summaryrefslogtreecommitdiffstats
path: root/Doc/lib/libhtmlparser.tex
diff options
context:
space:
mode:
authorFred Drake <fdrake@acm.org>2001-07-05 16:34:36 (GMT)
committerFred Drake <fdrake@acm.org>2001-07-05 16:34:36 (GMT)
commit25211f5724087516f10ddb8a232d63e09a9b9bec (patch)
tree9b65993721a40b85f2c4490cae34b036c8ccf269 /Doc/lib/libhtmlparser.tex
parent5fe2c139d5d167f7acc4c795adf276fa66e4664c (diff)
downloadcpython-25211f5724087516f10ddb8a232d63e09a9b9bec.zip
cpython-25211f5724087516f10ddb8a232d63e09a9b9bec.tar.gz
cpython-25211f5724087516f10ddb8a232d63e09a9b9bec.tar.bz2
Added more information on the differences between the htmllib and HTMLParser
modules.
Diffstat (limited to 'Doc/lib/libhtmlparser.tex')
-rw-r--r--Doc/lib/libhtmlparser.tex8
1 files changed, 7 insertions, 1 deletions
diff --git a/Doc/lib/libhtmlparser.tex b/Doc/lib/libhtmlparser.tex
index e8b4dd9..68c93e0 100644
--- a/Doc/lib/libhtmlparser.tex
+++ b/Doc/lib/libhtmlparser.tex
@@ -6,7 +6,9 @@
This module defines a class \class{HTMLParser} which serves as the
basis for parsing text files formatted in HTML\index{HTML} (HyperText
-Mark-up Language) and XHTML.\index{XHTML}
+Mark-up Language) and XHTML.\index{XHTML} Unlike the parser in
+\refmodule{htmllib}, this parser is not based on the SGML parser in
+\refmodule{sgmllib}.
\begin{classdesc}{HTMLParser}{}
@@ -15,6 +17,10 @@ The \class{HTMLParser} class is instantiated without arguments.
An HTMLParser instance is fed HTML data and calls handler functions
when tags begin and end. The \class{HTMLParser} class is meant to be
overridden by the user to provide a desired behavior.
+
+Unlike the parser in \refmodule{htmllib}, this parser does not check
+that end tags match start tags or call the end-tag handler for
+elements which are closed implicitly by closing an outer element.
\end{classdesc}