From d09def36d52af3e087433eb67c49da633436c602 Mon Sep 17 00:00:00 2001 From: Georg Brandl Date: Thu, 9 Mar 2006 13:27:14 +0000 Subject: Bug #1442874: handle "", the empty SGML comment --- Lib/markupbase.py | 5 ++++- Lib/test/test_htmlparser.py | 2 +- 2 files changed, 5 insertions(+), 2 deletions(-) diff --git a/Lib/markupbase.py b/Lib/markupbase.py index 3d00a74..85b07a2 100644 --- a/Lib/markupbase.py +++ b/Lib/markupbase.py @@ -76,13 +76,16 @@ class ParserBase: rawdata = self.rawdata j = i + 2 assert rawdata[i:j] == "": + # the empty comment + return j + 1 if rawdata[j:j+1] in ("-", ""): # Start of comment followed by buffer boundary, # or just a buffer boundary. return -1 # A simple, practical version could look like: ((name|stringlit) S*) + '>' n = len(rawdata) - if rawdata[j:j+1] == '--': #comment + if rawdata[j:j+2] == '--': #comment # Locate --.*-- as the body of the comment return self.parse_comment(i) elif rawdata[j] == '[': #marked section diff --git a/Lib/test/test_htmlparser.py b/Lib/test/test_htmlparser.py index 4cb87df..54b90cd 100755 --- a/Lib/test/test_htmlparser.py +++ b/Lib/test/test_htmlparser.py @@ -115,7 +115,7 @@ comment1b--> sample text “ - + """, [ ("data", "\n"), -- cgit v0.12