From 0b9e3f750cc91e83d9614dd941545a8b29fa248a Mon Sep 17 00:00:00 2001 From: Fred Drake Date: Tue, 12 Nov 2002 22:19:34 +0000 Subject: Handle the Content-Type header a little more appropriately: if it contains options, drop them to get the major/minor content type. Modified from the supplied patch to support more whitespace variation. Closes SF patch #613605. --- Tools/webchecker/webchecker.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/Tools/webchecker/webchecker.py b/Tools/webchecker/webchecker.py index fd7f578..e8d0ed7 100755 --- a/Tools/webchecker/webchecker.py +++ b/Tools/webchecker/webchecker.py @@ -544,6 +544,9 @@ class Checker: def checkforhtml(self, info, url): if info.has_key('content-type'): ctype = cgi.parse_header(info['content-type'])[0].lower() + if ';' in ctype: + # handle content-type: text/html; charset=iso8859-1 : + ctype = ctype.split(';', 1)[0].strip() else: if url[-1:] == "/": return 1 -- cgit v0.12