diff options
author | Neal Norwitz <nnorwitz@gmail.com> | 2005-09-30 04:46:49 (GMT) |
---|---|---|
committer | Neal Norwitz <nnorwitz@gmail.com> | 2005-09-30 04:46:49 (GMT) |
commit | 484d9a409a94e719329b41edaed38c1b16b8de7d (patch) | |
tree | a95cc808b2ce9df46b41a6ee8b45fb90ef00a68e | |
parent | aa93517de8b5e2b41644a22ae81ddec4f5d72991 (diff) | |
download | cpython-484d9a409a94e719329b41edaed38c1b16b8de7d.zip cpython-484d9a409a94e719329b41edaed38c1b16b8de7d.tar.gz cpython-484d9a409a94e719329b41edaed38c1b16b8de7d.tar.bz2 |
Patch #1309009, Fix segfault in pyexpat when the XML document is
in latin_1, but Python incorrectly assumes it is in UTF-8 format
Will backport.
-rw-r--r-- | Lib/test/test_minidom.py | 9 | ||||
-rw-r--r-- | Misc/ACKS | 1 | ||||
-rw-r--r-- | Misc/NEWS | 3 | ||||
-rw-r--r-- | Modules/pyexpat.c | 7 |
4 files changed, 19 insertions, 1 deletions
diff --git a/Lib/test/test_minidom.py b/Lib/test/test_minidom.py index 3154fbf..8b4c715 100644 --- a/Lib/test/test_minidom.py +++ b/Lib/test/test_minidom.py @@ -889,6 +889,15 @@ def testEncodings(): and doc.toxml('utf-8') == '<?xml version="1.0" encoding="utf-8"?><foo>\xe2\x82\xac</foo>' and doc.toxml('iso-8859-15') == '<?xml version="1.0" encoding="iso-8859-15"?><foo>\xa4</foo>', "testEncodings - encoding EURO SIGN") + + # Verify that character decoding errors throw exceptions instead of crashing + try: + doc = parseString('<fran\xe7ais>Comment \xe7a va ? Tr\xe8s bien ?</fran\xe7ais>') + except UnicodeDecodeError: + pass + else: + print 'parsing with bad encoding should raise a UnicodeDecodeError' + doc.unlink() class UserDataHandler: @@ -305,6 +305,7 @@ Flemming Kjær Jensen Jiba Orjan Johansen Simon Johnston +Evan Jones Richard Jones Irmen de Jong Lucas de Jonge @@ -153,6 +153,9 @@ present). Extension Modules ----------------- +- Patch #1309009, Fix segfault in pyexpat when the XML document is in latin_1, + but Python incorrectly assumes it is in UTF-8 format + - Fix parse errors in the readline module when compiling without threads. - Patch #1288833: Removed thread lock from socket.getaddrinfo on diff --git a/Modules/pyexpat.c b/Modules/pyexpat.c index e6c14f8..438f760 100644 --- a/Modules/pyexpat.c +++ b/Modules/pyexpat.c @@ -417,6 +417,9 @@ string_intern(xmlparseobject *self, const char* str) { PyObject *result = STRING_CONV_FUNC(str); PyObject *value; + /* result can be NULL if the unicode conversion failed. */ + if (!result) + return result; if (!self->intern) return result; value = PyDict_GetItem(self->intern, result); @@ -572,7 +575,9 @@ my_StartElementHandler(void *userData, Py_DECREF(v); } } - args = Py_BuildValue("(NN)", string_intern(self, name), container); + args = string_intern(self, name); + if (args != NULL) + args = Py_BuildValue("(NN)", args, container); if (args == NULL) { Py_DECREF(container); return; |