diff options
author | Raymond Hettinger <python@rcn.com> | 2016-09-12 06:18:03 (GMT) |
---|---|---|
committer | Raymond Hettinger <python@rcn.com> | 2016-09-12 06:18:03 (GMT) |
commit | 076366c2a52b1446eb684806f95e10c91366094a (patch) | |
tree | cb8d617ff122ea64fb9c8a3d45a59faa4a53d826 /Lib | |
parent | 4b73676c3d260b37b91dedbc0b286c4e779350e4 (diff) | |
download | cpython-076366c2a52b1446eb684806f95e10c91366094a.zip cpython-076366c2a52b1446eb684806f95e10c91366094a.tar.gz cpython-076366c2a52b1446eb684806f95e10c91366094a.tar.bz2 |
Issue #17582: xml.etree.ElementTree nows preserves whitespaces in attributes
(Patch by Duane Griffin. Reviewed and approved by Stefan Behnel.)
Diffstat (limited to 'Lib')
-rw-r--r-- | Lib/test/test_xml_etree.py | 8 | ||||
-rw-r--r-- | Lib/xml/etree/ElementTree.py | 11 |
2 files changed, 19 insertions, 0 deletions
diff --git a/Lib/test/test_xml_etree.py b/Lib/test/test_xml_etree.py index bc1dd14..fbfc0b0 100644 --- a/Lib/test/test_xml_etree.py +++ b/Lib/test/test_xml_etree.py @@ -405,6 +405,14 @@ class ElementTreeTest(unittest.TestCase): self.assertEqual(ET.tostring(elem), b'<test testa="testval" testb="test1" testc="test2">aa</test>') + elem = ET.Element('test') + elem.set('a', '\r') + elem.set('b', '\r\n') + elem.set('c', '\t\n\r ') + elem.set('d', '\n\n') + self.assertEqual(ET.tostring(elem), + b'<test a=" " b=" " c="	 " d=" " />') + def test_makeelement(self): # Test makeelement handling. diff --git a/Lib/xml/etree/ElementTree.py b/Lib/xml/etree/ElementTree.py index 6d1b0ab..92821c5 100644 --- a/Lib/xml/etree/ElementTree.py +++ b/Lib/xml/etree/ElementTree.py @@ -1083,8 +1083,19 @@ def _escape_attrib(text): text = text.replace(">", ">") if "\"" in text: text = text.replace("\"", """) + # The following business with carriage returns is to satisfy + # Section 2.11 of the XML specification, stating that + # CR or CR LN should be replaced with just LN + # http://www.w3.org/TR/REC-xml/#sec-line-ends + if "\r\n" in text: + text = text.replace("\r\n", "\n") + if "\r" in text: + text = text.replace("\r", "\n") + #The following four lines are issue 17582 if "\n" in text: text = text.replace("\n", " ") + if "\t" in text: + text = text.replace("\t", "	") return text except (TypeError, AttributeError): _raise_serialization_error(text) |