Merged revisions 81675 via svnmerge from

svn+ssh://pythondev@svn.python.org/python/trunk ........ r81675 | r.david.murray | 2010-06-03 11:43:20 -0400 (Thu, 03 Jun 2010) | 10 lines #5610: use \Z not $ so we don't eat extra chars when body part ends with \r\n. If a body part ended with \r\n, feedparser, using '$' to terminate its search for the newline, would match on the \r\n, and think that it needed to strip two characters in order to account for the line end before the boundary. That made it chop one too many characters off the end of the body part. Using \Z makes the match correct. Patch and test by Tony Nelson. ........
author: R. David Murray <rdmurray@bitdance.com> 2010-06-16 02:19:40 (GMT)
committer: R. David Murray <rdmurray@bitdance.com> 2010-06-16 02:19:40 (GMT)
commit: 45e0e1444bfaa3d57b6adf3bd2a7ec9171407792 (patch)
tree: 317538a77f43d3478cff286a8f00795292b1288a /Lib
parent: 9691e59d77dfab8d996c6f04ed21c3f8b290c970 (diff)
download: cpython-45e0e1444bfaa3d57b6adf3bd2a7ec9171407792.zip
cpython-45e0e1444bfaa3d57b6adf3bd2a7ec9171407792.tar.gz
cpython-45e0e1444bfaa3d57b6adf3bd2a7ec9171407792.tar.bz2
2 files changed, 19 insertions, 1 deletions
diff --git a/Lib/email/feedparser.py b/Lib/email/feedparser.py
index bff17ba..a6853c2 100644
--- a/Lib/email/feedparser.py
+++ b/Lib/email/feedparser.py
@@ -28,7 +28,7 @@ from email import message
 
 NLCRE = re.compile('\r\n|\r|\n')
 NLCRE_bol = re.compile('(\r\n|\r|\n)')
-NLCRE_eol = re.compile('(\r\n|\r|\n)$')
+NLCRE_eol = re.compile('(\r\n|\r|\n)\Z')
 NLCRE_crack = re.compile('(\r\n|\r|\n)')
 # RFC 2822 $3.6.8 Optional fields.  ftext is %d33-57 / %d59-126, Any character
 # except controls, SP, and ":".
diff --git a/Lib/email/test/test_email.py b/Lib/email/test/test_email.py
index 79146a3..be0565e 100644
--- a/Lib/email/test/test_email.py
+++ b/Lib/email/test/test_email.py
@@ -2588,6 +2588,24 @@ Here's the message body
         eq(headers, ['A', 'B', 'CC'])
         eq(msg.get_payload(), 'body')
 
+    def test_CRLFLF_at_end_of_part(self):
+        # issue 5610: feedparser should not eat two chars from body part ending
+        # with "\r\n\n".
+        m = (
+            "From: foo@bar.com\n"
+            "To: baz\n"
+            "Mime-Version: 1.0\n"
+            "Content-Type: multipart/mixed; boundary=BOUNDARY\n"
+            "\n"
+            "--BOUNDARY\n"
+            "Content-Type: text/plain\n"
+            "\n"
+            "body ending with CRLF newline\r\n"
+            "\n"
+            "--BOUNDARY--\n"
+          )
+        msg = email.message_from_string(m)
+        self.assertTrue(msg.get_payload(0).get_payload().endswith('\r\n'))
 
 
 class TestBase64(unittest.TestCase):
author	R. David Murray <rdmurray@bitdance.com>	2010-06-16 02:19:40 (GMT)
committer	R. David Murray <rdmurray@bitdance.com>	2010-06-16 02:19:40 (GMT)
commit	45e0e1444bfaa3d57b6adf3bd2a7ec9171407792 (patch)
tree	317538a77f43d3478cff286a8f00795292b1288a /Lib
parent	9691e59d77dfab8d996c6f04ed21c3f8b290c970 (diff)
download	cpython-45e0e1444bfaa3d57b6adf3bd2a7ec9171407792.zip cpython-45e0e1444bfaa3d57b6adf3bd2a7ec9171407792.tar.gz cpython-45e0e1444bfaa3d57b6adf3bd2a7ec9171407792.tar.bz2