summaryrefslogtreecommitdiffstats
path: root/Lib/test/test_unicode.py
diff options
context:
space:
mode:
authorEzio Melotti <ezio.melotti@gmail.com>2010-06-05 19:21:32 (GMT)
committerEzio Melotti <ezio.melotti@gmail.com>2010-06-05 19:21:32 (GMT)
commitab2eb0ee84ceb4b8f28653559248adb43a9502de (patch)
tree9324893ae15e346eaeb8663479344e0d0f732724 /Lib/test/test_unicode.py
parente57e50c8e77bc64e1ebab7a9ddf6f13fc3440c48 (diff)
downloadcpython-ab2eb0ee84ceb4b8f28653559248adb43a9502de.zip
cpython-ab2eb0ee84ceb4b8f28653559248adb43a9502de.tar.gz
cpython-ab2eb0ee84ceb4b8f28653559248adb43a9502de.tar.bz2
Add a NEWS entry for r81758 and clarify a comment.
Diffstat (limited to 'Lib/test/test_unicode.py')
-rw-r--r--Lib/test/test_unicode.py6
1 files changed, 3 insertions, 3 deletions
diff --git a/Lib/test/test_unicode.py b/Lib/test/test_unicode.py
index 3171379..4550be8 100644
--- a/Lib/test/test_unicode.py
+++ b/Lib/test/test_unicode.py
@@ -670,9 +670,9 @@ class UnicodeTest(
('\xF4'+cb+'\xBF\xBF').decode, 'utf-8')
def test_issue8271(self):
- # Issue #8271: when a byte sequence is invalid, only the start byte
- # and all the valid continuation bytes should be replaced by U+FFFD,
- # not the number of bytes specified by the start byte.
+ # Issue #8271: during the decoding of an invalid UTF-8 byte sequence,
+ # only the start byte and the continuation byte(s) are now considered
+ # invalid, instead of the number of bytes specified by the start byte.
# See http://www.unicode.org/versions/Unicode5.2.0/ch03.pdf (page 95,
# table 3-8, Row 2) for more information about the algorithm used.
FFFD = u'\ufffd'