summaryrefslogtreecommitdiffstats
path: root/Lib/email
diff options
context:
space:
mode:
authorR David Murray <rdmurray@bitdance.com>2013-02-05 16:34:39 (GMT)
committerR David Murray <rdmurray@bitdance.com>2013-02-05 16:34:39 (GMT)
commitc44911f49aeb0cdb54f006f99111b562b29fc46f (patch)
tree0af78d63398d01f122b7dbdf947639c925919114 /Lib/email
parent0b6119e478a98b35dbd40354e4f5826108b8ce87 (diff)
parente201e9d584e2922997eeacad06ee6e84a6419d08 (diff)
downloadcpython-c44911f49aeb0cdb54f006f99111b562b29fc46f.zip
cpython-c44911f49aeb0cdb54f006f99111b562b29fc46f.tar.gz
cpython-c44911f49aeb0cdb54f006f99111b562b29fc46f.tar.bz2
Merge: #16948: Fix quopri encoding of non-latin1 character sets.
Diffstat (limited to 'Lib/email')
-rw-r--r--Lib/email/charset.py13
1 files changed, 13 insertions, 0 deletions
diff --git a/Lib/email/charset.py b/Lib/email/charset.py
index f22be2c..c106649 100644
--- a/Lib/email/charset.py
+++ b/Lib/email/charset.py
@@ -392,6 +392,19 @@ class Charset:
string = string.encode(self.output_charset)
return email.base64mime.body_encode(string)
elif self.body_encoding is QP:
+ # quopromime.body_encode takes a string, but operates on it as if
+ # it were a list of byte codes. For a (minimal) history on why
+ # this is so, see changeset 0cf700464177. To correctly encode a
+ # character set, then, we must turn it into pseudo bytes via the
+ # latin1 charset, which will encode any byte as a single code point
+ # between 0 and 255, which is what body_encode is expecting.
+ #
+ # Note that this clause doesn't handle the case of a _payload that
+ # is already bytes. It never did, and the semantics of _payload
+ # being bytes has never been nailed down, so fixing that is a
+ # longer term TODO.
+ if isinstance(string, str):
+ string = string.encode(self.output_charset).decode('latin1')
return email.quoprimime.body_encode(string)
else:
if isinstance(string, str):