diff options
author | R David Murray <rdmurray@bitdance.com> | 2013-02-05 15:55:27 (GMT) |
---|---|---|
committer | R David Murray <rdmurray@bitdance.com> | 2013-02-05 15:55:27 (GMT) |
commit | e201e9d584e2922997eeacad06ee6e84a6419d08 (patch) | |
tree | 37e47281843a70b32983209108323c9a7130a2e4 /Lib/email | |
parent | 6e32442fd4b2f53347ab9415185257ed9c096c03 (diff) | |
parent | f581b372003de0ae604c14a1f1dc2e8c36ea277b (diff) | |
download | cpython-e201e9d584e2922997eeacad06ee6e84a6419d08.zip cpython-e201e9d584e2922997eeacad06ee6e84a6419d08.tar.gz cpython-e201e9d584e2922997eeacad06ee6e84a6419d08.tar.bz2 |
Merge: #16948: Fix quopri encoding of non-latin1 character sets.
Diffstat (limited to 'Lib/email')
-rw-r--r-- | Lib/email/charset.py | 13 |
1 files changed, 13 insertions, 0 deletions
diff --git a/Lib/email/charset.py b/Lib/email/charset.py index f22be2c..c106649 100644 --- a/Lib/email/charset.py +++ b/Lib/email/charset.py @@ -392,6 +392,19 @@ class Charset: string = string.encode(self.output_charset) return email.base64mime.body_encode(string) elif self.body_encoding is QP: + # quopromime.body_encode takes a string, but operates on it as if + # it were a list of byte codes. For a (minimal) history on why + # this is so, see changeset 0cf700464177. To correctly encode a + # character set, then, we must turn it into pseudo bytes via the + # latin1 charset, which will encode any byte as a single code point + # between 0 and 255, which is what body_encode is expecting. + # + # Note that this clause doesn't handle the case of a _payload that + # is already bytes. It never did, and the semantics of _payload + # being bytes has never been nailed down, so fixing that is a + # longer term TODO. + if isinstance(string, str): + string = string.encode(self.output_charset).decode('latin1') return email.quoprimime.body_encode(string) else: if isinstance(string, str): |