summaryrefslogtreecommitdiffstats
path: root/Include/unicodeobject.h
diff options
context:
space:
mode:
authorMarc-André Lemburg <mal@egenix.com>2000-08-03 18:46:08 (GMT)
committerMarc-André Lemburg <mal@egenix.com>2000-08-03 18:46:08 (GMT)
commitbff879cabba567f1c57ae41c3c69bb1ac275860a (patch)
treef77dca0c907d47543bfe2d4acf40685d5e3c24ef /Include/unicodeobject.h
parent2b83b4601f9f588b46667b541b100b5924019a14 (diff)
downloadcpython-bff879cabba567f1c57ae41c3c69bb1ac275860a.zip
cpython-bff879cabba567f1c57ae41c3c69bb1ac275860a.tar.gz
cpython-bff879cabba567f1c57ae41c3c69bb1ac275860a.tar.bz2
This patch finalizes the move from UTF-8 to a default encoding in
the Python Unicode implementation. The internal buffer used for implementing the buffer protocol is renamed to defenc to make this change visible. It now holds the default encoded version of the Unicode object and is calculated on demand (NULL otherwise). Since the default encoding defaults to ASCII, this will mean that Unicode objects which hold non-ASCII characters will no longer work on C APIs using the "s" or "t" parser markers. C APIs must now explicitly provide Unicode support via the "u", "U" or "es"/"es#" parser markers in order to work with non-ASCII Unicode strings. (Note: this patch will also have to be applied to the 1.6 branch of the CVS tree.)
Diffstat (limited to 'Include/unicodeobject.h')
-rw-r--r--Include/unicodeobject.h5
1 files changed, 3 insertions, 2 deletions
diff --git a/Include/unicodeobject.h b/Include/unicodeobject.h
index af3a376..01dce94 100644
--- a/Include/unicodeobject.h
+++ b/Include/unicodeobject.h
@@ -204,8 +204,9 @@ typedef struct {
int length; /* Length of raw Unicode data in buffer */
Py_UNICODE *str; /* Raw Unicode buffer */
long hash; /* Hash value; -1 if not set */
- PyObject *utf8str; /* UTF-8 encoded version as Python string,
- or NULL */
+ PyObject *defenc; /* (Default) Encoded version as Python
+ string, or NULL; this is used for
+ implementing the buffer protocol */
} PyUnicodeObject;
extern DL_IMPORT(PyTypeObject) PyUnicode_Type;