summaryrefslogtreecommitdiffstats
path: root/Objects/stringobject.c
diff options
context:
space:
mode:
Diffstat (limited to 'Objects/stringobject.c')
-rw-r--r--Objects/stringobject.c83
1 files changed, 68 insertions, 15 deletions
diff --git a/Objects/stringobject.c b/Objects/stringobject.c
index 92adb49..c11a362 100644
--- a/Objects/stringobject.c
+++ b/Objects/stringobject.c
@@ -26,6 +26,19 @@ static PyStringObject *nullstring;
static PyObject *interned;
+#if defined(HAVE_MBTOWC) && defined(HAVE_WCHAR_H)
+# define PRINT_MULTIBYTE_STRING
+# include <locale.h>
+# include <wchar.h>
+# if defined(HAVE_ISWPRINT)
+# define _isprint iswprint
+# else
+# define _isprint isprint
+# endif
+#endif
+
+static const char *hexchars = "0123456789abcdef";
+
/*
For both PyString_FromString() and PyString_FromStringAndSize(), the
parameter `size' denotes number of characters to allocate, not counting any
@@ -749,8 +762,14 @@ PyString_AsStringAndSize(register PyObject *obj,
static int
string_print(PyStringObject *op, FILE *fp, int flags)
{
+#ifndef PRINT_MULTIBYTE_STRING
int i;
char c;
+#else
+ char *scur, *send;
+ wchar_t c;
+ int cr;
+#endif
int quote;
/* XXX Ought to check for interrupts when writing long strings */
@@ -776,20 +795,36 @@ string_print(PyStringObject *op, FILE *fp, int flags)
quote = '"';
fputc(quote, fp);
+#ifndef PRINT_MULTIBYTE_STRING
for (i = 0; i < op->ob_size; i++) {
c = op->ob_sval[i];
+#else
+ for (scur = op->ob_sval, send = op->ob_sval + op->ob_size;
+ scur < send; scur += cr) {
+ if ((cr = mbtowc(&c, scur, send - scur)) <= 0)
+ goto non_printable;
+#endif
if (c == quote || c == '\\')
- fprintf(fp, "\\%c", c);
+ fputc('\\', fp), fputc(c, fp);
else if (c == '\t')
- fprintf(fp, "\\t");
+ fputs("\\t", fp);
else if (c == '\n')
- fprintf(fp, "\\n");
+ fputs("\\n", fp);
else if (c == '\r')
- fprintf(fp, "\\r");
- else if (c < ' ' || c >= 0x7f)
- fprintf(fp, "\\x%02x", c & 0xff);
- else
+ fputs("\\r", fp);
+#ifndef PRINT_MULTIBYTE_STRING
+ else if (' ' <= c && c < 0x7f)
fputc(c, fp);
+ else
+ fprintf(fp, "\\x%02x", c & 0xff);
+#else
+ else if (_isprint(c))
+ fwrite(scur, cr, 1, fp);
+ else {
+non_printable: cr = 1; /* unit to move cursor */
+ fprintf(fp, "\\x%02x", *scur & 0xff);
+ }
+#endif
}
fputc(quote, fp);
return 0;
@@ -810,8 +845,14 @@ PyString_Repr(PyObject *obj, int smartquotes)
return NULL;
}
else {
+#ifndef PRINT_MULTIBYTE_STRING
register int i;
register char c;
+#else
+ register char *scur, *send;
+ wchar_t c;
+ int cr;
+#endif
register char *p;
int quote;
@@ -824,11 +865,18 @@ PyString_Repr(PyObject *obj, int smartquotes)
p = PyString_AS_STRING(v);
*p++ = quote;
+#ifndef PRINT_MULTIBYTE_STRING
for (i = 0; i < op->ob_size; i++) {
/* There's at least enough room for a hex escape
and a closing quote. */
assert(newsize - (p - PyString_AS_STRING(v)) >= 5);
c = op->ob_sval[i];
+#else
+ for (scur = op->ob_sval, send = op->ob_sval + op->ob_size;
+ scur < send; scur += cr) {
+ if ((cr = mbtowc(&c, scur, send - scur)) <= 0)
+ goto non_printable;
+#endif
if (c == quote || c == '\\')
*p++ = '\\', *p++ = c;
else if (c == '\t')
@@ -837,15 +885,20 @@ PyString_Repr(PyObject *obj, int smartquotes)
*p++ = '\\', *p++ = 'n';
else if (c == '\r')
*p++ = '\\', *p++ = 'r';
- else if (c < ' ' || c >= 0x7f) {
- /* For performance, we don't want to call
- PyOS_snprintf here (extra layers of
- function call). */
- sprintf(p, "\\x%02x", c & 0xff);
- p += 4;
- }
- else
+#ifndef PRINT_MULTIBYTE_STRING
+ else if (' ' <= c && c < 0x7f)
*p++ = c;
+ else {
+#else
+ else if (_isprint(c))
+ memcpy(p, scur, cr), p += cr;
+ else {
+non_printable: cr = 1; c = *scur;
+#endif
+ *p++ = '\\'; *p++ = 'x';
+ *p++ = hexchars[(c >> 4) & 0x0f];
+ *p++ = hexchars[c & 0x0f];
+ }
}
assert(newsize - (p - PyString_AS_STRING(v)) >= 1);
*p++ = quote;