Fix PyUnicode_Substring() for start >= length and start > end

Remove the fast-path for 1-character string: unicode_fromascii() and _PyUnicode_FromUCS*() now have their own fast-path for 1-character strings.
author: Victor Stinner <victor.stinner@gmail.com> 2012-05-03 00:32:34 (GMT)
committer: Victor Stinner <victor.stinner@gmail.com> 2012-05-03 00:32:34 (GMT)
commit: 684d5fd42067109f46e94ea3ddab72ebd4e130ee (patch)
tree: e422af086c643d02ff3181177db6451ee23499db /Objects
parent: b6cd014d75394ca48e6113d614d36ed16fbe7b13 (diff)
download: cpython-684d5fd42067109f46e94ea3ddab72ebd4e130ee.zip
cpython-684d5fd42067109f46e94ea3ddab72ebd4e130ee.tar.gz
cpython-684d5fd42067109f46e94ea3ddab72ebd4e130ee.tar.bz2
1 files changed, 8 insertions, 6 deletions
diff --git a/Objects/unicodeobject.c b/Objects/unicodeobject.c
index f427fd3..09b5733 100644
--- a/Objects/unicodeobject.c
+++ b/Objects/unicodeobject.c
@@ -12067,20 +12067,22 @@ PyUnicode_Substring(PyObject *self, Py_ssize_t start, Py_ssize_t end)
     if (PyUnicode_READY(self) == -1)
         return NULL;
 
-    end = Py_MIN(end, PyUnicode_GET_LENGTH(self));
+    length = PyUnicode_GET_LENGTH(self);
+    end = Py_MIN(end, length);
 
-    if (start == 0 && end == PyUnicode_GET_LENGTH(self))
+    if (start == 0 && end == length)
         return unicode_result_unchanged(self);
 
-    length = end - start;
-    if (length == 1)
-        return unicode_getitem(self, start);
-
     if (start < 0 || end < 0) {
         PyErr_SetString(PyExc_IndexError, "string index out of range");
         return NULL;
     }
+    if (start >= length || end < start) {
+        assert(end == length);
+        return PyUnicode_New(0, 0);
+    }
 
+    length = end - start;
     if (PyUnicode_IS_ASCII(self)) {
         data = PyUnicode_1BYTE_DATA(self);
         return unicode_fromascii(data + start, length);
author	Victor Stinner <victor.stinner@gmail.com>	2012-05-03 00:32:34 (GMT)
committer	Victor Stinner <victor.stinner@gmail.com>	2012-05-03 00:32:34 (GMT)
commit	684d5fd42067109f46e94ea3ddab72ebd4e130ee (patch)
tree	e422af086c643d02ff3181177db6451ee23499db /Objects
parent	b6cd014d75394ca48e6113d614d36ed16fbe7b13 (diff)
download	cpython-684d5fd42067109f46e94ea3ddab72ebd4e130ee.zip cpython-684d5fd42067109f46e94ea3ddab72ebd4e130ee.tar.gz cpython-684d5fd42067109f46e94ea3ddab72ebd4e130ee.tar.bz2