diff options
author | Eric Smith <eric@trueblade.com> | 2007-08-26 22:27:13 (GMT) |
---|---|---|
committer | Eric Smith <eric@trueblade.com> | 2007-08-26 22:27:13 (GMT) |
commit | 7ade6485abde95c5cc9676ad3e476ba3aca98037 (patch) | |
tree | fa5710899c3e376f89eb6a6460e06f3feee62d58 | |
parent | 2bf4d5ba2881725bb7695bc0573bab0e2ca4fec5 (diff) | |
download | cpython-7ade6485abde95c5cc9676ad3e476ba3aca98037.zip cpython-7ade6485abde95c5cc9676ad3e476ba3aca98037.tar.gz cpython-7ade6485abde95c5cc9676ad3e476ba3aca98037.tar.bz2 |
PEP 3101: Completed string.Formatter class. Reimplemented field_name to object transformation.
-rw-r--r-- | Include/unicodeobject.h | 3 | ||||
-rw-r--r-- | Lib/string.py | 42 | ||||
-rw-r--r-- | Lib/test/test_string.py | 23 | ||||
-rw-r--r-- | Lib/test/test_unicode.py | 9 | ||||
-rw-r--r-- | Objects/stringlib/string_format.h | 425 | ||||
-rw-r--r-- | Objects/unicodeobject.c | 165 | ||||
-rw-r--r-- | Python/sysmodule.c | 27 |
7 files changed, 497 insertions, 197 deletions
diff --git a/Include/unicodeobject.h b/Include/unicodeobject.h index f940887..bc94a53 100644 --- a/Include/unicodeobject.h +++ b/Include/unicodeobject.h @@ -1440,8 +1440,7 @@ PyAPI_FUNC(Py_UNICODE*) Py_UNICODE_strchr( PyObject * _unicodeformatter_iterator(PyObject *str); PyObject * -_unicodeformatter_lookup(PyObject *field_name, PyObject *args, - PyObject *kwargs); +_unicodeformatter_field_name_split(PyObject *field_name); #ifdef __cplusplus } diff --git a/Lib/string.py b/Lib/string.py index 9df78af..edf5ae2 100644 --- a/Lib/string.py +++ b/Lib/string.py @@ -200,31 +200,59 @@ class Template(metaclass=_TemplateMetaclass): # exposed here via the sys module. sys was chosen because it's always # available and doesn't have to be dynamically loaded. -# The parser is implemented in sys._formatter_parser. -# The "object lookup" is implemented in sys._formatter_lookup +# The overall parser is implemented in sys._formatter_parser. +# The field name parser is implemented in sys._formatter_field_name_split -from sys import _formatter_parser, _formatter_lookup +from sys import _formatter_parser, _formatter_field_name_split class Formatter: def format(self, format_string, *args, **kwargs): return self.vformat(format_string, args, kwargs) def vformat(self, format_string, args, kwargs): + used_args = set() result = [] for (is_markup, literal, field_name, format_spec, conversion) in \ _formatter_parser(format_string): if is_markup: - # find the object - index, name, obj = _formatter_lookup(field_name, args, kwargs) + # given the field_name, find the object it references + + # split it into the first part, and and iterator that + # looks over the rest + first, rest = _formatter_field_name_split(field_name) + + used_args.add(first) + obj = self.get_value(first, args, kwargs) + + # loop through the rest of the field_name, doing + # getattr or getitem as needed + for is_attr, i in rest: + if is_attr: + obj = getattr(obj, i) + else: + obj = obj[i] + + # do any conversion on the resulting object + if conversion == 'r': + obj = repr(obj) + elif conversion == 's': + obj = str(obj) + + # format the object and append to the result + result.append(self.format_field(obj, format_spec)) else: result.append(literal) + self.check_unused_args(used_args, args, kwargs) return ''.join(result) def get_value(self, key, args, kwargs): - pass + if isinstance(key, int): + return args[key] + else: + return kwargs[key] def check_unused_args(self, used_args, args, kwargs): pass def format_field(self, value, format_spec): - pass + return format(value, format_spec) diff --git a/Lib/test/test_string.py b/Lib/test/test_string.py index ce9fe23..1706d2a 100644 --- a/Lib/test/test_string.py +++ b/Lib/test/test_string.py @@ -19,8 +19,27 @@ class ModuleTest(unittest.TestCase): fmt = string.Formatter() self.assertEqual(fmt.format("foo"), "foo") - # Formatter not working you for lookups - #self.assertEqual(fmt.format("foo{0}", "bar"), "foobar") + self.assertEqual(fmt.format("foo{0}", "bar"), "foobar") + self.assertEqual(fmt.format("foo{1}{0}-{1}", "bar", 6), "foo6bar-6") + self.assertEqual(fmt.format("-{arg!r}-", arg='test'), "-'test'-") + + class NamespaceFormatter(string.Formatter): + def __init__(self, namespace={}): + string.Formatter.__init__(self) + self.namespace = namespace + + def get_value(self, key, args, kwds): + if isinstance(key, str): + try: + # Check explicitly passed arguments first + return kwds[key] + except KeyError: + return self.namespace[key] + else: + string.Formatter.get_value(key, args, kwds) + + fmt = NamespaceFormatter({'greeting':'hello'}) + self.assertEqual(fmt.format("{greeting}, world!"), 'hello, world!') def test_maketrans(self): diff --git a/Lib/test/test_unicode.py b/Lib/test/test_unicode.py index ff0e015..c39ec09 100644 --- a/Lib/test/test_unicode.py +++ b/Lib/test/test_unicode.py @@ -449,6 +449,10 @@ class UnicodeTest( self.assertEqual('}}{{'.format(), '}{') self.assertEqual('}}x{{'.format(), '}x{') + # weird field names + self.assertEqual("{0[foo-bar]}".format({'foo-bar':'baz'}), 'baz') + self.assertEqual("{0[foo bar]}".format({'foo bar':'baz'}), 'baz') + self.assertEqual('{foo._x}'.format(foo=C(20)), '20') self.assertEqual('{1}{0}'.format(D(10), D(20)), '2010') self.assertEqual('{0._x.x}'.format(C(D('abc'))), 'abc') @@ -539,7 +543,11 @@ class UnicodeTest( self.assertRaises(ValueError, "}".format) self.assertRaises(ValueError, "abc{0:{}".format) self.assertRaises(ValueError, "{0".format) + self.assertRaises(ValueError, "{0.}".format) + self.assertRaises(ValueError, "{0[}".format) + self.assertRaises(ValueError, "{0]}".format) self.assertRaises(ValueError, "{0.[]}".format) + self.assertRaises(ValueError, "{0..foo}".format, 0) self.assertRaises(ValueError, "{0[0}".format) self.assertRaises(ValueError, "{0[0:foo}".format) self.assertRaises(ValueError, "{c]}".format) @@ -551,6 +559,7 @@ class UnicodeTest( self.assertRaises(ValueError, "{0!rs}".format) self.assertRaises(ValueError, "{!}".format) self.assertRaises(ValueError, "{:}".format) + self.assertRaises(ValueError, "{:s}".format) self.assertRaises(ValueError, "{}".format) # can't have a replacement on the field name portion diff --git a/Objects/stringlib/string_format.h b/Objects/stringlib/string_format.h index b81a7e3..2799141 100644 --- a/Objects/stringlib/string_format.h +++ b/Objects/stringlib/string_format.h @@ -72,23 +72,6 @@ SetError(const char *s) return PyErr_Format(PyExc_ValueError, "%s in format string", s); } -/* - check_input returns True if we still have characters - left in the input string. - - XXX: make this function go away when better error handling is - implemented. -*/ -Py_LOCAL_INLINE(int) -check_input(SubString *input) -{ - if (input->ptr < input->end) - return 1; - PyErr_SetString(PyExc_ValueError, - "unterminated replacement field"); - return 0; -} - /************************************************************************/ /*********** Output string management functions ****************/ /************************************************************************/ @@ -161,46 +144,22 @@ output_data(OutputString *output, const STRINGLIB_CHAR *s, Py_ssize_t count) /*********** Format string parsing -- integers and identifiers *********/ /************************************************************************/ -/* - end_identifier returns true if a character marks - the end of an identifier string. - - Although the PEP specifies that identifiers are - numbers or valid Python identifiers, we just let - getattr/getitem handle that, so the implementation - is more flexible than the PEP would indicate. -*/ -Py_LOCAL_INLINE(int) -end_identifier(STRINGLIB_CHAR c) +static Py_ssize_t +get_integer(const SubString *str) { - switch (c) { - case '.': case '[': case ']': - return 1; - default: - return 0; - } -} + Py_ssize_t accumulator = 0; + Py_ssize_t digitval; + Py_ssize_t oldaccumulator; + STRINGLIB_CHAR *p; -/* - get_integer consumes 0 or more decimal digit characters from an - input string, updates *result with the corresponding positive - integer, and returns the number of digits consumed. + /* empty string is an error */ + if (str->ptr >= str->end) + return -1; - returns -1 on error. -*/ -static int -get_integer(STRINGLIB_CHAR **ptr, STRINGLIB_CHAR *end, - Py_ssize_t *result) -{ - Py_ssize_t accumulator, digitval, oldaccumulator; - int numdigits; - accumulator = numdigits = 0; - for (;;(*ptr)++, numdigits++) { - if (*ptr >= end) - break; - digitval = STRINGLIB_TODECIMAL(**ptr); + for (p = str->ptr; p < str->end; p++) { + digitval = STRINGLIB_TODECIMAL(*p); if (digitval < 0) - break; + return -1; /* This trick was copied from old Unicode format code. It's cute, but would really suck on an old machine with a slow divide @@ -216,70 +175,215 @@ get_integer(STRINGLIB_CHAR **ptr, STRINGLIB_CHAR *end, } accumulator += digitval; } - *result = accumulator; - return numdigits; + return accumulator; } -/* - get_identifier is a bit of a misnomer. It returns a value for use - with getattr or getindex. This value will a string/unicode - object. The input cannot be zero length. Continues until end of - input, or end_identifier() returns true. -*/ +/************************************************************************/ +/******** Functions to get field objects and specification strings ******/ +/************************************************************************/ + +/* do the equivalent of obj.name */ static PyObject * -get_identifier(SubString *input) +getattr(PyObject *obj, SubString *name) { - STRINGLIB_CHAR *start; - - for (start = input->ptr; - input->ptr < input->end && !end_identifier(*input->ptr); - input->ptr++) - ; + PyObject *newobj; + PyObject *str = STRINGLIB_NEW(name->ptr, name->end - name->ptr); + if (str == NULL) + return NULL; + newobj = PyObject_GetAttr(obj, str); + Py_DECREF(str); + return newobj; +} - return STRINGLIB_NEW(start, input->ptr - start); +/* do the equivalent of obj[idx], where obj is a sequence */ +static PyObject * +getitem_sequence(PyObject *obj, Py_ssize_t idx) +{ + return PySequence_GetItem(obj, idx); +} - /* - We might want to add code here to check for invalid Python - identifiers. All identifiers are eventually passed to getattr - or getitem, so there is a check when used. However, we might - want to remove (or not) the ability to have strings like - "a/b" or " ab" or "-1" (which is not parsed as a number). - For now, this is left as an exercise for the first disgruntled - user... +/* do the equivalent of obj[idx], where obj is not a sequence */ +static PyObject * +getitem_idx(PyObject *obj, Py_ssize_t idx) +{ + PyObject *newobj; + PyObject *idx_obj = PyInt_FromSsize_t(idx); + if (idx_obj == NULL) + return NULL; + newobj = PyObject_GetItem(obj, idx_obj); + Py_DECREF(idx_obj); + return newobj; +} - if (XXX -- need check function) { - Py_DECREF(result); - PyErr_SetString(PyExc_ValueError, - "Invalid embedded Python identifier"); +/* do the equivalent of obj[name] */ +static PyObject * +getitem_str(PyObject *obj, SubString *name) +{ + PyObject *newobj; + PyObject *str = STRINGLIB_NEW(name->ptr, name->end - name->ptr); + if (str == NULL) return NULL; + newobj = PyObject_GetItem(obj, str); + Py_DECREF(str); + return newobj; +} + +typedef struct { + /* the entire string we're parsing. we assume that someone else + is managing its lifetime, and that it will exist for the + lifetime of the iterator. can be empty */ + SubString str; + + /* pointer to where we are inside field_name */ + STRINGLIB_CHAR *ptr; +} FieldNameIterator; + + +static int +FieldNameIterator_init(FieldNameIterator *self, STRINGLIB_CHAR *ptr, + Py_ssize_t len) +{ + SubString_init(&self->str, ptr, len); + self->ptr = self->str.ptr; + return 1; +} + +static int +_FieldNameIterator_attr(FieldNameIterator *self, SubString *name) +{ + STRINGLIB_CHAR c; + + name->ptr = self->ptr; + + /* return everything until '.' or '[' */ + while (self->ptr < self->str.end) { + switch (c = *self->ptr++) { + case '[': + case '.': + /* backup so that we this character will be seen next time */ + self->ptr--; + break; + default: + continue; + } + break; } - */ + /* end of string is okay */ + name->end = self->ptr; + return 1; } -/************************************************************************/ -/******** Functions to get field objects and specification strings ******/ -/************************************************************************/ +static int +_FieldNameIterator_item(FieldNameIterator *self, SubString *name) +{ + STRINGLIB_CHAR c; -/* get_field_and_spec is the main function in this section. It parses - the format string well enough to return a field object to render along - with a field specification string. -*/ + name->ptr = self->ptr; -/* - look up key in our keyword arguments + /* return everything until ']' */ + while (self->ptr < self->str.end) { + switch (c = *self->ptr++) { + case ']': + break; + default: + continue; + } + break; + } + /* end of string is okay */ + /* don't include the ']' */ + name->end = self->ptr-1; + return 1; +} + +/* returns 0 on error, 1 on non-error termination, and 2 if it returns a value */ +static int +FieldNameIterator_next(FieldNameIterator *self, int *is_attribute, + Py_ssize_t *name_idx, SubString *name) +{ + /* check at end of input */ + if (self->ptr >= self->str.end) + return 1; + + switch (*self->ptr++) { + case '.': + *is_attribute = 1; + if (_FieldNameIterator_attr(self, name) == 0) { + return 0; + } + *name_idx = -1; + break; + case '[': + *is_attribute = 0; + if (_FieldNameIterator_item(self, name) == 0) { + return 0; + } + *name_idx = get_integer(name); + break; + default: + /* interal error, can't get here */ + assert(0); + return 0; + } + + /* empty string is an error */ + if (name->ptr == name->end) { + PyErr_SetString(PyExc_ValueError, "Empty attribute in format string"); + return 0; + } + + return 2; +} + + +/* input: field_name + output: 'first' points to the part before the first '[' or '.' + 'first_idx' is -1 if 'first' is not an integer, otherwise + it's the value of first converted to an integer + 'rest' is an iterator to return the rest */ -static PyObject * -key_lookup(PyObject *kwargs, PyObject *key) +static int +field_name_split(STRINGLIB_CHAR *ptr, Py_ssize_t len, SubString *first, + Py_ssize_t *first_idx, FieldNameIterator *rest) { - PyObject *result; + STRINGLIB_CHAR c; + STRINGLIB_CHAR *p = ptr; + STRINGLIB_CHAR *end = ptr + len; + + /* find the part up until the first '.' or '[' */ + while (p < end) { + switch (c = *p++) { + case '[': + case '.': + /* backup so that we this character is available to the + "rest" iterator */ + p--; + break; + default: + continue; + } + break; + } + + /* set up the return values */ + SubString_init(first, ptr, p - ptr); + FieldNameIterator_init(rest, p, end - p); + + /* see if "first" is an integer, in which case it's used as an index */ + *first_idx = get_integer(first); - if (kwargs && (result = PyDict_GetItem(kwargs, key)) != NULL) { - Py_INCREF(result); - return result; + /* zero length string is an error */ + if (first->ptr >= first->end) { + PyErr_SetString(PyExc_ValueError, "empty field name"); + goto error; } - return NULL; + + return 1; +error: + return 0; } + /* get_field_object returns the object inside {}, before the format_spec. It handles getindex and getattr lookups and consumes @@ -288,80 +392,71 @@ key_lookup(PyObject *kwargs, PyObject *key) static PyObject * get_field_object(SubString *input, PyObject *args, PyObject *kwargs) { - PyObject *myobj, *subobj, *newobj; - STRINGLIB_CHAR c; + PyObject *obj = NULL; + int ok; + int is_attribute; + SubString name; + SubString first; Py_ssize_t index; - int isindex, isnumeric, isargument; - - index = isnumeric = 0; /* Just to shut up the compiler warnings */ + FieldNameIterator rest; - myobj = args; - Py_INCREF(myobj); + if (!field_name_split(input->ptr, input->end - input->ptr, &first, + &index, &rest)) { + goto error; + } - for (isindex=1, isargument=1;;) { - if (!check_input(input)) - break; - if (!isindex) { - if ((subobj = get_identifier(input)) == NULL) - break; - newobj = PyObject_GetAttr(myobj, subobj); - Py_DECREF(subobj); - } else { - isnumeric = (STRINGLIB_ISDECIMAL(*input->ptr)); - if (isnumeric) - /* XXX: add error checking */ - get_integer(&input->ptr, input->end, &index); - - if (isnumeric && PySequence_Check(myobj)) - newobj = PySequence_GetItem(myobj, index); - else { - /* XXX -- do we need PyLong_FromLongLong? - Using ssizet, not int... */ - subobj = isnumeric ? - PyInt_FromLong(index) : - get_identifier(input); - if (subobj == NULL) - break; - if (isargument) { - newobj = key_lookup(kwargs, subobj); - } else { - newobj = PyObject_GetItem(myobj, subobj); - } - Py_DECREF(subobj); - } + if (index == -1) { + /* look up in kwargs */ + PyObject *key = STRINGLIB_NEW(first.ptr, first.end - first.ptr); + if (key == NULL) + goto error; + if ((kwargs == NULL) || (obj = PyDict_GetItem(kwargs, key)) == NULL) { + PyErr_SetString(PyExc_ValueError, "Keyword argument not found " + "in format string"); + Py_DECREF(key); + goto error; } - Py_DECREF(myobj); - myobj = newobj; - if (myobj == NULL) - break; - if (!isargument && isindex) - if ((!check_input(input)) || (*(input->ptr++) != ']')) { - SetError("Expected ]"); - break; - } - - /* if at the end of input, return with myobj */ - if (input->ptr >= input->end) - return myobj; - - c = *input->ptr; - input->ptr++; - isargument = 0; - isindex = (c == '['); - if (!isindex && (c != '.')) { - SetError("Expected ., [, :, !, or }"); - break; + } else { + /* look up in args */ + obj = PySequence_GetItem(args, index); + if (obj == NULL) { + /* translate IndexError to a ValueError */ + PyErr_SetString(PyExc_ValueError, "Not enough positional arguments " + "in format string"); + goto error; } } - if ((myobj == NULL) && isargument) { - /* XXX: include more useful error information, like which - * keyword not found or which index missing */ - PyErr_Clear(); - return SetError(isnumeric - ? "Not enough positional arguments" - : "Keyword argument not found"); + + /* iterate over the rest of the field_name */ + while ((ok = FieldNameIterator_next(&rest, &is_attribute, &index, + &name)) == 2) { + PyObject *tmp; + + if (is_attribute) + /* getattr lookup "." */ + tmp = getattr(obj, &name); + else + /* getitem lookup "[]" */ + if (index == -1) + tmp = getitem_str(obj, &name); + else + if (PySequence_Check(obj)) + tmp = getitem_sequence(obj, index); + else + /* not a sequence */ + tmp = getitem_idx(obj, index); + if (tmp == NULL) + goto error; + + /* assign to obj */ + Py_DECREF(obj); + obj = tmp; } - Py_XDECREF(myobj); + /* end of iterator, this is the non-error case */ + if (ok == 1) + return obj; +error: + Py_XDECREF(obj); return NULL; } diff --git a/Objects/unicodeobject.c b/Objects/unicodeobject.c index d10d26f..1421bb2 100644 --- a/Objects/unicodeobject.c +++ b/Objects/unicodeobject.c @@ -9161,9 +9161,8 @@ typedef struct { static void formatteriter_dealloc(formatteriterobject *it) { - _PyObject_GC_UNTRACK(it); - Py_XDECREF(it->str); - PyObject_GC_Del(it); + Py_XDECREF(it->str); + PyObject_FREE(it); } /* returns a tuple: @@ -9313,7 +9312,7 @@ _unicodeformatter_iterator(PyObject *str) { formatteriterobject *it; - it = PyObject_GC_New(formatteriterobject, &PyFormatterIter_Type); + it = PyObject_New(formatteriterobject, &PyFormatterIter_Type); if (it == NULL) return NULL; @@ -9326,17 +9325,167 @@ _unicodeformatter_iterator(PyObject *str) PyUnicode_AS_UNICODE(str), PyUnicode_GET_SIZE(str)); - _PyObject_GC_TRACK(it); return (PyObject *)it; } -PyObject * -_unicodeformatter_lookup(PyObject *field_name, PyObject *args, - PyObject *kwargs) +/********************* FieldName Iterator ************************/ + +/* this is used to implement string.Formatter.vparse(). it parses + the field name into attribute and item values. */ + +typedef struct { + PyObject_HEAD + + /* we know this to be a unicode object, but since we just keep + it around to keep the object alive, having it as PyObject + is okay */ + PyObject *str; + + FieldNameIterator it_field; +} fieldnameiterobject; + +static void +fieldnameiter_dealloc(fieldnameiterobject *it) { + Py_XDECREF(it->str); + PyObject_FREE(it); +} + +/* returns a tuple: + (is_attr, value) + is_attr is true if we used attribute syntax (e.g., '.foo') + false if we used index syntax (e.g., '[foo]') + value is an integer or string +*/ +static PyObject * +fieldnameiter_next(fieldnameiterobject *it) +{ + int result; + int is_attr; + Py_ssize_t idx; + SubString name; + + result = FieldNameIterator_next(&it->it_field, &is_attr, + &idx, &name); + if (result == 0 || result == 1) { + /* if 0, error has already been set, if 1, iterator is empty */ + return NULL; + } else { + PyObject* result = NULL; + PyObject* is_attr_obj = NULL; + PyObject* obj = NULL; + + is_attr_obj = PyBool_FromLong(is_attr); + if (is_attr_obj == NULL) + goto error; + + /* either an integer or a string */ + if (idx != -1) + obj = PyInt_FromSsize_t(idx); + else + obj = STRINGLIB_NEW(name.ptr, name.end - name.ptr); + if (obj == NULL) + goto error; + + /* return a tuple of values */ + result = PyTuple_Pack(2, is_attr_obj, obj); + if (result == NULL) + goto error; + + return result; + + error: + Py_XDECREF(result); + Py_XDECREF(is_attr_obj); + Py_XDECREF(obj); + return NULL; + } return NULL; } +static PyMethodDef fieldnameiter_methods[] = { + {NULL, NULL} /* sentinel */ +}; + +static PyTypeObject PyFieldNameIter_Type = { + PyVarObject_HEAD_INIT(&PyType_Type, 0) + "fieldnameiterator", /* tp_name */ + sizeof(fieldnameiterobject), /* tp_basicsize */ + 0, /* tp_itemsize */ + /* methods */ + (destructor)fieldnameiter_dealloc, /* tp_dealloc */ + 0, /* tp_print */ + 0, /* tp_getattr */ + 0, /* tp_setattr */ + 0, /* tp_compare */ + 0, /* tp_repr */ + 0, /* tp_as_number */ + 0, /* tp_as_sequence */ + 0, /* tp_as_mapping */ + 0, /* tp_hash */ + 0, /* tp_call */ + 0, /* tp_str */ + PyObject_GenericGetAttr, /* tp_getattro */ + 0, /* tp_setattro */ + 0, /* tp_as_buffer */ + Py_TPFLAGS_DEFAULT, /* tp_flags */ + 0, /* tp_doc */ + 0, /* tp_traverse */ + 0, /* tp_clear */ + 0, /* tp_richcompare */ + 0, /* tp_weaklistoffset */ + PyObject_SelfIter, /* tp_iter */ + (iternextfunc)fieldnameiter_next, /* tp_iternext */ + fieldnameiter_methods, /* tp_methods */ + 0}; + +PyObject * +_unicodeformatter_field_name_split(PyObject *field_name) +{ + SubString first; + Py_ssize_t first_idx; + fieldnameiterobject *it; + + PyObject *first_obj = NULL; + PyObject *it_obj = NULL; + PyObject *result; + + it = PyObject_New(fieldnameiterobject, &PyFieldNameIter_Type); + if (it == NULL) + goto error; + it->str = NULL; + it_obj = (PyObject *)it; + + if (!field_name_split(STRINGLIB_STR(field_name), + STRINGLIB_LEN(field_name), + &first, &first_idx, &it->it_field)) + goto error; + + /* first becomes an integer, if possible, else a string */ + if (first_idx != -1) + first_obj = PyInt_FromSsize_t(first_idx); + else + /* convert "first" into a string object */ + first_obj = STRINGLIB_NEW(first.ptr, first.end - first.ptr); + if (first_obj == NULL) + goto error; + + /* take ownership, give the object to the iterator. this is + just to keep the field_name alive */ + Py_INCREF(field_name); + it->str = field_name; + + /* return a tuple of values */ + result = PyTuple_Pack(2, first_obj, it_obj); + if (result == NULL) + goto error; + + return result; +error: + Py_XDECREF(it_obj); + Py_XDECREF(first_obj); + return NULL; +} /********************* Unicode Iterator **************************/ diff --git a/Python/sysmodule.c b/Python/sysmodule.c index 10a7427..0c84db0 100644 --- a/Python/sysmodule.c +++ b/Python/sysmodule.c @@ -683,28 +683,28 @@ sys_formatter_iterator(PyObject *self, PyObject *args) return _unicodeformatter_iterator(str); } -/* sys_formatter_lookup is used to implement string.Formatter.vformat. - it takes an PEP 3101 "field name", args, and kwargs, and returns a - tuple (index, name, object). see unicodeobject.c's - _unicodeformatter_lookup for details */ +/* sys_formatter_field_name_split is used to implement + string.Formatter.vformat. it takes an PEP 3101 "field name", and + returns a tuple of (first, rest): "first", the part before the + first '.' or '['; and "rest", an iterator for the rest of the field + name. see unicodeobjects' _unicode_formatter_field_name_split for + details */ static PyObject * -sys_formatter_lookup(PyObject *self, PyObject *args) +sys_formatter_field_name_split(PyObject *self, PyObject *args) { PyObject *field_name; - PyObject *arg_args; - PyObject *kwargs; - if (!PyArg_ParseTuple(args, "OOO:_formatter_lookup", &field_name, - &arg_args, &kwargs)) + if (!PyArg_ParseTuple(args, "O:_formatter_field_name_split", + &field_name)) return NULL; if (!PyUnicode_Check(field_name)) { - PyErr_SetString(PyExc_TypeError, - "_formatter_lookup expects unicode object"); + PyErr_SetString(PyExc_TypeError, "_formatter_field_name_split " + "expects unicode object"); return NULL; } - return _unicodeformatter_lookup(field_name, arg_args, kwargs); + return _unicodeformatter_field_name_split(field_name); } @@ -773,7 +773,8 @@ static PyMethodDef sys_methods[] = { {"_current_frames", sys_current_frames, METH_NOARGS, current_frames_doc}, {"_formatter_parser", sys_formatter_iterator, METH_VARARGS}, - {"_formatter_lookup", sys_formatter_lookup, METH_VARARGS}, + {"_formatter_field_name_split", sys_formatter_field_name_split, + METH_VARARGS}, {"displayhook", sys_displayhook, METH_O, displayhook_doc}, {"exc_info", sys_exc_info, METH_NOARGS, exc_info_doc}, {"excepthook", sys_excepthook, METH_VARARGS, excepthook_doc}, |