diff options
Diffstat (limited to 'Tools/clinic/clinic.py')
-rwxr-xr-x | Tools/clinic/clinic.py | 351 |
1 files changed, 269 insertions, 82 deletions
diff --git a/Tools/clinic/clinic.py b/Tools/clinic/clinic.py index 82dfaaa..5b8786a 100755 --- a/Tools/clinic/clinic.py +++ b/Tools/clinic/clinic.py @@ -23,7 +23,6 @@ import sys import tempfile import textwrap - # TODO: # converters for # @@ -52,6 +51,8 @@ import textwrap # is too new for us. # +version = '1' + _empty = inspect._empty _void = inspect._void @@ -195,6 +196,46 @@ def linear_format(s, **kwargs): return output()[:-1] +def version_splitter(s): + """Splits a version string into a tuple of integers. + + The following ASCII characters are allowed, and employ + the following conversions: + a -> -3 + b -> -2 + c -> -1 + (This permits Python-style version strings such as "1.4b3".) + """ + version = [] + accumulator = [] + def flush(): + if not accumulator: + raise ValueError('Malformed version string: ' + repr(s)) + version.append(int(''.join(accumulator))) + accumulator.clear() + + for c in s: + if c.isdigit(): + accumulator.append(c) + elif c == '.': + flush() + elif c in 'abc': + flush() + version.append('abc'.index(c) - 3) + else: + raise ValueError('Illegal character ' + repr(c) + ' in version string ' + repr(s)) + flush() + return tuple(version) + +def version_comparitor(version1, version2): + iterator = itertools.zip_longest(version_splitter(version1), version_splitter(version2), fillvalue=0) + for i, (a, b) in enumerate(iterator): + if a < b: + return -1 + if a > b: + return 1 + return 0 + class CRenderData: def __init__(self): @@ -373,22 +414,22 @@ PyDoc_STRVAR({c_basename}__doc__, {docstring}); #define {methoddef_name} \\ - {{"{name}", (PyCFunction){c_basename}, {meth_flags}, {c_basename}__doc__}}, -""".replace('{meth_flags}', flags) + {{"{name}", (PyCFunction){c_basename}, {methoddef_flags}, {c_basename}__doc__}}, +""".replace('{methoddef_flags}', flags) - def meth_noargs_pyobject_template(self, meth_flags=""): - return self.template_base("METH_NOARGS", meth_flags) + """ + def meth_noargs_pyobject_template(self, methoddef_flags=""): + return self.template_base("METH_NOARGS", methoddef_flags) + """ static PyObject * -{c_basename}(PyObject *{self_name}) +{c_basename}({self_type}{self_name}) """ - def meth_noargs_template(self, meth_flags=""): - return self.template_base("METH_NOARGS", meth_flags) + """ + def meth_noargs_template(self, methoddef_flags=""): + return self.template_base("METH_NOARGS", methoddef_flags) + """ static {impl_return_type} {impl_prototype}; static PyObject * -{c_basename}(PyObject *{self_name}) +{c_basename}({self_type}{self_name}) {{ PyObject *return_value = NULL; {declarations} @@ -406,14 +447,14 @@ static {impl_return_type} {impl_prototype} """ - def meth_o_template(self, meth_flags=""): - return self.template_base("METH_O", meth_flags) + """ + def meth_o_template(self, methoddef_flags=""): + return self.template_base("METH_O", methoddef_flags) + """ static PyObject * {c_basename}({impl_parameters}) """ - def meth_o_return_converter_template(self, meth_flags=""): - return self.template_base("METH_O", meth_flags) + """ + def meth_o_return_converter_template(self, methoddef_flags=""): + return self.template_base("METH_O", methoddef_flags) + """ static {impl_return_type} {impl_prototype}; @@ -435,13 +476,13 @@ static {impl_return_type} {impl_prototype} """ - def option_group_template(self, meth_flags=""): - return self.template_base("METH_VARARGS", meth_flags) + """ + def option_group_template(self, methoddef_flags=""): + return self.template_base("METH_VARARGS", methoddef_flags) + """ static {impl_return_type} {impl_prototype}; static PyObject * -{c_basename}(PyObject *{self_name}, PyObject *args) +{c_basename}({self_type}{self_name}, PyObject *args) {{ PyObject *return_value = NULL; {declarations} @@ -460,13 +501,13 @@ static {impl_return_type} {impl_prototype} """ - def keywords_template(self, meth_flags=""): - return self.template_base("METH_VARARGS|METH_KEYWORDS", meth_flags) + """ + def keywords_template(self, methoddef_flags=""): + return self.template_base("METH_VARARGS|METH_KEYWORDS", methoddef_flags) + """ static {impl_return_type} {impl_prototype}; static PyObject * -{c_basename}(PyObject *{self_name}, PyObject *args, PyObject *kwargs) +{c_basename}({self_type}{self_name}, PyObject *args, PyObject *kwargs) {{ PyObject *return_value = NULL; static char *_keywords[] = {{{keywords}, NULL}}; @@ -489,13 +530,13 @@ static {impl_return_type} {impl_prototype} """ - def positional_only_template(self, meth_flags=""): - return self.template_base("METH_VARARGS", meth_flags) + """ + def positional_only_template(self, methoddef_flags=""): + return self.template_base("METH_VARARGS", methoddef_flags) + """ static {impl_return_type} {impl_prototype}; static PyObject * -{c_basename}(PyObject *{self_name}, PyObject *args) +{c_basename}({self_type}{self_name}, PyObject *args) {{ PyObject *return_value = NULL; {declarations} @@ -614,27 +655,6 @@ static {impl_return_type} add, output = text_accumulator() data = CRenderData() - if f.kind == STATIC_METHOD: - meth_flags = 'METH_STATIC' - self_name = "null" - else: - if f.kind == CALLABLE: - meth_flags = '' - self_name = "self" if f.cls else "module" - elif f.kind == CLASS_METHOD: - meth_flags = 'METH_CLASS' - self_name = "cls" - else: - fail("Unrecognized 'kind' " + repr(f.kind) + " for function " + f.name) - - data.impl_parameters.append("PyObject *" + self_name) - data.impl_arguments.append(self_name) - - if f.coexist: - if meth_flags: - meth_flags += '|' - meth_flags += 'METH_COEXIST' - parameters = list(f.parameters.values()) converters = [p.converter for p in parameters] @@ -654,8 +674,6 @@ static {impl_return_type} template_dict['docstring'] = self.docstring_for_c_string(f) - template_dict['self_name'] = self_name - positional = has_option_groups = False if parameters: @@ -680,6 +698,18 @@ static {impl_return_type} if has_option_groups: assert positional + # now insert our "self" (or whatever) parameters + # (we deliberately don't call render on self converters) + stock_self = self_converter('self', f) + template_dict['self_name'] = stock_self.name + template_dict['self_type'] = stock_self.type + data.impl_parameters.insert(0, f.self_converter.type + ("" if f.self_converter.type.endswith('*') else " ") + f.self_converter.name) + if f.self_converter.type != stock_self.type: + self_cast = '(' + f.self_converter.type + ')' + else: + self_cast = '' + data.impl_arguments.insert(0, self_cast + stock_self.name) + f.return_converter.render(f, data) template_dict['impl_return_type'] = f.return_converter.type @@ -701,25 +731,26 @@ static {impl_return_type} if not parameters: if default_return_converter: - template = self.meth_noargs_pyobject_template(meth_flags) + template = self.meth_noargs_pyobject_template(f.methoddef_flags) else: - template = self.meth_noargs_template(meth_flags) + template = self.meth_noargs_template(f.methoddef_flags) elif (len(parameters) == 1 and parameters[0].kind == inspect.Parameter.POSITIONAL_ONLY and not converters[0].is_optional() and isinstance(converters[0], object_converter) and converters[0].format_unit == 'O'): if default_return_converter: - template = self.meth_o_template(meth_flags) + template = self.meth_o_template(f.methoddef_flags) else: # HACK # we're using "impl_parameters" for the # non-impl function, because that works # better for METH_O. but that means we - # must surpress actually declaring the + # must supress actually declaring the # impl's parameters as variables in the # non-impl. but since it's METH_O, we - # only have one anyway, and it's the first one. + # only have one anyway, so + # we don't have any problem finding it. declarations_copy = list(data.declarations) before, pyobject, after = declarations_copy[0].partition('PyObject *') assert not before, "hack failed, see comment" @@ -727,16 +758,16 @@ static {impl_return_type} assert after and after[0].isalpha(), "hack failed, see comment" del declarations_copy[0] template_dict['declarations'] = "\n".join(declarations_copy) - template = self.meth_o_return_converter_template(meth_flags) + template = self.meth_o_return_converter_template(f.methoddef_flags) elif has_option_groups: self.render_option_group_parsing(f, template_dict) - template = self.option_group_template(meth_flags) + template = self.option_group_template(f.methoddef_flags) template = linear_format(template, option_group_parsing=template_dict['option_group_parsing']) elif positional: - template = self.positional_only_template(meth_flags) + template = self.positional_only_template(f.methoddef_flags) else: - template = self.keywords_template(meth_flags) + template = self.keywords_template(f.methoddef_flags) template = linear_format(template, declarations=template_dict['declarations'], @@ -1178,6 +1209,20 @@ class Function: self.docstring = docstring or '' self.kind = kind self.coexist = coexist + self.self_converter = None + + @property + def methoddef_flags(self): + flags = [] + if self.kind == CLASS_METHOD: + flags.append('METH_CLASS') + elif self.kind == STATIC_METHOD: + flags.append('METH_STATIC') + else: + assert self.kind == CALLABLE, "unknown kind: " + repr(self.kind) + if self.coexist: + flags.append('METH_COEXIST') + return '|'.join(flags) def __repr__(self): return '<clinic.Function ' + self.name + '>' @@ -1307,6 +1352,7 @@ class CConverter(metaclass=CConverterAutoRegister): # The C converter *function* to be used, if any. # (If this is not None, format_unit must be 'O&'.) converter = None + encoding = None impl_by_reference = False parse_by_reference = True @@ -1354,6 +1400,8 @@ class CConverter(metaclass=CConverterAutoRegister): # impl_arguments s = ("&" if self.impl_by_reference else "") + name data.impl_arguments.append(s) + if self.length: + data.impl_arguments.append(self.length_name()) # keywords data.keywords.append(name) @@ -1370,12 +1418,20 @@ class CConverter(metaclass=CConverterAutoRegister): # impl_parameters data.impl_parameters.append(self.simple_declaration(by_reference=self.impl_by_reference)) + if self.length: + data.impl_parameters.append("Py_ssize_clean_t " + self.length_name()) # cleanup cleanup = self.cleanup() if cleanup: data.cleanup.append('/* Cleanup for ' + name + ' */\n' + cleanup.rstrip() + "\n") + def length_name(self): + """Computes the name of the associated "length" variable.""" + if not self.length: + return None + return ensure_legal_c_identifier(self.name) + "_length" + # Why is this one broken out separately? # For "positional-only" function parsing, # which generates a bunch of PyArg_ParseTuple calls. @@ -1388,9 +1444,13 @@ class CConverter(metaclass=CConverterAutoRegister): if self.encoding: list.append(self.encoding) - s = ("&" if self.parse_by_reference else "") + ensure_legal_c_identifier(self.name) + legal_name = ensure_legal_c_identifier(self.name) + s = ("&" if self.parse_by_reference else "") + legal_name list.append(s) + if self.length: + list.append("&" + self.length_name()) + # # All the functions after here are intended as extension points. # @@ -1421,6 +1481,10 @@ class CConverter(metaclass=CConverterAutoRegister): declaration.append(" = ") declaration.append(default) declaration.append(";") + if self.length: + declaration.append('\nPy_ssize_clean_t ') + declaration.append(self.length_name()) + declaration.append(';') return "".join(declaration) def initialize(self): @@ -1462,7 +1526,7 @@ class byte_converter(CConverter): def converter_init(self, *, bitwise=False): if bitwise: - format_unit = 'B' + self.format_unit = 'B' class short_converter(CConverter): type = 'short' @@ -1478,15 +1542,17 @@ class unsigned_short_converter(CConverter): if not bitwise: fail("Unsigned shorts must be bitwise (for now).") -@add_legacy_c_converter('C', from_str=True) +@add_legacy_c_converter('C', types='str') class int_converter(CConverter): type = 'int' format_unit = 'i' c_ignored_default = "0" - def converter_init(self, *, from_str=False): - if from_str: - format_unit = 'C' + def converter_init(self, *, types='int'): + if types == 'str': + self.format_unit = 'C' + elif types != 'int': + fail("int_converter: illegal 'types' argument") class unsigned_int_converter(CConverter): type = 'unsigned int' @@ -1568,18 +1634,66 @@ class object_converter(CConverter): self.encoding = type -@add_legacy_c_converter('y', from_bytes=True) +@add_legacy_c_converter('s#', length=True) +@add_legacy_c_converter('y', type="bytes") +@add_legacy_c_converter('y#', type="bytes", length=True) @add_legacy_c_converter('z', nullable=True) +@add_legacy_c_converter('z#', nullable=True, length=True) class str_converter(CConverter): type = 'const char *' format_unit = 's' - def converter_init(self, *, nullable=False, from_bytes=False): - if from_bytes: - assert not nullable - format_unit = 'y' - if nullable: - format_unit = 'z' + def converter_init(self, *, encoding=None, types="str", + length=False, nullable=False, zeroes=False): + + types = set(types.strip().split()) + bytes_type = set(("bytes",)) + str_type = set(("str",)) + all_3_type = set(("bytearray",)) | bytes_type | str_type + is_bytes = types == bytes_type + is_str = types == str_type + is_all_3 = types == all_3_type + + self.length = bool(length) + format_unit = None + + if encoding: + self.encoding = encoding + + if is_str and not (length or zeroes or nullable): + format_unit = 'es' + elif is_all_3 and not (length or zeroes or nullable): + format_unit = 'et' + elif is_str and length and zeroes and not nullable: + format_unit = 'es#' + elif is_all_3 and length and not (nullable or zeroes): + format_unit = 'et#' + + if format_unit.endswith('#'): + # TODO set pointer to NULL + # TODO add cleanup for buffer + pass + + else: + if zeroes: + fail("str_converter: illegal combination of arguments (zeroes is only legal with an encoding)") + + if is_bytes and not (nullable or length): + format_unit = 'y' + elif is_bytes and length and not nullable: + format_unit = 'y#' + elif is_str and not (nullable or length): + format_unit = 's' + elif is_str and length and not nullable: + format_unit = 's#' + elif is_str and nullable and not length: + format_unit = 'z' + elif is_str and nullable and length: + format_unit = 'z#' + + if not format_unit: + fail("str_converter: illegal combination of arguments") + self.format_unit = format_unit class PyBytesObject_converter(CConverter): @@ -1594,36 +1708,89 @@ class unicode_converter(CConverter): type = 'PyObject *' format_unit = 'U' +@add_legacy_c_converter('u#', length=True) @add_legacy_c_converter('Z', nullable=True) +@add_legacy_c_converter('Z#', nullable=True, length=True) class Py_UNICODE_converter(CConverter): type = 'Py_UNICODE *' format_unit = 'u' - def converter_init(self, *, nullable=False): - if nullable: - format_unit = 'Z' + def converter_init(self, *, nullable=False, length=False): + format_unit = 'Z' if nullable else 'u' + if length: + format_unit += '#' + self.length = True + self.format_unit = format_unit -@add_legacy_c_converter('s*', zeroes=True) -@add_legacy_c_converter('w*', read_write=True) -@add_legacy_c_converter('z*', zeroes=True, nullable=True) +# +# We define three string conventions for buffer types in the 'types' argument: +# 'buffer' : any object supporting the buffer interface +# 'rwbuffer': any object supporting the buffer interface, but must be writeable +# 'robuffer': any object supporting the buffer interface, but must not be writeable +# +@add_legacy_c_converter('s*', types='str bytes bytearray buffer') +@add_legacy_c_converter('z*', types='str bytes bytearray buffer', nullable=True) +@add_legacy_c_converter('w*', types='bytearray rwbuffer') class Py_buffer_converter(CConverter): type = 'Py_buffer' format_unit = 'y*' impl_by_reference = True c_ignored_default = "{NULL, NULL, 0, 0, 0, 0, NULL, NULL, NULL, NULL, NULL}" - def converter_init(self, *, str=False, zeroes=False, nullable=False, read_write=False): - if not str: - assert not (zeroes or nullable or read_write) - elif read_write: - assert not (zeroes or nullable) - self.format_unit = 'w*' + def converter_init(self, *, types='bytes bytearray buffer', nullable=False): + types = set(types.strip().split()) + bytes_type = set(('bytes',)) + bytearray_type = set(('bytearray',)) + buffer_type = set(('buffer',)) + rwbuffer_type = set(('rwbuffer',)) + robuffer_type = set(('robuffer',)) + str_type = set(('str',)) + bytes_bytearray_buffer_type = bytes_type | bytearray_type | buffer_type + + format_unit = None + if types == (str_type | bytes_bytearray_buffer_type): + format_unit = 's*' if not nullable else 'z*' else: - assert zeroes - self.format_unit = 'z*' if nullable else 's*' + if nullable: + fail('Py_buffer_converter: illegal combination of arguments (nullable=True)') + elif types == (bytes_bytearray_buffer_type): + format_unit = 'y*' + elif types == (bytearray_type | rwuffer_type): + format_unit = 'w*' + if not format_unit: + fail("Py_buffer_converter: illegal combination of arguments") + + self.format_unit = format_unit def cleanup(self): - return "PyBuffer_Release(&" + ensure_legal_c_identifier(self.name) + ");\n" + name = ensure_legal_c_identifier(self.name) + return "".join(["if (", name, ".buf)\n PyBuffer_Release(&", name, ");\n"]) + + +class self_converter(CConverter): + """ + A special-case converter: + this is the default converter used for "self". + """ + type = "PyObject *" + def converter_init(self): + f = self.function + if f.kind == CALLABLE: + if f.cls: + self.name = "self" + else: + self.name = "module" + self.type = "PyModuleDef *" + elif f.kind == STATIC_METHOD: + self.name = "null" + self.type = "void *" + elif f.kind == CLASS_METHOD: + self.name = "cls" + self.type = "PyTypeObject *" + + def render(self, parameter, data): + fail("render() should never be called on self_converter instances") + def add_c_return_converter(f, name=None): @@ -1830,6 +1997,11 @@ class DSLParser: self.kind = CALLABLE self.coexist = False + def directive_version(self, required): + global version + if version_comparitor(version, required) < 0: + fail("Insufficient Clinic version!\n Version: " + version + "\n Required: " + required) + def directive_module(self, name): fields = name.split('.') new = fields.pop() @@ -1867,6 +2039,7 @@ class DSLParser: assert self.coexist == False self.coexist = True + def parse(self, block): self.reset() self.block = block @@ -2128,6 +2301,17 @@ class DSLParser: fail('{} is not a valid {}converter'.format(name, legacy_str)) converter = dict[name](parameter_name, self.function, value, **kwargs) + # special case: if it's the self converter, + # don't actually add it to the parameter list + if isinstance(converter, self_converter): + if self.function.parameters or (self.parameter_state != self.ps_required): + fail("The 'self' parameter, if specified, must be the very first thing in the parameter block.") + if self.function.self_converter: + fail("You can't specify the 'self' parameter more than once.") + self.function.self_converter = converter + self.parameter_state = self.ps_start + return + kind = inspect.Parameter.KEYWORD_ONLY if self.keyword_only else inspect.Parameter.POSITIONAL_OR_KEYWORD p = Parameter(parameter_name, kind, function=self.function, converter=converter, default=value, group=self.group) self.function.parameters[parameter_name] = p @@ -2224,6 +2408,9 @@ class DSLParser: # the final stanza of the DSL is the docstring. def state_function_docstring(self, line): + if not self.function.self_converter: + self.function.self_converter = self_converter("self", self.function) + if self.group: fail("Function " + self.function.name + " has a ] without a matching [.") |