/* Compile an expression node to intermediate code */ /* XXX TO DO: XXX add __doc__ attribute == co_doc to code object attributes? XXX (it's currently the first item of the co_const tuple) XXX Generate simple jump for break/return outside 'try...finally' XXX Allow 'continue' inside try-finally XXX New opcode for loading the initial index for a for loop XXX other JAR tricks? */ #include "Python.h" #include "node.h" #include "token.h" #include "graminit.h" #include "compile.h" #include "opcode.h" #include "structmember.h" #include /* Three symbols from graminit.h are also defined in Python.h, with Py_ prefixes to their names. Python.h can't include graminit.h (which defines too many confusing symbols), but we can check here that they haven't changed (which is very unlikely, but possible). */ #if Py_single_input != single_input #error "single_input has changed -- update Py_single_input in Python.h" #endif #if Py_file_input != file_input #error "file_input has changed -- update Py_file_input in Python.h" #endif #if Py_eval_input != eval_input #error "eval_input has changed -- update Py_eval_input in Python.h" #endif int Py_OptimizeFlag = 0; #define OP_DELETE 0 #define OP_ASSIGN 1 #define OP_APPLY 2 #define VAR_LOAD 0 #define VAR_STORE 1 #define VAR_DELETE 2 #define NAME_LOCAL 0 #define NAME_GLOBAL 1 #define NAME_DEFAULT 2 #define TYPE_FUNCTION 0 #define TYPE_CLASS 1 #define TYPE_MODULE 2 #define IMPLICIT_GLOBAL 1 #define EXPLICIT_GLOBAL 2 #define MANGLE_LEN 256 #define OFF(x) offsetof(PyCodeObject, x) static struct memberlist code_memberlist[] = { {"co_argcount", T_INT, OFF(co_argcount), READONLY}, {"co_nlocals", T_INT, OFF(co_nlocals), READONLY}, {"co_stacksize",T_INT, OFF(co_stacksize), READONLY}, {"co_flags", T_INT, OFF(co_flags), READONLY}, {"co_code", T_OBJECT, OFF(co_code), READONLY}, {"co_consts", T_OBJECT, OFF(co_consts), READONLY}, {"co_names", T_OBJECT, OFF(co_names), READONLY}, {"co_varnames", T_OBJECT, OFF(co_varnames), READONLY}, {"co_filename", T_OBJECT, OFF(co_filename), READONLY}, {"co_name", T_OBJECT, OFF(co_name), READONLY}, {"co_firstlineno", T_INT, OFF(co_firstlineno), READONLY}, {"co_lnotab", T_OBJECT, OFF(co_lnotab), READONLY}, {NULL} /* Sentinel */ }; static PyObject * code_getattr(PyCodeObject *co, char *name) { return PyMember_Get((char *)co, code_memberlist, name); } static void code_dealloc(PyCodeObject *co) { Py_XDECREF(co->co_code); Py_XDECREF(co->co_consts); Py_XDECREF(co->co_names); Py_XDECREF(co->co_varnames); Py_XDECREF(co->co_filename); Py_XDECREF(co->co_name); Py_XDECREF(co->co_lnotab); PyObject_DEL(co); } static PyObject * code_repr(PyCodeObject *co) { char buf[500]; int lineno = -1; char *filename = "???"; char *name = "???"; if (co->co_firstlineno != 0) lineno = co->co_firstlineno; if (co->co_filename && PyString_Check(co->co_filename)) filename = PyString_AsString(co->co_filename); if (co->co_name && PyString_Check(co->co_name)) name = PyString_AsString(co->co_name); sprintf(buf, "", name, co, filename, lineno); return PyString_FromString(buf); } static int code_compare(PyCodeObject *co, PyCodeObject *cp) { int cmp; cmp = PyObject_Compare(co->co_name, cp->co_name); if (cmp) return cmp; cmp = co->co_argcount - cp->co_argcount; if (cmp) return cmp; cmp = co->co_nlocals - cp->co_nlocals; if (cmp) return cmp; cmp = co->co_flags - cp->co_flags; if (cmp) return cmp; cmp = PyObject_Compare(co->co_code, cp->co_code); if (cmp) return cmp; cmp = PyObject_Compare(co->co_consts, cp->co_consts); if (cmp) return cmp; cmp = PyObject_Compare(co->co_names, cp->co_names); if (cmp) return cmp; cmp = PyObject_Compare(co->co_varnames, cp->co_varnames); return cmp; } static long code_hash(PyCodeObject *co) { long h, h0, h1, h2, h3, h4; h0 = PyObject_Hash(co->co_name); if (h0 == -1) return -1; h1 = PyObject_Hash(co->co_code); if (h1 == -1) return -1; h2 = PyObject_Hash(co->co_consts); if (h2 == -1) return -1; h3 = PyObject_Hash(co->co_names); if (h3 == -1) return -1; h4 = PyObject_Hash(co->co_varnames); if (h4 == -1) return -1; h = h0 ^ h1 ^ h2 ^ h3 ^ h4 ^ co->co_argcount ^ co->co_nlocals ^ co->co_flags; if (h == -1) h = -2; return h; } PyTypeObject PyCode_Type = { PyObject_HEAD_INIT(&PyType_Type) 0, "code", sizeof(PyCodeObject), 0, (destructor)code_dealloc, /*tp_dealloc*/ 0, /*tp_print*/ (getattrfunc)code_getattr, /*tp_getattr*/ 0, /*tp_setattr*/ (cmpfunc)code_compare, /*tp_compare*/ (reprfunc)code_repr, /*tp_repr*/ 0, /*tp_as_number*/ 0, /*tp_as_sequence*/ 0, /*tp_as_mapping*/ (hashfunc)code_hash, /*tp_hash*/ }; #define NAME_CHARS \ "0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ_abcdefghijklmnopqrstuvwxyz" /* all_name_chars(s): true iff all chars in s are valid NAME_CHARS */ static int all_name_chars(unsigned char *s) { static char ok_name_char[256]; static unsigned char *name_chars = (unsigned char *)NAME_CHARS; if (ok_name_char[*name_chars] == 0) { unsigned char *p; for (p = name_chars; *p; p++) ok_name_char[*p] = 1; } while (*s) { if (ok_name_char[*s++] == 0) return 0; } return 1; } PyCodeObject * PyCode_New(int argcount, int nlocals, int stacksize, int flags, PyObject *code, PyObject *consts, PyObject *names, PyObject *varnames, PyObject *filename, PyObject *name, int firstlineno, PyObject *lnotab) { PyCodeObject *co; int i; PyBufferProcs *pb; /* Check argument types */ if (argcount < 0 || nlocals < 0 || code == NULL || consts == NULL || !PyTuple_Check(consts) || names == NULL || !PyTuple_Check(names) || varnames == NULL || !PyTuple_Check(varnames) || name == NULL || !PyString_Check(name) || filename == NULL || !PyString_Check(filename) || lnotab == NULL || !PyString_Check(lnotab)) { PyErr_BadInternalCall(); return NULL; } pb = code->ob_type->tp_as_buffer; if (pb == NULL || pb->bf_getreadbuffer == NULL || pb->bf_getsegcount == NULL || (*pb->bf_getsegcount)(code, NULL) != 1) { PyErr_BadInternalCall(); return NULL; } /* Make sure names and varnames are all strings, & intern them */ for (i = PyTuple_Size(names); --i >= 0; ) { PyObject *v = PyTuple_GetItem(names, i); if (v == NULL || !PyString_Check(v)) { PyErr_BadInternalCall(); return NULL; } PyString_InternInPlace(&PyTuple_GET_ITEM(names, i)); } for (i = PyTuple_Size(varnames); --i >= 0; ) { PyObject *v = PyTuple_GetItem(varnames, i); if (v == NULL || !PyString_Check(v)) { PyErr_BadInternalCall(); return NULL; } PyString_InternInPlace(&PyTuple_GET_ITEM(varnames, i)); } /* Intern selected string constants */ for (i = PyTuple_Size(consts); --i >= 0; ) { PyObject *v = PyTuple_GetItem(consts, i); if (!PyString_Check(v)) continue; if (!all_name_chars((unsigned char *)PyString_AsString(v))) continue; PyString_InternInPlace(&PyTuple_GET_ITEM(consts, i)); } co = PyObject_NEW(PyCodeObject, &PyCode_Type); if (co != NULL) { co->co_argcount = argcount; co->co_nlocals = nlocals; co->co_stacksize = stacksize; co->co_flags = flags; Py_INCREF(code); co->co_code = code; Py_INCREF(consts); co->co_consts = consts; Py_INCREF(names); co->co_names = names; Py_INCREF(varnames); co->co_varnames = varnames; Py_INCREF(filename); co->co_filename = filename; Py_INCREF(name); co->co_name = name; co->co_firstlineno = firstlineno; Py_INCREF(lnotab); co->co_lnotab = lnotab; } return co; } /* Data structure used internally */ /* The compiler uses two passes to generate bytecodes. The first pass builds the symbol table. The second pass generates the bytecode. The first pass uses a single symtable struct. The second pass uses a compiling struct for each code block. The compiling structs share a reference to the symtable. The two passes communicate via symtable_load_symbols() and via is_local() and is_global(). The former initializes several slots in the compiling struct: c_varnames, c_locals, c_nlocals, c_argcount, c_globals, and c_flags. */ struct compiling { PyObject *c_code; /* string */ PyObject *c_consts; /* list of objects */ PyObject *c_const_dict; /* inverse of c_consts */ PyObject *c_names; /* list of strings (names) */ PyObject *c_name_dict; /* inverse of c_names */ PyObject *c_globals; /* dictionary (value=None) */ PyObject *c_locals; /* dictionary (value=localID) */ PyObject *c_varnames; /* list (inverse of c_locals) */ int c_nlocals; /* index of next local */ int c_argcount; /* number of top-level arguments */ int c_flags; /* same as co_flags */ int c_nexti; /* index into c_code */ int c_errors; /* counts errors occurred */ int c_infunction; /* set when compiling a function */ int c_interactive; /* generating code for interactive command */ int c_loops; /* counts nested loops */ int c_begin; /* begin of current loop, for 'continue' */ int c_block[CO_MAXBLOCKS]; /* stack of block types */ int c_nblocks; /* current block stack level */ char *c_filename; /* filename of current node */ char *c_name; /* name of object (e.g. function) */ int c_lineno; /* Current line number */ int c_stacklevel; /* Current stack level */ int c_maxstacklevel; /* Maximum stack level */ int c_firstlineno; PyObject *c_lnotab; /* Table mapping address to line number */ int c_last_addr, c_last_line, c_lnotab_next; char *c_private; /* for private name mangling */ int c_tmpname; /* temporary local name counter */ struct symtable *c_symtable; /* pointer to module symbol table */ }; /* The symbol table is constructed each time PyNode_Compile() is called. The table walks the entire parse tree and identifies each use or definition of a variable. The symbol table contains a dictionary for each code block in a module: The symbol dictionary for the block. They keys of these dictionaries are the name of all variables used or defined in the block; the integer values are used to store several flags, e.g. DEF_PARAM indicates that a variable is a parameter to a function. The slots st_cur, st_cur_id, and st_cur_type always refer to the current code block. The st_cur slot is the symbol dictionary. The st_cur_id slot is the id is the key in st_symbols. The st_cur_type slot is one of TYPE_FUNCTION, TYPE_CLASS, or TYPE_MODULE. The st_symbols slot is a dictionary that maps code block ids to symbol dictionaries. The keys are generated by a counter that is incremented each time a new code block is found. The counter is identifies a specific scope, because both passes walk the parse tree in the same order. The st_varnames slot is a dictionary that maps code block ids to parameter lists. The st_global slot always refers to the symbol dictionary for the module. */ struct symtable { PyObject *st_symbols; /* dictionary of symbol tables */ PyObject *st_varnames; /* dictionary of parameter lists */ PyObject *st_namespaces; /* pointer to list of namespaces */ PyObject *st_types; /* pointer to list of namespace types */ PyObject *st_cur; /* borrowed ref to dict in st_symbols */ PyObject *st_cur_id; /* int id of current code block */ int st_cur_type; /* type of current scope */ PyObject *st_global; /* borrowed ref to MODULE in st_symbols */ int st_scopes; /* number of scopes */ int st_errors; /* number of errors */ char *st_private; /* name of current class or NULL */ int st_tmpname; /* temporary name counter */ }; #define GLOBAL "global" #define NOOPT ".noopt" /* Flags for def-use information */ #define DEF_GLOBAL 1 #define DEF_LOCAL 2 #define DEF_PARAM 2<<1 #define USE 2<<2 #define DEF_STAR 2<<3 #define DEF_DOUBLESTAR 2<<4 #define DEF_INTUPLE 2<<5 /* Error message including line number */ static void com_error(struct compiling *c, PyObject *exc, char *msg) { PyObject *v, *tb, *tmp; if (c == NULL) { /* Error occurred via symtable call to is_constant_false */ PyErr_SetString(exc, msg); return; } c->c_errors++; if (c->c_lineno <= 1) { /* Unknown line number or single interactive command */ PyErr_SetString(exc, msg); return; } v = PyString_FromString(msg); if (v == NULL) return; /* MemoryError, too bad */ PyErr_SetObject(exc, v); Py_DECREF(v); /* add attributes for the line number and filename for the error */ PyErr_Fetch(&exc, &v, &tb); PyErr_NormalizeException(&exc, &v, &tb); tmp = PyInt_FromLong(c->c_lineno); if (tmp == NULL) PyErr_Clear(); else { if (PyObject_SetAttrString(v, "lineno", tmp)) PyErr_Clear(); Py_DECREF(tmp); } if (c->c_filename != NULL) { tmp = PyString_FromString(c->c_filename); if (tmp == NULL) PyErr_Clear(); else { if (PyObject_SetAttrString(v, "filename", tmp)) PyErr_Clear(); Py_DECREF(tmp); } } PyErr_Restore(exc, v, tb); } /* Interface to the block stack */ static void block_push(struct compiling *c, int type) { if (c->c_nblocks >= CO_MAXBLOCKS) { com_error(c, PyExc_SystemError, "too many statically nested blocks"); } else { c->c_block[c->c_nblocks++] = type; } } static void block_pop(struct compiling *c, int type) { if (c->c_nblocks > 0) c->c_nblocks--; if (c->c_block[c->c_nblocks] != type && c->c_errors == 0) { com_error(c, PyExc_SystemError, "bad block pop"); } } /* Prototype forward declarations */ static int com_init(struct compiling *, char *); static void com_free(struct compiling *); static void com_push(struct compiling *, int); static void com_pop(struct compiling *, int); static void com_done(struct compiling *); static void com_node(struct compiling *, node *); static void com_factor(struct compiling *, node *); static void com_addbyte(struct compiling *, int); static void com_addint(struct compiling *, int); static void com_addoparg(struct compiling *, int, int); static void com_addfwref(struct compiling *, int, int *); static void com_backpatch(struct compiling *, int); static int com_add(struct compiling *, PyObject *, PyObject *, PyObject *); static int com_addconst(struct compiling *, PyObject *); static int com_addname(struct compiling *, PyObject *); static void com_addopname(struct compiling *, int, node *); static void com_list(struct compiling *, node *, int); static void com_list_iter(struct compiling *, node *, node *, char *); static int com_argdefs(struct compiling *, node *); static void com_assign(struct compiling *, node *, int, node *); static void com_assign_name(struct compiling *, node *, int); static PyCodeObject *icompile(node *, struct compiling *); static PyCodeObject *jcompile(node *, char *, struct compiling *); static PyObject *parsestrplus(node *); static PyObject *parsestr(char *); static node *get_rawdocstring(node *); static int is_local(struct compiling *, char *); static int is_global(struct compiling *, char *); /* symtable operations */ static int symtable_build(struct compiling *, node *); static int symtable_load_symbols(struct compiling *); static struct symtable *symtable_init(void); static void symtable_free(struct symtable *); static int symtable_enter_scope(struct symtable *, char *, int); static int symtable_exit_scope(struct symtable *); static int symtable_update_cur(struct symtable *); static int symtable_add_def(struct symtable *, char *, int); static int symtable_add_use(struct symtable *, char *); static void symtable_node(struct symtable *, node *); static void symtable_funcdef(struct symtable *, node *); static void symtable_default_args(struct symtable *, node *); static void symtable_params(struct symtable *, node *); static void symtable_params_fplist(struct symtable *, node *n); static void symtable_global(struct symtable *, node *); static void symtable_import(struct symtable *, node *); static void symtable_assign(struct symtable *, node *); static void symtable_list_comprehension(struct symtable *, node *); /* helper */ static void do_pad(int pad) { int i; for (i = 0; i < pad; ++i) fprintf(stderr, " "); } static void dump(node *n, int pad, int depth) { int i; if (depth == 0) return; do_pad(pad); fprintf(stderr, "%d: %s\n", TYPE(n), STR(n)); if (depth > 0) depth--; for (i = 0; i < NCH(n); ++i) dump(CHILD(n, i), pad + 1, depth); } #define DUMP(N) dump(N, 0, -1) static int com_init(struct compiling *c, char *filename) { memset((void *)c, '\0', sizeof(struct compiling)); if ((c->c_code = PyString_FromStringAndSize((char *)NULL, 1000)) == NULL) goto fail; if ((c->c_consts = PyList_New(0)) == NULL) goto fail; if ((c->c_const_dict = PyDict_New()) == NULL) goto fail; if ((c->c_names = PyList_New(0)) == NULL) goto fail; if ((c->c_name_dict = PyDict_New()) == NULL) goto fail; if ((c->c_globals = PyDict_New()) == NULL) goto fail; if ((c->c_locals = PyDict_New()) == NULL) goto fail; if ((c->c_lnotab = PyString_FromStringAndSize((char *)NULL, 1000)) == NULL) goto fail; c->c_varnames = NULL; c->c_nlocals = 0; c->c_argcount = 0; c->c_flags = 0; c->c_nexti = 0; c->c_errors = 0; c->c_infunction = 0; c->c_interactive = 0; c->c_loops = 0; c->c_begin = 0; c->c_nblocks = 0; c->c_filename = filename; c->c_name = "?"; c->c_lineno = 0; c->c_stacklevel = 0; c->c_maxstacklevel = 0; c->c_firstlineno = 0; c->c_last_addr = 0; c->c_last_line = 0; c->c_lnotab_next = 0; c->c_tmpname = 0; c->c_symtable = NULL; return 1; fail: com_free(c); return 0; } static void com_free(struct compiling *c) { Py_XDECREF(c->c_code); Py_XDECREF(c->c_consts); Py_XDECREF(c->c_const_dict); Py_XDECREF(c->c_names); Py_XDECREF(c->c_name_dict); Py_XDECREF(c->c_globals); Py_XDECREF(c->c_locals); Py_XDECREF(c->c_varnames); Py_XDECREF(c->c_lnotab); } static void com_push(struct compiling *c, int n) { c->c_stacklevel += n; if (c->c_stacklevel > c->c_maxstacklevel) c->c_maxstacklevel = c->c_stacklevel; } static void com_pop(struct compiling *c, int n) { if (c->c_stacklevel < n) { /* fprintf(stderr, "%s:%d: underflow! nexti=%d, level=%d, n=%d\n", c->c_filename, c->c_lineno, c->c_nexti, c->c_stacklevel, n); */ c->c_stacklevel = 0; } else c->c_stacklevel -= n; } static void com_done(struct compiling *c) { if (c->c_code != NULL) _PyString_Resize(&c->c_code, c->c_nexti); if (c->c_lnotab != NULL) _PyString_Resize(&c->c_lnotab, c->c_lnotab_next); } static void com_addbyte(struct compiling *c, int byte) { int len; /*fprintf(stderr, "%3d: %3d\n", c->c_nexti, byte);*/ assert(byte >= 0 && byte <= 255); if (byte < 0 || byte > 255) { /* fprintf(stderr, "XXX compiling bad byte: %d\n", byte); fatal("com_addbyte: byte out of range"); */ com_error(c, PyExc_SystemError, "com_addbyte: byte out of range"); } if (c->c_code == NULL) return; len = PyString_Size(c->c_code); if (c->c_nexti >= len) { if (_PyString_Resize(&c->c_code, len+1000) != 0) { c->c_errors++; return; } } PyString_AsString(c->c_code)[c->c_nexti++] = byte; } static void com_addint(struct compiling *c, int x) { com_addbyte(c, x & 0xff); com_addbyte(c, x >> 8); /* XXX x should be positive */ } static void com_add_lnotab(struct compiling *c, int addr, int line) { int size; char *p; if (c->c_lnotab == NULL) return; size = PyString_Size(c->c_lnotab); if (c->c_lnotab_next+2 > size) { if (_PyString_Resize(&c->c_lnotab, size + 1000) < 0) { c->c_errors++; return; } } p = PyString_AsString(c->c_lnotab) + c->c_lnotab_next; *p++ = addr; *p++ = line; c->c_lnotab_next += 2; } static void com_set_lineno(struct compiling *c, int lineno) { c->c_lineno = lineno; if (c->c_firstlineno == 0) { c->c_firstlineno = c->c_last_line = lineno; } else { int incr_addr = c->c_nexti - c->c_last_addr; int incr_line = lineno - c->c_last_line; while (incr_addr > 0 || incr_line > 0) { int trunc_addr = incr_addr; int trunc_line = incr_line; if (trunc_addr > 255) trunc_addr = 255; if (trunc_line > 255) trunc_line = 255; com_add_lnotab(c, trunc_addr, trunc_line); incr_addr -= trunc_addr; incr_line -= trunc_line; } c->c_last_addr = c->c_nexti; c->c_last_line = lineno; } } static void com_addoparg(struct compiling *c, int op, int arg) { int extended_arg = arg >> 16; if (op == SET_LINENO) { com_set_lineno(c, arg); if (Py_OptimizeFlag) return; } if (extended_arg){ com_addbyte(c, EXTENDED_ARG); com_addint(c, extended_arg); arg &= 0xffff; } com_addbyte(c, op); com_addint(c, arg); } static void com_addfwref(struct compiling *c, int op, int *p_anchor) { /* Compile a forward reference for backpatching */ int here; int anchor; com_addbyte(c, op); here = c->c_nexti; anchor = *p_anchor; *p_anchor = here; com_addint(c, anchor == 0 ? 0 : here - anchor); } static void com_backpatch(struct compiling *c, int anchor) { unsigned char *code = (unsigned char *) PyString_AsString(c->c_code); int target = c->c_nexti; int dist; int prev; for (;;) { /* Make the JUMP instruction at anchor point to target */ prev = code[anchor] + (code[anchor+1] << 8); dist = target - (anchor+2); code[anchor] = dist & 0xff; dist >>= 8; code[anchor+1] = dist; dist >>= 8; if (dist) { com_error(c, PyExc_SystemError, "com_backpatch: offset too large"); break; } if (!prev) break; anchor -= prev; } } /* Handle literals and names uniformly */ static int com_add(struct compiling *c, PyObject *list, PyObject *dict, PyObject *v) { PyObject *w, *t, *np=NULL; long n; t = Py_BuildValue("(OO)", v, v->ob_type); if (t == NULL) goto fail; w = PyDict_GetItem(dict, t); if (w != NULL) { n = PyInt_AsLong(w); } else { n = PyList_Size(list); np = PyInt_FromLong(n); if (np == NULL) goto fail; if (PyList_Append(list, v) != 0) goto fail; if (PyDict_SetItem(dict, t, np) != 0) goto fail; Py_DECREF(np); } Py_DECREF(t); return n; fail: Py_XDECREF(np); Py_XDECREF(t); c->c_errors++; return 0; } static int com_addconst(struct compiling *c, PyObject *v) { return com_add(c, c->c_consts, c->c_const_dict, v); } static int com_addname(struct compiling *c, PyObject *v) { return com_add(c, c->c_names, c->c_name_dict, v); } static int mangle(char *p, char *name, char *buffer, size_t maxlen) { /* Name mangling: __private becomes _classname__private. This is independent from how the name is used. */ size_t nlen, plen; if (p == NULL || name == NULL || name[0] != '_' || name[1] != '_') return 0; nlen = strlen(name); if (nlen+2 >= maxlen) return 0; /* Don't mangle __extremely_long_names */ if (name[nlen-1] == '_' && name[nlen-2] == '_') return 0; /* Don't mangle __whatever__ */ /* Strip leading underscores from class name */ while (*p == '_') p++; if (*p == '\0') return 0; /* Don't mangle if class is just underscores */ plen = strlen(p); if (plen + nlen >= maxlen) plen = maxlen-nlen-2; /* Truncate class name if too long */ /* buffer = "_" + p[:plen] + name # i.e. 1+plen+nlen bytes */ buffer[0] = '_'; strncpy(buffer+1, p, plen); strcpy(buffer+1+plen, name); /* fprintf(stderr, "mangle %s -> %s\n", name, buffer); */ return 1; } static int com_mangle(struct compiling *c, char *name, char *buffer, size_t maxlen) { return mangle(c->c_private, name, buffer, maxlen); } static void com_addop_name(struct compiling *c, int op, char *name) { PyObject *v; int i; char buffer[MANGLE_LEN]; /* fprintf(stderr, "com_addop_name(%s, %d, %s)\n", c->c_name, op, name); */ if (com_mangle(c, name, buffer, sizeof(buffer))) name = buffer; if (name == NULL || (v = PyString_InternFromString(name)) == NULL) { c->c_errors++; i = 255; } else { i = com_addname(c, v); Py_DECREF(v); } com_addoparg(c, op, i); } static void com_addop_varname(struct compiling *c, int kind, char *name) { PyObject *v; int i; int scope; int op = STOP_CODE; char buffer[MANGLE_LEN]; if (com_mangle(c, name, buffer, sizeof(buffer))) name = buffer; if (name == NULL || (v = PyString_InternFromString(name)) == NULL) { c->c_errors++; i = 255; goto done; } scope = NAME_DEFAULT; if (c->c_symtable->st_cur_type == TYPE_FUNCTION && is_local(c, name)) { scope = NAME_LOCAL; } else { int g = is_global(c, name); if ((g & EXPLICIT_GLOBAL) || ((c->c_flags & CO_OPTIMIZED) && g)) scope = NAME_GLOBAL; } /* XXX Test can probably be eliminated once we reach 2.1 beta 1 */ if (!(is_local(c, name) || is_global(c, name))) { fprintf(stderr, "name: %s", name); fprintf(stderr, ", in %s, file '%s', line %d\n", c->c_name, c->c_filename, c->c_lineno); fprintf(stderr, "locals: %s\n", PyString_AS_STRING(PyObject_Repr(c->c_locals))); fprintf(stderr, "globals: %s\n", PyString_AS_STRING(PyObject_Repr(c->c_globals))); Py_FatalError("compiler did not label name as local or global"); } i = com_addname(c, v); if (scope == NAME_LOCAL) { PyObject *w = PyDict_GetItem(c->c_locals, v); if (w == NULL) { c->c_errors++; i = 255; goto done; } else i = PyInt_AsLong(w); } Py_DECREF(v); switch (kind) { case VAR_LOAD: switch (scope) { case NAME_LOCAL: op = LOAD_FAST; break; case NAME_GLOBAL: op = LOAD_GLOBAL; break; case NAME_DEFAULT: op = LOAD_NAME; } break; case VAR_STORE: switch (scope) { case NAME_LOCAL: op = STORE_FAST; break; case NAME_GLOBAL: op = STORE_GLOBAL; break; case NAME_DEFAULT: op = STORE_NAME; } break; case VAR_DELETE: switch (scope) { case NAME_LOCAL: op = DELETE_FAST; break; case NAME_GLOBAL: op = DELETE_GLOBAL; break; case NAME_DEFAULT: op = DELETE_NAME; } break; } done: com_addoparg(c, op, i); } static void com_addopname(struct compiling *c, int op, node *n) { char *name; char buffer[1000]; /* XXX it is possible to write this code without the 1000 chars on the total length of dotted names, I just can't be bothered right now */ if (TYPE(n) == STAR) name = "*"; else if (TYPE(n) == dotted_name) { char *p = buffer; int i; name = buffer; for (i = 0; i < NCH(n); i += 2) { char *s = STR(CHILD(n, i)); if (p + strlen(s) > buffer + (sizeof buffer) - 2) { com_error(c, PyExc_MemoryError, "dotted_name too long"); name = NULL; break; } if (p != buffer) *p++ = '.'; strcpy(p, s); p = strchr(p, '\0'); } } else { REQ(n, NAME); name = STR(n); } com_addop_name(c, op, name); } static PyObject * parsenumber(struct compiling *co, char *s) { char *end; long x; double dx; #ifndef WITHOUT_COMPLEX Py_complex c; int imflag; #endif errno = 0; end = s + strlen(s) - 1; #ifndef WITHOUT_COMPLEX imflag = *end == 'j' || *end == 'J'; #endif if (*end == 'l' || *end == 'L') return PyLong_FromString(s, (char **)0, 0); if (s[0] == '0') x = (long) PyOS_strtoul(s, &end, 0); else x = PyOS_strtol(s, &end, 0); if (*end == '\0') { if (errno != 0) { com_error(co, PyExc_OverflowError, "integer literal too large"); return NULL; } return PyInt_FromLong(x); } /* XXX Huge floats may silently fail */ #ifndef WITHOUT_COMPLEX if (imflag) { c.real = 0.; PyFPE_START_PROTECT("atof", return 0) c.imag = atof(s); PyFPE_END_PROTECT(c) return PyComplex_FromCComplex(c); } else #endif { PyFPE_START_PROTECT("atof", return 0) dx = atof(s); PyFPE_END_PROTECT(dx) return PyFloat_FromDouble(dx); } } static PyObject * parsestr(char *s) { PyObject *v; size_t len; char *buf; char *p; char *end; int c; int first = *s; int quote = first; int rawmode = 0; int unicode = 0; if (isalpha(quote) || quote == '_') { if (quote == 'u' || quote == 'U') { quote = *++s; unicode = 1; } if (quote == 'r' || quote == 'R') { quote = *++s; rawmode = 1; } } if (quote != '\'' && quote != '\"') { PyErr_BadInternalCall(); return NULL; } s++; len = strlen(s); if (len > INT_MAX) { PyErr_SetString(PyExc_OverflowError, "string to parse is too long"); return NULL; } if (s[--len] != quote) { PyErr_BadInternalCall(); return NULL; } if (len >= 4 && s[0] == quote && s[1] == quote) { s += 2; len -= 2; if (s[--len] != quote || s[--len] != quote) { PyErr_BadInternalCall(); return NULL; } } if (unicode || Py_UnicodeFlag) { if (rawmode) return PyUnicode_DecodeRawUnicodeEscape( s, len, NULL); else return PyUnicode_DecodeUnicodeEscape( s, len, NULL); } if (rawmode || strchr(s, '\\') == NULL) return PyString_FromStringAndSize(s, len); v = PyString_FromStringAndSize((char *)NULL, len); if (v == NULL) return NULL; p = buf = PyString_AsString(v); end = s + len; while (s < end) { if (*s != '\\') { *p++ = *s++; continue; } s++; switch (*s++) { /* XXX This assumes ASCII! */ case '\n': break; case '\\': *p++ = '\\'; break; case '\'': *p++ = '\''; break; case '\"': *p++ = '\"'; break; case 'b': *p++ = '\b'; break; case 'f': *p++ = '\014'; break; /* FF */ case 't': *p++ = '\t'; break; case 'n': *p++ = '\n'; break; case 'r': *p++ = '\r'; break; case 'v': *p++ = '\013'; break; /* VT */ case 'a': *p++ = '\007'; break; /* BEL, not classic C */ case '0': case '1': case '2': case '3': case '4': case '5': case '6': case '7': c = s[-1] - '0'; if ('0' <= *s && *s <= '7') { c = (c<<3) + *s++ - '0'; if ('0' <= *s && *s <= '7') c = (c<<3) + *s++ - '0'; } *p++ = c; break; case 'x': if (isxdigit(Py_CHARMASK(s[0])) && isxdigit(Py_CHARMASK(s[1]))) { unsigned int x = 0; c = Py_CHARMASK(*s); s++; if (isdigit(c)) x = c - '0'; else if (islower(c)) x = 10 + c - 'a'; else x = 10 + c - 'A'; x = x << 4; c = Py_CHARMASK(*s); s++; if (isdigit(c)) x += c - '0'; else if (islower(c)) x += 10 + c - 'a'; else x += 10 + c - 'A'; *p++ = x; break; } PyErr_SetString(PyExc_ValueError, "invalid \\x escape"); Py_DECREF(v); return NULL; default: *p++ = '\\'; *p++ = s[-1]; break; } } _PyString_Resize(&v, (int)(p - buf)); return v; } static PyObject * parsestrplus(node *n) { PyObject *v; int i; REQ(CHILD(n, 0), STRING); if ((v = parsestr(STR(CHILD(n, 0)))) != NULL) { /* String literal concatenation */ for (i = 1; i < NCH(n); i++) { PyObject *s; s = parsestr(STR(CHILD(n, i))); if (s == NULL) goto onError; if (PyString_Check(v) && PyString_Check(s)) { PyString_ConcatAndDel(&v, s); if (v == NULL) goto onError; } else { PyObject *temp; temp = PyUnicode_Concat(v, s); Py_DECREF(s); if (temp == NULL) goto onError; Py_DECREF(v); v = temp; } } } return v; onError: Py_XDECREF(v); return NULL; } static void com_list_for(struct compiling *c, node *n, node *e, char *t) { PyObject *v; int anchor = 0; int save_begin = c->c_begin; /* list_iter: for v in expr [list_iter] */ com_node(c, CHILD(n, 3)); /* expr */ v = PyInt_FromLong(0L); if (v == NULL) c->c_errors++; com_addoparg(c, LOAD_CONST, com_addconst(c, v)); com_push(c, 1); Py_XDECREF(v); c->c_begin = c->c_nexti; com_addoparg(c, SET_LINENO, n->n_lineno); com_addfwref(c, FOR_LOOP, &anchor); com_push(c, 1); com_assign(c, CHILD(n, 1), OP_ASSIGN, NULL); c->c_loops++; com_list_iter(c, n, e, t); c->c_loops--; com_addoparg(c, JUMP_ABSOLUTE, c->c_begin); c->c_begin = save_begin; com_backpatch(c, anchor); com_pop(c, 2); /* FOR_LOOP has popped these */ } static void com_list_if(struct compiling *c, node *n, node *e, char *t) { int anchor = 0; int a = 0; /* list_iter: 'if' test [list_iter] */ com_addoparg(c, SET_LINENO, n->n_lineno); com_node(c, CHILD(n, 1)); com_addfwref(c, JUMP_IF_FALSE, &a); com_addbyte(c, POP_TOP); com_pop(c, 1); com_list_iter(c, n, e, t); com_addfwref(c, JUMP_FORWARD, &anchor); com_backpatch(c, a); /* We jump here with an extra entry which we now pop */ com_addbyte(c, POP_TOP); com_backpatch(c, anchor); } static void com_list_iter(struct compiling *c, node *p, /* parent of list_iter node */ node *e, /* element expression node */ char *t /* name of result list temp local */) { /* list_iter is the last child in a listmaker, list_for, or list_if */ node *n = CHILD(p, NCH(p)-1); if (TYPE(n) == list_iter) { n = CHILD(n, 0); switch (TYPE(n)) { case list_for: com_list_for(c, n, e, t); break; case list_if: com_list_if(c, n, e, t); break; default: com_error(c, PyExc_SystemError, "invalid list_iter node type"); } } else { com_addop_varname(c, VAR_LOAD, t); com_push(c, 1); com_node(c, e); com_addoparg(c, CALL_FUNCTION, 1); com_addbyte(c, POP_TOP); com_pop(c, 2); } } static void com_list_comprehension(struct compiling *c, node *n) { /* listmaker: test list_for */ char tmpname[12]; sprintf(tmpname, "[%d]", ++c->c_tmpname); com_addoparg(c, BUILD_LIST, 0); com_addbyte(c, DUP_TOP); /* leave the result on the stack */ com_push(c, 2); com_addop_name(c, LOAD_ATTR, "append"); com_addop_varname(c, VAR_STORE, tmpname); com_pop(c, 1); com_list_for(c, CHILD(n, 1), CHILD(n, 0), tmpname); com_addop_varname(c, VAR_DELETE, tmpname); --c->c_tmpname; } static void com_listmaker(struct compiling *c, node *n) { /* listmaker: test ( list_for | (',' test)* [','] ) */ if (NCH(n) > 1 && TYPE(CHILD(n, 1)) == list_for) com_list_comprehension(c, n); else { int len = 0; int i; for (i = 0; i < NCH(n); i += 2, len++) com_node(c, CHILD(n, i)); com_addoparg(c, BUILD_LIST, len); com_pop(c, len-1); } } static void com_dictmaker(struct compiling *c, node *n) { int i; /* dictmaker: test ':' test (',' test ':' value)* [','] */ for (i = 0; i+2 < NCH(n); i += 4) { /* We must arrange things just right for STORE_SUBSCR. It wants the stack to look like (value) (dict) (key) */ com_addbyte(c, DUP_TOP); com_push(c, 1); com_node(c, CHILD(n, i+2)); /* value */ com_addbyte(c, ROT_TWO); com_node(c, CHILD(n, i)); /* key */ com_addbyte(c, STORE_SUBSCR); com_pop(c, 3); } } static void com_atom(struct compiling *c, node *n) { node *ch; PyObject *v; int i; REQ(n, atom); ch = CHILD(n, 0); switch (TYPE(ch)) { case LPAR: if (TYPE(CHILD(n, 1)) == RPAR) { com_addoparg(c, BUILD_TUPLE, 0); com_push(c, 1); } else com_node(c, CHILD(n, 1)); break; case LSQB: /* '[' [listmaker] ']' */ if (TYPE(CHILD(n, 1)) == RSQB) { com_addoparg(c, BUILD_LIST, 0); com_push(c, 1); } else com_listmaker(c, CHILD(n, 1)); break; case LBRACE: /* '{' [dictmaker] '}' */ com_addoparg(c, BUILD_MAP, 0); com_push(c, 1); if (TYPE(CHILD(n, 1)) == dictmaker) com_dictmaker(c, CHILD(n, 1)); break; case BACKQUOTE: com_node(c, CHILD(n, 1)); com_addbyte(c, UNARY_CONVERT); break; case NUMBER: if ((v = parsenumber(c, STR(ch))) == NULL) { i = 255; } else { i = com_addconst(c, v); Py_DECREF(v); } com_addoparg(c, LOAD_CONST, i); com_push(c, 1); break; case STRING: v = parsestrplus(n); if (v == NULL) { c->c_errors++; i = 255; } else { i = com_addconst(c, v); Py_DECREF(v); } com_addoparg(c, LOAD_CONST, i); com_push(c, 1); break; case NAME: com_addop_varname(c, VAR_LOAD, STR(ch)); com_push(c, 1); break; default: /* XXX fprintf(stderr, "node type %d\n", TYPE(ch)); */ com_error(c, PyExc_SystemError, "com_atom: unexpected node type"); } } static void com_slice(struct compiling *c, node *n, int op) { if (NCH(n) == 1) { com_addbyte(c, op); } else if (NCH(n) == 2) { if (TYPE(CHILD(n, 0)) != COLON) { com_node(c, CHILD(n, 0)); com_addbyte(c, op+1); } else { com_node(c, CHILD(n, 1)); com_addbyte(c, op+2); } com_pop(c, 1); } else { com_node(c, CHILD(n, 0)); com_node(c, CHILD(n, 2)); com_addbyte(c, op+3); com_pop(c, 2); } } static void com_augassign_slice(struct compiling *c, node *n, int opcode, node *augn) { if (NCH(n) == 1) { com_addbyte(c, DUP_TOP); com_push(c, 1); com_addbyte(c, SLICE); com_node(c, augn); com_addbyte(c, opcode); com_pop(c, 1); com_addbyte(c, ROT_TWO); com_addbyte(c, STORE_SLICE); com_pop(c, 2); } else if (NCH(n) == 2 && TYPE(CHILD(n, 0)) != COLON) { com_node(c, CHILD(n, 0)); com_addoparg(c, DUP_TOPX, 2); com_push(c, 2); com_addbyte(c, SLICE+1); com_pop(c, 1); com_node(c, augn); com_addbyte(c, opcode); com_pop(c, 1); com_addbyte(c, ROT_THREE); com_addbyte(c, STORE_SLICE+1); com_pop(c, 3); } else if (NCH(n) == 2) { com_node(c, CHILD(n, 1)); com_addoparg(c, DUP_TOPX, 2); com_push(c, 2); com_addbyte(c, SLICE+2); com_pop(c, 1); com_node(c, augn); com_addbyte(c, opcode); com_pop(c, 1); com_addbyte(c, ROT_THREE); com_addbyte(c, STORE_SLICE+2); com_pop(c, 3); } else { com_node(c, CHILD(n, 0)); com_node(c, CHILD(n, 2)); com_addoparg(c, DUP_TOPX, 3); com_push(c, 3); com_addbyte(c, SLICE+3); com_pop(c, 2); com_node(c, augn); com_addbyte(c, opcode); com_pop(c, 1); com_addbyte(c, ROT_FOUR); com_addbyte(c, STORE_SLICE+3); com_pop(c, 4); } } static void com_argument(struct compiling *c, node *n, PyObject **pkeywords) { node *m; REQ(n, argument); /* [test '='] test; really [keyword '='] test */ if (NCH(n) == 1) { if (*pkeywords != NULL) { com_error(c, PyExc_SyntaxError, "non-keyword arg after keyword arg"); } else { com_node(c, CHILD(n, 0)); } return; } m = n; do { m = CHILD(m, 0); } while (NCH(m) == 1); if (TYPE(m) != NAME) { com_error(c, PyExc_SyntaxError, "keyword can't be an expression"); } else { PyObject *v = PyString_InternFromString(STR(m)); if (v != NULL && *pkeywords == NULL) *pkeywords = PyDict_New(); if (v == NULL || *pkeywords == NULL) c->c_errors++; else { if (PyDict_GetItem(*pkeywords, v) != NULL) com_error(c, PyExc_SyntaxError, "duplicate keyword argument"); else if (PyDict_SetItem(*pkeywords, v, v) != 0) c->c_errors++; com_addoparg(c, LOAD_CONST, com_addconst(c, v)); com_push(c, 1); Py_DECREF(v); } } com_node(c, CHILD(n, 2)); } static void com_call_function(struct compiling *c, node *n) { if (TYPE(n) == RPAR) { com_addoparg(c, CALL_FUNCTION, 0); } else { PyObject *keywords = NULL; int i, na, nk; int lineno = n->n_lineno; int star_flag = 0; int starstar_flag = 0; int opcode; REQ(n, arglist); na = 0; nk = 0; for (i = 0; i < NCH(n); i += 2) { node *ch = CHILD(n, i); if (TYPE(ch) == STAR || TYPE(ch) == DOUBLESTAR) break; if (ch->n_lineno != lineno) { lineno = ch->n_lineno; com_addoparg(c, SET_LINENO, lineno); } com_argument(c, ch, &keywords); if (keywords == NULL) na++; else nk++; } Py_XDECREF(keywords); while (i < NCH(n)) { node *tok = CHILD(n, i); node *ch = CHILD(n, i+1); i += 3; switch (TYPE(tok)) { case STAR: star_flag = 1; break; case DOUBLESTAR: starstar_flag = 1; break; } com_node(c, ch); } if (na > 255 || nk > 255) { com_error(c, PyExc_SyntaxError, "more than 255 arguments"); } if (star_flag || starstar_flag) opcode = CALL_FUNCTION_VAR - 1 + star_flag + (starstar_flag << 1); else opcode = CALL_FUNCTION; com_addoparg(c, opcode, na | (nk << 8)); com_pop(c, na + 2*nk + star_flag + starstar_flag); } } static void com_select_member(struct compiling *c, node *n) { com_addopname(c, LOAD_ATTR, n); } static void com_sliceobj(struct compiling *c, node *n) { int i=0; int ns=2; /* number of slice arguments */ node *ch; /* first argument */ if (TYPE(CHILD(n,i)) == COLON) { com_addoparg(c, LOAD_CONST, com_addconst(c, Py_None)); com_push(c, 1); i++; } else { com_node(c, CHILD(n,i)); i++; REQ(CHILD(n,i),COLON); i++; } /* second argument */ if (i < NCH(n) && TYPE(CHILD(n,i)) == test) { com_node(c, CHILD(n,i)); i++; } else { com_addoparg(c, LOAD_CONST, com_addconst(c, Py_None)); com_push(c, 1); } /* remaining arguments */ for (; i < NCH(n); i++) { ns++; ch=CHILD(n,i); REQ(ch, sliceop); if (NCH(ch) == 1) { /* right argument of ':' missing */ com_addoparg(c, LOAD_CONST, com_addconst(c, Py_None)); com_push(c, 1); } else com_node(c, CHILD(ch,1)); } com_addoparg(c, BUILD_SLICE, ns); com_pop(c, 1 + (ns == 3)); } static void com_subscript(struct compiling *c, node *n) { node *ch; REQ(n, subscript); ch = CHILD(n,0); /* check for rubber index */ if (TYPE(ch) == DOT && TYPE(CHILD(n,1)) == DOT) { com_addoparg(c, LOAD_CONST, com_addconst(c, Py_Ellipsis)); com_push(c, 1); } else { /* check for slice */ if ((TYPE(ch) == COLON || NCH(n) > 1)) com_sliceobj(c, n); else { REQ(ch, test); com_node(c, ch); } } } static void com_subscriptlist(struct compiling *c, node *n, int assigning, node *augn) { int i, op; REQ(n, subscriptlist); /* Check to make backward compatible slice behavior for '[i:j]' */ if (NCH(n) == 1) { node *sub = CHILD(n, 0); /* subscript */ /* 'Basic' slice, should have exactly one colon. */ if ((TYPE(CHILD(sub, 0)) == COLON || (NCH(sub) > 1 && TYPE(CHILD(sub, 1)) == COLON)) && (TYPE(CHILD(sub,NCH(sub)-1)) != sliceop)) { switch (assigning) { case OP_DELETE: op = DELETE_SLICE; break; case OP_ASSIGN: op = STORE_SLICE; break; case OP_APPLY: op = SLICE; break; default: com_augassign_slice(c, sub, assigning, augn); return; } com_slice(c, sub, op); if (op == STORE_SLICE) com_pop(c, 2); else if (op == DELETE_SLICE) com_pop(c, 1); return; } } /* Else normal subscriptlist. Compile each subscript. */ for (i = 0; i < NCH(n); i += 2) com_subscript(c, CHILD(n, i)); /* Put multiple subscripts into a tuple */ if (NCH(n) > 1) { i = (NCH(n)+1) / 2; com_addoparg(c, BUILD_TUPLE, i); com_pop(c, i-1); } switch (assigning) { case OP_DELETE: op = DELETE_SUBSCR; i = 2; break; default: case OP_ASSIGN: op = STORE_SUBSCR; i = 3; break; case OP_APPLY: op = BINARY_SUBSCR; i = 1; break; } if (assigning > OP_APPLY) { com_addoparg(c, DUP_TOPX, 2); com_push(c, 2); com_addbyte(c, BINARY_SUBSCR); com_pop(c, 1); com_node(c, augn); com_addbyte(c, assigning); com_pop(c, 1); com_addbyte(c, ROT_THREE); } com_addbyte(c, op); com_pop(c, i); } static void com_apply_trailer(struct compiling *c, node *n) { REQ(n, trailer); switch (TYPE(CHILD(n, 0))) { case LPAR: com_call_function(c, CHILD(n, 1)); break; case DOT: com_select_member(c, CHILD(n, 1)); break; case LSQB: com_subscriptlist(c, CHILD(n, 1), OP_APPLY, NULL); break; default: com_error(c, PyExc_SystemError, "com_apply_trailer: unknown trailer type"); } } static void com_power(struct compiling *c, node *n) { int i; REQ(n, power); com_atom(c, CHILD(n, 0)); for (i = 1; i < NCH(n); i++) { if (TYPE(CHILD(n, i)) == DOUBLESTAR) { com_factor(c, CHILD(n, i+1)); com_addbyte(c, BINARY_POWER); com_pop(c, 1); break; } else com_apply_trailer(c, CHILD(n, i)); } } static void com_factor(struct compiling *c, node *n) { REQ(n, factor); if (TYPE(CHILD(n, 0)) == PLUS) { com_factor(c, CHILD(n, 1)); com_addbyte(c, UNARY_POSITIVE); } else if (TYPE(CHILD(n, 0)) == MINUS) { com_factor(c, CHILD(n, 1)); com_addbyte(c, UNARY_NEGATIVE); } else if (TYPE(CHILD(n, 0)) == TILDE) { com_factor(c, CHILD(n, 1)); com_addbyte(c, UNARY_INVERT); } else { com_power(c, CHILD(n, 0)); } } static void com_term(struct compiling *c, node *n) { int i; int op; REQ(n, term); com_factor(c, CHILD(n, 0)); for (i = 2; i < NCH(n); i += 2) { com_factor(c, CHILD(n, i)); switch (TYPE(CHILD(n, i-1))) { case STAR: op = BINARY_MULTIPLY; break; case SLASH: op = BINARY_DIVIDE; break; case PERCENT: op = BINARY_MODULO; break; default: com_error(c, PyExc_SystemError, "com_term: operator not *, / or %"); op = 255; } com_addbyte(c, op); com_pop(c, 1); } } static void com_arith_expr(struct compiling *c, node *n) { int i; int op; REQ(n, arith_expr); com_term(c, CHILD(n, 0)); for (i = 2; i < NCH(n); i += 2) { com_term(c, CHILD(n, i)); switch (TYPE(CHILD(n, i-1))) { case PLUS: op = BINARY_ADD; break; case MINUS: op = BINARY_SUBTRACT; break; default: com_error(c, PyExc_SystemError, "com_arith_expr: operator not + or -"); op = 255; } com_addbyte(c, op); com_pop(c, 1); } } static void com_shift_expr(struct compiling *c, node *n) { int i; int op; REQ(n, shift_expr); com_arith_expr(c, CHILD(n, 0)); for (i = 2; i < NCH(n); i += 2) { com_arith_expr(c, CHILD(n, i)); switch (TYPE(CHILD(n, i-1))) { case LEFTSHIFT: op = BINARY_LSHIFT; break; case RIGHTSHIFT: op = BINARY_RSHIFT; break; default: com_error(c, PyExc_SystemError, "com_shift_expr: operator not << or >>"); op = 255; } com_addbyte(c, op); com_pop(c, 1); } } static void com_and_expr(struct compiling *c, node *n) { int i; int op; REQ(n, and_expr); com_shift_expr(c, CHILD(n, 0)); for (i = 2; i < NCH(n); i += 2) { com_shift_expr(c, CHILD(n, i)); if (TYPE(CHILD(n, i-1)) == AMPER) { op = BINARY_AND; } else { com_error(c, PyExc_SystemError, "com_and_expr: operator not &"); op = 255; } com_addbyte(c, op); com_pop(c, 1); } } static void com_xor_expr(struct compiling *c, node *n) { int i; int op; REQ(n, xor_expr); com_and_expr(c, CHILD(n, 0)); for (i = 2; i < NCH(n); i += 2) { com_and_expr(c, CHILD(n, i)); if (TYPE(CHILD(n, i-1)) == CIRCUMFLEX) { op = BINARY_XOR; } else { com_error(c, PyExc_SystemError, "com_xor_expr: operator not ^"); op = 255; } com_addbyte(c, op); com_pop(c, 1); } } static void com_expr(struct compiling *c, node *n) { int i; int op; REQ(n, expr); com_xor_expr(c, CHILD(n, 0)); for (i = 2; i < NCH(n); i += 2) { com_xor_expr(c, CHILD(n, i)); if (TYPE(CHILD(n, i-1)) == VBAR) { op = BINARY_OR; } else { com_error(c, PyExc_SystemError, "com_expr: expr operator not |"); op = 255; } com_addbyte(c, op); com_pop(c, 1); } } static enum cmp_op cmp_type(node *n) { REQ(n, comp_op); /* comp_op: '<' | '>' | '=' | '>=' | '<=' | '<>' | '!=' | '==' | 'in' | 'not' 'in' | 'is' | 'is' not' */ if (NCH(n) == 1) { n = CHILD(n, 0); switch (TYPE(n)) { case LESS: return LT; case GREATER: return GT; case EQEQUAL: /* == */ case EQUAL: return EQ; case LESSEQUAL: return LE; case GREATEREQUAL: return GE; case NOTEQUAL: return NE; /* <> or != */ case NAME: if (strcmp(STR(n), "in") == 0) return IN; if (strcmp(STR(n), "is") == 0) return IS; } } else if (NCH(n) == 2) { switch (TYPE(CHILD(n, 0))) { case NAME: if (strcmp(STR(CHILD(n, 1)), "in") == 0) return NOT_IN; if (strcmp(STR(CHILD(n, 0)), "is") == 0) return IS_NOT; } } return BAD; } static void com_comparison(struct compiling *c, node *n) { int i; enum cmp_op op; int anchor; REQ(n, comparison); /* comparison: expr (comp_op expr)* */ com_expr(c, CHILD(n, 0)); if (NCH(n) == 1) return; /**************************************************************** The following code is generated for all but the last comparison in a chain: label: on stack: opcode: jump to: a a, b DUP_TOP a, b, b ROT_THREE b, a, b COMPARE_OP b, 0-or-1 JUMP_IF_FALSE L1 b, 1 POP_TOP b We are now ready to repeat this sequence for the next comparison in the chain. For the last we generate: b b, c COMPARE_OP 0-or-1 If there were any jumps to L1 (i.e., there was more than one comparison), we generate: 0-or-1 JUMP_FORWARD L2 L1: b, 0 ROT_TWO 0, b POP_TOP 0 L2: 0-or-1 ****************************************************************/ anchor = 0; for (i = 2; i < NCH(n); i += 2) { com_expr(c, CHILD(n, i)); if (i+2 < NCH(n)) { com_addbyte(c, DUP_TOP); com_push(c, 1); com_addbyte(c, ROT_THREE); } op = cmp_type(CHILD(n, i-1)); if (op == BAD) { com_error(c, PyExc_SystemError, "com_comparison: unknown comparison op"); } com_addoparg(c, COMPARE_OP, op); com_pop(c, 1); if (i+2 < NCH(n)) { com_addfwref(c, JUMP_IF_FALSE, &anchor); com_addbyte(c, POP_TOP); com_pop(c, 1); } } if (anchor) { int anchor2 = 0; com_addfwref(c, JUMP_FORWARD, &anchor2); com_backpatch(c, anchor); com_addbyte(c, ROT_TWO); com_addbyte(c, POP_TOP); com_backpatch(c, anchor2); } } static void com_not_test(struct compiling *c, node *n) { REQ(n, not_test); /* 'not' not_test | comparison */ if (NCH(n) == 1) { com_comparison(c, CHILD(n, 0)); } else { com_not_test(c, CHILD(n, 1)); com_addbyte(c, UNARY_NOT); } } static void com_and_test(struct compiling *c, node *n) { int i; int anchor; REQ(n, and_test); /* not_test ('and' not_test)* */ anchor = 0; i = 0; for (;;) { com_not_test(c, CHILD(n, i)); if ((i += 2) >= NCH(n)) break; com_addfwref(c, JUMP_IF_FALSE, &anchor); com_addbyte(c, POP_TOP); com_pop(c, 1); } if (anchor) com_backpatch(c, anchor); } static void com_test(struct compiling *c, node *n) { REQ(n, test); /* and_test ('or' and_test)* | lambdef */ if (NCH(n) == 1 && TYPE(CHILD(n, 0)) == lambdef) { PyObject *v; int i; int ndefs = com_argdefs(c, CHILD(n, 0)); symtable_enter_scope(c->c_symtable, "lambda", lambdef); v = (PyObject *) icompile(CHILD(n, 0), c); symtable_exit_scope(c->c_symtable); if (v == NULL) { c->c_errors++; i = 255; } else { i = com_addconst(c, v); Py_DECREF(v); } com_addoparg(c, LOAD_CONST, i); com_push(c, 1); com_addoparg(c, MAKE_FUNCTION, ndefs); com_pop(c, ndefs); } else { int anchor = 0; int i = 0; for (;;) { com_and_test(c, CHILD(n, i)); if ((i += 2) >= NCH(n)) break; com_addfwref(c, JUMP_IF_TRUE, &anchor); com_addbyte(c, POP_TOP); com_pop(c, 1); } if (anchor) com_backpatch(c, anchor); } } static void com_list(struct compiling *c, node *n, int toplevel) { /* exprlist: expr (',' expr)* [',']; likewise for testlist */ if (NCH(n) == 1 && !toplevel) { com_node(c, CHILD(n, 0)); } else { int i; int len; len = (NCH(n) + 1) / 2; for (i = 0; i < NCH(n); i += 2) com_node(c, CHILD(n, i)); com_addoparg(c, BUILD_TUPLE, len); com_pop(c, len-1); } } /* Begin of assignment compilation */ static void com_augassign_attr(struct compiling *c, node *n, int opcode, node *augn) { com_addbyte(c, DUP_TOP); com_push(c, 1); com_addopname(c, LOAD_ATTR, n); com_node(c, augn); com_addbyte(c, opcode); com_pop(c, 1); com_addbyte(c, ROT_TWO); com_addopname(c, STORE_ATTR, n); com_pop(c, 2); } static void com_assign_attr(struct compiling *c, node *n, int assigning) { com_addopname(c, assigning ? STORE_ATTR : DELETE_ATTR, n); com_pop(c, assigning ? 2 : 1); } static void com_assign_trailer(struct compiling *c, node *n, int assigning, node *augn) { REQ(n, trailer); switch (TYPE(CHILD(n, 0))) { case LPAR: /* '(' [exprlist] ')' */ com_error(c, PyExc_SyntaxError, "can't assign to function call"); break; case DOT: /* '.' NAME */ if (assigning > OP_APPLY) com_augassign_attr(c, CHILD(n, 1), assigning, augn); else com_assign_attr(c, CHILD(n, 1), assigning); break; case LSQB: /* '[' subscriptlist ']' */ com_subscriptlist(c, CHILD(n, 1), assigning, augn); break; default: com_error(c, PyExc_SystemError, "unknown trailer type"); } } static void com_assign_sequence(struct compiling *c, node *n, int assigning) { int i; if (TYPE(n) != testlist && TYPE(n) != listmaker) REQ(n, exprlist); if (assigning) { i = (NCH(n)+1)/2; com_addoparg(c, UNPACK_SEQUENCE, i); com_push(c, i-1); } for (i = 0; i < NCH(n); i += 2) com_assign(c, CHILD(n, i), assigning, NULL); } static void com_augassign_name(struct compiling *c, node *n, int opcode, node *augn) { REQ(n, NAME); com_addop_varname(c, VAR_LOAD, STR(n)); com_push(c, 1); com_node(c, augn); com_addbyte(c, opcode); com_pop(c, 1); com_assign_name(c, n, OP_ASSIGN); } static void com_assign_name(struct compiling *c, node *n, int assigning) { REQ(n, NAME); com_addop_varname(c, assigning ? VAR_STORE : VAR_DELETE, STR(n)); if (assigning) com_pop(c, 1); } static void com_assign(struct compiling *c, node *n, int assigning, node *augn) { /* Loop to avoid trivial recursion */ for (;;) { switch (TYPE(n)) { case exprlist: case testlist: if (NCH(n) > 1) { if (assigning > OP_APPLY) { com_error(c, PyExc_SyntaxError, "augmented assign to tuple not possible"); return; } com_assign_sequence(c, n, assigning); return; } n = CHILD(n, 0); break; case test: case and_test: case not_test: case comparison: case expr: case xor_expr: case and_expr: case shift_expr: case arith_expr: case term: case factor: if (NCH(n) > 1) { com_error(c, PyExc_SyntaxError, "can't assign to operator"); return; } n = CHILD(n, 0); break; case power: /* atom trailer* ('**' power)* */ /* ('+'|'-'|'~') factor | atom trailer* */ if (TYPE(CHILD(n, 0)) != atom) { com_error(c, PyExc_SyntaxError, "can't assign to operator"); return; } if (NCH(n) > 1) { /* trailer or exponent present */ int i; com_node(c, CHILD(n, 0)); for (i = 1; i+1 < NCH(n); i++) { if (TYPE(CHILD(n, i)) == DOUBLESTAR) { com_error(c, PyExc_SyntaxError, "can't assign to operator"); return; } com_apply_trailer(c, CHILD(n, i)); } /* NB i is still alive */ com_assign_trailer(c, CHILD(n, i), assigning, augn); return; } n = CHILD(n, 0); break; case atom: switch (TYPE(CHILD(n, 0))) { case LPAR: n = CHILD(n, 1); if (TYPE(n) == RPAR) { /* XXX Should allow () = () ??? */ com_error(c, PyExc_SyntaxError, "can't assign to ()"); return; } if (assigning > OP_APPLY) { com_error(c, PyExc_SyntaxError, "augmented assign to tuple not possible"); return; } break; case LSQB: n = CHILD(n, 1); if (TYPE(n) == RSQB) { com_error(c, PyExc_SyntaxError, "can't assign to []"); return; } if (assigning > OP_APPLY) { com_error(c, PyExc_SyntaxError, "augmented assign to list not possible"); return; } if (NCH(n) > 1 && TYPE(CHILD(n, 1)) == list_for) { com_error(c, PyExc_SyntaxError, "can't assign to list comprehension"); return; } com_assign_sequence(c, n, assigning); return; case NAME: if (assigning > OP_APPLY) com_augassign_name(c, CHILD(n, 0), assigning, augn); else com_assign_name(c, CHILD(n, 0), assigning); return; default: com_error(c, PyExc_SyntaxError, "can't assign to literal"); return; } break; case lambdef: com_error(c, PyExc_SyntaxError, "can't assign to lambda"); return; default: /* XXX fprintf(stderr, "node type %d\n", TYPE(n)); */ com_error(c, PyExc_SystemError, "com_assign: bad node"); return; } } } static void com_augassign(struct compiling *c, node *n) { int opcode; switch (STR(CHILD(CHILD(n, 1), 0))[0]) { case '+': opcode = INPLACE_ADD; break; case '-': opcode = INPLACE_SUBTRACT; break; case '/': opcode = INPLACE_DIVIDE; break; case '%': opcode = INPLACE_MODULO; break; case '<': opcode = INPLACE_LSHIFT; break; case '>': opcode = INPLACE_RSHIFT; break; case '&': opcode = INPLACE_AND; break; case '^': opcode = INPLACE_XOR; break; case '|': opcode = INPLACE_OR; break; case '*': if (STR(CHILD(CHILD(n, 1), 0))[1] == '*') opcode = INPLACE_POWER; else opcode = INPLACE_MULTIPLY; break; default: com_error(c, PyExc_SystemError, "com_augassign: bad operator"); return; } com_assign(c, CHILD(n, 0), opcode, CHILD(n, 2)); } static void com_expr_stmt(struct compiling *c, node *n) { REQ(n, expr_stmt); /* testlist (('=' testlist)* | augassign testlist) */ /* Forget it if we have just a doc string here */ if (!c->c_interactive && NCH(n) == 1 && get_rawdocstring(n) != NULL) return; if (NCH(n) == 1) { com_node(c, CHILD(n, NCH(n)-1)); if (c->c_interactive) com_addbyte(c, PRINT_EXPR); else com_addbyte(c, POP_TOP); com_pop(c, 1); } else if (TYPE(CHILD(n,1)) == augassign) com_augassign(c, n); else { int i; com_node(c, CHILD(n, NCH(n)-1)); for (i = 0; i < NCH(n)-2; i+=2) { if (i+2 < NCH(n)-2) { com_addbyte(c, DUP_TOP); com_push(c, 1); } com_assign(c, CHILD(n, i), OP_ASSIGN, NULL); } } } static void com_assert_stmt(struct compiling *c, node *n) { int a = 0, b = 0; int i; REQ(n, assert_stmt); /* 'assert' test [',' test] */ /* Generate code like for if __debug__: if not : raise AssertionError [, ] where is the second test, if present. */ /* XXX should __debug__ and AssertionError get inserted into the symbol table? they don't follow the normal rules because they are always loaded as globals */ if (Py_OptimizeFlag) return; com_addop_name(c, LOAD_GLOBAL, "__debug__"); com_push(c, 1); com_addfwref(c, JUMP_IF_FALSE, &a); com_addbyte(c, POP_TOP); com_pop(c, 1); com_node(c, CHILD(n, 1)); com_addfwref(c, JUMP_IF_TRUE, &b); com_addbyte(c, POP_TOP); com_pop(c, 1); /* Raise that exception! */ com_addop_name(c, LOAD_GLOBAL, "AssertionError"); com_push(c, 1); i = NCH(n)/2; /* Either 2 or 4 */ if (i > 1) com_node(c, CHILD(n, 3)); com_addoparg(c, RAISE_VARARGS, i); com_pop(c, i); /* The interpreter does not fall through */ /* All jumps converge here */ com_backpatch(c, a); com_backpatch(c, b); com_addbyte(c, POP_TOP); } static void com_print_stmt(struct compiling *c, node *n) { int i = 1; node* stream = NULL; REQ(n, print_stmt); /* 'print' (test ',')* [test] */ /* are we using the extended print form? */ if (NCH(n) >= 2 && TYPE(CHILD(n, 1)) == RIGHTSHIFT) { stream = CHILD(n, 2); com_node(c, stream); /* stack: [...] => [... stream] */ com_push(c, 1); if (NCH(n) > 3 && TYPE(CHILD(n, 3)) == COMMA) i = 4; else i = 3; } for (; i < NCH(n); i += 2) { if (stream != NULL) { com_addbyte(c, DUP_TOP); /* stack: [stream] => [stream stream] */ com_push(c, 1); com_node(c, CHILD(n, i)); /* stack: [stream stream] => [stream stream obj] */ com_addbyte(c, ROT_TWO); /* stack: [stream stream obj] => [stream obj stream] */ com_addbyte(c, PRINT_ITEM_TO); /* stack: [stream obj stream] => [stream] */ com_pop(c, 2); } else { com_node(c, CHILD(n, i)); /* stack: [...] => [... obj] */ com_addbyte(c, PRINT_ITEM); com_pop(c, 1); } } /* XXX Alternatively, LOAD_CONST '\n' and then PRINT_ITEM */ if (TYPE(CHILD(n, NCH(n)-1)) == COMMA) { if (stream != NULL) { /* must pop the extra stream object off the stack */ com_addbyte(c, POP_TOP); /* stack: [... stream] => [...] */ com_pop(c, 1); } } else { if (stream != NULL) { /* this consumes the last stream object on stack */ com_addbyte(c, PRINT_NEWLINE_TO); /* stack: [... stream] => [...] */ com_pop(c, 1); } else com_addbyte(c, PRINT_NEWLINE); } } static void com_return_stmt(struct compiling *c, node *n) { REQ(n, return_stmt); /* 'return' [testlist] */ if (!c->c_infunction) { com_error(c, PyExc_SyntaxError, "'return' outside function"); } if (NCH(n) < 2) { com_addoparg(c, LOAD_CONST, com_addconst(c, Py_None)); com_push(c, 1); } else com_node(c, CHILD(n, 1)); com_addbyte(c, RETURN_VALUE); com_pop(c, 1); } static void com_raise_stmt(struct compiling *c, node *n) { int i; REQ(n, raise_stmt); /* 'raise' [test [',' test [',' test]]] */ if (NCH(n) > 1) { com_node(c, CHILD(n, 1)); if (NCH(n) > 3) { com_node(c, CHILD(n, 3)); if (NCH(n) > 5) com_node(c, CHILD(n, 5)); } } i = NCH(n)/2; com_addoparg(c, RAISE_VARARGS, i); com_pop(c, i); } static void com_from_import(struct compiling *c, node *n) { com_addopname(c, IMPORT_FROM, CHILD(n, 0)); com_push(c, 1); if (NCH(n) > 1) { if (strcmp(STR(CHILD(n, 1)), "as") != 0) { com_error(c, PyExc_SyntaxError, "invalid syntax"); return; } com_addop_varname(c, VAR_STORE, STR(CHILD(n, 2))); } else com_addop_varname(c, VAR_STORE, STR(CHILD(n, 0))); com_pop(c, 1); } static void com_import_stmt(struct compiling *c, node *n) { int i; REQ(n, import_stmt); /* 'import' dotted_name (',' dotted_name)* | 'from' dotted_name 'import' ('*' | NAME (',' NAME)*) */ if (STR(CHILD(n, 0))[0] == 'f') { PyObject *tup; /* 'from' dotted_name 'import' ... */ REQ(CHILD(n, 1), dotted_name); if (TYPE(CHILD(n, 3)) == STAR) { tup = Py_BuildValue("(s)", "*"); } else { tup = PyTuple_New((NCH(n) - 2)/2); for (i = 3; i < NCH(n); i += 2) { PyTuple_SET_ITEM(tup, (i-3)/2, PyString_FromString(STR( CHILD(CHILD(n, i), 0)))); } } com_addoparg(c, LOAD_CONST, com_addconst(c, tup)); Py_DECREF(tup); com_push(c, 1); com_addopname(c, IMPORT_NAME, CHILD(n, 1)); if (TYPE(CHILD(n, 3)) == STAR) com_addbyte(c, IMPORT_STAR); else { for (i = 3; i < NCH(n); i += 2) com_from_import(c, CHILD(n, i)); com_addbyte(c, POP_TOP); } com_pop(c, 1); } else { /* 'import' ... */ for (i = 1; i < NCH(n); i += 2) { node *subn = CHILD(n, i); REQ(subn, dotted_as_name); com_addoparg(c, LOAD_CONST, com_addconst(c, Py_None)); com_push(c, 1); com_addopname(c, IMPORT_NAME, CHILD(subn, 0)); if (NCH(subn) > 1) { int j; if (strcmp(STR(CHILD(subn, 1)), "as") != 0) { com_error(c, PyExc_SyntaxError, "invalid syntax"); return; } for (j=2 ; j < NCH(CHILD(subn, 0)); j += 2) com_addopname(c, LOAD_ATTR, CHILD(CHILD(subn, 0), j)); com_addop_varname(c, VAR_STORE, STR(CHILD(subn, 2))); } else com_addop_varname(c, VAR_STORE, STR(CHILD(CHILD(subn, 0), 0))); com_pop(c, 1); } } } static void com_exec_stmt(struct compiling *c, node *n) { REQ(n, exec_stmt); /* exec_stmt: 'exec' expr ['in' expr [',' expr]] */ com_node(c, CHILD(n, 1)); if (NCH(n) >= 4) com_node(c, CHILD(n, 3)); else { com_addoparg(c, LOAD_CONST, com_addconst(c, Py_None)); com_push(c, 1); } if (NCH(n) >= 6) com_node(c, CHILD(n, 5)); else { com_addbyte(c, DUP_TOP); com_push(c, 1); } com_addbyte(c, EXEC_STMT); com_pop(c, 3); } static int is_constant_false(struct compiling *c, node *n) { PyObject *v; int i; /* argument c will be NULL when called from symtable_node() */ /* Label to avoid tail recursion */ next: switch (TYPE(n)) { case suite: if (NCH(n) == 1) { n = CHILD(n, 0); goto next; } /* Fall through */ case file_input: for (i = 0; i < NCH(n); i++) { node *ch = CHILD(n, i); if (TYPE(ch) == stmt) { n = ch; goto next; } } break; case stmt: case simple_stmt: case small_stmt: n = CHILD(n, 0); goto next; case expr_stmt: case testlist: case test: case and_test: case not_test: case comparison: case expr: case xor_expr: case and_expr: case shift_expr: case arith_expr: case term: case factor: case power: case atom: if (NCH(n) == 1) { n = CHILD(n, 0); goto next; } break; case NAME: if (Py_OptimizeFlag && strcmp(STR(n), "__debug__") == 0) return 1; break; case NUMBER: v = parsenumber(c, STR(n)); if (v == NULL) { PyErr_Clear(); break; } i = PyObject_IsTrue(v); Py_DECREF(v); return i == 0; case STRING: v = parsestr(STR(n)); if (v == NULL) { PyErr_Clear(); break; } i = PyObject_IsTrue(v); Py_DECREF(v); return i == 0; } return 0; } static void com_if_stmt(struct compiling *c, node *n) { int i; int anchor = 0; REQ(n, if_stmt); /*'if' test ':' suite ('elif' test ':' suite)* ['else' ':' suite] */ for (i = 0; i+3 < NCH(n); i+=4) { int a = 0; node *ch = CHILD(n, i+1); if (is_constant_false(c, ch)) continue; if (i > 0) com_addoparg(c, SET_LINENO, ch->n_lineno); com_node(c, ch); com_addfwref(c, JUMP_IF_FALSE, &a); com_addbyte(c, POP_TOP); com_pop(c, 1); com_node(c, CHILD(n, i+3)); com_addfwref(c, JUMP_FORWARD, &anchor); com_backpatch(c, a); /* We jump here with an extra entry which we now pop */ com_addbyte(c, POP_TOP); } if (i+2 < NCH(n)) com_node(c, CHILD(n, i+2)); if (anchor) com_backpatch(c, anchor); } static void com_while_stmt(struct compiling *c, node *n) { int break_anchor = 0; int anchor = 0; int save_begin = c->c_begin; REQ(n, while_stmt); /* 'while' test ':' suite ['else' ':' suite] */ com_addfwref(c, SETUP_LOOP, &break_anchor); block_push(c, SETUP_LOOP); c->c_begin = c->c_nexti; com_addoparg(c, SET_LINENO, n->n_lineno); com_node(c, CHILD(n, 1)); com_addfwref(c, JUMP_IF_FALSE, &anchor); com_addbyte(c, POP_TOP); com_pop(c, 1); c->c_loops++; com_node(c, CHILD(n, 3)); c->c_loops--; com_addoparg(c, JUMP_ABSOLUTE, c->c_begin); c->c_begin = save_begin; com_backpatch(c, anchor); /* We jump here with one entry more on the stack */ com_addbyte(c, POP_TOP); com_addbyte(c, POP_BLOCK); block_pop(c, SETUP_LOOP); if (NCH(n) > 4) com_node(c, CHILD(n, 6)); com_backpatch(c, break_anchor); } static void com_for_stmt(struct compiling *c, node *n) { PyObject *v; int break_anchor = 0; int anchor = 0; int save_begin = c->c_begin; REQ(n, for_stmt); /* 'for' exprlist 'in' exprlist ':' suite ['else' ':' suite] */ com_addfwref(c, SETUP_LOOP, &break_anchor); block_push(c, SETUP_LOOP); com_node(c, CHILD(n, 3)); v = PyInt_FromLong(0L); if (v == NULL) c->c_errors++; com_addoparg(c, LOAD_CONST, com_addconst(c, v)); com_push(c, 1); Py_XDECREF(v); c->c_begin = c->c_nexti; com_addoparg(c, SET_LINENO, n->n_lineno); com_addfwref(c, FOR_LOOP, &anchor); com_push(c, 1); com_assign(c, CHILD(n, 1), OP_ASSIGN, NULL); c->c_loops++; com_node(c, CHILD(n, 5)); c->c_loops--; com_addoparg(c, JUMP_ABSOLUTE, c->c_begin); c->c_begin = save_begin; com_backpatch(c, anchor); com_pop(c, 2); /* FOR_LOOP has popped these */ com_addbyte(c, POP_BLOCK); block_pop(c, SETUP_LOOP); if (NCH(n) > 8) com_node(c, CHILD(n, 8)); com_backpatch(c, break_anchor); } /* Code generated for "try: S finally: Sf" is as follows: SETUP_FINALLY L POP_BLOCK LOAD_CONST L: END_FINALLY The special instructions use the block stack. Each block stack entry contains the instruction that created it (here SETUP_FINALLY), the level of the value stack at the time the block stack entry was created, and a label (here L). SETUP_FINALLY: Pushes the current value stack level and the label onto the block stack. POP_BLOCK: Pops en entry from the block stack, and pops the value stack until its level is the same as indicated on the block stack. (The label is ignored.) END_FINALLY: Pops a variable number of entries from the *value* stack and re-raises the exception they specify. The number of entries popped depends on the (pseudo) exception type. The block stack is unwound when an exception is raised: when a SETUP_FINALLY entry is found, the exception is pushed onto the value stack (and the exception condition is cleared), and the interpreter jumps to the label gotten from the block stack. Code generated for "try: S except E1, V1: S1 except E2, V2: S2 ...": (The contents of the value stack is shown in [], with the top at the right; 'tb' is trace-back info, 'val' the exception's associated value, and 'exc' the exception.) Value stack Label Instruction Argument [] SETUP_EXCEPT L1 [] [] POP_BLOCK [] JUMP_FORWARD L0 [tb, val, exc] L1: DUP ) [tb, val, exc, exc] ) [tb, val, exc, exc, E1] COMPARE_OP EXC_MATCH ) only if E1 [tb, val, exc, 1-or-0] JUMP_IF_FALSE L2 ) [tb, val, exc, 1] POP ) [tb, val, exc] POP [tb, val] (or POP if no V1) [tb] POP [] JUMP_FORWARD L0 [tb, val, exc, 0] L2: POP [tb, val, exc] DUP .............................etc....................... [tb, val, exc, 0] Ln+1: POP [tb, val, exc] END_FINALLY # re-raise exception [] L0: Of course, parts are not generated if Vi or Ei is not present. */ static void com_try_except(struct compiling *c, node *n) { int except_anchor = 0; int end_anchor = 0; int else_anchor = 0; int i; node *ch; com_addfwref(c, SETUP_EXCEPT, &except_anchor); block_push(c, SETUP_EXCEPT); com_node(c, CHILD(n, 2)); com_addbyte(c, POP_BLOCK); block_pop(c, SETUP_EXCEPT); com_addfwref(c, JUMP_FORWARD, &else_anchor); com_backpatch(c, except_anchor); for (i = 3; i < NCH(n) && TYPE(ch = CHILD(n, i)) == except_clause; i += 3) { /* except_clause: 'except' [expr [',' var]] */ if (except_anchor == 0) { com_error(c, PyExc_SyntaxError, "default 'except:' must be last"); break; } except_anchor = 0; com_push(c, 3); /* tb, val, exc pushed by exception */ com_addoparg(c, SET_LINENO, ch->n_lineno); if (NCH(ch) > 1) { com_addbyte(c, DUP_TOP); com_push(c, 1); com_node(c, CHILD(ch, 1)); com_addoparg(c, COMPARE_OP, EXC_MATCH); com_pop(c, 1); com_addfwref(c, JUMP_IF_FALSE, &except_anchor); com_addbyte(c, POP_TOP); com_pop(c, 1); } com_addbyte(c, POP_TOP); com_pop(c, 1); if (NCH(ch) > 3) com_assign(c, CHILD(ch, 3), OP_ASSIGN, NULL); else { com_addbyte(c, POP_TOP); com_pop(c, 1); } com_addbyte(c, POP_TOP); com_pop(c, 1); com_node(c, CHILD(n, i+2)); com_addfwref(c, JUMP_FORWARD, &end_anchor); if (except_anchor) { com_backpatch(c, except_anchor); /* We come in with [tb, val, exc, 0] on the stack; one pop and it's the same as expected at the start of the loop */ com_addbyte(c, POP_TOP); } } /* We actually come in here with [tb, val, exc] but the END_FINALLY will zap those and jump around. The c_stacklevel does not reflect them so we need not pop anything. */ com_addbyte(c, END_FINALLY); com_backpatch(c, else_anchor); if (i < NCH(n)) com_node(c, CHILD(n, i+2)); com_backpatch(c, end_anchor); } static void com_try_finally(struct compiling *c, node *n) { int finally_anchor = 0; node *ch; com_addfwref(c, SETUP_FINALLY, &finally_anchor); block_push(c, SETUP_FINALLY); com_node(c, CHILD(n, 2)); com_addbyte(c, POP_BLOCK); block_pop(c, SETUP_FINALLY); block_push(c, END_FINALLY); com_addoparg(c, LOAD_CONST, com_addconst(c, Py_None)); /* While the generated code pushes only one item, the try-finally handling can enter here with up to three items. OK, here are the details: 3 for an exception, 2 for RETURN, 1 for BREAK. */ com_push(c, 3); com_backpatch(c, finally_anchor); ch = CHILD(n, NCH(n)-1); com_addoparg(c, SET_LINENO, ch->n_lineno); com_node(c, ch); com_addbyte(c, END_FINALLY); block_pop(c, END_FINALLY); com_pop(c, 3); /* Matches the com_push above */ } static void com_try_stmt(struct compiling *c, node *n) { REQ(n, try_stmt); /* 'try' ':' suite (except_clause ':' suite)+ ['else' ':' suite] | 'try' ':' suite 'finally' ':' suite */ if (TYPE(CHILD(n, 3)) != except_clause) com_try_finally(c, n); else com_try_except(c, n); } static node * get_rawdocstring(node *n) { int i; /* Label to avoid tail recursion */ next: switch (TYPE(n)) { case suite: if (NCH(n) == 1) { n = CHILD(n, 0); goto next; } /* Fall through */ case file_input: for (i = 0; i < NCH(n); i++) { node *ch = CHILD(n, i); if (TYPE(ch) == stmt) { n = ch; goto next; } } break; case stmt: case simple_stmt: case small_stmt: n = CHILD(n, 0); goto next; case expr_stmt: case testlist: case test: case and_test: case not_test: case comparison: case expr: case xor_expr: case and_expr: case shift_expr: case arith_expr: case term: case factor: case power: if (NCH(n) == 1) { n = CHILD(n, 0); goto next; } break; case atom: if (TYPE(CHILD(n, 0)) == STRING) return n; break; } return NULL; } static PyObject * get_docstring(node *n) { /* Don't generate doc-strings if run with -OO */ if (Py_OptimizeFlag > 1) return NULL; n = get_rawdocstring(n); if (n == NULL) return NULL; return parsestrplus(n); } static void com_suite(struct compiling *c, node *n) { REQ(n, suite); /* simple_stmt | NEWLINE INDENT NEWLINE* (stmt NEWLINE*)+ DEDENT */ if (NCH(n) == 1) { com_node(c, CHILD(n, 0)); } else { int i; for (i = 0; i < NCH(n); i++) { node *ch = CHILD(n, i); if (TYPE(ch) == stmt) com_node(c, ch); } } } /* ARGSUSED */ static void com_continue_stmt(struct compiling *c, node *n) { int i = c->c_nblocks; if (i-- > 0 && c->c_block[i] == SETUP_LOOP) { com_addoparg(c, JUMP_ABSOLUTE, c->c_begin); } else if (i <= 0) { /* at the outer level */ com_error(c, PyExc_SyntaxError, "'continue' not properly in loop"); } else { int j; for (j = 0; j <= i; ++j) { if (c->c_block[j] == SETUP_LOOP) break; } if (j < i+1) { /* there is a loop, but something interferes */ for (++j; j <= i; ++j) { if (c->c_block[i] == SETUP_EXCEPT || c->c_block[i] == SETUP_FINALLY) { com_error(c, PyExc_SyntaxError, "'continue' not supported inside 'try' clause"); return; } } } com_error(c, PyExc_SyntaxError, "'continue' not properly in loop"); } /* XXX Could allow it inside a 'finally' clause XXX if we could pop the exception still on the stack */ } static int com_argdefs(struct compiling *c, node *n) { int i, nch, nargs, ndefs; if (TYPE(n) == lambdef) { /* lambdef: 'lambda' [varargslist] ':' test */ n = CHILD(n, 1); } else { REQ(n, funcdef); /* funcdef: 'def' NAME parameters ... */ n = CHILD(n, 2); REQ(n, parameters); /* parameters: '(' [varargslist] ')' */ n = CHILD(n, 1); } if (TYPE(n) != varargslist) return 0; /* varargslist: (fpdef ['=' test] ',')* '*' ....... | fpdef ['=' test] (',' fpdef ['=' test])* [','] */ nch = NCH(n); nargs = 0; ndefs = 0; for (i = 0; i < nch; i++) { int t; if (TYPE(CHILD(n, i)) == STAR || TYPE(CHILD(n, i)) == DOUBLESTAR) break; nargs++; i++; if (i >= nch) t = RPAR; /* Anything except EQUAL or COMMA */ else t = TYPE(CHILD(n, i)); if (t == EQUAL) { i++; ndefs++; com_node(c, CHILD(n, i)); i++; if (i >= nch) break; t = TYPE(CHILD(n, i)); } else { /* Treat "(a=1, b)" as an error */ if (ndefs) com_error(c, PyExc_SyntaxError, "non-default argument follows default argument"); } if (t != COMMA) break; } return ndefs; } static void com_funcdef(struct compiling *c, node *n) { PyObject *v; int ndefs; REQ(n, funcdef); /* funcdef: 'def' NAME parameters ':' suite */ ndefs = com_argdefs(c, n); symtable_enter_scope(c->c_symtable, STR(CHILD(n, 1)), TYPE(n)); v = (PyObject *)icompile(n, c); symtable_exit_scope(c->c_symtable); if (v == NULL) c->c_errors++; else { int i = com_addconst(c, v); com_addoparg(c, LOAD_CONST, i); com_push(c, 1); com_addoparg(c, MAKE_FUNCTION, ndefs); com_pop(c, ndefs); com_addop_varname(c, VAR_STORE, STR(CHILD(n, 1))); com_pop(c, 1); Py_DECREF(v); } } static void com_bases(struct compiling *c, node *n) { int i; REQ(n, testlist); /* testlist: test (',' test)* [','] */ for (i = 0; i < NCH(n); i += 2) com_node(c, CHILD(n, i)); i = (NCH(n)+1) / 2; com_addoparg(c, BUILD_TUPLE, i); com_pop(c, i-1); } static void com_classdef(struct compiling *c, node *n) { int i; PyObject *v; char *name; REQ(n, classdef); /* classdef: class NAME ['(' testlist ')'] ':' suite */ if ((v = PyString_InternFromString(STR(CHILD(n, 1)))) == NULL) { c->c_errors++; return; } /* Push the class name on the stack */ i = com_addconst(c, v); com_addoparg(c, LOAD_CONST, i); com_push(c, 1); Py_DECREF(v); /* Push the tuple of base classes on the stack */ if (TYPE(CHILD(n, 2)) != LPAR) { com_addoparg(c, BUILD_TUPLE, 0); com_push(c, 1); } else com_bases(c, CHILD(n, 3)); name = STR(CHILD(n, 1)); symtable_enter_scope(c->c_symtable, name, TYPE(n)); v = (PyObject *)icompile(n, c); symtable_exit_scope(c->c_symtable); if (v == NULL) c->c_errors++; else { i = com_addconst(c, v); com_addoparg(c, LOAD_CONST, i); com_push(c, 1); com_addoparg(c, MAKE_FUNCTION, 0); com_addoparg(c, CALL_FUNCTION, 0); com_addbyte(c, BUILD_CLASS); com_pop(c, 2); com_addop_varname(c, VAR_STORE, STR(CHILD(n, 1))); Py_DECREF(v); } } static void com_node(struct compiling *c, node *n) { loop: switch (TYPE(n)) { /* Definition nodes */ case funcdef: com_funcdef(c, n); break; case classdef: com_classdef(c, n); break; /* Trivial parse tree nodes */ case stmt: case small_stmt: case flow_stmt: n = CHILD(n, 0); goto loop; case simple_stmt: /* small_stmt (';' small_stmt)* [';'] NEWLINE */ com_addoparg(c, SET_LINENO, n->n_lineno); { int i; for (i = 0; i < NCH(n)-1; i += 2) com_node(c, CHILD(n, i)); } break; case compound_stmt: com_addoparg(c, SET_LINENO, n->n_lineno); n = CHILD(n, 0); goto loop; /* Statement nodes */ case expr_stmt: com_expr_stmt(c, n); break; case print_stmt: com_print_stmt(c, n); break; case del_stmt: /* 'del' exprlist */ com_assign(c, CHILD(n, 1), OP_DELETE, NULL); break; case pass_stmt: break; case break_stmt: if (c->c_loops == 0) { com_error(c, PyExc_SyntaxError, "'break' outside loop"); } com_addbyte(c, BREAK_LOOP); break; case continue_stmt: com_continue_stmt(c, n); break; case return_stmt: com_return_stmt(c, n); break; case raise_stmt: com_raise_stmt(c, n); break; case import_stmt: com_import_stmt(c, n); break; case global_stmt: break; case exec_stmt: com_exec_stmt(c, n); break; case assert_stmt: com_assert_stmt(c, n); break; case if_stmt: com_if_stmt(c, n); break; case while_stmt: com_while_stmt(c, n); break; case for_stmt: com_for_stmt(c, n); break; case try_stmt: com_try_stmt(c, n); break; case suite: com_suite(c, n); break; /* Expression nodes */ case testlist: com_list(c, n, 0); break; case test: com_test(c, n); break; case and_test: com_and_test(c, n); break; case not_test: com_not_test(c, n); break; case comparison: com_comparison(c, n); break; case exprlist: com_list(c, n, 0); break; case expr: com_expr(c, n); break; case xor_expr: com_xor_expr(c, n); break; case and_expr: com_and_expr(c, n); break; case shift_expr: com_shift_expr(c, n); break; case arith_expr: com_arith_expr(c, n); break; case term: com_term(c, n); break; case factor: com_factor(c, n); break; case power: com_power(c, n); break; case atom: com_atom(c, n); break; default: /* XXX fprintf(stderr, "node type %d\n", TYPE(n)); */ com_error(c, PyExc_SystemError, "com_node: unexpected node type"); } } static void com_fplist(struct compiling *, node *); static void com_fpdef(struct compiling *c, node *n) { REQ(n, fpdef); /* fpdef: NAME | '(' fplist ')' */ if (TYPE(CHILD(n, 0)) == LPAR) com_fplist(c, CHILD(n, 1)); else { com_addop_varname(c, VAR_STORE, STR(CHILD(n, 0))); com_pop(c, 1); } } static void com_fplist(struct compiling *c, node *n) { REQ(n, fplist); /* fplist: fpdef (',' fpdef)* [','] */ if (NCH(n) == 1) { com_fpdef(c, CHILD(n, 0)); } else { int i = (NCH(n)+1)/2; com_addoparg(c, UNPACK_SEQUENCE, i); com_push(c, i-1); for (i = 0; i < NCH(n); i += 2) com_fpdef(c, CHILD(n, i)); } } /* XXX This function could probably be made simpler, because it doesn't do anything except generate code for complex arguments. */ static void com_arglist(struct compiling *c, node *n) { int nch, i; int complex = 0; char nbuf[10]; REQ(n, varargslist); /* varargslist: (fpdef ['=' test] ',')* (fpdef ['=' test] | '*' .....) */ nch = NCH(n); /* Enter all arguments in table of locals */ for (i = 0; i < nch; i++) { node *ch = CHILD(n, i); node *fp; char *name; if (TYPE(ch) == STAR || TYPE(ch) == DOUBLESTAR) break; REQ(ch, fpdef); /* fpdef: NAME | '(' fplist ')' */ fp = CHILD(ch, 0); if (TYPE(fp) == NAME) name = STR(fp); else { name = nbuf; sprintf(nbuf, ".%d", i); complex = 1; } /* all name updates handled by symtable */ if (++i >= nch) break; ch = CHILD(n, i); if (TYPE(ch) == EQUAL) i += 2; else REQ(ch, COMMA); } /* Handle *arguments */ if (i < nch) { node *ch; ch = CHILD(n, i); if (TYPE(ch) != DOUBLESTAR) { REQ(ch, STAR); ch = CHILD(n, i+1); if (TYPE(ch) == NAME) { i += 3; } } } /* Handle **keywords */ if (i < nch) { node *ch; ch = CHILD(n, i); if (TYPE(ch) != DOUBLESTAR) { REQ(ch, STAR); ch = CHILD(n, i+1); REQ(ch, STAR); ch = CHILD(n, i+2); } else ch = CHILD(n, i+1); REQ(ch, NAME); } if (complex) { /* Generate code for complex arguments only after having counted the simple arguments */ int ilocal = 0; for (i = 0; i < nch; i++) { node *ch = CHILD(n, i); node *fp; if (TYPE(ch) == STAR || TYPE(ch) == DOUBLESTAR) break; REQ(ch, fpdef); /* fpdef: NAME | '(' fplist ')' */ fp = CHILD(ch, 0); if (TYPE(fp) != NAME) { com_addoparg(c, LOAD_FAST, ilocal); com_push(c, 1); com_fpdef(c, ch); } ilocal++; if (++i >= nch) break; ch = CHILD(n, i); if (TYPE(ch) == EQUAL) i += 2; else REQ(ch, COMMA); } } } static void com_file_input(struct compiling *c, node *n) { int i; PyObject *doc; REQ(n, file_input); /* (NEWLINE | stmt)* ENDMARKER */ doc = get_docstring(n); if (doc != NULL) { int i = com_addconst(c, doc); Py_DECREF(doc); com_addoparg(c, LOAD_CONST, i); com_push(c, 1); com_addop_name(c, STORE_NAME, "__doc__"); com_pop(c, 1); } for (i = 0; i < NCH(n); i++) { node *ch = CHILD(n, i); if (TYPE(ch) != ENDMARKER && TYPE(ch) != NEWLINE) com_node(c, ch); } } /* Top-level compile-node interface */ static void compile_funcdef(struct compiling *c, node *n) { PyObject *doc; node *ch; REQ(n, funcdef); /* funcdef: 'def' NAME parameters ':' suite */ c->c_name = STR(CHILD(n, 1)); doc = get_docstring(CHILD(n, 4)); if (doc != NULL) { (void) com_addconst(c, doc); Py_DECREF(doc); } else (void) com_addconst(c, Py_None); /* No docstring */ ch = CHILD(n, 2); /* parameters: '(' [varargslist] ')' */ ch = CHILD(ch, 1); /* ')' | varargslist */ if (TYPE(ch) == varargslist) com_arglist(c, ch); c->c_infunction = 1; com_node(c, CHILD(n, 4)); c->c_infunction = 0; com_addoparg(c, LOAD_CONST, com_addconst(c, Py_None)); com_push(c, 1); com_addbyte(c, RETURN_VALUE); com_pop(c, 1); } static void compile_lambdef(struct compiling *c, node *n) { node *ch; REQ(n, lambdef); /* lambdef: 'lambda' [varargslist] ':' test */ c->c_name = ""; ch = CHILD(n, 1); (void) com_addconst(c, Py_None); /* No docstring */ if (TYPE(ch) == varargslist) { com_arglist(c, ch); ch = CHILD(n, 3); } else ch = CHILD(n, 2); com_node(c, ch); com_addbyte(c, RETURN_VALUE); com_pop(c, 1); } static void compile_classdef(struct compiling *c, node *n) { node *ch; PyObject *doc; REQ(n, classdef); /* classdef: 'class' NAME ['(' testlist ')'] ':' suite */ c->c_name = STR(CHILD(n, 1)); c->c_private = c->c_name; ch = CHILD(n, NCH(n)-1); /* The suite */ doc = get_docstring(ch); if (doc != NULL) { int i = com_addconst(c, doc); Py_DECREF(doc); com_addoparg(c, LOAD_CONST, i); com_push(c, 1); com_addop_name(c, STORE_NAME, "__doc__"); com_pop(c, 1); } else (void) com_addconst(c, Py_None); com_node(c, ch); com_addbyte(c, LOAD_LOCALS); com_push(c, 1); com_addbyte(c, RETURN_VALUE); com_pop(c, 1); } static void compile_node(struct compiling *c, node *n) { com_addoparg(c, SET_LINENO, n->n_lineno); switch (TYPE(n)) { case single_input: /* One interactive command */ /* NEWLINE | simple_stmt | compound_stmt NEWLINE */ c->c_interactive++; n = CHILD(n, 0); if (TYPE(n) != NEWLINE) com_node(c, n); com_addoparg(c, LOAD_CONST, com_addconst(c, Py_None)); com_push(c, 1); com_addbyte(c, RETURN_VALUE); com_pop(c, 1); c->c_interactive--; break; case file_input: /* A whole file, or built-in function exec() */ com_file_input(c, n); com_addoparg(c, LOAD_CONST, com_addconst(c, Py_None)); com_push(c, 1); com_addbyte(c, RETURN_VALUE); com_pop(c, 1); break; case eval_input: /* Built-in function input() */ com_node(c, CHILD(n, 0)); com_addbyte(c, RETURN_VALUE); com_pop(c, 1); break; case lambdef: /* anonymous function definition */ compile_lambdef(c, n); break; case funcdef: /* A function definition */ compile_funcdef(c, n); break; case classdef: /* A class definition */ compile_classdef(c, n); break; default: /* XXX fprintf(stderr, "node type %d\n", TYPE(n)); */ com_error(c, PyExc_SystemError, "compile_node: unexpected node type"); } } PyCodeObject * PyNode_Compile(node *n, char *filename) { return jcompile(n, filename, NULL); } static PyCodeObject * icompile(node *n, struct compiling *base) { return jcompile(n, base->c_filename, base); } static PyCodeObject * jcompile(node *n, char *filename, struct compiling *base) { struct compiling sc; PyCodeObject *co; if (!com_init(&sc, filename)) return NULL; if (base) { sc.c_private = base->c_private; sc.c_symtable = base->c_symtable; } else { sc.c_private = NULL; if (symtable_build(&sc, n) < 0) { com_free(&sc); return NULL; } } co = NULL; if (symtable_load_symbols(&sc) < 0) goto exit; compile_node(&sc, n); com_done(&sc); if (sc.c_errors == 0) { PyObject *consts, *names, *varnames, *filename, *name; consts = PyList_AsTuple(sc.c_consts); names = PyList_AsTuple(sc.c_names); varnames = PyList_AsTuple(sc.c_varnames); filename = PyString_InternFromString(sc.c_filename); name = PyString_InternFromString(sc.c_name); if (!PyErr_Occurred()) co = PyCode_New(sc.c_argcount, sc.c_nlocals, sc.c_maxstacklevel, sc.c_flags, sc.c_code, consts, names, varnames, filename, name, sc.c_firstlineno, sc.c_lnotab); Py_XDECREF(consts); Py_XDECREF(names); Py_XDECREF(varnames); Py_XDECREF(filename); Py_XDECREF(name); } else if (!PyErr_Occurred()) { /* This could happen if someone called PyErr_Clear() after an error was reported above. That's not supposed to happen, but I just plugged one case and I'm not sure there can't be others. In that case, raise SystemError so that at least it gets reported instead dumping core. */ PyErr_SetString(PyExc_SystemError, "lost syntax error"); } exit: if (base == NULL) symtable_free(sc.c_symtable); com_free(&sc); return co; } int PyCode_Addr2Line(PyCodeObject *co, int addrq) { int size = PyString_Size(co->co_lnotab) / 2; unsigned char *p = (unsigned char*)PyString_AsString(co->co_lnotab); int line = co->co_firstlineno; int addr = 0; while (--size >= 0) { addr += *p++; if (addr > addrq) break; line += *p++; } return line; } static int is_local(struct compiling *c, char *name) { if (PyDict_GetItemString(c->c_locals, name) != NULL) return 1; else return 0; } static int is_global(struct compiling *c, char *name) { PyObject *v; v = PyDict_GetItemString(c->c_globals, name); if (v == NULL) return 0; else if (v == Py_None) return IMPLICIT_GLOBAL; else return EXPLICIT_GLOBAL; } static int symtable_build(struct compiling *c, node *n) { if ((c->c_symtable = symtable_init()) == NULL) return -1; if (symtable_enter_scope(c->c_symtable, GLOBAL, TYPE(n)) < 0) return -1; symtable_node(c->c_symtable, n); /* reset for second pass */ c->c_symtable->st_scopes = 1; return 0; } static int symtable_load_symbols(struct compiling *c) { static PyObject *global = NULL; PyObject *name, *v, *varnames; int i, info, count, pos; struct symtable *st = c->c_symtable; varnames = PyDict_GetItem(st->st_varnames, st->st_cur_id); if (varnames == NULL) { varnames = PyList_New(0); if (varnames == NULL) return -1; } else Py_INCREF(varnames); c->c_varnames = varnames; count = PyList_GET_SIZE(varnames); c->c_argcount = count; for (i = 0; i < count; ++i) { v = PyInt_FromLong(i); if (PyDict_SetItem(c->c_locals, PyList_GET_ITEM(varnames, i), v) < 0) return -1; } /* XXX The cases below define the rules for whether a name is local or global. The logic could probably be clearer. */ pos = 0; while (PyDict_Next(st->st_cur, &pos, &name, &v)) { info = PyInt_AS_LONG(v); if (info & DEF_STAR) { c->c_argcount--; c->c_flags |= CO_VARARGS; } else if (info & DEF_DOUBLESTAR) { c->c_argcount--; c->c_flags |= CO_VARKEYWORDS; } else if (info & DEF_INTUPLE) c->c_argcount--; else if (info & DEF_GLOBAL) { if ((info & DEF_PARAM) && (PyString_AS_STRING(name)[0] != '.')){ char buf[500]; sprintf(buf, "name '%.400s' is local and global", PyString_AS_STRING(name)); com_error(c, PyExc_SyntaxError, buf); return -1; } if (global == NULL) { global = PyInt_FromLong(1); if (global == NULL) { return -1; } } if (PyDict_SetItem(c->c_globals, name, global) < 0) return -1; } else if ((info & USE) && !(info & (DEF_LOCAL | DEF_PARAM))) { if (PyDict_SetItem(c->c_globals, name, Py_None) < 0) return -1; } else if ((info & DEF_LOCAL) && !(info & DEF_PARAM)) { v = PyInt_FromLong(count++); if (PyDict_SetItem(c->c_locals, name, v) < 0) return -1; if (st->st_cur_type != TYPE_CLASS) if (PyList_Append(c->c_varnames, name) < 0) return -1; } } if (st->st_cur_type == TYPE_FUNCTION) c->c_nlocals = count; if (st->st_cur_type != TYPE_MODULE) c->c_flags |= CO_NEWLOCALS; if ((st->st_cur_type == TYPE_FUNCTION) && (PyDict_GetItemString(st->st_cur, NOOPT) == NULL)) c->c_flags |= CO_OPTIMIZED; return 0; } static struct symtable * symtable_init() { struct symtable *st; PyObject *d; st = (struct symtable *)PyMem_Malloc(sizeof(struct symtable)); if (st == NULL) return NULL; if ((st->st_namespaces = PyList_New(0)) == NULL) goto fail; if ((st->st_types = PyList_New(0)) == NULL) goto fail; if ((st->st_symbols = PyDict_New()) == NULL) goto fail; if ((st->st_varnames = PyDict_New()) == NULL) goto fail; if ((d = PyDict_New()) == NULL) goto fail; if (PyDict_SetItemString(st->st_symbols, GLOBAL, d) < 0) goto fail; st->st_global = d; st->st_cur = NULL; st->st_cur_id = NULL; st->st_cur_type = 0; st->st_scopes = 0; st->st_errors = 0; st->st_tmpname = 0; st->st_private = NULL; return st; fail: symtable_free(st); return NULL; } static void symtable_free(struct symtable *st) { Py_XDECREF(st->st_symbols); Py_XDECREF(st->st_varnames); Py_XDECREF(st->st_namespaces); Py_XDECREF(st->st_types); Py_XDECREF(st->st_cur_id); PyMem_Free((void *)st); } /* XXX name isn't used ... */ static int symtable_enter_scope(struct symtable *st, char *name, int type) { PyObject *o; o = PyInt_FromLong(st->st_scopes++); if (o == NULL) return -1; if (PyList_Append(st->st_namespaces, o) < 0) return -1; switch (type) { case funcdef: case lambdef: st->st_cur_type = TYPE_FUNCTION; break; case classdef: st->st_cur_type = TYPE_CLASS; break; case single_input: case eval_input: case file_input: st->st_cur_type = TYPE_MODULE; break; default: fprintf(stderr, "invalid symtable scope: %d\n", type); } o = PyInt_FromLong(st->st_cur_type); if (o == NULL) return -1; if (PyList_Append(st->st_types, o) < 0) return -1; return symtable_update_cur(st); } static int symtable_exit_scope(struct symtable *st) { PyObject *o; int end; end = PyList_GET_SIZE(st->st_namespaces) - 1; if (PySequence_DelItem(st->st_namespaces, end) < 0) return -1; if (PySequence_DelItem(st->st_types, end) < 0) return -1; o = PyList_GET_ITEM(st->st_types, end - 1); st->st_cur_type = PyInt_AS_LONG(o); return symtable_update_cur(st); } static int symtable_update_cur(struct symtable *st) { PyObject *s, *d, *l; int end; end = PyList_GET_SIZE(st->st_namespaces) - 1; s = PyList_GET_ITEM(st->st_namespaces, end); st->st_cur_id = s; d = PyDict_GetItem(st->st_symbols, s); if (d == NULL) { if ((d = PyDict_New()) == NULL) return -1; if (PyObject_SetItem(st->st_symbols, s, d) < 0) { Py_DECREF(d); return -1; } if (st->st_cur_type == TYPE_FUNCTION) { if ((l = PyList_New(0)) == NULL) return -1; if (PyDict_SetItem(st->st_varnames, s, l) < 0) return -1; } } st->st_cur = d; return 0; } static int symtable_mangle(struct symtable *st, char *name, char *buffer, size_t maxlen) { return mangle(st->st_private, name, buffer, maxlen); } static int symtable_add_def(struct symtable *st, char *name, int scope) { PyObject *s, *o; int val; char buffer[MANGLE_LEN]; if (symtable_mangle(st, name, buffer, sizeof(buffer))) name = buffer; if ((s = PyString_InternFromString(name)) == NULL) return -1; if ((o = PyDict_GetItem(st->st_cur, s))) { val = PyInt_AS_LONG(o); if ((scope & DEF_PARAM) && (val & DEF_PARAM)) { PyErr_Format(PyExc_SyntaxError, "duplicate argument '%s' in function definition", name); return -1; } val |= scope; } else val = scope; o = PyInt_FromLong(val); if (PyDict_SetItem(st->st_cur, s, o) < 0) { Py_DECREF(o); return -1; } Py_DECREF(o); if (scope & DEF_PARAM) { PyObject *l = PyDict_GetItem(st->st_varnames, st->st_cur_id); if (l == NULL) return -1; if (PyList_Append(l, s) < 0) return -1; } else if (scope & DEF_GLOBAL) { if ((o = PyDict_GetItem(st->st_global, s))) { val = PyInt_AS_LONG(o); val |= scope; } else val = scope; o = PyInt_FromLong(val); if (PyDict_SetItem(st->st_global, s, o) < 0) { Py_DECREF(o); return -1; } Py_DECREF(o); } return 0; } static int symtable_add_use(struct symtable *st, char *name) { PyObject *s, *o; int val; char buffer[MANGLE_LEN]; if (symtable_mangle(st, name, buffer, sizeof(buffer))) name = buffer; /* fprintf(stderr, "add_use(%s)\n", name); */ if ((s = PyString_InternFromString(name)) == NULL) return -1; if ((o = PyDict_GetItem(st->st_cur, s))) { val = PyInt_AS_LONG(o); val |= USE; } else val = USE; o = PyInt_FromLong(val); if (PyDict_SetItem(st->st_cur, s, o) < 0) { Py_DECREF(o); return -1; } Py_DECREF(o); return 0; } static void symtable_node(struct symtable *st, node *n) { int i, start = 0; loop: switch (TYPE(n)) { case funcdef: { char *func_name = STR(CHILD(n, 1)); symtable_add_def(st, func_name, DEF_LOCAL); symtable_default_args(st, CHILD(n, 2)); symtable_enter_scope(st, func_name, TYPE(n)); symtable_funcdef(st, n); symtable_exit_scope(st); break; } case lambdef: if (NCH(n) == 4) symtable_default_args(st, CHILD(n, 1)); symtable_enter_scope(st, "lambda", TYPE(n)); symtable_funcdef(st, n); symtable_exit_scope(st); break; case classdef: { char *tmp, *class_name = STR(CHILD(n, 1)); symtable_add_def(st, class_name, DEF_LOCAL); if (TYPE(CHILD(n, 2)) == LPAR) { node *bases = CHILD(n, 3); int i; for (i = 0; i < NCH(bases); i += 2) { symtable_node(st, CHILD(bases, i)); } } symtable_enter_scope(st, class_name, TYPE(n)); tmp = st->st_private; st->st_private = class_name; symtable_node(st, CHILD(n, NCH(n) - 1)); st->st_private = tmp; symtable_exit_scope(st); break; } case if_stmt: for (i = 0; i + 3 < NCH(n); i += 4) { if (is_constant_false(NULL, (CHILD(n, i + 1)))) continue; symtable_node(st, CHILD(n, i + 1)); symtable_node(st, CHILD(n, i + 3)); } if (i + 2 < NCH(n)) symtable_node(st, CHILD(n, i + 2)); break; case global_stmt: symtable_global(st, n); break; case import_stmt: symtable_import(st, n); break; case exec_stmt: if (PyDict_SetItemString(st->st_cur, NOOPT, Py_None) < 0) st->st_errors++; symtable_node(st, CHILD(n, 1)); if (NCH(n) > 2) symtable_node(st, CHILD(n, 3)); if (NCH(n) > 4) symtable_node(st, CHILD(n, 5)); break; case except_clause: if (NCH(n) == 4) symtable_assign(st, CHILD(n, 3)); if (NCH(n) > 1) { n = CHILD(n, 1); goto loop; } break; case del_stmt: symtable_assign(st, CHILD(n, 1)); break; case expr_stmt: if (NCH(n) == 1) n = CHILD(n, 0); else { if (TYPE(CHILD(n, 1)) == augassign) { symtable_assign(st, CHILD(n, 0)); symtable_node(st, CHILD(n, 2)); break; } else { int i; for (i = 0; i < NCH(n) - 2; i += 2) symtable_assign(st, CHILD(n, i)); n = CHILD(n, NCH(n) - 1); } } goto loop; /* watchout for fall-through logic below */ case listmaker: if (NCH(n) > 1 && TYPE(CHILD(n, 1)) == list_for) { symtable_list_comprehension(st, CHILD(n, 1)); n = CHILD(n, 0); goto loop; } case atom: if (TYPE(n) == atom && TYPE(CHILD(n, 0)) == NAME) { symtable_add_use(st, STR(CHILD(n, 0))); break; } case for_stmt: if (TYPE(n) == for_stmt) { symtable_assign(st, CHILD(n, 1)); start = 3; } default: if (NCH(n) == 1) { n = CHILD(n, 0); goto loop; } for (i = start; i < NCH(n); ++i) if (TYPE(CHILD(n, i)) >= single_input) symtable_node(st, CHILD(n, i)); } } static void symtable_funcdef(struct symtable *st, node *n) { node *body; if (TYPE(n) == lambdef) { if (NCH(n) == 4) symtable_params(st, CHILD(n, 1)); } else symtable_params(st, CHILD(n, 2)); body = CHILD(n, NCH(n) - 1); symtable_node(st, body); } /* The next two functions parse the argument tuple. symtable_default_arg() checks for names in the default arguments, which are references in the defining scope. symtable_params() parses the parameter names, which are defined in the function's body. varargslist: (fpdef ['=' test] ',')* ('*' NAME [',' '**' NAME] | '**' NAME) | fpdef ['=' test] (',' fpdef ['=' test])* [','] */ static void symtable_default_args(struct symtable *st, node *n) { node *c; int i; if (TYPE(n) == parameters) { n = CHILD(n, 1); if (TYPE(n) == RPAR) return; } REQ(n, varargslist); for (i = 0; i < NCH(n); i += 2) { c = CHILD(n, i); if (TYPE(c) == STAR || TYPE(c) == DOUBLESTAR) { break; } if (i > 0 && (TYPE(CHILD(n, i - 1)) == EQUAL)) symtable_node(st, CHILD(n, i)); } } static void symtable_params(struct symtable *st, node *n) { int i, complex = 0, ext = 0; node *c = NULL; if (TYPE(n) == parameters) { n = CHILD(n, 1); if (TYPE(n) == RPAR) return; } REQ(n, varargslist); for (i = 0; i < NCH(n); i += 2) { c = CHILD(n, i); if (TYPE(c) == STAR || TYPE(c) == DOUBLESTAR) { ext = 1; break; } if (TYPE(c) == test) { continue; } if (TYPE(CHILD(c, 0)) == NAME) symtable_add_def(st, STR(CHILD(c, 0)), DEF_PARAM); else { char nbuf[10]; sprintf(nbuf, ".%d", i); symtable_add_def(st, nbuf, DEF_PARAM); complex = 1; } } if (complex) { int j; for (j = 0; j < i; j += 2) { c = CHILD(n, j); if (TYPE(CHILD(c, 0)) == LPAR) symtable_params_fplist(st, CHILD(c, 1)); } } if (ext) { c = CHILD(n, i); if (TYPE(c) == STAR) { i++; symtable_add_def(st, STR(CHILD(n, i)), DEF_PARAM | DEF_STAR); i += 2; if (i >= NCH(n)) return; c = CHILD(n, i); } if (TYPE(c) == DOUBLESTAR) { i++; symtable_add_def(st, STR(CHILD(n, i)), DEF_PARAM | DEF_DOUBLESTAR); } } } static void symtable_params_fplist(struct symtable *st, node *n) { int i; node *c; REQ(n, fplist); for (i = 0; i < NCH(n); i += 2) { c = CHILD(n, i); REQ(c, fpdef); if (NCH(c) == 1) symtable_add_def(st, STR(CHILD(c, 0)), DEF_PARAM | DEF_INTUPLE); else symtable_params_fplist(st, CHILD(c, 1)); } } static void symtable_global(struct symtable *st, node *n) { int i; for (i = 1; i < NCH(n); i += 2) symtable_add_def(st, STR(CHILD(n, i)), DEF_GLOBAL); } static void symtable_list_comprehension(struct symtable *st, node *n) { char tmpname[12]; sprintf(tmpname, "[%d]", ++st->st_tmpname); symtable_add_def(st, tmpname, DEF_LOCAL); symtable_assign(st, CHILD(n, 1)); symtable_node(st, CHILD(n, 3)); if (NCH(n) == 5) symtable_node(st, CHILD(n, 4)); --st->st_tmpname; } static void symtable_import(struct symtable *st, node *n) { int i; /* import_stmt: 'import' dotted_as_name (',' dotted_as_name)* | 'from' dotted_name 'import' ('*' | import_as_name (',' import_as_name)*) import_as_name: NAME [NAME NAME] */ if (STR(CHILD(n, 0))[0] == 'f') { /* from */ if (TYPE(CHILD(n, 3)) == STAR) { if (PyDict_SetItemString(st->st_cur, NOOPT, Py_None) < 0) st->st_errors++; } else { for (i = 3; i < NCH(n); i += 2) { node *c = CHILD(n, i); if (NCH(c) > 1) /* import as */ symtable_assign(st, CHILD(c, 2)); else symtable_assign(st, CHILD(c, 0)); } } } else { for (i = 1; i < NCH(n); i += 2) { symtable_assign(st, CHILD(n, i)); } } } static void symtable_assign(struct symtable *st, node *n) { node *tmp; int i; for (;;) { /* fprintf(stderr, "symtable_assign(%d, %d)\n", TYPE(n), NCH(n)); */ switch (TYPE(n)) { case power: /* not sure that NCH(n) > 1 always means that none of the left-hand side names are targets of assignments */ if (NCH(n) > 2) { for (i = 2; i < NCH(n); ++i) if (TYPE(CHILD(n, i)) != DOUBLESTAR) symtable_node(st, CHILD(n, i)); } if (NCH(n) > 1) { symtable_node(st, CHILD(n, 0)); symtable_node(st, CHILD(n, 1)); } else { n = CHILD(n, 0); continue; } return; case listmaker: if (NCH(n) > 1 && TYPE(CHILD(n, 1)) == list_for) symtable_list_comprehension(st, CHILD(n, 1)); else { for (i = 0; i < NCH(n); i += 2) symtable_assign(st, CHILD(n, i)); } return; case exprlist: case testlist: if (NCH(n) == 1) { n = CHILD(n, 0); break; } else { int i; for (i = 0; i < NCH(n); i += 2) symtable_assign(st, CHILD(n, i)); return; } break; case atom: tmp = CHILD(n, 0); if (TYPE(tmp) == LPAR || TYPE(tmp) == LSQB) { n = CHILD(n, 1); continue; } else if (TYPE(tmp) == NAME) symtable_add_def(st, STR(tmp), DEF_LOCAL); return; case dotted_as_name: if (NCH(n) == 3) symtable_add_def(st, STR(CHILD(n, 2)), DEF_LOCAL); else symtable_add_def(st, STR(CHILD(CHILD(n, 0), 0)), DEF_LOCAL); return; case dotted_name: symtable_add_def(st, STR(CHILD(n, 0)), DEF_LOCAL); return; case NAME: symtable_add_def(st, STR(n), DEF_LOCAL); return; default: if (NCH(n) == 0) return; assert(NCH(n) == 1); n = CHILD(n, 0); break; } } }