summaryrefslogtreecommitdiffstats
path: root/Modules/pcremodule.c
diff options
context:
space:
mode:
Diffstat (limited to 'Modules/pcremodule.c')
-rw-r--r--Modules/pcremodule.c164
1 files changed, 50 insertions, 114 deletions
diff --git a/Modules/pcremodule.c b/Modules/pcremodule.c
index 7c4136a..d7615d1 100644
--- a/Modules/pcremodule.c
+++ b/Modules/pcremodule.c
@@ -222,7 +222,9 @@ PyPcre_compile(self, args)
{
PyMem_DEL(rv);
if (!PyErr_Occurred())
- PyErr_SetObject(ErrorObject, Py_BuildValue("si", error, erroroffset));
+ {
+ PyErr_SetObject(ErrorObject, Py_BuildValue("si", error, erroroffset));
+ }
return NULL;
}
rv->regex_extra=pcre_study(rv->regex, 0, &error);
@@ -243,47 +245,57 @@ PyPcre_compile(self, args)
}
static PyObject *
-PyPcre_expand_escape(self, args)
- PyObject *self;
- PyObject *args;
+PyPcre_expand_escape(pattern, pattern_len, indexptr, typeptr)
+ unsigned char *pattern;
+ int pattern_len, *indexptr, *typeptr;
{
- unsigned char c, *pattern;
- int index, pattern_len;
- const int context=REPLACEMENT;
-
- if (!PyArg_ParseTuple(args, "s#i", &pattern, &pattern_len, &index))
- return NULL;
+ unsigned char c;
+ int index = *indexptr;
+
if (pattern_len<=index)
{
PyErr_SetString(ErrorObject, "escape ends too soon");
return NULL;
}
c=pattern[index]; index++;
+ *typeptr=CHAR;
+
switch (c)
{
case('t'):
- return Py_BuildValue("ici", CHAR, (char)9, index);
+ *indexptr=index;
+ return Py_BuildValue("c", (char)9);
break;
case('n'):
- return Py_BuildValue("ici", CHAR, (char)10, index);
+ *indexptr = index;
+ return Py_BuildValue("c", (char)10);
break;
case('v'):
- return Py_BuildValue("ici", CHAR, (char)11, index);
+ *indexptr = index;
+ return Py_BuildValue("c", (char)11);
break;
case('r'):
- return Py_BuildValue("ici", CHAR, (char)13, index);
+ *indexptr = index;
+ return Py_BuildValue("c", (char)13);
break;
case('f'):
- return Py_BuildValue("ici", CHAR, (char)12, index);
+ *indexptr = index;
+ return Py_BuildValue("c", (char)12);
break;
case('a'):
- return Py_BuildValue("ici", CHAR, (char)7, index);
+ *indexptr = index;
+ return Py_BuildValue("c", (char)7);
break;
+ case('b'):
+ *indexptr=index;
+ return Py_BuildValue("c", (char)8);
+ break;
+
case('x'):
{
int end, length;
unsigned char *string;
- PyObject *v, *result;
+ PyObject *v;
end=index;
while (end<pattern_len &&
@@ -312,52 +324,11 @@ PyPcre_expand_escape(self, args)
free(string);
/* The evaluation raised an exception */
if (v==NULL) return NULL;
- result=Py_BuildValue("iOi", CHAR, v, end);
- Py_DECREF(v);
- return result;
+ *indexptr = end;
+ return v;
}
break;
- case('b'):
- if (context!=NORMAL)
- return Py_BuildValue("ici", CHAR, (char)8, index);
- else
- {
- unsigned char empty_string[1];
- empty_string[0]='\0';
- return Py_BuildValue("isi", WORD_BOUNDARY, empty_string, index);
- }
- break;
- case('B'):
- if (context!=NORMAL)
- return Py_BuildValue("ici", CHAR, 'B', index);
- else
- {
- unsigned char empty_string[1];
- empty_string[0]='\0';
- return Py_BuildValue("isi", NOT_WORD_BOUNDARY, empty_string, index);
- }
- break;
- case('A'):
- if (context!=NORMAL)
- return Py_BuildValue("ici", CHAR, 'A', index);
- else
- {
- unsigned char empty_string[1];
- empty_string[0]='\0';
- return Py_BuildValue("isi", BEGINNING_OF_BUFFER, empty_string, index);
- }
- break;
- case('Z'):
- if (context!=NORMAL)
- return Py_BuildValue("ici", CHAR, 'Z', index);
- else
- {
- unsigned char empty_string[1];
- empty_string[0]='\0';
- return Py_BuildValue("isi", END_OF_BUFFER, empty_string, index);
- }
- break;
case('E'): case('G'): case('L'): case('Q'):
case('U'): case('l'): case('u'):
{
@@ -367,26 +338,6 @@ PyPcre_expand_escape(self, args)
return NULL;
}
- case ('w'):
- return Py_BuildValue("ici", CHAR, 'w', index);
- break;
- case ('W'):
- return Py_BuildValue("ici", CHAR, 'W', index);
- break;
- case ('s'):
- return Py_BuildValue("ici", CHAR, 's', index);
- break;
- case ('S'):
- return Py_BuildValue("ici", CHAR, 'S', index);
- break;
-
- case ('d'):
- return Py_BuildValue("ici", CHAR, 'd', index);
- break;
- case ('D'):
- return Py_BuildValue("ici", CHAR, 'D', index);
- break;
-
case('g'):
{
int end, valid, i;
@@ -427,9 +378,9 @@ PyPcre_expand_escape(self, args)
return NULL;
}
- return Py_BuildValue("is#i", MEMORY_REFERENCE,
- pattern+index, end-index,
- end+1);
+ *typeptr = MEMORY_REFERENCE;
+ *indexptr = end+1;
+ return Py_BuildValue("s#", pattern+index, end-index);
}
break;
@@ -451,7 +402,8 @@ PyPcre_expand_escape(self, args)
PyErr_SetString(ErrorObject, "octal value out of range");
return NULL;
}
- return Py_BuildValue("ici", CHAR, (unsigned char)octval, i);
+ *indexptr = i;
+ return Py_BuildValue("c", (unsigned char)octval);
}
break;
case('1'): case('2'): case('3'): case('4'):
@@ -483,17 +435,12 @@ PyPcre_expand_escape(self, args)
PyErr_SetString(ErrorObject, "octal value out of range");
return NULL;
}
- return Py_BuildValue("ici", CHAR, (unsigned char)value, index+3);
+ *indexptr = index+3;
+ return Py_BuildValue("c", (unsigned char)value);
}
else
{
/* 2-digit form, so it's a memory reference */
- if (context==CHARCLASS)
- {
- PyErr_SetString(ErrorObject, "cannot reference a register "
- "from inside a character class");
- return NULL;
- }
value= 10*(pattern[index ]-'0') +
(pattern[index+1]-'0');
if (value<1 || EXTRACT_MAX<=value)
@@ -501,27 +448,24 @@ PyPcre_expand_escape(self, args)
PyErr_SetString(ErrorObject, "memory reference out of range");
return NULL;
}
- return Py_BuildValue("iii", MEMORY_REFERENCE,
- value, index+2);
+ *typeptr = MEMORY_REFERENCE;
+ *indexptr = index+2;
+ return Py_BuildValue("i", value);
}
}
else
{
/* Single-digit form, like \2, so it's a memory reference */
- if (context==CHARCLASS)
- {
- PyErr_SetString(ErrorObject, "cannot reference a register "
- "from inside a character class");
- return NULL;
- }
- return Py_BuildValue("iii", MEMORY_REFERENCE,
- pattern[index]-'0', index+1);
+ *typeptr = MEMORY_REFERENCE;
+ *indexptr = index+1;
+ return Py_BuildValue("i", pattern[index]-'0');
}
}
break;
default:
- return Py_BuildValue("ici", CHAR, c, index);
+ *indexptr = index;
+ return Py_BuildValue("c", c);
break;
}
}
@@ -547,7 +491,7 @@ PyPcre_expand(self, args)
{
if (repl[i]=='\\')
{
- PyObject *args, *t, *value;
+ PyObject *value;
int escape_type;
if (start!=i)
@@ -557,18 +501,14 @@ PyPcre_expand(self, args)
total_len += i-start;
}
i++;
- args=Py_BuildValue("Oi", repl_obj, i);
- t=PyPcre_expand_escape(NULL, args);
- Py_DECREF(args);
- if (t==NULL)
+ value=PyPcre_expand_escape(repl, size, &i, &escape_type);
+ if (value==NULL)
{
/* PyPcre_expand_escape triggered an exception of some sort,
so just return */
Py_DECREF(results);
return NULL;
}
- value=PyTuple_GetItem(t, 1);
- escape_type=PyInt_AsLong(PyTuple_GetItem(t, 0));
switch (escape_type)
{
case (CHAR):
@@ -599,7 +539,6 @@ PyPcre_expand(self, args)
PyErr_SetString(ErrorObject,
message);
Py_DECREF(result);
- Py_DECREF(t);
Py_DECREF(results);
return NULL;
}
@@ -610,15 +549,13 @@ PyPcre_expand(self, args)
}
break;
default:
- Py_DECREF(t);
Py_DECREF(results);
PyErr_SetString(ErrorObject,
"bad escape in replacement");
return NULL;
}
- i=start=PyInt_AsLong(PyTuple_GetItem(t, 2));
+ start=i;
i--; /* Decrement now, because the 'for' loop will increment it */
- Py_DECREF(t);
}
} /* endif repl[i]!='\\' */
@@ -690,7 +627,6 @@ void
initpcre()
{
PyObject *m, *d;
- int a;
/* Create the module and add the functions */
m = Py_InitModule("pcre", pcre_methods);