summaryrefslogtreecommitdiffstats
path: root/Parser
diff options
context:
space:
mode:
authorSerhiy Storchaka <storchaka@gmail.com>2015-11-14 13:11:17 (GMT)
committerSerhiy Storchaka <storchaka@gmail.com>2015-11-14 13:11:17 (GMT)
commit7e2b870b8593233306594237cd5286c60ec7a1e1 (patch)
tree612fa432059cc31904217e4bf55bed6c124576d0 /Parser
parent2463001a15f0f1dab1b82e71f3d37b1bc7bc701f (diff)
parent0d441119f5eb6437f6145e89e0963f75494d8a3f (diff)
downloadcpython-7e2b870b8593233306594237cd5286c60ec7a1e1.zip
cpython-7e2b870b8593233306594237cd5286c60ec7a1e1.tar.gz
cpython-7e2b870b8593233306594237cd5286c60ec7a1e1.tar.bz2
Issue #25388: Fixed tokenizer crash when processing undecodable source code
with a null byte.
Diffstat (limited to 'Parser')
-rw-r--r--Parser/tokenizer.c14
1 files changed, 6 insertions, 8 deletions
diff --git a/Parser/tokenizer.c b/Parser/tokenizer.c
index 04baeaf..6a528db 100644
--- a/Parser/tokenizer.c
+++ b/Parser/tokenizer.c
@@ -196,7 +196,8 @@ error_ret(struct tok_state *tok) /* XXX */
tok->decoding_erred = 1;
if (tok->fp != NULL && tok->buf != NULL) /* see PyTokenizer_Free */
PyMem_FREE(tok->buf);
- tok->buf = NULL;
+ tok->buf = tok->cur = tok->end = tok->inp = tok->start = NULL;
+ tok->done = E_DECODE;
return NULL; /* as if it were EOF */
}
@@ -952,11 +953,6 @@ tok_nextc(struct tok_state *tok)
}
buflen = PyBytes_GET_SIZE(u);
buf = PyBytes_AS_STRING(u);
- if (!buf) {
- Py_DECREF(u);
- tok->done = E_DECODE;
- return EOF;
- }
newtok = PyMem_MALLOC(buflen+1);
strcpy(newtok, buf);
Py_DECREF(u);
@@ -998,7 +994,6 @@ tok_nextc(struct tok_state *tok)
if (tok->buf != NULL)
PyMem_FREE(tok->buf);
tok->buf = newtok;
- tok->line_start = tok->buf;
tok->cur = tok->buf;
tok->line_start = tok->buf;
tok->inp = strchr(tok->buf, '\0');
@@ -1021,7 +1016,8 @@ tok_nextc(struct tok_state *tok)
}
if (decoding_fgets(tok->buf, (int)(tok->end - tok->buf),
tok) == NULL) {
- tok->done = E_EOF;
+ if (!tok->decoding_erred)
+ tok->done = E_EOF;
done = 1;
}
else {
@@ -1055,6 +1051,8 @@ tok_nextc(struct tok_state *tok)
return EOF;
}
tok->buf = newbuf;
+ tok->cur = tok->buf + cur;
+ tok->line_start = tok->cur;
tok->inp = tok->buf + curvalid;
tok->end = tok->buf + newsize;
tok->start = curstart < 0 ? NULL :