summaryrefslogtreecommitdiffstats
path: root/Parser
diff options
context:
space:
mode:
authorBatuhan Taskaya <batuhan@python.org>2021-07-20 15:42:12 (GMT)
committerGitHub <noreply@github.com>2021-07-20 15:42:12 (GMT)
commitfbc349ff790c21f1a59af939d42033470790c530 (patch)
tree8de9aad662539dc3c643c1ec1ecfaaf1d54f8af8 /Parser
parent4868b94c6089d457673b1ba5b5b64c2f38c435af (diff)
downloadcpython-fbc349ff790c21f1a59af939d42033470790c530.zip
cpython-fbc349ff790c21f1a59af939d42033470790c530.tar.gz
cpython-fbc349ff790c21f1a59af939d42033470790c530.tar.bz2
bpo-43950: Distinguish errors happening on character offset decoding (GH-27217)
Diffstat (limited to 'Parser')
-rw-r--r--Parser/pegen.c18
1 files changed, 13 insertions, 5 deletions
diff --git a/Parser/pegen.c b/Parser/pegen.c
index 3e8ddfb..106dba9 100644
--- a/Parser/pegen.c
+++ b/Parser/pegen.c
@@ -402,7 +402,7 @@ _PyPegen_byte_offset_to_character_offset(PyObject *line, Py_ssize_t col_offset)
{
const char *str = PyUnicode_AsUTF8(line);
if (!str) {
- return 0;
+ return -1;
}
Py_ssize_t len = strlen(str);
if (col_offset > len + 1) {
@@ -411,7 +411,7 @@ _PyPegen_byte_offset_to_character_offset(PyObject *line, Py_ssize_t col_offset)
assert(col_offset >= 0);
PyObject *text = PyUnicode_DecodeUTF8(str, col_offset, "replace");
if (!text) {
- return 0;
+ return -1;
}
Py_ssize_t size = PyUnicode_GET_LENGTH(text);
Py_DECREF(text);
@@ -499,9 +499,17 @@ _PyPegen_raise_error_known_location(Parser *p, PyObject *errtype,
if (p->tok->encoding != NULL) {
col_number = _PyPegen_byte_offset_to_character_offset(error_line, col_offset);
- end_col_number = end_col_number > 0 ?
- _PyPegen_byte_offset_to_character_offset(error_line, end_col_offset) :
- end_col_number;
+ if (col_number < 0) {
+ goto error;
+ }
+ if (end_col_number > 0) {
+ Py_ssize_t end_col_offset = _PyPegen_byte_offset_to_character_offset(error_line, end_col_number);
+ if (end_col_offset < 0) {
+ goto error;
+ } else {
+ end_col_number = end_col_offset;
+ }
+ }
}
tmp = Py_BuildValue("(OiiNii)", p->tok->filename, lineno, col_number, error_line, end_lineno, end_col_number);
if (!tmp) {