Commit 65fd0592 authored by Serhiy Storchaka's avatar Serhiy Storchaka

Issue #2382: SyntaxError cursor "^" now is written at correct position in most

cases when multibyte characters are in line (before "^").  This still not
works correctly with wide East Asian characters.
parent f7d2874d
...@@ -148,6 +148,19 @@ class ExceptionTests(unittest.TestCase): ...@@ -148,6 +148,19 @@ class ExceptionTests(unittest.TestCase):
ckmsg(s, "'continue' not properly in loop") ckmsg(s, "'continue' not properly in loop")
ckmsg("continue\n", "'continue' not properly in loop") ckmsg("continue\n", "'continue' not properly in loop")
def testSyntaxErrorOffset(self):
def check(src, lineno, offset):
with self.assertRaises(SyntaxError) as cm:
compile(src, '<fragment>', 'exec')
self.assertEqual(cm.exception.lineno, lineno)
self.assertEqual(cm.exception.offset, offset)
check('def fact(x):\n\treturn x!\n', 2, 10)
check('1 +\n', 1, 4)
check('def spam():\n print(1)\n print(2)', 3, 10)
check('Python = "Python" +', 1, 20)
check('Python = "\u1e54\xfd\u0163\u0125\xf2\xf1" +', 1, 20)
@cpython_only @cpython_only
def testSettingException(self): def testSettingException(self):
# test that setting an exception at the C level works even if the # test that setting an exception at the C level works even if the
......
...@@ -32,6 +32,9 @@ class SyntaxTracebackCases(unittest.TestCase): ...@@ -32,6 +32,9 @@ class SyntaxTracebackCases(unittest.TestCase):
def syntax_error_bad_indentation(self): def syntax_error_bad_indentation(self):
compile("def spam():\n print(1)\n print(2)", "?", "exec") compile("def spam():\n print(1)\n print(2)", "?", "exec")
def syntax_error_with_caret_non_ascii(self):
compile('Python = "\u1e54\xfd\u0163\u0125\xf2\xf1" +', "?", "exec")
def test_caret(self): def test_caret(self):
err = self.get_exception_format(self.syntax_error_with_caret, err = self.get_exception_format(self.syntax_error_with_caret,
SyntaxError) SyntaxError)
...@@ -46,6 +49,12 @@ class SyntaxTracebackCases(unittest.TestCase): ...@@ -46,6 +49,12 @@ class SyntaxTracebackCases(unittest.TestCase):
self.assertTrue(err[2].count('\n') == 1) # and no additional newline self.assertTrue(err[2].count('\n') == 1) # and no additional newline
self.assertTrue(err[1].find("+") == err[2].find("^")) # in the right place self.assertTrue(err[1].find("+") == err[2].find("^")) # in the right place
err = self.get_exception_format(self.syntax_error_with_caret_non_ascii,
SyntaxError)
self.assertIn("^", err[2]) # third line has caret
self.assertTrue(err[2].count('\n') == 1) # and no additional newline
self.assertTrue(err[1].find("+") == err[2].find("^")) # in the right place
def test_nocaret(self): def test_nocaret(self):
exc = SyntaxError("error", ("x.py", 23, None, "bad syntax")) exc = SyntaxError("error", ("x.py", 23, None, "bad syntax"))
err = traceback.format_exception_only(SyntaxError, exc) err = traceback.format_exception_only(SyntaxError, exc)
......
...@@ -10,6 +10,10 @@ What's New in Python 3.3.4 release candidate 1? ...@@ -10,6 +10,10 @@ What's New in Python 3.3.4 release candidate 1?
Core and Builtins Core and Builtins
----------------- -----------------
- Issue #2382: SyntaxError cursor "^" is now written at correct position in most
cases when multibyte characters are in line (before "^"). This still not
works correctly with wide East Asian characters.
- Issue #18960: The first line of Python script could be executed twice when - Issue #18960: The first line of Python script could be executed twice when
the source encoding was specified on the second line. Now the source encoding the source encoding was specified on the second line. Now the source encoding
declaration on the second line isn't effective if the first line contains declaration on the second line isn't effective if the first line contains
......
...@@ -2226,6 +2226,7 @@ err_input(perrdetail *err) ...@@ -2226,6 +2226,7 @@ err_input(perrdetail *err)
PyObject *v, *w, *errtype, *errtext; PyObject *v, *w, *errtype, *errtext;
PyObject *msg_obj = NULL; PyObject *msg_obj = NULL;
char *msg = NULL; char *msg = NULL;
int offset = err->offset;
errtype = PyExc_SyntaxError; errtype = PyExc_SyntaxError;
switch (err->error) { switch (err->error) {
...@@ -2310,11 +2311,20 @@ err_input(perrdetail *err) ...@@ -2310,11 +2311,20 @@ err_input(perrdetail *err)
errtext = Py_None; errtext = Py_None;
Py_INCREF(Py_None); Py_INCREF(Py_None);
} else { } else {
errtext = PyUnicode_DecodeUTF8(err->text, strlen(err->text), errtext = PyUnicode_DecodeUTF8(err->text, err->offset,
"replace"); "replace");
if (errtext != NULL) {
Py_ssize_t len = strlen(err->text);
offset = (int)PyUnicode_GET_LENGTH(errtext);
if (len != err->offset) {
Py_DECREF(errtext);
errtext = PyUnicode_DecodeUTF8(err->text, len,
"replace");
}
}
} }
v = Py_BuildValue("(OiiN)", err->filename, v = Py_BuildValue("(OiiN)", err->filename,
err->lineno, err->offset, errtext); err->lineno, offset, errtext);
if (v != NULL) { if (v != NULL) {
if (msg_obj) if (msg_obj)
w = Py_BuildValue("(OO)", msg_obj, v); w = Py_BuildValue("(OO)", msg_obj, v);
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment