Commit 4f5f0e54 authored by Serhiy Storchaka's avatar Serhiy Storchaka

Issue #16335: Fix integer overflow in unicode-escape decoder.

parent 410eee56
...@@ -8,6 +8,7 @@ Modified for Python 2.0 by Fredrik Lundh (fredrik@pythonware.com) ...@@ -8,6 +8,7 @@ Modified for Python 2.0 by Fredrik Lundh (fredrik@pythonware.com)
"""#" """#"
import unittest import unittest
import _testcapi
from test import support from test import support
...@@ -141,6 +142,21 @@ class UnicodeNamesTest(unittest.TestCase): ...@@ -141,6 +142,21 @@ class UnicodeNamesTest(unittest.TestCase):
str, b"\\NSPACE", 'unicode-escape', 'strict' str, b"\\NSPACE", 'unicode-escape', 'strict'
) )
@unittest.skipUnless(_testcapi.INT_MAX < _testcapi.PY_SSIZE_T_MAX,
"needs UINT_MAX < SIZE_MAX")
def test_issue16335(self):
# very very long bogus character name
try:
x = b'\\N{SPACE' + b'x' * (_testcapi.UINT_MAX + 1) + b'}'
except MemoryError:
raise unittest.SkipTest("not enough memory")
self.assertEqual(len(x), len(b'\\N{SPACE}') + (_testcapi.UINT_MAX + 1))
self.assertRaisesRegex(UnicodeError,
'unknown Unicode character name',
x.decode, 'unicode-escape'
)
def test_main(): def test_main():
support.run_unittest(UnicodeNamesTest) support.run_unittest(UnicodeNamesTest)
......
...@@ -3923,7 +3923,8 @@ PyObject *PyUnicode_DecodeUnicodeEscape(const char *s, ...@@ -3923,7 +3923,8 @@ PyObject *PyUnicode_DecodeUnicodeEscape(const char *s,
/* found a name. look it up in the unicode database */ /* found a name. look it up in the unicode database */
message = "unknown Unicode character name"; message = "unknown Unicode character name";
s++; s++;
if (ucnhash_CAPI->getcode(NULL, start, (int)(s-start-1), &chr)) if (s - start - 1 <= INT_MAX &&
ucnhash_CAPI->getcode(NULL, start, (int)(s-start-1), &chr))
goto store; goto store;
} }
} }
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment