Commit e2846548 authored by Mark Dickinson's avatar Mark Dickinson

Issue #14339: Improve speed of bin, oct and hex builtins. Patch by Serhiy...

Issue #14339: Improve speed of bin, oct and hex builtins.  Patch by Serhiy Storchaka (with minor modifications).
parent 1b5123aa
...@@ -10,6 +10,9 @@ What's New in Python 3.3.0 Alpha 3? ...@@ -10,6 +10,9 @@ What's New in Python 3.3.0 Alpha 3?
Core and Builtins Core and Builtins
----------------- -----------------
- Issue #14339: Speed improvements to bin, oct and hex functions. Patch by
Serhiy Storchaka.
- Issue #14098: New functions PyErr_GetExcInfo and PyErr_SetExcInfo. - Issue #14098: New functions PyErr_GetExcInfo and PyErr_SetExcInfo.
Patch by Stefan Behnel. Patch by Stefan Behnel.
......
...@@ -1672,11 +1672,10 @@ _PyLong_Format(PyObject *aa, int base) ...@@ -1672,11 +1672,10 @@ _PyLong_Format(PyObject *aa, int base)
{ {
register PyLongObject *a = (PyLongObject *)aa; register PyLongObject *a = (PyLongObject *)aa;
PyObject *v; PyObject *v;
Py_ssize_t i, sz; Py_ssize_t sz;
Py_ssize_t size_a; Py_ssize_t size_a;
char *p; Py_UCS1 *p;
char sign = '\0'; int negative;
char *buffer;
int bits; int bits;
assert(base == 2 || base == 8 || base == 10 || base == 16); assert(base == 2 || base == 8 || base == 10 || base == 16);
...@@ -1688,6 +1687,7 @@ _PyLong_Format(PyObject *aa, int base) ...@@ -1688,6 +1687,7 @@ _PyLong_Format(PyObject *aa, int base)
return NULL; return NULL;
} }
size_a = ABS(Py_SIZE(a)); size_a = ABS(Py_SIZE(a));
negative = Py_SIZE(a) < 0;
/* Compute a rough upper bound for the length of the string */ /* Compute a rough upper bound for the length of the string */
switch (base) { switch (base) {
...@@ -1704,33 +1704,40 @@ _PyLong_Format(PyObject *aa, int base) ...@@ -1704,33 +1704,40 @@ _PyLong_Format(PyObject *aa, int base)
assert(0); /* shouldn't ever get here */ assert(0); /* shouldn't ever get here */
bits = 0; /* to silence gcc warning */ bits = 0; /* to silence gcc warning */
} }
/* compute length of output string: allow 2 characters for prefix and
1 for possible '-' sign. */ /* Compute exact length 'sz' of output string. */
if (size_a > (PY_SSIZE_T_MAX - 3) / PyLong_SHIFT / sizeof(Py_UCS4)) { if (size_a == 0) {
PyErr_SetString(PyExc_OverflowError, sz = 3;
"int is too large to format");
return NULL;
} }
/* now size_a * PyLong_SHIFT + 3 <= PY_SSIZE_T_MAX, so the RHS below else {
is safe from overflow */ Py_ssize_t size_a_in_bits;
sz = 3 + (size_a * PyLong_SHIFT + (bits - 1)) / bits; /* Ensure overflow doesn't occur during computation of sz. */
assert(sz >= 0); if (size_a > (PY_SSIZE_T_MAX - 3) / PyLong_SHIFT) {
buffer = PyMem_Malloc(sz); PyErr_SetString(PyExc_OverflowError,
if (buffer == NULL) { "int is too large to format");
PyErr_NoMemory(); return NULL;
}
size_a_in_bits = (size_a - 1) * PyLong_SHIFT +
bits_in_digit(a->ob_digit[size_a - 1]);
/* Allow 2 characters for prefix and 1 for a '-' sign. */
sz = 2 + negative + (size_a_in_bits + (bits - 1)) / bits;
}
v = PyUnicode_New(sz, 'x');
if (v == NULL) {
return NULL; return NULL;
} }
p = &buffer[sz]; assert(PyUnicode_KIND(v) == PyUnicode_1BYTE_KIND);
if (Py_SIZE(a) < 0)
sign = '-';
if (Py_SIZE(a) == 0) { p = PyUnicode_1BYTE_DATA(v) + sz;
if (size_a == 0) {
*--p = '0'; *--p = '0';
} }
else { else {
/* JRH: special case for power-of-2 bases */ /* JRH: special case for power-of-2 bases */
twodigits accum = 0; twodigits accum = 0;
int accumbits = 0; /* # of bits in accum */ int accumbits = 0; /* # of bits in accum */
Py_ssize_t i;
for (i = 0; i < size_a; ++i) { for (i = 0; i < size_a; ++i) {
accum |= (twodigits)a->ob_digit[i] << accumbits; accum |= (twodigits)a->ob_digit[i] << accumbits;
accumbits += PyLong_SHIFT; accumbits += PyLong_SHIFT;
...@@ -1739,7 +1746,6 @@ _PyLong_Format(PyObject *aa, int base) ...@@ -1739,7 +1746,6 @@ _PyLong_Format(PyObject *aa, int base)
char cdigit; char cdigit;
cdigit = (char)(accum & (base - 1)); cdigit = (char)(accum & (base - 1));
cdigit += (cdigit < 10) ? '0' : 'a'-10; cdigit += (cdigit < 10) ? '0' : 'a'-10;
assert(p > buffer);
*--p = cdigit; *--p = cdigit;
accumbits -= bits; accumbits -= bits;
accum >>= bits; accum >>= bits;
...@@ -1754,10 +1760,9 @@ _PyLong_Format(PyObject *aa, int base) ...@@ -1754,10 +1760,9 @@ _PyLong_Format(PyObject *aa, int base)
else /* (base == 2) */ else /* (base == 2) */
*--p = 'b'; *--p = 'b';
*--p = '0'; *--p = '0';
if (sign) if (negative)
*--p = sign; *--p = '-';
v = PyUnicode_DecodeASCII(p, &buffer[sz] - p, NULL); assert(p == PyUnicode_1BYTE_DATA(v));
PyMem_Free(buffer);
return v; return v;
} }
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment