mirror of https://github.com/python/cpython
Merged revisions 75697 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/trunk ........ r75697 | mark.dickinson | 2009-10-25 20:39:06 +0000 (Sun, 25 Oct 2009) | 3 lines Issue #1087418: Small performance boost for bitwise operations on longs. Initial patch by Gregory Smith; some tweaks added. ........
This commit is contained in:
parent
b6ef9633a9
commit
27a87a2aa2
|
@ -12,6 +12,8 @@ What's New in Python 3.2 Alpha 1?
|
||||||
Core and Builtins
|
Core and Builtins
|
||||||
-----------------
|
-----------------
|
||||||
|
|
||||||
|
- Issue #1087418: Boost performance of bitwise operations for longs.
|
||||||
|
|
||||||
- Support for AtheOS has been completely removed from the code base. It was
|
- Support for AtheOS has been completely removed from the code base. It was
|
||||||
disabled since Python 3.0.
|
disabled since Python 3.0.
|
||||||
|
|
||||||
|
|
|
@ -3638,6 +3638,22 @@ lshift_error:
|
||||||
return (PyObject *) maybe_small_long(z);
|
return (PyObject *) maybe_small_long(z);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/* Compute two's complement of digit vector a[0:m], writing result to
|
||||||
|
z[0:m]. The digit vector a need not be normalized, but should not
|
||||||
|
be entirely zero. a and z may point to the same digit vector. */
|
||||||
|
|
||||||
|
static void
|
||||||
|
v_complement(digit *z, digit *a, Py_ssize_t m)
|
||||||
|
{
|
||||||
|
Py_ssize_t i;
|
||||||
|
digit carry = 1;
|
||||||
|
for (i = 0; i < m; ++i) {
|
||||||
|
carry += a[i] ^ PyLong_MASK;
|
||||||
|
z[i] = carry & PyLong_MASK;
|
||||||
|
carry >>= PyLong_SHIFT;
|
||||||
|
}
|
||||||
|
assert(carry == 0);
|
||||||
|
}
|
||||||
|
|
||||||
/* Bitwise and/xor/or operations */
|
/* Bitwise and/xor/or operations */
|
||||||
|
|
||||||
|
@ -3646,60 +3662,49 @@ long_bitwise(PyLongObject *a,
|
||||||
int op, /* '&', '|', '^' */
|
int op, /* '&', '|', '^' */
|
||||||
PyLongObject *b)
|
PyLongObject *b)
|
||||||
{
|
{
|
||||||
digit maska, maskb; /* 0 or PyLong_MASK */
|
int nega, negb, negz;
|
||||||
int negz;
|
|
||||||
Py_ssize_t size_a, size_b, size_z, i;
|
Py_ssize_t size_a, size_b, size_z, i;
|
||||||
PyLongObject *z;
|
PyLongObject *z;
|
||||||
digit diga, digb;
|
|
||||||
PyObject *v;
|
|
||||||
|
|
||||||
if (Py_SIZE(a) < 0) {
|
/* Bitwise operations for negative numbers operate as though
|
||||||
a = (PyLongObject *) long_invert(a);
|
on a two's complement representation. So convert arguments
|
||||||
if (a == NULL)
|
from sign-magnitude to two's complement, and convert the
|
||||||
|
result back to sign-magnitude at the end. */
|
||||||
|
|
||||||
|
/* If a is negative, replace it by its two's complement. */
|
||||||
|
size_a = ABS(Py_SIZE(a));
|
||||||
|
nega = Py_SIZE(a) < 0;
|
||||||
|
if (nega) {
|
||||||
|
z = _PyLong_New(size_a);
|
||||||
|
if (z == NULL)
|
||||||
return NULL;
|
return NULL;
|
||||||
maska = PyLong_MASK;
|
v_complement(z->ob_digit, a->ob_digit, size_a);
|
||||||
|
a = z;
|
||||||
}
|
}
|
||||||
else {
|
else
|
||||||
|
/* Keep reference count consistent. */
|
||||||
Py_INCREF(a);
|
Py_INCREF(a);
|
||||||
maska = 0;
|
|
||||||
}
|
/* Same for b. */
|
||||||
if (Py_SIZE(b) < 0) {
|
size_b = ABS(Py_SIZE(b));
|
||||||
b = (PyLongObject *) long_invert(b);
|
negb = Py_SIZE(b) < 0;
|
||||||
if (b == NULL) {
|
if (negb) {
|
||||||
|
z = _PyLong_New(size_b);
|
||||||
|
if (z == NULL) {
|
||||||
Py_DECREF(a);
|
Py_DECREF(a);
|
||||||
return NULL;
|
return NULL;
|
||||||
}
|
}
|
||||||
maskb = PyLong_MASK;
|
v_complement(z->ob_digit, b->ob_digit, size_b);
|
||||||
|
b = z;
|
||||||
}
|
}
|
||||||
else {
|
else
|
||||||
Py_INCREF(b);
|
Py_INCREF(b);
|
||||||
maskb = 0;
|
|
||||||
}
|
|
||||||
|
|
||||||
negz = 0;
|
/* Swap a and b if necessary to ensure size_a >= size_b. */
|
||||||
switch (op) {
|
if (size_a < size_b) {
|
||||||
case '^':
|
z = a; a = b; b = z;
|
||||||
if (maska != maskb) {
|
size_z = size_a; size_a = size_b; size_b = size_z;
|
||||||
maska ^= PyLong_MASK;
|
negz = nega; nega = negb; negb = negz;
|
||||||
negz = -1;
|
|
||||||
}
|
|
||||||
break;
|
|
||||||
case '&':
|
|
||||||
if (maska && maskb) {
|
|
||||||
op = '|';
|
|
||||||
maska ^= PyLong_MASK;
|
|
||||||
maskb ^= PyLong_MASK;
|
|
||||||
negz = -1;
|
|
||||||
}
|
|
||||||
break;
|
|
||||||
case '|':
|
|
||||||
if (maska || maskb) {
|
|
||||||
op = '&';
|
|
||||||
maska ^= PyLong_MASK;
|
|
||||||
maskb ^= PyLong_MASK;
|
|
||||||
negz = -1;
|
|
||||||
}
|
|
||||||
break;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/* JRH: The original logic here was to allocate the result value (z)
|
/* JRH: The original logic here was to allocate the result value (z)
|
||||||
|
@ -3707,43 +3712,72 @@ long_bitwise(PyLongObject *a,
|
||||||
where the result is guaranteed to be shorter than that: AND of two
|
where the result is guaranteed to be shorter than that: AND of two
|
||||||
positives, OR of two negatives: use the shorter number. AND with
|
positives, OR of two negatives: use the shorter number. AND with
|
||||||
mixed signs: use the positive number. OR with mixed signs: use the
|
mixed signs: use the positive number. OR with mixed signs: use the
|
||||||
negative number. After the transformations above, op will be '&'
|
negative number.
|
||||||
iff one of these cases applies, and mask will be non-0 for operands
|
|
||||||
whose length should be ignored.
|
|
||||||
*/
|
*/
|
||||||
|
switch (op) {
|
||||||
|
case '^':
|
||||||
|
negz = nega ^ negb;
|
||||||
|
size_z = size_a;
|
||||||
|
break;
|
||||||
|
case '&':
|
||||||
|
negz = nega & negb;
|
||||||
|
size_z = negb ? size_a : size_b;
|
||||||
|
break;
|
||||||
|
case '|':
|
||||||
|
negz = nega | negb;
|
||||||
|
size_z = negb ? size_b : size_a;
|
||||||
|
break;
|
||||||
|
default:
|
||||||
|
PyErr_BadArgument();
|
||||||
|
return NULL;
|
||||||
|
}
|
||||||
|
|
||||||
size_a = Py_SIZE(a);
|
/* We allow an extra digit if z is negative, to make sure that
|
||||||
size_b = Py_SIZE(b);
|
the final two's complement of z doesn't overflow. */
|
||||||
size_z = op == '&'
|
z = _PyLong_New(size_z + negz);
|
||||||
? (maska
|
|
||||||
? size_b
|
|
||||||
: (maskb ? size_a : MIN(size_a, size_b)))
|
|
||||||
: MAX(size_a, size_b);
|
|
||||||
z = _PyLong_New(size_z);
|
|
||||||
if (z == NULL) {
|
if (z == NULL) {
|
||||||
Py_DECREF(a);
|
Py_DECREF(a);
|
||||||
Py_DECREF(b);
|
Py_DECREF(b);
|
||||||
return NULL;
|
return NULL;
|
||||||
}
|
}
|
||||||
|
|
||||||
for (i = 0; i < size_z; ++i) {
|
/* Compute digits for overlap of a and b. */
|
||||||
diga = (i < size_a ? a->ob_digit[i] : 0) ^ maska;
|
|
||||||
digb = (i < size_b ? b->ob_digit[i] : 0) ^ maskb;
|
|
||||||
switch(op) {
|
switch(op) {
|
||||||
case '&': z->ob_digit[i] = diga & digb; break;
|
case '&':
|
||||||
case '|': z->ob_digit[i] = diga | digb; break;
|
for (i = 0; i < size_b; ++i)
|
||||||
case '^': z->ob_digit[i] = diga ^ digb; break;
|
z->ob_digit[i] = a->ob_digit[i] & b->ob_digit[i];
|
||||||
|
break;
|
||||||
|
case '|':
|
||||||
|
for (i = 0; i < size_b; ++i)
|
||||||
|
z->ob_digit[i] = a->ob_digit[i] | b->ob_digit[i];
|
||||||
|
break;
|
||||||
|
case '^':
|
||||||
|
for (i = 0; i < size_b; ++i)
|
||||||
|
z->ob_digit[i] = a->ob_digit[i] ^ b->ob_digit[i];
|
||||||
|
break;
|
||||||
|
default:
|
||||||
|
PyErr_BadArgument();
|
||||||
|
return NULL;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/* Copy any remaining digits of a, inverting if necessary. */
|
||||||
|
if (op == '^' && negb)
|
||||||
|
for (; i < size_z; ++i)
|
||||||
|
z->ob_digit[i] = a->ob_digit[i] ^ PyLong_MASK;
|
||||||
|
else if (i < size_z)
|
||||||
|
memcpy(&z->ob_digit[i], &a->ob_digit[i],
|
||||||
|
(size_z-i)*sizeof(digit));
|
||||||
|
|
||||||
|
/* Complement result if negative. */
|
||||||
|
if (negz) {
|
||||||
|
Py_SIZE(z) = -(Py_SIZE(z));
|
||||||
|
z->ob_digit[size_z] = PyLong_MASK;
|
||||||
|
v_complement(z->ob_digit, z->ob_digit, size_z+1);
|
||||||
}
|
}
|
||||||
|
|
||||||
Py_DECREF(a);
|
Py_DECREF(a);
|
||||||
Py_DECREF(b);
|
Py_DECREF(b);
|
||||||
z = long_normalize(z);
|
return (PyObject *)maybe_small_long(long_normalize(z));
|
||||||
if (negz == 0)
|
|
||||||
return (PyObject *) maybe_small_long(z);
|
|
||||||
v = long_invert(z);
|
|
||||||
Py_DECREF(z);
|
|
||||||
return v;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
static PyObject *
|
static PyObject *
|
||||||
|
|
Loading…
Reference in New Issue