Merged revisions 75697 via svnmerge from

svn+ssh://pythondev@svn.python.org/python/trunk

........
  r75697 | mark.dickinson | 2009-10-25 20:39:06 +0000 (Sun, 25 Oct 2009) | 3 lines

  Issue #1087418: Small performance boost for bitwise operations on longs.
  Initial patch by Gregory Smith;  some tweaks added.
........
This commit is contained in:
Mark Dickinson 2009-10-25 20:43:34 +00:00
parent b6ef9633a9
commit 27a87a2aa2
2 changed files with 103 additions and 67 deletions

View File

@ -12,6 +12,8 @@ What's New in Python 3.2 Alpha 1?
Core and Builtins Core and Builtins
----------------- -----------------
- Issue #1087418: Boost performance of bitwise operations for longs.
- Support for AtheOS has been completely removed from the code base. It was - Support for AtheOS has been completely removed from the code base. It was
disabled since Python 3.0. disabled since Python 3.0.

View File

@ -3638,6 +3638,22 @@ lshift_error:
return (PyObject *) maybe_small_long(z); return (PyObject *) maybe_small_long(z);
} }
/* Compute two's complement of digit vector a[0:m], writing result to
z[0:m]. The digit vector a need not be normalized, but should not
be entirely zero. a and z may point to the same digit vector. */
static void
v_complement(digit *z, digit *a, Py_ssize_t m)
{
Py_ssize_t i;
digit carry = 1;
for (i = 0; i < m; ++i) {
carry += a[i] ^ PyLong_MASK;
z[i] = carry & PyLong_MASK;
carry >>= PyLong_SHIFT;
}
assert(carry == 0);
}
/* Bitwise and/xor/or operations */ /* Bitwise and/xor/or operations */
@ -3646,60 +3662,49 @@ long_bitwise(PyLongObject *a,
int op, /* '&', '|', '^' */ int op, /* '&', '|', '^' */
PyLongObject *b) PyLongObject *b)
{ {
digit maska, maskb; /* 0 or PyLong_MASK */ int nega, negb, negz;
int negz;
Py_ssize_t size_a, size_b, size_z, i; Py_ssize_t size_a, size_b, size_z, i;
PyLongObject *z; PyLongObject *z;
digit diga, digb;
PyObject *v;
if (Py_SIZE(a) < 0) { /* Bitwise operations for negative numbers operate as though
a = (PyLongObject *) long_invert(a); on a two's complement representation. So convert arguments
if (a == NULL) from sign-magnitude to two's complement, and convert the
result back to sign-magnitude at the end. */
/* If a is negative, replace it by its two's complement. */
size_a = ABS(Py_SIZE(a));
nega = Py_SIZE(a) < 0;
if (nega) {
z = _PyLong_New(size_a);
if (z == NULL)
return NULL; return NULL;
maska = PyLong_MASK; v_complement(z->ob_digit, a->ob_digit, size_a);
a = z;
} }
else { else
/* Keep reference count consistent. */
Py_INCREF(a); Py_INCREF(a);
maska = 0;
} /* Same for b. */
if (Py_SIZE(b) < 0) { size_b = ABS(Py_SIZE(b));
b = (PyLongObject *) long_invert(b); negb = Py_SIZE(b) < 0;
if (b == NULL) { if (negb) {
z = _PyLong_New(size_b);
if (z == NULL) {
Py_DECREF(a); Py_DECREF(a);
return NULL; return NULL;
} }
maskb = PyLong_MASK; v_complement(z->ob_digit, b->ob_digit, size_b);
b = z;
} }
else { else
Py_INCREF(b); Py_INCREF(b);
maskb = 0;
}
negz = 0; /* Swap a and b if necessary to ensure size_a >= size_b. */
switch (op) { if (size_a < size_b) {
case '^': z = a; a = b; b = z;
if (maska != maskb) { size_z = size_a; size_a = size_b; size_b = size_z;
maska ^= PyLong_MASK; negz = nega; nega = negb; negb = negz;
negz = -1;
}
break;
case '&':
if (maska && maskb) {
op = '|';
maska ^= PyLong_MASK;
maskb ^= PyLong_MASK;
negz = -1;
}
break;
case '|':
if (maska || maskb) {
op = '&';
maska ^= PyLong_MASK;
maskb ^= PyLong_MASK;
negz = -1;
}
break;
} }
/* JRH: The original logic here was to allocate the result value (z) /* JRH: The original logic here was to allocate the result value (z)
@ -3707,43 +3712,72 @@ long_bitwise(PyLongObject *a,
where the result is guaranteed to be shorter than that: AND of two where the result is guaranteed to be shorter than that: AND of two
positives, OR of two negatives: use the shorter number. AND with positives, OR of two negatives: use the shorter number. AND with
mixed signs: use the positive number. OR with mixed signs: use the mixed signs: use the positive number. OR with mixed signs: use the
negative number. After the transformations above, op will be '&' negative number.
iff one of these cases applies, and mask will be non-0 for operands
whose length should be ignored.
*/ */
switch (op) {
case '^':
negz = nega ^ negb;
size_z = size_a;
break;
case '&':
negz = nega & negb;
size_z = negb ? size_a : size_b;
break;
case '|':
negz = nega | negb;
size_z = negb ? size_b : size_a;
break;
default:
PyErr_BadArgument();
return NULL;
}
size_a = Py_SIZE(a); /* We allow an extra digit if z is negative, to make sure that
size_b = Py_SIZE(b); the final two's complement of z doesn't overflow. */
size_z = op == '&' z = _PyLong_New(size_z + negz);
? (maska
? size_b
: (maskb ? size_a : MIN(size_a, size_b)))
: MAX(size_a, size_b);
z = _PyLong_New(size_z);
if (z == NULL) { if (z == NULL) {
Py_DECREF(a); Py_DECREF(a);
Py_DECREF(b); Py_DECREF(b);
return NULL; return NULL;
} }
for (i = 0; i < size_z; ++i) { /* Compute digits for overlap of a and b. */
diga = (i < size_a ? a->ob_digit[i] : 0) ^ maska; switch(op) {
digb = (i < size_b ? b->ob_digit[i] : 0) ^ maskb; case '&':
switch (op) { for (i = 0; i < size_b; ++i)
case '&': z->ob_digit[i] = diga & digb; break; z->ob_digit[i] = a->ob_digit[i] & b->ob_digit[i];
case '|': z->ob_digit[i] = diga | digb; break; break;
case '^': z->ob_digit[i] = diga ^ digb; break; case '|':
} for (i = 0; i < size_b; ++i)
z->ob_digit[i] = a->ob_digit[i] | b->ob_digit[i];
break;
case '^':
for (i = 0; i < size_b; ++i)
z->ob_digit[i] = a->ob_digit[i] ^ b->ob_digit[i];
break;
default:
PyErr_BadArgument();
return NULL;
}
/* Copy any remaining digits of a, inverting if necessary. */
if (op == '^' && negb)
for (; i < size_z; ++i)
z->ob_digit[i] = a->ob_digit[i] ^ PyLong_MASK;
else if (i < size_z)
memcpy(&z->ob_digit[i], &a->ob_digit[i],
(size_z-i)*sizeof(digit));
/* Complement result if negative. */
if (negz) {
Py_SIZE(z) = -(Py_SIZE(z));
z->ob_digit[size_z] = PyLong_MASK;
v_complement(z->ob_digit, z->ob_digit, size_z+1);
} }
Py_DECREF(a); Py_DECREF(a);
Py_DECREF(b); Py_DECREF(b);
z = long_normalize(z); return (PyObject *)maybe_small_long(long_normalize(z));
if (negz == 0)
return (PyObject *) maybe_small_long(z);
v = long_invert(z);
Py_DECREF(z);
return v;
} }
static PyObject * static PyObject *