Commit b9abde9d authored by Kevin Modzelewski's avatar Kevin Modzelewski

Support the different int formats for struct.pack

The struct module just defers to PyLong_As* methods, so the
actual change here is improving our implementation of
_PyLong_AsByteArray, to add
- overflow and underflow checking
- twos-complement conversion (mpz_export ignores the sign)
- endianness
parent 65b4d12c
...@@ -345,16 +345,20 @@ extern "C" Box* pow_i64_i64(i64 lhs, i64 rhs) { ...@@ -345,16 +345,20 @@ extern "C" Box* pow_i64_i64(i64 lhs, i64 rhs) {
} }
assert(rhs > 0); assert(rhs > 0);
while (rhs) { while (true) {
if (rhs & 1) { if (rhs & 1) {
// TODO: could potentially avoid restarting the entire computation on overflow? // TODO: could potentially avoid restarting the entire computation on overflow?
if (__builtin_smull_overflow(rtn, curpow, &rtn)) if (__builtin_smull_overflow(rtn, curpow, &rtn))
return longPow(boxLong(lhs), boxLong(orig_rhs)); return longPow(boxLong(lhs), boxLong(orig_rhs));
} }
if (__builtin_smull_overflow(curpow, curpow, &curpow))
return longPow(boxLong(lhs), boxLong(orig_rhs));
rhs >>= 1; rhs >>= 1;
if (!rhs)
break;
if (__builtin_smull_overflow(curpow, curpow, &curpow))
return longPow(boxLong(lhs), boxLong(orig_rhs));
} }
return boxInt(rtn); return boxInt(rtn);
} }
......
...@@ -232,11 +232,11 @@ static int64_t asSignedLong(BoxedLong* self) { ...@@ -232,11 +232,11 @@ static int64_t asSignedLong(BoxedLong* self) {
static uint64_t asUnsignedLong(BoxedLong* self) { static uint64_t asUnsignedLong(BoxedLong* self) {
assert(self->cls == long_cls); assert(self->cls == long_cls);
// if this is ever true, we should raise a Python error, but I don't think we should hit it? if (mpz_sgn(self->n) == -1)
assert(mpz_cmp_si(self->n, 0) >= 0); raiseExcHelper(OverflowError, "can't convert negative value to unsigned long");
if (!mpz_fits_ulong_p(self->n)) if (!mpz_fits_ulong_p(self->n))
raiseExcHelper(OverflowError, "long int too large to convert to int"); raiseExcHelper(OverflowError, "long int too large to convert");
return mpz_get_ui(self->n); return mpz_get_ui(self->n);
} }
...@@ -259,7 +259,8 @@ extern "C" unsigned long PyLong_AsUnsignedLong(PyObject* vv) noexcept { ...@@ -259,7 +259,8 @@ extern "C" unsigned long PyLong_AsUnsignedLong(PyObject* vv) noexcept {
try { try {
return asUnsignedLong(l); return asUnsignedLong(l);
} catch (ExcInfo e) { } catch (ExcInfo e) {
abort(); setCAPIException(e);
return -1;
} }
} }
...@@ -483,11 +484,56 @@ extern "C" void* PyLong_AsVoidPtr(PyObject* vv) noexcept { ...@@ -483,11 +484,56 @@ extern "C" void* PyLong_AsVoidPtr(PyObject* vv) noexcept {
extern "C" int _PyLong_AsByteArray(PyLongObject* v, unsigned char* bytes, size_t n, int little_endian, extern "C" int _PyLong_AsByteArray(PyLongObject* v, unsigned char* bytes, size_t n, int little_endian,
int is_signed) noexcept { int is_signed) noexcept {
RELEASE_ASSERT(little_endian == 1, "not implemented"); const mpz_t* op = &((BoxedLong*)v)->n;
RELEASE_ASSERT(n == 8, "did not yet check if the behaviour is correct for sizes other than 8"); mpz_t modified;
int sign = mpz_sgn(*op);
// If the value is zero, then mpz_export won't touch any of the memory, so handle that here:
if (sign == 0) {
memset(bytes, 0, n);
return 0;
}
size_t max_bits = n * 8;
if (is_signed)
max_bits--;
size_t bits;
if (sign == -1) {
if (!is_signed) {
PyErr_SetString(PyExc_OverflowError, "can't convert negative long to unsigned");
return -1;
}
// GMP uses sign-magnitude representation, and mpz_export just returns the magnitude.
// This is the easiest way I could think of to convert to two's complement.
// Note: the common case for this function is n in 1/2/4/8, where we could potentially
// just extract the value and then do the two's complement conversion ourselves. But
// then we would have to worry about endianness, which we don't right now.
mpz_init(modified);
mpz_com(modified, *op);
bits = mpz_sizeinbase(modified, 2);
for (int i = 0; i < 8 * n; i++) {
mpz_combit(modified, i);
}
op = &modified;
} else {
bits = mpz_sizeinbase(*op, 2);
}
if (bits > max_bits) {
if (sign == -1)
mpz_clear(modified);
PyErr_SetString(PyExc_OverflowError, "long too big to convert");
return -1;
}
size_t count = 0; size_t count = 0;
mpz_export(bytes, &count, -1, n, 0, 0, ((BoxedLong*)v)->n); mpz_export(bytes, &count, 1, n, little_endian ? -1 : 1, 0, *op);
RELEASE_ASSERT(count <= n, "overflow handling is not yet implemented"); ASSERT(count == 1, "overflow? (%ld %ld)", count, n);
if (sign == -1)
mpz_clear(modified);
return 0; return 0;
} }
...@@ -897,7 +943,7 @@ Box* longLshift(BoxedLong* v1, Box* _v2) { ...@@ -897,7 +943,7 @@ Box* longLshift(BoxedLong* v1, Box* _v2) {
if (isSubclass(_v2->cls, long_cls)) { if (isSubclass(_v2->cls, long_cls)) {
BoxedLong* v2 = static_cast<BoxedLong*>(_v2); BoxedLong* v2 = static_cast<BoxedLong*>(_v2);
if (mpz_cmp_si(v2->n, 0) < 0) if (mpz_sgn(v2->n) < 0)
raiseExcHelper(ValueError, "negative shift count"); raiseExcHelper(ValueError, "negative shift count");
uint64_t n = asUnsignedLong(v2); uint64_t n = asUnsignedLong(v2);
...@@ -927,7 +973,7 @@ Box* longRshift(BoxedLong* v1, Box* _v2) { ...@@ -927,7 +973,7 @@ Box* longRshift(BoxedLong* v1, Box* _v2) {
if (isSubclass(_v2->cls, long_cls)) { if (isSubclass(_v2->cls, long_cls)) {
BoxedLong* v2 = static_cast<BoxedLong*>(_v2); BoxedLong* v2 = static_cast<BoxedLong*>(_v2);
if (mpz_cmp_si(v2->n, 0) < 0) if (mpz_sgn(v2->n) < 0)
raiseExcHelper(ValueError, "negative shift count"); raiseExcHelper(ValueError, "negative shift count");
uint64_t n = asUnsignedLong(v2); uint64_t n = asUnsignedLong(v2);
...@@ -1013,7 +1059,7 @@ Box* longDiv(BoxedLong* v1, Box* _v2) { ...@@ -1013,7 +1059,7 @@ Box* longDiv(BoxedLong* v1, Box* _v2) {
if (isSubclass(_v2->cls, long_cls)) { if (isSubclass(_v2->cls, long_cls)) {
BoxedLong* v2 = static_cast<BoxedLong*>(_v2); BoxedLong* v2 = static_cast<BoxedLong*>(_v2);
if (mpz_cmp_si(v2->n, 0) == 0) if (mpz_sgn(v2->n) == 0)
raiseExcHelper(ZeroDivisionError, "long division or modulo by zero"); raiseExcHelper(ZeroDivisionError, "long division or modulo by zero");
BoxedLong* r = new BoxedLong(); BoxedLong* r = new BoxedLong();
...@@ -1049,7 +1095,7 @@ Box* longMod(BoxedLong* v1, Box* _v2) { ...@@ -1049,7 +1095,7 @@ Box* longMod(BoxedLong* v1, Box* _v2) {
if (isSubclass(_v2->cls, long_cls)) { if (isSubclass(_v2->cls, long_cls)) {
BoxedLong* v2 = static_cast<BoxedLong*>(_v2); BoxedLong* v2 = static_cast<BoxedLong*>(_v2);
if (mpz_cmp_si(v2->n, 0) == 0) if (mpz_sgn(v2->n) == 0)
raiseExcHelper(ZeroDivisionError, "long division or modulo by zero"); raiseExcHelper(ZeroDivisionError, "long division or modulo by zero");
BoxedLong* r = new BoxedLong(); BoxedLong* r = new BoxedLong();
...@@ -1095,7 +1141,7 @@ extern "C" Box* longDivmod(BoxedLong* lhs, Box* _rhs) { ...@@ -1095,7 +1141,7 @@ extern "C" Box* longDivmod(BoxedLong* lhs, Box* _rhs) {
if (isSubclass(_rhs->cls, long_cls)) { if (isSubclass(_rhs->cls, long_cls)) {
BoxedLong* rhs = static_cast<BoxedLong*>(_rhs); BoxedLong* rhs = static_cast<BoxedLong*>(_rhs);
if (mpz_cmp_si(rhs->n, 0) == 0) if (mpz_sgn(rhs->n) == 0)
raiseExcHelper(ZeroDivisionError, "long division or modulo by zero"); raiseExcHelper(ZeroDivisionError, "long division or modulo by zero");
BoxedLong* q = new BoxedLong(); BoxedLong* q = new BoxedLong();
...@@ -1126,7 +1172,7 @@ Box* longRdiv(BoxedLong* v1, Box* _v2) { ...@@ -1126,7 +1172,7 @@ Box* longRdiv(BoxedLong* v1, Box* _v2) {
raiseExcHelper(TypeError, "descriptor '__rdiv__' requires a 'long' object but received a '%s'", raiseExcHelper(TypeError, "descriptor '__rdiv__' requires a 'long' object but received a '%s'",
getTypeName(v1)); getTypeName(v1));
if (mpz_cmp_si(v1->n, 0) == 0) if (mpz_sgn(v1->n) == 0)
raiseExcHelper(ZeroDivisionError, "long division or modulo by zero"); raiseExcHelper(ZeroDivisionError, "long division or modulo by zero");
if (isSubclass(_v2->cls, long_cls)) { if (isSubclass(_v2->cls, long_cls)) {
...@@ -1255,7 +1301,7 @@ Box* longNonzero(BoxedLong* self) { ...@@ -1255,7 +1301,7 @@ Box* longNonzero(BoxedLong* self) {
raiseExcHelper(TypeError, "descriptor '__pow__' requires a 'long' object but received a '%s'", raiseExcHelper(TypeError, "descriptor '__pow__' requires a 'long' object but received a '%s'",
getTypeName(self)); getTypeName(self));
if (mpz_cmp_si(self->n, 0) == 0) if (mpz_sgn(self->n) == 0)
return False; return False;
return True; return True;
} }
......
...@@ -89,3 +89,5 @@ for i1 in [1, I(2), 3, I(4)]: ...@@ -89,3 +89,5 @@ for i1 in [1, I(2), 3, I(4)]:
print -i1, +i1, ~i1, i1 < i2, i1 <= i2, i1 == i2, i1 > i2, i1 >= i2, i1 != i2, i1 | i2, i1 ^ i2, i1 & i2, i1 * i2, i1 + i2, i1 / i2, i1 - i2, i1 ** i2, i1 // i2 print -i1, +i1, ~i1, i1 < i2, i1 <= i2, i1 == i2, i1 > i2, i1 >= i2, i1 != i2, i1 | i2, i1 ^ i2, i1 & i2, i1 * i2, i1 + i2, i1 / i2, i1 - i2, i1 ** i2, i1 // i2
print int("12345", base=16) print int("12345", base=16)
print type(2 ** 48)
...@@ -2,3 +2,18 @@ import struct ...@@ -2,3 +2,18 @@ import struct
s = struct.pack("II", 1, 1234) s = struct.pack("II", 1, 1234)
print repr(s) print repr(s)
print struct.unpack("II", s) print struct.unpack("II", s)
nums = [0, 0x98, -0x12, 0x9876, -0x1234, 0x98765432, -0x12345678, 0x9876543212345678, -0x1234567812345678]
for exp in 7, 8, 15, 16, 31, 32, 63, 64:
nums += [2 ** exp, 2 ** exp - 1, -2 ** exp, -2 ** exp - 1]
for format in "bB?hHiIlLqQP":
for order in [""] + list("@=<>!"):
for num in nums:
try:
spec = "%s%s" % (order, format)
print (spec, hex(num)), repr(struct.pack(spec, num))
except struct.error as e:
print "struct.error:", e
except OverflowError as e:
print "OverflowError:", e
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment