py/mpz: Fix bugs with bitwise of -0 by ensuring all 0's are positive.

This commit makes sure that the value zero is always encoded in an mpz_t as neg=0 and len=0 (previously it was just len=0). This invariant is needed for some of the bitwise operations that operate on negative numbers, because they cannot handle -0. For example (-((1<<100)-(1<<100)))|1 was being computed as -65535, instead of 1. Fixes issue #8042. Signed-off-by: Damien George <damien@micropython.org>
2021-11-30 00:31:46 +11:00 · 2021-11-30 00:31:46 +11:00 · 2c139bbf4e
parent 05bea70979
commit 2c139bbf4e
3 changed files with 52 additions and 11 deletions
--- a/py/mpz.c
+++ b/py/mpz.c
@ -713,6 +713,7 @@ void mpz_set(mpz_t *dest, const mpz_t *src) {

 void mpz_set_from_int(mpz_t *z, mp_int_t val) {
    if (val == 0) {
+        z->neg = 0;
        z->len = 0;
        return;
    }
@ -899,10 +900,6 @@ bool mpz_is_even(const mpz_t *z) {
 #endif

 int mpz_cmp(const mpz_t *z1, const mpz_t *z2) {
-    // to catch comparison of -0 with +0
-    if (z1->len == 0 && z2->len == 0) {
-        return 0;
-    }
    int cmp = (int)z2->neg - (int)z1->neg;
    if (cmp != 0) {
        return cmp;
@ -1052,7 +1049,9 @@ void mpz_neg_inpl(mpz_t *dest, const mpz_t *z) {
    if (dest != z) {
        mpz_set(dest, z);
    }
-    dest->neg = 1 - dest->neg;
+    if (dest->len) {
+        dest->neg = 1 - dest->neg;
+    }
 }

 /* computes dest = ~z (= -z - 1)
@ -1148,7 +1147,7 @@ void mpz_add_inpl(mpz_t *dest, const mpz_t *lhs, const mpz_t *rhs) {
        dest->len = mpn_sub(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len);
    }

-    dest->neg = lhs->neg;
+    dest->neg = lhs->neg & !!dest->len;
 }

 /* computes dest = lhs - rhs
@ -1172,7 +1171,9 @@ void mpz_sub_inpl(mpz_t *dest, const mpz_t *lhs, const mpz_t *rhs) {
        dest->len = mpn_sub(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len);
    }

-    if (neg) {
+    if (dest->len == 0) {
+        dest->neg = 0;
+    } else if (neg) {
        dest->neg = 1 - lhs->neg;
    } else {
        dest->neg = lhs->neg;
@ -1484,14 +1485,16 @@ void mpz_divmod_inpl(mpz_t *dest_quo, mpz_t *dest_rem, const mpz_t *lhs, const m

    mpz_need_dig(dest_quo, lhs->len + 1); // +1 necessary?
    memset(dest_quo->dig, 0, (lhs->len + 1) * sizeof(mpz_dig_t));
+    dest_quo->neg = 0;
    dest_quo->len = 0;
    mpz_need_dig(dest_rem, lhs->len + 1); // +1 necessary?
    mpz_set(dest_rem, lhs);
    mpn_div(dest_rem->dig, &dest_rem->len, rhs->dig, rhs->len, dest_quo->dig, &dest_quo->len);
+    dest_rem->neg &= !!dest_rem->len;

    // check signs and do Python style modulo
    if (lhs->neg != rhs->neg) {
-        dest_quo->neg = 1;
+        dest_quo->neg = !!dest_quo->len;
        if (!mpz_is_zero(dest_rem)) {
            mpz_t mpzone;
            mpz_init_from_int(&mpzone, -1);
--- a/py/mpz.h
+++ b/py/mpz.h
@ -91,6 +91,7 @@ typedef int8_t mpz_dbl_dig_signed_t;
 #define MPZ_NUM_DIG_FOR_LL ((sizeof(long long) * 8 + MPZ_DIG_SIZE - 1) / MPZ_DIG_SIZE)

 typedef struct _mpz_t {
+    // Zero has neg=0, len=0.  Negative zero is not allowed.
    size_t neg : 1;
    size_t fixed_dig : 1;
    size_t alloc : (8 * sizeof(size_t) - 2);
@ -119,7 +120,7 @@ static inline bool mpz_is_zero(const mpz_t *z) {
    return z->len == 0;
 }
 static inline bool mpz_is_neg(const mpz_t *z) {
-    return z->len != 0 && z->neg != 0;
+    return z->neg != 0;
 }
 int mpz_cmp(const mpz_t *lhs, const mpz_t *rhs);

--- a/tests/basics/int_big_zeroone.py
+++ b/tests/basics/int_big_zeroone.py
@ -1,4 +1,4 @@
-# test [0,-0,1,-1] edge cases of bignum
+# test [0,1,-1] edge cases of bignum

 long_zero = (2**64) >> 65
 long_neg_zero = -long_zero
@ -13,7 +13,7 @@ print([~c for c in cases])
 print([c >> 1 for c in cases])
 print([c << 1 for c in cases])

-# comparison of 0/-0/+0
+# comparison of 0
 print(long_zero == 0)
 print(long_neg_zero == 0)
 print(long_one - 1 == 0)
@ -26,3 +26,40 @@ print(long_neg_zero < 1)
 print(long_neg_zero < -1)
 print(long_neg_zero > 1)
 print(long_neg_zero > -1)
+
+# generate zeros that involve negative numbers
+large = 1 << 70
+large_plus_one = large + 1
+zeros = (
+    large - large,
+    -large + large,
+    large + -large,
+    -(large - large),
+    large - large_plus_one + 1,
+    -large & (large - large),
+    -large ^ -large,
+    -large * (large - large),
+    (large - large) // -large,
+    -large // -large_plus_one,
+    -(large + large) % large,
+    (large + large) % -large,
+    -(large + large) % -large,
+)
+print(zeros)
+
+# compute arithmetic operations that may have problems with -0
+# (this checks that -0 is never generated in the zeros tuple)
+cases = (0, 1, -1) + zeros
+for lhs in cases:
+    print("-{} = {}".format(lhs, -lhs))
+    print("~{} = {}".format(lhs, ~lhs))
+    print("{} >> 1 = {}".format(lhs, lhs >> 1))
+    print("{} << 1 = {}".format(lhs, lhs << 1))
+    for rhs in cases:
+        print("{} == {} = {}".format(lhs, rhs, lhs == rhs))
+        print("{} + {} = {}".format(lhs, rhs, lhs + rhs))
+        print("{} - {} = {}".format(lhs, rhs, lhs - rhs))
+        print("{} * {} = {}".format(lhs, rhs, lhs * rhs))
+        print("{} | {} = {}".format(lhs, rhs, lhs | rhs))
+        print("{} & {} = {}".format(lhs, rhs, lhs & rhs))
+        print("{} ^ {} = {}".format(lhs, rhs, lhs ^ rhs))