const CHAR_BIT = 8; const du_int = c_ulonglong; const di_int = c_longlong; const si_int = c_int; const su_int = c_uint; const udwords = [2]su_int; const low = if (@compile_var("is_big_endian")) 1 else 0; const high = 1 - low; export fn __udivdi3(a: du_int, b: du_int) -> du_int { return __udivmoddi4(a, b, null); } fn du_int_to_udwords(x: du_int) -> udwords { // TODO ability to take address of params const x2 = x; return *(&udwords)(&x2); } export fn __udivmoddi4(a: du_int, b: du_int, maybe_rem: ?&du_int) -> du_int { const n_uword_bits = @sizeof(su_int) * CHAR_BIT; const n_udword_bits = @sizeof(du_int) * CHAR_BIT; var n = du_int_to_udwords(a); var d = du_int_to_udwords(b); var q: udwords = undefined; var r: udwords = undefined; var sr: c_uint = undefined; /* special cases, X is unknown, K != 0 */ if (n[high] == 0) { if (d[high] == 0) { /* 0 X * --- * 0 X */ if (const rem ?= maybe_rem) { *rem = n[low] % d[low]; } return n[low] / d[low]; } /* 0 X * --- * K X */ if (const rem ?= maybe_rem) { *rem = n[low]; } return 0; } /* n[high] != 0 */ if (d[low] == 0) { if (d[high] == 0) { /* K X * --- * 0 0 */ if (var rem ?= maybe_rem) { *rem = n[high] % d[low]; } return n[high] / d[low]; } /* d[high] != 0 */ if (n[low] == 0) { /* K 0 * --- * K 0 */ if (var rem ?= maybe_rem) { r[high] = n[high] % d[high]; r[low] = 0; *rem = *(&du_int)(&r[0]); } return n[high] / d[high]; } /* K K * --- * K 0 */ // if d is a power of 2 if ((d[high] & (d[high] - 1)) == 0) { if (var rem ?= maybe_rem) { r[low] = n[low]; r[high] = n[high] & (d[high] - 1); *rem = *(&du_int)(&r[0]); } return n[high] >> @ctz(@typeof(d[high]), d[high]); } /* K K * --- * K 0 */ sr = @clz(su_int, d[high]) - @clz(su_int, n[high]); /* 0 <= sr <= n_uword_bits - 2 or sr large */ if (sr > n_uword_bits - 2) { if (var rem ?= maybe_rem) { *rem = *(&du_int)(&n[0]); } return 0; } sr += 1; /* 1 <= sr <= n_uword_bits - 1 */ /* q.all = n.all << (n_udword_bits - sr); */ q[low] = 0; q[high] = n[low] << (n_uword_bits - sr); /* r.all = n.all >> sr; */ r[high] = n[high] >> sr; r[low] = (n[high] << (n_uword_bits - sr)) | (n[low] >> sr); } else { /* d[low] != 0 */ if (d[high] == 0) { /* K X * --- * 0 K */ /* if d is a power of 2 */ if ((d[low] & (d[low] - 1)) == 0) { if (var rem ?= maybe_rem) { *rem = n[low] & (d[low] - 1); } if (d[low] == 1) { return *(&du_int)(&n[0]); } sr = @ctz(@typeof(d[low]), d[low]); q[high] = n[high] >> sr; q[low] = (n[high] << (n_uword_bits - sr)) | (n[low] >> sr); return *(&du_int)(&q[0]); } /* K X * --- * 0 K */ sr = 1 + n_uword_bits + @clz(su_int, d[low]) - @clz(su_int, n[high]); /* 2 <= sr <= n_udword_bits - 1 * q.all = n.all << (n_udword_bits - sr); * r.all = n.all >> sr; */ if (sr == n_uword_bits) { q[low] = 0; q[high] = n[low]; r[high] = 0; r[low] = n[high]; } else if (sr < n_uword_bits) { // 2 <= sr <= n_uword_bits - 1 q[low] = 0; q[high] = n[low] << (n_uword_bits - sr); r[high] = n[high] >> sr; r[low] = (n[high] << (n_uword_bits - sr)) | (n[low] >> sr); } else { // n_uword_bits + 1 <= sr <= n_udword_bits - 1 q[low] = n[low] << (n_udword_bits - sr); q[high] = (n[high] << (n_udword_bits - sr)) | (n[low] >> (sr - n_uword_bits)); r[high] = 0; r[low] = n[high] >> (sr - n_uword_bits); } } else { /* K X * --- * K K */ sr = @clz(su_int, d[high]) - @clz(su_int, n[high]); /* 0 <= sr <= n_uword_bits - 1 or sr large */ if (sr > n_uword_bits - 1) { if (var rem ?= maybe_rem) { *rem = *(&du_int)(&n[0]); } return 0; } sr += 1; /* 1 <= sr <= n_uword_bits */ /* q.all = n.all << (n_udword_bits - sr); */ q[low] = 0; if (sr == n_uword_bits) { q[high] = n[low]; r[high] = 0; r[low] = n[high]; } else { q[high] = n[low] << (n_uword_bits - sr); r[high] = n[high] >> sr; r[low] = (n[high] << (n_uword_bits - sr)) | (n[low] >> sr); } } } /* Not a special case * q and r are initialized with: * q.all = n.all << (n_udword_bits - sr); * r.all = n.all >> sr; * 1 <= sr <= n_udword_bits - 1 */ var carry: su_int = 0; while (sr > 0) { /* r:q = ((r:q) << 1) | carry */ r[high] = (r[high] << 1) | (r[low] >> (n_uword_bits - 1)); r[low] = (r[low] << 1) | (q[high] >> (n_uword_bits - 1)); q[high] = (q[high] << 1) | (q[low] >> (n_uword_bits - 1)); q[low] = (q[low] << 1) | carry; /* carry = 0; * if (r.all >= d.all) * { * r.all -= d.all; * carry = 1; * } */ const s: di_int = (di_int)(*(&du_int)(&d[0]) - *(&du_int)(&r[0]) - 1) >> (n_udword_bits - 1); carry = su_int(s & 1); *(&du_int)(&r[0]) -= *(&du_int)(&d[0]) & c_ulonglong(s); sr -= 1; } *(&du_int)(&q[0]) = (*(&du_int)(&q[0]) << 1) | carry; if (var rem ?= maybe_rem) { *rem = *(&du_int)(&r[0]); } return *(&du_int)(&q[0]); } export fn __umoddi3(a: du_int, b: du_int) -> du_int { var r: du_int = undefined; __udivmoddi4(a, b, &r); return r; } #attribute("test") fn test_umoddi3() { test_one_umoddi3(0, 1, 0); test_one_umoddi3(2, 1, 0); test_one_umoddi3(0x8000000000000000, 1, 0x0); test_one_umoddi3(0x8000000000000000, 2, 0x0); test_one_umoddi3(0xFFFFFFFFFFFFFFFF, 2, 0x1); } fn test_one_umoddi3(a: du_int, b: du_int, expected_r: du_int) { const r = __umoddi3(a, b); assert(r == expected_r); } #attribute("test") fn test_udivmoddi4() { const cases = [][4]du_int { []du_int{0x0000000000000000, 0x0000000000000001, 0x0000000000000000, 0x0000000000000000}, []du_int{0x0000000080000000, 0x0000000100000001, 0x0000000000000000, 0x0000000080000000}, []du_int{0x7FFFFFFF00000001, 0x0000000000000001, 0x7FFFFFFF00000001, 0x0000000000000000}, []du_int{0x7FFFFFFF7FFFFFFF, 0xFFFFFFFFFFFFFFFF, 0x0000000000000000, 0x7FFFFFFF7FFFFFFF}, []du_int{0x8000000000000002, 0xFFFFFFFFFFFFFFFE, 0x0000000000000000, 0x8000000000000002}, []du_int{0x80000000FFFFFFFD, 0xFFFFFFFFFFFFFFFD, 0x0000000000000000, 0x80000000FFFFFFFD}, []du_int{0xFFFFFFFD00000010, 0xFFFFFFFF80000000, 0x0000000000000000, 0xFFFFFFFD00000010}, []du_int{0xFFFFFFFDFFFFFFFF, 0xFFFFFFFF7FFFFFFF, 0x0000000000000000, 0xFFFFFFFDFFFFFFFF}, []du_int{0xFFFFFFFE0747AE14, 0xFFFFFFFF0747AE14, 0x0000000000000000, 0xFFFFFFFE0747AE14}, []du_int{0xFFFFFFFF00000001, 0xFFFFFFFF078644FA, 0x0000000000000000, 0xFFFFFFFF00000001}, []du_int{0xFFFFFFFF80000000, 0xFFFFFFFF00000010, 0x0000000000000001, 0x000000007FFFFFF0}, []du_int{0xFFFFFFFFFFFFFFFF, 0xFFFFFFFFFFFFFFFF, 0x0000000000000001, 0x0000000000000000}, }; for (cases) |case| { test_one_udivmoddi4(case[0], case[1], case[2], case[3]); } } fn test_one_udivmoddi4(a: du_int, b: du_int, expected_q: du_int, expected_r: du_int) { var r: du_int = undefined; const q = __udivmoddi4(a, b, &r); assert(q == expected_q); assert(r == expected_r); } fn assert(b: bool) { if (!b) unreachable{}; }