commit 2e0524954405e05d8b2bfa4a15c293f26a4a080d (tree)
parent 10c97c26d964ea70230341468e05fdea533a77a3
Author: Matthew Lugg <mlugg@mlugg.co.uk>
Date: Sun, 21 Jun 2026 18:44:08 +0100
compiler_rt: update for new `@bitCast` semantics
Diffstat:
4 files changed, 71 insertions(+), 52 deletions(-)
diff --git a/lib/compiler_rt/float_from_int.zig b/lib/compiler_rt/float_from_int.zig
@@ -64,10 +64,21 @@ inline fn limb(limbs: []const u32, index: usize) u32 {
pub inline fn floatFromBigInt(comptime T: type, comptime signedness: std.builtin.Signedness, x: []const u32) T {
switch (x.len) {
0 => return 0,
- inline 1...4 => |limbs_len| return @floatFromInt(@as(
- @Int(signedness, 32 * limbs_len),
- @bitCast(x[0..limbs_len].*),
- )),
+ inline 1...4 => |limbs_len| {
+ const low_to_high: [limbs_len]u32 = switch (@import("builtin").cpu.arch.endian()) {
+ .little => x[0..limbs_len].*,
+ .big => switch (limbs_len) {
+ 1 => .{x[0]},
+ 2 => .{ x[1], x[0] },
+ 3 => .{ x[2], x[1], x[0] },
+ 4 => .{ x[3], x[2], x[1], x[0] },
+ else => comptime unreachable,
+ },
+ };
+ const I = @Int(signedness, 32 * limbs_len);
+ const int: I = @bitCast(low_to_high);
+ return @floatFromInt(int);
+ },
else => {},
}
diff --git a/lib/compiler_rt/int_from_float.zig b/lib/compiler_rt/int_from_float.zig
@@ -80,10 +80,18 @@ pub inline fn bigIntFromFloat(comptime signedness: std.builtin.Signedness, resul
switch (result.len) {
0 => return,
inline 1...4 => |limbs_len| {
- result[0..limbs_len].* = @bitCast(@as(
- @Int(signedness, 32 * limbs_len),
- @intFromFloat(a),
- ));
+ const I = @Int(signedness, 32 * limbs_len);
+ const low_to_high: [limbs_len]u32 = @bitCast(@as(I, @intFromFloat(a)));
+ result[0..limbs_len].* = switch (@import("builtin").cpu.arch.endian()) {
+ .little => low_to_high,
+ .big => switch (limbs_len) {
+ 1 => .{low_to_high[0]},
+ 2 => .{ low_to_high[1], low_to_high[0] },
+ 3 => .{ low_to_high[2], low_to_high[1], low_to_high[0] },
+ 4 => .{ low_to_high[3], low_to_high[2], low_to_high[1], low_to_high[0] },
+ else => comptime unreachable,
+ },
+ };
return;
},
else => {},
diff --git a/lib/compiler_rt/limb64.zig b/lib/compiler_rt/limb64.zig
@@ -75,7 +75,17 @@ fn asLimbs(v: anytype) Limbs(@TypeOf(v)) {
const int_info = @typeInfo(T).int;
const limb_cnt = comptime limbCount(int_info.bits);
const ET = @Int(int_info.signedness, limb_cnt * 64);
- return @bitCast(@as(ET, v));
+ const low_to_high: Limbs(T) = @bitCast(@as(ET, v));
+ switch (endian) {
+ .little => return low_to_high,
+ .big => {
+ var swapped: Limbs(T) = undefined;
+ for (low_to_high, 0..) |x, i| {
+ swapped[limb_cnt - i - 1] = x;
+ }
+ return swapped;
+ },
+ }
}
fn limbWrap(limb: u64, is_signed: bool, bits: u16) u64 {
@@ -944,11 +954,7 @@ inline fn add3(x: *[3]u64, start: usize, v0: u64) void {
fn mulwide(a: u64, b: u64) [2]u64 {
const muldXi = @import("mulXi3.zig").muldXi;
- const limbs: [2]u64 = @bitCast(muldXi(u64, a, b));
- return switch (endian) {
- .little => limbs,
- .big => .{ limbs[1], limbs[0] },
- };
+ return @bitCast(muldXi(u64, a, b));
}
fn __mulo_limb64(out_ptr: [*]u64, a_ptr: [*]const u64, b_ptr: [*]const u64, is_signed: bool, bits: u16) callconv(.c) bool {
diff --git a/lib/compiler_rt/udivmod.zig b/lib/compiler_rt/udivmod.zig
@@ -61,12 +61,6 @@ pub fn __umodti3(a: u128, b: u128) callconv(.c) u128 {
return r;
}
-const lo = switch (builtin.cpu.arch.endian()) {
- .big => 1,
- .little => 0,
-};
-const hi = 1 - lo;
-
// Let _u1 and _u0 be the high and low limbs of U respectively.
// Returns U / v_ and sets r = U % v_.
fn divwide_generic(comptime T: type, _u1: T, _u0: T, v_: T, r: *T) T {
@@ -158,22 +152,22 @@ pub fn udivmod(comptime T: type, a_: T, b_: T, maybe_rem: ?*T) T {
return 0;
}
- const a: [2]HalfT = @bitCast(a_);
- const b: [2]HalfT = @bitCast(b_);
+ const a: [2]HalfT = @bitCast(a_); // [0] is low bits, [1] is high bits
+ const b: [2]HalfT = @bitCast(b_); // [0] is low bits, [1] is high bits
var q: [2]HalfT = undefined;
var r: [2]HalfT = undefined;
// When the divisor fits in 64 bits, we can use an optimized path
- if (b[hi] == 0) {
- r[hi] = 0;
- if (a[hi] < b[lo]) {
+ if (b[1] == 0) {
+ r[1] = 0;
+ if (a[1] < b[0]) {
// The result fits in 64 bits
- q[hi] = 0;
- q[lo] = divwide(HalfT, a[hi], a[lo], b[lo], &r[lo]);
+ q[1] = 0;
+ q[0] = divwide(HalfT, a[1], a[0], b[0], &r[0]);
} else {
// First, divide with the high part to get the remainder. After that a_hi < b_lo.
- q[hi] = a[hi] / b[lo];
- q[lo] = divwide(HalfT, a[hi] % b[lo], a[lo], b[lo], &r[lo]);
+ q[1] = a[1] / b[0];
+ q[0] = divwide(HalfT, a[1] % b[0], a[0], b[0], &r[0]);
}
if (maybe_rem) |rem| {
rem.* = @bitCast(r);
@@ -181,21 +175,21 @@ pub fn udivmod(comptime T: type, a_: T, b_: T, maybe_rem: ?*T) T {
return @bitCast(q);
}
- // Large-divisor case: b[hi] != 0, so the quotient fits in one HalfT word.
+ // Large-divisor case: b[1] != 0, so the quotient fits in one HalfT word.
//
// Trial quotient via divwide (Knuth Vol 2, Section 4.3.1):
// Normalize the divisor so its high half has the MSB set, then use divwide
// on the top bits to get a trial quotient that is at most 1 too large.
// This replaces the O(shift) bit-by-bit loop with O(1) operations.
- const s: Log2Int(HalfT) = @intCast(@clz(b[hi]));
+ const s: Log2Int(HalfT) = @intCast(@clz(b[1]));
if (s == 0) {
- // b[hi] already has its MSB set, so b >= 2^(T_bits - 1). Since a >= b
+ // b[1] already has its MSB set, so b >= 2^(T_bits - 1). Since a >= b
// (we passed the b_ > a_ check), a >= 2^(T_bits - 1) too, meaning
- // a[hi] also has its MSB set. Therefore a / b < 2, and the quotient
+ // a[1] also has its MSB set. Therefore a / b < 2, and the quotient
// is exactly 1.
q = @bitCast(@as(T, 0));
- q[lo] = 1;
+ q[0] = 1;
if (maybe_rem) |rem| {
rem.* = a_ - b_;
}
@@ -207,12 +201,12 @@ pub fn udivmod(comptime T: type, a_: T, b_: T, maybe_rem: ?*T) T {
std.math.IntFittingRange(0, half_bits),
@intCast(s),
));
- const bn_hi: HalfT = (b[hi] << s) | (b[lo] >> sr);
+ const bn_hi: HalfT = (b[1] << s) | (b[0] >> sr);
// Trial numerator: the top (half_bits + s) bits of (a << s), as [a2:a1].
// a2 < bn_hi is guaranteed since a2 < 2^s and bn_hi >= 2^(half_bits - 1).
- const a2: HalfT = a[hi] >> sr;
- const a1: HalfT = (a[hi] << s) | (a[lo] >> sr);
+ const a2: HalfT = a[1] >> sr;
+ const a1: HalfT = (a[1] << s) | (a[0] >> sr);
// Trial quotient via divwide: q_hat = floor([a2:a1] / bn_hi).
// By Knuth's theorem (normalized divisor), q <= q_hat <= q + 1.
@@ -223,42 +217,42 @@ pub fn udivmod(comptime T: type, a_: T, b_: T, maybe_rem: ?*T) T {
// Compute the product using HalfT * HalfT -> T widening multiplications,
// which are native single-instruction ops when HalfT fits in a register
// (e.g. u64 * u64 -> u128 via mulq on x86_64, mul on aarch64).
- // product = q_hat * [b[hi]:b[lo]] = [p_top : p_mid : p_lo] (3 half-words)
- const prod_lo: T = @as(T, q_hat) * @as(T, b[lo]);
- const prod_hi: T = @as(T, q_hat) * @as(T, b[hi]);
+ // product = q_hat * [b[1]:b[0]] = [p_top : p_mid : p_lo] (3 half-words)
+ const prod_lo: T = @as(T, q_hat) * @as(T, b[0]);
+ const prod_hi: T = @as(T, q_hat) * @as(T, b[1]);
const prod_lo_parts: [2]HalfT = @bitCast(prod_lo);
const prod_hi_parts: [2]HalfT = @bitCast(prod_hi);
- const mid_add = @addWithOverflow(prod_hi_parts[lo], prod_lo_parts[hi]);
+ const mid_add = @addWithOverflow(prod_hi_parts[0], prod_lo_parts[1]);
var p_mid: HalfT = mid_add[0];
- const p_top: HalfT = prod_hi_parts[hi] +% @as(HalfT, mid_add[1]);
- var p_lo: HalfT = prod_lo_parts[lo];
+ const p_top: HalfT = prod_hi_parts[1] +% @as(HalfT, mid_add[1]);
+ var p_lo: HalfT = prod_lo_parts[0];
// If product > a, decrement q_hat (at most once, guaranteed by Knuth).
- if (p_top > 0 or p_mid > a[hi] or (p_mid == a[hi] and p_lo > a[lo])) {
+ if (p_top > 0 or p_mid > a[1] or (p_mid == a[1] and p_lo > a[0])) {
q_hat -= 1;
// Subtract b from the product for correct remainder computation.
// After correction, (q_hat * b) fits in T bits, so borrows into
// p_top cancel it to zero -- we only need [p_mid:p_lo].
- const sub_lo = @subWithOverflow(p_lo, b[lo]);
+ const sub_lo = @subWithOverflow(p_lo, b[0]);
p_lo = sub_lo[0];
- const sub_mid = @subWithOverflow(p_mid, b[hi]);
+ const sub_mid = @subWithOverflow(p_mid, b[1]);
const sub_mid2 = @subWithOverflow(sub_mid[0], @as(HalfT, sub_lo[1]));
p_mid = sub_mid2[0];
}
q = @bitCast(@as(T, 0));
- q[lo] = q_hat;
+ q[0] = q_hat;
if (maybe_rem) |rem| {
- // remainder = a - q_hat * b = [a[hi]:a[lo]] - [p_mid:p_lo]
+ // remainder = a - q_hat * b = [a[1]:a[0]] - [p_mid:p_lo]
// This subtraction is non-negative since q_hat <= true quotient.
- const rem_lo = @subWithOverflow(a[lo], p_lo);
- r[lo] = rem_lo[0];
- const rem_hi = @subWithOverflow(a[hi], p_mid);
+ const rem_lo = @subWithOverflow(a[0], p_lo);
+ r[0] = rem_lo[0];
+ const rem_hi = @subWithOverflow(a[1], p_mid);
const rem_hi2 = @subWithOverflow(rem_hi[0], @as(HalfT, rem_lo[1]));
- r[hi] = rem_hi2[0];
+ r[1] = rem_hi2[0];
rem.* = @bitCast(r);
}
return @bitCast(q);