const std = @import("std"); const builtin = @import("builtin"); const math = std.math; const compiler_rt = @import("../compiler_rt.zig"); const symbol = compiler_rt.symbol; comptime { symbol(&__mulosi4, "__mulosi4"); symbol(&__mulodi4, "__mulodi4"); symbol(&__muloti4, "__muloti4"); } // mulo - multiplication overflow // * return a*%b. // * return if a*b overflows => 1 else => 0 // - muloXi4_genericSmall as default // - muloXi4_genericFast for 2*bitsize <= usize inline fn muloXi4_genericSmall(comptime ST: type, a: ST, b: ST, overflow: *c_int) ST { overflow.* = 0; const min = math.minInt(ST); const res: ST = if (ST == i128 and builtin.target.cpu.arch.isWasm()) res: { // Despite compiler-rt being built with `-fno-builtin`, LLVM still converts this function to // a call to `__muloti4` on WASM. This is an upstream bug: circumvent it by directly calling // the "lower-level" compiler-rt routine for this wrapping multiplication. break :res @import("mulXi3.zig").__multi3(a, b); } else a *% b; // Hacker's Delight section Overflow subsection Multiplication // case a=-2^{31}, b=-1 problem, because // on some machines a*b = -2^{31} with overflow // Then -2^{31}/-1 overflows and any result is possible. // => check with a<0 and b=-2^{31} if ((a < 0 and b == min) or (a != 0 and @divTrunc(res, a) != b)) overflow.* = 1; return res; } inline fn muloXi4_genericFast(comptime ST: type, a: ST, b: ST, overflow: *c_int) ST { overflow.* = 0; const EST = switch (ST) { i32 => i64, i64 => i128, i128 => i256, else => unreachable, }; const min = math.minInt(ST); const max = math.maxInt(ST); const res: EST = @as(EST, a) * @as(EST, b); //invariant: -2^{bitwidth(EST)} < res < 2^{bitwidth(EST)-1} if (res < min or max < res) overflow.* = 1; return @as(ST, @truncate(res)); } pub fn __mulosi4(a: i32, b: i32, overflow: *c_int) callconv(.c) i32 { if (2 * @bitSizeOf(i32) <= @bitSizeOf(usize)) { return muloXi4_genericFast(i32, a, b, overflow); } else { return muloXi4_genericSmall(i32, a, b, overflow); } } pub fn __mulodi4(a: i64, b: i64, overflow: *c_int) callconv(.c) i64 { if (2 * @bitSizeOf(i64) <= @bitSizeOf(usize)) { return muloXi4_genericFast(i64, a, b, overflow); } else { return muloXi4_genericSmall(i64, a, b, overflow); } } pub fn __muloti4(a: i128, b: i128, overflow: *c_int) callconv(.c) i128 { if (2 * @bitSizeOf(i128) <= @bitSizeOf(usize)) { return muloXi4_genericFast(i128, a, b, overflow); } else { return muloXi4_genericSmall(i128, a, b, overflow); } } test { _ = @import("mulosi4_test.zig"); _ = @import("mulodi4_test.zig"); _ = @import("muloti4_test.zig"); }