Move leb128 and remove trivial *mem functions as discussed in #5588 (#6876) - zig

commit 48d60834fd61404ea009f7f970775f9c59de1240 (tree)
parent d9c36cb2506f1b8cb30c7e9e108c6005eea7cf66
Author: tgschultz <tgschultz@gmail.com>
Date:   Mon, 16 Nov 2020 17:51:54 -0600

Move leb128 and remove trivial *mem functions as discussed in #5588 (#6876)

* Move leb128 out of debug and remove trivial *mem functions as discussed in #5588

* Turns out one of the *Mem functions was used by MachO. Replaced with trivial use of FixedBufferStream.
Diffstat:
M lib/std/debug.zig  | 7 -------
D lib/std/debug/leb128.zig  | 441 -------------------------------------------------------------------------------
M lib/std/dwarf.zig  | 2 +-
A lib/std/leb128.zig  | 374 +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
M lib/std/std.zig  | 1 +
M src/codegen.zig  | 2 +-
M src/codegen/wasm.zig  | 2 +-
M src/link/Elf.zig  | 2 +-
M src/link/MachO/Trie.zig  | 19 +++++++++++--------
M src/link/Wasm.zig  | 2 +-

10 files changed, 391 insertions(+), 461 deletions(-)
diff --git a/lib/std/debug.zig b/lib/std/debug.zig
@@ -22,8 +22,6 @@ const maxInt = std.math.maxInt;
 const File = std.fs.File;
 const windows = std.os.windows;
 
-pub const leb = @import("debug/leb128.zig");
-
 pub const runtime_safety = switch (builtin.mode) {
     .Debug, .ReleaseSafe => true,
     .ReleaseFast, .ReleaseSmall => false,
@@ -1843,8 +1841,3 @@ pub fn dumpStackPointerAddr(prefix: []const u8) void {
     );
     std.debug.warn("{} sp = 0x{x}\n", .{ prefix, sp });
 }
-
-// Reference everything so it gets tested.
-test "" {
-    _ = leb;
-}
diff --git a/lib/std/debug/leb128.zig b/lib/std/debug/leb128.zig
@@ -1,441 +0,0 @@
-// SPDX-License-Identifier: MIT
-// Copyright (c) 2015-2020 Zig Contributors
-// This file is part of [zig](https://ziglang.org/), which is MIT licensed.
-// The MIT license requires this copyright notice to be included in all copies
-// and substantial portions of the software.
-const std = @import("std");
-const testing = std.testing;
-
-/// Read a single unsigned LEB128 value from the given reader as type T,
-/// or error.Overflow if the value cannot fit.
-pub fn readULEB128(comptime T: type, reader: anytype) !T {
-    const U = if (@typeInfo(T).Int.bits < 8) u8 else T;
-    const ShiftT = std.math.Log2Int(U);
-
-    const max_group = (@typeInfo(U).Int.bits + 6) / 7;
-
-    var value = @as(U, 0);
-    var group = @as(ShiftT, 0);
-
-    while (group < max_group) : (group += 1) {
-        const byte = try reader.readByte();
-        var temp = @as(U, byte & 0x7f);
-
-        if (@shlWithOverflow(U, temp, group * 7, &temp)) return error.Overflow;
-
-        value |= temp;
-        if (byte & 0x80 == 0) break;
-    } else {
-        return error.Overflow;
-    }
-
-    // only applies in the case that we extended to u8
-    if (U != T) {
-        if (value > std.math.maxInt(T)) return error.Overflow;
-    }
-
-    return @truncate(T, value);
-}
-
-/// Write a single unsigned integer as unsigned LEB128 to the given writer.
-pub fn writeULEB128(writer: anytype, uint_value: anytype) !void {
-    const T = @TypeOf(uint_value);
-    const U = if (@typeInfo(T).Int.bits < 8) u8 else T;
-    var value = @intCast(U, uint_value);
-
-    while (true) {
-        const byte = @truncate(u8, value & 0x7f);
-        value >>= 7;
-        if (value == 0) {
-            try writer.writeByte(byte);
-            break;
-        } else {
-            try writer.writeByte(byte | 0x80);
-        }
-    }
-}
-
-/// Read a single unsigned integer from the given memory as type T.
-/// The provided slice reference will be updated to point to the byte after the last byte read.
-pub fn readULEB128Mem(comptime T: type, ptr: *[]const u8) !T {
-    var buf = std.io.fixedBufferStream(ptr.*);
-    const value = try readULEB128(T, buf.reader());
-    ptr.*.ptr += buf.pos;
-    return value;
-}
-
-/// Write a single unsigned LEB128 integer to the given memory as unsigned LEB128,
-/// returning the number of bytes written.
-pub fn writeULEB128Mem(ptr: []u8, uint_value: anytype) !usize {
-    const T = @TypeOf(uint_value);
-    const max_group = (@typeInfo(T).Int.bits + 6) / 7;
-    var buf = std.io.fixedBufferStream(ptr);
-    try writeULEB128(buf.writer(), uint_value);
-    return buf.pos;
-}
-
-/// Read a single signed LEB128 value from the given reader as type T,
-/// or error.Overflow if the value cannot fit.
-pub fn readILEB128(comptime T: type, reader: anytype) !T {
-    const S = if (@typeInfo(T).Int.bits < 8) i8 else T;
-    const U = std.meta.Int(.unsigned, @typeInfo(S).Int.bits);
-    const ShiftU = std.math.Log2Int(U);
-
-    const max_group = (@typeInfo(U).Int.bits + 6) / 7;
-
-    var value = @as(U, 0);
-    var group = @as(ShiftU, 0);
-
-    while (group < max_group) : (group += 1) {
-        const byte = try reader.readByte();
-        var temp = @as(U, byte & 0x7f);
-
-        const shift = group * 7;
-        if (@shlWithOverflow(U, temp, shift, &temp)) {
-            // Overflow is ok so long as the sign bit is set and this is the last byte
-            if (byte & 0x80 != 0) return error.Overflow;
-            if (@bitCast(S, temp) >= 0) return error.Overflow;
-
-            // and all the overflowed bits are 1
-            const remaining_shift = @intCast(u3, @typeInfo(U).Int.bits - @as(u16, shift));
-            const remaining_bits = @bitCast(i8, byte | 0x80) >> remaining_shift;
-            if (remaining_bits != -1) return error.Overflow;
-        }
-
-        value |= temp;
-        if (byte & 0x80 == 0) {
-            const needs_sign_ext = group + 1 < max_group;
-            if (byte & 0x40 != 0 and needs_sign_ext) {
-                const ones = @as(S, -1);
-                value |= @bitCast(U, ones) << (shift + 7);
-            }
-            break;
-        }
-    } else {
-        return error.Overflow;
-    }
-
-    const result = @bitCast(S, value);
-    // Only applies if we extended to i8
-    if (S != T) {
-        if (result > std.math.maxInt(T) or result < std.math.minInt(T)) return error.Overflow;
-    }
-
-    return @truncate(T, result);
-}
-
-/// Write a single signed integer as signed LEB128 to the given writer.
-pub fn writeILEB128(writer: anytype, int_value: anytype) !void {
-    const T = @TypeOf(int_value);
-    const S = if (@typeInfo(T).Int.bits < 8) i8 else T;
-    const U = std.meta.Int(.unsigned, @typeInfo(S).Int.bits);
-
-    var value = @intCast(S, int_value);
-
-    while (true) {
-        const uvalue = @bitCast(U, value);
-        const byte = @truncate(u8, uvalue);
-        value >>= 6;
-        if (value == -1 or value == 0) {
-            try writer.writeByte(byte & 0x7F);
-            break;
-        } else {
-            value >>= 1;
-            try writer.writeByte(byte | 0x80);
-        }
-    }
-}
-
-/// Read a single singed LEB128 integer from the given memory as type T.
-/// The provided slice reference will be updated to point to the byte after the last byte read.
-pub fn readILEB128Mem(comptime T: type, ptr: *[]const u8) !T {
-    var buf = std.io.fixedBufferStream(ptr.*);
-    const value = try readILEB128(T, buf.reader());
-    ptr.*.ptr += buf.pos;
-    return value;
-}
-
-/// Write a single signed LEB128 integer to the given memory as unsigned LEB128,
-/// returning the number of bytes written.
-pub fn writeILEB128Mem(ptr: []u8, int_value: anytype) !usize {
-    const T = @TypeOf(int_value);
-    var buf = std.io.fixedBufferStream(ptr);
-    try writeILEB128(buf.writer(), int_value);
-    return buf.pos;
-}
-
-/// This is an "advanced" function. It allows one to use a fixed amount of memory to store a
-/// ULEB128. This defeats the entire purpose of using this data encoding; it will no longer use
-/// fewer bytes to store smaller numbers. The advantage of using a fixed width is that it makes
-/// fields have a predictable size and so depending on the use case this tradeoff can be worthwhile.
-/// An example use case of this is in emitting DWARF info where one wants to make a ULEB128 field
-/// "relocatable", meaning that it becomes possible to later go back and patch the number to be a
-/// different value without shifting all the following code.
-pub fn writeUnsignedFixed(comptime l: usize, ptr: *[l]u8, int: std.meta.Int(.unsigned, l * 7)) void {
-    const T = @TypeOf(int);
-    const U = if (@typeInfo(T).Int.bits < 8) u8 else T;
-    var value = @intCast(U, int);
-
-    comptime var i = 0;
-    inline while (i < (l - 1)) : (i += 1) {
-        const byte = @truncate(u8, value) | 0b1000_0000;
-        value >>= 7;
-        ptr[i] = byte;
-    }
-    ptr[i] = @truncate(u8, value);
-}
-
-test "writeUnsignedFixed" {
-    {
-        var buf: [4]u8 = undefined;
-        writeUnsignedFixed(4, &buf, 0);
-        testing.expect((try test_read_uleb128(u64, &buf)) == 0);
-    }
-    {
-        var buf: [4]u8 = undefined;
-        writeUnsignedFixed(4, &buf, 1);
-        testing.expect((try test_read_uleb128(u64, &buf)) == 1);
-    }
-    {
-        var buf: [4]u8 = undefined;
-        writeUnsignedFixed(4, &buf, 1000);
-        testing.expect((try test_read_uleb128(u64, &buf)) == 1000);
-    }
-    {
-        var buf: [4]u8 = undefined;
-        writeUnsignedFixed(4, &buf, 10000000);
-        testing.expect((try test_read_uleb128(u64, &buf)) == 10000000);
-    }
-}
-
-// tests
-fn test_read_stream_ileb128(comptime T: type, encoded: []const u8) !T {
-    var reader = std.io.fixedBufferStream(encoded);
-    return try readILEB128(T, reader.reader());
-}
-
-fn test_read_stream_uleb128(comptime T: type, encoded: []const u8) !T {
-    var reader = std.io.fixedBufferStream(encoded);
-    return try readULEB128(T, reader.reader());
-}
-
-fn test_read_ileb128(comptime T: type, encoded: []const u8) !T {
-    var reader = std.io.fixedBufferStream(encoded);
-    const v1 = try readILEB128(T, reader.reader());
-    var in_ptr = encoded;
-    const v2 = try readILEB128Mem(T, &in_ptr);
-    testing.expectEqual(v1, v2);
-    return v1;
-}
-
-fn test_read_uleb128(comptime T: type, encoded: []const u8) !T {
-    var reader = std.io.fixedBufferStream(encoded);
-    const v1 = try readULEB128(T, reader.reader());
-    var in_ptr = encoded;
-    const v2 = try readULEB128Mem(T, &in_ptr);
-    testing.expectEqual(v1, v2);
-    return v1;
-}
-
-fn test_read_ileb128_seq(comptime T: type, comptime N: usize, encoded: []const u8) !void {
-    var reader = std.io.fixedBufferStream(encoded);
-    var in_ptr = encoded;
-    var i: usize = 0;
-    while (i < N) : (i += 1) {
-        const v1 = try readILEB128(T, reader.reader());
-        const v2 = try readILEB128Mem(T, &in_ptr);
-        testing.expectEqual(v1, v2);
-    }
-}
-
-fn test_read_uleb128_seq(comptime T: type, comptime N: usize, encoded: []const u8) !void {
-    var reader = std.io.fixedBufferStream(encoded);
-    var in_ptr = encoded;
-    var i: usize = 0;
-    while (i < N) : (i += 1) {
-        const v1 = try readULEB128(T, reader.reader());
-        const v2 = try readULEB128Mem(T, &in_ptr);
-        testing.expectEqual(v1, v2);
-    }
-}
-
-test "deserialize signed LEB128" {
-    // Truncated
-    testing.expectError(error.EndOfStream, test_read_stream_ileb128(i64, "\x80"));
-
-    // Overflow
-    testing.expectError(error.Overflow, test_read_ileb128(i8, "\x80\x80\x40"));
-    testing.expectError(error.Overflow, test_read_ileb128(i16, "\x80\x80\x80\x40"));
-    testing.expectError(error.Overflow, test_read_ileb128(i32, "\x80\x80\x80\x80\x40"));
-    testing.expectError(error.Overflow, test_read_ileb128(i64, "\x80\x80\x80\x80\x80\x80\x80\x80\x80\x40"));
-    testing.expectError(error.Overflow, test_read_ileb128(i8, "\xff\x7e"));
-
-    // Decode SLEB128
-    testing.expect((try test_read_ileb128(i64, "\x00")) == 0);
-    testing.expect((try test_read_ileb128(i64, "\x01")) == 1);
-    testing.expect((try test_read_ileb128(i64, "\x3f")) == 63);
-    testing.expect((try test_read_ileb128(i64, "\x40")) == -64);
-    testing.expect((try test_read_ileb128(i64, "\x41")) == -63);
-    testing.expect((try test_read_ileb128(i64, "\x7f")) == -1);
-    testing.expect((try test_read_ileb128(i64, "\x80\x01")) == 128);
-    testing.expect((try test_read_ileb128(i64, "\x81\x01")) == 129);
-    testing.expect((try test_read_ileb128(i64, "\xff\x7e")) == -129);
-    testing.expect((try test_read_ileb128(i64, "\x80\x7f")) == -128);
-    testing.expect((try test_read_ileb128(i64, "\x81\x7f")) == -127);
-    testing.expect((try test_read_ileb128(i64, "\xc0\x00")) == 64);
-    testing.expect((try test_read_ileb128(i64, "\xc7\x9f\x7f")) == -12345);
-    testing.expect((try test_read_ileb128(i8, "\xff\x7f")) == -1);
-    testing.expect((try test_read_ileb128(i16, "\xff\xff\x7f")) == -1);
-    testing.expect((try test_read_ileb128(i32, "\xff\xff\xff\xff\x7f")) == -1);
-    testing.expect((try test_read_ileb128(i32, "\x80\x80\x80\x80\x08")) == -0x80000000);
-    testing.expect((try test_read_ileb128(i64, "\x80\x80\x80\x80\x80\x80\x80\x80\x80\x01")) == @bitCast(i64, @intCast(u64, 0x8000000000000000)));
-    testing.expect((try test_read_ileb128(i64, "\x80\x80\x80\x80\x80\x80\x80\x80\x40")) == -0x4000000000000000);
-    testing.expect((try test_read_ileb128(i64, "\x80\x80\x80\x80\x80\x80\x80\x80\x80\x7f")) == -0x8000000000000000);
-
-    // Decode unnormalized SLEB128 with extra padding bytes.
-    testing.expect((try test_read_ileb128(i64, "\x80\x00")) == 0);
-    testing.expect((try test_read_ileb128(i64, "\x80\x80\x00")) == 0);
-    testing.expect((try test_read_ileb128(i64, "\xff\x00")) == 0x7f);
-    testing.expect((try test_read_ileb128(i64, "\xff\x80\x00")) == 0x7f);
-    testing.expect((try test_read_ileb128(i64, "\x80\x81\x00")) == 0x80);
-    testing.expect((try test_read_ileb128(i64, "\x80\x81\x80\x00")) == 0x80);
-
-    // Decode sequence of SLEB128 values
-    try test_read_ileb128_seq(i64, 4, "\x81\x01\x3f\x80\x7f\x80\x80\x80\x00");
-}
-
-test "deserialize unsigned LEB128" {
-    // Truncated
-    testing.expectError(error.EndOfStream, test_read_stream_uleb128(u64, "\x80"));
-
-    // Overflow
-    testing.expectError(error.Overflow, test_read_uleb128(u8, "\x80\x02"));
-    testing.expectError(error.Overflow, test_read_uleb128(u8, "\x80\x80\x40"));
-    testing.expectError(error.Overflow, test_read_uleb128(u16, "\x80\x80\x84"));
-    testing.expectError(error.Overflow, test_read_uleb128(u16, "\x80\x80\x80\x40"));
-    testing.expectError(error.Overflow, test_read_uleb128(u32, "\x80\x80\x80\x80\x90"));
-    testing.expectError(error.Overflow, test_read_uleb128(u32, "\x80\x80\x80\x80\x40"));
-    testing.expectError(error.Overflow, test_read_uleb128(u64, "\x80\x80\x80\x80\x80\x80\x80\x80\x80\x40"));
-
-    // Decode ULEB128
-    testing.expect((try test_read_uleb128(u64, "\x00")) == 0);
-    testing.expect((try test_read_uleb128(u64, "\x01")) == 1);
-    testing.expect((try test_read_uleb128(u64, "\x3f")) == 63);
-    testing.expect((try test_read_uleb128(u64, "\x40")) == 64);
-    testing.expect((try test_read_uleb128(u64, "\x7f")) == 0x7f);
-    testing.expect((try test_read_uleb128(u64, "\x80\x01")) == 0x80);
-    testing.expect((try test_read_uleb128(u64, "\x81\x01")) == 0x81);
-    testing.expect((try test_read_uleb128(u64, "\x90\x01")) == 0x90);
-    testing.expect((try test_read_uleb128(u64, "\xff\x01")) == 0xff);
-    testing.expect((try test_read_uleb128(u64, "\x80\x02")) == 0x100);
-    testing.expect((try test_read_uleb128(u64, "\x81\x02")) == 0x101);
-    testing.expect((try test_read_uleb128(u64, "\x80\xc1\x80\x80\x10")) == 4294975616);
-    testing.expect((try test_read_uleb128(u64, "\x80\x80\x80\x80\x80\x80\x80\x80\x80\x01")) == 0x8000000000000000);
-
-    // Decode ULEB128 with extra padding bytes
-    testing.expect((try test_read_uleb128(u64, "\x80\x00")) == 0);
-    testing.expect((try test_read_uleb128(u64, "\x80\x80\x00")) == 0);
-    testing.expect((try test_read_uleb128(u64, "\xff\x00")) == 0x7f);
-    testing.expect((try test_read_uleb128(u64, "\xff\x80\x00")) == 0x7f);
-    testing.expect((try test_read_uleb128(u64, "\x80\x81\x00")) == 0x80);
-    testing.expect((try test_read_uleb128(u64, "\x80\x81\x80\x00")) == 0x80);
-
-    // Decode sequence of ULEB128 values
-    try test_read_uleb128_seq(u64, 4, "\x81\x01\x3f\x80\x7f\x80\x80\x80\x00");
-}
-
-fn test_write_leb128(value: anytype) !void {
-    const T = @TypeOf(value);
-    const t_signed = @typeInfo(T).Int.is_signed;
-    const signedness = if (t_signed) .signed else .unsigned;
-
-    const writeStream = if (t_signed) writeILEB128 else writeULEB128;
-    const writeMem = if (t_signed) writeILEB128Mem else writeULEB128Mem;
-    const readStream = if (t_signed) readILEB128 else readULEB128;
-    const readMem = if (t_signed) readILEB128Mem else readULEB128Mem;
-
-    // decode to a larger bit size too, to ensure sign extension
-    // is working as expected
-    const larger_type_bits = ((@typeInfo(T).Int.bits + 8) / 8) * 8;
-    const B = std.meta.Int(signedness, larger_type_bits);
-
-    const bytes_needed = bn: {
-        const S = std.meta.Int(signedness, @sizeOf(T) * 8);
-        if (@typeInfo(T).Int.bits <= 7) break :bn @as(u16, 1);
-
-        const unused_bits = if (value < 0) @clz(T, ~value) else @clz(T, value);
-        const used_bits: u16 = (@typeInfo(T).Int.bits - unused_bits) + @boolToInt(t_signed);
-        if (used_bits <= 7) break :bn @as(u16, 1);
-        break :bn ((used_bits + 6) / 7);
-    };
-
-    const max_groups = if (@typeInfo(T).Int.bits == 0) 1 else (@typeInfo(T).Int.bits + 6) / 7;
-
-    var buf: [max_groups]u8 = undefined;
-    var fbs = std.io.fixedBufferStream(&buf);
-
-    // stream write
-    try writeStream(fbs.writer(), value);
-    const w1_pos = fbs.pos;
-    testing.expect(w1_pos == bytes_needed);
-
-    // stream read
-    fbs.pos = 0;
-    const sr = try readStream(T, fbs.reader());
-    testing.expect(fbs.pos == w1_pos);
-    testing.expect(sr == value);
-
-    // bigger type stream read
-    fbs.pos = 0;
-    const bsr = try readStream(B, fbs.reader());
-    testing.expect(fbs.pos == w1_pos);
-    testing.expect(bsr == value);
-
-    // mem write
-    const w2_pos = try writeMem(&buf, value);
-    testing.expect(w2_pos == w1_pos);
-
-    // mem read
-    var buf_ref: []u8 = buf[0..];
-    const mr = try readMem(T, &buf_ref);
-    testing.expect(@ptrToInt(buf_ref.ptr) - @ptrToInt(&buf) == w2_pos);
-    testing.expect(mr == value);
-
-    // bigger type mem read
-    buf_ref = buf[0..];
-    const bmr = try readMem(T, &buf_ref);
-    testing.expect(@ptrToInt(buf_ref.ptr) - @ptrToInt(&buf) == w2_pos);
-    testing.expect(bmr == value);
-}
-
-test "serialize unsigned LEB128" {
-    const max_bits = 18;
-
-    comptime var t = 0;
-    inline while (t <= max_bits) : (t += 1) {
-        const T = std.meta.Int(.unsigned, t);
-        const min = std.math.minInt(T);
-        const max = std.math.maxInt(T);
-        var i = @as(std.meta.Int(.unsigned, @typeInfo(T).Int.bits + 1), min);
-
-        while (i <= max) : (i += 1) try test_write_leb128(@intCast(T, i));
-    }
-}
-
-test "serialize signed LEB128" {
-    // explicitly test i0 because starting `t` at 0
-    // will break the while loop
-    try test_write_leb128(@as(i0, 0));
-
-    const max_bits = 18;
-
-    comptime var t = 1;
-    inline while (t <= max_bits) : (t += 1) {
-        const T = std.meta.Int(.signed, t);
-        const min = std.math.minInt(T);
-        const max = std.math.maxInt(T);
-        var i = @as(std.meta.Int(.signed, @typeInfo(T).Int.bits + 1), min);
-
-        while (i <= max) : (i += 1) try test_write_leb128(@intCast(T, i));
-    }
-}
diff --git a/lib/std/dwarf.zig b/lib/std/dwarf.zig
@@ -10,7 +10,7 @@ const fs = std.fs;
 const io = std.io;
 const mem = std.mem;
 const math = std.math;
-const leb = @import("debug/leb128.zig");
+const leb = @import("leb128.zig");
 
 const ArrayList = std.ArrayList;
 
diff --git a/lib/std/leb128.zig b/lib/std/leb128.zig
@@ -0,0 +1,374 @@
+// SPDX-License-Identifier: MIT
+// Copyright (c) 2015-2020 Zig Contributors
+// This file is part of [zig](https://ziglang.org/), which is MIT licensed.
+// The MIT license requires this copyright notice to be included in all copies
+// and substantial portions of the software.
+const std = @import("std");
+const testing = std.testing;
+
+/// Read a single unsigned LEB128 value from the given reader as type T,
+/// or error.Overflow if the value cannot fit.
+pub fn readULEB128(comptime T: type, reader: anytype) !T {
+    const U = if (@typeInfo(T).Int.bits < 8) u8 else T;
+    const ShiftT = std.math.Log2Int(U);
+
+    const max_group = (@typeInfo(U).Int.bits + 6) / 7;
+
+    var value = @as(U, 0);
+    var group = @as(ShiftT, 0);
+
+    while (group < max_group) : (group += 1) {
+        const byte = try reader.readByte();
+        var temp = @as(U, byte & 0x7f);
+
+        if (@shlWithOverflow(U, temp, group * 7, &temp)) return error.Overflow;
+
+        value |= temp;
+        if (byte & 0x80 == 0) break;
+    } else {
+        return error.Overflow;
+    }
+
+    // only applies in the case that we extended to u8
+    if (U != T) {
+        if (value > std.math.maxInt(T)) return error.Overflow;
+    }
+
+    return @truncate(T, value);
+}
+
+/// Write a single unsigned integer as unsigned LEB128 to the given writer.
+pub fn writeULEB128(writer: anytype, uint_value: anytype) !void {
+    const T = @TypeOf(uint_value);
+    const U = if (@typeInfo(T).Int.bits < 8) u8 else T;
+    var value = @intCast(U, uint_value);
+
+    while (true) {
+        const byte = @truncate(u8, value & 0x7f);
+        value >>= 7;
+        if (value == 0) {
+            try writer.writeByte(byte);
+            break;
+        } else {
+            try writer.writeByte(byte | 0x80);
+        }
+    }
+}
+
+/// Read a single signed LEB128 value from the given reader as type T,
+/// or error.Overflow if the value cannot fit.
+pub fn readILEB128(comptime T: type, reader: anytype) !T {
+    const S = if (@typeInfo(T).Int.bits < 8) i8 else T;
+    const U = std.meta.Int(.unsigned, @typeInfo(S).Int.bits);
+    const ShiftU = std.math.Log2Int(U);
+
+    const max_group = (@typeInfo(U).Int.bits + 6) / 7;
+
+    var value = @as(U, 0);
+    var group = @as(ShiftU, 0);
+
+    while (group < max_group) : (group += 1) {
+        const byte = try reader.readByte();
+        var temp = @as(U, byte & 0x7f);
+
+        const shift = group * 7;
+        if (@shlWithOverflow(U, temp, shift, &temp)) {
+            // Overflow is ok so long as the sign bit is set and this is the last byte
+            if (byte & 0x80 != 0) return error.Overflow;
+            if (@bitCast(S, temp) >= 0) return error.Overflow;
+
+            // and all the overflowed bits are 1
+            const remaining_shift = @intCast(u3, @typeInfo(U).Int.bits - @as(u16, shift));
+            const remaining_bits = @bitCast(i8, byte | 0x80) >> remaining_shift;
+            if (remaining_bits != -1) return error.Overflow;
+        }
+
+        value |= temp;
+        if (byte & 0x80 == 0) {
+            const needs_sign_ext = group + 1 < max_group;
+            if (byte & 0x40 != 0 and needs_sign_ext) {
+                const ones = @as(S, -1);
+                value |= @bitCast(U, ones) << (shift + 7);
+            }
+            break;
+        }
+    } else {
+        return error.Overflow;
+    }
+
+    const result = @bitCast(S, value);
+    // Only applies if we extended to i8
+    if (S != T) {
+        if (result > std.math.maxInt(T) or result < std.math.minInt(T)) return error.Overflow;
+    }
+
+    return @truncate(T, result);
+}
+
+/// Write a single signed integer as signed LEB128 to the given writer.
+pub fn writeILEB128(writer: anytype, int_value: anytype) !void {
+    const T = @TypeOf(int_value);
+    const S = if (@typeInfo(T).Int.bits < 8) i8 else T;
+    const U = std.meta.Int(.unsigned, @typeInfo(S).Int.bits);
+
+    var value = @intCast(S, int_value);
+
+    while (true) {
+        const uvalue = @bitCast(U, value);
+        const byte = @truncate(u8, uvalue);
+        value >>= 6;
+        if (value == -1 or value == 0) {
+            try writer.writeByte(byte & 0x7F);
+            break;
+        } else {
+            value >>= 1;
+            try writer.writeByte(byte | 0x80);
+        }
+    }
+}
+
+/// This is an "advanced" function. It allows one to use a fixed amount of memory to store a
+/// ULEB128. This defeats the entire purpose of using this data encoding; it will no longer use
+/// fewer bytes to store smaller numbers. The advantage of using a fixed width is that it makes
+/// fields have a predictable size and so depending on the use case this tradeoff can be worthwhile.
+/// An example use case of this is in emitting DWARF info where one wants to make a ULEB128 field
+/// "relocatable", meaning that it becomes possible to later go back and patch the number to be a
+/// different value without shifting all the following code.
+pub fn writeUnsignedFixed(comptime l: usize, ptr: *[l]u8, int: std.meta.Int(.unsigned, l * 7)) void {
+    const T = @TypeOf(int);
+    const U = if (@typeInfo(T).Int.bits < 8) u8 else T;
+    var value = @intCast(U, int);
+
+    comptime var i = 0;
+    inline while (i < (l - 1)) : (i += 1) {
+        const byte = @truncate(u8, value) | 0b1000_0000;
+        value >>= 7;
+        ptr[i] = byte;
+    }
+    ptr[i] = @truncate(u8, value);
+}
+
+test "writeUnsignedFixed" {
+    {
+        var buf: [4]u8 = undefined;
+        writeUnsignedFixed(4, &buf, 0);
+        testing.expect((try test_read_uleb128(u64, &buf)) == 0);
+    }
+    {
+        var buf: [4]u8 = undefined;
+        writeUnsignedFixed(4, &buf, 1);
+        testing.expect((try test_read_uleb128(u64, &buf)) == 1);
+    }
+    {
+        var buf: [4]u8 = undefined;
+        writeUnsignedFixed(4, &buf, 1000);
+        testing.expect((try test_read_uleb128(u64, &buf)) == 1000);
+    }
+    {
+        var buf: [4]u8 = undefined;
+        writeUnsignedFixed(4, &buf, 10000000);
+        testing.expect((try test_read_uleb128(u64, &buf)) == 10000000);
+    }
+}
+
+// tests
+fn test_read_stream_ileb128(comptime T: type, encoded: []const u8) !T {
+    var reader = std.io.fixedBufferStream(encoded);
+    return try readILEB128(T, reader.reader());
+}
+
+fn test_read_stream_uleb128(comptime T: type, encoded: []const u8) !T {
+    var reader = std.io.fixedBufferStream(encoded);
+    return try readULEB128(T, reader.reader());
+}
+
+fn test_read_ileb128(comptime T: type, encoded: []const u8) !T {
+    var reader = std.io.fixedBufferStream(encoded);
+    const v1 = try readILEB128(T, reader.reader());
+    return v1;
+}
+
+fn test_read_uleb128(comptime T: type, encoded: []const u8) !T {
+    var reader = std.io.fixedBufferStream(encoded);
+    const v1 = try readULEB128(T, reader.reader());
+    return v1;
+}
+
+fn test_read_ileb128_seq(comptime T: type, comptime N: usize, encoded: []const u8) !void {
+    var reader = std.io.fixedBufferStream(encoded);
+    var i: usize = 0;
+    while (i < N) : (i += 1) {
+        const v1 = try readILEB128(T, reader.reader());
+    }
+}
+
+fn test_read_uleb128_seq(comptime T: type, comptime N: usize, encoded: []const u8) !void {
+    var reader = std.io.fixedBufferStream(encoded);
+    var i: usize = 0;
+    while (i < N) : (i += 1) {
+        const v1 = try readULEB128(T, reader.reader());
+    }
+}
+
+test "deserialize signed LEB128" {
+    // Truncated
+    testing.expectError(error.EndOfStream, test_read_stream_ileb128(i64, "\x80"));
+
+    // Overflow
+    testing.expectError(error.Overflow, test_read_ileb128(i8, "\x80\x80\x40"));
+    testing.expectError(error.Overflow, test_read_ileb128(i16, "\x80\x80\x80\x40"));
+    testing.expectError(error.Overflow, test_read_ileb128(i32, "\x80\x80\x80\x80\x40"));
+    testing.expectError(error.Overflow, test_read_ileb128(i64, "\x80\x80\x80\x80\x80\x80\x80\x80\x80\x40"));
+    testing.expectError(error.Overflow, test_read_ileb128(i8, "\xff\x7e"));
+
+    // Decode SLEB128
+    testing.expect((try test_read_ileb128(i64, "\x00")) == 0);
+    testing.expect((try test_read_ileb128(i64, "\x01")) == 1);
+    testing.expect((try test_read_ileb128(i64, "\x3f")) == 63);
+    testing.expect((try test_read_ileb128(i64, "\x40")) == -64);
+    testing.expect((try test_read_ileb128(i64, "\x41")) == -63);
+    testing.expect((try test_read_ileb128(i64, "\x7f")) == -1);
+    testing.expect((try test_read_ileb128(i64, "\x80\x01")) == 128);
+    testing.expect((try test_read_ileb128(i64, "\x81\x01")) == 129);
+    testing.expect((try test_read_ileb128(i64, "\xff\x7e")) == -129);
+    testing.expect((try test_read_ileb128(i64, "\x80\x7f")) == -128);
+    testing.expect((try test_read_ileb128(i64, "\x81\x7f")) == -127);
+    testing.expect((try test_read_ileb128(i64, "\xc0\x00")) == 64);
+    testing.expect((try test_read_ileb128(i64, "\xc7\x9f\x7f")) == -12345);
+    testing.expect((try test_read_ileb128(i8, "\xff\x7f")) == -1);
+    testing.expect((try test_read_ileb128(i16, "\xff\xff\x7f")) == -1);
+    testing.expect((try test_read_ileb128(i32, "\xff\xff\xff\xff\x7f")) == -1);
+    testing.expect((try test_read_ileb128(i32, "\x80\x80\x80\x80\x08")) == -0x80000000);
+    testing.expect((try test_read_ileb128(i64, "\x80\x80\x80\x80\x80\x80\x80\x80\x80\x01")) == @bitCast(i64, @intCast(u64, 0x8000000000000000)));
+    testing.expect((try test_read_ileb128(i64, "\x80\x80\x80\x80\x80\x80\x80\x80\x40")) == -0x4000000000000000);
+    testing.expect((try test_read_ileb128(i64, "\x80\x80\x80\x80\x80\x80\x80\x80\x80\x7f")) == -0x8000000000000000);
+
+    // Decode unnormalized SLEB128 with extra padding bytes.
+    testing.expect((try test_read_ileb128(i64, "\x80\x00")) == 0);
+    testing.expect((try test_read_ileb128(i64, "\x80\x80\x00")) == 0);
+    testing.expect((try test_read_ileb128(i64, "\xff\x00")) == 0x7f);
+    testing.expect((try test_read_ileb128(i64, "\xff\x80\x00")) == 0x7f);
+    testing.expect((try test_read_ileb128(i64, "\x80\x81\x00")) == 0x80);
+    testing.expect((try test_read_ileb128(i64, "\x80\x81\x80\x00")) == 0x80);
+
+    // Decode sequence of SLEB128 values
+    try test_read_ileb128_seq(i64, 4, "\x81\x01\x3f\x80\x7f\x80\x80\x80\x00");
+}
+
+test "deserialize unsigned LEB128" {
+    // Truncated
+    testing.expectError(error.EndOfStream, test_read_stream_uleb128(u64, "\x80"));
+
+    // Overflow
+    testing.expectError(error.Overflow, test_read_uleb128(u8, "\x80\x02"));
+    testing.expectError(error.Overflow, test_read_uleb128(u8, "\x80\x80\x40"));
+    testing.expectError(error.Overflow, test_read_uleb128(u16, "\x80\x80\x84"));
+    testing.expectError(error.Overflow, test_read_uleb128(u16, "\x80\x80\x80\x40"));
+    testing.expectError(error.Overflow, test_read_uleb128(u32, "\x80\x80\x80\x80\x90"));
+    testing.expectError(error.Overflow, test_read_uleb128(u32, "\x80\x80\x80\x80\x40"));
+    testing.expectError(error.Overflow, test_read_uleb128(u64, "\x80\x80\x80\x80\x80\x80\x80\x80\x80\x40"));
+
+    // Decode ULEB128
+    testing.expect((try test_read_uleb128(u64, "\x00")) == 0);
+    testing.expect((try test_read_uleb128(u64, "\x01")) == 1);
+    testing.expect((try test_read_uleb128(u64, "\x3f")) == 63);
+    testing.expect((try test_read_uleb128(u64, "\x40")) == 64);
+    testing.expect((try test_read_uleb128(u64, "\x7f")) == 0x7f);
+    testing.expect((try test_read_uleb128(u64, "\x80\x01")) == 0x80);
+    testing.expect((try test_read_uleb128(u64, "\x81\x01")) == 0x81);
+    testing.expect((try test_read_uleb128(u64, "\x90\x01")) == 0x90);
+    testing.expect((try test_read_uleb128(u64, "\xff\x01")) == 0xff);
+    testing.expect((try test_read_uleb128(u64, "\x80\x02")) == 0x100);
+    testing.expect((try test_read_uleb128(u64, "\x81\x02")) == 0x101);
+    testing.expect((try test_read_uleb128(u64, "\x80\xc1\x80\x80\x10")) == 4294975616);
+    testing.expect((try test_read_uleb128(u64, "\x80\x80\x80\x80\x80\x80\x80\x80\x80\x01")) == 0x8000000000000000);
+
+    // Decode ULEB128 with extra padding bytes
+    testing.expect((try test_read_uleb128(u64, "\x80\x00")) == 0);
+    testing.expect((try test_read_uleb128(u64, "\x80\x80\x00")) == 0);
+    testing.expect((try test_read_uleb128(u64, "\xff\x00")) == 0x7f);
+    testing.expect((try test_read_uleb128(u64, "\xff\x80\x00")) == 0x7f);
+    testing.expect((try test_read_uleb128(u64, "\x80\x81\x00")) == 0x80);
+    testing.expect((try test_read_uleb128(u64, "\x80\x81\x80\x00")) == 0x80);
+
+    // Decode sequence of ULEB128 values
+    try test_read_uleb128_seq(u64, 4, "\x81\x01\x3f\x80\x7f\x80\x80\x80\x00");
+}
+
+fn test_write_leb128(value: anytype) !void {
+    const T = @TypeOf(value);
+    const t_signed = @typeInfo(T).Int.is_signed;
+    const signedness = if (t_signed) .signed else .unsigned;
+
+    const writeStream = if (t_signed) writeILEB128 else writeULEB128;
+    const readStream = if (t_signed) readILEB128 else readULEB128;
+
+    // decode to a larger bit size too, to ensure sign extension
+    // is working as expected
+    const larger_type_bits = ((@typeInfo(T).Int.bits + 8) / 8) * 8;
+    const B = std.meta.Int(signedness, larger_type_bits);
+
+    const bytes_needed = bn: {
+        const S = std.meta.Int(signedness, @sizeOf(T) * 8);
+        if (@typeInfo(T).Int.bits <= 7) break :bn @as(u16, 1);
+
+        const unused_bits = if (value < 0) @clz(T, ~value) else @clz(T, value);
+        const used_bits: u16 = (@typeInfo(T).Int.bits - unused_bits) + @boolToInt(t_signed);
+        if (used_bits <= 7) break :bn @as(u16, 1);
+        break :bn ((used_bits + 6) / 7);
+    };
+
+    const max_groups = if (@typeInfo(T).Int.bits == 0) 1 else (@typeInfo(T).Int.bits + 6) / 7;
+
+    var buf: [max_groups]u8 = undefined;
+    var fbs = std.io.fixedBufferStream(&buf);
+
+    // stream write
+    try writeStream(fbs.writer(), value);
+    const w1_pos = fbs.pos;
+    testing.expect(w1_pos == bytes_needed);
+
+    // stream read
+    fbs.pos = 0;
+    const sr = try readStream(T, fbs.reader());
+    testing.expect(fbs.pos == w1_pos);
+    testing.expect(sr == value);
+
+    // bigger type stream read
+    fbs.pos = 0;
+    const bsr = try readStream(B, fbs.reader());
+    testing.expect(fbs.pos == w1_pos);
+    testing.expect(bsr == value);
+}
+
+test "serialize unsigned LEB128" {
+    const max_bits = 18;
+
+    comptime var t = 0;
+    inline while (t <= max_bits) : (t += 1) {
+        const T = std.meta.Int(.unsigned, t);
+        const min = std.math.minInt(T);
+        const max = std.math.maxInt(T);
+        var i = @as(std.meta.Int(.unsigned, @typeInfo(T).Int.bits + 1), min);
+
+        while (i <= max) : (i += 1) try test_write_leb128(@intCast(T, i));
+    }
+}
+
+test "serialize signed LEB128" {
+    // explicitly test i0 because starting `t` at 0
+    // will break the while loop
+    try test_write_leb128(@as(i0, 0));
+
+    const max_bits = 18;
+
+    comptime var t = 1;
+    inline while (t <= max_bits) : (t += 1) {
+        const T = std.meta.Int(.signed, t);
+        const min = std.math.minInt(T);
+        const max = std.math.maxInt(T);
+        var i = @as(std.meta.Int(.signed, @typeInfo(T).Int.bits + 1), min);
+
+        while (i <= max) : (i += 1) try test_write_leb128(@intCast(T, i));
+    }
+}
diff --git a/lib/std/std.zig b/lib/std/std.zig
@@ -65,6 +65,7 @@ pub const hash_map = @import("hash_map.zig");
 pub const heap = @import("heap.zig");
 pub const io = @import("io.zig");
 pub const json = @import("json.zig");
+pub const leb = @import("leb128.zig");
 pub const log = @import("log.zig");
 pub const macho = @import("macho.zig");
 pub const math = @import("math.zig");
diff --git a/src/codegen.zig b/src/codegen.zig
@@ -14,7 +14,7 @@ const Target = std.Target;
 const Allocator = mem.Allocator;
 const trace = @import("tracy.zig").trace;
 const DW = std.dwarf;
-const leb128 = std.debug.leb;
+const leb128 = std.leb;
 const log = std.log.scoped(.codegen);
 
 /// The codegen-related data that is stored in `ir.Inst.Block` instructions.
diff --git a/src/codegen/wasm.zig b/src/codegen/wasm.zig
@@ -2,7 +2,7 @@ const std = @import("std");
 const Allocator = std.mem.Allocator;
 const ArrayList = std.ArrayList;
 const assert = std.debug.assert;
-const leb = std.debug.leb;
+const leb = std.leb;
 const mem = std.mem;
 
 const Module = @import("../Module.zig");
diff --git a/src/link/Elf.zig b/src/link/Elf.zig
@@ -8,7 +8,7 @@ const fs = std.fs;
 const elf = std.elf;
 const log = std.log.scoped(.link);
 const DW = std.dwarf;
-const leb128 = std.debug.leb;
+const leb128 = std.leb;
 
 const ir = @import("../ir.zig");
 const Module = @import("../Module.zig");
diff --git a/src/link/MachO/Trie.zig b/src/link/MachO/Trie.zig
@@ -32,7 +32,7 @@ const Trie = @This();
 
 const std = @import("std");
 const mem = std.mem;
-const leb = std.debug.leb;
+const leb = std.leb;
 const log = std.log.scoped(.link);
 const testing = std.testing;
 const assert = std.debug.assert;
@@ -139,16 +139,18 @@ const Node = struct {
             // Terminal node info: encode export flags and vmaddr offset of this symbol.
             var info_buf_len: usize = 0;
             var info_buf: [@sizeOf(u64) * 2]u8 = undefined;
-            info_buf_len += try leb.writeULEB128Mem(info_buf[0..], self.export_flags.?);
-            info_buf_len += try leb.writeULEB128Mem(info_buf[info_buf_len..], offset);
+            var info_stream = std.io.fixedBufferStream(&info_buf);
+            try leb.writeULEB128(info_stream.writer(), self.export_flags.?);
+            try leb.writeULEB128(info_stream.writer(), offset);
 
             // Encode the size of the terminal node info.
             var size_buf: [@sizeOf(u64)]u8 = undefined;
-            const size_buf_len = try leb.writeULEB128Mem(size_buf[0..], info_buf_len);
+            var size_stream = std.io.fixedBufferStream(&size_buf);
+            try leb.writeULEB128(size_stream.writer(), info_stream.pos);
 
             // Now, write them to the output buffer.
-            buffer.appendSliceAssumeCapacity(size_buf[0..size_buf_len]);
-            buffer.appendSliceAssumeCapacity(info_buf[0..info_buf_len]);
+            buffer.appendSliceAssumeCapacity(size_buf[0..size_stream.pos]);
+            buffer.appendSliceAssumeCapacity(info_buf[0..info_stream.pos]);
         } else {
             // Non-terminal node is delimited by 0 byte.
             buffer.appendAssumeCapacity(0);
@@ -162,8 +164,9 @@ const Node = struct {
             buffer.appendAssumeCapacity(0);
 
             var buf: [@sizeOf(u64)]u8 = undefined;
-            const buf_len = try leb.writeULEB128Mem(buf[0..], edge.to.trie_offset.?);
-            buffer.appendSliceAssumeCapacity(buf[0..buf_len]);
+            var buf_stream = std.io.fixedBufferStream(&buf);
+            try leb.writeULEB128(buf_stream.writer(), edge.to.trie_offset.?);
+            buffer.appendSliceAssumeCapacity(buf[0..buf_stream.pos]);
         }
     }
 
diff --git a/src/link/Wasm.zig b/src/link/Wasm.zig
@@ -5,7 +5,7 @@ const mem = std.mem;
 const Allocator = std.mem.Allocator;
 const assert = std.debug.assert;
 const fs = std.fs;
-const leb = std.debug.leb;
+const leb = std.leb;
 const log = std.log.scoped(.link);
 
 const Module = @import("../Module.zig");

	zig fork of https://codeberg.org/ziglang/zig
	Log \| Files \| Refs \| README \| LICENSE

M	lib/std/debug.zig	\|	7	-------
D	lib/std/debug/leb128.zig	\|	441	-------------------------------------------------------------------------------
M	lib/std/dwarf.zig	\|	2	+-
A	lib/std/leb128.zig	\|	374	+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
M	lib/std/std.zig	\|	1	+
M	src/codegen.zig	\|	2	+-
M	src/codegen/wasm.zig	\|	2	+-
M	src/link/Elf.zig	\|	2	+-
M	src/link/MachO/Trie.zig	\|	19	+++++++++++--------
M	src/link/Wasm.zig	\|	2	+-