From a18fd41064493e742eacebc88e2afeadd54ff6f0 Mon Sep 17 00:00:00 2001
From: mlugg <mlugg@mlugg.co.uk>
Date: Wed, 17 Sep 2025 18:38:11 +0100
Subject: std: rework/remove ucontext_t

Our usage of `ucontext_t` in the standard library was kind of
problematic. We unnecessarily mimiced libc-specific structures, and our
`getcontext` implementation was overkill for our use case of stack
tracing.

This commit introduces a new namespace, `std.debug.cpu_context`, which
contains "context" types for various architectures (currently x86,
x86_64, ARM, and AARCH64) containing the general-purpose CPU registers;
the ones needed in practice for stack unwinding. Each implementation has
a function `current` which populates the structure using inline
assembly. The structure is user-overrideable, though that should only be
necessary if the standard library does not have an implementation for
the *architecture*: that is to say, none of this is OS-dependent.

Of course, in POSIX signal handlers, we get a `ucontext_t` from the
kernel. The function `std.debug.cpu_context.fromPosixSignalContext`
converts this to a `std.debug.cpu_context.Native` with a big ol' target
switch.

This functionality is not exposed from `std.c` or `std.posix`, and
neither are `ucontext_t`, `mcontext_t`, or `getcontext`. The rationale
is that these types and functions do not conform to a specific ABI, and
in fact tend to get updated over time based on CPU features and
extensions; in addition, different libcs use different structures which
are "partially compatible" with the kernel structure. Overall, it's a
mess, but all we need is the kernel context, so we can just define a
kernel-compatible structure as long as we don't claim C compatibility by
putting it in `std.c` or `std.posix`.

This change resulted in a few nice `std.debug` simplifications, but
nothing too noteworthy. However, the main benefit of this change is that
DWARF unwinding---sometimes necessary for collecting stack traces
reliably---now requires far less target-specific integration.

Also fix a bug I noticed in `PageAllocator` (I found this due to a bug
in my distro's QEMU distribution; thanks, broken QEMU patch!) and I
think a couple of minor bugs in `std.debug`.

Resolves: #23801
Resolves: #23802
---
 lib/std/debug/cpu_context.zig | 1019 +++++++++++++++++++++++++++++++++++++++++
 1 file changed, 1019 insertions(+)
 create mode 100644 lib/std/debug/cpu_context.zig

(limited to 'lib/std/debug/cpu_context.zig')

diff --git a/lib/std/debug/cpu_context.zig b/lib/std/debug/cpu_context.zig
new file mode 100644
index 0000000000..9859575fa3
--- /dev/null
+++ b/lib/std/debug/cpu_context.zig
@@ -0,0 +1,1019 @@
+/// Register state for the native architecture, used by `std.debug` for stack unwinding.
+/// `noreturn` if there is no implementation for the native architecture.
+/// This can be overriden by exposing a declaration `root.debug.CpuContext`.
+pub const Native = if (@hasDecl(root, "debug") and @hasDecl(root.debug, "CpuContext"))
+    root.debug.CpuContext
+else switch (native_arch) {
+    .x86 => X86,
+    .x86_64 => X86_64,
+    .arm, .armeb, .thumb, .thumbeb => Arm,
+    .aarch64, .aarch64_be => Aarch64,
+    else => noreturn,
+};
+
+pub const DwarfRegisterError = error{
+    InvalidRegister,
+    UnsupportedRegister,
+};
+
+pub fn fromPosixSignalContext(ctx_ptr: ?*const anyopaque) ?Native {
+    if (signal_ucontext_t == void) return null;
+    const uc: *const signal_ucontext_t = @ptrCast(@alignCast(ctx_ptr));
+    return switch (native_arch) {
+        .x86 => switch (native_os) {
+            .linux, .netbsd, .solaris, .illumos => .{ .gprs = .init(.{
+                .eax = uc.mcontext.gregs[std.posix.REG.EAX],
+                .ecx = uc.mcontext.gregs[std.posix.REG.ECX],
+                .edx = uc.mcontext.gregs[std.posix.REG.EDX],
+                .ebx = uc.mcontext.gregs[std.posix.REG.EBX],
+                .esp = uc.mcontext.gregs[std.posix.REG.ESP],
+                .ebp = uc.mcontext.gregs[std.posix.REG.EBP],
+                .esi = uc.mcontext.gregs[std.posix.REG.ESI],
+                .edi = uc.mcontext.gregs[std.posix.REG.EDI],
+                .eip = uc.mcontext.gregs[std.posix.REG.EIP],
+            }) },
+            else => null,
+        },
+        .x86_64 => switch (native_os) {
+            .linux, .solaris, .illumos => .{ .gprs = .init(.{
+                .rax = uc.mcontext.gregs[std.posix.REG.RAX],
+                .rdx = uc.mcontext.gregs[std.posix.REG.RDX],
+                .rcx = uc.mcontext.gregs[std.posix.REG.RCX],
+                .rbx = uc.mcontext.gregs[std.posix.REG.RBX],
+                .rsi = uc.mcontext.gregs[std.posix.REG.RSI],
+                .rdi = uc.mcontext.gregs[std.posix.REG.RDI],
+                .rbp = uc.mcontext.gregs[std.posix.REG.RBP],
+                .rsp = uc.mcontext.gregs[std.posix.REG.RSP],
+                .r8 = uc.mcontext.gregs[std.posix.REG.R8],
+                .r9 = uc.mcontext.gregs[std.posix.REG.R9],
+                .r10 = uc.mcontext.gregs[std.posix.REG.R10],
+                .r11 = uc.mcontext.gregs[std.posix.REG.R11],
+                .r12 = uc.mcontext.gregs[std.posix.REG.R12],
+                .r13 = uc.mcontext.gregs[std.posix.REG.R13],
+                .r14 = uc.mcontext.gregs[std.posix.REG.R14],
+                .r15 = uc.mcontext.gregs[std.posix.REG.R15],
+                .rip = uc.mcontext.gregs[std.posix.REG.RIP],
+            }) },
+            .freebsd => .{ .gprs = .init(.{
+                .rax = uc.mcontext.rax,
+                .rdx = uc.mcontext.rdx,
+                .rcx = uc.mcontext.rcx,
+                .rbx = uc.mcontext.rbx,
+                .rsi = uc.mcontext.rsi,
+                .rdi = uc.mcontext.rdi,
+                .rbp = uc.mcontext.rbp,
+                .rsp = uc.mcontext.rsp,
+                .r8 = uc.mcontext.r8,
+                .r9 = uc.mcontext.r9,
+                .r10 = uc.mcontext.r10,
+                .r11 = uc.mcontext.r11,
+                .r12 = uc.mcontext.r12,
+                .r13 = uc.mcontext.r13,
+                .r14 = uc.mcontext.r14,
+                .r15 = uc.mcontext.r15,
+                .rip = uc.mcontext.rip,
+            }) },
+            .openbsd => .{ .gprs = .init(.{
+                .rax = @bitCast(uc.sc_rax),
+                .rdx = @bitCast(uc.sc_rdx),
+                .rcx = @bitCast(uc.sc_rcx),
+                .rbx = @bitCast(uc.sc_rbx),
+                .rsi = @bitCast(uc.sc_rsi),
+                .rdi = @bitCast(uc.sc_rdi),
+                .rbp = @bitCast(uc.sc_rbp),
+                .rsp = @bitCast(uc.sc_rsp),
+                .r8 = @bitCast(uc.sc_r8),
+                .r9 = @bitCast(uc.sc_r9),
+                .r10 = @bitCast(uc.sc_r10),
+                .r11 = @bitCast(uc.sc_r11),
+                .r12 = @bitCast(uc.sc_r12),
+                .r13 = @bitCast(uc.sc_r13),
+                .r14 = @bitCast(uc.sc_r14),
+                .r15 = @bitCast(uc.sc_r15),
+                .rip = @bitCast(uc.sc_rip),
+            }) },
+            .macos, .ios => .{ .gprs = .init(.{
+                .rax = uc.mcontext.ss.rax,
+                .rdx = uc.mcontext.ss.rdx,
+                .rcx = uc.mcontext.ss.rcx,
+                .rbx = uc.mcontext.ss.rbx,
+                .rsi = uc.mcontext.ss.rsi,
+                .rdi = uc.mcontext.ss.rdi,
+                .rbp = uc.mcontext.ss.rbp,
+                .rsp = uc.mcontext.ss.rsp,
+                .r8 = uc.mcontext.ss.r8,
+                .r9 = uc.mcontext.ss.r9,
+                .r10 = uc.mcontext.ss.r10,
+                .r11 = uc.mcontext.ss.r11,
+                .r12 = uc.mcontext.ss.r12,
+                .r13 = uc.mcontext.ss.r13,
+                .r14 = uc.mcontext.ss.r14,
+                .r15 = uc.mcontext.ss.r15,
+                .rip = uc.mcontext.ss.rip,
+            }) },
+            else => null,
+        },
+        .arm, .armeb, .thumb, .thumbeb => switch (builtin.os.tag) {
+            .linux => .{
+                .r = .{
+                    uc.mcontext.arm_r0,
+                    uc.mcontext.arm_r1,
+                    uc.mcontext.arm_r2,
+                    uc.mcontext.arm_r3,
+                    uc.mcontext.arm_r4,
+                    uc.mcontext.arm_r5,
+                    uc.mcontext.arm_r6,
+                    uc.mcontext.arm_r7,
+                    uc.mcontext.arm_r8,
+                    uc.mcontext.arm_r9,
+                    uc.mcontext.arm_r10,
+                    uc.mcontext.arm_fp, // r11 = fp
+                    uc.mcontext.arm_ip, // r12 = ip
+                    uc.mcontext.arm_sp, // r13 = sp
+                    uc.mcontext.arm_lr, // r14 = lr
+                    uc.mcontext.arm_pc, // r15 = pc
+                },
+            },
+            else => null,
+        },
+        .aarch64, .aarch64_be => switch (builtin.os.tag) {
+            .macos, .ios, .tvos, .watchos, .visionos => .{
+                .x = uc.mcontext.ss.regs ++ @as([2]u64, .{
+                    uc.mcontext.ss.fp, // x29 = fp
+                    uc.mcontext.ss.lr, // x30 = lr
+                }),
+                .sp = uc.mcontext.ss.sp,
+                .pc = uc.mcontext.ss.pc,
+            },
+            .netbsd => .{
+                .x = uc.mcontext.gregs[0..31],
+                .sp = uc.mcontext.gregs[31],
+                .pc = uc.mcontext.gregs[32],
+            },
+            .freebsd => .{
+                .x = uc.mcontext.gpregs.x ++ @as([1]u64, .{
+                    uc.mcontext.gpregs.lr, // x30 = lr
+                }),
+                .sp = uc.mcontext.gpregs.sp,
+                // On aarch64, the register ELR_LR1 defines the address to return to after handling
+                // a CPU exception (ELR is "Exception Link Register"). FreeBSD's ucontext_t uses
+                // this as the field name, but it's the same thing as the context's PC.
+                .pc = uc.mcontext.gpregs.elr,
+            },
+            .openbsd => .{
+                .x = uc.sc_x ++ .{uc.sc_lr},
+                .sp = uc.sc_sp,
+                // Not a bug; see freebsd above for explanation.
+                .pc = uc.sc_elr,
+            },
+            .linux => .{
+                .x = uc.mcontext.regs,
+                .sp = uc.mcontext.sp,
+                .pc = uc.mcontext.pc,
+            },
+            else => null,
+        },
+        else => null,
+    };
+}
+
+pub fn fromWindowsContext(ctx: *const std.os.windows.CONTEXT) Native {
+    return switch (native_arch) {
+        .x86 => .{ .gprs = .init(.{
+            .eax = ctx.Eax,
+            .ecx = ctx.Ecx,
+            .edx = ctx.Edx,
+            .ebx = ctx.Ebx,
+            .esp = ctx.Esp,
+            .ebp = ctx.Ebp,
+            .esi = ctx.Esi,
+            .edi = ctx.Edi,
+            .eip = ctx.Eip,
+        }) },
+        .x86_64 => .{ .gprs = .init(.{
+            .rax = ctx.Rax,
+            .rdx = ctx.Rdx,
+            .rcx = ctx.Rcx,
+            .rbx = ctx.Rbx,
+            .rsi = ctx.Rsi,
+            .rdi = ctx.Rdi,
+            .rbp = ctx.Rbp,
+            .rsp = ctx.Rsp,
+            .r8 = ctx.R8,
+            .r9 = ctx.R9,
+            .r10 = ctx.R10,
+            .r11 = ctx.R11,
+            .r12 = ctx.R12,
+            .r13 = ctx.R13,
+            .r14 = ctx.R14,
+            .r15 = ctx.R15,
+            .rip = ctx.Rip,
+        }) },
+        .aarch64, .aarch64_be => .{
+            .x = ctx.DUMMYUNIONNAME.X[0..31].*,
+            .sp = ctx.Sp,
+            .pc = ctx.Pc,
+        },
+        else => comptime unreachable,
+    };
+}
+
+pub const X86 = struct {
+    /// The first 8 registers here intentionally match the order of registers pushed
+    /// by PUSHA, which is also the order used by the DWARF register mappings.
+    pub const Gpr = enum {
+        // zig fmt: off
+        eax, ecx, edx, ebx,
+        esp, ebp, esi, edi,
+        eip,
+        // zig fmt: on
+    };
+    gprs: std.enums.EnumArray(Gpr, u32),
+
+    pub inline fn current() X86 {
+        var ctx: X86 = undefined;
+        asm volatile (
+            \\movl %%eax, 0x00(%%edi)
+            \\movl %%ecx, 0x04(%%edi)
+            \\movl %%edx, 0x08(%%edi)
+            \\movl %%ebx, 0x0c(%%edi)
+            \\movl %%esp, 0x10(%%edi)
+            \\movl %%ebp, 0x14(%%edi)
+            \\movl %%esi, 0x18(%%edi)
+            \\movl %%edi, 0x1c(%%edi)
+            \\call 1f
+            \\1:
+            \\popl 0x20(%%edi)
+            :
+            : [gprs] "{edi}" (&ctx.gprs.values),
+            : .{ .memory = true });
+        return ctx;
+    }
+
+    pub fn dwarfRegisterBytes(ctx: *X86, register_num: u16) DwarfRegisterError![]u8 {
+        // System V Application Binary Interface Intel386 Architecture Processor Supplement Version 1.1
+        //   § 2.4.2 "DWARF Register Number Mapping"
+        switch (register_num) {
+            // The order of `Gpr` intentionally matches DWARF's mappings.
+            //
+            // x86-macos sometimes uses different mappings (ebp and esp are reversed when the unwind
+            // information is from `__eh_frame`). This deviation is not considered here, because
+            // x86-macos is a deprecated target which is not supported by the Zig Standard Library.
+            0...8 => return @ptrCast(&ctx.gprs.values[register_num]),
+
+            9 => return error.UnsupportedRegister, // rflags
+            11...18 => return error.UnsupportedRegister, // st0 - st7
+            21...28 => return error.UnsupportedRegister, // xmm0 - xmm7
+            29...36 => return error.UnsupportedRegister, // mm0 - mm7
+            39 => return error.UnsupportedRegister, // mxcsr
+            40...45 => return error.UnsupportedRegister, // es, cs, ss, ds, fs, gs
+            48 => return error.UnsupportedRegister, // tr
+            49 => return error.UnsupportedRegister, // ldtr
+            93...94 => return error.UnsupportedRegister, // fs.base, gs.base
+
+            else => return error.InvalidRegister,
+        }
+    }
+};
+
+pub const X86_64 = struct {
+    /// MLUGG TODO: explain this order. why does DWARF have this?
+    pub const Gpr = enum {
+        // zig fmt: off
+        rax, rdx, rcx, rbx,
+        rsi, rdi, rbp, rsp,
+        r8,  r9,  r10, r11,
+        r12, r13, r14, r15,
+        rip,
+        // zig fmt: on
+    };
+    gprs: std.enums.EnumArray(Gpr, u64),
+
+    pub inline fn current() X86_64 {
+        var ctx: X86_64 = undefined;
+        asm volatile (
+            \\movq %%rax, 0x00(%%rdi)
+            \\movq %%rdx, 0x08(%%rdi)
+            \\movq %%rcx, 0x10(%%rdi)
+            \\movq %%rbx, 0x18(%%rdi)
+            \\movq %%rsi, 0x20(%%rdi)
+            \\movq %%rdi, 0x28(%%rdi)
+            \\movq %%rbp, 0x30(%%rdi)
+            \\movq %%rsp, 0x38(%%rdi)
+            \\movq %%r8,  0x40(%%rdi)
+            \\movq %%r9,  0x48(%%rdi)
+            \\movq %%r10, 0x50(%%rdi)
+            \\movq %%r11, 0x58(%%rdi)
+            \\movq %%r12, 0x60(%%rdi)
+            \\movq %%r13, 0x68(%%rdi)
+            \\movq %%r14, 0x70(%%rdi)
+            \\movq %%r15, 0x78(%%rdi)
+            \\leaq (%%rip), %%rax
+            \\movq %%rax, 0x80(%%rdi)
+            \\movq 0x00(%%rdi), %%rax  // restore saved rax
+            :
+            : [gprs] "{rdi}" (&ctx.gprs.values),
+            : .{ .memory = true });
+        return ctx;
+    }
+
+    pub fn dwarfRegisterBytes(ctx: *X86_64, register_num: u16) DwarfRegisterError![]u8 {
+        // System V Application Binary Interface AMD64 Architecture Processor Supplement
+        //   § 3.6.2 "DWARF Register Number Mapping"
+        switch (register_num) {
+            // The order of `Gpr` intentionally matches DWARF's mappings.
+            0...16 => return @ptrCast(&ctx.gprs.values[register_num]),
+
+            17...32 => return error.UnsupportedRegister, // xmm0 - xmm15
+            33...40 => return error.UnsupportedRegister, // st0 - st7
+            41...48 => return error.UnsupportedRegister, // mm0 - mm7
+            49 => return error.UnsupportedRegister, // rflags
+            50...55 => return error.UnsupportedRegister, // es, cs, ss, ds, fs, gs
+            58...59 => return error.UnsupportedRegister, // fs.base, gs.base
+            62 => return error.UnsupportedRegister, // tr
+            63 => return error.UnsupportedRegister, // ldtr
+            64 => return error.UnsupportedRegister, // mxcsr
+            65 => return error.UnsupportedRegister, // fcw
+            66 => return error.UnsupportedRegister, // fsw
+
+            else => return error.InvalidRegister,
+        }
+    }
+};
+
+pub const Arm = struct {
+    /// The numbered general-purpose registers R0 - R15.
+    r: [16]u32,
+
+    pub inline fn current() Arm {
+        var ctx: Arm = undefined;
+        asm volatile (
+            \\// For compatibility with Thumb, we can't write r13 (sp) or r15 (pc) with stm.
+            \\stm r0, {r0-r12}
+            \\str r13, [r0, #0x34]
+            \\str r14, [r0, #0x38]
+            \\str r15, [r0, #0x3c]
+            :
+            : [r] "{r0}" (&ctx.r),
+            : .{ .memory = true });
+        return ctx;
+    }
+
+    pub fn dwarfRegisterBytes(ctx: *Arm, register_num: u16) DwarfRegisterError![]u8 {
+        // DWARF for the Arm(r) Architecture § 4.1 "DWARF register names"
+        switch (register_num) {
+            // The order of `Gpr` intentionally matches DWARF's mappings.
+            0...15 => return @ptrCast(&ctx.r[register_num]),
+
+            64...95 => return error.UnsupportedRegister, // S0 - S31
+            96...103 => return error.UnsupportedRegister, // F0 - F7
+            104...111 => return error.UnsupportedRegister, // wCGR0 - wCGR7, or ACC0 - ACC7
+            112...127 => return error.UnsupportedRegister, // wR0 - wR15
+            128 => return error.UnsupportedRegister, // SPSR
+            129 => return error.UnsupportedRegister, // SPSR_FIQ
+            130 => return error.UnsupportedRegister, // SPSR_IRQ
+            131 => return error.UnsupportedRegister, // SPSR_ABT
+            132 => return error.UnsupportedRegister, // SPSR_UND
+            133 => return error.UnsupportedRegister, // SPSR_SVC
+            143 => return error.UnsupportedRegister, // RA_AUTH_CODE
+            144...150 => return error.UnsupportedRegister, // R8_USR - R14_USR
+            151...157 => return error.UnsupportedRegister, // R8_FIQ - R14_FIQ
+            158...159 => return error.UnsupportedRegister, // R13_IRQ - R14_IRQ
+            160...161 => return error.UnsupportedRegister, // R13_ABT - R14_ABT
+            162...163 => return error.UnsupportedRegister, // R13_UND - R14_UND
+            164...165 => return error.UnsupportedRegister, // R13_SVC - R14_SVC
+            192...199 => return error.UnsupportedRegister, // wC0 - wC7
+            256...287 => return error.UnsupportedRegister, // D0 - D31
+            320 => return error.UnsupportedRegister, // TPIDRURO
+            321 => return error.UnsupportedRegister, // TPIDRURW
+            322 => return error.UnsupportedRegister, // TPIDPR
+            323 => return error.UnsupportedRegister, // HTPIDPR
+            8192...16383 => return error.UnsupportedRegister, // Unspecified vendor co-processor register
+
+            else => return error.InvalidRegister,
+        }
+    }
+};
+
+/// This is an `extern struct` so that inline assembly in `current` can use field offsets.
+pub const Aarch64 = extern struct {
+    /// The numbered general-purpose registers X0 - X30.
+    x: [31]u64,
+    sp: u64,
+    pc: u64,
+
+    pub inline fn current() Aarch64 {
+        var ctx: Aarch64 = undefined;
+        asm volatile (
+            \\stp x0,  x1,  [x0, #0x000]
+            \\stp x2,  x3,  [x0, #0x010]
+            \\stp x4,  x5,  [x0, #0x020]
+            \\stp x6,  x7,  [x0, #0x030]
+            \\stp x8,  x9,  [x0, #0x040]
+            \\stp x10, x11, [x0, #0x050]
+            \\stp x12, x13, [x0, #0x060]
+            \\stp x14, x15, [x0, #0x070]
+            \\stp x16, x17, [x0, #0x080]
+            \\stp x18, x19, [x0, #0x090]
+            \\stp x20, x21, [x0, #0x0a0]
+            \\stp x22, x23, [x0, #0x0b0]
+            \\stp x24, x25, [x0, #0x0c0]
+            \\stp x26, x27, [x0, #0x0d0]
+            \\stp x28, x29, [x0, #0x0e0]
+            \\str x30, [x0, #0x0f0]
+            \\mov x1, sp
+            \\str x1, [x0, #0x0f8]
+            \\adr x1, .
+            \\str x1, [x0, #0x100]
+            \\ldr x1, [x0, #0x008] // restore saved x1
+            :
+            : [gprs] "{x0}" (&ctx),
+            : .{ .memory = true });
+        return ctx;
+    }
+
+    pub fn dwarfRegisterBytes(ctx: *Aarch64, register_num: u16) DwarfRegisterError![]u8 {
+        // DWARF for the Arm(r) 64-bit Architecture (AArch64) § 4.1 "DWARF register names"
+        switch (register_num) {
+            // The order of `Gpr` intentionally matches DWARF's mappings.
+            0...30 => return @ptrCast(&ctx.x[register_num]),
+            31 => return @ptrCast(&ctx.sp),
+            32 => return @ptrCast(&ctx.pc),
+
+            33 => return error.UnsupportedRegister, // ELF_mode
+            34 => return error.UnsupportedRegister, // RA_SIGN_STATE
+            35 => return error.UnsupportedRegister, // TPIDRRO_ELO
+            36 => return error.UnsupportedRegister, // RPIDR_ELO
+            37 => return error.UnsupportedRegister, // RPIDR_EL1
+            38 => return error.UnsupportedRegister, // RPIDR_EL2
+            39 => return error.UnsupportedRegister, // RPIDR_EL3
+            46 => return error.UnsupportedRegister, // VG
+            47 => return error.UnsupportedRegister, // FFR
+            48...63 => return error.UnsupportedRegister, // P0 - P15
+            64...95 => return error.UnsupportedRegister, // V0 - V31
+            96...127 => return error.UnsupportedRegister, // Z0 - Z31
+
+            else => return error.InvalidRegister,
+        }
+    }
+};
+
+const signal_ucontext_t = switch (native_os) {
+    .linux => std.os.linux.ucontext_t,
+    .emscripten => std.os.emscripten.ucontext_t,
+    .freebsd => std.os.freebsd.ucontext_t,
+    .macos, .ios, .tvos, .watchos, .visionos => extern struct {
+        onstack: c_int,
+        sigmask: std.c.sigset_t,
+        stack: std.c.stack_t,
+        link: ?*signal_ucontext_t,
+        mcsize: u64,
+        mcontext: *mcontext_t,
+        const mcontext_t = switch (native_arch) {
+            .aarch64 => extern struct {
+                es: extern struct {
+                    far: u64, // Virtual Fault Address
+                    esr: u32, // Exception syndrome
+                    exception: u32, // Number of arm exception taken
+                },
+                ss: extern struct {
+                    /// General purpose registers
+                    regs: [29]u64,
+                    /// Frame pointer x29
+                    fp: u64,
+                    /// Link register x30
+                    lr: u64,
+                    /// Stack pointer x31
+                    sp: u64,
+                    /// Program counter
+                    pc: u64,
+                    /// Current program status register
+                    cpsr: u32,
+                    __pad: u32,
+                },
+                ns: extern struct {
+                    q: [32]u128,
+                    fpsr: u32,
+                    fpcr: u32,
+                },
+            },
+            .x86_64 => extern struct {
+                es: extern struct {
+                    trapno: u16,
+                    cpu: u16,
+                    err: u32,
+                    faultvaddr: u64,
+                },
+                ss: extern struct {
+                    rax: u64,
+                    rbx: u64,
+                    rcx: u64,
+                    rdx: u64,
+                    rdi: u64,
+                    rsi: u64,
+                    rbp: u64,
+                    rsp: u64,
+                    r8: u64,
+                    r9: u64,
+                    r10: u64,
+                    r11: u64,
+                    r12: u64,
+                    r13: u64,
+                    r14: u64,
+                    r15: u64,
+                    rip: u64,
+                    rflags: u64,
+                    cs: u64,
+                    fs: u64,
+                    gs: u64,
+                },
+                fs: extern struct {
+                    reserved: [2]c_int,
+                    fcw: u16,
+                    fsw: u16,
+                    ftw: u8,
+                    rsrv1: u8,
+                    fop: u16,
+                    ip: u32,
+                    cs: u16,
+                    rsrv2: u16,
+                    dp: u32,
+                    ds: u16,
+                    rsrv3: u16,
+                    mxcsr: u32,
+                    mxcsrmask: u32,
+                    stmm: [8]stmm_reg,
+                    xmm: [16]xmm_reg,
+                    rsrv4: [96]u8,
+                    reserved1: c_int,
+
+                    const stmm_reg = [16]u8;
+                    const xmm_reg = [16]u8;
+                },
+            },
+            else => void,
+        };
+    },
+    .solaris, .illumos => extern struct {
+        flags: u64,
+        link: ?*signal_ucontext_t,
+        sigmask: std.c.sigset_t,
+        stack: std.c.stack_t,
+        mcontext: mcontext_t,
+        brand_data: [3]?*anyopaque,
+        filler: [2]i64,
+        const mcontext_t = extern struct {
+            gregs: [28]u64,
+            fpregs: std.c.fpregset_t,
+        };
+    },
+    .openbsd => switch (builtin.cpu.arch) {
+        .x86_64 => extern struct {
+            sc_rdi: c_long,
+            sc_rsi: c_long,
+            sc_rdx: c_long,
+            sc_rcx: c_long,
+            sc_r8: c_long,
+            sc_r9: c_long,
+            sc_r10: c_long,
+            sc_r11: c_long,
+            sc_r12: c_long,
+            sc_r13: c_long,
+            sc_r14: c_long,
+            sc_r15: c_long,
+            sc_rbp: c_long,
+            sc_rbx: c_long,
+            sc_rax: c_long,
+            sc_gs: c_long,
+            sc_fs: c_long,
+            sc_es: c_long,
+            sc_ds: c_long,
+            sc_trapno: c_long,
+            sc_err: c_long,
+            sc_rip: c_long,
+            sc_cs: c_long,
+            sc_rflags: c_long,
+            sc_rsp: c_long,
+            sc_ss: c_long,
+
+            sc_fpstate: *anyopaque, // struct fxsave64 *
+            __sc_unused: c_int,
+            sc_mask: c_int,
+            sc_cookie: c_long,
+        },
+        .aarch64 => extern struct {
+            __sc_unused: c_int,
+            sc_mask: c_int,
+            sc_sp: c_ulong,
+            sc_lr: c_ulong,
+            sc_elr: c_ulong,
+            sc_spsr: c_ulong,
+            sc_x: [30]c_ulong,
+            sc_cookie: c_long,
+        },
+        else => void,
+    },
+    .netbsd => extern struct {
+        flags: u32,
+        link: ?*signal_ucontext_t,
+        sigmask: std.c.sigset_t,
+        stack: std.c.stack_t,
+        mcontext: mcontext_t,
+        __pad: [
+            switch (builtin.cpu.arch) {
+                .x86 => 4,
+                .mips, .mipsel, .mips64, .mips64el => 14,
+                .arm, .armeb, .thumb, .thumbeb => 1,
+                .sparc, .sparc64 => if (@sizeOf(usize) == 4) 43 else 8,
+                else => 0,
+            }
+        ]u32,
+        const mcontext_t = switch (builtin.cpu.arch) {
+            .aarch64, .aarch64_be => extern struct {
+                gregs: [35]u64,
+                fregs: [528]u8 align(16),
+                spare: [8]u64,
+            },
+            .x86 => extern struct {
+                gregs: [19]u32,
+                fpregs: [161]u32,
+                mc_tlsbase: u32,
+            },
+            .x86_64 => extern struct {
+                gregs: [26]u64,
+                mc_tlsbase: u64,
+                fpregs: [512]u8 align(8),
+            },
+            else => void,
+        };
+    },
+    .dragonfly => extern struct {
+        sigmask: std.c.sigset_t,
+        mcontext: mcontext_t,
+        link: ?*signal_ucontext_t,
+        stack: std.c.stack_t,
+        cofunc: ?*fn (?*signal_ucontext_t, ?*anyopaque) void,
+        arg: ?*void,
+        _spare: [4]c_int,
+        const mcontext_t = extern struct {
+            const register_t = isize;
+            onstack: register_t, // XXX - sigcontext compat.
+            rdi: register_t,
+            rsi: register_t,
+            rdx: register_t,
+            rcx: register_t,
+            r8: register_t,
+            r9: register_t,
+            rax: register_t,
+            rbx: register_t,
+            rbp: register_t,
+            r10: register_t,
+            r11: register_t,
+            r12: register_t,
+            r13: register_t,
+            r14: register_t,
+            r15: register_t,
+            xflags: register_t,
+            trapno: register_t,
+            addr: register_t,
+            flags: register_t,
+            err: register_t,
+            rip: register_t,
+            cs: register_t,
+            rflags: register_t,
+            rsp: register_t, // machine state
+            ss: register_t,
+
+            len: c_uint, // sizeof(mcontext_t)
+            fpformat: c_uint,
+            ownedfp: c_uint,
+            reserved: c_uint,
+            unused: [8]c_uint,
+
+            // NOTE! 64-byte aligned as of here. Also must match savefpu structure.
+            fpregs: [256]c_int align(64),
+        };
+    },
+    .serenity => extern struct {
+        link: ?*signal_ucontext_t,
+        sigmask: std.c.sigset_t,
+        stack: std.c.stack_t,
+        mcontext: mcontext_t,
+        const mcontext_t = switch (builtin.cpu.arch) {
+            // https://github.com/SerenityOS/serenity/blob/200e91cd7f1ec5453799a2720d4dc114a59cc289/Kernel/Arch/aarch64/mcontext.h#L15-L19
+            .aarch64 => extern struct {
+                x: [31]u64,
+                sp: u64,
+                pc: u64,
+            },
+            // https://github.com/SerenityOS/serenity/blob/66f8d0f031ef25c409dbb4fecaa454800fecae0f/Kernel/Arch/riscv64/mcontext.h#L15-L18
+            .riscv64 => extern struct {
+                x: [31]u64,
+                pc: u64,
+            },
+            // https://github.com/SerenityOS/serenity/blob/7b9ea3efdec9f86a1042893e8107d0b23aad8727/Kernel/Arch/x86_64/mcontext.h#L15-L40
+            .x86_64 => extern struct {
+                rax: u64,
+                rcx: u64,
+                rdx: u64,
+                rbx: u64,
+                rsp: u64,
+                rbp: u64,
+                rsi: u64,
+                rdi: u64,
+                rip: u64,
+                r8: u64,
+                r9: u64,
+                r10: u64,
+                r11: u64,
+                r12: u64,
+                r13: u64,
+                r14: u64,
+                r15: u64,
+                rflags: u64,
+                cs: u32,
+                ss: u32,
+                ds: u32,
+                es: u32,
+                fs: u32,
+                gs: u32,
+            },
+            else => void,
+        };
+    },
+    .haiku => extern struct {
+        link: ?*signal_ucontext_t,
+        sigmask: std.c.sigset_t,
+        stack: std.c.stack_t,
+        mcontext: mcontext_t,
+        const mcontext_t = switch (builtin.cpu.arch) {
+            .arm, .thumb => extern struct {
+                r0: u32,
+                r1: u32,
+                r2: u32,
+                r3: u32,
+                r4: u32,
+                r5: u32,
+                r6: u32,
+                r7: u32,
+                r8: u32,
+                r9: u32,
+                r10: u32,
+                r11: u32,
+                r12: u32,
+                r13: u32,
+                r14: u32,
+                r15: u32,
+                cpsr: u32,
+            },
+            .aarch64 => extern struct {
+                x: [10]u64,
+                lr: u64,
+                sp: u64,
+                elr: u64,
+                spsr: u64,
+                fp_q: [32]u128,
+                fpsr: u32,
+                fpcr: u32,
+            },
+            .m68k => extern struct {
+                pc: u32,
+                d0: u32,
+                d1: u32,
+                d2: u32,
+                d3: u32,
+                d4: u32,
+                d5: u32,
+                d6: u32,
+                d7: u32,
+                a0: u32,
+                a1: u32,
+                a2: u32,
+                a3: u32,
+                a4: u32,
+                a5: u32,
+                a6: u32,
+                a7: u32,
+                ccr: u8,
+                f0: f64,
+                f1: f64,
+                f2: f64,
+                f3: f64,
+                f4: f64,
+                f5: f64,
+                f6: f64,
+                f7: f64,
+                f8: f64,
+                f9: f64,
+                f10: f64,
+                f11: f64,
+                f12: f64,
+                f13: f64,
+            },
+            .mipsel => extern struct {
+                r0: u32,
+            },
+            .powerpc => extern struct {
+                pc: u32,
+                r0: u32,
+                r1: u32,
+                r2: u32,
+                r3: u32,
+                r4: u32,
+                r5: u32,
+                r6: u32,
+                r7: u32,
+                r8: u32,
+                r9: u32,
+                r10: u32,
+                r11: u32,
+                r12: u32,
+                f0: f64,
+                f1: f64,
+                f2: f64,
+                f3: f64,
+                f4: f64,
+                f5: f64,
+                f6: f64,
+                f7: f64,
+                f8: f64,
+                f9: f64,
+                f10: f64,
+                f11: f64,
+                f12: f64,
+                f13: f64,
+                reserved: u32,
+                fpscr: u32,
+                ctr: u32,
+                xer: u32,
+                cr: u32,
+                msr: u32,
+                lr: u32,
+            },
+            .riscv64 => extern struct {
+                x: [31]u64,
+                pc: u64,
+                f: [32]f64,
+                fcsr: u64,
+            },
+            .sparc64 => extern struct {
+                g1: u64,
+                g2: u64,
+                g3: u64,
+                g4: u64,
+                g5: u64,
+                g6: u64,
+                g7: u64,
+                o0: u64,
+                o1: u64,
+                o2: u64,
+                o3: u64,
+                o4: u64,
+                o5: u64,
+                sp: u64,
+                o7: u64,
+                l0: u64,
+                l1: u64,
+                l2: u64,
+                l3: u64,
+                l4: u64,
+                l5: u64,
+                l6: u64,
+                l7: u64,
+                i0: u64,
+                i1: u64,
+                i2: u64,
+                i3: u64,
+                i4: u64,
+                i5: u64,
+                fp: u64,
+                i7: u64,
+            },
+            .x86 => extern struct {
+                pub const old_extended_regs = extern struct {
+                    control: u16,
+                    reserved1: u16,
+                    status: u16,
+                    reserved2: u16,
+                    tag: u16,
+                    reserved3: u16,
+                    eip: u32,
+                    cs: u16,
+                    opcode: u16,
+                    datap: u32,
+                    ds: u16,
+                    reserved4: u16,
+                    fp_mmx: [8][10]u8,
+                };
+
+                pub const fp_register = extern struct { value: [10]u8, reserved: [6]u8 };
+
+                pub const xmm_register = extern struct { value: [16]u8 };
+
+                pub const new_extended_regs = extern struct {
+                    control: u16,
+                    status: u16,
+                    tag: u16,
+                    opcode: u16,
+                    eip: u32,
+                    cs: u16,
+                    reserved1: u16,
+                    datap: u32,
+                    ds: u16,
+                    reserved2: u16,
+                    mxcsr: u32,
+                    reserved3: u32,
+                    fp_mmx: [8]fp_register,
+                    xmmx: [8]xmm_register,
+                    reserved4: [224]u8,
+                };
+
+                pub const extended_regs = extern struct {
+                    state: extern union {
+                        old_format: old_extended_regs,
+                        new_format: new_extended_regs,
+                    },
+                    format: u32,
+                };
+
+                eip: u32,
+                eflags: u32,
+                eax: u32,
+                ecx: u32,
+                edx: u32,
+                esp: u32,
+                ebp: u32,
+                reserved: u32,
+                xregs: extended_regs,
+                edi: u32,
+                esi: u32,
+                ebx: u32,
+            },
+            .x86_64 => extern struct {
+                pub const fp_register = extern struct {
+                    value: [10]u8,
+                    reserved: [6]u8,
+                };
+
+                pub const xmm_register = extern struct {
+                    value: [16]u8,
+                };
+
+                pub const fpu_state = extern struct {
+                    control: u16,
+                    status: u16,
+                    tag: u16,
+                    opcode: u16,
+                    rip: u64,
+                    rdp: u64,
+                    mxcsr: u32,
+                    mscsr_mask: u32,
+
+                    fp_mmx: [8]fp_register,
+                    xmm: [16]xmm_register,
+                    reserved: [96]u8,
+                };
+
+                pub const xstate_hdr = extern struct {
+                    bv: u64,
+                    xcomp_bv: u64,
+                    reserved: [48]u8,
+                };
+
+                pub const savefpu = extern struct {
+                    fxsave: fpu_state,
+                    xstate: xstate_hdr,
+                    ymm: [16]xmm_register,
+                };
+
+                rax: u64,
+                rbx: u64,
+                rcx: u64,
+                rdx: u64,
+                rdi: u64,
+                rsi: u64,
+                rbp: u64,
+                r8: u64,
+                r9: u64,
+                r10: u64,
+                r11: u64,
+                r12: u64,
+                r13: u64,
+                r14: u64,
+                r15: u64,
+                rsp: u64,
+                rip: u64,
+                rflags: u64,
+                fpu: savefpu,
+            },
+            else => void,
+        };
+    },
+    else => void,
+};
+
+const std = @import("../std.zig");
+const root = @import("root");
+const builtin = @import("builtin");
+const native_arch = @import("builtin").target.cpu.arch;
+const native_os = @import("builtin").target.os.tag;
-- 
cgit v1.2.3


From dd8d59686a069fdb72d9f0753e3482ff99cce98c Mon Sep 17 00:00:00 2001
From: mlugg <mlugg@mlugg.co.uk>
Date: Wed, 17 Sep 2025 23:03:45 +0100
Subject: std.debug: miscellaneous fixes

Mostly on macOS, since Loris showed me a not-great stack trace, and I
spent 8 hours trying to make it better. The dyld shared cache is
designed in a way which makes this really hard to do right, and
documentation is non-existent, but this *seems* to work pretty well.
I'll leave the ruling on whether I did a good job to CI and our users.
---
 lib/std/c.zig                            |   3 +
 lib/std/c/darwin.zig                     |   8 ++
 lib/std/debug.zig                        |  75 ++++++++---
 lib/std/debug/SelfInfo.zig               |  54 +++-----
 lib/std/debug/SelfInfo/DarwinModule.zig  | 224 +++++++++++++++++++++----------
 lib/std/debug/SelfInfo/ElfModule.zig     |   2 +-
 lib/std/debug/SelfInfo/WindowsModule.zig |  36 ++++-
 lib/std/debug/cpu_context.zig            |   6 +
 8 files changed, 276 insertions(+), 132 deletions(-)

(limited to 'lib/std/debug/cpu_context.zig')

diff --git a/lib/std/c.zig b/lib/std/c.zig
index d1affab207..4c139d5023 100644
--- a/lib/std/c.zig
+++ b/lib/std/c.zig
@@ -10994,6 +10994,9 @@ pub extern "c" fn dlclose(handle: *anyopaque) c_int;
 pub extern "c" fn dlsym(handle: ?*anyopaque, symbol: [*:0]const u8) ?*anyopaque;
 pub extern "c" fn dlerror() ?[*:0]u8;
 
+pub const dladdr = if (native_os.isDarwin()) darwin.dladdr else {};
+pub const dl_info = if (native_os.isDarwin()) darwin.dl_info else {};
+
 pub extern "c" fn sync() void;
 pub extern "c" fn syncfs(fd: c_int) c_int;
 pub extern "c" fn fsync(fd: c_int) c_int;
diff --git a/lib/std/c/darwin.zig b/lib/std/c/darwin.zig
index 2ad979ecf2..cf7d3127eb 100644
--- a/lib/std/c/darwin.zig
+++ b/lib/std/c/darwin.zig
@@ -354,6 +354,14 @@ pub extern "c" fn _dyld_image_count() u32;
 pub extern "c" fn _dyld_get_image_header(image_index: u32) ?*mach_header;
 pub extern "c" fn _dyld_get_image_vmaddr_slide(image_index: u32) usize;
 pub extern "c" fn _dyld_get_image_name(image_index: u32) [*:0]const u8;
+pub extern "c" fn dladdr(addr: *const anyopaque, info: *dl_info) c_int;
+
+pub const dl_info = extern struct {
+    fname: [*:0]const u8,
+    fbase: *anyopaque,
+    sname: ?[*:0]const u8,
+    saddr: ?*anyopaque,
+};
 
 pub const COPYFILE = packed struct(u32) {
     ACL: bool = false,
diff --git a/lib/std/debug.zig b/lib/std/debug.zig
index 088152d873..5b7a6bf715 100644
--- a/lib/std/debug.zig
+++ b/lib/std/debug.zig
@@ -585,12 +585,14 @@ pub fn captureCurrentStackTrace(options: StackUnwindOptions, addr_buf: []usize)
     while (true) switch (it.next()) {
         .switch_to_fp => if (!it.stratOk(options.allow_unsafe_unwind)) break,
         .end => break,
-        .frame => |return_address| {
+        .frame => |pc_addr| {
             if (wait_for) |target| {
-                if (return_address != target) continue;
+                // Possible off-by-one error: `pc_addr` might be one less than the return address (so
+                // that it falls *inside* the function call), while `target` *is* a return address.
+                if (pc_addr != target and pc_addr + 1 != target) continue;
                 wait_for = null;
             }
-            if (frame_idx < addr_buf.len) addr_buf[frame_idx] = return_address;
+            if (frame_idx < addr_buf.len) addr_buf[frame_idx] = pc_addr;
             frame_idx += 1;
         },
     };
@@ -631,6 +633,7 @@ pub fn writeCurrentStackTrace(options: StackUnwindOptions, writer: *Writer, tty_
     var printed_any_frame = false;
     while (true) switch (it.next()) {
         .switch_to_fp => |unwind_error| {
+            if (StackIterator.fp_unwind_is_safe) continue; // no need to even warn
             const module_name = di.getModuleNameForAddress(di_gpa, unwind_error.address) catch "???";
             const caption: []const u8 = switch (unwind_error.err) {
                 error.MissingDebugInfo => "unwind info unavailable",
@@ -658,12 +661,14 @@ pub fn writeCurrentStackTrace(options: StackUnwindOptions, writer: *Writer, tty_
             }
         },
         .end => break,
-        .frame => |return_address| {
+        .frame => |pc_addr| {
             if (wait_for) |target| {
-                if (return_address != target) continue;
+                // Possible off-by-one error: `pc_addr` might be one less than the return address (so
+                // that it falls *inside* the function call), while `target` *is* a return address.
+                if (pc_addr != target and pc_addr + 1 != target) continue;
                 wait_for = null;
             }
-            try printSourceAtAddress(di_gpa, di, writer, return_address -| 1, tty_config);
+            try printSourceAtAddress(di_gpa, di, writer, pc_addr, tty_config);
             printed_any_frame = true;
         },
     };
@@ -703,8 +708,8 @@ pub fn writeStackTrace(st: *const std.builtin.StackTrace, writer: *Writer, tty_c
         },
     };
     const captured_frames = @min(n_frames, st.instruction_addresses.len);
-    for (st.instruction_addresses[0..captured_frames]) |return_address| {
-        try printSourceAtAddress(di_gpa, di, writer, return_address -| 1, tty_config);
+    for (st.instruction_addresses[0..captured_frames]) |pc_addr| {
+        try printSourceAtAddress(di_gpa, di, writer, pc_addr, tty_config);
     }
     if (n_frames > captured_frames) {
         tty_config.setColor(writer, .bold) catch {};
@@ -725,6 +730,8 @@ pub fn dumpStackTrace(st: *const std.builtin.StackTrace) void {
 const StackIterator = union(enum) {
     /// Unwinding using debug info (e.g. DWARF CFI).
     di: if (SelfInfo.supports_unwinding) SelfInfo.UnwindContext else noreturn,
+    /// We will first report the *current* PC of this `UnwindContext`, then we will switch to `di`.
+    di_first: if (SelfInfo.supports_unwinding) SelfInfo.UnwindContext else noreturn,
     /// Naive frame-pointer-based unwinding. Very simple, but typically unreliable.
     fp: usize,
 
@@ -742,9 +749,12 @@ const StackIterator = union(enum) {
         }
         if (opt_context_ptr) |context_ptr| {
             if (!SelfInfo.supports_unwinding) return error.CannotUnwindFromContext;
-            return .{ .di = .init(context_ptr) };
+            // Use `di_first` here so we report the PC in the context before unwinding any further.
+            return .{ .di_first = .init(context_ptr) };
         }
         if (SelfInfo.supports_unwinding and cpu_context.Native != noreturn) {
+            // We don't need `di_first` here, because our PC is in `std.debug`; we're only interested
+            // in our caller's frame and above.
             return .{ .di = .init(&.current()) };
         }
         return .{ .fp = @frameAddress() };
@@ -752,7 +762,7 @@ const StackIterator = union(enum) {
     fn deinit(si: *StackIterator) void {
         switch (si.*) {
             .fp => {},
-            .di => |*unwind_context| unwind_context.deinit(getDebugInfoAllocator()),
+            .di, .di_first => |*unwind_context| unwind_context.deinit(getDebugInfoAllocator()),
         }
     }
 
@@ -763,7 +773,7 @@ const StackIterator = union(enum) {
     /// Whether the current unwind strategy is allowed given `allow_unsafe`.
     fn stratOk(it: *const StackIterator, allow_unsafe: bool) bool {
         return switch (it.*) {
-            .di => true,
+            .di, .di_first => true,
             // If we omitted frame pointers from *this* compilation, FP unwinding would crash
             // immediately regardless of anything. But FPs could also be omitted from a different
             // linked object, so it's not guaranteed to be safe, unless the target specifically
@@ -773,11 +783,11 @@ const StackIterator = union(enum) {
     }
 
     const Result = union(enum) {
-        /// A stack frame has been found; this is the corresponding return address.
+        /// A stack frame has been found; this is the corresponding program counter address.
         frame: usize,
         /// The end of the stack has been reached.
         end,
-        /// We were using the `.di` strategy, but are now switching to `.fp` due to this error.
+        /// We were using `SelfInfo.UnwindInfo`, but are now switching to FP unwinding due to this error.
         switch_to_fp: struct {
             address: usize,
             err: SelfInfo.Error,
@@ -785,20 +795,25 @@ const StackIterator = union(enum) {
     };
     fn next(it: *StackIterator) Result {
         switch (it.*) {
+            .di_first => |unwind_context| {
+                const first_pc = unwind_context.pc;
+                if (first_pc == 0) return .end;
+                it.* = .{ .di = unwind_context };
+                return .{ .frame = first_pc };
+            },
             .di => |*unwind_context| {
                 const di = getSelfDebugInfo() catch unreachable;
                 const di_gpa = getDebugInfoAllocator();
-                if (di.unwindFrame(di_gpa, unwind_context)) |ra| {
-                    if (ra <= 1) return .end;
-                    return .{ .frame = ra };
-                } else |err| {
+                di.unwindFrame(di_gpa, unwind_context) catch |err| {
                     const pc = unwind_context.pc;
                     it.* = .{ .fp = unwind_context.getFp() };
                     return .{ .switch_to_fp = .{
                         .address = pc,
                         .err = err,
                     } };
-                }
+                };
+                const pc = unwind_context.pc;
+                return if (pc == 0) .end else .{ .frame = pc };
             },
             .fp => |fp| {
                 if (fp == 0) return .end; // we reached the "sentinel" base pointer
@@ -824,9 +839,9 @@ const StackIterator = union(enum) {
                 if (bp != 0 and bp <= fp) return .end;
 
                 it.fp = bp;
-                const ra = ra_ptr.*;
+                const ra = stripInstructionPtrAuthCode(ra_ptr.*);
                 if (ra <= 1) return .end;
-                return .{ .frame = ra };
+                return .{ .frame = ra - 1 };
             },
         }
     }
@@ -860,6 +875,26 @@ const StackIterator = union(enum) {
     }
 };
 
+/// Some platforms use pointer authentication: the upper bits of instruction pointers contain a
+/// signature. This function clears those signature bits to make the pointer directly usable.
+pub inline fn stripInstructionPtrAuthCode(ptr: usize) usize {
+    if (native_arch.isAARCH64()) {
+        // `hint 0x07` maps to `xpaclri` (or `nop` if the hardware doesn't support it)
+        // The save / restore is because `xpaclri` operates on x30 (LR)
+        return asm (
+            \\mov x16, x30
+            \\mov x30, x15
+            \\hint 0x07
+            \\mov x15, x30
+            \\mov x30, x16
+            : [ret] "={x15}" (-> usize),
+            : [ptr] "{x15}" (ptr),
+            : .{ .x16 = true });
+    }
+
+    return ptr;
+}
+
 fn printSourceAtAddress(gpa: Allocator, debug_info: *SelfInfo, writer: *Writer, address: usize, tty_config: tty.Config) Writer.Error!void {
     const symbol: Symbol = debug_info.getSymbolAtAddress(gpa, address) catch |err| switch (err) {
         error.MissingDebugInfo,
diff --git a/lib/std/debug/SelfInfo.zig b/lib/std/debug/SelfInfo.zig
index 321e67bb7c..efa9d782f6 100644
--- a/lib/std/debug/SelfInfo.zig
+++ b/lib/std/debug/SelfInfo.zig
@@ -2,7 +2,6 @@
 //! goal of minimal code bloat and compilation speed penalty.
 
 const builtin = @import("builtin");
-const native_os = builtin.os.tag;
 const native_endian = native_arch.endian();
 const native_arch = builtin.cpu.arch;
 
@@ -13,6 +12,8 @@ const assert = std.debug.assert;
 const Dwarf = std.debug.Dwarf;
 const CpuContext = std.debug.cpu_context.Native;
 
+const stripInstructionPtrAuthCode = std.debug.stripInstructionPtrAuthCode;
+
 const root = @import("root");
 
 const SelfInfo = @This();
@@ -52,7 +53,7 @@ pub fn deinit(self: *SelfInfo, gpa: Allocator) void {
     if (Module.LookupCache != void) self.lookup_cache.deinit(gpa);
 }
 
-pub fn unwindFrame(self: *SelfInfo, gpa: Allocator, context: *UnwindContext) Error!usize {
+pub fn unwindFrame(self: *SelfInfo, gpa: Allocator, context: *UnwindContext) Error!void {
     comptime assert(supports_unwinding);
     const module: Module = try .lookup(&self.lookup_cache, gpa, context.pc);
     const gop = try self.modules.getOrPut(gpa, module.key());
@@ -115,7 +116,7 @@ pub fn getModuleNameForAddress(self: *SelfInfo, gpa: Allocator, address: usize)
 /// pub const supports_unwinding: bool;
 /// /// Only required if `supports_unwinding == true`.
 /// pub const UnwindContext = struct {
-///     /// A PC value inside the function of the last unwound frame.
+///     /// A PC value representing the location in the last frame.
 ///     pc: usize,
 ///     pub fn init(ctx: *std.debug.cpu_context.Native, gpa: Allocator) Allocator.Error!UnwindContext;
 ///     pub fn deinit(uc: *UnwindContext, gpa: Allocator) void;
@@ -123,21 +124,22 @@ pub fn getModuleNameForAddress(self: *SelfInfo, gpa: Allocator, address: usize)
 ///     /// pointer is unknown, 0 may be returned instead.
 ///     pub fn getFp(uc: *UnwindContext) usize;
 /// };
-/// /// Only required if `supports_unwinding == true`. Unwinds a single stack frame and returns
-/// /// the next return address (which may be 0 indicating end of stack).
+/// /// Only required if `supports_unwinding == true`. Unwinds a single stack frame.
+/// /// The caller will read the new instruction poiter from the `pc` field.
+/// /// `pc = 0` indicates end of stack / no more frames.
 /// pub fn unwindFrame(
 ///     mod: *const Module,
 ///     gpa: Allocator,
 ///     di: *DebugInfo,
 ///     ctx: *UnwindContext,
-/// ) SelfInfo.Error!usize;
+/// ) SelfInfo.Error!void;
 /// ```
 const Module: type = Module: {
     // Allow overriding the target-specific `SelfInfo` implementation by exposing `root.debug.Module`.
     if (@hasDecl(root, "debug") and @hasDecl(root.debug, "Module")) {
         break :Module root.debug.Module;
     }
-    break :Module switch (native_os) {
+    break :Module switch (builtin.os.tag) {
         .linux,
         .netbsd,
         .freebsd,
@@ -222,7 +224,7 @@ pub const DwarfUnwindContext = struct {
                 const register = col.register orelse return error.InvalidRegister;
                 // The default type is usually undefined, but can be overriden by ABI authors.
                 // See the doc comment on `Dwarf.Unwind.VirtualMachine.RegisterRule.default`.
-                if (builtin.cpu.arch.isAARCH64() and register >= 19 and register <= 18) {
+                if (builtin.cpu.arch.isAARCH64() and register >= 19 and register <= 28) {
                     // Callee-saved registers are initialized as if they had the .same_value rule
                     const src = try context.cpu_context.dwarfRegisterBytes(register);
                     if (src.len != out.len) return error.RegisterSizeMismatch;
@@ -310,7 +312,7 @@ pub const DwarfUnwindContext = struct {
         unwind: *const Dwarf.Unwind,
         load_offset: usize,
         explicit_fde_offset: ?usize,
-    ) Error!usize {
+    ) Error!void {
         return unwindFrameInner(context, gpa, unwind, load_offset, explicit_fde_offset) catch |err| switch (err) {
             error.InvalidDebugInfo, error.MissingDebugInfo, error.OutOfMemory => |e| return e,
 
@@ -358,9 +360,10 @@ pub const DwarfUnwindContext = struct {
         unwind: *const Dwarf.Unwind,
         load_offset: usize,
         explicit_fde_offset: ?usize,
-    ) !usize {
-        if (!supports_unwinding) return error.UnsupportedCpuArchitecture;
-        if (context.pc == 0) return 0;
+    ) !void {
+        comptime assert(supports_unwinding);
+
+        if (context.pc == 0) return;
 
         const pc_vaddr = context.pc - load_offset;
 
@@ -430,12 +433,12 @@ pub const DwarfUnwindContext = struct {
             }
         }
 
-        const return_address: u64 = if (has_return_address) pc: {
+        const return_address: usize = if (has_return_address) pc: {
             const raw_ptr = try regNative(&new_cpu_context, cie.return_address_register);
             break :pc stripInstructionPtrAuthCode(raw_ptr.*);
         } else 0;
 
-        (try regNative(new_cpu_context, ip_reg_num)).* = return_address;
+        (try regNative(&new_cpu_context, ip_reg_num)).* = return_address;
 
         // The new CPU context is complete; flush changes.
         context.cpu_context = new_cpu_context;
@@ -444,11 +447,9 @@ pub const DwarfUnwindContext = struct {
         // *after* the call, it could (in the case of noreturn functions) actually point outside of
         // the caller's address range, meaning an FDE lookup would fail. We can handle this by
         // subtracting 1 from `return_address` so that the next lookup is guaranteed to land inside
-        // the `call` instruction`. The exception to this rule is signal frames, where the return
+        // the `call` instruction. The exception to this rule is signal frames, where the return
         // address is the same instruction that triggered the handler.
         context.pc = if (cie.is_signal_frame) return_address else return_address -| 1;
-
-        return return_address;
     }
     /// Since register rules are applied (usually) during a panic,
     /// checked addition / subtraction is used so that we can return
@@ -459,25 +460,6 @@ pub const DwarfUnwindContext = struct {
         else
             try std.math.sub(usize, base, @as(usize, @intCast(-offset)));
     }
-    /// Some platforms use pointer authentication - the upper bits of instruction pointers contain a signature.
-    /// This function clears these signature bits to make the pointer usable.
-    pub inline fn stripInstructionPtrAuthCode(ptr: usize) usize {
-        if (native_arch.isAARCH64()) {
-            // `hint 0x07` maps to `xpaclri` (or `nop` if the hardware doesn't support it)
-            // The save / restore is because `xpaclri` operates on x30 (LR)
-            return asm (
-                \\mov x16, x30
-                \\mov x30, x15
-                \\hint 0x07
-                \\mov x15, x30
-                \\mov x30, x16
-                : [ret] "={x15}" (-> usize),
-                : [ptr] "{x15}" (ptr),
-                : .{ .x16 = true });
-        }
-
-        return ptr;
-    }
 
     pub fn regNative(ctx: *CpuContext, num: u16) error{
         InvalidRegister,
diff --git a/lib/std/debug/SelfInfo/DarwinModule.zig b/lib/std/debug/SelfInfo/DarwinModule.zig
index fc2f1c89bb..e3cbeb7edd 100644
--- a/lib/std/debug/SelfInfo/DarwinModule.zig
+++ b/lib/std/debug/SelfInfo/DarwinModule.zig
@@ -1,6 +1,5 @@
 /// The runtime address where __TEXT is loaded.
 text_base: usize,
-load_offset: usize,
 name: []const u8,
 
 pub fn key(m: *const DarwinModule) usize {
@@ -12,38 +11,14 @@ pub const LookupCache = void;
 pub fn lookup(cache: *LookupCache, gpa: Allocator, address: usize) Error!DarwinModule {
     _ = cache;
     _ = gpa;
-    const image_count = std.c._dyld_image_count();
-    for (0..image_count) |image_idx| {
-        const header = std.c._dyld_get_image_header(@intCast(image_idx)) orelse continue;
-        const text_base = @intFromPtr(header);
-        if (address < text_base) continue;
-        const load_offset = std.c._dyld_get_image_vmaddr_slide(@intCast(image_idx));
-
-        // Find the __TEXT segment
-        var it: macho.LoadCommandIterator = .{
-            .ncmds = header.ncmds,
-            .buffer = @as([*]u8, @ptrCast(header))[@sizeOf(macho.mach_header_64)..][0..header.sizeofcmds],
-        };
-        const text_segment_cmd = while (it.next()) |load_cmd| {
-            if (load_cmd.cmd() != .SEGMENT_64) continue;
-            const segment_cmd = load_cmd.cast(macho.segment_command_64).?;
-            if (!mem.eql(u8, segment_cmd.segName(), "__TEXT")) continue;
-            break segment_cmd;
-        } else continue;
-
-        const seg_start = load_offset + text_segment_cmd.vmaddr;
-        assert(seg_start == text_base);
-        const seg_end = seg_start + text_segment_cmd.vmsize;
-        if (address < seg_start or address >= seg_end) continue;
-
-        // We've found the matching __TEXT segment. This is the image we need.
-        return .{
-            .text_base = text_base,
-            .load_offset = load_offset,
-            .name = mem.span(std.c._dyld_get_image_name(@intCast(image_idx))),
-        };
+    var info: std.c.dl_info = undefined;
+    switch (std.c.dladdr(@ptrFromInt(address), &info)) {
+        0 => return error.MissingDebugInfo,
+        else => return .{
+            .name = std.mem.span(info.fname),
+            .text_base = @intFromPtr(info.fbase),
+        },
     }
-    return error.MissingDebugInfo;
 }
 fn loadUnwindInfo(module: *const DarwinModule) DebugInfo.Unwind {
     const header: *std.macho.mach_header = @ptrFromInt(module.text_base);
@@ -52,56 +27,115 @@ fn loadUnwindInfo(module: *const DarwinModule) DebugInfo.Unwind {
         .ncmds = header.ncmds,
         .buffer = @as([*]u8, @ptrCast(header))[@sizeOf(macho.mach_header_64)..][0..header.sizeofcmds],
     };
-    const sections = while (it.next()) |load_cmd| {
+    const sections, const text_vmaddr = while (it.next()) |load_cmd| {
         if (load_cmd.cmd() != .SEGMENT_64) continue;
         const segment_cmd = load_cmd.cast(macho.segment_command_64).?;
         if (!mem.eql(u8, segment_cmd.segName(), "__TEXT")) continue;
-        break load_cmd.getSections();
+        break .{ load_cmd.getSections(), segment_cmd.vmaddr };
     } else unreachable;
 
+    const vmaddr_slide = module.text_base - text_vmaddr;
+
     var unwind_info: ?[]const u8 = null;
     var eh_frame: ?[]const u8 = null;
     for (sections) |sect| {
         if (mem.eql(u8, sect.sectName(), "__unwind_info")) {
-            const sect_ptr: [*]u8 = @ptrFromInt(@as(usize, @intCast(module.load_offset + sect.addr)));
+            const sect_ptr: [*]u8 = @ptrFromInt(@as(usize, @intCast(vmaddr_slide + sect.addr)));
             unwind_info = sect_ptr[0..@intCast(sect.size)];
         } else if (mem.eql(u8, sect.sectName(), "__eh_frame")) {
-            const sect_ptr: [*]u8 = @ptrFromInt(@as(usize, @intCast(module.load_offset + sect.addr)));
+            const sect_ptr: [*]u8 = @ptrFromInt(@as(usize, @intCast(vmaddr_slide + sect.addr)));
             eh_frame = sect_ptr[0..@intCast(sect.size)];
         }
     }
     return .{
+        .vmaddr_slide = vmaddr_slide,
         .unwind_info = unwind_info,
         .eh_frame = eh_frame,
     };
 }
 fn loadMachO(module: *const DarwinModule, gpa: Allocator) !DebugInfo.LoadedMachO {
-    const mapped_mem = try mapDebugInfoFile(module.name);
-    errdefer posix.munmap(mapped_mem);
+    const all_mapped_memory = try mapDebugInfoFile(module.name);
+    errdefer posix.munmap(all_mapped_memory);
+
+    // In most cases, the file we just mapped is a Mach-O binary. However, it could be a "universal
+    // binary": a simple file format which contains Mach-O binaries for multiple targets. For
+    // instance, `/usr/lib/dyld` is currently distributed as a universal binary containing images
+    // for both ARM64 Macs and x86_64 Macs.
+    if (all_mapped_memory.len < 4) return error.InvalidDebugInfo;
+    const magic = @as(*const u32, @ptrCast(all_mapped_memory.ptr)).*;
+    // The contents of a Mach-O file, which may or may not be the whole of `all_mapped_memory`.
+    const mapped_macho = switch (magic) {
+        macho.MH_MAGIC_64 => all_mapped_memory,
+
+        macho.FAT_CIGAM => mapped_macho: {
+            // This is the universal binary format (aka a "fat binary"). Annoyingly, the whole thing
+            // is big-endian, so we'll be swapping some bytes.
+            if (all_mapped_memory.len < @sizeOf(macho.fat_header)) return error.InvalidDebugInfo;
+            const hdr: *const macho.fat_header = @ptrCast(all_mapped_memory.ptr);
+            const archs_ptr: [*]const macho.fat_arch = @ptrCast(all_mapped_memory.ptr + @sizeOf(macho.fat_header));
+            const archs: []const macho.fat_arch = archs_ptr[0..@byteSwap(hdr.nfat_arch)];
+            const native_cpu_type = switch (builtin.cpu.arch) {
+                .x86_64 => macho.CPU_TYPE_X86_64,
+                .aarch64 => macho.CPU_TYPE_ARM64,
+                else => comptime unreachable,
+            };
+            for (archs) |*arch| {
+                if (@byteSwap(arch.cputype) != native_cpu_type) continue;
+                const offset = @byteSwap(arch.offset);
+                const size = @byteSwap(arch.size);
+                break :mapped_macho all_mapped_memory[offset..][0..size];
+            }
+            // Our native architecture was not present in the fat binary.
+            return error.MissingDebugInfo;
+        },
+
+        // Even on modern 64-bit targets, this format doesn't seem to be too extensively used. It
+        // will be fairly easy to add support here if necessary; it's very similar to above.
+        macho.FAT_CIGAM_64 => return error.UnsupportedDebugInfo,
 
-    const hdr: *const macho.mach_header_64 = @ptrCast(@alignCast(mapped_mem.ptr));
+        else => return error.InvalidDebugInfo,
+    };
+
+    const hdr: *const macho.mach_header_64 = @ptrCast(@alignCast(mapped_macho.ptr));
     if (hdr.magic != macho.MH_MAGIC_64)
         return error.InvalidDebugInfo;
 
-    const symtab: macho.symtab_command = symtab: {
+    const symtab: macho.symtab_command, const text_vmaddr: u64 = lc_iter: {
         var it: macho.LoadCommandIterator = .{
             .ncmds = hdr.ncmds,
-            .buffer = mapped_mem[@sizeOf(macho.mach_header_64)..][0..hdr.sizeofcmds],
+            .buffer = mapped_macho[@sizeOf(macho.mach_header_64)..][0..hdr.sizeofcmds],
         };
+        var symtab: ?macho.symtab_command = null;
+        var text_vmaddr: ?u64 = null;
         while (it.next()) |cmd| switch (cmd.cmd()) {
-            .SYMTAB => break :symtab cmd.cast(macho.symtab_command) orelse return error.InvalidDebugInfo,
+            .SYMTAB => symtab = cmd.cast(macho.symtab_command) orelse return error.InvalidDebugInfo,
+            .SEGMENT_64 => if (cmd.cast(macho.segment_command_64)) |seg_cmd| {
+                if (!mem.eql(u8, seg_cmd.segName(), "__TEXT")) continue;
+                text_vmaddr = seg_cmd.vmaddr;
+            },
             else => {},
         };
-        return error.MissingDebugInfo;
+        break :lc_iter .{
+            symtab orelse return error.MissingDebugInfo,
+            text_vmaddr orelse return error.MissingDebugInfo,
+        };
     };
 
-    const syms_ptr: [*]align(1) const macho.nlist_64 = @ptrCast(mapped_mem[symtab.symoff..]);
+    const syms_ptr: [*]align(1) const macho.nlist_64 = @ptrCast(mapped_macho[symtab.symoff..]);
     const syms = syms_ptr[0..symtab.nsyms];
-    const strings = mapped_mem[symtab.stroff..][0 .. symtab.strsize - 1 :0];
+    const strings = mapped_macho[symtab.stroff..][0 .. symtab.strsize - 1];
 
     var symbols: std.ArrayList(MachoSymbol) = try .initCapacity(gpa, syms.len);
     defer symbols.deinit(gpa);
 
+    // This map is temporary; it is used only to detect duplicates here. This is
+    // necessary because we prefer to use STAB ("symbolic debugging table") symbols,
+    // but they might not be present, so we track normal symbols too.
+    // Indices match 1-1 with those of `symbols`.
+    var symbol_names: std.StringArrayHashMapUnmanaged(void) = .empty;
+    defer symbol_names.deinit(gpa);
+    try symbol_names.ensureUnusedCapacity(gpa, syms.len);
+
     var ofile: u32 = undefined;
     var last_sym: MachoSymbol = undefined;
     var state: enum {
@@ -115,7 +149,25 @@ fn loadMachO(module: *const DarwinModule, gpa: Allocator) !DebugInfo.LoadedMachO
     } = .init;
 
     for (syms) |*sym| {
-        if (sym.n_type.bits.is_stab == 0) continue;
+        if (sym.n_type.bits.is_stab == 0) {
+            if (sym.n_strx == 0) continue;
+            switch (sym.n_type.bits.type) {
+                .undf, .pbud, .indr, .abs, _ => continue,
+                .sect => {
+                    const name = std.mem.sliceTo(strings[sym.n_strx..], 0);
+                    const gop = symbol_names.getOrPutAssumeCapacity(name);
+                    if (!gop.found_existing) {
+                        assert(gop.index == symbols.items.len);
+                        symbols.appendAssumeCapacity(.{
+                            .strx = sym.n_strx,
+                            .addr = sym.n_value,
+                            .ofile = MachoSymbol.unknown_ofile,
+                        });
+                    }
+                },
+            }
+            continue;
+        }
 
         // TODO handle globals N_GSYM, and statics N_STSYM
         switch (sym.n_type.stab) {
@@ -132,7 +184,6 @@ fn loadMachO(module: *const DarwinModule, gpa: Allocator) !DebugInfo.LoadedMachO
                     last_sym = .{
                         .strx = 0,
                         .addr = sym.n_value,
-                        .size = 0,
                         .ofile = ofile,
                     };
                 },
@@ -145,14 +196,22 @@ fn loadMachO(module: *const DarwinModule, gpa: Allocator) !DebugInfo.LoadedMachO
                 },
                 .fun_strx => {
                     state = .fun_size;
-                    last_sym.size = @intCast(sym.n_value);
                 },
                 else => return error.InvalidDebugInfo,
             },
             .ensym => switch (state) {
                 .fun_size => {
                     state = .ensym;
-                    symbols.appendAssumeCapacity(last_sym);
+                    if (last_sym.strx != 0) {
+                        const name = std.mem.sliceTo(strings[sym.n_strx..], 0);
+                        const gop = symbol_names.getOrPutAssumeCapacity(name);
+                        if (!gop.found_existing) {
+                            assert(gop.index == symbols.items.len);
+                            symbols.appendAssumeCapacity(last_sym);
+                        } else {
+                            symbols.items[gop.index] = last_sym;
+                        }
+                    }
                 },
                 else => return error.InvalidDebugInfo,
             },
@@ -168,9 +227,12 @@ fn loadMachO(module: *const DarwinModule, gpa: Allocator) !DebugInfo.LoadedMachO
     }
 
     switch (state) {
-        .init => return error.MissingDebugInfo,
+        .init => {
+            // Missing STAB symtab entries is still okay, unless there were also no normal symbols.
+            if (symbols.items.len == 0) return error.MissingDebugInfo;
+        },
         .oso_close => {},
-        else => return error.InvalidDebugInfo,
+        else => return error.InvalidDebugInfo, // corrupted STAB entries in symtab
     }
 
     const symbols_slice = try symbols.toOwnedSlice(gpa);
@@ -182,10 +244,11 @@ fn loadMachO(module: *const DarwinModule, gpa: Allocator) !DebugInfo.LoadedMachO
     mem.sort(MachoSymbol, symbols_slice, {}, MachoSymbol.addressLessThan);
 
     return .{
-        .mapped_memory = mapped_mem,
+        .mapped_memory = all_mapped_memory,
         .symbols = symbols_slice,
         .strings = strings,
         .ofiles = .empty,
+        .vaddr_offset = module.text_base - text_vmaddr,
     };
 }
 pub fn getSymbolAtAddress(module: *const DarwinModule, gpa: Allocator, di: *DebugInfo, address: usize) Error!std.debug.Symbol {
@@ -195,7 +258,7 @@ pub fn getSymbolAtAddress(module: *const DarwinModule, gpa: Allocator, di: *Debu
     };
     const loaded_macho = &di.loaded_macho.?;
 
-    const vaddr = address - module.load_offset;
+    const vaddr = address - loaded_macho.vaddr_offset;
     const symbol = MachoSymbol.find(loaded_macho.symbols, vaddr) orelse return .unknown;
 
     // offset of `address` from start of `symbol`
@@ -212,6 +275,11 @@ pub fn getSymbolAtAddress(module: *const DarwinModule, gpa: Allocator, di: *Debu
         .source_location = null,
     };
 
+    if (symbol.ofile == MachoSymbol.unknown_ofile) {
+        // We don't have STAB info, so can't track down the object file; all we can do is the symbol name.
+        return sym_only_result;
+    }
+
     const o_file: *DebugInfo.OFile = of: {
         const gop = try loaded_macho.ofiles.getOrPut(gpa, symbol.ofile);
         if (!gop.found_existing) {
@@ -233,7 +301,7 @@ pub fn getSymbolAtAddress(module: *const DarwinModule, gpa: Allocator, di: *Debu
     const compile_unit = o_file.dwarf.findCompileUnit(native_endian, symbol_ofile_vaddr) catch return sym_only_result;
 
     return .{
-        .name = o_file.dwarf.getSymbolName(symbol_ofile_vaddr) orelse stab_symbol,
+        .name = o_file.dwarf.getSymbolName(symbol_ofile_vaddr + address_symbol_offset) orelse stab_symbol,
         .compile_unit_name = compile_unit.die.getAttrString(
             &o_file.dwarf,
             native_endian,
@@ -256,7 +324,7 @@ pub const UnwindContext = std.debug.SelfInfo.DwarfUnwindContext;
 /// Unwind a frame using MachO compact unwind info (from __unwind_info).
 /// If the compact encoding can't encode a way to unwind a frame, it will
 /// defer unwinding to DWARF, in which case `.eh_frame` will be used if available.
-pub fn unwindFrame(module: *const DarwinModule, gpa: Allocator, di: *DebugInfo, context: *UnwindContext) Error!usize {
+pub fn unwindFrame(module: *const DarwinModule, gpa: Allocator, di: *DebugInfo, context: *UnwindContext) Error!void {
     return unwindFrameInner(module, gpa, di, context) catch |err| switch (err) {
         error.InvalidDebugInfo,
         error.MissingDebugInfo,
@@ -272,7 +340,7 @@ pub fn unwindFrame(module: *const DarwinModule, gpa: Allocator, di: *DebugInfo,
         => return error.InvalidDebugInfo,
     };
 }
-fn unwindFrameInner(module: *const DarwinModule, gpa: Allocator, di: *DebugInfo, context: *UnwindContext) !usize {
+fn unwindFrameInner(module: *const DarwinModule, gpa: Allocator, di: *DebugInfo, context: *UnwindContext) !void {
     if (di.unwind == null) di.unwind = module.loadUnwindInfo();
     const unwind = &di.unwind.?;
 
@@ -500,11 +568,11 @@ fn unwindFrameInner(module: *const DarwinModule, gpa: Allocator, di: *DebugInfo,
             },
             .DWARF => {
                 const eh_frame = unwind.eh_frame orelse return error.MissingDebugInfo;
-                const eh_frame_vaddr = @intFromPtr(eh_frame.ptr) - module.load_offset;
+                const eh_frame_vaddr = @intFromPtr(eh_frame.ptr) - unwind.vmaddr_slide;
                 return context.unwindFrame(
                     gpa,
                     &.initSection(.eh_frame, eh_frame_vaddr, eh_frame),
-                    module.load_offset,
+                    unwind.vmaddr_slide,
                     @intCast(encoding.value.x86_64.dwarf),
                 );
             },
@@ -520,11 +588,11 @@ fn unwindFrameInner(module: *const DarwinModule, gpa: Allocator, di: *DebugInfo,
             },
             .DWARF => {
                 const eh_frame = unwind.eh_frame orelse return error.MissingDebugInfo;
-                const eh_frame_vaddr = @intFromPtr(eh_frame.ptr) - module.load_offset;
+                const eh_frame_vaddr = @intFromPtr(eh_frame.ptr) - unwind.vmaddr_slide;
                 return context.unwindFrame(
                     gpa,
                     &.initSection(.eh_frame, eh_frame_vaddr, eh_frame),
-                    module.load_offset,
+                    unwind.vmaddr_slide,
                     @intCast(encoding.value.x86_64.dwarf),
                 );
             },
@@ -572,9 +640,7 @@ fn unwindFrameInner(module: *const DarwinModule, gpa: Allocator, di: *DebugInfo,
         else => comptime unreachable, // unimplemented
     };
 
-    context.pc = UnwindContext.stripInstructionPtrAuthCode(new_ip);
-    if (context.pc > 0) context.pc -= 1;
-    return new_ip;
+    context.pc = std.debug.stripInstructionPtrAuthCode(new_ip) -| 1;
 }
 pub const DebugInfo = struct {
     unwind: ?Unwind,
@@ -590,6 +656,7 @@ pub const DebugInfo = struct {
             for (loaded_macho.ofiles.values()) |*ofile| {
                 ofile.dwarf.deinit(gpa);
                 ofile.symbols_by_name.deinit(gpa);
+                posix.munmap(ofile.mapped_memory);
             }
             loaded_macho.ofiles.deinit(gpa);
             gpa.free(loaded_macho.symbols);
@@ -598,6 +665,9 @@ pub const DebugInfo = struct {
     }
 
     const Unwind = struct {
+        /// The slide applied to the following sections. So, `unwind_info.ptr` is this many bytes
+        /// higher than the vmaddr of `__unwind_info`, and likewise for `__eh_frame`.
+        vmaddr_slide: u64,
         // Backed by the in-memory sections mapped by the loader
         unwind_info: ?[]const u8,
         eh_frame: ?[]const u8,
@@ -606,21 +676,31 @@ pub const DebugInfo = struct {
     const LoadedMachO = struct {
         mapped_memory: []align(std.heap.page_size_min) const u8,
         symbols: []const MachoSymbol,
-        strings: [:0]const u8,
+        strings: []const u8,
         /// Key is index into `strings` of the file path.
         ofiles: std.AutoArrayHashMapUnmanaged(u32, OFile),
+        /// This is not necessarily the same as the vmaddr_slide that dyld would report. This is
+        /// because the segments in the file on disk might differ from the ones in memory. Normally
+        /// we wouldn't necessarily expect that to work, but /usr/lib/dyld is incredibly annoying:
+        /// it exists on disk (necessarily, because the kernel needs to load it!), but is also in
+        /// the dyld cache (dyld actually restart itself from cache after loading it), and the two
+        /// versions have (very) different segment base addresses. It's sort of like a large slide
+        /// has been applied to all addresses in memory. For an optimal experience, we consider the
+        /// on-disk vmaddr instead of the in-memory one.
+        vaddr_offset: usize,
     };
 
     const OFile = struct {
+        mapped_memory: []align(std.heap.page_size_min) const u8,
         dwarf: Dwarf,
-        strtab: [:0]const u8,
+        strtab: []const u8,
         symtab: []align(1) const macho.nlist_64,
         /// All named symbols in `symtab`. Stored `u32` key is the index into `symtab`. Accessed
         /// through `SymbolAdapter`, so that the symbol name is used as the logical key.
         symbols_by_name: std.ArrayHashMapUnmanaged(u32, void, void, true),
 
         const SymbolAdapter = struct {
-            strtab: [:0]const u8,
+            strtab: []const u8,
             symtab: []align(1) const macho.nlist_64,
             pub fn hash(ctx: SymbolAdapter, sym_name: []const u8) u32 {
                 _ = ctx;
@@ -663,7 +743,7 @@ pub const DebugInfo = struct {
 
         if (mapped_mem.len < symtab_cmd.stroff + symtab_cmd.strsize) return error.InvalidDebugInfo;
         if (mapped_mem[symtab_cmd.stroff + symtab_cmd.strsize - 1] != 0) return error.InvalidDebugInfo;
-        const strtab = mapped_mem[symtab_cmd.stroff..][0 .. symtab_cmd.strsize - 1 :0];
+        const strtab = mapped_mem[symtab_cmd.stroff..][0 .. symtab_cmd.strsize - 1];
 
         const n_sym_bytes = symtab_cmd.nsyms * @sizeOf(macho.nlist_64);
         if (mapped_mem.len < symtab_cmd.symoff + n_sym_bytes) return error.InvalidDebugInfo;
@@ -717,6 +797,7 @@ pub const DebugInfo = struct {
         try dwarf.open(gpa, native_endian);
 
         return .{
+            .mapped_memory = mapped_mem,
             .dwarf = dwarf,
             .strtab = strtab,
             .symtab = symtab,
@@ -728,8 +809,9 @@ pub const DebugInfo = struct {
 const MachoSymbol = struct {
     strx: u32,
     addr: u64,
-    size: u32,
+    /// Value may be `unknown_ofile`.
     ofile: u32,
+    const unknown_ofile = std.math.maxInt(u32);
     fn addressLessThan(context: void, lhs: MachoSymbol, rhs: MachoSymbol) bool {
         _ = context;
         return lhs.addr < rhs.addr;
@@ -754,9 +836,9 @@ const MachoSymbol = struct {
 
     test find {
         const symbols: []const MachoSymbol = &.{
-            .{ .addr = 100, .strx = undefined, .size = undefined, .ofile = undefined },
-            .{ .addr = 200, .strx = undefined, .size = undefined, .ofile = undefined },
-            .{ .addr = 300, .strx = undefined, .size = undefined, .ofile = undefined },
+            .{ .addr = 100, .strx = undefined, .ofile = undefined },
+            .{ .addr = 200, .strx = undefined, .ofile = undefined },
+            .{ .addr = 300, .strx = undefined, .ofile = undefined },
         };
 
         try testing.expectEqual(null, find(symbols, 0));
diff --git a/lib/std/debug/SelfInfo/ElfModule.zig b/lib/std/debug/SelfInfo/ElfModule.zig
index fde61d8140..e080665497 100644
--- a/lib/std/debug/SelfInfo/ElfModule.zig
+++ b/lib/std/debug/SelfInfo/ElfModule.zig
@@ -230,7 +230,7 @@ fn loadUnwindInfo(module: *const ElfModule, gpa: Allocator, di: *DebugInfo) Erro
         else => unreachable,
     }
 }
-pub fn unwindFrame(module: *const ElfModule, gpa: Allocator, di: *DebugInfo, context: *UnwindContext) Error!usize {
+pub fn unwindFrame(module: *const ElfModule, gpa: Allocator, di: *DebugInfo, context: *UnwindContext) Error!void {
     if (di.unwind[0] == null) try module.loadUnwindInfo(gpa, di);
     std.debug.assert(di.unwind[0] != null);
     for (&di.unwind) |*opt_unwind| {
diff --git a/lib/std/debug/SelfInfo/WindowsModule.zig b/lib/std/debug/SelfInfo/WindowsModule.zig
index 8c88bd8b2f..75abc39ff5 100644
--- a/lib/std/debug/SelfInfo/WindowsModule.zig
+++ b/lib/std/debug/SelfInfo/WindowsModule.zig
@@ -332,6 +332,34 @@ pub const UnwindContext = struct {
                     .Wcr = @splat(0),
                     .Wvr = @splat(0),
                 },
+                .thumb => .{
+                    .ContextFlags = 0,
+                    .R0 = ctx.r[0],
+                    .R1 = ctx.r[1],
+                    .R2 = ctx.r[2],
+                    .R3 = ctx.r[3],
+                    .R4 = ctx.r[4],
+                    .R5 = ctx.r[5],
+                    .R6 = ctx.r[6],
+                    .R7 = ctx.r[7],
+                    .R8 = ctx.r[8],
+                    .R9 = ctx.r[9],
+                    .R10 = ctx.r[10],
+                    .R11 = ctx.r[11],
+                    .R12 = ctx.r[12],
+                    .Sp = ctx.r[13],
+                    .Lr = ctx.r[14],
+                    .Pc = ctx.r[15],
+                    .Cpsr = 0,
+                    .Fpcsr = 0,
+                    .Padding = 0,
+                    .DUMMYUNIONNAME = .{ .S = @splat(0) },
+                    .Bvr = @splat(0),
+                    .Bcr = @splat(0),
+                    .Wvr = @splat(0),
+                    .Wcr = @splat(0),
+                    .Padding2 = @splat(0),
+                },
                 else => comptime unreachable,
             },
             .history_table = std.mem.zeroes(windows.UNWIND_HISTORY_TABLE),
@@ -345,7 +373,7 @@ pub const UnwindContext = struct {
         return ctx.cur.getRegs().bp;
     }
 };
-pub fn unwindFrame(module: *const WindowsModule, gpa: Allocator, di: *DebugInfo, context: *UnwindContext) !usize {
+pub fn unwindFrame(module: *const WindowsModule, gpa: Allocator, di: *DebugInfo, context: *UnwindContext) !void {
     _ = module;
     _ = gpa;
     _ = di;
@@ -374,10 +402,10 @@ pub fn unwindFrame(module: *const WindowsModule, gpa: Allocator, di: *DebugInfo,
     const next_regs = context.cur.getRegs();
     const tib = &windows.teb().NtTib;
     if (next_regs.sp < @intFromPtr(tib.StackLimit) or next_regs.sp > @intFromPtr(tib.StackBase)) {
-        return 0;
+        context.pc = 0;
+    } else {
+        context.pc = next_regs.ip -| 1;
     }
-    context.pc = next_regs.ip -| 1;
-    return next_regs.ip;
 }
 
 const WindowsModule = @This();
diff --git a/lib/std/debug/cpu_context.zig b/lib/std/debug/cpu_context.zig
index 9859575fa3..b9dd49767f 100644
--- a/lib/std/debug/cpu_context.zig
+++ b/lib/std/debug/cpu_context.zig
@@ -214,6 +214,12 @@ pub fn fromWindowsContext(ctx: *const std.os.windows.CONTEXT) Native {
             .sp = ctx.Sp,
             .pc = ctx.Pc,
         },
+        .thumb => .{ .r = .{
+            ctx.R0,  ctx.R1, ctx.R2,  ctx.R3,
+            ctx.R4,  ctx.R5, ctx.R6,  ctx.R7,
+            ctx.R8,  ctx.R9, ctx.R10, ctx.R11,
+            ctx.R12, ctx.Sp, ctx.Lr,  ctx.Pc,
+        } },
         else => comptime unreachable,
     };
 }
-- 
cgit v1.2.3


From 084e92879a1732374fac5f1a05a27f42b9306d22 Mon Sep 17 00:00:00 2001
From: mlugg <mlugg@mlugg.co.uk>
Date: Thu, 18 Sep 2025 15:52:02 +0100
Subject: std: don't get CPU context when using CBE targeting MSVC

Calling `current` here causes compilation failures as the C backend
currently does not emit valid MSVC inline assembly. This change means
that when building for MSVC with the self-hosted C backend, only FP
unwinding can be used.
---
 lib/std/debug.zig             | 8 +++++++-
 lib/std/debug/cpu_context.zig | 4 ++--
 2 files changed, 9 insertions(+), 3 deletions(-)

(limited to 'lib/std/debug/cpu_context.zig')

diff --git a/lib/std/debug.zig b/lib/std/debug.zig
index 23d134f84c..3d8bc565e7 100644
--- a/lib/std/debug.zig
+++ b/lib/std/debug.zig
@@ -756,7 +756,13 @@ const StackIterator = union(enum) {
             // Use `di_first` here so we report the PC in the context before unwinding any further.
             return .{ .di_first = .init(context_ptr) };
         }
-        if (SelfInfo.supports_unwinding and cpu_context.Native != noreturn) {
+        // Workaround the C backend being unable to use inline assembly on MSVC by disabling the
+        // call to `current`. This effectively constrains stack trace collection and dumping to FP
+        // unwinding when building with CBE for MSVC.
+        if (!(builtin.zig_backend == .stage2_c and builtin.target.abi == .msvc) and
+            SelfInfo.supports_unwinding and
+            cpu_context.Native != noreturn)
+        {
             // We don't need `di_first` here, because our PC is in `std.debug`; we're only interested
             // in our caller's frame and above.
             return .{ .di = .init(&.current()) };
diff --git a/lib/std/debug/cpu_context.zig b/lib/std/debug/cpu_context.zig
index b9dd49767f..fdf6ebd243 100644
--- a/lib/std/debug/cpu_context.zig
+++ b/lib/std/debug/cpu_context.zig
@@ -316,7 +316,7 @@ pub const X86_64 = struct {
             \\movq %%r15, 0x78(%%rdi)
             \\leaq (%%rip), %%rax
             \\movq %%rax, 0x80(%%rdi)
-            \\movq 0x00(%%rdi), %%rax  // restore saved rax
+            \\movq 0x00(%%rdi), %%rax
             :
             : [gprs] "{rdi}" (&ctx.gprs.values),
             : .{ .memory = true });
@@ -431,7 +431,7 @@ pub const Aarch64 = extern struct {
             \\str x1, [x0, #0x0f8]
             \\adr x1, .
             \\str x1, [x0, #0x100]
-            \\ldr x1, [x0, #0x008] // restore saved x1
+            \\ldr x1, [x0, #0x008]
             :
             : [gprs] "{x0}" (&ctx),
             : .{ .memory = true });
-- 
cgit v1.2.3


From f7e0ff8a5fb3e8426e8f64bba271eae358d123b4 Mon Sep 17 00:00:00 2001
From: mlugg <mlugg@mlugg.co.uk>
Date: Sat, 20 Sep 2025 15:16:42 +0100
Subject: std: clarify cpu_context register order rationale

---
 lib/std/debug/cpu_context.zig | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

(limited to 'lib/std/debug/cpu_context.zig')

diff --git a/lib/std/debug/cpu_context.zig b/lib/std/debug/cpu_context.zig
index fdf6ebd243..6499de21b1 100644
--- a/lib/std/debug/cpu_context.zig
+++ b/lib/std/debug/cpu_context.zig
@@ -225,8 +225,9 @@ pub fn fromWindowsContext(ctx: *const std.os.windows.CONTEXT) Native {
 }
 
 pub const X86 = struct {
-    /// The first 8 registers here intentionally match the order of registers pushed
-    /// by PUSHA, which is also the order used by the DWARF register mappings.
+    /// The first 8 registers here intentionally match the order of registers in the x86 instruction
+    /// encoding. This order is inherited by the PUSHA instruction and the DWARF register mappings,
+    /// among other things.
     pub const Gpr = enum {
         // zig fmt: off
         eax, ecx, edx, ebx,
@@ -283,7 +284,9 @@ pub const X86 = struct {
 };
 
 pub const X86_64 = struct {
-    /// MLUGG TODO: explain this order. why does DWARF have this?
+    /// The order here intentionally matches the order of the DWARF register mappings. It's unclear
+    /// where those mappings actually originated from---the ordering of the first 4 registers seems
+    /// quite unusual---but it is currently convenient for us to match DWARF.
     pub const Gpr = enum {
         // zig fmt: off
         rax, rdx, rcx, rbx,
-- 
cgit v1.2.3


From a90eb50c8034134d9f22aeffb4ea11e83b056cc7 Mon Sep 17 00:00:00 2001
From: mlugg <mlugg@mlugg.co.uk>
Date: Sat, 27 Sep 2025 11:30:35 +0100
Subject: typo

---
 lib/std/debug/cpu_context.zig | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

(limited to 'lib/std/debug/cpu_context.zig')

diff --git a/lib/std/debug/cpu_context.zig b/lib/std/debug/cpu_context.zig
index 6499de21b1..1089e74aa6 100644
--- a/lib/std/debug/cpu_context.zig
+++ b/lib/std/debug/cpu_context.zig
@@ -146,7 +146,7 @@ pub fn fromPosixSignalContext(ctx_ptr: ?*const anyopaque) ?Native {
                 .pc = uc.mcontext.ss.pc,
             },
             .netbsd => .{
-                .x = uc.mcontext.gregs[0..31],
+                .x = uc.mcontext.gregs[0..31].*,
                 .sp = uc.mcontext.gregs[31],
                 .pc = uc.mcontext.gregs[32],
             },
-- 
cgit v1.2.3