From 4c3625d74546e22e1bd4695cc7bdde09f645bf30 Mon Sep 17 00:00:00 2001 From: Jakub Konka Date: Thu, 13 Jul 2023 14:33:33 +0200 Subject: check-object: dump ELF header --- lib/std/Build/Step/CheckObject.zig | 35 ++++++++++++++++++++++++++++++++++- 1 file changed, 34 insertions(+), 1 deletion(-) (limited to 'lib/std/Build/Step/CheckObject.zig') diff --git a/lib/std/Build/Step/CheckObject.zig b/lib/std/Build/Step/CheckObject.zig index 171734c450..d53352af80 100644 --- a/lib/std/Build/Step/CheckObject.zig +++ b/lib/std/Build/Step/CheckObject.zig @@ -1,5 +1,6 @@ const std = @import("std"); const assert = std.debug.assert; +const elf = std.elf; const fs = std.fs; const macho = std.macho; const math = std.math; @@ -338,7 +339,9 @@ fn make(step: *Step, prog_node: *std.Progress.Node) !void { .macho => try MachODumper.parseAndDump(step, contents, .{ .dump_symtab = self.dump_symtab, }), - .elf => @panic("TODO elf parser"), + .elf => try ElfDumper.parseAndDump(step, contents, .{ + .dump_symtab = self.dump_symtab, + }), .coff => @panic("TODO coff parser"), .wasm => try WasmDumper.parseAndDump(step, contents, .{ .dump_symtab = self.dump_symtab, @@ -695,6 +698,36 @@ const MachODumper = struct { } }; +const ElfDumper = struct { + const symtab_label = "symtab"; + + fn parseAndDump(step: *Step, bytes: []const u8, opts: Opts) ![]const u8 { + _ = opts; + + const gpa = step.owner.allocator; + var stream = std.io.fixedBufferStream(bytes); + const reader = stream.reader(); + + const hdr = try reader.readStruct(elf.Elf64_Ehdr); + if (!mem.eql(u8, hdr.e_ident[0..4], "\x7fELF")) { + return error.InvalidMagicNumber; + } + + var output = std.ArrayList(u8).init(gpa); + const writer = output.writer(); + + try dumpHeader(hdr, writer); + + return output.toOwnedSlice(); + } + + fn dumpHeader(hdr: elf.Elf64_Ehdr, writer: anytype) !void { + try writer.writeAll("header\n"); + try writer.print("type {s}\n", .{@tagName(hdr.e_type)}); + try writer.print("entry {x}\n", .{hdr.e_entry}); + } +}; + const WasmDumper = struct { const symtab_label = "symbols"; -- cgit v1.2.3 From 76dc0d516089da6cd7dfb5ee1634c7e4ccef6a4a Mon Sep 17 00:00:00 2001 From: Jakub Konka Date: Thu, 13 Jul 2023 17:01:26 +0200 Subject: check-object: dump some info on SHDRs --- lib/std/Build/Step/CheckObject.zig | 143 +++++++++++++++++++++++++++++++++++-- 1 file changed, 137 insertions(+), 6 deletions(-) (limited to 'lib/std/Build/Step/CheckObject.zig') diff --git a/lib/std/Build/Step/CheckObject.zig b/lib/std/Build/Step/CheckObject.zig index d53352af80..418aa9f681 100644 --- a/lib/std/Build/Step/CheckObject.zig +++ b/lib/std/Build/Step/CheckObject.zig @@ -701,9 +701,34 @@ const MachODumper = struct { const ElfDumper = struct { const symtab_label = "symtab"; - fn parseAndDump(step: *Step, bytes: []const u8, opts: Opts) ![]const u8 { - _ = opts; + const Symtab = struct { + symbols: []align(1) const elf.Elf64_Sym, + strings: []const u8, + + fn get(st: Symtab, index: usize) ?elf.Elf64_Sym { + if (index >= st.symbols.len) return null; + return st.symbols[index]; + } + + fn getName(st: Symtab, index: usize) ?[]const u8 { + const sym = st.get(index) orelse return null; + assert(sym.st_name < st.strings.len); + return mem.sliceTo(@ptrCast(st.strings.ptr + sym.st_name), 0); + } + }; + const Context = struct { + gpa: Allocator, + data: []const u8, + hdr: elf.Elf64_Ehdr, + shdrs: []align(1) const elf.Elf64_Shdr, + phdrs: []align(1) const elf.Elf64_Phdr, + shstrtab: []const u8, + symtab: ?Symtab = null, + dysymtab: ?Symtab = null, + }; + + fn parseAndDump(step: *Step, bytes: []const u8, opts: Opts) ![]const u8 { const gpa = step.owner.allocator; var stream = std.io.fixedBufferStream(bytes); const reader = stream.reader(); @@ -713,18 +738,124 @@ const ElfDumper = struct { return error.InvalidMagicNumber; } + const shdrs = @as([*]align(1) const elf.Elf64_Shdr, @ptrCast(bytes.ptr + hdr.e_shoff))[0..hdr.e_shnum]; + const phdrs = @as([*]align(1) const elf.Elf64_Phdr, @ptrCast(bytes.ptr + hdr.e_phoff))[0..hdr.e_phnum]; + + var ctx = Context{ + .gpa = gpa, + .data = bytes, + .hdr = hdr, + .shdrs = shdrs, + .phdrs = phdrs, + .shstrtab = undefined, + }; + ctx.shstrtab = getSectionContents(ctx, ctx.hdr.e_shstrndx); + + if (opts.dump_symtab) { + for (ctx.shdrs, 0..) |shdr, i| switch (shdr.sh_type) { + elf.SHT_SYMTAB, elf.SHT_DYNSYM => { + const raw = getSectionContents(ctx, i); + const nsyms = @divExact(raw.len, @sizeOf(elf.Elf64_Sym)); + const symbols = @as([*]align(1) const elf.Elf64_Sym, @ptrCast(raw.ptr))[0..nsyms]; + const strings = getSectionContents(ctx, shdr.sh_link); + + switch (shdr.sh_type) { + elf.SHT_SYMTAB => { + ctx.symtab = .{ + .symbols = symbols, + .strings = strings, + }; + }, + elf.SHT_DYNSYM => { + ctx.dysymtab = .{ + .symbols = symbols, + .strings = strings, + }; + }, + else => unreachable, + } + }, + + else => {}, + }; + } + var output = std.ArrayList(u8).init(gpa); const writer = output.writer(); - try dumpHeader(hdr, writer); + try dumpHeader(ctx, writer); + try dumpShdrs(ctx, writer); return output.toOwnedSlice(); } - fn dumpHeader(hdr: elf.Elf64_Ehdr, writer: anytype) !void { + fn getSectionName(ctx: Context, shndx: usize) []const u8 { + const shdr = ctx.shdrs[shndx]; + assert(shdr.sh_name < ctx.shstrtab.len); + return mem.sliceTo(@as([*:0]const u8, @ptrCast(ctx.shstrtab.ptr + shdr.sh_name)), 0); + } + + fn getSectionContents(ctx: Context, shndx: usize) []const u8 { + const shdr = ctx.shdrs[shndx]; + assert(shdr.sh_offset < ctx.data.len); + assert(shdr.sh_offset + shdr.sh_size <= ctx.data.len); + return ctx.data[shdr.sh_offset..][0..shdr.sh_size]; + } + + fn dumpHeader(ctx: Context, writer: anytype) !void { try writer.writeAll("header\n"); - try writer.print("type {s}\n", .{@tagName(hdr.e_type)}); - try writer.print("entry {x}\n", .{hdr.e_entry}); + try writer.print("type {s}\n", .{@tagName(ctx.hdr.e_type)}); + try writer.print("entry {x}\n", .{ctx.hdr.e_entry}); + } + + fn dumpShdrs(ctx: Context, writer: anytype) !void { + if (ctx.shdrs.len == 0) return; + + for (ctx.shdrs, 0..) |shdr, shndx| { + try writer.print("shdr {d}\n", .{shndx}); + try writer.print("name {s}\n", .{getSectionName(ctx, shndx)}); + try writer.print("type {s}\n", .{try fmtShType(ctx.gpa, shdr.sh_type)}); + } + } + + fn fmtShType(gpa: Allocator, sh_type: u32) ![]const u8 { + return switch (sh_type) { + elf.SHT_NULL => "NULL", + elf.SHT_PROGBITS => "PROGBITS", + elf.SHT_SYMTAB => "SYMTAB", + elf.SHT_STRTAB => "STRTAB", + elf.SHT_RELA => "RELA", + elf.SHT_HASH => "HASH", + elf.SHT_DYNAMIC => "DYNAMIC", + elf.SHT_NOTE => "NOTE", + elf.SHT_NOBITS => "NOBITS", + elf.SHT_REL => "REL", + elf.SHT_SHLIB => "SHLIB", + elf.SHT_DYNSYM => "DYNSYM", + elf.SHT_INIT_ARRAY => "INIT_ARRAY", + elf.SHT_FINI_ARRAY => "FINI_ARRAY", + elf.SHT_PREINIT_ARRAY => "PREINIT_ARRAY", + elf.SHT_GROUP => "GROUP", + elf.SHT_SYMTAB_SHNDX => "SYMTAB_SHNDX", + elf.SHT_X86_64_UNWIND => "X86_64_UNWIND", + elf.SHT_LLVM_ADDRSIG => "LLVM_ADDRSIG", + elf.SHT_GNU_HASH => "GNU_HASH", + elf.SHT_GNU_VERDEF => "VERDEF", + elf.SHT_GNU_VERNEED => "VERNEED", + elf.SHT_GNU_VERSYM => "VERSYM", + else => |sht| blk: { + if (elf.SHT_LOOS <= sht and sht < elf.SHT_HIOS) { + break :blk try std.fmt.allocPrint(gpa, "LOOS+0x{x}", .{sht - elf.SHT_LOOS}); + } + if (elf.SHT_LOPROC <= sht and sht < elf.SHT_HIPROC) { + break :blk try std.fmt.allocPrint(gpa, "LOPROC+0x{x}", .{sht - elf.SHT_LOPROC}); + } + if (elf.SHT_LOUSER <= sht and sht < elf.SHT_HIUSER) { + break :blk try std.fmt.allocPrint(gpa, "LOUSER+0x{x}", .{sht - elf.SHT_LOUSER}); + } + break :blk "UNKNOWN"; + }, + }; } }; -- cgit v1.2.3 From 33154b511cbf96e0c95e8bad0c5e19ba54371964 Mon Sep 17 00:00:00 2001 From: Jakub Konka Date: Thu, 13 Jul 2023 20:31:19 +0200 Subject: check-object: dump more info on SHDRs --- lib/std/Build/Step/CheckObject.zig | 4 ++++ 1 file changed, 4 insertions(+) (limited to 'lib/std/Build/Step/CheckObject.zig') diff --git a/lib/std/Build/Step/CheckObject.zig b/lib/std/Build/Step/CheckObject.zig index 418aa9f681..2458c15271 100644 --- a/lib/std/Build/Step/CheckObject.zig +++ b/lib/std/Build/Step/CheckObject.zig @@ -815,6 +815,10 @@ const ElfDumper = struct { try writer.print("shdr {d}\n", .{shndx}); try writer.print("name {s}\n", .{getSectionName(ctx, shndx)}); try writer.print("type {s}\n", .{try fmtShType(ctx.gpa, shdr.sh_type)}); + try writer.print("addr {x}\n", .{shdr.sh_addr}); + try writer.print("offset {x}\n", .{shdr.sh_offset}); + try writer.print("size {x}\n", .{shdr.sh_size}); + try writer.print("addralign {x}\n", .{shdr.sh_addralign}); } } -- cgit v1.2.3 From 77026c67a42050cf6c15531d784afbf16c67c23c Mon Sep 17 00:00:00 2001 From: Jakub Konka Date: Thu, 13 Jul 2023 21:27:18 +0200 Subject: check-object: dump info on PHDRs --- lib/std/Build/Step/CheckObject.zig | 141 +++++++++++++++++++++++++++---------- 1 file changed, 102 insertions(+), 39 deletions(-) (limited to 'lib/std/Build/Step/CheckObject.zig') diff --git a/lib/std/Build/Step/CheckObject.zig b/lib/std/Build/Step/CheckObject.zig index 2458c15271..5c24d53722 100644 --- a/lib/std/Build/Step/CheckObject.zig +++ b/lib/std/Build/Step/CheckObject.zig @@ -785,6 +785,7 @@ const ElfDumper = struct { try dumpHeader(ctx, writer); try dumpShdrs(ctx, writer); + try dumpPhdrs(ctx, writer); return output.toOwnedSlice(); } @@ -814,52 +815,114 @@ const ElfDumper = struct { for (ctx.shdrs, 0..) |shdr, shndx| { try writer.print("shdr {d}\n", .{shndx}); try writer.print("name {s}\n", .{getSectionName(ctx, shndx)}); - try writer.print("type {s}\n", .{try fmtShType(ctx.gpa, shdr.sh_type)}); + try writer.print("type {s}\n", .{fmtShType(shdr.sh_type)}); try writer.print("addr {x}\n", .{shdr.sh_addr}); try writer.print("offset {x}\n", .{shdr.sh_offset}); try writer.print("size {x}\n", .{shdr.sh_size}); try writer.print("addralign {x}\n", .{shdr.sh_addralign}); + // TODO dump formatted sh_flags } } - fn fmtShType(gpa: Allocator, sh_type: u32) ![]const u8 { - return switch (sh_type) { - elf.SHT_NULL => "NULL", - elf.SHT_PROGBITS => "PROGBITS", - elf.SHT_SYMTAB => "SYMTAB", - elf.SHT_STRTAB => "STRTAB", - elf.SHT_RELA => "RELA", - elf.SHT_HASH => "HASH", - elf.SHT_DYNAMIC => "DYNAMIC", - elf.SHT_NOTE => "NOTE", - elf.SHT_NOBITS => "NOBITS", - elf.SHT_REL => "REL", - elf.SHT_SHLIB => "SHLIB", - elf.SHT_DYNSYM => "DYNSYM", - elf.SHT_INIT_ARRAY => "INIT_ARRAY", - elf.SHT_FINI_ARRAY => "FINI_ARRAY", - elf.SHT_PREINIT_ARRAY => "PREINIT_ARRAY", - elf.SHT_GROUP => "GROUP", - elf.SHT_SYMTAB_SHNDX => "SYMTAB_SHNDX", - elf.SHT_X86_64_UNWIND => "X86_64_UNWIND", - elf.SHT_LLVM_ADDRSIG => "LLVM_ADDRSIG", - elf.SHT_GNU_HASH => "GNU_HASH", - elf.SHT_GNU_VERDEF => "VERDEF", - elf.SHT_GNU_VERNEED => "VERNEED", - elf.SHT_GNU_VERSYM => "VERSYM", - else => |sht| blk: { - if (elf.SHT_LOOS <= sht and sht < elf.SHT_HIOS) { - break :blk try std.fmt.allocPrint(gpa, "LOOS+0x{x}", .{sht - elf.SHT_LOOS}); - } - if (elf.SHT_LOPROC <= sht and sht < elf.SHT_HIPROC) { - break :blk try std.fmt.allocPrint(gpa, "LOPROC+0x{x}", .{sht - elf.SHT_LOPROC}); - } - if (elf.SHT_LOUSER <= sht and sht < elf.SHT_HIUSER) { - break :blk try std.fmt.allocPrint(gpa, "LOUSER+0x{x}", .{sht - elf.SHT_LOUSER}); - } - break :blk "UNKNOWN"; - }, - }; + fn fmtShType(sh_type: u32) std.fmt.Formatter(formatShType) { + return .{ .data = sh_type }; + } + + fn formatShType( + sh_type: u32, + comptime unused_fmt_string: []const u8, + options: std.fmt.FormatOptions, + writer: anytype, + ) !void { + _ = unused_fmt_string; + _ = options; + if (elf.SHT_LOOS <= sh_type and sh_type < elf.SHT_HIOS) { + try writer.print("LOOS+0x{x}", .{sh_type - elf.SHT_LOOS}); + } else if (elf.SHT_LOPROC <= sh_type and sh_type < elf.SHT_HIPROC) { + try writer.print("LOPROC+0x{x}", .{sh_type - elf.SHT_LOPROC}); + } else if (elf.SHT_LOUSER <= sh_type and sh_type < elf.SHT_HIUSER) { + try writer.print("LOUSER+0x{x}", .{sh_type - elf.SHT_LOUSER}); + } else { + const name = switch (sh_type) { + elf.SHT_NULL => "NULL", + elf.SHT_PROGBITS => "PROGBITS", + elf.SHT_SYMTAB => "SYMTAB", + elf.SHT_STRTAB => "STRTAB", + elf.SHT_RELA => "RELA", + elf.SHT_HASH => "HASH", + elf.SHT_DYNAMIC => "DYNAMIC", + elf.SHT_NOTE => "NOTE", + elf.SHT_NOBITS => "NOBITS", + elf.SHT_REL => "REL", + elf.SHT_SHLIB => "SHLIB", + elf.SHT_DYNSYM => "DYNSYM", + elf.SHT_INIT_ARRAY => "INIT_ARRAY", + elf.SHT_FINI_ARRAY => "FINI_ARRAY", + elf.SHT_PREINIT_ARRAY => "PREINIT_ARRAY", + elf.SHT_GROUP => "GROUP", + elf.SHT_SYMTAB_SHNDX => "SYMTAB_SHNDX", + elf.SHT_X86_64_UNWIND => "X86_64_UNWIND", + elf.SHT_LLVM_ADDRSIG => "LLVM_ADDRSIG", + elf.SHT_GNU_HASH => "GNU_HASH", + elf.SHT_GNU_VERDEF => "VERDEF", + elf.SHT_GNU_VERNEED => "VERNEED", + elf.SHT_GNU_VERSYM => "VERSYM", + else => "UNKNOWN", + }; + try writer.writeAll(name); + } + } + + fn dumpPhdrs(ctx: Context, writer: anytype) !void { + if (ctx.phdrs.len == 0) return; + + for (ctx.phdrs, 0..) |phdr, phndx| { + try writer.print("phdr {d}\n", .{phndx}); + try writer.print("type {s}\n", .{fmtPhType(phdr.p_type)}); + try writer.print("vaddr {x}\n", .{phdr.p_vaddr}); + try writer.print("paddr {x}\n", .{phdr.p_paddr}); + try writer.print("offset {x}\n", .{phdr.p_offset}); + try writer.print("memsz {x}\n", .{phdr.p_memsz}); + try writer.print("filesz {x}\n", .{phdr.p_filesz}); + try writer.print("align {x}\n", .{phdr.p_align}); + // TODO dump formatted p_flags + } + } + + fn fmtPhType(ph_type: u32) std.fmt.Formatter(formatPhType) { + return .{ .data = ph_type }; + } + + fn formatPhType( + ph_type: u32, + comptime unused_fmt_string: []const u8, + options: std.fmt.FormatOptions, + writer: anytype, + ) !void { + _ = unused_fmt_string; + _ = options; + if (elf.PT_LOOS <= ph_type and ph_type < elf.PT_HIOS) { + try writer.print("LOOS+0x{x}", .{ph_type - elf.PT_LOOS}); + } else if (elf.PT_LOPROC <= ph_type and ph_type < elf.PT_HIPROC) { + try writer.print("LOPROC+0x{x}", .{ph_type - elf.PT_LOPROC}); + } else { + const p_type = switch (ph_type) { + elf.PT_NULL => "NULL", + elf.PT_LOAD => "LOAD", + elf.PT_DYNAMIC => "DYNAMIC", + elf.PT_INTERP => "INTERP", + elf.PT_NOTE => "NOTE", + elf.PT_SHLIB => "SHLIB", + elf.PT_PHDR => "PHDR", + elf.PT_TLS => "TLS", + elf.PT_NUM => "NUM", + elf.PT_GNU_EH_FRAME => "GNU_EH_FRAME", + elf.PT_GNU_STACK => "GNU_STACK", + elf.PT_GNU_RELRO => "GNU_RELRO", + else => "UNKNOWN", + }; + try writer.writeAll(p_type); + } } }; -- cgit v1.2.3