aboutsummaryrefslogtreecommitdiff
path: root/src/arch
diff options
context:
space:
mode:
authorJakub Konka <kubkon@jakubkonka.com>2022-02-16 00:18:42 +0100
committerGitHub <noreply@github.com>2022-02-16 00:18:42 +0100
commit092b019a2feb6d7910c77a8dadc76b1ccc8dee53 (patch)
tree80e14ceb4135a49e69d4b60748762661979917eb /src/arch
parentcf5009f9af118716cbe97a28957cb1ca8d047f44 (diff)
parent1c975607e18711b7512057398065c315fa97464a (diff)
downloadzig-092b019a2feb6d7910c77a8dadc76b1ccc8dee53.tar.gz
zig-092b019a2feb6d7910c77a8dadc76b1ccc8dee53.zip
Merge pull request #10899 from ziglang/arm64-macos
aarch64,macos: handle GOT and direct loads in codegen
Diffstat (limited to 'src/arch')
-rw-r--r--src/arch/aarch64/CodeGen.zig118
-rw-r--r--src/arch/aarch64/Emit.zig134
-rw-r--r--src/arch/aarch64/Mir.zig20
3 files changed, 171 insertions, 101 deletions
diff --git a/src/arch/aarch64/CodeGen.zig b/src/arch/aarch64/CodeGen.zig
index b9d5a29f18..698f91a136 100644
--- a/src/arch/aarch64/CodeGen.zig
+++ b/src/arch/aarch64/CodeGen.zig
@@ -115,6 +115,14 @@ const MCValue = union(enum) {
/// The value is in memory at a hard-coded address.
/// If the type is a pointer, it means the pointer address is at this memory location.
memory: u64,
+ /// The value is in memory referenced indirectly via a GOT entry index.
+ /// If the type is a pointer, it means the pointer is referenced indirectly via GOT.
+ /// When lowered, linker will emit relocations of type ARM64_RELOC_GOT_LOAD_PAGE21 and ARM64_RELOC_GOT_LOAD_PAGEOFF12.
+ got_load: u32,
+ /// The value is in memory referenced directly via symbol index.
+ /// If the type is a pointer, it means the pointer is referenced directly via symbol index.
+ /// When lowered, linker will emit a relocation of type ARM64_RELOC_PAGE21 and ARM64_RELOC_PAGEOFF12.
+ direct_load: u32,
/// The value is one of the stack variables.
/// If the type is a pointer, it means the pointer address is in the stack at this offset.
stack_offset: u32,
@@ -1802,6 +1810,8 @@ fn load(self: *Self, dst_mcv: MCValue, ptr: MCValue, ptr_ty: Type) InnerError!vo
},
.memory,
.stack_offset,
+ .got_load,
+ .direct_load,
=> {
const reg = try self.register_manager.allocReg(null);
self.register_manager.freezeRegs(&.{reg});
@@ -1946,6 +1956,11 @@ fn store(self: *Self, ptr: MCValue, value: MCValue, ptr_ty: Type, value_ty: Type
const addr_reg = try self.copyToTmpRegister(ptr_ty, ptr);
try self.store(.{ .register = addr_reg }, value, ptr_ty, value_ty);
},
+ .got_load,
+ .direct_load,
+ => {
+ return self.fail("TODO implement storing to {}", .{ptr});
+ },
}
}
@@ -2114,6 +2129,8 @@ fn airCall(self: *Self, inst: Air.Inst.Index) !void {
.memory => unreachable,
.compare_flags_signed => unreachable,
.compare_flags_unsigned => unreachable,
+ .got_load => unreachable,
+ .direct_load => unreachable,
.register => |reg| {
try self.register_manager.getReg(reg, null);
try self.genSetReg(arg_ty, reg, arg_mcv);
@@ -2160,10 +2177,8 @@ fn airCall(self: *Self, inst: Air.Inst.Index) !void {
} else if (self.bin_file.cast(link.File.MachO)) |macho_file| {
if (func_value.castTag(.function)) |func_payload| {
const func = func_payload.data;
- // TODO I'm hacking my way through here by repurposing .memory for storing
- // index to the GOT target symbol index.
try self.genSetReg(Type.initTag(.u64), .x30, .{
- .memory = func.owner_decl.link.macho.local_sym_index,
+ .got_load = func.owner_decl.link.macho.local_sym_index,
});
// blr x30
_ = try self.addInst(.{
@@ -3015,6 +3030,12 @@ fn genSetStack(self: *Self, ty: Type, stack_offset: u32, mcv: MCValue) InnerErro
else => return self.fail("TODO implement storing other types abi_size={}", .{abi_size}),
}
},
+ .got_load,
+ .direct_load,
+ => |sym_index| {
+ _ = sym_index;
+ return self.fail("TODO implement set stack variable from {}", .{mcv});
+ },
.memory => |vaddr| {
_ = vaddr;
return self.fail("TODO implement set stack variable from memory vaddr", .{});
@@ -3151,22 +3172,34 @@ fn genSetReg(self: *Self, ty: Type, reg: Register, mcv: MCValue) InnerError!void
.data = .{ .rr = .{ .rd = reg, .rn = src_reg } },
});
},
- .memory => |addr| {
- const owner_decl = self.mod_fn.owner_decl;
- // TODO when refactoring LinkBlock, make this into a generic function.
- const atom_index = switch (self.bin_file.tag) {
- .macho => owner_decl.link.macho.local_sym_index,
- .elf => owner_decl.link.elf.local_sym_index,
- .plan9 => @intCast(u32, owner_decl.link.plan9.sym_index orelse 0),
- else => return self.fail("TODO handle aarch64 load memory in {}", .{self.bin_file.tag}),
+ .got_load,
+ .direct_load,
+ => |sym_index| {
+ const tag: Mir.Inst.Tag = switch (mcv) {
+ .got_load => .load_memory_got,
+ .direct_load => .load_memory_direct,
+ else => unreachable,
};
_ = try self.addInst(.{
+ .tag = tag,
+ .data = .{
+ .payload = try self.addExtra(Mir.LoadMemoryPie{
+ .register = @enumToInt(reg),
+ .atom_index = self.mod_fn.owner_decl.link.macho.local_sym_index,
+ .sym_index = sym_index,
+ }),
+ },
+ });
+ },
+ .memory => |addr| {
+ _ = try self.addInst(.{
.tag = .load_memory,
- .data = .{ .payload = try self.addExtra(Mir.LoadMemory{
- .atom_index = atom_index,
- .register = @enumToInt(reg),
- .addr = @intCast(u32, addr),
- }) },
+ .data = .{
+ .load_memory = .{
+ .register = @enumToInt(reg),
+ .addr = @intCast(u32, addr),
+ },
+ },
});
},
.stack_offset => |unadjusted_off| {
@@ -3385,9 +3418,9 @@ fn lowerDeclRef(self: *Self, tv: TypedValue, decl: *Module.Decl) InnerError!MCVa
const got_addr = got.p_vaddr + decl.link.elf.offset_table_index * ptr_bytes;
return MCValue{ .memory = got_addr };
} else if (self.bin_file.cast(link.File.MachO)) |_| {
- // TODO I'm hacking my way through here by repurposing .memory for storing
- // index to the GOT target symbol index.
- return MCValue{ .memory = decl.link.macho.local_sym_index };
+ // Because MachO is PIE-always-on, we defer memory address resolution until
+ // the linker has enough info to perform relocations.
+ return MCValue{ .got_load = decl.link.macho.local_sym_index };
} else if (self.bin_file.cast(link.File.Coff)) |coff_file| {
const got_addr = coff_file.offset_table_virtual_address + decl.link.coff.offset_table_index * ptr_bytes;
return MCValue{ .memory = got_addr };
@@ -3401,6 +3434,25 @@ fn lowerDeclRef(self: *Self, tv: TypedValue, decl: *Module.Decl) InnerError!MCVa
_ = tv;
}
+fn lowerUnnamedConst(self: *Self, tv: TypedValue) InnerError!MCValue {
+ log.debug("lowerUnnamedConst: ty = {}, val = {}", .{ tv.ty, tv.val });
+ const local_sym_index = self.bin_file.lowerUnnamedConst(tv, self.mod_fn.owner_decl) catch |err| {
+ return self.fail("lowering unnamed constant failed: {s}", .{@errorName(err)});
+ };
+ if (self.bin_file.cast(link.File.Elf)) |elf_file| {
+ const vaddr = elf_file.local_symbols.items[local_sym_index].st_value;
+ return MCValue{ .memory = vaddr };
+ } else if (self.bin_file.cast(link.File.MachO)) |_| {
+ return MCValue{ .direct_load = local_sym_index };
+ } else if (self.bin_file.cast(link.File.Coff)) |_| {
+ return self.fail("TODO lower unnamed const in COFF", .{});
+ } else if (self.bin_file.cast(link.File.Plan9)) |_| {
+ return self.fail("TODO lower unnamed const in Plan9", .{});
+ } else {
+ return self.fail("TODO lower unnamed const", .{});
+ }
+}
+
fn genTypedValue(self: *Self, typed_value: TypedValue) InnerError!MCValue {
if (typed_value.val.isUndef())
return MCValue{ .undef = {} };
@@ -3416,23 +3468,20 @@ fn genTypedValue(self: *Self, typed_value: TypedValue) InnerError!MCValue {
switch (typed_value.ty.zigTypeTag()) {
.Pointer => switch (typed_value.ty.ptrSize()) {
.Slice => {
- var buf: Type.SlicePtrFieldTypeBuffer = undefined;
- const ptr_type = typed_value.ty.slicePtrFieldType(&buf);
- const ptr_mcv = try self.genTypedValue(.{ .ty = ptr_type, .val = typed_value.val });
- const slice_len = typed_value.val.sliceLen();
- // Codegen can't handle some kinds of indirection. If the wrong union field is accessed here it may mean
- // the Sema code needs to use anonymous Decls or alloca instructions to store data.
- const ptr_imm = ptr_mcv.memory;
- _ = slice_len;
- _ = ptr_imm;
- // We need more general support for const data being stored in memory to make this work.
- return self.fail("TODO codegen for const slices", .{});
+ return self.lowerUnnamedConst(typed_value);
},
else => {
- if (typed_value.val.tag() == .int_u64) {
- return MCValue{ .immediate = typed_value.val.toUnsignedInt() };
+ switch (typed_value.val.tag()) {
+ .int_u64 => {
+ return MCValue{ .immediate = typed_value.val.toUnsignedInt() };
+ },
+ .slice => {
+ return self.lowerUnnamedConst(typed_value);
+ },
+ else => {
+ return self.fail("TODO codegen more kinds of const pointers: {}", .{typed_value.val.tag()});
+ },
}
- return self.fail("TODO codegen more kinds of const pointers", .{});
},
},
.Int => {
@@ -3516,6 +3565,9 @@ fn genTypedValue(self: *Self, typed_value: TypedValue) InnerError!MCValue {
return self.fail("TODO implement error union const of type '{}' (error)", .{typed_value.ty});
}
},
+ .Struct => {
+ return self.lowerUnnamedConst(typed_value);
+ },
else => return self.fail("TODO implement const of type '{}'", .{typed_value.ty}),
}
}
diff --git a/src/arch/aarch64/Emit.zig b/src/arch/aarch64/Emit.zig
index bc37cb56c6..77f400ea78 100644
--- a/src/arch/aarch64/Emit.zig
+++ b/src/arch/aarch64/Emit.zig
@@ -109,6 +109,8 @@ pub fn emitMir(
.eor_shifted_register => try emit.mirLogicalShiftedRegister(inst),
.load_memory => try emit.mirLoadMemory(inst),
+ .load_memory_got => try emit.mirLoadMemoryPie(inst),
+ .load_memory_direct => try emit.mirLoadMemoryPie(inst),
.ldp => try emit.mirLoadStoreRegisterPair(inst),
.stp => try emit.mirLoadStoreRegisterPair(inst),
@@ -205,21 +207,18 @@ fn instructionSize(emit: *Emit, inst: Mir.Inst.Index) usize {
}
switch (tag) {
+ .load_memory_got,
+ .load_memory_direct,
+ => return 2 * 4,
.load_memory => {
- if (emit.bin_file.options.pie) {
- // adrp, ldr
- return 2 * 4;
- } else {
- const payload = emit.mir.instructions.items(.data)[inst].payload;
- const load_memory = emit.mir.extraData(Mir.LoadMemory, payload).data;
- const addr = load_memory.addr;
-
- // movz, [movk, ...], ldr
- if (addr <= math.maxInt(u16)) return 2 * 4;
- if (addr <= math.maxInt(u32)) return 3 * 4;
- if (addr <= math.maxInt(u48)) return 4 * 4;
- return 5 * 4;
- }
+ const load_memory = emit.mir.instructions.items(.data)[inst].load_memory;
+ const addr = load_memory.addr;
+
+ // movz, [movk, ...], ldr
+ if (addr <= math.maxInt(u16)) return 2 * 4;
+ if (addr <= math.maxInt(u32)) return 3 * 4;
+ if (addr <= math.maxInt(u48)) return 4 * 4;
+ return 5 * 4;
},
.pop_regs, .push_regs => {
const reg_list = emit.mir.instructions.items(.data)[inst].reg_list;
@@ -658,58 +657,69 @@ fn mirLogicalShiftedRegister(emit: *Emit, inst: Mir.Inst.Index) !void {
fn mirLoadMemory(emit: *Emit, inst: Mir.Inst.Index) !void {
assert(emit.mir.instructions.items(.tag)[inst] == .load_memory);
- const payload = emit.mir.instructions.items(.data)[inst].payload;
- const load_memory = emit.mir.extraData(Mir.LoadMemory, payload).data;
+ const load_memory = emit.mir.instructions.items(.data)[inst].load_memory;
const reg = @intToEnum(Register, load_memory.register);
const addr = load_memory.addr;
+ // The value is in memory at a hard-coded address.
+ // If the type is a pointer, it means the pointer address is at this memory location.
+ try emit.moveImmediate(reg, addr);
+ try emit.writeInstruction(Instruction.ldr(
+ reg,
+ reg,
+ Instruction.LoadStoreOffset.none,
+ ));
+}
- if (emit.bin_file.options.pie) {
- // PC-relative displacement to the entry in the GOT table.
- // adrp
- const offset = @intCast(u32, emit.code.items.len);
- try emit.writeInstruction(Instruction.adrp(reg, 0));
-
- // ldr reg, reg, offset
- try emit.writeInstruction(Instruction.ldr(
- reg,
- reg,
- Instruction.LoadStoreOffset.imm(0),
- ));
-
- if (emit.bin_file.cast(link.File.MachO)) |macho_file| {
- const atom = macho_file.atom_by_index_table.get(load_memory.atom_index).?;
- // Page reloc for adrp instruction.
- try atom.relocs.append(emit.bin_file.allocator, .{
- .offset = offset,
- .target = .{ .local = addr },
- .addend = 0,
- .subtractor = null,
- .pcrel = true,
- .length = 2,
- .@"type" = @enumToInt(std.macho.reloc_type_arm64.ARM64_RELOC_GOT_LOAD_PAGE21),
- });
- // Pageoff reloc for adrp instruction.
- try atom.relocs.append(emit.bin_file.allocator, .{
- .offset = offset + 4,
- .target = .{ .local = addr },
- .addend = 0,
- .subtractor = null,
- .pcrel = false,
- .length = 2,
- .@"type" = @enumToInt(std.macho.reloc_type_arm64.ARM64_RELOC_GOT_LOAD_PAGEOFF12),
- });
- } else {
- return emit.fail("TODO implement load_memory for PIE GOT indirection on this platform", .{});
- }
+fn mirLoadMemoryPie(emit: *Emit, inst: Mir.Inst.Index) !void {
+ const tag = emit.mir.instructions.items(.tag)[inst];
+ const payload = emit.mir.instructions.items(.data)[inst].payload;
+ const data = emit.mir.extraData(Mir.LoadMemoryPie, payload).data;
+ const reg = @intToEnum(Register, data.register);
+
+ // PC-relative displacement to the entry in the GOT table.
+ // adrp
+ const offset = @intCast(u32, emit.code.items.len);
+ try emit.writeInstruction(Instruction.adrp(reg, 0));
+
+ // ldr reg, reg, offset
+ try emit.writeInstruction(Instruction.ldr(
+ reg,
+ reg,
+ Instruction.LoadStoreOffset.imm(0),
+ ));
+
+ if (emit.bin_file.cast(link.File.MachO)) |macho_file| {
+ const atom = macho_file.atom_by_index_table.get(data.atom_index).?;
+ // Page reloc for adrp instruction.
+ try atom.relocs.append(emit.bin_file.allocator, .{
+ .offset = offset,
+ .target = .{ .local = data.sym_index },
+ .addend = 0,
+ .subtractor = null,
+ .pcrel = true,
+ .length = 2,
+ .@"type" = switch (tag) {
+ .load_memory_got => @enumToInt(std.macho.reloc_type_arm64.ARM64_RELOC_GOT_LOAD_PAGE21),
+ .load_memory_direct => @enumToInt(std.macho.reloc_type_arm64.ARM64_RELOC_PAGE21),
+ else => unreachable,
+ },
+ });
+ // Pageoff reloc for adrp instruction.
+ try atom.relocs.append(emit.bin_file.allocator, .{
+ .offset = offset + 4,
+ .target = .{ .local = data.sym_index },
+ .addend = 0,
+ .subtractor = null,
+ .pcrel = false,
+ .length = 2,
+ .@"type" = switch (tag) {
+ .load_memory_got => @enumToInt(std.macho.reloc_type_arm64.ARM64_RELOC_GOT_LOAD_PAGEOFF12),
+ .load_memory_direct => @enumToInt(std.macho.reloc_type_arm64.ARM64_RELOC_PAGEOFF12),
+ else => unreachable,
+ },
+ });
} else {
- // The value is in memory at a hard-coded address.
- // If the type is a pointer, it means the pointer address is at this memory location.
- try emit.moveImmediate(reg, addr);
- try emit.writeInstruction(Instruction.ldr(
- reg,
- reg,
- Instruction.LoadStoreOffset.none,
- ));
+ return emit.fail("TODO implement load_memory for PIE GOT indirection on this platform", .{});
}
}
diff --git a/src/arch/aarch64/Mir.zig b/src/arch/aarch64/Mir.zig
index 92b0604347..62693f01d7 100644
--- a/src/arch/aarch64/Mir.zig
+++ b/src/arch/aarch64/Mir.zig
@@ -58,8 +58,12 @@ pub const Inst = struct {
eor_shifted_register,
/// Pseudo-instruction: Load memory
///
- /// Payload is `LoadMemory`
+ /// Payload is `load_memory`
load_memory,
+ /// Payload is `LoadMemoryPie`
+ load_memory_got,
+ /// Payload is `LoadMemoryPie`
+ load_memory_direct,
/// Load Pair of Registers
ldp,
/// Pseudo-instruction: Load from stack
@@ -157,8 +161,6 @@ pub const Inst = struct {
/// Used by e.g. svc
imm16: u16,
/// Index into `extra`. Meaning of what can be found there is context-dependent.
- ///
- /// Used by e.g. load_memory
payload: u32,
/// A register
///
@@ -298,6 +300,10 @@ pub const Inst = struct {
line: u32,
column: u32,
},
+ load_memory: struct {
+ register: u32,
+ addr: u32,
+ },
};
// Make sure we don't accidentally make instructions bigger than expected.
@@ -335,8 +341,10 @@ pub fn extraData(mir: Mir, comptime T: type, index: usize) struct { data: T, end
};
}
-pub const LoadMemory = struct {
- atom_index: u32,
+pub const LoadMemoryPie = struct {
register: u32,
- addr: u32,
+ /// Index of the containing atom.
+ atom_index: u32,
+ /// Index into the linker's symbol table.
+ sym_index: u32,
};