aboutsummaryrefslogtreecommitdiff
path: root/src/codegen/llvm.zig
diff options
context:
space:
mode:
Diffstat (limited to 'src/codegen/llvm.zig')
-rw-r--r--src/codegen/llvm.zig54
1 files changed, 35 insertions, 19 deletions
diff --git a/src/codegen/llvm.zig b/src/codegen/llvm.zig
index 6453ea04a3..e656150584 100644
--- a/src/codegen/llvm.zig
+++ b/src/codegen/llvm.zig
@@ -10286,7 +10286,7 @@ pub const FuncGen = struct {
return self.wip.cast(.addrspacecast, operand, try o.lowerType(inst_ty), "");
}
- fn amdgcnWorkIntrinsic(
+ fn workIntrinsic(
self: *FuncGen,
dimension: u32,
default: u32,
@@ -10303,44 +10303,60 @@ pub const FuncGen = struct {
fn airWorkItemId(self: *FuncGen, inst: Air.Inst.Index) !Builder.Value {
const o = self.ng.object;
const target = o.pt.zcu.getTarget();
- assert(target.cpu.arch == .amdgcn); // TODO is to port this function to other GPU architectures
const pl_op = self.air.instructions.items(.data)[@intFromEnum(inst)].pl_op;
const dimension = pl_op.payload;
- return self.amdgcnWorkIntrinsic(dimension, 0, "amdgcn.workitem.id");
+
+ return switch (target.cpu.arch) {
+ .amdgcn => self.workIntrinsic(dimension, 0, "amdgcn.workitem.id"),
+ .nvptx, .nvptx64 => self.workIntrinsic(dimension, 0, "nvvm.read.ptx.sreg.tid"),
+ else => unreachable,
+ };
}
fn airWorkGroupSize(self: *FuncGen, inst: Air.Inst.Index) !Builder.Value {
const o = self.ng.object;
const target = o.pt.zcu.getTarget();
- assert(target.cpu.arch == .amdgcn); // TODO is to port this function to other GPU architectures
const pl_op = self.air.instructions.items(.data)[@intFromEnum(inst)].pl_op;
const dimension = pl_op.payload;
- if (dimension >= 3) return .@"1";
-
- // Fetch the dispatch pointer, which points to this structure:
- // https://github.com/RadeonOpenCompute/ROCR-Runtime/blob/adae6c61e10d371f7cbc3d0e94ae2c070cab18a4/src/inc/hsa.h#L2913
- const dispatch_ptr =
- try self.wip.callIntrinsic(.normal, .none, .@"amdgcn.dispatch.ptr", &.{}, &.{}, "");
- // Load the work_group_* member from the struct as u16.
- // Just treat the dispatch pointer as an array of u16 to keep things simple.
- const workgroup_size_ptr = try self.wip.gep(.inbounds, .i16, dispatch_ptr, &.{
- try o.builder.intValue(try o.lowerType(Type.usize), 2 + dimension),
- }, "");
- const workgroup_size_alignment = comptime Builder.Alignment.fromByteUnits(2);
- return self.wip.load(.normal, .i16, workgroup_size_ptr, workgroup_size_alignment, "");
+ switch (target.cpu.arch) {
+ .amdgcn => {
+ if (dimension >= 3) return .@"1";
+
+ // Fetch the dispatch pointer, which points to this structure:
+ // https://github.com/RadeonOpenCompute/ROCR-Runtime/blob/adae6c61e10d371f7cbc3d0e94ae2c070cab18a4/src/inc/hsa.h#L2913
+ const dispatch_ptr =
+ try self.wip.callIntrinsic(.normal, .none, .@"amdgcn.dispatch.ptr", &.{}, &.{}, "");
+
+ // Load the work_group_* member from the struct as u16.
+ // Just treat the dispatch pointer as an array of u16 to keep things simple.
+ const workgroup_size_ptr = try self.wip.gep(.inbounds, .i16, dispatch_ptr, &.{
+ try o.builder.intValue(try o.lowerType(Type.usize), 2 + dimension),
+ }, "");
+ const workgroup_size_alignment = comptime Builder.Alignment.fromByteUnits(2);
+ return self.wip.load(.normal, .i16, workgroup_size_ptr, workgroup_size_alignment, "");
+ },
+ .nvptx, .nvptx64 => {
+ return self.workIntrinsic(dimension, 1, "nvvm.read.ptx.sreg.ntid");
+ },
+ else => unreachable,
+ }
}
fn airWorkGroupId(self: *FuncGen, inst: Air.Inst.Index) !Builder.Value {
const o = self.ng.object;
const target = o.pt.zcu.getTarget();
- assert(target.cpu.arch == .amdgcn); // TODO is to port this function to other GPU architectures
const pl_op = self.air.instructions.items(.data)[@intFromEnum(inst)].pl_op;
const dimension = pl_op.payload;
- return self.amdgcnWorkIntrinsic(dimension, 0, "amdgcn.workgroup.id");
+
+ return switch (target.cpu.arch) {
+ .amdgcn => self.workIntrinsic(dimension, 0, "amdgcn.workgroup.id"),
+ .nvptx, .nvptx64 => self.workIntrinsic(dimension, 0, "nvvm.read.ptx.sreg.ctaid"),
+ else => unreachable,
+ };
}
fn getErrorNameTable(self: *FuncGen) Allocator.Error!Builder.Variable.Index {