aboutsummaryrefslogtreecommitdiff
path: root/src/codegen/llvm.zig
diff options
context:
space:
mode:
authorVeikka Tuominen <git@vexu.eu>2022-03-11 13:12:32 +0200
committerVeikka Tuominen <git@vexu.eu>2022-03-11 13:12:32 +0200
commitcba68090a60c3de8eadbf8eb53e37620a1d66683 (patch)
tree19d972a0c3cab03307218e9fb757fd3fdc44c8a3 /src/codegen/llvm.zig
parentdb4262417009c0060e09a8cf8af088b76320aad0 (diff)
downloadzig-cba68090a60c3de8eadbf8eb53e37620a1d66683.tar.gz
zig-cba68090a60c3de8eadbf8eb53e37620a1d66683.zip
stage2: implement `@shuffle` at runtime
Diffstat (limited to 'src/codegen/llvm.zig')
-rw-r--r--src/codegen/llvm.zig38
1 files changed, 38 insertions, 0 deletions
diff --git a/src/codegen/llvm.zig b/src/codegen/llvm.zig
index d7df161b00..190fcd0ee6 100644
--- a/src/codegen/llvm.zig
+++ b/src/codegen/llvm.zig
@@ -3204,6 +3204,7 @@ pub const FuncGen = struct {
.tag_name => try self.airTagName(inst),
.error_name => try self.airErrorName(inst),
.splat => try self.airSplat(inst),
+ .shuffle => try self.airShuffle(inst),
.aggregate_init => try self.airAggregateInit(inst),
.union_init => try self.airUnionInit(inst),
.prefetch => try self.airPrefetch(inst),
@@ -5850,6 +5851,43 @@ pub const FuncGen = struct {
return self.builder.buildShuffleVector(op_vector, undef_vector, mask_llvm_ty.constNull(), "");
}
+ fn airShuffle(self: *FuncGen, inst: Air.Inst.Index) !?*const llvm.Value {
+ if (self.liveness.isUnused(inst)) return null;
+
+ const ty_pl = self.air.instructions.items(.data)[inst].ty_pl;
+ const extra = self.air.extraData(Air.Shuffle, ty_pl.payload).data;
+ const a = try self.resolveInst(extra.a);
+ const b = try self.resolveInst(extra.b);
+ const mask = self.air.values[extra.mask];
+ const mask_len = extra.mask_len;
+ const a_len = self.air.typeOf(extra.a).vectorLen();
+
+ // LLVM uses integers larger than the length of the first array to
+ // index into the second array. This was deemed unnecessarily fragile
+ // when changing code, so Zig uses negative numbers to index the
+ // second vector. These start at -1 and go down, and are easiest to use
+ // with the ~ operator. Here we convert between the two formats.
+ const values = try self.gpa.alloc(*const llvm.Value, mask_len);
+ defer self.gpa.free(values);
+
+ const llvm_i32 = self.context.intType(32);
+
+ for (values) |*val, i| {
+ var buf: Value.ElemValueBuffer = undefined;
+ const elem = mask.elemValueBuffer(i, &buf);
+ if (elem.isUndef()) {
+ val.* = llvm_i32.getUndef();
+ } else {
+ const int = elem.toSignedInt();
+ const unsigned = if (int >= 0) @intCast(u32, int) else @intCast(u32, ~int + a_len);
+ val.* = llvm_i32.constInt(unsigned, .False);
+ }
+ }
+
+ const llvm_mask_value = llvm.constVector(values.ptr, mask_len);
+ return self.builder.buildShuffleVector(a, b, llvm_mask_value, "");
+ }
+
fn airAggregateInit(self: *FuncGen, inst: Air.Inst.Index) !?*const llvm.Value {
if (self.liveness.isUnused(inst)) return null;