1 files changed, 101 insertions, 76 deletions
diff --git a/src/codegen/spirv.zig b/src/codegen/spirv.zig
index 00d7fa94f9..cbc6ae1eb3 100644
--- a/src/codegen/spirv.zig
+++ b/src/codegen/spirv.zig
@@ -632,11 +632,15 @@ const DeclGen = struct {
     /// Checks whether the type can be directly translated to SPIR-V vectors
     fn isVector(self: *DeclGen, ty: Type) bool {
         const mod = self.module;
+        const target = self.getTarget();
         if (ty.zigTypeTag(mod) != .Vector) return false;
         const elem_ty = ty.childType(mod);
+
         const len = ty.vectorLen(mod);
         const is_scalar = elem_ty.isNumeric(mod) or elem_ty.toIntern() == .bool_type;
-        return is_scalar and len > 1 and len <= 4;
+        const spirv_len = len > 1 and len <= 4;
+        const opencl_len = if (target.os.tag == .opencl) (len == 8 or len == 16) else false;
+        return is_scalar and (spirv_len or opencl_len);
     }
 
     fn arithmeticTypeInfo(self: *DeclGen, ty: Type) ArithmeticTypeInfo {
@@ -1968,7 +1972,10 @@ const DeclGen = struct {
             try self.func.prologue.emit(self.spv.gpa, .OpFunction, .{
                 .id_result_type = self.typeId(return_ty_ref),
                 .id_result = decl_id,
-                .function_control = .{}, // TODO: We can set inline here if the type requires it.
+                .function_control = switch (fn_info.cc) {
+                    .Inline => .{ .Inline = true },
+                    else => .{},
+                },
                 .function_type = prototype_id,
             });
 
@@ -2437,48 +2444,71 @@ const DeclGen = struct {
 
     fn minMax(self: *DeclGen, result_ty: Type, op: std.math.CompareOperator, lhs_id: IdRef, rhs_id: IdRef) !IdRef {
         const info = self.arithmeticTypeInfo(result_ty);
+        const target = self.getTarget();
 
-        var wip = try self.elementWise(result_ty, true);
+        const use_backup_codegen = target.os.tag == .opencl and info.class != .float;
+        var wip = try self.elementWise(result_ty, use_backup_codegen);
         defer wip.deinit();
+
         for (wip.results, 0..) |*result_id, i| {
             const lhs_elem_id = try wip.elementAt(result_ty, lhs_id, i);
             const rhs_elem_id = try wip.elementAt(result_ty, rhs_id, i);
 
-            // TODO: Use fmin for OpenCL
-            const cmp_id = try self.cmp(op, Type.bool, wip.ty, lhs_elem_id, rhs_elem_id);
-            const selection_id = switch (info.class) {
-                .float => blk: {
-                    // cmp uses OpFOrd. When we have 0 [<>] nan this returns false,
-                    // but we want it to pick lhs. Therefore we also have to check if
-                    // rhs is nan. We don't need to care about the result when both
-                    // are nan.
-                    const rhs_is_nan_id = self.spv.allocId();
-                    const bool_ty_ref = try self.resolveType(Type.bool, .direct);
-                    try self.func.body.emit(self.spv.gpa, .OpIsNan, .{
-                        .id_result_type = self.typeId(bool_ty_ref),
-                        .id_result = rhs_is_nan_id,
-                        .x = rhs_elem_id,
-                    });
-                    const float_cmp_id = self.spv.allocId();
-                    try self.func.body.emit(self.spv.gpa, .OpLogicalOr, .{
-                        .id_result_type = self.typeId(bool_ty_ref),
-                        .id_result = float_cmp_id,
-                        .operand_1 = cmp_id,
-                        .operand_2 = rhs_is_nan_id,
-                    });
-                    break :blk float_cmp_id;
-                },
-                else => cmp_id,
-            };
+            if (use_backup_codegen) {
+                const cmp_id = try self.cmp(op, Type.bool, wip.ty, lhs_elem_id, rhs_elem_id);
+                result_id.* = self.spv.allocId();
+                try self.func.body.emit(self.spv.gpa, .OpSelect, .{
+                    .id_result_type = wip.ty_id,
+                    .id_result = result_id.*,
+                    .condition = cmp_id,
+                    .object_1 = lhs_elem_id,
+                    .object_2 = rhs_elem_id,
+                });
+            } else {
+                const ext_inst: Word = switch (target.os.tag) {
+                    .opencl => switch (op) {
+                        .lt => 28, // fmin
+                        .gt => 27, // fmax
+                        else => unreachable,
+                    },
+                    .vulkan => switch (info.class) {
+                        .float => switch (op) {
+                            .lt => 37, // FMin
+                            .gt => 40, // FMax
+                            else => unreachable,
+                        },
+                        .integer, .strange_integer => switch (info.signedness) {
+                            .signed => switch (op) {
+                                .lt => 39, // SMin
+                                .gt => 42, // SMax
+                                else => unreachable,
+                            },
+                            .unsigned => switch (op) {
+                                .lt => 38, // UMin
+                                .gt => 41, // UMax
+                                else => unreachable,
+                            },
+                        },
+                        .composite_integer => unreachable, // TODO
+                        .bool => unreachable,
+                    },
+                    else => unreachable,
+                };
+                const set_id = switch (target.os.tag) {
+                    .opencl => try self.spv.importInstructionSet(.opencl),
+                    .vulkan => try self.spv.importInstructionSet(.glsl),
+                    else => unreachable,
+                };
 
-            result_id.* = self.spv.allocId();
-            try self.func.body.emit(self.spv.gpa, .OpSelect, .{
-                .id_result_type = wip.ty_id,
-                .id_result = result_id.*,
-                .condition = selection_id,
-                .object_1 = lhs_elem_id,
-                .object_2 = rhs_elem_id,
-            });
+                result_id.* = self.spv.allocId();
+                try self.func.body.emit(self.spv.gpa, .OpExtInst, .{
+                    .id_result_type = wip.ty_id,
+                    .id_result = result_id.*,
+                    .set = set_id,
+                    .instruction = .{ .inst = ext_inst },
+                    .id_ref_4 = &.{ lhs_elem_id, rhs_elem_id },
+                });
+            }
         }
         return wip.finalize();
     }
@@ -2607,57 +2637,52 @@ const DeclGen = struct {
     }
 
     fn airAbs(self: *DeclGen, inst: Air.Inst.Index) !?IdRef {
-        const mod = self.module;
+        const target = self.getTarget();
         const ty_op = self.air.instructions.items(.data)[@intFromEnum(inst)].ty_op;
         const operand_id = try self.resolve(ty_op.operand);
         // Note: operand_ty may be signed, while ty is always unsigned!
         const operand_ty = self.typeOf(ty_op.operand);
         const result_ty = self.typeOfIndex(inst);
-        const info = self.arithmeticTypeInfo(result_ty);
-        const operand_scalar_ty = operand_ty.scalarType(mod);
-        const operand_scalar_ty_ref = try self.resolveType(operand_scalar_ty, .direct);
+        const operand_info = self.arithmeticTypeInfo(operand_ty);
 
-        var wip = try self.elementWise(result_ty, true);
+        var wip = try self.elementWise(result_ty, false);
         defer wip.deinit();
 
-        const zero_id = switch (info.class) {
-            .float => try self.constFloat(operand_scalar_ty_ref, 0),
-            .integer, .strange_integer => try self.constInt(operand_scalar_ty_ref, 0),
-            .composite_integer => unreachable, // TODO
-            .bool => unreachable,
-        };
         for (wip.results, 0..) |*result_id, i| {
             const elem_id = try wip.elementAt(operand_ty, operand_id, i);
-            // Idk why spir-v doesn't have a dedicated abs() instruction in the base
-            // instruction set. For now we're just going to negate and check to avoid
-            // importing the extinst.
-            // TODO: Make this a call to compiler rt / ext inst
-            const neg_id = self.spv.allocId();
-            const args = .{
-                .id_result_type = self.typeId(operand_scalar_ty_ref),
-                .id_result = neg_id,
-                .operand_1 = zero_id,
-                .operand_2 = elem_id,
+
+            const ext_inst: Word = switch (target.os.tag) {
+                .opencl => switch (operand_info.class) {
+                    .float => 23, // fabs
+                    .integer, .strange_integer => switch (operand_info.signedness) {
+                        .signed => 141, // s_abs
+                        .unsigned => 201, // u_abs
+                    },
+                    .composite_integer => unreachable, // TODO
+                    .bool => unreachable,
+                },
+                .vulkan => switch (operand_info.class) {
+                    .float => 4, // FAbs
+                    .integer, .strange_integer => 5, // SAbs
+                    .composite_integer => unreachable, // TODO
+                    .bool => unreachable,
+                },
+                else => unreachable,
             };
-            switch (info.class) {
-                .float => try self.func.body.emit(self.spv.gpa, .OpFSub, args),
-                .integer, .strange_integer => try self.func.body.emit(self.spv.gpa, .OpISub, args),
-                .composite_integer => unreachable, // TODO
-                .bool => unreachable,
-            }
-            const neg_norm_id = try self.normalize(wip.ty_ref, neg_id, info);
-
-            const gt_zero_id = try self.cmp(.gt, Type.bool, operand_scalar_ty, elem_id, zero_id);
-            const abs_id = self.spv.allocId();
-            try self.func.body.emit(self.spv.gpa, .OpSelect, .{
-                .id_result_type = self.typeId(operand_scalar_ty_ref),
-                .id_result = abs_id,
-                .condition = gt_zero_id,
-                .object_1 = elem_id,
-                .object_2 = neg_norm_id,
+            const set_id = switch (target.os.tag) {
+                .opencl => try self.spv.importInstructionSet(.opencl),
+                .vulkan => try self.spv.importInstructionSet(.glsl),
+                else => unreachable,
+            };
+
+            result_id.* = self.spv.allocId();
+            try self.func.body.emit(self.spv.gpa, .OpExtInst, .{
+                .id_result_type = wip.ty_id,
+                .id_result = result_id.*,
+                .set = set_id,
+                .instruction = .{ .inst = ext_inst },
+                .id_ref_4 = &.{elem_id},
             });
-            // For Shader, we may need to cast from signed to unsigned here.
-            result_id.* = try self.bitCast(wip.ty, operand_scalar_ty, abs_id);
         }
         return try wip.finalize();
     }