diff options
Diffstat (limited to 'lib/std/target/amdgpu.zig')
| -rw-r--r-- | lib/std/target/amdgpu.zig | 1068 |
1 files changed, 534 insertions, 534 deletions
diff --git a/lib/std/target/amdgpu.zig b/lib/std/target/amdgpu.zig index 3d4b4950ca..f1954628c5 100644 --- a/lib/std/target/amdgpu.zig +++ b/lib/std/target/amdgpu.zig @@ -2,7 +2,7 @@ const Feature = @import("std").target.Feature; const Cpu = @import("std").target.Cpu; pub const feature_BitInsts16 = Feature{ - .name = "16-bit-insts", + .name = "BitInsts16", .llvm_name = "16-bit-insts", .description = "Has i16/f16 instructions", .dependencies = &[_]*const Feature { @@ -10,7 +10,7 @@ pub const feature_BitInsts16 = Feature{ }; pub const feature_addNoCarryInsts = Feature{ - .name = "add-no-carry-insts", + .name = "addNoCarryInsts", .llvm_name = "add-no-carry-insts", .description = "Have VALU add/sub instructions without carry out", .dependencies = &[_]*const Feature { @@ -18,7 +18,7 @@ pub const feature_addNoCarryInsts = Feature{ }; pub const feature_apertureRegs = Feature{ - .name = "aperture-regs", + .name = "apertureRegs", .llvm_name = "aperture-regs", .description = "Has Memory Aperture Base and Size Registers", .dependencies = &[_]*const Feature { @@ -26,7 +26,7 @@ pub const feature_apertureRegs = Feature{ }; pub const feature_atomicFaddInsts = Feature{ - .name = "atomic-fadd-insts", + .name = "atomicFaddInsts", .llvm_name = "atomic-fadd-insts", .description = "Has buffer_atomic_add_f32, buffer_atomic_pk_add_f16, global_atomic_add_f32, global_atomic_pk_add_f16 instructions", .dependencies = &[_]*const Feature { @@ -34,7 +34,7 @@ pub const feature_atomicFaddInsts = Feature{ }; pub const feature_autoWaitcntBeforeBarrier = Feature{ - .name = "auto-waitcnt-before-barrier", + .name = "autoWaitcntBeforeBarrier", .llvm_name = "auto-waitcnt-before-barrier", .description = "Hardware automatically inserts waitcnt before barrier", .dependencies = &[_]*const Feature { @@ -42,7 +42,7 @@ pub const feature_autoWaitcntBeforeBarrier = Feature{ }; pub const feature_ciInsts = Feature{ - .name = "ci-insts", + .name = "ciInsts", .llvm_name = "ci-insts", .description = "Additional instructions for CI+", .dependencies = &[_]*const Feature { @@ -50,7 +50,7 @@ pub const feature_ciInsts = Feature{ }; pub const feature_codeObjectV3 = Feature{ - .name = "code-object-v3", + .name = "codeObjectV3", .llvm_name = "code-object-v3", .description = "Generate code object version 3", .dependencies = &[_]*const Feature { @@ -66,7 +66,7 @@ pub const feature_cumode = Feature{ }; pub const feature_dlInsts = Feature{ - .name = "dl-insts", + .name = "dlInsts", .llvm_name = "dl-insts", .description = "Has v_fmac_f32 and v_xnor_b32 instructions", .dependencies = &[_]*const Feature { @@ -90,7 +90,7 @@ pub const feature_dpp8 = Feature{ }; pub const feature_noSramEccSupport = Feature{ - .name = "no-sram-ecc-support", + .name = "noSramEccSupport", .llvm_name = "no-sram-ecc-support", .description = "Hardware does not support SRAM ECC", .dependencies = &[_]*const Feature { @@ -98,7 +98,7 @@ pub const feature_noSramEccSupport = Feature{ }; pub const feature_noXnackSupport = Feature{ - .name = "no-xnack-support", + .name = "noXnackSupport", .llvm_name = "no-xnack-support", .description = "Hardware does not support XNACK", .dependencies = &[_]*const Feature { @@ -106,7 +106,7 @@ pub const feature_noXnackSupport = Feature{ }; pub const feature_dot1Insts = Feature{ - .name = "dot1-insts", + .name = "dot1Insts", .llvm_name = "dot1-insts", .description = "Has v_dot4_i32_i8 and v_dot8_i32_i4 instructions", .dependencies = &[_]*const Feature { @@ -114,7 +114,7 @@ pub const feature_dot1Insts = Feature{ }; pub const feature_dot2Insts = Feature{ - .name = "dot2-insts", + .name = "dot2Insts", .llvm_name = "dot2-insts", .description = "Has v_dot2_f32_f16, v_dot2_i32_i16, v_dot2_u32_u16, v_dot4_u32_u8, v_dot8_u32_u4 instructions", .dependencies = &[_]*const Feature { @@ -122,7 +122,7 @@ pub const feature_dot2Insts = Feature{ }; pub const feature_dot3Insts = Feature{ - .name = "dot3-insts", + .name = "dot3Insts", .llvm_name = "dot3-insts", .description = "Has v_dot8c_i32_i4 instruction", .dependencies = &[_]*const Feature { @@ -130,7 +130,7 @@ pub const feature_dot3Insts = Feature{ }; pub const feature_dot4Insts = Feature{ - .name = "dot4-insts", + .name = "dot4Insts", .llvm_name = "dot4-insts", .description = "Has v_dot2c_i32_i16 instruction", .dependencies = &[_]*const Feature { @@ -138,7 +138,7 @@ pub const feature_dot4Insts = Feature{ }; pub const feature_dot5Insts = Feature{ - .name = "dot5-insts", + .name = "dot5Insts", .llvm_name = "dot5-insts", .description = "Has v_dot2c_f32_f16 instruction", .dependencies = &[_]*const Feature { @@ -146,7 +146,7 @@ pub const feature_dot5Insts = Feature{ }; pub const feature_dot6Insts = Feature{ - .name = "dot6-insts", + .name = "dot6Insts", .llvm_name = "dot6-insts", .description = "Has v_dot4c_i32_i8 instruction", .dependencies = &[_]*const Feature { @@ -170,7 +170,7 @@ pub const feature_dumpcode = Feature{ }; pub const feature_enableDs128 = Feature{ - .name = "enable-ds128", + .name = "enableDs128", .llvm_name = "enable-ds128", .description = "Use ds_{read|write}_b128", .dependencies = &[_]*const Feature { @@ -178,7 +178,7 @@ pub const feature_enableDs128 = Feature{ }; pub const feature_loadStoreOpt = Feature{ - .name = "load-store-opt", + .name = "loadStoreOpt", .llvm_name = "load-store-opt", .description = "Enable SI load/store optimizer pass", .dependencies = &[_]*const Feature { @@ -186,7 +186,7 @@ pub const feature_loadStoreOpt = Feature{ }; pub const feature_enablePrtStrictNull = Feature{ - .name = "enable-prt-strict-null", + .name = "enablePrtStrictNull", .llvm_name = "enable-prt-strict-null", .description = "Enable zeroing of result registers for sparse texture fetches", .dependencies = &[_]*const Feature { @@ -194,7 +194,7 @@ pub const feature_enablePrtStrictNull = Feature{ }; pub const feature_siScheduler = Feature{ - .name = "si-scheduler", + .name = "siScheduler", .llvm_name = "si-scheduler", .description = "Enable SI Machine Scheduler", .dependencies = &[_]*const Feature { @@ -202,7 +202,7 @@ pub const feature_siScheduler = Feature{ }; pub const feature_unsafeDsOffsetFolding = Feature{ - .name = "unsafe-ds-offset-folding", + .name = "unsafeDsOffsetFolding", .llvm_name = "unsafe-ds-offset-folding", .description = "Force using DS instruction immediate offsets on SI", .dependencies = &[_]*const Feature { @@ -218,7 +218,7 @@ pub const feature_fmaf = Feature{ }; pub const feature_fp16Denormals = Feature{ - .name = "fp16-denormals", + .name = "fp16Denormals", .llvm_name = "fp16-denormals", .description = "Enable half precision denormal handling", .dependencies = &[_]*const Feature { @@ -227,7 +227,7 @@ pub const feature_fp16Denormals = Feature{ }; pub const feature_fp32Denormals = Feature{ - .name = "fp32-denormals", + .name = "fp32Denormals", .llvm_name = "fp32-denormals", .description = "Enable single precision denormal handling", .dependencies = &[_]*const Feature { @@ -243,7 +243,7 @@ pub const feature_fp64 = Feature{ }; pub const feature_fp64Denormals = Feature{ - .name = "fp64-denormals", + .name = "fp64Denormals", .llvm_name = "fp64-denormals", .description = "Enable double and half precision denormal handling", .dependencies = &[_]*const Feature { @@ -252,7 +252,7 @@ pub const feature_fp64Denormals = Feature{ }; pub const feature_fp64Fp16Denormals = Feature{ - .name = "fp64-fp16-denormals", + .name = "fp64Fp16Denormals", .llvm_name = "fp64-fp16-denormals", .description = "Enable double and half precision denormal handling", .dependencies = &[_]*const Feature { @@ -261,7 +261,7 @@ pub const feature_fp64Fp16Denormals = Feature{ }; pub const feature_fpExceptions = Feature{ - .name = "fp-exceptions", + .name = "fpExceptions", .llvm_name = "fp-exceptions", .description = "Enable floating point exceptions", .dependencies = &[_]*const Feature { @@ -269,7 +269,7 @@ pub const feature_fpExceptions = Feature{ }; pub const feature_fastFmaf = Feature{ - .name = "fast-fmaf", + .name = "fastFmaf", .llvm_name = "fast-fmaf", .description = "Assuming f32 fma is at least as fast as mul + add", .dependencies = &[_]*const Feature { @@ -277,7 +277,7 @@ pub const feature_fastFmaf = Feature{ }; pub const feature_flatAddressSpace = Feature{ - .name = "flat-address-space", + .name = "flatAddressSpace", .llvm_name = "flat-address-space", .description = "Support flat address space", .dependencies = &[_]*const Feature { @@ -285,7 +285,7 @@ pub const feature_flatAddressSpace = Feature{ }; pub const feature_flatForGlobal = Feature{ - .name = "flat-for-global", + .name = "flatForGlobal", .llvm_name = "flat-for-global", .description = "Force to generate flat instruction for global", .dependencies = &[_]*const Feature { @@ -293,7 +293,7 @@ pub const feature_flatForGlobal = Feature{ }; pub const feature_flatGlobalInsts = Feature{ - .name = "flat-global-insts", + .name = "flatGlobalInsts", .llvm_name = "flat-global-insts", .description = "Have global_* flat memory instructions", .dependencies = &[_]*const Feature { @@ -301,7 +301,7 @@ pub const feature_flatGlobalInsts = Feature{ }; pub const feature_flatInstOffsets = Feature{ - .name = "flat-inst-offsets", + .name = "flatInstOffsets", .llvm_name = "flat-inst-offsets", .description = "Flat instructions have immediate offset addressing mode", .dependencies = &[_]*const Feature { @@ -309,7 +309,7 @@ pub const feature_flatInstOffsets = Feature{ }; pub const feature_flatScratchInsts = Feature{ - .name = "flat-scratch-insts", + .name = "flatScratchInsts", .llvm_name = "flat-scratch-insts", .description = "Have scratch_* flat memory instructions", .dependencies = &[_]*const Feature { @@ -317,7 +317,7 @@ pub const feature_flatScratchInsts = Feature{ }; pub const feature_flatSegmentOffsetBug = Feature{ - .name = "flat-segment-offset-bug", + .name = "flatSegmentOffsetBug", .llvm_name = "flat-segment-offset-bug", .description = "GFX10 bug, inst_offset ignored in flat segment", .dependencies = &[_]*const Feature { @@ -325,7 +325,7 @@ pub const feature_flatSegmentOffsetBug = Feature{ }; pub const feature_fmaMixInsts = Feature{ - .name = "fma-mix-insts", + .name = "fmaMixInsts", .llvm_name = "fma-mix-insts", .description = "Has v_fma_mix_f32, v_fma_mixlo_f16, v_fma_mixhi_f16 instructions", .dependencies = &[_]*const Feature { @@ -333,7 +333,7 @@ pub const feature_fmaMixInsts = Feature{ }; pub const feature_gcn3Encoding = Feature{ - .name = "gcn3-encoding", + .name = "gcn3Encoding", .llvm_name = "gcn3-encoding", .description = "Encoding format for VI", .dependencies = &[_]*const Feature { @@ -341,7 +341,7 @@ pub const feature_gcn3Encoding = Feature{ }; pub const feature_gfx7Gfx8Gfx9Insts = Feature{ - .name = "gfx7-gfx8-gfx9-insts", + .name = "gfx7Gfx8Gfx9Insts", .llvm_name = "gfx7-gfx8-gfx9-insts", .description = "Instructions shared in GFX7, GFX8, GFX9", .dependencies = &[_]*const Feature { @@ -349,7 +349,7 @@ pub const feature_gfx7Gfx8Gfx9Insts = Feature{ }; pub const feature_gfx8Insts = Feature{ - .name = "gfx8-insts", + .name = "gfx8Insts", .llvm_name = "gfx8-insts", .description = "Additional instructions for GFX8+", .dependencies = &[_]*const Feature { @@ -357,7 +357,7 @@ pub const feature_gfx8Insts = Feature{ }; pub const feature_gfx9Insts = Feature{ - .name = "gfx9-insts", + .name = "gfx9Insts", .llvm_name = "gfx9-insts", .description = "Additional instructions for GFX9+", .dependencies = &[_]*const Feature { @@ -365,7 +365,7 @@ pub const feature_gfx9Insts = Feature{ }; pub const feature_gfx10Insts = Feature{ - .name = "gfx10-insts", + .name = "gfx10Insts", .llvm_name = "gfx10-insts", .description = "Additional instructions for GFX10+", .dependencies = &[_]*const Feature { @@ -373,7 +373,7 @@ pub const feature_gfx10Insts = Feature{ }; pub const feature_instFwdPrefetchBug = Feature{ - .name = "inst-fwd-prefetch-bug", + .name = "instFwdPrefetchBug", .llvm_name = "inst-fwd-prefetch-bug", .description = "S_INST_PREFETCH instruction causes shader to hang", .dependencies = &[_]*const Feature { @@ -381,7 +381,7 @@ pub const feature_instFwdPrefetchBug = Feature{ }; pub const feature_intClampInsts = Feature{ - .name = "int-clamp-insts", + .name = "intClampInsts", .llvm_name = "int-clamp-insts", .description = "Support clamp for integer destination", .dependencies = &[_]*const Feature { @@ -389,7 +389,7 @@ pub const feature_intClampInsts = Feature{ }; pub const feature_inv2piInlineImm = Feature{ - .name = "inv-2pi-inline-imm", + .name = "inv2piInlineImm", .llvm_name = "inv-2pi-inline-imm", .description = "Has 1 / (2 * pi) as inline immediate", .dependencies = &[_]*const Feature { @@ -413,7 +413,7 @@ pub const feature_ldsbankcount32 = Feature{ }; pub const feature_ldsBranchVmemWarHazard = Feature{ - .name = "lds-branch-vmem-war-hazard", + .name = "ldsBranchVmemWarHazard", .llvm_name = "lds-branch-vmem-war-hazard", .description = "Switching between LDS and VMEM-tex not waiting VM_VSRC=0", .dependencies = &[_]*const Feature { @@ -421,7 +421,7 @@ pub const feature_ldsBranchVmemWarHazard = Feature{ }; pub const feature_ldsMisalignedBug = Feature{ - .name = "lds-misaligned-bug", + .name = "ldsMisalignedBug", .llvm_name = "lds-misaligned-bug", .description = "Some GFX10 bug with misaligned multi-dword LDS access in WGP mode", .dependencies = &[_]*const Feature { @@ -453,7 +453,7 @@ pub const feature_localmemorysize65536 = Feature{ }; pub const feature_maiInsts = Feature{ - .name = "mai-insts", + .name = "maiInsts", .llvm_name = "mai-insts", .description = "Has mAI instructions", .dependencies = &[_]*const Feature { @@ -461,7 +461,7 @@ pub const feature_maiInsts = Feature{ }; pub const feature_mfmaInlineLiteralBug = Feature{ - .name = "mfma-inline-literal-bug", + .name = "mfmaInlineLiteralBug", .llvm_name = "mfma-inline-literal-bug", .description = "MFMA cannot use inline literal as SrcC", .dependencies = &[_]*const Feature { @@ -469,7 +469,7 @@ pub const feature_mfmaInlineLiteralBug = Feature{ }; pub const feature_mimgR128 = Feature{ - .name = "mimg-r128", + .name = "mimgR128", .llvm_name = "mimg-r128", .description = "Support 128-bit texture resources", .dependencies = &[_]*const Feature { @@ -477,7 +477,7 @@ pub const feature_mimgR128 = Feature{ }; pub const feature_madMixInsts = Feature{ - .name = "mad-mix-insts", + .name = "madMixInsts", .llvm_name = "mad-mix-insts", .description = "Has v_mad_mix_f32, v_mad_mixlo_f16, v_mad_mixhi_f16 instructions", .dependencies = &[_]*const Feature { @@ -485,7 +485,7 @@ pub const feature_madMixInsts = Feature{ }; pub const feature_maxPrivateElementSize4 = Feature{ - .name = "max-private-element-size-4", + .name = "maxPrivateElementSize4", .llvm_name = "max-private-element-size-4", .description = "Maximum private access size may be 4", .dependencies = &[_]*const Feature { @@ -493,7 +493,7 @@ pub const feature_maxPrivateElementSize4 = Feature{ }; pub const feature_maxPrivateElementSize8 = Feature{ - .name = "max-private-element-size-8", + .name = "maxPrivateElementSize8", .llvm_name = "max-private-element-size-8", .description = "Maximum private access size may be 8", .dependencies = &[_]*const Feature { @@ -501,7 +501,7 @@ pub const feature_maxPrivateElementSize8 = Feature{ }; pub const feature_maxPrivateElementSize16 = Feature{ - .name = "max-private-element-size-16", + .name = "maxPrivateElementSize16", .llvm_name = "max-private-element-size-16", .description = "Maximum private access size may be 16", .dependencies = &[_]*const Feature { @@ -517,7 +517,7 @@ pub const feature_movrel = Feature{ }; pub const feature_nsaEncoding = Feature{ - .name = "nsa-encoding", + .name = "nsaEncoding", .llvm_name = "nsa-encoding", .description = "Support NSA encoding for image instructions", .dependencies = &[_]*const Feature { @@ -525,7 +525,7 @@ pub const feature_nsaEncoding = Feature{ }; pub const feature_nsaToVmemBug = Feature{ - .name = "nsa-to-vmem-bug", + .name = "nsaToVmemBug", .llvm_name = "nsa-to-vmem-bug", .description = "MIMG-NSA followed by VMEM fail if EXEC_LO or EXEC_HI equals zero", .dependencies = &[_]*const Feature { @@ -533,7 +533,7 @@ pub const feature_nsaToVmemBug = Feature{ }; pub const feature_noDataDepHazard = Feature{ - .name = "no-data-dep-hazard", + .name = "noDataDepHazard", .llvm_name = "no-data-dep-hazard", .description = "Does not need SW waitstates", .dependencies = &[_]*const Feature { @@ -541,7 +541,7 @@ pub const feature_noDataDepHazard = Feature{ }; pub const feature_noSdstCmpx = Feature{ - .name = "no-sdst-cmpx", + .name = "noSdstCmpx", .llvm_name = "no-sdst-cmpx", .description = "V_CMPX does not write VCC/SGPR in addition to EXEC", .dependencies = &[_]*const Feature { @@ -549,7 +549,7 @@ pub const feature_noSdstCmpx = Feature{ }; pub const feature_offset3fBug = Feature{ - .name = "offset-3f-bug", + .name = "offset3fBug", .llvm_name = "offset-3f-bug", .description = "Branch offset of 3f hardware bug", .dependencies = &[_]*const Feature { @@ -557,7 +557,7 @@ pub const feature_offset3fBug = Feature{ }; pub const feature_pkFmacF16Inst = Feature{ - .name = "pk-fmac-f16-inst", + .name = "pkFmacF16Inst", .llvm_name = "pk-fmac-f16-inst", .description = "Has v_pk_fmac_f16 instruction", .dependencies = &[_]*const Feature { @@ -565,7 +565,7 @@ pub const feature_pkFmacF16Inst = Feature{ }; pub const feature_promoteAlloca = Feature{ - .name = "promote-alloca", + .name = "promoteAlloca", .llvm_name = "promote-alloca", .description = "Enable promote alloca pass", .dependencies = &[_]*const Feature { @@ -573,7 +573,7 @@ pub const feature_promoteAlloca = Feature{ }; pub const feature_r128A16 = Feature{ - .name = "r128-a16", + .name = "r128A16", .llvm_name = "r128-a16", .description = "Support 16 bit coordindates/gradients/lod/clamp/mip types on gfx9", .dependencies = &[_]*const Feature { @@ -581,7 +581,7 @@ pub const feature_r128A16 = Feature{ }; pub const feature_registerBanking = Feature{ - .name = "register-banking", + .name = "registerBanking", .llvm_name = "register-banking", .description = "Has register banking", .dependencies = &[_]*const Feature { @@ -597,7 +597,7 @@ pub const feature_sdwa = Feature{ }; pub const feature_sdwaMav = Feature{ - .name = "sdwa-mav", + .name = "sdwaMav", .llvm_name = "sdwa-mav", .description = "Support v_mac_f32/f16 with SDWA (Sub-DWORD Addressing) extension", .dependencies = &[_]*const Feature { @@ -605,7 +605,7 @@ pub const feature_sdwaMav = Feature{ }; pub const feature_sdwaOmod = Feature{ - .name = "sdwa-omod", + .name = "sdwaOmod", .llvm_name = "sdwa-omod", .description = "Support OMod with SDWA (Sub-DWORD Addressing) extension", .dependencies = &[_]*const Feature { @@ -613,7 +613,7 @@ pub const feature_sdwaOmod = Feature{ }; pub const feature_sdwaOutModsVopc = Feature{ - .name = "sdwa-out-mods-vopc", + .name = "sdwaOutModsVopc", .llvm_name = "sdwa-out-mods-vopc", .description = "Support clamp for VOPC with SDWA (Sub-DWORD Addressing) extension", .dependencies = &[_]*const Feature { @@ -621,7 +621,7 @@ pub const feature_sdwaOutModsVopc = Feature{ }; pub const feature_sdwaScalar = Feature{ - .name = "sdwa-scalar", + .name = "sdwaScalar", .llvm_name = "sdwa-scalar", .description = "Support scalar register with SDWA (Sub-DWORD Addressing) extension", .dependencies = &[_]*const Feature { @@ -629,7 +629,7 @@ pub const feature_sdwaScalar = Feature{ }; pub const feature_sdwaSdst = Feature{ - .name = "sdwa-sdst", + .name = "sdwaSdst", .llvm_name = "sdwa-sdst", .description = "Support scalar dst for VOPC with SDWA (Sub-DWORD Addressing) extension", .dependencies = &[_]*const Feature { @@ -637,7 +637,7 @@ pub const feature_sdwaSdst = Feature{ }; pub const feature_sgprInitBug = Feature{ - .name = "sgpr-init-bug", + .name = "sgprInitBug", .llvm_name = "sgpr-init-bug", .description = "VI SGPR initialization bug requiring a fixed SGPR allocation size", .dependencies = &[_]*const Feature { @@ -645,7 +645,7 @@ pub const feature_sgprInitBug = Feature{ }; pub const feature_smemToVectorWriteHazard = Feature{ - .name = "smem-to-vector-write-hazard", + .name = "smemToVectorWriteHazard", .llvm_name = "smem-to-vector-write-hazard", .description = "s_load_dword followed by v_cmp page faults", .dependencies = &[_]*const Feature { @@ -653,7 +653,7 @@ pub const feature_smemToVectorWriteHazard = Feature{ }; pub const feature_sMemrealtime = Feature{ - .name = "s-memrealtime", + .name = "sMemrealtime", .llvm_name = "s-memrealtime", .description = "Has s_memrealtime instruction", .dependencies = &[_]*const Feature { @@ -661,7 +661,7 @@ pub const feature_sMemrealtime = Feature{ }; pub const feature_sramEcc = Feature{ - .name = "sram-ecc", + .name = "sramEcc", .llvm_name = "sram-ecc", .description = "Enable SRAM ECC", .dependencies = &[_]*const Feature { @@ -669,7 +669,7 @@ pub const feature_sramEcc = Feature{ }; pub const feature_scalarAtomics = Feature{ - .name = "scalar-atomics", + .name = "scalarAtomics", .llvm_name = "scalar-atomics", .description = "Has atomic scalar memory instructions", .dependencies = &[_]*const Feature { @@ -677,7 +677,7 @@ pub const feature_scalarAtomics = Feature{ }; pub const feature_scalarFlatScratchInsts = Feature{ - .name = "scalar-flat-scratch-insts", + .name = "scalarFlatScratchInsts", .llvm_name = "scalar-flat-scratch-insts", .description = "Have s_scratch_* flat memory instructions", .dependencies = &[_]*const Feature { @@ -685,7 +685,7 @@ pub const feature_scalarFlatScratchInsts = Feature{ }; pub const feature_scalarStores = Feature{ - .name = "scalar-stores", + .name = "scalarStores", .llvm_name = "scalar-stores", .description = "Has store scalar memory instructions", .dependencies = &[_]*const Feature { @@ -693,7 +693,7 @@ pub const feature_scalarStores = Feature{ }; pub const feature_trapHandler = Feature{ - .name = "trap-handler", + .name = "trapHandler", .llvm_name = "trap-handler", .description = "Trap handler support", .dependencies = &[_]*const Feature { @@ -701,7 +701,7 @@ pub const feature_trapHandler = Feature{ }; pub const feature_trigReducedRange = Feature{ - .name = "trig-reduced-range", + .name = "trigReducedRange", .llvm_name = "trig-reduced-range", .description = "Requires use of fract on arguments to trig instructions", .dependencies = &[_]*const Feature { @@ -709,7 +709,7 @@ pub const feature_trigReducedRange = Feature{ }; pub const feature_unalignedBufferAccess = Feature{ - .name = "unaligned-buffer-access", + .name = "unalignedBufferAccess", .llvm_name = "unaligned-buffer-access", .description = "Support unaligned global loads and stores", .dependencies = &[_]*const Feature { @@ -717,7 +717,7 @@ pub const feature_unalignedBufferAccess = Feature{ }; pub const feature_unalignedScratchAccess = Feature{ - .name = "unaligned-scratch-access", + .name = "unalignedScratchAccess", .llvm_name = "unaligned-scratch-access", .description = "Support unaligned scratch loads and stores", .dependencies = &[_]*const Feature { @@ -725,7 +725,7 @@ pub const feature_unalignedScratchAccess = Feature{ }; pub const feature_unpackedD16Vmem = Feature{ - .name = "unpacked-d16-vmem", + .name = "unpackedD16Vmem", .llvm_name = "unpacked-d16-vmem", .description = "Has unpacked d16 vmem instructions", .dependencies = &[_]*const Feature { @@ -733,7 +733,7 @@ pub const feature_unpackedD16Vmem = Feature{ }; pub const feature_vgprIndexMode = Feature{ - .name = "vgpr-index-mode", + .name = "vgprIndexMode", .llvm_name = "vgpr-index-mode", .description = "Has VGPR mode register indexing", .dependencies = &[_]*const Feature { @@ -741,7 +741,7 @@ pub const feature_vgprIndexMode = Feature{ }; pub const feature_vmemToScalarWriteHazard = Feature{ - .name = "vmem-to-scalar-write-hazard", + .name = "vmemToScalarWriteHazard", .llvm_name = "vmem-to-scalar-write-hazard", .description = "VMEM instruction followed by scalar writing to EXEC mask, M0 or SGPR leads to incorrect execution.", .dependencies = &[_]*const Feature { @@ -749,7 +749,7 @@ pub const feature_vmemToScalarWriteHazard = Feature{ }; pub const feature_vop3Literal = Feature{ - .name = "vop3-literal", + .name = "vop3Literal", .llvm_name = "vop3-literal", .description = "Can use one literal in VOP3", .dependencies = &[_]*const Feature { @@ -765,7 +765,7 @@ pub const feature_vop3p = Feature{ }; pub const feature_vcmpxExecWarHazard = Feature{ - .name = "vcmpx-exec-war-hazard", + .name = "vcmpxExecWarHazard", .llvm_name = "vcmpx-exec-war-hazard", .description = "V_CMPX WAR hazard on EXEC (V_CMPX issue ONLY)", .dependencies = &[_]*const Feature { @@ -773,7 +773,7 @@ pub const feature_vcmpxExecWarHazard = Feature{ }; pub const feature_vcmpxPermlaneHazard = Feature{ - .name = "vcmpx-permlane-hazard", + .name = "vcmpxPermlaneHazard", .llvm_name = "vcmpx-permlane-hazard", .description = "TODO: describe me", .dependencies = &[_]*const Feature { @@ -821,7 +821,7 @@ pub const feature_xnack = Feature{ }; pub const feature_halfRate64Ops = Feature{ - .name = "half-rate-64-ops", + .name = "halfRate64Ops", .llvm_name = "half-rate-64-ops", .description = "Most fp64 instructions are half rate instead of quarter", .dependencies = &[_]*const Feature { @@ -942,15 +942,15 @@ pub const cpu_bonaire = Cpu{ &feature_noXnackSupport, &feature_ldsbankcount32, &feature_movrel, - &feature_flatAddressSpace, &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, &feature_wavefrontsize64, + &feature_ciInsts, + &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, &feature_mimgR128, &feature_noSramEccSupport, + &feature_flatAddressSpace, &feature_localmemorysize65536, - &feature_fp64, - &feature_ciInsts, }, }; @@ -962,28 +962,28 @@ pub const cpu_carrizo = Cpu{ &feature_fastFmaf, &feature_ldsbankcount32, &feature_unpackedD16Vmem, - &feature_sMemrealtime, - &feature_scalarStores, + &feature_BitInsts16, &feature_flatAddressSpace, - &feature_vgprIndexMode, - &feature_wavefrontsize64, - &feature_mimgR128, - &feature_intClampInsts, &feature_dpp, - &feature_movrel, - &feature_gcn3Encoding, - &feature_gfx8Insts, - &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, - &feature_sdwaMav, &feature_sdwa, - &feature_localmemorysize65536, - &feature_BitInsts16, - &feature_sdwaOutModsVopc, + &feature_mimgR128, &feature_inv2piInlineImm, - &feature_noSramEccSupport, + &feature_sdwaOutModsVopc, + &feature_sMemrealtime, + &feature_trigReducedRange, + &feature_vgprIndexMode, &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, + &feature_noSramEccSupport, + &feature_gfx8Insts, + &feature_localmemorysize65536, + &feature_movrel, + &feature_intClampInsts, + &feature_sdwaMav, + &feature_wavefrontsize64, &feature_ciInsts, + &feature_scalarStores, + &feature_gcn3Encoding, &feature_xnack, &feature_halfRate64Ops, }, @@ -997,28 +997,28 @@ pub const cpu_fiji = Cpu{ &feature_noXnackSupport, &feature_ldsbankcount32, &feature_unpackedD16Vmem, - &feature_sMemrealtime, - &feature_scalarStores, + &feature_BitInsts16, &feature_flatAddressSpace, - &feature_vgprIndexMode, - &feature_wavefrontsize64, - &feature_mimgR128, - &feature_intClampInsts, &feature_dpp, - &feature_movrel, - &feature_gcn3Encoding, - &feature_gfx8Insts, - &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, - &feature_sdwaMav, &feature_sdwa, - &feature_localmemorysize65536, - &feature_BitInsts16, - &feature_sdwaOutModsVopc, + &feature_mimgR128, &feature_inv2piInlineImm, - &feature_noSramEccSupport, + &feature_sdwaOutModsVopc, + &feature_sMemrealtime, + &feature_trigReducedRange, + &feature_vgprIndexMode, &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, + &feature_noSramEccSupport, + &feature_gfx8Insts, + &feature_localmemorysize65536, + &feature_movrel, + &feature_intClampInsts, + &feature_sdwaMav, + &feature_wavefrontsize64, &feature_ciInsts, + &feature_scalarStores, + &feature_gcn3Encoding, }, }; @@ -1031,7 +1031,7 @@ pub const cpu_generic = Cpu{ }; pub const cpu_genericHsa = Cpu{ - .name = "generic-hsa", + .name = "genericHsa", .llvm_name = "generic-hsa", .dependencies = &[_]*const Feature { &feature_flatAddressSpace, @@ -1047,40 +1047,40 @@ pub const cpu_gfx1010 = Cpu{ &feature_dlInsts, &feature_noXnackSupport, &feature_flatSegmentOffsetBug, - &feature_sdwaOmod, - &feature_sMemrealtime, - &feature_flatAddressSpace, - &feature_gfx9Insts, - &feature_fastFmaf, - &feature_flatScratchInsts, - &feature_mimgR128, - &feature_noSdstCmpx, - &feature_sdwaSdst, - &feature_vop3p, - &feature_intClampInsts, - &feature_dpp, - &feature_registerBanking, - &feature_movrel, - &feature_gfx8Insts, - &feature_sdwa, - &feature_noDataDepHazard, + &feature_vop3Literal, + &feature_apertureRegs, &feature_flatGlobalInsts, &feature_gfx10Insts, - &feature_localmemorysize65536, &feature_BitInsts16, - &feature_addNoCarryInsts, &feature_pkFmacF16Inst, + &feature_vop3p, + &feature_flatAddressSpace, + &feature_dpp, + &feature_inv2piInlineImm, + &feature_dpp8, + &feature_flatScratchInsts, &feature_flatInstOffsets, + &feature_mimgR128, + &feature_sdwa, &feature_fmaMixInsts, - &feature_sdwaScalar, - &feature_inv2piInlineImm, + &feature_sMemrealtime, &feature_vscnt, - &feature_apertureRegs, - &feature_dpp8, - &feature_noSramEccSupport, + &feature_fastFmaf, + &feature_registerBanking, + &feature_gfx9Insts, + &feature_sdwaSdst, + &feature_noSdstCmpx, &feature_fp64, + &feature_noSramEccSupport, + &feature_gfx8Insts, + &feature_localmemorysize65536, + &feature_movrel, + &feature_intClampInsts, + &feature_sdwaScalar, + &feature_sdwaOmod, + &feature_noDataDepHazard, &feature_ciInsts, - &feature_vop3Literal, + &feature_addNoCarryInsts, &feature_instFwdPrefetchBug, &feature_ldsbankcount32, &feature_ldsBranchVmemWarHazard, @@ -1111,40 +1111,40 @@ pub const cpu_gfx1011 = Cpu{ &feature_dot5Insts, &feature_dot6Insts, &feature_flatSegmentOffsetBug, - &feature_sdwaOmod, - &feature_sMemrealtime, - &feature_flatAddressSpace, - &feature_gfx9Insts, - &feature_fastFmaf, - &feature_flatScratchInsts, - &feature_mimgR128, - &feature_noSdstCmpx, - &feature_sdwaSdst, - &feature_vop3p, - &feature_intClampInsts, - &feature_dpp, - &feature_registerBanking, - &feature_movrel, - &feature_gfx8Insts, - &feature_sdwa, - &feature_noDataDepHazard, + &feature_vop3Literal, + &feature_apertureRegs, &feature_flatGlobalInsts, &feature_gfx10Insts, - &feature_localmemorysize65536, &feature_BitInsts16, - &feature_addNoCarryInsts, &feature_pkFmacF16Inst, + &feature_vop3p, + &feature_flatAddressSpace, + &feature_dpp, + &feature_inv2piInlineImm, + &feature_dpp8, + &feature_flatScratchInsts, &feature_flatInstOffsets, + &feature_mimgR128, + &feature_sdwa, &feature_fmaMixInsts, - &feature_sdwaScalar, - &feature_inv2piInlineImm, + &feature_sMemrealtime, &feature_vscnt, - &feature_apertureRegs, - &feature_dpp8, - &feature_noSramEccSupport, + &feature_fastFmaf, + &feature_registerBanking, + &feature_gfx9Insts, + &feature_sdwaSdst, + &feature_noSdstCmpx, &feature_fp64, + &feature_noSramEccSupport, + &feature_gfx8Insts, + &feature_localmemorysize65536, + &feature_movrel, + &feature_intClampInsts, + &feature_sdwaScalar, + &feature_sdwaOmod, + &feature_noDataDepHazard, &feature_ciInsts, - &feature_vop3Literal, + &feature_addNoCarryInsts, &feature_instFwdPrefetchBug, &feature_ldsbankcount32, &feature_ldsBranchVmemWarHazard, @@ -1174,40 +1174,40 @@ pub const cpu_gfx1012 = Cpu{ &feature_dot5Insts, &feature_dot6Insts, &feature_flatSegmentOffsetBug, - &feature_sdwaOmod, - &feature_sMemrealtime, - &feature_flatAddressSpace, - &feature_gfx9Insts, - &feature_fastFmaf, - &feature_flatScratchInsts, - &feature_mimgR128, - &feature_noSdstCmpx, - &feature_sdwaSdst, - &feature_vop3p, - &feature_intClampInsts, - &feature_dpp, - &feature_registerBanking, - &feature_movrel, - &feature_gfx8Insts, - &feature_sdwa, - &feature_noDataDepHazard, + &feature_vop3Literal, + &feature_apertureRegs, &feature_flatGlobalInsts, &feature_gfx10Insts, - &feature_localmemorysize65536, &feature_BitInsts16, - &feature_addNoCarryInsts, &feature_pkFmacF16Inst, + &feature_vop3p, + &feature_flatAddressSpace, + &feature_dpp, + &feature_inv2piInlineImm, + &feature_dpp8, + &feature_flatScratchInsts, &feature_flatInstOffsets, + &feature_mimgR128, + &feature_sdwa, &feature_fmaMixInsts, - &feature_sdwaScalar, - &feature_inv2piInlineImm, + &feature_sMemrealtime, &feature_vscnt, - &feature_apertureRegs, - &feature_dpp8, - &feature_noSramEccSupport, + &feature_fastFmaf, + &feature_registerBanking, + &feature_gfx9Insts, + &feature_sdwaSdst, + &feature_noSdstCmpx, &feature_fp64, + &feature_noSramEccSupport, + &feature_gfx8Insts, + &feature_localmemorysize65536, + &feature_movrel, + &feature_intClampInsts, + &feature_sdwaScalar, + &feature_sdwaOmod, + &feature_noDataDepHazard, &feature_ciInsts, - &feature_vop3Literal, + &feature_addNoCarryInsts, &feature_instFwdPrefetchBug, &feature_ldsbankcount32, &feature_ldsBranchVmemWarHazard, @@ -1236,11 +1236,11 @@ pub const cpu_gfx600 = Cpu{ &feature_ldsbankcount32, &feature_movrel, &feature_trigReducedRange, - &feature_mimgR128, - &feature_localmemorysize32768, &feature_wavefrontsize64, - &feature_noSramEccSupport, + &feature_localmemorysize32768, &feature_fp64, + &feature_noSramEccSupport, + &feature_mimgR128, &feature_halfRate64Ops, }, }; @@ -1254,11 +1254,11 @@ pub const cpu_gfx601 = Cpu{ &feature_ldsbankcount32, &feature_movrel, &feature_trigReducedRange, - &feature_mimgR128, - &feature_localmemorysize32768, &feature_wavefrontsize64, - &feature_noSramEccSupport, + &feature_localmemorysize32768, &feature_fp64, + &feature_noSramEccSupport, + &feature_mimgR128, }, }; @@ -1270,15 +1270,15 @@ pub const cpu_gfx700 = Cpu{ &feature_noXnackSupport, &feature_ldsbankcount32, &feature_movrel, - &feature_flatAddressSpace, &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, &feature_wavefrontsize64, + &feature_ciInsts, + &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, &feature_mimgR128, &feature_noSramEccSupport, + &feature_flatAddressSpace, &feature_localmemorysize65536, - &feature_fp64, - &feature_ciInsts, }, }; @@ -1291,15 +1291,15 @@ pub const cpu_gfx701 = Cpu{ &feature_fastFmaf, &feature_ldsbankcount32, &feature_movrel, - &feature_flatAddressSpace, &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, &feature_wavefrontsize64, + &feature_ciInsts, + &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, &feature_mimgR128, &feature_noSramEccSupport, + &feature_flatAddressSpace, &feature_localmemorysize65536, - &feature_fp64, - &feature_ciInsts, &feature_halfRate64Ops, }, }; @@ -1313,15 +1313,15 @@ pub const cpu_gfx702 = Cpu{ &feature_fastFmaf, &feature_ldsbankcount16, &feature_movrel, - &feature_flatAddressSpace, &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, &feature_wavefrontsize64, + &feature_ciInsts, + &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, &feature_mimgR128, &feature_noSramEccSupport, + &feature_flatAddressSpace, &feature_localmemorysize65536, - &feature_fp64, - &feature_ciInsts, }, }; @@ -1333,15 +1333,15 @@ pub const cpu_gfx703 = Cpu{ &feature_noXnackSupport, &feature_ldsbankcount16, &feature_movrel, - &feature_flatAddressSpace, &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, &feature_wavefrontsize64, + &feature_ciInsts, + &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, &feature_mimgR128, &feature_noSramEccSupport, + &feature_flatAddressSpace, &feature_localmemorysize65536, - &feature_fp64, - &feature_ciInsts, }, }; @@ -1353,15 +1353,15 @@ pub const cpu_gfx704 = Cpu{ &feature_noXnackSupport, &feature_ldsbankcount32, &feature_movrel, - &feature_flatAddressSpace, &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, &feature_wavefrontsize64, + &feature_ciInsts, + &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, &feature_mimgR128, &feature_noSramEccSupport, + &feature_flatAddressSpace, &feature_localmemorysize65536, - &feature_fp64, - &feature_ciInsts, }, }; @@ -1373,28 +1373,28 @@ pub const cpu_gfx801 = Cpu{ &feature_fastFmaf, &feature_ldsbankcount32, &feature_unpackedD16Vmem, - &feature_sMemrealtime, - &feature_scalarStores, + &feature_BitInsts16, &feature_flatAddressSpace, - &feature_vgprIndexMode, - &feature_wavefrontsize64, - &feature_mimgR128, - &feature_intClampInsts, &feature_dpp, - &feature_movrel, - &feature_gcn3Encoding, - &feature_gfx8Insts, - &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, - &feature_sdwaMav, &feature_sdwa, - &feature_localmemorysize65536, - &feature_BitInsts16, - &feature_sdwaOutModsVopc, + &feature_mimgR128, &feature_inv2piInlineImm, - &feature_noSramEccSupport, + &feature_sdwaOutModsVopc, + &feature_sMemrealtime, + &feature_trigReducedRange, + &feature_vgprIndexMode, &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, + &feature_noSramEccSupport, + &feature_gfx8Insts, + &feature_localmemorysize65536, + &feature_movrel, + &feature_intClampInsts, + &feature_sdwaMav, + &feature_wavefrontsize64, &feature_ciInsts, + &feature_scalarStores, + &feature_gcn3Encoding, &feature_xnack, &feature_halfRate64Ops, }, @@ -1409,28 +1409,28 @@ pub const cpu_gfx802 = Cpu{ &feature_ldsbankcount32, &feature_sgprInitBug, &feature_unpackedD16Vmem, - &feature_sMemrealtime, - &feature_scalarStores, + &feature_BitInsts16, &feature_flatAddressSpace, - &feature_vgprIndexMode, - &feature_wavefrontsize64, - &feature_mimgR128, - &feature_intClampInsts, &feature_dpp, - &feature_movrel, - &feature_gcn3Encoding, - &feature_gfx8Insts, - &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, - &feature_sdwaMav, &feature_sdwa, - &feature_localmemorysize65536, - &feature_BitInsts16, - &feature_sdwaOutModsVopc, + &feature_mimgR128, &feature_inv2piInlineImm, - &feature_noSramEccSupport, + &feature_sdwaOutModsVopc, + &feature_sMemrealtime, + &feature_trigReducedRange, + &feature_vgprIndexMode, &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, + &feature_noSramEccSupport, + &feature_gfx8Insts, + &feature_localmemorysize65536, + &feature_movrel, + &feature_intClampInsts, + &feature_sdwaMav, + &feature_wavefrontsize64, &feature_ciInsts, + &feature_scalarStores, + &feature_gcn3Encoding, }, }; @@ -1442,28 +1442,28 @@ pub const cpu_gfx803 = Cpu{ &feature_noXnackSupport, &feature_ldsbankcount32, &feature_unpackedD16Vmem, - &feature_sMemrealtime, - &feature_scalarStores, + &feature_BitInsts16, &feature_flatAddressSpace, - &feature_vgprIndexMode, - &feature_wavefrontsize64, - &feature_mimgR128, - &feature_intClampInsts, &feature_dpp, - &feature_movrel, - &feature_gcn3Encoding, - &feature_gfx8Insts, - &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, - &feature_sdwaMav, &feature_sdwa, - &feature_localmemorysize65536, - &feature_BitInsts16, - &feature_sdwaOutModsVopc, + &feature_mimgR128, &feature_inv2piInlineImm, - &feature_noSramEccSupport, + &feature_sdwaOutModsVopc, + &feature_sMemrealtime, + &feature_trigReducedRange, + &feature_vgprIndexMode, &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, + &feature_noSramEccSupport, + &feature_gfx8Insts, + &feature_localmemorysize65536, + &feature_movrel, + &feature_intClampInsts, + &feature_sdwaMav, + &feature_wavefrontsize64, &feature_ciInsts, + &feature_scalarStores, + &feature_gcn3Encoding, }, }; @@ -1473,28 +1473,28 @@ pub const cpu_gfx810 = Cpu{ .dependencies = &[_]*const Feature { &feature_codeObjectV3, &feature_ldsbankcount16, - &feature_sMemrealtime, - &feature_scalarStores, + &feature_BitInsts16, &feature_flatAddressSpace, - &feature_vgprIndexMode, - &feature_wavefrontsize64, - &feature_mimgR128, - &feature_intClampInsts, &feature_dpp, - &feature_movrel, - &feature_gcn3Encoding, - &feature_gfx8Insts, - &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, - &feature_sdwaMav, &feature_sdwa, - &feature_localmemorysize65536, - &feature_BitInsts16, - &feature_sdwaOutModsVopc, + &feature_mimgR128, &feature_inv2piInlineImm, - &feature_noSramEccSupport, + &feature_sdwaOutModsVopc, + &feature_sMemrealtime, + &feature_trigReducedRange, + &feature_vgprIndexMode, &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, + &feature_noSramEccSupport, + &feature_gfx8Insts, + &feature_localmemorysize65536, + &feature_movrel, + &feature_intClampInsts, + &feature_sdwaMav, + &feature_wavefrontsize64, &feature_ciInsts, + &feature_scalarStores, + &feature_gcn3Encoding, &feature_xnack, }, }; @@ -1506,36 +1506,36 @@ pub const cpu_gfx900 = Cpu{ &feature_codeObjectV3, &feature_noSramEccSupport, &feature_noXnackSupport, - &feature_sdwaOmod, - &feature_sMemrealtime, - &feature_scalarStores, + &feature_apertureRegs, + &feature_flatGlobalInsts, + &feature_BitInsts16, + &feature_vop3p, &feature_flatAddressSpace, - &feature_vgprIndexMode, - &feature_gfx9Insts, - &feature_r128A16, - &feature_fastFmaf, - &feature_wavefrontsize64, + &feature_dpp, + &feature_inv2piInlineImm, + &feature_sdwa, &feature_flatScratchInsts, + &feature_flatInstOffsets, + &feature_scalarFlatScratchInsts, + &feature_sMemrealtime, + &feature_fastFmaf, + &feature_gfx9Insts, &feature_sdwaSdst, - &feature_vop3p, - &feature_intClampInsts, - &feature_dpp, - &feature_scalarAtomics, - &feature_gcn3Encoding, - &feature_gfx8Insts, + &feature_vgprIndexMode, + &feature_fp64, &feature_gfx7Gfx8Gfx9Insts, - &feature_sdwa, - &feature_flatGlobalInsts, + &feature_gfx8Insts, &feature_localmemorysize65536, - &feature_BitInsts16, - &feature_addNoCarryInsts, - &feature_flatInstOffsets, + &feature_intClampInsts, &feature_sdwaScalar, - &feature_inv2piInlineImm, - &feature_apertureRegs, - &feature_fp64, + &feature_sdwaOmod, + &feature_scalarAtomics, + &feature_r128A16, + &feature_wavefrontsize64, &feature_ciInsts, - &feature_scalarFlatScratchInsts, + &feature_scalarStores, + &feature_gcn3Encoding, + &feature_addNoCarryInsts, &feature_ldsbankcount32, &feature_madMixInsts, }, @@ -1547,36 +1547,36 @@ pub const cpu_gfx902 = Cpu{ .dependencies = &[_]*const Feature { &feature_codeObjectV3, &feature_noSramEccSupport, - &feature_sdwaOmod, - &feature_sMemrealtime, - &feature_scalarStores, + &feature_apertureRegs, + &feature_flatGlobalInsts, + &feature_BitInsts16, + &feature_vop3p, &feature_flatAddressSpace, - &feature_vgprIndexMode, - &feature_gfx9Insts, - &feature_r128A16, - &feature_fastFmaf, - &feature_wavefrontsize64, + &feature_dpp, + &feature_inv2piInlineImm, + &feature_sdwa, &feature_flatScratchInsts, + &feature_flatInstOffsets, + &feature_scalarFlatScratchInsts, + &feature_sMemrealtime, + &feature_fastFmaf, + &feature_gfx9Insts, &feature_sdwaSdst, - &feature_vop3p, - &feature_intClampInsts, - &feature_dpp, - &feature_scalarAtomics, - &feature_gcn3Encoding, - &feature_gfx8Insts, + &feature_vgprIndexMode, + &feature_fp64, &feature_gfx7Gfx8Gfx9Insts, - &feature_sdwa, - &feature_flatGlobalInsts, + &feature_gfx8Insts, &feature_localmemorysize65536, - &feature_BitInsts16, - &feature_addNoCarryInsts, - &feature_flatInstOffsets, + &feature_intClampInsts, &feature_sdwaScalar, - &feature_inv2piInlineImm, - &feature_apertureRegs, - &feature_fp64, + &feature_sdwaOmod, + &feature_scalarAtomics, + &feature_r128A16, + &feature_wavefrontsize64, &feature_ciInsts, - &feature_scalarFlatScratchInsts, + &feature_scalarStores, + &feature_gcn3Encoding, + &feature_addNoCarryInsts, &feature_ldsbankcount32, &feature_madMixInsts, &feature_xnack, @@ -1591,36 +1591,36 @@ pub const cpu_gfx904 = Cpu{ &feature_noSramEccSupport, &feature_noXnackSupport, &feature_fmaMixInsts, - &feature_sdwaOmod, - &feature_sMemrealtime, - &feature_scalarStores, + &feature_apertureRegs, + &feature_flatGlobalInsts, + &feature_BitInsts16, + &feature_vop3p, &feature_flatAddressSpace, - &feature_vgprIndexMode, - &feature_gfx9Insts, - &feature_r128A16, - &feature_fastFmaf, - &feature_wavefrontsize64, + &feature_dpp, + &feature_inv2piInlineImm, + &feature_sdwa, &feature_flatScratchInsts, + &feature_flatInstOffsets, + &feature_scalarFlatScratchInsts, + &feature_sMemrealtime, + &feature_fastFmaf, + &feature_gfx9Insts, &feature_sdwaSdst, - &feature_vop3p, - &feature_intClampInsts, - &feature_dpp, - &feature_scalarAtomics, - &feature_gcn3Encoding, - &feature_gfx8Insts, + &feature_vgprIndexMode, + &feature_fp64, &feature_gfx7Gfx8Gfx9Insts, - &feature_sdwa, - &feature_flatGlobalInsts, + &feature_gfx8Insts, &feature_localmemorysize65536, - &feature_BitInsts16, - &feature_addNoCarryInsts, - &feature_flatInstOffsets, + &feature_intClampInsts, &feature_sdwaScalar, - &feature_inv2piInlineImm, - &feature_apertureRegs, - &feature_fp64, + &feature_sdwaOmod, + &feature_scalarAtomics, + &feature_r128A16, + &feature_wavefrontsize64, &feature_ciInsts, - &feature_scalarFlatScratchInsts, + &feature_scalarStores, + &feature_gcn3Encoding, + &feature_addNoCarryInsts, &feature_ldsbankcount32, }, }; @@ -1635,36 +1635,36 @@ pub const cpu_gfx906 = Cpu{ &feature_dot1Insts, &feature_dot2Insts, &feature_fmaMixInsts, - &feature_sdwaOmod, - &feature_sMemrealtime, - &feature_scalarStores, + &feature_apertureRegs, + &feature_flatGlobalInsts, + &feature_BitInsts16, + &feature_vop3p, &feature_flatAddressSpace, - &feature_vgprIndexMode, - &feature_gfx9Insts, - &feature_r128A16, - &feature_fastFmaf, - &feature_wavefrontsize64, + &feature_dpp, + &feature_inv2piInlineImm, + &feature_sdwa, &feature_flatScratchInsts, + &feature_flatInstOffsets, + &feature_scalarFlatScratchInsts, + &feature_sMemrealtime, + &feature_fastFmaf, + &feature_gfx9Insts, &feature_sdwaSdst, - &feature_vop3p, - &feature_intClampInsts, - &feature_dpp, - &feature_scalarAtomics, - &feature_gcn3Encoding, - &feature_gfx8Insts, + &feature_vgprIndexMode, + &feature_fp64, &feature_gfx7Gfx8Gfx9Insts, - &feature_sdwa, - &feature_flatGlobalInsts, + &feature_gfx8Insts, &feature_localmemorysize65536, - &feature_BitInsts16, - &feature_addNoCarryInsts, - &feature_flatInstOffsets, + &feature_intClampInsts, &feature_sdwaScalar, - &feature_inv2piInlineImm, - &feature_apertureRegs, - &feature_fp64, + &feature_sdwaOmod, + &feature_scalarAtomics, + &feature_r128A16, + &feature_wavefrontsize64, &feature_ciInsts, - &feature_scalarFlatScratchInsts, + &feature_scalarStores, + &feature_gcn3Encoding, + &feature_addNoCarryInsts, &feature_ldsbankcount32, &feature_halfRate64Ops, }, @@ -1684,36 +1684,36 @@ pub const cpu_gfx908 = Cpu{ &feature_dot5Insts, &feature_dot6Insts, &feature_fmaMixInsts, - &feature_sdwaOmod, - &feature_sMemrealtime, - &feature_scalarStores, + &feature_apertureRegs, + &feature_flatGlobalInsts, + &feature_BitInsts16, + &feature_vop3p, &feature_flatAddressSpace, - &feature_vgprIndexMode, - &feature_gfx9Insts, - &feature_r128A16, - &feature_fastFmaf, - &feature_wavefrontsize64, + &feature_dpp, + &feature_inv2piInlineImm, + &feature_sdwa, &feature_flatScratchInsts, + &feature_flatInstOffsets, + &feature_scalarFlatScratchInsts, + &feature_sMemrealtime, + &feature_fastFmaf, + &feature_gfx9Insts, &feature_sdwaSdst, - &feature_vop3p, - &feature_intClampInsts, - &feature_dpp, - &feature_scalarAtomics, - &feature_gcn3Encoding, - &feature_gfx8Insts, + &feature_vgprIndexMode, + &feature_fp64, &feature_gfx7Gfx8Gfx9Insts, - &feature_sdwa, - &feature_flatGlobalInsts, + &feature_gfx8Insts, &feature_localmemorysize65536, - &feature_BitInsts16, - &feature_addNoCarryInsts, - &feature_flatInstOffsets, + &feature_intClampInsts, &feature_sdwaScalar, - &feature_inv2piInlineImm, - &feature_apertureRegs, - &feature_fp64, + &feature_sdwaOmod, + &feature_scalarAtomics, + &feature_r128A16, + &feature_wavefrontsize64, &feature_ciInsts, - &feature_scalarFlatScratchInsts, + &feature_scalarStores, + &feature_gcn3Encoding, + &feature_addNoCarryInsts, &feature_ldsbankcount32, &feature_maiInsts, &feature_mfmaInlineLiteralBug, @@ -1728,36 +1728,36 @@ pub const cpu_gfx909 = Cpu{ .llvm_name = "gfx909", .dependencies = &[_]*const Feature { &feature_codeObjectV3, - &feature_sdwaOmod, - &feature_sMemrealtime, - &feature_scalarStores, + &feature_apertureRegs, + &feature_flatGlobalInsts, + &feature_BitInsts16, + &feature_vop3p, &feature_flatAddressSpace, - &feature_vgprIndexMode, - &feature_gfx9Insts, - &feature_r128A16, - &feature_fastFmaf, - &feature_wavefrontsize64, + &feature_dpp, + &feature_inv2piInlineImm, + &feature_sdwa, &feature_flatScratchInsts, + &feature_flatInstOffsets, + &feature_scalarFlatScratchInsts, + &feature_sMemrealtime, + &feature_fastFmaf, + &feature_gfx9Insts, &feature_sdwaSdst, - &feature_vop3p, - &feature_intClampInsts, - &feature_dpp, - &feature_scalarAtomics, - &feature_gcn3Encoding, - &feature_gfx8Insts, + &feature_vgprIndexMode, + &feature_fp64, &feature_gfx7Gfx8Gfx9Insts, - &feature_sdwa, - &feature_flatGlobalInsts, + &feature_gfx8Insts, &feature_localmemorysize65536, - &feature_BitInsts16, - &feature_addNoCarryInsts, - &feature_flatInstOffsets, + &feature_intClampInsts, &feature_sdwaScalar, - &feature_inv2piInlineImm, - &feature_apertureRegs, - &feature_fp64, + &feature_sdwaOmod, + &feature_scalarAtomics, + &feature_r128A16, + &feature_wavefrontsize64, &feature_ciInsts, - &feature_scalarFlatScratchInsts, + &feature_scalarStores, + &feature_gcn3Encoding, + &feature_addNoCarryInsts, &feature_ldsbankcount32, &feature_madMixInsts, &feature_xnack, @@ -1773,11 +1773,11 @@ pub const cpu_hainan = Cpu{ &feature_ldsbankcount32, &feature_movrel, &feature_trigReducedRange, - &feature_mimgR128, - &feature_localmemorysize32768, &feature_wavefrontsize64, - &feature_noSramEccSupport, + &feature_localmemorysize32768, &feature_fp64, + &feature_noSramEccSupport, + &feature_mimgR128, }, }; @@ -1790,15 +1790,15 @@ pub const cpu_hawaii = Cpu{ &feature_fastFmaf, &feature_ldsbankcount32, &feature_movrel, - &feature_flatAddressSpace, &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, &feature_wavefrontsize64, + &feature_ciInsts, + &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, &feature_mimgR128, &feature_noSramEccSupport, + &feature_flatAddressSpace, &feature_localmemorysize65536, - &feature_fp64, - &feature_ciInsts, &feature_halfRate64Ops, }, }; @@ -1812,28 +1812,28 @@ pub const cpu_iceland = Cpu{ &feature_ldsbankcount32, &feature_sgprInitBug, &feature_unpackedD16Vmem, - &feature_sMemrealtime, - &feature_scalarStores, + &feature_BitInsts16, &feature_flatAddressSpace, - &feature_vgprIndexMode, - &feature_wavefrontsize64, - &feature_mimgR128, - &feature_intClampInsts, &feature_dpp, - &feature_movrel, - &feature_gcn3Encoding, - &feature_gfx8Insts, - &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, - &feature_sdwaMav, &feature_sdwa, - &feature_localmemorysize65536, - &feature_BitInsts16, - &feature_sdwaOutModsVopc, + &feature_mimgR128, &feature_inv2piInlineImm, - &feature_noSramEccSupport, + &feature_sdwaOutModsVopc, + &feature_sMemrealtime, + &feature_trigReducedRange, + &feature_vgprIndexMode, &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, + &feature_noSramEccSupport, + &feature_gfx8Insts, + &feature_localmemorysize65536, + &feature_movrel, + &feature_intClampInsts, + &feature_sdwaMav, + &feature_wavefrontsize64, &feature_ciInsts, + &feature_scalarStores, + &feature_gcn3Encoding, }, }; @@ -1845,15 +1845,15 @@ pub const cpu_kabini = Cpu{ &feature_noXnackSupport, &feature_ldsbankcount16, &feature_movrel, - &feature_flatAddressSpace, &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, &feature_wavefrontsize64, + &feature_ciInsts, + &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, &feature_mimgR128, &feature_noSramEccSupport, + &feature_flatAddressSpace, &feature_localmemorysize65536, - &feature_fp64, - &feature_ciInsts, }, }; @@ -1865,15 +1865,15 @@ pub const cpu_kaveri = Cpu{ &feature_noXnackSupport, &feature_ldsbankcount32, &feature_movrel, - &feature_flatAddressSpace, &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, &feature_wavefrontsize64, + &feature_ciInsts, + &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, &feature_mimgR128, &feature_noSramEccSupport, + &feature_flatAddressSpace, &feature_localmemorysize65536, - &feature_fp64, - &feature_ciInsts, }, }; @@ -1885,15 +1885,15 @@ pub const cpu_mullins = Cpu{ &feature_noXnackSupport, &feature_ldsbankcount16, &feature_movrel, - &feature_flatAddressSpace, &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, &feature_wavefrontsize64, + &feature_ciInsts, + &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, &feature_mimgR128, &feature_noSramEccSupport, + &feature_flatAddressSpace, &feature_localmemorysize65536, - &feature_fp64, - &feature_ciInsts, }, }; @@ -1906,11 +1906,11 @@ pub const cpu_oland = Cpu{ &feature_ldsbankcount32, &feature_movrel, &feature_trigReducedRange, - &feature_mimgR128, - &feature_localmemorysize32768, &feature_wavefrontsize64, - &feature_noSramEccSupport, + &feature_localmemorysize32768, &feature_fp64, + &feature_noSramEccSupport, + &feature_mimgR128, }, }; @@ -1923,11 +1923,11 @@ pub const cpu_pitcairn = Cpu{ &feature_ldsbankcount32, &feature_movrel, &feature_trigReducedRange, - &feature_mimgR128, - &feature_localmemorysize32768, &feature_wavefrontsize64, - &feature_noSramEccSupport, + &feature_localmemorysize32768, &feature_fp64, + &feature_noSramEccSupport, + &feature_mimgR128, }, }; @@ -1939,28 +1939,28 @@ pub const cpu_polaris10 = Cpu{ &feature_noXnackSupport, &feature_ldsbankcount32, &feature_unpackedD16Vmem, - &feature_sMemrealtime, - &feature_scalarStores, + &feature_BitInsts16, &feature_flatAddressSpace, - &feature_vgprIndexMode, - &feature_wavefrontsize64, - &feature_mimgR128, - &feature_intClampInsts, &feature_dpp, - &feature_movrel, - &feature_gcn3Encoding, - &feature_gfx8Insts, - &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, - &feature_sdwaMav, &feature_sdwa, - &feature_localmemorysize65536, - &feature_BitInsts16, - &feature_sdwaOutModsVopc, + &feature_mimgR128, &feature_inv2piInlineImm, - &feature_noSramEccSupport, + &feature_sdwaOutModsVopc, + &feature_sMemrealtime, + &feature_trigReducedRange, + &feature_vgprIndexMode, &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, + &feature_noSramEccSupport, + &feature_gfx8Insts, + &feature_localmemorysize65536, + &feature_movrel, + &feature_intClampInsts, + &feature_sdwaMav, + &feature_wavefrontsize64, &feature_ciInsts, + &feature_scalarStores, + &feature_gcn3Encoding, }, }; @@ -1972,28 +1972,28 @@ pub const cpu_polaris11 = Cpu{ &feature_noXnackSupport, &feature_ldsbankcount32, &feature_unpackedD16Vmem, - &feature_sMemrealtime, - &feature_scalarStores, + &feature_BitInsts16, &feature_flatAddressSpace, - &feature_vgprIndexMode, - &feature_wavefrontsize64, - &feature_mimgR128, - &feature_intClampInsts, &feature_dpp, - &feature_movrel, - &feature_gcn3Encoding, - &feature_gfx8Insts, - &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, - &feature_sdwaMav, &feature_sdwa, - &feature_localmemorysize65536, - &feature_BitInsts16, - &feature_sdwaOutModsVopc, + &feature_mimgR128, &feature_inv2piInlineImm, - &feature_noSramEccSupport, + &feature_sdwaOutModsVopc, + &feature_sMemrealtime, + &feature_trigReducedRange, + &feature_vgprIndexMode, &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, + &feature_noSramEccSupport, + &feature_gfx8Insts, + &feature_localmemorysize65536, + &feature_movrel, + &feature_intClampInsts, + &feature_sdwaMav, + &feature_wavefrontsize64, &feature_ciInsts, + &feature_scalarStores, + &feature_gcn3Encoding, }, }; @@ -2003,28 +2003,28 @@ pub const cpu_stoney = Cpu{ .dependencies = &[_]*const Feature { &feature_codeObjectV3, &feature_ldsbankcount16, - &feature_sMemrealtime, - &feature_scalarStores, + &feature_BitInsts16, &feature_flatAddressSpace, - &feature_vgprIndexMode, - &feature_wavefrontsize64, - &feature_mimgR128, - &feature_intClampInsts, &feature_dpp, - &feature_movrel, - &feature_gcn3Encoding, - &feature_gfx8Insts, - &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, - &feature_sdwaMav, &feature_sdwa, - &feature_localmemorysize65536, - &feature_BitInsts16, - &feature_sdwaOutModsVopc, + &feature_mimgR128, &feature_inv2piInlineImm, - &feature_noSramEccSupport, + &feature_sdwaOutModsVopc, + &feature_sMemrealtime, + &feature_trigReducedRange, + &feature_vgprIndexMode, &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, + &feature_noSramEccSupport, + &feature_gfx8Insts, + &feature_localmemorysize65536, + &feature_movrel, + &feature_intClampInsts, + &feature_sdwaMav, + &feature_wavefrontsize64, &feature_ciInsts, + &feature_scalarStores, + &feature_gcn3Encoding, &feature_xnack, }, }; @@ -2039,11 +2039,11 @@ pub const cpu_tahiti = Cpu{ &feature_ldsbankcount32, &feature_movrel, &feature_trigReducedRange, - &feature_mimgR128, - &feature_localmemorysize32768, &feature_wavefrontsize64, - &feature_noSramEccSupport, + &feature_localmemorysize32768, &feature_fp64, + &feature_noSramEccSupport, + &feature_mimgR128, &feature_halfRate64Ops, }, }; @@ -2057,28 +2057,28 @@ pub const cpu_tonga = Cpu{ &feature_ldsbankcount32, &feature_sgprInitBug, &feature_unpackedD16Vmem, - &feature_sMemrealtime, - &feature_scalarStores, + &feature_BitInsts16, &feature_flatAddressSpace, - &feature_vgprIndexMode, - &feature_wavefrontsize64, - &feature_mimgR128, - &feature_intClampInsts, &feature_dpp, - &feature_movrel, - &feature_gcn3Encoding, - &feature_gfx8Insts, - &feature_trigReducedRange, - &feature_gfx7Gfx8Gfx9Insts, - &feature_sdwaMav, &feature_sdwa, - &feature_localmemorysize65536, - &feature_BitInsts16, - &feature_sdwaOutModsVopc, + &feature_mimgR128, &feature_inv2piInlineImm, - &feature_noSramEccSupport, + &feature_sdwaOutModsVopc, + &feature_sMemrealtime, + &feature_trigReducedRange, + &feature_vgprIndexMode, &feature_fp64, + &feature_gfx7Gfx8Gfx9Insts, + &feature_noSramEccSupport, + &feature_gfx8Insts, + &feature_localmemorysize65536, + &feature_movrel, + &feature_intClampInsts, + &feature_sdwaMav, + &feature_wavefrontsize64, &feature_ciInsts, + &feature_scalarStores, + &feature_gcn3Encoding, }, }; @@ -2091,11 +2091,11 @@ pub const cpu_verde = Cpu{ &feature_ldsbankcount32, &feature_movrel, &feature_trigReducedRange, - &feature_mimgR128, - &feature_localmemorysize32768, &feature_wavefrontsize64, - &feature_noSramEccSupport, + &feature_localmemorysize32768, &feature_fp64, + &feature_noSramEccSupport, + &feature_mimgR128, }, }; |
