[llvm] bd7c6e3 - [AMDGPU] Precommit lit test for wwm-reg AV spill pseudos D155646.

Christudasan Devadasan via llvm-commits llvm-commits at lists.llvm.org
Sat Aug 12 03:51:12 PDT 2023


Author: Christudasan Devadasan
Date: 2023-08-12T16:18:18+05:30
New Revision: bd7c6e3c48e9281ceeaae3a93cc493b35a3c9f29

URL: https://github.com/llvm/llvm-project/commit/bd7c6e3c48e9281ceeaae3a93cc493b35a3c9f29
DIFF: https://github.com/llvm/llvm-project/commit/bd7c6e3c48e9281ceeaae3a93cc493b35a3c9f29.diff

LOG: [AMDGPU] Precommit lit test for wwm-reg AV spill pseudos D155646.

Added: 
    llvm/test/CodeGen/AMDGPU/wwm-spill-superclass-pseudo.mir

Modified: 
    

Removed: 
    


################################################################################
diff  --git a/llvm/test/CodeGen/AMDGPU/wwm-spill-superclass-pseudo.mir b/llvm/test/CodeGen/AMDGPU/wwm-spill-superclass-pseudo.mir
new file mode 100644
index 00000000000000..9c4b0107b18fc0
--- /dev/null
+++ b/llvm/test/CodeGen/AMDGPU/wwm-spill-superclass-pseudo.mir
@@ -0,0 +1,85 @@
+# RUN: not --crash llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx908 -start-before=si-lower-sgpr-spills -stop-after=greedy,1 -verify-machineinstrs --stress-regalloc=2 %s -o /dev/null 2>&1 | FileCheck %s
+
+# This test would fail as there is no wwm-register spill pseudo instructions supported for the vector superclass (AV).
+# Currently there is only VGPR_32 regclass spilling allowed for wwm-registers.
+
+# CHECK: Bad machine code: Illegal virtual register for instruction
+# CHECK: instruction: {{.*}}    [[AV_REG:%[0-9]+]]:av_32 = SI_SPILL_WWM_V32_RESTORE
+# CHECK-NEXT: - operand 0:   [[AV_REG]]:av_32
+# CHECK-NEXT: Expected a VGPR_32 register, but got a AV_32 register
+
+name:            test_wwm_reg_superclass_spill
+tracksRegLiveness: true
+stack:
+  - { id: 0, name: '', type: spill-slot, offset: 0, size: 8, alignment: 8,
+      stack-id: sgpr-spill, callee-saved-register: '', callee-saved-restored: true}
+machineFunctionInfo:
+  isEntryFunction: true
+  stackPtrOffsetReg: '$sgpr32'
+  sgprForEXECCopy:   '$sgpr100_sgpr101'
+body:             |
+  bb.0:
+    $vgpr0 = IMPLICIT_DEF
+    $sgpr0_sgpr1 = IMPLICIT_DEF
+    %temp0:vgpr_32(s32) = COPY $vgpr0
+    %temp1:vgpr_32 = V_MOV_B32_e32 0, implicit $exec
+    $vcc = S_AND_B64 $exec, $sgpr0_sgpr1, implicit-def dead $scc
+    S_CBRANCH_VCCNZ %bb.2, implicit $vcc
+    S_BRANCH %bb.1
+
+  bb.1:
+    %temp2:vreg_64 = IMPLICIT_DEF
+    %temp1:vgpr_32 = FLAT_LOAD_DWORD %temp2, 0, 0, implicit $exec, implicit $flat_scr
+
+  bb.2:
+    %temp3:vreg_64 = V_MOV_B64_PSEUDO 0, implicit $exec
+    $sgpr2_sgpr3 = IMPLICIT_DEF
+    $sgpr4_sgpr5 = IMPLICIT_DEF
+    %temp4:vgpr_32 = FLAT_LOAD_UBYTE %temp3, 0, 0, implicit $exec, implicit $flat_scr
+    S_CBRANCH_EXECZ %bb.5, implicit $exec
+    S_BRANCH %bb.4
+
+  bb.3:
+    S_BRANCH %bb.8
+
+  bb.4:
+    liveins: $sgpr0_sgpr1, $sgpr2_sgpr3, $sgpr4_sgpr5
+    SI_SPILL_S64_SAVE killed $sgpr2_sgpr3, %stack.0, implicit $exec, implicit $sgpr32
+    $sgpr56_sgpr57 = S_LOAD_DWORDX2_IMM $sgpr4_sgpr5, 48, 0
+    $sgpr2 = S_MOV_B32 124
+    %temp5:vreg_64 = COPY  $sgpr56_sgpr57
+    %temp6:vreg_64, dead  $sgpr2_sgpr3 = V_MAD_U64_U32_e64 %temp0(s32), killed $sgpr2, %temp5, 0, implicit $exec
+    %temp7:vreg_64 = V_MOV_B64_PSEUDO 0, implicit $exec
+    undef %temp8.sub0:vreg_64 = FLAT_LOAD_DWORD %temp7, 0, 0, implicit $exec, implicit $flat_scr
+    $sgpr44_sgpr45_sgpr46_sgpr47 = S_LOAD_DWORDX4_IMM  $sgpr4_sgpr5, 88, 0
+    $sgpr58_sgpr59 = S_LOAD_DWORDX2_IMM  $sgpr4_sgpr5, 104, 0
+    $sgpr62_sgpr63 = S_XOR_B64  $sgpr0_sgpr1, -1, implicit-def dead $scc
+    $sgpr60_sgpr61 = S_MOV_B64 0
+    S_BRANCH %bb.6
+
+  bb.5:
+    S_CBRANCH_EXECZ %bb.8, implicit $exec
+    S_BRANCH %bb.3
+
+  bb.6:
+    liveins: $sgpr0_sgpr1, $sgpr60_sgpr61
+    %temp9:vgpr_32 = nofpexcept V_ADD_F32_e32 0, %temp1, implicit $mode, implicit $exec
+    %temp10:vgpr_32 = V_AND_B32_e32 2147483647, %temp9, implicit $exec
+    %temp11:vgpr_32 = V_AND_B32_e32 65535, %temp4, implicit $exec
+    undef %temp12.sub1:vreg_64 = V_MOV_B32_e32 0, implicit $exec
+    FLAT_STORE_DWORD %temp7, %temp12.sub1, 0, 0, implicit $exec, implicit $flat_scr
+    %temp13:vgpr_32 = V_CNDMASK_B32_e64 0, 1065353216, 0, 0, $sgpr0_sgpr1, implicit $exec
+    $sgpr19 = IMPLICIT_DEF
+    %temp14:vgpr_32 = nofpexcept V_MUL_F32_e64 0, 0, 0, $sgpr19, 0, 0, implicit $mode, implicit $exec
+    $sgpr17 = IMPLICIT_DEF
+
+  bb.7:
+    liveins: $sgpr60_sgpr61
+    $exec = S_OR_B64 $exec, killed $sgpr60_sgpr61, implicit-def $scc
+    $sgpr2_sgpr3 = SI_SPILL_S64_RESTORE %stack.0, implicit $exec, implicit $sgpr32
+    S_BRANCH %bb.5
+
+  bb.8:
+    S_ENDPGM 0
+
+...


        


More information about the llvm-commits mailing list