[PATCH] D75857: [AMDGPU] Fix using physical registers in vector instructions

Sebastian Neubauer via Phabricator via llvm-commits llvm-commits at lists.llvm.org
Wed Mar 11 09:04:42 PDT 2020


Flakebi updated this revision to Diff 249637.
Flakebi added a comment.

Add test


Repository:
  rG LLVM Github Monorepo

CHANGES SINCE LAST ACTION
  https://reviews.llvm.org/D75857/new/

https://reviews.llvm.org/D75857

Files:
  llvm/lib/Target/AMDGPU/SIInstrInfo.cpp
  llvm/test/CodeGen/AMDGPU/vop3-physical-reg.mir


Index: llvm/test/CodeGen/AMDGPU/vop3-physical-reg.mir
===================================================================
--- /dev/null
+++ llvm/test/CodeGen/AMDGPU/vop3-physical-reg.mir
@@ -0,0 +1,42 @@
+# RUN: llc -march=amdgcn -mcpu=kaveri -run-pass=si-peephole-sdwa -o - %s | FileCheck -check-prefix=CI -check-prefix=GCN %s
+# RUN: llc -march=amdgcn -mcpu=fiji -run-pass=si-peephole-sdwa -o - %s | FileCheck -check-prefix=VI -check-prefix=GCN %s
+# RUN: llc -march=amdgcn -mcpu=gfx900 -run-pass=si-peephole-sdwa -o - %s | FileCheck -check-prefix=GFX9 -check-prefix=GCN %s
+# RUN: llc -march=amdgcn -mcpu=gfx1010 -run-pass=si-peephole-sdwa -o - %s | FileCheck -check-prefix=GFX10 -check-prefix=GCN %s
+
+# Allow physical registers as vop3 operands
+
+# GCN-LABEL: {{^}}name: vop3_reg
+
+# GCN: %{{[0-9]+}}:vgpr_32 = V_BCNT_U32_B32_e64 $exec_lo, 0, implicit-def $vcc, implicit $exec
+# GCN: %{{[0-9]+}}:vgpr_32 = V_BCNT_U32_B32_e64 $exec_hi, 0, implicit-def $vcc, implicit $exec
+# GCN: %{{[0-9]+}}:vgpr_32 = V_MBCNT_LO_U32_B32_e64 $exec_lo, 0, implicit-def $vcc, implicit $exec
+# GCN: %{{[0-9]+}}:vgpr_32 = V_MBCNT_HI_U32_B32_e64 $exec_hi, %{{[0-9]+}}, implicit-def $vcc, implicit $exec
+
+---
+name:            vop3_reg
+tracksRegLiveness: true
+registers:
+  - { id: 0, class: vreg_64 }
+  - { id: 1, class: vgpr_32 }
+  - { id: 2, class: vgpr_32 }
+  - { id: 3, class: vgpr_32 }
+  - { id: 4, class: vgpr_32 }
+  - { id: 9, class: sreg_64 }
+body:             |
+  bb.0:
+    liveins: $vgpr0_vgpr1, $vgpr2, $sgpr30_sgpr31
+
+    %9 = COPY $sgpr30_sgpr31
+    %0 = COPY $vgpr0_vgpr1
+
+    %1 = V_BCNT_U32_B32_e64 $exec_lo, 0, implicit-def $vcc, implicit $exec
+    %2 = V_BCNT_U32_B32_e64 $exec_hi, 0, implicit-def $vcc, implicit $exec
+    %3 = V_MBCNT_LO_U32_B32_e64 $exec_lo, 0, implicit-def $vcc, implicit $exec
+    %4 = V_MBCNT_HI_U32_B32_e64 $exec_hi, %3, implicit-def $vcc, implicit $exec
+
+    FLAT_STORE_DWORD %0, %1, 0, 0, 0, 0, implicit $exec, implicit $flat_scr :: (store 4)
+    FLAT_STORE_DWORD %0, %2, 0, 0, 0, 0, implicit $exec, implicit $flat_scr :: (store 4)
+    FLAT_STORE_DWORD %0, %3, 0, 0, 0, 0, implicit $exec, implicit $flat_scr :: (store 4)
+    FLAT_STORE_DWORD %0, %4, 0, 0, 0, 0, implicit $exec, implicit $flat_scr :: (store 4)
+    $sgpr30_sgpr31 = COPY %9
+    S_SETPC_B64_return $sgpr30_sgpr31
Index: llvm/lib/Target/AMDGPU/SIInstrInfo.cpp
===================================================================
--- llvm/lib/Target/AMDGPU/SIInstrInfo.cpp
+++ llvm/lib/Target/AMDGPU/SIInstrInfo.cpp
@@ -4294,13 +4294,22 @@
       continue;
     }
 
-    if (RI.hasAGPRs(MRI.getRegClass(MO.getReg())) &&
-        !isOperandLegal(MI, Idx, &MO)) {
+    bool IsSGPR = false;
+    bool IsAGPR = false;
+    if (MO.getReg().isVirtual()) {
+      IsAGPR = RI.hasAGPRs(MRI.getRegClass(MO.getReg()));
+      IsSGPR = RI.isSGPRClass(MRI.getRegClass(MO.getReg()));
+    } else {
+      IsAGPR = RI.isAGPR(MRI, MO.getReg());
+      IsAGPR = RI.isSGPRReg(MRI, MO.getReg());
+    }
+
+    if (IsAGPR && !isOperandLegal(MI, Idx, &MO)) {
       legalizeOpWithMove(MI, Idx);
       continue;
     }
 
-    if (!RI.isSGPRClass(MRI.getRegClass(MO.getReg())))
+    if (!IsSGPR)
       continue; // VGPRs are legal
 
     // We can use one SGPR in each VOP3 instruction prior to GFX10
@@ -5929,9 +5938,14 @@
 
     // If this could be a VGPR or an SGPR, Check the dynamic register class.
     Register Reg = MO.getReg();
-    const TargetRegisterClass *RegRC = MRI.getRegClass(Reg);
-    if (RI.isSGPRClass(RegRC))
-      UsedSGPRs[i] = Reg;
+    if (Reg.isVirtual()) {
+      const TargetRegisterClass *RegRC = MRI.getRegClass(Reg);
+      if (RI.isSGPRClass(RegRC))
+        UsedSGPRs[i] = Reg;
+    } else {
+      if (RI.isSGPRReg(MRI, Reg))
+        UsedSGPRs[i] = Reg;
+    }
   }
 
   // We don't have a required SGPR operand, so we have a bit more freedom in


-------------- next part --------------
A non-text attachment was scrubbed...
Name: D75857.249637.patch
Type: text/x-patch
Size: 3882 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/llvm-commits/attachments/20200311/33762395/attachment-0001.bin>


More information about the llvm-commits mailing list