[llvm] 5230f6c - [llvm][GenericUniformity] Prevent assert while calculating temporal divergence

Yashwant Singh via llvm-commits llvm-commits at lists.llvm.org
Wed Mar 1 23:13:40 PST 2023


Author: Yashwant Singh
Date: 2023-03-02T12:42:35+05:30
New Revision: 5230f6c1c274778d9204288667c62c8b199cab65

URL: https://github.com/llvm/llvm-project/commit/5230f6c1c274778d9204288667c62c8b199cab65
DIFF: https://github.com/llvm/llvm-project/commit/5230f6c1c274778d9204288667c62c8b199cab65.diff

LOG: [llvm][GenericUniformity] Prevent assert while calculating temporal divergence

analyzeTemporalDivergence() was missing the check for always-uniform before
evaluating weather an instruction depends on a value defined in the cycle.
Fix for #60638
https://github.com/llvm/llvm-project/issues/60638

Reviewed By: sameerds, foad, #amdgpu

Differential Revision: https://reviews.llvm.org/D144070

Added: 
    llvm/test/Analysis/DivergenceAnalysis/AMDGPU/MIR/uses-value-from-cycle.mir

Modified: 
    llvm/include/llvm/ADT/GenericUniformityImpl.h
    llvm/lib/Analysis/UniformityAnalysis.cpp
    llvm/lib/CodeGen/MachineUniformityAnalysis.cpp

Removed: 
    


################################################################################
diff  --git a/llvm/include/llvm/ADT/GenericUniformityImpl.h b/llvm/include/llvm/ADT/GenericUniformityImpl.h
index 294edfba113da..4784d90cafc96 100644
--- a/llvm/include/llvm/ADT/GenericUniformityImpl.h
+++ b/llvm/include/llvm/ADT/GenericUniformityImpl.h
@@ -811,10 +811,10 @@ void GenericUniformityAnalysisImpl<ContextT>::analyzeTemporalDivergence(
 
   LLVM_DEBUG(dbgs() << "Analyze temporal divergence: " << Context.print(&I)
                     << "\n");
-  if (!usesValueFromCycle(I, OuterDivCycle))
+  if (isAlwaysUniform(I))
     return;
 
-  if (isAlwaysUniform(I))
+  if (!usesValueFromCycle(I, OuterDivCycle))
     return;
 
   if (markDivergent(I))

diff  --git a/llvm/lib/Analysis/UniformityAnalysis.cpp b/llvm/lib/Analysis/UniformityAnalysis.cpp
index df7fd40159bb2..bf1d3a61f75d7 100644
--- a/llvm/lib/Analysis/UniformityAnalysis.cpp
+++ b/llvm/lib/Analysis/UniformityAnalysis.cpp
@@ -73,8 +73,7 @@ void llvm::GenericUniformityAnalysisImpl<SSAContext>::pushUsers(
 template <>
 bool llvm::GenericUniformityAnalysisImpl<SSAContext>::usesValueFromCycle(
     const Instruction &I, const Cycle &DefCycle) const {
-  if (isAlwaysUniform(I))
-    return false;
+  assert(!isAlwaysUniform(I));
   for (const Use &U : I.operands()) {
     if (auto *I = dyn_cast<Instruction>(&U)) {
       if (DefCycle.contains(I->getParent()))

diff  --git a/llvm/lib/CodeGen/MachineUniformityAnalysis.cpp b/llvm/lib/CodeGen/MachineUniformityAnalysis.cpp
index 2fe5e40a58c25..2aa09f73ed2c8 100644
--- a/llvm/lib/CodeGen/MachineUniformityAnalysis.cpp
+++ b/llvm/lib/CodeGen/MachineUniformityAnalysis.cpp
@@ -102,7 +102,12 @@ bool llvm::GenericUniformityAnalysisImpl<MachineSSAContext>::usesValueFromCycle(
     if (!Op.isReg() || !Op.readsReg())
       continue;
     auto Reg = Op.getReg();
-    assert(Reg.isVirtual());
+
+    // FIXME: Physical registers need to be properly checked instead of always
+    // returning true
+    if (Reg.isPhysical())
+      return true;
+
     auto *Def = F.getRegInfo().getVRegDef(Reg);
     if (DefCycle.contains(Def->getParent()))
       return true;

diff  --git a/llvm/test/Analysis/DivergenceAnalysis/AMDGPU/MIR/uses-value-from-cycle.mir b/llvm/test/Analysis/DivergenceAnalysis/AMDGPU/MIR/uses-value-from-cycle.mir
new file mode 100644
index 0000000000000..b7e0d5449d2e8
--- /dev/null
+++ b/llvm/test/Analysis/DivergenceAnalysis/AMDGPU/MIR/uses-value-from-cycle.mir
@@ -0,0 +1,66 @@
+# RUN: llc -mtriple=amdgcn-- -mcpu=gfx1030 -run-pass=print-machine-uniformity -o - %s 2>&1 | FileCheck %s
+---
+name:            f1
+tracksRegLiveness: true
+body:             |
+  ; CHECK-LABEL: MachineUniformityInfo for function: f1
+  bb.1:
+    %3:_(s32) = G_CONSTANT i32 0
+    %25:_(s32) = G_IMPLICIT_DEF
+  
+  bb.2:
+    %0:_(s32) = G_PHI %22(s32), %bb.5, %3(s32), %bb.1
+    %1:_(s32) = G_PHI %3(s32), %bb.1, %20(s32), %bb.5
+    %2:_(s32) = G_PHI %3(s32), %bb.1, %19(s32), %bb.5
+    %36:_(s32) = G_CONSTANT i32 0
+    %4:_(s1) = G_ICMP intpred(slt), %1(s32), %36
+  
+  bb.3:
+    successors: %bb.4(0x04000000), %bb.3(0x7c000000)
+  
+    %5:_(s32) = G_PHI %38(s32), %bb.3, %1(s32), %bb.2
+    %38:_(s32) = G_CONSTANT i32 0
+    G_BRCOND %4(s1), %bb.3
+    G_BR %bb.4
+  
+  bb.4:
+    successors: %bb.7, %bb.5
+  
+    %6:_(s32) = G_PHI %5(s32), %bb.3
+    %33:_(s1) = G_CONSTANT i1 true
+    %7:_(s64) = G_SEXT %2(s32)
+    %39:_(s32) = G_CONSTANT i32 2
+    %10:_(s64) = G_SHL %7, %39(s32)
+    %11:_(p0) = G_INTTOPTR %10(s64)
+    %13:_(s32) = G_LOAD %11(p0) :: (load (s32))
+    %37:_(s32) = G_CONSTANT i32 0
+    %14:sreg_32_xm0_xexec(s1) = G_ICMP intpred(slt), %13(s32), %37
+    %16:sreg_32_xm0_xexec(s32) = SI_IF %14(s1), %bb.5, implicit-def $exec, implicit-def $scc, implicit $exec
+    G_BR %bb.7
+  
+  bb.5:
+    successors: %bb.6(0x04000000), %bb.2(0x7c000000)
+    ; CHECK: DIVERGENT: %{{[0-9]}}: %{{[0-9]}}:_(s32) = G_PHI
+    ; CHECK: DIVERGENT: %{{[0-9]}}: %{{[0-9]}}:_(s32) = G_PHI
+    ; CHECK: DIVERGENT: %{{[0-9]}}: %{{[0-9]}}:_(s32) = G_PHI
+    ; CHECK-NOT: DIVERGENT: %{{[0-9]}}: %{{[0-9]}}:sreg_32_xm0_xexec(s32) = G_INTRINSIC intrinsic(@llvm.amdgcn.if.break)
+    %19:_(s32) = G_PHI %18(s32), %bb.7, %25(s32), %bb.4
+    %20:_(s32) = G_PHI %6(s32), %bb.7, %25(s32), %bb.4
+    %21:_(s1) = G_PHI %34(s1), %bb.7, %33(s1), %bb.4
+    G_INTRINSIC_W_SIDE_EFFECTS intrinsic(@llvm.amdgcn.end.cf), %16(s32)
+    %22:sreg_32_xm0_xexec(s32) = G_INTRINSIC intrinsic(@llvm.amdgcn.if.break), %21(s1), %0(s32)
+    SI_LOOP %22(s32), %bb.2, implicit-def $exec, implicit-def $scc, implicit $exec
+    G_BR %bb.6
+  
+  bb.6:
+    %24:_(s32) = G_PHI %22(s32), %bb.5
+    G_INTRINSIC_W_SIDE_EFFECTS intrinsic(@llvm.amdgcn.end.cf), %24(s32)
+    SI_RETURN
+  
+  bb.7:
+    %34:_(s1) = G_CONSTANT i1 false
+    %35:_(s32) = G_CONSTANT i32 1
+    %18:_(s32) = G_OR %2, %35
+    G_BR %bb.5
+
+...


        


More information about the llvm-commits mailing list