[llvm] 45090b3 - [SLP]Check the whole def-use chain in the tree to find proper dominance, if the last instruction is the same

Alexey Bataev via llvm-commits llvm-commits at lists.llvm.org
Tue Mar 18 10:01:21 PDT 2025


Author: Alexey Bataev
Date: 2025-03-18T10:01:13-07:00
New Revision: 45090b3059562b32723cd25679db75d1574ab04e

URL: https://github.com/llvm/llvm-project/commit/45090b3059562b32723cd25679db75d1574ab04e
DIFF: https://github.com/llvm/llvm-project/commit/45090b3059562b32723cd25679db75d1574ab04e.diff

LOG: [SLP]Check the whole def-use chain in the tree to find proper dominance, if the last instruction is the same

If the insertion point (last instruction) of the user nodes is the same,
need to check the whole def-use chain in the tree to find proper
dominance to prevent a compiler crash.

Fixes #131818

Added: 
    llvm/test/Transforms/SLPVectorizer/X86/same-last-instruction-different-parents.ll

Modified: 
    llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp

Removed: 
    


################################################################################
diff  --git a/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp b/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp
index 24171f1d9a065..4a835bc797ab6 100644
--- a/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp
+++ b/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp
@@ -14086,11 +14086,18 @@ BoUpSLP::isGatherShuffledSingleRegisterEntry(
   auto CheckParentNodes = [&](const TreeEntry *User1, const TreeEntry *User2,
                               unsigned EdgeIdx) {
     const TreeEntry *Ptr1 = User1;
+    const TreeEntry *Ptr2 = User2;
+    SmallDenseMap<const TreeEntry *, unsigned> PtrToIdx;
+    while (Ptr2) {
+      PtrToIdx.try_emplace(Ptr2, EdgeIdx);
+      EdgeIdx = Ptr2->UserTreeIndex.EdgeIdx;
+      Ptr2 = Ptr2->UserTreeIndex.UserTE;
+    }
     while (Ptr1) {
       unsigned Idx = Ptr1->UserTreeIndex.EdgeIdx;
       Ptr1 = Ptr1->UserTreeIndex.UserTE;
-      if (Ptr1 == User2)
-        return Idx < EdgeIdx;
+      if (auto It = PtrToIdx.find(Ptr1); It != PtrToIdx.end())
+        return Idx < It->second;
     }
     return false;
   };

diff  --git a/llvm/test/Transforms/SLPVectorizer/X86/same-last-instruction-
diff erent-parents.ll b/llvm/test/Transforms/SLPVectorizer/X86/same-last-instruction-
diff erent-parents.ll
new file mode 100644
index 0000000000000..ef75a8dd99169
--- /dev/null
+++ b/llvm/test/Transforms/SLPVectorizer/X86/same-last-instruction-
diff erent-parents.ll
@@ -0,0 +1,64 @@
+; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
+; RUN: opt -S --passes=slp-vectorizer -mtriple=x86_64-unknown-linux-gnu < %s | FileCheck %s
+
+define i32 @test(i32 %0, i1 %1) {
+; CHECK-LABEL: define i32 @test(
+; CHECK-SAME: i32 [[TMP0:%.*]], i1 [[TMP1:%.*]]) {
+; CHECK-NEXT:    [[TMP3:%.*]] = insertelement <2 x i32> poison, i32 [[TMP0]], i32 0
+; CHECK-NEXT:    [[TMP4:%.*]] = shufflevector <2 x i32> [[TMP3]], <2 x i32> poison, <2 x i32> zeroinitializer
+; CHECK-NEXT:    [[TMP5:%.*]] = sitofp <2 x i32> [[TMP4]] to <2 x double>
+; CHECK-NEXT:    [[TMP6:%.*]] = sitofp <2 x i32> [[TMP4]] to <2 x double>
+; CHECK-NEXT:    br i1 [[TMP1]], label %[[BB7:.*]], label %[[BB9:.*]]
+; CHECK:       [[BB7]]:
+; CHECK-NEXT:    [[TMP8:%.*]] = call <2 x double> @llvm.fmuladd.v2f64(<2 x double> [[TMP6]], <2 x double> zeroinitializer, <2 x double> zeroinitializer)
+; CHECK-NEXT:    br label %[[BB16:.*]]
+; CHECK:       [[BB9]]:
+; CHECK-NEXT:    br i1 false, label %[[BB14:.*]], label %[[BB10:.*]]
+; CHECK:       [[BB10]]:
+; CHECK-NEXT:    [[TMP11:%.*]] = call <2 x double> @llvm.copysign.v2f64(<2 x double> zeroinitializer, <2 x double> [[TMP5]])
+; CHECK-NEXT:    [[TMP12:%.*]] = shufflevector <2 x double> [[TMP6]], <2 x double> <double 0.000000e+00, double poison>, <2 x i32> <i32 2, i32 1>
+; CHECK-NEXT:    [[TMP13:%.*]] = call <2 x double> @llvm.fmuladd.v2f64(<2 x double> [[TMP11]], <2 x double> [[TMP12]], <2 x double> zeroinitializer)
+; CHECK-NEXT:    br label %[[BB14]]
+; CHECK:       [[BB14]]:
+; CHECK-NEXT:    [[TMP15:%.*]] = phi <2 x double> [ [[TMP13]], %[[BB10]] ], [ zeroinitializer, %[[BB9]] ]
+; CHECK-NEXT:    br label %[[BB16]]
+; CHECK:       [[BB16]]:
+; CHECK-NEXT:    [[TMP17:%.*]] = phi <2 x double> [ [[TMP15]], %[[BB14]] ], [ [[TMP8]], %[[BB7]] ]
+; CHECK-NEXT:    [[TMP18:%.*]] = extractelement <2 x double> [[TMP17]], i32 0
+; CHECK-NEXT:    [[TMP19:%.*]] = extractelement <2 x double> [[TMP17]], i32 1
+; CHECK-NEXT:    [[TMP20:%.*]] = fmul double [[TMP19]], [[TMP18]]
+; CHECK-NEXT:    [[TMP21:%.*]] = fptosi double [[TMP20]] to i32
+; CHECK-NEXT:    ret i32 [[TMP21]]
+;
+  %3 = sitofp i32 %0 to double
+  %4 = sitofp i32 %0 to double
+  %5 = sitofp i32 %0 to double
+  br i1 %1, label %6, label %9
+
+6:
+  %7 = tail call double @llvm.fmuladd.f64(double %4, double 0.000000e+00, double 0.000000e+00)
+  %8 = tail call double @llvm.fmuladd.f64(double %5, double 0.000000e+00, double 0.000000e+00)
+  br label %18
+
+9:
+  br i1 false, label %15, label %10
+
+10:
+  %11 = call double @llvm.copysign.f64(double 0.000000e+00, double %3)
+  %12 = tail call double @llvm.fmuladd.f64(double %11, double %4, double 0.000000e+00)
+  %13 = call double @llvm.copysign.f64(double 0.000000e+00, double %5)
+  %14 = tail call double @llvm.fmuladd.f64(double %13, double 0.000000e+00, double 0.000000e+00)
+  br label %15
+
+15:
+  %16 = phi double [ %12, %10 ], [ 0.000000e+00, %9 ]
+  %17 = phi double [ %14, %10 ], [ 0.000000e+00, %9 ]
+  br label %18
+
+18:
+  %19 = phi double [ %17, %15 ], [ %8, %6 ]
+  %20 = phi double [ %16, %15 ], [ %7, %6 ]
+  %21 = fmul double %20, %19
+  %22 = fptosi double %21 to i32
+  ret i32 %22
+}


        


More information about the llvm-commits mailing list