[llvm] r365104 - [PowerPC] Hardware Loop branch instruction's condition may not be icmp.

Chen Zheng via llvm-commits llvm-commits at lists.llvm.org
Wed Jul 3 18:51:48 PDT 2019


Author: shchenz
Date: Wed Jul  3 18:51:47 2019
New Revision: 365104

URL: http://llvm.org/viewvc/llvm-project?rev=365104&view=rev
Log:
[PowerPC] Hardware Loop branch instruction's condition may not be icmp.
This fixes pr42492.
Differential Revision: https://reviews.llvm.org/D64124

Added:
    llvm/trunk/test/CodeGen/PowerPC/pr42492.ll
Modified:
    llvm/trunk/lib/Transforms/Scalar/LoopStrengthReduce.cpp
    llvm/trunk/test/Transforms/HardwareLoops/unscevable.ll

Modified: llvm/trunk/lib/Transforms/Scalar/LoopStrengthReduce.cpp
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Transforms/Scalar/LoopStrengthReduce.cpp?rev=365104&r1=365103&r2=365104&view=diff
==============================================================================
--- llvm/trunk/lib/Transforms/Scalar/LoopStrengthReduce.cpp (original)
+++ llvm/trunk/lib/Transforms/Scalar/LoopStrengthReduce.cpp Wed Jul  3 18:51:47 2019
@@ -3269,7 +3269,7 @@ void LSRInstance::CollectFixupsAndInitia
       if (CI->isEquality()) {
         // If CI can be saved in some target, like replaced inside hardware loop
         // in PowerPC, no need to generate initial formulae for it.
-        if (SaveCmp && CI == cast<ICmpInst>(ExitBranch->getCondition()))
+        if (SaveCmp && CI == dyn_cast<ICmpInst>(ExitBranch->getCondition()))
           continue;
         // Swap the operands if needed to put the OperandValToReplace on the
         // left, for consistency.

Added: llvm/trunk/test/CodeGen/PowerPC/pr42492.ll
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/CodeGen/PowerPC/pr42492.ll?rev=365104&view=auto
==============================================================================
--- llvm/trunk/test/CodeGen/PowerPC/pr42492.ll (added)
+++ llvm/trunk/test/CodeGen/PowerPC/pr42492.ll Wed Jul  3 18:51:47 2019
@@ -0,0 +1,41 @@
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
+; RUN: llc -mtriple=powerpc64-unknown-linux-gnu -mcpu=pwr9 < %s | FileCheck %s
+
+define void @f(i8*, i8*, i64*) {
+; Check we don't assert and this is not a Hardware Loop
+; CHECK-LABEL: f:
+; CHECK:  .LBB0_2: #
+; CHECK-NEXT:    cmplwi
+; CHECK-NEXT:    cmpd
+; CHECK-NEXT:    sldi
+; CHECK-NEXT:    cror
+; CHECK-NEXT:    addi
+; CHECK-NEXT:    bc
+
+  %4 = icmp eq i8* %0, %1
+  br i1 %4, label %9, label %5
+
+5:                                                ; preds = %3
+  %6 = getelementptr inbounds i64, i64* %2, i64 1
+  %7 = load i64, i64* %6, align 8
+  br label %10
+
+8:                                                ; preds = %10
+  store i64 %14, i64* %6, align 8
+  br label %9
+
+9:                                                ; preds = %8, %3
+  ret void
+
+10:                                               ; preds = %5, %10
+  %11 = phi i64 [ %7, %5 ], [ %14, %10 ]
+  %12 = phi i32 [ 0, %5 ], [ %15, %10 ]
+  %13 = phi i8* [ %0, %5 ], [ %16, %10 ]
+  %14 = shl nsw i64 %11, 4
+  %15 = add nuw nsw i32 %12, 1
+  %16 = getelementptr inbounds i8, i8* %13, i64 1
+  %17 = icmp ugt i32 %12, 14
+  %18 = icmp eq i8* %16, %1
+  %19 = or i1 %18, %17
+  br i1 %19, label %8, label %10
+}

Modified: llvm/trunk/test/Transforms/HardwareLoops/unscevable.ll
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/Transforms/HardwareLoops/unscevable.ll?rev=365104&r1=365103&r2=365104&view=diff
==============================================================================
--- llvm/trunk/test/Transforms/HardwareLoops/unscevable.ll (original)
+++ llvm/trunk/test/Transforms/HardwareLoops/unscevable.ll Wed Jul  3 18:51:47 2019
@@ -45,3 +45,35 @@ while.body:
 while.end:
   ret void
 }
+
+; CHECK-LABEL: variant_counter2
+; CHECK-NOT: set.loop.iterations
+; CHECK-NOT: loop.decrement
+define void @variant_counter2(i8*, i8*, i64*) {
+  %4 = icmp eq i8* %0, %1
+  br i1 %4, label %9, label %5
+
+5:                                                ; preds = %3
+  %6 = getelementptr inbounds i64, i64* %2, i64 1
+  %7 = load i64, i64* %6, align 8
+  br label %10
+
+8:                                                ; preds = %10
+  store i64 %14, i64* %6, align 8
+  br label %9
+
+9:                                                ; preds = %8, %3
+  ret void
+
+10:                                               ; preds = %5, %10
+  %11 = phi i64 [ %7, %5 ], [ %14, %10 ]
+  %12 = phi i32 [ 0, %5 ], [ %15, %10 ]
+  %13 = phi i8* [ %0, %5 ], [ %16, %10 ]
+  %14 = shl nsw i64 %11, 4
+  %15 = add nuw nsw i32 %12, 1
+  %16 = getelementptr inbounds i8, i8* %13, i64 1
+  %17 = icmp ugt i32 %12, 14
+  %18 = icmp eq i8* %16, %1
+  %19 = or i1 %18, %17
+  br i1 %19, label %8, label %10
+}




More information about the llvm-commits mailing list