[PATCH] D98263: [LoopInterchange] fix tightlyNested() in LoopInterchange legality
Congzhe Cao via Phabricator via llvm-commits
llvm-commits at lists.llvm.org
Wed Mar 10 18:41:07 PST 2021
congzhe updated this revision to Diff 329817.
congzhe added a comment.
Updated the patch based on the latest trunk code.
Repository:
rG LLVM Github Monorepo
CHANGES SINCE LAST ACTION
https://reviews.llvm.org/D98263/new/
https://reviews.llvm.org/D98263
Files:
llvm/lib/Transforms/Scalar/LoopInterchange.cpp
llvm/test/Transforms/LoopInterchange/not-interchanged-tightly-nested.ll
Index: llvm/test/Transforms/LoopInterchange/not-interchanged-tightly-nested.ll
===================================================================
--- llvm/test/Transforms/LoopInterchange/not-interchanged-tightly-nested.ll
+++ llvm/test/Transforms/LoopInterchange/not-interchanged-tightly-nested.ll
@@ -9,6 +9,7 @@
@B = common global [100 x i32] zeroinitializer
@C = common global [100 x [100 x i32]] zeroinitializer
@D = common global [100 x [100 x [100 x i32]]] zeroinitializer
+ at E = common global [100 x [100 x i64]] zeroinitializer
;; Loops not tightly nested are not interchanged
;; for(int j=0;j<N;j++) {
@@ -103,3 +104,39 @@
for.end12:
ret void
}
+
+;; The following Loop is not considered tightly nested and is not interchanged.
+; CHECK: Not interchanging loops. Cannot prove legality.
+define void @interchange_07(i64 %k, i64 %N, i64 signext %ny) {
+entry:
+ br label %for1.header
+
+for1.header:
+ %j23 = phi i64 [ 0, %entry ], [ %j.next24, %for1.inc10 ]
+ %cmp21 = icmp slt i64 0, %ny
+ br label %singleSucc
+
+singleSucc:
+ br i1 %cmp21, label %preheader.j, label %for1.inc10
+
+preheader.j:
+ br label %for2
+
+for2:
+ %j = phi i64 [ %j.next, %for2 ], [ 0, %preheader.j ]
+ %arrayidx5 = getelementptr inbounds [100 x [100 x i64]], [100 x [100 x i64]]* @E, i64 0, i64 %j, i64 %j23
+ %lv = load i64, i64* %arrayidx5
+ %add = add nsw i64 %lv, %k
+ store i64 %add, i64* %arrayidx5
+ %j.next = add nuw nsw i64 %j, 1
+ %exitcond = icmp eq i64 %j, 99
+ br i1 %exitcond, label %for1.inc10, label %for2
+
+for1.inc10:
+ %j.next24 = add nuw nsw i64 %j23, 1
+ %exitcond26 = icmp eq i64 %j23, 99
+ br i1 %exitcond26, label %for.end12, label %for1.header
+
+for.end12:
+ ret void
+}
Index: llvm/lib/Transforms/Scalar/LoopInterchange.cpp
===================================================================
--- llvm/lib/Transforms/Scalar/LoopInterchange.cpp
+++ llvm/lib/Transforms/Scalar/LoopInterchange.cpp
@@ -19,6 +19,7 @@
#include "llvm/ADT/StringRef.h"
#include "llvm/Analysis/DependenceAnalysis.h"
#include "llvm/Analysis/LoopInfo.h"
+#include "llvm/Analysis/LoopNestAnalysis.h"
#include "llvm/Analysis/LoopPass.h"
#include "llvm/Analysis/OptimizationRemarkEmitter.h"
#include "llvm/Analysis/ScalarEvolution.h"
@@ -617,6 +618,22 @@
containsUnsafeInstructions(InnerLoopPreHeader))
return false;
+ BasicBlock *InnerLoopExit = InnerLoop->getExitBlock();
+ // Ensure the inner loop exit block flow to the outer loop latch possibly
+ // through empty blocks
+ const BasicBlock &SuccInner =
+ LoopNest::skipEmptyBlockUntil(InnerLoopExit, OuterLoopLatch);
+ if (&SuccInner != OuterLoopLatch) {
+ LLVM_DEBUG(dbgs() << "Inner loop exit block " << *InnerLoopExit
+ << " does not lead to the outer loop latch.\n";);
+ return false;
+ }
+ // The inner loop exit block does flow to the outer loop latch and not some
+ // other BBs, now make sure it contains safe instructions, since it will be
+ // move into the (new) inner loop after interchange
+ if (containsUnsafeInstructions(InnerLoopExit))
+ return false;
+
LLVM_DEBUG(dbgs() << "Loops are perfectly nested\n");
// We have a perfect loop nest.
return true;
-------------- next part --------------
A non-text attachment was scrubbed...
Name: D98263.329817.patch
Type: text/x-patch
Size: 3212 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/llvm-commits/attachments/20210311/a064be31/attachment.bin>
More information about the llvm-commits
mailing list