[llvm-branch-commits] [llvm] [LoopInterchange] Reject if outer reduction value has extra user (PR #203241)

Ryotaro Kasuga via llvm-branch-commits llvm-branch-commits at lists.llvm.org
Thu Jun 11 03:52:37 PDT 2026


https://github.com/kasuga-fj created https://github.com/llvm/llvm-project/pull/203241

None

>From b52e2b3a64f465de2a06f741af92d3b46d357b5a Mon Sep 17 00:00:00 2001
From: Ryotaro Kasuga <kasuga.ryotaro at fujitsu.com>
Date: Thu, 11 Jun 2026 10:51:12 +0000
Subject: [PATCH] [LoopInterchange] Reject if outer reduction value has extra
 user

---
 .../lib/Transforms/Scalar/LoopInterchange.cpp |  18 ++
 .../reduction-extra-use-in-inner-loop.ll      | 266 +++++++++++++++---
 2 files changed, 240 insertions(+), 44 deletions(-)

diff --git a/llvm/lib/Transforms/Scalar/LoopInterchange.cpp b/llvm/lib/Transforms/Scalar/LoopInterchange.cpp
index 543f527941b29..5e0af6fe728bb 100644
--- a/llvm/lib/Transforms/Scalar/LoopInterchange.cpp
+++ b/llvm/lib/Transforms/Scalar/LoopInterchange.cpp
@@ -1280,6 +1280,24 @@ bool LoopInterchangeLegality::checkInductionsAndReductions(Loop *OuterLoop) {
           });
           return false;
         }
+
+        // Reject if PHI has users other than InnerRedPhi. The typical case is as follows:
+        //
+        //   o.header:
+        //     %red.o = phi [ 0, ... ], [ %red.next, %o.latch ]
+        //     br label %i.header
+        //  
+        //   i.header:
+        //     %red.i = phi [ %red.o, %o.header ], [ %red.next, %i.latch ]
+        //     br label %i.body
+        //  
+        //   i.body:
+        //     store %red.o to %mem
+        //     ...
+        // 
+        if (!all_of(PHI.users(), [InnerRedPhi](User *U) { return U == InnerRedPhi; }))
+          return false;
+
         OuterInnerReductions.insert(&PHI);
         OuterInnerReductions.insert(InnerRedPhi);
       } else {
diff --git a/llvm/test/Transforms/LoopInterchange/reduction-extra-use-in-inner-loop.ll b/llvm/test/Transforms/LoopInterchange/reduction-extra-use-in-inner-loop.ll
index 83d93168a9877..02665f40575f5 100644
--- a/llvm/test/Transforms/LoopInterchange/reduction-extra-use-in-inner-loop.ll
+++ b/llvm/test/Transforms/LoopInterchange/reduction-extra-use-in-inner-loop.ll
@@ -2,8 +2,8 @@
 ; RUN: opt < %s -passes=loop-interchange -loop-interchange-profitabilities=ignore -S | FileCheck %s
 
 ; sum = 0;
-; for (i = 0; i < 4; i++)
-;   for (j = 0, sum_i = sum; j < 4; j++) {
+; for (i = 0, sum_i = sum; i < 2; i++)
+;   for (j = 0; j < 2; j++) {
 ;     sum += A[j][i];
 ;     B[j][i] = sum_i;
 ;   }
@@ -11,54 +11,128 @@
 ; Interchanging the loops will become as follows:
 ;
 ; sum = 0;
-; for (j = 0; j < 4; j++)
-;   for (i = 0, sum_j = sum; i < 4; i++) {
-;     sum_j += A[j][i];
+; for (j = 0, sum_j = sum; j < 2; j++)
+;   for (i = 0; i < 2; i++) {
+;     sum += A[j][i];
 ;     B[j][i] = sum_j;
 ;   }
 ;
-; This is invalid transformation because the contens of the array `B` will be
-; different.
+; This is invalid transformation. Consider the case when `A` is as follows:
+;
+;  A = {{ 0, 0 }, { 1, 1 }}
 ;
-; FIXME: The loops are now interchanged.
+; In this case, `sum_i` evolves 0 -> 1, while `sum_j` evolves 0 -> 0.
 ;
-define i8 @extra_reduction_use_in_inner(ptr noalias %A, ptr noalias %B) {
-; CHECK-LABEL: define i8 @extra_reduction_use_in_inner(
+define i8 @extra_reduction_use_in_inner0(ptr noalias %A, ptr noalias %B) {
+; CHECK-LABEL: define i8 @extra_reduction_use_in_inner0(
 ; CHECK-SAME: ptr noalias [[A:%.*]], ptr noalias [[B:%.*]]) {
-; CHECK-NEXT:  [[ENTRY:.*:]]
-; CHECK-NEXT:    br label %[[INNER_PREHEADER:.*]]
-; CHECK:       [[OUTER_HEADER_PREHEADER:.*]]:
-; CHECK-NEXT:    br label %[[OUTER_HEADER:.*]]
-; CHECK:       [[OUTER_HEADER]]:
-; CHECK-NEXT:    [[I:%.*]] = phi i64 [ [[I_NEXT:%.*]], %[[OUTER_LATCH:.*]] ], [ 0, %[[OUTER_HEADER_PREHEADER]] ]
-; CHECK-NEXT:    [[SUM_INNER:%.*]] = phi i8 [ [[SUM_NEXT:%.*]], %[[OUTER_LATCH]] ], [ [[SUM:%.*]], %[[OUTER_HEADER_PREHEADER]] ]
-; CHECK-NEXT:    br label %[[INNER_SPLIT1:.*]]
-; CHECK:       [[INNER_PREHEADER]]:
+; CHECK-NEXT:  [[INNER_PREHEADER:.*]]:
 ; CHECK-NEXT:    br label %[[INNER:.*]]
 ; CHECK:       [[INNER]]:
-; CHECK-NEXT:    [[J:%.*]] = phi i64 [ [[TMP0:%.*]], %[[INNER_SPLIT:.*]] ], [ 0, %[[INNER_PREHEADER]] ]
-; CHECK-NEXT:    [[SUM]] = phi i8 [ [[SUM_LCSSA:%.*]], %[[INNER_SPLIT]] ], [ 0, %[[INNER_PREHEADER]] ]
-; CHECK-NEXT:    br label %[[OUTER_HEADER_PREHEADER]]
-; CHECK:       [[INNER_SPLIT1]]:
-; CHECK-NEXT:    [[GEP_A:%.*]] = getelementptr [4 x i8], ptr [[A]], i64 [[J]], i64 [[I]]
+; CHECK-NEXT:    [[I:%.*]] = phi i64 [ 0, %[[INNER_PREHEADER]] ], [ [[I_NEXT:%.*]], %[[OUTER_LATCH:.*]] ]
+; CHECK-NEXT:    [[SUM:%.*]] = phi i8 [ 0, %[[INNER_PREHEADER]] ], [ [[SUM_LCSSA:%.*]], %[[OUTER_LATCH]] ]
+; CHECK-NEXT:    br label %[[OUTER_HEADER_PREHEADER:.*]]
+; CHECK:       [[OUTER_HEADER_PREHEADER]]:
+; CHECK-NEXT:    [[J:%.*]] = phi i64 [ 0, %[[INNER]] ], [ [[TMP0:%.*]], %[[OUTER_HEADER_PREHEADER]] ]
+; CHECK-NEXT:    [[SUM_INNER:%.*]] = phi i8 [ [[SUM]], %[[INNER]] ], [ [[SUM_NEXT:%.*]], %[[OUTER_HEADER_PREHEADER]] ]
+; CHECK-NEXT:    [[GEP_A:%.*]] = getelementptr [2 x i8], ptr [[A]], i64 [[J]], i64 [[I]]
 ; CHECK-NEXT:    [[A:%.*]] = load i8, ptr [[GEP_A]], align 1
 ; CHECK-NEXT:    [[SUM_NEXT]] = add i8 [[SUM_INNER]], [[A]]
-; CHECK-NEXT:    [[GEP_B:%.*]] = getelementptr [4 x i8], ptr [[B]], i64 [[J]], i64 [[I]]
+; CHECK-NEXT:    [[GEP_B:%.*]] = getelementptr [2 x i8], ptr [[B]], i64 [[J]], i64 [[I]]
 ; CHECK-NEXT:    store i8 [[SUM]], ptr [[GEP_B]], align 1
-; CHECK-NEXT:    [[J_NEXT:%.*]] = add i64 [[J]], 1
-; CHECK-NEXT:    [[EC_J:%.*]] = icmp eq i64 [[J_NEXT]], 4
-; CHECK-NEXT:    br label %[[OUTER_LATCH]]
-; CHECK:       [[INNER_SPLIT]]:
-; CHECK-NEXT:    [[SUM_LCSSA]] = phi i8 [ [[SUM_NEXT]], %[[OUTER_LATCH]] ]
 ; CHECK-NEXT:    [[TMP0]] = add i64 [[J]], 1
-; CHECK-NEXT:    [[TMP1:%.*]] = icmp eq i64 [[TMP0]], 4
-; CHECK-NEXT:    br i1 [[TMP1]], label %[[EXIT:.*]], label %[[INNER]]
+; CHECK-NEXT:    [[TMP1:%.*]] = icmp eq i64 [[TMP0]], 2
+; CHECK-NEXT:    br i1 [[TMP1]], label %[[OUTER_LATCH]], label %[[OUTER_HEADER_PREHEADER]]
+; CHECK:       [[OUTER_LATCH]]:
+; CHECK-NEXT:    [[SUM_LCSSA]] = phi i8 [ [[SUM_NEXT]], %[[OUTER_HEADER_PREHEADER]] ]
+; CHECK-NEXT:    [[I_NEXT]] = add i64 [[I]], 1
+; CHECK-NEXT:    [[EC_I:%.*]] = icmp eq i64 [[I_NEXT]], 2
+; CHECK-NEXT:    br i1 [[EC_I]], label %[[EXIT:.*]], label %[[INNER]]
+; CHECK:       [[EXIT]]:
+; CHECK-NEXT:    [[RES:%.*]] = phi i8 [ [[SUM_LCSSA]], %[[OUTER_LATCH]] ]
+; CHECK-NEXT:    ret i8 [[RES]]
+;
+entry:
+  br label %outer.header
+
+outer.header:
+  %i = phi i64 [ 0, %entry ], [ %i.next, %outer.latch ]
+  %sum.outer = phi i8 [ 0, %entry ], [ %sum.lcssa, %outer.latch ]
+  br label %inner
+
+inner:
+  %j = phi i64 [ 0, %outer.header ], [ %j.next, %inner ]
+  %sum.inner = phi i8 [ %sum.outer, %outer.header ], [ %sum.inner.next, %inner ]
+  %gep.A = getelementptr [2 x i8], ptr %A, i64 %j, i64 %i
+  %a = load i8, ptr %gep.A
+  %sum.inner.next = add i8 %sum.inner, %a
+  %gep.B = getelementptr [2 x i8], ptr %B, i64 %j, i64 %i
+  store i8 %sum.outer, ptr %gep.B
+  %j.next = add i64 %j, 1
+  %ec.j = icmp eq i64 %j.next, 2
+  br i1 %ec.j, label %outer.latch, label %inner
+
+outer.latch:
+  %sum.lcssa = phi i8 [ %sum.inner.next, %inner ]
+  %i.next = add i64 %i, 1
+  %ec.i = icmp eq i64 %i.next, 2
+  br i1 %ec.i, label %exit, label %outer.header
+
+exit:
+  %res = phi i8 [ %sum.lcssa, %outer.latch ]
+  ret i8 %res
+}
+
+; sum = 0;
+; for (i = 0; i < 2; i++)
+;   for (j = 0; j < 2; j++) {
+;     sum += A[j][i];
+;     B[j][i] = sum;
+;   }
+;
+; Interchanging the loops will become as follows:
+;
+; sum = 0;
+; for (j = 0; j < 2; j++)
+;   for (i = 0; i < 2; i++) {
+;     sum += A[j][i];
+;     B[j][i] = sum;
+;   }
+;
+; This is invalid transformation. Consider the case when `A` is as follows:
+;
+;  A = {{ 0, 1 }, { 0, 0 }}
+;
+; In this case, in the original loops, `sum` evolves 0 -> 0 -> 1 -> 1, while in
+; the interchanged loops, `sum` evolves 0 -> 1 -> 1 -> 1
+;
+define i8 @extra_reduction_use_in_inner1(ptr noalias %A, ptr noalias %B) {
+; CHECK-LABEL: define i8 @extra_reduction_use_in_inner1(
+; CHECK-SAME: ptr noalias [[A:%.*]], ptr noalias [[B:%.*]]) {
+; CHECK-NEXT:  [[ENTRY:.*]]:
+; CHECK-NEXT:    br label %[[OUTER_HEADER:.*]]
+; CHECK:       [[OUTER_HEADER]]:
+; CHECK-NEXT:    [[I:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[I_NEXT:%.*]], %[[OUTER_LATCH:.*]] ]
+; CHECK-NEXT:    [[SUM_OUTER:%.*]] = phi i8 [ 0, %[[ENTRY]] ], [ [[SUM_LCSSA:%.*]], %[[OUTER_LATCH]] ]
+; CHECK-NEXT:    br label %[[INNER:.*]]
+; CHECK:       [[INNER]]:
+; CHECK-NEXT:    [[J:%.*]] = phi i64 [ 0, %[[OUTER_HEADER]] ], [ [[J_NEXT:%.*]], %[[INNER]] ]
+; CHECK-NEXT:    [[SUM_INNER:%.*]] = phi i8 [ [[SUM_OUTER]], %[[OUTER_HEADER]] ], [ [[SUM_NEXT:%.*]], %[[INNER]] ]
+; CHECK-NEXT:    [[GEP_A:%.*]] = getelementptr [2 x i8], ptr [[A]], i64 [[J]], i64 [[I]]
+; CHECK-NEXT:    [[A:%.*]] = load i8, ptr [[GEP_A]], align 1
+; CHECK-NEXT:    [[SUM_NEXT]] = add i8 [[SUM_INNER]], [[A]]
+; CHECK-NEXT:    [[GEP_B:%.*]] = getelementptr [2 x i8], ptr [[B]], i64 [[J]], i64 [[I]]
+; CHECK-NEXT:    store i8 [[SUM_NEXT]], ptr [[GEP_B]], align 1
+; CHECK-NEXT:    [[J_NEXT]] = add i64 [[J]], 1
+; CHECK-NEXT:    [[EC_J:%.*]] = icmp eq i64 [[J_NEXT]], 2
+; CHECK-NEXT:    br i1 [[EC_J]], label %[[OUTER_LATCH]], label %[[INNER]]
 ; CHECK:       [[OUTER_LATCH]]:
+; CHECK-NEXT:    [[SUM_LCSSA]] = phi i8 [ [[SUM_NEXT]], %[[INNER]] ]
 ; CHECK-NEXT:    [[I_NEXT]] = add i64 [[I]], 1
-; CHECK-NEXT:    [[EC_I:%.*]] = icmp eq i64 [[I_NEXT]], 4
-; CHECK-NEXT:    br i1 [[EC_I]], label %[[INNER_SPLIT]], label %[[OUTER_HEADER]]
+; CHECK-NEXT:    [[EC_I:%.*]] = icmp eq i64 [[I_NEXT]], 2
+; CHECK-NEXT:    br i1 [[EC_I]], label %[[EXIT:.*]], label %[[OUTER_HEADER]]
 ; CHECK:       [[EXIT]]:
-; CHECK-NEXT:    [[RES:%.*]] = phi i8 [ [[SUM_LCSSA]], %[[INNER_SPLIT]] ]
+; CHECK-NEXT:    [[RES:%.*]] = phi i8 [ [[SUM_LCSSA]], %[[OUTER_LATCH]] ]
 ; CHECK-NEXT:    ret i8 [[RES]]
 ;
 entry:
@@ -66,28 +140,132 @@ entry:
 
 outer.header:
   %i = phi i64 [ 0, %entry ], [ %i.next, %outer.latch ]
-  %sum = phi i8 [ 0, %entry ], [ %sum.lcssa, %outer.latch ]
+  %sum.outer = phi i8 [ 0, %entry ], [ %sum.lcssa, %outer.latch ]
   br label %inner
 
 inner:
   %j = phi i64 [ 0, %outer.header ], [ %j.next, %inner ]
-  %sum.inner = phi i8 [ %sum, %outer.header ], [ %sum.next, %inner ]
-  %gep.A = getelementptr [4 x i8], ptr %A, i64 %j, i64 %i
+  %sum.inner = phi i8 [ %sum.outer, %outer.header ], [ %sum.inner.next, %inner ]
+  %gep.A = getelementptr [2 x i8], ptr %A, i64 %j, i64 %i
   %a = load i8, ptr %gep.A
-  %sum.next = add i8 %sum.inner, %a
-  %gep.B = getelementptr [4 x i8], ptr %B, i64 %j, i64 %i
-  store i8 %sum, ptr %gep.B
+  %sum.inner.next = add i8 %sum.inner, %a
+  %gep.B = getelementptr [2 x i8], ptr %B, i64 %j, i64 %i
+  store i8 %sum.inner.next, ptr %gep.B
   %j.next = add i64 %j, 1
-  %ec.j = icmp eq i64 %j.next, 4
+  %ec.j = icmp eq i64 %j.next, 2
   br i1 %ec.j, label %outer.latch, label %inner
 
 outer.latch:
-  %sum.lcssa = phi i8 [ %sum.next, %inner ]
+  %sum.lcssa = phi i8 [ %sum.inner.next, %inner ]
   %i.next = add i64 %i, 1
-  %ec.i = icmp eq i64 %i.next, 4
+  %ec.i = icmp eq i64 %i.next, 2
   br i1 %ec.i, label %exit, label %outer.header
 
 exit:
   %res = phi i8 [ %sum.lcssa, %outer.latch ]
   ret i8 %res
 }
+
+; sum = 0;
+; for (i = 0, sum_i = sum; i < 2; i++)
+;   for (j = 0; j < 2; j++)
+;     for (k = 0; k < 2; k++) {
+;       sum += A[j][i];
+;       B[j][i] = sum_i;
+;     }
+;
+; In this case, interchanging the j-loop and the k-loop is legal.
+;
+define i8 @extra_reduction_use_in_inner2(ptr noalias %A, ptr noalias %B) {
+; CHECK-LABEL: define i8 @extra_reduction_use_in_inner2(
+; CHECK-SAME: ptr noalias [[A:%.*]], ptr noalias [[B:%.*]]) {
+; CHECK-NEXT:  [[ENTRY:.*]]:
+; CHECK-NEXT:    br label %[[OUTER_HEADER:.*]]
+; CHECK:       [[OUTER_HEADER]]:
+; CHECK-NEXT:    [[I:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[I_NEXT:%.*]], %[[OUTER_LATCH:.*]] ]
+; CHECK-NEXT:    [[SUM_OUTER:%.*]] = phi i8 [ 0, %[[ENTRY]] ], [ [[SUM_OUTER_LCSSA:%.*]], %[[OUTER_LATCH]] ]
+; CHECK-NEXT:    br label %[[MIDDLE_HEADER_PREHEADER:.*]]
+; CHECK:       [[MIDDLE_HEADER_PREHEADER]]:
+; CHECK-NEXT:    br label %[[MIDDLE_HEADER:.*]]
+; CHECK:       [[MIDDLE_HEADER]]:
+; CHECK-NEXT:    [[J:%.*]] = phi i64 [ [[TMP2:%.*]], %[[MIDDLE_LATCH_SPLIT:.*]] ], [ 0, %[[MIDDLE_HEADER_PREHEADER]] ]
+; CHECK-NEXT:    [[SUM_MIDDLE:%.*]] = phi i8 [ [[SUM_MIDDLE_LCSSA:%.*]], %[[MIDDLE_LATCH_SPLIT]] ], [ [[SUM_OUTER]], %[[MIDDLE_HEADER_PREHEADER]] ]
+; CHECK-NEXT:    br label %[[INNER_PREHEADER:.*]]
+; CHECK:       [[INNER_PREHEADER]]:
+; CHECK-NEXT:    br label %[[INNER:.*]]
+; CHECK:       [[INNER]]:
+; CHECK-NEXT:    [[K:%.*]] = phi i64 [ [[TMP0:%.*]], %[[INNER_SPLIT:.*]] ], [ 0, %[[INNER_PREHEADER]] ]
+; CHECK-NEXT:    [[SUM_INNER:%.*]] = phi i8 [ [[SUM_INNER_NEXT:%.*]], %[[INNER_SPLIT]] ], [ [[SUM_MIDDLE]], %[[INNER_PREHEADER]] ]
+; CHECK-NEXT:    br label %[[INNER_SPLIT1:.*]]
+; CHECK:       [[INNER_SPLIT1]]:
+; CHECK-NEXT:    [[GEP_A:%.*]] = getelementptr [2 x [2 x i8]], ptr [[A]], i64 [[K]], i64 [[J]], i64 [[I]]
+; CHECK-NEXT:    [[A:%.*]] = load i8, ptr [[GEP_A]], align 1
+; CHECK-NEXT:    [[SUM_INNER_NEXT]] = add i8 [[SUM_INNER]], [[A]]
+; CHECK-NEXT:    [[GEP_B:%.*]] = getelementptr [2 x [2 x i8]], ptr [[B]], i64 [[K]], i64 [[J]], i64 [[I]]
+; CHECK-NEXT:    store i8 [[SUM_OUTER]], ptr [[GEP_B]], align 1
+; CHECK-NEXT:    [[K_NEXT:%.*]] = add i64 [[K]], 1
+; CHECK-NEXT:    [[EC_K:%.*]] = icmp eq i64 [[K_NEXT]], 2
+; CHECK-NEXT:    br label %[[MIDDLE_LATCH:.*]]
+; CHECK:       [[INNER_SPLIT]]:
+; CHECK-NEXT:    [[TMP0]] = add i64 [[K]], 1
+; CHECK-NEXT:    [[TMP1:%.*]] = icmp eq i64 [[TMP0]], 2
+; CHECK-NEXT:    br i1 [[TMP1]], label %[[MIDDLE_LATCH_SPLIT]], label %[[INNER]]
+; CHECK:       [[MIDDLE_LATCH]]:
+; CHECK-NEXT:    [[J_NEXT:%.*]] = add i64 [[J]], 1
+; CHECK-NEXT:    [[EC_J:%.*]] = icmp eq i64 [[J_NEXT]], 2
+; CHECK-NEXT:    br label %[[INNER_SPLIT]]
+; CHECK:       [[MIDDLE_LATCH_SPLIT]]:
+; CHECK-NEXT:    [[SUM_MIDDLE_LCSSA]] = phi i8 [ [[SUM_INNER_NEXT]], %[[INNER_SPLIT]] ]
+; CHECK-NEXT:    [[TMP2]] = add i64 [[J]], 1
+; CHECK-NEXT:    [[TMP3:%.*]] = icmp eq i64 [[TMP2]], 2
+; CHECK-NEXT:    br i1 [[TMP3]], label %[[OUTER_LATCH]], label %[[MIDDLE_HEADER]]
+; CHECK:       [[OUTER_LATCH]]:
+; CHECK-NEXT:    [[SUM_OUTER_LCSSA]] = phi i8 [ [[SUM_MIDDLE_LCSSA]], %[[MIDDLE_LATCH_SPLIT]] ]
+; CHECK-NEXT:    [[I_NEXT]] = add i64 [[I]], 1
+; CHECK-NEXT:    [[EC_I:%.*]] = icmp eq i64 [[I_NEXT]], 2
+; CHECK-NEXT:    br i1 [[EC_I]], label %[[EXIT:.*]], label %[[OUTER_HEADER]]
+; CHECK:       [[EXIT]]:
+; CHECK-NEXT:    [[RES:%.*]] = phi i8 [ [[SUM_OUTER_LCSSA]], %[[OUTER_LATCH]] ]
+; CHECK-NEXT:    ret i8 [[RES]]
+;
+entry:
+  br label %outer.header
+
+outer.header:
+  %i = phi i64 [ 0, %entry ], [ %i.next, %outer.latch ]
+  %sum.outer = phi i8 [ 0, %entry ], [ %sum.outer.lcssa, %outer.latch ]
+  br label %middle.header
+
+middle.header:
+  %j = phi i64 [ 0, %outer.header ], [ %j.next, %middle.latch ]
+  %sum.middle = phi i8 [ %sum.outer, %outer.header ], [ %sum.middle.lcssa, %middle.latch ]
+  br label %inner
+
+inner:
+  %k = phi i64 [ 0, %middle.header ], [ %k.next, %inner ]
+  %sum.inner = phi i8 [ %sum.middle, %middle.header ], [ %sum.inner.next, %inner ]
+  %gep.A = getelementptr [2 x [2 x i8]], ptr %A, i64 %k, i64 %j, i64 %i
+  %a = load i8, ptr %gep.A
+  %sum.inner.next = add i8 %sum.inner, %a
+  %gep.B = getelementptr [2 x [2 x i8]], ptr %B, i64 %k, i64 %j, i64 %i
+  store i8 %sum.outer, ptr %gep.B
+  %k.next = add i64 %k, 1
+  %ec.k = icmp eq i64 %k.next, 2
+  br i1 %ec.k, label %middle.latch, label %inner
+
+middle.latch:
+  %sum.middle.lcssa = phi i8 [ %sum.inner.next, %inner ]
+  %j.next = add i64 %j, 1
+  %ec.j = icmp eq i64 %j.next, 2
+  br i1 %ec.j, label %outer.latch, label %middle.header
+
+outer.latch:
+  %sum.outer.lcssa = phi i8 [ %sum.middle.lcssa, %middle.latch ]
+  %i.next = add i64 %i, 1
+  %ec.i = icmp eq i64 %i.next, 2
+  br i1 %ec.i, label %exit, label %outer.header
+
+exit:
+  %res = phi i8 [ %sum.outer.lcssa, %outer.latch ]
+  ret i8 %res
+}



More information about the llvm-branch-commits mailing list