[llvm] 7ee30a0 - [NFC][LAA] Match-up type sizes for possible extensions, based on actual bit-size rather than rounded-up byte size.

Chang-Sun Lin Jr via llvm-commits llvm-commits at lists.llvm.org
Fri Apr 22 23:16:59 PDT 2022


Author: Chang-Sun Lin Jr
Date: 2022-04-22T23:16:20-07:00
New Revision: 7ee30a0e24a173c38253e235cc6e021a52e17c17

URL: https://github.com/llvm/llvm-project/commit/7ee30a0e24a173c38253e235cc6e021a52e17c17
DIFF: https://github.com/llvm/llvm-project/commit/7ee30a0e24a173c38253e235cc6e021a52e17c17.diff

LOG: [NFC][LAA] Match-up type sizes for possible extensions, based on actual bit-size rather than rounded-up byte size.

Differential Revision: https://reviews.llvm.org/D119200

Added: 
    llvm/test/Transforms/LoopLoadElim/loop-i1-count.ll

Modified: 
    llvm/lib/Analysis/LoopAccessAnalysis.cpp

Removed: 
    


################################################################################
diff  --git a/llvm/lib/Analysis/LoopAccessAnalysis.cpp b/llvm/lib/Analysis/LoopAccessAnalysis.cpp
index e024dc3197e71..b1773dbbaad63 100644
--- a/llvm/lib/Analysis/LoopAccessAnalysis.cpp
+++ b/llvm/lib/Analysis/LoopAccessAnalysis.cpp
@@ -1456,13 +1456,13 @@ static bool isSafeDependenceDistance(const DataLayout &DL, ScalarEvolution &SE,
 
   const SCEV *CastedDist = &Dist;
   const SCEV *CastedProduct = Product;
-  uint64_t DistTypeSize = DL.getTypeAllocSize(Dist.getType());
-  uint64_t ProductTypeSize = DL.getTypeAllocSize(Product->getType());
+  uint64_t DistTypeSizeBits = DL.getTypeSizeInBits(Dist.getType());
+  uint64_t ProductTypeSizeBits = DL.getTypeSizeInBits(Product->getType());
 
   // The dependence distance can be positive/negative, so we sign extend Dist;
   // The multiplication of the absolute stride in bytes and the
   // backedgeTakenCount is non-negative, so we zero extend Product.
-  if (DistTypeSize > ProductTypeSize)
+  if (DistTypeSizeBits > ProductTypeSizeBits)
     CastedProduct = SE.getZeroExtendExpr(Product, Dist.getType());
   else
     CastedDist = SE.getNoopOrSignExtend(&Dist, Product->getType());
@@ -2277,12 +2277,12 @@ void LoopAccessInfo::collectStridedAccess(Value *MemAccess) {
   // The Stride can be positive/negative, so we sign extend Stride;
   // The backedgeTakenCount is non-negative, so we zero extend BETakenCount.
   const DataLayout &DL = TheLoop->getHeader()->getModule()->getDataLayout();
-  uint64_t StrideTypeSize = DL.getTypeAllocSize(StrideExpr->getType());
-  uint64_t BETypeSize = DL.getTypeAllocSize(BETakenCount->getType());
+  uint64_t StrideTypeSizeBits = DL.getTypeSizeInBits(StrideExpr->getType());
+  uint64_t BETypeSizeBits = DL.getTypeSizeInBits(BETakenCount->getType());
   const SCEV *CastedStride = StrideExpr;
   const SCEV *CastedBECount = BETakenCount;
   ScalarEvolution *SE = PSE->getSE();
-  if (BETypeSize >= StrideTypeSize)
+  if (BETypeSizeBits >= StrideTypeSizeBits)
     CastedStride = SE->getNoopOrSignExtend(StrideExpr, BETakenCount->getType());
   else
     CastedBECount = SE->getZeroExtendExpr(BETakenCount, StrideExpr->getType());

diff  --git a/llvm/test/Transforms/LoopLoadElim/loop-i1-count.ll b/llvm/test/Transforms/LoopLoadElim/loop-i1-count.ll
new file mode 100644
index 0000000000000..7ee12c8665adc
--- /dev/null
+++ b/llvm/test/Transforms/LoopLoadElim/loop-i1-count.ll
@@ -0,0 +1,44 @@
+; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
+; RUN: opt -S -passes=loop-load-elim %s | FileCheck %s
+
+; The backedge taken count of this loop is an i1 type, and the IV is i8.
+; The math in LoopAccessAnalysis was rounding the type sizes to bytes and
+; believing them equal, causing a size mismatch.
+
+target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128"
+
+ at a = external dso_local local_unnamed_addr global [1 x i32], align 4
+
+define dso_local void @test(i8 %inc) local_unnamed_addr {
+; CHECK-LABEL: @test(
+; CHECK-NEXT:  entry:
+; CHECK-NEXT:    br label [[FOR_COND3:%.*]]
+; CHECK:       for.cond3:
+; CHECK-NEXT:    [[H_0:%.*]] = phi i8 [ 0, [[ENTRY:%.*]] ], [ [[ADD:%.*]], [[COND_END_FOR_COND_CLEANUP_LOOPEXIT_CRIT_EDGE:%.*]] ]
+; CHECK-NEXT:    [[IDXPROM11:%.*]] = sext i8 [[H_0]] to i64
+; CHECK-NEXT:    [[ARRAYIDX27:%.*]] = getelementptr inbounds [1 x i32], [1 x i32]* @a, i64 0, i64 [[IDXPROM11]]
+; CHECK-NEXT:    br label [[FOR_BODY:%.*]]
+; CHECK:       cond.end.for.cond.cleanup.loopexit_crit_edge:
+; CHECK-NEXT:    [[ADD]] = add i8 [[H_0]], [[INC:%.*]]
+; CHECK-NEXT:    br label [[FOR_COND3]]
+; CHECK:       for.body:
+; CHECK-NEXT:    store i32 0, i32* [[ARRAYIDX27]], align 4
+; CHECK-NEXT:    br i1 true, label [[COND_END_FOR_COND_CLEANUP_LOOPEXIT_CRIT_EDGE]], label [[FOR_BODY]]
+;
+entry:
+  br label %for.cond3
+
+for.cond3:                                        ; preds = %cond.end.for.cond.cleanup.loopexit_crit_edge, %entry
+  %h.0 = phi i8 [ 0, %entry ], [ %add, %cond.end.for.cond.cleanup.loopexit_crit_edge ]
+  %idxprom11 = sext i8 %h.0 to i64
+  %arrayidx27 = getelementptr inbounds [1 x i32], [1 x i32]* @a, i64 0, i64 %idxprom11
+  br label %for.body
+
+cond.end.for.cond.cleanup.loopexit_crit_edge:     ; preds = %for.body
+  %add = add i8 %h.0, %inc
+  br label %for.cond3
+
+for.body:                                         ; preds = %for.body, %for.cond3
+  store i32 0, i32* %arrayidx27, align 4
+  br i1 true, label %cond.end.for.cond.cleanup.loopexit_crit_edge, label %for.body
+}


        


More information about the llvm-commits mailing list