[llvm] r237993 - [Unroll] Extract the logic for caching SCEV-modeled GEPs with their

Thu May 21 20:02:22 PDT 2015

Author: chandlerc
Date: Thu May 21 22:02:22 2015
New Revision: 237993

URL: http://llvm.org/viewvc/llvm-project?rev=237993&view=rev
Log:
[Unroll] Extract the logic for caching SCEV-modeled GEPs with their
simplified model for use simulating each iteration into a separate
helper function that just returns the cache.

Building this cache had nothing to do with the rest of the unroll
analysis and so this removes an unnecessary coupling, etc. It should
also make it easier to think about the concept of providing fast cached
access to basic SCEV models as an orthogonal concept to the overall
unroll simulation.

I'd really like to see this kind of caching logic folded into SCEV
itself, it seems weird for us to provide it at this layer rather than
making repeated queries into SCEV fast all on their own.

No functionality changed.

Modified:
    llvm/trunk/lib/Transforms/Scalar/LoopUnrollPass.cpp

Modified: llvm/trunk/lib/Transforms/Scalar/LoopUnrollPass.cpp
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Transforms/Scalar/LoopUnrollPass.cpp?rev=237993&r1=237992&r2=237993&view=diff
==============================================================================

--- llvm/trunk/lib/Transforms/Scalar/LoopUnrollPass.cpp (original)
+++ llvm/trunk/lib/Transforms/Scalar/LoopUnrollPass.cpp Thu May 21 22:02:22 2015
@@ -317,7 +317,82 @@ struct FindConstantPointers {
   }
   bool isDone() const { return !IndexIsConstant; }
 };
+} // End anonymous namespace.
 
+namespace {
+/// \brief Struct to represent a GEP whose start and step are known fixed
+/// offsets from a base address due to SCEV's analysis.
+struct SCEVGEPDescriptor {
+  Value *BaseAddr;
+  unsigned Start;
+  unsigned Step;
+};
+} // End anonymous namespace.
+
+/// \brief Build a cache of all the GEP instructions which SCEV can describe.
+///
+/// Visit all GEPs in the loop and find those which after complete loop
+/// unrolling would become a constant, or BaseAddress+Constant. For those where
+/// we can identify small constant starts and steps from a base address, return
+/// a map from the GEP to the base, start, and step relevant for that GEP. This
+/// is essentially a simplified and fast to query form of the SCEV analysis
+/// which we can afford to look into repeatedly for different iterations of the
+/// loop.
+static SmallDenseMap<Value *, SCEVGEPDescriptor>
+buildSCEVGEPCache(const Loop &L, ScalarEvolution &SE) {
+  SmallDenseMap<Value *, SCEVGEPDescriptor> Cache;
+
+  for (auto BB : L.getBlocks()) {
+    for (Instruction &I : *BB) {
+      if (GetElementPtrInst *GEP = dyn_cast<GetElementPtrInst>(&I)) {
+        Value *V = cast<Value>(GEP);
+        if (!SE.isSCEVable(V->getType()))
+            continue;
+        const SCEV *S = SE.getSCEV(V);
+        // FIXME: Hoist the initialization out of the loop.
+        FindConstantPointers Visitor(&L, SE);
+        SCEVTraversal<FindConstantPointers> T(Visitor);
+        // Try to find (BaseAddress+Step+Offset) tuple.
+        // If succeeded, save it to the cache - it might help in folding
+        // loads.
+        T.visitAll(S);
+        if (!Visitor.IndexIsConstant || !Visitor.BaseAddress)
+          continue;
+
+        const SCEV *BaseAddrSE = SE.getSCEV(Visitor.BaseAddress);
+        if (BaseAddrSE->getType() != S->getType())
+          continue;
+        const SCEV *OffSE = SE.getMinusSCEV(S, BaseAddrSE);
+        const SCEVAddRecExpr *AR = dyn_cast<SCEVAddRecExpr>(OffSE);
+
+        if (!AR)
+          continue;
+
+        const SCEVConstant *StepSE =
+            dyn_cast<SCEVConstant>(AR->getStepRecurrence(SE));
+        const SCEVConstant *StartSE = dyn_cast<SCEVConstant>(AR->getStart());
+        if (!StepSE || !StartSE)
+          continue;
+
+        // Check and skip caching if doing so would require lots of bits to
+        // avoid overflow.
+        APInt Start = StartSE->getValue()->getValue();
+        APInt Step = StepSE->getValue()->getValue();
+        if (Start.getActiveBits() > 32 || Step.getActiveBits() > 32)
+          continue;
+
+        // We found a cacheable SCEV model for the GEP.
+        Cache[V] = {Visitor.BaseAddress,
+                    (unsigned)Start.getLimitedValue(),
+                    (unsigned)Step.getLimitedValue()};
+      }
+    }
+  }
+
+  return Cache;
+}
+
+namespace {
 // This class is used to get an estimate of the optimization effects that we
 // could get from complete loop unrolling. It comes from the fact that some
 // loads might be replaced with concrete constant values and that could trigger
@@ -338,12 +413,6 @@ class UnrollAnalyzer : public InstVisito
   typedef InstVisitor<UnrollAnalyzer, bool> Base;
   friend class InstVisitor<UnrollAnalyzer, bool>;
 
-  struct SCEVGEPDescriptor {
-    Value *BaseAddr;
-    unsigned Start;
-    unsigned Step;
-  };
-
   /// \brief The loop we're going to analyze.
   const Loop *L;
 
@@ -364,13 +433,13 @@ class UnrollAnalyzer : public InstVisito
   // To avoid requesting SCEV info on every iteration, request it once, and
   // for each value that would become ConstAddress+Constant after loop
   // unrolling, save the corresponding data.
-  SmallDenseMap<Value *, SCEVGEPDescriptor> SCEVCache;
+  SmallDenseMap<Value *, SCEVGEPDescriptor> SCEVGEPCache;
 
   /// \brief Number of currently simulated iteration.
   ///
   /// If an expression is ConstAddress+Constant, then the Constant is
   /// Start + Iteration*Step, where Start and Step could be obtained from
-  /// SCEVCache.
+  /// SCEVGEPCache.
   unsigned Iteration;
 
   /// \brief Upper threshold for complete unrolling.
@@ -415,8 +484,8 @@ class UnrollAnalyzer : public InstVisito
       if (Constant *SimplifiedAddrOp = SimplifiedValues.lookup(AddrOp))
         AddrOp = SimplifiedAddrOp;
 
-    auto It = SCEVCache.find(AddrOp);
-    if (It == SCEVCache.end())
+    auto It = SCEVGEPCache.find(AddrOp);
+    if (It == SCEVGEPCache.end())
       return false;
     SCEVGEPDescriptor GEPDesc = It->second;
 
@@ -451,61 +520,6 @@ class UnrollAnalyzer : public InstVisito
     return true;
   }
 
-  /// Visit all GEPs in the loop and find those which after complete loop
-  /// unrolling would become a constant, or BaseAddress+Constant.
-  ///
-  /// Such GEPs could allow to evaluate a load to a constant later - for now we
-  /// just store the corresponding BaseAddress and StartValue with StepValue in
-  /// the SCEVCache.
-  void cacheSCEVResults() {
-    for (auto BB : L->getBlocks()) {
-      for (Instruction &I : *BB) {
-        if (GetElementPtrInst *GEP = dyn_cast<GetElementPtrInst>(&I)) {
-          Value *V = cast<Value>(GEP);
-          if (!SE.isSCEVable(V->getType()))
-              continue;
-          const SCEV *S = SE.getSCEV(V);
-          // FIXME: Hoist the initialization out of the loop.
-          FindConstantPointers Visitor(L, SE);
-          SCEVTraversal<FindConstantPointers> T(Visitor);
-          // Try to find (BaseAddress+Step+Offset) tuple.
-          // If succeeded, save it to the cache - it might help in folding
-          // loads.
-          T.visitAll(S);
-          if (!Visitor.IndexIsConstant || !Visitor.BaseAddress)
-            continue;
-
-          const SCEV *BaseAddrSE = SE.getSCEV(Visitor.BaseAddress);
-          if (BaseAddrSE->getType() != S->getType())
-            continue;
-          const SCEV *OffSE = SE.getMinusSCEV(S, BaseAddrSE);
-          const SCEVAddRecExpr *AR = dyn_cast<SCEVAddRecExpr>(OffSE);
-
-          if (!AR)
-            continue;
-
-          const SCEVConstant *StepSE =
-              dyn_cast<SCEVConstant>(AR->getStepRecurrence(SE));
-          const SCEVConstant *StartSE = dyn_cast<SCEVConstant>(AR->getStart());
-          if (!StepSE || !StartSE)
-            continue;
-
-          // Check and skip caching if doing so would require lots of bits to
-          // avoid overflow.
-          APInt Start = StartSE->getValue()->getValue();
-          APInt Step = StepSE->getValue()->getValue();
-          if (Start.getActiveBits() > 32 || Step.getActiveBits() > 32)
-            continue;
-
-          // We found a cacheable SCEV model for the GEP.
-          SCEVCache[V] = {Visitor.BaseAddress,
-                          (unsigned)Start.getLimitedValue(),
-                          (unsigned)Step.getLimitedValue()};
-        }
-      }
-    }
-  }
-
 public:
   UnrollAnalyzer(const Loop *L, unsigned TripCount, ScalarEvolution &SE,
                  const TargetTransformInfo &TTI, unsigned MaxUnrolledLoopSize)
@@ -546,8 +560,8 @@ public:
       return false;
 
     // To avoid compute SCEV-expressions on every iteration, compute them once
-    // and store interesting to us in SCEVCache.
-    cacheSCEVResults();
+    // and store interesting to us in SCEVGEPCache.
+    SCEVGEPCache = buildSCEVGEPCache(*L, SE);
 
     // Simulate execution of each iteration of the loop counting instructions,
     // which would be simplified.