[llvm] [AArch64] Add flag to control unrolling for small multi-exit loops (PR #131998)
Igor Kirillov via llvm-commits
llvm-commits at lists.llvm.org
Thu Mar 27 02:22:13 PDT 2025
================
@@ -4237,6 +4242,81 @@ getFalkorUnrollingPreferences(Loop *L, ScalarEvolution &SE,
}
}
+static bool shouldUnrollLoopWithInstruction(Instruction &I,
+ AArch64TTIImpl &TTI) {
+ // Don't unroll vectorised loop.
+ if (I.getType()->isVectorTy())
+ return false;
+
+ if (isa<CallInst>(I) || isa<InvokeInst>(I)) {
+ if (const Function *F = cast<CallBase>(I).getCalledFunction())
+ if (!TTI.isLoweredToCall(F))
+ return true;
+ return false;
+ }
+
+ return true;
+}
+
+static InstructionCost getSizeOfLoop(Loop *L, AArch64TTIImpl &TTI) {
+ // Estimate the size of the loop.
+ InstructionCost Size = 0;
+ for (auto *BB : L->getBlocks()) {
+ for (auto &I : *BB) {
+ if (!shouldUnrollLoopWithInstruction(I, TTI))
+ return InstructionCost::getInvalid();
+
+ SmallVector<const Value *, 4> Operands(I.operand_values());
+ InstructionCost Cost =
+ TTI.getInstructionCost(&I, Operands, TTI::TCK_CodeSize);
+ // This can happen with intrinsics that don't currently have a cost model
+ // or for some operations that require SVE.
+ if (!Cost.isValid())
+ return InstructionCost::getInvalid();
+ Size += *Cost.getValue();
+ }
+ }
+ return Size;
+}
+
+static bool shouldUnrollMultiExitLoop(Loop *L, ScalarEvolution &SE,
+ AArch64TTIImpl &TTI) {
+ // Only consider loops with unknown trip counts for which we can determine
+ // a symbolic expression. Multi-exit loops with small known trip counts will
+ // likely be unrolled anyway.
+ const SCEV *BTC = SE.getSymbolicMaxBackedgeTakenCount(L);
+ if (isa<SCEVConstant>(BTC) || isa<SCEVCouldNotCompute>(BTC))
+ return false;
+
+ // It might not be worth unrolling loops with low max trip counts. Restrict
+ // this to max trip counts > 32 for now.
+ unsigned MaxTC = SE.getSmallConstantMaxTripCount(L);
+ if (MaxTC > 0 && MaxTC <= 32)
+ return false;
+
+ if (findStringMetadataForLoop(L, "llvm.loop.isvectorized"))
+ return false;
+
+ // Estimate the size of the loop.
+ InstructionCost Size = getSizeOfLoop(L, TTI);
+ if (!Size.isValid())
+ return false;
+
+ // Small search loops with multiple exits can be highly beneficial to unroll.
+ // We only care about loops with exactly two exiting blocks, although each
+ // block could jump to the same exit block.
+ SmallVector<BasicBlock *> Blocks(L->getBlocks());
----------------
igogo-x86 wrote:
I think we can avoid copying blocks here by ArrayRef or auto&:
```
ArrayRef<BasicBlock*> Blocks = L->getBlocks();
```
https://github.com/llvm/llvm-project/pull/131998
More information about the llvm-commits
mailing list