[Mlir-commits] [mlir] [mlir][SCF] Add support for peeling the first iteration out of the loop (PR #74015)
llvmlistbot at llvm.org
llvmlistbot at llvm.org
Wed Dec 6 23:49:37 PST 2023
================
@@ -205,32 +222,92 @@ LogicalResult mlir::scf::peelForLoopAndSimplifyBounds(RewriterBase &rewriter,
return success();
}
+LogicalResult mlir::scf::peelFirstIterationForLoop(RewriterBase &b, ForOp forOp,
+ ForOp &firstIteration) {
+ RewriterBase::InsertionGuard guard(b);
+ auto lbInt = getConstantIntValue(forOp.getLowerBound());
+ auto ubInt = getConstantIntValue(forOp.getUpperBound());
+ auto stepInt = getConstantIntValue(forOp.getStep());
+
+ // Peeling is not needed if there is one or less iteration.
+ if (lbInt && ubInt && stepInt && (*ubInt - *lbInt) / *stepInt <= 1)
+ return success();
+
+ // Slow path: Examine the ops that define lb, ub and step.
+ AffineExpr sym0, sym1, sym2;
+ bindSymbols(b.getContext(), sym0, sym1, sym2);
+ SmallVector<Value> operands{forOp.getLowerBound(), forOp.getUpperBound(),
+ forOp.getStep()};
+ AffineMap map = AffineMap::get(0, 3, {(sym1 - sym0) % sym2});
+ affine::fullyComposeAffineMapAndOperands(&map, &operands);
+ if (auto constExpr = dyn_cast<AffineConstantExpr>(map.getResult(0)))
+ if (constExpr.getValue() == 0)
+ return failure();
+
+ // New lower bound for main loop: %lb + %step
+ auto ubMap = AffineMap::get(0, 3, {sym0 + sym2});
+ b.setInsertionPoint(forOp);
+ auto loc = forOp.getLoc();
+ Value splitBound = b.createOrFold<AffineApplyOp>(
+ loc, ubMap,
+ ValueRange{forOp.getLowerBound(), forOp.getUpperBound(),
+ forOp.getStep()});
+
+ // Peel the first iteration.
+ b.setInsertionPoint(forOp);
+ firstIteration = cast<ForOp>(b.clone(*forOp.getOperation()));
----------------
MaheshRavishankar wrote:
If you use `mlir::clone` method, you can update the operands during cloning. Updating the operands as done below can cause some strange issues when there is a listener involved.
https://github.com/llvm/llvm-project/pull/74015
More information about the Mlir-commits
mailing list