[llvm] [LV] Strengthen calls to collectInstsToScalarize (NFC) (PR #130642)
Ramkumar Ramachandra via llvm-commits
llvm-commits at lists.llvm.org
Thu Mar 27 07:09:22 PDT 2025
https://github.com/artagnon updated https://github.com/llvm/llvm-project/pull/130642
>From 85ac80f8d04a77b341183975ece4cf9a1b863fc9 Mon Sep 17 00:00:00 2001
From: Ramkumar Ramachandra <ramkumar.ramachandra at codasip.com>
Date: Mon, 10 Mar 2025 17:23:50 +0000
Subject: [PATCH 1/2] [LV] Strengthen calls to collectInstsToScalarize (NFC)
Avoid the pattern of always calling collectInstsToScalarize after
collectUniformsAndScalars, and call it in collectUniformsAndScalars
instead. Also strengthen checks for early exits in the function.
---
.../Transforms/Vectorize/LoopVectorize.cpp | 25 ++++++++-----------
1 file changed, 10 insertions(+), 15 deletions(-)
diff --git a/llvm/lib/Transforms/Vectorize/LoopVectorize.cpp b/llvm/lib/Transforms/Vectorize/LoopVectorize.cpp
index 67509bd598f6a..598a6663e1ba8 100644
--- a/llvm/lib/Transforms/Vectorize/LoopVectorize.cpp
+++ b/llvm/lib/Transforms/Vectorize/LoopVectorize.cpp
@@ -980,7 +980,6 @@ class LoopVectorizationCostModel {
/// \return true if the UserVF is a feasible VF to be chosen.
bool selectUserVectorizationFactor(ElementCount UserVF) {
collectUniformsAndScalars(UserVF);
- collectInstsToScalarize(UserVF);
return expectedCost(UserVF).isValid();
}
@@ -1250,6 +1249,7 @@ class LoopVectorizationCostModel {
collectLoopUniforms(VF);
setVectorizedCallDecision(VF);
collectLoopScalars(VF);
+ collectInstsToScalarize(VF);
}
/// Returns true if the target machine supports masked store operation
@@ -5357,11 +5357,14 @@ bool LoopVectorizationCostModel::useEmulatedMaskMemRefHack(Instruction *I,
}
void LoopVectorizationCostModel::collectInstsToScalarize(ElementCount VF) {
- // If we aren't vectorizing the loop, or if we've already collected the
- // instructions to scalarize, there's nothing to do. Collection may already
- // have occurred if we have a user-selected VF and are now computing the
- // expected cost for interleaving.
- if (VF.isScalar() || VF.isZero() || InstsToScalarize.contains(VF))
+ assert(VF.isVector() && "Expected VF >= 2");
+
+ // If we've already collected the instructions to scalarize or the predicated
+ // BBs after vectorization, there's nothing to do. Collection may already have
+ // occurred if we have a user-selected VF and are now computing the expected
+ // cost for interleaving.
+ if (InstsToScalarize.contains(VF) ||
+ PredicatedBBsAfterVectorization.contains(VF))
return;
// Initialize a mapping for VF in InstsToScalalarize. If we find that it's
@@ -5369,8 +5372,6 @@ void LoopVectorizationCostModel::collectInstsToScalarize(ElementCount VF) {
// map will indicate that we've analyzed it already.
ScalarCostsTy &ScalarCostsVF = InstsToScalarize[VF];
- PredicatedBBsAfterVectorization[VF].clear();
-
// Find all the instructions that are scalar with predication in the loop and
// determine if it would be better to not if-convert the blocks they are in.
// If so, we also record the instructions to scalarize.
@@ -7160,16 +7161,10 @@ void LoopVectorizationPlanner::plan(ElementCount UserVF, unsigned UserIC) {
VFCandidates.push_back(VF);
CM.collectInLoopReductions();
- for (const auto &VF : VFCandidates) {
+ for (const auto &VF : VFCandidates)
// Collect Uniform and Scalar instructions after vectorization with VF.
CM.collectUniformsAndScalars(VF);
- // Collect the instructions (and their associated costs) that will be more
- // profitable to scalarize.
- if (VF.isVector())
- CM.collectInstsToScalarize(VF);
- }
-
buildVPlansWithVPRecipes(ElementCount::getFixed(1), MaxFactors.FixedVF);
buildVPlansWithVPRecipes(ElementCount::getScalable(1), MaxFactors.ScalableVF);
>From a65c77f55d61aca1970c3b7572e4bb58649f152d Mon Sep 17 00:00:00 2001
From: Ramkumar Ramachandra <ramkumar.ramachandra at codasip.com>
Date: Thu, 27 Mar 2025 14:06:52 +0000
Subject: [PATCH 2/2] [LV] Address review
---
llvm/lib/Transforms/Vectorize/LoopVectorize.cpp | 13 +++++++------
1 file changed, 7 insertions(+), 6 deletions(-)
diff --git a/llvm/lib/Transforms/Vectorize/LoopVectorize.cpp b/llvm/lib/Transforms/Vectorize/LoopVectorize.cpp
index 598a6663e1ba8..8e8057ad9672a 100644
--- a/llvm/lib/Transforms/Vectorize/LoopVectorize.cpp
+++ b/llvm/lib/Transforms/Vectorize/LoopVectorize.cpp
@@ -979,7 +979,7 @@ class LoopVectorizationCostModel {
/// Setup cost-based decisions for user vectorization factor.
/// \return true if the UserVF is a feasible VF to be chosen.
bool selectUserVectorizationFactor(ElementCount UserVF) {
- collectUniformsAndScalars(UserVF);
+ collectNonVectorized(UserVF);
return expectedCost(UserVF).isValid();
}
@@ -1235,13 +1235,13 @@ class LoopVectorizationCostModel {
/// the loop.
void collectInstsToScalarize(ElementCount VF);
- /// Collect Uniform and Scalar values for the given \p VF.
+ /// Collect Uniforms, Scalars, and Insts to Scalarize for the given \p VF.
/// The sets depend on CM decision for Load/Store instructions
/// that may be vectorized as interleave, gather-scatter or scalarized.
/// Also make a decision on what to do about call instructions in the loop
/// at that VF -- scalarize, call a known vector routine, or call a
/// vector intrinsic.
- void collectUniformsAndScalars(ElementCount VF) {
+ void collectNonVectorized(ElementCount VF) {
// Do the analysis once.
if (VF.isScalar() || Uniforms.contains(VF))
return;
@@ -5260,7 +5260,7 @@ LoopVectorizationCostModel::calculateRegisterUsage(ArrayRef<ElementCount> VFs) {
RegUsage[ClassID] += 1;
}
} else {
- collectUniformsAndScalars(VFs[J]);
+ collectNonVectorized(VFs[J]);
for (auto *Inst : OpenIntervals) {
// Skip ignored values for VF > 1.
if (VecValuesToIgnore.count(Inst))
@@ -7161,9 +7161,10 @@ void LoopVectorizationPlanner::plan(ElementCount UserVF, unsigned UserIC) {
VFCandidates.push_back(VF);
CM.collectInLoopReductions();
- for (const auto &VF : VFCandidates)
+ for (const auto &VF : VFCandidates) {
// Collect Uniform and Scalar instructions after vectorization with VF.
- CM.collectUniformsAndScalars(VF);
+ CM.collectNonVectorized(VF);
+ }
buildVPlansWithVPRecipes(ElementCount::getFixed(1), MaxFactors.FixedVF);
buildVPlansWithVPRecipes(ElementCount::getScalable(1), MaxFactors.ScalableVF);
More information about the llvm-commits
mailing list