[llvm] [SLP]Do not count extractelement costs in unreachable/landing pad blocks. (PR #105667)
Alexey Bataev via llvm-commits
llvm-commits at lists.llvm.org
Thu Aug 22 07:16:03 PDT 2024
https://github.com/alexey-bataev created https://github.com/llvm/llvm-project/pull/105667
If the external user of the scalar to be extract is in
unreachable/landing pad block, we can skip counting their cost.
>From 30304074ec485eed7fbaedf8526b3c9c8ca9ad29 Mon Sep 17 00:00:00 2001
From: Alexey Bataev <a.bataev at outlook.com>
Date: Thu, 22 Aug 2024 14:15:49 +0000
Subject: [PATCH] =?UTF-8?q?[=F0=9D=98=80=F0=9D=97=BD=F0=9D=97=BF]=20initia?=
=?UTF-8?q?l=20version?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit
Created using spr 1.3.5
---
llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp | 16 ++++++++++------
.../X86/same-scalar-in-same-phi-extract.ll | 3 ++-
2 files changed, 12 insertions(+), 7 deletions(-)
diff --git a/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp b/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp
index 8f70a43465b8ac..d7763a022f3b6e 100644
--- a/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp
+++ b/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp
@@ -10768,17 +10768,21 @@ InstructionCost BoUpSLP::getTreeCost(ArrayRef<Value *> VectorizedVals) {
std::optional<DenseMap<Value *, unsigned>> ValueToExtUses;
DenseMap<const TreeEntry *, DenseSet<Value *>> ExtractsCount;
for (ExternalUser &EU : ExternalUses) {
+ // Uses by ephemeral values are free (because the ephemeral value will be
+ // removed prior to code generation, and so the extraction will be
+ // removed as well) as well as uses in unreachable blocks or in landing pads
+ // (rarely executed).
+ if (EphValues.count(EU.User) ||
+ (EU.User &&
+ (!DT->isReachableFromEntry(cast<Instruction>(EU.User)->getParent()) ||
+ cast<Instruction>(EU.User)->getParent()->isLandingPad())))
+ continue;
+
// We only add extract cost once for the same scalar.
if (!isa_and_nonnull<InsertElementInst>(EU.User) &&
!ExtractCostCalculated.insert(EU.Scalar).second)
continue;
- // Uses by ephemeral values are free (because the ephemeral value will be
- // removed prior to code generation, and so the extraction will be
- // removed as well).
- if (EphValues.count(EU.User))
- continue;
-
// No extract cost for vector "scalar"
if (isa<FixedVectorType>(EU.Scalar->getType()))
continue;
diff --git a/llvm/test/Transforms/SLPVectorizer/X86/same-scalar-in-same-phi-extract.ll b/llvm/test/Transforms/SLPVectorizer/X86/same-scalar-in-same-phi-extract.ll
index 8bcf650d41d931..f1be11d0d0fc51 100644
--- a/llvm/test/Transforms/SLPVectorizer/X86/same-scalar-in-same-phi-extract.ll
+++ b/llvm/test/Transforms/SLPVectorizer/X86/same-scalar-in-same-phi-extract.ll
@@ -5,7 +5,6 @@ define void @test(i32 %arg) {
; CHECK-LABEL: define void @test(
; CHECK-SAME: i32 [[ARG:%.*]]) {
; CHECK-NEXT: bb:
-; CHECK-NEXT: [[TMP2:%.*]] = zext i32 [[ARG]] to i64
; CHECK-NEXT: [[TMP0:%.*]] = insertelement <2 x i32> <i32 poison, i32 0>, i32 [[ARG]], i32 0
; CHECK-NEXT: br label [[BB2:%.*]]
; CHECK: bb2:
@@ -15,6 +14,8 @@ define void @test(i32 %arg) {
; CHECK-NEXT: i32 1, label [[BB4:%.*]]
; CHECK-NEXT: ]
; CHECK: bb3:
+; CHECK-NEXT: [[TMP1:%.*]] = extractelement <2 x i32> [[TMP0]], i32 0
+; CHECK-NEXT: [[TMP2:%.*]] = zext i32 [[TMP1]] to i64
; CHECK-NEXT: switch i32 0, label [[BB10]] [
; CHECK-NEXT: i32 18, label [[BB7:%.*]]
; CHECK-NEXT: i32 1, label [[BB7]]
More information about the llvm-commits
mailing list