[PATCH] D145678: [RISCV] Model interleave and deinterleave shuffles in cost model
Luke Lau via Phabricator via llvm-commits
llvm-commits at lists.llvm.org
Thu Mar 9 17:10:10 PST 2023
This revision was automatically updated to reflect the committed changes.
Closed by commit rGc417266db506: [RISCV] Model interleave and deinterleave shuffles in cost model (authored by luke).
Repository:
rG LLVM Github Monorepo
CHANGES SINCE LAST ACTION
https://reviews.llvm.org/D145678/new/
https://reviews.llvm.org/D145678
Files:
llvm/lib/Target/RISCV/RISCVTargetTransformInfo.cpp
llvm/test/Analysis/CostModel/RISCV/shuffle-interleave.ll
Index: llvm/test/Analysis/CostModel/RISCV/shuffle-interleave.ll
===================================================================
--- llvm/test/Analysis/CostModel/RISCV/shuffle-interleave.ll
+++ llvm/test/Analysis/CostModel/RISCV/shuffle-interleave.ll
@@ -4,7 +4,7 @@
define <8 x i8> @interleave2_v8i8(<4 x i8> %v0, <4 x i8> %v1) {
; CHECK-LABEL: 'interleave2_v8i8'
; CHECK-NEXT: Cost Model: Found an estimated cost of 15 for instruction: %concat = shufflevector <4 x i8> %v0, <4 x i8> %v1, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
-; CHECK-NEXT: Cost Model: Found an estimated cost of 30 for instruction: %res = shufflevector <8 x i8> %concat, <8 x i8> poison, <8 x i32> <i32 0, i32 4, i32 1, i32 5, i32 2, i32 6, i32 3, i32 7>
+; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %res = shufflevector <8 x i8> %concat, <8 x i8> poison, <8 x i32> <i32 0, i32 4, i32 1, i32 5, i32 2, i32 6, i32 3, i32 7>
; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret <8 x i8> %res
;
%concat = shufflevector <4 x i8> %v0, <4 x i8> %v1, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
@@ -15,7 +15,7 @@
define <8 x i32> @interleave2_v8i32(<4 x i32> %v0, <4 x i32> %v1) {
; CHECK-LABEL: 'interleave2_v8i32'
; CHECK-NEXT: Cost Model: Found an estimated cost of 15 for instruction: %concat = shufflevector <4 x i32> %v0, <4 x i32> %v1, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
-; CHECK-NEXT: Cost Model: Found an estimated cost of 30 for instruction: %res = shufflevector <8 x i32> %concat, <8 x i32> poison, <8 x i32> <i32 0, i32 4, i32 1, i32 5, i32 2, i32 6, i32 3, i32 7>
+; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %res = shufflevector <8 x i32> %concat, <8 x i32> poison, <8 x i32> <i32 0, i32 4, i32 1, i32 5, i32 2, i32 6, i32 3, i32 7>
; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret <8 x i32> %res
;
%concat = shufflevector <4 x i32> %v0, <4 x i32> %v1, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
Index: llvm/lib/Target/RISCV/RISCVTargetTransformInfo.cpp
===================================================================
--- llvm/lib/Target/RISCV/RISCVTargetTransformInfo.cpp
+++ llvm/lib/Target/RISCV/RISCVTargetTransformInfo.cpp
@@ -8,7 +8,9 @@
#include "RISCVTargetTransformInfo.h"
#include "MCTargetDesc/RISCVMatInt.h"
+#include "llvm/ADT/STLExtras.h"
#include "llvm/Analysis/TargetTransformInfo.h"
+#include "llvm/Analysis/VectorUtils.h"
#include "llvm/CodeGen/BasicTTIImpl.h"
#include "llvm/CodeGen/CostTable.h"
#include "llvm/CodeGen/TargetLowering.h"
@@ -323,6 +325,34 @@
return LT.first * getLMULCost(LT.second);
}
+ if (isa<FixedVectorType>(Tp) && Kind == TTI::SK_PermuteSingleSrc &&
+ Mask.size() >= 2) {
+ std::pair<InstructionCost, MVT> LT = getTypeLegalizationCost(Tp);
+ if (LT.second.isFixedLengthVector()) {
+ MVT EltTp = LT.second.getVectorElementType();
+ // If the size of the element is < ELEN then shuffles of interleaves and
+ // deinterleaves of 2 vectors can be lowered into the following sequences
+ if (EltTp.getScalarSizeInBits() < ST->getELEN()) {
+ auto InterleaveMask = createInterleaveMask(Mask.size() / 2, 2);
+ // Example sequence:
+ // vsetivli zero, 4, e8, mf4, ta, ma (ignored)
+ // vwaddu.vv v10, v8, v9
+ // li a0, -1 (ignored)
+ // vwmaccu.vx v10, a0, v9
+ if (equal(InterleaveMask, Mask))
+ return 2 * LT.first * getLMULCost(LT.second);
+
+ if (Mask[0] == 0 || Mask[0] == 1) {
+ auto DeinterleaveMask = createStrideMask(Mask[0], 2, Mask.size());
+ // Example sequence:
+ // vnsrl.wi v10, v8, 0
+ if (equal(DeinterleaveMask, Mask))
+ return LT.first * getLMULCost(LT.second);
+ }
+ }
+ }
+ }
+
return BaseT::getShuffleCost(Kind, Tp, Mask, CostKind, Index, SubTp);
}
-------------- next part --------------
A non-text attachment was scrubbed...
Name: D145678.503987.patch
Type: text/x-patch
Size: 4038 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/llvm-commits/attachments/20230310/3529ebc7/attachment.bin>
More information about the llvm-commits
mailing list