[llvm] [X86] Add growShuffleMask helper to grow the shuffle mask for a larger value type. NFC. (PR #134243)
Simon Pilgrim via llvm-commits
llvm-commits at lists.llvm.org
Thu Apr 3 05:49:27 PDT 2025
https://github.com/RKSimon created https://github.com/llvm/llvm-project/pull/134243
Prep work for #133947
>From 8440fe71948e3a09f7b7d0552ad4b5cd2313a467 Mon Sep 17 00:00:00 2001
From: Simon Pilgrim <llvm-dev at redking.me.uk>
Date: Thu, 3 Apr 2025 13:45:40 +0100
Subject: [PATCH] [X86] Add growShuffleMask helper to grow the shuffle mask for
a larger value type. NFC.
Prep work for #133947
---
llvm/lib/Target/X86/X86ISelLowering.cpp | 28 ++++++++++++++++++-------
1 file changed, 20 insertions(+), 8 deletions(-)
diff --git a/llvm/lib/Target/X86/X86ISelLowering.cpp b/llvm/lib/Target/X86/X86ISelLowering.cpp
index 8271d9c486650..d1be19539b642 100644
--- a/llvm/lib/Target/X86/X86ISelLowering.cpp
+++ b/llvm/lib/Target/X86/X86ISelLowering.cpp
@@ -3941,6 +3941,24 @@ static bool canScaleShuffleElements(ArrayRef<int> Mask, unsigned NumDstElts) {
return scaleShuffleElements(Mask, NumDstElts, ScaledMask);
}
+// Helper to grow the shuffle mask for a larger value type.
+// NOTE: This is different to scaleShuffleElements which is a same size type.
+static void growShuffleMask(ArrayRef<int> SrcMask,
+ SmallVectorImpl<int> &DstMask,
+ unsigned SrcSizeInBits, unsigned DstSizeInBits) {
+ assert(DstMask.empty() && "Expected an empty shuffle mas");
+ assert((DstSizeInBits % SrcSizeInBits) == 0 && "Illegal shuffle scale");
+ unsigned Scale = DstSizeInBits / SrcSizeInBits;
+ unsigned NumSrcElts = SrcMask.size();
+ DstMask.assign(SrcMask.begin(), SrcMask.end());
+ for (int &M : DstMask) {
+ if (M < 0)
+ continue;
+ M = (M % NumSrcElts) + ((M / NumSrcElts) * Scale * NumSrcElts);
+ }
+ DstMask.append((Scale - 1) * NumSrcElts, SM_SentinelUndef);
+}
+
/// Returns true if Elt is a constant zero or a floating point constant +0.0.
bool X86::isZeroNode(SDValue Elt) {
return isNullConstant(Elt) || isNullFPConstant(Elt);
@@ -40456,19 +40474,13 @@ static SDValue combineX86ShuffleChainWithExtract(
}
// Bail if we fail to find a source larger than the existing root.
- unsigned Scale = WideSizeInBits / RootSizeInBits;
if (WideSizeInBits <= RootSizeInBits ||
(WideSizeInBits % RootSizeInBits) != 0)
return SDValue();
// Create new mask for larger type.
- SmallVector<int, 64> WideMask(BaseMask);
- for (int &M : WideMask) {
- if (M < 0)
- continue;
- M = (M % NumMaskElts) + ((M / NumMaskElts) * Scale * NumMaskElts);
- }
- WideMask.append((Scale - 1) * NumMaskElts, SM_SentinelUndef);
+ SmallVector<int, 64> WideMask;
+ growShuffleMask(BaseMask, WideMask, RootSizeInBits, WideSizeInBits);
// Attempt to peek through inputs and adjust mask when we extract from an
// upper subvector.
More information about the llvm-commits
mailing list