[llvm] [GISel][AMDGPU] Expand ShuffleVector (PR #124527)
Matt Arsenault via llvm-commits
llvm-commits at lists.llvm.org
Sun Feb 16 04:35:33 PST 2025
================
@@ -384,6 +384,69 @@ void CombinerHelper::applyCombineConcatVectors(
MI.eraseFromParent();
}
+bool CombinerHelper::matchCombineShuffleExtract(MachineInstr &MI,
+ int64_t &Idx) const {
+ assert(MI.getOpcode() == TargetOpcode::G_SHUFFLE_VECTOR &&
+ "Invalid instruction");
+ auto &Shuffle = cast<GShuffleVector>(MI);
+
+ auto SrcVec1 = Shuffle.getSrc1Reg();
+ int SrcVec2 = Shuffle.getSrc2Reg();
+
+ LLT SrcVec1Type = MRI.getType(SrcVec1);
+ LLT SrcVec2Type = MRI.getType(SrcVec2);
+ if (!SrcVec1Type.isVector() || !SrcVec2Type.isVector()) {
+ return false;
+ }
+
+ auto Mask = Shuffle.getMask();
+ int Width = MRI.getType(SrcVec1).getNumElements();
+ int Width2 = MRI.getType(SrcVec2).getNumElements();
+
+ if (!llvm::isPowerOf2_32(Width))
+ return false;
+
+ // Check if all elements are extracted from the same vector, or within single
+ // vector.
+ auto MaxValue = *std::max_element(Mask.begin(), Mask.end());
+ auto MinValue = *std::min_element(Mask.begin(), Mask.end());
+ if (MaxValue >= Width && MinValue < Width) {
+ return false;
+ }
+
+ // Check that the extractee length is power of 2.
+ if ((MaxValue < Width && !llvm::isPowerOf2_32(Width)) ||
+ (MinValue >= Width && !llvm::isPowerOf2_32(Width2))) {
+ return false;
+ }
+
+ // Check if the extractee's order is kept, and they should be consecutive.
+ for (size_t i = 1; i < Mask.size(); ++i) {
+ if (Mask[i] != Mask[i - 1] + 1) {
+ return false; // Not consecutive
+ }
+ }
+
+ Idx = Mask.front();
+ return true;
+}
+
+void CombinerHelper::applyCombineShuffleExtract(MachineInstr &MI,
+ int64_t Idx) const {
+ auto &Shuffle = cast<GShuffleVector>(MI);
+
+ auto SrcVec1 = Shuffle.getSrc1Reg();
+ auto SrcVec2 = Shuffle.getSrc2Reg();
+ auto EltTy = MRI.getType(SrcVec1).getElementType();
+ int Width = MRI.getType(SrcVec1).getNumElements();
+
+ auto SrcVec = Idx < Width ? SrcVec1 : SrcVec2;
+
+ Builder.buildExtract(MI.getOperand(0).getReg(), SrcVec,
----------------
arsenm wrote:
No, G_EXTRACT. G_EXTRACT_SUBVECTOR and G_EXTRACT_VECTOR_ELT are better defined, typed operations
https://github.com/llvm/llvm-project/pull/124527
More information about the llvm-commits
mailing list