[llvm] 8cf3988 - [X86] combineConcatVectorOps - add pmaddwd/pmaddubsw handling
Simon Pilgrim via llvm-commits
llvm-commits at lists.llvm.org
Fri Jun 21 05:25:46 PDT 2024
Author: Simon Pilgrim
Date: 2024-06-21T13:25:29+01:00
New Revision: 8cf39881d17becb1afef85190a602c4f76fe70d4
URL: https://github.com/llvm/llvm-project/commit/8cf39881d17becb1afef85190a602c4f76fe70d4
DIFF: https://github.com/llvm/llvm-project/commit/8cf39881d17becb1afef85190a602c4f76fe70d4.diff
LOG: [X86] combineConcatVectorOps - add pmaddwd/pmaddubsw handling
Added:
Modified:
llvm/lib/Target/X86/X86ISelLowering.cpp
llvm/test/CodeGen/X86/combine-pmadd.ll
Removed:
################################################################################
diff --git a/llvm/lib/Target/X86/X86ISelLowering.cpp b/llvm/lib/Target/X86/X86ISelLowering.cpp
index 2d5066dd8854c..f51a5e6c45184 100644
--- a/llvm/lib/Target/X86/X86ISelLowering.cpp
+++ b/llvm/lib/Target/X86/X86ISelLowering.cpp
@@ -55921,6 +55921,8 @@ static SDValue combineConcatVectorOps(const SDLoc &DL, MVT VT,
break;
case X86ISD::PSHUFB:
case X86ISD::PSADBW:
+ case X86ISD::VPMADDUBSW:
+ case X86ISD::VPMADDWD:
if (!IsSplat && ((VT.is256BitVector() && Subtarget.hasInt256()) ||
(VT.is512BitVector() && Subtarget.useBWIRegs()))) {
MVT SrcVT = Op0.getOperand(0).getSimpleValueType();
diff --git a/llvm/test/CodeGen/X86/combine-pmadd.ll b/llvm/test/CodeGen/X86/combine-pmadd.ll
index c4a28fe2eda34..c1bb310ec0119 100644
--- a/llvm/test/CodeGen/X86/combine-pmadd.ll
+++ b/llvm/test/CodeGen/X86/combine-pmadd.ll
@@ -51,9 +51,11 @@ define <8 x i32> @combine_pmaddwd_concat(<8 x i16> %a0, <8 x i16> %a1, <8 x i16>
;
; AVX2-LABEL: combine_pmaddwd_concat:
; AVX2: # %bb.0:
-; AVX2-NEXT: vpmaddwd %xmm1, %xmm0, %xmm0
-; AVX2-NEXT: vpmaddwd %xmm3, %xmm2, %xmm1
-; AVX2-NEXT: vinserti128 $1, %xmm1, %ymm0, %ymm0
+; AVX2-NEXT: # kill: def $xmm1 killed $xmm1 def $ymm1
+; AVX2-NEXT: # kill: def $xmm0 killed $xmm0 def $ymm0
+; AVX2-NEXT: vinserti128 $1, %xmm3, %ymm1, %ymm1
+; AVX2-NEXT: vinserti128 $1, %xmm2, %ymm0, %ymm0
+; AVX2-NEXT: vpmaddwd %ymm1, %ymm0, %ymm0
; AVX2-NEXT: retq
%1 = call <4 x i32> @llvm.x86.sse2.pmadd.wd(<8 x i16> %a0, <8 x i16> %a1)
%2 = call <4 x i32> @llvm.x86.sse2.pmadd.wd(<8 x i16> %a2, <8 x i16> %a3)
@@ -116,9 +118,11 @@ define <16 x i16> @combine_pmaddubsw_concat(<16 x i8> %a0, <16 x i8> %a1, <16 x
;
; AVX2-LABEL: combine_pmaddubsw_concat:
; AVX2: # %bb.0:
-; AVX2-NEXT: vpmaddubsw %xmm1, %xmm0, %xmm0
-; AVX2-NEXT: vpmaddubsw %xmm3, %xmm2, %xmm1
-; AVX2-NEXT: vinserti128 $1, %xmm1, %ymm0, %ymm0
+; AVX2-NEXT: # kill: def $xmm1 killed $xmm1 def $ymm1
+; AVX2-NEXT: # kill: def $xmm0 killed $xmm0 def $ymm0
+; AVX2-NEXT: vinserti128 $1, %xmm3, %ymm1, %ymm1
+; AVX2-NEXT: vinserti128 $1, %xmm2, %ymm0, %ymm0
+; AVX2-NEXT: vpmaddubsw %ymm1, %ymm0, %ymm0
; AVX2-NEXT: retq
%1 = call <8 x i16> @llvm.x86.ssse3.pmadd.ub.sw.128(<16 x i8> %a0, <16 x i8> %a1)
%2 = call <8 x i16> @llvm.x86.ssse3.pmadd.ub.sw.128(<16 x i8> %a2, <16 x i8> %a3)
More information about the llvm-commits
mailing list