[llvm] 411deb9 - [DAG] ScalarizeVectorResult - add ISD::MULHS/ISD::MULHU handling
Simon Pilgrim via llvm-commits
llvm-commits at lists.llvm.org
Thu Jun 22 03:11:02 PDT 2023
Author: Simon Pilgrim
Date: 2023-06-22T11:09:55+01:00
New Revision: 411deb97cfaf0266b5283c99aa6e9748763ced0c
URL: https://github.com/llvm/llvm-project/commit/411deb97cfaf0266b5283c99aa6e9748763ced0c
DIFF: https://github.com/llvm/llvm-project/commit/411deb97cfaf0266b5283c99aa6e9748763ced0c.diff
LOG: [DAG] ScalarizeVectorResult - add ISD::MULHS/ISD::MULHU handling
Fixes #63439
Added:
llvm/test/CodeGen/X86/pr63439.ll
Modified:
llvm/lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp
Removed:
################################################################################
diff --git a/llvm/lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp b/llvm/lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp
index 1a29aaff1b8c7..8b546ee415728 100644
--- a/llvm/lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp
+++ b/llvm/lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp
@@ -143,6 +143,8 @@ void DAGTypeLegalizer::ScalarizeVectorResult(SDNode *N, unsigned ResNo) {
case ISD::FREM:
case ISD::FSUB:
case ISD::MUL:
+ case ISD::MULHS:
+ case ISD::MULHU:
case ISD::OR:
case ISD::SDIV:
case ISD::SREM:
diff --git a/llvm/test/CodeGen/X86/pr63439.ll b/llvm/test/CodeGen/X86/pr63439.ll
new file mode 100644
index 0000000000000..155da0c629127
--- /dev/null
+++ b/llvm/test/CodeGen/X86/pr63439.ll
@@ -0,0 +1,52 @@
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
+; RUN: llc < %s -mtriple=x86_64-- -mattr=+sse4.1 | FileCheck %s --check-prefixes=CHECK,SSE
+; RUN: llc < %s -mtriple=x86_64-- -mattr=+avx2 | FileCheck %s --check-prefixes=CHECK,AVX
+
+define i16 @mulhs(i16 %a0, i16 %a1) {
+; CHECK-LABEL: mulhs:
+; CHECK: # %bb.0:
+; CHECK-NEXT: movswl %si, %ecx
+; CHECK-NEXT: movswl %di, %eax
+; CHECK-NEXT: imull %ecx, %eax
+; CHECK-NEXT: shrl $16, %eax
+; CHECK-NEXT: # kill: def $ax killed $ax killed $eax
+; CHECK-NEXT: retq
+ %x0 = sext i16 %a0 to i32
+ %x1 = sext i16 %a1 to i32
+ %v0 = insertelement <1 x i32> <i32 undef>, i32 %x0, i32 0
+ %v1 = insertelement <1 x i32> <i32 undef>, i32 %x1, i32 0
+ %mul = mul nsw <1 x i32> %v0, %v1
+ %lshr = lshr <1 x i32> %mul, <i32 16>
+ %trunc = trunc <1 x i32> %lshr to <1 x i16>
+ %res = extractelement <1 x i16> %trunc, i32 0
+ ret i16 %res
+}
+
+define i16 @mulhu(i16 %a0, i16 %a1) {
+; SSE-LABEL: mulhu:
+; SSE: # %bb.0:
+; SSE-NEXT: movzwl %si, %ecx
+; SSE-NEXT: movzwl %di, %eax
+; SSE-NEXT: imull %ecx, %eax
+; SSE-NEXT: shrl $16, %eax
+; SSE-NEXT: # kill: def $ax killed $ax killed $eax
+; SSE-NEXT: retq
+;
+; AVX-LABEL: mulhu:
+; AVX: # %bb.0:
+; AVX-NEXT: vmovd %edi, %xmm0
+; AVX-NEXT: vmovd %esi, %xmm1
+; AVX-NEXT: vpmulhuw %xmm1, %xmm0, %xmm0
+; AVX-NEXT: vmovd %xmm0, %eax
+; AVX-NEXT: # kill: def $ax killed $ax killed $eax
+; AVX-NEXT: retq
+ %x0 = zext i16 %a0 to i32
+ %x1 = zext i16 %a1 to i32
+ %v0 = insertelement <1 x i32> <i32 undef>, i32 %x0, i32 0
+ %v1 = insertelement <1 x i32> <i32 undef>, i32 %x1, i32 0
+ %mul = mul nsw <1 x i32> %v0, %v1
+ %lshr = lshr <1 x i32> %mul, <i32 16>
+ %trunc = trunc <1 x i32> %lshr to <1 x i16>
+ %res = extractelement <1 x i16> %trunc, i32 0
+ ret i16 %res
+}
More information about the llvm-commits
mailing list