[llvm] 9e83333 - [AArch64][SelectionDAG] Eliminates redundant zero-extension for 32-bit popcount
via llvm-commits
llvm-commits at lists.llvm.org
Mon Jan 9 00:08:46 PST 2023
Author: zhongyunde
Date: 2023-01-09T16:08:16+08:00
New Revision: 9e83333445715e737ea78e42e082c99c8ebcb7df
URL: https://github.com/llvm/llvm-project/commit/9e83333445715e737ea78e42e082c99c8ebcb7df
DIFF: https://github.com/llvm/llvm-project/commit/9e83333445715e737ea78e42e082c99c8ebcb7df.diff
LOG: [AArch64][SelectionDAG] Eliminates redundant zero-extension for 32-bit popcount
Fix https://github.com/llvm/llvm-project/issues/59597.
mov w8, w0 + fmov d0, x8 ==> fmov s0, w0
Reviewed By: dmgreen, efriedma
Differential Revision: https://reviews.llvm.org/D140649
Added:
Modified:
llvm/lib/Target/AArch64/AArch64InstrInfo.td
llvm/test/CodeGen/AArch64/arm64-popcnt.ll
Removed:
################################################################################
diff --git a/llvm/lib/Target/AArch64/AArch64InstrInfo.td b/llvm/lib/Target/AArch64/AArch64InstrInfo.td
index 66b03eaae5ffc..de9da9e09f3b1 100644
--- a/llvm/lib/Target/AArch64/AArch64InstrInfo.td
+++ b/llvm/lib/Target/AArch64/AArch64InstrInfo.td
@@ -5843,6 +5843,10 @@ def : Pat<(v8i8 (scalar_to_vector GPR32:$Rn)),
(SUBREG_TO_REG (i32 0),
(f32 (COPY_TO_REGCLASS GPR32:$Rn, FPR32)), ssub)>;
+// The top bits will be zero from the FMOVWSr
+def : Pat<(v8i8 (bitconvert (i64 (zext GPR32:$Rn)))),
+ (SUBREG_TO_REG (i32 0), (f32 (FMOVWSr GPR32:$Rn)), ssub)>;
+
def : Pat<(v8i16 (scalar_to_vector GPR32:$Rn)),
(SUBREG_TO_REG (i32 0),
(f32 (COPY_TO_REGCLASS GPR32:$Rn, FPR32)), ssub)>;
diff --git a/llvm/test/CodeGen/AArch64/arm64-popcnt.ll b/llvm/test/CodeGen/AArch64/arm64-popcnt.ll
index 2a4b30a9078d0..a1ee453e8d6a5 100644
--- a/llvm/test/CodeGen/AArch64/arm64-popcnt.ll
+++ b/llvm/test/CodeGen/AArch64/arm64-popcnt.ll
@@ -6,8 +6,7 @@
define i32 @cnt32_advsimd(i32 %x) nounwind readnone {
; CHECK-LABEL: cnt32_advsimd:
; CHECK: // %bb.0:
-; CHECK-NEXT: mov w8, w0
-; CHECK-NEXT: fmov d0, x8
+; CHECK-NEXT: fmov s0, w0
; CHECK-NEXT: cnt.8b v0, v0
; CHECK-NEXT: uaddlv.8b h0, v0
; CHECK-NEXT: fmov w0, s0
@@ -42,7 +41,7 @@ define i32 @cnt32_advsimd_2(<2 x i32> %x) {
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $d0 killed $d0 def $q0
; CHECK-NEXT: fmov w8, s0
-; CHECK-NEXT: fmov d0, x8
+; CHECK-NEXT: fmov s0, w8
; CHECK-NEXT: cnt.8b v0, v0
; CHECK-NEXT: uaddlv.8b h0, v0
; CHECK-NEXT: fmov w0, s0
@@ -267,6 +266,13 @@ define i1 @ctpop32_ne_one(i32 %x) nounwind readnone {
; CHECK-NONEON-NEXT: ccmp w0, #0, #4, eq
; CHECK-NONEON-NEXT: cset w0, eq
; CHECK-NONEON-NEXT: ret
+;
+; CHECK-CSSC-LABEL: ctpop32_ne_one:
+; CHECK-CSSC: // %bb.0:
+; CHECK-CSSC-NEXT: cnt w8, w0
+; CHECK-CSSC-NEXT: cmp w8, #1
+; CHECK-CSSC-NEXT: cset w0, ne
+; CHECK-CSSC-NEXT: ret
%count = tail call i32 @llvm.ctpop.i32(i32 %x)
%cmp = icmp ne i32 %count, 1
ret i1 %cmp
More information about the llvm-commits
mailing list