[llvm] 6c59dfb - [X86] Add test showing failure to remove freeze from all_of pattern
Simon Pilgrim via llvm-commits
llvm-commits at lists.llvm.org
Tue Sep 3 02:16:15 PDT 2024
Author: Simon Pilgrim
Date: 2024-09-03T10:15:51+01:00
New Revision: 6c59dfb0184aa11ec202f1cd8aee9e971a1565a4
URL: https://github.com/llvm/llvm-project/commit/6c59dfb0184aa11ec202f1cd8aee9e971a1565a4
DIFF: https://github.com/llvm/llvm-project/commit/6c59dfb0184aa11ec202f1cd8aee9e971a1565a4.diff
LOG: [X86] Add test showing failure to remove freeze from all_of pattern
Added:
Modified:
llvm/test/CodeGen/X86/movmsk-cmp.ll
Removed:
################################################################################
diff --git a/llvm/test/CodeGen/X86/movmsk-cmp.ll b/llvm/test/CodeGen/X86/movmsk-cmp.ll
index 253f990f8735ee..5bc2e12d502dc4 100644
--- a/llvm/test/CodeGen/X86/movmsk-cmp.ll
+++ b/llvm/test/CodeGen/X86/movmsk-cmp.ll
@@ -4425,6 +4425,61 @@ define i32 @PR39665_c_ray_opt(<2 x double> %x, <2 x double> %y) {
ret i32 %r
}
+define i32 @PR39665_c_ray_select(<2 x double> %x, <2 x double> %y) {
+; SSE-LABEL: PR39665_c_ray_select:
+; SSE: # %bb.0:
+; SSE-NEXT: cmpltpd %xmm0, %xmm1
+; SSE-NEXT: psllq $63, %xmm1
+; SSE-NEXT: movmskpd %xmm1, %eax
+; SSE-NEXT: cmpl $3, %eax
+; SSE-NEXT: movl $42, %ecx
+; SSE-NEXT: movl $99, %eax
+; SSE-NEXT: cmovel %ecx, %eax
+; SSE-NEXT: retq
+;
+; AVX1OR2-LABEL: PR39665_c_ray_select:
+; AVX1OR2: # %bb.0:
+; AVX1OR2-NEXT: vcmpltpd %xmm0, %xmm1, %xmm0
+; AVX1OR2-NEXT: vpsllq $63, %xmm0, %xmm0
+; AVX1OR2-NEXT: vpcmpeqd %xmm1, %xmm1, %xmm1
+; AVX1OR2-NEXT: vtestpd %xmm1, %xmm0
+; AVX1OR2-NEXT: movl $42, %ecx
+; AVX1OR2-NEXT: movl $99, %eax
+; AVX1OR2-NEXT: cmovbl %ecx, %eax
+; AVX1OR2-NEXT: retq
+;
+; KNL-LABEL: PR39665_c_ray_select:
+; KNL: # %bb.0:
+; KNL-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1
+; KNL-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0
+; KNL-NEXT: vcmpltpd %zmm0, %zmm1, %k0
+; KNL-NEXT: knotw %k0, %k0
+; KNL-NEXT: kmovw %k0, %eax
+; KNL-NEXT: testb $3, %al
+; KNL-NEXT: movl $42, %ecx
+; KNL-NEXT: movl $99, %eax
+; KNL-NEXT: cmovel %ecx, %eax
+; KNL-NEXT: vzeroupper
+; KNL-NEXT: retq
+;
+; SKX-LABEL: PR39665_c_ray_select:
+; SKX: # %bb.0:
+; SKX-NEXT: vcmpltpd %xmm0, %xmm1, %k0
+; SKX-NEXT: knotw %k0, %k0
+; SKX-NEXT: kmovd %k0, %eax
+; SKX-NEXT: testb $3, %al
+; SKX-NEXT: movl $42, %ecx
+; SKX-NEXT: movl $99, %eax
+; SKX-NEXT: cmovel %ecx, %eax
+; SKX-NEXT: retq
+ %cmp = fcmp fast ogt <2 x double> %x, %y
+ %b0 = extractelement <2 x i1> %cmp, i64 0
+ %b1 = extractelement <2 x i1> %cmp, i64 1
+ %b = select i1 %b0, i1 %b1, i1 false
+ %r = select i1 %b, i32 42, i32 99
+ ret i32 %r
+}
+
define i32 @pr67287(<2 x i64> %broadcast.splatinsert25) {
; SSE2-LABEL: pr67287:
; SSE2: # %bb.0: # %entry
@@ -4438,10 +4493,10 @@ define i32 @pr67287(<2 x i64> %broadcast.splatinsert25) {
; SSE2-NEXT: movd %xmm1, %ecx
; SSE2-NEXT: orb %al, %cl
; SSE2-NEXT: testb $1, %cl
-; SSE2-NEXT: je .LBB97_2
+; SSE2-NEXT: je .LBB98_2
; SSE2-NEXT: # %bb.1:
; SSE2-NEXT: movw $0, 0
-; SSE2-NEXT: .LBB97_2: # %middle.block
+; SSE2-NEXT: .LBB98_2: # %middle.block
; SSE2-NEXT: xorl %eax, %eax
; SSE2-NEXT: retq
;
@@ -4456,10 +4511,10 @@ define i32 @pr67287(<2 x i64> %broadcast.splatinsert25) {
; SSE41-NEXT: movd %xmm0, %ecx
; SSE41-NEXT: orb %al, %cl
; SSE41-NEXT: testb $1, %cl
-; SSE41-NEXT: je .LBB97_2
+; SSE41-NEXT: je .LBB98_2
; SSE41-NEXT: # %bb.1:
; SSE41-NEXT: movw $0, 0
-; SSE41-NEXT: .LBB97_2: # %middle.block
+; SSE41-NEXT: .LBB98_2: # %middle.block
; SSE41-NEXT: xorl %eax, %eax
; SSE41-NEXT: retq
;
@@ -4473,10 +4528,10 @@ define i32 @pr67287(<2 x i64> %broadcast.splatinsert25) {
; AVX1-NEXT: vmovd %xmm0, %ecx
; AVX1-NEXT: orb %al, %cl
; AVX1-NEXT: testb $1, %cl
-; AVX1-NEXT: je .LBB97_2
+; AVX1-NEXT: je .LBB98_2
; AVX1-NEXT: # %bb.1:
; AVX1-NEXT: movw $0, 0
-; AVX1-NEXT: .LBB97_2: # %middle.block
+; AVX1-NEXT: .LBB98_2: # %middle.block
; AVX1-NEXT: xorl %eax, %eax
; AVX1-NEXT: retq
;
@@ -4490,10 +4545,10 @@ define i32 @pr67287(<2 x i64> %broadcast.splatinsert25) {
; AVX2-NEXT: vmovd %xmm0, %ecx
; AVX2-NEXT: orb %al, %cl
; AVX2-NEXT: testb $1, %cl
-; AVX2-NEXT: je .LBB97_2
+; AVX2-NEXT: je .LBB98_2
; AVX2-NEXT: # %bb.1:
; AVX2-NEXT: movw $0, 0
-; AVX2-NEXT: .LBB97_2: # %middle.block
+; AVX2-NEXT: .LBB98_2: # %middle.block
; AVX2-NEXT: xorl %eax, %eax
; AVX2-NEXT: retq
;
@@ -4508,10 +4563,10 @@ define i32 @pr67287(<2 x i64> %broadcast.splatinsert25) {
; KNL-NEXT: setne %cl
; KNL-NEXT: orb %cl, %al
; KNL-NEXT: testb $1, %al
-; KNL-NEXT: je .LBB97_2
+; KNL-NEXT: je .LBB98_2
; KNL-NEXT: # %bb.1:
; KNL-NEXT: movw $0, 0
-; KNL-NEXT: .LBB97_2: # %middle.block
+; KNL-NEXT: .LBB98_2: # %middle.block
; KNL-NEXT: xorl %eax, %eax
; KNL-NEXT: vzeroupper
; KNL-NEXT: retq
@@ -4526,10 +4581,10 @@ define i32 @pr67287(<2 x i64> %broadcast.splatinsert25) {
; SKX-NEXT: kmovd %k0, %ecx
; SKX-NEXT: orb %al, %cl
; SKX-NEXT: testb $1, %cl
-; SKX-NEXT: je .LBB97_2
+; SKX-NEXT: je .LBB98_2
; SKX-NEXT: # %bb.1:
; SKX-NEXT: movw $0, 0
-; SKX-NEXT: .LBB97_2: # %middle.block
+; SKX-NEXT: .LBB98_2: # %middle.block
; SKX-NEXT: xorl %eax, %eax
; SKX-NEXT: retq
entry:
More information about the llvm-commits
mailing list