[llvm] 4da6a98 - [X86] Add test case for Issue #59526

Simon Pilgrim via llvm-commits llvm-commits at lists.llvm.org
Thu Dec 15 08:21:58 PST 2022


Author: Simon Pilgrim
Date: 2022-12-15T16:19:41Z
New Revision: 4da6a983ad07cc777e7d0bdd593c4f275b42f2ee

URL: https://github.com/llvm/llvm-project/commit/4da6a983ad07cc777e7d0bdd593c4f275b42f2ee
DIFF: https://github.com/llvm/llvm-project/commit/4da6a983ad07cc777e7d0bdd593c4f275b42f2ee.diff

LOG: [X86] Add test case for Issue #59526

Added: 
    

Modified: 
    llvm/test/CodeGen/X86/bitcast-vector-bool.ll

Removed: 
    


################################################################################
diff  --git a/llvm/test/CodeGen/X86/bitcast-vector-bool.ll b/llvm/test/CodeGen/X86/bitcast-vector-bool.ll
index de132c1c7ef4..6d87c3101380 100644
--- a/llvm/test/CodeGen/X86/bitcast-vector-bool.ll
+++ b/llvm/test/CodeGen/X86/bitcast-vector-bool.ll
@@ -722,3 +722,74 @@ define [2 x i8] @PR58546(<16 x float> %a0) {
   %6 = insertvalue [2 x i8] %5, i8 %4, 1
   ret [2 x i8] %6
 }
+
+define i8 @PR59526(<8 x i32> %a, <8 x i32> %b, ptr %mask) {
+; SSE2-SSSE3-LABEL: PR59526:
+; SSE2-SSSE3:       # %bb.0:
+; SSE2-SSSE3-NEXT:    pcmpeqd %xmm3, %xmm1
+; SSE2-SSSE3-NEXT:    pcmpeqd %xmm2, %xmm0
+; SSE2-SSSE3-NEXT:    packssdw %xmm1, %xmm0
+; SSE2-SSSE3-NEXT:    movdqu (%rdi), %xmm1
+; SSE2-SSSE3-NEXT:    movdqu 16(%rdi), %xmm2
+; SSE2-SSSE3-NEXT:    pxor %xmm3, %xmm3
+; SSE2-SSSE3-NEXT:    pxor %xmm4, %xmm4
+; SSE2-SSSE3-NEXT:    pcmpgtd %xmm2, %xmm4
+; SSE2-SSSE3-NEXT:    pcmpgtd %xmm1, %xmm3
+; SSE2-SSSE3-NEXT:    packssdw %xmm4, %xmm3
+; SSE2-SSSE3-NEXT:    pand %xmm0, %xmm3
+; SSE2-SSSE3-NEXT:    pmovmskb %xmm3, %eax
+; SSE2-SSSE3-NEXT:    testl %eax, %eax
+; SSE2-SSSE3-NEXT:    setne %al
+; SSE2-SSSE3-NEXT:    retq
+;
+; AVX1-LABEL: PR59526:
+; AVX1:       # %bb.0:
+; AVX1-NEXT:    vpcmpeqd %xmm1, %xmm0, %xmm2
+; AVX1-NEXT:    vextractf128 $1, %ymm1, %xmm1
+; AVX1-NEXT:    vextractf128 $1, %ymm0, %xmm0
+; AVX1-NEXT:    vpcmpeqd %xmm1, %xmm0, %xmm0
+; AVX1-NEXT:    vpxor %xmm1, %xmm1, %xmm1
+; AVX1-NEXT:    vpcmpgtd (%rdi), %xmm1, %xmm3
+; AVX1-NEXT:    vpand %xmm3, %xmm2, %xmm2
+; AVX1-NEXT:    vpcmpgtd 16(%rdi), %xmm1, %xmm1
+; AVX1-NEXT:    vpand %xmm1, %xmm0, %xmm0
+; AVX1-NEXT:    vpackssdw %xmm0, %xmm2, %xmm0
+; AVX1-NEXT:    vpmovmskb %xmm0, %eax
+; AVX1-NEXT:    testl %eax, %eax
+; AVX1-NEXT:    setne %al
+; AVX1-NEXT:    vzeroupper
+; AVX1-NEXT:    retq
+;
+; AVX2-LABEL: PR59526:
+; AVX2:       # %bb.0:
+; AVX2-NEXT:    vpcmpeqd %ymm1, %ymm0, %ymm0
+; AVX2-NEXT:    vpxor %xmm1, %xmm1, %xmm1
+; AVX2-NEXT:    vpcmpgtd (%rdi), %ymm1, %ymm1
+; AVX2-NEXT:    vpand %ymm1, %ymm0, %ymm0
+; AVX2-NEXT:    vextracti128 $1, %ymm0, %xmm1
+; AVX2-NEXT:    vpackssdw %xmm1, %xmm0, %xmm0
+; AVX2-NEXT:    vpmovmskb %xmm0, %eax
+; AVX2-NEXT:    testl %eax, %eax
+; AVX2-NEXT:    setne %al
+; AVX2-NEXT:    vzeroupper
+; AVX2-NEXT:    retq
+;
+; AVX512-LABEL: PR59526:
+; AVX512:       # %bb.0:
+; AVX512-NEXT:    vpcmpeqd %ymm1, %ymm0, %k1
+; AVX512-NEXT:    vpxor %xmm0, %xmm0, %xmm0
+; AVX512-NEXT:    vpcmpgtd (%rdi), %ymm0, %k0 {%k1}
+; AVX512-NEXT:    kmovd %k0, %eax
+; AVX512-NEXT:    testb %al, %al
+; AVX512-NEXT:    setne %al
+; AVX512-NEXT:    vzeroupper
+; AVX512-NEXT:    retq
+  %cmp.eq = icmp eq <8 x i32> %a, %b
+  %load = load <8 x i32>, ptr %mask, align 1
+  %cmp.slt = icmp slt <8 x i32> %load, zeroinitializer
+  %sel = select <8 x i1> %cmp.eq, <8 x i1> %cmp.slt, <8 x i1> zeroinitializer
+  %bc = bitcast <8 x i1> %sel to i8
+  %cmp = icmp ne i8 %bc, 0
+  %conv = zext i1 %cmp to i8
+  ret i8 %conv
+}


        


More information about the llvm-commits mailing list