[llvm] r368575 - [X86][SSE] Add test showing missing demanded elts PSADBW handling

Simon Pilgrim via llvm-commits llvm-commits at lists.llvm.org
Mon Aug 12 07:01:16 PDT 2019


Author: rksimon
Date: Mon Aug 12 07:01:16 2019
New Revision: 368575

URL: http://llvm.org/viewvc/llvm-project?rev=368575&view=rev
Log:
[X86][SSE] Add test showing missing demanded elts PSADBW handling

Modified:
    llvm/trunk/test/CodeGen/X86/psadbw.ll

Modified: llvm/trunk/test/CodeGen/X86/psadbw.ll
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/CodeGen/X86/psadbw.ll?rev=368575&r1=368574&r2=368575&view=diff
==============================================================================
--- llvm/trunk/test/CodeGen/X86/psadbw.ll (original)
+++ llvm/trunk/test/CodeGen/X86/psadbw.ll Mon Aug 12 07:01:16 2019
@@ -13,5 +13,31 @@ define <2 x i64> @combine_psadbw_shift(<
   ret <2 x i64> %4
 }
 
+; Propagate the demanded result elements to the 8 aliasing source elements.
+define i64 @combine_psadbw_demandedelt(<16 x i8> %0, <16 x i8> %1) {
+; X86-LABEL: combine_psadbw_demandedelt:
+; X86:       # %bb.0:
+; X86-NEXT:    pshufd {{.*#+}} xmm0 = xmm0[0,1,3,2]
+; X86-NEXT:    pshufd {{.*#+}} xmm1 = xmm1[0,1,3,2]
+; X86-NEXT:    psadbw %xmm0, %xmm1
+; X86-NEXT:    movd %xmm1, %eax
+; X86-NEXT:    pshufd {{.*#+}} xmm0 = xmm1[1,1,2,3]
+; X86-NEXT:    movd %xmm0, %edx
+; X86-NEXT:    retl
+;
+; X64-LABEL: combine_psadbw_demandedelt:
+; X64:       # %bb.0:
+; X64-NEXT:    pshufd {{.*#+}} xmm0 = xmm0[0,1,3,2]
+; X64-NEXT:    pshufd {{.*#+}} xmm1 = xmm1[0,1,3,2]
+; X64-NEXT:    psadbw %xmm0, %xmm1
+; X64-NEXT:    movq %xmm1, %rax
+; X64-NEXT:    retq
+  %3 = shufflevector <16 x i8> %0, <16 x i8> %0, <16 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 12, i32 13, i32 14, i32 15, i32 8, i32 9, i32 10, i32 11>
+  %4 = shufflevector <16 x i8> %1, <16 x i8> %1, <16 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 12, i32 13, i32 14, i32 15, i32 8, i32 9, i32 10, i32 11>
+  %5 = tail call <2 x i64> @llvm.x86.sse2.psad.bw(<16 x i8> %3, <16 x i8> %4)
+  %6 = extractelement <2 x i64> %5, i32 0
+  ret i64 %6
+}
+
 declare <2 x i64> @llvm.x86.sse2.psad.bw(<16 x i8>, <16 x i8>)
 




More information about the llvm-commits mailing list