[llvm] r272714 - [x86] add current codegen tests for PR27924
Sanjay Patel via llvm-commits
llvm-commits at lists.llvm.org
Tue Jun 14 14:25:46 PDT 2016
Author: spatel
Date: Tue Jun 14 16:25:46 2016
New Revision: 272714
URL: http://llvm.org/viewvc/llvm-project?rev=272714&view=rev
Log:
[x86] add current codegen tests for PR27924
Added:
llvm/trunk/test/CodeGen/X86/vector-compare-combines.ll
Added: llvm/trunk/test/CodeGen/X86/vector-compare-combines.ll
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/CodeGen/X86/vector-compare-combines.ll?rev=272714&view=auto
==============================================================================
--- llvm/trunk/test/CodeGen/X86/vector-compare-combines.ll (added)
+++ llvm/trunk/test/CodeGen/X86/vector-compare-combines.ll Tue Jun 14 16:25:46 2016
@@ -0,0 +1,51 @@
+; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
+; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse4.2 | FileCheck %s --check-prefix=SSE --check-prefix=SSE42
+; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx | FileCheck %s --check-prefix=AVX --check-prefix=AVX1
+
+; FIXME: If we have SSE/AVX intrinsics in the code, we miss obvious combines
+; unless we do them late on X86-specific nodes.
+
+declare <4 x i32> @llvm.x86.sse41.pmaxsd(<4 x i32>, <4 x i32>)
+
+define <4 x i32> @PR27924_cmpeq(<4 x i32> %a, <4 x i32> %b) {
+; SSE-LABEL: PR27924_cmpeq:
+; SSE: # BB#0:
+; SSE-NEXT: pmaxsd %xmm1, %xmm0
+; SSE-NEXT: pcmpeqd %xmm0, %xmm0
+; SSE-NEXT: retq
+;
+; AVX-LABEL: PR27924_cmpeq:
+; AVX: # BB#0:
+; AVX-NEXT: vpmaxsd %xmm1, %xmm0, %xmm0
+; AVX-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0
+; AVX-NEXT: retq
+;
+ %cmp = icmp sgt <4 x i32> %a, %b
+ %max = select <4 x i1> %cmp, <4 x i32> %a, <4 x i32> %b
+ %sse_max = tail call <4 x i32> @llvm.x86.sse41.pmaxsd(<4 x i32> %a, <4 x i32> %b)
+ %truth = icmp eq <4 x i32> %max, %sse_max
+ %ret = sext <4 x i1> %truth to <4 x i32>
+ ret <4 x i32> %ret
+}
+
+define <4 x i32> @PR27924_cmpgt(<4 x i32> %a, <4 x i32> %b) {
+; SSE-LABEL: PR27924_cmpgt:
+; SSE: # BB#0:
+; SSE-NEXT: pmaxsd %xmm1, %xmm0
+; SSE-NEXT: pcmpgtd %xmm0, %xmm0
+; SSE-NEXT: retq
+;
+; AVX-LABEL: PR27924_cmpgt:
+; AVX: # BB#0:
+; AVX-NEXT: vpmaxsd %xmm1, %xmm0, %xmm0
+; AVX-NEXT: vpcmpgtd %xmm0, %xmm0, %xmm0
+; AVX-NEXT: retq
+;
+ %cmp = icmp sgt <4 x i32> %a, %b
+ %max = select <4 x i1> %cmp, <4 x i32> %a, <4 x i32> %b
+ %sse_max = tail call <4 x i32> @llvm.x86.sse41.pmaxsd(<4 x i32> %a, <4 x i32> %b)
+ %untruth = icmp sgt <4 x i32> %max, %sse_max
+ %ret = sext <4 x i1> %untruth to <4 x i32>
+ ret <4 x i32> %ret
+}
+
More information about the llvm-commits
mailing list