[llvm] r328546 - [SLP] Add a test case. NFC.
Haicheng Wu via llvm-commits
llvm-commits at lists.llvm.org
Mon Mar 26 09:47:37 PDT 2018
Author: haicheng
Date: Mon Mar 26 09:47:37 2018
New Revision: 328546
URL: http://llvm.org/viewvc/llvm-project?rev=328546&view=rev
Log:
[SLP] Add a test case. NFC.
Added:
llvm/trunk/test/Transforms/SLPVectorizer/AArch64/ext-trunc.ll
Added: llvm/trunk/test/Transforms/SLPVectorizer/AArch64/ext-trunc.ll
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/Transforms/SLPVectorizer/AArch64/ext-trunc.ll?rev=328546&view=auto
==============================================================================
--- llvm/trunk/test/Transforms/SLPVectorizer/AArch64/ext-trunc.ll (added)
+++ llvm/trunk/test/Transforms/SLPVectorizer/AArch64/ext-trunc.ll Mon Mar 26 09:47:37 2018
@@ -0,0 +1,38 @@
+; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
+; RUN: opt -S -slp-vectorizer -mtriple=aarch64--linux-gnu -instcombine < %s | FileCheck %s
+
+target datalayout = "e-m:e-i32:64-i128:128-n32:64-S128"
+
+declare void @foo(i64, i64, i64, i64)
+
+define void @test(<4 x i16> %a, <4 x i16> %b, i64* %p) {
+; Make sure types of sub and its sources are not extended.
+; CHECK-LABEL: @test(
+; CHECK-NEXT: entry:
+; CHECK-NEXT: [[Z0:%.*]] = zext <4 x i16> [[A:%.*]] to <4 x i64>
+; CHECK-NEXT: [[Z1:%.*]] = zext <4 x i16> [[B:%.*]] to <4 x i64>
+; CHECK-NEXT: [[SUB0:%.*]] = sub nsw <4 x i64> [[Z0]], [[Z1]]
+;
+entry:
+ %z0 = zext <4 x i16> %a to <4 x i32>
+ %z1 = zext <4 x i16> %b to <4 x i32>
+ %sub0 = sub <4 x i32> %z0, %z1
+ %e0 = extractelement <4 x i32> %sub0, i32 0
+ %s0 = sext i32 %e0 to i64
+ %gep0 = getelementptr inbounds i64, i64* %p, i64 %s0
+ %load0 = load i64, i64* %gep0
+ %e1 = extractelement <4 x i32> %sub0, i32 1
+ %s1 = sext i32 %e1 to i64
+ %gep1 = getelementptr inbounds i64, i64* %p, i64 %s1
+ %load1 = load i64, i64* %gep1
+ %e2 = extractelement <4 x i32> %sub0, i32 2
+ %s2 = sext i32 %e2 to i64
+ %gep2 = getelementptr inbounds i64, i64* %p, i64 %s2
+ %load2 = load i64, i64* %gep2
+ %e3 = extractelement <4 x i32> %sub0, i32 3
+ %s3 = sext i32 %e3 to i64
+ %gep3 = getelementptr inbounds i64, i64* %p, i64 %s3
+ %load3 = load i64, i64* %gep3
+ call void @foo(i64 %load0, i64 %load1, i64 %load2, i64 %load3)
+ ret void
+}
More information about the llvm-commits
mailing list