[llvm] c40f4f2 - [SLP][NFC]Add a test for improved shuffles in buildvector sequences,
Alexey Bataev via llvm-commits
llvm-commits at lists.llvm.org
Tue May 10 05:53:09 PDT 2022
Author: Alexey Bataev
Date: 2022-05-10T05:51:44-07:00
New Revision: c40f4f2880f5b14344fbb5e2dc4486a6c11ab4dc
URL: https://github.com/llvm/llvm-project/commit/c40f4f2880f5b14344fbb5e2dc4486a6c11ab4dc
DIFF: https://github.com/llvm/llvm-project/commit/c40f4f2880f5b14344fbb5e2dc4486a6c11ab4dc.diff
LOG: [SLP][NFC]Add a test for improved shuffles in buildvector sequences,
NFC.
Added:
llvm/test/Transforms/SLPVectorizer/X86/buildvector-shuffle.ll
Modified:
Removed:
################################################################################
diff --git a/llvm/test/Transforms/SLPVectorizer/X86/buildvector-shuffle.ll b/llvm/test/Transforms/SLPVectorizer/X86/buildvector-shuffle.ll
new file mode 100644
index 000000000000..3b0ec888de66
--- /dev/null
+++ b/llvm/test/Transforms/SLPVectorizer/X86/buildvector-shuffle.ll
@@ -0,0 +1,89 @@
+; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
+; RUN: opt -S -slp-vectorizer -mtriple=x86_64-unknown-linux-gnu < %s | FileCheck %s
+
+define void @b() {
+; CHECK-LABEL: @b(
+; CHECK-NEXT: entry:
+; CHECK-NEXT: [[TMP0:%.*]] = insertelement <4 x float> poison, float 0x7FF8000000000000, i32 0
+; CHECK-NEXT: [[TMP1:%.*]] = shufflevector <4 x float> [[TMP0]], <4 x float> <float 0xFFF8000000000000, float 0xFFF8000000000000, float undef, float undef>, <4 x i32> <i32 0, i32 4, i32 5, i32 3>
+; CHECK-NEXT: [[TMP2:%.*]] = insertelement <4 x float> [[TMP1]], float 0x7FF8000000000000, i32 3
+; CHECK-NEXT: [[TMP3:%.*]] = call <4 x float> @llvm.fmuladd.v4f32(<4 x float> [[TMP2]], <4 x float> zeroinitializer, <4 x float> zeroinitializer)
+; CHECK-NEXT: [[TMP4:%.*]] = fmul <4 x float> [[TMP3]], <float undef, float undef, float undef, float 2.000000e+00>
+; CHECK-NEXT: [[TMP5:%.*]] = fdiv <4 x float> [[TMP4]], zeroinitializer
+; CHECK-NEXT: store <4 x float> [[TMP5]], ptr undef, align 4
+; CHECK-NEXT: ret void
+;
+entry:
+ %mul = fmul float undef, 2.000000e+00
+ %i = tail call float @llvm.fmuladd.f32(float %mul, float 0.000000e+00, float 0.000000e+00)
+ %mul2 = fmul float undef, %i
+ %add = fadd float undef, 1.000000e+00
+ %neg = fneg float %add
+ %i1 = tail call float @llvm.fmuladd.f32(float %neg, float 0.000000e+00, float 0.000000e+00)
+ %mul4 = fmul float undef, %i1
+ %neg7 = fneg float %mul
+ %i2 = tail call float @llvm.fmuladd.f32(float %neg7, float 0.000000e+00, float 0.000000e+00)
+ %mul8 = fmul float undef, %i2
+ %i3 = tail call float @llvm.fmuladd.f32(float %add, float 0.000000e+00, float 0.000000e+00)
+ %mul11 = fmul float %i3, 2.000000e+00
+ %div = fdiv float %mul2, 0.000000e+00
+ store float %div, ptr undef, align 4
+ %div12 = fdiv float %mul4, 0.000000e+00
+ %arrayidx13 = getelementptr inbounds float, ptr undef, i64 1
+ store float %div12, ptr %arrayidx13, align 4
+ %div14 = fdiv float %mul8, 0.000000e+00
+ %arrayidx15 = getelementptr inbounds float, ptr undef, i64 2
+ store float %div14, ptr %arrayidx15, align 4
+ %div16 = fdiv float %mul11, 0.000000e+00
+ %arrayidx17 = getelementptr inbounds float, ptr undef, i64 3
+ store float %div16, ptr %arrayidx17, align 4
+ ret void
+}
+
+declare float @llvm.fmuladd.f32(float, float, float)
+
+define void @test(float %a) {
+; CHECK-LABEL: @test(
+; CHECK-NEXT: entry:
+; CHECK-NEXT: [[TMP0:%.*]] = insertelement <2 x float> poison, float [[A:%.*]], i32 0
+; CHECK-NEXT: [[TMP1:%.*]] = insertelement <2 x float> [[TMP0]], float [[A]], i32 1
+; CHECK-NEXT: br label [[LOOP:%.*]]
+; CHECK: loop:
+; CHECK-NEXT: [[TMP2:%.*]] = fadd <2 x float> zeroinitializer, [[TMP1]]
+; CHECK-NEXT: [[TMP3:%.*]] = extractelement <2 x float> [[TMP2]], i32 0
+; CHECK-NEXT: [[AGG:%.*]] = insertelement <2 x float> [[TMP2]], float [[TMP3]], i64 1
+; CHECK-NEXT: br label [[LOOP]]
+;
+entry:
+ br label %loop
+
+loop:
+ %add.i157 = fadd float 0.000000e+00, %a
+ %add23.i = fadd float 0.000000e+00, %a
+ %insert = insertelement <2 x float> zeroinitializer, float %add.i157, i64 0
+ %insert.i = insertelement <2 x float> %insert, float %add23.i, i64 1
+ %agg = insertelement <2 x float> %insert.i, float %add.i157, i64 1
+ br label %loop
+}
+
+define internal void @test1() {
+; CHECK-LABEL: @test1(
+; CHECK-NEXT: entry:
+; CHECK-NEXT: br label [[LOOP:%.*]]
+; CHECK: loop:
+; CHECK-NEXT: [[DOTSROA_025_4_VEC_INSERT_US_I:%.*]] = insertelement <2 x float> zeroinitializer, float 0.000000e+00, i64 0
+; CHECK-NEXT: br label [[LOOP]]
+;
+entry:
+ br label %loop
+
+loop:
+ %0 = fadd float 0.000000e+00, 0.000000e+00
+ %1 = fadd float 0.000000e+00, 0.000000e+00
+ %2 = fadd float %0, 0.000000e+00
+ %3 = fadd float %1, 0.000000e+00
+ %.sroa.3.8.vec.insert.i.us.i = insertelement <2 x float> zeroinitializer, float %2, i64 0
+ %.sroa.3.12.vec.insert.i.us.i = insertelement <2 x float> %.sroa.3.8.vec.insert.i.us.i, float %3, i64 1
+ %.sroa.025.4.vec.insert.us.i = insertelement <2 x float> %.sroa.3.12.vec.insert.i.us.i, float %0, i64 0
+ br label %loop
+}
More information about the llvm-commits
mailing list