[llvm] be7014e - [SLP][NFC]Add a test with non-power-of-2 (but still whole vector) operands.
Alexey Bataev via llvm-commits
llvm-commits at lists.llvm.org
Wed Aug 28 10:08:34 PDT 2024
Author: Alexey Bataev
Date: 2024-08-28T10:08:20-07:00
New Revision: be7014e95af5868a6ac5c700ad02bf819159a62d
URL: https://github.com/llvm/llvm-project/commit/be7014e95af5868a6ac5c700ad02bf819159a62d
DIFF: https://github.com/llvm/llvm-project/commit/be7014e95af5868a6ac5c700ad02bf819159a62d.diff
LOG: [SLP][NFC]Add a test with non-power-of-2 (but still whole vector) operands.
Added:
llvm/test/Transforms/SLPVectorizer/RISCV/reduction-whole-regs-loads.ll
Modified:
Removed:
################################################################################
diff --git a/llvm/test/Transforms/SLPVectorizer/RISCV/reduction-whole-regs-loads.ll b/llvm/test/Transforms/SLPVectorizer/RISCV/reduction-whole-regs-loads.ll
new file mode 100644
index 00000000000000..54dc33dbc0d00b
--- /dev/null
+++ b/llvm/test/Transforms/SLPVectorizer/RISCV/reduction-whole-regs-loads.ll
@@ -0,0 +1,45 @@
+; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
+; RUN: opt < %s -passes=slp-vectorizer -S -mtriple=riscv64-unknown-linux -mattr=+v -slp-threshold=-100 | FileCheck %s
+
+define i64 @test(ptr %p) {
+; CHECK-LABEL: @test(
+; CHECK-NEXT: entry:
+; CHECK-NEXT: [[ARRAYIDX_4:%.*]] = getelementptr inbounds i64, ptr [[P:%.*]], i64 4
+; CHECK-NEXT: [[TMP0:%.*]] = load <4 x i64>, ptr [[P]], align 4
+; CHECK-NEXT: [[TMP1:%.*]] = load <2 x i64>, ptr [[ARRAYIDX_4]], align 4
+; CHECK-NEXT: [[TMP2:%.*]] = shufflevector <4 x i64> [[TMP0]], <4 x i64> poison, <8 x i32> <i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 poison, i32 0, i32 0>
+; CHECK-NEXT: [[TMP3:%.*]] = call <8 x i64> @llvm.vector.insert.v8i64.v4i64(<8 x i64> [[TMP2]], <4 x i64> [[TMP0]], i64 0)
+; CHECK-NEXT: [[TMP4:%.*]] = call <8 x i64> @llvm.vector.insert.v8i64.v2i64(<8 x i64> [[TMP3]], <2 x i64> [[TMP1]], i64 4)
+; CHECK-NEXT: [[TMP5:%.*]] = mul <8 x i64> [[TMP4]], <i64 42, i64 42, i64 42, i64 42, i64 42, i64 42, i64 42, i64 42>
+; CHECK-NEXT: [[TMP6:%.*]] = call i64 @llvm.vector.reduce.add.v8i64(<8 x i64> [[TMP5]])
+; CHECK-NEXT: ret i64 [[TMP6]]
+;
+entry:
+ %arrayidx.1 = getelementptr inbounds i64, ptr %p, i64 1
+ %arrayidx.2 = getelementptr inbounds i64, ptr %p, i64 2
+ %arrayidx.3 = getelementptr inbounds i64, ptr %p, i64 3
+ %arrayidx.4 = getelementptr inbounds i64, ptr %p, i64 4
+ %arrayidx.5 = getelementptr inbounds i64, ptr %p, i64 5
+ %tmp = load i64, ptr %p, align 4
+ %mul = mul i64 %tmp, 42
+ %tmp1 = load i64, ptr %arrayidx.1, align 4
+ %mul1 = mul i64 %tmp1, 42
+ %add = add i64 %mul, %mul1
+ %tmp2 = load i64, ptr %arrayidx.2, align 4
+ %mul2 = mul i64 %tmp2, 42
+ %add1 = add i64 %add, %mul2
+ %tmp3 = load i64, ptr %arrayidx.3, align 4
+ %mul3 = mul i64 %tmp3, 42
+ %add2 = add i64 %add1, %mul3
+ %tmp4 = load i64, ptr %arrayidx.4, align 4
+ %mul4 = mul i64 %tmp4, 42
+ %add3 = add i64 %add2, %mul4
+ %tmp5 = load i64, ptr %arrayidx.5, align 4
+ %mul5 = mul i64 %tmp5, 42
+ %add4 = add i64 %add3, %mul5
+ %mul6 = mul i64 %tmp, 42
+ %add5 = add i64 %add4, %mul6
+ %mul7 = mul i64 %tmp, 42
+ %add6 = add i64 %add5, %mul7
+ ret i64 %add6
+}
More information about the llvm-commits
mailing list