[llvm] 65ac12d - [SLP][NFC]Add a test with incorrect minbitwidth analysis for reduced operands
Alexey Bataev via llvm-commits
llvm-commits at lists.llvm.org
Thu Aug 15 07:26:57 PDT 2024
Author: Alexey Bataev
Date: 2024-08-15T07:26:44-07:00
New Revision: 65ac12d3c9877ecf5b97552364e7eead887d94eb
URL: https://github.com/llvm/llvm-project/commit/65ac12d3c9877ecf5b97552364e7eead887d94eb
DIFF: https://github.com/llvm/llvm-project/commit/65ac12d3c9877ecf5b97552364e7eead887d94eb.diff
LOG: [SLP][NFC]Add a test with incorrect minbitwidth analysis for reduced operands
Added:
llvm/test/Transforms/SLPVectorizer/X86/operand-is-reduced-val.ll
Modified:
Removed:
################################################################################
diff --git a/llvm/test/Transforms/SLPVectorizer/X86/operand-is-reduced-val.ll b/llvm/test/Transforms/SLPVectorizer/X86/operand-is-reduced-val.ll
new file mode 100644
index 00000000000000..5fb93e27539d8e
--- /dev/null
+++ b/llvm/test/Transforms/SLPVectorizer/X86/operand-is-reduced-val.ll
@@ -0,0 +1,46 @@
+; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
+; RUN: opt -S --passes=slp-vectorizer -mtriple=x86_64-unknown-linux < %s -slp-threshold=-10 | FileCheck %s
+
+define i64 @src(i32 %a) {
+; CHECK-LABEL: define i64 @src(
+; CHECK-SAME: i32 [[A:%.*]]) {
+; CHECK-NEXT: [[ENTRY:.*:]]
+; CHECK-NEXT: [[TMP17:%.*]] = sext i32 [[A]] to i64
+; CHECK-NEXT: [[TMP1:%.*]] = insertelement <4 x i32> poison, i32 [[A]], i32 0
+; CHECK-NEXT: [[TMP2:%.*]] = shufflevector <4 x i32> [[TMP1]], <4 x i32> poison, <4 x i32> zeroinitializer
+; CHECK-NEXT: [[TMP3:%.*]] = add <4 x i32> [[TMP2]], <i32 1, i32 1, i32 1, i32 1>
+; CHECK-NEXT: [[TMP4:%.*]] = sext <4 x i32> [[TMP3]] to <4 x i64>
+; CHECK-NEXT: [[TMP5:%.*]] = and <4 x i32> [[TMP3]], <i32 1, i32 1, i32 1, i32 1>
+; CHECK-NEXT: [[TMP6:%.*]] = zext <4 x i32> [[TMP5]] to <4 x i64>
+; CHECK-NEXT: [[TMP18:%.*]] = call i64 @llvm.vector.reduce.add.v4i64(<4 x i64> [[TMP6]])
+; CHECK-NEXT: [[TMP16:%.*]] = call i64 @llvm.vector.reduce.add.v4i64(<4 x i64> [[TMP4]])
+; CHECK-NEXT: [[TMP19:%.*]] = add i64 [[TMP18]], [[TMP16]]
+; CHECK-NEXT: [[OP_RDX1:%.*]] = add i64 [[TMP19]], 4294967297
+; CHECK-NEXT: [[TMP21:%.*]] = add i64 [[OP_RDX1]], [[TMP17]]
+; CHECK-NEXT: ret i64 [[TMP21]]
+;
+entry:
+ %0 = sext i32 %a to i64
+ %1 = add nsw i64 %0, 4294967297
+ %2 = sext i32 %a to i64
+ %3 = add nsw i64 %2, 4294967297
+ %4 = add i64 %3, %1
+ %5 = and i64 %3, 1
+ %6 = add i64 %4, %5
+ %7 = sext i32 %a to i64
+ %8 = add nsw i64 %7, 4294967297
+ %9 = add i64 %8, %6
+ %10 = and i64 %8, 1
+ %11 = add i64 %9, %10
+ %12 = sext i32 %a to i64
+ %13 = add nsw i64 %12, 4294967297
+ %14 = add i64 %13, %11
+ %15 = and i64 %13, 1
+ %16 = add i64 %14, %15
+ %17 = sext i32 %a to i64
+ %18 = add nsw i64 %17, 4294967297
+ %19 = add i64 %18, %16
+ %20 = and i64 %18, 1
+ %21 = add i64 %19, %20
+ ret i64 %21
+}
More information about the llvm-commits
mailing list