[llvm] [InstCombine] Fold minmax intrinsic using KnownBits information (PR #76242)
Yingwei Zheng via llvm-commits
llvm-commits at lists.llvm.org
Fri Dec 22 08:32:51 PST 2023
https://github.com/dtcxzyw updated https://github.com/llvm/llvm-project/pull/76242
>From a863b121c7b28f2c30439ccbd70927ed481835cb Mon Sep 17 00:00:00 2001
From: Yingwei Zheng <dtcxzyw2333 at gmail.com>
Date: Fri, 22 Dec 2023 22:30:41 +0800
Subject: [PATCH 1/2] [InstCombine] Add pre-commit tests. NFC.
---
.../InstCombine/minmax-intrinsics.ll | 68 +++++++++++++++++++
1 file changed, 68 insertions(+)
diff --git a/llvm/test/Transforms/InstCombine/minmax-intrinsics.ll b/llvm/test/Transforms/InstCombine/minmax-intrinsics.ll
index f3833a420ee835..d8a6f5bcf27586 100644
--- a/llvm/test/Transforms/InstCombine/minmax-intrinsics.ll
+++ b/llvm/test/Transforms/InstCombine/minmax-intrinsics.ll
@@ -2489,3 +2489,71 @@ define i1 @PR57986() {
%umin = call i1 @llvm.umin.i1(i1 ptrtoint (ptr @g to i1), i1 true)
ret i1 %umin
}
+
+define i8 @fold_umax_with_knownbits_info(i8 %a, i8 %b) {
+; CHECK-LABEL: @fold_umax_with_knownbits_info(
+; CHECK-NEXT: entry:
+; CHECK-NEXT: [[A1:%.*]] = or i8 [[A:%.*]], 1
+; CHECK-NEXT: [[A2:%.*]] = shl i8 [[B:%.*]], 1
+; CHECK-NEXT: [[SUB:%.*]] = sub i8 [[A1]], [[A2]]
+; CHECK-NEXT: [[VAL:%.*]] = call i8 @llvm.umax.i8(i8 [[SUB]], i8 1)
+; CHECK-NEXT: ret i8 [[VAL]]
+;
+entry:
+ %a1 = or i8 %a, 1
+ %a2 = shl i8 %b, 1
+ %sub = sub i8 %a1, %a2
+ %val = call i8 @llvm.umax.i8(i8 %sub, i8 1)
+ ret i8 %val
+}
+
+define i8 @fold_umin_with_knownbits_info(i8 %a, i8 %b) {
+; CHECK-LABEL: @fold_umin_with_knownbits_info(
+; CHECK-NEXT: entry:
+; CHECK-NEXT: [[A1:%.*]] = or i8 [[A:%.*]], 3
+; CHECK-NEXT: [[A2:%.*]] = shl i8 [[B:%.*]], 2
+; CHECK-NEXT: [[SUB:%.*]] = sub i8 [[A1]], [[A2]]
+; CHECK-NEXT: [[VAL:%.*]] = call i8 @llvm.umin.i8(i8 [[SUB]], i8 3)
+; CHECK-NEXT: ret i8 [[VAL]]
+;
+entry:
+ %a1 = or i8 %a, 3
+ %a2 = shl i8 %b, 2
+ %sub = sub i8 %a1, %a2
+ %val = call i8 @llvm.umin.i8(i8 %sub, i8 3)
+ ret i8 %val
+}
+
+define i8 @fold_umax_with_knownbits_info_fail(i8 %a, i8 %b) {
+; CHECK-LABEL: @fold_umax_with_knownbits_info_fail(
+; CHECK-NEXT: entry:
+; CHECK-NEXT: [[A1:%.*]] = or i8 [[A:%.*]], 2
+; CHECK-NEXT: [[A2:%.*]] = shl i8 [[B:%.*]], 1
+; CHECK-NEXT: [[SUB:%.*]] = sub i8 [[A1]], [[A2]]
+; CHECK-NEXT: [[VAL:%.*]] = call i8 @llvm.umax.i8(i8 [[SUB]], i8 1)
+; CHECK-NEXT: ret i8 [[VAL]]
+;
+entry:
+ %a1 = or i8 %a, 2
+ %a2 = shl i8 %b, 1
+ %sub = sub i8 %a1, %a2
+ %val = call i8 @llvm.umax.i8(i8 %sub, i8 1)
+ ret i8 %val
+}
+
+define i8 @fold_umin_with_knownbits_info_fail(i8 %a, i8 %b) {
+; CHECK-LABEL: @fold_umin_with_knownbits_info_fail(
+; CHECK-NEXT: entry:
+; CHECK-NEXT: [[A1:%.*]] = or i8 [[A:%.*]], 1
+; CHECK-NEXT: [[A2:%.*]] = shl i8 [[B:%.*]], 2
+; CHECK-NEXT: [[SUB:%.*]] = sub i8 [[A1]], [[A2]]
+; CHECK-NEXT: [[VAL:%.*]] = call i8 @llvm.umin.i8(i8 [[SUB]], i8 3)
+; CHECK-NEXT: ret i8 [[VAL]]
+;
+entry:
+ %a1 = or i8 %a, 1
+ %a2 = shl i8 %b, 2
+ %sub = sub i8 %a1, %a2
+ %val = call i8 @llvm.umin.i8(i8 %sub, i8 3)
+ ret i8 %val
+}
>From 94c65a141a052df42508d40b0d6813721dba77fc Mon Sep 17 00:00:00 2001
From: Yingwei Zheng <dtcxzyw2333 at gmail.com>
Date: Fri, 22 Dec 2023 22:44:54 +0800
Subject: [PATCH 2/2] [InstCombine] Fold minmax intrinsic using KnownBits
information
---
llvm/include/llvm/Analysis/ValueTracking.h | 5 +++++
llvm/lib/Analysis/ValueTracking.cpp | 8 ++++----
.../Transforms/InstCombine/InstCombineCalls.cpp | 15 +++++++++++++++
.../Transforms/InstCombine/minmax-intrinsics.ll | 9 ++-------
4 files changed, 26 insertions(+), 11 deletions(-)
diff --git a/llvm/include/llvm/Analysis/ValueTracking.h b/llvm/include/llvm/Analysis/ValueTracking.h
index a3186e61b94adf..baa16306ebf5df 100644
--- a/llvm/include/llvm/Analysis/ValueTracking.h
+++ b/llvm/include/llvm/Analysis/ValueTracking.h
@@ -863,6 +863,11 @@ ConstantRange computeConstantRange(const Value *V, bool ForSigned,
const DominatorTree *DT = nullptr,
unsigned Depth = 0);
+/// Combine constant ranges from computeConstantRange() and computeKnownBits().
+ConstantRange
+computeConstantRangeIncludingKnownBits(const WithCache<const Value *> &V,
+ bool ForSigned, const SimplifyQuery &SQ);
+
/// Return true if this function can prove that the instruction I will
/// always transfer execution to one of its successors (including the next
/// instruction that follows within a basic block). E.g. this is not
diff --git a/llvm/lib/Analysis/ValueTracking.cpp b/llvm/lib/Analysis/ValueTracking.cpp
index 769d921eb1e8d1..cac2602d455f9d 100644
--- a/llvm/lib/Analysis/ValueTracking.cpp
+++ b/llvm/lib/Analysis/ValueTracking.cpp
@@ -6289,10 +6289,10 @@ static OverflowResult mapOverflowResult(ConstantRange::OverflowResult OR) {
}
/// Combine constant ranges from computeConstantRange() and computeKnownBits().
-static ConstantRange
-computeConstantRangeIncludingKnownBits(const WithCache<const Value *> &V,
- bool ForSigned,
- const SimplifyQuery &SQ) {
+ConstantRange
+llvm::computeConstantRangeIncludingKnownBits(const WithCache<const Value *> &V,
+ bool ForSigned,
+ const SimplifyQuery &SQ) {
ConstantRange CR1 =
ConstantRange::fromKnownBits(V.getKnownBits(SQ), ForSigned);
ConstantRange CR2 = computeConstantRange(V, ForSigned, SQ.IIQ.UseInstrInfo);
diff --git a/llvm/lib/Transforms/InstCombine/InstCombineCalls.cpp b/llvm/lib/Transforms/InstCombine/InstCombineCalls.cpp
index a272357fa04a41..ff2bb1c6eb8756 100644
--- a/llvm/lib/Transforms/InstCombine/InstCombineCalls.cpp
+++ b/llvm/lib/Transforms/InstCombine/InstCombineCalls.cpp
@@ -1796,6 +1796,21 @@ Instruction *InstCombinerImpl::visitCallInst(CallInst &CI) {
if (Instruction *NewMinMax = factorizeMinMaxTree(II))
return NewMinMax;
+ // Try to fold minmax based on range information
+ ICmpInst::Predicate Pred =
+ ICmpInst::getNonStrictPredicate(MinMaxIntrinsic::getPredicate(IID));
+ bool IsSigned = MinMaxIntrinsic::isSigned(IID);
+ const auto LHS_CR = llvm::computeConstantRangeIncludingKnownBits(
+ I0, IsSigned, SQ.getWithInstruction(II));
+ if (!LHS_CR.isFullSet()) {
+ const auto RHS_CR = llvm::computeConstantRangeIncludingKnownBits(
+ I1, IsSigned, SQ.getWithInstruction(II));
+ if (LHS_CR.icmp(Pred, RHS_CR))
+ return replaceInstUsesWith(*II, I0);
+ if (RHS_CR.icmp(Pred, LHS_CR))
+ return replaceInstUsesWith(*II, I1);
+ }
+
break;
}
case Intrinsic::bitreverse: {
diff --git a/llvm/test/Transforms/InstCombine/minmax-intrinsics.ll b/llvm/test/Transforms/InstCombine/minmax-intrinsics.ll
index d8a6f5bcf27586..500ea0aa73f741 100644
--- a/llvm/test/Transforms/InstCombine/minmax-intrinsics.ll
+++ b/llvm/test/Transforms/InstCombine/minmax-intrinsics.ll
@@ -2496,8 +2496,7 @@ define i8 @fold_umax_with_knownbits_info(i8 %a, i8 %b) {
; CHECK-NEXT: [[A1:%.*]] = or i8 [[A:%.*]], 1
; CHECK-NEXT: [[A2:%.*]] = shl i8 [[B:%.*]], 1
; CHECK-NEXT: [[SUB:%.*]] = sub i8 [[A1]], [[A2]]
-; CHECK-NEXT: [[VAL:%.*]] = call i8 @llvm.umax.i8(i8 [[SUB]], i8 1)
-; CHECK-NEXT: ret i8 [[VAL]]
+; CHECK-NEXT: ret i8 [[SUB]]
;
entry:
%a1 = or i8 %a, 1
@@ -2510,11 +2509,7 @@ entry:
define i8 @fold_umin_with_knownbits_info(i8 %a, i8 %b) {
; CHECK-LABEL: @fold_umin_with_knownbits_info(
; CHECK-NEXT: entry:
-; CHECK-NEXT: [[A1:%.*]] = or i8 [[A:%.*]], 3
-; CHECK-NEXT: [[A2:%.*]] = shl i8 [[B:%.*]], 2
-; CHECK-NEXT: [[SUB:%.*]] = sub i8 [[A1]], [[A2]]
-; CHECK-NEXT: [[VAL:%.*]] = call i8 @llvm.umin.i8(i8 [[SUB]], i8 3)
-; CHECK-NEXT: ret i8 [[VAL]]
+; CHECK-NEXT: ret i8 3
;
entry:
%a1 = or i8 %a, 3
More information about the llvm-commits
mailing list