[llvm] b774f14 - [DAG] Calculate the number of sign bits for constant BUILD_VECTOR directly.
David Green via llvm-commits
llvm-commits at lists.llvm.org
Sun May 7 14:31:16 PDT 2023
Author: David Green
Date: 2023-05-07T22:31:10+01:00
New Revision: b774f14841a295187c9f77545b70b60b6f1b3351
URL: https://github.com/llvm/llvm-project/commit/b774f14841a295187c9f77545b70b60b6f1b3351
DIFF: https://github.com/llvm/llvm-project/commit/b774f14841a295187c9f77545b70b60b6f1b3351.diff
LOG: [DAG] Calculate the number of sign bits for constant BUILD_VECTOR directly.
For constant BUILD_VECTORs the operands need to be legal types. This can mean
that when the number of sign bits is calculated it may look that the entire
constant and inefficiently produce less sign bits than it could. For example i8
vectors could use i32 elements, for which 0x000000ff would be incorrectly
limited to 1 sign bit as the original value has 24 sign bits. This makes it
look at the constant directly, truncated to the correct type for the element so
that it can correctly return 8.
Differential Revision: https://reviews.llvm.org/D149956
Added:
Modified:
llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp
llvm/test/CodeGen/AArch64/dag-combine-setcc.ll
Removed:
################################################################################
diff --git a/llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp b/llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp
index f19f5644132af..9d5ca06ada5d7 100644
--- a/llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp
+++ b/llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp
@@ -4130,14 +4130,20 @@ unsigned SelectionDAG::ComputeNumSignBits(SDValue Op, const APInt &DemandedElts,
continue;
SDValue SrcOp = Op.getOperand(i);
- Tmp2 = ComputeNumSignBits(SrcOp, Depth + 1);
+ // BUILD_VECTOR can implicitly truncate sources, we handle this specially
+ // for constant nodes to ensure we only look at the sign bits.
+ if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(SrcOp)) {
+ APInt T = C->getAPIntValue().trunc(VTBits);
+ Tmp2 = T.getNumSignBits();
+ } else {
+ Tmp2 = ComputeNumSignBits(SrcOp, Depth + 1);
- // BUILD_VECTOR can implicitly truncate sources, we must handle this.
- if (SrcOp.getValueSizeInBits() != VTBits) {
- assert(SrcOp.getValueSizeInBits() > VTBits &&
- "Expected BUILD_VECTOR implicit truncation");
- unsigned ExtraBits = SrcOp.getValueSizeInBits() - VTBits;
- Tmp2 = (Tmp2 > ExtraBits ? Tmp2 - ExtraBits : 1);
+ if (SrcOp.getValueSizeInBits() != VTBits) {
+ assert(SrcOp.getValueSizeInBits() > VTBits &&
+ "Expected BUILD_VECTOR implicit truncation");
+ unsigned ExtraBits = SrcOp.getValueSizeInBits() - VTBits;
+ Tmp2 = (Tmp2 > ExtraBits ? Tmp2 - ExtraBits : 1);
+ }
}
Tmp = std::min(Tmp, Tmp2);
}
diff --git a/llvm/test/CodeGen/AArch64/dag-combine-setcc.ll b/llvm/test/CodeGen/AArch64/dag-combine-setcc.ll
index 71b4ed3880e66..f6c4c8429fd45 100644
--- a/llvm/test/CodeGen/AArch64/dag-combine-setcc.ll
+++ b/llvm/test/CodeGen/AArch64/dag-combine-setcc.ll
@@ -226,8 +226,6 @@ define i1 @combine_setcc_ne_vecreduce_and_v32i1(<32 x i8> %a) {
; CHECK-NEXT: mov w8, #1 // =0x1
; CHECK-NEXT: cmeq v1.16b, v1.16b, #0
; CHECK-NEXT: bic v0.16b, v0.16b, v1.16b
-; CHECK-NEXT: shl v0.16b, v0.16b, #7
-; CHECK-NEXT: cmlt v0.16b, v0.16b, #0
; CHECK-NEXT: uminv b0, v0.16b
; CHECK-NEXT: fmov w9, s0
; CHECK-NEXT: bic w0, w8, w9
@@ -249,8 +247,6 @@ define i1 @combine_setcc_ne_vecreduce_and_v64i1(<64 x i8> %a) {
; CHECK-NEXT: bic v1.16b, v1.16b, v3.16b
; CHECK-NEXT: bic v0.16b, v0.16b, v2.16b
; CHECK-NEXT: and v0.16b, v0.16b, v1.16b
-; CHECK-NEXT: shl v0.16b, v0.16b, #7
-; CHECK-NEXT: cmlt v0.16b, v0.16b, #0
; CHECK-NEXT: uminv b0, v0.16b
; CHECK-NEXT: fmov w9, s0
; CHECK-NEXT: bic w0, w8, w9
More information about the llvm-commits
mailing list