[llvm] [AArch64] Lower for power of 2 signed divides with scalar type (PR #97879)
via llvm-commits
llvm-commits at lists.llvm.org
Sat Jul 6 00:26:27 PDT 2024
llvmbot wrote:
<!--LLVM PR SUMMARY COMMENT-->
@llvm/pr-subscribers-backend-aarch64
Author: Allen (vfdff)
<details>
<summary>Changes</summary>
Expected same assemble for code which doesn't use sve registers when we compile it with/without -msve-vector-bits=256.
Fix https://github.com/llvm/llvm-project/issues/97821
---
Full diff: https://github.com/llvm/llvm-project/pull/97879.diff
2 Files Affected:
- (modified) llvm/lib/Target/AArch64/AArch64ISelLowering.cpp (+3-2)
- (modified) llvm/test/CodeGen/AArch64/sve-fixed-length-sdiv-pow2.ll (+17)
``````````diff
diff --git a/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp b/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp
index 9f6f66e9e0c70..f072c9a9b2178 100644
--- a/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp
+++ b/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp
@@ -17544,13 +17544,14 @@ AArch64TargetLowering::BuildSDIVPow2(SDNode *N, const APInt &Divisor,
SmallVectorImpl<SDNode *> &Created) const {
AttributeList Attr = DAG.getMachineFunction().getFunction().getAttributes();
if (isIntDivCheap(N->getValueType(0), Attr))
- return SDValue(N,0); // Lower SDIV as SDIV
+ return SDValue(N, 0); // Lower SDIV as SDIV
EVT VT = N->getValueType(0);
// For scalable and fixed types, mark them as cheap so we can handle it much
// later. This allows us to handle larger than legal types.
- if (VT.isScalableVector() || Subtarget->useSVEForFixedLengthVectors())
+ if (VT.isScalableVector() ||
+ (!VT.isScalarInteger() && Subtarget->useSVEForFixedLengthVectors()))
return SDValue(N, 0);
// fold (sdiv X, pow2)
diff --git a/llvm/test/CodeGen/AArch64/sve-fixed-length-sdiv-pow2.ll b/llvm/test/CodeGen/AArch64/sve-fixed-length-sdiv-pow2.ll
index 21a5abdeaa4d5..46c5ec375721c 100644
--- a/llvm/test/CodeGen/AArch64/sve-fixed-length-sdiv-pow2.ll
+++ b/llvm/test/CodeGen/AArch64/sve-fixed-length-sdiv-pow2.ll
@@ -383,4 +383,21 @@ define void @sdiv_v32i64(ptr %a) vscale_range(16,0) #0 {
ret void
}
+define i32 @sdiv_int(i32 %begin, i32 %first) #0 {
+; CHECK-LABEL: sdiv_int:
+; CHECK: // %bb.0:
+; CHECK-NEXT: sub w8, w0, w1
+; CHECK-NEXT: add w9, w8, #1
+; CHECK-NEXT: add w10, w8, #2
+; CHECK-NEXT: cmp w9, #0
+; CHECK-NEXT: csinc w8, w10, w8, lt
+; CHECK-NEXT: sub w0, w0, w8, asr #1
+; CHECK-NEXT: ret
+ %sub = add i32 %begin, 1
+ %add = sub i32 %sub, %first
+ %div.neg = sdiv i32 %add, -2
+ %sub1 = add i32 %div.neg, %begin
+ ret i32 %sub1
+}
+
attributes #0 = { "target-features"="+sve" }
``````````
</details>
https://github.com/llvm/llvm-project/pull/97879
More information about the llvm-commits
mailing list