[PATCH] D133235: [DAGCombiner] More opportunities to fuse fmul and fadd to fma aggressively
Dmitry Vassiliev via Phabricator via llvm-commits
llvm-commits at lists.llvm.org
Mon Sep 5 21:55:14 PDT 2022
slydiman updated this revision to Diff 458094.
Repository:
rG LLVM Github Monorepo
CHANGES SINCE LAST ACTION
https://reviews.llvm.org/D133235/new/
https://reviews.llvm.org/D133235
Files:
llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
llvm/test/CodeGen/NVPTX/fma-assoc.ll
Index: llvm/test/CodeGen/NVPTX/fma-assoc.ll
===================================================================
--- llvm/test/CodeGen/NVPTX/fma-assoc.ll
+++ llvm/test/CodeGen/NVPTX/fma-assoc.ll
@@ -39,3 +39,23 @@
ret double %3
}
+define float @FoldFAddFMAFMAFMul(float %a, float %b, float %c, float %d,
+ float %x, float %y, float %z) {
+; CHECK-LABEL: FoldFAddFMAFMAFMul(
+; fold (fadd x, (fma a, b, (fma c, d, (fmul y, z))))
+; -> (fma y, z (fma a, b, (fma c, d, x)))
+; CHECK-NOT: mul.f32
+; CHECK: fma.rn.f32
+; CHECK: fma.rn.f32
+; CHECK: fma.rn.f32
+; CHECK-NOT: add.f32
+ %mul = fmul float %y, %z
+ %fma1 = call float @llvm.fma.f32(float %c, float %d, float %mul)
+ %fma2 = call float @llvm.fma.f32(float %a, float %b, float %fma1)
+ %res = fadd float %x, %fma2
+ ret float %res
+}
+
+declare float @llvm.fma.f32(float, float, float) #0
+
+attributes #0 = { nounwind readnone }
Index: llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
===================================================================
--- llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
+++ llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
@@ -14202,6 +14202,28 @@
// More folding opportunities when target permits.
if (Aggressive) {
+ // fold (fadd x, (fma a, b, (fma c, d, (fmul y, z))))
+ // -> (fma y, z (fma a, b, (fma c, d, x)))
+ auto FoldFAddFMAFMAFMul = [&](SDValue A, SDValue B, SDValue C, SDValue D,
+ SDValue X, SDValue Y, SDValue Z) {
+ return DAG.getNode(
+ PreferredFusedOpcode, SL, VT, Y, Z,
+ DAG.getNode(PreferredFusedOpcode, SL, VT, A, B,
+ DAG.getNode(PreferredFusedOpcode, SL, VT, C, D, X)));
+ };
+ if (isFusedOp(N1)) {
+ SDValue FMA1_N2 = N1.getOperand(2);
+ if (isFusedOp(FMA1_N2)) {
+ SDValue FMA2_N2 = FMA1_N2.getOperand(2);
+ if (FMA2_N2.getOpcode() == ISD::FMUL) {
+ return FoldFAddFMAFMAFMul(
+ N1.getOperand(0), N1.getOperand(1), FMA1_N2.getOperand(0),
+ FMA1_N2.getOperand(1), N0, FMA2_N2.getOperand(0),
+ FMA2_N2.getOperand(1));
+ }
+ }
+ }
+
// fold (fadd (fma x, y, (fpext (fmul u, v))), z)
// -> (fma x, y, (fma (fpext u), (fpext v), z))
auto FoldFAddFMAFPExtFMul = [&](SDValue X, SDValue Y, SDValue U, SDValue V,
-------------- next part --------------
A non-text attachment was scrubbed...
Name: D133235.458094.patch
Type: text/x-patch
Size: 2366 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/llvm-commits/attachments/20220906/722870da/attachment.bin>
More information about the llvm-commits
mailing list