[llvm] d46751a - [GlobalISel][AArch64] Lower G_FMAD
Jessica Paquette via llvm-commits
llvm-commits at lists.llvm.org
Mon Oct 3 15:15:49 PDT 2022
Author: Jessica Paquette
Date: 2022-10-03T15:15:17-07:00
New Revision: d46751a5721c7e3ab83bc5ecd760e8ba7c84bb30
URL: https://github.com/llvm/llvm-project/commit/d46751a5721c7e3ab83bc5ecd760e8ba7c84bb30
DIFF: https://github.com/llvm/llvm-project/commit/d46751a5721c7e3ab83bc5ecd760e8ba7c84bb30.diff
LOG: [GlobalISel][AArch64] Lower G_FMAD
Noticed this falling back on CTMark at -Os (bullet).
Seems like we have no 1:1 matching for it, so match SDAG and just lower.
Add testcases for common legal cases as well.
Differential Revision: https://reviews.llvm.org/D135111
Added:
llvm/test/CodeGen/AArch64/GlobalISel/legalize-fmad.mir
Modified:
llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp
Removed:
################################################################################
diff --git a/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp b/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp
index d7448e4df146..093b1811a55d 100644
--- a/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp
+++ b/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp
@@ -824,6 +824,8 @@ AArch64LegalizerInfo::AArch64LegalizerInfo(const AArch64Subtarget &ST)
// TODO: s16 support.
getActionDefinitionsBuilder(G_FCOPYSIGN).customFor({{s32, s32}, {s64, s64}});
+ getActionDefinitionsBuilder(G_FMAD).lower();
+
getLegacyLegalizerInfo().computeTables();
verify(*ST.getInstrInfo());
}
diff --git a/llvm/test/CodeGen/AArch64/GlobalISel/legalize-fmad.mir b/llvm/test/CodeGen/AArch64/GlobalISel/legalize-fmad.mir
new file mode 100644
index 000000000000..73edd07ea699
--- /dev/null
+++ b/llvm/test/CodeGen/AArch64/GlobalISel/legalize-fmad.mir
@@ -0,0 +1,148 @@
+# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
+# RUN: llc -verify-machineinstrs -mtriple=aarch64 -run-pass=legalizer %s -o - | FileCheck %s
+
+...
+---
+name: s16
+tracksRegLiveness: true
+body: |
+ bb.0:
+ liveins: $h0, $h1, $h2
+ ; CHECK-LABEL: name: s16
+ ; CHECK: liveins: $h0, $h1, $h2
+ ; CHECK-NEXT: {{ $}}
+ ; CHECK-NEXT: %op0:_(s16) = COPY $h0
+ ; CHECK-NEXT: %op1:_(s16) = COPY $h1
+ ; CHECK-NEXT: %op2:_(s16) = COPY $h2
+ ; CHECK-NEXT: [[FPEXT:%[0-9]+]]:_(s32) = G_FPEXT %op0(s16)
+ ; CHECK-NEXT: [[FPEXT1:%[0-9]+]]:_(s32) = G_FPEXT %op1(s16)
+ ; CHECK-NEXT: [[FMUL:%[0-9]+]]:_(s32) = G_FMUL [[FPEXT]], [[FPEXT1]]
+ ; CHECK-NEXT: [[FPTRUNC:%[0-9]+]]:_(s16) = G_FPTRUNC [[FMUL]](s32)
+ ; CHECK-NEXT: [[FPEXT2:%[0-9]+]]:_(s32) = G_FPEXT [[FPTRUNC]](s16)
+ ; CHECK-NEXT: [[FPEXT3:%[0-9]+]]:_(s32) = G_FPEXT %op2(s16)
+ ; CHECK-NEXT: [[FADD:%[0-9]+]]:_(s32) = G_FADD [[FPEXT2]], [[FPEXT3]]
+ ; CHECK-NEXT: %fmad:_(s16) = G_FPTRUNC [[FADD]](s32)
+ ; CHECK-NEXT: $h0 = COPY %fmad(s16)
+ ; CHECK-NEXT: RET_ReallyLR implicit $h0
+ %op0:_(s16) = COPY $h0
+ %op1:_(s16) = COPY $h1
+ %op2:_(s16) = COPY $h2
+ %fmad:_(s16) = G_FMAD %op0, %op1, %op2
+ $h0 = COPY %fmad
+ RET_ReallyLR implicit $h0
+...
+---
+name: s32
+tracksRegLiveness: true
+body: |
+ bb.0:
+ liveins: $s0, $s1, $s2
+ ; CHECK-LABEL: name: s32
+ ; CHECK: liveins: $s0, $s1, $s2
+ ; CHECK-NEXT: {{ $}}
+ ; CHECK-NEXT: %op0:_(s32) = COPY $s0
+ ; CHECK-NEXT: %op1:_(s32) = COPY $s1
+ ; CHECK-NEXT: %op2:_(s32) = COPY $s2
+ ; CHECK-NEXT: [[FMUL:%[0-9]+]]:_(s32) = G_FMUL %op0, %op1
+ ; CHECK-NEXT: %fmad:_(s32) = G_FADD [[FMUL]], %op2
+ ; CHECK-NEXT: $s0 = COPY %fmad(s32)
+ ; CHECK-NEXT: RET_ReallyLR implicit $s0
+ %op0:_(s32) = COPY $s0
+ %op1:_(s32) = COPY $s1
+ %op2:_(s32) = COPY $s2
+ %fmad:_(s32) = G_FMAD %op0, %op1, %op2
+ $s0 = COPY %fmad
+ RET_ReallyLR implicit $s0
+...
+---
+name: s64
+tracksRegLiveness: true
+body: |
+ bb.0:
+ liveins: $d0, $d1, $d2
+ ; CHECK-LABEL: name: s64
+ ; CHECK: liveins: $d0, $d1, $d2
+ ; CHECK-NEXT: {{ $}}
+ ; CHECK-NEXT: %op0:_(s64) = COPY $d0
+ ; CHECK-NEXT: %op1:_(s64) = COPY $d1
+ ; CHECK-NEXT: %op2:_(s64) = COPY $d2
+ ; CHECK-NEXT: [[FMUL:%[0-9]+]]:_(s64) = G_FMUL %op0, %op1
+ ; CHECK-NEXT: %fmad:_(s64) = G_FADD [[FMUL]], %op2
+ ; CHECK-NEXT: $d0 = COPY %fmad(s64)
+ ; CHECK-NEXT: RET_ReallyLR implicit $d0
+ %op0:_(s64) = COPY $d0
+ %op1:_(s64) = COPY $d1
+ %op2:_(s64) = COPY $d2
+ %fmad:_(s64) = G_FMAD %op0, %op1, %op2
+ $d0 = COPY %fmad
+ RET_ReallyLR implicit $d0
+...
+---
+name: v2s32
+tracksRegLiveness: true
+body: |
+ bb.0:
+ liveins: $d0, $d1, $d2
+ ; CHECK-LABEL: name: v2s32
+ ; CHECK: liveins: $d0, $d1, $d2
+ ; CHECK-NEXT: {{ $}}
+ ; CHECK-NEXT: %op0:_(<2 x s32>) = COPY $d0
+ ; CHECK-NEXT: %op1:_(<2 x s32>) = COPY $d1
+ ; CHECK-NEXT: %op2:_(<2 x s32>) = COPY $d2
+ ; CHECK-NEXT: [[FMUL:%[0-9]+]]:_(<2 x s32>) = G_FMUL %op0, %op1
+ ; CHECK-NEXT: %fmad:_(<2 x s32>) = G_FADD [[FMUL]], %op2
+ ; CHECK-NEXT: $d0 = COPY %fmad(<2 x s32>)
+ ; CHECK-NEXT: RET_ReallyLR implicit $d0
+ %op0:_(<2 x s32>) = COPY $d0
+ %op1:_(<2 x s32>) = COPY $d1
+ %op2:_(<2 x s32>) = COPY $d2
+ %fmad:_(<2 x s32>) = G_FMAD %op0, %op1, %op2
+ $d0 = COPY %fmad
+ RET_ReallyLR implicit $d0
+...
+---
+name: v4s32
+tracksRegLiveness: true
+body: |
+ bb.0:
+ liveins: $q0, $q1, $q2
+ ; CHECK-LABEL: name: v4s32
+ ; CHECK: liveins: $q0, $q1, $q2
+ ; CHECK-NEXT: {{ $}}
+ ; CHECK-NEXT: %op0:_(<4 x s32>) = COPY $q0
+ ; CHECK-NEXT: %op1:_(<4 x s32>) = COPY $q1
+ ; CHECK-NEXT: %op2:_(<4 x s32>) = COPY $q2
+ ; CHECK-NEXT: [[FMUL:%[0-9]+]]:_(<4 x s32>) = G_FMUL %op0, %op1
+ ; CHECK-NEXT: %fmad:_(<4 x s32>) = G_FADD [[FMUL]], %op2
+ ; CHECK-NEXT: $q0 = COPY %fmad(<4 x s32>)
+ ; CHECK-NEXT: RET_ReallyLR implicit $q0
+ %op0:_(<4 x s32>) = COPY $q0
+ %op1:_(<4 x s32>) = COPY $q1
+ %op2:_(<4 x s32>) = COPY $q2
+ %fmad:_(<4 x s32>) = G_FMAD %op0, %op1, %op2
+ $q0 = COPY %fmad
+ RET_ReallyLR implicit $q0
+...
+---
+name: v2s64
+tracksRegLiveness: true
+body: |
+ bb.0:
+ liveins: $q0, $q1, $q2
+ ; CHECK-LABEL: name: v2s64
+ ; CHECK: liveins: $q0, $q1, $q2
+ ; CHECK-NEXT: {{ $}}
+ ; CHECK-NEXT: %op0:_(<2 x s64>) = COPY $q0
+ ; CHECK-NEXT: %op1:_(<2 x s64>) = COPY $q1
+ ; CHECK-NEXT: %op2:_(<2 x s64>) = COPY $q2
+ ; CHECK-NEXT: [[FMUL:%[0-9]+]]:_(<2 x s64>) = G_FMUL %op0, %op1
+ ; CHECK-NEXT: %fmad:_(<2 x s64>) = G_FADD [[FMUL]], %op2
+ ; CHECK-NEXT: $q0 = COPY %fmad(<2 x s64>)
+ ; CHECK-NEXT: RET_ReallyLR implicit $q0
+ %op0:_(<2 x s64>) = COPY $q0
+ %op1:_(<2 x s64>) = COPY $q1
+ %op2:_(<2 x s64>) = COPY $q2
+ %fmad:_(<2 x s64>) = G_FMAD %op0, %op1, %op2
+ $q0 = COPY %fmad
+ RET_ReallyLR implicit $q0
+...
More information about the llvm-commits
mailing list