[llvm] 9e4d726 - [AArch64] Improve schedule modelling on the Cortex-A55
Nicholas Guy via llvm-commits
llvm-commits at lists.llvm.org
Tue Sep 21 05:04:11 PDT 2021
Author: Nicholas Guy
Date: 2021-09-21T13:03:34+01:00
New Revision: 9e4d72675f476386cf6555cd5a1014cdd8d9facb
URL: https://github.com/llvm/llvm-project/commit/9e4d72675f476386cf6555cd5a1014cdd8d9facb
DIFF: https://github.com/llvm/llvm-project/commit/9e4d72675f476386cf6555cd5a1014cdd8d9facb.diff
LOG: [AArch64] Improve schedule modelling on the Cortex-A55
Enables the FuseAddress feature in the Cortex-A55 scheduling model
Differential Revision: https://reviews.llvm.org/D109323
Added:
llvm/test/CodeGen/AArch64/a55-fuse-address.mir
Modified:
llvm/lib/Target/AArch64/AArch64.td
Removed:
################################################################################
diff --git a/llvm/lib/Target/AArch64/AArch64.td b/llvm/lib/Target/AArch64/AArch64.td
index a7af4e61e59ef..5c1bf783ba2a9 100644
--- a/llvm/lib/Target/AArch64/AArch64.td
+++ b/llvm/lib/Target/AArch64/AArch64.td
@@ -615,6 +615,7 @@ def ProcA55 : SubtargetFeature<"a55", "ARMProcFamily", "CortexA55",
FeatureRCPC,
FeaturePerfMon,
FeaturePostRAScheduler,
+ FeatureFuseAddress,
]>;
def ProcA57 : SubtargetFeature<"a57", "ARMProcFamily", "CortexA57",
diff --git a/llvm/test/CodeGen/AArch64/a55-fuse-address.mir b/llvm/test/CodeGen/AArch64/a55-fuse-address.mir
new file mode 100644
index 0000000000000..bd6518ae8f0a6
--- /dev/null
+++ b/llvm/test/CodeGen/AArch64/a55-fuse-address.mir
@@ -0,0 +1,45 @@
+# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
+# RUN: llc -o - %s -mtriple=aarch64 -run-pass=machine-scheduler -verify-machineinstrs | FileCheck %s
+--- |
+ target datalayout = "e-m:e-i8:8:32-i16:16:32-i64:64-i128:128-n32:64-S128"
+ target triple = "aarch64-arm-none-eabi"
+
+ @a = dso_local global i32 2, align 4
+ @b = dso_local global i32 4, align 4
+
+ define i32 @fuseaddress(i32 %num) #0 {
+ entry:
+ %0 = load i32, i32* @a, align 4
+ %1 = load i32, i32* @b, align 4
+ %mul = mul nsw i32 %0, %1
+ ret i32 %mul
+ }
+
+ attributes #0 = { "target-cpu"="cortex-a55" }
+
+---
+name: fuseaddress
+legalized: true
+regBankSelected: true
+tracksRegLiveness: true
+liveins:
+ - { reg: '$w0' }
+body: |
+ bb.0.entry:
+ liveins: $w0
+ ; CHECK-LABEL: name: fuseaddress
+ ; CHECK: liveins: $w0
+ ; CHECK: [[ADRP:%[0-9]+]]:gpr64common = ADRP target-flags(aarch64-page) @a
+ ; CHECK: [[LDRWui:%[0-9]+]]:gpr32 = LDRWui [[ADRP]], target-flags(aarch64-pageoff, aarch64-nc) @a :: (dereferenceable load (s32) from @a)
+ ; CHECK: [[ADRP1:%[0-9]+]]:gpr64common = ADRP target-flags(aarch64-page) @b
+ ; CHECK: [[LDRWui1:%[0-9]+]]:gpr32 = LDRWui [[ADRP1]], target-flags(aarch64-pageoff, aarch64-nc) @b :: (dereferenceable load (s32) from @b)
+ ; CHECK: [[MADDWrrr:%[0-9]+]]:gpr32 = nsw MADDWrrr [[LDRWui]], [[LDRWui1]], $wzr
+ ; CHECK: $w0 = COPY [[MADDWrrr]]
+ ; CHECK: RET_ReallyLR implicit $w0
+ %1:gpr64common = ADRP target-flags(aarch64-page) @a
+ %4:gpr64common = ADRP target-flags(aarch64-page) @b
+ %2:gpr32 = LDRWui killed %1:gpr64common, target-flags(aarch64-pageoff, aarch64-nc) @a :: (dereferenceable load (s32) from @a)
+ %5:gpr32 = LDRWui killed %4:gpr64common, target-flags(aarch64-pageoff, aarch64-nc) @b :: (dereferenceable load (s32) from @b)
+ %6:gpr32 = nsw MADDWrrr killed %2:gpr32, killed %5:gpr32, $wzr
+ $w0 = COPY %6:gpr32
+ RET_ReallyLR implicit $w0
More information about the llvm-commits
mailing list