[llvm] 9e4d726 - [AArch64] Improve schedule modelling on the Cortex-A55

Nicholas Guy via llvm-commits llvm-commits at lists.llvm.org
Tue Sep 21 05:04:11 PDT 2021


Author: Nicholas Guy
Date: 2021-09-21T13:03:34+01:00
New Revision: 9e4d72675f476386cf6555cd5a1014cdd8d9facb

URL: https://github.com/llvm/llvm-project/commit/9e4d72675f476386cf6555cd5a1014cdd8d9facb
DIFF: https://github.com/llvm/llvm-project/commit/9e4d72675f476386cf6555cd5a1014cdd8d9facb.diff

LOG: [AArch64] Improve schedule modelling on the Cortex-A55

Enables the FuseAddress feature in the Cortex-A55 scheduling model

Differential Revision: https://reviews.llvm.org/D109323

Added: 
    llvm/test/CodeGen/AArch64/a55-fuse-address.mir

Modified: 
    llvm/lib/Target/AArch64/AArch64.td

Removed: 
    


################################################################################
diff  --git a/llvm/lib/Target/AArch64/AArch64.td b/llvm/lib/Target/AArch64/AArch64.td
index a7af4e61e59ef..5c1bf783ba2a9 100644
--- a/llvm/lib/Target/AArch64/AArch64.td
+++ b/llvm/lib/Target/AArch64/AArch64.td
@@ -615,6 +615,7 @@ def ProcA55     : SubtargetFeature<"a55", "ARMProcFamily", "CortexA55",
                                    FeatureRCPC,
                                    FeaturePerfMon,
                                    FeaturePostRAScheduler,
+                                   FeatureFuseAddress,
                                    ]>;
 
 def ProcA57     : SubtargetFeature<"a57", "ARMProcFamily", "CortexA57",

diff  --git a/llvm/test/CodeGen/AArch64/a55-fuse-address.mir b/llvm/test/CodeGen/AArch64/a55-fuse-address.mir
new file mode 100644
index 0000000000000..bd6518ae8f0a6
--- /dev/null
+++ b/llvm/test/CodeGen/AArch64/a55-fuse-address.mir
@@ -0,0 +1,45 @@
+# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
+# RUN: llc -o - %s -mtriple=aarch64 -run-pass=machine-scheduler -verify-machineinstrs | FileCheck %s
+--- |
+  target datalayout = "e-m:e-i8:8:32-i16:16:32-i64:64-i128:128-n32:64-S128"
+  target triple = "aarch64-arm-none-eabi"
+
+  @a = dso_local global i32 2, align 4
+  @b = dso_local global i32 4, align 4
+
+  define i32 @fuseaddress(i32 %num) #0 {
+  entry:
+    %0 = load i32, i32* @a, align 4
+    %1 = load i32, i32* @b, align 4
+    %mul = mul nsw i32 %0, %1
+    ret i32 %mul
+  }
+
+  attributes #0 = { "target-cpu"="cortex-a55" }
+
+---
+name: fuseaddress
+legalized: true
+regBankSelected: true
+tracksRegLiveness: true
+liveins:
+  - { reg: '$w0' }
+body: |
+  bb.0.entry:
+    liveins: $w0
+    ; CHECK-LABEL: name: fuseaddress
+    ; CHECK: liveins: $w0
+    ; CHECK: [[ADRP:%[0-9]+]]:gpr64common = ADRP target-flags(aarch64-page) @a
+    ; CHECK: [[LDRWui:%[0-9]+]]:gpr32 = LDRWui [[ADRP]], target-flags(aarch64-pageoff, aarch64-nc) @a :: (dereferenceable load (s32) from @a)
+    ; CHECK: [[ADRP1:%[0-9]+]]:gpr64common = ADRP target-flags(aarch64-page) @b
+    ; CHECK: [[LDRWui1:%[0-9]+]]:gpr32 = LDRWui [[ADRP1]], target-flags(aarch64-pageoff, aarch64-nc) @b :: (dereferenceable load (s32) from @b)
+    ; CHECK: [[MADDWrrr:%[0-9]+]]:gpr32 = nsw MADDWrrr [[LDRWui]], [[LDRWui1]], $wzr
+    ; CHECK: $w0 = COPY [[MADDWrrr]]
+    ; CHECK: RET_ReallyLR implicit $w0
+    %1:gpr64common = ADRP target-flags(aarch64-page) @a
+    %4:gpr64common = ADRP target-flags(aarch64-page) @b
+    %2:gpr32 = LDRWui killed %1:gpr64common, target-flags(aarch64-pageoff, aarch64-nc) @a :: (dereferenceable load (s32) from @a)
+    %5:gpr32 = LDRWui killed %4:gpr64common, target-flags(aarch64-pageoff, aarch64-nc) @b :: (dereferenceable load (s32) from @b)
+    %6:gpr32 = nsw MADDWrrr killed %2:gpr32, killed %5:gpr32, $wzr
+    $w0 = COPY %6:gpr32
+    RET_ReallyLR implicit $w0


        


More information about the llvm-commits mailing list