[llvm] [M68k] implement -mxgot (PR #119803)

via llvm-commits llvm-commits at lists.llvm.org
Thu Dec 12 19:03:55 PST 2024


https://github.com/knickish updated https://github.com/llvm/llvm-project/pull/119803

>From 35825eca71f3834f9314c40a6c9d8c32ce4340bd Mon Sep 17 00:00:00 2001
From: kirk <knickish at gmail.com>
Date: Wed, 11 Dec 2024 19:42:43 +0000
Subject: [PATCH] [M68k] implement -mxgot

---
 llvm/lib/Target/M68k/M68k.td                  |  3 +
 llvm/lib/Target/M68k/M68kInstrInfo.cpp        | 23 ++++++-
 llvm/lib/Target/M68k/M68kSubtarget.cpp        |  4 +-
 llvm/lib/Target/M68k/M68kSubtarget.h          |  5 ++
 llvm/lib/Target/M68k/M68kTargetMachine.cpp    |  1 +
 llvm/lib/Target/M68k/M68kTargetMachine.h      |  1 +
 .../M68k/MCTargetDesc/M68kAsmBackend.cpp      | 65 ++++++++++++++++---
 llvm/test/CodeGen/M68k/xgot.ll                | 51 +++++++++++++++
 .../MC/M68k/Relocations/PIC/data-gotoff.s     | 37 ++++++++++-
 9 files changed, 175 insertions(+), 15 deletions(-)
 create mode 100644 llvm/test/CodeGen/M68k/xgot.ll

diff --git a/llvm/lib/Target/M68k/M68k.td b/llvm/lib/Target/M68k/M68k.td
index dab66d10229559..7fd48d6a7c46d4 100644
--- a/llvm/lib/Target/M68k/M68k.td
+++ b/llvm/lib/Target/M68k/M68k.td
@@ -65,6 +65,9 @@ foreach i = {0-7} in
       SubtargetFeature<"reserve-d"#i, "UserReservedRegister[M68k::D"#i#"]",
                        "true", "Reserve D"#i#" register">;
 
+def FeatureXGOT
+    : SubtargetFeature<"xgot", "UseXGOT", "true", "Assume 32-bit GOT">;
+
 //===----------------------------------------------------------------------===//
 // M68k processors supported.
 //===----------------------------------------------------------------------===//
diff --git a/llvm/lib/Target/M68k/M68kInstrInfo.cpp b/llvm/lib/Target/M68k/M68kInstrInfo.cpp
index 63404645209508..da5ce0bd606a9c 100644
--- a/llvm/lib/Target/M68k/M68kInstrInfo.cpp
+++ b/llvm/lib/Target/M68k/M68kInstrInfo.cpp
@@ -17,6 +17,7 @@
 #include "M68kMachineFunction.h"
 #include "M68kTargetMachine.h"
 #include "MCTargetDesc/M68kMCCodeEmitter.h"
+#include "MCTargetDesc/M68kMCTargetDesc.h"
 
 #include "llvm/ADT/STLExtras.h"
 #include "llvm/ADT/ScopeExit.h"
@@ -936,6 +937,7 @@ struct M68kGlobalBaseReg : public MachineFunctionPass {
   bool runOnMachineFunction(MachineFunction &MF) override {
     const M68kSubtarget &STI = MF.getSubtarget<M68kSubtarget>();
     M68kMachineFunctionInfo *MxFI = MF.getInfo<M68kMachineFunctionInfo>();
+    MachineRegisterInfo &RegInfo = MF.getRegInfo();
 
     unsigned GlobalBaseReg = MxFI->getGlobalBaseReg();
 
@@ -949,9 +951,24 @@ struct M68kGlobalBaseReg : public MachineFunctionPass {
     DebugLoc DL = FirstMBB.findDebugLoc(MBBI);
     const M68kInstrInfo *TII = STI.getInstrInfo();
 
-    // Generate lea (__GLOBAL_OFFSET_TABLE_,%PC), %A5
-    BuildMI(FirstMBB, MBBI, DL, TII->get(M68k::LEA32q), GlobalBaseReg)
-        .addExternalSymbol("_GLOBAL_OFFSET_TABLE_", M68kII::MO_GOTPCREL);
+    if (STI.useXGOT()) {
+      Register LoadPC = RegInfo.createVirtualRegister(&M68k::AR32_NOSPRegClass);
+      Register LoadGOT =
+          RegInfo.createVirtualRegister(&M68k::AR32_NOSPRegClass);
+      BuildMI(FirstMBB, MBBI, DL, TII->get(M68k::LEA32q), LoadPC).addImm(0);
+      BuildMI(FirstMBB, MBBI, DL, TII->get(M68k::LEA32b), LoadGOT)
+          .addExternalSymbol("_GLOBAL_OFFSET_TABLE_");
+      ;
+      BuildMI(FirstMBB, MBBI, DL, TII->get(M68k::SUB32ar), GlobalBaseReg)
+          .addReg(LoadPC)
+          .addReg(LoadGOT);
+
+      // continue here
+    } else {
+      // Generate lea (__GLOBAL_OFFSET_TABLE_,%PC), %A5
+      BuildMI(FirstMBB, MBBI, DL, TII->get(M68k::LEA32q), GlobalBaseReg)
+          .addExternalSymbol("_GLOBAL_OFFSET_TABLE_", M68kII::MO_GOTPCREL);
+    }
 
     return true;
   }
diff --git a/llvm/lib/Target/M68k/M68kSubtarget.cpp b/llvm/lib/Target/M68k/M68kSubtarget.cpp
index 53ec574ae5596c..44927d37bd2c00 100644
--- a/llvm/lib/Target/M68k/M68kSubtarget.cpp
+++ b/llvm/lib/Target/M68k/M68kSubtarget.cpp
@@ -25,6 +25,7 @@
 #include "llvm/IR/Attributes.h"
 #include "llvm/IR/Function.h"
 #include "llvm/MC/TargetRegistry.h"
+#include "llvm/Support/CodeGen.h"
 #include "llvm/Support/CommandLine.h"
 #include "llvm/Support/ErrorHandling.h"
 
@@ -50,7 +51,8 @@ void M68kSubtarget::anchor() {}
 
 M68kSubtarget::M68kSubtarget(const Triple &TT, StringRef CPU, StringRef FS,
                              const M68kTargetMachine &TM)
-    : M68kGenSubtargetInfo(TT, CPU, /*TuneCPU*/ CPU, FS), TM(TM), TSInfo(),
+    : M68kGenSubtargetInfo(TT, CPU, /*TuneCPU*/ CPU, FS),
+      UseXGOT(this->useXGOT()), TM(TM), TSInfo(),
       InstrInfo(initializeSubtargetDependencies(CPU, TT, FS, TM)),
       FrameLowering(*this, this->getStackAlignment()), TLInfo(TM, *this),
       TargetTriple(TT) {
diff --git a/llvm/lib/Target/M68k/M68kSubtarget.h b/llvm/lib/Target/M68k/M68kSubtarget.h
index c08a9786fb27ba..19128856d30649 100644
--- a/llvm/lib/Target/M68k/M68kSubtarget.h
+++ b/llvm/lib/Target/M68k/M68kSubtarget.h
@@ -51,6 +51,9 @@ class M68kSubtarget : public M68kGenSubtargetInfo {
   enum SubtargetEnum { M00, M10, M20, M30, M40, M60 };
   SubtargetEnum SubtargetKind = M00;
 
+  // Assume 32-bit GOT.
+  bool UseXGOT = false;
+
   enum FPKindEnum { M881, M882 };
   std::optional<FPKindEnum> FPUKind;
 
@@ -98,6 +101,8 @@ class M68kSubtarget : public M68kGenSubtargetInfo {
 
   bool useSmallSection() const { return UseSmallSection; }
 
+  bool useXGOT() const { return UseXGOT; }
+
   const Triple &getTargetTriple() const { return TargetTriple; }
 
   bool isTargetELF() const { return TargetTriple.isOSBinFormatELF(); }
diff --git a/llvm/lib/Target/M68k/M68kTargetMachine.cpp b/llvm/lib/Target/M68k/M68kTargetMachine.cpp
index 2f5a2e8288a261..839db3a6da5fe5 100644
--- a/llvm/lib/Target/M68k/M68kTargetMachine.cpp
+++ b/llvm/lib/Target/M68k/M68kTargetMachine.cpp
@@ -105,6 +105,7 @@ M68kTargetMachine::M68kTargetMachine(const Target &T, const Triple &TT,
                                ::getEffectiveCodeModel(CM, JIT), OL),
       TLOF(std::make_unique<M68kELFTargetObjectFile>()),
       Subtarget(TT, CPU, FS, *this) {
+  setCodeModel(::getEffectiveCodeModel(CM, JIT));
   initAsmInfo();
 }
 
diff --git a/llvm/lib/Target/M68k/M68kTargetMachine.h b/llvm/lib/Target/M68k/M68kTargetMachine.h
index c2648f5d38c5ea..25a721aba3c8ec 100644
--- a/llvm/lib/Target/M68k/M68kTargetMachine.h
+++ b/llvm/lib/Target/M68k/M68kTargetMachine.h
@@ -21,6 +21,7 @@
 #include "llvm/CodeGen/Passes.h"
 #include "llvm/CodeGen/SelectionDAGISel.h"
 #include "llvm/CodeGen/TargetFrameLowering.h"
+#include "llvm/Support/CodeGen.h"
 
 #include <optional>
 
diff --git a/llvm/lib/Target/M68k/MCTargetDesc/M68kAsmBackend.cpp b/llvm/lib/Target/M68k/MCTargetDesc/M68kAsmBackend.cpp
index 04777677cbf218..432915e972538a 100644
--- a/llvm/lib/Target/M68k/MCTargetDesc/M68kAsmBackend.cpp
+++ b/llvm/lib/Target/M68k/MCTargetDesc/M68kAsmBackend.cpp
@@ -93,8 +93,11 @@ class M68kAsmBackend : public MCAsmBackend {
   bool mayNeedRelaxation(const MCInst &Inst,
                          const MCSubtargetInfo &STI) const override;
 
-  bool fixupNeedsRelaxation(const MCFixup &Fixup,
-                            uint64_t Value) const override;
+  bool fixupNeedsRelaxationAdvanced(const MCAssembler &Asm,
+                                    const MCFixup &Fixup, bool Resolved,
+                                    uint64_t Value,
+                                    const MCRelaxableFragment *DF,
+                                    const bool WasForced) const override;
 
   void relaxInstruction(MCInst &Inst,
                         const MCSubtargetInfo &STI) const override;
@@ -191,6 +194,31 @@ static unsigned getRelaxedOpcodeBranch(const MCInst &Inst) {
   }
 }
 
+static bool RelaxesTo32Bit(const MCInst &Inst) {
+  unsigned Op = Inst.getOpcode();
+  switch (Op) {
+  default:
+    return false;
+
+  case M68k::BRA16:
+  case M68k::Bcc16:
+  case M68k::Bls16:
+  case M68k::Blt16:
+  case M68k::Beq16:
+  case M68k::Bmi16:
+  case M68k::Bne16:
+  case M68k::Bge16:
+  case M68k::Bcs16:
+  case M68k::Bpl16:
+  case M68k::Bgt16:
+  case M68k::Bhi16:
+  case M68k::Bvc16:
+  case M68k::Ble16:
+  case M68k::Bvs16:
+    return true;
+  }
+}
+
 static unsigned getRelaxedOpcodeArith(const MCInst &Inst) {
   unsigned Op = Inst.getOpcode();
   // NOTE there will be some relaxations for PCD and ARD mem for x20
@@ -224,22 +252,42 @@ bool M68kAsmBackend::mayNeedRelaxation(const MCInst &Inst,
   return false;
 }
 
-bool M68kAsmBackend::fixupNeedsRelaxation(const MCFixup &Fixup,
-                                          uint64_t UnsignedValue) const {
+bool M68kAsmBackend::fixupNeedsRelaxationAdvanced(const MCAssembler &Asm,
+                                                  const MCFixup &Fixup,
+                                                  bool Resolved,
+                                                  uint64_t UnsignedValue,
+                                                  const MCRelaxableFragment *DF,
+                                                  const bool WasForced) const {
   int64_t Value = static_cast<int64_t>(UnsignedValue);
 
-  if (!isInt<32>(Value) || (!Allows32BitBranch && !isInt<16>(Value)))
+  if (!isInt<32>(Value) || (!Allows32BitBranch && !isInt<16>(Value))) {
     llvm_unreachable("Cannot relax the instruction, value does not fit");
+  }
+
+  bool InstrCanRelax = false;
+  if (Allows32BitBranch) {
+    // mayNeedRelaxation checks that there's actually an instr to relax to
+    // before reaching this point, and all instrs are available for this CPU
+    InstrCanRelax = true;
+  } else {
+    // We're using a CPU that can only handle 16 bit branches, we can't relax
+    // unless it's an 8->16 bit relaxation
+    InstrCanRelax = !RelaxesTo32Bit(DF->getInst());
+  }
+  // For unresolved fixups, make sure we relax them as much as is possible
+  // for the CPU type.
+  bool RelaxBecauseUnresolved = !Resolved && InstrCanRelax;
 
   // Relax if the value is too big for a (signed) i8
   // (or signed i16 if 32 bit branches can be used). This means
   // that byte-wide instructions have to matched by default
   unsigned KindLog2Size = getFixupKindLog2Size(Fixup.getKind());
   bool FixupFieldTooSmall = false;
-  if (!isInt<8>(Value) && KindLog2Size == 0)
+  if (!isInt<8>(Value) && KindLog2Size == 0) {
     FixupFieldTooSmall = true;
-  else if (!isInt<16>(Value) && KindLog2Size <= 1)
+  } else if (!isInt<16>(Value) && KindLog2Size <= 1) {
     FixupFieldTooSmall = true;
+  }
 
   // NOTE
   // A branch to the immediately following instruction automatically
@@ -247,7 +295,8 @@ bool M68kAsmBackend::fixupNeedsRelaxation(const MCFixup &Fixup,
   // displacement field contains $00 (zero offset).
   bool ZeroDisplacementNeedsFixup = Value == 0 && KindLog2Size == 0;
 
-  return ZeroDisplacementNeedsFixup || FixupFieldTooSmall;
+  return ZeroDisplacementNeedsFixup || FixupFieldTooSmall ||
+         RelaxBecauseUnresolved;
 }
 
 // NOTE Can tblgen help at all here to verify there aren't other instructions
diff --git a/llvm/test/CodeGen/M68k/xgot.ll b/llvm/test/CodeGen/M68k/xgot.ll
new file mode 100644
index 00000000000000..ad7ebc2fb38d1b
--- /dev/null
+++ b/llvm/test/CodeGen/M68k/xgot.ll
@@ -0,0 +1,51 @@
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 4
+; RUN: llc -mtriple=m68k --show-mc-encoding -mattr=+xgot -relocation-model=pic -code-model=large < %s | FileCheck %s
+
+ at VBRTag = external global [2147483647 x i8]
+
+define i1 @folded_offset(i32 %conv29) {
+; CHECK-LABEL: folded_offset:
+; CHECK:         .cfi_startproc
+; CHECK-NEXT:  ; %bb.0: ; %entry
+; CHECK-NEXT:    lea (0,%pc), %a0 ; encoding: [0x41,0xfa,0x00,0x00]
+; CHECK-NEXT:    lea _GLOBAL_OFFSET_TABLE_, %a1 ; encoding: [0x43,0xf9,A,A,A,A]
+; CHECK-NEXT:    ; fixup A - offset: 2, value: _GLOBAL_OFFSET_TABLE_, kind: FK_Data_4
+; CHECK-NEXT:    suba.l %a1, %a0 ; encoding: [0x91,0xc9]
+; CHECK-NEXT:    move.l #VBRTag at GOTOFF, %d0 ; encoding: [0x20,0x3c,A,A,A,A]
+; CHECK-NEXT:    ; fixup A - offset: 2, value: VBRTag at GOTOFF, kind: FK_Data_4
+; CHECK-NEXT:    move.b (1,%a0,%d0), %d0 ; encoding: [0x10,0x30,0x08,0x01]
+; CHECK-NEXT:    ext.w %d0 ; encoding: [0x48,0x80]
+; CHECK-NEXT:    ext.l %d0 ; encoding: [0x48,0xc0]
+; CHECK-NEXT:    sub.l (4,%sp), %d0 ; encoding: [0x90,0xaf,0x00,0x04]
+; CHECK-NEXT:    seq %d0 ; encoding: [0x57,0xc0]
+; CHECK-NEXT:    rts ; encoding: [0x4e,0x75]
+entry:
+  %0 = load i8, ptr getelementptr inbounds ([2147483647 x i8], ptr @VBRTag, i32 0, i32 1), align 1
+  %conv30 = sext i8 %0 to i32
+  %cmp31.not = icmp eq i32 %conv30, %conv29
+  ret i1 %cmp31.not
+}
+
+define i1 @non_folded_offset(i32 %conv29) {
+; CHECK-LABEL: non_folded_offset:
+; CHECK:         .cfi_startproc
+; CHECK-NEXT:  ; %bb.0: ; %entry
+; CHECK-NEXT:    lea (0,%pc), %a0 ; encoding: [0x41,0xfa,0x00,0x00]
+; CHECK-NEXT:    lea _GLOBAL_OFFSET_TABLE_, %a1 ; encoding: [0x43,0xf9,A,A,A,A]
+; CHECK-NEXT:    ; fixup A - offset: 2, value: _GLOBAL_OFFSET_TABLE_, kind: FK_Data_4
+; CHECK-NEXT:    suba.l %a1, %a0 ; encoding: [0x91,0xc9]
+; CHECK-NEXT:    move.l #2147483645, %d0 ; encoding: [0x20,0x3c,0x7f,0xff,0xff,0xfd]
+; CHECK-NEXT:    adda.l #VBRTag at GOTOFF, %a0 ; encoding: [0xd1,0xfc,A,A,A,A]
+; CHECK-NEXT:    ; fixup A - offset: 2, value: VBRTag at GOTOFF, kind: FK_Data_4
+; CHECK-NEXT:    move.b (0,%a0,%d0), %d0 ; encoding: [0x10,0x30,0x08,0x00]
+; CHECK-NEXT:    ext.w %d0 ; encoding: [0x48,0x80]
+; CHECK-NEXT:    ext.l %d0 ; encoding: [0x48,0xc0]
+; CHECK-NEXT:    sub.l (4,%sp), %d0 ; encoding: [0x90,0xaf,0x00,0x04]
+; CHECK-NEXT:    seq %d0 ; encoding: [0x57,0xc0]
+; CHECK-NEXT:    rts ; encoding: [0x4e,0x75]
+entry:
+  %0 = load i8, ptr getelementptr inbounds ([2147483647 x i8], ptr @VBRTag, i32 0, i32 2147483645), align 1
+  %conv30 = sext i8 %0 to i32
+  %cmp31.not = icmp eq i32 %conv30, %conv29
+  ret i1 %cmp31.not
+}
diff --git a/llvm/test/MC/M68k/Relocations/PIC/data-gotoff.s b/llvm/test/MC/M68k/Relocations/PIC/data-gotoff.s
index ca1ce52de1ca75..0de930b6fd6582 100644
--- a/llvm/test/MC/M68k/Relocations/PIC/data-gotoff.s
+++ b/llvm/test/MC/M68k/Relocations/PIC/data-gotoff.s
@@ -2,18 +2,49 @@
 ; RUN:   | llvm-readobj -r - | FileCheck -check-prefix=RELOC %s
 ; RUN: llvm-mc -triple m68k -show-encoding --position-independent %s -o - \
 ; RUN:   | FileCheck -check-prefix=INSTR -check-prefix=FIXUP %s
+; RUN: llvm-mc -triple m68k -filetype=obj -mattr=+xgot --position-independent %s -o - \
+; RUN:   | llvm-readobj -r - | FileCheck -check-prefix=RELOC-XGOT %s
+; RUN: llvm-mc -triple m68k -show-encoding -mattr=+xgot --position-independent %s -o - \
+; RUN:   | FileCheck -check-prefix=INSTR -check-prefix=FIXUP-XGOT %s
+
+; RUN: llvm-mc -triple m68k --mcpu=M68020 -filetype=obj --position-independent %s -o - \
+; RUN:   | llvm-readobj -r - | FileCheck -check-prefix=RELOC32 %s
+; RUN: llvm-mc -triple m68k --mcpu=M68020 -show-encoding --position-independent %s -o - \
+; RUN:   | FileCheck -check-prefix=INSTR -check-prefix=FIXUP32 %s
+; RUN: llvm-mc -triple m68k --mcpu=M68020 -filetype=obj -mattr=+xgot --position-independent %s -o - \
+; RUN:   | llvm-readobj -r - | FileCheck -check-prefix=RELOC-XGOT32 %s
+; RUN: llvm-mc -triple m68k --mcpu=M68020 -show-encoding -mattr=+xgot --position-independent %s -o - \
+; RUN:   | FileCheck -check-prefix=INSTR -check-prefix=FIXUP-XGOT32 %s
 
-; RELOC: R_68K_GOTOFF8 dst1 0x0
 ; INSTR: move.l  (dst1 at GOTOFF,%a5,%d0), %d0
+; RELOC: R_68K_GOTOFF8 dst1 0x0
+; RELOC32: R_68K_GOTOFF8 dst1 0x0
+; RELOC-XGOT: R_68K_GOTOFF8 dst1 0x0
+; RELOC-XGO32T: R_68K_GOTOFF8 dst1 0x0
 ; FIXUP: fixup A - offset: 3, value: dst1 at GOTOFF, kind: FK_Data_1
+; FIXUP32: fixup A - offset: 3, value: dst1 at GOTOFF, kind: FK_Data_1
+; FIXUP-XGOT: fixup A - offset: 3, value: dst1 at GOTOFF, kind: FK_Data_1
+; FIXUP-XGOT32: fixup A - offset: 3, value: dst1 at GOTOFF, kind: FK_Data_1
 move.l	(dst1 at GOTOFF,%a5,%d0), %d0
 
-; RELOC: R_68K_GOTOFF16 dst2 0x0
 ; INSTR: move.l  (dst2 at GOTOFF,%a5), %d0
+; RELOC: R_68K_GOTOFF16 dst2 0x0
+; RELOC32: R_68K_GOTOFF16 dst2 0x0
+; RELOC-XGOT: R_68K_GOTOFF16 dst2 0x0
+; RELOC-XGOT32: R_68K_GOTOFF16 dst2 0x0
 ; FIXUP: fixup A - offset: 2, value: dst2 at GOTOFF, kind: FK_Data_2
+; FIXUP32: fixup A - offset: 2, value: dst2 at GOTOFF, kind: FK_Data_2
+; FIXUP-XGOT: fixup A - offset: 2, value: dst2 at GOTOFF, kind: FK_Data_2
+; FIXUP-XGOT32: fixup A - offset: 2, value: dst2 at GOTOFF, kind: FK_Data_2
 move.l	(dst2 at GOTOFF,%a5), %d0
 
-; RELOC: R_68K_GOTPCREL16 dst3 0x0
 ; INSTR: lea     (dst3 at GOTPCREL,%pc), %a5
+; RELOC: R_68K_GOTPCREL16 dst3 0x0
+; RELOC32: R_68K_GOTPCREL16 dst3 0x0
+; RELOC-XGOT: R_68K_GOTPCREL16 dst3 0x0
+; RELOC-XGOT32: R_68K_GOTPCREL16 dst3 0x0
 ; FIXUP: fixup A - offset: 2, value: dst3 at GOTPCREL, kind: FK_PCRel_2
+; FIXUP32: fixup A - offset: 2, value: dst3 at GOTPCREL, kind: FK_PCRel_2
+; FIXUP-XGOT: fixup A - offset: 2, value: dst3 at GOTPCREL, kind: FK_PCRel_2
+; FIXUP-XGOT32: fixup A - offset: 2, value: dst3 at GOTPCREL, kind: FK_PCRel_2
 lea	(dst3 at GOTPCREL,%pc), %a5



More information about the llvm-commits mailing list