[llvm] 845cc96 - [clang][llvm][aarch64][win] Add a clang flag and module attribute for import call optimization, and remove LLVM flag (#122831)
via llvm-commits
llvm-commits at lists.llvm.org
Thu Jan 30 09:51:47 PST 2025
Author: Daniel Paoliello
Date: 2025-01-30T09:51:43-08:00
New Revision: 845cc968e987492bda6a62c9a87cd96cfc631d5b
URL: https://github.com/llvm/llvm-project/commit/845cc968e987492bda6a62c9a87cd96cfc631d5b
DIFF: https://github.com/llvm/llvm-project/commit/845cc968e987492bda6a62c9a87cd96cfc631d5b.diff
LOG: [clang][llvm][aarch64][win] Add a clang flag and module attribute for import call optimization, and remove LLVM flag (#122831)
Switches import call optimization from being enabled by an LLVM flag to
instead using a module attribute, and creates a new Clang flag that will
set that attribute. This addresses the concern raised in the original
PR:
<https://github.com/llvm/llvm-project/pull/121516#discussion_r1911763991>
This change also only creates the Called Global info if the module
attribute is present, addressing this concern:
<https://github.com/llvm/llvm-project/pull/122762#pullrequestreview-2547595934>
Added:
clang/test/CodeGen/import-call-optimization.c
Modified:
clang/include/clang/Basic/CodeGenOptions.def
clang/include/clang/Driver/Options.td
clang/lib/CodeGen/CodeGenModule.cpp
llvm/lib/Target/AArch64/AArch64AsmPrinter.cpp
llvm/lib/Target/AArch64/AArch64ISelLowering.cpp
llvm/test/CodeGen/AArch64/win-import-call-optimization-nocalls.ll
llvm/test/CodeGen/AArch64/win-import-call-optimization.ll
Removed:
################################################################################
diff --git a/clang/include/clang/Basic/CodeGenOptions.def b/clang/include/clang/Basic/CodeGenOptions.def
index 259972bdf8f001..386652d2efa9e1 100644
--- a/clang/include/clang/Basic/CodeGenOptions.def
+++ b/clang/include/clang/Basic/CodeGenOptions.def
@@ -465,6 +465,10 @@ ENUM_CODEGENOPT(ZeroCallUsedRegs, llvm::ZeroCallUsedRegs::ZeroCallUsedRegsKind,
/// non-deleting destructors. (No effect on Microsoft ABI.)
CODEGENOPT(CtorDtorReturnThis, 1, 0)
+/// Enables emitting Import Call sections on supported targets that can be used
+/// by the Windows kernel to enable import call optimization.
+CODEGENOPT(ImportCallOptimization, 1, 0)
+
/// FIXME: Make DebugOptions its own top-level .def file.
#include "DebugOptions.def"
diff --git a/clang/include/clang/Driver/Options.td b/clang/include/clang/Driver/Options.td
index f7a425bbd5eb7c..d8123cc39fdc95 100644
--- a/clang/include/clang/Driver/Options.td
+++ b/clang/include/clang/Driver/Options.td
@@ -7587,6 +7587,11 @@ def fexperimental_assignment_tracking_EQ : Joined<["-"], "fexperimental-assignme
def enable_tlsdesc : Flag<["-"], "enable-tlsdesc">,
MarshallingInfoFlag<CodeGenOpts<"EnableTLSDESC">>;
+def import_call_optimization : Flag<["-"], "import-call-optimization">,
+ HelpText<"Emit Import Call sections on supported targets that can be used "
+ "by the Windows kernel to enable import call optimization">,
+ MarshallingInfoFlag<CodeGenOpts<"ImportCallOptimization">>;
+
} // let Visibility = [CC1Option]
//===----------------------------------------------------------------------===//
diff --git a/clang/lib/CodeGen/CodeGenModule.cpp b/clang/lib/CodeGen/CodeGenModule.cpp
index a015d64f4065aa..05879cd486a8c9 100644
--- a/clang/lib/CodeGen/CodeGenModule.cpp
+++ b/clang/lib/CodeGen/CodeGenModule.cpp
@@ -1293,6 +1293,11 @@ void CodeGenModule::Release() {
if (LangOpts.EHAsynch)
getModule().addModuleFlag(llvm::Module::Warning, "eh-asynch", 1);
+ // Emit Import Call section.
+ if (CodeGenOpts.ImportCallOptimization)
+ getModule().addModuleFlag(llvm::Module::Warning, "import-call-optimization",
+ 1);
+
// Indicate whether this Module was compiled with -fopenmp
if (getLangOpts().OpenMP && !getLangOpts().OpenMPSimd)
getModule().addModuleFlag(llvm::Module::Max, "openmp", LangOpts.OpenMP);
diff --git a/clang/test/CodeGen/import-call-optimization.c b/clang/test/CodeGen/import-call-optimization.c
new file mode 100644
index 00000000000000..cc4e37fda7bb1d
--- /dev/null
+++ b/clang/test/CodeGen/import-call-optimization.c
@@ -0,0 +1,5 @@
+// RUN: %clang_cc1 -import-call-optimization -emit-llvm %s -o - | FileCheck %s
+
+void f(void) {}
+
+// CHECK: !"import-call-optimization", i32 1}
diff --git a/llvm/lib/Target/AArch64/AArch64AsmPrinter.cpp b/llvm/lib/Target/AArch64/AArch64AsmPrinter.cpp
index c6b4a219d201f7..f1f25b65fc53fa 100644
--- a/llvm/lib/Target/AArch64/AArch64AsmPrinter.cpp
+++ b/llvm/lib/Target/AArch64/AArch64AsmPrinter.cpp
@@ -78,11 +78,6 @@ static cl::opt<PtrauthCheckMode> PtrauthAuthChecks(
cl::desc("Check pointer authentication auth/resign failures"),
cl::init(Default));
-static cl::opt<bool> EnableImportCallOptimization(
- "aarch64-win-import-call-optimization", cl::Hidden,
- cl::desc("Enable import call optimization for AArch64 Windows"),
- cl::init(false));
-
#define DEBUG_TYPE "asm-printer"
namespace {
@@ -95,6 +90,7 @@ class AArch64AsmPrinter : public AsmPrinter {
#ifndef NDEBUG
unsigned InstsEmitted;
#endif
+ bool EnableImportCallOptimization = false;
DenseMap<MCSection *, std::vector<std::pair<MCSymbol *, MCSymbol *>>>
SectionToImportedFunctionCalls;
@@ -344,6 +340,9 @@ void AArch64AsmPrinter::emitStartOfAsmFile(Module &M) {
OutStreamer->emitSymbolAttribute(S, MCSA_Global);
OutStreamer->emitAssignment(
S, MCConstantExpr::create(Feat00Value, MMI->getContext()));
+
+ if (M.getModuleFlag("import-call-optimization"))
+ EnableImportCallOptimization = true;
}
if (!TT.isOSBinFormatELF())
@@ -3172,8 +3171,7 @@ void AArch64AsmPrinter::emitInstruction(const MachineInstr *MI) {
void AArch64AsmPrinter::recordIfImportCall(
const llvm::MachineInstr *BranchInst) {
- if (!EnableImportCallOptimization ||
- !TM.getTargetTriple().isOSBinFormatCOFF())
+ if (!EnableImportCallOptimization)
return;
auto [GV, OpFlags] = BranchInst->getMF()->tryGetCalledGlobal(BranchInst);
diff --git a/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp b/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp
index 02f2aecfdfefe1..a396198013fc3c 100644
--- a/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp
+++ b/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp
@@ -9573,7 +9573,8 @@ AArch64TargetLowering::LowerCall(CallLoweringInfo &CLI,
DAG.addNoMergeSiteInfo(Ret.getNode(), CLI.NoMerge);
DAG.addCallSiteInfo(Ret.getNode(), std::move(CSInfo));
- if (CalledGlobal)
+ if (CalledGlobal &&
+ MF.getFunction().getParent()->getModuleFlag("import-call-optimization"))
DAG.addCalledGlobal(Ret.getNode(), CalledGlobal, OpFlags);
return Ret;
}
@@ -9586,7 +9587,8 @@ AArch64TargetLowering::LowerCall(CallLoweringInfo &CLI,
DAG.addNoMergeSiteInfo(Chain.getNode(), CLI.NoMerge);
InGlue = Chain.getValue(1);
DAG.addCallSiteInfo(Chain.getNode(), std::move(CSInfo));
- if (CalledGlobal)
+ if (CalledGlobal &&
+ MF.getFunction().getParent()->getModuleFlag("import-call-optimization"))
DAG.addCalledGlobal(Chain.getNode(), CalledGlobal, OpFlags);
uint64_t CalleePopBytes =
diff --git a/llvm/test/CodeGen/AArch64/win-import-call-optimization-nocalls.ll b/llvm/test/CodeGen/AArch64/win-import-call-optimization-nocalls.ll
index 81d6d6369dcbf4..b17f2d113c0d29 100644
--- a/llvm/test/CodeGen/AArch64/win-import-call-optimization-nocalls.ll
+++ b/llvm/test/CodeGen/AArch64/win-import-call-optimization-nocalls.ll
@@ -1,4 +1,4 @@
-; RUN: llc -mtriple=aarch64-pc-windows-msvc -aarch64-win-import-call-optimization < %s | FileCheck %s
+; RUN: llc -mtriple=aarch64-pc-windows-msvc < %s | FileCheck %s
define dso_local void @normal_call() local_unnamed_addr {
entry:
@@ -16,3 +16,6 @@ declare void @a() local_unnamed_addr
; CHECK-LABEL .section .impcall,"yi"
; CHECK-NEXT .asciz "Imp_Call_V1"
; CHECK-NOT .secnum
+
+!llvm.module.flags = !{!0}
+!0 = !{i32 1, !"import-call-optimization", i32 1}
diff --git a/llvm/test/CodeGen/AArch64/win-import-call-optimization.ll b/llvm/test/CodeGen/AArch64/win-import-call-optimization.ll
index 6bb118ba1e1596..2cf0f8bb6baa5c 100644
--- a/llvm/test/CodeGen/AArch64/win-import-call-optimization.ll
+++ b/llvm/test/CodeGen/AArch64/win-import-call-optimization.ll
@@ -1,7 +1,4 @@
-; RUN: llc -mtriple=aarch64-pc-windows-msvc -aarch64-win-import-call-optimization < %s | FileCheck %s --check-prefix=CHECK-ENABLED
-; RUN: llc -mtriple=aarch64-pc-windows-msvc < %s | FileCheck %s --check-prefix=CHECK-DISABLED
-
-; CHECK-DISABLED-NOT: .section .impcall
+; RUN: llc -mtriple=aarch64-pc-windows-msvc < %s | FileCheck %s --check-prefix=CHECK
define dso_local void @normal_call() local_unnamed_addr section "nc_sect" {
entry:
@@ -9,40 +6,43 @@ entry:
call void @a()
ret void
}
-; CHECK-ENABLED-LABEL: normal_call:
-; CHECK-ENABLED: adrp [[ADRPREG:x[0-9]+]], __imp_a
-; CHECK-ENABLED-NEXT: ldr [[LDRREG:x[0-9]+]], [[[ADRPREG]], :lo12:__imp_a]
-; CHECK-ENABLED-NEXT: .Limpcall0:
-; CHECK-ENABLED-NEXT: blr [[LDRREG]]
-; CHECK-ENABLED-NEXT: .Limpcall1:
-; CHECK-ENABLED-NEXT: blr [[LDRREG]]
+; CHECK-LABEL: normal_call:
+; CHECK: adrp [[ADRPREG:x[0-9]+]], __imp_a
+; CHECK-NEXT: ldr [[LDRREG:x[0-9]+]], [[[ADRPREG]], :lo12:__imp_a]
+; CHECK-NEXT: .Limpcall0:
+; CHECK-NEXT: blr [[LDRREG]]
+; CHECK-NEXT: .Limpcall1:
+; CHECK-NEXT: blr [[LDRREG]]
define dso_local void @tail_call() local_unnamed_addr section "tc_sect" {
entry:
tail call void @b()
ret void
}
-; CHECK-ENABLED-LABEL: tail_call:
-; CHECK-ENABLED: adrp [[ADRPREG:x[0-9]+]], __imp_b
-; CHECK-ENABLED-NEXT: ldr [[LDRREG:x[0-9]+]], [[[ADRPREG]], :lo12:__imp_b]
-; CHECK-ENABLED-NEXT: .Limpcall2:
-; CHECK-ENABLED-NEXT: br [[LDRREG]]
+; CHECK-LABEL: tail_call:
+; CHECK: adrp [[ADRPREG:x[0-9]+]], __imp_b
+; CHECK-NEXT: ldr [[LDRREG:x[0-9]+]], [[[ADRPREG]], :lo12:__imp_b]
+; CHECK-NEXT: .Limpcall2:
+; CHECK-NEXT: br [[LDRREG]]
declare dllimport void @a() local_unnamed_addr
declare dllimport void @b() local_unnamed_addr
-; CHECK-ENABLED-LABEL .section .impcall,"yi"
-; CHECK-ENABLED-NEXT .asciz "Imp_Call_V1"
-; CHECK-ENABLED-NEXT .word 32
-; CHECK-ENABLED-NEXT .secnum nc_sect
-; CHECK-ENABLED-NEXT .word 19
-; CHECK-ENABLED-NEXT .secoffset .Limpcall0
-; CHECK-ENABLED-NEXT .symidx __imp_a
-; CHECK-ENABLED-NEXT .word 19
-; CHECK-ENABLED-NEXT .secoffset .Limpcall1
-; CHECK-ENABLED-NEXT .symidx __imp_a
-; CHECK-ENABLED-NEXT .word 20
-; CHECK-ENABLED-NEXT .secnum tc_sect
-; CHECK-ENABLED-NEXT .word 19
-; CHECK-ENABLED-NEXT .secoffset .Limpcall2
-; CHECK-ENABLED-NEXT .symidx __imp_b
+; CHECK-LABEL .section .impcall,"yi"
+; CHECK-NEXT .asciz "Imp_Call_V1"
+; CHECK-NEXT .word 32
+; CHECK-NEXT .secnum nc_sect
+; CHECK-NEXT .word 19
+; CHECK-NEXT .secoffset .Limpcall0
+; CHECK-NEXT .symidx __imp_a
+; CHECK-NEXT .word 19
+; CHECK-NEXT .secoffset .Limpcall1
+; CHECK-NEXT .symidx __imp_a
+; CHECK-NEXT .word 20
+; CHECK-NEXT .secnum tc_sect
+; CHECK-NEXT .word 19
+; CHECK-NEXT .secoffset .Limpcall2
+; CHECK-NEXT .symidx __imp_b
+
+!llvm.module.flags = !{!0}
+!0 = !{i32 1, !"import-call-optimization", i32 1}
More information about the llvm-commits
mailing list