[PATCH] D139045: [HIP] support --offload-arch=native
Yaxun Liu via Phabricator via cfe-commits
cfe-commits at lists.llvm.org
Mon Dec 12 12:54:11 PST 2022
yaxunl updated this revision to Diff 482234.
yaxunl retitled this revision from "[HIP] use detected GPU in --offload-arch" to "[HIP] support --offload-arch=native".
yaxunl edited the summary of this revision.
yaxunl added a comment.
use detected GPU when --offload-arch=native is specified based on RFC discussion
CHANGES SINCE LAST ACTION
https://reviews.llvm.org/D139045/new/
https://reviews.llvm.org/D139045
Files:
clang/lib/Driver/Driver.cpp
clang/lib/Driver/ToolChains/AMDGPU.h
Index: clang/lib/Driver/ToolChains/AMDGPU.h
===================================================================
--- clang/lib/Driver/ToolChains/AMDGPU.h
+++ clang/lib/Driver/ToolChains/AMDGPU.h
@@ -107,6 +107,9 @@
llvm::Error getSystemGPUArch(const llvm::opt::ArgList &Args,
std::string &GPUArch) const;
+ llvm::Error detectSystemGPUs(const llvm::opt::ArgList &Args,
+ SmallVector<std::string, 1> &GPUArchs) const;
+
protected:
/// Check and diagnose invalid target ID specified by -mcpu.
virtual void checkTargetID(const llvm::opt::ArgList &DriverArgs) const;
@@ -126,8 +129,6 @@
/// Get GPU arch from -mcpu without checking.
StringRef getGPUArch(const llvm::opt::ArgList &DriverArgs) const;
- llvm::Error detectSystemGPUs(const llvm::opt::ArgList &Args,
- SmallVector<std::string, 1> &GPUArchs) const;
};
class LLVM_LIBRARY_VISIBILITY ROCMToolChain : public AMDGPUToolChain {
Index: clang/lib/Driver/Driver.cpp
===================================================================
--- clang/lib/Driver/Driver.cpp
+++ clang/lib/Driver/Driver.cpp
@@ -3055,6 +3055,7 @@
}
// Collect all offload arch parameters, removing duplicates.
+ const StringRef NativeArchStr = "native";
std::set<StringRef> GpuArchs;
bool Error = false;
for (Arg *A : Args) {
@@ -3067,6 +3068,15 @@
if (A->getOption().matches(options::OPT_no_offload_arch_EQ) &&
ArchStr == "all") {
GpuArchs.clear();
+ } else if (ArchStr == NativeArchStr &&
+ ToolChains.front()->getTriple().isAMDGPU()) {
+ auto *TC = static_cast<const toolchains::HIPAMDToolChain *>(
+ ToolChains.front());
+ SmallVector<std::string, 1> GPUs;
+ if (!TC->detectSystemGPUs(Args, GPUs)) {
+ for (auto GPU : GPUs)
+ GpuArchs.insert(Args.MakeArgString(GPU));
+ }
} else {
ArchStr = getCanonicalOffloadArch(ArchStr);
if (ArchStr.empty()) {
-------------- next part --------------
A non-text attachment was scrubbed...
Name: D139045.482234.patch
Type: text/x-patch
Size: 2124 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/cfe-commits/attachments/20221212/df9d5767/attachment.bin>
More information about the cfe-commits
mailing list