[llvm] aead088 - [AMDGPU] Avoid repeated hash lookups (NFC) (#131419)
via llvm-commits
llvm-commits at lists.llvm.org
Fri Mar 14 23:54:53 PDT 2025
- Previous message: [llvm] 1762f16 - [InstCombine] Fold `umax/umin(nuw_shl(z, x), nuw_shl(z, y)) -> nuw_shl(z, umax/umin(x, y))` and `umax/umin(nuw_shl(x, z), nuw_shl(y, z)) -> nuw_shl(umax/umin(x, y), z)` (#131076)
- Next message: [llvm] 2ada0c1 - [AArch64] Move fixELFSymbolsInTLSFixups to getRelocType
- Messages sorted by:
[ date ]
[ thread ]
[ subject ]
[ author ]
Author: Kazu Hirata
Date: 2025-03-14T23:54:49-07:00
New Revision: aead088f02b9452ac151a77e05228ad9458a6eb5
URL: https://github.com/llvm/llvm-project/commit/aead088f02b9452ac151a77e05228ad9458a6eb5
DIFF: https://github.com/llvm/llvm-project/commit/aead088f02b9452ac151a77e05228ad9458a6eb5.diff
LOG: [AMDGPU] Avoid repeated hash lookups (NFC) (#131419)
Added:
Modified:
llvm/lib/Target/AMDGPU/SIMachineFunctionInfo.cpp
Removed:
################################################################################
diff --git a/llvm/lib/Target/AMDGPU/SIMachineFunctionInfo.cpp b/llvm/lib/Target/AMDGPU/SIMachineFunctionInfo.cpp
index abd19c988a7eb..93b030b0e0a70 100644
--- a/llvm/lib/Target/AMDGPU/SIMachineFunctionInfo.cpp
+++ b/llvm/lib/Target/AMDGPU/SIMachineFunctionInfo.cpp
@@ -254,8 +254,8 @@ Register SIMachineFunctionInfo::addLDSKernelId() {
SmallVectorImpl<MCRegister> *SIMachineFunctionInfo::addPreloadedKernArg(
const SIRegisterInfo &TRI, const TargetRegisterClass *RC,
unsigned AllocSizeDWord, int KernArgIdx, int PaddingSGPRs) {
- assert(!ArgInfo.PreloadKernArgs.count(KernArgIdx) &&
- "Preload kernel argument allocated twice.");
+ auto [It, Inserted] = ArgInfo.PreloadKernArgs.try_emplace(KernArgIdx);
+ assert(Inserted && "Preload kernel argument allocated twice.");
NumUserSGPRs += PaddingSGPRs;
// If the available register tuples are aligned with the kernarg to be
// preloaded use that register, otherwise we need to use a set of SGPRs and
@@ -264,20 +264,22 @@ SmallVectorImpl<MCRegister> *SIMachineFunctionInfo::addPreloadedKernArg(
ArgInfo.FirstKernArgPreloadReg = getNextUserSGPR();
Register PreloadReg =
TRI.getMatchingSuperReg(getNextUserSGPR(), AMDGPU::sub0, RC);
+ auto &Regs = It->second.Regs;
if (PreloadReg &&
(RC == &AMDGPU::SReg_32RegClass || RC == &AMDGPU::SReg_64RegClass)) {
- ArgInfo.PreloadKernArgs[KernArgIdx].Regs.push_back(PreloadReg);
+ Regs.push_back(PreloadReg);
NumUserSGPRs += AllocSizeDWord;
} else {
+ Regs.reserve(AllocSizeDWord);
for (unsigned I = 0; I < AllocSizeDWord; ++I) {
- ArgInfo.PreloadKernArgs[KernArgIdx].Regs.push_back(getNextUserSGPR());
+ Regs.push_back(getNextUserSGPR());
NumUserSGPRs++;
}
}
// Track the actual number of SGPRs that HW will preload to.
UserSGPRInfo.allocKernargPreloadSGPRs(AllocSizeDWord + PaddingSGPRs);
- return &ArgInfo.PreloadKernArgs[KernArgIdx].Regs;
+ return &Regs;
}
void SIMachineFunctionInfo::allocateWWMSpill(MachineFunction &MF, Register VGPR,
- Previous message: [llvm] 1762f16 - [InstCombine] Fold `umax/umin(nuw_shl(z, x), nuw_shl(z, y)) -> nuw_shl(z, umax/umin(x, y))` and `umax/umin(nuw_shl(x, z), nuw_shl(y, z)) -> nuw_shl(umax/umin(x, y), z)` (#131076)
- Next message: [llvm] 2ada0c1 - [AArch64] Move fixELFSymbolsInTLSFixups to getRelocType
- Messages sorted by:
[ date ]
[ thread ]
[ subject ]
[ author ]
More information about the llvm-commits
mailing list