[llvm] [AMDGPU] Handle lowering addrspace casts from LDS to FLAT address in amdgpu-sw-lower-lds. (PR #121214)
Matt Arsenault via llvm-commits
llvm-commits at lists.llvm.org
Mon Feb 17 22:00:44 PST 2025
================
@@ -668,22 +668,18 @@ Value *AMDGPUSwLowerLDS::getTranslatedGlobalMemoryPtrOfLDS(Value *LoadMallocPtr,
Value *LDSPtr) {
assert(LDSPtr && "Invalid LDS pointer operand");
Type *LDSPtrType = LDSPtr->getType();
-
- if (LDSPtrType->isVectorTy()) {
+ auto &Ctx = M.getContext();
+ const auto &DL = M.getDataLayout();
+ auto *IntPtrTy = DL.getIntPtrType(Ctx, AMDGPUAS::LOCAL_ADDRESS);
+ if (auto *VecPtrTy = dyn_cast<VectorType>(LDSPtrType)) {
// Handle vector of pointers
- VectorType *VecPtrTy = cast<VectorType>(LDSPtrType);
ElementCount NumElements = VecPtrTy->getElementCount();
- Type *Int32VecTy = VectorType::get(IRB.getInt32Ty(), NumElements);
- Value *PtrToInt = IRB.CreatePtrToInt(LDSPtr, Int32VecTy);
+ Type *IntVecTy = VectorType::get(IntPtrTy, NumElements);
+ Value *PtrToInt = IRB.CreatePtrToInt(LDSPtr, IntVecTy);
// Create vector of pointers to global address space
- Type *GlobalPtrVecTy =
- VectorType::get(IRB.getPtrTy(AMDGPUAS::GLOBAL_ADDRESS), NumElements);
- Value *GlobalPtrVec =
- IRB.CreateInBoundsGEP(IRB.getInt8Ty(), LoadMallocPtr, PtrToInt);
- GlobalPtrVec = IRB.CreateBitCast(GlobalPtrVec, GlobalPtrVecTy);
- return GlobalPtrVec;
+ return IRB.CreateInBoundsGEP(IRB.getInt8Ty(), LoadMallocPtr, PtrToInt);
----------------
arsenm wrote:
You can use the same code for the scalar case. The GEP supports scalar base with vector offset, you just need to use the correct type
https://github.com/llvm/llvm-project/pull/121214
More information about the llvm-commits
mailing list