[PATCH] D109773: [AMDGPU] Inline non-kernel functions using extern lds
Vang Thao via Phabricator via llvm-commits
llvm-commits at lists.llvm.org
Thu Sep 16 10:59:40 PDT 2021
This revision was automatically updated to reflect the committed changes.
Closed by commit rG106959acc15c: [AMDGPU] Inline non-kernel functions using extern lds (authored by vangthao).
Repository:
rG LLVM Github Monorepo
CHANGES SINCE LAST ACTION
https://reviews.llvm.org/D109773/new/
https://reviews.llvm.org/D109773
Files:
llvm/lib/Target/AMDGPU/AMDGPUAlwaysInlinePass.cpp
llvm/test/CodeGen/AMDGPU/hip.extern.shared.array.ll
Index: llvm/test/CodeGen/AMDGPU/hip.extern.shared.array.ll
===================================================================
--- llvm/test/CodeGen/AMDGPU/hip.extern.shared.array.ll
+++ llvm/test/CodeGen/AMDGPU/hip.extern.shared.array.ll
@@ -135,4 +135,25 @@
ret void
}
+; CHECK-LABEL: dynamic_shared_array_with_call:
+; CHECK-NOT: s_swappc_b64
+define amdgpu_kernel void @dynamic_shared_array_with_call(float addrspace(1)* nocapture readnone %out) local_unnamed_addr {
+ %tid.x = tail call i32 @llvm.amdgcn.workitem.id.x()
+ %1 = sext i32 %tid.x to i64
+ %arrayidx0 = getelementptr inbounds [512 x float], [512 x float] addrspace(3)* @lds0, i64 0, i64 %1
+ %val0 = load float, float addrspace(3)* %arrayidx0, align 4
+ tail call void @store_value(float %val0)
+ ret void
+}
+
+; CHECK-NOT: store_value
+define linkonce_odr hidden void @store_value(float %val1) local_unnamed_addr {
+entry:
+ %tid.x = tail call i32 @llvm.amdgcn.workitem.id.x()
+ %0 = sext i32 %tid.x to i64
+ %arrayidx1 = getelementptr inbounds [0 x float], [0 x float] addrspace(3)* @dynamic_shared0, i64 0, i64 %0
+ store float %val1, float addrspace(3)* %arrayidx1, align 4
+ ret void
+}
+
declare i32 @llvm.amdgcn.workitem.id.x()
Index: llvm/lib/Target/AMDGPU/AMDGPUAlwaysInlinePass.cpp
===================================================================
--- llvm/lib/Target/AMDGPU/AMDGPUAlwaysInlinePass.cpp
+++ llvm/lib/Target/AMDGPU/AMDGPUAlwaysInlinePass.cpp
@@ -122,7 +122,7 @@
unsigned AS = GV.getAddressSpace();
if ((AS == AMDGPUAS::REGION_ADDRESS) ||
(AS == AMDGPUAS::LOCAL_ADDRESS &&
- !AMDGPUTargetMachine::EnableLowerModuleLDS))
+ (!AMDGPUTargetMachine::EnableLowerModuleLDS || !GV.hasInitializer())))
recursivelyVisitUsers(GV, FuncsToAlwaysInline);
}
-------------- next part --------------
A non-text attachment was scrubbed...
Name: D109773.372998.patch
Type: text/x-patch
Size: 1801 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/llvm-commits/attachments/20210916/bd544a17/attachment.bin>
More information about the llvm-commits
mailing list