[Openmp-commits] [PATCH] D105229: [libomptarget][nfc] Replace out arguments with struct return
Jon Chesterfield via Phabricator via Openmp-commits
openmp-commits at lists.llvm.org
Wed Jun 30 14:29:39 PDT 2021
JonChesterfield updated this revision to Diff 355688.
JonChesterfield added a comment.
Herald added a reviewer: jdoerfert.
Herald added a subscriber: sstefan1.
- hoist access to device id
Repository:
rG LLVM Github Monorepo
CHANGES SINCE LAST ACTION
https://reviews.llvm.org/D105229/new/
https://reviews.llvm.org/D105229
Files:
openmp/libomptarget/plugins/amdgpu/src/rtl.cpp
Index: openmp/libomptarget/plugins/amdgpu/src/rtl.cpp
===================================================================
--- openmp/libomptarget/plugins/amdgpu/src/rtl.cpp
+++ openmp/libomptarget/plugins/amdgpu/src/rtl.cpp
@@ -1884,14 +1884,21 @@
// Inputs: Max_Teams, Max_WG_Size, Warp_Size, ExecutionMode,
// EnvTeamLimit, EnvNumTeams, num_teams, thread_limit,
// loop_tripcount.
-void getLaunchVals(int &threadsPerGroup, int &num_groups, int ConstWGSize,
- int ExecutionMode, int EnvTeamLimit, int EnvNumTeams,
- int num_teams, int thread_limit, uint64_t loop_tripcount,
- int32_t device_id) {
+struct launchVals {
+ int threadsPerGroup;
+ int num_groups;
+};
+
+launchVals getLaunchVals(int ConstWGSize, int ExecutionMode, int EnvTeamLimit,
+ int EnvNumTeams, int num_teams, int thread_limit,
+ uint64_t loop_tripcount, int DeviceNumTeams) {
+
+ int threadsPerGroup = RTLDeviceInfoTy::Default_WG_Size;
+ int num_groups = 0;
int Max_Teams = DeviceInfo.EnvMaxTeamsDefault > 0
? DeviceInfo.EnvMaxTeamsDefault
- : DeviceInfo.NumTeams[device_id];
+ : DeviceNumTeams;
if (Max_Teams > DeviceInfo.HardTeamLimit)
Max_Teams = DeviceInfo.HardTeamLimit;
@@ -2021,6 +2028,11 @@
}
DP("Final %d num_groups and %d threadsPerGroup\n", num_groups,
threadsPerGroup);
+
+ launchVals res;
+ res.threadsPerGroup = threadsPerGroup;
+ res.num_groups = num_groups;
+ return res;
}
static uint64_t acquire_available_packet_id(hsa_queue_t *queue) {
@@ -2098,17 +2110,15 @@
/*
* Set limit based on ThreadsPerGroup and GroupsPerDevice
*/
- int num_groups = 0;
-
- int threadsPerGroup = RTLDeviceInfoTy::Default_WG_Size;
-
- getLaunchVals(threadsPerGroup, num_groups, KernelInfo->ConstWGSize,
- KernelInfo->ExecutionMode, DeviceInfo.EnvTeamLimit,
- DeviceInfo.EnvNumTeams,
- num_teams, // From run_region arg
- thread_limit, // From run_region arg
- loop_tripcount, // From run_region arg
- KernelInfo->device_id);
+ launchVals LV =
+ getLaunchVals(KernelInfo->ConstWGSize, KernelInfo->ExecutionMode,
+ DeviceInfo.EnvTeamLimit, DeviceInfo.EnvNumTeams,
+ num_teams, // From run_region arg
+ thread_limit, // From run_region arg
+ loop_tripcount, // From run_region arg
+ DeviceInfo.NumTeams[KernelInfo->device_id]);
+ int num_groups = LV.num_groups;
+ int threadsPerGroup = LV.threadsPerGroup;
if (print_kernel_trace >= LAUNCH) {
// enum modes are SPMD, GENERIC, NONE 0,1,2
-------------- next part --------------
A non-text attachment was scrubbed...
Name: D105229.355688.patch
Type: text/x-patch
Size: 2804 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/openmp-commits/attachments/20210630/6f203c7e/attachment-0001.bin>
More information about the Openmp-commits
mailing list