[Openmp-commits] [PATCH] D105229: [libomptarget][nfc] Replace out arguments with struct return
Jon Chesterfield via Phabricator via Openmp-commits
openmp-commits at lists.llvm.org
Wed Jun 30 14:20:26 PDT 2021
JonChesterfield created this revision.
JonChesterfield added reviewers: pdhaliwal, dhruvachak, ronlieb.
Herald added subscribers: kerbowa, nhaehnle, jvesely.
JonChesterfield requested review of this revision.
Herald added a project: OpenMP.
Herald added a subscriber: openmp-commits.
[libomptarget][nfc] Replace out arguments with struct return
A step towards making this function adequately self contained that it
can be tested easily. No functional change intended here, left variable
names unchanged.
Repository:
rG LLVM Github Monorepo
https://reviews.llvm.org/D105229
Files:
openmp/libomptarget/plugins/amdgpu/src/rtl.cpp
Index: openmp/libomptarget/plugins/amdgpu/src/rtl.cpp
===================================================================
--- openmp/libomptarget/plugins/amdgpu/src/rtl.cpp
+++ openmp/libomptarget/plugins/amdgpu/src/rtl.cpp
@@ -1884,10 +1884,17 @@
// Inputs: Max_Teams, Max_WG_Size, Warp_Size, ExecutionMode,
// EnvTeamLimit, EnvNumTeams, num_teams, thread_limit,
// loop_tripcount.
-void getLaunchVals(int &threadsPerGroup, int &num_groups, int ConstWGSize,
- int ExecutionMode, int EnvTeamLimit, int EnvNumTeams,
- int num_teams, int thread_limit, uint64_t loop_tripcount,
- int32_t device_id) {
+struct launchVals {
+ int threadsPerGroup;
+ int num_groups;
+};
+
+launchVals getLaunchVals(int ConstWGSize, int ExecutionMode, int EnvTeamLimit,
+ int EnvNumTeams, int num_teams, int thread_limit,
+ uint64_t loop_tripcount, int32_t device_id) {
+
+ int threadsPerGroup = RTLDeviceInfoTy::Default_WG_Size;
+ int num_groups = 0;
int Max_Teams = DeviceInfo.EnvMaxTeamsDefault > 0
? DeviceInfo.EnvMaxTeamsDefault
@@ -2021,6 +2028,11 @@
}
DP("Final %d num_groups and %d threadsPerGroup\n", num_groups,
threadsPerGroup);
+
+ launchVals res;
+ res.threadsPerGroup = threadsPerGroup;
+ res.num_groups = num_groups;
+ return res;
}
static uint64_t acquire_available_packet_id(hsa_queue_t *queue) {
@@ -2098,17 +2110,15 @@
/*
* Set limit based on ThreadsPerGroup and GroupsPerDevice
*/
- int num_groups = 0;
-
- int threadsPerGroup = RTLDeviceInfoTy::Default_WG_Size;
-
- getLaunchVals(threadsPerGroup, num_groups, KernelInfo->ConstWGSize,
- KernelInfo->ExecutionMode, DeviceInfo.EnvTeamLimit,
- DeviceInfo.EnvNumTeams,
- num_teams, // From run_region arg
- thread_limit, // From run_region arg
- loop_tripcount, // From run_region arg
- KernelInfo->device_id);
+ launchVals LV =
+ getLaunchVals(KernelInfo->ConstWGSize, KernelInfo->ExecutionMode,
+ DeviceInfo.EnvTeamLimit, DeviceInfo.EnvNumTeams,
+ num_teams, // From run_region arg
+ thread_limit, // From run_region arg
+ loop_tripcount, // From run_region arg
+ KernelInfo->device_id);
+ int num_groups = LV.num_groups;
+ int threadsPerGroup = LV.threadsPerGroup;
if (print_kernel_trace >= LAUNCH) {
// enum modes are SPMD, GENERIC, NONE 0,1,2
-------------- next part --------------
A non-text attachment was scrubbed...
Name: D105229.355683.patch
Type: text/x-patch
Size: 2594 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/openmp-commits/attachments/20210630/26acace4/attachment.bin>
More information about the Openmp-commits
mailing list