[Openmp-commits] [PATCH] D42686: [libomptarget] Only use CUDA Driver API
Jonas Hahnfeld via Phabricator via Openmp-commits
openmp-commits at lists.llvm.org
Tue Jan 30 06:56:40 PST 2018
Hahnfeld updated this revision to Diff 131965.
Hahnfeld marked 3 inline comments as done.
Hahnfeld added a comment.
Remove `assert`s.
https://reviews.llvm.org/D42686
Files:
libomptarget/plugins/cuda/src/rtl.cpp
Index: libomptarget/plugins/cuda/src/rtl.cpp
===================================================================
--- libomptarget/plugins/cuda/src/rtl.cpp
+++ libomptarget/plugins/cuda/src/rtl.cpp
@@ -14,7 +14,6 @@
#include <cassert>
#include <cstddef>
#include <cuda.h>
-#include <cuda_runtime_api.h>
#include <list>
#include <string>
#include <vector>
@@ -280,9 +279,9 @@
}
// scan properties to determine number of threads/block and blocks/grid.
- struct cudaDeviceProp Properties;
- cudaError_t error = cudaGetDeviceProperties(&Properties, device_id);
- if (error != cudaSuccess) {
+ CUdevprop Properties;
+ err = cuDeviceGetProperties(&Properties, cuDevice);
+ if (err != CUDA_SUCCESS) {
DP("Error getting device Properties, use defaults\n");
DeviceInfo.BlocksPerGrid[device_id] = RTLDeviceInfoTy::DefaultNumTeams;
DeviceInfo.ThreadsPerBlock[device_id] = RTLDeviceInfoTy::DefaultNumThreads;
@@ -314,8 +313,8 @@
RTLDeviceInfoTy::HardThreadLimit);
}
- // Get warp size
- DeviceInfo.WarpSize[device_id] = Properties.warpSize;
+ // According to the documentation, SIMDWidth is "Warp size in threads".
+ DeviceInfo.WarpSize[device_id] = Properties.SIMDWidth;
}
// Adjust teams to the env variables
@@ -678,17 +677,16 @@
if (err != CUDA_SUCCESS) {
DP("Device kernel launch failed!\n");
CUDA_ERR_STRING(err);
- assert(err == CUDA_SUCCESS && "Unable to launch target execution!");
return OFFLOAD_FAIL;
}
DP("Launch of entry point at " DPxMOD " successful!\n",
DPxPTR(tgt_entry_ptr));
- cudaError_t sync_error = cudaDeviceSynchronize();
- if (sync_error != cudaSuccess) {
- DP("Kernel execution error at " DPxMOD ", %s.\n", DPxPTR(tgt_entry_ptr),
- cudaGetErrorString(sync_error));
+ CUresult sync_err = cuCtxSynchronize();
+ if (sync_err != CUDA_SUCCESS) {
+ DP("Kernel execution error at " DPxMOD "!\n", DPxPTR(tgt_entry_ptr));
+ CUDA_ERR_STRING(sync_err);
return OFFLOAD_FAIL;
} else {
DP("Kernel execution at " DPxMOD " successful!\n", DPxPTR(tgt_entry_ptr));
-------------- next part --------------
A non-text attachment was scrubbed...
Name: D42686.131965.patch
Type: text/x-patch
Size: 2100 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/openmp-commits/attachments/20180130/a0bda7cd/attachment-0001.bin>
More information about the Openmp-commits
mailing list