[Openmp-commits] [PATCH] D73077: [libomptarget] Implement wavefront functions for amdgcn
Jon Chesterfield via Phabricator via Openmp-commits
openmp-commits at lists.llvm.org
Mon Jan 20 18:16:05 PST 2020
JonChesterfield created this revision.
JonChesterfield added reviewers: jdoerfert, ABataev, grokos.
Herald added subscribers: openmp-commits, jvesely.
Herald added a project: OpenMP.
JonChesterfield added a comment.
Fills in some of the unresolved symbols for amdgcn target_impl with intrinsic calls. A bit architecture specific, but that seems OK in the context.
[libomptarget] Implement wavefront functions for amdgcn
Repository:
rG LLVM Github Monorepo
https://reviews.llvm.org/D73077
Files:
openmp/libomptarget/deviceRTLs/amdgcn/src/target_impl.hip
Index: openmp/libomptarget/deviceRTLs/amdgcn/src/target_impl.hip
===================================================================
--- openmp/libomptarget/deviceRTLs/amdgcn/src/target_impl.hip
+++ openmp/libomptarget/deviceRTLs/amdgcn/src/target_impl.hip
@@ -12,6 +12,32 @@
#include "target_impl.h"
+// Implementations initially derived from hcc
+
+static DEVICE uint32_t getLaneId(void) {
+ return __builtin_amdgcn_mbcnt_hi(~0u, __builtin_amdgcn_mbcnt_lo(~0u, 0u));
+}
+
+// initialized with a 64-bit mask with bits set in positions less than the
+// thread's lane number in the warp
+DEVICE __kmpc_impl_lanemask_t __kmpc_impl_lanemask_lt() {
+ uint32_t lane = getLaneId();
+ int64_t ballot = __kmpc_impl_activemask();
+ uint64_t mask = ((uint64_t)1 << lane) - (uint64_t)1;
+ return mask & ballot;
+}
+
+// initialized with a 64-bit mask with bits set in positions greater than the
+// thread's lane number in the warp
+DEVICE __kmpc_impl_lanemask_t __kmpc_impl_lanemask_gt() {
+ uint32_t lane = getLaneId();
+ if (lane == 63)
+ return 0;
+ uint64_t ballot = __kmpc_impl_activemask();
+ uint64_t mask = (~((uint64_t)0)) << (lane + 1);
+ return mask & ballot;
+}
+
DEVICE double __kmpc_impl_get_wtick() { return ((double)1E-9); }
EXTERN uint64_t __clock64();
@@ -19,6 +45,28 @@
return ((double)1.0 / 745000000.0) * __clock64();
}
+// warp vote function
+DEVICE __kmpc_impl_lanemask_t __kmpc_impl_activemask() {
+ // 33 is ICMP_NE from llvm/include/llvm/IR/InstrTypes.h
+ return __builtin_amdgcn_uicmp(1, 0, 33);
+}
+
+DEVICE int32_t __kmpc_impl_shfl_sync(__kmpc_impl_lanemask_t, int32_t var,
+ int32_t srcLane) {
+ int width = WARPSIZE;
+ int self = getLaneId();
+ int index = srcLane + (self & ~(width - 1));
+ return __builtin_amdgcn_ds_bpermute(index << 2, var);
+}
+
+DEVICE int32_t __kmpc_impl_shfl_down_sync(__kmpc_impl_lanemask_t, int32_t var,
+ uint32_t laneDelta, int32_t width) {
+ int self = getLaneId();
+ int index = self + laneDelta;
+ index = (int)(laneDelta + (self & (width - 1))) >= width ? self : index;
+ return __builtin_amdgcn_ds_bpermute(index << 2, var);
+}
+
EXTERN uint64_t __ockl_get_local_size(uint32_t);
EXTERN uint64_t __ockl_get_num_groups(uint32_t);
DEVICE int GetNumberOfBlocksInKernel() { return __ockl_get_num_groups(0); }
-------------- next part --------------
A non-text attachment was scrubbed...
Name: D73077.239221.patch
Type: text/x-patch
Size: 2378 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/openmp-commits/attachments/20200121/3546ef3d/attachment-0001.bin>
More information about the Openmp-commits
mailing list