[Openmp-commits] [openmp] r319970 - [libomptarget] Split device functionality
Jonas Hahnfeld via Openmp-commits
openmp-commits at lists.llvm.org
Wed Dec 6 13:59:10 PST 2017
Author: hahnfeld
Date: Wed Dec 6 13:59:09 2017
New Revision: 319970
URL: http://llvm.org/viewvc/llvm-project?rev=319970&view=rev
Log:
[libomptarget] Split device functionality
This is the second patch to split the current monolithic
implementation into separate files. Note that this change
doesn't cleanup the code yet.
Differential Revision: https://reviews.llvm.org/D40799
Added:
openmp/trunk/libomptarget/src/device.cpp
Modified:
openmp/trunk/libomptarget/src/CMakeLists.txt
openmp/trunk/libomptarget/src/device.h
openmp/trunk/libomptarget/src/omptarget.cpp
Modified: openmp/trunk/libomptarget/src/CMakeLists.txt
URL: http://llvm.org/viewvc/llvm-project/openmp/trunk/libomptarget/src/CMakeLists.txt?rev=319970&r1=319969&r2=319970&view=diff
==============================================================================
--- openmp/trunk/libomptarget/src/CMakeLists.txt (original)
+++ openmp/trunk/libomptarget/src/CMakeLists.txt Wed Dec 6 13:59:09 2017
@@ -14,6 +14,7 @@
libomptarget_say("Building offloading runtime library libomptarget.")
set(src_files
+ device.cpp
rtl.cpp
omptarget.cpp
)
Added: openmp/trunk/libomptarget/src/device.cpp
URL: http://llvm.org/viewvc/llvm-project/openmp/trunk/libomptarget/src/device.cpp?rev=319970&view=auto
==============================================================================
--- openmp/trunk/libomptarget/src/device.cpp (added)
+++ openmp/trunk/libomptarget/src/device.cpp Wed Dec 6 13:59:09 2017
@@ -0,0 +1,334 @@
+//===--------- device.cpp - Target independent OpenMP target RTL ----------===//
+//
+// The LLVM Compiler Infrastructure
+//
+// This file is dual licensed under the MIT and the University of Illinois Open
+// Source Licenses. See LICENSE.txt for details.
+//
+//===----------------------------------------------------------------------===//
+//
+// Functionality for managing devices that are handled by RTL plugins.
+//
+//===----------------------------------------------------------------------===//
+
+#include "device.h"
+#include "private.h"
+#include "rtl.h"
+
+#include <cassert>
+#include <climits>
+#include <string>
+
+/// Map between Device ID (i.e. openmp device id) and its DeviceTy.
+DevicesTy Devices;
+
+int DeviceTy::associatePtr(void *HstPtrBegin, void *TgtPtrBegin, int64_t Size) {
+ DataMapMtx.lock();
+
+ // Check if entry exists
+ for (auto &HT : HostDataToTargetMap) {
+ if ((uintptr_t)HstPtrBegin == HT.HstPtrBegin) {
+ // Mapping already exists
+ bool isValid = HT.HstPtrBegin == (uintptr_t) HstPtrBegin &&
+ HT.HstPtrEnd == (uintptr_t) HstPtrBegin + Size &&
+ HT.TgtPtrBegin == (uintptr_t) TgtPtrBegin;
+ DataMapMtx.unlock();
+ if (isValid) {
+ DP("Attempt to re-associate the same device ptr+offset with the same "
+ "host ptr, nothing to do\n");
+ return OFFLOAD_SUCCESS;
+ } else {
+ DP("Not allowed to re-associate a different device ptr+offset with the "
+ "same host ptr\n");
+ return OFFLOAD_FAIL;
+ }
+ }
+ }
+
+ // Mapping does not exist, allocate it
+ HostDataToTargetTy newEntry;
+
+ // Set up missing fields
+ newEntry.HstPtrBase = (uintptr_t) HstPtrBegin;
+ newEntry.HstPtrBegin = (uintptr_t) HstPtrBegin;
+ newEntry.HstPtrEnd = (uintptr_t) HstPtrBegin + Size;
+ newEntry.TgtPtrBegin = (uintptr_t) TgtPtrBegin;
+ // refCount must be infinite
+ newEntry.RefCount = INF_REF_CNT;
+
+ DP("Creating new map entry: HstBase=" DPxMOD ", HstBegin=" DPxMOD ", HstEnd="
+ DPxMOD ", TgtBegin=" DPxMOD "\n", DPxPTR(newEntry.HstPtrBase),
+ DPxPTR(newEntry.HstPtrBegin), DPxPTR(newEntry.HstPtrEnd),
+ DPxPTR(newEntry.TgtPtrBegin));
+ HostDataToTargetMap.push_front(newEntry);
+
+ DataMapMtx.unlock();
+
+ return OFFLOAD_SUCCESS;
+}
+
+int DeviceTy::disassociatePtr(void *HstPtrBegin) {
+ DataMapMtx.lock();
+
+ // Check if entry exists
+ for (HostDataToTargetListTy::iterator ii = HostDataToTargetMap.begin();
+ ii != HostDataToTargetMap.end(); ++ii) {
+ if ((uintptr_t)HstPtrBegin == ii->HstPtrBegin) {
+ // Mapping exists
+ if (CONSIDERED_INF(ii->RefCount)) {
+ DP("Association found, removing it\n");
+ HostDataToTargetMap.erase(ii);
+ DataMapMtx.unlock();
+ return OFFLOAD_SUCCESS;
+ } else {
+ DP("Trying to disassociate a pointer which was not mapped via "
+ "omp_target_associate_ptr\n");
+ break;
+ }
+ }
+ }
+
+ // Mapping not found
+ DataMapMtx.unlock();
+ DP("Association not found\n");
+ return OFFLOAD_FAIL;
+}
+
+// Get ref count of map entry containing HstPtrBegin
+long DeviceTy::getMapEntryRefCnt(void *HstPtrBegin) {
+ uintptr_t hp = (uintptr_t)HstPtrBegin;
+ long RefCnt = -1;
+
+ DataMapMtx.lock();
+ for (auto &HT : HostDataToTargetMap) {
+ if (hp >= HT.HstPtrBegin && hp < HT.HstPtrEnd) {
+ DP("DeviceTy::getMapEntry: requested entry found\n");
+ RefCnt = HT.RefCount;
+ break;
+ }
+ }
+ DataMapMtx.unlock();
+
+ if (RefCnt < 0) {
+ DP("DeviceTy::getMapEntry: requested entry not found\n");
+ }
+
+ return RefCnt;
+}
+
+LookupResult DeviceTy::lookupMapping(void *HstPtrBegin, int64_t Size) {
+ uintptr_t hp = (uintptr_t)HstPtrBegin;
+ LookupResult lr;
+
+ DP("Looking up mapping(HstPtrBegin=" DPxMOD ", Size=%ld)...\n", DPxPTR(hp),
+ Size);
+ for (lr.Entry = HostDataToTargetMap.begin();
+ lr.Entry != HostDataToTargetMap.end(); ++lr.Entry) {
+ auto &HT = *lr.Entry;
+ // Is it contained?
+ lr.Flags.IsContained = hp >= HT.HstPtrBegin && hp < HT.HstPtrEnd &&
+ (hp+Size) <= HT.HstPtrEnd;
+ // Does it extend into an already mapped region?
+ lr.Flags.ExtendsBefore = hp < HT.HstPtrBegin && (hp+Size) > HT.HstPtrBegin;
+ // Does it extend beyond the mapped region?
+ lr.Flags.ExtendsAfter = hp < HT.HstPtrEnd && (hp+Size) > HT.HstPtrEnd;
+
+ if (lr.Flags.IsContained || lr.Flags.ExtendsBefore ||
+ lr.Flags.ExtendsAfter) {
+ break;
+ }
+ }
+
+ if (lr.Flags.ExtendsBefore) {
+ DP("WARNING: Pointer is not mapped but section extends into already "
+ "mapped data\n");
+ }
+ if (lr.Flags.ExtendsAfter) {
+ DP("WARNING: Pointer is already mapped but section extends beyond mapped "
+ "region\n");
+ }
+
+ return lr;
+}
+
+// Used by target_data_begin
+// Return the target pointer begin (where the data will be moved).
+// Allocate memory if this is the first occurrence if this mapping.
+// Increment the reference counter.
+// If NULL is returned, then either data allocation failed or the user tried
+// to do an illegal mapping.
+void *DeviceTy::getOrAllocTgtPtr(void *HstPtrBegin, void *HstPtrBase,
+ int64_t Size, bool &IsNew, bool IsImplicit, bool UpdateRefCount) {
+ void *rc = NULL;
+ DataMapMtx.lock();
+ LookupResult lr = lookupMapping(HstPtrBegin, Size);
+
+ // Check if the pointer is contained.
+ if (lr.Flags.IsContained ||
+ ((lr.Flags.ExtendsBefore || lr.Flags.ExtendsAfter) && IsImplicit)) {
+ auto &HT = *lr.Entry;
+ IsNew = false;
+
+ if (UpdateRefCount)
+ ++HT.RefCount;
+
+ uintptr_t tp = HT.TgtPtrBegin + ((uintptr_t)HstPtrBegin - HT.HstPtrBegin);
+ DP("Mapping exists%s with HstPtrBegin=" DPxMOD ", TgtPtrBegin=" DPxMOD ", "
+ "Size=%ld,%s RefCount=%s\n", (IsImplicit ? " (implicit)" : ""),
+ DPxPTR(HstPtrBegin), DPxPTR(tp), Size,
+ (UpdateRefCount ? " updated" : ""),
+ (CONSIDERED_INF(HT.RefCount)) ? "INF" :
+ std::to_string(HT.RefCount).c_str());
+ rc = (void *)tp;
+ } else if ((lr.Flags.ExtendsBefore || lr.Flags.ExtendsAfter) && !IsImplicit) {
+ // Explicit extension of mapped data - not allowed.
+ DP("Explicit extension of mapping is not allowed.\n");
+ } else if (Size) {
+ // If it is not contained and Size > 0 we should create a new entry for it.
+ IsNew = true;
+ uintptr_t tp = (uintptr_t)RTL->data_alloc(RTLDeviceID, Size, HstPtrBegin);
+ DP("Creating new map entry: HstBase=" DPxMOD ", HstBegin=" DPxMOD ", "
+ "HstEnd=" DPxMOD ", TgtBegin=" DPxMOD "\n", DPxPTR(HstPtrBase),
+ DPxPTR(HstPtrBegin), DPxPTR((uintptr_t)HstPtrBegin + Size), DPxPTR(tp));
+ HostDataToTargetMap.push_front(HostDataToTargetTy((uintptr_t)HstPtrBase,
+ (uintptr_t)HstPtrBegin, (uintptr_t)HstPtrBegin + Size, tp));
+ rc = (void *)tp;
+ }
+
+ DataMapMtx.unlock();
+ return rc;
+}
+
+// Used by target_data_begin, target_data_end, target_data_update and target.
+// Return the target pointer begin (where the data will be moved).
+// Decrement the reference counter if called from target_data_end.
+void *DeviceTy::getTgtPtrBegin(void *HstPtrBegin, int64_t Size, bool &IsLast,
+ bool UpdateRefCount) {
+ void *rc = NULL;
+ DataMapMtx.lock();
+ LookupResult lr = lookupMapping(HstPtrBegin, Size);
+
+ if (lr.Flags.IsContained || lr.Flags.ExtendsBefore || lr.Flags.ExtendsAfter) {
+ auto &HT = *lr.Entry;
+ IsLast = !(HT.RefCount > 1);
+
+ if (HT.RefCount > 1 && UpdateRefCount)
+ --HT.RefCount;
+
+ uintptr_t tp = HT.TgtPtrBegin + ((uintptr_t)HstPtrBegin - HT.HstPtrBegin);
+ DP("Mapping exists with HstPtrBegin=" DPxMOD ", TgtPtrBegin=" DPxMOD ", "
+ "Size=%ld,%s RefCount=%s\n", DPxPTR(HstPtrBegin), DPxPTR(tp), Size,
+ (UpdateRefCount ? " updated" : ""),
+ (CONSIDERED_INF(HT.RefCount)) ? "INF" :
+ std::to_string(HT.RefCount).c_str());
+ rc = (void *)tp;
+ } else {
+ IsLast = false;
+ }
+
+ DataMapMtx.unlock();
+ return rc;
+}
+
+// Return the target pointer begin (where the data will be moved).
+// Lock-free version called when loading global symbols from the fat binary.
+void *DeviceTy::getTgtPtrBegin(void *HstPtrBegin, int64_t Size) {
+ uintptr_t hp = (uintptr_t)HstPtrBegin;
+ LookupResult lr = lookupMapping(HstPtrBegin, Size);
+ if (lr.Flags.IsContained || lr.Flags.ExtendsBefore || lr.Flags.ExtendsAfter) {
+ auto &HT = *lr.Entry;
+ uintptr_t tp = HT.TgtPtrBegin + (hp - HT.HstPtrBegin);
+ return (void *)tp;
+ }
+
+ return NULL;
+}
+
+int DeviceTy::deallocTgtPtr(void *HstPtrBegin, int64_t Size, bool ForceDelete) {
+ // Check if the pointer is contained in any sub-nodes.
+ int rc;
+ DataMapMtx.lock();
+ LookupResult lr = lookupMapping(HstPtrBegin, Size);
+ if (lr.Flags.IsContained || lr.Flags.ExtendsBefore || lr.Flags.ExtendsAfter) {
+ auto &HT = *lr.Entry;
+ if (ForceDelete)
+ HT.RefCount = 1;
+ if (--HT.RefCount <= 0) {
+ assert(HT.RefCount == 0 && "did not expect a negative ref count");
+ DP("Deleting tgt data " DPxMOD " of size %ld\n",
+ DPxPTR(HT.TgtPtrBegin), Size);
+ RTL->data_delete(RTLDeviceID, (void *)HT.TgtPtrBegin);
+ DP("Removing%s mapping with HstPtrBegin=" DPxMOD ", TgtPtrBegin=" DPxMOD
+ ", Size=%ld\n", (ForceDelete ? " (forced)" : ""),
+ DPxPTR(HT.HstPtrBegin), DPxPTR(HT.TgtPtrBegin), Size);
+ HostDataToTargetMap.erase(lr.Entry);
+ }
+ rc = OFFLOAD_SUCCESS;
+ } else {
+ DP("Section to delete (hst addr " DPxMOD ") does not exist in the allocated"
+ " memory\n", DPxPTR(HstPtrBegin));
+ rc = OFFLOAD_FAIL;
+ }
+
+ DataMapMtx.unlock();
+ return rc;
+}
+
+/// Init device, should not be called directly.
+void DeviceTy::init() {
+ int32_t rc = RTL->init_device(RTLDeviceID);
+ if (rc == OFFLOAD_SUCCESS) {
+ IsInit = true;
+ }
+}
+
+/// Thread-safe method to initialize the device only once.
+int32_t DeviceTy::initOnce() {
+ std::call_once(InitFlag, &DeviceTy::init, this);
+
+ // At this point, if IsInit is true, then either this thread or some other
+ // thread in the past successfully initialized the device, so we can return
+ // OFFLOAD_SUCCESS. If this thread executed init() via call_once() and it
+ // failed, return OFFLOAD_FAIL. If call_once did not invoke init(), it means
+ // that some other thread already attempted to execute init() and if IsInit
+ // is still false, return OFFLOAD_FAIL.
+ if (IsInit)
+ return OFFLOAD_SUCCESS;
+ else
+ return OFFLOAD_FAIL;
+}
+
+// Load binary to device.
+__tgt_target_table *DeviceTy::load_binary(void *Img) {
+ RTL->Mtx.lock();
+ __tgt_target_table *rc = RTL->load_binary(RTLDeviceID, Img);
+ RTL->Mtx.unlock();
+ return rc;
+}
+
+// Submit data to device.
+int32_t DeviceTy::data_submit(void *TgtPtrBegin, void *HstPtrBegin,
+ int64_t Size) {
+ return RTL->data_submit(RTLDeviceID, TgtPtrBegin, HstPtrBegin, Size);
+}
+
+// Retrieve data from device.
+int32_t DeviceTy::data_retrieve(void *HstPtrBegin, void *TgtPtrBegin,
+ int64_t Size) {
+ return RTL->data_retrieve(RTLDeviceID, HstPtrBegin, TgtPtrBegin, Size);
+}
+
+// Run region on device
+int32_t DeviceTy::run_region(void *TgtEntryPtr, void **TgtVarsPtr,
+ ptrdiff_t *TgtOffsets, int32_t TgtVarsSize) {
+ return RTL->run_region(RTLDeviceID, TgtEntryPtr, TgtVarsPtr, TgtOffsets,
+ TgtVarsSize);
+}
+
+// Run team region on device.
+int32_t DeviceTy::run_team_region(void *TgtEntryPtr, void **TgtVarsPtr,
+ ptrdiff_t *TgtOffsets, int32_t TgtVarsSize, int32_t NumTeams,
+ int32_t ThreadLimit, uint64_t LoopTripCount) {
+ return RTL->run_team_region(RTLDeviceID, TgtEntryPtr, TgtVarsPtr, TgtOffsets,
+ TgtVarsSize, NumTeams, ThreadLimit, LoopTripCount);
+}
Modified: openmp/trunk/libomptarget/src/device.h
URL: http://llvm.org/viewvc/llvm-project/openmp/trunk/libomptarget/src/device.h?rev=319970&r1=319969&r2=319970&view=diff
==============================================================================
--- openmp/trunk/libomptarget/src/device.h (original)
+++ openmp/trunk/libomptarget/src/device.h Wed Dec 6 13:59:09 2017
@@ -15,6 +15,7 @@
#define _OMPTARGET_DEVICE_H
#include <cstddef>
+#include <climits>
#include <list>
#include <map>
#include <mutex>
@@ -25,6 +26,9 @@ struct RTLInfoTy;
struct __tgt_bin_desc;
struct __tgt_target_table;
+#define INF_REF_CNT (LONG_MAX>>1) // leave room for additions/subtractions
+#define CONSIDERED_INF(x) (x > (INF_REF_CNT>>1))
+
/// Map between host data and target data.
struct HostDataToTargetTy {
uintptr_t HstPtrBase; // host info.
Modified: openmp/trunk/libomptarget/src/omptarget.cpp
URL: http://llvm.org/viewvc/llvm-project/openmp/trunk/libomptarget/src/omptarget.cpp?rev=319970&r1=319969&r2=319970&view=diff
==============================================================================
--- openmp/trunk/libomptarget/src/omptarget.cpp (original)
+++ openmp/trunk/libomptarget/src/omptarget.cpp Wed Dec 6 13:59:09 2017
@@ -21,19 +21,12 @@
#include <cassert>
#include <climits>
#include <cstring>
-#include <string>
#include <vector>
#ifdef OMPTARGET_DEBUG
int DebugLevel = 0;
#endif // OMPTARGET_DEBUG
-#define INF_REF_CNT (LONG_MAX>>1) // leave room for additions/subtractions
-#define CONSIDERED_INF(x) (x > (INF_REF_CNT>>1))
-
-/// Map between Device ID (i.e. openmp device id) and its DeviceTy.
-DevicesTy Devices;
-
/// Check whether a device has an associated RTL and initialize it if it's not
/// already initialized.
static bool device_is_ready(int device_num) {
@@ -330,320 +323,6 @@ EXTERN int omp_target_disassociate_ptr(v
}
////////////////////////////////////////////////////////////////////////////////
-// functionality for device
-
-int DeviceTy::associatePtr(void *HstPtrBegin, void *TgtPtrBegin, int64_t Size) {
- DataMapMtx.lock();
-
- // Check if entry exists
- for (auto &HT : HostDataToTargetMap) {
- if ((uintptr_t)HstPtrBegin == HT.HstPtrBegin) {
- // Mapping already exists
- bool isValid = HT.HstPtrBegin == (uintptr_t) HstPtrBegin &&
- HT.HstPtrEnd == (uintptr_t) HstPtrBegin + Size &&
- HT.TgtPtrBegin == (uintptr_t) TgtPtrBegin;
- DataMapMtx.unlock();
- if (isValid) {
- DP("Attempt to re-associate the same device ptr+offset with the same "
- "host ptr, nothing to do\n");
- return OFFLOAD_SUCCESS;
- } else {
- DP("Not allowed to re-associate a different device ptr+offset with the "
- "same host ptr\n");
- return OFFLOAD_FAIL;
- }
- }
- }
-
- // Mapping does not exist, allocate it
- HostDataToTargetTy newEntry;
-
- // Set up missing fields
- newEntry.HstPtrBase = (uintptr_t) HstPtrBegin;
- newEntry.HstPtrBegin = (uintptr_t) HstPtrBegin;
- newEntry.HstPtrEnd = (uintptr_t) HstPtrBegin + Size;
- newEntry.TgtPtrBegin = (uintptr_t) TgtPtrBegin;
- // refCount must be infinite
- newEntry.RefCount = INF_REF_CNT;
-
- DP("Creating new map entry: HstBase=" DPxMOD ", HstBegin=" DPxMOD ", HstEnd="
- DPxMOD ", TgtBegin=" DPxMOD "\n", DPxPTR(newEntry.HstPtrBase),
- DPxPTR(newEntry.HstPtrBegin), DPxPTR(newEntry.HstPtrEnd),
- DPxPTR(newEntry.TgtPtrBegin));
- HostDataToTargetMap.push_front(newEntry);
-
- DataMapMtx.unlock();
-
- return OFFLOAD_SUCCESS;
-}
-
-int DeviceTy::disassociatePtr(void *HstPtrBegin) {
- DataMapMtx.lock();
-
- // Check if entry exists
- for (HostDataToTargetListTy::iterator ii = HostDataToTargetMap.begin();
- ii != HostDataToTargetMap.end(); ++ii) {
- if ((uintptr_t)HstPtrBegin == ii->HstPtrBegin) {
- // Mapping exists
- if (CONSIDERED_INF(ii->RefCount)) {
- DP("Association found, removing it\n");
- HostDataToTargetMap.erase(ii);
- DataMapMtx.unlock();
- return OFFLOAD_SUCCESS;
- } else {
- DP("Trying to disassociate a pointer which was not mapped via "
- "omp_target_associate_ptr\n");
- break;
- }
- }
- }
-
- // Mapping not found
- DataMapMtx.unlock();
- DP("Association not found\n");
- return OFFLOAD_FAIL;
-}
-
-// Get ref count of map entry containing HstPtrBegin
-long DeviceTy::getMapEntryRefCnt(void *HstPtrBegin) {
- uintptr_t hp = (uintptr_t)HstPtrBegin;
- long RefCnt = -1;
-
- DataMapMtx.lock();
- for (auto &HT : HostDataToTargetMap) {
- if (hp >= HT.HstPtrBegin && hp < HT.HstPtrEnd) {
- DP("DeviceTy::getMapEntry: requested entry found\n");
- RefCnt = HT.RefCount;
- break;
- }
- }
- DataMapMtx.unlock();
-
- if (RefCnt < 0) {
- DP("DeviceTy::getMapEntry: requested entry not found\n");
- }
-
- return RefCnt;
-}
-
-LookupResult DeviceTy::lookupMapping(void *HstPtrBegin, int64_t Size) {
- uintptr_t hp = (uintptr_t)HstPtrBegin;
- LookupResult lr;
-
- DP("Looking up mapping(HstPtrBegin=" DPxMOD ", Size=%ld)...\n", DPxPTR(hp),
- Size);
- for (lr.Entry = HostDataToTargetMap.begin();
- lr.Entry != HostDataToTargetMap.end(); ++lr.Entry) {
- auto &HT = *lr.Entry;
- // Is it contained?
- lr.Flags.IsContained = hp >= HT.HstPtrBegin && hp < HT.HstPtrEnd &&
- (hp+Size) <= HT.HstPtrEnd;
- // Does it extend into an already mapped region?
- lr.Flags.ExtendsBefore = hp < HT.HstPtrBegin && (hp+Size) > HT.HstPtrBegin;
- // Does it extend beyond the mapped region?
- lr.Flags.ExtendsAfter = hp < HT.HstPtrEnd && (hp+Size) > HT.HstPtrEnd;
-
- if (lr.Flags.IsContained || lr.Flags.ExtendsBefore ||
- lr.Flags.ExtendsAfter) {
- break;
- }
- }
-
- if (lr.Flags.ExtendsBefore) {
- DP("WARNING: Pointer is not mapped but section extends into already "
- "mapped data\n");
- }
- if (lr.Flags.ExtendsAfter) {
- DP("WARNING: Pointer is already mapped but section extends beyond mapped "
- "region\n");
- }
-
- return lr;
-}
-
-// Used by target_data_begin
-// Return the target pointer begin (where the data will be moved).
-// Allocate memory if this is the first occurrence if this mapping.
-// Increment the reference counter.
-// If NULL is returned, then either data allocation failed or the user tried
-// to do an illegal mapping.
-void *DeviceTy::getOrAllocTgtPtr(void *HstPtrBegin, void *HstPtrBase,
- int64_t Size, bool &IsNew, bool IsImplicit, bool UpdateRefCount) {
- void *rc = NULL;
- DataMapMtx.lock();
- LookupResult lr = lookupMapping(HstPtrBegin, Size);
-
- // Check if the pointer is contained.
- if (lr.Flags.IsContained ||
- ((lr.Flags.ExtendsBefore || lr.Flags.ExtendsAfter) && IsImplicit)) {
- auto &HT = *lr.Entry;
- IsNew = false;
-
- if (UpdateRefCount)
- ++HT.RefCount;
-
- uintptr_t tp = HT.TgtPtrBegin + ((uintptr_t)HstPtrBegin - HT.HstPtrBegin);
- DP("Mapping exists%s with HstPtrBegin=" DPxMOD ", TgtPtrBegin=" DPxMOD ", "
- "Size=%ld,%s RefCount=%s\n", (IsImplicit ? " (implicit)" : ""),
- DPxPTR(HstPtrBegin), DPxPTR(tp), Size,
- (UpdateRefCount ? " updated" : ""),
- (CONSIDERED_INF(HT.RefCount)) ? "INF" :
- std::to_string(HT.RefCount).c_str());
- rc = (void *)tp;
- } else if ((lr.Flags.ExtendsBefore || lr.Flags.ExtendsAfter) && !IsImplicit) {
- // Explicit extension of mapped data - not allowed.
- DP("Explicit extension of mapping is not allowed.\n");
- } else if (Size) {
- // If it is not contained and Size > 0 we should create a new entry for it.
- IsNew = true;
- uintptr_t tp = (uintptr_t)RTL->data_alloc(RTLDeviceID, Size, HstPtrBegin);
- DP("Creating new map entry: HstBase=" DPxMOD ", HstBegin=" DPxMOD ", "
- "HstEnd=" DPxMOD ", TgtBegin=" DPxMOD "\n", DPxPTR(HstPtrBase),
- DPxPTR(HstPtrBegin), DPxPTR((uintptr_t)HstPtrBegin + Size), DPxPTR(tp));
- HostDataToTargetMap.push_front(HostDataToTargetTy((uintptr_t)HstPtrBase,
- (uintptr_t)HstPtrBegin, (uintptr_t)HstPtrBegin + Size, tp));
- rc = (void *)tp;
- }
-
- DataMapMtx.unlock();
- return rc;
-}
-
-// Used by target_data_begin, target_data_end, target_data_update and target.
-// Return the target pointer begin (where the data will be moved).
-// Decrement the reference counter if called from target_data_end.
-void *DeviceTy::getTgtPtrBegin(void *HstPtrBegin, int64_t Size, bool &IsLast,
- bool UpdateRefCount) {
- void *rc = NULL;
- DataMapMtx.lock();
- LookupResult lr = lookupMapping(HstPtrBegin, Size);
-
- if (lr.Flags.IsContained || lr.Flags.ExtendsBefore || lr.Flags.ExtendsAfter) {
- auto &HT = *lr.Entry;
- IsLast = !(HT.RefCount > 1);
-
- if (HT.RefCount > 1 && UpdateRefCount)
- --HT.RefCount;
-
- uintptr_t tp = HT.TgtPtrBegin + ((uintptr_t)HstPtrBegin - HT.HstPtrBegin);
- DP("Mapping exists with HstPtrBegin=" DPxMOD ", TgtPtrBegin=" DPxMOD ", "
- "Size=%ld,%s RefCount=%s\n", DPxPTR(HstPtrBegin), DPxPTR(tp), Size,
- (UpdateRefCount ? " updated" : ""),
- (CONSIDERED_INF(HT.RefCount)) ? "INF" :
- std::to_string(HT.RefCount).c_str());
- rc = (void *)tp;
- } else {
- IsLast = false;
- }
-
- DataMapMtx.unlock();
- return rc;
-}
-
-// Return the target pointer begin (where the data will be moved).
-// Lock-free version called when loading global symbols from the fat binary.
-void *DeviceTy::getTgtPtrBegin(void *HstPtrBegin, int64_t Size) {
- uintptr_t hp = (uintptr_t)HstPtrBegin;
- LookupResult lr = lookupMapping(HstPtrBegin, Size);
- if (lr.Flags.IsContained || lr.Flags.ExtendsBefore || lr.Flags.ExtendsAfter) {
- auto &HT = *lr.Entry;
- uintptr_t tp = HT.TgtPtrBegin + (hp - HT.HstPtrBegin);
- return (void *)tp;
- }
-
- return NULL;
-}
-
-int DeviceTy::deallocTgtPtr(void *HstPtrBegin, int64_t Size, bool ForceDelete) {
- // Check if the pointer is contained in any sub-nodes.
- int rc;
- DataMapMtx.lock();
- LookupResult lr = lookupMapping(HstPtrBegin, Size);
- if (lr.Flags.IsContained || lr.Flags.ExtendsBefore || lr.Flags.ExtendsAfter) {
- auto &HT = *lr.Entry;
- if (ForceDelete)
- HT.RefCount = 1;
- if (--HT.RefCount <= 0) {
- assert(HT.RefCount == 0 && "did not expect a negative ref count");
- DP("Deleting tgt data " DPxMOD " of size %ld\n",
- DPxPTR(HT.TgtPtrBegin), Size);
- RTL->data_delete(RTLDeviceID, (void *)HT.TgtPtrBegin);
- DP("Removing%s mapping with HstPtrBegin=" DPxMOD ", TgtPtrBegin=" DPxMOD
- ", Size=%ld\n", (ForceDelete ? " (forced)" : ""),
- DPxPTR(HT.HstPtrBegin), DPxPTR(HT.TgtPtrBegin), Size);
- HostDataToTargetMap.erase(lr.Entry);
- }
- rc = OFFLOAD_SUCCESS;
- } else {
- DP("Section to delete (hst addr " DPxMOD ") does not exist in the allocated"
- " memory\n", DPxPTR(HstPtrBegin));
- rc = OFFLOAD_FAIL;
- }
-
- DataMapMtx.unlock();
- return rc;
-}
-
-/// Init device, should not be called directly.
-void DeviceTy::init() {
- int32_t rc = RTL->init_device(RTLDeviceID);
- if (rc == OFFLOAD_SUCCESS) {
- IsInit = true;
- }
-}
-
-/// Thread-safe method to initialize the device only once.
-int32_t DeviceTy::initOnce() {
- std::call_once(InitFlag, &DeviceTy::init, this);
-
- // At this point, if IsInit is true, then either this thread or some other
- // thread in the past successfully initialized the device, so we can return
- // OFFLOAD_SUCCESS. If this thread executed init() via call_once() and it
- // failed, return OFFLOAD_FAIL. If call_once did not invoke init(), it means
- // that some other thread already attempted to execute init() and if IsInit
- // is still false, return OFFLOAD_FAIL.
- if (IsInit)
- return OFFLOAD_SUCCESS;
- else
- return OFFLOAD_FAIL;
-}
-
-// Load binary to device.
-__tgt_target_table *DeviceTy::load_binary(void *Img) {
- RTL->Mtx.lock();
- __tgt_target_table *rc = RTL->load_binary(RTLDeviceID, Img);
- RTL->Mtx.unlock();
- return rc;
-}
-
-// Submit data to device.
-int32_t DeviceTy::data_submit(void *TgtPtrBegin, void *HstPtrBegin,
- int64_t Size) {
- return RTL->data_submit(RTLDeviceID, TgtPtrBegin, HstPtrBegin, Size);
-}
-
-// Retrieve data from device.
-int32_t DeviceTy::data_retrieve(void *HstPtrBegin, void *TgtPtrBegin,
- int64_t Size) {
- return RTL->data_retrieve(RTLDeviceID, HstPtrBegin, TgtPtrBegin, Size);
-}
-
-// Run region on device
-int32_t DeviceTy::run_region(void *TgtEntryPtr, void **TgtVarsPtr,
- ptrdiff_t *TgtOffsets, int32_t TgtVarsSize) {
- return RTL->run_region(RTLDeviceID, TgtEntryPtr, TgtVarsPtr, TgtOffsets,
- TgtVarsSize);
-}
-
-// Run team region on device.
-int32_t DeviceTy::run_team_region(void *TgtEntryPtr, void **TgtVarsPtr,
- ptrdiff_t *TgtOffsets, int32_t TgtVarsSize, int32_t NumTeams,
- int32_t ThreadLimit, uint64_t LoopTripCount) {
- return RTL->run_team_region(RTLDeviceID, TgtEntryPtr, TgtVarsPtr, TgtOffsets,
- TgtVarsSize, NumTeams, ThreadLimit, LoopTripCount);
-}
-
-////////////////////////////////////////////////////////////////////////////////
/// adds a target shared library to the target execution image
EXTERN void __tgt_register_lib(__tgt_bin_desc *desc) {
RTLs.RegisterLib(desc);
More information about the Openmp-commits
mailing list