[clang] [llvm] [OpenMP] Adds omp_target_is_accessible routine (PR #138294)
Nicole Aschenbrenner via cfe-commits
cfe-commits at lists.llvm.org
Tue Oct 21 23:45:30 PDT 2025
https://github.com/nicebert updated https://github.com/llvm/llvm-project/pull/138294
>From 025d36ef4386bf017e3a8db4f42076a6350ff4ff Mon Sep 17 00:00:00 2001
From: Nicole Aschenbrenner <nicole.aschenbrenner at amd.com>
Date: Fri, 2 May 2025 09:58:23 -0400
Subject: [PATCH 01/18] [OpenMP] Adds omp_target_is_accessible routine
Adds implementation of omp_target_is_accessible routine with
5.1 behaviour, checking if a host pointer is acccessible from a device
without running on the device (from the host).
---
clang/docs/OpenMPSupport.rst | 2 +-
offload/include/device.h | 3 ++
offload/include/omptarget.h | 1 +
offload/libomptarget/OpenMP/API.cpp | 45 ++++++++++++++++++-
offload/libomptarget/device.cpp | 4 ++
offload/libomptarget/exports | 1 +
offload/plugins-nextgen/amdgpu/src/rtl.cpp | 2 +
.../common/include/PluginInterface.h | 7 +++
.../common/src/PluginInterface.cpp | 8 ++++
offload/test/mapping/is_accessible.cpp | 40 +++++++++++++++++
10 files changed, 111 insertions(+), 2 deletions(-)
create mode 100644 offload/test/mapping/is_accessible.cpp
diff --git a/clang/docs/OpenMPSupport.rst b/clang/docs/OpenMPSupport.rst
index 58cd10ad4d8fa..838d329041baa 100644
--- a/clang/docs/OpenMPSupport.rst
+++ b/clang/docs/OpenMPSupport.rst
@@ -256,7 +256,7 @@ implementation.
+------------------------------+--------------------------------------------------------------+--------------------------+-----------------------------------------------------------------------+
| device | device-specific environment variables | :none:`unclaimed` | |
+------------------------------+--------------------------------------------------------------+--------------------------+-----------------------------------------------------------------------+
-| device | omp_target_is_accessible routine | :none:`unclaimed` | |
+| device | omp_target_is_accessible routine | :part:`worked on` | https://github.com/llvm/llvm-project/pull/138294 |
+------------------------------+--------------------------------------------------------------+--------------------------+-----------------------------------------------------------------------+
| device | omp_get_mapped_ptr routine | :good:`done` | D141545 |
+------------------------------+--------------------------------------------------------------+--------------------------+-----------------------------------------------------------------------+
diff --git a/offload/include/device.h b/offload/include/device.h
index f4b10abbaa3fd..c82d947de6891 100644
--- a/offload/include/device.h
+++ b/offload/include/device.h
@@ -152,6 +152,9 @@ struct DeviceTy {
/// Ask the device whether the runtime should use auto zero-copy.
bool useAutoZeroCopy();
+ /// Ask the device whether it supports unified memory.
+ bool supportsUnifiedMemory();
+
/// Check if there are pending images for this device.
bool hasPendingImages() const { return HasPendingImages; }
diff --git a/offload/include/omptarget.h b/offload/include/omptarget.h
index 6971780c7bdb5..8af8c4f659b35 100644
--- a/offload/include/omptarget.h
+++ b/offload/include/omptarget.h
@@ -280,6 +280,7 @@ int omp_get_initial_device(void);
void *omp_target_alloc(size_t Size, int DeviceNum);
void omp_target_free(void *DevicePtr, int DeviceNum);
int omp_target_is_present(const void *Ptr, int DeviceNum);
+int omp_target_is_accessible(const void *Ptr, size_t Size, int DeviceNum);
int omp_target_memcpy(void *Dst, const void *Src, size_t Length,
size_t DstOffset, size_t SrcOffset, int DstDevice,
int SrcDevice);
diff --git a/offload/libomptarget/OpenMP/API.cpp b/offload/libomptarget/OpenMP/API.cpp
index 4576f9bd06121..3ad54220c1135 100644
--- a/offload/libomptarget/OpenMP/API.cpp
+++ b/offload/libomptarget/OpenMP/API.cpp
@@ -93,7 +93,8 @@ EXTERN int omp_get_device_num(void) {
EXTERN int omp_get_initial_device(void) {
TIMESCOPE();
OMPT_IF_BUILT(ReturnAddressSetterRAII RA(__builtin_return_address(0)));
- int HostDevice = omp_get_num_devices();
+ int NumDevices = omp_get_num_devices();
+ int HostDevice = NumDevices == 0 ? -1 : NumDevices;
DP("Call to omp_get_initial_device returning %d\n", HostDevice);
return HostDevice;
}
@@ -195,6 +196,48 @@ EXTERN int omp_target_is_present(const void *Ptr, int DeviceNum) {
return Rc;
}
+/// Check whether a pointer is accessible from a device.
+/// the functionality is available in OpenMP 5.1 and later
+/// OpenMP 5.1
+/// omp_target_is_accessible checks whether a host pointer is accessible from a
+/// device OpenMP 6.0 removes restriction on pointer, allowing any pointer
+/// interpreted as a pointer in the address space of the given device.
+EXTERN int omp_target_is_accessible(const void *Ptr, size_t Size,
+ int DeviceNum) {
+ TIMESCOPE();
+ OMPT_IF_BUILT(ReturnAddressSetterRAII RA(__builtin_return_address(0)));
+ DP("Call to omp_target_is_accessible for device %d, address " DPxMOD
+ ", size %zu\n",
+ DeviceNum, DPxPTR(Ptr), Size);
+
+ if (!Ptr) {
+ DP("Call to omp_target_is_accessible with NULL ptr returning false\n");
+ return false;
+ }
+
+ if (DeviceNum == omp_get_initial_device()) {
+ DP("Call to omp_target_is_accessible on host, returning true\n");
+ return true;
+ }
+
+ // the device number must refer to a valid device
+ auto DeviceOrErr = PM->getDevice(DeviceNum);
+ if (!DeviceOrErr)
+ FATAL_MESSAGE(DeviceNum, "%s", toString(DeviceOrErr.takeError()).c_str());
+
+ // for OpenMP 5.1 the routine checks whether a host pointer is accessible from
+ // the device this requires for the device to support unified shared memory
+ if (DeviceOrErr->supportsUnifiedMemory()) {
+ DP("Device %d supports unified memory, returning true\n", DeviceNum);
+ return true;
+ }
+
+ // functionality to check whether a device pointer is accessible from a device
+ // (OpenMP 6.0) from the host might not be possible
+ DP("Device %d does not support unified memory, returning false\n", DeviceNum);
+ return false;
+}
+
EXTERN int omp_target_memcpy(void *Dst, const void *Src, size_t Length,
size_t DstOffset, size_t SrcOffset, int DstDevice,
int SrcDevice) {
diff --git a/offload/libomptarget/device.cpp b/offload/libomptarget/device.cpp
index f88e30ae9e76b..584c967c1a178 100644
--- a/offload/libomptarget/device.cpp
+++ b/offload/libomptarget/device.cpp
@@ -281,3 +281,7 @@ bool DeviceTy::useAutoZeroCopy() {
return false;
return RTL->use_auto_zero_copy(RTLDeviceID);
}
+
+bool DeviceTy::supportsUnifiedMemory() {
+ return RTL->supports_unified_memory(RTLDeviceID);
+}
diff --git a/offload/libomptarget/exports b/offload/libomptarget/exports
index 2406776c1fb5f..94be34b2fbf77 100644
--- a/offload/libomptarget/exports
+++ b/offload/libomptarget/exports
@@ -42,6 +42,7 @@ VERS1.0 {
omp_get_initial_device;
omp_target_alloc;
omp_target_free;
+ omp_target_is_accessible;
omp_target_is_present;
omp_target_memcpy;
omp_target_memcpy_rect;
diff --git a/offload/plugins-nextgen/amdgpu/src/rtl.cpp b/offload/plugins-nextgen/amdgpu/src/rtl.cpp
index f8db9bf0ae739..bdccb988e8d9e 100644
--- a/offload/plugins-nextgen/amdgpu/src/rtl.cpp
+++ b/offload/plugins-nextgen/amdgpu/src/rtl.cpp
@@ -2821,6 +2821,8 @@ struct AMDGPUDeviceTy : public GenericDeviceTy, AMDGenericDeviceTy {
return ((IsAPU || OMPX_ApuMaps) && IsXnackEnabled);
}
+ bool supportsUnifiedMemoryImpl() override { return IsXnackEnabled; }
+
/// Getters and setters for stack and heap sizes.
Error getDeviceStackSize(uint64_t &Value) override {
Value = StackSize;
diff --git a/offload/plugins-nextgen/common/include/PluginInterface.h b/offload/plugins-nextgen/common/include/PluginInterface.h
index 8c17a2ee07047..d0c350c2cf50b 100644
--- a/offload/plugins-nextgen/common/include/PluginInterface.h
+++ b/offload/plugins-nextgen/common/include/PluginInterface.h
@@ -1003,6 +1003,10 @@ struct GenericDeviceTy : public DeviceAllocatorTy {
bool useAutoZeroCopy();
virtual bool useAutoZeroCopyImpl() { return false; }
+ /// Returns true if the device has unified memory capabilities
+ bool supportsUnifiedMemory();
+ virtual bool supportsUnifiedMemoryImpl() { return false; }
+
/// Allocate and construct a kernel object.
virtual Expected<GenericKernelTy &> constructKernel(const char *Name) = 0;
@@ -1402,6 +1406,9 @@ struct GenericPluginTy {
/// Returns if the plugin can support automatic copy.
int32_t use_auto_zero_copy(int32_t DeviceId);
+ /// Returns if the the device supports unified memory.
+ int32_t supports_unified_memory(int32_t DeviceId);
+
/// Look up a global symbol in the given binary.
int32_t get_global(__tgt_device_binary Binary, uint64_t Size,
const char *Name, void **DevicePtr);
diff --git a/offload/plugins-nextgen/common/src/PluginInterface.cpp b/offload/plugins-nextgen/common/src/PluginInterface.cpp
index 94a050b559efe..315c522e7dccb 100644
--- a/offload/plugins-nextgen/common/src/PluginInterface.cpp
+++ b/offload/plugins-nextgen/common/src/PluginInterface.cpp
@@ -1629,6 +1629,10 @@ Error GenericDeviceTy::syncEvent(void *EventPtr) {
bool GenericDeviceTy::useAutoZeroCopy() { return useAutoZeroCopyImpl(); }
+bool GenericDeviceTy::supportsUnifiedMemory() {
+ return supportsUnifiedMemoryImpl();
+}
+
Error GenericPluginTy::init() {
if (Initialized)
return Plugin::success();
@@ -2181,6 +2185,10 @@ int32_t GenericPluginTy::use_auto_zero_copy(int32_t DeviceId) {
return getDevice(DeviceId).useAutoZeroCopy();
}
+int32_t GenericPluginTy::supports_unified_memory(int32_t DeviceId) {
+ return getDevice(DeviceId).supportsUnifiedMemory();
+}
+
int32_t GenericPluginTy::get_global(__tgt_device_binary Binary, uint64_t Size,
const char *Name, void **DevicePtr) {
assert(Binary.handle && "Invalid device binary handle");
diff --git a/offload/test/mapping/is_accessible.cpp b/offload/test/mapping/is_accessible.cpp
new file mode 100644
index 0000000000000..6d6a0048e01f3
--- /dev/null
+++ b/offload/test/mapping/is_accessible.cpp
@@ -0,0 +1,40 @@
+// RUN: %libomptarget-compilexx-generic
+// RUN: env HSA_XNACK=1 %libomptarget-run-generic 2>&1 \
+// RUN: | %fcheck-generic
+
+// RUN: %libomptarget-compilexx-generic
+// RUN: env HSA_XNACK=0 %libomptarget-run-generic 2>&1 \
+// RUN: | %fcheck-generic -check-prefix=NO_USM
+
+// REQUIRES: unified_shared_memory
+// REQUIRES: amdgpu
+
+// CHECK: SUCCESS
+// NO_USM: Not accessible
+
+#include <assert.h>
+#include <iostream>
+#include <omp.h>
+#include <stdio.h>
+
+int main() {
+ int n = 10000;
+ int *a = new int[n];
+ int err = 0;
+
+ // program must be executed with HSA_XNACK=1
+ if (!omp_target_is_accessible(a, n * sizeof(int), /*device_num=*/0))
+ printf("Not accessible\n");
+ else {
+#pragma omp target teams distribute parallel for
+ for (int i = 0; i < n; i++)
+ a[i] = i;
+
+ for (int i = 0; i < n; i++)
+ if (a[i] != i)
+ err++;
+ }
+
+ printf("%s\n", err == 0 ? "SUCCESS" : "FAIL");
+ return err;
+}
>From b33b27ea15da8885f5db7871fdbfe7593c9bd5ec Mon Sep 17 00:00:00 2001
From: nicebert <110385235+nicebert at users.noreply.github.com>
Date: Mon, 28 Jul 2025 16:49:21 +0200
Subject: [PATCH 02/18] Update offload/libomptarget/OpenMP/API.cpp
Co-authored-by: Shilei Tian <i at tianshilei.me>
---
offload/libomptarget/OpenMP/API.cpp | 2 +-
1 file changed, 1 insertion(+), 1 deletion(-)
diff --git a/offload/libomptarget/OpenMP/API.cpp b/offload/libomptarget/OpenMP/API.cpp
index 3ad54220c1135..2958779397946 100644
--- a/offload/libomptarget/OpenMP/API.cpp
+++ b/offload/libomptarget/OpenMP/API.cpp
@@ -220,7 +220,7 @@ EXTERN int omp_target_is_accessible(const void *Ptr, size_t Size,
return true;
}
- // the device number must refer to a valid device
+ // The device number must refer to a valid device
auto DeviceOrErr = PM->getDevice(DeviceNum);
if (!DeviceOrErr)
FATAL_MESSAGE(DeviceNum, "%s", toString(DeviceOrErr.takeError()).c_str());
>From bf01578259844418a3f0d5f3eeb48dba6c57aad3 Mon Sep 17 00:00:00 2001
From: nicebert <110385235+nicebert at users.noreply.github.com>
Date: Mon, 28 Jul 2025 16:49:57 +0200
Subject: [PATCH 03/18] Fix comment spelling
Co-authored-by: Shilei Tian <i at tianshilei.me>
---
offload/libomptarget/OpenMP/API.cpp | 2 +-
1 file changed, 1 insertion(+), 1 deletion(-)
diff --git a/offload/libomptarget/OpenMP/API.cpp b/offload/libomptarget/OpenMP/API.cpp
index 2958779397946..5dc294381d545 100644
--- a/offload/libomptarget/OpenMP/API.cpp
+++ b/offload/libomptarget/OpenMP/API.cpp
@@ -225,7 +225,7 @@ EXTERN int omp_target_is_accessible(const void *Ptr, size_t Size,
if (!DeviceOrErr)
FATAL_MESSAGE(DeviceNum, "%s", toString(DeviceOrErr.takeError()).c_str());
- // for OpenMP 5.1 the routine checks whether a host pointer is accessible from
+ // For OpenMP 5.1 the routine checks whether a host pointer is accessible from
// the device this requires for the device to support unified shared memory
if (DeviceOrErr->supportsUnifiedMemory()) {
DP("Device %d supports unified memory, returning true\n", DeviceNum);
>From d20f4d5c171852ca42115d0dddd8f329dde6db80 Mon Sep 17 00:00:00 2001
From: Nicole Aschenbrenner <nicole.aschenbrenner at amd.com>
Date: Fri, 2 May 2025 09:58:23 -0400
Subject: [PATCH 04/18] [OpenMP] Adds omp_target_is_accessible routine
Adds implementation of omp_target_is_accessible routine with
5.1 behaviour, checking if a host pointer is acccessible from a device
without running on the device (from the host).
---
offload/libomptarget/OpenMP/API.cpp | 12 ++++++++++--
1 file changed, 10 insertions(+), 2 deletions(-)
diff --git a/offload/libomptarget/OpenMP/API.cpp b/offload/libomptarget/OpenMP/API.cpp
index 5dc294381d545..2b92d2c9c3f2d 100644
--- a/offload/libomptarget/OpenMP/API.cpp
+++ b/offload/libomptarget/OpenMP/API.cpp
@@ -220,18 +220,26 @@ EXTERN int omp_target_is_accessible(const void *Ptr, size_t Size,
return true;
}
- // The device number must refer to a valid device
+ // the device number must refer to a valid device
auto DeviceOrErr = PM->getDevice(DeviceNum);
if (!DeviceOrErr)
FATAL_MESSAGE(DeviceNum, "%s", toString(DeviceOrErr.takeError()).c_str());
- // For OpenMP 5.1 the routine checks whether a host pointer is accessible from
+ // TODO: Add check for openmp version compatability
+
+ // for OpenMP 5.1 the routine checks whether a host pointer is accessible from
// the device this requires for the device to support unified shared memory
if (DeviceOrErr->supportsUnifiedMemory()) {
DP("Device %d supports unified memory, returning true\n", DeviceNum);
return true;
}
+ // TODO: Provide stubs & implementation to check whether a pointer is accessible from a given device
+ // using hsa_amd_pointer_info for AMDGPU implementation
+ // for OpenMP 6.x the specification is required to return true if
+ // the accessibility of the pointer can be determined otherwise it's allowed to return false
+ // the specification will be clarified from the current wording
+
// functionality to check whether a device pointer is accessible from a device
// (OpenMP 6.0) from the host might not be possible
DP("Device %d does not support unified memory, returning false\n", DeviceNum);
>From cb872425f16aa0c4de1905a2fb7e9a6971ef5d88 Mon Sep 17 00:00:00 2001
From: Nicole Aschenbrenner <nicole.aschenbrenner at amd.com>
Date: Fri, 2 May 2025 09:58:23 -0400
Subject: [PATCH 05/18] [OpenMP] Adds omp_target_is_accessible routine
Adds implementation of omp_target_is_accessible routine with
5.1 behaviour, checking if a host pointer is acccessible from a device
without running on the device (from the host).
---
offload/libomptarget/OpenMP/API.cpp | 13 +++++++++++--
1 file changed, 11 insertions(+), 2 deletions(-)
diff --git a/offload/libomptarget/OpenMP/API.cpp b/offload/libomptarget/OpenMP/API.cpp
index 5dc294381d545..4d804934c47ed 100644
--- a/offload/libomptarget/OpenMP/API.cpp
+++ b/offload/libomptarget/OpenMP/API.cpp
@@ -220,18 +220,27 @@ EXTERN int omp_target_is_accessible(const void *Ptr, size_t Size,
return true;
}
- // The device number must refer to a valid device
+ // the device number must refer to a valid device
auto DeviceOrErr = PM->getDevice(DeviceNum);
if (!DeviceOrErr)
FATAL_MESSAGE(DeviceNum, "%s", toString(DeviceOrErr.takeError()).c_str());
- // For OpenMP 5.1 the routine checks whether a host pointer is accessible from
+ // TODO: Add check for openmp version compatability
+
+ // for OpenMP 5.1 the routine checks whether a host pointer is accessible from
// the device this requires for the device to support unified shared memory
if (DeviceOrErr->supportsUnifiedMemory()) {
DP("Device %d supports unified memory, returning true\n", DeviceNum);
return true;
}
+ // TODO: Provide stubs & implementation to check whether a pointer is
+ // accessible from a given device using hsa_amd_pointer_info for AMDGPU
+ // implementation for OpenMP 6.x the specification is required to return true
+ // if the accessibility of the pointer can be determined otherwise it's
+ // allowed to return false the specification will be clarified from the
+ // current wording
+
// functionality to check whether a device pointer is accessible from a device
// (OpenMP 6.0) from the host might not be possible
DP("Device %d does not support unified memory, returning false\n", DeviceNum);
>From 95ab6fe61af091a0bbf8b3337ba8073adb01aad2 Mon Sep 17 00:00:00 2001
From: Nicole Aschenbrenner <nicole.aschenbrenner at amd.com>
Date: Fri, 1 Aug 2025 04:55:50 -0500
Subject: [PATCH 06/18] [OpenMP] Reverts omp_get_initial_device changes
---
offload/libomptarget/OpenMP/API.cpp | 3 +--
1 file changed, 1 insertion(+), 2 deletions(-)
diff --git a/offload/libomptarget/OpenMP/API.cpp b/offload/libomptarget/OpenMP/API.cpp
index 4d804934c47ed..80bfb7f689a75 100644
--- a/offload/libomptarget/OpenMP/API.cpp
+++ b/offload/libomptarget/OpenMP/API.cpp
@@ -93,8 +93,7 @@ EXTERN int omp_get_device_num(void) {
EXTERN int omp_get_initial_device(void) {
TIMESCOPE();
OMPT_IF_BUILT(ReturnAddressSetterRAII RA(__builtin_return_address(0)));
- int NumDevices = omp_get_num_devices();
- int HostDevice = NumDevices == 0 ? -1 : NumDevices;
+ int HostDevice = omp_get_num_devices();
DP("Call to omp_get_initial_device returning %d\n", HostDevice);
return HostDevice;
}
>From 9d974242181604bf55d5054698f1d4f9ac68a7ad Mon Sep 17 00:00:00 2001
From: Nicole Aschenbrenner <nicole.aschenbrenner at amd.com>
Date: Fri, 2 May 2025 09:58:23 -0400
Subject: [PATCH 07/18] [OpenMP] Adds omp_target_is_accessible routine
Adds implementation of omp_target_is_accessible routine with
5.1 behaviour, checking if a host pointer is acccessible from a device
without running on the device (from the host).
---
offload/include/device.h | 3 ++
offload/include/omptarget.h | 1 +
offload/libomptarget/OpenMP/API.cpp | 45 ++++++++++++++++++-
offload/libomptarget/device.cpp | 4 ++
offload/libomptarget/exports | 1 +
offload/plugins-nextgen/amdgpu/src/rtl.cpp | 2 +
.../common/include/PluginInterface.h | 7 +++
.../common/src/PluginInterface.cpp | 8 ++++
offload/test/mapping/is_accessible.cpp | 40 +++++++++++++++++
9 files changed, 110 insertions(+), 1 deletion(-)
create mode 100644 offload/test/mapping/is_accessible.cpp
diff --git a/offload/include/device.h b/offload/include/device.h
index bf93ce0460aef..24c36c73ce4ee 100644
--- a/offload/include/device.h
+++ b/offload/include/device.h
@@ -158,6 +158,9 @@ struct DeviceTy {
/// Ask the device whether the runtime should use auto zero-copy.
bool useAutoZeroCopy();
+ /// Ask the device whether it supports unified memory.
+ bool supportsUnifiedMemory();
+
/// Check if there are pending images for this device.
bool hasPendingImages() const { return HasPendingImages; }
diff --git a/offload/include/omptarget.h b/offload/include/omptarget.h
index 8fd722bb15022..6328e29127aa4 100644
--- a/offload/include/omptarget.h
+++ b/offload/include/omptarget.h
@@ -280,6 +280,7 @@ int omp_get_initial_device(void);
void *omp_target_alloc(size_t Size, int DeviceNum);
void omp_target_free(void *DevicePtr, int DeviceNum);
int omp_target_is_present(const void *Ptr, int DeviceNum);
+int omp_target_is_accessible(const void *Ptr, size_t Size, int DeviceNum);
int omp_target_memcpy(void *Dst, const void *Src, size_t Length,
size_t DstOffset, size_t SrcOffset, int DstDevice,
int SrcDevice);
diff --git a/offload/libomptarget/OpenMP/API.cpp b/offload/libomptarget/OpenMP/API.cpp
index b0f0573833713..91704b444a70c 100644
--- a/offload/libomptarget/OpenMP/API.cpp
+++ b/offload/libomptarget/OpenMP/API.cpp
@@ -94,7 +94,8 @@ EXTERN int omp_get_device_num(void) {
EXTERN int omp_get_initial_device(void) {
TIMESCOPE();
OMPT_IF_BUILT(ReturnAddressSetterRAII RA(__builtin_return_address(0)));
- int HostDevice = omp_get_num_devices();
+ int NumDevices = omp_get_num_devices();
+ int HostDevice = NumDevices == 0 ? -1 : NumDevices;
DP("Call to omp_get_initial_device returning %d\n", HostDevice);
return HostDevice;
}
@@ -196,6 +197,48 @@ EXTERN int omp_target_is_present(const void *Ptr, int DeviceNum) {
return Rc;
}
+/// Check whether a pointer is accessible from a device.
+/// the functionality is available in OpenMP 5.1 and later
+/// OpenMP 5.1
+/// omp_target_is_accessible checks whether a host pointer is accessible from a
+/// device OpenMP 6.0 removes restriction on pointer, allowing any pointer
+/// interpreted as a pointer in the address space of the given device.
+EXTERN int omp_target_is_accessible(const void *Ptr, size_t Size,
+ int DeviceNum) {
+ TIMESCOPE();
+ OMPT_IF_BUILT(ReturnAddressSetterRAII RA(__builtin_return_address(0)));
+ DP("Call to omp_target_is_accessible for device %d, address " DPxMOD
+ ", size %zu\n",
+ DeviceNum, DPxPTR(Ptr), Size);
+
+ if (!Ptr) {
+ DP("Call to omp_target_is_accessible with NULL ptr returning false\n");
+ return false;
+ }
+
+ if (DeviceNum == omp_get_initial_device()) {
+ DP("Call to omp_target_is_accessible on host, returning true\n");
+ return true;
+ }
+
+ // the device number must refer to a valid device
+ auto DeviceOrErr = PM->getDevice(DeviceNum);
+ if (!DeviceOrErr)
+ FATAL_MESSAGE(DeviceNum, "%s", toString(DeviceOrErr.takeError()).c_str());
+
+ // for OpenMP 5.1 the routine checks whether a host pointer is accessible from
+ // the device this requires for the device to support unified shared memory
+ if (DeviceOrErr->supportsUnifiedMemory()) {
+ DP("Device %d supports unified memory, returning true\n", DeviceNum);
+ return true;
+ }
+
+ // functionality to check whether a device pointer is accessible from a device
+ // (OpenMP 6.0) from the host might not be possible
+ DP("Device %d does not support unified memory, returning false\n", DeviceNum);
+ return false;
+}
+
EXTERN int omp_target_memcpy(void *Dst, const void *Src, size_t Length,
size_t DstOffset, size_t SrcOffset, int DstDevice,
int SrcDevice) {
diff --git a/offload/libomptarget/device.cpp b/offload/libomptarget/device.cpp
index 71423ae0c94d9..ea46037059686 100644
--- a/offload/libomptarget/device.cpp
+++ b/offload/libomptarget/device.cpp
@@ -367,3 +367,7 @@ bool DeviceTy::useAutoZeroCopy() {
return false;
return RTL->use_auto_zero_copy(RTLDeviceID);
}
+
+bool DeviceTy::supportsUnifiedMemory() {
+ return RTL->supports_unified_memory(RTLDeviceID);
+}
diff --git a/offload/libomptarget/exports b/offload/libomptarget/exports
index 8e2db6ba8bba4..95ddd03bb46a3 100644
--- a/offload/libomptarget/exports
+++ b/offload/libomptarget/exports
@@ -43,6 +43,7 @@ VERS1.0 {
omp_get_initial_device;
omp_target_alloc;
omp_target_free;
+ omp_target_is_accessible;
omp_target_is_present;
omp_target_memcpy;
omp_target_memcpy_rect;
diff --git a/offload/plugins-nextgen/amdgpu/src/rtl.cpp b/offload/plugins-nextgen/amdgpu/src/rtl.cpp
index c26cfe961aa0e..761761bcdb6e1 100644
--- a/offload/plugins-nextgen/amdgpu/src/rtl.cpp
+++ b/offload/plugins-nextgen/amdgpu/src/rtl.cpp
@@ -3027,6 +3027,8 @@ struct AMDGPUDeviceTy : public GenericDeviceTy, AMDGenericDeviceTy {
return ((IsAPU || OMPX_ApuMaps) && IsXnackEnabled);
}
+ bool supportsUnifiedMemoryImpl() override { return IsXnackEnabled; }
+
/// Getters and setters for stack and heap sizes.
Error getDeviceStackSize(uint64_t &Value) override {
Value = StackSize;
diff --git a/offload/plugins-nextgen/common/include/PluginInterface.h b/offload/plugins-nextgen/common/include/PluginInterface.h
index 6ff3ef8cda177..e5731ec13d869 100644
--- a/offload/plugins-nextgen/common/include/PluginInterface.h
+++ b/offload/plugins-nextgen/common/include/PluginInterface.h
@@ -1093,6 +1093,10 @@ struct GenericDeviceTy : public DeviceAllocatorTy {
bool useAutoZeroCopy();
virtual bool useAutoZeroCopyImpl() { return false; }
+ /// Returns true if the device has unified memory capabilities
+ bool supportsUnifiedMemory();
+ virtual bool supportsUnifiedMemoryImpl() { return false; }
+
virtual Expected<omp_interop_val_t *>
createInterop(int32_t InteropType, interop_spec_t &InteropSpec) {
return nullptr;
@@ -1523,6 +1527,9 @@ struct GenericPluginTy {
/// Returns if the plugin can support automatic copy.
int32_t use_auto_zero_copy(int32_t DeviceId);
+ /// Returns if the the device supports unified memory.
+ int32_t supports_unified_memory(int32_t DeviceId);
+
/// Look up a global symbol in the given binary.
int32_t get_global(__tgt_device_binary Binary, uint64_t Size,
const char *Name, void **DevicePtr);
diff --git a/offload/plugins-nextgen/common/src/PluginInterface.cpp b/offload/plugins-nextgen/common/src/PluginInterface.cpp
index 36cdd6035e26d..6f7c12810c111 100644
--- a/offload/plugins-nextgen/common/src/PluginInterface.cpp
+++ b/offload/plugins-nextgen/common/src/PluginInterface.cpp
@@ -1607,6 +1607,10 @@ Error GenericDeviceTy::syncEvent(void *EventPtr) {
bool GenericDeviceTy::useAutoZeroCopy() { return useAutoZeroCopyImpl(); }
+bool GenericDeviceTy::supportsUnifiedMemory() {
+ return supportsUnifiedMemoryImpl();
+}
+
Error GenericPluginTy::init() {
if (Initialized)
return Plugin::success();
@@ -2159,6 +2163,10 @@ int32_t GenericPluginTy::use_auto_zero_copy(int32_t DeviceId) {
return getDevice(DeviceId).useAutoZeroCopy();
}
+int32_t GenericPluginTy::supports_unified_memory(int32_t DeviceId) {
+ return getDevice(DeviceId).supportsUnifiedMemory();
+}
+
int32_t GenericPluginTy::get_global(__tgt_device_binary Binary, uint64_t Size,
const char *Name, void **DevicePtr) {
assert(Binary.handle && "Invalid device binary handle");
diff --git a/offload/test/mapping/is_accessible.cpp b/offload/test/mapping/is_accessible.cpp
new file mode 100644
index 0000000000000..6d6a0048e01f3
--- /dev/null
+++ b/offload/test/mapping/is_accessible.cpp
@@ -0,0 +1,40 @@
+// RUN: %libomptarget-compilexx-generic
+// RUN: env HSA_XNACK=1 %libomptarget-run-generic 2>&1 \
+// RUN: | %fcheck-generic
+
+// RUN: %libomptarget-compilexx-generic
+// RUN: env HSA_XNACK=0 %libomptarget-run-generic 2>&1 \
+// RUN: | %fcheck-generic -check-prefix=NO_USM
+
+// REQUIRES: unified_shared_memory
+// REQUIRES: amdgpu
+
+// CHECK: SUCCESS
+// NO_USM: Not accessible
+
+#include <assert.h>
+#include <iostream>
+#include <omp.h>
+#include <stdio.h>
+
+int main() {
+ int n = 10000;
+ int *a = new int[n];
+ int err = 0;
+
+ // program must be executed with HSA_XNACK=1
+ if (!omp_target_is_accessible(a, n * sizeof(int), /*device_num=*/0))
+ printf("Not accessible\n");
+ else {
+#pragma omp target teams distribute parallel for
+ for (int i = 0; i < n; i++)
+ a[i] = i;
+
+ for (int i = 0; i < n; i++)
+ if (a[i] != i)
+ err++;
+ }
+
+ printf("%s\n", err == 0 ? "SUCCESS" : "FAIL");
+ return err;
+}
>From 34acf275b212052e712f77688d7bc32dc9e2caf3 Mon Sep 17 00:00:00 2001
From: nicebert <110385235+nicebert at users.noreply.github.com>
Date: Mon, 28 Jul 2025 16:49:21 +0200
Subject: [PATCH 08/18] Update offload/libomptarget/OpenMP/API.cpp
Co-authored-by: Shilei Tian <i at tianshilei.me>
---
offload/libomptarget/OpenMP/API.cpp | 2 +-
1 file changed, 1 insertion(+), 1 deletion(-)
diff --git a/offload/libomptarget/OpenMP/API.cpp b/offload/libomptarget/OpenMP/API.cpp
index 91704b444a70c..4c56fd34a02cd 100644
--- a/offload/libomptarget/OpenMP/API.cpp
+++ b/offload/libomptarget/OpenMP/API.cpp
@@ -221,7 +221,7 @@ EXTERN int omp_target_is_accessible(const void *Ptr, size_t Size,
return true;
}
- // the device number must refer to a valid device
+ // The device number must refer to a valid device
auto DeviceOrErr = PM->getDevice(DeviceNum);
if (!DeviceOrErr)
FATAL_MESSAGE(DeviceNum, "%s", toString(DeviceOrErr.takeError()).c_str());
>From d4ecaf6f802e7613e826ef9e2e4fd1b78d0b5140 Mon Sep 17 00:00:00 2001
From: nicebert <110385235+nicebert at users.noreply.github.com>
Date: Mon, 28 Jul 2025 16:49:57 +0200
Subject: [PATCH 09/18] Fix comment spelling
Co-authored-by: Shilei Tian <i at tianshilei.me>
---
offload/libomptarget/OpenMP/API.cpp | 2 +-
1 file changed, 1 insertion(+), 1 deletion(-)
diff --git a/offload/libomptarget/OpenMP/API.cpp b/offload/libomptarget/OpenMP/API.cpp
index 4c56fd34a02cd..4a9354842446b 100644
--- a/offload/libomptarget/OpenMP/API.cpp
+++ b/offload/libomptarget/OpenMP/API.cpp
@@ -226,7 +226,7 @@ EXTERN int omp_target_is_accessible(const void *Ptr, size_t Size,
if (!DeviceOrErr)
FATAL_MESSAGE(DeviceNum, "%s", toString(DeviceOrErr.takeError()).c_str());
- // for OpenMP 5.1 the routine checks whether a host pointer is accessible from
+ // For OpenMP 5.1 the routine checks whether a host pointer is accessible from
// the device this requires for the device to support unified shared memory
if (DeviceOrErr->supportsUnifiedMemory()) {
DP("Device %d supports unified memory, returning true\n", DeviceNum);
>From 2792290a1d9638bf9eca0e9c6196be3a8268597b Mon Sep 17 00:00:00 2001
From: Nicole Aschenbrenner <nicole.aschenbrenner at amd.com>
Date: Fri, 2 May 2025 09:58:23 -0400
Subject: [PATCH 10/18] [OpenMP] Adds omp_target_is_accessible routine
Adds implementation of omp_target_is_accessible routine with
5.1 behaviour, checking if a host pointer is acccessible from a device
without running on the device (from the host).
---
offload/libomptarget/OpenMP/API.cpp | 13 +++++++++++--
1 file changed, 11 insertions(+), 2 deletions(-)
diff --git a/offload/libomptarget/OpenMP/API.cpp b/offload/libomptarget/OpenMP/API.cpp
index 4a9354842446b..11eb219ef14a9 100644
--- a/offload/libomptarget/OpenMP/API.cpp
+++ b/offload/libomptarget/OpenMP/API.cpp
@@ -221,18 +221,27 @@ EXTERN int omp_target_is_accessible(const void *Ptr, size_t Size,
return true;
}
- // The device number must refer to a valid device
+ // the device number must refer to a valid device
auto DeviceOrErr = PM->getDevice(DeviceNum);
if (!DeviceOrErr)
FATAL_MESSAGE(DeviceNum, "%s", toString(DeviceOrErr.takeError()).c_str());
- // For OpenMP 5.1 the routine checks whether a host pointer is accessible from
+ // TODO: Add check for openmp version compatability
+
+ // for OpenMP 5.1 the routine checks whether a host pointer is accessible from
// the device this requires for the device to support unified shared memory
if (DeviceOrErr->supportsUnifiedMemory()) {
DP("Device %d supports unified memory, returning true\n", DeviceNum);
return true;
}
+ // TODO: Provide stubs & implementation to check whether a pointer is
+ // accessible from a given device using hsa_amd_pointer_info for AMDGPU
+ // implementation for OpenMP 6.x the specification is required to return true
+ // if the accessibility of the pointer can be determined otherwise it's
+ // allowed to return false the specification will be clarified from the
+ // current wording
+
// functionality to check whether a device pointer is accessible from a device
// (OpenMP 6.0) from the host might not be possible
DP("Device %d does not support unified memory, returning false\n", DeviceNum);
>From 712bdd101e0c727da69af5e01d468885fcf99df0 Mon Sep 17 00:00:00 2001
From: Nicole Aschenbrenner <nicole.aschenbrenner at amd.com>
Date: Fri, 1 Aug 2025 04:55:50 -0500
Subject: [PATCH 11/18] [OpenMP] Reverts omp_get_initial_device changes
---
offload/libomptarget/OpenMP/API.cpp | 3 +--
1 file changed, 1 insertion(+), 2 deletions(-)
diff --git a/offload/libomptarget/OpenMP/API.cpp b/offload/libomptarget/OpenMP/API.cpp
index 11eb219ef14a9..3632f0ffe7d99 100644
--- a/offload/libomptarget/OpenMP/API.cpp
+++ b/offload/libomptarget/OpenMP/API.cpp
@@ -94,8 +94,7 @@ EXTERN int omp_get_device_num(void) {
EXTERN int omp_get_initial_device(void) {
TIMESCOPE();
OMPT_IF_BUILT(ReturnAddressSetterRAII RA(__builtin_return_address(0)));
- int NumDevices = omp_get_num_devices();
- int HostDevice = NumDevices == 0 ? -1 : NumDevices;
+ int HostDevice = omp_get_num_devices();
DP("Call to omp_get_initial_device returning %d\n", HostDevice);
return HostDevice;
}
>From dd1574782d5ad679ed73c834169a5227f88d5dec Mon Sep 17 00:00:00 2001
From: Nicole Aschenbrenner <nicole.aschenbrenner at amd.com>
Date: Mon, 15 Sep 2025 07:12:51 -0500
Subject: [PATCH 12/18] [OpenMP] Rework implementation to be conform to OpenMP
6.0
Removes restriction on Ptr to host pointers.
Provides accessibility check for AMDGPU through HSA + default implementation returning false.
---
offload/include/device.h | 4 ++--
offload/libomptarget/OpenMP/API.cpp | 21 +------------------
offload/libomptarget/device.cpp | 6 +++---
offload/plugins-nextgen/amdgpu/src/rtl.cpp | 21 ++++++++++++++++++-
.../common/include/PluginInterface.h | 11 +++++-----
.../common/src/PluginInterface.cpp | 8 +++----
6 files changed, 35 insertions(+), 36 deletions(-)
diff --git a/offload/include/device.h b/offload/include/device.h
index 24c36c73ce4ee..4e27943d1dbc1 100644
--- a/offload/include/device.h
+++ b/offload/include/device.h
@@ -158,8 +158,8 @@ struct DeviceTy {
/// Ask the device whether the runtime should use auto zero-copy.
bool useAutoZeroCopy();
- /// Ask the device whether it supports unified memory.
- bool supportsUnifiedMemory();
+ /// Ask the device whether the storage is accessible.
+ bool isAccessiblePtr(const void *Ptr, size_t Size);
/// Check if there are pending images for this device.
bool hasPendingImages() const { return HasPendingImages; }
diff --git a/offload/libomptarget/OpenMP/API.cpp b/offload/libomptarget/OpenMP/API.cpp
index 3632f0ffe7d99..12a3a0cfb783a 100644
--- a/offload/libomptarget/OpenMP/API.cpp
+++ b/offload/libomptarget/OpenMP/API.cpp
@@ -225,26 +225,7 @@ EXTERN int omp_target_is_accessible(const void *Ptr, size_t Size,
if (!DeviceOrErr)
FATAL_MESSAGE(DeviceNum, "%s", toString(DeviceOrErr.takeError()).c_str());
- // TODO: Add check for openmp version compatability
-
- // for OpenMP 5.1 the routine checks whether a host pointer is accessible from
- // the device this requires for the device to support unified shared memory
- if (DeviceOrErr->supportsUnifiedMemory()) {
- DP("Device %d supports unified memory, returning true\n", DeviceNum);
- return true;
- }
-
- // TODO: Provide stubs & implementation to check whether a pointer is
- // accessible from a given device using hsa_amd_pointer_info for AMDGPU
- // implementation for OpenMP 6.x the specification is required to return true
- // if the accessibility of the pointer can be determined otherwise it's
- // allowed to return false the specification will be clarified from the
- // current wording
-
- // functionality to check whether a device pointer is accessible from a device
- // (OpenMP 6.0) from the host might not be possible
- DP("Device %d does not support unified memory, returning false\n", DeviceNum);
- return false;
+ return DeviceOrErr->isAccessiblePtr(Ptr, Size);
}
EXTERN int omp_target_memcpy(void *Dst, const void *Src, size_t Length,
diff --git a/offload/libomptarget/device.cpp b/offload/libomptarget/device.cpp
index ea46037059686..1fd853534eeaa 100644
--- a/offload/libomptarget/device.cpp
+++ b/offload/libomptarget/device.cpp
@@ -368,6 +368,6 @@ bool DeviceTy::useAutoZeroCopy() {
return RTL->use_auto_zero_copy(RTLDeviceID);
}
-bool DeviceTy::supportsUnifiedMemory() {
- return RTL->supports_unified_memory(RTLDeviceID);
-}
+bool DeviceTy::isAccessiblePtr(const void *Ptr, size_t Size) {
+ return RTL->is_accessible_ptr(RTLDeviceID, Ptr, Size);
+}
\ No newline at end of file
diff --git a/offload/plugins-nextgen/amdgpu/src/rtl.cpp b/offload/plugins-nextgen/amdgpu/src/rtl.cpp
index 761761bcdb6e1..9a6e25ab57303 100644
--- a/offload/plugins-nextgen/amdgpu/src/rtl.cpp
+++ b/offload/plugins-nextgen/amdgpu/src/rtl.cpp
@@ -3027,7 +3027,26 @@ struct AMDGPUDeviceTy : public GenericDeviceTy, AMDGenericDeviceTy {
return ((IsAPU || OMPX_ApuMaps) && IsXnackEnabled);
}
- bool supportsUnifiedMemoryImpl() override { return IsXnackEnabled; }
+ bool isAccessiblePtrImpl(const void *Ptr, size_t Size) override {
+ hsa_amd_pointer_info_t Info;
+ Info.size = sizeof(hsa_amd_pointer_info_t);
+
+ hsa_agent_t *Agents = nullptr;
+ uint32_t Count = 0;
+ hsa_status_t Status = hsa_amd_pointer_info(Ptr, &Info, malloc, &Count, &Agents);
+
+ if (Status != HSA_STATUS_SUCCESS)
+ return false;
+
+ // Checks if the pointer is known by HSA and accessible by the device
+ for(uint32_t i = 0; i < Count; i++)
+ if(Agents[i].handle == getAgent().handle)
+ return Info.sizeInBytes >= Size;
+
+ // If the pointer is unknown to HSA it's assumed a host pointer
+ // in that case the device can access it on unified memory support is enabled
+ return IsXnackEnabled;
+ }
/// Getters and setters for stack and heap sizes.
Error getDeviceStackSize(uint64_t &Value) override {
diff --git a/offload/plugins-nextgen/common/include/PluginInterface.h b/offload/plugins-nextgen/common/include/PluginInterface.h
index e5731ec13d869..391700487ab89 100644
--- a/offload/plugins-nextgen/common/include/PluginInterface.h
+++ b/offload/plugins-nextgen/common/include/PluginInterface.h
@@ -1093,9 +1093,10 @@ struct GenericDeviceTy : public DeviceAllocatorTy {
bool useAutoZeroCopy();
virtual bool useAutoZeroCopyImpl() { return false; }
- /// Returns true if the device has unified memory capabilities
- bool supportsUnifiedMemory();
- virtual bool supportsUnifiedMemoryImpl() { return false; }
+ /// Returns true if the plugin can guarantee that the associated
+ /// storage is accessible
+ bool isAccessiblePtr(const void *Ptr, size_t Size);
+ virtual bool isAccessiblePtrImpl(const void *Ptr, size_t Size) { return false; }
virtual Expected<omp_interop_val_t *>
createInterop(int32_t InteropType, interop_spec_t &InteropSpec) {
@@ -1527,8 +1528,8 @@ struct GenericPluginTy {
/// Returns if the plugin can support automatic copy.
int32_t use_auto_zero_copy(int32_t DeviceId);
- /// Returns if the the device supports unified memory.
- int32_t supports_unified_memory(int32_t DeviceId);
+ /// Returns if the associated storage is accessible for a given device.
+ int32_t is_accessible_ptr(int32_t DeviceId, const void *Ptr, size_t Size);
/// Look up a global symbol in the given binary.
int32_t get_global(__tgt_device_binary Binary, uint64_t Size,
diff --git a/offload/plugins-nextgen/common/src/PluginInterface.cpp b/offload/plugins-nextgen/common/src/PluginInterface.cpp
index 6f7c12810c111..e4a8be19d61bb 100644
--- a/offload/plugins-nextgen/common/src/PluginInterface.cpp
+++ b/offload/plugins-nextgen/common/src/PluginInterface.cpp
@@ -1607,9 +1607,7 @@ Error GenericDeviceTy::syncEvent(void *EventPtr) {
bool GenericDeviceTy::useAutoZeroCopy() { return useAutoZeroCopyImpl(); }
-bool GenericDeviceTy::supportsUnifiedMemory() {
- return supportsUnifiedMemoryImpl();
-}
+bool GenericDeviceTy::isAccessiblePtr(const void *Ptr, size_t Size) { return isAccessiblePtrImpl(Ptr, Size); }
Error GenericPluginTy::init() {
if (Initialized)
@@ -2163,8 +2161,8 @@ int32_t GenericPluginTy::use_auto_zero_copy(int32_t DeviceId) {
return getDevice(DeviceId).useAutoZeroCopy();
}
-int32_t GenericPluginTy::supports_unified_memory(int32_t DeviceId) {
- return getDevice(DeviceId).supportsUnifiedMemory();
+int32_t GenericPluginTy::is_accessible_ptr(int32_t DeviceId, const void *Ptr, size_t Size) {
+ return getDevice(DeviceId).isAccessiblePtr(Ptr, Size);
}
int32_t GenericPluginTy::get_global(__tgt_device_binary Binary, uint64_t Size,
>From e9dccd6c1b43446ec250c30223611a86bebaaf9b Mon Sep 17 00:00:00 2001
From: Nicole Aschenbrenner <nicole.aschenbrenner at amd.com>
Date: Wed, 17 Sep 2025 07:35:18 -0500
Subject: [PATCH 13/18] Applies git-clang-format
---
offload/plugins-nextgen/amdgpu/src/rtl.cpp | 12 +++++++-----
.../plugins-nextgen/common/include/PluginInterface.h | 4 +++-
.../plugins-nextgen/common/src/PluginInterface.cpp | 7 +++++--
3 files changed, 15 insertions(+), 8 deletions(-)
diff --git a/offload/plugins-nextgen/amdgpu/src/rtl.cpp b/offload/plugins-nextgen/amdgpu/src/rtl.cpp
index 9a6e25ab57303..47ee878fd167b 100644
--- a/offload/plugins-nextgen/amdgpu/src/rtl.cpp
+++ b/offload/plugins-nextgen/amdgpu/src/rtl.cpp
@@ -3033,18 +3033,20 @@ struct AMDGPUDeviceTy : public GenericDeviceTy, AMDGenericDeviceTy {
hsa_agent_t *Agents = nullptr;
uint32_t Count = 0;
- hsa_status_t Status = hsa_amd_pointer_info(Ptr, &Info, malloc, &Count, &Agents);
-
+ hsa_status_t Status =
+ hsa_amd_pointer_info(Ptr, &Info, malloc, &Count, &Agents);
+
if (Status != HSA_STATUS_SUCCESS)
return false;
// Checks if the pointer is known by HSA and accessible by the device
- for(uint32_t i = 0; i < Count; i++)
- if(Agents[i].handle == getAgent().handle)
+ for (uint32_t i = 0; i < Count; i++)
+ if (Agents[i].handle == getAgent().handle)
return Info.sizeInBytes >= Size;
// If the pointer is unknown to HSA it's assumed a host pointer
- // in that case the device can access it on unified memory support is enabled
+ // in that case the device can access it on unified memory support is
+ // enabled
return IsXnackEnabled;
}
diff --git a/offload/plugins-nextgen/common/include/PluginInterface.h b/offload/plugins-nextgen/common/include/PluginInterface.h
index 391700487ab89..dfb9f5b4886bd 100644
--- a/offload/plugins-nextgen/common/include/PluginInterface.h
+++ b/offload/plugins-nextgen/common/include/PluginInterface.h
@@ -1096,7 +1096,9 @@ struct GenericDeviceTy : public DeviceAllocatorTy {
/// Returns true if the plugin can guarantee that the associated
/// storage is accessible
bool isAccessiblePtr(const void *Ptr, size_t Size);
- virtual bool isAccessiblePtrImpl(const void *Ptr, size_t Size) { return false; }
+ virtual bool isAccessiblePtrImpl(const void *Ptr, size_t Size) {
+ return false;
+ }
virtual Expected<omp_interop_val_t *>
createInterop(int32_t InteropType, interop_spec_t &InteropSpec) {
diff --git a/offload/plugins-nextgen/common/src/PluginInterface.cpp b/offload/plugins-nextgen/common/src/PluginInterface.cpp
index e4a8be19d61bb..2ff644f43ce40 100644
--- a/offload/plugins-nextgen/common/src/PluginInterface.cpp
+++ b/offload/plugins-nextgen/common/src/PluginInterface.cpp
@@ -1607,7 +1607,9 @@ Error GenericDeviceTy::syncEvent(void *EventPtr) {
bool GenericDeviceTy::useAutoZeroCopy() { return useAutoZeroCopyImpl(); }
-bool GenericDeviceTy::isAccessiblePtr(const void *Ptr, size_t Size) { return isAccessiblePtrImpl(Ptr, Size); }
+bool GenericDeviceTy::isAccessiblePtr(const void *Ptr, size_t Size) {
+ return isAccessiblePtrImpl(Ptr, Size);
+}
Error GenericPluginTy::init() {
if (Initialized)
@@ -2161,7 +2163,8 @@ int32_t GenericPluginTy::use_auto_zero_copy(int32_t DeviceId) {
return getDevice(DeviceId).useAutoZeroCopy();
}
-int32_t GenericPluginTy::is_accessible_ptr(int32_t DeviceId, const void *Ptr, size_t Size) {
+int32_t GenericPluginTy::is_accessible_ptr(int32_t DeviceId, const void *Ptr,
+ size_t Size) {
return getDevice(DeviceId).isAccessiblePtr(Ptr, Size);
}
>From 4b51745f3914b61837dfa41668d544a9d1e01ee6 Mon Sep 17 00:00:00 2001
From: Nicole Aschenbrenner <nicole.aschenbrenner at amd.com>
Date: Fri, 19 Sep 2025 03:49:29 -0500
Subject: [PATCH 14/18] Fixes formatting and comment issues.
---
offload/libomptarget/OpenMP/API.cpp | 8 ++------
offload/libomptarget/device.cpp | 2 +-
2 files changed, 3 insertions(+), 7 deletions(-)
diff --git a/offload/libomptarget/OpenMP/API.cpp b/offload/libomptarget/OpenMP/API.cpp
index 12a3a0cfb783a..aa96dd336bfb8 100644
--- a/offload/libomptarget/OpenMP/API.cpp
+++ b/offload/libomptarget/OpenMP/API.cpp
@@ -197,11 +197,7 @@ EXTERN int omp_target_is_present(const void *Ptr, int DeviceNum) {
}
/// Check whether a pointer is accessible from a device.
-/// the functionality is available in OpenMP 5.1 and later
-/// OpenMP 5.1
-/// omp_target_is_accessible checks whether a host pointer is accessible from a
-/// device OpenMP 6.0 removes restriction on pointer, allowing any pointer
-/// interpreted as a pointer in the address space of the given device.
+/// Returns true when accessibility is guaranteed otherwise returns false.
EXTERN int omp_target_is_accessible(const void *Ptr, size_t Size,
int DeviceNum) {
TIMESCOPE();
@@ -220,7 +216,7 @@ EXTERN int omp_target_is_accessible(const void *Ptr, size_t Size,
return true;
}
- // the device number must refer to a valid device
+ // The device number must refer to a valid device
auto DeviceOrErr = PM->getDevice(DeviceNum);
if (!DeviceOrErr)
FATAL_MESSAGE(DeviceNum, "%s", toString(DeviceOrErr.takeError()).c_str());
diff --git a/offload/libomptarget/device.cpp b/offload/libomptarget/device.cpp
index 1fd853534eeaa..ee36fbed935a5 100644
--- a/offload/libomptarget/device.cpp
+++ b/offload/libomptarget/device.cpp
@@ -370,4 +370,4 @@ bool DeviceTy::useAutoZeroCopy() {
bool DeviceTy::isAccessiblePtr(const void *Ptr, size_t Size) {
return RTL->is_accessible_ptr(RTLDeviceID, Ptr, Size);
-}
\ No newline at end of file
+}
>From 79dd36f8243d4dc4d40d79b74edf50ac2170c744 Mon Sep 17 00:00:00 2001
From: Nicole Aschenbrenner <nicole.aschenbrenner at amd.com>
Date: Fri, 19 Sep 2025 04:05:40 -0500
Subject: [PATCH 15/18] [OpenMP] Fixes check for host device number
The implemetation is allowed to return -1 for the host device number.
To be complient with the spec both the device number needs to be checked against both -1
as well as the value returned by omp_get_initial_device.
---
offload/libomptarget/OpenMP/API.cpp | 4 ++--
1 file changed, 2 insertions(+), 2 deletions(-)
diff --git a/offload/libomptarget/OpenMP/API.cpp b/offload/libomptarget/OpenMP/API.cpp
index aa96dd336bfb8..7901a8e934fb6 100644
--- a/offload/libomptarget/OpenMP/API.cpp
+++ b/offload/libomptarget/OpenMP/API.cpp
@@ -197,7 +197,7 @@ EXTERN int omp_target_is_present(const void *Ptr, int DeviceNum) {
}
/// Check whether a pointer is accessible from a device.
-/// Returns true when accessibility is guaranteed otherwise returns false.
+/// Returns true when accessibility is guaranteed otherwise returns false.
EXTERN int omp_target_is_accessible(const void *Ptr, size_t Size,
int DeviceNum) {
TIMESCOPE();
@@ -211,7 +211,7 @@ EXTERN int omp_target_is_accessible(const void *Ptr, size_t Size,
return false;
}
- if (DeviceNum == omp_get_initial_device()) {
+ if (DeviceNum == omp_get_initial_device() || DeviceNum == -1) {
DP("Call to omp_target_is_accessible on host, returning true\n");
return true;
}
>From 588c3949a43cc97882af354e384d7580ea62d7cb Mon Sep 17 00:00:00 2001
From: Nicole Aschenbrenner <nicole.aschenbrenner at amd.com>
Date: Fri, 19 Sep 2025 04:09:24 -0500
Subject: [PATCH 16/18] Fixes formatting
---
offload/libomptarget/OpenMP/API.cpp | 2 +-
1 file changed, 1 insertion(+), 1 deletion(-)
diff --git a/offload/libomptarget/OpenMP/API.cpp b/offload/libomptarget/OpenMP/API.cpp
index 7901a8e934fb6..48b086d671285 100644
--- a/offload/libomptarget/OpenMP/API.cpp
+++ b/offload/libomptarget/OpenMP/API.cpp
@@ -197,7 +197,7 @@ EXTERN int omp_target_is_present(const void *Ptr, int DeviceNum) {
}
/// Check whether a pointer is accessible from a device.
-/// Returns true when accessibility is guaranteed otherwise returns false.
+/// Returns true when accessibility is guaranteed otherwise returns false.
EXTERN int omp_target_is_accessible(const void *Ptr, size_t Size,
int DeviceNum) {
TIMESCOPE();
>From 8961e19bd072b67554261e639ae617ca573c411b Mon Sep 17 00:00:00 2001
From: Nicole Aschenbrenner <nicole.aschenbrenner at amd.com>
Date: Tue, 14 Oct 2025 14:51:18 +0200
Subject: [PATCH 17/18] Review nit add braces to for loop body
Co-authored-by: Shilei Tian <i at tianshilei.me>
---
offload/plugins-nextgen/amdgpu/src/rtl.cpp | 3 ++-
1 file changed, 2 insertions(+), 1 deletion(-)
diff --git a/offload/plugins-nextgen/amdgpu/src/rtl.cpp b/offload/plugins-nextgen/amdgpu/src/rtl.cpp
index bdac35ae971c4..1a8cae35dfa38 100644
--- a/offload/plugins-nextgen/amdgpu/src/rtl.cpp
+++ b/offload/plugins-nextgen/amdgpu/src/rtl.cpp
@@ -3040,9 +3040,10 @@ struct AMDGPUDeviceTy : public GenericDeviceTy, AMDGenericDeviceTy {
return false;
// Checks if the pointer is known by HSA and accessible by the device
- for (uint32_t i = 0; i < Count; i++)
+ for (uint32_t i = 0; i < Count; i++) {
if (Agents[i].handle == getAgent().handle)
return Info.sizeInBytes >= Size;
+ }
// If the pointer is unknown to HSA it's assumed a host pointer
// in that case the device can access it on unified memory support is
>From 357ccd9ba08d3c3c92e56d98d379eacfbaa7ebf4 Mon Sep 17 00:00:00 2001
From: Nicole Aschenbrenner <nicole.aschenbrenner at amd.com>
Date: Thu, 16 Oct 2025 09:14:45 -0500
Subject: [PATCH 18/18] [OpenMP] Changes error handling for
omp_target_is_accessible
Addresses rewiev comments.
Changes LIT test to XFAIL on nvptx.
Changes implementation to provide better debug information to the user about failures.
---
offload/plugins-nextgen/amdgpu/src/rtl.cpp | 6 +++---
.../common/include/PluginInterface.h | 9 +++++----
.../plugins-nextgen/common/src/PluginInterface.cpp | 14 ++++++++++++--
offload/test/mapping/is_accessible.cpp | 2 +-
4 files changed, 21 insertions(+), 10 deletions(-)
diff --git a/offload/plugins-nextgen/amdgpu/src/rtl.cpp b/offload/plugins-nextgen/amdgpu/src/rtl.cpp
index bdac35ae971c4..c04fa78d79488 100644
--- a/offload/plugins-nextgen/amdgpu/src/rtl.cpp
+++ b/offload/plugins-nextgen/amdgpu/src/rtl.cpp
@@ -3027,7 +3027,7 @@ struct AMDGPUDeviceTy : public GenericDeviceTy, AMDGenericDeviceTy {
return ((IsAPU || OMPX_ApuMaps) && IsXnackEnabled);
}
- bool isAccessiblePtrImpl(const void *Ptr, size_t Size) override {
+ Expected<bool> isAccessiblePtrImpl(const void *Ptr, size_t Size) override {
hsa_amd_pointer_info_t Info;
Info.size = sizeof(hsa_amd_pointer_info_t);
@@ -3036,8 +3036,8 @@ struct AMDGPUDeviceTy : public GenericDeviceTy, AMDGenericDeviceTy {
hsa_status_t Status =
hsa_amd_pointer_info(Ptr, &Info, malloc, &Count, &Agents);
- if (Status != HSA_STATUS_SUCCESS)
- return false;
+ if (auto Err = Plugin::check(Status, "error in hsa_amd_pointer_info: %s"))
+ return std::move(Err);
// Checks if the pointer is known by HSA and accessible by the device
for (uint32_t i = 0; i < Count; i++)
diff --git a/offload/plugins-nextgen/common/include/PluginInterface.h b/offload/plugins-nextgen/common/include/PluginInterface.h
index 907c21ec662d3..44b6c26cec95f 100644
--- a/offload/plugins-nextgen/common/include/PluginInterface.h
+++ b/offload/plugins-nextgen/common/include/PluginInterface.h
@@ -1071,10 +1071,7 @@ struct GenericDeviceTy : public DeviceAllocatorTy {
/// Returns true if the plugin can guarantee that the associated
/// storage is accessible
- bool isAccessiblePtr(const void *Ptr, size_t Size);
- virtual bool isAccessiblePtrImpl(const void *Ptr, size_t Size) {
- return false;
- }
+ Expected<bool> isAccessiblePtr(const void *Ptr, size_t Size);
virtual Expected<omp_interop_val_t *>
createInterop(int32_t InteropType, interop_spec_t &InteropSpec) {
@@ -1176,6 +1173,10 @@ struct GenericDeviceTy : public DeviceAllocatorTy {
/// Per device setting of MemoryManager's Threshold
virtual size_t getMemoryManagerSizeThreshold() { return 0; }
+ virtual Expected<bool> isAccessiblePtrImpl(const void *Ptr, size_t Size) {
+ return false;
+ }
+
/// Environment variables defined by the OpenMP standard.
Int32Envar OMP_TeamLimit;
Int32Envar OMP_NumTeams;
diff --git a/offload/plugins-nextgen/common/src/PluginInterface.cpp b/offload/plugins-nextgen/common/src/PluginInterface.cpp
index 0ab3d8dc4c69c..b5b1dbdd4d568 100644
--- a/offload/plugins-nextgen/common/src/PluginInterface.cpp
+++ b/offload/plugins-nextgen/common/src/PluginInterface.cpp
@@ -1593,7 +1593,7 @@ Error GenericDeviceTy::syncEvent(void *EventPtr) {
bool GenericDeviceTy::useAutoZeroCopy() { return useAutoZeroCopyImpl(); }
-bool GenericDeviceTy::isAccessiblePtr(const void *Ptr, size_t Size) {
+Expected<bool> GenericDeviceTy::isAccessiblePtr(const void *Ptr, size_t Size) {
return isAccessiblePtrImpl(Ptr, Size);
}
@@ -2153,7 +2153,17 @@ int32_t GenericPluginTy::use_auto_zero_copy(int32_t DeviceId) {
int32_t GenericPluginTy::is_accessible_ptr(int32_t DeviceId, const void *Ptr,
size_t Size) {
- return getDevice(DeviceId).isAccessiblePtr(Ptr, Size);
+ auto HandleError = [&](Error Err) -> bool {
+ [[maybe_unused]] std::string ErrStr = toString(std::move(Err));
+ DP("Failure while checking accessibility of pointer %p for device %d: %s", Ptr, DeviceId, ErrStr.c_str());
+ return false;
+ };
+
+ auto AccessibleOrErr = getDevice(DeviceId).isAccessiblePtr(Ptr, Size);
+ if (Error Err = AccessibleOrErr.takeError())
+ return HandleError(std::move(Err));
+
+ return *AccessibleOrErr;
}
int32_t GenericPluginTy::get_global(__tgt_device_binary Binary, uint64_t Size,
diff --git a/offload/test/mapping/is_accessible.cpp b/offload/test/mapping/is_accessible.cpp
index 6d6a0048e01f3..7fb23893408ea 100644
--- a/offload/test/mapping/is_accessible.cpp
+++ b/offload/test/mapping/is_accessible.cpp
@@ -7,7 +7,7 @@
// RUN: | %fcheck-generic -check-prefix=NO_USM
// REQUIRES: unified_shared_memory
-// REQUIRES: amdgpu
+// XFAIL: nvptx
// CHECK: SUCCESS
// NO_USM: Not accessible
More information about the cfe-commits
mailing list