[Openmp-commits] [openmp] [OpenMP] Add interface for flushing with memory order and scope (PR #133325)
Hansang Bae via Openmp-commits
openmp-commits at lists.llvm.org
Thu Mar 27 14:46:47 PDT 2025
https://github.com/hansangbae created https://github.com/llvm/llvm-project/pull/133325
Current specification allows user input to the flush construct via
clauses for memory order and scope.
>From 7bcdea6fe418cd804c1e017065ce5bc34365d919 Mon Sep 17 00:00:00 2001
From: Hansang Bae <hansang.bae at intel.com>
Date: Thu, 27 Mar 2025 15:00:52 -0500
Subject: [PATCH] [OpenMP] Add interface for flushing with memory order and
scope
Current specification allows user input to the flush construct via
clauses for memory order and scope.
---
openmp/runtime/src/dllexports | 1 +
openmp/runtime/src/kmp.h | 2 +
openmp/runtime/src/kmp_csupport.cpp | 33 +++++++++++
.../test/flush/omp_flush_acquire_release.c | 58 +++++++++++++++++++
4 files changed, 94 insertions(+)
create mode 100644 openmp/runtime/test/flush/omp_flush_acquire_release.c
diff --git a/openmp/runtime/src/dllexports b/openmp/runtime/src/dllexports
index 0667d53c35a18..fae1a381ee7ec 100644
--- a/openmp/runtime/src/dllexports
+++ b/openmp/runtime/src/dllexports
@@ -221,6 +221,7 @@
# __kmpc_end_taskq 128
# __kmpc_end_taskq_task 129
__kmpc_flush 130
+ __kmpc_flush_explicit
__kmpc_for_static_fini 135
__kmpc_for_static_init_4 136
__kmpc_for_static_init_8 137
diff --git a/openmp/runtime/src/kmp.h b/openmp/runtime/src/kmp.h
index 3d34513491154..6d48f9faafca8 100644
--- a/openmp/runtime/src/kmp.h
+++ b/openmp/runtime/src/kmp.h
@@ -4204,6 +4204,8 @@ KMP_EXPORT void __kmpc_serialized_parallel(ident_t *, kmp_int32 global_tid);
KMP_EXPORT void __kmpc_end_serialized_parallel(ident_t *, kmp_int32 global_tid);
KMP_EXPORT void __kmpc_flush(ident_t *);
+KMP_EXPORT void __kmpc_flush_explicit(ident_t *, kmp_int32 order,
+ kmp_int32 scope);
KMP_EXPORT void __kmpc_barrier(ident_t *, kmp_int32 global_tid);
KMP_EXPORT kmp_int32 __kmpc_master(ident_t *, kmp_int32 global_tid);
KMP_EXPORT void __kmpc_end_master(ident_t *, kmp_int32 global_tid);
diff --git a/openmp/runtime/src/kmp_csupport.cpp b/openmp/runtime/src/kmp_csupport.cpp
index fdbf9ff45e354..d505f4f18405b 100644
--- a/openmp/runtime/src/kmp_csupport.cpp
+++ b/openmp/runtime/src/kmp_csupport.cpp
@@ -801,6 +801,39 @@ void __kmpc_flush(ident_t *loc) {
#endif
}
+/*!
+ at ingroup SYNCHRONIZATION
+ at param loc source location information.
+ at param order memory order input from user.
+ at param scope memory scope input from user.
+Perform memory fence with explicit memory semantics.
+*/
+void __kmpc_flush_explicit(ident_t *loc, kmp_int32 order, kmp_int32 scope) {
+ // `scope` is not used on the initial device.
+ switch (order) {
+ case std::memory_order_relaxed:
+ [[fallthrough]];
+ case std::memory_order_acquire:
+ [[fallthrough]];
+ case std::memory_order_release:
+ [[fallthrough]];
+ case std::memory_order_acq_rel:
+ [[fallthrough]];
+ case std::memory_order_seq_cst:
+ std::atomic_thread_fence(static_cast<std::memory_order>(order));
+ break;
+ default:
+ KMP_BUILTIN_UNREACHABLE;
+ }
+
+#if OMPT_SUPPORT && OMPT_OPTIONAL
+ if (ompt_enabled.ompt_callback_flush) {
+ ompt_callbacks.ompt_callback(ompt_callback_flush)(
+ __ompt_get_thread_data_internal(), OMPT_GET_RETURN_ADDRESS(0));
+ }
+#endif
+}
+
/* -------------------------------------------------------------------------- */
/*!
@ingroup SYNCHRONIZATION
diff --git a/openmp/runtime/test/flush/omp_flush_acquire_release.c b/openmp/runtime/test/flush/omp_flush_acquire_release.c
new file mode 100644
index 0000000000000..b3dd42d888e92
--- /dev/null
+++ b/openmp/runtime/test/flush/omp_flush_acquire_release.c
@@ -0,0 +1,58 @@
+// RUN: %libomp-compile-and-run
+// REQUIRES: clang
+
+// Test is based on OpenMP API Example (omp_5.0) acquire_release3.c
+// https://github.com/OpenMP/Examples/blob/main/synchronization/sources/acquire_release.3.c
+
+#include <stdio.h>
+#include <omp.h>
+
+typedef void ident_t;
+extern void __kmpc_flush_explicit(ident_t *, int order, int scope);
+
+int test_memorder(int write_order, int read_order) {
+ int x = 0, y = 0;
+ int num_fails = 0;
+#pragma omp parallel num_threads(2)
+ {
+ int thrd = omp_get_thread_num();
+ if (thrd == 0) {
+ x = 10;
+ __kmpc_flush_explicit(NULL, write_order, 0);
+#pragma omp atomic write // or with relaxed clause
+ y = 1;
+ } else {
+ int tmp = 0;
+ while (tmp == 0) {
+#pragma omp atomic read // or with relaxed clause
+ tmp = y;
+ }
+ __kmpc_flush_explicit(NULL, read_order, 0);
+ // printf("x = %d\n", x); // always "x = 10"
+ if (x != 10)
+ num_fails++;
+ }
+ }
+ return num_fails;
+}
+
+int main() {
+ // Clang-based compiler has predefined macro __ATOMIC_<memory_order>.
+ int write_order[3] = {__ATOMIC_SEQ_CST, __ATOMIC_ACQ_REL, __ATOMIC_RELEASE};
+ int read_order[3] = {__ATOMIC_SEQ_CST, __ATOMIC_ACQ_REL, __ATOMIC_ACQUIRE};
+
+ // Repeat 1000 times
+ for (int n = 0; n < 1000; n++) {
+ for (int i = 0; i < 3; i++) {
+ for (int j = 0; j < 3; j++) {
+ if (test_memorder(write_order[i], read_order[j])) {
+ printf("failed\n");
+ exit(EXIT_FAILURE);
+ }
+ }
+ }
+ }
+
+ printf("passed\n");
+ return EXIT_SUCCESS;
+}
More information about the Openmp-commits
mailing list