[Openmp-commits] [PATCH] D62398: [OPENMP][NVPTX]Perform memory flush if number of threads to sync is 1 or less.
Alexey Bataev via Phabricator via Openmp-commits
openmp-commits at lists.llvm.org
Fri May 24 08:28:25 PDT 2019
ABataev created this revision.
ABataev added reviewers: grokos, gtbercea, kkwli0.
Herald added subscribers: jdoerfert, guansong.
Herald added a project: OpenMP.
According to the OpenMP standard, barrier operation must perform
implicit flush operation. Currently, if there is only one thread in the
team, barrier does not flush the memory. Patch fixes this problem.
Repository:
rOMP OpenMP
https://reviews.llvm.org/D62398
Files:
libomptarget/deviceRTLs/nvptx/src/sync.cu
libomptarget/deviceRTLs/nvptx/test/parallel/barrier.c
Index: libomptarget/deviceRTLs/nvptx/test/parallel/barrier.c
===================================================================
--- /dev/null
+++ libomptarget/deviceRTLs/nvptx/test/parallel/barrier.c
@@ -0,0 +1,34 @@
+// RUN: %compile-run-and-check
+
+#include <omp.h>
+#include <stdio.h>
+
+int main(int argc, char *argv[]) {
+ int data, flag = 0;
+#pragma omp target teams num_teams(2) map(to : data, flag) thread_limit(1)
+#pragma omp parallel num_threads(1)
+ {
+ if (omp_get_team_num() == 0) {
+ /* Write to the data buffer that will be read by thread */
+ data = 42;
+/* Flush data to thread 1 and strictly order the write to data
+ relative to the write to the flag */
+#pragma omp barrier
+ /* Set flag to release thread 1 */
+ flag = 1;
+/* Flush flag to ensure that thread 1 sees S-21 the change */
+#pragma omp barrier
+ } else if (omp_get_team_num() == 1) {
+/* Loop until we see the update to the flag */
+#pragma omp barrier
+ while (flag < 1) {
+#pragma omp barrier
+ }
+#pragma omp barrier
+ // CHECK: data=42.
+ /* Values data will be 42, value of flag still undefined */
+ printf("data=%d.\n", data);
+ }
+ }
+ return 0;
+}
Index: libomptarget/deviceRTLs/nvptx/src/sync.cu
===================================================================
--- libomptarget/deviceRTLs/nvptx/src/sync.cu
+++ libomptarget/deviceRTLs/nvptx/src/sync.cu
@@ -62,6 +62,9 @@
// Barrier #1 is for synchronization among active threads.
named_sync(L1_BARRIER, threads);
}
+ } else {
+ // Still need to flush the memory per the standard.
+ __kmpc_flush(loc_ref);
} // numberOfActiveOMPThreads > 1
PRINT0(LD_SYNC, "completed kmpc_barrier\n");
}
-------------- next part --------------
A non-text attachment was scrubbed...
Name: D62398.201258.patch
Type: text/x-patch
Size: 1746 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/openmp-commits/attachments/20190524/a7c25b76/attachment-0001.bin>
More information about the Openmp-commits
mailing list