[libclc] r219007 - Implement async_work_group_strided_copy builtin v2

Tom Stellard thomas.stellard at amd.com
Fri Oct 3 12:49:38 PDT 2014


Author: tstellar
Date: Fri Oct  3 14:49:37 2014
New Revision: 219007

URL: http://llvm.org/viewvc/llvm-project?rev=219007&view=rev
Log:
Implement async_work_group_strided_copy builtin v2

This is a simple implementation which just copies data synchronously.

v2:
  - Use size_t.

Added:
    libclc/trunk/generic/include/clc/async/async_work_group_strided_copy.h
    libclc/trunk/generic/include/clc/async/async_work_group_strided_copy.inc
    libclc/trunk/generic/lib/async/async_work_group_strided_copy.cl
    libclc/trunk/generic/lib/async/async_work_group_strided_copy.inc
Modified:
    libclc/trunk/generic/include/clc/clc.h
    libclc/trunk/generic/lib/SOURCES

Added: libclc/trunk/generic/include/clc/async/async_work_group_strided_copy.h
URL: http://llvm.org/viewvc/llvm-project/libclc/trunk/generic/include/clc/async/async_work_group_strided_copy.h?rev=219007&view=auto
==============================================================================
--- libclc/trunk/generic/include/clc/async/async_work_group_strided_copy.h (added)
+++ libclc/trunk/generic/include/clc/async/async_work_group_strided_copy.h Fri Oct  3 14:49:37 2014
@@ -0,0 +1,15 @@
+#define __CLC_DST_ADDR_SPACE local
+#define __CLC_SRC_ADDR_SPACE global
+#define __CLC_BODY <clc/async/async_work_group_strided_copy.inc>
+#include <clc/async/gentype.inc>
+#undef __CLC_DST_ADDR_SPACE
+#undef __CLC_SRC_ADDR_SPACE
+#undef __CLC_BODY
+
+#define __CLC_DST_ADDR_SPACE global
+#define __CLC_SRC_ADDR_SPACE local
+#define __CLC_BODY <clc/async/async_work_group_strided_copy.inc>
+#include <clc/async/gentype.inc>
+#undef __CLC_DST_ADDR_SPACE
+#undef __CLC_SRC_ADDR_SPACE
+#undef __CLC_BODY

Added: libclc/trunk/generic/include/clc/async/async_work_group_strided_copy.inc
URL: http://llvm.org/viewvc/llvm-project/libclc/trunk/generic/include/clc/async/async_work_group_strided_copy.inc?rev=219007&view=auto
==============================================================================
--- libclc/trunk/generic/include/clc/async/async_work_group_strided_copy.inc (added)
+++ libclc/trunk/generic/include/clc/async/async_work_group_strided_copy.inc Fri Oct  3 14:49:37 2014
@@ -0,0 +1,6 @@
+_CLC_OVERLOAD _CLC_DECL event_t async_work_group_strided_copy(
+  __CLC_DST_ADDR_SPACE __CLC_GENTYPE *dst,
+  const __CLC_SRC_ADDR_SPACE __CLC_GENTYPE *src,
+  size_t num_gentypes,
+  size_t stride,
+  event_t event);

Modified: libclc/trunk/generic/include/clc/clc.h
URL: http://llvm.org/viewvc/llvm-project/libclc/trunk/generic/include/clc/clc.h?rev=219007&r1=219006&r2=219007&view=diff
==============================================================================
--- libclc/trunk/generic/include/clc/clc.h (original)
+++ libclc/trunk/generic/include/clc/clc.h Fri Oct  3 14:49:37 2014
@@ -137,6 +137,7 @@
 #include <clc/synchronization/barrier.h>
 
 /* 6.11.10 Async Copy and Prefetch Functions */
+#include <clc/async/async_work_group_strided_copy.h>
 #include <clc/async/prefetch.h>
 #include <clc/async/wait_group_events.h>
 

Modified: libclc/trunk/generic/lib/SOURCES
URL: http://llvm.org/viewvc/llvm-project/libclc/trunk/generic/lib/SOURCES?rev=219007&r1=219006&r2=219007&view=diff
==============================================================================
--- libclc/trunk/generic/lib/SOURCES (original)
+++ libclc/trunk/generic/lib/SOURCES Fri Oct  3 14:49:37 2014
@@ -1,3 +1,4 @@
+async/async_work_group_strided_copy.cl
 async/prefetch.cl
 async/wait_group_events.cl
 atomic/atomic_xchg.cl

Added: libclc/trunk/generic/lib/async/async_work_group_strided_copy.cl
URL: http://llvm.org/viewvc/llvm-project/libclc/trunk/generic/lib/async/async_work_group_strided_copy.cl?rev=219007&view=auto
==============================================================================
--- libclc/trunk/generic/lib/async/async_work_group_strided_copy.cl (added)
+++ libclc/trunk/generic/lib/async/async_work_group_strided_copy.cl Fri Oct  3 14:49:37 2014
@@ -0,0 +1,9 @@
+#include <clc/clc.h>
+
+#ifdef cl_khr_fp64
+#pragma OPENCL EXTENSION cl_khr_fp64 : enable
+#endif
+
+#define __CLC_BODY <async_work_group_strided_copy.inc>
+#include <clc/async/gentype.inc>
+#undef __CLC_BODY

Added: libclc/trunk/generic/lib/async/async_work_group_strided_copy.inc
URL: http://llvm.org/viewvc/llvm-project/libclc/trunk/generic/lib/async/async_work_group_strided_copy.inc?rev=219007&view=auto
==============================================================================
--- libclc/trunk/generic/lib/async/async_work_group_strided_copy.inc (added)
+++ libclc/trunk/generic/lib/async/async_work_group_strided_copy.inc Fri Oct  3 14:49:37 2014
@@ -0,0 +1,34 @@
+
+#define STRIDED_COPY(dst, src, num_gentypes, dst_stride, src_stride)       \
+  size_t size = get_local_size(0) * get_local_size(1) * get_local_size(2); \
+  size_t id = (get_local_size(1) * get_local_size(2) * get_local_id(0)) +  \
+              (get_local_size(2) * get_local_id(1)) +                      \
+              get_local_id(2);                                             \
+  size_t i;                                                                \
+                                                                           \
+  for (i = id; i < num_gentypes; i += size) {                              \
+    dst[i * dst_stride] = src[i * src_stride];                             \
+  }
+
+
+_CLC_OVERLOAD _CLC_DEF event_t async_work_group_strided_copy(
+    local __CLC_GENTYPE *dst,
+    const global __CLC_GENTYPE *src,
+    size_t num_gentypes,
+    size_t src_stride,
+    event_t event) {
+
+  STRIDED_COPY(dst, src, num_gentypes, 1, src_stride);
+  return event;
+}
+
+_CLC_OVERLOAD _CLC_DEF event_t async_work_group_strided_copy(
+    global __CLC_GENTYPE *dst,
+    const local __CLC_GENTYPE *src,
+    size_t num_gentypes,
+    size_t dst_stride,
+    event_t event) {
+
+  STRIDED_COPY(dst, src, num_gentypes, dst_stride, 1);
+  return event;
+}





More information about the cfe-commits mailing list