[Beignet] [PATCH 3/9] [OCL20] utest: add generic atomic test.
xionghu.luo at intel.com
xionghu.luo at intel.com
Wed Feb 24 15:09:39 UTC 2016
From: Luo Xionghu <xionghu.luo at intel.com>
only dword is supported so far.
Signed-off-by: Luo Xionghu <xionghu.luo at intel.com>
---
kernels/compiler_generic_atomic.cl | 32 +++++++++++++++++++++++++++
utests/CMakeLists.txt | 1 +
utests/compiler_generic_atomic.cpp | 45 ++++++++++++++++++++++++++++++++++++++
3 files changed, 78 insertions(+)
create mode 100644 kernels/compiler_generic_atomic.cl
create mode 100644 utests/compiler_generic_atomic.cpp
diff --git a/kernels/compiler_generic_atomic.cl b/kernels/compiler_generic_atomic.cl
new file mode 100644
index 0000000..63947ec
--- /dev/null
+++ b/kernels/compiler_generic_atomic.cl
@@ -0,0 +1,32 @@
+#define GENERIC_KERNEL(T) \
+kernel void compiler_generic_atomic_##T(global T *src, global T *dst) \
+{ \
+ size_t gid = get_global_id(0); \
+ size_t lid = get_local_id(0); \
+ private T pdata[16]; \
+ local T ldata[16]; \
+ generic T * p1 = &pdata[lid]; \
+ generic T * p2 = &ldata[lid]; \
+ generic T *p = (gid & 1) ? p1 : p2; \
+ /* below expression is not supported by clang now */ \
+ /* generic T *p = (gid & 1) ? p1 : (T *)&ldata[lid]; */ \
+ *p = src[gid]; \
+ /* fill other data */ \
+ if(gid&1) { \
+ ldata[lid] = 20; \
+ } else { \
+ for (int i = 0; i < 16; i++) { \
+ pdata[i] = src[lid];; \
+ } \
+ } \
+ barrier(CLK_LOCAL_MEM_FENCE); \
+ \
+ generic T * q1 = &pdata[lid]; \
+ generic T * q2 = &ldata[lid]; \
+ generic T *q = (gid & 1) ? q1 : q2; \
+ dst[gid] = atomic_add(q , pdata[lid]); \
+}
+
+GENERIC_KERNEL(int)
+//GENERIC_KERNEL(long)
+
diff --git a/utests/CMakeLists.txt b/utests/CMakeLists.txt
index d1443aa..84f8fff 100644
--- a/utests/CMakeLists.txt
+++ b/utests/CMakeLists.txt
@@ -79,6 +79,7 @@ set (utests_sources
compiler_global_constant_2.cpp
compiler_group_size.cpp
compiler_generic_pointer.cpp
+ compiler_generic_atomic.cpp
compiler_hadd.cpp
compiler_if_else.cpp
compiler_integer_division.cpp
diff --git a/utests/compiler_generic_atomic.cpp b/utests/compiler_generic_atomic.cpp
new file mode 100644
index 0000000..9ed5f53
--- /dev/null
+++ b/utests/compiler_generic_atomic.cpp
@@ -0,0 +1,45 @@
+#include "utest_helper.hpp"
+
+template<typename T>
+void test_atomic(const char* kernelName)
+{
+ const int n = 16;
+ T cpu_src[16];
+
+ // Setup kernel and buffers
+ OCL_CALL(cl_kernel_init, "compiler_generic_atomic.cl", kernelName, SOURCE, "-cl-std=CL2.0");
+ OCL_CREATE_BUFFER(buf[0], 0, n * sizeof(T), NULL);
+ OCL_CREATE_BUFFER(buf[1], 0, n * sizeof(T), NULL);
+ OCL_SET_ARG(0, sizeof(cl_mem), &buf[0]);
+ OCL_SET_ARG(1, sizeof(cl_mem), &buf[1]);
+ globals[0] = 16;
+ locals[0] = 16;
+
+ OCL_MAP_BUFFER(0);
+ for (int i = 0; i < n; ++i)
+ cpu_src[i] = ((T*)buf_data[0])[i] = (T)i;
+ OCL_UNMAP_BUFFER(0);
+
+ // Run the kernel on GPU
+ OCL_NDRANGE(1);
+
+ // Compare
+ OCL_MAP_BUFFER(1);
+ for (int32_t i = 0; i < n; ++i) {
+// printf("i=%d dst=%d\n", i, ((T*)buf_data[1])[i]);
+ OCL_ASSERT(((T*)buf_data[1])[i] == 2 * cpu_src[i]);
+ }
+ OCL_UNMAP_BUFFER(1);
+}
+
+#define GENERIC_ATOMIC_TEST(T) \
+void compiler_generic_atomic_##T() { \
+ test_atomic<T>("compiler_generic_atomic_"#T); \
+} \
+MAKE_UTEST_FROM_FUNCTION(compiler_generic_atomic_##T);
+
+GENERIC_ATOMIC_TEST(int)
+//GENERIC_TEST(long)
+
+
+
--
2.1.4
More information about the Beignet
mailing list