[Beignet] [PATCH 18/19] OCL20: add device enqueue test case.

Yang Rong rong.r.yang at intel.com
Mon Nov 28 11:32:44 UTC 2016


Signed-off-by: Yang Rong <rong.r.yang at intel.com>
Reviewed-by: Pan Xiuli <xiuli.pan at intel.com>
---
 kernels/compiler_device_enqueue.cl | 18 ++++++++++++++++++
 utests/CMakeLists.txt              |  3 ++-
 utests/compiler_device_enqueue.cpp | 36 ++++++++++++++++++++++++++++++++++++
 3 files changed, 56 insertions(+), 1 deletion(-)
 create mode 100644 kernels/compiler_device_enqueue.cl
 create mode 100644 utests/compiler_device_enqueue.cpp

diff --git a/kernels/compiler_device_enqueue.cl b/kernels/compiler_device_enqueue.cl
new file mode 100644
index 0000000..cb20142
--- /dev/null
+++ b/kernels/compiler_device_enqueue.cl
@@ -0,0 +1,18 @@
+void block_fn(__global uint* val)
+{
+  atomic_add(val, get_global_id(0));
+}
+
+kernel void compiler_device_enqueue(uint glob_size_arr, __global uint* val)
+{
+  size_t tid = get_global_id(0);
+
+  for(int i = 0; i < glob_size_arr; i++)
+  {
+    ndrange_t ndrange = ndrange_1D(glob_size_arr);
+    __global uint * v = val + tid;
+    void (^kernelBlock)(void) = ^{ block_fn(v); };
+    queue_t q = get_default_queue();
+    enqueue_kernel(q, CLK_ENQUEUE_FLAGS_WAIT_KERNEL, ndrange, kernelBlock);
+  }
+}
diff --git a/utests/CMakeLists.txt b/utests/CMakeLists.txt
index 0ca7f77..969b695 100644
--- a/utests/CMakeLists.txt
+++ b/utests/CMakeLists.txt
@@ -306,7 +306,8 @@ if (ENABLE_OPENCL_20)
       compiler_sampler.cpp
       compiler_generic_pointer.cpp
       runtime_pipe_query.cpp
-      compiler_pipe_builtin.cpp)
+      compiler_pipe_builtin.cpp
+      compiler_device_enqueue.cpp)
 endif (ENABLE_OPENCL_20)
 
 if (NOT_BUILD_STAND_ALONE_UTEST)
diff --git a/utests/compiler_device_enqueue.cpp b/utests/compiler_device_enqueue.cpp
new file mode 100644
index 0000000..a9e3e2d
--- /dev/null
+++ b/utests/compiler_device_enqueue.cpp
@@ -0,0 +1,36 @@
+#include "utest_helper.hpp"
+
+void compiler_device_enqueue(void)
+{
+  const size_t n = 32;
+  const uint32_t global_sz = 3;
+  uint32_t result = 0;
+
+  // Setup kernel and buffers
+  OCL_CREATE_KERNEL("compiler_device_enqueue");
+  OCL_CREATE_BUFFER(buf[0], 0, n * sizeof(uint32_t), NULL);
+  OCL_SET_ARG(0, sizeof(uint32_t), &global_sz);
+  OCL_SET_ARG(1, sizeof(cl_mem), &buf[0]);
+
+  OCL_MAP_BUFFER(0);
+  for(uint32_t i = 0; i < 69; ++i)
+    ((short *)buf_data[0])[i] = 0;
+  OCL_UNMAP_BUFFER(0);
+
+  // Run the kernel
+  globals[0] = n;
+  locals[0] = 16;
+  OCL_NDRANGE(1);
+
+  for(uint32_t i = 0; i < global_sz; ++i) {
+    result += i;
+  }
+  result *= global_sz;
+
+  OCL_MAP_BUFFER(0);
+  for (uint32_t i = 0; i < n; ++i)
+    OCL_ASSERT(((uint32_t *)buf_data[0])[i] == result);
+  OCL_UNMAP_BUFFER(0);
+}
+
+MAKE_UTEST_FROM_FUNCTION(compiler_device_enqueue);
-- 
2.1.4



More information about the Beignet mailing list