[Beignet] [PATCH 2/2] add utest for __gen_ocl_simd_shuffle and __gen_ocl_get_simd_size/id
Guo Yejun
yejun.guo at intel.com
Thu Mar 19 22:58:47 PDT 2015
Signed-off-by: Guo Yejun <yejun.guo at intel.com>
---
kernels/compiler_simd_shuffle.cl | 15 ++++++++++++++
utests/CMakeLists.txt | 1 +
utests/compiler_simd_shuffle.cpp | 44 ++++++++++++++++++++++++++++++++++++++++
3 files changed, 60 insertions(+)
create mode 100644 kernels/compiler_simd_shuffle.cl
create mode 100644 utests/compiler_simd_shuffle.cpp
diff --git a/kernels/compiler_simd_shuffle.cl b/kernels/compiler_simd_shuffle.cl
new file mode 100644
index 0000000..50588de
--- /dev/null
+++ b/kernels/compiler_simd_shuffle.cl
@@ -0,0 +1,15 @@
+__kernel void compiler_simd_shuffle(global int *dst, int c)
+{
+ int i = get_global_id(0);
+ if (i == 0)
+ dst[0] = __gen_ocl_get_simd_size();
+ dst++;
+
+ int from = i;
+ int o0 = __gen_ocl_get_simd_id();
+ int o1 = __gen_ocl_simd_shuffle(from, c);
+ int o2 = __gen_ocl_simd_shuffle(from, 5);
+ dst[i*3] = o0;
+ dst[i*3+1] = o1;
+ dst[i*3+2] = o2;
+}
diff --git a/utests/CMakeLists.txt b/utests/CMakeLists.txt
index 06baa68..858df13 100644
--- a/utests/CMakeLists.txt
+++ b/utests/CMakeLists.txt
@@ -189,6 +189,7 @@ set (utests_sources
compiler_getelementptr_bitcast.cpp
compiler_simd_any.cpp
compiler_simd_all.cpp
+ compiler_simd_shuffle.cpp
compiler_time_stamp.cpp
compiler_double_precision.cpp
load_program_from_gen_bin.cpp
diff --git a/utests/compiler_simd_shuffle.cpp b/utests/compiler_simd_shuffle.cpp
new file mode 100644
index 0000000..63b9d21
--- /dev/null
+++ b/utests/compiler_simd_shuffle.cpp
@@ -0,0 +1,44 @@
+#include "utest_helper.hpp"
+
+void compiler_simd_shuffle(void)
+{
+ const size_t n = 32;
+ const int32_t buf_size = 3 * n + 1;
+
+ // Setup kernel and buffers
+ OCL_CREATE_KERNEL("compiler_simd_shuffle");
+ OCL_CREATE_BUFFER(buf[0], 0, buf_size * sizeof(int), NULL);
+ OCL_SET_ARG(0, sizeof(cl_mem), &buf[0]);
+
+ int c = 3;
+ OCL_SET_ARG(1, sizeof(int), &c);
+
+ globals[0] = n;
+ locals[0] = 16;
+
+ OCL_MAP_BUFFER(0);
+ for (int32_t i = 0; i < buf_size; ++i)
+ ((int*)buf_data[0])[i] = -1;
+ OCL_UNMAP_BUFFER(0);
+
+ // Run the kernel on GPU
+ OCL_NDRANGE(1);
+
+ // Compare
+ OCL_MAP_BUFFER(0);
+ int* dst = (int *)buf_data[0];
+ int simdsize = dst[0];
+ OCL_ASSERT(simdsize == 8 || simdsize == 16);
+
+ dst++;
+ for (int32_t i = 0; i < (int32_t) n; ++i){
+ int round = i / simdsize;
+ int index = i % simdsize;
+ OCL_ASSERT(index == dst[3*i]);
+ OCL_ASSERT((round * simdsize + c) == dst[3*i+1]);
+ OCL_ASSERT((round * simdsize + 5) == dst[3*i+2]);
+ }
+ OCL_UNMAP_BUFFER(0);
+}
+
+MAKE_UTEST_FROM_FUNCTION(compiler_simd_shuffle);
--
1.9.1
More information about the Beignet
mailing list