[Beignet] [PATCH] Change global barrier test temporary to check local barrier whether need fence.

Yang Rong rong.r.yang at intel.com
Mon Jun 17 20:24:12 PDT 2013


Signed-off-by: Yang Rong <rong.r.yang at intel.com>
---
 kernels/compiler_global_memory_barrier.cl |    4 ++--
 utests/compiler_global_memory_barrier.cpp |    9 +++++----
 2 files changed, 7 insertions(+), 6 deletions(-)

diff --git a/kernels/compiler_global_memory_barrier.cl b/kernels/compiler_global_memory_barrier.cl
index 99bb940..705517d 100644
--- a/kernels/compiler_global_memory_barrier.cl
+++ b/kernels/compiler_global_memory_barrier.cl
@@ -1,7 +1,7 @@
-__kernel void compiler_global_memory_barrier(__global int *dst, __global int *src) {
+__kernel void compiler_global_memory_barrier(__global int *dst, __local int *src) {
   src[get_local_size(0) * (2 * get_group_id(0)) + get_local_id(0)] = get_local_id(0);
   src[get_local_size(0) * (2 * get_group_id(0) + 1) + get_local_id(0)] = get_local_id(0);
-  barrier(CLK_GLOBAL_MEM_FENCE);
+  barrier(CLK_LOCAL_MEM_FENCE);
   dst[get_local_size(0) * (2 * get_group_id(0)) + get_local_id(0)] = src[get_local_size(0) * 2 * get_group_id(0) + get_local_size(0) - (get_local_id(0) + 1)];
   dst[get_local_size(0) * (2 * get_group_id(0) + 1) + get_local_id(0)] = src[get_local_size(0) * (2 * get_group_id(0) + 1) + get_local_size(0) - (get_local_id(0) + 1)];
 }
diff --git a/utests/compiler_global_memory_barrier.cpp b/utests/compiler_global_memory_barrier.cpp
index a6496a7..311d093 100644
--- a/utests/compiler_global_memory_barrier.cpp
+++ b/utests/compiler_global_memory_barrier.cpp
@@ -4,16 +4,17 @@ static void compiler_global_memory_barrier(void)
 {
   const size_t n = 16*1024;
 
+  globals[0] = n/2;
+  locals[0] = 32;
+
   // Setup kernel and buffers
   OCL_CREATE_KERNEL("compiler_global_memory_barrier");
   OCL_CREATE_BUFFER(buf[0], 0, n * sizeof(uint32_t), NULL);
-  OCL_CREATE_BUFFER(buf[1], 0, n * sizeof(uint32_t), NULL);
+  //OCL_CREATE_BUFFER(buf[1], 0, n * sizeof(uint32_t), NULL);
   OCL_SET_ARG(0, sizeof(cl_mem), &buf[0]);
-  OCL_SET_ARG(1, sizeof(cl_mem), &buf[1]);
+  OCL_SET_ARG(1, locals[0] * 2 * sizeof(uint32_t), NULL);
 
   // Run the kernel
-  globals[0] = n/2;
-  locals[0] = 32;
   OCL_NDRANGE(1);
   OCL_MAP_BUFFER(0);
 
-- 
1.7.10.4



More information about the Beignet mailing list