[Beignet] [PATCH OCL20 06/11] Runtime: Add support of OCL2.0 device queries

Xiuli Pan xiuli.pan at intel.com
Wed Mar 2 03:01:59 UTC 2016


From: Pan Xiuli <xiuli.pan at intel.com>

Add device queries for OpenCL 2.0

Signed-off-by: Pan Xiuli <xiuli.pan at intel.com>
---
 src/cl_device_id.c | 14 +++++++++++++-
 src/cl_device_id.h | 16 ++++++++++++++--
 src/cl_gt_device.h | 14 +++++++++++++-
 3 files changed, 40 insertions(+), 4 deletions(-)

diff --git a/src/cl_device_id.c b/src/cl_device_id.c
index 99320be..9017769 100644
--- a/src/cl_device_id.c
+++ b/src/cl_device_id.c
@@ -786,6 +786,7 @@ cl_get_device_info(cl_device_id     device,
     DECL_FIELD(IMAGE_SUPPORT, image_support)
     DECL_FIELD(MAX_READ_IMAGE_ARGS, max_read_image_args)
     DECL_FIELD(MAX_WRITE_IMAGE_ARGS, max_write_image_args)
+    DECL_FIELD(MAX_READ_WRITE_IMAGE_ARGS, max_read_write_image_args)
     DECL_FIELD(IMAGE_MAX_ARRAY_SIZE, image_max_array_size)
     DECL_FIELD(IMAGE2D_MAX_WIDTH, image2d_max_width)
     DECL_FIELD(IMAGE2D_MAX_HEIGHT, image2d_max_height)
@@ -806,6 +807,8 @@ cl_get_device_info(cl_device_id     device,
     DECL_FIELD(MAX_CONSTANT_BUFFER_SIZE, max_constant_buffer_size)
     DECL_FIELD(IMAGE_MAX_BUFFER_SIZE, image_mem_size)
     DECL_FIELD(MAX_CONSTANT_ARGS, max_constant_args)
+    DECL_FIELD(MAX_GLOBAL_VARIABLE_SIZE, max_global_variable_size)
+    DECL_FIELD(GLOBAL_VARIABLE_PREFERRED_TOTAL_SIZE, global_variable_preferred_total_size)
     DECL_FIELD(LOCAL_MEM_TYPE, local_mem_type)
     DECL_FIELD(LOCAL_MEM_SIZE, local_mem_size)
     DECL_FIELD(ERROR_CORRECTION_SUPPORT, error_correction_support)
@@ -817,6 +820,12 @@ cl_get_device_info(cl_device_id     device,
     DECL_FIELD(LINKER_AVAILABLE, linker_available)
     DECL_FIELD(EXECUTION_CAPABILITIES, execution_capabilities)
     DECL_FIELD(QUEUE_PROPERTIES, queue_properties)
+    //DECL_FIELD(QUEUE_ON_HOST_PROPERTIES, queue_on_host_properties)
+    DECL_FIELD(QUEUE_ON_DEVICE_PROPERTIES, queue_on_device_properties)
+    DECL_FIELD(QUEUE_ON_DEVICE_PREFERRED_SIZE, queue_on_device_preferred_size)
+    DECL_FIELD(QUEUE_ON_DEVICE_MAX_SIZE, queue_on_device_max_size)
+    DECL_FIELD(MAX_ON_DEVICE_QUEUES, max_on_device_queues)
+    DECL_FIELD(MAX_ON_DEVICE_EVENTS, max_on_device_events)
     DECL_FIELD(PLATFORM, platform)
     DECL_FIELD(PRINTF_BUFFER_SIZE, printf_buffer_size)
     DECL_FIELD(PREFERRED_INTEROP_USER_SYNC, interop_user_sync)
@@ -834,9 +843,12 @@ cl_get_device_info(cl_device_id     device,
     DECL_FIELD(PARTITION_AFFINITY_DOMAIN, affinity_domain)
     DECL_FIELD(PARTITION_TYPE, partition_type)
     DECL_FIELD(REFERENCE_COUNT, device_reference_count)
+    DECL_FIELD(SVM_CAPABILITIES, svm_capabilities)
+    DECL_FIELD(PREFERRED_PLATFORM_ATOMIC_ALIGNMENT, preferred_platform_atomic_alignment)
+    DECL_FIELD(PREFERRED_GLOBAL_ATOMIC_ALIGNMENT, preferred_global_atomic_alignment)
+    DECL_FIELD(PREFERRED_LOCAL_ATOMIC_ALIGNMENT, preferred_local_atomic_alignment)
     DECL_FIELD(IMAGE_PITCH_ALIGNMENT, image_pitch_alignment)
     DECL_FIELD(IMAGE_BASE_ADDRESS_ALIGNMENT, image_base_address_alignment)
-    DECL_FIELD(SVM_CAPABILITIES, svm_capabilities)
 
     case CL_DRIVER_VERSION:
       if (param_value_size_ret) {
diff --git a/src/cl_device_id.h b/src/cl_device_id.h
index 6341362..fd75933 100644
--- a/src/cl_device_id.h
+++ b/src/cl_device_id.h
@@ -53,9 +53,13 @@ struct _cl_device_id {
   cl_uint  address_bits;
   size_t   max_mem_alloc_size;
   cl_device_svm_capabilities  svm_capabilities;
+  cl_uint preferred_platform_atomic_alignment;
+  cl_uint preferred_global_atomic_alignment;
+  cl_uint preferred_local_atomic_alignment;
   cl_bool  image_support;
   cl_uint  max_read_image_args;
   cl_uint  max_write_image_args;
+  cl_uint  max_read_write_image_args;
   size_t   image2d_max_width;
   size_t   image_max_array_size;
   size_t   image2d_max_height;
@@ -76,6 +80,8 @@ struct _cl_device_id {
   cl_ulong global_mem_size;
   cl_ulong max_constant_buffer_size;
   cl_uint  max_constant_args;
+  size_t  max_global_variable_size;
+  size_t  global_variable_preferred_total_size;
   cl_device_local_mem_type local_mem_type;
   cl_ulong local_mem_size;
   cl_ulong scratch_mem_size;
@@ -88,6 +94,12 @@ struct _cl_device_id {
   cl_bool  linker_available;
   cl_device_exec_capabilities execution_capabilities;
   cl_command_queue_properties queue_properties;
+  cl_command_queue_properties queue_on_host_properties;
+  cl_command_queue_properties queue_on_device_properties;
+  cl_uint queue_on_device_preferred_size;
+  cl_uint queue_on_device_max_size;
+  cl_uint max_on_device_queues;
+  cl_uint max_on_device_events;
   cl_platform_id platform;
   size_t printf_buffer_size;
   cl_bool interop_user_sync;
@@ -119,8 +131,8 @@ struct _cl_device_id {
   cl_device_partition_property partition_type[3];
   cl_uint      device_reference_count;
   uint32_t atomic_test_result;
-  uint32_t image_pitch_alignment;
-  uint32_t image_base_address_alignment;
+  cl_uint image_pitch_alignment;
+  cl_uint image_base_address_alignment;
 };
 
 /* Get a device from the given platform */
diff --git a/src/cl_gt_device.h b/src/cl_gt_device.h
index cf48b6d..7e66c14 100644
--- a/src/cl_gt_device.h
+++ b/src/cl_gt_device.h
@@ -40,11 +40,15 @@
 .native_vector_width_double = 2,
 .native_vector_width_half = 8,
 .preferred_wg_sz_mul = 16,
-.address_bits = 32,
+.address_bits = 64,
 .svm_capabilities = CL_DEVICE_SVM_COARSE_GRAIN_BUFFER,
+.preferred_platform_atomic_alignment = 0,
+.preferred_global_atomic_alignment = 0,
+.preferred_local_atomic_alignment = 0,
 .image_support = CL_TRUE,
 .max_read_image_args = BTI_MAX_READ_IMAGE_ARGS,
 .max_write_image_args = BTI_MAX_WRITE_IMAGE_ARGS,
+.max_read_write_image_args = BTI_MAX_WRITE_IMAGE_ARGS,
 .image_max_array_size = 2048,
 .image2d_max_width = 8192,
 .image2d_max_height = 8192,
@@ -59,6 +63,8 @@
 .global_mem_cache_type = CL_READ_WRITE_CACHE,
 .max_constant_buffer_size = 128 * 1024 * 1024,
 .max_constant_args = 8,
+.max_global_variable_size = 64 * 1024,
+.global_variable_preferred_total_size = 64 * 1024,
 .error_correction_support = CL_FALSE,
 #ifdef HAS_USERPTR
 .host_unified_memory = CL_TRUE,
@@ -72,6 +78,12 @@
 .linker_available = CL_TRUE,
 .execution_capabilities = CL_EXEC_KERNEL | CL_EXEC_NATIVE_KERNEL,
 .queue_properties = CL_QUEUE_PROFILING_ENABLE,
+.queue_on_host_properties = CL_QUEUE_PROFILING_ENABLE,
+.queue_on_device_properties = CL_QUEUE_PROFILING_ENABLE,
+.queue_on_device_preferred_size = 16 * 1024,
+.queue_on_device_max_size = 256 * 1024,
+.max_on_device_queues = 1,
+.max_on_device_events = 1024,
 .platform = NULL, /* == intel_platform (set when requested) */
 /* IEEE 754, XXX does IVB support CL_FP_CORRECTLY_ROUNDED_DIVIDE_SQRT? */
 .single_fp_config = CL_FP_INF_NAN | CL_FP_ROUND_TO_NEAREST , /* IEEE 754. */
-- 
2.5.0



More information about the Beignet mailing list