[igt-dev] [PATCH i-g-t v4 2/3] lib/intel_compute: Update intel_compute to run on specified engine
Kamil Konieczny
kamil.konieczny at linux.intel.com
Thu Dec 7 11:56:18 UTC 2023
Hi Niranjana,
On 2023-12-06 at 12:00:54 -0800, Niranjana Vishwanathapura wrote:
> With CCS_MODE setting, available compute slices can be assigned
> to specific compute engines. Update intel_compute library to
> be able to run compute kernel on specified compute or render
> engine.
>
> Signed-off-by: Niranjana Vishwanathapura <niranjana.vishwanathapura at intel.com>
> Reviewed-by: Zbigniew Kempczyński <zbigniew.kempczynski at intel.com>
> ---
> lib/intel_compute.c | 85 ++++++++++++++++++++++++++++++++-------------
> lib/intel_compute.h | 3 ++
> 2 files changed, 63 insertions(+), 25 deletions(-)
>
> diff --git a/lib/intel_compute.c b/lib/intel_compute.c
> index 0beab471b..79dffc50e 100644
> --- a/lib/intel_compute.c
> +++ b/lib/intel_compute.c
> @@ -16,7 +16,6 @@
> #include "intel_compute.h"
> #include "lib/igt_syncobj.h"
> #include "lib/intel_reg.h"
> -#include "xe_drm.h"
> #include "xe/xe_ioctl.h"
> #include "xe/xe_query.h"
> #include "xehp_media.h"
> @@ -64,7 +63,8 @@ struct bo_execenv {
> struct drm_i915_gem_exec_object2 *obj;
> };
>
> -static void bo_execenv_create(int fd, struct bo_execenv *execenv)
> +static void bo_execenv_create(int fd, struct bo_execenv *execenv,
> + struct drm_xe_engine_class_instance *eci)
> {
> igt_assert(execenv);
>
> @@ -73,18 +73,24 @@ static void bo_execenv_create(int fd, struct bo_execenv *execenv)
> execenv->driver = get_intel_driver(fd);
>
> if (execenv->driver == INTEL_DRIVER_XE) {
> - uint16_t engine_class;
> - uint32_t devid = intel_get_drm_devid(fd);
> - const struct intel_device_info *info = intel_get_device_info(devid);
> -
> - if (info->graphics_ver >= 12 && info->graphics_rel < 60)
> - engine_class = DRM_XE_ENGINE_CLASS_RENDER;
> - else
> - engine_class = DRM_XE_ENGINE_CLASS_COMPUTE;
> -
> execenv->vm = xe_vm_create(fd, DRM_XE_VM_CREATE_FLAG_ASYNC_DEFAULT, 0);
> - execenv->exec_queue = xe_exec_queue_create_class(fd, execenv->vm,
> - engine_class);
> +
> + if (eci) {
> + execenv->exec_queue = xe_exec_queue_create(fd, execenv->vm,
> + eci, 0);
> + } else {
> + uint16_t engine_class;
> + uint32_t devid = intel_get_drm_devid(fd);
> + const struct intel_device_info *info = intel_get_device_info(devid);
> +
> + if (info->graphics_ver >= 12 && info->graphics_rel < 60)
> + engine_class = DRM_XE_ENGINE_CLASS_RENDER;
> + else
> + engine_class = DRM_XE_ENGINE_CLASS_COMPUTE;
> +
> + execenv->exec_queue = xe_exec_queue_create_class(fd, execenv->vm,
> + engine_class);
> + }
> }
> }
>
> @@ -588,9 +594,11 @@ static void dg1_compute_exec_compute(uint32_t *addr_bo_buffer_batch,
> * @fd: file descriptor of the opened DRM device
> * @kernel: GPU Kernel binary to be executed
> * @size: size of @kernel.
> + * @eci: engine class instance
> */
> static void compute_exec(int fd, const unsigned char *kernel,
> - unsigned int size)
> + unsigned int size,
> + struct drm_xe_engine_class_instance *eci)
> {
> #define BO_DICT_ENTRIES 7
> struct bo_dict_entry bo_dict[BO_DICT_ENTRIES] = {
> @@ -619,7 +627,7 @@ static void compute_exec(int fd, const unsigned char *kernel,
> float *dinput;
> uint16_t devid = intel_get_drm_devid(fd);
>
> - bo_execenv_create(fd, &execenv);
> + bo_execenv_create(fd, &execenv, eci);
>
> /* Sets Kernel size */
> bo_dict[0].size = ALIGN(size, 0x1000);
> @@ -865,9 +873,11 @@ static void xehp_compute_exec_compute(uint32_t *addr_bo_buffer_batch,
> * @fd: file descriptor of the opened DRM device
> * @kernel: GPU Kernel binary to be executed
> * @size: size of @kernel.
> + * @eci: engine class instance
> */
> static void xehp_compute_exec(int fd, const unsigned char *kernel,
> - unsigned int size)
> + unsigned int size,
> + struct drm_xe_engine_class_instance *eci)
> {
> #define XEHP_BO_DICT_ENTRIES 9
> struct bo_dict_entry bo_dict[XEHP_BO_DICT_ENTRIES] = {
> @@ -897,7 +907,7 @@ static void xehp_compute_exec(int fd, const unsigned char *kernel,
> struct bo_execenv execenv;
> float *dinput;
>
> - bo_execenv_create(fd, &execenv);
> + bo_execenv_create(fd, &execenv, eci);
>
> /* Sets Kernel size */
> bo_dict[0].size = ALIGN(size, 0x1000);
> @@ -1079,9 +1089,11 @@ static void xehpc_compute_exec_compute(uint32_t *addr_bo_buffer_batch,
> * @fd: file descriptor of the opened DRM device
> * @kernel: GPU Kernel binary to be executed
> * @size: size of @kernel.
> + * @eci: engine class instance
> */
> static void xehpc_compute_exec(int fd, const unsigned char *kernel,
> - unsigned int size)
> + unsigned int size,
> + struct drm_xe_engine_class_instance *eci)
> {
> #define XEHPC_BO_DICT_ENTRIES 6
> struct bo_dict_entry bo_dict[XEHPC_BO_DICT_ENTRIES] = {
> @@ -1102,7 +1114,7 @@ static void xehpc_compute_exec(int fd, const unsigned char *kernel,
> struct bo_execenv execenv;
> float *dinput;
>
> - bo_execenv_create(fd, &execenv);
> + bo_execenv_create(fd, &execenv, eci);
>
> /* Sets Kernel size */
> bo_dict[0].size = ALIGN(size, 0x1000);
> @@ -1261,7 +1273,8 @@ static void xe2lpg_compute_exec_compute(uint32_t *addr_bo_buffer_batch,
> * @size: size of @kernel.
> */
> static void xe2lpg_compute_exec(int fd, const unsigned char *kernel,
> - unsigned int size)
> + unsigned int size,
> + struct drm_xe_engine_class_instance *eci)
> {
> #define XE2_BO_DICT_ENTRIES 10
> struct bo_dict_entry bo_dict[XE2_BO_DICT_ENTRIES] = {
> @@ -1296,7 +1309,7 @@ static void xe2lpg_compute_exec(int fd, const unsigned char *kernel,
> struct bo_execenv execenv;
> float *dinput;
>
> - bo_execenv_create(fd, &execenv);
> + bo_execenv_create(fd, &execenv, eci);
>
> /* Sets Kernel size */
> bo_dict[0].size = ALIGN(size, 0x1000);
> @@ -1356,7 +1369,8 @@ static void xe2lpg_compute_exec(int fd, const unsigned char *kernel,
> static const struct {
> unsigned int ip_ver;
> void (*compute_exec)(int fd, const unsigned char *kernel,
> - unsigned int size);
> + unsigned int size,
> + struct drm_xe_engine_class_instance *eci);
> uint32_t compat;
> } intel_compute_batches[] = {
> {
> @@ -1386,7 +1400,8 @@ static const struct {
> },
> };
>
> -bool run_intel_compute_kernel(int fd)
> +static bool __run_intel_compute_kernel(int fd,
> + struct drm_xe_engine_class_instance *eci)
> {
> unsigned int ip_ver = intel_graphics_ver(intel_get_drm_devid(fd));
> unsigned int batch;
> @@ -1397,8 +1412,10 @@ bool run_intel_compute_kernel(int fd)
> if (ip_ver == intel_compute_batches[batch].ip_ver)
> break;
> }
> - if (batch == ARRAY_SIZE(intel_compute_batches))
> + if (batch == ARRAY_SIZE(intel_compute_batches)) {
> + igt_debug("GPU version 0x%x not supported\n", ip_ver);
> return false;
> + }
>
> if (!(COMPAT_DRIVER_FLAG(driver) & intel_compute_batches[batch].compat)) {
> igt_debug("Driver is not supported: flags %x & %x\n",
> @@ -1416,7 +1433,25 @@ bool run_intel_compute_kernel(int fd)
> return 1;
>
> intel_compute_batches[batch].compute_exec(fd, kernels->kernel,
> - kernels->size);
> + kernels->size, eci);
>
> return true;
> }
> +
> +bool run_intel_compute_kernel(int fd)
> +{
> + return __run_intel_compute_kernel(fd, NULL);
> +}
> +
> +bool run_intel_compute_kernel_on_engine(int fd,
> + struct drm_xe_engine_class_instance *eci)
> +{
> + if (eci->engine_class != DRM_XE_ENGINE_CLASS_COMPUTE &&
> + eci->engine_class != DRM_XE_ENGINE_CLASS_RENDER) {
> + igt_debug("%s engine class not supported\n",
> + xe_engine_class_string(eci->engine_class));
> + return false;
> + }
> +
> + return __run_intel_compute_kernel(fd, eci);
> +}
> diff --git a/lib/intel_compute.h b/lib/intel_compute.h
> index ba153f064..5d81c3d62 100644
> --- a/lib/intel_compute.h
> +++ b/lib/intel_compute.h
> @@ -9,6 +9,8 @@
> #ifndef INTEL_COMPUTE_H
> #define INTEL_COMPUTE_H
>
> +#include "xe_drm.h"
With this it looks like Xe only header.
> +
> /*
> * OpenCL Kernels are generated using:
> *
> @@ -28,5 +30,6 @@ struct intel_compute_kernels {
> extern const struct intel_compute_kernels intel_compute_square_kernels[];
>
> bool run_intel_compute_kernel(int fd);
> +bool run_intel_compute_kernel_on_engine(int fd, struct drm_xe_engine_class_instance *eci);
What about using *void here?
>
> #endif /* INTEL_COMPUTE_H */
> --
> 2.21.0.rc0.32.g243a4c7e27
-- ^^
Please update your git to at least 2.3x or 2.4x (current lastest is 2.43.0).
Regards,
Kamil
More information about the igt-dev
mailing list