[igt-dev] [PATCH i-g-t 10/12] lib/intel_blt: Extend blitter library to support xe driver
Zbigniew Kempczyński
zbigniew.kempczynski at intel.com
Tue Jul 4 09:01:02 UTC 2023
Use already written for i915 blitter library in xe development.
Add appropriate code paths which are unique for those drivers.
Signed-off-by: Zbigniew Kempczyński <zbigniew.kempczynski at intel.com>
---
lib/intel_blt.c | 257 ++++++++++++++++++++++++++++++++----------------
lib/intel_blt.h | 2 +-
2 files changed, 171 insertions(+), 88 deletions(-)
diff --git a/lib/intel_blt.c b/lib/intel_blt.c
index f2f86e4947..43fda14583 100644
--- a/lib/intel_blt.c
+++ b/lib/intel_blt.c
@@ -9,9 +9,13 @@
#include <malloc.h>
#include <cairo.h>
#include "drm.h"
-#include "igt.h"
#include "i915/gem_create.h"
+#include "igt.h"
+#include "igt_syncobj.h"
#include "intel_blt.h"
+#include "xe/xe_ioctl.h"
+#include "xe/xe_query.h"
+#include "xe/xe_util.h"
#define BITRANGE(start, end) (end - start + 1)
#define GET_CMDS_INFO(__fd) intel_get_cmds_info(intel_get_drm_devid(__fd))
@@ -468,24 +472,41 @@ static int __special_mode(const struct blt_copy_data *blt)
return SM_NONE;
}
-static int __memory_type(uint32_t region)
+static int __memory_type(int fd, enum intel_driver driver, uint32_t region)
{
- igt_assert_f(IS_DEVICE_MEMORY_REGION(region) ||
- IS_SYSTEM_MEMORY_REGION(region),
- "Invalid region: %x\n", region);
+ if (driver == INTEL_DRIVER_I915) {
+ igt_assert_f(IS_DEVICE_MEMORY_REGION(region) ||
+ IS_SYSTEM_MEMORY_REGION(region),
+ "Invalid region: %x\n", region);
+ } else {
+ igt_assert_f(XE_IS_VRAM_MEMORY_REGION(fd, region) ||
+ XE_IS_SYSMEM_MEMORY_REGION(fd, region),
+ "Invalid region: %x\n", region);
+ }
- if (IS_DEVICE_MEMORY_REGION(region))
+ if (driver == INTEL_DRIVER_I915 && IS_DEVICE_MEMORY_REGION(region))
return TM_LOCAL_MEM;
+ else if (driver == INTEL_DRIVER_XE && XE_IS_VRAM_MEMORY_REGION(fd, region))
+ return TM_LOCAL_MEM;
+
return TM_SYSTEM_MEM;
}
-static enum blt_aux_mode __aux_mode(const struct blt_copy_object *obj)
+static enum blt_aux_mode __aux_mode(int fd,
+ enum intel_driver driver,
+ const struct blt_copy_object *obj)
{
- if (obj->compression == COMPRESSION_ENABLED) {
+
+ if (driver == INTEL_DRIVER_I915 && obj->compression == COMPRESSION_ENABLED) {
igt_assert_f(IS_DEVICE_MEMORY_REGION(obj->region),
"XY_BLOCK_COPY_BLT supports compression "
"on device memory only\n");
return AM_AUX_CCS_E;
+ } else if (driver == INTEL_DRIVER_XE && obj->compression == COMPRESSION_ENABLED) {
+ igt_assert_f(XE_IS_VRAM_MEMORY_REGION(fd, obj->region),
+ "XY_BLOCK_COPY_BLT supports compression "
+ "on device memory only\n");
+ return AM_AUX_CCS_E;
}
return AM_AUX_NONE;
@@ -508,9 +529,9 @@ static void fill_data(struct gen12_block_copy_data *data,
data->dw00.length = extended_command ? 20 : 10;
if (__special_mode(blt) == SM_FULL_RESOLVE)
- data->dw01.dst_aux_mode = __aux_mode(&blt->src);
+ data->dw01.dst_aux_mode = __aux_mode(blt->fd, blt->driver, &blt->src);
else
- data->dw01.dst_aux_mode = __aux_mode(&blt->dst);
+ data->dw01.dst_aux_mode = __aux_mode(blt->fd, blt->driver, &blt->dst);
data->dw01.dst_pitch = blt->dst.pitch - 1;
data->dw01.dst_mocs = blt->dst.mocs;
@@ -531,13 +552,13 @@ static void fill_data(struct gen12_block_copy_data *data,
data->dw06.dst_x_offset = blt->dst.x_offset;
data->dw06.dst_y_offset = blt->dst.y_offset;
- data->dw06.dst_target_memory = __memory_type(blt->dst.region);
+ data->dw06.dst_target_memory = __memory_type(blt->fd, blt->driver, blt->dst.region);
data->dw07.src_x1 = blt->src.x1;
data->dw07.src_y1 = blt->src.y1;
data->dw08.src_pitch = blt->src.pitch - 1;
- data->dw08.src_aux_mode = __aux_mode(&blt->src);
+ data->dw08.src_aux_mode = __aux_mode(blt->fd, blt->driver, &blt->src);
data->dw08.src_mocs = blt->src.mocs;
data->dw08.src_compression = blt->src.compression;
data->dw08.src_tiling = __block_tiling(blt->src.tiling);
@@ -550,7 +571,7 @@ static void fill_data(struct gen12_block_copy_data *data,
data->dw11.src_x_offset = blt->src.x_offset;
data->dw11.src_y_offset = blt->src.y_offset;
- data->dw11.src_target_memory = __memory_type(blt->src.region);
+ data->dw11.src_target_memory = __memory_type(blt->fd, blt->driver, blt->src.region);
}
static void fill_data_ext(struct gen12_block_copy_data_ext *dext,
@@ -739,7 +760,10 @@ uint64_t emit_blt_block_copy(int fd,
igt_assert_f(ahnd, "block-copy supports softpin only\n");
igt_assert_f(blt, "block-copy requires data to do blit\n");
- alignment = gem_detect_safe_alignment(fd);
+ if (blt->driver == INTEL_DRIVER_XE)
+ alignment = xe_get_default_alignment(fd);
+ else
+ alignment = gem_detect_safe_alignment(fd);
src_offset = get_offset(ahnd, blt->src.handle, blt->src.size, alignment)
+ blt->src.plane_offset;
dst_offset = get_offset(ahnd, blt->dst.handle, blt->dst.size, alignment)
@@ -748,8 +772,11 @@ uint64_t emit_blt_block_copy(int fd,
fill_data(&data, blt, src_offset, dst_offset, ext);
- bb = gem_mmap__device_coherent(fd, blt->bb.handle, 0, blt->bb.size,
- PROT_READ | PROT_WRITE);
+ if (blt->driver == INTEL_DRIVER_XE)
+ bb = xe_bo_map(fd, blt->bb.handle, blt->bb.size);
+ else
+ bb = gem_mmap__device_coherent(fd, blt->bb.handle, 0, blt->bb.size,
+ PROT_READ | PROT_WRITE);
igt_assert(bb_pos + sizeof(data) < blt->bb.size);
memcpy(bb + bb_pos, &data, sizeof(data));
@@ -812,29 +839,38 @@ int blt_block_copy(int fd,
igt_assert_f(ahnd, "block-copy supports softpin only\n");
igt_assert_f(blt, "block-copy requires data to do blit\n");
+ igt_assert_neq(blt->driver, 0);
- alignment = gem_detect_safe_alignment(fd);
+ if (blt->driver == INTEL_DRIVER_XE)
+ alignment = xe_get_default_alignment(fd);
+ else
+ alignment = gem_detect_safe_alignment(fd);
src_offset = get_offset(ahnd, blt->src.handle, blt->src.size, alignment);
dst_offset = get_offset(ahnd, blt->dst.handle, blt->dst.size, alignment);
bb_offset = get_offset(ahnd, blt->bb.handle, blt->bb.size, alignment);
emit_blt_block_copy(fd, ahnd, blt, ext, 0, true);
- obj[0].offset = CANONICAL(dst_offset);
- obj[1].offset = CANONICAL(src_offset);
- obj[2].offset = CANONICAL(bb_offset);
- obj[0].handle = blt->dst.handle;
- obj[1].handle = blt->src.handle;
- obj[2].handle = blt->bb.handle;
- obj[0].flags = EXEC_OBJECT_PINNED | EXEC_OBJECT_WRITE |
- EXEC_OBJECT_SUPPORTS_48B_ADDRESS;
- obj[1].flags = EXEC_OBJECT_PINNED | EXEC_OBJECT_SUPPORTS_48B_ADDRESS;
- obj[2].flags = EXEC_OBJECT_PINNED | EXEC_OBJECT_SUPPORTS_48B_ADDRESS;
- execbuf.buffer_count = 3;
- execbuf.buffers_ptr = to_user_pointer(obj);
- execbuf.rsvd1 = ctx ? ctx->id : 0;
- execbuf.flags = e ? e->flags : I915_EXEC_BLT;
- ret = __gem_execbuf(fd, &execbuf);
+ if (blt->driver == INTEL_DRIVER_XE) {
+ intel_ctx_xe_exec(ctx, ahnd, CANONICAL(bb_offset));
+ } else {
+ obj[0].offset = CANONICAL(dst_offset);
+ obj[1].offset = CANONICAL(src_offset);
+ obj[2].offset = CANONICAL(bb_offset);
+ obj[0].handle = blt->dst.handle;
+ obj[1].handle = blt->src.handle;
+ obj[2].handle = blt->bb.handle;
+ obj[0].flags = EXEC_OBJECT_PINNED | EXEC_OBJECT_WRITE |
+ EXEC_OBJECT_SUPPORTS_48B_ADDRESS;
+ obj[1].flags = EXEC_OBJECT_PINNED | EXEC_OBJECT_SUPPORTS_48B_ADDRESS;
+ obj[2].flags = EXEC_OBJECT_PINNED | EXEC_OBJECT_SUPPORTS_48B_ADDRESS;
+ execbuf.buffer_count = 3;
+ execbuf.buffers_ptr = to_user_pointer(obj);
+ execbuf.rsvd1 = ctx ? ctx->id : 0;
+ execbuf.flags = e ? e->flags : I915_EXEC_BLT;
+
+ ret = __gem_execbuf(fd, &execbuf);
+ }
return ret;
}
@@ -950,7 +986,10 @@ uint64_t emit_blt_ctrl_surf_copy(int fd,
igt_assert_f(ahnd, "ctrl-surf-copy supports softpin only\n");
igt_assert_f(surf, "ctrl-surf-copy requires data to do ctrl-surf-copy blit\n");
- alignment = max_t(uint64_t, gem_detect_safe_alignment(fd), 1ull << 16);
+ if (surf->driver == INTEL_DRIVER_XE)
+ alignment = max_t(uint64_t, xe_get_default_alignment(fd), 1ull << 16);
+ else
+ alignment = max_t(uint64_t, gem_detect_safe_alignment(fd), 1ull << 16);
data.dw00.client = 0x2;
data.dw00.opcode = 0x48;
@@ -973,8 +1012,11 @@ uint64_t emit_blt_ctrl_surf_copy(int fd,
data.dw04.dst_address_hi = dst_offset >> 32;
data.dw04.dst_mocs = surf->dst.mocs;
- bb = gem_mmap__device_coherent(fd, surf->bb.handle, 0, surf->bb.size,
- PROT_READ | PROT_WRITE);
+ if (surf->driver == INTEL_DRIVER_XE)
+ bb = xe_bo_map(fd, surf->bb.handle, surf->bb.size);
+ else
+ bb = gem_mmap__device_coherent(fd, surf->bb.handle, 0, surf->bb.size,
+ PROT_READ | PROT_WRITE);
igt_assert(bb_pos + sizeof(data) < surf->bb.size);
memcpy(bb + bb_pos, &data, sizeof(data));
@@ -1002,7 +1044,7 @@ uint64_t emit_blt_ctrl_surf_copy(int fd,
/**
* blt_ctrl_surf_copy:
- * @fd: drm fd
+ * @blt: bldrm fd
* @ctx: intel_ctx_t context
* @e: blitter engine for @ctx
* @ahnd: allocator handle
@@ -1026,32 +1068,41 @@ int blt_ctrl_surf_copy(int fd,
igt_assert_f(ahnd, "ctrl-surf-copy supports softpin only\n");
igt_assert_f(surf, "ctrl-surf-copy requires data to do ctrl-surf-copy blit\n");
+ igt_assert_neq(surf->driver, 0);
+
+ if (surf->driver == INTEL_DRIVER_XE)
+ alignment = max_t(uint64_t, xe_get_default_alignment(fd), 1ull << 16);
+ else
+ alignment = max_t(uint64_t, gem_detect_safe_alignment(fd), 1ull << 16);
- alignment = max_t(uint64_t, gem_detect_safe_alignment(fd), 1ull << 16);
src_offset = get_offset(ahnd, surf->src.handle, surf->src.size, alignment);
dst_offset = get_offset(ahnd, surf->dst.handle, surf->dst.size, alignment);
bb_offset = get_offset(ahnd, surf->bb.handle, surf->bb.size, alignment);
emit_blt_ctrl_surf_copy(fd, ahnd, surf, 0, true);
- obj[0].offset = CANONICAL(dst_offset);
- obj[1].offset = CANONICAL(src_offset);
- obj[2].offset = CANONICAL(bb_offset);
- obj[0].handle = surf->dst.handle;
- obj[1].handle = surf->src.handle;
- obj[2].handle = surf->bb.handle;
- obj[0].flags = EXEC_OBJECT_PINNED | EXEC_OBJECT_WRITE |
- EXEC_OBJECT_SUPPORTS_48B_ADDRESS;
- obj[1].flags = EXEC_OBJECT_PINNED | EXEC_OBJECT_SUPPORTS_48B_ADDRESS;
- obj[2].flags = EXEC_OBJECT_PINNED | EXEC_OBJECT_SUPPORTS_48B_ADDRESS;
- execbuf.buffer_count = 3;
- execbuf.buffers_ptr = to_user_pointer(obj);
- execbuf.flags = e ? e->flags : I915_EXEC_BLT;
- execbuf.rsvd1 = ctx ? ctx->id : 0;
- gem_execbuf(fd, &execbuf);
- put_offset(ahnd, surf->dst.handle);
- put_offset(ahnd, surf->src.handle);
- put_offset(ahnd, surf->bb.handle);
+ if (surf->driver == INTEL_DRIVER_XE) {
+ intel_ctx_xe_exec(ctx, ahnd, CANONICAL(bb_offset));
+ } else {
+ obj[0].offset = CANONICAL(dst_offset);
+ obj[1].offset = CANONICAL(src_offset);
+ obj[2].offset = CANONICAL(bb_offset);
+ obj[0].handle = surf->dst.handle;
+ obj[1].handle = surf->src.handle;
+ obj[2].handle = surf->bb.handle;
+ obj[0].flags = EXEC_OBJECT_PINNED | EXEC_OBJECT_WRITE |
+ EXEC_OBJECT_SUPPORTS_48B_ADDRESS;
+ obj[1].flags = EXEC_OBJECT_PINNED | EXEC_OBJECT_SUPPORTS_48B_ADDRESS;
+ obj[2].flags = EXEC_OBJECT_PINNED | EXEC_OBJECT_SUPPORTS_48B_ADDRESS;
+ execbuf.buffer_count = 3;
+ execbuf.buffers_ptr = to_user_pointer(obj);
+ execbuf.flags = e ? e->flags : I915_EXEC_BLT;
+ execbuf.rsvd1 = ctx ? ctx->id : 0;
+ gem_execbuf(fd, &execbuf);
+ put_offset(ahnd, surf->dst.handle);
+ put_offset(ahnd, surf->src.handle);
+ put_offset(ahnd, surf->bb.handle);
+ }
return 0;
}
@@ -1208,7 +1259,10 @@ uint64_t emit_blt_fast_copy(int fd,
uint32_t bbe = MI_BATCH_BUFFER_END;
uint32_t *bb;
- alignment = gem_detect_safe_alignment(fd);
+ if (blt->driver == INTEL_DRIVER_XE)
+ alignment = xe_get_default_alignment(fd);
+ else
+ alignment = gem_detect_safe_alignment(fd);
data.dw00.client = 0x2;
data.dw00.opcode = 0x42;
@@ -1218,8 +1272,8 @@ uint64_t emit_blt_fast_copy(int fd,
data.dw01.dst_pitch = blt->dst.pitch;
data.dw01.color_depth = __fast_color_depth(blt->color_depth);
- data.dw01.dst_memory = __memory_type(blt->dst.region);
- data.dw01.src_memory = __memory_type(blt->src.region);
+ data.dw01.dst_memory = __memory_type(blt->fd, blt->driver, blt->dst.region);
+ data.dw01.src_memory = __memory_type(blt->fd, blt->driver, blt->src.region);
data.dw01.dst_type_y = __new_tile_y_type(blt->dst.tiling) ? 1 : 0;
data.dw01.src_type_y = __new_tile_y_type(blt->src.tiling) ? 1 : 0;
@@ -1246,8 +1300,11 @@ uint64_t emit_blt_fast_copy(int fd,
data.dw08.src_address_lo = src_offset;
data.dw09.src_address_hi = src_offset >> 32;
- bb = gem_mmap__device_coherent(fd, blt->bb.handle, 0, blt->bb.size,
- PROT_READ | PROT_WRITE);
+ if (blt->driver == INTEL_DRIVER_XE)
+ bb = xe_bo_map(fd, blt->bb.handle, blt->bb.size);
+ else
+ bb = gem_mmap__device_coherent(fd, blt->bb.handle, 0, blt->bb.size,
+ PROT_READ | PROT_WRITE);
igt_assert(bb_pos + sizeof(data) < blt->bb.size);
memcpy(bb + bb_pos, &data, sizeof(data));
@@ -1297,7 +1354,14 @@ int blt_fast_copy(int fd,
uint64_t dst_offset, src_offset, bb_offset, alignment;
int ret;
- alignment = gem_detect_safe_alignment(fd);
+ igt_assert_f(ahnd, "fast-copy supports softpin only\n");
+ igt_assert_f(blt, "fast-copy requires data to do fast-copy blit\n");
+ igt_assert_neq(blt->driver, 0);
+
+ if (blt->driver == INTEL_DRIVER_XE)
+ alignment = xe_get_default_alignment(fd);
+ else
+ alignment = gem_detect_safe_alignment(fd);
src_offset = get_offset(ahnd, blt->src.handle, blt->src.size, alignment);
dst_offset = get_offset(ahnd, blt->dst.handle, blt->dst.size, alignment);
@@ -1305,24 +1369,28 @@ int blt_fast_copy(int fd,
emit_blt_fast_copy(fd, ahnd, blt, 0, true);
- obj[0].offset = CANONICAL(dst_offset);
- obj[1].offset = CANONICAL(src_offset);
- obj[2].offset = CANONICAL(bb_offset);
- obj[0].handle = blt->dst.handle;
- obj[1].handle = blt->src.handle;
- obj[2].handle = blt->bb.handle;
- obj[0].flags = EXEC_OBJECT_PINNED | EXEC_OBJECT_WRITE |
- EXEC_OBJECT_SUPPORTS_48B_ADDRESS;
- obj[1].flags = EXEC_OBJECT_PINNED | EXEC_OBJECT_SUPPORTS_48B_ADDRESS;
- obj[2].flags = EXEC_OBJECT_PINNED | EXEC_OBJECT_SUPPORTS_48B_ADDRESS;
- execbuf.buffer_count = 3;
- execbuf.buffers_ptr = to_user_pointer(obj);
- execbuf.rsvd1 = ctx ? ctx->id : 0;
- execbuf.flags = e ? e->flags : I915_EXEC_BLT;
- ret = __gem_execbuf(fd, &execbuf);
- put_offset(ahnd, blt->dst.handle);
- put_offset(ahnd, blt->src.handle);
- put_offset(ahnd, blt->bb.handle);
+ if (blt->driver == INTEL_DRIVER_XE) {
+ intel_ctx_xe_exec(ctx, ahnd, CANONICAL(bb_offset));
+ } else {
+ obj[0].offset = CANONICAL(dst_offset);
+ obj[1].offset = CANONICAL(src_offset);
+ obj[2].offset = CANONICAL(bb_offset);
+ obj[0].handle = blt->dst.handle;
+ obj[1].handle = blt->src.handle;
+ obj[2].handle = blt->bb.handle;
+ obj[0].flags = EXEC_OBJECT_PINNED | EXEC_OBJECT_WRITE |
+ EXEC_OBJECT_SUPPORTS_48B_ADDRESS;
+ obj[1].flags = EXEC_OBJECT_PINNED | EXEC_OBJECT_SUPPORTS_48B_ADDRESS;
+ obj[2].flags = EXEC_OBJECT_PINNED | EXEC_OBJECT_SUPPORTS_48B_ADDRESS;
+ execbuf.buffer_count = 3;
+ execbuf.buffers_ptr = to_user_pointer(obj);
+ execbuf.rsvd1 = ctx ? ctx->id : 0;
+ execbuf.flags = e ? e->flags : I915_EXEC_BLT;
+ ret = __gem_execbuf(fd, &execbuf);
+ put_offset(ahnd, blt->dst.handle);
+ put_offset(ahnd, blt->src.handle);
+ put_offset(ahnd, blt->bb.handle);
+ }
return ret;
}
@@ -1366,16 +1434,26 @@ blt_create_object(const struct blt_copy_data *blt, uint32_t region,
obj = calloc(1, sizeof(*obj));
obj->size = size;
- igt_assert(__gem_create_in_memory_regions(blt->fd, &handle,
- &size, region) == 0);
+
+ if (blt->driver == INTEL_DRIVER_XE) {
+ size = ALIGN(size, xe_get_default_alignment(blt->fd));
+ handle = xe_bo_create_flags(blt->fd, 0, size, region);
+ } else {
+ igt_assert(__gem_create_in_memory_regions(blt->fd, &handle,
+ &size, region) == 0);
+ }
blt_set_object(obj, handle, size, region, mocs, tiling,
compression, compression_type);
blt_set_geom(obj, stride, 0, 0, width, height, 0, 0);
- if (create_mapping)
- obj->ptr = gem_mmap__device_coherent(blt->fd, handle, 0, size,
- PROT_READ | PROT_WRITE);
+ if (create_mapping) {
+ if (blt->driver == INTEL_DRIVER_XE)
+ obj->ptr = xe_bo_map(blt->fd, handle, size);
+ else
+ obj->ptr = gem_mmap__device_coherent(blt->fd, handle, 0, size,
+ PROT_READ | PROT_WRITE);
+ }
return obj;
}
@@ -1518,14 +1596,19 @@ void blt_surface_to_png(int fd, uint32_t run_id, const char *fileid,
int format;
int stride = obj->tiling ? obj->pitch * 4 : obj->pitch;
char filename[FILENAME_MAX];
+ bool is_xe;
snprintf(filename, FILENAME_MAX-1, "%d-%s-%s-%ux%u-%s.png",
run_id, fileid, blt_tiling_name(obj->tiling), width, height,
obj->compression ? "compressed" : "uncompressed");
- if (!map)
- map = gem_mmap__device_coherent(fd, obj->handle, 0,
- obj->size, PROT_READ);
+ if (!map) {
+ if (is_xe)
+ map = xe_bo_map(fd, obj->handle, obj->size);
+ else
+ map = gem_mmap__device_coherent(fd, obj->handle, 0,
+ obj->size, PROT_READ);
+ }
format = CAIRO_FORMAT_RGB24;
surface = cairo_image_surface_create_for_data(map,
format, width, height,
diff --git a/lib/intel_blt.h b/lib/intel_blt.h
index 7516ce8ac7..944e2b4ae7 100644
--- a/lib/intel_blt.h
+++ b/lib/intel_blt.h
@@ -8,7 +8,7 @@
/**
* SECTION:intel_blt
- * @short_description: i915 blitter library
+ * @short_description: i915/xe blitter library
* @title: Blitter library
* @include: intel_blt.h
*
--
2.34.1
More information about the igt-dev
mailing list