[igt-dev] [PATCH i-g-t 1/2] lib: Apply x/y offsets to GPGPU fill
Christoph Manszewski
christoph.manszewski at intel.com
Fri Jun 9 09:37:18 UTC 2023
Actually honour the caller provided destination region and pass the x/y
offsets to the thread group.
Signed-off-by: Chris Wilson <chris.p.wilson at intel.com>
Signed-off-by: Christoph Manszewski <christoph.manszewski at intel.com>
---
lib/gpgpu_fill.c | 4 +---
lib/gpu_cmds.c | 29 +++++++++++++++--------------
lib/gpu_cmds.h | 1 +
3 files changed, 17 insertions(+), 17 deletions(-)
diff --git a/lib/gpgpu_fill.c b/lib/gpgpu_fill.c
index d854fbf7..eed82187 100644
--- a/lib/gpgpu_fill.c
+++ b/lib/gpgpu_fill.c
@@ -315,8 +315,6 @@ __xehp_gpgpu_fillfunc(int i915,
{
struct intel_bb *ibb;
struct xehp_interface_descriptor_data idd;
- (void) x;
- (void) y;
ibb = intel_bb_create(i915, PAGE_SIZE);
intel_bb_add_intel_buf(ibb, buf, true);
@@ -335,7 +333,7 @@ __xehp_gpgpu_fillfunc(int i915,
xehp_emit_state_compute_mode(ibb);
xehp_emit_state_binding_table_pool_alloc(ibb);
xehp_emit_cfe_state(ibb, THREADS);
- xehp_emit_compute_walk(ibb, width, height, &idd, color);
+ xehp_emit_compute_walk(ibb, x, y, width, height, &idd, color);
intel_bb_out(ibb, MI_BATCH_BUFFER_END);
intel_bb_ptr_align(ibb, 32);
diff --git a/lib/gpu_cmds.c b/lib/gpu_cmds.c
index 1f321ae4..aecba928 100644
--- a/lib/gpu_cmds.c
+++ b/lib/gpu_cmds.c
@@ -636,10 +636,10 @@ gen7_emit_gpgpu_walk(struct intel_bb *ibb,
* Then thread group X = width / 16 (aligned to 16)
* thread group Y = height;
*/
- x_dim = (width + 15) / 16;
- y_dim = height;
+ x_dim = (x + width + 15) / 16;
+ y_dim = y + height;
- tmp = width & 15;
+ tmp = (x + width) & 15;
if (tmp == 0)
right_mask = (1 << 16) - 1;
else
@@ -657,11 +657,11 @@ gen7_emit_gpgpu_walk(struct intel_bb *ibb,
0); /* width:1 */
/* thread group X */
- intel_bb_out(ibb, 0);
+ intel_bb_out(ibb, x / 16);
intel_bb_out(ibb, x_dim);
/* thread group Y */
- intel_bb_out(ibb, 0);
+ intel_bb_out(ibb, y);
intel_bb_out(ibb, y_dim);
/* thread group Z */
@@ -693,10 +693,10 @@ gen8_emit_gpgpu_walk(struct intel_bb *ibb,
* Then thread group X = width / 16 (aligned to 16)
* thread group Y = height;
*/
- x_dim = (width + 15) / 16;
- y_dim = height;
+ x_dim = (x + width + 15) / 16;
+ y_dim = y + height;
- tmp = width & 15;
+ tmp = (x + width) & 15;
if (tmp == 0)
right_mask = (1 << 16) - 1;
else
@@ -715,12 +715,12 @@ gen8_emit_gpgpu_walk(struct intel_bb *ibb,
0); /* width:1 */
/* thread group X */
- intel_bb_out(ibb, 0);
+ intel_bb_out(ibb, x / 16);
intel_bb_out(ibb, 0);
intel_bb_out(ibb, x_dim);
/* thread group Y */
- intel_bb_out(ibb, 0);
+ intel_bb_out(ibb, y);
intel_bb_out(ibb, 0);
intel_bb_out(ibb, y_dim);
@@ -948,6 +948,7 @@ xehp_emit_state_base_address(struct intel_bb *ibb)
void
xehp_emit_compute_walk(struct intel_bb *ibb,
+ unsigned int x, unsigned int y,
unsigned int width, unsigned int height,
struct xehp_interface_descriptor_data *pidd,
uint8_t color)
@@ -965,8 +966,8 @@ xehp_emit_compute_walk(struct intel_bb *ibb,
* Then thread group X = width / 16 (aligned to 16)
* thread group Y = height;
*/
- x_dim = (width + 15) / 16;
- y_dim = height;
+ x_dim = (x + width + 15) / 16;
+ y_dim = y + height;
intel_bb_out(ibb, XEHP_COMPUTE_WALKER | 0x25);
@@ -994,8 +995,8 @@ xehp_emit_compute_walk(struct intel_bb *ibb,
intel_bb_out(ibb, 1); //dw9
/* group id x/y/z */
- intel_bb_out(ibb, 0); //dw10
- intel_bb_out(ibb, 0); //dw11
+ intel_bb_out(ibb, x / 16); //dw10
+ intel_bb_out(ibb, y); //dw11
intel_bb_out(ibb, 0); //dw12
/* partition id / partition size */
diff --git a/lib/gpu_cmds.h b/lib/gpu_cmds.h
index 92cbbde9..b7ed64f8 100644
--- a/lib/gpu_cmds.h
+++ b/lib/gpu_cmds.h
@@ -138,6 +138,7 @@ xehp_emit_state_base_address(struct intel_bb *ibb);
void
xehp_emit_compute_walk(struct intel_bb *ibb,
+ unsigned int x, unsigned int y,
unsigned int width, unsigned int height,
struct xehp_interface_descriptor_data *pidd,
uint8_t color);
--
2.40.1
More information about the igt-dev
mailing list