[igt-dev] [PATCH i-g-t 3/3] tests/gem_ccs: Add block-multicopy subtest

Karolina Stolarek karolina.stolarek at intel.com
Thu Dec 15 11:47:37 UTC 2022



On 15.12.2022 12:00, Zbigniew Kempczyński wrote:
> On Thu, Dec 15, 2022 at 09:42:56AM +0100, Karolina Stolarek wrote:
>> On 14.12.2022 20:57, Zbigniew Kempczyński wrote:
>>> On Tue, Dec 13, 2022 at 04:40:38PM +0100, Karolina Stolarek wrote:
>>>> On 12.12.2022 13:50, Zbigniew Kempczyński wrote:
>>>>> Exercise sequence of blits packed in single batch. It may reveal
>>>>> flushing/decompressing/detiling problems during execution.
>>>>> multicopy-inplace version differs from copy-inplace version with
>>>>> additional blit to same tiling format during decompression to separate
>>>>> problems visible in decompressing/detiling in one step.
>>>>>
>>>>> Signed-off-by: Zbigniew Kempczyński <zbigniew.kempczynski at intel.com>
>>>>> ---
>>>>>     tests/i915/gem_ccs.c | 262 ++++++++++++++++++++++++++++++++++++++++---
>>>>>     1 file changed, 246 insertions(+), 16 deletions(-)
>>>>>
>>>>> diff --git a/tests/i915/gem_ccs.c b/tests/i915/gem_ccs.c
>>>>> index 4ecb3e36ac..6b5f199ec7 100644
>>>>> --- a/tests/i915/gem_ccs.c
>>>>> +++ b/tests/i915/gem_ccs.c
>>>>> @@ -262,6 +262,119 @@ static void surf_copy(int i915,
>>>>>     	gem_close(i915, ccs);
>>>>>     }
>>>>> +struct blt_copy3_data {
>>>>> +	int i915;
>>>>> +	struct blt_copy_object src;
>>>>> +	struct blt_copy_object mid;
>>>>> +	struct blt_copy_object dst;
>>>>> +	struct blt_copy_object final;
>>>>> +	struct blt_copy_batch bb;
>>>>> +	enum blt_color_depth color_depth;
>>>>> +
>>>>> +	/* debug stuff */
>>>>> +	bool print_bb;
>>>>> +};
>>>>> +
>>>>> +struct blt_block_copy3_data_ext {
>>>>> +	struct blt_block_copy_object_ext src;
>>>>> +	struct blt_block_copy_object_ext mid;
>>>>> +	struct blt_block_copy_object_ext dst;
>>>>> +	struct blt_block_copy_object_ext final;
>>>>> +};
>>>>> +
>>>>> +#define FILL_OBJ(_idx, _handle, _offset, _flags) do { \
>>>>> +	obj[(_idx)].handle = (_handle); \
>>>>> +	obj[(_idx)].offset = (_offset); \
>>>>> +	obj[(_idx)++].flags = EXEC_OBJECT_PINNED | \
>>>>> +			      EXEC_OBJECT_SUPPORTS_48B_ADDRESS | (_flags) ; \
>>>>> +} while (0)
>>>>> +
>>>>
>>>> I'm not sure if we want to have a macro with a hidden side effect. "i++"
>>>> after each statement isn't pretty either, so I'm on the fence with this one.
>>>
>>> I'm aware this has side effect, but this makes main code more clear as it
>>> is not interlaced with var++ between the lines. I think reader who knows
>>> how execbuf objs works will notice there's some implicit increment in the
>>> macro.
>>
>> When I first read the code, I thought "why do we keep using the same i for
>> different objects?", and then looked at this definition. Or we could call
>> FILL_OBJ(++i, ...), but it's not pretty either.
> 
> This will execute increment 3 times here.

Argh, you're right, silly me


Karolina

> --
> Zbigniew
> 
>>
>>>
>>>>
>>>>> +static int blt_block_copy3(int i915,
>>>>> +			   const intel_ctx_t *ctx,
>>>>> +			   const struct intel_execution_engine2 *e,
>>>>> +			   uint64_t ahnd,
>>>>> +			   const struct blt_copy3_data *blt3,
>>>>> +			   const struct blt_block_copy3_data_ext *ext3)
>>>>> +{
>>>>> +	struct drm_i915_gem_execbuffer2 execbuf = {};
>>>>> +	struct drm_i915_gem_exec_object2 obj[5] = {};
>>>>> +	struct blt_copy_data blt0;
>>>>> +	struct blt_block_copy_data_ext ext0;
>>>>> +	uint64_t src_offset, mid_offset, dst_offset, final_offset, bb_offset, alignment;
>>>>> +	uint64_t bb_pos = 0;
>>>>> +	uint32_t *bb;
>>>>> +	int i, ret;
>>>>> +
>>>>> +	igt_assert_f(ahnd, "block-copy3 supports softpin only\n");
>>>>> +	igt_assert_f(blt3, "block-copy3 requires data to do blit\n");
>>>>> +
>>>>> +	alignment = gem_detect_safe_alignment(i915);
>>>>> +	src_offset = get_offset(ahnd, blt3->src.handle, blt3->src.size, alignment);
>>>>> +	mid_offset = get_offset(ahnd, blt3->mid.handle, blt3->mid.size, alignment);
>>>>> +	dst_offset = get_offset(ahnd, blt3->dst.handle, blt3->dst.size, alignment);
>>>>> +	final_offset = get_offset(ahnd, blt3->final.handle, blt3->final.size, alignment);
>>>>> +	bb_offset = get_offset(ahnd, blt3->bb.handle, blt3->bb.size, alignment);
>>>>> +
>>>>> +	igt_debug("src: %lx, mid: %lx, dst: %lx, final: %lx, bb: %lx, align: %lx\n",
>>>>> +		  src_offset, mid_offset, dst_offset, final_offset, bb_offset, alignment);
>>>>> +
>>>>> +	/* First blit src -> mid */
>>>>> +	memset(&blt0, 0, sizeof(blt0));
>>>>> +	blt0.src = blt3->src;
>>>>> +	blt0.dst = blt3->mid;
>>>>> +	blt0.bb = blt3->bb;
>>>>> +	blt0.color_depth = blt3->color_depth;
>>>>> +	blt0.print_bb = blt3->print_bb;
>>>>> +	ext0.src = ext3->src;
>>>>> +	ext0.dst = ext3->mid;
>>>>> +	bb_pos = emit_blt_block_copy(i915, ahnd, &blt0, &ext0, bb_pos, false);
>>>>> +
>>>>> +	/* Second blit mid -> dst */
>>>>> +	memset(&blt0, 0, sizeof(blt0));
>>>>> +	blt0.src = blt3->mid;
>>>>> +	blt0.dst = blt3->dst;
>>>>> +	blt0.bb = blt3->bb;
>>>>> +	blt0.color_depth = blt3->color_depth;
>>>>> +	blt0.print_bb = blt3->print_bb;
>>>>> +	ext0.src = ext3->mid;
>>>>> +	ext0.dst = ext3->dst;
>>>>> +	bb_pos = emit_blt_block_copy(i915, ahnd, &blt0, &ext0, bb_pos, false);
>>>>> +
>>>>> +	/* Third blit dst -> final */
>>>>> +	memset(&blt0, 0, sizeof(blt0));
>>>>> +	blt0.src = blt3->dst;
>>>>> +	blt0.dst = blt3->final;
>>>>> +	blt0.bb = blt3->bb;
>>>>> +	blt0.color_depth = blt3->color_depth;
>>>>> +	blt0.print_bb = blt3->print_bb;
>>>>> +	ext0.src = ext3->dst;
>>>>> +	ext0.dst = ext3->final;
>>>>> +	bb_pos = emit_blt_block_copy(i915, ahnd, &blt0, &ext0, bb_pos, true);
>>>>> +
>>>>> +	i = 0;
>>>>> +	FILL_OBJ(i, blt3->src.handle, CANONICAL(src_offset), 0);
>>>>> +	FILL_OBJ(i, blt3->mid.handle, CANONICAL(mid_offset), EXEC_OBJECT_WRITE);
>>>>> +	if (mid_offset != dst_offset)
>>>>> +		FILL_OBJ(i, blt3->dst.handle, CANONICAL(dst_offset), EXEC_OBJECT_WRITE);
>>>>> +	FILL_OBJ(i, blt3->final.handle, CANONICAL(final_offset), 0);
>>>>> +	FILL_OBJ(i, blt3->bb.handle, CANONICAL(bb_offset), 0);
>>>>> +
>>>>> +	execbuf.buffer_count = i;
>>>>> +
>>>>> +	for (int __i = 0; __i < i; __i++)
>>>>> +		igt_debug("obj[%d].offset: %llx, handle: %u\n",
>>>>> +			  __i, (long long) obj[__i].offset, obj[__i].handle);
>>>>> +	execbuf.buffers_ptr = to_user_pointer(obj);
>>>>> +	execbuf.rsvd1 = ctx ? ctx->id : 0;
>>>>> +	execbuf.flags = e ? e->flags : I915_EXEC_BLT;
>>>>> +	ret = __gem_execbuf(i915, &execbuf);
>>>>> +
>>>>> +	gem_sync(i915, blt3->bb.handle);
>>>>> +	munmap(bb, blt3->bb.size);
>>>>> +
>>>>> +	return ret;
>>>>> +}
>>>>> +
>>>>>     static void block_copy(int i915,
>>>>>     		       const intel_ctx_t *ctx,
>>>>>     		       const struct intel_execution_engine2 *e,
>>>>> @@ -380,10 +493,100 @@ static void block_copy(int i915,
>>>>>     	igt_assert_f(!result, "source and destination surfaces differs!\n");
>>>>>     }
>>>>> +static void block_multicopy(int i915,
>>>>> +			    const intel_ctx_t *ctx,
>>>>> +			    const struct intel_execution_engine2 *e,
>>>>> +			    uint32_t region1, uint32_t region2,
>>>>> +			    enum blt_tiling mid_tiling,
>>>>> +			    const struct test_config *config)
>>>>> +{
>>>>> +	struct blt_copy3_data blt3 = {};
>>>>> +	struct blt_block_copy3_data_ext ext3 = {}, *pext3 = &ext3;
>>>>> +	struct blt_copy_object *src, *mid, *dst, *final;
>>>>> +	const uint32_t bpp = 32;
>>>>> +	uint64_t bb_size = 4096;
>>>>> +	uint64_t ahnd = get_reloc_ahnd(i915, ctx->id);
>>>>> +	uint32_t run_id = mid_tiling;
>>>>> +	uint32_t mid_region = region2, bb;
>>>>> +	uint32_t width = param.width, height = param.height;
>>>>> +	enum blt_compression mid_compression = config->compression;
>>>>> +	int mid_compression_format = param.compression_format;
>>>>> +	enum blt_compression_type comp_type = COMPRESSION_TYPE_3D;
>>>>> +	uint8_t uc_mocs = intel_get_uc_mocs(i915);
>>>>> +	int result;
>>>>> +
>>>>> +	igt_assert(__gem_create_in_memory_regions(i915, &bb, &bb_size, region1) == 0);
>>>>> +
>>>>> +	if (!blt_supports_compression(i915))
>>>>> +		pext3 = NULL;
>>>>> +
>>>>> +	src = create_object(i915, region1, width, height, bpp, uc_mocs,
>>>>> +			    T_LINEAR, COMPRESSION_DISABLED, comp_type, true);
>>>>> +	mid = create_object(i915, mid_region, width, height, bpp, uc_mocs,
>>>>> +			    mid_tiling, mid_compression, comp_type, true);
>>>>> +	dst = create_object(i915, region1, width, height, bpp, uc_mocs,
>>>>> +			    mid_tiling, COMPRESSION_DISABLED, comp_type, true);
>>>>> +	final = create_object(i915, region1, width, height, bpp, uc_mocs,
>>>>> +			    T_LINEAR, COMPRESSION_DISABLED, comp_type, true);
>>>>> +	igt_assert(src->size == dst->size);
>>>>> +	PRINT_SURFACE_INFO("src", src);
>>>>> +	PRINT_SURFACE_INFO("mid", mid);
>>>>> +	PRINT_SURFACE_INFO("dst", dst);
>>>>> +	PRINT_SURFACE_INFO("final", final);
>>>>> +
>>>>> +	blt_surface_fill_rect(i915, src, width, height);
>>>>> +
>>>>> +	memset(&blt3, 0, sizeof(blt3));
>>>>> +	blt3.color_depth = CD_32bit;
>>>>> +	blt3.print_bb = param.print_bb;
>>>>> +	set_blt_object(&blt3.src, src);
>>>>> +	set_blt_object(&blt3.mid, mid);
>>>>> +	set_blt_object(&blt3.dst, dst);
>>>>> +	set_blt_object(&blt3.final, final);
>>>>> +
>>>>> +	if (config->inplace) {
>>>>> +		set_object(&blt3.dst, mid->handle, dst->size, mid->region, mid->mocs,
>>>>> +			   mid_tiling, COMPRESSION_DISABLED, comp_type);
>>>>> +		blt3.dst.ptr = mid->ptr;
>>>>> +	}
>>>>> +
>>>>> +	set_object_ext(&ext3.src, 0, width, height, SURFACE_TYPE_2D);
>>>>> +	set_object_ext(&ext3.mid, mid_compression_format, width, height, SURFACE_TYPE_2D);
>>>>> +	set_object_ext(&ext3.dst, 0, width, height, SURFACE_TYPE_2D);
>>>>> +	set_object_ext(&ext3.final, 0, width, height, SURFACE_TYPE_2D);
>>>>> +	set_batch(&blt3.bb, bb, bb_size, region1);
>>>>> +
>>>>> +	blt_block_copy3(i915, ctx, e, ahnd, &blt3, pext3);
>>>>> +	gem_sync(i915, blt3.final.handle);
>>>>> +
>>>>> +	WRITE_PNG(i915, run_id, "src", &blt3.src, width, height);
>>>>> +	if (!config->inplace)
>>>>> +		WRITE_PNG(i915, run_id, "mid", &blt3.mid, width, height);
>>>>> +	WRITE_PNG(i915, run_id, "dst", &blt3.dst, width, height);
>>>>> +	WRITE_PNG(i915, run_id, "final", &blt3.final, width, height);
>>>>> +
>>>>> +	result = memcmp(src->ptr, blt3.final.ptr, src->size);
>>>>> +
>>>>> +	destroy_object(i915, src);
>>>>> +	destroy_object(i915, mid);
>>>>> +	destroy_object(i915, dst);
>>>>> +	destroy_object(i915, final);
>>>>> +	gem_close(i915, bb);
>>>>> +	put_ahnd(ahnd);
>>>>> +
>>>>> +	igt_assert_f(!result, "source and destination surfaces differs!\n");
>>>>> +}
>>>>> +
>>>>> +enum copy_func {
>>>>> +	BLOCK_COPY,
>>>>> +	BLOCK_MULTICOPY,
>>>>> +};
>>>>> +
>>>>
>>>> I was thinking if we need a simple case here (i.e. one emit, src->dst)
>>>
>>> What tiling you want to blit? linear -> linear? linear -> tileN? How to
>>> verify it works? fmt1 -> fmt2 -> fmt1 is equal to fmt1 -> fmt2 (detile
>>> fmt2 -> linear on cpu).
>>>
>>> At the moment we don't verify middle surface, only assume src == dst
>>> is fine with middle blit.
>>
>> I thought about linear->linear in the beginning, but maybe it would make
>> more sense to wait for predicates that can check the middle layer and work
>> with different tilings. It can stay like this for now.
>>
>> Many thanks,
>> Karolina
>>
>>>
>>> --
>>> Zbigniew
>>>
>>>>
>>>>>     static void block_copy_test(int i915,
>>>>>     			    const struct test_config *config,
>>>>>     			    const intel_ctx_t *ctx,
>>>>> -			    struct igt_collection *set)
>>>>> +			    struct igt_collection *set,
>>>>> +			    enum copy_func copy_function)
>>>>>     {
>>>>>     	struct igt_collection *regions;
>>>>>     	const struct intel_execution_engine2 *e;
>>>>> @@ -415,15 +618,27 @@ static void block_copy_test(int i915,
>>>>>     					continue;
>>>>>     				regtxt = memregion_dynamic_subtest_name(regions);
>>>>> -				igt_dynamic_f("%s-%s-compfmt%d-%s",
>>>>> -					      blt_tiling_name(tiling),
>>>>> -					      config->compression ?
>>>>> -						      "compressed" : "uncompressed",
>>>>> -					      param.compression_format, regtxt) {
>>>>> -					block_copy(i915, ctx, e,
>>>>> -						   region1, region2,
>>>>> -						   tiling, config);
>>>>> -				}
>>>>> +
>>>>> +				if (copy_function == BLOCK_COPY)
>>>>> +					igt_dynamic_f("%s-%s-compfmt%d-%s",
>>>>> +						      blt_tiling_name(tiling),
>>>>> +						      config->compression ?
>>>>> +							      "compressed" : "uncompressed",
>>>>> +						      param.compression_format, regtxt) {
>>>>> +						block_copy(i915, ctx, e,
>>>>> +							   region1, region2,
>>>>> +							   tiling, config);
>>>>> +					}
>>>>> +				else if (copy_function == BLOCK_MULTICOPY)
>>>>> +					igt_dynamic_f("%s-%s-compfmt%d-%s-multicopy",
>>>>> +						      blt_tiling_name(tiling),
>>>>> +						      config->compression ?
>>>>> +							      "compressed" : "uncompressed",
>>>>> +						      param.compression_format, regtxt) {
>>>>> +						block_multicopy(i915, ctx, e,
>>>>> +								region1, region2,
>>>>> +								tiling, config);
>>>>> +					}
>>>>
>>>> We could avoid repetition to some extent if we had introduced a macro that
>>>> accepts a function pointer and/or some config data. But I don't feel
>>>> strongly about it, just putting it out there.
>>>>
>>>> Many thanks,
>>>> Karolina
>>>>
>>>>>     				free(regtxt);
>>>>>     			}
>>>>>     		}
>>>>> @@ -506,14 +721,21 @@ igt_main_args("bf:pst:W:H:", NULL, help_str, opt_handler, NULL)
>>>>>     	igt_subtest_with_dynamic("block-copy-uncompressed") {
>>>>>     		struct test_config config = {};
>>>>> -		block_copy_test(i915, &config, ctx, set);
>>>>> +		block_copy_test(i915, &config, ctx, set, BLOCK_COPY);
>>>>>     	}
>>>>>     	igt_describe("Check block-copy flatccs compressed blit");
>>>>>     	igt_subtest_with_dynamic("block-copy-compressed") {
>>>>>     		struct test_config config = { .compression = true };
>>>>> -		block_copy_test(i915, &config, ctx, set);
>>>>> +		block_copy_test(i915, &config, ctx, set, BLOCK_COPY);
>>>>> +	}
>>>>> +
>>>>> +	igt_describe("Check block-multicopy flatccs compressed blit");
>>>>> +	igt_subtest_with_dynamic("block-multicopy-compressed") {
>>>>> +		struct test_config config = { .compression = true };
>>>>> +
>>>>> +		block_copy_test(i915, &config, ctx, set, BLOCK_MULTICOPY);
>>>>>     	}
>>>>>     	igt_describe("Check block-copy flatccs inplace decompression blit");
>>>>> @@ -521,7 +743,15 @@ igt_main_args("bf:pst:W:H:", NULL, help_str, opt_handler, NULL)
>>>>>     		struct test_config config = { .compression = true,
>>>>>     					      .inplace = true };
>>>>> -		block_copy_test(i915, &config, ctx, set);
>>>>> +		block_copy_test(i915, &config, ctx, set, BLOCK_COPY);
>>>>> +	}
>>>>> +
>>>>> +	igt_describe("Check block-multicopy flatccs inplace decompression blit");
>>>>> +	igt_subtest_with_dynamic("block-multicopy-inplace") {
>>>>> +		struct test_config config = { .compression = true,
>>>>> +					      .inplace = true };
>>>>> +
>>>>> +		block_copy_test(i915, &config, ctx, set, BLOCK_MULTICOPY);
>>>>>     	}
>>>>>     	igt_describe("Check flatccs data can be copied from/to surface");
>>>>> @@ -529,7 +759,7 @@ igt_main_args("bf:pst:W:H:", NULL, help_str, opt_handler, NULL)
>>>>>     		struct test_config config = { .compression = true,
>>>>>     					      .surfcopy = true };
>>>>> -		block_copy_test(i915, &config, ctx, set);
>>>>> +		block_copy_test(i915, &config, ctx, set, BLOCK_COPY);
>>>>>     	}
>>>>>     	igt_describe("Check flatccs data are physically tagged and visible"
>>>>> @@ -539,7 +769,7 @@ igt_main_args("bf:pst:W:H:", NULL, help_str, opt_handler, NULL)
>>>>>     					      .surfcopy = true,
>>>>>     					      .new_ctx = true };
>>>>> -		block_copy_test(i915, &config, ctx, set);
>>>>> +		block_copy_test(i915, &config, ctx, set, BLOCK_COPY);
>>>>>     	}
>>>>>     	igt_describe("Check flatccs data persists after suspend / resume (S0)");
>>>>> @@ -548,7 +778,7 @@ igt_main_args("bf:pst:W:H:", NULL, help_str, opt_handler, NULL)
>>>>>     					      .surfcopy = true,
>>>>>     					      .suspend_resume = true };
>>>>> -		block_copy_test(i915, &config, ctx, set);
>>>>> +		block_copy_test(i915, &config, ctx, set, BLOCK_COPY);
>>>>>     	}
>>>>>     	igt_fixture {


More information about the igt-dev mailing list