[igt-dev] [PATCH i-g-t 01/15] perf_pmu: Support multi-tile in rc6 subtest

Tvrtko Ursulin tvrtko.ursulin at linux.intel.com
Fri May 12 12:14:37 UTC 2023


On 12/05/2023 03:28, Dixit, Ashutosh wrote:
> On Fri, 05 May 2023 17:55:14 -0700, Umesh Nerlige Ramappa wrote:
>>
> 
> Hi Umesh/Tvrtko,
> 
>> From: Tvrtko Ursulin <tvrtko.ursulin at intel.com>
>>
>> Teach test how to wake up a particular tile and make it iterate all of
>> them using dynamic subtests.
>>
>> v2: Finalize SHIFT to 60. Drop FIXME from i915_drm.h
>>
>> Signed-off-by: Tvrtko Ursulin <tvrtko.ursulin at intel.com>
>> Signed-off-by: Umesh Nerlige Ramappa <umesh.nerlige.ramappa at intel.com>
>> ---
>>   include/drm-uapi/i915_drm.h | 17 ++++++++++++++-
>>   tests/i915/perf_pmu.c       | 41 ++++++++++++++++++++++++++-----------
>>   2 files changed, 45 insertions(+), 13 deletions(-)
>>
>> diff --git a/include/drm-uapi/i915_drm.h b/include/drm-uapi/i915_drm.h
>> index a0876ee41..e164ad014 100644
>> --- a/include/drm-uapi/i915_drm.h
>> +++ b/include/drm-uapi/i915_drm.h
>> @@ -280,7 +280,16 @@ enum drm_i915_pmu_engine_sample {
>>   #define I915_PMU_ENGINE_SEMA(class, instance) \
>> 	__I915_PMU_ENGINE(class, instance, I915_SAMPLE_SEMA)
>>
>> -#define __I915_PMU_OTHER(x) (__I915_PMU_ENGINE(0xff, 0xff, 0xf) + 1 + (x))
>> +/*
>> + * Top 4 bits of every non-engine counter are GT id.
>> + */
>> +#define __I915_PMU_GT_SHIFT (60)
>> +
>> +#define ___I915_PMU_OTHER(gt, x) \
>> +	(((__u64)__I915_PMU_ENGINE(0xff, 0xff, 0xf) + 1 + (x)) | \
>> +	((__u64)(gt) << __I915_PMU_GT_SHIFT))
>> +
>> +#define __I915_PMU_OTHER(x) ___I915_PMU_OTHER(0, x)
> 
> Typically we don't modify include/drm-uapi/i915_drm.h directly, it is
> sync'd with the kernel.
> 
> So maybe let's add the above to lib/i915/i915_drm_local.h.
> 
>>
>>   #define I915_PMU_ACTUAL_FREQUENCY	__I915_PMU_OTHER(0)
>>   #define I915_PMU_REQUESTED_FREQUENCY	__I915_PMU_OTHER(1)
>> @@ -290,6 +299,12 @@ enum drm_i915_pmu_engine_sample {
>>
>>   #define I915_PMU_LAST /* Deprecated - do not use */ I915_PMU_RC6_RESIDENCY
>>
>> +#define __I915_PMU_ACTUAL_FREQUENCY(gt)		___I915_PMU_OTHER(gt, 0)
>> +#define __I915_PMU_REQUESTED_FREQUENCY(gt)	___I915_PMU_OTHER(gt, 1)
>> +#define __I915_PMU_INTERRUPTS(gt)		___I915_PMU_OTHER(gt, 2)
>> +#define __I915_PMU_RC6_RESIDENCY(gt)		___I915_PMU_OTHER(gt, 3)
>> +#define __I915_PMU_SOFTWARE_GT_AWAKE_TIME(gt)	___I915_PMU_OTHER(gt, 4)
>> +
>>   /* Each region is a minimum of 16k, and there are at most 255 of them.
>>    */
>>   #define I915_NR_TEX_REGIONS 255	/* table size 2k - maximum due to use
>> diff --git a/tests/i915/perf_pmu.c b/tests/i915/perf_pmu.c
>> index c5f083bbd..97ad09d76 100644
>> --- a/tests/i915/perf_pmu.c
>> +++ b/tests/i915/perf_pmu.c
>> @@ -1707,8 +1707,16 @@ static bool wait_for_suspended(int gem_fd)
>> 	return suspended;
>>   }
>>
>> +static int open_forcewake_handle(int fd, unsigned int gt)
>> +{
>> +	if (getenv("IGT_NO_FORCEWAKE"))
>> +		return -1;
>> +
>> +	return igt_debugfs_gt_open(fd, gt, "forcewake_user", O_WRONLY);
>> +}
> 
> Let's create a new function igt_open_forcewake_gt_handle() below
> igt_open_forcewake_handle() in lib/igt_gt.c and add this code there so the
> code can be shared.

Typically we'd move to lib/ only when there are 2-3 callers and so it is 
clear helper is useful. Don't know, I am okay either way.

>> +
>>   static void
>> -test_rc6(int gem_fd, unsigned int flags)
>> +test_rc6(int gem_fd, unsigned int gt, unsigned int flags)
>>   {
>> 	int64_t duration_ns = 2e9;
>> 	uint64_t idle, busy, prev, ts[2];
>> @@ -1717,7 +1725,7 @@ test_rc6(int gem_fd, unsigned int flags)
>>
>> 	gem_quiescent_gpu(gem_fd);
>>
>> -	fd = open_pmu(gem_fd, I915_PMU_RC6_RESIDENCY);
>> +	fd = open_pmu(gem_fd, __I915_PMU_RC6_RESIDENCY(gt));
>>
>> 	if (flags & TEST_RUNTIME_PM) {
>> 		drmModeRes *res;
>> @@ -1784,8 +1792,8 @@ test_rc6(int gem_fd, unsigned int flags)
>> 	assert_within_epsilon(idle - prev, ts[1] - ts[0], tolerance);
>>
>> 	/* Wake up device and check no RC6. */
>> -	fw = igt_open_forcewake_handle(gem_fd);
>> -	igt_assert(fw >= 0);
>> +	fw = open_forcewake_handle(gem_fd, gt);
>> +	igt_require(fw >= 0);
> 
> Why not igt_assert?

It probably was to support running the test on old kernels. Although I 
am not sure if recently we have been disciplined enough with this 
requirement.

>> 	usleep(1e3); /* wait for the rc6 cycle counter to stop ticking */
>>
>> 	prev = pmu_read_single(fd);
>> @@ -2174,12 +2182,17 @@ static void pmu_read(int i915)
>> 		for_each_if((e)->class == I915_ENGINE_CLASS_RENDER) \
>> 			igt_dynamic_f("%s", e->name)
>>
>> +#define for_each_gt(i915, gtid, tmp) \
>> +	for ((gtid) = 0; \
>> +	     ((tmp) = igt_sysfs_gt_open((i915), (gtid))) != -1; \
>> +	     close(tmp), (gtid)++)
> 
> Use i915_for_each_gt from lib/ here.

Yeah I guess these patches predate much of the IGT code added for 
supporting multi-tile in the upstream since. Shrug.

Regards,

Tvrtko

> 
> Thanks.
> --
> Ashutosh
> 
>> +
>>   igt_main
>>   {
>> 	const struct intel_execution_engine2 *e;
>> 	unsigned int num_engines = 0;
>> 	const intel_ctx_t *ctx = NULL;
>> -	int fd = -1;
>> +	int gt, tmp, fd = -1;
>>
>> 	/**
>> 	 * All PMU should be accompanied by a test.
>> @@ -2396,17 +2409,21 @@ igt_main
>> 	/**
>> 	 * Test RC6 residency reporting.
>> 	 */
>> -	igt_subtest("rc6")
>> -		test_rc6(fd, 0);
>> +	igt_subtest_with_dynamic("rc6") {
>> +		for_each_gt(fd, gt, tmp) {
>> +			igt_dynamic_f("gt%u", gt)
>> +				test_rc6(fd, gt, 0);
>>
>> -	igt_subtest("rc6-runtime-pm")
>> -		test_rc6(fd, TEST_RUNTIME_PM);
>> +			igt_dynamic_f("runtime-pm-gt%u", gt)
>> +				test_rc6(fd, gt, TEST_RUNTIME_PM);
>>
>> -	igt_subtest("rc6-runtime-pm-long")
>> -		test_rc6(fd, TEST_RUNTIME_PM | FLAG_LONG);
>> +			igt_dynamic_f("runtime-pm-long-gt%u", gt)
>> +				test_rc6(fd, gt, TEST_RUNTIME_PM | FLAG_LONG);
>> +		}
>> +	}
>>
>> 	igt_subtest("rc6-suspend")
>> -		test_rc6(fd, TEST_S3);
>> +		test_rc6(fd, 0, TEST_S3);
>>
>> 	/**
>> 	 * Test GT wakeref tracking (similar to RC0, opposite of RC6)
>> --
>> 2.34.1
>>


More information about the igt-dev mailing list