[Intel-gfx] [PATCH] drm/i915/guc/slpc: Add a new SLPC selftest

Dixit, Ashutosh ashutosh.dixit at intel.com
Wed Jun 22 20:32:51 UTC 2022


On Fri, 10 Jun 2022 16:47:12 -0700, Vinay Belgaumkar wrote:
>
> This test will validate we can achieve actual frequency of RP0. Pcode
> grants frequencies based on what GuC is requesting. However, thermal
> throttling can limit what is being granted. Add a test to request for
> max, but don't fail the test if RP0 is not granted due to throttle
> reasons.
>
> Also optimize the selftest by using a common run_test function to avoid
> code duplication.

The refactoring does change the order of operations (changing the freq vs
spawning the spinner) but should be fine I think.

> Rename the "clamp" tests to vary_max_freq and vary_min_freq.

Either is ok, but maybe "clamp" names were ok I think since they verify req
freq is clamped at min/max.

>
> v2: Fix compile warning
>
> Fixes 8ee2c227822e ("drm/i915/guc/slpc: Add SLPC selftest")
> Signed-off-by: Vinay Belgaumkar <vinay.belgaumkar at intel.com>
> ---
>  drivers/gpu/drm/i915/gt/selftest_slpc.c | 323 ++++++++++++------------
>  1 file changed, 158 insertions(+), 165 deletions(-)
>
> diff --git a/drivers/gpu/drm/i915/gt/selftest_slpc.c b/drivers/gpu/drm/i915/gt/selftest_slpc.c
> index b768cea5943d..099129aae9a5 100644
> --- a/drivers/gpu/drm/i915/gt/selftest_slpc.c
> +++ b/drivers/gpu/drm/i915/gt/selftest_slpc.c
> @@ -8,6 +8,11 @@
>  #define delay_for_h2g() usleep_range(H2G_DELAY, H2G_DELAY + 10000)
>  #define FREQUENCY_REQ_UNIT	DIV_ROUND_CLOSEST(GT_FREQUENCY_MULTIPLIER, \
>						  GEN9_FREQ_SCALER)
> +enum test_type {
> +	VARY_MIN,
> +	VARY_MAX,
> +	MAX_GRANTED
> +};
>
>  static int slpc_set_min_freq(struct intel_guc_slpc *slpc, u32 freq)
>  {
> @@ -36,147 +41,120 @@ static int slpc_set_max_freq(struct intel_guc_slpc *slpc, u32 freq)
>	return ret;
>  }
>
> -static int live_slpc_clamp_min(void *arg)
> +static int vary_max_freq(struct intel_guc_slpc *slpc, struct intel_rps *rps,
> +		  u32 *max_act_freq)

Please run checkpatch, indentation seems off.

>  {
> -	struct drm_i915_private *i915 = arg;
> -	struct intel_gt *gt = to_gt(i915);
> -	struct intel_guc_slpc *slpc = &gt->uc.guc.slpc;
> -	struct intel_rps *rps = &gt->rps;
> -	struct intel_engine_cs *engine;
> -	enum intel_engine_id id;
> -	struct igt_spinner spin;
> +	u32 step, max_freq, req_freq;
> +	u32 act_freq;
>	u32 slpc_min_freq, slpc_max_freq;
>	int err = 0;
>
> -	if (!intel_uc_uses_guc_slpc(&gt->uc))
> -		return 0;
> -
> -	if (igt_spinner_init(&spin, gt))
> -		return -ENOMEM;
> +	slpc_min_freq = slpc->min_freq;
> +	slpc_max_freq = slpc->rp0_freq;

nit but we don't really need such variables since we don't change their
values, we should just use slpc->min_freq, slpc->rp0_freq directly. I'd
change this in all places in this patch.

>
> -	if (intel_guc_slpc_get_max_freq(slpc, &slpc_max_freq)) {
> -		pr_err("Could not get SLPC max freq\n");
> -		return -EIO;
> -	}
> -
> -	if (intel_guc_slpc_get_min_freq(slpc, &slpc_min_freq)) {
> -		pr_err("Could not get SLPC min freq\n");
> -		return -EIO;

Why do we need these two function calls? Can't we just use slpc->rp0_freq
and slpc->min_freq as we are doing in the vary_min/max_freq() functions
above?

Also, as mentioned below I think here we should just do:

        slpc_set_max_freq(slpc, slpc->rp0_freq);
        slpc_set_min_freq(slpc, slpc->min_freq);

to restore freq to a known state before starting the test (just in case a
previous test changed the values).

> -	}
> -
> -	if (slpc_min_freq == slpc_max_freq) {
> -		pr_err("Min/Max are fused to the same value\n");
> -		return -EINVAL;

What if they are actually equal? I think basically the max/min freq test
loops will just not be entered (so effectively the tests will just
skip). The granted freq test will be fine. So I think we can just delete
this if statement?

(It is showing deleted above in the patch but is in the new code somewhere
too).

> -	}
> -
> -	intel_gt_pm_wait_for_idle(gt);
> -	intel_gt_pm_get(gt);
> -	for_each_engine(engine, gt, id) {
> -		struct i915_request *rq;
> -		u32 step, min_freq, req_freq;
> -		u32 act_freq, max_act_freq;
> -
> -		if (!intel_engine_can_store_dword(engine))
> -			continue;
> +	/* Go from max to min in 5 steps */
> +	step = (slpc_max_freq - slpc_min_freq) / NUM_STEPS;
> +	*max_act_freq = slpc_min_freq;
> +	for (max_freq = slpc_max_freq; max_freq > slpc_min_freq;
> +				max_freq -= step) {
> +		err = slpc_set_max_freq(slpc, max_freq);
> +		if (err)
> +			break;
>
> -		/* Go from min to max in 5 steps */
> -		step = (slpc_max_freq - slpc_min_freq) / NUM_STEPS;
> -		max_act_freq = slpc_min_freq;
> -		for (min_freq = slpc_min_freq; min_freq < slpc_max_freq;
> -					min_freq += step) {
> -			err = slpc_set_min_freq(slpc, min_freq);
> -			if (err)
> -				break;
> -
> -			st_engine_heartbeat_disable(engine);
> -
> -			rq = igt_spinner_create_request(&spin,
> -							engine->kernel_context,
> -							MI_NOOP);
> -			if (IS_ERR(rq)) {
> -				err = PTR_ERR(rq);
> -				st_engine_heartbeat_enable(engine);
> -				break;
> -			}
> +		req_freq = intel_rps_read_punit_req_frequency(rps);
>
> -			i915_request_add(rq);
> +		/* GuC requests freq in multiples of 50/3 MHz */
> +		if (req_freq > (max_freq + FREQUENCY_REQ_UNIT)) {
> +			pr_err("SWReq is %d, should be at most %d\n", req_freq,
> +				max_freq + FREQUENCY_REQ_UNIT);
> +			err = -EINVAL;

Probably a nit but check can be (so should we be checking both high and low
limits?):
		if (req_freq > (max_freq + FREQUENCY_REQ_UNIT) ||
		    req_freq < (slpc_min_freq - FREQUENCY_REQ_UNIT))

Though if we do this we'd need to change the pr_err() or have two separate
if statements. Not sure if it's worth it but thought I'll mention it.

> +static int vary_min_freq(struct intel_guc_slpc *slpc, struct intel_rps *rps,
> +		  u32 *max_act_freq)
> +{
> +	u32 step, min_freq, req_freq;
> +	u32 act_freq;
> +	u32 slpc_min_freq, slpc_max_freq;
> +	int err = 0;
>
> -			act_freq =  intel_rps_read_actual_frequency(rps);
> -			if (act_freq > max_act_freq)
> -				max_act_freq = act_freq;
> +	slpc_min_freq = slpc->min_freq;
> +	slpc_max_freq = slpc->rp0_freq;
>
> -			igt_spinner_end(&spin);
> -			st_engine_heartbeat_enable(engine);
> -		}
> +	/* Go from min to max in 5 steps */
> +	step = (slpc_max_freq - slpc_min_freq) / NUM_STEPS;
> +	*max_act_freq = slpc_min_freq;
> +	for (min_freq = slpc_min_freq; min_freq < slpc_max_freq;
> +				min_freq += step) {
> +		err = slpc_set_min_freq(slpc, min_freq);
> +		if (err)
> +			break;
>
> -		pr_info("Max actual frequency for %s was %d\n",
> -			engine->name, max_act_freq);
> +		req_freq = intel_rps_read_punit_req_frequency(rps);
>
> -		/* Actual frequency should rise above min */
> -		if (max_act_freq == slpc_min_freq) {

Nit again. This check is somewhere in the new code but I think a better
check is

		if (max_act_freq <= slpc_min_freq)

just in case the act freq for whatever reason falls below
slpc_min_freq. Even if we know this is impossible (bugs make the impossible
possible).

> -			pr_err("Actual freq did not rise above min\n");
> +		/* GuC requests freq in multiples of 50/3 MHz */
> +		if (req_freq < (min_freq - FREQUENCY_REQ_UNIT)) {
> +			pr_err("SWReq is %d, should be at least %d\n", req_freq,
> +				min_freq - FREQUENCY_REQ_UNIT);
>			err = -EINVAL;

Again nit as above, but check can be:
		if (req_freq < (min_freq - FREQUENCY_REQ_UNIT) ||
		    req_freq > (slpc_max_freq + FREQUENCY_REQ_UNIT)) {

>		}
>
> +		act_freq =  intel_rps_read_actual_frequency(rps);
> +		if (act_freq > *max_act_freq)
> +			*max_act_freq = act_freq;
> +
>		if (err)
>			break;
>	}
>
> -	/* Restore min/max frequencies */
> -	slpc_set_max_freq(slpc, slpc_max_freq);
> -	slpc_set_min_freq(slpc, slpc_min_freq);
> +	return err;
> +}
>
> -	if (igt_flush_test(gt->i915))
> -		err = -EIO;
> +static int max_granted_freq(struct intel_guc_slpc *slpc, struct intel_rps *rps, u32 *max_act_freq)
> +{
> +	struct intel_gt *gt = rps_to_gt(rps);
> +	u32 perf_limit_reasons;
> +	int err = 0;
>
> -	intel_gt_pm_put(gt);
> -	igt_spinner_fini(&spin);
> -	intel_gt_pm_wait_for_idle(gt);
> +	err = slpc_set_min_freq(slpc, slpc->rp0_freq);
> +	if (err)
> +		return err;
> +
> +	*max_act_freq =  intel_rps_read_actual_frequency(rps);
> +	if (!(*max_act_freq == slpc->rp0_freq)) {
> +		/* Check if there was some throttling by pcode */
> +		perf_limit_reasons = intel_uncore_read(gt->uncore, GT0_PERF_LIMIT_REASONS);
> +
> +		/* If not, this is an error */
> +		if (perf_limit_reasons && GT0_PERF_LIMIT_REASONS_MASK) {
> +			pr_err("Pcode did not grant max freq\n");
> +			err = -EINVAL;

Looks incorrect, probably something like:
		if (!(perf_limit_reasons & GT0_PERF_LIMIT_REASONS_MASK))

> +		}
> +	}
>
>	return err;
>  }
>
> -static int live_slpc_clamp_max(void *arg)
> +static int run_test(struct intel_gt *gt, int test_type)
>  {
> -	struct drm_i915_private *i915 = arg;
> -	struct intel_gt *gt = to_gt(i915);
> -	struct intel_guc_slpc *slpc;
> -	struct intel_rps *rps;
> +	struct intel_guc_slpc *slpc = &gt->uc.guc.slpc;
> +	struct intel_rps *rps = &gt->rps;
>	struct intel_engine_cs *engine;
>	enum intel_engine_id id;
>	struct igt_spinner spin;
> -	int err = 0;
>	u32 slpc_min_freq, slpc_max_freq;
> -
> -	slpc = &gt->uc.guc.slpc;
> -	rps = &gt->rps;
> +	int err = 0;
>
>	if (!intel_uc_uses_guc_slpc(&gt->uc))
>		return 0;
> @@ -203,69 +181,56 @@ static int live_slpc_clamp_max(void *arg)
>	intel_gt_pm_get(gt);
>	for_each_engine(engine, gt, id) {
>		struct i915_request *rq;
> -		u32 max_freq, req_freq;
> -		u32 act_freq, max_act_freq;
> -		u32 step;
> +		u32 max_act_freq;
>
>		if (!intel_engine_can_store_dword(engine))
>			continue;
>
> -		/* Go from max to min in 5 steps */
> -		step = (slpc_max_freq - slpc_min_freq) / NUM_STEPS;
> -		max_act_freq = slpc_min_freq;
> -		for (max_freq = slpc_max_freq; max_freq > slpc_min_freq;
> -					max_freq -= step) {
> -			err = slpc_set_max_freq(slpc, max_freq);
> -			if (err)
> -				break;
> -
> -			st_engine_heartbeat_disable(engine);
> -
> -			rq = igt_spinner_create_request(&spin,
> -							engine->kernel_context,
> -							MI_NOOP);
> -			if (IS_ERR(rq)) {
> -				st_engine_heartbeat_enable(engine);
> -				err = PTR_ERR(rq);
> -				break;
> -			}
> +		st_engine_heartbeat_disable(engine);
>
> -			i915_request_add(rq);
> +		rq = igt_spinner_create_request(&spin,
> +						engine->kernel_context,
> +						MI_NOOP);
> +		if (IS_ERR(rq)) {
> +			err = PTR_ERR(rq);
> +			st_engine_heartbeat_enable(engine);
> +			break;
> +		}
>
> -			if (!igt_wait_for_spinner(&spin, rq)) {
> -				pr_err("%s: SLPC spinner did not start\n",
> -				       engine->name);
> -				igt_spinner_end(&spin);
> -				st_engine_heartbeat_enable(engine);
> -				intel_gt_set_wedged(engine->gt);
> -				err = -EIO;
> -				break;
> -			}
> +		i915_request_add(rq);
> +
> +		if (!igt_wait_for_spinner(&spin, rq)) {
> +			pr_err("%s: Spinner did not start\n",
> +			       engine->name);
> +			igt_spinner_end(&spin);
> +			st_engine_heartbeat_enable(engine);
> +			intel_gt_set_wedged(engine->gt);
> +			err = -EIO;
> +			break;
> +		}
>
> -			delay_for_h2g();
> +		switch (test_type) {
>
> -			/* Verify that SWREQ indeed was set to specific value */
> -			req_freq = intel_rps_read_punit_req_frequency(rps);
> +		case VARY_MIN:
> +			err = vary_min_freq(slpc, rps, &max_act_freq);
> +			break;
> +
> +		case VARY_MAX:
> +			err = vary_max_freq(slpc, rps, &max_act_freq);
> +			break;
>
> -			/* GuC requests freq in multiples of 50/3 MHz */
> -			if (req_freq > (max_freq + FREQUENCY_REQ_UNIT)) {
> -				pr_err("SWReq is %d, should be at most %d\n", req_freq,
> -				       max_freq + FREQUENCY_REQ_UNIT);
> +		case MAX_GRANTED:
> +			/* Media engines have a different RP0 */
> +			if ((engine->class == VIDEO_DECODE_CLASS) ||
> +			    (engine->class == VIDEO_ENHANCEMENT_CLASS)) {
>				igt_spinner_end(&spin);
>				st_engine_heartbeat_enable(engine);
> -				err = -EINVAL;
> -				break;
> +				err = 0;
> +				continue;

I think it's preferable to move this media engine code out of the main loop
into max_granted_freq() function if possible (maybe by faking max_act_freq
if needed)?

>			}
>
> -			act_freq =  intel_rps_read_actual_frequency(rps);
> -			if (act_freq > max_act_freq)
> -				max_act_freq = act_freq;
> -
> -			st_engine_heartbeat_enable(engine);
> -			igt_spinner_end(&spin);
> -
> -			if (err)
> -				break;
> +			err = max_granted_freq(slpc, rps, &max_act_freq);
> +			break;
>		}
>
>		pr_info("Max actual frequency for %s was %d\n",
> @@ -277,31 +242,59 @@ static int live_slpc_clamp_max(void *arg)
>			err = -EINVAL;
>		}
>
> -		if (igt_flush_test(gt->i915)) {
> -			err = -EIO;
> -			break;
> -		}
> +		igt_spinner_end(&spin);
> +		st_engine_heartbeat_enable(engine);
>
>		if (err)
>			break;
>	}
>
> -	/* Restore min/max freq */
> +	/* Restore min/max frequencies */
>	slpc_set_max_freq(slpc, slpc_max_freq);
>	slpc_set_min_freq(slpc, slpc_min_freq);

As mentioned above maybe we should restore at the beginning of the test too
(before the for_each_engine() loop) to start from a known state?

Anyway here maybe get rid of the variables and:

        slpc_set_max_freq(slpc, slpc->rp0_freq);
        slpc_set_min_freq(slpc, slpc->min_freq);

Thanks.
--
Ashutosh


More information about the Intel-gfx mailing list