[Intel-gfx] [PATCH 2/6] drm/i915: Store CS timestamp frequency in Hz
Lionel Landwerlin
lionel.g.landwerlin at intel.com
Wed May 13 15:08:03 UTC 2020
On 02/03/2020 16:39, Ville Syrjala wrote:
> From: Ville Syrjälä <ville.syrjala at linux.intel.com>
>
> kHz isn't accurate enough for storing the CS timestamp
> frequency on some of the platforms. Store the value
> in Hz instead.
>
> Cc: Lionel Landwerlin <lionel.g.landwerlin at intel.com>
> Signed-off-by: Ville Syrjälä <ville.syrjala at linux.intel.com>
Probably the only patch in this series where I'm qualified to review :)
Reviewed-by: Lionel Landwerlin <lionel.g.landwerlin at intel.com>
> ---
> drivers/gpu/drm/i915/i915_debugfs.c | 6 ++--
> drivers/gpu/drm/i915/i915_getparam.c | 2 +-
> drivers/gpu/drm/i915/i915_perf.c | 12 ++++----
> drivers/gpu/drm/i915/intel_device_info.c | 34 +++++++++++-----------
> drivers/gpu/drm/i915/intel_device_info.h | 2 +-
> drivers/gpu/drm/i915/selftests/i915_perf.c | 4 +--
> 6 files changed, 30 insertions(+), 30 deletions(-)
>
> diff --git a/drivers/gpu/drm/i915/i915_debugfs.c b/drivers/gpu/drm/i915/i915_debugfs.c
> index 8f2525e4ce0f..c0e54c500017 100644
> --- a/drivers/gpu/drm/i915/i915_debugfs.c
> +++ b/drivers/gpu/drm/i915/i915_debugfs.c
> @@ -1790,8 +1790,8 @@ static int i915_engine_info(struct seq_file *m, void *unused)
> seq_printf(m, "GT awake? %s [%d]\n",
> yesno(dev_priv->gt.awake),
> atomic_read(&dev_priv->gt.wakeref.count));
> - seq_printf(m, "CS timestamp frequency: %u kHz\n",
> - RUNTIME_INFO(dev_priv)->cs_timestamp_frequency_khz);
> + seq_printf(m, "CS timestamp frequency: %u Hz\n",
> + RUNTIME_INFO(dev_priv)->cs_timestamp_frequency_hz);
>
> p = drm_seq_file_printer(m);
> for_each_uabi_engine(engine, dev_priv)
> @@ -1890,7 +1890,7 @@ static int
> i915_perf_noa_delay_set(void *data, u64 val)
> {
> struct drm_i915_private *i915 = data;
> - const u32 clk = RUNTIME_INFO(i915)->cs_timestamp_frequency_khz;
> + const u32 clk = RUNTIME_INFO(i915)->cs_timestamp_frequency_hz / 1000;
>
> /*
> * This would lead to infinite waits as we're doing timestamp
> diff --git a/drivers/gpu/drm/i915/i915_getparam.c b/drivers/gpu/drm/i915/i915_getparam.c
> index 54fce81d5724..d042644b9cd2 100644
> --- a/drivers/gpu/drm/i915/i915_getparam.c
> +++ b/drivers/gpu/drm/i915/i915_getparam.c
> @@ -153,7 +153,7 @@ int i915_getparam_ioctl(struct drm_device *dev, void *data,
> return -ENODEV;
> break;
> case I915_PARAM_CS_TIMESTAMP_FREQUENCY:
> - value = 1000 * RUNTIME_INFO(i915)->cs_timestamp_frequency_khz;
> + value = RUNTIME_INFO(i915)->cs_timestamp_frequency_hz;
> break;
> case I915_PARAM_MMAP_GTT_COHERENT:
> value = INTEL_INFO(i915)->has_coherent_ggtt;
> diff --git a/drivers/gpu/drm/i915/i915_perf.c b/drivers/gpu/drm/i915/i915_perf.c
> index 716fe6e4e56c..a2f98fb08bf1 100644
> --- a/drivers/gpu/drm/i915/i915_perf.c
> +++ b/drivers/gpu/drm/i915/i915_perf.c
> @@ -1668,8 +1668,8 @@ static int alloc_noa_wait(struct i915_perf_stream *stream)
> struct i915_vma *vma;
> const u64 delay_ticks = 0xffffffffffffffff -
> DIV_ROUND_UP_ULL(atomic64_read(&stream->perf->noa_programming_delay) *
> - RUNTIME_INFO(i915)->cs_timestamp_frequency_khz,
> - 1000000);
> + RUNTIME_INFO(i915)->cs_timestamp_frequency_hz,
> + 1000000000);
> const u32 base = stream->engine->mmio_base;
> #define CS_GPR(x) GEN8_RING_CS_GPR(base, x)
> u32 *batch, *ts0, *cs, *jump;
> @@ -3466,8 +3466,8 @@ i915_perf_open_ioctl_locked(struct i915_perf *perf,
>
> static u64 oa_exponent_to_ns(struct i915_perf *perf, int exponent)
> {
> - return div_u64(1000000 * (2ULL << exponent),
> - RUNTIME_INFO(perf->i915)->cs_timestamp_frequency_khz);
> + return div_u64(1000000000 * (2ULL << exponent),
> + RUNTIME_INFO(perf->i915)->cs_timestamp_frequency_hz);
> }
>
> /**
> @@ -4359,8 +4359,8 @@ void i915_perf_init(struct drm_i915_private *i915)
> if (perf->ops.enable_metric_set) {
> mutex_init(&perf->lock);
>
> - oa_sample_rate_hard_limit = 1000 *
> - (RUNTIME_INFO(i915)->cs_timestamp_frequency_khz / 2);
> + oa_sample_rate_hard_limit =
> + RUNTIME_INFO(i915)->cs_timestamp_frequency_hz / 2;
>
> mutex_init(&perf->metrics_lock);
> idr_init(&perf->metrics_idr);
> diff --git a/drivers/gpu/drm/i915/intel_device_info.c b/drivers/gpu/drm/i915/intel_device_info.c
> index d7fe12734db8..32733535964d 100644
> --- a/drivers/gpu/drm/i915/intel_device_info.c
> +++ b/drivers/gpu/drm/i915/intel_device_info.c
> @@ -135,8 +135,8 @@ void intel_device_info_print_runtime(const struct intel_runtime_info *info,
> sseu_dump(&info->sseu, p);
>
> drm_printf(p, "rawclk rate: %u kHz\n", info->rawclk_freq);
> - drm_printf(p, "CS timestamp frequency: %u kHz\n",
> - info->cs_timestamp_frequency_khz);
> + drm_printf(p, "CS timestamp frequency: %u Hz\n",
> + info->cs_timestamp_frequency_hz);
> }
>
> static int sseu_eu_idx(const struct sseu_dev_info *sseu, int slice,
> @@ -677,12 +677,12 @@ static u32 read_reference_ts_freq(struct drm_i915_private *dev_priv)
>
> base_freq = ((ts_override & GEN9_TIMESTAMP_OVERRIDE_US_COUNTER_DIVIDER_MASK) >>
> GEN9_TIMESTAMP_OVERRIDE_US_COUNTER_DIVIDER_SHIFT) + 1;
> - base_freq *= 1000;
> + base_freq *= 1000000;
>
> frac_freq = ((ts_override &
> GEN9_TIMESTAMP_OVERRIDE_US_COUNTER_DENOMINATOR_MASK) >>
> GEN9_TIMESTAMP_OVERRIDE_US_COUNTER_DENOMINATOR_SHIFT);
> - frac_freq = 1000 / (frac_freq + 1);
> + frac_freq = 1000000 / (frac_freq + 1);
>
> return base_freq + frac_freq;
> }
> @@ -690,8 +690,8 @@ static u32 read_reference_ts_freq(struct drm_i915_private *dev_priv)
> static u32 gen10_get_crystal_clock_freq(struct drm_i915_private *dev_priv,
> u32 rpm_config_reg)
> {
> - u32 f19_2_mhz = 19200;
> - u32 f24_mhz = 24000;
> + u32 f19_2_mhz = 19200000;
> + u32 f24_mhz = 24000000;
> u32 crystal_clock = (rpm_config_reg &
> GEN9_RPM_CONFIG0_CRYSTAL_CLOCK_FREQ_MASK) >>
> GEN9_RPM_CONFIG0_CRYSTAL_CLOCK_FREQ_SHIFT;
> @@ -710,10 +710,10 @@ static u32 gen10_get_crystal_clock_freq(struct drm_i915_private *dev_priv,
> static u32 gen11_get_crystal_clock_freq(struct drm_i915_private *dev_priv,
> u32 rpm_config_reg)
> {
> - u32 f19_2_mhz = 19200;
> - u32 f24_mhz = 24000;
> - u32 f25_mhz = 25000;
> - u32 f38_4_mhz = 38400;
> + u32 f19_2_mhz = 19200000;
> + u32 f24_mhz = 24000000;
> + u32 f25_mhz = 25000000;
> + u32 f38_4_mhz = 38400000;
> u32 crystal_clock = (rpm_config_reg &
> GEN11_RPM_CONFIG0_CRYSTAL_CLOCK_FREQ_MASK) >>
> GEN11_RPM_CONFIG0_CRYSTAL_CLOCK_FREQ_SHIFT;
> @@ -735,9 +735,9 @@ static u32 gen11_get_crystal_clock_freq(struct drm_i915_private *dev_priv,
>
> static u32 read_timestamp_frequency(struct drm_i915_private *dev_priv)
> {
> - u32 f12_5_mhz = 12500;
> - u32 f19_2_mhz = 19200;
> - u32 f24_mhz = 24000;
> + u32 f12_5_mhz = 12500000;
> + u32 f19_2_mhz = 19200000;
> + u32 f24_mhz = 24000000;
>
> if (INTEL_GEN(dev_priv) <= 4) {
> /* PRMs say:
> @@ -746,7 +746,7 @@ static u32 read_timestamp_frequency(struct drm_i915_private *dev_priv)
> * hclks." (through the “Clocking Configuration”
> * (“CLKCFG”) MCHBAR register)
> */
> - return RUNTIME_INFO(dev_priv)->rawclk_freq / 16;
> + return RUNTIME_INFO(dev_priv)->rawclk_freq * 1000 / 16;
> } else if (INTEL_GEN(dev_priv) <= 8) {
> /* PRMs say:
> *
> @@ -1050,11 +1050,11 @@ void intel_device_info_runtime_init(struct drm_i915_private *dev_priv)
> drm_dbg(&dev_priv->drm, "rawclk rate: %d kHz\n", runtime->rawclk_freq);
>
> /* Initialize command stream timestamp frequency */
> - runtime->cs_timestamp_frequency_khz =
> + runtime->cs_timestamp_frequency_hz =
> read_timestamp_frequency(dev_priv);
> - if (runtime->cs_timestamp_frequency_khz) {
> + if (runtime->cs_timestamp_frequency_hz) {
> runtime->cs_timestamp_period_ns =
> - div_u64(1e6, runtime->cs_timestamp_frequency_khz);
> + div_u64(1e9, runtime->cs_timestamp_frequency_hz);
> drm_dbg(&dev_priv->drm,
> "CS timestamp wraparound in %lldms\n",
> div_u64(mul_u32_u32(runtime->cs_timestamp_period_ns,
> diff --git a/drivers/gpu/drm/i915/intel_device_info.h b/drivers/gpu/drm/i915/intel_device_info.h
> index 1ecb9df2de91..432e9c7c0fe7 100644
> --- a/drivers/gpu/drm/i915/intel_device_info.h
> +++ b/drivers/gpu/drm/i915/intel_device_info.h
> @@ -218,7 +218,7 @@ struct intel_runtime_info {
>
> u32 rawclk_freq;
>
> - u32 cs_timestamp_frequency_khz;
> + u32 cs_timestamp_frequency_hz;
> u32 cs_timestamp_period_ns;
>
> /* Media engine access to SFC per instance */
> diff --git a/drivers/gpu/drm/i915/selftests/i915_perf.c b/drivers/gpu/drm/i915/selftests/i915_perf.c
> index d1a1568c47ba..dea0c5dd2739 100644
> --- a/drivers/gpu/drm/i915/selftests/i915_perf.c
> +++ b/drivers/gpu/drm/i915/selftests/i915_perf.c
> @@ -180,8 +180,8 @@ static int live_noa_delay(void *arg)
>
> delay = intel_read_status_page(stream->engine, 0x102);
> delay -= intel_read_status_page(stream->engine, 0x100);
> - delay = div_u64(mul_u32_u32(delay, 1000 * 1000),
> - RUNTIME_INFO(i915)->cs_timestamp_frequency_khz);
> + delay = div_u64(mul_u32_u32(delay, 1000000000),
> + RUNTIME_INFO(i915)->cs_timestamp_frequency_hz);
> pr_info("GPU delay: %uns, expected %lluns\n",
> delay, expected);
>
More information about the Intel-gfx
mailing list