[Intel-gfx] [RFC 06/14] drm/i915/pmu: Only sample enabled samplers
Tvrtko Ursulin
tursulin at ursulin.net
Tue Jul 18 14:36:10 UTC 2017
From: Tvrtko Ursulin <tvrtko.ursulin at intel.com>
Save some execution time by not reading the MMIO registers
for the samplers which are not enabled.
Signed-off-by: Tvrtko Ursulin <tvrtko.ursulin at intel.com>
---
drivers/gpu/drm/i915/i915_pmu.c | 49 +++++++++++++++++++++++++++--------------
1 file changed, 33 insertions(+), 16 deletions(-)
diff --git a/drivers/gpu/drm/i915/i915_pmu.c b/drivers/gpu/drm/i915/i915_pmu.c
index d80e673477b5..4d61a1e72ee6 100644
--- a/drivers/gpu/drm/i915/i915_pmu.c
+++ b/drivers/gpu/drm/i915/i915_pmu.c
@@ -29,6 +29,14 @@ static const unsigned int user_engine_map[I915_NUM_ENGINES] = {
[I915_SAMPLE_VECS] = VECS,
};
+static bool grab_forcewake(struct drm_i915_private *i915, bool fw)
+{
+ if (!fw)
+ intel_uncore_forcewake_get(i915, FORCEWAKE_ALL);
+
+ return true;
+}
+
static void engines_sample(struct drm_i915_private *dev_priv)
{
struct intel_engine_cs *engine;
@@ -46,6 +54,7 @@ static void engines_sample(struct drm_i915_private *dev_priv)
for_each_engine(engine, dev_priv, id) {
unsigned int user_engine = engine_map[id];
+ u8 sample_mask;
u32 val;
if (WARN_ON_ONCE(id >= ARRAY_SIZE(engine_map)))
@@ -53,30 +62,38 @@ static void engines_sample(struct drm_i915_private *dev_priv)
else
user_engine = engine_map[id];
- if (!(dev_priv->pmu.enable &
- (ENGINE_SAMPLE_MASK << (ENGINE_SAMPLE_BITS * user_engine))))
+ sample_mask = (dev_priv->pmu.enable >>
+ (ENGINE_SAMPLE_BITS * user_engine)) &
+ ENGINE_SAMPLE_MASK;
+
+ if (!sample_mask)
continue;
if (i915_seqno_passed(intel_engine_get_seqno(engine),
intel_engine_last_submit(engine)))
continue;
- if (!fw) {
- intel_uncore_forcewake_get(dev_priv, FORCEWAKE_ALL);
- fw = true;
- }
-
- engine->pmu_sample[I915_SAMPLE_QUEUED] += PERIOD;
+ if (sample_mask & BIT(I915_SAMPLE_QUEUED))
+ engine->pmu_sample[I915_SAMPLE_QUEUED] += PERIOD;
- val = I915_READ_FW(RING_MI_MODE(engine->mmio_base));
- if (!(val & MODE_IDLE))
- engine->pmu_sample[I915_SAMPLE_BUSY] += PERIOD;
+ if (sample_mask & BIT(I915_SAMPLE_BUSY)) {
+ fw = grab_forcewake(dev_priv, fw);
+ val = I915_READ_FW(RING_MI_MODE(engine->mmio_base));
+ if (!(val & MODE_IDLE))
+ engine->pmu_sample[I915_SAMPLE_BUSY] += PERIOD;
+ }
- val = I915_READ_FW(RING_CTL(engine->mmio_base));
- if (val & RING_WAIT)
- engine->pmu_sample[I915_SAMPLE_WAIT] += PERIOD;
- if (val & RING_WAIT_SEMAPHORE)
- engine->pmu_sample[I915_SAMPLE_SEMA] += PERIOD;
+ if (sample_mask &
+ (BIT(I915_SAMPLE_WAIT) | BIT(I915_SAMPLE_SEMA))) {
+ fw = grab_forcewake(dev_priv, fw);
+ val = I915_READ_FW(RING_CTL(engine->mmio_base));
+ if ((sample_mask & BIT(I915_SAMPLE_WAIT)) &&
+ (val & RING_WAIT))
+ engine->pmu_sample[I915_SAMPLE_WAIT] += PERIOD;
+ if ((sample_mask & BIT(I915_SAMPLE_SEMA)) &&
+ (val & RING_WAIT_SEMAPHORE))
+ engine->pmu_sample[I915_SAMPLE_SEMA] += PERIOD;
+ }
}
if (fw)
--
2.9.4
More information about the Intel-gfx
mailing list