[Intel-gfx] [PATCH 3/4] drm/i915: Per-process stats work better when evaluated per-process

Ben Widawsky benjamin.widawsky at intel.com
Wed Mar 19 01:05:45 CET 2014


On Thu, Mar 13, 2014 at 11:57:00AM -0300, Rodrigo Vivi wrote:
> From: Chris Wilson <chris at chris-wilson.co.uk>
> 
> The idea of printing objects used by each process is to judge how each
> process is using them. This means that we need to evaluate whether the
> object is bound for that particular process, rather than just whether it
> is bound into the global GTT.
> 
> Signed-off-by: Chris Wilson <chris at chris-wilson.co.uk>
> Cc: Ben Widawsky <benjamin.widawsky at intel.com>
> Signed-off-by: Rodrigo Vivi <rodrigo.vivi at gmail.com>
> ---
>  drivers/gpu/drm/i915/i915_debugfs.c     | 34 ++++++++++++++++++++++++++-------
>  drivers/gpu/drm/i915/i915_drv.h         |  2 ++
>  drivers/gpu/drm/i915/i915_gem_context.c |  1 +
>  3 files changed, 30 insertions(+), 7 deletions(-)
> 
> diff --git a/drivers/gpu/drm/i915/i915_debugfs.c b/drivers/gpu/drm/i915/i915_debugfs.c
> index a90d31c..ed3965f 100644
> --- a/drivers/gpu/drm/i915/i915_debugfs.c
> +++ b/drivers/gpu/drm/i915/i915_debugfs.c
> @@ -299,28 +299,46 @@ static int i915_gem_stolen_list_info(struct seq_file *m, void *data)
>  } while (0)
>  
>  struct file_stats {
> +	struct drm_i915_file_private *file_priv;
>  	int count;
> -	size_t total, active, inactive, unbound;
> +	size_t total, global, active, inactive, unbound;
>  };
>  
>  static int per_file_stats(int id, void *ptr, void *data)
>  {
>  	struct drm_i915_gem_object *obj = ptr;
>  	struct file_stats *stats = data;
> +	struct i915_vma *vma;
>  
>  	stats->count++;
>  	stats->total += obj->base.size;
>  
> -	if (i915_gem_obj_ggtt_bound(obj)) {
> -		if (!list_empty(&obj->ring_list))
> +	list_for_each_entry(vma, &obj->vma_list, vma_link) {
> +		struct i915_hw_ppgtt *ppgtt;
> +
> +		if (!drm_mm_node_allocated(&vma->node))
> +			continue;
> +
> +		ppgtt = container_of(vma->vm, struct i915_hw_ppgtt, base);
> +		if (ppgtt->ctx == NULL) {
> +			stats->global += obj->base.size;
> +			continue;
> +		}

I'm not really clear how this is supposed to work for global. Can you
make me happy and change it to:

if (i915_is_ggtt(vma->vm))

> +
> +		if (ppgtt->ctx->file_priv != stats->file_priv)
> +			continue;
> +
> +		if (obj->ring) /* XXX per-vma statistic */
>  			stats->active += obj->base.size;

Doesn't active get counted too many times if multiple VMAs exist for the
same active object (not a new problem to this patch)?

>  		else
>  			stats->inactive += obj->base.size;
> -	} else {
> -		if (!list_empty(&obj->global_list))
> -			stats->unbound += obj->base.size;
> +
> +		return 0;
>  	}
>  
> +	if (!list_empty(&obj->global_list))
> +		stats->unbound += obj->base.size;
> +
>  	return 0;
>  }
>  
> @@ -411,6 +429,7 @@ static int i915_gem_object_info(struct seq_file *m, void* data)
>  		struct task_struct *task;
>  
>  		memset(&stats, 0, sizeof(stats));
> +		stats.file_priv = file->driver_priv;
>  		idr_for_each(&file->object_idr, per_file_stats, &stats);
>  		/*
>  		 * Although we have a valid reference on file->pid, that does
> @@ -420,12 +439,13 @@ static int i915_gem_object_info(struct seq_file *m, void* data)
>  		 */
>  		rcu_read_lock();
>  		task = pid_task(file->pid, PIDTYPE_PID);
> -		seq_printf(m, "%s: %u objects, %zu bytes (%zu active, %zu inactive, %zu unbound)\n",
> +		seq_printf(m, "%s: %u objects, %zu bytes (%zu active, %zu inactive, %zu global, %zu unbound)\n",
>  			   task ? task->comm : "<unknown>",
>  			   stats.count,
>  			   stats.total,
>  			   stats.active,
>  			   stats.inactive,
> +			   stats.global,
>  			   stats.unbound);
>  		rcu_read_unlock();
>  	}
> diff --git a/drivers/gpu/drm/i915/i915_drv.h b/drivers/gpu/drm/i915/i915_drv.h
> index 2a319ba..b76c6de 100644
> --- a/drivers/gpu/drm/i915/i915_drv.h
> +++ b/drivers/gpu/drm/i915/i915_drv.h
> @@ -721,6 +721,8 @@ struct i915_hw_ppgtt {
>  		dma_addr_t *gen8_pt_dma_addr[4];
>  	};
>  
> +	struct i915_hw_context *ctx;
> +
>  	int (*enable)(struct i915_hw_ppgtt *ppgtt);
>  	int (*switch_mm)(struct i915_hw_ppgtt *ppgtt,
>  			 struct intel_ring_buffer *ring,
> diff --git a/drivers/gpu/drm/i915/i915_gem_context.c b/drivers/gpu/drm/i915/i915_gem_context.c
> index ce41cff..1a94b07 100644
> --- a/drivers/gpu/drm/i915/i915_gem_context.c
> +++ b/drivers/gpu/drm/i915/i915_gem_context.c
> @@ -215,6 +215,7 @@ create_vm_for_ctx(struct drm_device *dev, struct i915_hw_context *ctx)
>  		return ERR_PTR(ret);
>  	}
>  
> +	ppgtt->ctx = ctx;
>  	return ppgtt;
>  }
>  
> -- 
> 1.8.5.3
> 

-- 
Ben Widawsky, Intel Open Source Technology Center



More information about the Intel-gfx mailing list