[Intel-gfx] [PATCH v8 13/13] drm/i915: add support for perf configuration queries
Chris Wilson
chris at chris-wilson.co.uk
Wed Jul 10 11:04:38 UTC 2019
Quoting Lionel Landwerlin (2019-07-09 13:33:51)
> Listing configurations at the moment is supported only through sysfs.
> This might cause issues for applications wanting to list
> configurations from a container where sysfs isn't available.
>
> This change adds a way to query the number of configurations and their
> content through the i915 query uAPI.
>
> v2: Fix sparse warnings (Lionel)
> Add support to query configuration using uuid (Lionel)
>
> v3: Fix some inconsistency in uapi header (Lionel)
> Fix unlocking when not locked issue (Lionel)
> Add debug messages (Lionel)
>
> v4: Fix missing unlock (Dan)
>
> Signed-off-by: Lionel Landwerlin <lionel.g.landwerlin at intel.com>
> ---
> drivers/gpu/drm/i915/i915_drv.h | 6 +
> drivers/gpu/drm/i915/i915_perf.c | 3 +
> drivers/gpu/drm/i915/i915_query.c | 277 ++++++++++++++++++++++++++++++
> include/uapi/drm/i915_drm.h | 65 ++++++-
> 4 files changed, 348 insertions(+), 3 deletions(-)
>
> diff --git a/drivers/gpu/drm/i915/i915_drv.h b/drivers/gpu/drm/i915/i915_drv.h
> index c72e7c746b57..28f0f490b7b1 100644
> --- a/drivers/gpu/drm/i915/i915_drv.h
> +++ b/drivers/gpu/drm/i915/i915_drv.h
> @@ -1729,6 +1729,12 @@ struct drm_i915_private {
> */
> struct list_head metrics_buffers;
>
> + /*
> + * Number of dynamic configurations, you need to hold
> + * dev_priv->perf.metrics_lock to access it.
> + */
> + u32 n_metrics;
> +
> /*
> * Lock associated with anything below within this structure
> * except exclusive_stream.
> diff --git a/drivers/gpu/drm/i915/i915_perf.c b/drivers/gpu/drm/i915/i915_perf.c
> index dfd9ed4f321e..9cd1362d6922 100644
> --- a/drivers/gpu/drm/i915/i915_perf.c
> +++ b/drivers/gpu/drm/i915/i915_perf.c
> @@ -3722,6 +3722,8 @@ int i915_perf_add_config_ioctl(struct drm_device *dev, void *data,
> goto sysfs_err;
> }
>
> + dev_priv->perf.n_metrics++;
> +
> mutex_unlock(&dev_priv->perf.metrics_lock);
>
> DRM_DEBUG("Added config %s id=%i\n", oa_config->uuid, oa_config->id);
> @@ -3782,6 +3784,7 @@ int i915_perf_remove_config_ioctl(struct drm_device *dev, void *data,
> &oa_config->sysfs_metric);
>
> idr_remove(&dev_priv->perf.metrics_idr, *arg);
> + dev_priv->perf.n_metrics--;
>
> mutex_unlock(&dev_priv->perf.metrics_lock);
>
> diff --git a/drivers/gpu/drm/i915/i915_query.c b/drivers/gpu/drm/i915/i915_query.c
> index 7b7016171057..74b632998d0e 100644
> --- a/drivers/gpu/drm/i915/i915_query.c
> +++ b/drivers/gpu/drm/i915/i915_query.c
> @@ -143,10 +143,287 @@ query_engine_info(struct drm_i915_private *i915,
> return len;
> }
>
> +static int can_copy_perf_config_registers_or_number(u32 user_n_regs,
> + u64 user_regs_ptr,
> + u32 kernel_n_regs)
> +{
> + /*
> + * We'll just put the number of registers, and won't copy the
> + * register.
> + */
> + if (user_n_regs == 0)
> + return 0;
> +
> + if (user_n_regs < kernel_n_regs)
> + return -EINVAL;
> +
> + if (!access_ok(u64_to_user_ptr(user_regs_ptr),
> + 2 * sizeof(u32) * kernel_n_regs))
> + return -EFAULT;
> +
> + return 0;
> +}
> +
> +static int copy_perf_config_registers_or_number(const struct i915_oa_reg *kernel_regs,
> + u32 kernel_n_regs,
> + u64 user_regs_ptr,
> + u32 *user_n_regs)
> +{
> + u32 r;
> +
> + if (*user_n_regs == 0) {
> + *user_n_regs = kernel_n_regs;
> + return 0;
> + }
> +
> + *user_n_regs = kernel_n_regs;
> +
> + for (r = 0; r < kernel_n_regs; r++) {
> + u32 __user *user_reg_ptr =
> + u64_to_user_ptr(user_regs_ptr + sizeof(u32) * r * 2);
> + u32 __user *user_val_ptr =
> + u64_to_user_ptr(user_regs_ptr + sizeof(u32) * r * 2 +
> + sizeof(u32));
> + int ret;
> +
> + ret = __put_user(i915_mmio_reg_offset(kernel_regs[r].addr),
> + user_reg_ptr);
> + if (ret)
> + return -EFAULT;
> +
> + ret = __put_user(kernel_regs[r].value, user_val_ptr);
> + if (ret)
> + return -EFAULT;
> + }
> +
> + return 0;
> +}
> +
> +static int query_perf_config_data(struct drm_i915_private *i915,
> + struct drm_i915_query_item *query_item,
> + bool use_uuid)
> +{
> + struct drm_i915_query_perf_config __user *user_query_config_ptr =
> + u64_to_user_ptr(query_item->data_ptr);
> + struct drm_i915_perf_oa_config __user *user_config_ptr =
> + u64_to_user_ptr(query_item->data_ptr +
> + sizeof(struct drm_i915_query_perf_config));
> + struct drm_i915_perf_oa_config user_config;
> + struct i915_oa_config *oa_config = NULL;
> + char uuid[UUID_STRING_LEN + 1];
> + u64 config_id;
> + u32 flags, total_size;
> + int ret;
> +
> + if (!i915->perf.initialized)
> + return -ENODEV;
> +
> + total_size = sizeof(struct drm_i915_query_perf_config) +
> + sizeof(struct drm_i915_perf_oa_config);
> +
> + if (query_item->length == 0)
> + return total_size;
> +
> + if (query_item->length < total_size) {
> + DRM_DEBUG("Invalid query config data item size=%u expected=%u\n",
> + query_item->length, total_size);
> + return -EINVAL;
> + }
> +
> + if (!access_ok(user_query_config_ptr, total_size))
> + return -EFAULT;
> +
> + if (__get_user(flags, &user_query_config_ptr->flags))
> + return -EFAULT;
> +
> + if (flags != 0)
> + return -EINVAL;
> +
> + if (use_uuid) {
> + BUILD_BUG_ON(sizeof(user_query_config_ptr->uuid) >= sizeof(uuid));
> +
> + memset(&uuid, 0, sizeof(uuid));
> + if (__copy_from_user(uuid, user_query_config_ptr->uuid,
> + sizeof(user_query_config_ptr->uuid)))
> + return -EFAULT;
> + } else {
> + if (__get_user(config_id, &user_query_config_ptr->config)) {
> + return -EFAULT;
> + }
> + }
> +
> + ret = mutex_lock_interruptible(&i915->perf.metrics_lock);
> + if (ret)
> + return ret;
> +
> + if (use_uuid) {
> + struct i915_oa_config *tmp;
> + int id;
> +
> + idr_for_each_entry(&i915->perf.metrics_idr, tmp, id) {
> + if (!strcmp(tmp->uuid, uuid)) {
> + kref_get(&tmp->ref);
> + oa_config = tmp;
Bah, was expecting oa_config = oa_config_get(tmp);
> + break;
> + }
Pray be small. A secondary hashtable would be trivial to add if
required.
> + }
> + } else {
> + ret = i915_perf_get_oa_config(i915, config_id, &oa_config, NULL);
> + }
> +
> + mutex_unlock(&i915->perf.metrics_lock);
> +
> + if (ret || !oa_config)
> + return -ENOENT;
> +
> + if (__copy_from_user(&user_config, user_config_ptr,
> + sizeof(user_config))) {
> + ret = -EFAULT;
> + goto out;
> + }
> +
> + ret = can_copy_perf_config_registers_or_number(user_config.n_boolean_regs,
> + user_config.boolean_regs_ptr,
> + oa_config->b_counter_regs_len);
> + if (ret)
> + goto out;
> +
> + ret = can_copy_perf_config_registers_or_number(user_config.n_flex_regs,
> + user_config.flex_regs_ptr,
> + oa_config->flex_regs_len);
> + if (ret)
> + goto out;
> +
> + ret = can_copy_perf_config_registers_or_number(user_config.n_mux_regs,
> + user_config.mux_regs_ptr,
> + oa_config->mux_regs_len);
> + if (ret)
> + goto out;
> +
> + ret = copy_perf_config_registers_or_number(oa_config->b_counter_regs,
> + oa_config->b_counter_regs_len,
> + user_config.boolean_regs_ptr,
> + &user_config.n_boolean_regs);
> + if (ret)
> + goto out;
> +
> + ret = copy_perf_config_registers_or_number(oa_config->flex_regs,
> + oa_config->flex_regs_len,
> + user_config.flex_regs_ptr,
> + &user_config.n_flex_regs);
> + if (ret)
> + goto out;
> +
> + ret = copy_perf_config_registers_or_number(oa_config->mux_regs,
> + oa_config->mux_regs_len,
> + user_config.mux_regs_ptr,
> + &user_config.n_mux_regs);
> + if (ret)
> + goto out;
> +
> + memcpy(user_config.uuid, oa_config->uuid, sizeof(user_config.uuid));
> +
> + if (__copy_to_user(user_config_ptr, &user_config,
> + sizeof(user_config))) {
> + ret = -EFAULT;
> + goto out;
> + }
> +
> + ret = total_size;
> +
> +out:
> + i915_oa_config_put(oa_config);
Much more comfortable with all the user access out from under the locks.
> +
> + return ret;
> +}
> +
> +static int query_perf_config_list(struct drm_i915_private *i915,
> + struct drm_i915_query_item *query_item)
> +{
> + struct drm_i915_query_perf_config __user *user_query_config_ptr =
> + u64_to_user_ptr(query_item->data_ptr);
> + struct i915_oa_config *oa_config;
> + u32 flags, total_size;
> + u64 n_configs;
> + int ret, id;
> +
> + if (!i915->perf.initialized)
> + return -ENODEV;
> +
> + /* Count the default test configuration */
> + n_configs = i915->perf.n_metrics + 1;
> + total_size = sizeof(struct drm_i915_query_perf_config) +
> + sizeof(u64) * n_configs;
> +
> + if (query_item->length == 0)
> + return total_size;
> +
> + if (query_item->length < total_size) {
> + DRM_DEBUG("Invalid query config list item size=%u expected=%u\n",
> + query_item->length, total_size);
> + return -EINVAL;
> + }
> +
> + if (!access_ok(user_query_config_ptr, total_size))
> + return -EFAULT;
> +
> + if (__get_user(flags, &user_query_config_ptr->flags))
> + return -EFAULT;
> +
> + if (flags != 0)
> + return -EINVAL;
> +
> + if (__put_user(n_configs, &user_query_config_ptr->config))
> + return -EFAULT;
> +
> + if (__put_user((u64)1ULL, &user_query_config_ptr->data[0]))
> + return -EFAULT;
> +
> + ret = mutex_lock_interruptible(&i915->perf.metrics_lock);
> + if (ret)
> + return ret;
> +
> + n_configs = 1;
> + idr_for_each_entry(&i915->perf.metrics_idr, oa_config, id) {
> + u64 __user *item =
> + u64_to_user_ptr(query_item->data_ptr +
> + sizeof(struct drm_i915_query_perf_config) +
> + n_configs * sizeof(u64));
> +
> + if (__put_user((u64)id, item)) {
Oh, that is a nuisance.
It would be easy to avoid the lock here by using a temporary kmalloc,
and this should not be a hot path...
(A stitch in time is worth nine :)
With a temporary copy,
Reviewed-by: Chris Wilson <chris at chris-wilson.co.uk>
Probably best to grab Tvrtko to see if he can spot potential issues with
i915_query usage.
-Chris
More information about the Intel-gfx
mailing list