[Intel-gfx] [PATCH v2 14/15] drm/i915: Use ttm mmap handling for ttm bo's.

Thomas Hellström thomas.hellstrom at linux.intel.com
Tue May 18 09:17:41 UTC 2021


On 5/18/21 10:27 AM, Thomas Hellström wrote:
> From: Maarten Lankhorst <maarten.lankhorst at linux.intel.com>
>
> Use the ttm handlers for servicing page faults, and vm_access.
>
> Signed-off-by: Maarten Lankhorst <maarten.lankhorst at linux.intel.com>

LGTM. Just need to make sure we don't forget about the caching.

Reviewed-by: Thomas Hellström <thomas.hellstrom at linux.intel.com>



> ---
>   drivers/gpu/drm/i915/gem/i915_gem_mman.c      |  17 ++-
>   drivers/gpu/drm/i915/gem/i915_gem_mman.h      |   2 +
>   .../gpu/drm/i915/gem/i915_gem_object_types.h  |   1 +
>   drivers/gpu/drm/i915/gem/i915_gem_ttm.c       | 105 +++++++++++++++++-
>   4 files changed, 118 insertions(+), 7 deletions(-)
>
> diff --git a/drivers/gpu/drm/i915/gem/i915_gem_mman.c b/drivers/gpu/drm/i915/gem/i915_gem_mman.c
> index 65db290efd16..2bf89349dde9 100644
> --- a/drivers/gpu/drm/i915/gem/i915_gem_mman.c
> +++ b/drivers/gpu/drm/i915/gem/i915_gem_mman.c
> @@ -19,6 +19,7 @@
>   #include "i915_gem_mman.h"
>   #include "i915_trace.h"
>   #include "i915_user_extensions.h"
> +#include "i915_gem_ttm.h"
>   #include "i915_vma.h"
>   
>   static inline bool
> @@ -789,7 +790,7 @@ i915_gem_mmap_offset_ioctl(struct drm_device *dev, void *data,
>   	return __assign_mmap_offset(file, args->handle, type, &args->offset);
>   }
>   
> -static void vm_open(struct vm_area_struct *vma)
> +void i915_gem_mmap_vm_open(struct vm_area_struct *vma)
>   {
>   	struct i915_mmap_offset *mmo = vma->vm_private_data;
>   	struct drm_i915_gem_object *obj = mmo->obj;
> @@ -798,7 +799,7 @@ static void vm_open(struct vm_area_struct *vma)
>   	i915_gem_object_get(obj);
>   }
>   
> -static void vm_close(struct vm_area_struct *vma)
> +void i915_gem_mmap_vm_close(struct vm_area_struct *vma)
>   {
>   	struct i915_mmap_offset *mmo = vma->vm_private_data;
>   	struct drm_i915_gem_object *obj = mmo->obj;
> @@ -810,15 +811,15 @@ static void vm_close(struct vm_area_struct *vma)
>   static const struct vm_operations_struct vm_ops_gtt = {
>   	.fault = vm_fault_gtt,
>   	.access = vm_access,
> -	.open = vm_open,
> -	.close = vm_close,
> +	.open = i915_gem_mmap_vm_open,
> +	.close = i915_gem_mmap_vm_close,
>   };
>   
>   static const struct vm_operations_struct vm_ops_cpu = {
>   	.fault = vm_fault_cpu,
>   	.access = vm_access,
> -	.open = vm_open,
> -	.close = vm_close,
> +	.open = i915_gem_mmap_vm_open,
> +	.close = i915_gem_mmap_vm_close,
>   };
>   
>   static int singleton_release(struct inode *inode, struct file *file)
> @@ -953,6 +954,10 @@ int i915_gem_mmap(struct file *filp, struct vm_area_struct *vma)
>   	}
>   	vma->vm_page_prot = pgprot_decrypted(vma->vm_page_prot);
>   
> +	/* override ops per-object if desired */
> +	if (obj->ops->mmap_ops)
> +		vma->vm_ops = obj->ops->mmap_ops;
> +
>   	return 0;
>   }
>   
> diff --git a/drivers/gpu/drm/i915/gem/i915_gem_mman.h b/drivers/gpu/drm/i915/gem/i915_gem_mman.h
> index efee9e0d2508..e5bd02a6db12 100644
> --- a/drivers/gpu/drm/i915/gem/i915_gem_mman.h
> +++ b/drivers/gpu/drm/i915/gem/i915_gem_mman.h
> @@ -28,5 +28,7 @@ void __i915_gem_object_release_mmap_gtt(struct drm_i915_gem_object *obj);
>   void i915_gem_object_release_mmap_gtt(struct drm_i915_gem_object *obj);
>   
>   void i915_gem_object_release_mmap_offset(struct drm_i915_gem_object *obj);
> +void i915_gem_mmap_vm_open(struct vm_area_struct *vma);
> +void i915_gem_mmap_vm_close(struct vm_area_struct *vma);
>   
>   #endif
> diff --git a/drivers/gpu/drm/i915/gem/i915_gem_object_types.h b/drivers/gpu/drm/i915/gem/i915_gem_object_types.h
> index b350765e1935..31d828e91cf4 100644
> --- a/drivers/gpu/drm/i915/gem/i915_gem_object_types.h
> +++ b/drivers/gpu/drm/i915/gem/i915_gem_object_types.h
> @@ -79,6 +79,7 @@ struct drm_i915_gem_object_ops {
>   	void (*delayed_free)(struct drm_i915_gem_object *obj);
>   	void (*release)(struct drm_i915_gem_object *obj);
>   
> +	const struct vm_operations_struct *mmap_ops;
>   	const char *name; /* friendly name for debug, e.g. lockdep classes */
>   };
>   
> diff --git a/drivers/gpu/drm/i915/gem/i915_gem_ttm.c b/drivers/gpu/drm/i915/gem/i915_gem_ttm.c
> index 790f5ec45c4d..fe9ac50b2470 100644
> --- a/drivers/gpu/drm/i915/gem/i915_gem_ttm.c
> +++ b/drivers/gpu/drm/i915/gem/i915_gem_ttm.c
> @@ -14,6 +14,7 @@
>   #include "gem/i915_gem_region.h"
>   #include "gem/i915_gem_ttm.h"
>   #include "gem/i915_gem_ttm_bo_util.h"
> +#include "gem/i915_gem_mman.h"
>   
>   #define I915_PL_LMEM0 TTM_PL_PRIV
>   #define I915_PL_SYSTEM TTM_PL_SYSTEM
> @@ -345,6 +346,44 @@ static int i915_ttm_move(struct ttm_buffer_object *bo, bool evict,
>   	return 0;
>   }
>   
> +static int i915_ttm_io_mem_reserve(struct ttm_device *bdev, struct ttm_resource *mem)
> +{
> +	if (mem->mem_type < I915_PL_LMEM0)
> +		return 0;
> +
> +	/* We may need to revisit this later, but this allows all caching to be used in mmap */
> +	mem->bus.caching = ttm_cached;
> +	mem->bus.is_iomem = true;
> +
> +	return 0;
> +}
> +
> +static unsigned long i915_ttm_io_mem_pfn(struct ttm_buffer_object *bo,
> +					 unsigned long page_offset)
> +{
> +	struct drm_i915_gem_object *obj = i915_ttm_to_gem(bo);
> +	struct sg_table *sgt = obj->ttm.cached_io_st;
> +	struct scatterlist *sg;
> +	unsigned int i;
> +
> +	GEM_WARN_ON(bo->ttm);
> +
> +	for_each_sgtable_dma_sg(sgt, sg, i) {
> +		unsigned long sg_max = sg->length >> PAGE_SHIFT;
> +
> +		if (page_offset < sg_max) {
> +			unsigned long base =
> +				obj->mm.region->iomap.base - obj->mm.region->region.start;
> +
> +			return ((base + sg_dma_address(sg)) >> PAGE_SHIFT) + page_offset;
> +		}
> +
> +		page_offset -= sg_max;
> +	}
> +	GEM_BUG_ON(1);
> +	return 0;
> +}
> +
>   struct ttm_device_funcs i915_ttm_bo_driver = {
>   	.ttm_tt_create = i915_ttm_tt_create,
>   	.ttm_tt_unpopulate = i915_ttm_tt_unpopulate,
> @@ -355,6 +394,8 @@ struct ttm_device_funcs i915_ttm_bo_driver = {
>   	.verify_access = NULL,
>   	.swap_notify = i915_ttm_swap_notify,
>   	.delete_mem_notify = i915_ttm_delete_mem_notify,
> +	.io_mem_reserve = i915_ttm_io_mem_reserve,
> +	.io_mem_pfn = i915_ttm_io_mem_pfn,
>   };
>   
>   static int i915_ttm_get_pages(struct drm_i915_gem_object *obj)
> @@ -454,7 +495,68 @@ static void i915_ttm_delayed_free(struct drm_i915_gem_object *obj)
>   	ttm_bo_put(i915_gem_to_ttm(obj));
>   }
>   
> -static const struct drm_i915_gem_object_ops i915_gem_ttm_obj_ops = {
> +static vm_fault_t vm_fault_ttm(struct vm_fault *vmf)
> +{
> +	struct vm_area_struct *area = vmf->vma;
> +	struct i915_mmap_offset *mmo = area->vm_private_data;
> +	struct drm_i915_gem_object *obj = mmo->obj;
> +	vm_fault_t ret;
> +
> +	/* Sanity check that we allow writing into this object */
> +	if (unlikely(i915_gem_object_is_readonly(obj) &&
> +		     area->vm_flags & VM_WRITE))
> +		return VM_FAULT_SIGBUS;
> +
> +	ret = ttm_bo_vm_reserve(i915_gem_to_ttm(obj), vmf);
> +	if (ret)
> +		return ret;
> +
> +	ret = ttm_bo_vm_fault_reserved(i915_gem_to_ttm(obj), vmf,
> +				       drm_vma_node_start(&mmo->vma_node),
> +				       vmf->vma->vm_page_prot,
> +				       TTM_BO_VM_NUM_PREFAULT, 1);
> +	if (ret == VM_FAULT_RETRY && !(vmf->flags & FAULT_FLAG_RETRY_NOWAIT))
> +		return ret;
> +
> +	dma_resv_unlock(obj->base.resv);
> +
> +	return ret;
> +}
> +
> +static int
> +vm_access_ttm(struct vm_area_struct *area, unsigned long addr,
> +	  void *buf, int len, int write)
> +{
> +	struct i915_mmap_offset *mmo = area->vm_private_data;
> +	struct drm_i915_gem_object *obj = mmo->obj;
> +	int err = 0;
> +
> +	if (i915_gem_object_is_readonly(obj) && write)
> +		return -EACCES;
> +
> +	addr -= area->vm_start;
> +	if (addr >= obj->base.size)
> +		return -EINVAL;
> +
> +	err = i915_gem_object_lock_interruptible(obj, NULL);
> +	if (err)
> +		return err;
> +
> +	len = ttm_bo_vm_access_reserved(i915_gem_to_ttm(obj), area,
> +					addr, buf, len, write);
> +	i915_gem_object_unlock(obj);
> +
> +	return len;
> +}
> +
> +static const struct vm_operations_struct vm_ops_ttm = {
> +	.fault = vm_fault_ttm,
> +	.access = vm_access_ttm,
> +	.open = i915_gem_mmap_vm_open,
> +	.close = i915_gem_mmap_vm_close,
> +};
> +
> +const struct drm_i915_gem_object_ops i915_gem_ttm_obj_ops = {
>   	.name = "i915_gem_object_ttm",
>   	.flags = I915_GEM_OBJECT_HAS_IOMEM,
>   
> @@ -463,6 +565,7 @@ static const struct drm_i915_gem_object_ops i915_gem_ttm_obj_ops = {
>   	.truncate = i915_ttm_purge,
>   	.adjust_lru = i915_ttm_adjust_lru,
>   	.delayed_free = i915_ttm_delayed_free,
> +	.mmap_ops = &vm_ops_ttm,
>   };
>   
>   void i915_ttm_bo_destroy(struct ttm_buffer_object *bo)


More information about the Intel-gfx mailing list