[Intel-gfx] [PATCH v5 2/6] drm/i915: Use the vma resource as argument for gtt binding / unbinding
Matthew Auld
matthew.auld at intel.com
Thu Jan 6 16:01:04 UTC 2022
On 04/01/2022 12:51, Thomas Hellström wrote:
> When introducing asynchronous unbinding, the vma itself may no longer
> be alive when the actual binding or unbinding takes place.
>
> Update the gtt i915_vma_ops accordingly to take a struct i915_vma_resource
> instead of a struct i915_vma for the bind_vma() and unbind_vma() ops.
> Similarly change the insert_entries() op for struct i915_address_space.
>
> Replace a couple of i915_vma_snapshot members with their newly introduced
> i915_vma_resource counterparts, since they have the same lifetime.
>
> Also make sure to avoid changing the struct i915_vma_flags (in particular
> the bind flags) async. That should now only be done sync under the
> vm mutex.
>
> v2:
> - Update the vma_res::bound_flags when binding to the aliased ggtt
>
> Signed-off-by: Thomas Hellström <thomas.hellstrom at linux.intel.com>
> ---
> drivers/gpu/drm/i915/display/intel_dpt.c | 27 ++---
> .../gpu/drm/i915/gem/i915_gem_object_types.h | 27 +----
> .../gpu/drm/i915/gem/selftests/huge_pages.c | 37 +++----
> drivers/gpu/drm/i915/gt/gen6_ppgtt.c | 19 ++--
> drivers/gpu/drm/i915/gt/gen8_ppgtt.c | 37 +++----
> drivers/gpu/drm/i915/gt/intel_engine_cs.c | 4 +-
> drivers/gpu/drm/i915/gt/intel_ggtt.c | 70 ++++++-------
> drivers/gpu/drm/i915/gt/intel_gtt.h | 16 +--
> drivers/gpu/drm/i915/gt/intel_ppgtt.c | 22 +++--
> drivers/gpu/drm/i915/gt/uc/intel_uc_fw.c | 13 ++-
> drivers/gpu/drm/i915/gt/uc/intel_uc_fw.h | 2 +-
> drivers/gpu/drm/i915/i915_debugfs.c | 3 +-
> drivers/gpu/drm/i915/i915_gpu_error.c | 6 +-
> drivers/gpu/drm/i915/i915_vma.c | 24 ++++-
> drivers/gpu/drm/i915/i915_vma.h | 11 +--
> drivers/gpu/drm/i915/i915_vma_resource.c | 9 +-
> drivers/gpu/drm/i915/i915_vma_resource.h | 99 ++++++++++++++++++-
> drivers/gpu/drm/i915/i915_vma_snapshot.c | 4 -
> drivers/gpu/drm/i915/i915_vma_snapshot.h | 8 --
> drivers/gpu/drm/i915/selftests/i915_gem_gtt.c | 64 ++++++++----
> drivers/gpu/drm/i915/selftests/mock_gtt.c | 12 +--
> 21 files changed, 308 insertions(+), 206 deletions(-)
>
> diff --git a/drivers/gpu/drm/i915/display/intel_dpt.c b/drivers/gpu/drm/i915/display/intel_dpt.c
> index 8f674745e7e0..63a83d5f85a1 100644
> --- a/drivers/gpu/drm/i915/display/intel_dpt.c
> +++ b/drivers/gpu/drm/i915/display/intel_dpt.c
> @@ -48,7 +48,7 @@ static void dpt_insert_page(struct i915_address_space *vm,
> }
>
> static void dpt_insert_entries(struct i915_address_space *vm,
> - struct i915_vma *vma,
> + struct i915_vma_resource *vma_res,
> enum i915_cache_level level,
> u32 flags)
> {
> @@ -64,8 +64,8 @@ static void dpt_insert_entries(struct i915_address_space *vm,
> * not to allow the user to override access to a read only page.
> */
>
> - i = vma->node.start / I915_GTT_PAGE_SIZE;
> - for_each_sgt_daddr(addr, sgt_iter, vma->pages)
> + i = vma_res->start / I915_GTT_PAGE_SIZE;
> + for_each_sgt_daddr(addr, sgt_iter, vma_res->bi.pages)
> gen8_set_pte(&base[i++], pte_encode | addr);
> }
>
> @@ -76,35 +76,38 @@ static void dpt_clear_range(struct i915_address_space *vm,
>
> static void dpt_bind_vma(struct i915_address_space *vm,
> struct i915_vm_pt_stash *stash,
> - struct i915_vma *vma,
> + struct i915_vma_resource *vma_res,
> enum i915_cache_level cache_level,
> u32 flags)
> {
> - struct drm_i915_gem_object *obj = vma->obj;
> u32 pte_flags;
>
> + if (vma_res->bound_flags)
> + return;
> +
> /* Applicable to VLV (gen8+ do not support RO in the GGTT) */
> pte_flags = 0;
> - if (vma->vm->has_read_only && i915_gem_object_is_readonly(obj))
> + if (vm->has_read_only && vma_res->bi.readonly)
> pte_flags |= PTE_READ_ONLY;
> - if (i915_gem_object_is_lmem(obj))
> + if (vma_res->bi.lmem)
> pte_flags |= PTE_LM;
>
> - vma->vm->insert_entries(vma->vm, vma, cache_level, pte_flags);
> + vm->insert_entries(vm, vma_res, cache_level, pte_flags);
>
> - vma->page_sizes.gtt = I915_GTT_PAGE_SIZE;
> + vma_res->page_sizes_gtt = I915_GTT_PAGE_SIZE;
>
> /*
> * Without aliasing PPGTT there's no difference between
> * GLOBAL/LOCAL_BIND, it's all the same ptes. Hence unconditionally
> * upgrade to both bound if we bind either to avoid double-binding.
> */
> - atomic_or(I915_VMA_GLOBAL_BIND | I915_VMA_LOCAL_BIND, &vma->flags);
> + vma_res->bound_flags = I915_VMA_GLOBAL_BIND | I915_VMA_LOCAL_BIND;
> }
>
> -static void dpt_unbind_vma(struct i915_address_space *vm, struct i915_vma *vma)
> +static void dpt_unbind_vma(struct i915_address_space *vm,
> + struct i915_vma_resource *vma_res)
> {
> - vm->clear_range(vm, vma->node.start, vma->size);
> + vm->clear_range(vm, vma_res->start, vma_res->vma_size);
> }
>
> static void dpt_cleanup(struct i915_address_space *vm)
> diff --git a/drivers/gpu/drm/i915/gem/i915_gem_object_types.h b/drivers/gpu/drm/i915/gem/i915_gem_object_types.h
> index f9f7e44099fe..f99d260e0684 100644
> --- a/drivers/gpu/drm/i915/gem/i915_gem_object_types.h
> +++ b/drivers/gpu/drm/i915/gem/i915_gem_object_types.h
> @@ -15,6 +15,7 @@
>
> #include "i915_active.h"
> #include "i915_selftest.h"
> +#include "i915_vma_resource.h"
>
> struct drm_i915_gem_object;
> struct intel_fronbuffer;
> @@ -549,31 +550,7 @@ struct drm_i915_gem_object {
> struct sg_table *pages;
> void *mapping;
>
> - struct i915_page_sizes {
> - /**
> - * The sg mask of the pages sg_table. i.e the mask of
> - * of the lengths for each sg entry.
> - */
> - unsigned int phys;
> -
> - /**
> - * The gtt page sizes we are allowed to use given the
> - * sg mask and the supported page sizes. This will
> - * express the smallest unit we can use for the whole
> - * object, as well as the larger sizes we may be able
> - * to use opportunistically.
> - */
> - unsigned int sg;
> -
> - /**
> - * The actual gtt page size usage. Since we can have
> - * multiple vma associated with this object we need to
> - * prevent any trampling of state, hence a copy of this
> - * struct also lives in each vma, therefore the gtt
> - * value here should only be read/write through the vma.
> - */
> - unsigned int gtt;
> - } page_sizes;
> + struct i915_page_sizes page_sizes;
>
> I915_SELFTEST_DECLARE(unsigned int page_mask);
>
> diff --git a/drivers/gpu/drm/i915/gem/selftests/huge_pages.c b/drivers/gpu/drm/i915/gem/selftests/huge_pages.c
> index 11f0aa65f8a3..26f997c376a2 100644
> --- a/drivers/gpu/drm/i915/gem/selftests/huge_pages.c
> +++ b/drivers/gpu/drm/i915/gem/selftests/huge_pages.c
> @@ -370,9 +370,9 @@ static int igt_check_page_sizes(struct i915_vma *vma)
> err = -EINVAL;
> }
>
> - if (!HAS_PAGE_SIZES(i915, vma->page_sizes.gtt)) {
> + if (!HAS_PAGE_SIZES(i915, vma->resource->page_sizes_gtt)) {
> pr_err("unsupported page_sizes.gtt=%u, supported=%u\n",
> - vma->page_sizes.gtt & ~supported, supported);
> + vma->resource->page_sizes_gtt & ~supported, supported);
> err = -EINVAL;
> }
>
> @@ -403,15 +403,9 @@ static int igt_check_page_sizes(struct i915_vma *vma)
> if (i915_gem_object_is_lmem(obj) &&
> IS_ALIGNED(vma->node.start, SZ_2M) &&
> vma->page_sizes.sg & SZ_2M &&
> - vma->page_sizes.gtt < SZ_2M) {
> + vma->resource->page_sizes_gtt < SZ_2M) {
> pr_err("gtt pages mismatch for LMEM, expected 2M GTT pages, sg(%u), gtt(%u)\n",
> - vma->page_sizes.sg, vma->page_sizes.gtt);
> - err = -EINVAL;
> - }
> -
> - if (obj->mm.page_sizes.gtt) {
> - pr_err("obj->page_sizes.gtt(%u) should never be set\n",
> - obj->mm.page_sizes.gtt);
> + vma->page_sizes.sg, vma->resource->page_sizes_gtt);
> err = -EINVAL;
> }
>
> @@ -547,9 +541,9 @@ static int igt_mock_memory_region_huge_pages(void *arg)
> goto out_unpin;
> }
>
> - if (vma->page_sizes.gtt != page_size) {
> + if (vma->resource->page_sizes_gtt != page_size) {
> pr_err("%s page_sizes.gtt=%u, expected=%u\n",
> - __func__, vma->page_sizes.gtt,
> + __func__, vma->resource->page_sizes_gtt,
> page_size);
> err = -EINVAL;
> goto out_unpin;
> @@ -630,9 +624,9 @@ static int igt_mock_ppgtt_misaligned_dma(void *arg)
>
> err = igt_check_page_sizes(vma);
>
> - if (vma->page_sizes.gtt != page_size) {
> + if (vma->resource->page_sizes_gtt != page_size) {
> pr_err("page_sizes.gtt=%u, expected %u\n",
> - vma->page_sizes.gtt, page_size);
> + vma->resource->page_sizes_gtt, page_size);
> err = -EINVAL;
> }
>
> @@ -657,9 +651,10 @@ static int igt_mock_ppgtt_misaligned_dma(void *arg)
>
> err = igt_check_page_sizes(vma);
>
> - if (vma->page_sizes.gtt != I915_GTT_PAGE_SIZE_4K) {
> + if (vma->resource->page_sizes_gtt != I915_GTT_PAGE_SIZE_4K) {
> pr_err("page_sizes.gtt=%u, expected %llu\n",
> - vma->page_sizes.gtt, I915_GTT_PAGE_SIZE_4K);
> + vma->resource->page_sizes_gtt,
> + I915_GTT_PAGE_SIZE_4K);
> err = -EINVAL;
> }
>
> @@ -805,9 +800,9 @@ static int igt_mock_ppgtt_huge_fill(void *arg)
> }
> }
>
> - if (vma->page_sizes.gtt != expected_gtt) {
> + if (vma->resource->page_sizes_gtt != expected_gtt) {
> pr_err("gtt=%u, expected=%u, size=%zd, single=%s\n",
> - vma->page_sizes.gtt, expected_gtt,
> + vma->resource->page_sizes_gtt, expected_gtt,
> obj->base.size, yesno(!!single));
> err = -EINVAL;
> break;
> @@ -961,10 +956,10 @@ static int igt_mock_ppgtt_64K(void *arg)
> }
> }
>
> - if (vma->page_sizes.gtt != expected_gtt) {
> + if (vma->resource->page_sizes_gtt != expected_gtt) {
> pr_err("gtt=%u, expected=%u, i=%d, single=%s\n",
> - vma->page_sizes.gtt, expected_gtt, i,
> - yesno(!!single));
> + vma->resource->page_sizes_gtt,
> + expected_gtt, i, yesno(!!single));
> err = -EINVAL;
> goto out_vma_unpin;
> }
> diff --git a/drivers/gpu/drm/i915/gt/gen6_ppgtt.c b/drivers/gpu/drm/i915/gt/gen6_ppgtt.c
> index 6e9292918bfc..d657ffd6c86a 100644
> --- a/drivers/gpu/drm/i915/gt/gen6_ppgtt.c
> +++ b/drivers/gpu/drm/i915/gt/gen6_ppgtt.c
> @@ -104,17 +104,17 @@ static void gen6_ppgtt_clear_range(struct i915_address_space *vm,
> }
>
> static void gen6_ppgtt_insert_entries(struct i915_address_space *vm,
> - struct i915_vma *vma,
> + struct i915_vma_resource *vma_res,
> enum i915_cache_level cache_level,
> u32 flags)
> {
> struct i915_ppgtt *ppgtt = i915_vm_to_ppgtt(vm);
> struct i915_page_directory * const pd = ppgtt->pd;
> - unsigned int first_entry = vma->node.start / I915_GTT_PAGE_SIZE;
> + unsigned int first_entry = vma_res->start / I915_GTT_PAGE_SIZE;
> unsigned int act_pt = first_entry / GEN6_PTES;
> unsigned int act_pte = first_entry % GEN6_PTES;
> const u32 pte_encode = vm->pte_encode(0, cache_level, flags);
> - struct sgt_dma iter = sgt_dma(vma);
> + struct sgt_dma iter = sgt_dma(vma_res);
> gen6_pte_t *vaddr;
>
> GEM_BUG_ON(!pd->entry[act_pt]);
> @@ -140,7 +140,7 @@ static void gen6_ppgtt_insert_entries(struct i915_address_space *vm,
> }
> } while (1);
>
> - vma->page_sizes.gtt = I915_GTT_PAGE_SIZE;
> + vma_res->page_sizes_gtt = I915_GTT_PAGE_SIZE;
> }
>
> static void gen6_flush_pd(struct gen6_ppgtt *ppgtt, u64 start, u64 end)
> @@ -271,13 +271,13 @@ static void gen6_ppgtt_cleanup(struct i915_address_space *vm)
>
> static void pd_vma_bind(struct i915_address_space *vm,
> struct i915_vm_pt_stash *stash,
> - struct i915_vma *vma,
> + struct i915_vma_resource *vma_res,
> enum i915_cache_level cache_level,
> u32 unused)
> {
> struct i915_ggtt *ggtt = i915_vm_to_ggtt(vm);
> - struct gen6_ppgtt *ppgtt = vma->private;
> - u32 ggtt_offset = i915_ggtt_offset(vma) / I915_GTT_PAGE_SIZE;
> + struct gen6_ppgtt *ppgtt = vma_res->private;
> + u32 ggtt_offset = vma_res->start / I915_GTT_PAGE_SIZE;
>
> ppgtt->pp_dir = ggtt_offset * sizeof(gen6_pte_t) << 10;
> ppgtt->pd_addr = (gen6_pte_t __iomem *)ggtt->gsm + ggtt_offset;
> @@ -285,9 +285,10 @@ static void pd_vma_bind(struct i915_address_space *vm,
> gen6_flush_pd(ppgtt, 0, ppgtt->base.vm.total);
> }
>
> -static void pd_vma_unbind(struct i915_address_space *vm, struct i915_vma *vma)
> +static void pd_vma_unbind(struct i915_address_space *vm,
> + struct i915_vma_resource *vma_res)
> {
> - struct gen6_ppgtt *ppgtt = vma->private;
> + struct gen6_ppgtt *ppgtt = vma_res->private;
> struct i915_page_directory * const pd = ppgtt->base.pd;
> struct i915_page_table *pt;
> unsigned int pde;
> diff --git a/drivers/gpu/drm/i915/gt/gen8_ppgtt.c b/drivers/gpu/drm/i915/gt/gen8_ppgtt.c
> index b012c50f7ce7..c43e724afa9f 100644
> --- a/drivers/gpu/drm/i915/gt/gen8_ppgtt.c
> +++ b/drivers/gpu/drm/i915/gt/gen8_ppgtt.c
> @@ -453,20 +453,21 @@ gen8_ppgtt_insert_pte(struct i915_ppgtt *ppgtt,
> return idx;
> }
>
> -static void gen8_ppgtt_insert_huge(struct i915_vma *vma,
> +static void gen8_ppgtt_insert_huge(struct i915_address_space *vm,
> + struct i915_vma_resource *vma_res,
> struct sgt_dma *iter,
> enum i915_cache_level cache_level,
> u32 flags)
> {
> const gen8_pte_t pte_encode = gen8_pte_encode(0, cache_level, flags);
> unsigned int rem = sg_dma_len(iter->sg);
> - u64 start = vma->node.start;
> + u64 start = vma_res->start;
>
> - GEM_BUG_ON(!i915_vm_is_4lvl(vma->vm));
> + GEM_BUG_ON(!i915_vm_is_4lvl(vm));
>
> do {
> struct i915_page_directory * const pdp =
> - gen8_pdp_for_page_address(vma->vm, start);
> + gen8_pdp_for_page_address(vm, start);
> struct i915_page_directory * const pd =
> i915_pd_entry(pdp, __gen8_pte_index(start, 2));
> gen8_pte_t encode = pte_encode;
> @@ -475,7 +476,7 @@ static void gen8_ppgtt_insert_huge(struct i915_vma *vma,
> gen8_pte_t *vaddr;
> u16 index;
>
> - if (vma->page_sizes.sg & I915_GTT_PAGE_SIZE_2M &&
> + if (vma_res->bi.page_sizes.sg & I915_GTT_PAGE_SIZE_2M &&
> IS_ALIGNED(iter->dma, I915_GTT_PAGE_SIZE_2M) &&
> rem >= I915_GTT_PAGE_SIZE_2M &&
> !__gen8_pte_index(start, 0)) {
> @@ -492,7 +493,7 @@ static void gen8_ppgtt_insert_huge(struct i915_vma *vma,
> page_size = I915_GTT_PAGE_SIZE;
>
> if (!index &&
> - vma->page_sizes.sg & I915_GTT_PAGE_SIZE_64K &&
> + vma_res->bi.page_sizes.sg & I915_GTT_PAGE_SIZE_64K &&
> IS_ALIGNED(iter->dma, I915_GTT_PAGE_SIZE_64K) &&
> (IS_ALIGNED(rem, I915_GTT_PAGE_SIZE_64K) ||
> rem >= (I915_PDES - index) * I915_GTT_PAGE_SIZE))
> @@ -541,9 +542,9 @@ static void gen8_ppgtt_insert_huge(struct i915_vma *vma,
> */
> if (maybe_64K != -1 &&
> (index == I915_PDES ||
> - (i915_vm_has_scratch_64K(vma->vm) &&
> - !iter->sg && IS_ALIGNED(vma->node.start +
> - vma->node.size,
> + (i915_vm_has_scratch_64K(vm) &&
> + !iter->sg && IS_ALIGNED(vma_res->start +
> + vma_res->node_size,
> I915_GTT_PAGE_SIZE_2M)))) {
> vaddr = px_vaddr(pd);
> vaddr[maybe_64K] |= GEN8_PDE_IPS_64K;
> @@ -559,10 +560,10 @@ static void gen8_ppgtt_insert_huge(struct i915_vma *vma,
> * instead - which we detect as missing results during
> * selftests.
> */
> - if (I915_SELFTEST_ONLY(vma->vm->scrub_64K)) {
> + if (I915_SELFTEST_ONLY(vm->scrub_64K)) {
> u16 i;
>
> - encode = vma->vm->scratch[0]->encode;
> + encode = vm->scratch[0]->encode;
> vaddr = px_vaddr(i915_pt_entry(pd, maybe_64K));
>
> for (i = 1; i < index; i += 16)
> @@ -572,22 +573,22 @@ static void gen8_ppgtt_insert_huge(struct i915_vma *vma,
> }
> }
>
> - vma->page_sizes.gtt |= page_size;
> + vma_res->page_sizes_gtt |= page_size;
> } while (iter->sg && sg_dma_len(iter->sg));
> }
>
> static void gen8_ppgtt_insert(struct i915_address_space *vm,
> - struct i915_vma *vma,
> + struct i915_vma_resource *vma_res,
> enum i915_cache_level cache_level,
> u32 flags)
> {
> struct i915_ppgtt * const ppgtt = i915_vm_to_ppgtt(vm);
> - struct sgt_dma iter = sgt_dma(vma);
> + struct sgt_dma iter = sgt_dma(vma_res);
>
> - if (vma->page_sizes.sg > I915_GTT_PAGE_SIZE) {
> - gen8_ppgtt_insert_huge(vma, &iter, cache_level, flags);
> + if (vma_res->bi.page_sizes.sg > I915_GTT_PAGE_SIZE) {
> + gen8_ppgtt_insert_huge(vm, vma_res, &iter, cache_level, flags);
> } else {
> - u64 idx = vma->node.start >> GEN8_PTE_SHIFT;
> + u64 idx = vma_res->start >> GEN8_PTE_SHIFT;
>
> do {
> struct i915_page_directory * const pdp =
> @@ -597,7 +598,7 @@ static void gen8_ppgtt_insert(struct i915_address_space *vm,
> cache_level, flags);
> } while (idx);
>
> - vma->page_sizes.gtt = I915_GTT_PAGE_SIZE;
> + vma_res->page_sizes_gtt = I915_GTT_PAGE_SIZE;
> }
> }
>
> diff --git a/drivers/gpu/drm/i915/gt/intel_engine_cs.c b/drivers/gpu/drm/i915/gt/intel_engine_cs.c
> index 352254e001b4..74aa90587061 100644
> --- a/drivers/gpu/drm/i915/gt/intel_engine_cs.c
> +++ b/drivers/gpu/drm/i915/gt/intel_engine_cs.c
> @@ -1718,8 +1718,8 @@ static void print_request_ring(struct drm_printer *m, struct i915_request *rq)
> drm_printf(m,
> "[head %04x, postfix %04x, tail %04x, batch 0x%08x_%08x]:\n",
> rq->head, rq->postfix, rq->tail,
> - vsnap ? upper_32_bits(vsnap->gtt_offset) : ~0u,
> - vsnap ? lower_32_bits(vsnap->gtt_offset) : ~0u);
> + vsnap ? upper_32_bits(vsnap->vma_resource->start) : ~0u,
> + vsnap ? lower_32_bits(vsnap->vma_resource->start) : ~0u);
>
> size = rq->tail - rq->head;
> if (rq->tail < rq->head)
> diff --git a/drivers/gpu/drm/i915/gt/intel_ggtt.c b/drivers/gpu/drm/i915/gt/intel_ggtt.c
> index 5263dda7f8d5..0137b6af0973 100644
> --- a/drivers/gpu/drm/i915/gt/intel_ggtt.c
> +++ b/drivers/gpu/drm/i915/gt/intel_ggtt.c
> @@ -235,7 +235,7 @@ static void gen8_ggtt_insert_page(struct i915_address_space *vm,
> }
>
> static void gen8_ggtt_insert_entries(struct i915_address_space *vm,
> - struct i915_vma *vma,
> + struct i915_vma_resource *vma_res,
> enum i915_cache_level level,
> u32 flags)
> {
> @@ -252,10 +252,10 @@ static void gen8_ggtt_insert_entries(struct i915_address_space *vm,
> */
>
> gte = (gen8_pte_t __iomem *)ggtt->gsm;
> - gte += vma->node.start / I915_GTT_PAGE_SIZE;
> - end = gte + vma->node.size / I915_GTT_PAGE_SIZE;
> + gte += vma_res->start / I915_GTT_PAGE_SIZE;
> + end = gte + vma_res->node_size / I915_GTT_PAGE_SIZE;
>
> - for_each_sgt_daddr(addr, iter, vma->pages)
> + for_each_sgt_daddr(addr, iter, vma_res->bi.pages)
> gen8_set_pte(gte++, pte_encode | addr);
> GEM_BUG_ON(gte > end);
>
> @@ -292,7 +292,7 @@ static void gen6_ggtt_insert_page(struct i915_address_space *vm,
> * through the GMADR mapped BAR (i915->mm.gtt->gtt).
> */
> static void gen6_ggtt_insert_entries(struct i915_address_space *vm,
> - struct i915_vma *vma,
> + struct i915_vma_resource *vma_res,
> enum i915_cache_level level,
> u32 flags)
> {
> @@ -303,10 +303,10 @@ static void gen6_ggtt_insert_entries(struct i915_address_space *vm,
> dma_addr_t addr;
>
> gte = (gen6_pte_t __iomem *)ggtt->gsm;
> - gte += vma->node.start / I915_GTT_PAGE_SIZE;
> - end = gte + vma->node.size / I915_GTT_PAGE_SIZE;
> + gte += vma_res->start / I915_GTT_PAGE_SIZE;
> + end = gte + vma_res->node_size / I915_GTT_PAGE_SIZE;
>
> - for_each_sgt_daddr(addr, iter, vma->pages)
> + for_each_sgt_daddr(addr, iter, vma_res->bi.pages)
> iowrite32(vm->pte_encode(addr, level, flags), gte++);
> GEM_BUG_ON(gte > end);
>
> @@ -389,7 +389,7 @@ static void bxt_vtd_ggtt_insert_page__BKL(struct i915_address_space *vm,
>
> struct insert_entries {
> struct i915_address_space *vm;
> - struct i915_vma *vma;
> + struct i915_vma_resource *vma_res;
> enum i915_cache_level level;
> u32 flags;
> };
> @@ -398,18 +398,18 @@ static int bxt_vtd_ggtt_insert_entries__cb(void *_arg)
> {
> struct insert_entries *arg = _arg;
>
> - gen8_ggtt_insert_entries(arg->vm, arg->vma, arg->level, arg->flags);
> + gen8_ggtt_insert_entries(arg->vm, arg->vma_res, arg->level, arg->flags);
> bxt_vtd_ggtt_wa(arg->vm);
>
> return 0;
> }
>
> static void bxt_vtd_ggtt_insert_entries__BKL(struct i915_address_space *vm,
> - struct i915_vma *vma,
> + struct i915_vma_resource *vma_res,
> enum i915_cache_level level,
> u32 flags)
> {
> - struct insert_entries arg = { vm, vma, level, flags };
> + struct insert_entries arg = { vm, vma_res, level, flags };
>
> stop_machine(bxt_vtd_ggtt_insert_entries__cb, &arg, NULL);
> }
> @@ -448,14 +448,14 @@ static void i915_ggtt_insert_page(struct i915_address_space *vm,
> }
>
> static void i915_ggtt_insert_entries(struct i915_address_space *vm,
> - struct i915_vma *vma,
> + struct i915_vma_resource *vma_res,
> enum i915_cache_level cache_level,
> u32 unused)
> {
> unsigned int flags = (cache_level == I915_CACHE_NONE) ?
> AGP_USER_MEMORY : AGP_USER_CACHED_MEMORY;
>
> - intel_gtt_insert_sg_entries(vma->pages, vma->node.start >> PAGE_SHIFT,
> + intel_gtt_insert_sg_entries(vma_res->bi.pages, vma_res->start >> PAGE_SHIFT,
> flags);
> }
>
> @@ -467,30 +467,32 @@ static void i915_ggtt_clear_range(struct i915_address_space *vm,
>
> static void ggtt_bind_vma(struct i915_address_space *vm,
> struct i915_vm_pt_stash *stash,
> - struct i915_vma *vma,
> + struct i915_vma_resource *vma_res,
> enum i915_cache_level cache_level,
> u32 flags)
> {
> - struct drm_i915_gem_object *obj = vma->obj;
> u32 pte_flags;
>
> - if (i915_vma_is_bound(vma, ~flags & I915_VMA_BIND_MASK))
> + if (vma_res->bound_flags & (~flags & I915_VMA_BIND_MASK))
> return;
>
> + vma_res->bound_flags |= flags;
> +
> /* Applicable to VLV (gen8+ do not support RO in the GGTT) */
> pte_flags = 0;
> - if (i915_gem_object_is_readonly(obj))
> + if (vma_res->bi.readonly)
> pte_flags |= PTE_READ_ONLY;
> - if (i915_gem_object_is_lmem(obj))
> + if (vma_res->bi.lmem)
> pte_flags |= PTE_LM;
>
> - vm->insert_entries(vm, vma, cache_level, pte_flags);
> - vma->page_sizes.gtt = I915_GTT_PAGE_SIZE;
> + vm->insert_entries(vm, vma_res, cache_level, pte_flags);
> + vma_res->page_sizes_gtt = I915_GTT_PAGE_SIZE;
> }
>
> -static void ggtt_unbind_vma(struct i915_address_space *vm, struct i915_vma *vma)
> +static void ggtt_unbind_vma(struct i915_address_space *vm,
> + struct i915_vma_resource *vma_res)
> {
> - vm->clear_range(vm, vma->node.start, vma->size);
> + vm->clear_range(vm, vma_res->start, vma_res->vma_size);
> }
>
> static int ggtt_reserve_guc_top(struct i915_ggtt *ggtt)
> @@ -623,7 +625,7 @@ static int init_ggtt(struct i915_ggtt *ggtt)
>
> static void aliasing_gtt_bind_vma(struct i915_address_space *vm,
> struct i915_vm_pt_stash *stash,
> - struct i915_vma *vma,
> + struct i915_vma_resource *vma_res,
> enum i915_cache_level cache_level,
> u32 flags)
> {
> @@ -631,25 +633,27 @@ static void aliasing_gtt_bind_vma(struct i915_address_space *vm,
>
> /* Currently applicable only to VLV */
> pte_flags = 0;
> - if (i915_gem_object_is_readonly(vma->obj))
> + if (vma_res->bi.readonly)
> pte_flags |= PTE_READ_ONLY;
>
> if (flags & I915_VMA_LOCAL_BIND)
> ppgtt_bind_vma(&i915_vm_to_ggtt(vm)->alias->vm,
> - stash, vma, cache_level, flags);
> + stash, vma_res, cache_level, flags);
>
> if (flags & I915_VMA_GLOBAL_BIND)
> - vm->insert_entries(vm, vma, cache_level, pte_flags);
> + vm->insert_entries(vm, vma_res, cache_level, pte_flags);
> +
> + vma_res->bound_flags |= flags;
> }
>
> static void aliasing_gtt_unbind_vma(struct i915_address_space *vm,
> - struct i915_vma *vma)
> + struct i915_vma_resource *vma_res)
> {
> - if (i915_vma_is_bound(vma, I915_VMA_GLOBAL_BIND))
> - vm->clear_range(vm, vma->node.start, vma->size);
> + if (vma_res->bound_flags & I915_VMA_GLOBAL_BIND)
> + vm->clear_range(vm, vma_res->start, vma_res->vma_size);
>
> - if (i915_vma_is_bound(vma, I915_VMA_LOCAL_BIND))
> - ppgtt_unbind_vma(&i915_vm_to_ggtt(vm)->alias->vm, vma);
> + if (vma_res->bound_flags & I915_VMA_LOCAL_BIND)
> + ppgtt_unbind_vma(&i915_vm_to_ggtt(vm)->alias->vm, vma_res);
> }
>
> static int init_aliasing_ppgtt(struct i915_ggtt *ggtt)
> @@ -1280,7 +1284,7 @@ bool i915_ggtt_resume_vm(struct i915_address_space *vm)
> atomic_read(&vma->flags) & I915_VMA_BIND_MASK;
>
> GEM_BUG_ON(!was_bound);
> - vma->ops->bind_vma(vm, NULL, vma,
> + vma->ops->bind_vma(vm, NULL, vma->resource,
> obj ? obj->cache_level : 0,
> was_bound);
> if (obj) { /* only used during resume => exclusive access */
> diff --git a/drivers/gpu/drm/i915/gt/intel_gtt.h b/drivers/gpu/drm/i915/gt/intel_gtt.h
> index 177b42b935a1..676b839d1a34 100644
> --- a/drivers/gpu/drm/i915/gt/intel_gtt.h
> +++ b/drivers/gpu/drm/i915/gt/intel_gtt.h
> @@ -27,6 +27,7 @@
>
> #include "gt/intel_reset.h"
> #include "i915_selftest.h"
> +#include "i915_vma_resource.h"
> #include "i915_vma_types.h"
>
> #define I915_GFP_ALLOW_FAIL (GFP_KERNEL | __GFP_RETRY_MAYFAIL | __GFP_NOWARN)
> @@ -200,7 +201,7 @@ struct i915_vma_ops {
> /* Map an object into an address space with the given cache flags. */
> void (*bind_vma)(struct i915_address_space *vm,
> struct i915_vm_pt_stash *stash,
> - struct i915_vma *vma,
> + struct i915_vma_resource *vma_res,
> enum i915_cache_level cache_level,
> u32 flags);
> /*
> @@ -208,7 +209,8 @@ struct i915_vma_ops {
> * setting the valid PTE entries to a reserved scratch page.
> */
> void (*unbind_vma)(struct i915_address_space *vm,
> - struct i915_vma *vma);
> + struct i915_vma_resource *vma_res);
> +
> };
>
> struct i915_address_space {
> @@ -285,7 +287,7 @@ struct i915_address_space {
> enum i915_cache_level cache_level,
> u32 flags);
> void (*insert_entries)(struct i915_address_space *vm,
> - struct i915_vma *vma,
> + struct i915_vma_resource *vma_res,
> enum i915_cache_level cache_level,
> u32 flags);
> void (*cleanup)(struct i915_address_space *vm);
> @@ -600,11 +602,11 @@ void gen6_ggtt_invalidate(struct i915_ggtt *ggtt);
>
> void ppgtt_bind_vma(struct i915_address_space *vm,
> struct i915_vm_pt_stash *stash,
> - struct i915_vma *vma,
> + struct i915_vma_resource *vma_res,
> enum i915_cache_level cache_level,
> u32 flags);
> void ppgtt_unbind_vma(struct i915_address_space *vm,
> - struct i915_vma *vma);
> + struct i915_vma_resource *vma_res);
>
> void gtt_write_workarounds(struct intel_gt *gt);
>
> @@ -627,8 +629,8 @@ __vm_create_scratch_for_read_pinned(struct i915_address_space *vm, unsigned long
> static inline struct sgt_dma {
> struct scatterlist *sg;
> dma_addr_t dma, max;
> -} sgt_dma(struct i915_vma *vma) {
> - struct scatterlist *sg = vma->pages->sgl;
> +} sgt_dma(struct i915_vma_resource *vma_res) {
> + struct scatterlist *sg = vma_res->bi.pages->sgl;
> dma_addr_t addr = sg_dma_address(sg);
>
> return (struct sgt_dma){ sg, addr, addr + sg_dma_len(sg) };
> diff --git a/drivers/gpu/drm/i915/gt/intel_ppgtt.c b/drivers/gpu/drm/i915/gt/intel_ppgtt.c
> index 083b3090c69c..48e6e2f87700 100644
> --- a/drivers/gpu/drm/i915/gt/intel_ppgtt.c
> +++ b/drivers/gpu/drm/i915/gt/intel_ppgtt.c
> @@ -179,32 +179,34 @@ struct i915_ppgtt *i915_ppgtt_create(struct intel_gt *gt,
>
> void ppgtt_bind_vma(struct i915_address_space *vm,
> struct i915_vm_pt_stash *stash,
> - struct i915_vma *vma,
> + struct i915_vma_resource *vma_res,
> enum i915_cache_level cache_level,
> u32 flags)
> {
> u32 pte_flags;
>
> - if (!test_bit(I915_VMA_ALLOC_BIT, __i915_vma_flags(vma))) {
> - vm->allocate_va_range(vm, stash, vma->node.start, vma->size);
> - set_bit(I915_VMA_ALLOC_BIT, __i915_vma_flags(vma));
> + if (!vma_res->allocated) {
> + vm->allocate_va_range(vm, stash, vma_res->start,
> + vma_res->vma_size);
> + vma_res->allocated = true;
> }
>
> /* Applicable to VLV, and gen8+ */
> pte_flags = 0;
> - if (i915_gem_object_is_readonly(vma->obj))
> + if (vma_res->bi.readonly)
> pte_flags |= PTE_READ_ONLY;
> - if (i915_gem_object_is_lmem(vma->obj))
> + if (vma_res->bi.lmem)
> pte_flags |= PTE_LM;
>
> - vm->insert_entries(vm, vma, cache_level, pte_flags);
> + vm->insert_entries(vm, vma_res, cache_level, pte_flags);
> wmb();
> }
>
> -void ppgtt_unbind_vma(struct i915_address_space *vm, struct i915_vma *vma)
> +void ppgtt_unbind_vma(struct i915_address_space *vm,
> + struct i915_vma_resource *vma_res)
> {
> - if (test_and_clear_bit(I915_VMA_ALLOC_BIT, __i915_vma_flags(vma)))
Can we remove ALLOC_BIT? Or are there still users?
> - vm->clear_range(vm, vma->node.start, vma->size);
> + if (vma_res->allocated)
> + vm->clear_range(vm, vma_res->start, vma_res->vma_size);
> }
>
> static unsigned long pd_count(u64 size, int shift)
> diff --git a/drivers/gpu/drm/i915/gt/uc/intel_uc_fw.c b/drivers/gpu/drm/i915/gt/uc/intel_uc_fw.c
> index a5af05bde6f2..777fc6f0ceff 100644
> --- a/drivers/gpu/drm/i915/gt/uc/intel_uc_fw.c
> +++ b/drivers/gpu/drm/i915/gt/uc/intel_uc_fw.c
> @@ -448,20 +448,19 @@ static void uc_fw_bind_ggtt(struct intel_uc_fw *uc_fw)
> {
> struct drm_i915_gem_object *obj = uc_fw->obj;
> struct i915_ggtt *ggtt = __uc_fw_to_gt(uc_fw)->ggtt;
> - struct i915_vma *dummy = &uc_fw->dummy;
> + struct i915_vma_resource *dummy = &uc_fw->dummy;
> u32 pte_flags = 0;
>
> - dummy->node.start = uc_fw_ggtt_offset(uc_fw);
> - dummy->node.size = obj->base.size;
> - dummy->pages = obj->mm.pages;
> - dummy->vm = &ggtt->vm;
> + dummy->start = uc_fw_ggtt_offset(uc_fw);
> + dummy->node_size = obj->base.size;
> + dummy->bi.pages = obj->mm.pages;
>
> GEM_BUG_ON(!i915_gem_object_has_pinned_pages(obj));
> - GEM_BUG_ON(dummy->node.size > ggtt->uc_fw.size);
> + GEM_BUG_ON(dummy->node_size > ggtt->uc_fw.size);
>
> /* uc_fw->obj cache domains were not controlled across suspend */
> if (i915_gem_object_has_struct_page(obj))
> - drm_clflush_sg(dummy->pages);
> + drm_clflush_sg(dummy->bi.pages);
>
> if (i915_gem_object_is_lmem(obj))
> pte_flags |= PTE_LM;
> diff --git a/drivers/gpu/drm/i915/gt/uc/intel_uc_fw.h b/drivers/gpu/drm/i915/gt/uc/intel_uc_fw.h
> index d9d1dc0b4cbb..3229018877d3 100644
> --- a/drivers/gpu/drm/i915/gt/uc/intel_uc_fw.h
> +++ b/drivers/gpu/drm/i915/gt/uc/intel_uc_fw.h
> @@ -85,7 +85,7 @@ struct intel_uc_fw {
> * threaded as it done during driver load (inherently single threaded)
> * or during a GT reset (mutex guarantees single threaded).
> */
> - struct i915_vma dummy;
> + struct i915_vma_resource dummy;
> struct i915_vma *rsa_data;
>
> /*
> diff --git a/drivers/gpu/drm/i915/i915_debugfs.c b/drivers/gpu/drm/i915/i915_debugfs.c
> index e0e052cdf8b8..f7d1feba5aa4 100644
> --- a/drivers/gpu/drm/i915/i915_debugfs.c
> +++ b/drivers/gpu/drm/i915/i915_debugfs.c
> @@ -170,7 +170,8 @@ i915_debugfs_describe_obj(struct seq_file *m, struct drm_i915_gem_object *obj)
> seq_printf(m, " (%s offset: %08llx, size: %08llx, pages: %s",
> stringify_vma_type(vma),
> vma->node.start, vma->node.size,
> - stringify_page_sizes(vma->page_sizes.gtt, NULL, 0));
> + stringify_page_sizes(vma->resource->page_sizes_gtt,
> + NULL, 0));
> if (i915_vma_is_ggtt(vma) || i915_vma_is_dpt(vma)) {
> switch (vma->ggtt_view.type) {
> case I915_GGTT_VIEW_NORMAL:
> diff --git a/drivers/gpu/drm/i915/i915_gpu_error.c b/drivers/gpu/drm/i915/i915_gpu_error.c
> index 5ae812d60abe..1af54ff374f9 100644
> --- a/drivers/gpu/drm/i915/i915_gpu_error.c
> +++ b/drivers/gpu/drm/i915/i915_gpu_error.c
> @@ -1040,9 +1040,9 @@ i915_vma_coredump_create(const struct intel_gt *gt,
> strcpy(dst->name, vsnap->name);
> dst->next = NULL;
>
> - dst->gtt_offset = vsnap->gtt_offset;
> - dst->gtt_size = vsnap->gtt_size;
> - dst->gtt_page_sizes = vsnap->page_sizes;
> + dst->gtt_offset = vsnap->vma_resource->start;
> + dst->gtt_size = vsnap->vma_resource->node_size;
> + dst->gtt_page_sizes = vsnap->vma_resource->page_sizes_gtt;
> dst->unused = 0;
>
> ret = -EINVAL;
> diff --git a/drivers/gpu/drm/i915/i915_vma.c b/drivers/gpu/drm/i915/i915_vma.c
> index 7097c5016431..1d4e448d22d9 100644
> --- a/drivers/gpu/drm/i915/i915_vma.c
> +++ b/drivers/gpu/drm/i915/i915_vma.c
> @@ -298,7 +298,7 @@ static void __vma_bind(struct dma_fence_work *work)
> struct i915_vma *vma = vw->vma;
>
> vma->ops->bind_vma(vw->vm, &vw->stash,
> - vma, vw->cache_level, vw->flags);
> + vma->resource, vw->cache_level, vw->flags);
> }
>
> static void __vma_release(struct dma_fence_work *work)
> @@ -375,6 +375,21 @@ static int i915_vma_verify_bind_complete(struct i915_vma *vma)
> #define i915_vma_verify_bind_complete(_vma) 0
> #endif
>
> +I915_SELFTEST_EXPORT void
> +i915_vma_resource_init_from_vma(struct i915_vma_resource *vma_res,
> + struct i915_vma *vma)
> +{
> + struct drm_i915_gem_object *obj = vma->obj;
> +
> + i915_vma_resource_init(vma_res, vma->pages, &vma->page_sizes,
> + i915_gem_object_is_readonly(obj),
> + i915_gem_object_is_lmem(obj),
> + vma->private,
> + vma->node.start,
> + vma->node.size,
> + vma->size);
> +}
> +
> /**
> * i915_vma_bind - Sets up PTEs for an VMA in it's corresponding address space.
> * @vma: VMA to map
> @@ -432,7 +447,7 @@ int i915_vma_bind(struct i915_vma *vma,
> GEM_WARN_ON(!vma_flags);
> kfree(vma_res);
> } else {
> - i915_vma_resource_init(vma_res);
> + i915_vma_resource_init_from_vma(vma_res, vma);
> vma->resource = vma_res;
> }
> trace_i915_vma_bind(vma, bind_flags);
> @@ -472,7 +487,8 @@ int i915_vma_bind(struct i915_vma *vma,
> if (ret)
> return ret;
> }
> - vma->ops->bind_vma(vma->vm, NULL, vma, cache_level, bind_flags);
> + vma->ops->bind_vma(vma->vm, NULL, vma->resource, cache_level,
> + bind_flags);
> }
>
> atomic_or(bind_flags, &vma->flags);
> @@ -1778,7 +1794,7 @@ void __i915_vma_evict(struct i915_vma *vma)
>
> if (likely(atomic_read(&vma->vm->open))) {
> trace_i915_vma_unbind(vma);
> - vma->ops->unbind_vma(vma->vm, vma);
> + vma->ops->unbind_vma(vma->vm, vma->resource);
> }
> atomic_and(~(I915_VMA_BIND_MASK | I915_VMA_ERROR | I915_VMA_GGTT_WRITE),
> &vma->flags);
> diff --git a/drivers/gpu/drm/i915/i915_vma.h b/drivers/gpu/drm/i915/i915_vma.h
> index de0f3e44cdfa..1df57ec832bd 100644
> --- a/drivers/gpu/drm/i915/i915_vma.h
> +++ b/drivers/gpu/drm/i915/i915_vma.h
> @@ -339,12 +339,6 @@ void __iomem *i915_vma_pin_iomap(struct i915_vma *vma);
> */
> void i915_vma_unpin_iomap(struct i915_vma *vma);
>
> -static inline struct page *i915_vma_first_page(struct i915_vma *vma)
> -{
> - GEM_BUG_ON(!vma->pages);
> - return sg_page(vma->pages->sgl);
> -}
> -
> /**
> * i915_vma_pin_fence - pin fencing state
> * @vma: vma to pin fencing for
> @@ -445,6 +439,11 @@ i915_vma_get_current_resource(struct i915_vma *vma)
> return i915_vma_resource_get(vma->resource);
> }
>
> +#if IS_ENABLED(CONFIG_DRM_I915_SELFTEST)
> +void i915_vma_resource_init_from_vma(struct i915_vma_resource *vma_res,
> + struct i915_vma *vma);
> +#endif
> +
> void i915_vma_module_exit(void);
> int i915_vma_module_init(void);
>
> diff --git a/drivers/gpu/drm/i915/i915_vma_resource.c b/drivers/gpu/drm/i915/i915_vma_resource.c
> index 833e987bed2a..c86db89ab5d2 100644
> --- a/drivers/gpu/drm/i915/i915_vma_resource.c
> +++ b/drivers/gpu/drm/i915/i915_vma_resource.c
> @@ -23,15 +23,12 @@ static struct dma_fence_ops unbind_fence_ops = {
> };
>
> /**
> - * i915_vma_resource_init - Initialize a vma resource.
> + * __i915_vma_resource_init - Initialize a vma resource.
> * @vma_res: The vma resource to initialize
> *
> - * Initializes a vma resource allocated using i915_vma_resource_alloc().
> - * The reason for having separate allocate and initialize function is that
> - * initialization may need to be performed from under a lock where
> - * allocation is not allowed.
> + * Initializes the private members of a vma resource.
> */
> -void i915_vma_resource_init(struct i915_vma_resource *vma_res)
> +void __i915_vma_resource_init(struct i915_vma_resource *vma_res)
> {
> spin_lock_init(&vma_res->lock);
> dma_fence_init(&vma_res->unbind_fence, &unbind_fence_ops,
> diff --git a/drivers/gpu/drm/i915/i915_vma_resource.h b/drivers/gpu/drm/i915/i915_vma_resource.h
> index 34744da23072..9872de58268b 100644
> --- a/drivers/gpu/drm/i915/i915_vma_resource.h
> +++ b/drivers/gpu/drm/i915/i915_vma_resource.h
> @@ -9,6 +9,25 @@
> #include <linux/dma-fence.h>
> #include <linux/refcount.h>
>
> +#include "i915_gem.h"
> +
> +struct i915_page_sizes {
> + /**
> + * The sg mask of the pages sg_table. i.e the mask of
> + * the lengths for each sg entry.
> + */
> + unsigned int phys;
> +
> + /**
> + * The gtt page sizes we are allowed to use given the
> + * sg mask and the supported page sizes. This will
> + * express the smallest unit we can use for the whole
> + * object, as well as the larger sizes we may be able
> + * to use opportunistically.
> + */
> + unsigned int sg;
> +};
> +
> /**
> * struct i915_vma_resource - Snapshotted unbind information.
> * @unbind_fence: Fence to mark unbinding complete. Note that this fence
> @@ -20,6 +39,13 @@
> * @hold_count: Number of holders blocking the fence from finishing.
> * The vma itself is keeping a hold, which is released when unbind
> * is scheduled.
> + * @private: Bind backend private info.
> + * @start: Offset into the address space of bind range start.
> + * @node_size: Size of the allocated range manager node.
> + * @vma_size: Bind size.
> + * @page_sizes_gtt: Resulting page sizes from the bind operation.
> + * @bound_flags: Flags indicating binding status.
> + * @allocated: Backend private data. TODO: Should move into @private.
> *
> * The lifetime of a struct i915_vma_resource is from a binding request to
> * the actual possible asynchronous unbind has completed.
> @@ -29,6 +55,32 @@ struct i915_vma_resource {
> /* See above for description of the lock. */
> spinlock_t lock;
> refcount_t hold_count;
> +
> + /**
> + * struct i915_vma_bindinfo - Information needed for async bind
> + * only but that can be dropped after the bind has taken place.
> + * Consider making this a separate argument to the bind_vma
> + * op, coalescing with other arguments like vm, stash, cache_level
> + * and flags
> + * @pages: The pages sg-table.
> + * @page_sizes: Page sizes of the pages.
> + * @readonly: Whether the vma should be bound read-only.
> + * @lmem: Whether the vma points to lmem.
> + */
> + struct i915_vma_bindinfo {
> + struct sg_table *pages;
> + struct i915_page_sizes page_sizes;
> + bool readonly:1;
> + bool lmem:1;
> + } bi;
> +
> + void *private;
> + unsigned long start;
> + unsigned long node_size;
> + unsigned long vma_size;
AFAIK these need to be u64, or at least the node_size & start.
Otherwise,
Reviewed-by: Matthew Auld <matthew.auld at intel.com>
> + u32 page_sizes_gtt;
> + u32 bound_flags;
> + bool allocated:1;
> };
>
> bool i915_vma_resource_hold(struct i915_vma_resource *vma_res,
> @@ -41,6 +93,8 @@ struct i915_vma_resource *i915_vma_resource_alloc(void);
>
> struct dma_fence *i915_vma_resource_unbind(struct i915_vma_resource *vma_res);
>
> +void __i915_vma_resource_init(struct i915_vma_resource *vma_res);
> +
> /**
> * i915_vma_resource_get - Take a reference on a vma resource
> * @vma_res: The vma resource on which to take a reference.
> @@ -63,8 +117,47 @@ static inline void i915_vma_resource_put(struct i915_vma_resource *vma_res)
> dma_fence_put(&vma_res->unbind_fence);
> }
>
> -#if IS_ENABLED(CONFIG_DRM_I915_SELFTEST)
> -void i915_vma_resource_init(struct i915_vma_resource *vma_res);
> -#endif
> +/**
> + * i915_vma_resource_init - Initialize a vma resource.
> + * @vma_res: The vma resource to initialize
> + * @pages: The pages sg-table.
> + * @page_sizes: Page sizes of the pages.
> + * @readonly: Whether the vma should be bound read-only.
> + * @lmem: Whether the vma points to lmem.
> + * @private: Bind backend private info.
> + * @start: Offset into the address space of bind range start.
> + * @node_size: Size of the allocated range manager node.
> + * @size: Bind size.
> + *
> + * Initializes a vma resource allocated using i915_vma_resource_alloc().
> + * The reason for having separate allocate and initialize function is that
> + * initialization may need to be performed from under a lock where
> + * allocation is not allowed.
> + */
> +static inline void i915_vma_resource_init(struct i915_vma_resource *vma_res,
> + struct sg_table *pages,
> + const struct i915_page_sizes *page_sizes,
> + bool readonly,
> + bool lmem,
> + void *private,
> + unsigned long start,
> + unsigned long node_size,
> + unsigned long size)
> +{
> + __i915_vma_resource_init(vma_res);
> + vma_res->bi.pages = pages;
> + vma_res->bi.page_sizes = *page_sizes;
> + vma_res->bi.readonly = readonly;
> + vma_res->bi.lmem = lmem;
> + vma_res->private = private;
> + vma_res->start = start;
> + vma_res->node_size = node_size;
> + vma_res->vma_size = size;
> +}
> +
> +static inline void i915_vma_resource_fini(struct i915_vma_resource *vma_res)
> +{
> + GEM_BUG_ON(refcount_read(&vma_res->hold_count) != 1);
> +}
>
> #endif
> diff --git a/drivers/gpu/drm/i915/i915_vma_snapshot.c b/drivers/gpu/drm/i915/i915_vma_snapshot.c
> index f7333c7a2f5e..69f62c1ca967 100644
> --- a/drivers/gpu/drm/i915/i915_vma_snapshot.c
> +++ b/drivers/gpu/drm/i915/i915_vma_snapshot.c
> @@ -24,11 +24,7 @@ void i915_vma_snapshot_init(struct i915_vma_snapshot *vsnap,
> assert_object_held(vma->obj);
>
> vsnap->name = name;
> - vsnap->size = vma->size;
> vsnap->obj_size = vma->obj->base.size;
> - vsnap->gtt_offset = vma->node.start;
> - vsnap->gtt_size = vma->node.size;
> - vsnap->page_sizes = vma->page_sizes.gtt;
> vsnap->pages = vma->pages;
> vsnap->pages_rsgt = NULL;
> vsnap->mr = NULL;
> diff --git a/drivers/gpu/drm/i915/i915_vma_snapshot.h b/drivers/gpu/drm/i915/i915_vma_snapshot.h
> index e74588dd676b..1b08ce9f8576 100644
> --- a/drivers/gpu/drm/i915/i915_vma_snapshot.h
> +++ b/drivers/gpu/drm/i915/i915_vma_snapshot.h
> @@ -23,31 +23,23 @@ struct sg_table;
>
> /**
> * struct i915_vma_snapshot - Snapshot of vma metadata.
> - * @size: The vma size in bytes.
> * @obj_size: The size of the underlying object in bytes.
> - * @gtt_offset: The gtt offset the vma is bound to.
> - * @gtt_size: The size in bytes allocated for the vma in the GTT.
> * @pages: The struct sg_table pointing to the pages bound.
> * @pages_rsgt: The refcounted sg_table holding the reference for @pages if any.
> * @mr: The memory region pointed for the pages bound.
> * @kref: Reference for this structure.
> * @vma_resource: Pointer to the vma resource representing the vma binding.
> - * @page_sizes: The vma GTT page sizes information.
> * @onstack: Whether the structure shouldn't be freed on final put.
> * @present: Whether the structure is present and initialized.
> */
> struct i915_vma_snapshot {
> const char *name;
> - size_t size;
> size_t obj_size;
> - size_t gtt_offset;
> - size_t gtt_size;
> struct sg_table *pages;
> struct i915_refct_sgt *pages_rsgt;
> struct intel_memory_region *mr;
> struct kref kref;
> struct i915_vma_resource *vma_resource;
> - u32 page_sizes;
> bool onstack:1;
> bool present:1;
> };
> diff --git a/drivers/gpu/drm/i915/selftests/i915_gem_gtt.c b/drivers/gpu/drm/i915/selftests/i915_gem_gtt.c
> index 54be880e55c3..70b5c47890b9 100644
> --- a/drivers/gpu/drm/i915/selftests/i915_gem_gtt.c
> +++ b/drivers/gpu/drm/i915/selftests/i915_gem_gtt.c
> @@ -239,11 +239,11 @@ static int lowlevel_hole(struct i915_address_space *vm,
> unsigned long end_time)
> {
> I915_RND_STATE(seed_prng);
> - struct i915_vma *mock_vma;
> + struct i915_vma_resource *mock_vma_res;
> unsigned int size;
>
> - mock_vma = kzalloc(sizeof(*mock_vma), GFP_KERNEL);
> - if (!mock_vma)
> + mock_vma_res = kzalloc(sizeof(*mock_vma_res), GFP_KERNEL);
> + if (!mock_vma_res)
> return -ENOMEM;
>
> /* Keep creating larger objects until one cannot fit into the hole */
> @@ -269,7 +269,7 @@ static int lowlevel_hole(struct i915_address_space *vm,
> break;
> } while (count >>= 1);
> if (!count) {
> - kfree(mock_vma);
> + kfree(mock_vma_res);
> return -ENOMEM;
> }
> GEM_BUG_ON(!order);
> @@ -343,12 +343,12 @@ static int lowlevel_hole(struct i915_address_space *vm,
> break;
> }
>
> - mock_vma->pages = obj->mm.pages;
> - mock_vma->node.size = BIT_ULL(size);
> - mock_vma->node.start = addr;
> + mock_vma_res->bi.pages = obj->mm.pages;
> + mock_vma_res->node_size = BIT_ULL(size);
> + mock_vma_res->start = addr;
>
> with_intel_runtime_pm(vm->gt->uncore->rpm, wakeref)
> - vm->insert_entries(vm, mock_vma,
> + vm->insert_entries(vm, mock_vma_res,
> I915_CACHE_NONE, 0);
> }
> count = n;
> @@ -371,7 +371,7 @@ static int lowlevel_hole(struct i915_address_space *vm,
> cleanup_freed_objects(vm->i915);
> }
>
> - kfree(mock_vma);
> + kfree(mock_vma_res);
> return 0;
> }
>
> @@ -1280,6 +1280,7 @@ static void track_vma_bind(struct i915_vma *vma)
> atomic_set(&vma->pages_count, I915_VMA_PAGES_ACTIVE);
> __i915_gem_object_pin_pages(obj);
> vma->pages = obj->mm.pages;
> + vma->resource->bi.pages = vma->pages;
>
> mutex_lock(&vma->vm->mutex);
> list_add_tail(&vma->vm_link, &vma->vm->bound_list);
> @@ -1354,7 +1355,7 @@ static int reserve_gtt_with_resource(struct i915_vma *vma, u64 offset)
> obj->cache_level,
> 0);
> if (!err) {
> - i915_vma_resource_init(vma_res);
> + i915_vma_resource_init_from_vma(vma_res, vma);
> vma->resource = vma_res;
> } else {
> kfree(vma_res);
> @@ -1533,7 +1534,7 @@ static int insert_gtt_with_resource(struct i915_vma *vma)
> err = i915_gem_gtt_insert(vm, &vma->node, obj->base.size, 0,
> obj->cache_level, 0, vm->total, 0);
> if (!err) {
> - i915_vma_resource_init(vma_res);
> + i915_vma_resource_init_from_vma(vma_res, vma);
> vma->resource = vma_res;
> } else {
> kfree(vma_res);
> @@ -1958,6 +1959,7 @@ static int igt_cs_tlb(void *arg)
> struct i915_vm_pt_stash stash = {};
> struct i915_request *rq;
> struct i915_gem_ww_ctx ww;
> + struct i915_vma_resource *vma_res;
> u64 offset;
>
> offset = igt_random_offset(&prng,
> @@ -1978,6 +1980,13 @@ static int igt_cs_tlb(void *arg)
> if (err)
> goto end;
>
> + vma_res = i915_vma_resource_alloc();
> + if (IS_ERR(vma_res)) {
> + i915_vma_put_pages(vma);
> + err = PTR_ERR(vma_res);
> + goto end;
> + }
> +
> i915_gem_ww_ctx_init(&ww, false);
> retry:
> err = i915_vm_lock_objects(vm, &ww);
> @@ -1999,33 +2008,41 @@ static int igt_cs_tlb(void *arg)
> goto retry;
> }
> i915_gem_ww_ctx_fini(&ww);
> - if (err)
> + if (err) {
> + kfree(vma_res);
> goto end;
> + }
>
> + i915_vma_resource_init_from_vma(vma_res, vma);
> /* Prime the TLB with the dummy pages */
> for (i = 0; i < count; i++) {
> - vma->node.start = offset + i * PAGE_SIZE;
> - vm->insert_entries(vm, vma, I915_CACHE_NONE, 0);
> + vma_res->start = offset + i * PAGE_SIZE;
> + vm->insert_entries(vm, vma_res, I915_CACHE_NONE,
> + 0);
>
> - rq = submit_batch(ce, vma->node.start);
> + rq = submit_batch(ce, vma_res->start);
> if (IS_ERR(rq)) {
> err = PTR_ERR(rq);
> + i915_vma_resource_fini(vma_res);
> + kfree(vma_res);
> goto end;
> }
> i915_request_put(rq);
> }
> -
> + i915_vma_resource_fini(vma_res);
> i915_vma_put_pages(vma);
>
> err = context_sync(ce);
> if (err) {
> pr_err("%s: dummy setup timed out\n",
> ce->engine->name);
> + kfree(vma_res);
> goto end;
> }
>
> vma = i915_vma_instance(act, vm, NULL);
> if (IS_ERR(vma)) {
> + kfree(vma_res);
> err = PTR_ERR(vma);
> goto end;
> }
> @@ -2033,19 +2050,22 @@ static int igt_cs_tlb(void *arg)
> i915_gem_object_lock(act, NULL);
> err = i915_vma_get_pages(vma);
> i915_gem_object_unlock(act);
> - if (err)
> + if (err) {
> + kfree(vma_res);
> goto end;
> + }
>
> + i915_vma_resource_init_from_vma(vma_res, vma);
> /* Replace the TLB with target batches */
> for (i = 0; i < count; i++) {
> struct i915_request *rq;
> u32 *cs = batch + i * 64 / sizeof(*cs);
> u64 addr;
>
> - vma->node.start = offset + i * PAGE_SIZE;
> - vm->insert_entries(vm, vma, I915_CACHE_NONE, 0);
> + vma_res->start = offset + i * PAGE_SIZE;
> + vm->insert_entries(vm, vma_res, I915_CACHE_NONE, 0);
>
> - addr = vma->node.start + i * 64;
> + addr = vma_res->start + i * 64;
> cs[4] = MI_NOOP;
> cs[6] = lower_32_bits(addr);
> cs[7] = upper_32_bits(addr);
> @@ -2054,6 +2074,8 @@ static int igt_cs_tlb(void *arg)
> rq = submit_batch(ce, addr);
> if (IS_ERR(rq)) {
> err = PTR_ERR(rq);
> + i915_vma_resource_fini(vma_res);
> + kfree(vma_res);
> goto end;
> }
>
> @@ -2070,6 +2092,8 @@ static int igt_cs_tlb(void *arg)
> }
> end_spin(batch, count - 1);
>
> + i915_vma_resource_fini(vma_res);
> + kfree(vma_res);
> i915_vma_put_pages(vma);
>
> err = context_sync(ce);
> diff --git a/drivers/gpu/drm/i915/selftests/mock_gtt.c b/drivers/gpu/drm/i915/selftests/mock_gtt.c
> index 1802baf80a17..d40519e3ca38 100644
> --- a/drivers/gpu/drm/i915/selftests/mock_gtt.c
> +++ b/drivers/gpu/drm/i915/selftests/mock_gtt.c
> @@ -33,23 +33,23 @@ static void mock_insert_page(struct i915_address_space *vm,
> }
>
> static void mock_insert_entries(struct i915_address_space *vm,
> - struct i915_vma *vma,
> + struct i915_vma_resource *vma_res,
> enum i915_cache_level level, u32 flags)
> {
> }
>
> static void mock_bind_ppgtt(struct i915_address_space *vm,
> struct i915_vm_pt_stash *stash,
> - struct i915_vma *vma,
> + struct i915_vma_resource *vma_res,
> enum i915_cache_level cache_level,
> u32 flags)
> {
> GEM_BUG_ON(flags & I915_VMA_GLOBAL_BIND);
> - set_bit(I915_VMA_LOCAL_BIND_BIT, __i915_vma_flags(vma));
> + vma_res->bound_flags |= flags;
> }
>
> static void mock_unbind_ppgtt(struct i915_address_space *vm,
> - struct i915_vma *vma)
> + struct i915_vma_resource *vma_res)
> {
> }
>
> @@ -93,14 +93,14 @@ struct i915_ppgtt *mock_ppgtt(struct drm_i915_private *i915, const char *name)
>
> static void mock_bind_ggtt(struct i915_address_space *vm,
> struct i915_vm_pt_stash *stash,
> - struct i915_vma *vma,
> + struct i915_vma_resource *vma_res,
> enum i915_cache_level cache_level,
> u32 flags)
> {
> }
>
> static void mock_unbind_ggtt(struct i915_address_space *vm,
> - struct i915_vma *vma)
> + struct i915_vma_resource *vma_res)
> {
> }
>
>
More information about the Intel-gfx
mailing list