[PATCH 5/5] drm/amdgpu: add AMDGPU_GEM_CREATE_LINEAR flag

Alex Deucher alexdeucher at gmail.com
Thu Aug 18 22:12:33 UTC 2016


On Thu, Aug 18, 2016 at 5:59 AM, Christian König
<deathsimple at vodafone.de> wrote:
> From: Christian König <christian.koenig at amd.com>
>
> Add a flag noting that a BO must be created using linear VRAM
> and set this flag on all in kernel users where appropriate.
>
> Hopefully I haven't missed anything.
>
> Signed-off-by: Christian König <christian.koenig at amd.com>

How about instead of LINEAR we use CONTIGUOUS?  linear is too easily
confused with tiling.  What about making contiguous the default and
having explicit requests for non-contiguous or scatter gather?

Alex


> ---
>  drivers/gpu/drm/amd/amdgpu/amdgpu.h        |  1 +
>  drivers/gpu/drm/amd/amdgpu/amdgpu_cgs.c    |  6 ++++--
>  drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c     | 31 ++++++++++++++++++++++++++++++
>  drivers/gpu/drm/amd/amdgpu/amdgpu_gart.c   |  3 ++-
>  drivers/gpu/drm/amd/amdgpu/amdgpu_object.c | 13 +++++++++++++
>  drivers/gpu/drm/amd/amdgpu/amdgpu_uvd.c    | 10 ++++++++--
>  drivers/gpu/drm/amd/amdgpu/amdgpu_vce.c    |  6 +++++-
>  drivers/gpu/drm/amd/amdgpu/amdgpu_vm.c     |  6 ++++--
>  include/uapi/drm/amdgpu_drm.h              |  2 ++
>  9 files changed, 70 insertions(+), 8 deletions(-)
>
> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu.h b/drivers/gpu/drm/amd/amdgpu/amdgpu.h
> index ffad8d9..2f5a70a 100644
> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu.h
> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu.h
> @@ -2533,6 +2533,7 @@ static inline void amdgpu_acpi_fini(struct amdgpu_device *adev) { }
>  struct amdgpu_bo_va_mapping *
>  amdgpu_cs_find_mapping(struct amdgpu_cs_parser *parser,
>                        uint64_t addr, struct amdgpu_bo **bo);
> +int amdgpu_cs_make_bos_linear(struct amdgpu_cs_parser *parser);
>
>  #if defined(CONFIG_DRM_AMD_DAL)
>  int amdgpu_dm_display_resume(struct amdgpu_device *adev );
> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_cgs.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_cgs.c
> index bc0440f..9a7092a 100644
> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_cgs.c
> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_cgs.c
> @@ -146,7 +146,8 @@ static int amdgpu_cgs_alloc_gpu_mem(struct cgs_device *cgs_device,
>         switch(type) {
>         case CGS_GPU_MEM_TYPE__VISIBLE_CONTIG_FB:
>         case CGS_GPU_MEM_TYPE__VISIBLE_FB:
> -               flags = AMDGPU_GEM_CREATE_CPU_ACCESS_REQUIRED;
> +               flags = AMDGPU_GEM_CREATE_CPU_ACCESS_REQUIRED |
> +                       AMDGPU_GEM_CREATE_VRAM_LINEAR;
>                 domain = AMDGPU_GEM_DOMAIN_VRAM;
>                 if (max_offset > adev->mc.real_vram_size)
>                         return -EINVAL;
> @@ -157,7 +158,8 @@ static int amdgpu_cgs_alloc_gpu_mem(struct cgs_device *cgs_device,
>                 break;
>         case CGS_GPU_MEM_TYPE__INVISIBLE_CONTIG_FB:
>         case CGS_GPU_MEM_TYPE__INVISIBLE_FB:
> -               flags = AMDGPU_GEM_CREATE_NO_CPU_ACCESS;
> +               flags = AMDGPU_GEM_CREATE_NO_CPU_ACCESS |
> +                       AMDGPU_GEM_CREATE_VRAM_LINEAR;
>                 domain = AMDGPU_GEM_DOMAIN_VRAM;
>                 if (adev->mc.visible_vram_size < adev->mc.real_vram_size) {
>                         place.fpfn =
> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c
> index d5d61a7..20d08ae 100644
> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c
> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c
> @@ -1041,3 +1041,34 @@ amdgpu_cs_find_mapping(struct amdgpu_cs_parser *parser,
>
>         return NULL;
>  }
> +
> +/**
> + * amdgpu_cs_make_bos_linear - mark all BOs in this CS as linear
> + *
> + * @parser: command submission parser context
> + *
> + * Helper for UVD/VCE VM emulation, mark all BOs in this CS as linear.
> + */
> +int amdgpu_cs_make_bos_linear(struct amdgpu_cs_parser *parser)
> +{
> +       unsigned i;
> +       int r;
> +
> +       if (!parser->bo_list)
> +               return 0;
> +
> +       for (i = 0; i < parser->bo_list->num_entries; i++) {
> +               struct amdgpu_bo *bo = parser->bo_list->array[i].robj;
> +
> +               if (bo->flags |= AMDGPU_GEM_CREATE_VRAM_LINEAR)
> +                       continue;
> +
> +               bo->flags |= AMDGPU_GEM_CREATE_VRAM_LINEAR;
> +               amdgpu_ttm_placement_from_domain(bo, bo->allowed_domains);
> +               r = ttm_bo_validate(&bo->tbo, &bo->placement, false, false);
> +               if (unlikely(r))
> +                       return r;
> +       }
> +
> +       return 0;
> +}
> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_gart.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_gart.c
> index 0feea34..b5982a9 100644
> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_gart.c
> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_gart.c
> @@ -126,7 +126,8 @@ int amdgpu_gart_table_vram_alloc(struct amdgpu_device *adev)
>         if (adev->gart.robj == NULL) {
>                 r = amdgpu_bo_create(adev, adev->gart.table_size,
>                                      PAGE_SIZE, true, AMDGPU_GEM_DOMAIN_VRAM,
> -                                    AMDGPU_GEM_CREATE_CPU_ACCESS_REQUIRED,
> +                                    AMDGPU_GEM_CREATE_CPU_ACCESS_REQUIRED |
> +                                    AMDGPU_GEM_CREATE_VRAM_LINEAR,
>                                      NULL, NULL, &adev->gart.robj);
>                 if (r) {
>                         return r;
> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_object.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_object.c
> index b8567d2..3945695 100644
> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_object.c
> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_object.c
> @@ -542,6 +542,8 @@ int amdgpu_bo_pin_restricted(struct amdgpu_bo *bo, u32 domain,
>
>                 return 0;
>         }
> +
> +       bo->flags |= AMDGPU_GEM_CREATE_VRAM_LINEAR;
>         amdgpu_ttm_placement_from_domain(bo, domain);
>         for (i = 0; i < bo->placement.num_placement; i++) {
>                 /* force to pin into visible video ram */
> @@ -777,6 +779,15 @@ int amdgpu_bo_fault_reserve_notify(struct ttm_buffer_object *bo)
>         if (bo->mem.mem_type != TTM_PL_VRAM)
>                 return 0;
>
> +       /* TODO: figure out how to map scattered VRAM to the CPU */
> +       if (!(abo->flags & AMDGPU_GEM_CREATE_VRAM_LINEAR)) {
> +               abo->flags |= AMDGPU_GEM_CREATE_VRAM_LINEAR;
> +               amdgpu_ttm_placement_from_domain(abo, AMDGPU_GEM_DOMAIN_VRAM);
> +               r = ttm_bo_validate(bo, &abo->placement, false, false);
> +               if (unlikely(r))
> +                       return r;
> +       }
> +
>         size = bo->mem.num_pages << PAGE_SHIFT;
>         offset = bo->mem.start << PAGE_SHIFT;
>         if ((offset + size) <= adev->mc.visible_vram_size)
> @@ -845,6 +856,8 @@ u64 amdgpu_bo_gpu_offset(struct amdgpu_bo *bo)
>         WARN_ON_ONCE(bo->tbo.mem.mem_type == TTM_PL_SYSTEM);
>         WARN_ON_ONCE(!ww_mutex_is_locked(&bo->tbo.resv->lock) &&
>                      !bo->pin_count);
> +       WARN_ON_ONCE(bo->tbo.mem.mem_type == TTM_PL_VRAM &&
> +                    !(bo->flags & AMDGPU_GEM_CREATE_VRAM_LINEAR));
>
>         return bo->tbo.offset;
>  }
> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_uvd.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_uvd.c
> index 533d702..a425d10 100644
> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_uvd.c
> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_uvd.c
> @@ -890,6 +890,10 @@ int amdgpu_uvd_ring_parse_cs(struct amdgpu_cs_parser *parser, uint32_t ib_idx)
>                 return -EINVAL;
>         }
>
> +       r = amdgpu_cs_make_bos_linear(parser);
> +       if (r)
> +               return r;
> +
>         ctx.parser = parser;
>         ctx.buf_sizes = buf_sizes;
>         ctx.ib_idx = ib_idx;
> @@ -1004,7 +1008,8 @@ int amdgpu_uvd_get_create_msg(struct amdgpu_ring *ring, uint32_t handle,
>
>         r = amdgpu_bo_create(adev, 1024, PAGE_SIZE, true,
>                              AMDGPU_GEM_DOMAIN_VRAM,
> -                            AMDGPU_GEM_CREATE_CPU_ACCESS_REQUIRED,
> +                            AMDGPU_GEM_CREATE_CPU_ACCESS_REQUIRED |
> +                            AMDGPU_GEM_CREATE_VRAM_LINEAR,
>                              NULL, NULL, &bo);
>         if (r)
>                 return r;
> @@ -1053,7 +1058,8 @@ int amdgpu_uvd_get_destroy_msg(struct amdgpu_ring *ring, uint32_t handle,
>
>         r = amdgpu_bo_create(adev, 1024, PAGE_SIZE, true,
>                              AMDGPU_GEM_DOMAIN_VRAM,
> -                            AMDGPU_GEM_CREATE_CPU_ACCESS_REQUIRED,
> +                            AMDGPU_GEM_CREATE_CPU_ACCESS_REQUIRED |
> +                            AMDGPU_GEM_CREATE_VRAM_LINEAR,
>                              NULL, NULL, &bo);
>         if (r)
>                 return r;
> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_vce.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_vce.c
> index 05865ce..9aa4458 100644
> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_vce.c
> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_vce.c
> @@ -634,7 +634,11 @@ int amdgpu_vce_ring_parse_cs(struct amdgpu_cs_parser *p, uint32_t ib_idx)
>         uint32_t allocated = 0;
>         uint32_t tmp, handle = 0;
>         uint32_t *size = &tmp;
> -       int i, r = 0, idx = 0;
> +       int i, r, idx = 0;
> +
> +       r = amdgpu_cs_make_bos_linear(p);
> +       if (r)
> +               return r;
>
>         while (idx < ib->length_dw) {
>                 uint32_t len = amdgpu_get_ib_value(p, ib_idx, idx);
> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_vm.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_vm.c
> index 0b92d36..cafbadb 100644
> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_vm.c
> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_vm.c
> @@ -1362,7 +1362,8 @@ int amdgpu_vm_bo_map(struct amdgpu_device *adev,
>                                      AMDGPU_GPU_PAGE_SIZE, true,
>                                      AMDGPU_GEM_DOMAIN_VRAM,
>                                      AMDGPU_GEM_CREATE_NO_CPU_ACCESS |
> -                                    AMDGPU_GEM_CREATE_SHADOW,
> +                                    AMDGPU_GEM_CREATE_SHADOW |
> +                                    AMDGPU_GEM_CREATE_VRAM_LINEAR,
>                                      NULL, resv, &pt);
>                 if (r)
>                         goto error_free;
> @@ -1562,7 +1563,8 @@ int amdgpu_vm_init(struct amdgpu_device *adev, struct amdgpu_vm *vm)
>         r = amdgpu_bo_create(adev, pd_size, align, true,
>                              AMDGPU_GEM_DOMAIN_VRAM,
>                              AMDGPU_GEM_CREATE_NO_CPU_ACCESS |
> -                            AMDGPU_GEM_CREATE_SHADOW,
> +                            AMDGPU_GEM_CREATE_SHADOW |
> +                            AMDGPU_GEM_CREATE_VRAM_LINEAR,
>                              NULL, NULL, &vm->page_directory);
>         if (r)
>                 goto error_free_sched_entity;
> diff --git a/include/uapi/drm/amdgpu_drm.h b/include/uapi/drm/amdgpu_drm.h
> index da2d3e1..1420c94 100644
> --- a/include/uapi/drm/amdgpu_drm.h
> +++ b/include/uapi/drm/amdgpu_drm.h
> @@ -79,6 +79,8 @@
>  #define AMDGPU_GEM_CREATE_VRAM_CLEARED         (1 << 3)
>  /* Flag that create shadow bo(GTT) while allocating vram bo */
>  #define AMDGPU_GEM_CREATE_SHADOW               (1 << 4)
> +/* Flag that allocating the BO should use linear VRAM */
> +#define AMDGPU_GEM_CREATE_VRAM_LINEAR          (1 << 5)
>
>  struct drm_amdgpu_gem_create_in  {
>         /** the requested memory size */
> --
> 2.5.0
>
> _______________________________________________
> amd-gfx mailing list
> amd-gfx at lists.freedesktop.org
> https://lists.freedesktop.org/mailman/listinfo/amd-gfx


More information about the amd-gfx mailing list