[Intel-gfx] [PATCH] drm/i915: Simplify processing of the golden render context state
Mika Kuoppala
mika.kuoppala at linux.intel.com
Mon Jun 16 13:40:45 CEST 2014
Chris Wilson <chris at chris-wilson.co.uk> writes:
> Rewrite i915_gem_render_state.c for the purposes of clarity and
> compactness, in the process we can eliminate some dodgy math that did
> not handle 64bit addresses correctly.
>
> Signed-off-by: Chris Wilson <chris at chris-wilson.co.uk>
> Cc: Ville Syrjälä <ville.syrjala at linux.intel.com>
> Cc: Damien Lespiau <damien.lespiau at intel.com>
> Cc: Mika Kuoppala <mika.kuoppala at intel.com>
Reviewed-by: Mika Kuoppala <mika.kuoppala at intel.com>
> ---
> drivers/gpu/drm/i915/i915_gem_render_state.c | 161 +++++++++++---------------
> drivers/gpu/drm/i915/intel_renderstate.h | 2 -
> drivers/gpu/drm/i915/intel_renderstate_gen6.c | 1 +
> drivers/gpu/drm/i915/intel_renderstate_gen7.c | 1 +
> drivers/gpu/drm/i915/intel_renderstate_gen8.c | 1 +
> 5 files changed, 69 insertions(+), 97 deletions(-)
>
> diff --git a/drivers/gpu/drm/i915/i915_gem_render_state.c b/drivers/gpu/drm/i915/i915_gem_render_state.c
> index 3521f998a178..e60be3f552a6 100644
> --- a/drivers/gpu/drm/i915/i915_gem_render_state.c
> +++ b/drivers/gpu/drm/i915/i915_gem_render_state.c
> @@ -28,64 +28,13 @@
> #include "i915_drv.h"
> #include "intel_renderstate.h"
>
> -struct i915_render_state {
> +struct render_state {
> + const struct intel_renderstate_rodata *rodata;
> struct drm_i915_gem_object *obj;
> - unsigned long ggtt_offset;
> - void *batch;
> - u32 size;
> - u32 len;
> + u64 ggtt_offset;
> + int gen;
> };
>
> -static struct i915_render_state *render_state_alloc(struct drm_device *dev)
> -{
> - struct i915_render_state *so;
> - struct page *page;
> - int ret;
> -
> - so = kzalloc(sizeof(*so), GFP_KERNEL);
> - if (!so)
> - return ERR_PTR(-ENOMEM);
> -
> - so->obj = i915_gem_alloc_object(dev, 4096);
> - if (so->obj == NULL) {
> - ret = -ENOMEM;
> - goto free;
> - }
> - so->size = 4096;
> -
> - ret = i915_gem_obj_ggtt_pin(so->obj, 4096, 0);
> - if (ret)
> - goto free_gem;
> -
> - BUG_ON(so->obj->pages->nents != 1);
> - page = sg_page(so->obj->pages->sgl);
> -
> - so->batch = kmap(page);
> - if (!so->batch) {
> - ret = -ENOMEM;
> - goto unpin;
> - }
> -
> - so->ggtt_offset = i915_gem_obj_ggtt_offset(so->obj);
> -
> - return so;
> -unpin:
> - i915_gem_object_ggtt_unpin(so->obj);
> -free_gem:
> - drm_gem_object_unreference(&so->obj->base);
> -free:
> - kfree(so);
> - return ERR_PTR(ret);
> -}
> -
> -static void render_state_free(struct i915_render_state *so)
> -{
> - kunmap(so->batch);
> - i915_gem_object_ggtt_unpin(so->obj);
> - drm_gem_object_unreference(&so->obj->base);
> - kfree(so);
> -}
> -
> static const struct intel_renderstate_rodata *
> render_state_get_rodata(struct drm_device *dev, const int gen)
> {
> @@ -101,98 +50,120 @@ render_state_get_rodata(struct drm_device *dev, const int gen)
> return NULL;
> }
>
> -static int render_state_setup(const int gen,
> - const struct intel_renderstate_rodata *rodata,
> - struct i915_render_state *so)
> +static int render_state_init(struct render_state *so, struct drm_device *dev)
> {
> - const u64 goffset = i915_gem_obj_ggtt_offset(so->obj);
> - u32 reloc_index = 0;
> - u32 * const d = so->batch;
> - unsigned int i = 0;
> int ret;
>
> - if (!rodata || rodata->batch_items * 4 > so->size)
> + so->gen = INTEL_INFO(dev)->gen;
> + so->rodata = render_state_get_rodata(dev, so->gen);
> + if (so->rodata == NULL)
> + return 0;
> +
> + if (so->rodata->batch_items * 4 > 4096)
> return -EINVAL;
>
> + so->obj = i915_gem_alloc_object(dev, 4096);
> + if (so->obj == NULL)
> + return -ENOMEM;
> +
> + ret = i915_gem_obj_ggtt_pin(so->obj, 4096, 0);
> + if (ret)
> + goto free_gem;
> +
> + so->ggtt_offset = i915_gem_obj_ggtt_offset(so->obj);
> + return 0;
> +
> +free_gem:
> + drm_gem_object_unreference(&so->obj->base);
> + return ret;
> +}
> +
> +static int render_state_setup(struct render_state *so)
> +{
> + const struct intel_renderstate_rodata *rodata = so->rodata;
> + unsigned int i = 0, reloc_index = 0;
> + struct page *page;
> + u32 *d;
> + int ret;
> +
> ret = i915_gem_object_set_to_cpu_domain(so->obj, true);
> if (ret)
> return ret;
>
> + page = sg_page(so->obj->pages->sgl);
> + d = kmap(page);
> +
> while (i < rodata->batch_items) {
> u32 s = rodata->batch[i];
>
> - if (reloc_index < rodata->reloc_items &&
> - i * 4 == rodata->reloc[reloc_index]) {
> -
> - s += goffset & 0xffffffff;
> -
> - /* We keep batch offsets max 32bit */
> - if (gen >= 8) {
> + if (i * 4 == rodata->reloc[reloc_index]) {
> + u64 r = s + so->ggtt_offset;
> + s = lower_32_bits(r);
> + if (so->gen >= 8) {
> if (i + 1 >= rodata->batch_items ||
> rodata->batch[i + 1] != 0)
> return -EINVAL;
>
> - d[i] = s;
> - i++;
> - s = (goffset & 0xffffffff00000000ull) >> 32;
> + d[i++] = s;
> + s = upper_32_bits(r);
> }
>
> reloc_index++;
> }
>
> - d[i] = s;
> - i++;
> + d[i++] = s;
> }
> + kunmap(page);
>
> ret = i915_gem_object_set_to_gtt_domain(so->obj, false);
> if (ret)
> return ret;
>
> - if (rodata->reloc_items != reloc_index) {
> - DRM_ERROR("not all relocs resolved, %d out of %d\n",
> - reloc_index, rodata->reloc_items);
> + if (rodata->reloc[reloc_index] != -1) {
> + DRM_ERROR("only %d relocs resolved\n", reloc_index);
> return -EINVAL;
> }
>
> - so->len = rodata->batch_items * 4;
> -
> return 0;
> }
>
> +static void render_state_fini(struct render_state *so)
> +{
> + i915_gem_object_ggtt_unpin(so->obj);
> + drm_gem_object_unreference(&so->obj->base);
> +}
> +
> int i915_gem_render_state_init(struct intel_engine_cs *ring)
> {
> - const int gen = INTEL_INFO(ring->dev)->gen;
> - struct i915_render_state *so;
> - const struct intel_renderstate_rodata *rodata;
> + struct render_state so;
> int ret;
>
> if (WARN_ON(ring->id != RCS))
> return -ENOENT;
>
> - rodata = render_state_get_rodata(ring->dev, gen);
> - if (rodata == NULL)
> - return 0;
> + ret = render_state_init(&so, ring->dev);
> + if (ret)
> + return ret;
>
> - so = render_state_alloc(ring->dev);
> - if (IS_ERR(so))
> - return PTR_ERR(so);
> + if (so.rodata == NULL)
> + return 0;
>
> - ret = render_state_setup(gen, rodata, so);
> + ret = render_state_setup(&so);
> if (ret)
> goto out;
>
> ret = ring->dispatch_execbuffer(ring,
> - i915_gem_obj_ggtt_offset(so->obj),
> - so->len,
> + so.ggtt_offset,
> + so.rodata->batch_items * 4,
> I915_DISPATCH_SECURE);
> if (ret)
> goto out;
>
> - i915_vma_move_to_active(i915_gem_obj_to_ggtt(so->obj), ring);
> + i915_vma_move_to_active(i915_gem_obj_to_ggtt(so.obj), ring);
>
> - ret = __i915_add_request(ring, NULL, so->obj, NULL);
> + ret = __i915_add_request(ring, NULL, so.obj, NULL);
> /* __i915_add_request moves object to inactive if it fails */
> out:
> - render_state_free(so);
> + render_state_fini(&so);
> return ret;
> }
> diff --git a/drivers/gpu/drm/i915/intel_renderstate.h b/drivers/gpu/drm/i915/intel_renderstate.h
> index a5e783a9928a..fd4f66231d30 100644
> --- a/drivers/gpu/drm/i915/intel_renderstate.h
> +++ b/drivers/gpu/drm/i915/intel_renderstate.h
> @@ -28,7 +28,6 @@
>
> struct intel_renderstate_rodata {
> const u32 *reloc;
> - const u32 reloc_items;
> const u32 *batch;
> const u32 batch_items;
> };
> @@ -40,7 +39,6 @@ extern const struct intel_renderstate_rodata gen8_null_state;
> #define RO_RENDERSTATE(_g) \
> const struct intel_renderstate_rodata gen ## _g ## _null_state = { \
> .reloc = gen ## _g ## _null_state_relocs, \
> - .reloc_items = sizeof(gen ## _g ## _null_state_relocs)/4, \
> .batch = gen ## _g ## _null_state_batch, \
> .batch_items = sizeof(gen ## _g ## _null_state_batch)/4, \
> }
> diff --git a/drivers/gpu/drm/i915/intel_renderstate_gen6.c b/drivers/gpu/drm/i915/intel_renderstate_gen6.c
> index 740538ad0977..56c1429d8a60 100644
> --- a/drivers/gpu/drm/i915/intel_renderstate_gen6.c
> +++ b/drivers/gpu/drm/i915/intel_renderstate_gen6.c
> @@ -6,6 +6,7 @@ static const u32 gen6_null_state_relocs[] = {
> 0x0000002c,
> 0x000001e0,
> 0x000001e4,
> + -1,
> };
>
> static const u32 gen6_null_state_batch[] = {
> diff --git a/drivers/gpu/drm/i915/intel_renderstate_gen7.c b/drivers/gpu/drm/i915/intel_renderstate_gen7.c
> index 6fa7ff2a1298..419e35a7b0ff 100644
> --- a/drivers/gpu/drm/i915/intel_renderstate_gen7.c
> +++ b/drivers/gpu/drm/i915/intel_renderstate_gen7.c
> @@ -5,6 +5,7 @@ static const u32 gen7_null_state_relocs[] = {
> 0x00000010,
> 0x00000018,
> 0x000001ec,
> + -1,
> };
>
> static const u32 gen7_null_state_batch[] = {
> diff --git a/drivers/gpu/drm/i915/intel_renderstate_gen8.c b/drivers/gpu/drm/i915/intel_renderstate_gen8.c
> index 5c875615d42a..75ef1b5de45c 100644
> --- a/drivers/gpu/drm/i915/intel_renderstate_gen8.c
> +++ b/drivers/gpu/drm/i915/intel_renderstate_gen8.c
> @@ -5,6 +5,7 @@ static const u32 gen8_null_state_relocs[] = {
> 0x00000050,
> 0x00000060,
> 0x000003ec,
> + -1,
> };
>
> static const u32 gen8_null_state_batch[] = {
> --
> 2.0.0
More information about the Intel-gfx
mailing list