[igt-dev] [PATCH i-g-t] lib/rendercopy: Add gen4/5 rendercopy
Kalamarz, Lukasz
lukasz.kalamarz at intel.com
Wed Jun 13 10:35:56 UTC 2018
On Mon, 2018-06-11 at 19:14 +0300, Ville Syrjala wrote:
> From: Ville Syrjälä <ville.syrjala at linux.intel.com>
>
> Add rendercopy implementation for gen4/5. Basic structure
> copied from the gen6 implementation,
After refactoring some part of rendercopy libs I don't like that
sentence :(
> and the gen4/5 specific
> bits were mostly lifted from sna.
>
> Signed-off-by: Ville Syrjälä <ville.syrjala at linux.intel.com>
> ---
> lib/Makefile.sources | 2 +
> lib/gen4_render.h | 628
> ++++++++++++++++++++++++++++++++++++++++++
> lib/intel_batchbuffer.c | 2 +
> lib/meson.build | 1 +
> lib/rendercopy.h | 5 +
> lib/rendercopy_gen4.c | 704
> ++++++++++++++++++++++++++++++++++++++++++++++++
> 6 files changed, 1342 insertions(+)
> create mode 100644 lib/gen4_render.h
> create mode 100644 lib/rendercopy_gen4.c
>
> diff --git a/lib/Makefile.sources b/lib/Makefile.sources
> index 042c1d3bb44a..e0ebd02c1661 100644
> --- a/lib/Makefile.sources
> +++ b/lib/Makefile.sources
> @@ -71,10 +71,12 @@ lib_source_list = \
> gen8_media.h \
> rendercopy_i915.c \
> rendercopy_i830.c \
> + gen4_render.h \
> gen6_render.h \
> gen7_render.h \
> gen8_render.h \
> gen9_render.h \
> + rendercopy_gen4.c \
> rendercopy_gen6.c \
> rendercopy_gen7.c \
> rendercopy_gen8.c \
> diff --git a/lib/gen4_render.h b/lib/gen4_render.h
> new file mode 100644
> index 000000000000..ab1158e3c6d2
> --- /dev/null
> +++ b/lib/gen4_render.h
With having in mind refactoring of genX_render libs introduced in patch
series: https://patchwork.freedesktop.org/series/44624/ Could You check
if registers defined here with GEN4/5 prefix are reimplmented in
gen6_render? If so, then maybe it will be good idea to modify those
definitions and not add more duplicated definitions?
> @@ -0,0 +1,628 @@
> +#ifndef GEN4_RENDER_H
> +#define GEN4_RENDER_H
<snip>
> diff --git a/lib/rendercopy_gen4.c b/lib/rendercopy_gen4.c
> new file mode 100644
> index 000000000000..acd4be8de9da
> --- /dev/null
> +++ b/lib/rendercopy_gen4.c
> @@ -0,0 +1,704 @@
> +#include "rendercopy.h"
> +#include "intel_chipset.h"
> +#include "gen4_render.h"
> +#include "surfaceformat.h"
> +
> +#include <assert.h>
> +
> +#define VERTEX_SIZE (3*4)
> +
> +#define URB_VS_ENTRY_SIZE 1
> +#define URB_GS_ENTRY_SIZE 0
> +#define URB_CL_ENTRY_SIZE 0
> +#define URB_SF_ENTRY_SIZE 2
> +#define URB_CS_ENTRY_SIZE 1
> +
> +#define GEN4_GRF_BLOCKS(nreg) (((nreg) + 15) / 16 - 1)
> +#define SF_KERNEL_NUM_GRF 16
> +#define PS_KERNEL_NUM_GRF 32
> +
> +static const uint32_t gen4_sf_kernel_nomask[][4] = {
> + { 0x00400031, 0x20c01fbd, 0x0069002c, 0x01110001 },
> + { 0x00600001, 0x206003be, 0x00690060, 0x00000000 },
> + { 0x00600040, 0x20e077bd, 0x00690080, 0x006940a0 },
> + { 0x00600041, 0x202077be, 0x008d00e0, 0x000000c0 },
> + { 0x00600040, 0x20e077bd, 0x006900a0, 0x00694060 },
> + { 0x00600041, 0x204077be, 0x008d00e0, 0x000000c8 },
> + { 0x00600031, 0x20001fbc, 0x008d0000, 0x8640c800 },
> +};
> +
> +static const uint32_t gen5_sf_kernel_nomask[][4] = {
> + { 0x00400031, 0x20c01fbd, 0x1069002c, 0x02100001 },
> + { 0x00600001, 0x206003be, 0x00690060, 0x00000000 },
> + { 0x00600040, 0x20e077bd, 0x00690080, 0x006940a0 },
> + { 0x00600041, 0x202077be, 0x008d00e0, 0x000000c0 },
> + { 0x00600040, 0x20e077bd, 0x006900a0, 0x00694060 },
> + { 0x00600041, 0x204077be, 0x008d00e0, 0x000000c8 },
> + { 0x00600031, 0x20001fbc, 0x648d0000, 0x8808c800 },
> +};
> +
> +static const uint32_t gen4_ps_kernel_nomask_affine[][4] = {
> + { 0x00800040, 0x23c06d29, 0x00480028, 0x10101010 },
> + { 0x00800040, 0x23806d29, 0x0048002a, 0x11001100 },
> + { 0x00802040, 0x2100753d, 0x008d03c0, 0x00004020 },
> + { 0x00802040, 0x2140753d, 0x008d0380, 0x00004024 },
> + { 0x00802059, 0x200077bc, 0x00000060, 0x008d0100 },
> + { 0x00802048, 0x204077be, 0x00000064, 0x008d0140 },
> + { 0x00802059, 0x200077bc, 0x00000070, 0x008d0100 },
> + { 0x00802048, 0x208077be, 0x00000074, 0x008d0140 },
> + { 0x00600201, 0x20200022, 0x008d0000, 0x00000000 },
> + { 0x00000201, 0x20280062, 0x00000000, 0x00000000 },
> + { 0x01800031, 0x21801d09, 0x008d0000, 0x02580001 },
> + { 0x00600001, 0x204003be, 0x008d0180, 0x00000000 },
> + { 0x00601001, 0x20c003be, 0x008d01a0, 0x00000000 },
> + { 0x00600001, 0x206003be, 0x008d01c0, 0x00000000 },
> + { 0x00601001, 0x20e003be, 0x008d01e0, 0x00000000 },
> + { 0x00600001, 0x208003be, 0x008d0200, 0x00000000 },
> + { 0x00601001, 0x210003be, 0x008d0220, 0x00000000 },
> + { 0x00600001, 0x20a003be, 0x008d0240, 0x00000000 },
> + { 0x00601001, 0x212003be, 0x008d0260, 0x00000000 },
> + { 0x00600201, 0x202003be, 0x008d0020, 0x00000000 },
> + { 0x00800031, 0x20001d28, 0x008d0000, 0x85a04800 },
> +};
> +
> +static const uint32_t gen5_ps_kernel_nomask_affine[][4] = {
> + { 0x00800040, 0x23c06d29, 0x00480028, 0x10101010 },
> + { 0x00800040, 0x23806d29, 0x0048002a, 0x11001100 },
> + { 0x00802040, 0x2100753d, 0x008d03c0, 0x00004020 },
> + { 0x00802040, 0x2140753d, 0x008d0380, 0x00004024 },
> + { 0x00802059, 0x200077bc, 0x00000060, 0x008d0100 },
> + { 0x00802048, 0x204077be, 0x00000064, 0x008d0140 },
> + { 0x00802059, 0x200077bc, 0x00000070, 0x008d0100 },
> + { 0x00802048, 0x208077be, 0x00000074, 0x008d0140 },
> + { 0x01800031, 0x21801fa9, 0x208d0000, 0x0a8a0001 },
> + { 0x00802001, 0x304003be, 0x008d0180, 0x00000000 },
> + { 0x00802001, 0x306003be, 0x008d01c0, 0x00000000 },
> + { 0x00802001, 0x308003be, 0x008d0200, 0x00000000 },
> + { 0x00802001, 0x30a003be, 0x008d0240, 0x00000000 },
> + { 0x00600201, 0x202003be, 0x008d0020, 0x00000000 },
> + { 0x00800031, 0x20001d28, 0x548d0000, 0x94084800 },
> +};
> +
> +static uint32_t
> +batch_used(struct intel_batchbuffer *batch)
> +{
> + return batch->ptr - batch->buffer;
> +}
> +
> +static uint32_t
> +batch_round_upto(struct intel_batchbuffer *batch, uint32_t divisor)
> +{
> + uint32_t offset = batch_used(batch);
> + offset = (offset + divisor - 1) / divisor * divisor;
> + batch->ptr = batch->buffer + offset;
> + return offset;
> +}
With the usage of the same methods in two libs (gen4 and gen6), maybe
it will be worth to move those functions to intel_batchbuffer (like it
was done with previous copy/pasted functions)?
<snip>
----
Lukasz
More information about the igt-dev
mailing list