[Mesa-dev] [PATCH 15/31] i965/blorp/exec: Refactor to use blorp_context and a void *batch
Pohjolainen, Topi
topi.pohjolainen at gmail.com
Tue Aug 23 15:33:44 UTC 2016
On Fri, Aug 19, 2016 at 09:55:52AM -0700, Jason Ekstrand wrote:
> This gets rid of brw_context throughout the core of the state setup code.
> ---
> src/mesa/drivers/dri/i965/genX_blorp_exec.c | 332 +++++++++++++++-------------
> 1 file changed, 182 insertions(+), 150 deletions(-)
>
> diff --git a/src/mesa/drivers/dri/i965/genX_blorp_exec.c b/src/mesa/drivers/dri/i965/genX_blorp_exec.c
> index 288e384..8c15b16 100644
> --- a/src/mesa/drivers/dri/i965/genX_blorp_exec.c
> +++ b/src/mesa/drivers/dri/i965/genX_blorp_exec.c
> @@ -34,8 +34,11 @@
> #include "genxml/gen_macros.h"
>
> static void *
> -blorp_emit_dwords(struct brw_context *brw, unsigned n)
> +blorp_emit_dwords(struct blorp_context *blorp, void *batch, unsigned n)
> {
> + assert(blorp->driver_ctx == batch);
> + struct brw_context *brw = batch;
> +
> intel_batchbuffer_begin(brw, n, RENDER_RING);
> uint32_t *map = brw->batch.map_next;
> brw->batch.map_next += n;
> @@ -44,9 +47,12 @@ blorp_emit_dwords(struct brw_context *brw, unsigned n)
> }
>
> static uint64_t
> -blorp_emit_reloc(struct brw_context *brw, void *location,
> - struct blorp_address address, uint32_t delta)
> +blorp_emit_reloc(struct blorp_context *blorp, void *batch,
> + void *location, struct blorp_address address, uint32_t delta)
> {
> + assert(blorp->driver_ctx == batch);
> + struct brw_context *brw = batch;
> +
> uint32_t offset = (char *)location - (char *)brw->batch.map;
> if (brw->gen >= 8) {
> return intel_batchbuffer_reloc64(brw, address.buffer, offset,
> @@ -62,9 +68,11 @@ blorp_emit_reloc(struct brw_context *brw, void *location,
> }
>
> static void
> -blorp_surface_reloc(struct brw_context *brw, uint32_t ss_offset,
> +blorp_surface_reloc(struct blorp_context *blorp, uint32_t ss_offset,
> struct blorp_address address, uint32_t delta)
> {
> + struct brw_context *brw = blorp->driver_ctx;
> +
> drm_intel_bo_emit_reloc(brw->batch.bo, ss_offset,
> address.buffer, address.offset + delta,
> address.read_domains, address.write_domain);
> @@ -129,8 +137,12 @@ blorp_alloc_vertex_buffer(struct blorp_context *blorp, uint32_t size,
> }
>
> static void
> -blorp_emit_urb_config(struct brw_context *brw, unsigned vs_entry_size)
> +blorp_emit_urb_config(struct blorp_context *blorp, void *batch,
> + unsigned vs_entry_size)
> {
> + assert(blorp->driver_ctx == batch);
> + struct brw_context *brw = batch;
> +
> #if GEN_GEN >= 7
> if (!(brw->ctx.NewDriverState & (BRW_NEW_CONTEXT | BRW_NEW_URB_SIZE)) &&
> brw->urb.vsize >= vs_entry_size)
> @@ -145,26 +157,34 @@ blorp_emit_urb_config(struct brw_context *brw, unsigned vs_entry_size)
> }
>
> static void
> -blorp_emit_3dstate_multisample(struct brw_context *brw, unsigned samples)
> +blorp_emit_3dstate_multisample(struct blorp_context *blorp, void *batch,
> + unsigned samples)
> {
> + assert(blorp->driver_ctx == batch);
> #if GEN_GEN >= 8
> - gen8_emit_3dstate_multisample(brw, samples);
> + gen8_emit_3dstate_multisample(batch, samples);
> #else
> - gen6_emit_3dstate_multisample(brw, samples);
> + gen6_emit_3dstate_multisample(batch, samples);
> #endif
> }
>
> +struct blorp_batch {
> + struct blorp_context *blorp;
> + void *batch;
> +};
> +
> #define __gen_address_type struct blorp_address
> -#define __gen_user_data struct brw_context
> +#define __gen_user_data struct blorp_batch
>
> static uint64_t
> -__gen_combine_address(struct brw_context *brw, void *location,
> +__gen_combine_address(struct blorp_batch *batch, void *location,
> struct blorp_address address, uint32_t delta)
> {
> if (address.buffer == NULL) {
> return address.offset + delta;
> } else {
> - return blorp_emit_reloc(brw, location, address, delta);
> + return blorp_emit_reloc(batch->blorp, batch->batch,
> + location, address, delta);
> }
> }
>
> @@ -175,21 +195,22 @@ __gen_combine_address(struct brw_context *brw, void *location,
> #define _blorp_cmd_header(cmd) cmd ## _header
> #define _blorp_cmd_pack(cmd) cmd ## _pack
>
> -#define blorp_emit(brw, cmd, name) \
> - for (struct cmd name = { _blorp_cmd_header(cmd) }, \
> - *_dst = blorp_emit_dwords(brw, _blorp_cmd_length(cmd)); \
> - __builtin_expect(_dst != NULL, 1); \
> - _blorp_cmd_pack(cmd)(brw, (void *)_dst, &name), \
> +#define blorp_emit(batch, cmd, name) \
> + for (struct cmd name = { _blorp_cmd_header(cmd) }, \
> + *_dst = blorp_emit_dwords(batch.blorp, batch.batch, \
> + _blorp_cmd_length(cmd)); \
> + __builtin_expect(_dst != NULL, 1); \
> + _blorp_cmd_pack(cmd)(&batch, (void *)_dst, &name), \
> _dst = NULL)
>
> -#define blorp_emitn(batch, cmd, n) ({ \
> - uint32_t *_dw = blorp_emit_dwords(batch, n); \
> - struct cmd template = { \
> - _blorp_cmd_header(cmd), \
> - .DWordLength = n - _blorp_cmd_length_bias(cmd), \
> - }; \
> - _blorp_cmd_pack(cmd)(batch, _dw, &template); \
> - _dw + 1; /* Array starts at dw[1] */ \
> +#define blorp_emitn(batch, cmd, n) ({ \
> + uint32_t *_dw = blorp_emit_dwords(batch.blorp, batch.batch, n); \
> + struct cmd template = { \
> + _blorp_cmd_header(cmd), \
> + .DWordLength = n - _blorp_cmd_length_bias(cmd), \
> + }; \
> + _blorp_cmd_pack(cmd)(&batch, _dw, &template); \
> + _dw + 1; /* Array starts at dw[1] */ \
> })
>
> /* Once vertex fetcher has written full VUE entries with complete
> @@ -242,14 +263,15 @@ gen7_blorp_get_vs_entry_size(const struct brw_blorp_params *params)
> * valid.
> */
> static void
> -emit_urb_config(struct brw_context *brw,
> +emit_urb_config(struct blorp_batch batch,
> const struct brw_blorp_params *params)
> {
> - blorp_emit_urb_config(brw, gen7_blorp_get_vs_entry_size(params));
> + blorp_emit_urb_config(batch.blorp, batch.batch,
> + gen7_blorp_get_vs_entry_size(params));
> }
>
> static void
> -blorp_emit_vertex_data(struct brw_context *brw,
> +blorp_emit_vertex_data(struct blorp_batch batch,
> const struct brw_blorp_params *params,
> struct blorp_address *addr,
> uint32_t *size)
> @@ -260,13 +282,13 @@ blorp_emit_vertex_data(struct brw_context *brw,
> /* v2 */ (float)params->x0, (float)params->y0,
> };
>
> - void *data = blorp_alloc_vertex_buffer(&brw->blorp, sizeof(vertices), addr);
> + void *data = blorp_alloc_vertex_buffer(batch.blorp, sizeof(vertices), addr);
> memcpy(data, vertices, sizeof(vertices));
> *size = sizeof(vertices);
> }
>
> static void
> -blorp_emit_input_varying_data(struct brw_context *brw,
> +blorp_emit_input_varying_data(struct blorp_batch batch,
> const struct brw_blorp_params *params,
> struct blorp_address *addr,
> uint32_t *size)
> @@ -279,7 +301,7 @@ blorp_emit_input_varying_data(struct brw_context *brw,
> *size = num_varyings * vec4_size_in_bytes;
>
> const float *const inputs_src = (const float *)¶ms->wm_inputs;
> - float *inputs = blorp_alloc_vertex_buffer(&brw->blorp, *size, addr);
> + float *inputs = blorp_alloc_vertex_buffer(batch.blorp, *size, addr);
>
> /* Walk over the attribute slots, determine if the attribute is used by
> * the program and when necessary copy the values from the input storage to
> @@ -298,7 +320,7 @@ blorp_emit_input_varying_data(struct brw_context *brw,
> }
>
> static void
> -blorp_emit_vertex_buffers(struct brw_context *brw,
> +blorp_emit_vertex_buffers(struct blorp_batch batch,
> const struct brw_blorp_params *params)
> {
> struct GENX(VERTEX_BUFFER_STATE) vb[2];
> @@ -307,10 +329,10 @@ blorp_emit_vertex_buffers(struct brw_context *brw,
> unsigned num_buffers = 1;
>
> uint32_t size;
> - blorp_emit_vertex_data(brw, params, &vb[0].BufferStartingAddress, &size);
> + blorp_emit_vertex_data(batch, params, &vb[0].BufferStartingAddress, &size);
> vb[0].VertexBufferIndex = 0;
> vb[0].BufferPitch = 2 * sizeof(float);
> - vb[0].VertexBufferMOCS = brw->blorp.mocs.vb;
> + vb[0].VertexBufferMOCS = batch.blorp->mocs.vb;
> #if GEN_GEN >= 7
> vb[0].AddressModifyEnable = true;
> #endif
> @@ -323,11 +345,11 @@ blorp_emit_vertex_buffers(struct brw_context *brw,
> #endif
>
> if (params->wm_prog_data && params->wm_prog_data->num_varying_inputs) {
> - blorp_emit_input_varying_data(brw, params,
> + blorp_emit_input_varying_data(batch, params,
> &vb[1].BufferStartingAddress, &size);
> vb[1].VertexBufferIndex = 1;
> vb[1].BufferPitch = 0;
> - vb[1].VertexBufferMOCS = brw->blorp.mocs.vb;
> + vb[1].VertexBufferMOCS = batch.blorp->mocs.vb;
> #if GEN_GEN >= 7
> vb[1].AddressModifyEnable = true;
> #endif
> @@ -343,16 +365,16 @@ blorp_emit_vertex_buffers(struct brw_context *brw,
>
> const unsigned num_dwords =
> 1 + GENX(VERTEX_BUFFER_STATE_length) * num_buffers;
> - uint32_t *dw = blorp_emitn(brw, GENX(3DSTATE_VERTEX_BUFFERS), num_dwords);
> + uint32_t *dw = blorp_emitn(batch, GENX(3DSTATE_VERTEX_BUFFERS), num_dwords);
>
> for (unsigned i = 0; i < num_buffers; i++) {
> - GENX(VERTEX_BUFFER_STATE_pack)(brw, dw, &vb[i]);
> + GENX(VERTEX_BUFFER_STATE_pack)(&batch, dw, &vb[i]);
> dw += GENX(VERTEX_BUFFER_STATE_length);
> }
> }
>
> static void
> -blorp_emit_vertex_elements(struct brw_context *brw,
> +blorp_emit_vertex_elements(struct blorp_batch batch,
> const struct brw_blorp_params *params)
> {
> const unsigned num_varyings =
> @@ -437,31 +459,31 @@ blorp_emit_vertex_elements(struct brw_context *brw,
>
> const unsigned num_dwords =
> 1 + GENX(VERTEX_ELEMENT_STATE_length) * num_elements;
> - uint32_t *dw = blorp_emitn(brw, GENX(3DSTATE_VERTEX_ELEMENTS), num_dwords);
> + uint32_t *dw = blorp_emitn(batch, GENX(3DSTATE_VERTEX_ELEMENTS), num_dwords);
>
> for (unsigned i = 0; i < num_elements; i++) {
> - GENX(VERTEX_ELEMENT_STATE_pack)(brw, dw, &ve[i]);
> + GENX(VERTEX_ELEMENT_STATE_pack)(&batch, dw, &ve[i]);
> dw += GENX(VERTEX_ELEMENT_STATE_length);
> }
>
> #if GEN_GEN >= 8
> - blorp_emit(brw, GENX(3DSTATE_VF_SGVS), sgvs);
> + blorp_emit(batch, GENX(3DSTATE_VF_SGVS), sgvs);
>
> for (unsigned i = 0; i < num_elements; i++) {
> - blorp_emit(brw, GENX(3DSTATE_VF_INSTANCING), vf) {
> + blorp_emit(batch, GENX(3DSTATE_VF_INSTANCING), vf) {
> vf.VertexElementIndex = i;
> vf.InstancingEnable = false;
> }
> }
>
> - blorp_emit(brw, GENX(3DSTATE_VF_TOPOLOGY), topo) {
> + blorp_emit(batch, GENX(3DSTATE_VF_TOPOLOGY), topo) {
> topo.PrimitiveTopologyType = _3DPRIM_RECTLIST;
> }
> #endif
> }
>
> static void
> -blorp_emit_sf_config(struct brw_context *brw,
> +blorp_emit_sf_config(struct blorp_batch batch,
> const struct brw_blorp_params *params)
> {
> const struct brw_blorp_prog_data *prog_data = params->wm_prog_data;
> @@ -487,13 +509,13 @@ blorp_emit_sf_config(struct brw_context *brw,
>
> #if GEN_GEN >= 8
>
> - blorp_emit(brw, GENX(3DSTATE_SF), sf);
> + blorp_emit(batch, GENX(3DSTATE_SF), sf);
>
> - blorp_emit(brw, GENX(3DSTATE_RASTER), raster) {
> + blorp_emit(batch, GENX(3DSTATE_RASTER), raster) {
> raster.CullMode = CULLMODE_NONE;
> }
>
> - blorp_emit(brw, GENX(3DSTATE_SBE), sbe) {
> + blorp_emit(batch, GENX(3DSTATE_SBE), sbe) {
> sbe.VertexURBEntryReadOffset = BRW_SF_URB_ENTRY_READ_OFFSET;
> sbe.NumberofSFOutputAttributes = prog_data->num_varying_inputs;
> sbe.VertexURBEntryReadLength = brw_blorp_get_urb_length(prog_data);
> @@ -509,7 +531,7 @@ blorp_emit_sf_config(struct brw_context *brw,
>
> #elif GEN_GEN >= 7
>
> - blorp_emit(brw, GENX(3DSTATE_SF), sf) {
> + blorp_emit(batch, GENX(3DSTATE_SF), sf) {
> sf.FrontFaceFillMode = FILL_MODE_SOLID;
> sf.BackFaceFillMode = FILL_MODE_SOLID;
>
> @@ -521,7 +543,7 @@ blorp_emit_sf_config(struct brw_context *brw,
> #endif
> }
>
> - blorp_emit(brw, GENX(3DSTATE_SBE), sbe) {
> + blorp_emit(batch, GENX(3DSTATE_SBE), sbe) {
> sbe.VertexURBEntryReadOffset = BRW_SF_URB_ENTRY_READ_OFFSET;
> if (prog_data) {
> sbe.NumberofSFOutputAttributes = prog_data->num_varying_inputs;
> @@ -535,7 +557,7 @@ blorp_emit_sf_config(struct brw_context *brw,
>
> #else /* GEN_GEN <= 6 */
>
> - blorp_emit(brw, GENX(3DSTATE_SF), sf) {
> + blorp_emit(batch, GENX(3DSTATE_SF), sf) {
> sf.FrontFaceFillMode = FILL_MODE_SOLID;
> sf.BackFaceFillMode = FILL_MODE_SOLID;
>
> @@ -557,7 +579,7 @@ blorp_emit_sf_config(struct brw_context *brw,
> }
>
> static void
> -blorp_emit_ps_config(struct brw_context *brw,
> +blorp_emit_ps_config(struct blorp_batch batch,
> const struct brw_blorp_params *params)
> {
> const struct brw_blorp_prog_data *prog_data = params->wm_prog_data;
> @@ -573,9 +595,9 @@ blorp_emit_ps_config(struct brw_context *brw,
>
> #if GEN_GEN >= 8
>
> - blorp_emit(brw, GENX(3DSTATE_WM), wm);
> + blorp_emit(batch, GENX(3DSTATE_WM), wm);
>
> - blorp_emit(brw, GENX(3DSTATE_PS), ps) {
> + blorp_emit(batch, GENX(3DSTATE_PS), ps) {
> if (params->src.addr.buffer) {
> ps.SamplerCount = 1; /* Up to 4 samplers */
> ps.BindingTableEntryCount = 2;
> @@ -625,7 +647,7 @@ blorp_emit_ps_config(struct brw_context *brw,
> }
> }
>
> - blorp_emit(brw, GENX(3DSTATE_PS_EXTRA), psx) {
> + blorp_emit(batch, GENX(3DSTATE_PS_EXTRA), psx) {
> psx.PixelShaderValid = true;
>
> if (params->src.addr.buffer)
> @@ -639,7 +661,7 @@ blorp_emit_ps_config(struct brw_context *brw,
>
> #elif GEN_GEN >= 7
>
> - blorp_emit(brw, GENX(3DSTATE_WM), wm) {
> + blorp_emit(batch, GENX(3DSTATE_WM), wm) {
> switch (params->hiz_op) {
> case GEN6_HIZ_OP_DEPTH_CLEAR:
> wm.DepthBufferClear = true;
> @@ -673,8 +695,8 @@ blorp_emit_ps_config(struct brw_context *brw,
> }
> }
>
> - blorp_emit(brw, GENX(3DSTATE_PS), ps) {
> - ps.MaximumNumberofThreads = brw->max_wm_threads - 1;
> + blorp_emit(batch, GENX(3DSTATE_PS), ps) {
> + ps.MaximumNumberofThreads = batch.blorp->isl_dev->info->max_wm_threads - 1;
>
> #if GEN_IS_HASWELL
> ps.SampleMask = 1;
> @@ -716,8 +738,8 @@ blorp_emit_ps_config(struct brw_context *brw,
>
> #else /* GEN_GEN <= 6 */
>
> - blorp_emit(brw, GENX(3DSTATE_WM), wm) {
> - wm.MaximumNumberofThreads = brw->max_wm_threads - 1;
> + blorp_emit(batch, GENX(3DSTATE_WM), wm) {
> + wm.MaximumNumberofThreads = batch.blorp->isl_dev->info->max_wm_threads - 1;
>
> switch (params->hiz_op) {
> case GEN6_HIZ_OP_DEPTH_CLEAR:
> @@ -774,18 +796,16 @@ blorp_emit_ps_config(struct brw_context *brw,
>
>
> static void
> -blorp_emit_depth_stencil_config(struct brw_context *brw,
> +blorp_emit_depth_stencil_config(struct blorp_batch batch,
> const struct brw_blorp_params *params)
> {
> - brw_emit_depth_stall_flushes(brw);
> -
> #if GEN_GEN >= 7
> const uint32_t mocs = 1; /* GEN7_MOCS_L3 */
> #else
> const uint32_t mocs = 0;
> #endif
>
> - blorp_emit(brw, GENX(3DSTATE_DEPTH_BUFFER), db) {
> + blorp_emit(batch, GENX(3DSTATE_DEPTH_BUFFER), db) {
> switch (params->depth.surf.dim) {
> case ISL_SURF_DIM_1D:
> db.SurfaceType = SURFTYPE_1D;
> @@ -827,17 +847,17 @@ blorp_emit_depth_stencil_config(struct brw_context *brw,
> db.DepthBufferMOCS = mocs;
> }
>
> - blorp_emit(brw, GENX(3DSTATE_HIER_DEPTH_BUFFER), hiz) {
> + blorp_emit(batch, GENX(3DSTATE_HIER_DEPTH_BUFFER), hiz) {
> hiz.SurfacePitch = params->depth.aux_surf.row_pitch - 1;
> hiz.SurfaceBaseAddress = params->depth.aux_addr;
> hiz.HierarchicalDepthBufferMOCS = mocs;
> }
>
> - blorp_emit(brw, GENX(3DSTATE_STENCIL_BUFFER), sb);
> + blorp_emit(batch, GENX(3DSTATE_STENCIL_BUFFER), sb);
> }
>
> static uint32_t
> -blorp_emit_blend_state(struct brw_context *brw,
> +blorp_emit_blend_state(struct blorp_batch batch,
> const struct brw_blorp_params *params)
> {
> struct GENX(BLEND_STATE) blend;
> @@ -855,14 +875,14 @@ blorp_emit_blend_state(struct brw_context *brw,
> }
>
> uint32_t offset;
> - void *state = blorp_alloc_dynamic_state(&brw->blorp,
> + void *state = blorp_alloc_dynamic_state(batch.blorp,
> AUB_TRACE_BLEND_STATE,
> GENX(BLEND_STATE_length) * 4,
> 64, &offset);
> GENX(BLEND_STATE_pack)(NULL, state, &blend);
>
> #if GEN_GEN >= 7
> - blorp_emit(brw, GENX(3DSTATE_BLEND_STATE_POINTERS), sp) {
> + blorp_emit(batch, GENX(3DSTATE_BLEND_STATE_POINTERS), sp) {
> sp.BlendStatePointer = offset;
> #if GEN_GEN >= 8
> sp.BlendStatePointerValid = true;
> @@ -871,7 +891,7 @@ blorp_emit_blend_state(struct brw_context *brw,
> #endif
>
> #if GEN_GEN >= 8
> - blorp_emit(brw, GENX(3DSTATE_PS_BLEND), ps_blend) {
> + blorp_emit(batch, GENX(3DSTATE_PS_BLEND), ps_blend) {
> ps_blend.HasWriteableRT = true;
> }
> #endif
> @@ -880,18 +900,18 @@ blorp_emit_blend_state(struct brw_context *brw,
> }
>
> static uint32_t
> -blorp_emit_color_calc_state(struct brw_context *brw,
> +blorp_emit_color_calc_state(struct blorp_batch batch,
> const struct brw_blorp_params *params)
> {
> uint32_t offset;
> - void *state = blorp_alloc_dynamic_state(&brw->blorp,
> + void *state = blorp_alloc_dynamic_state(batch.blorp,
> AUB_TRACE_CC_STATE,
> GENX(COLOR_CALC_STATE_length) * 4,
> 64, &offset);
> memset(state, 0, GENX(COLOR_CALC_STATE_length) * 4);
>
> #if GEN_GEN >= 7
> - blorp_emit(brw, GENX(3DSTATE_CC_STATE_POINTERS), sp) {
> + blorp_emit(batch, GENX(3DSTATE_CC_STATE_POINTERS), sp) {
> sp.ColorCalcStatePointer = offset;
> #if GEN_GEN >= 8
> sp.ColorCalcStatePointerValid = true;
> @@ -903,13 +923,13 @@ blorp_emit_color_calc_state(struct brw_context *brw,
> }
>
> static uint32_t
> -blorp_emit_depth_stencil_state(struct brw_context *brw,
> +blorp_emit_depth_stencil_state(struct blorp_batch batch,
> const struct brw_blorp_params *params)
> {
> #if GEN_GEN >= 8
>
> /* On gen8+, DEPTH_STENCIL state is simply an instruction */
> - blorp_emit(brw, GENX(3DSTATE_WM_DEPTH_STENCIL), ds);
> + blorp_emit(batch, GENX(3DSTATE_WM_DEPTH_STENCIL), ds);
> return 0;
>
> #else /* GEN_GEN <= 7 */
> @@ -929,14 +949,14 @@ blorp_emit_depth_stencil_state(struct brw_context *brw,
> }
>
> uint32_t offset;
> - void *state = blorp_alloc_dynamic_state(&brw->blorp,
> + void *state = blorp_alloc_dynamic_state(batch.blorp,
> AUB_TRACE_DEPTH_STENCIL_STATE,
> GENX(DEPTH_STENCIL_STATE_length) * 4,
> 64, &offset);
> GENX(DEPTH_STENCIL_STATE_pack)(NULL, state, &ds);
>
> #if GEN_GEN >= 7
> - blorp_emit(brw, GENX(3DSTATE_DEPTH_STENCIL_STATE_POINTERS), sp) {
> + blorp_emit(batch, GENX(3DSTATE_DEPTH_STENCIL_STATE_POINTERS), sp) {
> sp.PointertoDEPTH_STENCIL_STATE = offset;
> }
> #endif
> @@ -961,12 +981,12 @@ static const struct surface_state_info surface_state_infos[] = {
> };
>
> static void
> -blorp_emit_surface_state(struct brw_context *brw,
> +blorp_emit_surface_state(struct blorp_context *blorp,
> const struct brw_blorp_surface_info *surface,
> uint32_t *state, uint32_t state_offset,
> bool is_render_target)
> {
> - const struct surface_state_info ss_info = surface_state_infos[brw->gen];
> + const struct surface_state_info ss_info = surface_state_infos[GEN_GEN];
>
> struct isl_surf surf = surface->surf;
>
> @@ -981,17 +1001,16 @@ blorp_emit_surface_state(struct brw_context *brw,
> if (aux_usage == ISL_AUX_USAGE_HIZ)
> aux_usage = ISL_AUX_USAGE_NONE;
>
> - const uint32_t mocs =
> - is_render_target ? brw->blorp.mocs.rb : brw->blorp.mocs.tex;
> + const uint32_t mocs = is_render_target ? blorp->mocs.rb : blorp->mocs.tex;
>
> - isl_surf_fill_state(&brw->isl_dev, state,
> + isl_surf_fill_state(blorp->isl_dev, state,
> .surf = &surf, .view = &surface->view,
> .aux_surf = &surface->aux_surf, .aux_usage = aux_usage,
> .mocs = mocs, .clear_color = surface->clear_color,
> .x_offset_sa = surface->tile_x_sa,
> .y_offset_sa = surface->tile_y_sa);
>
> - blorp_surface_reloc(brw, state_offset + ss_info.reloc_dw * 4,
> + blorp_surface_reloc(blorp, state_offset + ss_info.reloc_dw * 4,
> surface->addr, 0);
>
> if (aux_usage != ISL_AUX_USAGE_NONE) {
> @@ -1000,13 +1019,13 @@ blorp_emit_surface_state(struct brw_context *brw,
> * surface buffer addresses are always 4K page alinged.
> */
> assert((surface->aux_addr.offset & 0xfff) == 0);
> - blorp_surface_reloc(brw, state_offset + ss_info.aux_reloc_dw * 4,
> + blorp_surface_reloc(blorp, state_offset + ss_info.aux_reloc_dw * 4,
> surface->aux_addr, state[ss_info.aux_reloc_dw]);
> }
> }
>
> static void
> -blorp_emit_surface_states(struct brw_context *brw,
> +blorp_emit_surface_states(struct blorp_batch batch,
> const struct brw_blorp_params *params)
> {
> uint32_t bind_offset, *bind_map;
> @@ -1016,24 +1035,24 @@ blorp_emit_surface_states(struct brw_context *brw,
> const unsigned ss_align = GENX(RENDER_SURFACE_STATE_length) > 8 ? 64 : 32;
>
> unsigned num_surfaces = 1 + (params->src.addr.buffer != NULL);
> - blorp_alloc_binding_table(&brw->blorp, num_surfaces, ss_size, ss_align,
> + blorp_alloc_binding_table(batch.blorp, num_surfaces, ss_size, ss_align,
> &bind_offset, &bind_map, surface_maps);
>
> - blorp_emit_surface_state(brw, ¶ms->dst,
> + blorp_emit_surface_state(batch.blorp, ¶ms->dst,
> surface_maps[BLORP_RENDERBUFFER_BT_INDEX],
> bind_map[BLORP_RENDERBUFFER_BT_INDEX], true);
> if (params->src.addr.buffer) {
> - blorp_emit_surface_state(brw, ¶ms->src,
> + blorp_emit_surface_state(batch.blorp, ¶ms->src,
> surface_maps[BLORP_TEXTURE_BT_INDEX],
> bind_map[BLORP_TEXTURE_BT_INDEX], false);
> }
>
> #if GEN_GEN >= 7
> - blorp_emit(brw, GENX(3DSTATE_BINDING_TABLE_POINTERS_PS), bt) {
> + blorp_emit(batch, GENX(3DSTATE_BINDING_TABLE_POINTERS_PS), bt) {
> bt.PointertoPSBindingTable = bind_offset;
> }
> #else
> - blorp_emit(brw, GENX(3DSTATE_BINDING_TABLE_POINTERS), bt) {
> + blorp_emit(batch, GENX(3DSTATE_BINDING_TABLE_POINTERS), bt) {
> bt.PSBindingTableChange = true;
> bt.PointertoPSBindingTable = bind_offset;
> }
> @@ -1041,7 +1060,7 @@ blorp_emit_surface_states(struct brw_context *brw,
> }
>
> static void
> -blorp_emit_sampler_state(struct brw_context *brw,
> +blorp_emit_sampler_state(struct blorp_batch batch,
> const struct brw_blorp_params *params)
> {
> struct GENX(SAMPLER_STATE) sampler = {
> @@ -1064,18 +1083,18 @@ blorp_emit_sampler_state(struct brw_context *brw,
> };
>
> uint32_t offset;
> - void *state = blorp_alloc_dynamic_state(&brw->blorp,
> + void *state = blorp_alloc_dynamic_state(batch.blorp,
> AUB_TRACE_SAMPLER_STATE,
> GENX(SAMPLER_STATE_length) * 4,
> 32, &offset);
> GENX(SAMPLER_STATE_pack)(NULL, state, &sampler);
>
> #if GEN_GEN >= 7
> - blorp_emit(brw, GENX(3DSTATE_SAMPLER_STATE_POINTERS_PS), ssp) {
> + blorp_emit(batch, GENX(3DSTATE_SAMPLER_STATE_POINTERS_PS), ssp) {
> ssp.PointertoPSSamplerState = offset;
> }
> #else
> - blorp_emit(brw, GENX(3DSTATE_SAMPLER_STATE_POINTERS), ssp) {
> + blorp_emit(batch, GENX(3DSTATE_SAMPLER_STATE_POINTERS), ssp) {
> ssp.VSSamplerStateChange = true;
> ssp.GSSamplerStateChange = true;
> ssp.PSSamplerStateChange = true;
> @@ -1086,28 +1105,28 @@ blorp_emit_sampler_state(struct brw_context *brw,
>
> /* 3DSTATE_VIEWPORT_STATE_POINTERS */
> static void
> -blorp_emit_viewport_state(struct brw_context *brw,
> +blorp_emit_viewport_state(struct blorp_batch batch,
> const struct brw_blorp_params *params)
> {
> uint32_t cc_vp_offset;
>
> - void *state = blorp_alloc_dynamic_state(&brw->blorp,
> + void *state = blorp_alloc_dynamic_state(batch.blorp,
> AUB_TRACE_CC_VP_STATE,
> GENX(CC_VIEWPORT_length) * 4, 32,
> &cc_vp_offset);
>
> - GENX(CC_VIEWPORT_pack)(brw, state,
> + GENX(CC_VIEWPORT_pack)(&batch, state,
> &(struct GENX(CC_VIEWPORT)) {
> .MinimumDepth = 0.0,
> .MaximumDepth = 1.0,
> });
>
> #if GEN_GEN >= 7
> - blorp_emit(brw, GENX(3DSTATE_VIEWPORT_STATE_POINTERS_CC), vsp) {
> + blorp_emit(batch, GENX(3DSTATE_VIEWPORT_STATE_POINTERS_CC), vsp) {
> vsp.CCViewportPointer = cc_vp_offset;
> }
> #else
> - blorp_emit(brw, GENX(3DSTATE_VIEWPORT_STATE_POINTERS), vsp) {
> + blorp_emit(batch, GENX(3DSTATE_VIEWPORT_STATE_POINTERS), vsp) {
> vsp.CCViewportStateChange = true;
> vsp.PointertoCC_VIEWPORT = cc_vp_offset;
> }
> @@ -1124,35 +1143,29 @@ blorp_emit_viewport_state(struct brw_context *brw,
> *
> * This function alters no GL state.
> */
> -void
> -genX(blorp_exec)(struct brw_context *brw,
> - const struct brw_blorp_params *params)
> +static void
> +blorp_exec(struct blorp_context *blorp, void *batch_data,
> + const struct brw_blorp_params *params)
> {
> + struct blorp_batch batch = {
> + .blorp = blorp,
> + .batch = batch_data,
> + };
> +
I was sort of expecting the callers to provide an instance of blorp_batch
instead of separate blorp_context and void*. Not a big deal though.
I read half-way through more carefully and skimmed the rest. I don't think
this would even compile if you had an obvious mistake somewhere. So:
Reviewed-by: Topi Pohjolainen <topi.pohjolainen at intel.com>
> uint32_t blend_state_offset = 0;
> uint32_t color_calc_state_offset = 0;
> uint32_t depth_stencil_state_offset;
>
> -#if GEN_GEN == 6
> - /* Emit workaround flushes when we switch from drawing to blorping. */
> - brw_emit_post_sync_nonzero_flush(brw);
> -#endif
> -
> - brw_upload_state_base_address(brw);
> -
> -#if GEN_GEN >= 8
> - gen7_l3_state.emit(brw);
> -#endif
> -
> - blorp_emit_vertex_buffers(brw, params);
> - blorp_emit_vertex_elements(brw, params);
> + blorp_emit_vertex_buffers(batch, params);
> + blorp_emit_vertex_elements(batch, params);
>
> - emit_urb_config(brw, params);
> + emit_urb_config(batch, params);
>
> if (params->wm_prog_data) {
> - blend_state_offset = blorp_emit_blend_state(brw, params);
> - color_calc_state_offset = blorp_emit_color_calc_state(brw, params);
> + blend_state_offset = blorp_emit_blend_state(batch, params);
> + color_calc_state_offset = blorp_emit_color_calc_state(batch, params);
> }
> - depth_stencil_state_offset = blorp_emit_depth_stencil_state(brw, params);
> + depth_stencil_state_offset = blorp_emit_depth_stencil_state(batch, params);
>
> #if GEN_GEN <= 6
> /* 3DSTATE_CC_STATE_POINTERS
> @@ -1166,7 +1179,7 @@ genX(blorp_exec)(struct brw_context *brw,
> * gen7+. However, on gen6 and earlier, they're all lumpped together in
> * one CC_STATE_POINTERS packet so we have to emit that here.
> */
> - blorp_emit(brw, GENX(3DSTATE_CC_STATE_POINTERS), cc) {
> + blorp_emit(batch, GENX(3DSTATE_CC_STATE_POINTERS), cc) {
> cc.BLEND_STATEChange = true;
> cc.COLOR_CALC_STATEChange = true;
> cc.DEPTH_STENCIL_STATEChange = true;
> @@ -1180,26 +1193,24 @@ genX(blorp_exec)(struct brw_context *brw,
> (void)depth_stencil_state_offset;
> #endif
>
> - blorp_emit(brw, GENX(3DSTATE_CONSTANT_VS), vs);
> + blorp_emit(batch, GENX(3DSTATE_CONSTANT_VS), vs);
> #if GEN_GEN >= 7
> - blorp_emit(brw, GENX(3DSTATE_CONSTANT_HS), hs);
> - blorp_emit(brw, GENX(3DSTATE_CONSTANT_DS), DS);
> + blorp_emit(batch, GENX(3DSTATE_CONSTANT_HS), hs);
> + blorp_emit(batch, GENX(3DSTATE_CONSTANT_DS), DS);
> #endif
> - blorp_emit(brw, GENX(3DSTATE_CONSTANT_GS), gs);
> - blorp_emit(brw, GENX(3DSTATE_CONSTANT_PS), ps);
> -
> - if (brw->use_resource_streamer)
> - gen7_disable_hw_binding_tables(brw);
> + blorp_emit(batch, GENX(3DSTATE_CONSTANT_GS), gs);
> + blorp_emit(batch, GENX(3DSTATE_CONSTANT_PS), ps);
>
> if (params->wm_prog_data)
> - blorp_emit_surface_states(brw, params);
> + blorp_emit_surface_states(batch, params);
>
> if (params->src.addr.buffer)
> - blorp_emit_sampler_state(brw, params);
> + blorp_emit_sampler_state(batch, params);
>
> - blorp_emit_3dstate_multisample(brw, params->dst.surf.samples);
> + blorp_emit_3dstate_multisample(batch.blorp, batch.batch,
> + params->dst.surf.samples);
>
> - blorp_emit(brw, GENX(3DSTATE_SAMPLE_MASK), mask) {
> + blorp_emit(batch, GENX(3DSTATE_SAMPLE_MASK), mask) {
> mask.SampleMask = (1 << params->dst.surf.samples) - 1;
> }
>
> @@ -1213,35 +1224,33 @@ genX(blorp_exec)(struct brw_context *brw,
> *
> * We've already done one at the start of the BLORP operation.
> */
> - blorp_emit(brw, GENX(3DSTATE_VS), vs);
> + blorp_emit(batch, GENX(3DSTATE_VS), vs);
> #if GEN_GEN >= 7
> - blorp_emit(brw, GENX(3DSTATE_HS), hs);
> - blorp_emit(brw, GENX(3DSTATE_TE), te);
> - blorp_emit(brw, GENX(3DSTATE_DS), DS);
> - blorp_emit(brw, GENX(3DSTATE_STREAMOUT), so);
> + blorp_emit(batch, GENX(3DSTATE_HS), hs);
> + blorp_emit(batch, GENX(3DSTATE_TE), te);
> + blorp_emit(batch, GENX(3DSTATE_DS), DS);
> + blorp_emit(batch, GENX(3DSTATE_STREAMOUT), so);
> #endif
> - blorp_emit(brw, GENX(3DSTATE_GS), gs);
> + blorp_emit(batch, GENX(3DSTATE_GS), gs);
>
> - blorp_emit(brw, GENX(3DSTATE_CLIP), clip) {
> + blorp_emit(batch, GENX(3DSTATE_CLIP), clip) {
> clip.PerspectiveDivideDisable = true;
> }
>
> - blorp_emit_sf_config(brw, params);
> - blorp_emit_ps_config(brw, params);
> + blorp_emit_sf_config(batch, params);
> + blorp_emit_ps_config(batch, params);
>
> - blorp_emit_viewport_state(brw, params);
> + blorp_emit_viewport_state(batch, params);
>
> if (params->depth.addr.buffer) {
> - blorp_emit_depth_stencil_config(brw, params);
> + blorp_emit_depth_stencil_config(batch, params);
> } else {
> - brw_emit_depth_stall_flushes(brw);
> -
> - blorp_emit(brw, GENX(3DSTATE_DEPTH_BUFFER), db) {
> + blorp_emit(batch, GENX(3DSTATE_DEPTH_BUFFER), db) {
> db.SurfaceType = SURFTYPE_NULL;
> db.SurfaceFormat = D32_FLOAT;
> }
> - blorp_emit(brw, GENX(3DSTATE_HIER_DEPTH_BUFFER), hiz);
> - blorp_emit(brw, GENX(3DSTATE_STENCIL_BUFFER), sb);
> + blorp_emit(batch, GENX(3DSTATE_HIER_DEPTH_BUFFER), hiz);
> + blorp_emit(batch, GENX(3DSTATE_STENCIL_BUFFER), sb);
> }
>
> /* 3DSTATE_CLEAR_PARAMS
> @@ -1250,20 +1259,43 @@ genX(blorp_exec)(struct brw_context *brw,
> * [DevSNB] 3DSTATE_CLEAR_PARAMS packet must follow the DEPTH_BUFFER_STATE
> * packet when HiZ is enabled and the DEPTH_BUFFER_STATE changes.
> */
> - blorp_emit(brw, GENX(3DSTATE_CLEAR_PARAMS), clear) {
> + blorp_emit(batch, GENX(3DSTATE_CLEAR_PARAMS), clear) {
> clear.DepthClearValueValid = true;
> clear.DepthClearValue = params->depth.clear_color.u32[0];
> }
>
> - blorp_emit(brw, GENX(3DSTATE_DRAWING_RECTANGLE), rect) {
> + blorp_emit(batch, GENX(3DSTATE_DRAWING_RECTANGLE), rect) {
> rect.ClippedDrawingRectangleXMax = MAX2(params->x1, params->x0) - 1;
> rect.ClippedDrawingRectangleYMax = MAX2(params->y1, params->y0) - 1;
> }
>
> - blorp_emit(brw, GENX(3DPRIMITIVE), prim) {
> + blorp_emit(batch, GENX(3DPRIMITIVE), prim) {
> prim.VertexAccessType = SEQUENTIAL;
> prim.PrimitiveTopologyType = _3DPRIM_RECTLIST;
> prim.VertexCountPerInstance = 3;
> prim.InstanceCount = params->num_layers;
> }
> }
> +
> +void
> +genX(blorp_exec)(struct brw_context *brw,
> + const struct brw_blorp_params *params)
> +{
> +#if GEN_GEN == 6
> + /* Emit workaround flushes when we switch from drawing to blorping. */
> + brw_emit_post_sync_nonzero_flush(brw);
> +#endif
> +
> + brw_upload_state_base_address(brw);
> +
> +#if GEN_GEN >= 8
> + gen7_l3_state.emit(brw);
> +#endif
> +
> + if (brw->use_resource_streamer)
> + gen7_disable_hw_binding_tables(brw);
> +
> + brw_emit_depth_stall_flushes(brw);
> +
> + blorp_exec(&brw->blorp, brw, params);
> +}
> --
> 2.5.0.400.gff86faf
>
> _______________________________________________
> mesa-dev mailing list
> mesa-dev at lists.freedesktop.org
> https://lists.freedesktop.org/mailman/listinfo/mesa-dev
More information about the mesa-dev
mailing list