[Mesa-dev] [PATCH 1/3] i965: Move SOL PSIZ hacks from draw time to link time.
Rafael Antognolli
rafael.antognolli at intel.com
Wed May 31 17:09:48 UTC 2017
This series is
Reviewed-by: Rafael Antognolli <rafael.antognolli at intel.com>
On Wed, May 31, 2017 at 01:17:45AM -0700, Kenneth Graunke wrote:
> We can just update the gl_transform_feedback_info fields at link time
> to make the VUE header fields have the right location and component.
> Then we don't need to handle them specially at draw time, which is
> expensive.
> ---
> src/intel/compiler/gen6_gs_visitor.cpp | 13 +---------
> src/mesa/drivers/dri/i965/brw_link.cpp | 36 +++++++++++++++++++++++++++
> src/mesa/drivers/dri/i965/genX_state_upload.c | 26 +++----------------
> 3 files changed, 41 insertions(+), 34 deletions(-)
>
> Here are a few cleanups to the SO_DECL handling I wrote a few months ago
> while reading through the state upload code. Really, we should move the
> SO_DECL_LIST processing to link-time...there's no current API state in
> there. Ideally we could just memcpy it all to the batch at draw time...
>
> diff --git a/src/intel/compiler/gen6_gs_visitor.cpp b/src/intel/compiler/gen6_gs_visitor.cpp
> index fe9f834f0ce..66c69fb058f 100644
> --- a/src/intel/compiler/gen6_gs_visitor.cpp
> +++ b/src/intel/compiler/gen6_gs_visitor.cpp
> @@ -687,18 +687,7 @@ gen6_gs_visitor::xfb_program(unsigned vertex, unsigned num_verts)
> emit(MOV(dst_reg(this->vertex_output_offset), brw_imm_d(offset)));
> memcpy(data.reladdr, &this->vertex_output_offset, sizeof(src_reg));
> data.type = output_reg[varying][0].type;
> -
> - /* PSIZ, LAYER and VIEWPORT are packed in different channels of the
> - * same slot, so make sure we write the appropriate channel
> - */
> - if (varying == VARYING_SLOT_PSIZ)
> - data.swizzle = BRW_SWIZZLE_WWWW;
> - else if (varying == VARYING_SLOT_LAYER)
> - data.swizzle = BRW_SWIZZLE_YYYY;
> - else if (varying == VARYING_SLOT_VIEWPORT)
> - data.swizzle = BRW_SWIZZLE_ZZZZ;
> - else
> - data.swizzle = gs_prog_data->transform_feedback_swizzles[binding];
> + data.swizzle = gs_prog_data->transform_feedback_swizzles[binding];
>
> /* Write data */
> inst = emit(GS_OPCODE_SVB_WRITE, mrf_reg, data, sol_temp);
> diff --git a/src/mesa/drivers/dri/i965/brw_link.cpp b/src/mesa/drivers/dri/i965/brw_link.cpp
> index 57aaf6b9dc0..e9158c596c5 100644
> --- a/src/mesa/drivers/dri/i965/brw_link.cpp
> +++ b/src/mesa/drivers/dri/i965/brw_link.cpp
> @@ -28,6 +28,7 @@
> #include "compiler/glsl/ir_optimization.h"
> #include "compiler/glsl/program.h"
> #include "program/program.h"
> +#include "main/mtypes.h"
> #include "main/shaderapi.h"
> #include "main/shaderobj.h"
> #include "main/uniforms.h"
> @@ -176,6 +177,39 @@ unify_interfaces(struct shader_info **infos)
> }
> }
>
> +static void
> +update_xfb_info(struct gl_transform_feedback_info *xfb_info)
> +{
> + if (!xfb_info)
> + return;
> +
> + for (unsigned i = 0; i < xfb_info->NumOutputs; i++) {
> + struct gl_transform_feedback_output *output = &xfb_info->Outputs[i];
> +
> + /* The VUE header contains three scalar fields packed together:
> + * - gl_PointSize is stored in VARYING_SLOT_PSIZ.w
> + * - gl_Layer is stored in VARYING_SLOT_PSIZ.y
> + * - gl_ViewportIndex is stored in VARYING_SLOT_PSIZ.z
> + */
> + switch (output->OutputRegister) {
> + case VARYING_SLOT_LAYER:
> + assert(output->NumComponents == 1);
> + output->OutputRegister = VARYING_SLOT_PSIZ;
> + output->ComponentOffset = 1;
> + break;
> + case VARYING_SLOT_VIEWPORT:
> + assert(output->NumComponents == 1);
> + output->OutputRegister = VARYING_SLOT_PSIZ;
> + output->ComponentOffset = 2;
> + break;
> + case VARYING_SLOT_PSIZ:
> + assert(output->NumComponents == 1);
> + output->ComponentOffset = 3;
> + break;
> + }
> + }
> +}
> +
> extern "C" GLboolean
> brw_link_shader(struct gl_context *ctx, struct gl_shader_program *shProg)
> {
> @@ -199,6 +233,8 @@ brw_link_shader(struct gl_context *ctx, struct gl_shader_program *shProg)
> prog->ShadowSamplers = shader->shadow_samplers;
> _mesa_update_shader_textures_used(shProg, prog);
>
> + update_xfb_info(prog->sh.LinkedTransformFeedback);
> +
> bool debug_enabled =
> (INTEL_DEBUG & intel_debug_flag_for_shader_stage(shader->Stage));
>
> diff --git a/src/mesa/drivers/dri/i965/genX_state_upload.c b/src/mesa/drivers/dri/i965/genX_state_upload.c
> index 76d2ea887b1..a2ed2e72710 100644
> --- a/src/mesa/drivers/dri/i965/genX_state_upload.c
> +++ b/src/mesa/drivers/dri/i965/genX_state_upload.c
> @@ -3087,32 +3087,14 @@ genX(upload_3dstate_so_decl_list)(struct brw_context *brw,
> unsigned decl_buffer_slot = buffer;
> assert(stream_id < MAX_VERTEX_STREAMS);
>
> - /* gl_PointSize is stored in VARYING_SLOT_PSIZ.w
> - * gl_Layer is stored in VARYING_SLOT_PSIZ.y
> - * gl_ViewportIndex is stored in VARYING_SLOT_PSIZ.z
> - */
> - if (varying == VARYING_SLOT_PSIZ) {
> - assert(components == 1);
> - component_mask <<= 3;
> - } else if (varying == VARYING_SLOT_LAYER) {
> - assert(components == 1);
> - component_mask <<= 1;
> - } else if (varying == VARYING_SLOT_VIEWPORT) {
> - assert(components == 1);
> - component_mask <<= 2;
> - } else {
> - component_mask <<= linked_xfb_info->Outputs[i].ComponentOffset;
> - }
> + component_mask <<= linked_xfb_info->Outputs[i].ComponentOffset;
>
> buffer_mask[stream_id] |= 1 << buffer;
>
> + assert(vue_map->varying_to_slot[varying] >= 0);
> +
> decl.OutputBufferSlot = decl_buffer_slot;
> - if (varying == VARYING_SLOT_LAYER || varying == VARYING_SLOT_VIEWPORT) {
> - decl.RegisterIndex = vue_map->varying_to_slot[VARYING_SLOT_PSIZ];
> - } else {
> - assert(vue_map->varying_to_slot[varying] >= 0);
> - decl.RegisterIndex = vue_map->varying_to_slot[varying];
> - }
> + decl.RegisterIndex = vue_map->varying_to_slot[varying];
> decl.ComponentMask = component_mask;
>
> /* Mesa doesn't store entries for gl_SkipComponents in the Outputs[]
> --
> 2.13.0
>
> _______________________________________________
> mesa-dev mailing list
> mesa-dev at lists.freedesktop.org
> https://lists.freedesktop.org/mailman/listinfo/mesa-dev
More information about the mesa-dev
mailing list