[Mesa-dev] [PATCH 4/9] i965/fs: Lower gl_VertexID and friends to inputs at the NIR level
Alejandro Piñeiro
apinheiro at igalia.com
Fri May 5 07:20:15 UTC 2017
Reviewed-by: Alejandro Piñeiro <apinheiro at igalia.com>
On 05/05/17 04:11, Jason Ekstrand wrote:
> NIR calls these system values but they come in from the VF unit as
> vertex data. It's terribly convenient to just be able to treat them as
> such in the back-end.
> ---
> src/intel/compiler/brw_fs.h | 1 -
> src/intel/compiler/brw_fs_nir.cpp | 30 +--------------
> src/intel/compiler/brw_fs_visitor.cpp | 38 ------------------
> src/intel/compiler/brw_nir.c | 72 ++++++++++++++++++++++++++++++++++-
> 4 files changed, 71 insertions(+), 70 deletions(-)
>
> diff --git a/src/intel/compiler/brw_fs.h b/src/intel/compiler/brw_fs.h
> index e230b5e..6c8c027 100644
> --- a/src/intel/compiler/brw_fs.h
> +++ b/src/intel/compiler/brw_fs.h
> @@ -175,7 +175,6 @@ public:
> fs_reg *emit_samplepos_setup();
> fs_reg *emit_sampleid_setup();
> fs_reg *emit_samplemaskin_setup();
> - fs_reg *emit_vs_system_value(int location);
> void emit_interpolation_setup_gen4();
> void emit_interpolation_setup_gen6();
> void compute_sample_position(fs_reg dst, fs_reg int_sample_pos);
> diff --git a/src/intel/compiler/brw_fs_nir.cpp b/src/intel/compiler/brw_fs_nir.cpp
> index 3ab41df..d4ce753 100644
> --- a/src/intel/compiler/brw_fs_nir.cpp
> +++ b/src/intel/compiler/brw_fs_nir.cpp
> @@ -89,39 +89,11 @@ emit_system_values_block(nir_block *block, fs_visitor *v)
> unreachable("should be lowered by lower_vertex_id().");
>
> case nir_intrinsic_load_vertex_id_zero_base:
> - assert(v->stage == MESA_SHADER_VERTEX);
> - reg = &v->nir_system_values[SYSTEM_VALUE_VERTEX_ID_ZERO_BASE];
> - if (reg->file == BAD_FILE)
> - *reg = *v->emit_vs_system_value(SYSTEM_VALUE_VERTEX_ID_ZERO_BASE);
> - break;
> -
> case nir_intrinsic_load_base_vertex:
> - assert(v->stage == MESA_SHADER_VERTEX);
> - reg = &v->nir_system_values[SYSTEM_VALUE_BASE_VERTEX];
> - if (reg->file == BAD_FILE)
> - *reg = *v->emit_vs_system_value(SYSTEM_VALUE_BASE_VERTEX);
> - break;
> -
> case nir_intrinsic_load_instance_id:
> - assert(v->stage == MESA_SHADER_VERTEX);
> - reg = &v->nir_system_values[SYSTEM_VALUE_INSTANCE_ID];
> - if (reg->file == BAD_FILE)
> - *reg = *v->emit_vs_system_value(SYSTEM_VALUE_INSTANCE_ID);
> - break;
> -
> case nir_intrinsic_load_base_instance:
> - assert(v->stage == MESA_SHADER_VERTEX);
> - reg = &v->nir_system_values[SYSTEM_VALUE_BASE_INSTANCE];
> - if (reg->file == BAD_FILE)
> - *reg = *v->emit_vs_system_value(SYSTEM_VALUE_BASE_INSTANCE);
> - break;
> -
> case nir_intrinsic_load_draw_id:
> - assert(v->stage == MESA_SHADER_VERTEX);
> - reg = &v->nir_system_values[SYSTEM_VALUE_DRAW_ID];
> - if (reg->file == BAD_FILE)
> - *reg = *v->emit_vs_system_value(SYSTEM_VALUE_DRAW_ID);
> - break;
> + unreachable("should be lowered by brw_nir_lower_vs_inputs().");
>
> case nir_intrinsic_load_invocation_id:
> if (v->stage == MESA_SHADER_TESS_CTRL)
> diff --git a/src/intel/compiler/brw_fs_visitor.cpp b/src/intel/compiler/brw_fs_visitor.cpp
> index 7904434..b6524d2 100644
> --- a/src/intel/compiler/brw_fs_visitor.cpp
> +++ b/src/intel/compiler/brw_fs_visitor.cpp
> @@ -32,44 +32,6 @@
>
> using namespace brw;
>
> -fs_reg *
> -fs_visitor::emit_vs_system_value(int location)
> -{
> - fs_reg *reg = new(this->mem_ctx)
> - fs_reg(ATTR, 4 * _mesa_bitcount_64(nir->info->inputs_read),
> - BRW_REGISTER_TYPE_D);
> -
> - switch (location) {
> - case SYSTEM_VALUE_BASE_VERTEX:
> - reg->offset = 0;
> - break;
> - case SYSTEM_VALUE_BASE_INSTANCE:
> - reg->offset = REG_SIZE;
> - break;
> - case SYSTEM_VALUE_VERTEX_ID:
> - unreachable("should have been lowered");
> - case SYSTEM_VALUE_VERTEX_ID_ZERO_BASE:
> - reg->offset = 2 * REG_SIZE;
> - break;
> - case SYSTEM_VALUE_INSTANCE_ID:
> - reg->offset = 3 * REG_SIZE;
> - break;
> - case SYSTEM_VALUE_DRAW_ID:
> - if (nir->info->system_values_read &
> - (BITFIELD64_BIT(SYSTEM_VALUE_BASE_VERTEX) |
> - BITFIELD64_BIT(SYSTEM_VALUE_BASE_INSTANCE) |
> - BITFIELD64_BIT(SYSTEM_VALUE_VERTEX_ID_ZERO_BASE) |
> - BITFIELD64_BIT(SYSTEM_VALUE_INSTANCE_ID)))
> - reg->nr += 4;
> - reg->offset = 0;
> - break;
> - default:
> - unreachable("not reached");
> - }
> -
> - return reg;
> -}
> -
> /* Sample from the MCS surface attached to this multisample texture. */
> fs_reg
> fs_visitor::emit_mcs_fetch(const fs_reg &coordinate, unsigned components,
> diff --git a/src/intel/compiler/brw_nir.c b/src/intel/compiler/brw_nir.c
> index 7248594..556782e 100644
> --- a/src/intel/compiler/brw_nir.c
> +++ b/src/intel/compiler/brw_nir.c
> @@ -259,18 +259,81 @@ brw_nir_lower_vs_inputs(nir_shader *nir,
> if (!is_scalar)
> return;
>
> + const bool has_svgs =
> + nir->info->system_values_read &
> + (BITFIELD64_BIT(SYSTEM_VALUE_BASE_VERTEX) |
> + BITFIELD64_BIT(SYSTEM_VALUE_BASE_INSTANCE) |
> + BITFIELD64_BIT(SYSTEM_VALUE_VERTEX_ID_ZERO_BASE) |
> + BITFIELD64_BIT(SYSTEM_VALUE_INSTANCE_ID));
> +
> + const unsigned num_inputs = _mesa_bitcount_64(nir->info->inputs_read);
> +
> nir_foreach_function(function, nir) {
> if (!function->impl)
> continue;
>
> + nir_builder b;
> + nir_builder_init(&b, function->impl);
> +
> nir_foreach_block(block, function->impl) {
> - nir_foreach_instr(instr, block) {
> + nir_foreach_instr_safe(instr, block) {
> if (instr->type != nir_instr_type_intrinsic)
> continue;
>
> nir_intrinsic_instr *intrin = nir_instr_as_intrinsic(instr);
>
> - if (intrin->intrinsic == nir_intrinsic_load_input) {
> + switch (intrin->intrinsic) {
> + case nir_intrinsic_load_base_vertex:
> + case nir_intrinsic_load_base_instance:
> + case nir_intrinsic_load_vertex_id_zero_base:
> + case nir_intrinsic_load_instance_id:
> + case nir_intrinsic_load_draw_id: {
> + b.cursor = nir_after_instr(&intrin->instr);
> +
> + /* gl_VertexID and friends are stored by the VF as the last
> + * vertex element. We convert them to load_input intrinsics at
> + * the right location.
> + */
> + nir_intrinsic_instr *load =
> + nir_intrinsic_instr_create(nir, nir_intrinsic_load_input);
> + load->src[0] = nir_src_for_ssa(nir_imm_int(&b, 0));
> +
> + nir_intrinsic_set_base(load, num_inputs);
> + switch (intrin->intrinsic) {
> + case nir_intrinsic_load_base_vertex:
> + nir_intrinsic_set_component(load, 0);
> + break;
> + case nir_intrinsic_load_base_instance:
> + nir_intrinsic_set_component(load, 1);
> + break;
> + case nir_intrinsic_load_vertex_id_zero_base:
> + nir_intrinsic_set_component(load, 2);
> + break;
> + case nir_intrinsic_load_instance_id:
> + nir_intrinsic_set_component(load, 3);
> + break;
> + case nir_intrinsic_load_draw_id:
> + /* gl_DrawID is stored right after gl_VertexID and friends
> + * if any of them exist.
> + */
> + nir_intrinsic_set_base(load, num_inputs + has_svgs);
> + nir_intrinsic_set_component(load, 0);
> + break;
> + default:
> + unreachable("Invalid SVGS intrinsic");
> + }
> +
> + load->num_components = 1;
> + nir_ssa_dest_init(&load->instr, &load->dest, 1, 32, NULL);
> + nir_builder_instr_insert(&b, &load->instr);
> +
> + nir_ssa_def_rewrite_uses(&intrin->dest.ssa,
> + nir_src_for_ssa(&load->dest.ssa));
> + nir_instr_remove(&intrin->instr);
> + break;
> + }
> +
> + case nir_intrinsic_load_input: {
> /* Attributes come in a contiguous block, ordered by their
> * gl_vert_attrib value. That means we can compute the slot
> * number for an attribute by masking out the enabled attributes
> @@ -280,6 +343,11 @@ brw_nir_lower_vs_inputs(nir_shader *nir,
> int slot = _mesa_bitcount_64(nir->info->inputs_read &
> BITFIELD64_MASK(attr));
> nir_intrinsic_set_base(intrin, slot);
> + break;
> + }
> +
> + default:
> + break; /* Nothing to do */
> }
> }
> }
More information about the mesa-dev
mailing list