[Mesa-dev] [PATCH v5 40/70] nir: Implement __intrinsic_load_ssbo
Samuel Iglesias Gonsálvez
siglesias at igalia.com
Mon Sep 21 02:03:41 PDT 2015
On 19/09/15 00:30, Kristian Høgsberg wrote:
> On Thu, Sep 10, 2015 at 03:35:56PM +0200, Iago Toral Quiroga wrote:
>> v2:
>> - Fix ssbo loads with boolean variables.
>>
>> Reviewed-by: Connor Abbott <connor.w.abbott at intel.com>
>> ---
>> src/glsl/nir/glsl_to_nir.cpp | 80 ++++++++++++++++++++++++++++++++-
>> src/glsl/nir/nir_intrinsics.h | 2 +-
>> src/glsl/nir/nir_lower_phis_to_scalar.c | 2 +
>> 3 files changed, 81 insertions(+), 3 deletions(-)
>>
>> diff --git a/src/glsl/nir/glsl_to_nir.cpp b/src/glsl/nir/glsl_to_nir.cpp
>> index 6f1e20a..cb7b196 100644
>> --- a/src/glsl/nir/glsl_to_nir.cpp
>> +++ b/src/glsl/nir/glsl_to_nir.cpp
>> @@ -646,11 +646,14 @@ nir_visitor::visit(ir_call *ir)
>> op = nir_intrinsic_image_size;
>> } else if (strcmp(ir->callee_name(), "__intrinsic_store_ssbo") == 0) {
>> op = nir_intrinsic_store_ssbo;
>> + } else if (strcmp(ir->callee_name(), "__intrinsic_load_ssbo") == 0) {
>> + op = nir_intrinsic_load_ssbo;
>> } else {
>> unreachable("not reached");
>> }
>>
>> nir_intrinsic_instr *instr = nir_intrinsic_instr_create(shader, op);
>> + nir_alu_instr *load_ssbo_compare;
>>
>> switch (op) {
>> case nir_intrinsic_atomic_counter_read_var:
>> @@ -776,11 +779,75 @@ nir_visitor::visit(ir_call *ir)
>> instr->src[1] = evaluate_rvalue(block);
>> break;
>> }
>> + case nir_intrinsic_load_ssbo: {
>> + exec_node *param = ir->actual_parameters.get_head();
>> + ir_rvalue *block = ((ir_instruction *)param)->as_rvalue();
>> +
>> + param = param->get_next();
>> + ir_rvalue *offset = ((ir_instruction *)param)->as_rvalue();
>> +
>> + /* Check if we need the indirect version */
>> + ir_constant *const_offset = offset->as_constant();
>> + if (!const_offset) {
>> + op = nir_intrinsic_load_ssbo_indirect;
>> + ralloc_free(instr);
>> + instr = nir_intrinsic_instr_create(shader, op);
>> + instr->src[1] = evaluate_rvalue(offset);
>> + instr->const_index[0] = 0;
>> + } else {
>> + instr->const_index[0] = const_offset->value.u[0];
>> + }
>> +
>> + instr->src[0] = evaluate_rvalue(block);
>> +
>> + const glsl_type *type = ir->return_deref->var->type;
>> + instr->num_components = type->vector_elements;
>> +
>> + /* Setup destination register */
>> + nir_ssa_dest_init(&instr->instr, &instr->dest,
>> + type->vector_elements, NULL);
>> +
>> + /* Insert the created nir instruction now since in the case of boolean
>> + * result we will need to emit another instruction after it
>> + */
>> + nir_instr_insert_after_cf_list(this->cf_node_list, &instr->instr);
>
> I'd prefer moving this insert into the GLSL_TYPE_BOOL condition below...
>
>> + /*
>> + * In SSBO/UBO's, a true boolean value is any non-zero value, but we
>> + * consider a true boolean to be ~0. Fix this up with a != 0
>> + * comparison.
>> + */
>> + if (type->base_type == GLSL_TYPE_BOOL) {
>
> ... that is, here...
>
>> + nir_load_const_instr *const_zero =
>> + nir_load_const_instr_create(shader, 1);
>> + const_zero->value.u[0] = 0;
>> + nir_instr_insert_after_cf_list(this->cf_node_list,
>> + &const_zero->instr);
>> +
>> + load_ssbo_compare = nir_alu_instr_create(shader, nir_op_ine);
>
> and then, insteed of introducing and using 'load_ssbo_compare' here,
> re-use 'instr' for the compare instruction...
>
I see why you suggest these changes but I don't like them:
instr is a pointer to nir_instrinsic_instr, while the compare
instruction is a nir_alu_instr*, so although we are lucky because some
fields are at the same offsets for both struct base addresses(*), this
could change in the future.
Even if I introduce load_ssbo_compare and, after setting it up, assign
'instr' with load_ssbo_compare pointer value to save some changes done
later, this would work now but it is not guaranteed to work in the future.
Sam
(*) For example:
load_ssbo_compare->dest.dest.ssa and instr->dest.ssa
>> + load_ssbo_compare->src[0].src.is_ssa = true;
>> + load_ssbo_compare->src[0].src.ssa = &instr->dest.ssa;
>> + load_ssbo_compare->src[1].src.is_ssa = true;
>> + load_ssbo_compare->src[1].src.ssa = &const_zero->def;
>> + for (unsigned i = 0; i < type->vector_elements; i++)
>> + load_ssbo_compare->src[1].swizzle[i] = 0;
>> + nir_ssa_dest_init(&load_ssbo_compare->instr,
>> + &load_ssbo_compare->dest.dest,
>> + type->vector_elements, NULL);
>> + load_ssbo_compare->dest.write_mask = (1 << type->vector_elements) - 1;
>> + nir_instr_insert_after_cf_list(this->cf_node_list,
>> + &load_ssbo_compare->instr);
>> + }
>> +
>> + break;
>> + }
>> default:
>> unreachable("not reached");
>> }
>>
>> - nir_instr_insert_after_cf_list(this->cf_node_list, &instr->instr);
>> + /* nir_intrinsic_load_ssbo{_indirect} were already emitted */
>> + if (op != nir_intrinsic_load_ssbo && op != nir_intrinsic_load_ssbo_indirect)
>> + nir_instr_insert_after_cf_list(this->cf_node_list, &instr->instr);
>>
>
> That way we don't need anything special here for ssbo_load...
>
>> if (ir->return_deref) {
>> nir_intrinsic_instr *store_instr =
>> @@ -789,7 +856,16 @@ nir_visitor::visit(ir_call *ir)
>>
>> store_instr->variables[0] =
>> evaluate_deref(&store_instr->instr, ir->return_deref);
>> - store_instr->src[0] = nir_src_for_ssa(&instr->dest.ssa);
>> +
>> + /* If nir_intrinsic_load_ssbo{_indirect} is loading a boolean variable,
>> + * the value is on load_ssbo_compare's dest. Use it instead.
>> + */
>> + if ((op == nir_intrinsic_load_ssbo || op == nir_intrinsic_load_ssbo_indirect) &&
>> + ir->return_deref->var->type->base_type == GLSL_TYPE_BOOL) {
>> + store_instr->src[0] = nir_src_for_ssa(&load_ssbo_compare->dest.dest.ssa);
>> + } else {
>> + store_instr->src[0] = nir_src_for_ssa(&instr->dest.ssa);
>> + }
>
> nor here.
>
>> nir_instr_insert_after_cf_list(this->cf_node_list,
>> &store_instr->instr);
>> diff --git a/src/glsl/nir/nir_intrinsics.h b/src/glsl/nir/nir_intrinsics.h
>> index 38f22c1..53066c6 100644
>> --- a/src/glsl/nir/nir_intrinsics.h
>> +++ b/src/glsl/nir/nir_intrinsics.h
>> @@ -174,7 +174,7 @@ SYSTEM_VALUE(invocation_id, 1)
>> LOAD(uniform, 0, 2, NIR_INTRINSIC_CAN_ELIMINATE | NIR_INTRINSIC_CAN_REORDER)
>> LOAD(ubo, 1, 1, NIR_INTRINSIC_CAN_ELIMINATE | NIR_INTRINSIC_CAN_REORDER)
>> LOAD(input, 0, 1, NIR_INTRINSIC_CAN_ELIMINATE | NIR_INTRINSIC_CAN_REORDER)
>> -/* LOAD(ssbo, 1, 0) */
>> +LOAD(ssbo, 1, 1, NIR_INTRINSIC_CAN_ELIMINATE)
>>
>> /*
>> * Stores work the same way as loads, except now the first register input is
>> diff --git a/src/glsl/nir/nir_lower_phis_to_scalar.c b/src/glsl/nir/nir_lower_phis_to_scalar.c
>> index 739170d..bdb7e6a 100644
>> --- a/src/glsl/nir/nir_lower_phis_to_scalar.c
>> +++ b/src/glsl/nir/nir_lower_phis_to_scalar.c
>> @@ -94,6 +94,8 @@ is_phi_src_scalarizable(nir_phi_src *src,
>> case nir_intrinsic_load_uniform_indirect:
>> case nir_intrinsic_load_ubo:
>> case nir_intrinsic_load_ubo_indirect:
>> + case nir_intrinsic_load_ssbo:
>> + case nir_intrinsic_load_ssbo_indirect:
>> case nir_intrinsic_load_input:
>> case nir_intrinsic_load_input_indirect:
>> return true;
>> --
>> 1.9.1
>>
>
More information about the mesa-dev
mailing list