[Mesa-dev] [PATCH 1/2] i965/clip: Add support for gl_ClipVertex

Chris Forbes chrisf at ijw.co.nz
Sun Jun 9 15:00:41 PDT 2013


I started out with predicated moves, but since this is about to go
away again anyway when I do ClipDistance support, I went with the
clearer option. No real perf impact.

-- Chris

On Thu, Jun 6, 2013 at 6:05 PM, Kenneth Graunke <kenneth at whitecape.org> wrote:
> On 06/05/2013 03:50 PM, Chris Forbes wrote:
>>
>> When clipping against a user clip plane, and gl_ClipVertex is provided
>> in the vertex, use it instead of hpos.
>>
>> Signed-off-by: Chris Forbes <chrisf at ijw.co.nz>
>> ---
>>   src/mesa/drivers/dri/i965/brw_clip.h     |  1 +
>>   src/mesa/drivers/dri/i965/brw_clip_tri.c | 44
>> +++++++++++++++++++++++++++++---
>>   2 files changed, 41 insertions(+), 4 deletions(-)
>>
>> diff --git a/src/mesa/drivers/dri/i965/brw_clip.h
>> b/src/mesa/drivers/dri/i965/brw_clip.h
>> index c6581ad..a0d5d93 100644
>> --- a/src/mesa/drivers/dri/i965/brw_clip.h
>> +++ b/src/mesa/drivers/dri/i965/brw_clip.h
>> @@ -100,6 +100,7 @@ struct brw_clip_compile {
>>         struct brw_reg plane_equation;
>>
>>         struct brw_reg ff_sync;
>> +      struct brw_reg vertex_src_mask;
>>      } reg;
>>
>>      /* Number of registers storing VUE data */
>> diff --git a/src/mesa/drivers/dri/i965/brw_clip_tri.c
>> b/src/mesa/drivers/dri/i965/brw_clip_tri.c
>> index 05959f6..5491ca8 100644
>> --- a/src/mesa/drivers/dri/i965/brw_clip_tri.c
>> +++ b/src/mesa/drivers/dri/i965/brw_clip_tri.c
>> @@ -119,6 +119,9 @@ void brw_clip_tri_alloc_regs( struct brw_clip_compile
>> *c,
>>         i++;
>>      }
>>
>> +   c->reg.vertex_src_mask = retype(brw_vec1_grf(i, 0),
>> BRW_REGISTER_TYPE_UD);
>> +   i++;
>> +
>>      if (intel->needs_ff_sync) {
>>         c->reg.ff_sync = retype(brw_vec1_grf(i, 0), BRW_REGISTER_TYPE_UD);
>>         i++;
>> @@ -219,6 +222,31 @@ void brw_clip_tri_flat_shade( struct brw_clip_compile
>> *c )
>>   }
>>
>>
>> +static inline void
>> +load_vertex_pos(struct brw_clip_compile *c, struct brw_indirect vtx,
>> +                struct brw_reg dst,
>> +                GLuint hpos_offset, GLuint clip_offset)
>> +{
>> +   struct brw_compile *p = &c->func;
>> +
>> +   /*
>> +    * Roughly:
>> +    * dst = (vertex_src_mask & 1) ? src.hpos : src.clipvertex;
>> +    */
>> +
>> +   brw_set_conditionalmod(p, BRW_CONDITIONAL_NZ);
>> +   brw_AND(p, vec1(brw_null_reg()), c->reg.vertex_src_mask,
>> brw_imm_ud(1));
>> +   brw_IF(p, BRW_EXECUTE_1);
>> +   {
>> +      brw_MOV(p, dst, deref_4f(vtx, clip_offset));
>> +   }
>> +   brw_ELSE(p);
>> +   {
>> +      brw_MOV(p, dst, deref_4f(vtx, hpos_offset));
>> +   }
>> +   brw_ENDIF(p);
>
>
> I wonder, is it possible to use SEL here?  Or failing that, predicated
> moves?  If not, no worries...the rest of the code is pretty well littered
> with IFs already.
>
> I second Paul's request for additional comments.  Other than that, this
> looks like a nice fix!  Somehow I imagined it would be harder.
>
> Both patches are:
> Reviewed-by: Kenneth Graunke <kenneth at whitecape.org>
>
> Thanks for doing this, Chris!
>
>
>> +}
>> +
>>
>>   /* Use mesa's clipping algorithms, translated to GEN4 assembly.
>>    */
>> @@ -233,13 +261,17 @@ void brw_clip_tri( struct brw_clip_compile *c )
>>      struct brw_indirect outlist_ptr = brw_indirect(5, 0);
>>      struct brw_indirect freelist_ptr = brw_indirect(6, 0);
>>      GLuint hpos_offset = brw_varying_to_offset(&c->vue_map,
>> VARYING_SLOT_POS);
>> -
>> +   GLuint clipvert_offset = brw_clip_have_varying(c,
>> VARYING_SLOT_CLIP_VERTEX)
>> +      ? brw_varying_to_offset(&c->vue_map, VARYING_SLOT_CLIP_VERTEX)
>> +      : hpos_offset;
>> +
>>      brw_MOV(p, get_addr_reg(vtxPrev),     brw_address(c->reg.vertex[2])
>> );
>>      brw_MOV(p, get_addr_reg(plane_ptr),   brw_clip_plane0_address(c));
>>      brw_MOV(p, get_addr_reg(inlist_ptr),  brw_address(c->reg.inlist));
>>      brw_MOV(p, get_addr_reg(outlist_ptr), brw_address(c->reg.outlist));
>>
>>      brw_MOV(p, get_addr_reg(freelist_ptr), brw_address(c->reg.vertex[3])
>> );
>> +   brw_MOV(p, c->reg.vertex_src_mask, brw_imm_ud(0xfc0));
>>
>>      brw_DO(p, BRW_EXECUTE_1);
>>      {
>> @@ -269,15 +301,17 @@ void brw_clip_tri( struct brw_clip_compile *c )
>>              */
>>             brw_MOV(p, get_addr_reg(vtx), deref_1uw(inlist_ptr, 0));
>>
>> +            load_vertex_pos(c, vtxPrev, vec4(c->reg.dpPrev), hpos_offset,
>> clipvert_offset);
>>             /* IS_NEGATIVE(prev) */
>>             brw_set_conditionalmod(p, BRW_CONDITIONAL_L);
>> -           brw_DP4(p, vec4(c->reg.dpPrev), deref_4f(vtxPrev,
>> hpos_offset), c->reg.plane_equation);
>> +           brw_DP4(p, vec4(c->reg.dpPrev), vec4(c->reg.dpPrev),
>> c->reg.plane_equation);
>>             brw_IF(p, BRW_EXECUTE_1);
>>             {
>> +               load_vertex_pos(c, vtx, vec4(c->reg.dp), hpos_offset,
>> clipvert_offset);
>>                /* IS_POSITIVE(next)
>>                 */
>>                brw_set_conditionalmod(p, BRW_CONDITIONAL_GE);
>> -              brw_DP4(p, vec4(c->reg.dp), deref_4f(vtx, hpos_offset),
>> c->reg.plane_equation);
>> +              brw_DP4(p, vec4(c->reg.dp), vec4(c->reg.dp),
>> c->reg.plane_equation);
>>                brw_IF(p, BRW_EXECUTE_1);
>>                {
>>
>> @@ -316,10 +350,11 @@ void brw_clip_tri( struct brw_clip_compile *c )
>>                brw_ADD(p, get_addr_reg(outlist_ptr),
>> get_addr_reg(outlist_ptr), brw_imm_uw(sizeof(short)));
>>                brw_ADD(p, c->reg.nr_verts, c->reg.nr_verts,
>> brw_imm_ud(1));
>>
>> +               load_vertex_pos(c, vtx, vec4(c->reg.dp), hpos_offset,
>> clipvert_offset);
>>                /* IS_NEGATIVE(next)
>>                 */
>>                brw_set_conditionalmod(p, BRW_CONDITIONAL_L);
>> -              brw_DP4(p, vec4(c->reg.dp), deref_4f(vtx, hpos_offset),
>> c->reg.plane_equation);
>> +              brw_DP4(p, vec4(c->reg.dp), vec4(c->reg.dp),
>> c->reg.plane_equation);
>>                brw_IF(p, BRW_EXECUTE_1);
>>                {
>>                   /* Going out of bounds.  Avoid division by zero as we
>> @@ -392,6 +427,7 @@ void brw_clip_tri( struct brw_clip_compile *c )
>>          */
>>         brw_set_conditionalmod(p, BRW_CONDITIONAL_NZ);
>>         brw_SHR(p, c->reg.planemask, c->reg.planemask, brw_imm_ud(1));
>> +      brw_SHR(p, c->reg.vertex_src_mask, c->reg.vertex_src_mask,
>> brw_imm_ud(1));
>>      }
>>      brw_WHILE(p);
>>   }
>>
>


More information about the mesa-dev mailing list