[Mesa-dev] [PATCH v3 08/44] i965: Implement programming of the L3 configuration.
Samuel Iglesias Gonsálvez
siglesias at igalia.com
Tue Dec 1 05:21:12 PST 2015
Reviewed-by: Samuel Iglesias Gonsálvez <siglesias at igalia.com>
On 01/12/15 09:19, Jordan Justen wrote:
> From: Francisco Jerez <currojerez at riseup.net>
>
> ---
> src/mesa/drivers/dri/i965/gen7_l3_state.c | 95 +++++++++++++++++++++++++++++++
> 1 file changed, 95 insertions(+)
>
> diff --git a/src/mesa/drivers/dri/i965/gen7_l3_state.c b/src/mesa/drivers/dri/i965/gen7_l3_state.c
> index 8765b11..108f3a8 100644
> --- a/src/mesa/drivers/dri/i965/gen7_l3_state.c
> +++ b/src/mesa/drivers/dri/i965/gen7_l3_state.c
> @@ -161,3 +161,98 @@ get_l3_way_size(const struct brw_device_info *devinfo)
> else
> return 8 * devinfo->num_slices;
> }
> +
> +/**
> + * Program the hardware to use the specified L3 configuration.
> + */
> +static void
> +setup_l3_config(struct brw_context *brw, const struct brw_l3_config *cfg)
> +{
> + const bool has_dc = cfg->n[L3P_DC] || cfg->n[L3P_ALL];
> + const bool has_is = cfg->n[L3P_IS] || cfg->n[L3P_RO] || cfg->n[L3P_ALL];
> + const bool has_c = cfg->n[L3P_C] || cfg->n[L3P_RO] || cfg->n[L3P_ALL];
> + const bool has_t = cfg->n[L3P_T] || cfg->n[L3P_RO] || cfg->n[L3P_ALL];
> + const bool has_slm = cfg->n[L3P_SLM];
> +
> + /* According to the hardware docs, the L3 partitioning can only be changed
> + * while the pipeline is completely drained and the caches are flushed,
> + * what involves a first PIPE_CONTROL flush which stalls the pipeline and
> + * initiates invalidation of the relevant caches...
> + */
> + brw_emit_pipe_control_flush(brw,
> + PIPE_CONTROL_TEXTURE_CACHE_INVALIDATE |
> + PIPE_CONTROL_CONST_CACHE_INVALIDATE |
> + PIPE_CONTROL_INSTRUCTION_INVALIDATE |
> + PIPE_CONTROL_DATA_CACHE_INVALIDATE |
> + PIPE_CONTROL_NO_WRITE |
> + PIPE_CONTROL_CS_STALL);
> +
> + /* ...followed by a second stalling flush which guarantees that
> + * invalidation is complete when the L3 configuration registers are
> + * modified.
> + */
> + brw_emit_pipe_control_flush(brw,
> + PIPE_CONTROL_DATA_CACHE_INVALIDATE |
> + PIPE_CONTROL_NO_WRITE |
> + PIPE_CONTROL_CS_STALL);
> +
> + if (brw->gen >= 8) {
> + assert(!cfg->n[L3P_IS] && !cfg->n[L3P_C] && !cfg->n[L3P_T]);
> +
> + BEGIN_BATCH(3);
> + OUT_BATCH(MI_LOAD_REGISTER_IMM | (3 - 2));
> +
> + /* Set up the L3 partitioning. */
> + OUT_BATCH(GEN8_L3CNTLREG);
> + OUT_BATCH((has_slm ? GEN8_L3CNTLREG_SLM_ENABLE : 0) |
> + SET_FIELD(cfg->n[L3P_URB], GEN8_L3CNTLREG_URB_ALLOC) |
> + SET_FIELD(cfg->n[L3P_RO], GEN8_L3CNTLREG_RO_ALLOC) |
> + SET_FIELD(cfg->n[L3P_DC], GEN8_L3CNTLREG_DC_ALLOC) |
> + SET_FIELD(cfg->n[L3P_ALL], GEN8_L3CNTLREG_ALL_ALLOC));
> +
> + ADVANCE_BATCH();
> +
> + } else {
> + assert(!cfg->n[L3P_ALL]);
> +
> + /* When enabled SLM only uses a portion of the L3 on half of the banks,
> + * the matching space on the remaining banks has to be allocated to a
> + * client (URB for all validated configurations) set to the
> + * lower-bandwidth 2-bank address hashing mode.
> + */
> + const bool urb_low_bw = has_slm && !brw->is_baytrail;
> + assert(!urb_low_bw || cfg->n[L3P_URB] == cfg->n[L3P_SLM]);
> +
> + /* Minimum number of ways that can be allocated to the URB. */
> + const unsigned n0_urb = (brw->is_baytrail ? 32 : 0);
> + assert(cfg->n[L3P_URB] >= n0_urb);
> +
> + BEGIN_BATCH(7);
> + OUT_BATCH(MI_LOAD_REGISTER_IMM | (7 - 2));
> +
> + /* Demote any clients with no ways assigned to LLC. */
> + OUT_BATCH(GEN7_L3SQCREG1);
> + OUT_BATCH((brw->is_haswell ? HSW_L3SQCREG1_SQGHPCI_DEFAULT :
> + brw->is_baytrail ? VLV_L3SQCREG1_SQGHPCI_DEFAULT :
> + IVB_L3SQCREG1_SQGHPCI_DEFAULT) |
> + (has_dc ? 0 : GEN7_L3SQCREG1_CONV_DC_UC) |
> + (has_is ? 0 : GEN7_L3SQCREG1_CONV_IS_UC) |
> + (has_c ? 0 : GEN7_L3SQCREG1_CONV_C_UC) |
> + (has_t ? 0 : GEN7_L3SQCREG1_CONV_T_UC));
> +
> + /* Set up the L3 partitioning. */
> + OUT_BATCH(GEN7_L3CNTLREG2);
> + OUT_BATCH((has_slm ? GEN7_L3CNTLREG2_SLM_ENABLE : 0) |
> + SET_FIELD(cfg->n[L3P_URB] - n0_urb, GEN7_L3CNTLREG2_URB_ALLOC) |
> + (urb_low_bw ? GEN7_L3CNTLREG2_URB_LOW_BW : 0) |
> + SET_FIELD(cfg->n[L3P_ALL], GEN7_L3CNTLREG2_ALL_ALLOC) |
> + SET_FIELD(cfg->n[L3P_RO], GEN7_L3CNTLREG2_RO_ALLOC) |
> + SET_FIELD(cfg->n[L3P_DC], GEN7_L3CNTLREG2_DC_ALLOC));
> + OUT_BATCH(GEN7_L3CNTLREG3);
> + OUT_BATCH(SET_FIELD(cfg->n[L3P_IS], GEN7_L3CNTLREG3_IS_ALLOC) |
> + SET_FIELD(cfg->n[L3P_C], GEN7_L3CNTLREG3_C_ALLOC) |
> + SET_FIELD(cfg->n[L3P_T], GEN7_L3CNTLREG3_T_ALLOC));
> +
> + ADVANCE_BATCH();
> + }
> +}
>
More information about the mesa-dev
mailing list