[Mesa-dev] [PATCH] nvc0: enable 32 textures on kepler+
Samuel Pitoiset
samuel.pitoiset at gmail.com
Tue May 24 08:05:48 UTC 2016
The idea sounds good to me, but this (1U << i) needs consistency in my
opinion. It's correct and avoid some compiler warnings (if the
corresponding flags are used) but we currently don't do that.
I would suggest to keep the (1 << i) for now, and maybe make a separate
patch which replaces 1 by 1U whenever it's possible. What do you think?
On 05/24/2016 06:23 AM, Ilia Mirkin wrote:
> For fermi, this likely will require use of linked tsc mode. However on
> bindless architectures, we can have as many as we want. As it stands,
> the AUX_TEX_INFO has 32 teture handles reserved.
>
> Signed-off-by: Ilia Mirkin <imirkin at alum.mit.edu>
> ---
> src/gallium/drivers/nouveau/nvc0/nvc0_context.h | 2 +-
> src/gallium/drivers/nouveau/nvc0/nvc0_screen.c | 4 ++--
> src/gallium/drivers/nouveau/nvc0/nvc0_tex.c | 12 ++++++------
> 3 files changed, 9 insertions(+), 9 deletions(-)
>
> diff --git a/src/gallium/drivers/nouveau/nvc0/nvc0_context.h b/src/gallium/drivers/nouveau/nvc0/nvc0_context.h
> index 436e912..5be78aa 100644
> --- a/src/gallium/drivers/nouveau/nvc0/nvc0_context.h
> +++ b/src/gallium/drivers/nouveau/nvc0/nvc0_context.h
> @@ -197,7 +197,7 @@ struct nvc0_context {
> uint32_t textures_coherent[6];
> struct nv50_tsc_entry *samplers[6][PIPE_MAX_SAMPLERS];
> unsigned num_samplers[6];
> - uint16_t samplers_dirty[6];
> + uint32_t samplers_dirty[6];
> bool seamless_cube_map;
>
> uint32_t tex_handles[6][PIPE_MAX_SAMPLERS]; /* for nve4 */
> diff --git a/src/gallium/drivers/nouveau/nvc0/nvc0_screen.c b/src/gallium/drivers/nouveau/nvc0/nvc0_screen.c
> index 7d692ea..4c47503 100644
> --- a/src/gallium/drivers/nouveau/nvc0/nvc0_screen.c
> +++ b/src/gallium/drivers/nouveau/nvc0/nvc0_screen.c
> @@ -369,9 +369,9 @@ nvc0_screen_get_shader_param(struct pipe_screen *pscreen, unsigned shader,
> case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
> return NVC0_MAX_BUFFERS;
> case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
> - return 16; /* would be 32 in linked (OpenGL-style) mode */
> + return (class_3d >= NVE4_3D_CLASS) ? 32 : 16;
> case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
> - return 16; /* XXX not sure if more are really safe */
> + return (class_3d >= NVE4_3D_CLASS) ? 32 : 16;
> case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
> return 32;
> case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
> diff --git a/src/gallium/drivers/nouveau/nvc0/nvc0_tex.c b/src/gallium/drivers/nouveau/nvc0/nvc0_tex.c
> index 2523c20..2c6f3eb 100644
> --- a/src/gallium/drivers/nouveau/nvc0/nvc0_tex.c
> +++ b/src/gallium/drivers/nouveau/nvc0/nvc0_tex.c
> @@ -446,7 +446,7 @@ nvc0_validate_tic(struct nvc0_context *nvc0, int s)
> for (i = 0; i < nvc0->num_textures[s]; ++i) {
> struct nv50_tic_entry *tic = nv50_tic_entry(nvc0->textures[s][i]);
> struct nv04_resource *res;
> - const bool dirty = !!(nvc0->textures_dirty[s] & (1 << i));
> + const bool dirty = !!(nvc0->textures_dirty[s] & (1U << i));
>
> if (!tic) {
> if (dirty)
> @@ -523,7 +523,7 @@ nve4_validate_tic(struct nvc0_context *nvc0, unsigned s)
> for (i = 0; i < nvc0->num_textures[s]; ++i) {
> struct nv50_tic_entry *tic = nv50_tic_entry(nvc0->textures[s][i]);
> struct nv04_resource *res;
> - const bool dirty = !!(nvc0->textures_dirty[s] & (1 << i));
> + const bool dirty = !!(nvc0->textures_dirty[s] & (1U << i));
>
> if (!tic) {
> nvc0->tex_handles[s][i] |= NVE4_TIC_ENTRY_INVALID;
> @@ -564,7 +564,7 @@ nve4_validate_tic(struct nvc0_context *nvc0, unsigned s)
> }
> for (; i < nvc0->state.num_textures[s]; ++i) {
> nvc0->tex_handles[s][i] |= NVE4_TIC_ENTRY_INVALID;
> - nvc0->textures_dirty[s] |= 1 << i;
> + nvc0->textures_dirty[s] |= 1U << i;
> }
>
> nvc0->state.num_textures[s] = nvc0->num_textures[s];
> @@ -593,7 +593,7 @@ void nvc0_validate_textures(struct nvc0_context *nvc0)
> bool
> nvc0_validate_tsc(struct nvc0_context *nvc0, int s)
> {
> - uint32_t commands[16];
> + uint32_t commands[32];
> struct nouveau_pushbuf *push = nvc0->base.pushbuf;
> unsigned i;
> unsigned n = 0;
> @@ -602,7 +602,7 @@ nvc0_validate_tsc(struct nvc0_context *nvc0, int s)
> for (i = 0; i < nvc0->num_samplers[s]; ++i) {
> struct nv50_tsc_entry *tsc = nv50_tsc_entry(nvc0->samplers[s][i]);
>
> - if (!(nvc0->samplers_dirty[s] & (1 << i)))
> + if (!(nvc0->samplers_dirty[s] & (1U << i)))
> continue;
> if (!tsc) {
> commands[n++] = (i << 4) | 0;
> @@ -676,7 +676,7 @@ nve4_validate_tsc(struct nvc0_context *nvc0, int s)
> }
> for (; i < nvc0->state.num_samplers[s]; ++i) {
> nvc0->tex_handles[s][i] |= NVE4_TSC_ENTRY_INVALID;
> - nvc0->samplers_dirty[s] |= 1 << i;
> + nvc0->samplers_dirty[s] |= 1U << i;
> }
>
> nvc0->state.num_samplers[s] = nvc0->num_samplers[s];
>
--
-Samuel
More information about the mesa-dev
mailing list