[PATCH] drm/radeon: allow CMASK and FMASK in the CS checker on r600-r700

Marek Olšák maraeo at gmail.com
Sun Aug 19 14:51:59 PDT 2012


Please can someone tell me if this patch will end up in kernel 3.6 or 3.7.

If it is merged in Linus's tree in the coming days, I'll try to
complete R600-R700 MSAA support (and therefore GL3.0) for Mesa 9.0.

Marek

On Sun, Aug 19, 2012 at 2:22 AM, Marek Olšák <maraeo at gmail.com> wrote:
> MSAA is impossible without them.
>
> Signed-off-by: Marek Olšák <maraeo at gmail.com>
> ---
>  drivers/gpu/drm/radeon/r600_cs.c     |   94 +++++++++++++++++++++++++++++-----
>  drivers/gpu/drm/radeon/r600d.h       |   17 ++++++
>  drivers/gpu/drm/radeon/radeon_drv.c  |    3 +-
>  drivers/gpu/drm/radeon/reg_srcs/r600 |    8 ---
>  4 files changed, 101 insertions(+), 21 deletions(-)
>
> diff --git a/drivers/gpu/drm/radeon/r600_cs.c b/drivers/gpu/drm/radeon/r600_cs.c
> index 3dab49c..1bec5b8 100644
> --- a/drivers/gpu/drm/radeon/r600_cs.c
> +++ b/drivers/gpu/drm/radeon/r600_cs.c
> @@ -47,13 +47,17 @@ struct r600_cs_track {
>         u32                     npipes;
>         /* value we track */
>         u32                     sq_config;
> +       u32                     log_nsamples;
>         u32                     nsamples;
>         u32                     cb_color_base_last[8];
>         struct radeon_bo        *cb_color_bo[8];
>         u64                     cb_color_bo_mc[8];
> -       u32                     cb_color_bo_offset[8];
> -       struct radeon_bo        *cb_color_frag_bo[8]; /* unused */
> -       struct radeon_bo        *cb_color_tile_bo[8]; /* unused */
> +       u64                     cb_color_bo_offset[8];
> +       struct radeon_bo        *cb_color_frag_bo[8];
> +       u64                     cb_color_frag_offset[8];
> +       struct radeon_bo        *cb_color_tile_bo[8];
> +       u64                     cb_color_tile_offset[8];
> +       u32                     cb_color_mask[8];
>         u32                     cb_color_info[8];
>         u32                     cb_color_view[8];
>         u32                     cb_color_size_idx[8]; /* unused */
> @@ -349,10 +353,6 @@ static int r600_cs_track_validate_cb(struct radeon_cs_parser *p, int i)
>         unsigned array_mode;
>         u32 format;
>
> -       if (G_0280A0_TILE_MODE(track->cb_color_info[i])) {
> -               dev_warn(p->dev, "FMASK or CMASK buffer are not supported by this kernel\n");
> -               return -EINVAL;
> -       }
>         size = radeon_bo_size(track->cb_color_bo[i]) - track->cb_color_bo_offset[i];
>         format = G_0280A0_FORMAT(track->cb_color_info[i]);
>         if (!r600_fmt_is_valid_color(format)) {
> @@ -441,7 +441,7 @@ static int r600_cs_track_validate_cb(struct radeon_cs_parser *p, int i)
>                          * broken userspace.
>                          */
>                 } else {
> -                       dev_warn(p->dev, "%s offset[%d] %d %d %d %lu too big (%d %d) (%d %d %d)\n",
> +                       dev_warn(p->dev, "%s offset[%d] %d %llu %d %lu too big (%d %d) (%d %d %d)\n",
>                                  __func__, i, array_mode,
>                                  track->cb_color_bo_offset[i], tmp,
>                                  radeon_bo_size(track->cb_color_bo[i]),
> @@ -458,6 +458,51 @@ static int r600_cs_track_validate_cb(struct radeon_cs_parser *p, int i)
>         tmp = S_028060_PITCH_TILE_MAX((pitch / 8) - 1) |
>                 S_028060_SLICE_TILE_MAX(slice_tile_max - 1);
>         ib[track->cb_color_size_idx[i]] = tmp;
> +
> +       /* FMASK/CMASK */
> +       switch (G_0280A0_TILE_MODE(track->cb_color_info[i])) {
> +       case V_0280A0_TILE_DISABLE:
> +               break;
> +       case V_0280A0_FRAG_ENABLE:
> +               if (track->nsamples > 1) {
> +                       uint32_t tile_max = G_028100_FMASK_TILE_MAX(track->cb_color_mask[i]);
> +                       /* the tile size is 8x8, but the size is in units of bits.
> +                        * for bytes, do just * 8. */
> +                       uint32_t bytes = track->nsamples * track->log_nsamples * 8 * (tile_max + 1);
> +
> +                       if (bytes + track->cb_color_frag_offset[i] >
> +                           radeon_bo_size(track->cb_color_frag_bo[i])) {
> +                               dev_warn(p->dev, "%s FMASK_TILE_MAX too large "
> +                                        "(tile_max=%u, bytes=%u, offset=%llu, bo_size=%lu)\n",
> +                                        __func__, tile_max, bytes,
> +                                        track->cb_color_frag_offset[i],
> +                                        radeon_bo_size(track->cb_color_frag_bo[i]));
> +                               return -EINVAL;
> +                       }
> +               }
> +               /* fall through */
> +       case V_0280A0_CLEAR_ENABLE:
> +       {
> +               uint32_t block_max = G_028100_CMASK_BLOCK_MAX(track->cb_color_mask[i]);
> +               /* One block = 128x128 pixels, one 8x8 tile has 4 bits..
> +                * (128*128) / (8*8) / 2 = 128 bytes per block. */
> +               uint32_t bytes = (block_max + 1) * 128;
> +
> +               if (bytes + track->cb_color_tile_offset[i] >
> +                   radeon_bo_size(track->cb_color_tile_bo[i])) {
> +                       dev_warn(p->dev, "%s CMASK_BLOCK_MAX too large "
> +                                "(block_max=%u, bytes=%u, offset=%llu, bo_size=%lu)\n",
> +                                __func__, block_max, bytes,
> +                                track->cb_color_tile_offset[i],
> +                                radeon_bo_size(track->cb_color_tile_bo[i]));
> +                       return -EINVAL;
> +               }
> +               break;
> +       }
> +       default:
> +               dev_warn(p->dev, "%s invalid tile mode\n", __func__);
> +               return -EINVAL;
> +       }
>         return 0;
>  }
>
> @@ -1231,6 +1276,7 @@ static int r600_cs_check_reg(struct radeon_cs_parser *p, u32 reg, u32 idx)
>                 break;
>         case R_028C04_PA_SC_AA_CONFIG:
>                 tmp = G_028C04_MSAA_NUM_SAMPLES(radeon_get_ib_value(p, idx));
> +               track->log_nsamples = tmp;
>                 track->nsamples = 1 << tmp;
>                 track->cb_dirty = true;
>                 break;
> @@ -1312,16 +1358,21 @@ static int r600_cs_check_reg(struct radeon_cs_parser *p, u32 reg, u32 idx)
>                                 dev_err(p->dev, "Broken old userspace ? no cb_color0_base supplied before trying to write 0x%08X\n", reg);
>                                 return -EINVAL;
>                         }
> -                       ib[idx] = track->cb_color_base_last[tmp];
>                         track->cb_color_frag_bo[tmp] = track->cb_color_bo[tmp];
> +                       track->cb_color_frag_offset[tmp] = track->cb_color_bo_offset[tmp];
> +                       ib[idx] = track->cb_color_base_last[tmp];
>                 } else {
>                         r = r600_cs_packet_next_reloc(p, &reloc);
>                         if (r) {
>                                 dev_err(p->dev, "bad SET_CONTEXT_REG 0x%04X\n", reg);
>                                 return -EINVAL;
>                         }
> -                       ib[idx] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
>                         track->cb_color_frag_bo[tmp] = reloc->robj;
> +                       track->cb_color_frag_offset[tmp] = (u64)ib[idx] << 8;
> +                       ib[idx] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
> +               }
> +               if (G_0280A0_TILE_MODE(track->cb_color_info[tmp])) {
> +                       track->cb_dirty = true;
>                 }
>                 break;
>         case R_0280C0_CB_COLOR0_TILE:
> @@ -1338,16 +1389,35 @@ static int r600_cs_check_reg(struct radeon_cs_parser *p, u32 reg, u32 idx)
>                                 dev_err(p->dev, "Broken old userspace ? no cb_color0_base supplied before trying to write 0x%08X\n", reg);
>                                 return -EINVAL;
>                         }
> -                       ib[idx] = track->cb_color_base_last[tmp];
>                         track->cb_color_tile_bo[tmp] = track->cb_color_bo[tmp];
> +                       track->cb_color_tile_offset[tmp] = track->cb_color_bo_offset[tmp];
> +                       ib[idx] = track->cb_color_base_last[tmp];
>                 } else {
>                         r = r600_cs_packet_next_reloc(p, &reloc);
>                         if (r) {
>                                 dev_err(p->dev, "bad SET_CONTEXT_REG 0x%04X\n", reg);
>                                 return -EINVAL;
>                         }
> -                       ib[idx] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
>                         track->cb_color_tile_bo[tmp] = reloc->robj;
> +                       track->cb_color_tile_offset[tmp] = (u64)ib[idx] << 8;
> +                       ib[idx] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
> +               }
> +               if (G_0280A0_TILE_MODE(track->cb_color_info[tmp])) {
> +                       track->cb_dirty = true;
> +               }
> +               break;
> +       case R_028100_CB_COLOR0_MASK:
> +       case R_028104_CB_COLOR1_MASK:
> +       case R_028108_CB_COLOR2_MASK:
> +       case R_02810C_CB_COLOR3_MASK:
> +       case R_028110_CB_COLOR4_MASK:
> +       case R_028114_CB_COLOR5_MASK:
> +       case R_028118_CB_COLOR6_MASK:
> +       case R_02811C_CB_COLOR7_MASK:
> +               tmp = (reg - R_028100_CB_COLOR0_MASK) / 4;
> +               track->cb_color_mask[tmp] = ib[idx];
> +               if (G_0280A0_TILE_MODE(track->cb_color_info[tmp])) {
> +                       track->cb_dirty = true;
>                 }
>                 break;
>         case CB_COLOR0_BASE:
> diff --git a/drivers/gpu/drm/radeon/r600d.h b/drivers/gpu/drm/radeon/r600d.h
> index fd328f4..bdb69a6 100644
> --- a/drivers/gpu/drm/radeon/r600d.h
> +++ b/drivers/gpu/drm/radeon/r600d.h
> @@ -92,6 +92,20 @@
>  #define R_028094_CB_COLOR5_VIEW                      0x028094
>  #define R_028098_CB_COLOR6_VIEW                      0x028098
>  #define R_02809C_CB_COLOR7_VIEW                      0x02809C
> +#define R_028100_CB_COLOR0_MASK                      0x028100
> +#define   S_028100_CMASK_BLOCK_MAX(x)                  (((x) & 0xFFF) << 0)
> +#define   G_028100_CMASK_BLOCK_MAX(x)                  (((x) >> 0) & 0xFFF)
> +#define   C_028100_CMASK_BLOCK_MAX                     0xFFFFF000
> +#define   S_028100_FMASK_TILE_MAX(x)                   (((x) & 0xFFFFF) << 12)
> +#define   G_028100_FMASK_TILE_MAX(x)                   (((x) >> 12) & 0xFFFFF)
> +#define   C_028100_FMASK_TILE_MAX                      0x00000FFF
> +#define R_028104_CB_COLOR1_MASK                      0x028104
> +#define R_028108_CB_COLOR2_MASK                      0x028108
> +#define R_02810C_CB_COLOR3_MASK                      0x02810C
> +#define R_028110_CB_COLOR4_MASK                      0x028110
> +#define R_028114_CB_COLOR5_MASK                      0x028114
> +#define R_028118_CB_COLOR6_MASK                      0x028118
> +#define R_02811C_CB_COLOR7_MASK                      0x02811C
>  #define CB_COLOR0_INFO                                  0x280a0
>  #      define CB_FORMAT(x)                             ((x) << 2)
>  #       define CB_ARRAY_MODE(x)                         ((x) << 8)
> @@ -1400,6 +1414,9 @@
>  #define   S_0280A0_TILE_MODE(x)                        (((x) & 0x3) << 18)
>  #define   G_0280A0_TILE_MODE(x)                        (((x) >> 18) & 0x3)
>  #define   C_0280A0_TILE_MODE                           0xFFF3FFFF
> +#define     V_0280A0_TILE_DISABLE                      0
> +#define     V_0280A0_CLEAR_ENABLE                      1
> +#define     V_0280A0_FRAG_ENABLE                       2
>  #define   S_0280A0_BLEND_CLAMP(x)                      (((x) & 0x1) << 20)
>  #define   G_0280A0_BLEND_CLAMP(x)                      (((x) >> 20) & 0x1)
>  #define   C_0280A0_BLEND_CLAMP                         0xFFEFFFFF
> diff --git a/drivers/gpu/drm/radeon/radeon_drv.c b/drivers/gpu/drm/radeon/radeon_drv.c
> index d7269f4..27d22d7 100644
> --- a/drivers/gpu/drm/radeon/radeon_drv.c
> +++ b/drivers/gpu/drm/radeon/radeon_drv.c
> @@ -62,9 +62,10 @@
>   *   2.18.0 - r600-eg: allow "invalid" DB formats
>   *   2.19.0 - r600-eg: MSAA textures
>   *   2.20.0 - r600-si: RADEON_INFO_TIMESTAMP query
> + *   2.21.0 - r600-r700: FMASK and CMASK
>   */
>  #define KMS_DRIVER_MAJOR       2
> -#define KMS_DRIVER_MINOR       20
> +#define KMS_DRIVER_MINOR       21
>  #define KMS_DRIVER_PATCHLEVEL  0
>  int radeon_driver_load_kms(struct drm_device *dev, unsigned long flags);
>  int radeon_driver_unload_kms(struct drm_device *dev);
> diff --git a/drivers/gpu/drm/radeon/reg_srcs/r600 b/drivers/gpu/drm/radeon/reg_srcs/r600
> index 5e659b0..f93e45d 100644
> --- a/drivers/gpu/drm/radeon/reg_srcs/r600
> +++ b/drivers/gpu/drm/radeon/reg_srcs/r600
> @@ -744,14 +744,6 @@ r600 0x9400
>  0x00028C38 CB_CLRCMP_DST
>  0x00028C3C CB_CLRCMP_MSK
>  0x00028C34 CB_CLRCMP_SRC
> -0x00028100 CB_COLOR0_MASK
> -0x00028104 CB_COLOR1_MASK
> -0x00028108 CB_COLOR2_MASK
> -0x0002810C CB_COLOR3_MASK
> -0x00028110 CB_COLOR4_MASK
> -0x00028114 CB_COLOR5_MASK
> -0x00028118 CB_COLOR6_MASK
> -0x0002811C CB_COLOR7_MASK
>  0x00028808 CB_COLOR_CONTROL
>  0x0002842C CB_FOG_BLUE
>  0x00028428 CB_FOG_GREEN
> --
> 1.7.9.5
>


More information about the dri-devel mailing list