[Mesa-dev] [PATCH v3] vl/dri3: use external texture as back buffers(v3)

Leo Liu leo.liu at amd.com
Fri Nov 4 19:54:04 UTC 2016



On 11/04/2016 02:45 PM, Nayan Deshmukh wrote:
> dri3 allows us to send handle of a texture directly to X
> so this patch allows a state tracker to directly send its
> texture to X to be used as back buffer and avoids extra
> copying
>
> v2: use clip width/height to display a portion of the surface
> v3: remove redundant variables, fix wrapping, rename variables
>      handle vaapi path
>
> Suggested-by: Leo Liu <leo.liu at amd.com>
> Signed-off-by: Nayan Deshmukh <nayan26deshmukh at gmail.com>
> ---
>   src/gallium/auxiliary/vl/vl_winsys.h      |   4 +
>   src/gallium/auxiliary/vl/vl_winsys_dri3.c | 117 ++++++++++++++++++++++++++----
>   2 files changed, 108 insertions(+), 13 deletions(-)
>
> diff --git a/src/gallium/auxiliary/vl/vl_winsys.h b/src/gallium/auxiliary/vl/vl_winsys.h
> index 26db9f2..908e9c6 100644
> --- a/src/gallium/auxiliary/vl/vl_winsys.h
> +++ b/src/gallium/auxiliary/vl/vl_winsys.h
> @@ -59,6 +59,10 @@ struct vl_screen
>      void *
>      (*get_private)(struct vl_screen *vscreen);
>   
> +   void
> +   (*set_back_texture_from_output)(struct vl_screen *vscreen, struct pipe_resource *buffer,
> +                         uint32_t width, uint32_t height);
> +
>      struct pipe_screen *pscreen;
>      struct pipe_loader_device *dev;
>   };
> diff --git a/src/gallium/auxiliary/vl/vl_winsys_dri3.c b/src/gallium/auxiliary/vl/vl_winsys_dri3.c
> index 2929928..9d0cd5a 100644
> --- a/src/gallium/auxiliary/vl/vl_winsys_dri3.c
> +++ b/src/gallium/auxiliary/vl/vl_winsys_dri3.c
> @@ -31,6 +31,7 @@
>   #include <X11/xshmfence.h>
>   #include <xcb/dri3.h>
>   #include <xcb/present.h>
> +#include <xcb/xfixes.h>
>   
>   #include "loader.h"
>   
> @@ -57,6 +58,7 @@ struct vl_dri3_buffer
>   
>      bool busy;
>      uint32_t width, height, pitch;
> +   uint32_t clip_width, clip_height;
>   };
>   
>   struct vl_dri3_screen
> @@ -71,6 +73,8 @@ struct vl_dri3_screen
>      xcb_special_event_t *special_event;
>   
>      struct pipe_context *pipe;
> +   struct pipe_resource *output_texture;
> +   uint32_t clip_width, clip_height;

Sorry, maybe I haven't explained clear enough on "combine", quick hack 
on top of this patch, just for your reference.

--- a/src/gallium/auxiliary/vl/vl_winsys_dri3.c
+++ b/src/gallium/auxiliary/vl/vl_winsys_dri3.c
@@ -58,7 +58,6 @@ struct vl_dri3_buffer

     bool busy;
     uint32_t width, height, pitch;
-   uint32_t clip_width, clip_height;
  };

  struct vl_dri3_screen
@@ -241,33 +240,23 @@ dri3_alloc_back_buffer(struct vl_dri3_screen *scrn)
     templ.format = PIPE_FORMAT_B8G8R8X8_UNORM;
     templ.target = PIPE_TEXTURE_2D;
     templ.last_level = 0;
-   if (scrn->output_texture) {
-      buffer->clip_width = (scrn->clip_width) ? scrn->clip_width :
-                           scrn->width;
-      buffer->clip_height = (scrn->clip_height) ? scrn->clip_height :
-                            scrn->height;
-      templ.width0 = scrn->output_texture->width0;
-      templ.height0 = scrn->output_texture->height0;
-   } else {
-       templ.width0 = scrn->width;
-       templ.height0 = scrn->height;
-       buffer->clip_width = scrn->width;
-       buffer->clip_height = scrn->height;
-   }
+   templ.width0 = (scrn->output_texture) ?
+         scrn->output_texture->width0 : scrn->width;
+   templ.height0 = (scrn->output_texture) ?
+         scrn->output_texture->height0 : scrn->height;
     templ.depth0 = 1;
     templ.array_size = 1;

     if (scrn->is_different_gpu) {
        buffer->texture = (scrn->output_texture) ? scrn->output_texture :
- scrn->base.pscreen->resource_create(scrn->base.pscreen,
- &templ);
+ scrn->base.pscreen->resource_create(scrn->base.pscreen, &templ);
        if (!buffer->texture)
           goto unmap_shm;

        templ.bind |= PIPE_BIND_SCANOUT | PIPE_BIND_SHARED |
                      PIPE_BIND_LINEAR;
-      buffer->linear_texture = 
scrn->base.pscreen->resource_create(scrn->base.pscreen,
- &templ);
+      buffer->linear_texture =
+ scrn->base.pscreen->resource_create(scrn->base.pscreen, &templ);
        pixmap_buffer_texture = buffer->linear_texture;

        if (!buffer->linear_texture)
@@ -275,8 +264,7 @@ dri3_alloc_back_buffer(struct vl_dri3_screen *scrn)
     } else {
        templ.bind |= PIPE_BIND_SCANOUT | PIPE_BIND_SHARED;
        buffer->texture = (scrn->output_texture) ? scrn->output_texture :
- scrn->base.pscreen->resource_create(scrn->base.pscreen,
- &templ);
+ scrn->base.pscreen->resource_create(scrn->base.pscreen, &templ);
        if (!buffer->texture)
           goto unmap_shm;
        pixmap_buffer_texture = buffer->texture;
@@ -373,15 +361,12 @@ dri3_get_back_buffer(struct vl_dri3_screen *scrn)
vl_compositor_reset_dirty_area(&scrn->dirty_areas[scrn->cur_back]);
        buffer = new_buffer;
        scrn->back_buffers[scrn->cur_back] = buffer;
-   } else if (scrn->output_texture) {
+   } else if (scrn->output_texture)
        /* In case of different gpu we can reuse the linear
         * texture so we only need to set the external
         * texture for copying
         */
        buffer->texture = scrn->output_texture;
-      buffer->clip_width = scrn->clip_width;
-      buffer->clip_height = scrn->clip_height;
-   }

>   
>      struct vl_dri3_buffer *back_buffers[BACK_BUFFER_NUM];
>      int cur_back;
> @@ -105,7 +109,8 @@ dri3_free_back_buffer(struct vl_dri3_screen *scrn,
>      xcb_free_pixmap(scrn->conn, buffer->pixmap);
>      xcb_sync_destroy_fence(scrn->conn, buffer->sync_fence);
>      xshmfence_unmap_shm(buffer->shm_fence);
> -   pipe_resource_reference(&buffer->texture, NULL);
> +   if (!scrn->output_texture)
> +      pipe_resource_reference(&buffer->texture, NULL);
>      if (buffer->linear_texture)
>          pipe_resource_reference(&buffer->linear_texture, NULL);
>      FREE(buffer);
> @@ -236,13 +241,25 @@ dri3_alloc_back_buffer(struct vl_dri3_screen *scrn)
>      templ.format = PIPE_FORMAT_B8G8R8X8_UNORM;
>      templ.target = PIPE_TEXTURE_2D;
>      templ.last_level = 0;
> -   templ.width0 = scrn->width;
> -   templ.height0 = scrn->height;
> +   if (scrn->output_texture) {
> +      buffer->clip_width = (scrn->clip_width) ? scrn->clip_width :
> +                           scrn->width;
> +      buffer->clip_height = (scrn->clip_height) ? scrn->clip_height :
> +                            scrn->height;
> +      templ.width0 = scrn->output_texture->width0;
> +      templ.height0 = scrn->output_texture->height0;
> +   } else {
> +       templ.width0 = scrn->width;
> +       templ.height0 = scrn->height;
> +       buffer->clip_width = scrn->width;
> +       buffer->clip_height = scrn->height;
> +   }
>      templ.depth0 = 1;
>      templ.array_size = 1;
>   
>      if (scrn->is_different_gpu) {
> -      buffer->texture = scrn->base.pscreen->resource_create(scrn->base.pscreen,
> +      buffer->texture = (scrn->output_texture) ? scrn->output_texture :
> +                        scrn->base.pscreen->resource_create(scrn->base.pscreen,
>                                                               &templ);
>         if (!buffer->texture)
>            goto unmap_shm;
> @@ -257,7 +274,8 @@ dri3_alloc_back_buffer(struct vl_dri3_screen *scrn)
>            goto no_linear_texture;
>      } else {
>         templ.bind |= PIPE_BIND_SCANOUT | PIPE_BIND_SHARED;
> -      buffer->texture = scrn->base.pscreen->resource_create(scrn->base.pscreen,
> +      buffer->texture = (scrn->output_texture) ? scrn->output_texture :
> +                        scrn->base.pscreen->resource_create(scrn->base.pscreen,
>                                                               &templ);
>         if (!buffer->texture)
>            goto unmap_shm;
> @@ -271,11 +289,14 @@ dri3_alloc_back_buffer(struct vl_dri3_screen *scrn)
>                                              usage);
>      buffer_fd = whandle.handle;
>      buffer->pitch = whandle.stride;
> +   buffer->width = templ.width0;
> +   buffer->height = templ.height0;
> +
>      xcb_dri3_pixmap_from_buffer(scrn->conn,
>                                  (pixmap = xcb_generate_id(scrn->conn)),
>                                  scrn->drawable,
>                                  0,
> -                               scrn->width, scrn->height, buffer->pitch,
> +                               buffer->width, buffer->height, buffer->pitch,
>                                  scrn->depth, 32,
>                                  buffer_fd);
>      xcb_dri3_fence_from_fd(scrn->conn,
> @@ -287,8 +308,6 @@ dri3_alloc_back_buffer(struct vl_dri3_screen *scrn)
>      buffer->pixmap = pixmap;
>      buffer->sync_fence = sync_fence;
>      buffer->shm_fence = shm_fence;
> -   buffer->width = scrn->width;
> -   buffer->height = scrn->height;
>   
>      xshmfence_trigger(buffer->shm_fence);
>   
> @@ -310,6 +329,7 @@ dri3_get_back_buffer(struct vl_dri3_screen *scrn)
>   {
>      struct vl_dri3_buffer *buffer;
>      struct pipe_resource *texture = NULL;
> +   bool allocate_new_buffer = false;
>   
>      assert(scrn);
>   
> @@ -318,8 +338,28 @@ dri3_get_back_buffer(struct vl_dri3_screen *scrn)
>         return NULL;
>      buffer = scrn->back_buffers[scrn->cur_back];
>   
> -   if (!buffer || buffer->width != scrn->width ||
> -       buffer->height != scrn->height) {
> +   /* This is normal case when our buffer is smaller
> +    * than the screen this will be same for external
> +    * texture
> +    */
> +   if (scrn->output_texture) {
> +      if (!buffer || buffer->width < scrn->width ||
> +          buffer->height < scrn->height)
> +         allocate_new_buffer = true;
> +   } else {
> +      if (!buffer || buffer->width != scrn->width ||
> +          buffer->height != scrn->height)
> +         allocate_new_buffer = true;
> +   }
> +

Any better ways?

> +   /* In case of a single gpu we need to get the
> +    * handle and pixmap for the texture that is set
> +    */
> +   if (buffer && scrn->output_texture &&
> +       !scrn->is_different_gpu)
> +      allocate_new_buffer = true;
> +

So now the normal case i.e. single gpu case have to allocate new buffers 
and have X extension calls on each frame, which are still very expensive.

Christian&Michel, any better ways ?

Regards,
Leo

> +   if (allocate_new_buffer) {
>         struct vl_dri3_buffer *new_buffer;
>   
>         new_buffer = dri3_alloc_back_buffer(scrn);
> @@ -329,9 +369,18 @@ dri3_get_back_buffer(struct vl_dri3_screen *scrn)
>         if (buffer)
>            dri3_free_back_buffer(scrn, buffer);
>   
> -      vl_compositor_reset_dirty_area(&scrn->dirty_areas[scrn->cur_back]);
> +      if (!scrn->output_texture)
> +         vl_compositor_reset_dirty_area(&scrn->dirty_areas[scrn->cur_back]);
>         buffer = new_buffer;
>         scrn->back_buffers[scrn->cur_back] = buffer;
> +   } else if (scrn->output_texture) {
> +      /* In case of different gpu we can reuse the linear
> +       * texture so we only need to set the external
> +       * texture for copying
> +       */
> +      buffer->texture = scrn->output_texture;
> +      buffer->clip_width = scrn->clip_width;
> +      buffer->clip_height = scrn->clip_height;
>      }
>   
>      pipe_resource_reference(&texture, buffer->texture);
> @@ -500,6 +549,8 @@ vl_dri3_flush_frontbuffer(struct pipe_screen *screen,
>      uint32_t options = XCB_PRESENT_OPTION_NONE;
>      struct vl_dri3_buffer *back;
>      struct pipe_box src_box;
> +   xcb_xfixes_region_t region;
> +   xcb_rectangle_t rectangle;
>   
>      back = scrn->back_buffers[scrn->cur_back];
>      if (!back)
> @@ -511,8 +562,16 @@ vl_dri3_flush_frontbuffer(struct pipe_screen *screen,
>               return;
>      }
>   
> +   rectangle.x = 0;
> +   rectangle.y = 0;
> +   rectangle.width = back->clip_width;
> +   rectangle.height = back->clip_height;
> +
> +   region = xcb_generate_id(scrn->conn);
> +   xcb_xfixes_create_region(scrn->conn, region, 2, &rectangle);
> +
>      if (scrn->is_different_gpu) {
> -      u_box_origin_2d(scrn->width, scrn->height, &src_box);
> +      u_box_origin_2d(back->width, back->height, &src_box);
>         scrn->pipe->resource_copy_region(scrn->pipe,
>                                          back->linear_texture,
>                                          0, 0, 0, 0,
> @@ -528,7 +587,7 @@ vl_dri3_flush_frontbuffer(struct pipe_screen *screen,
>                         scrn->drawable,
>                         back->pixmap,
>                         (uint32_t)(++scrn->send_sbc),
> -                      0, 0, 0, 0,
> +                      0, region, 0, 0,
>                         None, None,
>                         back->sync_fence,
>                         options,
> @@ -627,6 +686,20 @@ vl_dri3_screen_get_private(struct vl_screen *vscreen)
>   }
>   
>   static void
> +vl_dri3_screen_set_back_texture_from_output(struct vl_screen *vscreen,
> +                                            struct pipe_resource *buffer,
> +                                            uint32_t width, uint32_t height)
> +{
> +   struct vl_dri3_screen *scrn = (struct vl_dri3_screen *)vscreen;
> +
> +   assert(scrn);
> +
> +   scrn->output_texture = buffer;
> +   scrn->clip_width = width;
> +   scrn->clip_height = height;
> +}
> +
> +static void
>   vl_dri3_screen_destroy(struct vl_screen *vscreen)
>   {
>      struct vl_dri3_screen *scrn = (struct vl_dri3_screen *)vscreen;
> @@ -675,6 +748,9 @@ vl_dri3_screen_create(Display *display, int screen)
>      xcb_dri3_open_reply_t *open_reply;
>      xcb_get_geometry_cookie_t geom_cookie;
>      xcb_get_geometry_reply_t *geom_reply;
> +   xcb_xfixes_query_version_cookie_t xfixes_cookie;
> +   xcb_xfixes_query_version_reply_t *xfixes_reply;
> +   xcb_generic_error_t *error;
>      int fd;
>   
>      assert(display);
> @@ -689,12 +765,26 @@ vl_dri3_screen_create(Display *display, int screen)
>   
>      xcb_prefetch_extension_data(scrn->conn , &xcb_dri3_id);
>      xcb_prefetch_extension_data(scrn->conn, &xcb_present_id);
> +   xcb_prefetch_extension_data (scrn->conn, &xcb_xfixes_id);
>      extension = xcb_get_extension_data(scrn->conn, &xcb_dri3_id);
>      if (!(extension && extension->present))
>         goto free_screen;
>      extension = xcb_get_extension_data(scrn->conn, &xcb_present_id);
>      if (!(extension && extension->present))
>         goto free_screen;
> +   extension = xcb_get_extension_data(scrn->conn, &xcb_xfixes_id);
> +   if (!(extension && extension->present))
> +      goto free_screen;
> +
> +   xfixes_cookie = xcb_xfixes_query_version(scrn->conn, XCB_XFIXES_MAJOR_VERSION,
> +                                            XCB_XFIXES_MINOR_VERSION);
> +   xfixes_reply = xcb_xfixes_query_version_reply(scrn->conn, xfixes_cookie, &error);
> +   if (!xfixes_reply || error || xfixes_reply->major_version < 2) {
> +      free(error);
> +      free(xfixes_reply);
> +      goto free_screen;
> +   }
> +   free(xfixes_reply);
>   
>      open_cookie = xcb_dri3_open(scrn->conn, RootWindow(display, screen), None);
>      open_reply = xcb_dri3_open_reply(scrn->conn, open_cookie, NULL);
> @@ -744,6 +834,7 @@ vl_dri3_screen_create(Display *display, int screen)
>      scrn->base.set_next_timestamp = vl_dri3_screen_set_next_timestamp;
>      scrn->base.get_private = vl_dri3_screen_get_private;
>      scrn->base.pscreen->flush_frontbuffer = vl_dri3_flush_frontbuffer;
> +   scrn->base.set_back_texture_from_output = vl_dri3_screen_set_back_texture_from_output;
>   
>      return &scrn->base;
>   



More information about the mesa-dev mailing list