[igt-dev] [PATCH i-g-t v2 4/4] lib/igt_fb: Generalize the slow read from gtt mmap handling
Ville Syrjala
ville.syrjala at linux.intel.com
Fri Nov 2 19:37:31 UTC 2018
From: Ville Syrjälä <ville.syrjala at linux.intel.com>
Make the handling of slow gtt mmap reads generic, and extend it to
the pixman converter. Makes the pixman path a bit faster.
With testing just XRGB8888 and XBGR8888 on KBL:
$ time kms_plane --r pixel-format-pipe-A-planes
- real 0m18,757s
+ real 0m2,635s
v2: Use the original src buffer if the malloc fails (Chris)
Drop the duplicated comment about things being slow
Cc: Chris Wilson <chris at chris-wilson.co.uk>
Cc: Maxime Ripard <maxime.ripard at bootlin.com>
Cc: Arkadiusz Hiler <arkadiusz.hiler at intel.com>
Cc: Juha-Pekka Heikkila <juhapekka.heikkila at gmail.com>
Cc: Maarten Lankhorst <maarten.lankhorst at linux.intel.com>
Signed-off-by: Ville Syrjälä <ville.syrjala at linux.intel.com>
---
lib/igt_fb.c | 61 +++++++++++++++++++++++++++++++++++++---------------
1 file changed, 44 insertions(+), 17 deletions(-)
diff --git a/lib/igt_fb.c b/lib/igt_fb.c
index 97310f70b635..01efd269714b 100644
--- a/lib/igt_fb.c
+++ b/lib/igt_fb.c
@@ -1506,6 +1506,7 @@ static void write_rgb(uint8_t *rgb24, const struct igt_vec4 *rgb)
struct fb_convert_buf {
void *ptr;
struct igt_fb *fb;
+ bool slow_reads;
};
struct fb_convert {
@@ -1513,6 +1514,34 @@ struct fb_convert {
struct fb_convert_buf src;
};
+static void *convert_src_get(const struct fb_convert *cvt)
+{
+ void *buf;
+
+ if (!cvt->src.slow_reads)
+ return cvt->src.ptr;
+
+ /*
+ * Reading from the BO is awfully slow because of lack of read caching,
+ * it's faster to copy the whole BO to a temporary buffer and convert
+ * from there.
+ */
+ buf = malloc(cvt->src.fb->size);
+ if (!buf)
+ return cvt->src.ptr;
+
+ igt_memcpy_from_wc(buf, cvt->src.ptr, cvt->src.fb->size);
+
+ return buf;
+}
+
+static void convert_src_put(const struct fb_convert *cvt,
+ void *src_buf)
+{
+ if (src_buf != cvt->src.ptr)
+ free(src_buf);
+}
+
static void convert_nv12_to_rgb24(struct fb_convert *cvt)
{
int i, j;
@@ -1520,19 +1549,14 @@ static void convert_nv12_to_rgb24(struct fb_convert *cvt)
uint8_t *rgb24 = cvt->dst.ptr;
unsigned int rgb24_stride = cvt->dst.fb->strides[0];
unsigned int planar_stride = cvt->src.fb->strides[0];
- uint8_t *buf = malloc(cvt->src.fb->size);
struct igt_mat4 m = igt_ycbcr_to_rgb_matrix(cvt->src.fb->color_encoding,
cvt->src.fb->color_range);
+ uint8_t *buf;
igt_assert(cvt->src.fb->drm_format == DRM_FORMAT_NV12 &&
cvt->dst.fb->drm_format == DRM_FORMAT_XRGB8888);
- /*
- * Reading from the BO is awfully slow because of lack of read caching,
- * it's faster to copy the whole BO to a temporary buffer and convert
- * from there.
- */
- igt_memcpy_from_wc(buf, cvt->src.ptr, cvt->src.fb->size);
+ buf = convert_src_get(cvt);
y = buf + cvt->src.fb->offsets[0];
uv = buf + cvt->src.fb->offsets[1];
@@ -1622,7 +1646,7 @@ static void convert_nv12_to_rgb24(struct fb_convert *cvt)
}
}
- free(buf);
+ convert_src_put(cvt, buf);
}
static void convert_rgb24_to_nv12(struct fb_convert *cvt)
@@ -1760,10 +1784,10 @@ static void convert_yuyv_to_rgb24(struct fb_convert *cvt)
uint8_t *rgb24 = cvt->dst.ptr;
unsigned int rgb24_stride = cvt->dst.fb->strides[0];
unsigned int yuyv_stride = cvt->src.fb->strides[0];
- uint8_t *buf = malloc(cvt->src.fb->size);
struct igt_mat4 m = igt_ycbcr_to_rgb_matrix(cvt->src.fb->color_encoding,
cvt->src.fb->color_range);
const unsigned char *swz = yuyv_swizzle(cvt->src.fb->drm_format);
+ uint8_t *buf;
igt_assert((cvt->src.fb->drm_format == DRM_FORMAT_YUYV ||
cvt->src.fb->drm_format == DRM_FORMAT_UYVY ||
@@ -1771,12 +1795,7 @@ static void convert_yuyv_to_rgb24(struct fb_convert *cvt)
cvt->src.fb->drm_format == DRM_FORMAT_VYUY) &&
cvt->dst.fb->drm_format == DRM_FORMAT_XRGB8888);
- /*
- * Reading from the BO is awfully slow because of lack of read caching,
- * it's faster to copy the whole BO to a temporary buffer and convert
- * from there.
- */
- igt_memcpy_from_wc(buf, cvt->src.ptr, cvt->src.fb->size);
+ buf = convert_src_get(cvt);
yuyv = buf;
for (i = 0; i < cvt->dst.fb->height; i++) {
@@ -1816,7 +1835,7 @@ static void convert_yuyv_to_rgb24(struct fb_convert *cvt)
yuyv += yuyv_stride;
}
- free(buf);
+ convert_src_put(cvt, buf);
}
static void convert_rgb24_to_yuyv(struct fb_convert *cvt)
@@ -1877,14 +1896,17 @@ static void convert_pixman(struct fb_convert *cvt)
pixman_format_code_t src_pixman = drm_format_to_pixman(cvt->src.fb->drm_format);
pixman_format_code_t dst_pixman = drm_format_to_pixman(cvt->dst.fb->drm_format);
pixman_image_t *dst_image, *src_image;
+ void *src_ptr;
igt_assert((src_pixman != PIXMAN_invalid) &&
(dst_pixman != PIXMAN_invalid));
+ src_ptr = convert_src_get(cvt);
+
src_image = pixman_image_create_bits(src_pixman,
cvt->src.fb->width,
cvt->src.fb->height,
- cvt->src.ptr,
+ src_ptr,
cvt->src.fb->strides[0]);
igt_assert(src_image);
@@ -1900,6 +1922,8 @@ static void convert_pixman(struct fb_convert *cvt)
cvt->dst.fb->width, cvt->dst.fb->height);
pixman_image_unref(dst_image);
pixman_image_unref(src_image);
+
+ convert_src_put(cvt, src_ptr);
}
static void fb_convert(struct fb_convert *cvt)
@@ -1991,6 +2015,9 @@ static void create_cairo_surface__convert(int fd, struct igt_fb *fb)
blit->base.linear.fb.gem_handle = 0;
blit->base.linear.map = map_bo(fd, fb);
igt_assert(blit->base.linear.map);
+
+ /* reading via gtt mmap is slow */
+ cvt.src.slow_reads = is_i915_device(fd);
}
cvt.dst.ptr = blit->shadow_ptr;
--
2.18.1
More information about the igt-dev
mailing list