[Intel-gfx] [PATCH] tests: Add gem_blt_copy_align test

Fri Dec 12 08:59:21 PST 2014

On 12 December 2014 at 16:53, Mika Kuoppala
<mika.kuoppala at linux.intel.com> wrote:
> Copy a block into destination object with varying dst/src offsets.
> Put guard area before and after the blit target to see that it didn't
> touch memory out of blit boundaries.
>
> References: https://bugs.freedesktop.org/show_bug.cgi?id=79053
> Cc: Chris Wilson <chris at chris-wilson.co.uk>
> Signed-off-by: Mika Kuoppala <mika.kuoppala at intel.com>
> ---
>  gem_blt_copy_align.c       | 230 +++++++++++++++++++++++++++++++++++++++++++

Did you mean to add this file?

>  tests/Makefile.sources     |   1 +
>  tests/gem_blt_copy_align.c | 237 +++++++++++++++++++++++++++++++++++++++++++++
>  3 files changed, 468 insertions(+)
>  create mode 100644 gem_blt_copy_align.c
>  create mode 100644 tests/gem_blt_copy_align.c

Please also add the test binary name to .gitignore and add a short
description of the test using the IGT_TEST_DESCRIPTION macro.

>
> diff --git a/gem_blt_copy_align.c b/gem_blt_copy_align.c
> new file mode 100644
> index 0000000..84693da
> --- /dev/null
> +++ b/gem_blt_copy_align.c
> @@ -0,0 +1,230 @@
> +/*
> + * Copyright © 2014 Intel Corporation
> + *
> + * Permission is hereby granted, free of charge, to any person obtaining a
> + * copy of this software and associated documentation files (the "Software"),
> + * to deal in the Software without restriction, including without limitation
> + * the rights to use, copy, modify, merge, publish, distribute, sublicense,
> + * and/or sell copies of the Software, and to permit persons to whom the
> + * Software is furnished to do so, subject to the following conditions:
> + *
> + * The above copyright notice and this permission notice (including the next
> + * paragraph) shall be included in all copies or substantial portions of the
> + * Software.
> + *
> + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
> + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
> + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
> + * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
> + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
> + * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
> + * IN THE SOFTWARE.
> + *
> + * Authors:
> + *    Chris Wilson <chris at chris-wilson.co.uk>
> + *    Mika Kuoppala <mika.kuoppala at intel.com>
> + *
> + */
> +
> +#include <stdio.h>
> +#include <string.h>
> +#include <stdint.h>
> +#include "i915_drm.h"
> +#include "intel_chipset.h"
> +#include "intel_reg.h"
> +#include "ioctl_wrappers.h"
> +#include "drm.h"
> +#include "drmtest.h"
> +
> +static int gen = 0;
> +
> +#define WIDTH 32
> +#define HEIGHT 32
> +
> +static uint32_t linear[WIDTH*HEIGHT];
> +
> +static void
> +copy_align(int fd,
> +          uint32_t dst, uint32_t dst_offset,
> +          uint32_t src, uint32_t src_offset,
> +          uint32_t w, uint32_t h)
> +{
> +       uint32_t batch[12];
> +       struct drm_i915_gem_relocation_entry reloc[2];
> +       struct drm_i915_gem_exec_object2 obj[3];
> +       struct drm_i915_gem_execbuffer2 exec;
> +       uint32_t handle;
> +       int i=0;
> +
> +       batch[i++] = XY_SRC_COPY_BLT_CMD |
> +               XY_SRC_COPY_BLT_WRITE_ALPHA |
> +               XY_SRC_COPY_BLT_WRITE_RGB;
> +       if (gen >= 8)
> +               batch[i - 1] |= 8;
> +       else
> +               batch[i - 1] |= 6;
> +
> +       batch[i++] = (3 << 24) | /* 32 bits */
> +               (0xcc << 16) | /* copy ROP */
> +               w * 4;
> +
> +       /* The >= gen8 blitter needs to have dst/src base
> +        * addresses aligned to 4k. So we need to handle the
> +        * offsets with with dst/src coordinates */
> +       batch[i++] = dst_offset; /* dst, x1,y2 */
> +       batch[i++] = ((h) << 16) | (w + dst_offset); /* dst x2,y2 */
> +       batch[i++] = 0;
> +       if (gen >= 8)
> +               batch[i++] = 0;
> +       batch[i++] = src_offset; /* src x1,y1 */
> +       batch[i++] = w * 4;
> +
> +#if 0
> +       /* Bspec says this should be aligned to quad with gen8 but it doesn't
> +          seem to matter */
> +       if (gen >= 8 && (w * 4) % 8)
> +               igt_warn("src pitch NOT aligned to quad\n");
> +#endif
> +
> +       batch[i++] = 0;
> +       if (gen >= 8)
> +               batch[i++] = 0;
> +
> +       batch[i++] = MI_BATCH_BUFFER_END;
> +       batch[i++] = MI_NOOP;
> +
> +       handle = gem_create(fd, 4096);
> +       gem_write(fd, handle, 0, batch, sizeof(batch));
> +
> +       reloc[0].target_handle = dst;
> +       reloc[0].delta = 0;
> +       reloc[0].offset = 4 * sizeof(batch[0]);
> +       reloc[0].presumed_offset = 0;
> +       reloc[0].read_domains = I915_GEM_DOMAIN_RENDER;
> +       reloc[0].write_domain = I915_GEM_DOMAIN_RENDER;
> +
> +       reloc[1].target_handle = src;
> +       reloc[1].delta = 0;
> +       reloc[1].offset = 7 * sizeof(batch[0]);
> +       if (gen >= 8)
> +               reloc[1].offset += sizeof(batch[0]);
> +       reloc[1].presumed_offset = 0;
> +       reloc[1].read_domains = I915_GEM_DOMAIN_RENDER;
> +       reloc[1].write_domain = 0;
> +
> +       memset(obj, 0, sizeof(obj));
> +       exec.buffer_count = 0;
> +       obj[exec.buffer_count++].handle = dst;
> +       if (src != dst)
> +               obj[exec.buffer_count++].handle = src;
> +       obj[exec.buffer_count].handle = handle;
> +       obj[exec.buffer_count].relocation_count = 2;
> +       obj[exec.buffer_count].relocs_ptr = (uintptr_t)reloc;
> +       exec.buffer_count++;
> +       exec.buffers_ptr = (uintptr_t)obj;
> +
> +       exec.batch_start_offset = 0;
> +       exec.batch_len = i * 4;
> +       exec.DR1 = exec.DR4 = 0;
> +       exec.num_cliprects = 0;
> +       exec.cliprects_ptr = 0;
> +       exec.flags = HAS_BLT_RING(intel_get_drm_devid(fd)) ? I915_EXEC_BLT : 0;
> +       i915_execbuffer2_set_context_id(exec, 0);
> +       exec.rsvd2 = 0;
> +
> +       gem_execbuf(fd, &exec);
> +
> +       gem_sync(fd, handle);
> +       gem_close(fd, handle);
> +}
> +
> +static bool area_ok(uint32_t *p, const int size, const uint32_t sval)
> +{
> +       int i;
> +
> +       for (i = 0; i < size; i++)
> +               if (p[i] != i + sval)
> +                       return false;
> +
> +       return true;
> +}
> +
> +static void
> +_test_destination_align(int fd,
> +                       const uint32_t dst_align, const uint32_t src_align,
> +                       const uint32_t w, const uint32_t h)
> +{
> +       const uint32_t size = sizeof(linear) / 4;
> +       const uint32_t guard_val = 0xdeadf00d;
> +       uint32_t *p;
> +       uint32_t h_dst;
> +       uint32_t h_src;
> +       int i;
> +       const int dwords = w * h;
> +
> +       igt_assert(dwords < size);
> +       p = linear;
> +
> +       h_src = gem_create(fd, size * 4);
> +       igt_assert(h_src != 0);
> +
> +       for (i = 0; i < size; i++)
> +               p[i] = i;
> +
> +       gem_write(fd, h_src, 0, p, size * 4);
> +       gem_read(fd, h_src, 0, p, size * 4);
> +
> +       igt_assert(area_ok(p, size, 0));
> +
> +       h_dst = gem_create(fd, size * 4);
> +       igt_assert(h_dst != 0);
> +
> +       for (i = 0; i < size; i++)
> +               p[i] = guard_val + i;
> +
> +       gem_write(fd, h_dst, 0, p, size * 4);
> +       gem_read(fd, h_dst, 0, p, size * 4);
> +
> +       igt_assert(area_ok(p, size, guard_val));
> +
> +       copy_align(fd, h_dst, dst_align, h_src, src_align, w, h);
> +       gem_read(fd, h_dst, 0, p, size * 4);
> +
> +       igt_assert(area_ok(p, dst_align, guard_val));
> +       igt_assert(area_ok(p + dst_align, dwords, src_align));
> +       igt_assert(area_ok(p + dwords + dst_align,
> +                          size - dwords - dst_align,
> +                          guard_val + dwords + dst_align));
> +
> +       gem_close(fd, h_src);
> +       gem_close(fd, h_dst);
> +}
> +
> +static void test_destination_align(int fd,
> +                                  int dst_align, int src_align,
> +                                  int max_w, int max_h)
> +{
> +       int i, j, w, h;
> +
> +       for (i = 0; i <= src_align; i++)
> +               for (j = 0; j <= dst_align; j++)
> +                       for (h = 1; h <= max_h; h ++)
> +                               for (w = 1; w <= max_w; w++)
> +                                       _test_destination_align(fd, j, i, w, h);
> +}
> +
> +igt_simple_main
> +{
> +       int fd = -1;
> +
> +       igt_skip_on_simulation();
> +
> +       igt_fixture {
> +               fd = drm_open_any();
> +               igt_assert(fd >= 0);
> +
> +               gen = intel_gen(intel_get_drm_devid(fd));
> +       }
> +
> +       test_destination_align(fd, 16, 16, 16, 16);
> +}
> diff --git a/tests/Makefile.sources b/tests/Makefile.sources
> index 967dc8f..acc32be 100644
> --- a/tests/Makefile.sources
> +++ b/tests/Makefile.sources
> @@ -119,6 +119,7 @@ TESTS_progs = \
>         gem_render_copy \
>         gem_render_linear_blits \
>         gem_render_tiled_blits \
> +       gem_blt_copy_align \
>         gem_ring_sync_copy \
>         gem_ring_sync_loop \
>         gem_multi_bsd_sync_loop \
> diff --git a/tests/gem_blt_copy_align.c b/tests/gem_blt_copy_align.c
> new file mode 100644
> index 0000000..de3ea21
> --- /dev/null
> +++ b/tests/gem_blt_copy_align.c
> @@ -0,0 +1,237 @@
> +/*
> + * Copyright © 2014 Intel Corporation
> + *
> + * Permission is hereby granted, free of charge, to any person obtaining a
> + * copy of this software and associated documentation files (the "Software"),
> + * to deal in the Software without restriction, including without limitation
> + * the rights to use, copy, modify, merge, publish, distribute, sublicense,
> + * and/or sell copies of the Software, and to permit persons to whom the
> + * Software is furnished to do so, subject to the following conditions:
> + *
> + * The above copyright notice and this permission notice (including the next
> + * paragraph) shall be included in all copies or substantial portions of the
> + * Software.
> + *
> + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
> + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
> + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
> + * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
> + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
> + * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
> + * IN THE SOFTWARE.
> + *
> + * Authors:
> + *    Chris Wilson <chris at chris-wilson.co.uk>
> + *    Mika Kuoppala <mika.kuoppala at intel.com>
> + *
> + */
> +
> +#include <stdio.h>
> +#include <string.h>
> +#include <stdint.h>
> +#include "i915_drm.h"
> +#include "intel_chipset.h"
> +#include "intel_reg.h"
> +#include "ioctl_wrappers.h"
> +#include "drm.h"
> +#include "drmtest.h"
> +
> +static int gen = 0;
> +
> +#define WIDTH 32
> +#define HEIGHT 32
> +
> +static uint32_t linear[WIDTH * HEIGHT];
> +
> +static void
> +copy_align(int fd,
> +          uint32_t dst, uint32_t dst_offset,
> +          uint32_t src, uint32_t src_offset,
> +          uint32_t w, uint32_t h)
> +{
> +       uint32_t batch[12];
> +       struct drm_i915_gem_relocation_entry reloc[2];
> +       struct drm_i915_gem_exec_object2 obj[3];
> +       struct drm_i915_gem_execbuffer2 exec;
> +       uint32_t handle;
> +       int i=0;
> +
> +       batch[i++] = XY_SRC_COPY_BLT_CMD |
> +               XY_SRC_COPY_BLT_WRITE_ALPHA |
> +               XY_SRC_COPY_BLT_WRITE_RGB;
> +       if (gen >= 8)
> +               batch[i - 1] |= 8;
> +       else
> +               batch[i - 1] |= 6;
> +
> +       batch[i++] = (3 << 24) | /* 32 bits */
> +               (0xcc << 16) | /* copy ROP */
> +               w * 4;
> +
> +       /* The >= gen8 blitter needs to have dst/src base
> +        * addresses aligned to 4k. So we need to handle the
> +        * offsets with with dst/src coordinates */
> +
> +       batch[i++] = dst_offset; /* dst, x1,y2 */
> +       batch[i++] = ((h) << 16) | (w + dst_offset); /* dst x2,y2 */
> +       batch[i++] = 0;
> +       if (gen >= 8)
> +               batch[i++] = 0;
> +       batch[i++] = src_offset; /* src x1,y1 */
> +       batch[i++] = w * 4;
> +
> +#if 0
> +       /* Bspec says this should be aligned to quad with gen8 but it doesn't
> +          seem to matter on */
> +       if (gen >= 8 && (w * 4) % 8)
> +               igt_warn("src pitch NOT aligned to quad\n");
> +#endif
> +
> +       batch[i++] = 0;
> +       if (gen >= 8)
> +               batch[i++] = 0;
> +
> +       batch[i++] = MI_BATCH_BUFFER_END;
> +       batch[i++] = MI_NOOP;
> +
> +       handle = gem_create(fd, 4096);
> +       gem_write(fd, handle, 0, batch, sizeof(batch));
> +
> +       reloc[0].target_handle = dst;
> +       reloc[0].delta = 0;
> +       reloc[0].offset = 4 * sizeof(batch[0]);
> +       reloc[0].presumed_offset = 0;
> +       reloc[0].read_domains = I915_GEM_DOMAIN_RENDER;
> +       reloc[0].write_domain = I915_GEM_DOMAIN_RENDER;
> +
> +       reloc[1].target_handle = src;
> +       reloc[1].delta = 0;
> +       reloc[1].offset = 7 * sizeof(batch[0]);
> +       if (gen >= 8)
> +               reloc[1].offset += sizeof(batch[0]);
> +       reloc[1].presumed_offset = 0;
> +       reloc[1].read_domains = I915_GEM_DOMAIN_RENDER;
> +       reloc[1].write_domain = 0;
> +
> +       memset(obj, 0, sizeof(obj));
> +       exec.buffer_count = 0;
> +       obj[exec.buffer_count++].handle = dst;
> +       if (src != dst)
> +               obj[exec.buffer_count++].handle = src;
> +       obj[exec.buffer_count].handle = handle;
> +       obj[exec.buffer_count].relocation_count = 2;
> +       obj[exec.buffer_count].relocs_ptr = (uintptr_t)reloc;
> +       exec.buffer_count++;
> +       exec.buffers_ptr = (uintptr_t)obj;
> +
> +       exec.batch_start_offset = 0;
> +       exec.batch_len = i * 4;
> +       exec.DR1 = exec.DR4 = 0;
> +       exec.num_cliprects = 0;
> +       exec.cliprects_ptr = 0;
> +       exec.flags = HAS_BLT_RING(intel_get_drm_devid(fd)) ? I915_EXEC_BLT : 0;
> +       i915_execbuffer2_set_context_id(exec, 0);
> +       exec.rsvd2 = 0;
> +
> +       gem_execbuf(fd, &exec);
> +
> +       gem_sync(fd, handle);
> +       gem_close(fd, handle);
> +}
> +
> +static bool area_ok(uint32_t *p, const int start,
> +                   const int size, const uint32_t sval)
> +{
> +       int i;
> +
> +       for (i = start; i < start + size; i++)
> +               if (p[i] != i - start + sval) {
> +                       igt_info("%d: 0x%08x differs from assumed 0x%08x\n",
> +                                i, p[i], i + sval);
> +                       return false;
> +               }
> +
> +       return true;
> +}
> +
> +static void
> +_test_destination_align(int fd,
> +                       const uint32_t dst_align, const uint32_t src_align,
> +                       const uint32_t w, const uint32_t h)
> +{
> +       const uint32_t size = sizeof(linear) / 4;
> +       const uint32_t guard_val = 0xdeadf00d;
> +       const int copy_len = h * w;
> +       const int src_len = copy_len + src_align;
> +       const int dst_tail = 2 * 16 + 3;
> +       const int dst_total = dst_align + src_len + dst_tail;
> +       uint32_t *p;
> +       uint32_t h_dst;
> +       uint32_t h_src;
> +       int i;
> +
> +       igt_assert(src_len < size);
> +       p = linear;
> +
> +       h_src = gem_create(fd, src_len * 4);
> +       igt_assert(h_src != 0);
> +
> +       for (i = 0; i < src_len; i++)
> +               p[i] = i;
> +
> +       gem_write(fd, h_src, 0, p, src_len * 4);
> +       gem_read(fd, h_src, 0, p, src_len * 4);
> +       igt_assert(area_ok(p, 0, src_len, 0));
> +
> +       h_dst = gem_create(fd, dst_total * 4);
> +       igt_assert(h_dst != 0);
> +
> +       for (i = 0; i < dst_total; i++)
> +               p[i] = guard_val + i;
> +
> +       gem_write(fd, h_dst, 0, p, dst_total * 4);
> +       gem_read(fd, h_dst, 0, p, dst_total * 4);
> +
> +       igt_assert(area_ok(p, 0, dst_total, guard_val));
> +
> +       copy_align(fd, h_dst, dst_align, h_src, src_align, w, h);
> +       gem_read(fd, h_dst, 0, p, dst_total * 4);
> +
> +       igt_assert(area_ok(p, 0, dst_align, guard_val));
> +       igt_assert(area_ok(p, dst_align, copy_len, src_align));
> +       igt_assert(area_ok(p, copy_len + dst_align,
> +                          dst_total - copy_len - dst_align,
> +                          guard_val + copy_len + dst_align));
> +
> +       gem_close(fd, h_src);
> +       gem_close(fd, h_dst);
> +}
> +
> +static void test_destination_align(int fd,
> +                                  int dst_align, int src_align,
> +                                  int max_w, int max_h)
> +{
> +       int i, j, w, h;
> +
> +       for (i = 0; i <= src_align; i++)
> +               for (j = 0; j <= dst_align; j++)
> +                       for (h = 1; h <= max_h; h ++)
> +                               for (w = 1; w <= max_w; w++)
> +                                       _test_destination_align(fd, j, i, w, h);
> +}
> +
> +igt_simple_main
> +{
> +       int fd = -1;
> +
> +       igt_skip_on_simulation();
> +
> +       igt_fixture {
> +               fd = drm_open_any();
> +               igt_assert(fd >= 0);
> +
> +               gen = intel_gen(intel_get_drm_devid(fd));
> +       }
> +
> +       test_destination_align(fd, 17, 17, 17, 17);
> +}
> --
> 1.9.1