[Intel-gfx] [PATCH i-g-t] test/gem_mocs_settings: Testing MOCS register settings
Peter Antoine
peter.antoine at intel.com
Mon Apr 4 13:43:08 UTC 2016
The MOCS registers were added in Gen9 and define the caching policy.
The registers are split into two sets. The first set controls the
EDRAM policy and have a set for each engine, the second set controls
the L3 policy. The two sets use the same index.
The RCS registers and the L3CC registers are stored in the RCS context.
The test checks that the registers are correct by checking the values by
directly reading them via MMIO, then again it tests them by reading them
from within a batch buffer. RCS engine is tested last as it programs the
registers via a batch buffer and this will invalidate the test for
workloads that don't use the render ring or don't run a render batch
first.
Signed-off-by: Peter Antoine <peter.antoine at intel.com>
---
tests/Makefile.sources | 1 +
tests/gem_mocs_settings.c | 408 ++++++++++++++++++++++++++++++++++++++++++++++
2 files changed, 409 insertions(+)
create mode 100644 tests/gem_mocs_settings.c
diff --git a/tests/Makefile.sources b/tests/Makefile.sources
index 43f232f..d483c9e 100644
--- a/tests/Makefile.sources
+++ b/tests/Makefile.sources
@@ -148,6 +148,7 @@ TESTS_progs = \
gem_lut_handle \
gem_mmap_offset_exhaustion \
gem_media_fill \
+ gem_mocs_settings \
gem_gpgpu_fill \
gem_pin \
gem_reg_read \
diff --git a/tests/gem_mocs_settings.c b/tests/gem_mocs_settings.c
new file mode 100644
index 0000000..7db64c1
--- /dev/null
+++ b/tests/gem_mocs_settings.c
@@ -0,0 +1,408 @@
+/*
+ * Copyright © 2016 Intel Corporation
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice (including the next
+ * paragraph) shall be included in all copies or substantial portions of the
+ * Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
+ * IN THE SOFTWARE.
+ *
+ */
+
+/** @file gem_mocs_settings.c
+ *
+ * Check that the MOCs cache settings are valid.
+ */
+
+#include "igt.h"
+#include "igt_gt.h"
+
+#define MAX_NUMBER_MOCS_REGISTERS (64)
+
+enum {
+ NONE,
+ RESET,
+ SUSPEND,
+ HIBERNATE
+};
+
+#define GEN9_LNCFCMOCS0 (0xB020) /* L3 Cache Control base */
+#define GEN9_GFX_MOCS_0 (0xc800) /* Graphics MOCS base register*/
+#define GEN9_MFX0_MOCS_0 (0xc900) /* Media 0 MOCS base register*/
+#define GEN9_MFX1_MOCS_0 (0xcA00) /* Media 1 MOCS base register*/
+#define GEN9_VEBOX_MOCS_0 (0xcB00) /* Video MOCS base register*/
+#define GEN9_BLT_MOCS_0 (0xcc00) /* Blitter MOCS base register*/
+
+#define ENGINE_GFX (I915_EXEC_RENDER)
+#define ENGINE_MFX0 (I915_EXEC_BSD)
+#define ENGINE_MFX0_ALT (I915_EXEC_BSD | 1 << 13)
+#define ENGINE_MFX1 (I915_EXEC_BSD | 2 << 13)
+#define ENGINE_BLT (I915_EXEC_BLT)
+#define ENGINE_VEBOX (I915_EXEC_VEBOX)
+
+struct mocs_entry {
+ uint32_t control_value;
+ uint16_t l3cc_value;
+};
+
+struct mocs_table {
+ uint32_t size;
+ const struct mocs_entry *table;
+};
+
+static const struct mocs_entry skylake_mocs_table[] = {
+ { 0x00000009, 0x0010 },
+ { 0x00000038, 0x0030 },
+ { 0x0000003b, 0x0030 },
+};
+
+static const struct mocs_entry broxton_mocs_table[] = {
+ { 0x00000009, 0x0010 },
+ { 0x00000038, 0x0030 },
+ { 0x0000003b, 0x0030 },
+};
+
+static bool get_mocs_settings(uint32_t devid, struct mocs_table *table)
+{
+ bool result = false;
+
+ if (IS_SKYLAKE(devid) || IS_KABYLAKE(devid)) {
+ table->size = ARRAY_SIZE(skylake_mocs_table);
+ table->table = skylake_mocs_table;
+ result = true;
+ } else if (IS_BROXTON(devid)) {
+ table->size = ARRAY_SIZE(broxton_mocs_table);
+ table->table = broxton_mocs_table;
+ result = true;
+ }
+
+ return result;
+}
+
+static uint32_t get_engine_base(uint32_t engine)
+{
+ uint32_t result = 0;
+
+ switch(engine) {
+ case ENGINE_MFX0:
+ case ENGINE_MFX0_ALT: result = GEN9_MFX0_MOCS_0; break;
+ case ENGINE_GFX: result = GEN9_GFX_MOCS_0; break;
+ case ENGINE_MFX1: result = GEN9_MFX1_MOCS_0; break;
+ case ENGINE_BLT: result = GEN9_BLT_MOCS_0; break;
+ case ENGINE_VEBOX: result = GEN9_VEBOX_MOCS_0; break;
+ default:
+ igt_fail(-1);
+ }
+
+ return result;
+}
+
+static uint32_t get_mocs_register_value(int fd, uint64_t offset, uint32_t index)
+{
+ uint32_t regid = offset + (index * 4);
+
+ igt_assert(index < MAX_NUMBER_MOCS_REGISTERS);
+
+ return intel_register_read(regid);
+}
+
+static void test_mocs_control_values(int fd, uint32_t engine)
+{
+ int i;
+ uint32_t devid = intel_get_drm_devid(fd);
+ uint32_t engine_base = get_engine_base(engine);
+ struct mocs_table table;
+
+ igt_assert(get_mocs_settings(devid, &table));
+
+ for (i = 0; i < table.size; i++)
+ igt_assert_eq(get_mocs_register_value(fd, engine_base, i),
+ table.table[i].control_value);
+}
+
+static void test_mocs_l3cc_values(int fd)
+{
+ int i;
+ uint32_t reg_values[MAX_NUMBER_MOCS_REGISTERS/2];
+ struct mocs_table table;
+
+ for (i = 0; i < MAX_NUMBER_MOCS_REGISTERS / 2; i++)
+ reg_values[i] = intel_register_read(GEN9_LNCFCMOCS0 + (i * 4));
+
+ igt_assert(get_mocs_settings(intel_get_drm_devid(fd), &table));
+
+ for (i = 0; i < table.size / 2; i++) {
+ igt_assert_eq((reg_values[i] & 0xffff),
+ table.table[i * 2].l3cc_value);
+ igt_assert_eq((reg_values[i] >> 16),
+ table.table[i * 2 + 1].l3cc_value);
+ }
+
+ if (table.size & 1)
+ igt_assert_eq((reg_values[i] & 0xffff),
+ table.table[i * 2].l3cc_value);
+}
+
+static void test_mocs_values(int fd)
+{
+ const struct intel_execution_engine *e;
+
+ for (e = intel_execution_engines; e->name; e++)
+ if (e->exec_id != I915_EXEC_DEFAULT &&
+ gem_has_ring(fd, e->exec_id | e->flags))
+ test_mocs_control_values(fd, e->exec_id | e->flags);
+
+ test_mocs_l3cc_values(fd);
+}
+
+#define MI_STORE_REGISTER_MEM_64_BIT_ADDR ((0x24 << 23) | 2)
+
+static int create_read_batch(struct drm_i915_gem_relocation_entry *reloc,
+ uint32_t *batch,
+ uint32_t dst_handle,
+ uint32_t size,
+ uint32_t reg_base)
+{
+ unsigned int index;
+ unsigned int offset = 0;
+
+ for (index = 0, offset = 0; index < size; index++, offset += 4)
+ {
+ batch[offset] = MI_STORE_REGISTER_MEM_64_BIT_ADDR;
+ batch[offset+1] = reg_base + (index * sizeof(uint32_t));
+ batch[offset+2] = index * sizeof(uint32_t); /* reloc */
+ batch[offset+3] = 0;
+
+ reloc[index].offset = (offset + 2) * sizeof(uint32_t);
+ reloc[index].delta = index * sizeof(uint32_t);
+ reloc[index].target_handle = dst_handle;
+ }
+
+ batch[offset++] = MI_BATCH_BUFFER_END;
+ batch[offset++] = 0;
+
+ return offset * sizeof(uint32_t);
+}
+
+static void do_read_registers(int fd,
+ uint32_t ctx_id,
+ uint32_t dst_handle,
+ uint32_t reg_base,
+ uint32_t size,
+ uint32_t engine_id)
+{
+ struct drm_i915_gem_execbuffer2 execbuf;
+ struct drm_i915_gem_exec_object2 gem_exec[2];
+ struct drm_i915_gem_relocation_entry reloc[MAX_NUMBER_MOCS_REGISTERS];
+ uint32_t batch[MAX_NUMBER_MOCS_REGISTERS * 4 + 4];
+ uint32_t handle = gem_create(fd, 4096);
+
+ memset(reloc, 0, sizeof(reloc));
+
+ memset(&gem_exec, 0, sizeof(gem_exec));
+ gem_exec[0].handle = dst_handle;
+ gem_set_domain(fd, dst_handle, I915_GEM_DOMAIN_CPU, 0);
+
+ gem_exec[1].handle = handle;
+ gem_exec[1].relocation_count = size;
+ gem_exec[1].relocs_ptr = (uintptr_t) reloc;
+
+ memset(&execbuf, 0, sizeof(execbuf));
+ execbuf.buffers_ptr = (uintptr_t)gem_exec;
+ execbuf.buffer_count = 2;
+
+ execbuf.batch_len = create_read_batch(reloc,
+ batch,
+ dst_handle,
+ size,
+ reg_base);
+
+ gem_write(fd, handle, 0, batch, execbuf.batch_len);
+
+ if (ctx_id != 0)
+ i915_execbuffer2_set_context_id(execbuf, ctx_id);
+
+ execbuf.flags = I915_EXEC_SECURE | engine_id;
+
+ gem_execbuf(fd, &execbuf);
+ gem_sync(fd, handle);
+
+ gem_close(fd, handle);
+}
+
+static void check_control_registers(int fd,
+ const struct intel_execution_engine *engine,
+ uint32_t ctx_id,
+ bool use_default)
+{
+ uint32_t dst_handle = gem_create(fd, 4096);
+ uint32_t reg_base = get_engine_base(engine->exec_id | engine->flags);
+ uint32_t *read_regs;
+ struct mocs_table table;
+ igt_assert(get_mocs_settings(intel_get_drm_devid(fd), &table));
+
+ if (reg_base == GEN9_GFX_MOCS_0 && !use_default)
+ do_read_registers(fd,
+ ctx_id,
+ dst_handle,
+ reg_base,
+ table.size,
+ engine->exec_id | engine->flags);
+ else
+ do_read_registers(fd,
+ 0,
+ dst_handle,
+ reg_base,
+ table.size,
+ engine->exec_id | engine->flags);
+
+ read_regs = gem_mmap__gtt(fd, dst_handle, 4096, PROT_READ);
+
+ for (int index = 0; index < table.size; index++)
+ igt_assert_eq(read_regs[index],
+ table.table[index].control_value);
+
+ gem_close(fd, dst_handle);
+}
+
+static void check_l3cc_registers(int fd,
+ const struct intel_execution_engine *engine,
+ uint32_t ctx_id,
+ bool use_default)
+{
+ struct mocs_table table;
+ uint32_t dst_handle = gem_create(fd, 4096);
+ uint32_t *read_regs;
+ int index;
+
+ igt_assert(get_mocs_settings(intel_get_drm_devid(fd), &table));
+
+ if (use_default)
+ do_read_registers(fd,
+ 0,
+ dst_handle,
+ GEN9_LNCFCMOCS0,
+ (table.size + 1) / 2,
+ engine->exec_id | engine->flags);
+ else
+ do_read_registers(fd,
+ ctx_id,
+ dst_handle,
+ GEN9_LNCFCMOCS0,
+ (table.size + 1) / 2,
+ engine->exec_id | engine->flags);
+
+ read_regs = gem_mmap__gtt(fd, dst_handle, 4096, PROT_READ);
+
+ for (index = 0; index < table.size / 2; index++) {
+ igt_assert_eq(read_regs[index] & 0xffff,
+ table.table[index * 2].l3cc_value);
+ igt_assert_eq(read_regs[index] >> 16,
+ table.table[index * 2 + 1].l3cc_value);
+ }
+
+ if (table.size & 0x01)
+ igt_assert_eq(read_regs[index] & 0xffff,
+ table.table[index * 2].l3cc_value);
+
+ gem_close(fd, dst_handle);
+}
+
+static void test_context_mocs_values(int fd,
+ const struct intel_execution_engine *engine,
+ bool use_default)
+{
+ uint32_t ctx_id = 0;
+
+ igt_info("Testing Engine: %s%s\n",
+ engine->name,
+ use_default ? " (default context)" : "");
+
+ if (!use_default)
+ ctx_id = gem_context_create(fd);
+
+ check_control_registers(fd, engine, ctx_id, use_default);
+ check_l3cc_registers(fd, engine, ctx_id, use_default);
+
+ if (!use_default)
+ gem_context_destroy(fd, ctx_id);
+}
+
+static void run_test(int fd, unsigned mode)
+{
+ const int gen = intel_gen(intel_get_drm_devid(fd));
+ const struct intel_execution_engine *e;
+
+ igt_require(gen >= 9);
+
+ test_mocs_values(fd);
+
+ switch(mode) {
+ case NONE: break;
+ case RESET: igt_force_gpu_reset(); break;
+ case SUSPEND: igt_system_suspend_autoresume(); break;
+ case HIBERNATE: igt_system_hibernate_autoresume(); break;
+ };
+
+ /*
+ * Do render after other engines as older versions of code will
+ * cause the RCS context to program the registers and the test
+ * becomes invalid
+ */
+ for (e = intel_execution_engines; e->name; e++)
+ if (e->exec_id != I915_EXEC_DEFAULT &&
+ e->exec_id != I915_EXEC_RENDER &&
+ gem_has_ring(fd, e->exec_id | e->flags))
+ test_context_mocs_values(fd, e, true);
+
+ for (e = intel_execution_engines; e->name; e++)
+ if (e->exec_id == I915_EXEC_RENDER &&
+ gem_has_ring(fd, e->exec_id | e->flags)) {
+ test_context_mocs_values(fd, e, true);
+ test_context_mocs_values(fd, e, false);
+ }
+
+ test_mocs_values(fd);
+}
+
+igt_main
+{
+ int fd;
+ struct pci_device *pci_dev;
+
+ igt_fixture {
+ fd = drm_open_driver_master(DRIVER_INTEL);
+ pci_dev = intel_get_pci_device();
+ igt_require(pci_dev);
+
+ intel_register_access_init(pci_dev, 0);
+ }
+
+ igt_subtest("mocs-settings")
+ run_test(fd, NONE);
+
+ igt_subtest("mocs-reset")
+ run_test(fd, RESET);
+
+ igt_subtest("mocs-suspend")
+ run_test(fd, SUSPEND);
+
+ igt_subtest("mocs-hibernate")
+ run_test(fd, HIBERNATE);
+
+ igt_fixture
+ close(fd);
+}
--
1.9.1
More information about the Intel-gfx
mailing list