[Mesa-dev] [PATCH 24/33] anv: Add initial blorp support
Pohjolainen, Topi
topi.pohjolainen at gmail.com
Sat Sep 3 17:46:52 UTC 2016
On Wed, Aug 31, 2016 at 02:22:43PM -0700, Jason Ekstrand wrote:
> ---
> src/intel/vulkan/Makefile.am | 1 +
> src/intel/vulkan/Makefile.sources | 5 +
> src/intel/vulkan/anv_blorp.c | 120 +++++++++++++++++
> src/intel/vulkan/anv_device.c | 4 +
> src/intel/vulkan/anv_genX.h | 3 +
> src/intel/vulkan/anv_private.h | 6 +
> src/intel/vulkan/genX_blorp_exec.c | 259 +++++++++++++++++++++++++++++++++++++
> 7 files changed, 398 insertions(+)
> create mode 100644 src/intel/vulkan/anv_blorp.c
> create mode 100644 src/intel/vulkan/genX_blorp_exec.c
I couldn't see anything obvious in any of the hooks and if you were missing
a hook entirely it shouldn't even compile:
Reviewed-by: Topi Pohjolainen <topi.pohjolainen at intel.com>
>
> diff --git a/src/intel/vulkan/Makefile.am b/src/intel/vulkan/Makefile.am
> index 2d20de9..03c863a 100644
> --- a/src/intel/vulkan/Makefile.am
> +++ b/src/intel/vulkan/Makefile.am
> @@ -119,6 +119,7 @@ VULKAN_LIB_DEPS += \
> $(top_builddir)/src/util/libmesautil.la \
> $(top_builddir)/src/intel/common/libintel_common.la \
> $(top_builddir)/src/intel/isl/libisl.la \
> + $(top_builddir)/src/intel/blorp/libblorp.la \
> $(PER_GEN_LIBS) \
> $(PTHREAD_LIBS) \
> $(DLOPEN_LIBS) \
> diff --git a/src/intel/vulkan/Makefile.sources b/src/intel/vulkan/Makefile.sources
> index 8b4b97f..e384235 100644
> --- a/src/intel/vulkan/Makefile.sources
> +++ b/src/intel/vulkan/Makefile.sources
> @@ -22,6 +22,7 @@
> VULKAN_FILES := \
> anv_allocator.c \
> anv_batch_chain.c \
> + anv_blorp.c \
> anv_cmd_buffer.c \
> anv_descriptor_set.c \
> anv_device.c \
> @@ -73,6 +74,7 @@ VULKAN_GENERATED_FILES := \
>
> GEN7_FILES := \
> genX_cmd_buffer.c \
> + genX_blorp_exec.c \
> genX_pipeline.c \
> gen7_cmd_buffer.c \
> gen7_pipeline.c \
> @@ -80,6 +82,7 @@ GEN7_FILES := \
>
> GEN75_FILES := \
> genX_cmd_buffer.c \
> + genX_blorp_exec.c \
> genX_pipeline.c \
> gen7_cmd_buffer.c \
> gen7_pipeline.c \
> @@ -87,6 +90,7 @@ GEN75_FILES := \
>
> GEN8_FILES := \
> genX_cmd_buffer.c \
> + genX_blorp_exec.c \
> genX_pipeline.c \
> gen8_cmd_buffer.c \
> gen8_pipeline.c \
> @@ -94,6 +98,7 @@ GEN8_FILES := \
>
> GEN9_FILES := \
> genX_cmd_buffer.c \
> + genX_blorp_exec.c \
> genX_pipeline.c \
> gen8_cmd_buffer.c \
> gen8_pipeline.c \
> diff --git a/src/intel/vulkan/anv_blorp.c b/src/intel/vulkan/anv_blorp.c
> new file mode 100644
> index 0000000..d047bcd
> --- /dev/null
> +++ b/src/intel/vulkan/anv_blorp.c
> @@ -0,0 +1,120 @@
> +/*
> + * Copyright © 2016 Intel Corporation
> + *
> + * Permission is hereby granted, free of charge, to any person obtaining a
> + * copy of this software and associated documentation files (the "Software"),
> + * to deal in the Software without restriction, including without limitation
> + * the rights to use, copy, modify, merge, publish, distribute, sublicense,
> + * and/or sell copies of the Software, and to permit persons to whom the
> + * Software is furnished to do so, subject to the following conditions:
> + *
> + * The above copyright notice and this permission notice (including the next
> + * paragraph) shall be included in all copies or substantial portions of the
> + * Software.
> + *
> + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
> + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
> + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
> + * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
> + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
> + * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
> + * IN THE SOFTWARE.
> + */
> +
> +#include "anv_private.h"
> +
> +static bool
> +lookup_blorp_shader(struct blorp_context *blorp,
> + const void *key, uint32_t key_size,
> + uint32_t *kernel_out, void *prog_data_out)
> +{
> + struct anv_device *device = blorp->driver_ctx;
> +
> + /* The blorp cache must be a real cache */
> + assert(device->blorp_shader_cache.cache);
> +
> + struct anv_shader_bin *bin =
> + anv_pipeline_cache_search(&device->blorp_shader_cache, key, key_size);
> + if (!bin)
> + return false;
> +
> + /* The cache already has a reference and it's not going anywhere so there
> + * is no need to hold a second reference.
> + */
> + anv_shader_bin_unref(device, bin);
> +
> + *kernel_out = bin->kernel.offset;
> + *(const struct brw_stage_prog_data **)prog_data_out =
> + anv_shader_bin_get_prog_data(bin);
> +
> + return true;
> +}
> +
> +static void
> +upload_blorp_shader(struct blorp_context *blorp,
> + const void *key, uint32_t key_size,
> + const void *kernel, uint32_t kernel_size,
> + const void *prog_data, uint32_t prog_data_size,
> + uint32_t *kernel_out, void *prog_data_out)
> +{
> + struct anv_device *device = blorp->driver_ctx;
> +
> + /* The blorp cache must be a real cache */
> + assert(device->blorp_shader_cache.cache);
> +
> + struct anv_pipeline_bind_map bind_map = {
> + .surface_count = 0,
> + .sampler_count = 0,
> + };
> +
> + struct anv_shader_bin *bin =
> + anv_pipeline_cache_upload_kernel(&device->blorp_shader_cache,
> + key, key_size, kernel, kernel_size,
> + prog_data, prog_data_size, &bind_map);
> +
> + /* The cache already has a reference and it's not going anywhere so there
> + * is no need to hold a second reference.
> + */
> + anv_shader_bin_unref(device, bin);
> +
> + *kernel_out = bin->kernel.offset;
> + *(const struct brw_stage_prog_data **)prog_data_out =
> + anv_shader_bin_get_prog_data(bin);
> +}
> +
> +void
> +anv_device_init_blorp(struct anv_device *device)
> +{
> + anv_pipeline_cache_init(&device->blorp_shader_cache, device, true);
> + blorp_init(&device->blorp, device, &device->isl_dev);
> + device->blorp.compiler = device->instance->physicalDevice.compiler;
> + device->blorp.mocs.tex = device->default_mocs;
> + device->blorp.mocs.rb = device->default_mocs;
> + device->blorp.mocs.vb = device->default_mocs;
> + device->blorp.lookup_shader = lookup_blorp_shader;
> + device->blorp.upload_shader = upload_blorp_shader;
> + switch (device->info.gen) {
> + case 7:
> + if (device->info.is_haswell) {
> + device->blorp.exec = gen75_blorp_exec;
> + } else {
> + device->blorp.exec = gen7_blorp_exec;
> + }
> + break;
> + case 8:
> + device->blorp.exec = gen8_blorp_exec;
> + break;
> + case 9:
> + device->blorp.exec = gen9_blorp_exec;
> + break;
> + default:
> + unreachable("Unknown hardware generation");
> + }
> +}
> +
> +void
> +anv_device_finish_blorp(struct anv_device *device)
> +{
> + blorp_finish(&device->blorp);
> + anv_pipeline_cache_finish(&device->blorp_shader_cache);
> +}
> diff --git a/src/intel/vulkan/anv_device.c b/src/intel/vulkan/anv_device.c
> index 7317493..e66f812 100644
> --- a/src/intel/vulkan/anv_device.c
> +++ b/src/intel/vulkan/anv_device.c
> @@ -918,6 +918,8 @@ VkResult anv_CreateDevice(
> if (result != VK_SUCCESS)
> goto fail_fd;
>
> + anv_device_init_blorp(device);
> +
> anv_device_init_border_colors(device);
>
> *pDevice = anv_device_to_handle(device);
> @@ -940,6 +942,8 @@ void anv_DestroyDevice(
>
> anv_queue_finish(&device->queue);
>
> + anv_device_finish_blorp(device);
> +
> anv_device_finish_meta(device);
>
> #ifdef HAVE_VALGRIND
> diff --git a/src/intel/vulkan/anv_genX.h b/src/intel/vulkan/anv_genX.h
> index ccf4357..02e79c2 100644
> --- a/src/intel/vulkan/anv_genX.h
> +++ b/src/intel/vulkan/anv_genX.h
> @@ -72,3 +72,6 @@ genX(compute_pipeline_create)(VkDevice _device,
> const VkComputePipelineCreateInfo *pCreateInfo,
> const VkAllocationCallbacks *alloc,
> VkPipeline *pPipeline);
> +
> +void genX(blorp_exec)(struct blorp_batch *batch,
> + const struct blorp_params *params);
> diff --git a/src/intel/vulkan/anv_private.h b/src/intel/vulkan/anv_private.h
> index 5ef81d9..816a081 100644
> --- a/src/intel/vulkan/anv_private.h
> +++ b/src/intel/vulkan/anv_private.h
> @@ -41,6 +41,7 @@
> #endif
>
> #include "common/gen_device_info.h"
> +#include "blorp/blorp.h"
> #include "brw_compiler.h"
> #include "util/macros.h"
> #include "util/list.h"
> @@ -709,6 +710,9 @@ struct anv_device {
>
> struct anv_meta_state meta_state;
>
> + struct anv_pipeline_cache blorp_shader_cache;
> + struct blorp_context blorp;
> +
> struct anv_state border_colors;
>
> struct anv_queue queue;
> @@ -722,6 +726,8 @@ struct anv_device {
>
> void anv_device_get_cache_uuid(void *uuid);
>
> +void anv_device_init_blorp(struct anv_device *device);
> +void anv_device_finish_blorp(struct anv_device *device);
>
> void* anv_gem_mmap(struct anv_device *device,
> uint32_t gem_handle, uint64_t offset, uint64_t size, uint32_t flags);
> diff --git a/src/intel/vulkan/genX_blorp_exec.c b/src/intel/vulkan/genX_blorp_exec.c
> new file mode 100644
> index 0000000..833b94a
> --- /dev/null
> +++ b/src/intel/vulkan/genX_blorp_exec.c
> @@ -0,0 +1,259 @@
> +/*
> + * Copyright © 2016 Intel Corporation
> + *
> + * Permission is hereby granted, free of charge, to any person obtaining a
> + * copy of this software and associated documentation files (the "Software"),
> + * to deal in the Software without restriction, including without limitation
> + * the rights to use, copy, modify, merge, publish, distribute, sublicense,
> + * and/or sell copies of the Software, and to permit persons to whom the
> + * Software is furnished to do so, subject to the following conditions:
> + *
> + * The above copyright notice and this permission notice (including the next
> + * paragraph) shall be included in all copies or substantial portions of the
> + * Software.
> + *
> + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
> + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
> + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
> + * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
> + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
> + * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
> + * IN THE SOFTWARE.
> + */
> +
> +#include <assert.h>
> +
> +#include "anv_private.h"
> +#include "genX_multisample.h"
> +
> +/* These are defined in anv_private.h and blorp_genX_exec.h */
> +#undef __gen_address_type
> +#undef __gen_user_data
> +#undef __gen_combine_address
> +
> +#include "common/gen_l3_config.h"
> +#include "blorp/blorp_genX_exec.h"
> +
> +static void *
> +blorp_emit_dwords(struct blorp_batch *batch, unsigned n)
> +{
> + struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
> + return anv_batch_emit_dwords(&cmd_buffer->batch, n);
> +}
> +
> +static uint64_t
> +blorp_emit_reloc(struct blorp_batch *batch,
> + void *location, struct blorp_address address, uint32_t delta)
> +{
> + struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
> + assert(cmd_buffer->batch.start <= location &&
> + location < cmd_buffer->batch.end);
> + return anv_batch_emit_reloc(&cmd_buffer->batch, location,
> + address.buffer, address.offset + delta);
> +}
> +
> +static void
> +blorp_surface_reloc(struct blorp_batch *batch, uint32_t ss_offset,
> + struct blorp_address address, uint32_t delta)
> +{
> + struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
> + anv_reloc_list_add(&cmd_buffer->surface_relocs, &cmd_buffer->pool->alloc,
> + ss_offset, address.buffer, address.offset + delta);
> +}
> +
> +static void *
> +blorp_alloc_dynamic_state(struct blorp_batch *batch,
> + enum aub_state_struct_type type,
> + uint32_t size,
> + uint32_t alignment,
> + uint32_t *offset)
> +{
> + struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
> +
> + struct anv_state state =
> + anv_cmd_buffer_alloc_dynamic_state(cmd_buffer, size, alignment);
> +
> + *offset = state.offset;
> + return state.map;
> +}
> +
> +static void
> +blorp_alloc_binding_table(struct blorp_batch *batch, unsigned num_entries,
> + unsigned state_size, unsigned state_alignment,
> + uint32_t *bt_offset,
> + uint32_t *surface_offsets, void **surface_maps)
> +{
> + struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
> +
> + uint32_t state_offset;
> + struct anv_state bt_state =
> + anv_cmd_buffer_alloc_binding_table(cmd_buffer, num_entries,
> + &state_offset);
> + if (bt_state.map == NULL) {
> + /* We ran out of space. Grab a new binding table block. */
> + VkResult result = anv_cmd_buffer_new_binding_table_block(cmd_buffer);
> + assert(result == VK_SUCCESS);
> +
> + /* Re-emit state base addresses so we get the new surface state base
> + * address before we start emitting binding tables etc.
> + */
> + anv_cmd_buffer_emit_state_base_address(cmd_buffer);
> +
> + bt_state = anv_cmd_buffer_alloc_binding_table(cmd_buffer, num_entries,
> + &state_offset);
> + assert(bt_state.map != NULL);
> + }
> +
> + uint32_t *bt_map = bt_state.map;
> + *bt_offset = bt_state.offset;
> +
> + for (unsigned i = 0; i < num_entries; i++) {
> + struct anv_state surface_state =
> + anv_cmd_buffer_alloc_surface_state(cmd_buffer);
> + bt_map[i] = surface_state.offset + state_offset;
> + surface_offsets[i] = surface_state.offset;
> + surface_maps[i] = surface_state.map;
> + }
> +}
> +
> +static void *
> +blorp_alloc_vertex_buffer(struct blorp_batch *batch, uint32_t size,
> + struct blorp_address *addr)
> +{
> + struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
> + struct anv_state vb_state =
> + anv_cmd_buffer_alloc_dynamic_state(cmd_buffer, size, 16);
> +
> + *addr = (struct blorp_address) {
> + .buffer = &cmd_buffer->device->dynamic_state_block_pool.bo,
> + .offset = vb_state.offset,
> + };
> +
> + return vb_state.map;
> +}
> +
> +static void
> +blorp_emit_urb_config(struct blorp_batch *batch, unsigned vs_entry_size)
> +{
> + struct anv_device *device = batch->blorp->driver_ctx;
> + struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
> +
> + genX(emit_urb_setup)(device, &cmd_buffer->batch,
> + VK_SHADER_STAGE_VERTEX_BIT |
> + VK_SHADER_STAGE_FRAGMENT_BIT,
> + vs_entry_size, 0,
> + cmd_buffer->state.current_l3_config);
> +}
> +
> +static void
> +blorp_emit_3dstate_multisample(struct blorp_batch *batch, unsigned samples)
> +{
> + blorp_emit(batch, GENX(3DSTATE_MULTISAMPLE), ms) {
> + ms.NumberofMultisamples = __builtin_ffs(samples) - 1;
> +
> +#if GEN_GEN >= 8
> + /* The PRM says that this bit is valid only for DX9:
> + *
> + * SW can choose to set this bit only for DX9 API. DX10/OGL API's
> + * should not have any effect by setting or not setting this bit.
> + */
> + ms.PixelPositionOffsetEnable = false;
> + ms.PixelLocation = CENTER;
> +#else
> + ms.PixelLocation = PIXLOC_CENTER;
> +
> + switch (samples) {
> + case 1:
> + SAMPLE_POS_1X(ms.Sample);
> + break;
> + case 2:
> + SAMPLE_POS_2X(ms.Sample);
> + break;
> + case 4:
> + SAMPLE_POS_4X(ms.Sample);
> + break;
> + case 8:
> + SAMPLE_POS_8X(ms.Sample);
> + break;
> + default:
> + break;
> + }
> +#endif
> + }
> +}
> +
> +void genX(blorp_exec)(struct blorp_batch *batch,
> + const struct blorp_params *params);
> +
> +void
> +genX(blorp_exec)(struct blorp_batch *batch,
> + const struct blorp_params *params)
> +{
> + struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
> +
> + if (!cmd_buffer->state.current_l3_config) {
> + const struct gen_l3_config *cfg =
> + gen_get_default_l3_config(&cmd_buffer->device->info);
> + genX(cmd_buffer_config_l3)(cmd_buffer, cfg);
> + }
> +
> + if (cmd_buffer->state.current_pipeline != _3D) {
> +#if GEN_GEN <= 7
> + /* From "BXML » GT » MI » vol1a GPU Overview » [Instruction]
> + * PIPELINE_SELECT [DevBWR+]":
> + *
> + * Project: DEVSNB+
> + *
> + * Software must ensure all the write caches are flushed through a
> + * stalling PIPE_CONTROL command followed by another PIPE_CONTROL
> + * command to invalidate read only caches prior to programming
> + * MI_PIPELINE_SELECT command to change the Pipeline Select Mode.
> + */
> + blorp_emit(batch, GENX(PIPE_CONTROL), pc) {
> + pc.RenderTargetCacheFlushEnable = true;
> + pc.DepthCacheFlushEnable = true;
> + pc.DCFlushEnable = true;
> + pc.PostSyncOperation = NoWrite;
> + pc.CommandStreamerStallEnable = true;
> + }
> +
> + blorp_emit(batch, GENX(PIPE_CONTROL), pc) {
> + pc.TextureCacheInvalidationEnable = true;
> + pc.ConstantCacheInvalidationEnable = true;
> + pc.StateCacheInvalidationEnable = true;
> + pc.InstructionCacheInvalidateEnable = true;
> + pc.PostSyncOperation = NoWrite;
> + }
> +#endif
> +
> + blorp_emit(batch, GENX(PIPELINE_SELECT), ps) {
> +#if GEN_GEN >= 9
> + ps.MaskBits = 3;
> +#endif
> + ps.PipelineSelection = _3D;
> + }
> +
> + cmd_buffer->state.current_pipeline = _3D;
> + }
> +
> + blorp_exec(batch, params);
> +
> + /* BLORP sets DRAWING_RECTANGLE but we always want it set to the maximum.
> + * Since we set it once at driver init and never again, we have to set it
> + * back after invoking blorp.
> + *
> + * TODO: BLORP should assume a max drawing rectangle
> + */
> + blorp_emit(batch, GENX(3DSTATE_DRAWING_RECTANGLE), rect) {
> + rect.ClippedDrawingRectangleYMin = 0;
> + rect.ClippedDrawingRectangleXMin = 0;
> + rect.ClippedDrawingRectangleYMax = UINT16_MAX;
> + rect.ClippedDrawingRectangleXMax = UINT16_MAX;
> + rect.DrawingRectangleOriginY = 0;
> + rect.DrawingRectangleOriginX = 0;
> + }
> +
> + cmd_buffer->state.vb_dirty = ~0;
> + cmd_buffer->state.dirty = ~0;
> + cmd_buffer->state.push_constants_dirty = ~0;
> +}
> --
> 2.5.0.400.gff86faf
>
> _______________________________________________
> mesa-dev mailing list
> mesa-dev at lists.freedesktop.org
> https://lists.freedesktop.org/mailman/listinfo/mesa-dev
More information about the mesa-dev
mailing list