[Mesa-dev] [PATCH 24/33] anv: Add initial blorp support

Pohjolainen, Topi topi.pohjolainen at gmail.com
Sat Sep 3 17:46:52 UTC 2016


On Wed, Aug 31, 2016 at 02:22:43PM -0700, Jason Ekstrand wrote:
> ---
>  src/intel/vulkan/Makefile.am       |   1 +
>  src/intel/vulkan/Makefile.sources  |   5 +
>  src/intel/vulkan/anv_blorp.c       | 120 +++++++++++++++++
>  src/intel/vulkan/anv_device.c      |   4 +
>  src/intel/vulkan/anv_genX.h        |   3 +
>  src/intel/vulkan/anv_private.h     |   6 +
>  src/intel/vulkan/genX_blorp_exec.c | 259 +++++++++++++++++++++++++++++++++++++
>  7 files changed, 398 insertions(+)
>  create mode 100644 src/intel/vulkan/anv_blorp.c
>  create mode 100644 src/intel/vulkan/genX_blorp_exec.c

I couldn't see anything obvious in any of the hooks and if you were missing
a hook entirely it shouldn't even compile:

Reviewed-by: Topi Pohjolainen <topi.pohjolainen at intel.com>

> 
> diff --git a/src/intel/vulkan/Makefile.am b/src/intel/vulkan/Makefile.am
> index 2d20de9..03c863a 100644
> --- a/src/intel/vulkan/Makefile.am
> +++ b/src/intel/vulkan/Makefile.am
> @@ -119,6 +119,7 @@ VULKAN_LIB_DEPS += \
>  	$(top_builddir)/src/util/libmesautil.la \
>  	$(top_builddir)/src/intel/common/libintel_common.la \
>  	$(top_builddir)/src/intel/isl/libisl.la \
> +	$(top_builddir)/src/intel/blorp/libblorp.la \
>  	$(PER_GEN_LIBS) \
>  	$(PTHREAD_LIBS) \
>  	$(DLOPEN_LIBS) \
> diff --git a/src/intel/vulkan/Makefile.sources b/src/intel/vulkan/Makefile.sources
> index 8b4b97f..e384235 100644
> --- a/src/intel/vulkan/Makefile.sources
> +++ b/src/intel/vulkan/Makefile.sources
> @@ -22,6 +22,7 @@
>  VULKAN_FILES := \
>  	anv_allocator.c \
>  	anv_batch_chain.c \
> +	anv_blorp.c \
>  	anv_cmd_buffer.c \
>  	anv_descriptor_set.c \
>  	anv_device.c \
> @@ -73,6 +74,7 @@ VULKAN_GENERATED_FILES := \
>  
>  GEN7_FILES := \
>  	genX_cmd_buffer.c \
> +	genX_blorp_exec.c \
>  	genX_pipeline.c \
>  	gen7_cmd_buffer.c \
>  	gen7_pipeline.c \
> @@ -80,6 +82,7 @@ GEN7_FILES := \
>  
>  GEN75_FILES := \
>  	genX_cmd_buffer.c \
> +	genX_blorp_exec.c \
>  	genX_pipeline.c \
>  	gen7_cmd_buffer.c \
>  	gen7_pipeline.c \
> @@ -87,6 +90,7 @@ GEN75_FILES := \
>  
>  GEN8_FILES := \
>  	genX_cmd_buffer.c \
> +	genX_blorp_exec.c \
>  	genX_pipeline.c \
>  	gen8_cmd_buffer.c \
>  	gen8_pipeline.c \
> @@ -94,6 +98,7 @@ GEN8_FILES := \
>  
>  GEN9_FILES := \
>  	genX_cmd_buffer.c \
> +	genX_blorp_exec.c \
>  	genX_pipeline.c \
>  	gen8_cmd_buffer.c \
>  	gen8_pipeline.c \
> diff --git a/src/intel/vulkan/anv_blorp.c b/src/intel/vulkan/anv_blorp.c
> new file mode 100644
> index 0000000..d047bcd
> --- /dev/null
> +++ b/src/intel/vulkan/anv_blorp.c
> @@ -0,0 +1,120 @@
> +/*
> + * Copyright © 2016 Intel Corporation
> + *
> + * Permission is hereby granted, free of charge, to any person obtaining a
> + * copy of this software and associated documentation files (the "Software"),
> + * to deal in the Software without restriction, including without limitation
> + * the rights to use, copy, modify, merge, publish, distribute, sublicense,
> + * and/or sell copies of the Software, and to permit persons to whom the
> + * Software is furnished to do so, subject to the following conditions:
> + *
> + * The above copyright notice and this permission notice (including the next
> + * paragraph) shall be included in all copies or substantial portions of the
> + * Software.
> + *
> + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
> + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
> + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
> + * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
> + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
> + * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
> + * IN THE SOFTWARE.
> + */
> +
> +#include "anv_private.h"
> +
> +static bool
> +lookup_blorp_shader(struct blorp_context *blorp,
> +                    const void *key, uint32_t key_size,
> +                    uint32_t *kernel_out, void *prog_data_out)
> +{
> +   struct anv_device *device = blorp->driver_ctx;
> +
> +   /* The blorp cache must be a real cache */
> +   assert(device->blorp_shader_cache.cache);
> +
> +   struct anv_shader_bin *bin =
> +      anv_pipeline_cache_search(&device->blorp_shader_cache, key, key_size);
> +   if (!bin)
> +      return false;
> +
> +   /* The cache already has a reference and it's not going anywhere so there
> +    * is no need to hold a second reference.
> +    */
> +   anv_shader_bin_unref(device, bin);
> +
> +   *kernel_out = bin->kernel.offset;
> +   *(const struct brw_stage_prog_data **)prog_data_out =
> +      anv_shader_bin_get_prog_data(bin);
> +
> +   return true;
> +}
> +
> +static void
> +upload_blorp_shader(struct blorp_context *blorp,
> +                    const void *key, uint32_t key_size,
> +                    const void *kernel, uint32_t kernel_size,
> +                    const void *prog_data, uint32_t prog_data_size,
> +                    uint32_t *kernel_out, void *prog_data_out)
> +{
> +   struct anv_device *device = blorp->driver_ctx;
> +
> +   /* The blorp cache must be a real cache */
> +   assert(device->blorp_shader_cache.cache);
> +
> +   struct anv_pipeline_bind_map bind_map = {
> +      .surface_count = 0,
> +      .sampler_count = 0,
> +   };
> +
> +   struct anv_shader_bin *bin =
> +      anv_pipeline_cache_upload_kernel(&device->blorp_shader_cache,
> +                                       key, key_size, kernel, kernel_size,
> +                                       prog_data, prog_data_size, &bind_map);
> +
> +   /* The cache already has a reference and it's not going anywhere so there
> +    * is no need to hold a second reference.
> +    */
> +   anv_shader_bin_unref(device, bin);
> +
> +   *kernel_out = bin->kernel.offset;
> +   *(const struct brw_stage_prog_data **)prog_data_out =
> +      anv_shader_bin_get_prog_data(bin);
> +}
> +
> +void
> +anv_device_init_blorp(struct anv_device *device)
> +{
> +   anv_pipeline_cache_init(&device->blorp_shader_cache, device, true);
> +   blorp_init(&device->blorp, device, &device->isl_dev);
> +   device->blorp.compiler = device->instance->physicalDevice.compiler;
> +   device->blorp.mocs.tex = device->default_mocs;
> +   device->blorp.mocs.rb = device->default_mocs;
> +   device->blorp.mocs.vb = device->default_mocs;
> +   device->blorp.lookup_shader = lookup_blorp_shader;
> +   device->blorp.upload_shader = upload_blorp_shader;
> +   switch (device->info.gen) {
> +   case 7:
> +      if (device->info.is_haswell) {
> +         device->blorp.exec = gen75_blorp_exec;
> +      } else {
> +         device->blorp.exec = gen7_blorp_exec;
> +      }
> +      break;
> +   case 8:
> +      device->blorp.exec = gen8_blorp_exec;
> +      break;
> +   case 9:
> +      device->blorp.exec = gen9_blorp_exec;
> +      break;
> +   default:
> +      unreachable("Unknown hardware generation");
> +   }
> +}
> +
> +void
> +anv_device_finish_blorp(struct anv_device *device)
> +{
> +   blorp_finish(&device->blorp);
> +   anv_pipeline_cache_finish(&device->blorp_shader_cache);
> +}
> diff --git a/src/intel/vulkan/anv_device.c b/src/intel/vulkan/anv_device.c
> index 7317493..e66f812 100644
> --- a/src/intel/vulkan/anv_device.c
> +++ b/src/intel/vulkan/anv_device.c
> @@ -918,6 +918,8 @@ VkResult anv_CreateDevice(
>     if (result != VK_SUCCESS)
>        goto fail_fd;
>  
> +   anv_device_init_blorp(device);
> +
>     anv_device_init_border_colors(device);
>  
>     *pDevice = anv_device_to_handle(device);
> @@ -940,6 +942,8 @@ void anv_DestroyDevice(
>  
>     anv_queue_finish(&device->queue);
>  
> +   anv_device_finish_blorp(device);
> +
>     anv_device_finish_meta(device);
>  
>  #ifdef HAVE_VALGRIND
> diff --git a/src/intel/vulkan/anv_genX.h b/src/intel/vulkan/anv_genX.h
> index ccf4357..02e79c2 100644
> --- a/src/intel/vulkan/anv_genX.h
> +++ b/src/intel/vulkan/anv_genX.h
> @@ -72,3 +72,6 @@ genX(compute_pipeline_create)(VkDevice _device,
>                                const VkComputePipelineCreateInfo *pCreateInfo,
>                                const VkAllocationCallbacks *alloc,
>                                VkPipeline *pPipeline);
> +
> +void genX(blorp_exec)(struct blorp_batch *batch,
> +                      const struct blorp_params *params);
> diff --git a/src/intel/vulkan/anv_private.h b/src/intel/vulkan/anv_private.h
> index 5ef81d9..816a081 100644
> --- a/src/intel/vulkan/anv_private.h
> +++ b/src/intel/vulkan/anv_private.h
> @@ -41,6 +41,7 @@
>  #endif
>  
>  #include "common/gen_device_info.h"
> +#include "blorp/blorp.h"
>  #include "brw_compiler.h"
>  #include "util/macros.h"
>  #include "util/list.h"
> @@ -709,6 +710,9 @@ struct anv_device {
>  
>      struct anv_meta_state                       meta_state;
>  
> +    struct anv_pipeline_cache                   blorp_shader_cache;
> +    struct blorp_context                        blorp;
> +
>      struct anv_state                            border_colors;
>  
>      struct anv_queue                            queue;
> @@ -722,6 +726,8 @@ struct anv_device {
>  
>  void anv_device_get_cache_uuid(void *uuid);
>  
> +void anv_device_init_blorp(struct anv_device *device);
> +void anv_device_finish_blorp(struct anv_device *device);
>  
>  void* anv_gem_mmap(struct anv_device *device,
>                     uint32_t gem_handle, uint64_t offset, uint64_t size, uint32_t flags);
> diff --git a/src/intel/vulkan/genX_blorp_exec.c b/src/intel/vulkan/genX_blorp_exec.c
> new file mode 100644
> index 0000000..833b94a
> --- /dev/null
> +++ b/src/intel/vulkan/genX_blorp_exec.c
> @@ -0,0 +1,259 @@
> +/*
> + * Copyright © 2016 Intel Corporation
> + *
> + * Permission is hereby granted, free of charge, to any person obtaining a
> + * copy of this software and associated documentation files (the "Software"),
> + * to deal in the Software without restriction, including without limitation
> + * the rights to use, copy, modify, merge, publish, distribute, sublicense,
> + * and/or sell copies of the Software, and to permit persons to whom the
> + * Software is furnished to do so, subject to the following conditions:
> + *
> + * The above copyright notice and this permission notice (including the next
> + * paragraph) shall be included in all copies or substantial portions of the
> + * Software.
> + *
> + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
> + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
> + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
> + * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
> + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
> + * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
> + * IN THE SOFTWARE.
> + */
> +
> +#include <assert.h>
> +
> +#include "anv_private.h"
> +#include "genX_multisample.h"
> +
> +/* These are defined in anv_private.h and blorp_genX_exec.h */
> +#undef __gen_address_type
> +#undef __gen_user_data
> +#undef __gen_combine_address
> +
> +#include "common/gen_l3_config.h"
> +#include "blorp/blorp_genX_exec.h"
> +
> +static void *
> +blorp_emit_dwords(struct blorp_batch *batch, unsigned n)
> +{
> +   struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
> +   return anv_batch_emit_dwords(&cmd_buffer->batch, n);
> +}
> +
> +static uint64_t
> +blorp_emit_reloc(struct blorp_batch *batch,
> +                 void *location, struct blorp_address address, uint32_t delta)
> +{
> +   struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
> +   assert(cmd_buffer->batch.start <= location &&
> +          location < cmd_buffer->batch.end);
> +   return anv_batch_emit_reloc(&cmd_buffer->batch, location,
> +                               address.buffer, address.offset + delta);
> +}
> +
> +static void
> +blorp_surface_reloc(struct blorp_batch *batch, uint32_t ss_offset,
> +                    struct blorp_address address, uint32_t delta)
> +{
> +   struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
> +   anv_reloc_list_add(&cmd_buffer->surface_relocs, &cmd_buffer->pool->alloc,
> +                      ss_offset, address.buffer, address.offset + delta);
> +}
> +
> +static void *
> +blorp_alloc_dynamic_state(struct blorp_batch *batch,
> +                          enum aub_state_struct_type type,
> +                          uint32_t size,
> +                          uint32_t alignment,
> +                          uint32_t *offset)
> +{
> +   struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
> +
> +   struct anv_state state =
> +      anv_cmd_buffer_alloc_dynamic_state(cmd_buffer, size, alignment);
> +
> +   *offset = state.offset;
> +   return state.map;
> +}
> +
> +static void
> +blorp_alloc_binding_table(struct blorp_batch *batch, unsigned num_entries,
> +                          unsigned state_size, unsigned state_alignment,
> +                          uint32_t *bt_offset,
> +                          uint32_t *surface_offsets, void **surface_maps)
> +{
> +   struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
> +
> +   uint32_t state_offset;
> +   struct anv_state bt_state =
> +      anv_cmd_buffer_alloc_binding_table(cmd_buffer, num_entries,
> +                                         &state_offset);
> +   if (bt_state.map == NULL) {
> +      /* We ran out of space.  Grab a new binding table block. */
> +      VkResult result = anv_cmd_buffer_new_binding_table_block(cmd_buffer);
> +      assert(result == VK_SUCCESS);
> +
> +      /* Re-emit state base addresses so we get the new surface state base
> +       * address before we start emitting binding tables etc.
> +       */
> +      anv_cmd_buffer_emit_state_base_address(cmd_buffer);
> +
> +      bt_state = anv_cmd_buffer_alloc_binding_table(cmd_buffer, num_entries,
> +                                                    &state_offset);
> +      assert(bt_state.map != NULL);
> +   }
> +
> +   uint32_t *bt_map = bt_state.map;
> +   *bt_offset = bt_state.offset;
> +
> +   for (unsigned i = 0; i < num_entries; i++) {
> +      struct anv_state surface_state =
> +         anv_cmd_buffer_alloc_surface_state(cmd_buffer);
> +      bt_map[i] = surface_state.offset + state_offset;
> +      surface_offsets[i] = surface_state.offset;
> +      surface_maps[i] = surface_state.map;
> +   }
> +}
> +
> +static void *
> +blorp_alloc_vertex_buffer(struct blorp_batch *batch, uint32_t size,
> +                          struct blorp_address *addr)
> +{
> +   struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
> +   struct anv_state vb_state =
> +      anv_cmd_buffer_alloc_dynamic_state(cmd_buffer, size, 16);
> +
> +   *addr = (struct blorp_address) {
> +      .buffer = &cmd_buffer->device->dynamic_state_block_pool.bo,
> +      .offset = vb_state.offset,
> +   };
> +
> +   return vb_state.map;
> +}
> +
> +static void
> +blorp_emit_urb_config(struct blorp_batch *batch, unsigned vs_entry_size)
> +{
> +   struct anv_device *device = batch->blorp->driver_ctx;
> +   struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
> +
> +   genX(emit_urb_setup)(device, &cmd_buffer->batch,
> +                        VK_SHADER_STAGE_VERTEX_BIT |
> +                        VK_SHADER_STAGE_FRAGMENT_BIT,
> +                        vs_entry_size, 0,
> +                        cmd_buffer->state.current_l3_config);
> +}
> +
> +static void
> +blorp_emit_3dstate_multisample(struct blorp_batch *batch, unsigned samples)
> +{
> +   blorp_emit(batch, GENX(3DSTATE_MULTISAMPLE), ms) {
> +      ms.NumberofMultisamples       = __builtin_ffs(samples) - 1;
> +
> +#if GEN_GEN >= 8
> +      /* The PRM says that this bit is valid only for DX9:
> +       *
> +       *    SW can choose to set this bit only for DX9 API. DX10/OGL API's
> +       *    should not have any effect by setting or not setting this bit.
> +       */
> +      ms.PixelPositionOffsetEnable  = false;
> +      ms.PixelLocation              = CENTER;
> +#else
> +      ms.PixelLocation              = PIXLOC_CENTER;
> +
> +      switch (samples) {
> +      case 1:
> +         SAMPLE_POS_1X(ms.Sample);
> +         break;
> +      case 2:
> +         SAMPLE_POS_2X(ms.Sample);
> +         break;
> +      case 4:
> +         SAMPLE_POS_4X(ms.Sample);
> +         break;
> +      case 8:
> +         SAMPLE_POS_8X(ms.Sample);
> +         break;
> +      default:
> +         break;
> +      }
> +#endif
> +   }
> +}
> +
> +void genX(blorp_exec)(struct blorp_batch *batch,
> +                      const struct blorp_params *params);
> +
> +void
> +genX(blorp_exec)(struct blorp_batch *batch,
> +                 const struct blorp_params *params)
> +{
> +   struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
> +
> +   if (!cmd_buffer->state.current_l3_config) {
> +      const struct gen_l3_config *cfg =
> +         gen_get_default_l3_config(&cmd_buffer->device->info);
> +      genX(cmd_buffer_config_l3)(cmd_buffer, cfg);
> +   }
> +
> +   if (cmd_buffer->state.current_pipeline != _3D) {
> +#if GEN_GEN <= 7
> +      /* From "BXML » GT » MI » vol1a GPU Overview » [Instruction]
> +       * PIPELINE_SELECT [DevBWR+]":
> +       *
> +       *   Project: DEVSNB+
> +       *
> +       *   Software must ensure all the write caches are flushed through a
> +       *   stalling PIPE_CONTROL command followed by another PIPE_CONTROL
> +       *   command to invalidate read only caches prior to programming
> +       *   MI_PIPELINE_SELECT command to change the Pipeline Select Mode.
> +       */
> +      blorp_emit(batch, GENX(PIPE_CONTROL), pc) {
> +         pc.RenderTargetCacheFlushEnable  = true;
> +         pc.DepthCacheFlushEnable         = true;
> +         pc.DCFlushEnable                 = true;
> +         pc.PostSyncOperation             = NoWrite;
> +         pc.CommandStreamerStallEnable    = true;
> +      }
> +
> +      blorp_emit(batch, GENX(PIPE_CONTROL), pc) {
> +         pc.TextureCacheInvalidationEnable   = true;
> +         pc.ConstantCacheInvalidationEnable  = true;
> +         pc.StateCacheInvalidationEnable     = true;
> +         pc.InstructionCacheInvalidateEnable = true;
> +         pc.PostSyncOperation                = NoWrite;
> +      }
> +#endif
> +
> +      blorp_emit(batch, GENX(PIPELINE_SELECT), ps) {
> +#if GEN_GEN >= 9
> +         ps.MaskBits = 3;
> +#endif
> +         ps.PipelineSelection = _3D;
> +      }
> +
> +      cmd_buffer->state.current_pipeline = _3D;
> +   }
> +
> +   blorp_exec(batch, params);
> +
> +   /* BLORP sets DRAWING_RECTANGLE but we always want it set to the maximum.
> +    * Since we set it once at driver init and never again, we have to set it
> +    * back after invoking blorp.
> +    *
> +    * TODO: BLORP should assume a max drawing rectangle
> +    */
> +   blorp_emit(batch, GENX(3DSTATE_DRAWING_RECTANGLE), rect) {
> +      rect.ClippedDrawingRectangleYMin = 0;
> +      rect.ClippedDrawingRectangleXMin = 0;
> +      rect.ClippedDrawingRectangleYMax = UINT16_MAX;
> +      rect.ClippedDrawingRectangleXMax = UINT16_MAX;
> +      rect.DrawingRectangleOriginY = 0;
> +      rect.DrawingRectangleOriginX = 0;
> +   }
> +
> +   cmd_buffer->state.vb_dirty = ~0;
> +   cmd_buffer->state.dirty = ~0;
> +   cmd_buffer->state.push_constants_dirty = ~0;
> +}
> -- 
> 2.5.0.400.gff86faf
> 
> _______________________________________________
> mesa-dev mailing list
> mesa-dev at lists.freedesktop.org
> https://lists.freedesktop.org/mailman/listinfo/mesa-dev


More information about the mesa-dev mailing list