Mesa (main): radv: implement optimized MSAA copies using FMASK

GitLab Mirror gitlab-mirror at kemper.freedesktop.org
Wed Nov 24 08:55:14 UTC 2021


Module: Mesa
Branch: main
Commit: deb4685df39dbfcfb79389f259958f18441e7231
URL:    http://cgit.freedesktop.org/mesa/mesa/commit/?id=deb4685df39dbfcfb79389f259958f18441e7231

Author: Samuel Pitoiset <samuel.pitoiset at gmail.com>
Date:   Fri Aug 20 16:19:40 2021 +0200

radv: implement optimized MSAA copies using FMASK

Signed-off-by: Samuel Pitoiset <samuel.pitoiset at gmail.com>
Reviewed-by: Bas Nieuwenhuizen <bas at basnieuwenhuizen.nl>
Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/12555>

---

 src/amd/vulkan/meson.build            |   1 +
 src/amd/vulkan/radv_meta.c            |   7 +
 src/amd/vulkan/radv_meta.h            |   9 +
 src/amd/vulkan/radv_meta_copy.c       |   6 +-
 src/amd/vulkan/radv_meta_fmask_copy.c | 366 ++++++++++++++++++++++++++++++++++
 src/amd/vulkan/radv_private.h         |   5 +
 6 files changed, 393 insertions(+), 1 deletion(-)

diff --git a/src/amd/vulkan/meson.build b/src/amd/vulkan/meson.build
index 7bb76bf73bf..d81660366a3 100644
--- a/src/amd/vulkan/meson.build
+++ b/src/amd/vulkan/meson.build
@@ -62,6 +62,7 @@ libradv_files = files(
   'radv_meta_dcc_retile.c',
   'radv_meta_decompress.c',
   'radv_meta_fast_clear.c',
+  'radv_meta_fmask_copy.c',
   'radv_meta_fmask_expand.c',
   'radv_meta_resolve.c',
   'radv_meta_resolve_cs.c',
diff --git a/src/amd/vulkan/radv_meta.c b/src/amd/vulkan/radv_meta.c
index d45e812b75c..3d6423bb7c0 100644
--- a/src/amd/vulkan/radv_meta.c
+++ b/src/amd/vulkan/radv_meta.c
@@ -491,8 +491,14 @@ radv_device_init_meta(struct radv_device *device)
    if (result != VK_SUCCESS)
       goto fail_accel_struct_build;
 
+   result = radv_device_init_meta_fmask_copy_state(device);
+   if (result != VK_SUCCESS)
+      goto fail_fmask_copy;
+
    return VK_SUCCESS;
 
+fail_fmask_copy:
+   radv_device_finish_accel_struct_build_state(device);
 fail_accel_struct_build:
    radv_device_finish_meta_fmask_expand_state(device);
 fail_fmask_expand:
@@ -541,6 +547,7 @@ radv_device_finish_meta(struct radv_device *device)
    radv_device_finish_meta_fmask_expand_state(device);
    radv_device_finish_meta_dcc_retile_state(device);
    radv_device_finish_meta_copy_vrs_htile_state(device);
+   radv_device_finish_meta_fmask_copy_state(device);
 
    radv_store_meta_pipeline(device);
    radv_pipeline_cache_finish(&device->meta_state.cache);
diff --git a/src/amd/vulkan/radv_meta.h b/src/amd/vulkan/radv_meta.h
index efba51a4ecd..cf8221ff6a8 100644
--- a/src/amd/vulkan/radv_meta.h
+++ b/src/amd/vulkan/radv_meta.h
@@ -130,6 +130,9 @@ void radv_device_finish_meta_resolve_compute_state(struct radv_device *device);
 VkResult radv_device_init_meta_resolve_fragment_state(struct radv_device *device, bool on_demand);
 void radv_device_finish_meta_resolve_fragment_state(struct radv_device *device);
 
+VkResult radv_device_init_meta_fmask_copy_state(struct radv_device *device);
+void radv_device_finish_meta_fmask_copy_state(struct radv_device *device);
+
 VkResult radv_device_init_meta_fmask_expand_state(struct radv_device *device);
 void radv_device_finish_meta_fmask_expand_state(struct radv_device *device);
 
@@ -223,6 +226,12 @@ void radv_copy_vrs_htile(struct radv_cmd_buffer *cmd_buffer, struct radv_image *
                          VkExtent2D *extent, struct radv_image *dst_image,
                          struct radv_buffer *htile_buffer, bool read_htile_value);
 
+bool radv_can_use_fmask_copy(struct radv_cmd_buffer *cmd_buffer,
+                             const struct radv_image *src_image, const struct radv_image *dst_image,
+                             unsigned num_rects, const struct radv_meta_blit2d_rect *rects);
+void radv_fmask_copy(struct radv_cmd_buffer *cmd_buffer, struct radv_meta_blit2d_surf *src,
+                     struct radv_meta_blit2d_surf *dst);
+
 void radv_meta_resolve_compute_image(struct radv_cmd_buffer *cmd_buffer,
                                      struct radv_image *src_image, VkFormat src_format,
                                      VkImageLayout src_image_layout, struct radv_image *dest_image,
diff --git a/src/amd/vulkan/radv_meta_copy.c b/src/amd/vulkan/radv_meta_copy.c
index b9b45750625..aed65196c3b 100644
--- a/src/amd/vulkan/radv_meta_copy.c
+++ b/src/amd/vulkan/radv_meta_copy.c
@@ -535,7 +535,11 @@ copy_image(struct radv_cmd_buffer *cmd_buffer, struct radv_image *src_image,
          if (cs) {
             radv_meta_image_to_image_cs(cmd_buffer, &b_src, &b_dst, 1, &rect);
          } else {
-            radv_meta_blit2d(cmd_buffer, &b_src, NULL, &b_dst, 1, &rect);
+            if (radv_can_use_fmask_copy(cmd_buffer, b_src.image, b_dst.image, 1, &rect)) {
+               radv_fmask_copy(cmd_buffer, &b_src, &b_dst);
+            } else {
+               radv_meta_blit2d(cmd_buffer, &b_src, NULL, &b_dst, 1, &rect);
+            }
          }
 
          b_src.layer++;
diff --git a/src/amd/vulkan/radv_meta_fmask_copy.c b/src/amd/vulkan/radv_meta_fmask_copy.c
new file mode 100644
index 00000000000..da19b0d37c8
--- /dev/null
+++ b/src/amd/vulkan/radv_meta_fmask_copy.c
@@ -0,0 +1,366 @@
+/*
+ * Copyright © 2021 Valve Corporation
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice (including the next
+ * paragraph) shall be included in all copies or substantial portions of the
+ * Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
+ * IN THE SOFTWARE.
+ */
+#include "nir/nir_builder.h"
+#include "radv_meta.h"
+
+static nir_shader *
+build_fmask_copy_compute_shader(struct radv_device *dev, int samples)
+{
+   const struct glsl_type *sampler_type = glsl_sampler_type(GLSL_SAMPLER_DIM_MS, false, false, GLSL_TYPE_FLOAT);
+   const struct glsl_type *img_type = glsl_image_type(GLSL_SAMPLER_DIM_MS, false, GLSL_TYPE_FLOAT);
+
+   nir_builder b = nir_builder_init_simple_shader(MESA_SHADER_COMPUTE, NULL, "meta_fmask_copy_cs_-%d", samples);
+
+   b.shader->info.workgroup_size[0] = 8;
+   b.shader->info.workgroup_size[1] = 8;
+   b.shader->info.workgroup_size[2] = 1;
+
+   nir_variable *input_img = nir_variable_create(b.shader, nir_var_uniform, sampler_type, "s_tex");
+   input_img->data.descriptor_set = 0;
+   input_img->data.binding = 0;
+
+   nir_variable *output_img = nir_variable_create(b.shader, nir_var_uniform, img_type, "out_img");
+   output_img->data.descriptor_set = 0;
+   output_img->data.binding = 1;
+
+   nir_ssa_def *invoc_id = nir_load_local_invocation_id(&b);
+   nir_ssa_def *wg_id = nir_load_workgroup_id(&b, 32);
+   nir_ssa_def *block_size =
+      nir_imm_ivec3(&b, b.shader->info.workgroup_size[0], b.shader->info.workgroup_size[1],
+                    b.shader->info.workgroup_size[2]);
+
+   nir_ssa_def *global_id = nir_iadd(&b, nir_imul(&b, wg_id, block_size), invoc_id);
+
+   /* Get coordinates. */
+   nir_ssa_def *src_coord = nir_channels(&b, global_id, 0x3);
+   nir_ssa_def *dst_coord = nir_vec4(&b, nir_channel(&b, src_coord, 0),
+                                         nir_channel(&b, src_coord, 1),
+                                         nir_ssa_undef(&b, 1, 32),
+                                         nir_ssa_undef(&b, 1, 32));
+
+   nir_ssa_def *input_img_deref = &nir_build_deref_var(&b, input_img)->dest.ssa;
+
+   /* Fetch the mask for this fragment. */
+   nir_tex_instr *frag_mask_fetch = nir_tex_instr_create(b.shader, 3);
+   frag_mask_fetch->sampler_dim = GLSL_SAMPLER_DIM_MS;
+   frag_mask_fetch->op = nir_texop_fragment_mask_fetch_amd;
+   frag_mask_fetch->src[0].src_type = nir_tex_src_coord;
+   frag_mask_fetch->src[0].src = nir_src_for_ssa(src_coord);
+   frag_mask_fetch->src[1].src_type = nir_tex_src_lod;
+   frag_mask_fetch->src[1].src = nir_src_for_ssa(nir_imm_int(&b, 0));
+   frag_mask_fetch->src[2].src_type = nir_tex_src_texture_deref;
+   frag_mask_fetch->src[2].src = nir_src_for_ssa(input_img_deref);
+   frag_mask_fetch->dest_type = nir_type_uint32;
+   frag_mask_fetch->is_array = false;
+   frag_mask_fetch->coord_components = 2;
+
+   nir_ssa_dest_init(&frag_mask_fetch->instr, &frag_mask_fetch->dest, 1, 32, "frag_mask_fetch");
+   nir_builder_instr_insert(&b, &frag_mask_fetch->instr);
+
+   nir_ssa_def *frag_mask = &frag_mask_fetch->dest.ssa;
+
+   /* Get the maximum sample used in this fragment. */
+   nir_ssa_def *max_sample_index = nir_imm_int(&b, 0);
+   for (uint32_t s = 0; s < samples; s++) {
+      /* max_sample_index = MAX2(max_sample_index, (frag_mask >> (s * 4)) & 0xf) */
+      max_sample_index = nir_umax(&b, max_sample_index,
+                              nir_ubitfield_extract(&b, frag_mask, nir_imm_int(&b, 4 * s),
+                                                    nir_imm_int(&b, 4)));
+   }
+
+   nir_variable *counter = nir_local_variable_create(b.impl, glsl_int_type(), "counter");
+   nir_store_var(&b, counter, nir_imm_int(&b, 0), 0x1);
+
+   nir_loop *loop = nir_push_loop(&b);
+   {
+      nir_ssa_def *sample_id = nir_load_var(&b, counter);
+
+      nir_tex_instr *frag_fetch = nir_tex_instr_create(b.shader, 4);
+      frag_fetch->sampler_dim = GLSL_SAMPLER_DIM_MS;
+      frag_fetch->op = nir_texop_fragment_fetch_amd;
+      frag_fetch->src[0].src_type = nir_tex_src_coord;
+      frag_fetch->src[0].src = nir_src_for_ssa(src_coord);
+      frag_fetch->src[1].src_type = nir_tex_src_lod;
+      frag_fetch->src[1].src = nir_src_for_ssa(nir_imm_int(&b, 0));
+      frag_fetch->src[2].src_type = nir_tex_src_texture_deref;
+      frag_fetch->src[2].src = nir_src_for_ssa(input_img_deref);
+      frag_fetch->src[3].src_type = nir_tex_src_ms_index;
+      frag_fetch->src[3].src = nir_src_for_ssa(sample_id);
+      frag_fetch->dest_type = nir_type_uint32;
+      frag_fetch->is_array = false;
+      frag_fetch->coord_components = 2;
+
+      nir_ssa_dest_init(&frag_fetch->instr, &frag_fetch->dest, 4, 32, "frag_fetch");
+      nir_builder_instr_insert(&b, &frag_fetch->instr);
+
+      nir_ssa_def *outval = &frag_fetch->dest.ssa;
+      nir_image_deref_store(&b, &nir_build_deref_var(&b, output_img)->dest.ssa, dst_coord,
+                            sample_id, outval, nir_imm_int(&b, 0),
+                            .image_dim = GLSL_SAMPLER_DIM_MS);
+
+      radv_break_on_count(&b, counter, max_sample_index);
+   }
+   nir_pop_loop(&b, loop);
+
+   return b.shader;
+}
+
+void
+radv_device_finish_meta_fmask_copy_state(struct radv_device *device)
+{
+   struct radv_meta_state *state = &device->meta_state;
+
+   radv_DestroyPipelineLayout(radv_device_to_handle(device), state->fmask_copy.p_layout,
+                              &state->alloc);
+   radv_DestroyDescriptorSetLayout(radv_device_to_handle(device), state->fmask_copy.ds_layout,
+                                   &state->alloc);
+
+   for (uint32_t i = 0; i < MAX_SAMPLES_LOG2; ++i) {
+      radv_DestroyPipeline(radv_device_to_handle(device), state->fmask_copy.pipeline[i], &state->alloc);
+   }
+}
+
+static VkResult
+create_fmask_copy_pipeline(struct radv_device *device, int samples, VkPipeline *pipeline)
+{
+   struct radv_meta_state *state = &device->meta_state;
+   nir_shader *cs = build_fmask_copy_compute_shader(device, samples);
+   VkResult result;
+
+   VkPipelineShaderStageCreateInfo pipeline_shader_stage = {
+      .sType = VK_STRUCTURE_TYPE_PIPELINE_SHADER_STAGE_CREATE_INFO,
+      .stage = VK_SHADER_STAGE_COMPUTE_BIT,
+      .module = vk_shader_module_handle_from_nir(cs),
+      .pName = "main",
+      .pSpecializationInfo = NULL,
+   };
+
+   VkComputePipelineCreateInfo vk_pipeline_info = {
+      .sType = VK_STRUCTURE_TYPE_COMPUTE_PIPELINE_CREATE_INFO,
+      .stage = pipeline_shader_stage,
+      .flags = 0,
+      .layout = state->fmask_copy.p_layout,
+   };
+
+   result = radv_CreateComputePipelines(radv_device_to_handle(device),
+                                        radv_pipeline_cache_to_handle(&state->cache), 1,
+                                        &vk_pipeline_info, NULL, pipeline);
+   ralloc_free(cs);
+   return result;
+}
+
+VkResult
+radv_device_init_meta_fmask_copy_state(struct radv_device *device)
+{
+   VkResult result;
+
+   VkDescriptorSetLayoutCreateInfo ds_create_info = {
+      .sType = VK_STRUCTURE_TYPE_DESCRIPTOR_SET_LAYOUT_CREATE_INFO,
+      .flags = VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR,
+      .bindingCount = 2,
+      .pBindings = (VkDescriptorSetLayoutBinding[]){
+         {.binding = 0,
+          .descriptorType = VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE,
+          .descriptorCount = 1,
+          .stageFlags = VK_SHADER_STAGE_COMPUTE_BIT,
+          .pImmutableSamplers = NULL},
+         {.binding = 1,
+          .descriptorType = VK_DESCRIPTOR_TYPE_STORAGE_IMAGE,
+          .descriptorCount = 1,
+          .stageFlags = VK_SHADER_STAGE_COMPUTE_BIT,
+          .pImmutableSamplers = NULL},
+      }};
+
+   result = radv_CreateDescriptorSetLayout(radv_device_to_handle(device), &ds_create_info,
+                                           &device->meta_state.alloc,
+                                           &device->meta_state.fmask_copy.ds_layout);
+   if (result != VK_SUCCESS)
+      goto fail;
+
+   VkPipelineLayoutCreateInfo pl_create_info = {
+      .sType = VK_STRUCTURE_TYPE_PIPELINE_LAYOUT_CREATE_INFO,
+      .setLayoutCount = 1,
+      .pSetLayouts = &device->meta_state.fmask_copy.ds_layout,
+      .pushConstantRangeCount = 0,
+      .pPushConstantRanges = NULL
+   };
+
+   result =
+      radv_CreatePipelineLayout(radv_device_to_handle(device), &pl_create_info,
+                                &device->meta_state.alloc, &device->meta_state.fmask_copy.p_layout);
+   if (result != VK_SUCCESS)
+      goto fail;
+
+   for (uint32_t i = 0; i < MAX_SAMPLES_LOG2; i++) {
+      uint32_t samples = 1 << i;
+      result = create_fmask_copy_pipeline(device, samples, &device->meta_state.fmask_copy.pipeline[i]);
+      if (result != VK_SUCCESS)
+         goto fail;
+   }
+
+   return VK_SUCCESS;
+fail:
+   radv_device_finish_meta_fmask_copy_state(device);
+   return result;
+}
+
+static void
+radv_fixup_copy_dst_metadata(struct radv_cmd_buffer *cmd_buffer, const struct radv_image *src_image,
+                             const struct radv_image *dst_image)
+{
+   uint64_t src_offset, dst_offset, size;
+
+   assert(src_image->planes[0].surface.cmask_size == dst_image->planes[0].surface.cmask_size &&
+          src_image->planes[0].surface.fmask_size == dst_image->planes[0].surface.fmask_size);
+   assert(src_image->planes[0].surface.fmask_offset + src_image->planes[0].surface.fmask_size ==
+          src_image->planes[0].surface.cmask_offset &&
+          dst_image->planes[0].surface.fmask_offset + dst_image->planes[0].surface.fmask_size ==
+          dst_image->planes[0].surface.cmask_offset);
+
+   /* Copy CMASK+FMASK. */
+   size = src_image->planes[0].surface.cmask_size + src_image->planes[0].surface.fmask_size;
+   src_offset = src_image->planes[0].surface.fmask_offset;
+   dst_offset = dst_image->planes[0].surface.fmask_offset;
+
+   radv_copy_buffer(cmd_buffer, src_image->bo, dst_image->bo, src_offset, dst_offset, size);
+}
+
+bool
+radv_can_use_fmask_copy(struct radv_cmd_buffer *cmd_buffer,
+                        const struct radv_image *src_image, const struct radv_image *dst_image,
+                        unsigned num_rects, const struct radv_meta_blit2d_rect *rects)
+{
+   /* TODO: Test on pre GFX10 chips. */
+   if (cmd_buffer->device->physical_device->rad_info.chip_class < GFX10)
+      return false;
+
+   /* TODO: Add support for layers. */
+   if (src_image->info.array_size != 1 || dst_image->info.array_size != 1)
+      return false;
+
+   /* Source/destination images must have FMASK. */
+   if (!radv_image_has_fmask(src_image) || !radv_image_has_fmask(dst_image))
+      return false;
+
+   /* Source/destination images must have identical TC-compat mode. */
+   if (radv_image_is_tc_compat_cmask(src_image) != radv_image_is_tc_compat_cmask(dst_image))
+      return false;
+
+   /* The region must be a whole image copy. */
+   if (num_rects != 1 ||
+       (rects[0].src_x || rects[0].src_y || rects[0].dst_x || rects[0].dst_y ||
+        rects[0].width != src_image->info.width || rects[0].height != src_image->info.height))
+      return false;
+
+   /* Source/destination images must have identical size. */
+   if (src_image->info.width != dst_image->info.width ||
+       src_image->info.height != dst_image->info.height)
+      return false;
+
+   /* Source/destination images must have identical swizzle. */
+   if (src_image->planes[0].surface.fmask_tile_swizzle !=
+       dst_image->planes[0].surface.fmask_tile_swizzle ||
+       src_image->planes[0].surface.u.gfx9.color.fmask_swizzle_mode !=
+       dst_image->planes[0].surface.u.gfx9.color.fmask_swizzle_mode)
+      return false;
+
+   return true;
+}
+
+void
+radv_fmask_copy(struct radv_cmd_buffer *cmd_buffer, struct radv_meta_blit2d_surf *src,
+                struct radv_meta_blit2d_surf *dst)
+{
+   struct radv_device *device = cmd_buffer->device;
+   struct radv_image_view src_iview, dst_iview;
+   uint32_t samples = src->image->info.samples;
+   uint32_t samples_log2 = ffs(samples) - 1;
+
+   radv_CmdBindPipeline(radv_cmd_buffer_to_handle(cmd_buffer), VK_PIPELINE_BIND_POINT_COMPUTE,
+                        cmd_buffer->device->meta_state.fmask_copy.pipeline[samples_log2]);
+
+   radv_image_view_init(&src_iview, device,
+                        &(VkImageViewCreateInfo){
+                           .sType = VK_STRUCTURE_TYPE_IMAGE_VIEW_CREATE_INFO,
+                           .image = radv_image_to_handle(src->image),
+                           .viewType = radv_meta_get_view_type(src->image),
+                           .format = vk_format_no_srgb(src->image->vk_format),
+                           .subresourceRange =
+                              {
+                                 .aspectMask = src->aspect_mask,
+                                 .baseMipLevel = 0,
+                                 .levelCount = 1,
+                                 .baseArrayLayer = 0,
+                                 .layerCount = 1,
+                              },
+                        },
+                        NULL);
+
+   radv_image_view_init(&dst_iview, device,
+                        &(VkImageViewCreateInfo){
+                           .sType = VK_STRUCTURE_TYPE_IMAGE_VIEW_CREATE_INFO,
+                           .image = radv_image_to_handle(dst->image),
+                           .viewType = radv_meta_get_view_type(dst->image),
+                           .format = vk_format_no_srgb(dst->image->vk_format),
+                           .subresourceRange =
+                              {
+                                 .aspectMask = dst->aspect_mask,
+                                 .baseMipLevel = 0,
+                                 .levelCount = 1,
+                                 .baseArrayLayer = 0,
+                                 .layerCount = 1,
+                              },
+                        },
+                        NULL);
+
+   radv_meta_push_descriptor_set(
+      cmd_buffer, VK_PIPELINE_BIND_POINT_COMPUTE,
+      cmd_buffer->device->meta_state.fmask_copy.p_layout, 0, /* set */
+      2,                                                     /* descriptorWriteCount */
+      (VkWriteDescriptorSet[]){{.sType = VK_STRUCTURE_TYPE_WRITE_DESCRIPTOR_SET,
+                                .dstBinding = 0,
+                                .dstArrayElement = 0,
+                                .descriptorCount = 1,
+                                .descriptorType = VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE,
+                                .pImageInfo =
+                                   (VkDescriptorImageInfo[]){
+                                      {.sampler = VK_NULL_HANDLE,
+                                       .imageView = radv_image_view_to_handle(&src_iview),
+                                       .imageLayout = VK_IMAGE_LAYOUT_GENERAL},
+                                   }},
+                               {.sType = VK_STRUCTURE_TYPE_WRITE_DESCRIPTOR_SET,
+                                .dstBinding = 1,
+                                .dstArrayElement = 0,
+                                .descriptorCount = 1,
+                                .descriptorType = VK_DESCRIPTOR_TYPE_STORAGE_IMAGE,
+                                .pImageInfo = (VkDescriptorImageInfo[]){
+                                   {.sampler = VK_NULL_HANDLE,
+                                    .imageView = radv_image_view_to_handle(&dst_iview),
+                                    .imageLayout = VK_IMAGE_LAYOUT_GENERAL},
+                                }}});
+
+   radv_unaligned_dispatch(cmd_buffer, src->image->info.width, src->image->info.height, 1);
+
+   /* Fixup destination image metadata by copying CMASK/FMASK from the source image. */
+   radv_fixup_copy_dst_metadata(cmd_buffer, src->image, dst->image);
+}
diff --git a/src/amd/vulkan/radv_private.h b/src/amd/vulkan/radv_private.h
index 770bf55c033..693a85774f7 100644
--- a/src/amd/vulkan/radv_private.h
+++ b/src/amd/vulkan/radv_private.h
@@ -538,6 +538,11 @@ struct radv_meta_state {
       VkDescriptorSetLayout img_ds_layout;
       VkPipeline pipeline;
    } cleari_r32g32b32;
+   struct {
+      VkPipelineLayout p_layout;
+      VkDescriptorSetLayout ds_layout;
+      VkPipeline pipeline[MAX_SAMPLES_LOG2];
+   } fmask_copy;
 
    struct {
       VkPipelineLayout p_layout;



More information about the mesa-commit mailing list