[Mesa-dev] [PATCH 4/4] radv/gfx10: use the correct target machine for Wave32

Bas Nieuwenhuizen bas at basnieuwenhuizen.nl
Thu Aug 1 14:15:07 UTC 2019


r-b for patch 1,2,4

On Thu, Aug 1, 2019 at 10:40 AM Samuel Pitoiset
<samuel.pitoiset at gmail.com> wrote:
>
> Signed-off-by: Samuel Pitoiset <samuel.pitoiset at gmail.com>
> ---
>  src/amd/vulkan/radv_llvm_helper.cpp | 30 +++++++++++++++++++++--------
>  src/amd/vulkan/radv_shader.c        |  3 ++-
>  src/amd/vulkan/radv_shader_helper.h |  3 ++-
>  3 files changed, 26 insertions(+), 10 deletions(-)
>
> diff --git a/src/amd/vulkan/radv_llvm_helper.cpp b/src/amd/vulkan/radv_llvm_helper.cpp
> index 2b14ddcf184..612548e4219 100644
> --- a/src/amd/vulkan/radv_llvm_helper.cpp
> +++ b/src/amd/vulkan/radv_llvm_helper.cpp
> @@ -28,8 +28,10 @@
>  class radv_llvm_per_thread_info {
>  public:
>         radv_llvm_per_thread_info(enum radeon_family arg_family,
> -                               enum ac_target_machine_options arg_tm_options)
> -               : family(arg_family), tm_options(arg_tm_options), passes(NULL) {}
> +                               enum ac_target_machine_options arg_tm_options,
> +                               unsigned arg_wave_size)
> +               : family(arg_family), tm_options(arg_tm_options),
> +                 wave_size(arg_wave_size), passes(NULL), passes_wave32(NULL) {}
>
>         ~radv_llvm_per_thread_info()
>         {
> @@ -47,19 +49,28 @@ public:
>                 if (!passes)
>                         return false;
>
> +               if (llvm_info.tm_wave32) {
> +                       passes_wave32 = ac_create_llvm_passes(llvm_info.tm_wave32);
> +                       if (!passes_wave32)
> +                               return false;
> +               }
> +
>                 return true;
>         }
>
>         bool compile_to_memory_buffer(LLVMModuleRef module,
>                                       char **pelf_buffer, size_t *pelf_size)
>         {
> -               return ac_compile_module_to_elf(passes, module, pelf_buffer, pelf_size);
> +               struct ac_compiler_passes *p = wave_size == 32 ? passes_wave32 : passes;
> +               return ac_compile_module_to_elf(p, module, pelf_buffer, pelf_size);
>         }
>
>         bool is_same(enum radeon_family arg_family,
> -                    enum ac_target_machine_options arg_tm_options) {
> +                    enum ac_target_machine_options arg_tm_options,
> +                    unsigned arg_wave_size) {
>                 if (arg_family == family &&
> -                   arg_tm_options == tm_options)
> +                   arg_tm_options == tm_options &&
> +                   arg_wave_size == wave_size)
>                         return true;
>                 return false;
>         }
> @@ -67,7 +78,9 @@ public:
>  private:
>         enum radeon_family family;
>         enum ac_target_machine_options tm_options;
> +       unsigned wave_size;
>         struct ac_compiler_passes *passes;
> +       struct ac_compiler_passes *passes_wave32;
>  };
>
>  /* we have to store a linked list per thread due to the possiblity of multiple gpus being required */
> @@ -99,17 +112,18 @@ bool radv_compile_to_elf(struct ac_llvm_compiler *info,
>  bool radv_init_llvm_compiler(struct ac_llvm_compiler *info,
>                              bool thread_compiler,
>                              enum radeon_family family,
> -                            enum ac_target_machine_options tm_options)
> +                            enum ac_target_machine_options tm_options,
> +                            unsigned wave_size)
>  {
>         if (thread_compiler) {
>                 for (auto &I : radv_llvm_per_thread_list) {
> -                       if (I.is_same(family, tm_options)) {
> +                       if (I.is_same(family, tm_options, wave_size)) {
>                                 *info = I.llvm_info;
>                                 return true;
>                         }
>                 }
>
> -               radv_llvm_per_thread_list.emplace_back(family, tm_options);
> +               radv_llvm_per_thread_list.emplace_back(family, tm_options, wave_size);
>                 radv_llvm_per_thread_info &tinfo = radv_llvm_per_thread_list.back();
>
>                 if (!tinfo.init()) {
> diff --git a/src/amd/vulkan/radv_shader.c b/src/amd/vulkan/radv_shader.c
> index f0ab2d5e467..5e3b1378a14 100644
> --- a/src/amd/vulkan/radv_shader.c
> +++ b/src/amd/vulkan/radv_shader.c
> @@ -1163,7 +1163,8 @@ shader_variant_compile(struct radv_device *device,
>         radv_init_llvm_once();
>         radv_init_llvm_compiler(&ac_llvm,
>                                 thread_compiler,
> -                               chip_family, tm_options);
> +                               chip_family, tm_options,
> +                               radv_get_shader_wave_size(device->physical_device, stage));
>         if (gs_copy_shader) {
>                 assert(shader_count == 1);
>                 radv_compile_gs_copy_shader(&ac_llvm, *shaders, &binary,
> diff --git a/src/amd/vulkan/radv_shader_helper.h b/src/amd/vulkan/radv_shader_helper.h
> index d9dace0b495..c64d2df676b 100644
> --- a/src/amd/vulkan/radv_shader_helper.h
> +++ b/src/amd/vulkan/radv_shader_helper.h
> @@ -29,7 +29,8 @@ extern "C" {
>  bool radv_init_llvm_compiler(struct ac_llvm_compiler *info,
>                              bool thread_compiler,
>                              enum radeon_family family,
> -                            enum ac_target_machine_options tm_options);
> +                            enum ac_target_machine_options tm_options,
> +                            unsigned wave_size);
>  void radv_destroy_llvm_compiler(struct ac_llvm_compiler *info,
>                                 bool thread_compiler);
>
> --
> 2.22.0
>
> _______________________________________________
> mesa-dev mailing list
> mesa-dev at lists.freedesktop.org
> https://lists.freedesktop.org/mailman/listinfo/mesa-dev


More information about the mesa-dev mailing list