Mesa (staging/20.0): radeonsi: skip vs output optimizations for some outputs

GitLab Mirror gitlab-mirror at kemper.freedesktop.org
Thu Apr 23 05:32:25 UTC 2020


Module: Mesa
Branch: staging/20.0
Commit: d160bd3cf030981397c16f10df0c1a860008b1c4
URL:    http://cgit.freedesktop.org/mesa/mesa/commit/?id=d160bd3cf030981397c16f10df0c1a860008b1c4

Author: Pierre-Eric Pelloux-Prayer <pierre-eric.pelloux-prayer at amd.com>
Date:   Tue Apr 14 18:04:35 2020 +0200

radeonsi: skip vs output optimizations for some outputs

If PT_SPRITE_TEX is enabled, PS inputs are overriden at runtime so
we can't apply the vs output optim.

Closes: https://gitlab.freedesktop.org/mesa/mesa/-/issues/2747
Fixes: 3ec9975555d ("radeonsi: eliminate trivial constant VS outputs")
Reviewed-by: Marek Olšák <marek.olsak at amd.com>
Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/4559>
(cherry picked from commit 17acff01a00109c87d59b9d876fc735dd5fbe3d1)

---

 .pick_status.json                        |  4 ++--
 src/amd/llvm/ac_llvm_build.c             |  4 ++++
 src/amd/llvm/ac_llvm_build.h             |  1 +
 src/amd/vulkan/radv_nir_to_llvm.c        |  2 +-
 src/gallium/drivers/radeonsi/si_shader.c | 11 +++++++++++
 5 files changed, 19 insertions(+), 3 deletions(-)

diff --git a/.pick_status.json b/.pick_status.json
index 1f82998eed6..f0344e50a06 100644
--- a/.pick_status.json
+++ b/.pick_status.json
@@ -1291,7 +1291,7 @@
         "description": "radeonsi: skip vs output optimizations for some outputs",
         "nominated": true,
         "nomination_type": 1,
-        "resolution": 0,
+        "resolution": 1,
         "master_sha": null,
         "because_sha": "3ec9975555d1cc5365413ad9062f412904f944a3"
     },
@@ -25730,4 +25730,4 @@
         "master_sha": null,
         "because_sha": null
     }
-]
\ No newline at end of file
+]
diff --git a/src/amd/llvm/ac_llvm_build.c b/src/amd/llvm/ac_llvm_build.c
index 4b2331a524a..d78110ba820 100644
--- a/src/amd/llvm/ac_llvm_build.c
+++ b/src/amd/llvm/ac_llvm_build.c
@@ -3081,6 +3081,7 @@ void ac_optimize_vs_outputs(struct ac_llvm_context *ctx,
 			    LLVMValueRef main_fn,
 			    uint8_t *vs_output_param_offset,
 			    uint32_t num_outputs,
+			    uint32_t skip_output_mask,
 			    uint8_t *num_param_exports)
 {
 	LLVMBasicBlockRef bb;
@@ -3124,6 +3125,9 @@ void ac_optimize_vs_outputs(struct ac_llvm_context *ctx,
 
 			target -= V_008DFC_SQ_EXP_PARAM;
 
+			if ((1u << target) & skip_output_mask)
+				continue;
+
 			/* Parse the instruction. */
 			memset(&exp, 0, sizeof(exp));
 			exp.offset = target;
diff --git a/src/amd/llvm/ac_llvm_build.h b/src/amd/llvm/ac_llvm_build.h
index e08ab656f9c..4a65f117b21 100644
--- a/src/amd/llvm/ac_llvm_build.h
+++ b/src/amd/llvm/ac_llvm_build.h
@@ -605,6 +605,7 @@ void ac_optimize_vs_outputs(struct ac_llvm_context *ac,
 			    LLVMValueRef main_fn,
 			    uint8_t *vs_output_param_offset,
 			    uint32_t num_outputs,
+			    uint32_t skip_output_mask,
 			    uint8_t *num_param_exports);
 void ac_init_exec_full_mask(struct ac_llvm_context *ctx);
 
diff --git a/src/amd/vulkan/radv_nir_to_llvm.c b/src/amd/vulkan/radv_nir_to_llvm.c
index 64288be58bb..49065cdbe5b 100644
--- a/src/amd/vulkan/radv_nir_to_llvm.c
+++ b/src/amd/vulkan/radv_nir_to_llvm.c
@@ -3831,7 +3831,7 @@ ac_nir_eliminate_const_vs_outputs(struct radv_shader_context *ctx)
 	ac_optimize_vs_outputs(&ctx->ac,
 			       ctx->main_function,
 			       outinfo->vs_output_param_offset,
-			       VARYING_SLOT_MAX,
+			       VARYING_SLOT_MAX, 0,
 			       &outinfo->param_exports);
 }
 
diff --git a/src/gallium/drivers/radeonsi/si_shader.c b/src/gallium/drivers/radeonsi/si_shader.c
index fa35489ea50..0e62bf261fb 100644
--- a/src/gallium/drivers/radeonsi/si_shader.c
+++ b/src/gallium/drivers/radeonsi/si_shader.c
@@ -1369,6 +1369,7 @@ static void si_optimize_vs_outputs(struct si_shader_context *ctx)
 {
 	struct si_shader *shader = ctx->shader;
 	struct si_shader_info *info = &shader->selector->info;
+	unsigned skip_vs_optim_mask = 0;
 
 	if ((ctx->type != PIPE_SHADER_VERTEX &&
 	     ctx->type != PIPE_SHADER_TESS_EVAL) ||
@@ -1376,10 +1377,20 @@ static void si_optimize_vs_outputs(struct si_shader_context *ctx)
 	    shader->key.as_es)
 		return;
 
+	/* Optimizing these outputs is not possible, since they might be overriden
+	* at runtime with S_028644_PT_SPRITE_TEX. */
+	for (int i = 0; i < info->num_outputs; i++) {
+		if (info->output_semantic_name[i] == TGSI_SEMANTIC_PCOORD ||
+		  info->output_semantic_name[i] == TGSI_SEMANTIC_TEXCOORD) {
+			 skip_vs_optim_mask |= 1u << shader->info.vs_output_param_offset[i];
+		}
+	}
+
 	ac_optimize_vs_outputs(&ctx->ac,
 			       ctx->main_fn,
 			       shader->info.vs_output_param_offset,
 			       info->num_outputs,
+			       skip_vs_optim_mask,
 			       &shader->info.nr_param_exports);
 }
 



More information about the mesa-commit mailing list