Mesa (main): aco: Implement byte and lane permute intrinsics.
GitLab Mirror
gitlab-mirror at kemper.freedesktop.org
Wed Jun 9 17:25:49 UTC 2021
Module: Mesa
Branch: main
Commit: ce141e4c5f2297e5f7c9afbdd3f4c1beee449544
URL: http://cgit.freedesktop.org/mesa/mesa/commit/?id=ce141e4c5f2297e5f7c9afbdd3f4c1beee449544
Author: Timur Kristóf <timur.kristof at gmail.com>
Date: Fri May 28 21:57:43 2021 +0200
aco: Implement byte and lane permute intrinsics.
Signed-off-by: Timur Kristóf <timur.kristof at gmail.com>
Reviewed-by: Tony Wasserka <tony.wasserka at gmx.de>
Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/11072>
---
src/amd/compiler/aco_instruction_selection.cpp | 25 ++++++++++++++++++++++
.../compiler/aco_instruction_selection_setup.cpp | 2 ++
2 files changed, 27 insertions(+)
diff --git a/src/amd/compiler/aco_instruction_selection.cpp b/src/amd/compiler/aco_instruction_selection.cpp
index 40a1687c226..c06bdb1b1fb 100644
--- a/src/amd/compiler/aco_instruction_selection.cpp
+++ b/src/amd/compiler/aco_instruction_selection.cpp
@@ -8387,6 +8387,31 @@ void visit_intrinsic(isel_context *ctx, nir_intrinsic_instr *instr)
emit_wqm(bld, wqm_tmp, dst);
break;
}
+ case nir_intrinsic_byte_permute_amd: {
+ Temp dst = get_ssa_temp(ctx, &instr->dest.ssa);
+ assert(dst.regClass() == v1);
+ assert(ctx->program->chip_class >= GFX8);
+ bld.vop3(aco_opcode::v_perm_b32, Definition(dst),
+ get_ssa_temp(ctx, instr->src[0].ssa),
+ as_vgpr(ctx, get_ssa_temp(ctx, instr->src[1].ssa)),
+ as_vgpr(ctx, get_ssa_temp(ctx, instr->src[2].ssa)));
+ break;
+ }
+ case nir_intrinsic_lane_permute_16_amd: {
+ Temp src = get_ssa_temp(ctx, instr->src[0].ssa);
+ Temp dst = get_ssa_temp(ctx, &instr->dest.ssa);
+ assert(ctx->program->chip_class >= GFX10);
+
+ if (src.regClass() == s1) {
+ bld.copy(Definition(dst), src);
+ } else if (dst.regClass() == v1 && src.regClass() == v1) {
+ bld.vop3(aco_opcode::v_permlane16_b32, Definition(dst), src,
+ bld.as_uniform(get_ssa_temp(ctx, instr->src[1].ssa)), bld.as_uniform(get_ssa_temp(ctx, instr->src[2].ssa)));
+ } else {
+ isel_err(&instr->instr, "Unimplemented lane_permute_16_amd");
+ }
+ break;
+ }
case nir_intrinsic_load_helper_invocation:
case nir_intrinsic_is_helper_invocation: {
/* load_helper() after demote() get lowered to is_helper().
diff --git a/src/amd/compiler/aco_instruction_selection_setup.cpp b/src/amd/compiler/aco_instruction_selection_setup.cpp
index f7cebe0579f..7141bbf2c93 100644
--- a/src/amd/compiler/aco_instruction_selection_setup.cpp
+++ b/src/amd/compiler/aco_instruction_selection_setup.cpp
@@ -772,6 +772,8 @@ void init_context(isel_context *ctx, nir_shader *shader)
case nir_intrinsic_load_tess_coord:
case nir_intrinsic_write_invocation_amd:
case nir_intrinsic_mbcnt_amd:
+ case nir_intrinsic_byte_permute_amd:
+ case nir_intrinsic_lane_permute_16_amd:
case nir_intrinsic_load_instance_id:
case nir_intrinsic_ssbo_atomic_add:
case nir_intrinsic_ssbo_atomic_imin:
More information about the mesa-commit
mailing list