[Mesa-dev] [PATCH 2/2] radeonsi: implement TGSI_OPCODE_BFI (v2)
Tom Stellard
tom at stellard.net
Mon Mar 16 06:22:21 PDT 2015
On Sun, Mar 15, 2015 at 07:59:52PM +0100, Marek Olšák wrote:
> From: Marek Olšák <marek.olsak at amd.com>
>
> v2: Don't use the intrinsics, the shader backend can recognize these
> patterns and generates optimal code automatically.
Reviewed-by: Tom Stellard <thomas.stellard at amd.com>
> ---
> .../drivers/radeon/radeon_setup_tgsi_llvm.c | 34 ++++++++++++++++++++++
> 1 file changed, 34 insertions(+)
>
> diff --git a/src/gallium/drivers/radeon/radeon_setup_tgsi_llvm.c b/src/gallium/drivers/radeon/radeon_setup_tgsi_llvm.c
> index 0034b56..d89e2b4 100644
> --- a/src/gallium/drivers/radeon/radeon_setup_tgsi_llvm.c
> +++ b/src/gallium/drivers/radeon/radeon_setup_tgsi_llvm.c
> @@ -1234,6 +1234,39 @@ build_tgsi_intrinsic_nomem(
> build_tgsi_intrinsic(action, bld_base, emit_data, LLVMReadNoneAttribute);
> }
>
> +static void emit_bfi(const struct lp_build_tgsi_action * action,
> + struct lp_build_tgsi_context * bld_base,
> + struct lp_build_emit_data * emit_data)
> +{
> + struct gallivm_state *gallivm = bld_base->base.gallivm;
> + LLVMBuilderRef builder = gallivm->builder;
> + LLVMValueRef bfi_args[3];
> +
> + // Calculate the bitmask: (((1 << src3) - 1) << src2
> + bfi_args[0] = LLVMBuildShl(builder,
> + LLVMBuildSub(builder,
> + LLVMBuildShl(builder,
> + bld_base->int_bld.one,
> + emit_data->args[3], ""),
> + bld_base->int_bld.one, ""),
> + emit_data->args[2], "");
> +
> + bfi_args[1] = LLVMBuildShl(builder, emit_data->args[1],
> + emit_data->args[2], "");
> +
> + bfi_args[2] = emit_data->args[0];
> +
> + /* Calculate:
> + * (arg0 & arg1) | (~arg0 & arg2) = arg2 ^ (arg0 & (arg1 ^ arg2)
> + * Use the right-hand side, which the LLVM backend can convert to V_BFI.
> + */
> + emit_data->output[emit_data->chan] =
> + LLVMBuildXor(builder, bfi_args[2],
> + LLVMBuildAnd(builder, bfi_args[0],
> + LLVMBuildXor(builder, bfi_args[1], bfi_args[2],
> + ""), ""), "");
> +}
> +
> /* this is ffs in C */
> static void emit_lsb(const struct lp_build_tgsi_action * action,
> struct lp_build_tgsi_context * bld_base,
> @@ -1381,6 +1414,7 @@ void radeon_llvm_context_init(struct radeon_llvm_context * ctx)
> bld_base->op_actions[TGSI_OPCODE_ABS].intr_name = "fabs";
> bld_base->op_actions[TGSI_OPCODE_AND].emit = emit_and;
> bld_base->op_actions[TGSI_OPCODE_ARL].emit = emit_arl;
> + bld_base->op_actions[TGSI_OPCODE_BFI].emit = emit_bfi;
> bld_base->op_actions[TGSI_OPCODE_BGNLOOP].emit = bgnloop_emit;
> bld_base->op_actions[TGSI_OPCODE_BREV].emit = build_tgsi_intrinsic_nomem;
> bld_base->op_actions[TGSI_OPCODE_BREV].intr_name = "llvm.AMDGPU.brev";
> --
> 2.1.0
>
> _______________________________________________
> mesa-dev mailing list
> mesa-dev at lists.freedesktop.org
> http://lists.freedesktop.org/mailman/listinfo/mesa-dev
More information about the mesa-dev
mailing list