[Mesa-dev] [PATCH] swr/rast: fix intrinsic/function for LLVM 7 compatibility

Cherniak, Bruce bruce.cherniak at intel.com
Tue Oct 16 12:51:18 UTC 2018


Reviewed-by: Bruce Cherniak <bruce.cherniak at intel.com>

> On Oct 15, 2018, at 9:53 AM, Alok Hota <alok.hota at intel.com> wrote:
> 
> Converted from x86 VFMADDPS intrinsic to generic LLVM intrinsic, and
> removed createInstructionSimplifierPass, which were both removed in LLVM
> 7.0.0
> 
> These changes combine patches we received from the community and our own
> internal patches
> ---
> .../swr/rasterizer/codegen/gen_llvm_ir_macros.py      |  2 +-
> .../drivers/swr/rasterizer/jitter/blend_jit.cpp       |  1 -
> .../drivers/swr/rasterizer/jitter/builder_misc.cpp    | 11 ++---------
> .../drivers/swr/rasterizer/jitter/fetch_jit.cpp       |  1 -
> .../rasterizer/jitter/functionpasses/lower_x86.cpp    |  1 -
> .../drivers/swr/rasterizer/jitter/streamout_jit.cpp   |  1 -
> 6 files changed, 3 insertions(+), 14 deletions(-)
> 
> diff --git a/src/gallium/drivers/swr/rasterizer/codegen/gen_llvm_ir_macros.py b/src/gallium/drivers/swr/rasterizer/codegen/gen_llvm_ir_macros.py
> index 2e7f1a88a0..d34e88d1bc 100644
> --- a/src/gallium/drivers/swr/rasterizer/codegen/gen_llvm_ir_macros.py
> +++ b/src/gallium/drivers/swr/rasterizer/codegen/gen_llvm_ir_macros.py
> @@ -57,7 +57,6 @@ intrinsics = [
>     ['VHSUBPS',     ['a', 'b'], 'a'],
>     ['VPTESTC',     ['a', 'b'], 'mInt32Ty'],
>     ['VPTESTZ',     ['a', 'b'], 'mInt32Ty'],
> -    ['VFMADDPS',    ['a', 'b', 'c'], 'a'],
>     ['VPHADDD',     ['a', 'b'], 'a'],
>     ['PDEP32',      ['a', 'b'], 'a'],
>     ['RDTSC',       [], 'mInt64Ty'],
> @@ -71,6 +70,7 @@ llvm_intrinsics = [
>     ['STACKRESTORE', 'stackrestore', ['a'], []],
>     ['VMINPS', 'minnum', ['a', 'b'], ['a']],
>     ['VMAXPS', 'maxnum', ['a', 'b'], ['a']],
> +    ['VFMADDPS', 'fmuladd', ['a', 'b', 'c'], ['a']],
>     ['DEBUGTRAP', 'debugtrap', [], []],
>     ['POPCNT', 'ctpop', ['a'], ['a']],
>     ['LOG2', 'log2', ['a'], ['a']],
> diff --git a/src/gallium/drivers/swr/rasterizer/jitter/blend_jit.cpp b/src/gallium/drivers/swr/rasterizer/jitter/blend_jit.cpp
> index f89c502db7..d5328c8e4e 100644
> --- a/src/gallium/drivers/swr/rasterizer/jitter/blend_jit.cpp
> +++ b/src/gallium/drivers/swr/rasterizer/jitter/blend_jit.cpp
> @@ -870,7 +870,6 @@ struct BlendJit : public Builder
>         passes.add(createCFGSimplificationPass());
>         passes.add(createEarlyCSEPass());
>         passes.add(createInstructionCombiningPass());
> -        passes.add(createInstructionSimplifierPass());
>         passes.add(createConstantPropagationPass());
>         passes.add(createSCCPPass());
>         passes.add(createAggressiveDCEPass());
> diff --git a/src/gallium/drivers/swr/rasterizer/jitter/builder_misc.cpp b/src/gallium/drivers/swr/rasterizer/jitter/builder_misc.cpp
> index 4116dad443..26d8688f5e 100644
> --- a/src/gallium/drivers/swr/rasterizer/jitter/builder_misc.cpp
> +++ b/src/gallium/drivers/swr/rasterizer/jitter/builder_misc.cpp
> @@ -755,15 +755,8 @@ namespace SwrJit
>     Value* Builder::FMADDPS(Value* a, Value* b, Value* c)
>     {
>         Value* vOut;
> -        // use FMADs if available
> -        if (JM()->mArch.AVX2())
> -        {
> -            vOut = VFMADDPS(a, b, c);
> -        }
> -        else
> -        {
> -            vOut = FADD(FMUL(a, b), c);
> -        }
> +        // This maps to LLVM fmuladd intrinsic
> +        vOut = VFMADDPS(a, b, c);
>         return vOut;
>     }
> 
> diff --git a/src/gallium/drivers/swr/rasterizer/jitter/fetch_jit.cpp b/src/gallium/drivers/swr/rasterizer/jitter/fetch_jit.cpp
> index b4d326ebdc..3ad0fabe81 100644
> --- a/src/gallium/drivers/swr/rasterizer/jitter/fetch_jit.cpp
> +++ b/src/gallium/drivers/swr/rasterizer/jitter/fetch_jit.cpp
> @@ -294,7 +294,6 @@ Function* FetchJit::Create(const FETCH_COMPILE_STATE& fetchState)
>     optPasses.add(createCFGSimplificationPass());
>     optPasses.add(createEarlyCSEPass());
>     optPasses.add(createInstructionCombiningPass());
> -    optPasses.add(createInstructionSimplifierPass());
>     optPasses.add(createConstantPropagationPass());
>     optPasses.add(createSCCPPass());
>     optPasses.add(createAggressiveDCEPass());
> diff --git a/src/gallium/drivers/swr/rasterizer/jitter/functionpasses/lower_x86.cpp b/src/gallium/drivers/swr/rasterizer/jitter/functionpasses/lower_x86.cpp
> index 7605823c04..c34959d35e 100644
> --- a/src/gallium/drivers/swr/rasterizer/jitter/functionpasses/lower_x86.cpp
> +++ b/src/gallium/drivers/swr/rasterizer/jitter/functionpasses/lower_x86.cpp
> @@ -76,7 +76,6 @@ namespace SwrJit
>         {"meta.intrinsic.VCVTPS2PH", Intrinsic::x86_vcvtps2ph_256},
>         {"meta.intrinsic.VPTESTC", Intrinsic::x86_avx_ptestc_256},
>         {"meta.intrinsic.VPTESTZ", Intrinsic::x86_avx_ptestz_256},
> -        {"meta.intrinsic.VFMADDPS", Intrinsic::x86_fma_vfmadd_ps_256},
>         {"meta.intrinsic.VPHADDD", Intrinsic::x86_avx2_phadd_d},
>         {"meta.intrinsic.PDEP32", Intrinsic::x86_bmi_pdep_32},
>         {"meta.intrinsic.RDTSC", Intrinsic::x86_rdtsc},
> diff --git a/src/gallium/drivers/swr/rasterizer/jitter/streamout_jit.cpp b/src/gallium/drivers/swr/rasterizer/jitter/streamout_jit.cpp
> index 8f86af2a4b..11ad36521b 100644
> --- a/src/gallium/drivers/swr/rasterizer/jitter/streamout_jit.cpp
> +++ b/src/gallium/drivers/swr/rasterizer/jitter/streamout_jit.cpp
> @@ -306,7 +306,6 @@ struct StreamOutJit : public Builder
>         passes.add(createCFGSimplificationPass());
>         passes.add(createEarlyCSEPass());
>         passes.add(createInstructionCombiningPass());
> -        passes.add(createInstructionSimplifierPass());
>         passes.add(createConstantPropagationPass());
>         passes.add(createSCCPPass());
>         passes.add(createAggressiveDCEPass());
> -- 
> 2.17.1
> 
> _______________________________________________
> mesa-dev mailing list
> mesa-dev at lists.freedesktop.org
> https://lists.freedesktop.org/mailman/listinfo/mesa-dev



More information about the mesa-dev mailing list