[Mesa-dev] [PATCH v2 6/8] nvc0/ir: add a lowering pass for surfaces on Fermi
Ilia Mirkin
imirkin at alum.mit.edu
Mon May 16 19:22:43 UTC 2016
Reviewed-by: Ilia Mirkin <imirkin at alum.mit.edu>
On Mon, May 16, 2016 at 3:10 PM, Samuel Pitoiset
<samuel.pitoiset at gmail.com> wrote:
> v2: - remove one useless setSrc() call because moveSources() handles it
> - make sure the format doesn't mismatch only when it's != FMT_NONE
>
> Signed-off-by: Samuel Pitoiset <samuel.pitoiset at gmail.com>
> ---
> .../nouveau/codegen/nv50_ir_lowering_nvc0.cpp | 116 +++++++++++++++++++++
> .../nouveau/codegen/nv50_ir_lowering_nvc0.h | 2 +
> 2 files changed, 118 insertions(+)
>
> diff --git a/src/gallium/drivers/nouveau/codegen/nv50_ir_lowering_nvc0.cpp b/src/gallium/drivers/nouveau/codegen/nv50_ir_lowering_nvc0.cpp
> index 1068c21..fe3b9a4 100644
> --- a/src/gallium/drivers/nouveau/codegen/nv50_ir_lowering_nvc0.cpp
> +++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_lowering_nvc0.cpp
> @@ -1982,6 +1982,120 @@ NVC0LoweringPass::handleSurfaceOpNVE4(TexInstruction *su)
> su->sType = (su->tex.target == TEX_TARGET_BUFFER) ? TYPE_U32 : TYPE_U8;
> }
>
> +void
> +NVC0LoweringPass::processSurfaceCoordsNVC0(TexInstruction *su)
> +{
> + const int idx = su->tex.r;
> + const int dim = su->tex.target.getDim();
> + const int arg = dim + (su->tex.target.isArray() || su->tex.target.isCube());
> + const uint16_t base = idx * NVE4_SU_INFO__STRIDE;
> + int c;
> + Value *zero = bld.mkImm(0);
> + Value *src[3];
> + Value *v;
> + Value *ind = NULL;
> +
> + if (su->tex.rIndirectSrc >= 0) {
> + // FIXME: out of bounds
> + assert(su->tex.r == 0);
> + ind = bld.mkOp2v(OP_SHL, TYPE_U32, bld.getSSA(),
> + su->getIndirectR(), bld.mkImm(6));
> + }
> +
> + // get surface coordinates
> + for (c = 0; c < arg; ++c)
> + src[c] = su->getSrc(c);
> + for (; c < 3; ++c)
> + src[c] = zero;
> +
> + // calculate pixel offset
> + if (su->op == OP_SULDP || su->op == OP_SUREDP) {
> + v = loadSuInfo32(ind, base + NVE4_SU_INFO_BSIZE);
> + su->setSrc(0, bld.mkOp2v(OP_MUL, TYPE_U32, bld.getSSA(), src[0], v));
> + }
> +
> + // add array layer offset
> + if (su->tex.target.isArray() || su->tex.target.isCube()) {
> + v = loadSuInfo32(ind, base + NVE4_SU_INFO_ARRAY);
> + assert(dim > 1);
> + su->setSrc(2, bld.mkOp2v(OP_MUL, TYPE_U32, bld.getSSA(), src[2], v));
> + }
> +
> + // prevent read fault when the image is not actually bound
> + CmpInstruction *pred =
> + bld.mkCmp(OP_SET, CC_EQ, TYPE_U32, bld.getSSA(1, FILE_PREDICATE),
> + TYPE_U32, bld.mkImm(0),
> + loadSuInfo32(ind, base + NVE4_SU_INFO_ADDR));
> + if (su->tex.format) {
> + const TexInstruction::ImgFormatDesc *format = su->tex.format;
> + int blockwidth = format->bits[0] + format->bits[1] +
> + format->bits[2] + format->bits[3];
> +
> + if (format->components != 0) {
> + // make sure that the format doesn't mismatch when it's not FMT_NONE
> + bld.mkCmp(OP_SET_OR, CC_NE, TYPE_U32, pred->getDef(0),
> + TYPE_U32, bld.loadImm(NULL, blockwidth / 8),
> + loadSuInfo32(ind, base + NVE4_SU_INFO_BSIZE),
> + pred->getDef(0));
> + }
> + }
> + su->setPredicate(CC_NOT_P, pred->getDef(0));
> +}
> +
> +void
> +NVC0LoweringPass::handleSurfaceOpNVC0(TexInstruction *su)
> +{
> + if (su->tex.target == TEX_TARGET_1D_ARRAY) {
> + /* As 1d arrays also need 3 coordinates, switching to TEX_TARGET_2D_ARRAY
> + * will simplify the lowering pass and the texture constraints. */
> + su->moveSources(1, 1);
> + su->setSrc(1, bld.loadImm(NULL, 0));
> + su->tex.target = TEX_TARGET_2D_ARRAY;
> + }
> +
> + processSurfaceCoordsNVC0(su);
> +
> + if (su->op == OP_SULDP)
> + convertSurfaceFormat(su);
> +
> + if (su->op == OP_SUREDB || su->op == OP_SUREDP) {
> + const int dim = su->tex.target.getDim();
> + const int arg = dim + (su->tex.target.isArray() || su->tex.target.isCube());
> + LValue *addr = bld.getSSA(8);
> + Value *def = su->getDef(0);
> +
> + su->op = OP_SULEA;
> +
> + // Set the destination to the address
> + su->dType = TYPE_U64;
> + su->setDef(0, addr);
> + su->setDef(1, su->getPredicate());
> +
> + bld.setPosition(su, true);
> +
> + // Perform the atomic op
> + Instruction *red = bld.mkOp(OP_ATOM, su->sType, bld.getSSA());
> + red->subOp = su->subOp;
> + red->setSrc(0, bld.mkSymbol(FILE_MEMORY_GLOBAL, 0, su->sType, 0));
> + red->setSrc(1, su->getSrc(arg));
> + if (red->subOp == NV50_IR_SUBOP_ATOM_CAS)
> + red->setSrc(2, su->getSrc(arg + 1));
> + red->setIndirect(0, 0, addr);
> +
> + // make sure to initialize dst value when the atomic operation is not
> + // performed
> + Instruction *mov = bld.mkMov(bld.getSSA(), bld.loadImm(NULL, 0));
> +
> + assert(su->cc == CC_NOT_P);
> + red->setPredicate(su->cc, su->getPredicate());
> + mov->setPredicate(CC_P, su->getPredicate());
> +
> + bld.mkOp2(OP_UNION, TYPE_U32, def, red->getDef(0), mov->getDef(0));
> +
> + handleCasExch(red, false);
> + }
> +}
> +
> bool
> NVC0LoweringPass::handleWRSV(Instruction *i)
> {
> @@ -2455,6 +2569,8 @@ NVC0LoweringPass::visit(Instruction *i)
> case OP_SUREDP:
> if (targ->getChipset() >= NVISA_GK104_CHIPSET)
> handleSurfaceOpNVE4(i->asTex());
> + else
> + handleSurfaceOpNVC0(i->asTex());
> break;
> case OP_SUQ:
> handleSUQ(i->asTex());
> diff --git a/src/gallium/drivers/nouveau/codegen/nv50_ir_lowering_nvc0.h b/src/gallium/drivers/nouveau/codegen/nv50_ir_lowering_nvc0.h
> index c007e09..2321956 100644
> --- a/src/gallium/drivers/nouveau/codegen/nv50_ir_lowering_nvc0.h
> +++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_lowering_nvc0.h
> @@ -106,6 +106,7 @@ protected:
> bool handleATOM(Instruction *);
> bool handleCasExch(Instruction *, bool needCctl);
> void handleSurfaceOpNVE4(TexInstruction *);
> + void handleSurfaceOpNVC0(TexInstruction *);
> void handleSharedATOM(Instruction *);
> void handleSharedATOMNVE4(Instruction *);
> void handleLDST(Instruction *);
> @@ -138,6 +139,7 @@ private:
>
> void adjustCoordinatesMS(TexInstruction *);
> void processSurfaceCoordsNVE4(TexInstruction *);
> + void processSurfaceCoordsNVC0(TexInstruction *);
> void convertSurfaceFormat(TexInstruction *);
>
> protected:
> --
> 2.8.2
>
> _______________________________________________
> mesa-dev mailing list
> mesa-dev at lists.freedesktop.org
> https://lists.freedesktop.org/mailman/listinfo/mesa-dev
More information about the mesa-dev
mailing list