[Mesa-dev] [PATCH v2 1/7] nv50/ir: add nv50_ir_prog_info_out
Mark Menzynski
mmenzyns at redhat.com
Fri Feb 21 12:19:56 UTC 2020
From: Karol Herbst <kherbst at redhat.com>
Split out the output relevant fields from the nv50_ir_prog_info struct
in order to have a cleaner separation between the input and output of
the compilation.
Signed-off-by: Karol Herbst <kherbst at redhat.com>
---
.../drivers/nouveau/codegen/nv50_ir.cpp | 49 ++--
src/gallium/drivers/nouveau/codegen/nv50_ir.h | 9 +-
.../drivers/nouveau/codegen/nv50_ir_driver.h | 117 +++++---
.../nouveau/codegen/nv50_ir_from_common.cpp | 14 +-
.../nouveau/codegen/nv50_ir_from_common.h | 3 +-
.../nouveau/codegen/nv50_ir_from_nir.cpp | 204 +++++++-------
.../nouveau/codegen/nv50_ir_from_tgsi.cpp | 256 +++++++++---------
.../nouveau/codegen/nv50_ir_lowering_nvc0.cpp | 6 +-
.../nouveau/codegen/nv50_ir_target.cpp | 2 +-
.../drivers/nouveau/codegen/nv50_ir_target.h | 5 +-
.../nouveau/codegen/nv50_ir_target_nv50.cpp | 17 +-
.../nouveau/codegen/nv50_ir_target_nv50.h | 3 +-
.../drivers/nouveau/nouveau_compiler.c | 9 +-
.../drivers/nouveau/nv50/nv50_program.c | 61 +++--
.../drivers/nouveau/nvc0/nvc0_program.c | 89 +++---
15 files changed, 450 insertions(+), 394 deletions(-)
diff --git a/src/gallium/drivers/nouveau/codegen/nv50_ir.cpp b/src/gallium/drivers/nouveau/codegen/nv50_ir.cpp
index c65853578f6..c2c5956874a 100644
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir.cpp
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir.cpp
@@ -1241,15 +1241,18 @@ void Program::releaseValue(Value *value)
extern "C" {
static void
-nv50_ir_init_prog_info(struct nv50_ir_prog_info *info)
+nv50_ir_init_prog_info(struct nv50_ir_prog_info *info,
+ struct nv50_ir_prog_info_out *info_out)
{
+ info_out->target = info->target;
+ info_out->type = info->type;
if (info->type == PIPE_SHADER_TESS_CTRL || info->type == PIPE_SHADER_TESS_EVAL) {
- info->prop.tp.domain = PIPE_PRIM_MAX;
- info->prop.tp.outputPrim = PIPE_PRIM_MAX;
+ info_out->prop.tp.domain = PIPE_PRIM_MAX;
+ info_out->prop.tp.outputPrim = PIPE_PRIM_MAX;
}
if (info->type == PIPE_SHADER_GEOMETRY) {
- info->prop.gp.instanceCount = 1;
- info->prop.gp.maxVertices = 1;
+ info_out->prop.gp.instanceCount = 1;
+ info_out->prop.gp.maxVertices = 1;
}
if (info->type == PIPE_SHADER_COMPUTE) {
info->prop.cp.numThreads[0] =
@@ -1257,23 +1260,26 @@ nv50_ir_init_prog_info(struct nv50_ir_prog_info *info)
info->prop.cp.numThreads[2] = 1;
}
info->io.pointSize = 0xff;
- info->io.instanceId = 0xff;
- info->io.vertexId = 0xff;
- info->io.edgeFlagIn = 0xff;
- info->io.edgeFlagOut = 0xff;
- info->io.fragDepth = 0xff;
- info->io.sampleMask = 0xff;
+ info_out->bin.smemSize = info->bin.smemSize;
+ info_out->io.genUserClip = info->io.genUserClip;
+ info_out->io.instanceId = 0xff;
+ info_out->io.vertexId = 0xff;
+ info_out->io.edgeFlagIn = 0xff;
+ info_out->io.edgeFlagOut = 0xff;
+ info_out->io.fragDepth = 0xff;
+ info_out->io.sampleMask = 0xff;
info->io.backFaceColor[0] = info->io.backFaceColor[1] = 0xff;
}
int
-nv50_ir_generate_code(struct nv50_ir_prog_info *info)
+nv50_ir_generate_code(struct nv50_ir_prog_info *info,
+ struct nv50_ir_prog_info_out *info_out)
{
int ret = 0;
nv50_ir::Program::Type type;
- nv50_ir_init_prog_info(info);
+ nv50_ir_init_prog_info(info, info_out);
#define PROG_TYPE_CASE(a, b) \
case PIPE_SHADER_##a: type = nv50_ir::Program::TYPE_##b; break
@@ -1301,15 +1307,16 @@ nv50_ir_generate_code(struct nv50_ir_prog_info *info)
return -1;
}
prog->driver = info;
+ prog->driver_out = info_out;
prog->dbgFlags = info->dbgFlags;
prog->optLevel = info->optLevel;
switch (info->bin.sourceRep) {
case PIPE_SHADER_IR_NIR:
- ret = prog->makeFromNIR(info) ? 0 : -2;
+ ret = prog->makeFromNIR(info, info_out) ? 0 : -2;
break;
case PIPE_SHADER_IR_TGSI:
- ret = prog->makeFromTGSI(info) ? 0 : -2;
+ ret = prog->makeFromTGSI(info, info_out) ? 0 : -2;
break;
default:
ret = -1;
@@ -1320,7 +1327,7 @@ nv50_ir_generate_code(struct nv50_ir_prog_info *info)
if (prog->dbgFlags & NV50_IR_DEBUG_VERBOSE)
prog->print();
- targ->parseDriverInfo(info);
+ targ->parseDriverInfo(info, info_out);
prog->getTarget()->runLegalizePass(prog, nv50_ir::CG_STAGE_PRE_SSA);
prog->convertToSSA();
@@ -1342,7 +1349,7 @@ nv50_ir_generate_code(struct nv50_ir_prog_info *info)
prog->optimizePostRA(info->optLevel);
- if (!prog->emitBinary(info)) {
+ if (!prog->emitBinary(info_out)) {
ret = -5;
goto out;
}
@@ -1350,10 +1357,10 @@ nv50_ir_generate_code(struct nv50_ir_prog_info *info)
out:
INFO_DBG(prog->dbgFlags, VERBOSE, "nv50_ir_generate_code: ret = %i\n", ret);
- info->bin.maxGPR = prog->maxGPR;
- info->bin.code = prog->code;
- info->bin.codeSize = prog->binSize;
- info->bin.tlsSpace = prog->tlsSize;
+ info_out->bin.maxGPR = prog->maxGPR;
+ info_out->bin.code = prog->code;
+ info_out->bin.codeSize = prog->binSize;
+ info_out->bin.tlsSpace = prog->tlsSize;
delete prog;
nv50_ir::Target::destroy(targ);
diff --git a/src/gallium/drivers/nouveau/codegen/nv50_ir.h b/src/gallium/drivers/nouveau/codegen/nv50_ir.h
index d2200fc4ea9..78eb3437800 100644
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir.h
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir.h
@@ -1286,13 +1286,15 @@ public:
inline void del(Function *fn, int& id) { allFuncs.remove(id); }
inline void add(Value *rval, int& id) { allRValues.insert(rval, id); }
- bool makeFromNIR(struct nv50_ir_prog_info *);
- bool makeFromTGSI(struct nv50_ir_prog_info *);
+ bool makeFromNIR(struct nv50_ir_prog_info *,
+ struct nv50_ir_prog_info_out *);
+ bool makeFromTGSI(struct nv50_ir_prog_info *,
+ struct nv50_ir_prog_info_out *);
bool convertToSSA();
bool optimizeSSA(int level);
bool optimizePostRA(int level);
bool registerAllocation();
- bool emitBinary(struct nv50_ir_prog_info *);
+ bool emitBinary(struct nv50_ir_prog_info_out *);
const Target *getTarget() const { return target; }
@@ -1328,6 +1330,7 @@ public:
void *targetPriv; // e.g. to carry information between passes
const struct nv50_ir_prog_info *driver; // for driver configuration
+ const struct nv50_ir_prog_info_out *driver_out; // for driver configuration
void releaseInstruction(Instruction *);
void releaseValue(Value *);
diff --git a/src/gallium/drivers/nouveau/codegen/nv50_ir_driver.h b/src/gallium/drivers/nouveau/codegen/nv50_ir_driver.h
index 55cc4c609f0..dab1ce030cb 100644
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_driver.h
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_driver.h
@@ -75,6 +75,9 @@ struct nv50_ir_prog_symbol
#define NVISA_GM107_CHIPSET 0x110
#define NVISA_GM200_CHIPSET 0x120
+struct nv50_ir_prog_info_out;
+
+/* used for the input data and assignSlot interface */
struct nv50_ir_prog_info
{
uint16_t target; /* chipset (0x50, 0x84, 0xc0, ...) */
@@ -86,15 +89,78 @@ struct nv50_ir_prog_info
bool omitLineNum; /* only used for printing the prog when dbgFlags is set */
struct {
- int16_t maxGPR; /* may be -1 if none used */
int16_t maxOutput;
+ uint32_t smemSize; /* required shared memory per block */
+ uint8_t sourceRep; /* PIPE_SHADER_IR_* */
+ const void *source;
+ } bin;
+
+ struct {
+ uint32_t *buf; /* for IMMEDIATE_ARRAY */
+ uint16_t bufSize; /* size of immediate array */
+ uint16_t count; /* count of inline immediates */
+ uint32_t *data; /* inline immediate data */
+ uint8_t *type; /* for each vec4 (128 bit) */
+ } immd;
+
+ union {
+ struct {
+ uint32_t inputMask[4]; /* mask of attributes read (1 bit per scalar) */
+ } vp;
+ struct {
+ uint8_t inputPrim;
+ } gp;
+ struct {
+ bool persampleInvocation;
+ } fp;
+ struct {
+ uint32_t inputOffset; /* base address for user args */
+ uint32_t sharedOffset; /* reserved space in s[] */
+ uint32_t gridInfoBase; /* base address for NTID,NCTAID */
+ uint16_t numThreads[3]; /* max number of threads */
+ } cp;
+ } prop;
+
+ struct {
+ int8_t genUserClip; /* request user clip planes for ClipVertex */
+ uint8_t auxCBSlot; /* driver constant buffer slot */
+ uint16_t ucpBase; /* base address for UCPs */
+ uint16_t drawInfoBase; /* base address for draw parameters */
+ uint16_t alphaRefBase; /* base address for alpha test values */
+ uint8_t pointSize; /* output index for PointSize */
+ int8_t viewportId; /* output index of ViewportIndex */
+ uint8_t backFaceColor[2]; /* input/output indices of back face colour */
+ bool mul_zero_wins; /* program wants for x*0 = 0 */
+ bool nv50styleSurfaces; /* generate gX[] access for raw buffers */
+ uint16_t texBindBase; /* base address for tex handles (nve4) */
+ uint16_t fbtexBindBase; /* base address for fbtex handle (nve4) */
+ uint16_t suInfoBase; /* base address for surface info (nve4) */
+ uint16_t bindlessBase; /* base address for bindless image info (nve4) */
+ uint16_t bufInfoBase; /* base address for buffer info */
+ uint16_t sampleInfoBase; /* base address for sample positions */
+ uint8_t msInfoCBSlot; /* cX[] used for multisample info */
+ uint16_t msInfoBase; /* base address for multisample info */
+ uint16_t uboInfoBase; /* base address for compute UBOs (gk104+) */
+ } io;
+
+ /* driver callback to assign input/output locations */
+ int (*assignSlots)(struct nv50_ir_prog_info_out *);
+};
+
+/* the produced binary with metadata */
+struct nv50_ir_prog_info_out
+{
+ uint16_t target; /* chipset (0x50, 0x84, 0xc0, ...) */
+
+ uint8_t type; /* PIPE_SHADER */
+
+ struct {
+ int16_t maxGPR; /* may be -1 if none used */
uint32_t tlsSpace; /* required local memory per thread */
uint32_t smemSize; /* required shared memory per block */
uint32_t *code;
uint32_t codeSize;
uint32_t instructions;
- uint8_t sourceRep; /* PIPE_SHADER_IR_* */
- const void *source;
void *relocData;
void *fixupData;
} bin;
@@ -107,17 +173,8 @@ struct nv50_ir_prog_info
uint8_t numPatchConstants; /* also included in numInputs/numOutputs */
uint8_t numSysVals;
- struct {
- uint32_t *buf; /* for IMMEDIATE_ARRAY */
- uint16_t bufSize; /* size of immediate array */
- uint16_t count; /* count of inline immediates */
- uint32_t *data; /* inline immediate data */
- uint8_t *type; /* for each vec4 (128 bit) */
- } immd;
-
union {
struct {
- uint32_t inputMask[4]; /* mask of attributes read (1 bit per scalar) */
bool usesDrawParameters;
} vp;
struct {
@@ -128,7 +185,6 @@ struct nv50_ir_prog_info
uint8_t outputPrim; /* PIPE_PRIM_{TRIANGLES,LINES,POINTS} */
} tp;
struct {
- uint8_t inputPrim;
uint8_t outputPrim;
unsigned instanceCount;
unsigned maxVertices;
@@ -138,57 +194,29 @@ struct nv50_ir_prog_info
bool writesDepth;
bool earlyFragTests;
bool postDepthCoverage;
- bool separateFragData;
bool usesDiscard;
- bool persampleInvocation;
bool usesSampleMaskIn;
bool readsFramebuffer;
bool readsSampleLocations;
+ bool separateFragData;
} fp;
- struct {
- uint32_t inputOffset; /* base address for user args */
- uint32_t sharedOffset; /* reserved space in s[] */
- uint32_t gridInfoBase; /* base address for NTID,NCTAID */
- uint16_t numThreads[3]; /* max number of threads */
- } cp;
} prop;
- uint8_t numBarriers;
-
struct {
uint8_t clipDistances; /* number of clip distance outputs */
uint8_t cullDistances; /* number of cull distance outputs */
int8_t genUserClip; /* request user clip planes for ClipVertex */
- uint8_t auxCBSlot; /* driver constant buffer slot */
- uint16_t ucpBase; /* base address for UCPs */
- uint16_t drawInfoBase; /* base address for draw parameters */
- uint16_t alphaRefBase; /* base address for alpha test values */
- uint8_t pointSize; /* output index for PointSize */
uint8_t instanceId; /* system value index of InstanceID */
uint8_t vertexId; /* system value index of VertexID */
uint8_t edgeFlagIn;
uint8_t edgeFlagOut;
- int8_t viewportId; /* output index of ViewportIndex */
uint8_t fragDepth; /* output index of FragDepth */
uint8_t sampleMask; /* output index of SampleMask */
- uint8_t backFaceColor[2]; /* input/output indices of back face colour */
uint8_t globalAccess; /* 1 for read, 2 for wr, 3 for rw */
bool fp64; /* program uses fp64 math */
- bool mul_zero_wins; /* program wants for x*0 = 0 */
- bool nv50styleSurfaces; /* generate gX[] access for raw buffers */
- uint16_t texBindBase; /* base address for tex handles (nve4) */
- uint16_t fbtexBindBase; /* base address for fbtex handle (nve4) */
- uint16_t suInfoBase; /* base address for surface info (nve4) */
- uint16_t bindlessBase; /* base address for bindless image info (nve4) */
- uint16_t bufInfoBase; /* base address for buffer info */
- uint16_t sampleInfoBase; /* base address for sample positions */
- uint8_t msInfoCBSlot; /* cX[] used for multisample info */
- uint16_t msInfoBase; /* base address for multisample info */
- uint16_t uboInfoBase; /* base address for compute UBOs (gk104+) */
} io;
- /* driver callback to assign input/output locations */
- int (*assignSlots)(struct nv50_ir_prog_info *);
+ uint8_t numBarriers;
void *driverPriv;
};
@@ -197,7 +225,8 @@ struct nv50_ir_prog_info
extern "C" {
#endif
-extern int nv50_ir_generate_code(struct nv50_ir_prog_info *);
+extern int nv50_ir_generate_code(struct nv50_ir_prog_info *,
+ struct nv50_ir_prog_info_out *);
extern void nv50_ir_relocate_code(void *relocData, uint32_t *code,
uint32_t codePos,
diff --git a/src/gallium/drivers/nouveau/codegen/nv50_ir_from_common.cpp b/src/gallium/drivers/nouveau/codegen/nv50_ir_from_common.cpp
index 0ad6087e588..0a70c6881cc 100644
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_from_common.cpp
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_from_common.cpp
@@ -24,9 +24,11 @@
namespace nv50_ir {
-ConverterCommon::ConverterCommon(Program *prog, nv50_ir_prog_info *info)
+ConverterCommon::ConverterCommon(Program *prog, nv50_ir_prog_info *info,
+ nv50_ir_prog_info_out *info_out)
: BuildUtil(prog),
- info(info) {}
+ info(info),
+ info_out(info_out) {}
ConverterCommon::Subroutine *
ConverterCommon::getSubroutine(unsigned ip)
@@ -82,7 +84,7 @@ ConverterCommon::handleUserClipPlanes()
int n, i, c;
for (c = 0; c < 4; ++c) {
- for (i = 0; i < info->io.genUserClip; ++i) {
+ for (i = 0; i < info_out->io.genUserClip; ++i) {
Symbol *sym = mkSymbol(FILE_MEMORY_CONST, info->io.auxCBSlot,
TYPE_F32, info->io.ucpBase + i * 16 + c * 4);
Value *ucp = mkLoadv(TYPE_F32, sym, NULL);
@@ -93,13 +95,13 @@ ConverterCommon::handleUserClipPlanes()
}
}
- const int first = info->numOutputs - (info->io.genUserClip + 3) / 4;
+ const int first = info_out->numOutputs - (info_out->io.genUserClip + 3) / 4;
- for (i = 0; i < info->io.genUserClip; ++i) {
+ for (i = 0; i < info_out->io.genUserClip; ++i) {
n = i / 4 + first;
c = i % 4;
Symbol *sym =
- mkSymbol(FILE_SHADER_OUTPUT, 0, TYPE_F32, info->out[n].slot[c] * 4);
+ mkSymbol(FILE_SHADER_OUTPUT, 0, TYPE_F32, info_out->out[n].slot[c] * 4);
mkStore(OP_EXPORT, TYPE_F32, sym, NULL, res[i]);
}
}
diff --git a/src/gallium/drivers/nouveau/codegen/nv50_ir_from_common.h b/src/gallium/drivers/nouveau/codegen/nv50_ir_from_common.h
index e44eea86a90..a144ca23af0 100644
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_from_common.h
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_from_common.h
@@ -28,7 +28,7 @@ namespace nv50_ir {
class ConverterCommon : public BuildUtil
{
public:
- ConverterCommon(Program *, nv50_ir_prog_info *);
+ ConverterCommon(Program *, nv50_ir_prog_info *, nv50_ir_prog_info_out *);
protected:
struct Subroutine
{
@@ -50,6 +50,7 @@ protected:
} sub;
struct nv50_ir_prog_info *info;
+ struct nv50_ir_prog_info_out *info_out;
Value *fragCoord[4];
Value *clipVtx[4];
Value *outBase; // base address of vertex out patch (for TCP)
diff --git a/src/gallium/drivers/nouveau/codegen/nv50_ir_from_nir.cpp b/src/gallium/drivers/nouveau/codegen/nv50_ir_from_nir.cpp
index bd78b76f384..cf5f3d6d7e7 100644
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_from_nir.cpp
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_from_nir.cpp
@@ -62,7 +62,7 @@ type_size(const struct glsl_type *type, bool bindless)
class Converter : public ConverterCommon
{
public:
- Converter(Program *, nir_shader *, nv50_ir_prog_info *);
+ Converter(Program *, nir_shader *, nv50_ir_prog_info *, nv50_ir_prog_info_out *);
bool run();
private:
@@ -184,8 +184,9 @@ private:
};
};
-Converter::Converter(Program *prog, nir_shader *nir, nv50_ir_prog_info *info)
- : ConverterCommon(prog, info),
+Converter::Converter(Program *prog, nir_shader *nir, nv50_ir_prog_info *info,
+ nv50_ir_prog_info_out *info_out)
+ : ConverterCommon(prog, info, info_out),
nir(nir),
curLoopDepth(0),
clipVertexOutput(-1)
@@ -934,8 +935,8 @@ bool Converter::assignSlots() {
unsigned index;
info->io.viewportId = -1;
- info->numInputs = 0;
- info->numOutputs = 0;
+ info_out->numInputs = 0;
+ info_out->numOutputs = 0;
// we have to fixup the uniform locations for arrays
unsigned numImages = 0;
@@ -947,31 +948,31 @@ bool Converter::assignSlots() {
numImages += type->is_array() ? type->arrays_of_arrays_size() : 1;
}
- info->numSysVals = 0;
+ info_out->numSysVals = 0;
for (uint8_t i = 0; i < SYSTEM_VALUE_MAX; ++i) {
if (!(nir->info.system_values_read & 1ull << i))
continue;
- info->sv[info->numSysVals].sn = tgsi_get_sysval_semantic(i);
- info->sv[info->numSysVals].si = 0;
- info->sv[info->numSysVals].input = 0; // TODO inferSysValDirection(sn);
+ info_out->sv[info_out->numSysVals].sn = tgsi_get_sysval_semantic(i);
+ info_out->sv[info_out->numSysVals].si = 0;
+ info_out->sv[info_out->numSysVals].input = 0; // TODO inferSysValDirection(sn);
switch (i) {
case SYSTEM_VALUE_INSTANCE_ID:
- info->io.instanceId = info->numSysVals;
+ info_out->io.instanceId = info_out->numSysVals;
break;
case SYSTEM_VALUE_TESS_LEVEL_INNER:
case SYSTEM_VALUE_TESS_LEVEL_OUTER:
- info->sv[info->numSysVals].patch = 1;
+ info_out->sv[info_out->numSysVals].patch = 1;
break;
case SYSTEM_VALUE_VERTEX_ID:
- info->io.vertexId = info->numSysVals;
+ info_out->io.vertexId = info_out->numSysVals;
break;
default:
break;
}
- info->numSysVals += 1;
+ info_out->numSysVals += 1;
}
if (prog->getType() == Program::TYPE_COMPUTE)
@@ -998,7 +999,7 @@ bool Converter::assignSlots() {
tgsi_get_gl_varying_semantic((gl_varying_slot)slot, true,
&name, &index);
for (uint16_t i = 0; i < slots; ++i) {
- setInterpolate(&info->in[vary + i], var->data.interpolation,
+ setInterpolate(&info_out->in[vary + i], var->data.interpolation,
var->data.centroid | var->data.sample, name);
}
break;
@@ -1011,13 +1012,13 @@ bool Converter::assignSlots() {
tgsi_get_gl_varying_semantic((gl_varying_slot)slot, true,
&name, &index);
if (var->data.patch && name == TGSI_SEMANTIC_PATCH)
- info->numPatchConstants = MAX2(info->numPatchConstants, index + slots);
+ info_out->numPatchConstants = MAX2(info_out->numPatchConstants, index + slots);
break;
case Program::TYPE_VERTEX:
vert_attrib_to_tgsi_semantic((gl_vert_attrib)slot, &name, &index);
switch (name) {
case TGSI_SEMANTIC_EDGEFLAG:
- info->io.edgeFlagIn = vary;
+ info_out->io.edgeFlagIn = vary;
break;
default:
break;
@@ -1029,19 +1030,19 @@ bool Converter::assignSlots() {
}
for (uint16_t i = 0u; i < slots; ++i, ++vary) {
- info->in[vary].id = vary;
- info->in[vary].patch = var->data.patch;
- info->in[vary].sn = name;
- info->in[vary].si = index + i;
+ info_out->in[vary].id = vary;
+ info_out->in[vary].patch = var->data.patch;
+ info_out->in[vary].sn = name;
+ info_out->in[vary].si = index + i;
if (glsl_base_type_is_64bit(type->without_array()->base_type))
if (i & 0x1)
- info->in[vary].mask |= (((1 << (comp * 2)) - 1) << (frac * 2) >> 0x4);
+ info_out->in[vary].mask |= (((1 << (comp * 2)) - 1) << (frac * 2) >> 0x4);
else
- info->in[vary].mask |= (((1 << (comp * 2)) - 1) << (frac * 2) & 0xf);
+ info_out->in[vary].mask |= (((1 << (comp * 2)) - 1) << (frac * 2) & 0xf);
else
- info->in[vary].mask |= ((1 << comp) - 1) << frac;
+ info_out->in[vary].mask |= ((1 << comp) - 1) << frac;
}
- info->numInputs = std::max<uint8_t>(info->numInputs, vary);
+ info_out->numInputs = std::max<uint8_t>(info_out->numInputs, vary);
}
nir_foreach_variable(var, &nir->outputs) {
@@ -1066,18 +1067,18 @@ bool Converter::assignSlots() {
switch (name) {
case TGSI_SEMANTIC_COLOR:
if (!var->data.fb_fetch_output)
- info->prop.fp.numColourResults++;
- info->prop.fp.separateFragData = true;
+ info_out->prop.fp.numColourResults++;
+ info_out->prop.fp.separateFragData = true;
// sometimes we get FRAG_RESULT_DATAX with data.index 0
// sometimes we get FRAG_RESULT_DATA0 with data.index X
index = index == 0 ? var->data.index : index;
break;
case TGSI_SEMANTIC_POSITION:
- info->io.fragDepth = vary;
- info->prop.fp.writesDepth = true;
+ info_out->io.fragDepth = vary;
+ info_out->prop.fp.writesDepth = true;
break;
case TGSI_SEMANTIC_SAMPLEMASK:
- info->io.sampleMask = vary;
+ info_out->io.sampleMask = vary;
break;
default:
break;
@@ -1092,17 +1093,17 @@ bool Converter::assignSlots() {
if (var->data.patch && name != TGSI_SEMANTIC_TESSINNER &&
name != TGSI_SEMANTIC_TESSOUTER)
- info->numPatchConstants = MAX2(info->numPatchConstants, index + slots);
+ info_out->numPatchConstants = MAX2(info_out->numPatchConstants, index + slots);
switch (name) {
case TGSI_SEMANTIC_CLIPDIST:
- info->io.genUserClip = -1;
+ info_out->io.genUserClip = -1;
break;
case TGSI_SEMANTIC_CLIPVERTEX:
clipVertexOutput = vary;
break;
case TGSI_SEMANTIC_EDGEFLAG:
- info->io.edgeFlagOut = vary;
+ info_out->io.edgeFlagOut = vary;
break;
case TGSI_SEMANTIC_POSITION:
if (clipVertexOutput < 0)
@@ -1118,39 +1119,39 @@ bool Converter::assignSlots() {
}
for (uint16_t i = 0u; i < slots; ++i, ++vary) {
- info->out[vary].id = vary;
- info->out[vary].patch = var->data.patch;
- info->out[vary].sn = name;
- info->out[vary].si = index + i;
+ info_out->out[vary].id = vary;
+ info_out->out[vary].patch = var->data.patch;
+ info_out->out[vary].sn = name;
+ info_out->out[vary].si = index + i;
if (glsl_base_type_is_64bit(type->without_array()->base_type))
if (i & 0x1)
- info->out[vary].mask |= (((1 << (comp * 2)) - 1) << (frac * 2) >> 0x4);
+ info_out->out[vary].mask |= (((1 << (comp * 2)) - 1) << (frac * 2) >> 0x4);
else
- info->out[vary].mask |= (((1 << (comp * 2)) - 1) << (frac * 2) & 0xf);
+ info_out->out[vary].mask |= (((1 << (comp * 2)) - 1) << (frac * 2) & 0xf);
else
- info->out[vary].mask |= ((1 << comp) - 1) << frac;
+ info_out->out[vary].mask |= ((1 << comp) - 1) << frac;
if (nir->info.outputs_read & 1ull << slot)
- info->out[vary].oread = 1;
+ info_out->out[vary].oread = 1;
}
- info->numOutputs = std::max<uint8_t>(info->numOutputs, vary);
+ info_out->numOutputs = std::max<uint8_t>(info_out->numOutputs, vary);
}
- if (info->io.genUserClip > 0) {
- info->io.clipDistances = info->io.genUserClip;
+ if (info_out->io.genUserClip > 0) {
+ info_out->io.clipDistances = info_out->io.genUserClip;
- const unsigned int nOut = (info->io.genUserClip + 3) / 4;
+ const unsigned int nOut = (info_out->io.genUserClip + 3) / 4;
for (unsigned int n = 0; n < nOut; ++n) {
- unsigned int i = info->numOutputs++;
- info->out[i].id = i;
- info->out[i].sn = TGSI_SEMANTIC_CLIPDIST;
- info->out[i].si = n;
- info->out[i].mask = ((1 << info->io.clipDistances) - 1) >> (n * 4);
+ unsigned int i = info_out->numOutputs++;
+ info_out->out[i].id = i;
+ info_out->out[i].sn = TGSI_SEMANTIC_CLIPDIST;
+ info_out->out[i].si = n;
+ info_out->out[i].mask = ((1 << info_out->io.clipDistances) - 1) >> (n * 4);
}
}
- return info->assignSlots(info) == 0;
+ return info->assignSlots(info_out) == 0;
}
uint32_t
@@ -1200,7 +1201,7 @@ Converter::getSlotAddress(nir_intrinsic_instr *insn, uint8_t idx, uint8_t slot)
assert(!input || idx < PIPE_MAX_SHADER_INPUTS);
assert(input || idx < PIPE_MAX_SHADER_OUTPUTS);
- const nv50_ir_varying *vary = input ? info->in : info->out;
+ const nv50_ir_varying *vary = input ? info_out->in : info_out->out;
return vary[idx].slot[slot] * 4;
}
@@ -1258,63 +1259,63 @@ Converter::storeTo(nir_intrinsic_instr *insn, DataFile file, operation op,
}
mkStore(op, TYPE_U32, mkSymbol(file, 0, TYPE_U32, address), indirect0,
- split[0])->perPatch = info->out[idx].patch;
+ split[0])->perPatch = info_out->out[idx].patch;
mkStore(op, TYPE_U32, mkSymbol(file, 0, TYPE_U32, address + 4), indirect0,
- split[1])->perPatch = info->out[idx].patch;
+ split[1])->perPatch = info_out->out[idx].patch;
} else {
if (op == OP_EXPORT)
src = mkMov(getSSA(size), src, ty)->getDef(0);
mkStore(op, ty, mkSymbol(file, 0, ty, address), indirect0,
- src)->perPatch = info->out[idx].patch;
+ src)->perPatch = info_out->out[idx].patch;
}
}
bool
Converter::parseNIR()
{
- info->bin.tlsSpace = 0;
- info->io.clipDistances = nir->info.clip_distance_array_size;
- info->io.cullDistances = nir->info.cull_distance_array_size;
+ info_out->bin.tlsSpace = 0;
+ info_out->io.clipDistances = nir->info.clip_distance_array_size;
+ info_out->io.cullDistances = nir->info.cull_distance_array_size;
switch(prog->getType()) {
case Program::TYPE_COMPUTE:
info->prop.cp.numThreads[0] = nir->info.cs.local_size[0];
info->prop.cp.numThreads[1] = nir->info.cs.local_size[1];
info->prop.cp.numThreads[2] = nir->info.cs.local_size[2];
- info->bin.smemSize = nir->info.cs.shared_size;
+ info_out->bin.smemSize = nir->info.cs.shared_size;
break;
case Program::TYPE_FRAGMENT:
- info->prop.fp.earlyFragTests = nir->info.fs.early_fragment_tests;
+ info_out->prop.fp.earlyFragTests = nir->info.fs.early_fragment_tests;
info->prop.fp.persampleInvocation =
(nir->info.system_values_read & SYSTEM_BIT_SAMPLE_ID) ||
(nir->info.system_values_read & SYSTEM_BIT_SAMPLE_POS);
- info->prop.fp.postDepthCoverage = nir->info.fs.post_depth_coverage;
- info->prop.fp.readsSampleLocations =
+ info_out->prop.fp.postDepthCoverage = nir->info.fs.post_depth_coverage;
+ info_out->prop.fp.readsSampleLocations =
(nir->info.system_values_read & SYSTEM_BIT_SAMPLE_POS);
- info->prop.fp.usesDiscard = nir->info.fs.uses_discard;
- info->prop.fp.usesSampleMaskIn =
+ info_out->prop.fp.usesDiscard = nir->info.fs.uses_discard;
+ info_out->prop.fp.usesSampleMaskIn =
!!(nir->info.system_values_read & SYSTEM_BIT_SAMPLE_MASK_IN);
break;
case Program::TYPE_GEOMETRY:
info->prop.gp.inputPrim = nir->info.gs.input_primitive;
- info->prop.gp.instanceCount = nir->info.gs.invocations;
- info->prop.gp.maxVertices = nir->info.gs.vertices_out;
- info->prop.gp.outputPrim = nir->info.gs.output_primitive;
+ info_out->prop.gp.instanceCount = nir->info.gs.invocations;
+ info_out->prop.gp.maxVertices = nir->info.gs.vertices_out;
+ info_out->prop.gp.outputPrim = nir->info.gs.output_primitive;
break;
case Program::TYPE_TESSELLATION_CONTROL:
case Program::TYPE_TESSELLATION_EVAL:
if (nir->info.tess.primitive_mode == GL_ISOLINES)
- info->prop.tp.domain = GL_LINES;
+ info_out->prop.tp.domain = GL_LINES;
else
- info->prop.tp.domain = nir->info.tess.primitive_mode;
- info->prop.tp.outputPatchSize = nir->info.tess.tcs_vertices_out;
- info->prop.tp.outputPrim =
+ info_out->prop.tp.domain = nir->info.tess.primitive_mode;
+ info_out->prop.tp.outputPatchSize = nir->info.tess.tcs_vertices_out;
+ info_out->prop.tp.outputPrim =
nir->info.tess.point_mode ? PIPE_PRIM_POINTS : PIPE_PRIM_TRIANGLES;
- info->prop.tp.partitioning = (nir->info.tess.spacing + 1) % 3;
- info->prop.tp.winding = !nir->info.tess.ccw;
+ info_out->prop.tp.partitioning = (nir->info.tess.spacing + 1) % 3;
+ info_out->prop.tp.winding = !nir->info.tess.ccw;
break;
case Program::TYPE_VERTEX:
- info->prop.vp.usesDrawParameters =
+ info_out->prop.vp.usesDrawParameters =
(nir->info.system_values_read & BITFIELD64_BIT(SYSTEM_VALUE_BASE_VERTEX)) ||
(nir->info.system_values_read & BITFIELD64_BIT(SYSTEM_VALUE_BASE_INSTANCE)) ||
(nir->info.system_values_read & BITFIELD64_BIT(SYSTEM_VALUE_DRAW_ID));
@@ -1340,7 +1341,7 @@ Converter::visit(nir_function *function)
setPosition(entry, true);
- if (info->io.genUserClip > 0) {
+ if (info_out->io.genUserClip > 0) {
for (int c = 0; c < 4; ++c)
clipVtx[c] = getScratch();
}
@@ -1367,8 +1368,8 @@ Converter::visit(nir_function *function)
// TODO: packed variables would be nice, but MemoryOpt fails
// replace 4 with reg->num_components
uint32_t size = 4 * reg->num_array_elems * (reg->bit_size / 8);
- regToLmemOffset[reg->index] = info->bin.tlsSpace;
- info->bin.tlsSpace += size;
+ regToLmemOffset[reg->index] = info_out->bin.tlsSpace;
+ info_out->bin.tlsSpace += size;
}
}
@@ -1383,7 +1384,7 @@ Converter::visit(nir_function *function)
if ((prog->getType() == Program::TYPE_VERTEX ||
prog->getType() == Program::TYPE_TESSELLATION_EVAL)
- && info->io.genUserClip > 0)
+ && info_out->io.genUserClip > 0)
handleUserClipPlanes();
// TODO: for non main function this needs to be a OP_RETURN
@@ -1643,7 +1644,7 @@ Converter::visit(nir_intrinsic_instr *insn)
Value *src = getSrc(&insn->src[0], i);
switch (prog->getType()) {
case Program::TYPE_FRAGMENT: {
- if (info->out[idx].sn == TGSI_SEMANTIC_POSITION) {
+ if (info_out->out[idx].sn == TGSI_SEMANTIC_POSITION) {
// TGSI uses a different interface than NIR, TGSI stores that
// value in the z component, NIR in X
offset += 2;
@@ -1653,7 +1654,7 @@ Converter::visit(nir_intrinsic_instr *insn)
}
case Program::TYPE_GEOMETRY:
case Program::TYPE_VERTEX: {
- if (info->io.genUserClip > 0 && idx == (uint32_t)clipVertexOutput) {
+ if (info_out->io.genUserClip > 0 && idx == (uint32_t)clipVertexOutput) {
mkMov(clipVtx[i], src);
src = clipVtx[i];
}
@@ -1700,7 +1701,7 @@ Converter::visit(nir_intrinsic_instr *insn)
texi->tex.r = 0xffff;
texi->tex.s = 0xffff;
- info->prop.fp.readsFramebuffer = true;
+ info_out->prop.fp.readsFramebuffer = true;
break;
}
@@ -1711,7 +1712,7 @@ Converter::visit(nir_intrinsic_instr *insn)
uint32_t mode = 0;
uint32_t idx = getIndirect(insn, op == nir_intrinsic_load_interpolated_input ? 1 : 0, 0, indirect);
- nv50_ir_varying& vary = input ? info->in[idx] : info->out[idx];
+ nv50_ir_varying& vary = input ? info_out->in[idx] : info_out->out[idx];
// see load_barycentric_* handling
if (prog->getType() == Program::TYPE_FRAGMENT) {
@@ -1804,7 +1805,7 @@ Converter::visit(nir_intrinsic_instr *insn)
} else if (op == nir_intrinsic_load_barycentric_pixel) {
mode = NV50_IR_INTERP_DEFAULT;
} else if (op == nir_intrinsic_load_barycentric_at_sample) {
- info->prop.fp.readsSampleLocations = true;
+ info_out->prop.fp.readsSampleLocations = true;
mkOp1(OP_PIXLD, TYPE_U32, newDefs[0], getSrc(&insn->src[0], 0))->subOp = NV50_IR_SUBOP_PIXLD_OFFSET;
mode = NV50_IR_INTERP_OFFSET;
} else {
@@ -1934,7 +1935,7 @@ Converter::visit(nir_intrinsic_instr *insn)
for (uint8_t i = 0u; i < insn->num_components; ++i) {
uint32_t address = getSlotAddress(insn, idx, i);
loadFrom(FILE_SHADER_INPUT, 0, dType, newDefs[i], address, 0,
- indirectOffset, vtxBase, info->in[idx].patch);
+ indirectOffset, vtxBase, info_out->in[idx].patch);
}
break;
}
@@ -1957,12 +1958,12 @@ Converter::visit(nir_intrinsic_instr *insn)
for (uint8_t i = 0u; i < insn->num_components; ++i) {
uint32_t address = getSlotAddress(insn, idx, i);
loadFrom(FILE_SHADER_OUTPUT, 0, dType, newDefs[i], address, 0,
- indirectOffset, vtxBase, info->in[idx].patch);
+ indirectOffset, vtxBase, info_out->in[idx].patch);
}
break;
}
case nir_intrinsic_emit_vertex:
- if (info->io.genUserClip > 0)
+ if (info_out->io.genUserClip > 0)
handleUserClipPlanes();
// fallthrough
case nir_intrinsic_end_primitive: {
@@ -2009,7 +2010,7 @@ Converter::visit(nir_intrinsic_instr *insn)
mkStore(OP_STORE, sType, sym, indirectOffset, getSrc(&insn->src[0], i))
->setIndirect(0, 1, indirectBuffer);
}
- info->io.globalAccess |= 0x2;
+ info_out->io.globalAccess |= 0x2;
break;
}
case nir_intrinsic_load_ssbo: {
@@ -2024,7 +2025,7 @@ Converter::visit(nir_intrinsic_instr *insn)
loadFrom(FILE_MEMORY_BUFFER, buffer, dType, newDefs[i], offset, i,
indirectOffset, indirectBuffer);
- info->io.globalAccess |= 0x1;
+ info_out->io.globalAccess |= 0x1;
break;
}
case nir_intrinsic_shared_atomic_add:
@@ -2075,7 +2076,7 @@ Converter::visit(nir_intrinsic_instr *insn)
atom->setIndirect(0, 1, indirectBuffer);
atom->subOp = getSubOp(op);
- info->io.globalAccess |= 0x2;
+ info_out->io.globalAccess |= 0x2;
break;
}
case nir_intrinsic_global_atomic_add:
@@ -2099,7 +2100,7 @@ Converter::visit(nir_intrinsic_instr *insn)
atom->setIndirect(0, 0, address);
atom->subOp = getSubOp(op);
- info->io.globalAccess |= 0x2;
+ info_out->io.globalAccess |= 0x2;
break;
}
case nir_intrinsic_bindless_image_atomic_add:
@@ -2147,16 +2148,16 @@ Converter::visit(nir_intrinsic_instr *insn)
case nir_intrinsic_bindless_image_atomic_xor:
ty = getDType(insn);
mask = 0x1;
- info->io.globalAccess |= 0x2;
+ info_out->io.globalAccess |= 0x2;
break;
case nir_intrinsic_bindless_image_load:
ty = TYPE_U32;
- info->io.globalAccess |= 0x1;
+ info_out->io.globalAccess |= 0x1;
break;
case nir_intrinsic_bindless_image_store:
ty = TYPE_U32;
mask = 0xf;
- info->io.globalAccess |= 0x2;
+ info_out->io.globalAccess |= 0x2;
break;
case nir_intrinsic_bindless_image_samples:
mask = 0x8;
@@ -2253,16 +2254,16 @@ Converter::visit(nir_intrinsic_instr *insn)
case nir_intrinsic_image_deref_atomic_xor:
ty = getDType(insn);
mask = 0x1;
- info->io.globalAccess |= 0x2;
+ info_out->io.globalAccess |= 0x2;
break;
case nir_intrinsic_image_deref_load:
ty = TYPE_U32;
- info->io.globalAccess |= 0x1;
+ info_out->io.globalAccess |= 0x1;
break;
case nir_intrinsic_image_deref_store:
ty = TYPE_U32;
mask = 0xf;
- info->io.globalAccess |= 0x2;
+ info_out->io.globalAccess |= 0x2;
break;
case nir_intrinsic_image_deref_samples:
mask = 0x8;
@@ -2335,7 +2336,7 @@ Converter::visit(nir_intrinsic_instr *insn)
}
case nir_intrinsic_control_barrier: {
// TODO: add flag to shader_info
- info->numBarriers = 1;
+ info_out->numBarriers = 1;
Instruction *bar = mkOp2(OP_BAR, TYPE_U32, NULL, mkImm(0), mkImm(0));
bar->fixed = 1;
bar->subOp = NV50_IR_SUBOP_BAR_SYNC;
@@ -2370,7 +2371,7 @@ Converter::visit(nir_intrinsic_instr *insn)
for (auto i = 0u; i < insn->num_components; ++i)
loadFrom(FILE_MEMORY_GLOBAL, 0, dType, newDefs[i], offset, i, indirectOffset);
- info->io.globalAccess |= 0x1;
+ info_out->io.globalAccess |= 0x1;
break;
}
case nir_intrinsic_store_global: {
@@ -2394,7 +2395,7 @@ Converter::visit(nir_intrinsic_instr *insn)
}
}
- info->io.globalAccess |= 0x2;
+ info_out->io.globalAccess |= 0x2;
break;
}
default:
@@ -3271,16 +3272,17 @@ Converter::run()
namespace nv50_ir {
bool
-Program::makeFromNIR(struct nv50_ir_prog_info *info)
+Program::makeFromNIR(struct nv50_ir_prog_info *info,
+ struct nv50_ir_prog_info_out *info_out)
{
nir_shader *nir = (nir_shader*)info->bin.source;
- Converter converter(this, nir, info);
+ Converter converter(this, nir, info, info_out);
bool result = converter.run();
if (!result)
return result;
LoweringHelper lowering;
lowering.run(this);
- tlsSize = info->bin.tlsSpace;
+ tlsSize = info_out->bin.tlsSpace;
return result;
}
diff --git a/src/gallium/drivers/nouveau/codegen/nv50_ir_from_tgsi.cpp b/src/gallium/drivers/nouveau/codegen/nv50_ir_from_tgsi.cpp
index da9df42e232..c2322f3856a 100644
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_from_tgsi.cpp
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_from_tgsi.cpp
@@ -986,7 +986,7 @@ bool Instruction::checkDstSrcAliasing() const
class Source
{
public:
- Source(struct nv50_ir_prog_info *);
+ Source(struct nv50_ir_prog_info *, struct nv50_ir_prog_info_out *);
~Source();
public:
@@ -998,6 +998,7 @@ public:
struct tgsi_full_instruction *insns;
const struct tgsi_token *tokens;
struct nv50_ir_prog_info *info;
+ struct nv50_ir_prog_info_out *info_out;
nv50_ir::DynArray tempArrays;
nv50_ir::DynArray immdArrays;
@@ -1047,7 +1048,8 @@ private:
inline bool isEdgeFlagPassthrough(const Instruction&) const;
};
-Source::Source(struct nv50_ir_prog_info *prog) : info(prog)
+Source::Source(struct nv50_ir_prog_info *prog, struct nv50_ir_prog_info_out *info_out)
+: info(prog), info_out(info_out)
{
tokens = (const struct tgsi_token *)info->bin.source;
@@ -1088,16 +1090,16 @@ bool Source::scanSource()
info->immd.bufSize = 0;
- info->numInputs = scan.file_max[TGSI_FILE_INPUT] + 1;
- info->numOutputs = scan.file_max[TGSI_FILE_OUTPUT] + 1;
- info->numSysVals = scan.file_max[TGSI_FILE_SYSTEM_VALUE] + 1;
+ info_out->numInputs = scan.file_max[TGSI_FILE_INPUT] + 1;
+ info_out->numOutputs = scan.file_max[TGSI_FILE_OUTPUT] + 1;
+ info_out->numSysVals = scan.file_max[TGSI_FILE_SYSTEM_VALUE] + 1;
if (info->type == PIPE_SHADER_FRAGMENT) {
- info->prop.fp.writesDepth = scan.writes_z;
- info->prop.fp.usesDiscard = scan.uses_kill || info->io.alphaRefBase;
+ info_out->prop.fp.writesDepth = scan.writes_z;
+ info_out->prop.fp.usesDiscard = scan.uses_kill || info->io.alphaRefBase;
} else
if (info->type == PIPE_SHADER_GEOMETRY) {
- info->prop.gp.instanceCount = 1; // default value
+ info_out->prop.gp.instanceCount = 1; // default value
}
info->io.viewportId = -1;
@@ -1138,43 +1140,43 @@ bool Source::scanSource()
indirectTempOffsets.insert(std::make_pair(*it, tempBase - info.first));
tempBase += info.second;
}
- info->bin.tlsSpace += tempBase * 16;
+ info_out->bin.tlsSpace += tempBase * 16;
}
- if (info->io.genUserClip > 0) {
- info->io.clipDistances = info->io.genUserClip;
+ if (info_out->io.genUserClip > 0) {
+ info_out->io.clipDistances = info_out->io.genUserClip;
- const unsigned int nOut = (info->io.genUserClip + 3) / 4;
+ const unsigned int nOut = (info_out->io.genUserClip + 3) / 4;
for (unsigned int n = 0; n < nOut; ++n) {
- unsigned int i = info->numOutputs++;
- info->out[i].id = i;
- info->out[i].sn = TGSI_SEMANTIC_CLIPDIST;
- info->out[i].si = n;
- info->out[i].mask = ((1 << info->io.clipDistances) - 1) >> (n * 4);
+ unsigned int i = info_out->numOutputs++;
+ info_out->out[i].id = i;
+ info_out->out[i].sn = TGSI_SEMANTIC_CLIPDIST;
+ info_out->out[i].si = n;
+ info_out->out[i].mask = ((1 << info_out->io.clipDistances) - 1) >> (n * 4);
}
}
- return info->assignSlots(info) == 0;
+ return info->assignSlots(info_out) == 0;
}
void Source::scanProperty(const struct tgsi_full_property *prop)
{
switch (prop->Property.PropertyName) {
case TGSI_PROPERTY_GS_OUTPUT_PRIM:
- info->prop.gp.outputPrim = prop->u[0].Data;
+ info_out->prop.gp.outputPrim = prop->u[0].Data;
break;
case TGSI_PROPERTY_GS_INPUT_PRIM:
info->prop.gp.inputPrim = prop->u[0].Data;
break;
case TGSI_PROPERTY_GS_MAX_OUTPUT_VERTICES:
- info->prop.gp.maxVertices = prop->u[0].Data;
+ info_out->prop.gp.maxVertices = prop->u[0].Data;
break;
case TGSI_PROPERTY_GS_INVOCATIONS:
- info->prop.gp.instanceCount = prop->u[0].Data;
+ info_out->prop.gp.instanceCount = prop->u[0].Data;
break;
case TGSI_PROPERTY_FS_COLOR0_WRITES_ALL_CBUFS:
- info->prop.fp.separateFragData = true;
+ info_out->prop.fp.separateFragData = true;
break;
case TGSI_PROPERTY_FS_COORD_ORIGIN:
case TGSI_PROPERTY_FS_COORD_PIXEL_CENTER:
@@ -1182,25 +1184,25 @@ void Source::scanProperty(const struct tgsi_full_property *prop)
// we don't care
break;
case TGSI_PROPERTY_VS_PROHIBIT_UCPS:
- info->io.genUserClip = -1;
+ info_out->io.genUserClip = -1;
break;
case TGSI_PROPERTY_TCS_VERTICES_OUT:
- info->prop.tp.outputPatchSize = prop->u[0].Data;
+ info_out->prop.tp.outputPatchSize = prop->u[0].Data;
break;
case TGSI_PROPERTY_TES_PRIM_MODE:
- info->prop.tp.domain = prop->u[0].Data;
+ info_out->prop.tp.domain = prop->u[0].Data;
break;
case TGSI_PROPERTY_TES_SPACING:
- info->prop.tp.partitioning = prop->u[0].Data;
+ info_out->prop.tp.partitioning = prop->u[0].Data;
break;
case TGSI_PROPERTY_TES_VERTEX_ORDER_CW:
- info->prop.tp.winding = prop->u[0].Data;
+ info_out->prop.tp.winding = prop->u[0].Data;
break;
case TGSI_PROPERTY_TES_POINT_MODE:
if (prop->u[0].Data)
- info->prop.tp.outputPrim = PIPE_PRIM_POINTS;
+ info_out->prop.tp.outputPrim = PIPE_PRIM_POINTS;
else
- info->prop.tp.outputPrim = PIPE_PRIM_TRIANGLES; /* anything but points */
+ info_out->prop.tp.outputPrim = PIPE_PRIM_TRIANGLES; /* anything but points */
break;
case TGSI_PROPERTY_CS_FIXED_BLOCK_WIDTH:
info->prop.cp.numThreads[0] = prop->u[0].Data;
@@ -1212,19 +1214,19 @@ void Source::scanProperty(const struct tgsi_full_property *prop)
info->prop.cp.numThreads[2] = prop->u[0].Data;
break;
case TGSI_PROPERTY_NUM_CLIPDIST_ENABLED:
- info->io.clipDistances = prop->u[0].Data;
+ info_out->io.clipDistances = prop->u[0].Data;
break;
case TGSI_PROPERTY_NUM_CULLDIST_ENABLED:
- info->io.cullDistances = prop->u[0].Data;
+ info_out->io.cullDistances = prop->u[0].Data;
break;
case TGSI_PROPERTY_NEXT_SHADER:
/* Do not need to know the next shader stage. */
break;
case TGSI_PROPERTY_FS_EARLY_DEPTH_STENCIL:
- info->prop.fp.earlyFragTests = prop->u[0].Data;
+ info_out->prop.fp.earlyFragTests = prop->u[0].Data;
break;
case TGSI_PROPERTY_FS_POST_DEPTH_COVERAGE:
- info->prop.fp.postDepthCoverage = prop->u[0].Data;
+ info_out->prop.fp.postDepthCoverage = prop->u[0].Data;
break;
case TGSI_PROPERTY_MUL_ZERO_WINS:
info->io.mul_zero_wins = prop->u[0].Data;
@@ -1292,37 +1294,37 @@ bool Source::scanDeclaration(const struct tgsi_full_declaration *decl)
if (info->type == PIPE_SHADER_VERTEX) {
// all vertex attributes are equal
for (i = first; i <= last; ++i) {
- info->in[i].sn = TGSI_SEMANTIC_GENERIC;
- info->in[i].si = i;
+ info_out->in[i].sn = TGSI_SEMANTIC_GENERIC;
+ info_out->in[i].si = i;
}
} else {
for (i = first; i <= last; ++i, ++si) {
- info->in[i].id = i;
- info->in[i].sn = sn;
- info->in[i].si = si;
+ info_out->in[i].id = i;
+ info_out->in[i].sn = sn;
+ info_out->in[i].si = si;
if (info->type == PIPE_SHADER_FRAGMENT) {
// translate interpolation mode
switch (decl->Interp.Interpolate) {
case TGSI_INTERPOLATE_CONSTANT:
- info->in[i].flat = 1;
+ info_out->in[i].flat = 1;
break;
case TGSI_INTERPOLATE_COLOR:
- info->in[i].sc = 1;
+ info_out->in[i].sc = 1;
break;
case TGSI_INTERPOLATE_LINEAR:
- info->in[i].linear = 1;
+ info_out->in[i].linear = 1;
break;
default:
break;
}
if (decl->Interp.Location)
- info->in[i].centroid = 1;
+ info_out->in[i].centroid = 1;
}
if (sn == TGSI_SEMANTIC_PATCH)
- info->in[i].patch = 1;
+ info_out->in[i].patch = 1;
if (sn == TGSI_SEMANTIC_PATCH)
- info->numPatchConstants = MAX2(info->numPatchConstants, si + 1);
+ info_out->numPatchConstants = MAX2(info_out->numPatchConstants, si + 1);
}
}
break;
@@ -1331,77 +1333,77 @@ bool Source::scanDeclaration(const struct tgsi_full_declaration *decl)
switch (sn) {
case TGSI_SEMANTIC_POSITION:
if (info->type == PIPE_SHADER_FRAGMENT)
- info->io.fragDepth = i;
+ info_out->io.fragDepth = i;
else
if (clipVertexOutput < 0)
clipVertexOutput = i;
break;
case TGSI_SEMANTIC_COLOR:
if (info->type == PIPE_SHADER_FRAGMENT)
- info->prop.fp.numColourResults++;
+ info_out->prop.fp.numColourResults++;
break;
case TGSI_SEMANTIC_EDGEFLAG:
- info->io.edgeFlagOut = i;
+ info_out->io.edgeFlagOut = i;
break;
case TGSI_SEMANTIC_CLIPVERTEX:
clipVertexOutput = i;
break;
case TGSI_SEMANTIC_CLIPDIST:
- info->io.genUserClip = -1;
+ info_out->io.genUserClip = -1;
break;
case TGSI_SEMANTIC_SAMPLEMASK:
- info->io.sampleMask = i;
+ info_out->io.sampleMask = i;
break;
case TGSI_SEMANTIC_VIEWPORT_INDEX:
info->io.viewportId = i;
break;
case TGSI_SEMANTIC_PATCH:
- info->numPatchConstants = MAX2(info->numPatchConstants, si + 1);
+ info_out->numPatchConstants = MAX2(info_out->numPatchConstants, si + 1);
/* fallthrough */
case TGSI_SEMANTIC_TESSOUTER:
case TGSI_SEMANTIC_TESSINNER:
- info->out[i].patch = 1;
+ info_out->out[i].patch = 1;
break;
default:
break;
}
- info->out[i].id = i;
- info->out[i].sn = sn;
- info->out[i].si = si;
+ info_out->out[i].id = i;
+ info_out->out[i].sn = sn;
+ info_out->out[i].si = si;
}
break;
case TGSI_FILE_SYSTEM_VALUE:
switch (sn) {
case TGSI_SEMANTIC_INSTANCEID:
- info->io.instanceId = first;
+ info_out->io.instanceId = first;
break;
case TGSI_SEMANTIC_VERTEXID:
- info->io.vertexId = first;
+ info_out->io.vertexId = first;
break;
case TGSI_SEMANTIC_BASEVERTEX:
case TGSI_SEMANTIC_BASEINSTANCE:
case TGSI_SEMANTIC_DRAWID:
- info->prop.vp.usesDrawParameters = true;
+ info_out->prop.vp.usesDrawParameters = true;
break;
case TGSI_SEMANTIC_SAMPLEID:
case TGSI_SEMANTIC_SAMPLEPOS:
info->prop.fp.persampleInvocation = true;
break;
case TGSI_SEMANTIC_SAMPLEMASK:
- info->prop.fp.usesSampleMaskIn = true;
+ info_out->prop.fp.usesSampleMaskIn = true;
break;
default:
break;
}
for (i = first; i <= last; ++i, ++si) {
- info->sv[i].sn = sn;
- info->sv[i].si = si;
- info->sv[i].input = inferSysValDirection(sn);
+ info_out->sv[i].sn = sn;
+ info_out->sv[i].si = si;
+ info_out->sv[i].input = inferSysValDirection(sn);
switch (sn) {
case TGSI_SEMANTIC_TESSOUTER:
case TGSI_SEMANTIC_TESSINNER:
- info->sv[i].patch = 1;
+ info_out->sv[i].patch = 1;
break;
}
}
@@ -1451,7 +1453,7 @@ bool Source::scanDeclaration(const struct tgsi_full_declaration *decl)
inline bool Source::isEdgeFlagPassthrough(const Instruction& insn) const
{
return insn.getOpcode() == TGSI_OPCODE_MOV &&
- insn.getDst(0).getIndex(0) == info->io.edgeFlagOut &&
+ insn.getDst(0).getIndex(0) == info_out->io.edgeFlagOut &&
insn.getSrc(0).getFile() == TGSI_FILE_INPUT;
}
@@ -1467,22 +1469,22 @@ void Source::scanInstructionSrc(const Instruction& insn,
if (src.isIndirect(0)) {
// We don't know which one is accessed, just mark everything for
// reading. This is an extremely unlikely occurrence.
- for (unsigned i = 0; i < info->numOutputs; ++i)
- info->out[i].oread = 1;
+ for (unsigned i = 0; i < info_out->numOutputs; ++i)
+ info_out->out[i].oread = 1;
} else {
- info->out[src.getIndex(0)].oread = 1;
+ info_out->out[src.getIndex(0)].oread = 1;
}
}
if (src.getFile() == TGSI_FILE_SYSTEM_VALUE) {
- if (info->sv[src.getIndex(0)].sn == TGSI_SEMANTIC_SAMPLEPOS)
- info->prop.fp.readsSampleLocations = true;
+ if (info_out->sv[src.getIndex(0)].sn == TGSI_SEMANTIC_SAMPLEPOS)
+ info_out->prop.fp.readsSampleLocations = true;
}
if (src.getFile() != TGSI_FILE_INPUT)
return;
if (src.isIndirect(0)) {
- for (unsigned i = 0; i < info->numInputs; ++i)
- info->in[i].mask = 0xf;
+ for (unsigned i = 0; i < info_out->numInputs; ++i)
+ info_out->in[i].mask = 0xf;
} else {
const int i = src.getIndex(0);
for (unsigned c = 0; c < 4; ++c) {
@@ -1490,16 +1492,16 @@ void Source::scanInstructionSrc(const Instruction& insn,
continue;
int k = src.getSwizzle(c);
if (k <= TGSI_SWIZZLE_W)
- info->in[i].mask |= 1 << k;
+ info_out->in[i].mask |= 1 << k;
}
- switch (info->in[i].sn) {
+ switch (info_out->in[i].sn) {
case TGSI_SEMANTIC_PSIZE:
case TGSI_SEMANTIC_PRIMID:
case TGSI_SEMANTIC_FOG:
- info->in[i].mask &= 0x1;
+ info_out->in[i].mask &= 0x1;
break;
case TGSI_SEMANTIC_PCOORD:
- info->in[i].mask &= 0x3;
+ info_out->in[i].mask &= 0x3;
break;
default:
break;
@@ -1512,47 +1514,47 @@ bool Source::scanInstruction(const struct tgsi_full_instruction *inst)
Instruction insn(inst);
if (insn.getOpcode() == TGSI_OPCODE_BARRIER)
- info->numBarriers = 1;
+ info_out->numBarriers = 1;
if (insn.getOpcode() == TGSI_OPCODE_FBFETCH)
- info->prop.fp.readsFramebuffer = true;
+ info_out->prop.fp.readsFramebuffer = true;
if (insn.getOpcode() == TGSI_OPCODE_INTERP_SAMPLE)
- info->prop.fp.readsSampleLocations = true;
+ info_out->prop.fp.readsSampleLocations = true;
if (insn.getOpcode() == TGSI_OPCODE_DEMOTE)
- info->prop.fp.usesDiscard = true;
+ info_out->prop.fp.usesDiscard = true;
if (insn.dstCount()) {
Instruction::DstRegister dst = insn.getDst(0);
if (insn.getOpcode() == TGSI_OPCODE_STORE &&
dst.getFile() != TGSI_FILE_MEMORY) {
- info->io.globalAccess |= 0x2;
+ info_out->io.globalAccess |= 0x2;
if (dst.getFile() == TGSI_FILE_INPUT) {
// TODO: Handle indirect somehow?
const int i = dst.getIndex(0);
- info->in[i].mask |= 1;
+ info_out->in[i].mask |= 1;
}
}
if (dst.getFile() == TGSI_FILE_OUTPUT) {
if (dst.isIndirect(0))
- for (unsigned i = 0; i < info->numOutputs; ++i)
- info->out[i].mask = 0xf;
+ for (unsigned i = 0; i < info_out->numOutputs; ++i)
+ info_out->out[i].mask = 0xf;
else
- info->out[dst.getIndex(0)].mask |= dst.getMask();
+ info_out->out[dst.getIndex(0)].mask |= dst.getMask();
- if (info->out[dst.getIndex(0)].sn == TGSI_SEMANTIC_PSIZE ||
- info->out[dst.getIndex(0)].sn == TGSI_SEMANTIC_PRIMID ||
- info->out[dst.getIndex(0)].sn == TGSI_SEMANTIC_LAYER ||
- info->out[dst.getIndex(0)].sn == TGSI_SEMANTIC_VIEWPORT_INDEX ||
- info->out[dst.getIndex(0)].sn == TGSI_SEMANTIC_FOG)
- info->out[dst.getIndex(0)].mask &= 1;
+ if (info_out->out[dst.getIndex(0)].sn == TGSI_SEMANTIC_PSIZE ||
+ info_out->out[dst.getIndex(0)].sn == TGSI_SEMANTIC_PRIMID ||
+ info_out->out[dst.getIndex(0)].sn == TGSI_SEMANTIC_LAYER ||
+ info_out->out[dst.getIndex(0)].sn == TGSI_SEMANTIC_VIEWPORT_INDEX ||
+ info_out->out[dst.getIndex(0)].sn == TGSI_SEMANTIC_FOG)
+ info_out->out[dst.getIndex(0)].mask &= 1;
if (isEdgeFlagPassthrough(insn))
- info->io.edgeFlagIn = insn.getSrc(0).getIndex(0);
+ info_out->io.edgeFlagIn = insn.getSrc(0).getIndex(0);
} else
if (dst.getFile() == TGSI_FILE_TEMPORARY) {
if (dst.isIndirect(0))
@@ -1562,7 +1564,7 @@ bool Source::scanInstruction(const struct tgsi_full_instruction *inst)
dst.getFile() == TGSI_FILE_IMAGE ||
(dst.getFile() == TGSI_FILE_MEMORY &&
memoryFiles[dst.getIndex(0)].mem_type == TGSI_MEMORY_TYPE_GLOBAL)) {
- info->io.globalAccess |= 0x2;
+ info_out->io.globalAccess |= 0x2;
}
}
@@ -1585,7 +1587,7 @@ bool Source::scanInstruction(const struct tgsi_full_instruction *inst)
case TGSI_OPCODE_ATOMDEC_WRAP:
case TGSI_OPCODE_ATOMINC_WRAP:
case TGSI_OPCODE_LOAD:
- info->io.globalAccess |= (insn.getOpcode() == TGSI_OPCODE_LOAD) ?
+ info_out->io.globalAccess |= (insn.getOpcode() == TGSI_OPCODE_LOAD) ?
0x1 : 0x2;
break;
}
@@ -1630,7 +1632,7 @@ using namespace nv50_ir;
class Converter : public ConverterCommon
{
public:
- Converter(Program *, const tgsi::Source *);
+ Converter(Program *, const tgsi::Source *, nv50_ir_prog_info_out *);
~Converter();
bool run();
@@ -1789,13 +1791,13 @@ Converter::makeSym(uint tgsiFile, int fileIdx, int idx, int c, uint32_t address)
if (idx >= 0) {
if (sym->reg.file == FILE_SHADER_INPUT)
- sym->setOffset(info->in[idx].slot[c] * 4);
+ sym->setOffset(info_out->in[idx].slot[c] * 4);
else
if (sym->reg.file == FILE_SHADER_OUTPUT)
- sym->setOffset(info->out[idx].slot[c] * 4);
+ sym->setOffset(info_out->out[idx].slot[c] * 4);
else
if (sym->reg.file == FILE_SYSTEM_VALUE)
- sym->setSV(tgsi::translateSysVal(info->sv[idx].sn), c);
+ sym->setSV(tgsi::translateSysVal(info_out->sv[idx].sn), c);
else
sym->setOffset(address);
} else {
@@ -1810,7 +1812,7 @@ Converter::interpolate(tgsi::Instruction::SrcRegister src, int c, Value *ptr)
operation op;
// XXX: no way to know interpolation mode if we don't know what's accessed
- const uint8_t mode = translateInterpMode(&info->in[ptr ? 0 :
+ const uint8_t mode = translateInterpMode(&info_out->in[ptr ? 0 :
src.getIndex(0)], op);
Instruction *insn = new_Instruction(func, op, TYPE_F32);
@@ -2022,12 +2024,12 @@ Converter::fetchSrc(tgsi::Instruction::SrcRegister src, int c, Value *ptr)
case TGSI_FILE_INPUT:
if (prog->getType() == Program::TYPE_FRAGMENT) {
// don't load masked inputs, won't be assigned a slot
- if (!ptr && !(info->in[idx].mask & (1 << swz)))
+ if (!ptr && !(info_out->in[idx].mask & (1 << swz)))
return loadImm(NULL, swz == TGSI_SWIZZLE_W ? 1.0f : 0.0f);
return interpolate(src, c, shiftAddress(ptr));
} else
if (prog->getType() == Program::TYPE_GEOMETRY) {
- if (!ptr && info->in[idx].sn == TGSI_SEMANTIC_PRIMID)
+ if (!ptr && info_out->in[idx].sn == TGSI_SEMANTIC_PRIMID)
return mkOp1v(OP_RDSV, TYPE_U32, getSSA(), mkSysVal(SV_PRIMITIVE_ID, 0));
// XXX: This is going to be a problem with scalar arrays, i.e. when
// we cannot assume that the address is given in units of vec4.
@@ -2038,24 +2040,24 @@ Converter::fetchSrc(tgsi::Instruction::SrcRegister src, int c, Value *ptr)
return mkLoadv(TYPE_U32, srcToSym(src, c), ptr);
}
ld = mkLoad(TYPE_U32, getSSA(), srcToSym(src, c), shiftAddress(ptr));
- ld->perPatch = info->in[idx].patch;
+ ld->perPatch = info_out->in[idx].patch;
return ld->getDef(0);
case TGSI_FILE_OUTPUT:
assert(prog->getType() == Program::TYPE_TESSELLATION_CONTROL);
ld = mkLoad(TYPE_U32, getSSA(), srcToSym(src, c), shiftAddress(ptr));
- ld->perPatch = info->out[idx].patch;
+ ld->perPatch = info_out->out[idx].patch;
return ld->getDef(0);
case TGSI_FILE_SYSTEM_VALUE:
assert(!ptr);
- if (info->sv[idx].sn == TGSI_SEMANTIC_THREAD_ID &&
+ if (info_out->sv[idx].sn == TGSI_SEMANTIC_THREAD_ID &&
info->prop.cp.numThreads[swz] == 1)
return loadImm(NULL, 0u);
- if (isSubGroupMask(info->sv[idx].sn) && swz > 0)
+ if (isSubGroupMask(info_out->sv[idx].sn) && swz > 0)
return loadImm(NULL, 0u);
- if (info->sv[idx].sn == TGSI_SEMANTIC_SUBGROUP_SIZE)
+ if (info_out->sv[idx].sn == TGSI_SEMANTIC_SUBGROUP_SIZE)
return loadImm(NULL, 32u);
ld = mkOp1(OP_RDSV, TYPE_U32, getSSA(), srcToSym(src, c));
- ld->perPatch = info->sv[idx].patch;
+ ld->perPatch = info_out->sv[idx].patch;
return ld->getDef(0);
case TGSI_FILE_TEMPORARY: {
int arrayid = src.getArrayId();
@@ -2110,7 +2112,7 @@ Converter::storeDst(int d, int c, Value *val)
if (dst.isIndirect(0))
ptr = shiftAddress(fetchSrc(dst.getIndirect(0), 0, NULL));
- if (info->io.genUserClip > 0 &&
+ if (info_out->io.genUserClip > 0 &&
dst.getFile() == TGSI_FILE_OUTPUT &&
!dst.isIndirect(0) && dst.getIndex(0) == code->clipVertexOutput) {
mkMov(clipVtx[c], val);
@@ -2134,16 +2136,16 @@ Converter::storeDst(const tgsi::Instruction::DstRegister dst, int c,
} else
if (f == TGSI_FILE_OUTPUT && prog->getType() != Program::TYPE_FRAGMENT) {
- if (ptr || (info->out[idx].mask & (1 << c))) {
+ if (ptr || (info_out->out[idx].mask & (1 << c))) {
/* Save the viewport index into a scratch register so that it can be
exported at EMIT time */
- if (info->out[idx].sn == TGSI_SEMANTIC_VIEWPORT_INDEX &&
+ if (info_out->out[idx].sn == TGSI_SEMANTIC_VIEWPORT_INDEX &&
prog->getType() == Program::TYPE_GEOMETRY &&
viewport != NULL)
mkOp1(OP_MOV, TYPE_U32, viewport, val);
else
mkStore(OP_EXPORT, TYPE_U32, dstToSym(dst, c), ptr, val)->perPatch =
- info->out[idx].patch;
+ info_out->out[idx].patch;
}
} else
if (f == TGSI_FILE_TEMPORARY ||
@@ -3024,7 +3026,7 @@ Converter::handleINTERP(Value *dst[4])
// We can assume that the fixed index will point to an input of the same
// interpolation type in case of an indirect.
// TODO: Make use of ArrayID.
- linear = info->in[src.getIndex(0)].linear;
+ linear = info_out->in[src.getIndex(0)].linear;
if (linear) {
op = OP_LINTERP;
mode = NV50_IR_INTERP_LINEAR;
@@ -3518,11 +3520,11 @@ Converter::handleInstruction(const struct tgsi_full_instruction *insn)
/* export the saved viewport index */
if (viewport != NULL) {
Symbol *vpSym = mkSymbol(FILE_SHADER_OUTPUT, 0, TYPE_U32,
- info->out[info->io.viewportId].slot[0] * 4);
+ info_out->out[info->io.viewportId].slot[0] * 4);
mkStore(OP_EXPORT, TYPE_U32, vpSym, NULL, viewport);
}
/* handle user clip planes for each emitted vertex */
- if (info->io.genUserClip > 0)
+ if (info_out->io.genUserClip > 0)
handleUserClipPlanes();
/* fallthrough */
case TGSI_OPCODE_ENDPRIM:
@@ -3531,7 +3533,7 @@ Converter::handleInstruction(const struct tgsi_full_instruction *insn)
unsigned int stream = tgsi.getSrc(0).getValueU32(0, info);
if (stream && op == OP_RESTART)
break;
- if (info->prop.gp.maxVertices == 0)
+ if (info_out->prop.gp.maxVertices == 0)
break;
src0 = mkImm(stream);
mkOp1(op, TYPE_U32, NULL, src0)->fixed = 1;
@@ -3700,7 +3702,7 @@ Converter::handleInstruction(const struct tgsi_full_instruction *insn)
exportOutputs();
if ((prog->getType() == Program::TYPE_VERTEX ||
prog->getType() == Program::TYPE_TESSELLATION_EVAL
- ) && info->io.genUserClip > 0)
+ ) && info_out->io.genUserClip > 0)
handleUserClipPlanes();
mkOp(OP_EXIT, TYPE_NONE, NULL)->terminator = 1;
}
@@ -4148,9 +4150,9 @@ void
Converter::exportOutputs()
{
if (info->io.alphaRefBase) {
- for (unsigned int i = 0; i < info->numOutputs; ++i) {
- if (info->out[i].sn != TGSI_SEMANTIC_COLOR ||
- info->out[i].si != 0)
+ for (unsigned int i = 0; i < info_out->numOutputs; ++i) {
+ if (info_out->out[i].sn != TGSI_SEMANTIC_COLOR ||
+ info_out->out[i].si != 0)
continue;
const unsigned int c = 3;
if (!oData.exists(sub.cur->values, i, c))
@@ -4169,15 +4171,15 @@ Converter::exportOutputs()
}
}
- for (unsigned int i = 0; i < info->numOutputs; ++i) {
+ for (unsigned int i = 0; i < info_out->numOutputs; ++i) {
for (unsigned int c = 0; c < 4; ++c) {
if (!oData.exists(sub.cur->values, i, c))
continue;
Symbol *sym = mkSymbol(FILE_SHADER_OUTPUT, 0, TYPE_F32,
- info->out[i].slot[c] * 4);
+ info_out->out[i].slot[c] * 4);
Value *val = oData.load(sub.cur->values, i, c, NULL);
if (val) {
- if (info->out[i].sn == TGSI_SEMANTIC_POSITION)
+ if (info_out->out[i].sn == TGSI_SEMANTIC_POSITION)
mkOp1(OP_SAT, TYPE_F32, val, val);
mkStore(OP_EXPORT, TYPE_F32, sym, NULL, val);
}
@@ -4185,7 +4187,8 @@ Converter::exportOutputs()
}
}
-Converter::Converter(Program *ir, const tgsi::Source *code) : ConverterCommon(ir, code->info),
+Converter::Converter(Program *ir, const tgsi::Source *code, nv50_ir_prog_info_out *info_out)
+: ConverterCommon(ir, code->info, info_out),
code(code),
tgsi(NULL),
tData(this), lData(this), aData(this), oData(this)
@@ -4286,7 +4289,7 @@ Converter::run()
setPosition(entry, true);
sub.cur = getSubroutine(prog->main);
- if (info->io.genUserClip > 0) {
+ if (info_out->io.genUserClip > 0) {
for (int c = 0; c < 4; ++c)
clipVtx[c] = getScratch();
}
@@ -4329,14 +4332,15 @@ Converter::run()
namespace nv50_ir {
bool
-Program::makeFromTGSI(struct nv50_ir_prog_info *info)
+Program::makeFromTGSI(struct nv50_ir_prog_info *info,
+ struct nv50_ir_prog_info_out *info_out)
{
- tgsi::Source src(info);
+ tgsi::Source src(info, info_out);
if (!src.scanSource())
return false;
- tlsSize = info->bin.tlsSpace;
+ tlsSize = info_out->bin.tlsSpace;
- Converter builder(this, &src);
+ Converter builder(this, &src, info_out);
return builder.run();
}
diff --git a/src/gallium/drivers/nouveau/codegen/nv50_ir_lowering_nvc0.cpp b/src/gallium/drivers/nouveau/codegen/nv50_ir_lowering_nvc0.cpp
index a60881000fe..9fe0cb0dced 100644
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_lowering_nvc0.cpp
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_lowering_nvc0.cpp
@@ -2808,7 +2808,7 @@ NVC0LoweringPass::readTessCoord(LValue *dst, int c)
y = dst;
} else {
assert(c == 2);
- if (prog->driver->prop.tp.domain != PIPE_PRIM_TRIANGLES) {
+ if (prog->driver_out->prop.tp.domain != PIPE_PRIM_TRIANGLES) {
bld.mkMov(dst, bld.loadImm(NULL, 0));
return;
}
@@ -2917,7 +2917,7 @@ NVC0LoweringPass::handleRDSV(Instruction *i)
ld->subOp = NV50_IR_SUBOP_PIXLD_SAMPLEID;
Value *offset = calculateSampleOffset(sampleID);
- assert(prog->driver->prop.fp.readsSampleLocations);
+ assert(prog->driver_out->prop.fp.readsSampleLocations);
if (targ->getChipset() >= NVISA_GM200_CHIPSET) {
bld.mkLoad(TYPE_F32,
@@ -3152,7 +3152,7 @@ NVC0LoweringPass::handlePIXLD(Instruction *i)
if (targ->getChipset() < NVISA_GM200_CHIPSET)
return;
- assert(prog->driver->prop.fp.readsSampleLocations);
+ assert(prog->driver_out->prop.fp.readsSampleLocations);
bld.mkLoad(TYPE_F32,
i->getDef(0),
diff --git a/src/gallium/drivers/nouveau/codegen/nv50_ir_target.cpp b/src/gallium/drivers/nouveau/codegen/nv50_ir_target.cpp
index 0af79e9d50a..a0b9436845c 100644
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_target.cpp
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_target.cpp
@@ -344,7 +344,7 @@ CodeEmitter::prepareEmission(BasicBlock *bb)
}
bool
-Program::emitBinary(struct nv50_ir_prog_info *info)
+Program::emitBinary(struct nv50_ir_prog_info_out *info)
{
CodeEmitter *emit = target->getCodeEmitter(progType);
diff --git a/src/gallium/drivers/nouveau/codegen/nv50_ir_target.h b/src/gallium/drivers/nouveau/codegen/nv50_ir_target.h
index afeca14d7d1..cc64a51d25e 100644
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_target.h
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_target.h
@@ -173,8 +173,9 @@ public:
// The address chosen is supplied to the relocation routine.
virtual void getBuiltinCode(const uint32_t **code, uint32_t *size) const = 0;
- virtual void parseDriverInfo(const struct nv50_ir_prog_info *info) {
- if (info->type == PIPE_SHADER_COMPUTE) {
+ virtual void parseDriverInfo(const struct nv50_ir_prog_info *info,
+ const struct nv50_ir_prog_info_out *info_out) {
+ if (info_out->type == PIPE_SHADER_COMPUTE) {
threads = info->prop.cp.numThreads[0] *
info->prop.cp.numThreads[1] *
info->prop.cp.numThreads[2];
diff --git a/src/gallium/drivers/nouveau/codegen/nv50_ir_target_nv50.cpp b/src/gallium/drivers/nouveau/codegen/nv50_ir_target_nv50.cpp
index ec94590a3f8..1b57959cdc5 100644
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_target_nv50.cpp
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_target_nv50.cpp
@@ -584,15 +584,16 @@ recordLocation(uint16_t *locs, uint8_t *masks,
}
void
-TargetNV50::parseDriverInfo(const struct nv50_ir_prog_info *info)
+TargetNV50::parseDriverInfo(const struct nv50_ir_prog_info *info,
+ const struct nv50_ir_prog_info_out *info_out)
{
unsigned int i;
- for (i = 0; i < info->numOutputs; ++i)
- recordLocation(sysvalLocation, NULL, &info->out[i]);
- for (i = 0; i < info->numInputs; ++i)
- recordLocation(sysvalLocation, &wposMask, &info->in[i]);
- for (i = 0; i < info->numSysVals; ++i)
- recordLocation(sysvalLocation, NULL, &info->sv[i]);
+ for (i = 0; i < info_out->numOutputs; ++i)
+ recordLocation(sysvalLocation, NULL, &info_out->out[i]);
+ for (i = 0; i < info_out->numInputs; ++i)
+ recordLocation(sysvalLocation, &wposMask, &info_out->in[i]);
+ for (i = 0; i < info_out->numSysVals; ++i)
+ recordLocation(sysvalLocation, NULL, &info_out->sv[i]);
if (sysvalLocation[SV_POSITION] >= 0x200) {
// not assigned by driver, but we need it internally
@@ -600,7 +601,7 @@ TargetNV50::parseDriverInfo(const struct nv50_ir_prog_info *info)
sysvalLocation[SV_POSITION] = 0;
}
- Target::parseDriverInfo(info);
+ Target::parseDriverInfo(info, info_out);
}
} // namespace nv50_ir
diff --git a/src/gallium/drivers/nouveau/codegen/nv50_ir_target_nv50.h b/src/gallium/drivers/nouveau/codegen/nv50_ir_target_nv50.h
index 00243d7958e..caf66b269db 100644
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_target_nv50.h
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_target_nv50.h
@@ -42,7 +42,8 @@ public:
virtual void getBuiltinCode(const uint32_t **code, uint32_t *size) const;
- virtual void parseDriverInfo(const struct nv50_ir_prog_info *);
+ virtual void parseDriverInfo(const struct nv50_ir_prog_info *,
+ const struct nv50_ir_prog_info_out *);
virtual bool insnCanLoad(const Instruction *insn, int s,
const Instruction *ld) const;
diff --git a/src/gallium/drivers/nouveau/nouveau_compiler.c b/src/gallium/drivers/nouveau/nouveau_compiler.c
index f2c175661be..cf4b0995145 100644
--- a/src/gallium/drivers/nouveau/nouveau_compiler.c
+++ b/src/gallium/drivers/nouveau/nouveau_compiler.c
@@ -75,7 +75,7 @@ nv30_codegen(int chipset, int type, struct tgsi_token tokens[],
}
static int
-dummy_assign_slots(struct nv50_ir_prog_info *info)
+dummy_assign_slots(struct nv50_ir_prog_info_out *info)
{
unsigned i, n, c;
@@ -105,6 +105,7 @@ static int
nouveau_codegen(int chipset, int type, struct tgsi_token tokens[],
unsigned *size, unsigned **code) {
struct nv50_ir_prog_info info = {0};
+ struct nv50_ir_prog_info_out info_out = {0};
int ret;
info.type = type;
@@ -124,14 +125,14 @@ nouveau_codegen(int chipset, int type, struct tgsi_token tokens[],
info.dbgFlags = debug_get_num_option("NV50_PROG_DEBUG", 0);
info.omitLineNum = debug_get_num_option("NV50_PROG_DEBUG_OMIT_LINENUM", 0);
- ret = nv50_ir_generate_code(&info);
+ ret = nv50_ir_generate_code(&info, &info_out);
if (ret) {
_debug_printf("Error compiling program: %d\n", ret);
return ret;
}
- *size = info.bin.codeSize;
- *code = info.bin.code;
+ *size = info_out.bin.codeSize;
+ *code = info_out.bin.code;
return 0;
}
diff --git a/src/gallium/drivers/nouveau/nv50/nv50_program.c b/src/gallium/drivers/nouveau/nv50/nv50_program.c
index 58c0463f1a2..a3f3054cbaa 100644
--- a/src/gallium/drivers/nouveau/nv50/nv50_program.c
+++ b/src/gallium/drivers/nouveau/nv50/nv50_program.c
@@ -38,7 +38,7 @@ bitcount4(const uint32_t val)
}
static int
-nv50_vertprog_assign_slots(struct nv50_ir_prog_info *info)
+nv50_vertprog_assign_slots(struct nv50_ir_prog_info_out *info)
{
struct nv50_program *prog = (struct nv50_program *)info->driverPriv;
unsigned i, n, c;
@@ -140,7 +140,7 @@ nv50_vertprog_assign_slots(struct nv50_ir_prog_info *info)
}
static int
-nv50_fragprog_assign_slots(struct nv50_ir_prog_info *info)
+nv50_fragprog_assign_slots(struct nv50_ir_prog_info_out *info)
{
struct nv50_program *prog = (struct nv50_program *)info->driverPriv;
unsigned i, n, m, c;
@@ -249,7 +249,7 @@ nv50_fragprog_assign_slots(struct nv50_ir_prog_info *info)
}
static int
-nv50_program_assign_varying_slots(struct nv50_ir_prog_info *info)
+nv50_program_assign_varying_slots(struct nv50_ir_prog_info_out *info)
{
switch (info->type) {
case PIPE_SHADER_VERTEX:
@@ -266,7 +266,7 @@ nv50_program_assign_varying_slots(struct nv50_ir_prog_info *info)
}
static struct nv50_stream_output_state *
-nv50_program_create_strmout_state(const struct nv50_ir_prog_info *info,
+nv50_program_create_strmout_state(const struct nv50_ir_prog_info_out *info,
const struct pipe_stream_output_info *pso)
{
struct nv50_stream_output_state *so;
@@ -350,10 +350,8 @@ nv50_program_translate(struct nv50_program *prog, uint16_t chipset,
return false;
}
- info->bin.smemSize = prog->cp.smem_size;
info->io.auxCBSlot = 15;
info->io.ucpBase = NV50_CB_AUX_UCP_OFFSET;
- info->io.genUserClip = prog->vp.clpd_nr;
if (prog->fp.alphatest)
info->io.alphaRefBase = NV50_CB_AUX_ALPHATEST_OFFSET;
@@ -376,8 +374,6 @@ nv50_program_translate(struct nv50_program *prog, uint16_t chipset,
if (prog->type == PIPE_SHADER_COMPUTE)
info->prop.cp.inputOffset = 0x10;
- info->driverPriv = prog;
-
#ifndef NDEBUG
info->optLevel = debug_get_num_option("NV50_PROG_OPTIMIZE", 3);
info->dbgFlags = debug_get_num_option("NV50_PROG_DEBUG", 0);
@@ -386,39 +382,44 @@ nv50_program_translate(struct nv50_program *prog, uint16_t chipset,
info->optLevel = 3;
#endif
- ret = nv50_ir_generate_code(info);
+ struct nv50_ir_prog_info_out info_out = {};
+ /* these fields might be overwritten by the compiler */
+ info_out.bin.smemSize = prog->cp.smem_size;
+ info_out.io.genUserClip = prog->vp.clpd_nr;
+ info_out.driverPriv = prog;
+ ret = nv50_ir_generate_code(info, &info_out);
if (ret) {
NOUVEAU_ERR("shader translation failed: %i\n", ret);
goto out;
}
- prog->code = info->bin.code;
- prog->code_size = info->bin.codeSize;
- prog->fixups = info->bin.relocData;
- prog->interps = info->bin.fixupData;
- prog->max_gpr = MAX2(4, (info->bin.maxGPR >> 1) + 1);
- prog->tls_space = info->bin.tlsSpace;
- prog->cp.smem_size = info->bin.smemSize;
+ prog->code = info_out.bin.code;
+ prog->code_size = info_out.bin.codeSize;
+ prog->fixups = info_out.bin.relocData;
+ prog->interps = info_out.bin.fixupData;
+ prog->max_gpr = MAX2(4, (info_out.bin.maxGPR >> 1) + 1);
+ prog->tls_space = info_out.bin.tlsSpace;
+ prog->cp.smem_size = info_out.bin.smemSize;
prog->mul_zero_wins = info->io.mul_zero_wins;
- prog->vp.need_vertex_id = info->io.vertexId < PIPE_MAX_SHADER_INPUTS;
+ prog->vp.need_vertex_id = info_out.io.vertexId < PIPE_MAX_SHADER_INPUTS;
- prog->vp.clip_enable = (1 << info->io.clipDistances) - 1;
+ prog->vp.clip_enable = (1 << info_out.io.clipDistances) - 1;
prog->vp.cull_enable =
- ((1 << info->io.cullDistances) - 1) << info->io.clipDistances;
+ ((1 << info_out.io.cullDistances) - 1) << info_out.io.clipDistances;
prog->vp.clip_mode = 0;
- for (i = 0; i < info->io.cullDistances; ++i)
- prog->vp.clip_mode |= 1 << ((info->io.clipDistances + i) * 4);
+ for (i = 0; i < info_out.io.cullDistances; ++i)
+ prog->vp.clip_mode |= 1 << ((info_out.io.clipDistances + i) * 4);
if (prog->type == PIPE_SHADER_FRAGMENT) {
- if (info->prop.fp.writesDepth) {
+ if (info_out.prop.fp.writesDepth) {
prog->fp.flags[0] |= NV50_3D_FP_CONTROL_EXPORTS_Z;
prog->fp.flags[1] = 0x11;
}
- if (info->prop.fp.usesDiscard)
+ if (info_out.prop.fp.usesDiscard)
prog->fp.flags[0] |= NV50_3D_FP_CONTROL_USES_KIL;
} else
if (prog->type == PIPE_SHADER_GEOMETRY) {
- switch (info->prop.gp.outputPrim) {
+ switch (info_out.prop.gp.outputPrim) {
case PIPE_PRIM_LINE_STRIP:
prog->gp.prim_type = NV50_3D_GP_OUTPUT_PRIMITIVE_TYPE_LINE_STRIP;
break;
@@ -427,22 +428,22 @@ nv50_program_translate(struct nv50_program *prog, uint16_t chipset,
break;
case PIPE_PRIM_POINTS:
default:
- assert(info->prop.gp.outputPrim == PIPE_PRIM_POINTS);
+ assert(info_out.prop.gp.outputPrim == PIPE_PRIM_POINTS);
prog->gp.prim_type = NV50_3D_GP_OUTPUT_PRIMITIVE_TYPE_POINTS;
break;
}
- prog->gp.vert_count = CLAMP(info->prop.gp.maxVertices, 1, 1024);
+ prog->gp.vert_count = CLAMP(info_out.prop.gp.maxVertices, 1, 1024);
}
if (prog->pipe.stream_output.num_outputs)
- prog->so = nv50_program_create_strmout_state(info,
+ prog->so = nv50_program_create_strmout_state(&info_out,
&prog->pipe.stream_output);
pipe_debug_message(debug, SHADER_INFO,
"type: %d, local: %d, shared: %d, gpr: %d, inst: %d, bytes: %d",
- prog->type, info->bin.tlsSpace, info->bin.smemSize,
- prog->max_gpr, info->bin.instructions,
- info->bin.codeSize);
+ prog->type, info_out.bin.tlsSpace, info_out.bin.smemSize,
+ prog->max_gpr, info_out.bin.instructions,
+ info_out.bin.codeSize);
out:
if (info->bin.sourceRep == PIPE_SHADER_IR_NIR)
diff --git a/src/gallium/drivers/nouveau/nvc0/nvc0_program.c b/src/gallium/drivers/nouveau/nvc0/nvc0_program.c
index 3e982dbeec7..1a5073292e8 100644
--- a/src/gallium/drivers/nouveau/nvc0/nvc0_program.c
+++ b/src/gallium/drivers/nouveau/nvc0/nvc0_program.c
@@ -90,7 +90,7 @@ nvc0_shader_output_address(unsigned sn, unsigned si)
}
static int
-nvc0_vp_assign_input_slots(struct nv50_ir_prog_info *info)
+nvc0_vp_assign_input_slots(struct nv50_ir_prog_info_out *info)
{
unsigned i, c, n;
@@ -114,7 +114,7 @@ nvc0_vp_assign_input_slots(struct nv50_ir_prog_info *info)
}
static int
-nvc0_sp_assign_input_slots(struct nv50_ir_prog_info *info)
+nvc0_sp_assign_input_slots(struct nv50_ir_prog_info_out *info)
{
unsigned offset;
unsigned i, c;
@@ -130,7 +130,7 @@ nvc0_sp_assign_input_slots(struct nv50_ir_prog_info *info)
}
static int
-nvc0_fp_assign_output_slots(struct nv50_ir_prog_info *info)
+nvc0_fp_assign_output_slots(struct nv50_ir_prog_info_out *info)
{
unsigned count = info->prop.fp.numColourResults * 4;
unsigned i, c;
@@ -163,7 +163,7 @@ nvc0_fp_assign_output_slots(struct nv50_ir_prog_info *info)
}
static int
-nvc0_sp_assign_output_slots(struct nv50_ir_prog_info *info)
+nvc0_sp_assign_output_slots(struct nv50_ir_prog_info_out *info)
{
unsigned offset;
unsigned i, c;
@@ -179,7 +179,7 @@ nvc0_sp_assign_output_slots(struct nv50_ir_prog_info *info)
}
static int
-nvc0_program_assign_varying_slots(struct nv50_ir_prog_info *info)
+nvc0_program_assign_varying_slots(struct nv50_ir_prog_info_out *info)
{
int ret;
@@ -211,7 +211,7 @@ nvc0_vtgp_hdr_update_oread(struct nvc0_program *vp, uint8_t slot)
/* Common part of header generation for VP, TCP, TEP and GP. */
static int
-nvc0_vtgp_gen_header(struct nvc0_program *vp, struct nv50_ir_prog_info *info)
+nvc0_vtgp_gen_header(struct nvc0_program *vp, struct nv50_ir_prog_info_out *info)
{
unsigned i, c, a;
@@ -276,7 +276,7 @@ nvc0_vtgp_gen_header(struct nvc0_program *vp, struct nv50_ir_prog_info *info)
}
static int
-nvc0_vp_gen_header(struct nvc0_program *vp, struct nv50_ir_prog_info *info)
+nvc0_vp_gen_header(struct nvc0_program *vp, struct nv50_ir_prog_info_out *info)
{
vp->hdr[0] = 0x20061 | (1 << 10);
vp->hdr[4] = 0xff000;
@@ -285,7 +285,7 @@ nvc0_vp_gen_header(struct nvc0_program *vp, struct nv50_ir_prog_info *info)
}
static void
-nvc0_tp_get_tess_mode(struct nvc0_program *tp, struct nv50_ir_prog_info *info)
+nvc0_tp_get_tess_mode(struct nvc0_program *tp, struct nv50_ir_prog_info_out *info)
{
if (info->prop.tp.outputPrim == PIPE_PRIM_MAX) {
tp->tp.tess_mode = ~0;
@@ -339,7 +339,7 @@ nvc0_tp_get_tess_mode(struct nvc0_program *tp, struct nv50_ir_prog_info *info)
}
static int
-nvc0_tcp_gen_header(struct nvc0_program *tcp, struct nv50_ir_prog_info *info)
+nvc0_tcp_gen_header(struct nvc0_program *tcp, struct nv50_ir_prog_info_out *info)
{
unsigned opcs = 6; /* output patch constants (at least the TessFactors) */
@@ -370,7 +370,7 @@ nvc0_tcp_gen_header(struct nvc0_program *tcp, struct nv50_ir_prog_info *info)
}
static int
-nvc0_tep_gen_header(struct nvc0_program *tep, struct nv50_ir_prog_info *info)
+nvc0_tep_gen_header(struct nvc0_program *tep, struct nv50_ir_prog_info_out *info)
{
tep->hdr[0] = 0x20061 | (3 << 10);
tep->hdr[4] = 0xff000;
@@ -385,7 +385,7 @@ nvc0_tep_gen_header(struct nvc0_program *tep, struct nv50_ir_prog_info *info)
}
static int
-nvc0_gp_gen_header(struct nvc0_program *gp, struct nv50_ir_prog_info *info)
+nvc0_gp_gen_header(struct nvc0_program *gp, struct nv50_ir_prog_info_out *info)
{
gp->hdr[0] = 0x20061 | (4 << 10);
@@ -430,7 +430,7 @@ nvc0_hdr_interp_mode(const struct nv50_ir_varying *var)
}
static int
-nvc0_fp_gen_header(struct nvc0_program *fp, struct nv50_ir_prog_info *info)
+nvc0_fp_gen_header(struct nvc0_program *fp, struct nv50_ir_prog_info_out *info)
{
unsigned i, c, a, m;
@@ -507,7 +507,7 @@ nvc0_fp_gen_header(struct nvc0_program *fp, struct nv50_ir_prog_info *info)
}
static struct nvc0_transform_feedback_state *
-nvc0_program_create_tfb_state(const struct nv50_ir_prog_info *info,
+nvc0_program_create_tfb_state(const struct nv50_ir_prog_info_out *info,
const struct pipe_stream_output_info *pso)
{
struct nvc0_transform_feedback_state *tfb;
@@ -571,6 +571,7 @@ nvc0_program_translate(struct nvc0_program *prog, uint16_t chipset,
struct pipe_debug_callback *debug)
{
struct nv50_ir_prog_info *info;
+ struct nv50_ir_prog_info_out info_out = {};
int ret;
info = CALLOC_STRUCT(nv50_ir_prog_info);
@@ -603,8 +604,6 @@ nvc0_program_translate(struct nvc0_program *prog, uint16_t chipset,
info->optLevel = 3;
#endif
- info->bin.smemSize = prog->cp.smem_size;
- info->io.genUserClip = prog->vp.num_ucps;
info->io.auxCBSlot = 15;
info->io.msInfoCBSlot = 15;
info->io.ucpBase = NVC0_CB_AUX_UCP_INFO;
@@ -631,42 +630,46 @@ nvc0_program_translate(struct nvc0_program *prog, uint16_t chipset,
info->assignSlots = nvc0_program_assign_varying_slots;
- ret = nv50_ir_generate_code(info);
+ /* these fields might be overwritten by the compiler */
+ info_out.bin.smemSize = prog->cp.smem_size;
+ info_out.io.genUserClip = prog->vp.num_ucps;
+
+ ret = nv50_ir_generate_code(info, &info_out);
if (ret) {
NOUVEAU_ERR("shader translation failed: %i\n", ret);
goto out;
}
- prog->code = info->bin.code;
- prog->code_size = info->bin.codeSize;
- prog->relocs = info->bin.relocData;
- prog->fixups = info->bin.fixupData;
- prog->num_gprs = MAX2(4, (info->bin.maxGPR + 1));
- prog->cp.smem_size = info->bin.smemSize;
- prog->num_barriers = info->numBarriers;
+ prog->code = info_out.bin.code;
+ prog->code_size = info_out.bin.codeSize;
+ prog->relocs = info_out.bin.relocData;
+ prog->fixups = info_out.bin.fixupData;
+ prog->num_gprs = MAX2(4, (info_out.bin.maxGPR + 1));
+ prog->cp.smem_size = info_out.bin.smemSize;
+ prog->num_barriers = info_out.numBarriers;
- prog->vp.need_vertex_id = info->io.vertexId < PIPE_MAX_SHADER_INPUTS;
- prog->vp.need_draw_parameters = info->prop.vp.usesDrawParameters;
+ prog->vp.need_vertex_id = info_out.io.vertexId < PIPE_MAX_SHADER_INPUTS;
+ prog->vp.need_draw_parameters = info_out.prop.vp.usesDrawParameters;
- if (info->io.edgeFlagOut < PIPE_MAX_ATTRIBS)
- info->out[info->io.edgeFlagOut].mask = 0; /* for headergen */
- prog->vp.edgeflag = info->io.edgeFlagIn;
+ if (info_out.io.edgeFlagOut < PIPE_MAX_ATTRIBS)
+ info_out.out[info_out.io.edgeFlagOut].mask = 0; /* for headergen */
+ prog->vp.edgeflag = info_out.io.edgeFlagIn;
switch (prog->type) {
case PIPE_SHADER_VERTEX:
- ret = nvc0_vp_gen_header(prog, info);
+ ret = nvc0_vp_gen_header(prog, &info_out);
break;
case PIPE_SHADER_TESS_CTRL:
- ret = nvc0_tcp_gen_header(prog, info);
+ ret = nvc0_tcp_gen_header(prog, &info_out);
break;
case PIPE_SHADER_TESS_EVAL:
- ret = nvc0_tep_gen_header(prog, info);
+ ret = nvc0_tep_gen_header(prog, &info_out);
break;
case PIPE_SHADER_GEOMETRY:
- ret = nvc0_gp_gen_header(prog, info);
+ ret = nvc0_gp_gen_header(prog, &info_out);
break;
case PIPE_SHADER_FRAGMENT:
- ret = nvc0_fp_gen_header(prog, info);
+ ret = nvc0_fp_gen_header(prog, &info_out);
break;
case PIPE_SHADER_COMPUTE:
break;
@@ -678,10 +681,10 @@ nvc0_program_translate(struct nvc0_program *prog, uint16_t chipset,
if (ret)
goto out;
- if (info->bin.tlsSpace) {
- assert(info->bin.tlsSpace < (1 << 24));
+ if (info_out.bin.tlsSpace) {
+ assert(info_out.bin.tlsSpace < (1 << 24));
prog->hdr[0] |= 1 << 26;
- prog->hdr[1] |= align(info->bin.tlsSpace, 0x10); /* l[] size */
+ prog->hdr[1] |= align(info_out.bin.tlsSpace, 0x10); /* l[] size */
prog->need_tls = true;
}
/* TODO: factor 2 only needed where joinat/precont is used,
@@ -693,22 +696,22 @@ nvc0_program_translate(struct nvc0_program *prog, uint16_t chipset,
prog->need_tls = true;
}
*/
- if (info->io.globalAccess)
+ if (info_out.io.globalAccess)
prog->hdr[0] |= 1 << 26;
- if (info->io.globalAccess & 0x2)
+ if (info_out.io.globalAccess & 0x2)
prog->hdr[0] |= 1 << 16;
- if (info->io.fp64)
+ if (info_out.io.fp64)
prog->hdr[0] |= 1 << 27;
if (prog->pipe.stream_output.num_outputs)
- prog->tfb = nvc0_program_create_tfb_state(info,
+ prog->tfb = nvc0_program_create_tfb_state(&info_out,
&prog->pipe.stream_output);
pipe_debug_message(debug, SHADER_INFO,
"type: %d, local: %d, shared: %d, gpr: %d, inst: %d, bytes: %d",
- prog->type, info->bin.tlsSpace, info->bin.smemSize,
- prog->num_gprs, info->bin.instructions,
- info->bin.codeSize);
+ prog->type, info_out.bin.tlsSpace, info_out.bin.smemSize,
+ prog->num_gprs, info_out.bin.instructions,
+ info_out.bin.codeSize);
#ifndef NDEBUG
if (debug_get_option("NV50_PROG_CHIPSET", NULL) && info->dbgFlags)
--
2.21.1
More information about the mesa-dev
mailing list