nv50_program.c revision 6d0f7ea95475009ee17862786469f7b9a34a797f
1f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_context.h"
2f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_defines.h"
3f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_state.h"
4f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_inlines.h"
5f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
6f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_shader_tokens.h"
7f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "tgsi/util/tgsi_parse.h"
8f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "tgsi/util/tgsi_util.h"
9f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
10f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "nv50_context.h"
11f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "nv50_state.h"
12f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
13f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#define NV50_SU_MAX_TEMP 64
14f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
159a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs/* ARL - gallium craps itself on progs/vp/arl.txt
1621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs *
1721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * MSB - Like MAD, but MUL+SUB
1821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * 	- Fuck it off, introduce a way to negate args for ops that
1921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * 	  support it.
2021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs *
21ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs * Look into inlining IMMD for ops other than MOV (make it general?)
2233e4d30d50344be26398a51365bea1be37487403Ben Skeggs * 	- Maybe even relax restrictions a bit, can't do P_RESULT + P_IMMD,
2333e4d30d50344be26398a51365bea1be37487403Ben Skeggs * 	  but can emit to P_TEMP first - then MOV later. NVIDIA does this
24ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs *
25ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs * Verify half-insns work where expected - and force disable them where they
26ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs * don't work - MUL has it forcibly disabled atm as it fixes POW..
27afcaeaa0e4dc3ced40621c76304a2c0c5a3ab403Ben Skeggs *
28afcaeaa0e4dc3ced40621c76304a2c0c5a3ab403Ben Skeggs * FUCK! watch dst==src vectors, can overwrite components that are needed.
29afcaeaa0e4dc3ced40621c76304a2c0c5a3ab403Ben Skeggs * 	ie. SUB R0, R0.yzxw, R0
30776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs *
316d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * MOV dst, -src
326d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 	"delta" tmp, -src (0xa0000204,0xe4004780 - delta r0, -r0)
336d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 	mov dst, tmp
346d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs *
35b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs * Things to check with renouveau:
36b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs * 	FP attr/result assignment - how?
376d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 		attrib
386d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 			- 0x16bc maps vp output onto fp hpos
396d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 			- 0x16c0 maps vp output onto fp col0
406d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 		result
416d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 			- colr always 0-3
426d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 			- depr always 4
436d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 0x16bc->0x16e8 --> some binding between vp/fp regs
446d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 0x16b8 --> VP output count
456d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs *
466d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 0x1298 --> "MOV rcol.x, fcol.y" "MOV depr, fcol.y" = 0x00000005
476d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 	      "MOV rcol.x, fcol.y" = 0x00000004
486d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 0x19a8 --> as above but 0x00000100 and 0x00000000
496d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 	- 0x00100000 used when KIL used
506d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 0x196c --> as above but 0x00000011 and 0x00000000
516d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs *
526d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 0x1988 --> 0xXXNNNNNN
536d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 	- XX == FP high something
5421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs */
55f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstruct nv50_reg {
56f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	enum {
57f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_TEMP,
58f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_ATTR,
59f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_RESULT,
60f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_CONST,
61f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_IMMD
62f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	} type;
63f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int index;
64f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
65f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int hw;
6638ce697e5942550888c28bd4859ca2a92f247bf7Ben Skeggs	int neg;
67f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs};
68f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
69f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstruct nv50_pc {
70f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_program *p;
71f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
72f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	/* hw resources */
73f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *r_temp[NV50_SU_MAX_TEMP];
74f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
75f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	/* tgsi resources */
76f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *temp;
77f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int temp_nr;
78f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *attr;
79f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int attr_nr;
80f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *result;
81f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int result_nr;
82f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *param;
83f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int param_nr;
84f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *immd;
85f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	float *immd_buf;
86f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int immd_nr;
872a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
8852a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	struct nv50_reg *temp_temp[8];
892a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned temp_temp_nr;
90f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs};
91f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
92f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic void
93f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsalloc_reg(struct nv50_pc *pc, struct nv50_reg *reg)
94f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
95f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int i;
96f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
978ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	if (reg->type != P_TEMP)
98f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return;
99f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1008ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	if (reg->hw >= 0) {
1018ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		/*XXX: do this here too to catch FP temp-as-attr usage..
1028ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		 *     not clean, but works */
1038ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		if (pc->p->cfg.high_temp < (reg->hw + 1))
1048ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			pc->p->cfg.high_temp = reg->hw + 1;
1058ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		return;
1068ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	}
1078ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
108f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (i = 0; i < NV50_SU_MAX_TEMP; i++) {
109f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!(pc->r_temp[i])) {
110f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			pc->r_temp[i] = reg;
111f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			reg->hw = i;
1128ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			if (pc->p->cfg.high_temp < (i + 1))
1138ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				pc->p->cfg.high_temp = i + 1;
114f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			return;
115f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
116f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
117f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
118f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	assert(0);
119f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
120f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
121f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic struct nv50_reg *
122f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsalloc_temp(struct nv50_pc *pc, struct nv50_reg *dst)
123f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
124f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *r;
125f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int i;
126f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
127f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (dst && dst->type == P_TEMP && dst->hw == -1)
128f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return dst;
129f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
130f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (i = 0; i < NV50_SU_MAX_TEMP; i++) {
131f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->r_temp[i]) {
132f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r = CALLOC_STRUCT(nv50_reg);
133f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r->type = P_TEMP;
134f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r->index = -1;
135f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r->hw = i;
136f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			pc->r_temp[i] = r;
137f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			return r;
138f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
139f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
140f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
141f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	assert(0);
142f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return NULL;
143f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
144f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
145f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic void
146f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsfree_temp(struct nv50_pc *pc, struct nv50_reg *r)
147f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
148f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (r->index == -1) {
149f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		FREE(pc->r_temp[r->hw]);
150f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->r_temp[r->hw] = NULL;
151f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
152f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
153f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
154f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic struct nv50_reg *
1552a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggstemp_temp(struct nv50_pc *pc)
1562a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
15752a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	if (pc->temp_temp_nr >= 8)
1582a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		assert(0);
1592a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
1602a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	pc->temp_temp[pc->temp_temp_nr] = alloc_temp(pc, NULL);
1612a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	return pc->temp_temp[pc->temp_temp_nr++];
1622a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
1632a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
1642a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
1652a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggskill_temp_temp(struct nv50_pc *pc)
1662a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
1672a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	int i;
1682a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
1692a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	for (i = 0; i < pc->temp_temp_nr; i++)
1702a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		free_temp(pc, pc->temp_temp[i]);
1712a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	pc->temp_temp_nr = 0;
1722a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
1732a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
17433e4d30d50344be26398a51365bea1be37487403Ben Skeggsstatic int
17533e4d30d50344be26398a51365bea1be37487403Ben Skeggsctor_immd(struct nv50_pc *pc, float x, float y, float z, float w)
17633e4d30d50344be26398a51365bea1be37487403Ben Skeggs{
17733e4d30d50344be26398a51365bea1be37487403Ben Skeggs	pc->immd_buf = realloc(pc->immd_buf, (pc->immd_nr + 1) * 4 *
17833e4d30d50344be26398a51365bea1be37487403Ben Skeggs					     sizeof(float));
17933e4d30d50344be26398a51365bea1be37487403Ben Skeggs	pc->immd_buf[(pc->immd_nr * 4) + 0] = x;
180686bc00c05094e8678747c111a6a70ad4b7063e3Ben Skeggs	pc->immd_buf[(pc->immd_nr * 4) + 1] = y;
181686bc00c05094e8678747c111a6a70ad4b7063e3Ben Skeggs	pc->immd_buf[(pc->immd_nr * 4) + 2] = z;
182686bc00c05094e8678747c111a6a70ad4b7063e3Ben Skeggs	pc->immd_buf[(pc->immd_nr * 4) + 3] = w;
18333e4d30d50344be26398a51365bea1be37487403Ben Skeggs
18433e4d30d50344be26398a51365bea1be37487403Ben Skeggs	return pc->immd_nr++;
18533e4d30d50344be26398a51365bea1be37487403Ben Skeggs}
18633e4d30d50344be26398a51365bea1be37487403Ben Skeggs
18733e4d30d50344be26398a51365bea1be37487403Ben Skeggsstatic struct nv50_reg *
18833e4d30d50344be26398a51365bea1be37487403Ben Skeggsalloc_immd(struct nv50_pc *pc, float f)
18933e4d30d50344be26398a51365bea1be37487403Ben Skeggs{
19033e4d30d50344be26398a51365bea1be37487403Ben Skeggs	struct nv50_reg *r = CALLOC_STRUCT(nv50_reg);
19133e4d30d50344be26398a51365bea1be37487403Ben Skeggs	unsigned hw;
19233e4d30d50344be26398a51365bea1be37487403Ben Skeggs
19301e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	hw = ctor_immd(pc, f, 0, 0, 0) * 4;
19433e4d30d50344be26398a51365bea1be37487403Ben Skeggs	r->type = P_IMMD;
19533e4d30d50344be26398a51365bea1be37487403Ben Skeggs	r->hw = hw;
19633e4d30d50344be26398a51365bea1be37487403Ben Skeggs	r->index = -1;
19733e4d30d50344be26398a51365bea1be37487403Ben Skeggs	return r;
19833e4d30d50344be26398a51365bea1be37487403Ben Skeggs}
19933e4d30d50344be26398a51365bea1be37487403Ben Skeggs
20055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic void
20155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsemit(struct nv50_pc *pc, unsigned *inst)
20255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
20355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	struct nv50_program *p = pc->p;
20455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
205bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (inst[0] & 1) {
206bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		p->insns_nr += 2;
207bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		p->insns = realloc(p->insns, sizeof(unsigned) * p->insns_nr);
208bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		memcpy(p->insns + (p->insns_nr - 2), inst, sizeof(unsigned)*2);
209bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	} else {
210bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		p->insns_nr += 1;
211bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		p->insns = realloc(p->insns, sizeof(unsigned) * p->insns_nr);
212bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		memcpy(p->insns + (p->insns_nr - 1), inst, sizeof(unsigned));
213bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	}
21455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
21555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
21655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void set_long(struct nv50_pc *, unsigned *);
21755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
21855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic boolean
21955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsis_long(unsigned *inst)
22055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
22155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (inst[0] & 1)
22255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		return TRUE;
22355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	return FALSE;
22455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
22555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
22655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic boolean
22755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsis_immd(unsigned *inst)
22855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
22955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (is_long(inst) && (inst[1] & 3) == 3)
23055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		return TRUE;
23155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	return FALSE;
23255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
23355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
23455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
23555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsset_pred(struct nv50_pc *pc, unsigned pred, unsigned idx, unsigned *inst)
23655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
23755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_long(pc, inst);
23855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] &= ~((0x1f << 7) | (0x3 << 12));
23955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] |= (pred << 7) | (idx << 12);
24055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
24155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
24255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
24355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsset_pred_wr(struct nv50_pc *pc, unsigned on, unsigned idx, unsigned *inst)
24455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
24555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_long(pc, inst);
24655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] &= ~((0x3 << 4) | (1 << 6));
24755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] |= (idx << 4) | (on << 6);
24855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
24955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
25055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
25155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsset_long(struct nv50_pc *pc, unsigned *inst)
25255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
25355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (is_long(inst))
25455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		return;
25555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
25655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[0] |= 1;
25755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_pred(pc, 0xf, 0, inst);
25855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_pred_wr(pc, 0, 0, inst);
25955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
26055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
26155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
26255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsset_dst(struct nv50_pc *pc, struct nv50_reg *dst, unsigned *inst)
26355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
26455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (dst->type == P_RESULT) {
26555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		set_long(pc, inst);
26655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[1] |= 0x00000008;
26755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	}
26855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
26955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	alloc_reg(pc, dst);
27055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[0] |= (dst->hw << 2);
27155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
27255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
27355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
27455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsset_immd(struct nv50_pc *pc, struct nv50_reg *imm, unsigned *inst)
27555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
27655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	unsigned val = fui(pc->immd_buf[imm->hw]); /* XXX */
27755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
27855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_long(pc, inst);
27955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	/*XXX: can't be predicated - bits overlap.. catch cases where both
28055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	 *     are required and avoid them. */
28155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_pred(pc, 0, 0, inst);
28255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_pred_wr(pc, 0, 0, inst);
28355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
28455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] |= 0x00000002 | 0x00000001;
28555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[0] |= (val & 0x3f) << 16;
28655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] |= (val >> 6) << 2;
28755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
28855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
28955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic void
2908ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggsemit_interp(struct nv50_pc *pc, struct nv50_reg *dst,
2918ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	    struct nv50_reg *src, struct nv50_reg *iv, boolean noperspective)
2928ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs{
2938ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	unsigned inst[2] = { 0, 0 };
2948ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
2958ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	inst[0] |= 0x80000000;
2968ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	set_dst(pc, dst, inst);
2978ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	alloc_reg(pc, iv);
2988ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	inst[0] |= (iv->hw << 9);
2998ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	alloc_reg(pc, src);
3008ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	inst[0] |= (src->hw << 16);
3018ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	if (noperspective)
3028ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		inst[0] |= (1 << 25);
3038ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
3048ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	emit(pc, inst);
3058ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs}
3068ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
3078ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggsstatic void
3082a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsset_cseg(struct nv50_pc *pc, struct nv50_reg *src, unsigned *inst)
3092a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
3102a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_long(pc, inst);
3112a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_IMMD) {
3122a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[1] |= (NV50_CB_PMISC << 22);
3132a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else {
314b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs		if (pc->p->type == PIPE_SHADER_VERTEX)
3152a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			inst[1] |= (NV50_CB_PVP << 22);
3162a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		else
3172a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			inst[1] |= (NV50_CB_PFP << 22);
3182a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
3192a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
3202a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3212a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
32255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsemit_mov(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
32355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
32455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	unsigned inst[2] = { 0, 0 };
32555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
32655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[0] |= 0x10000000;
32755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
32855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_dst(pc, dst, inst);
32955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
33055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (dst->type != P_RESULT && src->type == P_IMMD) {
33155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		set_immd(pc, src, inst);
33255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		/*XXX: 32-bit, but steals part of "half" reg space - need to
33355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		 *     catch and handle this case if/when we do half-regs
33455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		 */
33555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[0] |= 0x00008000;
33655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	} else
33755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (src->type == P_IMMD || src->type == P_CONST) {
33855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		set_long(pc, inst);
3392a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		set_cseg(pc, src, inst);
34055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[0] |= (src->hw << 9);
34155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[1] |= 0x20000000; /* src0 const? */
34255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	} else {
34355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		if (src->type == P_ATTR) {
34455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs			set_long(pc, inst);
34555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs			inst[1] |= 0x00200000;
34655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		}
34755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
34855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		alloc_reg(pc, src);
34955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[0] |= (src->hw << 9);
35055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	}
35155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
35255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	/* We really should support "half" instructions here at some point,
35355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	 * but I don't feel confident enough about them yet.
35455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	 */
35555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_long(pc, inst);
35655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (is_long(inst) && !is_immd(inst)) {
35755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[1] |= 0x04000000; /* 32-bit */
35855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[1] |= 0x0003c000; /* "subsubop" 0xf == mov */
35955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	}
36055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
36155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	emit(pc, inst);
36255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
36355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
364f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic boolean
3652a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggscheck_swap_src_0_1(struct nv50_pc *pc,
3662a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		   struct nv50_reg **s0, struct nv50_reg **s1)
3672a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
3682a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	struct nv50_reg *src0 = *s0, *src1 = *s1;
3692a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3702a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src0->type == P_CONST) {
3712a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		if (src1->type != P_CONST) {
3722a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s0 = src1;
3732a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s1 = src0;
3742a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			return TRUE;
3752a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		}
3762a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
3772a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src1->type == P_ATTR) {
3782a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		if (src0->type != P_ATTR) {
3792a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s0 = src1;
3802a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s1 = src0;
3812a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			return TRUE;
3822a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		}
3832a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
3842a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3852a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	return FALSE;
3862a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
3872a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3882a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
3892a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsset_src_0(struct nv50_pc *pc, struct nv50_reg *src, unsigned *inst)
3902a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
3912a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_ATTR) {
3922a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		set_long(pc, inst);
3932a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[1] |= 0x00200000;
3942a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
3952a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_CONST || src->type == P_IMMD) {
3962a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		struct nv50_reg *temp = temp_temp(pc);
3972a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3982a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mov(pc, temp, src);
3992a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		src = temp;
4002a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
4012a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4022a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	alloc_reg(pc, src);
4032a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= (src->hw << 9);
4042a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4052a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4062a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
4072a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsset_src_1(struct nv50_pc *pc, struct nv50_reg *src, unsigned *inst)
4082a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4092a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_ATTR) {
4102a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		struct nv50_reg *temp = temp_temp(pc);
4112a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4122a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mov(pc, temp, src);
4132a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		src = temp;
4142a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
4152a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_CONST || src->type == P_IMMD) {
41634a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs		assert(!(inst[0] & 0x00800000));
41734a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs		if (inst[0] & 0x01000000) {
41834a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			struct nv50_reg *temp = temp_temp(pc);
41934a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs
42034a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			emit_mov(pc, temp, src);
42134a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			src = temp;
42234a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs		} else {
42334a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			set_cseg(pc, src, inst);
42434a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			inst[0] |= 0x00800000;
42534a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs		}
4262a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
4272a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4282a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	alloc_reg(pc, src);
4292a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= (src->hw << 16);
4302a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4312a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4322a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
4332a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsset_src_2(struct nv50_pc *pc, struct nv50_reg *src, unsigned *inst)
4342a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4352a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_long(pc, inst);
4362a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4372a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_ATTR) {
4382a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		struct nv50_reg *temp = temp_temp(pc);
4392a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4402a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mov(pc, temp, src);
4412a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		src = temp;
4422a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
4432a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_CONST || src->type == P_IMMD) {
44434a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs		assert(!(inst[0] & 0x01000000));
44534a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs		if (inst[0] & 0x00800000) {
44634a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			struct nv50_reg *temp = temp_temp(pc);
44734a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs
44834a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			emit_mov(pc, temp, src);
44934a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			src = temp;
45034a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs		} else {
45134a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			set_cseg(pc, src, inst);
45234a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			inst[0] |= 0x01000000;
45334a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs		}
4542a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
4552a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4562a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	alloc_reg(pc, src);
4572a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[1] |= (src->hw << 14);
4582a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4592a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4602a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
4612a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_mul(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
4622a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	 struct nv50_reg *src1)
4632a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4642a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned inst[2] = { 0, 0 };
4652a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4662a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= 0xc0000000;
467ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs	set_long(pc, inst);
4682a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4692a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
4702a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_dst(pc, dst, inst);
4712a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_0(pc, src0, inst);
4722a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_1(pc, src1, inst);
4732a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4742a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	emit(pc, inst);
4752a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4762a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4772a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
47852a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggsemit_add(struct nv50_pc *pc, struct nv50_reg *dst,
47952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	 struct nv50_reg *src0, struct nv50_reg *src1)
4802a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4812a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned inst[2] = { 0, 0 };
4822a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4832a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= 0xb0000000;
4842a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4852a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
4862a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_dst(pc, dst, inst);
4872a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_0(pc, src0, inst);
48852a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	if (is_long(inst))
48952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		set_src_2(pc, src1, inst);
49052a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	else
49152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		set_src_1(pc, src1, inst);
49252a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
49352a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	emit(pc, inst);
49452a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs}
49552a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
49652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggsstatic void
49752a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggsemit_minmax(struct nv50_pc *pc, unsigned sub, struct nv50_reg *dst,
49852a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	    struct nv50_reg *src0, struct nv50_reg *src1)
49952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs{
50052a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	unsigned inst[2] = { 0, 0 };
50152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
50252a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	set_long(pc, inst);
50352a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	inst[0] |= 0xb0000000;
50452a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	inst[1] |= (sub << 29);
50552a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
50652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
50752a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	set_dst(pc, dst, inst);
50852a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	set_src_0(pc, src0, inst);
50952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	set_src_1(pc, src1, inst);
5102a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5112a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	emit(pc, inst);
5122a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
5132a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5142a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
5152a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_sub(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
5162a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	 struct nv50_reg *src1)
5172a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
5182a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned inst[2] = { 0, 0 };
5192a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5202a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= 0xb0000000;
5212a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5222a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_long(pc, inst);
5232a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (check_swap_src_0_1(pc, &src0, &src1))
5242a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[1] |= 0x04000000;
5252a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	else
5262a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[1] |= 0x08000000;
5272a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5282a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_dst(pc, dst, inst);
5292a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_0(pc, src0, inst);
5302a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_2(pc, src1, inst);
5312a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5322a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	emit(pc, inst);
5332a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
5342a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5352a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
5362a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_mad(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
5372a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	 struct nv50_reg *src1, struct nv50_reg *src2)
5382a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
5392a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned inst[2] = { 0, 0 };
5402a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5412a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= 0xe0000000;
5422a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5432a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
5442a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_dst(pc, dst, inst);
5452a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_0(pc, src0, inst);
5462a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_1(pc, src1, inst);
5472a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_2(pc, src2, inst);
5482a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5492a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	emit(pc, inst);
5502a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
5512a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5522a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
55321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggsemit_msb(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
55421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	 struct nv50_reg *src1, struct nv50_reg *src2)
55521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs{
55621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	unsigned inst[2] = { 0, 0 };
55721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
55821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	inst[0] |= 0xe0000000;
55921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	set_long(pc, inst);
56021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	inst[1] |= 0x08000000; /* src0 * src1 - src2 */
56121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
56221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
56321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	set_dst(pc, dst, inst);
56421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	set_src_0(pc, src0, inst);
56521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	set_src_1(pc, src1, inst);
56621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	set_src_2(pc, src2, inst);
56721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
56821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	emit(pc, inst);
56921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs}
57021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
57121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggsstatic void
5722a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_flop(struct nv50_pc *pc, unsigned sub,
5732a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	  struct nv50_reg *dst, struct nv50_reg *src)
5742a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
5752a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned inst[2] = { 0, 0 };
5762a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5772a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= 0x90000000;
57852a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	if (sub) {
57952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		set_long(pc, inst);
58052a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		inst[1] |= (sub << 29);
58152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	}
5822a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5832a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_dst(pc, dst, inst);
5842a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_0(pc, src, inst);
5852a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5862a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	emit(pc, inst);
5872a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
5882a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
589d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggsstatic void
590d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggsemit_preex2(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
591d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs{
592d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	unsigned inst[2] = { 0, 0 };
593d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
594d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	inst[0] |= 0xb0000000;
595d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
596d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	set_dst(pc, dst, inst);
597d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	set_src_0(pc, src, inst);
598d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	set_long(pc, inst);
599d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	inst[1] |= (6 << 29) | 0x00004000;
600d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
601d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	emit(pc, inst);
602d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs}
603faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs
604bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs/*XXX: inaccurate results.. why? */
605bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs#define ALLOW_SET_SWAP 0
606bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
607bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggsstatic void
608bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggsemit_set(struct nv50_pc *pc, unsigned c_op, struct nv50_reg *dst,
609bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 struct nv50_reg *src0, struct nv50_reg *src1)
610bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs{
611bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	unsigned inst[2] = { 0, 0 };
612bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs#if ALLOW_SET_SWAP
613bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	unsigned inv_cop[8] = { 0, 6, 2, 4, 3, 5, 1, 7 };
614bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs#endif
615bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	struct nv50_reg *rdst;
616bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
617bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs#if ALLOW_SET_SWAP
618bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	assert(c_op <= 7);
619bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (check_swap_src_0_1(pc, &src0, &src1))
620bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		c_op = inv_cop[c_op];
621bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs#endif
622bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
623bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	rdst = dst;
624bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (dst->type != P_TEMP)
625bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		dst = alloc_temp(pc, NULL);
626bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
627bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	/* set.u32 */
628bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_long(pc, inst);
629bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[0] |= 0xb0000000;
630bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[1] |= (3 << 29);
631bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[1] |= (c_op << 14);
632bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	/*XXX: breaks things, .u32 by default?
633bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 *     decuda will disasm as .u16 and use .lo/.hi regs, but this
634bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 *     doesn't seem to match what the hw actually does.
635bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[1] |= 0x04000000; << breaks things.. .u32 by default?
636bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 */
637bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_dst(pc, dst, inst);
638bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_src_0(pc, src0, inst);
639bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_src_1(pc, src1, inst);
640bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	emit(pc, inst);
641bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
642bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	/* cvt.f32.u32 */
643bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[0] = 0xa0000001;
644bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[1] = 0x64014780;
645bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_dst(pc, rdst, inst);
646bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_src_0(pc, dst, inst);
647bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	emit(pc, inst);
648bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
649bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (dst != rdst)
650bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		free_temp(pc, dst);
651bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs}
652d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
653b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggsstatic void
654b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggsemit_flr(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
655b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs{
656b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	unsigned inst[2] = { 0, 0 };
657b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs
658b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[0] = 0xa0000000; /* cvt */
659688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	set_long(pc, inst);
660b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[1] |= (6 << 29); /* cvt */
661b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[1] |= 0x08000000; /* integer mode */
662b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[1] |= 0x04000000; /* 32 bit */
663b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[1] |= ((0x1 << 3)) << 14; /* .rn */
664b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[1] |= (1 << 14); /* src .f32 */
665b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	set_dst(pc, dst, inst);
666b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	set_src_0(pc, src, inst);
667b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs
668b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	emit(pc, inst);
669b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs}
670b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs
671faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggsstatic void
672faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggsemit_pow(struct nv50_pc *pc, struct nv50_reg *dst,
673faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	 struct nv50_reg *v, struct nv50_reg *e)
674faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs{
675faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	struct nv50_reg *temp = alloc_temp(pc, NULL);
676faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs
677faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	emit_flop(pc, 3, temp, v);
678faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	emit_mul(pc, temp, temp, e);
679faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	emit_preex2(pc, temp, temp);
680faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	emit_flop(pc, 6, dst, temp);
681faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs
682faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	free_temp(pc, temp);
683faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs}
684faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs
685fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggsstatic void
686fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggsemit_abs(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
687fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs{
688fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	unsigned inst[2] = { 0, 0 };
689fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
690fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	inst[0] = 0xa0000000; /* cvt */
691fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	set_long(pc, inst);
692fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	inst[1] |= (6 << 29); /* cvt */
693fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	inst[1] |= 0x04000000; /* 32 bit */
694fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	inst[1] |= (1 << 14); /* src .f32 */
695fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	inst[1] |= ((1 << 6) << 14); /* .abs */
696fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	set_dst(pc, dst, inst);
697fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	set_src_0(pc, src, inst);
698fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
699fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	emit(pc, inst);
700fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs}
701fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
70201e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggsstatic void
70301e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggsemit_lit(struct nv50_pc *pc, struct nv50_reg **dst, struct nv50_reg **src)
70401e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs{
70501e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	struct nv50_reg *one = alloc_immd(pc, 1.0);
70601e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	struct nv50_reg *zero = alloc_immd(pc, 0.0);
70701e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	struct nv50_reg *neg128 = alloc_immd(pc, -127.999999);
70801e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	struct nv50_reg *pos128 = alloc_immd(pc,  127.999999);
70901e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	struct nv50_reg *tmp[4];
71001e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
71101e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	emit_mov(pc, dst[0], one);
71201e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	emit_mov(pc, dst[3], one);
71301e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
71401e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	tmp[0] = temp_temp(pc);
71501e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	emit_minmax(pc, 4, dst[1], src[0], zero);
71601e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	set_pred_wr(pc, 1, 0, &pc->p->insns[pc->p->insns_nr - 2]);
71701e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
71801e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	tmp[1] = temp_temp(pc);
71901e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	emit_minmax(pc, 4, tmp[1], src[1], zero);
72001e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
72101e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	tmp[3] = temp_temp(pc);
72201e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	emit_minmax(pc, 4, tmp[3], src[3], neg128);
72301e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	emit_minmax(pc, 5, tmp[3], tmp[3], pos128);
72401e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
72501e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	emit_pow(pc, dst[2], tmp[1], tmp[3]);
72601e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	emit_mov(pc, dst[2], zero);
72701e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	set_pred(pc, 3, 0, &pc->p->insns[pc->p->insns_nr - 2]);
72801e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs}
72901e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
730fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggsstatic struct nv50_reg *
731fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggstgsi_dst(struct nv50_pc *pc, int c, const struct tgsi_full_dst_register *dst)
732fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs{
733fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	switch (dst->DstRegister.File) {
734fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_FILE_TEMPORARY:
735fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		return &pc->temp[dst->DstRegister.Index * 4 + c];
736fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_FILE_OUTPUT:
737fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		return &pc->result[dst->DstRegister.Index * 4 + c];
738fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_FILE_NULL:
739fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		return NULL;
740fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	default:
741fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
742fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	}
743fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
744fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	return NULL;
745fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs}
746fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
747fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggsstatic struct nv50_reg *
748fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggstgsi_src(struct nv50_pc *pc, int chan, const struct tgsi_full_src_register *src)
749fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs{
750fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	struct nv50_reg *r = NULL;
751fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	struct nv50_reg *temp;
752fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	unsigned c;
753fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
754fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	c = tgsi_util_get_full_src_register_extswizzle(src, chan);
755fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	switch (c) {
756fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_X:
757fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_Y:
758fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_Z:
759fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_W:
760fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		switch (src->SrcRegister.File) {
761fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		case TGSI_FILE_INPUT:
762fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			r = &pc->attr[src->SrcRegister.Index * 4 + c];
763fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			break;
764fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		case TGSI_FILE_TEMPORARY:
765fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			r = &pc->temp[src->SrcRegister.Index * 4 + c];
766fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			break;
767fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		case TGSI_FILE_CONSTANT:
768fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			r = &pc->param[src->SrcRegister.Index * 4 + c];
769fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			break;
770fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		case TGSI_FILE_IMMEDIATE:
771fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			r = &pc->immd[src->SrcRegister.Index * 4 + c];
772fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			break;
773fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		default:
774fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			assert(0);
775fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			break;
776fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		}
777fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
778fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_ZERO:
779fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		r = alloc_immd(pc, 0.0);
780fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
781fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_ONE:
782fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		r = alloc_immd(pc, 1.0);
783fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
784fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	default:
785fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		assert(0);
786fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
787fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	}
788fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
789fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	switch (tgsi_util_get_full_src_register_sign_mode(src, chan)) {
790fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_UTIL_SIGN_KEEP:
791fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
792fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_UTIL_SIGN_CLEAR:
793fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		temp = temp_temp(pc);
794fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		emit_abs(pc, temp, r);
795fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		r = temp;
796fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
797fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	default:
798fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		assert(0);
799fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
800fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	}
801fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
802fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	return r;
803fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs}
804fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
8052a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic boolean
806f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_tx_insn(struct nv50_pc *pc, const union tgsi_full_token *tok)
807f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
808f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	const struct tgsi_full_instruction *inst = &tok->FullInstruction;
809688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	struct nv50_reg *rdst[4], *dst[4], *src[3][4], *temp;
810688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	unsigned mask, sat;
811f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int i, c;
812f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
813f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	NOUVEAU_ERR("insn %p\n", tok);
814f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
815f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	mask = inst->FullDstRegisters[0].DstRegister.WriteMask;
816688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	sat = inst->Instruction.Saturate == TGSI_SAT_ZERO_ONE;
817f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
818f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (c = 0; c < 4; c++) {
819f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (mask & (1 << c))
820f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			dst[c] = tgsi_dst(pc, c, &inst->FullDstRegisters[0]);
821f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		else
822f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			dst[c] = NULL;
823f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
824f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
825f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (i = 0; i < inst->Instruction.NumSrcRegs; i++) {
826f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (c = 0; c < 4; c++)
827f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			src[i][c] = tgsi_src(pc, c, &inst->FullSrcRegisters[i]);
828f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
829f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
830688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	if (sat) {
831688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs		for (c = 0; c < 4; c++) {
832688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			rdst[c] = dst[c];
833688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			dst[c] = temp_temp(pc);
834688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs		}
835688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	}
836688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs
837f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	switch (inst->Instruction.Opcode) {
83868091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs	case TGSI_OPCODE_ABS:
83968091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs		for (c = 0; c < 4; c++) {
840fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			if (!(mask & (1 << c)))
841fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs				continue;
842fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			emit_abs(pc, dst[c], src[0][c]);
84368091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs		}
84468091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs		break;
8452a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_ADD:
8467df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8477df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8487df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
8492a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_add(pc, dst[c], src[0][c], src[1][c]);
8507df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
8512a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
8522a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_COS:
8537df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8547df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8557df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
8562a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_flop(pc, 5, dst[c], src[0][c]);
8577df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
8582a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
8592a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_DP3:
8602a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		temp = alloc_temp(pc, NULL);
8612a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mul(pc, temp, src[0][0], src[1][0]);
8622a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][1], src[1][1], temp);
8632a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][2], src[1][2], temp);
8647df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8657df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8667df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
8672a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mov(pc, dst[c], temp);
8687df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
8692a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		free_temp(pc, temp);
8702a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
8712a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_DP4:
8722a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		temp = alloc_temp(pc, NULL);
8732a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mul(pc, temp, src[0][0], src[1][0]);
8742a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][1], src[1][1], temp);
8752a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][2], src[1][2], temp);
8762a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][3], src[1][3], temp);
8777df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8787df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8797df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
8802a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mov(pc, dst[c], temp);
8817df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
8822a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		free_temp(pc, temp);
8832a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
88421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	case TGSI_OPCODE_DPH:
88521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		temp = alloc_temp(pc, NULL);
88621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mul(pc, temp, src[0][0], src[1][0]);
88721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mad(pc, temp, src[0][1], src[1][1], temp);
88821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mad(pc, temp, src[0][2], src[1][2], temp);
88921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_add(pc, temp, src[1][3], temp);
89021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		for (c = 0; c < 4; c++) {
89121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs			if (!(mask & (1 << c)))
89221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs				continue;
89321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs			emit_mov(pc, dst[c], temp);
89421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		}
89521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		free_temp(pc, temp);
89621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		break;
89733e4d30d50344be26398a51365bea1be37487403Ben Skeggs	case TGSI_OPCODE_DST:
89833e4d30d50344be26398a51365bea1be37487403Ben Skeggs	{
89933e4d30d50344be26398a51365bea1be37487403Ben Skeggs		struct nv50_reg *one = alloc_immd(pc, 1.0);
9009a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 0))
9019a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mov(pc, dst[0], one);
9029a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 1))
9039a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mul(pc, dst[1], src[0][1], src[1][1]);
9049a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 2))
9059a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mov(pc, dst[2], src[0][2]);
9069a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 3))
9079a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mov(pc, dst[3], src[1][3]);
90833e4d30d50344be26398a51365bea1be37487403Ben Skeggs		FREE(one);
90933e4d30d50344be26398a51365bea1be37487403Ben Skeggs	}
91033e4d30d50344be26398a51365bea1be37487403Ben Skeggs		break;
9112a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_EX2:
912fbf4027dd9b279ec159906dcad134f71e34aaec8Ben Skeggs		temp = alloc_temp(pc, NULL);
9137df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9147df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9157df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
916d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs			emit_preex2(pc, temp, src[0][c]);
917fbf4027dd9b279ec159906dcad134f71e34aaec8Ben Skeggs			emit_flop(pc, 6, dst[c], temp);
9187df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
919fbf4027dd9b279ec159906dcad134f71e34aaec8Ben Skeggs		free_temp(pc, temp);
9202a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
921b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	case TGSI_OPCODE_FLR:
922b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		for (c = 0; c < 4; c++) {
923b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			if (!(mask & (1 << c)))
924b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs				continue;
925b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			emit_flr(pc, dst[c], src[0][c]);
926b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		}
927b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		break;
928b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	case TGSI_OPCODE_FRC:
929b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		temp = alloc_temp(pc, NULL);
930b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		for (c = 0; c < 4; c++) {
931b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			if (!(mask & (1 << c)))
932b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs				continue;
933b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			emit_flr(pc, temp, src[0][c]);
934b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			emit_sub(pc, dst[c], src[0][c], temp);
935b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		}
936b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		free_temp(pc, temp);
937b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		break;
93801e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	case TGSI_OPCODE_LIT:
9399a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		/*XXX: writemask */
94001e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs		emit_lit(pc, &dst[0], &src[0][0]);
94101e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs		break;
9422a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_LG2:
9437df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9447df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9457df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
9462a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_flop(pc, 3, dst[c], src[0][c]);
9477df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
9482a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
9492a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_MAD:
9507df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9517df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9527df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
9532a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mad(pc, dst[c], src[0][c], src[1][c], src[2][c]);
9547df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
9552a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
95652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	case TGSI_OPCODE_MAX:
9577df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9587df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9597df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
96052a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs			emit_minmax(pc, 4, dst[c], src[0][c], src[1][c]);
9617df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
96252a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		break;
96352a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	case TGSI_OPCODE_MIN:
9647df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9657df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9667df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
96752a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs			emit_minmax(pc, 5, dst[c], src[0][c], src[1][c]);
9687df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
96952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		break;
970f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_OPCODE_MOV:
9717df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9727df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9737df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
97455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs			emit_mov(pc, dst[c], src[0][c]);
9757df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
97638ce697e5942550888c28bd4859ca2a92f247bf7Ben Skeggs		break;
9772a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_MUL:
9787df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9797df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9807df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
9812a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mul(pc, dst[c], src[0][c], src[1][c]);
9827df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
9832a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
984ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs	case TGSI_OPCODE_POW:
985ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		temp = alloc_temp(pc, NULL);
986faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs		emit_pow(pc, temp, src[0][0], src[1][0]);
987ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		for (c = 0; c < 4; c++) {
988ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs			if (!(mask & (1 << c)))
989ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs				continue;
990ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs			emit_mov(pc, dst[c], temp);
991ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		}
992ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		free_temp(pc, temp);
993ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		break;
9942a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_RCP:
9957df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9967df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9977df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
9982a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_flop(pc, 0, dst[c], src[0][c]);
9997df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
10002a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
10012a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_RSQ:
10027df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
10037df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
10047df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
10052a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_flop(pc, 2, dst[c], src[0][c]);
10067df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
10072a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
1008bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	case TGSI_OPCODE_SGE:
1009bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		for (c = 0; c < 4; c++) {
1010bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			if (!(mask & (1 << c)))
1011bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs				continue;
1012bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			emit_set(pc, 6, dst[c], src[0][c], src[1][c]);
1013bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		}
1014bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		break;
10152a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_SIN:
10167df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
10177df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
10187df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
10192a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_flop(pc, 4, dst[c], src[0][c]);
10207df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
10212a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
1022bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	case TGSI_OPCODE_SLT:
1023bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		for (c = 0; c < 4; c++) {
1024bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			if (!(mask & (1 << c)))
1025bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs				continue;
1026bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			emit_set(pc, 1, dst[c], src[0][c], src[1][c]);
1027bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		}
1028bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		break;
10292a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_SUB:
10307df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
10317df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
10327df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
10332a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_sub(pc, dst[c], src[0][c], src[1][c]);
10347df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
10352a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
103621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	case TGSI_OPCODE_XPD:
103721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		temp = alloc_temp(pc, NULL);
10389a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 0)) {
10399a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mul(pc, temp, src[0][2], src[1][1]);
10409a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_msb(pc, dst[0], src[0][1], src[1][2], temp);
10419a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		}
10429a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 1)) {
10439a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mul(pc, temp, src[0][0], src[1][2]);
10449a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_msb(pc, dst[1], src[0][2], src[1][0], temp);
10459a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		}
10469a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 2)) {
10479a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mul(pc, temp, src[0][1], src[1][0]);
10489a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_msb(pc, dst[2], src[0][0], src[1][1], temp);
10499a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		}
105021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		free_temp(pc, temp);
105121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		break;
1052f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_OPCODE_END:
1053f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		break;
1054f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	default:
1055f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		NOUVEAU_ERR("invalid opcode %d\n", inst->Instruction.Opcode);
1056f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return FALSE;
1057f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1058f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1059688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	if (sat) {
1060688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs		for (c = 0; c < 4; c++) {
1061688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			unsigned inst[2] = { 0, 0 };
1062688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs
1063688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			if (!(mask & (1 << c)))
1064688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs				continue;
1065688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs
1066688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			inst[0] = 0xa0000000; /* cvt */
1067688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			set_long(pc, inst);
1068688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			inst[1] |= (6 << 29); /* cvt */
1069688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			inst[1] |= 0x04000000; /* 32 bit */
1070688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			inst[1] |= (1 << 14); /* src .f32 */
1071688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			inst[1] |= ((1 << 5) << 14); /* .sat */
1072688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			set_dst(pc, rdst[c], inst);
1073688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			set_src_0(pc, dst[c], inst);
1074688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			emit(pc, inst);
1075688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs		}
1076688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	}
1077688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs
107852a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	kill_temp_temp(pc);
1079f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return TRUE;
1080f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1081f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1082f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic boolean
1083f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_tx_prep(struct nv50_pc *pc)
1084f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1085f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct tgsi_parse_context p;
1086f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	boolean ret = FALSE;
1087f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	unsigned i, c;
1088f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1089f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_init(&p, pc->p->pipe.tokens);
1090f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	while (!tgsi_parse_end_of_tokens(&p)) {
1091f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		const union tgsi_full_token *tok = &p.FullToken;
1092f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1093f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		tgsi_parse_token(&p);
1094f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		switch (tok->Token.Type) {
1095f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_IMMEDIATE:
1096f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		{
1097f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			const struct tgsi_full_immediate *imm =
1098f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				&p.FullToken.FullImmediate;
1099f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
110033e4d30d50344be26398a51365bea1be37487403Ben Skeggs			ctor_immd(pc, imm->u.ImmediateFloat32[0].Float,
110133e4d30d50344be26398a51365bea1be37487403Ben Skeggs				      imm->u.ImmediateFloat32[1].Float,
110233e4d30d50344be26398a51365bea1be37487403Ben Skeggs				      imm->u.ImmediateFloat32[2].Float,
110333e4d30d50344be26398a51365bea1be37487403Ben Skeggs				      imm->u.ImmediateFloat32[3].Float);
1104f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1105f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1106f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_DECLARATION:
1107f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		{
1108f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			const struct tgsi_full_declaration *d;
1109f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			unsigned last;
1110f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1111f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			d = &p.FullToken.FullDeclaration;
1112f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			last = d->u.DeclarationRange.Last;
1113f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1114f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			switch (d->Declaration.File) {
1115f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_TEMPORARY:
1116f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->temp_nr < (last + 1))
1117f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->temp_nr = last + 1;
1118f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
1119f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_OUTPUT:
1120f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->result_nr < (last + 1))
1121f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->result_nr = last + 1;
1122f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
1123f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_INPUT:
1124f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->attr_nr < (last + 1))
1125f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->attr_nr = last + 1;
1126f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
1127f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_CONSTANT:
1128f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->param_nr < (last + 1))
1129f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->param_nr = last + 1;
1130f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
1131f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			default:
1132f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				NOUVEAU_ERR("bad decl file %d\n",
1133f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					    d->Declaration.File);
1134f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				goto out_err;
1135f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1136f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1137f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1138f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_INSTRUCTION:
1139f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1140f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		default:
1141f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1142f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1143f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1144f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1145f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	NOUVEAU_ERR("%d temps\n", pc->temp_nr);
1146f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->temp_nr) {
1147f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->temp = calloc(pc->temp_nr * 4, sizeof(struct nv50_reg));
1148f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->temp)
1149f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1150f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1151f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->temp_nr; i++) {
1152f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1153f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->temp[i*4+c].type = P_TEMP;
1154f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->temp[i*4+c].hw = -1;
1155f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->temp[i*4+c].index = i;
1156f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1157f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1158f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1159f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1160f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	NOUVEAU_ERR("%d attrib regs\n", pc->attr_nr);
1161f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->attr_nr) {
11628ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		struct nv50_reg *iv = NULL, *tmp = NULL;
1163f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		int aid = 0;
1164f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1165f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->attr = calloc(pc->attr_nr * 4, sizeof(struct nv50_reg));
1166f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->attr)
1167f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1168f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1169b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs		if (pc->p->type == PIPE_SHADER_FRAGMENT) {
11708ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			iv = alloc_temp(pc, NULL);
11718ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			aid++;
11728ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		}
11738ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
1174f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->attr_nr; i++) {
11758ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			struct nv50_reg *a = &pc->attr[i*4];
11768ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
1177f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1178b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs				if (pc->p->type == PIPE_SHADER_FRAGMENT) {
11798ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					struct nv50_reg *at =
11808ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs						alloc_temp(pc, NULL);
11818ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].type = at->type;
11828ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].hw = at->hw;
11838ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].index = at->index;
11848ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				} else {
11858ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->p->cfg.vp.attr[aid/32] |=
11868ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs						(1 << (aid % 32));
11878ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].type = P_ATTR;
11888ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].hw = aid++;
11898ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].index = i;
11908ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				}
1191f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
11928ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
1193b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs			if (pc->p->type != PIPE_SHADER_FRAGMENT)
11948ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				continue;
11958ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
11968ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			emit_interp(pc, iv, iv, iv, FALSE);
11978ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			tmp = alloc_temp(pc, NULL);
1198713ef6ccd2590bd866598bb6d4f646e9ec29ba78Ben Skeggs			emit_flop(pc, 0, tmp, iv);
11998ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			emit_interp(pc, &a[0], &a[0], tmp, TRUE);
12008ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			emit_interp(pc, &a[1], &a[1], tmp, TRUE);
12018ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			emit_interp(pc, &a[2], &a[2], tmp, TRUE);
12028ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			emit_interp(pc, &a[3], &a[3], tmp, TRUE);
12038ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			free_temp(pc, tmp);
1204f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
12058ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
12068ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		if (iv)
12078ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			free_temp(pc, iv);
1208f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1209f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1210f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	NOUVEAU_ERR("%d result regs\n", pc->result_nr);
1211f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->result_nr) {
1212f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		int rid = 0;
1213f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1214f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->result = calloc(pc->result_nr * 4, sizeof(struct nv50_reg));
1215f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->result)
1216f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1217f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1218f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->result_nr; i++) {
1219f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1220b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs				if (pc->p->type == PIPE_SHADER_FRAGMENT) {
12218ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->result[i*4+c].type = P_TEMP;
1222776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs					pc->result[i*4+c].hw = -1;
1223776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs				} else {
12248ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->result[i*4+c].type = P_RESULT;
1225776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs					pc->result[i*4+c].hw = rid++;
1226776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs				}
1227f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->result[i*4+c].index = i;
1228f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1229f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1230f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1231f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1232f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	NOUVEAU_ERR("%d param regs\n", pc->param_nr);
1233f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->param_nr) {
1234f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		int rid = 0;
1235f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1236f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->param = calloc(pc->param_nr * 4, sizeof(struct nv50_reg));
1237f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->param)
1238f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1239f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1240f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->param_nr; i++) {
1241f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1242f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->param[i*4+c].type = P_CONST;
1243f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->param[i*4+c].hw = rid++;
1244f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->param[i*4+c].index = i;
1245f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1246f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1247f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1248f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1249f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->immd_nr) {
1250716c1cd2ecbc1e86c0fd747c9fa9e095ded5fd5dBen Skeggs		int rid = 0;
1251f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1252f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->immd = calloc(pc->immd_nr * 4, sizeof(struct nv50_reg));
1253f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->immd)
1254f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1255f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1256f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->immd_nr; i++) {
1257f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1258f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->immd[i*4+c].type = P_IMMD;
1259f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->immd[i*4+c].hw = rid++;
1260f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->immd[i*4+c].index = i;
1261f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1262f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1263f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1264f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1265f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	ret = TRUE;
1266f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsout_err:
1267f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_free(&p);
1268f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return ret;
1269f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1270f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1271f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic boolean
1272f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_tx(struct nv50_program *p)
1273f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1274f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct tgsi_parse_context parse;
1275f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_pc *pc;
1276f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	boolean ret;
1277f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1278f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	pc = CALLOC_STRUCT(nv50_pc);
1279f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (!pc)
1280f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return FALSE;
1281f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	pc->p = p;
12828ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	pc->p->cfg.high_temp = 4;
1283f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1284f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	ret = nv50_program_tx_prep(pc);
1285f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (ret == FALSE)
1286f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		goto out_cleanup;
1287f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1288f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_init(&parse, pc->p->pipe.tokens);
1289f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	while (!tgsi_parse_end_of_tokens(&parse)) {
1290f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		const union tgsi_full_token *tok = &parse.FullToken;
1291f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1292f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		tgsi_parse_token(&parse);
1293f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1294f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		switch (tok->Token.Type) {
1295f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_INSTRUCTION:
1296f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			ret = nv50_program_tx_insn(pc, tok);
1297f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			if (ret == FALSE)
1298f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				goto out_err;
1299f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1300f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		default:
1301f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1302f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1303f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1304f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1305b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs	if (p->type == PIPE_SHADER_FRAGMENT) {
1306776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs		struct nv50_reg out;
1307776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs
1308776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs		out.type = P_TEMP;
1309776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs		for (out.hw = 0; out.hw < pc->result_nr * 4; out.hw++)
1310776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs			emit_mov(pc, &out, &pc->result[out.hw]);
1311776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs	}
1312776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs
1313f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->immd_nr = pc->immd_nr * 4;
1314f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->immd = pc->immd_buf;
1315f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1316f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsout_err:
1317f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_free(&parse);
1318f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1319f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsout_cleanup:
1320f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return ret;
1321f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1322f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1323f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic void
1324f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_validate(struct nv50_context *nv50, struct nv50_program *p)
1325f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1326e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	int i;
1327e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs
1328e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	if (nv50_program_tx(p) == FALSE)
1329e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs		assert(0);
1330e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	/* *not* sufficient, it's fine if last inst is long and
1331e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	 * NOT immd - otherwise it's fucked fucked fucked */
1332e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	p->insns[p->insns_nr - 1] |= 0x00000001;
1333f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1334b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs	if (p->type == PIPE_SHADER_VERTEX) {
13352a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	for (i = 0; i < p->insns_nr; i++)
13362a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		NOUVEAU_ERR("VP0x%08x\n", p->insns[i]);
13372a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else {
1338e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	for (i = 0; i < p->insns_nr; i++)
13392a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		NOUVEAU_ERR("FP0x%08x\n", p->insns[i]);
13402a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
1341f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1342f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->translated = TRUE;
1343f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1344f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
134522e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsstatic void
134622e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsnv50_program_validate_data(struct nv50_context *nv50, struct nv50_program *p)
134722e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs{
134822e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	int i;
134922e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
135022e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	for (i = 0; i < p->immd_nr; i++) {
135122e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs		BEGIN_RING(tesla, 0x0f00, 2);
135222e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs		OUT_RING  ((NV50_CB_PMISC << 16) | (i << 8));
135322e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs		OUT_RING  (fui(p->immd[i]));
135422e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	}
135522e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs}
135622e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
135722e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsstatic void
135822e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsnv50_program_validate_code(struct nv50_context *nv50, struct nv50_program *p)
135922e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs{
136022e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	struct pipe_winsys *ws = nv50->pipe.winsys;
136122e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	void *map;
136222e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
136322e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	if (!p->buffer)
136422e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs		p->buffer = ws->buffer_create(ws, 0x100, 0, p->insns_nr * 4);
136522e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	map = ws->buffer_map(ws, p->buffer, PIPE_BUFFER_USAGE_CPU_WRITE);
136622e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	memcpy(map, p->insns, p->insns_nr * 4);
136722e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	ws->buffer_unmap(ws, p->buffer);
136822e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs}
136922e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
1370f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsvoid
1371f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_vertprog_validate(struct nv50_context *nv50)
1372f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1373f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_grobj *tesla = nv50->screen->tesla;
1374f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_program *p = nv50->vertprog;
1375f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_stateobj *so;
1376f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1377f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (!p->translated) {
1378f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		nv50_program_validate(nv50, p);
1379f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!p->translated)
1380f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			assert(0);
1381f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1382f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
138322e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	nv50_program_validate_data(nv50, p);
138422e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	nv50_program_validate_code(nv50, p);
1385f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1386f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so = so_new(11, 2);
1387f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, NV50TCL_VP_ADDRESS_HIGH, 2);
1388f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1389f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_HIGH, 0, 0);
1390f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1391f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_LOW, 0, 0);
1392f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, 0x1650, 2);
1393f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, p->cfg.vp.attr[0]);
1394f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, p->cfg.vp.attr[1]);
1395f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, 0x16ac, 2);
1396f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, 8);
13978ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_data  (so, p->cfg.high_temp);
1398f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, 0x140c, 1);
1399f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, 0); /* program start offset */
1400f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_emit(nv50->screen->nvws, so);
1401f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_ref(NULL, &so);
1402f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1403f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1404f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsvoid
1405f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_fragprog_validate(struct nv50_context *nv50)
1406f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1407f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_grobj *tesla = nv50->screen->tesla;
1408f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_program *p = nv50->fragprog;
1409f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_stateobj *so;
1410f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1411f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (!p->translated) {
1412f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		nv50_program_validate(nv50, p);
1413f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!p->translated)
1414f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			assert(0);
1415f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1416f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
141755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	nv50_program_validate_data(nv50, p);
141855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	nv50_program_validate_code(nv50, p);
1419f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
14208ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so = so_new(7, 2);
1421f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, NV50TCL_FP_ADDRESS_HIGH, 2);
1422f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1423f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_HIGH, 0, 0);
1424f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1425f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_LOW, 0, 0);
14268ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_method(so, tesla, 0x198c, 1);
14278ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_data  (so, p->cfg.high_temp);
14288ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_method(so, tesla, 0x1414, 1);
14298ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_data  (so, 0); /* program start offset */
1430f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_emit(nv50->screen->nvws, so);
1431f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_ref(NULL, &so);
1432f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1433f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1434f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsvoid
1435f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_destroy(struct nv50_context *nv50, struct nv50_program *p)
1436f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1437f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct pipe_winsys *ws = nv50->pipe.winsys;
1438f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1439f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (p->insns_nr) {
1440f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (p->insns)
1441f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			FREE(p->insns);
1442f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		p->insns_nr = 0;
1443f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1444f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1445f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (p->buffer)
1446f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pipe_buffer_reference(ws, &p->buffer, NULL);
1447f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1448f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->translated = 0;
1449f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1450f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1451