nv50_program.c revision afcaeaa0e4dc3ced40621c76304a2c0c5a3ab403
1f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_context.h"
2f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_defines.h"
3f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_state.h"
4f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_inlines.h"
5f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
6f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_shader_tokens.h"
7f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "tgsi/util/tgsi_parse.h"
8f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "tgsi/util/tgsi_util.h"
9f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
10f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "nv50_context.h"
11f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "nv50_state.h"
12f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
13f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#define NV50_SU_MAX_TEMP 64
14f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
159a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs/* ARL - gallium craps itself on progs/vp/arl.txt
1621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs *
1721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * MSB - Like MAD, but MUL+SUB
1821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * 	- Fuck it off, introduce a way to negate args for ops that
1921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * 	  support it.
2021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs *
21ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs * Look into inlining IMMD for ops other than MOV (make it general?)
2233e4d30d50344be26398a51365bea1be37487403Ben Skeggs * 	- Maybe even relax restrictions a bit, can't do P_RESULT + P_IMMD,
2333e4d30d50344be26398a51365bea1be37487403Ben Skeggs * 	  but can emit to P_TEMP first - then MOV later. NVIDIA does this
24ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs *
2501e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs * Hmmm.. what happens if we have src1+src2 both consts.. ouch !
2601e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs *
27ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs * Verify half-insns work where expected - and force disable them where they
28ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs * don't work - MUL has it forcibly disabled atm as it fixes POW..
29afcaeaa0e4dc3ced40621c76304a2c0c5a3ab403Ben Skeggs *
30afcaeaa0e4dc3ced40621c76304a2c0c5a3ab403Ben Skeggs * FUCK! watch dst==src vectors, can overwrite components that are needed.
31afcaeaa0e4dc3ced40621c76304a2c0c5a3ab403Ben Skeggs * 	ie. SUB R0, R0.yzxw, R0
3221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs */
33f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstruct nv50_reg {
34f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	enum {
35f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_TEMP,
36f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_ATTR,
37f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_RESULT,
38f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_CONST,
39f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_IMMD
40f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	} type;
41f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int index;
42f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
43f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int hw;
4438ce697e5942550888c28bd4859ca2a92f247bf7Ben Skeggs	int neg;
45f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs};
46f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
47f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstruct nv50_pc {
48f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_program *p;
49f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
50f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	/* hw resources */
51f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *r_temp[NV50_SU_MAX_TEMP];
52f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
53f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	/* tgsi resources */
54f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *temp;
55f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int temp_nr;
56f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *attr;
57f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int attr_nr;
58f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *result;
59f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int result_nr;
60f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *param;
61f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int param_nr;
62f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *immd;
63f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	float *immd_buf;
64f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int immd_nr;
652a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
6652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	struct nv50_reg *temp_temp[8];
672a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned temp_temp_nr;
68f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs};
69f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
70f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic void
71f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsalloc_reg(struct nv50_pc *pc, struct nv50_reg *reg)
72f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
73f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int i;
74f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
758ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	if (reg->type != P_TEMP)
76f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return;
77f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
788ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	if (reg->hw >= 0) {
798ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		/*XXX: do this here too to catch FP temp-as-attr usage..
808ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		 *     not clean, but works */
818ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		if (pc->p->cfg.high_temp < (reg->hw + 1))
828ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			pc->p->cfg.high_temp = reg->hw + 1;
838ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		return;
848ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	}
858ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
86f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (i = 0; i < NV50_SU_MAX_TEMP; i++) {
87f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!(pc->r_temp[i])) {
88f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			pc->r_temp[i] = reg;
89f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			reg->hw = i;
908ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			if (pc->p->cfg.high_temp < (i + 1))
918ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				pc->p->cfg.high_temp = i + 1;
92f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			return;
93f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
94f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
95f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
96f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	assert(0);
97f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
98f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
99f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic struct nv50_reg *
100f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsalloc_temp(struct nv50_pc *pc, struct nv50_reg *dst)
101f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
102f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *r;
103f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int i;
104f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
105f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (dst && dst->type == P_TEMP && dst->hw == -1)
106f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return dst;
107f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
108f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (i = 0; i < NV50_SU_MAX_TEMP; i++) {
109f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->r_temp[i]) {
110f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r = CALLOC_STRUCT(nv50_reg);
111f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r->type = P_TEMP;
112f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r->index = -1;
113f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r->hw = i;
114f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			pc->r_temp[i] = r;
115f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			return r;
116f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
117f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
118f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
119f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	assert(0);
120f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return NULL;
121f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
122f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
123f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic void
124f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsfree_temp(struct nv50_pc *pc, struct nv50_reg *r)
125f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
126f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (r->index == -1) {
127f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		FREE(pc->r_temp[r->hw]);
128f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->r_temp[r->hw] = NULL;
129f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
130f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
131f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
132f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic struct nv50_reg *
1332a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggstemp_temp(struct nv50_pc *pc)
1342a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
13552a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	if (pc->temp_temp_nr >= 8)
1362a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		assert(0);
1372a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
1382a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	pc->temp_temp[pc->temp_temp_nr] = alloc_temp(pc, NULL);
1392a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	return pc->temp_temp[pc->temp_temp_nr++];
1402a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
1412a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
1422a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
1432a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggskill_temp_temp(struct nv50_pc *pc)
1442a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
1452a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	int i;
1462a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
1472a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	for (i = 0; i < pc->temp_temp_nr; i++)
1482a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		free_temp(pc, pc->temp_temp[i]);
1492a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	pc->temp_temp_nr = 0;
1502a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
1512a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
15233e4d30d50344be26398a51365bea1be37487403Ben Skeggsstatic int
15333e4d30d50344be26398a51365bea1be37487403Ben Skeggsctor_immd(struct nv50_pc *pc, float x, float y, float z, float w)
15433e4d30d50344be26398a51365bea1be37487403Ben Skeggs{
15533e4d30d50344be26398a51365bea1be37487403Ben Skeggs	pc->immd_buf = realloc(pc->immd_buf, (pc->immd_nr + 1) * 4 *
15633e4d30d50344be26398a51365bea1be37487403Ben Skeggs					     sizeof(float));
15733e4d30d50344be26398a51365bea1be37487403Ben Skeggs	pc->immd_buf[(pc->immd_nr * 4) + 0] = x;
158686bc00c05094e8678747c111a6a70ad4b7063e3Ben Skeggs	pc->immd_buf[(pc->immd_nr * 4) + 1] = y;
159686bc00c05094e8678747c111a6a70ad4b7063e3Ben Skeggs	pc->immd_buf[(pc->immd_nr * 4) + 2] = z;
160686bc00c05094e8678747c111a6a70ad4b7063e3Ben Skeggs	pc->immd_buf[(pc->immd_nr * 4) + 3] = w;
16133e4d30d50344be26398a51365bea1be37487403Ben Skeggs
16233e4d30d50344be26398a51365bea1be37487403Ben Skeggs	return pc->immd_nr++;
16333e4d30d50344be26398a51365bea1be37487403Ben Skeggs}
16433e4d30d50344be26398a51365bea1be37487403Ben Skeggs
16533e4d30d50344be26398a51365bea1be37487403Ben Skeggsstatic struct nv50_reg *
16633e4d30d50344be26398a51365bea1be37487403Ben Skeggsalloc_immd(struct nv50_pc *pc, float f)
16733e4d30d50344be26398a51365bea1be37487403Ben Skeggs{
16833e4d30d50344be26398a51365bea1be37487403Ben Skeggs	struct nv50_reg *r = CALLOC_STRUCT(nv50_reg);
16933e4d30d50344be26398a51365bea1be37487403Ben Skeggs	unsigned hw;
17033e4d30d50344be26398a51365bea1be37487403Ben Skeggs
17101e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	hw = ctor_immd(pc, f, 0, 0, 0) * 4;
17233e4d30d50344be26398a51365bea1be37487403Ben Skeggs	r->type = P_IMMD;
17333e4d30d50344be26398a51365bea1be37487403Ben Skeggs	r->hw = hw;
17433e4d30d50344be26398a51365bea1be37487403Ben Skeggs	r->index = -1;
17533e4d30d50344be26398a51365bea1be37487403Ben Skeggs	return r;
17633e4d30d50344be26398a51365bea1be37487403Ben Skeggs}
17733e4d30d50344be26398a51365bea1be37487403Ben Skeggs
17855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic void
17955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsemit(struct nv50_pc *pc, unsigned *inst)
18055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
18155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	struct nv50_program *p = pc->p;
18255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
183bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (inst[0] & 1) {
184bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		p->insns_nr += 2;
185bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		p->insns = realloc(p->insns, sizeof(unsigned) * p->insns_nr);
186bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		memcpy(p->insns + (p->insns_nr - 2), inst, sizeof(unsigned)*2);
187bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	} else {
188bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		p->insns_nr += 1;
189bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		p->insns = realloc(p->insns, sizeof(unsigned) * p->insns_nr);
190bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		memcpy(p->insns + (p->insns_nr - 1), inst, sizeof(unsigned));
191bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	}
19255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
19355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
19455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void set_long(struct nv50_pc *, unsigned *);
19555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
19655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic boolean
19755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsis_long(unsigned *inst)
19855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
19955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (inst[0] & 1)
20055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		return TRUE;
20155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	return FALSE;
20255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
20355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
20455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic boolean
20555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsis_immd(unsigned *inst)
20655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
20755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (is_long(inst) && (inst[1] & 3) == 3)
20855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		return TRUE;
20955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	return FALSE;
21055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
21155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
21255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
21355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsset_pred(struct nv50_pc *pc, unsigned pred, unsigned idx, unsigned *inst)
21455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
21555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_long(pc, inst);
21655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] &= ~((0x1f << 7) | (0x3 << 12));
21755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] |= (pred << 7) | (idx << 12);
21855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
21955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
22055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
22155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsset_pred_wr(struct nv50_pc *pc, unsigned on, unsigned idx, unsigned *inst)
22255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
22355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_long(pc, inst);
22455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] &= ~((0x3 << 4) | (1 << 6));
22555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] |= (idx << 4) | (on << 6);
22655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
22755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
22855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
22955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsset_long(struct nv50_pc *pc, unsigned *inst)
23055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
23155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (is_long(inst))
23255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		return;
23355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
23455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[0] |= 1;
23555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_pred(pc, 0xf, 0, inst);
23655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_pred_wr(pc, 0, 0, inst);
23755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
23855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
23955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
24055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsset_dst(struct nv50_pc *pc, struct nv50_reg *dst, unsigned *inst)
24155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
24255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (dst->type == P_RESULT) {
24355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		set_long(pc, inst);
24455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[1] |= 0x00000008;
24555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	}
24655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
24755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	alloc_reg(pc, dst);
24855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[0] |= (dst->hw << 2);
24955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
25055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
25155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
25255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsset_immd(struct nv50_pc *pc, struct nv50_reg *imm, unsigned *inst)
25355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
25455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	unsigned val = fui(pc->immd_buf[imm->hw]); /* XXX */
25555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
25655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_long(pc, inst);
25755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	/*XXX: can't be predicated - bits overlap.. catch cases where both
25855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	 *     are required and avoid them. */
25955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_pred(pc, 0, 0, inst);
26055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_pred_wr(pc, 0, 0, inst);
26155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
26255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] |= 0x00000002 | 0x00000001;
26355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[0] |= (val & 0x3f) << 16;
26455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] |= (val >> 6) << 2;
26555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
26655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
26755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic void
2688ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggsemit_interp(struct nv50_pc *pc, struct nv50_reg *dst,
2698ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	    struct nv50_reg *src, struct nv50_reg *iv, boolean noperspective)
2708ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs{
2718ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	unsigned inst[2] = { 0, 0 };
2728ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
2738ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	inst[0] |= 0x80000000;
2748ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	set_dst(pc, dst, inst);
2758ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	alloc_reg(pc, iv);
2768ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	inst[0] |= (iv->hw << 9);
2778ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	alloc_reg(pc, src);
2788ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	inst[0] |= (src->hw << 16);
2798ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	if (noperspective)
2808ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		inst[0] |= (1 << 25);
2818ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
2828ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	emit(pc, inst);
2838ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs}
2848ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
2858ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggsstatic void
2862a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsset_cseg(struct nv50_pc *pc, struct nv50_reg *src, unsigned *inst)
2872a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
2882a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_long(pc, inst);
2892a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_IMMD) {
2902a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[1] |= (NV50_CB_PMISC << 22);
2912a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else {
2922a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		if (pc->p->type == NV50_PROG_VERTEX)
2932a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			inst[1] |= (NV50_CB_PVP << 22);
2942a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		else
2952a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			inst[1] |= (NV50_CB_PFP << 22);
2962a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
2972a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
2982a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
2992a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
30055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsemit_mov(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
30155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
30255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	unsigned inst[2] = { 0, 0 };
30355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
30455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[0] |= 0x10000000;
30555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
30655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_dst(pc, dst, inst);
30755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
30855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (dst->type != P_RESULT && src->type == P_IMMD) {
30955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		set_immd(pc, src, inst);
31055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		/*XXX: 32-bit, but steals part of "half" reg space - need to
31155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		 *     catch and handle this case if/when we do half-regs
31255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		 */
31355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[0] |= 0x00008000;
31455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	} else
31555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (src->type == P_IMMD || src->type == P_CONST) {
31655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		set_long(pc, inst);
3172a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		set_cseg(pc, src, inst);
31855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[0] |= (src->hw << 9);
31955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[1] |= 0x20000000; /* src0 const? */
32055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	} else {
32155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		if (src->type == P_ATTR) {
32255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs			set_long(pc, inst);
32355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs			inst[1] |= 0x00200000;
32455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		}
32555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
32655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		alloc_reg(pc, src);
32755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[0] |= (src->hw << 9);
32855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	}
32955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
33055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	/* We really should support "half" instructions here at some point,
33155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	 * but I don't feel confident enough about them yet.
33255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	 */
33355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_long(pc, inst);
33455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (is_long(inst) && !is_immd(inst)) {
33555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[1] |= 0x04000000; /* 32-bit */
33655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[1] |= 0x0003c000; /* "subsubop" 0xf == mov */
33755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	}
33855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
33955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	emit(pc, inst);
34055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
34155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
342f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic boolean
3432a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggscheck_swap_src_0_1(struct nv50_pc *pc,
3442a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		   struct nv50_reg **s0, struct nv50_reg **s1)
3452a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
3462a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	struct nv50_reg *src0 = *s0, *src1 = *s1;
3472a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3482a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src0->type == P_CONST) {
3492a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		if (src1->type != P_CONST) {
3502a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s0 = src1;
3512a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s1 = src0;
3522a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			return TRUE;
3532a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		}
3542a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
3552a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src1->type == P_ATTR) {
3562a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		if (src0->type != P_ATTR) {
3572a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s0 = src1;
3582a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s1 = src0;
3592a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			return TRUE;
3602a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		}
3612a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
3622a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3632a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	return FALSE;
3642a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
3652a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3662a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
3672a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsset_src_0(struct nv50_pc *pc, struct nv50_reg *src, unsigned *inst)
3682a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
3692a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_ATTR) {
3702a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		set_long(pc, inst);
3712a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[1] |= 0x00200000;
3722a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
3732a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_CONST || src->type == P_IMMD) {
3742a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		struct nv50_reg *temp = temp_temp(pc);
3752a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3762a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mov(pc, temp, src);
3772a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		src = temp;
3782a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
3792a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3802a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	alloc_reg(pc, src);
3812a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= (src->hw << 9);
3822a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
3832a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3842a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
3852a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsset_src_1(struct nv50_pc *pc, struct nv50_reg *src, unsigned *inst)
3862a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
3872a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_ATTR) {
3882a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		struct nv50_reg *temp = temp_temp(pc);
3892a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3902a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mov(pc, temp, src);
3912a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		src = temp;
3922a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
3932a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_CONST || src->type == P_IMMD) {
3942a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		set_cseg(pc, src, inst);
3952a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[0] |= 0x00800000;
3962a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
3972a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3982a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	alloc_reg(pc, src);
3992a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= (src->hw << 16);
4002a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4012a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4022a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
4032a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsset_src_2(struct nv50_pc *pc, struct nv50_reg *src, unsigned *inst)
4042a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4052a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_long(pc, inst);
4062a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4072a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_ATTR) {
4082a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		struct nv50_reg *temp = temp_temp(pc);
4092a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4102a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mov(pc, temp, src);
4112a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		src = temp;
4122a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
4132a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_CONST || src->type == P_IMMD) {
4142a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		set_cseg(pc, src, inst);
4152a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[0] |= 0x01000000;
4162a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
4172a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4182a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	alloc_reg(pc, src);
4192a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[1] |= (src->hw << 14);
4202a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4212a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4222a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
4232a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_mul(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
4242a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	 struct nv50_reg *src1)
4252a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4262a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned inst[2] = { 0, 0 };
4272a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4282a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= 0xc0000000;
429ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs	set_long(pc, inst);
4302a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4312a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
4322a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_dst(pc, dst, inst);
4332a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_0(pc, src0, inst);
4342a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_1(pc, src1, inst);
4352a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4362a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	emit(pc, inst);
4372a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4382a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4392a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
44052a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggsemit_add(struct nv50_pc *pc, struct nv50_reg *dst,
44152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	 struct nv50_reg *src0, struct nv50_reg *src1)
4422a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4432a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned inst[2] = { 0, 0 };
4442a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4452a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= 0xb0000000;
4462a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4472a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
4482a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_dst(pc, dst, inst);
4492a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_0(pc, src0, inst);
45052a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	if (is_long(inst))
45152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		set_src_2(pc, src1, inst);
45252a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	else
45352a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		set_src_1(pc, src1, inst);
45452a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
45552a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	emit(pc, inst);
45652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs}
45752a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
45852a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggsstatic void
45952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggsemit_minmax(struct nv50_pc *pc, unsigned sub, struct nv50_reg *dst,
46052a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	    struct nv50_reg *src0, struct nv50_reg *src1)
46152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs{
46252a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	unsigned inst[2] = { 0, 0 };
46352a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
46452a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	set_long(pc, inst);
46552a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	inst[0] |= 0xb0000000;
46652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	inst[1] |= (sub << 29);
46752a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
46852a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
46952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	set_dst(pc, dst, inst);
47052a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	set_src_0(pc, src0, inst);
47152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	set_src_1(pc, src1, inst);
4722a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4732a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	emit(pc, inst);
4742a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4752a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4762a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
4772a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_sub(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
4782a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	 struct nv50_reg *src1)
4792a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4802a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned inst[2] = { 0, 0 };
4812a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4822a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= 0xb0000000;
4832a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4842a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_long(pc, inst);
4852a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (check_swap_src_0_1(pc, &src0, &src1))
4862a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[1] |= 0x04000000;
4872a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	else
4882a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[1] |= 0x08000000;
4892a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4902a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_dst(pc, dst, inst);
4912a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_0(pc, src0, inst);
4922a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_2(pc, src1, inst);
4932a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4942a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	emit(pc, inst);
4952a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4962a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4972a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
4982a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_mad(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
4992a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	 struct nv50_reg *src1, struct nv50_reg *src2)
5002a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
5012a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned inst[2] = { 0, 0 };
5022a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5032a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= 0xe0000000;
5042a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5052a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
5062a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_dst(pc, dst, inst);
5072a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_0(pc, src0, inst);
5082a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_1(pc, src1, inst);
5092a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_2(pc, src2, inst);
5102a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5112a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	emit(pc, inst);
5122a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
5132a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5142a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
51521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggsemit_msb(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
51621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	 struct nv50_reg *src1, struct nv50_reg *src2)
51721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs{
51821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	unsigned inst[2] = { 0, 0 };
51921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
52021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	inst[0] |= 0xe0000000;
52121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	set_long(pc, inst);
52221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	inst[1] |= 0x08000000; /* src0 * src1 - src2 */
52321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
52421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
52521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	set_dst(pc, dst, inst);
52621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	set_src_0(pc, src0, inst);
52721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	set_src_1(pc, src1, inst);
52821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	set_src_2(pc, src2, inst);
52921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
53021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	emit(pc, inst);
53121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs}
53221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
53321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggsstatic void
5342a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_flop(struct nv50_pc *pc, unsigned sub,
5352a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	  struct nv50_reg *dst, struct nv50_reg *src)
5362a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
5372a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned inst[2] = { 0, 0 };
5382a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5392a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= 0x90000000;
54052a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	if (sub) {
54152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		set_long(pc, inst);
54252a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		inst[1] |= (sub << 29);
54352a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	}
5442a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5452a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_dst(pc, dst, inst);
5462a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_0(pc, src, inst);
5472a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5482a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	emit(pc, inst);
5492a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
5502a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
551d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggsstatic void
552d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggsemit_preex2(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
553d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs{
554d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	unsigned inst[2] = { 0, 0 };
555d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
556d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	inst[0] |= 0xb0000000;
557d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
558d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	set_dst(pc, dst, inst);
559d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	set_src_0(pc, src, inst);
560d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	set_long(pc, inst);
561d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	inst[1] |= (6 << 29) | 0x00004000;
562d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
563d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	emit(pc, inst);
564d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs}
565faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs
566bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs/*XXX: inaccurate results.. why? */
567bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs#define ALLOW_SET_SWAP 0
568bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
569bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggsstatic void
570bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggsemit_set(struct nv50_pc *pc, unsigned c_op, struct nv50_reg *dst,
571bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 struct nv50_reg *src0, struct nv50_reg *src1)
572bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs{
573bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	unsigned inst[2] = { 0, 0 };
574bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs#if ALLOW_SET_SWAP
575bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	unsigned inv_cop[8] = { 0, 6, 2, 4, 3, 5, 1, 7 };
576bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs#endif
577bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	struct nv50_reg *rdst;
578bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
579bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs#if ALLOW_SET_SWAP
580bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	assert(c_op <= 7);
581bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (check_swap_src_0_1(pc, &src0, &src1))
582bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		c_op = inv_cop[c_op];
583bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs#endif
584bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
585bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	rdst = dst;
586bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (dst->type != P_TEMP)
587bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		dst = alloc_temp(pc, NULL);
588bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
589bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	/* set.u32 */
590bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_long(pc, inst);
591bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[0] |= 0xb0000000;
592bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[1] |= (3 << 29);
593bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[1] |= (c_op << 14);
594bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	/*XXX: breaks things, .u32 by default?
595bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 *     decuda will disasm as .u16 and use .lo/.hi regs, but this
596bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 *     doesn't seem to match what the hw actually does.
597bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[1] |= 0x04000000; << breaks things.. .u32 by default?
598bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 */
599bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_dst(pc, dst, inst);
600bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_src_0(pc, src0, inst);
601bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_src_1(pc, src1, inst);
602bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	emit(pc, inst);
603bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
604bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	/* cvt.f32.u32 */
605bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[0] = 0xa0000001;
606bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[1] = 0x64014780;
607bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_dst(pc, rdst, inst);
608bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_src_0(pc, dst, inst);
609bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	emit(pc, inst);
610bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
611bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (dst != rdst)
612bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		free_temp(pc, dst);
613bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs}
614d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
615b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggsstatic void
616b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggsemit_flr(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
617b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs{
618b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	unsigned inst[2] = { 0, 0 };
619b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs
620b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[0] = 0xa0000000; /* cvt */
621688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	set_long(pc, inst);
622b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[1] |= (6 << 29); /* cvt */
623b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[1] |= 0x08000000; /* integer mode */
624b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[1] |= 0x04000000; /* 32 bit */
625b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[1] |= ((0x1 << 3)) << 14; /* .rn */
626b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[1] |= (1 << 14); /* src .f32 */
627b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	set_dst(pc, dst, inst);
628b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	set_src_0(pc, src, inst);
629b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs
630b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	emit(pc, inst);
631b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs}
632b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs
633faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggsstatic void
634faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggsemit_pow(struct nv50_pc *pc, struct nv50_reg *dst,
635faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	 struct nv50_reg *v, struct nv50_reg *e)
636faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs{
637faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	struct nv50_reg *temp = alloc_temp(pc, NULL);
638faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs
639faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	emit_flop(pc, 3, temp, v);
640faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	emit_mul(pc, temp, temp, e);
641faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	emit_preex2(pc, temp, temp);
642faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	emit_flop(pc, 6, dst, temp);
643faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs
644faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	free_temp(pc, temp);
645faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs}
646faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs
647fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggsstatic void
648fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggsemit_abs(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
649fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs{
650fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	unsigned inst[2] = { 0, 0 };
651fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
652fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	inst[0] = 0xa0000000; /* cvt */
653fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	set_long(pc, inst);
654fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	inst[1] |= (6 << 29); /* cvt */
655fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	inst[1] |= 0x04000000; /* 32 bit */
656fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	inst[1] |= (1 << 14); /* src .f32 */
657fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	inst[1] |= ((1 << 6) << 14); /* .abs */
658fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	set_dst(pc, dst, inst);
659fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	set_src_0(pc, src, inst);
660fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
661fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	emit(pc, inst);
662fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs}
663fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
66401e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggsstatic void
66501e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggsemit_lit(struct nv50_pc *pc, struct nv50_reg **dst, struct nv50_reg **src)
66601e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs{
66701e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	struct nv50_reg *one = alloc_immd(pc, 1.0);
66801e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	struct nv50_reg *zero = alloc_immd(pc, 0.0);
66901e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	struct nv50_reg *neg128 = alloc_immd(pc, -127.999999);
67001e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	struct nv50_reg *pos128 = alloc_immd(pc,  127.999999);
67101e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	struct nv50_reg *tmp[4];
67201e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
67301e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	emit_mov(pc, dst[0], one);
67401e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	emit_mov(pc, dst[3], one);
67501e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
67601e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	tmp[0] = temp_temp(pc);
67701e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	emit_minmax(pc, 4, dst[1], src[0], zero);
67801e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	set_pred_wr(pc, 1, 0, &pc->p->insns[pc->p->insns_nr - 2]);
67901e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
68001e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	tmp[1] = temp_temp(pc);
68101e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	emit_minmax(pc, 4, tmp[1], src[1], zero);
68201e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
68301e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	tmp[3] = temp_temp(pc);
68401e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	emit_minmax(pc, 4, tmp[3], src[3], neg128);
68501e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	emit_minmax(pc, 5, tmp[3], tmp[3], pos128);
68601e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
68701e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	emit_pow(pc, dst[2], tmp[1], tmp[3]);
68801e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	emit_mov(pc, dst[2], zero);
68901e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	set_pred(pc, 3, 0, &pc->p->insns[pc->p->insns_nr - 2]);
69001e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs}
69101e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
692fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggsstatic struct nv50_reg *
693fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggstgsi_dst(struct nv50_pc *pc, int c, const struct tgsi_full_dst_register *dst)
694fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs{
695fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	switch (dst->DstRegister.File) {
696fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_FILE_TEMPORARY:
697fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		return &pc->temp[dst->DstRegister.Index * 4 + c];
698fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_FILE_OUTPUT:
699fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		return &pc->result[dst->DstRegister.Index * 4 + c];
700fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_FILE_NULL:
701fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		return NULL;
702fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	default:
703fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
704fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	}
705fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
706fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	return NULL;
707fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs}
708fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
709fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggsstatic struct nv50_reg *
710fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggstgsi_src(struct nv50_pc *pc, int chan, const struct tgsi_full_src_register *src)
711fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs{
712fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	struct nv50_reg *r = NULL;
713fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	struct nv50_reg *temp;
714fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	unsigned c;
715fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
716fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	c = tgsi_util_get_full_src_register_extswizzle(src, chan);
717fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	switch (c) {
718fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_X:
719fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_Y:
720fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_Z:
721fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_W:
722fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		switch (src->SrcRegister.File) {
723fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		case TGSI_FILE_INPUT:
724fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			r = &pc->attr[src->SrcRegister.Index * 4 + c];
725fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			break;
726fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		case TGSI_FILE_TEMPORARY:
727fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			r = &pc->temp[src->SrcRegister.Index * 4 + c];
728fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			break;
729fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		case TGSI_FILE_CONSTANT:
730fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			r = &pc->param[src->SrcRegister.Index * 4 + c];
731fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			break;
732fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		case TGSI_FILE_IMMEDIATE:
733fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			r = &pc->immd[src->SrcRegister.Index * 4 + c];
734fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			break;
735fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		default:
736fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			assert(0);
737fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			break;
738fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		}
739fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
740fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_ZERO:
741fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		r = alloc_immd(pc, 0.0);
742fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
743fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_ONE:
744fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		r = alloc_immd(pc, 1.0);
745fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
746fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	default:
747fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		assert(0);
748fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
749fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	}
750fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
751fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	switch (tgsi_util_get_full_src_register_sign_mode(src, chan)) {
752fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_UTIL_SIGN_KEEP:
753fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
754fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_UTIL_SIGN_CLEAR:
755fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		temp = temp_temp(pc);
756fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		emit_abs(pc, temp, r);
757fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		r = temp;
758fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
759fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	default:
760fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		assert(0);
761fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
762fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	}
763fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
764fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	return r;
765fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs}
766fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
7672a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic boolean
768f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_tx_insn(struct nv50_pc *pc, const union tgsi_full_token *tok)
769f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
770f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	const struct tgsi_full_instruction *inst = &tok->FullInstruction;
771688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	struct nv50_reg *rdst[4], *dst[4], *src[3][4], *temp;
772688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	unsigned mask, sat;
773f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int i, c;
774f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
775f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	NOUVEAU_ERR("insn %p\n", tok);
776f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
777f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	mask = inst->FullDstRegisters[0].DstRegister.WriteMask;
778688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	sat = inst->Instruction.Saturate == TGSI_SAT_ZERO_ONE;
779f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
780f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (c = 0; c < 4; c++) {
781f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (mask & (1 << c))
782f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			dst[c] = tgsi_dst(pc, c, &inst->FullDstRegisters[0]);
783f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		else
784f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			dst[c] = NULL;
785f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
786f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
787f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (i = 0; i < inst->Instruction.NumSrcRegs; i++) {
788f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (c = 0; c < 4; c++)
789f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			src[i][c] = tgsi_src(pc, c, &inst->FullSrcRegisters[i]);
790f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
791f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
792688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	if (sat) {
793688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs		for (c = 0; c < 4; c++) {
794688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			rdst[c] = dst[c];
795688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			dst[c] = temp_temp(pc);
796688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs		}
797688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	}
798688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs
799f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	switch (inst->Instruction.Opcode) {
80068091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs	case TGSI_OPCODE_ABS:
80168091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs		for (c = 0; c < 4; c++) {
802fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			if (!(mask & (1 << c)))
803fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs				continue;
804fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			emit_abs(pc, dst[c], src[0][c]);
80568091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs		}
80668091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs		break;
8072a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_ADD:
8087df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8097df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8107df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
8112a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_add(pc, dst[c], src[0][c], src[1][c]);
8127df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
8132a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
8142a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_COS:
8157df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8167df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8177df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
8182a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_flop(pc, 5, dst[c], src[0][c]);
8197df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
8202a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
8212a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_DP3:
8222a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		temp = alloc_temp(pc, NULL);
8232a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mul(pc, temp, src[0][0], src[1][0]);
8242a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][1], src[1][1], temp);
8252a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][2], src[1][2], temp);
8267df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8277df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8287df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
8292a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mov(pc, dst[c], temp);
8307df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
8312a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		free_temp(pc, temp);
8322a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
8332a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_DP4:
8342a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		temp = alloc_temp(pc, NULL);
8352a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mul(pc, temp, src[0][0], src[1][0]);
8362a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][1], src[1][1], temp);
8372a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][2], src[1][2], temp);
8382a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][3], src[1][3], temp);
8397df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8407df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8417df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
8422a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mov(pc, dst[c], temp);
8437df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
8442a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		free_temp(pc, temp);
8452a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
84621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	case TGSI_OPCODE_DPH:
84721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		temp = alloc_temp(pc, NULL);
84821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mul(pc, temp, src[0][0], src[1][0]);
84921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mad(pc, temp, src[0][1], src[1][1], temp);
85021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mad(pc, temp, src[0][2], src[1][2], temp);
85121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_add(pc, temp, src[1][3], temp);
85221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		for (c = 0; c < 4; c++) {
85321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs			if (!(mask & (1 << c)))
85421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs				continue;
85521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs			emit_mov(pc, dst[c], temp);
85621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		}
85721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		free_temp(pc, temp);
85821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		break;
85933e4d30d50344be26398a51365bea1be37487403Ben Skeggs	case TGSI_OPCODE_DST:
86033e4d30d50344be26398a51365bea1be37487403Ben Skeggs	{
86133e4d30d50344be26398a51365bea1be37487403Ben Skeggs		struct nv50_reg *one = alloc_immd(pc, 1.0);
8629a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 0))
8639a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mov(pc, dst[0], one);
8649a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 1))
8659a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mul(pc, dst[1], src[0][1], src[1][1]);
8669a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 2))
8679a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mov(pc, dst[2], src[0][2]);
8689a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 3))
8699a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mov(pc, dst[3], src[1][3]);
87033e4d30d50344be26398a51365bea1be37487403Ben Skeggs		FREE(one);
87133e4d30d50344be26398a51365bea1be37487403Ben Skeggs	}
87233e4d30d50344be26398a51365bea1be37487403Ben Skeggs		break;
8732a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_EX2:
874fbf4027dd9b279ec159906dcad134f71e34aaec8Ben Skeggs		temp = alloc_temp(pc, NULL);
8757df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8767df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8777df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
878d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs			emit_preex2(pc, temp, src[0][c]);
879fbf4027dd9b279ec159906dcad134f71e34aaec8Ben Skeggs			emit_flop(pc, 6, dst[c], temp);
8807df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
881fbf4027dd9b279ec159906dcad134f71e34aaec8Ben Skeggs		free_temp(pc, temp);
8822a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
883b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	case TGSI_OPCODE_FLR:
884b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		for (c = 0; c < 4; c++) {
885b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			if (!(mask & (1 << c)))
886b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs				continue;
887b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			emit_flr(pc, dst[c], src[0][c]);
888b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		}
889b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		break;
890b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	case TGSI_OPCODE_FRC:
891b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		temp = alloc_temp(pc, NULL);
892b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		for (c = 0; c < 4; c++) {
893b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			if (!(mask & (1 << c)))
894b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs				continue;
895b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			emit_flr(pc, temp, src[0][c]);
896b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			emit_sub(pc, dst[c], src[0][c], temp);
897b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		}
898b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		free_temp(pc, temp);
899b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		break;
90001e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	case TGSI_OPCODE_LIT:
9019a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		/*XXX: writemask */
90201e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs		emit_lit(pc, &dst[0], &src[0][0]);
90301e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs		break;
9042a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_LG2:
9057df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9067df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9077df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
9082a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_flop(pc, 3, dst[c], src[0][c]);
9097df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
9102a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
9112a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_MAD:
9127df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9137df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9147df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
9152a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mad(pc, dst[c], src[0][c], src[1][c], src[2][c]);
9167df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
9172a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
91852a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	case TGSI_OPCODE_MAX:
9197df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9207df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9217df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
92252a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs			emit_minmax(pc, 4, dst[c], src[0][c], src[1][c]);
9237df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
92452a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		break;
92552a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	case TGSI_OPCODE_MIN:
9267df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9277df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9287df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
92952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs			emit_minmax(pc, 5, dst[c], src[0][c], src[1][c]);
9307df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
93152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		break;
932f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_OPCODE_MOV:
9337df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9347df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9357df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
93655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs			emit_mov(pc, dst[c], src[0][c]);
9377df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
93838ce697e5942550888c28bd4859ca2a92f247bf7Ben Skeggs		break;
9392a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_MUL:
9407df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9417df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9427df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
9432a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mul(pc, dst[c], src[0][c], src[1][c]);
9447df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
9452a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
946ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs	case TGSI_OPCODE_POW:
947ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		temp = alloc_temp(pc, NULL);
948faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs		emit_pow(pc, temp, src[0][0], src[1][0]);
949ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		for (c = 0; c < 4; c++) {
950ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs			if (!(mask & (1 << c)))
951ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs				continue;
952ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs			emit_mov(pc, dst[c], temp);
953ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		}
954ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		free_temp(pc, temp);
955ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		break;
9562a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_RCP:
9577df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9587df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9597df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
9602a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_flop(pc, 0, dst[c], src[0][c]);
9617df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
9622a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
9632a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_RSQ:
9647df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9657df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9667df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
9672a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_flop(pc, 2, dst[c], src[0][c]);
9687df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
9692a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
970bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	case TGSI_OPCODE_SGE:
971bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		for (c = 0; c < 4; c++) {
972bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			if (!(mask & (1 << c)))
973bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs				continue;
974bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			emit_set(pc, 6, dst[c], src[0][c], src[1][c]);
975bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		}
976bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		break;
9772a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_SIN:
9787df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9797df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9807df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
9812a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_flop(pc, 4, dst[c], src[0][c]);
9827df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
9832a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
984bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	case TGSI_OPCODE_SLT:
985bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		for (c = 0; c < 4; c++) {
986bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			if (!(mask & (1 << c)))
987bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs				continue;
988bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			emit_set(pc, 1, dst[c], src[0][c], src[1][c]);
989bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		}
990bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		break;
9912a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_SUB:
9927df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9937df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9947df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
9952a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_sub(pc, dst[c], src[0][c], src[1][c]);
9967df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
9972a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
99821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	case TGSI_OPCODE_XPD:
99921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		temp = alloc_temp(pc, NULL);
10009a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 0)) {
10019a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mul(pc, temp, src[0][2], src[1][1]);
10029a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_msb(pc, dst[0], src[0][1], src[1][2], temp);
10039a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		}
10049a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 1)) {
10059a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mul(pc, temp, src[0][0], src[1][2]);
10069a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_msb(pc, dst[1], src[0][2], src[1][0], temp);
10079a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		}
10089a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 2)) {
10099a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mul(pc, temp, src[0][1], src[1][0]);
10109a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_msb(pc, dst[2], src[0][0], src[1][1], temp);
10119a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		}
101221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		free_temp(pc, temp);
101321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		break;
1014f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_OPCODE_END:
1015f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		break;
1016f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	default:
1017f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		NOUVEAU_ERR("invalid opcode %d\n", inst->Instruction.Opcode);
1018f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return FALSE;
1019f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1020f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1021688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	if (sat) {
1022688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs		for (c = 0; c < 4; c++) {
1023688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			unsigned inst[2] = { 0, 0 };
1024688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs
1025688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			if (!(mask & (1 << c)))
1026688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs				continue;
1027688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs
1028688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			inst[0] = 0xa0000000; /* cvt */
1029688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			set_long(pc, inst);
1030688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			inst[1] |= (6 << 29); /* cvt */
1031688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			inst[1] |= 0x04000000; /* 32 bit */
1032688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			inst[1] |= (1 << 14); /* src .f32 */
1033688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			inst[1] |= ((1 << 5) << 14); /* .sat */
1034688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			set_dst(pc, rdst[c], inst);
1035688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			set_src_0(pc, dst[c], inst);
1036688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			emit(pc, inst);
1037688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs		}
1038688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	}
1039688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs
104052a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	kill_temp_temp(pc);
1041f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return TRUE;
1042f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1043f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1044f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic boolean
1045f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_tx_prep(struct nv50_pc *pc)
1046f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1047f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct tgsi_parse_context p;
1048f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	boolean ret = FALSE;
1049f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	unsigned i, c;
1050f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1051f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_init(&p, pc->p->pipe.tokens);
1052f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	while (!tgsi_parse_end_of_tokens(&p)) {
1053f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		const union tgsi_full_token *tok = &p.FullToken;
1054f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1055f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		tgsi_parse_token(&p);
1056f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		switch (tok->Token.Type) {
1057f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_IMMEDIATE:
1058f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		{
1059f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			const struct tgsi_full_immediate *imm =
1060f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				&p.FullToken.FullImmediate;
1061f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
106233e4d30d50344be26398a51365bea1be37487403Ben Skeggs			ctor_immd(pc, imm->u.ImmediateFloat32[0].Float,
106333e4d30d50344be26398a51365bea1be37487403Ben Skeggs				      imm->u.ImmediateFloat32[1].Float,
106433e4d30d50344be26398a51365bea1be37487403Ben Skeggs				      imm->u.ImmediateFloat32[2].Float,
106533e4d30d50344be26398a51365bea1be37487403Ben Skeggs				      imm->u.ImmediateFloat32[3].Float);
1066f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1067f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1068f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_DECLARATION:
1069f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		{
1070f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			const struct tgsi_full_declaration *d;
1071f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			unsigned last;
1072f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1073f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			d = &p.FullToken.FullDeclaration;
1074f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			last = d->u.DeclarationRange.Last;
1075f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1076f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			switch (d->Declaration.File) {
1077f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_TEMPORARY:
1078f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->temp_nr < (last + 1))
1079f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->temp_nr = last + 1;
1080f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
1081f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_OUTPUT:
1082f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->result_nr < (last + 1))
1083f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->result_nr = last + 1;
1084f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
1085f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_INPUT:
1086f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->attr_nr < (last + 1))
1087f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->attr_nr = last + 1;
1088f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
1089f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_CONSTANT:
1090f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->param_nr < (last + 1))
1091f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->param_nr = last + 1;
1092f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
1093f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			default:
1094f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				NOUVEAU_ERR("bad decl file %d\n",
1095f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					    d->Declaration.File);
1096f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				goto out_err;
1097f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1098f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1099f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1100f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_INSTRUCTION:
1101f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1102f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		default:
1103f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1104f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1105f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1106f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1107f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	NOUVEAU_ERR("%d temps\n", pc->temp_nr);
1108f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->temp_nr) {
1109f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->temp = calloc(pc->temp_nr * 4, sizeof(struct nv50_reg));
1110f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->temp)
1111f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1112f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1113f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->temp_nr; i++) {
1114f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1115f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->temp[i*4+c].type = P_TEMP;
1116f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->temp[i*4+c].hw = -1;
1117f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->temp[i*4+c].index = i;
1118f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1119f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1120f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1121f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1122f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	NOUVEAU_ERR("%d attrib regs\n", pc->attr_nr);
1123f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->attr_nr) {
11248ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		struct nv50_reg *iv = NULL, *tmp = NULL;
1125f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		int aid = 0;
1126f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1127f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->attr = calloc(pc->attr_nr * 4, sizeof(struct nv50_reg));
1128f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->attr)
1129f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1130f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
11318ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		if (pc->p->type == NV50_PROG_FRAGMENT) {
11328ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			iv = alloc_temp(pc, NULL);
11338ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			aid++;
11348ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		}
11358ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
1136f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->attr_nr; i++) {
11378ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			struct nv50_reg *a = &pc->attr[i*4];
11388ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
1139f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
11408ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				if (pc->p->type == NV50_PROG_FRAGMENT) {
11418ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					struct nv50_reg *at =
11428ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs						alloc_temp(pc, NULL);
11438ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].type = at->type;
11448ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].hw = at->hw;
11458ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].index = at->index;
11468ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				} else {
11478ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->p->cfg.vp.attr[aid/32] |=
11488ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs						(1 << (aid % 32));
11498ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].type = P_ATTR;
11508ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].hw = aid++;
11518ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].index = i;
11528ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				}
1153f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
11548ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
11558ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			if (pc->p->type != NV50_PROG_FRAGMENT)
11568ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				continue;
11578ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
11588ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			emit_interp(pc, iv, iv, iv, FALSE);
11598ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			tmp = alloc_temp(pc, NULL);
11608ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			{
11618ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				unsigned inst[2] = { 0, 0 };
11628ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				inst[0]  = 0x90000000;
11638ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				inst[0] |= (tmp->hw << 2);
11648ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				emit(pc, inst);
11658ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			}
11668ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			emit_interp(pc, &a[0], &a[0], tmp, TRUE);
11678ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			emit_interp(pc, &a[1], &a[1], tmp, TRUE);
11688ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			emit_interp(pc, &a[2], &a[2], tmp, TRUE);
11698ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			emit_interp(pc, &a[3], &a[3], tmp, TRUE);
11708ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			free_temp(pc, tmp);
1171f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
11728ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
11738ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		if (iv)
11748ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			free_temp(pc, iv);
1175f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1176f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1177f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	NOUVEAU_ERR("%d result regs\n", pc->result_nr);
1178f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->result_nr) {
1179f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		int rid = 0;
1180f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1181f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->result = calloc(pc->result_nr * 4, sizeof(struct nv50_reg));
1182f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->result)
1183f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1184f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1185f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->result_nr; i++) {
1186f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
11878ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				if (pc->p->type == NV50_PROG_FRAGMENT)
11888ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->result[i*4+c].type = P_TEMP;
11898ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				else
11908ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->result[i*4+c].type = P_RESULT;
1191f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->result[i*4+c].hw = rid++;
1192f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->result[i*4+c].index = i;
1193f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1194f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1195f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1196f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1197f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	NOUVEAU_ERR("%d param regs\n", pc->param_nr);
1198f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->param_nr) {
1199f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		int rid = 0;
1200f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1201f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->param = calloc(pc->param_nr * 4, sizeof(struct nv50_reg));
1202f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->param)
1203f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1204f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1205f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->param_nr; i++) {
1206f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1207f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->param[i*4+c].type = P_CONST;
1208f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->param[i*4+c].hw = rid++;
1209f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->param[i*4+c].index = i;
1210f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1211f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1212f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1213f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1214f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->immd_nr) {
1215716c1cd2ecbc1e86c0fd747c9fa9e095ded5fd5dBen Skeggs		int rid = 0;
1216f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1217f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->immd = calloc(pc->immd_nr * 4, sizeof(struct nv50_reg));
1218f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->immd)
1219f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1220f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1221f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->immd_nr; i++) {
1222f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1223f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->immd[i*4+c].type = P_IMMD;
1224f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->immd[i*4+c].hw = rid++;
1225f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->immd[i*4+c].index = i;
1226f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1227f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1228f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1229f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1230f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	ret = TRUE;
1231f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsout_err:
1232f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_free(&p);
1233f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return ret;
1234f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1235f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1236f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic boolean
1237f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_tx(struct nv50_program *p)
1238f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1239f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct tgsi_parse_context parse;
1240f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_pc *pc;
1241f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	boolean ret;
1242f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1243f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	pc = CALLOC_STRUCT(nv50_pc);
1244f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (!pc)
1245f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return FALSE;
1246f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	pc->p = p;
12478ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	pc->p->cfg.high_temp = 4;
1248f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1249f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	ret = nv50_program_tx_prep(pc);
1250f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (ret == FALSE)
1251f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		goto out_cleanup;
1252f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1253f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_init(&parse, pc->p->pipe.tokens);
1254f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	while (!tgsi_parse_end_of_tokens(&parse)) {
1255f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		const union tgsi_full_token *tok = &parse.FullToken;
1256f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1257f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		tgsi_parse_token(&parse);
1258f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1259f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		switch (tok->Token.Type) {
1260f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_INSTRUCTION:
1261f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			ret = nv50_program_tx_insn(pc, tok);
1262f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			if (ret == FALSE)
1263f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				goto out_err;
1264f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1265f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		default:
1266f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1267f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1268f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1269f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1270f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->immd_nr = pc->immd_nr * 4;
1271f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->immd = pc->immd_buf;
1272f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1273f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsout_err:
1274f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_free(&parse);
1275f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1276f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsout_cleanup:
1277f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return ret;
1278f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1279f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1280f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic void
1281f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_validate(struct nv50_context *nv50, struct nv50_program *p)
1282f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1283e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	int i;
1284e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs
1285e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	if (nv50_program_tx(p) == FALSE)
1286e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs		assert(0);
1287e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	/* *not* sufficient, it's fine if last inst is long and
1288e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	 * NOT immd - otherwise it's fucked fucked fucked */
1289e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	p->insns[p->insns_nr - 1] |= 0x00000001;
1290f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
12912a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (p->type == NV50_PROG_VERTEX) {
12922a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	for (i = 0; i < p->insns_nr; i++)
12932a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		NOUVEAU_ERR("VP0x%08x\n", p->insns[i]);
12942a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else {
1295e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	for (i = 0; i < p->insns_nr; i++)
12962a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		NOUVEAU_ERR("FP0x%08x\n", p->insns[i]);
12972a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
1298f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1299f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->translated = TRUE;
1300f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1301f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
130222e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsstatic void
130322e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsnv50_program_validate_data(struct nv50_context *nv50, struct nv50_program *p)
130422e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs{
130522e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	int i;
130622e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
130722e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	for (i = 0; i < p->immd_nr; i++) {
130822e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs		BEGIN_RING(tesla, 0x0f00, 2);
130922e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs		OUT_RING  ((NV50_CB_PMISC << 16) | (i << 8));
131022e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs		OUT_RING  (fui(p->immd[i]));
131122e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	}
131222e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs}
131322e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
131422e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsstatic void
131522e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsnv50_program_validate_code(struct nv50_context *nv50, struct nv50_program *p)
131622e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs{
131722e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	struct pipe_winsys *ws = nv50->pipe.winsys;
131822e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	void *map;
131922e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
132022e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	if (!p->buffer)
132122e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs		p->buffer = ws->buffer_create(ws, 0x100, 0, p->insns_nr * 4);
132222e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	map = ws->buffer_map(ws, p->buffer, PIPE_BUFFER_USAGE_CPU_WRITE);
132322e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	memcpy(map, p->insns, p->insns_nr * 4);
132422e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	ws->buffer_unmap(ws, p->buffer);
132522e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs}
132622e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
1327f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsvoid
1328f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_vertprog_validate(struct nv50_context *nv50)
1329f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1330f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_grobj *tesla = nv50->screen->tesla;
1331f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_program *p = nv50->vertprog;
1332f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_stateobj *so;
1333f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1334f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (!p->translated) {
1335f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		nv50_program_validate(nv50, p);
1336f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!p->translated)
1337f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			assert(0);
1338f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1339f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
134022e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	nv50_program_validate_data(nv50, p);
134122e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	nv50_program_validate_code(nv50, p);
1342f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1343f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so = so_new(11, 2);
1344f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, NV50TCL_VP_ADDRESS_HIGH, 2);
1345f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1346f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_HIGH, 0, 0);
1347f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1348f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_LOW, 0, 0);
1349f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, 0x1650, 2);
1350f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, p->cfg.vp.attr[0]);
1351f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, p->cfg.vp.attr[1]);
1352f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, 0x16ac, 2);
1353f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, 8);
13548ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_data  (so, p->cfg.high_temp);
1355f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, 0x140c, 1);
1356f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, 0); /* program start offset */
1357f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_emit(nv50->screen->nvws, so);
1358f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_ref(NULL, &so);
1359f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1360f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1361f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsvoid
1362f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_fragprog_validate(struct nv50_context *nv50)
1363f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1364f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_grobj *tesla = nv50->screen->tesla;
1365f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_program *p = nv50->fragprog;
1366f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_stateobj *so;
1367f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1368f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (!p->translated) {
1369f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		nv50_program_validate(nv50, p);
1370f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!p->translated)
1371f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			assert(0);
1372f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1373f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
137455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	nv50_program_validate_data(nv50, p);
137555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	nv50_program_validate_code(nv50, p);
1376f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
13778ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so = so_new(7, 2);
1378f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, NV50TCL_FP_ADDRESS_HIGH, 2);
1379f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1380f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_HIGH, 0, 0);
1381f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1382f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_LOW, 0, 0);
13838ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_method(so, tesla, 0x198c, 1);
13848ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_data  (so, p->cfg.high_temp);
13858ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_method(so, tesla, 0x1414, 1);
13868ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_data  (so, 0); /* program start offset */
1387f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_emit(nv50->screen->nvws, so);
1388f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_ref(NULL, &so);
1389f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1390f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1391f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsvoid
1392f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_destroy(struct nv50_context *nv50, struct nv50_program *p)
1393f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1394f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct pipe_winsys *ws = nv50->pipe.winsys;
1395f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1396f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (p->insns_nr) {
1397f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (p->insns)
1398f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			FREE(p->insns);
1399f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		p->insns_nr = 0;
1400f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1401f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1402f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (p->buffer)
1403f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pipe_buffer_reference(ws, &p->buffer, NULL);
1404f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1405f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->translated = 0;
1406f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1407f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1408