nv50_program.c revision b4f7463585071236d633e4c857dbbdf67b03dc94
1f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_context.h"
2f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_defines.h"
3f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_state.h"
4f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_inlines.h"
5f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
6f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_shader_tokens.h"
7f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "tgsi/util/tgsi_parse.h"
8f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "tgsi/util/tgsi_util.h"
9f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
10f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "nv50_context.h"
11f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "nv50_state.h"
12f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
13f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#define NV50_SU_MAX_TEMP 64
14f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs/* ABS
1621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * ARL
1721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * DST - const(1.0)
1821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * LIT
1921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * POW
2021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * SWZ
2121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs *
2221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * MSB - Like MAD, but MUL+SUB
2321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * 	- Fuck it off, introduce a way to negate args for ops that
2421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * 	  support it.
2521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs *
2621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * Need ability to specifiy driver IMMD values, like nv40 constant()
2721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs *
2821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * Look into inlining IMMD for ops other than MOV
2921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs */
30f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstruct nv50_reg {
31f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	enum {
32f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_TEMP,
33f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_ATTR,
34f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_RESULT,
35f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_CONST,
36f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_IMMD
37f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	} type;
38f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int index;
39f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
40f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int hw;
4138ce697e5942550888c28bd4859ca2a92f247bf7Ben Skeggs	int neg;
42f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs};
43f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
44f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstruct nv50_pc {
45f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_program *p;
46f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
47f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	/* hw resources */
48f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *r_temp[NV50_SU_MAX_TEMP];
49f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
50f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	/* tgsi resources */
51f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *temp;
52f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int temp_nr;
53f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *attr;
54f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int attr_nr;
55f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *result;
56f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int result_nr;
57f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *param;
58f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int param_nr;
59f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *immd;
60f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	float *immd_buf;
61f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int immd_nr;
622a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
6352a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	struct nv50_reg *temp_temp[8];
642a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned temp_temp_nr;
65f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs};
66f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
67f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic void
68f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsalloc_reg(struct nv50_pc *pc, struct nv50_reg *reg)
69f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
70f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int i;
71f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
728ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	if (reg->type != P_TEMP)
73f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return;
74f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
758ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	if (reg->hw >= 0) {
768ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		/*XXX: do this here too to catch FP temp-as-attr usage..
778ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		 *     not clean, but works */
788ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		if (pc->p->cfg.high_temp < (reg->hw + 1))
798ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			pc->p->cfg.high_temp = reg->hw + 1;
808ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		return;
818ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	}
828ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
83f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (i = 0; i < NV50_SU_MAX_TEMP; i++) {
84f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!(pc->r_temp[i])) {
85f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			pc->r_temp[i] = reg;
86f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			reg->hw = i;
878ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			if (pc->p->cfg.high_temp < (i + 1))
888ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				pc->p->cfg.high_temp = i + 1;
89f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			return;
90f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
91f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
92f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
93f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	assert(0);
94f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
95f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
96f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic struct nv50_reg *
97f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsalloc_temp(struct nv50_pc *pc, struct nv50_reg *dst)
98f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
99f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *r;
100f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int i;
101f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
102f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (dst && dst->type == P_TEMP && dst->hw == -1)
103f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return dst;
104f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
105f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (i = 0; i < NV50_SU_MAX_TEMP; i++) {
106f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->r_temp[i]) {
107f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r = CALLOC_STRUCT(nv50_reg);
108f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r->type = P_TEMP;
109f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r->index = -1;
110f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r->hw = i;
111f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			pc->r_temp[i] = r;
112f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			return r;
113f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
114f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
115f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
116f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	assert(0);
117f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return NULL;
118f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
119f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
120f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic void
121f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsfree_temp(struct nv50_pc *pc, struct nv50_reg *r)
122f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
123f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (r->index == -1) {
124f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		FREE(pc->r_temp[r->hw]);
125f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->r_temp[r->hw] = NULL;
126f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
127f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
128f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
129f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic struct nv50_reg *
1302a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggstemp_temp(struct nv50_pc *pc)
1312a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
13252a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	if (pc->temp_temp_nr >= 8)
1332a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		assert(0);
1342a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
1352a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	pc->temp_temp[pc->temp_temp_nr] = alloc_temp(pc, NULL);
1362a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	return pc->temp_temp[pc->temp_temp_nr++];
1372a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
1382a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
1392a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
1402a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggskill_temp_temp(struct nv50_pc *pc)
1412a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
1422a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	int i;
1432a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
1442a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	for (i = 0; i < pc->temp_temp_nr; i++)
1452a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		free_temp(pc, pc->temp_temp[i]);
1462a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	pc->temp_temp_nr = 0;
1472a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
1482a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
1492a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic struct nv50_reg *
150f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggstgsi_dst(struct nv50_pc *pc, int c, const struct tgsi_full_dst_register *dst)
151f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
152f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	switch (dst->DstRegister.File) {
153f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_FILE_TEMPORARY:
154f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return &pc->temp[dst->DstRegister.Index * 4 + c];
155f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_FILE_OUTPUT:
156f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return &pc->result[dst->DstRegister.Index * 4 + c];
157f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_FILE_NULL:
158f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return NULL;
159f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	default:
160f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		break;
161f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
162f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
163f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return NULL;
164f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
165f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
166f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic struct nv50_reg *
167f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggstgsi_src(struct nv50_pc *pc, int c, const struct tgsi_full_src_register *src)
168f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
169f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	/* Handle swizzling */
170f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	switch (c) {
171f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case 0: c = src->SrcRegister.SwizzleX; break;
172f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case 1: c = src->SrcRegister.SwizzleY; break;
173f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case 2: c = src->SrcRegister.SwizzleZ; break;
174f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case 3: c = src->SrcRegister.SwizzleW; break;
175f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	default:
176f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		assert(0);
177f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
178f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
179f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	switch (src->SrcRegister.File) {
180f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_FILE_INPUT:
181f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return &pc->attr[src->SrcRegister.Index * 4 + c];
182f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_FILE_TEMPORARY:
183f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return &pc->temp[src->SrcRegister.Index * 4 + c];
184f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_FILE_CONSTANT:
185f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return &pc->param[src->SrcRegister.Index * 4 + c];
186f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_FILE_IMMEDIATE:
187f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return &pc->immd[src->SrcRegister.Index * 4 + c];
188f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	default:
189f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		break;
190f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
191f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
192f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return NULL;
193f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
194f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
19555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic void
19655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsemit(struct nv50_pc *pc, unsigned *inst)
19755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
19855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	struct nv50_program *p = pc->p;
19955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
200bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (inst[0] & 1) {
201bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		p->insns_nr += 2;
202bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		p->insns = realloc(p->insns, sizeof(unsigned) * p->insns_nr);
203bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		memcpy(p->insns + (p->insns_nr - 2), inst, sizeof(unsigned)*2);
204bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	} else {
205bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		p->insns_nr += 1;
206bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		p->insns = realloc(p->insns, sizeof(unsigned) * p->insns_nr);
207bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		memcpy(p->insns + (p->insns_nr - 1), inst, sizeof(unsigned));
208bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	}
20955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
21055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
21155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void set_long(struct nv50_pc *, unsigned *);
21255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
21355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic boolean
21455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsis_long(unsigned *inst)
21555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
21655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (inst[0] & 1)
21755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		return TRUE;
21855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	return FALSE;
21955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
22055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
22155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic boolean
22255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsis_immd(unsigned *inst)
22355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
22455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (is_long(inst) && (inst[1] & 3) == 3)
22555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		return TRUE;
22655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	return FALSE;
22755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
22855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
22955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
23055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsset_pred(struct nv50_pc *pc, unsigned pred, unsigned idx, unsigned *inst)
23155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
23255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_long(pc, inst);
23355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] &= ~((0x1f << 7) | (0x3 << 12));
23455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] |= (pred << 7) | (idx << 12);
23555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
23655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
23755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
23855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsset_pred_wr(struct nv50_pc *pc, unsigned on, unsigned idx, unsigned *inst)
23955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
24055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_long(pc, inst);
24155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] &= ~((0x3 << 4) | (1 << 6));
24255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] |= (idx << 4) | (on << 6);
24355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
24455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
24555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
24655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsset_long(struct nv50_pc *pc, unsigned *inst)
24755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
24855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (is_long(inst))
24955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		return;
25055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
25155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[0] |= 1;
25255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_pred(pc, 0xf, 0, inst);
25355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_pred_wr(pc, 0, 0, inst);
25455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
25555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
25655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
25755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsset_dst(struct nv50_pc *pc, struct nv50_reg *dst, unsigned *inst)
25855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
25955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (dst->type == P_RESULT) {
26055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		set_long(pc, inst);
26155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[1] |= 0x00000008;
26255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	}
26355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
26455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	alloc_reg(pc, dst);
26555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[0] |= (dst->hw << 2);
26655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
26755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
26855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
26955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsset_immd(struct nv50_pc *pc, struct nv50_reg *imm, unsigned *inst)
27055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
27155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	unsigned val = fui(pc->immd_buf[imm->hw]); /* XXX */
27255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
27355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_long(pc, inst);
27455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	/*XXX: can't be predicated - bits overlap.. catch cases where both
27555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	 *     are required and avoid them. */
27655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_pred(pc, 0, 0, inst);
27755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_pred_wr(pc, 0, 0, inst);
27855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
27955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] |= 0x00000002 | 0x00000001;
28055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[0] |= (val & 0x3f) << 16;
28155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] |= (val >> 6) << 2;
28255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
28355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
28455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic void
2858ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggsemit_interp(struct nv50_pc *pc, struct nv50_reg *dst,
2868ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	    struct nv50_reg *src, struct nv50_reg *iv, boolean noperspective)
2878ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs{
2888ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	unsigned inst[2] = { 0, 0 };
2898ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
2908ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	inst[0] |= 0x80000000;
2918ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	set_dst(pc, dst, inst);
2928ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	alloc_reg(pc, iv);
2938ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	inst[0] |= (iv->hw << 9);
2948ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	alloc_reg(pc, src);
2958ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	inst[0] |= (src->hw << 16);
2968ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	if (noperspective)
2978ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		inst[0] |= (1 << 25);
2988ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
2998ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	emit(pc, inst);
3008ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs}
3018ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
3028ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggsstatic void
3032a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsset_cseg(struct nv50_pc *pc, struct nv50_reg *src, unsigned *inst)
3042a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
3052a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_long(pc, inst);
3062a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_IMMD) {
3072a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[1] |= (NV50_CB_PMISC << 22);
3082a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else {
3092a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		if (pc->p->type == NV50_PROG_VERTEX)
3102a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			inst[1] |= (NV50_CB_PVP << 22);
3112a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		else
3122a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			inst[1] |= (NV50_CB_PFP << 22);
3132a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
3142a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
3152a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3162a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
31755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsemit_mov(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
31855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
31955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	unsigned inst[2] = { 0, 0 };
32055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
32155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[0] |= 0x10000000;
32255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
32355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_dst(pc, dst, inst);
32455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
32555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (dst->type != P_RESULT && src->type == P_IMMD) {
32655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		set_immd(pc, src, inst);
32755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		/*XXX: 32-bit, but steals part of "half" reg space - need to
32855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		 *     catch and handle this case if/when we do half-regs
32955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		 */
33055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[0] |= 0x00008000;
33155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	} else
33255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (src->type == P_IMMD || src->type == P_CONST) {
33355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		set_long(pc, inst);
3342a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		set_cseg(pc, src, inst);
33555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[0] |= (src->hw << 9);
33655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[1] |= 0x20000000; /* src0 const? */
33755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	} else {
33855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		if (src->type == P_ATTR) {
33955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs			set_long(pc, inst);
34055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs			inst[1] |= 0x00200000;
34155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		}
34255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
34355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		alloc_reg(pc, src);
34455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[0] |= (src->hw << 9);
34555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	}
34655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
34755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	/* We really should support "half" instructions here at some point,
34855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	 * but I don't feel confident enough about them yet.
34955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	 */
35055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_long(pc, inst);
35155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (is_long(inst) && !is_immd(inst)) {
35255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[1] |= 0x04000000; /* 32-bit */
35355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[1] |= 0x0003c000; /* "subsubop" 0xf == mov */
35455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	}
35555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
35655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	emit(pc, inst);
35755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
35855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
359f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic boolean
3602a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggscheck_swap_src_0_1(struct nv50_pc *pc,
3612a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		   struct nv50_reg **s0, struct nv50_reg **s1)
3622a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
3632a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	struct nv50_reg *src0 = *s0, *src1 = *s1;
3642a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3652a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src0->type == P_CONST) {
3662a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		if (src1->type != P_CONST) {
3672a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s0 = src1;
3682a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s1 = src0;
3692a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			return TRUE;
3702a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		}
3712a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
3722a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src1->type == P_ATTR) {
3732a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		if (src0->type != P_ATTR) {
3742a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s0 = src1;
3752a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s1 = src0;
3762a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			return TRUE;
3772a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		}
3782a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
3792a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3802a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	return FALSE;
3812a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
3822a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3832a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
3842a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsset_src_0(struct nv50_pc *pc, struct nv50_reg *src, unsigned *inst)
3852a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
3862a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_ATTR) {
3872a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		set_long(pc, inst);
3882a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[1] |= 0x00200000;
3892a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
3902a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_CONST || src->type == P_IMMD) {
3912a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		struct nv50_reg *temp = temp_temp(pc);
3922a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3932a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mov(pc, temp, src);
3942a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		src = temp;
3952a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
3962a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3972a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	alloc_reg(pc, src);
3982a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= (src->hw << 9);
3992a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4002a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4012a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
4022a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsset_src_1(struct nv50_pc *pc, struct nv50_reg *src, unsigned *inst)
4032a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4042a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_ATTR) {
4052a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		struct nv50_reg *temp = temp_temp(pc);
4062a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4072a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mov(pc, temp, src);
4082a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		src = temp;
4092a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
4102a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_CONST || src->type == P_IMMD) {
4112a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		set_cseg(pc, src, inst);
4122a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[0] |= 0x00800000;
4132a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
4142a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4152a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	alloc_reg(pc, src);
4162a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= (src->hw << 16);
4172a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4182a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4192a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
4202a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsset_src_2(struct nv50_pc *pc, struct nv50_reg *src, unsigned *inst)
4212a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4222a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_long(pc, inst);
4232a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4242a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_ATTR) {
4252a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		struct nv50_reg *temp = temp_temp(pc);
4262a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4272a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mov(pc, temp, src);
4282a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		src = temp;
4292a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
4302a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_CONST || src->type == P_IMMD) {
4312a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		set_cseg(pc, src, inst);
4322a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[0] |= 0x01000000;
4332a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
4342a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4352a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	alloc_reg(pc, src);
4362a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[1] |= (src->hw << 14);
4372a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4382a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4392a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
4402a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_mul(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
4412a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	 struct nv50_reg *src1)
4422a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4432a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned inst[2] = { 0, 0 };
4442a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4452a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= 0xc0000000;
4462a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4472a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
4482a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_dst(pc, dst, inst);
4492a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_0(pc, src0, inst);
4502a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_1(pc, src1, inst);
4512a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4522a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	emit(pc, inst);
4532a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4542a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4552a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
45652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggsemit_add(struct nv50_pc *pc, struct nv50_reg *dst,
45752a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	 struct nv50_reg *src0, struct nv50_reg *src1)
4582a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4592a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned inst[2] = { 0, 0 };
4602a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4612a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= 0xb0000000;
4622a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4632a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
4642a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_dst(pc, dst, inst);
4652a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_0(pc, src0, inst);
46652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	if (is_long(inst))
46752a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		set_src_2(pc, src1, inst);
46852a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	else
46952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		set_src_1(pc, src1, inst);
47052a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
47152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	emit(pc, inst);
47252a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs}
47352a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
47452a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggsstatic void
47552a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggsemit_minmax(struct nv50_pc *pc, unsigned sub, struct nv50_reg *dst,
47652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	    struct nv50_reg *src0, struct nv50_reg *src1)
47752a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs{
47852a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	unsigned inst[2] = { 0, 0 };
47952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
48052a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	set_long(pc, inst);
48152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	inst[0] |= 0xb0000000;
48252a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	inst[1] |= (sub << 29);
48352a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
48452a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
48552a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	set_dst(pc, dst, inst);
48652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	set_src_0(pc, src0, inst);
48752a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	set_src_1(pc, src1, inst);
4882a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4892a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	emit(pc, inst);
4902a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4912a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4922a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
4932a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_sub(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
4942a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	 struct nv50_reg *src1)
4952a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4962a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned inst[2] = { 0, 0 };
4972a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4982a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= 0xb0000000;
4992a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5002a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_long(pc, inst);
5012a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (check_swap_src_0_1(pc, &src0, &src1))
5022a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[1] |= 0x04000000;
5032a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	else
5042a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[1] |= 0x08000000;
5052a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5062a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_dst(pc, dst, inst);
5072a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_0(pc, src0, inst);
5082a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_2(pc, src1, inst);
5092a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5102a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	emit(pc, inst);
5112a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
5122a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5132a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
5142a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_mad(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
5152a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	 struct nv50_reg *src1, struct nv50_reg *src2)
5162a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
5172a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned inst[2] = { 0, 0 };
5182a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5192a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= 0xe0000000;
5202a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5212a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
5222a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_dst(pc, dst, inst);
5232a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_0(pc, src0, inst);
5242a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_1(pc, src1, inst);
5252a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_2(pc, src2, inst);
5262a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5272a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	emit(pc, inst);
5282a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
5292a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5302a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
53121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggsemit_msb(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
53221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	 struct nv50_reg *src1, struct nv50_reg *src2)
53321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs{
53421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	unsigned inst[2] = { 0, 0 };
53521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
53621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	inst[0] |= 0xe0000000;
53721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	set_long(pc, inst);
53821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	inst[1] |= 0x08000000; /* src0 * src1 - src2 */
53921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
54021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
54121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	set_dst(pc, dst, inst);
54221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	set_src_0(pc, src0, inst);
54321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	set_src_1(pc, src1, inst);
54421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	set_src_2(pc, src2, inst);
54521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
54621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	emit(pc, inst);
54721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs}
54821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
54921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggsstatic void
5502a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_flop(struct nv50_pc *pc, unsigned sub,
5512a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	  struct nv50_reg *dst, struct nv50_reg *src)
5522a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
5532a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned inst[2] = { 0, 0 };
5542a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5552a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= 0x90000000;
55652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	if (sub) {
55752a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		set_long(pc, inst);
55852a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		inst[1] |= (sub << 29);
55952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	}
5602a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5612a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_dst(pc, dst, inst);
5622a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_0(pc, src, inst);
5632a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5642a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	emit(pc, inst);
5652a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
5662a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
567d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggsstatic void
568d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggsemit_preex2(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
569d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs{
570d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	unsigned inst[2] = { 0, 0 };
571d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
572d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	inst[0] |= 0xb0000000;
573d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
574d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	set_dst(pc, dst, inst);
575d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	set_src_0(pc, src, inst);
576d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	set_long(pc, inst);
577d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	inst[1] |= (6 << 29) | 0x00004000;
578d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
579d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	emit(pc, inst);
580d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs}
581bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs/*XXX: inaccurate results.. why? */
582bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs#define ALLOW_SET_SWAP 0
583bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
584bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggsstatic void
585bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggsemit_set(struct nv50_pc *pc, unsigned c_op, struct nv50_reg *dst,
586bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 struct nv50_reg *src0, struct nv50_reg *src1)
587bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs{
588bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	unsigned inst[2] = { 0, 0 };
589bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs#if ALLOW_SET_SWAP
590bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	unsigned inv_cop[8] = { 0, 6, 2, 4, 3, 5, 1, 7 };
591bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs#endif
592bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	struct nv50_reg *rdst;
593bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
594bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs#if ALLOW_SET_SWAP
595bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	assert(c_op <= 7);
596bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (check_swap_src_0_1(pc, &src0, &src1))
597bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		c_op = inv_cop[c_op];
598bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs#endif
599bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
600bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	rdst = dst;
601bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (dst->type != P_TEMP)
602bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		dst = alloc_temp(pc, NULL);
603bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
604bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	/* set.u32 */
605bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_long(pc, inst);
606bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[0] |= 0xb0000000;
607bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[1] |= (3 << 29);
608bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[1] |= (c_op << 14);
609bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	/*XXX: breaks things, .u32 by default?
610bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 *     decuda will disasm as .u16 and use .lo/.hi regs, but this
611bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 *     doesn't seem to match what the hw actually does.
612bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[1] |= 0x04000000; << breaks things.. .u32 by default?
613bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 */
614bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_dst(pc, dst, inst);
615bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_src_0(pc, src0, inst);
616bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_src_1(pc, src1, inst);
617bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	emit(pc, inst);
618bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
619bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	/* cvt.f32.u32 */
620bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[0] = 0xa0000001;
621bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[1] = 0x64014780;
622bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_dst(pc, rdst, inst);
623bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_src_0(pc, dst, inst);
624bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	emit(pc, inst);
625bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
626bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (dst != rdst)
627bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		free_temp(pc, dst);
628bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs}
629d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
630b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggsstatic void
631b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggsemit_flr(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
632b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs{
633b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	unsigned inst[2] = { 0, 0 };
634b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs
635b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	set_long(pc, inst);
636b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[0] = 0xa0000000; /* cvt */
637b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[1] |= (6 << 29); /* cvt */
638b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[1] |= 0x08000000; /* integer mode */
639b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[1] |= 0x04000000; /* 32 bit */
640b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[1] |= ((0x1 << 3)) << 14; /* .rn */
641b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[1] |= (1 << 14); /* src .f32 */
642b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	set_dst(pc, dst, inst);
643b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	set_src_0(pc, src, inst);
644b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs
645b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	emit(pc, inst);
646b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs}
647b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs
6482a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic boolean
649f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_tx_insn(struct nv50_pc *pc, const union tgsi_full_token *tok)
650f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
651f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	const struct tgsi_full_instruction *inst = &tok->FullInstruction;
6522a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	struct nv50_reg *dst[4], *src[3][4], *temp;
653f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	unsigned mask;
654f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int i, c;
655f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
656f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	NOUVEAU_ERR("insn %p\n", tok);
657f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
658f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	mask = inst->FullDstRegisters[0].DstRegister.WriteMask;
659f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
660f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (c = 0; c < 4; c++) {
661f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (mask & (1 << c))
662f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			dst[c] = tgsi_dst(pc, c, &inst->FullDstRegisters[0]);
663f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		else
664f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			dst[c] = NULL;
665f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
666f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
667f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (i = 0; i < inst->Instruction.NumSrcRegs; i++) {
668f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (c = 0; c < 4; c++)
669f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			src[i][c] = tgsi_src(pc, c, &inst->FullSrcRegisters[i]);
670f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
671f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
672f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	switch (inst->Instruction.Opcode) {
6732a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_ADD:
6747df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
6757df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
6767df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
6772a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_add(pc, dst[c], src[0][c], src[1][c]);
6787df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
6792a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
6802a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_COS:
6817df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
6827df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
6837df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
6842a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_flop(pc, 5, dst[c], src[0][c]);
6857df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
6862a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
6872a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_DP3:
6882a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		temp = alloc_temp(pc, NULL);
6892a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mul(pc, temp, src[0][0], src[1][0]);
6902a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][1], src[1][1], temp);
6912a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][2], src[1][2], temp);
6927df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
6937df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
6947df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
6952a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mov(pc, dst[c], temp);
6967df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
6972a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		free_temp(pc, temp);
6982a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
6992a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_DP4:
7002a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		temp = alloc_temp(pc, NULL);
7012a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mul(pc, temp, src[0][0], src[1][0]);
7022a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][1], src[1][1], temp);
7032a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][2], src[1][2], temp);
7042a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][3], src[1][3], temp);
7057df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
7067df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
7077df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
7082a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mov(pc, dst[c], temp);
7097df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
7102a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		free_temp(pc, temp);
7112a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
71221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	case TGSI_OPCODE_DPH:
71321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		temp = alloc_temp(pc, NULL);
71421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mul(pc, temp, src[0][0], src[1][0]);
71521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mad(pc, temp, src[0][1], src[1][1], temp);
71621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mad(pc, temp, src[0][2], src[1][2], temp);
71721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_add(pc, temp, src[1][3], temp);
71821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		for (c = 0; c < 4; c++) {
71921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs			if (!(mask & (1 << c)))
72021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs				continue;
72121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs			emit_mov(pc, dst[c], temp);
72221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		}
72321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		free_temp(pc, temp);
72421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		break;
7252a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_EX2:
726fbf4027dd9b279ec159906dcad134f71e34aaec8Ben Skeggs		temp = alloc_temp(pc, NULL);
7277df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
7287df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
7297df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
730d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs			emit_preex2(pc, temp, src[0][c]);
731fbf4027dd9b279ec159906dcad134f71e34aaec8Ben Skeggs			emit_flop(pc, 6, dst[c], temp);
7327df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
733fbf4027dd9b279ec159906dcad134f71e34aaec8Ben Skeggs		free_temp(pc, temp);
7342a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
735b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	case TGSI_OPCODE_FLR:
736b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		for (c = 0; c < 4; c++) {
737b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			if (!(mask & (1 << c)))
738b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs				continue;
739b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			emit_flr(pc, dst[c], src[0][c]);
740b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		}
741b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		break;
742b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	case TGSI_OPCODE_FRC:
743b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		temp = alloc_temp(pc, NULL);
744b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		for (c = 0; c < 4; c++) {
745b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			if (!(mask & (1 << c)))
746b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs				continue;
747b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			emit_flr(pc, temp, src[0][c]);
748b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			emit_sub(pc, dst[c], src[0][c], temp);
749b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		}
750b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		free_temp(pc, temp);
751b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		break;
7522a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_LG2:
7537df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
7547df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
7557df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
7562a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_flop(pc, 3, dst[c], src[0][c]);
7577df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
7582a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
7592a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_MAD:
7607df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
7617df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
7627df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
7632a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mad(pc, dst[c], src[0][c], src[1][c], src[2][c]);
7647df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
7652a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
76652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	case TGSI_OPCODE_MAX:
7677df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
7687df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
7697df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
77052a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs			emit_minmax(pc, 4, dst[c], src[0][c], src[1][c]);
7717df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
77252a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		break;
77352a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	case TGSI_OPCODE_MIN:
7747df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
7757df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
7767df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
77752a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs			emit_minmax(pc, 5, dst[c], src[0][c], src[1][c]);
7787df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
77952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		break;
780f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_OPCODE_MOV:
7817df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
7827df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
7837df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
78455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs			emit_mov(pc, dst[c], src[0][c]);
7857df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
78638ce697e5942550888c28bd4859ca2a92f247bf7Ben Skeggs		break;
7872a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_MUL:
7887df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
7897df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
7907df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
7912a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mul(pc, dst[c], src[0][c], src[1][c]);
7927df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
7932a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
7942a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_RCP:
7957df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
7967df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
7977df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
7982a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_flop(pc, 0, dst[c], src[0][c]);
7997df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
8002a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
8012a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_RSQ:
8027df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8037df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8047df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
8052a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_flop(pc, 2, dst[c], src[0][c]);
8067df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
8072a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
808bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	case TGSI_OPCODE_SGE:
809bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		for (c = 0; c < 4; c++) {
810bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			if (!(mask & (1 << c)))
811bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs				continue;
812bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			emit_set(pc, 6, dst[c], src[0][c], src[1][c]);
813bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		}
814bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		break;
8152a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_SIN:
8167df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8177df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8187df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
8192a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_flop(pc, 4, dst[c], src[0][c]);
8207df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
8212a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
822bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	case TGSI_OPCODE_SLT:
823bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		for (c = 0; c < 4; c++) {
824bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			if (!(mask & (1 << c)))
825bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs				continue;
826bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			emit_set(pc, 1, dst[c], src[0][c], src[1][c]);
827bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		}
828bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		break;
8292a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_SUB:
8307df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8317df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8327df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
8332a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_sub(pc, dst[c], src[0][c], src[1][c]);
8347df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
8352a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
83621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	case TGSI_OPCODE_XPD:
83721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		temp = alloc_temp(pc, NULL);
83821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mul(pc, temp, src[0][2], src[1][1]);
83921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_msb(pc, dst[0], src[0][1], src[1][2], temp);
84021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mul(pc, temp, src[0][0], src[1][2]);
84121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_msb(pc, dst[1], src[0][2], src[1][0], temp);
84221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mul(pc, temp, src[0][1], src[1][0]);
84321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_msb(pc, dst[2], src[0][0], src[1][1], temp);
84421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		free_temp(pc, temp);
84521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		break;
846f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_OPCODE_END:
847f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		break;
848f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	default:
849f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		NOUVEAU_ERR("invalid opcode %d\n", inst->Instruction.Opcode);
850f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return FALSE;
851f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
852f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
85352a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	kill_temp_temp(pc);
854f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return TRUE;
855f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
856f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
857f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic boolean
858f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_tx_prep(struct nv50_pc *pc)
859f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
860f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct tgsi_parse_context p;
861f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	boolean ret = FALSE;
862f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	unsigned i, c;
863f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
864f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_init(&p, pc->p->pipe.tokens);
865f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	while (!tgsi_parse_end_of_tokens(&p)) {
866f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		const union tgsi_full_token *tok = &p.FullToken;
867f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
868f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		tgsi_parse_token(&p);
869f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		switch (tok->Token.Type) {
870f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_IMMEDIATE:
871f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		{
872f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			const struct tgsi_full_immediate *imm =
873f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				&p.FullToken.FullImmediate;
874f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
875f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			pc->immd_nr++;
876f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			pc->immd_buf = realloc(pc->immd_buf, 4 * pc->immd_nr *
877f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs							     sizeof(float));
878f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			pc->immd_buf[4 * (pc->immd_nr - 1) + 0] =
879f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				imm->u.ImmediateFloat32[0].Float;
880f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			pc->immd_buf[4 * (pc->immd_nr - 1) + 1] =
881f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				imm->u.ImmediateFloat32[1].Float;
882f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			pc->immd_buf[4 * (pc->immd_nr - 1) + 2] =
883f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				imm->u.ImmediateFloat32[2].Float;
884f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			pc->immd_buf[4 * (pc->immd_nr - 1) + 3] =
885f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				imm->u.ImmediateFloat32[3].Float;
886f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
887f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
888f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_DECLARATION:
889f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		{
890f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			const struct tgsi_full_declaration *d;
891f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			unsigned last;
892f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
893f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			d = &p.FullToken.FullDeclaration;
894f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			last = d->u.DeclarationRange.Last;
895f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
896f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			switch (d->Declaration.File) {
897f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_TEMPORARY:
898f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->temp_nr < (last + 1))
899f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->temp_nr = last + 1;
900f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
901f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_OUTPUT:
902f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->result_nr < (last + 1))
903f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->result_nr = last + 1;
904f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
905f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_INPUT:
906f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->attr_nr < (last + 1))
907f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->attr_nr = last + 1;
908f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
909f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_CONSTANT:
910f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->param_nr < (last + 1))
911f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->param_nr = last + 1;
912f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
913f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			default:
914f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				NOUVEAU_ERR("bad decl file %d\n",
915f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					    d->Declaration.File);
916f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				goto out_err;
917f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
918f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
919f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
920f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_INSTRUCTION:
921f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
922f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		default:
923f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
924f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
925f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
926f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
927f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	NOUVEAU_ERR("%d temps\n", pc->temp_nr);
928f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->temp_nr) {
929f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->temp = calloc(pc->temp_nr * 4, sizeof(struct nv50_reg));
930f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->temp)
931f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
932f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
933f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->temp_nr; i++) {
934f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
935f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->temp[i*4+c].type = P_TEMP;
936f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->temp[i*4+c].hw = -1;
937f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->temp[i*4+c].index = i;
938f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
939f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
940f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
941f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
942f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	NOUVEAU_ERR("%d attrib regs\n", pc->attr_nr);
943f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->attr_nr) {
9448ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		struct nv50_reg *iv = NULL, *tmp = NULL;
945f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		int aid = 0;
946f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
947f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->attr = calloc(pc->attr_nr * 4, sizeof(struct nv50_reg));
948f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->attr)
949f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
950f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
9518ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		if (pc->p->type == NV50_PROG_FRAGMENT) {
9528ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			iv = alloc_temp(pc, NULL);
9538ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			aid++;
9548ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		}
9558ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
956f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->attr_nr; i++) {
9578ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			struct nv50_reg *a = &pc->attr[i*4];
9588ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
959f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
9608ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				if (pc->p->type == NV50_PROG_FRAGMENT) {
9618ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					struct nv50_reg *at =
9628ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs						alloc_temp(pc, NULL);
9638ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].type = at->type;
9648ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].hw = at->hw;
9658ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].index = at->index;
9668ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				} else {
9678ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->p->cfg.vp.attr[aid/32] |=
9688ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs						(1 << (aid % 32));
9698ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].type = P_ATTR;
9708ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].hw = aid++;
9718ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].index = i;
9728ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				}
973f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
9748ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
9758ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			if (pc->p->type != NV50_PROG_FRAGMENT)
9768ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				continue;
9778ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
9788ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			emit_interp(pc, iv, iv, iv, FALSE);
9798ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			tmp = alloc_temp(pc, NULL);
9808ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			{
9818ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				unsigned inst[2] = { 0, 0 };
9828ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				inst[0]  = 0x90000000;
9838ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				inst[0] |= (tmp->hw << 2);
9848ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				emit(pc, inst);
9858ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			}
9868ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			emit_interp(pc, &a[0], &a[0], tmp, TRUE);
9878ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			emit_interp(pc, &a[1], &a[1], tmp, TRUE);
9888ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			emit_interp(pc, &a[2], &a[2], tmp, TRUE);
9898ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			emit_interp(pc, &a[3], &a[3], tmp, TRUE);
9908ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			free_temp(pc, tmp);
991f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
9928ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
9938ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		if (iv)
9948ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			free_temp(pc, iv);
995f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
996f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
997f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	NOUVEAU_ERR("%d result regs\n", pc->result_nr);
998f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->result_nr) {
999f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		int rid = 0;
1000f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1001f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->result = calloc(pc->result_nr * 4, sizeof(struct nv50_reg));
1002f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->result)
1003f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1004f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1005f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->result_nr; i++) {
1006f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
10078ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				if (pc->p->type == NV50_PROG_FRAGMENT)
10088ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->result[i*4+c].type = P_TEMP;
10098ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				else
10108ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->result[i*4+c].type = P_RESULT;
1011f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->result[i*4+c].hw = rid++;
1012f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->result[i*4+c].index = i;
1013f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1014f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1015f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1016f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1017f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	NOUVEAU_ERR("%d param regs\n", pc->param_nr);
1018f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->param_nr) {
1019f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		int rid = 0;
1020f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1021f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->param = calloc(pc->param_nr * 4, sizeof(struct nv50_reg));
1022f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->param)
1023f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1024f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1025f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->param_nr; i++) {
1026f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1027f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->param[i*4+c].type = P_CONST;
1028f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->param[i*4+c].hw = rid++;
1029f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->param[i*4+c].index = i;
1030f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1031f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1032f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1033f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1034f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->immd_nr) {
1035716c1cd2ecbc1e86c0fd747c9fa9e095ded5fd5dBen Skeggs		int rid = 0;
1036f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1037f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->immd = calloc(pc->immd_nr * 4, sizeof(struct nv50_reg));
1038f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->immd)
1039f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1040f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1041f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->immd_nr; i++) {
1042f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1043f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->immd[i*4+c].type = P_IMMD;
1044f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->immd[i*4+c].hw = rid++;
1045f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->immd[i*4+c].index = i;
1046f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1047f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1048f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1049f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1050f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	ret = TRUE;
1051f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsout_err:
1052f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_free(&p);
1053f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return ret;
1054f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1055f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1056f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic boolean
1057f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_tx(struct nv50_program *p)
1058f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1059f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct tgsi_parse_context parse;
1060f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_pc *pc;
1061f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	boolean ret;
1062f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1063f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	pc = CALLOC_STRUCT(nv50_pc);
1064f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (!pc)
1065f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return FALSE;
1066f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	pc->p = p;
10678ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	pc->p->cfg.high_temp = 4;
1068f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1069f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	ret = nv50_program_tx_prep(pc);
1070f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (ret == FALSE)
1071f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		goto out_cleanup;
1072f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1073f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_init(&parse, pc->p->pipe.tokens);
1074f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	while (!tgsi_parse_end_of_tokens(&parse)) {
1075f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		const union tgsi_full_token *tok = &parse.FullToken;
1076f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1077f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		tgsi_parse_token(&parse);
1078f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1079f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		switch (tok->Token.Type) {
1080f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_INSTRUCTION:
1081f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			ret = nv50_program_tx_insn(pc, tok);
1082f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			if (ret == FALSE)
1083f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				goto out_err;
1084f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1085f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		default:
1086f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1087f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1088f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1089f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1090f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->immd_nr = pc->immd_nr * 4;
1091f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->immd = pc->immd_buf;
1092f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1093f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsout_err:
1094f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_free(&parse);
1095f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1096f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsout_cleanup:
1097f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return ret;
1098f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1099f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1100f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic void
1101f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_validate(struct nv50_context *nv50, struct nv50_program *p)
1102f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1103e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	int i;
1104e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs
1105e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	if (nv50_program_tx(p) == FALSE)
1106e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs		assert(0);
1107e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	/* *not* sufficient, it's fine if last inst is long and
1108e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	 * NOT immd - otherwise it's fucked fucked fucked */
1109e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	p->insns[p->insns_nr - 1] |= 0x00000001;
1110f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
11112a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (p->type == NV50_PROG_VERTEX) {
11122a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	for (i = 0; i < p->insns_nr; i++)
11132a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		NOUVEAU_ERR("VP0x%08x\n", p->insns[i]);
11142a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else {
1115e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	for (i = 0; i < p->insns_nr; i++)
11162a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		NOUVEAU_ERR("FP0x%08x\n", p->insns[i]);
11172a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
1118f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1119f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->translated = TRUE;
1120f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1121f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
112222e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsstatic void
112322e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsnv50_program_validate_data(struct nv50_context *nv50, struct nv50_program *p)
112422e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs{
112522e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	int i;
112622e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
112722e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	for (i = 0; i < p->immd_nr; i++) {
112822e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs		BEGIN_RING(tesla, 0x0f00, 2);
112922e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs		OUT_RING  ((NV50_CB_PMISC << 16) | (i << 8));
113022e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs		OUT_RING  (fui(p->immd[i]));
113122e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	}
113222e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs}
113322e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
113422e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsstatic void
113522e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsnv50_program_validate_code(struct nv50_context *nv50, struct nv50_program *p)
113622e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs{
113722e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	struct pipe_winsys *ws = nv50->pipe.winsys;
113822e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	void *map;
113922e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
114022e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	if (!p->buffer)
114122e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs		p->buffer = ws->buffer_create(ws, 0x100, 0, p->insns_nr * 4);
114222e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	map = ws->buffer_map(ws, p->buffer, PIPE_BUFFER_USAGE_CPU_WRITE);
114322e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	memcpy(map, p->insns, p->insns_nr * 4);
114422e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	ws->buffer_unmap(ws, p->buffer);
114522e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs}
114622e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
1147f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsvoid
1148f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_vertprog_validate(struct nv50_context *nv50)
1149f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1150f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_grobj *tesla = nv50->screen->tesla;
1151f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_program *p = nv50->vertprog;
1152f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_stateobj *so;
1153f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1154f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (!p->translated) {
1155f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		nv50_program_validate(nv50, p);
1156f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!p->translated)
1157f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			assert(0);
1158f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1159f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
116022e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	nv50_program_validate_data(nv50, p);
116122e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	nv50_program_validate_code(nv50, p);
1162f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1163f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so = so_new(11, 2);
1164f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, NV50TCL_VP_ADDRESS_HIGH, 2);
1165f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1166f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_HIGH, 0, 0);
1167f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1168f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_LOW, 0, 0);
1169f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, 0x1650, 2);
1170f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, p->cfg.vp.attr[0]);
1171f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, p->cfg.vp.attr[1]);
1172f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, 0x16ac, 2);
1173f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, 8);
11748ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_data  (so, p->cfg.high_temp);
1175f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, 0x140c, 1);
1176f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, 0); /* program start offset */
1177f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_emit(nv50->screen->nvws, so);
1178f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_ref(NULL, &so);
1179f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1180f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1181f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsvoid
1182f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_fragprog_validate(struct nv50_context *nv50)
1183f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1184f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_grobj *tesla = nv50->screen->tesla;
1185f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_program *p = nv50->fragprog;
1186f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_stateobj *so;
1187f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1188f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (!p->translated) {
1189f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		nv50_program_validate(nv50, p);
1190f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!p->translated)
1191f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			assert(0);
1192f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1193f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
119455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	nv50_program_validate_data(nv50, p);
119555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	nv50_program_validate_code(nv50, p);
1196f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
11978ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so = so_new(7, 2);
1198f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, NV50TCL_FP_ADDRESS_HIGH, 2);
1199f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1200f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_HIGH, 0, 0);
1201f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1202f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_LOW, 0, 0);
12038ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_method(so, tesla, 0x198c, 1);
12048ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_data  (so, p->cfg.high_temp);
12058ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_method(so, tesla, 0x1414, 1);
12068ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_data  (so, 0); /* program start offset */
1207f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_emit(nv50->screen->nvws, so);
1208f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_ref(NULL, &so);
1209f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1210f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1211f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsvoid
1212f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_destroy(struct nv50_context *nv50, struct nv50_program *p)
1213f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1214f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct pipe_winsys *ws = nv50->pipe.winsys;
1215f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1216f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (p->insns_nr) {
1217f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (p->insns)
1218f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			FREE(p->insns);
1219f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		p->insns_nr = 0;
1220f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1221f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1222f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (p->buffer)
1223f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pipe_buffer_reference(ws, &p->buffer, NULL);
1224f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1225f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->translated = 0;
1226f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1227f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1228