nv50_program.c revision ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69
1f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_context.h"
2f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_defines.h"
3f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_state.h"
4f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_inlines.h"
5f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
6f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_shader_tokens.h"
7f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "tgsi/util/tgsi_parse.h"
8f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "tgsi/util/tgsi_util.h"
9f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
10f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "nv50_context.h"
11f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "nv50_state.h"
12f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
13f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#define NV50_SU_MAX_TEMP 64
14f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1568091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs/* ARL
1633e4d30d50344be26398a51365bea1be37487403Ben Skeggs * LIT - other buggery
1721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs *
1821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * MSB - Like MAD, but MUL+SUB
1921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * 	- Fuck it off, introduce a way to negate args for ops that
2021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * 	  support it.
2121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs *
22ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs * Look into inlining IMMD for ops other than MOV (make it general?)
2333e4d30d50344be26398a51365bea1be37487403Ben Skeggs * 	- Maybe even relax restrictions a bit, can't do P_RESULT + P_IMMD,
2433e4d30d50344be26398a51365bea1be37487403Ben Skeggs * 	  but can emit to P_TEMP first - then MOV later. NVIDIA does this
25ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs *
26ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs * Verify half-insns work where expected - and force disable them where they
27ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs * don't work - MUL has it forcibly disabled atm as it fixes POW..
2821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs */
29f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstruct nv50_reg {
30f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	enum {
31f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_TEMP,
32f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_ATTR,
33f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_RESULT,
34f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_CONST,
35f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_IMMD
36f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	} type;
37f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int index;
38f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
39f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int hw;
4038ce697e5942550888c28bd4859ca2a92f247bf7Ben Skeggs	int neg;
41f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs};
42f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
43f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstruct nv50_pc {
44f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_program *p;
45f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
46f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	/* hw resources */
47f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *r_temp[NV50_SU_MAX_TEMP];
48f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
49f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	/* tgsi resources */
50f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *temp;
51f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int temp_nr;
52f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *attr;
53f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int attr_nr;
54f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *result;
55f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int result_nr;
56f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *param;
57f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int param_nr;
58f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *immd;
59f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	float *immd_buf;
60f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int immd_nr;
612a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
6252a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	struct nv50_reg *temp_temp[8];
632a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned temp_temp_nr;
64f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs};
65f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
66f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic void
67f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsalloc_reg(struct nv50_pc *pc, struct nv50_reg *reg)
68f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
69f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int i;
70f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
718ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	if (reg->type != P_TEMP)
72f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return;
73f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
748ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	if (reg->hw >= 0) {
758ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		/*XXX: do this here too to catch FP temp-as-attr usage..
768ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		 *     not clean, but works */
778ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		if (pc->p->cfg.high_temp < (reg->hw + 1))
788ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			pc->p->cfg.high_temp = reg->hw + 1;
798ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		return;
808ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	}
818ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
82f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (i = 0; i < NV50_SU_MAX_TEMP; i++) {
83f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!(pc->r_temp[i])) {
84f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			pc->r_temp[i] = reg;
85f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			reg->hw = i;
868ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			if (pc->p->cfg.high_temp < (i + 1))
878ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				pc->p->cfg.high_temp = i + 1;
88f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			return;
89f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
90f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
91f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
92f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	assert(0);
93f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
94f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
95f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic struct nv50_reg *
96f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsalloc_temp(struct nv50_pc *pc, struct nv50_reg *dst)
97f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
98f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *r;
99f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int i;
100f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
101f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (dst && dst->type == P_TEMP && dst->hw == -1)
102f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return dst;
103f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
104f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (i = 0; i < NV50_SU_MAX_TEMP; i++) {
105f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->r_temp[i]) {
106f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r = CALLOC_STRUCT(nv50_reg);
107f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r->type = P_TEMP;
108f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r->index = -1;
109f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r->hw = i;
110f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			pc->r_temp[i] = r;
111f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			return r;
112f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
113f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
114f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
115f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	assert(0);
116f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return NULL;
117f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
118f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
119f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic void
120f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsfree_temp(struct nv50_pc *pc, struct nv50_reg *r)
121f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
122f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (r->index == -1) {
123f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		FREE(pc->r_temp[r->hw]);
124f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->r_temp[r->hw] = NULL;
125f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
126f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
127f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
128f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic struct nv50_reg *
1292a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggstemp_temp(struct nv50_pc *pc)
1302a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
13152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	if (pc->temp_temp_nr >= 8)
1322a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		assert(0);
1332a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
1342a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	pc->temp_temp[pc->temp_temp_nr] = alloc_temp(pc, NULL);
1352a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	return pc->temp_temp[pc->temp_temp_nr++];
1362a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
1372a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
1382a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
1392a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggskill_temp_temp(struct nv50_pc *pc)
1402a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
1412a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	int i;
1422a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
1432a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	for (i = 0; i < pc->temp_temp_nr; i++)
1442a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		free_temp(pc, pc->temp_temp[i]);
1452a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	pc->temp_temp_nr = 0;
1462a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
1472a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
14833e4d30d50344be26398a51365bea1be37487403Ben Skeggsstatic int
14933e4d30d50344be26398a51365bea1be37487403Ben Skeggsctor_immd(struct nv50_pc *pc, float x, float y, float z, float w)
15033e4d30d50344be26398a51365bea1be37487403Ben Skeggs{
15133e4d30d50344be26398a51365bea1be37487403Ben Skeggs	pc->immd_buf = realloc(pc->immd_buf, (pc->immd_nr + 1) * 4 *
15233e4d30d50344be26398a51365bea1be37487403Ben Skeggs					     sizeof(float));
15333e4d30d50344be26398a51365bea1be37487403Ben Skeggs	pc->immd_buf[(pc->immd_nr * 4) + 0] = x;
15433e4d30d50344be26398a51365bea1be37487403Ben Skeggs	pc->immd_buf[(pc->immd_nr * 4) + 1] = x;
15533e4d30d50344be26398a51365bea1be37487403Ben Skeggs	pc->immd_buf[(pc->immd_nr * 4) + 2] = x;
15633e4d30d50344be26398a51365bea1be37487403Ben Skeggs	pc->immd_buf[(pc->immd_nr * 4) + 3] = x;
15733e4d30d50344be26398a51365bea1be37487403Ben Skeggs
15833e4d30d50344be26398a51365bea1be37487403Ben Skeggs	return pc->immd_nr++;
15933e4d30d50344be26398a51365bea1be37487403Ben Skeggs}
16033e4d30d50344be26398a51365bea1be37487403Ben Skeggs
16133e4d30d50344be26398a51365bea1be37487403Ben Skeggsstatic struct nv50_reg *
16233e4d30d50344be26398a51365bea1be37487403Ben Skeggsalloc_immd(struct nv50_pc *pc, float f)
16333e4d30d50344be26398a51365bea1be37487403Ben Skeggs{
16433e4d30d50344be26398a51365bea1be37487403Ben Skeggs	struct nv50_reg *r = CALLOC_STRUCT(nv50_reg);
16533e4d30d50344be26398a51365bea1be37487403Ben Skeggs	unsigned hw;
16633e4d30d50344be26398a51365bea1be37487403Ben Skeggs
16733e4d30d50344be26398a51365bea1be37487403Ben Skeggs	hw = ctor_immd(pc, f, 0, 0, 0);
16833e4d30d50344be26398a51365bea1be37487403Ben Skeggs	r->type = P_IMMD;
16933e4d30d50344be26398a51365bea1be37487403Ben Skeggs	r->hw = hw;
17033e4d30d50344be26398a51365bea1be37487403Ben Skeggs	r->index = -1;
17133e4d30d50344be26398a51365bea1be37487403Ben Skeggs	return r;
17233e4d30d50344be26398a51365bea1be37487403Ben Skeggs}
17333e4d30d50344be26398a51365bea1be37487403Ben Skeggs
1742a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic struct nv50_reg *
175f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggstgsi_dst(struct nv50_pc *pc, int c, const struct tgsi_full_dst_register *dst)
176f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
177f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	switch (dst->DstRegister.File) {
178f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_FILE_TEMPORARY:
179f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return &pc->temp[dst->DstRegister.Index * 4 + c];
180f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_FILE_OUTPUT:
181f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return &pc->result[dst->DstRegister.Index * 4 + c];
182f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_FILE_NULL:
183f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return NULL;
184f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	default:
185f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		break;
186f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
187f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
188f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return NULL;
189f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
190f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
191f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic struct nv50_reg *
19234abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggstgsi_src(struct nv50_pc *pc, int chan, const struct tgsi_full_src_register *src)
193f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
19434abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs	struct nv50_reg *r = NULL;
19534abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs	unsigned c;
19634abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs
19734abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs	c = tgsi_util_get_full_src_register_extswizzle(src, chan);
198f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	switch (c) {
19934abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs	case TGSI_EXTSWIZZLE_X:
20034abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs	case TGSI_EXTSWIZZLE_Y:
20134abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs	case TGSI_EXTSWIZZLE_Z:
20234abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs	case TGSI_EXTSWIZZLE_W:
20334abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs		switch (src->SrcRegister.File) {
20434abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs		case TGSI_FILE_INPUT:
20534abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs			r = &pc->attr[src->SrcRegister.Index * 4 + c];
20634abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs			break;
20734abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs		case TGSI_FILE_TEMPORARY:
20834abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs			r = &pc->temp[src->SrcRegister.Index * 4 + c];
20934abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs			break;
21034abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs		case TGSI_FILE_CONSTANT:
21134abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs			r = &pc->param[src->SrcRegister.Index * 4 + c];
21234abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs			break;
21334abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs		case TGSI_FILE_IMMEDIATE:
21434abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs			r = &pc->immd[src->SrcRegister.Index * 4 + c];
21534abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs			break;
21634abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs		default:
21734abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs			assert(0);
21834abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs			break;
21934abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs		}
22034abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs		break;
22134abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs	case TGSI_EXTSWIZZLE_ZERO:
22234abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs		r = alloc_immd(pc, 0.0);
22334abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs		break;
22434abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs	case TGSI_EXTSWIZZLE_ONE:
22534abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs		r = alloc_immd(pc, 1.0);
22634abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs		break;
227f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	default:
228f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		assert(0);
22934abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs		break;
230f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
231f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
23234abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs	switch (tgsi_util_get_full_src_register_sign_mode(src, chan)) {
23334abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs	case TGSI_UTIL_SIGN_KEEP:
23434abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs		break;
235f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	default:
23634abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs		assert(0);
237f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		break;
238f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
239f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
24034abb858e2aaef2c1a066a7cdb3e0376d6c9f6bdBen Skeggs	return r;
241f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
242f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
24355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic void
24455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsemit(struct nv50_pc *pc, unsigned *inst)
24555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
24655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	struct nv50_program *p = pc->p;
24755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
248bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (inst[0] & 1) {
249bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		p->insns_nr += 2;
250bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		p->insns = realloc(p->insns, sizeof(unsigned) * p->insns_nr);
251bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		memcpy(p->insns + (p->insns_nr - 2), inst, sizeof(unsigned)*2);
252bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	} else {
253bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		p->insns_nr += 1;
254bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		p->insns = realloc(p->insns, sizeof(unsigned) * p->insns_nr);
255bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		memcpy(p->insns + (p->insns_nr - 1), inst, sizeof(unsigned));
256bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	}
25755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
25855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
25955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void set_long(struct nv50_pc *, unsigned *);
26055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
26155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic boolean
26255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsis_long(unsigned *inst)
26355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
26455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (inst[0] & 1)
26555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		return TRUE;
26655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	return FALSE;
26755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
26855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
26955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic boolean
27055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsis_immd(unsigned *inst)
27155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
27255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (is_long(inst) && (inst[1] & 3) == 3)
27355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		return TRUE;
27455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	return FALSE;
27555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
27655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
27755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
27855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsset_pred(struct nv50_pc *pc, unsigned pred, unsigned idx, unsigned *inst)
27955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
28055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_long(pc, inst);
28155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] &= ~((0x1f << 7) | (0x3 << 12));
28255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] |= (pred << 7) | (idx << 12);
28355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
28455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
28555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
28655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsset_pred_wr(struct nv50_pc *pc, unsigned on, unsigned idx, unsigned *inst)
28755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
28855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_long(pc, inst);
28955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] &= ~((0x3 << 4) | (1 << 6));
29055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] |= (idx << 4) | (on << 6);
29155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
29255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
29355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
29455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsset_long(struct nv50_pc *pc, unsigned *inst)
29555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
29655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (is_long(inst))
29755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		return;
29855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
29955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[0] |= 1;
30055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_pred(pc, 0xf, 0, inst);
30155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_pred_wr(pc, 0, 0, inst);
30255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
30355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
30455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
30555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsset_dst(struct nv50_pc *pc, struct nv50_reg *dst, unsigned *inst)
30655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
30755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (dst->type == P_RESULT) {
30855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		set_long(pc, inst);
30955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[1] |= 0x00000008;
31055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	}
31155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
31255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	alloc_reg(pc, dst);
31355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[0] |= (dst->hw << 2);
31455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
31555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
31655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
31755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsset_immd(struct nv50_pc *pc, struct nv50_reg *imm, unsigned *inst)
31855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
31955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	unsigned val = fui(pc->immd_buf[imm->hw]); /* XXX */
32055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
32155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_long(pc, inst);
32255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	/*XXX: can't be predicated - bits overlap.. catch cases where both
32355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	 *     are required and avoid them. */
32455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_pred(pc, 0, 0, inst);
32555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_pred_wr(pc, 0, 0, inst);
32655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
32755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] |= 0x00000002 | 0x00000001;
32855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[0] |= (val & 0x3f) << 16;
32955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[1] |= (val >> 6) << 2;
33055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
33155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
33255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic void
3338ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggsemit_interp(struct nv50_pc *pc, struct nv50_reg *dst,
3348ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	    struct nv50_reg *src, struct nv50_reg *iv, boolean noperspective)
3358ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs{
3368ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	unsigned inst[2] = { 0, 0 };
3378ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
3388ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	inst[0] |= 0x80000000;
3398ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	set_dst(pc, dst, inst);
3408ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	alloc_reg(pc, iv);
3418ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	inst[0] |= (iv->hw << 9);
3428ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	alloc_reg(pc, src);
3438ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	inst[0] |= (src->hw << 16);
3448ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	if (noperspective)
3458ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		inst[0] |= (1 << 25);
3468ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
3478ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	emit(pc, inst);
3488ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs}
3498ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
3508ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggsstatic void
3512a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsset_cseg(struct nv50_pc *pc, struct nv50_reg *src, unsigned *inst)
3522a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
3532a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_long(pc, inst);
3542a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_IMMD) {
3552a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[1] |= (NV50_CB_PMISC << 22);
3562a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else {
3572a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		if (pc->p->type == NV50_PROG_VERTEX)
3582a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			inst[1] |= (NV50_CB_PVP << 22);
3592a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		else
3602a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			inst[1] |= (NV50_CB_PFP << 22);
3612a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
3622a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
3632a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3642a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
36555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsemit_mov(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
36655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
36755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	unsigned inst[2] = { 0, 0 };
36855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
36955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	inst[0] |= 0x10000000;
37055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
37155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_dst(pc, dst, inst);
37255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
37355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (dst->type != P_RESULT && src->type == P_IMMD) {
37455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		set_immd(pc, src, inst);
37555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		/*XXX: 32-bit, but steals part of "half" reg space - need to
37655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		 *     catch and handle this case if/when we do half-regs
37755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		 */
37855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[0] |= 0x00008000;
37955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	} else
38055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (src->type == P_IMMD || src->type == P_CONST) {
38155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		set_long(pc, inst);
3822a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		set_cseg(pc, src, inst);
38355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[0] |= (src->hw << 9);
38455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[1] |= 0x20000000; /* src0 const? */
38555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	} else {
38655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		if (src->type == P_ATTR) {
38755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs			set_long(pc, inst);
38855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs			inst[1] |= 0x00200000;
38955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		}
39055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
39155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		alloc_reg(pc, src);
39255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[0] |= (src->hw << 9);
39355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	}
39455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
39555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	/* We really should support "half" instructions here at some point,
39655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	 * but I don't feel confident enough about them yet.
39755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	 */
39855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	set_long(pc, inst);
39955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (is_long(inst) && !is_immd(inst)) {
40055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[1] |= 0x04000000; /* 32-bit */
40155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		inst[1] |= 0x0003c000; /* "subsubop" 0xf == mov */
40255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	}
40355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
40455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	emit(pc, inst);
40555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
40655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
407f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic boolean
4082a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggscheck_swap_src_0_1(struct nv50_pc *pc,
4092a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		   struct nv50_reg **s0, struct nv50_reg **s1)
4102a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4112a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	struct nv50_reg *src0 = *s0, *src1 = *s1;
4122a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4132a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src0->type == P_CONST) {
4142a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		if (src1->type != P_CONST) {
4152a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s0 = src1;
4162a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s1 = src0;
4172a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			return TRUE;
4182a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		}
4192a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
4202a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src1->type == P_ATTR) {
4212a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		if (src0->type != P_ATTR) {
4222a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s0 = src1;
4232a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s1 = src0;
4242a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			return TRUE;
4252a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		}
4262a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
4272a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4282a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	return FALSE;
4292a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4302a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4312a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
4322a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsset_src_0(struct nv50_pc *pc, struct nv50_reg *src, unsigned *inst)
4332a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4342a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_ATTR) {
4352a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		set_long(pc, inst);
4362a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[1] |= 0x00200000;
4372a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
4382a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_CONST || src->type == P_IMMD) {
4392a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		struct nv50_reg *temp = temp_temp(pc);
4402a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4412a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mov(pc, temp, src);
4422a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		src = temp;
4432a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
4442a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4452a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	alloc_reg(pc, src);
4462a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= (src->hw << 9);
4472a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4482a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4492a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
4502a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsset_src_1(struct nv50_pc *pc, struct nv50_reg *src, unsigned *inst)
4512a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4522a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_ATTR) {
4532a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		struct nv50_reg *temp = temp_temp(pc);
4542a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4552a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mov(pc, temp, src);
4562a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		src = temp;
4572a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
4582a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_CONST || src->type == P_IMMD) {
4592a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		set_cseg(pc, src, inst);
4602a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[0] |= 0x00800000;
4612a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
4622a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4632a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	alloc_reg(pc, src);
4642a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= (src->hw << 16);
4652a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4662a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4672a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
4682a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsset_src_2(struct nv50_pc *pc, struct nv50_reg *src, unsigned *inst)
4692a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4702a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_long(pc, inst);
4712a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4722a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_ATTR) {
4732a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		struct nv50_reg *temp = temp_temp(pc);
4742a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4752a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mov(pc, temp, src);
4762a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		src = temp;
4772a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
4782a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_CONST || src->type == P_IMMD) {
4792a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		set_cseg(pc, src, inst);
4802a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[0] |= 0x01000000;
4812a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
4822a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4832a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	alloc_reg(pc, src);
4842a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[1] |= (src->hw << 14);
4852a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4862a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4872a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
4882a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_mul(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
4892a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	 struct nv50_reg *src1)
4902a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4912a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned inst[2] = { 0, 0 };
4922a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4932a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= 0xc0000000;
494ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs	set_long(pc, inst);
4952a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4962a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
4972a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_dst(pc, dst, inst);
4982a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_0(pc, src0, inst);
4992a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_1(pc, src1, inst);
5002a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5012a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	emit(pc, inst);
5022a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
5032a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5042a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
50552a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggsemit_add(struct nv50_pc *pc, struct nv50_reg *dst,
50652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	 struct nv50_reg *src0, struct nv50_reg *src1)
5072a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
5082a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned inst[2] = { 0, 0 };
5092a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5102a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= 0xb0000000;
5112a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5122a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
5132a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_dst(pc, dst, inst);
5142a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_0(pc, src0, inst);
51552a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	if (is_long(inst))
51652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		set_src_2(pc, src1, inst);
51752a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	else
51852a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		set_src_1(pc, src1, inst);
51952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
52052a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	emit(pc, inst);
52152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs}
52252a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
52352a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggsstatic void
52452a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggsemit_minmax(struct nv50_pc *pc, unsigned sub, struct nv50_reg *dst,
52552a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	    struct nv50_reg *src0, struct nv50_reg *src1)
52652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs{
52752a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	unsigned inst[2] = { 0, 0 };
52852a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
52952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	set_long(pc, inst);
53052a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	inst[0] |= 0xb0000000;
53152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	inst[1] |= (sub << 29);
53252a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
53352a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
53452a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	set_dst(pc, dst, inst);
53552a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	set_src_0(pc, src0, inst);
53652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	set_src_1(pc, src1, inst);
5372a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5382a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	emit(pc, inst);
5392a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
5402a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5412a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
5422a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_sub(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
5432a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	 struct nv50_reg *src1)
5442a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
5452a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned inst[2] = { 0, 0 };
5462a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5472a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= 0xb0000000;
5482a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5492a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_long(pc, inst);
5502a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (check_swap_src_0_1(pc, &src0, &src1))
5512a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[1] |= 0x04000000;
5522a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	else
5532a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		inst[1] |= 0x08000000;
5542a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5552a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_dst(pc, dst, inst);
5562a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_0(pc, src0, inst);
5572a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_2(pc, src1, inst);
5582a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5592a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	emit(pc, inst);
5602a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
5612a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5622a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
5632a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_mad(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
5642a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	 struct nv50_reg *src1, struct nv50_reg *src2)
5652a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
5662a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned inst[2] = { 0, 0 };
5672a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5682a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= 0xe0000000;
5692a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5702a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
5712a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_dst(pc, dst, inst);
5722a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_0(pc, src0, inst);
5732a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_1(pc, src1, inst);
5742a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_2(pc, src2, inst);
5752a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5762a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	emit(pc, inst);
5772a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
5782a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5792a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
58021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggsemit_msb(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
58121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	 struct nv50_reg *src1, struct nv50_reg *src2)
58221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs{
58321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	unsigned inst[2] = { 0, 0 };
58421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
58521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	inst[0] |= 0xe0000000;
58621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	set_long(pc, inst);
58721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	inst[1] |= 0x08000000; /* src0 * src1 - src2 */
58821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
58921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
59021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	set_dst(pc, dst, inst);
59121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	set_src_0(pc, src0, inst);
59221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	set_src_1(pc, src1, inst);
59321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	set_src_2(pc, src2, inst);
59421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
59521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	emit(pc, inst);
59621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs}
59721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
59821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggsstatic void
5992a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_flop(struct nv50_pc *pc, unsigned sub,
6002a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	  struct nv50_reg *dst, struct nv50_reg *src)
6012a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
6022a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned inst[2] = { 0, 0 };
6032a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
6042a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	inst[0] |= 0x90000000;
60552a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	if (sub) {
60652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		set_long(pc, inst);
60752a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		inst[1] |= (sub << 29);
60852a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	}
6092a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
6102a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_dst(pc, dst, inst);
6112a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	set_src_0(pc, src, inst);
6122a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
6132a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	emit(pc, inst);
6142a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
6152a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
616d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggsstatic void
617d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggsemit_preex2(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
618d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs{
619d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	unsigned inst[2] = { 0, 0 };
620d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
621d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	inst[0] |= 0xb0000000;
622d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
623d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	set_dst(pc, dst, inst);
624d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	set_src_0(pc, src, inst);
625d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	set_long(pc, inst);
626d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	inst[1] |= (6 << 29) | 0x00004000;
627d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
628d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs	emit(pc, inst);
629d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs}
630bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs/*XXX: inaccurate results.. why? */
631bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs#define ALLOW_SET_SWAP 0
632bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
633bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggsstatic void
634bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggsemit_set(struct nv50_pc *pc, unsigned c_op, struct nv50_reg *dst,
635bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 struct nv50_reg *src0, struct nv50_reg *src1)
636bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs{
637bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	unsigned inst[2] = { 0, 0 };
638bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs#if ALLOW_SET_SWAP
639bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	unsigned inv_cop[8] = { 0, 6, 2, 4, 3, 5, 1, 7 };
640bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs#endif
641bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	struct nv50_reg *rdst;
642bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
643bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs#if ALLOW_SET_SWAP
644bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	assert(c_op <= 7);
645bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (check_swap_src_0_1(pc, &src0, &src1))
646bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		c_op = inv_cop[c_op];
647bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs#endif
648bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
649bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	rdst = dst;
650bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (dst->type != P_TEMP)
651bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		dst = alloc_temp(pc, NULL);
652bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
653bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	/* set.u32 */
654bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_long(pc, inst);
655bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[0] |= 0xb0000000;
656bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[1] |= (3 << 29);
657bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[1] |= (c_op << 14);
658bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	/*XXX: breaks things, .u32 by default?
659bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 *     decuda will disasm as .u16 and use .lo/.hi regs, but this
660bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 *     doesn't seem to match what the hw actually does.
661bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[1] |= 0x04000000; << breaks things.. .u32 by default?
662bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 */
663bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_dst(pc, dst, inst);
664bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_src_0(pc, src0, inst);
665bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_src_1(pc, src1, inst);
666bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	emit(pc, inst);
667bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
668bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	/* cvt.f32.u32 */
669bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[0] = 0xa0000001;
670bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[1] = 0x64014780;
671bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_dst(pc, rdst, inst);
672bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	set_src_0(pc, dst, inst);
673bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	emit(pc, inst);
674bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
675bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (dst != rdst)
676bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		free_temp(pc, dst);
677bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs}
678d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
679b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggsstatic void
680b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggsemit_flr(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
681b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs{
682b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	unsigned inst[2] = { 0, 0 };
683b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs
684b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[0] = 0xa0000000; /* cvt */
685688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	set_long(pc, inst);
686b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[1] |= (6 << 29); /* cvt */
687b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[1] |= 0x08000000; /* integer mode */
688b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[1] |= 0x04000000; /* 32 bit */
689b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[1] |= ((0x1 << 3)) << 14; /* .rn */
690b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	inst[1] |= (1 << 14); /* src .f32 */
691b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	set_dst(pc, dst, inst);
692b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	set_src_0(pc, src, inst);
693b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs
694b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	emit(pc, inst);
695b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs}
696b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs
6972a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic boolean
698f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_tx_insn(struct nv50_pc *pc, const union tgsi_full_token *tok)
699f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
700f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	const struct tgsi_full_instruction *inst = &tok->FullInstruction;
701688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	struct nv50_reg *rdst[4], *dst[4], *src[3][4], *temp;
702688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	unsigned mask, sat;
703f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int i, c;
704f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
705f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	NOUVEAU_ERR("insn %p\n", tok);
706f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
707f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	mask = inst->FullDstRegisters[0].DstRegister.WriteMask;
708688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	sat = inst->Instruction.Saturate == TGSI_SAT_ZERO_ONE;
709f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
710f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (c = 0; c < 4; c++) {
711f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (mask & (1 << c))
712f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			dst[c] = tgsi_dst(pc, c, &inst->FullDstRegisters[0]);
713f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		else
714f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			dst[c] = NULL;
715f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
716f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
717f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (i = 0; i < inst->Instruction.NumSrcRegs; i++) {
718f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (c = 0; c < 4; c++)
719f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			src[i][c] = tgsi_src(pc, c, &inst->FullSrcRegisters[i]);
720f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
721f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
722688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	if (sat) {
723688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs		for (c = 0; c < 4; c++) {
724688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			rdst[c] = dst[c];
725688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			dst[c] = temp_temp(pc);
726688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs		}
727688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	}
728688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs
729f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	switch (inst->Instruction.Opcode) {
73068091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs	case TGSI_OPCODE_ABS:
73168091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs		for (c = 0; c < 4; c++) {
73268091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs			unsigned inst[2] = { 0, 0 };
73368091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs
73468091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs			inst[0] = 0xa0000000; /* cvt */
735688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			set_long(pc, inst);
73668091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs			inst[1] |= (6 << 29); /* cvt */
73768091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs			inst[1] |= 0x04000000; /* 32 bit */
73868091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs			inst[1] |= (1 << 14); /* src .f32 */
73968091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs			inst[1] |= ((1 << 6) << 14); /* .abs */
74068091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs			set_dst(pc, dst[c], inst);
74168091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs			set_src_0(pc, src[0][c], inst);
74268091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs			emit(pc, inst);
74368091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs		}
74468091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs		break;
7452a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_ADD:
7467df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
7477df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
7487df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
7492a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_add(pc, dst[c], src[0][c], src[1][c]);
7507df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
7512a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
7522a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_COS:
7537df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
7547df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
7557df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
7562a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_flop(pc, 5, dst[c], src[0][c]);
7577df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
7582a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
7592a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_DP3:
7602a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		temp = alloc_temp(pc, NULL);
7612a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mul(pc, temp, src[0][0], src[1][0]);
7622a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][1], src[1][1], temp);
7632a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][2], src[1][2], temp);
7647df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
7657df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
7667df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
7672a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mov(pc, dst[c], temp);
7687df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
7692a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		free_temp(pc, temp);
7702a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
7712a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_DP4:
7722a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		temp = alloc_temp(pc, NULL);
7732a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mul(pc, temp, src[0][0], src[1][0]);
7742a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][1], src[1][1], temp);
7752a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][2], src[1][2], temp);
7762a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][3], src[1][3], temp);
7777df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
7787df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
7797df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
7802a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mov(pc, dst[c], temp);
7817df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
7822a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		free_temp(pc, temp);
7832a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
78421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	case TGSI_OPCODE_DPH:
78521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		temp = alloc_temp(pc, NULL);
78621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mul(pc, temp, src[0][0], src[1][0]);
78721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mad(pc, temp, src[0][1], src[1][1], temp);
78821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mad(pc, temp, src[0][2], src[1][2], temp);
78921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_add(pc, temp, src[1][3], temp);
79021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		for (c = 0; c < 4; c++) {
79121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs			if (!(mask & (1 << c)))
79221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs				continue;
79321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs			emit_mov(pc, dst[c], temp);
79421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		}
79521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		free_temp(pc, temp);
79621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		break;
79733e4d30d50344be26398a51365bea1be37487403Ben Skeggs	case TGSI_OPCODE_DST:
79833e4d30d50344be26398a51365bea1be37487403Ben Skeggs	{
79933e4d30d50344be26398a51365bea1be37487403Ben Skeggs		struct nv50_reg *one = alloc_immd(pc, 1.0);
80033e4d30d50344be26398a51365bea1be37487403Ben Skeggs		emit_mov(pc, dst[0], one);
80133e4d30d50344be26398a51365bea1be37487403Ben Skeggs		emit_mul(pc, dst[1], src[0][1], src[1][1]);
80233e4d30d50344be26398a51365bea1be37487403Ben Skeggs		emit_mov(pc, dst[2], src[0][2]);
80333e4d30d50344be26398a51365bea1be37487403Ben Skeggs		emit_mov(pc, dst[3], src[1][3]);
80433e4d30d50344be26398a51365bea1be37487403Ben Skeggs		FREE(one);
80533e4d30d50344be26398a51365bea1be37487403Ben Skeggs	}
80633e4d30d50344be26398a51365bea1be37487403Ben Skeggs		break;
8072a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_EX2:
808fbf4027dd9b279ec159906dcad134f71e34aaec8Ben Skeggs		temp = alloc_temp(pc, NULL);
8097df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8107df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8117df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
812d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs			emit_preex2(pc, temp, src[0][c]);
813fbf4027dd9b279ec159906dcad134f71e34aaec8Ben Skeggs			emit_flop(pc, 6, dst[c], temp);
8147df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
815fbf4027dd9b279ec159906dcad134f71e34aaec8Ben Skeggs		free_temp(pc, temp);
8162a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
817b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	case TGSI_OPCODE_FLR:
818b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		for (c = 0; c < 4; c++) {
819b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			if (!(mask & (1 << c)))
820b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs				continue;
821b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			emit_flr(pc, dst[c], src[0][c]);
822b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		}
823b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		break;
824b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	case TGSI_OPCODE_FRC:
825b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		temp = alloc_temp(pc, NULL);
826b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		for (c = 0; c < 4; c++) {
827b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			if (!(mask & (1 << c)))
828b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs				continue;
829b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			emit_flr(pc, temp, src[0][c]);
830b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			emit_sub(pc, dst[c], src[0][c], temp);
831b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		}
832b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		free_temp(pc, temp);
833b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		break;
8342a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_LG2:
8357df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8367df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8377df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
8382a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_flop(pc, 3, dst[c], src[0][c]);
8397df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
8402a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
8412a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_MAD:
8427df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8437df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8447df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
8452a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mad(pc, dst[c], src[0][c], src[1][c], src[2][c]);
8467df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
8472a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
84852a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	case TGSI_OPCODE_MAX:
8497df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8507df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8517df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
85252a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs			emit_minmax(pc, 4, dst[c], src[0][c], src[1][c]);
8537df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
85452a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		break;
85552a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	case TGSI_OPCODE_MIN:
8567df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8577df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8587df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
85952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs			emit_minmax(pc, 5, dst[c], src[0][c], src[1][c]);
8607df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
86152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		break;
862f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_OPCODE_MOV:
8637df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8647df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8657df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
86655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs			emit_mov(pc, dst[c], src[0][c]);
8677df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
86838ce697e5942550888c28bd4859ca2a92f247bf7Ben Skeggs		break;
8692a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_MUL:
8707df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8717df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8727df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
8732a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mul(pc, dst[c], src[0][c], src[1][c]);
8747df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
8752a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
876ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs	case TGSI_OPCODE_POW:
877ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		temp = alloc_temp(pc, NULL);
878ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		emit_flop(pc, 3, temp, src[0][0]);
879ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		emit_mul(pc, temp, temp, src[1][0]);
880ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		emit_preex2(pc, temp, temp);
881ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		emit_flop(pc, 6, temp, temp);
882ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		for (c = 0; c < 4; c++) {
883ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs			if (!(mask & (1 << c)))
884ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs				continue;
885ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs			emit_mov(pc, dst[c], temp);
886ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		}
887ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		free_temp(pc, temp);
888ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		break;
8892a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_RCP:
8907df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8917df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8927df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
8932a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_flop(pc, 0, dst[c], src[0][c]);
8947df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
8952a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
8962a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_RSQ:
8977df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
8987df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
8997df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
9002a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_flop(pc, 2, dst[c], src[0][c]);
9017df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
9022a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
903bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	case TGSI_OPCODE_SGE:
904bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		for (c = 0; c < 4; c++) {
905bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			if (!(mask & (1 << c)))
906bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs				continue;
907bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			emit_set(pc, 6, dst[c], src[0][c], src[1][c]);
908bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		}
909bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		break;
9102a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_SIN:
9117df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9127df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9137df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
9142a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_flop(pc, 4, dst[c], src[0][c]);
9157df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
9162a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
917bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	case TGSI_OPCODE_SLT:
918bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		for (c = 0; c < 4; c++) {
919bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			if (!(mask & (1 << c)))
920bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs				continue;
921bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			emit_set(pc, 1, dst[c], src[0][c], src[1][c]);
922bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		}
923bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		break;
9242a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_SUB:
9257df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9267df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9277df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
9282a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_sub(pc, dst[c], src[0][c], src[1][c]);
9297df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
9302a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
93121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	case TGSI_OPCODE_XPD:
93221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		temp = alloc_temp(pc, NULL);
93321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mul(pc, temp, src[0][2], src[1][1]);
93421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_msb(pc, dst[0], src[0][1], src[1][2], temp);
93521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mul(pc, temp, src[0][0], src[1][2]);
93621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_msb(pc, dst[1], src[0][2], src[1][0], temp);
93721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mul(pc, temp, src[0][1], src[1][0]);
93821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_msb(pc, dst[2], src[0][0], src[1][1], temp);
93921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		free_temp(pc, temp);
94021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		break;
941f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_OPCODE_END:
942f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		break;
943f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	default:
944f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		NOUVEAU_ERR("invalid opcode %d\n", inst->Instruction.Opcode);
945f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return FALSE;
946f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
947f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
948688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	if (sat) {
949688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs		for (c = 0; c < 4; c++) {
950688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			unsigned inst[2] = { 0, 0 };
951688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs
952688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			if (!(mask & (1 << c)))
953688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs				continue;
954688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs
955688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			inst[0] = 0xa0000000; /* cvt */
956688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			set_long(pc, inst);
957688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			inst[1] |= (6 << 29); /* cvt */
958688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			inst[1] |= 0x04000000; /* 32 bit */
959688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			inst[1] |= (1 << 14); /* src .f32 */
960688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			inst[1] |= ((1 << 5) << 14); /* .sat */
961688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			set_dst(pc, rdst[c], inst);
962688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			set_src_0(pc, dst[c], inst);
963688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			emit(pc, inst);
964688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs		}
965688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	}
966688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs
96752a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	kill_temp_temp(pc);
968f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return TRUE;
969f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
970f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
971f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic boolean
972f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_tx_prep(struct nv50_pc *pc)
973f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
974f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct tgsi_parse_context p;
975f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	boolean ret = FALSE;
976f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	unsigned i, c;
977f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
978f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_init(&p, pc->p->pipe.tokens);
979f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	while (!tgsi_parse_end_of_tokens(&p)) {
980f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		const union tgsi_full_token *tok = &p.FullToken;
981f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
982f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		tgsi_parse_token(&p);
983f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		switch (tok->Token.Type) {
984f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_IMMEDIATE:
985f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		{
986f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			const struct tgsi_full_immediate *imm =
987f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				&p.FullToken.FullImmediate;
988f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
98933e4d30d50344be26398a51365bea1be37487403Ben Skeggs			ctor_immd(pc, imm->u.ImmediateFloat32[0].Float,
99033e4d30d50344be26398a51365bea1be37487403Ben Skeggs				      imm->u.ImmediateFloat32[1].Float,
99133e4d30d50344be26398a51365bea1be37487403Ben Skeggs				      imm->u.ImmediateFloat32[2].Float,
99233e4d30d50344be26398a51365bea1be37487403Ben Skeggs				      imm->u.ImmediateFloat32[3].Float);
993f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
994f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
995f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_DECLARATION:
996f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		{
997f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			const struct tgsi_full_declaration *d;
998f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			unsigned last;
999f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1000f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			d = &p.FullToken.FullDeclaration;
1001f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			last = d->u.DeclarationRange.Last;
1002f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1003f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			switch (d->Declaration.File) {
1004f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_TEMPORARY:
1005f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->temp_nr < (last + 1))
1006f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->temp_nr = last + 1;
1007f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
1008f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_OUTPUT:
1009f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->result_nr < (last + 1))
1010f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->result_nr = last + 1;
1011f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
1012f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_INPUT:
1013f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->attr_nr < (last + 1))
1014f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->attr_nr = last + 1;
1015f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
1016f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_CONSTANT:
1017f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->param_nr < (last + 1))
1018f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->param_nr = last + 1;
1019f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
1020f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			default:
1021f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				NOUVEAU_ERR("bad decl file %d\n",
1022f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					    d->Declaration.File);
1023f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				goto out_err;
1024f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1025f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1026f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1027f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_INSTRUCTION:
1028f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1029f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		default:
1030f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1031f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1032f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1033f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1034f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	NOUVEAU_ERR("%d temps\n", pc->temp_nr);
1035f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->temp_nr) {
1036f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->temp = calloc(pc->temp_nr * 4, sizeof(struct nv50_reg));
1037f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->temp)
1038f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1039f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1040f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->temp_nr; i++) {
1041f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1042f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->temp[i*4+c].type = P_TEMP;
1043f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->temp[i*4+c].hw = -1;
1044f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->temp[i*4+c].index = i;
1045f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1046f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1047f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1048f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1049f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	NOUVEAU_ERR("%d attrib regs\n", pc->attr_nr);
1050f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->attr_nr) {
10518ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		struct nv50_reg *iv = NULL, *tmp = NULL;
1052f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		int aid = 0;
1053f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1054f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->attr = calloc(pc->attr_nr * 4, sizeof(struct nv50_reg));
1055f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->attr)
1056f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1057f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
10588ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		if (pc->p->type == NV50_PROG_FRAGMENT) {
10598ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			iv = alloc_temp(pc, NULL);
10608ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			aid++;
10618ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		}
10628ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
1063f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->attr_nr; i++) {
10648ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			struct nv50_reg *a = &pc->attr[i*4];
10658ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
1066f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
10678ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				if (pc->p->type == NV50_PROG_FRAGMENT) {
10688ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					struct nv50_reg *at =
10698ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs						alloc_temp(pc, NULL);
10708ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].type = at->type;
10718ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].hw = at->hw;
10728ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].index = at->index;
10738ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				} else {
10748ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->p->cfg.vp.attr[aid/32] |=
10758ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs						(1 << (aid % 32));
10768ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].type = P_ATTR;
10778ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].hw = aid++;
10788ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].index = i;
10798ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				}
1080f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
10818ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
10828ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			if (pc->p->type != NV50_PROG_FRAGMENT)
10838ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				continue;
10848ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
10858ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			emit_interp(pc, iv, iv, iv, FALSE);
10868ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			tmp = alloc_temp(pc, NULL);
10878ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			{
10888ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				unsigned inst[2] = { 0, 0 };
10898ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				inst[0]  = 0x90000000;
10908ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				inst[0] |= (tmp->hw << 2);
10918ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				emit(pc, inst);
10928ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			}
10938ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			emit_interp(pc, &a[0], &a[0], tmp, TRUE);
10948ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			emit_interp(pc, &a[1], &a[1], tmp, TRUE);
10958ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			emit_interp(pc, &a[2], &a[2], tmp, TRUE);
10968ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			emit_interp(pc, &a[3], &a[3], tmp, TRUE);
10978ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			free_temp(pc, tmp);
1098f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
10998ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
11008ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		if (iv)
11018ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			free_temp(pc, iv);
1102f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1103f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1104f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	NOUVEAU_ERR("%d result regs\n", pc->result_nr);
1105f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->result_nr) {
1106f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		int rid = 0;
1107f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1108f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->result = calloc(pc->result_nr * 4, sizeof(struct nv50_reg));
1109f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->result)
1110f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1111f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1112f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->result_nr; i++) {
1113f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
11148ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				if (pc->p->type == NV50_PROG_FRAGMENT)
11158ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->result[i*4+c].type = P_TEMP;
11168ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				else
11178ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->result[i*4+c].type = P_RESULT;
1118f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->result[i*4+c].hw = rid++;
1119f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->result[i*4+c].index = i;
1120f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1121f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1122f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1123f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1124f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	NOUVEAU_ERR("%d param regs\n", pc->param_nr);
1125f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->param_nr) {
1126f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		int rid = 0;
1127f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1128f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->param = calloc(pc->param_nr * 4, sizeof(struct nv50_reg));
1129f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->param)
1130f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1131f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1132f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->param_nr; i++) {
1133f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1134f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->param[i*4+c].type = P_CONST;
1135f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->param[i*4+c].hw = rid++;
1136f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->param[i*4+c].index = i;
1137f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1138f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1139f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1140f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1141f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->immd_nr) {
1142716c1cd2ecbc1e86c0fd747c9fa9e095ded5fd5dBen Skeggs		int rid = 0;
1143f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1144f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->immd = calloc(pc->immd_nr * 4, sizeof(struct nv50_reg));
1145f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->immd)
1146f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1147f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1148f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->immd_nr; i++) {
1149f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1150f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->immd[i*4+c].type = P_IMMD;
1151f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->immd[i*4+c].hw = rid++;
1152f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->immd[i*4+c].index = i;
1153f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1154f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1155f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1156f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1157f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	ret = TRUE;
1158f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsout_err:
1159f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_free(&p);
1160f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return ret;
1161f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1162f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1163f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic boolean
1164f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_tx(struct nv50_program *p)
1165f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1166f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct tgsi_parse_context parse;
1167f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_pc *pc;
1168f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	boolean ret;
1169f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1170f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	pc = CALLOC_STRUCT(nv50_pc);
1171f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (!pc)
1172f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return FALSE;
1173f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	pc->p = p;
11748ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	pc->p->cfg.high_temp = 4;
1175f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1176f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	ret = nv50_program_tx_prep(pc);
1177f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (ret == FALSE)
1178f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		goto out_cleanup;
1179f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1180f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_init(&parse, pc->p->pipe.tokens);
1181f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	while (!tgsi_parse_end_of_tokens(&parse)) {
1182f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		const union tgsi_full_token *tok = &parse.FullToken;
1183f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1184f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		tgsi_parse_token(&parse);
1185f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1186f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		switch (tok->Token.Type) {
1187f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_INSTRUCTION:
1188f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			ret = nv50_program_tx_insn(pc, tok);
1189f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			if (ret == FALSE)
1190f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				goto out_err;
1191f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1192f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		default:
1193f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1194f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1195f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1196f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1197f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->immd_nr = pc->immd_nr * 4;
1198f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->immd = pc->immd_buf;
1199f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1200f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsout_err:
1201f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_free(&parse);
1202f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1203f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsout_cleanup:
1204f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return ret;
1205f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1206f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1207f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic void
1208f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_validate(struct nv50_context *nv50, struct nv50_program *p)
1209f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1210e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	int i;
1211e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs
1212e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	if (nv50_program_tx(p) == FALSE)
1213e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs		assert(0);
1214e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	/* *not* sufficient, it's fine if last inst is long and
1215e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	 * NOT immd - otherwise it's fucked fucked fucked */
1216e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	p->insns[p->insns_nr - 1] |= 0x00000001;
1217f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
12182a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (p->type == NV50_PROG_VERTEX) {
12192a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	for (i = 0; i < p->insns_nr; i++)
12202a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		NOUVEAU_ERR("VP0x%08x\n", p->insns[i]);
12212a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else {
1222e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	for (i = 0; i < p->insns_nr; i++)
12232a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		NOUVEAU_ERR("FP0x%08x\n", p->insns[i]);
12242a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
1225f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1226f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->translated = TRUE;
1227f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1228f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
122922e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsstatic void
123022e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsnv50_program_validate_data(struct nv50_context *nv50, struct nv50_program *p)
123122e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs{
123222e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	int i;
123322e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
123422e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	for (i = 0; i < p->immd_nr; i++) {
123522e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs		BEGIN_RING(tesla, 0x0f00, 2);
123622e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs		OUT_RING  ((NV50_CB_PMISC << 16) | (i << 8));
123722e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs		OUT_RING  (fui(p->immd[i]));
123822e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	}
123922e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs}
124022e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
124122e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsstatic void
124222e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsnv50_program_validate_code(struct nv50_context *nv50, struct nv50_program *p)
124322e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs{
124422e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	struct pipe_winsys *ws = nv50->pipe.winsys;
124522e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	void *map;
124622e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
124722e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	if (!p->buffer)
124822e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs		p->buffer = ws->buffer_create(ws, 0x100, 0, p->insns_nr * 4);
124922e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	map = ws->buffer_map(ws, p->buffer, PIPE_BUFFER_USAGE_CPU_WRITE);
125022e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	memcpy(map, p->insns, p->insns_nr * 4);
125122e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	ws->buffer_unmap(ws, p->buffer);
125222e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs}
125322e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
1254f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsvoid
1255f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_vertprog_validate(struct nv50_context *nv50)
1256f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1257f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_grobj *tesla = nv50->screen->tesla;
1258f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_program *p = nv50->vertprog;
1259f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_stateobj *so;
1260f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1261f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (!p->translated) {
1262f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		nv50_program_validate(nv50, p);
1263f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!p->translated)
1264f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			assert(0);
1265f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1266f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
126722e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	nv50_program_validate_data(nv50, p);
126822e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	nv50_program_validate_code(nv50, p);
1269f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1270f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so = so_new(11, 2);
1271f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, NV50TCL_VP_ADDRESS_HIGH, 2);
1272f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1273f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_HIGH, 0, 0);
1274f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1275f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_LOW, 0, 0);
1276f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, 0x1650, 2);
1277f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, p->cfg.vp.attr[0]);
1278f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, p->cfg.vp.attr[1]);
1279f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, 0x16ac, 2);
1280f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, 8);
12818ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_data  (so, p->cfg.high_temp);
1282f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, 0x140c, 1);
1283f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, 0); /* program start offset */
1284f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_emit(nv50->screen->nvws, so);
1285f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_ref(NULL, &so);
1286f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1287f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1288f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsvoid
1289f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_fragprog_validate(struct nv50_context *nv50)
1290f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1291f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_grobj *tesla = nv50->screen->tesla;
1292f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_program *p = nv50->fragprog;
1293f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_stateobj *so;
1294f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1295f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (!p->translated) {
1296f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		nv50_program_validate(nv50, p);
1297f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!p->translated)
1298f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			assert(0);
1299f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1300f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
130155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	nv50_program_validate_data(nv50, p);
130255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	nv50_program_validate_code(nv50, p);
1303f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
13048ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so = so_new(7, 2);
1305f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, NV50TCL_FP_ADDRESS_HIGH, 2);
1306f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1307f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_HIGH, 0, 0);
1308f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1309f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_LOW, 0, 0);
13108ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_method(so, tesla, 0x198c, 1);
13118ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_data  (so, p->cfg.high_temp);
13128ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_method(so, tesla, 0x1414, 1);
13138ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_data  (so, 0); /* program start offset */
1314f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_emit(nv50->screen->nvws, so);
1315f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_ref(NULL, &so);
1316f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1317f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1318f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsvoid
1319f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_destroy(struct nv50_context *nv50, struct nv50_program *p)
1320f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1321f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct pipe_winsys *ws = nv50->pipe.winsys;
1322f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1323f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (p->insns_nr) {
1324f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (p->insns)
1325f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			FREE(p->insns);
1326f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		p->insns_nr = 0;
1327f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1328f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1329f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (p->buffer)
1330f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pipe_buffer_reference(ws, &p->buffer, NULL);
1331f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1332f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->translated = 0;
1333f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1334f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1335