nv50_program.c revision e002ad77398fbe14a0efbd91824c3325ca09b4c1
1f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_context.h"
2f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_defines.h"
3f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_state.h"
4f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_inlines.h"
5f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
6f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_shader_tokens.h"
7f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "tgsi/util/tgsi_parse.h"
8f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "tgsi/util/tgsi_util.h"
9f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
10f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "nv50_context.h"
11f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
12f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#define NV50_SU_MAX_TEMP 64
13aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs#define NV50_PROGRAM_DUMP
14f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
159a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs/* ARL - gallium craps itself on progs/vp/arl.txt
1621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs *
1721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * MSB - Like MAD, but MUL+SUB
1821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * 	- Fuck it off, introduce a way to negate args for ops that
1921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * 	  support it.
2021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs *
21ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs * Look into inlining IMMD for ops other than MOV (make it general?)
2233e4d30d50344be26398a51365bea1be37487403Ben Skeggs * 	- Maybe even relax restrictions a bit, can't do P_RESULT + P_IMMD,
2333e4d30d50344be26398a51365bea1be37487403Ben Skeggs * 	  but can emit to P_TEMP first - then MOV later. NVIDIA does this
24ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs *
252fdeb4d5a5cc8b93bf885ba646e3a29a68c755edBen Skeggs * In ops such as ADD it's possible to construct a bad opcode in the !is_long()
262fdeb4d5a5cc8b93bf885ba646e3a29a68c755edBen Skeggs * case, if the emit_src() causes the inst to suddenly become long.
272fdeb4d5a5cc8b93bf885ba646e3a29a68c755edBen Skeggs *
28ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs * Verify half-insns work where expected - and force disable them where they
29ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs * don't work - MUL has it forcibly disabled atm as it fixes POW..
30afcaeaa0e4dc3ced40621c76304a2c0c5a3ab403Ben Skeggs *
31afcaeaa0e4dc3ced40621c76304a2c0c5a3ab403Ben Skeggs * FUCK! watch dst==src vectors, can overwrite components that are needed.
32afcaeaa0e4dc3ced40621c76304a2c0c5a3ab403Ben Skeggs * 	ie. SUB R0, R0.yzxw, R0
33776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs *
34b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs * Things to check with renouveau:
35b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs * 	FP attr/result assignment - how?
366d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 		attrib
376d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 			- 0x16bc maps vp output onto fp hpos
386d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 			- 0x16c0 maps vp output onto fp col0
396d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 		result
406d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 			- colr always 0-3
416d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 			- depr always 4
426d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 0x16bc->0x16e8 --> some binding between vp/fp regs
436d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 0x16b8 --> VP output count
446d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs *
456d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 0x1298 --> "MOV rcol.x, fcol.y" "MOV depr, fcol.y" = 0x00000005
466d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 	      "MOV rcol.x, fcol.y" = 0x00000004
476d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 0x19a8 --> as above but 0x00000100 and 0x00000000
486d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 	- 0x00100000 used when KIL used
496d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 0x196c --> as above but 0x00000011 and 0x00000000
506d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs *
516d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 0x1988 --> 0xXXNNNNNN
526d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 	- XX == FP high something
5321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs */
54f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstruct nv50_reg {
55f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	enum {
56f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_TEMP,
57f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_ATTR,
58f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_RESULT,
59f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_CONST,
60f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_IMMD
61f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	} type;
62f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int index;
63f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
64f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int hw;
6538ce697e5942550888c28bd4859ca2a92f247bf7Ben Skeggs	int neg;
66f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs};
67f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
68f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstruct nv50_pc {
69f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_program *p;
70f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
71f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	/* hw resources */
72f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *r_temp[NV50_SU_MAX_TEMP];
73f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
74f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	/* tgsi resources */
75f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *temp;
76f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int temp_nr;
77f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *attr;
78f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int attr_nr;
79f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *result;
80f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int result_nr;
81f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *param;
82f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int param_nr;
83f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *immd;
84f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	float *immd_buf;
85f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int immd_nr;
862a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
8721e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs	struct nv50_reg *temp_temp[16];
882a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned temp_temp_nr;
89f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs};
90f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
91f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic void
92f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsalloc_reg(struct nv50_pc *pc, struct nv50_reg *reg)
93f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
94f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int i;
95f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
96fea0b1651677444fc6c135e1a4b8ab6463a9fdf9Ben Skeggs	if (reg->type == P_RESULT) {
97fea0b1651677444fc6c135e1a4b8ab6463a9fdf9Ben Skeggs		if (pc->p->cfg.high_result < (reg->hw + 1))
98fea0b1651677444fc6c135e1a4b8ab6463a9fdf9Ben Skeggs			pc->p->cfg.high_result = reg->hw + 1;
99fea0b1651677444fc6c135e1a4b8ab6463a9fdf9Ben Skeggs	}
100fea0b1651677444fc6c135e1a4b8ab6463a9fdf9Ben Skeggs
1018ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	if (reg->type != P_TEMP)
102f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return;
103f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1048ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	if (reg->hw >= 0) {
1058ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		/*XXX: do this here too to catch FP temp-as-attr usage..
1068ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		 *     not clean, but works */
1078ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		if (pc->p->cfg.high_temp < (reg->hw + 1))
1088ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			pc->p->cfg.high_temp = reg->hw + 1;
1098ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		return;
1108ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	}
1118ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
112f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (i = 0; i < NV50_SU_MAX_TEMP; i++) {
113f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!(pc->r_temp[i])) {
114f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			pc->r_temp[i] = reg;
115f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			reg->hw = i;
1168ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			if (pc->p->cfg.high_temp < (i + 1))
1178ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				pc->p->cfg.high_temp = i + 1;
118f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			return;
119f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
120f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
121f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
122f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	assert(0);
123f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
124f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
125f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic struct nv50_reg *
126f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsalloc_temp(struct nv50_pc *pc, struct nv50_reg *dst)
127f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
128f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *r;
129f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int i;
130f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
131f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (dst && dst->type == P_TEMP && dst->hw == -1)
132f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return dst;
133f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
134f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (i = 0; i < NV50_SU_MAX_TEMP; i++) {
135f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->r_temp[i]) {
136f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r = CALLOC_STRUCT(nv50_reg);
137f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r->type = P_TEMP;
138f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r->index = -1;
139f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r->hw = i;
140f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			pc->r_temp[i] = r;
141f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			return r;
142f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
143f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
144f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
145f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	assert(0);
146f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return NULL;
147f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
148f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
149f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic void
150f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsfree_temp(struct nv50_pc *pc, struct nv50_reg *r)
151f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
152f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (r->index == -1) {
153619549a6377a58d54c9cf55f8863beed56b09566Ben Skeggs		unsigned hw = r->hw;
154619549a6377a58d54c9cf55f8863beed56b09566Ben Skeggs
155619549a6377a58d54c9cf55f8863beed56b09566Ben Skeggs		FREE(pc->r_temp[hw]);
156619549a6377a58d54c9cf55f8863beed56b09566Ben Skeggs		pc->r_temp[hw] = NULL;
157f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
158f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
159f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
160f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic struct nv50_reg *
1612a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggstemp_temp(struct nv50_pc *pc)
1622a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
16321e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs	if (pc->temp_temp_nr >= 16)
1642a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		assert(0);
1652a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
1662a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	pc->temp_temp[pc->temp_temp_nr] = alloc_temp(pc, NULL);
1672a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	return pc->temp_temp[pc->temp_temp_nr++];
1682a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
1692a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
1702a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
1712a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggskill_temp_temp(struct nv50_pc *pc)
1722a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
1732a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	int i;
1742a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
1752a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	for (i = 0; i < pc->temp_temp_nr; i++)
1762a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		free_temp(pc, pc->temp_temp[i]);
1772a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	pc->temp_temp_nr = 0;
1782a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
1792a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
18033e4d30d50344be26398a51365bea1be37487403Ben Skeggsstatic int
18133e4d30d50344be26398a51365bea1be37487403Ben Skeggsctor_immd(struct nv50_pc *pc, float x, float y, float z, float w)
18233e4d30d50344be26398a51365bea1be37487403Ben Skeggs{
18333e4d30d50344be26398a51365bea1be37487403Ben Skeggs	pc->immd_buf = realloc(pc->immd_buf, (pc->immd_nr + 1) * 4 *
18433e4d30d50344be26398a51365bea1be37487403Ben Skeggs					     sizeof(float));
18533e4d30d50344be26398a51365bea1be37487403Ben Skeggs	pc->immd_buf[(pc->immd_nr * 4) + 0] = x;
186686bc00c05094e8678747c111a6a70ad4b7063e3Ben Skeggs	pc->immd_buf[(pc->immd_nr * 4) + 1] = y;
187686bc00c05094e8678747c111a6a70ad4b7063e3Ben Skeggs	pc->immd_buf[(pc->immd_nr * 4) + 2] = z;
188686bc00c05094e8678747c111a6a70ad4b7063e3Ben Skeggs	pc->immd_buf[(pc->immd_nr * 4) + 3] = w;
18933e4d30d50344be26398a51365bea1be37487403Ben Skeggs
19033e4d30d50344be26398a51365bea1be37487403Ben Skeggs	return pc->immd_nr++;
19133e4d30d50344be26398a51365bea1be37487403Ben Skeggs}
19233e4d30d50344be26398a51365bea1be37487403Ben Skeggs
19333e4d30d50344be26398a51365bea1be37487403Ben Skeggsstatic struct nv50_reg *
19433e4d30d50344be26398a51365bea1be37487403Ben Skeggsalloc_immd(struct nv50_pc *pc, float f)
19533e4d30d50344be26398a51365bea1be37487403Ben Skeggs{
19633e4d30d50344be26398a51365bea1be37487403Ben Skeggs	struct nv50_reg *r = CALLOC_STRUCT(nv50_reg);
19733e4d30d50344be26398a51365bea1be37487403Ben Skeggs	unsigned hw;
19833e4d30d50344be26398a51365bea1be37487403Ben Skeggs
19901e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	hw = ctor_immd(pc, f, 0, 0, 0) * 4;
20033e4d30d50344be26398a51365bea1be37487403Ben Skeggs	r->type = P_IMMD;
20133e4d30d50344be26398a51365bea1be37487403Ben Skeggs	r->hw = hw;
20233e4d30d50344be26398a51365bea1be37487403Ben Skeggs	r->index = -1;
20333e4d30d50344be26398a51365bea1be37487403Ben Skeggs	return r;
20433e4d30d50344be26398a51365bea1be37487403Ben Skeggs}
20533e4d30d50344be26398a51365bea1be37487403Ben Skeggs
20640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsstatic struct nv50_program_exec *
20740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsexec(struct nv50_pc *pc)
20840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs{
20940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = CALLOC_STRUCT(nv50_program_exec);
21040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs
2111c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs	e->param.index = -1;
21240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	return e;
21340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs}
21440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs
21555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic void
21640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsemit(struct nv50_pc *pc, struct nv50_program_exec *e)
21755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
21855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	struct nv50_program *p = pc->p;
21955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
22040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	if (p->exec_tail)
22140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		p->exec_tail->next = e;
22240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	if (!p->exec_head)
22340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		p->exec_head = e;
22440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	p->exec_tail = e;
22540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	p->exec_size += (e->inst[0] & 1) ? 2 : 1;
22655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
22755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
22840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsstatic INLINE void set_long(struct nv50_pc *, struct nv50_program_exec *);
22955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
23055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic boolean
23140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsis_long(struct nv50_program_exec *e)
23255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
23340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	if (e->inst[0] & 1)
23455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		return TRUE;
23555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	return FALSE;
23655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
23755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
23855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic boolean
23940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsis_immd(struct nv50_program_exec *e)
24055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
24140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	if (is_long(e) && (e->inst[1] & 3) == 3)
24255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		return TRUE;
24355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	return FALSE;
24455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
24555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
24655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
24740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsset_pred(struct nv50_pc *pc, unsigned pred, unsigned idx,
24840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	 struct nv50_program_exec *e)
24955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
25040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
25140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] &= ~((0x1f << 7) | (0x3 << 12));
25240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (pred << 7) | (idx << 12);
25355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
25455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
25555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
25640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsset_pred_wr(struct nv50_pc *pc, unsigned on, unsigned idx,
25740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	    struct nv50_program_exec *e)
25855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
25940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
26040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] &= ~((0x3 << 4) | (1 << 6));
26140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (idx << 4) | (on << 6);
26255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
26355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
26455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
26540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsset_long(struct nv50_pc *pc, struct nv50_program_exec *e)
26655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
26740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	if (is_long(e))
26855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		return;
26955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
27040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 1;
27140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_pred(pc, 0xf, 0, e);
27240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_pred_wr(pc, 0, 0, e);
27355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
27455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
27555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
27640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsset_dst(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_program_exec *e)
27755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
27855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (dst->type == P_RESULT) {
27940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		set_long(pc, e);
28040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[1] |= 0x00000008;
28155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	}
28255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
28355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	alloc_reg(pc, dst);
28440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= (dst->hw << 2);
28555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
28655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
28755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
28840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsset_immd(struct nv50_pc *pc, struct nv50_reg *imm, struct nv50_program_exec *e)
28955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
29055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	unsigned val = fui(pc->immd_buf[imm->hw]); /* XXX */
29155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
29240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
29355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	/*XXX: can't be predicated - bits overlap.. catch cases where both
29455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	 *     are required and avoid them. */
29540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_pred(pc, 0, 0, e);
29640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_pred_wr(pc, 0, 0, e);
29755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
29840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= 0x00000002 | 0x00000001;
29940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= (val & 0x3f) << 16;
30040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (val >> 6) << 2;
30155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
30255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
30355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic void
3048ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggsemit_interp(struct nv50_pc *pc, struct nv50_reg *dst,
3055a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs	    struct nv50_reg *src, struct nv50_reg *iv)
3068ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs{
30740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
3088ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
30940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0x80000000;
31040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
3118ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	alloc_reg(pc, src);
31240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= (src->hw << 16);
3135a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs	if (iv) {
31440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[0] |= (1 << 25);
3155a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs		alloc_reg(pc, iv);
3165a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs		e->inst[0] |= (iv->hw << 9);
3175a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs	}
3188ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
31940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
3208ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs}
3218ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
3228ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggsstatic void
3231c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggsset_data(struct nv50_pc *pc, struct nv50_reg *src, unsigned m, unsigned s,
3241c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs	 struct nv50_program_exec *e)
3252a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
32640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
327aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs#if 1
328aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	e->inst[1] |= (1 << 22);
329aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs#else
3302a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_IMMD) {
33140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[1] |= (NV50_CB_PMISC << 22);
3322a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else {
333b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs		if (pc->p->type == PIPE_SHADER_VERTEX)
33440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e->inst[1] |= (NV50_CB_PVP << 22);
3352a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		else
33640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e->inst[1] |= (NV50_CB_PFP << 22);
3372a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
338aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs#endif
3391c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs
3401c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs	e->param.index = src->hw;
3411c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs	e->param.shift = s;
3421c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs	e->param.mask = m << (s % 32);
3432a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
3442a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3452a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
34655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsemit_mov(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
34755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
34840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
34955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
35040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0x10000000;
35155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
35240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
35355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
354da66b8a2f4c3c052ad71b2b6d5a845c2fd267c6eBen Skeggs	if (0 && dst->type != P_RESULT && src->type == P_IMMD) {
35540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		set_immd(pc, src, e);
35655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		/*XXX: 32-bit, but steals part of "half" reg space - need to
35755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		 *     catch and handle this case if/when we do half-regs
35855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		 */
35940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[0] |= 0x00008000;
36055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	} else
36155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (src->type == P_IMMD || src->type == P_CONST) {
36240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		set_long(pc, e);
3631c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs		set_data(pc, src, 0x7f, 9, e);
36440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[1] |= 0x20000000; /* src0 const? */
36555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	} else {
36655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		if (src->type == P_ATTR) {
36740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			set_long(pc, e);
36840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e->inst[1] |= 0x00200000;
36955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		}
37055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
37155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		alloc_reg(pc, src);
37240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[0] |= (src->hw << 9);
37355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	}
37455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
37555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	/* We really should support "half" instructions here at some point,
37655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	 * but I don't feel confident enough about them yet.
37755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	 */
37840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
37940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	if (is_long(e) && !is_immd(e)) {
38040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[1] |= 0x04000000; /* 32-bit */
38140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[1] |= 0x0003c000; /* "subsubop" 0xf == mov */
38255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	}
38355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
38440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
38555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
38655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
387f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic boolean
3882a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggscheck_swap_src_0_1(struct nv50_pc *pc,
3892a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		   struct nv50_reg **s0, struct nv50_reg **s1)
3902a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
3912a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	struct nv50_reg *src0 = *s0, *src1 = *s1;
3922a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3932a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src0->type == P_CONST) {
3942a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		if (src1->type != P_CONST) {
3952a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s0 = src1;
3962a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s1 = src0;
3972a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			return TRUE;
3982a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		}
3992a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
4002a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src1->type == P_ATTR) {
4012a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		if (src0->type != P_ATTR) {
4022a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s0 = src1;
4032a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s1 = src0;
4042a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			return TRUE;
4052a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		}
4062a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
4072a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4082a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	return FALSE;
4092a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4102a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4112a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
41240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsset_src_0(struct nv50_pc *pc, struct nv50_reg *src, struct nv50_program_exec *e)
4132a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4142a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_ATTR) {
41540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		set_long(pc, e);
41640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[1] |= 0x00200000;
4172a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
4182a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_CONST || src->type == P_IMMD) {
4192a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		struct nv50_reg *temp = temp_temp(pc);
4202a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4212a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mov(pc, temp, src);
4222a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		src = temp;
4232a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
4242a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4252a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	alloc_reg(pc, src);
42640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= (src->hw << 9);
4272a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4282a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4292a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
43040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsset_src_1(struct nv50_pc *pc, struct nv50_reg *src, struct nv50_program_exec *e)
4312a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4322a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_ATTR) {
4332a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		struct nv50_reg *temp = temp_temp(pc);
4342a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4352a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mov(pc, temp, src);
4362a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		src = temp;
4372a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
4382a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_CONST || src->type == P_IMMD) {
43940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		assert(!(e->inst[0] & 0x00800000));
44040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		if (e->inst[0] & 0x01000000) {
44134a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			struct nv50_reg *temp = temp_temp(pc);
44234a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs
44334a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			emit_mov(pc, temp, src);
44434a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			src = temp;
44534a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs		} else {
4461c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs			set_data(pc, src, 0x7f, 16, e);
44740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e->inst[0] |= 0x00800000;
44834a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs		}
4492a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
4502a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4512a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	alloc_reg(pc, src);
45240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= (src->hw << 16);
4532a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4542a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4552a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
45640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsset_src_2(struct nv50_pc *pc, struct nv50_reg *src, struct nv50_program_exec *e)
4572a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
45840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
4592a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4602a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_ATTR) {
4612a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		struct nv50_reg *temp = temp_temp(pc);
4622a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4632a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mov(pc, temp, src);
4642a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		src = temp;
4652a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
4662a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_CONST || src->type == P_IMMD) {
46740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		assert(!(e->inst[0] & 0x01000000));
46840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		if (e->inst[0] & 0x00800000) {
46934a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			struct nv50_reg *temp = temp_temp(pc);
47034a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs
47134a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			emit_mov(pc, temp, src);
47234a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			src = temp;
47334a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs		} else {
4741c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs			set_data(pc, src, 0x7f, 32+14, e);
47540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e->inst[0] |= 0x01000000;
47634a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs		}
4772a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
4782a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4792a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	alloc_reg(pc, src);
48040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (src->hw << 14);
4812a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4822a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4832a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
4842a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_mul(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
4852a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	 struct nv50_reg *src1)
4862a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
48740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
4882a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
48940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0xc0000000;
49040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
4912a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4922a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
49340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
49440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src0, e);
49540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_1(pc, src1, e);
4962a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
49740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
4982a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4992a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5002a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
50152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggsemit_add(struct nv50_pc *pc, struct nv50_reg *dst,
50252a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	 struct nv50_reg *src0, struct nv50_reg *src1)
5032a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
50440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
5052a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
50640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0xb0000000;
5072a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5082a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
50940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
51040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src0, e);
51140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	if (is_long(e))
51240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		set_src_2(pc, src1, e);
51352a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	else
51440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		set_src_1(pc, src1, e);
51552a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
51640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
51752a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs}
51852a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
51952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggsstatic void
52052a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggsemit_minmax(struct nv50_pc *pc, unsigned sub, struct nv50_reg *dst,
52152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	    struct nv50_reg *src0, struct nv50_reg *src1)
52252a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs{
52340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
52452a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
52540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
52640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0xb0000000;
52740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (sub << 29);
52852a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
52952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
53040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
53140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src0, e);
53240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_1(pc, src1, e);
5332a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
53440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
5352a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
5362a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5372a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
5382a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_sub(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
5392a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	 struct nv50_reg *src1)
5402a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
54140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
5422a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
54340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0xb0000000;
5442a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
54540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
5462a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (check_swap_src_0_1(pc, &src0, &src1))
54740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[1] |= 0x04000000;
5482a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	else
54940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[1] |= 0x08000000;
5502a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
55140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
55240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src0, e);
55340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_2(pc, src1, e);
5542a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
55540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
5562a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
5572a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5582a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
5592a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_mad(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
5602a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	 struct nv50_reg *src1, struct nv50_reg *src2)
5612a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
56240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
5632a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
56440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0xe0000000;
5652a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5662a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
56740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
56840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src0, e);
56940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_1(pc, src1, e);
57040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_2(pc, src2, e);
5712a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
57240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
5732a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
5742a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5752a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
57621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggsemit_msb(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
57721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	 struct nv50_reg *src1, struct nv50_reg *src2)
57821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs{
57940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
58021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
58140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0xe0000000;
58240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
58340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= 0x08000000; /* src0 * src1 - src2 */
58421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
58521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
58640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
58740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src0, e);
58840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_1(pc, src1, e);
58940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_2(pc, src2, e);
59021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
59140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
59221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs}
59321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
59421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggsstatic void
5952a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_flop(struct nv50_pc *pc, unsigned sub,
5962a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	  struct nv50_reg *dst, struct nv50_reg *src)
5972a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
59840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
5992a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
60040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0x90000000;
60152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	if (sub) {
60240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		set_long(pc, e);
60340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[1] |= (sub << 29);
60452a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	}
6052a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
60640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
60740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src, e);
6082a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
60940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
6102a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
6112a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
612d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggsstatic void
613d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggsemit_preex2(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
614d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs{
61540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
616d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
61740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0xb0000000;
618d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
61940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
62040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src, e);
62140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
62240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (6 << 29) | 0x00004000;
623d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
62440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
625d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs}
626faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs
627bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggsstatic void
6287b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggsemit_precossin(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
6297b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs{
63040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
6317b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs
63240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0xb0000000;
6337b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs
63440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
63540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src, e);
63640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
63740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (6 << 29);
6387b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs
63940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
6407b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs}
6417b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs
6427b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggsstatic void
643bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggsemit_set(struct nv50_pc *pc, unsigned c_op, struct nv50_reg *dst,
644bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 struct nv50_reg *src0, struct nv50_reg *src1)
645bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs{
64640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
64751ea3aae03154046316b814053f7493bdb10c853Ben Skeggs	unsigned inv_cop[8] = { 0, 4, 2, 6, 1, 5, 3, 7 };
648bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	struct nv50_reg *rdst;
649bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
650bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	assert(c_op <= 7);
651bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (check_swap_src_0_1(pc, &src0, &src1))
652bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		c_op = inv_cop[c_op];
653bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
654bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	rdst = dst;
655bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (dst->type != P_TEMP)
656bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		dst = alloc_temp(pc, NULL);
657bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
658bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	/* set.u32 */
65940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
66040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0xb0000000;
66140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (3 << 29);
66240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (c_op << 14);
663bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	/*XXX: breaks things, .u32 by default?
664bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 *     decuda will disasm as .u16 and use .lo/.hi regs, but this
665bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 *     doesn't seem to match what the hw actually does.
666bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[1] |= 0x04000000; << breaks things.. .u32 by default?
667bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 */
66840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
66940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src0, e);
67040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_1(pc, src1, e);
67140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
672bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
673bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	/* cvt.f32.u32 */
67440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e = exec(pc);
67540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] = 0xa0000001;
67640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] = 0x64014780;
67740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, rdst, e);
67840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, dst, e);
67940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
680bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
681bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (dst != rdst)
682bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		free_temp(pc, dst);
683bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs}
684d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
685b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggsstatic void
686b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggsemit_flr(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
687b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs{
68840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
68940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs
69040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] = 0xa0000000; /* cvt */
69140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
69240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (6 << 29); /* cvt */
69340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= 0x08000000; /* integer mode */
69440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= 0x04000000; /* 32 bit */
69540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= ((0x1 << 3)) << 14; /* .rn */
69640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (1 << 14); /* src .f32 */
69740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
69840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src, e);
69940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs
70040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
701b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs}
702b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs
703faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggsstatic void
704faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggsemit_pow(struct nv50_pc *pc, struct nv50_reg *dst,
705faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	 struct nv50_reg *v, struct nv50_reg *e)
706faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs{
707faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	struct nv50_reg *temp = alloc_temp(pc, NULL);
708faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs
709faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	emit_flop(pc, 3, temp, v);
710faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	emit_mul(pc, temp, temp, e);
711faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	emit_preex2(pc, temp, temp);
712faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	emit_flop(pc, 6, dst, temp);
713faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs
714faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	free_temp(pc, temp);
715faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs}
716faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs
717fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggsstatic void
718fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggsemit_abs(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
719fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs{
72040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
72140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs
72240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] = 0xa0000000; /* cvt */
72340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
72440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (6 << 29); /* cvt */
72540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= 0x04000000; /* 32 bit */
72640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (1 << 14); /* src .f32 */
72740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= ((1 << 6) << 14); /* .abs */
72840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
72940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src, e);
73040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs
73140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
732fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs}
733fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
73401e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggsstatic void
7357b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggsemit_lit(struct nv50_pc *pc, struct nv50_reg **dst, unsigned mask,
7367b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs	 struct nv50_reg **src)
73701e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs{
73801e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	struct nv50_reg *one = alloc_immd(pc, 1.0);
73901e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	struct nv50_reg *zero = alloc_immd(pc, 0.0);
74001e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	struct nv50_reg *neg128 = alloc_immd(pc, -127.999999);
74101e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	struct nv50_reg *pos128 = alloc_immd(pc,  127.999999);
74201e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	struct nv50_reg *tmp[4];
74301e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
7447b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs	if (mask & (1 << 0))
7457b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_mov(pc, dst[0], one);
7467b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs
7477b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs	if (mask & (1 << 3))
7487b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_mov(pc, dst[3], one);
7497b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs
7507b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs	if (mask & (3 << 1)) {
7517b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		if (mask & (1 << 1))
7527b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs			tmp[0] = dst[1];
7537b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		else
7547b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs			tmp[0] = temp_temp(pc);
7557b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_minmax(pc, 4, tmp[0], src[0], zero);
7567b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs	}
75701e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
7587b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs	if (mask & (1 << 2)) {
75940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		set_pred_wr(pc, 1, 0, pc->p->exec_tail);
76001e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
7617b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		tmp[1] = temp_temp(pc);
7627b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_minmax(pc, 4, tmp[1], src[1], zero);
76301e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
7647b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		tmp[3] = temp_temp(pc);
7657b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_minmax(pc, 4, tmp[3], src[3], neg128);
7667b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_minmax(pc, 5, tmp[3], tmp[3], pos128);
76701e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
7687b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_pow(pc, dst[2], tmp[1], tmp[3]);
7697b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_mov(pc, dst[2], zero);
77040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		set_pred(pc, 3, 0, pc->p->exec_tail);
7717b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs	}
77201e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs}
77301e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
77431f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggsstatic void
77531f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggsemit_neg(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
77631f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs{
77740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
77831f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs
77940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
78040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0xa0000000; /* delta */
78140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (7 << 29); /* delta */
78240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= 0x04000000; /* negate arg0? probably not */
78340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (1 << 14); /* src .f32 */
78440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
78540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src, e);
78631f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs
78740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
78831f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs}
78931f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs
790fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggsstatic struct nv50_reg *
791fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggstgsi_dst(struct nv50_pc *pc, int c, const struct tgsi_full_dst_register *dst)
792fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs{
793fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	switch (dst->DstRegister.File) {
794fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_FILE_TEMPORARY:
795fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		return &pc->temp[dst->DstRegister.Index * 4 + c];
796fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_FILE_OUTPUT:
797fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		return &pc->result[dst->DstRegister.Index * 4 + c];
798fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_FILE_NULL:
799fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		return NULL;
800fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	default:
801fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
802fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	}
803fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
804fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	return NULL;
805fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs}
806fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
807fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggsstatic struct nv50_reg *
808fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggstgsi_src(struct nv50_pc *pc, int chan, const struct tgsi_full_src_register *src)
809fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs{
810fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	struct nv50_reg *r = NULL;
811fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	struct nv50_reg *temp;
812fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	unsigned c;
813fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
814fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	c = tgsi_util_get_full_src_register_extswizzle(src, chan);
815fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	switch (c) {
816fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_X:
817fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_Y:
818fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_Z:
819fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_W:
820fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		switch (src->SrcRegister.File) {
821fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		case TGSI_FILE_INPUT:
822fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			r = &pc->attr[src->SrcRegister.Index * 4 + c];
823fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			break;
824fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		case TGSI_FILE_TEMPORARY:
825fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			r = &pc->temp[src->SrcRegister.Index * 4 + c];
826fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			break;
827fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		case TGSI_FILE_CONSTANT:
828fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			r = &pc->param[src->SrcRegister.Index * 4 + c];
829fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			break;
830fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		case TGSI_FILE_IMMEDIATE:
831fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			r = &pc->immd[src->SrcRegister.Index * 4 + c];
832fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			break;
833c0ed6a871cd3513e17a1fab960f5626485ffed13Ben Skeggs		case TGSI_FILE_SAMPLER:
834c0ed6a871cd3513e17a1fab960f5626485ffed13Ben Skeggs			break;
835fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		default:
836fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			assert(0);
837fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			break;
838fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		}
839fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
840fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_ZERO:
841fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		r = alloc_immd(pc, 0.0);
842fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
843fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_ONE:
844fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		r = alloc_immd(pc, 1.0);
845fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
846fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	default:
847fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		assert(0);
848fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
849fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	}
850fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
851fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	switch (tgsi_util_get_full_src_register_sign_mode(src, chan)) {
852fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_UTIL_SIGN_KEEP:
853fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
854fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_UTIL_SIGN_CLEAR:
855fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		temp = temp_temp(pc);
856fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		emit_abs(pc, temp, r);
857fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		r = temp;
858fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
85931f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs	case TGSI_UTIL_SIGN_TOGGLE:
86031f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs		temp = temp_temp(pc);
86131f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs		emit_neg(pc, temp, r);
86231f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs		r = temp;
86331f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs		break;
86431f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs	case TGSI_UTIL_SIGN_SET:
86531f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs		temp = temp_temp(pc);
86631f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs		emit_abs(pc, temp, r);
86731f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs		emit_neg(pc, temp, r);
86831f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs		r = temp;
86931f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs		break;
870fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	default:
871fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		assert(0);
872fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
873fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	}
874fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
875fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	return r;
876fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs}
877fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
8782a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic boolean
879f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_tx_insn(struct nv50_pc *pc, const union tgsi_full_token *tok)
880f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
881f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	const struct tgsi_full_instruction *inst = &tok->FullInstruction;
882688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	struct nv50_reg *rdst[4], *dst[4], *src[3][4], *temp;
883688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	unsigned mask, sat;
884f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int i, c;
885f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
886f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	mask = inst->FullDstRegisters[0].DstRegister.WriteMask;
887688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	sat = inst->Instruction.Saturate == TGSI_SAT_ZERO_ONE;
888f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
889f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (c = 0; c < 4; c++) {
890f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (mask & (1 << c))
891f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			dst[c] = tgsi_dst(pc, c, &inst->FullDstRegisters[0]);
892f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		else
893f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			dst[c] = NULL;
894f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
895f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
896f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (i = 0; i < inst->Instruction.NumSrcRegs; i++) {
897f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (c = 0; c < 4; c++)
898f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			src[i][c] = tgsi_src(pc, c, &inst->FullSrcRegisters[i]);
899f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
900f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
901688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	if (sat) {
902688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs		for (c = 0; c < 4; c++) {
903688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			rdst[c] = dst[c];
904688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			dst[c] = temp_temp(pc);
905688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs		}
906688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	}
907688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs
908f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	switch (inst->Instruction.Opcode) {
90968091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs	case TGSI_OPCODE_ABS:
91068091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs		for (c = 0; c < 4; c++) {
911fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			if (!(mask & (1 << c)))
912fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs				continue;
913fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			emit_abs(pc, dst[c], src[0][c]);
91468091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs		}
91568091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs		break;
9162a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_ADD:
9177df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9187df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9197df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
9202a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_add(pc, dst[c], src[0][c], src[1][c]);
9217df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
9222a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
9232a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_COS:
9247b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		temp = alloc_temp(pc, NULL);
9257b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_precossin(pc, temp, src[0][0]);
9267b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_flop(pc, 5, temp, temp);
9277df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9287df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9297df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
9307b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs			emit_mov(pc, dst[c], temp);
9317df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
9322a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
9332a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_DP3:
9342a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		temp = alloc_temp(pc, NULL);
9352a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mul(pc, temp, src[0][0], src[1][0]);
9362a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][1], src[1][1], temp);
9372a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][2], src[1][2], temp);
9387df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9397df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9407df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
9412a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mov(pc, dst[c], temp);
9427df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
9432a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		free_temp(pc, temp);
9442a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
9452a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_DP4:
9462a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		temp = alloc_temp(pc, NULL);
9472a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mul(pc, temp, src[0][0], src[1][0]);
9482a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][1], src[1][1], temp);
9492a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][2], src[1][2], temp);
9502a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][3], src[1][3], temp);
9517df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9527df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9537df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
9542a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mov(pc, dst[c], temp);
9557df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
9562a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		free_temp(pc, temp);
9572a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
95821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	case TGSI_OPCODE_DPH:
95921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		temp = alloc_temp(pc, NULL);
96021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mul(pc, temp, src[0][0], src[1][0]);
96121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mad(pc, temp, src[0][1], src[1][1], temp);
96221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mad(pc, temp, src[0][2], src[1][2], temp);
96321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_add(pc, temp, src[1][3], temp);
96421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		for (c = 0; c < 4; c++) {
96521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs			if (!(mask & (1 << c)))
96621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs				continue;
96721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs			emit_mov(pc, dst[c], temp);
96821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		}
96921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		free_temp(pc, temp);
97021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		break;
97133e4d30d50344be26398a51365bea1be37487403Ben Skeggs	case TGSI_OPCODE_DST:
97233e4d30d50344be26398a51365bea1be37487403Ben Skeggs	{
97333e4d30d50344be26398a51365bea1be37487403Ben Skeggs		struct nv50_reg *one = alloc_immd(pc, 1.0);
9749a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 0))
9759a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mov(pc, dst[0], one);
9769a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 1))
9779a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mul(pc, dst[1], src[0][1], src[1][1]);
9789a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 2))
9799a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mov(pc, dst[2], src[0][2]);
9809a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 3))
9819a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mov(pc, dst[3], src[1][3]);
98233e4d30d50344be26398a51365bea1be37487403Ben Skeggs		FREE(one);
98333e4d30d50344be26398a51365bea1be37487403Ben Skeggs	}
98433e4d30d50344be26398a51365bea1be37487403Ben Skeggs		break;
9852a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_EX2:
986fbf4027dd9b279ec159906dcad134f71e34aaec8Ben Skeggs		temp = alloc_temp(pc, NULL);
9877b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_preex2(pc, temp, src[0][0]);
9887b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_flop(pc, 6, temp, temp);
9897df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
9907df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
9917df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
9927b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs			emit_mov(pc, dst[c], temp);
9937df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
994fbf4027dd9b279ec159906dcad134f71e34aaec8Ben Skeggs		free_temp(pc, temp);
9952a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
996b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	case TGSI_OPCODE_FLR:
997b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		for (c = 0; c < 4; c++) {
998b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			if (!(mask & (1 << c)))
999b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs				continue;
1000b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			emit_flr(pc, dst[c], src[0][c]);
1001b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		}
1002b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		break;
1003b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	case TGSI_OPCODE_FRC:
1004b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		temp = alloc_temp(pc, NULL);
1005b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		for (c = 0; c < 4; c++) {
1006b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			if (!(mask & (1 << c)))
1007b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs				continue;
1008b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			emit_flr(pc, temp, src[0][c]);
1009b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			emit_sub(pc, dst[c], src[0][c], temp);
1010b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		}
1011b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		free_temp(pc, temp);
1012b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		break;
101301e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	case TGSI_OPCODE_LIT:
10147b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_lit(pc, &dst[0], mask, &src[0][0]);
101501e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs		break;
10162a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_LG2:
10177b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		temp = alloc_temp(pc, NULL);
10187b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_flop(pc, 3, temp, src[0][0]);
10197df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
10207df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
10217df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
10227b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs			emit_mov(pc, dst[c], temp);
10237df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
10242a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
102521e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs	case TGSI_OPCODE_LRP:
102621e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs		for (c = 0; c < 4; c++) {
102721e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs			if (!(mask & (1 << c)))
102821e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs				continue;
102921e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs			/*XXX: we can do better than this */
103021e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs			temp = alloc_temp(pc, NULL);
103121e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs			emit_neg(pc, temp, src[0][c]);
103221e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs			emit_mad(pc, temp, temp, src[2][c], src[2][c]);
103321e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs			emit_mad(pc, dst[c], src[0][c], src[1][c], temp);
103421e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs			free_temp(pc, temp);
103521e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs		}
103621e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs		break;
10372a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_MAD:
10387df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
10397df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
10407df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
10412a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mad(pc, dst[c], src[0][c], src[1][c], src[2][c]);
10427df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
10432a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
104452a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	case TGSI_OPCODE_MAX:
10457df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
10467df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
10477df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
104852a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs			emit_minmax(pc, 4, dst[c], src[0][c], src[1][c]);
10497df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
105052a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		break;
105152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	case TGSI_OPCODE_MIN:
10527df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
10537df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
10547df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
105552a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs			emit_minmax(pc, 5, dst[c], src[0][c], src[1][c]);
10567df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
105752a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		break;
1058f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_OPCODE_MOV:
10597df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
10607df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
10617df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
106255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs			emit_mov(pc, dst[c], src[0][c]);
10637df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
106438ce697e5942550888c28bd4859ca2a92f247bf7Ben Skeggs		break;
10652a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_MUL:
10667df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
10677df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
10687df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
10692a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mul(pc, dst[c], src[0][c], src[1][c]);
10707df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
10712a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
1072ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs	case TGSI_OPCODE_POW:
1073ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		temp = alloc_temp(pc, NULL);
1074faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs		emit_pow(pc, temp, src[0][0], src[1][0]);
1075ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		for (c = 0; c < 4; c++) {
1076ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs			if (!(mask & (1 << c)))
1077ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs				continue;
1078ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs			emit_mov(pc, dst[c], temp);
1079ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		}
1080ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		free_temp(pc, temp);
1081ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		break;
10822a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_RCP:
10837df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
10847df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
10857df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
10867b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs			emit_flop(pc, 0, dst[c], src[0][0]);
10877df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
10882a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
10892a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_RSQ:
10907df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
10917df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
10927df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
10937b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs			emit_flop(pc, 2, dst[c], src[0][0]);
10947df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
10952a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
10967b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs	case TGSI_OPCODE_SCS:
10977b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		temp = alloc_temp(pc, NULL);
10987b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_precossin(pc, temp, src[0][0]);
10997b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		if (mask & (1 << 0))
11007b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs			emit_flop(pc, 5, dst[0], temp);
11017b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		if (mask & (1 << 1))
11027b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs			emit_flop(pc, 4, dst[1], temp);
11037b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		break;
1104bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	case TGSI_OPCODE_SGE:
1105bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		for (c = 0; c < 4; c++) {
1106bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			if (!(mask & (1 << c)))
1107bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs				continue;
1108bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			emit_set(pc, 6, dst[c], src[0][c], src[1][c]);
1109bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		}
1110bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		break;
11112a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_SIN:
11127b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		temp = alloc_temp(pc, NULL);
11137b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_precossin(pc, temp, src[0][0]);
11147b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_flop(pc, 4, temp, temp);
11157df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
11167df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
11177df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
11187b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs			emit_mov(pc, dst[c], temp);
11197df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
11202a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
1121bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	case TGSI_OPCODE_SLT:
1122bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		for (c = 0; c < 4; c++) {
1123bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			if (!(mask & (1 << c)))
1124bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs				continue;
1125bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			emit_set(pc, 1, dst[c], src[0][c], src[1][c]);
1126bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		}
1127bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		break;
11282a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_SUB:
11297df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
11307df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
11317df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
11322a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_sub(pc, dst[c], src[0][c], src[1][c]);
11337df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
11342a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
1135c0ed6a871cd3513e17a1fab960f5626485ffed13Ben Skeggs	case TGSI_OPCODE_TEX:
1136431504b99cd55948522e86a249e656e78598ddbdBen Skeggs		{
1137fd7412a7f1beab8b81ce307b1054331eee102e8bBen Skeggs			struct nv50_reg *t0, *t1, *t2, *t3;
1138431504b99cd55948522e86a249e656e78598ddbdBen Skeggs			struct nv50_program_exec *e;
1139431504b99cd55948522e86a249e656e78598ddbdBen Skeggs
1140431504b99cd55948522e86a249e656e78598ddbdBen Skeggs			t0 = alloc_temp(pc, NULL);
1141431504b99cd55948522e86a249e656e78598ddbdBen Skeggs			t0 = alloc_temp(pc, NULL);
1142431504b99cd55948522e86a249e656e78598ddbdBen Skeggs			t1 = alloc_temp(pc, NULL);
1143fd7412a7f1beab8b81ce307b1054331eee102e8bBen Skeggs			t2 = alloc_temp(pc, NULL);
1144fd7412a7f1beab8b81ce307b1054331eee102e8bBen Skeggs			t3 = alloc_temp(pc, NULL);
1145431504b99cd55948522e86a249e656e78598ddbdBen Skeggs			emit_mov(pc, t0, src[0][0]);
1146431504b99cd55948522e86a249e656e78598ddbdBen Skeggs			emit_mov(pc, t1, src[0][1]);
1147431504b99cd55948522e86a249e656e78598ddbdBen Skeggs
1148431504b99cd55948522e86a249e656e78598ddbdBen Skeggs			e = exec(pc);
11495a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs			e->inst[0] = 0xf6400000;
1150fd7412a7f1beab8b81ce307b1054331eee102e8bBen Skeggs			set_long(pc, e);
1151fd7412a7f1beab8b81ce307b1054331eee102e8bBen Skeggs			e->inst[1] |= 0x0000c004;
1152431504b99cd55948522e86a249e656e78598ddbdBen Skeggs			set_dst(pc, t0, e);
1153431504b99cd55948522e86a249e656e78598ddbdBen Skeggs			emit(pc, e);
1154fd7412a7f1beab8b81ce307b1054331eee102e8bBen Skeggs
1155fd7412a7f1beab8b81ce307b1054331eee102e8bBen Skeggs			if (mask & (1 << 0)) emit_mov(pc, dst[0], t0);
1156fd7412a7f1beab8b81ce307b1054331eee102e8bBen Skeggs			if (mask & (1 << 1)) emit_mov(pc, dst[1], t1);
1157fd7412a7f1beab8b81ce307b1054331eee102e8bBen Skeggs			if (mask & (1 << 2)) emit_mov(pc, dst[2], t2);
1158fd7412a7f1beab8b81ce307b1054331eee102e8bBen Skeggs			if (mask & (1 << 3)) emit_mov(pc, dst[3], t3);
1159fd7412a7f1beab8b81ce307b1054331eee102e8bBen Skeggs
1160431504b99cd55948522e86a249e656e78598ddbdBen Skeggs			free_temp(pc, t0);
1161431504b99cd55948522e86a249e656e78598ddbdBen Skeggs			free_temp(pc, t1);
1162fd7412a7f1beab8b81ce307b1054331eee102e8bBen Skeggs			free_temp(pc, t2);
1163fd7412a7f1beab8b81ce307b1054331eee102e8bBen Skeggs			free_temp(pc, t3);
1164431504b99cd55948522e86a249e656e78598ddbdBen Skeggs		}
1165c0ed6a871cd3513e17a1fab960f5626485ffed13Ben Skeggs		break;
116621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	case TGSI_OPCODE_XPD:
116721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		temp = alloc_temp(pc, NULL);
11689a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 0)) {
11699a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mul(pc, temp, src[0][2], src[1][1]);
11709a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_msb(pc, dst[0], src[0][1], src[1][2], temp);
11719a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		}
11729a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 1)) {
11739a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mul(pc, temp, src[0][0], src[1][2]);
11749a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_msb(pc, dst[1], src[0][2], src[1][0], temp);
11759a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		}
11769a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 2)) {
11779a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mul(pc, temp, src[0][1], src[1][0]);
11789a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_msb(pc, dst[2], src[0][0], src[1][1], temp);
11799a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		}
118021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		free_temp(pc, temp);
118121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		break;
1182f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_OPCODE_END:
1183f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		break;
1184f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	default:
1185f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		NOUVEAU_ERR("invalid opcode %d\n", inst->Instruction.Opcode);
1186f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return FALSE;
1187f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1188f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1189688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	if (sat) {
1190688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs		for (c = 0; c < 4; c++) {
119140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			struct nv50_program_exec *e;
1192688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs
1193688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			if (!(mask & (1 << c)))
1194688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs				continue;
119540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e = exec(pc);
119640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs
119740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e->inst[0] = 0xa0000000; /* cvt */
119840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			set_long(pc, e);
119940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e->inst[1] |= (6 << 29); /* cvt */
120040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e->inst[1] |= 0x04000000; /* 32 bit */
120140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e->inst[1] |= (1 << 14); /* src .f32 */
120240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e->inst[1] |= ((1 << 5) << 14); /* .sat */
120340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			set_dst(pc, rdst[c], e);
120440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			set_src_0(pc, dst[c], e);
120540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			emit(pc, e);
1206688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs		}
1207688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	}
1208688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs
120952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	kill_temp_temp(pc);
1210f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return TRUE;
1211f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1212f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1213f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic boolean
1214f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_tx_prep(struct nv50_pc *pc)
1215f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1216f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct tgsi_parse_context p;
1217f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	boolean ret = FALSE;
1218f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	unsigned i, c;
1219f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1220f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_init(&p, pc->p->pipe.tokens);
1221f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	while (!tgsi_parse_end_of_tokens(&p)) {
1222f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		const union tgsi_full_token *tok = &p.FullToken;
1223f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1224f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		tgsi_parse_token(&p);
1225f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		switch (tok->Token.Type) {
1226f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_IMMEDIATE:
1227f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		{
1228f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			const struct tgsi_full_immediate *imm =
1229f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				&p.FullToken.FullImmediate;
1230f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
123133e4d30d50344be26398a51365bea1be37487403Ben Skeggs			ctor_immd(pc, imm->u.ImmediateFloat32[0].Float,
123233e4d30d50344be26398a51365bea1be37487403Ben Skeggs				      imm->u.ImmediateFloat32[1].Float,
123333e4d30d50344be26398a51365bea1be37487403Ben Skeggs				      imm->u.ImmediateFloat32[2].Float,
123433e4d30d50344be26398a51365bea1be37487403Ben Skeggs				      imm->u.ImmediateFloat32[3].Float);
1235f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1236f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1237f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_DECLARATION:
1238f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		{
1239f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			const struct tgsi_full_declaration *d;
1240f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			unsigned last;
1241f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1242f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			d = &p.FullToken.FullDeclaration;
1243f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			last = d->u.DeclarationRange.Last;
1244f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1245f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			switch (d->Declaration.File) {
1246f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_TEMPORARY:
1247f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->temp_nr < (last + 1))
1248f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->temp_nr = last + 1;
1249f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
1250f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_OUTPUT:
1251f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->result_nr < (last + 1))
1252f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->result_nr = last + 1;
1253f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
1254f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_INPUT:
1255f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->attr_nr < (last + 1))
1256f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->attr_nr = last + 1;
1257f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
1258f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_CONSTANT:
1259f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->param_nr < (last + 1))
1260f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->param_nr = last + 1;
1261f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
1262c0ed6a871cd3513e17a1fab960f5626485ffed13Ben Skeggs			case TGSI_FILE_SAMPLER:
1263c0ed6a871cd3513e17a1fab960f5626485ffed13Ben Skeggs				break;
1264f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			default:
1265f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				NOUVEAU_ERR("bad decl file %d\n",
1266f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					    d->Declaration.File);
1267f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				goto out_err;
1268f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1269f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1270f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1271f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_INSTRUCTION:
1272f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1273f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		default:
1274f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1275f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1276f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1277f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1278f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->temp_nr) {
1279f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->temp = calloc(pc->temp_nr * 4, sizeof(struct nv50_reg));
1280f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->temp)
1281f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1282f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1283f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->temp_nr; i++) {
1284f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1285f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->temp[i*4+c].type = P_TEMP;
1286f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->temp[i*4+c].hw = -1;
1287f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->temp[i*4+c].index = i;
1288f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1289f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1290f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1291f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1292f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->attr_nr) {
1293fa5cd63f96d2b69ded48d40b9cb7e57c147f7332Ben Skeggs		struct nv50_reg *iv = NULL;
1294f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		int aid = 0;
1295f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1296f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->attr = calloc(pc->attr_nr * 4, sizeof(struct nv50_reg));
1297f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->attr)
1298f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1299f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1300b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs		if (pc->p->type == PIPE_SHADER_FRAGMENT) {
13018ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			iv = alloc_temp(pc, NULL);
13025a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs			emit_interp(pc, iv, iv, NULL);
1303fa5cd63f96d2b69ded48d40b9cb7e57c147f7332Ben Skeggs			emit_flop(pc, 0, iv, iv);
13048ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			aid++;
13058ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		}
13068ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
1307f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->attr_nr; i++) {
13088ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			struct nv50_reg *a = &pc->attr[i*4];
13098ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
1310f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1311b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs				if (pc->p->type == PIPE_SHADER_FRAGMENT) {
13128ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					struct nv50_reg *at =
13138ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs						alloc_temp(pc, NULL);
13148ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].type = at->type;
13158ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].hw = at->hw;
13168ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].index = at->index;
13178ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				} else {
13188ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->p->cfg.vp.attr[aid/32] |=
13198ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs						(1 << (aid % 32));
13208ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].type = P_ATTR;
13218ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].hw = aid++;
13228ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].index = i;
13238ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				}
1324f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
13258ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
1326b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs			if (pc->p->type != PIPE_SHADER_FRAGMENT)
13278ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				continue;
13288ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
13295a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs			emit_interp(pc, &a[0], &a[0], iv);
13305a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs			emit_interp(pc, &a[1], &a[1], iv);
13315a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs			emit_interp(pc, &a[2], &a[2], iv);
13325a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs			emit_interp(pc, &a[3], &a[3], iv);
1333f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
13348ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
13358ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		if (iv)
13368ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			free_temp(pc, iv);
1337f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1338f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1339f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->result_nr) {
1340f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		int rid = 0;
1341f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1342f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->result = calloc(pc->result_nr * 4, sizeof(struct nv50_reg));
1343f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->result)
1344f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1345f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1346f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->result_nr; i++) {
1347f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1348b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs				if (pc->p->type == PIPE_SHADER_FRAGMENT) {
13498ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->result[i*4+c].type = P_TEMP;
1350776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs					pc->result[i*4+c].hw = -1;
1351776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs				} else {
13528ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->result[i*4+c].type = P_RESULT;
1353776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs					pc->result[i*4+c].hw = rid++;
1354776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs				}
1355f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->result[i*4+c].index = i;
1356f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1357f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1358f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1359f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1360f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->param_nr) {
1361f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		int rid = 0;
1362f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1363f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->param = calloc(pc->param_nr * 4, sizeof(struct nv50_reg));
1364f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->param)
1365f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1366f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1367f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->param_nr; i++) {
1368f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1369f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->param[i*4+c].type = P_CONST;
1370f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->param[i*4+c].hw = rid++;
1371f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->param[i*4+c].index = i;
1372f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1373f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1374f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1375f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1376f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->immd_nr) {
1377aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs		int rid = pc->param_nr * 4;
1378f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1379f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pc->immd = calloc(pc->immd_nr * 4, sizeof(struct nv50_reg));
1380f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->immd)
1381f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1382f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1383f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->immd_nr; i++) {
1384f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1385f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->immd[i*4+c].type = P_IMMD;
1386f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->immd[i*4+c].hw = rid++;
1387f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->immd[i*4+c].index = i;
1388f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1389f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1390f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1391f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1392f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	ret = TRUE;
1393f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsout_err:
1394f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_free(&p);
1395f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return ret;
1396f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1397f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1398f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic boolean
1399f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_tx(struct nv50_program *p)
1400f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1401f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct tgsi_parse_context parse;
1402f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_pc *pc;
1403f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	boolean ret;
1404f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1405f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	pc = CALLOC_STRUCT(nv50_pc);
1406f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (!pc)
1407f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return FALSE;
1408f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	pc->p = p;
14098ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	pc->p->cfg.high_temp = 4;
1410f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1411f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	ret = nv50_program_tx_prep(pc);
1412f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (ret == FALSE)
1413f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		goto out_cleanup;
1414f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1415f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_init(&parse, pc->p->pipe.tokens);
1416f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	while (!tgsi_parse_end_of_tokens(&parse)) {
1417f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		const union tgsi_full_token *tok = &parse.FullToken;
1418f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1419f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		tgsi_parse_token(&parse);
1420f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1421f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		switch (tok->Token.Type) {
1422f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_INSTRUCTION:
1423f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			ret = nv50_program_tx_insn(pc, tok);
1424f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			if (ret == FALSE)
1425f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				goto out_err;
1426f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1427f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		default:
1428f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1429f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1430f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1431f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1432b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs	if (p->type == PIPE_SHADER_FRAGMENT) {
1433776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs		struct nv50_reg out;
1434776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs
1435776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs		out.type = P_TEMP;
1436776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs		for (out.hw = 0; out.hw < pc->result_nr * 4; out.hw++)
1437776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs			emit_mov(pc, &out, &pc->result[out.hw]);
1438776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs	}
1439776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs
144040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	assert(is_long(pc->p->exec_tail) && !is_immd(pc->p->exec_head));
144140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	pc->p->exec_tail->inst[1] |= 0x00000001;
144240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs
1443aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	p->param_nr = pc->param_nr * 4;
1444f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->immd_nr = pc->immd_nr * 4;
1445f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->immd = pc->immd_buf;
1446f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1447f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsout_err:
1448f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_free(&parse);
1449f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1450f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsout_cleanup:
1451f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return ret;
1452f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1453f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1454f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic void
1455f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_validate(struct nv50_context *nv50, struct nv50_program *p)
1456f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1457e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	if (nv50_program_tx(p) == FALSE)
1458e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs		assert(0);
1459f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->translated = TRUE;
1460f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1461f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
146222e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsstatic void
1463ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggsnv50_program_upload_data(struct nv50_context *nv50, float *map,
1464ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs			 unsigned start, unsigned count)
1465ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs{
1466ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs	while (count) {
1467ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs		unsigned nr = count > 2047 ? 2047 : count;
1468ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs
1469ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs		BEGIN_RING(tesla, 0x00000f00, 1);
1470ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs		OUT_RING  ((NV50_CB_PMISC << 0) | (start << 8));
1471ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs		BEGIN_RING(tesla, 0x40000f04, nr);
1472ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs		OUT_RINGp (map, nr);
1473ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs
1474ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs		map += nr;
1475ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs		start += nr;
1476ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs		count -= nr;
1477ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs	}
1478ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs}
1479ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs
1480ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggsstatic void
148122e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsnv50_program_validate_data(struct nv50_context *nv50, struct nv50_program *p)
148222e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs{
1483aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	struct nouveau_winsys *nvws = nv50->screen->nvws;
1484aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	struct pipe_winsys *ws = nv50->pipe.winsys;
1485aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	unsigned nr = p->param_nr + p->immd_nr;
148622e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
1487aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	if (!p->data && nr) {
1488aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs		struct nouveau_resource *heap = nv50->screen->vp_data_heap;
1489aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs
1490aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs		if (nvws->res_alloc(heap, nr, p, &p->data)) {
1491aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs			while (heap->next && heap->size < nr) {
1492aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs				struct nv50_program *evict = heap->next->priv;
1493aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs				nvws->res_free(&evict->data);
1494aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs			}
1495aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs
1496aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs			if (nvws->res_alloc(heap, nr, p, &p->data))
1497aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs				assert(0);
1498aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs		}
1499aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	}
1500aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs
1501aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	if (p->param_nr) {
1502aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs		float *map = ws->buffer_map(ws, nv50->constbuf[p->type],
1503aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs					    PIPE_BUFFER_USAGE_CPU_READ);
1504ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs		nv50_program_upload_data(nv50, map, p->data->start,
1505ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs					 p->param_nr);
1506aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs		ws->buffer_unmap(ws, nv50->constbuf[p->type]);
1507aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	}
1508aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs
1509ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs	if (p->immd_nr) {
1510ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs		nv50_program_upload_data(nv50, p->immd,
1511ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs					 p->data->start + p->param_nr,
1512ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs					 p->immd_nr);
151322e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	}
151422e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs}
151522e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
151622e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsstatic void
151722e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsnv50_program_validate_code(struct nv50_context *nv50, struct nv50_program *p)
151822e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs{
151922e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	struct pipe_winsys *ws = nv50->pipe.winsys;
152040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e;
1521cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	struct nouveau_stateobj *so;
1522cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	const unsigned flags = NOUVEAU_BO_VRAM | NOUVEAU_BO_WR;
1523cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	unsigned start, count, *up, *ptr;
1524f700d6be6335a4d4394296891f783687b6f2d4f2Ben Skeggs	boolean upload = FALSE;
152522e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
1526f700d6be6335a4d4394296891f783687b6f2d4f2Ben Skeggs	if (!p->buffer) {
152740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		p->buffer = ws->buffer_create(ws, 0x100, 0, p->exec_size * 4);
1528f700d6be6335a4d4394296891f783687b6f2d4f2Ben Skeggs		upload = TRUE;
1529f700d6be6335a4d4394296891f783687b6f2d4f2Ben Skeggs	}
153040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs
1531aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	if (p->data && p->data->start != p->data_start) {
1532aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs		for (e = p->exec_head; e; e = e->next) {
1533ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs			unsigned ei, ci;
1534ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs
1535aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs			if (e->param.index < 0)
1536aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs				continue;
1537ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs			ei = e->param.shift >> 5;
1538ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs			ci = e->param.index + p->data->start;
1539ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs
1540ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs			e->inst[ei] &= ~e->param.mask;
1541ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs			e->inst[ei] |= (ci << e->param.shift);
15421c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs		}
15431c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs
1544aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs		p->data_start = p->data->start;
1545f700d6be6335a4d4394296891f783687b6f2d4f2Ben Skeggs		upload = TRUE;
1546aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	}
1547aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs
1548f700d6be6335a4d4394296891f783687b6f2d4f2Ben Skeggs	if (!upload)
1549f700d6be6335a4d4394296891f783687b6f2d4f2Ben Skeggs		return FALSE;
1550f700d6be6335a4d4394296891f783687b6f2d4f2Ben Skeggs
1551cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	up = ptr = MALLOC(p->exec_size * 4);
1552aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	for (e = p->exec_head; e; e = e->next) {
1553cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		*(ptr++) = e->inst[0];
1554cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		if (is_long(e))
1555cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs			*(ptr++) = e->inst[1];
1556cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	}
1557cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs
1558e002ad77398fbe14a0efbd91824c3325ca09b4c1Ben Skeggs	so = so_new(4,2);
1559cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	so_method(so, nv50->screen->tesla, 0x1280, 3);
1560cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	so_reloc (so, p->buffer, 0, flags | NOUVEAU_BO_HIGH, 0, 0);
1561cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	so_reloc (so, p->buffer, 0, flags | NOUVEAU_BO_LOW, 0, 0);
1562cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	so_data  (so, (NV50_CB_PUPLOAD << 16) | 0x0800); //(p->exec_size * 4));
1563cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs
1564cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	start = 0; count = p->exec_size;
1565cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	while (count) {
1566cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		struct nouveau_winsys *nvws = nv50->screen->nvws;
1567cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		unsigned nr;
1568cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs
1569cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		so_emit(nvws, so);
1570cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs
1571cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		nr = MIN2(count, 2047);
1572cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		nr = MIN2(nvws->channel->pushbuf->remaining, nr);
1573cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		if (nvws->channel->pushbuf->remaining < (nr + 3)) {
1574cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs			FIRE_RING(NULL);
1575cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs			continue;
1576aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs		}
1577cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs
1578cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		BEGIN_RING(tesla, 0x0f00, 1);
1579cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		OUT_RING  ((start << 8) | NV50_CB_PUPLOAD);
1580cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		BEGIN_RING(tesla, 0x40000f04, nr);
1581cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		OUT_RINGp (up + start, nr);
1582cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs
1583cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		start += nr;
1584cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		count -= nr;
158540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	}
1586cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs
1587cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	FREE(up);
1588cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	so_ref(NULL, &so);
158922e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs}
159022e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
1591f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsvoid
1592f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_vertprog_validate(struct nv50_context *nv50)
1593f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1594f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_grobj *tesla = nv50->screen->tesla;
1595f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_program *p = nv50->vertprog;
1596f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_stateobj *so;
1597f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1598f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (!p->translated) {
1599f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		nv50_program_validate(nv50, p);
1600f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!p->translated)
1601f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			assert(0);
1602f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1603f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
160422e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	nv50_program_validate_data(nv50, p);
160522e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	nv50_program_validate_code(nv50, p);
1606f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1607e002ad77398fbe14a0efbd91824c3325ca09b4c1Ben Skeggs	so = so_new(13, 2);
1608f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, NV50TCL_VP_ADDRESS_HIGH, 2);
1609f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1610f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_HIGH, 0, 0);
1611f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1612f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_LOW, 0, 0);
1613f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, 0x1650, 2);
1614f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, p->cfg.vp.attr[0]);
1615f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, p->cfg.vp.attr[1]);
1616fea0b1651677444fc6c135e1a4b8ab6463a9fdf9Ben Skeggs	so_method(so, tesla, 0x16b8, 1);
1617fea0b1651677444fc6c135e1a4b8ab6463a9fdf9Ben Skeggs	so_data  (so, p->cfg.high_result);
1618f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, 0x16ac, 2);
1619bcbe6baac37915563bc120ad558cd930bc1ddec1Ben Skeggs	so_data  (so, p->cfg.high_result); //8);
16208ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_data  (so, p->cfg.high_temp);
1621f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, 0x140c, 1);
1622f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, 0); /* program start offset */
1623bb9efb5534a652878161e28bd73039eff5b11014Ben Skeggs	so_ref(so, &nv50->state.vertprog);
1624f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1625f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1626f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsvoid
1627f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_fragprog_validate(struct nv50_context *nv50)
1628f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1629f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_grobj *tesla = nv50->screen->tesla;
1630f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_program *p = nv50->fragprog;
1631f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_stateobj *so;
1632f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1633f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (!p->translated) {
1634f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		nv50_program_validate(nv50, p);
1635f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!p->translated)
1636f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			assert(0);
1637f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1638f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
163955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	nv50_program_validate_data(nv50, p);
164055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	nv50_program_validate_code(nv50, p);
1641f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1642585ae74d87f3d04a4b5b7c068b865292afd1a16bBen Skeggs	so = so_new(64, 2);
1643f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, NV50TCL_FP_ADDRESS_HIGH, 2);
1644f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1645f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_HIGH, 0, 0);
1646f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1647f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_LOW, 0, 0);
1648585ae74d87f3d04a4b5b7c068b865292afd1a16bBen Skeggs	so_method(so, tesla, 0x1904, 4);
1649585ae74d87f3d04a4b5b7c068b865292afd1a16bBen Skeggs	so_data  (so, 0x01040404); /* p: 0x01000404 */
1650585ae74d87f3d04a4b5b7c068b865292afd1a16bBen Skeggs	so_data  (so, 0x00000004);
1651585ae74d87f3d04a4b5b7c068b865292afd1a16bBen Skeggs	so_data  (so, 0x00000000);
1652585ae74d87f3d04a4b5b7c068b865292afd1a16bBen Skeggs	so_data  (so, 0x00000000);
1653fea0b1651677444fc6c135e1a4b8ab6463a9fdf9Ben Skeggs	so_method(so, tesla, 0x16bc, 3); /*XXX: fixme */
1654585ae74d87f3d04a4b5b7c068b865292afd1a16bBen Skeggs	so_data  (so, 0x03020100);
1655585ae74d87f3d04a4b5b7c068b865292afd1a16bBen Skeggs	so_data  (so, 0x07060504);
1656fea0b1651677444fc6c135e1a4b8ab6463a9fdf9Ben Skeggs	so_data  (so, 0x0b0a0908);
1657585ae74d87f3d04a4b5b7c068b865292afd1a16bBen Skeggs	so_method(so, tesla, 0x1988, 2);
1658bcbe6baac37915563bc120ad558cd930bc1ddec1Ben Skeggs	so_data  (so, 0x08080408); //0x08040404); /* p: 0x0f000401 */
16598ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_data  (so, p->cfg.high_temp);
16608ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_method(so, tesla, 0x1414, 1);
16618ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_data  (so, 0); /* program start offset */
1662bb9efb5534a652878161e28bd73039eff5b11014Ben Skeggs	so_ref(so, &nv50->state.fragprog);
1663f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1664f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1665f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsvoid
1666f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_destroy(struct nv50_context *nv50, struct nv50_program *p)
1667f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1668f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct pipe_winsys *ws = nv50->pipe.winsys;
1669f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
167040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	while (p->exec_head) {
167140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		struct nv50_program_exec *e = p->exec_head;
167240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs
167340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		p->exec_head = e->next;
167440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		FREE(e);
1675f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
167640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	p->exec_tail = NULL;
167740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	p->exec_size = 0;
1678f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1679f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (p->buffer)
1680f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		pipe_buffer_reference(ws, &p->buffer, NULL);
1681f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1682f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->translated = 0;
1683f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1684f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1685