nv50_program.c revision 4a7cf8f66ff5d7e15ae7f8f5542f27bc72c68709
1857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs/*
2857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs * Copyright 2008 Ben Skeggs
3857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs *
4857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs * Permission is hereby granted, free of charge, to any person obtaining a
5857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs * copy of this software and associated documentation files (the "Software"),
6857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs * to deal in the Software without restriction, including without limitation
7857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs * and/or sell copies of the Software, and to permit persons to whom the
9857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs * Software is furnished to do so, subject to the following conditions:
10857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs *
11857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs * The above copyright notice and this permission notice shall be included in
12857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs * all copies or substantial portions of the Software.
13857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs *
14857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs * THE AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
18857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF
19857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs * OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
20857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs * SOFTWARE.
21857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs */
22857a3294a959015bf893241199f7fd7f7882a6abBen Skeggs
23f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_context.h"
24f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_defines.h"
25f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_state.h"
26f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_inlines.h"
27f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
28f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "pipe/p_shader_tokens.h"
29fda01b584715c05696a0e6768fda669ef1eb5f3bBen Skeggs#include "tgsi/tgsi_parse.h"
30fda01b584715c05696a0e6768fda669ef1eb5f3bBen Skeggs#include "tgsi/tgsi_util.h"
31f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
32f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#include "nv50_context.h"
33f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
34f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs#define NV50_SU_MAX_TEMP 64
35b01d0077af9d93c582e5f53ebd358ac8148b22dfBen Skeggs//#define NV50_PROGRAM_DUMP
36f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
379a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs/* ARL - gallium craps itself on progs/vp/arl.txt
3821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs *
3921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * MSB - Like MAD, but MUL+SUB
4021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * 	- Fuck it off, introduce a way to negate args for ops that
4121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs * 	  support it.
4221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs *
43ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs * Look into inlining IMMD for ops other than MOV (make it general?)
4433e4d30d50344be26398a51365bea1be37487403Ben Skeggs * 	- Maybe even relax restrictions a bit, can't do P_RESULT + P_IMMD,
4533e4d30d50344be26398a51365bea1be37487403Ben Skeggs * 	  but can emit to P_TEMP first - then MOV later. NVIDIA does this
46ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs *
472fdeb4d5a5cc8b93bf885ba646e3a29a68c755edBen Skeggs * In ops such as ADD it's possible to construct a bad opcode in the !is_long()
482fdeb4d5a5cc8b93bf885ba646e3a29a68c755edBen Skeggs * case, if the emit_src() causes the inst to suddenly become long.
492fdeb4d5a5cc8b93bf885ba646e3a29a68c755edBen Skeggs *
50ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs * Verify half-insns work where expected - and force disable them where they
51ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs * don't work - MUL has it forcibly disabled atm as it fixes POW..
52afcaeaa0e4dc3ced40621c76304a2c0c5a3ab403Ben Skeggs *
53afcaeaa0e4dc3ced40621c76304a2c0c5a3ab403Ben Skeggs * FUCK! watch dst==src vectors, can overwrite components that are needed.
54afcaeaa0e4dc3ced40621c76304a2c0c5a3ab403Ben Skeggs * 	ie. SUB R0, R0.yzxw, R0
55776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs *
56b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs * Things to check with renouveau:
57b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs * 	FP attr/result assignment - how?
586d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 		attrib
596d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 			- 0x16bc maps vp output onto fp hpos
606d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 			- 0x16c0 maps vp output onto fp col0
616d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 		result
626d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 			- colr always 0-3
636d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 			- depr always 4
646d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 0x16bc->0x16e8 --> some binding between vp/fp regs
656d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 0x16b8 --> VP output count
666d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs *
676d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 0x1298 --> "MOV rcol.x, fcol.y" "MOV depr, fcol.y" = 0x00000005
686d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 	      "MOV rcol.x, fcol.y" = 0x00000004
696d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 0x19a8 --> as above but 0x00000100 and 0x00000000
706d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 	- 0x00100000 used when KIL used
716d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 0x196c --> as above but 0x00000011 and 0x00000000
726d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs *
736d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 0x1988 --> 0xXXNNNNNN
746d0f7ea95475009ee17862786469f7b9a34a797fBen Skeggs * 	- XX == FP high something
7521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs */
76f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstruct nv50_reg {
77f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	enum {
78f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_TEMP,
79f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_ATTR,
80f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_RESULT,
81f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_CONST,
82f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		P_IMMD
83f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	} type;
84f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int index;
85f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
86f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int hw;
8738ce697e5942550888c28bd4859ca2a92f247bf7Ben Skeggs	int neg;
88f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs};
89f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
90f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstruct nv50_pc {
91f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_program *p;
92f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
93f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	/* hw resources */
94f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *r_temp[NV50_SU_MAX_TEMP];
95f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
96f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	/* tgsi resources */
97f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *temp;
98f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int temp_nr;
99f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *attr;
100f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int attr_nr;
101f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *result;
102f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int result_nr;
103f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *param;
104f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int param_nr;
105f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *immd;
106f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	float *immd_buf;
107f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int immd_nr;
1082a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
10921e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs	struct nv50_reg *temp_temp[16];
1102a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	unsigned temp_temp_nr;
111f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs};
112f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
113f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic void
114f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsalloc_reg(struct nv50_pc *pc, struct nv50_reg *reg)
115f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
116f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int i;
117f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
118fea0b1651677444fc6c135e1a4b8ab6463a9fdf9Ben Skeggs	if (reg->type == P_RESULT) {
119fea0b1651677444fc6c135e1a4b8ab6463a9fdf9Ben Skeggs		if (pc->p->cfg.high_result < (reg->hw + 1))
120fea0b1651677444fc6c135e1a4b8ab6463a9fdf9Ben Skeggs			pc->p->cfg.high_result = reg->hw + 1;
121fea0b1651677444fc6c135e1a4b8ab6463a9fdf9Ben Skeggs	}
122fea0b1651677444fc6c135e1a4b8ab6463a9fdf9Ben Skeggs
1238ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	if (reg->type != P_TEMP)
124f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return;
125f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1268ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	if (reg->hw >= 0) {
1278ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		/*XXX: do this here too to catch FP temp-as-attr usage..
1288ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		 *     not clean, but works */
1298ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		if (pc->p->cfg.high_temp < (reg->hw + 1))
1308ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			pc->p->cfg.high_temp = reg->hw + 1;
1318ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		return;
1328ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	}
1338ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
134f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (i = 0; i < NV50_SU_MAX_TEMP; i++) {
135f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!(pc->r_temp[i])) {
136f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			pc->r_temp[i] = reg;
137f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			reg->hw = i;
1388ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			if (pc->p->cfg.high_temp < (i + 1))
1398ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				pc->p->cfg.high_temp = i + 1;
140f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			return;
141f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
142f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
143f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
144f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	assert(0);
145f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
146f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
147f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic struct nv50_reg *
148f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsalloc_temp(struct nv50_pc *pc, struct nv50_reg *dst)
149f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
150f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_reg *r;
151f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int i;
152f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
153f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (dst && dst->type == P_TEMP && dst->hw == -1)
154f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return dst;
155f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
156f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (i = 0; i < NV50_SU_MAX_TEMP; i++) {
157f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->r_temp[i]) {
158f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r = CALLOC_STRUCT(nv50_reg);
159f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r->type = P_TEMP;
160f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r->index = -1;
161f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			r->hw = i;
162f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			pc->r_temp[i] = r;
163f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			return r;
164f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
165f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
166f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
167f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	assert(0);
168f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return NULL;
169f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
170f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
171f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic void
172f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsfree_temp(struct nv50_pc *pc, struct nv50_reg *r)
173f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
174f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (r->index == -1) {
175619549a6377a58d54c9cf55f8863beed56b09566Ben Skeggs		unsigned hw = r->hw;
176619549a6377a58d54c9cf55f8863beed56b09566Ben Skeggs
177619549a6377a58d54c9cf55f8863beed56b09566Ben Skeggs		FREE(pc->r_temp[hw]);
178619549a6377a58d54c9cf55f8863beed56b09566Ben Skeggs		pc->r_temp[hw] = NULL;
179f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
180f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
181f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1823f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggsstatic int
1833f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggsalloc_temp4(struct nv50_pc *pc, struct nv50_reg *dst[4], int idx)
1843f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs{
1853f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs	int i;
1863f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs
1873f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs	if ((idx + 4) >= NV50_SU_MAX_TEMP)
1883f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs		return 1;
1893f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs
1903f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs	if (pc->r_temp[idx] || pc->r_temp[idx + 1] ||
1913f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs	    pc->r_temp[idx + 2] || pc->r_temp[idx + 3])
1923f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs		return alloc_temp4(pc, dst, idx + 1);
1933f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs
1943f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs	for (i = 0; i < 4; i++) {
1953f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs		dst[i] = CALLOC_STRUCT(nv50_reg);
1963f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs		dst[i]->type = P_TEMP;
1973f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs		dst[i]->index = -1;
1983f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs		dst[i]->hw = idx + i;
1993f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs		pc->r_temp[idx + i] = dst[i];
2003f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs	}
2013f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs
2023f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs	return 0;
2033f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs}
2043f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs
2053f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggsstatic void
2063f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggsfree_temp4(struct nv50_pc *pc, struct nv50_reg *reg[4])
2073f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs{
2083f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs	int i;
2093f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs
2103f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs	for (i = 0; i < 4; i++)
2113f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs		free_temp(pc, reg[i]);
2123f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs}
2133f66b72fdb4834c5211305698d22806eac80aa35Ben Skeggs
214f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic struct nv50_reg *
2152a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggstemp_temp(struct nv50_pc *pc)
2162a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
21721e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs	if (pc->temp_temp_nr >= 16)
2182a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		assert(0);
2192a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
2202a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	pc->temp_temp[pc->temp_temp_nr] = alloc_temp(pc, NULL);
2212a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	return pc->temp_temp[pc->temp_temp_nr++];
2222a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
2232a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
2242a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
2252a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggskill_temp_temp(struct nv50_pc *pc)
2262a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
2272a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	int i;
2282a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
2292a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	for (i = 0; i < pc->temp_temp_nr; i++)
2302a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		free_temp(pc, pc->temp_temp[i]);
2312a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	pc->temp_temp_nr = 0;
2322a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
2332a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
23433e4d30d50344be26398a51365bea1be37487403Ben Skeggsstatic int
23533e4d30d50344be26398a51365bea1be37487403Ben Skeggsctor_immd(struct nv50_pc *pc, float x, float y, float z, float w)
23633e4d30d50344be26398a51365bea1be37487403Ben Skeggs{
237861629d1fd4a1d256c913470c33d9522e83d615dBen Skeggs	pc->immd_buf = REALLOC(pc->immd_buf, (pc->immd_nr * r * sizeof(float)),
238861629d1fd4a1d256c913470c33d9522e83d615dBen Skeggs			       (pc->immd_nr + 1) * 4 * sizeof(float));
23933e4d30d50344be26398a51365bea1be37487403Ben Skeggs	pc->immd_buf[(pc->immd_nr * 4) + 0] = x;
240686bc00c05094e8678747c111a6a70ad4b7063e3Ben Skeggs	pc->immd_buf[(pc->immd_nr * 4) + 1] = y;
241686bc00c05094e8678747c111a6a70ad4b7063e3Ben Skeggs	pc->immd_buf[(pc->immd_nr * 4) + 2] = z;
242686bc00c05094e8678747c111a6a70ad4b7063e3Ben Skeggs	pc->immd_buf[(pc->immd_nr * 4) + 3] = w;
24333e4d30d50344be26398a51365bea1be37487403Ben Skeggs
24433e4d30d50344be26398a51365bea1be37487403Ben Skeggs	return pc->immd_nr++;
24533e4d30d50344be26398a51365bea1be37487403Ben Skeggs}
24633e4d30d50344be26398a51365bea1be37487403Ben Skeggs
24733e4d30d50344be26398a51365bea1be37487403Ben Skeggsstatic struct nv50_reg *
24833e4d30d50344be26398a51365bea1be37487403Ben Skeggsalloc_immd(struct nv50_pc *pc, float f)
24933e4d30d50344be26398a51365bea1be37487403Ben Skeggs{
25033e4d30d50344be26398a51365bea1be37487403Ben Skeggs	struct nv50_reg *r = CALLOC_STRUCT(nv50_reg);
25133e4d30d50344be26398a51365bea1be37487403Ben Skeggs	unsigned hw;
25233e4d30d50344be26398a51365bea1be37487403Ben Skeggs
25301e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	hw = ctor_immd(pc, f, 0, 0, 0) * 4;
25433e4d30d50344be26398a51365bea1be37487403Ben Skeggs	r->type = P_IMMD;
25533e4d30d50344be26398a51365bea1be37487403Ben Skeggs	r->hw = hw;
25633e4d30d50344be26398a51365bea1be37487403Ben Skeggs	r->index = -1;
25733e4d30d50344be26398a51365bea1be37487403Ben Skeggs	return r;
25833e4d30d50344be26398a51365bea1be37487403Ben Skeggs}
25933e4d30d50344be26398a51365bea1be37487403Ben Skeggs
26040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsstatic struct nv50_program_exec *
26140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsexec(struct nv50_pc *pc)
26240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs{
26340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = CALLOC_STRUCT(nv50_program_exec);
26440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs
2651c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs	e->param.index = -1;
26640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	return e;
26740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs}
26840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs
26955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic void
27040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsemit(struct nv50_pc *pc, struct nv50_program_exec *e)
27155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
27255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	struct nv50_program *p = pc->p;
27355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
27440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	if (p->exec_tail)
27540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		p->exec_tail->next = e;
27640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	if (!p->exec_head)
27740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		p->exec_head = e;
27840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	p->exec_tail = e;
27940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	p->exec_size += (e->inst[0] & 1) ? 2 : 1;
28055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
28155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
28240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsstatic INLINE void set_long(struct nv50_pc *, struct nv50_program_exec *);
28355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
28455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic boolean
28540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsis_long(struct nv50_program_exec *e)
28655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
28740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	if (e->inst[0] & 1)
28855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		return TRUE;
28955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	return FALSE;
29055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
29155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
29255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic boolean
29340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsis_immd(struct nv50_program_exec *e)
29455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
29540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	if (is_long(e) && (e->inst[1] & 3) == 3)
29655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		return TRUE;
29755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	return FALSE;
29855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
29955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
30055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
30140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsset_pred(struct nv50_pc *pc, unsigned pred, unsigned idx,
30240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	 struct nv50_program_exec *e)
30355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
30440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
30540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] &= ~((0x1f << 7) | (0x3 << 12));
30640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (pred << 7) | (idx << 12);
30755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
30855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
30955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
31040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsset_pred_wr(struct nv50_pc *pc, unsigned on, unsigned idx,
31140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	    struct nv50_program_exec *e)
31255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
31340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
31440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] &= ~((0x3 << 4) | (1 << 6));
31540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (idx << 4) | (on << 6);
31655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
31755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
31855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
31940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsset_long(struct nv50_pc *pc, struct nv50_program_exec *e)
32055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
32140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	if (is_long(e))
32255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		return;
32355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
32440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 1;
32540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_pred(pc, 0xf, 0, e);
32640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_pred_wr(pc, 0, 0, e);
32755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
32855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
32955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
33040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsset_dst(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_program_exec *e)
33155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
33255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (dst->type == P_RESULT) {
33340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		set_long(pc, e);
33440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[1] |= 0x00000008;
33555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	}
33655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
33755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	alloc_reg(pc, dst);
33840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= (dst->hw << 2);
33955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
34055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
34155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic INLINE void
34240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsset_immd(struct nv50_pc *pc, struct nv50_reg *imm, struct nv50_program_exec *e)
34355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
34455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	unsigned val = fui(pc->immd_buf[imm->hw]); /* XXX */
34555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
34640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
34755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	/*XXX: can't be predicated - bits overlap.. catch cases where both
34855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	 *     are required and avoid them. */
34940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_pred(pc, 0, 0, e);
35040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_pred_wr(pc, 0, 0, e);
35155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
35240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= 0x00000002 | 0x00000001;
35340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= (val & 0x3f) << 16;
35440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (val >> 6) << 2;
35555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
35655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
35755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsstatic void
3588ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggsemit_interp(struct nv50_pc *pc, struct nv50_reg *dst,
3595a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs	    struct nv50_reg *src, struct nv50_reg *iv)
3608ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs{
36140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
3628ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
36340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0x80000000;
36440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
3658ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	alloc_reg(pc, src);
36640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= (src->hw << 16);
3675a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs	if (iv) {
36840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[0] |= (1 << 25);
3695a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs		alloc_reg(pc, iv);
3705a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs		e->inst[0] |= (iv->hw << 9);
3715a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs	}
3728ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
37340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
3748ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs}
3758ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
3768ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggsstatic void
3771c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggsset_data(struct nv50_pc *pc, struct nv50_reg *src, unsigned m, unsigned s,
3781c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs	 struct nv50_program_exec *e)
3792a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
38040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
381aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs#if 1
382aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	e->inst[1] |= (1 << 22);
383aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs#else
3842a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_IMMD) {
38540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[1] |= (NV50_CB_PMISC << 22);
3862a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else {
387b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs		if (pc->p->type == PIPE_SHADER_VERTEX)
38840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e->inst[1] |= (NV50_CB_PVP << 22);
3892a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		else
39040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e->inst[1] |= (NV50_CB_PFP << 22);
3912a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
392aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs#endif
3931c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs
3941c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs	e->param.index = src->hw;
3951c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs	e->param.shift = s;
3961c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs	e->param.mask = m << (s % 32);
3972a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
3982a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
3992a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
40055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggsemit_mov(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
40155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs{
40240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
40355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
40440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0x10000000;
40555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
40640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
40755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
408da66b8a2f4c3c052ad71b2b6d5a845c2fd267c6eBen Skeggs	if (0 && dst->type != P_RESULT && src->type == P_IMMD) {
40940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		set_immd(pc, src, e);
41055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		/*XXX: 32-bit, but steals part of "half" reg space - need to
41155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		 *     catch and handle this case if/when we do half-regs
41255b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		 */
41340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[0] |= 0x00008000;
41455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	} else
41555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	if (src->type == P_IMMD || src->type == P_CONST) {
41640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		set_long(pc, e);
4171c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs		set_data(pc, src, 0x7f, 9, e);
41840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[1] |= 0x20000000; /* src0 const? */
41955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	} else {
42055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		if (src->type == P_ATTR) {
42140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			set_long(pc, e);
42240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e->inst[1] |= 0x00200000;
42355b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		}
42455b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
42555b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs		alloc_reg(pc, src);
42640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[0] |= (src->hw << 9);
42755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	}
42855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
42955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	/* We really should support "half" instructions here at some point,
43055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	 * but I don't feel confident enough about them yet.
43155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	 */
43240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
43340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	if (is_long(e) && !is_immd(e)) {
43440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[1] |= 0x04000000; /* 32-bit */
43540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[1] |= 0x0003c000; /* "subsubop" 0xf == mov */
43655b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	}
43755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
43840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
43955b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs}
44055b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs
4414a7cf8f66ff5d7e15ae7f8f5542f27bc72c68709Christoph Bumillerstatic INLINE void
4424a7cf8f66ff5d7e15ae7f8f5542f27bc72c68709Christoph Bumilleremit_mov_immdval(struct nv50_pc *pc, struct nv50_reg *dst, float f)
4434a7cf8f66ff5d7e15ae7f8f5542f27bc72c68709Christoph Bumiller{
4444a7cf8f66ff5d7e15ae7f8f5542f27bc72c68709Christoph Bumiller	struct nv50_reg *imm = alloc_immd(pc, f);
4454a7cf8f66ff5d7e15ae7f8f5542f27bc72c68709Christoph Bumiller	emit_mov(pc, dst, imm);
4464a7cf8f66ff5d7e15ae7f8f5542f27bc72c68709Christoph Bumiller	FREE(imm);
4474a7cf8f66ff5d7e15ae7f8f5542f27bc72c68709Christoph Bumiller}
4484a7cf8f66ff5d7e15ae7f8f5542f27bc72c68709Christoph Bumiller
449f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic boolean
4502a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggscheck_swap_src_0_1(struct nv50_pc *pc,
4512a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		   struct nv50_reg **s0, struct nv50_reg **s1)
4522a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4532a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	struct nv50_reg *src0 = *s0, *src1 = *s1;
4542a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4552a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src0->type == P_CONST) {
4562a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		if (src1->type != P_CONST) {
4572a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s0 = src1;
4582a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s1 = src0;
4592a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			return TRUE;
4602a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		}
4612a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
4622a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src1->type == P_ATTR) {
4632a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		if (src0->type != P_ATTR) {
4642a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s0 = src1;
4652a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			*s1 = src0;
4662a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			return TRUE;
4672a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		}
4682a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
4692a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4702a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	return FALSE;
4712a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4722a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4732a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
47440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsset_src_0(struct nv50_pc *pc, struct nv50_reg *src, struct nv50_program_exec *e)
4752a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4762a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_ATTR) {
47740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		set_long(pc, e);
47840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[1] |= 0x00200000;
4792a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
4802a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_CONST || src->type == P_IMMD) {
4812a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		struct nv50_reg *temp = temp_temp(pc);
4822a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4832a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mov(pc, temp, src);
4842a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		src = temp;
4852a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
4862a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4872a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	alloc_reg(pc, src);
48840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= (src->hw << 9);
4892a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
4902a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4912a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
49240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsset_src_1(struct nv50_pc *pc, struct nv50_reg *src, struct nv50_program_exec *e)
4932a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
4942a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_ATTR) {
4952a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		struct nv50_reg *temp = temp_temp(pc);
4962a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
4972a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mov(pc, temp, src);
4982a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		src = temp;
4992a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
5002a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_CONST || src->type == P_IMMD) {
50140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		assert(!(e->inst[0] & 0x00800000));
50240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		if (e->inst[0] & 0x01000000) {
50334a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			struct nv50_reg *temp = temp_temp(pc);
50434a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs
50534a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			emit_mov(pc, temp, src);
50634a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			src = temp;
50734a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs		} else {
5081c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs			set_data(pc, src, 0x7f, 16, e);
50940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e->inst[0] |= 0x00800000;
51034a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs		}
5112a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
5122a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5132a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	alloc_reg(pc, src);
51440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= (src->hw << 16);
5152a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
5162a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5172a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
51840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggsset_src_2(struct nv50_pc *pc, struct nv50_reg *src, struct nv50_program_exec *e)
5192a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
52040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
5212a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5222a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_ATTR) {
5232a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		struct nv50_reg *temp = temp_temp(pc);
5242a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5252a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mov(pc, temp, src);
5262a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		src = temp;
5272a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	} else
5282a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (src->type == P_CONST || src->type == P_IMMD) {
52940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		assert(!(e->inst[0] & 0x01000000));
53040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		if (e->inst[0] & 0x00800000) {
53134a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			struct nv50_reg *temp = temp_temp(pc);
53234a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs
53334a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			emit_mov(pc, temp, src);
53434a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs			src = temp;
53534a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs		} else {
5361c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs			set_data(pc, src, 0x7f, 32+14, e);
53740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e->inst[0] |= 0x01000000;
53834a039ae7b158cacb5b20d91067e9d6458d30a56Ben Skeggs		}
5392a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	}
5402a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5412a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	alloc_reg(pc, src);
54240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (src->hw << 14);
5432a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
5442a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5452a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
5462a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_mul(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
5472a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	 struct nv50_reg *src1)
5482a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
54940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
5502a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
55140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0xc0000000;
55240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
5532a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5542a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
55540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
55640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src0, e);
55740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_1(pc, src1, e);
5582a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
55940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
5602a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
5612a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5622a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
56352a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggsemit_add(struct nv50_pc *pc, struct nv50_reg *dst,
56452a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	 struct nv50_reg *src0, struct nv50_reg *src1)
5652a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
56640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
5672a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
56840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0xb0000000;
5692a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5702a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
57140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
57240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src0, e);
57340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	if (is_long(e))
57440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		set_src_2(pc, src1, e);
57552a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	else
57640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		set_src_1(pc, src1, e);
57752a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
57840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
57952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs}
58052a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
58152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggsstatic void
58252a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggsemit_minmax(struct nv50_pc *pc, unsigned sub, struct nv50_reg *dst,
58352a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	    struct nv50_reg *src0, struct nv50_reg *src1)
58452a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs{
58540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
58652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
58740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
58840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0xb0000000;
58940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (sub << 29);
59052a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs
59152a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
59240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
59340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src0, e);
59440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_1(pc, src1, e);
5952a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
59640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
5972a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
5982a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
5992a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
6002a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_sub(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
6012a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	 struct nv50_reg *src1)
6022a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
60340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
6042a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
60540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0xb0000000;
6062a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
60740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
6082a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	if (check_swap_src_0_1(pc, &src0, &src1))
60940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[1] |= 0x04000000;
6102a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	else
61140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[1] |= 0x08000000;
6122a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
61340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
61440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src0, e);
61540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_2(pc, src1, e);
6162a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
61740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
6182a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
6192a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
6202a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
6212a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_mad(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
6222a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	 struct nv50_reg *src1, struct nv50_reg *src2)
6232a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
62440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
6252a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
62640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0xe0000000;
6272a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
6282a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
62940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
63040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src0, e);
63140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_1(pc, src1, e);
63240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_2(pc, src2, e);
6332a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
63440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
6352a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
6362a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
6372a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic void
63821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggsemit_msb(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src0,
63921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	 struct nv50_reg *src1, struct nv50_reg *src2)
64021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs{
64140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
64221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
64340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0xe0000000;
64440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
64540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= 0x08000000; /* src0 * src1 - src2 */
64621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
64721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	check_swap_src_0_1(pc, &src0, &src1);
64840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
64940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src0, e);
65040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_1(pc, src1, e);
65140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_2(pc, src2, e);
65221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
65340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
65421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs}
65521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs
65621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggsstatic void
6572a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsemit_flop(struct nv50_pc *pc, unsigned sub,
6582a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	  struct nv50_reg *dst, struct nv50_reg *src)
6592a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs{
66040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
6612a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
66240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0x90000000;
66352a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	if (sub) {
66440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		set_long(pc, e);
66540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		e->inst[1] |= (sub << 29);
66652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	}
6672a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
66840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
66940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src, e);
6702a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
67140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
6722a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs}
6732a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs
674d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggsstatic void
675d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggsemit_preex2(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
676d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs{
67740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
678d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
67940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0xb0000000;
680d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
68140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
68240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src, e);
68340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
68440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (6 << 29) | 0x00004000;
685d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
68640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
687d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs}
688faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs
689bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggsstatic void
6907b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggsemit_precossin(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
6917b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs{
69240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
6937b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs
69440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0xb0000000;
6957b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs
69640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
69740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src, e);
69840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
69940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (6 << 29);
7007b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs
70140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
7027b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs}
7037b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs
7047b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggsstatic void
705bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggsemit_set(struct nv50_pc *pc, unsigned c_op, struct nv50_reg *dst,
706bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 struct nv50_reg *src0, struct nv50_reg *src1)
707bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs{
70840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
70951ea3aae03154046316b814053f7493bdb10c853Ben Skeggs	unsigned inv_cop[8] = { 0, 4, 2, 6, 1, 5, 3, 7 };
710bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	struct nv50_reg *rdst;
711bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
712bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	assert(c_op <= 7);
713bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (check_swap_src_0_1(pc, &src0, &src1))
714bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		c_op = inv_cop[c_op];
715bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
716bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	rdst = dst;
717bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (dst->type != P_TEMP)
718bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		dst = alloc_temp(pc, NULL);
719bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
720bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	/* set.u32 */
72140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
72240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0xb0000000;
72340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (3 << 29);
72440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (c_op << 14);
725bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	/*XXX: breaks things, .u32 by default?
726bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 *     decuda will disasm as .u16 and use .lo/.hi regs, but this
727bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 *     doesn't seem to match what the hw actually does.
728bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	inst[1] |= 0x04000000; << breaks things.. .u32 by default?
729bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	 */
73040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
73140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src0, e);
73240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_1(pc, src1, e);
73340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
734bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
735bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	/* cvt.f32.u32 */
73640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e = exec(pc);
73740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] = 0xa0000001;
73840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] = 0x64014780;
73940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, rdst, e);
74040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, dst, e);
74140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
742bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs
743bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	if (dst != rdst)
744bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		free_temp(pc, dst);
745bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs}
746d69f33423087fc054181c60724f4bcbe29195e08Ben Skeggs
747b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggsstatic void
748b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggsemit_flr(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
749b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs{
75040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
75140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs
75240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] = 0xa0000000; /* cvt */
75340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
75440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (6 << 29); /* cvt */
75540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= 0x08000000; /* integer mode */
75640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= 0x04000000; /* 32 bit */
75740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= ((0x1 << 3)) << 14; /* .rn */
75840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (1 << 14); /* src .f32 */
75940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
76040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src, e);
76140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs
76240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
763b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs}
764b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs
765faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggsstatic void
766faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggsemit_pow(struct nv50_pc *pc, struct nv50_reg *dst,
767faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	 struct nv50_reg *v, struct nv50_reg *e)
768faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs{
769faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	struct nv50_reg *temp = alloc_temp(pc, NULL);
770faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs
771faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	emit_flop(pc, 3, temp, v);
772faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	emit_mul(pc, temp, temp, e);
773faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	emit_preex2(pc, temp, temp);
774faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	emit_flop(pc, 6, dst, temp);
775faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs
776faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs	free_temp(pc, temp);
777faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs}
778faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs
779fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggsstatic void
780fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggsemit_abs(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
781fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs{
78240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
78340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs
78440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] = 0xa0000000; /* cvt */
78540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
78640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (6 << 29); /* cvt */
78740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= 0x04000000; /* 32 bit */
78840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (1 << 14); /* src .f32 */
78940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= ((1 << 6) << 14); /* .abs */
79040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
79140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src, e);
79240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs
79340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
794fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs}
795fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
79601e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggsstatic void
7977b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggsemit_lit(struct nv50_pc *pc, struct nv50_reg **dst, unsigned mask,
7987b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs	 struct nv50_reg **src)
79901e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs{
80001e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	struct nv50_reg *one = alloc_immd(pc, 1.0);
80101e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	struct nv50_reg *zero = alloc_immd(pc, 0.0);
80201e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	struct nv50_reg *neg128 = alloc_immd(pc, -127.999999);
80301e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	struct nv50_reg *pos128 = alloc_immd(pc,  127.999999);
80401e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	struct nv50_reg *tmp[4];
80501e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
8067b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs	if (mask & (1 << 0))
8077b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_mov(pc, dst[0], one);
8087b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs
8097b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs	if (mask & (1 << 3))
8107b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_mov(pc, dst[3], one);
8117b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs
8127b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs	if (mask & (3 << 1)) {
8137b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		if (mask & (1 << 1))
8147b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs			tmp[0] = dst[1];
8157b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		else
8167b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs			tmp[0] = temp_temp(pc);
8177b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_minmax(pc, 4, tmp[0], src[0], zero);
8187b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs	}
81901e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
8207b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs	if (mask & (1 << 2)) {
82140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		set_pred_wr(pc, 1, 0, pc->p->exec_tail);
82201e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
8237b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		tmp[1] = temp_temp(pc);
8247b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_minmax(pc, 4, tmp[1], src[1], zero);
82501e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
8267b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		tmp[3] = temp_temp(pc);
8277b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_minmax(pc, 4, tmp[3], src[3], neg128);
8287b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_minmax(pc, 5, tmp[3], tmp[3], pos128);
82901e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
8307b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_pow(pc, dst[2], tmp[1], tmp[3]);
8317b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_mov(pc, dst[2], zero);
83240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		set_pred(pc, 3, 0, pc->p->exec_tail);
8337b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs	}
8349417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller
8359417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller	FREE(pos128);
8369417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller	FREE(neg128);
8379417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller	FREE(zero);
8389417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller	FREE(one);
83901e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs}
84001e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs
84131f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggsstatic void
84231f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggsemit_neg(struct nv50_pc *pc, struct nv50_reg *dst, struct nv50_reg *src)
84331f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs{
84440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e = exec(pc);
84531f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs
84640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_long(pc, e);
84740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[0] |= 0xa0000000; /* delta */
84840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (7 << 29); /* delta */
84940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= 0x04000000; /* negate arg0? probably not */
85040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	e->inst[1] |= (1 << 14); /* src .f32 */
85140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_dst(pc, dst, e);
85240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	set_src_0(pc, src, e);
85331f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs
85440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	emit(pc, e);
85531f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs}
85631f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs
857d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggsstatic void
858d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggsemit_kil(struct nv50_pc *pc, struct nv50_reg *src)
859d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs{
860d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs	struct nv50_program_exec *e;
861d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs	const int r_pred = 1;
862d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs
863d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs	/* Sets predicate reg ? */
864d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs	e = exec(pc);
865d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs	e->inst[0] = 0xa00001fd;
866d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs	e->inst[1] = 0xc4014788;
867d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs	set_src_0(pc, src, e);
868d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs	set_pred_wr(pc, 1, r_pred, e);
869d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs	emit(pc, e);
870d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs
871d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs	/* This is probably KILP */
872d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs	e = exec(pc);
873d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs	e->inst[0] = 0x000001fe;
874d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs	set_long(pc, e);
875d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs	set_pred(pc, 1 /* LT? */, r_pred, e);
876d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs	emit(pc, e);
877d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs}
878d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs
879fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggsstatic struct nv50_reg *
880fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggstgsi_dst(struct nv50_pc *pc, int c, const struct tgsi_full_dst_register *dst)
881fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs{
882fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	switch (dst->DstRegister.File) {
883fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_FILE_TEMPORARY:
884fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		return &pc->temp[dst->DstRegister.Index * 4 + c];
885fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_FILE_OUTPUT:
886fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		return &pc->result[dst->DstRegister.Index * 4 + c];
887fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_FILE_NULL:
888fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		return NULL;
889fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	default:
890fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
891fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	}
892fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
893fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	return NULL;
894fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs}
895fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
896fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggsstatic struct nv50_reg *
897fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggstgsi_src(struct nv50_pc *pc, int chan, const struct tgsi_full_src_register *src)
898fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs{
899fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	struct nv50_reg *r = NULL;
900fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	struct nv50_reg *temp;
9019417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller	unsigned sgn, c;
9029417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller
9039417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller	sgn = tgsi_util_get_full_src_register_sign_mode(src, chan);
904fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
905fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	c = tgsi_util_get_full_src_register_extswizzle(src, chan);
906fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	switch (c) {
907fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_X:
908fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_Y:
909fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_Z:
910fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_W:
911fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		switch (src->SrcRegister.File) {
912fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		case TGSI_FILE_INPUT:
913fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			r = &pc->attr[src->SrcRegister.Index * 4 + c];
914fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			break;
915fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		case TGSI_FILE_TEMPORARY:
916fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			r = &pc->temp[src->SrcRegister.Index * 4 + c];
917fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			break;
918fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		case TGSI_FILE_CONSTANT:
919fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			r = &pc->param[src->SrcRegister.Index * 4 + c];
920fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			break;
921fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		case TGSI_FILE_IMMEDIATE:
922fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			r = &pc->immd[src->SrcRegister.Index * 4 + c];
923fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			break;
924c0ed6a871cd3513e17a1fab960f5626485ffed13Ben Skeggs		case TGSI_FILE_SAMPLER:
925c0ed6a871cd3513e17a1fab960f5626485ffed13Ben Skeggs			break;
926fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		default:
927fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			assert(0);
928fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			break;
929fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		}
930fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
931fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_ZERO:
932fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		r = alloc_immd(pc, 0.0);
9339417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		return r;
934fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_EXTSWIZZLE_ONE:
9359417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		if (sgn == TGSI_UTIL_SIGN_TOGGLE || sgn == TGSI_UTIL_SIGN_SET)
9369417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller			return alloc_immd(pc, -1.0);
9379417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		return alloc_immd(pc, 1.0);
938fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	default:
939fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		assert(0);
940fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
941fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	}
942fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
9439417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller	switch (sgn) {
944fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_UTIL_SIGN_KEEP:
945fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
946fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	case TGSI_UTIL_SIGN_CLEAR:
947fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		temp = temp_temp(pc);
948fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		emit_abs(pc, temp, r);
949fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		r = temp;
950fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
95131f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs	case TGSI_UTIL_SIGN_TOGGLE:
95231f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs		temp = temp_temp(pc);
95331f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs		emit_neg(pc, temp, r);
95431f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs		r = temp;
95531f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs		break;
95631f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs	case TGSI_UTIL_SIGN_SET:
95731f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs		temp = temp_temp(pc);
95831f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs		emit_abs(pc, temp, r);
95931f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs		emit_neg(pc, temp, r);
96031f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs		r = temp;
96131f6a24b59b0ac18e04336d2e3cbaa643358c88aBen Skeggs		break;
962fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	default:
963fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		assert(0);
964fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs		break;
965fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	}
966fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
967fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs	return r;
968fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs}
969fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs
9702a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggsstatic boolean
971f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_tx_insn(struct nv50_pc *pc, const union tgsi_full_token *tok)
972f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
973f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	const struct tgsi_full_instruction *inst = &tok->FullInstruction;
974688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	struct nv50_reg *rdst[4], *dst[4], *src[3][4], *temp;
975cd5d3fde13e424373feac9098453ed0ca7f6e4ebBen Skeggs	unsigned mask, sat, unit;
976f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	int i, c;
977f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
978f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	mask = inst->FullDstRegisters[0].DstRegister.WriteMask;
979688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	sat = inst->Instruction.Saturate == TGSI_SAT_ZERO_ONE;
980f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
981f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (c = 0; c < 4; c++) {
982f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (mask & (1 << c))
983f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			dst[c] = tgsi_dst(pc, c, &inst->FullDstRegisters[0]);
984f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		else
985f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			dst[c] = NULL;
9869417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		rdst[c] = NULL;
9879417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		src[0][c] = NULL;
9889417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		src[1][c] = NULL;
9899417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		src[2][c] = NULL;
990f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
991f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
992f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	for (i = 0; i < inst->Instruction.NumSrcRegs; i++) {
9935069bfed29bcee2c89c36c74c6d65d388eb7792eZack Rusin		const struct tgsi_full_src_register *fs = &inst->FullSrcRegisters[i];
994cd5d3fde13e424373feac9098453ed0ca7f6e4ebBen Skeggs
995cd5d3fde13e424373feac9098453ed0ca7f6e4ebBen Skeggs		if (fs->SrcRegister.File == TGSI_FILE_SAMPLER)
996cd5d3fde13e424373feac9098453ed0ca7f6e4ebBen Skeggs			unit = fs->SrcRegister.Index;
997cd5d3fde13e424373feac9098453ed0ca7f6e4ebBen Skeggs
998f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (c = 0; c < 4; c++)
999cd5d3fde13e424373feac9098453ed0ca7f6e4ebBen Skeggs			src[i][c] = tgsi_src(pc, c, fs);
1000f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1001f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1002688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	if (sat) {
1003688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs		for (c = 0; c < 4; c++) {
1004688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			rdst[c] = dst[c];
1005688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			dst[c] = temp_temp(pc);
1006688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs		}
1007688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	}
1008688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs
1009f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	switch (inst->Instruction.Opcode) {
101068091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs	case TGSI_OPCODE_ABS:
101168091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs		for (c = 0; c < 4; c++) {
1012fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			if (!(mask & (1 << c)))
1013fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs				continue;
1014fe90cc509f75772ce202930c934bade1d4b116c8Ben Skeggs			emit_abs(pc, dst[c], src[0][c]);
101568091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs		}
101668091b0c89310c309b668c9d6d80640dc6040ab7Ben Skeggs		break;
10172a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_ADD:
10187df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
10197df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
10207df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
10212a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_add(pc, dst[c], src[0][c], src[1][c]);
10227df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
10232a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
10242a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_COS:
10259417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		temp = temp_temp(pc);
10267b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_precossin(pc, temp, src[0][0]);
10277b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_flop(pc, 5, temp, temp);
10287df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
10297df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
10307df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
10317b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs			emit_mov(pc, dst[c], temp);
10327df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
10332a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
10342a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_DP3:
10359417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		temp = temp_temp(pc);
10362a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mul(pc, temp, src[0][0], src[1][0]);
10372a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][1], src[1][1], temp);
10382a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][2], src[1][2], temp);
10397df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
10407df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
10417df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
10422a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mov(pc, dst[c], temp);
10437df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
10442a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
10452a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_DP4:
10469417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		temp = temp_temp(pc);
10472a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mul(pc, temp, src[0][0], src[1][0]);
10482a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][1], src[1][1], temp);
10492a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][2], src[1][2], temp);
10502a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		emit_mad(pc, temp, src[0][3], src[1][3], temp);
10517df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
10527df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
10537df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
10542a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mov(pc, dst[c], temp);
10557df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
10562a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
105721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	case TGSI_OPCODE_DPH:
10589417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		temp = temp_temp(pc);
105921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mul(pc, temp, src[0][0], src[1][0]);
106021e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mad(pc, temp, src[0][1], src[1][1], temp);
106121e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_mad(pc, temp, src[0][2], src[1][2], temp);
106221e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		emit_add(pc, temp, src[1][3], temp);
106321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		for (c = 0; c < 4; c++) {
106421e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs			if (!(mask & (1 << c)))
106521e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs				continue;
106621e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs			emit_mov(pc, dst[c], temp);
106721e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		}
106821e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		break;
106933e4d30d50344be26398a51365bea1be37487403Ben Skeggs	case TGSI_OPCODE_DST:
107033e4d30d50344be26398a51365bea1be37487403Ben Skeggs	{
107133e4d30d50344be26398a51365bea1be37487403Ben Skeggs		struct nv50_reg *one = alloc_immd(pc, 1.0);
10729a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 0))
10739a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mov(pc, dst[0], one);
10749a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 1))
10759a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mul(pc, dst[1], src[0][1], src[1][1]);
10769a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 2))
10779a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mov(pc, dst[2], src[0][2]);
10789a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 3))
10799a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mov(pc, dst[3], src[1][3]);
108033e4d30d50344be26398a51365bea1be37487403Ben Skeggs		FREE(one);
108133e4d30d50344be26398a51365bea1be37487403Ben Skeggs	}
108233e4d30d50344be26398a51365bea1be37487403Ben Skeggs		break;
10832a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_EX2:
10849417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		temp = temp_temp(pc);
10857b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_preex2(pc, temp, src[0][0]);
10867b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_flop(pc, 6, temp, temp);
10877df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
10887df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
10897df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
10907b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs			emit_mov(pc, dst[c], temp);
10917df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
10922a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
1093b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	case TGSI_OPCODE_FLR:
1094b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		for (c = 0; c < 4; c++) {
1095b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			if (!(mask & (1 << c)))
1096b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs				continue;
1097b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			emit_flr(pc, dst[c], src[0][c]);
1098b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		}
1099b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		break;
1100b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs	case TGSI_OPCODE_FRC:
11019417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		temp = temp_temp(pc);
1102b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		for (c = 0; c < 4; c++) {
1103b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			if (!(mask & (1 << c)))
1104b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs				continue;
1105b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			emit_flr(pc, temp, src[0][c]);
1106b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs			emit_sub(pc, dst[c], src[0][c], temp);
1107b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		}
1108b4f7463585071236d633e4c857dbbdf67b03dc94Ben Skeggs		break;
1109d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs	case TGSI_OPCODE_KIL:
1110d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs		emit_kil(pc, src[0][0]);
1111d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs		emit_kil(pc, src[0][1]);
1112d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs		emit_kil(pc, src[0][2]);
1113d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs		emit_kil(pc, src[0][3]);
1114d2442016afdc5e3b12b04d912f005ab183f7b8ffBen Skeggs		break;
111501e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs	case TGSI_OPCODE_LIT:
11167b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_lit(pc, &dst[0], mask, &src[0][0]);
111701e36eb531dfb4b1b3fd38d3fc00c6770833b5eaBen Skeggs		break;
11182a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_LG2:
11199417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		temp = temp_temp(pc);
11207b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_flop(pc, 3, temp, src[0][0]);
11217df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
11227df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
11237df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
11247b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs			emit_mov(pc, dst[c], temp);
11257df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
11262a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
112721e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs	case TGSI_OPCODE_LRP:
1128229992d2812581ffae24d69a5a983d2c8441f720Christoph Bumiller		temp = temp_temp(pc);
112921e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs		for (c = 0; c < 4; c++) {
113021e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs			if (!(mask & (1 << c)))
113121e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs				continue;
1132229992d2812581ffae24d69a5a983d2c8441f720Christoph Bumiller			emit_sub(pc, temp, src[1][c], src[2][c]);
1133229992d2812581ffae24d69a5a983d2c8441f720Christoph Bumiller			emit_mad(pc, dst[c], temp, src[0][c], src[2][c]);
113421e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs		}
113521e688e0a3faeef18b07c4d860bd71cc6e3ddf4aBen Skeggs		break;
11362a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_MAD:
11377df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
11387df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
11397df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
11402a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mad(pc, dst[c], src[0][c], src[1][c], src[2][c]);
11417df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
11422a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
114352a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	case TGSI_OPCODE_MAX:
11447df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
11457df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
11467df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
114752a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs			emit_minmax(pc, 4, dst[c], src[0][c], src[1][c]);
11487df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
114952a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		break;
115052a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	case TGSI_OPCODE_MIN:
11517df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
11527df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
11537df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
115452a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs			emit_minmax(pc, 5, dst[c], src[0][c], src[1][c]);
11557df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
115652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs		break;
1157f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_OPCODE_MOV:
11587df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
11597df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
11607df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
116155b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs			emit_mov(pc, dst[c], src[0][c]);
11627df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
116338ce697e5942550888c28bd4859ca2a92f247bf7Ben Skeggs		break;
11642a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_MUL:
11657df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
11667df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
11677df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
11682a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_mul(pc, dst[c], src[0][c], src[1][c]);
11697df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
11702a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
1171ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs	case TGSI_OPCODE_POW:
11729417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		temp = temp_temp(pc);
1173faa1c02546db00f69c66db18076b5b0ac86d7138Ben Skeggs		emit_pow(pc, temp, src[0][0], src[1][0]);
1174ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		for (c = 0; c < 4; c++) {
1175ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs			if (!(mask & (1 << c)))
1176ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs				continue;
1177ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs			emit_mov(pc, dst[c], temp);
1178ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		}
1179ea4b09cbcbd9db82648ab30f18c0f46a66ab9f69Ben Skeggs		break;
11802a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_RCP:
11817df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
11827df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
11837df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
11847b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs			emit_flop(pc, 0, dst[c], src[0][0]);
11857df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
11862a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
11872a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_RSQ:
11887df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
11897df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
11907df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
11917b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs			emit_flop(pc, 2, dst[c], src[0][0]);
11927df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
11932a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
11947b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs	case TGSI_OPCODE_SCS:
11959417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		temp = temp_temp(pc);
11967b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_precossin(pc, temp, src[0][0]);
11977b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		if (mask & (1 << 0))
11987b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs			emit_flop(pc, 5, dst[0], temp);
11997b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		if (mask & (1 << 1))
12007b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs			emit_flop(pc, 4, dst[1], temp);
12014a7cf8f66ff5d7e15ae7f8f5542f27bc72c68709Christoph Bumiller		if (mask & (1 << 2))
12024a7cf8f66ff5d7e15ae7f8f5542f27bc72c68709Christoph Bumiller			emit_mov_immdval(pc, dst[2], 0.0);
12034a7cf8f66ff5d7e15ae7f8f5542f27bc72c68709Christoph Bumiller		if (mask & (1 << 3))
12044a7cf8f66ff5d7e15ae7f8f5542f27bc72c68709Christoph Bumiller			emit_mov_immdval(pc, dst[3], 1.0);
12057b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		break;
1206bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	case TGSI_OPCODE_SGE:
1207bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		for (c = 0; c < 4; c++) {
1208bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			if (!(mask & (1 << c)))
1209bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs				continue;
1210bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			emit_set(pc, 6, dst[c], src[0][c], src[1][c]);
1211bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		}
1212bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		break;
12132a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_SIN:
12149417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		temp = temp_temp(pc);
12157b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_precossin(pc, temp, src[0][0]);
12167b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs		emit_flop(pc, 4, temp, temp);
12177df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
12187df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
12197df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
12207b7df34781844c39998d60bbb60880d960da3fb1Ben Skeggs			emit_mov(pc, dst[c], temp);
12217df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
12222a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
1223bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs	case TGSI_OPCODE_SLT:
1224bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		for (c = 0; c < 4; c++) {
1225bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			if (!(mask & (1 << c)))
1226bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs				continue;
1227bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs			emit_set(pc, 1, dst[c], src[0][c], src[1][c]);
1228bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		}
1229bdd31c20abb27665ca701a5a46e29d4cfa71f679Ben Skeggs		break;
12302a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs	case TGSI_OPCODE_SUB:
12317df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		for (c = 0; c < 4; c++) {
12327df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs			if (!(mask & (1 << c)))
12337df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs				continue;
12342a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs			emit_sub(pc, dst[c], src[0][c], src[1][c]);
12357df7f7bb99441ed8e2fba2840e0459e72691f272Ben Skeggs		}
12362a1fb44d75364f2492a1ae5d232218a92b8ca807Ben Skeggs		break;
1237c0ed6a871cd3513e17a1fab960f5626485ffed13Ben Skeggs	case TGSI_OPCODE_TEX:
12385696267efd6f85d79f5fe511d1a066a17c4d1cccBen Skeggs	case TGSI_OPCODE_TXP:
12390d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs	{
12400d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs		struct nv50_reg *t[4];
12410d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs		struct nv50_program_exec *e;
1242431504b99cd55948522e86a249e656e78598ddbdBen Skeggs
12430d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs		alloc_temp4(pc, t, 0);
12440d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs		emit_mov(pc, t[0], src[0][0]);
12450d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs		emit_mov(pc, t[1], src[0][1]);
1246431504b99cd55948522e86a249e656e78598ddbdBen Skeggs
12470d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs		e = exec(pc);
12480d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs		e->inst[0] = 0xf6400000;
1249cd5d3fde13e424373feac9098453ed0ca7f6e4ebBen Skeggs		e->inst[0] |= (unit << 9);
12500d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs		set_long(pc, e);
12510d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs		e->inst[1] |= 0x0000c004;
12520d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs		set_dst(pc, t[0], e);
12530d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs		emit(pc, e);
1254fd7412a7f1beab8b81ce307b1054331eee102e8bBen Skeggs
12550d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs		if (mask & (1 << 0)) emit_mov(pc, dst[0], t[0]);
12560d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs		if (mask & (1 << 1)) emit_mov(pc, dst[1], t[1]);
12570d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs		if (mask & (1 << 2)) emit_mov(pc, dst[2], t[2]);
12580d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs		if (mask & (1 << 3)) emit_mov(pc, dst[3], t[3]);
1259fd7412a7f1beab8b81ce307b1054331eee102e8bBen Skeggs
12600d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs		free_temp4(pc, t);
12610d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs	}
1262c0ed6a871cd3513e17a1fab960f5626485ffed13Ben Skeggs		break;
126321e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs	case TGSI_OPCODE_XPD:
12649417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		temp = temp_temp(pc);
12659a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 0)) {
12669a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mul(pc, temp, src[0][2], src[1][1]);
12679a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_msb(pc, dst[0], src[0][1], src[1][2], temp);
12689a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		}
12699a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 1)) {
12709a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mul(pc, temp, src[0][0], src[1][2]);
12719a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_msb(pc, dst[1], src[0][2], src[1][0], temp);
12729a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		}
12739a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		if (mask & (1 << 2)) {
12749a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_mul(pc, temp, src[0][1], src[1][0]);
12759a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs			emit_msb(pc, dst[2], src[0][0], src[1][1], temp);
12769a37a56c8ab8c64bdadb1e1e807f885d6a5e3121Ben Skeggs		}
12774a7cf8f66ff5d7e15ae7f8f5542f27bc72c68709Christoph Bumiller		if (mask & (1 << 3))
12784a7cf8f66ff5d7e15ae7f8f5542f27bc72c68709Christoph Bumiller			emit_mov_immdval(pc, dst[3], 1.0);
127921e18e2b74d71c93af06ef4c603ca371c4614237Ben Skeggs		break;
1280f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	case TGSI_OPCODE_END:
1281f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		break;
1282f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	default:
1283f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		NOUVEAU_ERR("invalid opcode %d\n", inst->Instruction.Opcode);
1284f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return FALSE;
1285f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1286f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1287688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	if (sat) {
1288688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs		for (c = 0; c < 4; c++) {
128940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			struct nv50_program_exec *e;
1290688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs
1291688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs			if (!(mask & (1 << c)))
1292688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs				continue;
129340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e = exec(pc);
129440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs
129540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e->inst[0] = 0xa0000000; /* cvt */
129640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			set_long(pc, e);
129740137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e->inst[1] |= (6 << 29); /* cvt */
129840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e->inst[1] |= 0x04000000; /* 32 bit */
129940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e->inst[1] |= (1 << 14); /* src .f32 */
130040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			e->inst[1] |= ((1 << 5) << 14); /* .sat */
130140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			set_dst(pc, rdst[c], e);
130240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			set_src_0(pc, dst[c], e);
130340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs			emit(pc, e);
1304688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs		}
1305688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs	}
1306688064236ba8b5997014493eb6c6e3fe0739813eBen Skeggs
13079417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller	for (i = 0; i < inst->Instruction.NumSrcRegs; i++) {
13089417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		for (c = 0; c < 4; c++) {
13099417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller			if (!src[i][c])
13109417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller				continue;
13119417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller			if (src[i][c]->index == -1 && src[i][c]->type == P_IMMD)
13129417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller				FREE(src[i][c]);
13139417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		}
13149417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller	}
13159417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller
131652a69196c1680ff16d1ad1fc88e5869bc6055d00Ben Skeggs	kill_temp_temp(pc);
1317f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return TRUE;
1318f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1319f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1320f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic boolean
1321f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_tx_prep(struct nv50_pc *pc)
1322f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1323f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct tgsi_parse_context p;
1324f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	boolean ret = FALSE;
1325f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	unsigned i, c;
1326f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1327f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_init(&p, pc->p->pipe.tokens);
1328f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	while (!tgsi_parse_end_of_tokens(&p)) {
1329f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		const union tgsi_full_token *tok = &p.FullToken;
1330f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1331f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		tgsi_parse_token(&p);
1332f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		switch (tok->Token.Type) {
1333f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_IMMEDIATE:
1334f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		{
1335f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			const struct tgsi_full_immediate *imm =
1336f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				&p.FullToken.FullImmediate;
1337f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
133833e4d30d50344be26398a51365bea1be37487403Ben Skeggs			ctor_immd(pc, imm->u.ImmediateFloat32[0].Float,
133933e4d30d50344be26398a51365bea1be37487403Ben Skeggs				      imm->u.ImmediateFloat32[1].Float,
134033e4d30d50344be26398a51365bea1be37487403Ben Skeggs				      imm->u.ImmediateFloat32[2].Float,
134133e4d30d50344be26398a51365bea1be37487403Ben Skeggs				      imm->u.ImmediateFloat32[3].Float);
1342f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1343f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1344f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_DECLARATION:
1345f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		{
1346f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			const struct tgsi_full_declaration *d;
1347f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			unsigned last;
1348f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1349f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			d = &p.FullToken.FullDeclaration;
1350bf94027fdde51aed476e9bfdd4326aa9040440b0Ben Skeggs			last = d->DeclarationRange.Last;
1351f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1352f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			switch (d->Declaration.File) {
1353f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_TEMPORARY:
1354f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->temp_nr < (last + 1))
1355f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->temp_nr = last + 1;
1356f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
1357f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_OUTPUT:
1358f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->result_nr < (last + 1))
1359f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->result_nr = last + 1;
1360f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
1361f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_INPUT:
1362f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->attr_nr < (last + 1))
1363f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->attr_nr = last + 1;
1364f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
1365f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			case TGSI_FILE_CONSTANT:
1366f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				if (pc->param_nr < (last + 1))
1367f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					pc->param_nr = last + 1;
1368f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				break;
1369c0ed6a871cd3513e17a1fab960f5626485ffed13Ben Skeggs			case TGSI_FILE_SAMPLER:
1370c0ed6a871cd3513e17a1fab960f5626485ffed13Ben Skeggs				break;
1371f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			default:
1372f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				NOUVEAU_ERR("bad decl file %d\n",
1373f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs					    d->Declaration.File);
1374f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				goto out_err;
1375f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1376f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1377f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1378f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_INSTRUCTION:
1379f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1380f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		default:
1381f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1382f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1383f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1384f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1385f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->temp_nr) {
1386861629d1fd4a1d256c913470c33d9522e83d615dBen Skeggs		pc->temp = CALLOC(pc->temp_nr * 4, sizeof(struct nv50_reg));
1387f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->temp)
1388f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1389f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1390f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->temp_nr; i++) {
1391f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1392f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->temp[i*4+c].type = P_TEMP;
1393f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->temp[i*4+c].hw = -1;
1394f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->temp[i*4+c].index = i;
1395f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1396f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1397f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1398f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1399f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->attr_nr) {
1400fa5cd63f96d2b69ded48d40b9cb7e57c147f7332Ben Skeggs		struct nv50_reg *iv = NULL;
1401f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		int aid = 0;
1402f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1403861629d1fd4a1d256c913470c33d9522e83d615dBen Skeggs		pc->attr = CALLOC(pc->attr_nr * 4, sizeof(struct nv50_reg));
1404f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->attr)
1405f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1406f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1407b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs		if (pc->p->type == PIPE_SHADER_FRAGMENT) {
14088ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			iv = alloc_temp(pc, NULL);
14095a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs			emit_interp(pc, iv, iv, NULL);
1410fa5cd63f96d2b69ded48d40b9cb7e57c147f7332Ben Skeggs			emit_flop(pc, 0, iv, iv);
14118ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			aid++;
14128ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		}
14138ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
1414f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->attr_nr; i++) {
14158ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			struct nv50_reg *a = &pc->attr[i*4];
14168ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
1417f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1418b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs				if (pc->p->type == PIPE_SHADER_FRAGMENT) {
14198ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					struct nv50_reg *at =
14208ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs						alloc_temp(pc, NULL);
14218ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].type = at->type;
14228ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].hw = at->hw;
14238ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].index = at->index;
14248ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				} else {
14258ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->p->cfg.vp.attr[aid/32] |=
14268ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs						(1 << (aid % 32));
14278ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].type = P_ATTR;
14288ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].hw = aid++;
14298ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->attr[i*4+c].index = i;
14308ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				}
1431f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
14328ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
1433b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs			if (pc->p->type != PIPE_SHADER_FRAGMENT)
14348ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs				continue;
14358ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
14365a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs			emit_interp(pc, &a[0], &a[0], iv);
14375a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs			emit_interp(pc, &a[1], &a[1], iv);
14385a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs			emit_interp(pc, &a[2], &a[2], iv);
14395a3ea9ee59ac586955f7784eb25e7fd70d0c8882Ben Skeggs			emit_interp(pc, &a[3], &a[3], iv);
1440f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
14418ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs
14428ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs		if (iv)
14438ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs			free_temp(pc, iv);
1444f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1445f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1446f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->result_nr) {
1447f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		int rid = 0;
1448f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1449861629d1fd4a1d256c913470c33d9522e83d615dBen Skeggs		pc->result = CALLOC(pc->result_nr * 4, sizeof(struct nv50_reg));
1450f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->result)
1451f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1452f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1453f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->result_nr; i++) {
1454f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1455b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs				if (pc->p->type == PIPE_SHADER_FRAGMENT) {
14568ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->result[i*4+c].type = P_TEMP;
1457776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs					pc->result[i*4+c].hw = -1;
1458776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs				} else {
14598ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs					pc->result[i*4+c].type = P_RESULT;
1460776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs					pc->result[i*4+c].hw = rid++;
1461776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs				}
1462f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->result[i*4+c].index = i;
1463f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1464f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1465f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1466f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1467f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->param_nr) {
1468f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		int rid = 0;
1469f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1470861629d1fd4a1d256c913470c33d9522e83d615dBen Skeggs		pc->param = CALLOC(pc->param_nr * 4, sizeof(struct nv50_reg));
1471f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->param)
1472f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1473f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1474f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->param_nr; i++) {
1475f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1476f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->param[i*4+c].type = P_CONST;
1477f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->param[i*4+c].hw = rid++;
1478f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->param[i*4+c].index = i;
1479f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1480f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1481f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1482f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1483f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (pc->immd_nr) {
1484aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs		int rid = pc->param_nr * 4;
1485f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1486861629d1fd4a1d256c913470c33d9522e83d615dBen Skeggs		pc->immd = CALLOC(pc->immd_nr * 4, sizeof(struct nv50_reg));
1487f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!pc->immd)
1488f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			goto out_err;
1489f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1490f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		for (i = 0; i < pc->immd_nr; i++) {
1491f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			for (c = 0; c < 4; c++) {
1492f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->immd[i*4+c].type = P_IMMD;
1493f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->immd[i*4+c].hw = rid++;
1494f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				pc->immd[i*4+c].index = i;
1495f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			}
1496f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1497f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1498f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1499f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	ret = TRUE;
1500f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsout_err:
1501f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_free(&p);
1502f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return ret;
1503f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1504f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
15059417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumillerstatic void
15069417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumillerfree_nv50_pc(struct nv50_pc *pc)
15079417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller{
15089417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller	unsigned i;
15099417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller
15109417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller	if (pc->immd)
15119417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		FREE(pc->immd);
15129417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller	if (pc->param)
15139417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		FREE(pc->param);
15149417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller	if (pc->result)
15159417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		FREE(pc->result);
15169417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller	if (pc->attr)
15179417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		FREE(pc->attr);
15189417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller	if (pc->temp)
15199417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		FREE(pc->temp);
15209417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller
15219417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller	for (i = 0; i < NV50_SU_MAX_TEMP; i++) {
15229417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		/* deallocate fragment program attributes */
15239417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller		if (pc->r_temp[i] && pc->r_temp[i]->index == -1)
15249417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller			FREE(pc->r_temp[i]);
15259417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller	}
15269417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller
15279417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller	FREE(pc);
15289417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller}
15299417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller
1530f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic boolean
1531f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_tx(struct nv50_program *p)
1532f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1533f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct tgsi_parse_context parse;
1534f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_pc *pc;
1535f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	boolean ret;
1536f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1537f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	pc = CALLOC_STRUCT(nv50_pc);
1538f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (!pc)
1539f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		return FALSE;
1540f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	pc->p = p;
15418ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	pc->p->cfg.high_temp = 4;
1542f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1543f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	ret = nv50_program_tx_prep(pc);
1544f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (ret == FALSE)
1545f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		goto out_cleanup;
1546f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1547f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_init(&parse, pc->p->pipe.tokens);
1548f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	while (!tgsi_parse_end_of_tokens(&parse)) {
1549f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		const union tgsi_full_token *tok = &parse.FullToken;
1550f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1551f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		tgsi_parse_token(&parse);
1552f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1553f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		switch (tok->Token.Type) {
1554f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		case TGSI_TOKEN_TYPE_INSTRUCTION:
1555f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			ret = nv50_program_tx_insn(pc, tok);
1556f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			if (ret == FALSE)
1557f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs				goto out_err;
1558f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1559f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		default:
1560f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			break;
1561f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		}
1562f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1563f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1564b5bbf09c42a9d563984fad875ced5c4814033a3dBen Skeggs	if (p->type == PIPE_SHADER_FRAGMENT) {
1565776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs		struct nv50_reg out;
1566776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs
1567776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs		out.type = P_TEMP;
1568776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs		for (out.hw = 0; out.hw < pc->result_nr * 4; out.hw++)
1569776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs			emit_mov(pc, &out, &pc->result[out.hw]);
1570776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs	}
1571776e9581d16fc0fd28058fbcd879756fd5d40b96Ben Skeggs
157240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	assert(is_long(pc->p->exec_tail) && !is_immd(pc->p->exec_head));
157340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	pc->p->exec_tail->inst[1] |= 0x00000001;
157440137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs
1575aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	p->param_nr = pc->param_nr * 4;
1576f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->immd_nr = pc->immd_nr * 4;
1577f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->immd = pc->immd_buf;
1578f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1579f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsout_err:
1580f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	tgsi_parse_free(&parse);
1581f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1582f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsout_cleanup:
15839417582f39788476e1039df3f1bdf681686fb7b4Christoph Bumiller	free_nv50_pc(pc);
1584f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	return ret;
1585f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1586f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1587f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsstatic void
1588f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_validate(struct nv50_context *nv50, struct nv50_program *p)
1589f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1590e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs	if (nv50_program_tx(p) == FALSE)
1591e55964099b0d47dea80920765daac09b9e2a61a7Ben Skeggs		assert(0);
1592f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->translated = TRUE;
1593f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1594f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
159522e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsstatic void
1596ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggsnv50_program_upload_data(struct nv50_context *nv50, float *map,
1597ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs			 unsigned start, unsigned count)
1598ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs{
159975f0b38d9ea4a7318b0d661712dda15e24707395Ben Skeggs	struct nouveau_channel *chan = nv50->screen->nvws->channel;
160075f0b38d9ea4a7318b0d661712dda15e24707395Ben Skeggs	struct nouveau_grobj *tesla = nv50->screen->tesla;
160175f0b38d9ea4a7318b0d661712dda15e24707395Ben Skeggs
1602ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs	while (count) {
1603ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs		unsigned nr = count > 2047 ? 2047 : count;
1604ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs
160575f0b38d9ea4a7318b0d661712dda15e24707395Ben Skeggs		BEGIN_RING(chan, tesla, 0x00000f00, 1);
160675f0b38d9ea4a7318b0d661712dda15e24707395Ben Skeggs		OUT_RING  (chan, (NV50_CB_PMISC << 0) | (start << 8));
160775f0b38d9ea4a7318b0d661712dda15e24707395Ben Skeggs		BEGIN_RING(chan, tesla, 0x40000f04, nr);
160875f0b38d9ea4a7318b0d661712dda15e24707395Ben Skeggs		OUT_RINGp (chan, map, nr);
1609ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs
1610ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs		map += nr;
1611ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs		start += nr;
1612ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs		count -= nr;
1613ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs	}
1614ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs}
1615ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs
1616ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggsstatic void
161722e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsnv50_program_validate_data(struct nv50_context *nv50, struct nv50_program *p)
161822e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs{
1619aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	struct nouveau_winsys *nvws = nv50->screen->nvws;
1620aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	struct pipe_winsys *ws = nv50->pipe.winsys;
1621aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	unsigned nr = p->param_nr + p->immd_nr;
162222e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
1623aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	if (!p->data && nr) {
1624aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs		struct nouveau_resource *heap = nv50->screen->vp_data_heap;
1625aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs
1626aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs		if (nvws->res_alloc(heap, nr, p, &p->data)) {
1627aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs			while (heap->next && heap->size < nr) {
1628aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs				struct nv50_program *evict = heap->next->priv;
1629aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs				nvws->res_free(&evict->data);
1630aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs			}
1631aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs
1632aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs			if (nvws->res_alloc(heap, nr, p, &p->data))
1633aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs				assert(0);
1634aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs		}
1635aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	}
1636aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs
1637aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	if (p->param_nr) {
1638aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs		float *map = ws->buffer_map(ws, nv50->constbuf[p->type],
1639aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs					    PIPE_BUFFER_USAGE_CPU_READ);
1640ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs		nv50_program_upload_data(nv50, map, p->data->start,
1641ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs					 p->param_nr);
1642aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs		ws->buffer_unmap(ws, nv50->constbuf[p->type]);
1643aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	}
1644aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs
1645ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs	if (p->immd_nr) {
1646ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs		nv50_program_upload_data(nv50, p->immd,
1647ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs					 p->data->start + p->param_nr,
1648ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs					 p->immd_nr);
164922e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	}
165022e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs}
165122e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
165222e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsstatic void
165322e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggsnv50_program_validate_code(struct nv50_context *nv50, struct nv50_program *p)
165422e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs{
165575f0b38d9ea4a7318b0d661712dda15e24707395Ben Skeggs	struct nouveau_channel *chan = nv50->screen->nvws->channel;
165675f0b38d9ea4a7318b0d661712dda15e24707395Ben Skeggs	struct nouveau_grobj *tesla = nv50->screen->tesla;
16575e27cd46c04a9e7b5904cc014bffd0f4daae31feMichel Dänzer	struct pipe_screen *screen = nv50->pipe.screen;
165840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	struct nv50_program_exec *e;
1659cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	struct nouveau_stateobj *so;
1660cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	const unsigned flags = NOUVEAU_BO_VRAM | NOUVEAU_BO_WR;
1661cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	unsigned start, count, *up, *ptr;
1662f700d6be6335a4d4394296891f783687b6f2d4f2Ben Skeggs	boolean upload = FALSE;
166322e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
1664f700d6be6335a4d4394296891f783687b6f2d4f2Ben Skeggs	if (!p->buffer) {
16655e27cd46c04a9e7b5904cc014bffd0f4daae31feMichel Dänzer		p->buffer = screen->buffer_create(screen, 0x100, 0, p->exec_size * 4);
1666f700d6be6335a4d4394296891f783687b6f2d4f2Ben Skeggs		upload = TRUE;
1667f700d6be6335a4d4394296891f783687b6f2d4f2Ben Skeggs	}
166840137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs
1669aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	if (p->data && p->data->start != p->data_start) {
1670aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs		for (e = p->exec_head; e; e = e->next) {
1671ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs			unsigned ei, ci;
1672ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs
1673aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs			if (e->param.index < 0)
1674aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs				continue;
1675ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs			ei = e->param.shift >> 5;
1676ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs			ci = e->param.index + p->data->start;
1677ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs
1678ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs			e->inst[ei] &= ~e->param.mask;
1679ab3d55e2e3578db8deba84dcf47a024071486bd8Ben Skeggs			e->inst[ei] |= (ci << e->param.shift);
16801c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs		}
16811c7489bd7e5391136d0f2e68b467de89eb2d2bfcBen Skeggs
1682aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs		p->data_start = p->data->start;
1683f700d6be6335a4d4394296891f783687b6f2d4f2Ben Skeggs		upload = TRUE;
1684aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	}
1685aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs
1686f700d6be6335a4d4394296891f783687b6f2d4f2Ben Skeggs	if (!upload)
1687bf94027fdde51aed476e9bfdd4326aa9040440b0Ben Skeggs		return;
1688f700d6be6335a4d4394296891f783687b6f2d4f2Ben Skeggs
1689b01d0077af9d93c582e5f53ebd358ac8148b22dfBen Skeggs#ifdef NV50_PROGRAM_DUMP
16900d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs	NOUVEAU_ERR("-------\n");
1691aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs	for (e = p->exec_head; e; e = e->next) {
16920d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs		NOUVEAU_ERR("0x%08x\n", e->inst[0]);
16930d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs		if (is_long(e))
16940d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs			NOUVEAU_ERR("0x%08x\n", e->inst[1]);
1695b01d0077af9d93c582e5f53ebd358ac8148b22dfBen Skeggs	}
1696b01d0077af9d93c582e5f53ebd358ac8148b22dfBen Skeggs#endif
16970d54770cabbe034b0f07ab1b211c374d92ce19d4Ben Skeggs
1698b01d0077af9d93c582e5f53ebd358ac8148b22dfBen Skeggs	up = ptr = MALLOC(p->exec_size * 4);
1699b01d0077af9d93c582e5f53ebd358ac8148b22dfBen Skeggs	for (e = p->exec_head; e; e = e->next) {
1700cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		*(ptr++) = e->inst[0];
1701cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		if (is_long(e))
1702cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs			*(ptr++) = e->inst[1];
1703cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	}
1704cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs
1705e002ad77398fbe14a0efbd91824c3325ca09b4c1Ben Skeggs	so = so_new(4,2);
1706cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	so_method(so, nv50->screen->tesla, 0x1280, 3);
1707cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	so_reloc (so, p->buffer, 0, flags | NOUVEAU_BO_HIGH, 0, 0);
1708cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	so_reloc (so, p->buffer, 0, flags | NOUVEAU_BO_LOW, 0, 0);
1709cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	so_data  (so, (NV50_CB_PUPLOAD << 16) | 0x0800); //(p->exec_size * 4));
1710cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs
1711cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	start = 0; count = p->exec_size;
1712cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	while (count) {
1713cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		struct nouveau_winsys *nvws = nv50->screen->nvws;
1714cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		unsigned nr;
1715cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs
1716cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		so_emit(nvws, so);
1717cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs
1718cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		nr = MIN2(count, 2047);
1719cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		nr = MIN2(nvws->channel->pushbuf->remaining, nr);
1720cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		if (nvws->channel->pushbuf->remaining < (nr + 3)) {
172175f0b38d9ea4a7318b0d661712dda15e24707395Ben Skeggs			FIRE_RING(chan);
1722cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs			continue;
1723aea1669ff221f97682f0be6a60632e40c2739d09Ben Skeggs		}
1724cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs
172575f0b38d9ea4a7318b0d661712dda15e24707395Ben Skeggs		BEGIN_RING(chan, tesla, 0x0f00, 1);
172675f0b38d9ea4a7318b0d661712dda15e24707395Ben Skeggs		OUT_RING  (chan, (start << 8) | NV50_CB_PUPLOAD);
172775f0b38d9ea4a7318b0d661712dda15e24707395Ben Skeggs		BEGIN_RING(chan, tesla, 0x40000f04, nr);
172875f0b38d9ea4a7318b0d661712dda15e24707395Ben Skeggs		OUT_RINGp (chan, up + start, nr);
1729cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs
1730cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		start += nr;
1731cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs		count -= nr;
173240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	}
1733cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs
1734cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	FREE(up);
1735cae38d0fcc6c936d3a4dc25ca2dbef3d106d05a5Ben Skeggs	so_ref(NULL, &so);
173622e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs}
173722e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs
1738f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsvoid
1739f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_vertprog_validate(struct nv50_context *nv50)
1740f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1741f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_grobj *tesla = nv50->screen->tesla;
1742f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_program *p = nv50->vertprog;
1743f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_stateobj *so;
1744f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1745f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (!p->translated) {
1746f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		nv50_program_validate(nv50, p);
1747f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!p->translated)
1748f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			assert(0);
1749f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1750f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
175122e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	nv50_program_validate_data(nv50, p);
175222e0acc466947b203574c88f4964f61ef46ae3fdBen Skeggs	nv50_program_validate_code(nv50, p);
1753f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1754e002ad77398fbe14a0efbd91824c3325ca09b4c1Ben Skeggs	so = so_new(13, 2);
1755f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, NV50TCL_VP_ADDRESS_HIGH, 2);
1756f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1757f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_HIGH, 0, 0);
1758f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1759f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_LOW, 0, 0);
1760f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, 0x1650, 2);
1761f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, p->cfg.vp.attr[0]);
1762f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, p->cfg.vp.attr[1]);
1763fea0b1651677444fc6c135e1a4b8ab6463a9fdf9Ben Skeggs	so_method(so, tesla, 0x16b8, 1);
1764fea0b1651677444fc6c135e1a4b8ab6463a9fdf9Ben Skeggs	so_data  (so, p->cfg.high_result);
1765f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, 0x16ac, 2);
1766bcbe6baac37915563bc120ad558cd930bc1ddec1Ben Skeggs	so_data  (so, p->cfg.high_result); //8);
17678ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_data  (so, p->cfg.high_temp);
1768f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, 0x140c, 1);
1769f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_data  (so, 0); /* program start offset */
1770bb9efb5534a652878161e28bd73039eff5b11014Ben Skeggs	so_ref(so, &nv50->state.vertprog);
1771ca95d71a4bc63e2ea45abf9096a3da802819ef92Ben Skeggs	so_ref(NULL, &so);
1772f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1773f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1774f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsvoid
1775f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_fragprog_validate(struct nv50_context *nv50)
1776f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
1777f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_grobj *tesla = nv50->screen->tesla;
1778f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nv50_program *p = nv50->fragprog;
1779f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	struct nouveau_stateobj *so;
1780f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1781f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (!p->translated) {
1782f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		nv50_program_validate(nv50, p);
1783f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		if (!p->translated)
1784f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs			assert(0);
1785f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
1786f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
178755b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	nv50_program_validate_data(nv50, p);
178855b2fe1047b37d0d86641a252e1c745111030393Ben Skeggs	nv50_program_validate_code(nv50, p);
1789f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1790585ae74d87f3d04a4b5b7c068b865292afd1a16bBen Skeggs	so = so_new(64, 2);
1791f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_method(so, tesla, NV50TCL_FP_ADDRESS_HIGH, 2);
1792f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1793f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_HIGH, 0, 0);
1794f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	so_reloc (so, p->buffer, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD |
1795f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs		  NOUVEAU_BO_LOW, 0, 0);
1796585ae74d87f3d04a4b5b7c068b865292afd1a16bBen Skeggs	so_method(so, tesla, 0x1904, 4);
17978337c78d91612d615a1368ee8ee188d80574fad4Ben Skeggs	so_data  (so, 0x00040404); /* p: 0x01000404 */
1798585ae74d87f3d04a4b5b7c068b865292afd1a16bBen Skeggs	so_data  (so, 0x00000004);
1799585ae74d87f3d04a4b5b7c068b865292afd1a16bBen Skeggs	so_data  (so, 0x00000000);
1800585ae74d87f3d04a4b5b7c068b865292afd1a16bBen Skeggs	so_data  (so, 0x00000000);
1801fea0b1651677444fc6c135e1a4b8ab6463a9fdf9Ben Skeggs	so_method(so, tesla, 0x16bc, 3); /*XXX: fixme */
1802585ae74d87f3d04a4b5b7c068b865292afd1a16bBen Skeggs	so_data  (so, 0x03020100);
1803585ae74d87f3d04a4b5b7c068b865292afd1a16bBen Skeggs	so_data  (so, 0x07060504);
1804fea0b1651677444fc6c135e1a4b8ab6463a9fdf9Ben Skeggs	so_data  (so, 0x0b0a0908);
1805585ae74d87f3d04a4b5b7c068b865292afd1a16bBen Skeggs	so_method(so, tesla, 0x1988, 2);
1806bcbe6baac37915563bc120ad558cd930bc1ddec1Ben Skeggs	so_data  (so, 0x08080408); //0x08040404); /* p: 0x0f000401 */
18078ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_data  (so, p->cfg.high_temp);
18088ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_method(so, tesla, 0x1414, 1);
18098ec6415e9fcf876c67bc1624f3eb7dd7624b7791Ben Skeggs	so_data  (so, 0); /* program start offset */
1810bb9efb5534a652878161e28bd73039eff5b11014Ben Skeggs	so_ref(so, &nv50->state.fragprog);
1811ca95d71a4bc63e2ea45abf9096a3da802819ef92Ben Skeggs	so_ref(NULL, &so);
1812f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1813f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1814f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsvoid
1815f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggsnv50_program_destroy(struct nv50_context *nv50, struct nv50_program *p)
1816f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs{
181700b15c9f40944d94aa28a441edd7ebb51577d9baBen Skeggs	struct pipe_screen *pscreen = nv50->pipe.screen;
1818f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
181940137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	while (p->exec_head) {
182040137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		struct nv50_program_exec *e = p->exec_head;
182140137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs
182240137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		p->exec_head = e->next;
182340137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs		FREE(e);
1824f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	}
182540137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	p->exec_tail = NULL;
182640137ea2631a0c8158f99ae30ca90ed038b72076Ben Skeggs	p->exec_size = 0;
1827f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1828f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	if (p->buffer)
18295e27cd46c04a9e7b5904cc014bffd0f4daae31feMichel Dänzer		pipe_buffer_reference(&p->buffer, NULL);
1830f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
18317c745de74997e859d7e2640092bda9ad900e28a9Ben Skeggs	nv50->screen->nvws->res_free(&p->data);
18327c745de74997e859d7e2640092bda9ad900e28a9Ben Skeggs
1833f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs	p->translated = 0;
1834f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs}
1835f722fd937db2f3cacf1947d538c66528fd16eb89Ben Skeggs
1836