1/*
2 * Copyright 2010 Jerome Glisse <glisse@freedesktop.org>
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * on the rights to use, copy, modify, merge, publish, distribute, sub
8 * license, and/or sell copies of the Software, and to permit persons to whom
9 * the Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
22 */
23#ifndef R600_ASM_H
24#define R600_ASM_H
25
26#include "r600.h"
27
28struct r600_vertex_element;
29struct r600_context;
30
31struct r600_bytecode_alu_src {
32	unsigned			sel;
33	unsigned			chan;
34	unsigned			neg;
35	unsigned			abs;
36	unsigned			rel;
37	unsigned			kc_bank;
38	uint32_t			value;
39};
40
41struct r600_bytecode_alu_dst {
42	unsigned			sel;
43	unsigned			chan;
44	unsigned			clamp;
45	unsigned			write;
46	unsigned			rel;
47};
48
49struct r600_bytecode_alu {
50	struct list_head		list;
51	struct r600_bytecode_alu_src		src[3];
52	struct r600_bytecode_alu_dst		dst;
53	unsigned			inst;
54	unsigned			last;
55	unsigned			is_op3;
56	unsigned			execute_mask;
57	unsigned			update_pred;
58	unsigned			pred_sel;
59	unsigned			bank_swizzle;
60	unsigned			bank_swizzle_force;
61	unsigned			omod;
62	unsigned                        index_mode;
63};
64
65struct r600_bytecode_tex {
66	struct list_head		list;
67	unsigned			inst;
68	unsigned			resource_id;
69	unsigned			src_gpr;
70	unsigned			src_rel;
71	unsigned			dst_gpr;
72	unsigned			dst_rel;
73	unsigned			dst_sel_x;
74	unsigned			dst_sel_y;
75	unsigned			dst_sel_z;
76	unsigned			dst_sel_w;
77	unsigned			lod_bias;
78	unsigned			coord_type_x;
79	unsigned			coord_type_y;
80	unsigned			coord_type_z;
81	unsigned			coord_type_w;
82	unsigned			offset_x;
83	unsigned			offset_y;
84	unsigned			offset_z;
85	unsigned			sampler_id;
86	unsigned			src_sel_x;
87	unsigned			src_sel_y;
88	unsigned			src_sel_z;
89	unsigned			src_sel_w;
90};
91
92struct r600_bytecode_vtx {
93	struct list_head		list;
94	unsigned			inst;
95	unsigned			fetch_type;
96	unsigned			buffer_id;
97	unsigned			src_gpr;
98	unsigned			src_sel_x;
99	unsigned			mega_fetch_count;
100	unsigned			dst_gpr;
101	unsigned			dst_sel_x;
102	unsigned			dst_sel_y;
103	unsigned			dst_sel_z;
104	unsigned			dst_sel_w;
105	unsigned			use_const_fields;
106	unsigned			data_format;
107	unsigned			num_format_all;
108	unsigned			format_comp_all;
109	unsigned			srf_mode_all;
110	unsigned			offset;
111	unsigned			endian;
112};
113
114struct r600_bytecode_output {
115	unsigned			array_base;
116	unsigned			array_size;
117	unsigned			comp_mask;
118	unsigned			type;
119	unsigned			end_of_program;
120
121	/* CF_INST. This is already bit-shifted and only needs to be or'd for bytecode. */
122	unsigned			inst;
123
124	unsigned			elem_size;
125	unsigned			gpr;
126	unsigned			swizzle_x;
127	unsigned			swizzle_y;
128	unsigned			swizzle_z;
129	unsigned			swizzle_w;
130	unsigned			burst_count;
131	unsigned			barrier;
132};
133
134struct r600_bytecode_kcache {
135	unsigned			bank;
136	unsigned			mode;
137	unsigned			addr;
138};
139
140/* A value of CF_NATIVE in r600_bytecode_cf::inst means that this instruction
141 * has already been encoded, and the encoding has been stored in
142 * r600_bytecode::isa.  This is used by the LLVM backend to emit CF instructions
143 * e.g. RAT_WRITE_* that can't be properly represented by struct
144 * r600_bytecode_cf.
145 */
146#define CF_NATIVE ~0
147
148struct r600_bytecode_cf {
149	struct list_head		list;
150
151	/* CF_INST. This is already bit-shifted and only needs to be or'd for bytecode. */
152	unsigned			inst;
153
154	unsigned			addr;
155	unsigned			ndw;
156	unsigned			id;
157	unsigned			cond;
158	unsigned			pop_count;
159	unsigned			cf_addr; /* control flow addr */
160	struct r600_bytecode_kcache		kcache[4];
161	unsigned			r6xx_uses_waterfall;
162	unsigned			eg_alu_extended;
163	struct list_head		alu;
164	struct list_head		tex;
165	struct list_head		vtx;
166	struct r600_bytecode_output		output;
167	struct r600_bytecode_alu		*curr_bs_head;
168	struct r600_bytecode_alu		*prev_bs_head;
169	struct r600_bytecode_alu		*prev2_bs_head;
170	unsigned isa[2];
171};
172
173#define FC_NONE				0
174#define FC_IF				1
175#define FC_LOOP				2
176#define FC_REP				3
177#define FC_PUSH_VPM			4
178#define FC_PUSH_WQM			5
179
180struct r600_cf_stack_entry {
181	int				type;
182	struct r600_bytecode_cf		*start;
183	struct r600_bytecode_cf		**mid; /* used to store the else point */
184	int				num_mid;
185};
186
187#define SQ_MAX_CALL_DEPTH 0x00000020
188struct r600_cf_callstack {
189	unsigned			fc_sp_before_entry;
190	int				sub_desc_index;
191	int				current;
192	int				max;
193};
194
195#define AR_HANDLE_NORMAL 0
196#define AR_HANDLE_RV6XX 1 /* except RV670 */
197
198
199struct r600_bytecode {
200	enum chip_class			chip_class;
201	int				type;
202	struct list_head		cf;
203	struct r600_bytecode_cf		*cf_last;
204	unsigned			ndw;
205	unsigned			ncf;
206	unsigned			ngpr;
207	unsigned			nstack;
208	unsigned			nresource;
209	unsigned			force_add_cf;
210	uint32_t			*bytecode;
211	uint32_t			fc_sp;
212	struct r600_cf_stack_entry	fc_stack[32];
213	unsigned			call_sp;
214	struct r600_cf_callstack	callstack[SQ_MAX_CALL_DEPTH];
215	unsigned	ar_loaded;
216	unsigned	ar_reg;
217	unsigned        ar_handling;
218	unsigned        r6xx_nop_after_rel_dst;
219};
220
221/* eg_asm.c */
222int eg_bytecode_cf_build(struct r600_bytecode *bc, struct r600_bytecode_cf *cf);
223
224/* r600_asm.c */
225void r600_bytecode_init(struct r600_bytecode *bc, enum chip_class chip_class, enum radeon_family family);
226void r600_bytecode_clear(struct r600_bytecode *bc);
227int r600_bytecode_add_alu(struct r600_bytecode *bc, const struct r600_bytecode_alu *alu);
228int r600_bytecode_add_vtx(struct r600_bytecode *bc, const struct r600_bytecode_vtx *vtx);
229int r600_bytecode_add_tex(struct r600_bytecode *bc, const struct r600_bytecode_tex *tex);
230int r600_bytecode_add_output(struct r600_bytecode *bc, const struct r600_bytecode_output *output);
231int r600_bytecode_build(struct r600_bytecode *bc);
232int r600_bytecode_add_cfinst(struct r600_bytecode *bc, int inst);
233int r600_bytecode_add_alu_type(struct r600_bytecode *bc, const struct r600_bytecode_alu *alu, int type);
234void r600_bytecode_special_constants(uint32_t value, unsigned *sel, unsigned *neg);
235void r600_bytecode_dump(struct r600_bytecode *bc);
236
237int cm_bytecode_add_cf_end(struct r600_bytecode *bc);
238
239int r600_vertex_elements_build_fetch_shader(struct r600_context *rctx, struct r600_vertex_element *ve);
240
241/* r700_asm.c */
242void r700_bytecode_cf_vtx_build(uint32_t *bytecode, const struct r600_bytecode_cf *cf);
243int r700_bytecode_alu_build(struct r600_bytecode *bc, struct r600_bytecode_alu *alu, unsigned id);
244
245#endif
246