i915_state_emit.c revision 287c94ea4987033f9c99a2f91c5750c9083504ca
1/**************************************************************************
2 *
3 * Copyright 2003 Tungsten Graphics, Inc., Cedar Park, Texas.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28
29#include "i915_reg.h"
30#include "i915_context.h"
31#include "i915_batch.h"
32#include "i915_reg.h"
33#include "i915_resource.h"
34
35#include "pipe/p_context.h"
36#include "pipe/p_defines.h"
37
38static unsigned translate_format( enum pipe_format format )
39{
40   switch (format) {
41   case PIPE_FORMAT_B8G8R8A8_UNORM:
42      return COLOR_BUF_ARGB8888;
43   case PIPE_FORMAT_B5G6R5_UNORM:
44      return COLOR_BUF_RGB565;
45   default:
46      assert(0);
47      return 0;
48   }
49}
50
51static unsigned translate_depth_format( enum pipe_format zformat )
52{
53   switch (zformat) {
54   case PIPE_FORMAT_Z24_UNORM_S8_USCALED:
55      return DEPTH_FRMT_24_FIXED_8_OTHER;
56   case PIPE_FORMAT_Z16_UNORM:
57      return DEPTH_FRMT_16_FIXED;
58   default:
59      assert(0);
60      return 0;
61   }
62}
63
64
65/**
66 * Examine framebuffer state to determine width, height.
67 */
68static boolean
69framebuffer_size(const struct pipe_framebuffer_state *fb,
70                 uint *width, uint *height)
71{
72   if (fb->cbufs[0]) {
73      *width = fb->cbufs[0]->width;
74      *height = fb->cbufs[0]->height;
75      return TRUE;
76   }
77   else if (fb->zsbuf) {
78      *width = fb->zsbuf->width;
79      *height = fb->zsbuf->height;
80      return TRUE;
81   }
82   else {
83      *width = *height = 0;
84      return FALSE;
85   }
86}
87
88
89/* Push the state into the sarea and/or texture memory.
90 */
91void
92i915_emit_hardware_state(struct i915_context *i915 )
93{
94   /* XXX: there must be an easier way */
95   const unsigned dwords = ( 14 +
96                             7 +
97                             I915_MAX_DYNAMIC +
98                             8 +
99                             2 + I915_TEX_UNITS*3 +
100                             2 + I915_TEX_UNITS*3 +
101                             2 + I915_MAX_CONSTANT*4 +
102#if 0
103                             i915->current.program_len +
104#else
105                             i915->fs->program_len +
106#endif
107                             6
108                           ) * 3/2; /* plus 50% margin */
109   const unsigned relocs = ( I915_TEX_UNITS +
110                             3
111                           ) * 3/2; /* plus 50% margin */
112
113#if 0
114   debug_printf("i915_emit_hardware_state: %d dwords, %d relocs\n", dwords, relocs);
115#endif
116
117   if(!BEGIN_BATCH(dwords, relocs)) {
118      FLUSH_BATCH(NULL);
119      assert(BEGIN_BATCH(dwords, relocs));
120   }
121
122   /* 14 dwords, 0 relocs */
123   if (i915->hardware_dirty & I915_HW_INVARIENT)
124   {
125      OUT_BATCH(_3DSTATE_AA_CMD |
126                AA_LINE_ECAAR_WIDTH_ENABLE |
127                AA_LINE_ECAAR_WIDTH_1_0 |
128                AA_LINE_REGION_WIDTH_ENABLE | AA_LINE_REGION_WIDTH_1_0);
129
130      OUT_BATCH(_3DSTATE_DFLT_DIFFUSE_CMD);
131      OUT_BATCH(0);
132
133      OUT_BATCH(_3DSTATE_DFLT_SPEC_CMD);
134      OUT_BATCH(0);
135
136      OUT_BATCH(_3DSTATE_DFLT_Z_CMD);
137      OUT_BATCH(0);
138
139      OUT_BATCH(_3DSTATE_COORD_SET_BINDINGS |
140                CSB_TCB(0, 0) |
141                CSB_TCB(1, 1) |
142                CSB_TCB(2, 2) |
143                CSB_TCB(3, 3) |
144                CSB_TCB(4, 4) |
145                CSB_TCB(5, 5) |
146                CSB_TCB(6, 6) |
147                CSB_TCB(7, 7));
148
149      OUT_BATCH(_3DSTATE_RASTER_RULES_CMD |
150                ENABLE_POINT_RASTER_RULE |
151                OGL_POINT_RASTER_RULE |
152                ENABLE_LINE_STRIP_PROVOKE_VRTX |
153                ENABLE_TRI_FAN_PROVOKE_VRTX |
154                LINE_STRIP_PROVOKE_VRTX(1) |
155                TRI_FAN_PROVOKE_VRTX(2) |
156                ENABLE_TEXKILL_3D_4D |
157                TEXKILL_4D);
158
159      /* Need to initialize this to zero.
160       */
161      OUT_BATCH(_3DSTATE_LOAD_STATE_IMMEDIATE_1 | I1_LOAD_S(3) | (0));
162      OUT_BATCH(0);
163
164      OUT_BATCH(_3DSTATE_DEPTH_SUBRECT_DISABLE);
165
166      /* disable indirect state for now
167       */
168      OUT_BATCH(_3DSTATE_LOAD_INDIRECT | 0);
169      OUT_BATCH(0);
170   }
171
172   /* 7 dwords, 1 relocs */
173   if (i915->hardware_dirty & I915_HW_IMMEDIATE)
174   {
175      OUT_BATCH(_3DSTATE_LOAD_STATE_IMMEDIATE_1 |
176                I1_LOAD_S(0) |
177                I1_LOAD_S(1) |
178                I1_LOAD_S(2) |
179                I1_LOAD_S(4) |
180                I1_LOAD_S(5) |
181                I1_LOAD_S(6) |
182                (5));
183
184      if(i915->vbo)
185         OUT_RELOC(i915->vbo,
186                   I915_USAGE_VERTEX,
187                   i915->current.immediate[I915_IMMEDIATE_S0]);
188      else
189         /* FIXME: we should not do this */
190         OUT_BATCH(0);
191      OUT_BATCH(i915->current.immediate[I915_IMMEDIATE_S1]);
192      OUT_BATCH(i915->current.immediate[I915_IMMEDIATE_S2]);
193      OUT_BATCH(i915->current.immediate[I915_IMMEDIATE_S4]);
194      OUT_BATCH(i915->current.immediate[I915_IMMEDIATE_S5]);
195      OUT_BATCH(i915->current.immediate[I915_IMMEDIATE_S6]);
196   }
197
198   /* I915_MAX_DYNAMIC dwords, 0 relocs */
199   if (i915->hardware_dirty & I915_HW_DYNAMIC)
200   {
201      int i;
202      for (i = 0; i < I915_MAX_DYNAMIC; i++) {
203         OUT_BATCH(i915->current.dynamic[i]);
204      }
205   }
206
207   /* 8 dwords, 2 relocs */
208   if (i915->hardware_dirty & I915_HW_STATIC)
209   {
210      struct pipe_surface *cbuf_surface = i915->framebuffer.cbufs[0];
211      struct pipe_surface *depth_surface = i915->framebuffer.zsbuf;
212
213      if (cbuf_surface) {
214         unsigned ctile = BUF_3D_USE_FENCE;
215         struct i915_texture *tex = i915_texture(cbuf_surface->texture);
216         assert(tex);
217
218         if (tex && tex->sw_tiled) {
219            ctile = BUF_3D_TILED_SURFACE;
220         }
221
222         OUT_BATCH(_3DSTATE_BUF_INFO_CMD);
223
224         OUT_BATCH(BUF_3D_ID_COLOR_BACK |
225                   BUF_3D_PITCH(tex->stride) |  /* pitch in bytes */
226                   ctile);
227
228         OUT_RELOC(tex->buffer,
229                   I915_USAGE_RENDER,
230                   cbuf_surface->offset);
231      }
232
233      /* What happens if no zbuf??
234       */
235      if (depth_surface) {
236         unsigned ztile = BUF_3D_USE_FENCE;
237         struct i915_texture *tex = i915_texture(depth_surface->texture);
238         assert(tex);
239
240         if (tex && tex->sw_tiled) {
241            ztile = BUF_3D_TILED_SURFACE;
242         }
243
244         OUT_BATCH(_3DSTATE_BUF_INFO_CMD);
245
246         assert(tex);
247         OUT_BATCH(BUF_3D_ID_DEPTH |
248                   BUF_3D_PITCH(tex->stride) |  /* pitch in bytes */
249                   ztile);
250
251         OUT_RELOC(tex->buffer,
252                   I915_USAGE_RENDER,
253                   depth_surface->offset);
254      }
255
256      {
257         unsigned cformat, zformat = 0;
258
259         if (cbuf_surface)
260            cformat = cbuf_surface->format;
261         else
262            cformat = PIPE_FORMAT_B8G8R8A8_UNORM; /* arbitrary */
263         cformat = translate_format(cformat);
264
265         if (depth_surface)
266            zformat = translate_depth_format( i915->framebuffer.zsbuf->format );
267
268         OUT_BATCH(_3DSTATE_DST_BUF_VARS_CMD);
269         OUT_BATCH(DSTORG_HORT_BIAS(0x8) | /* .5 */
270                   DSTORG_VERT_BIAS(0x8) | /* .5 */
271                   LOD_PRECLAMP_OGL |
272                   TEX_DEFAULT_COLOR_OGL |
273                   cformat |
274                   zformat );
275      }
276   }
277
278#if 01
279      /* texture images */
280      /* 2 + I915_TEX_UNITS*3 dwords, I915_TEX_UNITS relocs */
281      if (i915->hardware_dirty & (I915_HW_MAP | I915_HW_SAMPLER))
282      {
283         const uint nr = i915->current.sampler_enable_nr;
284         if (nr) {
285            const uint enabled = i915->current.sampler_enable_flags;
286            uint unit;
287            uint count = 0;
288            OUT_BATCH(_3DSTATE_MAP_STATE | (3 * nr));
289            OUT_BATCH(enabled);
290            for (unit = 0; unit < I915_TEX_UNITS; unit++) {
291               if (enabled & (1 << unit)) {
292                  struct i915_texture *texture = i915_texture(i915->fragment_sampler_views[unit]->texture);
293                  struct i915_winsys_buffer *buf = texture->buffer;
294                  uint offset = 0;
295                  assert(buf);
296
297                  count++;
298
299                  OUT_RELOC(buf, I915_USAGE_SAMPLER, offset);
300                  OUT_BATCH(i915->current.texbuffer[unit][0]); /* MS3 */
301                  OUT_BATCH(i915->current.texbuffer[unit][1]); /* MS4 */
302               }
303            }
304            assert(count == nr);
305         }
306      }
307#endif
308
309#if 01
310   /* samplers */
311   /* 2 + I915_TEX_UNITS*3 dwords, 0 relocs */
312   if (i915->hardware_dirty & I915_HW_SAMPLER)
313   {
314      if (i915->current.sampler_enable_nr) {
315         int i;
316
317         OUT_BATCH( _3DSTATE_SAMPLER_STATE |
318                    (3 * i915->current.sampler_enable_nr) );
319
320         OUT_BATCH( i915->current.sampler_enable_flags );
321
322         for (i = 0; i < I915_TEX_UNITS; i++) {
323            if (i915->current.sampler_enable_flags & (1<<i)) {
324               OUT_BATCH( i915->current.sampler[i][0] );
325               OUT_BATCH( i915->current.sampler[i][1] );
326               OUT_BATCH( i915->current.sampler[i][2] );
327            }
328         }
329      }
330   }
331#endif
332
333   /* constants */
334   /* 2 + I915_MAX_CONSTANT*4 dwords, 0 relocs */
335   if (i915->hardware_dirty & I915_HW_PROGRAM)
336   {
337      /* Collate the user-defined constants with the fragment shader's
338       * immediates according to the constant_flags[] array.
339       */
340      const uint nr = i915->fs->num_constants;
341      if (nr) {
342         uint i;
343
344         OUT_BATCH( _3DSTATE_PIXEL_SHADER_CONSTANTS | (nr * 4) );
345         OUT_BATCH( (1 << (nr - 1)) | ((1 << (nr - 1)) - 1) );
346
347         for (i = 0; i < nr; i++) {
348            const uint *c;
349            if (i915->fs->constant_flags[i] == I915_CONSTFLAG_USER) {
350               /* grab user-defined constant */
351               c = (uint *) i915->current.constants[PIPE_SHADER_FRAGMENT][i];
352            }
353            else {
354               /* emit program constant */
355               c = (uint *) i915->fs->constants[i];
356            }
357#if 0 /* debug */
358            {
359               float *f = (float *) c;
360               printf("Const %2d: %f %f %f %f %s\n", i, f[0], f[1], f[2], f[3],
361                      (i915->fs->constant_flags[i] == I915_CONSTFLAG_USER
362                       ? "user" : "immediate"));
363            }
364#endif
365            OUT_BATCH(*c++);
366            OUT_BATCH(*c++);
367            OUT_BATCH(*c++);
368            OUT_BATCH(*c++);
369         }
370      }
371   }
372
373   /* Fragment program */
374   /* i915->current.program_len dwords, 0 relocs */
375   if (i915->hardware_dirty & I915_HW_PROGRAM)
376   {
377      uint i;
378      /* we should always have, at least, a pass-through program */
379      assert(i915->fs->program_len > 0);
380      for (i = 0; i < i915->fs->program_len; i++) {
381         OUT_BATCH(i915->fs->program[i]);
382      }
383   }
384
385   /* drawing surface size */
386   /* 6 dwords, 0 relocs */
387   {
388      uint w, h;
389      boolean k = framebuffer_size(&i915->framebuffer, &w, &h);
390      (void)k;
391      assert(k);
392
393      OUT_BATCH(_3DSTATE_DRAW_RECT_CMD);
394      OUT_BATCH(0);
395      OUT_BATCH(0);
396      OUT_BATCH(((w - 1) & 0xffff) | ((h - 1) << 16));
397      OUT_BATCH(0);
398      OUT_BATCH(0);
399   }
400
401
402   i915->hardware_dirty = 0;
403}
404