intel_span.c revision da2816a45e6e3a33246a341fee72e6f893f315d9
1/**************************************************************************
2 *
3 * Copyright 2003 Tungsten Graphics, Inc., Cedar Park, Texas.
4 * Copyright 2011 Intel Corporation
5 * All Rights Reserved.
6 *
7 * Permission is hereby granted, free of charge, to any person obtaining a
8 * copy of this software and associated documentation files (the
9 * "Software"), to deal in the Software without restriction, including
10 * without limitation the rights to use, copy, modify, merge, publish,
11 * distribute, sub license, and/or sell copies of the Software, and to
12 * permit persons to whom the Software is furnished to do so, subject to
13 * the following conditions:
14 *
15 * The above copyright notice and this permission notice (including the
16 * next paragraph) shall be included in all copies or substantial portions
17 * of the Software.
18 *
19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
20 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
21 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
22 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
23 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
24 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
25 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 *
27 * Authors:
28 *     Chad Versace <chad@chad-versace.us>
29 *
30 **************************************************************************/
31
32#include <stdbool.h>
33#include <stdint.h>
34#include "main/glheader.h"
35#include "main/macros.h"
36#include "main/mtypes.h"
37#include "main/colormac.h"
38#include "main/renderbuffer.h"
39
40#include "intel_buffers.h"
41#include "intel_fbo.h"
42#include "intel_mipmap_tree.h"
43#include "intel_screen.h"
44#include "intel_span.h"
45#include "intel_regions.h"
46#include "intel_tex.h"
47
48#include "swrast/swrast.h"
49
50static void
51intel_set_span_functions(struct intel_context *intel,
52			 struct gl_renderbuffer *rb);
53
54#undef DBG
55#define DBG 0
56
57#define LOCAL_VARS							\
58   struct intel_renderbuffer *irb = intel_renderbuffer(rb);		\
59   int minx = 0, miny = 0;						\
60   int maxx = rb->Width;						\
61   int maxy = rb->Height;						\
62   int pitch = rb->RowStride * irb->mt->region->cpp;			\
63   void *buf = rb->Data;						\
64   GLuint p;								\
65   (void) p;
66
67#define HW_CLIPLOOP()
68#define HW_ENDCLIPLOOP()
69
70#define Y_FLIP(_y) (_y)
71
72#define HW_LOCK()
73
74#define HW_UNLOCK()
75
76/* r5g6b5 color span and pixel functions */
77#define SPANTMP_PIXEL_FMT GL_RGB
78#define SPANTMP_PIXEL_TYPE GL_UNSIGNED_SHORT_5_6_5
79#define TAG(x) intel_##x##_RGB565
80#define TAG2(x,y) intel_##x##y_RGB565
81#include "spantmp2.h"
82
83/* a4r4g4b4 color span and pixel functions */
84#define SPANTMP_PIXEL_FMT GL_BGRA
85#define SPANTMP_PIXEL_TYPE GL_UNSIGNED_SHORT_4_4_4_4_REV
86#define TAG(x) intel_##x##_ARGB4444
87#define TAG2(x,y) intel_##x##y_ARGB4444
88#include "spantmp2.h"
89
90/* a1r5g5b5 color span and pixel functions */
91#define SPANTMP_PIXEL_FMT GL_BGRA
92#define SPANTMP_PIXEL_TYPE GL_UNSIGNED_SHORT_1_5_5_5_REV
93#define TAG(x) intel_##x##_ARGB1555
94#define TAG2(x,y) intel_##x##y##_ARGB1555
95#include "spantmp2.h"
96
97/* a8r8g8b8 color span and pixel functions */
98#define SPANTMP_PIXEL_FMT GL_BGRA
99#define SPANTMP_PIXEL_TYPE GL_UNSIGNED_INT_8_8_8_8_REV
100#define TAG(x) intel_##x##_ARGB8888
101#define TAG2(x,y) intel_##x##y##_ARGB8888
102#include "spantmp2.h"
103
104/* x8r8g8b8 color span and pixel functions */
105#define SPANTMP_PIXEL_FMT GL_BGR
106#define SPANTMP_PIXEL_TYPE GL_UNSIGNED_INT_8_8_8_8_REV
107#define TAG(x) intel_##x##_xRGB8888
108#define TAG2(x,y) intel_##x##y##_xRGB8888
109#include "spantmp2.h"
110
111/* a8 color span and pixel functions */
112#define SPANTMP_PIXEL_FMT GL_ALPHA
113#define SPANTMP_PIXEL_TYPE GL_UNSIGNED_BYTE
114#define TAG(x) intel_##x##_A8
115#define TAG2(x,y) intel_##x##y##_A8
116#include "spantmp2.h"
117
118/**
119 * \brief Get pointer offset into stencil buffer.
120 *
121 * The stencil buffer is W tiled. Since the GTT is incapable of W fencing, we
122 * must decode the tile's layout in software.
123 *
124 * See
125 *   - PRM, 2011 Sandy Bridge, Volume 1, Part 2, Section 4.5.2.1 W-Major Tile
126 *     Format.
127 *   - PRM, 2011 Sandy Bridge, Volume 1, Part 2, Section 4.5.3 Tiling Algorithm
128 *
129 * Even though the returned offset is always positive, the return type is
130 * signed due to
131 *    commit e8b1c6d6f55f5be3bef25084fdd8b6127517e137
132 *    mesa: Fix return type of  _mesa_get_format_bytes() (#37351)
133 */
134intptr_t
135intel_offset_S8(uint32_t stride, uint32_t x, uint32_t y)
136{
137   uint32_t tile_size = 4096;
138   uint32_t tile_width = 64;
139   uint32_t tile_height = 64;
140   uint32_t row_size = 64 * stride;
141
142   uint32_t tile_x = x / tile_width;
143   uint32_t tile_y = y / tile_height;
144
145   /* The byte's address relative to the tile's base addres. */
146   uint32_t byte_x = x % tile_width;
147   uint32_t byte_y = y % tile_height;
148
149   uintptr_t u = tile_y * row_size
150               + tile_x * tile_size
151               + 512 * (byte_x / 8)
152               +  64 * (byte_y / 8)
153               +  32 * ((byte_y / 4) % 2)
154               +  16 * ((byte_x / 4) % 2)
155               +   8 * ((byte_y / 2) % 2)
156               +   4 * ((byte_x / 2) % 2)
157               +   2 * (byte_y % 2)
158               +   1 * (byte_x % 2);
159
160   /*
161    * Errata for Gen5:
162    *
163    * An additional offset is needed which is not documented in the PRM.
164    *
165    * if ((byte_x / 8) % 2 == 1) {
166    *    if ((byte_y / 8) % 2) == 0) {
167    *       u += 64;
168    *    } else {
169    *       u -= 64;
170    *    }
171    * }
172    *
173    * The offset is expressed more tersely as
174    * u += ((int) x & 0x8) * (8 - (((int) y & 0x8) << 1));
175    */
176
177   return u;
178}
179
180void
181intel_renderbuffer_map(struct intel_context *intel, struct gl_renderbuffer *rb)
182{
183   struct gl_context *ctx = &intel->ctx;
184   struct intel_renderbuffer *irb = intel_renderbuffer(rb);
185   GLubyte *map;
186   int stride;
187
188   if (!irb)
189      return;
190
191   if (rb->Data) {
192      /* Renderbuffer is already mapped. This usually happens when a single
193       * buffer is attached to the framebuffer's depth and stencil attachment
194       * points.
195       */
196      return;
197   }
198
199   ctx->Driver.MapRenderbuffer(ctx, rb, 0, 0, rb->Width, rb->Height,
200			       GL_MAP_READ_BIT | GL_MAP_WRITE_BIT,
201			       &map, &stride);
202   rb->Data = map;
203   rb->RowStride = stride / _mesa_get_format_bytes(rb->Format);
204
205   intel_set_span_functions(intel, rb);
206}
207
208void
209intel_renderbuffer_unmap(struct intel_context *intel,
210			 struct gl_renderbuffer *rb)
211{
212   struct gl_context *ctx = &intel->ctx;
213   struct intel_renderbuffer *irb = intel_renderbuffer(rb);
214
215   if (!irb)
216      return;
217
218   if (!rb->Data) {
219      /* Renderbuffer is already unmapped. This usually happens when a single
220       * buffer is attached to the framebuffer's depth and stencil attachment
221       * points.
222       */
223      return;
224   }
225
226   ctx->Driver.UnmapRenderbuffer(ctx, rb);
227
228   rb->GetRow = NULL;
229   rb->PutRow = NULL;
230   rb->Data = NULL;
231   rb->RowStride = 0;
232}
233
234static void
235intel_framebuffer_map(struct intel_context *intel, struct gl_framebuffer *fb)
236{
237   int i;
238
239   for (i = 0; i < BUFFER_COUNT; i++) {
240      intel_renderbuffer_map(intel, fb->Attachment[i].Renderbuffer);
241   }
242
243   intel_check_front_buffer_rendering(intel);
244}
245
246static void
247intel_framebuffer_unmap(struct intel_context *intel, struct gl_framebuffer *fb)
248{
249   int i;
250
251   for (i = 0; i < BUFFER_COUNT; i++) {
252      intel_renderbuffer_unmap(intel, fb->Attachment[i].Renderbuffer);
253   }
254}
255
256/**
257 * Prepare for software rendering.  Map current read/draw framebuffers'
258 * renderbuffes and all currently bound texture objects.
259 *
260 * Old note: Moved locking out to get reasonable span performance.
261 */
262void
263intelSpanRenderStart(struct gl_context * ctx)
264{
265   struct intel_context *intel = intel_context(ctx);
266   GLuint i;
267
268   intel_flush(&intel->ctx);
269   intel_prepare_render(intel);
270
271   for (i = 0; i < ctx->Const.MaxTextureImageUnits; i++) {
272      if (ctx->Texture.Unit[i]._ReallyEnabled) {
273         struct gl_texture_object *texObj = ctx->Texture.Unit[i]._Current;
274
275         intel_finalize_mipmap_tree(intel, i);
276         intel_tex_map_images(intel, intel_texture_object(texObj),
277                              GL_MAP_READ_BIT | GL_MAP_WRITE_BIT);
278      }
279   }
280
281   intel_framebuffer_map(intel, ctx->DrawBuffer);
282   if (ctx->ReadBuffer != ctx->DrawBuffer) {
283      intel_framebuffer_map(intel, ctx->ReadBuffer);
284   }
285}
286
287/**
288 * Called when done software rendering.  Unmap the buffers we mapped in
289 * the above function.
290 */
291void
292intelSpanRenderFinish(struct gl_context * ctx)
293{
294   struct intel_context *intel = intel_context(ctx);
295   GLuint i;
296
297   _swrast_flush(ctx);
298
299   for (i = 0; i < ctx->Const.MaxTextureImageUnits; i++) {
300      if (ctx->Texture.Unit[i]._ReallyEnabled) {
301         struct gl_texture_object *texObj = ctx->Texture.Unit[i]._Current;
302         intel_tex_unmap_images(intel, intel_texture_object(texObj));
303      }
304   }
305
306   intel_framebuffer_unmap(intel, ctx->DrawBuffer);
307   if (ctx->ReadBuffer != ctx->DrawBuffer) {
308      intel_framebuffer_unmap(intel, ctx->ReadBuffer);
309   }
310}
311
312
313void
314intelInitSpanFuncs(struct gl_context * ctx)
315{
316   struct swrast_device_driver *swdd = _swrast_GetDeviceDriverReference(ctx);
317   swdd->SpanRenderStart = intelSpanRenderStart;
318   swdd->SpanRenderFinish = intelSpanRenderFinish;
319}
320
321void
322intel_map_vertex_shader_textures(struct gl_context *ctx)
323{
324   struct intel_context *intel = intel_context(ctx);
325   int i;
326
327   if (ctx->VertexProgram._Current == NULL)
328      return;
329
330   for (i = 0; i < ctx->Const.MaxTextureImageUnits; i++) {
331      if (ctx->Texture.Unit[i]._ReallyEnabled &&
332	  ctx->VertexProgram._Current->Base.TexturesUsed[i] != 0) {
333         struct gl_texture_object *texObj = ctx->Texture.Unit[i]._Current;
334
335         intel_tex_map_images(intel, intel_texture_object(texObj),
336                              GL_MAP_READ_BIT | GL_MAP_WRITE_BIT);
337      }
338   }
339}
340
341void
342intel_unmap_vertex_shader_textures(struct gl_context *ctx)
343{
344   struct intel_context *intel = intel_context(ctx);
345   int i;
346
347   if (ctx->VertexProgram._Current == NULL)
348      return;
349
350   for (i = 0; i < ctx->Const.MaxTextureImageUnits; i++) {
351      if (ctx->Texture.Unit[i]._ReallyEnabled &&
352	  ctx->VertexProgram._Current->Base.TexturesUsed[i] != 0) {
353         struct gl_texture_object *texObj = ctx->Texture.Unit[i]._Current;
354
355         intel_tex_unmap_images(intel, intel_texture_object(texObj));
356      }
357   }
358}
359
360typedef void (*span_init_func)(struct gl_renderbuffer *rb);
361
362static span_init_func intel_span_init_funcs[MESA_FORMAT_COUNT] =
363{
364   [MESA_FORMAT_A8] = intel_InitPointers_A8,
365   [MESA_FORMAT_RGB565] = intel_InitPointers_RGB565,
366   [MESA_FORMAT_ARGB4444] = intel_InitPointers_ARGB4444,
367   [MESA_FORMAT_ARGB1555] = intel_InitPointers_ARGB1555,
368   [MESA_FORMAT_XRGB8888] = intel_InitPointers_xRGB8888,
369   [MESA_FORMAT_ARGB8888] = intel_InitPointers_ARGB8888,
370   [MESA_FORMAT_SARGB8] = intel_InitPointers_ARGB8888,
371   [MESA_FORMAT_Z16] = _mesa_set_renderbuffer_accessors,
372   [MESA_FORMAT_X8_Z24] = _mesa_set_renderbuffer_accessors,
373   [MESA_FORMAT_S8_Z24] = _mesa_set_renderbuffer_accessors,
374   [MESA_FORMAT_S8] = _mesa_set_renderbuffer_accessors,
375   [MESA_FORMAT_R8] = _mesa_set_renderbuffer_accessors,
376   [MESA_FORMAT_RG88] = _mesa_set_renderbuffer_accessors,
377   [MESA_FORMAT_R16] = _mesa_set_renderbuffer_accessors,
378   [MESA_FORMAT_RG1616] = _mesa_set_renderbuffer_accessors,
379   [MESA_FORMAT_RGBA_FLOAT32] = _mesa_set_renderbuffer_accessors,
380   [MESA_FORMAT_RG_FLOAT32] = _mesa_set_renderbuffer_accessors,
381   [MESA_FORMAT_R_FLOAT32] = _mesa_set_renderbuffer_accessors,
382   [MESA_FORMAT_INTENSITY_FLOAT32] = _mesa_set_renderbuffer_accessors,
383   [MESA_FORMAT_LUMINANCE_FLOAT32] = _mesa_set_renderbuffer_accessors,
384};
385
386bool
387intel_span_supports_format(gl_format format)
388{
389   /* Rendering to/from integer textures will be done using MapRenderbuffer,
390    * rather than coding up new paths through GetRow/PutRow(), so claim support
391    * for those formats in here for now.
392    */
393   return (intel_span_init_funcs[format] != NULL ||
394	   _mesa_is_format_integer_color(format));
395}
396
397/**
398 * Plug in appropriate span read/write functions for the given renderbuffer.
399 * These are used for the software fallbacks.
400 */
401static void
402intel_set_span_functions(struct intel_context *intel,
403			 struct gl_renderbuffer *rb)
404{
405   struct intel_renderbuffer *irb = (struct intel_renderbuffer *) rb;
406
407   assert(intel_span_init_funcs[irb->Base.Format]);
408   intel_span_init_funcs[irb->Base.Format](rb);
409
410   if (rb->DataType == GL_NONE) {
411      _mesa_problem(NULL,
412		    "renderbuffer format %s is missing "
413		    "intel_mesa_format_to_rb_datatype() support.",
414		    _mesa_get_format_name(rb->Format));
415   }
416}
417