intel_span.c revision da2816a45e6e3a33246a341fee72e6f893f315d9
1/************************************************************************** 2 * 3 * Copyright 2003 Tungsten Graphics, Inc., Cedar Park, Texas. 4 * Copyright 2011 Intel Corporation 5 * All Rights Reserved. 6 * 7 * Permission is hereby granted, free of charge, to any person obtaining a 8 * copy of this software and associated documentation files (the 9 * "Software"), to deal in the Software without restriction, including 10 * without limitation the rights to use, copy, modify, merge, publish, 11 * distribute, sub license, and/or sell copies of the Software, and to 12 * permit persons to whom the Software is furnished to do so, subject to 13 * the following conditions: 14 * 15 * The above copyright notice and this permission notice (including the 16 * next paragraph) shall be included in all copies or substantial portions 17 * of the Software. 18 * 19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS 20 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 21 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. 22 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR 23 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, 24 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE 25 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. 26 * 27 * Authors: 28 * Chad Versace <chad@chad-versace.us> 29 * 30 **************************************************************************/ 31 32#include <stdbool.h> 33#include <stdint.h> 34#include "main/glheader.h" 35#include "main/macros.h" 36#include "main/mtypes.h" 37#include "main/colormac.h" 38#include "main/renderbuffer.h" 39 40#include "intel_buffers.h" 41#include "intel_fbo.h" 42#include "intel_mipmap_tree.h" 43#include "intel_screen.h" 44#include "intel_span.h" 45#include "intel_regions.h" 46#include "intel_tex.h" 47 48#include "swrast/swrast.h" 49 50static void 51intel_set_span_functions(struct intel_context *intel, 52 struct gl_renderbuffer *rb); 53 54#undef DBG 55#define DBG 0 56 57#define LOCAL_VARS \ 58 struct intel_renderbuffer *irb = intel_renderbuffer(rb); \ 59 int minx = 0, miny = 0; \ 60 int maxx = rb->Width; \ 61 int maxy = rb->Height; \ 62 int pitch = rb->RowStride * irb->mt->region->cpp; \ 63 void *buf = rb->Data; \ 64 GLuint p; \ 65 (void) p; 66 67#define HW_CLIPLOOP() 68#define HW_ENDCLIPLOOP() 69 70#define Y_FLIP(_y) (_y) 71 72#define HW_LOCK() 73 74#define HW_UNLOCK() 75 76/* r5g6b5 color span and pixel functions */ 77#define SPANTMP_PIXEL_FMT GL_RGB 78#define SPANTMP_PIXEL_TYPE GL_UNSIGNED_SHORT_5_6_5 79#define TAG(x) intel_##x##_RGB565 80#define TAG2(x,y) intel_##x##y_RGB565 81#include "spantmp2.h" 82 83/* a4r4g4b4 color span and pixel functions */ 84#define SPANTMP_PIXEL_FMT GL_BGRA 85#define SPANTMP_PIXEL_TYPE GL_UNSIGNED_SHORT_4_4_4_4_REV 86#define TAG(x) intel_##x##_ARGB4444 87#define TAG2(x,y) intel_##x##y_ARGB4444 88#include "spantmp2.h" 89 90/* a1r5g5b5 color span and pixel functions */ 91#define SPANTMP_PIXEL_FMT GL_BGRA 92#define SPANTMP_PIXEL_TYPE GL_UNSIGNED_SHORT_1_5_5_5_REV 93#define TAG(x) intel_##x##_ARGB1555 94#define TAG2(x,y) intel_##x##y##_ARGB1555 95#include "spantmp2.h" 96 97/* a8r8g8b8 color span and pixel functions */ 98#define SPANTMP_PIXEL_FMT GL_BGRA 99#define SPANTMP_PIXEL_TYPE GL_UNSIGNED_INT_8_8_8_8_REV 100#define TAG(x) intel_##x##_ARGB8888 101#define TAG2(x,y) intel_##x##y##_ARGB8888 102#include "spantmp2.h" 103 104/* x8r8g8b8 color span and pixel functions */ 105#define SPANTMP_PIXEL_FMT GL_BGR 106#define SPANTMP_PIXEL_TYPE GL_UNSIGNED_INT_8_8_8_8_REV 107#define TAG(x) intel_##x##_xRGB8888 108#define TAG2(x,y) intel_##x##y##_xRGB8888 109#include "spantmp2.h" 110 111/* a8 color span and pixel functions */ 112#define SPANTMP_PIXEL_FMT GL_ALPHA 113#define SPANTMP_PIXEL_TYPE GL_UNSIGNED_BYTE 114#define TAG(x) intel_##x##_A8 115#define TAG2(x,y) intel_##x##y##_A8 116#include "spantmp2.h" 117 118/** 119 * \brief Get pointer offset into stencil buffer. 120 * 121 * The stencil buffer is W tiled. Since the GTT is incapable of W fencing, we 122 * must decode the tile's layout in software. 123 * 124 * See 125 * - PRM, 2011 Sandy Bridge, Volume 1, Part 2, Section 4.5.2.1 W-Major Tile 126 * Format. 127 * - PRM, 2011 Sandy Bridge, Volume 1, Part 2, Section 4.5.3 Tiling Algorithm 128 * 129 * Even though the returned offset is always positive, the return type is 130 * signed due to 131 * commit e8b1c6d6f55f5be3bef25084fdd8b6127517e137 132 * mesa: Fix return type of _mesa_get_format_bytes() (#37351) 133 */ 134intptr_t 135intel_offset_S8(uint32_t stride, uint32_t x, uint32_t y) 136{ 137 uint32_t tile_size = 4096; 138 uint32_t tile_width = 64; 139 uint32_t tile_height = 64; 140 uint32_t row_size = 64 * stride; 141 142 uint32_t tile_x = x / tile_width; 143 uint32_t tile_y = y / tile_height; 144 145 /* The byte's address relative to the tile's base addres. */ 146 uint32_t byte_x = x % tile_width; 147 uint32_t byte_y = y % tile_height; 148 149 uintptr_t u = tile_y * row_size 150 + tile_x * tile_size 151 + 512 * (byte_x / 8) 152 + 64 * (byte_y / 8) 153 + 32 * ((byte_y / 4) % 2) 154 + 16 * ((byte_x / 4) % 2) 155 + 8 * ((byte_y / 2) % 2) 156 + 4 * ((byte_x / 2) % 2) 157 + 2 * (byte_y % 2) 158 + 1 * (byte_x % 2); 159 160 /* 161 * Errata for Gen5: 162 * 163 * An additional offset is needed which is not documented in the PRM. 164 * 165 * if ((byte_x / 8) % 2 == 1) { 166 * if ((byte_y / 8) % 2) == 0) { 167 * u += 64; 168 * } else { 169 * u -= 64; 170 * } 171 * } 172 * 173 * The offset is expressed more tersely as 174 * u += ((int) x & 0x8) * (8 - (((int) y & 0x8) << 1)); 175 */ 176 177 return u; 178} 179 180void 181intel_renderbuffer_map(struct intel_context *intel, struct gl_renderbuffer *rb) 182{ 183 struct gl_context *ctx = &intel->ctx; 184 struct intel_renderbuffer *irb = intel_renderbuffer(rb); 185 GLubyte *map; 186 int stride; 187 188 if (!irb) 189 return; 190 191 if (rb->Data) { 192 /* Renderbuffer is already mapped. This usually happens when a single 193 * buffer is attached to the framebuffer's depth and stencil attachment 194 * points. 195 */ 196 return; 197 } 198 199 ctx->Driver.MapRenderbuffer(ctx, rb, 0, 0, rb->Width, rb->Height, 200 GL_MAP_READ_BIT | GL_MAP_WRITE_BIT, 201 &map, &stride); 202 rb->Data = map; 203 rb->RowStride = stride / _mesa_get_format_bytes(rb->Format); 204 205 intel_set_span_functions(intel, rb); 206} 207 208void 209intel_renderbuffer_unmap(struct intel_context *intel, 210 struct gl_renderbuffer *rb) 211{ 212 struct gl_context *ctx = &intel->ctx; 213 struct intel_renderbuffer *irb = intel_renderbuffer(rb); 214 215 if (!irb) 216 return; 217 218 if (!rb->Data) { 219 /* Renderbuffer is already unmapped. This usually happens when a single 220 * buffer is attached to the framebuffer's depth and stencil attachment 221 * points. 222 */ 223 return; 224 } 225 226 ctx->Driver.UnmapRenderbuffer(ctx, rb); 227 228 rb->GetRow = NULL; 229 rb->PutRow = NULL; 230 rb->Data = NULL; 231 rb->RowStride = 0; 232} 233 234static void 235intel_framebuffer_map(struct intel_context *intel, struct gl_framebuffer *fb) 236{ 237 int i; 238 239 for (i = 0; i < BUFFER_COUNT; i++) { 240 intel_renderbuffer_map(intel, fb->Attachment[i].Renderbuffer); 241 } 242 243 intel_check_front_buffer_rendering(intel); 244} 245 246static void 247intel_framebuffer_unmap(struct intel_context *intel, struct gl_framebuffer *fb) 248{ 249 int i; 250 251 for (i = 0; i < BUFFER_COUNT; i++) { 252 intel_renderbuffer_unmap(intel, fb->Attachment[i].Renderbuffer); 253 } 254} 255 256/** 257 * Prepare for software rendering. Map current read/draw framebuffers' 258 * renderbuffes and all currently bound texture objects. 259 * 260 * Old note: Moved locking out to get reasonable span performance. 261 */ 262void 263intelSpanRenderStart(struct gl_context * ctx) 264{ 265 struct intel_context *intel = intel_context(ctx); 266 GLuint i; 267 268 intel_flush(&intel->ctx); 269 intel_prepare_render(intel); 270 271 for (i = 0; i < ctx->Const.MaxTextureImageUnits; i++) { 272 if (ctx->Texture.Unit[i]._ReallyEnabled) { 273 struct gl_texture_object *texObj = ctx->Texture.Unit[i]._Current; 274 275 intel_finalize_mipmap_tree(intel, i); 276 intel_tex_map_images(intel, intel_texture_object(texObj), 277 GL_MAP_READ_BIT | GL_MAP_WRITE_BIT); 278 } 279 } 280 281 intel_framebuffer_map(intel, ctx->DrawBuffer); 282 if (ctx->ReadBuffer != ctx->DrawBuffer) { 283 intel_framebuffer_map(intel, ctx->ReadBuffer); 284 } 285} 286 287/** 288 * Called when done software rendering. Unmap the buffers we mapped in 289 * the above function. 290 */ 291void 292intelSpanRenderFinish(struct gl_context * ctx) 293{ 294 struct intel_context *intel = intel_context(ctx); 295 GLuint i; 296 297 _swrast_flush(ctx); 298 299 for (i = 0; i < ctx->Const.MaxTextureImageUnits; i++) { 300 if (ctx->Texture.Unit[i]._ReallyEnabled) { 301 struct gl_texture_object *texObj = ctx->Texture.Unit[i]._Current; 302 intel_tex_unmap_images(intel, intel_texture_object(texObj)); 303 } 304 } 305 306 intel_framebuffer_unmap(intel, ctx->DrawBuffer); 307 if (ctx->ReadBuffer != ctx->DrawBuffer) { 308 intel_framebuffer_unmap(intel, ctx->ReadBuffer); 309 } 310} 311 312 313void 314intelInitSpanFuncs(struct gl_context * ctx) 315{ 316 struct swrast_device_driver *swdd = _swrast_GetDeviceDriverReference(ctx); 317 swdd->SpanRenderStart = intelSpanRenderStart; 318 swdd->SpanRenderFinish = intelSpanRenderFinish; 319} 320 321void 322intel_map_vertex_shader_textures(struct gl_context *ctx) 323{ 324 struct intel_context *intel = intel_context(ctx); 325 int i; 326 327 if (ctx->VertexProgram._Current == NULL) 328 return; 329 330 for (i = 0; i < ctx->Const.MaxTextureImageUnits; i++) { 331 if (ctx->Texture.Unit[i]._ReallyEnabled && 332 ctx->VertexProgram._Current->Base.TexturesUsed[i] != 0) { 333 struct gl_texture_object *texObj = ctx->Texture.Unit[i]._Current; 334 335 intel_tex_map_images(intel, intel_texture_object(texObj), 336 GL_MAP_READ_BIT | GL_MAP_WRITE_BIT); 337 } 338 } 339} 340 341void 342intel_unmap_vertex_shader_textures(struct gl_context *ctx) 343{ 344 struct intel_context *intel = intel_context(ctx); 345 int i; 346 347 if (ctx->VertexProgram._Current == NULL) 348 return; 349 350 for (i = 0; i < ctx->Const.MaxTextureImageUnits; i++) { 351 if (ctx->Texture.Unit[i]._ReallyEnabled && 352 ctx->VertexProgram._Current->Base.TexturesUsed[i] != 0) { 353 struct gl_texture_object *texObj = ctx->Texture.Unit[i]._Current; 354 355 intel_tex_unmap_images(intel, intel_texture_object(texObj)); 356 } 357 } 358} 359 360typedef void (*span_init_func)(struct gl_renderbuffer *rb); 361 362static span_init_func intel_span_init_funcs[MESA_FORMAT_COUNT] = 363{ 364 [MESA_FORMAT_A8] = intel_InitPointers_A8, 365 [MESA_FORMAT_RGB565] = intel_InitPointers_RGB565, 366 [MESA_FORMAT_ARGB4444] = intel_InitPointers_ARGB4444, 367 [MESA_FORMAT_ARGB1555] = intel_InitPointers_ARGB1555, 368 [MESA_FORMAT_XRGB8888] = intel_InitPointers_xRGB8888, 369 [MESA_FORMAT_ARGB8888] = intel_InitPointers_ARGB8888, 370 [MESA_FORMAT_SARGB8] = intel_InitPointers_ARGB8888, 371 [MESA_FORMAT_Z16] = _mesa_set_renderbuffer_accessors, 372 [MESA_FORMAT_X8_Z24] = _mesa_set_renderbuffer_accessors, 373 [MESA_FORMAT_S8_Z24] = _mesa_set_renderbuffer_accessors, 374 [MESA_FORMAT_S8] = _mesa_set_renderbuffer_accessors, 375 [MESA_FORMAT_R8] = _mesa_set_renderbuffer_accessors, 376 [MESA_FORMAT_RG88] = _mesa_set_renderbuffer_accessors, 377 [MESA_FORMAT_R16] = _mesa_set_renderbuffer_accessors, 378 [MESA_FORMAT_RG1616] = _mesa_set_renderbuffer_accessors, 379 [MESA_FORMAT_RGBA_FLOAT32] = _mesa_set_renderbuffer_accessors, 380 [MESA_FORMAT_RG_FLOAT32] = _mesa_set_renderbuffer_accessors, 381 [MESA_FORMAT_R_FLOAT32] = _mesa_set_renderbuffer_accessors, 382 [MESA_FORMAT_INTENSITY_FLOAT32] = _mesa_set_renderbuffer_accessors, 383 [MESA_FORMAT_LUMINANCE_FLOAT32] = _mesa_set_renderbuffer_accessors, 384}; 385 386bool 387intel_span_supports_format(gl_format format) 388{ 389 /* Rendering to/from integer textures will be done using MapRenderbuffer, 390 * rather than coding up new paths through GetRow/PutRow(), so claim support 391 * for those formats in here for now. 392 */ 393 return (intel_span_init_funcs[format] != NULL || 394 _mesa_is_format_integer_color(format)); 395} 396 397/** 398 * Plug in appropriate span read/write functions for the given renderbuffer. 399 * These are used for the software fallbacks. 400 */ 401static void 402intel_set_span_functions(struct intel_context *intel, 403 struct gl_renderbuffer *rb) 404{ 405 struct intel_renderbuffer *irb = (struct intel_renderbuffer *) rb; 406 407 assert(intel_span_init_funcs[irb->Base.Format]); 408 intel_span_init_funcs[irb->Base.Format](rb); 409 410 if (rb->DataType == GL_NONE) { 411 _mesa_problem(NULL, 412 "renderbuffer format %s is missing " 413 "intel_mesa_format_to_rb_datatype() support.", 414 _mesa_get_format_name(rb->Format)); 415 } 416} 417