r300_screen.c revision 3d13b081c72626acba6b9a25baec740c60dfafe1
1/*
2 * Copyright 2008 Corbin Simpson <MostAwesomeDude@gmail.com>
3 * Copyright 2010 Marek Olšák <maraeo@gmail.com>
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * on the rights to use, copy, modify, merge, publish, distribute, sub
9 * license, and/or sell copies of the Software, and to permit persons to whom
10 * the Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
20 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
21 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
22 * USE OR OTHER DEALINGS IN THE SOFTWARE. */
23
24#include "util/u_format.h"
25#include "util/u_format_s3tc.h"
26#include "util/u_memory.h"
27#include "os/os_time.h"
28#include "vl/vl_decoder.h"
29#include "vl/vl_video_buffer.h"
30
31#include "r300_context.h"
32#include "r300_texture.h"
33#include "r300_screen_buffer.h"
34#include "r300_state_inlines.h"
35#include "r300_public.h"
36
37#include "draw/draw_context.h"
38
39/* Return the identifier behind whom the brave coders responsible for this
40 * amalgamation of code, sweat, and duct tape, routinely obscure their names.
41 *
42 * ...I should have just put "Corbin Simpson", but I'm not that cool.
43 *
44 * (Or egotistical. Yet.) */
45static const char* r300_get_vendor(struct pipe_screen* pscreen)
46{
47    return "X.Org R300 Project";
48}
49
50static const char* chip_families[] = {
51    "ATI R300",
52    "ATI R350",
53    "ATI RV350",
54    "ATI RV370",
55    "ATI RV380",
56    "ATI RS400",
57    "ATI RC410",
58    "ATI RS480",
59    "ATI R420",
60    "ATI R423",
61    "ATI R430",
62    "ATI R480",
63    "ATI R481",
64    "ATI RV410",
65    "ATI RS600",
66    "ATI RS690",
67    "ATI RS740",
68    "ATI RV515",
69    "ATI R520",
70    "ATI RV530",
71    "ATI R580",
72    "ATI RV560",
73    "ATI RV570"
74};
75
76static const char* r300_get_name(struct pipe_screen* pscreen)
77{
78    struct r300_screen* r300screen = r300_screen(pscreen);
79
80    return chip_families[r300screen->caps.family];
81}
82
83static int r300_get_param(struct pipe_screen* pscreen, enum pipe_cap param)
84{
85    struct r300_screen* r300screen = r300_screen(pscreen);
86    boolean is_r500 = r300screen->caps.is_r500;
87
88    switch (param) {
89        /* Supported features (boolean caps). */
90        case PIPE_CAP_NPOT_TEXTURES:
91        case PIPE_CAP_TWO_SIDED_STENCIL:
92        case PIPE_CAP_GLSL:
93            /* I'll be frank. This is a lie.
94             *
95             * We don't truly support GLSL on any of this driver's chipsets.
96             * To be fair, no chipset supports the full GLSL specification
97             * to the best of our knowledge, but some of the less esoteric
98             * features are still missing here.
99             *
100             * Rather than cripple ourselves intentionally, I'm going to set
101             * this flag, and as Gallium's interface continues to change, I
102             * hope that this single monolithic GLSL enable can slowly get
103             * split down into many different pieces and the state tracker
104             * will handle fallbacks transparently, like it should.
105             *
106             * ~ C.
107             */
108        case PIPE_CAP_ANISOTROPIC_FILTER:
109        case PIPE_CAP_POINT_SPRITE:
110        case PIPE_CAP_OCCLUSION_QUERY:
111        case PIPE_CAP_TEXTURE_SHADOW_MAP:
112        case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
113        case PIPE_CAP_BLEND_EQUATION_SEPARATE:
114        case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
115        case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
116        case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
117        case PIPE_CAP_CONDITIONAL_RENDER:
118            return 1;
119
120        /* r300 cannot do swizzling of compressed textures. Supported otherwise. */
121        case PIPE_CAP_TEXTURE_SWIZZLE:
122            return util_format_s3tc_enabled ? r300screen->caps.dxtc_swizzle : 1;
123
124        /* Supported on r500 only. */
125        case PIPE_CAP_FRAGMENT_COLOR_CLAMP_CONTROL:
126        case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
127        case PIPE_CAP_SM3:
128            return is_r500 ? 1 : 0;
129
130        /* Unsupported features. */
131        case PIPE_CAP_TIMER_QUERY:
132        case PIPE_CAP_DUAL_SOURCE_BLEND:
133        case PIPE_CAP_INDEP_BLEND_ENABLE:
134        case PIPE_CAP_INDEP_BLEND_FUNC:
135        case PIPE_CAP_DEPTH_CLAMP:
136        case PIPE_CAP_DEPTHSTENCIL_CLEAR_SEPARATE:
137        case PIPE_CAP_SHADER_STENCIL_EXPORT:
138        case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
139        case PIPE_CAP_TGSI_INSTANCEID:
140        case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
141        case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
142        case PIPE_CAP_SEAMLESS_CUBE_MAP:
143        case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
144        case PIPE_CAP_SCALED_RESOLVE:
145        case PIPE_CAP_MIN_TEXEL_OFFSET:
146        case PIPE_CAP_MAX_TEXEL_OFFSET:
147            return 0;
148
149        /* SWTCL-only features. */
150        case PIPE_CAP_STREAM_OUTPUT:
151        case PIPE_CAP_PRIMITIVE_RESTART:
152            return !r300screen->caps.has_tcl;
153
154        /* Texturing. */
155        case PIPE_CAP_MAX_COMBINED_SAMPLERS:
156            return r300screen->caps.num_tex_units;
157        case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
158        case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
159        case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
160            /* 13 == 4096, 12 == 2048 */
161            return is_r500 ? 13 : 12;
162
163        /* Render targets. */
164        case PIPE_CAP_MAX_RENDER_TARGETS:
165            return 4;
166
167        default:
168            debug_printf("r300: Warning: Unknown CAP %d in get_param.\n",
169                         param);
170            return 0;
171    }
172}
173
174static int r300_get_shader_param(struct pipe_screen *pscreen, unsigned shader, enum pipe_shader_cap param)
175{
176   struct r300_screen* r300screen = r300_screen(pscreen);
177   boolean is_r400 = r300screen->caps.is_r400;
178   boolean is_r500 = r300screen->caps.is_r500;
179
180   switch (shader)
181    {
182    case PIPE_SHADER_FRAGMENT:
183        switch (param)
184        {
185        case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
186            return is_r500 || is_r400 ? 512 : 96;
187        case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
188            return is_r500 || is_r400 ? 512 : 64;
189        case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
190            return is_r500 || is_r400 ? 512 : 32;
191        case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
192            return is_r500 ? 511 : 4;
193        case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
194            return is_r500 ? 64 : 0; /* Actually unlimited on r500. */
195            /* Fragment shader limits. */
196        case PIPE_SHADER_CAP_MAX_INPUTS:
197            /* 2 colors + 8 texcoords are always supported
198             * (minus fog and wpos).
199             *
200             * R500 has the ability to turn 3rd and 4th color into
201             * additional texcoords but there is no two-sided color
202             * selection then. However the facing bit can be used instead. */
203            return 10;
204        case PIPE_SHADER_CAP_MAX_CONSTS:
205            return is_r500 ? 256 : 32;
206        case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
207            return 1;
208        case PIPE_SHADER_CAP_MAX_TEMPS:
209            return is_r500 ? 128 : is_r400 ? 64 : 32;
210        case PIPE_SHADER_CAP_MAX_ADDRS:
211            return 0;
212        case PIPE_SHADER_CAP_MAX_PREDS:
213            return is_r500 ? 1 : 0;
214        case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
215        case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
216        case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
217        case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
218        case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
219        case PIPE_SHADER_CAP_SUBROUTINES:
220        case PIPE_SHADER_CAP_INTEGERS:
221            return 0;
222        case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
223           return r300screen->caps.num_tex_units;
224        }
225        break;
226    case PIPE_SHADER_VERTEX:
227        if (!r300screen->caps.has_tcl) {
228            return draw_get_shader_param(shader, param);
229        }
230
231        switch (param)
232        {
233        case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
234        case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
235            return is_r500 ? 1024 : 256;
236        case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
237        case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
238            return 0;
239        case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
240            return is_r500 ? 4 : 0; /* For loops; not sure about conditionals. */
241        case PIPE_SHADER_CAP_MAX_INPUTS:
242            return 16;
243        case PIPE_SHADER_CAP_MAX_CONSTS:
244            return 256;
245        case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
246            return 1;
247        case PIPE_SHADER_CAP_MAX_TEMPS:
248            return 32;
249        case PIPE_SHADER_CAP_MAX_ADDRS:
250            return 1; /* XXX guessed */
251        case PIPE_SHADER_CAP_MAX_PREDS:
252            return is_r500 ? 4 : 0; /* XXX guessed. */
253        case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
254            return 1;
255        case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
256        case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
257        case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
258        case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
259        case PIPE_SHADER_CAP_SUBROUTINES:
260        case PIPE_SHADER_CAP_INTEGERS:
261        case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
262            return 0;
263        }
264        break;
265    default:
266        break;
267    }
268    return 0;
269}
270
271static float r300_get_paramf(struct pipe_screen* pscreen, enum pipe_cap param)
272{
273    struct r300_screen* r300screen = r300_screen(pscreen);
274
275    switch (param) {
276        case PIPE_CAP_MAX_LINE_WIDTH:
277        case PIPE_CAP_MAX_LINE_WIDTH_AA:
278        case PIPE_CAP_MAX_POINT_WIDTH:
279        case PIPE_CAP_MAX_POINT_WIDTH_AA:
280            /* The maximum dimensions of the colorbuffer are our practical
281             * rendering limits. 2048 pixels should be enough for anybody. */
282            if (r300screen->caps.is_r500) {
283                return 4096.0f;
284            } else if (r300screen->caps.is_r400) {
285                return 4021.0f;
286            } else {
287                return 2560.0f;
288            }
289        case PIPE_CAP_MAX_TEXTURE_ANISOTROPY:
290            return 16.0f;
291        case PIPE_CAP_MAX_TEXTURE_LOD_BIAS:
292            return 16.0f;
293        case PIPE_CAP_GUARD_BAND_LEFT:
294        case PIPE_CAP_GUARD_BAND_TOP:
295        case PIPE_CAP_GUARD_BAND_RIGHT:
296        case PIPE_CAP_GUARD_BAND_BOTTOM:
297            /* XXX I don't know what these should be but the least we can do is
298             * silence the potential error message */
299            return 0.0f;
300        default:
301            debug_printf("r300: Warning: Unknown CAP %d in get_paramf.\n",
302                         param);
303            return 0.0f;
304    }
305}
306
307static int r300_get_video_param(struct pipe_screen *screen,
308				enum pipe_video_profile profile,
309				enum pipe_video_cap param)
310{
311   switch (param) {
312      case PIPE_VIDEO_CAP_SUPPORTED:
313         return vl_profile_supported(screen, profile);
314      case PIPE_VIDEO_CAP_NPOT_TEXTURES:
315         return 0;
316      case PIPE_VIDEO_CAP_MAX_WIDTH:
317      case PIPE_VIDEO_CAP_MAX_HEIGHT:
318         return vl_video_buffer_max_size(screen);
319      case PIPE_VIDEO_CAP_NUM_BUFFERS_DESIRED:
320         return vl_num_buffers_desired(screen, profile);
321      default:
322         return 0;
323   }
324}
325
326static boolean r300_is_format_supported(struct pipe_screen* screen,
327                                        enum pipe_format format,
328                                        enum pipe_texture_target target,
329                                        unsigned sample_count,
330                                        unsigned usage)
331{
332    uint32_t retval = 0;
333    boolean drm_2_8_0 = r300_screen(screen)->info.drm_minor >= 8;
334    boolean is_r500 = r300_screen(screen)->caps.is_r500;
335    boolean is_r400 = r300_screen(screen)->caps.is_r400;
336    boolean is_color2101010 = format == PIPE_FORMAT_R10G10B10A2_UNORM ||
337                              format == PIPE_FORMAT_R10G10B10X2_SNORM ||
338                              format == PIPE_FORMAT_B10G10R10A2_UNORM ||
339                              format == PIPE_FORMAT_R10SG10SB10SA2U_NORM;
340    boolean is_ati1n = format == PIPE_FORMAT_RGTC1_UNORM ||
341                       format == PIPE_FORMAT_RGTC1_SNORM ||
342                       format == PIPE_FORMAT_LATC1_UNORM ||
343                       format == PIPE_FORMAT_LATC1_SNORM;
344    boolean is_ati2n = format == PIPE_FORMAT_RGTC2_UNORM ||
345                       format == PIPE_FORMAT_RGTC2_SNORM ||
346                       format == PIPE_FORMAT_LATC2_UNORM ||
347                       format == PIPE_FORMAT_LATC2_SNORM;
348    boolean is_x16f_xy16f = format == PIPE_FORMAT_R16_FLOAT ||
349                            format == PIPE_FORMAT_R16G16_FLOAT ||
350                            format == PIPE_FORMAT_A16_FLOAT ||
351                            format == PIPE_FORMAT_L16_FLOAT ||
352                            format == PIPE_FORMAT_L16A16_FLOAT ||
353                            format == PIPE_FORMAT_I16_FLOAT;
354    boolean is_half_float = format == PIPE_FORMAT_R16_FLOAT ||
355                            format == PIPE_FORMAT_R16G16_FLOAT ||
356                            format == PIPE_FORMAT_R16G16B16_FLOAT ||
357                            format == PIPE_FORMAT_R16G16B16A16_FLOAT;
358
359    if (!util_format_is_supported(format, usage))
360       return FALSE;
361
362    /* Check multisampling support. */
363    switch (sample_count) {
364        case 0:
365        case 1:
366            break;
367        case 2:
368        case 3:
369        case 4:
370        case 6:
371            return FALSE;
372#if 0
373            if (usage != PIPE_BIND_RENDER_TARGET ||
374                !util_format_is_rgba8_variant(
375                    util_format_description(format))) {
376                return FALSE;
377            }
378#endif
379            break;
380        default:
381            return FALSE;
382    }
383
384    /* Check sampler format support. */
385    if ((usage & PIPE_BIND_SAMPLER_VIEW) &&
386        /* ATI1N is r5xx-only. */
387        (is_r500 || !is_ati1n) &&
388        /* ATI2N is supported on r4xx-r5xx. */
389        (is_r400 || is_r500 || !is_ati2n) &&
390        /* R16F and RG16F texture support was added in as late as DRM 2.8.0 */
391        (drm_2_8_0 || !is_x16f_xy16f) &&
392        r300_is_sampler_format_supported(format)) {
393        retval |= PIPE_BIND_SAMPLER_VIEW;
394    }
395
396    /* Check colorbuffer format support. */
397    if ((usage & (PIPE_BIND_RENDER_TARGET |
398                  PIPE_BIND_DISPLAY_TARGET |
399                  PIPE_BIND_SCANOUT |
400                  PIPE_BIND_SHARED)) &&
401        /* 2101010 cannot be rendered to on non-r5xx. */
402        (!is_color2101010 || (is_r500 && drm_2_8_0)) &&
403        r300_is_colorbuffer_format_supported(format)) {
404        retval |= usage &
405            (PIPE_BIND_RENDER_TARGET |
406             PIPE_BIND_DISPLAY_TARGET |
407             PIPE_BIND_SCANOUT |
408             PIPE_BIND_SHARED);
409    }
410
411    /* Check depth-stencil format support. */
412    if (usage & PIPE_BIND_DEPTH_STENCIL &&
413        r300_is_zs_format_supported(format)) {
414        retval |= PIPE_BIND_DEPTH_STENCIL;
415    }
416
417    /* Check vertex buffer format support. */
418    if (usage & PIPE_BIND_VERTEX_BUFFER &&
419        /* Half float is supported on >= RV350. */
420        (is_r400 || is_r500 || !is_half_float) &&
421        r300_translate_vertex_data_type(format) != R300_INVALID_FORMAT) {
422        retval |= PIPE_BIND_VERTEX_BUFFER;
423    }
424
425    /* Transfers are always supported. */
426    if (usage & PIPE_BIND_TRANSFER_READ)
427        retval |= PIPE_BIND_TRANSFER_READ;
428    if (usage & PIPE_BIND_TRANSFER_WRITE)
429        retval |= PIPE_BIND_TRANSFER_WRITE;
430
431    return retval == usage;
432}
433
434static void r300_destroy_screen(struct pipe_screen* pscreen)
435{
436    struct r300_screen* r300screen = r300_screen(pscreen);
437    struct radeon_winsys *rws = radeon_winsys(pscreen);
438
439    util_slab_destroy(&r300screen->pool_buffers);
440    pipe_mutex_destroy(r300screen->num_contexts_mutex);
441
442    if (rws)
443      rws->destroy(rws);
444
445    FREE(r300screen);
446}
447
448static void r300_fence_reference(struct pipe_screen *screen,
449                                 struct pipe_fence_handle **ptr,
450                                 struct pipe_fence_handle *fence)
451{
452    pb_reference((struct pb_buffer**)ptr,
453                             (struct pb_buffer*)fence);
454}
455
456static boolean r300_fence_signalled(struct pipe_screen *screen,
457                                    struct pipe_fence_handle *fence)
458{
459    struct radeon_winsys *rws = r300_screen(screen)->rws;
460    struct pb_buffer *rfence = (struct pb_buffer*)fence;
461
462    return !rws->buffer_is_busy(rfence, RADEON_USAGE_READWRITE);
463}
464
465static boolean r300_fence_finish(struct pipe_screen *screen,
466                                 struct pipe_fence_handle *fence,
467                                 uint64_t timeout)
468{
469    struct radeon_winsys *rws = r300_screen(screen)->rws;
470    struct pb_buffer *rfence = (struct pb_buffer*)fence;
471
472    if (timeout != PIPE_TIMEOUT_INFINITE) {
473        int64_t start_time = os_time_get();
474
475        /* Convert to microseconds. */
476        timeout /= 1000;
477
478        /* Wait in a loop. */
479        while (rws->buffer_is_busy(rfence, RADEON_USAGE_READWRITE)) {
480            if (os_time_get() - start_time >= timeout) {
481                return FALSE;
482            }
483            os_time_sleep(10);
484        }
485        return TRUE;
486    }
487
488    rws->buffer_wait(rfence, RADEON_USAGE_READWRITE);
489    return TRUE;
490}
491
492struct pipe_screen* r300_screen_create(struct radeon_winsys *rws)
493{
494    struct r300_screen *r300screen = CALLOC_STRUCT(r300_screen);
495
496    if (!r300screen) {
497        FREE(r300screen);
498        return NULL;
499    }
500
501    rws->query_info(rws, &r300screen->info);
502
503    r300_init_debug(r300screen);
504    r300_parse_chipset(r300screen->info.pci_id, &r300screen->caps);
505
506    if (SCREEN_DBG_ON(r300screen, DBG_NO_ZMASK))
507        r300screen->caps.zmask_ram = 0;
508    if (SCREEN_DBG_ON(r300screen, DBG_NO_HIZ))
509        r300screen->caps.hiz_ram = 0;
510
511    if (r300screen->info.drm_minor < 8)
512        r300screen->caps.has_us_format = FALSE;
513
514    pipe_mutex_init(r300screen->num_contexts_mutex);
515
516    util_slab_create(&r300screen->pool_buffers,
517                     sizeof(struct r300_resource), 64,
518                     UTIL_SLAB_SINGLETHREADED);
519
520    r300screen->rws = rws;
521    r300screen->screen.winsys = (struct pipe_winsys*)rws;
522    r300screen->screen.destroy = r300_destroy_screen;
523    r300screen->screen.get_name = r300_get_name;
524    r300screen->screen.get_vendor = r300_get_vendor;
525    r300screen->screen.get_param = r300_get_param;
526    r300screen->screen.get_shader_param = r300_get_shader_param;
527    r300screen->screen.get_paramf = r300_get_paramf;
528    r300screen->screen.get_video_param = r300_get_video_param;
529    r300screen->screen.is_format_supported = r300_is_format_supported;
530    r300screen->screen.is_video_format_supported = vl_video_buffer_is_format_supported;
531    r300screen->screen.context_create = r300_create_context;
532    r300screen->screen.fence_reference = r300_fence_reference;
533    r300screen->screen.fence_signalled = r300_fence_signalled;
534    r300screen->screen.fence_finish = r300_fence_finish;
535
536    r300_init_screen_resource_functions(r300screen);
537
538    util_format_s3tc_init();
539
540    return &r300screen->screen;
541}
542