r300_screen.c revision 684d74e0009c01773e13f476676c0c575f73c615
1/*
2 * Copyright 2008 Corbin Simpson <MostAwesomeDude@gmail.com>
3 * Copyright 2010 Marek Olšák <maraeo@gmail.com>
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * on the rights to use, copy, modify, merge, publish, distribute, sub
9 * license, and/or sell copies of the Software, and to permit persons to whom
10 * the Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
20 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
21 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
22 * USE OR OTHER DEALINGS IN THE SOFTWARE. */
23
24#include "util/u_format.h"
25#include "util/u_format_s3tc.h"
26#include "util/u_memory.h"
27#include "os/os_time.h"
28#include "vl/vl_decoder.h"
29#include "vl/vl_video_buffer.h"
30
31#include "r300_context.h"
32#include "r300_texture.h"
33#include "r300_screen_buffer.h"
34#include "r300_state_inlines.h"
35#include "r300_public.h"
36
37#include "draw/draw_context.h"
38
39/* Return the identifier behind whom the brave coders responsible for this
40 * amalgamation of code, sweat, and duct tape, routinely obscure their names.
41 *
42 * ...I should have just put "Corbin Simpson", but I'm not that cool.
43 *
44 * (Or egotistical. Yet.) */
45static const char* r300_get_vendor(struct pipe_screen* pscreen)
46{
47    return "X.Org R300 Project";
48}
49
50static const char* chip_families[] = {
51    "ATI R300",
52    "ATI R350",
53    "ATI RV350",
54    "ATI RV370",
55    "ATI RV380",
56    "ATI RS400",
57    "ATI RC410",
58    "ATI RS480",
59    "ATI R420",
60    "ATI R423",
61    "ATI R430",
62    "ATI R480",
63    "ATI R481",
64    "ATI RV410",
65    "ATI RS600",
66    "ATI RS690",
67    "ATI RS740",
68    "ATI RV515",
69    "ATI R520",
70    "ATI RV530",
71    "ATI R580",
72    "ATI RV560",
73    "ATI RV570"
74};
75
76static const char* r300_get_name(struct pipe_screen* pscreen)
77{
78    struct r300_screen* r300screen = r300_screen(pscreen);
79
80    return chip_families[r300screen->caps.family];
81}
82
83static int r300_get_param(struct pipe_screen* pscreen, enum pipe_cap param)
84{
85    struct r300_screen* r300screen = r300_screen(pscreen);
86    boolean is_r500 = r300screen->caps.is_r500;
87
88    switch (param) {
89        /* Supported features (boolean caps). */
90        case PIPE_CAP_NPOT_TEXTURES:
91        case PIPE_CAP_TWO_SIDED_STENCIL:
92        case PIPE_CAP_ANISOTROPIC_FILTER:
93        case PIPE_CAP_POINT_SPRITE:
94        case PIPE_CAP_OCCLUSION_QUERY:
95        case PIPE_CAP_TEXTURE_SHADOW_MAP:
96        case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
97        case PIPE_CAP_BLEND_EQUATION_SEPARATE:
98        case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
99        case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
100        case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
101        case PIPE_CAP_CONDITIONAL_RENDER:
102        case PIPE_CAP_TEXTURE_BARRIER:
103            return 1;
104
105        /* r300 cannot do swizzling of compressed textures. Supported otherwise. */
106        case PIPE_CAP_TEXTURE_SWIZZLE:
107            return util_format_s3tc_enabled ? r300screen->caps.dxtc_swizzle : 1;
108
109        /* Supported on r500 only. */
110        case PIPE_CAP_FRAGMENT_COLOR_CLAMP_CONTROL:
111        case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
112        case PIPE_CAP_SM3:
113            return is_r500 ? 1 : 0;
114
115        /* Unsupported features. */
116        case PIPE_CAP_TIMER_QUERY:
117        case PIPE_CAP_DUAL_SOURCE_BLEND:
118        case PIPE_CAP_INDEP_BLEND_ENABLE:
119        case PIPE_CAP_INDEP_BLEND_FUNC:
120        case PIPE_CAP_DEPTH_CLAMP:
121        case PIPE_CAP_DEPTHSTENCIL_CLEAR_SEPARATE:
122        case PIPE_CAP_SHADER_STENCIL_EXPORT:
123        case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
124        case PIPE_CAP_TGSI_INSTANCEID:
125        case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
126        case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
127        case PIPE_CAP_SEAMLESS_CUBE_MAP:
128        case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
129        case PIPE_CAP_SCALED_RESOLVE:
130        case PIPE_CAP_MIN_TEXEL_OFFSET:
131        case PIPE_CAP_MAX_TEXEL_OFFSET:
132        case PIPE_CAP_STREAM_OUTPUT:
133            return 0;
134
135        /* SWTCL-only features. */
136        case PIPE_CAP_PRIMITIVE_RESTART:
137            return !r300screen->caps.has_tcl;
138
139        /* Texturing. */
140        case PIPE_CAP_MAX_COMBINED_SAMPLERS:
141            return r300screen->caps.num_tex_units;
142        case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
143        case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
144        case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
145            /* 13 == 4096, 12 == 2048 */
146            return is_r500 ? 13 : 12;
147
148        /* Render targets. */
149        case PIPE_CAP_MAX_RENDER_TARGETS:
150            return 4;
151    }
152    return 0;
153}
154
155static int r300_get_shader_param(struct pipe_screen *pscreen, unsigned shader, enum pipe_shader_cap param)
156{
157   struct r300_screen* r300screen = r300_screen(pscreen);
158   boolean is_r400 = r300screen->caps.is_r400;
159   boolean is_r500 = r300screen->caps.is_r500;
160
161   switch (shader) {
162    case PIPE_SHADER_FRAGMENT:
163        switch (param)
164        {
165        case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
166            return is_r500 || is_r400 ? 512 : 96;
167        case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
168            return is_r500 || is_r400 ? 512 : 64;
169        case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
170            return is_r500 || is_r400 ? 512 : 32;
171        case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
172            return is_r500 ? 511 : 4;
173        case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
174            return is_r500 ? 64 : 0; /* Actually unlimited on r500. */
175            /* Fragment shader limits. */
176        case PIPE_SHADER_CAP_MAX_INPUTS:
177            /* 2 colors + 8 texcoords are always supported
178             * (minus fog and wpos).
179             *
180             * R500 has the ability to turn 3rd and 4th color into
181             * additional texcoords but there is no two-sided color
182             * selection then. However the facing bit can be used instead. */
183            return 10;
184        case PIPE_SHADER_CAP_MAX_CONSTS:
185            return is_r500 ? 256 : 32;
186        case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
187            return 1;
188        case PIPE_SHADER_CAP_MAX_TEMPS:
189            return is_r500 ? 128 : is_r400 ? 64 : 32;
190        case PIPE_SHADER_CAP_MAX_ADDRS:
191            return 0;
192        case PIPE_SHADER_CAP_MAX_PREDS:
193            return is_r500 ? 1 : 0;
194        case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
195        case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
196        case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
197        case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
198        case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
199        case PIPE_SHADER_CAP_SUBROUTINES:
200        case PIPE_SHADER_CAP_INTEGERS:
201            return 0;
202        case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
203           return r300screen->caps.num_tex_units;
204        }
205        break;
206    case PIPE_SHADER_VERTEX:
207        switch (param)
208        {
209        case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
210            return 0;
211        default:;
212        }
213
214        if (!r300screen->caps.has_tcl) {
215            return draw_get_shader_param(shader, param);
216        }
217
218        switch (param)
219        {
220        case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
221        case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
222            return is_r500 ? 1024 : 256;
223        case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
224        case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
225            return 0;
226        case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
227            return is_r500 ? 4 : 0; /* For loops; not sure about conditionals. */
228        case PIPE_SHADER_CAP_MAX_INPUTS:
229            return 16;
230        case PIPE_SHADER_CAP_MAX_CONSTS:
231            return 256;
232        case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
233            return 1;
234        case PIPE_SHADER_CAP_MAX_TEMPS:
235            return 32;
236        case PIPE_SHADER_CAP_MAX_ADDRS:
237            return 1; /* XXX guessed */
238        case PIPE_SHADER_CAP_MAX_PREDS:
239            return is_r500 ? 4 : 0; /* XXX guessed. */
240        case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
241            return 1;
242        case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
243        case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
244        case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
245        case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
246        case PIPE_SHADER_CAP_SUBROUTINES:
247        case PIPE_SHADER_CAP_INTEGERS:
248            return 0;
249        }
250        break;
251    }
252    return 0;
253}
254
255static float r300_get_paramf(struct pipe_screen* pscreen,
256                             enum pipe_capf param)
257{
258    struct r300_screen* r300screen = r300_screen(pscreen);
259
260    switch (param) {
261        case PIPE_CAPF_MAX_LINE_WIDTH:
262        case PIPE_CAPF_MAX_LINE_WIDTH_AA:
263        case PIPE_CAPF_MAX_POINT_WIDTH:
264        case PIPE_CAPF_MAX_POINT_WIDTH_AA:
265            /* The maximum dimensions of the colorbuffer are our practical
266             * rendering limits. 2048 pixels should be enough for anybody. */
267            if (r300screen->caps.is_r500) {
268                return 4096.0f;
269            } else if (r300screen->caps.is_r400) {
270                return 4021.0f;
271            } else {
272                return 2560.0f;
273            }
274        case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
275            return 16.0f;
276        case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
277            return 16.0f;
278        case PIPE_CAPF_GUARD_BAND_LEFT:
279        case PIPE_CAPF_GUARD_BAND_TOP:
280        case PIPE_CAPF_GUARD_BAND_RIGHT:
281        case PIPE_CAPF_GUARD_BAND_BOTTOM:
282            /* XXX I don't know what these should be but the least we can do is
283             * silence the potential error message */
284            return 0.0f;
285        default:
286            debug_printf("r300: Warning: Unknown CAP %d in get_paramf.\n",
287                         param);
288            return 0.0f;
289    }
290}
291
292static int r300_get_video_param(struct pipe_screen *screen,
293				enum pipe_video_profile profile,
294				enum pipe_video_cap param)
295{
296   switch (param) {
297      case PIPE_VIDEO_CAP_SUPPORTED:
298         return vl_profile_supported(screen, profile);
299      case PIPE_VIDEO_CAP_NPOT_TEXTURES:
300         return 0;
301      case PIPE_VIDEO_CAP_MAX_WIDTH:
302      case PIPE_VIDEO_CAP_MAX_HEIGHT:
303         return vl_video_buffer_max_size(screen);
304      case PIPE_VIDEO_CAP_NUM_BUFFERS_DESIRED:
305         return vl_num_buffers_desired(screen, profile);
306      default:
307         return 0;
308   }
309}
310
311static boolean r300_is_format_supported(struct pipe_screen* screen,
312                                        enum pipe_format format,
313                                        enum pipe_texture_target target,
314                                        unsigned sample_count,
315                                        unsigned usage)
316{
317    uint32_t retval = 0;
318    boolean drm_2_8_0 = r300_screen(screen)->info.drm_minor >= 8;
319    boolean is_r500 = r300_screen(screen)->caps.is_r500;
320    boolean is_r400 = r300_screen(screen)->caps.is_r400;
321    boolean is_color2101010 = format == PIPE_FORMAT_R10G10B10A2_UNORM ||
322                              format == PIPE_FORMAT_R10G10B10X2_SNORM ||
323                              format == PIPE_FORMAT_B10G10R10A2_UNORM ||
324                              format == PIPE_FORMAT_R10SG10SB10SA2U_NORM;
325    boolean is_ati1n = format == PIPE_FORMAT_RGTC1_UNORM ||
326                       format == PIPE_FORMAT_RGTC1_SNORM ||
327                       format == PIPE_FORMAT_LATC1_UNORM ||
328                       format == PIPE_FORMAT_LATC1_SNORM;
329    boolean is_ati2n = format == PIPE_FORMAT_RGTC2_UNORM ||
330                       format == PIPE_FORMAT_RGTC2_SNORM ||
331                       format == PIPE_FORMAT_LATC2_UNORM ||
332                       format == PIPE_FORMAT_LATC2_SNORM;
333    boolean is_x16f_xy16f = format == PIPE_FORMAT_R16_FLOAT ||
334                            format == PIPE_FORMAT_R16G16_FLOAT ||
335                            format == PIPE_FORMAT_A16_FLOAT ||
336                            format == PIPE_FORMAT_L16_FLOAT ||
337                            format == PIPE_FORMAT_L16A16_FLOAT ||
338                            format == PIPE_FORMAT_I16_FLOAT;
339    boolean is_half_float = format == PIPE_FORMAT_R16_FLOAT ||
340                            format == PIPE_FORMAT_R16G16_FLOAT ||
341                            format == PIPE_FORMAT_R16G16B16_FLOAT ||
342                            format == PIPE_FORMAT_R16G16B16A16_FLOAT;
343    boolean is_fixed = format == PIPE_FORMAT_R32_FIXED ||
344                       format == PIPE_FORMAT_R32G32_FIXED ||
345                       format == PIPE_FORMAT_R32G32B32_FIXED ||
346                       format == PIPE_FORMAT_R32G32B32A32_FIXED;
347
348    if (!util_format_is_supported(format, usage))
349       return FALSE;
350
351    /* Check multisampling support. */
352    switch (sample_count) {
353        case 0:
354        case 1:
355            break;
356        case 2:
357        case 3:
358        case 4:
359        case 6:
360            return FALSE;
361#if 0
362            if (usage != PIPE_BIND_RENDER_TARGET ||
363                !util_format_is_rgba8_variant(
364                    util_format_description(format))) {
365                return FALSE;
366            }
367#endif
368            break;
369        default:
370            return FALSE;
371    }
372
373    /* Check sampler format support. */
374    if ((usage & PIPE_BIND_SAMPLER_VIEW) &&
375        /* ATI1N is r5xx-only. */
376        (is_r500 || !is_ati1n) &&
377        /* ATI2N is supported on r4xx-r5xx. */
378        (is_r400 || is_r500 || !is_ati2n) &&
379        /* R16F and RG16F texture support was added in as late as DRM 2.8.0 */
380        (drm_2_8_0 || !is_x16f_xy16f) &&
381        r300_is_sampler_format_supported(format)) {
382        retval |= PIPE_BIND_SAMPLER_VIEW;
383    }
384
385    /* Check colorbuffer format support. */
386    if ((usage & (PIPE_BIND_RENDER_TARGET |
387                  PIPE_BIND_DISPLAY_TARGET |
388                  PIPE_BIND_SCANOUT |
389                  PIPE_BIND_SHARED)) &&
390        /* 2101010 cannot be rendered to on non-r5xx. */
391        (!is_color2101010 || (is_r500 && drm_2_8_0)) &&
392        r300_is_colorbuffer_format_supported(format)) {
393        retval |= usage &
394            (PIPE_BIND_RENDER_TARGET |
395             PIPE_BIND_DISPLAY_TARGET |
396             PIPE_BIND_SCANOUT |
397             PIPE_BIND_SHARED);
398    }
399
400    /* Check depth-stencil format support. */
401    if (usage & PIPE_BIND_DEPTH_STENCIL &&
402        r300_is_zs_format_supported(format)) {
403        retval |= PIPE_BIND_DEPTH_STENCIL;
404    }
405
406    /* Check vertex buffer format support. */
407    if (usage & PIPE_BIND_VERTEX_BUFFER &&
408        /* Half float is supported on >= R400. */
409        (is_r400 || is_r500 || !is_half_float) &&
410        /* We have a fallback for FIXED. */
411        (is_fixed || r300_translate_vertex_data_type(format) != R300_INVALID_FORMAT)) {
412        retval |= PIPE_BIND_VERTEX_BUFFER;
413    }
414
415    /* Transfers are always supported. */
416    if (usage & PIPE_BIND_TRANSFER_READ)
417        retval |= PIPE_BIND_TRANSFER_READ;
418    if (usage & PIPE_BIND_TRANSFER_WRITE)
419        retval |= PIPE_BIND_TRANSFER_WRITE;
420
421    return retval == usage;
422}
423
424static void r300_destroy_screen(struct pipe_screen* pscreen)
425{
426    struct r300_screen* r300screen = r300_screen(pscreen);
427    struct radeon_winsys *rws = radeon_winsys(pscreen);
428
429    util_slab_destroy(&r300screen->pool_buffers);
430    pipe_mutex_destroy(r300screen->num_contexts_mutex);
431
432    if (rws)
433      rws->destroy(rws);
434
435    FREE(r300screen);
436}
437
438static void r300_fence_reference(struct pipe_screen *screen,
439                                 struct pipe_fence_handle **ptr,
440                                 struct pipe_fence_handle *fence)
441{
442    pb_reference((struct pb_buffer**)ptr,
443                             (struct pb_buffer*)fence);
444}
445
446static boolean r300_fence_signalled(struct pipe_screen *screen,
447                                    struct pipe_fence_handle *fence)
448{
449    struct radeon_winsys *rws = r300_screen(screen)->rws;
450    struct pb_buffer *rfence = (struct pb_buffer*)fence;
451
452    return !rws->buffer_is_busy(rfence, RADEON_USAGE_READWRITE);
453}
454
455static boolean r300_fence_finish(struct pipe_screen *screen,
456                                 struct pipe_fence_handle *fence,
457                                 uint64_t timeout)
458{
459    struct radeon_winsys *rws = r300_screen(screen)->rws;
460    struct pb_buffer *rfence = (struct pb_buffer*)fence;
461
462    if (timeout != PIPE_TIMEOUT_INFINITE) {
463        int64_t start_time = os_time_get();
464
465        /* Convert to microseconds. */
466        timeout /= 1000;
467
468        /* Wait in a loop. */
469        while (rws->buffer_is_busy(rfence, RADEON_USAGE_READWRITE)) {
470            if (os_time_get() - start_time >= timeout) {
471                return FALSE;
472            }
473            os_time_sleep(10);
474        }
475        return TRUE;
476    }
477
478    rws->buffer_wait(rfence, RADEON_USAGE_READWRITE);
479    return TRUE;
480}
481
482struct pipe_screen* r300_screen_create(struct radeon_winsys *rws)
483{
484    struct r300_screen *r300screen = CALLOC_STRUCT(r300_screen);
485
486    if (!r300screen) {
487        FREE(r300screen);
488        return NULL;
489    }
490
491    rws->query_info(rws, &r300screen->info);
492
493    r300_init_debug(r300screen);
494    r300_parse_chipset(r300screen->info.pci_id, &r300screen->caps);
495
496    if (SCREEN_DBG_ON(r300screen, DBG_NO_ZMASK))
497        r300screen->caps.zmask_ram = 0;
498    if (SCREEN_DBG_ON(r300screen, DBG_NO_HIZ))
499        r300screen->caps.hiz_ram = 0;
500
501    if (r300screen->info.drm_minor < 8)
502        r300screen->caps.has_us_format = FALSE;
503
504    pipe_mutex_init(r300screen->num_contexts_mutex);
505
506    util_slab_create(&r300screen->pool_buffers,
507                     sizeof(struct r300_resource), 64,
508                     UTIL_SLAB_SINGLETHREADED);
509
510    r300screen->rws = rws;
511    r300screen->screen.winsys = (struct pipe_winsys*)rws;
512    r300screen->screen.destroy = r300_destroy_screen;
513    r300screen->screen.get_name = r300_get_name;
514    r300screen->screen.get_vendor = r300_get_vendor;
515    r300screen->screen.get_param = r300_get_param;
516    r300screen->screen.get_shader_param = r300_get_shader_param;
517    r300screen->screen.get_paramf = r300_get_paramf;
518    r300screen->screen.get_video_param = r300_get_video_param;
519    r300screen->screen.is_format_supported = r300_is_format_supported;
520    r300screen->screen.is_video_format_supported = vl_video_buffer_is_format_supported;
521    r300screen->screen.context_create = r300_create_context;
522    r300screen->screen.fence_reference = r300_fence_reference;
523    r300screen->screen.fence_signalled = r300_fence_signalled;
524    r300screen->screen.fence_finish = r300_fence_finish;
525
526    r300_init_screen_resource_functions(r300screen);
527
528    util_format_s3tc_init();
529
530    return &r300screen->screen;
531}
532