r300_screen.c revision dc4c821f0817a3db716f965692fb701079f66340
1/*
2 * Copyright 2008 Corbin Simpson <MostAwesomeDude@gmail.com>
3 * Copyright 2010 Marek Olšák <maraeo@gmail.com>
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * on the rights to use, copy, modify, merge, publish, distribute, sub
9 * license, and/or sell copies of the Software, and to permit persons to whom
10 * the Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
20 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
21 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
22 * USE OR OTHER DEALINGS IN THE SOFTWARE. */
23
24#include "util/u_format.h"
25#include "util/u_format_s3tc.h"
26#include "util/u_memory.h"
27#include "os/os_time.h"
28#include "vl/vl_decoder.h"
29#include "vl/vl_video_buffer.h"
30
31#include "r300_context.h"
32#include "r300_texture.h"
33#include "r300_screen_buffer.h"
34#include "r300_state_inlines.h"
35#include "r300_public.h"
36
37#include "draw/draw_context.h"
38
39/* Return the identifier behind whom the brave coders responsible for this
40 * amalgamation of code, sweat, and duct tape, routinely obscure their names.
41 *
42 * ...I should have just put "Corbin Simpson", but I'm not that cool.
43 *
44 * (Or egotistical. Yet.) */
45static const char* r300_get_vendor(struct pipe_screen* pscreen)
46{
47    return "X.Org R300 Project";
48}
49
50static const char* chip_families[] = {
51    "ATI R300",
52    "ATI R350",
53    "ATI RV350",
54    "ATI RV370",
55    "ATI RV380",
56    "ATI RS400",
57    "ATI RC410",
58    "ATI RS480",
59    "ATI R420",
60    "ATI R423",
61    "ATI R430",
62    "ATI R480",
63    "ATI R481",
64    "ATI RV410",
65    "ATI RS600",
66    "ATI RS690",
67    "ATI RS740",
68    "ATI RV515",
69    "ATI R520",
70    "ATI RV530",
71    "ATI R580",
72    "ATI RV560",
73    "ATI RV570"
74};
75
76static const char* r300_get_name(struct pipe_screen* pscreen)
77{
78    struct r300_screen* r300screen = r300_screen(pscreen);
79
80    return chip_families[r300screen->caps.family];
81}
82
83static int r300_get_param(struct pipe_screen* pscreen, enum pipe_cap param)
84{
85    struct r300_screen* r300screen = r300_screen(pscreen);
86    boolean is_r500 = r300screen->caps.is_r500;
87
88    switch (param) {
89        /* Supported features (boolean caps). */
90        case PIPE_CAP_NPOT_TEXTURES:
91        case PIPE_CAP_TWO_SIDED_STENCIL:
92        case PIPE_CAP_ANISOTROPIC_FILTER:
93        case PIPE_CAP_POINT_SPRITE:
94        case PIPE_CAP_OCCLUSION_QUERY:
95        case PIPE_CAP_TEXTURE_SHADOW_MAP:
96        case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
97        case PIPE_CAP_BLEND_EQUATION_SEPARATE:
98        case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
99        case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
100        case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
101        case PIPE_CAP_CONDITIONAL_RENDER:
102        case PIPE_CAP_TEXTURE_BARRIER:
103        case PIPE_CAP_TGSI_CAN_COMPACT_VARYINGS:
104        case PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS:
105            return 1;
106
107        /* r300 cannot do swizzling of compressed textures. Supported otherwise. */
108        case PIPE_CAP_TEXTURE_SWIZZLE:
109            return util_format_s3tc_enabled ? r300screen->caps.dxtc_swizzle : 1;
110
111        /* Supported on r500 only. */
112        case PIPE_CAP_FRAGMENT_COLOR_CLAMP_CONTROL:
113        case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
114        case PIPE_CAP_SM3:
115            return is_r500 ? 1 : 0;
116
117        /* Unsupported features. */
118        case PIPE_CAP_TIMER_QUERY:
119        case PIPE_CAP_DUAL_SOURCE_BLEND:
120        case PIPE_CAP_INDEP_BLEND_ENABLE:
121        case PIPE_CAP_INDEP_BLEND_FUNC:
122        case PIPE_CAP_DEPTH_CLIP_DISABLE:
123        case PIPE_CAP_DEPTHSTENCIL_CLEAR_SEPARATE:
124        case PIPE_CAP_SHADER_STENCIL_EXPORT:
125        case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
126        case PIPE_CAP_TGSI_INSTANCEID:
127        case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
128        case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
129        case PIPE_CAP_SEAMLESS_CUBE_MAP:
130        case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
131        case PIPE_CAP_SCALED_RESOLVE:
132        case PIPE_CAP_MIN_TEXEL_OFFSET:
133        case PIPE_CAP_MAX_TEXEL_OFFSET:
134        case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
135        case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS:
136        case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS:
137        case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
138            return 0;
139
140        /* SWTCL-only features. */
141        case PIPE_CAP_PRIMITIVE_RESTART:
142            return !r300screen->caps.has_tcl;
143
144        /* Texturing. */
145        case PIPE_CAP_MAX_COMBINED_SAMPLERS:
146            return r300screen->caps.num_tex_units;
147        case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
148        case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
149        case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
150            /* 13 == 4096, 12 == 2048 */
151            return is_r500 ? 13 : 12;
152
153        /* Render targets. */
154        case PIPE_CAP_MAX_RENDER_TARGETS:
155            return 4;
156    }
157    return 0;
158}
159
160static int r300_get_shader_param(struct pipe_screen *pscreen, unsigned shader, enum pipe_shader_cap param)
161{
162   struct r300_screen* r300screen = r300_screen(pscreen);
163   boolean is_r400 = r300screen->caps.is_r400;
164   boolean is_r500 = r300screen->caps.is_r500;
165
166   switch (shader) {
167    case PIPE_SHADER_FRAGMENT:
168        switch (param)
169        {
170        case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
171            return is_r500 || is_r400 ? 512 : 96;
172        case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
173            return is_r500 || is_r400 ? 512 : 64;
174        case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
175            return is_r500 || is_r400 ? 512 : 32;
176        case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
177            return is_r500 ? 511 : 4;
178        case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
179            return is_r500 ? 64 : 0; /* Actually unlimited on r500. */
180            /* Fragment shader limits. */
181        case PIPE_SHADER_CAP_MAX_INPUTS:
182            /* 2 colors + 8 texcoords are always supported
183             * (minus fog and wpos).
184             *
185             * R500 has the ability to turn 3rd and 4th color into
186             * additional texcoords but there is no two-sided color
187             * selection then. However the facing bit can be used instead. */
188            return 10;
189        case PIPE_SHADER_CAP_MAX_CONSTS:
190            return is_r500 ? 256 : 32;
191        case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
192            return 1;
193        case PIPE_SHADER_CAP_MAX_TEMPS:
194            return is_r500 ? 128 : is_r400 ? 64 : 32;
195        case PIPE_SHADER_CAP_MAX_PREDS:
196            return is_r500 ? 1 : 0;
197        case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
198           return r300screen->caps.num_tex_units;
199        case PIPE_SHADER_CAP_MAX_ADDRS:
200        case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
201        case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
202        case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
203        case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
204        case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
205        case PIPE_SHADER_CAP_SUBROUTINES:
206        case PIPE_SHADER_CAP_INTEGERS:
207        case PIPE_SHADER_CAP_OUTPUT_READ:
208            return 0;
209        }
210        break;
211    case PIPE_SHADER_VERTEX:
212        switch (param)
213        {
214        case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
215            return 0;
216        default:;
217        }
218
219        if (!r300screen->caps.has_tcl) {
220            return draw_get_shader_param(shader, param);
221        }
222
223        switch (param)
224        {
225        case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
226        case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
227            return is_r500 ? 1024 : 256;
228        case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
229            return is_r500 ? 4 : 0; /* For loops; not sure about conditionals. */
230        case PIPE_SHADER_CAP_MAX_INPUTS:
231            return 16;
232        case PIPE_SHADER_CAP_MAX_CONSTS:
233            return 256;
234        case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
235            return 1;
236        case PIPE_SHADER_CAP_MAX_TEMPS:
237            return 32;
238        case PIPE_SHADER_CAP_MAX_ADDRS:
239            return 1; /* XXX guessed */
240        case PIPE_SHADER_CAP_MAX_PREDS:
241            return is_r500 ? 4 : 0; /* XXX guessed. */
242        case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
243            return 1;
244        case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
245        case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
246        case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
247        case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
248        case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
249        case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
250        case PIPE_SHADER_CAP_SUBROUTINES:
251        case PIPE_SHADER_CAP_INTEGERS:
252        case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
253        case PIPE_SHADER_CAP_OUTPUT_READ:
254            return 0;
255        }
256        break;
257    }
258    return 0;
259}
260
261static float r300_get_paramf(struct pipe_screen* pscreen,
262                             enum pipe_capf param)
263{
264    struct r300_screen* r300screen = r300_screen(pscreen);
265
266    switch (param) {
267        case PIPE_CAPF_MAX_LINE_WIDTH:
268        case PIPE_CAPF_MAX_LINE_WIDTH_AA:
269        case PIPE_CAPF_MAX_POINT_WIDTH:
270        case PIPE_CAPF_MAX_POINT_WIDTH_AA:
271            /* The maximum dimensions of the colorbuffer are our practical
272             * rendering limits. 2048 pixels should be enough for anybody. */
273            if (r300screen->caps.is_r500) {
274                return 4096.0f;
275            } else if (r300screen->caps.is_r400) {
276                return 4021.0f;
277            } else {
278                return 2560.0f;
279            }
280        case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
281            return 16.0f;
282        case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
283            return 16.0f;
284        case PIPE_CAPF_GUARD_BAND_LEFT:
285        case PIPE_CAPF_GUARD_BAND_TOP:
286        case PIPE_CAPF_GUARD_BAND_RIGHT:
287        case PIPE_CAPF_GUARD_BAND_BOTTOM:
288            /* XXX I don't know what these should be but the least we can do is
289             * silence the potential error message */
290            return 0.0f;
291        default:
292            debug_printf("r300: Warning: Unknown CAP %d in get_paramf.\n",
293                         param);
294            return 0.0f;
295    }
296}
297
298static int r300_get_video_param(struct pipe_screen *screen,
299				enum pipe_video_profile profile,
300				enum pipe_video_cap param)
301{
302   switch (param) {
303      case PIPE_VIDEO_CAP_SUPPORTED:
304         return vl_profile_supported(screen, profile);
305      case PIPE_VIDEO_CAP_NPOT_TEXTURES:
306         return 0;
307      case PIPE_VIDEO_CAP_MAX_WIDTH:
308      case PIPE_VIDEO_CAP_MAX_HEIGHT:
309         return vl_video_buffer_max_size(screen);
310      default:
311         return 0;
312   }
313}
314
315static boolean r300_is_format_supported(struct pipe_screen* screen,
316                                        enum pipe_format format,
317                                        enum pipe_texture_target target,
318                                        unsigned sample_count,
319                                        unsigned usage)
320{
321    uint32_t retval = 0;
322    boolean drm_2_8_0 = r300_screen(screen)->info.drm_minor >= 8;
323    boolean is_r500 = r300_screen(screen)->caps.is_r500;
324    boolean is_r400 = r300_screen(screen)->caps.is_r400;
325    boolean is_color2101010 = format == PIPE_FORMAT_R10G10B10A2_UNORM ||
326                              format == PIPE_FORMAT_R10G10B10X2_SNORM ||
327                              format == PIPE_FORMAT_B10G10R10A2_UNORM ||
328                              format == PIPE_FORMAT_R10SG10SB10SA2U_NORM;
329    boolean is_ati1n = format == PIPE_FORMAT_RGTC1_UNORM ||
330                       format == PIPE_FORMAT_RGTC1_SNORM ||
331                       format == PIPE_FORMAT_LATC1_UNORM ||
332                       format == PIPE_FORMAT_LATC1_SNORM;
333    boolean is_ati2n = format == PIPE_FORMAT_RGTC2_UNORM ||
334                       format == PIPE_FORMAT_RGTC2_SNORM ||
335                       format == PIPE_FORMAT_LATC2_UNORM ||
336                       format == PIPE_FORMAT_LATC2_SNORM;
337    boolean is_x16f_xy16f = format == PIPE_FORMAT_R16_FLOAT ||
338                            format == PIPE_FORMAT_R16G16_FLOAT ||
339                            format == PIPE_FORMAT_A16_FLOAT ||
340                            format == PIPE_FORMAT_L16_FLOAT ||
341                            format == PIPE_FORMAT_L16A16_FLOAT ||
342                            format == PIPE_FORMAT_I16_FLOAT;
343    boolean is_half_float = format == PIPE_FORMAT_R16_FLOAT ||
344                            format == PIPE_FORMAT_R16G16_FLOAT ||
345                            format == PIPE_FORMAT_R16G16B16_FLOAT ||
346                            format == PIPE_FORMAT_R16G16B16A16_FLOAT;
347    boolean is_fixed = format == PIPE_FORMAT_R32_FIXED ||
348                       format == PIPE_FORMAT_R32G32_FIXED ||
349                       format == PIPE_FORMAT_R32G32B32_FIXED ||
350                       format == PIPE_FORMAT_R32G32B32A32_FIXED;
351
352    if (!util_format_is_supported(format, usage))
353       return FALSE;
354
355    /* Check multisampling support. */
356    switch (sample_count) {
357        case 0:
358        case 1:
359            break;
360        case 2:
361        case 3:
362        case 4:
363        case 6:
364            return FALSE;
365#if 0
366            if (usage != PIPE_BIND_RENDER_TARGET ||
367                !util_format_is_rgba8_variant(
368                    util_format_description(format))) {
369                return FALSE;
370            }
371#endif
372            break;
373        default:
374            return FALSE;
375    }
376
377    /* Check sampler format support. */
378    if ((usage & PIPE_BIND_SAMPLER_VIEW) &&
379        /* ATI1N is r5xx-only. */
380        (is_r500 || !is_ati1n) &&
381        /* ATI2N is supported on r4xx-r5xx. */
382        (is_r400 || is_r500 || !is_ati2n) &&
383        /* R16F and RG16F texture support was added in as late as DRM 2.8.0 */
384        (drm_2_8_0 || !is_x16f_xy16f) &&
385        r300_is_sampler_format_supported(format)) {
386        retval |= PIPE_BIND_SAMPLER_VIEW;
387    }
388
389    /* Check colorbuffer format support. */
390    if ((usage & (PIPE_BIND_RENDER_TARGET |
391                  PIPE_BIND_DISPLAY_TARGET |
392                  PIPE_BIND_SCANOUT |
393                  PIPE_BIND_SHARED)) &&
394        /* 2101010 cannot be rendered to on non-r5xx. */
395        (!is_color2101010 || (is_r500 && drm_2_8_0)) &&
396        r300_is_colorbuffer_format_supported(format)) {
397        retval |= usage &
398            (PIPE_BIND_RENDER_TARGET |
399             PIPE_BIND_DISPLAY_TARGET |
400             PIPE_BIND_SCANOUT |
401             PIPE_BIND_SHARED);
402    }
403
404    /* Check depth-stencil format support. */
405    if (usage & PIPE_BIND_DEPTH_STENCIL &&
406        r300_is_zs_format_supported(format)) {
407        retval |= PIPE_BIND_DEPTH_STENCIL;
408    }
409
410    /* Check vertex buffer format support. */
411    if (usage & PIPE_BIND_VERTEX_BUFFER &&
412        /* Half float is supported on >= R400. */
413        (is_r400 || is_r500 || !is_half_float) &&
414        /* We have a fallback for FIXED. */
415        (is_fixed || r300_translate_vertex_data_type(format) != R300_INVALID_FORMAT)) {
416        retval |= PIPE_BIND_VERTEX_BUFFER;
417    }
418
419    /* Transfers are always supported. */
420    if (usage & PIPE_BIND_TRANSFER_READ)
421        retval |= PIPE_BIND_TRANSFER_READ;
422    if (usage & PIPE_BIND_TRANSFER_WRITE)
423        retval |= PIPE_BIND_TRANSFER_WRITE;
424
425    return retval == usage;
426}
427
428static void r300_destroy_screen(struct pipe_screen* pscreen)
429{
430    struct r300_screen* r300screen = r300_screen(pscreen);
431    struct radeon_winsys *rws = radeon_winsys(pscreen);
432
433    util_slab_destroy(&r300screen->pool_buffers);
434    pipe_mutex_destroy(r300screen->num_contexts_mutex);
435
436    if (rws)
437      rws->destroy(rws);
438
439    FREE(r300screen);
440}
441
442static void r300_fence_reference(struct pipe_screen *screen,
443                                 struct pipe_fence_handle **ptr,
444                                 struct pipe_fence_handle *fence)
445{
446    pb_reference((struct pb_buffer**)ptr,
447                             (struct pb_buffer*)fence);
448}
449
450static boolean r300_fence_signalled(struct pipe_screen *screen,
451                                    struct pipe_fence_handle *fence)
452{
453    struct radeon_winsys *rws = r300_screen(screen)->rws;
454    struct pb_buffer *rfence = (struct pb_buffer*)fence;
455
456    return !rws->buffer_is_busy(rfence, RADEON_USAGE_READWRITE);
457}
458
459static boolean r300_fence_finish(struct pipe_screen *screen,
460                                 struct pipe_fence_handle *fence,
461                                 uint64_t timeout)
462{
463    struct radeon_winsys *rws = r300_screen(screen)->rws;
464    struct pb_buffer *rfence = (struct pb_buffer*)fence;
465
466    if (timeout != PIPE_TIMEOUT_INFINITE) {
467        int64_t start_time = os_time_get();
468
469        /* Convert to microseconds. */
470        timeout /= 1000;
471
472        /* Wait in a loop. */
473        while (rws->buffer_is_busy(rfence, RADEON_USAGE_READWRITE)) {
474            if (os_time_get() - start_time >= timeout) {
475                return FALSE;
476            }
477            os_time_sleep(10);
478        }
479        return TRUE;
480    }
481
482    rws->buffer_wait(rfence, RADEON_USAGE_READWRITE);
483    return TRUE;
484}
485
486struct pipe_screen* r300_screen_create(struct radeon_winsys *rws)
487{
488    struct r300_screen *r300screen = CALLOC_STRUCT(r300_screen);
489
490    if (!r300screen) {
491        FREE(r300screen);
492        return NULL;
493    }
494
495    rws->query_info(rws, &r300screen->info);
496
497    r300_init_debug(r300screen);
498    r300_parse_chipset(r300screen->info.pci_id, &r300screen->caps);
499
500    if (SCREEN_DBG_ON(r300screen, DBG_NO_ZMASK))
501        r300screen->caps.zmask_ram = 0;
502    if (SCREEN_DBG_ON(r300screen, DBG_NO_HIZ))
503        r300screen->caps.hiz_ram = 0;
504
505    if (r300screen->info.drm_minor < 8)
506        r300screen->caps.has_us_format = FALSE;
507
508    pipe_mutex_init(r300screen->num_contexts_mutex);
509
510    util_slab_create(&r300screen->pool_buffers,
511                     sizeof(struct r300_resource), 64,
512                     UTIL_SLAB_SINGLETHREADED);
513
514    r300screen->rws = rws;
515    r300screen->screen.winsys = (struct pipe_winsys*)rws;
516    r300screen->screen.destroy = r300_destroy_screen;
517    r300screen->screen.get_name = r300_get_name;
518    r300screen->screen.get_vendor = r300_get_vendor;
519    r300screen->screen.get_param = r300_get_param;
520    r300screen->screen.get_shader_param = r300_get_shader_param;
521    r300screen->screen.get_paramf = r300_get_paramf;
522    r300screen->screen.get_video_param = r300_get_video_param;
523    r300screen->screen.is_format_supported = r300_is_format_supported;
524    r300screen->screen.is_video_format_supported = vl_video_buffer_is_format_supported;
525    r300screen->screen.context_create = r300_create_context;
526    r300screen->screen.fence_reference = r300_fence_reference;
527    r300screen->screen.fence_signalled = r300_fence_signalled;
528    r300screen->screen.fence_finish = r300_fence_finish;
529
530    r300_init_screen_resource_functions(r300screen);
531
532    util_format_s3tc_init();
533
534    return &r300screen->screen;
535}
536