r300_screen.c revision ae272a92a17510493392d7d7dd4937786af415ec
1/*
2 * Copyright 2008 Corbin Simpson <MostAwesomeDude@gmail.com>
3 * Copyright 2010 Marek Olšák <maraeo@gmail.com>
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * on the rights to use, copy, modify, merge, publish, distribute, sub
9 * license, and/or sell copies of the Software, and to permit persons to whom
10 * the Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
20 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
21 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
22 * USE OR OTHER DEALINGS IN THE SOFTWARE. */
23
24#include "util/u_format.h"
25#include "util/u_format_s3tc.h"
26#include "util/u_memory.h"
27#include "os/os_time.h"
28#include "vl/vl_decoder.h"
29#include "vl/vl_video_buffer.h"
30
31#include "r300_context.h"
32#include "r300_texture.h"
33#include "r300_screen_buffer.h"
34#include "r300_state_inlines.h"
35#include "r300_public.h"
36
37#include "draw/draw_context.h"
38
39/* Return the identifier behind whom the brave coders responsible for this
40 * amalgamation of code, sweat, and duct tape, routinely obscure their names.
41 *
42 * ...I should have just put "Corbin Simpson", but I'm not that cool.
43 *
44 * (Or egotistical. Yet.) */
45static const char* r300_get_vendor(struct pipe_screen* pscreen)
46{
47    return "X.Org R300 Project";
48}
49
50static const char* chip_families[] = {
51    "ATI R300",
52    "ATI R350",
53    "ATI RV350",
54    "ATI RV370",
55    "ATI RV380",
56    "ATI RS400",
57    "ATI RC410",
58    "ATI RS480",
59    "ATI R420",
60    "ATI R423",
61    "ATI R430",
62    "ATI R480",
63    "ATI R481",
64    "ATI RV410",
65    "ATI RS600",
66    "ATI RS690",
67    "ATI RS740",
68    "ATI RV515",
69    "ATI R520",
70    "ATI RV530",
71    "ATI R580",
72    "ATI RV560",
73    "ATI RV570"
74};
75
76static const char* r300_get_name(struct pipe_screen* pscreen)
77{
78    struct r300_screen* r300screen = r300_screen(pscreen);
79
80    return chip_families[r300screen->caps.family];
81}
82
83static int r300_get_param(struct pipe_screen* pscreen, enum pipe_cap param)
84{
85    struct r300_screen* r300screen = r300_screen(pscreen);
86    boolean is_r500 = r300screen->caps.is_r500;
87
88    switch (param) {
89        /* Supported features (boolean caps). */
90        case PIPE_CAP_NPOT_TEXTURES:
91        case PIPE_CAP_TWO_SIDED_STENCIL:
92        case PIPE_CAP_GLSL:
93            /* I'll be frank. This is a lie.
94             *
95             * We don't truly support GLSL on any of this driver's chipsets.
96             * To be fair, no chipset supports the full GLSL specification
97             * to the best of our knowledge, but some of the less esoteric
98             * features are still missing here.
99             *
100             * Rather than cripple ourselves intentionally, I'm going to set
101             * this flag, and as Gallium's interface continues to change, I
102             * hope that this single monolithic GLSL enable can slowly get
103             * split down into many different pieces and the state tracker
104             * will handle fallbacks transparently, like it should.
105             *
106             * ~ C.
107             */
108        case PIPE_CAP_ANISOTROPIC_FILTER:
109        case PIPE_CAP_POINT_SPRITE:
110        case PIPE_CAP_OCCLUSION_QUERY:
111        case PIPE_CAP_TEXTURE_SHADOW_MAP:
112        case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
113        case PIPE_CAP_BLEND_EQUATION_SEPARATE:
114        case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
115        case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
116        case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
117        case PIPE_CAP_CONDITIONAL_RENDER:
118        case PIPE_CAP_TEXTURE_BARRIER:
119            return 1;
120
121        /* r300 cannot do swizzling of compressed textures. Supported otherwise. */
122        case PIPE_CAP_TEXTURE_SWIZZLE:
123            return util_format_s3tc_enabled ? r300screen->caps.dxtc_swizzle : 1;
124
125        /* Supported on r500 only. */
126        case PIPE_CAP_FRAGMENT_COLOR_CLAMP_CONTROL:
127        case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
128        case PIPE_CAP_SM3:
129            return is_r500 ? 1 : 0;
130
131        /* Unsupported features. */
132        case PIPE_CAP_TIMER_QUERY:
133        case PIPE_CAP_DUAL_SOURCE_BLEND:
134        case PIPE_CAP_INDEP_BLEND_ENABLE:
135        case PIPE_CAP_INDEP_BLEND_FUNC:
136        case PIPE_CAP_DEPTH_CLAMP:
137        case PIPE_CAP_DEPTHSTENCIL_CLEAR_SEPARATE:
138        case PIPE_CAP_SHADER_STENCIL_EXPORT:
139        case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
140        case PIPE_CAP_TGSI_INSTANCEID:
141        case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
142        case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
143        case PIPE_CAP_SEAMLESS_CUBE_MAP:
144        case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
145        case PIPE_CAP_SCALED_RESOLVE:
146        case PIPE_CAP_MIN_TEXEL_OFFSET:
147        case PIPE_CAP_MAX_TEXEL_OFFSET:
148        case PIPE_CAP_STREAM_OUTPUT:
149            return 0;
150
151        /* SWTCL-only features. */
152        case PIPE_CAP_PRIMITIVE_RESTART:
153            return !r300screen->caps.has_tcl;
154
155        /* Texturing. */
156        case PIPE_CAP_MAX_COMBINED_SAMPLERS:
157            return r300screen->caps.num_tex_units;
158        case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
159        case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
160        case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
161            /* 13 == 4096, 12 == 2048 */
162            return is_r500 ? 13 : 12;
163
164        /* Render targets. */
165        case PIPE_CAP_MAX_RENDER_TARGETS:
166            return 4;
167
168        default:
169            debug_printf("r300: Warning: Unknown CAP %d in get_param.\n",
170                         param);
171            return 0;
172    }
173}
174
175static int r300_get_shader_param(struct pipe_screen *pscreen, unsigned shader, enum pipe_shader_cap param)
176{
177   struct r300_screen* r300screen = r300_screen(pscreen);
178   boolean is_r400 = r300screen->caps.is_r400;
179   boolean is_r500 = r300screen->caps.is_r500;
180
181   switch (shader)
182    {
183    case PIPE_SHADER_FRAGMENT:
184        switch (param)
185        {
186        case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
187            return is_r500 || is_r400 ? 512 : 96;
188        case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
189            return is_r500 || is_r400 ? 512 : 64;
190        case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
191            return is_r500 || is_r400 ? 512 : 32;
192        case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
193            return is_r500 ? 511 : 4;
194        case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
195            return is_r500 ? 64 : 0; /* Actually unlimited on r500. */
196            /* Fragment shader limits. */
197        case PIPE_SHADER_CAP_MAX_INPUTS:
198            /* 2 colors + 8 texcoords are always supported
199             * (minus fog and wpos).
200             *
201             * R500 has the ability to turn 3rd and 4th color into
202             * additional texcoords but there is no two-sided color
203             * selection then. However the facing bit can be used instead. */
204            return 10;
205        case PIPE_SHADER_CAP_MAX_CONSTS:
206            return is_r500 ? 256 : 32;
207        case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
208            return 1;
209        case PIPE_SHADER_CAP_MAX_TEMPS:
210            return is_r500 ? 128 : is_r400 ? 64 : 32;
211        case PIPE_SHADER_CAP_MAX_ADDRS:
212            return 0;
213        case PIPE_SHADER_CAP_MAX_PREDS:
214            return is_r500 ? 1 : 0;
215        case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
216        case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
217        case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
218        case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
219        case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
220        case PIPE_SHADER_CAP_SUBROUTINES:
221        case PIPE_SHADER_CAP_INTEGERS:
222            return 0;
223        case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
224           return r300screen->caps.num_tex_units;
225        }
226        break;
227    case PIPE_SHADER_VERTEX:
228        switch (param)
229        {
230        case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
231            return 0;
232        default:;
233        }
234
235        if (!r300screen->caps.has_tcl) {
236            return draw_get_shader_param(shader, param);
237        }
238
239        switch (param)
240        {
241        case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
242        case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
243            return is_r500 ? 1024 : 256;
244        case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
245        case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
246            return 0;
247        case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
248            return is_r500 ? 4 : 0; /* For loops; not sure about conditionals. */
249        case PIPE_SHADER_CAP_MAX_INPUTS:
250            return 16;
251        case PIPE_SHADER_CAP_MAX_CONSTS:
252            return 256;
253        case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
254            return 1;
255        case PIPE_SHADER_CAP_MAX_TEMPS:
256            return 32;
257        case PIPE_SHADER_CAP_MAX_ADDRS:
258            return 1; /* XXX guessed */
259        case PIPE_SHADER_CAP_MAX_PREDS:
260            return is_r500 ? 4 : 0; /* XXX guessed. */
261        case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
262            return 1;
263        case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
264        case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
265        case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
266        case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
267        case PIPE_SHADER_CAP_SUBROUTINES:
268        case PIPE_SHADER_CAP_INTEGERS:
269            return 0;
270        default:;
271        }
272        break;
273    }
274    return 0;
275}
276
277static float r300_get_paramf(struct pipe_screen* pscreen, enum pipe_cap param)
278{
279    struct r300_screen* r300screen = r300_screen(pscreen);
280
281    switch (param) {
282        case PIPE_CAP_MAX_LINE_WIDTH:
283        case PIPE_CAP_MAX_LINE_WIDTH_AA:
284        case PIPE_CAP_MAX_POINT_WIDTH:
285        case PIPE_CAP_MAX_POINT_WIDTH_AA:
286            /* The maximum dimensions of the colorbuffer are our practical
287             * rendering limits. 2048 pixels should be enough for anybody. */
288            if (r300screen->caps.is_r500) {
289                return 4096.0f;
290            } else if (r300screen->caps.is_r400) {
291                return 4021.0f;
292            } else {
293                return 2560.0f;
294            }
295        case PIPE_CAP_MAX_TEXTURE_ANISOTROPY:
296            return 16.0f;
297        case PIPE_CAP_MAX_TEXTURE_LOD_BIAS:
298            return 16.0f;
299        case PIPE_CAP_GUARD_BAND_LEFT:
300        case PIPE_CAP_GUARD_BAND_TOP:
301        case PIPE_CAP_GUARD_BAND_RIGHT:
302        case PIPE_CAP_GUARD_BAND_BOTTOM:
303            /* XXX I don't know what these should be but the least we can do is
304             * silence the potential error message */
305            return 0.0f;
306        default:
307            debug_printf("r300: Warning: Unknown CAP %d in get_paramf.\n",
308                         param);
309            return 0.0f;
310    }
311}
312
313static int r300_get_video_param(struct pipe_screen *screen,
314				enum pipe_video_profile profile,
315				enum pipe_video_cap param)
316{
317   switch (param) {
318      case PIPE_VIDEO_CAP_SUPPORTED:
319         return vl_profile_supported(screen, profile);
320      case PIPE_VIDEO_CAP_NPOT_TEXTURES:
321         return 0;
322      case PIPE_VIDEO_CAP_MAX_WIDTH:
323      case PIPE_VIDEO_CAP_MAX_HEIGHT:
324         return vl_video_buffer_max_size(screen);
325      case PIPE_VIDEO_CAP_NUM_BUFFERS_DESIRED:
326         return vl_num_buffers_desired(screen, profile);
327      default:
328         return 0;
329   }
330}
331
332static boolean r300_is_format_supported(struct pipe_screen* screen,
333                                        enum pipe_format format,
334                                        enum pipe_texture_target target,
335                                        unsigned sample_count,
336                                        unsigned usage)
337{
338    uint32_t retval = 0;
339    boolean drm_2_8_0 = r300_screen(screen)->info.drm_minor >= 8;
340    boolean is_r500 = r300_screen(screen)->caps.is_r500;
341    boolean is_r400 = r300_screen(screen)->caps.is_r400;
342    boolean is_color2101010 = format == PIPE_FORMAT_R10G10B10A2_UNORM ||
343                              format == PIPE_FORMAT_R10G10B10X2_SNORM ||
344                              format == PIPE_FORMAT_B10G10R10A2_UNORM ||
345                              format == PIPE_FORMAT_R10SG10SB10SA2U_NORM;
346    boolean is_ati1n = format == PIPE_FORMAT_RGTC1_UNORM ||
347                       format == PIPE_FORMAT_RGTC1_SNORM ||
348                       format == PIPE_FORMAT_LATC1_UNORM ||
349                       format == PIPE_FORMAT_LATC1_SNORM;
350    boolean is_ati2n = format == PIPE_FORMAT_RGTC2_UNORM ||
351                       format == PIPE_FORMAT_RGTC2_SNORM ||
352                       format == PIPE_FORMAT_LATC2_UNORM ||
353                       format == PIPE_FORMAT_LATC2_SNORM;
354    boolean is_x16f_xy16f = format == PIPE_FORMAT_R16_FLOAT ||
355                            format == PIPE_FORMAT_R16G16_FLOAT ||
356                            format == PIPE_FORMAT_A16_FLOAT ||
357                            format == PIPE_FORMAT_L16_FLOAT ||
358                            format == PIPE_FORMAT_L16A16_FLOAT ||
359                            format == PIPE_FORMAT_I16_FLOAT;
360    boolean is_half_float = format == PIPE_FORMAT_R16_FLOAT ||
361                            format == PIPE_FORMAT_R16G16_FLOAT ||
362                            format == PIPE_FORMAT_R16G16B16_FLOAT ||
363                            format == PIPE_FORMAT_R16G16B16A16_FLOAT;
364
365    if (!util_format_is_supported(format, usage))
366       return FALSE;
367
368    /* Check multisampling support. */
369    switch (sample_count) {
370        case 0:
371        case 1:
372            break;
373        case 2:
374        case 3:
375        case 4:
376        case 6:
377            return FALSE;
378#if 0
379            if (usage != PIPE_BIND_RENDER_TARGET ||
380                !util_format_is_rgba8_variant(
381                    util_format_description(format))) {
382                return FALSE;
383            }
384#endif
385            break;
386        default:
387            return FALSE;
388    }
389
390    /* Check sampler format support. */
391    if ((usage & PIPE_BIND_SAMPLER_VIEW) &&
392        /* ATI1N is r5xx-only. */
393        (is_r500 || !is_ati1n) &&
394        /* ATI2N is supported on r4xx-r5xx. */
395        (is_r400 || is_r500 || !is_ati2n) &&
396        /* R16F and RG16F texture support was added in as late as DRM 2.8.0 */
397        (drm_2_8_0 || !is_x16f_xy16f) &&
398        r300_is_sampler_format_supported(format)) {
399        retval |= PIPE_BIND_SAMPLER_VIEW;
400    }
401
402    /* Check colorbuffer format support. */
403    if ((usage & (PIPE_BIND_RENDER_TARGET |
404                  PIPE_BIND_DISPLAY_TARGET |
405                  PIPE_BIND_SCANOUT |
406                  PIPE_BIND_SHARED)) &&
407        /* 2101010 cannot be rendered to on non-r5xx. */
408        (!is_color2101010 || (is_r500 && drm_2_8_0)) &&
409        r300_is_colorbuffer_format_supported(format)) {
410        retval |= usage &
411            (PIPE_BIND_RENDER_TARGET |
412             PIPE_BIND_DISPLAY_TARGET |
413             PIPE_BIND_SCANOUT |
414             PIPE_BIND_SHARED);
415    }
416
417    /* Check depth-stencil format support. */
418    if (usage & PIPE_BIND_DEPTH_STENCIL &&
419        r300_is_zs_format_supported(format)) {
420        retval |= PIPE_BIND_DEPTH_STENCIL;
421    }
422
423    /* Check vertex buffer format support. */
424    if (usage & PIPE_BIND_VERTEX_BUFFER &&
425        /* Half float is supported on >= RV350. */
426        (is_r400 || is_r500 || !is_half_float) &&
427        r300_translate_vertex_data_type(format) != R300_INVALID_FORMAT) {
428        retval |= PIPE_BIND_VERTEX_BUFFER;
429    }
430
431    /* Transfers are always supported. */
432    if (usage & PIPE_BIND_TRANSFER_READ)
433        retval |= PIPE_BIND_TRANSFER_READ;
434    if (usage & PIPE_BIND_TRANSFER_WRITE)
435        retval |= PIPE_BIND_TRANSFER_WRITE;
436
437    return retval == usage;
438}
439
440static void r300_destroy_screen(struct pipe_screen* pscreen)
441{
442    struct r300_screen* r300screen = r300_screen(pscreen);
443    struct radeon_winsys *rws = radeon_winsys(pscreen);
444
445    util_slab_destroy(&r300screen->pool_buffers);
446    pipe_mutex_destroy(r300screen->num_contexts_mutex);
447
448    if (rws)
449      rws->destroy(rws);
450
451    FREE(r300screen);
452}
453
454static void r300_fence_reference(struct pipe_screen *screen,
455                                 struct pipe_fence_handle **ptr,
456                                 struct pipe_fence_handle *fence)
457{
458    pb_reference((struct pb_buffer**)ptr,
459                             (struct pb_buffer*)fence);
460}
461
462static boolean r300_fence_signalled(struct pipe_screen *screen,
463                                    struct pipe_fence_handle *fence)
464{
465    struct radeon_winsys *rws = r300_screen(screen)->rws;
466    struct pb_buffer *rfence = (struct pb_buffer*)fence;
467
468    return !rws->buffer_is_busy(rfence, RADEON_USAGE_READWRITE);
469}
470
471static boolean r300_fence_finish(struct pipe_screen *screen,
472                                 struct pipe_fence_handle *fence,
473                                 uint64_t timeout)
474{
475    struct radeon_winsys *rws = r300_screen(screen)->rws;
476    struct pb_buffer *rfence = (struct pb_buffer*)fence;
477
478    if (timeout != PIPE_TIMEOUT_INFINITE) {
479        int64_t start_time = os_time_get();
480
481        /* Convert to microseconds. */
482        timeout /= 1000;
483
484        /* Wait in a loop. */
485        while (rws->buffer_is_busy(rfence, RADEON_USAGE_READWRITE)) {
486            if (os_time_get() - start_time >= timeout) {
487                return FALSE;
488            }
489            os_time_sleep(10);
490        }
491        return TRUE;
492    }
493
494    rws->buffer_wait(rfence, RADEON_USAGE_READWRITE);
495    return TRUE;
496}
497
498struct pipe_screen* r300_screen_create(struct radeon_winsys *rws)
499{
500    struct r300_screen *r300screen = CALLOC_STRUCT(r300_screen);
501
502    if (!r300screen) {
503        FREE(r300screen);
504        return NULL;
505    }
506
507    rws->query_info(rws, &r300screen->info);
508
509    r300_init_debug(r300screen);
510    r300_parse_chipset(r300screen->info.pci_id, &r300screen->caps);
511
512    if (SCREEN_DBG_ON(r300screen, DBG_NO_ZMASK))
513        r300screen->caps.zmask_ram = 0;
514    if (SCREEN_DBG_ON(r300screen, DBG_NO_HIZ))
515        r300screen->caps.hiz_ram = 0;
516
517    if (r300screen->info.drm_minor < 8)
518        r300screen->caps.has_us_format = FALSE;
519
520    pipe_mutex_init(r300screen->num_contexts_mutex);
521
522    util_slab_create(&r300screen->pool_buffers,
523                     sizeof(struct r300_resource), 64,
524                     UTIL_SLAB_SINGLETHREADED);
525
526    r300screen->rws = rws;
527    r300screen->screen.winsys = (struct pipe_winsys*)rws;
528    r300screen->screen.destroy = r300_destroy_screen;
529    r300screen->screen.get_name = r300_get_name;
530    r300screen->screen.get_vendor = r300_get_vendor;
531    r300screen->screen.get_param = r300_get_param;
532    r300screen->screen.get_shader_param = r300_get_shader_param;
533    r300screen->screen.get_paramf = r300_get_paramf;
534    r300screen->screen.get_video_param = r300_get_video_param;
535    r300screen->screen.is_format_supported = r300_is_format_supported;
536    r300screen->screen.is_video_format_supported = vl_video_buffer_is_format_supported;
537    r300screen->screen.context_create = r300_create_context;
538    r300screen->screen.fence_reference = r300_fence_reference;
539    r300screen->screen.fence_signalled = r300_fence_signalled;
540    r300screen->screen.fence_finish = r300_fence_finish;
541
542    r300_init_screen_resource_functions(r300screen);
543
544    util_format_s3tc_init();
545
546    return &r300screen->screen;
547}
548