1/*
2 * Copyright 2008 Ben Skeggs
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
21 */
22
23#include "pipe/p_state.h"
24#include "pipe/p_defines.h"
25#include "util/u_inlines.h"
26#include "util/u_format.h"
27
28#include "nv50/nv50_context.h"
29#include "nv50/nv50_resource.h"
30
31uint32_t
32nv50_tex_choose_tile_dims_helper(unsigned nx, unsigned ny, unsigned nz,
33                                 bool is_3d)
34{
35   uint32_t tile_mode = 0x000;
36
37   if (ny > 64) tile_mode = 0x040; /* height 128 tiles */
38   else
39   if (ny > 32) tile_mode = 0x030; /* height 64 tiles */
40   else
41   if (ny > 16) tile_mode = 0x020; /* height 32 tiles */
42   else
43   if (ny >  8) tile_mode = 0x010; /* height 16 tiles */
44
45   if (!is_3d)
46      return tile_mode;
47   else
48      if (tile_mode > 0x020)
49         tile_mode = 0x020;
50
51   if (nz > 16 && tile_mode < 0x020)
52      return tile_mode | 0x500; /* depth 32 tiles */
53   if (nz > 8) return tile_mode | 0x400; /* depth 16 tiles */
54   if (nz > 4) return tile_mode | 0x300; /* depth 8 tiles */
55   if (nz > 2) return tile_mode | 0x200; /* depth 4 tiles */
56   if (nz > 1) return tile_mode | 0x100; /* depth 2 tiles */
57
58   return tile_mode;
59}
60
61static uint32_t
62nv50_tex_choose_tile_dims(unsigned nx, unsigned ny, unsigned nz, bool is_3d)
63{
64   return nv50_tex_choose_tile_dims_helper(nx, ny * 2, nz, is_3d);
65}
66
67static uint32_t
68nv50_mt_choose_storage_type(struct nv50_miptree *mt, bool compressed)
69{
70   const unsigned ms = util_logbase2(mt->base.base.nr_samples);
71   uint32_t tile_flags;
72
73   if (unlikely(mt->base.base.flags & NOUVEAU_RESOURCE_FLAG_LINEAR))
74      return 0;
75   if (unlikely(mt->base.base.bind & PIPE_BIND_CURSOR))
76      return 0;
77
78   switch (mt->base.base.format) {
79   case PIPE_FORMAT_Z16_UNORM:
80      tile_flags = 0x6c + ms;
81      break;
82   case PIPE_FORMAT_X8Z24_UNORM:
83   case PIPE_FORMAT_S8X24_UINT:
84   case PIPE_FORMAT_S8_UINT_Z24_UNORM:
85      tile_flags = 0x18 + ms;
86      break;
87   case PIPE_FORMAT_X24S8_UINT:
88   case PIPE_FORMAT_Z24X8_UNORM:
89   case PIPE_FORMAT_Z24_UNORM_S8_UINT:
90      tile_flags = 0x128 + ms;
91      break;
92   case PIPE_FORMAT_Z32_FLOAT:
93      tile_flags = 0x40 + ms;
94      break;
95   case PIPE_FORMAT_X32_S8X24_UINT:
96   case PIPE_FORMAT_Z32_FLOAT_S8X24_UINT:
97      tile_flags = 0x60 + ms;
98      break;
99   default:
100      /* Most color formats don't work with compression. */
101      compressed = false;
102      /* fallthrough */
103   case PIPE_FORMAT_R8G8B8A8_UNORM:
104   case PIPE_FORMAT_R8G8B8A8_SRGB:
105   case PIPE_FORMAT_R8G8B8X8_UNORM:
106   case PIPE_FORMAT_R8G8B8X8_SRGB:
107   case PIPE_FORMAT_B8G8R8A8_UNORM:
108   case PIPE_FORMAT_B8G8R8A8_SRGB:
109   case PIPE_FORMAT_B8G8R8X8_UNORM:
110   case PIPE_FORMAT_B8G8R8X8_SRGB:
111   case PIPE_FORMAT_R10G10B10A2_UNORM:
112   case PIPE_FORMAT_B10G10R10A2_UNORM:
113   case PIPE_FORMAT_R16G16B16A16_FLOAT:
114   case PIPE_FORMAT_R16G16B16X16_FLOAT:
115   case PIPE_FORMAT_R11G11B10_FLOAT:
116      switch (util_format_get_blocksizebits(mt->base.base.format)) {
117      case 128:
118         assert(ms < 3);
119         tile_flags = 0x74;
120         break;
121      case 64:
122         switch (ms) {
123         case 2: tile_flags = 0xfc; break;
124         case 3: tile_flags = 0xfd; break;
125         default:
126            tile_flags = 0x70;
127            break;
128         }
129         break;
130      case 32:
131         if (mt->base.base.bind & PIPE_BIND_SCANOUT) {
132            assert(ms == 0);
133            tile_flags = 0x7a;
134         } else {
135            switch (ms) {
136            case 2: tile_flags = 0xf8; break;
137            case 3: tile_flags = 0xf9; break;
138            default:
139               tile_flags = 0x70;
140               break;
141            }
142         }
143         break;
144      case 16:
145      case 8:
146         tile_flags = 0x70;
147         break;
148      default:
149         return 0;
150      }
151      if (mt->base.base.bind & PIPE_BIND_CURSOR)
152         tile_flags = 0;
153   }
154
155   if (!compressed)
156      tile_flags &= ~0x180;
157
158   return tile_flags;
159}
160
161void
162nv50_miptree_destroy(struct pipe_screen *pscreen, struct pipe_resource *pt)
163{
164   struct nv50_miptree *mt = nv50_miptree(pt);
165
166   if (mt->base.fence && mt->base.fence->state < NOUVEAU_FENCE_STATE_FLUSHED)
167      nouveau_fence_work(mt->base.fence, nouveau_fence_unref_bo, mt->base.bo);
168   else
169      nouveau_bo_ref(NULL, &mt->base.bo);
170
171   nouveau_fence_ref(NULL, &mt->base.fence);
172   nouveau_fence_ref(NULL, &mt->base.fence_wr);
173
174   NOUVEAU_DRV_STAT(nouveau_screen(pscreen), tex_obj_current_count, -1);
175   NOUVEAU_DRV_STAT(nouveau_screen(pscreen), tex_obj_current_bytes,
176                    -(uint64_t)mt->total_size);
177
178   FREE(mt);
179}
180
181boolean
182nv50_miptree_get_handle(struct pipe_screen *pscreen,
183                        struct pipe_resource *pt,
184                        struct winsys_handle *whandle)
185{
186   struct nv50_miptree *mt = nv50_miptree(pt);
187   unsigned stride;
188
189   if (!mt || !mt->base.bo)
190      return false;
191
192   stride = mt->level[0].pitch;
193
194   return nouveau_screen_bo_get_handle(pscreen,
195                                       mt->base.bo,
196                                       stride,
197                                       whandle);
198}
199
200const struct u_resource_vtbl nv50_miptree_vtbl =
201{
202   nv50_miptree_get_handle,         /* get_handle */
203   nv50_miptree_destroy,            /* resource_destroy */
204   nv50_miptree_transfer_map,       /* transfer_map */
205   u_default_transfer_flush_region, /* transfer_flush_region */
206   nv50_miptree_transfer_unmap,     /* transfer_unmap */
207};
208
209static inline bool
210nv50_miptree_init_ms_mode(struct nv50_miptree *mt)
211{
212   switch (mt->base.base.nr_samples) {
213   case 8:
214      mt->ms_mode = NV50_3D_MULTISAMPLE_MODE_MS8;
215      mt->ms_x = 2;
216      mt->ms_y = 1;
217      break;
218   case 4:
219      mt->ms_mode = NV50_3D_MULTISAMPLE_MODE_MS4;
220      mt->ms_x = 1;
221      mt->ms_y = 1;
222      break;
223   case 2:
224      mt->ms_mode = NV50_3D_MULTISAMPLE_MODE_MS2;
225      mt->ms_x = 1;
226      break;
227   case 1:
228   case 0:
229      mt->ms_mode = NV50_3D_MULTISAMPLE_MODE_MS1;
230      break;
231   default:
232      NOUVEAU_ERR("invalid nr_samples: %u\n", mt->base.base.nr_samples);
233      return false;
234   }
235   return true;
236}
237
238bool
239nv50_miptree_init_layout_linear(struct nv50_miptree *mt, unsigned pitch_align)
240{
241   struct pipe_resource *pt = &mt->base.base;
242   const unsigned blocksize = util_format_get_blocksize(pt->format);
243   unsigned h = pt->height0;
244
245   if (util_format_is_depth_or_stencil(pt->format))
246      return false;
247
248   if ((pt->last_level > 0) || (pt->depth0 > 1) || (pt->array_size > 1))
249      return false;
250   if (mt->ms_x | mt->ms_y)
251      return false;
252
253   mt->level[0].pitch = align(pt->width0 * blocksize, pitch_align);
254
255   /* Account for very generous prefetch (allocate size as if tiled). */
256   h = MAX2(h, 8);
257   h = util_next_power_of_two(h);
258
259   mt->total_size = mt->level[0].pitch * h;
260
261   return true;
262}
263
264static void
265nv50_miptree_init_layout_video(struct nv50_miptree *mt)
266{
267   const struct pipe_resource *pt = &mt->base.base;
268   const unsigned blocksize = util_format_get_blocksize(pt->format);
269
270   assert(pt->last_level == 0);
271   assert(mt->ms_x == 0 && mt->ms_y == 0);
272   assert(!util_format_is_compressed(pt->format));
273
274   mt->layout_3d = pt->target == PIPE_TEXTURE_3D;
275
276   mt->level[0].tile_mode = 0x20;
277   mt->level[0].pitch = align(pt->width0 * blocksize, 64);
278   mt->total_size = align(pt->height0, 16) * mt->level[0].pitch * (mt->layout_3d ? pt->depth0 : 1);
279
280   if (pt->array_size > 1) {
281      mt->layer_stride = align(mt->total_size, NV50_TILE_SIZE(0x20));
282      mt->total_size = mt->layer_stride * pt->array_size;
283   }
284}
285
286static void
287nv50_miptree_init_layout_tiled(struct nv50_miptree *mt)
288{
289   struct pipe_resource *pt = &mt->base.base;
290   unsigned w, h, d, l;
291   const unsigned blocksize = util_format_get_blocksize(pt->format);
292
293   mt->layout_3d = pt->target == PIPE_TEXTURE_3D;
294
295   w = pt->width0 << mt->ms_x;
296   h = pt->height0 << mt->ms_y;
297
298   /* For 3D textures, a mipmap is spanned by all the layers, for array
299    * textures and cube maps, each layer contains its own mipmaps.
300    */
301   d = mt->layout_3d ? pt->depth0 : 1;
302
303   for (l = 0; l <= pt->last_level; ++l) {
304      struct nv50_miptree_level *lvl = &mt->level[l];
305      unsigned tsx, tsy, tsz;
306      unsigned nbx = util_format_get_nblocksx(pt->format, w);
307      unsigned nby = util_format_get_nblocksy(pt->format, h);
308
309      lvl->offset = mt->total_size;
310
311      lvl->tile_mode = nv50_tex_choose_tile_dims(nbx, nby, d, mt->layout_3d);
312
313      tsx = NV50_TILE_SIZE_X(lvl->tile_mode); /* x is tile row pitch in bytes */
314      tsy = NV50_TILE_SIZE_Y(lvl->tile_mode);
315      tsz = NV50_TILE_SIZE_Z(lvl->tile_mode);
316
317      lvl->pitch = align(nbx * blocksize, tsx);
318
319      mt->total_size += lvl->pitch * align(nby, tsy) * align(d, tsz);
320
321      w = u_minify(w, 1);
322      h = u_minify(h, 1);
323      d = u_minify(d, 1);
324   }
325
326   if (pt->array_size > 1) {
327      mt->layer_stride = align(mt->total_size,
328                               NV50_TILE_SIZE(mt->level[0].tile_mode));
329      mt->total_size = mt->layer_stride * pt->array_size;
330   }
331}
332
333struct pipe_resource *
334nv50_miptree_create(struct pipe_screen *pscreen,
335                    const struct pipe_resource *templ)
336{
337   struct nouveau_device *dev = nouveau_screen(pscreen)->device;
338   struct nouveau_drm *drm = nouveau_screen(pscreen)->drm;
339   struct nv50_miptree *mt = CALLOC_STRUCT(nv50_miptree);
340   struct pipe_resource *pt = &mt->base.base;
341   bool compressed = drm->version >= 0x01000101;
342   int ret;
343   union nouveau_bo_config bo_config;
344   uint32_t bo_flags;
345
346   if (!mt)
347      return NULL;
348
349   mt->base.vtbl = &nv50_miptree_vtbl;
350   *pt = *templ;
351   pipe_reference_init(&pt->reference, 1);
352   pt->screen = pscreen;
353
354   if (pt->bind & PIPE_BIND_LINEAR)
355      pt->flags |= NOUVEAU_RESOURCE_FLAG_LINEAR;
356
357   bo_config.nv50.memtype = nv50_mt_choose_storage_type(mt, compressed);
358
359   if (!nv50_miptree_init_ms_mode(mt)) {
360      FREE(mt);
361      return NULL;
362   }
363
364   if (unlikely(pt->flags & NV50_RESOURCE_FLAG_VIDEO)) {
365      nv50_miptree_init_layout_video(mt);
366      if (pt->flags & NV50_RESOURCE_FLAG_NOALLOC) {
367         /* BO allocation done by client */
368         return pt;
369      }
370   } else
371   if (bo_config.nv50.memtype != 0) {
372      nv50_miptree_init_layout_tiled(mt);
373   } else
374   if (!nv50_miptree_init_layout_linear(mt, 64)) {
375      FREE(mt);
376      return NULL;
377   }
378   bo_config.nv50.tile_mode = mt->level[0].tile_mode;
379
380   if (!bo_config.nv50.memtype && (pt->bind & PIPE_BIND_SHARED))
381      mt->base.domain = NOUVEAU_BO_GART;
382   else
383      mt->base.domain = NV_VRAM_DOMAIN(nouveau_screen(pscreen));
384
385   bo_flags = mt->base.domain | NOUVEAU_BO_NOSNOOP;
386   if (mt->base.base.bind & (PIPE_BIND_CURSOR | PIPE_BIND_DISPLAY_TARGET))
387      bo_flags |= NOUVEAU_BO_CONTIG;
388
389   ret = nouveau_bo_new(dev, bo_flags, 4096, mt->total_size, &bo_config,
390                        &mt->base.bo);
391   if (ret) {
392      FREE(mt);
393      return NULL;
394   }
395   mt->base.address = mt->base.bo->offset;
396
397   return pt;
398}
399
400struct pipe_resource *
401nv50_miptree_from_handle(struct pipe_screen *pscreen,
402                         const struct pipe_resource *templ,
403                         struct winsys_handle *whandle)
404{
405   struct nv50_miptree *mt;
406   unsigned stride;
407
408   /* only supports 2D, non-mipmapped textures for the moment */
409   if ((templ->target != PIPE_TEXTURE_2D &&
410        templ->target != PIPE_TEXTURE_RECT) ||
411       templ->last_level != 0 ||
412       templ->depth0 != 1 ||
413       templ->array_size > 1)
414      return NULL;
415
416   mt = CALLOC_STRUCT(nv50_miptree);
417   if (!mt)
418      return NULL;
419
420   mt->base.bo = nouveau_screen_bo_from_handle(pscreen, whandle, &stride);
421   if (mt->base.bo == NULL) {
422      FREE(mt);
423      return NULL;
424   }
425   mt->base.domain = mt->base.bo->flags & NOUVEAU_BO_APER;
426   mt->base.address = mt->base.bo->offset;
427
428   mt->base.base = *templ;
429   mt->base.vtbl = &nv50_miptree_vtbl;
430   pipe_reference_init(&mt->base.base.reference, 1);
431   mt->base.base.screen = pscreen;
432   mt->level[0].pitch = stride;
433   mt->level[0].offset = 0;
434   mt->level[0].tile_mode = mt->base.bo->config.nv50.tile_mode;
435
436   NOUVEAU_DRV_STAT(nouveau_screen(pscreen), tex_obj_current_count, 1);
437
438   /* no need to adjust bo reference count */
439   return &mt->base.base;
440}
441
442
443/* Offset of zslice @z from start of level @l. */
444inline unsigned
445nv50_mt_zslice_offset(const struct nv50_miptree *mt, unsigned l, unsigned z)
446{
447   const struct pipe_resource *pt = &mt->base.base;
448
449   unsigned tds = NV50_TILE_SHIFT_Z(mt->level[l].tile_mode);
450   unsigned ths = NV50_TILE_SHIFT_Y(mt->level[l].tile_mode);
451
452   unsigned nby = util_format_get_nblocksy(pt->format,
453                                           u_minify(pt->height0, l));
454
455   /* to next 2D tile slice within a 3D tile */
456   unsigned stride_2d = NV50_TILE_SIZE_2D(mt->level[l].tile_mode);
457
458   /* to slice in the next (in z direction) 3D tile */
459   unsigned stride_3d = (align(nby, (1 << ths)) * mt->level[l].pitch) << tds;
460
461   return (z & ((1 << tds) - 1)) * stride_2d + (z >> tds) * stride_3d;
462}
463
464/* Surface functions.
465 */
466
467struct nv50_surface *
468nv50_surface_from_miptree(struct nv50_miptree *mt,
469                          const struct pipe_surface *templ)
470{
471   struct pipe_surface *ps;
472   struct nv50_surface *ns = CALLOC_STRUCT(nv50_surface);
473   if (!ns)
474      return NULL;
475   ps = &ns->base;
476
477   pipe_reference_init(&ps->reference, 1);
478   pipe_resource_reference(&ps->texture, &mt->base.base);
479
480   ps->format = templ->format;
481   ps->writable = templ->writable;
482   ps->u.tex.level = templ->u.tex.level;
483   ps->u.tex.first_layer = templ->u.tex.first_layer;
484   ps->u.tex.last_layer = templ->u.tex.last_layer;
485
486   ns->width = u_minify(mt->base.base.width0, ps->u.tex.level);
487   ns->height = u_minify(mt->base.base.height0, ps->u.tex.level);
488   ns->depth = ps->u.tex.last_layer - ps->u.tex.first_layer + 1;
489   ns->offset = mt->level[templ->u.tex.level].offset;
490
491   /* comment says there are going to be removed, but they're used by the st */
492   ps->width = ns->width;
493   ps->height = ns->height;
494
495   ns->width <<= mt->ms_x;
496   ns->height <<= mt->ms_y;
497
498   return ns;
499}
500
501struct pipe_surface *
502nv50_miptree_surface_new(struct pipe_context *pipe,
503                         struct pipe_resource *pt,
504                         const struct pipe_surface *templ)
505{
506   struct nv50_miptree *mt = nv50_miptree(pt);
507   struct nv50_surface *ns = nv50_surface_from_miptree(mt, templ);
508   if (!ns)
509      return NULL;
510   ns->base.context = pipe;
511
512   if (ns->base.u.tex.first_layer) {
513      const unsigned l = ns->base.u.tex.level;
514      const unsigned z = ns->base.u.tex.first_layer;
515
516      if (mt->layout_3d) {
517         ns->offset += nv50_mt_zslice_offset(mt, l, z);
518
519         /* TODO: switch to depth 1 tiles; but actually this shouldn't happen */
520         if (ns->depth > 1 &&
521             (z & (NV50_TILE_SIZE_Z(mt->level[l].tile_mode) - 1)))
522            NOUVEAU_ERR("Creating unsupported 3D surface !\n");
523      } else {
524         ns->offset += mt->layer_stride * z;
525      }
526   }
527
528   return &ns->base;
529}
530