radeon_drm_bo.c revision 6ccab620a0e7364ab6c0d902b3ddf58ee988f7fa
1#define _FILE_OFFSET_BITS 64 2#include "radeon_drm_cs.h" 3 4#include "util/u_hash_table.h" 5#include "util/u_memory.h" 6#include "util/u_simple_list.h" 7#include "os/os_thread.h" 8 9#include "state_tracker/drm_driver.h" 10 11#include <sys/ioctl.h> 12#include <sys/mman.h> 13#include <xf86drm.h> 14#include <errno.h> 15 16#define RADEON_BO_FLAGS_MACRO_TILE 1 17#define RADEON_BO_FLAGS_MICRO_TILE 2 18#define RADEON_BO_FLAGS_MICRO_TILE_SQUARE 0x20 19 20extern const struct pb_vtbl radeon_bo_vtbl; 21 22 23static INLINE struct radeon_bo *radeon_bo(struct pb_buffer *bo) 24{ 25 assert(bo->vtbl == &radeon_bo_vtbl); 26 return (struct radeon_bo *)bo; 27} 28 29struct radeon_bomgr { 30 /* Base class. */ 31 struct pb_manager base; 32 33 /* Winsys. */ 34 struct radeon_drm_winsys *rws; 35 36 /* List of buffer handles and its mutex. */ 37 struct util_hash_table *bo_handles; 38 pipe_mutex bo_handles_mutex; 39}; 40 41static INLINE struct radeon_bomgr *radeon_bomgr(struct pb_manager *mgr) 42{ 43 return (struct radeon_bomgr *)mgr; 44} 45 46static struct radeon_bo *get_radeon_bo(struct pb_buffer *_buf) 47{ 48 struct radeon_bo *bo = NULL; 49 50 if (_buf->vtbl == &radeon_bo_vtbl) { 51 bo = radeon_bo(_buf); 52 } else { 53 struct pb_buffer *base_buf; 54 pb_size offset; 55 pb_get_base_buffer(_buf, &base_buf, &offset); 56 57 if (base_buf->vtbl == &radeon_bo_vtbl) 58 bo = radeon_bo(base_buf); 59 } 60 61 return bo; 62} 63 64void radeon_bo_unref(struct radeon_bo *bo) 65{ 66 struct drm_gem_close args = {}; 67 68 if (!p_atomic_dec_zero(&bo->cref)) 69 return; 70 71 if (bo->name) { 72 pipe_mutex_lock(bo->mgr->bo_handles_mutex); 73 util_hash_table_remove(bo->mgr->bo_handles, 74 (void*)(uintptr_t)bo->name); 75 pipe_mutex_unlock(bo->mgr->bo_handles_mutex); 76 } 77 78 if (bo->ptr) 79 munmap(bo->ptr, bo->size); 80 81 /* Close object. */ 82 args.handle = bo->handle; 83 drmIoctl(bo->mgr->rws->fd, DRM_IOCTL_GEM_CLOSE, &args); 84 FREE(bo); 85} 86 87static void radeon_bo_wait(struct r300_winsys_bo *_buf) 88{ 89 struct radeon_bo *bo = get_radeon_bo(pb_buffer(_buf)); 90 struct drm_radeon_gem_wait_idle args = {}; 91 92 args.handle = bo->handle; 93 while (drmCommandWriteRead(bo->mgr->rws->fd, DRM_RADEON_GEM_WAIT_IDLE, 94 &args, sizeof(args)) == -EBUSY); 95} 96 97static boolean radeon_bo_is_busy(struct r300_winsys_bo *_buf) 98{ 99 struct radeon_bo *bo = get_radeon_bo(pb_buffer(_buf)); 100 struct drm_radeon_gem_busy args = {}; 101 102 args.handle = bo->handle; 103 return drmCommandWriteRead(bo->mgr->rws->fd, DRM_RADEON_GEM_BUSY, 104 &args, sizeof(args)) != 0; 105} 106 107static void radeon_bo_destroy(struct pb_buffer *_buf) 108{ 109 struct radeon_bo *bo = radeon_bo(_buf); 110 111 radeon_bo_unref(bo); 112} 113 114static unsigned get_pb_usage_from_transfer_flags(enum pipe_transfer_usage usage) 115{ 116 unsigned res = 0; 117 118 if (usage & PIPE_TRANSFER_READ) 119 res |= PB_USAGE_CPU_READ; 120 121 if (usage & PIPE_TRANSFER_WRITE) 122 res |= PB_USAGE_CPU_WRITE; 123 124 if (usage & PIPE_TRANSFER_DONTBLOCK) 125 res |= PB_USAGE_DONTBLOCK; 126 127 if (usage & PIPE_TRANSFER_UNSYNCHRONIZED) 128 res |= PB_USAGE_UNSYNCHRONIZED; 129 130 return res; 131} 132 133static void *radeon_bo_map_internal(struct pb_buffer *_buf, 134 unsigned flags, void *flush_ctx) 135{ 136 struct radeon_bo *bo = radeon_bo(_buf); 137 struct radeon_drm_cs *cs = flush_ctx; 138 struct drm_radeon_gem_mmap args = {}; 139 140 if (flags & PB_USAGE_DONTBLOCK) { 141 /* Note how we use radeon_bo_is_referenced_by_cs here. There are 142 * basically two places this map function can be called from: 143 * - pb_map 144 * - create_buffer (in the buffer reuse case) 145 * 146 * Since pb managers are per-winsys managers, not per-context managers, 147 * and we shouldn't reuse buffers if they are in-use in any context, 148 * we simply ask: is this buffer referenced by *any* CS? 149 * 150 * The problem with buffer_create is that it comes from pipe_screen, 151 * so we have no CS to look at, though luckily the following code 152 * is sufficient to tell whether the buffer is in use. */ 153 if (_buf->base.usage & RADEON_PB_USAGE_CACHE) { 154 if (radeon_bo_is_referenced_by_any_cs(bo)) 155 return NULL; 156 } 157 158 if (cs && radeon_bo_is_referenced_by_cs(cs, bo)) { 159 cs->flush_cs(cs->flush_data); 160 return NULL; /* It's very unlikely that the buffer is not busy. */ 161 } 162 163 if (radeon_bo_is_busy((struct r300_winsys_bo*)bo)) { 164 return NULL; 165 } 166 } 167 168 /* If it's not unsynchronized bo_map, flush CS if needed and then wait. */ 169 if (!(flags & PB_USAGE_UNSYNCHRONIZED)) { 170 if (cs && radeon_bo_is_referenced_by_cs(cs, bo)) { 171 cs->flush_cs(cs->flush_data); 172 } 173 174 radeon_bo_wait((struct r300_winsys_bo*)bo); 175 } 176 177 /* Map buffer if it's not already mapped. */ 178 /* XXX We may get a race in bo->ptr. */ 179 if (!bo->ptr) { 180 void *ptr; 181 182 args.handle = bo->handle; 183 args.offset = 0; 184 args.size = (uint64_t)bo->size; 185 if (drmCommandWriteRead(bo->mgr->rws->fd, 186 DRM_RADEON_GEM_MMAP, 187 &args, 188 sizeof(args))) { 189 fprintf(stderr, "radeon: gem_mmap failed: %p 0x%08X\n", 190 bo, bo->handle); 191 return NULL; 192 } 193 ptr = mmap(0, args.size, PROT_READ|PROT_WRITE, MAP_SHARED, 194 bo->mgr->rws->fd, args.addr_ptr); 195 if (ptr == MAP_FAILED) { 196 fprintf(stderr, "radeon: mmap failed, errno: %i\n", errno); 197 return NULL; 198 } 199 bo->ptr = ptr; 200 } 201 202 return bo->ptr; 203} 204 205static void radeon_bo_unmap_internal(struct pb_buffer *_buf) 206{ 207 /* NOP */ 208} 209 210static void radeon_bo_get_base_buffer(struct pb_buffer *buf, 211 struct pb_buffer **base_buf, 212 unsigned *offset) 213{ 214 *base_buf = buf; 215 *offset = 0; 216} 217 218static enum pipe_error radeon_bo_validate(struct pb_buffer *_buf, 219 struct pb_validate *vl, 220 unsigned flags) 221{ 222 /* Always pinned */ 223 return PIPE_OK; 224} 225 226static void radeon_bo_fence(struct pb_buffer *buf, 227 struct pipe_fence_handle *fence) 228{ 229} 230 231const struct pb_vtbl radeon_bo_vtbl = { 232 radeon_bo_destroy, 233 radeon_bo_map_internal, 234 radeon_bo_unmap_internal, 235 radeon_bo_validate, 236 radeon_bo_fence, 237 radeon_bo_get_base_buffer, 238}; 239 240static struct pb_buffer *radeon_bomgr_create_bo(struct pb_manager *_mgr, 241 pb_size size, 242 const struct pb_desc *desc) 243{ 244 struct radeon_bomgr *mgr = radeon_bomgr(_mgr); 245 struct radeon_drm_winsys *rws = mgr->rws; 246 struct radeon_bo *bo; 247 struct drm_radeon_gem_create args = {}; 248 249 args.size = size; 250 args.alignment = desc->alignment; 251 args.initial_domain = 252 (desc->usage & RADEON_PB_USAGE_DOMAIN_GTT ? 253 RADEON_GEM_DOMAIN_GTT : 0) | 254 (desc->usage & RADEON_PB_USAGE_DOMAIN_VRAM ? 255 RADEON_GEM_DOMAIN_VRAM : 0); 256 257 if (drmCommandWriteRead(rws->fd, DRM_RADEON_GEM_CREATE, 258 &args, sizeof(args))) { 259 fprintf(stderr, "Failed to allocate :\n"); 260 fprintf(stderr, " size : %d bytes\n", size); 261 fprintf(stderr, " alignment : %d bytes\n", desc->alignment); 262 fprintf(stderr, " domains : %d\n", args.initial_domain); 263 return NULL; 264 } 265 266 bo = CALLOC_STRUCT(radeon_bo); 267 if (!bo) 268 return NULL; 269 270 pipe_reference_init(&bo->base.base.reference, 1); 271 bo->base.base.alignment = desc->alignment; 272 bo->base.base.usage = desc->usage; 273 bo->base.base.size = size; 274 bo->base.vtbl = &radeon_bo_vtbl; 275 bo->mgr = mgr; 276 bo->handle = args.handle; 277 bo->size = size; 278 279 radeon_bo_ref(bo); 280 return &bo->base; 281} 282 283static void radeon_bomgr_flush(struct pb_manager *mgr) 284{ 285 /* NOP */ 286} 287 288static void radeon_bomgr_destroy(struct pb_manager *_mgr) 289{ 290 struct radeon_bomgr *mgr = radeon_bomgr(_mgr); 291 util_hash_table_destroy(mgr->bo_handles); 292 pipe_mutex_destroy(mgr->bo_handles_mutex); 293 FREE(mgr); 294} 295 296static unsigned handle_hash(void *key) 297{ 298 return (unsigned)key; 299} 300 301static int handle_compare(void *key1, void *key2) 302{ 303 return !((int)key1 == (int)key2); 304} 305 306struct pb_manager *radeon_bomgr_create(struct radeon_drm_winsys *rws) 307{ 308 struct radeon_bomgr *mgr; 309 310 mgr = CALLOC_STRUCT(radeon_bomgr); 311 if (!mgr) 312 return NULL; 313 314 mgr->base.destroy = radeon_bomgr_destroy; 315 mgr->base.create_buffer = radeon_bomgr_create_bo; 316 mgr->base.flush = radeon_bomgr_flush; 317 318 mgr->rws = rws; 319 mgr->bo_handles = util_hash_table_create(handle_hash, handle_compare); 320 pipe_mutex_init(mgr->bo_handles_mutex); 321 return &mgr->base; 322} 323 324static void *radeon_bo_map(struct r300_winsys_bo *buf, 325 struct r300_winsys_cs *cs, 326 enum pipe_transfer_usage usage) 327{ 328 struct pb_buffer *_buf = pb_buffer(buf); 329 330 return pb_map(_buf, get_pb_usage_from_transfer_flags(usage), cs); 331} 332 333static void radeon_bo_get_tiling(struct r300_winsys_bo *_buf, 334 enum r300_buffer_tiling *microtiled, 335 enum r300_buffer_tiling *macrotiled) 336{ 337 struct radeon_bo *bo = get_radeon_bo(pb_buffer(_buf)); 338 struct drm_radeon_gem_set_tiling args = {}; 339 340 args.handle = bo->handle; 341 342 drmCommandWriteRead(bo->mgr->rws->fd, 343 DRM_RADEON_GEM_GET_TILING, 344 &args, 345 sizeof(args)); 346 347 *microtiled = R300_BUFFER_LINEAR; 348 *macrotiled = R300_BUFFER_LINEAR; 349 if (args.tiling_flags & RADEON_BO_FLAGS_MICRO_TILE) 350 *microtiled = R300_BUFFER_TILED; 351 352 if (args.tiling_flags & RADEON_BO_FLAGS_MACRO_TILE) 353 *macrotiled = R300_BUFFER_TILED; 354} 355 356static void radeon_bo_set_tiling(struct r300_winsys_bo *_buf, 357 enum r300_buffer_tiling microtiled, 358 enum r300_buffer_tiling macrotiled, 359 uint32_t pitch) 360{ 361 struct radeon_bo *bo = get_radeon_bo(pb_buffer(_buf)); 362 struct drm_radeon_gem_set_tiling args = {}; 363 364 if (microtiled == R300_BUFFER_TILED) 365 args.tiling_flags |= RADEON_BO_FLAGS_MICRO_TILE; 366 else if (microtiled == R300_BUFFER_SQUARETILED) 367 args.tiling_flags |= RADEON_BO_FLAGS_MICRO_TILE_SQUARE; 368 369 if (macrotiled == R300_BUFFER_TILED) 370 args.tiling_flags |= RADEON_BO_FLAGS_MACRO_TILE; 371 372 args.handle = bo->handle; 373 args.pitch = pitch; 374 375 drmCommandWriteRead(bo->mgr->rws->fd, 376 DRM_RADEON_GEM_SET_TILING, 377 &args, 378 sizeof(args)); 379} 380 381static struct r300_winsys_cs_handle *radeon_drm_get_cs_handle( 382 struct r300_winsys_bo *_buf) 383{ 384 /* return radeon_bo. */ 385 return (struct r300_winsys_cs_handle*) 386 get_radeon_bo(pb_buffer(_buf)); 387} 388 389static unsigned get_pb_usage_from_create_flags(unsigned bind, unsigned usage, 390 enum r300_buffer_domain domain) 391{ 392 unsigned res = 0; 393 394 if (bind & (PIPE_BIND_VERTEX_BUFFER | PIPE_BIND_INDEX_BUFFER)) 395 res |= RADEON_PB_USAGE_CACHE; 396 397 if (domain & R300_DOMAIN_GTT) 398 res |= RADEON_PB_USAGE_DOMAIN_GTT; 399 400 if (domain & R300_DOMAIN_VRAM) 401 res |= RADEON_PB_USAGE_DOMAIN_VRAM; 402 403 return res; 404} 405 406static struct r300_winsys_bo * 407radeon_winsys_bo_create(struct r300_winsys_screen *rws, 408 unsigned size, 409 unsigned alignment, 410 unsigned bind, 411 unsigned usage, 412 enum r300_buffer_domain domain) 413{ 414 struct radeon_drm_winsys *ws = radeon_drm_winsys(rws); 415 struct pb_desc desc; 416 struct pb_manager *provider; 417 struct pb_buffer *buffer; 418 419 memset(&desc, 0, sizeof(desc)); 420 desc.alignment = alignment; 421 desc.usage = get_pb_usage_from_create_flags(bind, usage, domain); 422 423 /* Assign a buffer manager. */ 424 if (bind & (PIPE_BIND_VERTEX_BUFFER | PIPE_BIND_INDEX_BUFFER)) 425 provider = ws->cman; 426 else 427 provider = ws->kman; 428 429 buffer = provider->create_buffer(provider, size, &desc); 430 if (!buffer) 431 return NULL; 432 433 return (struct r300_winsys_bo*)buffer; 434} 435 436static struct r300_winsys_bo *radeon_winsys_bo_from_handle(struct r300_winsys_screen *rws, 437 struct winsys_handle *whandle, 438 unsigned *stride, 439 unsigned *size) 440{ 441 struct radeon_drm_winsys *ws = radeon_drm_winsys(rws); 442 struct radeon_bo *bo; 443 struct radeon_bomgr *mgr = radeon_bomgr(ws->kman); 444 struct drm_gem_open open_arg = {}; 445 446 /* We must maintain a list of pairs <handle, bo>, so that we always return 447 * the same BO for one particular handle. If we didn't do that and created 448 * more than one BO for the same handle and then relocated them in a CS, 449 * we would hit a deadlock in the kernel. 450 * 451 * The list of pairs is guarded by a mutex, of course. */ 452 pipe_mutex_lock(mgr->bo_handles_mutex); 453 454 /* First check if there already is an existing bo for the handle. */ 455 bo = util_hash_table_get(mgr->bo_handles, (void*)(uintptr_t)whandle->handle); 456 if (bo) { 457 /* Increase the refcount. */ 458 struct pb_buffer *b = NULL; 459 pb_reference(&b, &bo->base); 460 goto done; 461 } 462 463 /* There isn't, create a new one. */ 464 bo = CALLOC_STRUCT(radeon_bo); 465 if (!bo) { 466 goto fail; 467 } 468 469 /* Open the BO. */ 470 open_arg.name = whandle->handle; 471 if (drmIoctl(ws->fd, DRM_IOCTL_GEM_OPEN, &open_arg)) { 472 goto fail; 473 } 474 bo->handle = open_arg.handle; 475 bo->size = open_arg.size; 476 bo->name = whandle->handle; 477 radeon_bo_ref(bo); 478 479 /* Initialize it. */ 480 pipe_reference_init(&bo->base.base.reference, 1); 481 bo->base.base.alignment = 0; 482 bo->base.base.usage = PB_USAGE_GPU_WRITE | PB_USAGE_GPU_READ; 483 bo->base.base.size = bo->size; 484 bo->base.vtbl = &radeon_bo_vtbl; 485 bo->mgr = mgr; 486 487 util_hash_table_set(mgr->bo_handles, (void*)(uintptr_t)whandle->handle, bo); 488 489done: 490 pipe_mutex_unlock(mgr->bo_handles_mutex); 491 492 if (stride) 493 *stride = whandle->stride; 494 if (size) 495 *size = bo->base.base.size; 496 497 return (struct r300_winsys_bo*)bo; 498 499fail: 500 pipe_mutex_unlock(mgr->bo_handles_mutex); 501 return NULL; 502} 503 504static boolean radeon_winsys_bo_get_handle(struct r300_winsys_bo *buffer, 505 unsigned stride, 506 struct winsys_handle *whandle) 507{ 508 struct drm_gem_flink flink = {}; 509 struct radeon_bo *bo = get_radeon_bo(pb_buffer(buffer)); 510 whandle->stride = stride; 511 512 513 if (whandle->type == DRM_API_HANDLE_TYPE_SHARED) { 514 if (!bo->flinked) { 515 flink.handle = bo->handle; 516 517 if (ioctl(bo->mgr->rws->fd, DRM_IOCTL_GEM_FLINK, &flink)) { 518 return FALSE; 519 } 520 521 bo->flinked = TRUE; 522 bo->flink = flink.name; 523 } 524 whandle->handle = bo->flink; 525 } else if (whandle->type == DRM_API_HANDLE_TYPE_KMS) { 526 whandle->handle = bo->handle; 527 } 528 return TRUE; 529} 530 531void radeon_bomgr_init_functions(struct radeon_drm_winsys *ws) 532{ 533 ws->base.buffer_get_cs_handle = radeon_drm_get_cs_handle; 534 ws->base.buffer_set_tiling = radeon_bo_set_tiling; 535 ws->base.buffer_get_tiling = radeon_bo_get_tiling; 536 ws->base.buffer_map = radeon_bo_map; 537 ws->base.buffer_unmap = pb_unmap; 538 ws->base.buffer_wait = radeon_bo_wait; 539 ws->base.buffer_is_busy = radeon_bo_is_busy; 540 ws->base.buffer_create = radeon_winsys_bo_create; 541 ws->base.buffer_from_handle = radeon_winsys_bo_from_handle; 542 ws->base.buffer_get_handle = radeon_winsys_bo_get_handle; 543} 544