vmwgfx_execbuf.c revision 97a875cbdf89a4638eea57c2b456c7cc4e3e8b21
1/**************************************************************************
2 *
3 * Copyright © 2009 VMware, Inc., Palo Alto, CA., USA
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
19 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
20 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
21 * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
22 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
23 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
24 * USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28#include "vmwgfx_drv.h"
29#include "vmwgfx_reg.h"
30#include <drm/ttm/ttm_bo_api.h>
31#include <drm/ttm/ttm_placement.h>
32
33#define VMW_RES_HT_ORDER 12
34
35/**
36 * struct vmw_resource_relocation - Relocation info for resources
37 *
38 * @head: List head for the software context's relocation list.
39 * @res: Non-ref-counted pointer to the resource.
40 * @offset: Offset of 4 byte entries into the command buffer where the
41 * id that needs fixup is located.
42 */
43struct vmw_resource_relocation {
44	struct list_head head;
45	const struct vmw_resource *res;
46	unsigned long offset;
47};
48
49/**
50 * struct vmw_resource_val_node - Validation info for resources
51 *
52 * @head: List head for the software context's resource list.
53 * @hash: Hash entry for quick resouce to val_node lookup.
54 * @res: Ref-counted pointer to the resource.
55 * @switch_backup: Boolean whether to switch backup buffer on unreserve.
56 * @new_backup: Refcounted pointer to the new backup buffer.
57 * @new_backup_offset: New backup buffer offset if @new_backup is non-NUll.
58 * @first_usage: Set to true the first time the resource is referenced in
59 * the command stream.
60 * @no_buffer_needed: Resources do not need to allocate buffer backup on
61 * reservation. The command stream will provide one.
62 */
63struct vmw_resource_val_node {
64	struct list_head head;
65	struct drm_hash_item hash;
66	struct vmw_resource *res;
67	struct vmw_dma_buffer *new_backup;
68	unsigned long new_backup_offset;
69	bool first_usage;
70	bool no_buffer_needed;
71};
72
73/**
74 * vmw_resource_unreserve - unreserve resources previously reserved for
75 * command submission.
76 *
77 * @list_head: list of resources to unreserve.
78 * @backoff: Whether command submission failed.
79 */
80static void vmw_resource_list_unreserve(struct list_head *list,
81					bool backoff)
82{
83	struct vmw_resource_val_node *val;
84
85	list_for_each_entry(val, list, head) {
86		struct vmw_resource *res = val->res;
87		struct vmw_dma_buffer *new_backup =
88			backoff ? NULL : val->new_backup;
89
90		vmw_resource_unreserve(res, new_backup,
91			val->new_backup_offset);
92		vmw_dmabuf_unreference(&val->new_backup);
93	}
94}
95
96
97/**
98 * vmw_resource_val_add - Add a resource to the software context's
99 * resource list if it's not already on it.
100 *
101 * @sw_context: Pointer to the software context.
102 * @res: Pointer to the resource.
103 * @p_node On successful return points to a valid pointer to a
104 * struct vmw_resource_val_node, if non-NULL on entry.
105 */
106static int vmw_resource_val_add(struct vmw_sw_context *sw_context,
107				struct vmw_resource *res,
108				struct vmw_resource_val_node **p_node)
109{
110	struct vmw_resource_val_node *node;
111	struct drm_hash_item *hash;
112	int ret;
113
114	if (likely(drm_ht_find_item(&sw_context->res_ht, (unsigned long) res,
115				    &hash) == 0)) {
116		node = container_of(hash, struct vmw_resource_val_node, hash);
117		node->first_usage = false;
118		if (unlikely(p_node != NULL))
119			*p_node = node;
120		return 0;
121	}
122
123	node = kzalloc(sizeof(*node), GFP_KERNEL);
124	if (unlikely(node == NULL)) {
125		DRM_ERROR("Failed to allocate a resource validation "
126			  "entry.\n");
127		return -ENOMEM;
128	}
129
130	node->hash.key = (unsigned long) res;
131	ret = drm_ht_insert_item(&sw_context->res_ht, &node->hash);
132	if (unlikely(ret != 0)) {
133		DRM_ERROR("Failed to initialize a resource validation "
134			  "entry.\n");
135		kfree(node);
136		return ret;
137	}
138	list_add_tail(&node->head, &sw_context->resource_list);
139	node->res = vmw_resource_reference(res);
140	node->first_usage = true;
141
142	if (unlikely(p_node != NULL))
143		*p_node = node;
144
145	return 0;
146}
147
148/**
149 * vmw_resource_relocation_add - Add a relocation to the relocation list
150 *
151 * @list: Pointer to head of relocation list.
152 * @res: The resource.
153 * @offset: Offset into the command buffer currently being parsed where the
154 * id that needs fixup is located. Granularity is 4 bytes.
155 */
156static int vmw_resource_relocation_add(struct list_head *list,
157				       const struct vmw_resource *res,
158				       unsigned long offset)
159{
160	struct vmw_resource_relocation *rel;
161
162	rel = kmalloc(sizeof(*rel), GFP_KERNEL);
163	if (unlikely(rel == NULL)) {
164		DRM_ERROR("Failed to allocate a resource relocation.\n");
165		return -ENOMEM;
166	}
167
168	rel->res = res;
169	rel->offset = offset;
170	list_add_tail(&rel->head, list);
171
172	return 0;
173}
174
175/**
176 * vmw_resource_relocations_free - Free all relocations on a list
177 *
178 * @list: Pointer to the head of the relocation list.
179 */
180static void vmw_resource_relocations_free(struct list_head *list)
181{
182	struct vmw_resource_relocation *rel, *n;
183
184	list_for_each_entry_safe(rel, n, list, head) {
185		list_del(&rel->head);
186		kfree(rel);
187	}
188}
189
190/**
191 * vmw_resource_relocations_apply - Apply all relocations on a list
192 *
193 * @cb: Pointer to the start of the command buffer bein patch. This need
194 * not be the same buffer as the one being parsed when the relocation
195 * list was built, but the contents must be the same modulo the
196 * resource ids.
197 * @list: Pointer to the head of the relocation list.
198 */
199static void vmw_resource_relocations_apply(uint32_t *cb,
200					   struct list_head *list)
201{
202	struct vmw_resource_relocation *rel;
203
204	list_for_each_entry(rel, list, head)
205		cb[rel->offset] = rel->res->id;
206}
207
208static int vmw_cmd_invalid(struct vmw_private *dev_priv,
209			   struct vmw_sw_context *sw_context,
210			   SVGA3dCmdHeader *header)
211{
212	return capable(CAP_SYS_ADMIN) ? : -EINVAL;
213}
214
215static int vmw_cmd_ok(struct vmw_private *dev_priv,
216		      struct vmw_sw_context *sw_context,
217		      SVGA3dCmdHeader *header)
218{
219	return 0;
220}
221
222/**
223 * vmw_bo_to_validate_list - add a bo to a validate list
224 *
225 * @sw_context: The software context used for this command submission batch.
226 * @bo: The buffer object to add.
227 * @p_val_node: If non-NULL Will be updated with the validate node number
228 * on return.
229 *
230 * Returns -EINVAL if the limit of number of buffer objects per command
231 * submission is reached.
232 */
233static int vmw_bo_to_validate_list(struct vmw_sw_context *sw_context,
234				   struct ttm_buffer_object *bo,
235				   uint32_t *p_val_node)
236{
237	uint32_t val_node;
238	struct vmw_validate_buffer *vval_buf;
239	struct ttm_validate_buffer *val_buf;
240	struct drm_hash_item *hash;
241	int ret;
242
243	if (likely(drm_ht_find_item(&sw_context->res_ht, (unsigned long) bo,
244				    &hash) == 0)) {
245		vval_buf = container_of(hash, struct vmw_validate_buffer,
246					hash);
247		val_buf = &vval_buf->base;
248		val_node = vval_buf - sw_context->val_bufs;
249	} else {
250		val_node = sw_context->cur_val_buf;
251		if (unlikely(val_node >= VMWGFX_MAX_VALIDATIONS)) {
252			DRM_ERROR("Max number of DMA buffers per submission "
253				  "exceeded.\n");
254			return -EINVAL;
255		}
256		vval_buf = &sw_context->val_bufs[val_node];
257		vval_buf->hash.key = (unsigned long) bo;
258		ret = drm_ht_insert_item(&sw_context->res_ht, &vval_buf->hash);
259		if (unlikely(ret != 0)) {
260			DRM_ERROR("Failed to initialize a buffer validation "
261				  "entry.\n");
262			return ret;
263		}
264		++sw_context->cur_val_buf;
265		val_buf = &vval_buf->base;
266		val_buf->bo = ttm_bo_reference(bo);
267		val_buf->reserved = false;
268		list_add_tail(&val_buf->head, &sw_context->validate_nodes);
269	}
270
271	sw_context->fence_flags |= DRM_VMW_FENCE_FLAG_EXEC;
272
273	if (p_val_node)
274		*p_val_node = val_node;
275
276	return 0;
277}
278
279/**
280 * vmw_resources_reserve - Reserve all resources on the sw_context's
281 * resource list.
282 *
283 * @sw_context: Pointer to the software context.
284 *
285 * Note that since vmware's command submission currently is protected by
286 * the cmdbuf mutex, no fancy deadlock avoidance is required for resources,
287 * since only a single thread at once will attempt this.
288 */
289static int vmw_resources_reserve(struct vmw_sw_context *sw_context)
290{
291	struct vmw_resource_val_node *val;
292	int ret;
293
294	list_for_each_entry(val, &sw_context->resource_list, head) {
295		struct vmw_resource *res = val->res;
296
297		ret = vmw_resource_reserve(res, val->no_buffer_needed);
298		if (unlikely(ret != 0))
299			return ret;
300
301		if (res->backup) {
302			struct ttm_buffer_object *bo = &res->backup->base;
303
304			ret = vmw_bo_to_validate_list
305				(sw_context, bo, NULL);
306
307			if (unlikely(ret != 0))
308				return ret;
309		}
310	}
311	return 0;
312}
313
314/**
315 * vmw_resources_validate - Validate all resources on the sw_context's
316 * resource list.
317 *
318 * @sw_context: Pointer to the software context.
319 *
320 * Before this function is called, all resource backup buffers must have
321 * been validated.
322 */
323static int vmw_resources_validate(struct vmw_sw_context *sw_context)
324{
325	struct vmw_resource_val_node *val;
326	int ret;
327
328	list_for_each_entry(val, &sw_context->resource_list, head) {
329		struct vmw_resource *res = val->res;
330
331		ret = vmw_resource_validate(res);
332		if (unlikely(ret != 0)) {
333			if (ret != -ERESTARTSYS)
334				DRM_ERROR("Failed to validate resource.\n");
335			return ret;
336		}
337	}
338	return 0;
339}
340
341/**
342 * vmw_cmd_res_check - Check that a resource is present and if so, put it
343 * on the resource validate list unless it's already there.
344 *
345 * @dev_priv: Pointer to a device private structure.
346 * @sw_context: Pointer to the software context.
347 * @res_type: Resource type.
348 * @converter: User-space visisble type specific information.
349 * @id: Pointer to the location in the command buffer currently being
350 * parsed from where the user-space resource id handle is located.
351 */
352static int vmw_cmd_res_check(struct vmw_private *dev_priv,
353			     struct vmw_sw_context *sw_context,
354			     enum vmw_res_type res_type,
355			     const struct vmw_user_resource_conv *converter,
356			     uint32_t *id,
357			     struct vmw_resource_val_node **p_val)
358{
359	struct vmw_res_cache_entry *rcache =
360		&sw_context->res_cache[res_type];
361	struct vmw_resource *res;
362	struct vmw_resource_val_node *node;
363	int ret;
364
365	if (*id == SVGA3D_INVALID_ID)
366		return 0;
367
368	/*
369	 * Fastpath in case of repeated commands referencing the same
370	 * resource
371	 */
372
373	if (likely(rcache->valid && *id == rcache->handle)) {
374		const struct vmw_resource *res = rcache->res;
375
376		rcache->node->first_usage = false;
377		if (p_val)
378			*p_val = rcache->node;
379
380		return vmw_resource_relocation_add
381			(&sw_context->res_relocations, res,
382			 id - sw_context->buf_start);
383	}
384
385	ret = vmw_user_resource_lookup_handle(dev_priv,
386					      sw_context->tfile,
387					      *id,
388					      converter,
389					      &res);
390	if (unlikely(ret != 0)) {
391		DRM_ERROR("Could not find or use resource 0x%08x.\n",
392			  (unsigned) *id);
393		dump_stack();
394		return ret;
395	}
396
397	rcache->valid = true;
398	rcache->res = res;
399	rcache->handle = *id;
400
401	ret = vmw_resource_relocation_add(&sw_context->res_relocations,
402					  res,
403					  id - sw_context->buf_start);
404	if (unlikely(ret != 0))
405		goto out_no_reloc;
406
407	ret = vmw_resource_val_add(sw_context, res, &node);
408	if (unlikely(ret != 0))
409		goto out_no_reloc;
410
411	rcache->node = node;
412	if (p_val)
413		*p_val = node;
414	vmw_resource_unreference(&res);
415	return 0;
416
417out_no_reloc:
418	BUG_ON(sw_context->error_resource != NULL);
419	sw_context->error_resource = res;
420
421	return ret;
422}
423
424/**
425 * vmw_cmd_cid_check - Check a command header for valid context information.
426 *
427 * @dev_priv: Pointer to a device private structure.
428 * @sw_context: Pointer to the software context.
429 * @header: A command header with an embedded user-space context handle.
430 *
431 * Convenience function: Call vmw_cmd_res_check with the user-space context
432 * handle embedded in @header.
433 */
434static int vmw_cmd_cid_check(struct vmw_private *dev_priv,
435			     struct vmw_sw_context *sw_context,
436			     SVGA3dCmdHeader *header)
437{
438	struct vmw_cid_cmd {
439		SVGA3dCmdHeader header;
440		__le32 cid;
441	} *cmd;
442
443	cmd = container_of(header, struct vmw_cid_cmd, header);
444	return vmw_cmd_res_check(dev_priv, sw_context, vmw_res_context,
445				 user_context_converter, &cmd->cid, NULL);
446}
447
448static int vmw_cmd_set_render_target_check(struct vmw_private *dev_priv,
449					   struct vmw_sw_context *sw_context,
450					   SVGA3dCmdHeader *header)
451{
452	struct vmw_sid_cmd {
453		SVGA3dCmdHeader header;
454		SVGA3dCmdSetRenderTarget body;
455	} *cmd;
456	int ret;
457
458	ret = vmw_cmd_cid_check(dev_priv, sw_context, header);
459	if (unlikely(ret != 0))
460		return ret;
461
462	cmd = container_of(header, struct vmw_sid_cmd, header);
463	ret = vmw_cmd_res_check(dev_priv, sw_context, vmw_res_surface,
464				user_surface_converter,
465				&cmd->body.target.sid, NULL);
466	return ret;
467}
468
469static int vmw_cmd_surface_copy_check(struct vmw_private *dev_priv,
470				      struct vmw_sw_context *sw_context,
471				      SVGA3dCmdHeader *header)
472{
473	struct vmw_sid_cmd {
474		SVGA3dCmdHeader header;
475		SVGA3dCmdSurfaceCopy body;
476	} *cmd;
477	int ret;
478
479	cmd = container_of(header, struct vmw_sid_cmd, header);
480	ret = vmw_cmd_res_check(dev_priv, sw_context, vmw_res_surface,
481				user_surface_converter,
482				&cmd->body.src.sid, NULL);
483	if (unlikely(ret != 0))
484		return ret;
485	return vmw_cmd_res_check(dev_priv, sw_context, vmw_res_surface,
486				 user_surface_converter,
487				 &cmd->body.dest.sid, NULL);
488}
489
490static int vmw_cmd_stretch_blt_check(struct vmw_private *dev_priv,
491				     struct vmw_sw_context *sw_context,
492				     SVGA3dCmdHeader *header)
493{
494	struct vmw_sid_cmd {
495		SVGA3dCmdHeader header;
496		SVGA3dCmdSurfaceStretchBlt body;
497	} *cmd;
498	int ret;
499
500	cmd = container_of(header, struct vmw_sid_cmd, header);
501	ret = vmw_cmd_res_check(dev_priv, sw_context, vmw_res_surface,
502				user_surface_converter,
503				&cmd->body.src.sid, NULL);
504	if (unlikely(ret != 0))
505		return ret;
506	return vmw_cmd_res_check(dev_priv, sw_context, vmw_res_surface,
507				 user_surface_converter,
508				 &cmd->body.dest.sid, NULL);
509}
510
511static int vmw_cmd_blt_surf_screen_check(struct vmw_private *dev_priv,
512					 struct vmw_sw_context *sw_context,
513					 SVGA3dCmdHeader *header)
514{
515	struct vmw_sid_cmd {
516		SVGA3dCmdHeader header;
517		SVGA3dCmdBlitSurfaceToScreen body;
518	} *cmd;
519
520	cmd = container_of(header, struct vmw_sid_cmd, header);
521
522	if (unlikely(!sw_context->kernel)) {
523		DRM_ERROR("Kernel only SVGA3d command: %u.\n", cmd->header.id);
524		return -EPERM;
525	}
526
527	return vmw_cmd_res_check(dev_priv, sw_context, vmw_res_surface,
528				 user_surface_converter,
529				 &cmd->body.srcImage.sid, NULL);
530}
531
532static int vmw_cmd_present_check(struct vmw_private *dev_priv,
533				 struct vmw_sw_context *sw_context,
534				 SVGA3dCmdHeader *header)
535{
536	struct vmw_sid_cmd {
537		SVGA3dCmdHeader header;
538		SVGA3dCmdPresent body;
539	} *cmd;
540
541
542	cmd = container_of(header, struct vmw_sid_cmd, header);
543
544	if (unlikely(!sw_context->kernel)) {
545		DRM_ERROR("Kernel only SVGA3d command: %u.\n", cmd->header.id);
546		return -EPERM;
547	}
548
549	return vmw_cmd_res_check(dev_priv, sw_context, vmw_res_surface,
550				 user_surface_converter, &cmd->body.sid,
551				 NULL);
552}
553
554/**
555 * vmw_query_bo_switch_prepare - Prepare to switch pinned buffer for queries.
556 *
557 * @dev_priv: The device private structure.
558 * @new_query_bo: The new buffer holding query results.
559 * @sw_context: The software context used for this command submission.
560 *
561 * This function checks whether @new_query_bo is suitable for holding
562 * query results, and if another buffer currently is pinned for query
563 * results. If so, the function prepares the state of @sw_context for
564 * switching pinned buffers after successful submission of the current
565 * command batch.
566 */
567static int vmw_query_bo_switch_prepare(struct vmw_private *dev_priv,
568				       struct ttm_buffer_object *new_query_bo,
569				       struct vmw_sw_context *sw_context)
570{
571	struct vmw_res_cache_entry *ctx_entry =
572		&sw_context->res_cache[vmw_res_context];
573	int ret;
574
575	BUG_ON(!ctx_entry->valid);
576	sw_context->last_query_ctx = ctx_entry->res;
577
578	if (unlikely(new_query_bo != sw_context->cur_query_bo)) {
579
580		if (unlikely(new_query_bo->num_pages > 4)) {
581			DRM_ERROR("Query buffer too large.\n");
582			return -EINVAL;
583		}
584
585		if (unlikely(sw_context->cur_query_bo != NULL)) {
586			sw_context->needs_post_query_barrier = true;
587			ret = vmw_bo_to_validate_list(sw_context,
588						      sw_context->cur_query_bo,
589						      NULL);
590			if (unlikely(ret != 0))
591				return ret;
592		}
593		sw_context->cur_query_bo = new_query_bo;
594
595		ret = vmw_bo_to_validate_list(sw_context,
596					      dev_priv->dummy_query_bo,
597					      NULL);
598		if (unlikely(ret != 0))
599			return ret;
600
601	}
602
603	return 0;
604}
605
606
607/**
608 * vmw_query_bo_switch_commit - Finalize switching pinned query buffer
609 *
610 * @dev_priv: The device private structure.
611 * @sw_context: The software context used for this command submission batch.
612 *
613 * This function will check if we're switching query buffers, and will then,
614 * issue a dummy occlusion query wait used as a query barrier. When the fence
615 * object following that query wait has signaled, we are sure that all
616 * preceding queries have finished, and the old query buffer can be unpinned.
617 * However, since both the new query buffer and the old one are fenced with
618 * that fence, we can do an asynchronus unpin now, and be sure that the
619 * old query buffer won't be moved until the fence has signaled.
620 *
621 * As mentioned above, both the new - and old query buffers need to be fenced
622 * using a sequence emitted *after* calling this function.
623 */
624static void vmw_query_bo_switch_commit(struct vmw_private *dev_priv,
625				     struct vmw_sw_context *sw_context)
626{
627	/*
628	 * The validate list should still hold references to all
629	 * contexts here.
630	 */
631
632	if (sw_context->needs_post_query_barrier) {
633		struct vmw_res_cache_entry *ctx_entry =
634			&sw_context->res_cache[vmw_res_context];
635		struct vmw_resource *ctx;
636		int ret;
637
638		BUG_ON(!ctx_entry->valid);
639		ctx = ctx_entry->res;
640
641		ret = vmw_fifo_emit_dummy_query(dev_priv, ctx->id);
642
643		if (unlikely(ret != 0))
644			DRM_ERROR("Out of fifo space for dummy query.\n");
645	}
646
647	if (dev_priv->pinned_bo != sw_context->cur_query_bo) {
648		if (dev_priv->pinned_bo) {
649			vmw_bo_pin(dev_priv->pinned_bo, false);
650			ttm_bo_unref(&dev_priv->pinned_bo);
651		}
652
653		if (!sw_context->needs_post_query_barrier) {
654			vmw_bo_pin(sw_context->cur_query_bo, true);
655
656			/*
657			 * We pin also the dummy_query_bo buffer so that we
658			 * don't need to validate it when emitting
659			 * dummy queries in context destroy paths.
660			 */
661
662			vmw_bo_pin(dev_priv->dummy_query_bo, true);
663			dev_priv->dummy_query_bo_pinned = true;
664
665			BUG_ON(sw_context->last_query_ctx == NULL);
666			dev_priv->query_cid = sw_context->last_query_ctx->id;
667			dev_priv->query_cid_valid = true;
668			dev_priv->pinned_bo =
669				ttm_bo_reference(sw_context->cur_query_bo);
670		}
671	}
672}
673
674/**
675 * vmw_translate_guest_pointer - Prepare to translate a user-space buffer
676 * handle to a valid SVGAGuestPtr
677 *
678 * @dev_priv: Pointer to a device private structure.
679 * @sw_context: The software context used for this command batch validation.
680 * @ptr: Pointer to the user-space handle to be translated.
681 * @vmw_bo_p: Points to a location that, on successful return will carry
682 * a reference-counted pointer to the DMA buffer identified by the
683 * user-space handle in @id.
684 *
685 * This function saves information needed to translate a user-space buffer
686 * handle to a valid SVGAGuestPtr. The translation does not take place
687 * immediately, but during a call to vmw_apply_relocations().
688 * This function builds a relocation list and a list of buffers to validate.
689 * The former needs to be freed using either vmw_apply_relocations() or
690 * vmw_free_relocations(). The latter needs to be freed using
691 * vmw_clear_validations.
692 */
693static int vmw_translate_guest_ptr(struct vmw_private *dev_priv,
694				   struct vmw_sw_context *sw_context,
695				   SVGAGuestPtr *ptr,
696				   struct vmw_dma_buffer **vmw_bo_p)
697{
698	struct vmw_dma_buffer *vmw_bo = NULL;
699	struct ttm_buffer_object *bo;
700	uint32_t handle = ptr->gmrId;
701	struct vmw_relocation *reloc;
702	int ret;
703
704	ret = vmw_user_dmabuf_lookup(sw_context->tfile, handle, &vmw_bo);
705	if (unlikely(ret != 0)) {
706		DRM_ERROR("Could not find or use GMR region.\n");
707		return -EINVAL;
708	}
709	bo = &vmw_bo->base;
710
711	if (unlikely(sw_context->cur_reloc >= VMWGFX_MAX_RELOCATIONS)) {
712		DRM_ERROR("Max number relocations per submission"
713			  " exceeded\n");
714		ret = -EINVAL;
715		goto out_no_reloc;
716	}
717
718	reloc = &sw_context->relocs[sw_context->cur_reloc++];
719	reloc->location = ptr;
720
721	ret = vmw_bo_to_validate_list(sw_context, bo, &reloc->index);
722	if (unlikely(ret != 0))
723		goto out_no_reloc;
724
725	*vmw_bo_p = vmw_bo;
726	return 0;
727
728out_no_reloc:
729	vmw_dmabuf_unreference(&vmw_bo);
730	vmw_bo_p = NULL;
731	return ret;
732}
733
734/**
735 * vmw_cmd_begin_query - validate a  SVGA_3D_CMD_BEGIN_QUERY command.
736 *
737 * @dev_priv: Pointer to a device private struct.
738 * @sw_context: The software context used for this command submission.
739 * @header: Pointer to the command header in the command stream.
740 */
741static int vmw_cmd_begin_query(struct vmw_private *dev_priv,
742			       struct vmw_sw_context *sw_context,
743			       SVGA3dCmdHeader *header)
744{
745	struct vmw_begin_query_cmd {
746		SVGA3dCmdHeader header;
747		SVGA3dCmdBeginQuery q;
748	} *cmd;
749
750	cmd = container_of(header, struct vmw_begin_query_cmd,
751			   header);
752
753	return vmw_cmd_res_check(dev_priv, sw_context, vmw_res_context,
754				 user_context_converter, &cmd->q.cid,
755				 NULL);
756}
757
758/**
759 * vmw_cmd_end_query - validate a  SVGA_3D_CMD_END_QUERY command.
760 *
761 * @dev_priv: Pointer to a device private struct.
762 * @sw_context: The software context used for this command submission.
763 * @header: Pointer to the command header in the command stream.
764 */
765static int vmw_cmd_end_query(struct vmw_private *dev_priv,
766			     struct vmw_sw_context *sw_context,
767			     SVGA3dCmdHeader *header)
768{
769	struct vmw_dma_buffer *vmw_bo;
770	struct vmw_query_cmd {
771		SVGA3dCmdHeader header;
772		SVGA3dCmdEndQuery q;
773	} *cmd;
774	int ret;
775
776	cmd = container_of(header, struct vmw_query_cmd, header);
777	ret = vmw_cmd_cid_check(dev_priv, sw_context, header);
778	if (unlikely(ret != 0))
779		return ret;
780
781	ret = vmw_translate_guest_ptr(dev_priv, sw_context,
782				      &cmd->q.guestResult,
783				      &vmw_bo);
784	if (unlikely(ret != 0))
785		return ret;
786
787	ret = vmw_query_bo_switch_prepare(dev_priv, &vmw_bo->base, sw_context);
788
789	vmw_dmabuf_unreference(&vmw_bo);
790	return ret;
791}
792
793/*
794 * vmw_cmd_wait_query - validate a  SVGA_3D_CMD_WAIT_QUERY command.
795 *
796 * @dev_priv: Pointer to a device private struct.
797 * @sw_context: The software context used for this command submission.
798 * @header: Pointer to the command header in the command stream.
799 */
800static int vmw_cmd_wait_query(struct vmw_private *dev_priv,
801			      struct vmw_sw_context *sw_context,
802			      SVGA3dCmdHeader *header)
803{
804	struct vmw_dma_buffer *vmw_bo;
805	struct vmw_query_cmd {
806		SVGA3dCmdHeader header;
807		SVGA3dCmdWaitForQuery q;
808	} *cmd;
809	int ret;
810
811	cmd = container_of(header, struct vmw_query_cmd, header);
812	ret = vmw_cmd_cid_check(dev_priv, sw_context, header);
813	if (unlikely(ret != 0))
814		return ret;
815
816	ret = vmw_translate_guest_ptr(dev_priv, sw_context,
817				      &cmd->q.guestResult,
818				      &vmw_bo);
819	if (unlikely(ret != 0))
820		return ret;
821
822	vmw_dmabuf_unreference(&vmw_bo);
823	return 0;
824}
825
826static int vmw_cmd_dma(struct vmw_private *dev_priv,
827		       struct vmw_sw_context *sw_context,
828		       SVGA3dCmdHeader *header)
829{
830	struct vmw_dma_buffer *vmw_bo = NULL;
831	struct vmw_surface *srf = NULL;
832	struct vmw_dma_cmd {
833		SVGA3dCmdHeader header;
834		SVGA3dCmdSurfaceDMA dma;
835	} *cmd;
836	int ret;
837
838	cmd = container_of(header, struct vmw_dma_cmd, header);
839	ret = vmw_translate_guest_ptr(dev_priv, sw_context,
840				      &cmd->dma.guest.ptr,
841				      &vmw_bo);
842	if (unlikely(ret != 0))
843		return ret;
844
845	ret = vmw_cmd_res_check(dev_priv, sw_context, vmw_res_surface,
846				user_surface_converter, &cmd->dma.host.sid,
847				NULL);
848	if (unlikely(ret != 0)) {
849		if (unlikely(ret != -ERESTARTSYS))
850			DRM_ERROR("could not find surface for DMA.\n");
851		goto out_no_surface;
852	}
853
854	srf = vmw_res_to_srf(sw_context->res_cache[vmw_res_surface].res);
855
856	vmw_kms_cursor_snoop(srf, sw_context->tfile, &vmw_bo->base, header);
857
858out_no_surface:
859	vmw_dmabuf_unreference(&vmw_bo);
860	return ret;
861}
862
863static int vmw_cmd_draw(struct vmw_private *dev_priv,
864			struct vmw_sw_context *sw_context,
865			SVGA3dCmdHeader *header)
866{
867	struct vmw_draw_cmd {
868		SVGA3dCmdHeader header;
869		SVGA3dCmdDrawPrimitives body;
870	} *cmd;
871	SVGA3dVertexDecl *decl = (SVGA3dVertexDecl *)(
872		(unsigned long)header + sizeof(*cmd));
873	SVGA3dPrimitiveRange *range;
874	uint32_t i;
875	uint32_t maxnum;
876	int ret;
877
878	ret = vmw_cmd_cid_check(dev_priv, sw_context, header);
879	if (unlikely(ret != 0))
880		return ret;
881
882	cmd = container_of(header, struct vmw_draw_cmd, header);
883	maxnum = (header->size - sizeof(cmd->body)) / sizeof(*decl);
884
885	if (unlikely(cmd->body.numVertexDecls > maxnum)) {
886		DRM_ERROR("Illegal number of vertex declarations.\n");
887		return -EINVAL;
888	}
889
890	for (i = 0; i < cmd->body.numVertexDecls; ++i, ++decl) {
891		ret = vmw_cmd_res_check(dev_priv, sw_context, vmw_res_surface,
892					user_surface_converter,
893					&decl->array.surfaceId, NULL);
894		if (unlikely(ret != 0))
895			return ret;
896	}
897
898	maxnum = (header->size - sizeof(cmd->body) -
899		  cmd->body.numVertexDecls * sizeof(*decl)) / sizeof(*range);
900	if (unlikely(cmd->body.numRanges > maxnum)) {
901		DRM_ERROR("Illegal number of index ranges.\n");
902		return -EINVAL;
903	}
904
905	range = (SVGA3dPrimitiveRange *) decl;
906	for (i = 0; i < cmd->body.numRanges; ++i, ++range) {
907		ret = vmw_cmd_res_check(dev_priv, sw_context, vmw_res_surface,
908					user_surface_converter,
909					&range->indexArray.surfaceId, NULL);
910		if (unlikely(ret != 0))
911			return ret;
912	}
913	return 0;
914}
915
916
917static int vmw_cmd_tex_state(struct vmw_private *dev_priv,
918			     struct vmw_sw_context *sw_context,
919			     SVGA3dCmdHeader *header)
920{
921	struct vmw_tex_state_cmd {
922		SVGA3dCmdHeader header;
923		SVGA3dCmdSetTextureState state;
924	};
925
926	SVGA3dTextureState *last_state = (SVGA3dTextureState *)
927	  ((unsigned long) header + header->size + sizeof(header));
928	SVGA3dTextureState *cur_state = (SVGA3dTextureState *)
929		((unsigned long) header + sizeof(struct vmw_tex_state_cmd));
930	int ret;
931
932	ret = vmw_cmd_cid_check(dev_priv, sw_context, header);
933	if (unlikely(ret != 0))
934		return ret;
935
936	for (; cur_state < last_state; ++cur_state) {
937		if (likely(cur_state->name != SVGA3D_TS_BIND_TEXTURE))
938			continue;
939
940		ret = vmw_cmd_res_check(dev_priv, sw_context, vmw_res_surface,
941					user_surface_converter,
942					&cur_state->value, NULL);
943		if (unlikely(ret != 0))
944			return ret;
945	}
946
947	return 0;
948}
949
950static int vmw_cmd_check_define_gmrfb(struct vmw_private *dev_priv,
951				      struct vmw_sw_context *sw_context,
952				      void *buf)
953{
954	struct vmw_dma_buffer *vmw_bo;
955	int ret;
956
957	struct {
958		uint32_t header;
959		SVGAFifoCmdDefineGMRFB body;
960	} *cmd = buf;
961
962	ret = vmw_translate_guest_ptr(dev_priv, sw_context,
963				      &cmd->body.ptr,
964				      &vmw_bo);
965	if (unlikely(ret != 0))
966		return ret;
967
968	vmw_dmabuf_unreference(&vmw_bo);
969
970	return ret;
971}
972
973/**
974 * vmw_cmd_set_shader - Validate an SVGA_3D_CMD_SET_SHADER
975 * command
976 *
977 * @dev_priv: Pointer to a device private struct.
978 * @sw_context: The software context being used for this batch.
979 * @header: Pointer to the command header in the command stream.
980 */
981static int vmw_cmd_set_shader(struct vmw_private *dev_priv,
982			      struct vmw_sw_context *sw_context,
983			      SVGA3dCmdHeader *header)
984{
985	struct vmw_set_shader_cmd {
986		SVGA3dCmdHeader header;
987		SVGA3dCmdSetShader body;
988	} *cmd;
989	int ret;
990
991	cmd = container_of(header, struct vmw_set_shader_cmd,
992			   header);
993
994	ret = vmw_cmd_cid_check(dev_priv, sw_context, header);
995	if (unlikely(ret != 0))
996		return ret;
997
998	return 0;
999}
1000
1001static int vmw_cmd_check_not_3d(struct vmw_private *dev_priv,
1002				struct vmw_sw_context *sw_context,
1003				void *buf, uint32_t *size)
1004{
1005	uint32_t size_remaining = *size;
1006	uint32_t cmd_id;
1007
1008	cmd_id = le32_to_cpu(((uint32_t *)buf)[0]);
1009	switch (cmd_id) {
1010	case SVGA_CMD_UPDATE:
1011		*size = sizeof(uint32_t) + sizeof(SVGAFifoCmdUpdate);
1012		break;
1013	case SVGA_CMD_DEFINE_GMRFB:
1014		*size = sizeof(uint32_t) + sizeof(SVGAFifoCmdDefineGMRFB);
1015		break;
1016	case SVGA_CMD_BLIT_GMRFB_TO_SCREEN:
1017		*size = sizeof(uint32_t) + sizeof(SVGAFifoCmdBlitGMRFBToScreen);
1018		break;
1019	case SVGA_CMD_BLIT_SCREEN_TO_GMRFB:
1020		*size = sizeof(uint32_t) + sizeof(SVGAFifoCmdBlitGMRFBToScreen);
1021		break;
1022	default:
1023		DRM_ERROR("Unsupported SVGA command: %u.\n", cmd_id);
1024		return -EINVAL;
1025	}
1026
1027	if (*size > size_remaining) {
1028		DRM_ERROR("Invalid SVGA command (size mismatch):"
1029			  " %u.\n", cmd_id);
1030		return -EINVAL;
1031	}
1032
1033	if (unlikely(!sw_context->kernel)) {
1034		DRM_ERROR("Kernel only SVGA command: %u.\n", cmd_id);
1035		return -EPERM;
1036	}
1037
1038	if (cmd_id == SVGA_CMD_DEFINE_GMRFB)
1039		return vmw_cmd_check_define_gmrfb(dev_priv, sw_context, buf);
1040
1041	return 0;
1042}
1043
1044typedef int (*vmw_cmd_func) (struct vmw_private *,
1045			     struct vmw_sw_context *,
1046			     SVGA3dCmdHeader *);
1047
1048#define VMW_CMD_DEF(cmd, func) \
1049	[cmd - SVGA_3D_CMD_BASE] = func
1050
1051static vmw_cmd_func vmw_cmd_funcs[SVGA_3D_CMD_MAX] = {
1052	VMW_CMD_DEF(SVGA_3D_CMD_SURFACE_DEFINE, &vmw_cmd_invalid),
1053	VMW_CMD_DEF(SVGA_3D_CMD_SURFACE_DESTROY, &vmw_cmd_invalid),
1054	VMW_CMD_DEF(SVGA_3D_CMD_SURFACE_COPY, &vmw_cmd_surface_copy_check),
1055	VMW_CMD_DEF(SVGA_3D_CMD_SURFACE_STRETCHBLT, &vmw_cmd_stretch_blt_check),
1056	VMW_CMD_DEF(SVGA_3D_CMD_SURFACE_DMA, &vmw_cmd_dma),
1057	VMW_CMD_DEF(SVGA_3D_CMD_CONTEXT_DEFINE, &vmw_cmd_invalid),
1058	VMW_CMD_DEF(SVGA_3D_CMD_CONTEXT_DESTROY, &vmw_cmd_invalid),
1059	VMW_CMD_DEF(SVGA_3D_CMD_SETTRANSFORM, &vmw_cmd_cid_check),
1060	VMW_CMD_DEF(SVGA_3D_CMD_SETZRANGE, &vmw_cmd_cid_check),
1061	VMW_CMD_DEF(SVGA_3D_CMD_SETRENDERSTATE, &vmw_cmd_cid_check),
1062	VMW_CMD_DEF(SVGA_3D_CMD_SETRENDERTARGET,
1063		    &vmw_cmd_set_render_target_check),
1064	VMW_CMD_DEF(SVGA_3D_CMD_SETTEXTURESTATE, &vmw_cmd_tex_state),
1065	VMW_CMD_DEF(SVGA_3D_CMD_SETMATERIAL, &vmw_cmd_cid_check),
1066	VMW_CMD_DEF(SVGA_3D_CMD_SETLIGHTDATA, &vmw_cmd_cid_check),
1067	VMW_CMD_DEF(SVGA_3D_CMD_SETLIGHTENABLED, &vmw_cmd_cid_check),
1068	VMW_CMD_DEF(SVGA_3D_CMD_SETVIEWPORT, &vmw_cmd_cid_check),
1069	VMW_CMD_DEF(SVGA_3D_CMD_SETCLIPPLANE, &vmw_cmd_cid_check),
1070	VMW_CMD_DEF(SVGA_3D_CMD_CLEAR, &vmw_cmd_cid_check),
1071	VMW_CMD_DEF(SVGA_3D_CMD_PRESENT, &vmw_cmd_present_check),
1072	VMW_CMD_DEF(SVGA_3D_CMD_SHADER_DEFINE, &vmw_cmd_cid_check),
1073	VMW_CMD_DEF(SVGA_3D_CMD_SHADER_DESTROY, &vmw_cmd_cid_check),
1074	VMW_CMD_DEF(SVGA_3D_CMD_SET_SHADER, &vmw_cmd_set_shader),
1075	VMW_CMD_DEF(SVGA_3D_CMD_SET_SHADER_CONST, &vmw_cmd_cid_check),
1076	VMW_CMD_DEF(SVGA_3D_CMD_DRAW_PRIMITIVES, &vmw_cmd_draw),
1077	VMW_CMD_DEF(SVGA_3D_CMD_SETSCISSORRECT, &vmw_cmd_cid_check),
1078	VMW_CMD_DEF(SVGA_3D_CMD_BEGIN_QUERY, &vmw_cmd_begin_query),
1079	VMW_CMD_DEF(SVGA_3D_CMD_END_QUERY, &vmw_cmd_end_query),
1080	VMW_CMD_DEF(SVGA_3D_CMD_WAIT_FOR_QUERY, &vmw_cmd_wait_query),
1081	VMW_CMD_DEF(SVGA_3D_CMD_PRESENT_READBACK, &vmw_cmd_ok),
1082	VMW_CMD_DEF(SVGA_3D_CMD_BLIT_SURFACE_TO_SCREEN,
1083		    &vmw_cmd_blt_surf_screen_check),
1084	VMW_CMD_DEF(SVGA_3D_CMD_SURFACE_DEFINE_V2, &vmw_cmd_invalid),
1085	VMW_CMD_DEF(SVGA_3D_CMD_GENERATE_MIPMAPS, &vmw_cmd_invalid),
1086	VMW_CMD_DEF(SVGA_3D_CMD_ACTIVATE_SURFACE, &vmw_cmd_invalid),
1087	VMW_CMD_DEF(SVGA_3D_CMD_DEACTIVATE_SURFACE, &vmw_cmd_invalid),
1088};
1089
1090static int vmw_cmd_check(struct vmw_private *dev_priv,
1091			 struct vmw_sw_context *sw_context,
1092			 void *buf, uint32_t *size)
1093{
1094	uint32_t cmd_id;
1095	uint32_t size_remaining = *size;
1096	SVGA3dCmdHeader *header = (SVGA3dCmdHeader *) buf;
1097	int ret;
1098
1099	cmd_id = le32_to_cpu(((uint32_t *)buf)[0]);
1100	/* Handle any none 3D commands */
1101	if (unlikely(cmd_id < SVGA_CMD_MAX))
1102		return vmw_cmd_check_not_3d(dev_priv, sw_context, buf, size);
1103
1104
1105	cmd_id = le32_to_cpu(header->id);
1106	*size = le32_to_cpu(header->size) + sizeof(SVGA3dCmdHeader);
1107
1108	cmd_id -= SVGA_3D_CMD_BASE;
1109	if (unlikely(*size > size_remaining))
1110		goto out_err;
1111
1112	if (unlikely(cmd_id >= SVGA_3D_CMD_MAX - SVGA_3D_CMD_BASE))
1113		goto out_err;
1114
1115	ret = vmw_cmd_funcs[cmd_id](dev_priv, sw_context, header);
1116	if (unlikely(ret != 0))
1117		goto out_err;
1118
1119	return 0;
1120out_err:
1121	DRM_ERROR("Illegal / Invalid SVGA3D command: %d\n",
1122		  cmd_id + SVGA_3D_CMD_BASE);
1123	return -EINVAL;
1124}
1125
1126static int vmw_cmd_check_all(struct vmw_private *dev_priv,
1127			     struct vmw_sw_context *sw_context,
1128			     void *buf,
1129			     uint32_t size)
1130{
1131	int32_t cur_size = size;
1132	int ret;
1133
1134	sw_context->buf_start = buf;
1135
1136	while (cur_size > 0) {
1137		size = cur_size;
1138		ret = vmw_cmd_check(dev_priv, sw_context, buf, &size);
1139		if (unlikely(ret != 0))
1140			return ret;
1141		buf = (void *)((unsigned long) buf + size);
1142		cur_size -= size;
1143	}
1144
1145	if (unlikely(cur_size != 0)) {
1146		DRM_ERROR("Command verifier out of sync.\n");
1147		return -EINVAL;
1148	}
1149
1150	return 0;
1151}
1152
1153static void vmw_free_relocations(struct vmw_sw_context *sw_context)
1154{
1155	sw_context->cur_reloc = 0;
1156}
1157
1158static void vmw_apply_relocations(struct vmw_sw_context *sw_context)
1159{
1160	uint32_t i;
1161	struct vmw_relocation *reloc;
1162	struct ttm_validate_buffer *validate;
1163	struct ttm_buffer_object *bo;
1164
1165	for (i = 0; i < sw_context->cur_reloc; ++i) {
1166		reloc = &sw_context->relocs[i];
1167		validate = &sw_context->val_bufs[reloc->index].base;
1168		bo = validate->bo;
1169		switch (bo->mem.mem_type) {
1170		case TTM_PL_VRAM:
1171			reloc->location->offset += bo->offset;
1172			reloc->location->gmrId = SVGA_GMR_FRAMEBUFFER;
1173			break;
1174		case VMW_PL_GMR:
1175			reloc->location->gmrId = bo->mem.start;
1176			break;
1177		default:
1178			BUG();
1179		}
1180	}
1181	vmw_free_relocations(sw_context);
1182}
1183
1184/**
1185 * vmw_resource_list_unrefererence - Free up a resource list and unreference
1186 * all resources referenced by it.
1187 *
1188 * @list: The resource list.
1189 */
1190static void vmw_resource_list_unreference(struct list_head *list)
1191{
1192	struct vmw_resource_val_node *val, *val_next;
1193
1194	/*
1195	 * Drop references to resources held during command submission.
1196	 */
1197
1198	list_for_each_entry_safe(val, val_next, list, head) {
1199		list_del_init(&val->head);
1200		vmw_resource_unreference(&val->res);
1201		kfree(val);
1202	}
1203}
1204
1205static void vmw_clear_validations(struct vmw_sw_context *sw_context)
1206{
1207	struct vmw_validate_buffer *entry, *next;
1208	struct vmw_resource_val_node *val;
1209
1210	/*
1211	 * Drop references to DMA buffers held during command submission.
1212	 */
1213	list_for_each_entry_safe(entry, next, &sw_context->validate_nodes,
1214				 base.head) {
1215		list_del(&entry->base.head);
1216		ttm_bo_unref(&entry->base.bo);
1217		(void) drm_ht_remove_item(&sw_context->res_ht, &entry->hash);
1218		sw_context->cur_val_buf--;
1219	}
1220	BUG_ON(sw_context->cur_val_buf != 0);
1221
1222	list_for_each_entry(val, &sw_context->resource_list, head)
1223		(void) drm_ht_remove_item(&sw_context->res_ht, &val->hash);
1224}
1225
1226static int vmw_validate_single_buffer(struct vmw_private *dev_priv,
1227				      struct ttm_buffer_object *bo)
1228{
1229	int ret;
1230
1231
1232	/*
1233	 * Don't validate pinned buffers.
1234	 */
1235
1236	if (bo == dev_priv->pinned_bo ||
1237	    (bo == dev_priv->dummy_query_bo &&
1238	     dev_priv->dummy_query_bo_pinned))
1239		return 0;
1240
1241	/**
1242	 * Put BO in VRAM if there is space, otherwise as a GMR.
1243	 * If there is no space in VRAM and GMR ids are all used up,
1244	 * start evicting GMRs to make room. If the DMA buffer can't be
1245	 * used as a GMR, this will return -ENOMEM.
1246	 */
1247
1248	ret = ttm_bo_validate(bo, &vmw_vram_gmr_placement, true, false);
1249	if (likely(ret == 0 || ret == -ERESTARTSYS))
1250		return ret;
1251
1252	/**
1253	 * If that failed, try VRAM again, this time evicting
1254	 * previous contents.
1255	 */
1256
1257	DRM_INFO("Falling through to VRAM.\n");
1258	ret = ttm_bo_validate(bo, &vmw_vram_placement, true, false);
1259	return ret;
1260}
1261
1262
1263static int vmw_validate_buffers(struct vmw_private *dev_priv,
1264				struct vmw_sw_context *sw_context)
1265{
1266	struct vmw_validate_buffer *entry;
1267	int ret;
1268
1269	list_for_each_entry(entry, &sw_context->validate_nodes, base.head) {
1270		ret = vmw_validate_single_buffer(dev_priv, entry->base.bo);
1271		if (unlikely(ret != 0))
1272			return ret;
1273	}
1274	return 0;
1275}
1276
1277static int vmw_resize_cmd_bounce(struct vmw_sw_context *sw_context,
1278				 uint32_t size)
1279{
1280	if (likely(sw_context->cmd_bounce_size >= size))
1281		return 0;
1282
1283	if (sw_context->cmd_bounce_size == 0)
1284		sw_context->cmd_bounce_size = VMWGFX_CMD_BOUNCE_INIT_SIZE;
1285
1286	while (sw_context->cmd_bounce_size < size) {
1287		sw_context->cmd_bounce_size =
1288			PAGE_ALIGN(sw_context->cmd_bounce_size +
1289				   (sw_context->cmd_bounce_size >> 1));
1290	}
1291
1292	if (sw_context->cmd_bounce != NULL)
1293		vfree(sw_context->cmd_bounce);
1294
1295	sw_context->cmd_bounce = vmalloc(sw_context->cmd_bounce_size);
1296
1297	if (sw_context->cmd_bounce == NULL) {
1298		DRM_ERROR("Failed to allocate command bounce buffer.\n");
1299		sw_context->cmd_bounce_size = 0;
1300		return -ENOMEM;
1301	}
1302
1303	return 0;
1304}
1305
1306/**
1307 * vmw_execbuf_fence_commands - create and submit a command stream fence
1308 *
1309 * Creates a fence object and submits a command stream marker.
1310 * If this fails for some reason, We sync the fifo and return NULL.
1311 * It is then safe to fence buffers with a NULL pointer.
1312 *
1313 * If @p_handle is not NULL @file_priv must also not be NULL. Creates
1314 * a userspace handle if @p_handle is not NULL, otherwise not.
1315 */
1316
1317int vmw_execbuf_fence_commands(struct drm_file *file_priv,
1318			       struct vmw_private *dev_priv,
1319			       struct vmw_fence_obj **p_fence,
1320			       uint32_t *p_handle)
1321{
1322	uint32_t sequence;
1323	int ret;
1324	bool synced = false;
1325
1326	/* p_handle implies file_priv. */
1327	BUG_ON(p_handle != NULL && file_priv == NULL);
1328
1329	ret = vmw_fifo_send_fence(dev_priv, &sequence);
1330	if (unlikely(ret != 0)) {
1331		DRM_ERROR("Fence submission error. Syncing.\n");
1332		synced = true;
1333	}
1334
1335	if (p_handle != NULL)
1336		ret = vmw_user_fence_create(file_priv, dev_priv->fman,
1337					    sequence,
1338					    DRM_VMW_FENCE_FLAG_EXEC,
1339					    p_fence, p_handle);
1340	else
1341		ret = vmw_fence_create(dev_priv->fman, sequence,
1342				       DRM_VMW_FENCE_FLAG_EXEC,
1343				       p_fence);
1344
1345	if (unlikely(ret != 0 && !synced)) {
1346		(void) vmw_fallback_wait(dev_priv, false, false,
1347					 sequence, false,
1348					 VMW_FENCE_WAIT_TIMEOUT);
1349		*p_fence = NULL;
1350	}
1351
1352	return 0;
1353}
1354
1355/**
1356 * vmw_execbuf_copy_fence_user - copy fence object information to
1357 * user-space.
1358 *
1359 * @dev_priv: Pointer to a vmw_private struct.
1360 * @vmw_fp: Pointer to the struct vmw_fpriv representing the calling file.
1361 * @ret: Return value from fence object creation.
1362 * @user_fence_rep: User space address of a struct drm_vmw_fence_rep to
1363 * which the information should be copied.
1364 * @fence: Pointer to the fenc object.
1365 * @fence_handle: User-space fence handle.
1366 *
1367 * This function copies fence information to user-space. If copying fails,
1368 * The user-space struct drm_vmw_fence_rep::error member is hopefully
1369 * left untouched, and if it's preloaded with an -EFAULT by user-space,
1370 * the error will hopefully be detected.
1371 * Also if copying fails, user-space will be unable to signal the fence
1372 * object so we wait for it immediately, and then unreference the
1373 * user-space reference.
1374 */
1375void
1376vmw_execbuf_copy_fence_user(struct vmw_private *dev_priv,
1377			    struct vmw_fpriv *vmw_fp,
1378			    int ret,
1379			    struct drm_vmw_fence_rep __user *user_fence_rep,
1380			    struct vmw_fence_obj *fence,
1381			    uint32_t fence_handle)
1382{
1383	struct drm_vmw_fence_rep fence_rep;
1384
1385	if (user_fence_rep == NULL)
1386		return;
1387
1388	memset(&fence_rep, 0, sizeof(fence_rep));
1389
1390	fence_rep.error = ret;
1391	if (ret == 0) {
1392		BUG_ON(fence == NULL);
1393
1394		fence_rep.handle = fence_handle;
1395		fence_rep.seqno = fence->seqno;
1396		vmw_update_seqno(dev_priv, &dev_priv->fifo);
1397		fence_rep.passed_seqno = dev_priv->last_read_seqno;
1398	}
1399
1400	/*
1401	 * copy_to_user errors will be detected by user space not
1402	 * seeing fence_rep::error filled in. Typically
1403	 * user-space would have pre-set that member to -EFAULT.
1404	 */
1405	ret = copy_to_user(user_fence_rep, &fence_rep,
1406			   sizeof(fence_rep));
1407
1408	/*
1409	 * User-space lost the fence object. We need to sync
1410	 * and unreference the handle.
1411	 */
1412	if (unlikely(ret != 0) && (fence_rep.error == 0)) {
1413		ttm_ref_object_base_unref(vmw_fp->tfile,
1414					  fence_handle, TTM_REF_USAGE);
1415		DRM_ERROR("Fence copy error. Syncing.\n");
1416		(void) vmw_fence_obj_wait(fence, fence->signal_mask,
1417					  false, false,
1418					  VMW_FENCE_WAIT_TIMEOUT);
1419	}
1420}
1421
1422int vmw_execbuf_process(struct drm_file *file_priv,
1423			struct vmw_private *dev_priv,
1424			void __user *user_commands,
1425			void *kernel_commands,
1426			uint32_t command_size,
1427			uint64_t throttle_us,
1428			struct drm_vmw_fence_rep __user *user_fence_rep,
1429			struct vmw_fence_obj **out_fence)
1430{
1431	struct vmw_sw_context *sw_context = &dev_priv->ctx;
1432	struct vmw_fence_obj *fence = NULL;
1433	struct vmw_resource *error_resource;
1434	struct list_head resource_list;
1435	uint32_t handle;
1436	void *cmd;
1437	int ret;
1438
1439	ret = mutex_lock_interruptible(&dev_priv->cmdbuf_mutex);
1440	if (unlikely(ret != 0))
1441		return -ERESTARTSYS;
1442
1443	if (kernel_commands == NULL) {
1444		sw_context->kernel = false;
1445
1446		ret = vmw_resize_cmd_bounce(sw_context, command_size);
1447		if (unlikely(ret != 0))
1448			goto out_unlock;
1449
1450
1451		ret = copy_from_user(sw_context->cmd_bounce,
1452				     user_commands, command_size);
1453
1454		if (unlikely(ret != 0)) {
1455			ret = -EFAULT;
1456			DRM_ERROR("Failed copying commands.\n");
1457			goto out_unlock;
1458		}
1459		kernel_commands = sw_context->cmd_bounce;
1460	} else
1461		sw_context->kernel = true;
1462
1463	sw_context->tfile = vmw_fpriv(file_priv)->tfile;
1464	sw_context->cur_reloc = 0;
1465	sw_context->cur_val_buf = 0;
1466	sw_context->fence_flags = 0;
1467	INIT_LIST_HEAD(&sw_context->resource_list);
1468	sw_context->cur_query_bo = dev_priv->pinned_bo;
1469	sw_context->last_query_ctx = NULL;
1470	sw_context->needs_post_query_barrier = false;
1471	memset(sw_context->res_cache, 0, sizeof(sw_context->res_cache));
1472	INIT_LIST_HEAD(&sw_context->validate_nodes);
1473	INIT_LIST_HEAD(&sw_context->res_relocations);
1474	if (!sw_context->res_ht_initialized) {
1475		ret = drm_ht_create(&sw_context->res_ht, VMW_RES_HT_ORDER);
1476		if (unlikely(ret != 0))
1477			goto out_unlock;
1478		sw_context->res_ht_initialized = true;
1479	}
1480
1481	INIT_LIST_HEAD(&resource_list);
1482	ret = vmw_cmd_check_all(dev_priv, sw_context, kernel_commands,
1483				command_size);
1484	if (unlikely(ret != 0))
1485		goto out_err;
1486
1487	ret = vmw_resources_reserve(sw_context);
1488	if (unlikely(ret != 0))
1489		goto out_err;
1490
1491	ret = ttm_eu_reserve_buffers(&sw_context->validate_nodes);
1492	if (unlikely(ret != 0))
1493		goto out_err;
1494
1495	ret = vmw_validate_buffers(dev_priv, sw_context);
1496	if (unlikely(ret != 0))
1497		goto out_err;
1498
1499	ret = vmw_resources_validate(sw_context);
1500	if (unlikely(ret != 0))
1501		goto out_err;
1502
1503	if (throttle_us) {
1504		ret = vmw_wait_lag(dev_priv, &dev_priv->fifo.marker_queue,
1505				   throttle_us);
1506
1507		if (unlikely(ret != 0))
1508			goto out_err;
1509	}
1510
1511	cmd = vmw_fifo_reserve(dev_priv, command_size);
1512	if (unlikely(cmd == NULL)) {
1513		DRM_ERROR("Failed reserving fifo space for commands.\n");
1514		ret = -ENOMEM;
1515		goto out_err;
1516	}
1517
1518	vmw_apply_relocations(sw_context);
1519	memcpy(cmd, kernel_commands, command_size);
1520
1521	vmw_resource_relocations_apply(cmd, &sw_context->res_relocations);
1522	vmw_resource_relocations_free(&sw_context->res_relocations);
1523
1524	vmw_fifo_commit(dev_priv, command_size);
1525
1526	vmw_query_bo_switch_commit(dev_priv, sw_context);
1527	ret = vmw_execbuf_fence_commands(file_priv, dev_priv,
1528					 &fence,
1529					 (user_fence_rep) ? &handle : NULL);
1530	/*
1531	 * This error is harmless, because if fence submission fails,
1532	 * vmw_fifo_send_fence will sync. The error will be propagated to
1533	 * user-space in @fence_rep
1534	 */
1535
1536	if (ret != 0)
1537		DRM_ERROR("Fence submission error. Syncing.\n");
1538
1539	vmw_resource_list_unreserve(&sw_context->resource_list, false);
1540	ttm_eu_fence_buffer_objects(&sw_context->validate_nodes,
1541				    (void *) fence);
1542
1543	if (unlikely(dev_priv->pinned_bo != NULL &&
1544		     !dev_priv->query_cid_valid))
1545		__vmw_execbuf_release_pinned_bo(dev_priv, fence);
1546
1547	vmw_clear_validations(sw_context);
1548	vmw_execbuf_copy_fence_user(dev_priv, vmw_fpriv(file_priv), ret,
1549				    user_fence_rep, fence, handle);
1550
1551	/* Don't unreference when handing fence out */
1552	if (unlikely(out_fence != NULL)) {
1553		*out_fence = fence;
1554		fence = NULL;
1555	} else if (likely(fence != NULL)) {
1556		vmw_fence_obj_unreference(&fence);
1557	}
1558
1559	list_splice_init(&sw_context->resource_list, &resource_list);
1560	mutex_unlock(&dev_priv->cmdbuf_mutex);
1561
1562	/*
1563	 * Unreference resources outside of the cmdbuf_mutex to
1564	 * avoid deadlocks in resource destruction paths.
1565	 */
1566	vmw_resource_list_unreference(&resource_list);
1567
1568	return 0;
1569
1570out_err:
1571	vmw_resource_relocations_free(&sw_context->res_relocations);
1572	vmw_free_relocations(sw_context);
1573	ttm_eu_backoff_reservation(&sw_context->validate_nodes);
1574	vmw_resource_list_unreserve(&sw_context->resource_list, true);
1575	vmw_clear_validations(sw_context);
1576	if (unlikely(dev_priv->pinned_bo != NULL &&
1577		     !dev_priv->query_cid_valid))
1578		__vmw_execbuf_release_pinned_bo(dev_priv, NULL);
1579out_unlock:
1580	list_splice_init(&sw_context->resource_list, &resource_list);
1581	error_resource = sw_context->error_resource;
1582	sw_context->error_resource = NULL;
1583	mutex_unlock(&dev_priv->cmdbuf_mutex);
1584
1585	/*
1586	 * Unreference resources outside of the cmdbuf_mutex to
1587	 * avoid deadlocks in resource destruction paths.
1588	 */
1589	vmw_resource_list_unreference(&resource_list);
1590	if (unlikely(error_resource != NULL))
1591		vmw_resource_unreference(&error_resource);
1592
1593	return ret;
1594}
1595
1596/**
1597 * vmw_execbuf_unpin_panic - Idle the fifo and unpin the query buffer.
1598 *
1599 * @dev_priv: The device private structure.
1600 *
1601 * This function is called to idle the fifo and unpin the query buffer
1602 * if the normal way to do this hits an error, which should typically be
1603 * extremely rare.
1604 */
1605static void vmw_execbuf_unpin_panic(struct vmw_private *dev_priv)
1606{
1607	DRM_ERROR("Can't unpin query buffer. Trying to recover.\n");
1608
1609	(void) vmw_fallback_wait(dev_priv, false, true, 0, false, 10*HZ);
1610	vmw_bo_pin(dev_priv->pinned_bo, false);
1611	vmw_bo_pin(dev_priv->dummy_query_bo, false);
1612	dev_priv->dummy_query_bo_pinned = false;
1613}
1614
1615
1616/**
1617 * __vmw_execbuf_release_pinned_bo - Flush queries and unpin the pinned
1618 * query bo.
1619 *
1620 * @dev_priv: The device private structure.
1621 * @fence: If non-NULL should point to a struct vmw_fence_obj issued
1622 * _after_ a query barrier that flushes all queries touching the current
1623 * buffer pointed to by @dev_priv->pinned_bo
1624 *
1625 * This function should be used to unpin the pinned query bo, or
1626 * as a query barrier when we need to make sure that all queries have
1627 * finished before the next fifo command. (For example on hardware
1628 * context destructions where the hardware may otherwise leak unfinished
1629 * queries).
1630 *
1631 * This function does not return any failure codes, but make attempts
1632 * to do safe unpinning in case of errors.
1633 *
1634 * The function will synchronize on the previous query barrier, and will
1635 * thus not finish until that barrier has executed.
1636 *
1637 * the @dev_priv->cmdbuf_mutex needs to be held by the current thread
1638 * before calling this function.
1639 */
1640void __vmw_execbuf_release_pinned_bo(struct vmw_private *dev_priv,
1641				     struct vmw_fence_obj *fence)
1642{
1643	int ret = 0;
1644	struct list_head validate_list;
1645	struct ttm_validate_buffer pinned_val, query_val;
1646	struct vmw_fence_obj *lfence = NULL;
1647
1648	if (dev_priv->pinned_bo == NULL)
1649		goto out_unlock;
1650
1651	INIT_LIST_HEAD(&validate_list);
1652
1653	pinned_val.bo = ttm_bo_reference(dev_priv->pinned_bo);
1654	list_add_tail(&pinned_val.head, &validate_list);
1655
1656	query_val.bo = ttm_bo_reference(dev_priv->dummy_query_bo);
1657	list_add_tail(&query_val.head, &validate_list);
1658
1659	do {
1660		ret = ttm_eu_reserve_buffers(&validate_list);
1661	} while (ret == -ERESTARTSYS);
1662
1663	if (unlikely(ret != 0)) {
1664		vmw_execbuf_unpin_panic(dev_priv);
1665		goto out_no_reserve;
1666	}
1667
1668	if (dev_priv->query_cid_valid) {
1669		BUG_ON(fence != NULL);
1670		ret = vmw_fifo_emit_dummy_query(dev_priv, dev_priv->query_cid);
1671		if (unlikely(ret != 0)) {
1672			vmw_execbuf_unpin_panic(dev_priv);
1673			goto out_no_emit;
1674		}
1675		dev_priv->query_cid_valid = false;
1676	}
1677
1678	vmw_bo_pin(dev_priv->pinned_bo, false);
1679	vmw_bo_pin(dev_priv->dummy_query_bo, false);
1680	dev_priv->dummy_query_bo_pinned = false;
1681
1682	if (fence == NULL) {
1683		(void) vmw_execbuf_fence_commands(NULL, dev_priv, &lfence,
1684						  NULL);
1685		fence = lfence;
1686	}
1687	ttm_eu_fence_buffer_objects(&validate_list, (void *) fence);
1688	if (lfence != NULL)
1689		vmw_fence_obj_unreference(&lfence);
1690
1691	ttm_bo_unref(&query_val.bo);
1692	ttm_bo_unref(&pinned_val.bo);
1693	ttm_bo_unref(&dev_priv->pinned_bo);
1694
1695out_unlock:
1696	return;
1697
1698out_no_emit:
1699	ttm_eu_backoff_reservation(&validate_list);
1700out_no_reserve:
1701	ttm_bo_unref(&query_val.bo);
1702	ttm_bo_unref(&pinned_val.bo);
1703	ttm_bo_unref(&dev_priv->pinned_bo);
1704}
1705
1706/**
1707 * vmw_execbuf_release_pinned_bo - Flush queries and unpin the pinned
1708 * query bo.
1709 *
1710 * @dev_priv: The device private structure.
1711 *
1712 * This function should be used to unpin the pinned query bo, or
1713 * as a query barrier when we need to make sure that all queries have
1714 * finished before the next fifo command. (For example on hardware
1715 * context destructions where the hardware may otherwise leak unfinished
1716 * queries).
1717 *
1718 * This function does not return any failure codes, but make attempts
1719 * to do safe unpinning in case of errors.
1720 *
1721 * The function will synchronize on the previous query barrier, and will
1722 * thus not finish until that barrier has executed.
1723 */
1724void vmw_execbuf_release_pinned_bo(struct vmw_private *dev_priv)
1725{
1726	mutex_lock(&dev_priv->cmdbuf_mutex);
1727	if (dev_priv->query_cid_valid)
1728		__vmw_execbuf_release_pinned_bo(dev_priv, NULL);
1729	mutex_unlock(&dev_priv->cmdbuf_mutex);
1730}
1731
1732
1733int vmw_execbuf_ioctl(struct drm_device *dev, void *data,
1734		      struct drm_file *file_priv)
1735{
1736	struct vmw_private *dev_priv = vmw_priv(dev);
1737	struct drm_vmw_execbuf_arg *arg = (struct drm_vmw_execbuf_arg *)data;
1738	struct vmw_master *vmaster = vmw_master(file_priv->master);
1739	int ret;
1740
1741	/*
1742	 * This will allow us to extend the ioctl argument while
1743	 * maintaining backwards compatibility:
1744	 * We take different code paths depending on the value of
1745	 * arg->version.
1746	 */
1747
1748	if (unlikely(arg->version != DRM_VMW_EXECBUF_VERSION)) {
1749		DRM_ERROR("Incorrect execbuf version.\n");
1750		DRM_ERROR("You're running outdated experimental "
1751			  "vmwgfx user-space drivers.");
1752		return -EINVAL;
1753	}
1754
1755	ret = ttm_read_lock(&vmaster->lock, true);
1756	if (unlikely(ret != 0))
1757		return ret;
1758
1759	ret = vmw_execbuf_process(file_priv, dev_priv,
1760				  (void __user *)(unsigned long)arg->commands,
1761				  NULL, arg->command_size, arg->throttle_us,
1762				  (void __user *)(unsigned long)arg->fence_rep,
1763				  NULL);
1764
1765	if (unlikely(ret != 0))
1766		goto out_unlock;
1767
1768	vmw_kms_cursor_post_execbuf(dev_priv);
1769
1770out_unlock:
1771	ttm_read_unlock(&vmaster->lock);
1772	return ret;
1773}
1774