1 // SPDX-License-Identifier: GPL-2.0 OR MIT
2 /**************************************************************************
4 * Copyright 2009-2020 VMware, Inc., Palo Alto, CA., USA
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
19 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
20 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
21 * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
22 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
23 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
24 * USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
28 #include <linux/sched/signal.h>
30 #include <drm/ttm/ttm_placement.h>
32 #include "vmwgfx_drv.h"
34 struct vmw_temp_set_context {
35 SVGA3dCmdHeader header;
36 SVGA3dCmdDXTempSetContext body;
39 bool vmw_supports_3d(struct vmw_private *dev_priv)
41 uint32_t fifo_min, hwversion;
42 const struct vmw_fifo_state *fifo = &dev_priv->fifo;
44 if (!(dev_priv->capabilities & SVGA_CAP_3D))
47 if (dev_priv->capabilities & SVGA_CAP_GBOBJECTS) {
50 if (!dev_priv->has_mob)
53 spin_lock(&dev_priv->cap_lock);
54 vmw_write(dev_priv, SVGA_REG_DEV_CAP, SVGA3D_DEVCAP_3D);
55 result = vmw_read(dev_priv, SVGA_REG_DEV_CAP);
56 spin_unlock(&dev_priv->cap_lock);
61 if (!(dev_priv->capabilities & SVGA_CAP_EXTENDED_FIFO))
64 fifo_min = vmw_fifo_mem_read(dev_priv, SVGA_FIFO_MIN);
65 if (fifo_min <= SVGA_FIFO_3D_HWVERSION * sizeof(unsigned int))
68 hwversion = vmw_fifo_mem_read(dev_priv,
69 ((fifo->capabilities &
70 SVGA_FIFO_CAP_3D_HWVERSION_REVISED) ?
71 SVGA_FIFO_3D_HWVERSION_REVISED :
72 SVGA_FIFO_3D_HWVERSION));
77 if (hwversion < SVGA3D_HWVERSION_WS8_B1)
80 /* Legacy Display Unit does not support surfaces */
81 if (dev_priv->active_display_unit == vmw_du_legacy)
87 bool vmw_fifo_have_pitchlock(struct vmw_private *dev_priv)
91 if (!(dev_priv->capabilities & SVGA_CAP_EXTENDED_FIFO))
94 caps = vmw_fifo_mem_read(dev_priv, SVGA_FIFO_CAPABILITIES);
95 if (caps & SVGA_FIFO_CAP_PITCHLOCK)
101 int vmw_fifo_init(struct vmw_private *dev_priv, struct vmw_fifo_state *fifo)
107 fifo->static_buffer_size = VMWGFX_FIFO_STATIC_SIZE;
108 fifo->static_buffer = vmalloc(fifo->static_buffer_size);
109 if (unlikely(fifo->static_buffer == NULL))
112 fifo->dynamic_buffer = NULL;
113 fifo->reserved_size = 0;
114 fifo->using_bounce_buffer = false;
116 mutex_init(&fifo->fifo_mutex);
117 init_rwsem(&fifo->rwsem);
119 DRM_INFO("width %d\n", vmw_read(dev_priv, SVGA_REG_WIDTH));
120 DRM_INFO("height %d\n", vmw_read(dev_priv, SVGA_REG_HEIGHT));
121 DRM_INFO("bpp %d\n", vmw_read(dev_priv, SVGA_REG_BITS_PER_PIXEL));
123 dev_priv->enable_state = vmw_read(dev_priv, SVGA_REG_ENABLE);
124 dev_priv->config_done_state = vmw_read(dev_priv, SVGA_REG_CONFIG_DONE);
125 dev_priv->traces_state = vmw_read(dev_priv, SVGA_REG_TRACES);
127 vmw_write(dev_priv, SVGA_REG_ENABLE, SVGA_REG_ENABLE_ENABLE |
128 SVGA_REG_ENABLE_HIDE);
130 vmw_write(dev_priv, SVGA_REG_TRACES, 0);
133 if (dev_priv->capabilities & SVGA_CAP_EXTENDED_FIFO)
134 min = vmw_read(dev_priv, SVGA_REG_MEM_REGS);
140 vmw_fifo_mem_write(dev_priv, SVGA_FIFO_MIN, min);
141 vmw_fifo_mem_write(dev_priv, SVGA_FIFO_MAX, dev_priv->fifo_mem_size);
143 vmw_fifo_mem_write(dev_priv, SVGA_FIFO_NEXT_CMD, min);
144 vmw_fifo_mem_write(dev_priv, SVGA_FIFO_STOP, min);
145 vmw_fifo_mem_write(dev_priv, SVGA_FIFO_BUSY, 0);
148 vmw_write(dev_priv, SVGA_REG_CONFIG_DONE, 1);
150 max = vmw_fifo_mem_read(dev_priv, SVGA_FIFO_MAX);
151 min = vmw_fifo_mem_read(dev_priv, SVGA_FIFO_MIN);
152 fifo->capabilities = vmw_fifo_mem_read(dev_priv, SVGA_FIFO_CAPABILITIES);
154 DRM_INFO("Fifo max 0x%08x min 0x%08x cap 0x%08x\n",
157 (unsigned int) fifo->capabilities);
159 atomic_set(&dev_priv->marker_seq, dev_priv->last_read_seqno);
160 vmw_fifo_mem_write(dev_priv, SVGA_FIFO_FENCE, dev_priv->last_read_seqno);
165 void vmw_fifo_ping_host(struct vmw_private *dev_priv, uint32_t reason)
167 u32 *fifo_mem = dev_priv->fifo_mem;
169 if (cmpxchg(fifo_mem + SVGA_FIFO_BUSY, 0, 1) == 0)
170 vmw_write(dev_priv, SVGA_REG_SYNC, reason);
173 void vmw_fifo_release(struct vmw_private *dev_priv, struct vmw_fifo_state *fifo)
175 vmw_write(dev_priv, SVGA_REG_SYNC, SVGA_SYNC_GENERIC);
176 while (vmw_read(dev_priv, SVGA_REG_BUSY) != 0)
179 dev_priv->last_read_seqno = vmw_fifo_mem_read(dev_priv, SVGA_FIFO_FENCE);
181 vmw_write(dev_priv, SVGA_REG_CONFIG_DONE,
182 dev_priv->config_done_state);
183 vmw_write(dev_priv, SVGA_REG_ENABLE,
184 dev_priv->enable_state);
185 vmw_write(dev_priv, SVGA_REG_TRACES,
186 dev_priv->traces_state);
188 if (likely(fifo->static_buffer != NULL)) {
189 vfree(fifo->static_buffer);
190 fifo->static_buffer = NULL;
193 if (likely(fifo->dynamic_buffer != NULL)) {
194 vfree(fifo->dynamic_buffer);
195 fifo->dynamic_buffer = NULL;
199 static bool vmw_fifo_is_full(struct vmw_private *dev_priv, uint32_t bytes)
201 uint32_t max = vmw_fifo_mem_read(dev_priv, SVGA_FIFO_MAX);
202 uint32_t next_cmd = vmw_fifo_mem_read(dev_priv, SVGA_FIFO_NEXT_CMD);
203 uint32_t min = vmw_fifo_mem_read(dev_priv, SVGA_FIFO_MIN);
204 uint32_t stop = vmw_fifo_mem_read(dev_priv, SVGA_FIFO_STOP);
206 return ((max - next_cmd) + (stop - min) <= bytes);
209 static int vmw_fifo_wait_noirq(struct vmw_private *dev_priv,
210 uint32_t bytes, bool interruptible,
211 unsigned long timeout)
214 unsigned long end_jiffies = jiffies + timeout;
217 DRM_INFO("Fifo wait noirq.\n");
220 prepare_to_wait(&dev_priv->fifo_queue, &__wait,
222 TASK_INTERRUPTIBLE : TASK_UNINTERRUPTIBLE);
223 if (!vmw_fifo_is_full(dev_priv, bytes))
225 if (time_after_eq(jiffies, end_jiffies)) {
227 DRM_ERROR("SVGA device lockup.\n");
231 if (interruptible && signal_pending(current)) {
236 finish_wait(&dev_priv->fifo_queue, &__wait);
237 wake_up_all(&dev_priv->fifo_queue);
238 DRM_INFO("Fifo noirq exit.\n");
242 static int vmw_fifo_wait(struct vmw_private *dev_priv,
243 uint32_t bytes, bool interruptible,
244 unsigned long timeout)
248 if (likely(!vmw_fifo_is_full(dev_priv, bytes)))
251 vmw_fifo_ping_host(dev_priv, SVGA_SYNC_FIFOFULL);
252 if (!(dev_priv->capabilities & SVGA_CAP_IRQMASK))
253 return vmw_fifo_wait_noirq(dev_priv, bytes,
254 interruptible, timeout);
256 vmw_generic_waiter_add(dev_priv, SVGA_IRQFLAG_FIFO_PROGRESS,
257 &dev_priv->fifo_queue_waiters);
260 ret = wait_event_interruptible_timeout
261 (dev_priv->fifo_queue,
262 !vmw_fifo_is_full(dev_priv, bytes), timeout);
264 ret = wait_event_timeout
265 (dev_priv->fifo_queue,
266 !vmw_fifo_is_full(dev_priv, bytes), timeout);
268 if (unlikely(ret == 0))
270 else if (likely(ret > 0))
273 vmw_generic_waiter_remove(dev_priv, SVGA_IRQFLAG_FIFO_PROGRESS,
274 &dev_priv->fifo_queue_waiters);
280 * Reserve @bytes number of bytes in the fifo.
282 * This function will return NULL (error) on two conditions:
283 * If it timeouts waiting for fifo space, or if @bytes is larger than the
284 * available fifo space.
287 * Pointer to the fifo, or null on error (possible hardware hang).
289 static void *vmw_local_fifo_reserve(struct vmw_private *dev_priv,
292 struct vmw_fifo_state *fifo_state = &dev_priv->fifo;
293 u32 *fifo_mem = dev_priv->fifo_mem;
297 uint32_t reserveable = fifo_state->capabilities & SVGA_FIFO_CAP_RESERVE;
300 mutex_lock(&fifo_state->fifo_mutex);
301 max = vmw_fifo_mem_read(dev_priv, SVGA_FIFO_MAX);
302 min = vmw_fifo_mem_read(dev_priv, SVGA_FIFO_MIN);
303 next_cmd = vmw_fifo_mem_read(dev_priv, SVGA_FIFO_NEXT_CMD);
305 if (unlikely(bytes >= (max - min)))
308 BUG_ON(fifo_state->reserved_size != 0);
309 BUG_ON(fifo_state->dynamic_buffer != NULL);
311 fifo_state->reserved_size = bytes;
314 uint32_t stop = vmw_fifo_mem_read(dev_priv, SVGA_FIFO_STOP);
315 bool need_bounce = false;
316 bool reserve_in_place = false;
318 if (next_cmd >= stop) {
319 if (likely((next_cmd + bytes < max ||
320 (next_cmd + bytes == max && stop > min))))
321 reserve_in_place = true;
323 else if (vmw_fifo_is_full(dev_priv, bytes)) {
324 ret = vmw_fifo_wait(dev_priv, bytes,
326 if (unlikely(ret != 0))
333 if (likely((next_cmd + bytes < stop)))
334 reserve_in_place = true;
336 ret = vmw_fifo_wait(dev_priv, bytes,
338 if (unlikely(ret != 0))
343 if (reserve_in_place) {
344 if (reserveable || bytes <= sizeof(uint32_t)) {
345 fifo_state->using_bounce_buffer = false;
348 vmw_fifo_mem_write(dev_priv,
351 return (void __force *) (fifo_mem +
359 fifo_state->using_bounce_buffer = true;
360 if (bytes < fifo_state->static_buffer_size)
361 return fifo_state->static_buffer;
363 fifo_state->dynamic_buffer = vmalloc(bytes);
364 if (!fifo_state->dynamic_buffer)
366 return fifo_state->dynamic_buffer;
371 fifo_state->reserved_size = 0;
372 mutex_unlock(&fifo_state->fifo_mutex);
377 void *vmw_cmd_ctx_reserve(struct vmw_private *dev_priv, uint32_t bytes,
383 ret = vmw_cmdbuf_reserve(dev_priv->cman, bytes,
384 ctx_id, false, NULL);
385 else if (ctx_id == SVGA3D_INVALID_ID)
386 ret = vmw_local_fifo_reserve(dev_priv, bytes);
388 WARN(1, "Command buffer has not been allocated.\n");
391 if (IS_ERR_OR_NULL(ret))
397 static void vmw_fifo_res_copy(struct vmw_fifo_state *fifo_state,
398 struct vmw_private *vmw,
400 uint32_t max, uint32_t min, uint32_t bytes)
402 u32 *fifo_mem = vmw->fifo_mem;
403 uint32_t chunk_size = max - next_cmd;
405 uint32_t *buffer = (fifo_state->dynamic_buffer != NULL) ?
406 fifo_state->dynamic_buffer : fifo_state->static_buffer;
408 if (bytes < chunk_size)
411 vmw_fifo_mem_write(vmw, SVGA_FIFO_RESERVED, bytes);
413 memcpy(fifo_mem + (next_cmd >> 2), buffer, chunk_size);
414 rest = bytes - chunk_size;
416 memcpy(fifo_mem + (min >> 2), buffer + (chunk_size >> 2), rest);
419 static void vmw_fifo_slow_copy(struct vmw_fifo_state *fifo_state,
420 struct vmw_private *vmw,
422 uint32_t max, uint32_t min, uint32_t bytes)
424 uint32_t *buffer = (fifo_state->dynamic_buffer != NULL) ?
425 fifo_state->dynamic_buffer : fifo_state->static_buffer;
428 vmw_fifo_mem_write(vmw, (next_cmd >> 2), *buffer++);
429 next_cmd += sizeof(uint32_t);
430 if (unlikely(next_cmd == max))
433 vmw_fifo_mem_write(vmw, SVGA_FIFO_NEXT_CMD, next_cmd);
435 bytes -= sizeof(uint32_t);
439 static void vmw_local_fifo_commit(struct vmw_private *dev_priv, uint32_t bytes)
441 struct vmw_fifo_state *fifo_state = &dev_priv->fifo;
442 uint32_t next_cmd = vmw_fifo_mem_read(dev_priv, SVGA_FIFO_NEXT_CMD);
443 uint32_t max = vmw_fifo_mem_read(dev_priv, SVGA_FIFO_MAX);
444 uint32_t min = vmw_fifo_mem_read(dev_priv, SVGA_FIFO_MIN);
445 bool reserveable = fifo_state->capabilities & SVGA_FIFO_CAP_RESERVE;
448 bytes += sizeof(struct vmw_temp_set_context);
450 fifo_state->dx = false;
451 BUG_ON((bytes & 3) != 0);
452 BUG_ON(bytes > fifo_state->reserved_size);
454 fifo_state->reserved_size = 0;
456 if (fifo_state->using_bounce_buffer) {
458 vmw_fifo_res_copy(fifo_state, dev_priv,
459 next_cmd, max, min, bytes);
461 vmw_fifo_slow_copy(fifo_state, dev_priv,
462 next_cmd, max, min, bytes);
464 if (fifo_state->dynamic_buffer) {
465 vfree(fifo_state->dynamic_buffer);
466 fifo_state->dynamic_buffer = NULL;
471 down_write(&fifo_state->rwsem);
472 if (fifo_state->using_bounce_buffer || reserveable) {
475 next_cmd -= max - min;
477 vmw_fifo_mem_write(dev_priv, SVGA_FIFO_NEXT_CMD, next_cmd);
481 vmw_fifo_mem_write(dev_priv, SVGA_FIFO_RESERVED, 0);
483 up_write(&fifo_state->rwsem);
484 vmw_fifo_ping_host(dev_priv, SVGA_SYNC_GENERIC);
485 mutex_unlock(&fifo_state->fifo_mutex);
488 void vmw_cmd_commit(struct vmw_private *dev_priv, uint32_t bytes)
491 vmw_cmdbuf_commit(dev_priv->cman, bytes, NULL, false);
493 vmw_local_fifo_commit(dev_priv, bytes);
498 * vmw_fifo_commit_flush - Commit fifo space and flush any buffered commands.
500 * @dev_priv: Pointer to device private structure.
501 * @bytes: Number of bytes to commit.
503 void vmw_cmd_commit_flush(struct vmw_private *dev_priv, uint32_t bytes)
506 vmw_cmdbuf_commit(dev_priv->cman, bytes, NULL, true);
508 vmw_local_fifo_commit(dev_priv, bytes);
512 * vmw_fifo_flush - Flush any buffered commands and make sure command processing
515 * @dev_priv: Pointer to device private structure.
516 * @interruptible: Whether to wait interruptible if function needs to sleep.
518 int vmw_cmd_flush(struct vmw_private *dev_priv, bool interruptible)
523 return vmw_cmdbuf_cur_flush(dev_priv->cman, interruptible);
528 int vmw_cmd_send_fence(struct vmw_private *dev_priv, uint32_t *seqno)
530 struct vmw_fifo_state *fifo_state = &dev_priv->fifo;
531 struct svga_fifo_cmd_fence *cmd_fence;
534 uint32_t bytes = sizeof(u32) + sizeof(*cmd_fence);
536 fm = VMW_CMD_RESERVE(dev_priv, bytes);
537 if (unlikely(fm == NULL)) {
538 *seqno = atomic_read(&dev_priv->marker_seq);
540 (void)vmw_fallback_wait(dev_priv, false, true, *seqno,
546 *seqno = atomic_add_return(1, &dev_priv->marker_seq);
547 } while (*seqno == 0);
549 if (!(fifo_state->capabilities & SVGA_FIFO_CAP_FENCE)) {
552 * Don't request hardware to send a fence. The
553 * waiting code in vmwgfx_irq.c will emulate this.
556 vmw_cmd_commit(dev_priv, 0);
560 *fm++ = SVGA_CMD_FENCE;
561 cmd_fence = (struct svga_fifo_cmd_fence *) fm;
562 cmd_fence->fence = *seqno;
563 vmw_cmd_commit_flush(dev_priv, bytes);
564 vmw_update_seqno(dev_priv, fifo_state);
571 * vmw_fifo_emit_dummy_legacy_query - emits a dummy query to the fifo using
572 * legacy query commands.
574 * @dev_priv: The device private structure.
575 * @cid: The hardware context id used for the query.
577 * See the vmw_fifo_emit_dummy_query documentation.
579 static int vmw_fifo_emit_dummy_legacy_query(struct vmw_private *dev_priv,
583 * A query wait without a preceding query end will
584 * actually finish all queries for this cid
585 * without writing to the query result structure.
588 struct ttm_buffer_object *bo = &dev_priv->dummy_query_bo->base;
590 SVGA3dCmdHeader header;
591 SVGA3dCmdWaitForQuery body;
594 cmd = VMW_CMD_RESERVE(dev_priv, sizeof(*cmd));
595 if (unlikely(cmd == NULL))
598 cmd->header.id = SVGA_3D_CMD_WAIT_FOR_QUERY;
599 cmd->header.size = sizeof(cmd->body);
601 cmd->body.type = SVGA3D_QUERYTYPE_OCCLUSION;
603 if (bo->mem.mem_type == TTM_PL_VRAM) {
604 cmd->body.guestResult.gmrId = SVGA_GMR_FRAMEBUFFER;
605 cmd->body.guestResult.offset = bo->mem.start << PAGE_SHIFT;
607 cmd->body.guestResult.gmrId = bo->mem.start;
608 cmd->body.guestResult.offset = 0;
611 vmw_cmd_commit(dev_priv, sizeof(*cmd));
617 * vmw_fifo_emit_dummy_gb_query - emits a dummy query to the fifo using
618 * guest-backed resource query commands.
620 * @dev_priv: The device private structure.
621 * @cid: The hardware context id used for the query.
623 * See the vmw_fifo_emit_dummy_query documentation.
625 static int vmw_fifo_emit_dummy_gb_query(struct vmw_private *dev_priv,
629 * A query wait without a preceding query end will
630 * actually finish all queries for this cid
631 * without writing to the query result structure.
634 struct ttm_buffer_object *bo = &dev_priv->dummy_query_bo->base;
636 SVGA3dCmdHeader header;
637 SVGA3dCmdWaitForGBQuery body;
640 cmd = VMW_CMD_RESERVE(dev_priv, sizeof(*cmd));
641 if (unlikely(cmd == NULL))
644 cmd->header.id = SVGA_3D_CMD_WAIT_FOR_GB_QUERY;
645 cmd->header.size = sizeof(cmd->body);
647 cmd->body.type = SVGA3D_QUERYTYPE_OCCLUSION;
648 BUG_ON(bo->mem.mem_type != VMW_PL_MOB);
649 cmd->body.mobid = bo->mem.start;
650 cmd->body.offset = 0;
652 vmw_cmd_commit(dev_priv, sizeof(*cmd));
659 * vmw_fifo_emit_dummy_gb_query - emits a dummy query to the fifo using
660 * appropriate resource query commands.
662 * @dev_priv: The device private structure.
663 * @cid: The hardware context id used for the query.
665 * This function is used to emit a dummy occlusion query with
666 * no primitives rendered between query begin and query end.
667 * It's used to provide a query barrier, in order to know that when
668 * this query is finished, all preceding queries are also finished.
670 * A Query results structure should have been initialized at the start
671 * of the dev_priv->dummy_query_bo buffer object. And that buffer object
672 * must also be either reserved or pinned when this function is called.
674 * Returns -ENOMEM on failure to reserve fifo space.
676 int vmw_cmd_emit_dummy_query(struct vmw_private *dev_priv,
679 if (dev_priv->has_mob)
680 return vmw_fifo_emit_dummy_gb_query(dev_priv, cid);
682 return vmw_fifo_emit_dummy_legacy_query(dev_priv, cid);