2 * Copyright 2014 Advanced Micro Devices, Inc.
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
25 #include <linux/firmware.h>
28 #include "amdgpu_uvd.h"
30 #include "uvd/uvd_6_0_d.h"
31 #include "uvd/uvd_6_0_sh_mask.h"
32 #include "oss/oss_2_0_d.h"
33 #include "oss/oss_2_0_sh_mask.h"
34 #include "smu/smu_7_1_3_d.h"
35 #include "smu/smu_7_1_3_sh_mask.h"
36 #include "bif/bif_5_1_d.h"
37 #include "gmc/gmc_8_1_d.h"
40 static void uvd_v6_0_set_ring_funcs(struct amdgpu_device *adev);
41 static void uvd_v6_0_set_irq_funcs(struct amdgpu_device *adev);
42 static int uvd_v6_0_start(struct amdgpu_device *adev);
43 static void uvd_v6_0_stop(struct amdgpu_device *adev);
44 static void uvd_v6_0_set_sw_clock_gating(struct amdgpu_device *adev);
47 * uvd_v6_0_ring_get_rptr - get read pointer
49 * @ring: amdgpu_ring pointer
51 * Returns the current hardware read pointer
53 static uint32_t uvd_v6_0_ring_get_rptr(struct amdgpu_ring *ring)
55 struct amdgpu_device *adev = ring->adev;
57 return RREG32(mmUVD_RBC_RB_RPTR);
61 * uvd_v6_0_ring_get_wptr - get write pointer
63 * @ring: amdgpu_ring pointer
65 * Returns the current hardware write pointer
67 static uint32_t uvd_v6_0_ring_get_wptr(struct amdgpu_ring *ring)
69 struct amdgpu_device *adev = ring->adev;
71 return RREG32(mmUVD_RBC_RB_WPTR);
75 * uvd_v6_0_ring_set_wptr - set write pointer
77 * @ring: amdgpu_ring pointer
79 * Commits the write pointer to the hardware
81 static void uvd_v6_0_ring_set_wptr(struct amdgpu_ring *ring)
83 struct amdgpu_device *adev = ring->adev;
85 WREG32(mmUVD_RBC_RB_WPTR, ring->wptr);
88 static int uvd_v6_0_early_init(void *handle)
90 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
92 uvd_v6_0_set_ring_funcs(adev);
93 uvd_v6_0_set_irq_funcs(adev);
98 static int uvd_v6_0_sw_init(void *handle)
100 struct amdgpu_ring *ring;
102 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
105 r = amdgpu_irq_add_id(adev, 124, &adev->uvd.irq);
109 r = amdgpu_uvd_sw_init(adev);
113 r = amdgpu_uvd_resume(adev);
117 ring = &adev->uvd.ring;
118 sprintf(ring->name, "uvd");
119 r = amdgpu_ring_init(adev, ring, 512, PACKET0(mmUVD_NO_OP, 0), 0xf,
120 &adev->uvd.irq, 0, AMDGPU_RING_TYPE_UVD);
125 static int uvd_v6_0_sw_fini(void *handle)
128 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
130 r = amdgpu_uvd_suspend(adev);
134 r = amdgpu_uvd_sw_fini(adev);
142 * uvd_v6_0_hw_init - start and test UVD block
144 * @adev: amdgpu_device pointer
146 * Initialize the hardware, boot up the VCPU and do some testing
148 static int uvd_v6_0_hw_init(void *handle)
150 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
151 struct amdgpu_ring *ring = &adev->uvd.ring;
155 r = uvd_v6_0_start(adev);
160 r = amdgpu_ring_test_ring(ring);
166 r = amdgpu_ring_alloc(ring, 10);
168 DRM_ERROR("amdgpu: ring failed to lock UVD ring (%d).\n", r);
172 tmp = PACKET0(mmUVD_SEMA_WAIT_FAULT_TIMEOUT_CNTL, 0);
173 amdgpu_ring_write(ring, tmp);
174 amdgpu_ring_write(ring, 0xFFFFF);
176 tmp = PACKET0(mmUVD_SEMA_WAIT_INCOMPLETE_TIMEOUT_CNTL, 0);
177 amdgpu_ring_write(ring, tmp);
178 amdgpu_ring_write(ring, 0xFFFFF);
180 tmp = PACKET0(mmUVD_SEMA_SIGNAL_INCOMPLETE_TIMEOUT_CNTL, 0);
181 amdgpu_ring_write(ring, tmp);
182 amdgpu_ring_write(ring, 0xFFFFF);
184 /* Clear timeout status bits */
185 amdgpu_ring_write(ring, PACKET0(mmUVD_SEMA_TIMEOUT_STATUS, 0));
186 amdgpu_ring_write(ring, 0x8);
188 amdgpu_ring_write(ring, PACKET0(mmUVD_SEMA_CNTL, 0));
189 amdgpu_ring_write(ring, 3);
191 amdgpu_ring_commit(ring);
195 DRM_INFO("UVD initialized successfully.\n");
201 * uvd_v6_0_hw_fini - stop the hardware block
203 * @adev: amdgpu_device pointer
205 * Stop the UVD block, mark ring as not ready any more
207 static int uvd_v6_0_hw_fini(void *handle)
209 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
210 struct amdgpu_ring *ring = &adev->uvd.ring;
218 static int uvd_v6_0_suspend(void *handle)
221 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
223 r = uvd_v6_0_hw_fini(adev);
227 /* Skip this for APU for now */
228 if (!(adev->flags & AMD_IS_APU)) {
229 r = amdgpu_uvd_suspend(adev);
237 static int uvd_v6_0_resume(void *handle)
240 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
242 /* Skip this for APU for now */
243 if (!(adev->flags & AMD_IS_APU)) {
244 r = amdgpu_uvd_resume(adev);
248 r = uvd_v6_0_hw_init(adev);
256 * uvd_v6_0_mc_resume - memory controller programming
258 * @adev: amdgpu_device pointer
260 * Let the UVD memory controller know it's offsets
262 static void uvd_v6_0_mc_resume(struct amdgpu_device *adev)
267 /* programm memory controller bits 0-27 */
268 WREG32(mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
269 lower_32_bits(adev->uvd.gpu_addr));
270 WREG32(mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
271 upper_32_bits(adev->uvd.gpu_addr));
273 offset = AMDGPU_UVD_FIRMWARE_OFFSET;
274 size = AMDGPU_GPU_PAGE_ALIGN(adev->uvd.fw->size + 4);
275 WREG32(mmUVD_VCPU_CACHE_OFFSET0, offset >> 3);
276 WREG32(mmUVD_VCPU_CACHE_SIZE0, size);
279 size = AMDGPU_UVD_HEAP_SIZE;
280 WREG32(mmUVD_VCPU_CACHE_OFFSET1, offset >> 3);
281 WREG32(mmUVD_VCPU_CACHE_SIZE1, size);
284 size = AMDGPU_UVD_STACK_SIZE +
285 (AMDGPU_UVD_SESSION_SIZE * adev->uvd.max_handles);
286 WREG32(mmUVD_VCPU_CACHE_OFFSET2, offset >> 3);
287 WREG32(mmUVD_VCPU_CACHE_SIZE2, size);
289 WREG32(mmUVD_UDEC_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
290 WREG32(mmUVD_UDEC_DB_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
291 WREG32(mmUVD_UDEC_DBW_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
293 WREG32(mmUVD_GP_SCRATCH4, adev->uvd.max_handles);
297 static void cz_set_uvd_clock_gating_branches(struct amdgpu_device *adev,
302 data = RREG32(mmUVD_CGC_GATE);
303 data1 = RREG32(mmUVD_SUVD_CGC_GATE);
305 data |= UVD_CGC_GATE__SYS_MASK |
306 UVD_CGC_GATE__UDEC_MASK |
307 UVD_CGC_GATE__MPEG2_MASK |
308 UVD_CGC_GATE__RBC_MASK |
309 UVD_CGC_GATE__LMI_MC_MASK |
310 UVD_CGC_GATE__IDCT_MASK |
311 UVD_CGC_GATE__MPRD_MASK |
312 UVD_CGC_GATE__MPC_MASK |
313 UVD_CGC_GATE__LBSI_MASK |
314 UVD_CGC_GATE__LRBBM_MASK |
315 UVD_CGC_GATE__UDEC_RE_MASK |
316 UVD_CGC_GATE__UDEC_CM_MASK |
317 UVD_CGC_GATE__UDEC_IT_MASK |
318 UVD_CGC_GATE__UDEC_DB_MASK |
319 UVD_CGC_GATE__UDEC_MP_MASK |
320 UVD_CGC_GATE__WCB_MASK |
321 UVD_CGC_GATE__VCPU_MASK |
322 UVD_CGC_GATE__SCPU_MASK;
323 data1 |= UVD_SUVD_CGC_GATE__SRE_MASK |
324 UVD_SUVD_CGC_GATE__SIT_MASK |
325 UVD_SUVD_CGC_GATE__SMP_MASK |
326 UVD_SUVD_CGC_GATE__SCM_MASK |
327 UVD_SUVD_CGC_GATE__SDB_MASK |
328 UVD_SUVD_CGC_GATE__SRE_H264_MASK |
329 UVD_SUVD_CGC_GATE__SRE_HEVC_MASK |
330 UVD_SUVD_CGC_GATE__SIT_H264_MASK |
331 UVD_SUVD_CGC_GATE__SIT_HEVC_MASK |
332 UVD_SUVD_CGC_GATE__SCM_H264_MASK |
333 UVD_SUVD_CGC_GATE__SCM_HEVC_MASK |
334 UVD_SUVD_CGC_GATE__SDB_H264_MASK |
335 UVD_SUVD_CGC_GATE__SDB_HEVC_MASK;
337 data &= ~(UVD_CGC_GATE__SYS_MASK |
338 UVD_CGC_GATE__UDEC_MASK |
339 UVD_CGC_GATE__MPEG2_MASK |
340 UVD_CGC_GATE__RBC_MASK |
341 UVD_CGC_GATE__LMI_MC_MASK |
342 UVD_CGC_GATE__LMI_UMC_MASK |
343 UVD_CGC_GATE__IDCT_MASK |
344 UVD_CGC_GATE__MPRD_MASK |
345 UVD_CGC_GATE__MPC_MASK |
346 UVD_CGC_GATE__LBSI_MASK |
347 UVD_CGC_GATE__LRBBM_MASK |
348 UVD_CGC_GATE__UDEC_RE_MASK |
349 UVD_CGC_GATE__UDEC_CM_MASK |
350 UVD_CGC_GATE__UDEC_IT_MASK |
351 UVD_CGC_GATE__UDEC_DB_MASK |
352 UVD_CGC_GATE__UDEC_MP_MASK |
353 UVD_CGC_GATE__WCB_MASK |
354 UVD_CGC_GATE__VCPU_MASK |
355 UVD_CGC_GATE__SCPU_MASK);
356 data1 &= ~(UVD_SUVD_CGC_GATE__SRE_MASK |
357 UVD_SUVD_CGC_GATE__SIT_MASK |
358 UVD_SUVD_CGC_GATE__SMP_MASK |
359 UVD_SUVD_CGC_GATE__SCM_MASK |
360 UVD_SUVD_CGC_GATE__SDB_MASK |
361 UVD_SUVD_CGC_GATE__SRE_H264_MASK |
362 UVD_SUVD_CGC_GATE__SRE_HEVC_MASK |
363 UVD_SUVD_CGC_GATE__SIT_H264_MASK |
364 UVD_SUVD_CGC_GATE__SIT_HEVC_MASK |
365 UVD_SUVD_CGC_GATE__SCM_H264_MASK |
366 UVD_SUVD_CGC_GATE__SCM_HEVC_MASK |
367 UVD_SUVD_CGC_GATE__SDB_H264_MASK |
368 UVD_SUVD_CGC_GATE__SDB_HEVC_MASK);
370 WREG32(mmUVD_CGC_GATE, data);
371 WREG32(mmUVD_SUVD_CGC_GATE, data1);
376 * uvd_v6_0_start - start UVD block
378 * @adev: amdgpu_device pointer
380 * Setup and start the UVD block
382 static int uvd_v6_0_start(struct amdgpu_device *adev)
384 struct amdgpu_ring *ring = &adev->uvd.ring;
385 uint32_t rb_bufsz, tmp;
386 uint32_t lmi_swap_cntl;
387 uint32_t mp_swap_cntl;
391 WREG32_P(mmUVD_POWER_STATUS, 0, ~UVD_POWER_STATUS__UVD_PG_MODE_MASK);
393 /* disable byte swapping */
397 uvd_v6_0_mc_resume(adev);
399 /* disable clock gating */
400 WREG32_FIELD(UVD_CGC_CTRL, DYN_CLOCK_MODE, 0);
402 /* disable interupt */
403 WREG32_FIELD(UVD_MASTINT_EN, VCPU_EN, 0);
405 /* stall UMC and register bus before resetting VCPU */
406 WREG32_FIELD(UVD_LMI_CTRL2, STALL_ARB_UMC, 1);
409 /* put LMI, VCPU, RBC etc... into reset */
410 WREG32(mmUVD_SOFT_RESET,
411 UVD_SOFT_RESET__LMI_SOFT_RESET_MASK |
412 UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK |
413 UVD_SOFT_RESET__LBSI_SOFT_RESET_MASK |
414 UVD_SOFT_RESET__RBC_SOFT_RESET_MASK |
415 UVD_SOFT_RESET__CSM_SOFT_RESET_MASK |
416 UVD_SOFT_RESET__CXW_SOFT_RESET_MASK |
417 UVD_SOFT_RESET__TAP_SOFT_RESET_MASK |
418 UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK);
421 /* take UVD block out of reset */
422 WREG32_FIELD(SRBM_SOFT_RESET, SOFT_RESET_UVD, 0);
425 /* initialize UVD memory controller */
426 WREG32(mmUVD_LMI_CTRL,
427 (0x40 << UVD_LMI_CTRL__WRITE_CLEAN_TIMER__SHIFT) |
428 UVD_LMI_CTRL__WRITE_CLEAN_TIMER_EN_MASK |
429 UVD_LMI_CTRL__DATA_COHERENCY_EN_MASK |
430 UVD_LMI_CTRL__VCPU_DATA_COHERENCY_EN_MASK |
431 UVD_LMI_CTRL__REQ_MODE_MASK |
432 UVD_LMI_CTRL__DISABLE_ON_FWV_FAIL_MASK);
435 /* swap (8 in 32) RB and IB */
439 WREG32(mmUVD_LMI_SWAP_CNTL, lmi_swap_cntl);
440 WREG32(mmUVD_MP_SWAP_CNTL, mp_swap_cntl);
442 WREG32(mmUVD_MPC_SET_MUXA0, 0x40c2040);
443 WREG32(mmUVD_MPC_SET_MUXA1, 0x0);
444 WREG32(mmUVD_MPC_SET_MUXB0, 0x40c2040);
445 WREG32(mmUVD_MPC_SET_MUXB1, 0x0);
446 WREG32(mmUVD_MPC_SET_ALU, 0);
447 WREG32(mmUVD_MPC_SET_MUX, 0x88);
449 /* take all subblocks out of reset, except VCPU */
450 WREG32(mmUVD_SOFT_RESET, UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
453 /* enable VCPU clock */
454 WREG32(mmUVD_VCPU_CNTL, UVD_VCPU_CNTL__CLK_EN_MASK);
457 WREG32_FIELD(UVD_LMI_CTRL2, STALL_ARB_UMC, 0);
459 /* boot up the VCPU */
460 WREG32(mmUVD_SOFT_RESET, 0);
463 for (i = 0; i < 10; ++i) {
466 for (j = 0; j < 100; ++j) {
467 status = RREG32(mmUVD_STATUS);
476 DRM_ERROR("UVD not responding, trying to reset the VCPU!!!\n");
477 WREG32_FIELD(UVD_SOFT_RESET, VCPU_SOFT_RESET, 1);
479 WREG32_FIELD(UVD_SOFT_RESET, VCPU_SOFT_RESET, 0);
485 DRM_ERROR("UVD not responding, giving up!!!\n");
488 /* enable master interrupt */
489 WREG32_P(mmUVD_MASTINT_EN,
490 (UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK),
491 ~(UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK));
493 /* clear the bit 4 of UVD_STATUS */
494 WREG32_P(mmUVD_STATUS, 0, ~(2 << UVD_STATUS__VCPU_REPORT__SHIFT));
496 /* force RBC into idle state */
497 rb_bufsz = order_base_2(ring->ring_size);
498 tmp = REG_SET_FIELD(0, UVD_RBC_RB_CNTL, RB_BUFSZ, rb_bufsz);
499 tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_BLKSZ, 1);
500 tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_FETCH, 1);
501 tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_WPTR_POLL_EN, 0);
502 tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_UPDATE, 1);
503 tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_RPTR_WR_EN, 1);
504 WREG32(mmUVD_RBC_RB_CNTL, tmp);
506 /* set the write pointer delay */
507 WREG32(mmUVD_RBC_RB_WPTR_CNTL, 0);
509 /* set the wb address */
510 WREG32(mmUVD_RBC_RB_RPTR_ADDR, (upper_32_bits(ring->gpu_addr) >> 2));
512 /* programm the RB_BASE for ring buffer */
513 WREG32(mmUVD_LMI_RBC_RB_64BIT_BAR_LOW,
514 lower_32_bits(ring->gpu_addr));
515 WREG32(mmUVD_LMI_RBC_RB_64BIT_BAR_HIGH,
516 upper_32_bits(ring->gpu_addr));
518 /* Initialize the ring buffer's read and write pointers */
519 WREG32(mmUVD_RBC_RB_RPTR, 0);
521 ring->wptr = RREG32(mmUVD_RBC_RB_RPTR);
522 WREG32(mmUVD_RBC_RB_WPTR, ring->wptr);
524 WREG32_FIELD(UVD_RBC_RB_CNTL, RB_NO_FETCH, 0);
530 * uvd_v6_0_stop - stop UVD block
532 * @adev: amdgpu_device pointer
536 static void uvd_v6_0_stop(struct amdgpu_device *adev)
538 /* force RBC into idle state */
539 WREG32(mmUVD_RBC_RB_CNTL, 0x11010101);
541 /* Stall UMC and register bus before resetting VCPU */
542 WREG32_P(mmUVD_LMI_CTRL2, 1 << 8, ~(1 << 8));
545 /* put VCPU into reset */
546 WREG32(mmUVD_SOFT_RESET, UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
549 /* disable VCPU clock */
550 WREG32(mmUVD_VCPU_CNTL, 0x0);
552 /* Unstall UMC and register bus */
553 WREG32_P(mmUVD_LMI_CTRL2, 0, ~(1 << 8));
557 * uvd_v6_0_ring_emit_fence - emit an fence & trap command
559 * @ring: amdgpu_ring pointer
560 * @fence: fence to emit
562 * Write a fence and a trap command to the ring.
564 static void uvd_v6_0_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq,
567 WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
569 amdgpu_ring_write(ring, PACKET0(mmUVD_CONTEXT_ID, 0));
570 amdgpu_ring_write(ring, seq);
571 amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
572 amdgpu_ring_write(ring, addr & 0xffffffff);
573 amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
574 amdgpu_ring_write(ring, upper_32_bits(addr) & 0xff);
575 amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
576 amdgpu_ring_write(ring, 0);
578 amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
579 amdgpu_ring_write(ring, 0);
580 amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
581 amdgpu_ring_write(ring, 0);
582 amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
583 amdgpu_ring_write(ring, 2);
587 * uvd_v6_0_ring_emit_hdp_flush - emit an hdp flush
589 * @ring: amdgpu_ring pointer
591 * Emits an hdp flush.
593 static void uvd_v6_0_ring_emit_hdp_flush(struct amdgpu_ring *ring)
595 amdgpu_ring_write(ring, PACKET0(mmHDP_MEM_COHERENCY_FLUSH_CNTL, 0));
596 amdgpu_ring_write(ring, 0);
600 * uvd_v6_0_ring_hdp_invalidate - emit an hdp invalidate
602 * @ring: amdgpu_ring pointer
604 * Emits an hdp invalidate.
606 static void uvd_v6_0_ring_emit_hdp_invalidate(struct amdgpu_ring *ring)
608 amdgpu_ring_write(ring, PACKET0(mmHDP_DEBUG0, 0));
609 amdgpu_ring_write(ring, 1);
613 * uvd_v6_0_ring_test_ring - register write test
615 * @ring: amdgpu_ring pointer
617 * Test if we can successfully write to the context register
619 static int uvd_v6_0_ring_test_ring(struct amdgpu_ring *ring)
621 struct amdgpu_device *adev = ring->adev;
626 WREG32(mmUVD_CONTEXT_ID, 0xCAFEDEAD);
627 r = amdgpu_ring_alloc(ring, 3);
629 DRM_ERROR("amdgpu: cp failed to lock ring %d (%d).\n",
633 amdgpu_ring_write(ring, PACKET0(mmUVD_CONTEXT_ID, 0));
634 amdgpu_ring_write(ring, 0xDEADBEEF);
635 amdgpu_ring_commit(ring);
636 for (i = 0; i < adev->usec_timeout; i++) {
637 tmp = RREG32(mmUVD_CONTEXT_ID);
638 if (tmp == 0xDEADBEEF)
643 if (i < adev->usec_timeout) {
644 DRM_INFO("ring test on %d succeeded in %d usecs\n",
647 DRM_ERROR("amdgpu: ring %d test failed (0x%08X)\n",
655 * uvd_v6_0_ring_emit_ib - execute indirect buffer
657 * @ring: amdgpu_ring pointer
658 * @ib: indirect buffer to execute
660 * Write ring commands to execute the indirect buffer
662 static void uvd_v6_0_ring_emit_ib(struct amdgpu_ring *ring,
663 struct amdgpu_ib *ib,
664 unsigned vm_id, bool ctx_switch)
666 amdgpu_ring_write(ring, PACKET0(mmUVD_LMI_RBC_IB_VMID, 0));
667 amdgpu_ring_write(ring, vm_id);
669 amdgpu_ring_write(ring, PACKET0(mmUVD_LMI_RBC_IB_64BIT_BAR_LOW, 0));
670 amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
671 amdgpu_ring_write(ring, PACKET0(mmUVD_LMI_RBC_IB_64BIT_BAR_HIGH, 0));
672 amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
673 amdgpu_ring_write(ring, PACKET0(mmUVD_RBC_IB_SIZE, 0));
674 amdgpu_ring_write(ring, ib->length_dw);
677 static void uvd_v6_0_ring_emit_vm_flush(struct amdgpu_ring *ring,
678 unsigned vm_id, uint64_t pd_addr)
683 reg = mmVM_CONTEXT0_PAGE_TABLE_BASE_ADDR + vm_id;
685 reg = mmVM_CONTEXT8_PAGE_TABLE_BASE_ADDR + vm_id - 8;
687 amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
688 amdgpu_ring_write(ring, reg << 2);
689 amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
690 amdgpu_ring_write(ring, pd_addr >> 12);
691 amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
692 amdgpu_ring_write(ring, 0x8);
694 amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
695 amdgpu_ring_write(ring, mmVM_INVALIDATE_REQUEST << 2);
696 amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
697 amdgpu_ring_write(ring, 1 << vm_id);
698 amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
699 amdgpu_ring_write(ring, 0x8);
701 amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
702 amdgpu_ring_write(ring, mmVM_INVALIDATE_REQUEST << 2);
703 amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
704 amdgpu_ring_write(ring, 0);
705 amdgpu_ring_write(ring, PACKET0(mmUVD_GP_SCRATCH8, 0));
706 amdgpu_ring_write(ring, 1 << vm_id); /* mask */
707 amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
708 amdgpu_ring_write(ring, 0xC);
711 static void uvd_v6_0_ring_emit_pipeline_sync(struct amdgpu_ring *ring)
713 uint32_t seq = ring->fence_drv.sync_seq;
714 uint64_t addr = ring->fence_drv.gpu_addr;
716 amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
717 amdgpu_ring_write(ring, lower_32_bits(addr));
718 amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
719 amdgpu_ring_write(ring, upper_32_bits(addr));
720 amdgpu_ring_write(ring, PACKET0(mmUVD_GP_SCRATCH8, 0));
721 amdgpu_ring_write(ring, 0xffffffff); /* mask */
722 amdgpu_ring_write(ring, PACKET0(mmUVD_GP_SCRATCH9, 0));
723 amdgpu_ring_write(ring, seq);
724 amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
725 amdgpu_ring_write(ring, 0xE);
728 static unsigned uvd_v6_0_ring_get_emit_ib_size(struct amdgpu_ring *ring)
731 8; /* uvd_v6_0_ring_emit_ib */
734 static unsigned uvd_v6_0_ring_get_dma_frame_size(struct amdgpu_ring *ring)
737 2 + /* uvd_v6_0_ring_emit_hdp_flush */
738 2 + /* uvd_v6_0_ring_emit_hdp_invalidate */
739 10 + /* uvd_v6_0_ring_emit_pipeline_sync */
740 14; /* uvd_v6_0_ring_emit_fence x1 no user fence */
743 static unsigned uvd_v6_0_ring_get_dma_frame_size_vm(struct amdgpu_ring *ring)
746 2 + /* uvd_v6_0_ring_emit_hdp_flush */
747 2 + /* uvd_v6_0_ring_emit_hdp_invalidate */
748 10 + /* uvd_v6_0_ring_emit_pipeline_sync */
749 20 + /* uvd_v6_0_ring_emit_vm_flush */
750 14 + 14; /* uvd_v6_0_ring_emit_fence x2 vm fence */
753 static bool uvd_v6_0_is_idle(void *handle)
755 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
757 return !(RREG32(mmSRBM_STATUS) & SRBM_STATUS__UVD_BUSY_MASK);
760 static int uvd_v6_0_wait_for_idle(void *handle)
763 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
765 for (i = 0; i < adev->usec_timeout; i++) {
766 if (uvd_v6_0_is_idle(handle))
772 #define AMDGPU_UVD_STATUS_BUSY_MASK 0xfd
773 static int uvd_v6_0_check_soft_reset(void *handle)
775 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
776 u32 srbm_soft_reset = 0;
777 u32 tmp = RREG32(mmSRBM_STATUS);
779 if (REG_GET_FIELD(tmp, SRBM_STATUS, UVD_RQ_PENDING) ||
780 REG_GET_FIELD(tmp, SRBM_STATUS, UVD_BUSY) ||
781 (RREG32(mmUVD_STATUS) & AMDGPU_UVD_STATUS_BUSY_MASK))
782 srbm_soft_reset = REG_SET_FIELD(srbm_soft_reset, SRBM_SOFT_RESET, SOFT_RESET_UVD, 1);
784 if (srbm_soft_reset) {
785 adev->ip_block_status[AMD_IP_BLOCK_TYPE_UVD].hang = true;
786 adev->uvd.srbm_soft_reset = srbm_soft_reset;
788 adev->ip_block_status[AMD_IP_BLOCK_TYPE_UVD].hang = false;
789 adev->uvd.srbm_soft_reset = 0;
793 static int uvd_v6_0_pre_soft_reset(void *handle)
795 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
797 if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_UVD].hang)
804 static int uvd_v6_0_soft_reset(void *handle)
806 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
809 if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_UVD].hang)
811 srbm_soft_reset = adev->uvd.srbm_soft_reset;
813 if (srbm_soft_reset) {
816 tmp = RREG32(mmSRBM_SOFT_RESET);
817 tmp |= srbm_soft_reset;
818 dev_info(adev->dev, "SRBM_SOFT_RESET=0x%08X\n", tmp);
819 WREG32(mmSRBM_SOFT_RESET, tmp);
820 tmp = RREG32(mmSRBM_SOFT_RESET);
824 tmp &= ~srbm_soft_reset;
825 WREG32(mmSRBM_SOFT_RESET, tmp);
826 tmp = RREG32(mmSRBM_SOFT_RESET);
828 /* Wait a little for things to settle down */
835 static int uvd_v6_0_post_soft_reset(void *handle)
837 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
839 if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_UVD].hang)
844 return uvd_v6_0_start(adev);
847 static int uvd_v6_0_set_interrupt_state(struct amdgpu_device *adev,
848 struct amdgpu_irq_src *source,
850 enum amdgpu_interrupt_state state)
856 static int uvd_v6_0_process_interrupt(struct amdgpu_device *adev,
857 struct amdgpu_irq_src *source,
858 struct amdgpu_iv_entry *entry)
860 DRM_DEBUG("IH: UVD TRAP\n");
861 amdgpu_fence_process(&adev->uvd.ring);
865 static void uvd_v6_0_set_sw_clock_gating(struct amdgpu_device *adev)
867 uint32_t data, data1, data2, suvd_flags;
869 data = RREG32(mmUVD_CGC_CTRL);
870 data1 = RREG32(mmUVD_SUVD_CGC_GATE);
871 data2 = RREG32(mmUVD_SUVD_CGC_CTRL);
873 data &= ~(UVD_CGC_CTRL__CLK_OFF_DELAY_MASK |
874 UVD_CGC_CTRL__CLK_GATE_DLY_TIMER_MASK);
876 suvd_flags = UVD_SUVD_CGC_GATE__SRE_MASK |
877 UVD_SUVD_CGC_GATE__SIT_MASK |
878 UVD_SUVD_CGC_GATE__SMP_MASK |
879 UVD_SUVD_CGC_GATE__SCM_MASK |
880 UVD_SUVD_CGC_GATE__SDB_MASK;
882 data |= UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK |
883 (1 << REG_FIELD_SHIFT(UVD_CGC_CTRL, CLK_GATE_DLY_TIMER)) |
884 (4 << REG_FIELD_SHIFT(UVD_CGC_CTRL, CLK_OFF_DELAY));
886 data &= ~(UVD_CGC_CTRL__UDEC_RE_MODE_MASK |
887 UVD_CGC_CTRL__UDEC_CM_MODE_MASK |
888 UVD_CGC_CTRL__UDEC_IT_MODE_MASK |
889 UVD_CGC_CTRL__UDEC_DB_MODE_MASK |
890 UVD_CGC_CTRL__UDEC_MP_MODE_MASK |
891 UVD_CGC_CTRL__SYS_MODE_MASK |
892 UVD_CGC_CTRL__UDEC_MODE_MASK |
893 UVD_CGC_CTRL__MPEG2_MODE_MASK |
894 UVD_CGC_CTRL__REGS_MODE_MASK |
895 UVD_CGC_CTRL__RBC_MODE_MASK |
896 UVD_CGC_CTRL__LMI_MC_MODE_MASK |
897 UVD_CGC_CTRL__LMI_UMC_MODE_MASK |
898 UVD_CGC_CTRL__IDCT_MODE_MASK |
899 UVD_CGC_CTRL__MPRD_MODE_MASK |
900 UVD_CGC_CTRL__MPC_MODE_MASK |
901 UVD_CGC_CTRL__LBSI_MODE_MASK |
902 UVD_CGC_CTRL__LRBBM_MODE_MASK |
903 UVD_CGC_CTRL__WCB_MODE_MASK |
904 UVD_CGC_CTRL__VCPU_MODE_MASK |
905 UVD_CGC_CTRL__JPEG_MODE_MASK |
906 UVD_CGC_CTRL__SCPU_MODE_MASK |
907 UVD_CGC_CTRL__JPEG2_MODE_MASK);
908 data2 &= ~(UVD_SUVD_CGC_CTRL__SRE_MODE_MASK |
909 UVD_SUVD_CGC_CTRL__SIT_MODE_MASK |
910 UVD_SUVD_CGC_CTRL__SMP_MODE_MASK |
911 UVD_SUVD_CGC_CTRL__SCM_MODE_MASK |
912 UVD_SUVD_CGC_CTRL__SDB_MODE_MASK);
915 WREG32(mmUVD_CGC_CTRL, data);
916 WREG32(mmUVD_CGC_GATE, 0);
917 WREG32(mmUVD_SUVD_CGC_GATE, data1);
918 WREG32(mmUVD_SUVD_CGC_CTRL, data2);
922 static void uvd_v6_0_set_hw_clock_gating(struct amdgpu_device *adev)
924 uint32_t data, data1, cgc_flags, suvd_flags;
926 data = RREG32(mmUVD_CGC_GATE);
927 data1 = RREG32(mmUVD_SUVD_CGC_GATE);
929 cgc_flags = UVD_CGC_GATE__SYS_MASK |
930 UVD_CGC_GATE__UDEC_MASK |
931 UVD_CGC_GATE__MPEG2_MASK |
932 UVD_CGC_GATE__RBC_MASK |
933 UVD_CGC_GATE__LMI_MC_MASK |
934 UVD_CGC_GATE__IDCT_MASK |
935 UVD_CGC_GATE__MPRD_MASK |
936 UVD_CGC_GATE__MPC_MASK |
937 UVD_CGC_GATE__LBSI_MASK |
938 UVD_CGC_GATE__LRBBM_MASK |
939 UVD_CGC_GATE__UDEC_RE_MASK |
940 UVD_CGC_GATE__UDEC_CM_MASK |
941 UVD_CGC_GATE__UDEC_IT_MASK |
942 UVD_CGC_GATE__UDEC_DB_MASK |
943 UVD_CGC_GATE__UDEC_MP_MASK |
944 UVD_CGC_GATE__WCB_MASK |
945 UVD_CGC_GATE__VCPU_MASK |
946 UVD_CGC_GATE__SCPU_MASK |
947 UVD_CGC_GATE__JPEG_MASK |
948 UVD_CGC_GATE__JPEG2_MASK;
950 suvd_flags = UVD_SUVD_CGC_GATE__SRE_MASK |
951 UVD_SUVD_CGC_GATE__SIT_MASK |
952 UVD_SUVD_CGC_GATE__SMP_MASK |
953 UVD_SUVD_CGC_GATE__SCM_MASK |
954 UVD_SUVD_CGC_GATE__SDB_MASK;
959 WREG32(mmUVD_CGC_GATE, data);
960 WREG32(mmUVD_SUVD_CGC_GATE, data1);
964 static void uvd_v6_set_bypass_mode(struct amdgpu_device *adev, bool enable)
966 u32 tmp = RREG32_SMC(ixGCK_DFS_BYPASS_CNTL);
969 tmp |= (GCK_DFS_BYPASS_CNTL__BYPASSDCLK_MASK |
970 GCK_DFS_BYPASS_CNTL__BYPASSVCLK_MASK);
972 tmp &= ~(GCK_DFS_BYPASS_CNTL__BYPASSDCLK_MASK |
973 GCK_DFS_BYPASS_CNTL__BYPASSVCLK_MASK);
975 WREG32_SMC(ixGCK_DFS_BYPASS_CNTL, tmp);
978 static int uvd_v6_0_set_clockgating_state(void *handle,
979 enum amd_clockgating_state state)
981 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
983 if (adev->asic_type == CHIP_FIJI ||
984 adev->asic_type == CHIP_POLARIS10)
985 uvd_v6_set_bypass_mode(adev, state == AMD_CG_STATE_GATE ? true : false);
987 if (!(adev->cg_flags & AMD_CG_SUPPORT_UVD_MGCG))
990 if (state == AMD_CG_STATE_GATE) {
991 /* disable HW gating and enable Sw gating */
992 uvd_v6_0_set_sw_clock_gating(adev);
994 /* wait for STATUS to clear */
995 if (uvd_v6_0_wait_for_idle(handle))
998 /* enable HW gates because UVD is idle */
999 /* uvd_v6_0_set_hw_clock_gating(adev); */
1005 static int uvd_v6_0_set_powergating_state(void *handle,
1006 enum amd_powergating_state state)
1008 /* This doesn't actually powergate the UVD block.
1009 * That's done in the dpm code via the SMC. This
1010 * just re-inits the block as necessary. The actual
1011 * gating still happens in the dpm code. We should
1012 * revisit this when there is a cleaner line between
1013 * the smc and the hw blocks
1015 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1017 if (!(adev->pg_flags & AMD_PG_SUPPORT_UVD))
1020 WREG32(mmUVD_POWER_STATUS, UVD_POWER_STATUS__UVD_PG_EN_MASK);
1022 if (state == AMD_PG_STATE_GATE) {
1023 uvd_v6_0_stop(adev);
1026 return uvd_v6_0_start(adev);
1030 const struct amd_ip_funcs uvd_v6_0_ip_funcs = {
1032 .early_init = uvd_v6_0_early_init,
1034 .sw_init = uvd_v6_0_sw_init,
1035 .sw_fini = uvd_v6_0_sw_fini,
1036 .hw_init = uvd_v6_0_hw_init,
1037 .hw_fini = uvd_v6_0_hw_fini,
1038 .suspend = uvd_v6_0_suspend,
1039 .resume = uvd_v6_0_resume,
1040 .is_idle = uvd_v6_0_is_idle,
1041 .wait_for_idle = uvd_v6_0_wait_for_idle,
1042 .check_soft_reset = uvd_v6_0_check_soft_reset,
1043 .pre_soft_reset = uvd_v6_0_pre_soft_reset,
1044 .soft_reset = uvd_v6_0_soft_reset,
1045 .post_soft_reset = uvd_v6_0_post_soft_reset,
1046 .set_clockgating_state = uvd_v6_0_set_clockgating_state,
1047 .set_powergating_state = uvd_v6_0_set_powergating_state,
1050 static const struct amdgpu_ring_funcs uvd_v6_0_ring_phys_funcs = {
1051 .get_rptr = uvd_v6_0_ring_get_rptr,
1052 .get_wptr = uvd_v6_0_ring_get_wptr,
1053 .set_wptr = uvd_v6_0_ring_set_wptr,
1054 .parse_cs = amdgpu_uvd_ring_parse_cs,
1055 .emit_ib = uvd_v6_0_ring_emit_ib,
1056 .emit_fence = uvd_v6_0_ring_emit_fence,
1057 .emit_hdp_flush = uvd_v6_0_ring_emit_hdp_flush,
1058 .emit_hdp_invalidate = uvd_v6_0_ring_emit_hdp_invalidate,
1059 .test_ring = uvd_v6_0_ring_test_ring,
1060 .test_ib = amdgpu_uvd_ring_test_ib,
1061 .insert_nop = amdgpu_ring_insert_nop,
1062 .pad_ib = amdgpu_ring_generic_pad_ib,
1063 .begin_use = amdgpu_uvd_ring_begin_use,
1064 .end_use = amdgpu_uvd_ring_end_use,
1065 .get_emit_ib_size = uvd_v6_0_ring_get_emit_ib_size,
1066 .get_dma_frame_size = uvd_v6_0_ring_get_dma_frame_size,
1069 static const struct amdgpu_ring_funcs uvd_v6_0_ring_vm_funcs = {
1070 .get_rptr = uvd_v6_0_ring_get_rptr,
1071 .get_wptr = uvd_v6_0_ring_get_wptr,
1072 .set_wptr = uvd_v6_0_ring_set_wptr,
1074 .emit_ib = uvd_v6_0_ring_emit_ib,
1075 .emit_fence = uvd_v6_0_ring_emit_fence,
1076 .emit_vm_flush = uvd_v6_0_ring_emit_vm_flush,
1077 .emit_pipeline_sync = uvd_v6_0_ring_emit_pipeline_sync,
1078 .emit_hdp_flush = uvd_v6_0_ring_emit_hdp_flush,
1079 .emit_hdp_invalidate = uvd_v6_0_ring_emit_hdp_invalidate,
1080 .test_ring = uvd_v6_0_ring_test_ring,
1081 .test_ib = amdgpu_uvd_ring_test_ib,
1082 .insert_nop = amdgpu_ring_insert_nop,
1083 .pad_ib = amdgpu_ring_generic_pad_ib,
1084 .begin_use = amdgpu_uvd_ring_begin_use,
1085 .end_use = amdgpu_uvd_ring_end_use,
1086 .get_emit_ib_size = uvd_v6_0_ring_get_emit_ib_size,
1087 .get_dma_frame_size = uvd_v6_0_ring_get_dma_frame_size_vm,
1090 static void uvd_v6_0_set_ring_funcs(struct amdgpu_device *adev)
1092 if (adev->asic_type >= CHIP_POLARIS10) {
1093 adev->uvd.ring.funcs = &uvd_v6_0_ring_vm_funcs;
1094 DRM_INFO("UVD is enabled in VM mode\n");
1096 adev->uvd.ring.funcs = &uvd_v6_0_ring_phys_funcs;
1097 DRM_INFO("UVD is enabled in physical mode\n");
1101 static const struct amdgpu_irq_src_funcs uvd_v6_0_irq_funcs = {
1102 .set = uvd_v6_0_set_interrupt_state,
1103 .process = uvd_v6_0_process_interrupt,
1106 static void uvd_v6_0_set_irq_funcs(struct amdgpu_device *adev)
1108 adev->uvd.irq.num_types = 1;
1109 adev->uvd.irq.funcs = &uvd_v6_0_irq_funcs;