2 * Copyright 2016 Advanced Micro Devices, Inc.
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
24 #include <linux/firmware.h>
27 #include "amdgpu_vcn.h"
30 #include "soc15_common.h"
32 #include "vcn/vcn_1_0_offset.h"
33 #include "vcn/vcn_1_0_sh_mask.h"
34 #include "hdp/hdp_4_0_offset.h"
35 #include "mmhub/mmhub_9_1_offset.h"
36 #include "mmhub/mmhub_9_1_sh_mask.h"
38 #include "ivsrcid/vcn/irqsrcs_vcn_1_0.h"
40 static int vcn_v1_0_stop(struct amdgpu_device *adev);
41 static void vcn_v1_0_set_dec_ring_funcs(struct amdgpu_device *adev);
42 static void vcn_v1_0_set_enc_ring_funcs(struct amdgpu_device *adev);
43 static void vcn_v1_0_set_jpeg_ring_funcs(struct amdgpu_device *adev);
44 static void vcn_v1_0_set_irq_funcs(struct amdgpu_device *adev);
45 static void vcn_v1_0_jpeg_ring_set_patch_ring(struct amdgpu_ring *ring, uint32_t ptr);
48 * vcn_v1_0_early_init - set function pointers
50 * @handle: amdgpu_device pointer
52 * Set ring and irq function pointers
54 static int vcn_v1_0_early_init(void *handle)
56 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
58 adev->vcn.num_enc_rings = 2;
60 vcn_v1_0_set_dec_ring_funcs(adev);
61 vcn_v1_0_set_enc_ring_funcs(adev);
62 vcn_v1_0_set_jpeg_ring_funcs(adev);
63 vcn_v1_0_set_irq_funcs(adev);
69 * vcn_v1_0_sw_init - sw init for VCN block
71 * @handle: amdgpu_device pointer
73 * Load firmware and sw initialization
75 static int vcn_v1_0_sw_init(void *handle)
77 struct amdgpu_ring *ring;
79 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
82 r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_VCN, VCN_1_0__SRCID__UVD_SYSTEM_MESSAGE_INTERRUPT, &adev->vcn.irq);
87 for (i = 0; i < adev->vcn.num_enc_rings; ++i) {
88 r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_VCN, i + VCN_1_0__SRCID__UVD_ENC_GENERAL_PURPOSE,
95 r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_VCN, 126, &adev->vcn.irq);
99 r = amdgpu_vcn_sw_init(adev);
103 if (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) {
104 const struct common_firmware_header *hdr;
105 hdr = (const struct common_firmware_header *)adev->vcn.fw->data;
106 adev->firmware.ucode[AMDGPU_UCODE_ID_VCN].ucode_id = AMDGPU_UCODE_ID_VCN;
107 adev->firmware.ucode[AMDGPU_UCODE_ID_VCN].fw = adev->vcn.fw;
108 adev->firmware.fw_size +=
109 ALIGN(le32_to_cpu(hdr->ucode_size_bytes), PAGE_SIZE);
110 DRM_INFO("PSP loading VCN firmware\n");
113 r = amdgpu_vcn_resume(adev);
117 ring = &adev->vcn.ring_dec;
118 sprintf(ring->name, "vcn_dec");
119 r = amdgpu_ring_init(adev, ring, 512, &adev->vcn.irq, 0);
123 for (i = 0; i < adev->vcn.num_enc_rings; ++i) {
124 ring = &adev->vcn.ring_enc[i];
125 sprintf(ring->name, "vcn_enc%d", i);
126 r = amdgpu_ring_init(adev, ring, 512, &adev->vcn.irq, 0);
131 ring = &adev->vcn.ring_jpeg;
132 sprintf(ring->name, "vcn_jpeg");
133 r = amdgpu_ring_init(adev, ring, 512, &adev->vcn.irq, 0);
141 * vcn_v1_0_sw_fini - sw fini for VCN block
143 * @handle: amdgpu_device pointer
145 * VCN suspend and free up sw allocation
147 static int vcn_v1_0_sw_fini(void *handle)
150 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
152 r = amdgpu_vcn_suspend(adev);
156 r = amdgpu_vcn_sw_fini(adev);
162 * vcn_v1_0_hw_init - start and test VCN block
164 * @handle: amdgpu_device pointer
166 * Initialize the hardware, boot up the VCPU and do some testing
168 static int vcn_v1_0_hw_init(void *handle)
170 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
171 struct amdgpu_ring *ring = &adev->vcn.ring_dec;
175 r = amdgpu_ring_test_ring(ring);
181 for (i = 0; i < adev->vcn.num_enc_rings; ++i) {
182 ring = &adev->vcn.ring_enc[i];
184 r = amdgpu_ring_test_ring(ring);
191 ring = &adev->vcn.ring_jpeg;
193 r = amdgpu_ring_test_ring(ring);
201 DRM_INFO("VCN decode and encode initialized successfully.\n");
207 * vcn_v1_0_hw_fini - stop the hardware block
209 * @handle: amdgpu_device pointer
211 * Stop the VCN block, mark ring as not ready any more
213 static int vcn_v1_0_hw_fini(void *handle)
215 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
216 struct amdgpu_ring *ring = &adev->vcn.ring_dec;
218 if (RREG32_SOC15(VCN, 0, mmUVD_STATUS))
227 * vcn_v1_0_suspend - suspend VCN block
229 * @handle: amdgpu_device pointer
231 * HW fini and suspend VCN block
233 static int vcn_v1_0_suspend(void *handle)
236 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
238 r = vcn_v1_0_hw_fini(adev);
242 r = amdgpu_vcn_suspend(adev);
248 * vcn_v1_0_resume - resume VCN block
250 * @handle: amdgpu_device pointer
252 * Resume firmware and hw init VCN block
254 static int vcn_v1_0_resume(void *handle)
257 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
259 r = amdgpu_vcn_resume(adev);
263 r = vcn_v1_0_hw_init(adev);
269 * vcn_v1_0_mc_resume - memory controller programming
271 * @adev: amdgpu_device pointer
273 * Let the VCN memory controller know it's offsets
275 static void vcn_v1_0_mc_resume(struct amdgpu_device *adev)
277 uint32_t size = AMDGPU_GPU_PAGE_ALIGN(adev->vcn.fw->size + 4);
280 if (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) {
281 WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
282 (adev->firmware.ucode[AMDGPU_UCODE_ID_VCN].tmr_mc_addr_lo));
283 WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
284 (adev->firmware.ucode[AMDGPU_UCODE_ID_VCN].tmr_mc_addr_hi));
285 WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET0, 0);
288 WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
289 lower_32_bits(adev->vcn.gpu_addr));
290 WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
291 upper_32_bits(adev->vcn.gpu_addr));
293 WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET0,
294 AMDGPU_UVD_FIRMWARE_OFFSET >> 3);
297 WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_SIZE0, size);
299 WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_LOW,
300 lower_32_bits(adev->vcn.gpu_addr + offset));
301 WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_HIGH,
302 upper_32_bits(adev->vcn.gpu_addr + offset));
303 WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET1, 0);
304 WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_SIZE1, AMDGPU_VCN_HEAP_SIZE);
306 WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_LOW,
307 lower_32_bits(adev->vcn.gpu_addr + offset + AMDGPU_VCN_HEAP_SIZE));
308 WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_HIGH,
309 upper_32_bits(adev->vcn.gpu_addr + offset + AMDGPU_VCN_HEAP_SIZE));
310 WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET2, 0);
311 WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_SIZE2,
312 AMDGPU_VCN_STACK_SIZE + (AMDGPU_VCN_SESSION_SIZE * 40));
314 WREG32_SOC15(UVD, 0, mmUVD_UDEC_ADDR_CONFIG,
315 adev->gfx.config.gb_addr_config);
316 WREG32_SOC15(UVD, 0, mmUVD_UDEC_DB_ADDR_CONFIG,
317 adev->gfx.config.gb_addr_config);
318 WREG32_SOC15(UVD, 0, mmUVD_UDEC_DBW_ADDR_CONFIG,
319 adev->gfx.config.gb_addr_config);
323 * vcn_v1_0_disable_clock_gating - disable VCN clock gating
325 * @adev: amdgpu_device pointer
326 * @sw: enable SW clock gating
328 * Disable clock gating for VCN block
330 static void vcn_v1_0_disable_clock_gating(struct amdgpu_device *adev)
334 /* JPEG disable CGC */
335 data = RREG32_SOC15(VCN, 0, mmJPEG_CGC_CTRL);
337 if (adev->cg_flags & AMD_CG_SUPPORT_VCN_MGCG)
338 data |= 1 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
340 data &= ~JPEG_CGC_CTRL__DYN_CLOCK_MODE_MASK;
342 data |= 1 << JPEG_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
343 data |= 4 << JPEG_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
344 WREG32_SOC15(VCN, 0, mmJPEG_CGC_CTRL, data);
346 data = RREG32_SOC15(VCN, 0, mmJPEG_CGC_GATE);
347 data &= ~(JPEG_CGC_GATE__JPEG_MASK | JPEG_CGC_GATE__JPEG2_MASK);
348 WREG32_SOC15(VCN, 0, mmJPEG_CGC_GATE, data);
350 /* UVD disable CGC */
351 data = RREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL);
352 if (adev->cg_flags & AMD_CG_SUPPORT_VCN_MGCG)
353 data |= 1 << UVD_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
355 data &= ~ UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK;
357 data |= 1 << UVD_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
358 data |= 4 << UVD_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
359 WREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL, data);
361 data = RREG32_SOC15(VCN, 0, mmUVD_CGC_GATE);
362 data &= ~(UVD_CGC_GATE__SYS_MASK
363 | UVD_CGC_GATE__UDEC_MASK
364 | UVD_CGC_GATE__MPEG2_MASK
365 | UVD_CGC_GATE__REGS_MASK
366 | UVD_CGC_GATE__RBC_MASK
367 | UVD_CGC_GATE__LMI_MC_MASK
368 | UVD_CGC_GATE__LMI_UMC_MASK
369 | UVD_CGC_GATE__IDCT_MASK
370 | UVD_CGC_GATE__MPRD_MASK
371 | UVD_CGC_GATE__MPC_MASK
372 | UVD_CGC_GATE__LBSI_MASK
373 | UVD_CGC_GATE__LRBBM_MASK
374 | UVD_CGC_GATE__UDEC_RE_MASK
375 | UVD_CGC_GATE__UDEC_CM_MASK
376 | UVD_CGC_GATE__UDEC_IT_MASK
377 | UVD_CGC_GATE__UDEC_DB_MASK
378 | UVD_CGC_GATE__UDEC_MP_MASK
379 | UVD_CGC_GATE__WCB_MASK
380 | UVD_CGC_GATE__VCPU_MASK
381 | UVD_CGC_GATE__SCPU_MASK);
382 WREG32_SOC15(VCN, 0, mmUVD_CGC_GATE, data);
384 data = RREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL);
385 data &= ~(UVD_CGC_CTRL__UDEC_RE_MODE_MASK
386 | UVD_CGC_CTRL__UDEC_CM_MODE_MASK
387 | UVD_CGC_CTRL__UDEC_IT_MODE_MASK
388 | UVD_CGC_CTRL__UDEC_DB_MODE_MASK
389 | UVD_CGC_CTRL__UDEC_MP_MODE_MASK
390 | UVD_CGC_CTRL__SYS_MODE_MASK
391 | UVD_CGC_CTRL__UDEC_MODE_MASK
392 | UVD_CGC_CTRL__MPEG2_MODE_MASK
393 | UVD_CGC_CTRL__REGS_MODE_MASK
394 | UVD_CGC_CTRL__RBC_MODE_MASK
395 | UVD_CGC_CTRL__LMI_MC_MODE_MASK
396 | UVD_CGC_CTRL__LMI_UMC_MODE_MASK
397 | UVD_CGC_CTRL__IDCT_MODE_MASK
398 | UVD_CGC_CTRL__MPRD_MODE_MASK
399 | UVD_CGC_CTRL__MPC_MODE_MASK
400 | UVD_CGC_CTRL__LBSI_MODE_MASK
401 | UVD_CGC_CTRL__LRBBM_MODE_MASK
402 | UVD_CGC_CTRL__WCB_MODE_MASK
403 | UVD_CGC_CTRL__VCPU_MODE_MASK
404 | UVD_CGC_CTRL__SCPU_MODE_MASK);
405 WREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL, data);
408 data = RREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_GATE);
409 data |= (UVD_SUVD_CGC_GATE__SRE_MASK
410 | UVD_SUVD_CGC_GATE__SIT_MASK
411 | UVD_SUVD_CGC_GATE__SMP_MASK
412 | UVD_SUVD_CGC_GATE__SCM_MASK
413 | UVD_SUVD_CGC_GATE__SDB_MASK
414 | UVD_SUVD_CGC_GATE__SRE_H264_MASK
415 | UVD_SUVD_CGC_GATE__SRE_HEVC_MASK
416 | UVD_SUVD_CGC_GATE__SIT_H264_MASK
417 | UVD_SUVD_CGC_GATE__SIT_HEVC_MASK
418 | UVD_SUVD_CGC_GATE__SCM_H264_MASK
419 | UVD_SUVD_CGC_GATE__SCM_HEVC_MASK
420 | UVD_SUVD_CGC_GATE__SDB_H264_MASK
421 | UVD_SUVD_CGC_GATE__SDB_HEVC_MASK
422 | UVD_SUVD_CGC_GATE__SCLR_MASK
423 | UVD_SUVD_CGC_GATE__UVD_SC_MASK
424 | UVD_SUVD_CGC_GATE__ENT_MASK
425 | UVD_SUVD_CGC_GATE__SIT_HEVC_DEC_MASK
426 | UVD_SUVD_CGC_GATE__SIT_HEVC_ENC_MASK
427 | UVD_SUVD_CGC_GATE__SITE_MASK
428 | UVD_SUVD_CGC_GATE__SRE_VP9_MASK
429 | UVD_SUVD_CGC_GATE__SCM_VP9_MASK
430 | UVD_SUVD_CGC_GATE__SIT_VP9_DEC_MASK
431 | UVD_SUVD_CGC_GATE__SDB_VP9_MASK
432 | UVD_SUVD_CGC_GATE__IME_HEVC_MASK);
433 WREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_GATE, data);
435 data = RREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_CTRL);
436 data &= ~(UVD_SUVD_CGC_CTRL__SRE_MODE_MASK
437 | UVD_SUVD_CGC_CTRL__SIT_MODE_MASK
438 | UVD_SUVD_CGC_CTRL__SMP_MODE_MASK
439 | UVD_SUVD_CGC_CTRL__SCM_MODE_MASK
440 | UVD_SUVD_CGC_CTRL__SDB_MODE_MASK
441 | UVD_SUVD_CGC_CTRL__SCLR_MODE_MASK
442 | UVD_SUVD_CGC_CTRL__UVD_SC_MODE_MASK
443 | UVD_SUVD_CGC_CTRL__ENT_MODE_MASK
444 | UVD_SUVD_CGC_CTRL__IME_MODE_MASK
445 | UVD_SUVD_CGC_CTRL__SITE_MODE_MASK);
446 WREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_CTRL, data);
450 * vcn_v1_0_enable_clock_gating - enable VCN clock gating
452 * @adev: amdgpu_device pointer
453 * @sw: enable SW clock gating
455 * Enable clock gating for VCN block
457 static void vcn_v1_0_enable_clock_gating(struct amdgpu_device *adev)
461 /* enable JPEG CGC */
462 data = RREG32_SOC15(VCN, 0, mmJPEG_CGC_CTRL);
463 if (adev->cg_flags & AMD_CG_SUPPORT_VCN_MGCG)
464 data |= 1 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
466 data |= 0 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
467 data |= 1 << JPEG_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
468 data |= 4 << JPEG_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
469 WREG32_SOC15(VCN, 0, mmJPEG_CGC_CTRL, data);
471 data = RREG32_SOC15(VCN, 0, mmJPEG_CGC_GATE);
472 data |= (JPEG_CGC_GATE__JPEG_MASK | JPEG_CGC_GATE__JPEG2_MASK);
473 WREG32_SOC15(VCN, 0, mmJPEG_CGC_GATE, data);
476 data = RREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL);
477 if (adev->cg_flags & AMD_CG_SUPPORT_VCN_MGCG)
478 data |= 1 << UVD_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
480 data |= 0 << UVD_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
481 data |= 1 << UVD_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
482 data |= 4 << UVD_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
483 WREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL, data);
485 data = RREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL);
486 data |= (UVD_CGC_CTRL__UDEC_RE_MODE_MASK
487 | UVD_CGC_CTRL__UDEC_CM_MODE_MASK
488 | UVD_CGC_CTRL__UDEC_IT_MODE_MASK
489 | UVD_CGC_CTRL__UDEC_DB_MODE_MASK
490 | UVD_CGC_CTRL__UDEC_MP_MODE_MASK
491 | UVD_CGC_CTRL__SYS_MODE_MASK
492 | UVD_CGC_CTRL__UDEC_MODE_MASK
493 | UVD_CGC_CTRL__MPEG2_MODE_MASK
494 | UVD_CGC_CTRL__REGS_MODE_MASK
495 | UVD_CGC_CTRL__RBC_MODE_MASK
496 | UVD_CGC_CTRL__LMI_MC_MODE_MASK
497 | UVD_CGC_CTRL__LMI_UMC_MODE_MASK
498 | UVD_CGC_CTRL__IDCT_MODE_MASK
499 | UVD_CGC_CTRL__MPRD_MODE_MASK
500 | UVD_CGC_CTRL__MPC_MODE_MASK
501 | UVD_CGC_CTRL__LBSI_MODE_MASK
502 | UVD_CGC_CTRL__LRBBM_MODE_MASK
503 | UVD_CGC_CTRL__WCB_MODE_MASK
504 | UVD_CGC_CTRL__VCPU_MODE_MASK
505 | UVD_CGC_CTRL__SCPU_MODE_MASK);
506 WREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL, data);
508 data = RREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_CTRL);
509 data |= (UVD_SUVD_CGC_CTRL__SRE_MODE_MASK
510 | UVD_SUVD_CGC_CTRL__SIT_MODE_MASK
511 | UVD_SUVD_CGC_CTRL__SMP_MODE_MASK
512 | UVD_SUVD_CGC_CTRL__SCM_MODE_MASK
513 | UVD_SUVD_CGC_CTRL__SDB_MODE_MASK
514 | UVD_SUVD_CGC_CTRL__SCLR_MODE_MASK
515 | UVD_SUVD_CGC_CTRL__UVD_SC_MODE_MASK
516 | UVD_SUVD_CGC_CTRL__ENT_MODE_MASK
517 | UVD_SUVD_CGC_CTRL__IME_MODE_MASK
518 | UVD_SUVD_CGC_CTRL__SITE_MODE_MASK);
519 WREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_CTRL, data);
522 static void vcn_1_0_disable_static_power_gating(struct amdgpu_device *adev)
527 if (adev->pg_flags & AMD_PG_SUPPORT_VCN) {
528 data = (1 << UVD_PGFSM_CONFIG__UVDM_PWR_CONFIG__SHIFT
529 | 1 << UVD_PGFSM_CONFIG__UVDU_PWR_CONFIG__SHIFT
530 | 2 << UVD_PGFSM_CONFIG__UVDF_PWR_CONFIG__SHIFT
531 | 2 << UVD_PGFSM_CONFIG__UVDC_PWR_CONFIG__SHIFT
532 | 2 << UVD_PGFSM_CONFIG__UVDB_PWR_CONFIG__SHIFT
533 | 2 << UVD_PGFSM_CONFIG__UVDIL_PWR_CONFIG__SHIFT
534 | 2 << UVD_PGFSM_CONFIG__UVDIR_PWR_CONFIG__SHIFT
535 | 2 << UVD_PGFSM_CONFIG__UVDTD_PWR_CONFIG__SHIFT
536 | 2 << UVD_PGFSM_CONFIG__UVDTE_PWR_CONFIG__SHIFT
537 | 2 << UVD_PGFSM_CONFIG__UVDE_PWR_CONFIG__SHIFT
538 | 2 << UVD_PGFSM_CONFIG__UVDW_PWR_CONFIG__SHIFT);
540 WREG32_SOC15(VCN, 0, mmUVD_PGFSM_CONFIG, data);
541 SOC15_WAIT_ON_RREG(VCN, 0, mmUVD_PGFSM_STATUS, UVD_PGFSM_STATUS__UVDM_UVDU_PWR_ON, 0xFFFFFF, ret);
543 data = (1 << UVD_PGFSM_CONFIG__UVDM_PWR_CONFIG__SHIFT
544 | 1 << UVD_PGFSM_CONFIG__UVDU_PWR_CONFIG__SHIFT
545 | 1 << UVD_PGFSM_CONFIG__UVDF_PWR_CONFIG__SHIFT
546 | 1 << UVD_PGFSM_CONFIG__UVDC_PWR_CONFIG__SHIFT
547 | 1 << UVD_PGFSM_CONFIG__UVDB_PWR_CONFIG__SHIFT
548 | 1 << UVD_PGFSM_CONFIG__UVDIL_PWR_CONFIG__SHIFT
549 | 1 << UVD_PGFSM_CONFIG__UVDIR_PWR_CONFIG__SHIFT
550 | 1 << UVD_PGFSM_CONFIG__UVDTD_PWR_CONFIG__SHIFT
551 | 1 << UVD_PGFSM_CONFIG__UVDTE_PWR_CONFIG__SHIFT
552 | 1 << UVD_PGFSM_CONFIG__UVDE_PWR_CONFIG__SHIFT
553 | 1 << UVD_PGFSM_CONFIG__UVDW_PWR_CONFIG__SHIFT);
554 WREG32_SOC15(VCN, 0, mmUVD_PGFSM_CONFIG, data);
555 SOC15_WAIT_ON_RREG(VCN, 0, mmUVD_PGFSM_STATUS, 0, 0xFFFFFFFF, ret);
558 /* polling UVD_PGFSM_STATUS to confirm UVDM_PWR_STATUS , UVDU_PWR_STATUS are 0 (power on) */
560 data = RREG32_SOC15(VCN, 0, mmUVD_POWER_STATUS);
562 if (adev->pg_flags & AMD_PG_SUPPORT_VCN)
563 data |= UVD_PGFSM_CONFIG__UVDM_UVDU_PWR_ON | UVD_POWER_STATUS__UVD_PG_EN_MASK;
565 WREG32_SOC15(VCN, 0, mmUVD_POWER_STATUS, data);
568 static void vcn_1_0_enable_static_power_gating(struct amdgpu_device *adev)
573 if (adev->pg_flags & AMD_PG_SUPPORT_VCN) {
574 /* Before power off, this indicator has to be turned on */
575 data = RREG32_SOC15(VCN, 0, mmUVD_POWER_STATUS);
576 data &= ~UVD_POWER_STATUS__UVD_POWER_STATUS_MASK;
577 data |= UVD_POWER_STATUS__UVD_POWER_STATUS_TILES_OFF;
578 WREG32_SOC15(VCN, 0, mmUVD_POWER_STATUS, data);
581 data = (2 << UVD_PGFSM_CONFIG__UVDM_PWR_CONFIG__SHIFT
582 | 2 << UVD_PGFSM_CONFIG__UVDU_PWR_CONFIG__SHIFT
583 | 2 << UVD_PGFSM_CONFIG__UVDF_PWR_CONFIG__SHIFT
584 | 2 << UVD_PGFSM_CONFIG__UVDC_PWR_CONFIG__SHIFT
585 | 2 << UVD_PGFSM_CONFIG__UVDB_PWR_CONFIG__SHIFT
586 | 2 << UVD_PGFSM_CONFIG__UVDIL_PWR_CONFIG__SHIFT
587 | 2 << UVD_PGFSM_CONFIG__UVDIR_PWR_CONFIG__SHIFT
588 | 2 << UVD_PGFSM_CONFIG__UVDTD_PWR_CONFIG__SHIFT
589 | 2 << UVD_PGFSM_CONFIG__UVDTE_PWR_CONFIG__SHIFT
590 | 2 << UVD_PGFSM_CONFIG__UVDE_PWR_CONFIG__SHIFT
591 | 2 << UVD_PGFSM_CONFIG__UVDW_PWR_CONFIG__SHIFT);
593 WREG32_SOC15(VCN, 0, mmUVD_PGFSM_CONFIG, data);
595 data = (2 << UVD_PGFSM_STATUS__UVDM_PWR_STATUS__SHIFT
596 | 2 << UVD_PGFSM_STATUS__UVDU_PWR_STATUS__SHIFT
597 | 2 << UVD_PGFSM_STATUS__UVDF_PWR_STATUS__SHIFT
598 | 2 << UVD_PGFSM_STATUS__UVDC_PWR_STATUS__SHIFT
599 | 2 << UVD_PGFSM_STATUS__UVDB_PWR_STATUS__SHIFT
600 | 2 << UVD_PGFSM_STATUS__UVDIL_PWR_STATUS__SHIFT
601 | 2 << UVD_PGFSM_STATUS__UVDIR_PWR_STATUS__SHIFT
602 | 2 << UVD_PGFSM_STATUS__UVDTD_PWR_STATUS__SHIFT
603 | 2 << UVD_PGFSM_STATUS__UVDTE_PWR_STATUS__SHIFT
604 | 2 << UVD_PGFSM_STATUS__UVDE_PWR_STATUS__SHIFT
605 | 2 << UVD_PGFSM_STATUS__UVDW_PWR_STATUS__SHIFT);
606 SOC15_WAIT_ON_RREG(VCN, 0, mmUVD_PGFSM_STATUS, data, 0xFFFFFFFF, ret);
611 * vcn_v1_0_start - start VCN block
613 * @adev: amdgpu_device pointer
615 * Setup and start the VCN block
617 static int vcn_v1_0_start(struct amdgpu_device *adev)
619 struct amdgpu_ring *ring = &adev->vcn.ring_dec;
620 uint32_t rb_bufsz, tmp;
621 uint32_t lmi_swap_cntl;
624 /* disable byte swapping */
627 vcn_1_0_disable_static_power_gating(adev);
628 /* disable clock gating */
629 vcn_v1_0_disable_clock_gating(adev);
631 vcn_v1_0_mc_resume(adev);
633 /* disable interupt */
634 WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_MASTINT_EN), 0,
635 ~UVD_MASTINT_EN__VCPU_EN_MASK);
637 /* stall UMC and register bus before resetting VCPU */
638 WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2),
639 UVD_LMI_CTRL2__STALL_ARB_UMC_MASK,
640 ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
643 /* put LMI, VCPU, RBC etc... into reset */
644 WREG32_SOC15(UVD, 0, mmUVD_SOFT_RESET,
645 UVD_SOFT_RESET__LMI_SOFT_RESET_MASK |
646 UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK |
647 UVD_SOFT_RESET__LBSI_SOFT_RESET_MASK |
648 UVD_SOFT_RESET__RBC_SOFT_RESET_MASK |
649 UVD_SOFT_RESET__CSM_SOFT_RESET_MASK |
650 UVD_SOFT_RESET__CXW_SOFT_RESET_MASK |
651 UVD_SOFT_RESET__TAP_SOFT_RESET_MASK |
652 UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK);
655 /* initialize VCN memory controller */
656 WREG32_SOC15(UVD, 0, mmUVD_LMI_CTRL,
657 (0x40 << UVD_LMI_CTRL__WRITE_CLEAN_TIMER__SHIFT) |
658 UVD_LMI_CTRL__WRITE_CLEAN_TIMER_EN_MASK |
659 UVD_LMI_CTRL__DATA_COHERENCY_EN_MASK |
660 UVD_LMI_CTRL__VCPU_DATA_COHERENCY_EN_MASK |
661 UVD_LMI_CTRL__REQ_MODE_MASK |
665 /* swap (8 in 32) RB and IB */
668 WREG32_SOC15(UVD, 0, mmUVD_LMI_SWAP_CNTL, lmi_swap_cntl);
670 WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUXA0, 0x40c2040);
671 WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUXA1, 0x0);
672 WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUXB0, 0x40c2040);
673 WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUXB1, 0x0);
674 WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_ALU, 0);
675 WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUX, 0x88);
677 /* take all subblocks out of reset, except VCPU */
678 WREG32_SOC15(UVD, 0, mmUVD_SOFT_RESET,
679 UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
682 /* enable VCPU clock */
683 WREG32_SOC15(UVD, 0, mmUVD_VCPU_CNTL,
684 UVD_VCPU_CNTL__CLK_EN_MASK);
687 WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2), 0,
688 ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
690 /* boot up the VCPU */
691 WREG32_SOC15(UVD, 0, mmUVD_SOFT_RESET, 0);
694 for (i = 0; i < 10; ++i) {
697 for (j = 0; j < 100; ++j) {
698 status = RREG32_SOC15(UVD, 0, mmUVD_STATUS);
707 DRM_ERROR("VCN decode not responding, trying to reset the VCPU!!!\n");
708 WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET),
709 UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK,
710 ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
712 WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET), 0,
713 ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
719 DRM_ERROR("VCN decode not responding, giving up!!!\n");
722 /* enable master interrupt */
723 WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_MASTINT_EN),
724 (UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK),
725 ~(UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK));
727 /* clear the bit 4 of VCN_STATUS */
728 WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_STATUS), 0,
729 ~(2 << UVD_STATUS__VCPU_REPORT__SHIFT));
731 /* force RBC into idle state */
732 rb_bufsz = order_base_2(ring->ring_size);
733 tmp = REG_SET_FIELD(0, UVD_RBC_RB_CNTL, RB_BUFSZ, rb_bufsz);
734 tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_BLKSZ, 1);
735 tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_FETCH, 1);
736 tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_WPTR_POLL_EN, 0);
737 tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_UPDATE, 1);
738 tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_RPTR_WR_EN, 1);
739 WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_CNTL, tmp);
741 /* set the write pointer delay */
742 WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR_CNTL, 0);
744 /* set the wb address */
745 WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR_ADDR,
746 (upper_32_bits(ring->gpu_addr) >> 2));
748 /* programm the RB_BASE for ring buffer */
749 WREG32_SOC15(UVD, 0, mmUVD_LMI_RBC_RB_64BIT_BAR_LOW,
750 lower_32_bits(ring->gpu_addr));
751 WREG32_SOC15(UVD, 0, mmUVD_LMI_RBC_RB_64BIT_BAR_HIGH,
752 upper_32_bits(ring->gpu_addr));
754 /* Initialize the ring buffer's read and write pointers */
755 WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR, 0);
757 ring->wptr = RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR);
758 WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR,
759 lower_32_bits(ring->wptr));
761 WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_RBC_RB_CNTL), 0,
762 ~UVD_RBC_RB_CNTL__RB_NO_FETCH_MASK);
764 ring = &adev->vcn.ring_enc[0];
765 WREG32_SOC15(UVD, 0, mmUVD_RB_RPTR, lower_32_bits(ring->wptr));
766 WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR, lower_32_bits(ring->wptr));
767 WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_LO, ring->gpu_addr);
768 WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_HI, upper_32_bits(ring->gpu_addr));
769 WREG32_SOC15(UVD, 0, mmUVD_RB_SIZE, ring->ring_size / 4);
771 ring = &adev->vcn.ring_enc[1];
772 WREG32_SOC15(UVD, 0, mmUVD_RB_RPTR2, lower_32_bits(ring->wptr));
773 WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR2, lower_32_bits(ring->wptr));
774 WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_LO2, ring->gpu_addr);
775 WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_HI2, upper_32_bits(ring->gpu_addr));
776 WREG32_SOC15(UVD, 0, mmUVD_RB_SIZE2, ring->ring_size / 4);
778 ring = &adev->vcn.ring_jpeg;
779 WREG32_SOC15(UVD, 0, mmUVD_LMI_JRBC_RB_VMID, 0);
780 WREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_CNTL, (0x00000001L | 0x00000002L));
781 WREG32_SOC15(UVD, 0, mmUVD_LMI_JRBC_RB_64BIT_BAR_LOW, lower_32_bits(ring->gpu_addr));
782 WREG32_SOC15(UVD, 0, mmUVD_LMI_JRBC_RB_64BIT_BAR_HIGH, upper_32_bits(ring->gpu_addr));
783 WREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_RPTR, 0);
784 WREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_WPTR, 0);
785 WREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_CNTL, 0x00000002L);
787 /* initialize wptr */
788 ring->wptr = RREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_WPTR);
790 /* copy patch commands to the jpeg ring */
791 vcn_v1_0_jpeg_ring_set_patch_ring(ring,
792 (ring->wptr + ring->max_dw * amdgpu_sched_hw_submission));
798 * vcn_v1_0_stop - stop VCN block
800 * @adev: amdgpu_device pointer
804 static int vcn_v1_0_stop(struct amdgpu_device *adev)
806 /* force RBC into idle state */
807 WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_CNTL, 0x11010101);
809 /* Stall UMC and register bus before resetting VCPU */
810 WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2),
811 UVD_LMI_CTRL2__STALL_ARB_UMC_MASK,
812 ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
815 /* put VCPU into reset */
816 WREG32_SOC15(UVD, 0, mmUVD_SOFT_RESET,
817 UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
820 /* disable VCPU clock */
821 WREG32_SOC15(UVD, 0, mmUVD_VCPU_CNTL, 0x0);
823 /* Unstall UMC and register bus */
824 WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2), 0,
825 ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
827 WREG32_SOC15(VCN, 0, mmUVD_STATUS, 0);
829 vcn_v1_0_enable_clock_gating(adev);
830 vcn_1_0_enable_static_power_gating(adev);
834 static bool vcn_v1_0_is_idle(void *handle)
836 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
838 return (RREG32_SOC15(VCN, 0, mmUVD_STATUS) == 0x2);
841 static int vcn_v1_0_wait_for_idle(void *handle)
843 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
846 SOC15_WAIT_ON_RREG(VCN, 0, mmUVD_STATUS, 0x2, 0x2, ret);
851 static int vcn_v1_0_set_clockgating_state(void *handle,
852 enum amd_clockgating_state state)
854 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
855 bool enable = (state == AMD_CG_STATE_GATE) ? true : false;
858 /* wait for STATUS to clear */
859 if (vcn_v1_0_is_idle(handle))
861 vcn_v1_0_enable_clock_gating(adev);
863 /* disable HW gating and enable Sw gating */
864 vcn_v1_0_disable_clock_gating(adev);
870 * vcn_v1_0_dec_ring_get_rptr - get read pointer
872 * @ring: amdgpu_ring pointer
874 * Returns the current hardware read pointer
876 static uint64_t vcn_v1_0_dec_ring_get_rptr(struct amdgpu_ring *ring)
878 struct amdgpu_device *adev = ring->adev;
880 return RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR);
884 * vcn_v1_0_dec_ring_get_wptr - get write pointer
886 * @ring: amdgpu_ring pointer
888 * Returns the current hardware write pointer
890 static uint64_t vcn_v1_0_dec_ring_get_wptr(struct amdgpu_ring *ring)
892 struct amdgpu_device *adev = ring->adev;
894 return RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR);
898 * vcn_v1_0_dec_ring_set_wptr - set write pointer
900 * @ring: amdgpu_ring pointer
902 * Commits the write pointer to the hardware
904 static void vcn_v1_0_dec_ring_set_wptr(struct amdgpu_ring *ring)
906 struct amdgpu_device *adev = ring->adev;
908 WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR, lower_32_bits(ring->wptr));
912 * vcn_v1_0_dec_ring_insert_start - insert a start command
914 * @ring: amdgpu_ring pointer
916 * Write a start command to the ring.
918 static void vcn_v1_0_dec_ring_insert_start(struct amdgpu_ring *ring)
920 struct amdgpu_device *adev = ring->adev;
922 amdgpu_ring_write(ring,
923 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
924 amdgpu_ring_write(ring, 0);
925 amdgpu_ring_write(ring,
926 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
927 amdgpu_ring_write(ring, VCN_DEC_CMD_PACKET_START << 1);
931 * vcn_v1_0_dec_ring_insert_end - insert a end command
933 * @ring: amdgpu_ring pointer
935 * Write a end command to the ring.
937 static void vcn_v1_0_dec_ring_insert_end(struct amdgpu_ring *ring)
939 struct amdgpu_device *adev = ring->adev;
941 amdgpu_ring_write(ring,
942 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
943 amdgpu_ring_write(ring, VCN_DEC_CMD_PACKET_END << 1);
947 * vcn_v1_0_dec_ring_emit_fence - emit an fence & trap command
949 * @ring: amdgpu_ring pointer
950 * @fence: fence to emit
952 * Write a fence and a trap command to the ring.
954 static void vcn_v1_0_dec_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq,
957 struct amdgpu_device *adev = ring->adev;
959 WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
961 amdgpu_ring_write(ring,
962 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_CONTEXT_ID), 0));
963 amdgpu_ring_write(ring, seq);
964 amdgpu_ring_write(ring,
965 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
966 amdgpu_ring_write(ring, addr & 0xffffffff);
967 amdgpu_ring_write(ring,
968 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1), 0));
969 amdgpu_ring_write(ring, upper_32_bits(addr) & 0xff);
970 amdgpu_ring_write(ring,
971 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
972 amdgpu_ring_write(ring, VCN_DEC_CMD_FENCE << 1);
974 amdgpu_ring_write(ring,
975 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
976 amdgpu_ring_write(ring, 0);
977 amdgpu_ring_write(ring,
978 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1), 0));
979 amdgpu_ring_write(ring, 0);
980 amdgpu_ring_write(ring,
981 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
982 amdgpu_ring_write(ring, VCN_DEC_CMD_TRAP << 1);
986 * vcn_v1_0_dec_ring_emit_ib - execute indirect buffer
988 * @ring: amdgpu_ring pointer
989 * @ib: indirect buffer to execute
991 * Write ring commands to execute the indirect buffer
993 static void vcn_v1_0_dec_ring_emit_ib(struct amdgpu_ring *ring,
994 struct amdgpu_ib *ib,
995 unsigned vmid, bool ctx_switch)
997 struct amdgpu_device *adev = ring->adev;
999 amdgpu_ring_write(ring,
1000 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_RBC_IB_VMID), 0));
1001 amdgpu_ring_write(ring, vmid);
1003 amdgpu_ring_write(ring,
1004 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_RBC_IB_64BIT_BAR_LOW), 0));
1005 amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
1006 amdgpu_ring_write(ring,
1007 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_RBC_IB_64BIT_BAR_HIGH), 0));
1008 amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
1009 amdgpu_ring_write(ring,
1010 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_RBC_IB_SIZE), 0));
1011 amdgpu_ring_write(ring, ib->length_dw);
1014 static void vcn_v1_0_dec_ring_emit_reg_wait(struct amdgpu_ring *ring,
1015 uint32_t reg, uint32_t val,
1018 struct amdgpu_device *adev = ring->adev;
1020 amdgpu_ring_write(ring,
1021 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
1022 amdgpu_ring_write(ring, reg << 2);
1023 amdgpu_ring_write(ring,
1024 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1), 0));
1025 amdgpu_ring_write(ring, val);
1026 amdgpu_ring_write(ring,
1027 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GP_SCRATCH8), 0));
1028 amdgpu_ring_write(ring, mask);
1029 amdgpu_ring_write(ring,
1030 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
1031 amdgpu_ring_write(ring, VCN_DEC_CMD_REG_READ_COND_WAIT << 1);
1034 static void vcn_v1_0_dec_ring_emit_vm_flush(struct amdgpu_ring *ring,
1035 unsigned vmid, uint64_t pd_addr)
1037 struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
1038 uint32_t data0, data1, mask;
1040 pd_addr = amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
1042 /* wait for register write */
1043 data0 = hub->ctx0_ptb_addr_lo32 + vmid * 2;
1044 data1 = lower_32_bits(pd_addr);
1046 vcn_v1_0_dec_ring_emit_reg_wait(ring, data0, data1, mask);
1049 static void vcn_v1_0_dec_ring_emit_wreg(struct amdgpu_ring *ring,
1050 uint32_t reg, uint32_t val)
1052 struct amdgpu_device *adev = ring->adev;
1054 amdgpu_ring_write(ring,
1055 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
1056 amdgpu_ring_write(ring, reg << 2);
1057 amdgpu_ring_write(ring,
1058 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1), 0));
1059 amdgpu_ring_write(ring, val);
1060 amdgpu_ring_write(ring,
1061 PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
1062 amdgpu_ring_write(ring, VCN_DEC_CMD_WRITE_REG << 1);
1066 * vcn_v1_0_enc_ring_get_rptr - get enc read pointer
1068 * @ring: amdgpu_ring pointer
1070 * Returns the current hardware enc read pointer
1072 static uint64_t vcn_v1_0_enc_ring_get_rptr(struct amdgpu_ring *ring)
1074 struct amdgpu_device *adev = ring->adev;
1076 if (ring == &adev->vcn.ring_enc[0])
1077 return RREG32_SOC15(UVD, 0, mmUVD_RB_RPTR);
1079 return RREG32_SOC15(UVD, 0, mmUVD_RB_RPTR2);
1083 * vcn_v1_0_enc_ring_get_wptr - get enc write pointer
1085 * @ring: amdgpu_ring pointer
1087 * Returns the current hardware enc write pointer
1089 static uint64_t vcn_v1_0_enc_ring_get_wptr(struct amdgpu_ring *ring)
1091 struct amdgpu_device *adev = ring->adev;
1093 if (ring == &adev->vcn.ring_enc[0])
1094 return RREG32_SOC15(UVD, 0, mmUVD_RB_WPTR);
1096 return RREG32_SOC15(UVD, 0, mmUVD_RB_WPTR2);
1100 * vcn_v1_0_enc_ring_set_wptr - set enc write pointer
1102 * @ring: amdgpu_ring pointer
1104 * Commits the enc write pointer to the hardware
1106 static void vcn_v1_0_enc_ring_set_wptr(struct amdgpu_ring *ring)
1108 struct amdgpu_device *adev = ring->adev;
1110 if (ring == &adev->vcn.ring_enc[0])
1111 WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR,
1112 lower_32_bits(ring->wptr));
1114 WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR2,
1115 lower_32_bits(ring->wptr));
1119 * vcn_v1_0_enc_ring_emit_fence - emit an enc fence & trap command
1121 * @ring: amdgpu_ring pointer
1122 * @fence: fence to emit
1124 * Write enc a fence and a trap command to the ring.
1126 static void vcn_v1_0_enc_ring_emit_fence(struct amdgpu_ring *ring, u64 addr,
1127 u64 seq, unsigned flags)
1129 WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
1131 amdgpu_ring_write(ring, VCN_ENC_CMD_FENCE);
1132 amdgpu_ring_write(ring, addr);
1133 amdgpu_ring_write(ring, upper_32_bits(addr));
1134 amdgpu_ring_write(ring, seq);
1135 amdgpu_ring_write(ring, VCN_ENC_CMD_TRAP);
1138 static void vcn_v1_0_enc_ring_insert_end(struct amdgpu_ring *ring)
1140 amdgpu_ring_write(ring, VCN_ENC_CMD_END);
1144 * vcn_v1_0_enc_ring_emit_ib - enc execute indirect buffer
1146 * @ring: amdgpu_ring pointer
1147 * @ib: indirect buffer to execute
1149 * Write enc ring commands to execute the indirect buffer
1151 static void vcn_v1_0_enc_ring_emit_ib(struct amdgpu_ring *ring,
1152 struct amdgpu_ib *ib, unsigned int vmid, bool ctx_switch)
1154 amdgpu_ring_write(ring, VCN_ENC_CMD_IB);
1155 amdgpu_ring_write(ring, vmid);
1156 amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
1157 amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
1158 amdgpu_ring_write(ring, ib->length_dw);
1161 static void vcn_v1_0_enc_ring_emit_reg_wait(struct amdgpu_ring *ring,
1162 uint32_t reg, uint32_t val,
1165 amdgpu_ring_write(ring, VCN_ENC_CMD_REG_WAIT);
1166 amdgpu_ring_write(ring, reg << 2);
1167 amdgpu_ring_write(ring, mask);
1168 amdgpu_ring_write(ring, val);
1171 static void vcn_v1_0_enc_ring_emit_vm_flush(struct amdgpu_ring *ring,
1172 unsigned int vmid, uint64_t pd_addr)
1174 struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
1176 pd_addr = amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
1178 /* wait for reg writes */
1179 vcn_v1_0_enc_ring_emit_reg_wait(ring, hub->ctx0_ptb_addr_lo32 + vmid * 2,
1180 lower_32_bits(pd_addr), 0xffffffff);
1183 static void vcn_v1_0_enc_ring_emit_wreg(struct amdgpu_ring *ring,
1184 uint32_t reg, uint32_t val)
1186 amdgpu_ring_write(ring, VCN_ENC_CMD_REG_WRITE);
1187 amdgpu_ring_write(ring, reg << 2);
1188 amdgpu_ring_write(ring, val);
1193 * vcn_v1_0_jpeg_ring_get_rptr - get read pointer
1195 * @ring: amdgpu_ring pointer
1197 * Returns the current hardware read pointer
1199 static uint64_t vcn_v1_0_jpeg_ring_get_rptr(struct amdgpu_ring *ring)
1201 struct amdgpu_device *adev = ring->adev;
1203 return RREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_RPTR);
1207 * vcn_v1_0_jpeg_ring_get_wptr - get write pointer
1209 * @ring: amdgpu_ring pointer
1211 * Returns the current hardware write pointer
1213 static uint64_t vcn_v1_0_jpeg_ring_get_wptr(struct amdgpu_ring *ring)
1215 struct amdgpu_device *adev = ring->adev;
1217 return RREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_WPTR);
1221 * vcn_v1_0_jpeg_ring_set_wptr - set write pointer
1223 * @ring: amdgpu_ring pointer
1225 * Commits the write pointer to the hardware
1227 static void vcn_v1_0_jpeg_ring_set_wptr(struct amdgpu_ring *ring)
1229 struct amdgpu_device *adev = ring->adev;
1231 WREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_WPTR, lower_32_bits(ring->wptr));
1235 * vcn_v1_0_jpeg_ring_insert_start - insert a start command
1237 * @ring: amdgpu_ring pointer
1239 * Write a start command to the ring.
1241 static void vcn_v1_0_jpeg_ring_insert_start(struct amdgpu_ring *ring)
1243 struct amdgpu_device *adev = ring->adev;
1245 amdgpu_ring_write(ring,
1246 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_EXTERNAL_REG_BASE), 0, 0, PACKETJ_TYPE0));
1247 amdgpu_ring_write(ring, 0x68e04);
1249 amdgpu_ring_write(ring, PACKETJ(0, 0, 0, PACKETJ_TYPE0));
1250 amdgpu_ring_write(ring, 0x80010000);
1254 * vcn_v1_0_jpeg_ring_insert_end - insert a end command
1256 * @ring: amdgpu_ring pointer
1258 * Write a end command to the ring.
1260 static void vcn_v1_0_jpeg_ring_insert_end(struct amdgpu_ring *ring)
1262 struct amdgpu_device *adev = ring->adev;
1264 amdgpu_ring_write(ring,
1265 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_EXTERNAL_REG_BASE), 0, 0, PACKETJ_TYPE0));
1266 amdgpu_ring_write(ring, 0x68e04);
1268 amdgpu_ring_write(ring, PACKETJ(0, 0, 0, PACKETJ_TYPE0));
1269 amdgpu_ring_write(ring, 0x00010000);
1273 * vcn_v1_0_jpeg_ring_emit_fence - emit an fence & trap command
1275 * @ring: amdgpu_ring pointer
1276 * @fence: fence to emit
1278 * Write a fence and a trap command to the ring.
1280 static void vcn_v1_0_jpeg_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq,
1283 struct amdgpu_device *adev = ring->adev;
1285 WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
1287 amdgpu_ring_write(ring,
1288 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JPEG_GPCOM_DATA0), 0, 0, PACKETJ_TYPE0));
1289 amdgpu_ring_write(ring, seq);
1291 amdgpu_ring_write(ring,
1292 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JPEG_GPCOM_DATA1), 0, 0, PACKETJ_TYPE0));
1293 amdgpu_ring_write(ring, seq);
1295 amdgpu_ring_write(ring,
1296 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_RB_MEM_WR_64BIT_BAR_LOW), 0, 0, PACKETJ_TYPE0));
1297 amdgpu_ring_write(ring, lower_32_bits(addr));
1299 amdgpu_ring_write(ring,
1300 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_RB_MEM_WR_64BIT_BAR_HIGH), 0, 0, PACKETJ_TYPE0));
1301 amdgpu_ring_write(ring, upper_32_bits(addr));
1303 amdgpu_ring_write(ring,
1304 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JPEG_GPCOM_CMD), 0, 0, PACKETJ_TYPE0));
1305 amdgpu_ring_write(ring, 0x8);
1307 amdgpu_ring_write(ring,
1308 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JPEG_GPCOM_CMD), 0, PACKETJ_CONDITION_CHECK0, PACKETJ_TYPE4));
1309 amdgpu_ring_write(ring, 0);
1311 amdgpu_ring_write(ring,
1312 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_COND_RD_TIMER), 0, 0, PACKETJ_TYPE0));
1313 amdgpu_ring_write(ring, 0x01400200);
1315 amdgpu_ring_write(ring,
1316 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_REF_DATA), 0, 0, PACKETJ_TYPE0));
1317 amdgpu_ring_write(ring, seq);
1319 amdgpu_ring_write(ring,
1320 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_LOW), 0, 0, PACKETJ_TYPE0));
1321 amdgpu_ring_write(ring, lower_32_bits(addr));
1323 amdgpu_ring_write(ring,
1324 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_HIGH), 0, 0, PACKETJ_TYPE0));
1325 amdgpu_ring_write(ring, upper_32_bits(addr));
1327 amdgpu_ring_write(ring,
1328 PACKETJ(0, 0, PACKETJ_CONDITION_CHECK3, PACKETJ_TYPE2));
1329 amdgpu_ring_write(ring, 0xffffffff);
1331 amdgpu_ring_write(ring,
1332 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_EXTERNAL_REG_BASE), 0, 0, PACKETJ_TYPE0));
1333 amdgpu_ring_write(ring, 0x3fbc);
1335 amdgpu_ring_write(ring,
1336 PACKETJ(0, 0, 0, PACKETJ_TYPE0));
1337 amdgpu_ring_write(ring, 0x1);
1341 * vcn_v1_0_jpeg_ring_emit_ib - execute indirect buffer
1343 * @ring: amdgpu_ring pointer
1344 * @ib: indirect buffer to execute
1346 * Write ring commands to execute the indirect buffer.
1348 static void vcn_v1_0_jpeg_ring_emit_ib(struct amdgpu_ring *ring,
1349 struct amdgpu_ib *ib,
1350 unsigned vmid, bool ctx_switch)
1352 struct amdgpu_device *adev = ring->adev;
1354 amdgpu_ring_write(ring,
1355 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_IB_VMID), 0, 0, PACKETJ_TYPE0));
1356 amdgpu_ring_write(ring, (vmid | (vmid << 4)));
1358 amdgpu_ring_write(ring,
1359 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JPEG_VMID), 0, 0, PACKETJ_TYPE0));
1360 amdgpu_ring_write(ring, (vmid | (vmid << 4)));
1362 amdgpu_ring_write(ring,
1363 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_IB_64BIT_BAR_LOW), 0, 0, PACKETJ_TYPE0));
1364 amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
1366 amdgpu_ring_write(ring,
1367 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_IB_64BIT_BAR_HIGH), 0, 0, PACKETJ_TYPE0));
1368 amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
1370 amdgpu_ring_write(ring,
1371 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_IB_SIZE), 0, 0, PACKETJ_TYPE0));
1372 amdgpu_ring_write(ring, ib->length_dw);
1374 amdgpu_ring_write(ring,
1375 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_LOW), 0, 0, PACKETJ_TYPE0));
1376 amdgpu_ring_write(ring, lower_32_bits(ring->gpu_addr));
1378 amdgpu_ring_write(ring,
1379 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_HIGH), 0, 0, PACKETJ_TYPE0));
1380 amdgpu_ring_write(ring, upper_32_bits(ring->gpu_addr));
1382 amdgpu_ring_write(ring,
1383 PACKETJ(0, 0, PACKETJ_CONDITION_CHECK0, PACKETJ_TYPE2));
1384 amdgpu_ring_write(ring, 0);
1386 amdgpu_ring_write(ring,
1387 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_COND_RD_TIMER), 0, 0, PACKETJ_TYPE0));
1388 amdgpu_ring_write(ring, 0x01400200);
1390 amdgpu_ring_write(ring,
1391 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_REF_DATA), 0, 0, PACKETJ_TYPE0));
1392 amdgpu_ring_write(ring, 0x2);
1394 amdgpu_ring_write(ring,
1395 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_STATUS), 0, PACKETJ_CONDITION_CHECK3, PACKETJ_TYPE3));
1396 amdgpu_ring_write(ring, 0x2);
1399 static void vcn_v1_0_jpeg_ring_emit_reg_wait(struct amdgpu_ring *ring,
1400 uint32_t reg, uint32_t val,
1403 struct amdgpu_device *adev = ring->adev;
1404 uint32_t reg_offset = (reg << 2);
1406 amdgpu_ring_write(ring,
1407 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_COND_RD_TIMER), 0, 0, PACKETJ_TYPE0));
1408 amdgpu_ring_write(ring, 0x01400200);
1410 amdgpu_ring_write(ring,
1411 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_REF_DATA), 0, 0, PACKETJ_TYPE0));
1412 amdgpu_ring_write(ring, val);
1414 amdgpu_ring_write(ring,
1415 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_EXTERNAL_REG_BASE), 0, 0, PACKETJ_TYPE0));
1416 if (((reg_offset >= 0x1f800) && (reg_offset <= 0x21fff)) ||
1417 ((reg_offset >= 0x1e000) && (reg_offset <= 0x1e1ff))) {
1418 amdgpu_ring_write(ring, 0);
1419 amdgpu_ring_write(ring,
1420 PACKETJ((reg_offset >> 2), 0, 0, PACKETJ_TYPE3));
1422 amdgpu_ring_write(ring, reg_offset);
1423 amdgpu_ring_write(ring,
1424 PACKETJ(0, 0, 0, PACKETJ_TYPE3));
1426 amdgpu_ring_write(ring, mask);
1429 static void vcn_v1_0_jpeg_ring_emit_vm_flush(struct amdgpu_ring *ring,
1430 unsigned vmid, uint64_t pd_addr)
1432 struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
1433 uint32_t data0, data1, mask;
1435 pd_addr = amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
1437 /* wait for register write */
1438 data0 = hub->ctx0_ptb_addr_lo32 + vmid * 2;
1439 data1 = lower_32_bits(pd_addr);
1441 vcn_v1_0_jpeg_ring_emit_reg_wait(ring, data0, data1, mask);
1444 static void vcn_v1_0_jpeg_ring_emit_wreg(struct amdgpu_ring *ring,
1445 uint32_t reg, uint32_t val)
1447 struct amdgpu_device *adev = ring->adev;
1448 uint32_t reg_offset = (reg << 2);
1450 amdgpu_ring_write(ring,
1451 PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_EXTERNAL_REG_BASE), 0, 0, PACKETJ_TYPE0));
1452 if (((reg_offset >= 0x1f800) && (reg_offset <= 0x21fff)) ||
1453 ((reg_offset >= 0x1e000) && (reg_offset <= 0x1e1ff))) {
1454 amdgpu_ring_write(ring, 0);
1455 amdgpu_ring_write(ring,
1456 PACKETJ((reg_offset >> 2), 0, 0, PACKETJ_TYPE0));
1458 amdgpu_ring_write(ring, reg_offset);
1459 amdgpu_ring_write(ring,
1460 PACKETJ(0, 0, 0, PACKETJ_TYPE0));
1462 amdgpu_ring_write(ring, val);
1465 static void vcn_v1_0_jpeg_ring_nop(struct amdgpu_ring *ring, uint32_t count)
1469 WARN_ON(ring->wptr % 2 || count % 2);
1471 for (i = 0; i < count / 2; i++) {
1472 amdgpu_ring_write(ring, PACKETJ(0, 0, 0, PACKETJ_TYPE6));
1473 amdgpu_ring_write(ring, 0);
1477 static void vcn_v1_0_jpeg_ring_patch_wreg(struct amdgpu_ring *ring, uint32_t *ptr, uint32_t reg_offset, uint32_t val)
1479 struct amdgpu_device *adev = ring->adev;
1480 ring->ring[(*ptr)++] = PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_EXTERNAL_REG_BASE), 0, 0, PACKETJ_TYPE0);
1481 if (((reg_offset >= 0x1f800) && (reg_offset <= 0x21fff)) ||
1482 ((reg_offset >= 0x1e000) && (reg_offset <= 0x1e1ff))) {
1483 ring->ring[(*ptr)++] = 0;
1484 ring->ring[(*ptr)++] = PACKETJ((reg_offset >> 2), 0, 0, PACKETJ_TYPE0);
1486 ring->ring[(*ptr)++] = reg_offset;
1487 ring->ring[(*ptr)++] = PACKETJ(0, 0, 0, PACKETJ_TYPE0);
1489 ring->ring[(*ptr)++] = val;
1492 static void vcn_v1_0_jpeg_ring_set_patch_ring(struct amdgpu_ring *ring, uint32_t ptr)
1494 struct amdgpu_device *adev = ring->adev;
1496 uint32_t reg, reg_offset, val, mask, i;
1498 // 1st: program mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_LOW
1499 reg = SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_LOW);
1500 reg_offset = (reg << 2);
1501 val = lower_32_bits(ring->gpu_addr);
1502 vcn_v1_0_jpeg_ring_patch_wreg(ring, &ptr, reg_offset, val);
1504 // 2nd: program mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_HIGH
1505 reg = SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_HIGH);
1506 reg_offset = (reg << 2);
1507 val = upper_32_bits(ring->gpu_addr);
1508 vcn_v1_0_jpeg_ring_patch_wreg(ring, &ptr, reg_offset, val);
1510 // 3rd to 5th: issue MEM_READ commands
1511 for (i = 0; i <= 2; i++) {
1512 ring->ring[ptr++] = PACKETJ(0, 0, 0, PACKETJ_TYPE2);
1513 ring->ring[ptr++] = 0;
1516 // 6th: program mmUVD_JRBC_RB_CNTL register to enable NO_FETCH and RPTR write ability
1517 reg = SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_CNTL);
1518 reg_offset = (reg << 2);
1520 vcn_v1_0_jpeg_ring_patch_wreg(ring, &ptr, reg_offset, val);
1522 // 7th: program mmUVD_JRBC_RB_REF_DATA
1523 reg = SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_REF_DATA);
1524 reg_offset = (reg << 2);
1526 vcn_v1_0_jpeg_ring_patch_wreg(ring, &ptr, reg_offset, val);
1528 // 8th: issue conditional register read mmUVD_JRBC_RB_CNTL
1529 reg = SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_CNTL);
1530 reg_offset = (reg << 2);
1534 ring->ring[ptr++] = PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_COND_RD_TIMER), 0, 0, PACKETJ_TYPE0);
1535 ring->ring[ptr++] = 0x01400200;
1536 ring->ring[ptr++] = PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_REF_DATA), 0, 0, PACKETJ_TYPE0);
1537 ring->ring[ptr++] = val;
1538 ring->ring[ptr++] = PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_EXTERNAL_REG_BASE), 0, 0, PACKETJ_TYPE0);
1539 if (((reg_offset >= 0x1f800) && (reg_offset <= 0x21fff)) ||
1540 ((reg_offset >= 0x1e000) && (reg_offset <= 0x1e1ff))) {
1541 ring->ring[ptr++] = 0;
1542 ring->ring[ptr++] = PACKETJ((reg_offset >> 2), 0, 0, PACKETJ_TYPE3);
1544 ring->ring[ptr++] = reg_offset;
1545 ring->ring[ptr++] = PACKETJ(0, 0, 0, PACKETJ_TYPE3);
1547 ring->ring[ptr++] = mask;
1549 //9th to 21st: insert no-op
1550 for (i = 0; i <= 12; i++) {
1551 ring->ring[ptr++] = PACKETJ(0, 0, 0, PACKETJ_TYPE6);
1552 ring->ring[ptr++] = 0;
1555 //22nd: reset mmUVD_JRBC_RB_RPTR
1556 reg = SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_RPTR);
1557 reg_offset = (reg << 2);
1559 vcn_v1_0_jpeg_ring_patch_wreg(ring, &ptr, reg_offset, val);
1561 //23rd: program mmUVD_JRBC_RB_CNTL to disable no_fetch
1562 reg = SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_CNTL);
1563 reg_offset = (reg << 2);
1565 vcn_v1_0_jpeg_ring_patch_wreg(ring, &ptr, reg_offset, val);
1568 static int vcn_v1_0_set_interrupt_state(struct amdgpu_device *adev,
1569 struct amdgpu_irq_src *source,
1571 enum amdgpu_interrupt_state state)
1576 static int vcn_v1_0_process_interrupt(struct amdgpu_device *adev,
1577 struct amdgpu_irq_src *source,
1578 struct amdgpu_iv_entry *entry)
1580 DRM_DEBUG("IH: VCN TRAP\n");
1582 switch (entry->src_id) {
1584 amdgpu_fence_process(&adev->vcn.ring_dec);
1587 amdgpu_fence_process(&adev->vcn.ring_enc[0]);
1590 amdgpu_fence_process(&adev->vcn.ring_enc[1]);
1593 amdgpu_fence_process(&adev->vcn.ring_jpeg);
1596 DRM_ERROR("Unhandled interrupt: %d %d\n",
1597 entry->src_id, entry->src_data[0]);
1604 static void vcn_v1_0_dec_ring_insert_nop(struct amdgpu_ring *ring, uint32_t count)
1606 struct amdgpu_device *adev = ring->adev;
1609 WARN_ON(ring->wptr % 2 || count % 2);
1611 for (i = 0; i < count / 2; i++) {
1612 amdgpu_ring_write(ring, PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_NO_OP), 0));
1613 amdgpu_ring_write(ring, 0);
1617 static int vcn_v1_0_set_powergating_state(void *handle,
1618 enum amd_powergating_state state)
1620 /* This doesn't actually powergate the VCN block.
1621 * That's done in the dpm code via the SMC. This
1622 * just re-inits the block as necessary. The actual
1623 * gating still happens in the dpm code. We should
1624 * revisit this when there is a cleaner line between
1625 * the smc and the hw blocks
1627 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1629 if (state == AMD_PG_STATE_GATE)
1630 return vcn_v1_0_stop(adev);
1632 return vcn_v1_0_start(adev);
1635 static const struct amd_ip_funcs vcn_v1_0_ip_funcs = {
1637 .early_init = vcn_v1_0_early_init,
1639 .sw_init = vcn_v1_0_sw_init,
1640 .sw_fini = vcn_v1_0_sw_fini,
1641 .hw_init = vcn_v1_0_hw_init,
1642 .hw_fini = vcn_v1_0_hw_fini,
1643 .suspend = vcn_v1_0_suspend,
1644 .resume = vcn_v1_0_resume,
1645 .is_idle = vcn_v1_0_is_idle,
1646 .wait_for_idle = vcn_v1_0_wait_for_idle,
1647 .check_soft_reset = NULL /* vcn_v1_0_check_soft_reset */,
1648 .pre_soft_reset = NULL /* vcn_v1_0_pre_soft_reset */,
1649 .soft_reset = NULL /* vcn_v1_0_soft_reset */,
1650 .post_soft_reset = NULL /* vcn_v1_0_post_soft_reset */,
1651 .set_clockgating_state = vcn_v1_0_set_clockgating_state,
1652 .set_powergating_state = vcn_v1_0_set_powergating_state,
1655 static const struct amdgpu_ring_funcs vcn_v1_0_dec_ring_vm_funcs = {
1656 .type = AMDGPU_RING_TYPE_VCN_DEC,
1658 .support_64bit_ptrs = false,
1659 .vmhub = AMDGPU_MMHUB,
1660 .get_rptr = vcn_v1_0_dec_ring_get_rptr,
1661 .get_wptr = vcn_v1_0_dec_ring_get_wptr,
1662 .set_wptr = vcn_v1_0_dec_ring_set_wptr,
1664 6 + 6 + /* hdp invalidate / flush */
1665 SOC15_FLUSH_GPU_TLB_NUM_WREG * 6 +
1666 SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 8 +
1667 8 + /* vcn_v1_0_dec_ring_emit_vm_flush */
1668 14 + 14 + /* vcn_v1_0_dec_ring_emit_fence x2 vm fence */
1670 .emit_ib_size = 8, /* vcn_v1_0_dec_ring_emit_ib */
1671 .emit_ib = vcn_v1_0_dec_ring_emit_ib,
1672 .emit_fence = vcn_v1_0_dec_ring_emit_fence,
1673 .emit_vm_flush = vcn_v1_0_dec_ring_emit_vm_flush,
1674 .test_ring = amdgpu_vcn_dec_ring_test_ring,
1675 .test_ib = amdgpu_vcn_dec_ring_test_ib,
1676 .insert_nop = vcn_v1_0_dec_ring_insert_nop,
1677 .insert_start = vcn_v1_0_dec_ring_insert_start,
1678 .insert_end = vcn_v1_0_dec_ring_insert_end,
1679 .pad_ib = amdgpu_ring_generic_pad_ib,
1680 .begin_use = amdgpu_vcn_ring_begin_use,
1681 .end_use = amdgpu_vcn_ring_end_use,
1682 .emit_wreg = vcn_v1_0_dec_ring_emit_wreg,
1683 .emit_reg_wait = vcn_v1_0_dec_ring_emit_reg_wait,
1684 .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
1687 static const struct amdgpu_ring_funcs vcn_v1_0_enc_ring_vm_funcs = {
1688 .type = AMDGPU_RING_TYPE_VCN_ENC,
1690 .nop = VCN_ENC_CMD_NO_OP,
1691 .support_64bit_ptrs = false,
1692 .vmhub = AMDGPU_MMHUB,
1693 .get_rptr = vcn_v1_0_enc_ring_get_rptr,
1694 .get_wptr = vcn_v1_0_enc_ring_get_wptr,
1695 .set_wptr = vcn_v1_0_enc_ring_set_wptr,
1697 SOC15_FLUSH_GPU_TLB_NUM_WREG * 3 +
1698 SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 4 +
1699 4 + /* vcn_v1_0_enc_ring_emit_vm_flush */
1700 5 + 5 + /* vcn_v1_0_enc_ring_emit_fence x2 vm fence */
1701 1, /* vcn_v1_0_enc_ring_insert_end */
1702 .emit_ib_size = 5, /* vcn_v1_0_enc_ring_emit_ib */
1703 .emit_ib = vcn_v1_0_enc_ring_emit_ib,
1704 .emit_fence = vcn_v1_0_enc_ring_emit_fence,
1705 .emit_vm_flush = vcn_v1_0_enc_ring_emit_vm_flush,
1706 .test_ring = amdgpu_vcn_enc_ring_test_ring,
1707 .test_ib = amdgpu_vcn_enc_ring_test_ib,
1708 .insert_nop = amdgpu_ring_insert_nop,
1709 .insert_end = vcn_v1_0_enc_ring_insert_end,
1710 .pad_ib = amdgpu_ring_generic_pad_ib,
1711 .begin_use = amdgpu_vcn_ring_begin_use,
1712 .end_use = amdgpu_vcn_ring_end_use,
1713 .emit_wreg = vcn_v1_0_enc_ring_emit_wreg,
1714 .emit_reg_wait = vcn_v1_0_enc_ring_emit_reg_wait,
1715 .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
1718 static const struct amdgpu_ring_funcs vcn_v1_0_jpeg_ring_vm_funcs = {
1719 .type = AMDGPU_RING_TYPE_VCN_JPEG,
1721 .nop = PACKET0(0x81ff, 0),
1722 .support_64bit_ptrs = false,
1723 .vmhub = AMDGPU_MMHUB,
1725 .get_rptr = vcn_v1_0_jpeg_ring_get_rptr,
1726 .get_wptr = vcn_v1_0_jpeg_ring_get_wptr,
1727 .set_wptr = vcn_v1_0_jpeg_ring_set_wptr,
1729 6 + 6 + /* hdp invalidate / flush */
1730 SOC15_FLUSH_GPU_TLB_NUM_WREG * 6 +
1731 SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 8 +
1732 8 + /* vcn_v1_0_dec_ring_emit_vm_flush */
1733 14 + 14 + /* vcn_v1_0_dec_ring_emit_fence x2 vm fence */
1735 .emit_ib_size = 22, /* vcn_v1_0_dec_ring_emit_ib */
1736 .emit_ib = vcn_v1_0_jpeg_ring_emit_ib,
1737 .emit_fence = vcn_v1_0_jpeg_ring_emit_fence,
1738 .emit_vm_flush = vcn_v1_0_jpeg_ring_emit_vm_flush,
1739 .test_ring = amdgpu_vcn_jpeg_ring_test_ring,
1740 .test_ib = amdgpu_vcn_jpeg_ring_test_ib,
1741 .insert_nop = vcn_v1_0_jpeg_ring_nop,
1742 .insert_start = vcn_v1_0_jpeg_ring_insert_start,
1743 .insert_end = vcn_v1_0_jpeg_ring_insert_end,
1744 .pad_ib = amdgpu_ring_generic_pad_ib,
1745 .begin_use = amdgpu_vcn_ring_begin_use,
1746 .end_use = amdgpu_vcn_ring_end_use,
1747 .emit_wreg = vcn_v1_0_jpeg_ring_emit_wreg,
1748 .emit_reg_wait = vcn_v1_0_jpeg_ring_emit_reg_wait,
1751 static void vcn_v1_0_set_dec_ring_funcs(struct amdgpu_device *adev)
1753 adev->vcn.ring_dec.funcs = &vcn_v1_0_dec_ring_vm_funcs;
1754 DRM_INFO("VCN decode is enabled in VM mode\n");
1757 static void vcn_v1_0_set_enc_ring_funcs(struct amdgpu_device *adev)
1761 for (i = 0; i < adev->vcn.num_enc_rings; ++i)
1762 adev->vcn.ring_enc[i].funcs = &vcn_v1_0_enc_ring_vm_funcs;
1764 DRM_INFO("VCN encode is enabled in VM mode\n");
1767 static void vcn_v1_0_set_jpeg_ring_funcs(struct amdgpu_device *adev)
1769 adev->vcn.ring_jpeg.funcs = &vcn_v1_0_jpeg_ring_vm_funcs;
1770 DRM_INFO("VCN jpeg decode is enabled in VM mode\n");
1773 static const struct amdgpu_irq_src_funcs vcn_v1_0_irq_funcs = {
1774 .set = vcn_v1_0_set_interrupt_state,
1775 .process = vcn_v1_0_process_interrupt,
1778 static void vcn_v1_0_set_irq_funcs(struct amdgpu_device *adev)
1780 adev->vcn.irq.num_types = adev->vcn.num_enc_rings + 1;
1781 adev->vcn.irq.funcs = &vcn_v1_0_irq_funcs;
1784 const struct amdgpu_ip_block_version vcn_v1_0_ip_block =
1786 .type = AMD_IP_BLOCK_TYPE_VCN,
1790 .funcs = &vcn_v1_0_ip_funcs,