2 * Copyright 2019 Advanced Micro Devices, Inc.
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
25 #include "amdgpu_jpeg.h"
28 #include "jpeg_v2_0.h"
30 #include "vcn/vcn_2_5_offset.h"
31 #include "vcn/vcn_2_5_sh_mask.h"
32 #include "ivsrcid/vcn/irqsrcs_vcn_2_0.h"
34 #define mmUVD_JPEG_PITCH_INTERNAL_OFFSET 0x401f
36 #define JPEG25_MAX_HW_INSTANCES_ARCTURUS 2
38 static void jpeg_v2_5_set_dec_ring_funcs(struct amdgpu_device *adev);
39 static void jpeg_v2_5_set_irq_funcs(struct amdgpu_device *adev);
40 static int jpeg_v2_5_set_powergating_state(void *handle,
41 enum amd_powergating_state state);
43 static int amdgpu_ih_clientid_jpeg[] = {
44 SOC15_IH_CLIENTID_VCN,
45 SOC15_IH_CLIENTID_VCN1
49 * jpeg_v2_5_early_init - set function pointers
51 * @handle: amdgpu_device pointer
53 * Set ring and irq function pointers
55 static int jpeg_v2_5_early_init(void *handle)
57 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
61 adev->jpeg.num_jpeg_inst = JPEG25_MAX_HW_INSTANCES_ARCTURUS;
62 for (i = 0; i < adev->jpeg.num_jpeg_inst; i++) {
63 harvest = RREG32_SOC15(JPEG, i, mmCC_UVD_HARVESTING);
64 if (harvest & CC_UVD_HARVESTING__UVD_DISABLE_MASK)
65 adev->jpeg.harvest_config |= 1 << i;
67 if (adev->jpeg.harvest_config == (AMDGPU_JPEG_HARVEST_JPEG0 |
68 AMDGPU_JPEG_HARVEST_JPEG1))
71 jpeg_v2_5_set_dec_ring_funcs(adev);
72 jpeg_v2_5_set_irq_funcs(adev);
78 * jpeg_v2_5_sw_init - sw init for JPEG block
80 * @handle: amdgpu_device pointer
82 * Load firmware and sw initialization
84 static int jpeg_v2_5_sw_init(void *handle)
86 struct amdgpu_ring *ring;
88 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
90 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
91 if (adev->jpeg.harvest_config & (1 << i))
95 r = amdgpu_irq_add_id(adev, amdgpu_ih_clientid_jpeg[i],
96 VCN_2_0__SRCID__JPEG_DECODE, &adev->jpeg.inst[i].irq);
101 r = amdgpu_jpeg_sw_init(adev);
105 r = amdgpu_jpeg_resume(adev);
109 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
110 if (adev->jpeg.harvest_config & (1 << i))
113 ring = &adev->jpeg.inst[i].ring_dec;
114 ring->use_doorbell = true;
115 ring->doorbell_index = (adev->doorbell_index.vcn.vcn_ring0_1 << 1) + 1 + 8 * i;
116 sprintf(ring->name, "jpeg_dec_%d", i);
117 r = amdgpu_ring_init(adev, ring, 512, &adev->jpeg.inst[i].irq,
118 0, AMDGPU_RING_PRIO_DEFAULT);
122 adev->jpeg.internal.jpeg_pitch = mmUVD_JPEG_PITCH_INTERNAL_OFFSET;
123 adev->jpeg.inst[i].external.jpeg_pitch = SOC15_REG_OFFSET(JPEG, i, mmUVD_JPEG_PITCH);
130 * jpeg_v2_5_sw_fini - sw fini for JPEG block
132 * @handle: amdgpu_device pointer
134 * JPEG suspend and free up sw allocation
136 static int jpeg_v2_5_sw_fini(void *handle)
139 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
141 r = amdgpu_jpeg_suspend(adev);
145 r = amdgpu_jpeg_sw_fini(adev);
151 * jpeg_v2_5_hw_init - start and test JPEG block
153 * @handle: amdgpu_device pointer
156 static int jpeg_v2_5_hw_init(void *handle)
158 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
159 struct amdgpu_ring *ring;
162 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
163 if (adev->jpeg.harvest_config & (1 << i))
166 ring = &adev->jpeg.inst[i].ring_dec;
167 adev->nbio.funcs->vcn_doorbell_range(adev, ring->use_doorbell,
168 (adev->doorbell_index.vcn.vcn_ring0_1 << 1) + 8 * i, i);
170 r = amdgpu_ring_test_helper(ring);
175 DRM_INFO("JPEG decode initialized successfully.\n");
181 * jpeg_v2_5_hw_fini - stop the hardware block
183 * @handle: amdgpu_device pointer
185 * Stop the JPEG block, mark ring as not ready any more
187 static int jpeg_v2_5_hw_fini(void *handle)
189 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
190 struct amdgpu_ring *ring;
193 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
194 if (adev->jpeg.harvest_config & (1 << i))
197 ring = &adev->jpeg.inst[i].ring_dec;
198 if (adev->jpeg.cur_state != AMD_PG_STATE_GATE &&
199 RREG32_SOC15(JPEG, i, mmUVD_JRBC_STATUS))
200 jpeg_v2_5_set_powergating_state(adev, AMD_PG_STATE_GATE);
202 ring->sched.ready = false;
209 * jpeg_v2_5_suspend - suspend JPEG block
211 * @handle: amdgpu_device pointer
213 * HW fini and suspend JPEG block
215 static int jpeg_v2_5_suspend(void *handle)
217 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
220 r = jpeg_v2_5_hw_fini(adev);
224 r = amdgpu_jpeg_suspend(adev);
230 * jpeg_v2_5_resume - resume JPEG block
232 * @handle: amdgpu_device pointer
234 * Resume firmware and hw init JPEG block
236 static int jpeg_v2_5_resume(void *handle)
238 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
241 r = amdgpu_jpeg_resume(adev);
245 r = jpeg_v2_5_hw_init(adev);
250 static void jpeg_v2_5_disable_clock_gating(struct amdgpu_device* adev, int inst)
254 data = RREG32_SOC15(JPEG, inst, mmJPEG_CGC_CTRL);
255 if (adev->cg_flags & AMD_CG_SUPPORT_JPEG_MGCG)
256 data |= 1 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
258 data &= ~JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
260 data |= 1 << JPEG_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
261 data |= 4 << JPEG_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
262 WREG32_SOC15(JPEG, inst, mmJPEG_CGC_CTRL, data);
264 data = RREG32_SOC15(JPEG, inst, mmJPEG_CGC_GATE);
265 data &= ~(JPEG_CGC_GATE__JPEG_DEC_MASK
266 | JPEG_CGC_GATE__JPEG2_DEC_MASK
267 | JPEG_CGC_GATE__JMCIF_MASK
268 | JPEG_CGC_GATE__JRBBM_MASK);
269 WREG32_SOC15(JPEG, inst, mmJPEG_CGC_GATE, data);
271 data = RREG32_SOC15(JPEG, inst, mmJPEG_CGC_CTRL);
272 data &= ~(JPEG_CGC_CTRL__JPEG_DEC_MODE_MASK
273 | JPEG_CGC_CTRL__JPEG2_DEC_MODE_MASK
274 | JPEG_CGC_CTRL__JMCIF_MODE_MASK
275 | JPEG_CGC_CTRL__JRBBM_MODE_MASK);
276 WREG32_SOC15(JPEG, inst, mmJPEG_CGC_CTRL, data);
279 static void jpeg_v2_5_enable_clock_gating(struct amdgpu_device* adev, int inst)
283 data = RREG32_SOC15(JPEG, inst, mmJPEG_CGC_GATE);
284 data |= (JPEG_CGC_GATE__JPEG_DEC_MASK
285 |JPEG_CGC_GATE__JPEG2_DEC_MASK
286 |JPEG_CGC_GATE__JPEG_ENC_MASK
287 |JPEG_CGC_GATE__JMCIF_MASK
288 |JPEG_CGC_GATE__JRBBM_MASK);
289 WREG32_SOC15(JPEG, inst, mmJPEG_CGC_GATE, data);
293 * jpeg_v2_5_start - start JPEG block
295 * @adev: amdgpu_device pointer
297 * Setup and start the JPEG block
299 static int jpeg_v2_5_start(struct amdgpu_device *adev)
301 struct amdgpu_ring *ring;
304 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
305 if (adev->jpeg.harvest_config & (1 << i))
308 ring = &adev->jpeg.inst[i].ring_dec;
309 /* disable anti hang mechanism */
310 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmUVD_JPEG_POWER_STATUS), 0,
311 ~UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_MASK);
313 /* JPEG disable CGC */
314 jpeg_v2_5_disable_clock_gating(adev, i);
316 /* MJPEG global tiling registers */
317 WREG32_SOC15(JPEG, i, mmJPEG_DEC_GFX8_ADDR_CONFIG,
318 adev->gfx.config.gb_addr_config);
319 WREG32_SOC15(JPEG, i, mmJPEG_DEC_GFX10_ADDR_CONFIG,
320 adev->gfx.config.gb_addr_config);
322 /* enable JMI channel */
323 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmUVD_JMI_CNTL), 0,
324 ~UVD_JMI_CNTL__SOFT_RESET_MASK);
326 /* enable System Interrupt for JRBC */
327 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmJPEG_SYS_INT_EN),
328 JPEG_SYS_INT_EN__DJRBC_MASK,
329 ~JPEG_SYS_INT_EN__DJRBC_MASK);
331 WREG32_SOC15(JPEG, i, mmUVD_LMI_JRBC_RB_VMID, 0);
332 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_CNTL, (0x00000001L | 0x00000002L));
333 WREG32_SOC15(JPEG, i, mmUVD_LMI_JRBC_RB_64BIT_BAR_LOW,
334 lower_32_bits(ring->gpu_addr));
335 WREG32_SOC15(JPEG, i, mmUVD_LMI_JRBC_RB_64BIT_BAR_HIGH,
336 upper_32_bits(ring->gpu_addr));
337 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_RPTR, 0);
338 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_WPTR, 0);
339 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_CNTL, 0x00000002L);
340 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_SIZE, ring->ring_size / 4);
341 ring->wptr = RREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_WPTR);
348 * jpeg_v2_5_stop - stop JPEG block
350 * @adev: amdgpu_device pointer
352 * stop the JPEG block
354 static int jpeg_v2_5_stop(struct amdgpu_device *adev)
358 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
359 if (adev->jpeg.harvest_config & (1 << i))
363 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmUVD_JMI_CNTL),
364 UVD_JMI_CNTL__SOFT_RESET_MASK,
365 ~UVD_JMI_CNTL__SOFT_RESET_MASK);
367 jpeg_v2_5_enable_clock_gating(adev, i);
369 /* enable anti hang mechanism */
370 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmUVD_JPEG_POWER_STATUS),
371 UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_MASK,
372 ~UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_MASK);
379 * jpeg_v2_5_dec_ring_get_rptr - get read pointer
381 * @ring: amdgpu_ring pointer
383 * Returns the current hardware read pointer
385 static uint64_t jpeg_v2_5_dec_ring_get_rptr(struct amdgpu_ring *ring)
387 struct amdgpu_device *adev = ring->adev;
389 return RREG32_SOC15(JPEG, ring->me, mmUVD_JRBC_RB_RPTR);
393 * jpeg_v2_5_dec_ring_get_wptr - get write pointer
395 * @ring: amdgpu_ring pointer
397 * Returns the current hardware write pointer
399 static uint64_t jpeg_v2_5_dec_ring_get_wptr(struct amdgpu_ring *ring)
401 struct amdgpu_device *adev = ring->adev;
403 if (ring->use_doorbell)
404 return adev->wb.wb[ring->wptr_offs];
406 return RREG32_SOC15(JPEG, ring->me, mmUVD_JRBC_RB_WPTR);
410 * jpeg_v2_5_dec_ring_set_wptr - set write pointer
412 * @ring: amdgpu_ring pointer
414 * Commits the write pointer to the hardware
416 static void jpeg_v2_5_dec_ring_set_wptr(struct amdgpu_ring *ring)
418 struct amdgpu_device *adev = ring->adev;
420 if (ring->use_doorbell) {
421 adev->wb.wb[ring->wptr_offs] = lower_32_bits(ring->wptr);
422 WDOORBELL32(ring->doorbell_index, lower_32_bits(ring->wptr));
424 WREG32_SOC15(JPEG, ring->me, mmUVD_JRBC_RB_WPTR, lower_32_bits(ring->wptr));
428 static bool jpeg_v2_5_is_idle(void *handle)
430 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
433 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
434 if (adev->jpeg.harvest_config & (1 << i))
437 ret &= (((RREG32_SOC15(JPEG, i, mmUVD_JRBC_STATUS) &
438 UVD_JRBC_STATUS__RB_JOB_DONE_MASK) ==
439 UVD_JRBC_STATUS__RB_JOB_DONE_MASK));
445 static int jpeg_v2_5_wait_for_idle(void *handle)
447 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
450 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
451 if (adev->jpeg.harvest_config & (1 << i))
454 ret = SOC15_WAIT_ON_RREG(JPEG, i, mmUVD_JRBC_STATUS,
455 UVD_JRBC_STATUS__RB_JOB_DONE_MASK,
456 UVD_JRBC_STATUS__RB_JOB_DONE_MASK);
464 static int jpeg_v2_5_set_clockgating_state(void *handle,
465 enum amd_clockgating_state state)
467 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
468 bool enable = (state == AMD_CG_STATE_GATE);
471 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
472 if (adev->jpeg.harvest_config & (1 << i))
476 if (!jpeg_v2_5_is_idle(handle))
478 jpeg_v2_5_enable_clock_gating(adev, i);
480 jpeg_v2_5_disable_clock_gating(adev, i);
487 static int jpeg_v2_5_set_powergating_state(void *handle,
488 enum amd_powergating_state state)
490 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
493 if(state == adev->jpeg.cur_state)
496 if (state == AMD_PG_STATE_GATE)
497 ret = jpeg_v2_5_stop(adev);
499 ret = jpeg_v2_5_start(adev);
502 adev->jpeg.cur_state = state;
507 static int jpeg_v2_5_set_interrupt_state(struct amdgpu_device *adev,
508 struct amdgpu_irq_src *source,
510 enum amdgpu_interrupt_state state)
515 static int jpeg_v2_5_process_interrupt(struct amdgpu_device *adev,
516 struct amdgpu_irq_src *source,
517 struct amdgpu_iv_entry *entry)
519 uint32_t ip_instance;
521 switch (entry->client_id) {
522 case SOC15_IH_CLIENTID_VCN:
525 case SOC15_IH_CLIENTID_VCN1:
529 DRM_ERROR("Unhandled client id: %d\n", entry->client_id);
533 DRM_DEBUG("IH: JPEG TRAP\n");
535 switch (entry->src_id) {
536 case VCN_2_0__SRCID__JPEG_DECODE:
537 amdgpu_fence_process(&adev->jpeg.inst[ip_instance].ring_dec);
540 DRM_ERROR("Unhandled interrupt: %d %d\n",
541 entry->src_id, entry->src_data[0]);
548 static const struct amd_ip_funcs jpeg_v2_5_ip_funcs = {
550 .early_init = jpeg_v2_5_early_init,
552 .sw_init = jpeg_v2_5_sw_init,
553 .sw_fini = jpeg_v2_5_sw_fini,
554 .hw_init = jpeg_v2_5_hw_init,
555 .hw_fini = jpeg_v2_5_hw_fini,
556 .suspend = jpeg_v2_5_suspend,
557 .resume = jpeg_v2_5_resume,
558 .is_idle = jpeg_v2_5_is_idle,
559 .wait_for_idle = jpeg_v2_5_wait_for_idle,
560 .check_soft_reset = NULL,
561 .pre_soft_reset = NULL,
563 .post_soft_reset = NULL,
564 .set_clockgating_state = jpeg_v2_5_set_clockgating_state,
565 .set_powergating_state = jpeg_v2_5_set_powergating_state,
568 static const struct amdgpu_ring_funcs jpeg_v2_5_dec_ring_vm_funcs = {
569 .type = AMDGPU_RING_TYPE_VCN_JPEG,
571 .vmhub = AMDGPU_MMHUB_1,
572 .get_rptr = jpeg_v2_5_dec_ring_get_rptr,
573 .get_wptr = jpeg_v2_5_dec_ring_get_wptr,
574 .set_wptr = jpeg_v2_5_dec_ring_set_wptr,
576 SOC15_FLUSH_GPU_TLB_NUM_WREG * 6 +
577 SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 8 +
578 8 + /* jpeg_v2_5_dec_ring_emit_vm_flush */
579 18 + 18 + /* jpeg_v2_5_dec_ring_emit_fence x2 vm fence */
581 .emit_ib_size = 22, /* jpeg_v2_5_dec_ring_emit_ib */
582 .emit_ib = jpeg_v2_0_dec_ring_emit_ib,
583 .emit_fence = jpeg_v2_0_dec_ring_emit_fence,
584 .emit_vm_flush = jpeg_v2_0_dec_ring_emit_vm_flush,
585 .test_ring = amdgpu_jpeg_dec_ring_test_ring,
586 .test_ib = amdgpu_jpeg_dec_ring_test_ib,
587 .insert_nop = jpeg_v2_0_dec_ring_nop,
588 .insert_start = jpeg_v2_0_dec_ring_insert_start,
589 .insert_end = jpeg_v2_0_dec_ring_insert_end,
590 .pad_ib = amdgpu_ring_generic_pad_ib,
591 .begin_use = amdgpu_jpeg_ring_begin_use,
592 .end_use = amdgpu_jpeg_ring_end_use,
593 .emit_wreg = jpeg_v2_0_dec_ring_emit_wreg,
594 .emit_reg_wait = jpeg_v2_0_dec_ring_emit_reg_wait,
595 .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
598 static void jpeg_v2_5_set_dec_ring_funcs(struct amdgpu_device *adev)
602 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
603 if (adev->jpeg.harvest_config & (1 << i))
606 adev->jpeg.inst[i].ring_dec.funcs = &jpeg_v2_5_dec_ring_vm_funcs;
607 adev->jpeg.inst[i].ring_dec.me = i;
608 DRM_INFO("JPEG(%d) JPEG decode is enabled in VM mode\n", i);
612 static const struct amdgpu_irq_src_funcs jpeg_v2_5_irq_funcs = {
613 .set = jpeg_v2_5_set_interrupt_state,
614 .process = jpeg_v2_5_process_interrupt,
617 static void jpeg_v2_5_set_irq_funcs(struct amdgpu_device *adev)
621 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
622 if (adev->jpeg.harvest_config & (1 << i))
625 adev->jpeg.inst[i].irq.num_types = 1;
626 adev->jpeg.inst[i].irq.funcs = &jpeg_v2_5_irq_funcs;
630 const struct amdgpu_ip_block_version jpeg_v2_5_ip_block =
632 .type = AMD_IP_BLOCK_TYPE_JPEG,
636 .funcs = &jpeg_v2_5_ip_funcs,