1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24#include "amdgpu.h"
25#include "amdgpu_jpeg.h"
26#include "soc15.h"
27#include "soc15d.h"
28#include "jpeg_v2_0.h"
29
30#include "vcn/vcn_2_5_offset.h"
31#include "vcn/vcn_2_5_sh_mask.h"
32#include "ivsrcid/vcn/irqsrcs_vcn_2_0.h"
33
34#define mmUVD_JPEG_PITCH_INTERNAL_OFFSET 0x401f
35
36#define JPEG25_MAX_HW_INSTANCES_ARCTURUS 2
37
38static void jpeg_v2_5_set_dec_ring_funcs(struct amdgpu_device *adev);
39static void jpeg_v2_5_set_irq_funcs(struct amdgpu_device *adev);
40static int jpeg_v2_5_set_powergating_state(void *handle,
41 enum amd_powergating_state state);
42
43static int amdgpu_ih_clientid_jpeg[] = {
44 SOC15_IH_CLIENTID_VCN,
45 SOC15_IH_CLIENTID_VCN1
46};
47
48
49
50
51
52
53
54
55static int jpeg_v2_5_early_init(void *handle)
56{
57 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
58 if (adev->asic_type == CHIP_ARCTURUS) {
59 u32 harvest;
60 int i;
61
62 adev->jpeg.num_jpeg_inst = JPEG25_MAX_HW_INSTANCES_ARCTURUS;
63 for (i = 0; i < adev->jpeg.num_jpeg_inst; i++) {
64 harvest = RREG32_SOC15(JPEG, i, mmCC_UVD_HARVESTING);
65 if (harvest & CC_UVD_HARVESTING__UVD_DISABLE_MASK)
66 adev->jpeg.harvest_config |= 1 << i;
67 }
68
69 if (adev->jpeg.harvest_config == (AMDGPU_JPEG_HARVEST_JPEG0 |
70 AMDGPU_JPEG_HARVEST_JPEG1))
71 return -ENOENT;
72 } else
73 adev->jpeg.num_jpeg_inst = 1;
74
75 jpeg_v2_5_set_dec_ring_funcs(adev);
76 jpeg_v2_5_set_irq_funcs(adev);
77
78 return 0;
79}
80
81
82
83
84
85
86
87
88static int jpeg_v2_5_sw_init(void *handle)
89{
90 struct amdgpu_ring *ring;
91 int i, r;
92 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
93
94 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
95 if (adev->jpeg.harvest_config & (1 << i))
96 continue;
97
98
99 r = amdgpu_irq_add_id(adev, amdgpu_ih_clientid_jpeg[i],
100 VCN_2_0__SRCID__JPEG_DECODE, &adev->jpeg.inst[i].irq);
101 if (r)
102 return r;
103 }
104
105 r = amdgpu_jpeg_sw_init(adev);
106 if (r)
107 return r;
108
109 r = amdgpu_jpeg_resume(adev);
110 if (r)
111 return r;
112
113 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
114 if (adev->jpeg.harvest_config & (1 << i))
115 continue;
116
117 ring = &adev->jpeg.inst[i].ring_dec;
118 ring->use_doorbell = true;
119 ring->doorbell_index = (adev->doorbell_index.vcn.vcn_ring0_1 << 1) + 1 + 8 * i;
120 sprintf(ring->name, "jpeg_dec_%d", i);
121 r = amdgpu_ring_init(adev, ring, 512, &adev->jpeg.inst[i].irq,
122 0, AMDGPU_RING_PRIO_DEFAULT);
123 if (r)
124 return r;
125
126 adev->jpeg.internal.jpeg_pitch = mmUVD_JPEG_PITCH_INTERNAL_OFFSET;
127 adev->jpeg.inst[i].external.jpeg_pitch = SOC15_REG_OFFSET(JPEG, i, mmUVD_JPEG_PITCH);
128 }
129
130 return 0;
131}
132
133
134
135
136
137
138
139
140static int jpeg_v2_5_sw_fini(void *handle)
141{
142 int r;
143 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
144
145 r = amdgpu_jpeg_suspend(adev);
146 if (r)
147 return r;
148
149 r = amdgpu_jpeg_sw_fini(adev);
150
151 return r;
152}
153
154
155
156
157
158
159
160static int jpeg_v2_5_hw_init(void *handle)
161{
162 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
163 struct amdgpu_ring *ring;
164 int i, r;
165
166 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
167 if (adev->jpeg.harvest_config & (1 << i))
168 continue;
169
170 ring = &adev->jpeg.inst[i].ring_dec;
171 adev->nbio.funcs->vcn_doorbell_range(adev, ring->use_doorbell,
172 (adev->doorbell_index.vcn.vcn_ring0_1 << 1) + 8 * i, i);
173
174 r = amdgpu_ring_test_helper(ring);
175 if (r)
176 return r;
177 }
178
179 DRM_INFO("JPEG decode initialized successfully.\n");
180
181 return 0;
182}
183
184
185
186
187
188
189
190
191static int jpeg_v2_5_hw_fini(void *handle)
192{
193 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
194 struct amdgpu_ring *ring;
195 int i;
196
197 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
198 if (adev->jpeg.harvest_config & (1 << i))
199 continue;
200
201 ring = &adev->jpeg.inst[i].ring_dec;
202 if (adev->jpeg.cur_state != AMD_PG_STATE_GATE &&
203 RREG32_SOC15(JPEG, i, mmUVD_JRBC_STATUS))
204 jpeg_v2_5_set_powergating_state(adev, AMD_PG_STATE_GATE);
205
206 ring->sched.ready = false;
207 }
208
209 return 0;
210}
211
212
213
214
215
216
217
218
219static int jpeg_v2_5_suspend(void *handle)
220{
221 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
222 int r;
223
224 r = jpeg_v2_5_hw_fini(adev);
225 if (r)
226 return r;
227
228 r = amdgpu_jpeg_suspend(adev);
229
230 return r;
231}
232
233
234
235
236
237
238
239
240static int jpeg_v2_5_resume(void *handle)
241{
242 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
243 int r;
244
245 r = amdgpu_jpeg_resume(adev);
246 if (r)
247 return r;
248
249 r = jpeg_v2_5_hw_init(adev);
250
251 return r;
252}
253
254static void jpeg_v2_5_disable_clock_gating(struct amdgpu_device* adev, int inst)
255{
256 uint32_t data;
257
258 data = RREG32_SOC15(JPEG, inst, mmJPEG_CGC_CTRL);
259 if (adev->cg_flags & AMD_CG_SUPPORT_JPEG_MGCG)
260 data |= 1 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
261 else
262 data &= ~JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
263
264 data |= 1 << JPEG_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
265 data |= 4 << JPEG_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
266 WREG32_SOC15(JPEG, inst, mmJPEG_CGC_CTRL, data);
267
268 data = RREG32_SOC15(JPEG, inst, mmJPEG_CGC_GATE);
269 data &= ~(JPEG_CGC_GATE__JPEG_DEC_MASK
270 | JPEG_CGC_GATE__JPEG2_DEC_MASK
271 | JPEG_CGC_GATE__JMCIF_MASK
272 | JPEG_CGC_GATE__JRBBM_MASK);
273 WREG32_SOC15(JPEG, inst, mmJPEG_CGC_GATE, data);
274
275 data = RREG32_SOC15(JPEG, inst, mmJPEG_CGC_CTRL);
276 data &= ~(JPEG_CGC_CTRL__JPEG_DEC_MODE_MASK
277 | JPEG_CGC_CTRL__JPEG2_DEC_MODE_MASK
278 | JPEG_CGC_CTRL__JMCIF_MODE_MASK
279 | JPEG_CGC_CTRL__JRBBM_MODE_MASK);
280 WREG32_SOC15(JPEG, inst, mmJPEG_CGC_CTRL, data);
281}
282
283static void jpeg_v2_5_enable_clock_gating(struct amdgpu_device* adev, int inst)
284{
285 uint32_t data;
286
287 data = RREG32_SOC15(JPEG, inst, mmJPEG_CGC_GATE);
288 data |= (JPEG_CGC_GATE__JPEG_DEC_MASK
289 |JPEG_CGC_GATE__JPEG2_DEC_MASK
290 |JPEG_CGC_GATE__JPEG_ENC_MASK
291 |JPEG_CGC_GATE__JMCIF_MASK
292 |JPEG_CGC_GATE__JRBBM_MASK);
293 WREG32_SOC15(JPEG, inst, mmJPEG_CGC_GATE, data);
294}
295
296
297
298
299
300
301
302
303static int jpeg_v2_5_start(struct amdgpu_device *adev)
304{
305 struct amdgpu_ring *ring;
306 int i;
307
308 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
309 if (adev->jpeg.harvest_config & (1 << i))
310 continue;
311
312 ring = &adev->jpeg.inst[i].ring_dec;
313
314 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmUVD_JPEG_POWER_STATUS), 0,
315 ~UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_MASK);
316
317
318 jpeg_v2_5_disable_clock_gating(adev, i);
319
320
321 WREG32_SOC15(JPEG, i, mmJPEG_DEC_GFX8_ADDR_CONFIG,
322 adev->gfx.config.gb_addr_config);
323 WREG32_SOC15(JPEG, i, mmJPEG_DEC_GFX10_ADDR_CONFIG,
324 adev->gfx.config.gb_addr_config);
325
326
327 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmUVD_JMI_CNTL), 0,
328 ~UVD_JMI_CNTL__SOFT_RESET_MASK);
329
330
331 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmJPEG_SYS_INT_EN),
332 JPEG_SYS_INT_EN__DJRBC_MASK,
333 ~JPEG_SYS_INT_EN__DJRBC_MASK);
334
335 WREG32_SOC15(JPEG, i, mmUVD_LMI_JRBC_RB_VMID, 0);
336 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_CNTL, (0x00000001L | 0x00000002L));
337 WREG32_SOC15(JPEG, i, mmUVD_LMI_JRBC_RB_64BIT_BAR_LOW,
338 lower_32_bits(ring->gpu_addr));
339 WREG32_SOC15(JPEG, i, mmUVD_LMI_JRBC_RB_64BIT_BAR_HIGH,
340 upper_32_bits(ring->gpu_addr));
341 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_RPTR, 0);
342 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_WPTR, 0);
343 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_CNTL, 0x00000002L);
344 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_SIZE, ring->ring_size / 4);
345 ring->wptr = RREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_WPTR);
346 }
347
348 return 0;
349}
350
351
352
353
354
355
356
357
358static int jpeg_v2_5_stop(struct amdgpu_device *adev)
359{
360 int i;
361
362 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
363 if (adev->jpeg.harvest_config & (1 << i))
364 continue;
365
366
367 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmUVD_JMI_CNTL),
368 UVD_JMI_CNTL__SOFT_RESET_MASK,
369 ~UVD_JMI_CNTL__SOFT_RESET_MASK);
370
371 jpeg_v2_5_enable_clock_gating(adev, i);
372
373
374 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmUVD_JPEG_POWER_STATUS),
375 UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_MASK,
376 ~UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_MASK);
377 }
378
379 return 0;
380}
381
382
383
384
385
386
387
388
389static uint64_t jpeg_v2_5_dec_ring_get_rptr(struct amdgpu_ring *ring)
390{
391 struct amdgpu_device *adev = ring->adev;
392
393 return RREG32_SOC15(JPEG, ring->me, mmUVD_JRBC_RB_RPTR);
394}
395
396
397
398
399
400
401
402
403static uint64_t jpeg_v2_5_dec_ring_get_wptr(struct amdgpu_ring *ring)
404{
405 struct amdgpu_device *adev = ring->adev;
406
407 if (ring->use_doorbell)
408 return adev->wb.wb[ring->wptr_offs];
409 else
410 return RREG32_SOC15(JPEG, ring->me, mmUVD_JRBC_RB_WPTR);
411}
412
413
414
415
416
417
418
419
420static void jpeg_v2_5_dec_ring_set_wptr(struct amdgpu_ring *ring)
421{
422 struct amdgpu_device *adev = ring->adev;
423
424 if (ring->use_doorbell) {
425 adev->wb.wb[ring->wptr_offs] = lower_32_bits(ring->wptr);
426 WDOORBELL32(ring->doorbell_index, lower_32_bits(ring->wptr));
427 } else {
428 WREG32_SOC15(JPEG, ring->me, mmUVD_JRBC_RB_WPTR, lower_32_bits(ring->wptr));
429 }
430}
431
432static bool jpeg_v2_5_is_idle(void *handle)
433{
434 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
435 int i, ret = 1;
436
437 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
438 if (adev->jpeg.harvest_config & (1 << i))
439 continue;
440
441 ret &= (((RREG32_SOC15(JPEG, i, mmUVD_JRBC_STATUS) &
442 UVD_JRBC_STATUS__RB_JOB_DONE_MASK) ==
443 UVD_JRBC_STATUS__RB_JOB_DONE_MASK));
444 }
445
446 return ret;
447}
448
449static int jpeg_v2_5_wait_for_idle(void *handle)
450{
451 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
452 int i, ret;
453
454 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
455 if (adev->jpeg.harvest_config & (1 << i))
456 continue;
457
458 ret = SOC15_WAIT_ON_RREG(JPEG, i, mmUVD_JRBC_STATUS,
459 UVD_JRBC_STATUS__RB_JOB_DONE_MASK,
460 UVD_JRBC_STATUS__RB_JOB_DONE_MASK);
461 if (ret)
462 return ret;
463 }
464
465 return 0;
466}
467
468static int jpeg_v2_5_set_clockgating_state(void *handle,
469 enum amd_clockgating_state state)
470{
471 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
472 bool enable = (state == AMD_CG_STATE_GATE);
473 int i;
474
475 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
476 if (adev->jpeg.harvest_config & (1 << i))
477 continue;
478
479 if (enable) {
480 if (!jpeg_v2_5_is_idle(handle))
481 return -EBUSY;
482 jpeg_v2_5_enable_clock_gating(adev, i);
483 } else {
484 jpeg_v2_5_disable_clock_gating(adev, i);
485 }
486 }
487
488 return 0;
489}
490
491static int jpeg_v2_5_set_powergating_state(void *handle,
492 enum amd_powergating_state state)
493{
494 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
495 int ret;
496
497 if(state == adev->jpeg.cur_state)
498 return 0;
499
500 if (state == AMD_PG_STATE_GATE)
501 ret = jpeg_v2_5_stop(adev);
502 else
503 ret = jpeg_v2_5_start(adev);
504
505 if(!ret)
506 adev->jpeg.cur_state = state;
507
508 return ret;
509}
510
511static int jpeg_v2_5_set_interrupt_state(struct amdgpu_device *adev,
512 struct amdgpu_irq_src *source,
513 unsigned type,
514 enum amdgpu_interrupt_state state)
515{
516 return 0;
517}
518
519static int jpeg_v2_5_process_interrupt(struct amdgpu_device *adev,
520 struct amdgpu_irq_src *source,
521 struct amdgpu_iv_entry *entry)
522{
523 uint32_t ip_instance;
524
525 switch (entry->client_id) {
526 case SOC15_IH_CLIENTID_VCN:
527 ip_instance = 0;
528 break;
529 case SOC15_IH_CLIENTID_VCN1:
530 ip_instance = 1;
531 break;
532 default:
533 DRM_ERROR("Unhandled client id: %d\n", entry->client_id);
534 return 0;
535 }
536
537 DRM_DEBUG("IH: JPEG TRAP\n");
538
539 switch (entry->src_id) {
540 case VCN_2_0__SRCID__JPEG_DECODE:
541 amdgpu_fence_process(&adev->jpeg.inst[ip_instance].ring_dec);
542 break;
543 default:
544 DRM_ERROR("Unhandled interrupt: %d %d\n",
545 entry->src_id, entry->src_data[0]);
546 break;
547 }
548
549 return 0;
550}
551
552static const struct amd_ip_funcs jpeg_v2_5_ip_funcs = {
553 .name = "jpeg_v2_5",
554 .early_init = jpeg_v2_5_early_init,
555 .late_init = NULL,
556 .sw_init = jpeg_v2_5_sw_init,
557 .sw_fini = jpeg_v2_5_sw_fini,
558 .hw_init = jpeg_v2_5_hw_init,
559 .hw_fini = jpeg_v2_5_hw_fini,
560 .suspend = jpeg_v2_5_suspend,
561 .resume = jpeg_v2_5_resume,
562 .is_idle = jpeg_v2_5_is_idle,
563 .wait_for_idle = jpeg_v2_5_wait_for_idle,
564 .check_soft_reset = NULL,
565 .pre_soft_reset = NULL,
566 .soft_reset = NULL,
567 .post_soft_reset = NULL,
568 .set_clockgating_state = jpeg_v2_5_set_clockgating_state,
569 .set_powergating_state = jpeg_v2_5_set_powergating_state,
570};
571
572static const struct amdgpu_ring_funcs jpeg_v2_5_dec_ring_vm_funcs = {
573 .type = AMDGPU_RING_TYPE_VCN_JPEG,
574 .align_mask = 0xf,
575 .vmhub = AMDGPU_MMHUB_1,
576 .get_rptr = jpeg_v2_5_dec_ring_get_rptr,
577 .get_wptr = jpeg_v2_5_dec_ring_get_wptr,
578 .set_wptr = jpeg_v2_5_dec_ring_set_wptr,
579 .emit_frame_size =
580 SOC15_FLUSH_GPU_TLB_NUM_WREG * 6 +
581 SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 8 +
582 8 +
583 18 + 18 +
584 8 + 16,
585 .emit_ib_size = 22,
586 .emit_ib = jpeg_v2_0_dec_ring_emit_ib,
587 .emit_fence = jpeg_v2_0_dec_ring_emit_fence,
588 .emit_vm_flush = jpeg_v2_0_dec_ring_emit_vm_flush,
589 .test_ring = amdgpu_jpeg_dec_ring_test_ring,
590 .test_ib = amdgpu_jpeg_dec_ring_test_ib,
591 .insert_nop = jpeg_v2_0_dec_ring_nop,
592 .insert_start = jpeg_v2_0_dec_ring_insert_start,
593 .insert_end = jpeg_v2_0_dec_ring_insert_end,
594 .pad_ib = amdgpu_ring_generic_pad_ib,
595 .begin_use = amdgpu_jpeg_ring_begin_use,
596 .end_use = amdgpu_jpeg_ring_end_use,
597 .emit_wreg = jpeg_v2_0_dec_ring_emit_wreg,
598 .emit_reg_wait = jpeg_v2_0_dec_ring_emit_reg_wait,
599 .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
600};
601
602static void jpeg_v2_5_set_dec_ring_funcs(struct amdgpu_device *adev)
603{
604 int i;
605
606 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
607 if (adev->jpeg.harvest_config & (1 << i))
608 continue;
609
610 adev->jpeg.inst[i].ring_dec.funcs = &jpeg_v2_5_dec_ring_vm_funcs;
611 adev->jpeg.inst[i].ring_dec.me = i;
612 DRM_INFO("JPEG(%d) JPEG decode is enabled in VM mode\n", i);
613 }
614}
615
616static const struct amdgpu_irq_src_funcs jpeg_v2_5_irq_funcs = {
617 .set = jpeg_v2_5_set_interrupt_state,
618 .process = jpeg_v2_5_process_interrupt,
619};
620
621static void jpeg_v2_5_set_irq_funcs(struct amdgpu_device *adev)
622{
623 int i;
624
625 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
626 if (adev->jpeg.harvest_config & (1 << i))
627 continue;
628
629 adev->jpeg.inst[i].irq.num_types = 1;
630 adev->jpeg.inst[i].irq.funcs = &jpeg_v2_5_irq_funcs;
631 }
632}
633
634const struct amdgpu_ip_block_version jpeg_v2_5_ip_block =
635{
636 .type = AMD_IP_BLOCK_TYPE_JPEG,
637 .major = 2,
638 .minor = 5,
639 .rev = 0,
640 .funcs = &jpeg_v2_5_ip_funcs,
641};
642