Loading...
1/*
2 * Copyright 2019 Advanced Micro Devices, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
21 *
22 */
23
24#include "amdgpu.h"
25#include "amdgpu_jpeg.h"
26#include "soc15.h"
27#include "soc15d.h"
28#include "jpeg_v2_0.h"
29#include "jpeg_v2_5.h"
30
31#include "vcn/vcn_2_5_offset.h"
32#include "vcn/vcn_2_5_sh_mask.h"
33#include "ivsrcid/vcn/irqsrcs_vcn_2_0.h"
34
35#define mmUVD_JPEG_PITCH_INTERNAL_OFFSET 0x401f
36
37#define JPEG25_MAX_HW_INSTANCES_ARCTURUS 2
38
39static void jpeg_v2_5_set_dec_ring_funcs(struct amdgpu_device *adev);
40static void jpeg_v2_5_set_irq_funcs(struct amdgpu_device *adev);
41static int jpeg_v2_5_set_powergating_state(void *handle,
42 enum amd_powergating_state state);
43static void jpeg_v2_5_set_ras_funcs(struct amdgpu_device *adev);
44
45static int amdgpu_ih_clientid_jpeg[] = {
46 SOC15_IH_CLIENTID_VCN,
47 SOC15_IH_CLIENTID_VCN1
48};
49
50/**
51 * jpeg_v2_5_early_init - set function pointers
52 *
53 * @handle: amdgpu_device pointer
54 *
55 * Set ring and irq function pointers
56 */
57static int jpeg_v2_5_early_init(void *handle)
58{
59 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
60 u32 harvest;
61 int i;
62
63 adev->jpeg.num_jpeg_rings = 1;
64 adev->jpeg.num_jpeg_inst = JPEG25_MAX_HW_INSTANCES_ARCTURUS;
65 for (i = 0; i < adev->jpeg.num_jpeg_inst; i++) {
66 harvest = RREG32_SOC15(JPEG, i, mmCC_UVD_HARVESTING);
67 if (harvest & CC_UVD_HARVESTING__UVD_DISABLE_MASK)
68 adev->jpeg.harvest_config |= 1 << i;
69 }
70 if (adev->jpeg.harvest_config == (AMDGPU_JPEG_HARVEST_JPEG0 |
71 AMDGPU_JPEG_HARVEST_JPEG1))
72 return -ENOENT;
73
74 jpeg_v2_5_set_dec_ring_funcs(adev);
75 jpeg_v2_5_set_irq_funcs(adev);
76 jpeg_v2_5_set_ras_funcs(adev);
77
78 return 0;
79}
80
81/**
82 * jpeg_v2_5_sw_init - sw init for JPEG block
83 *
84 * @handle: amdgpu_device pointer
85 *
86 * Load firmware and sw initialization
87 */
88static int jpeg_v2_5_sw_init(void *handle)
89{
90 struct amdgpu_ring *ring;
91 int i, r;
92 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
93
94 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
95 if (adev->jpeg.harvest_config & (1 << i))
96 continue;
97
98 /* JPEG TRAP */
99 r = amdgpu_irq_add_id(adev, amdgpu_ih_clientid_jpeg[i],
100 VCN_2_0__SRCID__JPEG_DECODE, &adev->jpeg.inst[i].irq);
101 if (r)
102 return r;
103
104 /* JPEG DJPEG POISON EVENT */
105 r = amdgpu_irq_add_id(adev, amdgpu_ih_clientid_jpeg[i],
106 VCN_2_6__SRCID_DJPEG0_POISON, &adev->jpeg.inst[i].ras_poison_irq);
107 if (r)
108 return r;
109
110 /* JPEG EJPEG POISON EVENT */
111 r = amdgpu_irq_add_id(adev, amdgpu_ih_clientid_jpeg[i],
112 VCN_2_6__SRCID_EJPEG0_POISON, &adev->jpeg.inst[i].ras_poison_irq);
113 if (r)
114 return r;
115 }
116
117 r = amdgpu_jpeg_sw_init(adev);
118 if (r)
119 return r;
120
121 r = amdgpu_jpeg_resume(adev);
122 if (r)
123 return r;
124
125 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
126 if (adev->jpeg.harvest_config & (1 << i))
127 continue;
128
129 ring = adev->jpeg.inst[i].ring_dec;
130 ring->use_doorbell = true;
131 if (amdgpu_ip_version(adev, UVD_HWIP, 0) == IP_VERSION(2, 5, 0))
132 ring->vm_hub = AMDGPU_MMHUB1(0);
133 else
134 ring->vm_hub = AMDGPU_MMHUB0(0);
135 ring->doorbell_index = (adev->doorbell_index.vcn.vcn_ring0_1 << 1) + 1 + 8 * i;
136 sprintf(ring->name, "jpeg_dec_%d", i);
137 r = amdgpu_ring_init(adev, ring, 512, &adev->jpeg.inst[i].irq,
138 0, AMDGPU_RING_PRIO_DEFAULT, NULL);
139 if (r)
140 return r;
141
142 adev->jpeg.internal.jpeg_pitch[0] = mmUVD_JPEG_PITCH_INTERNAL_OFFSET;
143 adev->jpeg.inst[i].external.jpeg_pitch[0] = SOC15_REG_OFFSET(JPEG, i, mmUVD_JPEG_PITCH);
144 }
145
146 r = amdgpu_jpeg_ras_sw_init(adev);
147 if (r)
148 return r;
149
150 return 0;
151}
152
153/**
154 * jpeg_v2_5_sw_fini - sw fini for JPEG block
155 *
156 * @handle: amdgpu_device pointer
157 *
158 * JPEG suspend and free up sw allocation
159 */
160static int jpeg_v2_5_sw_fini(void *handle)
161{
162 int r;
163 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
164
165 r = amdgpu_jpeg_suspend(adev);
166 if (r)
167 return r;
168
169 r = amdgpu_jpeg_sw_fini(adev);
170
171 return r;
172}
173
174/**
175 * jpeg_v2_5_hw_init - start and test JPEG block
176 *
177 * @handle: amdgpu_device pointer
178 *
179 */
180static int jpeg_v2_5_hw_init(void *handle)
181{
182 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
183 struct amdgpu_ring *ring;
184 int i, r;
185
186 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
187 if (adev->jpeg.harvest_config & (1 << i))
188 continue;
189
190 ring = adev->jpeg.inst[i].ring_dec;
191 adev->nbio.funcs->vcn_doorbell_range(adev, ring->use_doorbell,
192 (adev->doorbell_index.vcn.vcn_ring0_1 << 1) + 8 * i, i);
193
194 r = amdgpu_ring_test_helper(ring);
195 if (r)
196 return r;
197 }
198
199 DRM_INFO("JPEG decode initialized successfully.\n");
200
201 return 0;
202}
203
204/**
205 * jpeg_v2_5_hw_fini - stop the hardware block
206 *
207 * @handle: amdgpu_device pointer
208 *
209 * Stop the JPEG block, mark ring as not ready any more
210 */
211static int jpeg_v2_5_hw_fini(void *handle)
212{
213 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
214 int i;
215
216 cancel_delayed_work_sync(&adev->vcn.idle_work);
217
218 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
219 if (adev->jpeg.harvest_config & (1 << i))
220 continue;
221
222 if (adev->jpeg.cur_state != AMD_PG_STATE_GATE &&
223 RREG32_SOC15(JPEG, i, mmUVD_JRBC_STATUS))
224 jpeg_v2_5_set_powergating_state(adev, AMD_PG_STATE_GATE);
225
226 if (amdgpu_ras_is_supported(adev, AMDGPU_RAS_BLOCK__JPEG))
227 amdgpu_irq_put(adev, &adev->jpeg.inst[i].ras_poison_irq, 0);
228 }
229
230 return 0;
231}
232
233/**
234 * jpeg_v2_5_suspend - suspend JPEG block
235 *
236 * @handle: amdgpu_device pointer
237 *
238 * HW fini and suspend JPEG block
239 */
240static int jpeg_v2_5_suspend(void *handle)
241{
242 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
243 int r;
244
245 r = jpeg_v2_5_hw_fini(adev);
246 if (r)
247 return r;
248
249 r = amdgpu_jpeg_suspend(adev);
250
251 return r;
252}
253
254/**
255 * jpeg_v2_5_resume - resume JPEG block
256 *
257 * @handle: amdgpu_device pointer
258 *
259 * Resume firmware and hw init JPEG block
260 */
261static int jpeg_v2_5_resume(void *handle)
262{
263 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
264 int r;
265
266 r = amdgpu_jpeg_resume(adev);
267 if (r)
268 return r;
269
270 r = jpeg_v2_5_hw_init(adev);
271
272 return r;
273}
274
275static void jpeg_v2_5_disable_clock_gating(struct amdgpu_device *adev, int inst)
276{
277 uint32_t data;
278
279 data = RREG32_SOC15(JPEG, inst, mmJPEG_CGC_CTRL);
280 if (adev->cg_flags & AMD_CG_SUPPORT_JPEG_MGCG)
281 data |= 1 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
282 else
283 data &= ~JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
284
285 data |= 1 << JPEG_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
286 data |= 4 << JPEG_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
287 WREG32_SOC15(JPEG, inst, mmJPEG_CGC_CTRL, data);
288
289 data = RREG32_SOC15(JPEG, inst, mmJPEG_CGC_GATE);
290 data &= ~(JPEG_CGC_GATE__JPEG_DEC_MASK
291 | JPEG_CGC_GATE__JPEG2_DEC_MASK
292 | JPEG_CGC_GATE__JMCIF_MASK
293 | JPEG_CGC_GATE__JRBBM_MASK);
294 WREG32_SOC15(JPEG, inst, mmJPEG_CGC_GATE, data);
295
296 data = RREG32_SOC15(JPEG, inst, mmJPEG_CGC_CTRL);
297 data &= ~(JPEG_CGC_CTRL__JPEG_DEC_MODE_MASK
298 | JPEG_CGC_CTRL__JPEG2_DEC_MODE_MASK
299 | JPEG_CGC_CTRL__JMCIF_MODE_MASK
300 | JPEG_CGC_CTRL__JRBBM_MODE_MASK);
301 WREG32_SOC15(JPEG, inst, mmJPEG_CGC_CTRL, data);
302}
303
304static void jpeg_v2_5_enable_clock_gating(struct amdgpu_device *adev, int inst)
305{
306 uint32_t data;
307
308 data = RREG32_SOC15(JPEG, inst, mmJPEG_CGC_GATE);
309 data |= (JPEG_CGC_GATE__JPEG_DEC_MASK
310 |JPEG_CGC_GATE__JPEG2_DEC_MASK
311 |JPEG_CGC_GATE__JPEG_ENC_MASK
312 |JPEG_CGC_GATE__JMCIF_MASK
313 |JPEG_CGC_GATE__JRBBM_MASK);
314 WREG32_SOC15(JPEG, inst, mmJPEG_CGC_GATE, data);
315}
316
317/**
318 * jpeg_v2_5_start - start JPEG block
319 *
320 * @adev: amdgpu_device pointer
321 *
322 * Setup and start the JPEG block
323 */
324static int jpeg_v2_5_start(struct amdgpu_device *adev)
325{
326 struct amdgpu_ring *ring;
327 int i;
328
329 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
330 if (adev->jpeg.harvest_config & (1 << i))
331 continue;
332
333 ring = adev->jpeg.inst[i].ring_dec;
334 /* disable anti hang mechanism */
335 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmUVD_JPEG_POWER_STATUS), 0,
336 ~UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_MASK);
337
338 /* JPEG disable CGC */
339 jpeg_v2_5_disable_clock_gating(adev, i);
340
341 /* MJPEG global tiling registers */
342 WREG32_SOC15(JPEG, i, mmJPEG_DEC_GFX8_ADDR_CONFIG,
343 adev->gfx.config.gb_addr_config);
344 WREG32_SOC15(JPEG, i, mmJPEG_DEC_GFX10_ADDR_CONFIG,
345 adev->gfx.config.gb_addr_config);
346
347 /* enable JMI channel */
348 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmUVD_JMI_CNTL), 0,
349 ~UVD_JMI_CNTL__SOFT_RESET_MASK);
350
351 /* enable System Interrupt for JRBC */
352 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmJPEG_SYS_INT_EN),
353 JPEG_SYS_INT_EN__DJRBC_MASK,
354 ~JPEG_SYS_INT_EN__DJRBC_MASK);
355
356 WREG32_SOC15(JPEG, i, mmUVD_LMI_JRBC_RB_VMID, 0);
357 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_CNTL, (0x00000001L | 0x00000002L));
358 WREG32_SOC15(JPEG, i, mmUVD_LMI_JRBC_RB_64BIT_BAR_LOW,
359 lower_32_bits(ring->gpu_addr));
360 WREG32_SOC15(JPEG, i, mmUVD_LMI_JRBC_RB_64BIT_BAR_HIGH,
361 upper_32_bits(ring->gpu_addr));
362 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_RPTR, 0);
363 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_WPTR, 0);
364 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_CNTL, 0x00000002L);
365 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_SIZE, ring->ring_size / 4);
366 ring->wptr = RREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_WPTR);
367 }
368
369 return 0;
370}
371
372/**
373 * jpeg_v2_5_stop - stop JPEG block
374 *
375 * @adev: amdgpu_device pointer
376 *
377 * stop the JPEG block
378 */
379static int jpeg_v2_5_stop(struct amdgpu_device *adev)
380{
381 int i;
382
383 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
384 if (adev->jpeg.harvest_config & (1 << i))
385 continue;
386
387 /* reset JMI */
388 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmUVD_JMI_CNTL),
389 UVD_JMI_CNTL__SOFT_RESET_MASK,
390 ~UVD_JMI_CNTL__SOFT_RESET_MASK);
391
392 jpeg_v2_5_enable_clock_gating(adev, i);
393
394 /* enable anti hang mechanism */
395 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmUVD_JPEG_POWER_STATUS),
396 UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_MASK,
397 ~UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_MASK);
398 }
399
400 return 0;
401}
402
403/**
404 * jpeg_v2_5_dec_ring_get_rptr - get read pointer
405 *
406 * @ring: amdgpu_ring pointer
407 *
408 * Returns the current hardware read pointer
409 */
410static uint64_t jpeg_v2_5_dec_ring_get_rptr(struct amdgpu_ring *ring)
411{
412 struct amdgpu_device *adev = ring->adev;
413
414 return RREG32_SOC15(JPEG, ring->me, mmUVD_JRBC_RB_RPTR);
415}
416
417/**
418 * jpeg_v2_5_dec_ring_get_wptr - get write pointer
419 *
420 * @ring: amdgpu_ring pointer
421 *
422 * Returns the current hardware write pointer
423 */
424static uint64_t jpeg_v2_5_dec_ring_get_wptr(struct amdgpu_ring *ring)
425{
426 struct amdgpu_device *adev = ring->adev;
427
428 if (ring->use_doorbell)
429 return *ring->wptr_cpu_addr;
430 else
431 return RREG32_SOC15(JPEG, ring->me, mmUVD_JRBC_RB_WPTR);
432}
433
434/**
435 * jpeg_v2_5_dec_ring_set_wptr - set write pointer
436 *
437 * @ring: amdgpu_ring pointer
438 *
439 * Commits the write pointer to the hardware
440 */
441static void jpeg_v2_5_dec_ring_set_wptr(struct amdgpu_ring *ring)
442{
443 struct amdgpu_device *adev = ring->adev;
444
445 if (ring->use_doorbell) {
446 *ring->wptr_cpu_addr = lower_32_bits(ring->wptr);
447 WDOORBELL32(ring->doorbell_index, lower_32_bits(ring->wptr));
448 } else {
449 WREG32_SOC15(JPEG, ring->me, mmUVD_JRBC_RB_WPTR, lower_32_bits(ring->wptr));
450 }
451}
452
453/**
454 * jpeg_v2_6_dec_ring_insert_start - insert a start command
455 *
456 * @ring: amdgpu_ring pointer
457 *
458 * Write a start command to the ring.
459 */
460static void jpeg_v2_6_dec_ring_insert_start(struct amdgpu_ring *ring)
461{
462 amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
463 0, 0, PACKETJ_TYPE0));
464 amdgpu_ring_write(ring, 0x6aa04); /* PCTL0_MMHUB_DEEPSLEEP_IB */
465
466 amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
467 0, 0, PACKETJ_TYPE0));
468 amdgpu_ring_write(ring, 0x80000000 | (1 << (ring->me * 2 + 14)));
469}
470
471/**
472 * jpeg_v2_6_dec_ring_insert_end - insert a end command
473 *
474 * @ring: amdgpu_ring pointer
475 *
476 * Write a end command to the ring.
477 */
478static void jpeg_v2_6_dec_ring_insert_end(struct amdgpu_ring *ring)
479{
480 amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
481 0, 0, PACKETJ_TYPE0));
482 amdgpu_ring_write(ring, 0x6aa04); /* PCTL0_MMHUB_DEEPSLEEP_IB */
483
484 amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
485 0, 0, PACKETJ_TYPE0));
486 amdgpu_ring_write(ring, (1 << (ring->me * 2 + 14)));
487}
488
489static bool jpeg_v2_5_is_idle(void *handle)
490{
491 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
492 int i, ret = 1;
493
494 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
495 if (adev->jpeg.harvest_config & (1 << i))
496 continue;
497
498 ret &= (((RREG32_SOC15(JPEG, i, mmUVD_JRBC_STATUS) &
499 UVD_JRBC_STATUS__RB_JOB_DONE_MASK) ==
500 UVD_JRBC_STATUS__RB_JOB_DONE_MASK));
501 }
502
503 return ret;
504}
505
506static int jpeg_v2_5_wait_for_idle(void *handle)
507{
508 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
509 int i, ret;
510
511 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
512 if (adev->jpeg.harvest_config & (1 << i))
513 continue;
514
515 ret = SOC15_WAIT_ON_RREG(JPEG, i, mmUVD_JRBC_STATUS,
516 UVD_JRBC_STATUS__RB_JOB_DONE_MASK,
517 UVD_JRBC_STATUS__RB_JOB_DONE_MASK);
518 if (ret)
519 return ret;
520 }
521
522 return 0;
523}
524
525static int jpeg_v2_5_set_clockgating_state(void *handle,
526 enum amd_clockgating_state state)
527{
528 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
529 bool enable = (state == AMD_CG_STATE_GATE);
530 int i;
531
532 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
533 if (adev->jpeg.harvest_config & (1 << i))
534 continue;
535
536 if (enable) {
537 if (!jpeg_v2_5_is_idle(handle))
538 return -EBUSY;
539 jpeg_v2_5_enable_clock_gating(adev, i);
540 } else {
541 jpeg_v2_5_disable_clock_gating(adev, i);
542 }
543 }
544
545 return 0;
546}
547
548static int jpeg_v2_5_set_powergating_state(void *handle,
549 enum amd_powergating_state state)
550{
551 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
552 int ret;
553
554 if (state == adev->jpeg.cur_state)
555 return 0;
556
557 if (state == AMD_PG_STATE_GATE)
558 ret = jpeg_v2_5_stop(adev);
559 else
560 ret = jpeg_v2_5_start(adev);
561
562 if (!ret)
563 adev->jpeg.cur_state = state;
564
565 return ret;
566}
567
568static int jpeg_v2_5_set_interrupt_state(struct amdgpu_device *adev,
569 struct amdgpu_irq_src *source,
570 unsigned type,
571 enum amdgpu_interrupt_state state)
572{
573 return 0;
574}
575
576static int jpeg_v2_6_set_ras_interrupt_state(struct amdgpu_device *adev,
577 struct amdgpu_irq_src *source,
578 unsigned int type,
579 enum amdgpu_interrupt_state state)
580{
581 return 0;
582}
583
584static int jpeg_v2_5_process_interrupt(struct amdgpu_device *adev,
585 struct amdgpu_irq_src *source,
586 struct amdgpu_iv_entry *entry)
587{
588 uint32_t ip_instance;
589
590 switch (entry->client_id) {
591 case SOC15_IH_CLIENTID_VCN:
592 ip_instance = 0;
593 break;
594 case SOC15_IH_CLIENTID_VCN1:
595 ip_instance = 1;
596 break;
597 default:
598 DRM_ERROR("Unhandled client id: %d\n", entry->client_id);
599 return 0;
600 }
601
602 DRM_DEBUG("IH: JPEG TRAP\n");
603
604 switch (entry->src_id) {
605 case VCN_2_0__SRCID__JPEG_DECODE:
606 amdgpu_fence_process(adev->jpeg.inst[ip_instance].ring_dec);
607 break;
608 default:
609 DRM_ERROR("Unhandled interrupt: %d %d\n",
610 entry->src_id, entry->src_data[0]);
611 break;
612 }
613
614 return 0;
615}
616
617static const struct amd_ip_funcs jpeg_v2_5_ip_funcs = {
618 .name = "jpeg_v2_5",
619 .early_init = jpeg_v2_5_early_init,
620 .late_init = NULL,
621 .sw_init = jpeg_v2_5_sw_init,
622 .sw_fini = jpeg_v2_5_sw_fini,
623 .hw_init = jpeg_v2_5_hw_init,
624 .hw_fini = jpeg_v2_5_hw_fini,
625 .suspend = jpeg_v2_5_suspend,
626 .resume = jpeg_v2_5_resume,
627 .is_idle = jpeg_v2_5_is_idle,
628 .wait_for_idle = jpeg_v2_5_wait_for_idle,
629 .check_soft_reset = NULL,
630 .pre_soft_reset = NULL,
631 .soft_reset = NULL,
632 .post_soft_reset = NULL,
633 .set_clockgating_state = jpeg_v2_5_set_clockgating_state,
634 .set_powergating_state = jpeg_v2_5_set_powergating_state,
635};
636
637static const struct amd_ip_funcs jpeg_v2_6_ip_funcs = {
638 .name = "jpeg_v2_6",
639 .early_init = jpeg_v2_5_early_init,
640 .late_init = NULL,
641 .sw_init = jpeg_v2_5_sw_init,
642 .sw_fini = jpeg_v2_5_sw_fini,
643 .hw_init = jpeg_v2_5_hw_init,
644 .hw_fini = jpeg_v2_5_hw_fini,
645 .suspend = jpeg_v2_5_suspend,
646 .resume = jpeg_v2_5_resume,
647 .is_idle = jpeg_v2_5_is_idle,
648 .wait_for_idle = jpeg_v2_5_wait_for_idle,
649 .check_soft_reset = NULL,
650 .pre_soft_reset = NULL,
651 .soft_reset = NULL,
652 .post_soft_reset = NULL,
653 .set_clockgating_state = jpeg_v2_5_set_clockgating_state,
654 .set_powergating_state = jpeg_v2_5_set_powergating_state,
655};
656
657static const struct amdgpu_ring_funcs jpeg_v2_5_dec_ring_vm_funcs = {
658 .type = AMDGPU_RING_TYPE_VCN_JPEG,
659 .align_mask = 0xf,
660 .get_rptr = jpeg_v2_5_dec_ring_get_rptr,
661 .get_wptr = jpeg_v2_5_dec_ring_get_wptr,
662 .set_wptr = jpeg_v2_5_dec_ring_set_wptr,
663 .emit_frame_size =
664 SOC15_FLUSH_GPU_TLB_NUM_WREG * 6 +
665 SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 8 +
666 8 + /* jpeg_v2_5_dec_ring_emit_vm_flush */
667 18 + 18 + /* jpeg_v2_5_dec_ring_emit_fence x2 vm fence */
668 8 + 16,
669 .emit_ib_size = 22, /* jpeg_v2_5_dec_ring_emit_ib */
670 .emit_ib = jpeg_v2_0_dec_ring_emit_ib,
671 .emit_fence = jpeg_v2_0_dec_ring_emit_fence,
672 .emit_vm_flush = jpeg_v2_0_dec_ring_emit_vm_flush,
673 .test_ring = amdgpu_jpeg_dec_ring_test_ring,
674 .test_ib = amdgpu_jpeg_dec_ring_test_ib,
675 .insert_nop = jpeg_v2_0_dec_ring_nop,
676 .insert_start = jpeg_v2_0_dec_ring_insert_start,
677 .insert_end = jpeg_v2_0_dec_ring_insert_end,
678 .pad_ib = amdgpu_ring_generic_pad_ib,
679 .begin_use = amdgpu_jpeg_ring_begin_use,
680 .end_use = amdgpu_jpeg_ring_end_use,
681 .emit_wreg = jpeg_v2_0_dec_ring_emit_wreg,
682 .emit_reg_wait = jpeg_v2_0_dec_ring_emit_reg_wait,
683 .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
684};
685
686static const struct amdgpu_ring_funcs jpeg_v2_6_dec_ring_vm_funcs = {
687 .type = AMDGPU_RING_TYPE_VCN_JPEG,
688 .align_mask = 0xf,
689 .get_rptr = jpeg_v2_5_dec_ring_get_rptr,
690 .get_wptr = jpeg_v2_5_dec_ring_get_wptr,
691 .set_wptr = jpeg_v2_5_dec_ring_set_wptr,
692 .emit_frame_size =
693 SOC15_FLUSH_GPU_TLB_NUM_WREG * 6 +
694 SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 8 +
695 8 + /* jpeg_v2_5_dec_ring_emit_vm_flush */
696 18 + 18 + /* jpeg_v2_5_dec_ring_emit_fence x2 vm fence */
697 8 + 16,
698 .emit_ib_size = 22, /* jpeg_v2_5_dec_ring_emit_ib */
699 .emit_ib = jpeg_v2_0_dec_ring_emit_ib,
700 .emit_fence = jpeg_v2_0_dec_ring_emit_fence,
701 .emit_vm_flush = jpeg_v2_0_dec_ring_emit_vm_flush,
702 .test_ring = amdgpu_jpeg_dec_ring_test_ring,
703 .test_ib = amdgpu_jpeg_dec_ring_test_ib,
704 .insert_nop = jpeg_v2_0_dec_ring_nop,
705 .insert_start = jpeg_v2_6_dec_ring_insert_start,
706 .insert_end = jpeg_v2_6_dec_ring_insert_end,
707 .pad_ib = amdgpu_ring_generic_pad_ib,
708 .begin_use = amdgpu_jpeg_ring_begin_use,
709 .end_use = amdgpu_jpeg_ring_end_use,
710 .emit_wreg = jpeg_v2_0_dec_ring_emit_wreg,
711 .emit_reg_wait = jpeg_v2_0_dec_ring_emit_reg_wait,
712 .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
713};
714
715static void jpeg_v2_5_set_dec_ring_funcs(struct amdgpu_device *adev)
716{
717 int i;
718
719 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
720 if (adev->jpeg.harvest_config & (1 << i))
721 continue;
722 if (adev->asic_type == CHIP_ARCTURUS)
723 adev->jpeg.inst[i].ring_dec->funcs = &jpeg_v2_5_dec_ring_vm_funcs;
724 else /* CHIP_ALDEBARAN */
725 adev->jpeg.inst[i].ring_dec->funcs = &jpeg_v2_6_dec_ring_vm_funcs;
726 adev->jpeg.inst[i].ring_dec->me = i;
727 DRM_INFO("JPEG(%d) JPEG decode is enabled in VM mode\n", i);
728 }
729}
730
731static const struct amdgpu_irq_src_funcs jpeg_v2_5_irq_funcs = {
732 .set = jpeg_v2_5_set_interrupt_state,
733 .process = jpeg_v2_5_process_interrupt,
734};
735
736static const struct amdgpu_irq_src_funcs jpeg_v2_6_ras_irq_funcs = {
737 .set = jpeg_v2_6_set_ras_interrupt_state,
738 .process = amdgpu_jpeg_process_poison_irq,
739};
740
741static void jpeg_v2_5_set_irq_funcs(struct amdgpu_device *adev)
742{
743 int i;
744
745 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
746 if (adev->jpeg.harvest_config & (1 << i))
747 continue;
748
749 adev->jpeg.inst[i].irq.num_types = 1;
750 adev->jpeg.inst[i].irq.funcs = &jpeg_v2_5_irq_funcs;
751
752 adev->jpeg.inst[i].ras_poison_irq.num_types = 1;
753 adev->jpeg.inst[i].ras_poison_irq.funcs = &jpeg_v2_6_ras_irq_funcs;
754 }
755}
756
757const struct amdgpu_ip_block_version jpeg_v2_5_ip_block = {
758 .type = AMD_IP_BLOCK_TYPE_JPEG,
759 .major = 2,
760 .minor = 5,
761 .rev = 0,
762 .funcs = &jpeg_v2_5_ip_funcs,
763};
764
765const struct amdgpu_ip_block_version jpeg_v2_6_ip_block = {
766 .type = AMD_IP_BLOCK_TYPE_JPEG,
767 .major = 2,
768 .minor = 6,
769 .rev = 0,
770 .funcs = &jpeg_v2_6_ip_funcs,
771};
772
773static uint32_t jpeg_v2_6_query_poison_by_instance(struct amdgpu_device *adev,
774 uint32_t instance, uint32_t sub_block)
775{
776 uint32_t poison_stat = 0, reg_value = 0;
777
778 switch (sub_block) {
779 case AMDGPU_JPEG_V2_6_JPEG0:
780 reg_value = RREG32_SOC15(JPEG, instance, mmUVD_RAS_JPEG0_STATUS);
781 poison_stat = REG_GET_FIELD(reg_value, UVD_RAS_JPEG0_STATUS, POISONED_PF);
782 break;
783 case AMDGPU_JPEG_V2_6_JPEG1:
784 reg_value = RREG32_SOC15(JPEG, instance, mmUVD_RAS_JPEG1_STATUS);
785 poison_stat = REG_GET_FIELD(reg_value, UVD_RAS_JPEG1_STATUS, POISONED_PF);
786 break;
787 default:
788 break;
789 }
790
791 if (poison_stat)
792 dev_info(adev->dev, "Poison detected in JPEG%d sub_block%d\n",
793 instance, sub_block);
794
795 return poison_stat;
796}
797
798static bool jpeg_v2_6_query_ras_poison_status(struct amdgpu_device *adev)
799{
800 uint32_t inst = 0, sub = 0, poison_stat = 0;
801
802 for (inst = 0; inst < adev->jpeg.num_jpeg_inst; inst++)
803 for (sub = 0; sub < AMDGPU_JPEG_V2_6_MAX_SUB_BLOCK; sub++)
804 poison_stat +=
805 jpeg_v2_6_query_poison_by_instance(adev, inst, sub);
806
807 return !!poison_stat;
808}
809
810const struct amdgpu_ras_block_hw_ops jpeg_v2_6_ras_hw_ops = {
811 .query_poison_status = jpeg_v2_6_query_ras_poison_status,
812};
813
814static struct amdgpu_jpeg_ras jpeg_v2_6_ras = {
815 .ras_block = {
816 .hw_ops = &jpeg_v2_6_ras_hw_ops,
817 .ras_late_init = amdgpu_jpeg_ras_late_init,
818 },
819};
820
821static void jpeg_v2_5_set_ras_funcs(struct amdgpu_device *adev)
822{
823 switch (amdgpu_ip_version(adev, JPEG_HWIP, 0)) {
824 case IP_VERSION(2, 6, 0):
825 adev->jpeg.ras = &jpeg_v2_6_ras;
826 break;
827 default:
828 break;
829 }
830}
1/*
2 * Copyright 2019 Advanced Micro Devices, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
21 *
22 */
23
24#include "amdgpu.h"
25#include "amdgpu_jpeg.h"
26#include "soc15.h"
27#include "soc15d.h"
28#include "jpeg_v2_0.h"
29#include "jpeg_v2_5.h"
30
31#include "vcn/vcn_2_5_offset.h"
32#include "vcn/vcn_2_5_sh_mask.h"
33#include "ivsrcid/vcn/irqsrcs_vcn_2_0.h"
34
35#define mmUVD_JPEG_PITCH_INTERNAL_OFFSET 0x401f
36
37#define JPEG25_MAX_HW_INSTANCES_ARCTURUS 2
38
39static void jpeg_v2_5_set_dec_ring_funcs(struct amdgpu_device *adev);
40static void jpeg_v2_5_set_irq_funcs(struct amdgpu_device *adev);
41static int jpeg_v2_5_set_powergating_state(void *handle,
42 enum amd_powergating_state state);
43static void jpeg_v2_5_set_ras_funcs(struct amdgpu_device *adev);
44
45static int amdgpu_ih_clientid_jpeg[] = {
46 SOC15_IH_CLIENTID_VCN,
47 SOC15_IH_CLIENTID_VCN1
48};
49
50/**
51 * jpeg_v2_5_early_init - set function pointers
52 *
53 * @ip_block: Pointer to the amdgpu_ip_block for this hw instance.
54 *
55 * Set ring and irq function pointers
56 */
57static int jpeg_v2_5_early_init(struct amdgpu_ip_block *ip_block)
58{
59 struct amdgpu_device *adev = ip_block->adev;
60 u32 harvest;
61 int i;
62
63 adev->jpeg.num_jpeg_rings = 1;
64 adev->jpeg.num_jpeg_inst = JPEG25_MAX_HW_INSTANCES_ARCTURUS;
65 for (i = 0; i < adev->jpeg.num_jpeg_inst; i++) {
66 harvest = RREG32_SOC15(JPEG, i, mmCC_UVD_HARVESTING);
67 if (harvest & CC_UVD_HARVESTING__UVD_DISABLE_MASK)
68 adev->jpeg.harvest_config |= 1 << i;
69 }
70 if (adev->jpeg.harvest_config == (AMDGPU_JPEG_HARVEST_JPEG0 |
71 AMDGPU_JPEG_HARVEST_JPEG1))
72 return -ENOENT;
73
74 jpeg_v2_5_set_dec_ring_funcs(adev);
75 jpeg_v2_5_set_irq_funcs(adev);
76 jpeg_v2_5_set_ras_funcs(adev);
77
78 return 0;
79}
80
81/**
82 * jpeg_v2_5_sw_init - sw init for JPEG block
83 *
84 * @ip_block: Pointer to the amdgpu_ip_block for this hw instance.
85 *
86 * Load firmware and sw initialization
87 */
88static int jpeg_v2_5_sw_init(struct amdgpu_ip_block *ip_block)
89{
90 struct amdgpu_ring *ring;
91 int i, r;
92 struct amdgpu_device *adev = ip_block->adev;
93
94 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
95 if (adev->jpeg.harvest_config & (1 << i))
96 continue;
97
98 /* JPEG TRAP */
99 r = amdgpu_irq_add_id(adev, amdgpu_ih_clientid_jpeg[i],
100 VCN_2_0__SRCID__JPEG_DECODE, &adev->jpeg.inst[i].irq);
101 if (r)
102 return r;
103
104 /* JPEG DJPEG POISON EVENT */
105 r = amdgpu_irq_add_id(adev, amdgpu_ih_clientid_jpeg[i],
106 VCN_2_6__SRCID_DJPEG0_POISON, &adev->jpeg.inst[i].ras_poison_irq);
107 if (r)
108 return r;
109
110 /* JPEG EJPEG POISON EVENT */
111 r = amdgpu_irq_add_id(adev, amdgpu_ih_clientid_jpeg[i],
112 VCN_2_6__SRCID_EJPEG0_POISON, &adev->jpeg.inst[i].ras_poison_irq);
113 if (r)
114 return r;
115 }
116
117 r = amdgpu_jpeg_sw_init(adev);
118 if (r)
119 return r;
120
121 r = amdgpu_jpeg_resume(adev);
122 if (r)
123 return r;
124
125 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
126 if (adev->jpeg.harvest_config & (1 << i))
127 continue;
128
129 ring = adev->jpeg.inst[i].ring_dec;
130 ring->use_doorbell = true;
131 if (amdgpu_ip_version(adev, UVD_HWIP, 0) == IP_VERSION(2, 5, 0))
132 ring->vm_hub = AMDGPU_MMHUB1(0);
133 else
134 ring->vm_hub = AMDGPU_MMHUB0(0);
135 ring->doorbell_index = (adev->doorbell_index.vcn.vcn_ring0_1 << 1) + 1 + 8 * i;
136 sprintf(ring->name, "jpeg_dec_%d", i);
137 r = amdgpu_ring_init(adev, ring, 512, &adev->jpeg.inst[i].irq,
138 0, AMDGPU_RING_PRIO_DEFAULT, NULL);
139 if (r)
140 return r;
141
142 adev->jpeg.internal.jpeg_pitch[0] = mmUVD_JPEG_PITCH_INTERNAL_OFFSET;
143 adev->jpeg.inst[i].external.jpeg_pitch[0] = SOC15_REG_OFFSET(JPEG, i, mmUVD_JPEG_PITCH);
144 }
145
146 r = amdgpu_jpeg_ras_sw_init(adev);
147 if (r)
148 return r;
149
150 return 0;
151}
152
153/**
154 * jpeg_v2_5_sw_fini - sw fini for JPEG block
155 *
156 * @ip_block: Pointer to the amdgpu_ip_block for this hw instance.
157 *
158 * JPEG suspend and free up sw allocation
159 */
160static int jpeg_v2_5_sw_fini(struct amdgpu_ip_block *ip_block)
161{
162 int r;
163 struct amdgpu_device *adev = ip_block->adev;
164
165 r = amdgpu_jpeg_suspend(adev);
166 if (r)
167 return r;
168
169 r = amdgpu_jpeg_sw_fini(adev);
170
171 return r;
172}
173
174/**
175 * jpeg_v2_5_hw_init - start and test JPEG block
176 *
177 * @ip_block: Pointer to the amdgpu_ip_block for this hw instance.
178 *
179 */
180static int jpeg_v2_5_hw_init(struct amdgpu_ip_block *ip_block)
181{
182 struct amdgpu_device *adev = ip_block->adev;
183 struct amdgpu_ring *ring;
184 int i, r;
185
186 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
187 if (adev->jpeg.harvest_config & (1 << i))
188 continue;
189
190 ring = adev->jpeg.inst[i].ring_dec;
191 adev->nbio.funcs->vcn_doorbell_range(adev, ring->use_doorbell,
192 (adev->doorbell_index.vcn.vcn_ring0_1 << 1) + 8 * i, i);
193
194 r = amdgpu_ring_test_helper(ring);
195 if (r)
196 return r;
197 }
198
199 return 0;
200}
201
202/**
203 * jpeg_v2_5_hw_fini - stop the hardware block
204 *
205 * @ip_block: Pointer to the amdgpu_ip_block for this hw instance.
206 *
207 * Stop the JPEG block, mark ring as not ready any more
208 */
209static int jpeg_v2_5_hw_fini(struct amdgpu_ip_block *ip_block)
210{
211 struct amdgpu_device *adev = ip_block->adev;
212 int i;
213
214 cancel_delayed_work_sync(&adev->jpeg.idle_work);
215
216 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
217 if (adev->jpeg.harvest_config & (1 << i))
218 continue;
219
220 if (adev->jpeg.cur_state != AMD_PG_STATE_GATE &&
221 RREG32_SOC15(JPEG, i, mmUVD_JRBC_STATUS))
222 jpeg_v2_5_set_powergating_state(adev, AMD_PG_STATE_GATE);
223
224 if (amdgpu_ras_is_supported(adev, AMDGPU_RAS_BLOCK__JPEG))
225 amdgpu_irq_put(adev, &adev->jpeg.inst[i].ras_poison_irq, 0);
226 }
227
228 return 0;
229}
230
231/**
232 * jpeg_v2_5_suspend - suspend JPEG block
233 *
234 * @ip_block: Pointer to the amdgpu_ip_block for this hw instance.
235 *
236 * HW fini and suspend JPEG block
237 */
238static int jpeg_v2_5_suspend(struct amdgpu_ip_block *ip_block)
239{
240 int r;
241
242 r = jpeg_v2_5_hw_fini(ip_block);
243 if (r)
244 return r;
245
246 r = amdgpu_jpeg_suspend(ip_block->adev);
247
248 return r;
249}
250
251/**
252 * jpeg_v2_5_resume - resume JPEG block
253 *
254 * @ip_block: Pointer to the amdgpu_ip_block for this hw instance.
255 *
256 * Resume firmware and hw init JPEG block
257 */
258static int jpeg_v2_5_resume(struct amdgpu_ip_block *ip_block)
259{
260 int r;
261
262 r = amdgpu_jpeg_resume(ip_block->adev);
263 if (r)
264 return r;
265
266 r = jpeg_v2_5_hw_init(ip_block);
267
268 return r;
269}
270
271static void jpeg_v2_5_disable_clock_gating(struct amdgpu_device *adev, int inst)
272{
273 uint32_t data;
274
275 data = RREG32_SOC15(JPEG, inst, mmJPEG_CGC_CTRL);
276 if (adev->cg_flags & AMD_CG_SUPPORT_JPEG_MGCG)
277 data |= 1 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
278 else
279 data &= ~JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
280
281 data |= 1 << JPEG_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
282 data |= 4 << JPEG_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
283 WREG32_SOC15(JPEG, inst, mmJPEG_CGC_CTRL, data);
284
285 data = RREG32_SOC15(JPEG, inst, mmJPEG_CGC_GATE);
286 data &= ~(JPEG_CGC_GATE__JPEG_DEC_MASK
287 | JPEG_CGC_GATE__JPEG2_DEC_MASK
288 | JPEG_CGC_GATE__JMCIF_MASK
289 | JPEG_CGC_GATE__JRBBM_MASK);
290 WREG32_SOC15(JPEG, inst, mmJPEG_CGC_GATE, data);
291
292 data = RREG32_SOC15(JPEG, inst, mmJPEG_CGC_CTRL);
293 data &= ~(JPEG_CGC_CTRL__JPEG_DEC_MODE_MASK
294 | JPEG_CGC_CTRL__JPEG2_DEC_MODE_MASK
295 | JPEG_CGC_CTRL__JMCIF_MODE_MASK
296 | JPEG_CGC_CTRL__JRBBM_MODE_MASK);
297 WREG32_SOC15(JPEG, inst, mmJPEG_CGC_CTRL, data);
298}
299
300static void jpeg_v2_5_enable_clock_gating(struct amdgpu_device *adev, int inst)
301{
302 uint32_t data;
303
304 data = RREG32_SOC15(JPEG, inst, mmJPEG_CGC_GATE);
305 data |= (JPEG_CGC_GATE__JPEG_DEC_MASK
306 |JPEG_CGC_GATE__JPEG2_DEC_MASK
307 |JPEG_CGC_GATE__JPEG_ENC_MASK
308 |JPEG_CGC_GATE__JMCIF_MASK
309 |JPEG_CGC_GATE__JRBBM_MASK);
310 WREG32_SOC15(JPEG, inst, mmJPEG_CGC_GATE, data);
311}
312
313/**
314 * jpeg_v2_5_start - start JPEG block
315 *
316 * @adev: amdgpu_device pointer
317 *
318 * Setup and start the JPEG block
319 */
320static int jpeg_v2_5_start(struct amdgpu_device *adev)
321{
322 struct amdgpu_ring *ring;
323 int i;
324
325 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
326 if (adev->jpeg.harvest_config & (1 << i))
327 continue;
328
329 ring = adev->jpeg.inst[i].ring_dec;
330 /* disable anti hang mechanism */
331 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmUVD_JPEG_POWER_STATUS), 0,
332 ~UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_MASK);
333
334 /* JPEG disable CGC */
335 jpeg_v2_5_disable_clock_gating(adev, i);
336
337 /* MJPEG global tiling registers */
338 WREG32_SOC15(JPEG, i, mmJPEG_DEC_GFX8_ADDR_CONFIG,
339 adev->gfx.config.gb_addr_config);
340 WREG32_SOC15(JPEG, i, mmJPEG_DEC_GFX10_ADDR_CONFIG,
341 adev->gfx.config.gb_addr_config);
342
343 /* enable JMI channel */
344 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmUVD_JMI_CNTL), 0,
345 ~UVD_JMI_CNTL__SOFT_RESET_MASK);
346
347 /* enable System Interrupt for JRBC */
348 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmJPEG_SYS_INT_EN),
349 JPEG_SYS_INT_EN__DJRBC_MASK,
350 ~JPEG_SYS_INT_EN__DJRBC_MASK);
351
352 WREG32_SOC15(JPEG, i, mmUVD_LMI_JRBC_RB_VMID, 0);
353 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_CNTL, (0x00000001L | 0x00000002L));
354 WREG32_SOC15(JPEG, i, mmUVD_LMI_JRBC_RB_64BIT_BAR_LOW,
355 lower_32_bits(ring->gpu_addr));
356 WREG32_SOC15(JPEG, i, mmUVD_LMI_JRBC_RB_64BIT_BAR_HIGH,
357 upper_32_bits(ring->gpu_addr));
358 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_RPTR, 0);
359 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_WPTR, 0);
360 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_CNTL, 0x00000002L);
361 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_SIZE, ring->ring_size / 4);
362 ring->wptr = RREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_WPTR);
363 }
364
365 return 0;
366}
367
368/**
369 * jpeg_v2_5_stop - stop JPEG block
370 *
371 * @adev: amdgpu_device pointer
372 *
373 * stop the JPEG block
374 */
375static int jpeg_v2_5_stop(struct amdgpu_device *adev)
376{
377 int i;
378
379 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
380 if (adev->jpeg.harvest_config & (1 << i))
381 continue;
382
383 /* reset JMI */
384 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmUVD_JMI_CNTL),
385 UVD_JMI_CNTL__SOFT_RESET_MASK,
386 ~UVD_JMI_CNTL__SOFT_RESET_MASK);
387
388 jpeg_v2_5_enable_clock_gating(adev, i);
389
390 /* enable anti hang mechanism */
391 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmUVD_JPEG_POWER_STATUS),
392 UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_MASK,
393 ~UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_MASK);
394 }
395
396 return 0;
397}
398
399/**
400 * jpeg_v2_5_dec_ring_get_rptr - get read pointer
401 *
402 * @ring: amdgpu_ring pointer
403 *
404 * Returns the current hardware read pointer
405 */
406static uint64_t jpeg_v2_5_dec_ring_get_rptr(struct amdgpu_ring *ring)
407{
408 struct amdgpu_device *adev = ring->adev;
409
410 return RREG32_SOC15(JPEG, ring->me, mmUVD_JRBC_RB_RPTR);
411}
412
413/**
414 * jpeg_v2_5_dec_ring_get_wptr - get write pointer
415 *
416 * @ring: amdgpu_ring pointer
417 *
418 * Returns the current hardware write pointer
419 */
420static uint64_t jpeg_v2_5_dec_ring_get_wptr(struct amdgpu_ring *ring)
421{
422 struct amdgpu_device *adev = ring->adev;
423
424 if (ring->use_doorbell)
425 return *ring->wptr_cpu_addr;
426 else
427 return RREG32_SOC15(JPEG, ring->me, mmUVD_JRBC_RB_WPTR);
428}
429
430/**
431 * jpeg_v2_5_dec_ring_set_wptr - set write pointer
432 *
433 * @ring: amdgpu_ring pointer
434 *
435 * Commits the write pointer to the hardware
436 */
437static void jpeg_v2_5_dec_ring_set_wptr(struct amdgpu_ring *ring)
438{
439 struct amdgpu_device *adev = ring->adev;
440
441 if (ring->use_doorbell) {
442 *ring->wptr_cpu_addr = lower_32_bits(ring->wptr);
443 WDOORBELL32(ring->doorbell_index, lower_32_bits(ring->wptr));
444 } else {
445 WREG32_SOC15(JPEG, ring->me, mmUVD_JRBC_RB_WPTR, lower_32_bits(ring->wptr));
446 }
447}
448
449/**
450 * jpeg_v2_6_dec_ring_insert_start - insert a start command
451 *
452 * @ring: amdgpu_ring pointer
453 *
454 * Write a start command to the ring.
455 */
456static void jpeg_v2_6_dec_ring_insert_start(struct amdgpu_ring *ring)
457{
458 amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
459 0, 0, PACKETJ_TYPE0));
460 amdgpu_ring_write(ring, 0x6aa04); /* PCTL0_MMHUB_DEEPSLEEP_IB */
461
462 amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
463 0, 0, PACKETJ_TYPE0));
464 amdgpu_ring_write(ring, 0x80000000 | (1 << (ring->me * 2 + 14)));
465}
466
467/**
468 * jpeg_v2_6_dec_ring_insert_end - insert a end command
469 *
470 * @ring: amdgpu_ring pointer
471 *
472 * Write a end command to the ring.
473 */
474static void jpeg_v2_6_dec_ring_insert_end(struct amdgpu_ring *ring)
475{
476 amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
477 0, 0, PACKETJ_TYPE0));
478 amdgpu_ring_write(ring, 0x6aa04); /* PCTL0_MMHUB_DEEPSLEEP_IB */
479
480 amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
481 0, 0, PACKETJ_TYPE0));
482 amdgpu_ring_write(ring, (1 << (ring->me * 2 + 14)));
483}
484
485static bool jpeg_v2_5_is_idle(void *handle)
486{
487 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
488 int i, ret = 1;
489
490 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
491 if (adev->jpeg.harvest_config & (1 << i))
492 continue;
493
494 ret &= (((RREG32_SOC15(JPEG, i, mmUVD_JRBC_STATUS) &
495 UVD_JRBC_STATUS__RB_JOB_DONE_MASK) ==
496 UVD_JRBC_STATUS__RB_JOB_DONE_MASK));
497 }
498
499 return ret;
500}
501
502static int jpeg_v2_5_wait_for_idle(struct amdgpu_ip_block *ip_block)
503{
504 struct amdgpu_device *adev = ip_block->adev;
505 int i, ret;
506
507 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
508 if (adev->jpeg.harvest_config & (1 << i))
509 continue;
510
511 ret = SOC15_WAIT_ON_RREG(JPEG, i, mmUVD_JRBC_STATUS,
512 UVD_JRBC_STATUS__RB_JOB_DONE_MASK,
513 UVD_JRBC_STATUS__RB_JOB_DONE_MASK);
514 if (ret)
515 return ret;
516 }
517
518 return 0;
519}
520
521static int jpeg_v2_5_set_clockgating_state(void *handle,
522 enum amd_clockgating_state state)
523{
524 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
525 bool enable = (state == AMD_CG_STATE_GATE);
526 int i;
527
528 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
529 if (adev->jpeg.harvest_config & (1 << i))
530 continue;
531
532 if (enable) {
533 if (!jpeg_v2_5_is_idle(handle))
534 return -EBUSY;
535 jpeg_v2_5_enable_clock_gating(adev, i);
536 } else {
537 jpeg_v2_5_disable_clock_gating(adev, i);
538 }
539 }
540
541 return 0;
542}
543
544static int jpeg_v2_5_set_powergating_state(void *handle,
545 enum amd_powergating_state state)
546{
547 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
548 int ret;
549
550 if (state == adev->jpeg.cur_state)
551 return 0;
552
553 if (state == AMD_PG_STATE_GATE)
554 ret = jpeg_v2_5_stop(adev);
555 else
556 ret = jpeg_v2_5_start(adev);
557
558 if (!ret)
559 adev->jpeg.cur_state = state;
560
561 return ret;
562}
563
564static int jpeg_v2_5_set_interrupt_state(struct amdgpu_device *adev,
565 struct amdgpu_irq_src *source,
566 unsigned type,
567 enum amdgpu_interrupt_state state)
568{
569 return 0;
570}
571
572static int jpeg_v2_6_set_ras_interrupt_state(struct amdgpu_device *adev,
573 struct amdgpu_irq_src *source,
574 unsigned int type,
575 enum amdgpu_interrupt_state state)
576{
577 return 0;
578}
579
580static int jpeg_v2_5_process_interrupt(struct amdgpu_device *adev,
581 struct amdgpu_irq_src *source,
582 struct amdgpu_iv_entry *entry)
583{
584 uint32_t ip_instance;
585
586 switch (entry->client_id) {
587 case SOC15_IH_CLIENTID_VCN:
588 ip_instance = 0;
589 break;
590 case SOC15_IH_CLIENTID_VCN1:
591 ip_instance = 1;
592 break;
593 default:
594 DRM_ERROR("Unhandled client id: %d\n", entry->client_id);
595 return 0;
596 }
597
598 DRM_DEBUG("IH: JPEG TRAP\n");
599
600 switch (entry->src_id) {
601 case VCN_2_0__SRCID__JPEG_DECODE:
602 amdgpu_fence_process(adev->jpeg.inst[ip_instance].ring_dec);
603 break;
604 default:
605 DRM_ERROR("Unhandled interrupt: %d %d\n",
606 entry->src_id, entry->src_data[0]);
607 break;
608 }
609
610 return 0;
611}
612
613static const struct amd_ip_funcs jpeg_v2_5_ip_funcs = {
614 .name = "jpeg_v2_5",
615 .early_init = jpeg_v2_5_early_init,
616 .sw_init = jpeg_v2_5_sw_init,
617 .sw_fini = jpeg_v2_5_sw_fini,
618 .hw_init = jpeg_v2_5_hw_init,
619 .hw_fini = jpeg_v2_5_hw_fini,
620 .suspend = jpeg_v2_5_suspend,
621 .resume = jpeg_v2_5_resume,
622 .is_idle = jpeg_v2_5_is_idle,
623 .wait_for_idle = jpeg_v2_5_wait_for_idle,
624 .set_clockgating_state = jpeg_v2_5_set_clockgating_state,
625 .set_powergating_state = jpeg_v2_5_set_powergating_state,
626};
627
628static const struct amd_ip_funcs jpeg_v2_6_ip_funcs = {
629 .name = "jpeg_v2_6",
630 .early_init = jpeg_v2_5_early_init,
631 .sw_init = jpeg_v2_5_sw_init,
632 .sw_fini = jpeg_v2_5_sw_fini,
633 .hw_init = jpeg_v2_5_hw_init,
634 .hw_fini = jpeg_v2_5_hw_fini,
635 .suspend = jpeg_v2_5_suspend,
636 .resume = jpeg_v2_5_resume,
637 .is_idle = jpeg_v2_5_is_idle,
638 .wait_for_idle = jpeg_v2_5_wait_for_idle,
639 .set_clockgating_state = jpeg_v2_5_set_clockgating_state,
640 .set_powergating_state = jpeg_v2_5_set_powergating_state,
641};
642
643static const struct amdgpu_ring_funcs jpeg_v2_5_dec_ring_vm_funcs = {
644 .type = AMDGPU_RING_TYPE_VCN_JPEG,
645 .align_mask = 0xf,
646 .get_rptr = jpeg_v2_5_dec_ring_get_rptr,
647 .get_wptr = jpeg_v2_5_dec_ring_get_wptr,
648 .set_wptr = jpeg_v2_5_dec_ring_set_wptr,
649 .parse_cs = jpeg_v2_dec_ring_parse_cs,
650 .emit_frame_size =
651 SOC15_FLUSH_GPU_TLB_NUM_WREG * 6 +
652 SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 8 +
653 8 + /* jpeg_v2_5_dec_ring_emit_vm_flush */
654 18 + 18 + /* jpeg_v2_5_dec_ring_emit_fence x2 vm fence */
655 8 + 16,
656 .emit_ib_size = 22, /* jpeg_v2_5_dec_ring_emit_ib */
657 .emit_ib = jpeg_v2_0_dec_ring_emit_ib,
658 .emit_fence = jpeg_v2_0_dec_ring_emit_fence,
659 .emit_vm_flush = jpeg_v2_0_dec_ring_emit_vm_flush,
660 .test_ring = amdgpu_jpeg_dec_ring_test_ring,
661 .test_ib = amdgpu_jpeg_dec_ring_test_ib,
662 .insert_nop = jpeg_v2_0_dec_ring_nop,
663 .insert_start = jpeg_v2_0_dec_ring_insert_start,
664 .insert_end = jpeg_v2_0_dec_ring_insert_end,
665 .pad_ib = amdgpu_ring_generic_pad_ib,
666 .begin_use = amdgpu_jpeg_ring_begin_use,
667 .end_use = amdgpu_jpeg_ring_end_use,
668 .emit_wreg = jpeg_v2_0_dec_ring_emit_wreg,
669 .emit_reg_wait = jpeg_v2_0_dec_ring_emit_reg_wait,
670 .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
671};
672
673static const struct amdgpu_ring_funcs jpeg_v2_6_dec_ring_vm_funcs = {
674 .type = AMDGPU_RING_TYPE_VCN_JPEG,
675 .align_mask = 0xf,
676 .get_rptr = jpeg_v2_5_dec_ring_get_rptr,
677 .get_wptr = jpeg_v2_5_dec_ring_get_wptr,
678 .set_wptr = jpeg_v2_5_dec_ring_set_wptr,
679 .parse_cs = jpeg_v2_dec_ring_parse_cs,
680 .emit_frame_size =
681 SOC15_FLUSH_GPU_TLB_NUM_WREG * 6 +
682 SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 8 +
683 8 + /* jpeg_v2_5_dec_ring_emit_vm_flush */
684 18 + 18 + /* jpeg_v2_5_dec_ring_emit_fence x2 vm fence */
685 8 + 16,
686 .emit_ib_size = 22, /* jpeg_v2_5_dec_ring_emit_ib */
687 .emit_ib = jpeg_v2_0_dec_ring_emit_ib,
688 .emit_fence = jpeg_v2_0_dec_ring_emit_fence,
689 .emit_vm_flush = jpeg_v2_0_dec_ring_emit_vm_flush,
690 .test_ring = amdgpu_jpeg_dec_ring_test_ring,
691 .test_ib = amdgpu_jpeg_dec_ring_test_ib,
692 .insert_nop = jpeg_v2_0_dec_ring_nop,
693 .insert_start = jpeg_v2_6_dec_ring_insert_start,
694 .insert_end = jpeg_v2_6_dec_ring_insert_end,
695 .pad_ib = amdgpu_ring_generic_pad_ib,
696 .begin_use = amdgpu_jpeg_ring_begin_use,
697 .end_use = amdgpu_jpeg_ring_end_use,
698 .emit_wreg = jpeg_v2_0_dec_ring_emit_wreg,
699 .emit_reg_wait = jpeg_v2_0_dec_ring_emit_reg_wait,
700 .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
701};
702
703static void jpeg_v2_5_set_dec_ring_funcs(struct amdgpu_device *adev)
704{
705 int i;
706
707 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
708 if (adev->jpeg.harvest_config & (1 << i))
709 continue;
710 if (adev->asic_type == CHIP_ARCTURUS)
711 adev->jpeg.inst[i].ring_dec->funcs = &jpeg_v2_5_dec_ring_vm_funcs;
712 else /* CHIP_ALDEBARAN */
713 adev->jpeg.inst[i].ring_dec->funcs = &jpeg_v2_6_dec_ring_vm_funcs;
714 adev->jpeg.inst[i].ring_dec->me = i;
715 }
716}
717
718static const struct amdgpu_irq_src_funcs jpeg_v2_5_irq_funcs = {
719 .set = jpeg_v2_5_set_interrupt_state,
720 .process = jpeg_v2_5_process_interrupt,
721};
722
723static const struct amdgpu_irq_src_funcs jpeg_v2_6_ras_irq_funcs = {
724 .set = jpeg_v2_6_set_ras_interrupt_state,
725 .process = amdgpu_jpeg_process_poison_irq,
726};
727
728static void jpeg_v2_5_set_irq_funcs(struct amdgpu_device *adev)
729{
730 int i;
731
732 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
733 if (adev->jpeg.harvest_config & (1 << i))
734 continue;
735
736 adev->jpeg.inst[i].irq.num_types = 1;
737 adev->jpeg.inst[i].irq.funcs = &jpeg_v2_5_irq_funcs;
738
739 adev->jpeg.inst[i].ras_poison_irq.num_types = 1;
740 adev->jpeg.inst[i].ras_poison_irq.funcs = &jpeg_v2_6_ras_irq_funcs;
741 }
742}
743
744const struct amdgpu_ip_block_version jpeg_v2_5_ip_block = {
745 .type = AMD_IP_BLOCK_TYPE_JPEG,
746 .major = 2,
747 .minor = 5,
748 .rev = 0,
749 .funcs = &jpeg_v2_5_ip_funcs,
750};
751
752const struct amdgpu_ip_block_version jpeg_v2_6_ip_block = {
753 .type = AMD_IP_BLOCK_TYPE_JPEG,
754 .major = 2,
755 .minor = 6,
756 .rev = 0,
757 .funcs = &jpeg_v2_6_ip_funcs,
758};
759
760static uint32_t jpeg_v2_6_query_poison_by_instance(struct amdgpu_device *adev,
761 uint32_t instance, uint32_t sub_block)
762{
763 uint32_t poison_stat = 0, reg_value = 0;
764
765 switch (sub_block) {
766 case AMDGPU_JPEG_V2_6_JPEG0:
767 reg_value = RREG32_SOC15(JPEG, instance, mmUVD_RAS_JPEG0_STATUS);
768 poison_stat = REG_GET_FIELD(reg_value, UVD_RAS_JPEG0_STATUS, POISONED_PF);
769 break;
770 case AMDGPU_JPEG_V2_6_JPEG1:
771 reg_value = RREG32_SOC15(JPEG, instance, mmUVD_RAS_JPEG1_STATUS);
772 poison_stat = REG_GET_FIELD(reg_value, UVD_RAS_JPEG1_STATUS, POISONED_PF);
773 break;
774 default:
775 break;
776 }
777
778 if (poison_stat)
779 dev_info(adev->dev, "Poison detected in JPEG%d sub_block%d\n",
780 instance, sub_block);
781
782 return poison_stat;
783}
784
785static bool jpeg_v2_6_query_ras_poison_status(struct amdgpu_device *adev)
786{
787 uint32_t inst = 0, sub = 0, poison_stat = 0;
788
789 for (inst = 0; inst < adev->jpeg.num_jpeg_inst; inst++)
790 for (sub = 0; sub < AMDGPU_JPEG_V2_6_MAX_SUB_BLOCK; sub++)
791 poison_stat +=
792 jpeg_v2_6_query_poison_by_instance(adev, inst, sub);
793
794 return !!poison_stat;
795}
796
797const struct amdgpu_ras_block_hw_ops jpeg_v2_6_ras_hw_ops = {
798 .query_poison_status = jpeg_v2_6_query_ras_poison_status,
799};
800
801static struct amdgpu_jpeg_ras jpeg_v2_6_ras = {
802 .ras_block = {
803 .hw_ops = &jpeg_v2_6_ras_hw_ops,
804 .ras_late_init = amdgpu_jpeg_ras_late_init,
805 },
806};
807
808static void jpeg_v2_5_set_ras_funcs(struct amdgpu_device *adev)
809{
810 switch (amdgpu_ip_version(adev, JPEG_HWIP, 0)) {
811 case IP_VERSION(2, 6, 0):
812 adev->jpeg.ras = &jpeg_v2_6_ras;
813 break;
814 default:
815 break;
816 }
817}