1 /*
2 * Copyright 2019 Advanced Micro Devices, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
21 *
22 */
23
24 #include "amdgpu.h"
25 #include "amdgpu_jpeg.h"
26 #include "soc15.h"
27 #include "soc15d.h"
28 #include "jpeg_v2_0.h"
29 #include "jpeg_v2_5.h"
30
31 #include "vcn/vcn_2_5_offset.h"
32 #include "vcn/vcn_2_5_sh_mask.h"
33 #include "ivsrcid/vcn/irqsrcs_vcn_2_0.h"
34
35 #define mmUVD_JPEG_PITCH_INTERNAL_OFFSET 0x401f
36
37 #define JPEG25_MAX_HW_INSTANCES_ARCTURUS 2
38
39 static void jpeg_v2_5_set_dec_ring_funcs(struct amdgpu_device *adev);
40 static void jpeg_v2_5_set_irq_funcs(struct amdgpu_device *adev);
41 static int jpeg_v2_5_set_powergating_state(void *handle,
42 enum amd_powergating_state state);
43 static void jpeg_v2_5_set_ras_funcs(struct amdgpu_device *adev);
44
45 static int amdgpu_ih_clientid_jpeg[] = {
46 SOC15_IH_CLIENTID_VCN,
47 SOC15_IH_CLIENTID_VCN1
48 };
49
50 /**
51 * jpeg_v2_5_early_init - set function pointers
52 *
53 * @handle: amdgpu_device pointer
54 *
55 * Set ring and irq function pointers
56 */
jpeg_v2_5_early_init(void * handle)57 static int jpeg_v2_5_early_init(void *handle)
58 {
59 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
60 u32 harvest;
61 int i;
62
63 adev->jpeg.num_jpeg_rings = 1;
64 adev->jpeg.num_jpeg_inst = JPEG25_MAX_HW_INSTANCES_ARCTURUS;
65 for (i = 0; i < adev->jpeg.num_jpeg_inst; i++) {
66 harvest = RREG32_SOC15(JPEG, i, mmCC_UVD_HARVESTING);
67 if (harvest & CC_UVD_HARVESTING__UVD_DISABLE_MASK)
68 adev->jpeg.harvest_config |= 1 << i;
69 }
70 if (adev->jpeg.harvest_config == (AMDGPU_JPEG_HARVEST_JPEG0 |
71 AMDGPU_JPEG_HARVEST_JPEG1))
72 return -ENOENT;
73
74 jpeg_v2_5_set_dec_ring_funcs(adev);
75 jpeg_v2_5_set_irq_funcs(adev);
76 jpeg_v2_5_set_ras_funcs(adev);
77
78 return 0;
79 }
80
81 /**
82 * jpeg_v2_5_sw_init - sw init for JPEG block
83 *
84 * @handle: amdgpu_device pointer
85 *
86 * Load firmware and sw initialization
87 */
jpeg_v2_5_sw_init(void * handle)88 static int jpeg_v2_5_sw_init(void *handle)
89 {
90 struct amdgpu_ring *ring;
91 int i, r;
92 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
93
94 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
95 if (adev->jpeg.harvest_config & (1 << i))
96 continue;
97
98 /* JPEG TRAP */
99 r = amdgpu_irq_add_id(adev, amdgpu_ih_clientid_jpeg[i],
100 VCN_2_0__SRCID__JPEG_DECODE, &adev->jpeg.inst[i].irq);
101 if (r)
102 return r;
103
104 /* JPEG DJPEG POISON EVENT */
105 r = amdgpu_irq_add_id(adev, amdgpu_ih_clientid_jpeg[i],
106 VCN_2_6__SRCID_DJPEG0_POISON, &adev->jpeg.inst[i].ras_poison_irq);
107 if (r)
108 return r;
109
110 /* JPEG EJPEG POISON EVENT */
111 r = amdgpu_irq_add_id(adev, amdgpu_ih_clientid_jpeg[i],
112 VCN_2_6__SRCID_EJPEG0_POISON, &adev->jpeg.inst[i].ras_poison_irq);
113 if (r)
114 return r;
115 }
116
117 r = amdgpu_jpeg_sw_init(adev);
118 if (r)
119 return r;
120
121 r = amdgpu_jpeg_resume(adev);
122 if (r)
123 return r;
124
125 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
126 if (adev->jpeg.harvest_config & (1 << i))
127 continue;
128
129 ring = adev->jpeg.inst[i].ring_dec;
130 ring->use_doorbell = true;
131 if (adev->ip_versions[UVD_HWIP][0] == IP_VERSION(2, 5, 0))
132 ring->vm_hub = AMDGPU_MMHUB1(0);
133 else
134 ring->vm_hub = AMDGPU_MMHUB0(0);
135 ring->doorbell_index = (adev->doorbell_index.vcn.vcn_ring0_1 << 1) + 1 + 8 * i;
136 snprintf(ring->name, sizeof(ring->name), "jpeg_dec_%d", i);
137 r = amdgpu_ring_init(adev, ring, 512, &adev->jpeg.inst[i].irq,
138 0, AMDGPU_RING_PRIO_DEFAULT, NULL);
139 if (r)
140 return r;
141
142 adev->jpeg.internal.jpeg_pitch[0] = mmUVD_JPEG_PITCH_INTERNAL_OFFSET;
143 adev->jpeg.inst[i].external.jpeg_pitch[0] = SOC15_REG_OFFSET(JPEG, i, mmUVD_JPEG_PITCH);
144 }
145
146 r = amdgpu_jpeg_ras_sw_init(adev);
147 if (r)
148 return r;
149
150 return 0;
151 }
152
153 /**
154 * jpeg_v2_5_sw_fini - sw fini for JPEG block
155 *
156 * @handle: amdgpu_device pointer
157 *
158 * JPEG suspend and free up sw allocation
159 */
jpeg_v2_5_sw_fini(void * handle)160 static int jpeg_v2_5_sw_fini(void *handle)
161 {
162 int r;
163 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
164
165 r = amdgpu_jpeg_suspend(adev);
166 if (r)
167 return r;
168
169 r = amdgpu_jpeg_sw_fini(adev);
170
171 return r;
172 }
173
174 /**
175 * jpeg_v2_5_hw_init - start and test JPEG block
176 *
177 * @handle: amdgpu_device pointer
178 *
179 */
jpeg_v2_5_hw_init(void * handle)180 static int jpeg_v2_5_hw_init(void *handle)
181 {
182 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
183 struct amdgpu_ring *ring;
184 int i, r;
185
186 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
187 if (adev->jpeg.harvest_config & (1 << i))
188 continue;
189
190 ring = adev->jpeg.inst[i].ring_dec;
191 adev->nbio.funcs->vcn_doorbell_range(adev, ring->use_doorbell,
192 (adev->doorbell_index.vcn.vcn_ring0_1 << 1) + 8 * i, i);
193
194 r = amdgpu_ring_test_helper(ring);
195 if (r)
196 return r;
197 }
198
199 DRM_INFO("JPEG decode initialized successfully.\n");
200
201 return 0;
202 }
203
204 /**
205 * jpeg_v2_5_hw_fini - stop the hardware block
206 *
207 * @handle: amdgpu_device pointer
208 *
209 * Stop the JPEG block, mark ring as not ready any more
210 */
jpeg_v2_5_hw_fini(void * handle)211 static int jpeg_v2_5_hw_fini(void *handle)
212 {
213 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
214 int i;
215
216 cancel_delayed_work_sync(&adev->vcn.idle_work);
217
218 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
219 if (adev->jpeg.harvest_config & (1 << i))
220 continue;
221
222 if (adev->jpeg.cur_state != AMD_PG_STATE_GATE &&
223 RREG32_SOC15(JPEG, i, mmUVD_JRBC_STATUS))
224 jpeg_v2_5_set_powergating_state(adev, AMD_PG_STATE_GATE);
225
226 if (amdgpu_ras_is_supported(adev, AMDGPU_RAS_BLOCK__JPEG))
227 amdgpu_irq_put(adev, &adev->jpeg.inst[i].ras_poison_irq, 0);
228 }
229
230 return 0;
231 }
232
233 /**
234 * jpeg_v2_5_suspend - suspend JPEG block
235 *
236 * @handle: amdgpu_device pointer
237 *
238 * HW fini and suspend JPEG block
239 */
jpeg_v2_5_suspend(void * handle)240 static int jpeg_v2_5_suspend(void *handle)
241 {
242 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
243 int r;
244
245 r = jpeg_v2_5_hw_fini(adev);
246 if (r)
247 return r;
248
249 r = amdgpu_jpeg_suspend(adev);
250
251 return r;
252 }
253
254 /**
255 * jpeg_v2_5_resume - resume JPEG block
256 *
257 * @handle: amdgpu_device pointer
258 *
259 * Resume firmware and hw init JPEG block
260 */
jpeg_v2_5_resume(void * handle)261 static int jpeg_v2_5_resume(void *handle)
262 {
263 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
264 int r;
265
266 r = amdgpu_jpeg_resume(adev);
267 if (r)
268 return r;
269
270 r = jpeg_v2_5_hw_init(adev);
271
272 return r;
273 }
274
jpeg_v2_5_disable_clock_gating(struct amdgpu_device * adev,int inst)275 static void jpeg_v2_5_disable_clock_gating(struct amdgpu_device *adev, int inst)
276 {
277 uint32_t data;
278
279 data = RREG32_SOC15(JPEG, inst, mmJPEG_CGC_CTRL);
280 if (adev->cg_flags & AMD_CG_SUPPORT_JPEG_MGCG)
281 data |= 1 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
282 else
283 data &= ~JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
284
285 data |= 1 << JPEG_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
286 data |= 4 << JPEG_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
287 WREG32_SOC15(JPEG, inst, mmJPEG_CGC_CTRL, data);
288
289 data = RREG32_SOC15(JPEG, inst, mmJPEG_CGC_GATE);
290 data &= ~(JPEG_CGC_GATE__JPEG_DEC_MASK
291 | JPEG_CGC_GATE__JPEG2_DEC_MASK
292 | JPEG_CGC_GATE__JMCIF_MASK
293 | JPEG_CGC_GATE__JRBBM_MASK);
294 WREG32_SOC15(JPEG, inst, mmJPEG_CGC_GATE, data);
295
296 data = RREG32_SOC15(JPEG, inst, mmJPEG_CGC_CTRL);
297 data &= ~(JPEG_CGC_CTRL__JPEG_DEC_MODE_MASK
298 | JPEG_CGC_CTRL__JPEG2_DEC_MODE_MASK
299 | JPEG_CGC_CTRL__JMCIF_MODE_MASK
300 | JPEG_CGC_CTRL__JRBBM_MODE_MASK);
301 WREG32_SOC15(JPEG, inst, mmJPEG_CGC_CTRL, data);
302 }
303
jpeg_v2_5_enable_clock_gating(struct amdgpu_device * adev,int inst)304 static void jpeg_v2_5_enable_clock_gating(struct amdgpu_device *adev, int inst)
305 {
306 uint32_t data;
307
308 data = RREG32_SOC15(JPEG, inst, mmJPEG_CGC_GATE);
309 data |= (JPEG_CGC_GATE__JPEG_DEC_MASK
310 |JPEG_CGC_GATE__JPEG2_DEC_MASK
311 |JPEG_CGC_GATE__JPEG_ENC_MASK
312 |JPEG_CGC_GATE__JMCIF_MASK
313 |JPEG_CGC_GATE__JRBBM_MASK);
314 WREG32_SOC15(JPEG, inst, mmJPEG_CGC_GATE, data);
315 }
316
317 /**
318 * jpeg_v2_5_start - start JPEG block
319 *
320 * @adev: amdgpu_device pointer
321 *
322 * Setup and start the JPEG block
323 */
jpeg_v2_5_start(struct amdgpu_device * adev)324 static int jpeg_v2_5_start(struct amdgpu_device *adev)
325 {
326 struct amdgpu_ring *ring;
327 int i;
328
329 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
330 if (adev->jpeg.harvest_config & (1 << i))
331 continue;
332
333 ring = adev->jpeg.inst[i].ring_dec;
334 /* disable anti hang mechanism */
335 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmUVD_JPEG_POWER_STATUS), 0,
336 ~UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_MASK);
337
338 /* JPEG disable CGC */
339 jpeg_v2_5_disable_clock_gating(adev, i);
340
341 /* MJPEG global tiling registers */
342 WREG32_SOC15(JPEG, i, mmJPEG_DEC_GFX8_ADDR_CONFIG,
343 adev->gfx.config.gb_addr_config);
344 WREG32_SOC15(JPEG, i, mmJPEG_DEC_GFX10_ADDR_CONFIG,
345 adev->gfx.config.gb_addr_config);
346
347 /* enable JMI channel */
348 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmUVD_JMI_CNTL), 0,
349 ~UVD_JMI_CNTL__SOFT_RESET_MASK);
350
351 /* enable System Interrupt for JRBC */
352 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmJPEG_SYS_INT_EN),
353 JPEG_SYS_INT_EN__DJRBC_MASK,
354 ~JPEG_SYS_INT_EN__DJRBC_MASK);
355
356 WREG32_SOC15(JPEG, i, mmUVD_LMI_JRBC_RB_VMID, 0);
357 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_CNTL, (0x00000001L | 0x00000002L));
358 WREG32_SOC15(JPEG, i, mmUVD_LMI_JRBC_RB_64BIT_BAR_LOW,
359 lower_32_bits(ring->gpu_addr));
360 WREG32_SOC15(JPEG, i, mmUVD_LMI_JRBC_RB_64BIT_BAR_HIGH,
361 upper_32_bits(ring->gpu_addr));
362 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_RPTR, 0);
363 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_WPTR, 0);
364 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_CNTL, 0x00000002L);
365 WREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_SIZE, ring->ring_size / 4);
366 ring->wptr = RREG32_SOC15(JPEG, i, mmUVD_JRBC_RB_WPTR);
367 }
368
369 return 0;
370 }
371
372 /**
373 * jpeg_v2_5_stop - stop JPEG block
374 *
375 * @adev: amdgpu_device pointer
376 *
377 * stop the JPEG block
378 */
jpeg_v2_5_stop(struct amdgpu_device * adev)379 static int jpeg_v2_5_stop(struct amdgpu_device *adev)
380 {
381 int i;
382
383 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
384 if (adev->jpeg.harvest_config & (1 << i))
385 continue;
386
387 /* reset JMI */
388 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmUVD_JMI_CNTL),
389 UVD_JMI_CNTL__SOFT_RESET_MASK,
390 ~UVD_JMI_CNTL__SOFT_RESET_MASK);
391
392 jpeg_v2_5_enable_clock_gating(adev, i);
393
394 /* enable anti hang mechanism */
395 WREG32_P(SOC15_REG_OFFSET(JPEG, i, mmUVD_JPEG_POWER_STATUS),
396 UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_MASK,
397 ~UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_MASK);
398 }
399
400 return 0;
401 }
402
403 /**
404 * jpeg_v2_5_dec_ring_get_rptr - get read pointer
405 *
406 * @ring: amdgpu_ring pointer
407 *
408 * Returns the current hardware read pointer
409 */
jpeg_v2_5_dec_ring_get_rptr(struct amdgpu_ring * ring)410 static uint64_t jpeg_v2_5_dec_ring_get_rptr(struct amdgpu_ring *ring)
411 {
412 struct amdgpu_device *adev = ring->adev;
413
414 return RREG32_SOC15(JPEG, ring->me, mmUVD_JRBC_RB_RPTR);
415 }
416
417 /**
418 * jpeg_v2_5_dec_ring_get_wptr - get write pointer
419 *
420 * @ring: amdgpu_ring pointer
421 *
422 * Returns the current hardware write pointer
423 */
jpeg_v2_5_dec_ring_get_wptr(struct amdgpu_ring * ring)424 static uint64_t jpeg_v2_5_dec_ring_get_wptr(struct amdgpu_ring *ring)
425 {
426 struct amdgpu_device *adev = ring->adev;
427
428 if (ring->use_doorbell)
429 return *ring->wptr_cpu_addr;
430 else
431 return RREG32_SOC15(JPEG, ring->me, mmUVD_JRBC_RB_WPTR);
432 }
433
434 /**
435 * jpeg_v2_5_dec_ring_set_wptr - set write pointer
436 *
437 * @ring: amdgpu_ring pointer
438 *
439 * Commits the write pointer to the hardware
440 */
jpeg_v2_5_dec_ring_set_wptr(struct amdgpu_ring * ring)441 static void jpeg_v2_5_dec_ring_set_wptr(struct amdgpu_ring *ring)
442 {
443 struct amdgpu_device *adev = ring->adev;
444
445 if (ring->use_doorbell) {
446 *ring->wptr_cpu_addr = lower_32_bits(ring->wptr);
447 WDOORBELL32(ring->doorbell_index, lower_32_bits(ring->wptr));
448 } else {
449 WREG32_SOC15(JPEG, ring->me, mmUVD_JRBC_RB_WPTR, lower_32_bits(ring->wptr));
450 }
451 }
452
453 /**
454 * jpeg_v2_6_dec_ring_insert_start - insert a start command
455 *
456 * @ring: amdgpu_ring pointer
457 *
458 * Write a start command to the ring.
459 */
jpeg_v2_6_dec_ring_insert_start(struct amdgpu_ring * ring)460 static void jpeg_v2_6_dec_ring_insert_start(struct amdgpu_ring *ring)
461 {
462 amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
463 0, 0, PACKETJ_TYPE0));
464 amdgpu_ring_write(ring, 0x6aa04); /* PCTL0_MMHUB_DEEPSLEEP_IB */
465
466 amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
467 0, 0, PACKETJ_TYPE0));
468 amdgpu_ring_write(ring, 0x80000000 | (1 << (ring->me * 2 + 14)));
469 }
470
471 /**
472 * jpeg_v2_6_dec_ring_insert_end - insert a end command
473 *
474 * @ring: amdgpu_ring pointer
475 *
476 * Write a end command to the ring.
477 */
jpeg_v2_6_dec_ring_insert_end(struct amdgpu_ring * ring)478 static void jpeg_v2_6_dec_ring_insert_end(struct amdgpu_ring *ring)
479 {
480 amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
481 0, 0, PACKETJ_TYPE0));
482 amdgpu_ring_write(ring, 0x6aa04); /* PCTL0_MMHUB_DEEPSLEEP_IB */
483
484 amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
485 0, 0, PACKETJ_TYPE0));
486 amdgpu_ring_write(ring, (1 << (ring->me * 2 + 14)));
487 }
488
jpeg_v2_5_is_idle(void * handle)489 static bool jpeg_v2_5_is_idle(void *handle)
490 {
491 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
492 int i, ret = 1;
493
494 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
495 if (adev->jpeg.harvest_config & (1 << i))
496 continue;
497
498 ret &= (((RREG32_SOC15(JPEG, i, mmUVD_JRBC_STATUS) &
499 UVD_JRBC_STATUS__RB_JOB_DONE_MASK) ==
500 UVD_JRBC_STATUS__RB_JOB_DONE_MASK));
501 }
502
503 return ret;
504 }
505
jpeg_v2_5_wait_for_idle(void * handle)506 static int jpeg_v2_5_wait_for_idle(void *handle)
507 {
508 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
509 int i, ret;
510
511 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
512 if (adev->jpeg.harvest_config & (1 << i))
513 continue;
514
515 ret = SOC15_WAIT_ON_RREG(JPEG, i, mmUVD_JRBC_STATUS,
516 UVD_JRBC_STATUS__RB_JOB_DONE_MASK,
517 UVD_JRBC_STATUS__RB_JOB_DONE_MASK);
518 if (ret)
519 return ret;
520 }
521
522 return 0;
523 }
524
jpeg_v2_5_set_clockgating_state(void * handle,enum amd_clockgating_state state)525 static int jpeg_v2_5_set_clockgating_state(void *handle,
526 enum amd_clockgating_state state)
527 {
528 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
529 bool enable = (state == AMD_CG_STATE_GATE);
530 int i;
531
532 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
533 if (adev->jpeg.harvest_config & (1 << i))
534 continue;
535
536 if (enable) {
537 if (!jpeg_v2_5_is_idle(handle))
538 return -EBUSY;
539 jpeg_v2_5_enable_clock_gating(adev, i);
540 } else {
541 jpeg_v2_5_disable_clock_gating(adev, i);
542 }
543 }
544
545 return 0;
546 }
547
jpeg_v2_5_set_powergating_state(void * handle,enum amd_powergating_state state)548 static int jpeg_v2_5_set_powergating_state(void *handle,
549 enum amd_powergating_state state)
550 {
551 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
552 int ret;
553
554 if(state == adev->jpeg.cur_state)
555 return 0;
556
557 if (state == AMD_PG_STATE_GATE)
558 ret = jpeg_v2_5_stop(adev);
559 else
560 ret = jpeg_v2_5_start(adev);
561
562 if(!ret)
563 adev->jpeg.cur_state = state;
564
565 return ret;
566 }
567
jpeg_v2_5_set_interrupt_state(struct amdgpu_device * adev,struct amdgpu_irq_src * source,unsigned type,enum amdgpu_interrupt_state state)568 static int jpeg_v2_5_set_interrupt_state(struct amdgpu_device *adev,
569 struct amdgpu_irq_src *source,
570 unsigned type,
571 enum amdgpu_interrupt_state state)
572 {
573 return 0;
574 }
575
jpeg_v2_6_set_ras_interrupt_state(struct amdgpu_device * adev,struct amdgpu_irq_src * source,unsigned int type,enum amdgpu_interrupt_state state)576 static int jpeg_v2_6_set_ras_interrupt_state(struct amdgpu_device *adev,
577 struct amdgpu_irq_src *source,
578 unsigned int type,
579 enum amdgpu_interrupt_state state)
580 {
581 return 0;
582 }
583
jpeg_v2_5_process_interrupt(struct amdgpu_device * adev,struct amdgpu_irq_src * source,struct amdgpu_iv_entry * entry)584 static int jpeg_v2_5_process_interrupt(struct amdgpu_device *adev,
585 struct amdgpu_irq_src *source,
586 struct amdgpu_iv_entry *entry)
587 {
588 uint32_t ip_instance;
589
590 switch (entry->client_id) {
591 case SOC15_IH_CLIENTID_VCN:
592 ip_instance = 0;
593 break;
594 case SOC15_IH_CLIENTID_VCN1:
595 ip_instance = 1;
596 break;
597 default:
598 DRM_ERROR("Unhandled client id: %d\n", entry->client_id);
599 return 0;
600 }
601
602 DRM_DEBUG("IH: JPEG TRAP\n");
603
604 switch (entry->src_id) {
605 case VCN_2_0__SRCID__JPEG_DECODE:
606 amdgpu_fence_process(adev->jpeg.inst[ip_instance].ring_dec);
607 break;
608 default:
609 DRM_ERROR("Unhandled interrupt: %d %d\n",
610 entry->src_id, entry->src_data[0]);
611 break;
612 }
613
614 return 0;
615 }
616
617 static const struct amd_ip_funcs jpeg_v2_5_ip_funcs = {
618 .name = "jpeg_v2_5",
619 .early_init = jpeg_v2_5_early_init,
620 .late_init = NULL,
621 .sw_init = jpeg_v2_5_sw_init,
622 .sw_fini = jpeg_v2_5_sw_fini,
623 .hw_init = jpeg_v2_5_hw_init,
624 .hw_fini = jpeg_v2_5_hw_fini,
625 .suspend = jpeg_v2_5_suspend,
626 .resume = jpeg_v2_5_resume,
627 .is_idle = jpeg_v2_5_is_idle,
628 .wait_for_idle = jpeg_v2_5_wait_for_idle,
629 .check_soft_reset = NULL,
630 .pre_soft_reset = NULL,
631 .soft_reset = NULL,
632 .post_soft_reset = NULL,
633 .set_clockgating_state = jpeg_v2_5_set_clockgating_state,
634 .set_powergating_state = jpeg_v2_5_set_powergating_state,
635 };
636
637 static const struct amd_ip_funcs jpeg_v2_6_ip_funcs = {
638 .name = "jpeg_v2_6",
639 .early_init = jpeg_v2_5_early_init,
640 .late_init = NULL,
641 .sw_init = jpeg_v2_5_sw_init,
642 .sw_fini = jpeg_v2_5_sw_fini,
643 .hw_init = jpeg_v2_5_hw_init,
644 .hw_fini = jpeg_v2_5_hw_fini,
645 .suspend = jpeg_v2_5_suspend,
646 .resume = jpeg_v2_5_resume,
647 .is_idle = jpeg_v2_5_is_idle,
648 .wait_for_idle = jpeg_v2_5_wait_for_idle,
649 .check_soft_reset = NULL,
650 .pre_soft_reset = NULL,
651 .soft_reset = NULL,
652 .post_soft_reset = NULL,
653 .set_clockgating_state = jpeg_v2_5_set_clockgating_state,
654 .set_powergating_state = jpeg_v2_5_set_powergating_state,
655 };
656
657 static const struct amdgpu_ring_funcs jpeg_v2_5_dec_ring_vm_funcs = {
658 .type = AMDGPU_RING_TYPE_VCN_JPEG,
659 .align_mask = 0xf,
660 .get_rptr = jpeg_v2_5_dec_ring_get_rptr,
661 .get_wptr = jpeg_v2_5_dec_ring_get_wptr,
662 .set_wptr = jpeg_v2_5_dec_ring_set_wptr,
663 .emit_frame_size =
664 SOC15_FLUSH_GPU_TLB_NUM_WREG * 6 +
665 SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 8 +
666 8 + /* jpeg_v2_5_dec_ring_emit_vm_flush */
667 18 + 18 + /* jpeg_v2_5_dec_ring_emit_fence x2 vm fence */
668 8 + 16,
669 .emit_ib_size = 22, /* jpeg_v2_5_dec_ring_emit_ib */
670 .emit_ib = jpeg_v2_0_dec_ring_emit_ib,
671 .emit_fence = jpeg_v2_0_dec_ring_emit_fence,
672 .emit_vm_flush = jpeg_v2_0_dec_ring_emit_vm_flush,
673 .test_ring = amdgpu_jpeg_dec_ring_test_ring,
674 .test_ib = amdgpu_jpeg_dec_ring_test_ib,
675 .insert_nop = jpeg_v2_0_dec_ring_nop,
676 .insert_start = jpeg_v2_0_dec_ring_insert_start,
677 .insert_end = jpeg_v2_0_dec_ring_insert_end,
678 .pad_ib = amdgpu_ring_generic_pad_ib,
679 .begin_use = amdgpu_jpeg_ring_begin_use,
680 .end_use = amdgpu_jpeg_ring_end_use,
681 .emit_wreg = jpeg_v2_0_dec_ring_emit_wreg,
682 .emit_reg_wait = jpeg_v2_0_dec_ring_emit_reg_wait,
683 .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
684 };
685
686 static const struct amdgpu_ring_funcs jpeg_v2_6_dec_ring_vm_funcs = {
687 .type = AMDGPU_RING_TYPE_VCN_JPEG,
688 .align_mask = 0xf,
689 .get_rptr = jpeg_v2_5_dec_ring_get_rptr,
690 .get_wptr = jpeg_v2_5_dec_ring_get_wptr,
691 .set_wptr = jpeg_v2_5_dec_ring_set_wptr,
692 .emit_frame_size =
693 SOC15_FLUSH_GPU_TLB_NUM_WREG * 6 +
694 SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 8 +
695 8 + /* jpeg_v2_5_dec_ring_emit_vm_flush */
696 18 + 18 + /* jpeg_v2_5_dec_ring_emit_fence x2 vm fence */
697 8 + 16,
698 .emit_ib_size = 22, /* jpeg_v2_5_dec_ring_emit_ib */
699 .emit_ib = jpeg_v2_0_dec_ring_emit_ib,
700 .emit_fence = jpeg_v2_0_dec_ring_emit_fence,
701 .emit_vm_flush = jpeg_v2_0_dec_ring_emit_vm_flush,
702 .test_ring = amdgpu_jpeg_dec_ring_test_ring,
703 .test_ib = amdgpu_jpeg_dec_ring_test_ib,
704 .insert_nop = jpeg_v2_0_dec_ring_nop,
705 .insert_start = jpeg_v2_6_dec_ring_insert_start,
706 .insert_end = jpeg_v2_6_dec_ring_insert_end,
707 .pad_ib = amdgpu_ring_generic_pad_ib,
708 .begin_use = amdgpu_jpeg_ring_begin_use,
709 .end_use = amdgpu_jpeg_ring_end_use,
710 .emit_wreg = jpeg_v2_0_dec_ring_emit_wreg,
711 .emit_reg_wait = jpeg_v2_0_dec_ring_emit_reg_wait,
712 .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
713 };
714
jpeg_v2_5_set_dec_ring_funcs(struct amdgpu_device * adev)715 static void jpeg_v2_5_set_dec_ring_funcs(struct amdgpu_device *adev)
716 {
717 int i;
718
719 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
720 if (adev->jpeg.harvest_config & (1 << i))
721 continue;
722 if (adev->asic_type == CHIP_ARCTURUS)
723 adev->jpeg.inst[i].ring_dec->funcs = &jpeg_v2_5_dec_ring_vm_funcs;
724 else /* CHIP_ALDEBARAN */
725 adev->jpeg.inst[i].ring_dec->funcs = &jpeg_v2_6_dec_ring_vm_funcs;
726 adev->jpeg.inst[i].ring_dec->me = i;
727 DRM_INFO("JPEG(%d) JPEG decode is enabled in VM mode\n", i);
728 }
729 }
730
731 static const struct amdgpu_irq_src_funcs jpeg_v2_5_irq_funcs = {
732 .set = jpeg_v2_5_set_interrupt_state,
733 .process = jpeg_v2_5_process_interrupt,
734 };
735
736 static const struct amdgpu_irq_src_funcs jpeg_v2_6_ras_irq_funcs = {
737 .set = jpeg_v2_6_set_ras_interrupt_state,
738 .process = amdgpu_jpeg_process_poison_irq,
739 };
740
jpeg_v2_5_set_irq_funcs(struct amdgpu_device * adev)741 static void jpeg_v2_5_set_irq_funcs(struct amdgpu_device *adev)
742 {
743 int i;
744
745 for (i = 0; i < adev->jpeg.num_jpeg_inst; ++i) {
746 if (adev->jpeg.harvest_config & (1 << i))
747 continue;
748
749 adev->jpeg.inst[i].irq.num_types = 1;
750 adev->jpeg.inst[i].irq.funcs = &jpeg_v2_5_irq_funcs;
751
752 adev->jpeg.inst[i].ras_poison_irq.num_types = 1;
753 adev->jpeg.inst[i].ras_poison_irq.funcs = &jpeg_v2_6_ras_irq_funcs;
754 }
755 }
756
757 const struct amdgpu_ip_block_version jpeg_v2_5_ip_block =
758 {
759 .type = AMD_IP_BLOCK_TYPE_JPEG,
760 .major = 2,
761 .minor = 5,
762 .rev = 0,
763 .funcs = &jpeg_v2_5_ip_funcs,
764 };
765
766 const struct amdgpu_ip_block_version jpeg_v2_6_ip_block =
767 {
768 .type = AMD_IP_BLOCK_TYPE_JPEG,
769 .major = 2,
770 .minor = 6,
771 .rev = 0,
772 .funcs = &jpeg_v2_6_ip_funcs,
773 };
774
jpeg_v2_6_query_poison_by_instance(struct amdgpu_device * adev,uint32_t instance,uint32_t sub_block)775 static uint32_t jpeg_v2_6_query_poison_by_instance(struct amdgpu_device *adev,
776 uint32_t instance, uint32_t sub_block)
777 {
778 uint32_t poison_stat = 0, reg_value = 0;
779
780 switch (sub_block) {
781 case AMDGPU_JPEG_V2_6_JPEG0:
782 reg_value = RREG32_SOC15(JPEG, instance, mmUVD_RAS_JPEG0_STATUS);
783 poison_stat = REG_GET_FIELD(reg_value, UVD_RAS_JPEG0_STATUS, POISONED_PF);
784 break;
785 case AMDGPU_JPEG_V2_6_JPEG1:
786 reg_value = RREG32_SOC15(JPEG, instance, mmUVD_RAS_JPEG1_STATUS);
787 poison_stat = REG_GET_FIELD(reg_value, UVD_RAS_JPEG1_STATUS, POISONED_PF);
788 break;
789 default:
790 break;
791 }
792
793 if (poison_stat)
794 dev_info(adev->dev, "Poison detected in JPEG%d sub_block%d\n",
795 instance, sub_block);
796
797 return poison_stat;
798 }
799
jpeg_v2_6_query_ras_poison_status(struct amdgpu_device * adev)800 static bool jpeg_v2_6_query_ras_poison_status(struct amdgpu_device *adev)
801 {
802 uint32_t inst = 0, sub = 0, poison_stat = 0;
803
804 for (inst = 0; inst < adev->jpeg.num_jpeg_inst; inst++)
805 for (sub = 0; sub < AMDGPU_JPEG_V2_6_MAX_SUB_BLOCK; sub++)
806 poison_stat +=
807 jpeg_v2_6_query_poison_by_instance(adev, inst, sub);
808
809 return !!poison_stat;
810 }
811
812 const struct amdgpu_ras_block_hw_ops jpeg_v2_6_ras_hw_ops = {
813 .query_poison_status = jpeg_v2_6_query_ras_poison_status,
814 };
815
816 static struct amdgpu_jpeg_ras jpeg_v2_6_ras = {
817 .ras_block = {
818 .hw_ops = &jpeg_v2_6_ras_hw_ops,
819 .ras_late_init = amdgpu_jpeg_ras_late_init,
820 },
821 };
822
jpeg_v2_5_set_ras_funcs(struct amdgpu_device * adev)823 static void jpeg_v2_5_set_ras_funcs(struct amdgpu_device *adev)
824 {
825 switch (adev->ip_versions[JPEG_HWIP][0]) {
826 case IP_VERSION(2, 6, 0):
827 adev->jpeg.ras = &jpeg_v2_6_ras;
828 break;
829 default:
830 break;
831 }
832 }
833