]> git.proxmox.com Git - mirror_ubuntu-hirsute-kernel.git/blob - drivers/gpu/drm/amd/amdgpu/jpeg_v2_0.c
Merge tag 'kbuild-v5.6-2' of git://git.kernel.org/pub/scm/linux/kernel/git/masahiroy...
[mirror_ubuntu-hirsute-kernel.git] / drivers / gpu / drm / amd / amdgpu / jpeg_v2_0.c
1 /*
2 * Copyright 2019 Advanced Micro Devices, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
21 *
22 */
23
24 #include "amdgpu.h"
25 #include "amdgpu_jpeg.h"
26 #include "amdgpu_pm.h"
27 #include "soc15.h"
28 #include "soc15d.h"
29
30 #include "vcn/vcn_2_0_0_offset.h"
31 #include "vcn/vcn_2_0_0_sh_mask.h"
32 #include "ivsrcid/vcn/irqsrcs_vcn_2_0.h"
33
34 #define mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET 0x1bfff
35 #define mmUVD_JPEG_GPCOM_CMD_INTERNAL_OFFSET 0x4029
36 #define mmUVD_JPEG_GPCOM_DATA0_INTERNAL_OFFSET 0x402a
37 #define mmUVD_JPEG_GPCOM_DATA1_INTERNAL_OFFSET 0x402b
38 #define mmUVD_LMI_JRBC_RB_MEM_WR_64BIT_BAR_LOW_INTERNAL_OFFSET 0x40ea
39 #define mmUVD_LMI_JRBC_RB_MEM_WR_64BIT_BAR_HIGH_INTERNAL_OFFSET 0x40eb
40 #define mmUVD_LMI_JRBC_IB_VMID_INTERNAL_OFFSET 0x40cf
41 #define mmUVD_LMI_JPEG_VMID_INTERNAL_OFFSET 0x40d1
42 #define mmUVD_LMI_JRBC_IB_64BIT_BAR_LOW_INTERNAL_OFFSET 0x40e8
43 #define mmUVD_LMI_JRBC_IB_64BIT_BAR_HIGH_INTERNAL_OFFSET 0x40e9
44 #define mmUVD_JRBC_IB_SIZE_INTERNAL_OFFSET 0x4082
45 #define mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_LOW_INTERNAL_OFFSET 0x40ec
46 #define mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_HIGH_INTERNAL_OFFSET 0x40ed
47 #define mmUVD_JRBC_RB_COND_RD_TIMER_INTERNAL_OFFSET 0x4085
48 #define mmUVD_JRBC_RB_REF_DATA_INTERNAL_OFFSET 0x4084
49 #define mmUVD_JRBC_STATUS_INTERNAL_OFFSET 0x4089
50 #define mmUVD_JPEG_PITCH_INTERNAL_OFFSET 0x401f
51
52 #define JRBC_DEC_EXTERNAL_REG_WRITE_ADDR 0x18000
53
54 static void jpeg_v2_0_set_dec_ring_funcs(struct amdgpu_device *adev);
55 static void jpeg_v2_0_set_irq_funcs(struct amdgpu_device *adev);
56 static int jpeg_v2_0_set_powergating_state(void *handle,
57 enum amd_powergating_state state);
58
59 /**
60 * jpeg_v2_0_early_init - set function pointers
61 *
62 * @handle: amdgpu_device pointer
63 *
64 * Set ring and irq function pointers
65 */
66 static int jpeg_v2_0_early_init(void *handle)
67 {
68 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
69
70 adev->jpeg.num_jpeg_inst = 1;
71
72 jpeg_v2_0_set_dec_ring_funcs(adev);
73 jpeg_v2_0_set_irq_funcs(adev);
74
75 return 0;
76 }
77
78 /**
79 * jpeg_v2_0_sw_init - sw init for JPEG block
80 *
81 * @handle: amdgpu_device pointer
82 *
83 * Load firmware and sw initialization
84 */
85 static int jpeg_v2_0_sw_init(void *handle)
86 {
87 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
88 struct amdgpu_ring *ring;
89 int r;
90
91 /* JPEG TRAP */
92 r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_VCN,
93 VCN_2_0__SRCID__JPEG_DECODE, &adev->jpeg.inst->irq);
94 if (r)
95 return r;
96
97 r = amdgpu_jpeg_sw_init(adev);
98 if (r)
99 return r;
100
101 r = amdgpu_jpeg_resume(adev);
102 if (r)
103 return r;
104
105 ring = &adev->jpeg.inst->ring_dec;
106 ring->use_doorbell = true;
107 ring->doorbell_index = (adev->doorbell_index.vcn.vcn_ring0_1 << 1) + 1;
108 sprintf(ring->name, "jpeg_dec");
109 r = amdgpu_ring_init(adev, ring, 512, &adev->jpeg.inst->irq, 0);
110 if (r)
111 return r;
112
113 adev->jpeg.internal.jpeg_pitch = mmUVD_JPEG_PITCH_INTERNAL_OFFSET;
114 adev->jpeg.inst->external.jpeg_pitch = SOC15_REG_OFFSET(JPEG, 0, mmUVD_JPEG_PITCH);
115
116 return 0;
117 }
118
119 /**
120 * jpeg_v2_0_sw_fini - sw fini for JPEG block
121 *
122 * @handle: amdgpu_device pointer
123 *
124 * JPEG suspend and free up sw allocation
125 */
126 static int jpeg_v2_0_sw_fini(void *handle)
127 {
128 int r;
129 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
130
131 r = amdgpu_jpeg_suspend(adev);
132 if (r)
133 return r;
134
135 r = amdgpu_jpeg_sw_fini(adev);
136
137 return r;
138 }
139
140 /**
141 * jpeg_v2_0_hw_init - start and test JPEG block
142 *
143 * @handle: amdgpu_device pointer
144 *
145 */
146 static int jpeg_v2_0_hw_init(void *handle)
147 {
148 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
149 struct amdgpu_ring *ring = &adev->jpeg.inst->ring_dec;
150 int r;
151
152 adev->nbio.funcs->vcn_doorbell_range(adev, ring->use_doorbell,
153 (adev->doorbell_index.vcn.vcn_ring0_1 << 1), 0);
154
155 r = amdgpu_ring_test_helper(ring);
156 if (!r)
157 DRM_INFO("JPEG decode initialized successfully.\n");
158
159 return r;
160 }
161
162 /**
163 * jpeg_v2_0_hw_fini - stop the hardware block
164 *
165 * @handle: amdgpu_device pointer
166 *
167 * Stop the JPEG block, mark ring as not ready any more
168 */
169 static int jpeg_v2_0_hw_fini(void *handle)
170 {
171 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
172 struct amdgpu_ring *ring = &adev->jpeg.inst->ring_dec;
173
174 if (adev->jpeg.cur_state != AMD_PG_STATE_GATE &&
175 RREG32_SOC15(JPEG, 0, mmUVD_JRBC_STATUS))
176 jpeg_v2_0_set_powergating_state(adev, AMD_PG_STATE_GATE);
177
178 ring->sched.ready = false;
179
180 return 0;
181 }
182
183 /**
184 * jpeg_v2_0_suspend - suspend JPEG block
185 *
186 * @handle: amdgpu_device pointer
187 *
188 * HW fini and suspend JPEG block
189 */
190 static int jpeg_v2_0_suspend(void *handle)
191 {
192 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
193 int r;
194
195 r = jpeg_v2_0_hw_fini(adev);
196 if (r)
197 return r;
198
199 r = amdgpu_jpeg_suspend(adev);
200
201 return r;
202 }
203
204 /**
205 * jpeg_v2_0_resume - resume JPEG block
206 *
207 * @handle: amdgpu_device pointer
208 *
209 * Resume firmware and hw init JPEG block
210 */
211 static int jpeg_v2_0_resume(void *handle)
212 {
213 int r;
214 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
215
216 r = amdgpu_jpeg_resume(adev);
217 if (r)
218 return r;
219
220 r = jpeg_v2_0_hw_init(adev);
221
222 return r;
223 }
224
225 static int jpeg_v2_0_disable_power_gating(struct amdgpu_device *adev)
226 {
227 uint32_t data;
228 int r = 0;
229
230 if (adev->pg_flags & AMD_PG_SUPPORT_JPEG) {
231 data = 1 << UVD_PGFSM_CONFIG__UVDJ_PWR_CONFIG__SHIFT;
232 WREG32(SOC15_REG_OFFSET(JPEG, 0, mmUVD_PGFSM_CONFIG), data);
233
234 SOC15_WAIT_ON_RREG(JPEG, 0,
235 mmUVD_PGFSM_STATUS, UVD_PGFSM_STATUS_UVDJ_PWR_ON,
236 UVD_PGFSM_STATUS__UVDJ_PWR_STATUS_MASK, r);
237
238 if (r) {
239 DRM_ERROR("amdgpu: JPEG disable power gating failed\n");
240 return r;
241 }
242 }
243
244 /* Removing the anti hang mechanism to indicate the UVDJ tile is ON */
245 data = RREG32(SOC15_REG_OFFSET(JPEG, 0, mmUVD_JPEG_POWER_STATUS)) & ~0x1;
246 WREG32(SOC15_REG_OFFSET(JPEG, 0, mmUVD_JPEG_POWER_STATUS), data);
247
248 return 0;
249 }
250
251 static int jpeg_v2_0_enable_power_gating(struct amdgpu_device* adev)
252 {
253 if (adev->pg_flags & AMD_PG_SUPPORT_JPEG) {
254 uint32_t data;
255 int r = 0;
256
257 data = RREG32(SOC15_REG_OFFSET(JPEG, 0, mmUVD_JPEG_POWER_STATUS));
258 data &= ~UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_MASK;
259 data |= 0x1; //UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_TILES_OFF;
260 WREG32(SOC15_REG_OFFSET(JPEG, 0, mmUVD_JPEG_POWER_STATUS), data);
261
262 data = 2 << UVD_PGFSM_CONFIG__UVDJ_PWR_CONFIG__SHIFT;
263 WREG32(SOC15_REG_OFFSET(JPEG, 0, mmUVD_PGFSM_CONFIG), data);
264
265 SOC15_WAIT_ON_RREG(JPEG, 0, mmUVD_PGFSM_STATUS,
266 (2 << UVD_PGFSM_STATUS__UVDJ_PWR_STATUS__SHIFT),
267 UVD_PGFSM_STATUS__UVDJ_PWR_STATUS_MASK, r);
268
269 if (r) {
270 DRM_ERROR("amdgpu: JPEG enable power gating failed\n");
271 return r;
272 }
273 }
274
275 return 0;
276 }
277
278 static void jpeg_v2_0_disable_clock_gating(struct amdgpu_device* adev)
279 {
280 uint32_t data;
281
282 data = RREG32_SOC15(JPEG, 0, mmJPEG_CGC_CTRL);
283 if (adev->cg_flags & AMD_CG_SUPPORT_JPEG_MGCG)
284 data |= 1 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
285 else
286 data &= ~JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
287
288 data |= 1 << JPEG_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
289 data |= 4 << JPEG_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
290 WREG32_SOC15(JPEG, 0, mmJPEG_CGC_CTRL, data);
291
292 data = RREG32_SOC15(JPEG, 0, mmJPEG_CGC_GATE);
293 data &= ~(JPEG_CGC_GATE__JPEG_DEC_MASK
294 | JPEG_CGC_GATE__JPEG2_DEC_MASK
295 | JPEG_CGC_GATE__JPEG_ENC_MASK
296 | JPEG_CGC_GATE__JMCIF_MASK
297 | JPEG_CGC_GATE__JRBBM_MASK);
298 WREG32_SOC15(JPEG, 0, mmJPEG_CGC_GATE, data);
299 }
300
301 static void jpeg_v2_0_enable_clock_gating(struct amdgpu_device* adev)
302 {
303 uint32_t data;
304
305 data = RREG32_SOC15(JPEG, 0, mmJPEG_CGC_CTRL);
306 if (adev->cg_flags & AMD_CG_SUPPORT_JPEG_MGCG)
307 data |= 1 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
308 else
309 data |= 0 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
310
311 data |= 1 << JPEG_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
312 data |= 4 << JPEG_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
313 WREG32_SOC15(JPEG, 0, mmJPEG_CGC_CTRL, data);
314
315 data = RREG32_SOC15(JPEG, 0, mmJPEG_CGC_GATE);
316 data |= (JPEG_CGC_GATE__JPEG_DEC_MASK
317 |JPEG_CGC_GATE__JPEG2_DEC_MASK
318 |JPEG_CGC_GATE__JPEG_ENC_MASK
319 |JPEG_CGC_GATE__JMCIF_MASK
320 |JPEG_CGC_GATE__JRBBM_MASK);
321 WREG32_SOC15(JPEG, 0, mmJPEG_CGC_GATE, data);
322 }
323
324 /**
325 * jpeg_v2_0_start - start JPEG block
326 *
327 * @adev: amdgpu_device pointer
328 *
329 * Setup and start the JPEG block
330 */
331 static int jpeg_v2_0_start(struct amdgpu_device *adev)
332 {
333 struct amdgpu_ring *ring = &adev->jpeg.inst->ring_dec;
334 int r;
335
336 if (adev->pm.dpm_enabled)
337 amdgpu_dpm_enable_jpeg(adev, true);
338
339 /* disable power gating */
340 r = jpeg_v2_0_disable_power_gating(adev);
341 if (r)
342 return r;
343
344 /* JPEG disable CGC */
345 jpeg_v2_0_disable_clock_gating(adev);
346
347 WREG32_SOC15(JPEG, 0, mmJPEG_DEC_GFX10_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
348
349 /* enable JMI channel */
350 WREG32_P(SOC15_REG_OFFSET(JPEG, 0, mmUVD_JMI_CNTL), 0,
351 ~UVD_JMI_CNTL__SOFT_RESET_MASK);
352
353 /* enable System Interrupt for JRBC */
354 WREG32_P(SOC15_REG_OFFSET(JPEG, 0, mmJPEG_SYS_INT_EN),
355 JPEG_SYS_INT_EN__DJRBC_MASK,
356 ~JPEG_SYS_INT_EN__DJRBC_MASK);
357
358 WREG32_SOC15(JPEG, 0, mmUVD_LMI_JRBC_RB_VMID, 0);
359 WREG32_SOC15(JPEG, 0, mmUVD_JRBC_RB_CNTL, (0x00000001L | 0x00000002L));
360 WREG32_SOC15(JPEG, 0, mmUVD_LMI_JRBC_RB_64BIT_BAR_LOW,
361 lower_32_bits(ring->gpu_addr));
362 WREG32_SOC15(JPEG, 0, mmUVD_LMI_JRBC_RB_64BIT_BAR_HIGH,
363 upper_32_bits(ring->gpu_addr));
364 WREG32_SOC15(JPEG, 0, mmUVD_JRBC_RB_RPTR, 0);
365 WREG32_SOC15(JPEG, 0, mmUVD_JRBC_RB_WPTR, 0);
366 WREG32_SOC15(JPEG, 0, mmUVD_JRBC_RB_CNTL, 0x00000002L);
367 WREG32_SOC15(JPEG, 0, mmUVD_JRBC_RB_SIZE, ring->ring_size / 4);
368 ring->wptr = RREG32_SOC15(JPEG, 0, mmUVD_JRBC_RB_WPTR);
369
370 return 0;
371 }
372
373 /**
374 * jpeg_v2_0_stop - stop JPEG block
375 *
376 * @adev: amdgpu_device pointer
377 *
378 * stop the JPEG block
379 */
380 static int jpeg_v2_0_stop(struct amdgpu_device *adev)
381 {
382 int r;
383
384 /* reset JMI */
385 WREG32_P(SOC15_REG_OFFSET(JPEG, 0, mmUVD_JMI_CNTL),
386 UVD_JMI_CNTL__SOFT_RESET_MASK,
387 ~UVD_JMI_CNTL__SOFT_RESET_MASK);
388
389 /* enable JPEG CGC */
390 jpeg_v2_0_enable_clock_gating(adev);
391
392 /* enable power gating */
393 r = jpeg_v2_0_enable_power_gating(adev);
394 if (r)
395 return r;
396
397 if (adev->pm.dpm_enabled)
398 amdgpu_dpm_enable_jpeg(adev, false);
399
400 return 0;
401 }
402
403 /**
404 * jpeg_v2_0_dec_ring_get_rptr - get read pointer
405 *
406 * @ring: amdgpu_ring pointer
407 *
408 * Returns the current hardware read pointer
409 */
410 static uint64_t jpeg_v2_0_dec_ring_get_rptr(struct amdgpu_ring *ring)
411 {
412 struct amdgpu_device *adev = ring->adev;
413
414 return RREG32_SOC15(JPEG, 0, mmUVD_JRBC_RB_RPTR);
415 }
416
417 /**
418 * jpeg_v2_0_dec_ring_get_wptr - get write pointer
419 *
420 * @ring: amdgpu_ring pointer
421 *
422 * Returns the current hardware write pointer
423 */
424 static uint64_t jpeg_v2_0_dec_ring_get_wptr(struct amdgpu_ring *ring)
425 {
426 struct amdgpu_device *adev = ring->adev;
427
428 if (ring->use_doorbell)
429 return adev->wb.wb[ring->wptr_offs];
430 else
431 return RREG32_SOC15(JPEG, 0, mmUVD_JRBC_RB_WPTR);
432 }
433
434 /**
435 * jpeg_v2_0_dec_ring_set_wptr - set write pointer
436 *
437 * @ring: amdgpu_ring pointer
438 *
439 * Commits the write pointer to the hardware
440 */
441 static void jpeg_v2_0_dec_ring_set_wptr(struct amdgpu_ring *ring)
442 {
443 struct amdgpu_device *adev = ring->adev;
444
445 if (ring->use_doorbell) {
446 adev->wb.wb[ring->wptr_offs] = lower_32_bits(ring->wptr);
447 WDOORBELL32(ring->doorbell_index, lower_32_bits(ring->wptr));
448 } else {
449 WREG32_SOC15(JPEG, 0, mmUVD_JRBC_RB_WPTR, lower_32_bits(ring->wptr));
450 }
451 }
452
453 /**
454 * jpeg_v2_0_dec_ring_insert_start - insert a start command
455 *
456 * @ring: amdgpu_ring pointer
457 *
458 * Write a start command to the ring.
459 */
460 void jpeg_v2_0_dec_ring_insert_start(struct amdgpu_ring *ring)
461 {
462 amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
463 0, 0, PACKETJ_TYPE0));
464 amdgpu_ring_write(ring, 0x68e04);
465
466 amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
467 0, 0, PACKETJ_TYPE0));
468 amdgpu_ring_write(ring, 0x80010000);
469 }
470
471 /**
472 * jpeg_v2_0_dec_ring_insert_end - insert a end command
473 *
474 * @ring: amdgpu_ring pointer
475 *
476 * Write a end command to the ring.
477 */
478 void jpeg_v2_0_dec_ring_insert_end(struct amdgpu_ring *ring)
479 {
480 amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
481 0, 0, PACKETJ_TYPE0));
482 amdgpu_ring_write(ring, 0x68e04);
483
484 amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
485 0, 0, PACKETJ_TYPE0));
486 amdgpu_ring_write(ring, 0x00010000);
487 }
488
489 /**
490 * jpeg_v2_0_dec_ring_emit_fence - emit an fence & trap command
491 *
492 * @ring: amdgpu_ring pointer
493 * @fence: fence to emit
494 *
495 * Write a fence and a trap command to the ring.
496 */
497 void jpeg_v2_0_dec_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq,
498 unsigned flags)
499 {
500 WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
501
502 amdgpu_ring_write(ring, PACKETJ(mmUVD_JPEG_GPCOM_DATA0_INTERNAL_OFFSET,
503 0, 0, PACKETJ_TYPE0));
504 amdgpu_ring_write(ring, seq);
505
506 amdgpu_ring_write(ring, PACKETJ(mmUVD_JPEG_GPCOM_DATA1_INTERNAL_OFFSET,
507 0, 0, PACKETJ_TYPE0));
508 amdgpu_ring_write(ring, seq);
509
510 amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_RB_MEM_WR_64BIT_BAR_LOW_INTERNAL_OFFSET,
511 0, 0, PACKETJ_TYPE0));
512 amdgpu_ring_write(ring, lower_32_bits(addr));
513
514 amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_RB_MEM_WR_64BIT_BAR_HIGH_INTERNAL_OFFSET,
515 0, 0, PACKETJ_TYPE0));
516 amdgpu_ring_write(ring, upper_32_bits(addr));
517
518 amdgpu_ring_write(ring, PACKETJ(mmUVD_JPEG_GPCOM_CMD_INTERNAL_OFFSET,
519 0, 0, PACKETJ_TYPE0));
520 amdgpu_ring_write(ring, 0x8);
521
522 amdgpu_ring_write(ring, PACKETJ(mmUVD_JPEG_GPCOM_CMD_INTERNAL_OFFSET,
523 0, PACKETJ_CONDITION_CHECK0, PACKETJ_TYPE4));
524 amdgpu_ring_write(ring, 0);
525
526 amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
527 0, 0, PACKETJ_TYPE0));
528 amdgpu_ring_write(ring, 0x3fbc);
529
530 amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
531 0, 0, PACKETJ_TYPE0));
532 amdgpu_ring_write(ring, 0x1);
533
534 amdgpu_ring_write(ring, PACKETJ(0, 0, 0, PACKETJ_TYPE7));
535 amdgpu_ring_write(ring, 0);
536 }
537
538 /**
539 * jpeg_v2_0_dec_ring_emit_ib - execute indirect buffer
540 *
541 * @ring: amdgpu_ring pointer
542 * @ib: indirect buffer to execute
543 *
544 * Write ring commands to execute the indirect buffer.
545 */
546 void jpeg_v2_0_dec_ring_emit_ib(struct amdgpu_ring *ring,
547 struct amdgpu_job *job,
548 struct amdgpu_ib *ib,
549 uint32_t flags)
550 {
551 unsigned vmid = AMDGPU_JOB_GET_VMID(job);
552
553 amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_IB_VMID_INTERNAL_OFFSET,
554 0, 0, PACKETJ_TYPE0));
555 amdgpu_ring_write(ring, (vmid | (vmid << 4)));
556
557 amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JPEG_VMID_INTERNAL_OFFSET,
558 0, 0, PACKETJ_TYPE0));
559 amdgpu_ring_write(ring, (vmid | (vmid << 4)));
560
561 amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_IB_64BIT_BAR_LOW_INTERNAL_OFFSET,
562 0, 0, PACKETJ_TYPE0));
563 amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
564
565 amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_IB_64BIT_BAR_HIGH_INTERNAL_OFFSET,
566 0, 0, PACKETJ_TYPE0));
567 amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
568
569 amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_IB_SIZE_INTERNAL_OFFSET,
570 0, 0, PACKETJ_TYPE0));
571 amdgpu_ring_write(ring, ib->length_dw);
572
573 amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_LOW_INTERNAL_OFFSET,
574 0, 0, PACKETJ_TYPE0));
575 amdgpu_ring_write(ring, lower_32_bits(ring->gpu_addr));
576
577 amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_HIGH_INTERNAL_OFFSET,
578 0, 0, PACKETJ_TYPE0));
579 amdgpu_ring_write(ring, upper_32_bits(ring->gpu_addr));
580
581 amdgpu_ring_write(ring, PACKETJ(0, 0, PACKETJ_CONDITION_CHECK0, PACKETJ_TYPE2));
582 amdgpu_ring_write(ring, 0);
583
584 amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_RB_COND_RD_TIMER_INTERNAL_OFFSET,
585 0, 0, PACKETJ_TYPE0));
586 amdgpu_ring_write(ring, 0x01400200);
587
588 amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_RB_REF_DATA_INTERNAL_OFFSET,
589 0, 0, PACKETJ_TYPE0));
590 amdgpu_ring_write(ring, 0x2);
591
592 amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_STATUS_INTERNAL_OFFSET,
593 0, PACKETJ_CONDITION_CHECK3, PACKETJ_TYPE3));
594 amdgpu_ring_write(ring, 0x2);
595 }
596
597 void jpeg_v2_0_dec_ring_emit_reg_wait(struct amdgpu_ring *ring, uint32_t reg,
598 uint32_t val, uint32_t mask)
599 {
600 uint32_t reg_offset = (reg << 2);
601
602 amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_RB_COND_RD_TIMER_INTERNAL_OFFSET,
603 0, 0, PACKETJ_TYPE0));
604 amdgpu_ring_write(ring, 0x01400200);
605
606 amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_RB_REF_DATA_INTERNAL_OFFSET,
607 0, 0, PACKETJ_TYPE0));
608 amdgpu_ring_write(ring, val);
609
610 amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
611 0, 0, PACKETJ_TYPE0));
612 if (reg_offset >= 0x10000 && reg_offset <= 0x105ff) {
613 amdgpu_ring_write(ring, 0);
614 amdgpu_ring_write(ring,
615 PACKETJ((reg_offset >> 2), 0, 0, PACKETJ_TYPE3));
616 } else {
617 amdgpu_ring_write(ring, reg_offset);
618 amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
619 0, 0, PACKETJ_TYPE3));
620 }
621 amdgpu_ring_write(ring, mask);
622 }
623
624 void jpeg_v2_0_dec_ring_emit_vm_flush(struct amdgpu_ring *ring,
625 unsigned vmid, uint64_t pd_addr)
626 {
627 struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
628 uint32_t data0, data1, mask;
629
630 pd_addr = amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
631
632 /* wait for register write */
633 data0 = hub->ctx0_ptb_addr_lo32 + vmid * 2;
634 data1 = lower_32_bits(pd_addr);
635 mask = 0xffffffff;
636 jpeg_v2_0_dec_ring_emit_reg_wait(ring, data0, data1, mask);
637 }
638
639 void jpeg_v2_0_dec_ring_emit_wreg(struct amdgpu_ring *ring, uint32_t reg, uint32_t val)
640 {
641 uint32_t reg_offset = (reg << 2);
642
643 amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
644 0, 0, PACKETJ_TYPE0));
645 if (reg_offset >= 0x10000 && reg_offset <= 0x105ff) {
646 amdgpu_ring_write(ring, 0);
647 amdgpu_ring_write(ring,
648 PACKETJ((reg_offset >> 2), 0, 0, PACKETJ_TYPE0));
649 } else {
650 amdgpu_ring_write(ring, reg_offset);
651 amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
652 0, 0, PACKETJ_TYPE0));
653 }
654 amdgpu_ring_write(ring, val);
655 }
656
657 void jpeg_v2_0_dec_ring_nop(struct amdgpu_ring *ring, uint32_t count)
658 {
659 int i;
660
661 WARN_ON(ring->wptr % 2 || count % 2);
662
663 for (i = 0; i < count / 2; i++) {
664 amdgpu_ring_write(ring, PACKETJ(0, 0, 0, PACKETJ_TYPE6));
665 amdgpu_ring_write(ring, 0);
666 }
667 }
668
669 static bool jpeg_v2_0_is_idle(void *handle)
670 {
671 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
672
673 return ((RREG32_SOC15(JPEG, 0, mmUVD_JRBC_STATUS) &
674 UVD_JRBC_STATUS__RB_JOB_DONE_MASK) ==
675 UVD_JRBC_STATUS__RB_JOB_DONE_MASK);
676 }
677
678 static int jpeg_v2_0_wait_for_idle(void *handle)
679 {
680 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
681 int ret = 0;
682
683 SOC15_WAIT_ON_RREG(JPEG, 0, mmUVD_JRBC_STATUS, UVD_JRBC_STATUS__RB_JOB_DONE_MASK,
684 UVD_JRBC_STATUS__RB_JOB_DONE_MASK, ret);
685
686 return ret;
687 }
688
689 static int jpeg_v2_0_set_clockgating_state(void *handle,
690 enum amd_clockgating_state state)
691 {
692 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
693 bool enable = (state == AMD_CG_STATE_GATE);
694
695 if (enable) {
696 if (jpeg_v2_0_is_idle(handle))
697 return -EBUSY;
698 jpeg_v2_0_enable_clock_gating(adev);
699 } else {
700 jpeg_v2_0_disable_clock_gating(adev);
701 }
702
703 return 0;
704 }
705
706 static int jpeg_v2_0_set_powergating_state(void *handle,
707 enum amd_powergating_state state)
708 {
709 struct amdgpu_device *adev = (struct amdgpu_device *)handle;
710 int ret;
711
712 if (state == adev->jpeg.cur_state)
713 return 0;
714
715 if (state == AMD_PG_STATE_GATE)
716 ret = jpeg_v2_0_stop(adev);
717 else
718 ret = jpeg_v2_0_start(adev);
719
720 if (!ret)
721 adev->jpeg.cur_state = state;
722
723 return ret;
724 }
725
726 static int jpeg_v2_0_set_interrupt_state(struct amdgpu_device *adev,
727 struct amdgpu_irq_src *source,
728 unsigned type,
729 enum amdgpu_interrupt_state state)
730 {
731 return 0;
732 }
733
734 static int jpeg_v2_0_process_interrupt(struct amdgpu_device *adev,
735 struct amdgpu_irq_src *source,
736 struct amdgpu_iv_entry *entry)
737 {
738 DRM_DEBUG("IH: JPEG TRAP\n");
739
740 switch (entry->src_id) {
741 case VCN_2_0__SRCID__JPEG_DECODE:
742 amdgpu_fence_process(&adev->jpeg.inst->ring_dec);
743 break;
744 default:
745 DRM_ERROR("Unhandled interrupt: %d %d\n",
746 entry->src_id, entry->src_data[0]);
747 break;
748 }
749
750 return 0;
751 }
752
753 static const struct amd_ip_funcs jpeg_v2_0_ip_funcs = {
754 .name = "jpeg_v2_0",
755 .early_init = jpeg_v2_0_early_init,
756 .late_init = NULL,
757 .sw_init = jpeg_v2_0_sw_init,
758 .sw_fini = jpeg_v2_0_sw_fini,
759 .hw_init = jpeg_v2_0_hw_init,
760 .hw_fini = jpeg_v2_0_hw_fini,
761 .suspend = jpeg_v2_0_suspend,
762 .resume = jpeg_v2_0_resume,
763 .is_idle = jpeg_v2_0_is_idle,
764 .wait_for_idle = jpeg_v2_0_wait_for_idle,
765 .check_soft_reset = NULL,
766 .pre_soft_reset = NULL,
767 .soft_reset = NULL,
768 .post_soft_reset = NULL,
769 .set_clockgating_state = jpeg_v2_0_set_clockgating_state,
770 .set_powergating_state = jpeg_v2_0_set_powergating_state,
771 };
772
773 static const struct amdgpu_ring_funcs jpeg_v2_0_dec_ring_vm_funcs = {
774 .type = AMDGPU_RING_TYPE_VCN_JPEG,
775 .align_mask = 0xf,
776 .vmhub = AMDGPU_MMHUB_0,
777 .get_rptr = jpeg_v2_0_dec_ring_get_rptr,
778 .get_wptr = jpeg_v2_0_dec_ring_get_wptr,
779 .set_wptr = jpeg_v2_0_dec_ring_set_wptr,
780 .emit_frame_size =
781 SOC15_FLUSH_GPU_TLB_NUM_WREG * 6 +
782 SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 8 +
783 8 + /* jpeg_v2_0_dec_ring_emit_vm_flush */
784 18 + 18 + /* jpeg_v2_0_dec_ring_emit_fence x2 vm fence */
785 8 + 16,
786 .emit_ib_size = 22, /* jpeg_v2_0_dec_ring_emit_ib */
787 .emit_ib = jpeg_v2_0_dec_ring_emit_ib,
788 .emit_fence = jpeg_v2_0_dec_ring_emit_fence,
789 .emit_vm_flush = jpeg_v2_0_dec_ring_emit_vm_flush,
790 .test_ring = amdgpu_jpeg_dec_ring_test_ring,
791 .test_ib = amdgpu_jpeg_dec_ring_test_ib,
792 .insert_nop = jpeg_v2_0_dec_ring_nop,
793 .insert_start = jpeg_v2_0_dec_ring_insert_start,
794 .insert_end = jpeg_v2_0_dec_ring_insert_end,
795 .pad_ib = amdgpu_ring_generic_pad_ib,
796 .begin_use = amdgpu_jpeg_ring_begin_use,
797 .end_use = amdgpu_jpeg_ring_end_use,
798 .emit_wreg = jpeg_v2_0_dec_ring_emit_wreg,
799 .emit_reg_wait = jpeg_v2_0_dec_ring_emit_reg_wait,
800 .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
801 };
802
803 static void jpeg_v2_0_set_dec_ring_funcs(struct amdgpu_device *adev)
804 {
805 adev->jpeg.inst->ring_dec.funcs = &jpeg_v2_0_dec_ring_vm_funcs;
806 DRM_INFO("JPEG decode is enabled in VM mode\n");
807 }
808
809 static const struct amdgpu_irq_src_funcs jpeg_v2_0_irq_funcs = {
810 .set = jpeg_v2_0_set_interrupt_state,
811 .process = jpeg_v2_0_process_interrupt,
812 };
813
814 static void jpeg_v2_0_set_irq_funcs(struct amdgpu_device *adev)
815 {
816 adev->jpeg.inst->irq.num_types = 1;
817 adev->jpeg.inst->irq.funcs = &jpeg_v2_0_irq_funcs;
818 }
819
820 const struct amdgpu_ip_block_version jpeg_v2_0_ip_block =
821 {
822 .type = AMD_IP_BLOCK_TYPE_JPEG,
823 .major = 2,
824 .minor = 0,
825 .rev = 0,
826 .funcs = &jpeg_v2_0_ip_funcs,
827 };