OSDN Git Service

smb3: Add defines for new information level, FileIdInformation
[tomoyo/tomoyo-test1.git] / drivers / gpu / drm / amd / amdgpu / jpeg_v2_0.c
1 /*
2  * Copyright 2019 Advanced Micro Devices, Inc.
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice shall be included in
12  * all copies or substantial portions of the Software.
13  *
14  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20  * OTHER DEALINGS IN THE SOFTWARE.
21  *
22  */
23
24 #include "amdgpu.h"
25 #include "amdgpu_jpeg.h"
26 #include "amdgpu_pm.h"
27 #include "soc15.h"
28 #include "soc15d.h"
29
30 #include "vcn/vcn_2_0_0_offset.h"
31 #include "vcn/vcn_2_0_0_sh_mask.h"
32 #include "ivsrcid/vcn/irqsrcs_vcn_2_0.h"
33
34 #define mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET                         0x1bfff
35 #define mmUVD_JPEG_GPCOM_CMD_INTERNAL_OFFSET                            0x4029
36 #define mmUVD_JPEG_GPCOM_DATA0_INTERNAL_OFFSET                          0x402a
37 #define mmUVD_JPEG_GPCOM_DATA1_INTERNAL_OFFSET                          0x402b
38 #define mmUVD_LMI_JRBC_RB_MEM_WR_64BIT_BAR_LOW_INTERNAL_OFFSET          0x40ea
39 #define mmUVD_LMI_JRBC_RB_MEM_WR_64BIT_BAR_HIGH_INTERNAL_OFFSET         0x40eb
40 #define mmUVD_LMI_JRBC_IB_VMID_INTERNAL_OFFSET                          0x40cf
41 #define mmUVD_LMI_JPEG_VMID_INTERNAL_OFFSET                             0x40d1
42 #define mmUVD_LMI_JRBC_IB_64BIT_BAR_LOW_INTERNAL_OFFSET                 0x40e8
43 #define mmUVD_LMI_JRBC_IB_64BIT_BAR_HIGH_INTERNAL_OFFSET                0x40e9
44 #define mmUVD_JRBC_IB_SIZE_INTERNAL_OFFSET                              0x4082
45 #define mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_LOW_INTERNAL_OFFSET          0x40ec
46 #define mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_HIGH_INTERNAL_OFFSET         0x40ed
47 #define mmUVD_JRBC_RB_COND_RD_TIMER_INTERNAL_OFFSET                     0x4085
48 #define mmUVD_JRBC_RB_REF_DATA_INTERNAL_OFFSET                          0x4084
49 #define mmUVD_JRBC_STATUS_INTERNAL_OFFSET                               0x4089
50 #define mmUVD_JPEG_PITCH_INTERNAL_OFFSET                                0x401f
51
52 #define JRBC_DEC_EXTERNAL_REG_WRITE_ADDR                                0x18000
53
54 static void jpeg_v2_0_set_dec_ring_funcs(struct amdgpu_device *adev);
55 static void jpeg_v2_0_set_irq_funcs(struct amdgpu_device *adev);
56 static int jpeg_v2_0_set_powergating_state(void *handle,
57                                 enum amd_powergating_state state);
58
59 /**
60  * jpeg_v2_0_early_init - set function pointers
61  *
62  * @handle: amdgpu_device pointer
63  *
64  * Set ring and irq function pointers
65  */
66 static int jpeg_v2_0_early_init(void *handle)
67 {
68         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
69
70         adev->jpeg.num_jpeg_inst = 1;
71
72         jpeg_v2_0_set_dec_ring_funcs(adev);
73         jpeg_v2_0_set_irq_funcs(adev);
74
75         return 0;
76 }
77
78 /**
79  * jpeg_v2_0_sw_init - sw init for JPEG block
80  *
81  * @handle: amdgpu_device pointer
82  *
83  * Load firmware and sw initialization
84  */
85 static int jpeg_v2_0_sw_init(void *handle)
86 {
87         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
88         struct amdgpu_ring *ring;
89         int r;
90
91         /* JPEG TRAP */
92         r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_VCN,
93                 VCN_2_0__SRCID__JPEG_DECODE, &adev->jpeg.inst->irq);
94         if (r)
95                 return r;
96
97         r = amdgpu_jpeg_sw_init(adev);
98         if (r)
99                 return r;
100
101         r = amdgpu_jpeg_resume(adev);
102         if (r)
103                 return r;
104
105         ring = &adev->jpeg.inst->ring_dec;
106         ring->use_doorbell = true;
107         ring->doorbell_index = (adev->doorbell_index.vcn.vcn_ring0_1 << 1) + 1;
108         sprintf(ring->name, "jpeg_dec");
109         r = amdgpu_ring_init(adev, ring, 512, &adev->jpeg.inst->irq, 0);
110         if (r)
111                 return r;
112
113         adev->jpeg.internal.jpeg_pitch = mmUVD_JPEG_PITCH_INTERNAL_OFFSET;
114         adev->jpeg.inst->external.jpeg_pitch = SOC15_REG_OFFSET(JPEG, 0, mmUVD_JPEG_PITCH);
115
116         return 0;
117 }
118
119 /**
120  * jpeg_v2_0_sw_fini - sw fini for JPEG block
121  *
122  * @handle: amdgpu_device pointer
123  *
124  * JPEG suspend and free up sw allocation
125  */
126 static int jpeg_v2_0_sw_fini(void *handle)
127 {
128         int r;
129         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
130
131         r = amdgpu_jpeg_suspend(adev);
132         if (r)
133                 return r;
134
135         r = amdgpu_jpeg_sw_fini(adev);
136
137         return r;
138 }
139
140 /**
141  * jpeg_v2_0_hw_init - start and test JPEG block
142  *
143  * @handle: amdgpu_device pointer
144  *
145  */
146 static int jpeg_v2_0_hw_init(void *handle)
147 {
148         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
149         struct amdgpu_ring *ring = &adev->jpeg.inst->ring_dec;
150         int r;
151
152         adev->nbio.funcs->vcn_doorbell_range(adev, ring->use_doorbell,
153                 (adev->doorbell_index.vcn.vcn_ring0_1 << 1), 0);
154
155         r = amdgpu_ring_test_helper(ring);
156         if (!r)
157                 DRM_INFO("JPEG decode initialized successfully.\n");
158
159         return r;
160 }
161
162 /**
163  * jpeg_v2_0_hw_fini - stop the hardware block
164  *
165  * @handle: amdgpu_device pointer
166  *
167  * Stop the JPEG block, mark ring as not ready any more
168  */
169 static int jpeg_v2_0_hw_fini(void *handle)
170 {
171         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
172         struct amdgpu_ring *ring = &adev->jpeg.inst->ring_dec;
173
174         if (adev->jpeg.cur_state != AMD_PG_STATE_GATE &&
175               RREG32_SOC15(JPEG, 0, mmUVD_JRBC_STATUS))
176                 jpeg_v2_0_set_powergating_state(adev, AMD_PG_STATE_GATE);
177
178         ring->sched.ready = false;
179
180         return 0;
181 }
182
183 /**
184  * jpeg_v2_0_suspend - suspend JPEG block
185  *
186  * @handle: amdgpu_device pointer
187  *
188  * HW fini and suspend JPEG block
189  */
190 static int jpeg_v2_0_suspend(void *handle)
191 {
192         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
193         int r;
194
195         r = jpeg_v2_0_hw_fini(adev);
196         if (r)
197                 return r;
198
199         r = amdgpu_jpeg_suspend(adev);
200
201         return r;
202 }
203
204 /**
205  * jpeg_v2_0_resume - resume JPEG block
206  *
207  * @handle: amdgpu_device pointer
208  *
209  * Resume firmware and hw init JPEG block
210  */
211 static int jpeg_v2_0_resume(void *handle)
212 {
213         int r;
214         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
215
216         r = amdgpu_jpeg_resume(adev);
217         if (r)
218                 return r;
219
220         r = jpeg_v2_0_hw_init(adev);
221
222         return r;
223 }
224
225 static int jpeg_v2_0_disable_power_gating(struct amdgpu_device *adev)
226 {
227         uint32_t data;
228         int r = 0;
229
230         if (adev->pg_flags & AMD_PG_SUPPORT_JPEG) {
231                 data = 1 << UVD_PGFSM_CONFIG__UVDJ_PWR_CONFIG__SHIFT;
232                 WREG32(SOC15_REG_OFFSET(JPEG, 0, mmUVD_PGFSM_CONFIG), data);
233
234                 SOC15_WAIT_ON_RREG(JPEG, 0,
235                         mmUVD_PGFSM_STATUS, UVD_PGFSM_STATUS_UVDJ_PWR_ON,
236                         UVD_PGFSM_STATUS__UVDJ_PWR_STATUS_MASK, r);
237
238                 if (r) {
239                         DRM_ERROR("amdgpu: JPEG disable power gating failed\n");
240                         return r;
241                 }
242         }
243
244         /* Removing the anti hang mechanism to indicate the UVDJ tile is ON */
245         data = RREG32(SOC15_REG_OFFSET(JPEG, 0, mmUVD_JPEG_POWER_STATUS)) & ~0x1;
246         WREG32(SOC15_REG_OFFSET(JPEG, 0, mmUVD_JPEG_POWER_STATUS), data);
247
248         return 0;
249 }
250
251 static int jpeg_v2_0_enable_power_gating(struct amdgpu_device* adev)
252 {
253         if (adev->pg_flags & AMD_PG_SUPPORT_JPEG) {
254                 uint32_t data;
255                 int r = 0;
256
257                 data = RREG32(SOC15_REG_OFFSET(JPEG, 0, mmUVD_JPEG_POWER_STATUS));
258                 data &= ~UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_MASK;
259                 data |=  0x1; //UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_TILES_OFF;
260                 WREG32(SOC15_REG_OFFSET(JPEG, 0, mmUVD_JPEG_POWER_STATUS), data);
261
262                 data = 2 << UVD_PGFSM_CONFIG__UVDJ_PWR_CONFIG__SHIFT;
263                 WREG32(SOC15_REG_OFFSET(JPEG, 0, mmUVD_PGFSM_CONFIG), data);
264
265                 SOC15_WAIT_ON_RREG(JPEG, 0, mmUVD_PGFSM_STATUS,
266                         (2 << UVD_PGFSM_STATUS__UVDJ_PWR_STATUS__SHIFT),
267                         UVD_PGFSM_STATUS__UVDJ_PWR_STATUS_MASK, r);
268
269                 if (r) {
270                         DRM_ERROR("amdgpu: JPEG enable power gating failed\n");
271                         return r;
272                 }
273         }
274
275         return 0;
276 }
277
278 static void jpeg_v2_0_disable_clock_gating(struct amdgpu_device* adev)
279 {
280         uint32_t data;
281
282         data = RREG32_SOC15(JPEG, 0, mmJPEG_CGC_CTRL);
283         if (adev->cg_flags & AMD_CG_SUPPORT_JPEG_MGCG)
284                 data |= 1 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
285         else
286                 data &= ~JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
287
288         data |= 1 << JPEG_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
289         data |= 4 << JPEG_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
290         WREG32_SOC15(JPEG, 0, mmJPEG_CGC_CTRL, data);
291
292         data = RREG32_SOC15(JPEG, 0, mmJPEG_CGC_GATE);
293         data &= ~(JPEG_CGC_GATE__JPEG_DEC_MASK
294                 | JPEG_CGC_GATE__JPEG2_DEC_MASK
295                 | JPEG_CGC_GATE__JPEG_ENC_MASK
296                 | JPEG_CGC_GATE__JMCIF_MASK
297                 | JPEG_CGC_GATE__JRBBM_MASK);
298         WREG32_SOC15(JPEG, 0, mmJPEG_CGC_GATE, data);
299 }
300
301 static void jpeg_v2_0_enable_clock_gating(struct amdgpu_device* adev)
302 {
303         uint32_t data;
304
305         data = RREG32_SOC15(JPEG, 0, mmJPEG_CGC_CTRL);
306         if (adev->cg_flags & AMD_CG_SUPPORT_JPEG_MGCG)
307                 data |= 1 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
308         else
309                 data |= 0 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
310
311         data |= 1 << JPEG_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
312         data |= 4 << JPEG_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
313         WREG32_SOC15(JPEG, 0, mmJPEG_CGC_CTRL, data);
314
315         data = RREG32_SOC15(JPEG, 0, mmJPEG_CGC_GATE);
316         data |= (JPEG_CGC_GATE__JPEG_DEC_MASK
317                 |JPEG_CGC_GATE__JPEG2_DEC_MASK
318                 |JPEG_CGC_GATE__JPEG_ENC_MASK
319                 |JPEG_CGC_GATE__JMCIF_MASK
320                 |JPEG_CGC_GATE__JRBBM_MASK);
321         WREG32_SOC15(JPEG, 0, mmJPEG_CGC_GATE, data);
322 }
323
324 /**
325  * jpeg_v2_0_start - start JPEG block
326  *
327  * @adev: amdgpu_device pointer
328  *
329  * Setup and start the JPEG block
330  */
331 static int jpeg_v2_0_start(struct amdgpu_device *adev)
332 {
333         struct amdgpu_ring *ring = &adev->jpeg.inst->ring_dec;
334         int r;
335
336         if (adev->pm.dpm_enabled)
337                 amdgpu_dpm_enable_jpeg(adev, true);
338
339         /* disable power gating */
340         r = jpeg_v2_0_disable_power_gating(adev);
341         if (r)
342                 return r;
343
344         /* JPEG disable CGC */
345         jpeg_v2_0_disable_clock_gating(adev);
346
347         WREG32_SOC15(JPEG, 0, mmJPEG_DEC_GFX10_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
348
349         /* enable JMI channel */
350         WREG32_P(SOC15_REG_OFFSET(JPEG, 0, mmUVD_JMI_CNTL), 0,
351                 ~UVD_JMI_CNTL__SOFT_RESET_MASK);
352
353         /* enable System Interrupt for JRBC */
354         WREG32_P(SOC15_REG_OFFSET(JPEG, 0, mmJPEG_SYS_INT_EN),
355                 JPEG_SYS_INT_EN__DJRBC_MASK,
356                 ~JPEG_SYS_INT_EN__DJRBC_MASK);
357
358         WREG32_SOC15(JPEG, 0, mmUVD_LMI_JRBC_RB_VMID, 0);
359         WREG32_SOC15(JPEG, 0, mmUVD_JRBC_RB_CNTL, (0x00000001L | 0x00000002L));
360         WREG32_SOC15(JPEG, 0, mmUVD_LMI_JRBC_RB_64BIT_BAR_LOW,
361                 lower_32_bits(ring->gpu_addr));
362         WREG32_SOC15(JPEG, 0, mmUVD_LMI_JRBC_RB_64BIT_BAR_HIGH,
363                 upper_32_bits(ring->gpu_addr));
364         WREG32_SOC15(JPEG, 0, mmUVD_JRBC_RB_RPTR, 0);
365         WREG32_SOC15(JPEG, 0, mmUVD_JRBC_RB_WPTR, 0);
366         WREG32_SOC15(JPEG, 0, mmUVD_JRBC_RB_CNTL, 0x00000002L);
367         WREG32_SOC15(JPEG, 0, mmUVD_JRBC_RB_SIZE, ring->ring_size / 4);
368         ring->wptr = RREG32_SOC15(JPEG, 0, mmUVD_JRBC_RB_WPTR);
369
370         return 0;
371 }
372
373 /**
374  * jpeg_v2_0_stop - stop JPEG block
375  *
376  * @adev: amdgpu_device pointer
377  *
378  * stop the JPEG block
379  */
380 static int jpeg_v2_0_stop(struct amdgpu_device *adev)
381 {
382         int r;
383
384         /* reset JMI */
385         WREG32_P(SOC15_REG_OFFSET(JPEG, 0, mmUVD_JMI_CNTL),
386                 UVD_JMI_CNTL__SOFT_RESET_MASK,
387                 ~UVD_JMI_CNTL__SOFT_RESET_MASK);
388
389         /* enable JPEG CGC */
390         jpeg_v2_0_enable_clock_gating(adev);
391
392         /* enable power gating */
393         r = jpeg_v2_0_enable_power_gating(adev);
394         if (r)
395                 return r;
396
397         if (adev->pm.dpm_enabled)
398                 amdgpu_dpm_enable_jpeg(adev, false);
399
400         return 0;
401 }
402
403 /**
404  * jpeg_v2_0_dec_ring_get_rptr - get read pointer
405  *
406  * @ring: amdgpu_ring pointer
407  *
408  * Returns the current hardware read pointer
409  */
410 static uint64_t jpeg_v2_0_dec_ring_get_rptr(struct amdgpu_ring *ring)
411 {
412         struct amdgpu_device *adev = ring->adev;
413
414         return RREG32_SOC15(JPEG, 0, mmUVD_JRBC_RB_RPTR);
415 }
416
417 /**
418  * jpeg_v2_0_dec_ring_get_wptr - get write pointer
419  *
420  * @ring: amdgpu_ring pointer
421  *
422  * Returns the current hardware write pointer
423  */
424 static uint64_t jpeg_v2_0_dec_ring_get_wptr(struct amdgpu_ring *ring)
425 {
426         struct amdgpu_device *adev = ring->adev;
427
428         if (ring->use_doorbell)
429                 return adev->wb.wb[ring->wptr_offs];
430         else
431                 return RREG32_SOC15(JPEG, 0, mmUVD_JRBC_RB_WPTR);
432 }
433
434 /**
435  * jpeg_v2_0_dec_ring_set_wptr - set write pointer
436  *
437  * @ring: amdgpu_ring pointer
438  *
439  * Commits the write pointer to the hardware
440  */
441 static void jpeg_v2_0_dec_ring_set_wptr(struct amdgpu_ring *ring)
442 {
443         struct amdgpu_device *adev = ring->adev;
444
445         if (ring->use_doorbell) {
446                 adev->wb.wb[ring->wptr_offs] = lower_32_bits(ring->wptr);
447                 WDOORBELL32(ring->doorbell_index, lower_32_bits(ring->wptr));
448         } else {
449                 WREG32_SOC15(JPEG, 0, mmUVD_JRBC_RB_WPTR, lower_32_bits(ring->wptr));
450         }
451 }
452
453 /**
454  * jpeg_v2_0_dec_ring_insert_start - insert a start command
455  *
456  * @ring: amdgpu_ring pointer
457  *
458  * Write a start command to the ring.
459  */
460 void jpeg_v2_0_dec_ring_insert_start(struct amdgpu_ring *ring)
461 {
462         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
463                 0, 0, PACKETJ_TYPE0));
464         amdgpu_ring_write(ring, 0x68e04);
465
466         amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
467                 0, 0, PACKETJ_TYPE0));
468         amdgpu_ring_write(ring, 0x80010000);
469 }
470
471 /**
472  * jpeg_v2_0_dec_ring_insert_end - insert a end command
473  *
474  * @ring: amdgpu_ring pointer
475  *
476  * Write a end command to the ring.
477  */
478 void jpeg_v2_0_dec_ring_insert_end(struct amdgpu_ring *ring)
479 {
480         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
481                 0, 0, PACKETJ_TYPE0));
482         amdgpu_ring_write(ring, 0x68e04);
483
484         amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
485                 0, 0, PACKETJ_TYPE0));
486         amdgpu_ring_write(ring, 0x00010000);
487 }
488
489 /**
490  * jpeg_v2_0_dec_ring_emit_fence - emit an fence & trap command
491  *
492  * @ring: amdgpu_ring pointer
493  * @fence: fence to emit
494  *
495  * Write a fence and a trap command to the ring.
496  */
497 void jpeg_v2_0_dec_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq,
498                                 unsigned flags)
499 {
500         WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
501
502         amdgpu_ring_write(ring, PACKETJ(mmUVD_JPEG_GPCOM_DATA0_INTERNAL_OFFSET,
503                 0, 0, PACKETJ_TYPE0));
504         amdgpu_ring_write(ring, seq);
505
506         amdgpu_ring_write(ring, PACKETJ(mmUVD_JPEG_GPCOM_DATA1_INTERNAL_OFFSET,
507                 0, 0, PACKETJ_TYPE0));
508         amdgpu_ring_write(ring, seq);
509
510         amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_RB_MEM_WR_64BIT_BAR_LOW_INTERNAL_OFFSET,
511                 0, 0, PACKETJ_TYPE0));
512         amdgpu_ring_write(ring, lower_32_bits(addr));
513
514         amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_RB_MEM_WR_64BIT_BAR_HIGH_INTERNAL_OFFSET,
515                 0, 0, PACKETJ_TYPE0));
516         amdgpu_ring_write(ring, upper_32_bits(addr));
517
518         amdgpu_ring_write(ring, PACKETJ(mmUVD_JPEG_GPCOM_CMD_INTERNAL_OFFSET,
519                 0, 0, PACKETJ_TYPE0));
520         amdgpu_ring_write(ring, 0x8);
521
522         amdgpu_ring_write(ring, PACKETJ(mmUVD_JPEG_GPCOM_CMD_INTERNAL_OFFSET,
523                 0, PACKETJ_CONDITION_CHECK0, PACKETJ_TYPE4));
524         amdgpu_ring_write(ring, 0);
525
526         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
527                 0, 0, PACKETJ_TYPE0));
528         amdgpu_ring_write(ring, 0x3fbc);
529
530         amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
531                 0, 0, PACKETJ_TYPE0));
532         amdgpu_ring_write(ring, 0x1);
533
534         amdgpu_ring_write(ring, PACKETJ(0, 0, 0, PACKETJ_TYPE7));
535         amdgpu_ring_write(ring, 0);
536 }
537
538 /**
539  * jpeg_v2_0_dec_ring_emit_ib - execute indirect buffer
540  *
541  * @ring: amdgpu_ring pointer
542  * @ib: indirect buffer to execute
543  *
544  * Write ring commands to execute the indirect buffer.
545  */
546 void jpeg_v2_0_dec_ring_emit_ib(struct amdgpu_ring *ring,
547                                 struct amdgpu_job *job,
548                                 struct amdgpu_ib *ib,
549                                 uint32_t flags)
550 {
551         unsigned vmid = AMDGPU_JOB_GET_VMID(job);
552
553         amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_IB_VMID_INTERNAL_OFFSET,
554                 0, 0, PACKETJ_TYPE0));
555         amdgpu_ring_write(ring, (vmid | (vmid << 4)));
556
557         amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JPEG_VMID_INTERNAL_OFFSET,
558                 0, 0, PACKETJ_TYPE0));
559         amdgpu_ring_write(ring, (vmid | (vmid << 4)));
560
561         amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_IB_64BIT_BAR_LOW_INTERNAL_OFFSET,
562                 0, 0, PACKETJ_TYPE0));
563         amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
564
565         amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_IB_64BIT_BAR_HIGH_INTERNAL_OFFSET,
566                 0, 0, PACKETJ_TYPE0));
567         amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
568
569         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_IB_SIZE_INTERNAL_OFFSET,
570                 0, 0, PACKETJ_TYPE0));
571         amdgpu_ring_write(ring, ib->length_dw);
572
573         amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_LOW_INTERNAL_OFFSET,
574                 0, 0, PACKETJ_TYPE0));
575         amdgpu_ring_write(ring, lower_32_bits(ring->gpu_addr));
576
577         amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_HIGH_INTERNAL_OFFSET,
578                 0, 0, PACKETJ_TYPE0));
579         amdgpu_ring_write(ring, upper_32_bits(ring->gpu_addr));
580
581         amdgpu_ring_write(ring, PACKETJ(0, 0, PACKETJ_CONDITION_CHECK0, PACKETJ_TYPE2));
582         amdgpu_ring_write(ring, 0);
583
584         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_RB_COND_RD_TIMER_INTERNAL_OFFSET,
585                 0, 0, PACKETJ_TYPE0));
586         amdgpu_ring_write(ring, 0x01400200);
587
588         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_RB_REF_DATA_INTERNAL_OFFSET,
589                 0, 0, PACKETJ_TYPE0));
590         amdgpu_ring_write(ring, 0x2);
591
592         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_STATUS_INTERNAL_OFFSET,
593                 0, PACKETJ_CONDITION_CHECK3, PACKETJ_TYPE3));
594         amdgpu_ring_write(ring, 0x2);
595 }
596
597 void jpeg_v2_0_dec_ring_emit_reg_wait(struct amdgpu_ring *ring, uint32_t reg,
598                                 uint32_t val, uint32_t mask)
599 {
600         uint32_t reg_offset = (reg << 2);
601
602         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_RB_COND_RD_TIMER_INTERNAL_OFFSET,
603                 0, 0, PACKETJ_TYPE0));
604         amdgpu_ring_write(ring, 0x01400200);
605
606         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_RB_REF_DATA_INTERNAL_OFFSET,
607                 0, 0, PACKETJ_TYPE0));
608         amdgpu_ring_write(ring, val);
609
610         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
611                 0, 0, PACKETJ_TYPE0));
612         if (reg_offset >= 0x10000 && reg_offset <= 0x105ff) {
613                 amdgpu_ring_write(ring, 0);
614                 amdgpu_ring_write(ring,
615                         PACKETJ((reg_offset >> 2), 0, 0, PACKETJ_TYPE3));
616         } else {
617                 amdgpu_ring_write(ring, reg_offset);
618                 amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
619                         0, 0, PACKETJ_TYPE3));
620         }
621         amdgpu_ring_write(ring, mask);
622 }
623
624 void jpeg_v2_0_dec_ring_emit_vm_flush(struct amdgpu_ring *ring,
625                                 unsigned vmid, uint64_t pd_addr)
626 {
627         struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
628         uint32_t data0, data1, mask;
629
630         pd_addr = amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
631
632         /* wait for register write */
633         data0 = hub->ctx0_ptb_addr_lo32 + vmid * 2;
634         data1 = lower_32_bits(pd_addr);
635         mask = 0xffffffff;
636         jpeg_v2_0_dec_ring_emit_reg_wait(ring, data0, data1, mask);
637 }
638
639 void jpeg_v2_0_dec_ring_emit_wreg(struct amdgpu_ring *ring, uint32_t reg, uint32_t val)
640 {
641         uint32_t reg_offset = (reg << 2);
642
643         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
644                 0, 0, PACKETJ_TYPE0));
645         if (reg_offset >= 0x10000 && reg_offset <= 0x105ff) {
646                 amdgpu_ring_write(ring, 0);
647                 amdgpu_ring_write(ring,
648                         PACKETJ((reg_offset >> 2), 0, 0, PACKETJ_TYPE0));
649         } else {
650                 amdgpu_ring_write(ring, reg_offset);
651                 amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
652                         0, 0, PACKETJ_TYPE0));
653         }
654         amdgpu_ring_write(ring, val);
655 }
656
657 void jpeg_v2_0_dec_ring_nop(struct amdgpu_ring *ring, uint32_t count)
658 {
659         int i;
660
661         WARN_ON(ring->wptr % 2 || count % 2);
662
663         for (i = 0; i < count / 2; i++) {
664                 amdgpu_ring_write(ring, PACKETJ(0, 0, 0, PACKETJ_TYPE6));
665                 amdgpu_ring_write(ring, 0);
666         }
667 }
668
669 static bool jpeg_v2_0_is_idle(void *handle)
670 {
671         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
672
673         return ((RREG32_SOC15(JPEG, 0, mmUVD_JRBC_STATUS) &
674                 UVD_JRBC_STATUS__RB_JOB_DONE_MASK) ==
675                 UVD_JRBC_STATUS__RB_JOB_DONE_MASK);
676 }
677
678 static int jpeg_v2_0_wait_for_idle(void *handle)
679 {
680         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
681         int ret = 0;
682
683         SOC15_WAIT_ON_RREG(JPEG, 0, mmUVD_JRBC_STATUS, UVD_JRBC_STATUS__RB_JOB_DONE_MASK,
684                 UVD_JRBC_STATUS__RB_JOB_DONE_MASK, ret);
685
686         return ret;
687 }
688
689 static int jpeg_v2_0_set_clockgating_state(void *handle,
690                                           enum amd_clockgating_state state)
691 {
692         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
693         bool enable = (state == AMD_CG_STATE_GATE) ? true : false;
694
695         if (enable) {
696                 if (jpeg_v2_0_is_idle(handle))
697                         return -EBUSY;
698                 jpeg_v2_0_enable_clock_gating(adev);
699         } else {
700                 jpeg_v2_0_disable_clock_gating(adev);
701         }
702
703         return 0;
704 }
705
706 static int jpeg_v2_0_set_powergating_state(void *handle,
707                                         enum amd_powergating_state state)
708 {
709         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
710         int ret;
711
712         if (state == adev->jpeg.cur_state)
713                 return 0;
714
715         if (state == AMD_PG_STATE_GATE)
716                 ret = jpeg_v2_0_stop(adev);
717         else
718                 ret = jpeg_v2_0_start(adev);
719
720         if (!ret)
721                 adev->jpeg.cur_state = state;
722
723         return ret;
724 }
725
726 static int jpeg_v2_0_set_interrupt_state(struct amdgpu_device *adev,
727                                         struct amdgpu_irq_src *source,
728                                         unsigned type,
729                                         enum amdgpu_interrupt_state state)
730 {
731         return 0;
732 }
733
734 static int jpeg_v2_0_process_interrupt(struct amdgpu_device *adev,
735                                       struct amdgpu_irq_src *source,
736                                       struct amdgpu_iv_entry *entry)
737 {
738         DRM_DEBUG("IH: JPEG TRAP\n");
739
740         switch (entry->src_id) {
741         case VCN_2_0__SRCID__JPEG_DECODE:
742                 amdgpu_fence_process(&adev->jpeg.inst->ring_dec);
743                 break;
744         default:
745                 DRM_ERROR("Unhandled interrupt: %d %d\n",
746                           entry->src_id, entry->src_data[0]);
747                 break;
748         }
749
750         return 0;
751 }
752
753 static const struct amd_ip_funcs jpeg_v2_0_ip_funcs = {
754         .name = "jpeg_v2_0",
755         .early_init = jpeg_v2_0_early_init,
756         .late_init = NULL,
757         .sw_init = jpeg_v2_0_sw_init,
758         .sw_fini = jpeg_v2_0_sw_fini,
759         .hw_init = jpeg_v2_0_hw_init,
760         .hw_fini = jpeg_v2_0_hw_fini,
761         .suspend = jpeg_v2_0_suspend,
762         .resume = jpeg_v2_0_resume,
763         .is_idle = jpeg_v2_0_is_idle,
764         .wait_for_idle = jpeg_v2_0_wait_for_idle,
765         .check_soft_reset = NULL,
766         .pre_soft_reset = NULL,
767         .soft_reset = NULL,
768         .post_soft_reset = NULL,
769         .set_clockgating_state = jpeg_v2_0_set_clockgating_state,
770         .set_powergating_state = jpeg_v2_0_set_powergating_state,
771 };
772
773 static const struct amdgpu_ring_funcs jpeg_v2_0_dec_ring_vm_funcs = {
774         .type = AMDGPU_RING_TYPE_VCN_JPEG,
775         .align_mask = 0xf,
776         .vmhub = AMDGPU_MMHUB_0,
777         .get_rptr = jpeg_v2_0_dec_ring_get_rptr,
778         .get_wptr = jpeg_v2_0_dec_ring_get_wptr,
779         .set_wptr = jpeg_v2_0_dec_ring_set_wptr,
780         .emit_frame_size =
781                 SOC15_FLUSH_GPU_TLB_NUM_WREG * 6 +
782                 SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 8 +
783                 8 + /* jpeg_v2_0_dec_ring_emit_vm_flush */
784                 18 + 18 + /* jpeg_v2_0_dec_ring_emit_fence x2 vm fence */
785                 8 + 16,
786         .emit_ib_size = 22, /* jpeg_v2_0_dec_ring_emit_ib */
787         .emit_ib = jpeg_v2_0_dec_ring_emit_ib,
788         .emit_fence = jpeg_v2_0_dec_ring_emit_fence,
789         .emit_vm_flush = jpeg_v2_0_dec_ring_emit_vm_flush,
790         .test_ring = amdgpu_jpeg_dec_ring_test_ring,
791         .test_ib = amdgpu_jpeg_dec_ring_test_ib,
792         .insert_nop = jpeg_v2_0_dec_ring_nop,
793         .insert_start = jpeg_v2_0_dec_ring_insert_start,
794         .insert_end = jpeg_v2_0_dec_ring_insert_end,
795         .pad_ib = amdgpu_ring_generic_pad_ib,
796         .begin_use = amdgpu_jpeg_ring_begin_use,
797         .end_use = amdgpu_jpeg_ring_end_use,
798         .emit_wreg = jpeg_v2_0_dec_ring_emit_wreg,
799         .emit_reg_wait = jpeg_v2_0_dec_ring_emit_reg_wait,
800         .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
801 };
802
803 static void jpeg_v2_0_set_dec_ring_funcs(struct amdgpu_device *adev)
804 {
805         adev->jpeg.inst->ring_dec.funcs = &jpeg_v2_0_dec_ring_vm_funcs;
806         DRM_INFO("JPEG decode is enabled in VM mode\n");
807 }
808
809 static const struct amdgpu_irq_src_funcs jpeg_v2_0_irq_funcs = {
810         .set = jpeg_v2_0_set_interrupt_state,
811         .process = jpeg_v2_0_process_interrupt,
812 };
813
814 static void jpeg_v2_0_set_irq_funcs(struct amdgpu_device *adev)
815 {
816         adev->jpeg.inst->irq.num_types = 1;
817         adev->jpeg.inst->irq.funcs = &jpeg_v2_0_irq_funcs;
818 }
819
820 const struct amdgpu_ip_block_version jpeg_v2_0_ip_block =
821 {
822                 .type = AMD_IP_BLOCK_TYPE_JPEG,
823                 .major = 2,
824                 .minor = 0,
825                 .rev = 0,
826                 .funcs = &jpeg_v2_0_ip_funcs,
827 };