]> asedeno.scripts.mit.edu Git - linux.git/blob - drivers/gpu/drm/amd/amdgpu/vcn_v2_0.c
36ad0c0e8efbcb714fd0acc3ed3e261bbf0ab51b
[linux.git] / drivers / gpu / drm / amd / amdgpu / vcn_v2_0.c
1 /*
2  * Copyright 2018 Advanced Micro Devices, Inc.
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice shall be included in
12  * all copies or substantial portions of the Software.
13  *
14  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20  * OTHER DEALINGS IN THE SOFTWARE.
21  *
22  */
23
24 #include <linux/firmware.h>
25
26 #include "amdgpu.h"
27 #include "amdgpu_vcn.h"
28 #include "soc15.h"
29 #include "soc15d.h"
30 #include "amdgpu_pm.h"
31 #include "amdgpu_psp.h"
32
33 #include "vcn/vcn_2_0_0_offset.h"
34 #include "vcn/vcn_2_0_0_sh_mask.h"
35 #include "ivsrcid/vcn/irqsrcs_vcn_2_0.h"
36
37 #define mmUVD_CONTEXT_ID_INTERNAL_OFFSET                        0x1fd
38 #define mmUVD_GPCOM_VCPU_CMD_INTERNAL_OFFSET                    0x503
39 #define mmUVD_GPCOM_VCPU_DATA0_INTERNAL_OFFSET                  0x504
40 #define mmUVD_GPCOM_VCPU_DATA1_INTERNAL_OFFSET                  0x505
41 #define mmUVD_NO_OP_INTERNAL_OFFSET                             0x53f
42 #define mmUVD_GP_SCRATCH8_INTERNAL_OFFSET                       0x54a
43 #define mmUVD_SCRATCH9_INTERNAL_OFFSET                          0xc01d
44
45 #define mmUVD_LMI_RBC_IB_VMID_INTERNAL_OFFSET                   0x1e1
46 #define mmUVD_LMI_RBC_IB_64BIT_BAR_HIGH_INTERNAL_OFFSET         0x5a6
47 #define mmUVD_LMI_RBC_IB_64BIT_BAR_LOW_INTERNAL_OFFSET          0x5a7
48 #define mmUVD_RBC_IB_SIZE_INTERNAL_OFFSET                       0x1e2
49
50 #define mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET                         0x1bfff
51 #define mmUVD_JPEG_GPCOM_CMD_INTERNAL_OFFSET                            0x4029
52 #define mmUVD_JPEG_GPCOM_DATA0_INTERNAL_OFFSET                          0x402a
53 #define mmUVD_JPEG_GPCOM_DATA1_INTERNAL_OFFSET                          0x402b
54 #define mmUVD_LMI_JRBC_RB_MEM_WR_64BIT_BAR_LOW_INTERNAL_OFFSET          0x40ea
55 #define mmUVD_LMI_JRBC_RB_MEM_WR_64BIT_BAR_HIGH_INTERNAL_OFFSET         0x40eb
56 #define mmUVD_LMI_JRBC_IB_VMID_INTERNAL_OFFSET                          0x40cf
57 #define mmUVD_LMI_JPEG_VMID_INTERNAL_OFFSET                             0x40d1
58 #define mmUVD_LMI_JRBC_IB_64BIT_BAR_LOW_INTERNAL_OFFSET                 0x40e8
59 #define mmUVD_LMI_JRBC_IB_64BIT_BAR_HIGH_INTERNAL_OFFSET                0x40e9
60 #define mmUVD_JRBC_IB_SIZE_INTERNAL_OFFSET                              0x4082
61 #define mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_LOW_INTERNAL_OFFSET          0x40ec
62 #define mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_HIGH_INTERNAL_OFFSET         0x40ed
63 #define mmUVD_JRBC_RB_COND_RD_TIMER_INTERNAL_OFFSET                     0x4085
64 #define mmUVD_JRBC_RB_REF_DATA_INTERNAL_OFFSET                          0x4084
65 #define mmUVD_JRBC_STATUS_INTERNAL_OFFSET                               0x4089
66 #define mmUVD_JPEG_PITCH_INTERNAL_OFFSET                                0x401f
67
68 #define JRBC_DEC_EXTERNAL_REG_WRITE_ADDR                                0x18000
69
70 #define mmUVD_RBC_XX_IB_REG_CHECK                                       0x026b
71 #define mmUVD_RBC_XX_IB_REG_CHECK_BASE_IDX                              1
72 #define mmUVD_REG_XX_MASK                                               0x026c
73 #define mmUVD_REG_XX_MASK_BASE_IDX                                      1
74
75 static void vcn_v2_0_set_dec_ring_funcs(struct amdgpu_device *adev);
76 static void vcn_v2_0_set_enc_ring_funcs(struct amdgpu_device *adev);
77 static void vcn_v2_0_set_jpeg_ring_funcs(struct amdgpu_device *adev);
78 static void vcn_v2_0_set_irq_funcs(struct amdgpu_device *adev);
79 static int vcn_v2_0_set_powergating_state(void *handle,
80                                 enum amd_powergating_state state);
81 static int vcn_v2_0_pause_dpg_mode(struct amdgpu_device *adev,
82                                 struct dpg_pause_state *new_state);
83
84 /**
85  * vcn_v2_0_early_init - set function pointers
86  *
87  * @handle: amdgpu_device pointer
88  *
89  * Set ring and irq function pointers
90  */
91 static int vcn_v2_0_early_init(void *handle)
92 {
93         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
94
95         adev->vcn.num_vcn_inst = 1;
96         adev->vcn.num_enc_rings = 2;
97
98         vcn_v2_0_set_dec_ring_funcs(adev);
99         vcn_v2_0_set_enc_ring_funcs(adev);
100         vcn_v2_0_set_jpeg_ring_funcs(adev);
101         vcn_v2_0_set_irq_funcs(adev);
102
103         return 0;
104 }
105
106 /**
107  * vcn_v2_0_sw_init - sw init for VCN block
108  *
109  * @handle: amdgpu_device pointer
110  *
111  * Load firmware and sw initialization
112  */
113 static int vcn_v2_0_sw_init(void *handle)
114 {
115         struct amdgpu_ring *ring;
116         int i, r;
117         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
118
119         /* VCN DEC TRAP */
120         r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_VCN,
121                               VCN_2_0__SRCID__UVD_SYSTEM_MESSAGE_INTERRUPT,
122                               &adev->vcn.inst->irq);
123         if (r)
124                 return r;
125
126         /* VCN ENC TRAP */
127         for (i = 0; i < adev->vcn.num_enc_rings; ++i) {
128                 r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_VCN,
129                                       i + VCN_2_0__SRCID__UVD_ENC_GENERAL_PURPOSE,
130                                       &adev->vcn.inst->irq);
131                 if (r)
132                         return r;
133         }
134
135         /* VCN JPEG TRAP */
136         r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_VCN,
137                               VCN_2_0__SRCID__JPEG_DECODE, &adev->vcn.inst->irq);
138         if (r)
139                 return r;
140
141         r = amdgpu_vcn_sw_init(adev);
142         if (r)
143                 return r;
144
145         if (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) {
146                 const struct common_firmware_header *hdr;
147                 hdr = (const struct common_firmware_header *)adev->vcn.fw->data;
148                 adev->firmware.ucode[AMDGPU_UCODE_ID_VCN].ucode_id = AMDGPU_UCODE_ID_VCN;
149                 adev->firmware.ucode[AMDGPU_UCODE_ID_VCN].fw = adev->vcn.fw;
150                 adev->firmware.fw_size +=
151                         ALIGN(le32_to_cpu(hdr->ucode_size_bytes), PAGE_SIZE);
152                 DRM_INFO("PSP loading VCN firmware\n");
153         }
154
155         r = amdgpu_vcn_resume(adev);
156         if (r)
157                 return r;
158
159         ring = &adev->vcn.inst->ring_dec;
160
161         ring->use_doorbell = true;
162         ring->doorbell_index = adev->doorbell_index.vcn.vcn_ring0_1 << 1;
163
164         sprintf(ring->name, "vcn_dec");
165         r = amdgpu_ring_init(adev, ring, 512, &adev->vcn.inst->irq, 0);
166         if (r)
167                 return r;
168
169         adev->vcn.internal.context_id = mmUVD_CONTEXT_ID_INTERNAL_OFFSET;
170         adev->vcn.internal.ib_vmid = mmUVD_LMI_RBC_IB_VMID_INTERNAL_OFFSET;
171         adev->vcn.internal.ib_bar_low = mmUVD_LMI_RBC_IB_64BIT_BAR_LOW_INTERNAL_OFFSET;
172         adev->vcn.internal.ib_bar_high = mmUVD_LMI_RBC_IB_64BIT_BAR_HIGH_INTERNAL_OFFSET;
173         adev->vcn.internal.ib_size = mmUVD_RBC_IB_SIZE_INTERNAL_OFFSET;
174         adev->vcn.internal.gp_scratch8 = mmUVD_GP_SCRATCH8_INTERNAL_OFFSET;
175
176         adev->vcn.internal.scratch9 = mmUVD_SCRATCH9_INTERNAL_OFFSET;
177         adev->vcn.inst->external.scratch9 = SOC15_REG_OFFSET(UVD, 0, mmUVD_SCRATCH9);
178         adev->vcn.internal.data0 = mmUVD_GPCOM_VCPU_DATA0_INTERNAL_OFFSET;
179         adev->vcn.inst->external.data0 = SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0);
180         adev->vcn.internal.data1 = mmUVD_GPCOM_VCPU_DATA1_INTERNAL_OFFSET;
181         adev->vcn.inst->external.data1 = SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1);
182         adev->vcn.internal.cmd = mmUVD_GPCOM_VCPU_CMD_INTERNAL_OFFSET;
183         adev->vcn.inst->external.cmd = SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD);
184         adev->vcn.internal.nop = mmUVD_NO_OP_INTERNAL_OFFSET;
185         adev->vcn.inst->external.nop = SOC15_REG_OFFSET(UVD, 0, mmUVD_NO_OP);
186
187         for (i = 0; i < adev->vcn.num_enc_rings; ++i) {
188                 ring = &adev->vcn.inst->ring_enc[i];
189                 ring->use_doorbell = true;
190                 ring->doorbell_index = (adev->doorbell_index.vcn.vcn_ring0_1 << 1) + 2 + i;
191                 sprintf(ring->name, "vcn_enc%d", i);
192                 r = amdgpu_ring_init(adev, ring, 512, &adev->vcn.inst->irq, 0);
193                 if (r)
194                         return r;
195         }
196
197         ring = &adev->vcn.inst->ring_jpeg;
198         ring->use_doorbell = true;
199         ring->doorbell_index = (adev->doorbell_index.vcn.vcn_ring0_1 << 1) + 1;
200         sprintf(ring->name, "vcn_jpeg");
201         r = amdgpu_ring_init(adev, ring, 512, &adev->vcn.inst->irq, 0);
202         if (r)
203                 return r;
204
205         adev->vcn.pause_dpg_mode = vcn_v2_0_pause_dpg_mode;
206
207         adev->vcn.internal.jpeg_pitch = mmUVD_JPEG_PITCH_INTERNAL_OFFSET;
208         adev->vcn.inst->external.jpeg_pitch = SOC15_REG_OFFSET(UVD, 0, mmUVD_JPEG_PITCH);
209
210         return 0;
211 }
212
213 /**
214  * vcn_v2_0_sw_fini - sw fini for VCN block
215  *
216  * @handle: amdgpu_device pointer
217  *
218  * VCN suspend and free up sw allocation
219  */
220 static int vcn_v2_0_sw_fini(void *handle)
221 {
222         int r;
223         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
224
225         r = amdgpu_vcn_suspend(adev);
226         if (r)
227                 return r;
228
229         r = amdgpu_vcn_sw_fini(adev);
230
231         return r;
232 }
233
234 /**
235  * vcn_v2_0_hw_init - start and test VCN block
236  *
237  * @handle: amdgpu_device pointer
238  *
239  * Initialize the hardware, boot up the VCPU and do some testing
240  */
241 static int vcn_v2_0_hw_init(void *handle)
242 {
243         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
244         struct amdgpu_ring *ring = &adev->vcn.inst->ring_dec;
245         int i, r;
246
247         adev->nbio_funcs->vcn_doorbell_range(adev, ring->use_doorbell,
248                                              ring->doorbell_index, 0);
249
250         ring->sched.ready = true;
251         r = amdgpu_ring_test_ring(ring);
252         if (r) {
253                 ring->sched.ready = false;
254                 goto done;
255         }
256
257         for (i = 0; i < adev->vcn.num_enc_rings; ++i) {
258                 ring = &adev->vcn.inst->ring_enc[i];
259                 ring->sched.ready = true;
260                 r = amdgpu_ring_test_ring(ring);
261                 if (r) {
262                         ring->sched.ready = false;
263                         goto done;
264                 }
265         }
266
267         ring = &adev->vcn.inst->ring_jpeg;
268         ring->sched.ready = true;
269         r = amdgpu_ring_test_ring(ring);
270         if (r) {
271                 ring->sched.ready = false;
272                 goto done;
273         }
274
275 done:
276         if (!r)
277                 DRM_INFO("VCN decode and encode initialized successfully(under %s).\n",
278                         (adev->pg_flags & AMD_PG_SUPPORT_VCN_DPG)?"DPG Mode":"SPG Mode");
279
280         return r;
281 }
282
283 /**
284  * vcn_v2_0_hw_fini - stop the hardware block
285  *
286  * @handle: amdgpu_device pointer
287  *
288  * Stop the VCN block, mark ring as not ready any more
289  */
290 static int vcn_v2_0_hw_fini(void *handle)
291 {
292         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
293         struct amdgpu_ring *ring = &adev->vcn.inst->ring_dec;
294         int i;
295
296         if ((adev->pg_flags & AMD_PG_SUPPORT_VCN_DPG) ||
297             (adev->vcn.cur_state != AMD_PG_STATE_GATE &&
298               RREG32_SOC15(VCN, 0, mmUVD_STATUS)))
299                 vcn_v2_0_set_powergating_state(adev, AMD_PG_STATE_GATE);
300
301         ring->sched.ready = false;
302
303         for (i = 0; i < adev->vcn.num_enc_rings; ++i) {
304                 ring = &adev->vcn.inst->ring_enc[i];
305                 ring->sched.ready = false;
306         }
307
308         ring = &adev->vcn.inst->ring_jpeg;
309         ring->sched.ready = false;
310
311         return 0;
312 }
313
314 /**
315  * vcn_v2_0_suspend - suspend VCN block
316  *
317  * @handle: amdgpu_device pointer
318  *
319  * HW fini and suspend VCN block
320  */
321 static int vcn_v2_0_suspend(void *handle)
322 {
323         int r;
324         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
325
326         r = vcn_v2_0_hw_fini(adev);
327         if (r)
328                 return r;
329
330         r = amdgpu_vcn_suspend(adev);
331
332         return r;
333 }
334
335 /**
336  * vcn_v2_0_resume - resume VCN block
337  *
338  * @handle: amdgpu_device pointer
339  *
340  * Resume firmware and hw init VCN block
341  */
342 static int vcn_v2_0_resume(void *handle)
343 {
344         int r;
345         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
346
347         r = amdgpu_vcn_resume(adev);
348         if (r)
349                 return r;
350
351         r = vcn_v2_0_hw_init(adev);
352
353         return r;
354 }
355
356 /**
357  * vcn_v2_0_mc_resume - memory controller programming
358  *
359  * @adev: amdgpu_device pointer
360  *
361  * Let the VCN memory controller know it's offsets
362  */
363 static void vcn_v2_0_mc_resume(struct amdgpu_device *adev)
364 {
365         uint32_t size = AMDGPU_GPU_PAGE_ALIGN(adev->vcn.fw->size + 4);
366         uint32_t offset;
367
368         /* cache window 0: fw */
369         if (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) {
370                 WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
371                         (adev->firmware.ucode[AMDGPU_UCODE_ID_VCN].tmr_mc_addr_lo));
372                 WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
373                         (adev->firmware.ucode[AMDGPU_UCODE_ID_VCN].tmr_mc_addr_hi));
374                 WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET0, 0);
375                 offset = 0;
376         } else {
377                 WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
378                         lower_32_bits(adev->vcn.inst->gpu_addr));
379                 WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
380                         upper_32_bits(adev->vcn.inst->gpu_addr));
381                 offset = size;
382                 WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET0,
383                         AMDGPU_UVD_FIRMWARE_OFFSET >> 3);
384         }
385
386         WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_SIZE0, size);
387
388         /* cache window 1: stack */
389         WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_LOW,
390                 lower_32_bits(adev->vcn.inst->gpu_addr + offset));
391         WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_HIGH,
392                 upper_32_bits(adev->vcn.inst->gpu_addr + offset));
393         WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET1, 0);
394         WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_SIZE1, AMDGPU_VCN_STACK_SIZE);
395
396         /* cache window 2: context */
397         WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_LOW,
398                 lower_32_bits(adev->vcn.inst->gpu_addr + offset + AMDGPU_VCN_STACK_SIZE));
399         WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_HIGH,
400                 upper_32_bits(adev->vcn.inst->gpu_addr + offset + AMDGPU_VCN_STACK_SIZE));
401         WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET2, 0);
402         WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_SIZE2, AMDGPU_VCN_CONTEXT_SIZE);
403
404         WREG32_SOC15(UVD, 0, mmUVD_GFX10_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
405         WREG32_SOC15(UVD, 0, mmJPEG_DEC_GFX10_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
406 }
407
408 static void vcn_v2_0_mc_resume_dpg_mode(struct amdgpu_device *adev, bool indirect)
409 {
410         uint32_t size = AMDGPU_GPU_PAGE_ALIGN(adev->vcn.fw->size + 4);
411         uint32_t offset;
412
413         /* cache window 0: fw */
414         if (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) {
415                 if (!indirect) {
416                         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
417                                 UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW),
418                                 (adev->firmware.ucode[AMDGPU_UCODE_ID_VCN].tmr_mc_addr_lo), 0, indirect);
419                         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
420                                 UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH),
421                                 (adev->firmware.ucode[AMDGPU_UCODE_ID_VCN].tmr_mc_addr_hi), 0, indirect);
422                         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
423                                 UVD, 0, mmUVD_VCPU_CACHE_OFFSET0), 0, 0, indirect);
424                 } else {
425                         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
426                                 UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW), 0, 0, indirect);
427                         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
428                                 UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH), 0, 0, indirect);
429                         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
430                                 UVD, 0, mmUVD_VCPU_CACHE_OFFSET0), 0, 0, indirect);
431                 }
432                 offset = 0;
433         } else {
434                 WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
435                         UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW),
436                         lower_32_bits(adev->vcn.inst->gpu_addr), 0, indirect);
437                 WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
438                         UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH),
439                         upper_32_bits(adev->vcn.inst->gpu_addr), 0, indirect);
440                 offset = size;
441                 WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
442                         UVD, 0, mmUVD_VCPU_CACHE_OFFSET0),
443                         AMDGPU_UVD_FIRMWARE_OFFSET >> 3, 0, indirect);
444         }
445
446         if (!indirect)
447                 WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
448                         UVD, 0, mmUVD_VCPU_CACHE_SIZE0), size, 0, indirect);
449         else
450                 WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
451                         UVD, 0, mmUVD_VCPU_CACHE_SIZE0), 0, 0, indirect);
452
453         /* cache window 1: stack */
454         if (!indirect) {
455                 WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
456                         UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_LOW),
457                         lower_32_bits(adev->vcn.inst->gpu_addr + offset), 0, indirect);
458                 WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
459                         UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_HIGH),
460                         upper_32_bits(adev->vcn.inst->gpu_addr + offset), 0, indirect);
461                 WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
462                         UVD, 0, mmUVD_VCPU_CACHE_OFFSET1), 0, 0, indirect);
463         } else {
464                 WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
465                         UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_LOW), 0, 0, indirect);
466                 WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
467                         UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_HIGH), 0, 0, indirect);
468                 WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
469                         UVD, 0, mmUVD_VCPU_CACHE_OFFSET1), 0, 0, indirect);
470         }
471         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
472                 UVD, 0, mmUVD_VCPU_CACHE_SIZE1), AMDGPU_VCN_STACK_SIZE, 0, indirect);
473
474         /* cache window 2: context */
475         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
476                 UVD, 0, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_LOW),
477                 lower_32_bits(adev->vcn.inst->gpu_addr + offset + AMDGPU_VCN_STACK_SIZE), 0, indirect);
478         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
479                 UVD, 0, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_HIGH),
480                 upper_32_bits(adev->vcn.inst->gpu_addr + offset + AMDGPU_VCN_STACK_SIZE), 0, indirect);
481         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
482                 UVD, 0, mmUVD_VCPU_CACHE_OFFSET2), 0, 0, indirect);
483         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
484                 UVD, 0, mmUVD_VCPU_CACHE_SIZE2), AMDGPU_VCN_CONTEXT_SIZE, 0, indirect);
485
486         /* non-cache window */
487         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
488                 UVD, 0, mmUVD_LMI_VCPU_NC0_64BIT_BAR_LOW), 0, 0, indirect);
489         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
490                 UVD, 0, mmUVD_LMI_VCPU_NC0_64BIT_BAR_HIGH), 0, 0, indirect);
491         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
492                 UVD, 0, mmUVD_VCPU_NONCACHE_OFFSET0), 0, 0, indirect);
493         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
494                 UVD, 0, mmUVD_VCPU_NONCACHE_SIZE0), 0, 0, indirect);
495
496         /* VCN global tiling registers */
497         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
498                 UVD, 0, mmUVD_GFX10_ADDR_CONFIG), adev->gfx.config.gb_addr_config, 0, indirect);
499 }
500
501 /**
502  * vcn_v2_0_disable_clock_gating - disable VCN clock gating
503  *
504  * @adev: amdgpu_device pointer
505  * @sw: enable SW clock gating
506  *
507  * Disable clock gating for VCN block
508  */
509 static void vcn_v2_0_disable_clock_gating(struct amdgpu_device *adev)
510 {
511         uint32_t data;
512
513         /* UVD disable CGC */
514         data = RREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL);
515         if (adev->cg_flags & AMD_CG_SUPPORT_VCN_MGCG)
516                 data |= 1 << UVD_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
517         else
518                 data &= ~UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK;
519         data |= 1 << UVD_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
520         data |= 4 << UVD_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
521         WREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL, data);
522
523         data = RREG32_SOC15(VCN, 0, mmUVD_CGC_GATE);
524         data &= ~(UVD_CGC_GATE__SYS_MASK
525                 | UVD_CGC_GATE__UDEC_MASK
526                 | UVD_CGC_GATE__MPEG2_MASK
527                 | UVD_CGC_GATE__REGS_MASK
528                 | UVD_CGC_GATE__RBC_MASK
529                 | UVD_CGC_GATE__LMI_MC_MASK
530                 | UVD_CGC_GATE__LMI_UMC_MASK
531                 | UVD_CGC_GATE__IDCT_MASK
532                 | UVD_CGC_GATE__MPRD_MASK
533                 | UVD_CGC_GATE__MPC_MASK
534                 | UVD_CGC_GATE__LBSI_MASK
535                 | UVD_CGC_GATE__LRBBM_MASK
536                 | UVD_CGC_GATE__UDEC_RE_MASK
537                 | UVD_CGC_GATE__UDEC_CM_MASK
538                 | UVD_CGC_GATE__UDEC_IT_MASK
539                 | UVD_CGC_GATE__UDEC_DB_MASK
540                 | UVD_CGC_GATE__UDEC_MP_MASK
541                 | UVD_CGC_GATE__WCB_MASK
542                 | UVD_CGC_GATE__VCPU_MASK
543                 | UVD_CGC_GATE__SCPU_MASK);
544         WREG32_SOC15(VCN, 0, mmUVD_CGC_GATE, data);
545
546         data = RREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL);
547         data &= ~(UVD_CGC_CTRL__UDEC_RE_MODE_MASK
548                 | UVD_CGC_CTRL__UDEC_CM_MODE_MASK
549                 | UVD_CGC_CTRL__UDEC_IT_MODE_MASK
550                 | UVD_CGC_CTRL__UDEC_DB_MODE_MASK
551                 | UVD_CGC_CTRL__UDEC_MP_MODE_MASK
552                 | UVD_CGC_CTRL__SYS_MODE_MASK
553                 | UVD_CGC_CTRL__UDEC_MODE_MASK
554                 | UVD_CGC_CTRL__MPEG2_MODE_MASK
555                 | UVD_CGC_CTRL__REGS_MODE_MASK
556                 | UVD_CGC_CTRL__RBC_MODE_MASK
557                 | UVD_CGC_CTRL__LMI_MC_MODE_MASK
558                 | UVD_CGC_CTRL__LMI_UMC_MODE_MASK
559                 | UVD_CGC_CTRL__IDCT_MODE_MASK
560                 | UVD_CGC_CTRL__MPRD_MODE_MASK
561                 | UVD_CGC_CTRL__MPC_MODE_MASK
562                 | UVD_CGC_CTRL__LBSI_MODE_MASK
563                 | UVD_CGC_CTRL__LRBBM_MODE_MASK
564                 | UVD_CGC_CTRL__WCB_MODE_MASK
565                 | UVD_CGC_CTRL__VCPU_MODE_MASK
566                 | UVD_CGC_CTRL__SCPU_MODE_MASK);
567         WREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL, data);
568
569         /* turn on */
570         data = RREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_GATE);
571         data |= (UVD_SUVD_CGC_GATE__SRE_MASK
572                 | UVD_SUVD_CGC_GATE__SIT_MASK
573                 | UVD_SUVD_CGC_GATE__SMP_MASK
574                 | UVD_SUVD_CGC_GATE__SCM_MASK
575                 | UVD_SUVD_CGC_GATE__SDB_MASK
576                 | UVD_SUVD_CGC_GATE__SRE_H264_MASK
577                 | UVD_SUVD_CGC_GATE__SRE_HEVC_MASK
578                 | UVD_SUVD_CGC_GATE__SIT_H264_MASK
579                 | UVD_SUVD_CGC_GATE__SIT_HEVC_MASK
580                 | UVD_SUVD_CGC_GATE__SCM_H264_MASK
581                 | UVD_SUVD_CGC_GATE__SCM_HEVC_MASK
582                 | UVD_SUVD_CGC_GATE__SDB_H264_MASK
583                 | UVD_SUVD_CGC_GATE__SDB_HEVC_MASK
584                 | UVD_SUVD_CGC_GATE__SCLR_MASK
585                 | UVD_SUVD_CGC_GATE__UVD_SC_MASK
586                 | UVD_SUVD_CGC_GATE__ENT_MASK
587                 | UVD_SUVD_CGC_GATE__SIT_HEVC_DEC_MASK
588                 | UVD_SUVD_CGC_GATE__SIT_HEVC_ENC_MASK
589                 | UVD_SUVD_CGC_GATE__SITE_MASK
590                 | UVD_SUVD_CGC_GATE__SRE_VP9_MASK
591                 | UVD_SUVD_CGC_GATE__SCM_VP9_MASK
592                 | UVD_SUVD_CGC_GATE__SIT_VP9_DEC_MASK
593                 | UVD_SUVD_CGC_GATE__SDB_VP9_MASK
594                 | UVD_SUVD_CGC_GATE__IME_HEVC_MASK);
595         WREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_GATE, data);
596
597         data = RREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_CTRL);
598         data &= ~(UVD_SUVD_CGC_CTRL__SRE_MODE_MASK
599                 | UVD_SUVD_CGC_CTRL__SIT_MODE_MASK
600                 | UVD_SUVD_CGC_CTRL__SMP_MODE_MASK
601                 | UVD_SUVD_CGC_CTRL__SCM_MODE_MASK
602                 | UVD_SUVD_CGC_CTRL__SDB_MODE_MASK
603                 | UVD_SUVD_CGC_CTRL__SCLR_MODE_MASK
604                 | UVD_SUVD_CGC_CTRL__UVD_SC_MODE_MASK
605                 | UVD_SUVD_CGC_CTRL__ENT_MODE_MASK
606                 | UVD_SUVD_CGC_CTRL__IME_MODE_MASK
607                 | UVD_SUVD_CGC_CTRL__SITE_MODE_MASK);
608         WREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_CTRL, data);
609 }
610
611 static void vcn_v2_0_clock_gating_dpg_mode(struct amdgpu_device *adev,
612                 uint8_t sram_sel, uint8_t indirect)
613 {
614         uint32_t reg_data = 0;
615
616         /* enable sw clock gating control */
617         if (adev->cg_flags & AMD_CG_SUPPORT_VCN_MGCG)
618                 reg_data = 1 << UVD_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
619         else
620                 reg_data = 0 << UVD_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
621         reg_data |= 1 << UVD_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
622         reg_data |= 4 << UVD_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
623         reg_data &= ~(UVD_CGC_CTRL__UDEC_RE_MODE_MASK |
624                  UVD_CGC_CTRL__UDEC_CM_MODE_MASK |
625                  UVD_CGC_CTRL__UDEC_IT_MODE_MASK |
626                  UVD_CGC_CTRL__UDEC_DB_MODE_MASK |
627                  UVD_CGC_CTRL__UDEC_MP_MODE_MASK |
628                  UVD_CGC_CTRL__SYS_MODE_MASK |
629                  UVD_CGC_CTRL__UDEC_MODE_MASK |
630                  UVD_CGC_CTRL__MPEG2_MODE_MASK |
631                  UVD_CGC_CTRL__REGS_MODE_MASK |
632                  UVD_CGC_CTRL__RBC_MODE_MASK |
633                  UVD_CGC_CTRL__LMI_MC_MODE_MASK |
634                  UVD_CGC_CTRL__LMI_UMC_MODE_MASK |
635                  UVD_CGC_CTRL__IDCT_MODE_MASK |
636                  UVD_CGC_CTRL__MPRD_MODE_MASK |
637                  UVD_CGC_CTRL__MPC_MODE_MASK |
638                  UVD_CGC_CTRL__LBSI_MODE_MASK |
639                  UVD_CGC_CTRL__LRBBM_MODE_MASK |
640                  UVD_CGC_CTRL__WCB_MODE_MASK |
641                  UVD_CGC_CTRL__VCPU_MODE_MASK |
642                  UVD_CGC_CTRL__SCPU_MODE_MASK);
643         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
644                 UVD, 0, mmUVD_CGC_CTRL), reg_data, sram_sel, indirect);
645
646         /* turn off clock gating */
647         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
648                 UVD, 0, mmUVD_CGC_GATE), 0, sram_sel, indirect);
649
650         /* turn on SUVD clock gating */
651         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
652                 UVD, 0, mmUVD_SUVD_CGC_GATE), 1, sram_sel, indirect);
653
654         /* turn on sw mode in UVD_SUVD_CGC_CTRL */
655         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
656                 UVD, 0, mmUVD_SUVD_CGC_CTRL), 0, sram_sel, indirect);
657 }
658
659 /**
660  * jpeg_v2_0_start - start JPEG block
661  *
662  * @adev: amdgpu_device pointer
663  *
664  * Setup and start the JPEG block
665  */
666 static int jpeg_v2_0_start(struct amdgpu_device *adev)
667 {
668         struct amdgpu_ring *ring = &adev->vcn.inst->ring_jpeg;
669         uint32_t tmp;
670         int r = 0;
671
672         /* disable power gating */
673         tmp = 1 << UVD_PGFSM_CONFIG__UVDJ_PWR_CONFIG__SHIFT;
674         WREG32(SOC15_REG_OFFSET(UVD, 0, mmUVD_PGFSM_CONFIG), tmp);
675
676         SOC15_WAIT_ON_RREG(VCN, 0,
677                 mmUVD_PGFSM_STATUS, UVD_PGFSM_STATUS_UVDJ_PWR_ON,
678                 UVD_PGFSM_STATUS__UVDJ_PWR_STATUS_MASK, r);
679
680         if (r) {
681                 DRM_ERROR("amdgpu: JPEG disable power gating failed\n");
682                 return r;
683         }
684
685         /* Removing the anti hang mechanism to indicate the UVDJ tile is ON */
686         tmp = RREG32(SOC15_REG_OFFSET(UVD, 0, mmUVD_JPEG_POWER_STATUS)) & ~0x1;
687         WREG32(SOC15_REG_OFFSET(UVD, 0, mmUVD_JPEG_POWER_STATUS), tmp);
688
689         /* JPEG disable CGC */
690         tmp = RREG32_SOC15(VCN, 0, mmJPEG_CGC_CTRL);
691         tmp |= 1 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
692         tmp |= 1 << JPEG_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
693         tmp |= 4 << JPEG_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
694         WREG32_SOC15(VCN, 0, mmJPEG_CGC_CTRL, tmp);
695
696         tmp = RREG32_SOC15(VCN, 0, mmJPEG_CGC_GATE);
697         tmp &= ~(JPEG_CGC_GATE__JPEG_DEC_MASK
698                 | JPEG_CGC_GATE__JPEG2_DEC_MASK
699                 | JPEG_CGC_GATE__JPEG_ENC_MASK
700                 | JPEG_CGC_GATE__JMCIF_MASK
701                 | JPEG_CGC_GATE__JRBBM_MASK);
702         WREG32_SOC15(VCN, 0, mmJPEG_CGC_GATE, tmp);
703
704         /* enable JMI channel */
705         WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_JMI_CNTL), 0,
706                 ~UVD_JMI_CNTL__SOFT_RESET_MASK);
707
708         /* enable System Interrupt for JRBC */
709         WREG32_P(SOC15_REG_OFFSET(VCN, 0, mmJPEG_SYS_INT_EN),
710                 JPEG_SYS_INT_EN__DJRBC_MASK,
711                 ~JPEG_SYS_INT_EN__DJRBC_MASK);
712
713         WREG32_SOC15(UVD, 0, mmUVD_LMI_JRBC_RB_VMID, 0);
714         WREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_CNTL, (0x00000001L | 0x00000002L));
715         WREG32_SOC15(UVD, 0, mmUVD_LMI_JRBC_RB_64BIT_BAR_LOW,
716                 lower_32_bits(ring->gpu_addr));
717         WREG32_SOC15(UVD, 0, mmUVD_LMI_JRBC_RB_64BIT_BAR_HIGH,
718                 upper_32_bits(ring->gpu_addr));
719         WREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_RPTR, 0);
720         WREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_WPTR, 0);
721         WREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_CNTL, 0x00000002L);
722         WREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_SIZE, ring->ring_size / 4);
723         ring->wptr = RREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_WPTR);
724
725         return 0;
726 }
727
728 /**
729  * jpeg_v2_0_stop - stop JPEG block
730  *
731  * @adev: amdgpu_device pointer
732  *
733  * stop the JPEG block
734  */
735 static int jpeg_v2_0_stop(struct amdgpu_device *adev)
736 {
737         uint32_t tmp;
738         int r = 0;
739
740         /* reset JMI */
741         WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_JMI_CNTL),
742                 UVD_JMI_CNTL__SOFT_RESET_MASK,
743                 ~UVD_JMI_CNTL__SOFT_RESET_MASK);
744
745         /* enable JPEG CGC */
746         tmp = RREG32_SOC15(VCN, 0, mmJPEG_CGC_CTRL);
747         tmp |= 1 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
748         tmp |= 1 << JPEG_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
749         tmp |= 4 << JPEG_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
750         WREG32_SOC15(VCN, 0, mmJPEG_CGC_CTRL, tmp);
751
752
753         tmp = RREG32_SOC15(VCN, 0, mmJPEG_CGC_GATE);
754         tmp |= (JPEG_CGC_GATE__JPEG_DEC_MASK
755                 |JPEG_CGC_GATE__JPEG2_DEC_MASK
756                 |JPEG_CGC_GATE__JPEG_ENC_MASK
757                 |JPEG_CGC_GATE__JMCIF_MASK
758                 |JPEG_CGC_GATE__JRBBM_MASK);
759         WREG32_SOC15(VCN, 0, mmJPEG_CGC_GATE, tmp);
760
761         /* enable power gating */
762         tmp = RREG32(SOC15_REG_OFFSET(UVD, 0, mmUVD_JPEG_POWER_STATUS));
763         tmp &= ~UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_MASK;
764         tmp |=  0x1; //UVD_JPEG_POWER_STATUS__JPEG_POWER_STATUS_TILES_OFF;
765         WREG32(SOC15_REG_OFFSET(UVD, 0, mmUVD_JPEG_POWER_STATUS), tmp);
766
767         tmp = 2 << UVD_PGFSM_CONFIG__UVDJ_PWR_CONFIG__SHIFT;
768         WREG32(SOC15_REG_OFFSET(UVD, 0, mmUVD_PGFSM_CONFIG), tmp);
769
770         SOC15_WAIT_ON_RREG(VCN, 0, mmUVD_PGFSM_STATUS,
771                 (2 << UVD_PGFSM_STATUS__UVDJ_PWR_STATUS__SHIFT),
772                 UVD_PGFSM_STATUS__UVDJ_PWR_STATUS_MASK, r);
773
774         if (r) {
775                 DRM_ERROR("amdgpu: JPEG enable power gating failed\n");
776                 return r;
777         }
778
779         return r;
780 }
781
782 /**
783  * vcn_v2_0_enable_clock_gating - enable VCN clock gating
784  *
785  * @adev: amdgpu_device pointer
786  * @sw: enable SW clock gating
787  *
788  * Enable clock gating for VCN block
789  */
790 static void vcn_v2_0_enable_clock_gating(struct amdgpu_device *adev)
791 {
792         uint32_t data = 0;
793
794         /* enable UVD CGC */
795         data = RREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL);
796         if (adev->cg_flags & AMD_CG_SUPPORT_VCN_MGCG)
797                 data |= 1 << UVD_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
798         else
799                 data |= 0 << UVD_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
800         data |= 1 << UVD_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
801         data |= 4 << UVD_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
802         WREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL, data);
803
804         data = RREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL);
805         data |= (UVD_CGC_CTRL__UDEC_RE_MODE_MASK
806                 | UVD_CGC_CTRL__UDEC_CM_MODE_MASK
807                 | UVD_CGC_CTRL__UDEC_IT_MODE_MASK
808                 | UVD_CGC_CTRL__UDEC_DB_MODE_MASK
809                 | UVD_CGC_CTRL__UDEC_MP_MODE_MASK
810                 | UVD_CGC_CTRL__SYS_MODE_MASK
811                 | UVD_CGC_CTRL__UDEC_MODE_MASK
812                 | UVD_CGC_CTRL__MPEG2_MODE_MASK
813                 | UVD_CGC_CTRL__REGS_MODE_MASK
814                 | UVD_CGC_CTRL__RBC_MODE_MASK
815                 | UVD_CGC_CTRL__LMI_MC_MODE_MASK
816                 | UVD_CGC_CTRL__LMI_UMC_MODE_MASK
817                 | UVD_CGC_CTRL__IDCT_MODE_MASK
818                 | UVD_CGC_CTRL__MPRD_MODE_MASK
819                 | UVD_CGC_CTRL__MPC_MODE_MASK
820                 | UVD_CGC_CTRL__LBSI_MODE_MASK
821                 | UVD_CGC_CTRL__LRBBM_MODE_MASK
822                 | UVD_CGC_CTRL__WCB_MODE_MASK
823                 | UVD_CGC_CTRL__VCPU_MODE_MASK
824                 | UVD_CGC_CTRL__SCPU_MODE_MASK);
825         WREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL, data);
826
827         data = RREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_CTRL);
828         data |= (UVD_SUVD_CGC_CTRL__SRE_MODE_MASK
829                 | UVD_SUVD_CGC_CTRL__SIT_MODE_MASK
830                 | UVD_SUVD_CGC_CTRL__SMP_MODE_MASK
831                 | UVD_SUVD_CGC_CTRL__SCM_MODE_MASK
832                 | UVD_SUVD_CGC_CTRL__SDB_MODE_MASK
833                 | UVD_SUVD_CGC_CTRL__SCLR_MODE_MASK
834                 | UVD_SUVD_CGC_CTRL__UVD_SC_MODE_MASK
835                 | UVD_SUVD_CGC_CTRL__ENT_MODE_MASK
836                 | UVD_SUVD_CGC_CTRL__IME_MODE_MASK
837                 | UVD_SUVD_CGC_CTRL__SITE_MODE_MASK);
838         WREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_CTRL, data);
839 }
840
841 static void vcn_v2_0_disable_static_power_gating(struct amdgpu_device *adev)
842 {
843         uint32_t data = 0;
844         int ret;
845
846         if (adev->pg_flags & AMD_PG_SUPPORT_VCN) {
847                 data = (1 << UVD_PGFSM_CONFIG__UVDM_PWR_CONFIG__SHIFT
848                         | 1 << UVD_PGFSM_CONFIG__UVDU_PWR_CONFIG__SHIFT
849                         | 2 << UVD_PGFSM_CONFIG__UVDF_PWR_CONFIG__SHIFT
850                         | 2 << UVD_PGFSM_CONFIG__UVDC_PWR_CONFIG__SHIFT
851                         | 2 << UVD_PGFSM_CONFIG__UVDB_PWR_CONFIG__SHIFT
852                         | 2 << UVD_PGFSM_CONFIG__UVDIL_PWR_CONFIG__SHIFT
853                         | 2 << UVD_PGFSM_CONFIG__UVDIR_PWR_CONFIG__SHIFT
854                         | 2 << UVD_PGFSM_CONFIG__UVDTD_PWR_CONFIG__SHIFT
855                         | 2 << UVD_PGFSM_CONFIG__UVDTE_PWR_CONFIG__SHIFT
856                         | 2 << UVD_PGFSM_CONFIG__UVDE_PWR_CONFIG__SHIFT);
857
858                 WREG32_SOC15(VCN, 0, mmUVD_PGFSM_CONFIG, data);
859                 SOC15_WAIT_ON_RREG(VCN, 0, mmUVD_PGFSM_STATUS,
860                         UVD_PGFSM_STATUS__UVDM_UVDU_PWR_ON_2_0, 0xFFFFF, ret);
861         } else {
862                 data = (1 << UVD_PGFSM_CONFIG__UVDM_PWR_CONFIG__SHIFT
863                         | 1 << UVD_PGFSM_CONFIG__UVDU_PWR_CONFIG__SHIFT
864                         | 1 << UVD_PGFSM_CONFIG__UVDF_PWR_CONFIG__SHIFT
865                         | 1 << UVD_PGFSM_CONFIG__UVDC_PWR_CONFIG__SHIFT
866                         | 1 << UVD_PGFSM_CONFIG__UVDB_PWR_CONFIG__SHIFT
867                         | 1 << UVD_PGFSM_CONFIG__UVDIL_PWR_CONFIG__SHIFT
868                         | 1 << UVD_PGFSM_CONFIG__UVDIR_PWR_CONFIG__SHIFT
869                         | 1 << UVD_PGFSM_CONFIG__UVDTD_PWR_CONFIG__SHIFT
870                         | 1 << UVD_PGFSM_CONFIG__UVDTE_PWR_CONFIG__SHIFT
871                         | 1 << UVD_PGFSM_CONFIG__UVDE_PWR_CONFIG__SHIFT);
872                 WREG32_SOC15(VCN, 0, mmUVD_PGFSM_CONFIG, data);
873                 SOC15_WAIT_ON_RREG(VCN, 0, mmUVD_PGFSM_STATUS, 0,  0xFFFFF, ret);
874         }
875
876         /* polling UVD_PGFSM_STATUS to confirm UVDM_PWR_STATUS,
877          * UVDU_PWR_STATUS are 0 (power on) */
878
879         data = RREG32_SOC15(VCN, 0, mmUVD_POWER_STATUS);
880         data &= ~0x103;
881         if (adev->pg_flags & AMD_PG_SUPPORT_VCN)
882                 data |= UVD_PGFSM_CONFIG__UVDM_UVDU_PWR_ON |
883                         UVD_POWER_STATUS__UVD_PG_EN_MASK;
884
885         WREG32_SOC15(VCN, 0, mmUVD_POWER_STATUS, data);
886 }
887
888 static void vcn_v2_0_enable_static_power_gating(struct amdgpu_device *adev)
889 {
890         uint32_t data = 0;
891         int ret;
892
893         if (adev->pg_flags & AMD_PG_SUPPORT_VCN) {
894                 /* Before power off, this indicator has to be turned on */
895                 data = RREG32_SOC15(VCN, 0, mmUVD_POWER_STATUS);
896                 data &= ~UVD_POWER_STATUS__UVD_POWER_STATUS_MASK;
897                 data |= UVD_POWER_STATUS__UVD_POWER_STATUS_TILES_OFF;
898                 WREG32_SOC15(VCN, 0, mmUVD_POWER_STATUS, data);
899
900
901                 data = (2 << UVD_PGFSM_CONFIG__UVDM_PWR_CONFIG__SHIFT
902                         | 2 << UVD_PGFSM_CONFIG__UVDU_PWR_CONFIG__SHIFT
903                         | 2 << UVD_PGFSM_CONFIG__UVDF_PWR_CONFIG__SHIFT
904                         | 2 << UVD_PGFSM_CONFIG__UVDC_PWR_CONFIG__SHIFT
905                         | 2 << UVD_PGFSM_CONFIG__UVDB_PWR_CONFIG__SHIFT
906                         | 2 << UVD_PGFSM_CONFIG__UVDIL_PWR_CONFIG__SHIFT
907                         | 2 << UVD_PGFSM_CONFIG__UVDIR_PWR_CONFIG__SHIFT
908                         | 2 << UVD_PGFSM_CONFIG__UVDTD_PWR_CONFIG__SHIFT
909                         | 2 << UVD_PGFSM_CONFIG__UVDTE_PWR_CONFIG__SHIFT
910                         | 2 << UVD_PGFSM_CONFIG__UVDE_PWR_CONFIG__SHIFT);
911
912                 WREG32_SOC15(VCN, 0, mmUVD_PGFSM_CONFIG, data);
913
914                 data = (2 << UVD_PGFSM_STATUS__UVDM_PWR_STATUS__SHIFT
915                         | 2 << UVD_PGFSM_STATUS__UVDU_PWR_STATUS__SHIFT
916                         | 2 << UVD_PGFSM_STATUS__UVDF_PWR_STATUS__SHIFT
917                         | 2 << UVD_PGFSM_STATUS__UVDC_PWR_STATUS__SHIFT
918                         | 2 << UVD_PGFSM_STATUS__UVDB_PWR_STATUS__SHIFT
919                         | 2 << UVD_PGFSM_STATUS__UVDIL_PWR_STATUS__SHIFT
920                         | 2 << UVD_PGFSM_STATUS__UVDIR_PWR_STATUS__SHIFT
921                         | 2 << UVD_PGFSM_STATUS__UVDTD_PWR_STATUS__SHIFT
922                         | 2 << UVD_PGFSM_STATUS__UVDTE_PWR_STATUS__SHIFT
923                         | 2 << UVD_PGFSM_STATUS__UVDE_PWR_STATUS__SHIFT);
924                 SOC15_WAIT_ON_RREG(VCN, 0, mmUVD_PGFSM_STATUS, data, 0xFFFFF, ret);
925         }
926 }
927
928 static int vcn_v2_0_start_dpg_mode(struct amdgpu_device *adev, bool indirect)
929 {
930         struct amdgpu_ring *ring = &adev->vcn.inst->ring_dec;
931         uint32_t rb_bufsz, tmp;
932
933         vcn_v2_0_enable_static_power_gating(adev);
934
935         /* enable dynamic power gating mode */
936         tmp = RREG32_SOC15(UVD, 0, mmUVD_POWER_STATUS);
937         tmp |= UVD_POWER_STATUS__UVD_PG_MODE_MASK;
938         tmp |= UVD_POWER_STATUS__UVD_PG_EN_MASK;
939         WREG32_SOC15(UVD, 0, mmUVD_POWER_STATUS, tmp);
940
941         if (indirect)
942                 adev->vcn.dpg_sram_curr_addr = (uint32_t*)adev->vcn.dpg_sram_cpu_addr;
943
944         /* enable clock gating */
945         vcn_v2_0_clock_gating_dpg_mode(adev, 0, indirect);
946
947         /* enable VCPU clock */
948         tmp = (0xFF << UVD_VCPU_CNTL__PRB_TIMEOUT_VAL__SHIFT);
949         tmp |= UVD_VCPU_CNTL__CLK_EN_MASK;
950         tmp |= UVD_VCPU_CNTL__MIF_WR_LOW_THRESHOLD_BP_MASK;
951         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
952                 UVD, 0, mmUVD_VCPU_CNTL), tmp, 0, indirect);
953
954         /* disable master interupt */
955         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
956                 UVD, 0, mmUVD_MASTINT_EN), 0, 0, indirect);
957
958         /* setup mmUVD_LMI_CTRL */
959         tmp = (UVD_LMI_CTRL__WRITE_CLEAN_TIMER_EN_MASK |
960                 UVD_LMI_CTRL__REQ_MODE_MASK |
961                 UVD_LMI_CTRL__CRC_RESET_MASK |
962                 UVD_LMI_CTRL__MASK_MC_URGENT_MASK |
963                 UVD_LMI_CTRL__DATA_COHERENCY_EN_MASK |
964                 UVD_LMI_CTRL__VCPU_DATA_COHERENCY_EN_MASK |
965                 (8 << UVD_LMI_CTRL__WRITE_CLEAN_TIMER__SHIFT) |
966                 0x00100000L);
967         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
968                 UVD, 0, mmUVD_LMI_CTRL), tmp, 0, indirect);
969
970         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
971                 UVD, 0, mmUVD_MPC_CNTL),
972                 0x2 << UVD_MPC_CNTL__REPLACEMENT_MODE__SHIFT, 0, indirect);
973
974         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
975                 UVD, 0, mmUVD_MPC_SET_MUXA0),
976                 ((0x1 << UVD_MPC_SET_MUXA0__VARA_1__SHIFT) |
977                  (0x2 << UVD_MPC_SET_MUXA0__VARA_2__SHIFT) |
978                  (0x3 << UVD_MPC_SET_MUXA0__VARA_3__SHIFT) |
979                  (0x4 << UVD_MPC_SET_MUXA0__VARA_4__SHIFT)), 0, indirect);
980
981         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
982                 UVD, 0, mmUVD_MPC_SET_MUXB0),
983                 ((0x1 << UVD_MPC_SET_MUXB0__VARB_1__SHIFT) |
984                  (0x2 << UVD_MPC_SET_MUXB0__VARB_2__SHIFT) |
985                  (0x3 << UVD_MPC_SET_MUXB0__VARB_3__SHIFT) |
986                  (0x4 << UVD_MPC_SET_MUXB0__VARB_4__SHIFT)), 0, indirect);
987
988         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
989                 UVD, 0, mmUVD_MPC_SET_MUX),
990                 ((0x0 << UVD_MPC_SET_MUX__SET_0__SHIFT) |
991                  (0x1 << UVD_MPC_SET_MUX__SET_1__SHIFT) |
992                  (0x2 << UVD_MPC_SET_MUX__SET_2__SHIFT)), 0, indirect);
993
994         vcn_v2_0_mc_resume_dpg_mode(adev, indirect);
995
996         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
997                 UVD, 0, mmUVD_REG_XX_MASK), 0x10, 0, indirect);
998         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
999                 UVD, 0, mmUVD_RBC_XX_IB_REG_CHECK), 0x3, 0, indirect);
1000
1001         /* release VCPU reset to boot */
1002         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
1003                 UVD, 0, mmUVD_SOFT_RESET), 0, 0, indirect);
1004
1005         /* enable LMI MC and UMC channels */
1006         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
1007                 UVD, 0, mmUVD_LMI_CTRL2),
1008                 0x1F << UVD_LMI_CTRL2__RE_OFLD_MIF_WR_REQ_NUM__SHIFT, 0, indirect);
1009
1010         /* enable master interrupt */
1011         WREG32_SOC15_DPG_MODE_2_0(SOC15_DPG_MODE_OFFSET_2_0(
1012                 UVD, 0, mmUVD_MASTINT_EN),
1013                 UVD_MASTINT_EN__VCPU_EN_MASK, 0, indirect);
1014
1015         if (indirect)
1016                 psp_update_vcn_sram(adev, 0, adev->vcn.dpg_sram_gpu_addr,
1017                                     (uint32_t)((uintptr_t)adev->vcn.dpg_sram_curr_addr -
1018                                                (uintptr_t)adev->vcn.dpg_sram_cpu_addr));
1019
1020         /* force RBC into idle state */
1021         rb_bufsz = order_base_2(ring->ring_size);
1022         tmp = REG_SET_FIELD(0, UVD_RBC_RB_CNTL, RB_BUFSZ, rb_bufsz);
1023         tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_BLKSZ, 1);
1024         tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_FETCH, 1);
1025         tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_UPDATE, 1);
1026         tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_RPTR_WR_EN, 1);
1027         WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_CNTL, tmp);
1028
1029         /* set the write pointer delay */
1030         WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR_CNTL, 0);
1031
1032         /* set the wb address */
1033         WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR_ADDR,
1034                 (upper_32_bits(ring->gpu_addr) >> 2));
1035
1036         /* programm the RB_BASE for ring buffer */
1037         WREG32_SOC15(UVD, 0, mmUVD_LMI_RBC_RB_64BIT_BAR_LOW,
1038                 lower_32_bits(ring->gpu_addr));
1039         WREG32_SOC15(UVD, 0, mmUVD_LMI_RBC_RB_64BIT_BAR_HIGH,
1040                 upper_32_bits(ring->gpu_addr));
1041
1042         /* Initialize the ring buffer's read and write pointers */
1043         WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR, 0);
1044
1045         WREG32_SOC15(UVD, 0, mmUVD_SCRATCH2, 0);
1046
1047         ring->wptr = RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR);
1048         WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR,
1049                 lower_32_bits(ring->wptr));
1050
1051         return 0;
1052 }
1053
1054 static int vcn_v2_0_start(struct amdgpu_device *adev)
1055 {
1056         struct amdgpu_ring *ring = &adev->vcn.inst->ring_dec;
1057         uint32_t rb_bufsz, tmp;
1058         uint32_t lmi_swap_cntl;
1059         int i, j, r;
1060
1061         if (adev->pm.dpm_enabled)
1062                 amdgpu_dpm_enable_uvd(adev, true);
1063
1064         if (adev->pg_flags & AMD_PG_SUPPORT_VCN_DPG) {
1065                 r = vcn_v2_0_start_dpg_mode(adev, adev->vcn.indirect_sram);
1066                 if (r)
1067                         return r;
1068                 goto jpeg;
1069         }
1070
1071         vcn_v2_0_disable_static_power_gating(adev);
1072
1073         /* set uvd status busy */
1074         tmp = RREG32_SOC15(UVD, 0, mmUVD_STATUS) | UVD_STATUS__UVD_BUSY;
1075         WREG32_SOC15(UVD, 0, mmUVD_STATUS, tmp);
1076
1077         /*SW clock gating */
1078         vcn_v2_0_disable_clock_gating(adev);
1079
1080         /* enable VCPU clock */
1081         WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_VCPU_CNTL),
1082                 UVD_VCPU_CNTL__CLK_EN_MASK, ~UVD_VCPU_CNTL__CLK_EN_MASK);
1083
1084         /* disable master interrupt */
1085         WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_MASTINT_EN), 0,
1086                 ~UVD_MASTINT_EN__VCPU_EN_MASK);
1087
1088         /* setup mmUVD_LMI_CTRL */
1089         tmp = RREG32_SOC15(UVD, 0, mmUVD_LMI_CTRL);
1090         WREG32_SOC15(UVD, 0, mmUVD_LMI_CTRL, tmp |
1091                 UVD_LMI_CTRL__WRITE_CLEAN_TIMER_EN_MASK |
1092                 UVD_LMI_CTRL__MASK_MC_URGENT_MASK |
1093                 UVD_LMI_CTRL__DATA_COHERENCY_EN_MASK |
1094                 UVD_LMI_CTRL__VCPU_DATA_COHERENCY_EN_MASK);
1095
1096         /* setup mmUVD_MPC_CNTL */
1097         tmp = RREG32_SOC15(UVD, 0, mmUVD_MPC_CNTL);
1098         tmp &= ~UVD_MPC_CNTL__REPLACEMENT_MODE_MASK;
1099         tmp |= 0x2 << UVD_MPC_CNTL__REPLACEMENT_MODE__SHIFT;
1100         WREG32_SOC15(VCN, 0, mmUVD_MPC_CNTL, tmp);
1101
1102         /* setup UVD_MPC_SET_MUXA0 */
1103         WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUXA0,
1104                 ((0x1 << UVD_MPC_SET_MUXA0__VARA_1__SHIFT) |
1105                 (0x2 << UVD_MPC_SET_MUXA0__VARA_2__SHIFT) |
1106                 (0x3 << UVD_MPC_SET_MUXA0__VARA_3__SHIFT) |
1107                 (0x4 << UVD_MPC_SET_MUXA0__VARA_4__SHIFT)));
1108
1109         /* setup UVD_MPC_SET_MUXB0 */
1110         WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUXB0,
1111                 ((0x1 << UVD_MPC_SET_MUXB0__VARB_1__SHIFT) |
1112                 (0x2 << UVD_MPC_SET_MUXB0__VARB_2__SHIFT) |
1113                 (0x3 << UVD_MPC_SET_MUXB0__VARB_3__SHIFT) |
1114                 (0x4 << UVD_MPC_SET_MUXB0__VARB_4__SHIFT)));
1115
1116         /* setup mmUVD_MPC_SET_MUX */
1117         WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUX,
1118                 ((0x0 << UVD_MPC_SET_MUX__SET_0__SHIFT) |
1119                 (0x1 << UVD_MPC_SET_MUX__SET_1__SHIFT) |
1120                 (0x2 << UVD_MPC_SET_MUX__SET_2__SHIFT)));
1121
1122         vcn_v2_0_mc_resume(adev);
1123
1124         /* release VCPU reset to boot */
1125         WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET), 0,
1126                 ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
1127
1128         /* enable LMI MC and UMC channels */
1129         WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2), 0,
1130                 ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
1131
1132         tmp = RREG32_SOC15(VCN, 0, mmUVD_SOFT_RESET);
1133         tmp &= ~UVD_SOFT_RESET__LMI_SOFT_RESET_MASK;
1134         tmp &= ~UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK;
1135         WREG32_SOC15(VCN, 0, mmUVD_SOFT_RESET, tmp);
1136
1137         /* disable byte swapping */
1138         lmi_swap_cntl = 0;
1139 #ifdef __BIG_ENDIAN
1140         /* swap (8 in 32) RB and IB */
1141         lmi_swap_cntl = 0xa;
1142 #endif
1143         WREG32_SOC15(UVD, 0, mmUVD_LMI_SWAP_CNTL, lmi_swap_cntl);
1144
1145         for (i = 0; i < 10; ++i) {
1146                 uint32_t status;
1147
1148                 for (j = 0; j < 100; ++j) {
1149                         status = RREG32_SOC15(UVD, 0, mmUVD_STATUS);
1150                         if (status & 2)
1151                                 break;
1152                         mdelay(10);
1153                 }
1154                 r = 0;
1155                 if (status & 2)
1156                         break;
1157
1158                 DRM_ERROR("VCN decode not responding, trying to reset the VCPU!!!\n");
1159                 WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET),
1160                         UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK,
1161                         ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
1162                 mdelay(10);
1163                 WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET), 0,
1164                         ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
1165                 mdelay(10);
1166                 r = -1;
1167         }
1168
1169         if (r) {
1170                 DRM_ERROR("VCN decode not responding, giving up!!!\n");
1171                 return r;
1172         }
1173
1174         /* enable master interrupt */
1175         WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_MASTINT_EN),
1176                 UVD_MASTINT_EN__VCPU_EN_MASK,
1177                 ~UVD_MASTINT_EN__VCPU_EN_MASK);
1178
1179         /* clear the busy bit of VCN_STATUS */
1180         WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_STATUS), 0,
1181                 ~(2 << UVD_STATUS__VCPU_REPORT__SHIFT));
1182
1183         WREG32_SOC15(UVD, 0, mmUVD_LMI_RBC_RB_VMID, 0);
1184
1185         /* force RBC into idle state */
1186         rb_bufsz = order_base_2(ring->ring_size);
1187         tmp = REG_SET_FIELD(0, UVD_RBC_RB_CNTL, RB_BUFSZ, rb_bufsz);
1188         tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_BLKSZ, 1);
1189         tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_FETCH, 1);
1190         tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_UPDATE, 1);
1191         tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_RPTR_WR_EN, 1);
1192         WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_CNTL, tmp);
1193
1194         /* programm the RB_BASE for ring buffer */
1195         WREG32_SOC15(UVD, 0, mmUVD_LMI_RBC_RB_64BIT_BAR_LOW,
1196                 lower_32_bits(ring->gpu_addr));
1197         WREG32_SOC15(UVD, 0, mmUVD_LMI_RBC_RB_64BIT_BAR_HIGH,
1198                 upper_32_bits(ring->gpu_addr));
1199
1200         /* Initialize the ring buffer's read and write pointers */
1201         WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR, 0);
1202
1203         ring->wptr = RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR);
1204         WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR,
1205                         lower_32_bits(ring->wptr));
1206
1207         ring = &adev->vcn.inst->ring_enc[0];
1208         WREG32_SOC15(UVD, 0, mmUVD_RB_RPTR, lower_32_bits(ring->wptr));
1209         WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR, lower_32_bits(ring->wptr));
1210         WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_LO, ring->gpu_addr);
1211         WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_HI, upper_32_bits(ring->gpu_addr));
1212         WREG32_SOC15(UVD, 0, mmUVD_RB_SIZE, ring->ring_size / 4);
1213
1214         ring = &adev->vcn.inst->ring_enc[1];
1215         WREG32_SOC15(UVD, 0, mmUVD_RB_RPTR2, lower_32_bits(ring->wptr));
1216         WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR2, lower_32_bits(ring->wptr));
1217         WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_LO2, ring->gpu_addr);
1218         WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_HI2, upper_32_bits(ring->gpu_addr));
1219         WREG32_SOC15(UVD, 0, mmUVD_RB_SIZE2, ring->ring_size / 4);
1220
1221 jpeg:
1222         r = jpeg_v2_0_start(adev);
1223
1224         return r;
1225 }
1226
1227 static int vcn_v2_0_stop_dpg_mode(struct amdgpu_device *adev)
1228 {
1229         int ret_code = 0;
1230         uint32_t tmp;
1231
1232         /* Wait for power status to be 1 */
1233         SOC15_WAIT_ON_RREG(UVD, 0, mmUVD_POWER_STATUS, 1,
1234                 UVD_POWER_STATUS__UVD_POWER_STATUS_MASK, ret_code);
1235
1236         /* wait for read ptr to be equal to write ptr */
1237         tmp = RREG32_SOC15(UVD, 0, mmUVD_RB_WPTR);
1238         SOC15_WAIT_ON_RREG(UVD, 0, mmUVD_RB_RPTR, tmp, 0xFFFFFFFF, ret_code);
1239
1240         tmp = RREG32_SOC15(UVD, 0, mmUVD_RB_WPTR2);
1241         SOC15_WAIT_ON_RREG(UVD, 0, mmUVD_RB_RPTR2, tmp, 0xFFFFFFFF, ret_code);
1242
1243         tmp = RREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_WPTR);
1244         SOC15_WAIT_ON_RREG(UVD, 0, mmUVD_JRBC_RB_RPTR, tmp, 0xFFFFFFFF, ret_code);
1245
1246         tmp = RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR) & 0x7FFFFFFF;
1247         SOC15_WAIT_ON_RREG(UVD, 0, mmUVD_RBC_RB_RPTR, tmp, 0xFFFFFFFF, ret_code);
1248
1249         SOC15_WAIT_ON_RREG(UVD, 0, mmUVD_POWER_STATUS, 1,
1250                 UVD_POWER_STATUS__UVD_POWER_STATUS_MASK, ret_code);
1251
1252         /* disable dynamic power gating mode */
1253         WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_POWER_STATUS), 0,
1254                         ~UVD_POWER_STATUS__UVD_PG_MODE_MASK);
1255
1256         return 0;
1257 }
1258
1259 static int vcn_v2_0_stop(struct amdgpu_device *adev)
1260 {
1261         uint32_t tmp;
1262         int r;
1263
1264         r = jpeg_v2_0_stop(adev);
1265         if (r)
1266                 return r;
1267
1268         if (adev->pg_flags & AMD_PG_SUPPORT_VCN_DPG) {
1269                 r = vcn_v2_0_stop_dpg_mode(adev);
1270                 if (r)
1271                         return r;
1272                 goto power_off;
1273         }
1274
1275         /* wait for uvd idle */
1276         SOC15_WAIT_ON_RREG(VCN, 0, mmUVD_STATUS, UVD_STATUS__IDLE, 0x7, r);
1277         if (r)
1278                 return r;
1279
1280         tmp = UVD_LMI_STATUS__VCPU_LMI_WRITE_CLEAN_MASK |
1281                 UVD_LMI_STATUS__READ_CLEAN_MASK |
1282                 UVD_LMI_STATUS__WRITE_CLEAN_MASK |
1283                 UVD_LMI_STATUS__WRITE_CLEAN_RAW_MASK;
1284         SOC15_WAIT_ON_RREG(VCN, 0, mmUVD_LMI_STATUS, tmp, tmp, r);
1285         if (r)
1286                 return r;
1287
1288         /* stall UMC channel */
1289         tmp = RREG32_SOC15(VCN, 0, mmUVD_LMI_CTRL2);
1290         tmp |= UVD_LMI_CTRL2__STALL_ARB_UMC_MASK;
1291         WREG32_SOC15(VCN, 0, mmUVD_LMI_CTRL2, tmp);
1292
1293         tmp = UVD_LMI_STATUS__UMC_READ_CLEAN_RAW_MASK|
1294                 UVD_LMI_STATUS__UMC_WRITE_CLEAN_RAW_MASK;
1295         SOC15_WAIT_ON_RREG(VCN, 0, mmUVD_LMI_STATUS, tmp, tmp, r);
1296         if (r)
1297                 return r;
1298
1299         /* disable VCPU clock */
1300         WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_VCPU_CNTL), 0,
1301                 ~(UVD_VCPU_CNTL__CLK_EN_MASK));
1302
1303         /* reset LMI UMC */
1304         WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET),
1305                 UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK,
1306                 ~UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK);
1307
1308         /* reset LMI */
1309         WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET),
1310                 UVD_SOFT_RESET__LMI_SOFT_RESET_MASK,
1311                 ~UVD_SOFT_RESET__LMI_SOFT_RESET_MASK);
1312
1313         /* reset VCPU */
1314         WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET),
1315                 UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK,
1316                 ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
1317
1318         /* clear status */
1319         WREG32_SOC15(VCN, 0, mmUVD_STATUS, 0);
1320
1321         vcn_v2_0_enable_clock_gating(adev);
1322         vcn_v2_0_enable_static_power_gating(adev);
1323
1324 power_off:
1325         if (adev->pm.dpm_enabled)
1326                 amdgpu_dpm_enable_uvd(adev, false);
1327
1328         return 0;
1329 }
1330
1331 static int vcn_v2_0_pause_dpg_mode(struct amdgpu_device *adev,
1332                                 struct dpg_pause_state *new_state)
1333 {
1334         struct amdgpu_ring *ring;
1335         uint32_t reg_data = 0;
1336         int ret_code;
1337
1338         /* pause/unpause if state is changed */
1339         if (adev->vcn.pause_state.fw_based != new_state->fw_based) {
1340                 DRM_DEBUG("dpg pause state changed %d -> %d",
1341                         adev->vcn.pause_state.fw_based, new_state->fw_based);
1342                 reg_data = RREG32_SOC15(UVD, 0, mmUVD_DPG_PAUSE) &
1343                         (~UVD_DPG_PAUSE__NJ_PAUSE_DPG_ACK_MASK);
1344
1345                 if (new_state->fw_based == VCN_DPG_STATE__PAUSE) {
1346                         ret_code = 0;
1347                         SOC15_WAIT_ON_RREG(UVD, 0, mmUVD_POWER_STATUS, 0x1,
1348                                 UVD_POWER_STATUS__UVD_POWER_STATUS_MASK, ret_code);
1349
1350                         if (!ret_code) {
1351                                 /* pause DPG */
1352                                 reg_data |= UVD_DPG_PAUSE__NJ_PAUSE_DPG_REQ_MASK;
1353                                 WREG32_SOC15(UVD, 0, mmUVD_DPG_PAUSE, reg_data);
1354
1355                                 /* wait for ACK */
1356                                 SOC15_WAIT_ON_RREG(UVD, 0, mmUVD_DPG_PAUSE,
1357                                            UVD_DPG_PAUSE__NJ_PAUSE_DPG_ACK_MASK,
1358                                            UVD_DPG_PAUSE__NJ_PAUSE_DPG_ACK_MASK, ret_code);
1359
1360                                 /* Restore */
1361                                 ring = &adev->vcn.inst->ring_enc[0];
1362                                 WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_LO, ring->gpu_addr);
1363                                 WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_HI, upper_32_bits(ring->gpu_addr));
1364                                 WREG32_SOC15(UVD, 0, mmUVD_RB_SIZE, ring->ring_size / 4);
1365                                 WREG32_SOC15(UVD, 0, mmUVD_RB_RPTR, lower_32_bits(ring->wptr));
1366                                 WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR, lower_32_bits(ring->wptr));
1367
1368                                 ring = &adev->vcn.inst->ring_enc[1];
1369                                 WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_LO2, ring->gpu_addr);
1370                                 WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_HI2, upper_32_bits(ring->gpu_addr));
1371                                 WREG32_SOC15(UVD, 0, mmUVD_RB_SIZE2, ring->ring_size / 4);
1372                                 WREG32_SOC15(UVD, 0, mmUVD_RB_RPTR2, lower_32_bits(ring->wptr));
1373                                 WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR2, lower_32_bits(ring->wptr));
1374
1375                                 WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR,
1376                                            RREG32_SOC15(UVD, 0, mmUVD_SCRATCH2) & 0x7FFFFFFF);
1377
1378                                 SOC15_WAIT_ON_RREG(UVD, 0, mmUVD_POWER_STATUS,
1379                                            UVD_PGFSM_CONFIG__UVDM_UVDU_PWR_ON,
1380                                            UVD_POWER_STATUS__UVD_POWER_STATUS_MASK, ret_code);
1381                         }
1382                 } else {
1383                         /* unpause dpg, no need to wait */
1384                         reg_data &= ~UVD_DPG_PAUSE__NJ_PAUSE_DPG_REQ_MASK;
1385                         WREG32_SOC15(UVD, 0, mmUVD_DPG_PAUSE, reg_data);
1386                 }
1387                 adev->vcn.pause_state.fw_based = new_state->fw_based;
1388         }
1389
1390         return 0;
1391 }
1392
1393 static bool vcn_v2_0_is_idle(void *handle)
1394 {
1395         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1396
1397         return (RREG32_SOC15(VCN, 0, mmUVD_STATUS) == UVD_STATUS__IDLE);
1398 }
1399
1400 static int vcn_v2_0_wait_for_idle(void *handle)
1401 {
1402         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1403         int ret = 0;
1404
1405         SOC15_WAIT_ON_RREG(VCN, 0, mmUVD_STATUS, UVD_STATUS__IDLE,
1406                 UVD_STATUS__IDLE, ret);
1407
1408         return ret;
1409 }
1410
1411 static int vcn_v2_0_set_clockgating_state(void *handle,
1412                                           enum amd_clockgating_state state)
1413 {
1414         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1415         bool enable = (state == AMD_CG_STATE_GATE) ? true : false;
1416
1417         if (enable) {
1418                 /* wait for STATUS to clear */
1419                 if (vcn_v2_0_is_idle(handle))
1420                         return -EBUSY;
1421                 vcn_v2_0_enable_clock_gating(adev);
1422         } else {
1423                 /* disable HW gating and enable Sw gating */
1424                 vcn_v2_0_disable_clock_gating(adev);
1425         }
1426         return 0;
1427 }
1428
1429 /**
1430  * vcn_v2_0_dec_ring_get_rptr - get read pointer
1431  *
1432  * @ring: amdgpu_ring pointer
1433  *
1434  * Returns the current hardware read pointer
1435  */
1436 static uint64_t vcn_v2_0_dec_ring_get_rptr(struct amdgpu_ring *ring)
1437 {
1438         struct amdgpu_device *adev = ring->adev;
1439
1440         return RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR);
1441 }
1442
1443 /**
1444  * vcn_v2_0_dec_ring_get_wptr - get write pointer
1445  *
1446  * @ring: amdgpu_ring pointer
1447  *
1448  * Returns the current hardware write pointer
1449  */
1450 static uint64_t vcn_v2_0_dec_ring_get_wptr(struct amdgpu_ring *ring)
1451 {
1452         struct amdgpu_device *adev = ring->adev;
1453
1454         if (ring->use_doorbell)
1455                 return adev->wb.wb[ring->wptr_offs];
1456         else
1457                 return RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR);
1458 }
1459
1460 /**
1461  * vcn_v2_0_dec_ring_set_wptr - set write pointer
1462  *
1463  * @ring: amdgpu_ring pointer
1464  *
1465  * Commits the write pointer to the hardware
1466  */
1467 static void vcn_v2_0_dec_ring_set_wptr(struct amdgpu_ring *ring)
1468 {
1469         struct amdgpu_device *adev = ring->adev;
1470
1471         if (adev->pg_flags & AMD_PG_SUPPORT_VCN_DPG)
1472                 WREG32_SOC15(UVD, 0, mmUVD_SCRATCH2,
1473                         lower_32_bits(ring->wptr) | 0x80000000);
1474
1475         if (ring->use_doorbell) {
1476                 adev->wb.wb[ring->wptr_offs] = lower_32_bits(ring->wptr);
1477                 WDOORBELL32(ring->doorbell_index, lower_32_bits(ring->wptr));
1478         } else {
1479                 WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR, lower_32_bits(ring->wptr));
1480         }
1481 }
1482
1483 /**
1484  * vcn_v2_0_dec_ring_insert_start - insert a start command
1485  *
1486  * @ring: amdgpu_ring pointer
1487  *
1488  * Write a start command to the ring.
1489  */
1490 void vcn_v2_0_dec_ring_insert_start(struct amdgpu_ring *ring)
1491 {
1492         struct amdgpu_device *adev = ring->adev;
1493
1494         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.data0, 0));
1495         amdgpu_ring_write(ring, 0);
1496         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.cmd, 0));
1497         amdgpu_ring_write(ring, VCN_DEC_KMD_CMD | (VCN_DEC_CMD_PACKET_START << 1));
1498 }
1499
1500 /**
1501  * vcn_v2_0_dec_ring_insert_end - insert a end command
1502  *
1503  * @ring: amdgpu_ring pointer
1504  *
1505  * Write a end command to the ring.
1506  */
1507 void vcn_v2_0_dec_ring_insert_end(struct amdgpu_ring *ring)
1508 {
1509         struct amdgpu_device *adev = ring->adev;
1510
1511         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.cmd, 0));
1512         amdgpu_ring_write(ring, VCN_DEC_KMD_CMD | (VCN_DEC_CMD_PACKET_END << 1));
1513 }
1514
1515 /**
1516  * vcn_v2_0_dec_ring_insert_nop - insert a nop command
1517  *
1518  * @ring: amdgpu_ring pointer
1519  *
1520  * Write a nop command to the ring.
1521  */
1522 void vcn_v2_0_dec_ring_insert_nop(struct amdgpu_ring *ring, uint32_t count)
1523 {
1524         struct amdgpu_device *adev = ring->adev;
1525         int i;
1526
1527         WARN_ON(ring->wptr % 2 || count % 2);
1528
1529         for (i = 0; i < count / 2; i++) {
1530                 amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.nop, 0));
1531                 amdgpu_ring_write(ring, 0);
1532         }
1533 }
1534
1535 /**
1536  * vcn_v2_0_dec_ring_emit_fence - emit an fence & trap command
1537  *
1538  * @ring: amdgpu_ring pointer
1539  * @fence: fence to emit
1540  *
1541  * Write a fence and a trap command to the ring.
1542  */
1543 void vcn_v2_0_dec_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq,
1544                                 unsigned flags)
1545 {
1546         struct amdgpu_device *adev = ring->adev;
1547
1548         WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
1549         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.context_id, 0));
1550         amdgpu_ring_write(ring, seq);
1551
1552         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.data0, 0));
1553         amdgpu_ring_write(ring, addr & 0xffffffff);
1554
1555         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.data1, 0));
1556         amdgpu_ring_write(ring, upper_32_bits(addr) & 0xff);
1557
1558         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.cmd, 0));
1559         amdgpu_ring_write(ring, VCN_DEC_KMD_CMD | (VCN_DEC_CMD_FENCE << 1));
1560
1561         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.data0, 0));
1562         amdgpu_ring_write(ring, 0);
1563
1564         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.data1, 0));
1565         amdgpu_ring_write(ring, 0);
1566
1567         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.cmd, 0));
1568
1569         amdgpu_ring_write(ring, VCN_DEC_KMD_CMD | (VCN_DEC_CMD_TRAP << 1));
1570 }
1571
1572 /**
1573  * vcn_v2_0_dec_ring_emit_ib - execute indirect buffer
1574  *
1575  * @ring: amdgpu_ring pointer
1576  * @ib: indirect buffer to execute
1577  *
1578  * Write ring commands to execute the indirect buffer
1579  */
1580 void vcn_v2_0_dec_ring_emit_ib(struct amdgpu_ring *ring,
1581                                struct amdgpu_job *job,
1582                                struct amdgpu_ib *ib,
1583                                uint32_t flags)
1584 {
1585         struct amdgpu_device *adev = ring->adev;
1586         unsigned vmid = AMDGPU_JOB_GET_VMID(job);
1587
1588         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.ib_vmid, 0));
1589         amdgpu_ring_write(ring, vmid);
1590
1591         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.ib_bar_low, 0));
1592         amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
1593         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.ib_bar_high, 0));
1594         amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
1595         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.ib_size, 0));
1596         amdgpu_ring_write(ring, ib->length_dw);
1597 }
1598
1599 void vcn_v2_0_dec_ring_emit_reg_wait(struct amdgpu_ring *ring, uint32_t reg,
1600                                 uint32_t val, uint32_t mask)
1601 {
1602         struct amdgpu_device *adev = ring->adev;
1603
1604         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.data0, 0));
1605         amdgpu_ring_write(ring, reg << 2);
1606
1607         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.data1, 0));
1608         amdgpu_ring_write(ring, val);
1609
1610         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.gp_scratch8, 0));
1611         amdgpu_ring_write(ring, mask);
1612
1613         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.cmd, 0));
1614
1615         amdgpu_ring_write(ring, VCN_DEC_KMD_CMD | (VCN_DEC_CMD_REG_READ_COND_WAIT << 1));
1616 }
1617
1618 void vcn_v2_0_dec_ring_emit_vm_flush(struct amdgpu_ring *ring,
1619                                 unsigned vmid, uint64_t pd_addr)
1620 {
1621         struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
1622         uint32_t data0, data1, mask;
1623
1624         pd_addr = amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
1625
1626         /* wait for register write */
1627         data0 = hub->ctx0_ptb_addr_lo32 + vmid * 2;
1628         data1 = lower_32_bits(pd_addr);
1629         mask = 0xffffffff;
1630         vcn_v2_0_dec_ring_emit_reg_wait(ring, data0, data1, mask);
1631 }
1632
1633 void vcn_v2_0_dec_ring_emit_wreg(struct amdgpu_ring *ring,
1634                                 uint32_t reg, uint32_t val)
1635 {
1636         struct amdgpu_device *adev = ring->adev;
1637
1638         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.data0, 0));
1639         amdgpu_ring_write(ring, reg << 2);
1640
1641         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.data1, 0));
1642         amdgpu_ring_write(ring, val);
1643
1644         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.cmd, 0));
1645
1646         amdgpu_ring_write(ring, VCN_DEC_KMD_CMD | (VCN_DEC_CMD_WRITE_REG << 1));
1647 }
1648
1649 /**
1650  * vcn_v2_0_enc_ring_get_rptr - get enc read pointer
1651  *
1652  * @ring: amdgpu_ring pointer
1653  *
1654  * Returns the current hardware enc read pointer
1655  */
1656 static uint64_t vcn_v2_0_enc_ring_get_rptr(struct amdgpu_ring *ring)
1657 {
1658         struct amdgpu_device *adev = ring->adev;
1659
1660         if (ring == &adev->vcn.inst->ring_enc[0])
1661                 return RREG32_SOC15(UVD, 0, mmUVD_RB_RPTR);
1662         else
1663                 return RREG32_SOC15(UVD, 0, mmUVD_RB_RPTR2);
1664 }
1665
1666  /**
1667  * vcn_v2_0_enc_ring_get_wptr - get enc write pointer
1668  *
1669  * @ring: amdgpu_ring pointer
1670  *
1671  * Returns the current hardware enc write pointer
1672  */
1673 static uint64_t vcn_v2_0_enc_ring_get_wptr(struct amdgpu_ring *ring)
1674 {
1675         struct amdgpu_device *adev = ring->adev;
1676
1677         if (ring == &adev->vcn.inst->ring_enc[0]) {
1678                 if (ring->use_doorbell)
1679                         return adev->wb.wb[ring->wptr_offs];
1680                 else
1681                         return RREG32_SOC15(UVD, 0, mmUVD_RB_WPTR);
1682         } else {
1683                 if (ring->use_doorbell)
1684                         return adev->wb.wb[ring->wptr_offs];
1685                 else
1686                         return RREG32_SOC15(UVD, 0, mmUVD_RB_WPTR2);
1687         }
1688 }
1689
1690  /**
1691  * vcn_v2_0_enc_ring_set_wptr - set enc write pointer
1692  *
1693  * @ring: amdgpu_ring pointer
1694  *
1695  * Commits the enc write pointer to the hardware
1696  */
1697 static void vcn_v2_0_enc_ring_set_wptr(struct amdgpu_ring *ring)
1698 {
1699         struct amdgpu_device *adev = ring->adev;
1700
1701         if (ring == &adev->vcn.inst->ring_enc[0]) {
1702                 if (ring->use_doorbell) {
1703                         adev->wb.wb[ring->wptr_offs] = lower_32_bits(ring->wptr);
1704                         WDOORBELL32(ring->doorbell_index, lower_32_bits(ring->wptr));
1705                 } else {
1706                         WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR, lower_32_bits(ring->wptr));
1707                 }
1708         } else {
1709                 if (ring->use_doorbell) {
1710                         adev->wb.wb[ring->wptr_offs] = lower_32_bits(ring->wptr);
1711                         WDOORBELL32(ring->doorbell_index, lower_32_bits(ring->wptr));
1712                 } else {
1713                         WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR2, lower_32_bits(ring->wptr));
1714                 }
1715         }
1716 }
1717
1718 /**
1719  * vcn_v2_0_enc_ring_emit_fence - emit an enc fence & trap command
1720  *
1721  * @ring: amdgpu_ring pointer
1722  * @fence: fence to emit
1723  *
1724  * Write enc a fence and a trap command to the ring.
1725  */
1726 void vcn_v2_0_enc_ring_emit_fence(struct amdgpu_ring *ring, u64 addr,
1727                                 u64 seq, unsigned flags)
1728 {
1729         WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
1730
1731         amdgpu_ring_write(ring, VCN_ENC_CMD_FENCE);
1732         amdgpu_ring_write(ring, addr);
1733         amdgpu_ring_write(ring, upper_32_bits(addr));
1734         amdgpu_ring_write(ring, seq);
1735         amdgpu_ring_write(ring, VCN_ENC_CMD_TRAP);
1736 }
1737
1738 void vcn_v2_0_enc_ring_insert_end(struct amdgpu_ring *ring)
1739 {
1740         amdgpu_ring_write(ring, VCN_ENC_CMD_END);
1741 }
1742
1743 /**
1744  * vcn_v2_0_enc_ring_emit_ib - enc execute indirect buffer
1745  *
1746  * @ring: amdgpu_ring pointer
1747  * @ib: indirect buffer to execute
1748  *
1749  * Write enc ring commands to execute the indirect buffer
1750  */
1751 void vcn_v2_0_enc_ring_emit_ib(struct amdgpu_ring *ring,
1752                                struct amdgpu_job *job,
1753                                struct amdgpu_ib *ib,
1754                                uint32_t flags)
1755 {
1756         unsigned vmid = AMDGPU_JOB_GET_VMID(job);
1757
1758         amdgpu_ring_write(ring, VCN_ENC_CMD_IB);
1759         amdgpu_ring_write(ring, vmid);
1760         amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
1761         amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
1762         amdgpu_ring_write(ring, ib->length_dw);
1763 }
1764
1765 void vcn_v2_0_enc_ring_emit_reg_wait(struct amdgpu_ring *ring, uint32_t reg,
1766                                 uint32_t val, uint32_t mask)
1767 {
1768         amdgpu_ring_write(ring, VCN_ENC_CMD_REG_WAIT);
1769         amdgpu_ring_write(ring, reg << 2);
1770         amdgpu_ring_write(ring, mask);
1771         amdgpu_ring_write(ring, val);
1772 }
1773
1774 void vcn_v2_0_enc_ring_emit_vm_flush(struct amdgpu_ring *ring,
1775                                 unsigned int vmid, uint64_t pd_addr)
1776 {
1777         struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
1778
1779         pd_addr = amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
1780
1781         /* wait for reg writes */
1782         vcn_v2_0_enc_ring_emit_reg_wait(ring, hub->ctx0_ptb_addr_lo32 + vmid * 2,
1783                                         lower_32_bits(pd_addr), 0xffffffff);
1784 }
1785
1786 void vcn_v2_0_enc_ring_emit_wreg(struct amdgpu_ring *ring, uint32_t reg, uint32_t val)
1787 {
1788         amdgpu_ring_write(ring, VCN_ENC_CMD_REG_WRITE);
1789         amdgpu_ring_write(ring, reg << 2);
1790         amdgpu_ring_write(ring, val);
1791 }
1792
1793 /**
1794  * vcn_v2_0_jpeg_ring_get_rptr - get read pointer
1795  *
1796  * @ring: amdgpu_ring pointer
1797  *
1798  * Returns the current hardware read pointer
1799  */
1800 static uint64_t vcn_v2_0_jpeg_ring_get_rptr(struct amdgpu_ring *ring)
1801 {
1802         struct amdgpu_device *adev = ring->adev;
1803
1804         return RREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_RPTR);
1805 }
1806
1807 /**
1808  * vcn_v2_0_jpeg_ring_get_wptr - get write pointer
1809  *
1810  * @ring: amdgpu_ring pointer
1811  *
1812  * Returns the current hardware write pointer
1813  */
1814 static uint64_t vcn_v2_0_jpeg_ring_get_wptr(struct amdgpu_ring *ring)
1815 {
1816         struct amdgpu_device *adev = ring->adev;
1817
1818         if (ring->use_doorbell)
1819                 return adev->wb.wb[ring->wptr_offs];
1820         else
1821                 return RREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_WPTR);
1822 }
1823
1824 /**
1825  * vcn_v2_0_jpeg_ring_set_wptr - set write pointer
1826  *
1827  * @ring: amdgpu_ring pointer
1828  *
1829  * Commits the write pointer to the hardware
1830  */
1831 static void vcn_v2_0_jpeg_ring_set_wptr(struct amdgpu_ring *ring)
1832 {
1833         struct amdgpu_device *adev = ring->adev;
1834
1835         if (ring->use_doorbell) {
1836                 adev->wb.wb[ring->wptr_offs] = lower_32_bits(ring->wptr);
1837                 WDOORBELL32(ring->doorbell_index, lower_32_bits(ring->wptr));
1838         } else {
1839                 WREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_WPTR, lower_32_bits(ring->wptr));
1840         }
1841 }
1842
1843 /**
1844  * vcn_v2_0_jpeg_ring_insert_start - insert a start command
1845  *
1846  * @ring: amdgpu_ring pointer
1847  *
1848  * Write a start command to the ring.
1849  */
1850 void vcn_v2_0_jpeg_ring_insert_start(struct amdgpu_ring *ring)
1851 {
1852         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
1853                 0, 0, PACKETJ_TYPE0));
1854         amdgpu_ring_write(ring, 0x68e04);
1855
1856         amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
1857                 0, 0, PACKETJ_TYPE0));
1858         amdgpu_ring_write(ring, 0x80010000);
1859 }
1860
1861 /**
1862  * vcn_v2_0_jpeg_ring_insert_end - insert a end command
1863  *
1864  * @ring: amdgpu_ring pointer
1865  *
1866  * Write a end command to the ring.
1867  */
1868 void vcn_v2_0_jpeg_ring_insert_end(struct amdgpu_ring *ring)
1869 {
1870         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
1871                 0, 0, PACKETJ_TYPE0));
1872         amdgpu_ring_write(ring, 0x68e04);
1873
1874         amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
1875                 0, 0, PACKETJ_TYPE0));
1876         amdgpu_ring_write(ring, 0x00010000);
1877 }
1878
1879 /**
1880  * vcn_v2_0_jpeg_ring_emit_fence - emit an fence & trap command
1881  *
1882  * @ring: amdgpu_ring pointer
1883  * @fence: fence to emit
1884  *
1885  * Write a fence and a trap command to the ring.
1886  */
1887 void vcn_v2_0_jpeg_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq,
1888                                 unsigned flags)
1889 {
1890         WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
1891
1892         amdgpu_ring_write(ring, PACKETJ(mmUVD_JPEG_GPCOM_DATA0_INTERNAL_OFFSET,
1893                 0, 0, PACKETJ_TYPE0));
1894         amdgpu_ring_write(ring, seq);
1895
1896         amdgpu_ring_write(ring, PACKETJ(mmUVD_JPEG_GPCOM_DATA1_INTERNAL_OFFSET,
1897                 0, 0, PACKETJ_TYPE0));
1898         amdgpu_ring_write(ring, seq);
1899
1900         amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_RB_MEM_WR_64BIT_BAR_LOW_INTERNAL_OFFSET,
1901                 0, 0, PACKETJ_TYPE0));
1902         amdgpu_ring_write(ring, lower_32_bits(addr));
1903
1904         amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_RB_MEM_WR_64BIT_BAR_HIGH_INTERNAL_OFFSET,
1905                 0, 0, PACKETJ_TYPE0));
1906         amdgpu_ring_write(ring, upper_32_bits(addr));
1907
1908         amdgpu_ring_write(ring, PACKETJ(mmUVD_JPEG_GPCOM_CMD_INTERNAL_OFFSET,
1909                 0, 0, PACKETJ_TYPE0));
1910         amdgpu_ring_write(ring, 0x8);
1911
1912         amdgpu_ring_write(ring, PACKETJ(mmUVD_JPEG_GPCOM_CMD_INTERNAL_OFFSET,
1913                 0, PACKETJ_CONDITION_CHECK0, PACKETJ_TYPE4));
1914         amdgpu_ring_write(ring, 0);
1915
1916         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
1917                 0, 0, PACKETJ_TYPE0));
1918         amdgpu_ring_write(ring, 0x3fbc);
1919
1920         amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
1921                 0, 0, PACKETJ_TYPE0));
1922         amdgpu_ring_write(ring, 0x1);
1923
1924         amdgpu_ring_write(ring, PACKETJ(0, 0, 0, PACKETJ_TYPE7));
1925         amdgpu_ring_write(ring, 0);
1926 }
1927
1928 /**
1929  * vcn_v2_0_jpeg_ring_emit_ib - execute indirect buffer
1930  *
1931  * @ring: amdgpu_ring pointer
1932  * @ib: indirect buffer to execute
1933  *
1934  * Write ring commands to execute the indirect buffer.
1935  */
1936 void vcn_v2_0_jpeg_ring_emit_ib(struct amdgpu_ring *ring,
1937                                 struct amdgpu_job *job,
1938                                 struct amdgpu_ib *ib,
1939                                 uint32_t flags)
1940 {
1941         unsigned vmid = AMDGPU_JOB_GET_VMID(job);
1942
1943         amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_IB_VMID_INTERNAL_OFFSET,
1944                 0, 0, PACKETJ_TYPE0));
1945         amdgpu_ring_write(ring, (vmid | (vmid << 4)));
1946
1947         amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JPEG_VMID_INTERNAL_OFFSET,
1948                 0, 0, PACKETJ_TYPE0));
1949         amdgpu_ring_write(ring, (vmid | (vmid << 4)));
1950
1951         amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_IB_64BIT_BAR_LOW_INTERNAL_OFFSET,
1952                 0, 0, PACKETJ_TYPE0));
1953         amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
1954
1955         amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_IB_64BIT_BAR_HIGH_INTERNAL_OFFSET,
1956                 0, 0, PACKETJ_TYPE0));
1957         amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
1958
1959         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_IB_SIZE_INTERNAL_OFFSET,
1960                 0, 0, PACKETJ_TYPE0));
1961         amdgpu_ring_write(ring, ib->length_dw);
1962
1963         amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_LOW_INTERNAL_OFFSET,
1964                 0, 0, PACKETJ_TYPE0));
1965         amdgpu_ring_write(ring, lower_32_bits(ring->gpu_addr));
1966
1967         amdgpu_ring_write(ring, PACKETJ(mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_HIGH_INTERNAL_OFFSET,
1968                 0, 0, PACKETJ_TYPE0));
1969         amdgpu_ring_write(ring, upper_32_bits(ring->gpu_addr));
1970
1971         amdgpu_ring_write(ring, PACKETJ(0, 0, PACKETJ_CONDITION_CHECK0, PACKETJ_TYPE2));
1972         amdgpu_ring_write(ring, 0);
1973
1974         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_RB_COND_RD_TIMER_INTERNAL_OFFSET,
1975                 0, 0, PACKETJ_TYPE0));
1976         amdgpu_ring_write(ring, 0x01400200);
1977
1978         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_RB_REF_DATA_INTERNAL_OFFSET,
1979                 0, 0, PACKETJ_TYPE0));
1980         amdgpu_ring_write(ring, 0x2);
1981
1982         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_STATUS_INTERNAL_OFFSET,
1983                 0, PACKETJ_CONDITION_CHECK3, PACKETJ_TYPE3));
1984         amdgpu_ring_write(ring, 0x2);
1985 }
1986
1987 void vcn_v2_0_jpeg_ring_emit_reg_wait(struct amdgpu_ring *ring, uint32_t reg,
1988                                 uint32_t val, uint32_t mask)
1989 {
1990         uint32_t reg_offset = (reg << 2);
1991
1992         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_RB_COND_RD_TIMER_INTERNAL_OFFSET,
1993                 0, 0, PACKETJ_TYPE0));
1994         amdgpu_ring_write(ring, 0x01400200);
1995
1996         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_RB_REF_DATA_INTERNAL_OFFSET,
1997                 0, 0, PACKETJ_TYPE0));
1998         amdgpu_ring_write(ring, val);
1999
2000         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
2001                 0, 0, PACKETJ_TYPE0));
2002         if (reg_offset >= 0x10000 && reg_offset <= 0x105ff) {
2003                 amdgpu_ring_write(ring, 0);
2004                 amdgpu_ring_write(ring,
2005                         PACKETJ((reg_offset >> 2), 0, 0, PACKETJ_TYPE3));
2006         } else {
2007                 amdgpu_ring_write(ring, reg_offset);
2008                 amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
2009                         0, 0, PACKETJ_TYPE3));
2010         }
2011         amdgpu_ring_write(ring, mask);
2012 }
2013
2014 void vcn_v2_0_jpeg_ring_emit_vm_flush(struct amdgpu_ring *ring,
2015                                 unsigned vmid, uint64_t pd_addr)
2016 {
2017         struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
2018         uint32_t data0, data1, mask;
2019
2020         pd_addr = amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
2021
2022         /* wait for register write */
2023         data0 = hub->ctx0_ptb_addr_lo32 + vmid * 2;
2024         data1 = lower_32_bits(pd_addr);
2025         mask = 0xffffffff;
2026         vcn_v2_0_jpeg_ring_emit_reg_wait(ring, data0, data1, mask);
2027 }
2028
2029 void vcn_v2_0_jpeg_ring_emit_wreg(struct amdgpu_ring *ring, uint32_t reg, uint32_t val)
2030 {
2031         uint32_t reg_offset = (reg << 2);
2032
2033         amdgpu_ring_write(ring, PACKETJ(mmUVD_JRBC_EXTERNAL_REG_INTERNAL_OFFSET,
2034                 0, 0, PACKETJ_TYPE0));
2035         if (reg_offset >= 0x10000 && reg_offset <= 0x105ff) {
2036                 amdgpu_ring_write(ring, 0);
2037                 amdgpu_ring_write(ring,
2038                         PACKETJ((reg_offset >> 2), 0, 0, PACKETJ_TYPE0));
2039         } else {
2040                 amdgpu_ring_write(ring, reg_offset);
2041                 amdgpu_ring_write(ring, PACKETJ(JRBC_DEC_EXTERNAL_REG_WRITE_ADDR,
2042                         0, 0, PACKETJ_TYPE0));
2043         }
2044         amdgpu_ring_write(ring, val);
2045 }
2046
2047 void vcn_v2_0_jpeg_ring_nop(struct amdgpu_ring *ring, uint32_t count)
2048 {
2049         int i;
2050
2051         WARN_ON(ring->wptr % 2 || count % 2);
2052
2053         for (i = 0; i < count / 2; i++) {
2054                 amdgpu_ring_write(ring, PACKETJ(0, 0, 0, PACKETJ_TYPE6));
2055                 amdgpu_ring_write(ring, 0);
2056         }
2057 }
2058
2059 static int vcn_v2_0_set_interrupt_state(struct amdgpu_device *adev,
2060                                         struct amdgpu_irq_src *source,
2061                                         unsigned type,
2062                                         enum amdgpu_interrupt_state state)
2063 {
2064         return 0;
2065 }
2066
2067 static int vcn_v2_0_process_interrupt(struct amdgpu_device *adev,
2068                                       struct amdgpu_irq_src *source,
2069                                       struct amdgpu_iv_entry *entry)
2070 {
2071         DRM_DEBUG("IH: VCN TRAP\n");
2072
2073         switch (entry->src_id) {
2074         case VCN_2_0__SRCID__UVD_SYSTEM_MESSAGE_INTERRUPT:
2075                 amdgpu_fence_process(&adev->vcn.inst->ring_dec);
2076                 break;
2077         case VCN_2_0__SRCID__UVD_ENC_GENERAL_PURPOSE:
2078                 amdgpu_fence_process(&adev->vcn.inst->ring_enc[0]);
2079                 break;
2080         case VCN_2_0__SRCID__UVD_ENC_LOW_LATENCY:
2081                 amdgpu_fence_process(&adev->vcn.inst->ring_enc[1]);
2082                 break;
2083         case VCN_2_0__SRCID__JPEG_DECODE:
2084                 amdgpu_fence_process(&adev->vcn.inst->ring_jpeg);
2085                 break;
2086         default:
2087                 DRM_ERROR("Unhandled interrupt: %d %d\n",
2088                           entry->src_id, entry->src_data[0]);
2089                 break;
2090         }
2091
2092         return 0;
2093 }
2094
2095 static int vcn_v2_0_dec_ring_test_ring(struct amdgpu_ring *ring)
2096 {
2097         struct amdgpu_device *adev = ring->adev;
2098         uint32_t tmp = 0;
2099         unsigned i;
2100         int r;
2101
2102         WREG32(adev->vcn.inst[ring->me].external.scratch9, 0xCAFEDEAD);
2103         r = amdgpu_ring_alloc(ring, 4);
2104         if (r)
2105                 return r;
2106         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.cmd, 0));
2107         amdgpu_ring_write(ring, VCN_DEC_KMD_CMD | (VCN_DEC_CMD_PACKET_START << 1));
2108         amdgpu_ring_write(ring, PACKET0(adev->vcn.internal.scratch9, 0));
2109         amdgpu_ring_write(ring, 0xDEADBEEF);
2110         amdgpu_ring_commit(ring);
2111         for (i = 0; i < adev->usec_timeout; i++) {
2112                 tmp = RREG32(adev->vcn.inst[ring->me].external.scratch9);
2113                 if (tmp == 0xDEADBEEF)
2114                         break;
2115                 udelay(1);
2116         }
2117
2118         if (i >= adev->usec_timeout)
2119                 r = -ETIMEDOUT;
2120
2121         return r;
2122 }
2123
2124
2125 static int vcn_v2_0_set_powergating_state(void *handle,
2126                                           enum amd_powergating_state state)
2127 {
2128         /* This doesn't actually powergate the VCN block.
2129          * That's done in the dpm code via the SMC.  This
2130          * just re-inits the block as necessary.  The actual
2131          * gating still happens in the dpm code.  We should
2132          * revisit this when there is a cleaner line between
2133          * the smc and the hw blocks
2134          */
2135         int ret;
2136         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
2137
2138         if (state == adev->vcn.cur_state)
2139                 return 0;
2140
2141         if (state == AMD_PG_STATE_GATE)
2142                 ret = vcn_v2_0_stop(adev);
2143         else
2144                 ret = vcn_v2_0_start(adev);
2145
2146         if (!ret)
2147                 adev->vcn.cur_state = state;
2148         return ret;
2149 }
2150
2151 static const struct amd_ip_funcs vcn_v2_0_ip_funcs = {
2152         .name = "vcn_v2_0",
2153         .early_init = vcn_v2_0_early_init,
2154         .late_init = NULL,
2155         .sw_init = vcn_v2_0_sw_init,
2156         .sw_fini = vcn_v2_0_sw_fini,
2157         .hw_init = vcn_v2_0_hw_init,
2158         .hw_fini = vcn_v2_0_hw_fini,
2159         .suspend = vcn_v2_0_suspend,
2160         .resume = vcn_v2_0_resume,
2161         .is_idle = vcn_v2_0_is_idle,
2162         .wait_for_idle = vcn_v2_0_wait_for_idle,
2163         .check_soft_reset = NULL,
2164         .pre_soft_reset = NULL,
2165         .soft_reset = NULL,
2166         .post_soft_reset = NULL,
2167         .set_clockgating_state = vcn_v2_0_set_clockgating_state,
2168         .set_powergating_state = vcn_v2_0_set_powergating_state,
2169 };
2170
2171 static const struct amdgpu_ring_funcs vcn_v2_0_dec_ring_vm_funcs = {
2172         .type = AMDGPU_RING_TYPE_VCN_DEC,
2173         .align_mask = 0xf,
2174         .vmhub = AMDGPU_MMHUB_0,
2175         .get_rptr = vcn_v2_0_dec_ring_get_rptr,
2176         .get_wptr = vcn_v2_0_dec_ring_get_wptr,
2177         .set_wptr = vcn_v2_0_dec_ring_set_wptr,
2178         .emit_frame_size =
2179                 SOC15_FLUSH_GPU_TLB_NUM_WREG * 6 +
2180                 SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 8 +
2181                 8 + /* vcn_v2_0_dec_ring_emit_vm_flush */
2182                 14 + 14 + /* vcn_v2_0_dec_ring_emit_fence x2 vm fence */
2183                 6,
2184         .emit_ib_size = 8, /* vcn_v2_0_dec_ring_emit_ib */
2185         .emit_ib = vcn_v2_0_dec_ring_emit_ib,
2186         .emit_fence = vcn_v2_0_dec_ring_emit_fence,
2187         .emit_vm_flush = vcn_v2_0_dec_ring_emit_vm_flush,
2188         .test_ring = vcn_v2_0_dec_ring_test_ring,
2189         .test_ib = amdgpu_vcn_dec_ring_test_ib,
2190         .insert_nop = vcn_v2_0_dec_ring_insert_nop,
2191         .insert_start = vcn_v2_0_dec_ring_insert_start,
2192         .insert_end = vcn_v2_0_dec_ring_insert_end,
2193         .pad_ib = amdgpu_ring_generic_pad_ib,
2194         .begin_use = amdgpu_vcn_ring_begin_use,
2195         .end_use = amdgpu_vcn_ring_end_use,
2196         .emit_wreg = vcn_v2_0_dec_ring_emit_wreg,
2197         .emit_reg_wait = vcn_v2_0_dec_ring_emit_reg_wait,
2198         .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
2199 };
2200
2201 static const struct amdgpu_ring_funcs vcn_v2_0_enc_ring_vm_funcs = {
2202         .type = AMDGPU_RING_TYPE_VCN_ENC,
2203         .align_mask = 0x3f,
2204         .nop = VCN_ENC_CMD_NO_OP,
2205         .vmhub = AMDGPU_MMHUB_0,
2206         .get_rptr = vcn_v2_0_enc_ring_get_rptr,
2207         .get_wptr = vcn_v2_0_enc_ring_get_wptr,
2208         .set_wptr = vcn_v2_0_enc_ring_set_wptr,
2209         .emit_frame_size =
2210                 SOC15_FLUSH_GPU_TLB_NUM_WREG * 3 +
2211                 SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 4 +
2212                 4 + /* vcn_v2_0_enc_ring_emit_vm_flush */
2213                 5 + 5 + /* vcn_v2_0_enc_ring_emit_fence x2 vm fence */
2214                 1, /* vcn_v2_0_enc_ring_insert_end */
2215         .emit_ib_size = 5, /* vcn_v2_0_enc_ring_emit_ib */
2216         .emit_ib = vcn_v2_0_enc_ring_emit_ib,
2217         .emit_fence = vcn_v2_0_enc_ring_emit_fence,
2218         .emit_vm_flush = vcn_v2_0_enc_ring_emit_vm_flush,
2219         .test_ring = amdgpu_vcn_enc_ring_test_ring,
2220         .test_ib = amdgpu_vcn_enc_ring_test_ib,
2221         .insert_nop = amdgpu_ring_insert_nop,
2222         .insert_end = vcn_v2_0_enc_ring_insert_end,
2223         .pad_ib = amdgpu_ring_generic_pad_ib,
2224         .begin_use = amdgpu_vcn_ring_begin_use,
2225         .end_use = amdgpu_vcn_ring_end_use,
2226         .emit_wreg = vcn_v2_0_enc_ring_emit_wreg,
2227         .emit_reg_wait = vcn_v2_0_enc_ring_emit_reg_wait,
2228         .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
2229 };
2230
2231 static const struct amdgpu_ring_funcs vcn_v2_0_jpeg_ring_vm_funcs = {
2232         .type = AMDGPU_RING_TYPE_VCN_JPEG,
2233         .align_mask = 0xf,
2234         .vmhub = AMDGPU_MMHUB_0,
2235         .get_rptr = vcn_v2_0_jpeg_ring_get_rptr,
2236         .get_wptr = vcn_v2_0_jpeg_ring_get_wptr,
2237         .set_wptr = vcn_v2_0_jpeg_ring_set_wptr,
2238         .emit_frame_size =
2239                 SOC15_FLUSH_GPU_TLB_NUM_WREG * 6 +
2240                 SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 8 +
2241                 8 + /* vcn_v2_0_jpeg_ring_emit_vm_flush */
2242                 18 + 18 + /* vcn_v2_0_jpeg_ring_emit_fence x2 vm fence */
2243                 8 + 16,
2244         .emit_ib_size = 22, /* vcn_v2_0_jpeg_ring_emit_ib */
2245         .emit_ib = vcn_v2_0_jpeg_ring_emit_ib,
2246         .emit_fence = vcn_v2_0_jpeg_ring_emit_fence,
2247         .emit_vm_flush = vcn_v2_0_jpeg_ring_emit_vm_flush,
2248         .test_ring = amdgpu_vcn_jpeg_ring_test_ring,
2249         .test_ib = amdgpu_vcn_jpeg_ring_test_ib,
2250         .insert_nop = vcn_v2_0_jpeg_ring_nop,
2251         .insert_start = vcn_v2_0_jpeg_ring_insert_start,
2252         .insert_end = vcn_v2_0_jpeg_ring_insert_end,
2253         .pad_ib = amdgpu_ring_generic_pad_ib,
2254         .begin_use = amdgpu_vcn_ring_begin_use,
2255         .end_use = amdgpu_vcn_ring_end_use,
2256         .emit_wreg = vcn_v2_0_jpeg_ring_emit_wreg,
2257         .emit_reg_wait = vcn_v2_0_jpeg_ring_emit_reg_wait,
2258         .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
2259 };
2260
2261 static void vcn_v2_0_set_dec_ring_funcs(struct amdgpu_device *adev)
2262 {
2263         adev->vcn.inst->ring_dec.funcs = &vcn_v2_0_dec_ring_vm_funcs;
2264         DRM_INFO("VCN decode is enabled in VM mode\n");
2265 }
2266
2267 static void vcn_v2_0_set_enc_ring_funcs(struct amdgpu_device *adev)
2268 {
2269         int i;
2270
2271         for (i = 0; i < adev->vcn.num_enc_rings; ++i)
2272                 adev->vcn.inst->ring_enc[i].funcs = &vcn_v2_0_enc_ring_vm_funcs;
2273
2274         DRM_INFO("VCN encode is enabled in VM mode\n");
2275 }
2276
2277 static void vcn_v2_0_set_jpeg_ring_funcs(struct amdgpu_device *adev)
2278 {
2279         adev->vcn.inst->ring_jpeg.funcs = &vcn_v2_0_jpeg_ring_vm_funcs;
2280         DRM_INFO("VCN jpeg decode is enabled in VM mode\n");
2281 }
2282
2283 static const struct amdgpu_irq_src_funcs vcn_v2_0_irq_funcs = {
2284         .set = vcn_v2_0_set_interrupt_state,
2285         .process = vcn_v2_0_process_interrupt,
2286 };
2287
2288 static void vcn_v2_0_set_irq_funcs(struct amdgpu_device *adev)
2289 {
2290         adev->vcn.inst->irq.num_types = adev->vcn.num_enc_rings + 2;
2291         adev->vcn.inst->irq.funcs = &vcn_v2_0_irq_funcs;
2292 }
2293
2294 const struct amdgpu_ip_block_version vcn_v2_0_ip_block =
2295 {
2296                 .type = AMD_IP_BLOCK_TYPE_VCN,
2297                 .major = 2,
2298                 .minor = 0,
2299                 .rev = 0,
2300                 .funcs = &vcn_v2_0_ip_funcs,
2301 };