xref: /openbmc/linux/drivers/gpu/drm/amd/amdgpu/uvd_v4_2.c (revision 24b4d710)
1a2e73f56SAlex Deucher /*
2a2e73f56SAlex Deucher  * Copyright 2013 Advanced Micro Devices, Inc.
3a2e73f56SAlex Deucher  *
4a2e73f56SAlex Deucher  * Permission is hereby granted, free of charge, to any person obtaining a
5a2e73f56SAlex Deucher  * copy of this software and associated documentation files (the "Software"),
6a2e73f56SAlex Deucher  * to deal in the Software without restriction, including without limitation
7a2e73f56SAlex Deucher  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8a2e73f56SAlex Deucher  * and/or sell copies of the Software, and to permit persons to whom the
9a2e73f56SAlex Deucher  * Software is furnished to do so, subject to the following conditions:
10a2e73f56SAlex Deucher  *
11a2e73f56SAlex Deucher  * The above copyright notice and this permission notice shall be included in
12a2e73f56SAlex Deucher  * all copies or substantial portions of the Software.
13a2e73f56SAlex Deucher  *
14a2e73f56SAlex Deucher  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15a2e73f56SAlex Deucher  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16a2e73f56SAlex Deucher  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17a2e73f56SAlex Deucher  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18a2e73f56SAlex Deucher  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19a2e73f56SAlex Deucher  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20a2e73f56SAlex Deucher  * OTHER DEALINGS IN THE SOFTWARE.
21a2e73f56SAlex Deucher  *
22a2e73f56SAlex Deucher  * Authors: Christian König <christian.koenig@amd.com>
23a2e73f56SAlex Deucher  */
24a2e73f56SAlex Deucher 
25a2e73f56SAlex Deucher #include <linux/firmware.h>
2647b757fbSSam Ravnborg 
27a2e73f56SAlex Deucher #include "amdgpu.h"
28a2e73f56SAlex Deucher #include "amdgpu_uvd.h"
29a2e73f56SAlex Deucher #include "cikd.h"
30a2e73f56SAlex Deucher 
31a2e73f56SAlex Deucher #include "uvd/uvd_4_2_d.h"
32a2e73f56SAlex Deucher #include "uvd/uvd_4_2_sh_mask.h"
33a2e73f56SAlex Deucher 
34a2e73f56SAlex Deucher #include "oss/oss_2_0_d.h"
35a2e73f56SAlex Deucher #include "oss/oss_2_0_sh_mask.h"
36a2e73f56SAlex Deucher 
37d5b4e25dSChristian König #include "bif/bif_4_1_d.h"
38d5b4e25dSChristian König 
394be5097cSRex Zhu #include "smu/smu_7_0_1_d.h"
404be5097cSRex Zhu #include "smu/smu_7_0_1_sh_mask.h"
414be5097cSRex Zhu 
42a2e73f56SAlex Deucher static void uvd_v4_2_mc_resume(struct amdgpu_device *adev);
43a2e73f56SAlex Deucher static void uvd_v4_2_set_ring_funcs(struct amdgpu_device *adev);
44a2e73f56SAlex Deucher static void uvd_v4_2_set_irq_funcs(struct amdgpu_device *adev);
45a2e73f56SAlex Deucher static int uvd_v4_2_start(struct amdgpu_device *adev);
46a2e73f56SAlex Deucher static void uvd_v4_2_stop(struct amdgpu_device *adev);
47aa4747c0SRex Zhu static int uvd_v4_2_set_clockgating_state(void *handle,
48aa4747c0SRex Zhu 				enum amd_clockgating_state state);
49ca581e45SRex Zhu static void uvd_v4_2_set_dcm(struct amdgpu_device *adev,
50ca581e45SRex Zhu 			     bool sw_mode);
51a2e73f56SAlex Deucher /**
52a2e73f56SAlex Deucher  * uvd_v4_2_ring_get_rptr - get read pointer
53a2e73f56SAlex Deucher  *
54a2e73f56SAlex Deucher  * @ring: amdgpu_ring pointer
55a2e73f56SAlex Deucher  *
56a2e73f56SAlex Deucher  * Returns the current hardware read pointer
57a2e73f56SAlex Deucher  */
uvd_v4_2_ring_get_rptr(struct amdgpu_ring * ring)58536fbf94SKen Wang static uint64_t uvd_v4_2_ring_get_rptr(struct amdgpu_ring *ring)
59a2e73f56SAlex Deucher {
60a2e73f56SAlex Deucher 	struct amdgpu_device *adev = ring->adev;
61a2e73f56SAlex Deucher 
62a2e73f56SAlex Deucher 	return RREG32(mmUVD_RBC_RB_RPTR);
63a2e73f56SAlex Deucher }
64a2e73f56SAlex Deucher 
65a2e73f56SAlex Deucher /**
66a2e73f56SAlex Deucher  * uvd_v4_2_ring_get_wptr - get write pointer
67a2e73f56SAlex Deucher  *
68a2e73f56SAlex Deucher  * @ring: amdgpu_ring pointer
69a2e73f56SAlex Deucher  *
70a2e73f56SAlex Deucher  * Returns the current hardware write pointer
71a2e73f56SAlex Deucher  */
uvd_v4_2_ring_get_wptr(struct amdgpu_ring * ring)72536fbf94SKen Wang static uint64_t uvd_v4_2_ring_get_wptr(struct amdgpu_ring *ring)
73a2e73f56SAlex Deucher {
74a2e73f56SAlex Deucher 	struct amdgpu_device *adev = ring->adev;
75a2e73f56SAlex Deucher 
76a2e73f56SAlex Deucher 	return RREG32(mmUVD_RBC_RB_WPTR);
77a2e73f56SAlex Deucher }
78a2e73f56SAlex Deucher 
79a2e73f56SAlex Deucher /**
80a2e73f56SAlex Deucher  * uvd_v4_2_ring_set_wptr - set write pointer
81a2e73f56SAlex Deucher  *
82a2e73f56SAlex Deucher  * @ring: amdgpu_ring pointer
83a2e73f56SAlex Deucher  *
84a2e73f56SAlex Deucher  * Commits the write pointer to the hardware
85a2e73f56SAlex Deucher  */
uvd_v4_2_ring_set_wptr(struct amdgpu_ring * ring)86a2e73f56SAlex Deucher static void uvd_v4_2_ring_set_wptr(struct amdgpu_ring *ring)
87a2e73f56SAlex Deucher {
88a2e73f56SAlex Deucher 	struct amdgpu_device *adev = ring->adev;
89a2e73f56SAlex Deucher 
90536fbf94SKen Wang 	WREG32(mmUVD_RBC_RB_WPTR, lower_32_bits(ring->wptr));
91a2e73f56SAlex Deucher }
92a2e73f56SAlex Deucher 
uvd_v4_2_early_init(void * handle)935fc3aeebSyanyang1 static int uvd_v4_2_early_init(void *handle)
94a2e73f56SAlex Deucher {
955fc3aeebSyanyang1 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
962bb795f5SJames Zhu 	adev->uvd.num_uvd_inst = 1;
975fc3aeebSyanyang1 
98a2e73f56SAlex Deucher 	uvd_v4_2_set_ring_funcs(adev);
99a2e73f56SAlex Deucher 	uvd_v4_2_set_irq_funcs(adev);
100a2e73f56SAlex Deucher 
101a2e73f56SAlex Deucher 	return 0;
102a2e73f56SAlex Deucher }
103a2e73f56SAlex Deucher 
uvd_v4_2_sw_init(void * handle)1045fc3aeebSyanyang1 static int uvd_v4_2_sw_init(void *handle)
105a2e73f56SAlex Deucher {
106a2e73f56SAlex Deucher 	struct amdgpu_ring *ring;
1075fc3aeebSyanyang1 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
108a2e73f56SAlex Deucher 	int r;
109a2e73f56SAlex Deucher 
110a2e73f56SAlex Deucher 	/* UVD TRAP */
1111ffdeca6SChristian König 	r = amdgpu_irq_add_id(adev, AMDGPU_IRQ_CLIENTID_LEGACY, 124, &adev->uvd.inst->irq);
112a2e73f56SAlex Deucher 	if (r)
113a2e73f56SAlex Deucher 		return r;
114a2e73f56SAlex Deucher 
115a2e73f56SAlex Deucher 	r = amdgpu_uvd_sw_init(adev);
116a2e73f56SAlex Deucher 	if (r)
117a2e73f56SAlex Deucher 		return r;
118a2e73f56SAlex Deucher 
1192bb795f5SJames Zhu 	ring = &adev->uvd.inst->ring;
120a2e73f56SAlex Deucher 	sprintf(ring->name, "uvd");
1211c6d567bSNirmoy Das 	r = amdgpu_ring_init(adev, ring, 512, &adev->uvd.inst->irq, 0,
122c107171bSChristian König 			     AMDGPU_RING_PRIO_DEFAULT, NULL);
12333d5bd07SEmily Deng 	if (r)
12433d5bd07SEmily Deng 		return r;
12533d5bd07SEmily Deng 
1263b34c14fSChris Wilson 	r = amdgpu_uvd_resume(adev);
1273b34c14fSChris Wilson 	if (r)
1283b34c14fSChris Wilson 		return r;
1293b34c14fSChris Wilson 
13033d5bd07SEmily Deng 	r = amdgpu_uvd_entity_init(adev);
131a2e73f56SAlex Deucher 
132a2e73f56SAlex Deucher 	return r;
133a2e73f56SAlex Deucher }
134a2e73f56SAlex Deucher 
uvd_v4_2_sw_fini(void * handle)1355fc3aeebSyanyang1 static int uvd_v4_2_sw_fini(void *handle)
136a2e73f56SAlex Deucher {
137a2e73f56SAlex Deucher 	int r;
1385fc3aeebSyanyang1 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
139a2e73f56SAlex Deucher 
140a2e73f56SAlex Deucher 	r = amdgpu_uvd_suspend(adev);
141a2e73f56SAlex Deucher 	if (r)
142a2e73f56SAlex Deucher 		return r;
143a2e73f56SAlex Deucher 
14450237287SRex Zhu 	return amdgpu_uvd_sw_fini(adev);
145a2e73f56SAlex Deucher }
14650237287SRex Zhu 
147ca581e45SRex Zhu static void uvd_v4_2_enable_mgcg(struct amdgpu_device *adev,
148ca581e45SRex Zhu 				 bool enable);
149a2e73f56SAlex Deucher /**
150a2e73f56SAlex Deucher  * uvd_v4_2_hw_init - start and test UVD block
151a2e73f56SAlex Deucher  *
15244eb261cSLee Jones  * @handle: handle used to pass amdgpu_device pointer
153a2e73f56SAlex Deucher  *
154a2e73f56SAlex Deucher  * Initialize the hardware, boot up the VCPU and do some testing
155a2e73f56SAlex Deucher  */
uvd_v4_2_hw_init(void * handle)1565fc3aeebSyanyang1 static int uvd_v4_2_hw_init(void *handle)
157a2e73f56SAlex Deucher {
1585fc3aeebSyanyang1 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1592bb795f5SJames Zhu 	struct amdgpu_ring *ring = &adev->uvd.inst->ring;
160a2e73f56SAlex Deucher 	uint32_t tmp;
161a2e73f56SAlex Deucher 	int r;
162a2e73f56SAlex Deucher 
163ca581e45SRex Zhu 	uvd_v4_2_enable_mgcg(adev, true);
164aa4747c0SRex Zhu 	amdgpu_asic_set_uvd_clocks(adev, 10000, 10000);
165a2e73f56SAlex Deucher 
166c66ed765SAndrey Grodzovsky 	r = amdgpu_ring_test_helper(ring);
167c66ed765SAndrey Grodzovsky 	if (r)
168a2e73f56SAlex Deucher 		goto done;
169a2e73f56SAlex Deucher 
170a27de35cSChristian König 	r = amdgpu_ring_alloc(ring, 10);
171a2e73f56SAlex Deucher 	if (r) {
172a2e73f56SAlex Deucher 		DRM_ERROR("amdgpu: ring failed to lock UVD ring (%d).\n", r);
173a2e73f56SAlex Deucher 		goto done;
174a2e73f56SAlex Deucher 	}
175a2e73f56SAlex Deucher 
176a2e73f56SAlex Deucher 	tmp = PACKET0(mmUVD_SEMA_WAIT_FAULT_TIMEOUT_CNTL, 0);
177a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, tmp);
178a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, 0xFFFFF);
179a2e73f56SAlex Deucher 
180a2e73f56SAlex Deucher 	tmp = PACKET0(mmUVD_SEMA_WAIT_INCOMPLETE_TIMEOUT_CNTL, 0);
181a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, tmp);
182a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, 0xFFFFF);
183a2e73f56SAlex Deucher 
184a2e73f56SAlex Deucher 	tmp = PACKET0(mmUVD_SEMA_SIGNAL_INCOMPLETE_TIMEOUT_CNTL, 0);
185a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, tmp);
186a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, 0xFFFFF);
187a2e73f56SAlex Deucher 
188a2e73f56SAlex Deucher 	/* Clear timeout status bits */
189a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, PACKET0(mmUVD_SEMA_TIMEOUT_STATUS, 0));
190a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, 0x8);
191a2e73f56SAlex Deucher 
192a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, PACKET0(mmUVD_SEMA_CNTL, 0));
193a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, 3);
194a2e73f56SAlex Deucher 
195a27de35cSChristian König 	amdgpu_ring_commit(ring);
196a2e73f56SAlex Deucher 
197a2e73f56SAlex Deucher done:
198a2e73f56SAlex Deucher 	if (!r)
199a2e73f56SAlex Deucher 		DRM_INFO("UVD initialized successfully.\n");
200a2e73f56SAlex Deucher 
201a2e73f56SAlex Deucher 	return r;
202a2e73f56SAlex Deucher }
203a2e73f56SAlex Deucher 
204a2e73f56SAlex Deucher /**
205a2e73f56SAlex Deucher  * uvd_v4_2_hw_fini - stop the hardware block
206a2e73f56SAlex Deucher  *
20744eb261cSLee Jones  * @handle: handle used to pass amdgpu_device pointer
208a2e73f56SAlex Deucher  *
209a2e73f56SAlex Deucher  * Stop the UVD block, mark ring as not ready any more
210a2e73f56SAlex Deucher  */
uvd_v4_2_hw_fini(void * handle)2115fc3aeebSyanyang1 static int uvd_v4_2_hw_fini(void *handle)
212a2e73f56SAlex Deucher {
2135fc3aeebSyanyang1 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
214a2e73f56SAlex Deucher 
215*24b4d710SAndrey Grodzovsky 	cancel_delayed_work_sync(&adev->uvd.idle_work);
216*24b4d710SAndrey Grodzovsky 
217*24b4d710SAndrey Grodzovsky 	if (RREG32(mmUVD_STATUS) != 0)
218*24b4d710SAndrey Grodzovsky 		uvd_v4_2_stop(adev);
219*24b4d710SAndrey Grodzovsky 
220*24b4d710SAndrey Grodzovsky 	return 0;
221*24b4d710SAndrey Grodzovsky }
222*24b4d710SAndrey Grodzovsky 
uvd_v4_2_suspend(void * handle)223*24b4d710SAndrey Grodzovsky static int uvd_v4_2_suspend(void *handle)
224*24b4d710SAndrey Grodzovsky {
225*24b4d710SAndrey Grodzovsky 	int r;
226*24b4d710SAndrey Grodzovsky 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
227*24b4d710SAndrey Grodzovsky 
228859e4659SEvan Quan 	/*
229859e4659SEvan Quan 	 * Proper cleanups before halting the HW engine:
230859e4659SEvan Quan 	 *   - cancel the delayed idle work
231859e4659SEvan Quan 	 *   - enable powergating
232859e4659SEvan Quan 	 *   - enable clockgating
233859e4659SEvan Quan 	 *   - disable dpm
234859e4659SEvan Quan 	 *
235859e4659SEvan Quan 	 * TODO: to align with the VCN implementation, move the
236859e4659SEvan Quan 	 * jobs for clockgating/powergating/dpm setting to
237859e4659SEvan Quan 	 * ->set_powergating_state().
238859e4659SEvan Quan 	 */
239859e4659SEvan Quan 	cancel_delayed_work_sync(&adev->uvd.idle_work);
240859e4659SEvan Quan 
241859e4659SEvan Quan 	if (adev->pm.dpm_enabled) {
242859e4659SEvan Quan 		amdgpu_dpm_enable_uvd(adev, false);
243859e4659SEvan Quan 	} else {
244859e4659SEvan Quan 		amdgpu_asic_set_uvd_clocks(adev, 0, 0);
245859e4659SEvan Quan 		/* shutdown the UVD block */
246859e4659SEvan Quan 		amdgpu_device_ip_set_powergating_state(adev, AMD_IP_BLOCK_TYPE_UVD,
247859e4659SEvan Quan 						       AMD_PG_STATE_GATE);
248859e4659SEvan Quan 		amdgpu_device_ip_set_clockgating_state(adev, AMD_IP_BLOCK_TYPE_UVD,
249859e4659SEvan Quan 						       AMD_CG_STATE_GATE);
250859e4659SEvan Quan 	}
251859e4659SEvan Quan 
2523f99dd81SLeo Liu 	r = uvd_v4_2_hw_fini(adev);
253a2e73f56SAlex Deucher 	if (r)
254a2e73f56SAlex Deucher 		return r;
255a2e73f56SAlex Deucher 
25650237287SRex Zhu 	return amdgpu_uvd_suspend(adev);
257a2e73f56SAlex Deucher }
258a2e73f56SAlex Deucher 
uvd_v4_2_resume(void * handle)2595fc3aeebSyanyang1 static int uvd_v4_2_resume(void *handle)
260a2e73f56SAlex Deucher {
261a2e73f56SAlex Deucher 	int r;
2625fc3aeebSyanyang1 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
263a2e73f56SAlex Deucher 
264a2e73f56SAlex Deucher 	r = amdgpu_uvd_resume(adev);
265a2e73f56SAlex Deucher 	if (r)
266a2e73f56SAlex Deucher 		return r;
267a2e73f56SAlex Deucher 
26850237287SRex Zhu 	return uvd_v4_2_hw_init(adev);
269a2e73f56SAlex Deucher }
270a2e73f56SAlex Deucher 
271a2e73f56SAlex Deucher /**
272a2e73f56SAlex Deucher  * uvd_v4_2_start - start UVD block
273a2e73f56SAlex Deucher  *
274a2e73f56SAlex Deucher  * @adev: amdgpu_device pointer
275a2e73f56SAlex Deucher  *
276a2e73f56SAlex Deucher  * Setup and start the UVD block
277a2e73f56SAlex Deucher  */
uvd_v4_2_start(struct amdgpu_device * adev)278a2e73f56SAlex Deucher static int uvd_v4_2_start(struct amdgpu_device *adev)
279a2e73f56SAlex Deucher {
2802bb795f5SJames Zhu 	struct amdgpu_ring *ring = &adev->uvd.inst->ring;
281a2e73f56SAlex Deucher 	uint32_t rb_bufsz;
282a2e73f56SAlex Deucher 	int i, j, r;
2838b55d17eSRex Zhu 	u32 tmp;
284a2e73f56SAlex Deucher 	/* disable byte swapping */
285a2e73f56SAlex Deucher 	u32 lmi_swap_cntl = 0;
286a2e73f56SAlex Deucher 	u32 mp_swap_cntl = 0;
287a2e73f56SAlex Deucher 
2888b55d17eSRex Zhu 	/* set uvd busy */
2898b55d17eSRex Zhu 	WREG32_P(mmUVD_STATUS, 1<<2, ~(1<<2));
2908b55d17eSRex Zhu 
291ca581e45SRex Zhu 	uvd_v4_2_set_dcm(adev, true);
2928b55d17eSRex Zhu 	WREG32(mmUVD_CGC_GATE, 0);
293a2e73f56SAlex Deucher 
294a2e73f56SAlex Deucher 	/* take UVD block out of reset */
295a2e73f56SAlex Deucher 	WREG32_P(mmSRBM_SOFT_RESET, 0, ~SRBM_SOFT_RESET__SOFT_RESET_UVD_MASK);
296a2e73f56SAlex Deucher 	mdelay(5);
297a2e73f56SAlex Deucher 
2988b55d17eSRex Zhu 	/* enable VCPU clock */
2998b55d17eSRex Zhu 	WREG32(mmUVD_VCPU_CNTL,  1 << 9);
3008b55d17eSRex Zhu 
3018b55d17eSRex Zhu 	/* disable interupt */
3028b55d17eSRex Zhu 	WREG32_P(mmUVD_MASTINT_EN, 0, ~(1 << 1));
303a2e73f56SAlex Deucher 
304a2e73f56SAlex Deucher #ifdef __BIG_ENDIAN
305a2e73f56SAlex Deucher 	/* swap (8 in 32) RB and IB */
306a2e73f56SAlex Deucher 	lmi_swap_cntl = 0xa;
307a2e73f56SAlex Deucher 	mp_swap_cntl = 0;
308a2e73f56SAlex Deucher #endif
309a2e73f56SAlex Deucher 	WREG32(mmUVD_LMI_SWAP_CNTL, lmi_swap_cntl);
310a2e73f56SAlex Deucher 	WREG32(mmUVD_MP_SWAP_CNTL, mp_swap_cntl);
3118b55d17eSRex Zhu 	/* initialize UVD memory controller */
3128b55d17eSRex Zhu 	WREG32(mmUVD_LMI_CTRL, 0x203108);
3138b55d17eSRex Zhu 
3148b55d17eSRex Zhu 	tmp = RREG32(mmUVD_MPC_CNTL);
3158b55d17eSRex Zhu 	WREG32(mmUVD_MPC_CNTL, tmp | 0x10);
316a2e73f56SAlex Deucher 
317a2e73f56SAlex Deucher 	WREG32(mmUVD_MPC_SET_MUXA0, 0x40c2040);
318a2e73f56SAlex Deucher 	WREG32(mmUVD_MPC_SET_MUXA1, 0x0);
319a2e73f56SAlex Deucher 	WREG32(mmUVD_MPC_SET_MUXB0, 0x40c2040);
320a2e73f56SAlex Deucher 	WREG32(mmUVD_MPC_SET_MUXB1, 0x0);
321a2e73f56SAlex Deucher 	WREG32(mmUVD_MPC_SET_ALU, 0);
322a2e73f56SAlex Deucher 	WREG32(mmUVD_MPC_SET_MUX, 0x88);
323a2e73f56SAlex Deucher 
3248b55d17eSRex Zhu 	uvd_v4_2_mc_resume(adev);
325a2e73f56SAlex Deucher 
3268b55d17eSRex Zhu 	tmp = RREG32_UVD_CTX(ixUVD_LMI_CACHE_CTRL);
3278b55d17eSRex Zhu 	WREG32_UVD_CTX(ixUVD_LMI_CACHE_CTRL, tmp & (~0x10));
328a2e73f56SAlex Deucher 
329a2e73f56SAlex Deucher 	/* enable UMC */
330a2e73f56SAlex Deucher 	WREG32_P(mmUVD_LMI_CTRL2, 0, ~(1 << 8));
331a2e73f56SAlex Deucher 
3328b55d17eSRex Zhu 	WREG32_P(mmUVD_SOFT_RESET, 0, ~UVD_SOFT_RESET__LMI_SOFT_RESET_MASK);
3338b55d17eSRex Zhu 
3348b55d17eSRex Zhu 	WREG32_P(mmUVD_SOFT_RESET, 0, ~UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK);
3358b55d17eSRex Zhu 
3368b55d17eSRex Zhu 	WREG32_P(mmUVD_SOFT_RESET, 0, ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
3378b55d17eSRex Zhu 
338a2e73f56SAlex Deucher 	mdelay(10);
339a2e73f56SAlex Deucher 
340a2e73f56SAlex Deucher 	for (i = 0; i < 10; ++i) {
341a2e73f56SAlex Deucher 		uint32_t status;
342a2e73f56SAlex Deucher 		for (j = 0; j < 100; ++j) {
343a2e73f56SAlex Deucher 			status = RREG32(mmUVD_STATUS);
344a2e73f56SAlex Deucher 			if (status & 2)
345a2e73f56SAlex Deucher 				break;
346a2e73f56SAlex Deucher 			mdelay(10);
347a2e73f56SAlex Deucher 		}
348a2e73f56SAlex Deucher 		r = 0;
349a2e73f56SAlex Deucher 		if (status & 2)
350a2e73f56SAlex Deucher 			break;
351a2e73f56SAlex Deucher 
352a2e73f56SAlex Deucher 		DRM_ERROR("UVD not responding, trying to reset the VCPU!!!\n");
353a2e73f56SAlex Deucher 		WREG32_P(mmUVD_SOFT_RESET, UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK,
354a2e73f56SAlex Deucher 				~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
355a2e73f56SAlex Deucher 		mdelay(10);
356a2e73f56SAlex Deucher 		WREG32_P(mmUVD_SOFT_RESET, 0, ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
357a2e73f56SAlex Deucher 		mdelay(10);
358a2e73f56SAlex Deucher 		r = -1;
359a2e73f56SAlex Deucher 	}
360a2e73f56SAlex Deucher 
361a2e73f56SAlex Deucher 	if (r) {
362a2e73f56SAlex Deucher 		DRM_ERROR("UVD not responding, giving up!!!\n");
363a2e73f56SAlex Deucher 		return r;
364a2e73f56SAlex Deucher 	}
365a2e73f56SAlex Deucher 
366a2e73f56SAlex Deucher 	/* enable interupt */
367a2e73f56SAlex Deucher 	WREG32_P(mmUVD_MASTINT_EN, 3<<1, ~(3 << 1));
368a2e73f56SAlex Deucher 
3698b55d17eSRex Zhu 	WREG32_P(mmUVD_STATUS, 0, ~(1<<2));
3708b55d17eSRex Zhu 
371a2e73f56SAlex Deucher 	/* force RBC into idle state */
372a2e73f56SAlex Deucher 	WREG32(mmUVD_RBC_RB_CNTL, 0x11010101);
373a2e73f56SAlex Deucher 
374a2e73f56SAlex Deucher 	/* Set the write pointer delay */
375a2e73f56SAlex Deucher 	WREG32(mmUVD_RBC_RB_WPTR_CNTL, 0);
376a2e73f56SAlex Deucher 
377f349f772SBernard Zhao 	/* program the 4GB memory segment for rptr and ring buffer */
378a2e73f56SAlex Deucher 	WREG32(mmUVD_LMI_EXT40_ADDR, upper_32_bits(ring->gpu_addr) |
379a2e73f56SAlex Deucher 				   (0x7 << 16) | (0x1 << 31));
380a2e73f56SAlex Deucher 
381a2e73f56SAlex Deucher 	/* Initialize the ring buffer's read and write pointers */
382a2e73f56SAlex Deucher 	WREG32(mmUVD_RBC_RB_RPTR, 0x0);
383a2e73f56SAlex Deucher 
384a2e73f56SAlex Deucher 	ring->wptr = RREG32(mmUVD_RBC_RB_RPTR);
385536fbf94SKen Wang 	WREG32(mmUVD_RBC_RB_WPTR, lower_32_bits(ring->wptr));
386a2e73f56SAlex Deucher 
387a2e73f56SAlex Deucher 	/* set the ring address */
388a2e73f56SAlex Deucher 	WREG32(mmUVD_RBC_RB_BASE, ring->gpu_addr);
389a2e73f56SAlex Deucher 
390a2e73f56SAlex Deucher 	/* Set ring buffer size */
391a2e73f56SAlex Deucher 	rb_bufsz = order_base_2(ring->ring_size);
392a2e73f56SAlex Deucher 	rb_bufsz = (0x1 << 8) | rb_bufsz;
393a2e73f56SAlex Deucher 	WREG32_P(mmUVD_RBC_RB_CNTL, rb_bufsz, ~0x11f1f);
394a2e73f56SAlex Deucher 
395a2e73f56SAlex Deucher 	return 0;
396a2e73f56SAlex Deucher }
397a2e73f56SAlex Deucher 
398a2e73f56SAlex Deucher /**
399a2e73f56SAlex Deucher  * uvd_v4_2_stop - stop UVD block
400a2e73f56SAlex Deucher  *
401a2e73f56SAlex Deucher  * @adev: amdgpu_device pointer
402a2e73f56SAlex Deucher  *
403a2e73f56SAlex Deucher  * stop the UVD block
404a2e73f56SAlex Deucher  */
uvd_v4_2_stop(struct amdgpu_device * adev)405a2e73f56SAlex Deucher static void uvd_v4_2_stop(struct amdgpu_device *adev)
406a2e73f56SAlex Deucher {
4078b55d17eSRex Zhu 	uint32_t i, j;
4088b55d17eSRex Zhu 	uint32_t status;
4098b55d17eSRex Zhu 
410a2e73f56SAlex Deucher 	WREG32(mmUVD_RBC_RB_CNTL, 0x11010101);
411a2e73f56SAlex Deucher 
4128b55d17eSRex Zhu 	for (i = 0; i < 10; ++i) {
4138b55d17eSRex Zhu 		for (j = 0; j < 100; ++j) {
4148b55d17eSRex Zhu 			status = RREG32(mmUVD_STATUS);
4158b55d17eSRex Zhu 			if (status & 2)
4168b55d17eSRex Zhu 				break;
4178b55d17eSRex Zhu 			mdelay(1);
4188b55d17eSRex Zhu 		}
419e89d5b5cSTom St Denis 		if (status & 2)
4208b55d17eSRex Zhu 			break;
4218b55d17eSRex Zhu 	}
4228b55d17eSRex Zhu 
4238b55d17eSRex Zhu 	for (i = 0; i < 10; ++i) {
4248b55d17eSRex Zhu 		for (j = 0; j < 100; ++j) {
4258b55d17eSRex Zhu 			status = RREG32(mmUVD_LMI_STATUS);
4268b55d17eSRex Zhu 			if (status & 0xf)
4278b55d17eSRex Zhu 				break;
4288b55d17eSRex Zhu 			mdelay(1);
4298b55d17eSRex Zhu 		}
430e89d5b5cSTom St Denis 		if (status & 0xf)
4318b55d17eSRex Zhu 			break;
4328b55d17eSRex Zhu 	}
4338b55d17eSRex Zhu 
434a2e73f56SAlex Deucher 	/* Stall UMC and register bus before resetting VCPU */
435a2e73f56SAlex Deucher 	WREG32_P(mmUVD_LMI_CTRL2, 1 << 8, ~(1 << 8));
4368b55d17eSRex Zhu 
4378b55d17eSRex Zhu 	for (i = 0; i < 10; ++i) {
4388b55d17eSRex Zhu 		for (j = 0; j < 100; ++j) {
4398b55d17eSRex Zhu 			status = RREG32(mmUVD_LMI_STATUS);
4408b55d17eSRex Zhu 			if (status & 0x240)
4418b55d17eSRex Zhu 				break;
442a2e73f56SAlex Deucher 			mdelay(1);
4438b55d17eSRex Zhu 		}
444e89d5b5cSTom St Denis 		if (status & 0x240)
4458b55d17eSRex Zhu 			break;
4468b55d17eSRex Zhu 	}
447a2e73f56SAlex Deucher 
4488b55d17eSRex Zhu 	WREG32_P(0x3D49, 0, ~(1 << 2));
449a2e73f56SAlex Deucher 
4508b55d17eSRex Zhu 	WREG32_P(mmUVD_VCPU_CNTL, 0, ~(1 << 9));
451a2e73f56SAlex Deucher 
4528b55d17eSRex Zhu 	/* put LMI, VCPU, RBC etc... into reset */
4538b55d17eSRex Zhu 	WREG32(mmUVD_SOFT_RESET, UVD_SOFT_RESET__LMI_SOFT_RESET_MASK |
4548b55d17eSRex Zhu 		UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK |
4558b55d17eSRex Zhu 		UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK);
4568b55d17eSRex Zhu 
4578b55d17eSRex Zhu 	WREG32(mmUVD_STATUS, 0);
458ca581e45SRex Zhu 
459ca581e45SRex Zhu 	uvd_v4_2_set_dcm(adev, false);
460a2e73f56SAlex Deucher }
461a2e73f56SAlex Deucher 
462a2e73f56SAlex Deucher /**
463a2e73f56SAlex Deucher  * uvd_v4_2_ring_emit_fence - emit an fence & trap command
464a2e73f56SAlex Deucher  *
465a2e73f56SAlex Deucher  * @ring: amdgpu_ring pointer
46644eb261cSLee Jones  * @addr: address
46744eb261cSLee Jones  * @seq: sequence number
4688a0fdc72SLee Jones  * @flags: fence related flags
469a2e73f56SAlex Deucher  *
470a2e73f56SAlex Deucher  * Write a fence and a trap command to the ring.
471a2e73f56SAlex Deucher  */
uvd_v4_2_ring_emit_fence(struct amdgpu_ring * ring,u64 addr,u64 seq,unsigned flags)472a2e73f56SAlex Deucher static void uvd_v4_2_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq,
473890ee23fSChunming Zhou 				     unsigned flags)
474a2e73f56SAlex Deucher {
475890ee23fSChunming Zhou 	WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
476a2e73f56SAlex Deucher 
477a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, PACKET0(mmUVD_CONTEXT_ID, 0));
478a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, seq);
479a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
480a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, addr & 0xffffffff);
481a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
482a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, upper_32_bits(addr) & 0xff);
483a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
484a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, 0);
485a2e73f56SAlex Deucher 
486a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
487a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, 0);
488a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
489a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, 0);
490a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
491a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, 2);
492a2e73f56SAlex Deucher }
493a2e73f56SAlex Deucher 
494a2e73f56SAlex Deucher /**
495a2e73f56SAlex Deucher  * uvd_v4_2_ring_test_ring - register write test
496a2e73f56SAlex Deucher  *
497a2e73f56SAlex Deucher  * @ring: amdgpu_ring pointer
498a2e73f56SAlex Deucher  *
499a2e73f56SAlex Deucher  * Test if we can successfully write to the context register
500a2e73f56SAlex Deucher  */
uvd_v4_2_ring_test_ring(struct amdgpu_ring * ring)501a2e73f56SAlex Deucher static int uvd_v4_2_ring_test_ring(struct amdgpu_ring *ring)
502a2e73f56SAlex Deucher {
503a2e73f56SAlex Deucher 	struct amdgpu_device *adev = ring->adev;
504a2e73f56SAlex Deucher 	uint32_t tmp = 0;
505a2e73f56SAlex Deucher 	unsigned i;
506a2e73f56SAlex Deucher 	int r;
507a2e73f56SAlex Deucher 
508a2e73f56SAlex Deucher 	WREG32(mmUVD_CONTEXT_ID, 0xCAFEDEAD);
509a27de35cSChristian König 	r = amdgpu_ring_alloc(ring, 3);
510dc9eeff8SChristian König 	if (r)
511a2e73f56SAlex Deucher 		return r;
512dc9eeff8SChristian König 
513a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, PACKET0(mmUVD_CONTEXT_ID, 0));
514a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, 0xDEADBEEF);
515a27de35cSChristian König 	amdgpu_ring_commit(ring);
516a2e73f56SAlex Deucher 	for (i = 0; i < adev->usec_timeout; i++) {
517a2e73f56SAlex Deucher 		tmp = RREG32(mmUVD_CONTEXT_ID);
518a2e73f56SAlex Deucher 		if (tmp == 0xDEADBEEF)
519a2e73f56SAlex Deucher 			break;
520c366be54SSam Ravnborg 		udelay(1);
521a2e73f56SAlex Deucher 	}
522a2e73f56SAlex Deucher 
523dc9eeff8SChristian König 	if (i >= adev->usec_timeout)
524dc9eeff8SChristian König 		r = -ETIMEDOUT;
525dc9eeff8SChristian König 
526a2e73f56SAlex Deucher 	return r;
527a2e73f56SAlex Deucher }
528a2e73f56SAlex Deucher 
529a2e73f56SAlex Deucher /**
530a2e73f56SAlex Deucher  * uvd_v4_2_ring_emit_ib - execute indirect buffer
531a2e73f56SAlex Deucher  *
532a2e73f56SAlex Deucher  * @ring: amdgpu_ring pointer
53344eb261cSLee Jones  * @job: iob associated with the indirect buffer
534a2e73f56SAlex Deucher  * @ib: indirect buffer to execute
53544eb261cSLee Jones  * @flags: flags associated with the indirect buffer
536a2e73f56SAlex Deucher  *
537a2e73f56SAlex Deucher  * Write ring commands to execute the indirect buffer
538a2e73f56SAlex Deucher  */
uvd_v4_2_ring_emit_ib(struct amdgpu_ring * ring,struct amdgpu_job * job,struct amdgpu_ib * ib,uint32_t flags)539a2e73f56SAlex Deucher static void uvd_v4_2_ring_emit_ib(struct amdgpu_ring *ring,
54034955e03SRex Zhu 				  struct amdgpu_job *job,
541d88bf583SChristian König 				  struct amdgpu_ib *ib,
542c4c905ecSJack Xiao 				  uint32_t flags)
543a2e73f56SAlex Deucher {
544a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, PACKET0(mmUVD_RBC_IB_BASE, 0));
545a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, ib->gpu_addr);
546a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, PACKET0(mmUVD_RBC_IB_SIZE, 0));
547a2e73f56SAlex Deucher 	amdgpu_ring_write(ring, ib->length_dw);
548a2e73f56SAlex Deucher }
549a2e73f56SAlex Deucher 
uvd_v4_2_ring_insert_nop(struct amdgpu_ring * ring,uint32_t count)550def13903SLeo Liu static void uvd_v4_2_ring_insert_nop(struct amdgpu_ring *ring, uint32_t count)
551def13903SLeo Liu {
552def13903SLeo Liu 	int i;
553def13903SLeo Liu 
554def13903SLeo Liu 	WARN_ON(ring->wptr % 2 || count % 2);
555def13903SLeo Liu 
556def13903SLeo Liu 	for (i = 0; i < count / 2; i++) {
557def13903SLeo Liu 		amdgpu_ring_write(ring, PACKET0(mmUVD_NO_OP, 0));
558def13903SLeo Liu 		amdgpu_ring_write(ring, 0);
559def13903SLeo Liu 	}
560def13903SLeo Liu }
561def13903SLeo Liu 
562a2e73f56SAlex Deucher /**
563a2e73f56SAlex Deucher  * uvd_v4_2_mc_resume - memory controller programming
564a2e73f56SAlex Deucher  *
565a2e73f56SAlex Deucher  * @adev: amdgpu_device pointer
566a2e73f56SAlex Deucher  *
567a2e73f56SAlex Deucher  * Let the UVD memory controller know it's offsets
568a2e73f56SAlex Deucher  */
uvd_v4_2_mc_resume(struct amdgpu_device * adev)569a2e73f56SAlex Deucher static void uvd_v4_2_mc_resume(struct amdgpu_device *adev)
570a2e73f56SAlex Deucher {
571a2e73f56SAlex Deucher 	uint64_t addr;
572a2e73f56SAlex Deucher 	uint32_t size;
573a2e73f56SAlex Deucher 
574f349f772SBernard Zhao 	/* program the VCPU memory controller bits 0-27 */
5752bb795f5SJames Zhu 	addr = (adev->uvd.inst->gpu_addr + AMDGPU_UVD_FIRMWARE_OFFSET) >> 3;
576c1fe75c9SPiotr Redlewski 	size = AMDGPU_UVD_FIRMWARE_SIZE(adev) >> 3;
577a2e73f56SAlex Deucher 	WREG32(mmUVD_VCPU_CACHE_OFFSET0, addr);
578a2e73f56SAlex Deucher 	WREG32(mmUVD_VCPU_CACHE_SIZE0, size);
579a2e73f56SAlex Deucher 
580a2e73f56SAlex Deucher 	addr += size;
581c0365541SArindam Nath 	size = AMDGPU_UVD_HEAP_SIZE >> 3;
582a2e73f56SAlex Deucher 	WREG32(mmUVD_VCPU_CACHE_OFFSET1, addr);
583a2e73f56SAlex Deucher 	WREG32(mmUVD_VCPU_CACHE_SIZE1, size);
584a2e73f56SAlex Deucher 
585a2e73f56SAlex Deucher 	addr += size;
586c0365541SArindam Nath 	size = (AMDGPU_UVD_STACK_SIZE +
587c0365541SArindam Nath 	       (AMDGPU_UVD_SESSION_SIZE * adev->uvd.max_handles)) >> 3;
588a2e73f56SAlex Deucher 	WREG32(mmUVD_VCPU_CACHE_OFFSET2, addr);
589a2e73f56SAlex Deucher 	WREG32(mmUVD_VCPU_CACHE_SIZE2, size);
590a2e73f56SAlex Deucher 
591a2e73f56SAlex Deucher 	/* bits 28-31 */
5922bb795f5SJames Zhu 	addr = (adev->uvd.inst->gpu_addr >> 28) & 0xF;
593a2e73f56SAlex Deucher 	WREG32(mmUVD_LMI_ADDR_EXT, (addr << 12) | (addr << 0));
594a2e73f56SAlex Deucher 
595a2e73f56SAlex Deucher 	/* bits 32-39 */
5962bb795f5SJames Zhu 	addr = (adev->uvd.inst->gpu_addr >> 32) & 0xFF;
597a2e73f56SAlex Deucher 	WREG32(mmUVD_LMI_EXT40_ADDR, addr | (0x9 << 16) | (0x1 << 31));
598a2e73f56SAlex Deucher 
59976ed6cb0SAlex Deucher 	WREG32(mmUVD_UDEC_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
60076ed6cb0SAlex Deucher 	WREG32(mmUVD_UDEC_DB_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
60176ed6cb0SAlex Deucher 	WREG32(mmUVD_UDEC_DBW_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
602a2e73f56SAlex Deucher }
603a2e73f56SAlex Deucher 
uvd_v4_2_enable_mgcg(struct amdgpu_device * adev,bool enable)604a2e73f56SAlex Deucher static void uvd_v4_2_enable_mgcg(struct amdgpu_device *adev,
605a2e73f56SAlex Deucher 				 bool enable)
606a2e73f56SAlex Deucher {
607a2e73f56SAlex Deucher 	u32 orig, data;
608a2e73f56SAlex Deucher 
609e3b04bc7SAlex Deucher 	if (enable && (adev->cg_flags & AMD_CG_SUPPORT_UVD_MGCG)) {
610a2e73f56SAlex Deucher 		data = RREG32_UVD_CTX(ixUVD_CGC_MEM_CTRL);
611aa4747c0SRex Zhu 		data |= 0xfff;
612a2e73f56SAlex Deucher 		WREG32_UVD_CTX(ixUVD_CGC_MEM_CTRL, data);
613a2e73f56SAlex Deucher 
614a2e73f56SAlex Deucher 		orig = data = RREG32(mmUVD_CGC_CTRL);
615a2e73f56SAlex Deucher 		data |= UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK;
616a2e73f56SAlex Deucher 		if (orig != data)
617a2e73f56SAlex Deucher 			WREG32(mmUVD_CGC_CTRL, data);
618a2e73f56SAlex Deucher 	} else {
619a2e73f56SAlex Deucher 		data = RREG32_UVD_CTX(ixUVD_CGC_MEM_CTRL);
620a2e73f56SAlex Deucher 		data &= ~0xfff;
621a2e73f56SAlex Deucher 		WREG32_UVD_CTX(ixUVD_CGC_MEM_CTRL, data);
622a2e73f56SAlex Deucher 
623a2e73f56SAlex Deucher 		orig = data = RREG32(mmUVD_CGC_CTRL);
624a2e73f56SAlex Deucher 		data &= ~UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK;
625a2e73f56SAlex Deucher 		if (orig != data)
626a2e73f56SAlex Deucher 			WREG32(mmUVD_CGC_CTRL, data);
627a2e73f56SAlex Deucher 	}
628a2e73f56SAlex Deucher }
629a2e73f56SAlex Deucher 
uvd_v4_2_set_dcm(struct amdgpu_device * adev,bool sw_mode)630a2e73f56SAlex Deucher static void uvd_v4_2_set_dcm(struct amdgpu_device *adev,
631a2e73f56SAlex Deucher 			     bool sw_mode)
632a2e73f56SAlex Deucher {
633a2e73f56SAlex Deucher 	u32 tmp, tmp2;
634a2e73f56SAlex Deucher 
635953618cfSRex Zhu 	WREG32_FIELD(UVD_CGC_GATE, REGS, 0);
636953618cfSRex Zhu 
637a2e73f56SAlex Deucher 	tmp = RREG32(mmUVD_CGC_CTRL);
638a2e73f56SAlex Deucher 	tmp &= ~(UVD_CGC_CTRL__CLK_OFF_DELAY_MASK | UVD_CGC_CTRL__CLK_GATE_DLY_TIMER_MASK);
639a2e73f56SAlex Deucher 	tmp |= UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK |
640a2e73f56SAlex Deucher 		(1 << UVD_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT) |
641a2e73f56SAlex Deucher 		(4 << UVD_CGC_CTRL__CLK_OFF_DELAY__SHIFT);
642a2e73f56SAlex Deucher 
643a2e73f56SAlex Deucher 	if (sw_mode) {
644a2e73f56SAlex Deucher 		tmp &= ~0x7ffff800;
645a2e73f56SAlex Deucher 		tmp2 = UVD_CGC_CTRL2__DYN_OCLK_RAMP_EN_MASK |
646a2e73f56SAlex Deucher 			UVD_CGC_CTRL2__DYN_RCLK_RAMP_EN_MASK |
647a2e73f56SAlex Deucher 			(7 << UVD_CGC_CTRL2__GATER_DIV_ID__SHIFT);
648a2e73f56SAlex Deucher 	} else {
649a2e73f56SAlex Deucher 		tmp |= 0x7ffff800;
650a2e73f56SAlex Deucher 		tmp2 = 0;
651a2e73f56SAlex Deucher 	}
652a2e73f56SAlex Deucher 
653a2e73f56SAlex Deucher 	WREG32(mmUVD_CGC_CTRL, tmp);
654a2e73f56SAlex Deucher 	WREG32_UVD_CTX(ixUVD_CGC_CTRL2, tmp2);
655a2e73f56SAlex Deucher }
656a2e73f56SAlex Deucher 
uvd_v4_2_is_idle(void * handle)6575fc3aeebSyanyang1 static bool uvd_v4_2_is_idle(void *handle)
658a2e73f56SAlex Deucher {
6595fc3aeebSyanyang1 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
6605fc3aeebSyanyang1 
661a2e73f56SAlex Deucher 	return !(RREG32(mmSRBM_STATUS) & SRBM_STATUS__UVD_BUSY_MASK);
662a2e73f56SAlex Deucher }
663a2e73f56SAlex Deucher 
uvd_v4_2_wait_for_idle(void * handle)6645fc3aeebSyanyang1 static int uvd_v4_2_wait_for_idle(void *handle)
665a2e73f56SAlex Deucher {
666a2e73f56SAlex Deucher 	unsigned i;
6675fc3aeebSyanyang1 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
668a2e73f56SAlex Deucher 
669a2e73f56SAlex Deucher 	for (i = 0; i < adev->usec_timeout; i++) {
670a2e73f56SAlex Deucher 		if (!(RREG32(mmSRBM_STATUS) & SRBM_STATUS__UVD_BUSY_MASK))
671a2e73f56SAlex Deucher 			return 0;
672a2e73f56SAlex Deucher 	}
673a2e73f56SAlex Deucher 	return -ETIMEDOUT;
674a2e73f56SAlex Deucher }
675a2e73f56SAlex Deucher 
uvd_v4_2_soft_reset(void * handle)6765fc3aeebSyanyang1 static int uvd_v4_2_soft_reset(void *handle)
677a2e73f56SAlex Deucher {
6785fc3aeebSyanyang1 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
6795fc3aeebSyanyang1 
680a2e73f56SAlex Deucher 	uvd_v4_2_stop(adev);
681a2e73f56SAlex Deucher 
682a2e73f56SAlex Deucher 	WREG32_P(mmSRBM_SOFT_RESET, SRBM_SOFT_RESET__SOFT_RESET_UVD_MASK,
683a2e73f56SAlex Deucher 			~SRBM_SOFT_RESET__SOFT_RESET_UVD_MASK);
684a2e73f56SAlex Deucher 	mdelay(5);
685a2e73f56SAlex Deucher 
686a2e73f56SAlex Deucher 	return uvd_v4_2_start(adev);
687a2e73f56SAlex Deucher }
688a2e73f56SAlex Deucher 
uvd_v4_2_set_interrupt_state(struct amdgpu_device * adev,struct amdgpu_irq_src * source,unsigned type,enum amdgpu_interrupt_state state)689a2e73f56SAlex Deucher static int uvd_v4_2_set_interrupt_state(struct amdgpu_device *adev,
690a2e73f56SAlex Deucher 					struct amdgpu_irq_src *source,
691a2e73f56SAlex Deucher 					unsigned type,
692a2e73f56SAlex Deucher 					enum amdgpu_interrupt_state state)
693a2e73f56SAlex Deucher {
694a2e73f56SAlex Deucher 	// TODO
695a2e73f56SAlex Deucher 	return 0;
696a2e73f56SAlex Deucher }
697a2e73f56SAlex Deucher 
uvd_v4_2_process_interrupt(struct amdgpu_device * adev,struct amdgpu_irq_src * source,struct amdgpu_iv_entry * entry)698a2e73f56SAlex Deucher static int uvd_v4_2_process_interrupt(struct amdgpu_device *adev,
699a2e73f56SAlex Deucher 				      struct amdgpu_irq_src *source,
700a2e73f56SAlex Deucher 				      struct amdgpu_iv_entry *entry)
701a2e73f56SAlex Deucher {
702a2e73f56SAlex Deucher 	DRM_DEBUG("IH: UVD TRAP\n");
7032bb795f5SJames Zhu 	amdgpu_fence_process(&adev->uvd.inst->ring);
704a2e73f56SAlex Deucher 	return 0;
705a2e73f56SAlex Deucher }
706a2e73f56SAlex Deucher 
uvd_v4_2_set_clockgating_state(void * handle,enum amd_clockgating_state state)7075fc3aeebSyanyang1 static int uvd_v4_2_set_clockgating_state(void *handle,
7085fc3aeebSyanyang1 					  enum amd_clockgating_state state)
709a2e73f56SAlex Deucher {
710a2e73f56SAlex Deucher 	return 0;
711a2e73f56SAlex Deucher }
712a2e73f56SAlex Deucher 
uvd_v4_2_set_powergating_state(void * handle,enum amd_powergating_state state)7135fc3aeebSyanyang1 static int uvd_v4_2_set_powergating_state(void *handle,
7145fc3aeebSyanyang1 					  enum amd_powergating_state state)
715a2e73f56SAlex Deucher {
716a2e73f56SAlex Deucher 	/* This doesn't actually powergate the UVD block.
717a2e73f56SAlex Deucher 	 * That's done in the dpm code via the SMC.  This
718a2e73f56SAlex Deucher 	 * just re-inits the block as necessary.  The actual
719a2e73f56SAlex Deucher 	 * gating still happens in the dpm code.  We should
720a2e73f56SAlex Deucher 	 * revisit this when there is a cleaner line between
721a2e73f56SAlex Deucher 	 * the smc and the hw blocks
722a2e73f56SAlex Deucher 	 */
7235fc3aeebSyanyang1 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
7245fc3aeebSyanyang1 
7255fc3aeebSyanyang1 	if (state == AMD_PG_STATE_GATE) {
726a2e73f56SAlex Deucher 		uvd_v4_2_stop(adev);
727b13aa109SRex Zhu 		if (adev->pg_flags & AMD_PG_SUPPORT_UVD && !adev->pm.dpm_enabled) {
728254cd2e0SRex Zhu 			if (!(RREG32_SMC(ixCURRENT_PG_STATUS) &
729254cd2e0SRex Zhu 				CURRENT_PG_STATUS__UVD_PG_STATUS_MASK)) {
7303a786966SRex Zhu 				WREG32(mmUVD_PGFSM_CONFIG, (UVD_PGFSM_CONFIG__UVD_PGFSM_FSM_ADDR_MASK   |
7313a786966SRex Zhu 							UVD_PGFSM_CONFIG__UVD_PGFSM_POWER_DOWN_MASK |
7323a786966SRex Zhu 							UVD_PGFSM_CONFIG__UVD_PGFSM_P1_SELECT_MASK));
7333a786966SRex Zhu 				mdelay(20);
7343a786966SRex Zhu 			}
7353a786966SRex Zhu 		}
736a2e73f56SAlex Deucher 		return 0;
737a2e73f56SAlex Deucher 	} else {
738b13aa109SRex Zhu 		if (adev->pg_flags & AMD_PG_SUPPORT_UVD && !adev->pm.dpm_enabled) {
739254cd2e0SRex Zhu 			if (RREG32_SMC(ixCURRENT_PG_STATUS) &
740254cd2e0SRex Zhu 				CURRENT_PG_STATUS__UVD_PG_STATUS_MASK) {
7413a786966SRex Zhu 				WREG32(mmUVD_PGFSM_CONFIG, (UVD_PGFSM_CONFIG__UVD_PGFSM_FSM_ADDR_MASK   |
7423a786966SRex Zhu 						UVD_PGFSM_CONFIG__UVD_PGFSM_POWER_UP_MASK |
7433a786966SRex Zhu 						UVD_PGFSM_CONFIG__UVD_PGFSM_P1_SELECT_MASK));
7443a786966SRex Zhu 				mdelay(30);
7453a786966SRex Zhu 			}
7463a786966SRex Zhu 		}
747a2e73f56SAlex Deucher 		return uvd_v4_2_start(adev);
748a2e73f56SAlex Deucher 	}
749a2e73f56SAlex Deucher }
750a2e73f56SAlex Deucher 
751a1255107SAlex Deucher static const struct amd_ip_funcs uvd_v4_2_ip_funcs = {
75288a907d6STom St Denis 	.name = "uvd_v4_2",
753a2e73f56SAlex Deucher 	.early_init = uvd_v4_2_early_init,
754a2e73f56SAlex Deucher 	.late_init = NULL,
755a2e73f56SAlex Deucher 	.sw_init = uvd_v4_2_sw_init,
756a2e73f56SAlex Deucher 	.sw_fini = uvd_v4_2_sw_fini,
757a2e73f56SAlex Deucher 	.hw_init = uvd_v4_2_hw_init,
758a2e73f56SAlex Deucher 	.hw_fini = uvd_v4_2_hw_fini,
759a2e73f56SAlex Deucher 	.suspend = uvd_v4_2_suspend,
760a2e73f56SAlex Deucher 	.resume = uvd_v4_2_resume,
761a2e73f56SAlex Deucher 	.is_idle = uvd_v4_2_is_idle,
762a2e73f56SAlex Deucher 	.wait_for_idle = uvd_v4_2_wait_for_idle,
763a2e73f56SAlex Deucher 	.soft_reset = uvd_v4_2_soft_reset,
764a2e73f56SAlex Deucher 	.set_clockgating_state = uvd_v4_2_set_clockgating_state,
765a2e73f56SAlex Deucher 	.set_powergating_state = uvd_v4_2_set_powergating_state,
766a2e73f56SAlex Deucher };
767a2e73f56SAlex Deucher 
768a2e73f56SAlex Deucher static const struct amdgpu_ring_funcs uvd_v4_2_ring_funcs = {
76921cd942eSChristian König 	.type = AMDGPU_RING_TYPE_UVD,
77079887142SChristian König 	.align_mask = 0xf,
771536fbf94SKen Wang 	.support_64bit_ptrs = false,
7727ee250b1SLeo Liu 	.no_user_fence = true,
773a2e73f56SAlex Deucher 	.get_rptr = uvd_v4_2_ring_get_rptr,
774a2e73f56SAlex Deucher 	.get_wptr = uvd_v4_2_ring_get_wptr,
775a2e73f56SAlex Deucher 	.set_wptr = uvd_v4_2_ring_set_wptr,
776a2e73f56SAlex Deucher 	.parse_cs = amdgpu_uvd_ring_parse_cs,
777e12f3d7aSChristian König 	.emit_frame_size =
778e12f3d7aSChristian König 		14, /* uvd_v4_2_ring_emit_fence  x1 no user fence */
779e12f3d7aSChristian König 	.emit_ib_size = 4, /* uvd_v4_2_ring_emit_ib */
780a2e73f56SAlex Deucher 	.emit_ib = uvd_v4_2_ring_emit_ib,
781a2e73f56SAlex Deucher 	.emit_fence = uvd_v4_2_ring_emit_fence,
782a2e73f56SAlex Deucher 	.test_ring = uvd_v4_2_ring_test_ring,
7838de190c9SChristian König 	.test_ib = amdgpu_uvd_ring_test_ib,
784def13903SLeo Liu 	.insert_nop = uvd_v4_2_ring_insert_nop,
7859e5d5309SChristian König 	.pad_ib = amdgpu_ring_generic_pad_ib,
786c4120d55SChristian König 	.begin_use = amdgpu_uvd_ring_begin_use,
787c4120d55SChristian König 	.end_use = amdgpu_uvd_ring_end_use,
788a2e73f56SAlex Deucher };
789a2e73f56SAlex Deucher 
uvd_v4_2_set_ring_funcs(struct amdgpu_device * adev)790a2e73f56SAlex Deucher static void uvd_v4_2_set_ring_funcs(struct amdgpu_device *adev)
791a2e73f56SAlex Deucher {
7922bb795f5SJames Zhu 	adev->uvd.inst->ring.funcs = &uvd_v4_2_ring_funcs;
793a2e73f56SAlex Deucher }
794a2e73f56SAlex Deucher 
795a2e73f56SAlex Deucher static const struct amdgpu_irq_src_funcs uvd_v4_2_irq_funcs = {
796a2e73f56SAlex Deucher 	.set = uvd_v4_2_set_interrupt_state,
797a2e73f56SAlex Deucher 	.process = uvd_v4_2_process_interrupt,
798a2e73f56SAlex Deucher };
799a2e73f56SAlex Deucher 
uvd_v4_2_set_irq_funcs(struct amdgpu_device * adev)800a2e73f56SAlex Deucher static void uvd_v4_2_set_irq_funcs(struct amdgpu_device *adev)
801a2e73f56SAlex Deucher {
8022bb795f5SJames Zhu 	adev->uvd.inst->irq.num_types = 1;
8032bb795f5SJames Zhu 	adev->uvd.inst->irq.funcs = &uvd_v4_2_irq_funcs;
804a2e73f56SAlex Deucher }
805a1255107SAlex Deucher 
806a1255107SAlex Deucher const struct amdgpu_ip_block_version uvd_v4_2_ip_block =
807a1255107SAlex Deucher {
808a1255107SAlex Deucher 		.type = AMD_IP_BLOCK_TYPE_UVD,
809a1255107SAlex Deucher 		.major = 4,
810a1255107SAlex Deucher 		.minor = 2,
811a1255107SAlex Deucher 		.rev = 0,
812a1255107SAlex Deucher 		.funcs = &uvd_v4_2_ip_funcs,
813a1255107SAlex Deucher };
814