xref: /openbmc/linux/drivers/gpu/drm/amd/amdgpu/navi10_ih.c (revision a89aa749ece9c6fee7932163472d2ee0efd6ddd3)
1 /*
2  * Copyright 2019 Advanced Micro Devices, Inc.
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice shall be included in
12  * all copies or substantial portions of the Software.
13  *
14  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20  * OTHER DEALINGS IN THE SOFTWARE.
21  *
22  */
23 
24 #include <linux/pci.h>
25 
26 #include "amdgpu.h"
27 #include "amdgpu_ih.h"
28 
29 #include "oss/osssys_5_0_0_offset.h"
30 #include "oss/osssys_5_0_0_sh_mask.h"
31 
32 #include "soc15_common.h"
33 #include "navi10_ih.h"
34 
35 #define MAX_REARM_RETRY 10
36 
37 static void navi10_ih_set_interrupt_funcs(struct amdgpu_device *adev);
38 
39 /**
40  * navi10_ih_enable_interrupts - Enable the interrupt ring buffer
41  *
42  * @adev: amdgpu_device pointer
43  *
44  * Enable the interrupt ring buffer (NAVI10).
45  */
46 static void navi10_ih_enable_interrupts(struct amdgpu_device *adev)
47 {
48 	u32 ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL);
49 
50 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, RB_ENABLE, 1);
51 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, ENABLE_INTR, 1);
52 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL, ih_rb_cntl);
53 	adev->irq.ih.enabled = true;
54 }
55 
56 /**
57  * navi10_ih_disable_interrupts - Disable the interrupt ring buffer
58  *
59  * @adev: amdgpu_device pointer
60  *
61  * Disable the interrupt ring buffer (NAVI10).
62  */
63 static void navi10_ih_disable_interrupts(struct amdgpu_device *adev)
64 {
65 	u32 ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL);
66 
67 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, RB_ENABLE, 0);
68 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, ENABLE_INTR, 0);
69 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL, ih_rb_cntl);
70 	/* set rptr, wptr to 0 */
71 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_RPTR, 0);
72 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_WPTR, 0);
73 	adev->irq.ih.enabled = false;
74 	adev->irq.ih.rptr = 0;
75 }
76 
77 static uint32_t navi10_ih_rb_cntl(struct amdgpu_ih_ring *ih, uint32_t ih_rb_cntl)
78 {
79 	int rb_bufsz = order_base_2(ih->ring_size / 4);
80 
81 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL,
82 				   MC_SPACE, ih->use_bus_addr ? 1 : 4);
83 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL,
84 				   WPTR_OVERFLOW_CLEAR, 1);
85 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL,
86 				   WPTR_OVERFLOW_ENABLE, 1);
87 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, RB_SIZE, rb_bufsz);
88 	/* Ring Buffer write pointer writeback. If enabled, IH_RB_WPTR register
89 	 * value is written to memory
90 	 */
91 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL,
92 				   WPTR_WRITEBACK_ENABLE, 1);
93 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, MC_SNOOP, 1);
94 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, MC_RO, 0);
95 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, MC_VMID, 0);
96 
97 	return ih_rb_cntl;
98 }
99 
100 /**
101  * navi10_ih_irq_init - init and enable the interrupt ring
102  *
103  * @adev: amdgpu_device pointer
104  *
105  * Allocate a ring buffer for the interrupt controller,
106  * enable the RLC, disable interrupts, enable the IH
107  * ring buffer and enable it (NAVI).
108  * Called at device load and reume.
109  * Returns 0 for success, errors for failure.
110  */
111 static int navi10_ih_irq_init(struct amdgpu_device *adev)
112 {
113 	struct amdgpu_ih_ring *ih = &adev->irq.ih;
114 	u32 ih_rb_cntl, ih_doorbell_rtpr, ih_chicken;
115 	u32 tmp;
116 
117 	/* disable irqs */
118 	navi10_ih_disable_interrupts(adev);
119 
120 	adev->nbio.funcs->ih_control(adev);
121 
122 	/* Ring Buffer base. [39:8] of 40-bit address of the beginning of the ring buffer*/
123 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_BASE, ih->gpu_addr >> 8);
124 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_BASE_HI, (ih->gpu_addr >> 40) & 0xff);
125 
126 	ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL);
127 	ih_rb_cntl = navi10_ih_rb_cntl(ih, ih_rb_cntl);
128 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, RPTR_REARM,
129 				   !!adev->irq.msi_enabled);
130 
131 	if (unlikely(adev->firmware.load_type == AMDGPU_FW_LOAD_DIRECT)) {
132 		if (ih->use_bus_addr) {
133 			ih_chicken = RREG32_SOC15(OSSSYS, 0, mmIH_CHICKEN);
134 			ih_chicken = REG_SET_FIELD(ih_chicken,
135 					IH_CHICKEN, MC_SPACE_GPA_ENABLE, 1);
136 			WREG32_SOC15(OSSSYS, 0, mmIH_CHICKEN, ih_chicken);
137 		}
138 	}
139 
140 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL, ih_rb_cntl);
141 
142 	/* set the writeback address whether it's enabled or not */
143 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_WPTR_ADDR_LO,
144 		     lower_32_bits(ih->wptr_addr));
145 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_WPTR_ADDR_HI,
146 		     upper_32_bits(ih->wptr_addr) & 0xFFFF);
147 
148 	/* set rptr, wptr to 0 */
149 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_RPTR, 0);
150 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_WPTR, 0);
151 
152 	ih_doorbell_rtpr = RREG32_SOC15(OSSSYS, 0, mmIH_DOORBELL_RPTR);
153 	if (ih->use_doorbell) {
154 		ih_doorbell_rtpr = REG_SET_FIELD(ih_doorbell_rtpr,
155 						 IH_DOORBELL_RPTR, OFFSET,
156 						 ih->doorbell_index);
157 		ih_doorbell_rtpr = REG_SET_FIELD(ih_doorbell_rtpr,
158 						 IH_DOORBELL_RPTR, ENABLE, 1);
159 	} else {
160 		ih_doorbell_rtpr = REG_SET_FIELD(ih_doorbell_rtpr,
161 						 IH_DOORBELL_RPTR, ENABLE, 0);
162 	}
163 	WREG32_SOC15(OSSSYS, 0, mmIH_DOORBELL_RPTR, ih_doorbell_rtpr);
164 
165 	adev->nbio.funcs->ih_doorbell_range(adev, ih->use_doorbell,
166 					    ih->doorbell_index);
167 
168 	tmp = RREG32_SOC15(OSSSYS, 0, mmIH_STORM_CLIENT_LIST_CNTL);
169 	tmp = REG_SET_FIELD(tmp, IH_STORM_CLIENT_LIST_CNTL,
170 			    CLIENT18_IS_STORM_CLIENT, 1);
171 	WREG32_SOC15(OSSSYS, 0, mmIH_STORM_CLIENT_LIST_CNTL, tmp);
172 
173 	tmp = RREG32_SOC15(OSSSYS, 0, mmIH_INT_FLOOD_CNTL);
174 	tmp = REG_SET_FIELD(tmp, IH_INT_FLOOD_CNTL, FLOOD_CNTL_ENABLE, 1);
175 	WREG32_SOC15(OSSSYS, 0, mmIH_INT_FLOOD_CNTL, tmp);
176 
177 	pci_set_master(adev->pdev);
178 
179 	/* enable interrupts */
180 	navi10_ih_enable_interrupts(adev);
181 
182 	return 0;
183 }
184 
185 /**
186  * navi10_ih_irq_disable - disable interrupts
187  *
188  * @adev: amdgpu_device pointer
189  *
190  * Disable interrupts on the hw (NAVI10).
191  */
192 static void navi10_ih_irq_disable(struct amdgpu_device *adev)
193 {
194 	navi10_ih_disable_interrupts(adev);
195 
196 	/* Wait and acknowledge irq */
197 	mdelay(1);
198 }
199 
200 /**
201  * navi10_ih_get_wptr - get the IH ring buffer wptr
202  *
203  * @adev: amdgpu_device pointer
204  *
205  * Get the IH ring buffer wptr from either the register
206  * or the writeback memory buffer (NAVI10).  Also check for
207  * ring buffer overflow and deal with it.
208  * Returns the value of the wptr.
209  */
210 static u32 navi10_ih_get_wptr(struct amdgpu_device *adev,
211 			      struct amdgpu_ih_ring *ih)
212 {
213 	u32 wptr, reg, tmp;
214 
215 	wptr = le32_to_cpu(*ih->wptr_cpu);
216 
217 	if (!REG_GET_FIELD(wptr, IH_RB_WPTR, RB_OVERFLOW))
218 		goto out;
219 
220 	reg = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_WPTR);
221 	wptr = RREG32_NO_KIQ(reg);
222 	if (!REG_GET_FIELD(wptr, IH_RB_WPTR, RB_OVERFLOW))
223 		goto out;
224 	wptr = REG_SET_FIELD(wptr, IH_RB_WPTR, RB_OVERFLOW, 0);
225 
226 	/* When a ring buffer overflow happen start parsing interrupt
227 	 * from the last not overwritten vector (wptr + 32). Hopefully
228 	 * this should allow us to catch up.
229 	 */
230 	tmp = (wptr + 32) & ih->ptr_mask;
231 	dev_warn(adev->dev, "IH ring buffer overflow "
232 		 "(0x%08X, 0x%08X, 0x%08X)\n",
233 		 wptr, ih->rptr, tmp);
234 	ih->rptr = tmp;
235 
236 	reg = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_CNTL);
237 	tmp = RREG32_NO_KIQ(reg);
238 	tmp = REG_SET_FIELD(tmp, IH_RB_CNTL, WPTR_OVERFLOW_CLEAR, 1);
239 	WREG32_NO_KIQ(reg, tmp);
240 out:
241 	return (wptr & ih->ptr_mask);
242 }
243 
244 /**
245  * navi10_ih_decode_iv - decode an interrupt vector
246  *
247  * @adev: amdgpu_device pointer
248  *
249  * Decodes the interrupt vector at the current rptr
250  * position and also advance the position.
251  */
252 static void navi10_ih_decode_iv(struct amdgpu_device *adev,
253 				struct amdgpu_ih_ring *ih,
254 				struct amdgpu_iv_entry *entry)
255 {
256 	/* wptr/rptr are in bytes! */
257 	u32 ring_index = ih->rptr >> 2;
258 	uint32_t dw[8];
259 
260 	dw[0] = le32_to_cpu(ih->ring[ring_index + 0]);
261 	dw[1] = le32_to_cpu(ih->ring[ring_index + 1]);
262 	dw[2] = le32_to_cpu(ih->ring[ring_index + 2]);
263 	dw[3] = le32_to_cpu(ih->ring[ring_index + 3]);
264 	dw[4] = le32_to_cpu(ih->ring[ring_index + 4]);
265 	dw[5] = le32_to_cpu(ih->ring[ring_index + 5]);
266 	dw[6] = le32_to_cpu(ih->ring[ring_index + 6]);
267 	dw[7] = le32_to_cpu(ih->ring[ring_index + 7]);
268 
269 	entry->client_id = dw[0] & 0xff;
270 	entry->src_id = (dw[0] >> 8) & 0xff;
271 	entry->ring_id = (dw[0] >> 16) & 0xff;
272 	entry->vmid = (dw[0] >> 24) & 0xf;
273 	entry->vmid_src = (dw[0] >> 31);
274 	entry->timestamp = dw[1] | ((u64)(dw[2] & 0xffff) << 32);
275 	entry->timestamp_src = dw[2] >> 31;
276 	entry->pasid = dw[3] & 0xffff;
277 	entry->pasid_src = dw[3] >> 31;
278 	entry->src_data[0] = dw[4];
279 	entry->src_data[1] = dw[5];
280 	entry->src_data[2] = dw[6];
281 	entry->src_data[3] = dw[7];
282 
283 	/* wptr/rptr are in bytes! */
284 	ih->rptr += 32;
285 }
286 
287 /**
288  * navi10_ih_irq_rearm - rearm IRQ if lost
289  *
290  * @adev: amdgpu_device pointer
291  *
292  */
293 static void navi10_ih_irq_rearm(struct amdgpu_device *adev,
294 			       struct amdgpu_ih_ring *ih)
295 {
296 	uint32_t reg_rptr = 0;
297 	uint32_t v = 0;
298 	uint32_t i = 0;
299 
300 	if (ih == &adev->irq.ih)
301 		reg_rptr = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_RPTR);
302 	else if (ih == &adev->irq.ih1)
303 		reg_rptr = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_RPTR_RING1);
304 	else if (ih == &adev->irq.ih2)
305 		reg_rptr = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_RPTR_RING2);
306 	else
307 		return;
308 
309 	/* Rearm IRQ / re-write doorbell if doorbell write is lost */
310 	for (i = 0; i < MAX_REARM_RETRY; i++) {
311 		v = RREG32_NO_KIQ(reg_rptr);
312 		if ((v < ih->ring_size) && (v != ih->rptr))
313 			WDOORBELL32(ih->doorbell_index, ih->rptr);
314 		else
315 			break;
316 	}
317 }
318 
319 /**
320  * navi10_ih_set_rptr - set the IH ring buffer rptr
321  *
322  * @adev: amdgpu_device pointer
323  *
324  * Set the IH ring buffer rptr.
325  */
326 static void navi10_ih_set_rptr(struct amdgpu_device *adev,
327 			       struct amdgpu_ih_ring *ih)
328 {
329 	if (ih->use_doorbell) {
330 		/* XXX check if swapping is necessary on BE */
331 		*ih->rptr_cpu = ih->rptr;
332 		WDOORBELL32(ih->doorbell_index, ih->rptr);
333 
334 		if (amdgpu_sriov_vf(adev))
335 			navi10_ih_irq_rearm(adev, ih);
336 	} else
337 		WREG32_SOC15(OSSSYS, 0, mmIH_RB_RPTR, ih->rptr);
338 }
339 
340 static int navi10_ih_early_init(void *handle)
341 {
342 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
343 
344 	navi10_ih_set_interrupt_funcs(adev);
345 	return 0;
346 }
347 
348 static int navi10_ih_sw_init(void *handle)
349 {
350 	int r;
351 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
352 	bool use_bus_addr;
353 
354 	/* use gpu virtual address for ih ring
355 	 * until ih_checken is programmed to allow
356 	 * use bus address for ih ring by psp bl */
357 	use_bus_addr =
358 		(adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) ? false : true;
359 	r = amdgpu_ih_ring_init(adev, &adev->irq.ih, 256 * 1024, use_bus_addr);
360 	if (r)
361 		return r;
362 
363 	adev->irq.ih.use_doorbell = true;
364 	adev->irq.ih.doorbell_index = adev->doorbell_index.ih << 1;
365 
366 	r = amdgpu_irq_init(adev);
367 
368 	return r;
369 }
370 
371 static int navi10_ih_sw_fini(void *handle)
372 {
373 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
374 
375 	amdgpu_irq_fini(adev);
376 	amdgpu_ih_ring_fini(adev, &adev->irq.ih);
377 
378 	return 0;
379 }
380 
381 static int navi10_ih_hw_init(void *handle)
382 {
383 	int r;
384 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
385 
386 	r = navi10_ih_irq_init(adev);
387 	if (r)
388 		return r;
389 
390 	return 0;
391 }
392 
393 static int navi10_ih_hw_fini(void *handle)
394 {
395 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
396 
397 	navi10_ih_irq_disable(adev);
398 
399 	return 0;
400 }
401 
402 static int navi10_ih_suspend(void *handle)
403 {
404 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
405 
406 	return navi10_ih_hw_fini(adev);
407 }
408 
409 static int navi10_ih_resume(void *handle)
410 {
411 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
412 
413 	return navi10_ih_hw_init(adev);
414 }
415 
416 static bool navi10_ih_is_idle(void *handle)
417 {
418 	/* todo */
419 	return true;
420 }
421 
422 static int navi10_ih_wait_for_idle(void *handle)
423 {
424 	/* todo */
425 	return -ETIMEDOUT;
426 }
427 
428 static int navi10_ih_soft_reset(void *handle)
429 {
430 	/* todo */
431 	return 0;
432 }
433 
434 static void navi10_ih_update_clockgating_state(struct amdgpu_device *adev,
435 					       bool enable)
436 {
437 	uint32_t data, def, field_val;
438 
439 	if (adev->cg_flags & AMD_CG_SUPPORT_IH_CG) {
440 		def = data = RREG32_SOC15(OSSSYS, 0, mmIH_CLK_CTRL);
441 		field_val = enable ? 0 : 1;
442 		data = REG_SET_FIELD(data, IH_CLK_CTRL,
443 				     DBUS_MUX_CLK_SOFT_OVERRIDE, field_val);
444 		data = REG_SET_FIELD(data, IH_CLK_CTRL,
445 				     OSSSYS_SHARE_CLK_SOFT_OVERRIDE, field_val);
446 		data = REG_SET_FIELD(data, IH_CLK_CTRL,
447 				     LIMIT_SMN_CLK_SOFT_OVERRIDE, field_val);
448 		data = REG_SET_FIELD(data, IH_CLK_CTRL,
449 				     DYN_CLK_SOFT_OVERRIDE, field_val);
450 		data = REG_SET_FIELD(data, IH_CLK_CTRL,
451 				     REG_CLK_SOFT_OVERRIDE, field_val);
452 		if (def != data)
453 			WREG32_SOC15(OSSSYS, 0, mmIH_CLK_CTRL, data);
454 	}
455 
456 	return;
457 }
458 
459 static int navi10_ih_set_clockgating_state(void *handle,
460 					   enum amd_clockgating_state state)
461 {
462 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
463 
464 	navi10_ih_update_clockgating_state(adev,
465 				state == AMD_CG_STATE_GATE);
466 	return 0;
467 }
468 
469 static int navi10_ih_set_powergating_state(void *handle,
470 					   enum amd_powergating_state state)
471 {
472 	return 0;
473 }
474 
475 static void navi10_ih_get_clockgating_state(void *handle, u32 *flags)
476 {
477 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
478 
479 	if (!RREG32_SOC15(OSSSYS, 0, mmIH_CLK_CTRL))
480 		*flags |= AMD_CG_SUPPORT_IH_CG;
481 
482 	return;
483 }
484 
485 static const struct amd_ip_funcs navi10_ih_ip_funcs = {
486 	.name = "navi10_ih",
487 	.early_init = navi10_ih_early_init,
488 	.late_init = NULL,
489 	.sw_init = navi10_ih_sw_init,
490 	.sw_fini = navi10_ih_sw_fini,
491 	.hw_init = navi10_ih_hw_init,
492 	.hw_fini = navi10_ih_hw_fini,
493 	.suspend = navi10_ih_suspend,
494 	.resume = navi10_ih_resume,
495 	.is_idle = navi10_ih_is_idle,
496 	.wait_for_idle = navi10_ih_wait_for_idle,
497 	.soft_reset = navi10_ih_soft_reset,
498 	.set_clockgating_state = navi10_ih_set_clockgating_state,
499 	.set_powergating_state = navi10_ih_set_powergating_state,
500 	.get_clockgating_state = navi10_ih_get_clockgating_state,
501 };
502 
503 static const struct amdgpu_ih_funcs navi10_ih_funcs = {
504 	.get_wptr = navi10_ih_get_wptr,
505 	.decode_iv = navi10_ih_decode_iv,
506 	.set_rptr = navi10_ih_set_rptr
507 };
508 
509 static void navi10_ih_set_interrupt_funcs(struct amdgpu_device *adev)
510 {
511 	if (adev->irq.ih_funcs == NULL)
512 		adev->irq.ih_funcs = &navi10_ih_funcs;
513 }
514 
515 const struct amdgpu_ip_block_version navi10_ih_ip_block =
516 {
517 	.type = AMD_IP_BLOCK_TYPE_IH,
518 	.major = 5,
519 	.minor = 0,
520 	.rev = 0,
521 	.funcs = &navi10_ih_ip_funcs,
522 };
523