xref: /openbmc/linux/drivers/gpu/drm/i915/gt/intel_gt_pm.c (revision c3d8cb19)
1 // SPDX-License-Identifier: MIT
2 /*
3  * Copyright © 2019 Intel Corporation
4  */
5 
6 #include <linux/string_helpers.h>
7 #include <linux/suspend.h>
8 
9 #include "i915_drv.h"
10 #include "i915_irq.h"
11 #include "i915_params.h"
12 #include "intel_context.h"
13 #include "intel_engine_pm.h"
14 #include "intel_gt.h"
15 #include "intel_gt_clock_utils.h"
16 #include "intel_gt_pm.h"
17 #include "intel_gt_print.h"
18 #include "intel_gt_requests.h"
19 #include "intel_llc.h"
20 #include "intel_pm.h"
21 #include "intel_rc6.h"
22 #include "intel_rps.h"
23 #include "intel_wakeref.h"
24 #include "intel_pcode.h"
25 #include "pxp/intel_pxp_pm.h"
26 
27 #define I915_GT_SUSPEND_IDLE_TIMEOUT (HZ / 2)
28 
29 static void mtl_media_busy(struct intel_gt *gt)
30 {
31 	/* Wa_14017073508: mtl */
32 	if (IS_MTL_GRAPHICS_STEP(gt->i915, P, STEP_A0, STEP_B0) &&
33 	    gt->type == GT_MEDIA)
34 		snb_pcode_write_p(gt->uncore, PCODE_MBOX_GT_STATE,
35 				  PCODE_MBOX_GT_STATE_MEDIA_BUSY,
36 				  PCODE_MBOX_GT_STATE_DOMAIN_MEDIA, 0);
37 }
38 
39 static void mtl_media_idle(struct intel_gt *gt)
40 {
41 	/* Wa_14017073508: mtl */
42 	if (IS_MTL_GRAPHICS_STEP(gt->i915, P, STEP_A0, STEP_B0) &&
43 	    gt->type == GT_MEDIA)
44 		snb_pcode_write_p(gt->uncore, PCODE_MBOX_GT_STATE,
45 				  PCODE_MBOX_GT_STATE_MEDIA_NOT_BUSY,
46 				  PCODE_MBOX_GT_STATE_DOMAIN_MEDIA, 0);
47 }
48 
49 static void user_forcewake(struct intel_gt *gt, bool suspend)
50 {
51 	int count = atomic_read(&gt->user_wakeref);
52 
53 	/* Inside suspend/resume so single threaded, no races to worry about. */
54 	if (likely(!count))
55 		return;
56 
57 	intel_gt_pm_get(gt);
58 	if (suspend) {
59 		GEM_BUG_ON(count > atomic_read(&gt->wakeref.count));
60 		atomic_sub(count, &gt->wakeref.count);
61 	} else {
62 		atomic_add(count, &gt->wakeref.count);
63 	}
64 	intel_gt_pm_put(gt);
65 }
66 
67 static void runtime_begin(struct intel_gt *gt)
68 {
69 	local_irq_disable();
70 	write_seqcount_begin(&gt->stats.lock);
71 	gt->stats.start = ktime_get();
72 	gt->stats.active = true;
73 	write_seqcount_end(&gt->stats.lock);
74 	local_irq_enable();
75 }
76 
77 static void runtime_end(struct intel_gt *gt)
78 {
79 	local_irq_disable();
80 	write_seqcount_begin(&gt->stats.lock);
81 	gt->stats.active = false;
82 	gt->stats.total =
83 		ktime_add(gt->stats.total,
84 			  ktime_sub(ktime_get(), gt->stats.start));
85 	write_seqcount_end(&gt->stats.lock);
86 	local_irq_enable();
87 }
88 
89 static int __gt_unpark(struct intel_wakeref *wf)
90 {
91 	struct intel_gt *gt = container_of(wf, typeof(*gt), wakeref);
92 	struct drm_i915_private *i915 = gt->i915;
93 
94 	GT_TRACE(gt, "\n");
95 
96 	/* Wa_14017073508: mtl */
97 	mtl_media_busy(gt);
98 
99 	/*
100 	 * It seems that the DMC likes to transition between the DC states a lot
101 	 * when there are no connected displays (no active power domains) during
102 	 * command submission.
103 	 *
104 	 * This activity has negative impact on the performance of the chip with
105 	 * huge latencies observed in the interrupt handler and elsewhere.
106 	 *
107 	 * Work around it by grabbing a GT IRQ power domain whilst there is any
108 	 * GT activity, preventing any DC state transitions.
109 	 */
110 	gt->awake = intel_display_power_get(i915, POWER_DOMAIN_GT_IRQ);
111 	GEM_BUG_ON(!gt->awake);
112 
113 	intel_rc6_unpark(&gt->rc6);
114 	intel_rps_unpark(&gt->rps);
115 	i915_pmu_gt_unparked(i915);
116 	intel_guc_busyness_unpark(gt);
117 
118 	intel_gt_unpark_requests(gt);
119 	runtime_begin(gt);
120 
121 	return 0;
122 }
123 
124 static int __gt_park(struct intel_wakeref *wf)
125 {
126 	struct intel_gt *gt = container_of(wf, typeof(*gt), wakeref);
127 	intel_wakeref_t wakeref = fetch_and_zero(&gt->awake);
128 	struct drm_i915_private *i915 = gt->i915;
129 
130 	GT_TRACE(gt, "\n");
131 
132 	runtime_end(gt);
133 	intel_gt_park_requests(gt);
134 
135 	intel_guc_busyness_park(gt);
136 	i915_vma_parked(gt);
137 	i915_pmu_gt_parked(i915);
138 	intel_rps_park(&gt->rps);
139 	intel_rc6_park(&gt->rc6);
140 
141 	/* Everything switched off, flush any residual interrupt just in case */
142 	intel_synchronize_irq(i915);
143 
144 	/* Defer dropping the display power well for 100ms, it's slow! */
145 	GEM_BUG_ON(!wakeref);
146 	intel_display_power_put_async(i915, POWER_DOMAIN_GT_IRQ, wakeref);
147 
148 	/* Wa_14017073508: mtl */
149 	mtl_media_idle(gt);
150 
151 	return 0;
152 }
153 
154 static const struct intel_wakeref_ops wf_ops = {
155 	.get = __gt_unpark,
156 	.put = __gt_park,
157 };
158 
159 void intel_gt_pm_init_early(struct intel_gt *gt)
160 {
161 	/*
162 	 * We access the runtime_pm structure via gt->i915 here rather than
163 	 * gt->uncore as we do elsewhere in the file because gt->uncore is not
164 	 * yet initialized for all tiles at this point in the driver startup.
165 	 * runtime_pm is per-device rather than per-tile, so this is still the
166 	 * correct structure.
167 	 */
168 	intel_wakeref_init(&gt->wakeref, &gt->i915->runtime_pm, &wf_ops);
169 	seqcount_mutex_init(&gt->stats.lock, &gt->wakeref.mutex);
170 }
171 
172 void intel_gt_pm_init(struct intel_gt *gt)
173 {
174 	/*
175 	 * Enabling power-management should be "self-healing". If we cannot
176 	 * enable a feature, simply leave it disabled with a notice to the
177 	 * user.
178 	 */
179 	intel_rc6_init(&gt->rc6);
180 	intel_rps_init(&gt->rps);
181 }
182 
183 static bool reset_engines(struct intel_gt *gt)
184 {
185 	if (INTEL_INFO(gt->i915)->gpu_reset_clobbers_display)
186 		return false;
187 
188 	return __intel_gt_reset(gt, ALL_ENGINES) == 0;
189 }
190 
191 static void gt_sanitize(struct intel_gt *gt, bool force)
192 {
193 	struct intel_engine_cs *engine;
194 	enum intel_engine_id id;
195 	intel_wakeref_t wakeref;
196 
197 	GT_TRACE(gt, "force:%s", str_yes_no(force));
198 
199 	/* Use a raw wakeref to avoid calling intel_display_power_get early */
200 	wakeref = intel_runtime_pm_get(gt->uncore->rpm);
201 	intel_uncore_forcewake_get(gt->uncore, FORCEWAKE_ALL);
202 
203 	intel_gt_check_clock_frequency(gt);
204 
205 	/*
206 	 * As we have just resumed the machine and woken the device up from
207 	 * deep PCI sleep (presumably D3_cold), assume the HW has been reset
208 	 * back to defaults, recovering from whatever wedged state we left it
209 	 * in and so worth trying to use the device once more.
210 	 */
211 	if (intel_gt_is_wedged(gt))
212 		intel_gt_unset_wedged(gt);
213 
214 	/* For GuC mode, ensure submission is disabled before stopping ring */
215 	intel_uc_reset_prepare(&gt->uc);
216 
217 	for_each_engine(engine, gt, id) {
218 		if (engine->reset.prepare)
219 			engine->reset.prepare(engine);
220 
221 		if (engine->sanitize)
222 			engine->sanitize(engine);
223 	}
224 
225 	if (reset_engines(gt) || force) {
226 		for_each_engine(engine, gt, id)
227 			__intel_engine_reset(engine, false);
228 	}
229 
230 	intel_uc_reset(&gt->uc, false);
231 
232 	for_each_engine(engine, gt, id)
233 		if (engine->reset.finish)
234 			engine->reset.finish(engine);
235 
236 	intel_rps_sanitize(&gt->rps);
237 
238 	intel_uncore_forcewake_put(gt->uncore, FORCEWAKE_ALL);
239 	intel_runtime_pm_put(gt->uncore->rpm, wakeref);
240 }
241 
242 void intel_gt_pm_fini(struct intel_gt *gt)
243 {
244 	intel_rc6_fini(&gt->rc6);
245 }
246 
247 int intel_gt_resume(struct intel_gt *gt)
248 {
249 	struct intel_engine_cs *engine;
250 	enum intel_engine_id id;
251 	int err;
252 
253 	err = intel_gt_has_unrecoverable_error(gt);
254 	if (err)
255 		return err;
256 
257 	GT_TRACE(gt, "\n");
258 
259 	/*
260 	 * After resume, we may need to poke into the pinned kernel
261 	 * contexts to paper over any damage caused by the sudden suspend.
262 	 * Only the kernel contexts should remain pinned over suspend,
263 	 * allowing us to fixup the user contexts on their first pin.
264 	 */
265 	gt_sanitize(gt, true);
266 
267 	intel_gt_pm_get(gt);
268 
269 	intel_uncore_forcewake_get(gt->uncore, FORCEWAKE_ALL);
270 	intel_rc6_sanitize(&gt->rc6);
271 	if (intel_gt_is_wedged(gt)) {
272 		err = -EIO;
273 		goto out_fw;
274 	}
275 
276 	/* Only when the HW is re-initialised, can we replay the requests */
277 	err = intel_gt_init_hw(gt);
278 	if (err) {
279 		gt_probe_error(gt, "Failed to initialize GPU, declaring it wedged!\n");
280 		goto err_wedged;
281 	}
282 
283 	intel_uc_reset_finish(&gt->uc);
284 
285 	intel_rps_enable(&gt->rps);
286 	intel_llc_enable(&gt->llc);
287 
288 	for_each_engine(engine, gt, id) {
289 		intel_engine_pm_get(engine);
290 
291 		engine->serial++; /* kernel context lost */
292 		err = intel_engine_resume(engine);
293 
294 		intel_engine_pm_put(engine);
295 		if (err) {
296 			gt_err(gt, "Failed to restart %s (%d)\n",
297 			       engine->name, err);
298 			goto err_wedged;
299 		}
300 	}
301 
302 	intel_rc6_enable(&gt->rc6);
303 
304 	intel_uc_resume(&gt->uc);
305 
306 	user_forcewake(gt, false);
307 
308 out_fw:
309 	intel_uncore_forcewake_put(gt->uncore, FORCEWAKE_ALL);
310 	intel_gt_pm_put(gt);
311 	return err;
312 
313 err_wedged:
314 	intel_gt_set_wedged(gt);
315 	goto out_fw;
316 }
317 
318 static void wait_for_suspend(struct intel_gt *gt)
319 {
320 	if (!intel_gt_pm_is_awake(gt))
321 		return;
322 
323 	if (intel_gt_wait_for_idle(gt, I915_GT_SUSPEND_IDLE_TIMEOUT) == -ETIME) {
324 		/*
325 		 * Forcibly cancel outstanding work and leave
326 		 * the gpu quiet.
327 		 */
328 		intel_gt_set_wedged(gt);
329 		intel_gt_retire_requests(gt);
330 	}
331 
332 	intel_gt_pm_wait_for_idle(gt);
333 }
334 
335 void intel_gt_suspend_prepare(struct intel_gt *gt)
336 {
337 	user_forcewake(gt, true);
338 	wait_for_suspend(gt);
339 }
340 
341 static suspend_state_t pm_suspend_target(void)
342 {
343 #if IS_ENABLED(CONFIG_SUSPEND) && IS_ENABLED(CONFIG_PM_SLEEP)
344 	return pm_suspend_target_state;
345 #else
346 	return PM_SUSPEND_TO_IDLE;
347 #endif
348 }
349 
350 void intel_gt_suspend_late(struct intel_gt *gt)
351 {
352 	intel_wakeref_t wakeref;
353 
354 	/* We expect to be idle already; but also want to be independent */
355 	wait_for_suspend(gt);
356 
357 	if (is_mock_gt(gt))
358 		return;
359 
360 	GEM_BUG_ON(gt->awake);
361 
362 	intel_uc_suspend(&gt->uc);
363 
364 	/*
365 	 * On disabling the device, we want to turn off HW access to memory
366 	 * that we no longer own.
367 	 *
368 	 * However, not all suspend-states disable the device. S0 (s2idle)
369 	 * is effectively runtime-suspend, the device is left powered on
370 	 * but needs to be put into a low power state. We need to keep
371 	 * powermanagement enabled, but we also retain system state and so
372 	 * it remains safe to keep on using our allocated memory.
373 	 */
374 	if (pm_suspend_target() == PM_SUSPEND_TO_IDLE)
375 		return;
376 
377 	with_intel_runtime_pm(gt->uncore->rpm, wakeref) {
378 		intel_rps_disable(&gt->rps);
379 		intel_rc6_disable(&gt->rc6);
380 		intel_llc_disable(&gt->llc);
381 	}
382 
383 	gt_sanitize(gt, false);
384 
385 	GT_TRACE(gt, "\n");
386 }
387 
388 void intel_gt_runtime_suspend(struct intel_gt *gt)
389 {
390 	intel_uc_runtime_suspend(&gt->uc);
391 
392 	GT_TRACE(gt, "\n");
393 }
394 
395 int intel_gt_runtime_resume(struct intel_gt *gt)
396 {
397 	int ret;
398 
399 	GT_TRACE(gt, "\n");
400 	intel_gt_init_swizzling(gt);
401 	intel_ggtt_restore_fences(gt->ggtt);
402 
403 	ret = intel_uc_runtime_resume(&gt->uc);
404 	if (ret)
405 		return ret;
406 
407 	return 0;
408 }
409 
410 static ktime_t __intel_gt_get_awake_time(const struct intel_gt *gt)
411 {
412 	ktime_t total = gt->stats.total;
413 
414 	if (gt->stats.active)
415 		total = ktime_add(total,
416 				  ktime_sub(ktime_get(), gt->stats.start));
417 
418 	return total;
419 }
420 
421 ktime_t intel_gt_get_awake_time(const struct intel_gt *gt)
422 {
423 	unsigned int seq;
424 	ktime_t total;
425 
426 	do {
427 		seq = read_seqcount_begin(&gt->stats.lock);
428 		total = __intel_gt_get_awake_time(gt);
429 	} while (read_seqcount_retry(&gt->stats.lock, seq));
430 
431 	return total;
432 }
433 
434 #if IS_ENABLED(CONFIG_DRM_I915_SELFTEST)
435 #include "selftest_gt_pm.c"
436 #endif
437