xref: /openbmc/linux/drivers/gpu/drm/i915/display/intel_vblank.c (revision 248ed9e227e6cf59acb1aaf3aa30d530a0232c1a)
1 // SPDX-License-Identifier: MIT
2 /*
3  * Copyright © 2022-2023 Intel Corporation
4  */
5 
6 #include "i915_drv.h"
7 #include "i915_reg.h"
8 #include "intel_de.h"
9 #include "intel_display_types.h"
10 #include "intel_vblank.h"
11 #include "intel_vrr.h"
12 
13 /*
14  * This timing diagram depicts the video signal in and
15  * around the vertical blanking period.
16  *
17  * Assumptions about the fictitious mode used in this example:
18  *  vblank_start >= 3
19  *  vsync_start = vblank_start + 1
20  *  vsync_end = vblank_start + 2
21  *  vtotal = vblank_start + 3
22  *
23  *           start of vblank:
24  *           latch double buffered registers
25  *           increment frame counter (ctg+)
26  *           generate start of vblank interrupt (gen4+)
27  *           |
28  *           |          frame start:
29  *           |          generate frame start interrupt (aka. vblank interrupt) (gmch)
30  *           |          may be shifted forward 1-3 extra lines via TRANSCONF
31  *           |          |
32  *           |          |  start of vsync:
33  *           |          |  generate vsync interrupt
34  *           |          |  |
35  * ___xxxx___    ___xxxx___    ___xxxx___    ___xxxx___    ___xxxx___    ___xxxx
36  *       .   \hs/   .      \hs/          \hs/          \hs/   .      \hs/
37  * ----va---> <-----------------vb--------------------> <--------va-------------
38  *       |          |       <----vs----->                     |
39  * -vbs-----> <---vbs+1---> <---vbs+2---> <-----0-----> <-----1-----> <-----2--- (scanline counter gen2)
40  * -vbs-2---> <---vbs-1---> <---vbs-----> <---vbs+1---> <---vbs+2---> <-----0--- (scanline counter gen3+)
41  * -vbs-2---> <---vbs-2---> <---vbs-1---> <---vbs-----> <---vbs+1---> <---vbs+2- (scanline counter hsw+ hdmi)
42  *       |          |                                         |
43  *       last visible pixel                                   first visible pixel
44  *                  |                                         increment frame counter (gen3/4)
45  *                  pixel counter = vblank_start * htotal     pixel counter = 0 (gen3/4)
46  *
47  * x  = horizontal active
48  * _  = horizontal blanking
49  * hs = horizontal sync
50  * va = vertical active
51  * vb = vertical blanking
52  * vs = vertical sync
53  * vbs = vblank_start (number)
54  *
55  * Summary:
56  * - most events happen at the start of horizontal sync
57  * - frame start happens at the start of horizontal blank, 1-4 lines
58  *   (depending on TRANSCONF settings) after the start of vblank
59  * - gen3/4 pixel and frame counter are synchronized with the start
60  *   of horizontal active on the first line of vertical active
61  */
62 
63 /*
64  * Called from drm generic code, passed a 'crtc', which we use as a pipe index.
65  */
66 u32 i915_get_vblank_counter(struct drm_crtc *crtc)
67 {
68 	struct drm_i915_private *dev_priv = to_i915(crtc->dev);
69 	struct drm_vblank_crtc *vblank = &dev_priv->drm.vblank[drm_crtc_index(crtc)];
70 	const struct drm_display_mode *mode = &vblank->hwmode;
71 	enum pipe pipe = to_intel_crtc(crtc)->pipe;
72 	u32 pixel, vbl_start, hsync_start, htotal;
73 	u64 frame;
74 
75 	/*
76 	 * On i965gm TV output the frame counter only works up to
77 	 * the point when we enable the TV encoder. After that the
78 	 * frame counter ceases to work and reads zero. We need a
79 	 * vblank wait before enabling the TV encoder and so we
80 	 * have to enable vblank interrupts while the frame counter
81 	 * is still in a working state. However the core vblank code
82 	 * does not like us returning non-zero frame counter values
83 	 * when we've told it that we don't have a working frame
84 	 * counter. Thus we must stop non-zero values leaking out.
85 	 */
86 	if (!vblank->max_vblank_count)
87 		return 0;
88 
89 	htotal = mode->crtc_htotal;
90 	hsync_start = mode->crtc_hsync_start;
91 	vbl_start = mode->crtc_vblank_start;
92 	if (mode->flags & DRM_MODE_FLAG_INTERLACE)
93 		vbl_start = DIV_ROUND_UP(vbl_start, 2);
94 
95 	/* Convert to pixel count */
96 	vbl_start *= htotal;
97 
98 	/* Start of vblank event occurs at start of hsync */
99 	vbl_start -= htotal - hsync_start;
100 
101 	/*
102 	 * High & low register fields aren't synchronized, so make sure
103 	 * we get a low value that's stable across two reads of the high
104 	 * register.
105 	 */
106 	frame = intel_de_read64_2x32(dev_priv, PIPEFRAMEPIXEL(pipe), PIPEFRAME(pipe));
107 
108 	pixel = frame & PIPE_PIXEL_MASK;
109 	frame = (frame >> PIPE_FRAME_LOW_SHIFT) & 0xffffff;
110 
111 	/*
112 	 * The frame counter increments at beginning of active.
113 	 * Cook up a vblank counter by also checking the pixel
114 	 * counter against vblank start.
115 	 */
116 	return (frame + (pixel >= vbl_start)) & 0xffffff;
117 }
118 
119 u32 g4x_get_vblank_counter(struct drm_crtc *crtc)
120 {
121 	struct drm_i915_private *dev_priv = to_i915(crtc->dev);
122 	struct drm_vblank_crtc *vblank = &dev_priv->drm.vblank[drm_crtc_index(crtc)];
123 	enum pipe pipe = to_intel_crtc(crtc)->pipe;
124 
125 	if (!vblank->max_vblank_count)
126 		return 0;
127 
128 	return intel_de_read(dev_priv, PIPE_FRMCOUNT_G4X(pipe));
129 }
130 
131 static u32 intel_crtc_scanlines_since_frame_timestamp(struct intel_crtc *crtc)
132 {
133 	struct drm_i915_private *dev_priv = to_i915(crtc->base.dev);
134 	struct drm_vblank_crtc *vblank =
135 		&crtc->base.dev->vblank[drm_crtc_index(&crtc->base)];
136 	const struct drm_display_mode *mode = &vblank->hwmode;
137 	u32 htotal = mode->crtc_htotal;
138 	u32 clock = mode->crtc_clock;
139 	u32 scan_prev_time, scan_curr_time, scan_post_time;
140 
141 	/*
142 	 * To avoid the race condition where we might cross into the
143 	 * next vblank just between the PIPE_FRMTMSTMP and TIMESTAMP_CTR
144 	 * reads. We make sure we read PIPE_FRMTMSTMP and TIMESTAMP_CTR
145 	 * during the same frame.
146 	 */
147 	do {
148 		/*
149 		 * This field provides read back of the display
150 		 * pipe frame time stamp. The time stamp value
151 		 * is sampled at every start of vertical blank.
152 		 */
153 		scan_prev_time = intel_de_read_fw(dev_priv,
154 						  PIPE_FRMTMSTMP(crtc->pipe));
155 
156 		/*
157 		 * The TIMESTAMP_CTR register has the current
158 		 * time stamp value.
159 		 */
160 		scan_curr_time = intel_de_read_fw(dev_priv, IVB_TIMESTAMP_CTR);
161 
162 		scan_post_time = intel_de_read_fw(dev_priv,
163 						  PIPE_FRMTMSTMP(crtc->pipe));
164 	} while (scan_post_time != scan_prev_time);
165 
166 	return div_u64(mul_u32_u32(scan_curr_time - scan_prev_time,
167 				   clock), 1000 * htotal);
168 }
169 
170 /*
171  * On certain encoders on certain platforms, pipe
172  * scanline register will not work to get the scanline,
173  * since the timings are driven from the PORT or issues
174  * with scanline register updates.
175  * This function will use Framestamp and current
176  * timestamp registers to calculate the scanline.
177  */
178 static u32 __intel_get_crtc_scanline_from_timestamp(struct intel_crtc *crtc)
179 {
180 	struct drm_vblank_crtc *vblank =
181 		&crtc->base.dev->vblank[drm_crtc_index(&crtc->base)];
182 	const struct drm_display_mode *mode = &vblank->hwmode;
183 	u32 vblank_start = mode->crtc_vblank_start;
184 	u32 vtotal = mode->crtc_vtotal;
185 	u32 scanline;
186 
187 	scanline = intel_crtc_scanlines_since_frame_timestamp(crtc);
188 	scanline = min(scanline, vtotal - 1);
189 	scanline = (scanline + vblank_start) % vtotal;
190 
191 	return scanline;
192 }
193 
194 /*
195  * intel_de_read_fw(), only for fast reads of display block, no need for
196  * forcewake etc.
197  */
198 static int __intel_get_crtc_scanline(struct intel_crtc *crtc)
199 {
200 	struct drm_device *dev = crtc->base.dev;
201 	struct drm_i915_private *dev_priv = to_i915(dev);
202 	const struct drm_display_mode *mode;
203 	struct drm_vblank_crtc *vblank;
204 	enum pipe pipe = crtc->pipe;
205 	int position, vtotal;
206 
207 	if (!crtc->active)
208 		return 0;
209 
210 	vblank = &crtc->base.dev->vblank[drm_crtc_index(&crtc->base)];
211 	mode = &vblank->hwmode;
212 
213 	if (crtc->mode_flags & I915_MODE_FLAG_GET_SCANLINE_FROM_TIMESTAMP)
214 		return __intel_get_crtc_scanline_from_timestamp(crtc);
215 
216 	vtotal = mode->crtc_vtotal;
217 	if (mode->flags & DRM_MODE_FLAG_INTERLACE)
218 		vtotal /= 2;
219 
220 	position = intel_de_read_fw(dev_priv, PIPEDSL(pipe)) & PIPEDSL_LINE_MASK;
221 
222 	/*
223 	 * On HSW, the DSL reg (0x70000) appears to return 0 if we
224 	 * read it just before the start of vblank.  So try it again
225 	 * so we don't accidentally end up spanning a vblank frame
226 	 * increment, causing the pipe_update_end() code to squak at us.
227 	 *
228 	 * The nature of this problem means we can't simply check the ISR
229 	 * bit and return the vblank start value; nor can we use the scanline
230 	 * debug register in the transcoder as it appears to have the same
231 	 * problem.  We may need to extend this to include other platforms,
232 	 * but so far testing only shows the problem on HSW.
233 	 */
234 	if (HAS_DDI(dev_priv) && !position) {
235 		int i, temp;
236 
237 		for (i = 0; i < 100; i++) {
238 			udelay(1);
239 			temp = intel_de_read_fw(dev_priv, PIPEDSL(pipe)) & PIPEDSL_LINE_MASK;
240 			if (temp != position) {
241 				position = temp;
242 				break;
243 			}
244 		}
245 	}
246 
247 	/*
248 	 * See update_scanline_offset() for the details on the
249 	 * scanline_offset adjustment.
250 	 */
251 	return (position + crtc->scanline_offset) % vtotal;
252 }
253 
254 static bool i915_get_crtc_scanoutpos(struct drm_crtc *_crtc,
255 				     bool in_vblank_irq,
256 				     int *vpos, int *hpos,
257 				     ktime_t *stime, ktime_t *etime,
258 				     const struct drm_display_mode *mode)
259 {
260 	struct drm_device *dev = _crtc->dev;
261 	struct drm_i915_private *dev_priv = to_i915(dev);
262 	struct intel_crtc *crtc = to_intel_crtc(_crtc);
263 	enum pipe pipe = crtc->pipe;
264 	int position;
265 	int vbl_start, vbl_end, hsync_start, htotal, vtotal;
266 	unsigned long irqflags;
267 	bool use_scanline_counter = DISPLAY_VER(dev_priv) >= 5 ||
268 		IS_G4X(dev_priv) || DISPLAY_VER(dev_priv) == 2 ||
269 		crtc->mode_flags & I915_MODE_FLAG_USE_SCANLINE_COUNTER;
270 
271 	if (drm_WARN_ON(&dev_priv->drm, !mode->crtc_clock)) {
272 		drm_dbg(&dev_priv->drm,
273 			"trying to get scanoutpos for disabled pipe %c\n",
274 			pipe_name(pipe));
275 		return false;
276 	}
277 
278 	htotal = mode->crtc_htotal;
279 	hsync_start = mode->crtc_hsync_start;
280 	vtotal = mode->crtc_vtotal;
281 	vbl_start = mode->crtc_vblank_start;
282 	vbl_end = mode->crtc_vblank_end;
283 
284 	if (mode->flags & DRM_MODE_FLAG_INTERLACE) {
285 		vbl_start = DIV_ROUND_UP(vbl_start, 2);
286 		vbl_end /= 2;
287 		vtotal /= 2;
288 	}
289 
290 	/*
291 	 * Lock uncore.lock, as we will do multiple timing critical raw
292 	 * register reads, potentially with preemption disabled, so the
293 	 * following code must not block on uncore.lock.
294 	 */
295 	spin_lock_irqsave(&dev_priv->uncore.lock, irqflags);
296 
297 	/* preempt_disable_rt() should go right here in PREEMPT_RT patchset. */
298 
299 	/* Get optional system timestamp before query. */
300 	if (stime)
301 		*stime = ktime_get();
302 
303 	if (crtc->mode_flags & I915_MODE_FLAG_VRR) {
304 		int scanlines = intel_crtc_scanlines_since_frame_timestamp(crtc);
305 
306 		position = __intel_get_crtc_scanline(crtc);
307 
308 		/*
309 		 * Already exiting vblank? If so, shift our position
310 		 * so it looks like we're already apporaching the full
311 		 * vblank end. This should make the generated timestamp
312 		 * more or less match when the active portion will start.
313 		 */
314 		if (position >= vbl_start && scanlines < position)
315 			position = min(crtc->vmax_vblank_start + scanlines, vtotal - 1);
316 	} else if (use_scanline_counter) {
317 		/* No obvious pixelcount register. Only query vertical
318 		 * scanout position from Display scan line register.
319 		 */
320 		position = __intel_get_crtc_scanline(crtc);
321 	} else {
322 		/*
323 		 * Have access to pixelcount since start of frame.
324 		 * We can split this into vertical and horizontal
325 		 * scanout position.
326 		 */
327 		position = (intel_de_read_fw(dev_priv, PIPEFRAMEPIXEL(pipe)) & PIPE_PIXEL_MASK) >> PIPE_PIXEL_SHIFT;
328 
329 		/* convert to pixel counts */
330 		vbl_start *= htotal;
331 		vbl_end *= htotal;
332 		vtotal *= htotal;
333 
334 		/*
335 		 * In interlaced modes, the pixel counter counts all pixels,
336 		 * so one field will have htotal more pixels. In order to avoid
337 		 * the reported position from jumping backwards when the pixel
338 		 * counter is beyond the length of the shorter field, just
339 		 * clamp the position the length of the shorter field. This
340 		 * matches how the scanline counter based position works since
341 		 * the scanline counter doesn't count the two half lines.
342 		 */
343 		if (position >= vtotal)
344 			position = vtotal - 1;
345 
346 		/*
347 		 * Start of vblank interrupt is triggered at start of hsync,
348 		 * just prior to the first active line of vblank. However we
349 		 * consider lines to start at the leading edge of horizontal
350 		 * active. So, should we get here before we've crossed into
351 		 * the horizontal active of the first line in vblank, we would
352 		 * not set the DRM_SCANOUTPOS_INVBL flag. In order to fix that,
353 		 * always add htotal-hsync_start to the current pixel position.
354 		 */
355 		position = (position + htotal - hsync_start) % vtotal;
356 	}
357 
358 	/* Get optional system timestamp after query. */
359 	if (etime)
360 		*etime = ktime_get();
361 
362 	/* preempt_enable_rt() should go right here in PREEMPT_RT patchset. */
363 
364 	spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags);
365 
366 	/*
367 	 * While in vblank, position will be negative
368 	 * counting up towards 0 at vbl_end. And outside
369 	 * vblank, position will be positive counting
370 	 * up since vbl_end.
371 	 */
372 	if (position >= vbl_start)
373 		position -= vbl_end;
374 	else
375 		position += vtotal - vbl_end;
376 
377 	if (use_scanline_counter) {
378 		*vpos = position;
379 		*hpos = 0;
380 	} else {
381 		*vpos = position / htotal;
382 		*hpos = position - (*vpos * htotal);
383 	}
384 
385 	return true;
386 }
387 
388 bool intel_crtc_get_vblank_timestamp(struct drm_crtc *crtc, int *max_error,
389 				     ktime_t *vblank_time, bool in_vblank_irq)
390 {
391 	return drm_crtc_vblank_helper_get_vblank_timestamp_internal(
392 		crtc, max_error, vblank_time, in_vblank_irq,
393 		i915_get_crtc_scanoutpos);
394 }
395 
396 int intel_get_crtc_scanline(struct intel_crtc *crtc)
397 {
398 	struct drm_i915_private *dev_priv = to_i915(crtc->base.dev);
399 	unsigned long irqflags;
400 	int position;
401 
402 	spin_lock_irqsave(&dev_priv->uncore.lock, irqflags);
403 	position = __intel_get_crtc_scanline(crtc);
404 	spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags);
405 
406 	return position;
407 }
408 
409 static bool pipe_scanline_is_moving(struct drm_i915_private *dev_priv,
410 				    enum pipe pipe)
411 {
412 	i915_reg_t reg = PIPEDSL(pipe);
413 	u32 line1, line2;
414 
415 	line1 = intel_de_read(dev_priv, reg) & PIPEDSL_LINE_MASK;
416 	msleep(5);
417 	line2 = intel_de_read(dev_priv, reg) & PIPEDSL_LINE_MASK;
418 
419 	return line1 != line2;
420 }
421 
422 static void wait_for_pipe_scanline_moving(struct intel_crtc *crtc, bool state)
423 {
424 	struct drm_i915_private *dev_priv = to_i915(crtc->base.dev);
425 	enum pipe pipe = crtc->pipe;
426 
427 	/* Wait for the display line to settle/start moving */
428 	if (wait_for(pipe_scanline_is_moving(dev_priv, pipe) == state, 100))
429 		drm_err(&dev_priv->drm,
430 			"pipe %c scanline %s wait timed out\n",
431 			pipe_name(pipe), str_on_off(state));
432 }
433 
434 void intel_wait_for_pipe_scanline_stopped(struct intel_crtc *crtc)
435 {
436 	wait_for_pipe_scanline_moving(crtc, false);
437 }
438 
439 void intel_wait_for_pipe_scanline_moving(struct intel_crtc *crtc)
440 {
441 	wait_for_pipe_scanline_moving(crtc, true);
442 }
443 
444 static int intel_crtc_scanline_offset(const struct intel_crtc_state *crtc_state)
445 {
446 	struct drm_i915_private *i915 = to_i915(crtc_state->uapi.crtc->dev);
447 	const struct drm_display_mode *adjusted_mode = &crtc_state->hw.adjusted_mode;
448 
449 	/*
450 	 * The scanline counter increments at the leading edge of hsync.
451 	 *
452 	 * On most platforms it starts counting from vtotal-1 on the
453 	 * first active line. That means the scanline counter value is
454 	 * always one less than what we would expect. Ie. just after
455 	 * start of vblank, which also occurs at start of hsync (on the
456 	 * last active line), the scanline counter will read vblank_start-1.
457 	 *
458 	 * On gen2 the scanline counter starts counting from 1 instead
459 	 * of vtotal-1, so we have to subtract one (or rather add vtotal-1
460 	 * to keep the value positive), instead of adding one.
461 	 *
462 	 * On HSW+ the behaviour of the scanline counter depends on the output
463 	 * type. For DP ports it behaves like most other platforms, but on HDMI
464 	 * there's an extra 1 line difference. So we need to add two instead of
465 	 * one to the value.
466 	 *
467 	 * On VLV/CHV DSI the scanline counter would appear to increment
468 	 * approx. 1/3 of a scanline before start of vblank. Unfortunately
469 	 * that means we can't tell whether we're in vblank or not while
470 	 * we're on that particular line. We must still set scanline_offset
471 	 * to 1 so that the vblank timestamps come out correct when we query
472 	 * the scanline counter from within the vblank interrupt handler.
473 	 * However if queried just before the start of vblank we'll get an
474 	 * answer that's slightly in the future.
475 	 */
476 	if (DISPLAY_VER(i915) == 2) {
477 		int vtotal;
478 
479 		vtotal = adjusted_mode->crtc_vtotal;
480 		if (adjusted_mode->flags & DRM_MODE_FLAG_INTERLACE)
481 			vtotal /= 2;
482 
483 		return vtotal - 1;
484 	} else if (HAS_DDI(i915) && intel_crtc_has_type(crtc_state, INTEL_OUTPUT_HDMI)) {
485 		return 2;
486 	} else {
487 		return 1;
488 	}
489 }
490 
491 void intel_crtc_update_active_timings(const struct intel_crtc_state *crtc_state)
492 {
493 	struct intel_crtc *crtc = to_intel_crtc(crtc_state->uapi.crtc);
494 	struct drm_i915_private *i915 = to_i915(crtc->base.dev);
495 	struct drm_display_mode adjusted_mode;
496 	int vmax_vblank_start = 0;
497 	unsigned long irqflags;
498 
499 	drm_mode_init(&adjusted_mode, &crtc_state->hw.adjusted_mode);
500 
501 	if (crtc_state->vrr.enable) {
502 		adjusted_mode.crtc_vtotal = crtc_state->vrr.vmax;
503 		adjusted_mode.crtc_vblank_end = crtc_state->vrr.vmax;
504 		adjusted_mode.crtc_vblank_start = intel_vrr_vmin_vblank_start(crtc_state);
505 		vmax_vblank_start = intel_vrr_vmax_vblank_start(crtc_state);
506 	}
507 
508 	/*
509 	 * Belts and suspenders locking to guarantee everyone sees 100%
510 	 * consistent state during fastset seamless refresh rate changes.
511 	 *
512 	 * vblank_time_lock takes care of all drm_vblank.c stuff, and
513 	 * uncore.lock takes care of __intel_get_crtc_scanline() which
514 	 * may get called elsewhere as well.
515 	 *
516 	 * TODO maybe just protect everything (including
517 	 * __intel_get_crtc_scanline()) with vblank_time_lock?
518 	 * Need to audit everything to make sure it's safe.
519 	 */
520 	spin_lock_irqsave(&i915->drm.vblank_time_lock, irqflags);
521 	spin_lock(&i915->uncore.lock);
522 
523 	drm_calc_timestamping_constants(&crtc->base, &adjusted_mode);
524 
525 	crtc->vmax_vblank_start = vmax_vblank_start;
526 
527 	crtc->mode_flags = crtc_state->mode_flags;
528 
529 	crtc->scanline_offset = intel_crtc_scanline_offset(crtc_state);
530 
531 	spin_unlock(&i915->uncore.lock);
532 	spin_unlock_irqrestore(&i915->drm.vblank_time_lock, irqflags);
533 }
534