xref: /openbmc/linux/drivers/gpu/drm/i915/gt/intel_llc.c (revision e1cab970)
124f90d66SChris Wilson // SPDX-License-Identifier: MIT
20dc3c562SAndi Shyti /*
30dc3c562SAndi Shyti  * Copyright © 2019 Intel Corporation
40dc3c562SAndi Shyti  */
50dc3c562SAndi Shyti 
6aa5e9f98SLucas De Marchi #include <asm/tsc.h>
70dc3c562SAndi Shyti #include <linux/cpufreq.h>
80dc3c562SAndi Shyti 
90dc3c562SAndi Shyti #include "i915_drv.h"
10ce2fce25SMatt Roper #include "i915_reg.h"
110dc3c562SAndi Shyti #include "intel_gt.h"
120dc3c562SAndi Shyti #include "intel_llc.h"
13e30e6c7bSMatt Roper #include "intel_mchbar_regs.h"
144dd4375bSJani Nikula #include "intel_pcode.h"
15*e1cab970SRodrigo Vivi #include "intel_rps.h"
160dc3c562SAndi Shyti 
170dc3c562SAndi Shyti struct ia_constants {
180dc3c562SAndi Shyti 	unsigned int min_gpu_freq;
190dc3c562SAndi Shyti 	unsigned int max_gpu_freq;
200dc3c562SAndi Shyti 
210dc3c562SAndi Shyti 	unsigned int min_ring_freq;
220dc3c562SAndi Shyti 	unsigned int max_ia_freq;
230dc3c562SAndi Shyti };
240dc3c562SAndi Shyti 
llc_to_gt(struct intel_llc * llc)250dc3c562SAndi Shyti static struct intel_gt *llc_to_gt(struct intel_llc *llc)
260dc3c562SAndi Shyti {
270dc3c562SAndi Shyti 	return container_of(llc, struct intel_gt, llc);
280dc3c562SAndi Shyti }
290dc3c562SAndi Shyti 
cpu_max_MHz(void)300dc3c562SAndi Shyti static unsigned int cpu_max_MHz(void)
310dc3c562SAndi Shyti {
320dc3c562SAndi Shyti 	struct cpufreq_policy *policy;
330dc3c562SAndi Shyti 	unsigned int max_khz;
340dc3c562SAndi Shyti 
350dc3c562SAndi Shyti 	policy = cpufreq_cpu_get(0);
360dc3c562SAndi Shyti 	if (policy) {
370dc3c562SAndi Shyti 		max_khz = policy->cpuinfo.max_freq;
380dc3c562SAndi Shyti 		cpufreq_cpu_put(policy);
390dc3c562SAndi Shyti 	} else {
400dc3c562SAndi Shyti 		/*
410dc3c562SAndi Shyti 		 * Default to measured freq if none found, PCU will ensure we
420dc3c562SAndi Shyti 		 * don't go over
430dc3c562SAndi Shyti 		 */
440dc3c562SAndi Shyti 		max_khz = tsc_khz;
450dc3c562SAndi Shyti 	}
460dc3c562SAndi Shyti 
470dc3c562SAndi Shyti 	return max_khz / 1000;
480dc3c562SAndi Shyti }
490dc3c562SAndi Shyti 
get_ia_constants(struct intel_llc * llc,struct ia_constants * consts)500dc3c562SAndi Shyti static bool get_ia_constants(struct intel_llc *llc,
510dc3c562SAndi Shyti 			     struct ia_constants *consts)
520dc3c562SAndi Shyti {
530dc3c562SAndi Shyti 	struct drm_i915_private *i915 = llc_to_gt(llc)->i915;
543e7abf81SAndi Shyti 	struct intel_rps *rps = &llc_to_gt(llc)->rps;
550dc3c562SAndi Shyti 
56c014e076SChris Wilson 	if (!HAS_LLC(i915) || IS_DGFX(i915))
57c014e076SChris Wilson 		return false;
58c014e076SChris Wilson 
590dc3c562SAndi Shyti 	consts->max_ia_freq = cpu_max_MHz();
600dc3c562SAndi Shyti 
610dc3c562SAndi Shyti 	consts->min_ring_freq =
620dc3c562SAndi Shyti 		intel_uncore_read(llc_to_gt(llc)->uncore, DCLK) & 0xf;
630dc3c562SAndi Shyti 	/* convert DDR frequency from units of 266.6MHz to bandwidth */
640dc3c562SAndi Shyti 	consts->min_ring_freq = mult_frac(consts->min_ring_freq, 8, 3);
650dc3c562SAndi Shyti 
66*e1cab970SRodrigo Vivi 	consts->min_gpu_freq = intel_rps_get_min_raw_freq(rps);
67*e1cab970SRodrigo Vivi 	consts->max_gpu_freq = intel_rps_get_max_raw_freq(rps);
680dc3c562SAndi Shyti 
690dc3c562SAndi Shyti 	return true;
700dc3c562SAndi Shyti }
710dc3c562SAndi Shyti 
calc_ia_freq(struct intel_llc * llc,unsigned int gpu_freq,const struct ia_constants * consts,unsigned int * out_ia_freq,unsigned int * out_ring_freq)720dc3c562SAndi Shyti static void calc_ia_freq(struct intel_llc *llc,
730dc3c562SAndi Shyti 			 unsigned int gpu_freq,
740dc3c562SAndi Shyti 			 const struct ia_constants *consts,
750dc3c562SAndi Shyti 			 unsigned int *out_ia_freq,
760dc3c562SAndi Shyti 			 unsigned int *out_ring_freq)
770dc3c562SAndi Shyti {
780dc3c562SAndi Shyti 	struct drm_i915_private *i915 = llc_to_gt(llc)->i915;
790dc3c562SAndi Shyti 	const int diff = consts->max_gpu_freq - gpu_freq;
800dc3c562SAndi Shyti 	unsigned int ia_freq = 0, ring_freq = 0;
810dc3c562SAndi Shyti 
82c816723bSLucas De Marchi 	if (GRAPHICS_VER(i915) >= 9) {
830dc3c562SAndi Shyti 		/*
840dc3c562SAndi Shyti 		 * ring_freq = 2 * GT. ring_freq is in 100MHz units
850dc3c562SAndi Shyti 		 * No floor required for ring frequency on SKL.
860dc3c562SAndi Shyti 		 */
870dc3c562SAndi Shyti 		ring_freq = gpu_freq;
88c816723bSLucas De Marchi 	} else if (GRAPHICS_VER(i915) >= 8) {
890dc3c562SAndi Shyti 		/* max(2 * GT, DDR). NB: GT is 50MHz units */
900dc3c562SAndi Shyti 		ring_freq = max(consts->min_ring_freq, gpu_freq);
910dc3c562SAndi Shyti 	} else if (IS_HASWELL(i915)) {
920dc3c562SAndi Shyti 		ring_freq = mult_frac(gpu_freq, 5, 4);
930dc3c562SAndi Shyti 		ring_freq = max(consts->min_ring_freq, ring_freq);
940dc3c562SAndi Shyti 		/* leave ia_freq as the default, chosen by cpufreq */
950dc3c562SAndi Shyti 	} else {
960dc3c562SAndi Shyti 		const int min_freq = 15;
970dc3c562SAndi Shyti 		const int scale = 180;
980dc3c562SAndi Shyti 
990dc3c562SAndi Shyti 		/*
1000dc3c562SAndi Shyti 		 * On older processors, there is no separate ring
1010dc3c562SAndi Shyti 		 * clock domain, so in order to boost the bandwidth
1020dc3c562SAndi Shyti 		 * of the ring, we need to upclock the CPU (ia_freq).
1030dc3c562SAndi Shyti 		 *
1040dc3c562SAndi Shyti 		 * For GPU frequencies less than 750MHz,
1050dc3c562SAndi Shyti 		 * just use the lowest ring freq.
1060dc3c562SAndi Shyti 		 */
1070dc3c562SAndi Shyti 		if (gpu_freq < min_freq)
1080dc3c562SAndi Shyti 			ia_freq = 800;
1090dc3c562SAndi Shyti 		else
1100dc3c562SAndi Shyti 			ia_freq = consts->max_ia_freq - diff * scale / 2;
1110dc3c562SAndi Shyti 		ia_freq = DIV_ROUND_CLOSEST(ia_freq, 100);
1120dc3c562SAndi Shyti 	}
1130dc3c562SAndi Shyti 
1140dc3c562SAndi Shyti 	*out_ia_freq = ia_freq;
1150dc3c562SAndi Shyti 	*out_ring_freq = ring_freq;
1160dc3c562SAndi Shyti }
1170dc3c562SAndi Shyti 
gen6_update_ring_freq(struct intel_llc * llc)1180dc3c562SAndi Shyti static void gen6_update_ring_freq(struct intel_llc *llc)
1190dc3c562SAndi Shyti {
1200dc3c562SAndi Shyti 	struct ia_constants consts;
1210dc3c562SAndi Shyti 	unsigned int gpu_freq;
1220dc3c562SAndi Shyti 
1230dc3c562SAndi Shyti 	if (!get_ia_constants(llc, &consts))
1240dc3c562SAndi Shyti 		return;
1250dc3c562SAndi Shyti 
1260dc3c562SAndi Shyti 	/*
127*e1cab970SRodrigo Vivi 	 * Although this is unlikely on any platform during initialization,
128*e1cab970SRodrigo Vivi 	 * let's ensure we don't get accidentally into infinite loop
129*e1cab970SRodrigo Vivi 	 */
130*e1cab970SRodrigo Vivi 	if (consts.max_gpu_freq <= consts.min_gpu_freq)
131*e1cab970SRodrigo Vivi 		return;
132*e1cab970SRodrigo Vivi 	/*
1330dc3c562SAndi Shyti 	 * For each potential GPU frequency, load a ring frequency we'd like
1340dc3c562SAndi Shyti 	 * to use for memory access.  We do this by specifying the IA frequency
1350dc3c562SAndi Shyti 	 * the PCU should use as a reference to determine the ring frequency.
1360dc3c562SAndi Shyti 	 */
1370dc3c562SAndi Shyti 	for (gpu_freq = consts.max_gpu_freq;
1380dc3c562SAndi Shyti 	     gpu_freq >= consts.min_gpu_freq;
1390dc3c562SAndi Shyti 	     gpu_freq--) {
1400dc3c562SAndi Shyti 		unsigned int ia_freq, ring_freq;
1410dc3c562SAndi Shyti 
1420dc3c562SAndi Shyti 		calc_ia_freq(llc, gpu_freq, &consts, &ia_freq, &ring_freq);
143ee421bb4SAshutosh Dixit 		snb_pcode_write(llc_to_gt(llc)->uncore, GEN6_PCODE_WRITE_MIN_FREQ_TABLE,
1440dc3c562SAndi Shyti 				ia_freq << GEN6_PCODE_FREQ_IA_RATIO_SHIFT |
1450dc3c562SAndi Shyti 				ring_freq << GEN6_PCODE_FREQ_RING_RATIO_SHIFT |
1460dc3c562SAndi Shyti 				gpu_freq);
1470dc3c562SAndi Shyti 	}
1480dc3c562SAndi Shyti }
1490dc3c562SAndi Shyti 
intel_llc_enable(struct intel_llc * llc)1500dc3c562SAndi Shyti void intel_llc_enable(struct intel_llc *llc)
1510dc3c562SAndi Shyti {
1520dc3c562SAndi Shyti 	gen6_update_ring_freq(llc);
1530dc3c562SAndi Shyti }
1540dc3c562SAndi Shyti 
intel_llc_disable(struct intel_llc * llc)1550dc3c562SAndi Shyti void intel_llc_disable(struct intel_llc *llc)
1560dc3c562SAndi Shyti {
1570dc3c562SAndi Shyti 	/* Currently there is no HW configuration to be done to disable. */
1580dc3c562SAndi Shyti }
1590dc3c562SAndi Shyti 
1600dc3c562SAndi Shyti #if IS_ENABLED(CONFIG_DRM_I915_SELFTEST)
1610dc3c562SAndi Shyti #include "selftest_llc.c"
1620dc3c562SAndi Shyti #endif
163