xref: /openbsd-src/sys/dev/pci/drm/i915/gt/intel_llc.c (revision 1bb76ff151c0aba8e3312a604e4cd2e5195cf4b7)
15ca02815Sjsg // SPDX-License-Identifier: MIT
2c349dbc7Sjsg /*
3c349dbc7Sjsg  * Copyright © 2019 Intel Corporation
4c349dbc7Sjsg  */
5c349dbc7Sjsg 
6*1bb76ff1Sjsg #include <asm/tsc.h>
7c349dbc7Sjsg #include <linux/cpufreq.h>
8c349dbc7Sjsg 
9c349dbc7Sjsg #include "i915_drv.h"
10*1bb76ff1Sjsg #include "i915_reg.h"
11c349dbc7Sjsg #include "intel_gt.h"
12c349dbc7Sjsg #include "intel_llc.h"
13*1bb76ff1Sjsg #include "intel_mchbar_regs.h"
14*1bb76ff1Sjsg #include "intel_pcode.h"
15*1bb76ff1Sjsg #include "intel_rps.h"
16c349dbc7Sjsg 
17c349dbc7Sjsg struct ia_constants {
18c349dbc7Sjsg 	unsigned int min_gpu_freq;
19c349dbc7Sjsg 	unsigned int max_gpu_freq;
20c349dbc7Sjsg 
21c349dbc7Sjsg 	unsigned int min_ring_freq;
22c349dbc7Sjsg 	unsigned int max_ia_freq;
23c349dbc7Sjsg };
24c349dbc7Sjsg 
llc_to_gt(struct intel_llc * llc)25c349dbc7Sjsg static struct intel_gt *llc_to_gt(struct intel_llc *llc)
26c349dbc7Sjsg {
27c349dbc7Sjsg 	return container_of(llc, struct intel_gt, llc);
28c349dbc7Sjsg }
29c349dbc7Sjsg 
cpu_max_MHz(void)30c349dbc7Sjsg static unsigned int cpu_max_MHz(void)
31c349dbc7Sjsg {
32c349dbc7Sjsg 	struct cpufreq_policy *policy;
33c349dbc7Sjsg 	unsigned int max_khz;
34c349dbc7Sjsg 
35c349dbc7Sjsg #ifdef notyet
36c349dbc7Sjsg 	policy = cpufreq_cpu_get(0);
37c349dbc7Sjsg 	if (policy) {
38c349dbc7Sjsg 		max_khz = policy->cpuinfo.max_freq;
39c349dbc7Sjsg 		cpufreq_cpu_put(policy);
40c349dbc7Sjsg 	} else {
41c349dbc7Sjsg 		/*
42c349dbc7Sjsg 		 * Default to measured freq if none found, PCU will ensure we
43c349dbc7Sjsg 		 * don't go over
44c349dbc7Sjsg 		 */
45c349dbc7Sjsg 		max_khz = tsc_khz;
46c349dbc7Sjsg 	}
47c349dbc7Sjsg #else
48c349dbc7Sjsg 	/* XXX we ideally want the max not cpuspeed... */
49c349dbc7Sjsg 	max_khz = cpuspeed;
50c349dbc7Sjsg #endif
51c349dbc7Sjsg 
52c349dbc7Sjsg 	return max_khz / 1000;
53c349dbc7Sjsg }
54c349dbc7Sjsg 
get_ia_constants(struct intel_llc * llc,struct ia_constants * consts)55c349dbc7Sjsg static bool get_ia_constants(struct intel_llc *llc,
56c349dbc7Sjsg 			     struct ia_constants *consts)
57c349dbc7Sjsg {
58c349dbc7Sjsg 	struct drm_i915_private *i915 = llc_to_gt(llc)->i915;
59c349dbc7Sjsg 	struct intel_rps *rps = &llc_to_gt(llc)->rps;
60c349dbc7Sjsg 
61c349dbc7Sjsg 	if (!HAS_LLC(i915) || IS_DGFX(i915))
62c349dbc7Sjsg 		return false;
63c349dbc7Sjsg 
64c349dbc7Sjsg 	consts->max_ia_freq = cpu_max_MHz();
65c349dbc7Sjsg 
66c349dbc7Sjsg 	consts->min_ring_freq =
67c349dbc7Sjsg 		intel_uncore_read(llc_to_gt(llc)->uncore, DCLK) & 0xf;
68c349dbc7Sjsg 	/* convert DDR frequency from units of 266.6MHz to bandwidth */
69c349dbc7Sjsg 	consts->min_ring_freq = mult_frac(consts->min_ring_freq, 8, 3);
70c349dbc7Sjsg 
71*1bb76ff1Sjsg 	consts->min_gpu_freq = intel_rps_get_min_raw_freq(rps);
72*1bb76ff1Sjsg 	consts->max_gpu_freq = intel_rps_get_max_raw_freq(rps);
73c349dbc7Sjsg 
74c349dbc7Sjsg 	return true;
75c349dbc7Sjsg }
76c349dbc7Sjsg 
calc_ia_freq(struct intel_llc * llc,unsigned int gpu_freq,const struct ia_constants * consts,unsigned int * out_ia_freq,unsigned int * out_ring_freq)77c349dbc7Sjsg static void calc_ia_freq(struct intel_llc *llc,
78c349dbc7Sjsg 			 unsigned int gpu_freq,
79c349dbc7Sjsg 			 const struct ia_constants *consts,
80c349dbc7Sjsg 			 unsigned int *out_ia_freq,
81c349dbc7Sjsg 			 unsigned int *out_ring_freq)
82c349dbc7Sjsg {
83c349dbc7Sjsg 	struct drm_i915_private *i915 = llc_to_gt(llc)->i915;
84c349dbc7Sjsg 	const int diff = consts->max_gpu_freq - gpu_freq;
85c349dbc7Sjsg 	unsigned int ia_freq = 0, ring_freq = 0;
86c349dbc7Sjsg 
875ca02815Sjsg 	if (GRAPHICS_VER(i915) >= 9) {
88c349dbc7Sjsg 		/*
89c349dbc7Sjsg 		 * ring_freq = 2 * GT. ring_freq is in 100MHz units
90c349dbc7Sjsg 		 * No floor required for ring frequency on SKL.
91c349dbc7Sjsg 		 */
92c349dbc7Sjsg 		ring_freq = gpu_freq;
935ca02815Sjsg 	} else if (GRAPHICS_VER(i915) >= 8) {
94c349dbc7Sjsg 		/* max(2 * GT, DDR). NB: GT is 50MHz units */
95c349dbc7Sjsg 		ring_freq = max(consts->min_ring_freq, gpu_freq);
96c349dbc7Sjsg 	} else if (IS_HASWELL(i915)) {
97c349dbc7Sjsg 		ring_freq = mult_frac(gpu_freq, 5, 4);
98c349dbc7Sjsg 		ring_freq = max(consts->min_ring_freq, ring_freq);
99c349dbc7Sjsg 		/* leave ia_freq as the default, chosen by cpufreq */
100c349dbc7Sjsg 	} else {
101c349dbc7Sjsg 		const int min_freq = 15;
102c349dbc7Sjsg 		const int scale = 180;
103c349dbc7Sjsg 
104c349dbc7Sjsg 		/*
105c349dbc7Sjsg 		 * On older processors, there is no separate ring
106c349dbc7Sjsg 		 * clock domain, so in order to boost the bandwidth
107c349dbc7Sjsg 		 * of the ring, we need to upclock the CPU (ia_freq).
108c349dbc7Sjsg 		 *
109c349dbc7Sjsg 		 * For GPU frequencies less than 750MHz,
110c349dbc7Sjsg 		 * just use the lowest ring freq.
111c349dbc7Sjsg 		 */
112c349dbc7Sjsg 		if (gpu_freq < min_freq)
113c349dbc7Sjsg 			ia_freq = 800;
114c349dbc7Sjsg 		else
115c349dbc7Sjsg 			ia_freq = consts->max_ia_freq - diff * scale / 2;
116c349dbc7Sjsg 		ia_freq = DIV_ROUND_CLOSEST(ia_freq, 100);
117c349dbc7Sjsg 	}
118c349dbc7Sjsg 
119c349dbc7Sjsg 	*out_ia_freq = ia_freq;
120c349dbc7Sjsg 	*out_ring_freq = ring_freq;
121c349dbc7Sjsg }
122c349dbc7Sjsg 
gen6_update_ring_freq(struct intel_llc * llc)123c349dbc7Sjsg static void gen6_update_ring_freq(struct intel_llc *llc)
124c349dbc7Sjsg {
125c349dbc7Sjsg 	struct ia_constants consts;
126c349dbc7Sjsg 	unsigned int gpu_freq;
127c349dbc7Sjsg 
128c349dbc7Sjsg 	if (!get_ia_constants(llc, &consts))
129c349dbc7Sjsg 		return;
130c349dbc7Sjsg 
131c349dbc7Sjsg 	/*
132*1bb76ff1Sjsg 	 * Although this is unlikely on any platform during initialization,
133*1bb76ff1Sjsg 	 * let's ensure we don't get accidentally into infinite loop
134*1bb76ff1Sjsg 	 */
135*1bb76ff1Sjsg 	if (consts.max_gpu_freq <= consts.min_gpu_freq)
136*1bb76ff1Sjsg 		return;
137*1bb76ff1Sjsg 	/*
138c349dbc7Sjsg 	 * For each potential GPU frequency, load a ring frequency we'd like
139c349dbc7Sjsg 	 * to use for memory access.  We do this by specifying the IA frequency
140c349dbc7Sjsg 	 * the PCU should use as a reference to determine the ring frequency.
141c349dbc7Sjsg 	 */
142c349dbc7Sjsg 	for (gpu_freq = consts.max_gpu_freq;
143c349dbc7Sjsg 	     gpu_freq >= consts.min_gpu_freq;
144c349dbc7Sjsg 	     gpu_freq--) {
145c349dbc7Sjsg 		unsigned int ia_freq, ring_freq;
146c349dbc7Sjsg 
147c349dbc7Sjsg 		calc_ia_freq(llc, gpu_freq, &consts, &ia_freq, &ring_freq);
148*1bb76ff1Sjsg 		snb_pcode_write(llc_to_gt(llc)->uncore, GEN6_PCODE_WRITE_MIN_FREQ_TABLE,
149c349dbc7Sjsg 				ia_freq << GEN6_PCODE_FREQ_IA_RATIO_SHIFT |
150c349dbc7Sjsg 				ring_freq << GEN6_PCODE_FREQ_RING_RATIO_SHIFT |
151c349dbc7Sjsg 				gpu_freq);
152c349dbc7Sjsg 	}
153c349dbc7Sjsg }
154c349dbc7Sjsg 
intel_llc_enable(struct intel_llc * llc)155c349dbc7Sjsg void intel_llc_enable(struct intel_llc *llc)
156c349dbc7Sjsg {
157c349dbc7Sjsg 	gen6_update_ring_freq(llc);
158c349dbc7Sjsg }
159c349dbc7Sjsg 
intel_llc_disable(struct intel_llc * llc)160c349dbc7Sjsg void intel_llc_disable(struct intel_llc *llc)
161c349dbc7Sjsg {
162c349dbc7Sjsg 	/* Currently there is no HW configuration to be done to disable. */
163c349dbc7Sjsg }
164c349dbc7Sjsg 
165c349dbc7Sjsg #if IS_ENABLED(CONFIG_DRM_I915_SELFTEST)
166c349dbc7Sjsg #include "selftest_llc.c"
167c349dbc7Sjsg #endif
168