xref: /openbsd-src/sys/dev/pci/drm/i915/display/intel_bw.c (revision f005ef32267c16bdb134f0e9fa4477dbe07c263a)
1c349dbc7Sjsg // SPDX-License-Identifier: MIT
2c349dbc7Sjsg /*
3c349dbc7Sjsg  * Copyright © 2019 Intel Corporation
4c349dbc7Sjsg  */
5c349dbc7Sjsg 
6c349dbc7Sjsg #include <drm/drm_atomic_state_helper.h>
7c349dbc7Sjsg 
81bb76ff1Sjsg #include "i915_drv.h"
91bb76ff1Sjsg #include "i915_reg.h"
101bb76ff1Sjsg #include "i915_utils.h"
11ad8b1aafSjsg #include "intel_atomic.h"
12c349dbc7Sjsg #include "intel_bw.h"
13ad8b1aafSjsg #include "intel_cdclk.h"
141bb76ff1Sjsg #include "intel_display_core.h"
15c349dbc7Sjsg #include "intel_display_types.h"
161bb76ff1Sjsg #include "skl_watermark.h"
171bb76ff1Sjsg #include "intel_mchbar_regs.h"
181bb76ff1Sjsg #include "intel_pcode.h"
19c349dbc7Sjsg 
20c349dbc7Sjsg /* Parameters for Qclk Geyserville (QGV) */
21c349dbc7Sjsg struct intel_qgv_point {
22c349dbc7Sjsg 	u16 dclk, t_rp, t_rdpre, t_rc, t_ras, t_rcd;
23c349dbc7Sjsg };
24c349dbc7Sjsg 
255ca02815Sjsg struct intel_psf_gv_point {
265ca02815Sjsg 	u8 clk; /* clock in multiples of 16.6666 MHz */
27c349dbc7Sjsg };
28c349dbc7Sjsg 
295ca02815Sjsg struct intel_qgv_info {
305ca02815Sjsg 	struct intel_qgv_point points[I915_NUM_QGV_POINTS];
315ca02815Sjsg 	struct intel_psf_gv_point psf_points[I915_NUM_PSF_GV_POINTS];
325ca02815Sjsg 	u8 num_points;
335ca02815Sjsg 	u8 num_psf_points;
345ca02815Sjsg 	u8 t_bl;
351bb76ff1Sjsg 	u8 max_numchannels;
361bb76ff1Sjsg 	u8 channel_width;
371bb76ff1Sjsg 	u8 deinterleave;
385ca02815Sjsg };
395ca02815Sjsg 
dg1_mchbar_read_qgv_point_info(struct drm_i915_private * dev_priv,struct intel_qgv_point * sp,int point)405ca02815Sjsg static int dg1_mchbar_read_qgv_point_info(struct drm_i915_private *dev_priv,
415ca02815Sjsg 					  struct intel_qgv_point *sp,
425ca02815Sjsg 					  int point)
43c349dbc7Sjsg {
445ca02815Sjsg 	u32 dclk_ratio, dclk_reference;
455ca02815Sjsg 	u32 val;
46c349dbc7Sjsg 
475ca02815Sjsg 	val = intel_uncore_read(&dev_priv->uncore, SA_PERF_STATUS_0_0_0_MCHBAR_PC);
485ca02815Sjsg 	dclk_ratio = REG_FIELD_GET(DG1_QCLK_RATIO_MASK, val);
495ca02815Sjsg 	if (val & DG1_QCLK_REFERENCE)
505ca02815Sjsg 		dclk_reference = 6; /* 6 * 16.666 MHz = 100 MHz */
515ca02815Sjsg 	else
525ca02815Sjsg 		dclk_reference = 8; /* 8 * 16.666 MHz = 133 MHz */
531bb76ff1Sjsg 	sp->dclk = DIV_ROUND_UP((16667 * dclk_ratio * dclk_reference) + 500, 1000);
54c349dbc7Sjsg 
555ca02815Sjsg 	val = intel_uncore_read(&dev_priv->uncore, SKL_MC_BIOS_DATA_0_0_0_MCHBAR_PCU);
565ca02815Sjsg 	if (val & DG1_GEAR_TYPE)
575ca02815Sjsg 		sp->dclk *= 2;
58c349dbc7Sjsg 
595ca02815Sjsg 	if (sp->dclk == 0)
605ca02815Sjsg 		return -EINVAL;
61c349dbc7Sjsg 
625ca02815Sjsg 	val = intel_uncore_read(&dev_priv->uncore, MCHBAR_CH0_CR_TC_PRE_0_0_0_MCHBAR);
635ca02815Sjsg 	sp->t_rp = REG_FIELD_GET(DG1_DRAM_T_RP_MASK, val);
645ca02815Sjsg 	sp->t_rdpre = REG_FIELD_GET(DG1_DRAM_T_RDPRE_MASK, val);
655ca02815Sjsg 
665ca02815Sjsg 	val = intel_uncore_read(&dev_priv->uncore, MCHBAR_CH0_CR_TC_PRE_0_0_0_MCHBAR_HIGH);
675ca02815Sjsg 	sp->t_rcd = REG_FIELD_GET(DG1_DRAM_T_RCD_MASK, val);
685ca02815Sjsg 	sp->t_ras = REG_FIELD_GET(DG1_DRAM_T_RAS_MASK, val);
695ca02815Sjsg 
705ca02815Sjsg 	sp->t_rc = sp->t_rp + sp->t_ras;
71c349dbc7Sjsg 
72c349dbc7Sjsg 	return 0;
73c349dbc7Sjsg }
74c349dbc7Sjsg 
icl_pcode_read_qgv_point_info(struct drm_i915_private * dev_priv,struct intel_qgv_point * sp,int point)75c349dbc7Sjsg static int icl_pcode_read_qgv_point_info(struct drm_i915_private *dev_priv,
76c349dbc7Sjsg 					 struct intel_qgv_point *sp,
77c349dbc7Sjsg 					 int point)
78c349dbc7Sjsg {
79c349dbc7Sjsg 	u32 val = 0, val2 = 0;
801bb76ff1Sjsg 	u16 dclk;
81c349dbc7Sjsg 	int ret;
82c349dbc7Sjsg 
831bb76ff1Sjsg 	ret = snb_pcode_read(&dev_priv->uncore, ICL_PCODE_MEM_SUBSYSYSTEM_INFO |
84c349dbc7Sjsg 			     ICL_PCODE_MEM_SS_READ_QGV_POINT_INFO(point),
85c349dbc7Sjsg 			     &val, &val2);
86c349dbc7Sjsg 	if (ret)
87c349dbc7Sjsg 		return ret;
88c349dbc7Sjsg 
891bb76ff1Sjsg 	dclk = val & 0xffff;
901bb76ff1Sjsg 	sp->dclk = DIV_ROUND_UP((16667 * dclk) + (DISPLAY_VER(dev_priv) > 11 ? 500 : 0), 1000);
91c349dbc7Sjsg 	sp->t_rp = (val & 0xff0000) >> 16;
92c349dbc7Sjsg 	sp->t_rcd = (val & 0xff000000) >> 24;
93c349dbc7Sjsg 
94c349dbc7Sjsg 	sp->t_rdpre = val2 & 0xff;
95c349dbc7Sjsg 	sp->t_ras = (val2 & 0xff00) >> 8;
96c349dbc7Sjsg 
97c349dbc7Sjsg 	sp->t_rc = sp->t_rp + sp->t_ras;
98c349dbc7Sjsg 
99c349dbc7Sjsg 	return 0;
100c349dbc7Sjsg }
101c349dbc7Sjsg 
adls_pcode_read_psf_gv_point_info(struct drm_i915_private * dev_priv,struct intel_psf_gv_point * points)1025ca02815Sjsg static int adls_pcode_read_psf_gv_point_info(struct drm_i915_private *dev_priv,
1035ca02815Sjsg 					    struct intel_psf_gv_point *points)
1045ca02815Sjsg {
1055ca02815Sjsg 	u32 val = 0;
1065ca02815Sjsg 	int ret;
1075ca02815Sjsg 	int i;
1085ca02815Sjsg 
1091bb76ff1Sjsg 	ret = snb_pcode_read(&dev_priv->uncore, ICL_PCODE_MEM_SUBSYSYSTEM_INFO |
1101bb76ff1Sjsg 			     ADL_PCODE_MEM_SS_READ_PSF_GV_INFO, &val, NULL);
1115ca02815Sjsg 	if (ret)
1125ca02815Sjsg 		return ret;
1135ca02815Sjsg 
1145ca02815Sjsg 	for (i = 0; i < I915_NUM_PSF_GV_POINTS; i++) {
1155ca02815Sjsg 		points[i].clk = val & 0xff;
1165ca02815Sjsg 		val >>= 8;
1175ca02815Sjsg 	}
1185ca02815Sjsg 
1195ca02815Sjsg 	return 0;
1205ca02815Sjsg }
1215ca02815Sjsg 
icl_qgv_points_mask(struct drm_i915_private * i915)122*f005ef32Sjsg static u16 icl_qgv_points_mask(struct drm_i915_private *i915)
123*f005ef32Sjsg {
124*f005ef32Sjsg 	unsigned int num_psf_gv_points = i915->display.bw.max[0].num_psf_gv_points;
125*f005ef32Sjsg 	unsigned int num_qgv_points = i915->display.bw.max[0].num_qgv_points;
126*f005ef32Sjsg 	u16 qgv_points = 0, psf_points = 0;
127*f005ef32Sjsg 
128*f005ef32Sjsg 	/*
129*f005ef32Sjsg 	 * We can _not_ use the whole ADLS_QGV_PT_MASK here, as PCode rejects
130*f005ef32Sjsg 	 * it with failure if we try masking any unadvertised points.
131*f005ef32Sjsg 	 * So need to operate only with those returned from PCode.
132*f005ef32Sjsg 	 */
133*f005ef32Sjsg 	if (num_qgv_points > 0)
134*f005ef32Sjsg 		qgv_points = GENMASK(num_qgv_points - 1, 0);
135*f005ef32Sjsg 
136*f005ef32Sjsg 	if (num_psf_gv_points > 0)
137*f005ef32Sjsg 		psf_points = GENMASK(num_psf_gv_points - 1, 0);
138*f005ef32Sjsg 
139*f005ef32Sjsg 	return ICL_PCODE_REQ_QGV_PT(qgv_points) | ADLS_PCODE_REQ_PSF_PT(psf_points);
140*f005ef32Sjsg }
141*f005ef32Sjsg 
is_sagv_enabled(struct drm_i915_private * i915,u16 points_mask)142*f005ef32Sjsg static bool is_sagv_enabled(struct drm_i915_private *i915, u16 points_mask)
143*f005ef32Sjsg {
144*f005ef32Sjsg 	return !is_power_of_2(~points_mask & icl_qgv_points_mask(i915) &
145*f005ef32Sjsg 			      ICL_PCODE_REQ_QGV_PT_MASK);
146*f005ef32Sjsg }
147*f005ef32Sjsg 
icl_pcode_restrict_qgv_points(struct drm_i915_private * dev_priv,u32 points_mask)148ad8b1aafSjsg int icl_pcode_restrict_qgv_points(struct drm_i915_private *dev_priv,
149ad8b1aafSjsg 				  u32 points_mask)
150ad8b1aafSjsg {
151ad8b1aafSjsg 	int ret;
152ad8b1aafSjsg 
153*f005ef32Sjsg 	if (DISPLAY_VER(dev_priv) >= 14)
154*f005ef32Sjsg 		return 0;
155*f005ef32Sjsg 
156ad8b1aafSjsg 	/* bspec says to keep retrying for at least 1 ms */
1571bb76ff1Sjsg 	ret = skl_pcode_request(&dev_priv->uncore, ICL_PCODE_SAGV_DE_MEM_SS_CONFIG,
158ad8b1aafSjsg 				points_mask,
1591bb76ff1Sjsg 				ICL_PCODE_REP_QGV_MASK | ADLS_PCODE_REP_PSF_MASK,
1601bb76ff1Sjsg 				ICL_PCODE_REP_QGV_SAFE | ADLS_PCODE_REP_PSF_SAFE,
161ad8b1aafSjsg 				1);
162ad8b1aafSjsg 
163ad8b1aafSjsg 	if (ret < 0) {
1645ca02815Sjsg 		drm_err(&dev_priv->drm, "Failed to disable qgv points (%d) points: 0x%x\n", ret, points_mask);
165ad8b1aafSjsg 		return ret;
166ad8b1aafSjsg 	}
167ad8b1aafSjsg 
168*f005ef32Sjsg 	dev_priv->display.sagv.status = is_sagv_enabled(dev_priv, points_mask) ?
169*f005ef32Sjsg 		I915_SAGV_ENABLED : I915_SAGV_DISABLED;
170*f005ef32Sjsg 
171ad8b1aafSjsg 	return 0;
172ad8b1aafSjsg }
173ad8b1aafSjsg 
mtl_read_qgv_point_info(struct drm_i915_private * dev_priv,struct intel_qgv_point * sp,int point)1741bb76ff1Sjsg static int mtl_read_qgv_point_info(struct drm_i915_private *dev_priv,
1751bb76ff1Sjsg 				   struct intel_qgv_point *sp, int point)
1761bb76ff1Sjsg {
1771bb76ff1Sjsg 	u32 val, val2;
1781bb76ff1Sjsg 	u16 dclk;
1791bb76ff1Sjsg 
1801bb76ff1Sjsg 	val = intel_uncore_read(&dev_priv->uncore,
1811bb76ff1Sjsg 				MTL_MEM_SS_INFO_QGV_POINT_LOW(point));
1821bb76ff1Sjsg 	val2 = intel_uncore_read(&dev_priv->uncore,
1831bb76ff1Sjsg 				 MTL_MEM_SS_INFO_QGV_POINT_HIGH(point));
1841bb76ff1Sjsg 	dclk = REG_FIELD_GET(MTL_DCLK_MASK, val);
185*f005ef32Sjsg 	sp->dclk = DIV_ROUND_CLOSEST(16667 * dclk, 1000);
1861bb76ff1Sjsg 	sp->t_rp = REG_FIELD_GET(MTL_TRP_MASK, val);
1871bb76ff1Sjsg 	sp->t_rcd = REG_FIELD_GET(MTL_TRCD_MASK, val);
1881bb76ff1Sjsg 
1891bb76ff1Sjsg 	sp->t_rdpre = REG_FIELD_GET(MTL_TRDPRE_MASK, val2);
1901bb76ff1Sjsg 	sp->t_ras = REG_FIELD_GET(MTL_TRAS_MASK, val2);
1911bb76ff1Sjsg 
1921bb76ff1Sjsg 	sp->t_rc = sp->t_rp + sp->t_ras;
1931bb76ff1Sjsg 
1941bb76ff1Sjsg 	return 0;
1951bb76ff1Sjsg }
1961bb76ff1Sjsg 
1971bb76ff1Sjsg static int
intel_read_qgv_point_info(struct drm_i915_private * dev_priv,struct intel_qgv_point * sp,int point)1981bb76ff1Sjsg intel_read_qgv_point_info(struct drm_i915_private *dev_priv,
1991bb76ff1Sjsg 			  struct intel_qgv_point *sp,
2001bb76ff1Sjsg 			  int point)
2011bb76ff1Sjsg {
2021bb76ff1Sjsg 	if (DISPLAY_VER(dev_priv) >= 14)
2031bb76ff1Sjsg 		return mtl_read_qgv_point_info(dev_priv, sp, point);
2041bb76ff1Sjsg 	else if (IS_DG1(dev_priv))
2051bb76ff1Sjsg 		return dg1_mchbar_read_qgv_point_info(dev_priv, sp, point);
2061bb76ff1Sjsg 	else
2071bb76ff1Sjsg 		return icl_pcode_read_qgv_point_info(dev_priv, sp, point);
2081bb76ff1Sjsg }
2091bb76ff1Sjsg 
icl_get_qgv_points(struct drm_i915_private * dev_priv,struct intel_qgv_info * qi,bool is_y_tile)210c349dbc7Sjsg static int icl_get_qgv_points(struct drm_i915_private *dev_priv,
2111bb76ff1Sjsg 			      struct intel_qgv_info *qi,
2121bb76ff1Sjsg 			      bool is_y_tile)
213c349dbc7Sjsg {
2145ca02815Sjsg 	const struct dram_info *dram_info = &dev_priv->dram_info;
215c349dbc7Sjsg 	int i, ret;
216c349dbc7Sjsg 
2175ca02815Sjsg 	qi->num_points = dram_info->num_qgv_points;
2185ca02815Sjsg 	qi->num_psf_points = dram_info->num_psf_gv_points;
2195ca02815Sjsg 
2201bb76ff1Sjsg 	if (DISPLAY_VER(dev_priv) >= 14) {
2215ca02815Sjsg 		switch (dram_info->type) {
2225ca02815Sjsg 		case INTEL_DRAM_DDR4:
2235ca02815Sjsg 			qi->t_bl = 4;
2241bb76ff1Sjsg 			qi->max_numchannels = 2;
2251bb76ff1Sjsg 			qi->channel_width = 64;
2261bb76ff1Sjsg 			qi->deinterleave = 2;
2275ca02815Sjsg 			break;
2285ca02815Sjsg 		case INTEL_DRAM_DDR5:
2295ca02815Sjsg 			qi->t_bl = 8;
2301bb76ff1Sjsg 			qi->max_numchannels = 4;
2311bb76ff1Sjsg 			qi->channel_width = 32;
2321bb76ff1Sjsg 			qi->deinterleave = 2;
2331bb76ff1Sjsg 			break;
2341bb76ff1Sjsg 		case INTEL_DRAM_LPDDR4:
2351bb76ff1Sjsg 		case INTEL_DRAM_LPDDR5:
2361bb76ff1Sjsg 			qi->t_bl = 16;
2371bb76ff1Sjsg 			qi->max_numchannels = 8;
2381bb76ff1Sjsg 			qi->channel_width = 16;
2391bb76ff1Sjsg 			qi->deinterleave = 4;
2401bb76ff1Sjsg 			break;
2411bb76ff1Sjsg 		default:
2421bb76ff1Sjsg 			MISSING_CASE(dram_info->type);
2431bb76ff1Sjsg 			return -EINVAL;
2441bb76ff1Sjsg 		}
2451bb76ff1Sjsg 	} else if (DISPLAY_VER(dev_priv) >= 12) {
2461bb76ff1Sjsg 		switch (dram_info->type) {
2471bb76ff1Sjsg 		case INTEL_DRAM_DDR4:
2481bb76ff1Sjsg 			qi->t_bl = is_y_tile ? 8 : 4;
2491bb76ff1Sjsg 			qi->max_numchannels = 2;
2501bb76ff1Sjsg 			qi->channel_width = 64;
2511bb76ff1Sjsg 			qi->deinterleave = is_y_tile ? 1 : 2;
2521bb76ff1Sjsg 			break;
2531bb76ff1Sjsg 		case INTEL_DRAM_DDR5:
2541bb76ff1Sjsg 			qi->t_bl = is_y_tile ? 16 : 8;
2551bb76ff1Sjsg 			qi->max_numchannels = 4;
2561bb76ff1Sjsg 			qi->channel_width = 32;
2571bb76ff1Sjsg 			qi->deinterleave = is_y_tile ? 1 : 2;
2581bb76ff1Sjsg 			break;
2591bb76ff1Sjsg 		case INTEL_DRAM_LPDDR4:
2601bb76ff1Sjsg 			if (IS_ROCKETLAKE(dev_priv)) {
2611bb76ff1Sjsg 				qi->t_bl = 8;
2621bb76ff1Sjsg 				qi->max_numchannels = 4;
2631bb76ff1Sjsg 				qi->channel_width = 32;
2641bb76ff1Sjsg 				qi->deinterleave = 2;
2651bb76ff1Sjsg 				break;
2661bb76ff1Sjsg 			}
2671bb76ff1Sjsg 			fallthrough;
2681bb76ff1Sjsg 		case INTEL_DRAM_LPDDR5:
2691bb76ff1Sjsg 			qi->t_bl = 16;
2701bb76ff1Sjsg 			qi->max_numchannels = 8;
2711bb76ff1Sjsg 			qi->channel_width = 16;
2721bb76ff1Sjsg 			qi->deinterleave = is_y_tile ? 2 : 4;
2735ca02815Sjsg 			break;
2745ca02815Sjsg 		default:
2755ca02815Sjsg 			qi->t_bl = 16;
2761bb76ff1Sjsg 			qi->max_numchannels = 1;
2775ca02815Sjsg 			break;
2785ca02815Sjsg 		}
2791bb76ff1Sjsg 	} else if (DISPLAY_VER(dev_priv) == 11) {
2805ca02815Sjsg 		qi->t_bl = dev_priv->dram_info.type == INTEL_DRAM_DDR4 ? 4 : 8;
2811bb76ff1Sjsg 		qi->max_numchannels = 1;
2821bb76ff1Sjsg 	}
283c349dbc7Sjsg 
284c349dbc7Sjsg 	if (drm_WARN_ON(&dev_priv->drm,
285c349dbc7Sjsg 			qi->num_points > ARRAY_SIZE(qi->points)))
286c349dbc7Sjsg 		qi->num_points = ARRAY_SIZE(qi->points);
287c349dbc7Sjsg 
288c349dbc7Sjsg 	for (i = 0; i < qi->num_points; i++) {
289c349dbc7Sjsg 		struct intel_qgv_point *sp = &qi->points[i];
290c349dbc7Sjsg 
2911bb76ff1Sjsg 		ret = intel_read_qgv_point_info(dev_priv, sp, i);
292c349dbc7Sjsg 		if (ret)
293c349dbc7Sjsg 			return ret;
294c349dbc7Sjsg 
295c349dbc7Sjsg 		drm_dbg_kms(&dev_priv->drm,
296c349dbc7Sjsg 			    "QGV %d: DCLK=%d tRP=%d tRDPRE=%d tRAS=%d tRCD=%d tRC=%d\n",
297c349dbc7Sjsg 			    i, sp->dclk, sp->t_rp, sp->t_rdpre, sp->t_ras,
298c349dbc7Sjsg 			    sp->t_rcd, sp->t_rc);
299c349dbc7Sjsg 	}
300c349dbc7Sjsg 
3015ca02815Sjsg 	if (qi->num_psf_points > 0) {
3025ca02815Sjsg 		ret = adls_pcode_read_psf_gv_point_info(dev_priv, qi->psf_points);
3035ca02815Sjsg 		if (ret) {
3045ca02815Sjsg 			drm_err(&dev_priv->drm, "Failed to read PSF point data; PSF points will not be considered in bandwidth calculations.\n");
3055ca02815Sjsg 			qi->num_psf_points = 0;
3065ca02815Sjsg 		}
3075ca02815Sjsg 
3085ca02815Sjsg 		for (i = 0; i < qi->num_psf_points; i++)
3095ca02815Sjsg 			drm_dbg_kms(&dev_priv->drm,
3105ca02815Sjsg 				    "PSF GV %d: CLK=%d \n",
3115ca02815Sjsg 				    i, qi->psf_points[i].clk);
3125ca02815Sjsg 	}
3135ca02815Sjsg 
314c349dbc7Sjsg 	return 0;
315c349dbc7Sjsg }
316c349dbc7Sjsg 
adl_calc_psf_bw(int clk)3175ca02815Sjsg static int adl_calc_psf_bw(int clk)
3185ca02815Sjsg {
3195ca02815Sjsg 	/*
3205ca02815Sjsg 	 * clk is multiples of 16.666MHz (100/6)
3215ca02815Sjsg 	 * According to BSpec PSF GV bandwidth is
3225ca02815Sjsg 	 * calculated as BW = 64 * clk * 16.666Mhz
3235ca02815Sjsg 	 */
3245ca02815Sjsg 	return DIV_ROUND_CLOSEST(64 * clk * 100, 6);
3255ca02815Sjsg }
3265ca02815Sjsg 
icl_sagv_max_dclk(const struct intel_qgv_info * qi)327c349dbc7Sjsg static int icl_sagv_max_dclk(const struct intel_qgv_info *qi)
328c349dbc7Sjsg {
329c349dbc7Sjsg 	u16 dclk = 0;
330c349dbc7Sjsg 	int i;
331c349dbc7Sjsg 
332c349dbc7Sjsg 	for (i = 0; i < qi->num_points; i++)
333c349dbc7Sjsg 		dclk = max(dclk, qi->points[i].dclk);
334c349dbc7Sjsg 
335c349dbc7Sjsg 	return dclk;
336c349dbc7Sjsg }
337c349dbc7Sjsg 
338c349dbc7Sjsg struct intel_sa_info {
339c349dbc7Sjsg 	u16 displayrtids;
3405ca02815Sjsg 	u8 deburst, deprogbwlimit, derating;
341c349dbc7Sjsg };
342c349dbc7Sjsg 
343c349dbc7Sjsg static const struct intel_sa_info icl_sa_info = {
344c349dbc7Sjsg 	.deburst = 8,
345c349dbc7Sjsg 	.deprogbwlimit = 25, /* GB/s */
346c349dbc7Sjsg 	.displayrtids = 128,
3475ca02815Sjsg 	.derating = 10,
348c349dbc7Sjsg };
349c349dbc7Sjsg 
350c349dbc7Sjsg static const struct intel_sa_info tgl_sa_info = {
351c349dbc7Sjsg 	.deburst = 16,
352c349dbc7Sjsg 	.deprogbwlimit = 34, /* GB/s */
353c349dbc7Sjsg 	.displayrtids = 256,
3545ca02815Sjsg 	.derating = 10,
355c349dbc7Sjsg };
356c349dbc7Sjsg 
357ad8b1aafSjsg static const struct intel_sa_info rkl_sa_info = {
3581bb76ff1Sjsg 	.deburst = 8,
359ad8b1aafSjsg 	.deprogbwlimit = 20, /* GB/s */
360ad8b1aafSjsg 	.displayrtids = 128,
3615ca02815Sjsg 	.derating = 10,
3625ca02815Sjsg };
3635ca02815Sjsg 
3645ca02815Sjsg static const struct intel_sa_info adls_sa_info = {
3655ca02815Sjsg 	.deburst = 16,
3665ca02815Sjsg 	.deprogbwlimit = 38, /* GB/s */
3675ca02815Sjsg 	.displayrtids = 256,
3685ca02815Sjsg 	.derating = 10,
3695ca02815Sjsg };
3705ca02815Sjsg 
3715ca02815Sjsg static const struct intel_sa_info adlp_sa_info = {
3725ca02815Sjsg 	.deburst = 16,
3735ca02815Sjsg 	.deprogbwlimit = 38, /* GB/s */
3745ca02815Sjsg 	.displayrtids = 256,
3755ca02815Sjsg 	.derating = 20,
376ad8b1aafSjsg };
377ad8b1aafSjsg 
3781bb76ff1Sjsg static const struct intel_sa_info mtl_sa_info = {
3791bb76ff1Sjsg 	.deburst = 32,
3801bb76ff1Sjsg 	.deprogbwlimit = 38, /* GB/s */
3811bb76ff1Sjsg 	.displayrtids = 256,
382*f005ef32Sjsg 	.derating = 10,
3831bb76ff1Sjsg };
3841bb76ff1Sjsg 
icl_get_bw_info(struct drm_i915_private * dev_priv,const struct intel_sa_info * sa)385c349dbc7Sjsg static int icl_get_bw_info(struct drm_i915_private *dev_priv, const struct intel_sa_info *sa)
386c349dbc7Sjsg {
387c349dbc7Sjsg 	struct intel_qgv_info qi = {};
388c349dbc7Sjsg 	bool is_y_tile = true; /* assume y tile may be used */
3895ca02815Sjsg 	int num_channels = max_t(u8, 1, dev_priv->dram_info.num_channels);
3901bb76ff1Sjsg 	int ipqdepth, ipqdepthpch = 16;
391c349dbc7Sjsg 	int dclk_max;
392c349dbc7Sjsg 	int maxdebw;
3931bb76ff1Sjsg 	int num_groups = ARRAY_SIZE(dev_priv->display.bw.max);
394c349dbc7Sjsg 	int i, ret;
395c349dbc7Sjsg 
3961bb76ff1Sjsg 	ret = icl_get_qgv_points(dev_priv, &qi, is_y_tile);
397c349dbc7Sjsg 	if (ret) {
398c349dbc7Sjsg 		drm_dbg_kms(&dev_priv->drm,
399c349dbc7Sjsg 			    "Failed to get memory subsystem information, ignoring bandwidth limits");
400c349dbc7Sjsg 		return ret;
401c349dbc7Sjsg 	}
402c349dbc7Sjsg 
403c349dbc7Sjsg 	dclk_max = icl_sagv_max_dclk(&qi);
4041bb76ff1Sjsg 	maxdebw = min(sa->deprogbwlimit * 1000, dclk_max * 16 * 6 / 10);
405c349dbc7Sjsg 	ipqdepth = min(ipqdepthpch, sa->displayrtids / num_channels);
4061bb76ff1Sjsg 	qi.deinterleave = DIV_ROUND_UP(num_channels, is_y_tile ? 4 : 2);
407c349dbc7Sjsg 
4081bb76ff1Sjsg 	for (i = 0; i < num_groups; i++) {
4091bb76ff1Sjsg 		struct intel_bw_info *bi = &dev_priv->display.bw.max[i];
410c349dbc7Sjsg 		int clpchgroup;
411c349dbc7Sjsg 		int j;
412c349dbc7Sjsg 
4131bb76ff1Sjsg 		clpchgroup = (sa->deburst * qi.deinterleave / num_channels) << i;
414c349dbc7Sjsg 		bi->num_planes = (ipqdepth - clpchgroup) / clpchgroup + 1;
415c349dbc7Sjsg 
416c349dbc7Sjsg 		bi->num_qgv_points = qi.num_points;
4175ca02815Sjsg 		bi->num_psf_gv_points = qi.num_psf_points;
418c349dbc7Sjsg 
419c349dbc7Sjsg 		for (j = 0; j < qi.num_points; j++) {
420c349dbc7Sjsg 			const struct intel_qgv_point *sp = &qi.points[j];
421c349dbc7Sjsg 			int ct, bw;
422c349dbc7Sjsg 
423c349dbc7Sjsg 			/*
424c349dbc7Sjsg 			 * Max row cycle time
425c349dbc7Sjsg 			 *
426c349dbc7Sjsg 			 * FIXME what is the logic behind the
427c349dbc7Sjsg 			 * assumed burst length?
428c349dbc7Sjsg 			 */
429c349dbc7Sjsg 			ct = max_t(int, sp->t_rc, sp->t_rp + sp->t_rcd +
430c349dbc7Sjsg 				   (clpchgroup - 1) * qi.t_bl + sp->t_rdpre);
4311bb76ff1Sjsg 			bw = DIV_ROUND_UP(sp->dclk * clpchgroup * 32 * num_channels, ct);
4321bb76ff1Sjsg 
4331bb76ff1Sjsg 			bi->deratedbw[j] = min(maxdebw,
4341bb76ff1Sjsg 					       bw * (100 - sa->derating) / 100);
4351bb76ff1Sjsg 
4361bb76ff1Sjsg 			drm_dbg_kms(&dev_priv->drm,
4371bb76ff1Sjsg 				    "BW%d / QGV %d: num_planes=%d deratedbw=%u\n",
4381bb76ff1Sjsg 				    i, j, bi->num_planes, bi->deratedbw[j]);
4391bb76ff1Sjsg 		}
4401bb76ff1Sjsg 	}
4411bb76ff1Sjsg 	/*
4421bb76ff1Sjsg 	 * In case if SAGV is disabled in BIOS, we always get 1
4431bb76ff1Sjsg 	 * SAGV point, but we can't send PCode commands to restrict it
4441bb76ff1Sjsg 	 * as it will fail and pointless anyway.
4451bb76ff1Sjsg 	 */
4461bb76ff1Sjsg 	if (qi.num_points == 1)
4471bb76ff1Sjsg 		dev_priv->display.sagv.status = I915_SAGV_NOT_CONTROLLED;
4481bb76ff1Sjsg 	else
4491bb76ff1Sjsg 		dev_priv->display.sagv.status = I915_SAGV_ENABLED;
4501bb76ff1Sjsg 
4511bb76ff1Sjsg 	return 0;
4521bb76ff1Sjsg }
4531bb76ff1Sjsg 
tgl_get_bw_info(struct drm_i915_private * dev_priv,const struct intel_sa_info * sa)4541bb76ff1Sjsg static int tgl_get_bw_info(struct drm_i915_private *dev_priv, const struct intel_sa_info *sa)
4551bb76ff1Sjsg {
4561bb76ff1Sjsg 	struct intel_qgv_info qi = {};
4571bb76ff1Sjsg 	const struct dram_info *dram_info = &dev_priv->dram_info;
4581bb76ff1Sjsg 	bool is_y_tile = true; /* assume y tile may be used */
4591bb76ff1Sjsg 	int num_channels = max_t(u8, 1, dev_priv->dram_info.num_channels);
4601bb76ff1Sjsg 	int ipqdepth, ipqdepthpch = 16;
4611bb76ff1Sjsg 	int dclk_max;
4621bb76ff1Sjsg 	int maxdebw, peakbw;
4631bb76ff1Sjsg 	int clperchgroup;
4641bb76ff1Sjsg 	int num_groups = ARRAY_SIZE(dev_priv->display.bw.max);
4651bb76ff1Sjsg 	int i, ret;
4661bb76ff1Sjsg 
4671bb76ff1Sjsg 	ret = icl_get_qgv_points(dev_priv, &qi, is_y_tile);
4681bb76ff1Sjsg 	if (ret) {
4691bb76ff1Sjsg 		drm_dbg_kms(&dev_priv->drm,
4701bb76ff1Sjsg 			    "Failed to get memory subsystem information, ignoring bandwidth limits");
4711bb76ff1Sjsg 		return ret;
4721bb76ff1Sjsg 	}
4731bb76ff1Sjsg 
474*f005ef32Sjsg 	if (DISPLAY_VER(dev_priv) < 14 &&
475*f005ef32Sjsg 	    (dram_info->type == INTEL_DRAM_LPDDR4 || dram_info->type == INTEL_DRAM_LPDDR5))
4761bb76ff1Sjsg 		num_channels *= 2;
4771bb76ff1Sjsg 
4781bb76ff1Sjsg 	qi.deinterleave = qi.deinterleave ? : DIV_ROUND_UP(num_channels, is_y_tile ? 4 : 2);
4791bb76ff1Sjsg 
4801bb76ff1Sjsg 	if (num_channels < qi.max_numchannels && DISPLAY_VER(dev_priv) >= 12)
4811bb76ff1Sjsg 		qi.deinterleave = max(DIV_ROUND_UP(qi.deinterleave, 2), 1);
4821bb76ff1Sjsg 
4831bb76ff1Sjsg 	if (DISPLAY_VER(dev_priv) > 11 && num_channels > qi.max_numchannels)
4841bb76ff1Sjsg 		drm_warn(&dev_priv->drm, "Number of channels exceeds max number of channels.");
4851bb76ff1Sjsg 	if (qi.max_numchannels != 0)
4861bb76ff1Sjsg 		num_channels = min_t(u8, num_channels, qi.max_numchannels);
4871bb76ff1Sjsg 
4881bb76ff1Sjsg 	dclk_max = icl_sagv_max_dclk(&qi);
4891bb76ff1Sjsg 
4901bb76ff1Sjsg 	peakbw = num_channels * DIV_ROUND_UP(qi.channel_width, 8) * dclk_max;
4911bb76ff1Sjsg 	maxdebw = min(sa->deprogbwlimit * 1000, peakbw * 6 / 10); /* 60% */
4921bb76ff1Sjsg 
4931bb76ff1Sjsg 	ipqdepth = min(ipqdepthpch, sa->displayrtids / num_channels);
4941bb76ff1Sjsg 	/*
4951bb76ff1Sjsg 	 * clperchgroup = 4kpagespermempage * clperchperblock,
4961bb76ff1Sjsg 	 * clperchperblock = 8 / num_channels * interleave
4971bb76ff1Sjsg 	 */
4981bb76ff1Sjsg 	clperchgroup = 4 * DIV_ROUND_UP(8, num_channels) * qi.deinterleave;
4991bb76ff1Sjsg 
5001bb76ff1Sjsg 	for (i = 0; i < num_groups; i++) {
5011bb76ff1Sjsg 		struct intel_bw_info *bi = &dev_priv->display.bw.max[i];
5021bb76ff1Sjsg 		struct intel_bw_info *bi_next;
5031bb76ff1Sjsg 		int clpchgroup;
5041bb76ff1Sjsg 		int j;
5051bb76ff1Sjsg 
5061bb76ff1Sjsg 		clpchgroup = (sa->deburst * qi.deinterleave / num_channels) << i;
5071bb76ff1Sjsg 
5081bb76ff1Sjsg 		if (i < num_groups - 1) {
5091bb76ff1Sjsg 			bi_next = &dev_priv->display.bw.max[i + 1];
5101bb76ff1Sjsg 
5111bb76ff1Sjsg 			if (clpchgroup < clperchgroup)
5121bb76ff1Sjsg 				bi_next->num_planes = (ipqdepth - clpchgroup) /
5131bb76ff1Sjsg 						       clpchgroup + 1;
5141bb76ff1Sjsg 			else
5151bb76ff1Sjsg 				bi_next->num_planes = 0;
5161bb76ff1Sjsg 		}
5171bb76ff1Sjsg 
5181bb76ff1Sjsg 		bi->num_qgv_points = qi.num_points;
5191bb76ff1Sjsg 		bi->num_psf_gv_points = qi.num_psf_points;
5201bb76ff1Sjsg 
5211bb76ff1Sjsg 		for (j = 0; j < qi.num_points; j++) {
5221bb76ff1Sjsg 			const struct intel_qgv_point *sp = &qi.points[j];
5231bb76ff1Sjsg 			int ct, bw;
5241bb76ff1Sjsg 
5251bb76ff1Sjsg 			/*
5261bb76ff1Sjsg 			 * Max row cycle time
5271bb76ff1Sjsg 			 *
5281bb76ff1Sjsg 			 * FIXME what is the logic behind the
5291bb76ff1Sjsg 			 * assumed burst length?
5301bb76ff1Sjsg 			 */
5311bb76ff1Sjsg 			ct = max_t(int, sp->t_rc, sp->t_rp + sp->t_rcd +
5321bb76ff1Sjsg 				   (clpchgroup - 1) * qi.t_bl + sp->t_rdpre);
5331bb76ff1Sjsg 			bw = DIV_ROUND_UP(sp->dclk * clpchgroup * 32 * num_channels, ct);
534c349dbc7Sjsg 
535c349dbc7Sjsg 			bi->deratedbw[j] = min(maxdebw,
5365ca02815Sjsg 					       bw * (100 - sa->derating) / 100);
537*f005ef32Sjsg 			bi->peakbw[j] = DIV_ROUND_CLOSEST(sp->dclk *
538*f005ef32Sjsg 							  num_channels *
539*f005ef32Sjsg 							  qi.channel_width, 8);
540c349dbc7Sjsg 
541c349dbc7Sjsg 			drm_dbg_kms(&dev_priv->drm,
542*f005ef32Sjsg 				    "BW%d / QGV %d: num_planes=%d deratedbw=%u peakbw: %u\n",
543*f005ef32Sjsg 				    i, j, bi->num_planes, bi->deratedbw[j],
544*f005ef32Sjsg 				    bi->peakbw[j]);
545c349dbc7Sjsg 		}
546c349dbc7Sjsg 
5475ca02815Sjsg 		for (j = 0; j < qi.num_psf_points; j++) {
5485ca02815Sjsg 			const struct intel_psf_gv_point *sp = &qi.psf_points[j];
5495ca02815Sjsg 
5505ca02815Sjsg 			bi->psf_bw[j] = adl_calc_psf_bw(sp->clk);
5515ca02815Sjsg 
5525ca02815Sjsg 			drm_dbg_kms(&dev_priv->drm,
5535ca02815Sjsg 				    "BW%d / PSF GV %d: num_planes=%d bw=%u\n",
5545ca02815Sjsg 				    i, j, bi->num_planes, bi->psf_bw[j]);
5555ca02815Sjsg 		}
556c349dbc7Sjsg 	}
557c349dbc7Sjsg 
558ad8b1aafSjsg 	/*
559ad8b1aafSjsg 	 * In case if SAGV is disabled in BIOS, we always get 1
560ad8b1aafSjsg 	 * SAGV point, but we can't send PCode commands to restrict it
561ad8b1aafSjsg 	 * as it will fail and pointless anyway.
562ad8b1aafSjsg 	 */
563ad8b1aafSjsg 	if (qi.num_points == 1)
5641bb76ff1Sjsg 		dev_priv->display.sagv.status = I915_SAGV_NOT_CONTROLLED;
565ad8b1aafSjsg 	else
5661bb76ff1Sjsg 		dev_priv->display.sagv.status = I915_SAGV_ENABLED;
567ad8b1aafSjsg 
568c349dbc7Sjsg 	return 0;
569c349dbc7Sjsg }
570c349dbc7Sjsg 
dg2_get_bw_info(struct drm_i915_private * i915)5715ca02815Sjsg static void dg2_get_bw_info(struct drm_i915_private *i915)
5725ca02815Sjsg {
5731bb76ff1Sjsg 	unsigned int deratedbw = IS_DG2_G11(i915) ? 38000 : 50000;
5741bb76ff1Sjsg 	int num_groups = ARRAY_SIZE(i915->display.bw.max);
5751bb76ff1Sjsg 	int i;
5765ca02815Sjsg 
5775ca02815Sjsg 	/*
5785ca02815Sjsg 	 * DG2 doesn't have SAGV or QGV points, just a constant max bandwidth
5791bb76ff1Sjsg 	 * that doesn't depend on the number of planes enabled. So fill all the
5801bb76ff1Sjsg 	 * plane group with constant bw information for uniformity with other
5811bb76ff1Sjsg 	 * platforms. DG2-G10 platforms have a constant 50 GB/s bandwidth,
5821bb76ff1Sjsg 	 * whereas DG2-G11 platforms have 38 GB/s.
5835ca02815Sjsg 	 */
5841bb76ff1Sjsg 	for (i = 0; i < num_groups; i++) {
5851bb76ff1Sjsg 		struct intel_bw_info *bi = &i915->display.bw.max[i];
5865ca02815Sjsg 
5871bb76ff1Sjsg 		bi->num_planes = 1;
5881bb76ff1Sjsg 		/* Need only one dummy QGV point per group */
5891bb76ff1Sjsg 		bi->num_qgv_points = 1;
5901bb76ff1Sjsg 		bi->deratedbw[0] = deratedbw;
5911bb76ff1Sjsg 	}
5921bb76ff1Sjsg 
5931bb76ff1Sjsg 	i915->display.sagv.status = I915_SAGV_NOT_CONTROLLED;
5945ca02815Sjsg }
5955ca02815Sjsg 
icl_max_bw_index(struct drm_i915_private * dev_priv,int num_planes,int qgv_point)596*f005ef32Sjsg static unsigned int icl_max_bw_index(struct drm_i915_private *dev_priv,
597c349dbc7Sjsg 				     int num_planes, int qgv_point)
598c349dbc7Sjsg {
599c349dbc7Sjsg 	int i;
600c349dbc7Sjsg 
601ad8b1aafSjsg 	/*
602ad8b1aafSjsg 	 * Let's return max bw for 0 planes
603ad8b1aafSjsg 	 */
604ad8b1aafSjsg 	num_planes = max(1, num_planes);
605ad8b1aafSjsg 
6061bb76ff1Sjsg 	for (i = 0; i < ARRAY_SIZE(dev_priv->display.bw.max); i++) {
607c349dbc7Sjsg 		const struct intel_bw_info *bi =
6081bb76ff1Sjsg 			&dev_priv->display.bw.max[i];
609c349dbc7Sjsg 
610c349dbc7Sjsg 		/*
611c349dbc7Sjsg 		 * Pcode will not expose all QGV points when
612c349dbc7Sjsg 		 * SAGV is forced to off/min/med/max.
613c349dbc7Sjsg 		 */
614c349dbc7Sjsg 		if (qgv_point >= bi->num_qgv_points)
615c349dbc7Sjsg 			return UINT_MAX;
616c349dbc7Sjsg 
617c349dbc7Sjsg 		if (num_planes >= bi->num_planes)
618*f005ef32Sjsg 			return i;
619c349dbc7Sjsg 	}
620c349dbc7Sjsg 
621*f005ef32Sjsg 	return UINT_MAX;
622c349dbc7Sjsg }
623c349dbc7Sjsg 
tgl_max_bw_index(struct drm_i915_private * dev_priv,int num_planes,int qgv_point)624*f005ef32Sjsg static unsigned int tgl_max_bw_index(struct drm_i915_private *dev_priv,
6251bb76ff1Sjsg 				     int num_planes, int qgv_point)
6261bb76ff1Sjsg {
6271bb76ff1Sjsg 	int i;
6281bb76ff1Sjsg 
6291bb76ff1Sjsg 	/*
6301bb76ff1Sjsg 	 * Let's return max bw for 0 planes
6311bb76ff1Sjsg 	 */
6321bb76ff1Sjsg 	num_planes = max(1, num_planes);
6331bb76ff1Sjsg 
6341bb76ff1Sjsg 	for (i = ARRAY_SIZE(dev_priv->display.bw.max) - 1; i >= 0; i--) {
6351bb76ff1Sjsg 		const struct intel_bw_info *bi =
6361bb76ff1Sjsg 			&dev_priv->display.bw.max[i];
6371bb76ff1Sjsg 
6381bb76ff1Sjsg 		/*
6391bb76ff1Sjsg 		 * Pcode will not expose all QGV points when
6401bb76ff1Sjsg 		 * SAGV is forced to off/min/med/max.
6411bb76ff1Sjsg 		 */
6421bb76ff1Sjsg 		if (qgv_point >= bi->num_qgv_points)
6431bb76ff1Sjsg 			return UINT_MAX;
6441bb76ff1Sjsg 
6451bb76ff1Sjsg 		if (num_planes <= bi->num_planes)
646*f005ef32Sjsg 			return i;
6471bb76ff1Sjsg 	}
6481bb76ff1Sjsg 
649*f005ef32Sjsg 	return 0;
6501bb76ff1Sjsg }
6511bb76ff1Sjsg 
adl_psf_bw(struct drm_i915_private * dev_priv,int psf_gv_point)6525ca02815Sjsg static unsigned int adl_psf_bw(struct drm_i915_private *dev_priv,
6535ca02815Sjsg 			       int psf_gv_point)
6545ca02815Sjsg {
6555ca02815Sjsg 	const struct intel_bw_info *bi =
6561bb76ff1Sjsg 			&dev_priv->display.bw.max[0];
6575ca02815Sjsg 
6585ca02815Sjsg 	return bi->psf_bw[psf_gv_point];
6595ca02815Sjsg }
6605ca02815Sjsg 
intel_bw_init_hw(struct drm_i915_private * dev_priv)661c349dbc7Sjsg void intel_bw_init_hw(struct drm_i915_private *dev_priv)
662c349dbc7Sjsg {
663c349dbc7Sjsg 	if (!HAS_DISPLAY(dev_priv))
664c349dbc7Sjsg 		return;
665c349dbc7Sjsg 
6661bb76ff1Sjsg 	if (DISPLAY_VER(dev_priv) >= 14)
6671bb76ff1Sjsg 		tgl_get_bw_info(dev_priv, &mtl_sa_info);
6681bb76ff1Sjsg 	else if (IS_DG2(dev_priv))
6695ca02815Sjsg 		dg2_get_bw_info(dev_priv);
6705ca02815Sjsg 	else if (IS_ALDERLAKE_P(dev_priv))
6711bb76ff1Sjsg 		tgl_get_bw_info(dev_priv, &adlp_sa_info);
6725ca02815Sjsg 	else if (IS_ALDERLAKE_S(dev_priv))
6731bb76ff1Sjsg 		tgl_get_bw_info(dev_priv, &adls_sa_info);
6745ca02815Sjsg 	else if (IS_ROCKETLAKE(dev_priv))
6751bb76ff1Sjsg 		tgl_get_bw_info(dev_priv, &rkl_sa_info);
6765ca02815Sjsg 	else if (DISPLAY_VER(dev_priv) == 12)
6771bb76ff1Sjsg 		tgl_get_bw_info(dev_priv, &tgl_sa_info);
6785ca02815Sjsg 	else if (DISPLAY_VER(dev_priv) == 11)
679c349dbc7Sjsg 		icl_get_bw_info(dev_priv, &icl_sa_info);
680c349dbc7Sjsg }
681c349dbc7Sjsg 
intel_bw_crtc_num_active_planes(const struct intel_crtc_state * crtc_state)682c349dbc7Sjsg static unsigned int intel_bw_crtc_num_active_planes(const struct intel_crtc_state *crtc_state)
683c349dbc7Sjsg {
684c349dbc7Sjsg 	/*
685c349dbc7Sjsg 	 * We assume cursors are small enough
686c349dbc7Sjsg 	 * to not not cause bandwidth problems.
687c349dbc7Sjsg 	 */
688c349dbc7Sjsg 	return hweight8(crtc_state->active_planes & ~BIT(PLANE_CURSOR));
689c349dbc7Sjsg }
690c349dbc7Sjsg 
intel_bw_crtc_data_rate(const struct intel_crtc_state * crtc_state)691c349dbc7Sjsg static unsigned int intel_bw_crtc_data_rate(const struct intel_crtc_state *crtc_state)
692c349dbc7Sjsg {
693c349dbc7Sjsg 	struct intel_crtc *crtc = to_intel_crtc(crtc_state->uapi.crtc);
6941bb76ff1Sjsg 	struct drm_i915_private *i915 = to_i915(crtc->base.dev);
695c349dbc7Sjsg 	unsigned int data_rate = 0;
696c349dbc7Sjsg 	enum plane_id plane_id;
697c349dbc7Sjsg 
698c349dbc7Sjsg 	for_each_plane_id_on_crtc(crtc, plane_id) {
699c349dbc7Sjsg 		/*
700c349dbc7Sjsg 		 * We assume cursors are small enough
701c349dbc7Sjsg 		 * to not not cause bandwidth problems.
702c349dbc7Sjsg 		 */
703c349dbc7Sjsg 		if (plane_id == PLANE_CURSOR)
704c349dbc7Sjsg 			continue;
705c349dbc7Sjsg 
706c349dbc7Sjsg 		data_rate += crtc_state->data_rate[plane_id];
7071bb76ff1Sjsg 
7081bb76ff1Sjsg 		if (DISPLAY_VER(i915) < 11)
7091bb76ff1Sjsg 			data_rate += crtc_state->data_rate_y[plane_id];
710c349dbc7Sjsg 	}
711c349dbc7Sjsg 
712c349dbc7Sjsg 	return data_rate;
713c349dbc7Sjsg }
714c349dbc7Sjsg 
7151bb76ff1Sjsg /* "Maximum Pipe Read Bandwidth" */
intel_bw_crtc_min_cdclk(const struct intel_crtc_state * crtc_state)7161bb76ff1Sjsg static int intel_bw_crtc_min_cdclk(const struct intel_crtc_state *crtc_state)
7171bb76ff1Sjsg {
7181bb76ff1Sjsg 	struct intel_crtc *crtc = to_intel_crtc(crtc_state->uapi.crtc);
7191bb76ff1Sjsg 	struct drm_i915_private *i915 = to_i915(crtc->base.dev);
7201bb76ff1Sjsg 
7211bb76ff1Sjsg 	if (DISPLAY_VER(i915) < 12)
7221bb76ff1Sjsg 		return 0;
7231bb76ff1Sjsg 
7241bb76ff1Sjsg 	return DIV_ROUND_UP_ULL(mul_u32_u32(intel_bw_crtc_data_rate(crtc_state), 10), 512);
7251bb76ff1Sjsg }
7261bb76ff1Sjsg 
intel_bw_crtc_update(struct intel_bw_state * bw_state,const struct intel_crtc_state * crtc_state)727c349dbc7Sjsg void intel_bw_crtc_update(struct intel_bw_state *bw_state,
728c349dbc7Sjsg 			  const struct intel_crtc_state *crtc_state)
729c349dbc7Sjsg {
730c349dbc7Sjsg 	struct intel_crtc *crtc = to_intel_crtc(crtc_state->uapi.crtc);
731ad8b1aafSjsg 	struct drm_i915_private *i915 = to_i915(crtc->base.dev);
732c349dbc7Sjsg 
733c349dbc7Sjsg 	bw_state->data_rate[crtc->pipe] =
734c349dbc7Sjsg 		intel_bw_crtc_data_rate(crtc_state);
735c349dbc7Sjsg 	bw_state->num_active_planes[crtc->pipe] =
736c349dbc7Sjsg 		intel_bw_crtc_num_active_planes(crtc_state);
737c349dbc7Sjsg 
738ad8b1aafSjsg 	drm_dbg_kms(&i915->drm, "pipe %c data rate %u num active planes %u\n",
739c349dbc7Sjsg 		    pipe_name(crtc->pipe),
740c349dbc7Sjsg 		    bw_state->data_rate[crtc->pipe],
741c349dbc7Sjsg 		    bw_state->num_active_planes[crtc->pipe]);
742c349dbc7Sjsg }
743c349dbc7Sjsg 
intel_bw_num_active_planes(struct drm_i915_private * dev_priv,const struct intel_bw_state * bw_state)744c349dbc7Sjsg static unsigned int intel_bw_num_active_planes(struct drm_i915_private *dev_priv,
745c349dbc7Sjsg 					       const struct intel_bw_state *bw_state)
746c349dbc7Sjsg {
747c349dbc7Sjsg 	unsigned int num_active_planes = 0;
748c349dbc7Sjsg 	enum pipe pipe;
749c349dbc7Sjsg 
750c349dbc7Sjsg 	for_each_pipe(dev_priv, pipe)
751c349dbc7Sjsg 		num_active_planes += bw_state->num_active_planes[pipe];
752c349dbc7Sjsg 
753c349dbc7Sjsg 	return num_active_planes;
754c349dbc7Sjsg }
755c349dbc7Sjsg 
intel_bw_data_rate(struct drm_i915_private * dev_priv,const struct intel_bw_state * bw_state)756c349dbc7Sjsg static unsigned int intel_bw_data_rate(struct drm_i915_private *dev_priv,
757c349dbc7Sjsg 				       const struct intel_bw_state *bw_state)
758c349dbc7Sjsg {
759c349dbc7Sjsg 	unsigned int data_rate = 0;
760c349dbc7Sjsg 	enum pipe pipe;
761c349dbc7Sjsg 
762c349dbc7Sjsg 	for_each_pipe(dev_priv, pipe)
763c349dbc7Sjsg 		data_rate += bw_state->data_rate[pipe];
764c349dbc7Sjsg 
7651bb76ff1Sjsg 	if (DISPLAY_VER(dev_priv) >= 13 && i915_vtd_active(dev_priv))
7661bb76ff1Sjsg 		data_rate = DIV_ROUND_UP(data_rate * 105, 100);
7675ca02815Sjsg 
768c349dbc7Sjsg 	return data_rate;
769c349dbc7Sjsg }
770c349dbc7Sjsg 
771ad8b1aafSjsg struct intel_bw_state *
intel_atomic_get_old_bw_state(struct intel_atomic_state * state)772ad8b1aafSjsg intel_atomic_get_old_bw_state(struct intel_atomic_state *state)
773ad8b1aafSjsg {
774ad8b1aafSjsg 	struct drm_i915_private *dev_priv = to_i915(state->base.dev);
775ad8b1aafSjsg 	struct intel_global_state *bw_state;
776ad8b1aafSjsg 
7771bb76ff1Sjsg 	bw_state = intel_atomic_get_old_global_obj_state(state, &dev_priv->display.bw.obj);
778ad8b1aafSjsg 
779ad8b1aafSjsg 	return to_intel_bw_state(bw_state);
780ad8b1aafSjsg }
781ad8b1aafSjsg 
782ad8b1aafSjsg struct intel_bw_state *
intel_atomic_get_new_bw_state(struct intel_atomic_state * state)783ad8b1aafSjsg intel_atomic_get_new_bw_state(struct intel_atomic_state *state)
784ad8b1aafSjsg {
785ad8b1aafSjsg 	struct drm_i915_private *dev_priv = to_i915(state->base.dev);
786ad8b1aafSjsg 	struct intel_global_state *bw_state;
787ad8b1aafSjsg 
7881bb76ff1Sjsg 	bw_state = intel_atomic_get_new_global_obj_state(state, &dev_priv->display.bw.obj);
789ad8b1aafSjsg 
790ad8b1aafSjsg 	return to_intel_bw_state(bw_state);
791ad8b1aafSjsg }
792ad8b1aafSjsg 
793ad8b1aafSjsg struct intel_bw_state *
intel_atomic_get_bw_state(struct intel_atomic_state * state)794c349dbc7Sjsg intel_atomic_get_bw_state(struct intel_atomic_state *state)
795c349dbc7Sjsg {
796c349dbc7Sjsg 	struct drm_i915_private *dev_priv = to_i915(state->base.dev);
797c349dbc7Sjsg 	struct intel_global_state *bw_state;
798c349dbc7Sjsg 
7991bb76ff1Sjsg 	bw_state = intel_atomic_get_global_obj_state(state, &dev_priv->display.bw.obj);
800c349dbc7Sjsg 	if (IS_ERR(bw_state))
801c349dbc7Sjsg 		return ERR_CAST(bw_state);
802c349dbc7Sjsg 
803c349dbc7Sjsg 	return to_intel_bw_state(bw_state);
804c349dbc7Sjsg }
805c349dbc7Sjsg 
mtl_find_qgv_points(struct drm_i915_private * i915,unsigned int data_rate,unsigned int num_active_planes,struct intel_bw_state * new_bw_state)806*f005ef32Sjsg static int mtl_find_qgv_points(struct drm_i915_private *i915,
807*f005ef32Sjsg 			       unsigned int data_rate,
808*f005ef32Sjsg 			       unsigned int num_active_planes,
809*f005ef32Sjsg 			       struct intel_bw_state *new_bw_state)
810*f005ef32Sjsg {
811*f005ef32Sjsg 	unsigned int best_rate = UINT_MAX;
812*f005ef32Sjsg 	unsigned int num_qgv_points = i915->display.bw.max[0].num_qgv_points;
813*f005ef32Sjsg 	unsigned int qgv_peak_bw  = 0;
814*f005ef32Sjsg 	int i;
815*f005ef32Sjsg 	int ret;
816*f005ef32Sjsg 
817*f005ef32Sjsg 	ret = intel_atomic_lock_global_state(&new_bw_state->base);
818*f005ef32Sjsg 	if (ret)
819*f005ef32Sjsg 		return ret;
820*f005ef32Sjsg 
821*f005ef32Sjsg 	/*
822*f005ef32Sjsg 	 * If SAGV cannot be enabled, disable the pcode SAGV by passing all 1's
823*f005ef32Sjsg 	 * for qgv peak bw in PM Demand request. So assign UINT_MAX if SAGV is
824*f005ef32Sjsg 	 * not enabled. PM Demand code will clamp the value for the register
825*f005ef32Sjsg 	 */
826*f005ef32Sjsg 	if (!intel_can_enable_sagv(i915, new_bw_state)) {
827*f005ef32Sjsg 		new_bw_state->qgv_point_peakbw = U16_MAX;
828*f005ef32Sjsg 		drm_dbg_kms(&i915->drm, "No SAGV, use UINT_MAX as peak bw.");
829*f005ef32Sjsg 		return 0;
830*f005ef32Sjsg 	}
831*f005ef32Sjsg 
832*f005ef32Sjsg 	/*
833*f005ef32Sjsg 	 * Find the best QGV point by comparing the data_rate with max data rate
834*f005ef32Sjsg 	 * offered per plane group
835*f005ef32Sjsg 	 */
836*f005ef32Sjsg 	for (i = 0; i < num_qgv_points; i++) {
837*f005ef32Sjsg 		unsigned int bw_index =
838*f005ef32Sjsg 			tgl_max_bw_index(i915, num_active_planes, i);
839*f005ef32Sjsg 		unsigned int max_data_rate;
840*f005ef32Sjsg 
841*f005ef32Sjsg 		if (bw_index >= ARRAY_SIZE(i915->display.bw.max))
842*f005ef32Sjsg 			continue;
843*f005ef32Sjsg 
844*f005ef32Sjsg 		max_data_rate = i915->display.bw.max[bw_index].deratedbw[i];
845*f005ef32Sjsg 
846*f005ef32Sjsg 		if (max_data_rate < data_rate)
847*f005ef32Sjsg 			continue;
848*f005ef32Sjsg 
849*f005ef32Sjsg 		if (max_data_rate - data_rate < best_rate) {
850*f005ef32Sjsg 			best_rate = max_data_rate - data_rate;
851*f005ef32Sjsg 			qgv_peak_bw = i915->display.bw.max[bw_index].peakbw[i];
852*f005ef32Sjsg 		}
853*f005ef32Sjsg 
854*f005ef32Sjsg 		drm_dbg_kms(&i915->drm, "QGV point %d: max bw %d required %d qgv_peak_bw: %d\n",
855*f005ef32Sjsg 			    i, max_data_rate, data_rate, qgv_peak_bw);
856*f005ef32Sjsg 	}
857*f005ef32Sjsg 
858*f005ef32Sjsg 	drm_dbg_kms(&i915->drm, "Matching peaks QGV bw: %d for required data rate: %d\n",
859*f005ef32Sjsg 		    qgv_peak_bw, data_rate);
860*f005ef32Sjsg 
861*f005ef32Sjsg 	/*
862*f005ef32Sjsg 	 * The display configuration cannot be supported if no QGV point
863*f005ef32Sjsg 	 * satisfying the required data rate is found
864*f005ef32Sjsg 	 */
865*f005ef32Sjsg 	if (qgv_peak_bw == 0) {
866*f005ef32Sjsg 		drm_dbg_kms(&i915->drm, "No QGV points for bw %d for display configuration(%d active planes).\n",
867*f005ef32Sjsg 			    data_rate, num_active_planes);
868*f005ef32Sjsg 		return -EINVAL;
869*f005ef32Sjsg 	}
870*f005ef32Sjsg 
871*f005ef32Sjsg 	/* MTL PM DEMAND expects QGV BW parameter in multiples of 100 mbps */
872*f005ef32Sjsg 	new_bw_state->qgv_point_peakbw = DIV_ROUND_CLOSEST(qgv_peak_bw, 100);
873*f005ef32Sjsg 
874*f005ef32Sjsg 	return 0;
875*f005ef32Sjsg }
876*f005ef32Sjsg 
icl_find_qgv_points(struct drm_i915_private * i915,unsigned int data_rate,unsigned int num_active_planes,const struct intel_bw_state * old_bw_state,struct intel_bw_state * new_bw_state)877*f005ef32Sjsg static int icl_find_qgv_points(struct drm_i915_private *i915,
878*f005ef32Sjsg 			       unsigned int data_rate,
879*f005ef32Sjsg 			       unsigned int num_active_planes,
880*f005ef32Sjsg 			       const struct intel_bw_state *old_bw_state,
881*f005ef32Sjsg 			       struct intel_bw_state *new_bw_state)
882*f005ef32Sjsg {
883*f005ef32Sjsg 	unsigned int max_bw_point = 0;
884*f005ef32Sjsg 	unsigned int max_bw = 0;
885*f005ef32Sjsg 	unsigned int num_psf_gv_points = i915->display.bw.max[0].num_psf_gv_points;
886*f005ef32Sjsg 	unsigned int num_qgv_points = i915->display.bw.max[0].num_qgv_points;
887*f005ef32Sjsg 	u16 psf_points = 0;
888*f005ef32Sjsg 	u16 qgv_points = 0;
889*f005ef32Sjsg 	int i;
890*f005ef32Sjsg 	int ret;
891*f005ef32Sjsg 
892*f005ef32Sjsg 	ret = intel_atomic_lock_global_state(&new_bw_state->base);
893*f005ef32Sjsg 	if (ret)
894*f005ef32Sjsg 		return ret;
895*f005ef32Sjsg 
896*f005ef32Sjsg 	for (i = 0; i < num_qgv_points; i++) {
897*f005ef32Sjsg 		unsigned int idx;
898*f005ef32Sjsg 		unsigned int max_data_rate;
899*f005ef32Sjsg 
900*f005ef32Sjsg 		if (DISPLAY_VER(i915) > 11)
901*f005ef32Sjsg 			idx = tgl_max_bw_index(i915, num_active_planes, i);
902*f005ef32Sjsg 		else
903*f005ef32Sjsg 			idx = icl_max_bw_index(i915, num_active_planes, i);
904*f005ef32Sjsg 
905*f005ef32Sjsg 		if (idx >= ARRAY_SIZE(i915->display.bw.max))
906*f005ef32Sjsg 			continue;
907*f005ef32Sjsg 
908*f005ef32Sjsg 		max_data_rate = i915->display.bw.max[idx].deratedbw[i];
909*f005ef32Sjsg 
910*f005ef32Sjsg 		/*
911*f005ef32Sjsg 		 * We need to know which qgv point gives us
912*f005ef32Sjsg 		 * maximum bandwidth in order to disable SAGV
913*f005ef32Sjsg 		 * if we find that we exceed SAGV block time
914*f005ef32Sjsg 		 * with watermarks. By that moment we already
915*f005ef32Sjsg 		 * have those, as it is calculated earlier in
916*f005ef32Sjsg 		 * intel_atomic_check,
917*f005ef32Sjsg 		 */
918*f005ef32Sjsg 		if (max_data_rate > max_bw) {
919*f005ef32Sjsg 			max_bw_point = i;
920*f005ef32Sjsg 			max_bw = max_data_rate;
921*f005ef32Sjsg 		}
922*f005ef32Sjsg 		if (max_data_rate >= data_rate)
923*f005ef32Sjsg 			qgv_points |= BIT(i);
924*f005ef32Sjsg 
925*f005ef32Sjsg 		drm_dbg_kms(&i915->drm, "QGV point %d: max bw %d required %d\n",
926*f005ef32Sjsg 			    i, max_data_rate, data_rate);
927*f005ef32Sjsg 	}
928*f005ef32Sjsg 
929*f005ef32Sjsg 	for (i = 0; i < num_psf_gv_points; i++) {
930*f005ef32Sjsg 		unsigned int max_data_rate = adl_psf_bw(i915, i);
931*f005ef32Sjsg 
932*f005ef32Sjsg 		if (max_data_rate >= data_rate)
933*f005ef32Sjsg 			psf_points |= BIT(i);
934*f005ef32Sjsg 
935*f005ef32Sjsg 		drm_dbg_kms(&i915->drm, "PSF GV point %d: max bw %d"
936*f005ef32Sjsg 			    " required %d\n",
937*f005ef32Sjsg 			    i, max_data_rate, data_rate);
938*f005ef32Sjsg 	}
939*f005ef32Sjsg 
940*f005ef32Sjsg 	/*
941*f005ef32Sjsg 	 * BSpec states that we always should have at least one allowed point
942*f005ef32Sjsg 	 * left, so if we couldn't - simply reject the configuration for obvious
943*f005ef32Sjsg 	 * reasons.
944*f005ef32Sjsg 	 */
945*f005ef32Sjsg 	if (qgv_points == 0) {
946*f005ef32Sjsg 		drm_dbg_kms(&i915->drm, "No QGV points provide sufficient memory"
947*f005ef32Sjsg 			    " bandwidth %d for display configuration(%d active planes).\n",
948*f005ef32Sjsg 			    data_rate, num_active_planes);
949*f005ef32Sjsg 		return -EINVAL;
950*f005ef32Sjsg 	}
951*f005ef32Sjsg 
952*f005ef32Sjsg 	if (num_psf_gv_points > 0 && psf_points == 0) {
953*f005ef32Sjsg 		drm_dbg_kms(&i915->drm, "No PSF GV points provide sufficient memory"
954*f005ef32Sjsg 			    " bandwidth %d for display configuration(%d active planes).\n",
955*f005ef32Sjsg 			    data_rate, num_active_planes);
956*f005ef32Sjsg 		return -EINVAL;
957*f005ef32Sjsg 	}
958*f005ef32Sjsg 
959*f005ef32Sjsg 	/*
960*f005ef32Sjsg 	 * Leave only single point with highest bandwidth, if
961*f005ef32Sjsg 	 * we can't enable SAGV due to the increased memory latency it may
962*f005ef32Sjsg 	 * cause.
963*f005ef32Sjsg 	 */
964*f005ef32Sjsg 	if (!intel_can_enable_sagv(i915, new_bw_state)) {
965*f005ef32Sjsg 		qgv_points = BIT(max_bw_point);
966*f005ef32Sjsg 		drm_dbg_kms(&i915->drm, "No SAGV, using single QGV point %d\n",
967*f005ef32Sjsg 			    max_bw_point);
968*f005ef32Sjsg 	}
969*f005ef32Sjsg 
970*f005ef32Sjsg 	/*
971*f005ef32Sjsg 	 * We store the ones which need to be masked as that is what PCode
972*f005ef32Sjsg 	 * actually accepts as a parameter.
973*f005ef32Sjsg 	 */
974*f005ef32Sjsg 	new_bw_state->qgv_points_mask =
975*f005ef32Sjsg 		~(ICL_PCODE_REQ_QGV_PT(qgv_points) |
976*f005ef32Sjsg 		  ADLS_PCODE_REQ_PSF_PT(psf_points)) &
977*f005ef32Sjsg 		icl_qgv_points_mask(i915);
978*f005ef32Sjsg 
979*f005ef32Sjsg 	/*
980*f005ef32Sjsg 	 * If the actual mask had changed we need to make sure that
981*f005ef32Sjsg 	 * the commits are serialized(in case this is a nomodeset, nonblocking)
982*f005ef32Sjsg 	 */
983*f005ef32Sjsg 	if (new_bw_state->qgv_points_mask != old_bw_state->qgv_points_mask) {
984*f005ef32Sjsg 		ret = intel_atomic_serialize_global_state(&new_bw_state->base);
985*f005ef32Sjsg 		if (ret)
986*f005ef32Sjsg 			return ret;
987*f005ef32Sjsg 	}
988*f005ef32Sjsg 
989*f005ef32Sjsg 	return 0;
990*f005ef32Sjsg }
991*f005ef32Sjsg 
intel_bw_check_qgv_points(struct drm_i915_private * i915,const struct intel_bw_state * old_bw_state,struct intel_bw_state * new_bw_state)992*f005ef32Sjsg static int intel_bw_check_qgv_points(struct drm_i915_private *i915,
993*f005ef32Sjsg 				     const struct intel_bw_state *old_bw_state,
994*f005ef32Sjsg 				     struct intel_bw_state *new_bw_state)
995*f005ef32Sjsg {
996*f005ef32Sjsg 	unsigned int data_rate = intel_bw_data_rate(i915, new_bw_state);
997*f005ef32Sjsg 	unsigned int num_active_planes =
998*f005ef32Sjsg 			intel_bw_num_active_planes(i915, new_bw_state);
999*f005ef32Sjsg 
1000*f005ef32Sjsg 	data_rate = DIV_ROUND_UP(data_rate, 1000);
1001*f005ef32Sjsg 
1002*f005ef32Sjsg 	if (DISPLAY_VER(i915) >= 14)
1003*f005ef32Sjsg 		return mtl_find_qgv_points(i915, data_rate, num_active_planes,
1004*f005ef32Sjsg 					   new_bw_state);
1005*f005ef32Sjsg 	else
1006*f005ef32Sjsg 		return icl_find_qgv_points(i915, data_rate, num_active_planes,
1007*f005ef32Sjsg 					   old_bw_state, new_bw_state);
1008*f005ef32Sjsg }
1009*f005ef32Sjsg 
intel_bw_state_changed(struct drm_i915_private * i915,const struct intel_bw_state * old_bw_state,const struct intel_bw_state * new_bw_state)10101bb76ff1Sjsg static bool intel_bw_state_changed(struct drm_i915_private *i915,
10111bb76ff1Sjsg 				   const struct intel_bw_state *old_bw_state,
10121bb76ff1Sjsg 				   const struct intel_bw_state *new_bw_state)
1013ad8b1aafSjsg {
1014ad8b1aafSjsg 	enum pipe pipe;
1015ad8b1aafSjsg 
10161bb76ff1Sjsg 	for_each_pipe(i915, pipe) {
10171bb76ff1Sjsg 		const struct intel_dbuf_bw *old_crtc_bw =
10181bb76ff1Sjsg 			&old_bw_state->dbuf_bw[pipe];
10191bb76ff1Sjsg 		const struct intel_dbuf_bw *new_crtc_bw =
10201bb76ff1Sjsg 			&new_bw_state->dbuf_bw[pipe];
10211bb76ff1Sjsg 		enum dbuf_slice slice;
10221bb76ff1Sjsg 
10231bb76ff1Sjsg 		for_each_dbuf_slice(i915, slice) {
10241bb76ff1Sjsg 			if (old_crtc_bw->max_bw[slice] != new_crtc_bw->max_bw[slice] ||
10251bb76ff1Sjsg 			    old_crtc_bw->active_planes[slice] != new_crtc_bw->active_planes[slice])
10261bb76ff1Sjsg 				return true;
10271bb76ff1Sjsg 		}
10281bb76ff1Sjsg 
10291bb76ff1Sjsg 		if (old_bw_state->min_cdclk[pipe] != new_bw_state->min_cdclk[pipe])
10301bb76ff1Sjsg 			return true;
10311bb76ff1Sjsg 	}
10321bb76ff1Sjsg 
10331bb76ff1Sjsg 	return false;
10341bb76ff1Sjsg }
10351bb76ff1Sjsg 
skl_plane_calc_dbuf_bw(struct intel_bw_state * bw_state,struct intel_crtc * crtc,enum plane_id plane_id,const struct skl_ddb_entry * ddb,unsigned int data_rate)10361bb76ff1Sjsg static void skl_plane_calc_dbuf_bw(struct intel_bw_state *bw_state,
10371bb76ff1Sjsg 				   struct intel_crtc *crtc,
10381bb76ff1Sjsg 				   enum plane_id plane_id,
10391bb76ff1Sjsg 				   const struct skl_ddb_entry *ddb,
10401bb76ff1Sjsg 				   unsigned int data_rate)
10411bb76ff1Sjsg {
10421bb76ff1Sjsg 	struct drm_i915_private *i915 = to_i915(crtc->base.dev);
10431bb76ff1Sjsg 	struct intel_dbuf_bw *crtc_bw = &bw_state->dbuf_bw[crtc->pipe];
10441bb76ff1Sjsg 	unsigned int dbuf_mask = skl_ddb_dbuf_slice_mask(i915, ddb);
10451bb76ff1Sjsg 	enum dbuf_slice slice;
10461bb76ff1Sjsg 
10471bb76ff1Sjsg 	/*
10481bb76ff1Sjsg 	 * The arbiter can only really guarantee an
10491bb76ff1Sjsg 	 * equal share of the total bw to each plane.
10501bb76ff1Sjsg 	 */
10511bb76ff1Sjsg 	for_each_dbuf_slice_in_mask(i915, slice, dbuf_mask) {
10521bb76ff1Sjsg 		crtc_bw->max_bw[slice] = max(crtc_bw->max_bw[slice], data_rate);
10531bb76ff1Sjsg 		crtc_bw->active_planes[slice] |= BIT(plane_id);
10541bb76ff1Sjsg 	}
10551bb76ff1Sjsg }
10561bb76ff1Sjsg 
skl_crtc_calc_dbuf_bw(struct intel_bw_state * bw_state,const struct intel_crtc_state * crtc_state)10571bb76ff1Sjsg static void skl_crtc_calc_dbuf_bw(struct intel_bw_state *bw_state,
10581bb76ff1Sjsg 				  const struct intel_crtc_state *crtc_state)
10591bb76ff1Sjsg {
10601bb76ff1Sjsg 	struct intel_crtc *crtc = to_intel_crtc(crtc_state->uapi.crtc);
10611bb76ff1Sjsg 	struct drm_i915_private *i915 = to_i915(crtc->base.dev);
10621bb76ff1Sjsg 	struct intel_dbuf_bw *crtc_bw = &bw_state->dbuf_bw[crtc->pipe];
1063ad8b1aafSjsg 	enum plane_id plane_id;
1064ad8b1aafSjsg 
10651bb76ff1Sjsg 	memset(crtc_bw, 0, sizeof(*crtc_bw));
1066ad8b1aafSjsg 
1067ad8b1aafSjsg 	if (!crtc_state->hw.active)
10681bb76ff1Sjsg 		return;
1069ad8b1aafSjsg 
1070ad8b1aafSjsg 	for_each_plane_id_on_crtc(crtc, plane_id) {
10711bb76ff1Sjsg 		/*
10721bb76ff1Sjsg 		 * We assume cursors are small enough
10731bb76ff1Sjsg 		 * to not cause bandwidth problems.
10741bb76ff1Sjsg 		 */
10751bb76ff1Sjsg 		if (plane_id == PLANE_CURSOR)
10761bb76ff1Sjsg 			continue;
10771bb76ff1Sjsg 
10781bb76ff1Sjsg 		skl_plane_calc_dbuf_bw(bw_state, crtc, plane_id,
10791bb76ff1Sjsg 				       &crtc_state->wm.skl.plane_ddb[plane_id],
10801bb76ff1Sjsg 				       crtc_state->data_rate[plane_id]);
10811bb76ff1Sjsg 
10821bb76ff1Sjsg 		if (DISPLAY_VER(i915) < 11)
10831bb76ff1Sjsg 			skl_plane_calc_dbuf_bw(bw_state, crtc, plane_id,
10841bb76ff1Sjsg 					       &crtc_state->wm.skl.plane_ddb_y[plane_id],
10851bb76ff1Sjsg 					       crtc_state->data_rate[plane_id]);
10861bb76ff1Sjsg 	}
10871bb76ff1Sjsg }
10881bb76ff1Sjsg 
10891bb76ff1Sjsg /* "Maximum Data Buffer Bandwidth" */
10901bb76ff1Sjsg static int
intel_bw_dbuf_min_cdclk(struct drm_i915_private * i915,const struct intel_bw_state * bw_state)10911bb76ff1Sjsg intel_bw_dbuf_min_cdclk(struct drm_i915_private *i915,
10921bb76ff1Sjsg 			const struct intel_bw_state *bw_state)
10931bb76ff1Sjsg {
10941bb76ff1Sjsg 	unsigned int total_max_bw = 0;
10955ca02815Sjsg 	enum dbuf_slice slice;
1096ad8b1aafSjsg 
10971bb76ff1Sjsg 	for_each_dbuf_slice(i915, slice) {
10981bb76ff1Sjsg 		int num_active_planes = 0;
10991bb76ff1Sjsg 		unsigned int max_bw = 0;
11001bb76ff1Sjsg 		enum pipe pipe;
1101ad8b1aafSjsg 
1102ad8b1aafSjsg 		/*
11031bb76ff1Sjsg 		 * The arbiter can only really guarantee an
11041bb76ff1Sjsg 		 * equal share of the total bw to each plane.
1105ad8b1aafSjsg 		 */
11061bb76ff1Sjsg 		for_each_pipe(i915, pipe) {
11071bb76ff1Sjsg 			const struct intel_dbuf_bw *crtc_bw = &bw_state->dbuf_bw[pipe];
11081bb76ff1Sjsg 
11091bb76ff1Sjsg 			max_bw = max(crtc_bw->max_bw[slice], max_bw);
11101bb76ff1Sjsg 			num_active_planes += hweight8(crtc_bw->active_planes[slice]);
1111ad8b1aafSjsg 		}
11121bb76ff1Sjsg 		max_bw *= num_active_planes;
11131bb76ff1Sjsg 
11141bb76ff1Sjsg 		total_max_bw = max(total_max_bw, max_bw);
1115ad8b1aafSjsg 	}
1116ad8b1aafSjsg 
11171bb76ff1Sjsg 	return DIV_ROUND_UP(total_max_bw, 64);
1118ad8b1aafSjsg }
1119ad8b1aafSjsg 
intel_bw_min_cdclk(struct drm_i915_private * i915,const struct intel_bw_state * bw_state)11201bb76ff1Sjsg int intel_bw_min_cdclk(struct drm_i915_private *i915,
11211bb76ff1Sjsg 		       const struct intel_bw_state *bw_state)
11221bb76ff1Sjsg {
11231bb76ff1Sjsg 	enum pipe pipe;
11241bb76ff1Sjsg 	int min_cdclk;
1125ad8b1aafSjsg 
11261bb76ff1Sjsg 	min_cdclk = intel_bw_dbuf_min_cdclk(i915, bw_state);
1127ad8b1aafSjsg 
11281bb76ff1Sjsg 	for_each_pipe(i915, pipe)
11291bb76ff1Sjsg 		min_cdclk = max(bw_state->min_cdclk[pipe], min_cdclk);
11301bb76ff1Sjsg 
11311bb76ff1Sjsg 	return min_cdclk;
1132ad8b1aafSjsg }
1133ad8b1aafSjsg 
intel_bw_calc_min_cdclk(struct intel_atomic_state * state,bool * need_cdclk_calc)11341bb76ff1Sjsg int intel_bw_calc_min_cdclk(struct intel_atomic_state *state,
11351bb76ff1Sjsg 			    bool *need_cdclk_calc)
1136ad8b1aafSjsg {
1137ad8b1aafSjsg 	struct drm_i915_private *dev_priv = to_i915(state->base.dev);
1138ad8b1aafSjsg 	struct intel_bw_state *new_bw_state = NULL;
11391bb76ff1Sjsg 	const struct intel_bw_state *old_bw_state = NULL;
11401bb76ff1Sjsg 	const struct intel_cdclk_state *cdclk_state;
1141ad8b1aafSjsg 	const struct intel_crtc_state *crtc_state;
11421bb76ff1Sjsg 	int old_min_cdclk, new_min_cdclk;
1143ad8b1aafSjsg 	struct intel_crtc *crtc;
1144ad8b1aafSjsg 	int i;
1145ad8b1aafSjsg 
11461bb76ff1Sjsg 	if (DISPLAY_VER(dev_priv) < 9)
11471bb76ff1Sjsg 		return 0;
11481bb76ff1Sjsg 
1149ad8b1aafSjsg 	for_each_new_intel_crtc_in_state(state, crtc, crtc_state, i) {
1150ad8b1aafSjsg 		new_bw_state = intel_atomic_get_bw_state(state);
1151ad8b1aafSjsg 		if (IS_ERR(new_bw_state))
1152ad8b1aafSjsg 			return PTR_ERR(new_bw_state);
1153ad8b1aafSjsg 
1154ad8b1aafSjsg 		old_bw_state = intel_atomic_get_old_bw_state(state);
11551bb76ff1Sjsg 
11561bb76ff1Sjsg 		skl_crtc_calc_dbuf_bw(new_bw_state, crtc_state);
11571bb76ff1Sjsg 
11581bb76ff1Sjsg 		new_bw_state->min_cdclk[crtc->pipe] =
11591bb76ff1Sjsg 			intel_bw_crtc_min_cdclk(crtc_state);
1160ad8b1aafSjsg 	}
1161ad8b1aafSjsg 
1162ad8b1aafSjsg 	if (!old_bw_state)
1163ad8b1aafSjsg 		return 0;
1164ad8b1aafSjsg 
11651bb76ff1Sjsg 	if (intel_bw_state_changed(dev_priv, old_bw_state, new_bw_state)) {
1166ad8b1aafSjsg 		int ret = intel_atomic_lock_global_state(&new_bw_state->base);
1167ad8b1aafSjsg 		if (ret)
1168ad8b1aafSjsg 			return ret;
1169ad8b1aafSjsg 	}
1170ad8b1aafSjsg 
11711bb76ff1Sjsg 	old_min_cdclk = intel_bw_min_cdclk(dev_priv, old_bw_state);
11721bb76ff1Sjsg 	new_min_cdclk = intel_bw_min_cdclk(dev_priv, new_bw_state);
11731bb76ff1Sjsg 
11741bb76ff1Sjsg 	/*
11751bb76ff1Sjsg 	 * No need to check against the cdclk state if
11761bb76ff1Sjsg 	 * the min cdclk doesn't increase.
11771bb76ff1Sjsg 	 *
11781bb76ff1Sjsg 	 * Ie. we only ever increase the cdclk due to bandwidth
11791bb76ff1Sjsg 	 * requirements. This can reduce back and forth
11801bb76ff1Sjsg 	 * display blinking due to constant cdclk changes.
11811bb76ff1Sjsg 	 */
11821bb76ff1Sjsg 	if (new_min_cdclk <= old_min_cdclk)
11831bb76ff1Sjsg 		return 0;
11841bb76ff1Sjsg 
11851bb76ff1Sjsg 	cdclk_state = intel_atomic_get_cdclk_state(state);
11861bb76ff1Sjsg 	if (IS_ERR(cdclk_state))
11871bb76ff1Sjsg 		return PTR_ERR(cdclk_state);
11881bb76ff1Sjsg 
11891bb76ff1Sjsg 	/*
11901bb76ff1Sjsg 	 * No need to recalculate the cdclk state if
11911bb76ff1Sjsg 	 * the min cdclk doesn't increase.
11921bb76ff1Sjsg 	 *
11931bb76ff1Sjsg 	 * Ie. we only ever increase the cdclk due to bandwidth
11941bb76ff1Sjsg 	 * requirements. This can reduce back and forth
11951bb76ff1Sjsg 	 * display blinking due to constant cdclk changes.
11961bb76ff1Sjsg 	 */
11971bb76ff1Sjsg 	if (new_min_cdclk <= cdclk_state->bw_min_cdclk)
11981bb76ff1Sjsg 		return 0;
11991bb76ff1Sjsg 
12001bb76ff1Sjsg 	drm_dbg_kms(&dev_priv->drm,
12011bb76ff1Sjsg 		    "new bandwidth min cdclk (%d kHz) > old min cdclk (%d kHz)\n",
12021bb76ff1Sjsg 		    new_min_cdclk, cdclk_state->bw_min_cdclk);
12031bb76ff1Sjsg 	*need_cdclk_calc = true;
12041bb76ff1Sjsg 
1205ad8b1aafSjsg 	return 0;
1206ad8b1aafSjsg }
1207ad8b1aafSjsg 
intel_bw_check_data_rate(struct intel_atomic_state * state,bool * changed)12081bb76ff1Sjsg static int intel_bw_check_data_rate(struct intel_atomic_state *state, bool *changed)
12091bb76ff1Sjsg {
12101bb76ff1Sjsg 	struct drm_i915_private *i915 = to_i915(state->base.dev);
12111bb76ff1Sjsg 	const struct intel_crtc_state *new_crtc_state, *old_crtc_state;
12121bb76ff1Sjsg 	struct intel_crtc *crtc;
12131bb76ff1Sjsg 	int i;
12145ca02815Sjsg 
1215c349dbc7Sjsg 	for_each_oldnew_intel_crtc_in_state(state, crtc, old_crtc_state,
1216c349dbc7Sjsg 					    new_crtc_state, i) {
1217c349dbc7Sjsg 		unsigned int old_data_rate =
1218c349dbc7Sjsg 			intel_bw_crtc_data_rate(old_crtc_state);
1219c349dbc7Sjsg 		unsigned int new_data_rate =
1220c349dbc7Sjsg 			intel_bw_crtc_data_rate(new_crtc_state);
1221c349dbc7Sjsg 		unsigned int old_active_planes =
1222c349dbc7Sjsg 			intel_bw_crtc_num_active_planes(old_crtc_state);
1223c349dbc7Sjsg 		unsigned int new_active_planes =
1224c349dbc7Sjsg 			intel_bw_crtc_num_active_planes(new_crtc_state);
12251bb76ff1Sjsg 		struct intel_bw_state *new_bw_state;
1226c349dbc7Sjsg 
1227c349dbc7Sjsg 		/*
1228c349dbc7Sjsg 		 * Avoid locking the bw state when
1229c349dbc7Sjsg 		 * nothing significant has changed.
1230c349dbc7Sjsg 		 */
1231c349dbc7Sjsg 		if (old_data_rate == new_data_rate &&
1232c349dbc7Sjsg 		    old_active_planes == new_active_planes)
1233c349dbc7Sjsg 			continue;
1234c349dbc7Sjsg 
1235ad8b1aafSjsg 		new_bw_state = intel_atomic_get_bw_state(state);
1236ad8b1aafSjsg 		if (IS_ERR(new_bw_state))
1237ad8b1aafSjsg 			return PTR_ERR(new_bw_state);
1238c349dbc7Sjsg 
1239ad8b1aafSjsg 		new_bw_state->data_rate[crtc->pipe] = new_data_rate;
1240ad8b1aafSjsg 		new_bw_state->num_active_planes[crtc->pipe] = new_active_planes;
1241c349dbc7Sjsg 
12421bb76ff1Sjsg 		*changed = true;
1243679bd941Sjsg 
12441bb76ff1Sjsg 		drm_dbg_kms(&i915->drm,
12451bb76ff1Sjsg 			    "[CRTC:%d:%s] data rate %u num active planes %u\n",
12461bb76ff1Sjsg 			    crtc->base.base.id, crtc->base.name,
1247ad8b1aafSjsg 			    new_bw_state->data_rate[crtc->pipe],
1248ad8b1aafSjsg 			    new_bw_state->num_active_planes[crtc->pipe]);
1249c349dbc7Sjsg 	}
1250c349dbc7Sjsg 
12511bb76ff1Sjsg 	return 0;
12521bb76ff1Sjsg }
12531bb76ff1Sjsg 
intel_bw_atomic_check(struct intel_atomic_state * state)12541bb76ff1Sjsg int intel_bw_atomic_check(struct intel_atomic_state *state)
12551bb76ff1Sjsg {
12561bb76ff1Sjsg 	bool changed = false;
1257*f005ef32Sjsg 	struct drm_i915_private *i915 = to_i915(state->base.dev);
1258*f005ef32Sjsg 	struct intel_bw_state *new_bw_state;
1259*f005ef32Sjsg 	const struct intel_bw_state *old_bw_state;
1260*f005ef32Sjsg 	int ret;
12611bb76ff1Sjsg 
12621bb76ff1Sjsg 	/* FIXME earlier gens need some checks too */
1263*f005ef32Sjsg 	if (DISPLAY_VER(i915) < 11)
12641bb76ff1Sjsg 		return 0;
12651bb76ff1Sjsg 
12661bb76ff1Sjsg 	ret = intel_bw_check_data_rate(state, &changed);
12671bb76ff1Sjsg 	if (ret)
12681bb76ff1Sjsg 		return ret;
12691bb76ff1Sjsg 
1270679bd941Sjsg 	old_bw_state = intel_atomic_get_old_bw_state(state);
1271679bd941Sjsg 	new_bw_state = intel_atomic_get_new_bw_state(state);
1272679bd941Sjsg 
1273679bd941Sjsg 	if (new_bw_state &&
1274*f005ef32Sjsg 	    intel_can_enable_sagv(i915, old_bw_state) !=
1275*f005ef32Sjsg 	    intel_can_enable_sagv(i915, new_bw_state))
1276679bd941Sjsg 		changed = true;
1277679bd941Sjsg 
1278679bd941Sjsg 	/*
1279679bd941Sjsg 	 * If none of our inputs (data rates, number of active
1280679bd941Sjsg 	 * planes, SAGV yes/no) changed then nothing to do here.
1281679bd941Sjsg 	 */
1282679bd941Sjsg 	if (!changed)
1283c349dbc7Sjsg 		return 0;
1284c349dbc7Sjsg 
1285*f005ef32Sjsg 	ret = intel_bw_check_qgv_points(i915, old_bw_state, new_bw_state);
1286c349dbc7Sjsg 	if (ret)
1287c349dbc7Sjsg 		return ret;
1288c349dbc7Sjsg 
1289c349dbc7Sjsg 	return 0;
1290c349dbc7Sjsg }
1291c349dbc7Sjsg 
1292c349dbc7Sjsg static struct intel_global_state *
intel_bw_duplicate_state(struct intel_global_obj * obj)1293c349dbc7Sjsg intel_bw_duplicate_state(struct intel_global_obj *obj)
1294c349dbc7Sjsg {
1295c349dbc7Sjsg 	struct intel_bw_state *state;
1296c349dbc7Sjsg 
1297c349dbc7Sjsg 	state = kmemdup(obj->state, sizeof(*state), GFP_KERNEL);
1298c349dbc7Sjsg 	if (!state)
1299c349dbc7Sjsg 		return NULL;
1300c349dbc7Sjsg 
1301c349dbc7Sjsg 	return &state->base;
1302c349dbc7Sjsg }
1303c349dbc7Sjsg 
intel_bw_destroy_state(struct intel_global_obj * obj,struct intel_global_state * state)1304c349dbc7Sjsg static void intel_bw_destroy_state(struct intel_global_obj *obj,
1305c349dbc7Sjsg 				   struct intel_global_state *state)
1306c349dbc7Sjsg {
1307c349dbc7Sjsg 	kfree(state);
1308c349dbc7Sjsg }
1309c349dbc7Sjsg 
1310c349dbc7Sjsg static const struct intel_global_state_funcs intel_bw_funcs = {
1311c349dbc7Sjsg 	.atomic_duplicate_state = intel_bw_duplicate_state,
1312c349dbc7Sjsg 	.atomic_destroy_state = intel_bw_destroy_state,
1313c349dbc7Sjsg };
1314c349dbc7Sjsg 
intel_bw_init(struct drm_i915_private * dev_priv)1315c349dbc7Sjsg int intel_bw_init(struct drm_i915_private *dev_priv)
1316c349dbc7Sjsg {
1317c349dbc7Sjsg 	struct intel_bw_state *state;
1318c349dbc7Sjsg 
1319c349dbc7Sjsg 	state = kzalloc(sizeof(*state), GFP_KERNEL);
1320c349dbc7Sjsg 	if (!state)
1321c349dbc7Sjsg 		return -ENOMEM;
1322c349dbc7Sjsg 
13231bb76ff1Sjsg 	intel_atomic_global_obj_init(dev_priv, &dev_priv->display.bw.obj,
1324c349dbc7Sjsg 				     &state->base, &intel_bw_funcs);
1325c349dbc7Sjsg 
1326c349dbc7Sjsg 	return 0;
1327c349dbc7Sjsg }
1328