1c349dbc7Sjsg // SPDX-License-Identifier: MIT
2c349dbc7Sjsg /*
3c349dbc7Sjsg * Copyright © 2019 Intel Corporation
4c349dbc7Sjsg */
5c349dbc7Sjsg
6c349dbc7Sjsg #include <drm/drm_atomic_state_helper.h>
7c349dbc7Sjsg
81bb76ff1Sjsg #include "i915_drv.h"
91bb76ff1Sjsg #include "i915_reg.h"
101bb76ff1Sjsg #include "i915_utils.h"
11ad8b1aafSjsg #include "intel_atomic.h"
12c349dbc7Sjsg #include "intel_bw.h"
13ad8b1aafSjsg #include "intel_cdclk.h"
141bb76ff1Sjsg #include "intel_display_core.h"
15c349dbc7Sjsg #include "intel_display_types.h"
161bb76ff1Sjsg #include "skl_watermark.h"
171bb76ff1Sjsg #include "intel_mchbar_regs.h"
181bb76ff1Sjsg #include "intel_pcode.h"
19c349dbc7Sjsg
20c349dbc7Sjsg /* Parameters for Qclk Geyserville (QGV) */
21c349dbc7Sjsg struct intel_qgv_point {
22c349dbc7Sjsg u16 dclk, t_rp, t_rdpre, t_rc, t_ras, t_rcd;
23c349dbc7Sjsg };
24c349dbc7Sjsg
255ca02815Sjsg struct intel_psf_gv_point {
265ca02815Sjsg u8 clk; /* clock in multiples of 16.6666 MHz */
27c349dbc7Sjsg };
28c349dbc7Sjsg
295ca02815Sjsg struct intel_qgv_info {
305ca02815Sjsg struct intel_qgv_point points[I915_NUM_QGV_POINTS];
315ca02815Sjsg struct intel_psf_gv_point psf_points[I915_NUM_PSF_GV_POINTS];
325ca02815Sjsg u8 num_points;
335ca02815Sjsg u8 num_psf_points;
345ca02815Sjsg u8 t_bl;
351bb76ff1Sjsg u8 max_numchannels;
361bb76ff1Sjsg u8 channel_width;
371bb76ff1Sjsg u8 deinterleave;
385ca02815Sjsg };
395ca02815Sjsg
dg1_mchbar_read_qgv_point_info(struct drm_i915_private * dev_priv,struct intel_qgv_point * sp,int point)405ca02815Sjsg static int dg1_mchbar_read_qgv_point_info(struct drm_i915_private *dev_priv,
415ca02815Sjsg struct intel_qgv_point *sp,
425ca02815Sjsg int point)
43c349dbc7Sjsg {
445ca02815Sjsg u32 dclk_ratio, dclk_reference;
455ca02815Sjsg u32 val;
46c349dbc7Sjsg
475ca02815Sjsg val = intel_uncore_read(&dev_priv->uncore, SA_PERF_STATUS_0_0_0_MCHBAR_PC);
485ca02815Sjsg dclk_ratio = REG_FIELD_GET(DG1_QCLK_RATIO_MASK, val);
495ca02815Sjsg if (val & DG1_QCLK_REFERENCE)
505ca02815Sjsg dclk_reference = 6; /* 6 * 16.666 MHz = 100 MHz */
515ca02815Sjsg else
525ca02815Sjsg dclk_reference = 8; /* 8 * 16.666 MHz = 133 MHz */
531bb76ff1Sjsg sp->dclk = DIV_ROUND_UP((16667 * dclk_ratio * dclk_reference) + 500, 1000);
54c349dbc7Sjsg
555ca02815Sjsg val = intel_uncore_read(&dev_priv->uncore, SKL_MC_BIOS_DATA_0_0_0_MCHBAR_PCU);
565ca02815Sjsg if (val & DG1_GEAR_TYPE)
575ca02815Sjsg sp->dclk *= 2;
58c349dbc7Sjsg
595ca02815Sjsg if (sp->dclk == 0)
605ca02815Sjsg return -EINVAL;
61c349dbc7Sjsg
625ca02815Sjsg val = intel_uncore_read(&dev_priv->uncore, MCHBAR_CH0_CR_TC_PRE_0_0_0_MCHBAR);
635ca02815Sjsg sp->t_rp = REG_FIELD_GET(DG1_DRAM_T_RP_MASK, val);
645ca02815Sjsg sp->t_rdpre = REG_FIELD_GET(DG1_DRAM_T_RDPRE_MASK, val);
655ca02815Sjsg
665ca02815Sjsg val = intel_uncore_read(&dev_priv->uncore, MCHBAR_CH0_CR_TC_PRE_0_0_0_MCHBAR_HIGH);
675ca02815Sjsg sp->t_rcd = REG_FIELD_GET(DG1_DRAM_T_RCD_MASK, val);
685ca02815Sjsg sp->t_ras = REG_FIELD_GET(DG1_DRAM_T_RAS_MASK, val);
695ca02815Sjsg
705ca02815Sjsg sp->t_rc = sp->t_rp + sp->t_ras;
71c349dbc7Sjsg
72c349dbc7Sjsg return 0;
73c349dbc7Sjsg }
74c349dbc7Sjsg
icl_pcode_read_qgv_point_info(struct drm_i915_private * dev_priv,struct intel_qgv_point * sp,int point)75c349dbc7Sjsg static int icl_pcode_read_qgv_point_info(struct drm_i915_private *dev_priv,
76c349dbc7Sjsg struct intel_qgv_point *sp,
77c349dbc7Sjsg int point)
78c349dbc7Sjsg {
79c349dbc7Sjsg u32 val = 0, val2 = 0;
801bb76ff1Sjsg u16 dclk;
81c349dbc7Sjsg int ret;
82c349dbc7Sjsg
831bb76ff1Sjsg ret = snb_pcode_read(&dev_priv->uncore, ICL_PCODE_MEM_SUBSYSYSTEM_INFO |
84c349dbc7Sjsg ICL_PCODE_MEM_SS_READ_QGV_POINT_INFO(point),
85c349dbc7Sjsg &val, &val2);
86c349dbc7Sjsg if (ret)
87c349dbc7Sjsg return ret;
88c349dbc7Sjsg
891bb76ff1Sjsg dclk = val & 0xffff;
901bb76ff1Sjsg sp->dclk = DIV_ROUND_UP((16667 * dclk) + (DISPLAY_VER(dev_priv) > 11 ? 500 : 0), 1000);
91c349dbc7Sjsg sp->t_rp = (val & 0xff0000) >> 16;
92c349dbc7Sjsg sp->t_rcd = (val & 0xff000000) >> 24;
93c349dbc7Sjsg
94c349dbc7Sjsg sp->t_rdpre = val2 & 0xff;
95c349dbc7Sjsg sp->t_ras = (val2 & 0xff00) >> 8;
96c349dbc7Sjsg
97c349dbc7Sjsg sp->t_rc = sp->t_rp + sp->t_ras;
98c349dbc7Sjsg
99c349dbc7Sjsg return 0;
100c349dbc7Sjsg }
101c349dbc7Sjsg
adls_pcode_read_psf_gv_point_info(struct drm_i915_private * dev_priv,struct intel_psf_gv_point * points)1025ca02815Sjsg static int adls_pcode_read_psf_gv_point_info(struct drm_i915_private *dev_priv,
1035ca02815Sjsg struct intel_psf_gv_point *points)
1045ca02815Sjsg {
1055ca02815Sjsg u32 val = 0;
1065ca02815Sjsg int ret;
1075ca02815Sjsg int i;
1085ca02815Sjsg
1091bb76ff1Sjsg ret = snb_pcode_read(&dev_priv->uncore, ICL_PCODE_MEM_SUBSYSYSTEM_INFO |
1101bb76ff1Sjsg ADL_PCODE_MEM_SS_READ_PSF_GV_INFO, &val, NULL);
1115ca02815Sjsg if (ret)
1125ca02815Sjsg return ret;
1135ca02815Sjsg
1145ca02815Sjsg for (i = 0; i < I915_NUM_PSF_GV_POINTS; i++) {
1155ca02815Sjsg points[i].clk = val & 0xff;
1165ca02815Sjsg val >>= 8;
1175ca02815Sjsg }
1185ca02815Sjsg
1195ca02815Sjsg return 0;
1205ca02815Sjsg }
1215ca02815Sjsg
icl_qgv_points_mask(struct drm_i915_private * i915)122*f005ef32Sjsg static u16 icl_qgv_points_mask(struct drm_i915_private *i915)
123*f005ef32Sjsg {
124*f005ef32Sjsg unsigned int num_psf_gv_points = i915->display.bw.max[0].num_psf_gv_points;
125*f005ef32Sjsg unsigned int num_qgv_points = i915->display.bw.max[0].num_qgv_points;
126*f005ef32Sjsg u16 qgv_points = 0, psf_points = 0;
127*f005ef32Sjsg
128*f005ef32Sjsg /*
129*f005ef32Sjsg * We can _not_ use the whole ADLS_QGV_PT_MASK here, as PCode rejects
130*f005ef32Sjsg * it with failure if we try masking any unadvertised points.
131*f005ef32Sjsg * So need to operate only with those returned from PCode.
132*f005ef32Sjsg */
133*f005ef32Sjsg if (num_qgv_points > 0)
134*f005ef32Sjsg qgv_points = GENMASK(num_qgv_points - 1, 0);
135*f005ef32Sjsg
136*f005ef32Sjsg if (num_psf_gv_points > 0)
137*f005ef32Sjsg psf_points = GENMASK(num_psf_gv_points - 1, 0);
138*f005ef32Sjsg
139*f005ef32Sjsg return ICL_PCODE_REQ_QGV_PT(qgv_points) | ADLS_PCODE_REQ_PSF_PT(psf_points);
140*f005ef32Sjsg }
141*f005ef32Sjsg
is_sagv_enabled(struct drm_i915_private * i915,u16 points_mask)142*f005ef32Sjsg static bool is_sagv_enabled(struct drm_i915_private *i915, u16 points_mask)
143*f005ef32Sjsg {
144*f005ef32Sjsg return !is_power_of_2(~points_mask & icl_qgv_points_mask(i915) &
145*f005ef32Sjsg ICL_PCODE_REQ_QGV_PT_MASK);
146*f005ef32Sjsg }
147*f005ef32Sjsg
icl_pcode_restrict_qgv_points(struct drm_i915_private * dev_priv,u32 points_mask)148ad8b1aafSjsg int icl_pcode_restrict_qgv_points(struct drm_i915_private *dev_priv,
149ad8b1aafSjsg u32 points_mask)
150ad8b1aafSjsg {
151ad8b1aafSjsg int ret;
152ad8b1aafSjsg
153*f005ef32Sjsg if (DISPLAY_VER(dev_priv) >= 14)
154*f005ef32Sjsg return 0;
155*f005ef32Sjsg
156ad8b1aafSjsg /* bspec says to keep retrying for at least 1 ms */
1571bb76ff1Sjsg ret = skl_pcode_request(&dev_priv->uncore, ICL_PCODE_SAGV_DE_MEM_SS_CONFIG,
158ad8b1aafSjsg points_mask,
1591bb76ff1Sjsg ICL_PCODE_REP_QGV_MASK | ADLS_PCODE_REP_PSF_MASK,
1601bb76ff1Sjsg ICL_PCODE_REP_QGV_SAFE | ADLS_PCODE_REP_PSF_SAFE,
161ad8b1aafSjsg 1);
162ad8b1aafSjsg
163ad8b1aafSjsg if (ret < 0) {
1645ca02815Sjsg drm_err(&dev_priv->drm, "Failed to disable qgv points (%d) points: 0x%x\n", ret, points_mask);
165ad8b1aafSjsg return ret;
166ad8b1aafSjsg }
167ad8b1aafSjsg
168*f005ef32Sjsg dev_priv->display.sagv.status = is_sagv_enabled(dev_priv, points_mask) ?
169*f005ef32Sjsg I915_SAGV_ENABLED : I915_SAGV_DISABLED;
170*f005ef32Sjsg
171ad8b1aafSjsg return 0;
172ad8b1aafSjsg }
173ad8b1aafSjsg
mtl_read_qgv_point_info(struct drm_i915_private * dev_priv,struct intel_qgv_point * sp,int point)1741bb76ff1Sjsg static int mtl_read_qgv_point_info(struct drm_i915_private *dev_priv,
1751bb76ff1Sjsg struct intel_qgv_point *sp, int point)
1761bb76ff1Sjsg {
1771bb76ff1Sjsg u32 val, val2;
1781bb76ff1Sjsg u16 dclk;
1791bb76ff1Sjsg
1801bb76ff1Sjsg val = intel_uncore_read(&dev_priv->uncore,
1811bb76ff1Sjsg MTL_MEM_SS_INFO_QGV_POINT_LOW(point));
1821bb76ff1Sjsg val2 = intel_uncore_read(&dev_priv->uncore,
1831bb76ff1Sjsg MTL_MEM_SS_INFO_QGV_POINT_HIGH(point));
1841bb76ff1Sjsg dclk = REG_FIELD_GET(MTL_DCLK_MASK, val);
185*f005ef32Sjsg sp->dclk = DIV_ROUND_CLOSEST(16667 * dclk, 1000);
1861bb76ff1Sjsg sp->t_rp = REG_FIELD_GET(MTL_TRP_MASK, val);
1871bb76ff1Sjsg sp->t_rcd = REG_FIELD_GET(MTL_TRCD_MASK, val);
1881bb76ff1Sjsg
1891bb76ff1Sjsg sp->t_rdpre = REG_FIELD_GET(MTL_TRDPRE_MASK, val2);
1901bb76ff1Sjsg sp->t_ras = REG_FIELD_GET(MTL_TRAS_MASK, val2);
1911bb76ff1Sjsg
1921bb76ff1Sjsg sp->t_rc = sp->t_rp + sp->t_ras;
1931bb76ff1Sjsg
1941bb76ff1Sjsg return 0;
1951bb76ff1Sjsg }
1961bb76ff1Sjsg
1971bb76ff1Sjsg static int
intel_read_qgv_point_info(struct drm_i915_private * dev_priv,struct intel_qgv_point * sp,int point)1981bb76ff1Sjsg intel_read_qgv_point_info(struct drm_i915_private *dev_priv,
1991bb76ff1Sjsg struct intel_qgv_point *sp,
2001bb76ff1Sjsg int point)
2011bb76ff1Sjsg {
2021bb76ff1Sjsg if (DISPLAY_VER(dev_priv) >= 14)
2031bb76ff1Sjsg return mtl_read_qgv_point_info(dev_priv, sp, point);
2041bb76ff1Sjsg else if (IS_DG1(dev_priv))
2051bb76ff1Sjsg return dg1_mchbar_read_qgv_point_info(dev_priv, sp, point);
2061bb76ff1Sjsg else
2071bb76ff1Sjsg return icl_pcode_read_qgv_point_info(dev_priv, sp, point);
2081bb76ff1Sjsg }
2091bb76ff1Sjsg
icl_get_qgv_points(struct drm_i915_private * dev_priv,struct intel_qgv_info * qi,bool is_y_tile)210c349dbc7Sjsg static int icl_get_qgv_points(struct drm_i915_private *dev_priv,
2111bb76ff1Sjsg struct intel_qgv_info *qi,
2121bb76ff1Sjsg bool is_y_tile)
213c349dbc7Sjsg {
2145ca02815Sjsg const struct dram_info *dram_info = &dev_priv->dram_info;
215c349dbc7Sjsg int i, ret;
216c349dbc7Sjsg
2175ca02815Sjsg qi->num_points = dram_info->num_qgv_points;
2185ca02815Sjsg qi->num_psf_points = dram_info->num_psf_gv_points;
2195ca02815Sjsg
2201bb76ff1Sjsg if (DISPLAY_VER(dev_priv) >= 14) {
2215ca02815Sjsg switch (dram_info->type) {
2225ca02815Sjsg case INTEL_DRAM_DDR4:
2235ca02815Sjsg qi->t_bl = 4;
2241bb76ff1Sjsg qi->max_numchannels = 2;
2251bb76ff1Sjsg qi->channel_width = 64;
2261bb76ff1Sjsg qi->deinterleave = 2;
2275ca02815Sjsg break;
2285ca02815Sjsg case INTEL_DRAM_DDR5:
2295ca02815Sjsg qi->t_bl = 8;
2301bb76ff1Sjsg qi->max_numchannels = 4;
2311bb76ff1Sjsg qi->channel_width = 32;
2321bb76ff1Sjsg qi->deinterleave = 2;
2331bb76ff1Sjsg break;
2341bb76ff1Sjsg case INTEL_DRAM_LPDDR4:
2351bb76ff1Sjsg case INTEL_DRAM_LPDDR5:
2361bb76ff1Sjsg qi->t_bl = 16;
2371bb76ff1Sjsg qi->max_numchannels = 8;
2381bb76ff1Sjsg qi->channel_width = 16;
2391bb76ff1Sjsg qi->deinterleave = 4;
2401bb76ff1Sjsg break;
2411bb76ff1Sjsg default:
2421bb76ff1Sjsg MISSING_CASE(dram_info->type);
2431bb76ff1Sjsg return -EINVAL;
2441bb76ff1Sjsg }
2451bb76ff1Sjsg } else if (DISPLAY_VER(dev_priv) >= 12) {
2461bb76ff1Sjsg switch (dram_info->type) {
2471bb76ff1Sjsg case INTEL_DRAM_DDR4:
2481bb76ff1Sjsg qi->t_bl = is_y_tile ? 8 : 4;
2491bb76ff1Sjsg qi->max_numchannels = 2;
2501bb76ff1Sjsg qi->channel_width = 64;
2511bb76ff1Sjsg qi->deinterleave = is_y_tile ? 1 : 2;
2521bb76ff1Sjsg break;
2531bb76ff1Sjsg case INTEL_DRAM_DDR5:
2541bb76ff1Sjsg qi->t_bl = is_y_tile ? 16 : 8;
2551bb76ff1Sjsg qi->max_numchannels = 4;
2561bb76ff1Sjsg qi->channel_width = 32;
2571bb76ff1Sjsg qi->deinterleave = is_y_tile ? 1 : 2;
2581bb76ff1Sjsg break;
2591bb76ff1Sjsg case INTEL_DRAM_LPDDR4:
2601bb76ff1Sjsg if (IS_ROCKETLAKE(dev_priv)) {
2611bb76ff1Sjsg qi->t_bl = 8;
2621bb76ff1Sjsg qi->max_numchannels = 4;
2631bb76ff1Sjsg qi->channel_width = 32;
2641bb76ff1Sjsg qi->deinterleave = 2;
2651bb76ff1Sjsg break;
2661bb76ff1Sjsg }
2671bb76ff1Sjsg fallthrough;
2681bb76ff1Sjsg case INTEL_DRAM_LPDDR5:
2691bb76ff1Sjsg qi->t_bl = 16;
2701bb76ff1Sjsg qi->max_numchannels = 8;
2711bb76ff1Sjsg qi->channel_width = 16;
2721bb76ff1Sjsg qi->deinterleave = is_y_tile ? 2 : 4;
2735ca02815Sjsg break;
2745ca02815Sjsg default:
2755ca02815Sjsg qi->t_bl = 16;
2761bb76ff1Sjsg qi->max_numchannels = 1;
2775ca02815Sjsg break;
2785ca02815Sjsg }
2791bb76ff1Sjsg } else if (DISPLAY_VER(dev_priv) == 11) {
2805ca02815Sjsg qi->t_bl = dev_priv->dram_info.type == INTEL_DRAM_DDR4 ? 4 : 8;
2811bb76ff1Sjsg qi->max_numchannels = 1;
2821bb76ff1Sjsg }
283c349dbc7Sjsg
284c349dbc7Sjsg if (drm_WARN_ON(&dev_priv->drm,
285c349dbc7Sjsg qi->num_points > ARRAY_SIZE(qi->points)))
286c349dbc7Sjsg qi->num_points = ARRAY_SIZE(qi->points);
287c349dbc7Sjsg
288c349dbc7Sjsg for (i = 0; i < qi->num_points; i++) {
289c349dbc7Sjsg struct intel_qgv_point *sp = &qi->points[i];
290c349dbc7Sjsg
2911bb76ff1Sjsg ret = intel_read_qgv_point_info(dev_priv, sp, i);
292c349dbc7Sjsg if (ret)
293c349dbc7Sjsg return ret;
294c349dbc7Sjsg
295c349dbc7Sjsg drm_dbg_kms(&dev_priv->drm,
296c349dbc7Sjsg "QGV %d: DCLK=%d tRP=%d tRDPRE=%d tRAS=%d tRCD=%d tRC=%d\n",
297c349dbc7Sjsg i, sp->dclk, sp->t_rp, sp->t_rdpre, sp->t_ras,
298c349dbc7Sjsg sp->t_rcd, sp->t_rc);
299c349dbc7Sjsg }
300c349dbc7Sjsg
3015ca02815Sjsg if (qi->num_psf_points > 0) {
3025ca02815Sjsg ret = adls_pcode_read_psf_gv_point_info(dev_priv, qi->psf_points);
3035ca02815Sjsg if (ret) {
3045ca02815Sjsg drm_err(&dev_priv->drm, "Failed to read PSF point data; PSF points will not be considered in bandwidth calculations.\n");
3055ca02815Sjsg qi->num_psf_points = 0;
3065ca02815Sjsg }
3075ca02815Sjsg
3085ca02815Sjsg for (i = 0; i < qi->num_psf_points; i++)
3095ca02815Sjsg drm_dbg_kms(&dev_priv->drm,
3105ca02815Sjsg "PSF GV %d: CLK=%d \n",
3115ca02815Sjsg i, qi->psf_points[i].clk);
3125ca02815Sjsg }
3135ca02815Sjsg
314c349dbc7Sjsg return 0;
315c349dbc7Sjsg }
316c349dbc7Sjsg
adl_calc_psf_bw(int clk)3175ca02815Sjsg static int adl_calc_psf_bw(int clk)
3185ca02815Sjsg {
3195ca02815Sjsg /*
3205ca02815Sjsg * clk is multiples of 16.666MHz (100/6)
3215ca02815Sjsg * According to BSpec PSF GV bandwidth is
3225ca02815Sjsg * calculated as BW = 64 * clk * 16.666Mhz
3235ca02815Sjsg */
3245ca02815Sjsg return DIV_ROUND_CLOSEST(64 * clk * 100, 6);
3255ca02815Sjsg }
3265ca02815Sjsg
icl_sagv_max_dclk(const struct intel_qgv_info * qi)327c349dbc7Sjsg static int icl_sagv_max_dclk(const struct intel_qgv_info *qi)
328c349dbc7Sjsg {
329c349dbc7Sjsg u16 dclk = 0;
330c349dbc7Sjsg int i;
331c349dbc7Sjsg
332c349dbc7Sjsg for (i = 0; i < qi->num_points; i++)
333c349dbc7Sjsg dclk = max(dclk, qi->points[i].dclk);
334c349dbc7Sjsg
335c349dbc7Sjsg return dclk;
336c349dbc7Sjsg }
337c349dbc7Sjsg
338c349dbc7Sjsg struct intel_sa_info {
339c349dbc7Sjsg u16 displayrtids;
3405ca02815Sjsg u8 deburst, deprogbwlimit, derating;
341c349dbc7Sjsg };
342c349dbc7Sjsg
343c349dbc7Sjsg static const struct intel_sa_info icl_sa_info = {
344c349dbc7Sjsg .deburst = 8,
345c349dbc7Sjsg .deprogbwlimit = 25, /* GB/s */
346c349dbc7Sjsg .displayrtids = 128,
3475ca02815Sjsg .derating = 10,
348c349dbc7Sjsg };
349c349dbc7Sjsg
350c349dbc7Sjsg static const struct intel_sa_info tgl_sa_info = {
351c349dbc7Sjsg .deburst = 16,
352c349dbc7Sjsg .deprogbwlimit = 34, /* GB/s */
353c349dbc7Sjsg .displayrtids = 256,
3545ca02815Sjsg .derating = 10,
355c349dbc7Sjsg };
356c349dbc7Sjsg
357ad8b1aafSjsg static const struct intel_sa_info rkl_sa_info = {
3581bb76ff1Sjsg .deburst = 8,
359ad8b1aafSjsg .deprogbwlimit = 20, /* GB/s */
360ad8b1aafSjsg .displayrtids = 128,
3615ca02815Sjsg .derating = 10,
3625ca02815Sjsg };
3635ca02815Sjsg
3645ca02815Sjsg static const struct intel_sa_info adls_sa_info = {
3655ca02815Sjsg .deburst = 16,
3665ca02815Sjsg .deprogbwlimit = 38, /* GB/s */
3675ca02815Sjsg .displayrtids = 256,
3685ca02815Sjsg .derating = 10,
3695ca02815Sjsg };
3705ca02815Sjsg
3715ca02815Sjsg static const struct intel_sa_info adlp_sa_info = {
3725ca02815Sjsg .deburst = 16,
3735ca02815Sjsg .deprogbwlimit = 38, /* GB/s */
3745ca02815Sjsg .displayrtids = 256,
3755ca02815Sjsg .derating = 20,
376ad8b1aafSjsg };
377ad8b1aafSjsg
3781bb76ff1Sjsg static const struct intel_sa_info mtl_sa_info = {
3791bb76ff1Sjsg .deburst = 32,
3801bb76ff1Sjsg .deprogbwlimit = 38, /* GB/s */
3811bb76ff1Sjsg .displayrtids = 256,
382*f005ef32Sjsg .derating = 10,
3831bb76ff1Sjsg };
3841bb76ff1Sjsg
icl_get_bw_info(struct drm_i915_private * dev_priv,const struct intel_sa_info * sa)385c349dbc7Sjsg static int icl_get_bw_info(struct drm_i915_private *dev_priv, const struct intel_sa_info *sa)
386c349dbc7Sjsg {
387c349dbc7Sjsg struct intel_qgv_info qi = {};
388c349dbc7Sjsg bool is_y_tile = true; /* assume y tile may be used */
3895ca02815Sjsg int num_channels = max_t(u8, 1, dev_priv->dram_info.num_channels);
3901bb76ff1Sjsg int ipqdepth, ipqdepthpch = 16;
391c349dbc7Sjsg int dclk_max;
392c349dbc7Sjsg int maxdebw;
3931bb76ff1Sjsg int num_groups = ARRAY_SIZE(dev_priv->display.bw.max);
394c349dbc7Sjsg int i, ret;
395c349dbc7Sjsg
3961bb76ff1Sjsg ret = icl_get_qgv_points(dev_priv, &qi, is_y_tile);
397c349dbc7Sjsg if (ret) {
398c349dbc7Sjsg drm_dbg_kms(&dev_priv->drm,
399c349dbc7Sjsg "Failed to get memory subsystem information, ignoring bandwidth limits");
400c349dbc7Sjsg return ret;
401c349dbc7Sjsg }
402c349dbc7Sjsg
403c349dbc7Sjsg dclk_max = icl_sagv_max_dclk(&qi);
4041bb76ff1Sjsg maxdebw = min(sa->deprogbwlimit * 1000, dclk_max * 16 * 6 / 10);
405c349dbc7Sjsg ipqdepth = min(ipqdepthpch, sa->displayrtids / num_channels);
4061bb76ff1Sjsg qi.deinterleave = DIV_ROUND_UP(num_channels, is_y_tile ? 4 : 2);
407c349dbc7Sjsg
4081bb76ff1Sjsg for (i = 0; i < num_groups; i++) {
4091bb76ff1Sjsg struct intel_bw_info *bi = &dev_priv->display.bw.max[i];
410c349dbc7Sjsg int clpchgroup;
411c349dbc7Sjsg int j;
412c349dbc7Sjsg
4131bb76ff1Sjsg clpchgroup = (sa->deburst * qi.deinterleave / num_channels) << i;
414c349dbc7Sjsg bi->num_planes = (ipqdepth - clpchgroup) / clpchgroup + 1;
415c349dbc7Sjsg
416c349dbc7Sjsg bi->num_qgv_points = qi.num_points;
4175ca02815Sjsg bi->num_psf_gv_points = qi.num_psf_points;
418c349dbc7Sjsg
419c349dbc7Sjsg for (j = 0; j < qi.num_points; j++) {
420c349dbc7Sjsg const struct intel_qgv_point *sp = &qi.points[j];
421c349dbc7Sjsg int ct, bw;
422c349dbc7Sjsg
423c349dbc7Sjsg /*
424c349dbc7Sjsg * Max row cycle time
425c349dbc7Sjsg *
426c349dbc7Sjsg * FIXME what is the logic behind the
427c349dbc7Sjsg * assumed burst length?
428c349dbc7Sjsg */
429c349dbc7Sjsg ct = max_t(int, sp->t_rc, sp->t_rp + sp->t_rcd +
430c349dbc7Sjsg (clpchgroup - 1) * qi.t_bl + sp->t_rdpre);
4311bb76ff1Sjsg bw = DIV_ROUND_UP(sp->dclk * clpchgroup * 32 * num_channels, ct);
4321bb76ff1Sjsg
4331bb76ff1Sjsg bi->deratedbw[j] = min(maxdebw,
4341bb76ff1Sjsg bw * (100 - sa->derating) / 100);
4351bb76ff1Sjsg
4361bb76ff1Sjsg drm_dbg_kms(&dev_priv->drm,
4371bb76ff1Sjsg "BW%d / QGV %d: num_planes=%d deratedbw=%u\n",
4381bb76ff1Sjsg i, j, bi->num_planes, bi->deratedbw[j]);
4391bb76ff1Sjsg }
4401bb76ff1Sjsg }
4411bb76ff1Sjsg /*
4421bb76ff1Sjsg * In case if SAGV is disabled in BIOS, we always get 1
4431bb76ff1Sjsg * SAGV point, but we can't send PCode commands to restrict it
4441bb76ff1Sjsg * as it will fail and pointless anyway.
4451bb76ff1Sjsg */
4461bb76ff1Sjsg if (qi.num_points == 1)
4471bb76ff1Sjsg dev_priv->display.sagv.status = I915_SAGV_NOT_CONTROLLED;
4481bb76ff1Sjsg else
4491bb76ff1Sjsg dev_priv->display.sagv.status = I915_SAGV_ENABLED;
4501bb76ff1Sjsg
4511bb76ff1Sjsg return 0;
4521bb76ff1Sjsg }
4531bb76ff1Sjsg
tgl_get_bw_info(struct drm_i915_private * dev_priv,const struct intel_sa_info * sa)4541bb76ff1Sjsg static int tgl_get_bw_info(struct drm_i915_private *dev_priv, const struct intel_sa_info *sa)
4551bb76ff1Sjsg {
4561bb76ff1Sjsg struct intel_qgv_info qi = {};
4571bb76ff1Sjsg const struct dram_info *dram_info = &dev_priv->dram_info;
4581bb76ff1Sjsg bool is_y_tile = true; /* assume y tile may be used */
4591bb76ff1Sjsg int num_channels = max_t(u8, 1, dev_priv->dram_info.num_channels);
4601bb76ff1Sjsg int ipqdepth, ipqdepthpch = 16;
4611bb76ff1Sjsg int dclk_max;
4621bb76ff1Sjsg int maxdebw, peakbw;
4631bb76ff1Sjsg int clperchgroup;
4641bb76ff1Sjsg int num_groups = ARRAY_SIZE(dev_priv->display.bw.max);
4651bb76ff1Sjsg int i, ret;
4661bb76ff1Sjsg
4671bb76ff1Sjsg ret = icl_get_qgv_points(dev_priv, &qi, is_y_tile);
4681bb76ff1Sjsg if (ret) {
4691bb76ff1Sjsg drm_dbg_kms(&dev_priv->drm,
4701bb76ff1Sjsg "Failed to get memory subsystem information, ignoring bandwidth limits");
4711bb76ff1Sjsg return ret;
4721bb76ff1Sjsg }
4731bb76ff1Sjsg
474*f005ef32Sjsg if (DISPLAY_VER(dev_priv) < 14 &&
475*f005ef32Sjsg (dram_info->type == INTEL_DRAM_LPDDR4 || dram_info->type == INTEL_DRAM_LPDDR5))
4761bb76ff1Sjsg num_channels *= 2;
4771bb76ff1Sjsg
4781bb76ff1Sjsg qi.deinterleave = qi.deinterleave ? : DIV_ROUND_UP(num_channels, is_y_tile ? 4 : 2);
4791bb76ff1Sjsg
4801bb76ff1Sjsg if (num_channels < qi.max_numchannels && DISPLAY_VER(dev_priv) >= 12)
4811bb76ff1Sjsg qi.deinterleave = max(DIV_ROUND_UP(qi.deinterleave, 2), 1);
4821bb76ff1Sjsg
4831bb76ff1Sjsg if (DISPLAY_VER(dev_priv) > 11 && num_channels > qi.max_numchannels)
4841bb76ff1Sjsg drm_warn(&dev_priv->drm, "Number of channels exceeds max number of channels.");
4851bb76ff1Sjsg if (qi.max_numchannels != 0)
4861bb76ff1Sjsg num_channels = min_t(u8, num_channels, qi.max_numchannels);
4871bb76ff1Sjsg
4881bb76ff1Sjsg dclk_max = icl_sagv_max_dclk(&qi);
4891bb76ff1Sjsg
4901bb76ff1Sjsg peakbw = num_channels * DIV_ROUND_UP(qi.channel_width, 8) * dclk_max;
4911bb76ff1Sjsg maxdebw = min(sa->deprogbwlimit * 1000, peakbw * 6 / 10); /* 60% */
4921bb76ff1Sjsg
4931bb76ff1Sjsg ipqdepth = min(ipqdepthpch, sa->displayrtids / num_channels);
4941bb76ff1Sjsg /*
4951bb76ff1Sjsg * clperchgroup = 4kpagespermempage * clperchperblock,
4961bb76ff1Sjsg * clperchperblock = 8 / num_channels * interleave
4971bb76ff1Sjsg */
4981bb76ff1Sjsg clperchgroup = 4 * DIV_ROUND_UP(8, num_channels) * qi.deinterleave;
4991bb76ff1Sjsg
5001bb76ff1Sjsg for (i = 0; i < num_groups; i++) {
5011bb76ff1Sjsg struct intel_bw_info *bi = &dev_priv->display.bw.max[i];
5021bb76ff1Sjsg struct intel_bw_info *bi_next;
5031bb76ff1Sjsg int clpchgroup;
5041bb76ff1Sjsg int j;
5051bb76ff1Sjsg
5061bb76ff1Sjsg clpchgroup = (sa->deburst * qi.deinterleave / num_channels) << i;
5071bb76ff1Sjsg
5081bb76ff1Sjsg if (i < num_groups - 1) {
5091bb76ff1Sjsg bi_next = &dev_priv->display.bw.max[i + 1];
5101bb76ff1Sjsg
5111bb76ff1Sjsg if (clpchgroup < clperchgroup)
5121bb76ff1Sjsg bi_next->num_planes = (ipqdepth - clpchgroup) /
5131bb76ff1Sjsg clpchgroup + 1;
5141bb76ff1Sjsg else
5151bb76ff1Sjsg bi_next->num_planes = 0;
5161bb76ff1Sjsg }
5171bb76ff1Sjsg
5181bb76ff1Sjsg bi->num_qgv_points = qi.num_points;
5191bb76ff1Sjsg bi->num_psf_gv_points = qi.num_psf_points;
5201bb76ff1Sjsg
5211bb76ff1Sjsg for (j = 0; j < qi.num_points; j++) {
5221bb76ff1Sjsg const struct intel_qgv_point *sp = &qi.points[j];
5231bb76ff1Sjsg int ct, bw;
5241bb76ff1Sjsg
5251bb76ff1Sjsg /*
5261bb76ff1Sjsg * Max row cycle time
5271bb76ff1Sjsg *
5281bb76ff1Sjsg * FIXME what is the logic behind the
5291bb76ff1Sjsg * assumed burst length?
5301bb76ff1Sjsg */
5311bb76ff1Sjsg ct = max_t(int, sp->t_rc, sp->t_rp + sp->t_rcd +
5321bb76ff1Sjsg (clpchgroup - 1) * qi.t_bl + sp->t_rdpre);
5331bb76ff1Sjsg bw = DIV_ROUND_UP(sp->dclk * clpchgroup * 32 * num_channels, ct);
534c349dbc7Sjsg
535c349dbc7Sjsg bi->deratedbw[j] = min(maxdebw,
5365ca02815Sjsg bw * (100 - sa->derating) / 100);
537*f005ef32Sjsg bi->peakbw[j] = DIV_ROUND_CLOSEST(sp->dclk *
538*f005ef32Sjsg num_channels *
539*f005ef32Sjsg qi.channel_width, 8);
540c349dbc7Sjsg
541c349dbc7Sjsg drm_dbg_kms(&dev_priv->drm,
542*f005ef32Sjsg "BW%d / QGV %d: num_planes=%d deratedbw=%u peakbw: %u\n",
543*f005ef32Sjsg i, j, bi->num_planes, bi->deratedbw[j],
544*f005ef32Sjsg bi->peakbw[j]);
545c349dbc7Sjsg }
546c349dbc7Sjsg
5475ca02815Sjsg for (j = 0; j < qi.num_psf_points; j++) {
5485ca02815Sjsg const struct intel_psf_gv_point *sp = &qi.psf_points[j];
5495ca02815Sjsg
5505ca02815Sjsg bi->psf_bw[j] = adl_calc_psf_bw(sp->clk);
5515ca02815Sjsg
5525ca02815Sjsg drm_dbg_kms(&dev_priv->drm,
5535ca02815Sjsg "BW%d / PSF GV %d: num_planes=%d bw=%u\n",
5545ca02815Sjsg i, j, bi->num_planes, bi->psf_bw[j]);
5555ca02815Sjsg }
556c349dbc7Sjsg }
557c349dbc7Sjsg
558ad8b1aafSjsg /*
559ad8b1aafSjsg * In case if SAGV is disabled in BIOS, we always get 1
560ad8b1aafSjsg * SAGV point, but we can't send PCode commands to restrict it
561ad8b1aafSjsg * as it will fail and pointless anyway.
562ad8b1aafSjsg */
563ad8b1aafSjsg if (qi.num_points == 1)
5641bb76ff1Sjsg dev_priv->display.sagv.status = I915_SAGV_NOT_CONTROLLED;
565ad8b1aafSjsg else
5661bb76ff1Sjsg dev_priv->display.sagv.status = I915_SAGV_ENABLED;
567ad8b1aafSjsg
568c349dbc7Sjsg return 0;
569c349dbc7Sjsg }
570c349dbc7Sjsg
dg2_get_bw_info(struct drm_i915_private * i915)5715ca02815Sjsg static void dg2_get_bw_info(struct drm_i915_private *i915)
5725ca02815Sjsg {
5731bb76ff1Sjsg unsigned int deratedbw = IS_DG2_G11(i915) ? 38000 : 50000;
5741bb76ff1Sjsg int num_groups = ARRAY_SIZE(i915->display.bw.max);
5751bb76ff1Sjsg int i;
5765ca02815Sjsg
5775ca02815Sjsg /*
5785ca02815Sjsg * DG2 doesn't have SAGV or QGV points, just a constant max bandwidth
5791bb76ff1Sjsg * that doesn't depend on the number of planes enabled. So fill all the
5801bb76ff1Sjsg * plane group with constant bw information for uniformity with other
5811bb76ff1Sjsg * platforms. DG2-G10 platforms have a constant 50 GB/s bandwidth,
5821bb76ff1Sjsg * whereas DG2-G11 platforms have 38 GB/s.
5835ca02815Sjsg */
5841bb76ff1Sjsg for (i = 0; i < num_groups; i++) {
5851bb76ff1Sjsg struct intel_bw_info *bi = &i915->display.bw.max[i];
5865ca02815Sjsg
5871bb76ff1Sjsg bi->num_planes = 1;
5881bb76ff1Sjsg /* Need only one dummy QGV point per group */
5891bb76ff1Sjsg bi->num_qgv_points = 1;
5901bb76ff1Sjsg bi->deratedbw[0] = deratedbw;
5911bb76ff1Sjsg }
5921bb76ff1Sjsg
5931bb76ff1Sjsg i915->display.sagv.status = I915_SAGV_NOT_CONTROLLED;
5945ca02815Sjsg }
5955ca02815Sjsg
icl_max_bw_index(struct drm_i915_private * dev_priv,int num_planes,int qgv_point)596*f005ef32Sjsg static unsigned int icl_max_bw_index(struct drm_i915_private *dev_priv,
597c349dbc7Sjsg int num_planes, int qgv_point)
598c349dbc7Sjsg {
599c349dbc7Sjsg int i;
600c349dbc7Sjsg
601ad8b1aafSjsg /*
602ad8b1aafSjsg * Let's return max bw for 0 planes
603ad8b1aafSjsg */
604ad8b1aafSjsg num_planes = max(1, num_planes);
605ad8b1aafSjsg
6061bb76ff1Sjsg for (i = 0; i < ARRAY_SIZE(dev_priv->display.bw.max); i++) {
607c349dbc7Sjsg const struct intel_bw_info *bi =
6081bb76ff1Sjsg &dev_priv->display.bw.max[i];
609c349dbc7Sjsg
610c349dbc7Sjsg /*
611c349dbc7Sjsg * Pcode will not expose all QGV points when
612c349dbc7Sjsg * SAGV is forced to off/min/med/max.
613c349dbc7Sjsg */
614c349dbc7Sjsg if (qgv_point >= bi->num_qgv_points)
615c349dbc7Sjsg return UINT_MAX;
616c349dbc7Sjsg
617c349dbc7Sjsg if (num_planes >= bi->num_planes)
618*f005ef32Sjsg return i;
619c349dbc7Sjsg }
620c349dbc7Sjsg
621*f005ef32Sjsg return UINT_MAX;
622c349dbc7Sjsg }
623c349dbc7Sjsg
tgl_max_bw_index(struct drm_i915_private * dev_priv,int num_planes,int qgv_point)624*f005ef32Sjsg static unsigned int tgl_max_bw_index(struct drm_i915_private *dev_priv,
6251bb76ff1Sjsg int num_planes, int qgv_point)
6261bb76ff1Sjsg {
6271bb76ff1Sjsg int i;
6281bb76ff1Sjsg
6291bb76ff1Sjsg /*
6301bb76ff1Sjsg * Let's return max bw for 0 planes
6311bb76ff1Sjsg */
6321bb76ff1Sjsg num_planes = max(1, num_planes);
6331bb76ff1Sjsg
6341bb76ff1Sjsg for (i = ARRAY_SIZE(dev_priv->display.bw.max) - 1; i >= 0; i--) {
6351bb76ff1Sjsg const struct intel_bw_info *bi =
6361bb76ff1Sjsg &dev_priv->display.bw.max[i];
6371bb76ff1Sjsg
6381bb76ff1Sjsg /*
6391bb76ff1Sjsg * Pcode will not expose all QGV points when
6401bb76ff1Sjsg * SAGV is forced to off/min/med/max.
6411bb76ff1Sjsg */
6421bb76ff1Sjsg if (qgv_point >= bi->num_qgv_points)
6431bb76ff1Sjsg return UINT_MAX;
6441bb76ff1Sjsg
6451bb76ff1Sjsg if (num_planes <= bi->num_planes)
646*f005ef32Sjsg return i;
6471bb76ff1Sjsg }
6481bb76ff1Sjsg
649*f005ef32Sjsg return 0;
6501bb76ff1Sjsg }
6511bb76ff1Sjsg
adl_psf_bw(struct drm_i915_private * dev_priv,int psf_gv_point)6525ca02815Sjsg static unsigned int adl_psf_bw(struct drm_i915_private *dev_priv,
6535ca02815Sjsg int psf_gv_point)
6545ca02815Sjsg {
6555ca02815Sjsg const struct intel_bw_info *bi =
6561bb76ff1Sjsg &dev_priv->display.bw.max[0];
6575ca02815Sjsg
6585ca02815Sjsg return bi->psf_bw[psf_gv_point];
6595ca02815Sjsg }
6605ca02815Sjsg
intel_bw_init_hw(struct drm_i915_private * dev_priv)661c349dbc7Sjsg void intel_bw_init_hw(struct drm_i915_private *dev_priv)
662c349dbc7Sjsg {
663c349dbc7Sjsg if (!HAS_DISPLAY(dev_priv))
664c349dbc7Sjsg return;
665c349dbc7Sjsg
6661bb76ff1Sjsg if (DISPLAY_VER(dev_priv) >= 14)
6671bb76ff1Sjsg tgl_get_bw_info(dev_priv, &mtl_sa_info);
6681bb76ff1Sjsg else if (IS_DG2(dev_priv))
6695ca02815Sjsg dg2_get_bw_info(dev_priv);
6705ca02815Sjsg else if (IS_ALDERLAKE_P(dev_priv))
6711bb76ff1Sjsg tgl_get_bw_info(dev_priv, &adlp_sa_info);
6725ca02815Sjsg else if (IS_ALDERLAKE_S(dev_priv))
6731bb76ff1Sjsg tgl_get_bw_info(dev_priv, &adls_sa_info);
6745ca02815Sjsg else if (IS_ROCKETLAKE(dev_priv))
6751bb76ff1Sjsg tgl_get_bw_info(dev_priv, &rkl_sa_info);
6765ca02815Sjsg else if (DISPLAY_VER(dev_priv) == 12)
6771bb76ff1Sjsg tgl_get_bw_info(dev_priv, &tgl_sa_info);
6785ca02815Sjsg else if (DISPLAY_VER(dev_priv) == 11)
679c349dbc7Sjsg icl_get_bw_info(dev_priv, &icl_sa_info);
680c349dbc7Sjsg }
681c349dbc7Sjsg
intel_bw_crtc_num_active_planes(const struct intel_crtc_state * crtc_state)682c349dbc7Sjsg static unsigned int intel_bw_crtc_num_active_planes(const struct intel_crtc_state *crtc_state)
683c349dbc7Sjsg {
684c349dbc7Sjsg /*
685c349dbc7Sjsg * We assume cursors are small enough
686c349dbc7Sjsg * to not not cause bandwidth problems.
687c349dbc7Sjsg */
688c349dbc7Sjsg return hweight8(crtc_state->active_planes & ~BIT(PLANE_CURSOR));
689c349dbc7Sjsg }
690c349dbc7Sjsg
intel_bw_crtc_data_rate(const struct intel_crtc_state * crtc_state)691c349dbc7Sjsg static unsigned int intel_bw_crtc_data_rate(const struct intel_crtc_state *crtc_state)
692c349dbc7Sjsg {
693c349dbc7Sjsg struct intel_crtc *crtc = to_intel_crtc(crtc_state->uapi.crtc);
6941bb76ff1Sjsg struct drm_i915_private *i915 = to_i915(crtc->base.dev);
695c349dbc7Sjsg unsigned int data_rate = 0;
696c349dbc7Sjsg enum plane_id plane_id;
697c349dbc7Sjsg
698c349dbc7Sjsg for_each_plane_id_on_crtc(crtc, plane_id) {
699c349dbc7Sjsg /*
700c349dbc7Sjsg * We assume cursors are small enough
701c349dbc7Sjsg * to not not cause bandwidth problems.
702c349dbc7Sjsg */
703c349dbc7Sjsg if (plane_id == PLANE_CURSOR)
704c349dbc7Sjsg continue;
705c349dbc7Sjsg
706c349dbc7Sjsg data_rate += crtc_state->data_rate[plane_id];
7071bb76ff1Sjsg
7081bb76ff1Sjsg if (DISPLAY_VER(i915) < 11)
7091bb76ff1Sjsg data_rate += crtc_state->data_rate_y[plane_id];
710c349dbc7Sjsg }
711c349dbc7Sjsg
712c349dbc7Sjsg return data_rate;
713c349dbc7Sjsg }
714c349dbc7Sjsg
7151bb76ff1Sjsg /* "Maximum Pipe Read Bandwidth" */
intel_bw_crtc_min_cdclk(const struct intel_crtc_state * crtc_state)7161bb76ff1Sjsg static int intel_bw_crtc_min_cdclk(const struct intel_crtc_state *crtc_state)
7171bb76ff1Sjsg {
7181bb76ff1Sjsg struct intel_crtc *crtc = to_intel_crtc(crtc_state->uapi.crtc);
7191bb76ff1Sjsg struct drm_i915_private *i915 = to_i915(crtc->base.dev);
7201bb76ff1Sjsg
7211bb76ff1Sjsg if (DISPLAY_VER(i915) < 12)
7221bb76ff1Sjsg return 0;
7231bb76ff1Sjsg
7241bb76ff1Sjsg return DIV_ROUND_UP_ULL(mul_u32_u32(intel_bw_crtc_data_rate(crtc_state), 10), 512);
7251bb76ff1Sjsg }
7261bb76ff1Sjsg
intel_bw_crtc_update(struct intel_bw_state * bw_state,const struct intel_crtc_state * crtc_state)727c349dbc7Sjsg void intel_bw_crtc_update(struct intel_bw_state *bw_state,
728c349dbc7Sjsg const struct intel_crtc_state *crtc_state)
729c349dbc7Sjsg {
730c349dbc7Sjsg struct intel_crtc *crtc = to_intel_crtc(crtc_state->uapi.crtc);
731ad8b1aafSjsg struct drm_i915_private *i915 = to_i915(crtc->base.dev);
732c349dbc7Sjsg
733c349dbc7Sjsg bw_state->data_rate[crtc->pipe] =
734c349dbc7Sjsg intel_bw_crtc_data_rate(crtc_state);
735c349dbc7Sjsg bw_state->num_active_planes[crtc->pipe] =
736c349dbc7Sjsg intel_bw_crtc_num_active_planes(crtc_state);
737c349dbc7Sjsg
738ad8b1aafSjsg drm_dbg_kms(&i915->drm, "pipe %c data rate %u num active planes %u\n",
739c349dbc7Sjsg pipe_name(crtc->pipe),
740c349dbc7Sjsg bw_state->data_rate[crtc->pipe],
741c349dbc7Sjsg bw_state->num_active_planes[crtc->pipe]);
742c349dbc7Sjsg }
743c349dbc7Sjsg
intel_bw_num_active_planes(struct drm_i915_private * dev_priv,const struct intel_bw_state * bw_state)744c349dbc7Sjsg static unsigned int intel_bw_num_active_planes(struct drm_i915_private *dev_priv,
745c349dbc7Sjsg const struct intel_bw_state *bw_state)
746c349dbc7Sjsg {
747c349dbc7Sjsg unsigned int num_active_planes = 0;
748c349dbc7Sjsg enum pipe pipe;
749c349dbc7Sjsg
750c349dbc7Sjsg for_each_pipe(dev_priv, pipe)
751c349dbc7Sjsg num_active_planes += bw_state->num_active_planes[pipe];
752c349dbc7Sjsg
753c349dbc7Sjsg return num_active_planes;
754c349dbc7Sjsg }
755c349dbc7Sjsg
intel_bw_data_rate(struct drm_i915_private * dev_priv,const struct intel_bw_state * bw_state)756c349dbc7Sjsg static unsigned int intel_bw_data_rate(struct drm_i915_private *dev_priv,
757c349dbc7Sjsg const struct intel_bw_state *bw_state)
758c349dbc7Sjsg {
759c349dbc7Sjsg unsigned int data_rate = 0;
760c349dbc7Sjsg enum pipe pipe;
761c349dbc7Sjsg
762c349dbc7Sjsg for_each_pipe(dev_priv, pipe)
763c349dbc7Sjsg data_rate += bw_state->data_rate[pipe];
764c349dbc7Sjsg
7651bb76ff1Sjsg if (DISPLAY_VER(dev_priv) >= 13 && i915_vtd_active(dev_priv))
7661bb76ff1Sjsg data_rate = DIV_ROUND_UP(data_rate * 105, 100);
7675ca02815Sjsg
768c349dbc7Sjsg return data_rate;
769c349dbc7Sjsg }
770c349dbc7Sjsg
771ad8b1aafSjsg struct intel_bw_state *
intel_atomic_get_old_bw_state(struct intel_atomic_state * state)772ad8b1aafSjsg intel_atomic_get_old_bw_state(struct intel_atomic_state *state)
773ad8b1aafSjsg {
774ad8b1aafSjsg struct drm_i915_private *dev_priv = to_i915(state->base.dev);
775ad8b1aafSjsg struct intel_global_state *bw_state;
776ad8b1aafSjsg
7771bb76ff1Sjsg bw_state = intel_atomic_get_old_global_obj_state(state, &dev_priv->display.bw.obj);
778ad8b1aafSjsg
779ad8b1aafSjsg return to_intel_bw_state(bw_state);
780ad8b1aafSjsg }
781ad8b1aafSjsg
782ad8b1aafSjsg struct intel_bw_state *
intel_atomic_get_new_bw_state(struct intel_atomic_state * state)783ad8b1aafSjsg intel_atomic_get_new_bw_state(struct intel_atomic_state *state)
784ad8b1aafSjsg {
785ad8b1aafSjsg struct drm_i915_private *dev_priv = to_i915(state->base.dev);
786ad8b1aafSjsg struct intel_global_state *bw_state;
787ad8b1aafSjsg
7881bb76ff1Sjsg bw_state = intel_atomic_get_new_global_obj_state(state, &dev_priv->display.bw.obj);
789ad8b1aafSjsg
790ad8b1aafSjsg return to_intel_bw_state(bw_state);
791ad8b1aafSjsg }
792ad8b1aafSjsg
793ad8b1aafSjsg struct intel_bw_state *
intel_atomic_get_bw_state(struct intel_atomic_state * state)794c349dbc7Sjsg intel_atomic_get_bw_state(struct intel_atomic_state *state)
795c349dbc7Sjsg {
796c349dbc7Sjsg struct drm_i915_private *dev_priv = to_i915(state->base.dev);
797c349dbc7Sjsg struct intel_global_state *bw_state;
798c349dbc7Sjsg
7991bb76ff1Sjsg bw_state = intel_atomic_get_global_obj_state(state, &dev_priv->display.bw.obj);
800c349dbc7Sjsg if (IS_ERR(bw_state))
801c349dbc7Sjsg return ERR_CAST(bw_state);
802c349dbc7Sjsg
803c349dbc7Sjsg return to_intel_bw_state(bw_state);
804c349dbc7Sjsg }
805c349dbc7Sjsg
mtl_find_qgv_points(struct drm_i915_private * i915,unsigned int data_rate,unsigned int num_active_planes,struct intel_bw_state * new_bw_state)806*f005ef32Sjsg static int mtl_find_qgv_points(struct drm_i915_private *i915,
807*f005ef32Sjsg unsigned int data_rate,
808*f005ef32Sjsg unsigned int num_active_planes,
809*f005ef32Sjsg struct intel_bw_state *new_bw_state)
810*f005ef32Sjsg {
811*f005ef32Sjsg unsigned int best_rate = UINT_MAX;
812*f005ef32Sjsg unsigned int num_qgv_points = i915->display.bw.max[0].num_qgv_points;
813*f005ef32Sjsg unsigned int qgv_peak_bw = 0;
814*f005ef32Sjsg int i;
815*f005ef32Sjsg int ret;
816*f005ef32Sjsg
817*f005ef32Sjsg ret = intel_atomic_lock_global_state(&new_bw_state->base);
818*f005ef32Sjsg if (ret)
819*f005ef32Sjsg return ret;
820*f005ef32Sjsg
821*f005ef32Sjsg /*
822*f005ef32Sjsg * If SAGV cannot be enabled, disable the pcode SAGV by passing all 1's
823*f005ef32Sjsg * for qgv peak bw in PM Demand request. So assign UINT_MAX if SAGV is
824*f005ef32Sjsg * not enabled. PM Demand code will clamp the value for the register
825*f005ef32Sjsg */
826*f005ef32Sjsg if (!intel_can_enable_sagv(i915, new_bw_state)) {
827*f005ef32Sjsg new_bw_state->qgv_point_peakbw = U16_MAX;
828*f005ef32Sjsg drm_dbg_kms(&i915->drm, "No SAGV, use UINT_MAX as peak bw.");
829*f005ef32Sjsg return 0;
830*f005ef32Sjsg }
831*f005ef32Sjsg
832*f005ef32Sjsg /*
833*f005ef32Sjsg * Find the best QGV point by comparing the data_rate with max data rate
834*f005ef32Sjsg * offered per plane group
835*f005ef32Sjsg */
836*f005ef32Sjsg for (i = 0; i < num_qgv_points; i++) {
837*f005ef32Sjsg unsigned int bw_index =
838*f005ef32Sjsg tgl_max_bw_index(i915, num_active_planes, i);
839*f005ef32Sjsg unsigned int max_data_rate;
840*f005ef32Sjsg
841*f005ef32Sjsg if (bw_index >= ARRAY_SIZE(i915->display.bw.max))
842*f005ef32Sjsg continue;
843*f005ef32Sjsg
844*f005ef32Sjsg max_data_rate = i915->display.bw.max[bw_index].deratedbw[i];
845*f005ef32Sjsg
846*f005ef32Sjsg if (max_data_rate < data_rate)
847*f005ef32Sjsg continue;
848*f005ef32Sjsg
849*f005ef32Sjsg if (max_data_rate - data_rate < best_rate) {
850*f005ef32Sjsg best_rate = max_data_rate - data_rate;
851*f005ef32Sjsg qgv_peak_bw = i915->display.bw.max[bw_index].peakbw[i];
852*f005ef32Sjsg }
853*f005ef32Sjsg
854*f005ef32Sjsg drm_dbg_kms(&i915->drm, "QGV point %d: max bw %d required %d qgv_peak_bw: %d\n",
855*f005ef32Sjsg i, max_data_rate, data_rate, qgv_peak_bw);
856*f005ef32Sjsg }
857*f005ef32Sjsg
858*f005ef32Sjsg drm_dbg_kms(&i915->drm, "Matching peaks QGV bw: %d for required data rate: %d\n",
859*f005ef32Sjsg qgv_peak_bw, data_rate);
860*f005ef32Sjsg
861*f005ef32Sjsg /*
862*f005ef32Sjsg * The display configuration cannot be supported if no QGV point
863*f005ef32Sjsg * satisfying the required data rate is found
864*f005ef32Sjsg */
865*f005ef32Sjsg if (qgv_peak_bw == 0) {
866*f005ef32Sjsg drm_dbg_kms(&i915->drm, "No QGV points for bw %d for display configuration(%d active planes).\n",
867*f005ef32Sjsg data_rate, num_active_planes);
868*f005ef32Sjsg return -EINVAL;
869*f005ef32Sjsg }
870*f005ef32Sjsg
871*f005ef32Sjsg /* MTL PM DEMAND expects QGV BW parameter in multiples of 100 mbps */
872*f005ef32Sjsg new_bw_state->qgv_point_peakbw = DIV_ROUND_CLOSEST(qgv_peak_bw, 100);
873*f005ef32Sjsg
874*f005ef32Sjsg return 0;
875*f005ef32Sjsg }
876*f005ef32Sjsg
icl_find_qgv_points(struct drm_i915_private * i915,unsigned int data_rate,unsigned int num_active_planes,const struct intel_bw_state * old_bw_state,struct intel_bw_state * new_bw_state)877*f005ef32Sjsg static int icl_find_qgv_points(struct drm_i915_private *i915,
878*f005ef32Sjsg unsigned int data_rate,
879*f005ef32Sjsg unsigned int num_active_planes,
880*f005ef32Sjsg const struct intel_bw_state *old_bw_state,
881*f005ef32Sjsg struct intel_bw_state *new_bw_state)
882*f005ef32Sjsg {
883*f005ef32Sjsg unsigned int max_bw_point = 0;
884*f005ef32Sjsg unsigned int max_bw = 0;
885*f005ef32Sjsg unsigned int num_psf_gv_points = i915->display.bw.max[0].num_psf_gv_points;
886*f005ef32Sjsg unsigned int num_qgv_points = i915->display.bw.max[0].num_qgv_points;
887*f005ef32Sjsg u16 psf_points = 0;
888*f005ef32Sjsg u16 qgv_points = 0;
889*f005ef32Sjsg int i;
890*f005ef32Sjsg int ret;
891*f005ef32Sjsg
892*f005ef32Sjsg ret = intel_atomic_lock_global_state(&new_bw_state->base);
893*f005ef32Sjsg if (ret)
894*f005ef32Sjsg return ret;
895*f005ef32Sjsg
896*f005ef32Sjsg for (i = 0; i < num_qgv_points; i++) {
897*f005ef32Sjsg unsigned int idx;
898*f005ef32Sjsg unsigned int max_data_rate;
899*f005ef32Sjsg
900*f005ef32Sjsg if (DISPLAY_VER(i915) > 11)
901*f005ef32Sjsg idx = tgl_max_bw_index(i915, num_active_planes, i);
902*f005ef32Sjsg else
903*f005ef32Sjsg idx = icl_max_bw_index(i915, num_active_planes, i);
904*f005ef32Sjsg
905*f005ef32Sjsg if (idx >= ARRAY_SIZE(i915->display.bw.max))
906*f005ef32Sjsg continue;
907*f005ef32Sjsg
908*f005ef32Sjsg max_data_rate = i915->display.bw.max[idx].deratedbw[i];
909*f005ef32Sjsg
910*f005ef32Sjsg /*
911*f005ef32Sjsg * We need to know which qgv point gives us
912*f005ef32Sjsg * maximum bandwidth in order to disable SAGV
913*f005ef32Sjsg * if we find that we exceed SAGV block time
914*f005ef32Sjsg * with watermarks. By that moment we already
915*f005ef32Sjsg * have those, as it is calculated earlier in
916*f005ef32Sjsg * intel_atomic_check,
917*f005ef32Sjsg */
918*f005ef32Sjsg if (max_data_rate > max_bw) {
919*f005ef32Sjsg max_bw_point = i;
920*f005ef32Sjsg max_bw = max_data_rate;
921*f005ef32Sjsg }
922*f005ef32Sjsg if (max_data_rate >= data_rate)
923*f005ef32Sjsg qgv_points |= BIT(i);
924*f005ef32Sjsg
925*f005ef32Sjsg drm_dbg_kms(&i915->drm, "QGV point %d: max bw %d required %d\n",
926*f005ef32Sjsg i, max_data_rate, data_rate);
927*f005ef32Sjsg }
928*f005ef32Sjsg
929*f005ef32Sjsg for (i = 0; i < num_psf_gv_points; i++) {
930*f005ef32Sjsg unsigned int max_data_rate = adl_psf_bw(i915, i);
931*f005ef32Sjsg
932*f005ef32Sjsg if (max_data_rate >= data_rate)
933*f005ef32Sjsg psf_points |= BIT(i);
934*f005ef32Sjsg
935*f005ef32Sjsg drm_dbg_kms(&i915->drm, "PSF GV point %d: max bw %d"
936*f005ef32Sjsg " required %d\n",
937*f005ef32Sjsg i, max_data_rate, data_rate);
938*f005ef32Sjsg }
939*f005ef32Sjsg
940*f005ef32Sjsg /*
941*f005ef32Sjsg * BSpec states that we always should have at least one allowed point
942*f005ef32Sjsg * left, so if we couldn't - simply reject the configuration for obvious
943*f005ef32Sjsg * reasons.
944*f005ef32Sjsg */
945*f005ef32Sjsg if (qgv_points == 0) {
946*f005ef32Sjsg drm_dbg_kms(&i915->drm, "No QGV points provide sufficient memory"
947*f005ef32Sjsg " bandwidth %d for display configuration(%d active planes).\n",
948*f005ef32Sjsg data_rate, num_active_planes);
949*f005ef32Sjsg return -EINVAL;
950*f005ef32Sjsg }
951*f005ef32Sjsg
952*f005ef32Sjsg if (num_psf_gv_points > 0 && psf_points == 0) {
953*f005ef32Sjsg drm_dbg_kms(&i915->drm, "No PSF GV points provide sufficient memory"
954*f005ef32Sjsg " bandwidth %d for display configuration(%d active planes).\n",
955*f005ef32Sjsg data_rate, num_active_planes);
956*f005ef32Sjsg return -EINVAL;
957*f005ef32Sjsg }
958*f005ef32Sjsg
959*f005ef32Sjsg /*
960*f005ef32Sjsg * Leave only single point with highest bandwidth, if
961*f005ef32Sjsg * we can't enable SAGV due to the increased memory latency it may
962*f005ef32Sjsg * cause.
963*f005ef32Sjsg */
964*f005ef32Sjsg if (!intel_can_enable_sagv(i915, new_bw_state)) {
965*f005ef32Sjsg qgv_points = BIT(max_bw_point);
966*f005ef32Sjsg drm_dbg_kms(&i915->drm, "No SAGV, using single QGV point %d\n",
967*f005ef32Sjsg max_bw_point);
968*f005ef32Sjsg }
969*f005ef32Sjsg
970*f005ef32Sjsg /*
971*f005ef32Sjsg * We store the ones which need to be masked as that is what PCode
972*f005ef32Sjsg * actually accepts as a parameter.
973*f005ef32Sjsg */
974*f005ef32Sjsg new_bw_state->qgv_points_mask =
975*f005ef32Sjsg ~(ICL_PCODE_REQ_QGV_PT(qgv_points) |
976*f005ef32Sjsg ADLS_PCODE_REQ_PSF_PT(psf_points)) &
977*f005ef32Sjsg icl_qgv_points_mask(i915);
978*f005ef32Sjsg
979*f005ef32Sjsg /*
980*f005ef32Sjsg * If the actual mask had changed we need to make sure that
981*f005ef32Sjsg * the commits are serialized(in case this is a nomodeset, nonblocking)
982*f005ef32Sjsg */
983*f005ef32Sjsg if (new_bw_state->qgv_points_mask != old_bw_state->qgv_points_mask) {
984*f005ef32Sjsg ret = intel_atomic_serialize_global_state(&new_bw_state->base);
985*f005ef32Sjsg if (ret)
986*f005ef32Sjsg return ret;
987*f005ef32Sjsg }
988*f005ef32Sjsg
989*f005ef32Sjsg return 0;
990*f005ef32Sjsg }
991*f005ef32Sjsg
intel_bw_check_qgv_points(struct drm_i915_private * i915,const struct intel_bw_state * old_bw_state,struct intel_bw_state * new_bw_state)992*f005ef32Sjsg static int intel_bw_check_qgv_points(struct drm_i915_private *i915,
993*f005ef32Sjsg const struct intel_bw_state *old_bw_state,
994*f005ef32Sjsg struct intel_bw_state *new_bw_state)
995*f005ef32Sjsg {
996*f005ef32Sjsg unsigned int data_rate = intel_bw_data_rate(i915, new_bw_state);
997*f005ef32Sjsg unsigned int num_active_planes =
998*f005ef32Sjsg intel_bw_num_active_planes(i915, new_bw_state);
999*f005ef32Sjsg
1000*f005ef32Sjsg data_rate = DIV_ROUND_UP(data_rate, 1000);
1001*f005ef32Sjsg
1002*f005ef32Sjsg if (DISPLAY_VER(i915) >= 14)
1003*f005ef32Sjsg return mtl_find_qgv_points(i915, data_rate, num_active_planes,
1004*f005ef32Sjsg new_bw_state);
1005*f005ef32Sjsg else
1006*f005ef32Sjsg return icl_find_qgv_points(i915, data_rate, num_active_planes,
1007*f005ef32Sjsg old_bw_state, new_bw_state);
1008*f005ef32Sjsg }
1009*f005ef32Sjsg
intel_bw_state_changed(struct drm_i915_private * i915,const struct intel_bw_state * old_bw_state,const struct intel_bw_state * new_bw_state)10101bb76ff1Sjsg static bool intel_bw_state_changed(struct drm_i915_private *i915,
10111bb76ff1Sjsg const struct intel_bw_state *old_bw_state,
10121bb76ff1Sjsg const struct intel_bw_state *new_bw_state)
1013ad8b1aafSjsg {
1014ad8b1aafSjsg enum pipe pipe;
1015ad8b1aafSjsg
10161bb76ff1Sjsg for_each_pipe(i915, pipe) {
10171bb76ff1Sjsg const struct intel_dbuf_bw *old_crtc_bw =
10181bb76ff1Sjsg &old_bw_state->dbuf_bw[pipe];
10191bb76ff1Sjsg const struct intel_dbuf_bw *new_crtc_bw =
10201bb76ff1Sjsg &new_bw_state->dbuf_bw[pipe];
10211bb76ff1Sjsg enum dbuf_slice slice;
10221bb76ff1Sjsg
10231bb76ff1Sjsg for_each_dbuf_slice(i915, slice) {
10241bb76ff1Sjsg if (old_crtc_bw->max_bw[slice] != new_crtc_bw->max_bw[slice] ||
10251bb76ff1Sjsg old_crtc_bw->active_planes[slice] != new_crtc_bw->active_planes[slice])
10261bb76ff1Sjsg return true;
10271bb76ff1Sjsg }
10281bb76ff1Sjsg
10291bb76ff1Sjsg if (old_bw_state->min_cdclk[pipe] != new_bw_state->min_cdclk[pipe])
10301bb76ff1Sjsg return true;
10311bb76ff1Sjsg }
10321bb76ff1Sjsg
10331bb76ff1Sjsg return false;
10341bb76ff1Sjsg }
10351bb76ff1Sjsg
skl_plane_calc_dbuf_bw(struct intel_bw_state * bw_state,struct intel_crtc * crtc,enum plane_id plane_id,const struct skl_ddb_entry * ddb,unsigned int data_rate)10361bb76ff1Sjsg static void skl_plane_calc_dbuf_bw(struct intel_bw_state *bw_state,
10371bb76ff1Sjsg struct intel_crtc *crtc,
10381bb76ff1Sjsg enum plane_id plane_id,
10391bb76ff1Sjsg const struct skl_ddb_entry *ddb,
10401bb76ff1Sjsg unsigned int data_rate)
10411bb76ff1Sjsg {
10421bb76ff1Sjsg struct drm_i915_private *i915 = to_i915(crtc->base.dev);
10431bb76ff1Sjsg struct intel_dbuf_bw *crtc_bw = &bw_state->dbuf_bw[crtc->pipe];
10441bb76ff1Sjsg unsigned int dbuf_mask = skl_ddb_dbuf_slice_mask(i915, ddb);
10451bb76ff1Sjsg enum dbuf_slice slice;
10461bb76ff1Sjsg
10471bb76ff1Sjsg /*
10481bb76ff1Sjsg * The arbiter can only really guarantee an
10491bb76ff1Sjsg * equal share of the total bw to each plane.
10501bb76ff1Sjsg */
10511bb76ff1Sjsg for_each_dbuf_slice_in_mask(i915, slice, dbuf_mask) {
10521bb76ff1Sjsg crtc_bw->max_bw[slice] = max(crtc_bw->max_bw[slice], data_rate);
10531bb76ff1Sjsg crtc_bw->active_planes[slice] |= BIT(plane_id);
10541bb76ff1Sjsg }
10551bb76ff1Sjsg }
10561bb76ff1Sjsg
skl_crtc_calc_dbuf_bw(struct intel_bw_state * bw_state,const struct intel_crtc_state * crtc_state)10571bb76ff1Sjsg static void skl_crtc_calc_dbuf_bw(struct intel_bw_state *bw_state,
10581bb76ff1Sjsg const struct intel_crtc_state *crtc_state)
10591bb76ff1Sjsg {
10601bb76ff1Sjsg struct intel_crtc *crtc = to_intel_crtc(crtc_state->uapi.crtc);
10611bb76ff1Sjsg struct drm_i915_private *i915 = to_i915(crtc->base.dev);
10621bb76ff1Sjsg struct intel_dbuf_bw *crtc_bw = &bw_state->dbuf_bw[crtc->pipe];
1063ad8b1aafSjsg enum plane_id plane_id;
1064ad8b1aafSjsg
10651bb76ff1Sjsg memset(crtc_bw, 0, sizeof(*crtc_bw));
1066ad8b1aafSjsg
1067ad8b1aafSjsg if (!crtc_state->hw.active)
10681bb76ff1Sjsg return;
1069ad8b1aafSjsg
1070ad8b1aafSjsg for_each_plane_id_on_crtc(crtc, plane_id) {
10711bb76ff1Sjsg /*
10721bb76ff1Sjsg * We assume cursors are small enough
10731bb76ff1Sjsg * to not cause bandwidth problems.
10741bb76ff1Sjsg */
10751bb76ff1Sjsg if (plane_id == PLANE_CURSOR)
10761bb76ff1Sjsg continue;
10771bb76ff1Sjsg
10781bb76ff1Sjsg skl_plane_calc_dbuf_bw(bw_state, crtc, plane_id,
10791bb76ff1Sjsg &crtc_state->wm.skl.plane_ddb[plane_id],
10801bb76ff1Sjsg crtc_state->data_rate[plane_id]);
10811bb76ff1Sjsg
10821bb76ff1Sjsg if (DISPLAY_VER(i915) < 11)
10831bb76ff1Sjsg skl_plane_calc_dbuf_bw(bw_state, crtc, plane_id,
10841bb76ff1Sjsg &crtc_state->wm.skl.plane_ddb_y[plane_id],
10851bb76ff1Sjsg crtc_state->data_rate[plane_id]);
10861bb76ff1Sjsg }
10871bb76ff1Sjsg }
10881bb76ff1Sjsg
10891bb76ff1Sjsg /* "Maximum Data Buffer Bandwidth" */
10901bb76ff1Sjsg static int
intel_bw_dbuf_min_cdclk(struct drm_i915_private * i915,const struct intel_bw_state * bw_state)10911bb76ff1Sjsg intel_bw_dbuf_min_cdclk(struct drm_i915_private *i915,
10921bb76ff1Sjsg const struct intel_bw_state *bw_state)
10931bb76ff1Sjsg {
10941bb76ff1Sjsg unsigned int total_max_bw = 0;
10955ca02815Sjsg enum dbuf_slice slice;
1096ad8b1aafSjsg
10971bb76ff1Sjsg for_each_dbuf_slice(i915, slice) {
10981bb76ff1Sjsg int num_active_planes = 0;
10991bb76ff1Sjsg unsigned int max_bw = 0;
11001bb76ff1Sjsg enum pipe pipe;
1101ad8b1aafSjsg
1102ad8b1aafSjsg /*
11031bb76ff1Sjsg * The arbiter can only really guarantee an
11041bb76ff1Sjsg * equal share of the total bw to each plane.
1105ad8b1aafSjsg */
11061bb76ff1Sjsg for_each_pipe(i915, pipe) {
11071bb76ff1Sjsg const struct intel_dbuf_bw *crtc_bw = &bw_state->dbuf_bw[pipe];
11081bb76ff1Sjsg
11091bb76ff1Sjsg max_bw = max(crtc_bw->max_bw[slice], max_bw);
11101bb76ff1Sjsg num_active_planes += hweight8(crtc_bw->active_planes[slice]);
1111ad8b1aafSjsg }
11121bb76ff1Sjsg max_bw *= num_active_planes;
11131bb76ff1Sjsg
11141bb76ff1Sjsg total_max_bw = max(total_max_bw, max_bw);
1115ad8b1aafSjsg }
1116ad8b1aafSjsg
11171bb76ff1Sjsg return DIV_ROUND_UP(total_max_bw, 64);
1118ad8b1aafSjsg }
1119ad8b1aafSjsg
intel_bw_min_cdclk(struct drm_i915_private * i915,const struct intel_bw_state * bw_state)11201bb76ff1Sjsg int intel_bw_min_cdclk(struct drm_i915_private *i915,
11211bb76ff1Sjsg const struct intel_bw_state *bw_state)
11221bb76ff1Sjsg {
11231bb76ff1Sjsg enum pipe pipe;
11241bb76ff1Sjsg int min_cdclk;
1125ad8b1aafSjsg
11261bb76ff1Sjsg min_cdclk = intel_bw_dbuf_min_cdclk(i915, bw_state);
1127ad8b1aafSjsg
11281bb76ff1Sjsg for_each_pipe(i915, pipe)
11291bb76ff1Sjsg min_cdclk = max(bw_state->min_cdclk[pipe], min_cdclk);
11301bb76ff1Sjsg
11311bb76ff1Sjsg return min_cdclk;
1132ad8b1aafSjsg }
1133ad8b1aafSjsg
intel_bw_calc_min_cdclk(struct intel_atomic_state * state,bool * need_cdclk_calc)11341bb76ff1Sjsg int intel_bw_calc_min_cdclk(struct intel_atomic_state *state,
11351bb76ff1Sjsg bool *need_cdclk_calc)
1136ad8b1aafSjsg {
1137ad8b1aafSjsg struct drm_i915_private *dev_priv = to_i915(state->base.dev);
1138ad8b1aafSjsg struct intel_bw_state *new_bw_state = NULL;
11391bb76ff1Sjsg const struct intel_bw_state *old_bw_state = NULL;
11401bb76ff1Sjsg const struct intel_cdclk_state *cdclk_state;
1141ad8b1aafSjsg const struct intel_crtc_state *crtc_state;
11421bb76ff1Sjsg int old_min_cdclk, new_min_cdclk;
1143ad8b1aafSjsg struct intel_crtc *crtc;
1144ad8b1aafSjsg int i;
1145ad8b1aafSjsg
11461bb76ff1Sjsg if (DISPLAY_VER(dev_priv) < 9)
11471bb76ff1Sjsg return 0;
11481bb76ff1Sjsg
1149ad8b1aafSjsg for_each_new_intel_crtc_in_state(state, crtc, crtc_state, i) {
1150ad8b1aafSjsg new_bw_state = intel_atomic_get_bw_state(state);
1151ad8b1aafSjsg if (IS_ERR(new_bw_state))
1152ad8b1aafSjsg return PTR_ERR(new_bw_state);
1153ad8b1aafSjsg
1154ad8b1aafSjsg old_bw_state = intel_atomic_get_old_bw_state(state);
11551bb76ff1Sjsg
11561bb76ff1Sjsg skl_crtc_calc_dbuf_bw(new_bw_state, crtc_state);
11571bb76ff1Sjsg
11581bb76ff1Sjsg new_bw_state->min_cdclk[crtc->pipe] =
11591bb76ff1Sjsg intel_bw_crtc_min_cdclk(crtc_state);
1160ad8b1aafSjsg }
1161ad8b1aafSjsg
1162ad8b1aafSjsg if (!old_bw_state)
1163ad8b1aafSjsg return 0;
1164ad8b1aafSjsg
11651bb76ff1Sjsg if (intel_bw_state_changed(dev_priv, old_bw_state, new_bw_state)) {
1166ad8b1aafSjsg int ret = intel_atomic_lock_global_state(&new_bw_state->base);
1167ad8b1aafSjsg if (ret)
1168ad8b1aafSjsg return ret;
1169ad8b1aafSjsg }
1170ad8b1aafSjsg
11711bb76ff1Sjsg old_min_cdclk = intel_bw_min_cdclk(dev_priv, old_bw_state);
11721bb76ff1Sjsg new_min_cdclk = intel_bw_min_cdclk(dev_priv, new_bw_state);
11731bb76ff1Sjsg
11741bb76ff1Sjsg /*
11751bb76ff1Sjsg * No need to check against the cdclk state if
11761bb76ff1Sjsg * the min cdclk doesn't increase.
11771bb76ff1Sjsg *
11781bb76ff1Sjsg * Ie. we only ever increase the cdclk due to bandwidth
11791bb76ff1Sjsg * requirements. This can reduce back and forth
11801bb76ff1Sjsg * display blinking due to constant cdclk changes.
11811bb76ff1Sjsg */
11821bb76ff1Sjsg if (new_min_cdclk <= old_min_cdclk)
11831bb76ff1Sjsg return 0;
11841bb76ff1Sjsg
11851bb76ff1Sjsg cdclk_state = intel_atomic_get_cdclk_state(state);
11861bb76ff1Sjsg if (IS_ERR(cdclk_state))
11871bb76ff1Sjsg return PTR_ERR(cdclk_state);
11881bb76ff1Sjsg
11891bb76ff1Sjsg /*
11901bb76ff1Sjsg * No need to recalculate the cdclk state if
11911bb76ff1Sjsg * the min cdclk doesn't increase.
11921bb76ff1Sjsg *
11931bb76ff1Sjsg * Ie. we only ever increase the cdclk due to bandwidth
11941bb76ff1Sjsg * requirements. This can reduce back and forth
11951bb76ff1Sjsg * display blinking due to constant cdclk changes.
11961bb76ff1Sjsg */
11971bb76ff1Sjsg if (new_min_cdclk <= cdclk_state->bw_min_cdclk)
11981bb76ff1Sjsg return 0;
11991bb76ff1Sjsg
12001bb76ff1Sjsg drm_dbg_kms(&dev_priv->drm,
12011bb76ff1Sjsg "new bandwidth min cdclk (%d kHz) > old min cdclk (%d kHz)\n",
12021bb76ff1Sjsg new_min_cdclk, cdclk_state->bw_min_cdclk);
12031bb76ff1Sjsg *need_cdclk_calc = true;
12041bb76ff1Sjsg
1205ad8b1aafSjsg return 0;
1206ad8b1aafSjsg }
1207ad8b1aafSjsg
intel_bw_check_data_rate(struct intel_atomic_state * state,bool * changed)12081bb76ff1Sjsg static int intel_bw_check_data_rate(struct intel_atomic_state *state, bool *changed)
12091bb76ff1Sjsg {
12101bb76ff1Sjsg struct drm_i915_private *i915 = to_i915(state->base.dev);
12111bb76ff1Sjsg const struct intel_crtc_state *new_crtc_state, *old_crtc_state;
12121bb76ff1Sjsg struct intel_crtc *crtc;
12131bb76ff1Sjsg int i;
12145ca02815Sjsg
1215c349dbc7Sjsg for_each_oldnew_intel_crtc_in_state(state, crtc, old_crtc_state,
1216c349dbc7Sjsg new_crtc_state, i) {
1217c349dbc7Sjsg unsigned int old_data_rate =
1218c349dbc7Sjsg intel_bw_crtc_data_rate(old_crtc_state);
1219c349dbc7Sjsg unsigned int new_data_rate =
1220c349dbc7Sjsg intel_bw_crtc_data_rate(new_crtc_state);
1221c349dbc7Sjsg unsigned int old_active_planes =
1222c349dbc7Sjsg intel_bw_crtc_num_active_planes(old_crtc_state);
1223c349dbc7Sjsg unsigned int new_active_planes =
1224c349dbc7Sjsg intel_bw_crtc_num_active_planes(new_crtc_state);
12251bb76ff1Sjsg struct intel_bw_state *new_bw_state;
1226c349dbc7Sjsg
1227c349dbc7Sjsg /*
1228c349dbc7Sjsg * Avoid locking the bw state when
1229c349dbc7Sjsg * nothing significant has changed.
1230c349dbc7Sjsg */
1231c349dbc7Sjsg if (old_data_rate == new_data_rate &&
1232c349dbc7Sjsg old_active_planes == new_active_planes)
1233c349dbc7Sjsg continue;
1234c349dbc7Sjsg
1235ad8b1aafSjsg new_bw_state = intel_atomic_get_bw_state(state);
1236ad8b1aafSjsg if (IS_ERR(new_bw_state))
1237ad8b1aafSjsg return PTR_ERR(new_bw_state);
1238c349dbc7Sjsg
1239ad8b1aafSjsg new_bw_state->data_rate[crtc->pipe] = new_data_rate;
1240ad8b1aafSjsg new_bw_state->num_active_planes[crtc->pipe] = new_active_planes;
1241c349dbc7Sjsg
12421bb76ff1Sjsg *changed = true;
1243679bd941Sjsg
12441bb76ff1Sjsg drm_dbg_kms(&i915->drm,
12451bb76ff1Sjsg "[CRTC:%d:%s] data rate %u num active planes %u\n",
12461bb76ff1Sjsg crtc->base.base.id, crtc->base.name,
1247ad8b1aafSjsg new_bw_state->data_rate[crtc->pipe],
1248ad8b1aafSjsg new_bw_state->num_active_planes[crtc->pipe]);
1249c349dbc7Sjsg }
1250c349dbc7Sjsg
12511bb76ff1Sjsg return 0;
12521bb76ff1Sjsg }
12531bb76ff1Sjsg
intel_bw_atomic_check(struct intel_atomic_state * state)12541bb76ff1Sjsg int intel_bw_atomic_check(struct intel_atomic_state *state)
12551bb76ff1Sjsg {
12561bb76ff1Sjsg bool changed = false;
1257*f005ef32Sjsg struct drm_i915_private *i915 = to_i915(state->base.dev);
1258*f005ef32Sjsg struct intel_bw_state *new_bw_state;
1259*f005ef32Sjsg const struct intel_bw_state *old_bw_state;
1260*f005ef32Sjsg int ret;
12611bb76ff1Sjsg
12621bb76ff1Sjsg /* FIXME earlier gens need some checks too */
1263*f005ef32Sjsg if (DISPLAY_VER(i915) < 11)
12641bb76ff1Sjsg return 0;
12651bb76ff1Sjsg
12661bb76ff1Sjsg ret = intel_bw_check_data_rate(state, &changed);
12671bb76ff1Sjsg if (ret)
12681bb76ff1Sjsg return ret;
12691bb76ff1Sjsg
1270679bd941Sjsg old_bw_state = intel_atomic_get_old_bw_state(state);
1271679bd941Sjsg new_bw_state = intel_atomic_get_new_bw_state(state);
1272679bd941Sjsg
1273679bd941Sjsg if (new_bw_state &&
1274*f005ef32Sjsg intel_can_enable_sagv(i915, old_bw_state) !=
1275*f005ef32Sjsg intel_can_enable_sagv(i915, new_bw_state))
1276679bd941Sjsg changed = true;
1277679bd941Sjsg
1278679bd941Sjsg /*
1279679bd941Sjsg * If none of our inputs (data rates, number of active
1280679bd941Sjsg * planes, SAGV yes/no) changed then nothing to do here.
1281679bd941Sjsg */
1282679bd941Sjsg if (!changed)
1283c349dbc7Sjsg return 0;
1284c349dbc7Sjsg
1285*f005ef32Sjsg ret = intel_bw_check_qgv_points(i915, old_bw_state, new_bw_state);
1286c349dbc7Sjsg if (ret)
1287c349dbc7Sjsg return ret;
1288c349dbc7Sjsg
1289c349dbc7Sjsg return 0;
1290c349dbc7Sjsg }
1291c349dbc7Sjsg
1292c349dbc7Sjsg static struct intel_global_state *
intel_bw_duplicate_state(struct intel_global_obj * obj)1293c349dbc7Sjsg intel_bw_duplicate_state(struct intel_global_obj *obj)
1294c349dbc7Sjsg {
1295c349dbc7Sjsg struct intel_bw_state *state;
1296c349dbc7Sjsg
1297c349dbc7Sjsg state = kmemdup(obj->state, sizeof(*state), GFP_KERNEL);
1298c349dbc7Sjsg if (!state)
1299c349dbc7Sjsg return NULL;
1300c349dbc7Sjsg
1301c349dbc7Sjsg return &state->base;
1302c349dbc7Sjsg }
1303c349dbc7Sjsg
intel_bw_destroy_state(struct intel_global_obj * obj,struct intel_global_state * state)1304c349dbc7Sjsg static void intel_bw_destroy_state(struct intel_global_obj *obj,
1305c349dbc7Sjsg struct intel_global_state *state)
1306c349dbc7Sjsg {
1307c349dbc7Sjsg kfree(state);
1308c349dbc7Sjsg }
1309c349dbc7Sjsg
1310c349dbc7Sjsg static const struct intel_global_state_funcs intel_bw_funcs = {
1311c349dbc7Sjsg .atomic_duplicate_state = intel_bw_duplicate_state,
1312c349dbc7Sjsg .atomic_destroy_state = intel_bw_destroy_state,
1313c349dbc7Sjsg };
1314c349dbc7Sjsg
intel_bw_init(struct drm_i915_private * dev_priv)1315c349dbc7Sjsg int intel_bw_init(struct drm_i915_private *dev_priv)
1316c349dbc7Sjsg {
1317c349dbc7Sjsg struct intel_bw_state *state;
1318c349dbc7Sjsg
1319c349dbc7Sjsg state = kzalloc(sizeof(*state), GFP_KERNEL);
1320c349dbc7Sjsg if (!state)
1321c349dbc7Sjsg return -ENOMEM;
1322c349dbc7Sjsg
13231bb76ff1Sjsg intel_atomic_global_obj_init(dev_priv, &dev_priv->display.bw.obj,
1324c349dbc7Sjsg &state->base, &intel_bw_funcs);
1325c349dbc7Sjsg
1326c349dbc7Sjsg return 0;
1327c349dbc7Sjsg }
1328