1*f005ef32Sjsg // SPDX-License-Identifier: MIT
2*f005ef32Sjsg /*
3*f005ef32Sjsg * Copyright © 2017-2019 Intel Corporation
4*f005ef32Sjsg */
5*f005ef32Sjsg
6*f005ef32Sjsg #include "intel_wopcm.h"
7*f005ef32Sjsg #include "i915_drv.h"
8*f005ef32Sjsg
9*f005ef32Sjsg /**
10*f005ef32Sjsg * DOC: WOPCM Layout
11*f005ef32Sjsg *
12*f005ef32Sjsg * The layout of the WOPCM will be fixed after writing to GuC WOPCM size and
13*f005ef32Sjsg * offset registers whose values are calculated and determined by HuC/GuC
14*f005ef32Sjsg * firmware size and set of hardware requirements/restrictions as shown below:
15*f005ef32Sjsg *
16*f005ef32Sjsg * ::
17*f005ef32Sjsg *
18*f005ef32Sjsg * +=========> +====================+ <== WOPCM Top
19*f005ef32Sjsg * ^ | HW contexts RSVD |
20*f005ef32Sjsg * | +===> +====================+ <== GuC WOPCM Top
21*f005ef32Sjsg * | ^ | |
22*f005ef32Sjsg * | | | |
23*f005ef32Sjsg * | | | |
24*f005ef32Sjsg * | GuC | |
25*f005ef32Sjsg * | WOPCM | |
26*f005ef32Sjsg * | Size +--------------------+
27*f005ef32Sjsg * WOPCM | | GuC FW RSVD |
28*f005ef32Sjsg * | | +--------------------+
29*f005ef32Sjsg * | | | GuC Stack RSVD |
30*f005ef32Sjsg * | | +------------------- +
31*f005ef32Sjsg * | v | GuC WOPCM RSVD |
32*f005ef32Sjsg * | +===> +====================+ <== GuC WOPCM base
33*f005ef32Sjsg * | | WOPCM RSVD |
34*f005ef32Sjsg * | +------------------- + <== HuC Firmware Top
35*f005ef32Sjsg * v | HuC FW |
36*f005ef32Sjsg * +=========> +====================+ <== WOPCM Base
37*f005ef32Sjsg *
38*f005ef32Sjsg * GuC accessible WOPCM starts at GuC WOPCM base and ends at GuC WOPCM top.
39*f005ef32Sjsg * The top part of the WOPCM is reserved for hardware contexts (e.g. RC6
40*f005ef32Sjsg * context).
41*f005ef32Sjsg */
42*f005ef32Sjsg
43*f005ef32Sjsg /* Default WOPCM size is 2MB from Gen11, 1MB on previous platforms */
44*f005ef32Sjsg #define GEN11_WOPCM_SIZE SZ_2M
45*f005ef32Sjsg #define GEN9_WOPCM_SIZE SZ_1M
46*f005ef32Sjsg #define MAX_WOPCM_SIZE SZ_8M
47*f005ef32Sjsg /* 16KB WOPCM (RSVD WOPCM) is reserved from HuC firmware top. */
48*f005ef32Sjsg #define WOPCM_RESERVED_SIZE SZ_16K
49*f005ef32Sjsg
50*f005ef32Sjsg /* 16KB reserved at the beginning of GuC WOPCM. */
51*f005ef32Sjsg #define GUC_WOPCM_RESERVED SZ_16K
52*f005ef32Sjsg /* 8KB from GUC_WOPCM_RESERVED is reserved for GuC stack. */
53*f005ef32Sjsg #define GUC_WOPCM_STACK_RESERVED SZ_8K
54*f005ef32Sjsg
55*f005ef32Sjsg /* GuC WOPCM Offset value needs to be aligned to 16KB. */
56*f005ef32Sjsg #define GUC_WOPCM_OFFSET_ALIGNMENT (1UL << GUC_WOPCM_OFFSET_SHIFT)
57*f005ef32Sjsg
58*f005ef32Sjsg /* 24KB at the end of WOPCM is reserved for RC6 CTX on BXT. */
59*f005ef32Sjsg #define BXT_WOPCM_RC6_CTX_RESERVED (SZ_16K + SZ_8K)
60*f005ef32Sjsg /* 36KB WOPCM reserved at the end of WOPCM on ICL. */
61*f005ef32Sjsg #define ICL_WOPCM_HW_CTX_RESERVED (SZ_32K + SZ_4K)
62*f005ef32Sjsg
63*f005ef32Sjsg /* 128KB from GUC_WOPCM_RESERVED is reserved for FW on Gen9. */
64*f005ef32Sjsg #define GEN9_GUC_FW_RESERVED SZ_128K
65*f005ef32Sjsg #define GEN9_GUC_WOPCM_OFFSET (GUC_WOPCM_RESERVED + GEN9_GUC_FW_RESERVED)
66*f005ef32Sjsg
wopcm_to_gt(struct intel_wopcm * wopcm)67*f005ef32Sjsg static inline struct intel_gt *wopcm_to_gt(struct intel_wopcm *wopcm)
68*f005ef32Sjsg {
69*f005ef32Sjsg return container_of(wopcm, struct intel_gt, wopcm);
70*f005ef32Sjsg }
71*f005ef32Sjsg
72*f005ef32Sjsg /**
73*f005ef32Sjsg * intel_wopcm_init_early() - Early initialization of the WOPCM.
74*f005ef32Sjsg * @wopcm: pointer to intel_wopcm.
75*f005ef32Sjsg *
76*f005ef32Sjsg * Setup the size of WOPCM which will be used by later on WOPCM partitioning.
77*f005ef32Sjsg */
intel_wopcm_init_early(struct intel_wopcm * wopcm)78*f005ef32Sjsg void intel_wopcm_init_early(struct intel_wopcm *wopcm)
79*f005ef32Sjsg {
80*f005ef32Sjsg struct intel_gt *gt = wopcm_to_gt(wopcm);
81*f005ef32Sjsg struct drm_i915_private *i915 = gt->i915;
82*f005ef32Sjsg
83*f005ef32Sjsg if (!HAS_GT_UC(i915))
84*f005ef32Sjsg return;
85*f005ef32Sjsg
86*f005ef32Sjsg if (GRAPHICS_VER(i915) >= 11)
87*f005ef32Sjsg wopcm->size = GEN11_WOPCM_SIZE;
88*f005ef32Sjsg else
89*f005ef32Sjsg wopcm->size = GEN9_WOPCM_SIZE;
90*f005ef32Sjsg
91*f005ef32Sjsg drm_dbg(&i915->drm, "WOPCM: %uK\n", wopcm->size / 1024);
92*f005ef32Sjsg }
93*f005ef32Sjsg
context_reserved_size(struct drm_i915_private * i915)94*f005ef32Sjsg static u32 context_reserved_size(struct drm_i915_private *i915)
95*f005ef32Sjsg {
96*f005ef32Sjsg if (IS_GEN9_LP(i915))
97*f005ef32Sjsg return BXT_WOPCM_RC6_CTX_RESERVED;
98*f005ef32Sjsg else if (GRAPHICS_VER(i915) >= 11)
99*f005ef32Sjsg return ICL_WOPCM_HW_CTX_RESERVED;
100*f005ef32Sjsg else
101*f005ef32Sjsg return 0;
102*f005ef32Sjsg }
103*f005ef32Sjsg
gen9_check_dword_gap(struct drm_i915_private * i915,u32 guc_wopcm_base,u32 guc_wopcm_size)104*f005ef32Sjsg static bool gen9_check_dword_gap(struct drm_i915_private *i915,
105*f005ef32Sjsg u32 guc_wopcm_base, u32 guc_wopcm_size)
106*f005ef32Sjsg {
107*f005ef32Sjsg u32 offset;
108*f005ef32Sjsg
109*f005ef32Sjsg /*
110*f005ef32Sjsg * GuC WOPCM size shall be at least a dword larger than the offset from
111*f005ef32Sjsg * WOPCM base (GuC WOPCM offset from WOPCM base + GEN9_GUC_WOPCM_OFFSET)
112*f005ef32Sjsg * due to hardware limitation on Gen9.
113*f005ef32Sjsg */
114*f005ef32Sjsg offset = guc_wopcm_base + GEN9_GUC_WOPCM_OFFSET;
115*f005ef32Sjsg if (offset > guc_wopcm_size ||
116*f005ef32Sjsg (guc_wopcm_size - offset) < sizeof(u32)) {
117*f005ef32Sjsg drm_err(&i915->drm,
118*f005ef32Sjsg "WOPCM: invalid GuC region size: %uK < %uK\n",
119*f005ef32Sjsg guc_wopcm_size / SZ_1K,
120*f005ef32Sjsg (u32)(offset + sizeof(u32)) / SZ_1K);
121*f005ef32Sjsg return false;
122*f005ef32Sjsg }
123*f005ef32Sjsg
124*f005ef32Sjsg return true;
125*f005ef32Sjsg }
126*f005ef32Sjsg
gen9_check_huc_fw_fits(struct drm_i915_private * i915,u32 guc_wopcm_size,u32 huc_fw_size)127*f005ef32Sjsg static bool gen9_check_huc_fw_fits(struct drm_i915_private *i915,
128*f005ef32Sjsg u32 guc_wopcm_size, u32 huc_fw_size)
129*f005ef32Sjsg {
130*f005ef32Sjsg /*
131*f005ef32Sjsg * On Gen9, hardware requires the total available GuC WOPCM
132*f005ef32Sjsg * size to be larger than or equal to HuC firmware size. Otherwise,
133*f005ef32Sjsg * firmware uploading would fail.
134*f005ef32Sjsg */
135*f005ef32Sjsg if (huc_fw_size > guc_wopcm_size - GUC_WOPCM_RESERVED) {
136*f005ef32Sjsg drm_err(&i915->drm, "WOPCM: no space for %s: %uK < %uK\n",
137*f005ef32Sjsg intel_uc_fw_type_repr(INTEL_UC_FW_TYPE_HUC),
138*f005ef32Sjsg (guc_wopcm_size - GUC_WOPCM_RESERVED) / SZ_1K,
139*f005ef32Sjsg huc_fw_size / 1024);
140*f005ef32Sjsg return false;
141*f005ef32Sjsg }
142*f005ef32Sjsg
143*f005ef32Sjsg return true;
144*f005ef32Sjsg }
145*f005ef32Sjsg
check_hw_restrictions(struct drm_i915_private * i915,u32 guc_wopcm_base,u32 guc_wopcm_size,u32 huc_fw_size)146*f005ef32Sjsg static bool check_hw_restrictions(struct drm_i915_private *i915,
147*f005ef32Sjsg u32 guc_wopcm_base, u32 guc_wopcm_size,
148*f005ef32Sjsg u32 huc_fw_size)
149*f005ef32Sjsg {
150*f005ef32Sjsg if (GRAPHICS_VER(i915) == 9 && !gen9_check_dword_gap(i915, guc_wopcm_base,
151*f005ef32Sjsg guc_wopcm_size))
152*f005ef32Sjsg return false;
153*f005ef32Sjsg
154*f005ef32Sjsg if (GRAPHICS_VER(i915) == 9 &&
155*f005ef32Sjsg !gen9_check_huc_fw_fits(i915, guc_wopcm_size, huc_fw_size))
156*f005ef32Sjsg return false;
157*f005ef32Sjsg
158*f005ef32Sjsg return true;
159*f005ef32Sjsg }
160*f005ef32Sjsg
__check_layout(struct intel_gt * gt,u32 wopcm_size,u32 guc_wopcm_base,u32 guc_wopcm_size,u32 guc_fw_size,u32 huc_fw_size)161*f005ef32Sjsg static bool __check_layout(struct intel_gt *gt, u32 wopcm_size,
162*f005ef32Sjsg u32 guc_wopcm_base, u32 guc_wopcm_size,
163*f005ef32Sjsg u32 guc_fw_size, u32 huc_fw_size)
164*f005ef32Sjsg {
165*f005ef32Sjsg struct drm_i915_private *i915 = gt->i915;
166*f005ef32Sjsg const u32 ctx_rsvd = context_reserved_size(i915);
167*f005ef32Sjsg u32 size;
168*f005ef32Sjsg
169*f005ef32Sjsg size = wopcm_size - ctx_rsvd;
170*f005ef32Sjsg if (unlikely(range_overflows(guc_wopcm_base, guc_wopcm_size, size))) {
171*f005ef32Sjsg drm_err(&i915->drm,
172*f005ef32Sjsg "WOPCM: invalid GuC region layout: %uK + %uK > %uK\n",
173*f005ef32Sjsg guc_wopcm_base / SZ_1K, guc_wopcm_size / SZ_1K,
174*f005ef32Sjsg size / SZ_1K);
175*f005ef32Sjsg return false;
176*f005ef32Sjsg }
177*f005ef32Sjsg
178*f005ef32Sjsg size = guc_fw_size + GUC_WOPCM_RESERVED + GUC_WOPCM_STACK_RESERVED;
179*f005ef32Sjsg if (unlikely(guc_wopcm_size < size)) {
180*f005ef32Sjsg drm_err(&i915->drm, "WOPCM: no space for %s: %uK < %uK\n",
181*f005ef32Sjsg intel_uc_fw_type_repr(INTEL_UC_FW_TYPE_GUC),
182*f005ef32Sjsg guc_wopcm_size / SZ_1K, size / SZ_1K);
183*f005ef32Sjsg return false;
184*f005ef32Sjsg }
185*f005ef32Sjsg
186*f005ef32Sjsg if (intel_uc_supports_huc(>->uc)) {
187*f005ef32Sjsg size = huc_fw_size + WOPCM_RESERVED_SIZE;
188*f005ef32Sjsg if (unlikely(guc_wopcm_base < size)) {
189*f005ef32Sjsg drm_err(&i915->drm, "WOPCM: no space for %s: %uK < %uK\n",
190*f005ef32Sjsg intel_uc_fw_type_repr(INTEL_UC_FW_TYPE_HUC),
191*f005ef32Sjsg guc_wopcm_base / SZ_1K, size / SZ_1K);
192*f005ef32Sjsg return false;
193*f005ef32Sjsg }
194*f005ef32Sjsg }
195*f005ef32Sjsg
196*f005ef32Sjsg return check_hw_restrictions(i915, guc_wopcm_base, guc_wopcm_size,
197*f005ef32Sjsg huc_fw_size);
198*f005ef32Sjsg }
199*f005ef32Sjsg
__wopcm_regs_locked(struct intel_uncore * uncore,u32 * guc_wopcm_base,u32 * guc_wopcm_size)200*f005ef32Sjsg static bool __wopcm_regs_locked(struct intel_uncore *uncore,
201*f005ef32Sjsg u32 *guc_wopcm_base, u32 *guc_wopcm_size)
202*f005ef32Sjsg {
203*f005ef32Sjsg u32 reg_base = intel_uncore_read(uncore, DMA_GUC_WOPCM_OFFSET);
204*f005ef32Sjsg u32 reg_size = intel_uncore_read(uncore, GUC_WOPCM_SIZE);
205*f005ef32Sjsg
206*f005ef32Sjsg if (!(reg_size & GUC_WOPCM_SIZE_LOCKED) ||
207*f005ef32Sjsg !(reg_base & GUC_WOPCM_OFFSET_VALID))
208*f005ef32Sjsg return false;
209*f005ef32Sjsg
210*f005ef32Sjsg *guc_wopcm_base = reg_base & GUC_WOPCM_OFFSET_MASK;
211*f005ef32Sjsg *guc_wopcm_size = reg_size & GUC_WOPCM_SIZE_MASK;
212*f005ef32Sjsg return true;
213*f005ef32Sjsg }
214*f005ef32Sjsg
__wopcm_regs_writable(struct intel_uncore * uncore)215*f005ef32Sjsg static bool __wopcm_regs_writable(struct intel_uncore *uncore)
216*f005ef32Sjsg {
217*f005ef32Sjsg if (!HAS_GUC_DEPRIVILEGE(uncore->i915))
218*f005ef32Sjsg return true;
219*f005ef32Sjsg
220*f005ef32Sjsg return intel_uncore_read(uncore, GUC_SHIM_CONTROL2) & GUC_IS_PRIVILEGED;
221*f005ef32Sjsg }
222*f005ef32Sjsg
223*f005ef32Sjsg /**
224*f005ef32Sjsg * intel_wopcm_init() - Initialize the WOPCM structure.
225*f005ef32Sjsg * @wopcm: pointer to intel_wopcm.
226*f005ef32Sjsg *
227*f005ef32Sjsg * This function will partition WOPCM space based on GuC and HuC firmware sizes
228*f005ef32Sjsg * and will allocate max remaining for use by GuC. This function will also
229*f005ef32Sjsg * enforce platform dependent hardware restrictions on GuC WOPCM offset and
230*f005ef32Sjsg * size. It will fail the WOPCM init if any of these checks fail, so that the
231*f005ef32Sjsg * following WOPCM registers setup and GuC firmware uploading would be aborted.
232*f005ef32Sjsg */
intel_wopcm_init(struct intel_wopcm * wopcm)233*f005ef32Sjsg void intel_wopcm_init(struct intel_wopcm *wopcm)
234*f005ef32Sjsg {
235*f005ef32Sjsg struct intel_gt *gt = wopcm_to_gt(wopcm);
236*f005ef32Sjsg struct drm_i915_private *i915 = gt->i915;
237*f005ef32Sjsg u32 guc_fw_size = intel_uc_fw_get_upload_size(>->uc.guc.fw);
238*f005ef32Sjsg u32 huc_fw_size = intel_uc_fw_get_upload_size(>->uc.huc.fw);
239*f005ef32Sjsg u32 ctx_rsvd = context_reserved_size(i915);
240*f005ef32Sjsg u32 wopcm_size = wopcm->size;
241*f005ef32Sjsg u32 guc_wopcm_base;
242*f005ef32Sjsg u32 guc_wopcm_size;
243*f005ef32Sjsg
244*f005ef32Sjsg if (!guc_fw_size)
245*f005ef32Sjsg return;
246*f005ef32Sjsg
247*f005ef32Sjsg GEM_BUG_ON(!wopcm_size);
248*f005ef32Sjsg GEM_BUG_ON(wopcm->guc.base);
249*f005ef32Sjsg GEM_BUG_ON(wopcm->guc.size);
250*f005ef32Sjsg GEM_BUG_ON(guc_fw_size >= wopcm_size);
251*f005ef32Sjsg GEM_BUG_ON(huc_fw_size >= wopcm_size);
252*f005ef32Sjsg GEM_BUG_ON(ctx_rsvd + WOPCM_RESERVED_SIZE >= wopcm_size);
253*f005ef32Sjsg
254*f005ef32Sjsg if (i915_inject_probe_failure(i915))
255*f005ef32Sjsg return;
256*f005ef32Sjsg
257*f005ef32Sjsg if (__wopcm_regs_locked(gt->uncore, &guc_wopcm_base, &guc_wopcm_size)) {
258*f005ef32Sjsg drm_dbg(&i915->drm, "GuC WOPCM is already locked [%uK, %uK)\n",
259*f005ef32Sjsg guc_wopcm_base / SZ_1K, guc_wopcm_size / SZ_1K);
260*f005ef32Sjsg /*
261*f005ef32Sjsg * Note that to keep things simple (i.e. avoid different
262*f005ef32Sjsg * defines per platform) our WOPCM math doesn't always use the
263*f005ef32Sjsg * actual WOPCM size, but a value that is less or equal to it.
264*f005ef32Sjsg * This is perfectly fine when i915 programs the registers, but
265*f005ef32Sjsg * on platforms with GuC deprivilege the registers are not
266*f005ef32Sjsg * writable from i915 and are instead pre-programmed by the
267*f005ef32Sjsg * bios/IFWI, so there might be a mismatch of sizes.
268*f005ef32Sjsg * Instead of handling the size difference, we trust that the
269*f005ef32Sjsg * programmed values make sense and disable the relevant check
270*f005ef32Sjsg * by using the maximum possible WOPCM size in the verification
271*f005ef32Sjsg * math. In the extremely unlikely case that the registers
272*f005ef32Sjsg * were pre-programmed with an invalid value, we will still
273*f005ef32Sjsg * gracefully fail later during the GuC/HuC dma.
274*f005ef32Sjsg */
275*f005ef32Sjsg if (!__wopcm_regs_writable(gt->uncore))
276*f005ef32Sjsg wopcm_size = MAX_WOPCM_SIZE;
277*f005ef32Sjsg
278*f005ef32Sjsg goto check;
279*f005ef32Sjsg }
280*f005ef32Sjsg
281*f005ef32Sjsg /*
282*f005ef32Sjsg * On platforms with a media GT, the WOPCM is partitioned between the
283*f005ef32Sjsg * two GTs, so we would have to take that into account when doing the
284*f005ef32Sjsg * math below. There is also a new section reserved for the GSC context
285*f005ef32Sjsg * that would have to be factored in. However, all platforms with a
286*f005ef32Sjsg * media GT also have GuC depriv enabled, so the WOPCM regs are
287*f005ef32Sjsg * pre-locked and therefore we don't have to do the math ourselves.
288*f005ef32Sjsg */
289*f005ef32Sjsg if (unlikely(i915->media_gt)) {
290*f005ef32Sjsg drm_err(&i915->drm, "Unlocked WOPCM regs with media GT\n");
291*f005ef32Sjsg return;
292*f005ef32Sjsg }
293*f005ef32Sjsg
294*f005ef32Sjsg /*
295*f005ef32Sjsg * Aligned value of guc_wopcm_base will determine available WOPCM space
296*f005ef32Sjsg * for HuC firmware and mandatory reserved area.
297*f005ef32Sjsg */
298*f005ef32Sjsg guc_wopcm_base = huc_fw_size + WOPCM_RESERVED_SIZE;
299*f005ef32Sjsg guc_wopcm_base = ALIGN(guc_wopcm_base, GUC_WOPCM_OFFSET_ALIGNMENT);
300*f005ef32Sjsg
301*f005ef32Sjsg /*
302*f005ef32Sjsg * Need to clamp guc_wopcm_base now to make sure the following math is
303*f005ef32Sjsg * correct. Formal check of whole WOPCM layout will be done below.
304*f005ef32Sjsg */
305*f005ef32Sjsg guc_wopcm_base = min(guc_wopcm_base, wopcm_size - ctx_rsvd);
306*f005ef32Sjsg
307*f005ef32Sjsg /* Aligned remainings of usable WOPCM space can be assigned to GuC. */
308*f005ef32Sjsg guc_wopcm_size = wopcm_size - ctx_rsvd - guc_wopcm_base;
309*f005ef32Sjsg guc_wopcm_size &= GUC_WOPCM_SIZE_MASK;
310*f005ef32Sjsg
311*f005ef32Sjsg drm_dbg(&i915->drm, "Calculated GuC WOPCM [%uK, %uK)\n",
312*f005ef32Sjsg guc_wopcm_base / SZ_1K, guc_wopcm_size / SZ_1K);
313*f005ef32Sjsg
314*f005ef32Sjsg check:
315*f005ef32Sjsg if (__check_layout(gt, wopcm_size, guc_wopcm_base, guc_wopcm_size,
316*f005ef32Sjsg guc_fw_size, huc_fw_size)) {
317*f005ef32Sjsg wopcm->guc.base = guc_wopcm_base;
318*f005ef32Sjsg wopcm->guc.size = guc_wopcm_size;
319*f005ef32Sjsg GEM_BUG_ON(!wopcm->guc.base);
320*f005ef32Sjsg GEM_BUG_ON(!wopcm->guc.size);
321*f005ef32Sjsg }
322*f005ef32Sjsg }
323