1de97bdebSjsg // SPDX-License-Identifier: MIT
2de97bdebSjsg /*
3de97bdebSjsg * Copyright © 2021 Intel Corporation
4de97bdebSjsg */
5de97bdebSjsg
61bb76ff1Sjsg #include "gem/i915_gem_domain.h"
71bb76ff1Sjsg #include "gem/i915_gem_internal.h"
8*f005ef32Sjsg #include "gem/i915_gem_lmem.h"
91bb76ff1Sjsg #include "gt/gen8_ppgtt.h"
101bb76ff1Sjsg
11de97bdebSjsg #include "i915_drv.h"
12*f005ef32Sjsg #include "i915_reg.h"
13*f005ef32Sjsg #include "intel_de.h"
14de97bdebSjsg #include "intel_display_types.h"
15de97bdebSjsg #include "intel_dpt.h"
16de97bdebSjsg #include "intel_fb.h"
17de97bdebSjsg
18de97bdebSjsg struct i915_dpt {
19de97bdebSjsg struct i915_address_space vm;
20de97bdebSjsg
21de97bdebSjsg struct drm_i915_gem_object *obj;
22de97bdebSjsg struct i915_vma *vma;
23de97bdebSjsg void __iomem *iomem;
24de97bdebSjsg };
25de97bdebSjsg
26de97bdebSjsg #define i915_is_dpt(vm) ((vm)->is_dpt)
27de97bdebSjsg
28de97bdebSjsg static inline struct i915_dpt *
i915_vm_to_dpt(struct i915_address_space * vm)29de97bdebSjsg i915_vm_to_dpt(struct i915_address_space *vm)
30de97bdebSjsg {
31de97bdebSjsg BUILD_BUG_ON(offsetof(struct i915_dpt, vm));
32de97bdebSjsg GEM_BUG_ON(!i915_is_dpt(vm));
33de97bdebSjsg return container_of(vm, struct i915_dpt, vm);
34de97bdebSjsg }
35de97bdebSjsg
36de97bdebSjsg #define dpt_total_entries(dpt) ((dpt)->vm.total >> PAGE_SHIFT)
37de97bdebSjsg
gen8_set_pte(void __iomem * addr,gen8_pte_t pte)38de97bdebSjsg static void gen8_set_pte(void __iomem *addr, gen8_pte_t pte)
39de97bdebSjsg {
40de97bdebSjsg writeq(pte, addr);
41de97bdebSjsg }
42de97bdebSjsg
dpt_insert_page(struct i915_address_space * vm,dma_addr_t addr,u64 offset,unsigned int pat_index,u32 flags)43de97bdebSjsg static void dpt_insert_page(struct i915_address_space *vm,
44de97bdebSjsg dma_addr_t addr,
45de97bdebSjsg u64 offset,
46*f005ef32Sjsg unsigned int pat_index,
47de97bdebSjsg u32 flags)
48de97bdebSjsg {
49de97bdebSjsg struct i915_dpt *dpt = i915_vm_to_dpt(vm);
50de97bdebSjsg gen8_pte_t __iomem *base = dpt->iomem;
51de97bdebSjsg
52de97bdebSjsg gen8_set_pte(base + offset / I915_GTT_PAGE_SIZE,
53*f005ef32Sjsg vm->pte_encode(addr, pat_index, flags));
54de97bdebSjsg }
55de97bdebSjsg
dpt_insert_entries(struct i915_address_space * vm,struct i915_vma_resource * vma_res,unsigned int pat_index,u32 flags)56de97bdebSjsg static void dpt_insert_entries(struct i915_address_space *vm,
571bb76ff1Sjsg struct i915_vma_resource *vma_res,
58*f005ef32Sjsg unsigned int pat_index,
59de97bdebSjsg u32 flags)
60de97bdebSjsg {
61de97bdebSjsg struct i915_dpt *dpt = i915_vm_to_dpt(vm);
62de97bdebSjsg gen8_pte_t __iomem *base = dpt->iomem;
63*f005ef32Sjsg const gen8_pte_t pte_encode = vm->pte_encode(0, pat_index, flags);
64de97bdebSjsg struct sgt_iter sgt_iter;
65de97bdebSjsg dma_addr_t addr;
66de97bdebSjsg int i;
67de97bdebSjsg
68de97bdebSjsg /*
69de97bdebSjsg * Note that we ignore PTE_READ_ONLY here. The caller must be careful
70de97bdebSjsg * not to allow the user to override access to a read only page.
71de97bdebSjsg */
72de97bdebSjsg
731bb76ff1Sjsg i = vma_res->start / I915_GTT_PAGE_SIZE;
741bb76ff1Sjsg for_each_sgt_daddr(addr, sgt_iter, vma_res->bi.pages)
75de97bdebSjsg gen8_set_pte(&base[i++], pte_encode | addr);
76de97bdebSjsg }
77de97bdebSjsg
dpt_clear_range(struct i915_address_space * vm,u64 start,u64 length)78de97bdebSjsg static void dpt_clear_range(struct i915_address_space *vm,
79de97bdebSjsg u64 start, u64 length)
80de97bdebSjsg {
81de97bdebSjsg }
82de97bdebSjsg
dpt_bind_vma(struct i915_address_space * vm,struct i915_vm_pt_stash * stash,struct i915_vma_resource * vma_res,unsigned int pat_index,u32 flags)83de97bdebSjsg static void dpt_bind_vma(struct i915_address_space *vm,
84de97bdebSjsg struct i915_vm_pt_stash *stash,
851bb76ff1Sjsg struct i915_vma_resource *vma_res,
86*f005ef32Sjsg unsigned int pat_index,
87de97bdebSjsg u32 flags)
88de97bdebSjsg {
89de97bdebSjsg u32 pte_flags;
90de97bdebSjsg
911bb76ff1Sjsg if (vma_res->bound_flags)
921bb76ff1Sjsg return;
931bb76ff1Sjsg
94de97bdebSjsg /* Applicable to VLV (gen8+ do not support RO in the GGTT) */
95de97bdebSjsg pte_flags = 0;
961bb76ff1Sjsg if (vm->has_read_only && vma_res->bi.readonly)
97de97bdebSjsg pte_flags |= PTE_READ_ONLY;
981bb76ff1Sjsg if (vma_res->bi.lmem)
99de97bdebSjsg pte_flags |= PTE_LM;
100de97bdebSjsg
101*f005ef32Sjsg vm->insert_entries(vm, vma_res, pat_index, pte_flags);
102de97bdebSjsg
1031bb76ff1Sjsg vma_res->page_sizes_gtt = I915_GTT_PAGE_SIZE;
104de97bdebSjsg
105de97bdebSjsg /*
106de97bdebSjsg * Without aliasing PPGTT there's no difference between
107de97bdebSjsg * GLOBAL/LOCAL_BIND, it's all the same ptes. Hence unconditionally
108de97bdebSjsg * upgrade to both bound if we bind either to avoid double-binding.
109de97bdebSjsg */
1101bb76ff1Sjsg vma_res->bound_flags = I915_VMA_GLOBAL_BIND | I915_VMA_LOCAL_BIND;
111de97bdebSjsg }
112de97bdebSjsg
dpt_unbind_vma(struct i915_address_space * vm,struct i915_vma_resource * vma_res)1131bb76ff1Sjsg static void dpt_unbind_vma(struct i915_address_space *vm,
1141bb76ff1Sjsg struct i915_vma_resource *vma_res)
115de97bdebSjsg {
1161bb76ff1Sjsg vm->clear_range(vm, vma_res->start, vma_res->vma_size);
117de97bdebSjsg }
118de97bdebSjsg
dpt_cleanup(struct i915_address_space * vm)119de97bdebSjsg static void dpt_cleanup(struct i915_address_space *vm)
120de97bdebSjsg {
121de97bdebSjsg struct i915_dpt *dpt = i915_vm_to_dpt(vm);
122de97bdebSjsg
123de97bdebSjsg i915_gem_object_put(dpt->obj);
124de97bdebSjsg }
125de97bdebSjsg
intel_dpt_pin(struct i915_address_space * vm)126de97bdebSjsg struct i915_vma *intel_dpt_pin(struct i915_address_space *vm)
127de97bdebSjsg {
128de97bdebSjsg struct drm_i915_private *i915 = vm->i915;
129de97bdebSjsg struct i915_dpt *dpt = i915_vm_to_dpt(vm);
130de97bdebSjsg intel_wakeref_t wakeref;
131de97bdebSjsg struct i915_vma *vma;
132de97bdebSjsg void __iomem *iomem;
1331bb76ff1Sjsg struct i915_gem_ww_ctx ww;
1341bb76ff1Sjsg u64 pin_flags = 0;
1351bb76ff1Sjsg int err;
1361bb76ff1Sjsg
1371bb76ff1Sjsg if (i915_gem_object_is_stolen(dpt->obj))
1381bb76ff1Sjsg pin_flags |= PIN_MAPPABLE;
139de97bdebSjsg
140de97bdebSjsg wakeref = intel_runtime_pm_get(&i915->runtime_pm);
141de97bdebSjsg atomic_inc(&i915->gpu_error.pending_fb_pin);
142de97bdebSjsg
1431bb76ff1Sjsg for_i915_gem_ww(&ww, err, true) {
1441bb76ff1Sjsg err = i915_gem_object_lock(dpt->obj, &ww);
1451bb76ff1Sjsg if (err)
1461bb76ff1Sjsg continue;
1471bb76ff1Sjsg
1481bb76ff1Sjsg vma = i915_gem_object_ggtt_pin_ww(dpt->obj, &ww, NULL, 0, 4096,
1491bb76ff1Sjsg pin_flags);
1501bb76ff1Sjsg if (IS_ERR(vma)) {
1511bb76ff1Sjsg err = PTR_ERR(vma);
1521bb76ff1Sjsg continue;
1531bb76ff1Sjsg }
154de97bdebSjsg
155de97bdebSjsg iomem = i915_vma_pin_iomap(vma);
156de97bdebSjsg i915_vma_unpin(vma);
1571bb76ff1Sjsg
158de97bdebSjsg if (IS_ERR(iomem)) {
1591bb76ff1Sjsg err = PTR_ERR(iomem);
1601bb76ff1Sjsg continue;
161de97bdebSjsg }
162de97bdebSjsg
163de97bdebSjsg dpt->vma = vma;
164de97bdebSjsg dpt->iomem = iomem;
165de97bdebSjsg
166de97bdebSjsg i915_vma_get(vma);
1671bb76ff1Sjsg }
168de97bdebSjsg
16980ab6b62Sjsg dpt->obj->mm.dirty = true;
17080ab6b62Sjsg
171de97bdebSjsg atomic_dec(&i915->gpu_error.pending_fb_pin);
172de97bdebSjsg intel_runtime_pm_put(&i915->runtime_pm, wakeref);
173de97bdebSjsg
1741bb76ff1Sjsg return err ? ERR_PTR(err) : vma;
175de97bdebSjsg }
176de97bdebSjsg
intel_dpt_unpin(struct i915_address_space * vm)177de97bdebSjsg void intel_dpt_unpin(struct i915_address_space *vm)
178de97bdebSjsg {
179de97bdebSjsg struct i915_dpt *dpt = i915_vm_to_dpt(vm);
180de97bdebSjsg
181de97bdebSjsg i915_vma_unpin_iomap(dpt->vma);
182de97bdebSjsg i915_vma_put(dpt->vma);
183de97bdebSjsg }
184de97bdebSjsg
1851bb76ff1Sjsg /**
1861bb76ff1Sjsg * intel_dpt_resume - restore the memory mapping for all DPT FBs during system resume
1871bb76ff1Sjsg * @i915: device instance
1881bb76ff1Sjsg *
1891bb76ff1Sjsg * Restore the memory mapping during system resume for all framebuffers which
1901bb76ff1Sjsg * are mapped to HW via a GGTT->DPT page table. The content of these page
1911bb76ff1Sjsg * tables are not stored in the hibernation image during S4 and S3RST->S4
1921bb76ff1Sjsg * transitions, so here we reprogram the PTE entries in those tables.
1931bb76ff1Sjsg *
1941bb76ff1Sjsg * This function must be called after the mappings in GGTT have been restored calling
1951bb76ff1Sjsg * i915_ggtt_resume().
1961bb76ff1Sjsg */
intel_dpt_resume(struct drm_i915_private * i915)1971bb76ff1Sjsg void intel_dpt_resume(struct drm_i915_private *i915)
1981bb76ff1Sjsg {
1991bb76ff1Sjsg struct drm_framebuffer *drm_fb;
2001bb76ff1Sjsg
2011bb76ff1Sjsg if (!HAS_DISPLAY(i915))
2021bb76ff1Sjsg return;
2031bb76ff1Sjsg
2041bb76ff1Sjsg mutex_lock(&i915->drm.mode_config.fb_lock);
2051bb76ff1Sjsg drm_for_each_fb(drm_fb, &i915->drm) {
2061bb76ff1Sjsg struct intel_framebuffer *fb = to_intel_framebuffer(drm_fb);
2071bb76ff1Sjsg
2081bb76ff1Sjsg if (fb->dpt_vm)
2091bb76ff1Sjsg i915_ggtt_resume_vm(fb->dpt_vm);
2101bb76ff1Sjsg }
2111bb76ff1Sjsg mutex_unlock(&i915->drm.mode_config.fb_lock);
2121bb76ff1Sjsg }
2131bb76ff1Sjsg
2141bb76ff1Sjsg /**
2151bb76ff1Sjsg * intel_dpt_suspend - suspend the memory mapping for all DPT FBs during system suspend
2161bb76ff1Sjsg * @i915: device instance
2171bb76ff1Sjsg *
2181bb76ff1Sjsg * Suspend the memory mapping during system suspend for all framebuffers which
2191bb76ff1Sjsg * are mapped to HW via a GGTT->DPT page table.
2201bb76ff1Sjsg *
2211bb76ff1Sjsg * This function must be called before the mappings in GGTT are suspended calling
2221bb76ff1Sjsg * i915_ggtt_suspend().
2231bb76ff1Sjsg */
intel_dpt_suspend(struct drm_i915_private * i915)2241bb76ff1Sjsg void intel_dpt_suspend(struct drm_i915_private *i915)
2251bb76ff1Sjsg {
2261bb76ff1Sjsg struct drm_framebuffer *drm_fb;
2271bb76ff1Sjsg
2281bb76ff1Sjsg if (!HAS_DISPLAY(i915))
2291bb76ff1Sjsg return;
2301bb76ff1Sjsg
2311bb76ff1Sjsg mutex_lock(&i915->drm.mode_config.fb_lock);
2321bb76ff1Sjsg
2331bb76ff1Sjsg drm_for_each_fb(drm_fb, &i915->drm) {
2341bb76ff1Sjsg struct intel_framebuffer *fb = to_intel_framebuffer(drm_fb);
2351bb76ff1Sjsg
2361bb76ff1Sjsg if (fb->dpt_vm)
2371bb76ff1Sjsg i915_ggtt_suspend_vm(fb->dpt_vm);
2381bb76ff1Sjsg }
2391bb76ff1Sjsg
2401bb76ff1Sjsg mutex_unlock(&i915->drm.mode_config.fb_lock);
2411bb76ff1Sjsg }
2421bb76ff1Sjsg
243de97bdebSjsg struct i915_address_space *
intel_dpt_create(struct intel_framebuffer * fb)244de97bdebSjsg intel_dpt_create(struct intel_framebuffer *fb)
245de97bdebSjsg {
246de97bdebSjsg struct drm_gem_object *obj = &intel_fb_obj(&fb->base)->base;
247de97bdebSjsg struct drm_i915_private *i915 = to_i915(obj->dev);
248de97bdebSjsg struct drm_i915_gem_object *dpt_obj;
249de97bdebSjsg struct i915_address_space *vm;
250de97bdebSjsg struct i915_dpt *dpt;
251de97bdebSjsg size_t size;
252de97bdebSjsg int ret;
253de97bdebSjsg
254de97bdebSjsg if (intel_fb_needs_pot_stride_remap(fb))
255de97bdebSjsg size = intel_remapped_info_size(&fb->remapped_view.gtt.remapped);
256de97bdebSjsg else
257de97bdebSjsg size = DIV_ROUND_UP_ULL(obj->size, I915_GTT_PAGE_SIZE);
258de97bdebSjsg
259de97bdebSjsg size = round_up(size * sizeof(gen8_pte_t), I915_GTT_PAGE_SIZE);
260de97bdebSjsg
2611bb76ff1Sjsg dpt_obj = i915_gem_object_create_lmem(i915, size, I915_BO_ALLOC_CONTIGUOUS);
2621bb76ff1Sjsg if (IS_ERR(dpt_obj) && i915_ggtt_has_aperture(to_gt(i915)->ggtt))
263de97bdebSjsg dpt_obj = i915_gem_object_create_stolen(i915, size);
2641bb76ff1Sjsg if (IS_ERR(dpt_obj) && !HAS_LMEM(i915)) {
2651bb76ff1Sjsg drm_dbg_kms(&i915->drm, "Allocating dpt from smem\n");
26680ab6b62Sjsg dpt_obj = i915_gem_object_create_shmem(i915, size);
2671bb76ff1Sjsg }
268de97bdebSjsg if (IS_ERR(dpt_obj))
269de97bdebSjsg return ERR_CAST(dpt_obj);
270de97bdebSjsg
2711bb76ff1Sjsg ret = i915_gem_object_lock_interruptible(dpt_obj, NULL);
2721bb76ff1Sjsg if (!ret) {
273de97bdebSjsg ret = i915_gem_object_set_cache_level(dpt_obj, I915_CACHE_NONE);
2741bb76ff1Sjsg i915_gem_object_unlock(dpt_obj);
2751bb76ff1Sjsg }
276de97bdebSjsg if (ret) {
277de97bdebSjsg i915_gem_object_put(dpt_obj);
278de97bdebSjsg return ERR_PTR(ret);
279de97bdebSjsg }
280de97bdebSjsg
281de97bdebSjsg dpt = kzalloc(sizeof(*dpt), GFP_KERNEL);
282de97bdebSjsg if (!dpt) {
283de97bdebSjsg i915_gem_object_put(dpt_obj);
284de97bdebSjsg return ERR_PTR(-ENOMEM);
285de97bdebSjsg }
286de97bdebSjsg
287de97bdebSjsg vm = &dpt->vm;
288de97bdebSjsg
2891bb76ff1Sjsg vm->gt = to_gt(i915);
290de97bdebSjsg vm->i915 = i915;
291de97bdebSjsg vm->dma = i915->drm.dev;
292de97bdebSjsg vm->total = (size / sizeof(gen8_pte_t)) * I915_GTT_PAGE_SIZE;
293de97bdebSjsg vm->is_dpt = true;
294de97bdebSjsg
295de97bdebSjsg i915_address_space_init(vm, VM_CLASS_DPT);
296de97bdebSjsg
297de97bdebSjsg vm->insert_page = dpt_insert_page;
298de97bdebSjsg vm->clear_range = dpt_clear_range;
299de97bdebSjsg vm->insert_entries = dpt_insert_entries;
300de97bdebSjsg vm->cleanup = dpt_cleanup;
301de97bdebSjsg
302de97bdebSjsg vm->vma_ops.bind_vma = dpt_bind_vma;
303de97bdebSjsg vm->vma_ops.unbind_vma = dpt_unbind_vma;
304de97bdebSjsg
305*f005ef32Sjsg vm->pte_encode = vm->gt->ggtt->vm.pte_encode;
306de97bdebSjsg
307de97bdebSjsg dpt->obj = dpt_obj;
308af76a5a8Sjsg dpt->obj->is_dpt = true;
309de97bdebSjsg
310de97bdebSjsg return &dpt->vm;
311de97bdebSjsg }
312de97bdebSjsg
intel_dpt_destroy(struct i915_address_space * vm)313de97bdebSjsg void intel_dpt_destroy(struct i915_address_space *vm)
314de97bdebSjsg {
315de97bdebSjsg struct i915_dpt *dpt = i915_vm_to_dpt(vm);
316de97bdebSjsg
317af76a5a8Sjsg dpt->obj->is_dpt = false;
3181bb76ff1Sjsg i915_vm_put(&dpt->vm);
319de97bdebSjsg }
320*f005ef32Sjsg
intel_dpt_configure(struct intel_crtc * crtc)321*f005ef32Sjsg void intel_dpt_configure(struct intel_crtc *crtc)
322*f005ef32Sjsg {
323*f005ef32Sjsg struct drm_i915_private *i915 = to_i915(crtc->base.dev);
324*f005ef32Sjsg
325*f005ef32Sjsg if (DISPLAY_VER(i915) == 14) {
326*f005ef32Sjsg enum pipe pipe = crtc->pipe;
327*f005ef32Sjsg enum plane_id plane_id;
328*f005ef32Sjsg
329*f005ef32Sjsg for_each_plane_id_on_crtc(crtc, plane_id) {
330*f005ef32Sjsg if (plane_id == PLANE_CURSOR)
331*f005ef32Sjsg continue;
332*f005ef32Sjsg
333*f005ef32Sjsg intel_de_rmw(i915, PLANE_CHICKEN(pipe, plane_id),
334*f005ef32Sjsg PLANE_CHICKEN_DISABLE_DPT,
335*f005ef32Sjsg i915->params.enable_dpt ? 0 : PLANE_CHICKEN_DISABLE_DPT);
336*f005ef32Sjsg }
337*f005ef32Sjsg } else if (DISPLAY_VER(i915) == 13) {
338*f005ef32Sjsg intel_de_rmw(i915, CHICKEN_MISC_2,
339*f005ef32Sjsg CHICKEN_MISC_DISABLE_DPT,
340*f005ef32Sjsg i915->params.enable_dpt ? 0 : CHICKEN_MISC_DISABLE_DPT);
341*f005ef32Sjsg }
342*f005ef32Sjsg }
343