xref: /openbsd-src/sys/dev/pci/drm/amd/amdgpu/gfxhub_v1_0.c (revision 8cf5070fd19e3309d53d732ce99f08f6b3df5e68)
1fb4d8502Sjsg /*
2fb4d8502Sjsg  * Copyright 2016 Advanced Micro Devices, Inc.
3fb4d8502Sjsg  *
4fb4d8502Sjsg  * Permission is hereby granted, free of charge, to any person obtaining a
5fb4d8502Sjsg  * copy of this software and associated documentation files (the "Software"),
6fb4d8502Sjsg  * to deal in the Software without restriction, including without limitation
7fb4d8502Sjsg  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8fb4d8502Sjsg  * and/or sell copies of the Software, and to permit persons to whom the
9fb4d8502Sjsg  * Software is furnished to do so, subject to the following conditions:
10fb4d8502Sjsg  *
11fb4d8502Sjsg  * The above copyright notice and this permission notice shall be included in
12fb4d8502Sjsg  * all copies or substantial portions of the Software.
13fb4d8502Sjsg  *
14fb4d8502Sjsg  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15fb4d8502Sjsg  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16fb4d8502Sjsg  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17fb4d8502Sjsg  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18fb4d8502Sjsg  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19fb4d8502Sjsg  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20fb4d8502Sjsg  * OTHER DEALINGS IN THE SOFTWARE.
21fb4d8502Sjsg  *
22fb4d8502Sjsg  */
23fb4d8502Sjsg #include "amdgpu.h"
24fb4d8502Sjsg #include "gfxhub_v1_0.h"
255ca02815Sjsg #include "gfxhub_v1_1.h"
26fb4d8502Sjsg 
27fb4d8502Sjsg #include "gc/gc_9_0_offset.h"
28fb4d8502Sjsg #include "gc/gc_9_0_sh_mask.h"
29fb4d8502Sjsg #include "gc/gc_9_0_default.h"
30fb4d8502Sjsg #include "vega10_enum.h"
31fb4d8502Sjsg 
32fb4d8502Sjsg #include "soc15_common.h"
33fb4d8502Sjsg 
gfxhub_v1_0_get_mc_fb_offset(struct amdgpu_device * adev)345ca02815Sjsg static u64 gfxhub_v1_0_get_mc_fb_offset(struct amdgpu_device *adev)
35fb4d8502Sjsg {
36fb4d8502Sjsg 	return (u64)RREG32_SOC15(GC, 0, mmMC_VM_FB_OFFSET) << 24;
37fb4d8502Sjsg }
38fb4d8502Sjsg 
gfxhub_v1_0_setup_vm_pt_regs(struct amdgpu_device * adev,uint32_t vmid,uint64_t page_table_base)395ca02815Sjsg static void gfxhub_v1_0_setup_vm_pt_regs(struct amdgpu_device *adev,
405ca02815Sjsg 					 uint32_t vmid,
41c349dbc7Sjsg 					 uint64_t page_table_base)
42fb4d8502Sjsg {
43f005ef32Sjsg 	struct amdgpu_vmhub *hub = &adev->vmhub[AMDGPU_GFXHUB(0)];
44fb4d8502Sjsg 
45c349dbc7Sjsg 	WREG32_SOC15_OFFSET(GC, 0, mmVM_CONTEXT0_PAGE_TABLE_BASE_ADDR_LO32,
46ad8b1aafSjsg 			    hub->ctx_addr_distance * vmid,
47ad8b1aafSjsg 			    lower_32_bits(page_table_base));
48fb4d8502Sjsg 
49c349dbc7Sjsg 	WREG32_SOC15_OFFSET(GC, 0, mmVM_CONTEXT0_PAGE_TABLE_BASE_ADDR_HI32,
50ad8b1aafSjsg 			    hub->ctx_addr_distance * vmid,
51ad8b1aafSjsg 			    upper_32_bits(page_table_base));
52fb4d8502Sjsg }
53fb4d8502Sjsg 
gfxhub_v1_0_init_gart_aperture_regs(struct amdgpu_device * adev)54fb4d8502Sjsg static void gfxhub_v1_0_init_gart_aperture_regs(struct amdgpu_device *adev)
55fb4d8502Sjsg {
565ca02815Sjsg 	uint64_t pt_base;
575ca02815Sjsg 
585ca02815Sjsg 	if (adev->gmc.pdb0_bo)
595ca02815Sjsg 		pt_base = amdgpu_gmc_pd_addr(adev->gmc.pdb0_bo);
605ca02815Sjsg 	else
615ca02815Sjsg 		pt_base = amdgpu_gmc_pd_addr(adev->gart.bo);
62c349dbc7Sjsg 
63c349dbc7Sjsg 	gfxhub_v1_0_setup_vm_pt_regs(adev, 0, pt_base);
64fb4d8502Sjsg 
655ca02815Sjsg 	/* If use GART for FB translation, vmid0 page table covers both
665ca02815Sjsg 	 * vram and system memory (gart)
675ca02815Sjsg 	 */
685ca02815Sjsg 	if (adev->gmc.pdb0_bo) {
695ca02815Sjsg 		WREG32_SOC15(GC, 0, mmVM_CONTEXT0_PAGE_TABLE_START_ADDR_LO32,
705ca02815Sjsg 				(u32)(adev->gmc.fb_start >> 12));
715ca02815Sjsg 		WREG32_SOC15(GC, 0, mmVM_CONTEXT0_PAGE_TABLE_START_ADDR_HI32,
725ca02815Sjsg 				(u32)(adev->gmc.fb_start >> 44));
735ca02815Sjsg 
745ca02815Sjsg 		WREG32_SOC15(GC, 0, mmVM_CONTEXT0_PAGE_TABLE_END_ADDR_LO32,
755ca02815Sjsg 				(u32)(adev->gmc.gart_end >> 12));
765ca02815Sjsg 		WREG32_SOC15(GC, 0, mmVM_CONTEXT0_PAGE_TABLE_END_ADDR_HI32,
775ca02815Sjsg 				(u32)(adev->gmc.gart_end >> 44));
785ca02815Sjsg 	} else {
79fb4d8502Sjsg 		WREG32_SOC15(GC, 0, mmVM_CONTEXT0_PAGE_TABLE_START_ADDR_LO32,
80fb4d8502Sjsg 				(u32)(adev->gmc.gart_start >> 12));
81fb4d8502Sjsg 		WREG32_SOC15(GC, 0, mmVM_CONTEXT0_PAGE_TABLE_START_ADDR_HI32,
82fb4d8502Sjsg 				(u32)(adev->gmc.gart_start >> 44));
83fb4d8502Sjsg 
84fb4d8502Sjsg 		WREG32_SOC15(GC, 0, mmVM_CONTEXT0_PAGE_TABLE_END_ADDR_LO32,
85fb4d8502Sjsg 				(u32)(adev->gmc.gart_end >> 12));
86fb4d8502Sjsg 		WREG32_SOC15(GC, 0, mmVM_CONTEXT0_PAGE_TABLE_END_ADDR_HI32,
87fb4d8502Sjsg 				(u32)(adev->gmc.gart_end >> 44));
88fb4d8502Sjsg 	}
895ca02815Sjsg }
90fb4d8502Sjsg 
gfxhub_v1_0_init_system_aperture_regs(struct amdgpu_device * adev)91fb4d8502Sjsg static void gfxhub_v1_0_init_system_aperture_regs(struct amdgpu_device *adev)
92fb4d8502Sjsg {
93fb4d8502Sjsg 	uint64_t value;
94fb4d8502Sjsg 
95c349dbc7Sjsg 	/* Program the AGP BAR */
96c349dbc7Sjsg 	WREG32_SOC15_RLC(GC, 0, mmMC_VM_AGP_BASE, 0);
97c349dbc7Sjsg 	WREG32_SOC15_RLC(GC, 0, mmMC_VM_AGP_BOT, adev->gmc.agp_start >> 24);
98c349dbc7Sjsg 	WREG32_SOC15_RLC(GC, 0, mmMC_VM_AGP_TOP, adev->gmc.agp_end >> 24);
99fb4d8502Sjsg 
100c349dbc7Sjsg 	if (!amdgpu_sriov_vf(adev) || adev->asic_type <= CHIP_VEGA10) {
101fb4d8502Sjsg 		/* Program the system aperture low logical page number. */
102c349dbc7Sjsg 		WREG32_SOC15_RLC(GC, 0, mmMC_VM_SYSTEM_APERTURE_LOW_ADDR,
103c349dbc7Sjsg 			min(adev->gmc.fb_start, adev->gmc.agp_start) >> 18);
104c349dbc7Sjsg 
105*8cf5070fSjsg 		if (adev->apu_flags & (AMD_APU_IS_RAVEN2 |
106*8cf5070fSjsg 				       AMD_APU_IS_RENOIR |
107*8cf5070fSjsg 				       AMD_APU_IS_GREEN_SARDINE))
108c349dbc7Sjsg 		       /*
109c349dbc7Sjsg 			* Raven2 has a HW issue that it is unable to use the
110c349dbc7Sjsg 			* vram which is out of MC_VM_SYSTEM_APERTURE_HIGH_ADDR.
111c349dbc7Sjsg 			* So here is the workaround that increase system
112c349dbc7Sjsg 			* aperture high address (add 1) to get rid of the VM
113c349dbc7Sjsg 			* fault and hardware hang.
114c349dbc7Sjsg 			*/
115c349dbc7Sjsg 			WREG32_SOC15_RLC(GC, 0,
116c349dbc7Sjsg 					 mmMC_VM_SYSTEM_APERTURE_HIGH_ADDR,
117c349dbc7Sjsg 					 max((adev->gmc.fb_end >> 18) + 0x1,
118c349dbc7Sjsg 					     adev->gmc.agp_end >> 18));
119c349dbc7Sjsg 		else
120c349dbc7Sjsg 			WREG32_SOC15_RLC(
121c349dbc7Sjsg 				GC, 0, mmMC_VM_SYSTEM_APERTURE_HIGH_ADDR,
122c349dbc7Sjsg 				max(adev->gmc.fb_end, adev->gmc.agp_end) >> 18);
123fb4d8502Sjsg 
124fb4d8502Sjsg 		/* Set default page address. */
125f005ef32Sjsg 		value = amdgpu_gmc_vram_mc2pa(adev, adev->mem_scratch.gpu_addr);
126fb4d8502Sjsg 		WREG32_SOC15(GC, 0, mmMC_VM_SYSTEM_APERTURE_DEFAULT_ADDR_LSB,
127fb4d8502Sjsg 			     (u32)(value >> 12));
128fb4d8502Sjsg 		WREG32_SOC15(GC, 0, mmMC_VM_SYSTEM_APERTURE_DEFAULT_ADDR_MSB,
129fb4d8502Sjsg 			     (u32)(value >> 44));
130fb4d8502Sjsg 
131fb4d8502Sjsg 		/* Program "protection fault". */
132fb4d8502Sjsg 		WREG32_SOC15(GC, 0, mmVM_L2_PROTECTION_FAULT_DEFAULT_ADDR_LO32,
133fb4d8502Sjsg 			     (u32)(adev->dummy_page_addr >> 12));
134fb4d8502Sjsg 		WREG32_SOC15(GC, 0, mmVM_L2_PROTECTION_FAULT_DEFAULT_ADDR_HI32,
135fb4d8502Sjsg 			     (u32)((u64)adev->dummy_page_addr >> 44));
136fb4d8502Sjsg 
137fb4d8502Sjsg 		WREG32_FIELD15(GC, 0, VM_L2_PROTECTION_FAULT_CNTL2,
138fb4d8502Sjsg 			       ACTIVE_PAGE_MIGRATION_PTE_READ_RETRY, 1);
139fb4d8502Sjsg 	}
1405ca02815Sjsg 
1415ca02815Sjsg 	/* In the case squeezing vram into GART aperture, we don't use
1425ca02815Sjsg 	 * FB aperture and AGP aperture. Disable them.
1435ca02815Sjsg 	 */
1445ca02815Sjsg 	if (adev->gmc.pdb0_bo) {
1455ca02815Sjsg 		WREG32_SOC15(GC, 0, mmMC_VM_FB_LOCATION_TOP, 0);
1465ca02815Sjsg 		WREG32_SOC15(GC, 0, mmMC_VM_FB_LOCATION_BASE, 0x00FFFFFF);
1475ca02815Sjsg 		WREG32_SOC15(GC, 0, mmMC_VM_AGP_TOP, 0);
1485ca02815Sjsg 		WREG32_SOC15(GC, 0, mmMC_VM_AGP_BOT, 0xFFFFFF);
1495ca02815Sjsg 		WREG32_SOC15(GC, 0, mmMC_VM_SYSTEM_APERTURE_LOW_ADDR, 0x3FFFFFFF);
1505ca02815Sjsg 		WREG32_SOC15(GC, 0, mmMC_VM_SYSTEM_APERTURE_HIGH_ADDR, 0);
1515ca02815Sjsg 	}
152c349dbc7Sjsg }
153fb4d8502Sjsg 
gfxhub_v1_0_init_tlb_regs(struct amdgpu_device * adev)154fb4d8502Sjsg static void gfxhub_v1_0_init_tlb_regs(struct amdgpu_device *adev)
155fb4d8502Sjsg {
156fb4d8502Sjsg 	uint32_t tmp;
157fb4d8502Sjsg 
158fb4d8502Sjsg 	/* Setup TLB control */
159fb4d8502Sjsg 	tmp = RREG32_SOC15(GC, 0, mmMC_VM_MX_L1_TLB_CNTL);
160fb4d8502Sjsg 
161fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, MC_VM_MX_L1_TLB_CNTL, ENABLE_L1_TLB, 1);
162fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, MC_VM_MX_L1_TLB_CNTL, SYSTEM_ACCESS_MODE, 3);
163fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, MC_VM_MX_L1_TLB_CNTL,
164fb4d8502Sjsg 			    ENABLE_ADVANCED_DRIVER_MODEL, 1);
165fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, MC_VM_MX_L1_TLB_CNTL,
166fb4d8502Sjsg 			    SYSTEM_APERTURE_UNMAPPED_ACCESS, 0);
167fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, MC_VM_MX_L1_TLB_CNTL,
168fb4d8502Sjsg 			    MTYPE, MTYPE_UC);/* XXX for emulation. */
169fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, MC_VM_MX_L1_TLB_CNTL, ATC_EN, 1);
170fb4d8502Sjsg 
171c349dbc7Sjsg 	WREG32_SOC15_RLC(GC, 0, mmMC_VM_MX_L1_TLB_CNTL, tmp);
172fb4d8502Sjsg }
173fb4d8502Sjsg 
gfxhub_v1_0_init_cache_regs(struct amdgpu_device * adev)174fb4d8502Sjsg static void gfxhub_v1_0_init_cache_regs(struct amdgpu_device *adev)
175fb4d8502Sjsg {
176fb4d8502Sjsg 	uint32_t tmp;
177fb4d8502Sjsg 
178fb4d8502Sjsg 	/* Setup L2 cache */
179fb4d8502Sjsg 	tmp = RREG32_SOC15(GC, 0, mmVM_L2_CNTL);
180fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, VM_L2_CNTL, ENABLE_L2_CACHE, 1);
181fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, VM_L2_CNTL, ENABLE_L2_FRAGMENT_PROCESSING, 1);
182fb4d8502Sjsg 	/* XXX for emulation, Refer to closed source code.*/
183fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, VM_L2_CNTL, L2_PDE0_CACHE_TAG_GENERATION_MODE,
184fb4d8502Sjsg 			    0);
185c349dbc7Sjsg 	tmp = REG_SET_FIELD(tmp, VM_L2_CNTL, PDE_FAULT_CLASSIFICATION, 0);
186fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, VM_L2_CNTL, CONTEXT1_IDENTITY_ACCESS_MODE, 1);
187fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, VM_L2_CNTL, IDENTITY_MODE_FRAGMENT_SIZE, 0);
188c349dbc7Sjsg 	WREG32_SOC15_RLC(GC, 0, mmVM_L2_CNTL, tmp);
189fb4d8502Sjsg 
190fb4d8502Sjsg 	tmp = RREG32_SOC15(GC, 0, mmVM_L2_CNTL2);
191fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, VM_L2_CNTL2, INVALIDATE_ALL_L1_TLBS, 1);
192fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, VM_L2_CNTL2, INVALIDATE_L2_CACHE, 1);
193c349dbc7Sjsg 	WREG32_SOC15_RLC(GC, 0, mmVM_L2_CNTL2, tmp);
194fb4d8502Sjsg 
195fb4d8502Sjsg 	tmp = mmVM_L2_CNTL3_DEFAULT;
196fb4d8502Sjsg 	if (adev->gmc.translate_further) {
197fb4d8502Sjsg 		tmp = REG_SET_FIELD(tmp, VM_L2_CNTL3, BANK_SELECT, 12);
198fb4d8502Sjsg 		tmp = REG_SET_FIELD(tmp, VM_L2_CNTL3,
199fb4d8502Sjsg 				    L2_CACHE_BIGK_FRAGMENT_SIZE, 9);
200fb4d8502Sjsg 	} else {
201fb4d8502Sjsg 		tmp = REG_SET_FIELD(tmp, VM_L2_CNTL3, BANK_SELECT, 9);
202fb4d8502Sjsg 		tmp = REG_SET_FIELD(tmp, VM_L2_CNTL3,
203fb4d8502Sjsg 				    L2_CACHE_BIGK_FRAGMENT_SIZE, 6);
204fb4d8502Sjsg 	}
205c349dbc7Sjsg 	WREG32_SOC15_RLC(GC, 0, mmVM_L2_CNTL3, tmp);
206fb4d8502Sjsg 
207fb4d8502Sjsg 	tmp = mmVM_L2_CNTL4_DEFAULT;
2085ca02815Sjsg 	if (adev->gmc.xgmi.connected_to_cpu) {
2095ca02815Sjsg 		tmp = REG_SET_FIELD(tmp, VM_L2_CNTL4, VMC_TAP_PDE_REQUEST_PHYSICAL, 1);
2105ca02815Sjsg 		tmp = REG_SET_FIELD(tmp, VM_L2_CNTL4, VMC_TAP_PTE_REQUEST_PHYSICAL, 1);
2115ca02815Sjsg 	} else {
212fb4d8502Sjsg 		tmp = REG_SET_FIELD(tmp, VM_L2_CNTL4, VMC_TAP_PDE_REQUEST_PHYSICAL, 0);
213fb4d8502Sjsg 		tmp = REG_SET_FIELD(tmp, VM_L2_CNTL4, VMC_TAP_PTE_REQUEST_PHYSICAL, 0);
2145ca02815Sjsg 	}
215c349dbc7Sjsg 	WREG32_SOC15_RLC(GC, 0, mmVM_L2_CNTL4, tmp);
216fb4d8502Sjsg }
217fb4d8502Sjsg 
gfxhub_v1_0_enable_system_domain(struct amdgpu_device * adev)218fb4d8502Sjsg static void gfxhub_v1_0_enable_system_domain(struct amdgpu_device *adev)
219fb4d8502Sjsg {
220fb4d8502Sjsg 	uint32_t tmp;
221fb4d8502Sjsg 
222fb4d8502Sjsg 	tmp = RREG32_SOC15(GC, 0, mmVM_CONTEXT0_CNTL);
223fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, VM_CONTEXT0_CNTL, ENABLE_CONTEXT, 1);
2245ca02815Sjsg 	tmp = REG_SET_FIELD(tmp, VM_CONTEXT0_CNTL, PAGE_TABLE_DEPTH,
2255ca02815Sjsg 			adev->gmc.vmid0_page_table_depth);
2265ca02815Sjsg 	tmp = REG_SET_FIELD(tmp, VM_CONTEXT0_CNTL, PAGE_TABLE_BLOCK_SIZE,
2275ca02815Sjsg 			adev->gmc.vmid0_page_table_block_size);
228c349dbc7Sjsg 	tmp = REG_SET_FIELD(tmp, VM_CONTEXT0_CNTL,
229c349dbc7Sjsg 			    RETRY_PERMISSION_OR_INVALID_PAGE_FAULT, 0);
230fb4d8502Sjsg 	WREG32_SOC15(GC, 0, mmVM_CONTEXT0_CNTL, tmp);
231fb4d8502Sjsg }
232fb4d8502Sjsg 
gfxhub_v1_0_disable_identity_aperture(struct amdgpu_device * adev)233fb4d8502Sjsg static void gfxhub_v1_0_disable_identity_aperture(struct amdgpu_device *adev)
234fb4d8502Sjsg {
235fb4d8502Sjsg 	WREG32_SOC15(GC, 0, mmVM_L2_CONTEXT1_IDENTITY_APERTURE_LOW_ADDR_LO32,
236fb4d8502Sjsg 		     0XFFFFFFFF);
237fb4d8502Sjsg 	WREG32_SOC15(GC, 0, mmVM_L2_CONTEXT1_IDENTITY_APERTURE_LOW_ADDR_HI32,
238fb4d8502Sjsg 		     0x0000000F);
239fb4d8502Sjsg 
240fb4d8502Sjsg 	WREG32_SOC15(GC, 0, mmVM_L2_CONTEXT1_IDENTITY_APERTURE_HIGH_ADDR_LO32,
241fb4d8502Sjsg 		     0);
242fb4d8502Sjsg 	WREG32_SOC15(GC, 0, mmVM_L2_CONTEXT1_IDENTITY_APERTURE_HIGH_ADDR_HI32,
243fb4d8502Sjsg 		     0);
244fb4d8502Sjsg 
245fb4d8502Sjsg 	WREG32_SOC15(GC, 0, mmVM_L2_CONTEXT_IDENTITY_PHYSICAL_OFFSET_LO32, 0);
246fb4d8502Sjsg 	WREG32_SOC15(GC, 0, mmVM_L2_CONTEXT_IDENTITY_PHYSICAL_OFFSET_HI32, 0);
247fb4d8502Sjsg 
248fb4d8502Sjsg }
249fb4d8502Sjsg 
gfxhub_v1_0_setup_vmid_config(struct amdgpu_device * adev)250fb4d8502Sjsg static void gfxhub_v1_0_setup_vmid_config(struct amdgpu_device *adev)
251fb4d8502Sjsg {
252f005ef32Sjsg 	struct amdgpu_vmhub *hub = &adev->vmhub[AMDGPU_GFXHUB(0)];
253f005ef32Sjsg 	unsigned int num_level, block_size;
254fb4d8502Sjsg 	uint32_t tmp;
255fb4d8502Sjsg 	int i;
256fb4d8502Sjsg 
257fb4d8502Sjsg 	num_level = adev->vm_manager.num_level;
258fb4d8502Sjsg 	block_size = adev->vm_manager.block_size;
259fb4d8502Sjsg 	if (adev->gmc.translate_further)
260fb4d8502Sjsg 		num_level -= 1;
261fb4d8502Sjsg 	else
262fb4d8502Sjsg 		block_size -= 9;
263fb4d8502Sjsg 
264fb4d8502Sjsg 	for (i = 0; i <= 14; i++) {
265fb4d8502Sjsg 		tmp = RREG32_SOC15_OFFSET(GC, 0, mmVM_CONTEXT1_CNTL, i);
266fb4d8502Sjsg 		tmp = REG_SET_FIELD(tmp, VM_CONTEXT1_CNTL, ENABLE_CONTEXT, 1);
267fb4d8502Sjsg 		tmp = REG_SET_FIELD(tmp, VM_CONTEXT1_CNTL, PAGE_TABLE_DEPTH,
268fb4d8502Sjsg 				    num_level);
269fb4d8502Sjsg 		tmp = REG_SET_FIELD(tmp, VM_CONTEXT1_CNTL,
270fb4d8502Sjsg 				    RANGE_PROTECTION_FAULT_ENABLE_DEFAULT, 1);
271fb4d8502Sjsg 		tmp = REG_SET_FIELD(tmp, VM_CONTEXT1_CNTL,
272fb4d8502Sjsg 				    DUMMY_PAGE_PROTECTION_FAULT_ENABLE_DEFAULT,
273fb4d8502Sjsg 				    1);
274fb4d8502Sjsg 		tmp = REG_SET_FIELD(tmp, VM_CONTEXT1_CNTL,
275fb4d8502Sjsg 				    PDE0_PROTECTION_FAULT_ENABLE_DEFAULT, 1);
276fb4d8502Sjsg 		tmp = REG_SET_FIELD(tmp, VM_CONTEXT1_CNTL,
277fb4d8502Sjsg 				    VALID_PROTECTION_FAULT_ENABLE_DEFAULT, 1);
278fb4d8502Sjsg 		tmp = REG_SET_FIELD(tmp, VM_CONTEXT1_CNTL,
279fb4d8502Sjsg 				    READ_PROTECTION_FAULT_ENABLE_DEFAULT, 1);
280fb4d8502Sjsg 		tmp = REG_SET_FIELD(tmp, VM_CONTEXT1_CNTL,
281fb4d8502Sjsg 				    WRITE_PROTECTION_FAULT_ENABLE_DEFAULT, 1);
282fb4d8502Sjsg 		tmp = REG_SET_FIELD(tmp, VM_CONTEXT1_CNTL,
283fb4d8502Sjsg 				    EXECUTE_PROTECTION_FAULT_ENABLE_DEFAULT, 1);
284fb4d8502Sjsg 		tmp = REG_SET_FIELD(tmp, VM_CONTEXT1_CNTL,
285fb4d8502Sjsg 				    PAGE_TABLE_BLOCK_SIZE,
286fb4d8502Sjsg 				    block_size);
2875ca02815Sjsg 		/* Send no-retry XNACK on fault to suppress VM fault storm.
2885ca02815Sjsg 		 * On Aldebaran, XNACK can be enabled in the SQ per-process.
2895ca02815Sjsg 		 * Retry faults need to be enabled for that to work.
2905ca02815Sjsg 		 */
291fb4d8502Sjsg 		tmp = REG_SET_FIELD(tmp, VM_CONTEXT1_CNTL,
292c349dbc7Sjsg 				    RETRY_PERMISSION_OR_INVALID_PAGE_FAULT,
2935ca02815Sjsg 				    !adev->gmc.noretry ||
2945ca02815Sjsg 				    adev->asic_type == CHIP_ALDEBARAN);
295ad8b1aafSjsg 		WREG32_SOC15_OFFSET(GC, 0, mmVM_CONTEXT1_CNTL,
296ad8b1aafSjsg 				    i * hub->ctx_distance, tmp);
297ad8b1aafSjsg 		WREG32_SOC15_OFFSET(GC, 0, mmVM_CONTEXT1_PAGE_TABLE_START_ADDR_LO32,
298ad8b1aafSjsg 				    i * hub->ctx_addr_distance, 0);
299ad8b1aafSjsg 		WREG32_SOC15_OFFSET(GC, 0, mmVM_CONTEXT1_PAGE_TABLE_START_ADDR_HI32,
300ad8b1aafSjsg 				    i * hub->ctx_addr_distance, 0);
301ad8b1aafSjsg 		WREG32_SOC15_OFFSET(GC, 0, mmVM_CONTEXT1_PAGE_TABLE_END_ADDR_LO32,
302ad8b1aafSjsg 				    i * hub->ctx_addr_distance,
303fb4d8502Sjsg 				    lower_32_bits(adev->vm_manager.max_pfn - 1));
304ad8b1aafSjsg 		WREG32_SOC15_OFFSET(GC, 0, mmVM_CONTEXT1_PAGE_TABLE_END_ADDR_HI32,
305ad8b1aafSjsg 				    i * hub->ctx_addr_distance,
306fb4d8502Sjsg 				    upper_32_bits(adev->vm_manager.max_pfn - 1));
307fb4d8502Sjsg 	}
308fb4d8502Sjsg }
309fb4d8502Sjsg 
gfxhub_v1_0_program_invalidation(struct amdgpu_device * adev)310fb4d8502Sjsg static void gfxhub_v1_0_program_invalidation(struct amdgpu_device *adev)
311fb4d8502Sjsg {
312f005ef32Sjsg 	struct amdgpu_vmhub *hub = &adev->vmhub[AMDGPU_GFXHUB(0)];
313f005ef32Sjsg 	unsigned int i;
314fb4d8502Sjsg 
315fb4d8502Sjsg 	for (i = 0 ; i < 18; ++i) {
316fb4d8502Sjsg 		WREG32_SOC15_OFFSET(GC, 0, mmVM_INVALIDATE_ENG0_ADDR_RANGE_LO32,
317ad8b1aafSjsg 				    i * hub->eng_addr_distance, 0xffffffff);
318fb4d8502Sjsg 		WREG32_SOC15_OFFSET(GC, 0, mmVM_INVALIDATE_ENG0_ADDR_RANGE_HI32,
319ad8b1aafSjsg 				    i * hub->eng_addr_distance, 0x1f);
320fb4d8502Sjsg 	}
321fb4d8502Sjsg }
322fb4d8502Sjsg 
gfxhub_v1_0_gart_enable(struct amdgpu_device * adev)3235ca02815Sjsg static int gfxhub_v1_0_gart_enable(struct amdgpu_device *adev)
324fb4d8502Sjsg {
325fb4d8502Sjsg 	/* GART Enable. */
326fb4d8502Sjsg 	gfxhub_v1_0_init_gart_aperture_regs(adev);
327fb4d8502Sjsg 	gfxhub_v1_0_init_system_aperture_regs(adev);
328fb4d8502Sjsg 	gfxhub_v1_0_init_tlb_regs(adev);
329c349dbc7Sjsg 	if (!amdgpu_sriov_vf(adev))
330fb4d8502Sjsg 		gfxhub_v1_0_init_cache_regs(adev);
331fb4d8502Sjsg 
332fb4d8502Sjsg 	gfxhub_v1_0_enable_system_domain(adev);
333c349dbc7Sjsg 	if (!amdgpu_sriov_vf(adev))
334fb4d8502Sjsg 		gfxhub_v1_0_disable_identity_aperture(adev);
335fb4d8502Sjsg 	gfxhub_v1_0_setup_vmid_config(adev);
336fb4d8502Sjsg 	gfxhub_v1_0_program_invalidation(adev);
337fb4d8502Sjsg 
338fb4d8502Sjsg 	return 0;
339fb4d8502Sjsg }
340fb4d8502Sjsg 
gfxhub_v1_0_gart_disable(struct amdgpu_device * adev)3415ca02815Sjsg static void gfxhub_v1_0_gart_disable(struct amdgpu_device *adev)
342fb4d8502Sjsg {
343f005ef32Sjsg 	struct amdgpu_vmhub *hub = &adev->vmhub[AMDGPU_GFXHUB(0)];
344fb4d8502Sjsg 	u32 tmp;
345fb4d8502Sjsg 	u32 i;
346fb4d8502Sjsg 
347fb4d8502Sjsg 	/* Disable all tables */
348fb4d8502Sjsg 	for (i = 0; i < 16; i++)
349ad8b1aafSjsg 		WREG32_SOC15_OFFSET(GC, 0, mmVM_CONTEXT0_CNTL,
350ad8b1aafSjsg 				    i * hub->ctx_distance, 0);
351fb4d8502Sjsg 
3521bb76ff1Sjsg 	if (amdgpu_sriov_vf(adev))
3531bb76ff1Sjsg 		/* Avoid write to GMC registers */
3541bb76ff1Sjsg 		return;
3551bb76ff1Sjsg 
356fb4d8502Sjsg 	/* Setup TLB control */
357fb4d8502Sjsg 	tmp = RREG32_SOC15(GC, 0, mmMC_VM_MX_L1_TLB_CNTL);
358fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, MC_VM_MX_L1_TLB_CNTL, ENABLE_L1_TLB, 0);
359fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp,
360fb4d8502Sjsg 				MC_VM_MX_L1_TLB_CNTL,
361fb4d8502Sjsg 				ENABLE_ADVANCED_DRIVER_MODEL,
362fb4d8502Sjsg 				0);
363c349dbc7Sjsg 	WREG32_SOC15_RLC(GC, 0, mmMC_VM_MX_L1_TLB_CNTL, tmp);
364fb4d8502Sjsg 
365fb4d8502Sjsg 	/* Setup L2 cache */
366fb4d8502Sjsg 	WREG32_FIELD15(GC, 0, VM_L2_CNTL, ENABLE_L2_CACHE, 0);
367fb4d8502Sjsg 	WREG32_SOC15(GC, 0, mmVM_L2_CNTL3, 0);
368fb4d8502Sjsg }
369fb4d8502Sjsg 
370fb4d8502Sjsg /**
371fb4d8502Sjsg  * gfxhub_v1_0_set_fault_enable_default - update GART/VM fault handling
372fb4d8502Sjsg  *
373fb4d8502Sjsg  * @adev: amdgpu_device pointer
374fb4d8502Sjsg  * @value: true redirects VM faults to the default page
375fb4d8502Sjsg  */
gfxhub_v1_0_set_fault_enable_default(struct amdgpu_device * adev,bool value)3765ca02815Sjsg static void gfxhub_v1_0_set_fault_enable_default(struct amdgpu_device *adev,
377fb4d8502Sjsg 						 bool value)
378fb4d8502Sjsg {
379fb4d8502Sjsg 	u32 tmp;
380f005ef32Sjsg 
381fb4d8502Sjsg 	tmp = RREG32_SOC15(GC, 0, mmVM_L2_PROTECTION_FAULT_CNTL);
382fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, VM_L2_PROTECTION_FAULT_CNTL,
383fb4d8502Sjsg 			RANGE_PROTECTION_FAULT_ENABLE_DEFAULT, value);
384fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, VM_L2_PROTECTION_FAULT_CNTL,
385fb4d8502Sjsg 			PDE0_PROTECTION_FAULT_ENABLE_DEFAULT, value);
386fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, VM_L2_PROTECTION_FAULT_CNTL,
387fb4d8502Sjsg 			PDE1_PROTECTION_FAULT_ENABLE_DEFAULT, value);
388fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, VM_L2_PROTECTION_FAULT_CNTL,
389fb4d8502Sjsg 			PDE2_PROTECTION_FAULT_ENABLE_DEFAULT, value);
390fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp,
391fb4d8502Sjsg 			VM_L2_PROTECTION_FAULT_CNTL,
392fb4d8502Sjsg 			TRANSLATE_FURTHER_PROTECTION_FAULT_ENABLE_DEFAULT,
393fb4d8502Sjsg 			value);
394fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, VM_L2_PROTECTION_FAULT_CNTL,
395fb4d8502Sjsg 			NACK_PROTECTION_FAULT_ENABLE_DEFAULT, value);
396fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, VM_L2_PROTECTION_FAULT_CNTL,
397fb4d8502Sjsg 			DUMMY_PAGE_PROTECTION_FAULT_ENABLE_DEFAULT, value);
398fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, VM_L2_PROTECTION_FAULT_CNTL,
399fb4d8502Sjsg 			VALID_PROTECTION_FAULT_ENABLE_DEFAULT, value);
400fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, VM_L2_PROTECTION_FAULT_CNTL,
401fb4d8502Sjsg 			READ_PROTECTION_FAULT_ENABLE_DEFAULT, value);
402fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, VM_L2_PROTECTION_FAULT_CNTL,
403fb4d8502Sjsg 			WRITE_PROTECTION_FAULT_ENABLE_DEFAULT, value);
404fb4d8502Sjsg 	tmp = REG_SET_FIELD(tmp, VM_L2_PROTECTION_FAULT_CNTL,
405fb4d8502Sjsg 			EXECUTE_PROTECTION_FAULT_ENABLE_DEFAULT, value);
406fb4d8502Sjsg 	if (!value) {
407fb4d8502Sjsg 		tmp = REG_SET_FIELD(tmp, VM_L2_PROTECTION_FAULT_CNTL,
408fb4d8502Sjsg 				CRASH_ON_NO_RETRY_FAULT, 1);
409fb4d8502Sjsg 		tmp = REG_SET_FIELD(tmp, VM_L2_PROTECTION_FAULT_CNTL,
410fb4d8502Sjsg 				CRASH_ON_RETRY_FAULT, 1);
411fb4d8502Sjsg 	}
412fb4d8502Sjsg 	WREG32_SOC15(GC, 0, mmVM_L2_PROTECTION_FAULT_CNTL, tmp);
413fb4d8502Sjsg }
414fb4d8502Sjsg 
gfxhub_v1_0_init(struct amdgpu_device * adev)4155ca02815Sjsg static void gfxhub_v1_0_init(struct amdgpu_device *adev)
416fb4d8502Sjsg {
417f005ef32Sjsg 	struct amdgpu_vmhub *hub = &adev->vmhub[AMDGPU_GFXHUB(0)];
418fb4d8502Sjsg 
419fb4d8502Sjsg 	hub->ctx0_ptb_addr_lo32 =
420fb4d8502Sjsg 		SOC15_REG_OFFSET(GC, 0,
421fb4d8502Sjsg 				 mmVM_CONTEXT0_PAGE_TABLE_BASE_ADDR_LO32);
422fb4d8502Sjsg 	hub->ctx0_ptb_addr_hi32 =
423fb4d8502Sjsg 		SOC15_REG_OFFSET(GC, 0,
424fb4d8502Sjsg 				 mmVM_CONTEXT0_PAGE_TABLE_BASE_ADDR_HI32);
425c349dbc7Sjsg 	hub->vm_inv_eng0_sem =
426c349dbc7Sjsg 		SOC15_REG_OFFSET(GC, 0, mmVM_INVALIDATE_ENG0_SEM);
427fb4d8502Sjsg 	hub->vm_inv_eng0_req =
428fb4d8502Sjsg 		SOC15_REG_OFFSET(GC, 0, mmVM_INVALIDATE_ENG0_REQ);
429fb4d8502Sjsg 	hub->vm_inv_eng0_ack =
430fb4d8502Sjsg 		SOC15_REG_OFFSET(GC, 0, mmVM_INVALIDATE_ENG0_ACK);
431fb4d8502Sjsg 	hub->vm_context0_cntl =
432fb4d8502Sjsg 		SOC15_REG_OFFSET(GC, 0, mmVM_CONTEXT0_CNTL);
433fb4d8502Sjsg 	hub->vm_l2_pro_fault_status =
434fb4d8502Sjsg 		SOC15_REG_OFFSET(GC, 0, mmVM_L2_PROTECTION_FAULT_STATUS);
435fb4d8502Sjsg 	hub->vm_l2_pro_fault_cntl =
436fb4d8502Sjsg 		SOC15_REG_OFFSET(GC, 0, mmVM_L2_PROTECTION_FAULT_CNTL);
437ad8b1aafSjsg 
438ad8b1aafSjsg 	hub->ctx_distance = mmVM_CONTEXT1_CNTL - mmVM_CONTEXT0_CNTL;
439ad8b1aafSjsg 	hub->ctx_addr_distance = mmVM_CONTEXT1_PAGE_TABLE_BASE_ADDR_LO32 -
440ad8b1aafSjsg 		mmVM_CONTEXT0_PAGE_TABLE_BASE_ADDR_LO32;
441ad8b1aafSjsg 	hub->eng_distance = mmVM_INVALIDATE_ENG1_REQ - mmVM_INVALIDATE_ENG0_REQ;
442ad8b1aafSjsg 	hub->eng_addr_distance = mmVM_INVALIDATE_ENG1_ADDR_RANGE_LO32 -
443ad8b1aafSjsg 		mmVM_INVALIDATE_ENG0_ADDR_RANGE_LO32;
444fb4d8502Sjsg }
445ad8b1aafSjsg 
446ad8b1aafSjsg 
447ad8b1aafSjsg const struct amdgpu_gfxhub_funcs gfxhub_v1_0_funcs = {
448ad8b1aafSjsg 	.get_mc_fb_offset = gfxhub_v1_0_get_mc_fb_offset,
449ad8b1aafSjsg 	.setup_vm_pt_regs = gfxhub_v1_0_setup_vm_pt_regs,
450ad8b1aafSjsg 	.gart_enable = gfxhub_v1_0_gart_enable,
451ad8b1aafSjsg 	.gart_disable = gfxhub_v1_0_gart_disable,
452ad8b1aafSjsg 	.set_fault_enable_default = gfxhub_v1_0_set_fault_enable_default,
453ad8b1aafSjsg 	.init = gfxhub_v1_0_init,
4545ca02815Sjsg 	.get_xgmi_info = gfxhub_v1_1_get_xgmi_info,
455ad8b1aafSjsg };
456