1 /* 2 * Copyright 2025 Advanced Micro Devices, Inc. 3 * 4 * Permission is hereby granted, free of charge, to any person obtaining a 5 * copy of this software and associated documentation files (the "Software"), 6 * to deal in the Software without restriction, including without limitation 7 * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8 * and/or sell copies of the Software, and to permit persons to whom the 9 * Software is furnished to do so, subject to the following conditions: 10 * 11 * The above copyright notice and this permission notice shall be included in 12 * all copies or substantial portions of the Software. 13 * 14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR 18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 20 * OTHER DEALINGS IN THE SOFTWARE. 21 * 22 */ 23 #include "amdgpu.h" 24 #include "amdgpu_xcp.h" 25 #include "gfxhub_v12_1.h" 26 27 #include "gc/gc_12_1_0_offset.h" 28 #include "gc/gc_12_1_0_sh_mask.h" 29 #include "soc_v1_0_enum.h" 30 31 #include "soc15_common.h" 32 33 #define regGCVM_L2_CNTL3_DEFAULT 0x80120007 34 #define regGCVM_L2_CNTL4_DEFAULT 0x000000c1 35 #define regGCVM_L2_CNTL5_DEFAULT 0x00003fe0 36 #define regGRBM_GFX_INDEX_DEFAULT 0xe0000000 37 38 39 static u64 gfxhub_v12_1_get_fb_location(struct amdgpu_device *adev) 40 { 41 u64 base; 42 43 base = RREG32_SOC15(GC, GET_INST(GC, 0), 44 regGCMC_VM_FB_LOCATION_BASE_LO32); 45 base &= GCMC_VM_FB_LOCATION_BASE_LO32__FB_BASE_LO32_MASK; 46 base <<= 24; 47 48 base |= ((u64)(GCMC_VM_FB_LOCATION_BASE_HI32__FB_BASE_HI1_MASK & 49 RREG32_SOC15(GC, GET_INST(GC, 0), 50 regGCMC_VM_FB_LOCATION_BASE_HI32)) << 56); 51 return base; 52 } 53 54 static u64 gfxhub_v12_1_get_mc_fb_offset(struct amdgpu_device *adev) 55 { 56 return (u64)(RREG32_SOC15(GC, GET_INST(GC, 0), 57 regGCMC_VM_FB_OFFSET) << 24); 58 } 59 60 static void gfxhub_v12_1_xcc_setup_vm_pt_regs(struct amdgpu_device *adev, 61 uint32_t vmid, 62 uint64_t page_table_base, 63 uint32_t xcc_mask) 64 { 65 struct amdgpu_vmhub *hub; 66 int i; 67 68 for_each_inst(i, xcc_mask) { 69 hub = &adev->vmhub[AMDGPU_GFXHUB(i)]; 70 WREG32_SOC15_OFFSET(GC, GET_INST(GC, i), 71 regGCVM_CONTEXT0_PAGE_TABLE_BASE_ADDR_LO32, 72 hub->ctx_addr_distance * vmid, 73 lower_32_bits(page_table_base)); 74 75 WREG32_SOC15_OFFSET(GC, GET_INST(GC, i), 76 regGCVM_CONTEXT0_PAGE_TABLE_BASE_ADDR_HI32, 77 hub->ctx_addr_distance * vmid, 78 upper_32_bits(page_table_base)); 79 } 80 } 81 82 static void gfxhub_v12_1_setup_vm_pt_regs(struct amdgpu_device *adev, 83 uint32_t vmid, 84 uint64_t page_table_base) 85 { 86 uint32_t xcc_mask; 87 88 xcc_mask = GENMASK(NUM_XCC(adev->gfx.xcc_mask) - 1, 0); 89 gfxhub_v12_1_xcc_setup_vm_pt_regs(adev, vmid, page_table_base, xcc_mask); 90 } 91 92 static void gfxhub_v12_1_xcc_init_gart_aperture_regs(struct amdgpu_device *adev, 93 uint32_t xcc_mask) 94 { 95 uint64_t pt_base; 96 int i; 97 98 if (adev->gmc.pdb0_bo) 99 pt_base = amdgpu_gmc_pd_addr(adev->gmc.pdb0_bo); 100 else 101 pt_base = amdgpu_gmc_pd_addr(adev->gart.bo); 102 103 gfxhub_v12_1_xcc_setup_vm_pt_regs(adev, 0, pt_base, xcc_mask); 104 105 /* If use GART for FB translation, vmid0 page table covers both 106 * vram and system memory (gart) 107 */ 108 for_each_inst(i, xcc_mask) { 109 if (adev->gmc.pdb0_bo) { 110 WREG32_SOC15(GC, GET_INST(GC, i), 111 regGCVM_CONTEXT0_PAGE_TABLE_START_ADDR_LO32, 112 (u32)(adev->gmc.fb_start >> 12)); 113 WREG32_SOC15(GC, GET_INST(GC, i), 114 regGCVM_CONTEXT0_PAGE_TABLE_START_ADDR_HI32, 115 (u32)(adev->gmc.fb_start >> 44)); 116 117 WREG32_SOC15(GC, GET_INST(GC, i), 118 regGCVM_CONTEXT0_PAGE_TABLE_END_ADDR_LO32, 119 (u32)(adev->gmc.gart_end >> 12)); 120 WREG32_SOC15(GC, GET_INST(GC, i), 121 regGCVM_CONTEXT0_PAGE_TABLE_END_ADDR_HI32, 122 (u32)(adev->gmc.gart_end >> 44)); 123 } else { 124 WREG32_SOC15(GC, GET_INST(GC, i), 125 regGCVM_CONTEXT0_PAGE_TABLE_START_ADDR_LO32, 126 (u32)(adev->gmc.gart_start >> 12)); 127 WREG32_SOC15(GC, GET_INST(GC, i), 128 regGCVM_CONTEXT0_PAGE_TABLE_START_ADDR_HI32, 129 (u32)(adev->gmc.gart_start >> 44)); 130 131 WREG32_SOC15(GC, GET_INST(GC, i), 132 regGCVM_CONTEXT0_PAGE_TABLE_END_ADDR_LO32, 133 (u32)(adev->gmc.gart_end >> 12)); 134 WREG32_SOC15(GC, GET_INST(GC, i), 135 regGCVM_CONTEXT0_PAGE_TABLE_END_ADDR_HI32, 136 (u32)(adev->gmc.gart_end >> 44)); 137 } 138 } 139 } 140 141 static void gfxhub_v12_1_xcc_init_system_aperture_regs(struct amdgpu_device *adev, 142 uint32_t xcc_mask) 143 { 144 uint64_t value; 145 uint32_t tmp; 146 int i; 147 148 for_each_inst(i, xcc_mask) { 149 /* Program the AGP BAR */ 150 WREG32_SOC15_RLC(GC, GET_INST(GC, i), 151 regGCMC_VM_AGP_BASE_LO32, 0); 152 WREG32_SOC15_RLC(GC, GET_INST(GC, i), 153 regGCMC_VM_AGP_BASE_HI32, 0); 154 WREG32_SOC15_RLC(GC, GET_INST(GC, i), 155 regGCMC_VM_AGP_BOT_LO32, 156 lower_32_bits(adev->gmc.agp_start >> 24)); 157 WREG32_SOC15_RLC(GC, GET_INST(GC, i), 158 regGCMC_VM_AGP_BOT_HI32, 159 upper_32_bits(adev->gmc.agp_start >> 24)); 160 WREG32_SOC15_RLC(GC, GET_INST(GC, i), 161 regGCMC_VM_AGP_TOP_LO32, 162 lower_32_bits(adev->gmc.agp_end >> 24)); 163 WREG32_SOC15_RLC(GC, GET_INST(GC, i), 164 regGCMC_VM_AGP_TOP_HI32, 165 upper_32_bits(adev->gmc.agp_end >> 24)); 166 167 if (!amdgpu_sriov_vf(adev)) { 168 /* Program the system aperture low logical page number. */ 169 WREG32_SOC15(GC, GET_INST(GC, i), 170 regGCMC_VM_SYSTEM_APERTURE_LOW_ADDR_LO32, 171 lower_32_bits(min(adev->gmc.fb_start, adev->gmc.agp_start) >> 18)); 172 WREG32_SOC15(GC, GET_INST(GC, i), 173 regGCMC_VM_SYSTEM_APERTURE_LOW_ADDR_HI32, 174 upper_32_bits(min(adev->gmc.fb_start, adev->gmc.agp_start) >> 18)); 175 WREG32_SOC15(GC, GET_INST(GC, i), 176 regGCMC_VM_SYSTEM_APERTURE_HIGH_ADDR_LO32, 177 lower_32_bits(max(adev->gmc.fb_end, adev->gmc.agp_end) >> 18)); 178 WREG32_SOC15(GC, GET_INST(GC, i), 179 regGCMC_VM_SYSTEM_APERTURE_HIGH_ADDR_HI32, 180 upper_32_bits(max(adev->gmc.fb_end, adev->gmc.agp_end) >> 18)); 181 182 /* Set default page address. */ 183 value = amdgpu_gmc_vram_mc2pa(adev, adev->mem_scratch.gpu_addr); 184 WREG32_SOC15(GC, GET_INST(GC, i), 185 regGCMC_VM_SYSTEM_APERTURE_DEFAULT_ADDR_LSB, 186 (u32)(value >> 12)); 187 WREG32_SOC15(GC, GET_INST(GC, i), 188 regGCMC_VM_SYSTEM_APERTURE_DEFAULT_ADDR_MSB, 189 (u32)(value >> 44)); 190 191 /* Program "protection fault". */ 192 WREG32_SOC15(GC, GET_INST(GC, i), 193 regGCVM_L2_PROTECTION_FAULT_DEFAULT_ADDR_LO32, 194 (u32)(adev->dummy_page_addr >> 12)); 195 WREG32_SOC15(GC, GET_INST(GC, i), 196 regGCVM_L2_PROTECTION_FAULT_DEFAULT_ADDR_HI32, 197 (u32)((u64)adev->dummy_page_addr >> 44)); 198 199 tmp = RREG32_SOC15(GC, GET_INST(GC, i), 200 regGCVM_L2_PROTECTION_FAULT_CNTL2); 201 tmp = REG_SET_FIELD(tmp, GCVM_L2_PROTECTION_FAULT_CNTL2, 202 ACTIVE_PAGE_MIGRATION_PTE_READ_RETRY, 1); 203 WREG32_SOC15(GC, GET_INST(GC, i), 204 regGCVM_L2_PROTECTION_FAULT_CNTL2, tmp); 205 } 206 207 /* In the case squeezing vram into GART aperture, we don't use 208 * FB aperture and AGP aperture. Disable them. 209 */ 210 if (adev->gmc.pdb0_bo) { 211 WREG32_SOC15(GC, GET_INST(GC, i), 212 regGCMC_VM_FB_LOCATION_TOP_LO32, 0); 213 WREG32_SOC15(GC, GET_INST(GC, i), 214 regGCMC_VM_FB_LOCATION_TOP_HI32, 0); 215 WREG32_SOC15(GC, GET_INST(GC, i), 216 regGCMC_VM_FB_LOCATION_BASE_LO32, 217 0xFFFFFFFF); 218 WREG32_SOC15(GC, GET_INST(GC, i), 219 regGCMC_VM_FB_LOCATION_BASE_HI32, 1); 220 WREG32_SOC15(GC, GET_INST(GC, i), 221 regGCMC_VM_AGP_TOP_LO32, 0); 222 WREG32_SOC15(GC, GET_INST(GC, i), 223 regGCMC_VM_AGP_TOP_HI32, 0); 224 WREG32_SOC15(GC, GET_INST(GC, i), 225 regGCMC_VM_AGP_BOT_LO32, 0xFFFFFFFF); 226 WREG32_SOC15(GC, GET_INST(GC, i), 227 regGCMC_VM_AGP_BOT_HI32, 1); 228 WREG32_SOC15(GC, GET_INST(GC, i), 229 regGCMC_VM_SYSTEM_APERTURE_LOW_ADDR_LO32, 230 0xFFFFFFFF); 231 WREG32_SOC15(GC, GET_INST(GC, i), 232 regGCMC_VM_SYSTEM_APERTURE_LOW_ADDR_HI32, 233 0x7F); 234 WREG32_SOC15(GC, GET_INST(GC, i), 235 regGCMC_VM_SYSTEM_APERTURE_HIGH_ADDR_LO32, 0); 236 WREG32_SOC15(GC, GET_INST(GC, i), 237 regGCMC_VM_SYSTEM_APERTURE_HIGH_ADDR_HI32, 0); 238 } 239 } 240 } 241 242 static void gfxhub_v12_1_xcc_init_tlb_regs(struct amdgpu_device *adev, 243 uint32_t xcc_mask) 244 { 245 uint32_t tmp; 246 int i; 247 248 for_each_inst(i, xcc_mask) { 249 /* Setup TLB control */ 250 tmp = RREG32_SOC15(GC, GET_INST(GC, i), 251 regGCMC_VM_MX_L1_TLB_CNTL); 252 253 tmp = REG_SET_FIELD(tmp, 254 GCMC_VM_MX_L1_TLB_CNTL, 255 ENABLE_L1_TLB, 1); 256 tmp = REG_SET_FIELD(tmp, 257 GCMC_VM_MX_L1_TLB_CNTL, 258 SYSTEM_ACCESS_MODE, 3); 259 tmp = REG_SET_FIELD(tmp, 260 GCMC_VM_MX_L1_TLB_CNTL, 261 ENABLE_ADVANCED_DRIVER_MODEL, 1); 262 tmp = REG_SET_FIELD(tmp, 263 GCMC_VM_MX_L1_TLB_CNTL, 264 SYSTEM_APERTURE_UNMAPPED_ACCESS, 0); 265 tmp = REG_SET_FIELD(tmp, 266 GCMC_VM_MX_L1_TLB_CNTL, 267 ECO_BITS, 0); 268 tmp = REG_SET_FIELD(tmp, 269 GCMC_VM_MX_L1_TLB_CNTL, 270 MTYPE, MTYPE_UC); 271 272 WREG32_SOC15_RLC(GC, GET_INST(GC, i), 273 regGCMC_VM_MX_L1_TLB_CNTL, tmp); 274 } 275 } 276 277 static void gfxhub_v12_1_xcc_init_cache_regs(struct amdgpu_device *adev, 278 uint32_t xcc_mask) 279 { 280 uint32_t tmp; 281 int i; 282 283 for_each_inst(i, xcc_mask) { 284 /* Setup L2 cache */ 285 tmp = RREG32_SOC15(GC, GET_INST(GC, i), regGCVM_L2_CNTL); 286 tmp = REG_SET_FIELD(tmp, GCVM_L2_CNTL, 287 ENABLE_L2_CACHE, 1); 288 /*TODO: set ENABLE_L2_FRAGMENT_PROCESSING to 1? */ 289 tmp = REG_SET_FIELD(tmp, GCVM_L2_CNTL, 290 ENABLE_L2_FRAGMENT_PROCESSING, 0); 291 tmp = REG_SET_FIELD(tmp, GCVM_L2_CNTL, 292 ENABLE_DEFAULT_PAGE_OUT_TO_SYSTEM_MEMORY, 1); 293 tmp = REG_SET_FIELD(tmp, GCVM_L2_CNTL, 294 L2_PDE0_CACHE_TAG_GENERATION_MODE, 0); 295 tmp = REG_SET_FIELD(tmp, GCVM_L2_CNTL, 296 PDE_FAULT_CLASSIFICATION, 0); 297 tmp = REG_SET_FIELD(tmp, GCVM_L2_CNTL, 298 CONTEXT1_IDENTITY_ACCESS_MODE, 1); 299 tmp = REG_SET_FIELD(tmp, GCVM_L2_CNTL, 300 IDENTITY_MODE_FRAGMENT_SIZE, 0); 301 WREG32_SOC15_RLC(GC, GET_INST(GC, i), 302 regGCVM_L2_CNTL, tmp); 303 304 tmp = RREG32_SOC15(GC, GET_INST(GC, i), regGCVM_L2_CNTL2); 305 tmp = REG_SET_FIELD(tmp, GCVM_L2_CNTL2, 306 INVALIDATE_ALL_L1_TLBS, 1); 307 tmp = REG_SET_FIELD(tmp, GCVM_L2_CNTL2, 308 INVALIDATE_L2_CACHE, 1); 309 WREG32_SOC15_RLC(GC, GET_INST(GC, i), 310 regGCVM_L2_CNTL2, tmp); 311 312 tmp = regGCVM_L2_CNTL3_DEFAULT; 313 if (adev->gmc.translate_further) { 314 tmp = REG_SET_FIELD(tmp, GCVM_L2_CNTL3, BANK_SELECT, 12); 315 tmp = REG_SET_FIELD(tmp, GCVM_L2_CNTL3, 316 L2_CACHE_BIGK_FRAGMENT_SIZE, 9); 317 } else { 318 tmp = REG_SET_FIELD(tmp, GCVM_L2_CNTL3, BANK_SELECT, 9); 319 tmp = REG_SET_FIELD(tmp, GCVM_L2_CNTL3, 320 L2_CACHE_BIGK_FRAGMENT_SIZE, 6); 321 } 322 WREG32_SOC15_RLC(GC, GET_INST(GC, i), regGCVM_L2_CNTL3, tmp); 323 324 tmp = regGCVM_L2_CNTL4_DEFAULT; 325 tmp = REG_SET_FIELD(tmp, GCVM_L2_CNTL4, 326 VMC_TAP_PDE_REQUEST_PHYSICAL, 1); 327 tmp = REG_SET_FIELD(tmp, GCVM_L2_CNTL4, 328 VMC_TAP_PTE_REQUEST_PHYSICAL, 1); 329 WREG32_SOC15_RLC(GC, GET_INST(GC, i), regGCVM_L2_CNTL4, tmp); 330 331 tmp = regGCVM_L2_CNTL5_DEFAULT; 332 tmp = REG_SET_FIELD(tmp, GCVM_L2_CNTL5, 333 L2_CACHE_SMALLK_FRAGMENT_SIZE, 0); 334 WREG32_SOC15_RLC(GC, GET_INST(GC, i), regGCVM_L2_CNTL5, tmp); 335 } 336 } 337 338 static void gfxhub_v12_1_xcc_enable_system_domain(struct amdgpu_device *adev, 339 uint32_t xcc_mask) 340 { 341 uint32_t tmp; 342 int i; 343 344 for_each_inst(i, xcc_mask) { 345 tmp = RREG32_SOC15(GC, GET_INST(GC, i), 346 regGCVM_CONTEXT0_CNTL); 347 tmp = REG_SET_FIELD(tmp, GCVM_CONTEXT0_CNTL, 348 ENABLE_CONTEXT, 1); 349 tmp = REG_SET_FIELD(tmp, GCVM_CONTEXT0_CNTL, 350 PAGE_TABLE_DEPTH, 351 adev->gmc.vmid0_page_table_depth); 352 tmp = REG_SET_FIELD(tmp, GCVM_CONTEXT0_CNTL, 353 PAGE_TABLE_BLOCK_SIZE, 354 adev->gmc.vmid0_page_table_block_size); 355 tmp = REG_SET_FIELD(tmp, GCVM_CONTEXT0_CNTL, 356 RETRY_PERMISSION_OR_INVALID_PAGE_FAULT, 0); 357 WREG32_SOC15(GC, GET_INST(GC, i), 358 regGCVM_CONTEXT0_CNTL, tmp); 359 } 360 } 361 362 static void gfxhub_v12_1_xcc_disable_identity_aperture(struct amdgpu_device *adev, 363 uint32_t xcc_mask) 364 { 365 int i; 366 367 for_each_inst(i, xcc_mask) { 368 WREG32_SOC15(GC, GET_INST(GC, i), 369 regGCVM_L2_CONTEXT1_IDENTITY_APERTURE_LOW_ADDR_LO32, 370 0XFFFFFFFF); 371 WREG32_SOC15(GC, GET_INST(GC, i), 372 regGCVM_L2_CONTEXT1_IDENTITY_APERTURE_LOW_ADDR_HI32, 373 0x00001FFF); 374 375 WREG32_SOC15(GC, GET_INST(GC, i), 376 regGCVM_L2_CONTEXT1_IDENTITY_APERTURE_HIGH_ADDR_LO32, 377 0); 378 WREG32_SOC15(GC, GET_INST(GC, i), 379 regGCVM_L2_CONTEXT1_IDENTITY_APERTURE_HIGH_ADDR_HI32, 380 0); 381 382 WREG32_SOC15(GC, GET_INST(GC, i), 383 regGCVM_L2_CONTEXT_IDENTITY_PHYSICAL_OFFSET_LO32, 384 0); 385 WREG32_SOC15(GC, GET_INST(GC, i), 386 regGCVM_L2_CONTEXT_IDENTITY_PHYSICAL_OFFSET_HI32, 387 0); 388 } 389 } 390 391 static void gfxhub_v12_1_xcc_setup_vmid_config(struct amdgpu_device *adev, 392 uint32_t xcc_mask) 393 { 394 struct amdgpu_vmhub *hub; 395 unsigned int num_level, block_size; 396 uint32_t tmp; 397 int i, j; 398 399 num_level = adev->vm_manager.num_level; 400 block_size = adev->vm_manager.block_size; 401 block_size -= 9; 402 403 for_each_inst(j, xcc_mask) { 404 hub = &adev->vmhub[AMDGPU_GFXHUB(j)]; 405 for (i = 0; i <= 14; i++) { 406 tmp = RREG32_SOC15_OFFSET(GC, GET_INST(GC, j), 407 regGCVM_CONTEXT1_CNTL, 408 i * hub->ctx_distance); 409 tmp = REG_SET_FIELD(tmp, GCVM_CONTEXT1_CNTL, 410 ENABLE_CONTEXT, 1); 411 tmp = REG_SET_FIELD(tmp, GCVM_CONTEXT1_CNTL, 412 PAGE_TABLE_DEPTH, num_level); 413 tmp = REG_SET_FIELD(tmp, GCVM_CONTEXT1_CNTL, 414 RANGE_PROTECTION_FAULT_ENABLE_DEFAULT, 1); 415 tmp = REG_SET_FIELD(tmp, GCVM_CONTEXT1_CNTL, 416 DUMMY_PAGE_PROTECTION_FAULT_ENABLE_DEFAULT, 1); 417 tmp = REG_SET_FIELD(tmp, GCVM_CONTEXT1_CNTL, 418 PDE0_PROTECTION_FAULT_ENABLE_DEFAULT, 1); 419 tmp = REG_SET_FIELD(tmp, GCVM_CONTEXT1_CNTL, 420 VALID_PROTECTION_FAULT_ENABLE_DEFAULT, 1); 421 tmp = REG_SET_FIELD(tmp, GCVM_CONTEXT1_CNTL, 422 READ_PROTECTION_FAULT_ENABLE_DEFAULT, 1); 423 tmp = REG_SET_FIELD(tmp, GCVM_CONTEXT1_CNTL, 424 WRITE_PROTECTION_FAULT_ENABLE_DEFAULT, 1); 425 tmp = REG_SET_FIELD(tmp, GCVM_CONTEXT1_CNTL, 426 EXECUTE_PROTECTION_FAULT_ENABLE_DEFAULT, 1); 427 tmp = REG_SET_FIELD(tmp, GCVM_CONTEXT1_CNTL, 428 PAGE_TABLE_BLOCK_SIZE, block_size); 429 /* Send no-retry XNACK on fault to suppress VM fault storm */ 430 tmp = REG_SET_FIELD(tmp, GCVM_CONTEXT1_CNTL, 431 RETRY_PERMISSION_OR_INVALID_PAGE_FAULT, 432 !amdgpu_noretry); 433 WREG32_SOC15_OFFSET(GC, GET_INST(GC, j), regGCVM_CONTEXT1_CNTL, 434 i * hub->ctx_distance, tmp); 435 WREG32_SOC15_OFFSET(GC, GET_INST(GC, j), 436 regGCVM_CONTEXT1_PAGE_TABLE_START_ADDR_LO32, 437 i * hub->ctx_addr_distance, 0); 438 WREG32_SOC15_OFFSET(GC, GET_INST(GC, j), 439 regGCVM_CONTEXT1_PAGE_TABLE_START_ADDR_HI32, 440 i * hub->ctx_addr_distance, 0); 441 WREG32_SOC15_OFFSET(GC, GET_INST(GC, j), 442 regGCVM_CONTEXT1_PAGE_TABLE_END_ADDR_LO32, 443 i * hub->ctx_addr_distance, 444 lower_32_bits(adev->vm_manager.max_pfn - 1)); 445 WREG32_SOC15_OFFSET(GC, GET_INST(GC, j), 446 regGCVM_CONTEXT1_PAGE_TABLE_END_ADDR_HI32, 447 i * hub->ctx_addr_distance, 448 upper_32_bits(adev->vm_manager.max_pfn - 1)); 449 } 450 451 hub->vm_cntx_cntl = tmp; 452 } 453 } 454 455 static void gfxhub_v12_1_xcc_program_invalidation(struct amdgpu_device *adev, 456 uint32_t xcc_mask) 457 { 458 struct amdgpu_vmhub *hub; 459 unsigned int i, j; 460 461 for_each_inst(j, xcc_mask) { 462 hub = &adev->vmhub[AMDGPU_GFXHUB(j)]; 463 464 for (i = 0 ; i < 18; ++i) { 465 WREG32_SOC15_OFFSET(GC, GET_INST(GC, j), 466 regGCVM_INVALIDATE_ENG0_ADDR_RANGE_LO32, 467 i * hub->eng_addr_distance, 0xFFFFFFFF); 468 WREG32_SOC15_OFFSET(GC, GET_INST(GC, j), 469 regGCVM_INVALIDATE_ENG0_ADDR_RANGE_HI32, 470 i * hub->eng_addr_distance, 0x3FFF); 471 } 472 } 473 } 474 475 static int gfxhub_v12_1_xcc_gart_enable(struct amdgpu_device *adev, 476 uint32_t xcc_mask) 477 { 478 uint32_t i; 479 480 if (amdgpu_sriov_vf(adev)) { 481 /* GCMC_VM_FB_LOCATION_BASE/TOP are VF copy registers 482 * VBIO post does not program them at boot up phase 483 * Need driver to program them from guest side */ 484 for_each_inst(i, xcc_mask) { 485 WREG32_SOC15(GC, GET_INST(GC, i), 486 regGCMC_VM_FB_LOCATION_BASE_LO32, 487 lower_32_bits(adev->gmc.vram_start >> 24)); 488 WREG32_SOC15(GC, GET_INST(GC, i), 489 regGCMC_VM_FB_LOCATION_BASE_HI32, 490 upper_32_bits(adev->gmc.vram_start >> 24)); 491 WREG32_SOC15(GC, GET_INST(GC, i), 492 regGCMC_VM_FB_LOCATION_TOP_LO32, 493 lower_32_bits(adev->gmc.vram_end >> 24)); 494 WREG32_SOC15(GC, GET_INST(GC, i), 495 regGCMC_VM_FB_LOCATION_TOP_HI32, 496 upper_32_bits(adev->gmc.vram_end >> 24)); 497 } 498 } 499 /* GART Enable. */ 500 gfxhub_v12_1_xcc_init_gart_aperture_regs(adev, xcc_mask); 501 gfxhub_v12_1_xcc_init_system_aperture_regs(adev, xcc_mask); 502 gfxhub_v12_1_xcc_init_tlb_regs(adev, xcc_mask); 503 if (!amdgpu_sriov_vf(adev)) 504 gfxhub_v12_1_xcc_init_cache_regs(adev, xcc_mask); 505 506 gfxhub_v12_1_xcc_enable_system_domain(adev, xcc_mask); 507 if (!amdgpu_sriov_vf(adev)) 508 gfxhub_v12_1_xcc_disable_identity_aperture(adev, xcc_mask); 509 gfxhub_v12_1_xcc_setup_vmid_config(adev, xcc_mask); 510 gfxhub_v12_1_xcc_program_invalidation(adev, xcc_mask); 511 512 return 0; 513 } 514 515 static int gfxhub_v12_1_gart_enable(struct amdgpu_device *adev) 516 { 517 uint32_t xcc_mask; 518 519 xcc_mask = GENMASK(NUM_XCC(adev->gfx.xcc_mask) - 1, 0); 520 return gfxhub_v12_1_xcc_gart_enable(adev, xcc_mask); 521 } 522 523 static void gfxhub_v12_1_xcc_gart_disable(struct amdgpu_device *adev, 524 uint32_t xcc_mask) 525 { 526 struct amdgpu_vmhub *hub; 527 u32 tmp; 528 u32 i, j; 529 530 for_each_inst(j, xcc_mask) { 531 hub = &adev->vmhub[AMDGPU_GFXHUB(j)]; 532 /* Disable all tables */ 533 for (i = 0; i < 16; i++) 534 WREG32_SOC15_OFFSET(GC, GET_INST(GC, j), 535 regGCVM_CONTEXT0_CNTL, 536 i * hub->ctx_distance, 0); 537 538 /* Setup TLB control */ 539 tmp = RREG32_SOC15(GC, GET_INST(GC, j), 540 regGCMC_VM_MX_L1_TLB_CNTL); 541 tmp = REG_SET_FIELD(tmp, GCMC_VM_MX_L1_TLB_CNTL, 542 ENABLE_L1_TLB, 0); 543 tmp = REG_SET_FIELD(tmp, GCMC_VM_MX_L1_TLB_CNTL, 544 ENABLE_ADVANCED_DRIVER_MODEL, 0); 545 WREG32_SOC15_RLC(GC, GET_INST(GC, j), 546 regGCMC_VM_MX_L1_TLB_CNTL, tmp); 547 548 /* Setup L2 cache */ 549 if (!amdgpu_sriov_vf(adev)) { 550 tmp = RREG32_SOC15(GC, GET_INST(GC, j), regGCVM_L2_CNTL); 551 tmp = REG_SET_FIELD(tmp, GCVM_L2_CNTL, ENABLE_L2_CACHE, 0); 552 WREG32_SOC15(GC, GET_INST(GC, j), regGCVM_L2_CNTL, tmp); 553 WREG32_SOC15(GC, GET_INST(GC, j), regGCVM_L2_CNTL3, 0); 554 } 555 } 556 } 557 558 static void gfxhub_v12_1_gart_disable(struct amdgpu_device *adev) 559 { 560 uint32_t xcc_mask; 561 562 xcc_mask = GENMASK(NUM_XCC(adev->gfx.xcc_mask) - 1, 0); 563 gfxhub_v12_1_xcc_gart_disable(adev, xcc_mask); 564 } 565 566 static void gfxhub_v12_1_xcc_set_fault_enable_default(struct amdgpu_device *adev, 567 bool value, uint32_t xcc_mask) 568 { 569 u32 tmp; 570 int i; 571 572 for_each_inst(i, xcc_mask) { 573 tmp = RREG32_SOC15(GC, GET_INST(GC, i), 574 regGCVM_L2_PROTECTION_FAULT_CNTL_LO32); 575 tmp = REG_SET_FIELD(tmp, 576 GCVM_L2_PROTECTION_FAULT_CNTL_LO32, 577 RANGE_PROTECTION_FAULT_ENABLE_DEFAULT, value); 578 tmp = REG_SET_FIELD(tmp, 579 GCVM_L2_PROTECTION_FAULT_CNTL_LO32, 580 PDE0_PROTECTION_FAULT_ENABLE_DEFAULT, value); 581 tmp = REG_SET_FIELD(tmp, 582 GCVM_L2_PROTECTION_FAULT_CNTL_LO32, 583 PDE1_PROTECTION_FAULT_ENABLE_DEFAULT, value); 584 tmp = REG_SET_FIELD(tmp, 585 GCVM_L2_PROTECTION_FAULT_CNTL_LO32, 586 PDE2_PROTECTION_FAULT_ENABLE_DEFAULT, value); 587 tmp = REG_SET_FIELD(tmp, 588 GCVM_L2_PROTECTION_FAULT_CNTL_LO32, 589 PDE3_PROTECTION_FAULT_ENABLE_DEFAULT, value); 590 tmp = REG_SET_FIELD(tmp, 591 GCVM_L2_PROTECTION_FAULT_CNTL_LO32, 592 TRANSLATE_FURTHER_PROTECTION_FAULT_ENABLE_DEFAULT, 593 value); 594 tmp = REG_SET_FIELD(tmp, 595 GCVM_L2_PROTECTION_FAULT_CNTL_LO32, 596 NACK_PROTECTION_FAULT_ENABLE_DEFAULT, value); 597 tmp = REG_SET_FIELD(tmp, 598 GCVM_L2_PROTECTION_FAULT_CNTL_LO32, 599 DUMMY_PAGE_PROTECTION_FAULT_ENABLE_DEFAULT, value); 600 tmp = REG_SET_FIELD(tmp, 601 GCVM_L2_PROTECTION_FAULT_CNTL_LO32, 602 VALID_PROTECTION_FAULT_ENABLE_DEFAULT, value); 603 tmp = REG_SET_FIELD(tmp, 604 GCVM_L2_PROTECTION_FAULT_CNTL_LO32, 605 READ_PROTECTION_FAULT_ENABLE_DEFAULT, value); 606 tmp = REG_SET_FIELD(tmp, 607 GCVM_L2_PROTECTION_FAULT_CNTL_LO32, 608 WRITE_PROTECTION_FAULT_ENABLE_DEFAULT, value); 609 tmp = REG_SET_FIELD(tmp, 610 GCVM_L2_PROTECTION_FAULT_CNTL_LO32, 611 EXECUTE_PROTECTION_FAULT_ENABLE_DEFAULT, value); 612 tmp = REG_SET_FIELD(tmp, 613 GCVM_L2_PROTECTION_FAULT_CNTL_LO32, 614 CLIENT_ID_NO_RETRY_FAULT_INTERRUPT, value ? 0xFFFF:0); 615 tmp = REG_SET_FIELD(tmp, 616 GCVM_L2_PROTECTION_FAULT_CNTL_LO32, 617 OTHER_CLIENT_ID_NO_RETRY_FAULT_INTERRUPT, value); 618 if (!value) 619 tmp = REG_SET_FIELD(tmp, 620 GCVM_L2_PROTECTION_FAULT_CNTL_LO32, 621 CRASH_ON_NO_RETRY_FAULT, 1); 622 WREG32_SOC15(GC, GET_INST(GC, i), 623 regGCVM_L2_PROTECTION_FAULT_CNTL_LO32, tmp); 624 625 tmp = RREG32_SOC15(GC, GET_INST(GC, i), 626 regGCVM_L2_PROTECTION_FAULT_CNTL_HI32); 627 if (!value) 628 tmp = REG_SET_FIELD(tmp, 629 GCVM_L2_PROTECTION_FAULT_CNTL_HI32, 630 CRASH_ON_RETRY_FAULT, 1); 631 WREG32_SOC15(GC, GET_INST(GC, i), 632 regGCVM_L2_PROTECTION_FAULT_CNTL_HI32, tmp); 633 } 634 } 635 636 /** 637 * gfxhub_v12_1_set_fault_enable_default - update GART/VM fault handling 638 * 639 * @adev: amdgpu_device pointer 640 * @value: true redirects VM faults to the default page 641 */ 642 static void gfxhub_v12_1_set_fault_enable_default(struct amdgpu_device *adev, 643 bool value) 644 { 645 uint32_t xcc_mask; 646 647 xcc_mask = GENMASK(NUM_XCC(adev->gfx.xcc_mask) - 1, 0); 648 gfxhub_v12_1_xcc_set_fault_enable_default(adev, value, xcc_mask); 649 } 650 651 static uint32_t gfxhub_v12_1_get_invalidate_req(unsigned int vmid, 652 uint32_t flush_type) 653 { 654 u32 req = 0; 655 656 /* invalidate using legacy mode on vmid*/ 657 req = REG_SET_FIELD(req, GCVM_INVALIDATE_ENG0_REQ, 658 PER_VMID_INVALIDATE_REQ, 1 << vmid); 659 req = REG_SET_FIELD(req, GCVM_INVALIDATE_ENG0_REQ, 660 FLUSH_TYPE, flush_type); 661 req = REG_SET_FIELD(req, GCVM_INVALIDATE_ENG0_REQ, 662 INVALIDATE_L2_PTES, 1); 663 req = REG_SET_FIELD(req, GCVM_INVALIDATE_ENG0_REQ, 664 INVALIDATE_L2_PDE0, 1); 665 req = REG_SET_FIELD(req, GCVM_INVALIDATE_ENG0_REQ, 666 INVALIDATE_L2_PDE1, 1); 667 req = REG_SET_FIELD(req, GCVM_INVALIDATE_ENG0_REQ, 668 INVALIDATE_L2_PDE2, 1); 669 req = REG_SET_FIELD(req, GCVM_INVALIDATE_ENG0_REQ, 670 INVALIDATE_L1_PTES, 1); 671 req = REG_SET_FIELD(req, GCVM_INVALIDATE_ENG0_REQ, 672 CLEAR_PROTECTION_FAULT_STATUS_ADDR, 0); 673 674 return req; 675 } 676 677 static const char *gfxhub_v12_1_client_ids[] = { 678 "CB", 679 "DB", 680 "GE1", 681 "GE2", 682 "CPF", 683 "CPC", 684 "CPG", 685 "RLC", 686 "TCP", 687 "SQC (inst)", 688 "SQC (data)", 689 "SQG/PC/SC", 690 "Reserved", 691 "SDMA0", 692 "SDMA1", 693 "GCR", 694 "Reserved", 695 "Reserved", 696 "WGS", 697 "DSM", 698 "PA" 699 }; 700 701 /*TODO: l2 protection fault status is increased to 64bits. 702 * some critical fields like FED are moved to STATUS_HI32 */ 703 static void gfxhub_v12_1_print_l2_protection_fault_status(struct amdgpu_device *adev, 704 uint32_t status) 705 { 706 u32 cid = REG_GET_FIELD(status, 707 GCVM_L2_PROTECTION_FAULT_STATUS_LO32, 708 CID); 709 710 dev_err(adev->dev, 711 "GCVM_L2_PROTECTION_FAULT_STATUS_LO32:0x%08X\n", 712 status); 713 dev_err(adev->dev, "\t Faulty UTCL2 client ID: %s (0x%x)\n", 714 cid >= ARRAY_SIZE(gfxhub_v12_1_client_ids) ? 715 "unknown" : gfxhub_v12_1_client_ids[cid], cid); 716 dev_err(adev->dev, "\t MORE_FAULTS: 0x%lx\n", 717 REG_GET_FIELD(status, 718 GCVM_L2_PROTECTION_FAULT_STATUS_LO32, MORE_FAULTS)); 719 dev_err(adev->dev, "\t WALKER_ERROR: 0x%lx\n", 720 REG_GET_FIELD(status, 721 GCVM_L2_PROTECTION_FAULT_STATUS_LO32, WALKER_ERROR)); 722 dev_err(adev->dev, "\t PERMISSION_FAULTS: 0x%lx\n", 723 REG_GET_FIELD(status, 724 GCVM_L2_PROTECTION_FAULT_STATUS_LO32, PERMISSION_FAULTS)); 725 dev_err(adev->dev, "\t MAPPING_ERROR: 0x%lx\n", 726 REG_GET_FIELD(status, 727 GCVM_L2_PROTECTION_FAULT_STATUS_LO32, MAPPING_ERROR)); 728 dev_err(adev->dev, "\t RW: 0x%lx\n", 729 REG_GET_FIELD(status, 730 GCVM_L2_PROTECTION_FAULT_STATUS_LO32, RW)); 731 } 732 733 static const struct amdgpu_vmhub_funcs gfxhub_v12_1_vmhub_funcs = { 734 .print_l2_protection_fault_status = gfxhub_v12_1_print_l2_protection_fault_status, 735 .get_invalidate_req = gfxhub_v12_1_get_invalidate_req, 736 }; 737 738 static void gfxhub_v12_1_xcc_init(struct amdgpu_device *adev, uint32_t xcc_mask) 739 { 740 struct amdgpu_vmhub *hub; 741 int i; 742 743 for_each_inst(i, xcc_mask) { 744 hub = &adev->vmhub[AMDGPU_GFXHUB(i)]; 745 746 hub->ctx0_ptb_addr_lo32 = 747 SOC15_REG_OFFSET(GC, GET_INST(GC, i), 748 regGCVM_CONTEXT0_PAGE_TABLE_BASE_ADDR_LO32); 749 hub->ctx0_ptb_addr_hi32 = 750 SOC15_REG_OFFSET(GC, GET_INST(GC, i), 751 regGCVM_CONTEXT0_PAGE_TABLE_BASE_ADDR_HI32); 752 hub->vm_inv_eng0_sem = 753 SOC15_REG_OFFSET(GC, GET_INST(GC, i), 754 regGCVM_INVALIDATE_ENG0_SEM); 755 hub->vm_inv_eng0_req = 756 SOC15_REG_OFFSET(GC, GET_INST(GC, i), 757 regGCVM_INVALIDATE_ENG0_REQ); 758 hub->vm_inv_eng0_ack = 759 SOC15_REG_OFFSET(GC, GET_INST(GC, i), 760 regGCVM_INVALIDATE_ENG0_ACK); 761 hub->vm_context0_cntl = 762 SOC15_REG_OFFSET(GC, GET_INST(GC, i), 763 regGCVM_CONTEXT0_CNTL); 764 /* TODO: add a new member to accomandate additional fault status/cntl reg */ 765 hub->vm_l2_pro_fault_status = 766 SOC15_REG_OFFSET(GC, GET_INST(GC, i), 767 regGCVM_L2_PROTECTION_FAULT_STATUS_LO32); 768 hub->vm_l2_pro_fault_cntl = 769 SOC15_REG_OFFSET(GC, GET_INST(GC, i), 770 regGCVM_L2_PROTECTION_FAULT_CNTL_LO32); 771 hub->ctx_distance = 772 regGCVM_CONTEXT1_CNTL - 773 regGCVM_CONTEXT0_CNTL; 774 hub->ctx_addr_distance = 775 regGCVM_CONTEXT1_PAGE_TABLE_BASE_ADDR_LO32 - 776 regGCVM_CONTEXT0_PAGE_TABLE_BASE_ADDR_LO32; 777 hub->eng_distance = 778 regGCVM_INVALIDATE_ENG1_REQ - 779 regGCVM_INVALIDATE_ENG0_REQ; 780 hub->eng_addr_distance = 781 regGCVM_INVALIDATE_ENG1_ADDR_RANGE_LO32 - 782 regGCVM_INVALIDATE_ENG0_ADDR_RANGE_LO32; 783 784 hub->vm_cntx_cntl_vm_fault = 785 GCVM_CONTEXT1_CNTL__RANGE_PROTECTION_FAULT_ENABLE_INTERRUPT_MASK | 786 GCVM_CONTEXT1_CNTL__DUMMY_PAGE_PROTECTION_FAULT_ENABLE_INTERRUPT_MASK | 787 GCVM_CONTEXT1_CNTL__PDE0_PROTECTION_FAULT_ENABLE_INTERRUPT_MASK | 788 GCVM_CONTEXT1_CNTL__VALID_PROTECTION_FAULT_ENABLE_INTERRUPT_MASK | 789 GCVM_CONTEXT1_CNTL__READ_PROTECTION_FAULT_ENABLE_INTERRUPT_MASK | 790 GCVM_CONTEXT1_CNTL__WRITE_PROTECTION_FAULT_ENABLE_INTERRUPT_MASK | 791 GCVM_CONTEXT1_CNTL__EXECUTE_PROTECTION_FAULT_ENABLE_INTERRUPT_MASK; 792 793 hub->vmhub_funcs = &gfxhub_v12_1_vmhub_funcs; 794 } 795 } 796 797 static void gfxhub_v12_1_init(struct amdgpu_device *adev) 798 { 799 uint32_t xcc_mask; 800 801 xcc_mask = GENMASK(NUM_XCC(adev->gfx.xcc_mask) - 1, 0); 802 gfxhub_v12_1_xcc_init(adev, xcc_mask); 803 } 804 805 static int gfxhub_v12_1_get_xgmi_info(struct amdgpu_device *adev) 806 { 807 u32 max_num_physical_nodes; 808 u32 max_physical_node_id; 809 u32 xgmi_lfb_cntl; 810 u32 max_region; 811 u64 seg_size; 812 813 xgmi_lfb_cntl = RREG32_SOC15(GC, GET_INST(GC, 0), 814 regGCMC_VM_XGMI_LFB_CNTL); 815 seg_size = REG_GET_FIELD(RREG32_SOC15(GC, GET_INST(GC, 0), 816 regGCMC_VM_XGMI_LFB_SIZE), 817 GCMC_VM_XGMI_LFB_SIZE, PF_LFB_SIZE) << 24; 818 max_region = REG_GET_FIELD(xgmi_lfb_cntl, 819 GCMC_VM_XGMI_LFB_CNTL, 820 PF_MAX_REGION); 821 822 max_num_physical_nodes = 8; 823 max_physical_node_id = 7; 824 825 /* PF_MAX_REGION=0 means xgmi is disabled */ 826 if (max_region || adev->gmc.xgmi.connected_to_cpu) { 827 adev->gmc.xgmi.num_physical_nodes = max_region + 1; 828 829 if (adev->gmc.xgmi.num_physical_nodes > max_num_physical_nodes) 830 return -EINVAL; 831 832 adev->gmc.xgmi.physical_node_id = 833 REG_GET_FIELD(xgmi_lfb_cntl, 834 GCMC_VM_XGMI_LFB_CNTL, 835 PF_LFB_REGION); 836 837 if (adev->gmc.xgmi.physical_node_id > max_physical_node_id) 838 return -EINVAL; 839 840 adev->gmc.xgmi.node_segment_size = seg_size; 841 } 842 843 return 0; 844 } 845 846 const struct amdgpu_gfxhub_funcs gfxhub_v12_1_funcs = { 847 .get_fb_location = gfxhub_v12_1_get_fb_location, 848 .get_mc_fb_offset = gfxhub_v12_1_get_mc_fb_offset, 849 .setup_vm_pt_regs = gfxhub_v12_1_setup_vm_pt_regs, 850 .gart_enable = gfxhub_v12_1_gart_enable, 851 .gart_disable = gfxhub_v12_1_gart_disable, 852 .set_fault_enable_default = gfxhub_v12_1_set_fault_enable_default, 853 .init = gfxhub_v12_1_init, 854 .get_xgmi_info = gfxhub_v12_1_get_xgmi_info, 855 }; 856 857 static int gfxhub_v12_1_xcp_resume(void *handle, uint32_t inst_mask) 858 { 859 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 860 bool value; 861 862 if (amdgpu_vm_fault_stop == AMDGPU_VM_FAULT_STOP_ALWAYS) 863 value = false; 864 else 865 value = true; 866 867 gfxhub_v12_1_xcc_set_fault_enable_default(adev, value, inst_mask); 868 869 if (!amdgpu_sriov_vf(adev)) 870 return gfxhub_v12_1_xcc_gart_enable(adev, inst_mask); 871 872 return 0; 873 } 874 875 static int gfxhub_v12_1_xcp_suspend(void *handle, uint32_t inst_mask) 876 { 877 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 878 879 if (!amdgpu_sriov_vf(adev)) 880 gfxhub_v12_1_xcc_gart_disable(adev, inst_mask); 881 882 return 0; 883 } 884 885 struct amdgpu_xcp_ip_funcs gfxhub_v12_1_xcp_funcs = { 886 .suspend = &gfxhub_v12_1_xcp_suspend, 887 .resume = &gfxhub_v12_1_xcp_resume 888 }; 889