1 /* 2 * Copyright 2008 Advanced Micro Devices, Inc. 3 * Copyright 2008 Red Hat Inc. 4 * Copyright 2009 Jerome Glisse. 5 * 6 * Permission is hereby granted, free of charge, to any person obtaining a 7 * copy of this software and associated documentation files (the "Software"), 8 * to deal in the Software without restriction, including without limitation 9 * the rights to use, copy, modify, merge, publish, distribute, sublicense, 10 * and/or sell copies of the Software, and to permit persons to whom the 11 * Software is furnished to do so, subject to the following conditions: 12 * 13 * The above copyright notice and this permission notice shall be included in 14 * all copies or substantial portions of the Software. 15 * 16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 19 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR 20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 22 * OTHER DEALINGS IN THE SOFTWARE. 23 * 24 * Authors: Dave Airlie 25 * Alex Deucher 26 * Jerome Glisse 27 */ 28 #include <linux/seq_file.h> 29 #include <linux/slab.h> 30 #include <drm/drmP.h> 31 #include "radeon.h" 32 #include "radeon_asic.h" 33 #include "rs400d.h" 34 35 /* This files gather functions specifics to : rs400,rs480 */ 36 static int rs400_debugfs_pcie_gart_info_init(struct radeon_device *rdev); 37 38 void rs400_gart_adjust_size(struct radeon_device *rdev) 39 { 40 /* Check gart size */ 41 switch (rdev->mc.gtt_size/(1024*1024)) { 42 case 32: 43 case 64: 44 case 128: 45 case 256: 46 case 512: 47 case 1024: 48 case 2048: 49 break; 50 default: 51 DRM_ERROR("Unable to use IGP GART size %uM\n", 52 (unsigned)(rdev->mc.gtt_size >> 20)); 53 DRM_ERROR("Valid GART size for IGP are 32M,64M,128M,256M,512M,1G,2G\n"); 54 DRM_ERROR("Forcing to 32M GART size\n"); 55 rdev->mc.gtt_size = 32 * 1024 * 1024; 56 return; 57 } 58 if (rdev->family == CHIP_RS400 || rdev->family == CHIP_RS480) { 59 /* FIXME: RS400 & RS480 seems to have issue with GART size 60 * if 4G of system memory (needs more testing) */ 61 rdev->mc.gtt_size = 32 * 1024 * 1024; 62 DRM_ERROR("Forcing to 32M GART size (because of ASIC bug ?)\n"); 63 } 64 } 65 66 void rs400_gart_tlb_flush(struct radeon_device *rdev) 67 { 68 uint32_t tmp; 69 unsigned int timeout = rdev->usec_timeout; 70 71 WREG32_MC(RS480_GART_CACHE_CNTRL, RS480_GART_CACHE_INVALIDATE); 72 do { 73 tmp = RREG32_MC(RS480_GART_CACHE_CNTRL); 74 if ((tmp & RS480_GART_CACHE_INVALIDATE) == 0) 75 break; 76 DRM_UDELAY(1); 77 timeout--; 78 } while (timeout > 0); 79 WREG32_MC(RS480_GART_CACHE_CNTRL, 0); 80 } 81 82 int rs400_gart_init(struct radeon_device *rdev) 83 { 84 int r; 85 86 if (rdev->gart.table.ram.ptr) { 87 WARN(1, "RS400 GART already initialized.\n"); 88 return 0; 89 } 90 /* Check gart size */ 91 switch(rdev->mc.gtt_size / (1024 * 1024)) { 92 case 32: 93 case 64: 94 case 128: 95 case 256: 96 case 512: 97 case 1024: 98 case 2048: 99 break; 100 default: 101 return -EINVAL; 102 } 103 /* Initialize common gart structure */ 104 r = radeon_gart_init(rdev); 105 if (r) 106 return r; 107 if (rs400_debugfs_pcie_gart_info_init(rdev)) 108 DRM_ERROR("Failed to register debugfs file for RS400 GART !\n"); 109 rdev->gart.table_size = rdev->gart.num_gpu_pages * 4; 110 return radeon_gart_table_ram_alloc(rdev); 111 } 112 113 int rs400_gart_enable(struct radeon_device *rdev) 114 { 115 uint32_t size_reg; 116 uint32_t tmp; 117 118 radeon_gart_restore(rdev); 119 tmp = RREG32_MC(RS690_AIC_CTRL_SCRATCH); 120 tmp |= RS690_DIS_OUT_OF_PCI_GART_ACCESS; 121 WREG32_MC(RS690_AIC_CTRL_SCRATCH, tmp); 122 /* Check gart size */ 123 switch(rdev->mc.gtt_size / (1024 * 1024)) { 124 case 32: 125 size_reg = RS480_VA_SIZE_32MB; 126 break; 127 case 64: 128 size_reg = RS480_VA_SIZE_64MB; 129 break; 130 case 128: 131 size_reg = RS480_VA_SIZE_128MB; 132 break; 133 case 256: 134 size_reg = RS480_VA_SIZE_256MB; 135 break; 136 case 512: 137 size_reg = RS480_VA_SIZE_512MB; 138 break; 139 case 1024: 140 size_reg = RS480_VA_SIZE_1GB; 141 break; 142 case 2048: 143 size_reg = RS480_VA_SIZE_2GB; 144 break; 145 default: 146 return -EINVAL; 147 } 148 /* It should be fine to program it to max value */ 149 if (rdev->family == CHIP_RS690 || (rdev->family == CHIP_RS740)) { 150 WREG32_MC(RS690_MCCFG_AGP_BASE, 0xFFFFFFFF); 151 WREG32_MC(RS690_MCCFG_AGP_BASE_2, 0); 152 } else { 153 WREG32(RADEON_AGP_BASE, 0xFFFFFFFF); 154 WREG32(RS480_AGP_BASE_2, 0); 155 } 156 tmp = REG_SET(RS690_MC_AGP_TOP, rdev->mc.gtt_end >> 16); 157 tmp |= REG_SET(RS690_MC_AGP_START, rdev->mc.gtt_start >> 16); 158 if ((rdev->family == CHIP_RS690) || (rdev->family == CHIP_RS740)) { 159 WREG32_MC(RS690_MCCFG_AGP_LOCATION, tmp); 160 tmp = RREG32(RADEON_BUS_CNTL) & ~RS600_BUS_MASTER_DIS; 161 WREG32(RADEON_BUS_CNTL, tmp); 162 } else { 163 WREG32(RADEON_MC_AGP_LOCATION, tmp); 164 tmp = RREG32(RADEON_BUS_CNTL) & ~RADEON_BUS_MASTER_DIS; 165 WREG32(RADEON_BUS_CNTL, tmp); 166 } 167 /* Table should be in 32bits address space so ignore bits above. */ 168 tmp = (u32)rdev->gart.table_addr & 0xfffff000; 169 tmp |= (upper_32_bits(rdev->gart.table_addr) & 0xff) << 4; 170 171 WREG32_MC(RS480_GART_BASE, tmp); 172 /* TODO: more tweaking here */ 173 WREG32_MC(RS480_GART_FEATURE_ID, 174 (RS480_TLB_ENABLE | 175 RS480_GTW_LAC_EN | RS480_1LEVEL_GART)); 176 /* Disable snooping */ 177 WREG32_MC(RS480_AGP_MODE_CNTL, 178 (1 << RS480_REQ_TYPE_SNOOP_SHIFT) | RS480_REQ_TYPE_SNOOP_DIS); 179 /* Disable AGP mode */ 180 /* FIXME: according to doc we should set HIDE_MMCFG_BAR=0, 181 * AGPMODE30=0 & AGP30ENHANCED=0 in NB_CNTL */ 182 if ((rdev->family == CHIP_RS690) || (rdev->family == CHIP_RS740)) { 183 WREG32_MC(RS480_MC_MISC_CNTL, 184 (RS480_GART_INDEX_REG_EN | RS690_BLOCK_GFX_D3_EN)); 185 } else { 186 WREG32_MC(RS480_MC_MISC_CNTL, RS480_GART_INDEX_REG_EN); 187 } 188 /* Enable gart */ 189 WREG32_MC(RS480_AGP_ADDRESS_SPACE_SIZE, (RS480_GART_EN | size_reg)); 190 rs400_gart_tlb_flush(rdev); 191 rdev->gart.ready = true; 192 return 0; 193 } 194 195 void rs400_gart_disable(struct radeon_device *rdev) 196 { 197 uint32_t tmp; 198 199 tmp = RREG32_MC(RS690_AIC_CTRL_SCRATCH); 200 tmp |= RS690_DIS_OUT_OF_PCI_GART_ACCESS; 201 WREG32_MC(RS690_AIC_CTRL_SCRATCH, tmp); 202 WREG32_MC(RS480_AGP_ADDRESS_SPACE_SIZE, 0); 203 } 204 205 void rs400_gart_fini(struct radeon_device *rdev) 206 { 207 radeon_gart_fini(rdev); 208 rs400_gart_disable(rdev); 209 radeon_gart_table_ram_free(rdev); 210 } 211 212 int rs400_gart_set_page(struct radeon_device *rdev, int i, uint64_t addr) 213 { 214 uint32_t entry; 215 216 if (i < 0 || i > rdev->gart.num_gpu_pages) { 217 return -EINVAL; 218 } 219 220 entry = (lower_32_bits(addr) & PAGE_MASK) | 221 ((upper_32_bits(addr) & 0xff) << 4) | 222 0xc; 223 entry = cpu_to_le32(entry); 224 rdev->gart.table.ram.ptr[i] = entry; 225 return 0; 226 } 227 228 int rs400_mc_wait_for_idle(struct radeon_device *rdev) 229 { 230 unsigned i; 231 uint32_t tmp; 232 233 for (i = 0; i < rdev->usec_timeout; i++) { 234 /* read MC_STATUS */ 235 tmp = RREG32(0x0150); 236 if (tmp & (1 << 2)) { 237 return 0; 238 } 239 DRM_UDELAY(1); 240 } 241 return -1; 242 } 243 244 void rs400_gpu_init(struct radeon_device *rdev) 245 { 246 /* FIXME: is this correct ? */ 247 r420_pipes_init(rdev); 248 if (rs400_mc_wait_for_idle(rdev)) { 249 printk(KERN_WARNING "rs400: Failed to wait MC idle while " 250 "programming pipes. Bad things might happen. %08x\n", RREG32(0x150)); 251 } 252 } 253 254 void rs400_mc_init(struct radeon_device *rdev) 255 { 256 u64 base; 257 258 rs400_gart_adjust_size(rdev); 259 rdev->mc.igp_sideport_enabled = radeon_combios_sideport_present(rdev); 260 /* DDR for all card after R300 & IGP */ 261 rdev->mc.vram_is_ddr = true; 262 rdev->mc.vram_width = 128; 263 r100_vram_init_sizes(rdev); 264 base = (RREG32(RADEON_NB_TOM) & 0xffff) << 16; 265 radeon_vram_location(rdev, &rdev->mc, base); 266 radeon_gtt_location(rdev, &rdev->mc); 267 radeon_update_bandwidth_info(rdev); 268 } 269 270 uint32_t rs400_mc_rreg(struct radeon_device *rdev, uint32_t reg) 271 { 272 uint32_t r; 273 274 WREG32(RS480_NB_MC_INDEX, reg & 0xff); 275 r = RREG32(RS480_NB_MC_DATA); 276 WREG32(RS480_NB_MC_INDEX, 0xff); 277 return r; 278 } 279 280 void rs400_mc_wreg(struct radeon_device *rdev, uint32_t reg, uint32_t v) 281 { 282 WREG32(RS480_NB_MC_INDEX, ((reg) & 0xff) | RS480_NB_MC_IND_WR_EN); 283 WREG32(RS480_NB_MC_DATA, (v)); 284 WREG32(RS480_NB_MC_INDEX, 0xff); 285 } 286 287 #if defined(CONFIG_DEBUG_FS) 288 static int rs400_debugfs_gart_info(struct seq_file *m, void *data) 289 { 290 struct drm_info_node *node = (struct drm_info_node *) m->private; 291 struct drm_device *dev = node->minor->dev; 292 struct radeon_device *rdev = dev->dev_private; 293 uint32_t tmp; 294 295 tmp = RREG32(RADEON_HOST_PATH_CNTL); 296 seq_printf(m, "HOST_PATH_CNTL 0x%08x\n", tmp); 297 tmp = RREG32(RADEON_BUS_CNTL); 298 seq_printf(m, "BUS_CNTL 0x%08x\n", tmp); 299 tmp = RREG32_MC(RS690_AIC_CTRL_SCRATCH); 300 seq_printf(m, "AIC_CTRL_SCRATCH 0x%08x\n", tmp); 301 if (rdev->family == CHIP_RS690 || (rdev->family == CHIP_RS740)) { 302 tmp = RREG32_MC(RS690_MCCFG_AGP_BASE); 303 seq_printf(m, "MCCFG_AGP_BASE 0x%08x\n", tmp); 304 tmp = RREG32_MC(RS690_MCCFG_AGP_BASE_2); 305 seq_printf(m, "MCCFG_AGP_BASE_2 0x%08x\n", tmp); 306 tmp = RREG32_MC(RS690_MCCFG_AGP_LOCATION); 307 seq_printf(m, "MCCFG_AGP_LOCATION 0x%08x\n", tmp); 308 tmp = RREG32_MC(0x100); 309 seq_printf(m, "MCCFG_FB_LOCATION 0x%08x\n", tmp); 310 tmp = RREG32(0x134); 311 seq_printf(m, "HDP_FB_LOCATION 0x%08x\n", tmp); 312 } else { 313 tmp = RREG32(RADEON_AGP_BASE); 314 seq_printf(m, "AGP_BASE 0x%08x\n", tmp); 315 tmp = RREG32(RS480_AGP_BASE_2); 316 seq_printf(m, "AGP_BASE_2 0x%08x\n", tmp); 317 tmp = RREG32(RADEON_MC_AGP_LOCATION); 318 seq_printf(m, "MC_AGP_LOCATION 0x%08x\n", tmp); 319 } 320 tmp = RREG32_MC(RS480_GART_BASE); 321 seq_printf(m, "GART_BASE 0x%08x\n", tmp); 322 tmp = RREG32_MC(RS480_GART_FEATURE_ID); 323 seq_printf(m, "GART_FEATURE_ID 0x%08x\n", tmp); 324 tmp = RREG32_MC(RS480_AGP_MODE_CNTL); 325 seq_printf(m, "AGP_MODE_CONTROL 0x%08x\n", tmp); 326 tmp = RREG32_MC(RS480_MC_MISC_CNTL); 327 seq_printf(m, "MC_MISC_CNTL 0x%08x\n", tmp); 328 tmp = RREG32_MC(0x5F); 329 seq_printf(m, "MC_MISC_UMA_CNTL 0x%08x\n", tmp); 330 tmp = RREG32_MC(RS480_AGP_ADDRESS_SPACE_SIZE); 331 seq_printf(m, "AGP_ADDRESS_SPACE_SIZE 0x%08x\n", tmp); 332 tmp = RREG32_MC(RS480_GART_CACHE_CNTRL); 333 seq_printf(m, "GART_CACHE_CNTRL 0x%08x\n", tmp); 334 tmp = RREG32_MC(0x3B); 335 seq_printf(m, "MC_GART_ERROR_ADDRESS 0x%08x\n", tmp); 336 tmp = RREG32_MC(0x3C); 337 seq_printf(m, "MC_GART_ERROR_ADDRESS_HI 0x%08x\n", tmp); 338 tmp = RREG32_MC(0x30); 339 seq_printf(m, "GART_ERROR_0 0x%08x\n", tmp); 340 tmp = RREG32_MC(0x31); 341 seq_printf(m, "GART_ERROR_1 0x%08x\n", tmp); 342 tmp = RREG32_MC(0x32); 343 seq_printf(m, "GART_ERROR_2 0x%08x\n", tmp); 344 tmp = RREG32_MC(0x33); 345 seq_printf(m, "GART_ERROR_3 0x%08x\n", tmp); 346 tmp = RREG32_MC(0x34); 347 seq_printf(m, "GART_ERROR_4 0x%08x\n", tmp); 348 tmp = RREG32_MC(0x35); 349 seq_printf(m, "GART_ERROR_5 0x%08x\n", tmp); 350 tmp = RREG32_MC(0x36); 351 seq_printf(m, "GART_ERROR_6 0x%08x\n", tmp); 352 tmp = RREG32_MC(0x37); 353 seq_printf(m, "GART_ERROR_7 0x%08x\n", tmp); 354 return 0; 355 } 356 357 static struct drm_info_list rs400_gart_info_list[] = { 358 {"rs400_gart_info", rs400_debugfs_gart_info, 0, NULL}, 359 }; 360 #endif 361 362 static int rs400_debugfs_pcie_gart_info_init(struct radeon_device *rdev) 363 { 364 #if defined(CONFIG_DEBUG_FS) 365 return radeon_debugfs_add_files(rdev, rs400_gart_info_list, 1); 366 #else 367 return 0; 368 #endif 369 } 370 371 void rs400_mc_program(struct radeon_device *rdev) 372 { 373 struct r100_mc_save save; 374 375 /* Stops all mc clients */ 376 r100_mc_stop(rdev, &save); 377 378 /* Wait for mc idle */ 379 if (rs400_mc_wait_for_idle(rdev)) 380 dev_warn(rdev->dev, "rs400: Wait MC idle timeout before updating MC.\n"); 381 WREG32(R_000148_MC_FB_LOCATION, 382 S_000148_MC_FB_START(rdev->mc.vram_start >> 16) | 383 S_000148_MC_FB_TOP(rdev->mc.vram_end >> 16)); 384 385 r100_mc_resume(rdev, &save); 386 } 387 388 static int rs400_startup(struct radeon_device *rdev) 389 { 390 int r; 391 392 r100_set_common_regs(rdev); 393 394 rs400_mc_program(rdev); 395 /* Resume clock */ 396 r300_clock_startup(rdev); 397 /* Initialize GPU configuration (# pipes, ...) */ 398 rs400_gpu_init(rdev); 399 r100_enable_bm(rdev); 400 /* Initialize GART (initialize after TTM so we can allocate 401 * memory through TTM but finalize after TTM) */ 402 r = rs400_gart_enable(rdev); 403 if (r) 404 return r; 405 /* Enable IRQ */ 406 r100_irq_set(rdev); 407 rdev->config.r300.hdp_cntl = RREG32(RADEON_HOST_PATH_CNTL); 408 /* 1M ring buffer */ 409 r = r100_cp_init(rdev, 1024 * 1024); 410 if (r) { 411 dev_err(rdev->dev, "failled initializing CP (%d).\n", r); 412 return r; 413 } 414 r = r100_wb_init(rdev); 415 if (r) 416 dev_err(rdev->dev, "failled initializing WB (%d).\n", r); 417 r = r100_ib_init(rdev); 418 if (r) { 419 dev_err(rdev->dev, "failled initializing IB (%d).\n", r); 420 return r; 421 } 422 return 0; 423 } 424 425 int rs400_resume(struct radeon_device *rdev) 426 { 427 /* Make sur GART are not working */ 428 rs400_gart_disable(rdev); 429 /* Resume clock before doing reset */ 430 r300_clock_startup(rdev); 431 /* setup MC before calling post tables */ 432 rs400_mc_program(rdev); 433 /* Reset gpu before posting otherwise ATOM will enter infinite loop */ 434 if (radeon_asic_reset(rdev)) { 435 dev_warn(rdev->dev, "GPU reset failed ! (0xE40=0x%08X, 0x7C0=0x%08X)\n", 436 RREG32(R_000E40_RBBM_STATUS), 437 RREG32(R_0007C0_CP_STAT)); 438 } 439 /* post */ 440 radeon_combios_asic_init(rdev->ddev); 441 /* Resume clock after posting */ 442 r300_clock_startup(rdev); 443 /* Initialize surface registers */ 444 radeon_surface_init(rdev); 445 return rs400_startup(rdev); 446 } 447 448 int rs400_suspend(struct radeon_device *rdev) 449 { 450 r100_cp_disable(rdev); 451 r100_wb_disable(rdev); 452 r100_irq_disable(rdev); 453 rs400_gart_disable(rdev); 454 return 0; 455 } 456 457 void rs400_fini(struct radeon_device *rdev) 458 { 459 r100_cp_fini(rdev); 460 r100_wb_fini(rdev); 461 r100_ib_fini(rdev); 462 radeon_gem_fini(rdev); 463 rs400_gart_fini(rdev); 464 radeon_irq_kms_fini(rdev); 465 radeon_fence_driver_fini(rdev); 466 radeon_bo_fini(rdev); 467 radeon_atombios_fini(rdev); 468 kfree(rdev->bios); 469 rdev->bios = NULL; 470 } 471 472 int rs400_init(struct radeon_device *rdev) 473 { 474 int r; 475 476 /* Disable VGA */ 477 r100_vga_render_disable(rdev); 478 /* Initialize scratch registers */ 479 radeon_scratch_init(rdev); 480 /* Initialize surface registers */ 481 radeon_surface_init(rdev); 482 /* TODO: disable VGA need to use VGA request */ 483 /* BIOS*/ 484 if (!radeon_get_bios(rdev)) { 485 if (ASIC_IS_AVIVO(rdev)) 486 return -EINVAL; 487 } 488 if (rdev->is_atom_bios) { 489 dev_err(rdev->dev, "Expecting combios for RS400/RS480 GPU\n"); 490 return -EINVAL; 491 } else { 492 r = radeon_combios_init(rdev); 493 if (r) 494 return r; 495 } 496 /* Reset gpu before posting otherwise ATOM will enter infinite loop */ 497 if (radeon_asic_reset(rdev)) { 498 dev_warn(rdev->dev, 499 "GPU reset failed ! (0xE40=0x%08X, 0x7C0=0x%08X)\n", 500 RREG32(R_000E40_RBBM_STATUS), 501 RREG32(R_0007C0_CP_STAT)); 502 } 503 /* check if cards are posted or not */ 504 if (radeon_boot_test_post_card(rdev) == false) 505 return -EINVAL; 506 507 /* Initialize clocks */ 508 radeon_get_clock_info(rdev->ddev); 509 /* initialize memory controller */ 510 rs400_mc_init(rdev); 511 /* Fence driver */ 512 r = radeon_fence_driver_init(rdev); 513 if (r) 514 return r; 515 r = radeon_irq_kms_init(rdev); 516 if (r) 517 return r; 518 /* Memory manager */ 519 r = radeon_bo_init(rdev); 520 if (r) 521 return r; 522 r = rs400_gart_init(rdev); 523 if (r) 524 return r; 525 r300_set_reg_safe(rdev); 526 rdev->accel_working = true; 527 r = rs400_startup(rdev); 528 if (r) { 529 /* Somethings want wront with the accel init stop accel */ 530 dev_err(rdev->dev, "Disabling GPU acceleration\n"); 531 r100_cp_fini(rdev); 532 r100_wb_fini(rdev); 533 r100_ib_fini(rdev); 534 rs400_gart_fini(rdev); 535 radeon_irq_kms_fini(rdev); 536 rdev->accel_working = false; 537 } 538 return 0; 539 } 540