1 /* 2 ** 3 ** PCI Lower Bus Adapter (LBA) manager 4 ** 5 ** (c) Copyright 1999,2000 Grant Grundler 6 ** (c) Copyright 1999,2000 Hewlett-Packard Company 7 ** 8 ** This program is free software; you can redistribute it and/or modify 9 ** it under the terms of the GNU General Public License as published by 10 ** the Free Software Foundation; either version 2 of the License, or 11 ** (at your option) any later version. 12 ** 13 ** 14 ** This module primarily provides access to PCI bus (config/IOport 15 ** spaces) on platforms with an SBA/LBA chipset. A/B/C/J/L/N-class 16 ** with 4 digit model numbers - eg C3000 (and A400...sigh). 17 ** 18 ** LBA driver isn't as simple as the Dino driver because: 19 ** (a) this chip has substantial bug fixes between revisions 20 ** (Only one Dino bug has a software workaround :^( ) 21 ** (b) has more options which we don't (yet) support (DMA hints, OLARD) 22 ** (c) IRQ support lives in the I/O SAPIC driver (not with PCI driver) 23 ** (d) play nicely with both PAT and "Legacy" PA-RISC firmware (PDC). 24 ** (dino only deals with "Legacy" PDC) 25 ** 26 ** LBA driver passes the I/O SAPIC HPA to the I/O SAPIC driver. 27 ** (I/O SAPIC is integratd in the LBA chip). 28 ** 29 ** FIXME: Add support to SBA and LBA drivers for DMA hint sets 30 ** FIXME: Add support for PCI card hot-plug (OLARD). 31 */ 32 33 #include <linux/delay.h> 34 #include <linux/types.h> 35 #include <linux/kernel.h> 36 #include <linux/spinlock.h> 37 #include <linux/init.h> /* for __init */ 38 #include <linux/pci.h> 39 #include <linux/ioport.h> 40 #include <linux/slab.h> 41 42 #include <asm/byteorder.h> 43 #include <asm/pdc.h> 44 #include <asm/pdcpat.h> 45 #include <asm/page.h> 46 47 #include <asm/ropes.h> 48 #include <asm/hardware.h> /* for register_parisc_driver() stuff */ 49 #include <asm/parisc-device.h> 50 #include <asm/io.h> /* read/write stuff */ 51 52 #undef DEBUG_LBA /* general stuff */ 53 #undef DEBUG_LBA_PORT /* debug I/O Port access */ 54 #undef DEBUG_LBA_CFG /* debug Config Space Access (ie PCI Bus walk) */ 55 #undef DEBUG_LBA_PAT /* debug PCI Resource Mgt code - PDC PAT only */ 56 57 #undef FBB_SUPPORT /* Fast Back-Back xfers - NOT READY YET */ 58 59 60 #ifdef DEBUG_LBA 61 #define DBG(x...) printk(x) 62 #else 63 #define DBG(x...) 64 #endif 65 66 #ifdef DEBUG_LBA_PORT 67 #define DBG_PORT(x...) printk(x) 68 #else 69 #define DBG_PORT(x...) 70 #endif 71 72 #ifdef DEBUG_LBA_CFG 73 #define DBG_CFG(x...) printk(x) 74 #else 75 #define DBG_CFG(x...) 76 #endif 77 78 #ifdef DEBUG_LBA_PAT 79 #define DBG_PAT(x...) printk(x) 80 #else 81 #define DBG_PAT(x...) 82 #endif 83 84 85 /* 86 ** Config accessor functions only pass in the 8-bit bus number and not 87 ** the 8-bit "PCI Segment" number. Each LBA will be assigned a PCI bus 88 ** number based on what firmware wrote into the scratch register. 89 ** 90 ** The "secondary" bus number is set to this before calling 91 ** pci_register_ops(). If any PPB's are present, the scan will 92 ** discover them and update the "secondary" and "subordinate" 93 ** fields in the pci_bus structure. 94 ** 95 ** Changes in the configuration *may* result in a different 96 ** bus number for each LBA depending on what firmware does. 97 */ 98 99 #define MODULE_NAME "LBA" 100 101 /* non-postable I/O port space, densely packed */ 102 #define LBA_PORT_BASE (PCI_F_EXTEND | 0xfee00000UL) 103 static void __iomem *astro_iop_base __read_mostly; 104 105 static u32 lba_t32; 106 107 /* lba flags */ 108 #define LBA_FLAG_SKIP_PROBE 0x10 109 110 #define LBA_SKIP_PROBE(d) ((d)->flags & LBA_FLAG_SKIP_PROBE) 111 112 113 /* Looks nice and keeps the compiler happy */ 114 #define LBA_DEV(d) ((struct lba_device *) (d)) 115 116 117 /* 118 ** Only allow 8 subsidiary busses per LBA 119 ** Problem is the PCI bus numbering is globally shared. 120 */ 121 #define LBA_MAX_NUM_BUSES 8 122 123 /************************************ 124 * LBA register read and write support 125 * 126 * BE WARNED: register writes are posted. 127 * (ie follow writes which must reach HW with a read) 128 */ 129 #define READ_U8(addr) __raw_readb(addr) 130 #define READ_U16(addr) __raw_readw(addr) 131 #define READ_U32(addr) __raw_readl(addr) 132 #define WRITE_U8(value, addr) __raw_writeb(value, addr) 133 #define WRITE_U16(value, addr) __raw_writew(value, addr) 134 #define WRITE_U32(value, addr) __raw_writel(value, addr) 135 136 #define READ_REG8(addr) readb(addr) 137 #define READ_REG16(addr) readw(addr) 138 #define READ_REG32(addr) readl(addr) 139 #define READ_REG64(addr) readq(addr) 140 #define WRITE_REG8(value, addr) writeb(value, addr) 141 #define WRITE_REG16(value, addr) writew(value, addr) 142 #define WRITE_REG32(value, addr) writel(value, addr) 143 144 145 #define LBA_CFG_TOK(bus,dfn) ((u32) ((bus)<<16 | (dfn)<<8)) 146 #define LBA_CFG_BUS(tok) ((u8) ((tok)>>16)) 147 #define LBA_CFG_DEV(tok) ((u8) ((tok)>>11) & 0x1f) 148 #define LBA_CFG_FUNC(tok) ((u8) ((tok)>>8 ) & 0x7) 149 150 151 /* 152 ** Extract LBA (Rope) number from HPA 153 ** REVISIT: 16 ropes for Stretch/Ike? 154 */ 155 #define ROPES_PER_IOC 8 156 #define LBA_NUM(x) ((((unsigned long) x) >> 13) & (ROPES_PER_IOC-1)) 157 158 159 static void 160 lba_dump_res(struct resource *r, int d) 161 { 162 int i; 163 164 if (NULL == r) 165 return; 166 167 printk(KERN_DEBUG "(%p)", r->parent); 168 for (i = d; i ; --i) printk(" "); 169 printk(KERN_DEBUG "%p [%lx,%lx]/%lx\n", r, 170 (long)r->start, (long)r->end, r->flags); 171 lba_dump_res(r->child, d+2); 172 lba_dump_res(r->sibling, d); 173 } 174 175 176 /* 177 ** LBA rev 2.0, 2.1, 2.2, and 3.0 bus walks require a complex 178 ** workaround for cfg cycles: 179 ** -- preserve LBA state 180 ** -- prevent any DMA from occurring 181 ** -- turn on smart mode 182 ** -- probe with config writes before doing config reads 183 ** -- check ERROR_STATUS 184 ** -- clear ERROR_STATUS 185 ** -- restore LBA state 186 ** 187 ** The workaround is only used for device discovery. 188 */ 189 190 static int lba_device_present(u8 bus, u8 dfn, struct lba_device *d) 191 { 192 u8 first_bus = d->hba.hba_bus->busn_res.start; 193 u8 last_sub_bus = d->hba.hba_bus->busn_res.end; 194 195 if ((bus < first_bus) || 196 (bus > last_sub_bus) || 197 ((bus - first_bus) >= LBA_MAX_NUM_BUSES)) { 198 return 0; 199 } 200 201 return 1; 202 } 203 204 205 206 #define LBA_CFG_SETUP(d, tok) { \ 207 /* Save contents of error config register. */ \ 208 error_config = READ_REG32(d->hba.base_addr + LBA_ERROR_CONFIG); \ 209 \ 210 /* Save contents of status control register. */ \ 211 status_control = READ_REG32(d->hba.base_addr + LBA_STAT_CTL); \ 212 \ 213 /* For LBA rev 2.0, 2.1, 2.2, and 3.0, we must disable DMA \ 214 ** arbitration for full bus walks. \ 215 */ \ 216 /* Save contents of arb mask register. */ \ 217 arb_mask = READ_REG32(d->hba.base_addr + LBA_ARB_MASK); \ 218 \ 219 /* \ 220 * Turn off all device arbitration bits (i.e. everything \ 221 * except arbitration enable bit). \ 222 */ \ 223 WRITE_REG32(0x1, d->hba.base_addr + LBA_ARB_MASK); \ 224 \ 225 /* \ 226 * Set the smart mode bit so that master aborts don't cause \ 227 * LBA to go into PCI fatal mode (required). \ 228 */ \ 229 WRITE_REG32(error_config | LBA_SMART_MODE, d->hba.base_addr + LBA_ERROR_CONFIG); \ 230 } 231 232 233 #define LBA_CFG_PROBE(d, tok) { \ 234 /* \ 235 * Setup Vendor ID write and read back the address register \ 236 * to make sure that LBA is the bus master. \ 237 */ \ 238 WRITE_REG32(tok | PCI_VENDOR_ID, (d)->hba.base_addr + LBA_PCI_CFG_ADDR);\ 239 /* \ 240 * Read address register to ensure that LBA is the bus master, \ 241 * which implies that DMA traffic has stopped when DMA arb is off. \ 242 */ \ 243 lba_t32 = READ_REG32((d)->hba.base_addr + LBA_PCI_CFG_ADDR); \ 244 /* \ 245 * Generate a cfg write cycle (will have no affect on \ 246 * Vendor ID register since read-only). \ 247 */ \ 248 WRITE_REG32(~0, (d)->hba.base_addr + LBA_PCI_CFG_DATA); \ 249 /* \ 250 * Make sure write has completed before proceeding further, \ 251 * i.e. before setting clear enable. \ 252 */ \ 253 lba_t32 = READ_REG32((d)->hba.base_addr + LBA_PCI_CFG_ADDR); \ 254 } 255 256 257 /* 258 * HPREVISIT: 259 * -- Can't tell if config cycle got the error. 260 * 261 * OV bit is broken until rev 4.0, so can't use OV bit and 262 * LBA_ERROR_LOG_ADDR to tell if error belongs to config cycle. 263 * 264 * As of rev 4.0, no longer need the error check. 265 * 266 * -- Even if we could tell, we still want to return -1 267 * for **ANY** error (not just master abort). 268 * 269 * -- Only clear non-fatal errors (we don't want to bring 270 * LBA out of pci-fatal mode). 271 * 272 * Actually, there is still a race in which 273 * we could be clearing a fatal error. We will 274 * live with this during our initial bus walk 275 * until rev 4.0 (no driver activity during 276 * initial bus walk). The initial bus walk 277 * has race conditions concerning the use of 278 * smart mode as well. 279 */ 280 281 #define LBA_MASTER_ABORT_ERROR 0xc 282 #define LBA_FATAL_ERROR 0x10 283 284 #define LBA_CFG_MASTER_ABORT_CHECK(d, base, tok, error) { \ 285 u32 error_status = 0; \ 286 /* \ 287 * Set clear enable (CE) bit. Unset by HW when new \ 288 * errors are logged -- LBA HW ERS section 14.3.3). \ 289 */ \ 290 WRITE_REG32(status_control | CLEAR_ERRLOG_ENABLE, base + LBA_STAT_CTL); \ 291 error_status = READ_REG32(base + LBA_ERROR_STATUS); \ 292 if ((error_status & 0x1f) != 0) { \ 293 /* \ 294 * Fail the config read request. \ 295 */ \ 296 error = 1; \ 297 if ((error_status & LBA_FATAL_ERROR) == 0) { \ 298 /* \ 299 * Clear error status (if fatal bit not set) by setting \ 300 * clear error log bit (CL). \ 301 */ \ 302 WRITE_REG32(status_control | CLEAR_ERRLOG, base + LBA_STAT_CTL); \ 303 } \ 304 } \ 305 } 306 307 #define LBA_CFG_TR4_ADDR_SETUP(d, addr) \ 308 WRITE_REG32(((addr) & ~3), (d)->hba.base_addr + LBA_PCI_CFG_ADDR); 309 310 #define LBA_CFG_ADDR_SETUP(d, addr) { \ 311 WRITE_REG32(((addr) & ~3), (d)->hba.base_addr + LBA_PCI_CFG_ADDR); \ 312 /* \ 313 * Read address register to ensure that LBA is the bus master, \ 314 * which implies that DMA traffic has stopped when DMA arb is off. \ 315 */ \ 316 lba_t32 = READ_REG32((d)->hba.base_addr + LBA_PCI_CFG_ADDR); \ 317 } 318 319 320 #define LBA_CFG_RESTORE(d, base) { \ 321 /* \ 322 * Restore status control register (turn off clear enable). \ 323 */ \ 324 WRITE_REG32(status_control, base + LBA_STAT_CTL); \ 325 /* \ 326 * Restore error config register (turn off smart mode). \ 327 */ \ 328 WRITE_REG32(error_config, base + LBA_ERROR_CONFIG); \ 329 /* \ 330 * Restore arb mask register (reenables DMA arbitration). \ 331 */ \ 332 WRITE_REG32(arb_mask, base + LBA_ARB_MASK); \ 333 } 334 335 336 337 static unsigned int 338 lba_rd_cfg(struct lba_device *d, u32 tok, u8 reg, u32 size) 339 { 340 u32 data = ~0U; 341 int error = 0; 342 u32 arb_mask = 0; /* used by LBA_CFG_SETUP/RESTORE */ 343 u32 error_config = 0; /* used by LBA_CFG_SETUP/RESTORE */ 344 u32 status_control = 0; /* used by LBA_CFG_SETUP/RESTORE */ 345 346 LBA_CFG_SETUP(d, tok); 347 LBA_CFG_PROBE(d, tok); 348 LBA_CFG_MASTER_ABORT_CHECK(d, d->hba.base_addr, tok, error); 349 if (!error) { 350 void __iomem *data_reg = d->hba.base_addr + LBA_PCI_CFG_DATA; 351 352 LBA_CFG_ADDR_SETUP(d, tok | reg); 353 switch (size) { 354 case 1: data = (u32) READ_REG8(data_reg + (reg & 3)); break; 355 case 2: data = (u32) READ_REG16(data_reg+ (reg & 2)); break; 356 case 4: data = READ_REG32(data_reg); break; 357 } 358 } 359 LBA_CFG_RESTORE(d, d->hba.base_addr); 360 return(data); 361 } 362 363 364 static int elroy_cfg_read(struct pci_bus *bus, unsigned int devfn, int pos, int size, u32 *data) 365 { 366 struct lba_device *d = LBA_DEV(parisc_walk_tree(bus->bridge)); 367 u32 local_bus = (bus->parent == NULL) ? 0 : bus->busn_res.start; 368 u32 tok = LBA_CFG_TOK(local_bus, devfn); 369 void __iomem *data_reg = d->hba.base_addr + LBA_PCI_CFG_DATA; 370 371 if ((pos > 255) || (devfn > 255)) 372 return -EINVAL; 373 374 /* FIXME: B2K/C3600 workaround is always use old method... */ 375 /* if (!LBA_SKIP_PROBE(d)) */ { 376 /* original - Generate config cycle on broken elroy 377 with risk we will miss PCI bus errors. */ 378 *data = lba_rd_cfg(d, tok, pos, size); 379 DBG_CFG("%s(%x+%2x) -> 0x%x (a)\n", __func__, tok, pos, *data); 380 return 0; 381 } 382 383 if (LBA_SKIP_PROBE(d) && !lba_device_present(bus->busn_res.start, devfn, d)) { 384 DBG_CFG("%s(%x+%2x) -> -1 (b)\n", __func__, tok, pos); 385 /* either don't want to look or know device isn't present. */ 386 *data = ~0U; 387 return(0); 388 } 389 390 /* Basic Algorithm 391 ** Should only get here on fully working LBA rev. 392 ** This is how simple the code should have been. 393 */ 394 LBA_CFG_ADDR_SETUP(d, tok | pos); 395 switch(size) { 396 case 1: *data = READ_REG8 (data_reg + (pos & 3)); break; 397 case 2: *data = READ_REG16(data_reg + (pos & 2)); break; 398 case 4: *data = READ_REG32(data_reg); break; 399 } 400 DBG_CFG("%s(%x+%2x) -> 0x%x (c)\n", __func__, tok, pos, *data); 401 return 0; 402 } 403 404 405 static void 406 lba_wr_cfg(struct lba_device *d, u32 tok, u8 reg, u32 data, u32 size) 407 { 408 int error = 0; 409 u32 arb_mask = 0; 410 u32 error_config = 0; 411 u32 status_control = 0; 412 void __iomem *data_reg = d->hba.base_addr + LBA_PCI_CFG_DATA; 413 414 LBA_CFG_SETUP(d, tok); 415 LBA_CFG_ADDR_SETUP(d, tok | reg); 416 switch (size) { 417 case 1: WRITE_REG8 (data, data_reg + (reg & 3)); break; 418 case 2: WRITE_REG16(data, data_reg + (reg & 2)); break; 419 case 4: WRITE_REG32(data, data_reg); break; 420 } 421 LBA_CFG_MASTER_ABORT_CHECK(d, d->hba.base_addr, tok, error); 422 LBA_CFG_RESTORE(d, d->hba.base_addr); 423 } 424 425 426 /* 427 * LBA 4.0 config write code implements non-postable semantics 428 * by doing a read of CONFIG ADDR after the write. 429 */ 430 431 static int elroy_cfg_write(struct pci_bus *bus, unsigned int devfn, int pos, int size, u32 data) 432 { 433 struct lba_device *d = LBA_DEV(parisc_walk_tree(bus->bridge)); 434 u32 local_bus = (bus->parent == NULL) ? 0 : bus->busn_res.start; 435 u32 tok = LBA_CFG_TOK(local_bus,devfn); 436 437 if ((pos > 255) || (devfn > 255)) 438 return -EINVAL; 439 440 if (!LBA_SKIP_PROBE(d)) { 441 /* Original Workaround */ 442 lba_wr_cfg(d, tok, pos, (u32) data, size); 443 DBG_CFG("%s(%x+%2x) = 0x%x (a)\n", __func__, tok, pos,data); 444 return 0; 445 } 446 447 if (LBA_SKIP_PROBE(d) && (!lba_device_present(bus->busn_res.start, devfn, d))) { 448 DBG_CFG("%s(%x+%2x) = 0x%x (b)\n", __func__, tok, pos,data); 449 return 1; /* New Workaround */ 450 } 451 452 DBG_CFG("%s(%x+%2x) = 0x%x (c)\n", __func__, tok, pos, data); 453 454 /* Basic Algorithm */ 455 LBA_CFG_ADDR_SETUP(d, tok | pos); 456 switch(size) { 457 case 1: WRITE_REG8 (data, d->hba.base_addr + LBA_PCI_CFG_DATA + (pos & 3)); 458 break; 459 case 2: WRITE_REG16(data, d->hba.base_addr + LBA_PCI_CFG_DATA + (pos & 2)); 460 break; 461 case 4: WRITE_REG32(data, d->hba.base_addr + LBA_PCI_CFG_DATA); 462 break; 463 } 464 /* flush posted write */ 465 lba_t32 = READ_REG32(d->hba.base_addr + LBA_PCI_CFG_ADDR); 466 return 0; 467 } 468 469 470 static struct pci_ops elroy_cfg_ops = { 471 .read = elroy_cfg_read, 472 .write = elroy_cfg_write, 473 }; 474 475 /* 476 * The mercury_cfg_ops are slightly misnamed; they're also used for Elroy 477 * TR4.0 as no additional bugs were found in this areea between Elroy and 478 * Mercury 479 */ 480 481 static int mercury_cfg_read(struct pci_bus *bus, unsigned int devfn, int pos, int size, u32 *data) 482 { 483 struct lba_device *d = LBA_DEV(parisc_walk_tree(bus->bridge)); 484 u32 local_bus = (bus->parent == NULL) ? 0 : bus->busn_res.start; 485 u32 tok = LBA_CFG_TOK(local_bus, devfn); 486 void __iomem *data_reg = d->hba.base_addr + LBA_PCI_CFG_DATA; 487 488 if ((pos > 255) || (devfn > 255)) 489 return -EINVAL; 490 491 LBA_CFG_TR4_ADDR_SETUP(d, tok | pos); 492 switch(size) { 493 case 1: 494 *data = READ_REG8(data_reg + (pos & 3)); 495 break; 496 case 2: 497 *data = READ_REG16(data_reg + (pos & 2)); 498 break; 499 case 4: 500 *data = READ_REG32(data_reg); break; 501 break; 502 } 503 504 DBG_CFG("mercury_cfg_read(%x+%2x) -> 0x%x\n", tok, pos, *data); 505 return 0; 506 } 507 508 /* 509 * LBA 4.0 config write code implements non-postable semantics 510 * by doing a read of CONFIG ADDR after the write. 511 */ 512 513 static int mercury_cfg_write(struct pci_bus *bus, unsigned int devfn, int pos, int size, u32 data) 514 { 515 struct lba_device *d = LBA_DEV(parisc_walk_tree(bus->bridge)); 516 void __iomem *data_reg = d->hba.base_addr + LBA_PCI_CFG_DATA; 517 u32 local_bus = (bus->parent == NULL) ? 0 : bus->busn_res.start; 518 u32 tok = LBA_CFG_TOK(local_bus,devfn); 519 520 if ((pos > 255) || (devfn > 255)) 521 return -EINVAL; 522 523 DBG_CFG("%s(%x+%2x) <- 0x%x (c)\n", __func__, tok, pos, data); 524 525 LBA_CFG_TR4_ADDR_SETUP(d, tok | pos); 526 switch(size) { 527 case 1: 528 WRITE_REG8 (data, data_reg + (pos & 3)); 529 break; 530 case 2: 531 WRITE_REG16(data, data_reg + (pos & 2)); 532 break; 533 case 4: 534 WRITE_REG32(data, data_reg); 535 break; 536 } 537 538 /* flush posted write */ 539 lba_t32 = READ_U32(d->hba.base_addr + LBA_PCI_CFG_ADDR); 540 return 0; 541 } 542 543 static struct pci_ops mercury_cfg_ops = { 544 .read = mercury_cfg_read, 545 .write = mercury_cfg_write, 546 }; 547 548 549 static void 550 lba_bios_init(void) 551 { 552 DBG(MODULE_NAME ": lba_bios_init\n"); 553 } 554 555 556 #ifdef CONFIG_64BIT 557 558 /* 559 * truncate_pat_collision: Deal with overlaps or outright collisions 560 * between PAT PDC reported ranges. 561 * 562 * Broken PA8800 firmware will report lmmio range that 563 * overlaps with CPU HPA. Just truncate the lmmio range. 564 * 565 * BEWARE: conflicts with this lmmio range may be an 566 * elmmio range which is pointing down another rope. 567 * 568 * FIXME: only deals with one collision per range...theoretically we 569 * could have several. Supporting more than one collision will get messy. 570 */ 571 static unsigned long 572 truncate_pat_collision(struct resource *root, struct resource *new) 573 { 574 unsigned long start = new->start; 575 unsigned long end = new->end; 576 struct resource *tmp = root->child; 577 578 if (end <= start || start < root->start || !tmp) 579 return 0; 580 581 /* find first overlap */ 582 while (tmp && tmp->end < start) 583 tmp = tmp->sibling; 584 585 /* no entries overlap */ 586 if (!tmp) return 0; 587 588 /* found one that starts behind the new one 589 ** Don't need to do anything. 590 */ 591 if (tmp->start >= end) return 0; 592 593 if (tmp->start <= start) { 594 /* "front" of new one overlaps */ 595 new->start = tmp->end + 1; 596 597 if (tmp->end >= end) { 598 /* AACCKK! totally overlaps! drop this range. */ 599 return 1; 600 } 601 } 602 603 if (tmp->end < end ) { 604 /* "end" of new one overlaps */ 605 new->end = tmp->start - 1; 606 } 607 608 printk(KERN_WARNING "LBA: Truncating lmmio_space [%lx/%lx] " 609 "to [%lx,%lx]\n", 610 start, end, 611 (long)new->start, (long)new->end ); 612 613 return 0; /* truncation successful */ 614 } 615 616 /* 617 * extend_lmmio_len: extend lmmio range to maximum length 618 * 619 * This is needed at least on C8000 systems to get the ATI FireGL card 620 * working. On other systems we will currently not extend the lmmio space. 621 */ 622 static unsigned long 623 extend_lmmio_len(unsigned long start, unsigned long end, unsigned long lba_len) 624 { 625 struct resource *tmp; 626 627 /* exit if not a C8000 */ 628 if (boot_cpu_data.cpu_type < mako) 629 return end; 630 631 pr_debug("LMMIO mismatch: PAT length = 0x%lx, MASK register = 0x%lx\n", 632 end - start, lba_len); 633 634 lba_len = min(lba_len+1, 256UL*1024*1024); /* limit to 256 MB */ 635 636 pr_debug("LBA: lmmio_space [0x%lx-0x%lx] - original\n", start, end); 637 638 639 end += lba_len; 640 if (end < start) /* fix overflow */ 641 end = -1ULL; 642 643 pr_debug("LBA: lmmio_space [0x%lx-0x%lx] - current\n", start, end); 644 645 /* first overlap */ 646 for (tmp = iomem_resource.child; tmp; tmp = tmp->sibling) { 647 pr_debug("LBA: testing %pR\n", tmp); 648 if (tmp->start == start) 649 continue; /* ignore ourself */ 650 if (tmp->end < start) 651 continue; 652 if (tmp->start > end) 653 continue; 654 if (end >= tmp->start) 655 end = tmp->start - 1; 656 } 657 658 pr_info("LBA: lmmio_space [0x%lx-0x%lx] - new\n", start, end); 659 660 /* return new end */ 661 return end; 662 } 663 664 #else 665 #define truncate_pat_collision(r,n) (0) 666 #endif 667 668 /* 669 ** The algorithm is generic code. 670 ** But it needs to access local data structures to get the IRQ base. 671 ** Could make this a "pci_fixup_irq(bus, region)" but not sure 672 ** it's worth it. 673 ** 674 ** Called by do_pci_scan_bus() immediately after each PCI bus is walked. 675 ** Resources aren't allocated until recursive buswalk below HBA is completed. 676 */ 677 static void 678 lba_fixup_bus(struct pci_bus *bus) 679 { 680 struct pci_dev *dev; 681 #ifdef FBB_SUPPORT 682 u16 status; 683 #endif 684 struct lba_device *ldev = LBA_DEV(parisc_walk_tree(bus->bridge)); 685 686 DBG("lba_fixup_bus(0x%p) bus %d platform_data 0x%p\n", 687 bus, (int)bus->busn_res.start, bus->bridge->platform_data); 688 689 /* 690 ** Properly Setup MMIO resources for this bus. 691 ** pci_alloc_primary_bus() mangles this. 692 */ 693 if (bus->parent) { 694 int i; 695 /* PCI-PCI Bridge */ 696 pci_read_bridge_bases(bus); 697 for (i = PCI_BRIDGE_RESOURCES; i < PCI_NUM_RESOURCES; i++) 698 pci_claim_bridge_resource(bus->self, i); 699 } else { 700 /* Host-PCI Bridge */ 701 int err; 702 703 DBG("lba_fixup_bus() %s [%lx/%lx]/%lx\n", 704 ldev->hba.io_space.name, 705 ldev->hba.io_space.start, ldev->hba.io_space.end, 706 ldev->hba.io_space.flags); 707 DBG("lba_fixup_bus() %s [%lx/%lx]/%lx\n", 708 ldev->hba.lmmio_space.name, 709 ldev->hba.lmmio_space.start, ldev->hba.lmmio_space.end, 710 ldev->hba.lmmio_space.flags); 711 712 err = request_resource(&ioport_resource, &(ldev->hba.io_space)); 713 if (err < 0) { 714 lba_dump_res(&ioport_resource, 2); 715 BUG(); 716 } 717 718 if (ldev->hba.elmmio_space.flags) { 719 err = request_resource(&iomem_resource, 720 &(ldev->hba.elmmio_space)); 721 if (err < 0) { 722 723 printk("FAILED: lba_fixup_bus() request for " 724 "elmmio_space [%lx/%lx]\n", 725 (long)ldev->hba.elmmio_space.start, 726 (long)ldev->hba.elmmio_space.end); 727 728 /* lba_dump_res(&iomem_resource, 2); */ 729 /* BUG(); */ 730 } 731 } 732 733 if (ldev->hba.lmmio_space.flags) { 734 err = request_resource(&iomem_resource, &(ldev->hba.lmmio_space)); 735 if (err < 0) { 736 printk(KERN_ERR "FAILED: lba_fixup_bus() request for " 737 "lmmio_space [%lx/%lx]\n", 738 (long)ldev->hba.lmmio_space.start, 739 (long)ldev->hba.lmmio_space.end); 740 } 741 } 742 743 #ifdef CONFIG_64BIT 744 /* GMMIO is distributed range. Every LBA/Rope gets part it. */ 745 if (ldev->hba.gmmio_space.flags) { 746 err = request_resource(&iomem_resource, &(ldev->hba.gmmio_space)); 747 if (err < 0) { 748 printk("FAILED: lba_fixup_bus() request for " 749 "gmmio_space [%lx/%lx]\n", 750 (long)ldev->hba.gmmio_space.start, 751 (long)ldev->hba.gmmio_space.end); 752 lba_dump_res(&iomem_resource, 2); 753 BUG(); 754 } 755 } 756 #endif 757 758 } 759 760 list_for_each_entry(dev, &bus->devices, bus_list) { 761 int i; 762 763 DBG("lba_fixup_bus() %s\n", pci_name(dev)); 764 765 /* Virtualize Device/Bridge Resources. */ 766 for (i = 0; i < PCI_BRIDGE_RESOURCES; i++) { 767 struct resource *res = &dev->resource[i]; 768 769 /* If resource not allocated - skip it */ 770 if (!res->start) 771 continue; 772 773 /* 774 ** FIXME: this will result in whinging for devices 775 ** that share expansion ROMs (think quad tulip), but 776 ** isn't harmful. 777 */ 778 pci_claim_resource(dev, i); 779 } 780 781 #ifdef FBB_SUPPORT 782 /* 783 ** If one device does not support FBB transfers, 784 ** No one on the bus can be allowed to use them. 785 */ 786 (void) pci_read_config_word(dev, PCI_STATUS, &status); 787 bus->bridge_ctl &= ~(status & PCI_STATUS_FAST_BACK); 788 #endif 789 790 /* 791 ** P2PB's have no IRQs. ignore them. 792 */ 793 if ((dev->class >> 8) == PCI_CLASS_BRIDGE_PCI) { 794 pcibios_init_bridge(dev); 795 continue; 796 } 797 798 /* Adjust INTERRUPT_LINE for this dev */ 799 iosapic_fixup_irq(ldev->iosapic_obj, dev); 800 } 801 802 #ifdef FBB_SUPPORT 803 /* FIXME/REVISIT - finish figuring out to set FBB on both 804 ** pci_setup_bridge() clobbers PCI_BRIDGE_CONTROL. 805 ** Can't fixup here anyway....garr... 806 */ 807 if (fbb_enable) { 808 if (bus->parent) { 809 u8 control; 810 /* enable on PPB */ 811 (void) pci_read_config_byte(bus->self, PCI_BRIDGE_CONTROL, &control); 812 (void) pci_write_config_byte(bus->self, PCI_BRIDGE_CONTROL, control | PCI_STATUS_FAST_BACK); 813 814 } else { 815 /* enable on LBA */ 816 } 817 fbb_enable = PCI_COMMAND_FAST_BACK; 818 } 819 820 /* Lastly enable FBB/PERR/SERR on all devices too */ 821 list_for_each_entry(dev, &bus->devices, bus_list) { 822 (void) pci_read_config_word(dev, PCI_COMMAND, &status); 823 status |= PCI_COMMAND_PARITY | PCI_COMMAND_SERR | fbb_enable; 824 (void) pci_write_config_word(dev, PCI_COMMAND, status); 825 } 826 #endif 827 } 828 829 830 static struct pci_bios_ops lba_bios_ops = { 831 .init = lba_bios_init, 832 .fixup_bus = lba_fixup_bus, 833 }; 834 835 836 837 838 /******************************************************* 839 ** 840 ** LBA Sprockets "I/O Port" Space Accessor Functions 841 ** 842 ** This set of accessor functions is intended for use with 843 ** "legacy firmware" (ie Sprockets on Allegro/Forte boxes). 844 ** 845 ** Many PCI devices don't require use of I/O port space (eg Tulip, 846 ** NCR720) since they export the same registers to both MMIO and 847 ** I/O port space. In general I/O port space is slower than 848 ** MMIO since drivers are designed so PIO writes can be posted. 849 ** 850 ********************************************************/ 851 852 #define LBA_PORT_IN(size, mask) \ 853 static u##size lba_astro_in##size (struct pci_hba_data *d, u16 addr) \ 854 { \ 855 u##size t; \ 856 t = READ_REG##size(astro_iop_base + addr); \ 857 DBG_PORT(" 0x%x\n", t); \ 858 return (t); \ 859 } 860 861 LBA_PORT_IN( 8, 3) 862 LBA_PORT_IN(16, 2) 863 LBA_PORT_IN(32, 0) 864 865 866 867 /* 868 ** BUG X4107: Ordering broken - DMA RD return can bypass PIO WR 869 ** 870 ** Fixed in Elroy 2.2. The READ_U32(..., LBA_FUNC_ID) below is 871 ** guarantee non-postable completion semantics - not avoid X4107. 872 ** The READ_U32 only guarantees the write data gets to elroy but 873 ** out to the PCI bus. We can't read stuff from I/O port space 874 ** since we don't know what has side-effects. Attempting to read 875 ** from configuration space would be suicidal given the number of 876 ** bugs in that elroy functionality. 877 ** 878 ** Description: 879 ** DMA read results can improperly pass PIO writes (X4107). The 880 ** result of this bug is that if a processor modifies a location in 881 ** memory after having issued PIO writes, the PIO writes are not 882 ** guaranteed to be completed before a PCI device is allowed to see 883 ** the modified data in a DMA read. 884 ** 885 ** Note that IKE bug X3719 in TR1 IKEs will result in the same 886 ** symptom. 887 ** 888 ** Workaround: 889 ** The workaround for this bug is to always follow a PIO write with 890 ** a PIO read to the same bus before starting DMA on that PCI bus. 891 ** 892 */ 893 #define LBA_PORT_OUT(size, mask) \ 894 static void lba_astro_out##size (struct pci_hba_data *d, u16 addr, u##size val) \ 895 { \ 896 DBG_PORT("%s(0x%p, 0x%x, 0x%x)\n", __func__, d, addr, val); \ 897 WRITE_REG##size(val, astro_iop_base + addr); \ 898 if (LBA_DEV(d)->hw_rev < 3) \ 899 lba_t32 = READ_U32(d->base_addr + LBA_FUNC_ID); \ 900 } 901 902 LBA_PORT_OUT( 8, 3) 903 LBA_PORT_OUT(16, 2) 904 LBA_PORT_OUT(32, 0) 905 906 907 static struct pci_port_ops lba_astro_port_ops = { 908 .inb = lba_astro_in8, 909 .inw = lba_astro_in16, 910 .inl = lba_astro_in32, 911 .outb = lba_astro_out8, 912 .outw = lba_astro_out16, 913 .outl = lba_astro_out32 914 }; 915 916 917 #ifdef CONFIG_64BIT 918 #define PIOP_TO_GMMIO(lba, addr) \ 919 ((lba)->iop_base + (((addr)&0xFFFC)<<10) + ((addr)&3)) 920 921 /******************************************************* 922 ** 923 ** LBA PAT "I/O Port" Space Accessor Functions 924 ** 925 ** This set of accessor functions is intended for use with 926 ** "PAT PDC" firmware (ie Prelude/Rhapsody/Piranha boxes). 927 ** 928 ** This uses the PIOP space located in the first 64MB of GMMIO. 929 ** Each rope gets a full 64*KB* (ie 4 bytes per page) this way. 930 ** bits 1:0 stay the same. bits 15:2 become 25:12. 931 ** Then add the base and we can generate an I/O Port cycle. 932 ********************************************************/ 933 #undef LBA_PORT_IN 934 #define LBA_PORT_IN(size, mask) \ 935 static u##size lba_pat_in##size (struct pci_hba_data *l, u16 addr) \ 936 { \ 937 u##size t; \ 938 DBG_PORT("%s(0x%p, 0x%x) ->", __func__, l, addr); \ 939 t = READ_REG##size(PIOP_TO_GMMIO(LBA_DEV(l), addr)); \ 940 DBG_PORT(" 0x%x\n", t); \ 941 return (t); \ 942 } 943 944 LBA_PORT_IN( 8, 3) 945 LBA_PORT_IN(16, 2) 946 LBA_PORT_IN(32, 0) 947 948 949 #undef LBA_PORT_OUT 950 #define LBA_PORT_OUT(size, mask) \ 951 static void lba_pat_out##size (struct pci_hba_data *l, u16 addr, u##size val) \ 952 { \ 953 void __iomem *where = PIOP_TO_GMMIO(LBA_DEV(l), addr); \ 954 DBG_PORT("%s(0x%p, 0x%x, 0x%x)\n", __func__, l, addr, val); \ 955 WRITE_REG##size(val, where); \ 956 /* flush the I/O down to the elroy at least */ \ 957 lba_t32 = READ_U32(l->base_addr + LBA_FUNC_ID); \ 958 } 959 960 LBA_PORT_OUT( 8, 3) 961 LBA_PORT_OUT(16, 2) 962 LBA_PORT_OUT(32, 0) 963 964 965 static struct pci_port_ops lba_pat_port_ops = { 966 .inb = lba_pat_in8, 967 .inw = lba_pat_in16, 968 .inl = lba_pat_in32, 969 .outb = lba_pat_out8, 970 .outw = lba_pat_out16, 971 .outl = lba_pat_out32 972 }; 973 974 975 976 /* 977 ** make range information from PDC available to PCI subsystem. 978 ** We make the PDC call here in order to get the PCI bus range 979 ** numbers. The rest will get forwarded in pcibios_fixup_bus(). 980 ** We don't have a struct pci_bus assigned to us yet. 981 */ 982 static void 983 lba_pat_resources(struct parisc_device *pa_dev, struct lba_device *lba_dev) 984 { 985 unsigned long bytecnt; 986 long io_count; 987 long status; /* PDC return status */ 988 long pa_count; 989 pdc_pat_cell_mod_maddr_block_t *pa_pdc_cell; /* PA_VIEW */ 990 pdc_pat_cell_mod_maddr_block_t *io_pdc_cell; /* IO_VIEW */ 991 int i; 992 993 pa_pdc_cell = kzalloc(sizeof(pdc_pat_cell_mod_maddr_block_t), GFP_KERNEL); 994 if (!pa_pdc_cell) 995 return; 996 997 io_pdc_cell = kzalloc(sizeof(pdc_pat_cell_mod_maddr_block_t), GFP_KERNEL); 998 if (!io_pdc_cell) { 999 kfree(pa_pdc_cell); 1000 return; 1001 } 1002 1003 /* return cell module (IO view) */ 1004 status = pdc_pat_cell_module(&bytecnt, pa_dev->pcell_loc, pa_dev->mod_index, 1005 PA_VIEW, pa_pdc_cell); 1006 pa_count = pa_pdc_cell->mod[1]; 1007 1008 status |= pdc_pat_cell_module(&bytecnt, pa_dev->pcell_loc, pa_dev->mod_index, 1009 IO_VIEW, io_pdc_cell); 1010 io_count = io_pdc_cell->mod[1]; 1011 1012 /* We've already done this once for device discovery...*/ 1013 if (status != PDC_OK) { 1014 panic("pdc_pat_cell_module() call failed for LBA!\n"); 1015 } 1016 1017 if (PAT_GET_ENTITY(pa_pdc_cell->mod_info) != PAT_ENTITY_LBA) { 1018 panic("pdc_pat_cell_module() entity returned != PAT_ENTITY_LBA!\n"); 1019 } 1020 1021 /* 1022 ** Inspect the resources PAT tells us about 1023 */ 1024 for (i = 0; i < pa_count; i++) { 1025 struct { 1026 unsigned long type; 1027 unsigned long start; 1028 unsigned long end; /* aka finish */ 1029 } *p, *io; 1030 struct resource *r; 1031 1032 p = (void *) &(pa_pdc_cell->mod[2+i*3]); 1033 io = (void *) &(io_pdc_cell->mod[2+i*3]); 1034 1035 /* Convert the PAT range data to PCI "struct resource" */ 1036 switch(p->type & 0xff) { 1037 case PAT_PBNUM: 1038 lba_dev->hba.bus_num.start = p->start; 1039 lba_dev->hba.bus_num.end = p->end; 1040 lba_dev->hba.bus_num.flags = IORESOURCE_BUS; 1041 break; 1042 1043 case PAT_LMMIO: 1044 /* used to fix up pre-initialized MEM BARs */ 1045 if (!lba_dev->hba.lmmio_space.flags) { 1046 unsigned long lba_len; 1047 1048 lba_len = ~READ_REG32(lba_dev->hba.base_addr 1049 + LBA_LMMIO_MASK); 1050 if ((p->end - p->start) != lba_len) 1051 p->end = extend_lmmio_len(p->start, 1052 p->end, lba_len); 1053 1054 sprintf(lba_dev->hba.lmmio_name, 1055 "PCI%02x LMMIO", 1056 (int)lba_dev->hba.bus_num.start); 1057 lba_dev->hba.lmmio_space_offset = p->start - 1058 io->start; 1059 r = &lba_dev->hba.lmmio_space; 1060 r->name = lba_dev->hba.lmmio_name; 1061 } else if (!lba_dev->hba.elmmio_space.flags) { 1062 sprintf(lba_dev->hba.elmmio_name, 1063 "PCI%02x ELMMIO", 1064 (int)lba_dev->hba.bus_num.start); 1065 r = &lba_dev->hba.elmmio_space; 1066 r->name = lba_dev->hba.elmmio_name; 1067 } else { 1068 printk(KERN_WARNING MODULE_NAME 1069 " only supports 2 LMMIO resources!\n"); 1070 break; 1071 } 1072 1073 r->start = p->start; 1074 r->end = p->end; 1075 r->flags = IORESOURCE_MEM; 1076 r->parent = r->sibling = r->child = NULL; 1077 break; 1078 1079 case PAT_GMMIO: 1080 /* MMIO space > 4GB phys addr; for 64-bit BAR */ 1081 sprintf(lba_dev->hba.gmmio_name, "PCI%02x GMMIO", 1082 (int)lba_dev->hba.bus_num.start); 1083 r = &lba_dev->hba.gmmio_space; 1084 r->name = lba_dev->hba.gmmio_name; 1085 r->start = p->start; 1086 r->end = p->end; 1087 r->flags = IORESOURCE_MEM; 1088 r->parent = r->sibling = r->child = NULL; 1089 break; 1090 1091 case PAT_NPIOP: 1092 printk(KERN_WARNING MODULE_NAME 1093 " range[%d] : ignoring NPIOP (0x%lx)\n", 1094 i, p->start); 1095 break; 1096 1097 case PAT_PIOP: 1098 /* 1099 ** Postable I/O port space is per PCI host adapter. 1100 ** base of 64MB PIOP region 1101 */ 1102 lba_dev->iop_base = ioremap_nocache(p->start, 64 * 1024 * 1024); 1103 1104 sprintf(lba_dev->hba.io_name, "PCI%02x Ports", 1105 (int)lba_dev->hba.bus_num.start); 1106 r = &lba_dev->hba.io_space; 1107 r->name = lba_dev->hba.io_name; 1108 r->start = HBA_PORT_BASE(lba_dev->hba.hba_num); 1109 r->end = r->start + HBA_PORT_SPACE_SIZE - 1; 1110 r->flags = IORESOURCE_IO; 1111 r->parent = r->sibling = r->child = NULL; 1112 break; 1113 1114 default: 1115 printk(KERN_WARNING MODULE_NAME 1116 " range[%d] : unknown pat range type (0x%lx)\n", 1117 i, p->type & 0xff); 1118 break; 1119 } 1120 } 1121 1122 kfree(pa_pdc_cell); 1123 kfree(io_pdc_cell); 1124 } 1125 #else 1126 /* keep compiler from complaining about missing declarations */ 1127 #define lba_pat_port_ops lba_astro_port_ops 1128 #define lba_pat_resources(pa_dev, lba_dev) 1129 #endif /* CONFIG_64BIT */ 1130 1131 1132 extern void sba_distributed_lmmio(struct parisc_device *, struct resource *); 1133 extern void sba_directed_lmmio(struct parisc_device *, struct resource *); 1134 1135 1136 static void 1137 lba_legacy_resources(struct parisc_device *pa_dev, struct lba_device *lba_dev) 1138 { 1139 struct resource *r; 1140 int lba_num; 1141 1142 lba_dev->hba.lmmio_space_offset = PCI_F_EXTEND; 1143 1144 /* 1145 ** With "legacy" firmware, the lowest byte of FW_SCRATCH 1146 ** represents bus->secondary and the second byte represents 1147 ** bus->subsidiary (i.e. highest PPB programmed by firmware). 1148 ** PCI bus walk *should* end up with the same result. 1149 ** FIXME: But we don't have sanity checks in PCI or LBA. 1150 */ 1151 lba_num = READ_REG32(lba_dev->hba.base_addr + LBA_FW_SCRATCH); 1152 r = &(lba_dev->hba.bus_num); 1153 r->name = "LBA PCI Busses"; 1154 r->start = lba_num & 0xff; 1155 r->end = (lba_num>>8) & 0xff; 1156 r->flags = IORESOURCE_BUS; 1157 1158 /* Set up local PCI Bus resources - we don't need them for 1159 ** Legacy boxes but it's nice to see in /proc/iomem. 1160 */ 1161 r = &(lba_dev->hba.lmmio_space); 1162 sprintf(lba_dev->hba.lmmio_name, "PCI%02x LMMIO", 1163 (int)lba_dev->hba.bus_num.start); 1164 r->name = lba_dev->hba.lmmio_name; 1165 1166 #if 1 1167 /* We want the CPU -> IO routing of addresses. 1168 * The SBA BASE/MASK registers control CPU -> IO routing. 1169 * Ask SBA what is routed to this rope/LBA. 1170 */ 1171 sba_distributed_lmmio(pa_dev, r); 1172 #else 1173 /* 1174 * The LBA BASE/MASK registers control IO -> System routing. 1175 * 1176 * The following code works but doesn't get us what we want. 1177 * Well, only because firmware (v5.0) on C3000 doesn't program 1178 * the LBA BASE/MASE registers to be the exact inverse of 1179 * the corresponding SBA registers. Other Astro/Pluto 1180 * based platform firmware may do it right. 1181 * 1182 * Should someone want to mess with MSI, they may need to 1183 * reprogram LBA BASE/MASK registers. Thus preserve the code 1184 * below until MSI is known to work on C3000/A500/N4000/RP3440. 1185 * 1186 * Using the code below, /proc/iomem shows: 1187 * ... 1188 * f0000000-f0ffffff : PCI00 LMMIO 1189 * f05d0000-f05d0000 : lcd_data 1190 * f05d0008-f05d0008 : lcd_cmd 1191 * f1000000-f1ffffff : PCI01 LMMIO 1192 * f4000000-f4ffffff : PCI02 LMMIO 1193 * f4000000-f4001fff : sym53c8xx 1194 * f4002000-f4003fff : sym53c8xx 1195 * f4004000-f40043ff : sym53c8xx 1196 * f4005000-f40053ff : sym53c8xx 1197 * f4007000-f4007fff : ohci_hcd 1198 * f4008000-f40083ff : tulip 1199 * f6000000-f6ffffff : PCI03 LMMIO 1200 * f8000000-fbffffff : PCI00 ELMMIO 1201 * fa100000-fa4fffff : stifb mmio 1202 * fb000000-fb1fffff : stifb fb 1203 * 1204 * But everything listed under PCI02 actually lives under PCI00. 1205 * This is clearly wrong. 1206 * 1207 * Asking SBA how things are routed tells the correct story: 1208 * LMMIO_BASE/MASK/ROUTE f4000001 fc000000 00000000 1209 * DIR0_BASE/MASK/ROUTE fa000001 fe000000 00000006 1210 * DIR1_BASE/MASK/ROUTE f9000001 ff000000 00000004 1211 * DIR2_BASE/MASK/ROUTE f0000000 fc000000 00000000 1212 * DIR3_BASE/MASK/ROUTE f0000000 fc000000 00000000 1213 * 1214 * Which looks like this in /proc/iomem: 1215 * f4000000-f47fffff : PCI00 LMMIO 1216 * f4000000-f4001fff : sym53c8xx 1217 * ...[deteled core devices - same as above]... 1218 * f4008000-f40083ff : tulip 1219 * f4800000-f4ffffff : PCI01 LMMIO 1220 * f6000000-f67fffff : PCI02 LMMIO 1221 * f7000000-f77fffff : PCI03 LMMIO 1222 * f9000000-f9ffffff : PCI02 ELMMIO 1223 * fa000000-fbffffff : PCI03 ELMMIO 1224 * fa100000-fa4fffff : stifb mmio 1225 * fb000000-fb1fffff : stifb fb 1226 * 1227 * ie all Built-in core are under now correctly under PCI00. 1228 * The "PCI02 ELMMIO" directed range is for: 1229 * +-[02]---03.0 3Dfx Interactive, Inc. Voodoo 2 1230 * 1231 * All is well now. 1232 */ 1233 r->start = READ_REG32(lba_dev->hba.base_addr + LBA_LMMIO_BASE); 1234 if (r->start & 1) { 1235 unsigned long rsize; 1236 1237 r->flags = IORESOURCE_MEM; 1238 /* mmio_mask also clears Enable bit */ 1239 r->start &= mmio_mask; 1240 r->start = PCI_HOST_ADDR(HBA_DATA(lba_dev), r->start); 1241 rsize = ~ READ_REG32(lba_dev->hba.base_addr + LBA_LMMIO_MASK); 1242 1243 /* 1244 ** Each rope only gets part of the distributed range. 1245 ** Adjust "window" for this rope. 1246 */ 1247 rsize /= ROPES_PER_IOC; 1248 r->start += (rsize + 1) * LBA_NUM(pa_dev->hpa.start); 1249 r->end = r->start + rsize; 1250 } else { 1251 r->end = r->start = 0; /* Not enabled. */ 1252 } 1253 #endif 1254 1255 /* 1256 ** "Directed" ranges are used when the "distributed range" isn't 1257 ** sufficient for all devices below a given LBA. Typically devices 1258 ** like graphics cards or X25 may need a directed range when the 1259 ** bus has multiple slots (ie multiple devices) or the device 1260 ** needs more than the typical 4 or 8MB a distributed range offers. 1261 ** 1262 ** The main reason for ignoring it now frigging complications. 1263 ** Directed ranges may overlap (and have precedence) over 1264 ** distributed ranges. Or a distributed range assigned to a unused 1265 ** rope may be used by a directed range on a different rope. 1266 ** Support for graphics devices may require fixing this 1267 ** since they may be assigned a directed range which overlaps 1268 ** an existing (but unused portion of) distributed range. 1269 */ 1270 r = &(lba_dev->hba.elmmio_space); 1271 sprintf(lba_dev->hba.elmmio_name, "PCI%02x ELMMIO", 1272 (int)lba_dev->hba.bus_num.start); 1273 r->name = lba_dev->hba.elmmio_name; 1274 1275 #if 1 1276 /* See comment which precedes call to sba_directed_lmmio() */ 1277 sba_directed_lmmio(pa_dev, r); 1278 #else 1279 r->start = READ_REG32(lba_dev->hba.base_addr + LBA_ELMMIO_BASE); 1280 1281 if (r->start & 1) { 1282 unsigned long rsize; 1283 r->flags = IORESOURCE_MEM; 1284 /* mmio_mask also clears Enable bit */ 1285 r->start &= mmio_mask; 1286 r->start = PCI_HOST_ADDR(HBA_DATA(lba_dev), r->start); 1287 rsize = READ_REG32(lba_dev->hba.base_addr + LBA_ELMMIO_MASK); 1288 r->end = r->start + ~rsize; 1289 } 1290 #endif 1291 1292 r = &(lba_dev->hba.io_space); 1293 sprintf(lba_dev->hba.io_name, "PCI%02x Ports", 1294 (int)lba_dev->hba.bus_num.start); 1295 r->name = lba_dev->hba.io_name; 1296 r->flags = IORESOURCE_IO; 1297 r->start = READ_REG32(lba_dev->hba.base_addr + LBA_IOS_BASE) & ~1L; 1298 r->end = r->start + (READ_REG32(lba_dev->hba.base_addr + LBA_IOS_MASK) ^ (HBA_PORT_SPACE_SIZE - 1)); 1299 1300 /* Virtualize the I/O Port space ranges */ 1301 lba_num = HBA_PORT_BASE(lba_dev->hba.hba_num); 1302 r->start |= lba_num; 1303 r->end |= lba_num; 1304 } 1305 1306 1307 /************************************************************************** 1308 ** 1309 ** LBA initialization code (HW and SW) 1310 ** 1311 ** o identify LBA chip itself 1312 ** o initialize LBA chip modes (HardFail) 1313 ** o FIXME: initialize DMA hints for reasonable defaults 1314 ** o enable configuration functions 1315 ** o call pci_register_ops() to discover devs (fixup/fixup_bus get invoked) 1316 ** 1317 **************************************************************************/ 1318 1319 static int __init 1320 lba_hw_init(struct lba_device *d) 1321 { 1322 u32 stat; 1323 u32 bus_reset; /* PDC_PAT_BUG */ 1324 1325 #if 0 1326 printk(KERN_DEBUG "LBA %lx STAT_CTL %Lx ERROR_CFG %Lx STATUS %Lx DMA_CTL %Lx\n", 1327 d->hba.base_addr, 1328 READ_REG64(d->hba.base_addr + LBA_STAT_CTL), 1329 READ_REG64(d->hba.base_addr + LBA_ERROR_CONFIG), 1330 READ_REG64(d->hba.base_addr + LBA_ERROR_STATUS), 1331 READ_REG64(d->hba.base_addr + LBA_DMA_CTL) ); 1332 printk(KERN_DEBUG " ARB mask %Lx pri %Lx mode %Lx mtlt %Lx\n", 1333 READ_REG64(d->hba.base_addr + LBA_ARB_MASK), 1334 READ_REG64(d->hba.base_addr + LBA_ARB_PRI), 1335 READ_REG64(d->hba.base_addr + LBA_ARB_MODE), 1336 READ_REG64(d->hba.base_addr + LBA_ARB_MTLT) ); 1337 printk(KERN_DEBUG " HINT cfg 0x%Lx\n", 1338 READ_REG64(d->hba.base_addr + LBA_HINT_CFG)); 1339 printk(KERN_DEBUG " HINT reg "); 1340 { int i; 1341 for (i=LBA_HINT_BASE; i< (14*8 + LBA_HINT_BASE); i+=8) 1342 printk(" %Lx", READ_REG64(d->hba.base_addr + i)); 1343 } 1344 printk("\n"); 1345 #endif /* DEBUG_LBA_PAT */ 1346 1347 #ifdef CONFIG_64BIT 1348 /* 1349 * FIXME add support for PDC_PAT_IO "Get slot status" - OLAR support 1350 * Only N-Class and up can really make use of Get slot status. 1351 * maybe L-class too but I've never played with it there. 1352 */ 1353 #endif 1354 1355 /* PDC_PAT_BUG: exhibited in rev 40.48 on L2000 */ 1356 bus_reset = READ_REG32(d->hba.base_addr + LBA_STAT_CTL + 4) & 1; 1357 if (bus_reset) { 1358 printk(KERN_DEBUG "NOTICE: PCI bus reset still asserted! (clearing)\n"); 1359 } 1360 1361 stat = READ_REG32(d->hba.base_addr + LBA_ERROR_CONFIG); 1362 if (stat & LBA_SMART_MODE) { 1363 printk(KERN_DEBUG "NOTICE: LBA in SMART mode! (cleared)\n"); 1364 stat &= ~LBA_SMART_MODE; 1365 WRITE_REG32(stat, d->hba.base_addr + LBA_ERROR_CONFIG); 1366 } 1367 1368 /* Set HF mode as the default (vs. -1 mode). */ 1369 stat = READ_REG32(d->hba.base_addr + LBA_STAT_CTL); 1370 WRITE_REG32(stat | HF_ENABLE, d->hba.base_addr + LBA_STAT_CTL); 1371 1372 /* 1373 ** Writing a zero to STAT_CTL.rf (bit 0) will clear reset signal 1374 ** if it's not already set. If we just cleared the PCI Bus Reset 1375 ** signal, wait a bit for the PCI devices to recover and setup. 1376 */ 1377 if (bus_reset) 1378 mdelay(pci_post_reset_delay); 1379 1380 if (0 == READ_REG32(d->hba.base_addr + LBA_ARB_MASK)) { 1381 /* 1382 ** PDC_PAT_BUG: PDC rev 40.48 on L2000. 1383 ** B2000/C3600/J6000 also have this problem? 1384 ** 1385 ** Elroys with hot pluggable slots don't get configured 1386 ** correctly if the slot is empty. ARB_MASK is set to 0 1387 ** and we can't master transactions on the bus if it's 1388 ** not at least one. 0x3 enables elroy and first slot. 1389 */ 1390 printk(KERN_DEBUG "NOTICE: Enabling PCI Arbitration\n"); 1391 WRITE_REG32(0x3, d->hba.base_addr + LBA_ARB_MASK); 1392 } 1393 1394 /* 1395 ** FIXME: Hint registers are programmed with default hint 1396 ** values by firmware. Hints should be sane even if we 1397 ** can't reprogram them the way drivers want. 1398 */ 1399 return 0; 1400 } 1401 1402 /* 1403 * Unfortunately, when firmware numbers busses, it doesn't take into account 1404 * Cardbus bridges. So we have to renumber the busses to suit ourselves. 1405 * Elroy/Mercury don't actually know what bus number they're attached to; 1406 * we use bus 0 to indicate the directly attached bus and any other bus 1407 * number will be taken care of by the PCI-PCI bridge. 1408 */ 1409 static unsigned int lba_next_bus = 0; 1410 1411 /* 1412 * Determine if lba should claim this chip (return 0) or not (return 1). 1413 * If so, initialize the chip and tell other partners in crime they 1414 * have work to do. 1415 */ 1416 static int __init 1417 lba_driver_probe(struct parisc_device *dev) 1418 { 1419 struct lba_device *lba_dev; 1420 LIST_HEAD(resources); 1421 struct pci_bus *lba_bus; 1422 struct pci_ops *cfg_ops; 1423 u32 func_class; 1424 void *tmp_obj; 1425 char *version; 1426 void __iomem *addr = ioremap_nocache(dev->hpa.start, 4096); 1427 int max; 1428 1429 /* Read HW Rev First */ 1430 func_class = READ_REG32(addr + LBA_FCLASS); 1431 1432 if (IS_ELROY(dev)) { 1433 func_class &= 0xf; 1434 switch (func_class) { 1435 case 0: version = "TR1.0"; break; 1436 case 1: version = "TR2.0"; break; 1437 case 2: version = "TR2.1"; break; 1438 case 3: version = "TR2.2"; break; 1439 case 4: version = "TR3.0"; break; 1440 case 5: version = "TR4.0"; break; 1441 default: version = "TR4+"; 1442 } 1443 1444 printk(KERN_INFO "Elroy version %s (0x%x) found at 0x%lx\n", 1445 version, func_class & 0xf, (long)dev->hpa.start); 1446 1447 if (func_class < 2) { 1448 printk(KERN_WARNING "Can't support LBA older than " 1449 "TR2.1 - continuing under adversity.\n"); 1450 } 1451 1452 #if 0 1453 /* Elroy TR4.0 should work with simple algorithm. 1454 But it doesn't. Still missing something. *sigh* 1455 */ 1456 if (func_class > 4) { 1457 cfg_ops = &mercury_cfg_ops; 1458 } else 1459 #endif 1460 { 1461 cfg_ops = &elroy_cfg_ops; 1462 } 1463 1464 } else if (IS_MERCURY(dev) || IS_QUICKSILVER(dev)) { 1465 int major, minor; 1466 1467 func_class &= 0xff; 1468 major = func_class >> 4, minor = func_class & 0xf; 1469 1470 /* We could use one printk for both Elroy and Mercury, 1471 * but for the mask for func_class. 1472 */ 1473 printk(KERN_INFO "%s version TR%d.%d (0x%x) found at 0x%lx\n", 1474 IS_MERCURY(dev) ? "Mercury" : "Quicksilver", major, 1475 minor, func_class, (long)dev->hpa.start); 1476 1477 cfg_ops = &mercury_cfg_ops; 1478 } else { 1479 printk(KERN_ERR "Unknown LBA found at 0x%lx\n", 1480 (long)dev->hpa.start); 1481 return -ENODEV; 1482 } 1483 1484 /* Tell I/O SAPIC driver we have a IRQ handler/region. */ 1485 tmp_obj = iosapic_register(dev->hpa.start + LBA_IOSAPIC_BASE); 1486 1487 /* NOTE: PCI devices (e.g. 103c:1005 graphics card) which don't 1488 ** have an IRT entry will get NULL back from iosapic code. 1489 */ 1490 1491 lba_dev = kzalloc(sizeof(struct lba_device), GFP_KERNEL); 1492 if (!lba_dev) { 1493 printk(KERN_ERR "lba_init_chip - couldn't alloc lba_device\n"); 1494 return(1); 1495 } 1496 1497 1498 /* ---------- First : initialize data we already have --------- */ 1499 1500 lba_dev->hw_rev = func_class; 1501 lba_dev->hba.base_addr = addr; 1502 lba_dev->hba.dev = dev; 1503 lba_dev->iosapic_obj = tmp_obj; /* save interrupt handle */ 1504 lba_dev->hba.iommu = sba_get_iommu(dev); /* get iommu data */ 1505 parisc_set_drvdata(dev, lba_dev); 1506 1507 /* ------------ Second : initialize common stuff ---------- */ 1508 pci_bios = &lba_bios_ops; 1509 pcibios_register_hba(HBA_DATA(lba_dev)); 1510 spin_lock_init(&lba_dev->lba_lock); 1511 1512 if (lba_hw_init(lba_dev)) 1513 return(1); 1514 1515 /* ---------- Third : setup I/O Port and MMIO resources --------- */ 1516 1517 if (is_pdc_pat()) { 1518 /* PDC PAT firmware uses PIOP region of GMMIO space. */ 1519 pci_port = &lba_pat_port_ops; 1520 /* Go ask PDC PAT what resources this LBA has */ 1521 lba_pat_resources(dev, lba_dev); 1522 } else { 1523 if (!astro_iop_base) { 1524 /* Sprockets PDC uses NPIOP region */ 1525 astro_iop_base = ioremap_nocache(LBA_PORT_BASE, 64 * 1024); 1526 pci_port = &lba_astro_port_ops; 1527 } 1528 1529 /* Poke the chip a bit for /proc output */ 1530 lba_legacy_resources(dev, lba_dev); 1531 } 1532 1533 if (lba_dev->hba.bus_num.start < lba_next_bus) 1534 lba_dev->hba.bus_num.start = lba_next_bus; 1535 1536 /* Overlaps with elmmio can (and should) fail here. 1537 * We will prune (or ignore) the distributed range. 1538 * 1539 * FIXME: SBA code should register all elmmio ranges first. 1540 * that would take care of elmmio ranges routed 1541 * to a different rope (already discovered) from 1542 * getting registered *after* LBA code has already 1543 * registered it's distributed lmmio range. 1544 */ 1545 if (truncate_pat_collision(&iomem_resource, 1546 &(lba_dev->hba.lmmio_space))) { 1547 printk(KERN_WARNING "LBA: lmmio_space [%lx/%lx] duplicate!\n", 1548 (long)lba_dev->hba.lmmio_space.start, 1549 (long)lba_dev->hba.lmmio_space.end); 1550 lba_dev->hba.lmmio_space.flags = 0; 1551 } 1552 1553 pci_add_resource_offset(&resources, &lba_dev->hba.io_space, 1554 HBA_PORT_BASE(lba_dev->hba.hba_num)); 1555 if (lba_dev->hba.elmmio_space.flags) 1556 pci_add_resource_offset(&resources, &lba_dev->hba.elmmio_space, 1557 lba_dev->hba.lmmio_space_offset); 1558 if (lba_dev->hba.lmmio_space.flags) 1559 pci_add_resource_offset(&resources, &lba_dev->hba.lmmio_space, 1560 lba_dev->hba.lmmio_space_offset); 1561 if (lba_dev->hba.gmmio_space.flags) { 1562 /* Not registering GMMIO space - according to docs it's not 1563 * even used on HP-UX. */ 1564 /* pci_add_resource(&resources, &lba_dev->hba.gmmio_space); */ 1565 } 1566 1567 pci_add_resource(&resources, &lba_dev->hba.bus_num); 1568 1569 dev->dev.platform_data = lba_dev; 1570 lba_bus = lba_dev->hba.hba_bus = 1571 pci_create_root_bus(&dev->dev, lba_dev->hba.bus_num.start, 1572 cfg_ops, NULL, &resources); 1573 if (!lba_bus) { 1574 pci_free_resource_list(&resources); 1575 return 0; 1576 } 1577 1578 max = pci_scan_child_bus(lba_bus); 1579 1580 /* This is in lieu of calling pci_assign_unassigned_resources() */ 1581 if (is_pdc_pat()) { 1582 /* assign resources to un-initialized devices */ 1583 1584 DBG_PAT("LBA pci_bus_size_bridges()\n"); 1585 pci_bus_size_bridges(lba_bus); 1586 1587 DBG_PAT("LBA pci_bus_assign_resources()\n"); 1588 pci_bus_assign_resources(lba_bus); 1589 1590 #ifdef DEBUG_LBA_PAT 1591 DBG_PAT("\nLBA PIOP resource tree\n"); 1592 lba_dump_res(&lba_dev->hba.io_space, 2); 1593 DBG_PAT("\nLBA LMMIO resource tree\n"); 1594 lba_dump_res(&lba_dev->hba.lmmio_space, 2); 1595 #endif 1596 } 1597 1598 /* 1599 ** Once PCI register ops has walked the bus, access to config 1600 ** space is restricted. Avoids master aborts on config cycles. 1601 ** Early LBA revs go fatal on *any* master abort. 1602 */ 1603 if (cfg_ops == &elroy_cfg_ops) { 1604 lba_dev->flags |= LBA_FLAG_SKIP_PROBE; 1605 } 1606 1607 lba_next_bus = max + 1; 1608 pci_bus_add_devices(lba_bus); 1609 1610 /* Whew! Finally done! Tell services we got this one covered. */ 1611 return 0; 1612 } 1613 1614 static struct parisc_device_id lba_tbl[] = { 1615 { HPHW_BRIDGE, HVERSION_REV_ANY_ID, ELROY_HVERS, 0xa }, 1616 { HPHW_BRIDGE, HVERSION_REV_ANY_ID, MERCURY_HVERS, 0xa }, 1617 { HPHW_BRIDGE, HVERSION_REV_ANY_ID, QUICKSILVER_HVERS, 0xa }, 1618 { 0, } 1619 }; 1620 1621 static struct parisc_driver lba_driver = { 1622 .name = MODULE_NAME, 1623 .id_table = lba_tbl, 1624 .probe = lba_driver_probe, 1625 }; 1626 1627 /* 1628 ** One time initialization to let the world know the LBA was found. 1629 ** Must be called exactly once before pci_init(). 1630 */ 1631 void __init lba_init(void) 1632 { 1633 register_parisc_driver(&lba_driver); 1634 } 1635 1636 /* 1637 ** Initialize the IBASE/IMASK registers for LBA (Elroy). 1638 ** Only called from sba_iommu.c in order to route ranges (MMIO vs DMA). 1639 ** sba_iommu is responsible for locking (none needed at init time). 1640 */ 1641 void lba_set_iregs(struct parisc_device *lba, u32 ibase, u32 imask) 1642 { 1643 void __iomem * base_addr = ioremap_nocache(lba->hpa.start, 4096); 1644 1645 imask <<= 2; /* adjust for hints - 2 more bits */ 1646 1647 /* Make sure we aren't trying to set bits that aren't writeable. */ 1648 WARN_ON((ibase & 0x001fffff) != 0); 1649 WARN_ON((imask & 0x001fffff) != 0); 1650 1651 DBG("%s() ibase 0x%x imask 0x%x\n", __func__, ibase, imask); 1652 WRITE_REG32( imask, base_addr + LBA_IMASK); 1653 WRITE_REG32( ibase, base_addr + LBA_IBASE); 1654 iounmap(base_addr); 1655 } 1656 1657