1 // SPDX-License-Identifier: GPL-2.0 2 /* 3 * PCI detection and setup code 4 */ 5 6 #include <linux/array_size.h> 7 #include <linux/kernel.h> 8 #include <linux/delay.h> 9 #include <linux/init.h> 10 #include <linux/pci.h> 11 #include <linux/msi.h> 12 #include <linux/of_pci.h> 13 #include <linux/of_platform.h> 14 #include <linux/platform_device.h> 15 #include <linux/pci_hotplug.h> 16 #include <linux/slab.h> 17 #include <linux/module.h> 18 #include <linux/cpumask.h> 19 #include <linux/aer.h> 20 #include <linux/acpi.h> 21 #include <linux/hypervisor.h> 22 #include <linux/irqdomain.h> 23 #include <linux/pm_runtime.h> 24 #include <linux/bitfield.h> 25 #include "pci.h" 26 27 #define CARDBUS_LATENCY_TIMER 176 /* secondary latency timer */ 28 #define CARDBUS_RESERVE_BUSNR 3 29 30 static struct resource busn_resource = { 31 .name = "PCI busn", 32 .start = 0, 33 .end = 255, 34 .flags = IORESOURCE_BUS, 35 }; 36 37 /* Ugh. Need to stop exporting this to modules. */ 38 LIST_HEAD(pci_root_buses); 39 EXPORT_SYMBOL(pci_root_buses); 40 41 static LIST_HEAD(pci_domain_busn_res_list); 42 43 struct pci_domain_busn_res { 44 struct list_head list; 45 struct resource res; 46 int domain_nr; 47 }; 48 49 static struct resource *get_pci_domain_busn_res(int domain_nr) 50 { 51 struct pci_domain_busn_res *r; 52 53 list_for_each_entry(r, &pci_domain_busn_res_list, list) 54 if (r->domain_nr == domain_nr) 55 return &r->res; 56 57 r = kzalloc(sizeof(*r), GFP_KERNEL); 58 if (!r) 59 return NULL; 60 61 r->domain_nr = domain_nr; 62 r->res.start = 0; 63 r->res.end = 0xff; 64 r->res.flags = IORESOURCE_BUS | IORESOURCE_PCI_FIXED; 65 66 list_add_tail(&r->list, &pci_domain_busn_res_list); 67 68 return &r->res; 69 } 70 71 /* 72 * Some device drivers need know if PCI is initiated. 73 * Basically, we think PCI is not initiated when there 74 * is no device to be found on the pci_bus_type. 75 */ 76 int no_pci_devices(void) 77 { 78 struct device *dev; 79 int no_devices; 80 81 dev = bus_find_next_device(&pci_bus_type, NULL); 82 no_devices = (dev == NULL); 83 put_device(dev); 84 return no_devices; 85 } 86 EXPORT_SYMBOL(no_pci_devices); 87 88 /* 89 * PCI Bus Class 90 */ 91 static void release_pcibus_dev(struct device *dev) 92 { 93 struct pci_bus *pci_bus = to_pci_bus(dev); 94 95 put_device(pci_bus->bridge); 96 pci_bus_remove_resources(pci_bus); 97 pci_release_bus_of_node(pci_bus); 98 kfree(pci_bus); 99 } 100 101 static const struct class pcibus_class = { 102 .name = "pci_bus", 103 .dev_release = &release_pcibus_dev, 104 .dev_groups = pcibus_groups, 105 }; 106 107 static int __init pcibus_class_init(void) 108 { 109 return class_register(&pcibus_class); 110 } 111 postcore_initcall(pcibus_class_init); 112 113 static u64 pci_size(u64 base, u64 maxbase, u64 mask) 114 { 115 u64 size = mask & maxbase; /* Find the significant bits */ 116 if (!size) 117 return 0; 118 119 /* 120 * Get the lowest of them to find the decode size, and from that 121 * the extent. 122 */ 123 size = size & ~(size-1); 124 125 /* 126 * base == maxbase can be valid only if the BAR has already been 127 * programmed with all 1s. 128 */ 129 if (base == maxbase && ((base | (size - 1)) & mask) != mask) 130 return 0; 131 132 return size; 133 } 134 135 static inline unsigned long decode_bar(struct pci_dev *dev, u32 bar) 136 { 137 u32 mem_type; 138 unsigned long flags; 139 140 if ((bar & PCI_BASE_ADDRESS_SPACE) == PCI_BASE_ADDRESS_SPACE_IO) { 141 flags = bar & ~PCI_BASE_ADDRESS_IO_MASK; 142 flags |= IORESOURCE_IO; 143 return flags; 144 } 145 146 flags = bar & ~PCI_BASE_ADDRESS_MEM_MASK; 147 flags |= IORESOURCE_MEM; 148 if (flags & PCI_BASE_ADDRESS_MEM_PREFETCH) 149 flags |= IORESOURCE_PREFETCH; 150 151 mem_type = bar & PCI_BASE_ADDRESS_MEM_TYPE_MASK; 152 switch (mem_type) { 153 case PCI_BASE_ADDRESS_MEM_TYPE_32: 154 break; 155 case PCI_BASE_ADDRESS_MEM_TYPE_1M: 156 /* 1M mem BAR treated as 32-bit BAR */ 157 break; 158 case PCI_BASE_ADDRESS_MEM_TYPE_64: 159 flags |= IORESOURCE_MEM_64; 160 break; 161 default: 162 /* mem unknown type treated as 32-bit BAR */ 163 break; 164 } 165 return flags; 166 } 167 168 #define PCI_COMMAND_DECODE_ENABLE (PCI_COMMAND_MEMORY | PCI_COMMAND_IO) 169 170 /** 171 * __pci_size_bars - Read the raw BAR mask for a range of PCI BARs 172 * @dev: the PCI device 173 * @count: number of BARs to size 174 * @pos: starting config space position 175 * @sizes: array to store mask values 176 * @rom: indicate whether to use ROM mask, which avoids enabling ROM BARs 177 * 178 * Provided @sizes array must be sufficiently sized to store results for 179 * @count u32 BARs. Caller is responsible for disabling decode to specified 180 * BAR range around calling this function. This function is intended to avoid 181 * disabling decode around sizing each BAR individually, which can result in 182 * non-trivial overhead in virtualized environments with very large PCI BARs. 183 */ 184 static void __pci_size_bars(struct pci_dev *dev, int count, 185 unsigned int pos, u32 *sizes, bool rom) 186 { 187 u32 orig, mask = rom ? PCI_ROM_ADDRESS_MASK : ~0; 188 int i; 189 190 for (i = 0; i < count; i++, pos += 4, sizes++) { 191 pci_read_config_dword(dev, pos, &orig); 192 pci_write_config_dword(dev, pos, mask); 193 pci_read_config_dword(dev, pos, sizes); 194 pci_write_config_dword(dev, pos, orig); 195 } 196 } 197 198 void __pci_size_stdbars(struct pci_dev *dev, int count, 199 unsigned int pos, u32 *sizes) 200 { 201 __pci_size_bars(dev, count, pos, sizes, false); 202 } 203 204 static void __pci_size_rom(struct pci_dev *dev, unsigned int pos, u32 *sizes) 205 { 206 __pci_size_bars(dev, 1, pos, sizes, true); 207 } 208 209 /** 210 * __pci_read_base - Read a PCI BAR 211 * @dev: the PCI device 212 * @type: type of the BAR 213 * @res: resource buffer to be filled in 214 * @pos: BAR position in the config space 215 * @sizes: array of one or more pre-read BAR masks 216 * 217 * Returns 1 if the BAR is 64-bit, or 0 if 32-bit. 218 */ 219 int __pci_read_base(struct pci_dev *dev, enum pci_bar_type type, 220 struct resource *res, unsigned int pos, u32 *sizes) 221 { 222 u32 l = 0, sz; 223 u64 l64, sz64, mask64; 224 struct pci_bus_region region, inverted_region; 225 const char *res_name = pci_resource_name(dev, res - dev->resource); 226 227 res->name = pci_name(dev); 228 229 pci_read_config_dword(dev, pos, &l); 230 sz = sizes[0]; 231 232 /* 233 * All bits set in sz means the device isn't working properly. 234 * If the BAR isn't implemented, all bits must be 0. If it's a 235 * memory BAR or a ROM, bit 0 must be clear; if it's an io BAR, bit 236 * 1 must be clear. 237 */ 238 if (PCI_POSSIBLE_ERROR(sz)) 239 sz = 0; 240 241 /* 242 * I don't know how l can have all bits set. Copied from old code. 243 * Maybe it fixes a bug on some ancient platform. 244 */ 245 if (PCI_POSSIBLE_ERROR(l)) 246 l = 0; 247 248 if (type == pci_bar_unknown) { 249 res->flags = decode_bar(dev, l); 250 res->flags |= IORESOURCE_SIZEALIGN; 251 if (res->flags & IORESOURCE_IO) { 252 l64 = l & PCI_BASE_ADDRESS_IO_MASK; 253 sz64 = sz & PCI_BASE_ADDRESS_IO_MASK; 254 mask64 = PCI_BASE_ADDRESS_IO_MASK & (u32)IO_SPACE_LIMIT; 255 } else { 256 l64 = l & PCI_BASE_ADDRESS_MEM_MASK; 257 sz64 = sz & PCI_BASE_ADDRESS_MEM_MASK; 258 mask64 = (u32)PCI_BASE_ADDRESS_MEM_MASK; 259 } 260 } else { 261 if (l & PCI_ROM_ADDRESS_ENABLE) 262 res->flags |= IORESOURCE_ROM_ENABLE; 263 l64 = l & PCI_ROM_ADDRESS_MASK; 264 sz64 = sz & PCI_ROM_ADDRESS_MASK; 265 mask64 = PCI_ROM_ADDRESS_MASK; 266 } 267 268 if (res->flags & IORESOURCE_MEM_64) { 269 pci_read_config_dword(dev, pos + 4, &l); 270 sz = sizes[1]; 271 272 l64 |= ((u64)l << 32); 273 sz64 |= ((u64)sz << 32); 274 mask64 |= ((u64)~0 << 32); 275 } 276 277 if (!sz64) 278 goto fail; 279 280 sz64 = pci_size(l64, sz64, mask64); 281 if (!sz64) { 282 pci_info(dev, FW_BUG "%s: invalid; can't size\n", res_name); 283 goto fail; 284 } 285 286 if (res->flags & IORESOURCE_MEM_64) { 287 if ((sizeof(pci_bus_addr_t) < 8 || sizeof(resource_size_t) < 8) 288 && sz64 > 0x100000000ULL) { 289 res->flags |= IORESOURCE_UNSET | IORESOURCE_DISABLED; 290 res->start = 0; 291 res->end = 0; 292 pci_err(dev, "%s: can't handle BAR larger than 4GB (size %#010llx)\n", 293 res_name, (unsigned long long)sz64); 294 goto out; 295 } 296 297 if ((sizeof(pci_bus_addr_t) < 8) && l) { 298 /* Above 32-bit boundary; try to reallocate */ 299 res->flags |= IORESOURCE_UNSET; 300 res->start = 0; 301 res->end = sz64 - 1; 302 pci_info(dev, "%s: can't handle BAR above 4GB (bus address %#010llx)\n", 303 res_name, (unsigned long long)l64); 304 goto out; 305 } 306 } 307 308 region.start = l64; 309 region.end = l64 + sz64 - 1; 310 311 pcibios_bus_to_resource(dev->bus, res, ®ion); 312 pcibios_resource_to_bus(dev->bus, &inverted_region, res); 313 314 /* 315 * If "A" is a BAR value (a bus address), "bus_to_resource(A)" is 316 * the corresponding resource address (the physical address used by 317 * the CPU. Converting that resource address back to a bus address 318 * should yield the original BAR value: 319 * 320 * resource_to_bus(bus_to_resource(A)) == A 321 * 322 * If it doesn't, CPU accesses to "bus_to_resource(A)" will not 323 * be claimed by the device. 324 */ 325 if (inverted_region.start != region.start) { 326 res->flags |= IORESOURCE_UNSET; 327 res->start = 0; 328 res->end = region.end - region.start; 329 pci_info(dev, "%s: initial BAR value %#010llx invalid\n", 330 res_name, (unsigned long long)region.start); 331 } 332 333 goto out; 334 335 336 fail: 337 res->flags = 0; 338 out: 339 if (res->flags) 340 pci_info(dev, "%s %pR\n", res_name, res); 341 342 return (res->flags & IORESOURCE_MEM_64) ? 1 : 0; 343 } 344 345 static __always_inline void pci_read_bases(struct pci_dev *dev, 346 unsigned int howmany, int rom) 347 { 348 u32 rombar, stdbars[PCI_STD_NUM_BARS]; 349 unsigned int pos, reg; 350 u16 orig_cmd; 351 352 BUILD_BUG_ON(statically_true(howmany > PCI_STD_NUM_BARS)); 353 354 if (dev->non_compliant_bars) 355 return; 356 357 /* Per PCIe r4.0, sec 9.3.4.1.11, the VF BARs are all RO Zero */ 358 if (dev->is_virtfn) 359 return; 360 361 /* No printks while decoding is disabled! */ 362 if (!dev->mmio_always_on) { 363 pci_read_config_word(dev, PCI_COMMAND, &orig_cmd); 364 if (orig_cmd & PCI_COMMAND_DECODE_ENABLE) { 365 pci_write_config_word(dev, PCI_COMMAND, 366 orig_cmd & ~PCI_COMMAND_DECODE_ENABLE); 367 } 368 } 369 370 __pci_size_stdbars(dev, howmany, PCI_BASE_ADDRESS_0, stdbars); 371 if (rom) 372 __pci_size_rom(dev, rom, &rombar); 373 374 if (!dev->mmio_always_on && 375 (orig_cmd & PCI_COMMAND_DECODE_ENABLE)) 376 pci_write_config_word(dev, PCI_COMMAND, orig_cmd); 377 378 for (pos = 0; pos < howmany; pos++) { 379 struct resource *res = &dev->resource[pos]; 380 reg = PCI_BASE_ADDRESS_0 + (pos << 2); 381 pos += __pci_read_base(dev, pci_bar_unknown, 382 res, reg, &stdbars[pos]); 383 } 384 385 if (rom) { 386 struct resource *res = &dev->resource[PCI_ROM_RESOURCE]; 387 dev->rom_base_reg = rom; 388 res->flags = IORESOURCE_MEM | IORESOURCE_PREFETCH | 389 IORESOURCE_READONLY | IORESOURCE_SIZEALIGN; 390 __pci_read_base(dev, pci_bar_mem32, res, rom, &rombar); 391 } 392 } 393 394 static void pci_read_bridge_io(struct pci_dev *dev, struct resource *res, 395 bool log) 396 { 397 u8 io_base_lo, io_limit_lo; 398 unsigned long io_mask, io_granularity, base, limit; 399 struct pci_bus_region region; 400 401 io_mask = PCI_IO_RANGE_MASK; 402 io_granularity = 0x1000; 403 if (dev->io_window_1k) { 404 /* Support 1K I/O space granularity */ 405 io_mask = PCI_IO_1K_RANGE_MASK; 406 io_granularity = 0x400; 407 } 408 409 pci_read_config_byte(dev, PCI_IO_BASE, &io_base_lo); 410 pci_read_config_byte(dev, PCI_IO_LIMIT, &io_limit_lo); 411 base = (io_base_lo & io_mask) << 8; 412 limit = (io_limit_lo & io_mask) << 8; 413 414 if ((io_base_lo & PCI_IO_RANGE_TYPE_MASK) == PCI_IO_RANGE_TYPE_32) { 415 u16 io_base_hi, io_limit_hi; 416 417 pci_read_config_word(dev, PCI_IO_BASE_UPPER16, &io_base_hi); 418 pci_read_config_word(dev, PCI_IO_LIMIT_UPPER16, &io_limit_hi); 419 base |= ((unsigned long) io_base_hi << 16); 420 limit |= ((unsigned long) io_limit_hi << 16); 421 } 422 423 res->flags = (io_base_lo & PCI_IO_RANGE_TYPE_MASK) | IORESOURCE_IO; 424 425 if (base <= limit) { 426 region.start = base; 427 region.end = limit + io_granularity - 1; 428 pcibios_bus_to_resource(dev->bus, res, ®ion); 429 if (log) 430 pci_info(dev, " bridge window %pR\n", res); 431 } else { 432 resource_set_range(res, 0, 0); 433 res->flags |= IORESOURCE_UNSET | IORESOURCE_DISABLED; 434 } 435 } 436 437 static void pci_read_bridge_mmio(struct pci_dev *dev, struct resource *res, 438 bool log) 439 { 440 u16 mem_base_lo, mem_limit_lo; 441 unsigned long base, limit; 442 struct pci_bus_region region; 443 444 pci_read_config_word(dev, PCI_MEMORY_BASE, &mem_base_lo); 445 pci_read_config_word(dev, PCI_MEMORY_LIMIT, &mem_limit_lo); 446 base = ((unsigned long) mem_base_lo & PCI_MEMORY_RANGE_MASK) << 16; 447 limit = ((unsigned long) mem_limit_lo & PCI_MEMORY_RANGE_MASK) << 16; 448 449 res->flags = (mem_base_lo & PCI_MEMORY_RANGE_TYPE_MASK) | IORESOURCE_MEM; 450 451 if (base <= limit) { 452 region.start = base; 453 region.end = limit + 0xfffff; 454 pcibios_bus_to_resource(dev->bus, res, ®ion); 455 if (log) 456 pci_info(dev, " bridge window %pR\n", res); 457 } else { 458 resource_set_range(res, 0, 0); 459 res->flags |= IORESOURCE_UNSET | IORESOURCE_DISABLED; 460 } 461 } 462 463 static void pci_read_bridge_mmio_pref(struct pci_dev *dev, struct resource *res, 464 bool log) 465 { 466 u16 mem_base_lo, mem_limit_lo; 467 u64 base64, limit64; 468 pci_bus_addr_t base, limit; 469 struct pci_bus_region region; 470 471 pci_read_config_word(dev, PCI_PREF_MEMORY_BASE, &mem_base_lo); 472 pci_read_config_word(dev, PCI_PREF_MEMORY_LIMIT, &mem_limit_lo); 473 base64 = (mem_base_lo & PCI_PREF_RANGE_MASK) << 16; 474 limit64 = (mem_limit_lo & PCI_PREF_RANGE_MASK) << 16; 475 476 if ((mem_base_lo & PCI_PREF_RANGE_TYPE_MASK) == PCI_PREF_RANGE_TYPE_64) { 477 u32 mem_base_hi, mem_limit_hi; 478 479 pci_read_config_dword(dev, PCI_PREF_BASE_UPPER32, &mem_base_hi); 480 pci_read_config_dword(dev, PCI_PREF_LIMIT_UPPER32, &mem_limit_hi); 481 482 /* 483 * Some bridges set the base > limit by default, and some 484 * (broken) BIOSes do not initialize them. If we find 485 * this, just assume they are not being used. 486 */ 487 if (mem_base_hi <= mem_limit_hi) { 488 base64 |= (u64) mem_base_hi << 32; 489 limit64 |= (u64) mem_limit_hi << 32; 490 } 491 } 492 493 base = (pci_bus_addr_t) base64; 494 limit = (pci_bus_addr_t) limit64; 495 496 if (base != base64) { 497 pci_err(dev, "can't handle bridge window above 4GB (bus address %#010llx)\n", 498 (unsigned long long) base64); 499 return; 500 } 501 502 res->flags = (mem_base_lo & PCI_PREF_RANGE_TYPE_MASK) | IORESOURCE_MEM | 503 IORESOURCE_PREFETCH; 504 if (res->flags & PCI_PREF_RANGE_TYPE_64) 505 res->flags |= IORESOURCE_MEM_64; 506 507 if (base <= limit) { 508 region.start = base; 509 region.end = limit + 0xfffff; 510 pcibios_bus_to_resource(dev->bus, res, ®ion); 511 if (log) 512 pci_info(dev, " bridge window %pR\n", res); 513 } else { 514 resource_set_range(res, 0, 0); 515 res->flags |= IORESOURCE_UNSET | IORESOURCE_DISABLED; 516 } 517 } 518 519 static void pci_read_bridge_windows(struct pci_dev *bridge) 520 { 521 u32 buses; 522 u16 io; 523 u32 pmem, tmp; 524 struct resource res; 525 526 pci_read_config_dword(bridge, PCI_PRIMARY_BUS, &buses); 527 res.flags = IORESOURCE_BUS; 528 res.start = (buses >> 8) & 0xff; 529 res.end = (buses >> 16) & 0xff; 530 pci_info(bridge, "PCI bridge to %pR%s\n", &res, 531 bridge->transparent ? " (subtractive decode)" : ""); 532 533 pci_read_config_word(bridge, PCI_IO_BASE, &io); 534 if (!io) { 535 pci_write_config_word(bridge, PCI_IO_BASE, 0xe0f0); 536 pci_read_config_word(bridge, PCI_IO_BASE, &io); 537 pci_write_config_word(bridge, PCI_IO_BASE, 0x0); 538 } 539 if (io) { 540 bridge->io_window = 1; 541 pci_read_bridge_io(bridge, &res, true); 542 } 543 544 pci_read_bridge_mmio(bridge, &res, true); 545 546 /* 547 * DECchip 21050 pass 2 errata: the bridge may miss an address 548 * disconnect boundary by one PCI data phase. Workaround: do not 549 * use prefetching on this device. 550 */ 551 if (bridge->vendor == PCI_VENDOR_ID_DEC && bridge->device == 0x0001) 552 return; 553 554 pci_read_config_dword(bridge, PCI_PREF_MEMORY_BASE, &pmem); 555 if (!pmem) { 556 pci_write_config_dword(bridge, PCI_PREF_MEMORY_BASE, 557 0xffe0fff0); 558 pci_read_config_dword(bridge, PCI_PREF_MEMORY_BASE, &pmem); 559 pci_write_config_dword(bridge, PCI_PREF_MEMORY_BASE, 0x0); 560 } 561 if (!pmem) 562 return; 563 564 bridge->pref_window = 1; 565 566 if ((pmem & PCI_PREF_RANGE_TYPE_MASK) == PCI_PREF_RANGE_TYPE_64) { 567 568 /* 569 * Bridge claims to have a 64-bit prefetchable memory 570 * window; verify that the upper bits are actually 571 * writable. 572 */ 573 pci_read_config_dword(bridge, PCI_PREF_BASE_UPPER32, &pmem); 574 pci_write_config_dword(bridge, PCI_PREF_BASE_UPPER32, 575 0xffffffff); 576 pci_read_config_dword(bridge, PCI_PREF_BASE_UPPER32, &tmp); 577 pci_write_config_dword(bridge, PCI_PREF_BASE_UPPER32, pmem); 578 if (tmp) 579 bridge->pref_64_window = 1; 580 } 581 582 pci_read_bridge_mmio_pref(bridge, &res, true); 583 } 584 585 void pci_read_bridge_bases(struct pci_bus *child) 586 { 587 struct pci_dev *dev = child->self; 588 struct resource *res; 589 int i; 590 591 if (pci_is_root_bus(child)) /* It's a host bus, nothing to read */ 592 return; 593 594 pci_info(dev, "PCI bridge to %pR%s\n", 595 &child->busn_res, 596 dev->transparent ? " (subtractive decode)" : ""); 597 598 pci_bus_remove_resources(child); 599 for (i = 0; i < PCI_BRIDGE_RESOURCE_NUM; i++) 600 child->resource[i] = &dev->resource[PCI_BRIDGE_RESOURCES+i]; 601 602 pci_read_bridge_io(child->self, 603 child->resource[PCI_BUS_BRIDGE_IO_WINDOW], false); 604 pci_read_bridge_mmio(child->self, 605 child->resource[PCI_BUS_BRIDGE_MEM_WINDOW], false); 606 pci_read_bridge_mmio_pref(child->self, 607 child->resource[PCI_BUS_BRIDGE_PREF_MEM_WINDOW], 608 false); 609 610 if (!dev->transparent) 611 return; 612 613 pci_bus_for_each_resource(child->parent, res) { 614 if (!res || !res->flags) 615 continue; 616 617 pci_bus_add_resource(child, res); 618 pci_info(dev, " bridge window %pR (subtractive decode)\n", res); 619 } 620 } 621 622 static struct pci_bus *pci_alloc_bus(struct pci_bus *parent) 623 { 624 struct pci_bus *b; 625 626 b = kzalloc(sizeof(*b), GFP_KERNEL); 627 if (!b) 628 return NULL; 629 630 INIT_LIST_HEAD(&b->node); 631 INIT_LIST_HEAD(&b->children); 632 INIT_LIST_HEAD(&b->devices); 633 INIT_LIST_HEAD(&b->slots); 634 INIT_LIST_HEAD(&b->resources); 635 b->max_bus_speed = PCI_SPEED_UNKNOWN; 636 b->cur_bus_speed = PCI_SPEED_UNKNOWN; 637 #ifdef CONFIG_PCI_DOMAINS_GENERIC 638 if (parent) 639 b->domain_nr = parent->domain_nr; 640 #endif 641 return b; 642 } 643 644 static void pci_release_host_bridge_dev(struct device *dev) 645 { 646 struct pci_host_bridge *bridge = to_pci_host_bridge(dev); 647 648 if (bridge->release_fn) 649 bridge->release_fn(bridge); 650 651 pci_free_resource_list(&bridge->windows); 652 pci_free_resource_list(&bridge->dma_ranges); 653 kfree(bridge); 654 } 655 656 static void pci_init_host_bridge(struct pci_host_bridge *bridge) 657 { 658 INIT_LIST_HEAD(&bridge->windows); 659 INIT_LIST_HEAD(&bridge->dma_ranges); 660 661 /* 662 * We assume we can manage these PCIe features. Some systems may 663 * reserve these for use by the platform itself, e.g., an ACPI BIOS 664 * may implement its own AER handling and use _OSC to prevent the 665 * OS from interfering. 666 */ 667 bridge->native_aer = 1; 668 bridge->native_pcie_hotplug = 1; 669 bridge->native_shpc_hotplug = 1; 670 bridge->native_pme = 1; 671 bridge->native_ltr = 1; 672 bridge->native_dpc = 1; 673 bridge->domain_nr = PCI_DOMAIN_NR_NOT_SET; 674 bridge->native_cxl_error = 1; 675 676 device_initialize(&bridge->dev); 677 } 678 679 struct pci_host_bridge *pci_alloc_host_bridge(size_t priv) 680 { 681 struct pci_host_bridge *bridge; 682 683 bridge = kzalloc(sizeof(*bridge) + priv, GFP_KERNEL); 684 if (!bridge) 685 return NULL; 686 687 pci_init_host_bridge(bridge); 688 bridge->dev.release = pci_release_host_bridge_dev; 689 690 return bridge; 691 } 692 EXPORT_SYMBOL(pci_alloc_host_bridge); 693 694 static void devm_pci_alloc_host_bridge_release(void *data) 695 { 696 pci_free_host_bridge(data); 697 } 698 699 struct pci_host_bridge *devm_pci_alloc_host_bridge(struct device *dev, 700 size_t priv) 701 { 702 int ret; 703 struct pci_host_bridge *bridge; 704 705 bridge = pci_alloc_host_bridge(priv); 706 if (!bridge) 707 return NULL; 708 709 bridge->dev.parent = dev; 710 711 ret = devm_add_action_or_reset(dev, devm_pci_alloc_host_bridge_release, 712 bridge); 713 if (ret) 714 return NULL; 715 716 ret = devm_of_pci_bridge_init(dev, bridge); 717 if (ret) 718 return NULL; 719 720 return bridge; 721 } 722 EXPORT_SYMBOL(devm_pci_alloc_host_bridge); 723 724 void pci_free_host_bridge(struct pci_host_bridge *bridge) 725 { 726 put_device(&bridge->dev); 727 } 728 EXPORT_SYMBOL(pci_free_host_bridge); 729 730 /* Indexed by PCI_X_SSTATUS_FREQ (secondary bus mode and frequency) */ 731 static const unsigned char pcix_bus_speed[] = { 732 PCI_SPEED_UNKNOWN, /* 0 */ 733 PCI_SPEED_66MHz_PCIX, /* 1 */ 734 PCI_SPEED_100MHz_PCIX, /* 2 */ 735 PCI_SPEED_133MHz_PCIX, /* 3 */ 736 PCI_SPEED_UNKNOWN, /* 4 */ 737 PCI_SPEED_66MHz_PCIX_ECC, /* 5 */ 738 PCI_SPEED_100MHz_PCIX_ECC, /* 6 */ 739 PCI_SPEED_133MHz_PCIX_ECC, /* 7 */ 740 PCI_SPEED_UNKNOWN, /* 8 */ 741 PCI_SPEED_66MHz_PCIX_266, /* 9 */ 742 PCI_SPEED_100MHz_PCIX_266, /* A */ 743 PCI_SPEED_133MHz_PCIX_266, /* B */ 744 PCI_SPEED_UNKNOWN, /* C */ 745 PCI_SPEED_66MHz_PCIX_533, /* D */ 746 PCI_SPEED_100MHz_PCIX_533, /* E */ 747 PCI_SPEED_133MHz_PCIX_533 /* F */ 748 }; 749 750 /* Indexed by PCI_EXP_LNKCAP_SLS, PCI_EXP_LNKSTA_CLS */ 751 const unsigned char pcie_link_speed[] = { 752 PCI_SPEED_UNKNOWN, /* 0 */ 753 PCIE_SPEED_2_5GT, /* 1 */ 754 PCIE_SPEED_5_0GT, /* 2 */ 755 PCIE_SPEED_8_0GT, /* 3 */ 756 PCIE_SPEED_16_0GT, /* 4 */ 757 PCIE_SPEED_32_0GT, /* 5 */ 758 PCIE_SPEED_64_0GT, /* 6 */ 759 PCI_SPEED_UNKNOWN, /* 7 */ 760 PCI_SPEED_UNKNOWN, /* 8 */ 761 PCI_SPEED_UNKNOWN, /* 9 */ 762 PCI_SPEED_UNKNOWN, /* A */ 763 PCI_SPEED_UNKNOWN, /* B */ 764 PCI_SPEED_UNKNOWN, /* C */ 765 PCI_SPEED_UNKNOWN, /* D */ 766 PCI_SPEED_UNKNOWN, /* E */ 767 PCI_SPEED_UNKNOWN /* F */ 768 }; 769 EXPORT_SYMBOL_GPL(pcie_link_speed); 770 771 const char *pci_speed_string(enum pci_bus_speed speed) 772 { 773 /* Indexed by the pci_bus_speed enum */ 774 static const char *speed_strings[] = { 775 "33 MHz PCI", /* 0x00 */ 776 "66 MHz PCI", /* 0x01 */ 777 "66 MHz PCI-X", /* 0x02 */ 778 "100 MHz PCI-X", /* 0x03 */ 779 "133 MHz PCI-X", /* 0x04 */ 780 NULL, /* 0x05 */ 781 NULL, /* 0x06 */ 782 NULL, /* 0x07 */ 783 NULL, /* 0x08 */ 784 "66 MHz PCI-X 266", /* 0x09 */ 785 "100 MHz PCI-X 266", /* 0x0a */ 786 "133 MHz PCI-X 266", /* 0x0b */ 787 "Unknown AGP", /* 0x0c */ 788 "1x AGP", /* 0x0d */ 789 "2x AGP", /* 0x0e */ 790 "4x AGP", /* 0x0f */ 791 "8x AGP", /* 0x10 */ 792 "66 MHz PCI-X 533", /* 0x11 */ 793 "100 MHz PCI-X 533", /* 0x12 */ 794 "133 MHz PCI-X 533", /* 0x13 */ 795 "2.5 GT/s PCIe", /* 0x14 */ 796 "5.0 GT/s PCIe", /* 0x15 */ 797 "8.0 GT/s PCIe", /* 0x16 */ 798 "16.0 GT/s PCIe", /* 0x17 */ 799 "32.0 GT/s PCIe", /* 0x18 */ 800 "64.0 GT/s PCIe", /* 0x19 */ 801 }; 802 803 if (speed < ARRAY_SIZE(speed_strings)) 804 return speed_strings[speed]; 805 return "Unknown"; 806 } 807 EXPORT_SYMBOL_GPL(pci_speed_string); 808 809 void pcie_update_link_speed(struct pci_bus *bus) 810 { 811 struct pci_dev *bridge = bus->self; 812 u16 linksta, linksta2; 813 814 pcie_capability_read_word(bridge, PCI_EXP_LNKSTA, &linksta); 815 pcie_capability_read_word(bridge, PCI_EXP_LNKSTA2, &linksta2); 816 __pcie_update_link_speed(bus, linksta, linksta2); 817 } 818 EXPORT_SYMBOL_GPL(pcie_update_link_speed); 819 820 static unsigned char agp_speeds[] = { 821 AGP_UNKNOWN, 822 AGP_1X, 823 AGP_2X, 824 AGP_4X, 825 AGP_8X 826 }; 827 828 static enum pci_bus_speed agp_speed(int agp3, int agpstat) 829 { 830 int index = 0; 831 832 if (agpstat & 4) 833 index = 3; 834 else if (agpstat & 2) 835 index = 2; 836 else if (agpstat & 1) 837 index = 1; 838 else 839 goto out; 840 841 if (agp3) { 842 index += 2; 843 if (index == 5) 844 index = 0; 845 } 846 847 out: 848 return agp_speeds[index]; 849 } 850 851 static void pci_set_bus_speed(struct pci_bus *bus) 852 { 853 struct pci_dev *bridge = bus->self; 854 int pos; 855 856 pos = pci_find_capability(bridge, PCI_CAP_ID_AGP); 857 if (!pos) 858 pos = pci_find_capability(bridge, PCI_CAP_ID_AGP3); 859 if (pos) { 860 u32 agpstat, agpcmd; 861 862 pci_read_config_dword(bridge, pos + PCI_AGP_STATUS, &agpstat); 863 bus->max_bus_speed = agp_speed(agpstat & 8, agpstat & 7); 864 865 pci_read_config_dword(bridge, pos + PCI_AGP_COMMAND, &agpcmd); 866 bus->cur_bus_speed = agp_speed(agpstat & 8, agpcmd & 7); 867 } 868 869 pos = pci_find_capability(bridge, PCI_CAP_ID_PCIX); 870 if (pos) { 871 u16 status; 872 enum pci_bus_speed max; 873 874 pci_read_config_word(bridge, pos + PCI_X_BRIDGE_SSTATUS, 875 &status); 876 877 if (status & PCI_X_SSTATUS_533MHZ) { 878 max = PCI_SPEED_133MHz_PCIX_533; 879 } else if (status & PCI_X_SSTATUS_266MHZ) { 880 max = PCI_SPEED_133MHz_PCIX_266; 881 } else if (status & PCI_X_SSTATUS_133MHZ) { 882 if ((status & PCI_X_SSTATUS_VERS) == PCI_X_SSTATUS_V2) 883 max = PCI_SPEED_133MHz_PCIX_ECC; 884 else 885 max = PCI_SPEED_133MHz_PCIX; 886 } else { 887 max = PCI_SPEED_66MHz_PCIX; 888 } 889 890 bus->max_bus_speed = max; 891 bus->cur_bus_speed = 892 pcix_bus_speed[FIELD_GET(PCI_X_SSTATUS_FREQ, status)]; 893 894 return; 895 } 896 897 if (pci_is_pcie(bridge)) { 898 u32 linkcap; 899 900 pcie_capability_read_dword(bridge, PCI_EXP_LNKCAP, &linkcap); 901 bus->max_bus_speed = pcie_link_speed[linkcap & PCI_EXP_LNKCAP_SLS]; 902 903 pcie_update_link_speed(bus); 904 } 905 } 906 907 static struct irq_domain *pci_host_bridge_msi_domain(struct pci_bus *bus) 908 { 909 struct irq_domain *d; 910 911 /* If the host bridge driver sets a MSI domain of the bridge, use it */ 912 d = dev_get_msi_domain(bus->bridge); 913 914 /* 915 * Any firmware interface that can resolve the msi_domain 916 * should be called from here. 917 */ 918 if (!d) 919 d = pci_host_bridge_of_msi_domain(bus); 920 if (!d) 921 d = pci_host_bridge_acpi_msi_domain(bus); 922 923 /* 924 * If no IRQ domain was found via the OF tree, try looking it up 925 * directly through the fwnode_handle. 926 */ 927 if (!d) { 928 struct fwnode_handle *fwnode = pci_root_bus_fwnode(bus); 929 930 if (fwnode) 931 d = irq_find_matching_fwnode(fwnode, 932 DOMAIN_BUS_PCI_MSI); 933 } 934 935 return d; 936 } 937 938 static void pci_set_bus_msi_domain(struct pci_bus *bus) 939 { 940 struct irq_domain *d; 941 struct pci_bus *b; 942 943 /* 944 * The bus can be a root bus, a subordinate bus, or a virtual bus 945 * created by an SR-IOV device. Walk up to the first bridge device 946 * found or derive the domain from the host bridge. 947 */ 948 for (b = bus, d = NULL; !d && !pci_is_root_bus(b); b = b->parent) { 949 if (b->self) 950 d = dev_get_msi_domain(&b->self->dev); 951 } 952 953 if (!d) 954 d = pci_host_bridge_msi_domain(b); 955 956 dev_set_msi_domain(&bus->dev, d); 957 } 958 959 static bool pci_preserve_config(struct pci_host_bridge *host_bridge) 960 { 961 if (pci_acpi_preserve_config(host_bridge)) 962 return true; 963 964 if (host_bridge->dev.parent && host_bridge->dev.parent->of_node) 965 return of_pci_preserve_config(host_bridge->dev.parent->of_node); 966 967 return false; 968 } 969 970 static int pci_register_host_bridge(struct pci_host_bridge *bridge) 971 { 972 struct device *parent = bridge->dev.parent; 973 struct resource_entry *window, *next, *n; 974 struct pci_bus *bus, *b; 975 resource_size_t offset, next_offset; 976 LIST_HEAD(resources); 977 struct resource *res, *next_res; 978 bool bus_registered = false; 979 char addr[64], *fmt; 980 const char *name; 981 int err; 982 983 bus = pci_alloc_bus(NULL); 984 if (!bus) 985 return -ENOMEM; 986 987 bridge->bus = bus; 988 989 bus->sysdata = bridge->sysdata; 990 bus->ops = bridge->ops; 991 bus->number = bus->busn_res.start = bridge->busnr; 992 #ifdef CONFIG_PCI_DOMAINS_GENERIC 993 if (bridge->domain_nr == PCI_DOMAIN_NR_NOT_SET) 994 bus->domain_nr = pci_bus_find_domain_nr(bus, parent); 995 else 996 bus->domain_nr = bridge->domain_nr; 997 if (bus->domain_nr < 0) { 998 err = bus->domain_nr; 999 goto free; 1000 } 1001 #endif 1002 1003 b = pci_find_bus(pci_domain_nr(bus), bridge->busnr); 1004 if (b) { 1005 /* Ignore it if we already got here via a different bridge */ 1006 dev_dbg(&b->dev, "bus already known\n"); 1007 err = -EEXIST; 1008 goto free; 1009 } 1010 1011 dev_set_name(&bridge->dev, "pci%04x:%02x", pci_domain_nr(bus), 1012 bridge->busnr); 1013 1014 err = pcibios_root_bridge_prepare(bridge); 1015 if (err) 1016 goto free; 1017 1018 /* Temporarily move resources off the list */ 1019 list_splice_init(&bridge->windows, &resources); 1020 err = device_add(&bridge->dev); 1021 if (err) 1022 goto free; 1023 1024 bus->bridge = get_device(&bridge->dev); 1025 device_enable_async_suspend(bus->bridge); 1026 pci_set_bus_of_node(bus); 1027 pci_set_bus_msi_domain(bus); 1028 if (bridge->msi_domain && !dev_get_msi_domain(&bus->dev) && 1029 !pci_host_of_has_msi_map(parent)) 1030 bus->bus_flags |= PCI_BUS_FLAGS_NO_MSI; 1031 1032 if (!parent) 1033 set_dev_node(bus->bridge, pcibus_to_node(bus)); 1034 1035 bus->dev.class = &pcibus_class; 1036 bus->dev.parent = bus->bridge; 1037 1038 dev_set_name(&bus->dev, "%04x:%02x", pci_domain_nr(bus), bus->number); 1039 name = dev_name(&bus->dev); 1040 1041 err = device_register(&bus->dev); 1042 bus_registered = true; 1043 if (err) 1044 goto unregister; 1045 1046 pcibios_add_bus(bus); 1047 1048 if (bus->ops->add_bus) { 1049 err = bus->ops->add_bus(bus); 1050 if (WARN_ON(err < 0)) 1051 dev_err(&bus->dev, "failed to add bus: %d\n", err); 1052 } 1053 1054 /* Create legacy_io and legacy_mem files for this bus */ 1055 pci_create_legacy_files(bus); 1056 1057 if (parent) 1058 dev_info(parent, "PCI host bridge to bus %s\n", name); 1059 else 1060 pr_info("PCI host bridge to bus %s\n", name); 1061 1062 if (nr_node_ids > 1 && pcibus_to_node(bus) == NUMA_NO_NODE) 1063 dev_warn(&bus->dev, "Unknown NUMA node; performance will be reduced\n"); 1064 1065 /* Check if the boot configuration by FW needs to be preserved */ 1066 bridge->preserve_config = pci_preserve_config(bridge); 1067 1068 /* Coalesce contiguous windows */ 1069 resource_list_for_each_entry_safe(window, n, &resources) { 1070 if (list_is_last(&window->node, &resources)) 1071 break; 1072 1073 next = list_next_entry(window, node); 1074 offset = window->offset; 1075 res = window->res; 1076 next_offset = next->offset; 1077 next_res = next->res; 1078 1079 if (res->flags != next_res->flags || offset != next_offset) 1080 continue; 1081 1082 if (res->end + 1 == next_res->start) { 1083 next_res->start = res->start; 1084 res->flags = res->start = res->end = 0; 1085 } 1086 } 1087 1088 /* Add initial resources to the bus */ 1089 resource_list_for_each_entry_safe(window, n, &resources) { 1090 offset = window->offset; 1091 res = window->res; 1092 if (!res->flags && !res->start && !res->end) { 1093 release_resource(res); 1094 resource_list_destroy_entry(window); 1095 continue; 1096 } 1097 1098 list_move_tail(&window->node, &bridge->windows); 1099 1100 if (res->flags & IORESOURCE_BUS) 1101 pci_bus_insert_busn_res(bus, bus->number, res->end); 1102 else 1103 pci_bus_add_resource(bus, res); 1104 1105 if (offset) { 1106 if (resource_type(res) == IORESOURCE_IO) 1107 fmt = " (bus address [%#06llx-%#06llx])"; 1108 else 1109 fmt = " (bus address [%#010llx-%#010llx])"; 1110 1111 snprintf(addr, sizeof(addr), fmt, 1112 (unsigned long long)(res->start - offset), 1113 (unsigned long long)(res->end - offset)); 1114 } else 1115 addr[0] = '\0'; 1116 1117 dev_info(&bus->dev, "root bus resource %pR%s\n", res, addr); 1118 } 1119 1120 of_pci_make_host_bridge_node(bridge); 1121 1122 down_write(&pci_bus_sem); 1123 list_add_tail(&bus->node, &pci_root_buses); 1124 up_write(&pci_bus_sem); 1125 1126 return 0; 1127 1128 unregister: 1129 put_device(&bridge->dev); 1130 device_del(&bridge->dev); 1131 free: 1132 #ifdef CONFIG_PCI_DOMAINS_GENERIC 1133 pci_bus_release_domain_nr(parent, bus->domain_nr); 1134 #endif 1135 if (bus_registered) 1136 put_device(&bus->dev); 1137 else 1138 kfree(bus); 1139 1140 return err; 1141 } 1142 1143 static bool pci_bridge_child_ext_cfg_accessible(struct pci_dev *bridge) 1144 { 1145 int pos; 1146 u32 status; 1147 1148 /* 1149 * If extended config space isn't accessible on a bridge's primary 1150 * bus, we certainly can't access it on the secondary bus. 1151 */ 1152 if (bridge->bus->bus_flags & PCI_BUS_FLAGS_NO_EXTCFG) 1153 return false; 1154 1155 /* 1156 * PCIe Root Ports and switch ports are PCIe on both sides, so if 1157 * extended config space is accessible on the primary, it's also 1158 * accessible on the secondary. 1159 */ 1160 if (pci_is_pcie(bridge) && 1161 (pci_pcie_type(bridge) == PCI_EXP_TYPE_ROOT_PORT || 1162 pci_pcie_type(bridge) == PCI_EXP_TYPE_UPSTREAM || 1163 pci_pcie_type(bridge) == PCI_EXP_TYPE_DOWNSTREAM)) 1164 return true; 1165 1166 /* 1167 * For the other bridge types: 1168 * - PCI-to-PCI bridges 1169 * - PCIe-to-PCI/PCI-X forward bridges 1170 * - PCI/PCI-X-to-PCIe reverse bridges 1171 * extended config space on the secondary side is only accessible 1172 * if the bridge supports PCI-X Mode 2. 1173 */ 1174 pos = pci_find_capability(bridge, PCI_CAP_ID_PCIX); 1175 if (!pos) 1176 return false; 1177 1178 pci_read_config_dword(bridge, pos + PCI_X_STATUS, &status); 1179 return status & (PCI_X_STATUS_266MHZ | PCI_X_STATUS_533MHZ); 1180 } 1181 1182 static struct pci_bus *pci_alloc_child_bus(struct pci_bus *parent, 1183 struct pci_dev *bridge, int busnr) 1184 { 1185 struct pci_bus *child; 1186 struct pci_host_bridge *host; 1187 int i; 1188 int ret; 1189 1190 /* Allocate a new bus and inherit stuff from the parent */ 1191 child = pci_alloc_bus(parent); 1192 if (!child) 1193 return NULL; 1194 1195 child->parent = parent; 1196 child->sysdata = parent->sysdata; 1197 child->bus_flags = parent->bus_flags; 1198 1199 host = pci_find_host_bridge(parent); 1200 if (host->child_ops) 1201 child->ops = host->child_ops; 1202 else 1203 child->ops = parent->ops; 1204 1205 /* 1206 * Initialize some portions of the bus device, but don't register 1207 * it now as the parent is not properly set up yet. 1208 */ 1209 child->dev.class = &pcibus_class; 1210 dev_set_name(&child->dev, "%04x:%02x", pci_domain_nr(child), busnr); 1211 1212 /* Set up the primary, secondary and subordinate bus numbers */ 1213 child->number = child->busn_res.start = busnr; 1214 child->primary = parent->busn_res.start; 1215 child->busn_res.end = 0xff; 1216 1217 if (!bridge) { 1218 child->dev.parent = parent->bridge; 1219 goto add_dev; 1220 } 1221 1222 child->self = bridge; 1223 child->bridge = get_device(&bridge->dev); 1224 child->dev.parent = child->bridge; 1225 pci_set_bus_of_node(child); 1226 pci_set_bus_speed(child); 1227 1228 /* 1229 * Check whether extended config space is accessible on the child 1230 * bus. Note that we currently assume it is always accessible on 1231 * the root bus. 1232 */ 1233 if (!pci_bridge_child_ext_cfg_accessible(bridge)) { 1234 child->bus_flags |= PCI_BUS_FLAGS_NO_EXTCFG; 1235 pci_info(child, "extended config space not accessible\n"); 1236 } 1237 1238 /* Set up default resource pointers and names */ 1239 for (i = 0; i < PCI_BRIDGE_RESOURCE_NUM; i++) { 1240 child->resource[i] = &bridge->resource[PCI_BRIDGE_RESOURCES+i]; 1241 child->resource[i]->name = child->name; 1242 } 1243 bridge->subordinate = child; 1244 1245 add_dev: 1246 pci_set_bus_msi_domain(child); 1247 ret = device_register(&child->dev); 1248 if (WARN_ON(ret < 0)) { 1249 put_device(&child->dev); 1250 return NULL; 1251 } 1252 1253 pcibios_add_bus(child); 1254 1255 if (child->ops->add_bus) { 1256 ret = child->ops->add_bus(child); 1257 if (WARN_ON(ret < 0)) 1258 dev_err(&child->dev, "failed to add bus: %d\n", ret); 1259 } 1260 1261 /* Create legacy_io and legacy_mem files for this bus */ 1262 pci_create_legacy_files(child); 1263 1264 return child; 1265 } 1266 1267 struct pci_bus *pci_add_new_bus(struct pci_bus *parent, struct pci_dev *dev, 1268 int busnr) 1269 { 1270 struct pci_bus *child; 1271 1272 child = pci_alloc_child_bus(parent, dev, busnr); 1273 if (child) { 1274 down_write(&pci_bus_sem); 1275 list_add_tail(&child->node, &parent->children); 1276 up_write(&pci_bus_sem); 1277 } 1278 return child; 1279 } 1280 EXPORT_SYMBOL(pci_add_new_bus); 1281 1282 static void pci_enable_rrs_sv(struct pci_dev *pdev) 1283 { 1284 u16 root_cap = 0; 1285 1286 /* Enable Configuration RRS Software Visibility if supported */ 1287 pcie_capability_read_word(pdev, PCI_EXP_RTCAP, &root_cap); 1288 if (root_cap & PCI_EXP_RTCAP_RRS_SV) { 1289 pcie_capability_set_word(pdev, PCI_EXP_RTCTL, 1290 PCI_EXP_RTCTL_RRS_SVE); 1291 pdev->config_rrs_sv = 1; 1292 } 1293 } 1294 1295 static unsigned int pci_scan_child_bus_extend(struct pci_bus *bus, 1296 unsigned int available_buses); 1297 /** 1298 * pci_ea_fixed_busnrs() - Read fixed Secondary and Subordinate bus 1299 * numbers from EA capability. 1300 * @dev: Bridge 1301 * @sec: updated with secondary bus number from EA 1302 * @sub: updated with subordinate bus number from EA 1303 * 1304 * If @dev is a bridge with EA capability that specifies valid secondary 1305 * and subordinate bus numbers, return true with the bus numbers in @sec 1306 * and @sub. Otherwise return false. 1307 */ 1308 static bool pci_ea_fixed_busnrs(struct pci_dev *dev, u8 *sec, u8 *sub) 1309 { 1310 int ea, offset; 1311 u32 dw; 1312 u8 ea_sec, ea_sub; 1313 1314 if (dev->hdr_type != PCI_HEADER_TYPE_BRIDGE) 1315 return false; 1316 1317 /* find PCI EA capability in list */ 1318 ea = pci_find_capability(dev, PCI_CAP_ID_EA); 1319 if (!ea) 1320 return false; 1321 1322 offset = ea + PCI_EA_FIRST_ENT; 1323 pci_read_config_dword(dev, offset, &dw); 1324 ea_sec = FIELD_GET(PCI_EA_SEC_BUS_MASK, dw); 1325 ea_sub = FIELD_GET(PCI_EA_SUB_BUS_MASK, dw); 1326 if (ea_sec == 0 || ea_sub < ea_sec) 1327 return false; 1328 1329 *sec = ea_sec; 1330 *sub = ea_sub; 1331 return true; 1332 } 1333 1334 /* 1335 * pci_scan_bridge_extend() - Scan buses behind a bridge 1336 * @bus: Parent bus the bridge is on 1337 * @dev: Bridge itself 1338 * @max: Starting subordinate number of buses behind this bridge 1339 * @available_buses: Total number of buses available for this bridge and 1340 * the devices below. After the minimal bus space has 1341 * been allocated the remaining buses will be 1342 * distributed equally between hotplug-capable bridges. 1343 * @pass: Either %0 (scan already configured bridges) or %1 (scan bridges 1344 * that need to be reconfigured. 1345 * 1346 * If it's a bridge, configure it and scan the bus behind it. 1347 * For CardBus bridges, we don't scan behind as the devices will 1348 * be handled by the bridge driver itself. 1349 * 1350 * We need to process bridges in two passes -- first we scan those 1351 * already configured by the BIOS and after we are done with all of 1352 * them, we proceed to assigning numbers to the remaining buses in 1353 * order to avoid overlaps between old and new bus numbers. 1354 * 1355 * Return: New subordinate number covering all buses behind this bridge. 1356 */ 1357 static int pci_scan_bridge_extend(struct pci_bus *bus, struct pci_dev *dev, 1358 int max, unsigned int available_buses, 1359 int pass) 1360 { 1361 struct pci_bus *child; 1362 int is_cardbus = (dev->hdr_type == PCI_HEADER_TYPE_CARDBUS); 1363 u32 buses, i, j = 0; 1364 u16 bctl; 1365 u8 primary, secondary, subordinate; 1366 int broken = 0; 1367 bool fixed_buses; 1368 u8 fixed_sec, fixed_sub; 1369 int next_busnr; 1370 1371 /* 1372 * Make sure the bridge is powered on to be able to access config 1373 * space of devices below it. 1374 */ 1375 pm_runtime_get_sync(&dev->dev); 1376 1377 pci_read_config_dword(dev, PCI_PRIMARY_BUS, &buses); 1378 primary = buses & 0xFF; 1379 secondary = (buses >> 8) & 0xFF; 1380 subordinate = (buses >> 16) & 0xFF; 1381 1382 pci_dbg(dev, "scanning [bus %02x-%02x] behind bridge, pass %d\n", 1383 secondary, subordinate, pass); 1384 1385 if (!primary && (primary != bus->number) && secondary && subordinate) { 1386 pci_warn(dev, "Primary bus is hard wired to 0\n"); 1387 primary = bus->number; 1388 } 1389 1390 /* Check if setup is sensible at all */ 1391 if (!pass && 1392 (primary != bus->number || secondary <= bus->number || 1393 secondary > subordinate)) { 1394 pci_info(dev, "bridge configuration invalid ([bus %02x-%02x]), reconfiguring\n", 1395 secondary, subordinate); 1396 broken = 1; 1397 } 1398 1399 /* 1400 * Disable Master-Abort Mode during probing to avoid reporting of 1401 * bus errors in some architectures. 1402 */ 1403 pci_read_config_word(dev, PCI_BRIDGE_CONTROL, &bctl); 1404 pci_write_config_word(dev, PCI_BRIDGE_CONTROL, 1405 bctl & ~PCI_BRIDGE_CTL_MASTER_ABORT); 1406 1407 if ((secondary || subordinate) && !pcibios_assign_all_busses() && 1408 !is_cardbus && !broken) { 1409 unsigned int cmax, buses; 1410 1411 /* 1412 * Bus already configured by firmware, process it in the 1413 * first pass and just note the configuration. 1414 */ 1415 if (pass) 1416 goto out; 1417 1418 /* 1419 * The bus might already exist for two reasons: Either we 1420 * are rescanning the bus or the bus is reachable through 1421 * more than one bridge. The second case can happen with 1422 * the i450NX chipset. 1423 */ 1424 child = pci_find_bus(pci_domain_nr(bus), secondary); 1425 if (!child) { 1426 child = pci_add_new_bus(bus, dev, secondary); 1427 if (!child) 1428 goto out; 1429 child->primary = primary; 1430 pci_bus_insert_busn_res(child, secondary, subordinate); 1431 child->bridge_ctl = bctl; 1432 } 1433 1434 buses = subordinate - secondary; 1435 cmax = pci_scan_child_bus_extend(child, buses); 1436 if (cmax > subordinate) 1437 pci_warn(dev, "bridge has subordinate %02x but max busn %02x\n", 1438 subordinate, cmax); 1439 1440 /* Subordinate should equal child->busn_res.end */ 1441 if (subordinate > max) 1442 max = subordinate; 1443 } else { 1444 1445 /* 1446 * We need to assign a number to this bus which we always 1447 * do in the second pass. 1448 */ 1449 if (!pass) { 1450 if (pcibios_assign_all_busses() || broken || is_cardbus) 1451 1452 /* 1453 * Temporarily disable forwarding of the 1454 * configuration cycles on all bridges in 1455 * this bus segment to avoid possible 1456 * conflicts in the second pass between two 1457 * bridges programmed with overlapping bus 1458 * ranges. 1459 */ 1460 pci_write_config_dword(dev, PCI_PRIMARY_BUS, 1461 buses & ~0xffffff); 1462 goto out; 1463 } 1464 1465 /* Clear errors */ 1466 pci_write_config_word(dev, PCI_STATUS, 0xffff); 1467 1468 /* Read bus numbers from EA Capability (if present) */ 1469 fixed_buses = pci_ea_fixed_busnrs(dev, &fixed_sec, &fixed_sub); 1470 if (fixed_buses) 1471 next_busnr = fixed_sec; 1472 else 1473 next_busnr = max + 1; 1474 1475 /* 1476 * Prevent assigning a bus number that already exists. 1477 * This can happen when a bridge is hot-plugged, so in this 1478 * case we only re-scan this bus. 1479 */ 1480 child = pci_find_bus(pci_domain_nr(bus), next_busnr); 1481 if (!child) { 1482 child = pci_add_new_bus(bus, dev, next_busnr); 1483 if (!child) 1484 goto out; 1485 pci_bus_insert_busn_res(child, next_busnr, 1486 bus->busn_res.end); 1487 } 1488 max++; 1489 if (available_buses) 1490 available_buses--; 1491 1492 buses = (buses & 0xff000000) 1493 | ((unsigned int)(child->primary) << 0) 1494 | ((unsigned int)(child->busn_res.start) << 8) 1495 | ((unsigned int)(child->busn_res.end) << 16); 1496 1497 /* 1498 * yenta.c forces a secondary latency timer of 176. 1499 * Copy that behaviour here. 1500 */ 1501 if (is_cardbus) { 1502 buses &= ~0xff000000; 1503 buses |= CARDBUS_LATENCY_TIMER << 24; 1504 } 1505 1506 /* We need to blast all three values with a single write */ 1507 pci_write_config_dword(dev, PCI_PRIMARY_BUS, buses); 1508 1509 if (!is_cardbus) { 1510 child->bridge_ctl = bctl; 1511 max = pci_scan_child_bus_extend(child, available_buses); 1512 } else { 1513 1514 /* 1515 * For CardBus bridges, we leave 4 bus numbers as 1516 * cards with a PCI-to-PCI bridge can be inserted 1517 * later. 1518 */ 1519 for (i = 0; i < CARDBUS_RESERVE_BUSNR; i++) { 1520 struct pci_bus *parent = bus; 1521 if (pci_find_bus(pci_domain_nr(bus), 1522 max+i+1)) 1523 break; 1524 while (parent->parent) { 1525 if ((!pcibios_assign_all_busses()) && 1526 (parent->busn_res.end > max) && 1527 (parent->busn_res.end <= max+i)) { 1528 j = 1; 1529 } 1530 parent = parent->parent; 1531 } 1532 if (j) { 1533 1534 /* 1535 * Often, there are two CardBus 1536 * bridges -- try to leave one 1537 * valid bus number for each one. 1538 */ 1539 i /= 2; 1540 break; 1541 } 1542 } 1543 max += i; 1544 } 1545 1546 /* 1547 * Set subordinate bus number to its real value. 1548 * If fixed subordinate bus number exists from EA 1549 * capability then use it. 1550 */ 1551 if (fixed_buses) 1552 max = fixed_sub; 1553 pci_bus_update_busn_res_end(child, max); 1554 pci_write_config_byte(dev, PCI_SUBORDINATE_BUS, max); 1555 } 1556 1557 sprintf(child->name, 1558 (is_cardbus ? "PCI CardBus %04x:%02x" : "PCI Bus %04x:%02x"), 1559 pci_domain_nr(bus), child->number); 1560 1561 /* Check that all devices are accessible */ 1562 while (bus->parent) { 1563 if ((child->busn_res.end > bus->busn_res.end) || 1564 (child->number > bus->busn_res.end) || 1565 (child->number < bus->number) || 1566 (child->busn_res.end < bus->number)) { 1567 dev_info(&dev->dev, "devices behind bridge are unusable because %pR cannot be assigned for them\n", 1568 &child->busn_res); 1569 break; 1570 } 1571 bus = bus->parent; 1572 } 1573 1574 out: 1575 /* Clear errors in the Secondary Status Register */ 1576 pci_write_config_word(dev, PCI_SEC_STATUS, 0xffff); 1577 1578 pci_write_config_word(dev, PCI_BRIDGE_CONTROL, bctl); 1579 1580 pm_runtime_put(&dev->dev); 1581 1582 return max; 1583 } 1584 1585 /* 1586 * pci_scan_bridge() - Scan buses behind a bridge 1587 * @bus: Parent bus the bridge is on 1588 * @dev: Bridge itself 1589 * @max: Starting subordinate number of buses behind this bridge 1590 * @pass: Either %0 (scan already configured bridges) or %1 (scan bridges 1591 * that need to be reconfigured. 1592 * 1593 * If it's a bridge, configure it and scan the bus behind it. 1594 * For CardBus bridges, we don't scan behind as the devices will 1595 * be handled by the bridge driver itself. 1596 * 1597 * We need to process bridges in two passes -- first we scan those 1598 * already configured by the BIOS and after we are done with all of 1599 * them, we proceed to assigning numbers to the remaining buses in 1600 * order to avoid overlaps between old and new bus numbers. 1601 * 1602 * Return: New subordinate number covering all buses behind this bridge. 1603 */ 1604 int pci_scan_bridge(struct pci_bus *bus, struct pci_dev *dev, int max, int pass) 1605 { 1606 return pci_scan_bridge_extend(bus, dev, max, 0, pass); 1607 } 1608 EXPORT_SYMBOL(pci_scan_bridge); 1609 1610 /* 1611 * Read interrupt line and base address registers. 1612 * The architecture-dependent code can tweak these, of course. 1613 */ 1614 static void pci_read_irq(struct pci_dev *dev) 1615 { 1616 unsigned char irq; 1617 1618 /* VFs are not allowed to use INTx, so skip the config reads */ 1619 if (dev->is_virtfn) { 1620 dev->pin = 0; 1621 dev->irq = 0; 1622 return; 1623 } 1624 1625 pci_read_config_byte(dev, PCI_INTERRUPT_PIN, &irq); 1626 dev->pin = irq; 1627 if (irq) 1628 pci_read_config_byte(dev, PCI_INTERRUPT_LINE, &irq); 1629 dev->irq = irq; 1630 } 1631 1632 void set_pcie_port_type(struct pci_dev *pdev) 1633 { 1634 int pos; 1635 u16 reg16; 1636 u32 reg32; 1637 int type; 1638 struct pci_dev *parent; 1639 1640 pos = pci_find_capability(pdev, PCI_CAP_ID_EXP); 1641 if (!pos) 1642 return; 1643 1644 pdev->pcie_cap = pos; 1645 pci_read_config_word(pdev, pos + PCI_EXP_FLAGS, ®16); 1646 pdev->pcie_flags_reg = reg16; 1647 1648 type = pci_pcie_type(pdev); 1649 if (type == PCI_EXP_TYPE_ROOT_PORT) 1650 pci_enable_rrs_sv(pdev); 1651 1652 pci_read_config_dword(pdev, pos + PCI_EXP_DEVCAP, &pdev->devcap); 1653 pdev->pcie_mpss = FIELD_GET(PCI_EXP_DEVCAP_PAYLOAD, pdev->devcap); 1654 1655 pcie_capability_read_dword(pdev, PCI_EXP_LNKCAP, ®32); 1656 if (reg32 & PCI_EXP_LNKCAP_DLLLARC) 1657 pdev->link_active_reporting = 1; 1658 1659 #ifdef CONFIG_PCIEASPM 1660 if (reg32 & PCI_EXP_LNKCAP_ASPM_L0S) 1661 pdev->aspm_l0s_support = 1; 1662 if (reg32 & PCI_EXP_LNKCAP_ASPM_L1) 1663 pdev->aspm_l1_support = 1; 1664 #endif 1665 1666 parent = pci_upstream_bridge(pdev); 1667 if (!parent) 1668 return; 1669 1670 /* 1671 * Some systems do not identify their upstream/downstream ports 1672 * correctly so detect impossible configurations here and correct 1673 * the port type accordingly. 1674 */ 1675 if (type == PCI_EXP_TYPE_DOWNSTREAM) { 1676 /* 1677 * If pdev claims to be downstream port but the parent 1678 * device is also downstream port assume pdev is actually 1679 * upstream port. 1680 */ 1681 if (pcie_downstream_port(parent)) { 1682 pci_info(pdev, "claims to be downstream port but is acting as upstream port, correcting type\n"); 1683 pdev->pcie_flags_reg &= ~PCI_EXP_FLAGS_TYPE; 1684 pdev->pcie_flags_reg |= PCI_EXP_TYPE_UPSTREAM; 1685 } 1686 } else if (type == PCI_EXP_TYPE_UPSTREAM) { 1687 /* 1688 * If pdev claims to be upstream port but the parent 1689 * device is also upstream port assume pdev is actually 1690 * downstream port. 1691 */ 1692 if (pci_pcie_type(parent) == PCI_EXP_TYPE_UPSTREAM) { 1693 pci_info(pdev, "claims to be upstream port but is acting as downstream port, correcting type\n"); 1694 pdev->pcie_flags_reg &= ~PCI_EXP_FLAGS_TYPE; 1695 pdev->pcie_flags_reg |= PCI_EXP_TYPE_DOWNSTREAM; 1696 } 1697 } 1698 } 1699 1700 void set_pcie_hotplug_bridge(struct pci_dev *pdev) 1701 { 1702 u32 reg32; 1703 1704 pcie_capability_read_dword(pdev, PCI_EXP_SLTCAP, ®32); 1705 if (reg32 & PCI_EXP_SLTCAP_HPC) 1706 pdev->is_hotplug_bridge = pdev->is_pciehp = 1; 1707 } 1708 1709 static void set_pcie_thunderbolt(struct pci_dev *dev) 1710 { 1711 u16 vsec; 1712 1713 /* Is the device part of a Thunderbolt controller? */ 1714 vsec = pci_find_vsec_capability(dev, PCI_VENDOR_ID_INTEL, PCI_VSEC_ID_INTEL_TBT); 1715 if (vsec) 1716 dev->is_thunderbolt = 1; 1717 } 1718 1719 static void set_pcie_untrusted(struct pci_dev *dev) 1720 { 1721 struct pci_dev *parent = pci_upstream_bridge(dev); 1722 1723 if (!parent) 1724 return; 1725 /* 1726 * If the upstream bridge is untrusted we treat this device as 1727 * untrusted as well. 1728 */ 1729 if (parent->untrusted) { 1730 dev->untrusted = true; 1731 return; 1732 } 1733 1734 if (arch_pci_dev_is_removable(dev)) { 1735 pci_dbg(dev, "marking as untrusted\n"); 1736 dev->untrusted = true; 1737 } 1738 } 1739 1740 static void pci_set_removable(struct pci_dev *dev) 1741 { 1742 struct pci_dev *parent = pci_upstream_bridge(dev); 1743 1744 if (!parent) 1745 return; 1746 /* 1747 * We (only) consider everything tunneled below an external_facing 1748 * device to be removable by the user. We're mainly concerned with 1749 * consumer platforms with user accessible thunderbolt ports that are 1750 * vulnerable to DMA attacks, and we expect those ports to be marked by 1751 * the firmware as external_facing. Devices in traditional hotplug 1752 * slots can technically be removed, but the expectation is that unless 1753 * the port is marked with external_facing, such devices are less 1754 * accessible to user / may not be removed by end user, and thus not 1755 * exposed as "removable" to userspace. 1756 */ 1757 if (dev_is_removable(&parent->dev)) { 1758 dev_set_removable(&dev->dev, DEVICE_REMOVABLE); 1759 return; 1760 } 1761 1762 if (arch_pci_dev_is_removable(dev)) { 1763 pci_dbg(dev, "marking as removable\n"); 1764 dev_set_removable(&dev->dev, DEVICE_REMOVABLE); 1765 } 1766 } 1767 1768 /** 1769 * pci_ext_cfg_is_aliased - Is ext config space just an alias of std config? 1770 * @dev: PCI device 1771 * 1772 * PCI Express to PCI/PCI-X Bridge Specification, rev 1.0, 4.1.4 says that 1773 * when forwarding a type1 configuration request the bridge must check that 1774 * the extended register address field is zero. The bridge is not permitted 1775 * to forward the transactions and must handle it as an Unsupported Request. 1776 * Some bridges do not follow this rule and simply drop the extended register 1777 * bits, resulting in the standard config space being aliased, every 256 1778 * bytes across the entire configuration space. Test for this condition by 1779 * comparing the first dword of each potential alias to the vendor/device ID. 1780 * Known offenders: 1781 * ASM1083/1085 PCIe-to-PCI Reversible Bridge (1b21:1080, rev 01 & 03) 1782 * AMD/ATI SBx00 PCI to PCI Bridge (1002:4384, rev 40) 1783 */ 1784 static bool pci_ext_cfg_is_aliased(struct pci_dev *dev) 1785 { 1786 #ifdef CONFIG_PCI_QUIRKS 1787 int pos, ret; 1788 u32 header, tmp; 1789 1790 pci_read_config_dword(dev, PCI_VENDOR_ID, &header); 1791 1792 for (pos = PCI_CFG_SPACE_SIZE; 1793 pos < PCI_CFG_SPACE_EXP_SIZE; pos += PCI_CFG_SPACE_SIZE) { 1794 ret = pci_read_config_dword(dev, pos, &tmp); 1795 if ((ret != PCIBIOS_SUCCESSFUL) || (header != tmp)) 1796 return false; 1797 } 1798 1799 return true; 1800 #else 1801 return false; 1802 #endif 1803 } 1804 1805 /** 1806 * pci_cfg_space_size_ext - Get the configuration space size of the PCI device 1807 * @dev: PCI device 1808 * 1809 * Regular PCI devices have 256 bytes, but PCI-X 2 and PCI Express devices 1810 * have 4096 bytes. Even if the device is capable, that doesn't mean we can 1811 * access it. Maybe we don't have a way to generate extended config space 1812 * accesses, or the device is behind a reverse Express bridge. So we try 1813 * reading the dword at 0x100 which must either be 0 or a valid extended 1814 * capability header. 1815 */ 1816 static int pci_cfg_space_size_ext(struct pci_dev *dev) 1817 { 1818 u32 status; 1819 int pos = PCI_CFG_SPACE_SIZE; 1820 1821 if (pci_read_config_dword(dev, pos, &status) != PCIBIOS_SUCCESSFUL) 1822 return PCI_CFG_SPACE_SIZE; 1823 if (PCI_POSSIBLE_ERROR(status) || pci_ext_cfg_is_aliased(dev)) 1824 return PCI_CFG_SPACE_SIZE; 1825 1826 return PCI_CFG_SPACE_EXP_SIZE; 1827 } 1828 1829 int pci_cfg_space_size(struct pci_dev *dev) 1830 { 1831 int pos; 1832 u32 status; 1833 u16 class; 1834 1835 #ifdef CONFIG_PCI_IOV 1836 /* 1837 * Per the SR-IOV specification (rev 1.1, sec 3.5), VFs are required to 1838 * implement a PCIe capability and therefore must implement extended 1839 * config space. We can skip the NO_EXTCFG test below and the 1840 * reachability/aliasing test in pci_cfg_space_size_ext() by virtue of 1841 * the fact that the SR-IOV capability on the PF resides in extended 1842 * config space and must be accessible and non-aliased to have enabled 1843 * support for this VF. This is a micro performance optimization for 1844 * systems supporting many VFs. 1845 */ 1846 if (dev->is_virtfn) 1847 return PCI_CFG_SPACE_EXP_SIZE; 1848 #endif 1849 1850 if (dev->bus->bus_flags & PCI_BUS_FLAGS_NO_EXTCFG) 1851 return PCI_CFG_SPACE_SIZE; 1852 1853 class = dev->class >> 8; 1854 if (class == PCI_CLASS_BRIDGE_HOST) 1855 return pci_cfg_space_size_ext(dev); 1856 1857 if (pci_is_pcie(dev)) 1858 return pci_cfg_space_size_ext(dev); 1859 1860 pos = pci_find_capability(dev, PCI_CAP_ID_PCIX); 1861 if (!pos) 1862 return PCI_CFG_SPACE_SIZE; 1863 1864 pci_read_config_dword(dev, pos + PCI_X_STATUS, &status); 1865 if (status & (PCI_X_STATUS_266MHZ | PCI_X_STATUS_533MHZ)) 1866 return pci_cfg_space_size_ext(dev); 1867 1868 return PCI_CFG_SPACE_SIZE; 1869 } 1870 1871 static u32 pci_class(struct pci_dev *dev) 1872 { 1873 u32 class; 1874 1875 #ifdef CONFIG_PCI_IOV 1876 if (dev->is_virtfn) 1877 return dev->physfn->sriov->class; 1878 #endif 1879 pci_read_config_dword(dev, PCI_CLASS_REVISION, &class); 1880 return class; 1881 } 1882 1883 static void pci_subsystem_ids(struct pci_dev *dev, u16 *vendor, u16 *device) 1884 { 1885 #ifdef CONFIG_PCI_IOV 1886 if (dev->is_virtfn) { 1887 *vendor = dev->physfn->sriov->subsystem_vendor; 1888 *device = dev->physfn->sriov->subsystem_device; 1889 return; 1890 } 1891 #endif 1892 pci_read_config_word(dev, PCI_SUBSYSTEM_VENDOR_ID, vendor); 1893 pci_read_config_word(dev, PCI_SUBSYSTEM_ID, device); 1894 } 1895 1896 static u8 pci_hdr_type(struct pci_dev *dev) 1897 { 1898 u8 hdr_type; 1899 1900 #ifdef CONFIG_PCI_IOV 1901 if (dev->is_virtfn) 1902 return dev->physfn->sriov->hdr_type; 1903 #endif 1904 pci_read_config_byte(dev, PCI_HEADER_TYPE, &hdr_type); 1905 return hdr_type; 1906 } 1907 1908 #define LEGACY_IO_RESOURCE (IORESOURCE_IO | IORESOURCE_PCI_FIXED) 1909 1910 /** 1911 * pci_intx_mask_broken - Test PCI_COMMAND_INTX_DISABLE writability 1912 * @dev: PCI device 1913 * 1914 * Test whether PCI_COMMAND_INTX_DISABLE is writable for @dev. Check this 1915 * at enumeration-time to avoid modifying PCI_COMMAND at run-time. 1916 */ 1917 static int pci_intx_mask_broken(struct pci_dev *dev) 1918 { 1919 u16 orig, toggle, new; 1920 1921 pci_read_config_word(dev, PCI_COMMAND, &orig); 1922 toggle = orig ^ PCI_COMMAND_INTX_DISABLE; 1923 pci_write_config_word(dev, PCI_COMMAND, toggle); 1924 pci_read_config_word(dev, PCI_COMMAND, &new); 1925 1926 pci_write_config_word(dev, PCI_COMMAND, orig); 1927 1928 /* 1929 * PCI_COMMAND_INTX_DISABLE was reserved and read-only prior to PCI 1930 * r2.3, so strictly speaking, a device is not *broken* if it's not 1931 * writable. But we'll live with the misnomer for now. 1932 */ 1933 if (new != toggle) 1934 return 1; 1935 return 0; 1936 } 1937 1938 static void early_dump_pci_device(struct pci_dev *pdev) 1939 { 1940 u32 value[PCI_CFG_SPACE_SIZE / sizeof(u32)]; 1941 int i; 1942 1943 pci_info(pdev, "config space:\n"); 1944 1945 for (i = 0; i < ARRAY_SIZE(value); i++) 1946 pci_read_config_dword(pdev, i * sizeof(u32), &value[i]); 1947 1948 print_hex_dump(KERN_INFO, "", DUMP_PREFIX_OFFSET, 16, 1, 1949 value, ARRAY_SIZE(value) * sizeof(u32), false); 1950 } 1951 1952 static const char *pci_type_str(struct pci_dev *dev) 1953 { 1954 static const char * const str[] = { 1955 "PCIe Endpoint", 1956 "PCIe Legacy Endpoint", 1957 "PCIe unknown", 1958 "PCIe unknown", 1959 "PCIe Root Port", 1960 "PCIe Switch Upstream Port", 1961 "PCIe Switch Downstream Port", 1962 "PCIe to PCI/PCI-X bridge", 1963 "PCI/PCI-X to PCIe bridge", 1964 "PCIe Root Complex Integrated Endpoint", 1965 "PCIe Root Complex Event Collector", 1966 }; 1967 int type; 1968 1969 if (pci_is_pcie(dev)) { 1970 type = pci_pcie_type(dev); 1971 if (type < ARRAY_SIZE(str)) 1972 return str[type]; 1973 1974 return "PCIe unknown"; 1975 } 1976 1977 switch (dev->hdr_type) { 1978 case PCI_HEADER_TYPE_NORMAL: 1979 return "conventional PCI endpoint"; 1980 case PCI_HEADER_TYPE_BRIDGE: 1981 return "conventional PCI bridge"; 1982 case PCI_HEADER_TYPE_CARDBUS: 1983 return "CardBus bridge"; 1984 default: 1985 return "conventional PCI"; 1986 } 1987 } 1988 1989 /** 1990 * pci_setup_device - Fill in class and map information of a device 1991 * @dev: the device structure to fill 1992 * 1993 * Initialize the device structure with information about the device's 1994 * vendor,class,memory and IO-space addresses, IRQ lines etc. 1995 * Called at initialisation of the PCI subsystem and by CardBus services. 1996 * Returns 0 on success and negative if unknown type of device (not normal, 1997 * bridge or CardBus). 1998 */ 1999 int pci_setup_device(struct pci_dev *dev) 2000 { 2001 u32 class; 2002 u16 cmd; 2003 u8 hdr_type; 2004 int err, pos = 0; 2005 struct pci_bus_region region; 2006 struct resource *res; 2007 2008 hdr_type = pci_hdr_type(dev); 2009 2010 dev->sysdata = dev->bus->sysdata; 2011 dev->dev.parent = dev->bus->bridge; 2012 dev->dev.bus = &pci_bus_type; 2013 dev->hdr_type = FIELD_GET(PCI_HEADER_TYPE_MASK, hdr_type); 2014 dev->multifunction = FIELD_GET(PCI_HEADER_TYPE_MFD, hdr_type); 2015 dev->error_state = pci_channel_io_normal; 2016 set_pcie_port_type(dev); 2017 2018 err = pci_set_of_node(dev); 2019 if (err) 2020 return err; 2021 pci_set_acpi_fwnode(dev); 2022 2023 pci_dev_assign_slot(dev); 2024 2025 /* 2026 * Assume 32-bit PCI; let 64-bit PCI cards (which are far rarer) 2027 * set this higher, assuming the system even supports it. 2028 */ 2029 dev->dma_mask = 0xffffffff; 2030 2031 dev_set_name(&dev->dev, "%04x:%02x:%02x.%d", pci_domain_nr(dev->bus), 2032 dev->bus->number, PCI_SLOT(dev->devfn), 2033 PCI_FUNC(dev->devfn)); 2034 2035 class = pci_class(dev); 2036 2037 dev->revision = class & 0xff; 2038 dev->class = class >> 8; /* upper 3 bytes */ 2039 2040 if (pci_early_dump) 2041 early_dump_pci_device(dev); 2042 2043 /* Need to have dev->class ready */ 2044 dev->cfg_size = pci_cfg_space_size(dev); 2045 2046 /* Need to have dev->cfg_size ready */ 2047 set_pcie_thunderbolt(dev); 2048 2049 set_pcie_untrusted(dev); 2050 2051 if (pci_is_pcie(dev)) 2052 dev->supported_speeds = pcie_get_supported_speeds(dev); 2053 2054 /* "Unknown power state" */ 2055 dev->current_state = PCI_UNKNOWN; 2056 2057 /* Early fixups, before probing the BARs */ 2058 pci_fixup_device(pci_fixup_early, dev); 2059 2060 pci_set_removable(dev); 2061 2062 pci_info(dev, "[%04x:%04x] type %02x class %#08x %s\n", 2063 dev->vendor, dev->device, dev->hdr_type, dev->class, 2064 pci_type_str(dev)); 2065 2066 /* Device class may be changed after fixup */ 2067 class = dev->class >> 8; 2068 2069 if (dev->non_compliant_bars && !dev->mmio_always_on) { 2070 pci_read_config_word(dev, PCI_COMMAND, &cmd); 2071 if (cmd & (PCI_COMMAND_IO | PCI_COMMAND_MEMORY)) { 2072 pci_info(dev, "device has non-compliant BARs; disabling IO/MEM decoding\n"); 2073 cmd &= ~PCI_COMMAND_IO; 2074 cmd &= ~PCI_COMMAND_MEMORY; 2075 pci_write_config_word(dev, PCI_COMMAND, cmd); 2076 } 2077 } 2078 2079 dev->broken_intx_masking = pci_intx_mask_broken(dev); 2080 2081 switch (dev->hdr_type) { /* header type */ 2082 case PCI_HEADER_TYPE_NORMAL: /* standard header */ 2083 if (class == PCI_CLASS_BRIDGE_PCI) 2084 goto bad; 2085 pci_read_irq(dev); 2086 pci_read_bases(dev, PCI_STD_NUM_BARS, PCI_ROM_ADDRESS); 2087 2088 pci_subsystem_ids(dev, &dev->subsystem_vendor, &dev->subsystem_device); 2089 2090 /* 2091 * Do the ugly legacy mode stuff here rather than broken chip 2092 * quirk code. Legacy mode ATA controllers have fixed 2093 * addresses. These are not always echoed in BAR0-3, and 2094 * BAR0-3 in a few cases contain junk! 2095 */ 2096 if (class == PCI_CLASS_STORAGE_IDE) { 2097 u8 progif; 2098 pci_read_config_byte(dev, PCI_CLASS_PROG, &progif); 2099 if ((progif & 1) == 0) { 2100 region.start = 0x1F0; 2101 region.end = 0x1F7; 2102 res = &dev->resource[0]; 2103 res->flags = LEGACY_IO_RESOURCE; 2104 pcibios_bus_to_resource(dev->bus, res, ®ion); 2105 pci_info(dev, "BAR 0 %pR: legacy IDE quirk\n", 2106 res); 2107 region.start = 0x3F6; 2108 region.end = 0x3F6; 2109 res = &dev->resource[1]; 2110 res->flags = LEGACY_IO_RESOURCE; 2111 pcibios_bus_to_resource(dev->bus, res, ®ion); 2112 pci_info(dev, "BAR 1 %pR: legacy IDE quirk\n", 2113 res); 2114 } 2115 if ((progif & 4) == 0) { 2116 region.start = 0x170; 2117 region.end = 0x177; 2118 res = &dev->resource[2]; 2119 res->flags = LEGACY_IO_RESOURCE; 2120 pcibios_bus_to_resource(dev->bus, res, ®ion); 2121 pci_info(dev, "BAR 2 %pR: legacy IDE quirk\n", 2122 res); 2123 region.start = 0x376; 2124 region.end = 0x376; 2125 res = &dev->resource[3]; 2126 res->flags = LEGACY_IO_RESOURCE; 2127 pcibios_bus_to_resource(dev->bus, res, ®ion); 2128 pci_info(dev, "BAR 3 %pR: legacy IDE quirk\n", 2129 res); 2130 } 2131 } 2132 break; 2133 2134 case PCI_HEADER_TYPE_BRIDGE: /* bridge header */ 2135 /* 2136 * The PCI-to-PCI bridge spec requires that subtractive 2137 * decoding (i.e. transparent) bridge must have programming 2138 * interface code of 0x01. 2139 */ 2140 pci_read_irq(dev); 2141 dev->transparent = ((dev->class & 0xff) == 1); 2142 pci_read_bases(dev, 2, PCI_ROM_ADDRESS1); 2143 pci_read_bridge_windows(dev); 2144 set_pcie_hotplug_bridge(dev); 2145 pos = pci_find_capability(dev, PCI_CAP_ID_SSVID); 2146 if (pos) { 2147 pci_read_config_word(dev, pos + PCI_SSVID_VENDOR_ID, &dev->subsystem_vendor); 2148 pci_read_config_word(dev, pos + PCI_SSVID_DEVICE_ID, &dev->subsystem_device); 2149 } 2150 break; 2151 2152 case PCI_HEADER_TYPE_CARDBUS: /* CardBus bridge header */ 2153 if (class != PCI_CLASS_BRIDGE_CARDBUS) 2154 goto bad; 2155 pci_read_irq(dev); 2156 pci_read_bases(dev, 1, 0); 2157 pci_read_config_word(dev, PCI_CB_SUBSYSTEM_VENDOR_ID, &dev->subsystem_vendor); 2158 pci_read_config_word(dev, PCI_CB_SUBSYSTEM_ID, &dev->subsystem_device); 2159 break; 2160 2161 default: /* unknown header */ 2162 pci_err(dev, "unknown header type %02x, ignoring device\n", 2163 dev->hdr_type); 2164 pci_release_of_node(dev); 2165 return -EIO; 2166 2167 bad: 2168 pci_err(dev, "ignoring class %#08x (doesn't match header type %02x)\n", 2169 dev->class, dev->hdr_type); 2170 dev->class = PCI_CLASS_NOT_DEFINED << 8; 2171 } 2172 2173 /* We found a fine healthy device, go go go... */ 2174 return 0; 2175 } 2176 2177 static void pci_configure_mps(struct pci_dev *dev) 2178 { 2179 struct pci_dev *bridge = pci_upstream_bridge(dev); 2180 int mps, mpss, p_mps, rc; 2181 2182 if (!pci_is_pcie(dev)) 2183 return; 2184 2185 /* MPS and MRRS fields are of type 'RsvdP' for VFs, short-circuit out */ 2186 if (dev->is_virtfn) 2187 return; 2188 2189 /* 2190 * For Root Complex Integrated Endpoints, program the maximum 2191 * supported value unless limited by the PCIE_BUS_PEER2PEER case. 2192 */ 2193 if (pci_pcie_type(dev) == PCI_EXP_TYPE_RC_END) { 2194 if (pcie_bus_config == PCIE_BUS_PEER2PEER) 2195 mps = 128; 2196 else 2197 mps = 128 << dev->pcie_mpss; 2198 rc = pcie_set_mps(dev, mps); 2199 if (rc) { 2200 pci_warn(dev, "can't set Max Payload Size to %d; if necessary, use \"pci=pcie_bus_safe\" and report a bug\n", 2201 mps); 2202 } 2203 return; 2204 } 2205 2206 if (!bridge || !pci_is_pcie(bridge)) 2207 return; 2208 2209 mps = pcie_get_mps(dev); 2210 p_mps = pcie_get_mps(bridge); 2211 2212 if (mps == p_mps) 2213 return; 2214 2215 if (pcie_bus_config == PCIE_BUS_TUNE_OFF) { 2216 pci_warn(dev, "Max Payload Size %d, but upstream %s set to %d; if necessary, use \"pci=pcie_bus_safe\" and report a bug\n", 2217 mps, pci_name(bridge), p_mps); 2218 return; 2219 } 2220 2221 /* 2222 * Fancier MPS configuration is done later by 2223 * pcie_bus_configure_settings() 2224 */ 2225 if (pcie_bus_config != PCIE_BUS_DEFAULT) 2226 return; 2227 2228 mpss = 128 << dev->pcie_mpss; 2229 if (mpss < p_mps && pci_pcie_type(bridge) == PCI_EXP_TYPE_ROOT_PORT) { 2230 pcie_set_mps(bridge, mpss); 2231 pci_info(dev, "Upstream bridge's Max Payload Size set to %d (was %d, max %d)\n", 2232 mpss, p_mps, 128 << bridge->pcie_mpss); 2233 p_mps = pcie_get_mps(bridge); 2234 } 2235 2236 rc = pcie_set_mps(dev, p_mps); 2237 if (rc) { 2238 pci_warn(dev, "can't set Max Payload Size to %d; if necessary, use \"pci=pcie_bus_safe\" and report a bug\n", 2239 p_mps); 2240 return; 2241 } 2242 2243 pci_info(dev, "Max Payload Size set to %d (was %d, max %d)\n", 2244 p_mps, mps, mpss); 2245 } 2246 2247 int pci_configure_extended_tags(struct pci_dev *dev, void *ign) 2248 { 2249 struct pci_host_bridge *host; 2250 u32 cap; 2251 u16 ctl; 2252 int ret; 2253 2254 if (!pci_is_pcie(dev)) 2255 return 0; 2256 2257 ret = pcie_capability_read_dword(dev, PCI_EXP_DEVCAP, &cap); 2258 if (ret) 2259 return 0; 2260 2261 if (!(cap & PCI_EXP_DEVCAP_EXT_TAG)) 2262 return 0; 2263 2264 ret = pcie_capability_read_word(dev, PCI_EXP_DEVCTL, &ctl); 2265 if (ret) 2266 return 0; 2267 2268 host = pci_find_host_bridge(dev->bus); 2269 if (!host) 2270 return 0; 2271 2272 /* 2273 * If some device in the hierarchy doesn't handle Extended Tags 2274 * correctly, make sure they're disabled. 2275 */ 2276 if (host->no_ext_tags) { 2277 if (ctl & PCI_EXP_DEVCTL_EXT_TAG) { 2278 pci_info(dev, "disabling Extended Tags\n"); 2279 pcie_capability_clear_word(dev, PCI_EXP_DEVCTL, 2280 PCI_EXP_DEVCTL_EXT_TAG); 2281 } 2282 return 0; 2283 } 2284 2285 if (!(ctl & PCI_EXP_DEVCTL_EXT_TAG)) { 2286 pci_info(dev, "enabling Extended Tags\n"); 2287 pcie_capability_set_word(dev, PCI_EXP_DEVCTL, 2288 PCI_EXP_DEVCTL_EXT_TAG); 2289 } 2290 return 0; 2291 } 2292 2293 /** 2294 * pcie_relaxed_ordering_enabled - Probe for PCIe relaxed ordering enable 2295 * @dev: PCI device to query 2296 * 2297 * Returns true if the device has enabled relaxed ordering attribute. 2298 */ 2299 bool pcie_relaxed_ordering_enabled(struct pci_dev *dev) 2300 { 2301 u16 v; 2302 2303 pcie_capability_read_word(dev, PCI_EXP_DEVCTL, &v); 2304 2305 return !!(v & PCI_EXP_DEVCTL_RELAX_EN); 2306 } 2307 EXPORT_SYMBOL(pcie_relaxed_ordering_enabled); 2308 2309 static void pci_configure_relaxed_ordering(struct pci_dev *dev) 2310 { 2311 struct pci_dev *root; 2312 2313 /* PCI_EXP_DEVCTL_RELAX_EN is RsvdP in VFs */ 2314 if (dev->is_virtfn) 2315 return; 2316 2317 if (!pcie_relaxed_ordering_enabled(dev)) 2318 return; 2319 2320 /* 2321 * For now, we only deal with Relaxed Ordering issues with Root 2322 * Ports. Peer-to-Peer DMA is another can of worms. 2323 */ 2324 root = pcie_find_root_port(dev); 2325 if (!root) 2326 return; 2327 2328 if (root->dev_flags & PCI_DEV_FLAGS_NO_RELAXED_ORDERING) { 2329 pcie_capability_clear_word(dev, PCI_EXP_DEVCTL, 2330 PCI_EXP_DEVCTL_RELAX_EN); 2331 pci_info(dev, "Relaxed Ordering disabled because the Root Port didn't support it\n"); 2332 } 2333 } 2334 2335 static void pci_configure_eetlp_prefix(struct pci_dev *dev) 2336 { 2337 struct pci_dev *bridge; 2338 unsigned int eetlp_max; 2339 int pcie_type; 2340 u32 cap; 2341 2342 if (!pci_is_pcie(dev)) 2343 return; 2344 2345 pcie_capability_read_dword(dev, PCI_EXP_DEVCAP2, &cap); 2346 if (!(cap & PCI_EXP_DEVCAP2_EE_PREFIX)) 2347 return; 2348 2349 pcie_type = pci_pcie_type(dev); 2350 2351 eetlp_max = FIELD_GET(PCI_EXP_DEVCAP2_EE_PREFIX_MAX, cap); 2352 /* 00b means 4 */ 2353 eetlp_max = eetlp_max ?: 4; 2354 2355 if (pcie_type == PCI_EXP_TYPE_ROOT_PORT || 2356 pcie_type == PCI_EXP_TYPE_RC_END) 2357 dev->eetlp_prefix_max = eetlp_max; 2358 else { 2359 bridge = pci_upstream_bridge(dev); 2360 if (bridge && bridge->eetlp_prefix_max) 2361 dev->eetlp_prefix_max = eetlp_max; 2362 } 2363 } 2364 2365 static void pci_configure_serr(struct pci_dev *dev) 2366 { 2367 u16 control; 2368 2369 if (dev->hdr_type == PCI_HEADER_TYPE_BRIDGE) { 2370 2371 /* 2372 * A bridge will not forward ERR_ messages coming from an 2373 * endpoint unless SERR# forwarding is enabled. 2374 */ 2375 pci_read_config_word(dev, PCI_BRIDGE_CONTROL, &control); 2376 if (!(control & PCI_BRIDGE_CTL_SERR)) { 2377 control |= PCI_BRIDGE_CTL_SERR; 2378 pci_write_config_word(dev, PCI_BRIDGE_CONTROL, control); 2379 } 2380 } 2381 } 2382 2383 static void pci_configure_device(struct pci_dev *dev) 2384 { 2385 pci_configure_mps(dev); 2386 pci_configure_extended_tags(dev, NULL); 2387 pci_configure_relaxed_ordering(dev); 2388 pci_configure_ltr(dev); 2389 pci_configure_aspm_l1ss(dev); 2390 pci_configure_eetlp_prefix(dev); 2391 pci_configure_serr(dev); 2392 2393 pci_acpi_program_hp_params(dev); 2394 } 2395 2396 static void pci_release_capabilities(struct pci_dev *dev) 2397 { 2398 pci_aer_exit(dev); 2399 pci_rcec_exit(dev); 2400 pci_iov_release(dev); 2401 pci_free_cap_save_buffers(dev); 2402 } 2403 2404 /** 2405 * pci_release_dev - Free a PCI device structure when all users of it are 2406 * finished 2407 * @dev: device that's been disconnected 2408 * 2409 * Will be called only by the device core when all users of this PCI device are 2410 * done. 2411 */ 2412 static void pci_release_dev(struct device *dev) 2413 { 2414 struct pci_dev *pci_dev; 2415 2416 pci_dev = to_pci_dev(dev); 2417 pci_release_capabilities(pci_dev); 2418 pci_release_of_node(pci_dev); 2419 pcibios_release_device(pci_dev); 2420 pci_bus_put(pci_dev->bus); 2421 kfree(pci_dev->driver_override); 2422 bitmap_free(pci_dev->dma_alias_mask); 2423 dev_dbg(dev, "device released\n"); 2424 kfree(pci_dev); 2425 } 2426 2427 static const struct device_type pci_dev_type = { 2428 .groups = pci_dev_attr_groups, 2429 }; 2430 2431 struct pci_dev *pci_alloc_dev(struct pci_bus *bus) 2432 { 2433 struct pci_dev *dev; 2434 2435 dev = kzalloc(sizeof(struct pci_dev), GFP_KERNEL); 2436 if (!dev) 2437 return NULL; 2438 2439 INIT_LIST_HEAD(&dev->bus_list); 2440 dev->dev.type = &pci_dev_type; 2441 dev->bus = pci_bus_get(bus); 2442 dev->driver_exclusive_resource = (struct resource) { 2443 .name = "PCI Exclusive", 2444 .start = 0, 2445 .end = -1, 2446 }; 2447 2448 spin_lock_init(&dev->pcie_cap_lock); 2449 #ifdef CONFIG_PCI_MSI 2450 raw_spin_lock_init(&dev->msi_lock); 2451 #endif 2452 return dev; 2453 } 2454 EXPORT_SYMBOL(pci_alloc_dev); 2455 2456 static bool pci_bus_wait_rrs(struct pci_bus *bus, int devfn, u32 *l, 2457 int timeout) 2458 { 2459 int delay = 1; 2460 2461 if (!pci_bus_rrs_vendor_id(*l)) 2462 return true; /* not a Configuration RRS completion */ 2463 2464 if (!timeout) 2465 return false; /* RRS, but caller doesn't want to wait */ 2466 2467 /* 2468 * We got the reserved Vendor ID that indicates a completion with 2469 * Configuration Request Retry Status (RRS). Retry until we get a 2470 * valid Vendor ID or we time out. 2471 */ 2472 while (pci_bus_rrs_vendor_id(*l)) { 2473 if (delay > timeout) { 2474 pr_warn("pci %04x:%02x:%02x.%d: not ready after %dms; giving up\n", 2475 pci_domain_nr(bus), bus->number, 2476 PCI_SLOT(devfn), PCI_FUNC(devfn), delay - 1); 2477 2478 return false; 2479 } 2480 if (delay >= 1000) 2481 pr_info("pci %04x:%02x:%02x.%d: not ready after %dms; waiting\n", 2482 pci_domain_nr(bus), bus->number, 2483 PCI_SLOT(devfn), PCI_FUNC(devfn), delay - 1); 2484 2485 msleep(delay); 2486 delay *= 2; 2487 2488 if (pci_bus_read_config_dword(bus, devfn, PCI_VENDOR_ID, l)) 2489 return false; 2490 } 2491 2492 if (delay >= 1000) 2493 pr_info("pci %04x:%02x:%02x.%d: ready after %dms\n", 2494 pci_domain_nr(bus), bus->number, 2495 PCI_SLOT(devfn), PCI_FUNC(devfn), delay - 1); 2496 2497 return true; 2498 } 2499 2500 bool pci_bus_generic_read_dev_vendor_id(struct pci_bus *bus, int devfn, u32 *l, 2501 int timeout) 2502 { 2503 if (pci_bus_read_config_dword(bus, devfn, PCI_VENDOR_ID, l)) 2504 return false; 2505 2506 /* Some broken boards return 0 or ~0 (PCI_ERROR_RESPONSE) if a slot is empty: */ 2507 if (PCI_POSSIBLE_ERROR(*l) || *l == 0x00000000 || 2508 *l == 0x0000ffff || *l == 0xffff0000) 2509 return false; 2510 2511 if (pci_bus_rrs_vendor_id(*l)) 2512 return pci_bus_wait_rrs(bus, devfn, l, timeout); 2513 2514 return true; 2515 } 2516 2517 bool pci_bus_read_dev_vendor_id(struct pci_bus *bus, int devfn, u32 *l, 2518 int timeout) 2519 { 2520 #ifdef CONFIG_PCI_QUIRKS 2521 struct pci_dev *bridge = bus->self; 2522 2523 /* 2524 * Certain IDT switches have an issue where they improperly trigger 2525 * ACS Source Validation errors on completions for config reads. 2526 */ 2527 if (bridge && bridge->vendor == PCI_VENDOR_ID_IDT && 2528 bridge->device == 0x80b5) 2529 return pci_idt_bus_quirk(bus, devfn, l, timeout); 2530 #endif 2531 2532 return pci_bus_generic_read_dev_vendor_id(bus, devfn, l, timeout); 2533 } 2534 EXPORT_SYMBOL(pci_bus_read_dev_vendor_id); 2535 2536 #if IS_ENABLED(CONFIG_PCI_PWRCTRL) 2537 static struct platform_device *pci_pwrctrl_create_device(struct pci_bus *bus, int devfn) 2538 { 2539 struct pci_host_bridge *host = pci_find_host_bridge(bus); 2540 struct platform_device *pdev; 2541 struct device_node *np; 2542 2543 np = of_pci_find_child_device(dev_of_node(&bus->dev), devfn); 2544 if (!np) 2545 return NULL; 2546 2547 pdev = of_find_device_by_node(np); 2548 if (pdev) { 2549 put_device(&pdev->dev); 2550 goto err_put_of_node; 2551 } 2552 2553 /* 2554 * First check whether the pwrctrl device really needs to be created or 2555 * not. This is decided based on at least one of the power supplies 2556 * being defined in the devicetree node of the device. 2557 */ 2558 if (!of_pci_supply_present(np)) { 2559 pr_debug("PCI/pwrctrl: Skipping OF node: %s\n", np->name); 2560 goto err_put_of_node; 2561 } 2562 2563 /* Now create the pwrctrl device */ 2564 pdev = of_platform_device_create(np, NULL, &host->dev); 2565 if (!pdev) { 2566 pr_err("PCI/pwrctrl: Failed to create pwrctrl device for node: %s\n", np->name); 2567 goto err_put_of_node; 2568 } 2569 2570 of_node_put(np); 2571 2572 return pdev; 2573 2574 err_put_of_node: 2575 of_node_put(np); 2576 2577 return NULL; 2578 } 2579 #else 2580 static struct platform_device *pci_pwrctrl_create_device(struct pci_bus *bus, int devfn) 2581 { 2582 return NULL; 2583 } 2584 #endif 2585 2586 /* 2587 * Read the config data for a PCI device, sanity-check it, 2588 * and fill in the dev structure. 2589 */ 2590 static struct pci_dev *pci_scan_device(struct pci_bus *bus, int devfn) 2591 { 2592 struct pci_dev *dev; 2593 u32 l; 2594 2595 /* 2596 * Create pwrctrl device (if required) for the PCI device to handle the 2597 * power state. If the pwrctrl device is created, then skip scanning 2598 * further as the pwrctrl core will rescan the bus after powering on 2599 * the device. 2600 */ 2601 if (pci_pwrctrl_create_device(bus, devfn)) 2602 return NULL; 2603 2604 if (!pci_bus_read_dev_vendor_id(bus, devfn, &l, 60*1000)) 2605 return NULL; 2606 2607 dev = pci_alloc_dev(bus); 2608 if (!dev) 2609 return NULL; 2610 2611 dev->devfn = devfn; 2612 dev->vendor = l & 0xffff; 2613 dev->device = (l >> 16) & 0xffff; 2614 2615 if (pci_setup_device(dev)) { 2616 pci_bus_put(dev->bus); 2617 kfree(dev); 2618 return NULL; 2619 } 2620 2621 return dev; 2622 } 2623 2624 void pcie_report_downtraining(struct pci_dev *dev) 2625 { 2626 if (!pci_is_pcie(dev)) 2627 return; 2628 2629 /* Look from the device up to avoid downstream ports with no devices */ 2630 if ((pci_pcie_type(dev) != PCI_EXP_TYPE_ENDPOINT) && 2631 (pci_pcie_type(dev) != PCI_EXP_TYPE_LEG_END) && 2632 (pci_pcie_type(dev) != PCI_EXP_TYPE_UPSTREAM)) 2633 return; 2634 2635 /* Multi-function PCIe devices share the same link/status */ 2636 if (PCI_FUNC(dev->devfn) != 0 || dev->is_virtfn) 2637 return; 2638 2639 /* Print link status only if the device is constrained by the fabric */ 2640 __pcie_print_link_status(dev, false); 2641 } 2642 2643 static void pci_imm_ready_init(struct pci_dev *dev) 2644 { 2645 u16 status; 2646 2647 pci_read_config_word(dev, PCI_STATUS, &status); 2648 if (status & PCI_STATUS_IMM_READY) 2649 dev->imm_ready = 1; 2650 } 2651 2652 static void pci_init_capabilities(struct pci_dev *dev) 2653 { 2654 pci_ea_init(dev); /* Enhanced Allocation */ 2655 pci_msi_init(dev); /* Disable MSI */ 2656 pci_msix_init(dev); /* Disable MSI-X */ 2657 2658 /* Buffers for saving PCIe and PCI-X capabilities */ 2659 pci_allocate_cap_save_buffers(dev); 2660 2661 pci_imm_ready_init(dev); /* Immediate Readiness */ 2662 pci_pm_init(dev); /* Power Management */ 2663 pci_vpd_init(dev); /* Vital Product Data */ 2664 pci_configure_ari(dev); /* Alternative Routing-ID Forwarding */ 2665 pci_iov_init(dev); /* Single Root I/O Virtualization */ 2666 pci_ats_init(dev); /* Address Translation Services */ 2667 pci_pri_init(dev); /* Page Request Interface */ 2668 pci_pasid_init(dev); /* Process Address Space ID */ 2669 pci_acs_init(dev); /* Access Control Services */ 2670 pci_ptm_init(dev); /* Precision Time Measurement */ 2671 pci_aer_init(dev); /* Advanced Error Reporting */ 2672 pci_dpc_init(dev); /* Downstream Port Containment */ 2673 pci_rcec_init(dev); /* Root Complex Event Collector */ 2674 pci_doe_init(dev); /* Data Object Exchange */ 2675 pci_tph_init(dev); /* TLP Processing Hints */ 2676 pci_rebar_init(dev); /* Resizable BAR */ 2677 2678 pcie_report_downtraining(dev); 2679 pci_init_reset_methods(dev); 2680 } 2681 2682 /* 2683 * This is the equivalent of pci_host_bridge_msi_domain() that acts on 2684 * devices. Firmware interfaces that can select the MSI domain on a 2685 * per-device basis should be called from here. 2686 */ 2687 static struct irq_domain *pci_dev_msi_domain(struct pci_dev *dev) 2688 { 2689 struct irq_domain *d; 2690 2691 /* 2692 * If a domain has been set through the pcibios_device_add() 2693 * callback, then this is the one (platform code knows best). 2694 */ 2695 d = dev_get_msi_domain(&dev->dev); 2696 if (d) 2697 return d; 2698 2699 /* 2700 * Let's see if we have a firmware interface able to provide 2701 * the domain. 2702 */ 2703 d = pci_msi_get_device_domain(dev); 2704 if (d) 2705 return d; 2706 2707 return NULL; 2708 } 2709 2710 static void pci_set_msi_domain(struct pci_dev *dev) 2711 { 2712 struct irq_domain *d; 2713 2714 /* 2715 * If the platform or firmware interfaces cannot supply a 2716 * device-specific MSI domain, then inherit the default domain 2717 * from the host bridge itself. 2718 */ 2719 d = pci_dev_msi_domain(dev); 2720 if (!d) 2721 d = dev_get_msi_domain(&dev->bus->dev); 2722 2723 dev_set_msi_domain(&dev->dev, d); 2724 } 2725 2726 void pci_device_add(struct pci_dev *dev, struct pci_bus *bus) 2727 { 2728 int ret; 2729 2730 pci_configure_device(dev); 2731 2732 device_initialize(&dev->dev); 2733 dev->dev.release = pci_release_dev; 2734 2735 set_dev_node(&dev->dev, pcibus_to_node(bus)); 2736 dev->dev.dma_mask = &dev->dma_mask; 2737 dev->dev.dma_parms = &dev->dma_parms; 2738 dev->dev.coherent_dma_mask = 0xffffffffull; 2739 2740 dma_set_max_seg_size(&dev->dev, 65536); 2741 dma_set_seg_boundary(&dev->dev, 0xffffffff); 2742 2743 pcie_failed_link_retrain(dev); 2744 2745 /* Fix up broken headers */ 2746 pci_fixup_device(pci_fixup_header, dev); 2747 2748 pci_reassigndev_resource_alignment(dev); 2749 2750 dev->state_saved = false; 2751 2752 pci_init_capabilities(dev); 2753 2754 /* 2755 * Add the device to our list of discovered devices 2756 * and the bus list for fixup functions, etc. 2757 */ 2758 down_write(&pci_bus_sem); 2759 list_add_tail(&dev->bus_list, &bus->devices); 2760 up_write(&pci_bus_sem); 2761 2762 ret = pcibios_device_add(dev); 2763 WARN_ON(ret < 0); 2764 2765 /* Set up MSI IRQ domain */ 2766 pci_set_msi_domain(dev); 2767 2768 /* Notifier could use PCI capabilities */ 2769 ret = device_add(&dev->dev); 2770 WARN_ON(ret < 0); 2771 2772 pci_npem_create(dev); 2773 2774 pci_doe_sysfs_init(dev); 2775 } 2776 2777 struct pci_dev *pci_scan_single_device(struct pci_bus *bus, int devfn) 2778 { 2779 struct pci_dev *dev; 2780 2781 dev = pci_get_slot(bus, devfn); 2782 if (dev) { 2783 pci_dev_put(dev); 2784 return dev; 2785 } 2786 2787 dev = pci_scan_device(bus, devfn); 2788 if (!dev) 2789 return NULL; 2790 2791 pci_device_add(dev, bus); 2792 2793 return dev; 2794 } 2795 EXPORT_SYMBOL(pci_scan_single_device); 2796 2797 static int next_ari_fn(struct pci_bus *bus, struct pci_dev *dev, int fn) 2798 { 2799 int pos; 2800 u16 cap = 0; 2801 unsigned int next_fn; 2802 2803 if (!dev) 2804 return -ENODEV; 2805 2806 pos = pci_find_ext_capability(dev, PCI_EXT_CAP_ID_ARI); 2807 if (!pos) 2808 return -ENODEV; 2809 2810 pci_read_config_word(dev, pos + PCI_ARI_CAP, &cap); 2811 next_fn = PCI_ARI_CAP_NFN(cap); 2812 if (next_fn <= fn) 2813 return -ENODEV; /* protect against malformed list */ 2814 2815 return next_fn; 2816 } 2817 2818 static int next_fn(struct pci_bus *bus, struct pci_dev *dev, int fn) 2819 { 2820 if (pci_ari_enabled(bus)) 2821 return next_ari_fn(bus, dev, fn); 2822 2823 if (fn >= 7) 2824 return -ENODEV; 2825 /* only multifunction devices may have more functions */ 2826 if (dev && !dev->multifunction) 2827 return -ENODEV; 2828 2829 return fn + 1; 2830 } 2831 2832 static int only_one_child(struct pci_bus *bus) 2833 { 2834 struct pci_dev *bridge = bus->self; 2835 2836 /* 2837 * Systems with unusual topologies set PCI_SCAN_ALL_PCIE_DEVS so 2838 * we scan for all possible devices, not just Device 0. 2839 */ 2840 if (pci_has_flag(PCI_SCAN_ALL_PCIE_DEVS)) 2841 return 0; 2842 2843 /* 2844 * A PCIe Downstream Port normally leads to a Link with only Device 2845 * 0 on it (PCIe spec r3.1, sec 7.3.1). As an optimization, scan 2846 * only for Device 0 in that situation. 2847 */ 2848 if (bridge && pci_is_pcie(bridge) && pcie_downstream_port(bridge)) 2849 return 1; 2850 2851 return 0; 2852 } 2853 2854 /** 2855 * pci_scan_slot - Scan a PCI slot on a bus for devices 2856 * @bus: PCI bus to scan 2857 * @devfn: slot number to scan (must have zero function) 2858 * 2859 * Scan a PCI slot on the specified PCI bus for devices, adding 2860 * discovered devices to the @bus->devices list. New devices 2861 * will not have is_added set. 2862 * 2863 * Returns the number of new devices found. 2864 */ 2865 int pci_scan_slot(struct pci_bus *bus, int devfn) 2866 { 2867 struct pci_dev *dev; 2868 int fn = 0, nr = 0; 2869 2870 if (only_one_child(bus) && (devfn > 0)) 2871 return 0; /* Already scanned the entire slot */ 2872 2873 do { 2874 dev = pci_scan_single_device(bus, devfn + fn); 2875 if (dev) { 2876 if (!pci_dev_is_added(dev)) 2877 nr++; 2878 if (fn > 0) 2879 dev->multifunction = 1; 2880 } else if (fn == 0) { 2881 /* 2882 * Function 0 is required unless we are running on 2883 * a hypervisor that passes through individual PCI 2884 * functions. 2885 */ 2886 if (!hypervisor_isolated_pci_functions()) 2887 break; 2888 } 2889 fn = next_fn(bus, dev, fn); 2890 } while (fn >= 0); 2891 2892 /* Only one slot has PCIe device */ 2893 if (bus->self && nr) 2894 pcie_aspm_init_link_state(bus->self); 2895 2896 return nr; 2897 } 2898 EXPORT_SYMBOL(pci_scan_slot); 2899 2900 static int pcie_find_smpss(struct pci_dev *dev, void *data) 2901 { 2902 u8 *smpss = data; 2903 2904 if (!pci_is_pcie(dev)) 2905 return 0; 2906 2907 /* 2908 * We don't have a way to change MPS settings on devices that have 2909 * drivers attached. A hot-added device might support only the minimum 2910 * MPS setting (MPS=128). Therefore, if the fabric contains a bridge 2911 * where devices may be hot-added, we limit the fabric MPS to 128 so 2912 * hot-added devices will work correctly. 2913 * 2914 * However, if we hot-add a device to a slot directly below a Root 2915 * Port, it's impossible for there to be other existing devices below 2916 * the port. We don't limit the MPS in this case because we can 2917 * reconfigure MPS on both the Root Port and the hot-added device, 2918 * and there are no other devices involved. 2919 * 2920 * Note that this PCIE_BUS_SAFE path assumes no peer-to-peer DMA. 2921 */ 2922 if (dev->is_hotplug_bridge && 2923 pci_pcie_type(dev) != PCI_EXP_TYPE_ROOT_PORT) 2924 *smpss = 0; 2925 2926 if (*smpss > dev->pcie_mpss) 2927 *smpss = dev->pcie_mpss; 2928 2929 return 0; 2930 } 2931 2932 static void pcie_write_mps(struct pci_dev *dev, int mps) 2933 { 2934 int rc; 2935 2936 if (pcie_bus_config == PCIE_BUS_PERFORMANCE) { 2937 mps = 128 << dev->pcie_mpss; 2938 2939 if (pci_pcie_type(dev) != PCI_EXP_TYPE_ROOT_PORT && 2940 dev->bus->self) 2941 2942 /* 2943 * For "Performance", the assumption is made that 2944 * downstream communication will never be larger than 2945 * the MRRS. So, the MPS only needs to be configured 2946 * for the upstream communication. This being the case, 2947 * walk from the top down and set the MPS of the child 2948 * to that of the parent bus. 2949 * 2950 * Configure the device MPS with the smaller of the 2951 * device MPSS or the bridge MPS (which is assumed to be 2952 * properly configured at this point to the largest 2953 * allowable MPS based on its parent bus). 2954 */ 2955 mps = min(mps, pcie_get_mps(dev->bus->self)); 2956 } 2957 2958 rc = pcie_set_mps(dev, mps); 2959 if (rc) 2960 pci_err(dev, "Failed attempting to set the MPS\n"); 2961 } 2962 2963 static void pcie_write_mrrs(struct pci_dev *dev) 2964 { 2965 int rc, mrrs; 2966 2967 /* 2968 * In the "safe" case, do not configure the MRRS. There appear to be 2969 * issues with setting MRRS to 0 on a number of devices. 2970 */ 2971 if (pcie_bus_config != PCIE_BUS_PERFORMANCE) 2972 return; 2973 2974 /* 2975 * For max performance, the MRRS must be set to the largest supported 2976 * value. However, it cannot be configured larger than the MPS the 2977 * device or the bus can support. This should already be properly 2978 * configured by a prior call to pcie_write_mps(). 2979 */ 2980 mrrs = pcie_get_mps(dev); 2981 2982 /* 2983 * MRRS is a R/W register. Invalid values can be written, but a 2984 * subsequent read will verify if the value is acceptable or not. 2985 * If the MRRS value provided is not acceptable (e.g., too large), 2986 * shrink the value until it is acceptable to the HW. 2987 */ 2988 while (mrrs != pcie_get_readrq(dev) && mrrs >= 128) { 2989 rc = pcie_set_readrq(dev, mrrs); 2990 if (!rc) 2991 break; 2992 2993 pci_warn(dev, "Failed attempting to set the MRRS\n"); 2994 mrrs /= 2; 2995 } 2996 2997 if (mrrs < 128) 2998 pci_err(dev, "MRRS was unable to be configured with a safe value. If problems are experienced, try running with pci=pcie_bus_safe\n"); 2999 } 3000 3001 static int pcie_bus_configure_set(struct pci_dev *dev, void *data) 3002 { 3003 int mps, orig_mps; 3004 3005 if (!pci_is_pcie(dev)) 3006 return 0; 3007 3008 if (pcie_bus_config == PCIE_BUS_TUNE_OFF || 3009 pcie_bus_config == PCIE_BUS_DEFAULT) 3010 return 0; 3011 3012 mps = 128 << *(u8 *)data; 3013 orig_mps = pcie_get_mps(dev); 3014 3015 pcie_write_mps(dev, mps); 3016 pcie_write_mrrs(dev); 3017 3018 pci_info(dev, "Max Payload Size set to %4d/%4d (was %4d), Max Read Rq %4d\n", 3019 pcie_get_mps(dev), 128 << dev->pcie_mpss, 3020 orig_mps, pcie_get_readrq(dev)); 3021 3022 return 0; 3023 } 3024 3025 /* 3026 * pcie_bus_configure_settings() requires that pci_walk_bus work in a top-down, 3027 * parents then children fashion. If this changes, then this code will not 3028 * work as designed. 3029 */ 3030 void pcie_bus_configure_settings(struct pci_bus *bus) 3031 { 3032 u8 smpss = 0; 3033 3034 if (!bus->self) 3035 return; 3036 3037 if (!pci_is_pcie(bus->self)) 3038 return; 3039 3040 /* 3041 * FIXME - Peer to peer DMA is possible, though the endpoint would need 3042 * to be aware of the MPS of the destination. To work around this, 3043 * simply force the MPS of the entire system to the smallest possible. 3044 */ 3045 if (pcie_bus_config == PCIE_BUS_PEER2PEER) 3046 smpss = 0; 3047 3048 if (pcie_bus_config == PCIE_BUS_SAFE) { 3049 smpss = bus->self->pcie_mpss; 3050 3051 pcie_find_smpss(bus->self, &smpss); 3052 pci_walk_bus(bus, pcie_find_smpss, &smpss); 3053 } 3054 3055 pcie_bus_configure_set(bus->self, &smpss); 3056 pci_walk_bus(bus, pcie_bus_configure_set, &smpss); 3057 } 3058 EXPORT_SYMBOL_GPL(pcie_bus_configure_settings); 3059 3060 /* 3061 * Called after each bus is probed, but before its children are examined. This 3062 * is marked as __weak because multiple architectures define it. 3063 */ 3064 void __weak pcibios_fixup_bus(struct pci_bus *bus) 3065 { 3066 /* nothing to do, expected to be removed in the future */ 3067 } 3068 3069 /** 3070 * pci_scan_child_bus_extend() - Scan devices below a bus 3071 * @bus: Bus to scan for devices 3072 * @available_buses: Total number of buses available (%0 does not try to 3073 * extend beyond the minimal) 3074 * 3075 * Scans devices below @bus including subordinate buses. Returns new 3076 * subordinate number including all the found devices. Passing 3077 * @available_buses causes the remaining bus space to be distributed 3078 * equally between hotplug-capable bridges to allow future extension of the 3079 * hierarchy. 3080 */ 3081 static unsigned int pci_scan_child_bus_extend(struct pci_bus *bus, 3082 unsigned int available_buses) 3083 { 3084 unsigned int used_buses, normal_bridges = 0, hotplug_bridges = 0; 3085 unsigned int start = bus->busn_res.start; 3086 unsigned int devnr, cmax, max = start; 3087 struct pci_dev *dev; 3088 3089 dev_dbg(&bus->dev, "scanning bus\n"); 3090 3091 /* Go find them, Rover! */ 3092 for (devnr = 0; devnr < PCI_MAX_NR_DEVS; devnr++) 3093 pci_scan_slot(bus, PCI_DEVFN(devnr, 0)); 3094 3095 /* Reserve buses for SR-IOV capability */ 3096 used_buses = pci_iov_bus_range(bus); 3097 max += used_buses; 3098 3099 /* 3100 * After performing arch-dependent fixup of the bus, look behind 3101 * all PCI-to-PCI bridges on this bus. 3102 */ 3103 if (!bus->is_added) { 3104 dev_dbg(&bus->dev, "fixups for bus\n"); 3105 pcibios_fixup_bus(bus); 3106 bus->is_added = 1; 3107 } 3108 3109 /* 3110 * Calculate how many hotplug bridges and normal bridges there 3111 * are on this bus. We will distribute the additional available 3112 * buses between hotplug bridges. 3113 */ 3114 for_each_pci_bridge(dev, bus) { 3115 if (dev->is_hotplug_bridge) 3116 hotplug_bridges++; 3117 else 3118 normal_bridges++; 3119 } 3120 3121 /* 3122 * Scan bridges that are already configured. We don't touch them 3123 * unless they are misconfigured (which will be done in the second 3124 * scan below). 3125 */ 3126 for_each_pci_bridge(dev, bus) { 3127 cmax = max; 3128 max = pci_scan_bridge_extend(bus, dev, max, 0, 0); 3129 3130 /* 3131 * Reserve one bus for each bridge now to avoid extending 3132 * hotplug bridges too much during the second scan below. 3133 */ 3134 used_buses++; 3135 if (max - cmax > 1) 3136 used_buses += max - cmax - 1; 3137 } 3138 3139 /* Scan bridges that need to be reconfigured */ 3140 for_each_pci_bridge(dev, bus) { 3141 unsigned int buses = 0; 3142 3143 if (!hotplug_bridges && normal_bridges == 1) { 3144 /* 3145 * There is only one bridge on the bus (upstream 3146 * port) so it gets all available buses which it 3147 * can then distribute to the possible hotplug 3148 * bridges below. 3149 */ 3150 buses = available_buses; 3151 } else if (dev->is_hotplug_bridge) { 3152 /* 3153 * Distribute the extra buses between hotplug 3154 * bridges if any. 3155 */ 3156 buses = available_buses / hotplug_bridges; 3157 buses = min(buses, available_buses - used_buses + 1); 3158 } 3159 3160 cmax = max; 3161 max = pci_scan_bridge_extend(bus, dev, cmax, buses, 1); 3162 /* One bus is already accounted so don't add it again */ 3163 if (max - cmax > 1) 3164 used_buses += max - cmax - 1; 3165 } 3166 3167 /* 3168 * Make sure a hotplug bridge has at least the minimum requested 3169 * number of buses but allow it to grow up to the maximum available 3170 * bus number if there is room. 3171 */ 3172 if (bus->self && bus->self->is_hotplug_bridge) { 3173 used_buses = max_t(unsigned int, available_buses, 3174 pci_hotplug_bus_size - 1); 3175 if (max - start < used_buses) { 3176 max = start + used_buses; 3177 3178 /* Do not allocate more buses than we have room left */ 3179 if (max > bus->busn_res.end) 3180 max = bus->busn_res.end; 3181 3182 dev_dbg(&bus->dev, "%pR extended by %#02x\n", 3183 &bus->busn_res, max - start); 3184 } 3185 } 3186 3187 /* 3188 * We've scanned the bus and so we know all about what's on 3189 * the other side of any bridges that may be on this bus plus 3190 * any devices. 3191 * 3192 * Return how far we've got finding sub-buses. 3193 */ 3194 dev_dbg(&bus->dev, "bus scan returning with max=%02x\n", max); 3195 return max; 3196 } 3197 3198 /** 3199 * pci_scan_child_bus() - Scan devices below a bus 3200 * @bus: Bus to scan for devices 3201 * 3202 * Scans devices below @bus including subordinate buses. Returns new 3203 * subordinate number including all the found devices. 3204 */ 3205 unsigned int pci_scan_child_bus(struct pci_bus *bus) 3206 { 3207 return pci_scan_child_bus_extend(bus, 0); 3208 } 3209 EXPORT_SYMBOL_GPL(pci_scan_child_bus); 3210 3211 /** 3212 * pcibios_root_bridge_prepare - Platform-specific host bridge setup 3213 * @bridge: Host bridge to set up 3214 * 3215 * Default empty implementation. Replace with an architecture-specific setup 3216 * routine, if necessary. 3217 */ 3218 int __weak pcibios_root_bridge_prepare(struct pci_host_bridge *bridge) 3219 { 3220 return 0; 3221 } 3222 3223 void __weak pcibios_add_bus(struct pci_bus *bus) 3224 { 3225 } 3226 3227 void __weak pcibios_remove_bus(struct pci_bus *bus) 3228 { 3229 } 3230 3231 struct pci_bus *pci_create_root_bus(struct device *parent, int bus, 3232 struct pci_ops *ops, void *sysdata, struct list_head *resources) 3233 { 3234 int error; 3235 struct pci_host_bridge *bridge; 3236 3237 bridge = pci_alloc_host_bridge(0); 3238 if (!bridge) 3239 return NULL; 3240 3241 bridge->dev.parent = parent; 3242 3243 list_splice_init(resources, &bridge->windows); 3244 bridge->sysdata = sysdata; 3245 bridge->busnr = bus; 3246 bridge->ops = ops; 3247 3248 error = pci_register_host_bridge(bridge); 3249 if (error < 0) 3250 goto err_out; 3251 3252 return bridge->bus; 3253 3254 err_out: 3255 put_device(&bridge->dev); 3256 return NULL; 3257 } 3258 EXPORT_SYMBOL_GPL(pci_create_root_bus); 3259 3260 int pci_host_probe(struct pci_host_bridge *bridge) 3261 { 3262 struct pci_bus *bus, *child; 3263 int ret; 3264 3265 pci_lock_rescan_remove(); 3266 ret = pci_scan_root_bus_bridge(bridge); 3267 pci_unlock_rescan_remove(); 3268 if (ret < 0) { 3269 dev_err(bridge->dev.parent, "Scanning root bridge failed"); 3270 return ret; 3271 } 3272 3273 bus = bridge->bus; 3274 3275 /* If we must preserve the resource configuration, claim now */ 3276 if (bridge->preserve_config) 3277 pci_bus_claim_resources(bus); 3278 3279 /* 3280 * Assign whatever was left unassigned. If we didn't claim above, 3281 * this will reassign everything. 3282 */ 3283 pci_assign_unassigned_root_bus_resources(bus); 3284 3285 list_for_each_entry(child, &bus->children, node) 3286 pcie_bus_configure_settings(child); 3287 3288 pci_lock_rescan_remove(); 3289 pci_bus_add_devices(bus); 3290 pci_unlock_rescan_remove(); 3291 3292 /* 3293 * Ensure pm_runtime_enable() is called for the controller drivers 3294 * before calling pci_host_probe(). The PM framework expects that 3295 * if the parent device supports runtime PM, it will be enabled 3296 * before child runtime PM is enabled. 3297 */ 3298 pm_runtime_set_active(&bridge->dev); 3299 pm_runtime_no_callbacks(&bridge->dev); 3300 devm_pm_runtime_enable(&bridge->dev); 3301 3302 return 0; 3303 } 3304 EXPORT_SYMBOL_GPL(pci_host_probe); 3305 3306 int pci_bus_insert_busn_res(struct pci_bus *b, int bus, int bus_max) 3307 { 3308 struct resource *res = &b->busn_res; 3309 struct resource *parent_res, *conflict; 3310 3311 res->start = bus; 3312 res->end = bus_max; 3313 res->flags = IORESOURCE_BUS; 3314 3315 if (!pci_is_root_bus(b)) 3316 parent_res = &b->parent->busn_res; 3317 else { 3318 parent_res = get_pci_domain_busn_res(pci_domain_nr(b)); 3319 res->flags |= IORESOURCE_PCI_FIXED; 3320 } 3321 3322 conflict = request_resource_conflict(parent_res, res); 3323 3324 if (conflict) 3325 dev_info(&b->dev, 3326 "busn_res: can not insert %pR under %s%pR (conflicts with %s %pR)\n", 3327 res, pci_is_root_bus(b) ? "domain " : "", 3328 parent_res, conflict->name, conflict); 3329 3330 return conflict == NULL; 3331 } 3332 3333 int pci_bus_update_busn_res_end(struct pci_bus *b, int bus_max) 3334 { 3335 struct resource *res = &b->busn_res; 3336 struct resource old_res = *res; 3337 resource_size_t size; 3338 int ret; 3339 3340 if (res->start > bus_max) 3341 return -EINVAL; 3342 3343 size = bus_max - res->start + 1; 3344 ret = adjust_resource(res, res->start, size); 3345 dev_info(&b->dev, "busn_res: %pR end %s updated to %02x\n", 3346 &old_res, ret ? "can not be" : "is", bus_max); 3347 3348 if (!ret && !res->parent) 3349 pci_bus_insert_busn_res(b, res->start, res->end); 3350 3351 return ret; 3352 } 3353 3354 void pci_bus_release_busn_res(struct pci_bus *b) 3355 { 3356 struct resource *res = &b->busn_res; 3357 int ret; 3358 3359 if (!res->flags || !res->parent) 3360 return; 3361 3362 ret = release_resource(res); 3363 dev_info(&b->dev, "busn_res: %pR %s released\n", 3364 res, ret ? "can not be" : "is"); 3365 } 3366 3367 int pci_scan_root_bus_bridge(struct pci_host_bridge *bridge) 3368 { 3369 struct resource_entry *window; 3370 bool found = false; 3371 struct pci_bus *b; 3372 int max, bus, ret; 3373 3374 if (!bridge) 3375 return -EINVAL; 3376 3377 resource_list_for_each_entry(window, &bridge->windows) 3378 if (window->res->flags & IORESOURCE_BUS) { 3379 bridge->busnr = window->res->start; 3380 found = true; 3381 break; 3382 } 3383 3384 ret = pci_register_host_bridge(bridge); 3385 if (ret < 0) 3386 return ret; 3387 3388 b = bridge->bus; 3389 bus = bridge->busnr; 3390 3391 if (!found) { 3392 dev_info(&b->dev, 3393 "No busn resource found for root bus, will use [bus %02x-ff]\n", 3394 bus); 3395 pci_bus_insert_busn_res(b, bus, 255); 3396 } 3397 3398 max = pci_scan_child_bus(b); 3399 3400 if (!found) 3401 pci_bus_update_busn_res_end(b, max); 3402 3403 return 0; 3404 } 3405 EXPORT_SYMBOL(pci_scan_root_bus_bridge); 3406 3407 struct pci_bus *pci_scan_root_bus(struct device *parent, int bus, 3408 struct pci_ops *ops, void *sysdata, struct list_head *resources) 3409 { 3410 struct resource_entry *window; 3411 bool found = false; 3412 struct pci_bus *b; 3413 int max; 3414 3415 resource_list_for_each_entry(window, resources) 3416 if (window->res->flags & IORESOURCE_BUS) { 3417 found = true; 3418 break; 3419 } 3420 3421 b = pci_create_root_bus(parent, bus, ops, sysdata, resources); 3422 if (!b) 3423 return NULL; 3424 3425 if (!found) { 3426 dev_info(&b->dev, 3427 "No busn resource found for root bus, will use [bus %02x-ff]\n", 3428 bus); 3429 pci_bus_insert_busn_res(b, bus, 255); 3430 } 3431 3432 max = pci_scan_child_bus(b); 3433 3434 if (!found) 3435 pci_bus_update_busn_res_end(b, max); 3436 3437 return b; 3438 } 3439 EXPORT_SYMBOL(pci_scan_root_bus); 3440 3441 struct pci_bus *pci_scan_bus(int bus, struct pci_ops *ops, 3442 void *sysdata) 3443 { 3444 LIST_HEAD(resources); 3445 struct pci_bus *b; 3446 3447 pci_add_resource(&resources, &ioport_resource); 3448 pci_add_resource(&resources, &iomem_resource); 3449 pci_add_resource(&resources, &busn_resource); 3450 b = pci_create_root_bus(NULL, bus, ops, sysdata, &resources); 3451 if (b) { 3452 pci_scan_child_bus(b); 3453 } else { 3454 pci_free_resource_list(&resources); 3455 } 3456 return b; 3457 } 3458 EXPORT_SYMBOL(pci_scan_bus); 3459 3460 /** 3461 * pci_rescan_bus_bridge_resize - Scan a PCI bus for devices 3462 * @bridge: PCI bridge for the bus to scan 3463 * 3464 * Scan a PCI bus and child buses for new devices, add them, 3465 * and enable them, resizing bridge mmio/io resource if necessary 3466 * and possible. The caller must ensure the child devices are already 3467 * removed for resizing to occur. 3468 * 3469 * Returns the max number of subordinate bus discovered. 3470 */ 3471 unsigned int pci_rescan_bus_bridge_resize(struct pci_dev *bridge) 3472 { 3473 unsigned int max; 3474 struct pci_bus *bus = bridge->subordinate; 3475 3476 max = pci_scan_child_bus(bus); 3477 3478 pci_assign_unassigned_bridge_resources(bridge); 3479 3480 pci_bus_add_devices(bus); 3481 3482 return max; 3483 } 3484 3485 /** 3486 * pci_rescan_bus - Scan a PCI bus for devices 3487 * @bus: PCI bus to scan 3488 * 3489 * Scan a PCI bus and child buses for new devices, add them, 3490 * and enable them. 3491 * 3492 * Returns the max number of subordinate bus discovered. 3493 */ 3494 unsigned int pci_rescan_bus(struct pci_bus *bus) 3495 { 3496 unsigned int max; 3497 3498 max = pci_scan_child_bus(bus); 3499 pci_assign_unassigned_bus_resources(bus); 3500 pci_bus_add_devices(bus); 3501 3502 return max; 3503 } 3504 EXPORT_SYMBOL_GPL(pci_rescan_bus); 3505 3506 /* 3507 * pci_rescan_bus(), pci_rescan_bus_bridge_resize() and PCI device removal 3508 * routines should always be executed under this mutex. 3509 */ 3510 DEFINE_MUTEX(pci_rescan_remove_lock); 3511 3512 void pci_lock_rescan_remove(void) 3513 { 3514 mutex_lock(&pci_rescan_remove_lock); 3515 } 3516 EXPORT_SYMBOL_GPL(pci_lock_rescan_remove); 3517 3518 void pci_unlock_rescan_remove(void) 3519 { 3520 mutex_unlock(&pci_rescan_remove_lock); 3521 } 3522 EXPORT_SYMBOL_GPL(pci_unlock_rescan_remove); 3523 3524 static int __init pci_sort_bf_cmp(const struct device *d_a, 3525 const struct device *d_b) 3526 { 3527 const struct pci_dev *a = to_pci_dev(d_a); 3528 const struct pci_dev *b = to_pci_dev(d_b); 3529 3530 if (pci_domain_nr(a->bus) < pci_domain_nr(b->bus)) return -1; 3531 else if (pci_domain_nr(a->bus) > pci_domain_nr(b->bus)) return 1; 3532 3533 if (a->bus->number < b->bus->number) return -1; 3534 else if (a->bus->number > b->bus->number) return 1; 3535 3536 if (a->devfn < b->devfn) return -1; 3537 else if (a->devfn > b->devfn) return 1; 3538 3539 return 0; 3540 } 3541 3542 void __init pci_sort_breadthfirst(void) 3543 { 3544 bus_sort_breadthfirst(&pci_bus_type, &pci_sort_bf_cmp); 3545 } 3546 3547 int pci_hp_add_bridge(struct pci_dev *dev) 3548 { 3549 struct pci_bus *parent = dev->bus; 3550 int busnr, start = parent->busn_res.start; 3551 unsigned int available_buses = 0; 3552 int end = parent->busn_res.end; 3553 3554 for (busnr = start; busnr <= end; busnr++) { 3555 if (!pci_find_bus(pci_domain_nr(parent), busnr)) 3556 break; 3557 } 3558 if (busnr-- > end) { 3559 pci_err(dev, "No bus number available for hot-added bridge\n"); 3560 return -1; 3561 } 3562 3563 /* Scan bridges that are already configured */ 3564 busnr = pci_scan_bridge(parent, dev, busnr, 0); 3565 3566 /* 3567 * Distribute the available bus numbers between hotplug-capable 3568 * bridges to make extending the chain later possible. 3569 */ 3570 available_buses = end - busnr; 3571 3572 /* Scan bridges that need to be reconfigured */ 3573 pci_scan_bridge_extend(parent, dev, busnr, available_buses, 1); 3574 3575 if (!dev->subordinate) 3576 return -1; 3577 3578 return 0; 3579 } 3580 EXPORT_SYMBOL_GPL(pci_hp_add_bridge); 3581