xref: /linux/drivers/pci/probe.c (revision a2cce7a9f1b8cc3d4edce106fb971529f1d4d9ce)
1 /*
2  * probe.c - PCI detection and setup code
3  */
4 
5 #include <linux/kernel.h>
6 #include <linux/delay.h>
7 #include <linux/init.h>
8 #include <linux/pci.h>
9 #include <linux/of_pci.h>
10 #include <linux/pci_hotplug.h>
11 #include <linux/slab.h>
12 #include <linux/module.h>
13 #include <linux/cpumask.h>
14 #include <linux/pci-aspm.h>
15 #include <asm-generic/pci-bridge.h>
16 #include "pci.h"
17 
18 #define CARDBUS_LATENCY_TIMER	176	/* secondary latency timer */
19 #define CARDBUS_RESERVE_BUSNR	3
20 
21 static struct resource busn_resource = {
22 	.name	= "PCI busn",
23 	.start	= 0,
24 	.end	= 255,
25 	.flags	= IORESOURCE_BUS,
26 };
27 
28 /* Ugh.  Need to stop exporting this to modules. */
29 LIST_HEAD(pci_root_buses);
30 EXPORT_SYMBOL(pci_root_buses);
31 
32 static LIST_HEAD(pci_domain_busn_res_list);
33 
34 struct pci_domain_busn_res {
35 	struct list_head list;
36 	struct resource res;
37 	int domain_nr;
38 };
39 
40 static struct resource *get_pci_domain_busn_res(int domain_nr)
41 {
42 	struct pci_domain_busn_res *r;
43 
44 	list_for_each_entry(r, &pci_domain_busn_res_list, list)
45 		if (r->domain_nr == domain_nr)
46 			return &r->res;
47 
48 	r = kzalloc(sizeof(*r), GFP_KERNEL);
49 	if (!r)
50 		return NULL;
51 
52 	r->domain_nr = domain_nr;
53 	r->res.start = 0;
54 	r->res.end = 0xff;
55 	r->res.flags = IORESOURCE_BUS | IORESOURCE_PCI_FIXED;
56 
57 	list_add_tail(&r->list, &pci_domain_busn_res_list);
58 
59 	return &r->res;
60 }
61 
62 static int find_anything(struct device *dev, void *data)
63 {
64 	return 1;
65 }
66 
67 /*
68  * Some device drivers need know if pci is initiated.
69  * Basically, we think pci is not initiated when there
70  * is no device to be found on the pci_bus_type.
71  */
72 int no_pci_devices(void)
73 {
74 	struct device *dev;
75 	int no_devices;
76 
77 	dev = bus_find_device(&pci_bus_type, NULL, NULL, find_anything);
78 	no_devices = (dev == NULL);
79 	put_device(dev);
80 	return no_devices;
81 }
82 EXPORT_SYMBOL(no_pci_devices);
83 
84 /*
85  * PCI Bus Class
86  */
87 static void release_pcibus_dev(struct device *dev)
88 {
89 	struct pci_bus *pci_bus = to_pci_bus(dev);
90 
91 	put_device(pci_bus->bridge);
92 	pci_bus_remove_resources(pci_bus);
93 	pci_release_bus_of_node(pci_bus);
94 	kfree(pci_bus);
95 }
96 
97 static struct class pcibus_class = {
98 	.name		= "pci_bus",
99 	.dev_release	= &release_pcibus_dev,
100 	.dev_groups	= pcibus_groups,
101 };
102 
103 static int __init pcibus_class_init(void)
104 {
105 	return class_register(&pcibus_class);
106 }
107 postcore_initcall(pcibus_class_init);
108 
109 static u64 pci_size(u64 base, u64 maxbase, u64 mask)
110 {
111 	u64 size = mask & maxbase;	/* Find the significant bits */
112 	if (!size)
113 		return 0;
114 
115 	/* Get the lowest of them to find the decode size, and
116 	   from that the extent.  */
117 	size = (size & ~(size-1)) - 1;
118 
119 	/* base == maxbase can be valid only if the BAR has
120 	   already been programmed with all 1s.  */
121 	if (base == maxbase && ((base | size) & mask) != mask)
122 		return 0;
123 
124 	return size;
125 }
126 
127 static inline unsigned long decode_bar(struct pci_dev *dev, u32 bar)
128 {
129 	u32 mem_type;
130 	unsigned long flags;
131 
132 	if ((bar & PCI_BASE_ADDRESS_SPACE) == PCI_BASE_ADDRESS_SPACE_IO) {
133 		flags = bar & ~PCI_BASE_ADDRESS_IO_MASK;
134 		flags |= IORESOURCE_IO;
135 		return flags;
136 	}
137 
138 	flags = bar & ~PCI_BASE_ADDRESS_MEM_MASK;
139 	flags |= IORESOURCE_MEM;
140 	if (flags & PCI_BASE_ADDRESS_MEM_PREFETCH)
141 		flags |= IORESOURCE_PREFETCH;
142 
143 	mem_type = bar & PCI_BASE_ADDRESS_MEM_TYPE_MASK;
144 	switch (mem_type) {
145 	case PCI_BASE_ADDRESS_MEM_TYPE_32:
146 		break;
147 	case PCI_BASE_ADDRESS_MEM_TYPE_1M:
148 		/* 1M mem BAR treated as 32-bit BAR */
149 		break;
150 	case PCI_BASE_ADDRESS_MEM_TYPE_64:
151 		flags |= IORESOURCE_MEM_64;
152 		break;
153 	default:
154 		/* mem unknown type treated as 32-bit BAR */
155 		break;
156 	}
157 	return flags;
158 }
159 
160 #define PCI_COMMAND_DECODE_ENABLE	(PCI_COMMAND_MEMORY | PCI_COMMAND_IO)
161 
162 /**
163  * pci_read_base - read a PCI BAR
164  * @dev: the PCI device
165  * @type: type of the BAR
166  * @res: resource buffer to be filled in
167  * @pos: BAR position in the config space
168  *
169  * Returns 1 if the BAR is 64-bit, or 0 if 32-bit.
170  */
171 int __pci_read_base(struct pci_dev *dev, enum pci_bar_type type,
172 		    struct resource *res, unsigned int pos)
173 {
174 	u32 l, sz, mask;
175 	u64 l64, sz64, mask64;
176 	u16 orig_cmd;
177 	struct pci_bus_region region, inverted_region;
178 
179 	mask = type ? PCI_ROM_ADDRESS_MASK : ~0;
180 
181 	/* No printks while decoding is disabled! */
182 	if (!dev->mmio_always_on) {
183 		pci_read_config_word(dev, PCI_COMMAND, &orig_cmd);
184 		if (orig_cmd & PCI_COMMAND_DECODE_ENABLE) {
185 			pci_write_config_word(dev, PCI_COMMAND,
186 				orig_cmd & ~PCI_COMMAND_DECODE_ENABLE);
187 		}
188 	}
189 
190 	res->name = pci_name(dev);
191 
192 	pci_read_config_dword(dev, pos, &l);
193 	pci_write_config_dword(dev, pos, l | mask);
194 	pci_read_config_dword(dev, pos, &sz);
195 	pci_write_config_dword(dev, pos, l);
196 
197 	/*
198 	 * All bits set in sz means the device isn't working properly.
199 	 * If the BAR isn't implemented, all bits must be 0.  If it's a
200 	 * memory BAR or a ROM, bit 0 must be clear; if it's an io BAR, bit
201 	 * 1 must be clear.
202 	 */
203 	if (sz == 0xffffffff)
204 		sz = 0;
205 
206 	/*
207 	 * I don't know how l can have all bits set.  Copied from old code.
208 	 * Maybe it fixes a bug on some ancient platform.
209 	 */
210 	if (l == 0xffffffff)
211 		l = 0;
212 
213 	if (type == pci_bar_unknown) {
214 		res->flags = decode_bar(dev, l);
215 		res->flags |= IORESOURCE_SIZEALIGN;
216 		if (res->flags & IORESOURCE_IO) {
217 			l64 = l & PCI_BASE_ADDRESS_IO_MASK;
218 			sz64 = sz & PCI_BASE_ADDRESS_IO_MASK;
219 			mask64 = PCI_BASE_ADDRESS_IO_MASK & (u32)IO_SPACE_LIMIT;
220 		} else {
221 			l64 = l & PCI_BASE_ADDRESS_MEM_MASK;
222 			sz64 = sz & PCI_BASE_ADDRESS_MEM_MASK;
223 			mask64 = (u32)PCI_BASE_ADDRESS_MEM_MASK;
224 		}
225 	} else {
226 		res->flags |= (l & IORESOURCE_ROM_ENABLE);
227 		l64 = l & PCI_ROM_ADDRESS_MASK;
228 		sz64 = sz & PCI_ROM_ADDRESS_MASK;
229 		mask64 = (u32)PCI_ROM_ADDRESS_MASK;
230 	}
231 
232 	if (res->flags & IORESOURCE_MEM_64) {
233 		pci_read_config_dword(dev, pos + 4, &l);
234 		pci_write_config_dword(dev, pos + 4, ~0);
235 		pci_read_config_dword(dev, pos + 4, &sz);
236 		pci_write_config_dword(dev, pos + 4, l);
237 
238 		l64 |= ((u64)l << 32);
239 		sz64 |= ((u64)sz << 32);
240 		mask64 |= ((u64)~0 << 32);
241 	}
242 
243 	if (!dev->mmio_always_on && (orig_cmd & PCI_COMMAND_DECODE_ENABLE))
244 		pci_write_config_word(dev, PCI_COMMAND, orig_cmd);
245 
246 	if (!sz64)
247 		goto fail;
248 
249 	sz64 = pci_size(l64, sz64, mask64);
250 	if (!sz64) {
251 		dev_info(&dev->dev, FW_BUG "reg 0x%x: invalid BAR (can't size)\n",
252 			 pos);
253 		goto fail;
254 	}
255 
256 	if (res->flags & IORESOURCE_MEM_64) {
257 		if ((sizeof(pci_bus_addr_t) < 8 || sizeof(resource_size_t) < 8)
258 		    && sz64 > 0x100000000ULL) {
259 			res->flags |= IORESOURCE_UNSET | IORESOURCE_DISABLED;
260 			res->start = 0;
261 			res->end = 0;
262 			dev_err(&dev->dev, "reg 0x%x: can't handle BAR larger than 4GB (size %#010llx)\n",
263 				pos, (unsigned long long)sz64);
264 			goto out;
265 		}
266 
267 		if ((sizeof(pci_bus_addr_t) < 8) && l) {
268 			/* Above 32-bit boundary; try to reallocate */
269 			res->flags |= IORESOURCE_UNSET;
270 			res->start = 0;
271 			res->end = sz64;
272 			dev_info(&dev->dev, "reg 0x%x: can't handle BAR above 4GB (bus address %#010llx)\n",
273 				 pos, (unsigned long long)l64);
274 			goto out;
275 		}
276 	}
277 
278 	region.start = l64;
279 	region.end = l64 + sz64;
280 
281 	pcibios_bus_to_resource(dev->bus, res, &region);
282 	pcibios_resource_to_bus(dev->bus, &inverted_region, res);
283 
284 	/*
285 	 * If "A" is a BAR value (a bus address), "bus_to_resource(A)" is
286 	 * the corresponding resource address (the physical address used by
287 	 * the CPU.  Converting that resource address back to a bus address
288 	 * should yield the original BAR value:
289 	 *
290 	 *     resource_to_bus(bus_to_resource(A)) == A
291 	 *
292 	 * If it doesn't, CPU accesses to "bus_to_resource(A)" will not
293 	 * be claimed by the device.
294 	 */
295 	if (inverted_region.start != region.start) {
296 		res->flags |= IORESOURCE_UNSET;
297 		res->start = 0;
298 		res->end = region.end - region.start;
299 		dev_info(&dev->dev, "reg 0x%x: initial BAR value %#010llx invalid\n",
300 			 pos, (unsigned long long)region.start);
301 	}
302 
303 	goto out;
304 
305 
306 fail:
307 	res->flags = 0;
308 out:
309 	if (res->flags)
310 		dev_printk(KERN_DEBUG, &dev->dev, "reg 0x%x: %pR\n", pos, res);
311 
312 	return (res->flags & IORESOURCE_MEM_64) ? 1 : 0;
313 }
314 
315 static void pci_read_bases(struct pci_dev *dev, unsigned int howmany, int rom)
316 {
317 	unsigned int pos, reg;
318 
319 	for (pos = 0; pos < howmany; pos++) {
320 		struct resource *res = &dev->resource[pos];
321 		reg = PCI_BASE_ADDRESS_0 + (pos << 2);
322 		pos += __pci_read_base(dev, pci_bar_unknown, res, reg);
323 	}
324 
325 	if (rom) {
326 		struct resource *res = &dev->resource[PCI_ROM_RESOURCE];
327 		dev->rom_base_reg = rom;
328 		res->flags = IORESOURCE_MEM | IORESOURCE_PREFETCH |
329 				IORESOURCE_READONLY | IORESOURCE_SIZEALIGN;
330 		__pci_read_base(dev, pci_bar_mem32, res, rom);
331 	}
332 }
333 
334 static void pci_read_bridge_io(struct pci_bus *child)
335 {
336 	struct pci_dev *dev = child->self;
337 	u8 io_base_lo, io_limit_lo;
338 	unsigned long io_mask, io_granularity, base, limit;
339 	struct pci_bus_region region;
340 	struct resource *res;
341 
342 	io_mask = PCI_IO_RANGE_MASK;
343 	io_granularity = 0x1000;
344 	if (dev->io_window_1k) {
345 		/* Support 1K I/O space granularity */
346 		io_mask = PCI_IO_1K_RANGE_MASK;
347 		io_granularity = 0x400;
348 	}
349 
350 	res = child->resource[0];
351 	pci_read_config_byte(dev, PCI_IO_BASE, &io_base_lo);
352 	pci_read_config_byte(dev, PCI_IO_LIMIT, &io_limit_lo);
353 	base = (io_base_lo & io_mask) << 8;
354 	limit = (io_limit_lo & io_mask) << 8;
355 
356 	if ((io_base_lo & PCI_IO_RANGE_TYPE_MASK) == PCI_IO_RANGE_TYPE_32) {
357 		u16 io_base_hi, io_limit_hi;
358 
359 		pci_read_config_word(dev, PCI_IO_BASE_UPPER16, &io_base_hi);
360 		pci_read_config_word(dev, PCI_IO_LIMIT_UPPER16, &io_limit_hi);
361 		base |= ((unsigned long) io_base_hi << 16);
362 		limit |= ((unsigned long) io_limit_hi << 16);
363 	}
364 
365 	if (base <= limit) {
366 		res->flags = (io_base_lo & PCI_IO_RANGE_TYPE_MASK) | IORESOURCE_IO;
367 		region.start = base;
368 		region.end = limit + io_granularity - 1;
369 		pcibios_bus_to_resource(dev->bus, res, &region);
370 		dev_printk(KERN_DEBUG, &dev->dev, "  bridge window %pR\n", res);
371 	}
372 }
373 
374 static void pci_read_bridge_mmio(struct pci_bus *child)
375 {
376 	struct pci_dev *dev = child->self;
377 	u16 mem_base_lo, mem_limit_lo;
378 	unsigned long base, limit;
379 	struct pci_bus_region region;
380 	struct resource *res;
381 
382 	res = child->resource[1];
383 	pci_read_config_word(dev, PCI_MEMORY_BASE, &mem_base_lo);
384 	pci_read_config_word(dev, PCI_MEMORY_LIMIT, &mem_limit_lo);
385 	base = ((unsigned long) mem_base_lo & PCI_MEMORY_RANGE_MASK) << 16;
386 	limit = ((unsigned long) mem_limit_lo & PCI_MEMORY_RANGE_MASK) << 16;
387 	if (base <= limit) {
388 		res->flags = (mem_base_lo & PCI_MEMORY_RANGE_TYPE_MASK) | IORESOURCE_MEM;
389 		region.start = base;
390 		region.end = limit + 0xfffff;
391 		pcibios_bus_to_resource(dev->bus, res, &region);
392 		dev_printk(KERN_DEBUG, &dev->dev, "  bridge window %pR\n", res);
393 	}
394 }
395 
396 static void pci_read_bridge_mmio_pref(struct pci_bus *child)
397 {
398 	struct pci_dev *dev = child->self;
399 	u16 mem_base_lo, mem_limit_lo;
400 	u64 base64, limit64;
401 	pci_bus_addr_t base, limit;
402 	struct pci_bus_region region;
403 	struct resource *res;
404 
405 	res = child->resource[2];
406 	pci_read_config_word(dev, PCI_PREF_MEMORY_BASE, &mem_base_lo);
407 	pci_read_config_word(dev, PCI_PREF_MEMORY_LIMIT, &mem_limit_lo);
408 	base64 = (mem_base_lo & PCI_PREF_RANGE_MASK) << 16;
409 	limit64 = (mem_limit_lo & PCI_PREF_RANGE_MASK) << 16;
410 
411 	if ((mem_base_lo & PCI_PREF_RANGE_TYPE_MASK) == PCI_PREF_RANGE_TYPE_64) {
412 		u32 mem_base_hi, mem_limit_hi;
413 
414 		pci_read_config_dword(dev, PCI_PREF_BASE_UPPER32, &mem_base_hi);
415 		pci_read_config_dword(dev, PCI_PREF_LIMIT_UPPER32, &mem_limit_hi);
416 
417 		/*
418 		 * Some bridges set the base > limit by default, and some
419 		 * (broken) BIOSes do not initialize them.  If we find
420 		 * this, just assume they are not being used.
421 		 */
422 		if (mem_base_hi <= mem_limit_hi) {
423 			base64 |= (u64) mem_base_hi << 32;
424 			limit64 |= (u64) mem_limit_hi << 32;
425 		}
426 	}
427 
428 	base = (pci_bus_addr_t) base64;
429 	limit = (pci_bus_addr_t) limit64;
430 
431 	if (base != base64) {
432 		dev_err(&dev->dev, "can't handle bridge window above 4GB (bus address %#010llx)\n",
433 			(unsigned long long) base64);
434 		return;
435 	}
436 
437 	if (base <= limit) {
438 		res->flags = (mem_base_lo & PCI_PREF_RANGE_TYPE_MASK) |
439 					 IORESOURCE_MEM | IORESOURCE_PREFETCH;
440 		if (res->flags & PCI_PREF_RANGE_TYPE_64)
441 			res->flags |= IORESOURCE_MEM_64;
442 		region.start = base;
443 		region.end = limit + 0xfffff;
444 		pcibios_bus_to_resource(dev->bus, res, &region);
445 		dev_printk(KERN_DEBUG, &dev->dev, "  bridge window %pR\n", res);
446 	}
447 }
448 
449 void pci_read_bridge_bases(struct pci_bus *child)
450 {
451 	struct pci_dev *dev = child->self;
452 	struct resource *res;
453 	int i;
454 
455 	if (pci_is_root_bus(child))	/* It's a host bus, nothing to read */
456 		return;
457 
458 	dev_info(&dev->dev, "PCI bridge to %pR%s\n",
459 		 &child->busn_res,
460 		 dev->transparent ? " (subtractive decode)" : "");
461 
462 	pci_bus_remove_resources(child);
463 	for (i = 0; i < PCI_BRIDGE_RESOURCE_NUM; i++)
464 		child->resource[i] = &dev->resource[PCI_BRIDGE_RESOURCES+i];
465 
466 	pci_read_bridge_io(child);
467 	pci_read_bridge_mmio(child);
468 	pci_read_bridge_mmio_pref(child);
469 
470 	if (dev->transparent) {
471 		pci_bus_for_each_resource(child->parent, res, i) {
472 			if (res && res->flags) {
473 				pci_bus_add_resource(child, res,
474 						     PCI_SUBTRACTIVE_DECODE);
475 				dev_printk(KERN_DEBUG, &dev->dev,
476 					   "  bridge window %pR (subtractive decode)\n",
477 					   res);
478 			}
479 		}
480 	}
481 }
482 
483 static struct pci_bus *pci_alloc_bus(struct pci_bus *parent)
484 {
485 	struct pci_bus *b;
486 
487 	b = kzalloc(sizeof(*b), GFP_KERNEL);
488 	if (!b)
489 		return NULL;
490 
491 	INIT_LIST_HEAD(&b->node);
492 	INIT_LIST_HEAD(&b->children);
493 	INIT_LIST_HEAD(&b->devices);
494 	INIT_LIST_HEAD(&b->slots);
495 	INIT_LIST_HEAD(&b->resources);
496 	b->max_bus_speed = PCI_SPEED_UNKNOWN;
497 	b->cur_bus_speed = PCI_SPEED_UNKNOWN;
498 #ifdef CONFIG_PCI_DOMAINS_GENERIC
499 	if (parent)
500 		b->domain_nr = parent->domain_nr;
501 #endif
502 	return b;
503 }
504 
505 static void pci_release_host_bridge_dev(struct device *dev)
506 {
507 	struct pci_host_bridge *bridge = to_pci_host_bridge(dev);
508 
509 	if (bridge->release_fn)
510 		bridge->release_fn(bridge);
511 
512 	pci_free_resource_list(&bridge->windows);
513 
514 	kfree(bridge);
515 }
516 
517 static struct pci_host_bridge *pci_alloc_host_bridge(struct pci_bus *b)
518 {
519 	struct pci_host_bridge *bridge;
520 
521 	bridge = kzalloc(sizeof(*bridge), GFP_KERNEL);
522 	if (!bridge)
523 		return NULL;
524 
525 	INIT_LIST_HEAD(&bridge->windows);
526 	bridge->bus = b;
527 	return bridge;
528 }
529 
530 static const unsigned char pcix_bus_speed[] = {
531 	PCI_SPEED_UNKNOWN,		/* 0 */
532 	PCI_SPEED_66MHz_PCIX,		/* 1 */
533 	PCI_SPEED_100MHz_PCIX,		/* 2 */
534 	PCI_SPEED_133MHz_PCIX,		/* 3 */
535 	PCI_SPEED_UNKNOWN,		/* 4 */
536 	PCI_SPEED_66MHz_PCIX_ECC,	/* 5 */
537 	PCI_SPEED_100MHz_PCIX_ECC,	/* 6 */
538 	PCI_SPEED_133MHz_PCIX_ECC,	/* 7 */
539 	PCI_SPEED_UNKNOWN,		/* 8 */
540 	PCI_SPEED_66MHz_PCIX_266,	/* 9 */
541 	PCI_SPEED_100MHz_PCIX_266,	/* A */
542 	PCI_SPEED_133MHz_PCIX_266,	/* B */
543 	PCI_SPEED_UNKNOWN,		/* C */
544 	PCI_SPEED_66MHz_PCIX_533,	/* D */
545 	PCI_SPEED_100MHz_PCIX_533,	/* E */
546 	PCI_SPEED_133MHz_PCIX_533	/* F */
547 };
548 
549 const unsigned char pcie_link_speed[] = {
550 	PCI_SPEED_UNKNOWN,		/* 0 */
551 	PCIE_SPEED_2_5GT,		/* 1 */
552 	PCIE_SPEED_5_0GT,		/* 2 */
553 	PCIE_SPEED_8_0GT,		/* 3 */
554 	PCI_SPEED_UNKNOWN,		/* 4 */
555 	PCI_SPEED_UNKNOWN,		/* 5 */
556 	PCI_SPEED_UNKNOWN,		/* 6 */
557 	PCI_SPEED_UNKNOWN,		/* 7 */
558 	PCI_SPEED_UNKNOWN,		/* 8 */
559 	PCI_SPEED_UNKNOWN,		/* 9 */
560 	PCI_SPEED_UNKNOWN,		/* A */
561 	PCI_SPEED_UNKNOWN,		/* B */
562 	PCI_SPEED_UNKNOWN,		/* C */
563 	PCI_SPEED_UNKNOWN,		/* D */
564 	PCI_SPEED_UNKNOWN,		/* E */
565 	PCI_SPEED_UNKNOWN		/* F */
566 };
567 
568 void pcie_update_link_speed(struct pci_bus *bus, u16 linksta)
569 {
570 	bus->cur_bus_speed = pcie_link_speed[linksta & PCI_EXP_LNKSTA_CLS];
571 }
572 EXPORT_SYMBOL_GPL(pcie_update_link_speed);
573 
574 static unsigned char agp_speeds[] = {
575 	AGP_UNKNOWN,
576 	AGP_1X,
577 	AGP_2X,
578 	AGP_4X,
579 	AGP_8X
580 };
581 
582 static enum pci_bus_speed agp_speed(int agp3, int agpstat)
583 {
584 	int index = 0;
585 
586 	if (agpstat & 4)
587 		index = 3;
588 	else if (agpstat & 2)
589 		index = 2;
590 	else if (agpstat & 1)
591 		index = 1;
592 	else
593 		goto out;
594 
595 	if (agp3) {
596 		index += 2;
597 		if (index == 5)
598 			index = 0;
599 	}
600 
601  out:
602 	return agp_speeds[index];
603 }
604 
605 static void pci_set_bus_speed(struct pci_bus *bus)
606 {
607 	struct pci_dev *bridge = bus->self;
608 	int pos;
609 
610 	pos = pci_find_capability(bridge, PCI_CAP_ID_AGP);
611 	if (!pos)
612 		pos = pci_find_capability(bridge, PCI_CAP_ID_AGP3);
613 	if (pos) {
614 		u32 agpstat, agpcmd;
615 
616 		pci_read_config_dword(bridge, pos + PCI_AGP_STATUS, &agpstat);
617 		bus->max_bus_speed = agp_speed(agpstat & 8, agpstat & 7);
618 
619 		pci_read_config_dword(bridge, pos + PCI_AGP_COMMAND, &agpcmd);
620 		bus->cur_bus_speed = agp_speed(agpstat & 8, agpcmd & 7);
621 	}
622 
623 	pos = pci_find_capability(bridge, PCI_CAP_ID_PCIX);
624 	if (pos) {
625 		u16 status;
626 		enum pci_bus_speed max;
627 
628 		pci_read_config_word(bridge, pos + PCI_X_BRIDGE_SSTATUS,
629 				     &status);
630 
631 		if (status & PCI_X_SSTATUS_533MHZ) {
632 			max = PCI_SPEED_133MHz_PCIX_533;
633 		} else if (status & PCI_X_SSTATUS_266MHZ) {
634 			max = PCI_SPEED_133MHz_PCIX_266;
635 		} else if (status & PCI_X_SSTATUS_133MHZ) {
636 			if ((status & PCI_X_SSTATUS_VERS) == PCI_X_SSTATUS_V2)
637 				max = PCI_SPEED_133MHz_PCIX_ECC;
638 			else
639 				max = PCI_SPEED_133MHz_PCIX;
640 		} else {
641 			max = PCI_SPEED_66MHz_PCIX;
642 		}
643 
644 		bus->max_bus_speed = max;
645 		bus->cur_bus_speed = pcix_bus_speed[
646 			(status & PCI_X_SSTATUS_FREQ) >> 6];
647 
648 		return;
649 	}
650 
651 	if (pci_is_pcie(bridge)) {
652 		u32 linkcap;
653 		u16 linksta;
654 
655 		pcie_capability_read_dword(bridge, PCI_EXP_LNKCAP, &linkcap);
656 		bus->max_bus_speed = pcie_link_speed[linkcap & PCI_EXP_LNKCAP_SLS];
657 
658 		pcie_capability_read_word(bridge, PCI_EXP_LNKSTA, &linksta);
659 		pcie_update_link_speed(bus, linksta);
660 	}
661 }
662 
663 static struct irq_domain *pci_host_bridge_msi_domain(struct pci_bus *bus)
664 {
665 	struct irq_domain *d;
666 
667 	/*
668 	 * Any firmware interface that can resolve the msi_domain
669 	 * should be called from here.
670 	 */
671 	d = pci_host_bridge_of_msi_domain(bus);
672 
673 	return d;
674 }
675 
676 static void pci_set_bus_msi_domain(struct pci_bus *bus)
677 {
678 	struct irq_domain *d;
679 	struct pci_bus *b;
680 
681 	/*
682 	 * The bus can be a root bus, a subordinate bus, or a virtual bus
683 	 * created by an SR-IOV device.  Walk up to the first bridge device
684 	 * found or derive the domain from the host bridge.
685 	 */
686 	for (b = bus, d = NULL; !d && !pci_is_root_bus(b); b = b->parent) {
687 		if (b->self)
688 			d = dev_get_msi_domain(&b->self->dev);
689 	}
690 
691 	if (!d)
692 		d = pci_host_bridge_msi_domain(b);
693 
694 	dev_set_msi_domain(&bus->dev, d);
695 }
696 
697 static struct pci_bus *pci_alloc_child_bus(struct pci_bus *parent,
698 					   struct pci_dev *bridge, int busnr)
699 {
700 	struct pci_bus *child;
701 	int i;
702 	int ret;
703 
704 	/*
705 	 * Allocate a new bus, and inherit stuff from the parent..
706 	 */
707 	child = pci_alloc_bus(parent);
708 	if (!child)
709 		return NULL;
710 
711 	child->parent = parent;
712 	child->ops = parent->ops;
713 	child->msi = parent->msi;
714 	child->sysdata = parent->sysdata;
715 	child->bus_flags = parent->bus_flags;
716 
717 	/* initialize some portions of the bus device, but don't register it
718 	 * now as the parent is not properly set up yet.
719 	 */
720 	child->dev.class = &pcibus_class;
721 	dev_set_name(&child->dev, "%04x:%02x", pci_domain_nr(child), busnr);
722 
723 	/*
724 	 * Set up the primary, secondary and subordinate
725 	 * bus numbers.
726 	 */
727 	child->number = child->busn_res.start = busnr;
728 	child->primary = parent->busn_res.start;
729 	child->busn_res.end = 0xff;
730 
731 	if (!bridge) {
732 		child->dev.parent = parent->bridge;
733 		goto add_dev;
734 	}
735 
736 	child->self = bridge;
737 	child->bridge = get_device(&bridge->dev);
738 	child->dev.parent = child->bridge;
739 	pci_set_bus_of_node(child);
740 	pci_set_bus_speed(child);
741 
742 	/* Set up default resource pointers and names.. */
743 	for (i = 0; i < PCI_BRIDGE_RESOURCE_NUM; i++) {
744 		child->resource[i] = &bridge->resource[PCI_BRIDGE_RESOURCES+i];
745 		child->resource[i]->name = child->name;
746 	}
747 	bridge->subordinate = child;
748 
749 add_dev:
750 	pci_set_bus_msi_domain(child);
751 	ret = device_register(&child->dev);
752 	WARN_ON(ret < 0);
753 
754 	pcibios_add_bus(child);
755 
756 	/* Create legacy_io and legacy_mem files for this bus */
757 	pci_create_legacy_files(child);
758 
759 	return child;
760 }
761 
762 struct pci_bus *pci_add_new_bus(struct pci_bus *parent, struct pci_dev *dev,
763 				int busnr)
764 {
765 	struct pci_bus *child;
766 
767 	child = pci_alloc_child_bus(parent, dev, busnr);
768 	if (child) {
769 		down_write(&pci_bus_sem);
770 		list_add_tail(&child->node, &parent->children);
771 		up_write(&pci_bus_sem);
772 	}
773 	return child;
774 }
775 EXPORT_SYMBOL(pci_add_new_bus);
776 
777 static void pci_enable_crs(struct pci_dev *pdev)
778 {
779 	u16 root_cap = 0;
780 
781 	/* Enable CRS Software Visibility if supported */
782 	pcie_capability_read_word(pdev, PCI_EXP_RTCAP, &root_cap);
783 	if (root_cap & PCI_EXP_RTCAP_CRSVIS)
784 		pcie_capability_set_word(pdev, PCI_EXP_RTCTL,
785 					 PCI_EXP_RTCTL_CRSSVE);
786 }
787 
788 /*
789  * If it's a bridge, configure it and scan the bus behind it.
790  * For CardBus bridges, we don't scan behind as the devices will
791  * be handled by the bridge driver itself.
792  *
793  * We need to process bridges in two passes -- first we scan those
794  * already configured by the BIOS and after we are done with all of
795  * them, we proceed to assigning numbers to the remaining buses in
796  * order to avoid overlaps between old and new bus numbers.
797  */
798 int pci_scan_bridge(struct pci_bus *bus, struct pci_dev *dev, int max, int pass)
799 {
800 	struct pci_bus *child;
801 	int is_cardbus = (dev->hdr_type == PCI_HEADER_TYPE_CARDBUS);
802 	u32 buses, i, j = 0;
803 	u16 bctl;
804 	u8 primary, secondary, subordinate;
805 	int broken = 0;
806 
807 	pci_read_config_dword(dev, PCI_PRIMARY_BUS, &buses);
808 	primary = buses & 0xFF;
809 	secondary = (buses >> 8) & 0xFF;
810 	subordinate = (buses >> 16) & 0xFF;
811 
812 	dev_dbg(&dev->dev, "scanning [bus %02x-%02x] behind bridge, pass %d\n",
813 		secondary, subordinate, pass);
814 
815 	if (!primary && (primary != bus->number) && secondary && subordinate) {
816 		dev_warn(&dev->dev, "Primary bus is hard wired to 0\n");
817 		primary = bus->number;
818 	}
819 
820 	/* Check if setup is sensible at all */
821 	if (!pass &&
822 	    (primary != bus->number || secondary <= bus->number ||
823 	     secondary > subordinate)) {
824 		dev_info(&dev->dev, "bridge configuration invalid ([bus %02x-%02x]), reconfiguring\n",
825 			 secondary, subordinate);
826 		broken = 1;
827 	}
828 
829 	/* Disable MasterAbortMode during probing to avoid reporting
830 	   of bus errors (in some architectures) */
831 	pci_read_config_word(dev, PCI_BRIDGE_CONTROL, &bctl);
832 	pci_write_config_word(dev, PCI_BRIDGE_CONTROL,
833 			      bctl & ~PCI_BRIDGE_CTL_MASTER_ABORT);
834 
835 	pci_enable_crs(dev);
836 
837 	if ((secondary || subordinate) && !pcibios_assign_all_busses() &&
838 	    !is_cardbus && !broken) {
839 		unsigned int cmax;
840 		/*
841 		 * Bus already configured by firmware, process it in the first
842 		 * pass and just note the configuration.
843 		 */
844 		if (pass)
845 			goto out;
846 
847 		/*
848 		 * The bus might already exist for two reasons: Either we are
849 		 * rescanning the bus or the bus is reachable through more than
850 		 * one bridge. The second case can happen with the i450NX
851 		 * chipset.
852 		 */
853 		child = pci_find_bus(pci_domain_nr(bus), secondary);
854 		if (!child) {
855 			child = pci_add_new_bus(bus, dev, secondary);
856 			if (!child)
857 				goto out;
858 			child->primary = primary;
859 			pci_bus_insert_busn_res(child, secondary, subordinate);
860 			child->bridge_ctl = bctl;
861 		}
862 
863 		cmax = pci_scan_child_bus(child);
864 		if (cmax > subordinate)
865 			dev_warn(&dev->dev, "bridge has subordinate %02x but max busn %02x\n",
866 				 subordinate, cmax);
867 		/* subordinate should equal child->busn_res.end */
868 		if (subordinate > max)
869 			max = subordinate;
870 	} else {
871 		/*
872 		 * We need to assign a number to this bus which we always
873 		 * do in the second pass.
874 		 */
875 		if (!pass) {
876 			if (pcibios_assign_all_busses() || broken || is_cardbus)
877 				/* Temporarily disable forwarding of the
878 				   configuration cycles on all bridges in
879 				   this bus segment to avoid possible
880 				   conflicts in the second pass between two
881 				   bridges programmed with overlapping
882 				   bus ranges. */
883 				pci_write_config_dword(dev, PCI_PRIMARY_BUS,
884 						       buses & ~0xffffff);
885 			goto out;
886 		}
887 
888 		/* Clear errors */
889 		pci_write_config_word(dev, PCI_STATUS, 0xffff);
890 
891 		/* Prevent assigning a bus number that already exists.
892 		 * This can happen when a bridge is hot-plugged, so in
893 		 * this case we only re-scan this bus. */
894 		child = pci_find_bus(pci_domain_nr(bus), max+1);
895 		if (!child) {
896 			child = pci_add_new_bus(bus, dev, max+1);
897 			if (!child)
898 				goto out;
899 			pci_bus_insert_busn_res(child, max+1, 0xff);
900 		}
901 		max++;
902 		buses = (buses & 0xff000000)
903 		      | ((unsigned int)(child->primary)     <<  0)
904 		      | ((unsigned int)(child->busn_res.start)   <<  8)
905 		      | ((unsigned int)(child->busn_res.end) << 16);
906 
907 		/*
908 		 * yenta.c forces a secondary latency timer of 176.
909 		 * Copy that behaviour here.
910 		 */
911 		if (is_cardbus) {
912 			buses &= ~0xff000000;
913 			buses |= CARDBUS_LATENCY_TIMER << 24;
914 		}
915 
916 		/*
917 		 * We need to blast all three values with a single write.
918 		 */
919 		pci_write_config_dword(dev, PCI_PRIMARY_BUS, buses);
920 
921 		if (!is_cardbus) {
922 			child->bridge_ctl = bctl;
923 			max = pci_scan_child_bus(child);
924 		} else {
925 			/*
926 			 * For CardBus bridges, we leave 4 bus numbers
927 			 * as cards with a PCI-to-PCI bridge can be
928 			 * inserted later.
929 			 */
930 			for (i = 0; i < CARDBUS_RESERVE_BUSNR; i++) {
931 				struct pci_bus *parent = bus;
932 				if (pci_find_bus(pci_domain_nr(bus),
933 							max+i+1))
934 					break;
935 				while (parent->parent) {
936 					if ((!pcibios_assign_all_busses()) &&
937 					    (parent->busn_res.end > max) &&
938 					    (parent->busn_res.end <= max+i)) {
939 						j = 1;
940 					}
941 					parent = parent->parent;
942 				}
943 				if (j) {
944 					/*
945 					 * Often, there are two cardbus bridges
946 					 * -- try to leave one valid bus number
947 					 * for each one.
948 					 */
949 					i /= 2;
950 					break;
951 				}
952 			}
953 			max += i;
954 		}
955 		/*
956 		 * Set the subordinate bus number to its real value.
957 		 */
958 		pci_bus_update_busn_res_end(child, max);
959 		pci_write_config_byte(dev, PCI_SUBORDINATE_BUS, max);
960 	}
961 
962 	sprintf(child->name,
963 		(is_cardbus ? "PCI CardBus %04x:%02x" : "PCI Bus %04x:%02x"),
964 		pci_domain_nr(bus), child->number);
965 
966 	/* Has only triggered on CardBus, fixup is in yenta_socket */
967 	while (bus->parent) {
968 		if ((child->busn_res.end > bus->busn_res.end) ||
969 		    (child->number > bus->busn_res.end) ||
970 		    (child->number < bus->number) ||
971 		    (child->busn_res.end < bus->number)) {
972 			dev_info(&child->dev, "%pR %s hidden behind%s bridge %s %pR\n",
973 				&child->busn_res,
974 				(bus->number > child->busn_res.end &&
975 				 bus->busn_res.end < child->number) ?
976 					"wholly" : "partially",
977 				bus->self->transparent ? " transparent" : "",
978 				dev_name(&bus->dev),
979 				&bus->busn_res);
980 		}
981 		bus = bus->parent;
982 	}
983 
984 out:
985 	pci_write_config_word(dev, PCI_BRIDGE_CONTROL, bctl);
986 
987 	return max;
988 }
989 EXPORT_SYMBOL(pci_scan_bridge);
990 
991 /*
992  * Read interrupt line and base address registers.
993  * The architecture-dependent code can tweak these, of course.
994  */
995 static void pci_read_irq(struct pci_dev *dev)
996 {
997 	unsigned char irq;
998 
999 	pci_read_config_byte(dev, PCI_INTERRUPT_PIN, &irq);
1000 	dev->pin = irq;
1001 	if (irq)
1002 		pci_read_config_byte(dev, PCI_INTERRUPT_LINE, &irq);
1003 	dev->irq = irq;
1004 }
1005 
1006 void set_pcie_port_type(struct pci_dev *pdev)
1007 {
1008 	int pos;
1009 	u16 reg16;
1010 	int type;
1011 	struct pci_dev *parent;
1012 
1013 	pos = pci_find_capability(pdev, PCI_CAP_ID_EXP);
1014 	if (!pos)
1015 		return;
1016 	pdev->pcie_cap = pos;
1017 	pci_read_config_word(pdev, pos + PCI_EXP_FLAGS, &reg16);
1018 	pdev->pcie_flags_reg = reg16;
1019 	pci_read_config_word(pdev, pos + PCI_EXP_DEVCAP, &reg16);
1020 	pdev->pcie_mpss = reg16 & PCI_EXP_DEVCAP_PAYLOAD;
1021 
1022 	/*
1023 	 * A Root Port is always the upstream end of a Link.  No PCIe
1024 	 * component has two Links.  Two Links are connected by a Switch
1025 	 * that has a Port on each Link and internal logic to connect the
1026 	 * two Ports.
1027 	 */
1028 	type = pci_pcie_type(pdev);
1029 	if (type == PCI_EXP_TYPE_ROOT_PORT)
1030 		pdev->has_secondary_link = 1;
1031 	else if (type == PCI_EXP_TYPE_UPSTREAM ||
1032 		 type == PCI_EXP_TYPE_DOWNSTREAM) {
1033 		parent = pci_upstream_bridge(pdev);
1034 
1035 		/*
1036 		 * Usually there's an upstream device (Root Port or Switch
1037 		 * Downstream Port), but we can't assume one exists.
1038 		 */
1039 		if (parent && !parent->has_secondary_link)
1040 			pdev->has_secondary_link = 1;
1041 	}
1042 }
1043 
1044 void set_pcie_hotplug_bridge(struct pci_dev *pdev)
1045 {
1046 	u32 reg32;
1047 
1048 	pcie_capability_read_dword(pdev, PCI_EXP_SLTCAP, &reg32);
1049 	if (reg32 & PCI_EXP_SLTCAP_HPC)
1050 		pdev->is_hotplug_bridge = 1;
1051 }
1052 
1053 /**
1054  * pci_ext_cfg_is_aliased - is ext config space just an alias of std config?
1055  * @dev: PCI device
1056  *
1057  * PCI Express to PCI/PCI-X Bridge Specification, rev 1.0, 4.1.4 says that
1058  * when forwarding a type1 configuration request the bridge must check that
1059  * the extended register address field is zero.  The bridge is not permitted
1060  * to forward the transactions and must handle it as an Unsupported Request.
1061  * Some bridges do not follow this rule and simply drop the extended register
1062  * bits, resulting in the standard config space being aliased, every 256
1063  * bytes across the entire configuration space.  Test for this condition by
1064  * comparing the first dword of each potential alias to the vendor/device ID.
1065  * Known offenders:
1066  *   ASM1083/1085 PCIe-to-PCI Reversible Bridge (1b21:1080, rev 01 & 03)
1067  *   AMD/ATI SBx00 PCI to PCI Bridge (1002:4384, rev 40)
1068  */
1069 static bool pci_ext_cfg_is_aliased(struct pci_dev *dev)
1070 {
1071 #ifdef CONFIG_PCI_QUIRKS
1072 	int pos;
1073 	u32 header, tmp;
1074 
1075 	pci_read_config_dword(dev, PCI_VENDOR_ID, &header);
1076 
1077 	for (pos = PCI_CFG_SPACE_SIZE;
1078 	     pos < PCI_CFG_SPACE_EXP_SIZE; pos += PCI_CFG_SPACE_SIZE) {
1079 		if (pci_read_config_dword(dev, pos, &tmp) != PCIBIOS_SUCCESSFUL
1080 		    || header != tmp)
1081 			return false;
1082 	}
1083 
1084 	return true;
1085 #else
1086 	return false;
1087 #endif
1088 }
1089 
1090 /**
1091  * pci_cfg_space_size - get the configuration space size of the PCI device.
1092  * @dev: PCI device
1093  *
1094  * Regular PCI devices have 256 bytes, but PCI-X 2 and PCI Express devices
1095  * have 4096 bytes.  Even if the device is capable, that doesn't mean we can
1096  * access it.  Maybe we don't have a way to generate extended config space
1097  * accesses, or the device is behind a reverse Express bridge.  So we try
1098  * reading the dword at 0x100 which must either be 0 or a valid extended
1099  * capability header.
1100  */
1101 static int pci_cfg_space_size_ext(struct pci_dev *dev)
1102 {
1103 	u32 status;
1104 	int pos = PCI_CFG_SPACE_SIZE;
1105 
1106 	if (pci_read_config_dword(dev, pos, &status) != PCIBIOS_SUCCESSFUL)
1107 		goto fail;
1108 	if (status == 0xffffffff || pci_ext_cfg_is_aliased(dev))
1109 		goto fail;
1110 
1111 	return PCI_CFG_SPACE_EXP_SIZE;
1112 
1113  fail:
1114 	return PCI_CFG_SPACE_SIZE;
1115 }
1116 
1117 int pci_cfg_space_size(struct pci_dev *dev)
1118 {
1119 	int pos;
1120 	u32 status;
1121 	u16 class;
1122 
1123 	class = dev->class >> 8;
1124 	if (class == PCI_CLASS_BRIDGE_HOST)
1125 		return pci_cfg_space_size_ext(dev);
1126 
1127 	if (!pci_is_pcie(dev)) {
1128 		pos = pci_find_capability(dev, PCI_CAP_ID_PCIX);
1129 		if (!pos)
1130 			goto fail;
1131 
1132 		pci_read_config_dword(dev, pos + PCI_X_STATUS, &status);
1133 		if (!(status & (PCI_X_STATUS_266MHZ | PCI_X_STATUS_533MHZ)))
1134 			goto fail;
1135 	}
1136 
1137 	return pci_cfg_space_size_ext(dev);
1138 
1139  fail:
1140 	return PCI_CFG_SPACE_SIZE;
1141 }
1142 
1143 #define LEGACY_IO_RESOURCE	(IORESOURCE_IO | IORESOURCE_PCI_FIXED)
1144 
1145 void pci_msi_setup_pci_dev(struct pci_dev *dev)
1146 {
1147 	/*
1148 	 * Disable the MSI hardware to avoid screaming interrupts
1149 	 * during boot.  This is the power on reset default so
1150 	 * usually this should be a noop.
1151 	 */
1152 	dev->msi_cap = pci_find_capability(dev, PCI_CAP_ID_MSI);
1153 	if (dev->msi_cap)
1154 		pci_msi_set_enable(dev, 0);
1155 
1156 	dev->msix_cap = pci_find_capability(dev, PCI_CAP_ID_MSIX);
1157 	if (dev->msix_cap)
1158 		pci_msix_clear_and_set_ctrl(dev, PCI_MSIX_FLAGS_ENABLE, 0);
1159 }
1160 
1161 /**
1162  * pci_setup_device - fill in class and map information of a device
1163  * @dev: the device structure to fill
1164  *
1165  * Initialize the device structure with information about the device's
1166  * vendor,class,memory and IO-space addresses,IRQ lines etc.
1167  * Called at initialisation of the PCI subsystem and by CardBus services.
1168  * Returns 0 on success and negative if unknown type of device (not normal,
1169  * bridge or CardBus).
1170  */
1171 int pci_setup_device(struct pci_dev *dev)
1172 {
1173 	u32 class;
1174 	u8 hdr_type;
1175 	int pos = 0;
1176 	struct pci_bus_region region;
1177 	struct resource *res;
1178 
1179 	if (pci_read_config_byte(dev, PCI_HEADER_TYPE, &hdr_type))
1180 		return -EIO;
1181 
1182 	dev->sysdata = dev->bus->sysdata;
1183 	dev->dev.parent = dev->bus->bridge;
1184 	dev->dev.bus = &pci_bus_type;
1185 	dev->hdr_type = hdr_type & 0x7f;
1186 	dev->multifunction = !!(hdr_type & 0x80);
1187 	dev->error_state = pci_channel_io_normal;
1188 	set_pcie_port_type(dev);
1189 
1190 	pci_dev_assign_slot(dev);
1191 	/* Assume 32-bit PCI; let 64-bit PCI cards (which are far rarer)
1192 	   set this higher, assuming the system even supports it.  */
1193 	dev->dma_mask = 0xffffffff;
1194 
1195 	dev_set_name(&dev->dev, "%04x:%02x:%02x.%d", pci_domain_nr(dev->bus),
1196 		     dev->bus->number, PCI_SLOT(dev->devfn),
1197 		     PCI_FUNC(dev->devfn));
1198 
1199 	pci_read_config_dword(dev, PCI_CLASS_REVISION, &class);
1200 	dev->revision = class & 0xff;
1201 	dev->class = class >> 8;		    /* upper 3 bytes */
1202 
1203 	dev_printk(KERN_DEBUG, &dev->dev, "[%04x:%04x] type %02x class %#08x\n",
1204 		   dev->vendor, dev->device, dev->hdr_type, dev->class);
1205 
1206 	/* need to have dev->class ready */
1207 	dev->cfg_size = pci_cfg_space_size(dev);
1208 
1209 	/* "Unknown power state" */
1210 	dev->current_state = PCI_UNKNOWN;
1211 
1212 	pci_msi_setup_pci_dev(dev);
1213 
1214 	/* Early fixups, before probing the BARs */
1215 	pci_fixup_device(pci_fixup_early, dev);
1216 	/* device class may be changed after fixup */
1217 	class = dev->class >> 8;
1218 
1219 	switch (dev->hdr_type) {		    /* header type */
1220 	case PCI_HEADER_TYPE_NORMAL:		    /* standard header */
1221 		if (class == PCI_CLASS_BRIDGE_PCI)
1222 			goto bad;
1223 		pci_read_irq(dev);
1224 		pci_read_bases(dev, 6, PCI_ROM_ADDRESS);
1225 		pci_read_config_word(dev, PCI_SUBSYSTEM_VENDOR_ID, &dev->subsystem_vendor);
1226 		pci_read_config_word(dev, PCI_SUBSYSTEM_ID, &dev->subsystem_device);
1227 
1228 		/*
1229 		 * Do the ugly legacy mode stuff here rather than broken chip
1230 		 * quirk code. Legacy mode ATA controllers have fixed
1231 		 * addresses. These are not always echoed in BAR0-3, and
1232 		 * BAR0-3 in a few cases contain junk!
1233 		 */
1234 		if (class == PCI_CLASS_STORAGE_IDE) {
1235 			u8 progif;
1236 			pci_read_config_byte(dev, PCI_CLASS_PROG, &progif);
1237 			if ((progif & 1) == 0) {
1238 				region.start = 0x1F0;
1239 				region.end = 0x1F7;
1240 				res = &dev->resource[0];
1241 				res->flags = LEGACY_IO_RESOURCE;
1242 				pcibios_bus_to_resource(dev->bus, res, &region);
1243 				dev_info(&dev->dev, "legacy IDE quirk: reg 0x10: %pR\n",
1244 					 res);
1245 				region.start = 0x3F6;
1246 				region.end = 0x3F6;
1247 				res = &dev->resource[1];
1248 				res->flags = LEGACY_IO_RESOURCE;
1249 				pcibios_bus_to_resource(dev->bus, res, &region);
1250 				dev_info(&dev->dev, "legacy IDE quirk: reg 0x14: %pR\n",
1251 					 res);
1252 			}
1253 			if ((progif & 4) == 0) {
1254 				region.start = 0x170;
1255 				region.end = 0x177;
1256 				res = &dev->resource[2];
1257 				res->flags = LEGACY_IO_RESOURCE;
1258 				pcibios_bus_to_resource(dev->bus, res, &region);
1259 				dev_info(&dev->dev, "legacy IDE quirk: reg 0x18: %pR\n",
1260 					 res);
1261 				region.start = 0x376;
1262 				region.end = 0x376;
1263 				res = &dev->resource[3];
1264 				res->flags = LEGACY_IO_RESOURCE;
1265 				pcibios_bus_to_resource(dev->bus, res, &region);
1266 				dev_info(&dev->dev, "legacy IDE quirk: reg 0x1c: %pR\n",
1267 					 res);
1268 			}
1269 		}
1270 		break;
1271 
1272 	case PCI_HEADER_TYPE_BRIDGE:		    /* bridge header */
1273 		if (class != PCI_CLASS_BRIDGE_PCI)
1274 			goto bad;
1275 		/* The PCI-to-PCI bridge spec requires that subtractive
1276 		   decoding (i.e. transparent) bridge must have programming
1277 		   interface code of 0x01. */
1278 		pci_read_irq(dev);
1279 		dev->transparent = ((dev->class & 0xff) == 1);
1280 		pci_read_bases(dev, 2, PCI_ROM_ADDRESS1);
1281 		set_pcie_hotplug_bridge(dev);
1282 		pos = pci_find_capability(dev, PCI_CAP_ID_SSVID);
1283 		if (pos) {
1284 			pci_read_config_word(dev, pos + PCI_SSVID_VENDOR_ID, &dev->subsystem_vendor);
1285 			pci_read_config_word(dev, pos + PCI_SSVID_DEVICE_ID, &dev->subsystem_device);
1286 		}
1287 		break;
1288 
1289 	case PCI_HEADER_TYPE_CARDBUS:		    /* CardBus bridge header */
1290 		if (class != PCI_CLASS_BRIDGE_CARDBUS)
1291 			goto bad;
1292 		pci_read_irq(dev);
1293 		pci_read_bases(dev, 1, 0);
1294 		pci_read_config_word(dev, PCI_CB_SUBSYSTEM_VENDOR_ID, &dev->subsystem_vendor);
1295 		pci_read_config_word(dev, PCI_CB_SUBSYSTEM_ID, &dev->subsystem_device);
1296 		break;
1297 
1298 	default:				    /* unknown header */
1299 		dev_err(&dev->dev, "unknown header type %02x, ignoring device\n",
1300 			dev->hdr_type);
1301 		return -EIO;
1302 
1303 	bad:
1304 		dev_err(&dev->dev, "ignoring class %#08x (doesn't match header type %02x)\n",
1305 			dev->class, dev->hdr_type);
1306 		dev->class = PCI_CLASS_NOT_DEFINED << 8;
1307 	}
1308 
1309 	/* We found a fine healthy device, go go go... */
1310 	return 0;
1311 }
1312 
1313 static void pci_configure_mps(struct pci_dev *dev)
1314 {
1315 	struct pci_dev *bridge = pci_upstream_bridge(dev);
1316 	int mps, p_mps, rc;
1317 
1318 	if (!pci_is_pcie(dev) || !bridge || !pci_is_pcie(bridge))
1319 		return;
1320 
1321 	mps = pcie_get_mps(dev);
1322 	p_mps = pcie_get_mps(bridge);
1323 
1324 	if (mps == p_mps)
1325 		return;
1326 
1327 	if (pcie_bus_config == PCIE_BUS_TUNE_OFF) {
1328 		dev_warn(&dev->dev, "Max Payload Size %d, but upstream %s set to %d; if necessary, use \"pci=pcie_bus_safe\" and report a bug\n",
1329 			 mps, pci_name(bridge), p_mps);
1330 		return;
1331 	}
1332 
1333 	/*
1334 	 * Fancier MPS configuration is done later by
1335 	 * pcie_bus_configure_settings()
1336 	 */
1337 	if (pcie_bus_config != PCIE_BUS_DEFAULT)
1338 		return;
1339 
1340 	rc = pcie_set_mps(dev, p_mps);
1341 	if (rc) {
1342 		dev_warn(&dev->dev, "can't set Max Payload Size to %d; if necessary, use \"pci=pcie_bus_safe\" and report a bug\n",
1343 			 p_mps);
1344 		return;
1345 	}
1346 
1347 	dev_info(&dev->dev, "Max Payload Size set to %d (was %d, max %d)\n",
1348 		 p_mps, mps, 128 << dev->pcie_mpss);
1349 }
1350 
1351 static struct hpp_type0 pci_default_type0 = {
1352 	.revision = 1,
1353 	.cache_line_size = 8,
1354 	.latency_timer = 0x40,
1355 	.enable_serr = 0,
1356 	.enable_perr = 0,
1357 };
1358 
1359 static void program_hpp_type0(struct pci_dev *dev, struct hpp_type0 *hpp)
1360 {
1361 	u16 pci_cmd, pci_bctl;
1362 
1363 	if (!hpp)
1364 		hpp = &pci_default_type0;
1365 
1366 	if (hpp->revision > 1) {
1367 		dev_warn(&dev->dev,
1368 			 "PCI settings rev %d not supported; using defaults\n",
1369 			 hpp->revision);
1370 		hpp = &pci_default_type0;
1371 	}
1372 
1373 	pci_write_config_byte(dev, PCI_CACHE_LINE_SIZE, hpp->cache_line_size);
1374 	pci_write_config_byte(dev, PCI_LATENCY_TIMER, hpp->latency_timer);
1375 	pci_read_config_word(dev, PCI_COMMAND, &pci_cmd);
1376 	if (hpp->enable_serr)
1377 		pci_cmd |= PCI_COMMAND_SERR;
1378 	if (hpp->enable_perr)
1379 		pci_cmd |= PCI_COMMAND_PARITY;
1380 	pci_write_config_word(dev, PCI_COMMAND, pci_cmd);
1381 
1382 	/* Program bridge control value */
1383 	if ((dev->class >> 8) == PCI_CLASS_BRIDGE_PCI) {
1384 		pci_write_config_byte(dev, PCI_SEC_LATENCY_TIMER,
1385 				      hpp->latency_timer);
1386 		pci_read_config_word(dev, PCI_BRIDGE_CONTROL, &pci_bctl);
1387 		if (hpp->enable_serr)
1388 			pci_bctl |= PCI_BRIDGE_CTL_SERR;
1389 		if (hpp->enable_perr)
1390 			pci_bctl |= PCI_BRIDGE_CTL_PARITY;
1391 		pci_write_config_word(dev, PCI_BRIDGE_CONTROL, pci_bctl);
1392 	}
1393 }
1394 
1395 static void program_hpp_type1(struct pci_dev *dev, struct hpp_type1 *hpp)
1396 {
1397 	if (hpp)
1398 		dev_warn(&dev->dev, "PCI-X settings not supported\n");
1399 }
1400 
1401 static void program_hpp_type2(struct pci_dev *dev, struct hpp_type2 *hpp)
1402 {
1403 	int pos;
1404 	u32 reg32;
1405 
1406 	if (!hpp)
1407 		return;
1408 
1409 	if (hpp->revision > 1) {
1410 		dev_warn(&dev->dev, "PCIe settings rev %d not supported\n",
1411 			 hpp->revision);
1412 		return;
1413 	}
1414 
1415 	/*
1416 	 * Don't allow _HPX to change MPS or MRRS settings.  We manage
1417 	 * those to make sure they're consistent with the rest of the
1418 	 * platform.
1419 	 */
1420 	hpp->pci_exp_devctl_and |= PCI_EXP_DEVCTL_PAYLOAD |
1421 				    PCI_EXP_DEVCTL_READRQ;
1422 	hpp->pci_exp_devctl_or &= ~(PCI_EXP_DEVCTL_PAYLOAD |
1423 				    PCI_EXP_DEVCTL_READRQ);
1424 
1425 	/* Initialize Device Control Register */
1426 	pcie_capability_clear_and_set_word(dev, PCI_EXP_DEVCTL,
1427 			~hpp->pci_exp_devctl_and, hpp->pci_exp_devctl_or);
1428 
1429 	/* Initialize Link Control Register */
1430 	if (pcie_cap_has_lnkctl(dev))
1431 		pcie_capability_clear_and_set_word(dev, PCI_EXP_LNKCTL,
1432 			~hpp->pci_exp_lnkctl_and, hpp->pci_exp_lnkctl_or);
1433 
1434 	/* Find Advanced Error Reporting Enhanced Capability */
1435 	pos = pci_find_ext_capability(dev, PCI_EXT_CAP_ID_ERR);
1436 	if (!pos)
1437 		return;
1438 
1439 	/* Initialize Uncorrectable Error Mask Register */
1440 	pci_read_config_dword(dev, pos + PCI_ERR_UNCOR_MASK, &reg32);
1441 	reg32 = (reg32 & hpp->unc_err_mask_and) | hpp->unc_err_mask_or;
1442 	pci_write_config_dword(dev, pos + PCI_ERR_UNCOR_MASK, reg32);
1443 
1444 	/* Initialize Uncorrectable Error Severity Register */
1445 	pci_read_config_dword(dev, pos + PCI_ERR_UNCOR_SEVER, &reg32);
1446 	reg32 = (reg32 & hpp->unc_err_sever_and) | hpp->unc_err_sever_or;
1447 	pci_write_config_dword(dev, pos + PCI_ERR_UNCOR_SEVER, reg32);
1448 
1449 	/* Initialize Correctable Error Mask Register */
1450 	pci_read_config_dword(dev, pos + PCI_ERR_COR_MASK, &reg32);
1451 	reg32 = (reg32 & hpp->cor_err_mask_and) | hpp->cor_err_mask_or;
1452 	pci_write_config_dword(dev, pos + PCI_ERR_COR_MASK, reg32);
1453 
1454 	/* Initialize Advanced Error Capabilities and Control Register */
1455 	pci_read_config_dword(dev, pos + PCI_ERR_CAP, &reg32);
1456 	reg32 = (reg32 & hpp->adv_err_cap_and) | hpp->adv_err_cap_or;
1457 	pci_write_config_dword(dev, pos + PCI_ERR_CAP, reg32);
1458 
1459 	/*
1460 	 * FIXME: The following two registers are not supported yet.
1461 	 *
1462 	 *   o Secondary Uncorrectable Error Severity Register
1463 	 *   o Secondary Uncorrectable Error Mask Register
1464 	 */
1465 }
1466 
1467 static void pci_configure_device(struct pci_dev *dev)
1468 {
1469 	struct hotplug_params hpp;
1470 	int ret;
1471 
1472 	pci_configure_mps(dev);
1473 
1474 	memset(&hpp, 0, sizeof(hpp));
1475 	ret = pci_get_hp_params(dev, &hpp);
1476 	if (ret)
1477 		return;
1478 
1479 	program_hpp_type2(dev, hpp.t2);
1480 	program_hpp_type1(dev, hpp.t1);
1481 	program_hpp_type0(dev, hpp.t0);
1482 }
1483 
1484 static void pci_release_capabilities(struct pci_dev *dev)
1485 {
1486 	pci_vpd_release(dev);
1487 	pci_iov_release(dev);
1488 	pci_free_cap_save_buffers(dev);
1489 }
1490 
1491 /**
1492  * pci_release_dev - free a pci device structure when all users of it are finished.
1493  * @dev: device that's been disconnected
1494  *
1495  * Will be called only by the device core when all users of this pci device are
1496  * done.
1497  */
1498 static void pci_release_dev(struct device *dev)
1499 {
1500 	struct pci_dev *pci_dev;
1501 
1502 	pci_dev = to_pci_dev(dev);
1503 	pci_release_capabilities(pci_dev);
1504 	pci_release_of_node(pci_dev);
1505 	pcibios_release_device(pci_dev);
1506 	pci_bus_put(pci_dev->bus);
1507 	kfree(pci_dev->driver_override);
1508 	kfree(pci_dev);
1509 }
1510 
1511 struct pci_dev *pci_alloc_dev(struct pci_bus *bus)
1512 {
1513 	struct pci_dev *dev;
1514 
1515 	dev = kzalloc(sizeof(struct pci_dev), GFP_KERNEL);
1516 	if (!dev)
1517 		return NULL;
1518 
1519 	INIT_LIST_HEAD(&dev->bus_list);
1520 	dev->dev.type = &pci_dev_type;
1521 	dev->bus = pci_bus_get(bus);
1522 
1523 	return dev;
1524 }
1525 EXPORT_SYMBOL(pci_alloc_dev);
1526 
1527 bool pci_bus_read_dev_vendor_id(struct pci_bus *bus, int devfn, u32 *l,
1528 				int crs_timeout)
1529 {
1530 	int delay = 1;
1531 
1532 	if (pci_bus_read_config_dword(bus, devfn, PCI_VENDOR_ID, l))
1533 		return false;
1534 
1535 	/* some broken boards return 0 or ~0 if a slot is empty: */
1536 	if (*l == 0xffffffff || *l == 0x00000000 ||
1537 	    *l == 0x0000ffff || *l == 0xffff0000)
1538 		return false;
1539 
1540 	/*
1541 	 * Configuration Request Retry Status.  Some root ports return the
1542 	 * actual device ID instead of the synthetic ID (0xFFFF) required
1543 	 * by the PCIe spec.  Ignore the device ID and only check for
1544 	 * (vendor id == 1).
1545 	 */
1546 	while ((*l & 0xffff) == 0x0001) {
1547 		if (!crs_timeout)
1548 			return false;
1549 
1550 		msleep(delay);
1551 		delay *= 2;
1552 		if (pci_bus_read_config_dword(bus, devfn, PCI_VENDOR_ID, l))
1553 			return false;
1554 		/* Card hasn't responded in 60 seconds?  Must be stuck. */
1555 		if (delay > crs_timeout) {
1556 			printk(KERN_WARNING "pci %04x:%02x:%02x.%d: not responding\n",
1557 			       pci_domain_nr(bus), bus->number, PCI_SLOT(devfn),
1558 			       PCI_FUNC(devfn));
1559 			return false;
1560 		}
1561 	}
1562 
1563 	return true;
1564 }
1565 EXPORT_SYMBOL(pci_bus_read_dev_vendor_id);
1566 
1567 /*
1568  * Read the config data for a PCI device, sanity-check it
1569  * and fill in the dev structure...
1570  */
1571 static struct pci_dev *pci_scan_device(struct pci_bus *bus, int devfn)
1572 {
1573 	struct pci_dev *dev;
1574 	u32 l;
1575 
1576 	if (!pci_bus_read_dev_vendor_id(bus, devfn, &l, 60*1000))
1577 		return NULL;
1578 
1579 	dev = pci_alloc_dev(bus);
1580 	if (!dev)
1581 		return NULL;
1582 
1583 	dev->devfn = devfn;
1584 	dev->vendor = l & 0xffff;
1585 	dev->device = (l >> 16) & 0xffff;
1586 
1587 	pci_set_of_node(dev);
1588 
1589 	if (pci_setup_device(dev)) {
1590 		pci_bus_put(dev->bus);
1591 		kfree(dev);
1592 		return NULL;
1593 	}
1594 
1595 	return dev;
1596 }
1597 
1598 static void pci_init_capabilities(struct pci_dev *dev)
1599 {
1600 	/* MSI/MSI-X list */
1601 	pci_msi_init_pci_dev(dev);
1602 
1603 	/* Buffers for saving PCIe and PCI-X capabilities */
1604 	pci_allocate_cap_save_buffers(dev);
1605 
1606 	/* Power Management */
1607 	pci_pm_init(dev);
1608 
1609 	/* Vital Product Data */
1610 	pci_vpd_pci22_init(dev);
1611 
1612 	/* Alternative Routing-ID Forwarding */
1613 	pci_configure_ari(dev);
1614 
1615 	/* Single Root I/O Virtualization */
1616 	pci_iov_init(dev);
1617 
1618 	/* Address Translation Services */
1619 	pci_ats_init(dev);
1620 
1621 	/* Enable ACS P2P upstream forwarding */
1622 	pci_enable_acs(dev);
1623 }
1624 
1625 static void pci_set_msi_domain(struct pci_dev *dev)
1626 {
1627 	/*
1628 	 * If no domain has been set through the pcibios_add_device
1629 	 * callback, inherit the default from the bus device.
1630 	 */
1631 	if (!dev_get_msi_domain(&dev->dev))
1632 		dev_set_msi_domain(&dev->dev,
1633 				   dev_get_msi_domain(&dev->bus->dev));
1634 }
1635 
1636 void pci_device_add(struct pci_dev *dev, struct pci_bus *bus)
1637 {
1638 	int ret;
1639 
1640 	pci_configure_device(dev);
1641 
1642 	device_initialize(&dev->dev);
1643 	dev->dev.release = pci_release_dev;
1644 
1645 	set_dev_node(&dev->dev, pcibus_to_node(bus));
1646 	dev->dev.dma_mask = &dev->dma_mask;
1647 	dev->dev.dma_parms = &dev->dma_parms;
1648 	dev->dev.coherent_dma_mask = 0xffffffffull;
1649 	of_pci_dma_configure(dev);
1650 
1651 	pci_set_dma_max_seg_size(dev, 65536);
1652 	pci_set_dma_seg_boundary(dev, 0xffffffff);
1653 
1654 	/* Fix up broken headers */
1655 	pci_fixup_device(pci_fixup_header, dev);
1656 
1657 	/* moved out from quirk header fixup code */
1658 	pci_reassigndev_resource_alignment(dev);
1659 
1660 	/* Clear the state_saved flag. */
1661 	dev->state_saved = false;
1662 
1663 	/* Initialize various capabilities */
1664 	pci_init_capabilities(dev);
1665 
1666 	/*
1667 	 * Add the device to our list of discovered devices
1668 	 * and the bus list for fixup functions, etc.
1669 	 */
1670 	down_write(&pci_bus_sem);
1671 	list_add_tail(&dev->bus_list, &bus->devices);
1672 	up_write(&pci_bus_sem);
1673 
1674 	ret = pcibios_add_device(dev);
1675 	WARN_ON(ret < 0);
1676 
1677 	/* Setup MSI irq domain */
1678 	pci_set_msi_domain(dev);
1679 
1680 	/* Notifier could use PCI capabilities */
1681 	dev->match_driver = false;
1682 	ret = device_add(&dev->dev);
1683 	WARN_ON(ret < 0);
1684 }
1685 
1686 struct pci_dev *pci_scan_single_device(struct pci_bus *bus, int devfn)
1687 {
1688 	struct pci_dev *dev;
1689 
1690 	dev = pci_get_slot(bus, devfn);
1691 	if (dev) {
1692 		pci_dev_put(dev);
1693 		return dev;
1694 	}
1695 
1696 	dev = pci_scan_device(bus, devfn);
1697 	if (!dev)
1698 		return NULL;
1699 
1700 	pci_device_add(dev, bus);
1701 
1702 	return dev;
1703 }
1704 EXPORT_SYMBOL(pci_scan_single_device);
1705 
1706 static unsigned next_fn(struct pci_bus *bus, struct pci_dev *dev, unsigned fn)
1707 {
1708 	int pos;
1709 	u16 cap = 0;
1710 	unsigned next_fn;
1711 
1712 	if (pci_ari_enabled(bus)) {
1713 		if (!dev)
1714 			return 0;
1715 		pos = pci_find_ext_capability(dev, PCI_EXT_CAP_ID_ARI);
1716 		if (!pos)
1717 			return 0;
1718 
1719 		pci_read_config_word(dev, pos + PCI_ARI_CAP, &cap);
1720 		next_fn = PCI_ARI_CAP_NFN(cap);
1721 		if (next_fn <= fn)
1722 			return 0;	/* protect against malformed list */
1723 
1724 		return next_fn;
1725 	}
1726 
1727 	/* dev may be NULL for non-contiguous multifunction devices */
1728 	if (!dev || dev->multifunction)
1729 		return (fn + 1) % 8;
1730 
1731 	return 0;
1732 }
1733 
1734 static int only_one_child(struct pci_bus *bus)
1735 {
1736 	struct pci_dev *parent = bus->self;
1737 
1738 	if (!parent || !pci_is_pcie(parent))
1739 		return 0;
1740 	if (pci_pcie_type(parent) == PCI_EXP_TYPE_ROOT_PORT)
1741 		return 1;
1742 	if (parent->has_secondary_link &&
1743 	    !pci_has_flag(PCI_SCAN_ALL_PCIE_DEVS))
1744 		return 1;
1745 	return 0;
1746 }
1747 
1748 /**
1749  * pci_scan_slot - scan a PCI slot on a bus for devices.
1750  * @bus: PCI bus to scan
1751  * @devfn: slot number to scan (must have zero function.)
1752  *
1753  * Scan a PCI slot on the specified PCI bus for devices, adding
1754  * discovered devices to the @bus->devices list.  New devices
1755  * will not have is_added set.
1756  *
1757  * Returns the number of new devices found.
1758  */
1759 int pci_scan_slot(struct pci_bus *bus, int devfn)
1760 {
1761 	unsigned fn, nr = 0;
1762 	struct pci_dev *dev;
1763 
1764 	if (only_one_child(bus) && (devfn > 0))
1765 		return 0; /* Already scanned the entire slot */
1766 
1767 	dev = pci_scan_single_device(bus, devfn);
1768 	if (!dev)
1769 		return 0;
1770 	if (!dev->is_added)
1771 		nr++;
1772 
1773 	for (fn = next_fn(bus, dev, 0); fn > 0; fn = next_fn(bus, dev, fn)) {
1774 		dev = pci_scan_single_device(bus, devfn + fn);
1775 		if (dev) {
1776 			if (!dev->is_added)
1777 				nr++;
1778 			dev->multifunction = 1;
1779 		}
1780 	}
1781 
1782 	/* only one slot has pcie device */
1783 	if (bus->self && nr)
1784 		pcie_aspm_init_link_state(bus->self);
1785 
1786 	return nr;
1787 }
1788 EXPORT_SYMBOL(pci_scan_slot);
1789 
1790 static int pcie_find_smpss(struct pci_dev *dev, void *data)
1791 {
1792 	u8 *smpss = data;
1793 
1794 	if (!pci_is_pcie(dev))
1795 		return 0;
1796 
1797 	/*
1798 	 * We don't have a way to change MPS settings on devices that have
1799 	 * drivers attached.  A hot-added device might support only the minimum
1800 	 * MPS setting (MPS=128).  Therefore, if the fabric contains a bridge
1801 	 * where devices may be hot-added, we limit the fabric MPS to 128 so
1802 	 * hot-added devices will work correctly.
1803 	 *
1804 	 * However, if we hot-add a device to a slot directly below a Root
1805 	 * Port, it's impossible for there to be other existing devices below
1806 	 * the port.  We don't limit the MPS in this case because we can
1807 	 * reconfigure MPS on both the Root Port and the hot-added device,
1808 	 * and there are no other devices involved.
1809 	 *
1810 	 * Note that this PCIE_BUS_SAFE path assumes no peer-to-peer DMA.
1811 	 */
1812 	if (dev->is_hotplug_bridge &&
1813 	    pci_pcie_type(dev) != PCI_EXP_TYPE_ROOT_PORT)
1814 		*smpss = 0;
1815 
1816 	if (*smpss > dev->pcie_mpss)
1817 		*smpss = dev->pcie_mpss;
1818 
1819 	return 0;
1820 }
1821 
1822 static void pcie_write_mps(struct pci_dev *dev, int mps)
1823 {
1824 	int rc;
1825 
1826 	if (pcie_bus_config == PCIE_BUS_PERFORMANCE) {
1827 		mps = 128 << dev->pcie_mpss;
1828 
1829 		if (pci_pcie_type(dev) != PCI_EXP_TYPE_ROOT_PORT &&
1830 		    dev->bus->self)
1831 			/* For "Performance", the assumption is made that
1832 			 * downstream communication will never be larger than
1833 			 * the MRRS.  So, the MPS only needs to be configured
1834 			 * for the upstream communication.  This being the case,
1835 			 * walk from the top down and set the MPS of the child
1836 			 * to that of the parent bus.
1837 			 *
1838 			 * Configure the device MPS with the smaller of the
1839 			 * device MPSS or the bridge MPS (which is assumed to be
1840 			 * properly configured at this point to the largest
1841 			 * allowable MPS based on its parent bus).
1842 			 */
1843 			mps = min(mps, pcie_get_mps(dev->bus->self));
1844 	}
1845 
1846 	rc = pcie_set_mps(dev, mps);
1847 	if (rc)
1848 		dev_err(&dev->dev, "Failed attempting to set the MPS\n");
1849 }
1850 
1851 static void pcie_write_mrrs(struct pci_dev *dev)
1852 {
1853 	int rc, mrrs;
1854 
1855 	/* In the "safe" case, do not configure the MRRS.  There appear to be
1856 	 * issues with setting MRRS to 0 on a number of devices.
1857 	 */
1858 	if (pcie_bus_config != PCIE_BUS_PERFORMANCE)
1859 		return;
1860 
1861 	/* For Max performance, the MRRS must be set to the largest supported
1862 	 * value.  However, it cannot be configured larger than the MPS the
1863 	 * device or the bus can support.  This should already be properly
1864 	 * configured by a prior call to pcie_write_mps.
1865 	 */
1866 	mrrs = pcie_get_mps(dev);
1867 
1868 	/* MRRS is a R/W register.  Invalid values can be written, but a
1869 	 * subsequent read will verify if the value is acceptable or not.
1870 	 * If the MRRS value provided is not acceptable (e.g., too large),
1871 	 * shrink the value until it is acceptable to the HW.
1872 	 */
1873 	while (mrrs != pcie_get_readrq(dev) && mrrs >= 128) {
1874 		rc = pcie_set_readrq(dev, mrrs);
1875 		if (!rc)
1876 			break;
1877 
1878 		dev_warn(&dev->dev, "Failed attempting to set the MRRS\n");
1879 		mrrs /= 2;
1880 	}
1881 
1882 	if (mrrs < 128)
1883 		dev_err(&dev->dev, "MRRS was unable to be configured with a safe value.  If problems are experienced, try running with pci=pcie_bus_safe\n");
1884 }
1885 
1886 static int pcie_bus_configure_set(struct pci_dev *dev, void *data)
1887 {
1888 	int mps, orig_mps;
1889 
1890 	if (!pci_is_pcie(dev))
1891 		return 0;
1892 
1893 	if (pcie_bus_config == PCIE_BUS_TUNE_OFF ||
1894 	    pcie_bus_config == PCIE_BUS_DEFAULT)
1895 		return 0;
1896 
1897 	mps = 128 << *(u8 *)data;
1898 	orig_mps = pcie_get_mps(dev);
1899 
1900 	pcie_write_mps(dev, mps);
1901 	pcie_write_mrrs(dev);
1902 
1903 	dev_info(&dev->dev, "Max Payload Size set to %4d/%4d (was %4d), Max Read Rq %4d\n",
1904 		 pcie_get_mps(dev), 128 << dev->pcie_mpss,
1905 		 orig_mps, pcie_get_readrq(dev));
1906 
1907 	return 0;
1908 }
1909 
1910 /* pcie_bus_configure_settings requires that pci_walk_bus work in a top-down,
1911  * parents then children fashion.  If this changes, then this code will not
1912  * work as designed.
1913  */
1914 void pcie_bus_configure_settings(struct pci_bus *bus)
1915 {
1916 	u8 smpss = 0;
1917 
1918 	if (!bus->self)
1919 		return;
1920 
1921 	if (!pci_is_pcie(bus->self))
1922 		return;
1923 
1924 	/* FIXME - Peer to peer DMA is possible, though the endpoint would need
1925 	 * to be aware of the MPS of the destination.  To work around this,
1926 	 * simply force the MPS of the entire system to the smallest possible.
1927 	 */
1928 	if (pcie_bus_config == PCIE_BUS_PEER2PEER)
1929 		smpss = 0;
1930 
1931 	if (pcie_bus_config == PCIE_BUS_SAFE) {
1932 		smpss = bus->self->pcie_mpss;
1933 
1934 		pcie_find_smpss(bus->self, &smpss);
1935 		pci_walk_bus(bus, pcie_find_smpss, &smpss);
1936 	}
1937 
1938 	pcie_bus_configure_set(bus->self, &smpss);
1939 	pci_walk_bus(bus, pcie_bus_configure_set, &smpss);
1940 }
1941 EXPORT_SYMBOL_GPL(pcie_bus_configure_settings);
1942 
1943 unsigned int pci_scan_child_bus(struct pci_bus *bus)
1944 {
1945 	unsigned int devfn, pass, max = bus->busn_res.start;
1946 	struct pci_dev *dev;
1947 
1948 	dev_dbg(&bus->dev, "scanning bus\n");
1949 
1950 	/* Go find them, Rover! */
1951 	for (devfn = 0; devfn < 0x100; devfn += 8)
1952 		pci_scan_slot(bus, devfn);
1953 
1954 	/* Reserve buses for SR-IOV capability. */
1955 	max += pci_iov_bus_range(bus);
1956 
1957 	/*
1958 	 * After performing arch-dependent fixup of the bus, look behind
1959 	 * all PCI-to-PCI bridges on this bus.
1960 	 */
1961 	if (!bus->is_added) {
1962 		dev_dbg(&bus->dev, "fixups for bus\n");
1963 		pcibios_fixup_bus(bus);
1964 		bus->is_added = 1;
1965 	}
1966 
1967 	for (pass = 0; pass < 2; pass++)
1968 		list_for_each_entry(dev, &bus->devices, bus_list) {
1969 			if (pci_is_bridge(dev))
1970 				max = pci_scan_bridge(bus, dev, max, pass);
1971 		}
1972 
1973 	/*
1974 	 * We've scanned the bus and so we know all about what's on
1975 	 * the other side of any bridges that may be on this bus plus
1976 	 * any devices.
1977 	 *
1978 	 * Return how far we've got finding sub-buses.
1979 	 */
1980 	dev_dbg(&bus->dev, "bus scan returning with max=%02x\n", max);
1981 	return max;
1982 }
1983 EXPORT_SYMBOL_GPL(pci_scan_child_bus);
1984 
1985 /**
1986  * pcibios_root_bridge_prepare - Platform-specific host bridge setup.
1987  * @bridge: Host bridge to set up.
1988  *
1989  * Default empty implementation.  Replace with an architecture-specific setup
1990  * routine, if necessary.
1991  */
1992 int __weak pcibios_root_bridge_prepare(struct pci_host_bridge *bridge)
1993 {
1994 	return 0;
1995 }
1996 
1997 void __weak pcibios_add_bus(struct pci_bus *bus)
1998 {
1999 }
2000 
2001 void __weak pcibios_remove_bus(struct pci_bus *bus)
2002 {
2003 }
2004 
2005 struct pci_bus *pci_create_root_bus(struct device *parent, int bus,
2006 		struct pci_ops *ops, void *sysdata, struct list_head *resources)
2007 {
2008 	int error;
2009 	struct pci_host_bridge *bridge;
2010 	struct pci_bus *b, *b2;
2011 	struct resource_entry *window, *n;
2012 	struct resource *res;
2013 	resource_size_t offset;
2014 	char bus_addr[64];
2015 	char *fmt;
2016 
2017 	b = pci_alloc_bus(NULL);
2018 	if (!b)
2019 		return NULL;
2020 
2021 	b->sysdata = sysdata;
2022 	b->ops = ops;
2023 	b->number = b->busn_res.start = bus;
2024 	pci_bus_assign_domain_nr(b, parent);
2025 	b2 = pci_find_bus(pci_domain_nr(b), bus);
2026 	if (b2) {
2027 		/* If we already got to this bus through a different bridge, ignore it */
2028 		dev_dbg(&b2->dev, "bus already known\n");
2029 		goto err_out;
2030 	}
2031 
2032 	bridge = pci_alloc_host_bridge(b);
2033 	if (!bridge)
2034 		goto err_out;
2035 
2036 	bridge->dev.parent = parent;
2037 	bridge->dev.release = pci_release_host_bridge_dev;
2038 	dev_set_name(&bridge->dev, "pci%04x:%02x", pci_domain_nr(b), bus);
2039 	error = pcibios_root_bridge_prepare(bridge);
2040 	if (error) {
2041 		kfree(bridge);
2042 		goto err_out;
2043 	}
2044 
2045 	error = device_register(&bridge->dev);
2046 	if (error) {
2047 		put_device(&bridge->dev);
2048 		goto err_out;
2049 	}
2050 	b->bridge = get_device(&bridge->dev);
2051 	device_enable_async_suspend(b->bridge);
2052 	pci_set_bus_of_node(b);
2053 	pci_set_bus_msi_domain(b);
2054 
2055 	if (!parent)
2056 		set_dev_node(b->bridge, pcibus_to_node(b));
2057 
2058 	b->dev.class = &pcibus_class;
2059 	b->dev.parent = b->bridge;
2060 	dev_set_name(&b->dev, "%04x:%02x", pci_domain_nr(b), bus);
2061 	error = device_register(&b->dev);
2062 	if (error)
2063 		goto class_dev_reg_err;
2064 
2065 	pcibios_add_bus(b);
2066 
2067 	/* Create legacy_io and legacy_mem files for this bus */
2068 	pci_create_legacy_files(b);
2069 
2070 	if (parent)
2071 		dev_info(parent, "PCI host bridge to bus %s\n", dev_name(&b->dev));
2072 	else
2073 		printk(KERN_INFO "PCI host bridge to bus %s\n", dev_name(&b->dev));
2074 
2075 	/* Add initial resources to the bus */
2076 	resource_list_for_each_entry_safe(window, n, resources) {
2077 		list_move_tail(&window->node, &bridge->windows);
2078 		res = window->res;
2079 		offset = window->offset;
2080 		if (res->flags & IORESOURCE_BUS)
2081 			pci_bus_insert_busn_res(b, bus, res->end);
2082 		else
2083 			pci_bus_add_resource(b, res, 0);
2084 		if (offset) {
2085 			if (resource_type(res) == IORESOURCE_IO)
2086 				fmt = " (bus address [%#06llx-%#06llx])";
2087 			else
2088 				fmt = " (bus address [%#010llx-%#010llx])";
2089 			snprintf(bus_addr, sizeof(bus_addr), fmt,
2090 				 (unsigned long long) (res->start - offset),
2091 				 (unsigned long long) (res->end - offset));
2092 		} else
2093 			bus_addr[0] = '\0';
2094 		dev_info(&b->dev, "root bus resource %pR%s\n", res, bus_addr);
2095 	}
2096 
2097 	down_write(&pci_bus_sem);
2098 	list_add_tail(&b->node, &pci_root_buses);
2099 	up_write(&pci_bus_sem);
2100 
2101 	return b;
2102 
2103 class_dev_reg_err:
2104 	put_device(&bridge->dev);
2105 	device_unregister(&bridge->dev);
2106 err_out:
2107 	kfree(b);
2108 	return NULL;
2109 }
2110 EXPORT_SYMBOL_GPL(pci_create_root_bus);
2111 
2112 int pci_bus_insert_busn_res(struct pci_bus *b, int bus, int bus_max)
2113 {
2114 	struct resource *res = &b->busn_res;
2115 	struct resource *parent_res, *conflict;
2116 
2117 	res->start = bus;
2118 	res->end = bus_max;
2119 	res->flags = IORESOURCE_BUS;
2120 
2121 	if (!pci_is_root_bus(b))
2122 		parent_res = &b->parent->busn_res;
2123 	else {
2124 		parent_res = get_pci_domain_busn_res(pci_domain_nr(b));
2125 		res->flags |= IORESOURCE_PCI_FIXED;
2126 	}
2127 
2128 	conflict = request_resource_conflict(parent_res, res);
2129 
2130 	if (conflict)
2131 		dev_printk(KERN_DEBUG, &b->dev,
2132 			   "busn_res: can not insert %pR under %s%pR (conflicts with %s %pR)\n",
2133 			    res, pci_is_root_bus(b) ? "domain " : "",
2134 			    parent_res, conflict->name, conflict);
2135 
2136 	return conflict == NULL;
2137 }
2138 
2139 int pci_bus_update_busn_res_end(struct pci_bus *b, int bus_max)
2140 {
2141 	struct resource *res = &b->busn_res;
2142 	struct resource old_res = *res;
2143 	resource_size_t size;
2144 	int ret;
2145 
2146 	if (res->start > bus_max)
2147 		return -EINVAL;
2148 
2149 	size = bus_max - res->start + 1;
2150 	ret = adjust_resource(res, res->start, size);
2151 	dev_printk(KERN_DEBUG, &b->dev,
2152 			"busn_res: %pR end %s updated to %02x\n",
2153 			&old_res, ret ? "can not be" : "is", bus_max);
2154 
2155 	if (!ret && !res->parent)
2156 		pci_bus_insert_busn_res(b, res->start, res->end);
2157 
2158 	return ret;
2159 }
2160 
2161 void pci_bus_release_busn_res(struct pci_bus *b)
2162 {
2163 	struct resource *res = &b->busn_res;
2164 	int ret;
2165 
2166 	if (!res->flags || !res->parent)
2167 		return;
2168 
2169 	ret = release_resource(res);
2170 	dev_printk(KERN_DEBUG, &b->dev,
2171 			"busn_res: %pR %s released\n",
2172 			res, ret ? "can not be" : "is");
2173 }
2174 
2175 struct pci_bus *pci_scan_root_bus_msi(struct device *parent, int bus,
2176 		struct pci_ops *ops, void *sysdata,
2177 		struct list_head *resources, struct msi_controller *msi)
2178 {
2179 	struct resource_entry *window;
2180 	bool found = false;
2181 	struct pci_bus *b;
2182 	int max;
2183 
2184 	resource_list_for_each_entry(window, resources)
2185 		if (window->res->flags & IORESOURCE_BUS) {
2186 			found = true;
2187 			break;
2188 		}
2189 
2190 	b = pci_create_root_bus(parent, bus, ops, sysdata, resources);
2191 	if (!b)
2192 		return NULL;
2193 
2194 	b->msi = msi;
2195 
2196 	if (!found) {
2197 		dev_info(&b->dev,
2198 		 "No busn resource found for root bus, will use [bus %02x-ff]\n",
2199 			bus);
2200 		pci_bus_insert_busn_res(b, bus, 255);
2201 	}
2202 
2203 	max = pci_scan_child_bus(b);
2204 
2205 	if (!found)
2206 		pci_bus_update_busn_res_end(b, max);
2207 
2208 	return b;
2209 }
2210 
2211 struct pci_bus *pci_scan_root_bus(struct device *parent, int bus,
2212 		struct pci_ops *ops, void *sysdata, struct list_head *resources)
2213 {
2214 	return pci_scan_root_bus_msi(parent, bus, ops, sysdata, resources,
2215 				     NULL);
2216 }
2217 EXPORT_SYMBOL(pci_scan_root_bus);
2218 
2219 struct pci_bus *pci_scan_bus(int bus, struct pci_ops *ops,
2220 					void *sysdata)
2221 {
2222 	LIST_HEAD(resources);
2223 	struct pci_bus *b;
2224 
2225 	pci_add_resource(&resources, &ioport_resource);
2226 	pci_add_resource(&resources, &iomem_resource);
2227 	pci_add_resource(&resources, &busn_resource);
2228 	b = pci_create_root_bus(NULL, bus, ops, sysdata, &resources);
2229 	if (b) {
2230 		pci_scan_child_bus(b);
2231 	} else {
2232 		pci_free_resource_list(&resources);
2233 	}
2234 	return b;
2235 }
2236 EXPORT_SYMBOL(pci_scan_bus);
2237 
2238 /**
2239  * pci_rescan_bus_bridge_resize - scan a PCI bus for devices.
2240  * @bridge: PCI bridge for the bus to scan
2241  *
2242  * Scan a PCI bus and child buses for new devices, add them,
2243  * and enable them, resizing bridge mmio/io resource if necessary
2244  * and possible.  The caller must ensure the child devices are already
2245  * removed for resizing to occur.
2246  *
2247  * Returns the max number of subordinate bus discovered.
2248  */
2249 unsigned int pci_rescan_bus_bridge_resize(struct pci_dev *bridge)
2250 {
2251 	unsigned int max;
2252 	struct pci_bus *bus = bridge->subordinate;
2253 
2254 	max = pci_scan_child_bus(bus);
2255 
2256 	pci_assign_unassigned_bridge_resources(bridge);
2257 
2258 	pci_bus_add_devices(bus);
2259 
2260 	return max;
2261 }
2262 
2263 /**
2264  * pci_rescan_bus - scan a PCI bus for devices.
2265  * @bus: PCI bus to scan
2266  *
2267  * Scan a PCI bus and child buses for new devices, adds them,
2268  * and enables them.
2269  *
2270  * Returns the max number of subordinate bus discovered.
2271  */
2272 unsigned int pci_rescan_bus(struct pci_bus *bus)
2273 {
2274 	unsigned int max;
2275 
2276 	max = pci_scan_child_bus(bus);
2277 	pci_assign_unassigned_bus_resources(bus);
2278 	pci_bus_add_devices(bus);
2279 
2280 	return max;
2281 }
2282 EXPORT_SYMBOL_GPL(pci_rescan_bus);
2283 
2284 /*
2285  * pci_rescan_bus(), pci_rescan_bus_bridge_resize() and PCI device removal
2286  * routines should always be executed under this mutex.
2287  */
2288 static DEFINE_MUTEX(pci_rescan_remove_lock);
2289 
2290 void pci_lock_rescan_remove(void)
2291 {
2292 	mutex_lock(&pci_rescan_remove_lock);
2293 }
2294 EXPORT_SYMBOL_GPL(pci_lock_rescan_remove);
2295 
2296 void pci_unlock_rescan_remove(void)
2297 {
2298 	mutex_unlock(&pci_rescan_remove_lock);
2299 }
2300 EXPORT_SYMBOL_GPL(pci_unlock_rescan_remove);
2301 
2302 static int __init pci_sort_bf_cmp(const struct device *d_a,
2303 				  const struct device *d_b)
2304 {
2305 	const struct pci_dev *a = to_pci_dev(d_a);
2306 	const struct pci_dev *b = to_pci_dev(d_b);
2307 
2308 	if      (pci_domain_nr(a->bus) < pci_domain_nr(b->bus)) return -1;
2309 	else if (pci_domain_nr(a->bus) > pci_domain_nr(b->bus)) return  1;
2310 
2311 	if      (a->bus->number < b->bus->number) return -1;
2312 	else if (a->bus->number > b->bus->number) return  1;
2313 
2314 	if      (a->devfn < b->devfn) return -1;
2315 	else if (a->devfn > b->devfn) return  1;
2316 
2317 	return 0;
2318 }
2319 
2320 void __init pci_sort_breadthfirst(void)
2321 {
2322 	bus_sort_breadthfirst(&pci_bus_type, &pci_sort_bf_cmp);
2323 }
2324