xref: /freebsd/sys/dev/pci/pci_pci.c (revision 357378bbdedf24ce2b90e9bd831af4a9db3ec70a)
1 /*-
2  * SPDX-License-Identifier: BSD-3-Clause
3  *
4  * Copyright (c) 1994,1995 Stefan Esser, Wolfgang StanglMeier
5  * Copyright (c) 2000 Michael Smith <msmith@freebsd.org>
6  * Copyright (c) 2000 BSDi
7  * All rights reserved.
8  *
9  * Redistribution and use in source and binary forms, with or without
10  * modification, are permitted provided that the following conditions
11  * are met:
12  * 1. Redistributions of source code must retain the above copyright
13  *    notice, this list of conditions and the following disclaimer.
14  * 2. Redistributions in binary form must reproduce the above copyright
15  *    notice, this list of conditions and the following disclaimer in the
16  *    documentation and/or other materials provided with the distribution.
17  * 3. The name of the author may not be used to endorse or promote products
18  *    derived from this software without specific prior written permission.
19  *
20  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
21  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
22  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
23  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
24  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
25  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
26  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
28  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
29  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
30  * SUCH DAMAGE.
31  */
32 
33 #include <sys/cdefs.h>
34 /*
35  * PCI:PCI bridge support.
36  */
37 
38 #include "opt_pci.h"
39 
40 #include <sys/param.h>
41 #include <sys/bus.h>
42 #include <sys/kernel.h>
43 #include <sys/lock.h>
44 #include <sys/malloc.h>
45 #include <sys/module.h>
46 #include <sys/mutex.h>
47 #include <sys/pciio.h>
48 #include <sys/rman.h>
49 #include <sys/sysctl.h>
50 #include <sys/systm.h>
51 #include <sys/taskqueue.h>
52 
53 #include <dev/pci/pcivar.h>
54 #include <dev/pci/pcireg.h>
55 #include <dev/pci/pci_private.h>
56 #include <dev/pci/pcib_private.h>
57 
58 #include "pcib_if.h"
59 
60 static int		pcib_probe(device_t dev);
61 static int		pcib_resume(device_t dev);
62 
63 static bus_child_present_t	pcib_child_present;
64 static bus_alloc_resource_t	pcib_alloc_resource;
65 static bus_adjust_resource_t	pcib_adjust_resource;
66 static bus_release_resource_t	pcib_release_resource;
67 static bus_activate_resource_t	pcib_activate_resource;
68 static bus_deactivate_resource_t pcib_deactivate_resource;
69 static bus_map_resource_t	pcib_map_resource;
70 static bus_unmap_resource_t	pcib_unmap_resource;
71 static int		pcib_reset_child(device_t dev, device_t child, int flags);
72 
73 static int		pcib_power_for_sleep(device_t pcib, device_t dev,
74 			    int *pstate);
75 static int		pcib_ari_get_id(device_t pcib, device_t dev,
76     enum pci_id_type type, uintptr_t *id);
77 static uint32_t		pcib_read_config(device_t dev, u_int b, u_int s,
78     u_int f, u_int reg, int width);
79 static void		pcib_write_config(device_t dev, u_int b, u_int s,
80     u_int f, u_int reg, uint32_t val, int width);
81 static int		pcib_ari_maxslots(device_t dev);
82 static int		pcib_ari_maxfuncs(device_t dev);
83 static int		pcib_try_enable_ari(device_t pcib, device_t dev);
84 static int		pcib_ari_enabled(device_t pcib);
85 static void		pcib_ari_decode_rid(device_t pcib, uint16_t rid,
86 			    int *bus, int *slot, int *func);
87 #ifdef PCI_HP
88 static void		pcib_pcie_ab_timeout(void *arg, int pending);
89 static void		pcib_pcie_cc_timeout(void *arg, int pending);
90 static void		pcib_pcie_dll_timeout(void *arg, int pending);
91 #endif
92 static int		pcib_request_feature_default(device_t pcib, device_t dev,
93 			    enum pci_feature feature);
94 
95 static device_method_t pcib_methods[] = {
96     /* Device interface */
97     DEVMETHOD(device_probe,		pcib_probe),
98     DEVMETHOD(device_attach,		pcib_attach),
99     DEVMETHOD(device_detach,		pcib_detach),
100     DEVMETHOD(device_shutdown,		bus_generic_shutdown),
101     DEVMETHOD(device_suspend,		bus_generic_suspend),
102     DEVMETHOD(device_resume,		pcib_resume),
103 
104     /* Bus interface */
105     DEVMETHOD(bus_child_present,	pcib_child_present),
106     DEVMETHOD(bus_read_ivar,		pcib_read_ivar),
107     DEVMETHOD(bus_write_ivar,		pcib_write_ivar),
108     DEVMETHOD(bus_alloc_resource,	pcib_alloc_resource),
109     DEVMETHOD(bus_adjust_resource,	pcib_adjust_resource),
110     DEVMETHOD(bus_release_resource,	pcib_release_resource),
111     DEVMETHOD(bus_activate_resource,	pcib_activate_resource),
112     DEVMETHOD(bus_deactivate_resource,	pcib_deactivate_resource),
113     DEVMETHOD(bus_map_resource,		pcib_map_resource),
114     DEVMETHOD(bus_unmap_resource,	pcib_unmap_resource),
115     DEVMETHOD(bus_setup_intr,		bus_generic_setup_intr),
116     DEVMETHOD(bus_teardown_intr,	bus_generic_teardown_intr),
117     DEVMETHOD(bus_reset_child,		pcib_reset_child),
118 
119     /* pcib interface */
120     DEVMETHOD(pcib_maxslots,		pcib_ari_maxslots),
121     DEVMETHOD(pcib_maxfuncs,		pcib_ari_maxfuncs),
122     DEVMETHOD(pcib_read_config,		pcib_read_config),
123     DEVMETHOD(pcib_write_config,	pcib_write_config),
124     DEVMETHOD(pcib_route_interrupt,	pcib_route_interrupt),
125     DEVMETHOD(pcib_alloc_msi,		pcib_alloc_msi),
126     DEVMETHOD(pcib_release_msi,		pcib_release_msi),
127     DEVMETHOD(pcib_alloc_msix,		pcib_alloc_msix),
128     DEVMETHOD(pcib_release_msix,	pcib_release_msix),
129     DEVMETHOD(pcib_map_msi,		pcib_map_msi),
130     DEVMETHOD(pcib_power_for_sleep,	pcib_power_for_sleep),
131     DEVMETHOD(pcib_get_id,		pcib_ari_get_id),
132     DEVMETHOD(pcib_try_enable_ari,	pcib_try_enable_ari),
133     DEVMETHOD(pcib_ari_enabled,		pcib_ari_enabled),
134     DEVMETHOD(pcib_decode_rid,		pcib_ari_decode_rid),
135     DEVMETHOD(pcib_request_feature,	pcib_request_feature_default),
136 
137     DEVMETHOD_END
138 };
139 
140 DEFINE_CLASS_0(pcib, pcib_driver, pcib_methods, sizeof(struct pcib_softc));
141 EARLY_DRIVER_MODULE(pcib, pci, pcib_driver, NULL, NULL, BUS_PASS_BUS);
142 
143 SYSCTL_DECL(_hw_pci);
144 
145 static int pci_clear_pcib;
146 SYSCTL_INT(_hw_pci, OID_AUTO, clear_pcib, CTLFLAG_RDTUN, &pci_clear_pcib, 0,
147     "Clear firmware-assigned resources for PCI-PCI bridge I/O windows.");
148 
149 /*
150  * Get the corresponding window if this resource from a child device was
151  * sub-allocated from one of our window resource managers.
152  */
153 static struct pcib_window *
154 pcib_get_resource_window(struct pcib_softc *sc, struct resource *r)
155 {
156 	switch (rman_get_type(r)) {
157 	case SYS_RES_IOPORT:
158 		if (rman_is_region_manager(r, &sc->io.rman))
159 			return (&sc->io);
160 		break;
161 	case SYS_RES_MEMORY:
162 		/* Prefetchable resources may live in either memory rman. */
163 		if (rman_get_flags(r) & RF_PREFETCHABLE &&
164 		    rman_is_region_manager(r, &sc->pmem.rman))
165 			return (&sc->pmem);
166 		if (rman_is_region_manager(r, &sc->mem.rman))
167 			return (&sc->mem);
168 		break;
169 	}
170 	return (NULL);
171 }
172 
173 /*
174  * Is a resource from a child device sub-allocated from one of our
175  * resource managers?
176  */
177 static int
178 pcib_is_resource_managed(struct pcib_softc *sc, struct resource *r)
179 {
180 
181 	if (rman_get_type(r) == PCI_RES_BUS)
182 		return (rman_is_region_manager(r, &sc->bus.rman));
183 	return (pcib_get_resource_window(sc, r) != NULL);
184 }
185 
186 static int
187 pcib_is_window_open(struct pcib_window *pw)
188 {
189 
190 	return (pw->valid && pw->base < pw->limit);
191 }
192 
193 /*
194  * XXX: If RF_ACTIVE did not also imply allocating a bus space tag and
195  * handle for the resource, we could pass RF_ACTIVE up to the PCI bus
196  * when allocating the resource windows and rely on the PCI bus driver
197  * to do this for us.
198  */
199 static void
200 pcib_activate_window(struct pcib_softc *sc, int type)
201 {
202 
203 	PCI_ENABLE_IO(device_get_parent(sc->dev), sc->dev, type);
204 }
205 
206 static void
207 pcib_write_windows(struct pcib_softc *sc, int mask)
208 {
209 	device_t dev;
210 	uint32_t val;
211 
212 	dev = sc->dev;
213 	if (sc->io.valid && mask & WIN_IO) {
214 		val = pci_read_config(dev, PCIR_IOBASEL_1, 1);
215 		if ((val & PCIM_BRIO_MASK) == PCIM_BRIO_32) {
216 			pci_write_config(dev, PCIR_IOBASEH_1,
217 			    sc->io.base >> 16, 2);
218 			pci_write_config(dev, PCIR_IOLIMITH_1,
219 			    sc->io.limit >> 16, 2);
220 		}
221 		pci_write_config(dev, PCIR_IOBASEL_1, sc->io.base >> 8, 1);
222 		pci_write_config(dev, PCIR_IOLIMITL_1, sc->io.limit >> 8, 1);
223 	}
224 
225 	if (mask & WIN_MEM) {
226 		pci_write_config(dev, PCIR_MEMBASE_1, sc->mem.base >> 16, 2);
227 		pci_write_config(dev, PCIR_MEMLIMIT_1, sc->mem.limit >> 16, 2);
228 	}
229 
230 	if (sc->pmem.valid && mask & WIN_PMEM) {
231 		val = pci_read_config(dev, PCIR_PMBASEL_1, 2);
232 		if ((val & PCIM_BRPM_MASK) == PCIM_BRPM_64) {
233 			pci_write_config(dev, PCIR_PMBASEH_1,
234 			    sc->pmem.base >> 32, 4);
235 			pci_write_config(dev, PCIR_PMLIMITH_1,
236 			    sc->pmem.limit >> 32, 4);
237 		}
238 		pci_write_config(dev, PCIR_PMBASEL_1, sc->pmem.base >> 16, 2);
239 		pci_write_config(dev, PCIR_PMLIMITL_1, sc->pmem.limit >> 16, 2);
240 	}
241 }
242 
243 /*
244  * This is used to reject I/O port allocations that conflict with an
245  * ISA alias range.
246  */
247 static int
248 pcib_is_isa_range(struct pcib_softc *sc, rman_res_t start, rman_res_t end,
249     rman_res_t count)
250 {
251 	rman_res_t next_alias;
252 
253 	if (!(sc->bridgectl & PCIB_BCR_ISA_ENABLE))
254 		return (0);
255 
256 	/* Only check fixed ranges for overlap. */
257 	if (start + count - 1 != end)
258 		return (0);
259 
260 	/* ISA aliases are only in the lower 64KB of I/O space. */
261 	if (start >= 65536)
262 		return (0);
263 
264 	/* Check for overlap with 0x000 - 0x0ff as a special case. */
265 	if (start < 0x100)
266 		goto alias;
267 
268 	/*
269 	 * If the start address is an alias, the range is an alias.
270 	 * Otherwise, compute the start of the next alias range and
271 	 * check if it is before the end of the candidate range.
272 	 */
273 	if ((start & 0x300) != 0)
274 		goto alias;
275 	next_alias = (start & ~0x3fful) | 0x100;
276 	if (next_alias <= end)
277 		goto alias;
278 	return (0);
279 
280 alias:
281 	if (bootverbose)
282 		device_printf(sc->dev,
283 		    "I/O range %#jx-%#jx overlaps with an ISA alias\n", start,
284 		    end);
285 	return (1);
286 }
287 
288 static void
289 pcib_add_window_resources(struct pcib_window *w, struct resource **res,
290     int count)
291 {
292 	struct resource **newarray;
293 	int error, i;
294 
295 	newarray = malloc(sizeof(struct resource *) * (w->count + count),
296 	    M_DEVBUF, M_WAITOK);
297 	if (w->res != NULL)
298 		bcopy(w->res, newarray, sizeof(struct resource *) * w->count);
299 	bcopy(res, newarray + w->count, sizeof(struct resource *) * count);
300 	free(w->res, M_DEVBUF);
301 	w->res = newarray;
302 	w->count += count;
303 
304 	for (i = 0; i < count; i++) {
305 		error = rman_manage_region(&w->rman, rman_get_start(res[i]),
306 		    rman_get_end(res[i]));
307 		if (error)
308 			panic("Failed to add resource to rman");
309 	}
310 }
311 
312 typedef void (nonisa_callback)(rman_res_t start, rman_res_t end, void *arg);
313 
314 static void
315 pcib_walk_nonisa_ranges(rman_res_t start, rman_res_t end, nonisa_callback *cb,
316     void *arg)
317 {
318 	rman_res_t next_end;
319 
320 	/*
321 	 * If start is within an ISA alias range, move up to the start
322 	 * of the next non-alias range.  As a special case, addresses
323 	 * in the range 0x000 - 0x0ff should also be skipped since
324 	 * those are used for various system I/O devices in ISA
325 	 * systems.
326 	 */
327 	if (start <= 65535) {
328 		if (start < 0x100 || (start & 0x300) != 0) {
329 			start &= ~0x3ff;
330 			start += 0x400;
331 		}
332 	}
333 
334 	/* ISA aliases are only in the lower 64KB of I/O space. */
335 	while (start <= MIN(end, 65535)) {
336 		next_end = MIN(start | 0xff, end);
337 		cb(start, next_end, arg);
338 		start += 0x400;
339 	}
340 
341 	if (start <= end)
342 		cb(start, end, arg);
343 }
344 
345 static void
346 count_ranges(rman_res_t start, rman_res_t end, void *arg)
347 {
348 	int *countp;
349 
350 	countp = arg;
351 	(*countp)++;
352 }
353 
354 struct alloc_state {
355 	struct resource **res;
356 	struct pcib_softc *sc;
357 	int count, error;
358 };
359 
360 static void
361 alloc_ranges(rman_res_t start, rman_res_t end, void *arg)
362 {
363 	struct alloc_state *as;
364 	struct pcib_window *w;
365 	int rid;
366 
367 	as = arg;
368 	if (as->error != 0)
369 		return;
370 
371 	w = &as->sc->io;
372 	rid = w->reg;
373 	if (bootverbose)
374 		device_printf(as->sc->dev,
375 		    "allocating non-ISA range %#jx-%#jx\n", start, end);
376 	as->res[as->count] = bus_alloc_resource(as->sc->dev, SYS_RES_IOPORT,
377 	    &rid, start, end, end - start + 1, RF_ACTIVE | RF_UNMAPPED);
378 	if (as->res[as->count] == NULL)
379 		as->error = ENXIO;
380 	else
381 		as->count++;
382 }
383 
384 static int
385 pcib_alloc_nonisa_ranges(struct pcib_softc *sc, rman_res_t start, rman_res_t end)
386 {
387 	struct alloc_state as;
388 	int i, new_count;
389 
390 	/* First, see how many ranges we need. */
391 	new_count = 0;
392 	pcib_walk_nonisa_ranges(start, end, count_ranges, &new_count);
393 
394 	/* Second, allocate the ranges. */
395 	as.res = malloc(sizeof(struct resource *) * new_count, M_DEVBUF,
396 	    M_WAITOK);
397 	as.sc = sc;
398 	as.count = 0;
399 	as.error = 0;
400 	pcib_walk_nonisa_ranges(start, end, alloc_ranges, &as);
401 	if (as.error != 0) {
402 		for (i = 0; i < as.count; i++)
403 			bus_release_resource(sc->dev, SYS_RES_IOPORT,
404 			    sc->io.reg, as.res[i]);
405 		free(as.res, M_DEVBUF);
406 		return (as.error);
407 	}
408 	KASSERT(as.count == new_count, ("%s: count mismatch", __func__));
409 
410 	/* Third, add the ranges to the window. */
411 	pcib_add_window_resources(&sc->io, as.res, as.count);
412 	free(as.res, M_DEVBUF);
413 	return (0);
414 }
415 
416 static void
417 pcib_alloc_window(struct pcib_softc *sc, struct pcib_window *w, int type,
418     int flags, pci_addr_t max_address)
419 {
420 	struct resource *res;
421 	char buf[64];
422 	int error, rid;
423 
424 	if (max_address != (rman_res_t)max_address)
425 		max_address = ~0;
426 	w->rman.rm_start = 0;
427 	w->rman.rm_end = max_address;
428 	w->rman.rm_type = RMAN_ARRAY;
429 	snprintf(buf, sizeof(buf), "%s %s window",
430 	    device_get_nameunit(sc->dev), w->name);
431 	w->rman.rm_descr = strdup(buf, M_DEVBUF);
432 	error = rman_init(&w->rman);
433 	if (error)
434 		panic("Failed to initialize %s %s rman",
435 		    device_get_nameunit(sc->dev), w->name);
436 
437 	if (!pcib_is_window_open(w))
438 		return;
439 
440 	if (w->base > max_address || w->limit > max_address) {
441 		device_printf(sc->dev,
442 		    "initial %s window has too many bits, ignoring\n", w->name);
443 		return;
444 	}
445 	if (type == SYS_RES_IOPORT && sc->bridgectl & PCIB_BCR_ISA_ENABLE)
446 		(void)pcib_alloc_nonisa_ranges(sc, w->base, w->limit);
447 	else {
448 		rid = w->reg;
449 		res = bus_alloc_resource(sc->dev, type, &rid, w->base, w->limit,
450 		    w->limit - w->base + 1, flags | RF_ACTIVE | RF_UNMAPPED);
451 		if (res != NULL)
452 			pcib_add_window_resources(w, &res, 1);
453 	}
454 	if (w->res == NULL) {
455 		device_printf(sc->dev,
456 		    "failed to allocate initial %s window: %#jx-%#jx\n",
457 		    w->name, (uintmax_t)w->base, (uintmax_t)w->limit);
458 		w->base = max_address;
459 		w->limit = 0;
460 		pcib_write_windows(sc, w->mask);
461 		return;
462 	}
463 	pcib_activate_window(sc, type);
464 }
465 
466 /*
467  * Initialize I/O windows.
468  */
469 static void
470 pcib_probe_windows(struct pcib_softc *sc)
471 {
472 	pci_addr_t max;
473 	device_t dev;
474 	uint32_t val;
475 
476 	dev = sc->dev;
477 
478 	if (pci_clear_pcib) {
479 		pcib_bridge_init(dev);
480 	}
481 
482 	/* Determine if the I/O port window is implemented. */
483 	val = pci_read_config(dev, PCIR_IOBASEL_1, 1);
484 	if (val == 0) {
485 		/*
486 		 * If 'val' is zero, then only 16-bits of I/O space
487 		 * are supported.
488 		 */
489 		pci_write_config(dev, PCIR_IOBASEL_1, 0xff, 1);
490 		if (pci_read_config(dev, PCIR_IOBASEL_1, 1) != 0) {
491 			sc->io.valid = 1;
492 			pci_write_config(dev, PCIR_IOBASEL_1, 0, 1);
493 		}
494 	} else
495 		sc->io.valid = 1;
496 
497 	/* Read the existing I/O port window. */
498 	if (sc->io.valid) {
499 		sc->io.reg = PCIR_IOBASEL_1;
500 		sc->io.step = 12;
501 		sc->io.mask = WIN_IO;
502 		sc->io.name = "I/O port";
503 		if ((val & PCIM_BRIO_MASK) == PCIM_BRIO_32) {
504 			sc->io.base = PCI_PPBIOBASE(
505 			    pci_read_config(dev, PCIR_IOBASEH_1, 2), val);
506 			sc->io.limit = PCI_PPBIOLIMIT(
507 			    pci_read_config(dev, PCIR_IOLIMITH_1, 2),
508 			    pci_read_config(dev, PCIR_IOLIMITL_1, 1));
509 			max = 0xffffffff;
510 		} else {
511 			sc->io.base = PCI_PPBIOBASE(0, val);
512 			sc->io.limit = PCI_PPBIOLIMIT(0,
513 			    pci_read_config(dev, PCIR_IOLIMITL_1, 1));
514 			max = 0xffff;
515 		}
516 		pcib_alloc_window(sc, &sc->io, SYS_RES_IOPORT, 0, max);
517 	}
518 
519 	/* Read the existing memory window. */
520 	sc->mem.valid = 1;
521 	sc->mem.reg = PCIR_MEMBASE_1;
522 	sc->mem.step = 20;
523 	sc->mem.mask = WIN_MEM;
524 	sc->mem.name = "memory";
525 	sc->mem.base = PCI_PPBMEMBASE(0,
526 	    pci_read_config(dev, PCIR_MEMBASE_1, 2));
527 	sc->mem.limit = PCI_PPBMEMLIMIT(0,
528 	    pci_read_config(dev, PCIR_MEMLIMIT_1, 2));
529 	pcib_alloc_window(sc, &sc->mem, SYS_RES_MEMORY, 0, 0xffffffff);
530 
531 	/* Determine if the prefetchable memory window is implemented. */
532 	val = pci_read_config(dev, PCIR_PMBASEL_1, 2);
533 	if (val == 0) {
534 		/*
535 		 * If 'val' is zero, then only 32-bits of memory space
536 		 * are supported.
537 		 */
538 		pci_write_config(dev, PCIR_PMBASEL_1, 0xffff, 2);
539 		if (pci_read_config(dev, PCIR_PMBASEL_1, 2) != 0) {
540 			sc->pmem.valid = 1;
541 			pci_write_config(dev, PCIR_PMBASEL_1, 0, 2);
542 		}
543 	} else
544 		sc->pmem.valid = 1;
545 
546 	/* Read the existing prefetchable memory window. */
547 	if (sc->pmem.valid) {
548 		sc->pmem.reg = PCIR_PMBASEL_1;
549 		sc->pmem.step = 20;
550 		sc->pmem.mask = WIN_PMEM;
551 		sc->pmem.name = "prefetch";
552 		if ((val & PCIM_BRPM_MASK) == PCIM_BRPM_64) {
553 			sc->pmem.base = PCI_PPBMEMBASE(
554 			    pci_read_config(dev, PCIR_PMBASEH_1, 4), val);
555 			sc->pmem.limit = PCI_PPBMEMLIMIT(
556 			    pci_read_config(dev, PCIR_PMLIMITH_1, 4),
557 			    pci_read_config(dev, PCIR_PMLIMITL_1, 2));
558 			max = 0xffffffffffffffff;
559 		} else {
560 			sc->pmem.base = PCI_PPBMEMBASE(0, val);
561 			sc->pmem.limit = PCI_PPBMEMLIMIT(0,
562 			    pci_read_config(dev, PCIR_PMLIMITL_1, 2));
563 			max = 0xffffffff;
564 		}
565 		pcib_alloc_window(sc, &sc->pmem, SYS_RES_MEMORY,
566 		    RF_PREFETCHABLE, max);
567 	}
568 }
569 
570 static void
571 pcib_release_window(struct pcib_softc *sc, struct pcib_window *w, int type)
572 {
573 	device_t dev;
574 	int error, i;
575 
576 	if (!w->valid)
577 		return;
578 
579 	dev = sc->dev;
580 	error = rman_fini(&w->rman);
581 	if (error) {
582 		device_printf(dev, "failed to release %s rman\n", w->name);
583 		return;
584 	}
585 	free(__DECONST(char *, w->rman.rm_descr), M_DEVBUF);
586 
587 	for (i = 0; i < w->count; i++) {
588 		error = bus_free_resource(dev, type, w->res[i]);
589 		if (error)
590 			device_printf(dev,
591 			    "failed to release %s resource: %d\n", w->name,
592 			    error);
593 	}
594 	free(w->res, M_DEVBUF);
595 }
596 
597 static void
598 pcib_free_windows(struct pcib_softc *sc)
599 {
600 
601 	pcib_release_window(sc, &sc->pmem, SYS_RES_MEMORY);
602 	pcib_release_window(sc, &sc->mem, SYS_RES_MEMORY);
603 	pcib_release_window(sc, &sc->io, SYS_RES_IOPORT);
604 }
605 
606 /*
607  * Allocate a suitable secondary bus for this bridge if needed and
608  * initialize the resource manager for the secondary bus range.  Note
609  * that the minimum count is a desired value and this may allocate a
610  * smaller range.
611  */
612 void
613 pcib_setup_secbus(device_t dev, struct pcib_secbus *bus, int min_count)
614 {
615 	char buf[64];
616 	int error, rid, sec_reg;
617 
618 	switch (pci_read_config(dev, PCIR_HDRTYPE, 1) & PCIM_HDRTYPE) {
619 	case PCIM_HDRTYPE_BRIDGE:
620 		sec_reg = PCIR_SECBUS_1;
621 		bus->sub_reg = PCIR_SUBBUS_1;
622 		break;
623 	case PCIM_HDRTYPE_CARDBUS:
624 		sec_reg = PCIR_SECBUS_2;
625 		bus->sub_reg = PCIR_SUBBUS_2;
626 		break;
627 	default:
628 		panic("not a PCI bridge");
629 	}
630 	bus->sec = pci_read_config(dev, sec_reg, 1);
631 	bus->sub = pci_read_config(dev, bus->sub_reg, 1);
632 	bus->dev = dev;
633 	bus->rman.rm_start = 0;
634 	bus->rman.rm_end = PCI_BUSMAX;
635 	bus->rman.rm_type = RMAN_ARRAY;
636 	snprintf(buf, sizeof(buf), "%s bus numbers", device_get_nameunit(dev));
637 	bus->rman.rm_descr = strdup(buf, M_DEVBUF);
638 	error = rman_init(&bus->rman);
639 	if (error)
640 		panic("Failed to initialize %s bus number rman",
641 		    device_get_nameunit(dev));
642 
643 	/*
644 	 * Allocate a bus range.  This will return an existing bus range
645 	 * if one exists, or a new bus range if one does not.
646 	 */
647 	rid = 0;
648 	bus->res = bus_alloc_resource_anywhere(dev, PCI_RES_BUS, &rid,
649 	    min_count, RF_ACTIVE);
650 	if (bus->res == NULL) {
651 		/*
652 		 * Fall back to just allocating a range of a single bus
653 		 * number.
654 		 */
655 		bus->res = bus_alloc_resource_anywhere(dev, PCI_RES_BUS, &rid,
656 		    1, RF_ACTIVE);
657 	} else if (rman_get_size(bus->res) < min_count)
658 		/*
659 		 * Attempt to grow the existing range to satisfy the
660 		 * minimum desired count.
661 		 */
662 		(void)bus_adjust_resource(dev, PCI_RES_BUS, bus->res,
663 		    rman_get_start(bus->res), rman_get_start(bus->res) +
664 		    min_count - 1);
665 
666 	/*
667 	 * Add the initial resource to the rman.
668 	 */
669 	if (bus->res != NULL) {
670 		error = rman_manage_region(&bus->rman, rman_get_start(bus->res),
671 		    rman_get_end(bus->res));
672 		if (error)
673 			panic("Failed to add resource to rman");
674 		bus->sec = rman_get_start(bus->res);
675 		bus->sub = rman_get_end(bus->res);
676 	}
677 }
678 
679 void
680 pcib_free_secbus(device_t dev, struct pcib_secbus *bus)
681 {
682 	int error;
683 
684 	error = rman_fini(&bus->rman);
685 	if (error) {
686 		device_printf(dev, "failed to release bus number rman\n");
687 		return;
688 	}
689 	free(__DECONST(char *, bus->rman.rm_descr), M_DEVBUF);
690 
691 	error = bus_free_resource(dev, PCI_RES_BUS, bus->res);
692 	if (error)
693 		device_printf(dev,
694 		    "failed to release bus numbers resource: %d\n", error);
695 }
696 
697 static struct resource *
698 pcib_suballoc_bus(struct pcib_secbus *bus, device_t child, int *rid,
699     rman_res_t start, rman_res_t end, rman_res_t count, u_int flags)
700 {
701 	struct resource *res;
702 
703 	res = rman_reserve_resource(&bus->rman, start, end, count, flags,
704 	    child);
705 	if (res == NULL)
706 		return (NULL);
707 
708 	if (bootverbose)
709 		device_printf(bus->dev,
710 		    "allocated bus range (%ju-%ju) for rid %d of %s\n",
711 		    rman_get_start(res), rman_get_end(res), *rid,
712 		    pcib_child_name(child));
713 	rman_set_rid(res, *rid);
714 	rman_set_type(res, PCI_RES_BUS);
715 	return (res);
716 }
717 
718 /*
719  * Attempt to grow the secondary bus range.  This is much simpler than
720  * for I/O windows as the range can only be grown by increasing
721  * subbus.
722  */
723 static int
724 pcib_grow_subbus(struct pcib_secbus *bus, rman_res_t new_end)
725 {
726 	rman_res_t old_end;
727 	int error;
728 
729 	old_end = rman_get_end(bus->res);
730 	KASSERT(new_end > old_end, ("attempt to shrink subbus"));
731 	error = bus_adjust_resource(bus->dev, PCI_RES_BUS, bus->res,
732 	    rman_get_start(bus->res), new_end);
733 	if (error)
734 		return (error);
735 	if (bootverbose)
736 		device_printf(bus->dev, "grew bus range to %ju-%ju\n",
737 		    rman_get_start(bus->res), rman_get_end(bus->res));
738 	error = rman_manage_region(&bus->rman, old_end + 1,
739 	    rman_get_end(bus->res));
740 	if (error)
741 		panic("Failed to add resource to rman");
742 	bus->sub = rman_get_end(bus->res);
743 	pci_write_config(bus->dev, bus->sub_reg, bus->sub, 1);
744 	return (0);
745 }
746 
747 struct resource *
748 pcib_alloc_subbus(struct pcib_secbus *bus, device_t child, int *rid,
749     rman_res_t start, rman_res_t end, rman_res_t count, u_int flags)
750 {
751 	struct resource *res;
752 	rman_res_t start_free, end_free, new_end;
753 
754 	/*
755 	 * First, see if the request can be satisified by the existing
756 	 * bus range.
757 	 */
758 	res = pcib_suballoc_bus(bus, child, rid, start, end, count, flags);
759 	if (res != NULL)
760 		return (res);
761 
762 	/*
763 	 * Figure out a range to grow the bus range.  First, find the
764 	 * first bus number after the last allocated bus in the rman and
765 	 * enforce that as a minimum starting point for the range.
766 	 */
767 	if (rman_last_free_region(&bus->rman, &start_free, &end_free) != 0 ||
768 	    end_free != bus->sub)
769 		start_free = bus->sub + 1;
770 	if (start_free < start)
771 		start_free = start;
772 	new_end = start_free + count - 1;
773 
774 	/*
775 	 * See if this new range would satisfy the request if it
776 	 * succeeds.
777 	 */
778 	if (new_end > end)
779 		return (NULL);
780 
781 	/* Finally, attempt to grow the existing resource. */
782 	if (bootverbose) {
783 		device_printf(bus->dev,
784 		    "attempting to grow bus range for %ju buses\n", count);
785 		printf("\tback candidate range: %ju-%ju\n", start_free,
786 		    new_end);
787 	}
788 	if (pcib_grow_subbus(bus, new_end) == 0)
789 		return (pcib_suballoc_bus(bus, child, rid, start, end, count,
790 		    flags));
791 	return (NULL);
792 }
793 
794 #ifdef PCI_HP
795 /*
796  * PCI-express HotPlug support.
797  */
798 static int pci_enable_pcie_hp = 1;
799 SYSCTL_INT(_hw_pci, OID_AUTO, enable_pcie_hp, CTLFLAG_RDTUN,
800     &pci_enable_pcie_hp, 0,
801     "Enable support for native PCI-express HotPlug.");
802 
803 TASKQUEUE_DEFINE_THREAD(pci_hp);
804 
805 static void
806 pcib_probe_hotplug(struct pcib_softc *sc)
807 {
808 	device_t dev;
809 	uint32_t link_cap;
810 	uint16_t link_sta, slot_sta;
811 
812 	if (!pci_enable_pcie_hp)
813 		return;
814 
815 	dev = sc->dev;
816 	if (pci_find_cap(dev, PCIY_EXPRESS, NULL) != 0)
817 		return;
818 
819 	if (!(pcie_read_config(dev, PCIER_FLAGS, 2) & PCIEM_FLAGS_SLOT))
820 		return;
821 
822 	sc->pcie_slot_cap = pcie_read_config(dev, PCIER_SLOT_CAP, 4);
823 
824 	if ((sc->pcie_slot_cap & PCIEM_SLOT_CAP_HPC) == 0)
825 		return;
826 	link_cap = pcie_read_config(dev, PCIER_LINK_CAP, 4);
827 	if ((link_cap & PCIEM_LINK_CAP_DL_ACTIVE) == 0)
828 		return;
829 
830 	/*
831 	 * Some devices report that they have an MRL when they actually
832 	 * do not.  Since they always report that the MRL is open, child
833 	 * devices would be ignored.  Try to detect these devices and
834 	 * ignore their claim of HotPlug support.
835 	 *
836 	 * If there is an open MRL but the Data Link Layer is active,
837 	 * the MRL is not real.
838 	 */
839 	if ((sc->pcie_slot_cap & PCIEM_SLOT_CAP_MRLSP) != 0) {
840 		link_sta = pcie_read_config(dev, PCIER_LINK_STA, 2);
841 		slot_sta = pcie_read_config(dev, PCIER_SLOT_STA, 2);
842 		if ((slot_sta & PCIEM_SLOT_STA_MRLSS) != 0 &&
843 		    (link_sta & PCIEM_LINK_STA_DL_ACTIVE) != 0) {
844 			return;
845 		}
846 	}
847 
848 	/*
849 	 * Now that we're sure we want to do hot plug, ask the
850 	 * firmware, if any, if that's OK.
851 	 */
852 	if (pcib_request_feature(dev, PCI_FEATURE_HP) != 0) {
853 		if (bootverbose)
854 			device_printf(dev, "Unable to activate hot plug feature.\n");
855 		return;
856 	}
857 
858 	sc->flags |= PCIB_HOTPLUG;
859 }
860 
861 /*
862  * Send a HotPlug command to the slot control register.  If this slot
863  * uses command completion interrupts and a previous command is still
864  * in progress, then the command is dropped.  Once the previous
865  * command completes or times out, pcib_pcie_hotplug_update() will be
866  * invoked to post a new command based on the slot's state at that
867  * time.
868  */
869 static void
870 pcib_pcie_hotplug_command(struct pcib_softc *sc, uint16_t val, uint16_t mask)
871 {
872 	device_t dev;
873 	uint16_t ctl, new;
874 
875 	dev = sc->dev;
876 
877 	if (sc->flags & PCIB_HOTPLUG_CMD_PENDING)
878 		return;
879 
880 	ctl = pcie_read_config(dev, PCIER_SLOT_CTL, 2);
881 	new = (ctl & ~mask) | val;
882 	if (new == ctl)
883 		return;
884 	if (bootverbose)
885 		device_printf(dev, "HotPlug command: %04x -> %04x\n", ctl, new);
886 	pcie_write_config(dev, PCIER_SLOT_CTL, new, 2);
887 	if (!(sc->pcie_slot_cap & PCIEM_SLOT_CAP_NCCS) &&
888 	    (ctl & new) & PCIEM_SLOT_CTL_CCIE) {
889 		sc->flags |= PCIB_HOTPLUG_CMD_PENDING;
890 		if (!cold)
891 			taskqueue_enqueue_timeout(taskqueue_pci_hp,
892 			    &sc->pcie_cc_task, hz);
893 	}
894 }
895 
896 static void
897 pcib_pcie_hotplug_command_completed(struct pcib_softc *sc)
898 {
899 	device_t dev;
900 
901 	dev = sc->dev;
902 
903 	if (bootverbose)
904 		device_printf(dev, "Command Completed\n");
905 	if (!(sc->flags & PCIB_HOTPLUG_CMD_PENDING))
906 		return;
907 	taskqueue_cancel_timeout(taskqueue_pci_hp, &sc->pcie_cc_task, NULL);
908 	sc->flags &= ~PCIB_HOTPLUG_CMD_PENDING;
909 	wakeup(sc);
910 }
911 
912 /*
913  * Returns true if a card is fully inserted from the user's
914  * perspective.  It may not yet be ready for access, but the driver
915  * can now start enabling access if necessary.
916  */
917 static bool
918 pcib_hotplug_inserted(struct pcib_softc *sc)
919 {
920 
921 	/* Pretend the card isn't present if a detach is forced. */
922 	if (sc->flags & PCIB_DETACHING)
923 		return (false);
924 
925 	/* Card must be present in the slot. */
926 	if ((sc->pcie_slot_sta & PCIEM_SLOT_STA_PDS) == 0)
927 		return (false);
928 
929 	/* A power fault implicitly turns off power to the slot. */
930 	if (sc->pcie_slot_sta & PCIEM_SLOT_STA_PFD)
931 		return (false);
932 
933 	/* If the MRL is disengaged, the slot is powered off. */
934 	if (sc->pcie_slot_cap & PCIEM_SLOT_CAP_MRLSP &&
935 	    (sc->pcie_slot_sta & PCIEM_SLOT_STA_MRLSS) != 0)
936 		return (false);
937 
938 	return (true);
939 }
940 
941 /*
942  * Returns -1 if the card is fully inserted, powered, and ready for
943  * access.  Otherwise, returns 0.
944  */
945 static int
946 pcib_hotplug_present(struct pcib_softc *sc)
947 {
948 
949 	/* Card must be inserted. */
950 	if (!pcib_hotplug_inserted(sc))
951 		return (0);
952 
953 	/* Require the Data Link Layer to be active. */
954 	if (!(sc->pcie_link_sta & PCIEM_LINK_STA_DL_ACTIVE))
955 		return (0);
956 
957 	return (-1);
958 }
959 
960 static int pci_enable_pcie_ei = 0;
961 SYSCTL_INT(_hw_pci, OID_AUTO, enable_pcie_ei, CTLFLAG_RWTUN,
962     &pci_enable_pcie_ei, 0,
963     "Enable support for PCI-express Electromechanical Interlock.");
964 
965 static void
966 pcib_pcie_hotplug_update(struct pcib_softc *sc, uint16_t val, uint16_t mask,
967     bool schedule_task)
968 {
969 	bool card_inserted, ei_engaged;
970 
971 	/* Clear DETACHING if Presence Detect has cleared. */
972 	if ((sc->pcie_slot_sta & (PCIEM_SLOT_STA_PDC | PCIEM_SLOT_STA_PDS)) ==
973 	    PCIEM_SLOT_STA_PDC)
974 		sc->flags &= ~PCIB_DETACHING;
975 
976 	card_inserted = pcib_hotplug_inserted(sc);
977 
978 	/* Turn the power indicator on if a card is inserted. */
979 	if (sc->pcie_slot_cap & PCIEM_SLOT_CAP_PIP) {
980 		mask |= PCIEM_SLOT_CTL_PIC;
981 		if (card_inserted)
982 			val |= PCIEM_SLOT_CTL_PI_ON;
983 		else if (sc->flags & PCIB_DETACH_PENDING)
984 			val |= PCIEM_SLOT_CTL_PI_BLINK;
985 		else
986 			val |= PCIEM_SLOT_CTL_PI_OFF;
987 	}
988 
989 	/* Turn the power on via the Power Controller if a card is inserted. */
990 	if (sc->pcie_slot_cap & PCIEM_SLOT_CAP_PCP) {
991 		mask |= PCIEM_SLOT_CTL_PCC;
992 		if (card_inserted)
993 			val |= PCIEM_SLOT_CTL_PC_ON;
994 		else
995 			val |= PCIEM_SLOT_CTL_PC_OFF;
996 	}
997 
998 	/*
999 	 * If a card is inserted, enable the Electromechanical
1000 	 * Interlock.  If a card is not inserted (or we are in the
1001 	 * process of detaching), disable the Electromechanical
1002 	 * Interlock.
1003 	 */
1004 	if ((sc->pcie_slot_cap & PCIEM_SLOT_CAP_EIP) &&
1005 	    pci_enable_pcie_ei) {
1006 		mask |= PCIEM_SLOT_CTL_EIC;
1007 		ei_engaged = (sc->pcie_slot_sta & PCIEM_SLOT_STA_EIS) != 0;
1008 		if (card_inserted != ei_engaged)
1009 			val |= PCIEM_SLOT_CTL_EIC;
1010 	}
1011 
1012 	/*
1013 	 * Start a timer to see if the Data Link Layer times out.
1014 	 * Note that we only start the timer if Presence Detect or MRL Sensor
1015 	 * changed on this interrupt.  Stop any scheduled timer if
1016 	 * the Data Link Layer is active.
1017 	 */
1018 	if (card_inserted &&
1019 	    !(sc->pcie_link_sta & PCIEM_LINK_STA_DL_ACTIVE) &&
1020 	    sc->pcie_slot_sta &
1021 	    (PCIEM_SLOT_STA_MRLSC | PCIEM_SLOT_STA_PDC)) {
1022 		if (cold)
1023 			device_printf(sc->dev,
1024 			    "Data Link Layer inactive\n");
1025 		else
1026 			taskqueue_enqueue_timeout(taskqueue_pci_hp,
1027 			    &sc->pcie_dll_task, hz);
1028 	} else if (sc->pcie_link_sta & PCIEM_LINK_STA_DL_ACTIVE)
1029 		taskqueue_cancel_timeout(taskqueue_pci_hp, &sc->pcie_dll_task,
1030 		    NULL);
1031 
1032 	pcib_pcie_hotplug_command(sc, val, mask);
1033 
1034 	/*
1035 	 * During attach the child "pci" device is added synchronously;
1036 	 * otherwise, the task is scheduled to manage the child
1037 	 * device.
1038 	 */
1039 	if (schedule_task &&
1040 	    (pcib_hotplug_present(sc) != 0) != (sc->child != NULL))
1041 		taskqueue_enqueue(taskqueue_pci_hp, &sc->pcie_hp_task);
1042 }
1043 
1044 static void
1045 pcib_pcie_intr_hotplug(void *arg)
1046 {
1047 	struct pcib_softc *sc;
1048 	device_t dev;
1049 	uint16_t old_slot_sta;
1050 
1051 	sc = arg;
1052 	dev = sc->dev;
1053 	PCIB_HP_LOCK(sc);
1054 	old_slot_sta = sc->pcie_slot_sta;
1055 	sc->pcie_slot_sta = pcie_read_config(dev, PCIER_SLOT_STA, 2);
1056 
1057 	/* Clear the events just reported. */
1058 	pcie_write_config(dev, PCIER_SLOT_STA, sc->pcie_slot_sta, 2);
1059 
1060 	if (bootverbose)
1061 		device_printf(dev, "HotPlug interrupt: %#x\n",
1062 		    sc->pcie_slot_sta);
1063 
1064 	if (sc->pcie_slot_sta & PCIEM_SLOT_STA_ABP) {
1065 		if (sc->flags & PCIB_DETACH_PENDING) {
1066 			device_printf(dev,
1067 			    "Attention Button Pressed: Detach Cancelled\n");
1068 			sc->flags &= ~PCIB_DETACH_PENDING;
1069 			taskqueue_cancel_timeout(taskqueue_pci_hp,
1070 			    &sc->pcie_ab_task, NULL);
1071 		} else if (old_slot_sta & PCIEM_SLOT_STA_PDS) {
1072 			/* Only initiate detach sequence if device present. */
1073 			device_printf(dev,
1074 		    "Attention Button Pressed: Detaching in 5 seconds\n");
1075 			sc->flags |= PCIB_DETACH_PENDING;
1076 			taskqueue_enqueue_timeout(taskqueue_pci_hp,
1077 			    &sc->pcie_ab_task, 5 * hz);
1078 		}
1079 	}
1080 	if (sc->pcie_slot_sta & PCIEM_SLOT_STA_PFD)
1081 		device_printf(dev, "Power Fault Detected\n");
1082 	if (sc->pcie_slot_sta & PCIEM_SLOT_STA_MRLSC)
1083 		device_printf(dev, "MRL Sensor Changed to %s\n",
1084 		    sc->pcie_slot_sta & PCIEM_SLOT_STA_MRLSS ? "open" :
1085 		    "closed");
1086 	if (bootverbose && sc->pcie_slot_sta & PCIEM_SLOT_STA_PDC)
1087 		device_printf(dev, "Presence Detect Changed to %s\n",
1088 		    sc->pcie_slot_sta & PCIEM_SLOT_STA_PDS ? "card present" :
1089 		    "empty");
1090 	if (sc->pcie_slot_sta & PCIEM_SLOT_STA_CC)
1091 		pcib_pcie_hotplug_command_completed(sc);
1092 	if (sc->pcie_slot_sta & PCIEM_SLOT_STA_DLLSC) {
1093 		sc->pcie_link_sta = pcie_read_config(dev, PCIER_LINK_STA, 2);
1094 		if (bootverbose)
1095 			device_printf(dev,
1096 			    "Data Link Layer State Changed to %s\n",
1097 			    sc->pcie_link_sta & PCIEM_LINK_STA_DL_ACTIVE ?
1098 			    "active" : "inactive");
1099 	}
1100 
1101 	pcib_pcie_hotplug_update(sc, 0, 0, true);
1102 	PCIB_HP_UNLOCK(sc);
1103 }
1104 
1105 static void
1106 pcib_pcie_hotplug_task(void *context, int pending)
1107 {
1108 	struct pcib_softc *sc;
1109 	device_t dev;
1110 
1111 	sc = context;
1112 	PCIB_HP_LOCK(sc);
1113 	dev = sc->dev;
1114 	if (pcib_hotplug_present(sc) != 0) {
1115 		if (sc->child == NULL) {
1116 			sc->child = device_add_child(dev, "pci", DEVICE_UNIT_ANY);
1117 			bus_generic_attach(dev);
1118 		}
1119 	} else {
1120 		if (sc->child != NULL) {
1121 			if (device_delete_child(dev, sc->child) == 0)
1122 				sc->child = NULL;
1123 		}
1124 	}
1125 	PCIB_HP_UNLOCK(sc);
1126 }
1127 
1128 static void
1129 pcib_pcie_ab_timeout(void *arg, int pending)
1130 {
1131 	struct pcib_softc *sc = arg;
1132 
1133 	PCIB_HP_LOCK(sc);
1134 	if (sc->flags & PCIB_DETACH_PENDING) {
1135 		sc->flags |= PCIB_DETACHING;
1136 		sc->flags &= ~PCIB_DETACH_PENDING;
1137 		pcib_pcie_hotplug_update(sc, 0, 0, true);
1138 	}
1139 	PCIB_HP_UNLOCK(sc);
1140 }
1141 
1142 static void
1143 pcib_pcie_cc_timeout(void *arg, int pending)
1144 {
1145 	struct pcib_softc *sc = arg;
1146 	device_t dev = sc->dev;
1147 	uint16_t sta;
1148 
1149 	PCIB_HP_LOCK(sc);
1150 	sta = pcie_read_config(dev, PCIER_SLOT_STA, 2);
1151 	if (!(sta & PCIEM_SLOT_STA_CC)) {
1152 		device_printf(dev, "HotPlug Command Timed Out\n");
1153 		sc->flags &= ~PCIB_HOTPLUG_CMD_PENDING;
1154 	} else {
1155 		device_printf(dev,
1156 	    "Missed HotPlug interrupt waiting for Command Completion\n");
1157 		pcib_pcie_intr_hotplug(sc);
1158 	}
1159 	PCIB_HP_UNLOCK(sc);
1160 }
1161 
1162 static void
1163 pcib_pcie_dll_timeout(void *arg, int pending)
1164 {
1165 	struct pcib_softc *sc = arg;
1166 	device_t dev = sc->dev;
1167 	uint16_t sta;
1168 
1169 	PCIB_HP_LOCK(sc);
1170 	sta = pcie_read_config(dev, PCIER_LINK_STA, 2);
1171 	if (!(sta & PCIEM_LINK_STA_DL_ACTIVE)) {
1172 		device_printf(dev,
1173 		    "Timed out waiting for Data Link Layer Active\n");
1174 		sc->flags |= PCIB_DETACHING;
1175 		pcib_pcie_hotplug_update(sc, 0, 0, true);
1176 	} else if (sta != sc->pcie_link_sta) {
1177 		device_printf(dev,
1178 		    "Missed HotPlug interrupt waiting for DLL Active\n");
1179 		pcib_pcie_intr_hotplug(sc);
1180 	}
1181 	PCIB_HP_UNLOCK(sc);
1182 }
1183 
1184 static int
1185 pcib_alloc_pcie_irq(struct pcib_softc *sc)
1186 {
1187 	device_t dev;
1188 	int count, error, mem_rid, rid;
1189 
1190 	rid = -1;
1191 	dev = sc->dev;
1192 
1193 	/*
1194 	 * For simplicity, only use MSI-X if there is a single message.
1195 	 * To support a device with multiple messages we would have to
1196 	 * use remap intr if the MSI number is not 0.
1197 	 */
1198 	count = pci_msix_count(dev);
1199 	if (count == 1) {
1200 		mem_rid = pci_msix_table_bar(dev);
1201 		sc->pcie_mem = bus_alloc_resource_any(dev, SYS_RES_MEMORY,
1202 		    &mem_rid, RF_ACTIVE);
1203 		if (sc->pcie_mem == NULL) {
1204 			device_printf(dev,
1205 			    "Failed to allocate BAR for MSI-X table\n");
1206 		} else {
1207 			error = pci_alloc_msix(dev, &count);
1208 			if (error == 0)
1209 				rid = 1;
1210 		}
1211 	}
1212 
1213 	if (rid < 0 && pci_msi_count(dev) > 0) {
1214 		count = 1;
1215 		error = pci_alloc_msi(dev, &count);
1216 		if (error == 0)
1217 			rid = 1;
1218 	}
1219 
1220 	if (rid < 0)
1221 		rid = 0;
1222 
1223 	sc->pcie_irq = bus_alloc_resource_any(dev, SYS_RES_IRQ, &rid,
1224 	    RF_ACTIVE | RF_SHAREABLE);
1225 	if (sc->pcie_irq == NULL) {
1226 		device_printf(dev,
1227 		    "Failed to allocate interrupt for PCI-e events\n");
1228 		if (rid > 0)
1229 			pci_release_msi(dev);
1230 		return (ENXIO);
1231 	}
1232 
1233 	error = bus_setup_intr(dev, sc->pcie_irq, INTR_TYPE_MISC|INTR_MPSAFE,
1234 	    NULL, pcib_pcie_intr_hotplug, sc, &sc->pcie_ihand);
1235 	if (error) {
1236 		device_printf(dev, "Failed to setup PCI-e interrupt handler\n");
1237 		bus_release_resource(dev, SYS_RES_IRQ, rid, sc->pcie_irq);
1238 		if (rid > 0)
1239 			pci_release_msi(dev);
1240 		return (error);
1241 	}
1242 	return (0);
1243 }
1244 
1245 static int
1246 pcib_release_pcie_irq(struct pcib_softc *sc)
1247 {
1248 	device_t dev;
1249 	int error;
1250 
1251 	dev = sc->dev;
1252 	error = bus_teardown_intr(dev, sc->pcie_irq, sc->pcie_ihand);
1253 	if (error)
1254 		return (error);
1255 	error = bus_free_resource(dev, SYS_RES_IRQ, sc->pcie_irq);
1256 	if (error)
1257 		return (error);
1258 	error = pci_release_msi(dev);
1259 	if (error)
1260 		return (error);
1261 	if (sc->pcie_mem != NULL)
1262 		error = bus_free_resource(dev, SYS_RES_MEMORY, sc->pcie_mem);
1263 	return (error);
1264 }
1265 
1266 static void
1267 pcib_setup_hotplug(struct pcib_softc *sc)
1268 {
1269 	device_t dev;
1270 	uint16_t mask, val;
1271 
1272 	dev = sc->dev;
1273 	TASK_INIT(&sc->pcie_hp_task, 0, pcib_pcie_hotplug_task, sc);
1274 	TIMEOUT_TASK_INIT(taskqueue_pci_hp, &sc->pcie_ab_task, 0,
1275 	    pcib_pcie_ab_timeout, sc);
1276 	TIMEOUT_TASK_INIT(taskqueue_pci_hp, &sc->pcie_cc_task, 0,
1277 	    pcib_pcie_cc_timeout, sc);
1278 	TIMEOUT_TASK_INIT(taskqueue_pci_hp, &sc->pcie_dll_task, 0,
1279 	    pcib_pcie_dll_timeout, sc);
1280 	sc->pcie_hp_lock = bus_topo_mtx();
1281 
1282 	/* Allocate IRQ. */
1283 	if (pcib_alloc_pcie_irq(sc) != 0)
1284 		return;
1285 
1286 	sc->pcie_link_sta = pcie_read_config(dev, PCIER_LINK_STA, 2);
1287 	sc->pcie_slot_sta = pcie_read_config(dev, PCIER_SLOT_STA, 2);
1288 
1289 	/* Clear any events previously pending. */
1290 	pcie_write_config(dev, PCIER_SLOT_STA, sc->pcie_slot_sta, 2);
1291 
1292 	/* Enable HotPlug events. */
1293 	mask = PCIEM_SLOT_CTL_DLLSCE | PCIEM_SLOT_CTL_HPIE |
1294 	    PCIEM_SLOT_CTL_CCIE | PCIEM_SLOT_CTL_PDCE | PCIEM_SLOT_CTL_MRLSCE |
1295 	    PCIEM_SLOT_CTL_PFDE | PCIEM_SLOT_CTL_ABPE;
1296 	val = PCIEM_SLOT_CTL_DLLSCE | PCIEM_SLOT_CTL_HPIE | PCIEM_SLOT_CTL_PDCE;
1297 	if (sc->pcie_slot_cap & PCIEM_SLOT_CAP_APB)
1298 		val |= PCIEM_SLOT_CTL_ABPE;
1299 	if (sc->pcie_slot_cap & PCIEM_SLOT_CAP_PCP)
1300 		val |= PCIEM_SLOT_CTL_PFDE;
1301 	if (sc->pcie_slot_cap & PCIEM_SLOT_CAP_MRLSP)
1302 		val |= PCIEM_SLOT_CTL_MRLSCE;
1303 	if (!(sc->pcie_slot_cap & PCIEM_SLOT_CAP_NCCS))
1304 		val |= PCIEM_SLOT_CTL_CCIE;
1305 
1306 	/* Turn the attention indicator off. */
1307 	if (sc->pcie_slot_cap & PCIEM_SLOT_CAP_AIP) {
1308 		mask |= PCIEM_SLOT_CTL_AIC;
1309 		val |= PCIEM_SLOT_CTL_AI_OFF;
1310 	}
1311 
1312 	pcib_pcie_hotplug_update(sc, val, mask, false);
1313 }
1314 
1315 static int
1316 pcib_detach_hotplug(struct pcib_softc *sc)
1317 {
1318 	uint16_t mask, val;
1319 	int error;
1320 
1321 	/* Disable the card in the slot and force it to detach. */
1322 	if (sc->flags & PCIB_DETACH_PENDING) {
1323 		sc->flags &= ~PCIB_DETACH_PENDING;
1324 		taskqueue_cancel_timeout(taskqueue_pci_hp, &sc->pcie_ab_task,
1325 		    NULL);
1326 	}
1327 	sc->flags |= PCIB_DETACHING;
1328 
1329 	if (sc->flags & PCIB_HOTPLUG_CMD_PENDING) {
1330 		taskqueue_cancel_timeout(taskqueue_pci_hp, &sc->pcie_cc_task,
1331 		    NULL);
1332 		tsleep(sc, 0, "hpcmd", hz);
1333 		sc->flags &= ~PCIB_HOTPLUG_CMD_PENDING;
1334 	}
1335 
1336 	/* Disable HotPlug events. */
1337 	mask = PCIEM_SLOT_CTL_DLLSCE | PCIEM_SLOT_CTL_HPIE |
1338 	    PCIEM_SLOT_CTL_CCIE | PCIEM_SLOT_CTL_PDCE | PCIEM_SLOT_CTL_MRLSCE |
1339 	    PCIEM_SLOT_CTL_PFDE | PCIEM_SLOT_CTL_ABPE;
1340 	val = 0;
1341 
1342 	/* Turn the attention indicator off. */
1343 	if (sc->pcie_slot_cap & PCIEM_SLOT_CAP_AIP) {
1344 		mask |= PCIEM_SLOT_CTL_AIC;
1345 		val |= PCIEM_SLOT_CTL_AI_OFF;
1346 	}
1347 
1348 	pcib_pcie_hotplug_update(sc, val, mask, false);
1349 
1350 	error = pcib_release_pcie_irq(sc);
1351 	if (error)
1352 		return (error);
1353 	taskqueue_drain(taskqueue_pci_hp, &sc->pcie_hp_task);
1354 	taskqueue_drain_timeout(taskqueue_pci_hp, &sc->pcie_ab_task);
1355 	taskqueue_drain_timeout(taskqueue_pci_hp, &sc->pcie_cc_task);
1356 	taskqueue_drain_timeout(taskqueue_pci_hp, &sc->pcie_dll_task);
1357 	return (0);
1358 }
1359 #endif
1360 
1361 /*
1362  * Restore previous bridge configuration.
1363  */
1364 static void
1365 pcib_cfg_restore(struct pcib_softc *sc)
1366 {
1367 	pcib_write_windows(sc, WIN_IO | WIN_MEM | WIN_PMEM);
1368 }
1369 
1370 /*
1371  * Generic device interface
1372  */
1373 static int
1374 pcib_probe(device_t dev)
1375 {
1376     if ((pci_get_class(dev) == PCIC_BRIDGE) &&
1377 	(pci_get_subclass(dev) == PCIS_BRIDGE_PCI)) {
1378 	device_set_desc(dev, "PCI-PCI bridge");
1379 	return(-10000);
1380     }
1381     return(ENXIO);
1382 }
1383 
1384 void
1385 pcib_attach_common(device_t dev)
1386 {
1387     struct pcib_softc	*sc;
1388     struct sysctl_ctx_list *sctx;
1389     struct sysctl_oid	*soid;
1390     int comma;
1391 
1392     sc = device_get_softc(dev);
1393     sc->dev = dev;
1394 
1395     /*
1396      * Get current bridge configuration.
1397      */
1398     sc->domain = pci_get_domain(dev);
1399     sc->bridgectl = pci_read_config(dev, PCIR_BRIDGECTL_1, 2);
1400 
1401     /*
1402      * The primary bus register should always be the bus of the
1403      * parent.
1404      */
1405     sc->pribus = pci_get_bus(dev);
1406     pci_write_config(dev, PCIR_PRIBUS_1, sc->pribus, 1);
1407 
1408     /*
1409      * Setup sysctl reporting nodes
1410      */
1411     sctx = device_get_sysctl_ctx(dev);
1412     soid = device_get_sysctl_tree(dev);
1413     SYSCTL_ADD_UINT(sctx, SYSCTL_CHILDREN(soid), OID_AUTO, "domain",
1414       CTLFLAG_RD, &sc->domain, 0, "Domain number");
1415     SYSCTL_ADD_UINT(sctx, SYSCTL_CHILDREN(soid), OID_AUTO, "pribus",
1416       CTLFLAG_RD, &sc->pribus, 0, "Primary bus number");
1417     SYSCTL_ADD_UINT(sctx, SYSCTL_CHILDREN(soid), OID_AUTO, "secbus",
1418       CTLFLAG_RD, &sc->bus.sec, 0, "Secondary bus number");
1419     SYSCTL_ADD_UINT(sctx, SYSCTL_CHILDREN(soid), OID_AUTO, "subbus",
1420       CTLFLAG_RD, &sc->bus.sub, 0, "Subordinate bus number");
1421 
1422     /*
1423      * Quirk handling.
1424      */
1425     switch (pci_get_devid(dev)) {
1426     /*
1427      * The i82380FB mobile docking controller is a PCI-PCI bridge,
1428      * and it is a subtractive bridge.  However, the ProgIf is wrong
1429      * so the normal setting of PCIB_SUBTRACTIVE bit doesn't
1430      * happen.  There are also Toshiba and Cavium ThunderX bridges
1431      * that behave this way.
1432      */
1433     case 0xa002177d:		/* Cavium ThunderX */
1434     case 0x124b8086:		/* Intel 82380FB Mobile */
1435     case 0x060513d7:		/* Toshiba ???? */
1436 	sc->flags |= PCIB_SUBTRACTIVE;
1437 	break;
1438     }
1439 
1440     if (pci_msi_device_blacklisted(dev))
1441 	sc->flags |= PCIB_DISABLE_MSI;
1442 
1443     if (pci_msix_device_blacklisted(dev))
1444 	sc->flags |= PCIB_DISABLE_MSIX;
1445 
1446     /*
1447      * Intel 815, 845 and other chipsets say they are PCI-PCI bridges,
1448      * but have a ProgIF of 0x80.  The 82801 family (AA, AB, BAM/CAM,
1449      * BA/CA/DB and E) PCI bridges are HUB-PCI bridges, in Intelese.
1450      * This means they act as if they were subtractively decoding
1451      * bridges and pass all transactions.  Mark them and real ProgIf 1
1452      * parts as subtractive.
1453      */
1454     if ((pci_get_devid(dev) & 0xff00ffff) == 0x24008086 ||
1455       pci_read_config(dev, PCIR_PROGIF, 1) == PCIP_BRIDGE_PCI_SUBTRACTIVE)
1456 	sc->flags |= PCIB_SUBTRACTIVE;
1457 
1458 #ifdef PCI_HP
1459     pcib_probe_hotplug(sc);
1460 #endif
1461     pcib_setup_secbus(dev, &sc->bus, 1);
1462     pcib_probe_windows(sc);
1463 #ifdef PCI_HP
1464     if (sc->flags & PCIB_HOTPLUG)
1465 	    pcib_setup_hotplug(sc);
1466 #endif
1467     if (bootverbose) {
1468 	device_printf(dev, "  domain            %d\n", sc->domain);
1469 	device_printf(dev, "  secondary bus     %d\n", sc->bus.sec);
1470 	device_printf(dev, "  subordinate bus   %d\n", sc->bus.sub);
1471 	if (pcib_is_window_open(&sc->io))
1472 	    device_printf(dev, "  I/O decode        0x%jx-0x%jx\n",
1473 	      (uintmax_t)sc->io.base, (uintmax_t)sc->io.limit);
1474 	if (pcib_is_window_open(&sc->mem))
1475 	    device_printf(dev, "  memory decode     0x%jx-0x%jx\n",
1476 	      (uintmax_t)sc->mem.base, (uintmax_t)sc->mem.limit);
1477 	if (pcib_is_window_open(&sc->pmem))
1478 	    device_printf(dev, "  prefetched decode 0x%jx-0x%jx\n",
1479 	      (uintmax_t)sc->pmem.base, (uintmax_t)sc->pmem.limit);
1480 	if (sc->bridgectl & (PCIB_BCR_ISA_ENABLE | PCIB_BCR_VGA_ENABLE) ||
1481 	    sc->flags & PCIB_SUBTRACTIVE) {
1482 		device_printf(dev, "  special decode    ");
1483 		comma = 0;
1484 		if (sc->bridgectl & PCIB_BCR_ISA_ENABLE) {
1485 			printf("ISA");
1486 			comma = 1;
1487 		}
1488 		if (sc->bridgectl & PCIB_BCR_VGA_ENABLE) {
1489 			printf("%sVGA", comma ? ", " : "");
1490 			comma = 1;
1491 		}
1492 		if (sc->flags & PCIB_SUBTRACTIVE)
1493 			printf("%ssubtractive", comma ? ", " : "");
1494 		printf("\n");
1495 	}
1496     }
1497 
1498     /*
1499      * Always enable busmastering on bridges so that transactions
1500      * initiated on the secondary bus are passed through to the
1501      * primary bus.
1502      */
1503     pci_enable_busmaster(dev);
1504 }
1505 
1506 #ifdef PCI_HP
1507 static int
1508 pcib_present(struct pcib_softc *sc)
1509 {
1510 
1511 	if (sc->flags & PCIB_HOTPLUG)
1512 		return (pcib_hotplug_present(sc) != 0);
1513 	return (1);
1514 }
1515 #endif
1516 
1517 int
1518 pcib_attach_child(device_t dev)
1519 {
1520 	struct pcib_softc *sc;
1521 
1522 	sc = device_get_softc(dev);
1523 	if (sc->bus.sec == 0) {
1524 		/* no secondary bus; we should have fixed this */
1525 		return(0);
1526 	}
1527 
1528 #ifdef PCI_HP
1529 	if (!pcib_present(sc)) {
1530 		/* An empty HotPlug slot, so don't add a PCI bus yet. */
1531 		return (0);
1532 	}
1533 #endif
1534 
1535 	sc->child = device_add_child(dev, "pci", DEVICE_UNIT_ANY);
1536 	return (bus_generic_attach(dev));
1537 }
1538 
1539 int
1540 pcib_attach(device_t dev)
1541 {
1542 
1543     pcib_attach_common(dev);
1544     return (pcib_attach_child(dev));
1545 }
1546 
1547 int
1548 pcib_detach(device_t dev)
1549 {
1550 	struct pcib_softc *sc;
1551 	int error;
1552 
1553 	sc = device_get_softc(dev);
1554 	error = bus_generic_detach(dev);
1555 	if (error)
1556 		return (error);
1557 #ifdef PCI_HP
1558 	if (sc->flags & PCIB_HOTPLUG) {
1559 		error = pcib_detach_hotplug(sc);
1560 		if (error)
1561 			return (error);
1562 	}
1563 #endif
1564 	error = device_delete_children(dev);
1565 	if (error)
1566 		return (error);
1567 	pcib_free_windows(sc);
1568 	pcib_free_secbus(dev, &sc->bus);
1569 	return (0);
1570 }
1571 
1572 int
1573 pcib_resume(device_t dev)
1574 {
1575 
1576 	pcib_cfg_restore(device_get_softc(dev));
1577 
1578 	/*
1579 	 * Restore the Command register only after restoring the windows.
1580 	 * The bridge should not be claiming random windows.
1581 	 */
1582 	pci_write_config(dev, PCIR_COMMAND, pci_get_cmdreg(dev), 2);
1583 	return (bus_generic_resume(dev));
1584 }
1585 
1586 void
1587 pcib_bridge_init(device_t dev)
1588 {
1589 	pci_write_config(dev, PCIR_IOBASEL_1, 0xff, 1);
1590 	pci_write_config(dev, PCIR_IOBASEH_1, 0xffff, 2);
1591 	pci_write_config(dev, PCIR_IOLIMITL_1, 0, 1);
1592 	pci_write_config(dev, PCIR_IOLIMITH_1, 0, 2);
1593 	pci_write_config(dev, PCIR_MEMBASE_1, 0xffff, 2);
1594 	pci_write_config(dev, PCIR_MEMLIMIT_1, 0, 2);
1595 	pci_write_config(dev, PCIR_PMBASEL_1, 0xffff, 2);
1596 	pci_write_config(dev, PCIR_PMBASEH_1, 0xffffffff, 4);
1597 	pci_write_config(dev, PCIR_PMLIMITL_1, 0, 2);
1598 	pci_write_config(dev, PCIR_PMLIMITH_1, 0, 4);
1599 }
1600 
1601 int
1602 pcib_child_present(device_t dev, device_t child)
1603 {
1604 #ifdef PCI_HP
1605 	struct pcib_softc *sc = device_get_softc(dev);
1606 	int retval;
1607 
1608 	retval = bus_child_present(dev);
1609 	if (retval != 0 && sc->flags & PCIB_HOTPLUG)
1610 		retval = pcib_hotplug_present(sc);
1611 	return (retval);
1612 #else
1613 	return (bus_child_present(dev));
1614 #endif
1615 }
1616 
1617 int
1618 pcib_read_ivar(device_t dev, device_t child, int which, uintptr_t *result)
1619 {
1620     struct pcib_softc	*sc = device_get_softc(dev);
1621 
1622     switch (which) {
1623     case PCIB_IVAR_DOMAIN:
1624 	*result = sc->domain;
1625 	return(0);
1626     case PCIB_IVAR_BUS:
1627 	*result = sc->bus.sec;
1628 	return(0);
1629     }
1630     return(ENOENT);
1631 }
1632 
1633 int
1634 pcib_write_ivar(device_t dev, device_t child, int which, uintptr_t value)
1635 {
1636 
1637     switch (which) {
1638     case PCIB_IVAR_DOMAIN:
1639 	return(EINVAL);
1640     case PCIB_IVAR_BUS:
1641 	return(EINVAL);
1642     }
1643     return(ENOENT);
1644 }
1645 
1646 /*
1647  * Attempt to allocate a resource from the existing resources assigned
1648  * to a window.
1649  */
1650 static struct resource *
1651 pcib_suballoc_resource(struct pcib_softc *sc, struct pcib_window *w,
1652     device_t child, int type, int *rid, rman_res_t start, rman_res_t end,
1653     rman_res_t count, u_int flags)
1654 {
1655 	struct resource *res;
1656 
1657 	if (!pcib_is_window_open(w))
1658 		return (NULL);
1659 
1660 	res = rman_reserve_resource(&w->rman, start, end, count,
1661 	    flags & ~RF_ACTIVE, child);
1662 	if (res == NULL)
1663 		return (NULL);
1664 
1665 	if (bootverbose)
1666 		device_printf(sc->dev,
1667 		    "allocated %s range (%#jx-%#jx) for rid %x of %s\n",
1668 		    w->name, rman_get_start(res), rman_get_end(res), *rid,
1669 		    pcib_child_name(child));
1670 	rman_set_rid(res, *rid);
1671 	rman_set_type(res, type);
1672 
1673 	if (flags & RF_ACTIVE) {
1674 		if (bus_activate_resource(child, type, *rid, res) != 0) {
1675 			rman_release_resource(res);
1676 			return (NULL);
1677 		}
1678 	}
1679 
1680 	return (res);
1681 }
1682 
1683 /* Allocate a fresh resource range for an unconfigured window. */
1684 static int
1685 pcib_alloc_new_window(struct pcib_softc *sc, struct pcib_window *w, int type,
1686     rman_res_t start, rman_res_t end, rman_res_t count, u_int flags)
1687 {
1688 	struct resource *res;
1689 	rman_res_t base, limit, wmask;
1690 	int rid;
1691 
1692 	/*
1693 	 * If this is an I/O window on a bridge with ISA enable set
1694 	 * and the start address is below 64k, then try to allocate an
1695 	 * initial window of 0x1000 bytes long starting at address
1696 	 * 0xf000 and walking down.  Note that if the original request
1697 	 * was larger than the non-aliased range size of 0x100 our
1698 	 * caller would have raised the start address up to 64k
1699 	 * already.
1700 	 */
1701 	if (type == SYS_RES_IOPORT && sc->bridgectl & PCIB_BCR_ISA_ENABLE &&
1702 	    start < 65536) {
1703 		for (base = 0xf000; (long)base >= 0; base -= 0x1000) {
1704 			limit = base + 0xfff;
1705 
1706 			/*
1707 			 * Skip ranges that wouldn't work for the
1708 			 * original request.  Note that the actual
1709 			 * window that overlaps are the non-alias
1710 			 * ranges within [base, limit], so this isn't
1711 			 * quite a simple comparison.
1712 			 */
1713 			if (start + count > limit - 0x400)
1714 				continue;
1715 			if (base == 0) {
1716 				/*
1717 				 * The first open region for the window at
1718 				 * 0 is 0x400-0x4ff.
1719 				 */
1720 				if (end - count + 1 < 0x400)
1721 					continue;
1722 			} else {
1723 				if (end - count + 1 < base)
1724 					continue;
1725 			}
1726 
1727 			if (pcib_alloc_nonisa_ranges(sc, base, limit) == 0) {
1728 				w->base = base;
1729 				w->limit = limit;
1730 				return (0);
1731 			}
1732 		}
1733 		return (ENOSPC);
1734 	}
1735 
1736 	wmask = ((rman_res_t)1 << w->step) - 1;
1737 	if (RF_ALIGNMENT(flags) < w->step) {
1738 		flags &= ~RF_ALIGNMENT_MASK;
1739 		flags |= RF_ALIGNMENT_LOG2(w->step);
1740 	}
1741 	start &= ~wmask;
1742 	end |= wmask;
1743 	count = roundup2(count, (rman_res_t)1 << w->step);
1744 	rid = w->reg;
1745 	res = bus_alloc_resource(sc->dev, type, &rid, start, end, count,
1746 	    flags | RF_ACTIVE | RF_UNMAPPED);
1747 	if (res == NULL)
1748 		return (ENOSPC);
1749 	pcib_add_window_resources(w, &res, 1);
1750 	pcib_activate_window(sc, type);
1751 	w->base = rman_get_start(res);
1752 	w->limit = rman_get_end(res);
1753 	return (0);
1754 }
1755 
1756 /* Try to expand an existing window to the requested base and limit. */
1757 static int
1758 pcib_expand_window(struct pcib_softc *sc, struct pcib_window *w, int type,
1759     rman_res_t base, rman_res_t limit)
1760 {
1761 	struct resource *res;
1762 	int error, i, force_64k_base;
1763 
1764 	KASSERT(base <= w->base && limit >= w->limit,
1765 	    ("attempting to shrink window"));
1766 
1767 	/*
1768 	 * XXX: pcib_grow_window() doesn't try to do this anyway and
1769 	 * the error handling for all the edge cases would be tedious.
1770 	 */
1771 	KASSERT(limit == w->limit || base == w->base,
1772 	    ("attempting to grow both ends of a window"));
1773 
1774 	/*
1775 	 * Yet more special handling for requests to expand an I/O
1776 	 * window behind an ISA-enabled bridge.  Since I/O windows
1777 	 * have to grow in 0x1000 increments and the end of the 0xffff
1778 	 * range is an alias, growing a window below 64k will always
1779 	 * result in allocating new resources and never adjusting an
1780 	 * existing resource.
1781 	 */
1782 	if (type == SYS_RES_IOPORT && sc->bridgectl & PCIB_BCR_ISA_ENABLE &&
1783 	    (limit <= 65535 || (base <= 65535 && base != w->base))) {
1784 		KASSERT(limit == w->limit || limit <= 65535,
1785 		    ("attempting to grow both ends across 64k ISA alias"));
1786 
1787 		if (base != w->base)
1788 			error = pcib_alloc_nonisa_ranges(sc, base, w->base - 1);
1789 		else
1790 			error = pcib_alloc_nonisa_ranges(sc, w->limit + 1,
1791 			    limit);
1792 		if (error == 0) {
1793 			w->base = base;
1794 			w->limit = limit;
1795 		}
1796 		return (error);
1797 	}
1798 
1799 	/*
1800 	 * Find the existing resource to adjust.  Usually there is only one,
1801 	 * but for an ISA-enabled bridge we might be growing the I/O window
1802 	 * above 64k and need to find the existing resource that maps all
1803 	 * of the area above 64k.
1804 	 */
1805 	for (i = 0; i < w->count; i++) {
1806 		if (rman_get_end(w->res[i]) == w->limit)
1807 			break;
1808 	}
1809 	KASSERT(i != w->count, ("did not find existing resource"));
1810 	res = w->res[i];
1811 
1812 	/*
1813 	 * Usually the resource we found should match the window's
1814 	 * existing range.  The one exception is the ISA-enabled case
1815 	 * mentioned above in which case the resource should start at
1816 	 * 64k.
1817 	 */
1818 	if (type == SYS_RES_IOPORT && sc->bridgectl & PCIB_BCR_ISA_ENABLE &&
1819 	    w->base <= 65535) {
1820 		KASSERT(rman_get_start(res) == 65536,
1821 		    ("existing resource mismatch"));
1822 		force_64k_base = 1;
1823 	} else {
1824 		KASSERT(w->base == rman_get_start(res),
1825 		    ("existing resource mismatch"));
1826 		force_64k_base = 0;
1827 	}
1828 
1829 	error = bus_adjust_resource(sc->dev, type, res, force_64k_base ?
1830 	    rman_get_start(res) : base, limit);
1831 	if (error)
1832 		return (error);
1833 
1834 	/* Add the newly allocated region to the resource manager. */
1835 	if (w->base != base) {
1836 		error = rman_manage_region(&w->rman, base, w->base - 1);
1837 		w->base = base;
1838 	} else {
1839 		error = rman_manage_region(&w->rman, w->limit + 1, limit);
1840 		w->limit = limit;
1841 	}
1842 	if (error) {
1843 		if (bootverbose)
1844 			device_printf(sc->dev,
1845 			    "failed to expand %s resource manager\n", w->name);
1846 		(void)bus_adjust_resource(sc->dev, type, res, force_64k_base ?
1847 		    rman_get_start(res) : w->base, w->limit);
1848 	}
1849 	return (error);
1850 }
1851 
1852 /*
1853  * Attempt to grow a window to make room for a given resource request.
1854  */
1855 static int
1856 pcib_grow_window(struct pcib_softc *sc, struct pcib_window *w, int type,
1857     rman_res_t start, rman_res_t end, rman_res_t count, u_int flags)
1858 {
1859 	rman_res_t align, start_free, end_free, front, back, wmask;
1860 	int error;
1861 
1862 	/*
1863 	 * Clamp the desired resource range to the maximum address
1864 	 * this window supports.  Reject impossible requests.
1865 	 *
1866 	 * For I/O port requests behind a bridge with the ISA enable
1867 	 * bit set, force large allocations to start above 64k.
1868 	 */
1869 	if (!w->valid)
1870 		return (EINVAL);
1871 	if (sc->bridgectl & PCIB_BCR_ISA_ENABLE && count > 0x100 &&
1872 	    start < 65536)
1873 		start = 65536;
1874 	if (end > w->rman.rm_end)
1875 		end = w->rman.rm_end;
1876 	if (start + count - 1 > end || start + count < start)
1877 		return (EINVAL);
1878 	wmask = ((rman_res_t)1 << w->step) - 1;
1879 
1880 	/*
1881 	 * If there is no resource at all, just try to allocate enough
1882 	 * aligned space for this resource.
1883 	 */
1884 	if (w->res == NULL) {
1885 		error = pcib_alloc_new_window(sc, w, type, start, end, count,
1886 		    flags);
1887 		if (error) {
1888 			if (bootverbose)
1889 				device_printf(sc->dev,
1890 		    "failed to allocate initial %s window (%#jx-%#jx,%#jx)\n",
1891 				    w->name, start, end, count);
1892 			return (error);
1893 		}
1894 		if (bootverbose)
1895 			device_printf(sc->dev,
1896 			    "allocated initial %s window of %#jx-%#jx\n",
1897 			    w->name, (uintmax_t)w->base, (uintmax_t)w->limit);
1898 		goto updatewin;
1899 	}
1900 
1901 	/*
1902 	 * See if growing the window would help.  Compute the minimum
1903 	 * amount of address space needed on both the front and back
1904 	 * ends of the existing window to satisfy the allocation.
1905 	 *
1906 	 * For each end, build a candidate region adjusting for the
1907 	 * required alignment, etc.  If there is a free region at the
1908 	 * edge of the window, grow from the inner edge of the free
1909 	 * region.  Otherwise grow from the window boundary.
1910 	 *
1911 	 * Growing an I/O window below 64k for a bridge with the ISA
1912 	 * enable bit doesn't require any special magic as the step
1913 	 * size of an I/O window (1k) always includes multiple
1914 	 * non-alias ranges when it is grown in either direction.
1915 	 *
1916 	 * XXX: Special case: if w->res is completely empty and the
1917 	 * request size is larger than w->res, we should find the
1918 	 * optimal aligned buffer containing w->res and allocate that.
1919 	 */
1920 	if (bootverbose)
1921 		device_printf(sc->dev,
1922 		    "attempting to grow %s window for (%#jx-%#jx,%#jx)\n",
1923 		    w->name, start, end, count);
1924 	align = (rman_res_t)1 << RF_ALIGNMENT(flags);
1925 	if (start < w->base) {
1926 		if (rman_first_free_region(&w->rman, &start_free, &end_free) !=
1927 		    0 || start_free != w->base)
1928 			end_free = w->base;
1929 		if (end_free > end)
1930 			end_free = end + 1;
1931 
1932 		/* Move end_free down until it is properly aligned. */
1933 		end_free &= ~(align - 1);
1934 		end_free--;
1935 		front = end_free - (count - 1);
1936 
1937 		/*
1938 		 * The resource would now be allocated at (front,
1939 		 * end_free).  Ensure that fits in the (start, end)
1940 		 * bounds.  end_free is checked above.  If 'front' is
1941 		 * ok, ensure it is properly aligned for this window.
1942 		 * Also check for underflow.
1943 		 */
1944 		if (front >= start && front <= end_free) {
1945 			if (bootverbose)
1946 				printf("\tfront candidate range: %#jx-%#jx\n",
1947 				    front, end_free);
1948 			front &= ~wmask;
1949 			front = w->base - front;
1950 		} else
1951 			front = 0;
1952 	} else
1953 		front = 0;
1954 	if (end > w->limit) {
1955 		if (rman_last_free_region(&w->rman, &start_free, &end_free) !=
1956 		    0 || end_free != w->limit)
1957 			start_free = w->limit + 1;
1958 		if (start_free < start)
1959 			start_free = start;
1960 
1961 		/* Move start_free up until it is properly aligned. */
1962 		start_free = roundup2(start_free, align);
1963 		back = start_free + count - 1;
1964 
1965 		/*
1966 		 * The resource would now be allocated at (start_free,
1967 		 * back).  Ensure that fits in the (start, end)
1968 		 * bounds.  start_free is checked above.  If 'back' is
1969 		 * ok, ensure it is properly aligned for this window.
1970 		 * Also check for overflow.
1971 		 */
1972 		if (back <= end && start_free <= back) {
1973 			if (bootverbose)
1974 				printf("\tback candidate range: %#jx-%#jx\n",
1975 				    start_free, back);
1976 			back |= wmask;
1977 			back -= w->limit;
1978 		} else
1979 			back = 0;
1980 	} else
1981 		back = 0;
1982 
1983 	/*
1984 	 * Try to allocate the smallest needed region first.
1985 	 * If that fails, fall back to the other region.
1986 	 */
1987 	error = ENOSPC;
1988 	while (front != 0 || back != 0) {
1989 		if (front != 0 && (front <= back || back == 0)) {
1990 			error = pcib_expand_window(sc, w, type, w->base - front,
1991 			    w->limit);
1992 			if (error == 0)
1993 				break;
1994 			front = 0;
1995 		} else {
1996 			error = pcib_expand_window(sc, w, type, w->base,
1997 			    w->limit + back);
1998 			if (error == 0)
1999 				break;
2000 			back = 0;
2001 		}
2002 	}
2003 
2004 	if (error)
2005 		return (error);
2006 	if (bootverbose)
2007 		device_printf(sc->dev, "grew %s window to %#jx-%#jx\n",
2008 		    w->name, (uintmax_t)w->base, (uintmax_t)w->limit);
2009 
2010 updatewin:
2011 	/* Write the new window. */
2012 	KASSERT((w->base & wmask) == 0, ("start address is not aligned"));
2013 	KASSERT((w->limit & wmask) == wmask, ("end address is not aligned"));
2014 	pcib_write_windows(sc, w->mask);
2015 	return (0);
2016 }
2017 
2018 /*
2019  * We have to trap resource allocation requests and ensure that the bridge
2020  * is set up to, or capable of handling them.
2021  */
2022 static struct resource *
2023 pcib_alloc_resource(device_t dev, device_t child, int type, int *rid,
2024     rman_res_t start, rman_res_t end, rman_res_t count, u_int flags)
2025 {
2026 	struct pcib_softc *sc;
2027 	struct resource *r;
2028 
2029 	sc = device_get_softc(dev);
2030 
2031 	/*
2032 	 * VGA resources are decoded iff the VGA enable bit is set in
2033 	 * the bridge control register.  VGA resources do not fall into
2034 	 * the resource windows and are passed up to the parent.
2035 	 */
2036 	if ((type == SYS_RES_IOPORT && pci_is_vga_ioport_range(start, end)) ||
2037 	    (type == SYS_RES_MEMORY && pci_is_vga_memory_range(start, end))) {
2038 		if (sc->bridgectl & PCIB_BCR_VGA_ENABLE)
2039 			return (bus_generic_alloc_resource(dev, child, type,
2040 			    rid, start, end, count, flags));
2041 		else
2042 			return (NULL);
2043 	}
2044 
2045 	switch (type) {
2046 	case PCI_RES_BUS:
2047 		return (pcib_alloc_subbus(&sc->bus, child, rid, start, end,
2048 		    count, flags));
2049 	case SYS_RES_IOPORT:
2050 		if (pcib_is_isa_range(sc, start, end, count))
2051 			return (NULL);
2052 		r = pcib_suballoc_resource(sc, &sc->io, child, type, rid, start,
2053 		    end, count, flags);
2054 		if (r != NULL || (sc->flags & PCIB_SUBTRACTIVE) != 0)
2055 			break;
2056 		if (pcib_grow_window(sc, &sc->io, type, start, end, count,
2057 		    flags) == 0)
2058 			r = pcib_suballoc_resource(sc, &sc->io, child, type,
2059 			    rid, start, end, count, flags);
2060 		break;
2061 	case SYS_RES_MEMORY:
2062 		/*
2063 		 * For prefetchable resources, prefer the prefetchable
2064 		 * memory window, but fall back to the regular memory
2065 		 * window if that fails.  Try both windows before
2066 		 * attempting to grow a window in case the firmware
2067 		 * has used a range in the regular memory window to
2068 		 * map a prefetchable BAR.
2069 		 */
2070 		if (flags & RF_PREFETCHABLE) {
2071 			r = pcib_suballoc_resource(sc, &sc->pmem, child, type,
2072 			    rid, start, end, count, flags);
2073 			if (r != NULL)
2074 				break;
2075 		}
2076 		r = pcib_suballoc_resource(sc, &sc->mem, child, type, rid,
2077 		    start, end, count, flags);
2078 		if (r != NULL || (sc->flags & PCIB_SUBTRACTIVE) != 0)
2079 			break;
2080 		if (flags & RF_PREFETCHABLE) {
2081 			if (pcib_grow_window(sc, &sc->pmem, type, start, end,
2082 			    count, flags) == 0) {
2083 				r = pcib_suballoc_resource(sc, &sc->pmem, child,
2084 				    type, rid, start, end, count, flags);
2085 				if (r != NULL)
2086 					break;
2087 			}
2088 		}
2089 		if (pcib_grow_window(sc, &sc->mem, type, start, end, count,
2090 		    flags & ~RF_PREFETCHABLE) == 0)
2091 			r = pcib_suballoc_resource(sc, &sc->mem, child, type,
2092 			    rid, start, end, count, flags);
2093 		break;
2094 	default:
2095 		return (bus_generic_alloc_resource(dev, child, type, rid,
2096 		    start, end, count, flags));
2097 	}
2098 
2099 	/*
2100 	 * If attempts to suballocate from the window fail but this is a
2101 	 * subtractive bridge, pass the request up the tree.
2102 	 */
2103 	if (sc->flags & PCIB_SUBTRACTIVE && r == NULL)
2104 		return (bus_generic_alloc_resource(dev, child, type, rid,
2105 		    start, end, count, flags));
2106 	return (r);
2107 }
2108 
2109 static int
2110 pcib_adjust_resource(device_t bus, device_t child, struct resource *r,
2111     rman_res_t start, rman_res_t end)
2112 {
2113 	struct pcib_softc *sc;
2114 	struct pcib_window *w;
2115 	rman_res_t wmask;
2116 	int error, type;
2117 
2118 	sc = device_get_softc(bus);
2119 	type = rman_get_type(r);
2120 
2121 	/*
2122 	 * If the resource wasn't sub-allocated from one of our region
2123 	 * managers then just pass the request up.
2124 	 */
2125 	if (!pcib_is_resource_managed(sc, r))
2126 		return (bus_generic_adjust_resource(bus, child, r, start, end));
2127 
2128 	if (type == PCI_RES_BUS) {
2129 		/*
2130 		 * If our bus range isn't big enough to grow the sub-allocation
2131 		 * then we need to grow our bus range. Any request that would
2132 		 * require us to decrease the start of our own bus range is
2133 		 * invalid, we can only extend the end; ignore such requests
2134 		 * and let rman_adjust_resource fail below.
2135 		 */
2136 		if (start >= sc->bus.sec && end > sc->bus.sub) {
2137 			error = pcib_grow_subbus(&sc->bus, end);
2138 			if (error != 0)
2139 				return (error);
2140 		}
2141 	} else {
2142 		/*
2143 		 * Resource is managed and not a secondary bus number, must
2144 		 * be from one of our windows.
2145 		 */
2146 		w = pcib_get_resource_window(sc, r);
2147 		KASSERT(w != NULL,
2148 		    ("%s: no window for resource (%#jx-%#jx) type %d",
2149 		    __func__, rman_get_start(r), rman_get_end(r), type));
2150 
2151 		/*
2152 		 * If our window isn't big enough to grow the sub-allocation
2153 		 * then we need to expand the window.
2154 		 */
2155 		if (start < w->base || end > w->limit) {
2156 			wmask = ((rman_res_t)1 << w->step) - 1;
2157 			error = pcib_expand_window(sc, w, type,
2158 			    MIN(start & ~wmask, w->base),
2159 			    MAX(end | wmask, w->limit));
2160 			if (error != 0)
2161 				return (error);
2162 			if (bootverbose)
2163 				device_printf(sc->dev,
2164 				    "grew %s window to %#jx-%#jx\n",
2165 				    w->name, (uintmax_t)w->base,
2166 				    (uintmax_t)w->limit);
2167 			pcib_write_windows(sc, w->mask);
2168 		}
2169 	}
2170 
2171 	return (rman_adjust_resource(r, start, end));
2172 }
2173 
2174 static int
2175 pcib_release_resource(device_t dev, device_t child, struct resource *r)
2176 {
2177 	struct pcib_softc *sc;
2178 	int error;
2179 
2180 	sc = device_get_softc(dev);
2181 	if (pcib_is_resource_managed(sc, r)) {
2182 		if (rman_get_flags(r) & RF_ACTIVE) {
2183 			error = bus_deactivate_resource(child, r);
2184 			if (error)
2185 				return (error);
2186 		}
2187 		return (rman_release_resource(r));
2188 	}
2189 	return (bus_generic_release_resource(dev, child, r));
2190 }
2191 
2192 static int
2193 pcib_activate_resource(device_t dev, device_t child, struct resource *r)
2194 {
2195 	struct pcib_softc *sc = device_get_softc(dev);
2196 	struct resource_map map;
2197 	int error, type;
2198 
2199 	if (!pcib_is_resource_managed(sc, r))
2200 		return (bus_generic_activate_resource(dev, child, r));
2201 
2202 	error = rman_activate_resource(r);
2203 	if (error != 0)
2204 		return (error);
2205 
2206 	type = rman_get_type(r);
2207 	if ((rman_get_flags(r) & RF_UNMAPPED) == 0 &&
2208 	    (type == SYS_RES_MEMORY || type == SYS_RES_IOPORT)) {
2209 		error = BUS_MAP_RESOURCE(dev, child, r, NULL, &map);
2210 		if (error != 0) {
2211 			rman_deactivate_resource(r);
2212 			return (error);
2213 		}
2214 
2215 		rman_set_mapping(r, &map);
2216 	}
2217 	return (0);
2218 }
2219 
2220 static int
2221 pcib_deactivate_resource(device_t dev, device_t child, struct resource *r)
2222 {
2223 	struct pcib_softc *sc = device_get_softc(dev);
2224 	struct resource_map map;
2225 	int error, type;
2226 
2227 	if (!pcib_is_resource_managed(sc, r))
2228 		return (bus_generic_deactivate_resource(dev, child, r));
2229 
2230 	error = rman_deactivate_resource(r);
2231 	if (error != 0)
2232 		return (error);
2233 
2234 	type = rman_get_type(r);
2235 	if ((rman_get_flags(r) & RF_UNMAPPED) == 0 &&
2236 	    (type == SYS_RES_MEMORY || type == SYS_RES_IOPORT)) {
2237 		rman_get_mapping(r, &map);
2238 		BUS_UNMAP_RESOURCE(dev, child, r, &map);
2239 	}
2240 	return (0);
2241 }
2242 
2243 static struct resource *
2244 pcib_find_parent_resource(struct pcib_window *w, struct resource *r)
2245 {
2246 	for (int i = 0; i < w->count; i++) {
2247 		if (rman_get_start(w->res[i]) <= rman_get_start(r) &&
2248 		    rman_get_end(w->res[i]) >= rman_get_end(r))
2249 			return (w->res[i]);
2250 	}
2251 	return (NULL);
2252 }
2253 
2254 static int
2255 pcib_map_resource(device_t dev, device_t child, struct resource *r,
2256     struct resource_map_request *argsp, struct resource_map *map)
2257 {
2258 	struct pcib_softc *sc = device_get_softc(dev);
2259 	struct resource_map_request args;
2260 	struct pcib_window *w;
2261 	struct resource *pres;
2262 	rman_res_t length, start;
2263 	int error;
2264 
2265 	w = pcib_get_resource_window(sc, r);
2266 	if (w == NULL)
2267 		return (bus_generic_map_resource(dev, child, r, argsp, map));
2268 
2269 	/* Resources must be active to be mapped. */
2270 	if (!(rman_get_flags(r) & RF_ACTIVE))
2271 		return (ENXIO);
2272 
2273 	resource_init_map_request(&args);
2274 	error = resource_validate_map_request(r, argsp, &args, &start, &length);
2275 	if (error)
2276 		return (error);
2277 
2278 	pres = pcib_find_parent_resource(w, r);
2279 	if (pres == NULL)
2280 		return (ENOENT);
2281 
2282 	args.offset = start - rman_get_start(pres);
2283 	args.length = length;
2284 	return (bus_map_resource(dev, pres, &args, map));
2285 }
2286 
2287 static int
2288 pcib_unmap_resource(device_t dev, device_t child, struct resource *r,
2289     struct resource_map *map)
2290 {
2291 	struct pcib_softc *sc = device_get_softc(dev);
2292 	struct pcib_window *w;
2293 	struct resource *pres;
2294 
2295 	w = pcib_get_resource_window(sc, r);
2296 	if (w == NULL)
2297 		return (bus_generic_unmap_resource(dev, child, r, map));
2298 
2299 	pres = pcib_find_parent_resource(w, r);
2300 	if (pres == NULL)
2301 		return (ENOENT);
2302 	return (bus_unmap_resource(dev, pres, map));
2303 }
2304 
2305 /*
2306  * If ARI is enabled on this downstream port, translate the function number
2307  * to the non-ARI slot/function.  The downstream port will convert it back in
2308  * hardware.  If ARI is not enabled slot and func are not modified.
2309  */
2310 static __inline void
2311 pcib_xlate_ari(device_t pcib, int bus, int *slot, int *func)
2312 {
2313 	struct pcib_softc *sc;
2314 	int ari_func;
2315 
2316 	sc = device_get_softc(pcib);
2317 	ari_func = *func;
2318 
2319 	if (sc->flags & PCIB_ENABLE_ARI) {
2320 		KASSERT(*slot == 0,
2321 		    ("Non-zero slot number with ARI enabled!"));
2322 		*slot = PCIE_ARI_SLOT(ari_func);
2323 		*func = PCIE_ARI_FUNC(ari_func);
2324 	}
2325 }
2326 
2327 static void
2328 pcib_enable_ari(struct pcib_softc *sc, uint32_t pcie_pos)
2329 {
2330 	uint32_t ctl2;
2331 
2332 	ctl2 = pci_read_config(sc->dev, pcie_pos + PCIER_DEVICE_CTL2, 4);
2333 	ctl2 |= PCIEM_CTL2_ARI;
2334 	pci_write_config(sc->dev, pcie_pos + PCIER_DEVICE_CTL2, ctl2, 4);
2335 
2336 	sc->flags |= PCIB_ENABLE_ARI;
2337 }
2338 
2339 /*
2340  * PCIB interface.
2341  */
2342 int
2343 pcib_maxslots(device_t dev)
2344 {
2345 #if !defined(__amd64__) && !defined(__i386__)
2346 	uint32_t pcie_pos;
2347 	uint16_t val;
2348 
2349 	/*
2350 	 * If this is a PCIe rootport or downstream switch port, there's only
2351 	 * one slot permitted.
2352 	 */
2353 	if (pci_find_cap(dev, PCIY_EXPRESS, &pcie_pos) == 0) {
2354 		val = pci_read_config(dev, pcie_pos + PCIER_FLAGS, 2);
2355 		val &= PCIEM_FLAGS_TYPE;
2356 		if (val == PCIEM_TYPE_ROOT_PORT ||
2357 		    val == PCIEM_TYPE_DOWNSTREAM_PORT)
2358 			return (0);
2359 	}
2360 #endif
2361 	return (PCI_SLOTMAX);
2362 }
2363 
2364 static int
2365 pcib_ari_maxslots(device_t dev)
2366 {
2367 	struct pcib_softc *sc;
2368 
2369 	sc = device_get_softc(dev);
2370 
2371 	if (sc->flags & PCIB_ENABLE_ARI)
2372 		return (PCIE_ARI_SLOTMAX);
2373 	else
2374 		return (pcib_maxslots(dev));
2375 }
2376 
2377 static int
2378 pcib_ari_maxfuncs(device_t dev)
2379 {
2380 	struct pcib_softc *sc;
2381 
2382 	sc = device_get_softc(dev);
2383 
2384 	if (sc->flags & PCIB_ENABLE_ARI)
2385 		return (PCIE_ARI_FUNCMAX);
2386 	else
2387 		return (PCI_FUNCMAX);
2388 }
2389 
2390 static void
2391 pcib_ari_decode_rid(device_t pcib, uint16_t rid, int *bus, int *slot,
2392     int *func)
2393 {
2394 	struct pcib_softc *sc;
2395 
2396 	sc = device_get_softc(pcib);
2397 
2398 	*bus = PCI_RID2BUS(rid);
2399 	if (sc->flags & PCIB_ENABLE_ARI) {
2400 		*slot = PCIE_ARI_RID2SLOT(rid);
2401 		*func = PCIE_ARI_RID2FUNC(rid);
2402 	} else {
2403 		*slot = PCI_RID2SLOT(rid);
2404 		*func = PCI_RID2FUNC(rid);
2405 	}
2406 }
2407 
2408 /*
2409  * Since we are a child of a PCI bus, its parent must support the pcib interface.
2410  */
2411 static uint32_t
2412 pcib_read_config(device_t dev, u_int b, u_int s, u_int f, u_int reg, int width)
2413 {
2414 #ifdef PCI_HP
2415 	struct pcib_softc *sc;
2416 
2417 	sc = device_get_softc(dev);
2418 	if (!pcib_present(sc)) {
2419 		switch (width) {
2420 		case 2:
2421 			return (0xffff);
2422 		case 1:
2423 			return (0xff);
2424 		default:
2425 			return (0xffffffff);
2426 		}
2427 	}
2428 #endif
2429 	pcib_xlate_ari(dev, b, &s, &f);
2430 	return(PCIB_READ_CONFIG(device_get_parent(device_get_parent(dev)), b, s,
2431 	    f, reg, width));
2432 }
2433 
2434 static void
2435 pcib_write_config(device_t dev, u_int b, u_int s, u_int f, u_int reg, uint32_t val, int width)
2436 {
2437 #ifdef PCI_HP
2438 	struct pcib_softc *sc;
2439 
2440 	sc = device_get_softc(dev);
2441 	if (!pcib_present(sc))
2442 		return;
2443 #endif
2444 	pcib_xlate_ari(dev, b, &s, &f);
2445 	PCIB_WRITE_CONFIG(device_get_parent(device_get_parent(dev)), b, s, f,
2446 	    reg, val, width);
2447 }
2448 
2449 /*
2450  * Route an interrupt across a PCI bridge.
2451  */
2452 int
2453 pcib_route_interrupt(device_t pcib, device_t dev, int pin)
2454 {
2455     device_t	bus;
2456     int		parent_intpin;
2457     int		intnum;
2458 
2459     /*
2460      *
2461      * The PCI standard defines a swizzle of the child-side device/intpin to
2462      * the parent-side intpin as follows.
2463      *
2464      * device = device on child bus
2465      * child_intpin = intpin on child bus slot (0-3)
2466      * parent_intpin = intpin on parent bus slot (0-3)
2467      *
2468      * parent_intpin = (device + child_intpin) % 4
2469      */
2470     parent_intpin = (pci_get_slot(dev) + (pin - 1)) % 4;
2471 
2472     /*
2473      * Our parent is a PCI bus.  Its parent must export the pcib interface
2474      * which includes the ability to route interrupts.
2475      */
2476     bus = device_get_parent(pcib);
2477     intnum = PCIB_ROUTE_INTERRUPT(device_get_parent(bus), pcib, parent_intpin + 1);
2478     if (PCI_INTERRUPT_VALID(intnum) && bootverbose) {
2479 	device_printf(pcib, "slot %d INT%c is routed to irq %d\n",
2480 	    pci_get_slot(dev), 'A' + pin - 1, intnum);
2481     }
2482     return(intnum);
2483 }
2484 
2485 /* Pass request to alloc MSI/MSI-X messages up to the parent bridge. */
2486 int
2487 pcib_alloc_msi(device_t pcib, device_t dev, int count, int maxcount, int *irqs)
2488 {
2489 	struct pcib_softc *sc = device_get_softc(pcib);
2490 	device_t bus;
2491 
2492 	if (sc->flags & PCIB_DISABLE_MSI)
2493 		return (ENXIO);
2494 	bus = device_get_parent(pcib);
2495 	return (PCIB_ALLOC_MSI(device_get_parent(bus), dev, count, maxcount,
2496 	    irqs));
2497 }
2498 
2499 /* Pass request to release MSI/MSI-X messages up to the parent bridge. */
2500 int
2501 pcib_release_msi(device_t pcib, device_t dev, int count, int *irqs)
2502 {
2503 	device_t bus;
2504 
2505 	bus = device_get_parent(pcib);
2506 	return (PCIB_RELEASE_MSI(device_get_parent(bus), dev, count, irqs));
2507 }
2508 
2509 /* Pass request to alloc an MSI-X message up to the parent bridge. */
2510 int
2511 pcib_alloc_msix(device_t pcib, device_t dev, int *irq)
2512 {
2513 	struct pcib_softc *sc = device_get_softc(pcib);
2514 	device_t bus;
2515 
2516 	if (sc->flags & PCIB_DISABLE_MSIX)
2517 		return (ENXIO);
2518 	bus = device_get_parent(pcib);
2519 	return (PCIB_ALLOC_MSIX(device_get_parent(bus), dev, irq));
2520 }
2521 
2522 /* Pass request to release an MSI-X message up to the parent bridge. */
2523 int
2524 pcib_release_msix(device_t pcib, device_t dev, int irq)
2525 {
2526 	device_t bus;
2527 
2528 	bus = device_get_parent(pcib);
2529 	return (PCIB_RELEASE_MSIX(device_get_parent(bus), dev, irq));
2530 }
2531 
2532 /* Pass request to map MSI/MSI-X message up to parent bridge. */
2533 int
2534 pcib_map_msi(device_t pcib, device_t dev, int irq, uint64_t *addr,
2535     uint32_t *data)
2536 {
2537 	device_t bus;
2538 	int error;
2539 
2540 	bus = device_get_parent(pcib);
2541 	error = PCIB_MAP_MSI(device_get_parent(bus), dev, irq, addr, data);
2542 	if (error)
2543 		return (error);
2544 
2545 	pci_ht_map_msi(pcib, *addr);
2546 	return (0);
2547 }
2548 
2549 /* Pass request for device power state up to parent bridge. */
2550 int
2551 pcib_power_for_sleep(device_t pcib, device_t dev, int *pstate)
2552 {
2553 	device_t bus;
2554 
2555 	bus = device_get_parent(pcib);
2556 	return (PCIB_POWER_FOR_SLEEP(bus, dev, pstate));
2557 }
2558 
2559 static int
2560 pcib_ari_enabled(device_t pcib)
2561 {
2562 	struct pcib_softc *sc;
2563 
2564 	sc = device_get_softc(pcib);
2565 
2566 	return ((sc->flags & PCIB_ENABLE_ARI) != 0);
2567 }
2568 
2569 static int
2570 pcib_ari_get_id(device_t pcib, device_t dev, enum pci_id_type type,
2571     uintptr_t *id)
2572 {
2573 	struct pcib_softc *sc;
2574 	device_t bus_dev;
2575 	uint8_t bus, slot, func;
2576 
2577 	if (type != PCI_ID_RID) {
2578 		bus_dev = device_get_parent(pcib);
2579 		return (PCIB_GET_ID(device_get_parent(bus_dev), dev, type, id));
2580 	}
2581 
2582 	sc = device_get_softc(pcib);
2583 
2584 	if (sc->flags & PCIB_ENABLE_ARI) {
2585 		bus = pci_get_bus(dev);
2586 		func = pci_get_function(dev);
2587 
2588 		*id = (PCI_ARI_RID(bus, func));
2589 	} else {
2590 		bus = pci_get_bus(dev);
2591 		slot = pci_get_slot(dev);
2592 		func = pci_get_function(dev);
2593 
2594 		*id = (PCI_RID(bus, slot, func));
2595 	}
2596 
2597 	return (0);
2598 }
2599 
2600 /*
2601  * Check that the downstream port (pcib) and the endpoint device (dev) both
2602  * support ARI.  If so, enable it and return 0, otherwise return an error.
2603  */
2604 static int
2605 pcib_try_enable_ari(device_t pcib, device_t dev)
2606 {
2607 	struct pcib_softc *sc;
2608 	int error;
2609 	uint32_t cap2;
2610 	int ari_cap_off;
2611 	uint32_t ari_ver;
2612 	uint32_t pcie_pos;
2613 
2614 	sc = device_get_softc(pcib);
2615 
2616 	/*
2617 	 * ARI is controlled in a register in the PCIe capability structure.
2618 	 * If the downstream port does not have the PCIe capability structure
2619 	 * then it does not support ARI.
2620 	 */
2621 	error = pci_find_cap(pcib, PCIY_EXPRESS, &pcie_pos);
2622 	if (error != 0)
2623 		return (ENODEV);
2624 
2625 	/* Check that the PCIe port advertises ARI support. */
2626 	cap2 = pci_read_config(pcib, pcie_pos + PCIER_DEVICE_CAP2, 4);
2627 	if (!(cap2 & PCIEM_CAP2_ARI))
2628 		return (ENODEV);
2629 
2630 	/*
2631 	 * Check that the endpoint device advertises ARI support via the ARI
2632 	 * extended capability structure.
2633 	 */
2634 	error = pci_find_extcap(dev, PCIZ_ARI, &ari_cap_off);
2635 	if (error != 0)
2636 		return (ENODEV);
2637 
2638 	/*
2639 	 * Finally, check that the endpoint device supports the same version
2640 	 * of ARI that we do.
2641 	 */
2642 	ari_ver = pci_read_config(dev, ari_cap_off, 4);
2643 	if (PCI_EXTCAP_VER(ari_ver) != PCIB_SUPPORTED_ARI_VER) {
2644 		if (bootverbose)
2645 			device_printf(pcib,
2646 			    "Unsupported version of ARI (%d) detected\n",
2647 			    PCI_EXTCAP_VER(ari_ver));
2648 
2649 		return (ENXIO);
2650 	}
2651 
2652 	pcib_enable_ari(sc, pcie_pos);
2653 
2654 	return (0);
2655 }
2656 
2657 int
2658 pcib_request_feature_allow(device_t pcib, device_t dev,
2659     enum pci_feature feature)
2660 {
2661 	/*
2662 	 * No host firmware we have to negotiate with, so we allow
2663 	 * every valid feature requested.
2664 	 */
2665 	switch (feature) {
2666 	case PCI_FEATURE_AER:
2667 	case PCI_FEATURE_HP:
2668 		break;
2669 	default:
2670 		return (EINVAL);
2671 	}
2672 
2673 	return (0);
2674 }
2675 
2676 int
2677 pcib_request_feature(device_t dev, enum pci_feature feature)
2678 {
2679 
2680 	/*
2681 	 * Invoke PCIB_REQUEST_FEATURE of this bridge first in case
2682 	 * the firmware overrides the method of PCI-PCI bridges.
2683 	 */
2684 	return (PCIB_REQUEST_FEATURE(dev, dev, feature));
2685 }
2686 
2687 /*
2688  * Pass the request to use this PCI feature up the tree. Either there's a
2689  * firmware like ACPI that's using this feature that will approve (or deny) the
2690  * request to take it over, or the platform has no such firmware, in which case
2691  * the request will be approved. If the request is approved, the OS is expected
2692  * to make use of the feature or render it harmless.
2693  */
2694 static int
2695 pcib_request_feature_default(device_t pcib, device_t dev,
2696     enum pci_feature feature)
2697 {
2698 	device_t bus;
2699 
2700 	/*
2701 	 * Our parent is necessarily a pci bus. Its parent will either be
2702 	 * another pci bridge (which passes it up) or a host bridge that can
2703 	 * approve or reject the request.
2704 	 */
2705 	bus = device_get_parent(pcib);
2706 	return (PCIB_REQUEST_FEATURE(device_get_parent(bus), dev, feature));
2707 }
2708 
2709 static int
2710 pcib_reset_child(device_t dev, device_t child, int flags)
2711 {
2712 	struct pci_devinfo *pdinfo;
2713 	int error;
2714 
2715 	error = 0;
2716 	if (dev == NULL || device_get_parent(child) != dev)
2717 		goto out;
2718 	error = ENXIO;
2719 	if (device_get_devclass(child) != devclass_find("pci"))
2720 		goto out;
2721 	pdinfo = device_get_ivars(dev);
2722 	if (pdinfo->cfg.pcie.pcie_location != 0 &&
2723 	    (pdinfo->cfg.pcie.pcie_type == PCIEM_TYPE_DOWNSTREAM_PORT ||
2724 	    pdinfo->cfg.pcie.pcie_type == PCIEM_TYPE_ROOT_PORT)) {
2725 		error = bus_helper_reset_prepare(child, flags);
2726 		if (error == 0) {
2727 			error = pcie_link_reset(dev,
2728 			    pdinfo->cfg.pcie.pcie_location);
2729 			/* XXXKIB call _post even if error != 0 ? */
2730 			bus_helper_reset_post(child, flags);
2731 		}
2732 	}
2733 out:
2734 	return (error);
2735 }
2736