xref: /freebsd/sys/dev/cxgb/cxgb_main.c (revision 7e00348e7605b9906601438008341ffc37c00e2c)
1 /**************************************************************************
2 
3 Copyright (c) 2007-2009, Chelsio Inc.
4 All rights reserved.
5 
6 Redistribution and use in source and binary forms, with or without
7 modification, are permitted provided that the following conditions are met:
8 
9  1. Redistributions of source code must retain the above copyright notice,
10     this list of conditions and the following disclaimer.
11 
12  2. Neither the name of the Chelsio Corporation nor the names of its
13     contributors may be used to endorse or promote products derived from
14     this software without specific prior written permission.
15 
16 THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
17 AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18 IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19 ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
20 LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
21 CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
22 SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
23 INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
24 CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
25 ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
26 POSSIBILITY OF SUCH DAMAGE.
27 
28 ***************************************************************************/
29 
30 #include <sys/cdefs.h>
31 __FBSDID("$FreeBSD$");
32 
33 #include "opt_inet.h"
34 
35 #include <sys/param.h>
36 #include <sys/systm.h>
37 #include <sys/kernel.h>
38 #include <sys/bus.h>
39 #include <sys/module.h>
40 #include <sys/pciio.h>
41 #include <sys/conf.h>
42 #include <machine/bus.h>
43 #include <machine/resource.h>
44 #include <sys/bus_dma.h>
45 #include <sys/ktr.h>
46 #include <sys/rman.h>
47 #include <sys/ioccom.h>
48 #include <sys/mbuf.h>
49 #include <sys/linker.h>
50 #include <sys/firmware.h>
51 #include <sys/socket.h>
52 #include <sys/sockio.h>
53 #include <sys/smp.h>
54 #include <sys/sysctl.h>
55 #include <sys/syslog.h>
56 #include <sys/queue.h>
57 #include <sys/taskqueue.h>
58 #include <sys/proc.h>
59 
60 #include <net/bpf.h>
61 #include <net/ethernet.h>
62 #include <net/if.h>
63 #include <net/if_var.h>
64 #include <net/if_arp.h>
65 #include <net/if_dl.h>
66 #include <net/if_media.h>
67 #include <net/if_types.h>
68 #include <net/if_vlan_var.h>
69 
70 #include <netinet/in_systm.h>
71 #include <netinet/in.h>
72 #include <netinet/if_ether.h>
73 #include <netinet/ip.h>
74 #include <netinet/ip.h>
75 #include <netinet/tcp.h>
76 #include <netinet/udp.h>
77 
78 #include <dev/pci/pcireg.h>
79 #include <dev/pci/pcivar.h>
80 #include <dev/pci/pci_private.h>
81 
82 #include <cxgb_include.h>
83 
84 #ifdef PRIV_SUPPORTED
85 #include <sys/priv.h>
86 #endif
87 
88 static int cxgb_setup_interrupts(adapter_t *);
89 static void cxgb_teardown_interrupts(adapter_t *);
90 static void cxgb_init(void *);
91 static int cxgb_init_locked(struct port_info *);
92 static int cxgb_uninit_locked(struct port_info *);
93 static int cxgb_uninit_synchronized(struct port_info *);
94 static int cxgb_ioctl(struct ifnet *, unsigned long, caddr_t);
95 static int cxgb_media_change(struct ifnet *);
96 static int cxgb_ifm_type(int);
97 static void cxgb_build_medialist(struct port_info *);
98 static void cxgb_media_status(struct ifnet *, struct ifmediareq *);
99 static uint64_t cxgb_get_counter(struct ifnet *, ift_counter);
100 static int setup_sge_qsets(adapter_t *);
101 static void cxgb_async_intr(void *);
102 static void cxgb_tick_handler(void *, int);
103 static void cxgb_tick(void *);
104 static void link_check_callout(void *);
105 static void check_link_status(void *, int);
106 static void setup_rss(adapter_t *sc);
107 static int alloc_filters(struct adapter *);
108 static int setup_hw_filters(struct adapter *);
109 static int set_filter(struct adapter *, int, const struct filter_info *);
110 static inline void mk_set_tcb_field(struct cpl_set_tcb_field *, unsigned int,
111     unsigned int, u64, u64);
112 static inline void set_tcb_field_ulp(struct cpl_set_tcb_field *, unsigned int,
113     unsigned int, u64, u64);
114 #ifdef TCP_OFFLOAD
115 static int cpl_not_handled(struct sge_qset *, struct rsp_desc *, struct mbuf *);
116 #endif
117 
118 /* Attachment glue for the PCI controller end of the device.  Each port of
119  * the device is attached separately, as defined later.
120  */
121 static int cxgb_controller_probe(device_t);
122 static int cxgb_controller_attach(device_t);
123 static int cxgb_controller_detach(device_t);
124 static void cxgb_free(struct adapter *);
125 static __inline void reg_block_dump(struct adapter *ap, uint8_t *buf, unsigned int start,
126     unsigned int end);
127 static void cxgb_get_regs(adapter_t *sc, struct ch_ifconf_regs *regs, uint8_t *buf);
128 static int cxgb_get_regs_len(void);
129 static void touch_bars(device_t dev);
130 static void cxgb_update_mac_settings(struct port_info *p);
131 #ifdef TCP_OFFLOAD
132 static int toe_capability(struct port_info *, int);
133 #endif
134 
135 static device_method_t cxgb_controller_methods[] = {
136 	DEVMETHOD(device_probe,		cxgb_controller_probe),
137 	DEVMETHOD(device_attach,	cxgb_controller_attach),
138 	DEVMETHOD(device_detach,	cxgb_controller_detach),
139 
140 	DEVMETHOD_END
141 };
142 
143 static driver_t cxgb_controller_driver = {
144 	"cxgbc",
145 	cxgb_controller_methods,
146 	sizeof(struct adapter)
147 };
148 
149 static int cxgbc_mod_event(module_t, int, void *);
150 static devclass_t	cxgb_controller_devclass;
151 DRIVER_MODULE(cxgbc, pci, cxgb_controller_driver, cxgb_controller_devclass,
152     cxgbc_mod_event, 0);
153 MODULE_VERSION(cxgbc, 1);
154 MODULE_DEPEND(cxgbc, firmware, 1, 1, 1);
155 
156 /*
157  * Attachment glue for the ports.  Attachment is done directly to the
158  * controller device.
159  */
160 static int cxgb_port_probe(device_t);
161 static int cxgb_port_attach(device_t);
162 static int cxgb_port_detach(device_t);
163 
164 static device_method_t cxgb_port_methods[] = {
165 	DEVMETHOD(device_probe,		cxgb_port_probe),
166 	DEVMETHOD(device_attach,	cxgb_port_attach),
167 	DEVMETHOD(device_detach,	cxgb_port_detach),
168 	{ 0, 0 }
169 };
170 
171 static driver_t cxgb_port_driver = {
172 	"cxgb",
173 	cxgb_port_methods,
174 	0
175 };
176 
177 static d_ioctl_t cxgb_extension_ioctl;
178 static d_open_t cxgb_extension_open;
179 static d_close_t cxgb_extension_close;
180 
181 static struct cdevsw cxgb_cdevsw = {
182        .d_version =    D_VERSION,
183        .d_flags =      0,
184        .d_open =       cxgb_extension_open,
185        .d_close =      cxgb_extension_close,
186        .d_ioctl =      cxgb_extension_ioctl,
187        .d_name =       "cxgb",
188 };
189 
190 static devclass_t	cxgb_port_devclass;
191 DRIVER_MODULE(cxgb, cxgbc, cxgb_port_driver, cxgb_port_devclass, 0, 0);
192 MODULE_VERSION(cxgb, 1);
193 
194 static struct mtx t3_list_lock;
195 static SLIST_HEAD(, adapter) t3_list;
196 #ifdef TCP_OFFLOAD
197 static struct mtx t3_uld_list_lock;
198 static SLIST_HEAD(, uld_info) t3_uld_list;
199 #endif
200 
201 /*
202  * The driver uses the best interrupt scheme available on a platform in the
203  * order MSI-X, MSI, legacy pin interrupts.  This parameter determines which
204  * of these schemes the driver may consider as follows:
205  *
206  * msi = 2: choose from among all three options
207  * msi = 1 : only consider MSI and pin interrupts
208  * msi = 0: force pin interrupts
209  */
210 static int msi_allowed = 2;
211 
212 SYSCTL_NODE(_hw, OID_AUTO, cxgb, CTLFLAG_RD, 0, "CXGB driver parameters");
213 SYSCTL_INT(_hw_cxgb, OID_AUTO, msi_allowed, CTLFLAG_RDTUN, &msi_allowed, 0,
214     "MSI-X, MSI, INTx selector");
215 
216 /*
217  * The driver uses an auto-queue algorithm by default.
218  * To disable it and force a single queue-set per port, use multiq = 0
219  */
220 static int multiq = 1;
221 SYSCTL_INT(_hw_cxgb, OID_AUTO, multiq, CTLFLAG_RDTUN, &multiq, 0,
222     "use min(ncpus/ports, 8) queue-sets per port");
223 
224 /*
225  * By default the driver will not update the firmware unless
226  * it was compiled against a newer version
227  *
228  */
229 static int force_fw_update = 0;
230 SYSCTL_INT(_hw_cxgb, OID_AUTO, force_fw_update, CTLFLAG_RDTUN, &force_fw_update, 0,
231     "update firmware even if up to date");
232 
233 int cxgb_use_16k_clusters = -1;
234 SYSCTL_INT(_hw_cxgb, OID_AUTO, use_16k_clusters, CTLFLAG_RDTUN,
235     &cxgb_use_16k_clusters, 0, "use 16kB clusters for the jumbo queue ");
236 
237 static int nfilters = -1;
238 SYSCTL_INT(_hw_cxgb, OID_AUTO, nfilters, CTLFLAG_RDTUN,
239     &nfilters, 0, "max number of entries in the filter table");
240 
241 enum {
242 	MAX_TXQ_ENTRIES      = 16384,
243 	MAX_CTRL_TXQ_ENTRIES = 1024,
244 	MAX_RSPQ_ENTRIES     = 16384,
245 	MAX_RX_BUFFERS       = 16384,
246 	MAX_RX_JUMBO_BUFFERS = 16384,
247 	MIN_TXQ_ENTRIES      = 4,
248 	MIN_CTRL_TXQ_ENTRIES = 4,
249 	MIN_RSPQ_ENTRIES     = 32,
250 	MIN_FL_ENTRIES       = 32,
251 	MIN_FL_JUMBO_ENTRIES = 32
252 };
253 
254 struct filter_info {
255 	u32 sip;
256 	u32 sip_mask;
257 	u32 dip;
258 	u16 sport;
259 	u16 dport;
260 	u32 vlan:12;
261 	u32 vlan_prio:3;
262 	u32 mac_hit:1;
263 	u32 mac_idx:4;
264 	u32 mac_vld:1;
265 	u32 pkt_type:2;
266 	u32 report_filter_id:1;
267 	u32 pass:1;
268 	u32 rss:1;
269 	u32 qset:3;
270 	u32 locked:1;
271 	u32 valid:1;
272 };
273 
274 enum { FILTER_NO_VLAN_PRI = 7 };
275 
276 #define EEPROM_MAGIC 0x38E2F10C
277 
278 #define PORT_MASK ((1 << MAX_NPORTS) - 1)
279 
280 /* Table for probing the cards.  The desc field isn't actually used */
281 struct cxgb_ident {
282 	uint16_t	vendor;
283 	uint16_t	device;
284 	int		index;
285 	char		*desc;
286 } cxgb_identifiers[] = {
287 	{PCI_VENDOR_ID_CHELSIO, 0x0020, 0, "PE9000"},
288 	{PCI_VENDOR_ID_CHELSIO, 0x0021, 1, "T302E"},
289 	{PCI_VENDOR_ID_CHELSIO, 0x0022, 2, "T310E"},
290 	{PCI_VENDOR_ID_CHELSIO, 0x0023, 3, "T320X"},
291 	{PCI_VENDOR_ID_CHELSIO, 0x0024, 1, "T302X"},
292 	{PCI_VENDOR_ID_CHELSIO, 0x0025, 3, "T320E"},
293 	{PCI_VENDOR_ID_CHELSIO, 0x0026, 2, "T310X"},
294 	{PCI_VENDOR_ID_CHELSIO, 0x0030, 2, "T3B10"},
295 	{PCI_VENDOR_ID_CHELSIO, 0x0031, 3, "T3B20"},
296 	{PCI_VENDOR_ID_CHELSIO, 0x0032, 1, "T3B02"},
297 	{PCI_VENDOR_ID_CHELSIO, 0x0033, 4, "T3B04"},
298 	{PCI_VENDOR_ID_CHELSIO, 0x0035, 6, "T3C10"},
299 	{PCI_VENDOR_ID_CHELSIO, 0x0036, 3, "S320E-CR"},
300 	{PCI_VENDOR_ID_CHELSIO, 0x0037, 7, "N320E-G2"},
301 	{0, 0, 0, NULL}
302 };
303 
304 static int set_eeprom(struct port_info *pi, const uint8_t *data, int len, int offset);
305 
306 
307 static __inline char
308 t3rev2char(struct adapter *adapter)
309 {
310 	char rev = 'z';
311 
312 	switch(adapter->params.rev) {
313 	case T3_REV_A:
314 		rev = 'a';
315 		break;
316 	case T3_REV_B:
317 	case T3_REV_B2:
318 		rev = 'b';
319 		break;
320 	case T3_REV_C:
321 		rev = 'c';
322 		break;
323 	}
324 	return rev;
325 }
326 
327 static struct cxgb_ident *
328 cxgb_get_ident(device_t dev)
329 {
330 	struct cxgb_ident *id;
331 
332 	for (id = cxgb_identifiers; id->desc != NULL; id++) {
333 		if ((id->vendor == pci_get_vendor(dev)) &&
334 		    (id->device == pci_get_device(dev))) {
335 			return (id);
336 		}
337 	}
338 	return (NULL);
339 }
340 
341 static const struct adapter_info *
342 cxgb_get_adapter_info(device_t dev)
343 {
344 	struct cxgb_ident *id;
345 	const struct adapter_info *ai;
346 
347 	id = cxgb_get_ident(dev);
348 	if (id == NULL)
349 		return (NULL);
350 
351 	ai = t3_get_adapter_info(id->index);
352 
353 	return (ai);
354 }
355 
356 static int
357 cxgb_controller_probe(device_t dev)
358 {
359 	const struct adapter_info *ai;
360 	char *ports, buf[80];
361 	int nports;
362 
363 	ai = cxgb_get_adapter_info(dev);
364 	if (ai == NULL)
365 		return (ENXIO);
366 
367 	nports = ai->nports0 + ai->nports1;
368 	if (nports == 1)
369 		ports = "port";
370 	else
371 		ports = "ports";
372 
373 	snprintf(buf, sizeof(buf), "%s, %d %s", ai->desc, nports, ports);
374 	device_set_desc_copy(dev, buf);
375 	return (BUS_PROBE_DEFAULT);
376 }
377 
378 #define FW_FNAME "cxgb_t3fw"
379 #define TPEEPROM_NAME "cxgb_t3%c_tp_eeprom"
380 #define TPSRAM_NAME "cxgb_t3%c_protocol_sram"
381 
382 static int
383 upgrade_fw(adapter_t *sc)
384 {
385 	const struct firmware *fw;
386 	int status;
387 	u32 vers;
388 
389 	if ((fw = firmware_get(FW_FNAME)) == NULL)  {
390 		device_printf(sc->dev, "Could not find firmware image %s\n", FW_FNAME);
391 		return (ENOENT);
392 	} else
393 		device_printf(sc->dev, "installing firmware on card\n");
394 	status = t3_load_fw(sc, (const uint8_t *)fw->data, fw->datasize);
395 
396 	if (status != 0) {
397 		device_printf(sc->dev, "failed to install firmware: %d\n",
398 		    status);
399 	} else {
400 		t3_get_fw_version(sc, &vers);
401 		snprintf(&sc->fw_version[0], sizeof(sc->fw_version), "%d.%d.%d",
402 		    G_FW_VERSION_MAJOR(vers), G_FW_VERSION_MINOR(vers),
403 		    G_FW_VERSION_MICRO(vers));
404 	}
405 
406 	firmware_put(fw, FIRMWARE_UNLOAD);
407 
408 	return (status);
409 }
410 
411 /*
412  * The cxgb_controller_attach function is responsible for the initial
413  * bringup of the device.  Its responsibilities include:
414  *
415  *  1. Determine if the device supports MSI or MSI-X.
416  *  2. Allocate bus resources so that we can access the Base Address Register
417  *  3. Create and initialize mutexes for the controller and its control
418  *     logic such as SGE and MDIO.
419  *  4. Call hardware specific setup routine for the adapter as a whole.
420  *  5. Allocate the BAR for doing MSI-X.
421  *  6. Setup the line interrupt iff MSI-X is not supported.
422  *  7. Create the driver's taskq.
423  *  8. Start one task queue service thread.
424  *  9. Check if the firmware and SRAM are up-to-date.  They will be
425  *     auto-updated later (before FULL_INIT_DONE), if required.
426  * 10. Create a child device for each MAC (port)
427  * 11. Initialize T3 private state.
428  * 12. Trigger the LED
429  * 13. Setup offload iff supported.
430  * 14. Reset/restart the tick callout.
431  * 15. Attach sysctls
432  *
433  * NOTE: Any modification or deviation from this list MUST be reflected in
434  * the above comment.  Failure to do so will result in problems on various
435  * error conditions including link flapping.
436  */
437 static int
438 cxgb_controller_attach(device_t dev)
439 {
440 	device_t child;
441 	const struct adapter_info *ai;
442 	struct adapter *sc;
443 	int i, error = 0;
444 	uint32_t vers;
445 	int port_qsets = 1;
446 	int msi_needed, reg;
447 	char buf[80];
448 
449 	sc = device_get_softc(dev);
450 	sc->dev = dev;
451 	sc->msi_count = 0;
452 	ai = cxgb_get_adapter_info(dev);
453 
454 	snprintf(sc->lockbuf, ADAPTER_LOCK_NAME_LEN, "cxgb controller lock %d",
455 	    device_get_unit(dev));
456 	ADAPTER_LOCK_INIT(sc, sc->lockbuf);
457 
458 	snprintf(sc->reglockbuf, ADAPTER_LOCK_NAME_LEN, "SGE reg lock %d",
459 	    device_get_unit(dev));
460 	snprintf(sc->mdiolockbuf, ADAPTER_LOCK_NAME_LEN, "cxgb mdio lock %d",
461 	    device_get_unit(dev));
462 	snprintf(sc->elmerlockbuf, ADAPTER_LOCK_NAME_LEN, "cxgb elmer lock %d",
463 	    device_get_unit(dev));
464 
465 	MTX_INIT(&sc->sge.reg_lock, sc->reglockbuf, NULL, MTX_SPIN);
466 	MTX_INIT(&sc->mdio_lock, sc->mdiolockbuf, NULL, MTX_DEF);
467 	MTX_INIT(&sc->elmer_lock, sc->elmerlockbuf, NULL, MTX_DEF);
468 
469 	mtx_lock(&t3_list_lock);
470 	SLIST_INSERT_HEAD(&t3_list, sc, link);
471 	mtx_unlock(&t3_list_lock);
472 
473 	/* find the PCIe link width and set max read request to 4KB*/
474 	if (pci_find_cap(dev, PCIY_EXPRESS, &reg) == 0) {
475 		uint16_t lnk;
476 
477 		lnk = pci_read_config(dev, reg + PCIER_LINK_STA, 2);
478 		sc->link_width = (lnk & PCIEM_LINK_STA_WIDTH) >> 4;
479 		if (sc->link_width < 8 &&
480 		    (ai->caps & SUPPORTED_10000baseT_Full)) {
481 			device_printf(sc->dev,
482 			    "PCIe x%d Link, expect reduced performance\n",
483 			    sc->link_width);
484 		}
485 
486 		pci_set_max_read_req(dev, 4096);
487 	}
488 
489 	touch_bars(dev);
490 	pci_enable_busmaster(dev);
491 	/*
492 	 * Allocate the registers and make them available to the driver.
493 	 * The registers that we care about for NIC mode are in BAR 0
494 	 */
495 	sc->regs_rid = PCIR_BAR(0);
496 	if ((sc->regs_res = bus_alloc_resource_any(dev, SYS_RES_MEMORY,
497 	    &sc->regs_rid, RF_ACTIVE)) == NULL) {
498 		device_printf(dev, "Cannot allocate BAR region 0\n");
499 		error = ENXIO;
500 		goto out;
501 	}
502 
503 	sc->bt = rman_get_bustag(sc->regs_res);
504 	sc->bh = rman_get_bushandle(sc->regs_res);
505 	sc->mmio_len = rman_get_size(sc->regs_res);
506 
507 	for (i = 0; i < MAX_NPORTS; i++)
508 		sc->port[i].adapter = sc;
509 
510 	if (t3_prep_adapter(sc, ai, 1) < 0) {
511 		printf("prep adapter failed\n");
512 		error = ENODEV;
513 		goto out;
514 	}
515 
516 	sc->udbs_rid = PCIR_BAR(2);
517 	sc->udbs_res = NULL;
518 	if (is_offload(sc) &&
519 	    ((sc->udbs_res = bus_alloc_resource_any(dev, SYS_RES_MEMORY,
520 		   &sc->udbs_rid, RF_ACTIVE)) == NULL)) {
521 		device_printf(dev, "Cannot allocate BAR region 1\n");
522 		error = ENXIO;
523 		goto out;
524 	}
525 
526         /* Allocate the BAR for doing MSI-X.  If it succeeds, try to allocate
527 	 * enough messages for the queue sets.  If that fails, try falling
528 	 * back to MSI.  If that fails, then try falling back to the legacy
529 	 * interrupt pin model.
530 	 */
531 	sc->msix_regs_rid = 0x20;
532 	if ((msi_allowed >= 2) &&
533 	    (sc->msix_regs_res = bus_alloc_resource_any(dev, SYS_RES_MEMORY,
534 	    &sc->msix_regs_rid, RF_ACTIVE)) != NULL) {
535 
536 		if (multiq)
537 			port_qsets = min(SGE_QSETS/sc->params.nports, mp_ncpus);
538 		msi_needed = sc->msi_count = sc->params.nports * port_qsets + 1;
539 
540 		if (pci_msix_count(dev) == 0 ||
541 		    (error = pci_alloc_msix(dev, &sc->msi_count)) != 0 ||
542 		    sc->msi_count != msi_needed) {
543 			device_printf(dev, "alloc msix failed - "
544 				      "msi_count=%d, msi_needed=%d, err=%d; "
545 				      "will try MSI\n", sc->msi_count,
546 				      msi_needed, error);
547 			sc->msi_count = 0;
548 			port_qsets = 1;
549 			pci_release_msi(dev);
550 			bus_release_resource(dev, SYS_RES_MEMORY,
551 			    sc->msix_regs_rid, sc->msix_regs_res);
552 			sc->msix_regs_res = NULL;
553 		} else {
554 			sc->flags |= USING_MSIX;
555 			sc->cxgb_intr = cxgb_async_intr;
556 			device_printf(dev,
557 				      "using MSI-X interrupts (%u vectors)\n",
558 				      sc->msi_count);
559 		}
560 	}
561 
562 	if ((msi_allowed >= 1) && (sc->msi_count == 0)) {
563 		sc->msi_count = 1;
564 		if ((error = pci_alloc_msi(dev, &sc->msi_count)) != 0) {
565 			device_printf(dev, "alloc msi failed - "
566 				      "err=%d; will try INTx\n", error);
567 			sc->msi_count = 0;
568 			port_qsets = 1;
569 			pci_release_msi(dev);
570 		} else {
571 			sc->flags |= USING_MSI;
572 			sc->cxgb_intr = t3_intr_msi;
573 			device_printf(dev, "using MSI interrupts\n");
574 		}
575 	}
576 	if (sc->msi_count == 0) {
577 		device_printf(dev, "using line interrupts\n");
578 		sc->cxgb_intr = t3b_intr;
579 	}
580 
581 	/* Create a private taskqueue thread for handling driver events */
582 	sc->tq = taskqueue_create("cxgb_taskq", M_NOWAIT,
583 	    taskqueue_thread_enqueue, &sc->tq);
584 	if (sc->tq == NULL) {
585 		device_printf(dev, "failed to allocate controller task queue\n");
586 		goto out;
587 	}
588 
589 	taskqueue_start_threads(&sc->tq, 1, PI_NET, "%s taskq",
590 	    device_get_nameunit(dev));
591 	TASK_INIT(&sc->tick_task, 0, cxgb_tick_handler, sc);
592 
593 
594 	/* Create a periodic callout for checking adapter status */
595 	callout_init(&sc->cxgb_tick_ch, TRUE);
596 
597 	if (t3_check_fw_version(sc) < 0 || force_fw_update) {
598 		/*
599 		 * Warn user that a firmware update will be attempted in init.
600 		 */
601 		device_printf(dev, "firmware needs to be updated to version %d.%d.%d\n",
602 		    FW_VERSION_MAJOR, FW_VERSION_MINOR, FW_VERSION_MICRO);
603 		sc->flags &= ~FW_UPTODATE;
604 	} else {
605 		sc->flags |= FW_UPTODATE;
606 	}
607 
608 	if (t3_check_tpsram_version(sc) < 0) {
609 		/*
610 		 * Warn user that a firmware update will be attempted in init.
611 		 */
612 		device_printf(dev, "SRAM needs to be updated to version %c-%d.%d.%d\n",
613 		    t3rev2char(sc), TP_VERSION_MAJOR, TP_VERSION_MINOR, TP_VERSION_MICRO);
614 		sc->flags &= ~TPS_UPTODATE;
615 	} else {
616 		sc->flags |= TPS_UPTODATE;
617 	}
618 
619 	/*
620 	 * Create a child device for each MAC.  The ethernet attachment
621 	 * will be done in these children.
622 	 */
623 	for (i = 0; i < (sc)->params.nports; i++) {
624 		struct port_info *pi;
625 
626 		if ((child = device_add_child(dev, "cxgb", -1)) == NULL) {
627 			device_printf(dev, "failed to add child port\n");
628 			error = EINVAL;
629 			goto out;
630 		}
631 		pi = &sc->port[i];
632 		pi->adapter = sc;
633 		pi->nqsets = port_qsets;
634 		pi->first_qset = i*port_qsets;
635 		pi->port_id = i;
636 		pi->tx_chan = i >= ai->nports0;
637 		pi->txpkt_intf = pi->tx_chan ? 2 * (i - ai->nports0) + 1 : 2 * i;
638 		sc->rxpkt_map[pi->txpkt_intf] = i;
639 		sc->port[i].tx_chan = i >= ai->nports0;
640 		sc->portdev[i] = child;
641 		device_set_softc(child, pi);
642 	}
643 	if ((error = bus_generic_attach(dev)) != 0)
644 		goto out;
645 
646 	/* initialize sge private state */
647 	t3_sge_init_adapter(sc);
648 
649 	t3_led_ready(sc);
650 
651 	error = t3_get_fw_version(sc, &vers);
652 	if (error)
653 		goto out;
654 
655 	snprintf(&sc->fw_version[0], sizeof(sc->fw_version), "%d.%d.%d",
656 	    G_FW_VERSION_MAJOR(vers), G_FW_VERSION_MINOR(vers),
657 	    G_FW_VERSION_MICRO(vers));
658 
659 	snprintf(buf, sizeof(buf), "%s %sNIC\t E/C: %s S/N: %s",
660 		 ai->desc, is_offload(sc) ? "R" : "",
661 		 sc->params.vpd.ec, sc->params.vpd.sn);
662 	device_set_desc_copy(dev, buf);
663 
664 	snprintf(&sc->port_types[0], sizeof(sc->port_types), "%x%x%x%x",
665 		 sc->params.vpd.port_type[0], sc->params.vpd.port_type[1],
666 		 sc->params.vpd.port_type[2], sc->params.vpd.port_type[3]);
667 
668 	device_printf(sc->dev, "Firmware Version %s\n", &sc->fw_version[0]);
669 	callout_reset(&sc->cxgb_tick_ch, hz, cxgb_tick, sc);
670 	t3_add_attach_sysctls(sc);
671 
672 #ifdef TCP_OFFLOAD
673 	for (i = 0; i < NUM_CPL_HANDLERS; i++)
674 		sc->cpl_handler[i] = cpl_not_handled;
675 #endif
676 
677 	t3_intr_clear(sc);
678 	error = cxgb_setup_interrupts(sc);
679 out:
680 	if (error)
681 		cxgb_free(sc);
682 
683 	return (error);
684 }
685 
686 /*
687  * The cxgb_controller_detach routine is called with the device is
688  * unloaded from the system.
689  */
690 
691 static int
692 cxgb_controller_detach(device_t dev)
693 {
694 	struct adapter *sc;
695 
696 	sc = device_get_softc(dev);
697 
698 	cxgb_free(sc);
699 
700 	return (0);
701 }
702 
703 /*
704  * The cxgb_free() is called by the cxgb_controller_detach() routine
705  * to tear down the structures that were built up in
706  * cxgb_controller_attach(), and should be the final piece of work
707  * done when fully unloading the driver.
708  *
709  *
710  *  1. Shutting down the threads started by the cxgb_controller_attach()
711  *     routine.
712  *  2. Stopping the lower level device and all callouts (cxgb_down_locked()).
713  *  3. Detaching all of the port devices created during the
714  *     cxgb_controller_attach() routine.
715  *  4. Removing the device children created via cxgb_controller_attach().
716  *  5. Releasing PCI resources associated with the device.
717  *  6. Turning off the offload support, iff it was turned on.
718  *  7. Destroying the mutexes created in cxgb_controller_attach().
719  *
720  */
721 static void
722 cxgb_free(struct adapter *sc)
723 {
724 	int i, nqsets = 0;
725 
726 	ADAPTER_LOCK(sc);
727 	sc->flags |= CXGB_SHUTDOWN;
728 	ADAPTER_UNLOCK(sc);
729 
730 	/*
731 	 * Make sure all child devices are gone.
732 	 */
733 	bus_generic_detach(sc->dev);
734 	for (i = 0; i < (sc)->params.nports; i++) {
735 		if (sc->portdev[i] &&
736 		    device_delete_child(sc->dev, sc->portdev[i]) != 0)
737 			device_printf(sc->dev, "failed to delete child port\n");
738 		nqsets += sc->port[i].nqsets;
739 	}
740 
741 	/*
742 	 * At this point, it is as if cxgb_port_detach has run on all ports, and
743 	 * cxgb_down has run on the adapter.  All interrupts have been silenced,
744 	 * all open devices have been closed.
745 	 */
746 	KASSERT(sc->open_device_map == 0, ("%s: device(s) still open (%x)",
747 					   __func__, sc->open_device_map));
748 	for (i = 0; i < sc->params.nports; i++) {
749 		KASSERT(sc->port[i].ifp == NULL, ("%s: port %i undead!",
750 						  __func__, i));
751 	}
752 
753 	/*
754 	 * Finish off the adapter's callouts.
755 	 */
756 	callout_drain(&sc->cxgb_tick_ch);
757 	callout_drain(&sc->sge_timer_ch);
758 
759 	/*
760 	 * Release resources grabbed under FULL_INIT_DONE by cxgb_up.  The
761 	 * sysctls are cleaned up by the kernel linker.
762 	 */
763 	if (sc->flags & FULL_INIT_DONE) {
764  		t3_free_sge_resources(sc, nqsets);
765  		sc->flags &= ~FULL_INIT_DONE;
766  	}
767 
768 	/*
769 	 * Release all interrupt resources.
770 	 */
771 	cxgb_teardown_interrupts(sc);
772 	if (sc->flags & (USING_MSI | USING_MSIX)) {
773 		device_printf(sc->dev, "releasing msi message(s)\n");
774 		pci_release_msi(sc->dev);
775 	} else {
776 		device_printf(sc->dev, "no msi message to release\n");
777 	}
778 
779 	if (sc->msix_regs_res != NULL) {
780 		bus_release_resource(sc->dev, SYS_RES_MEMORY, sc->msix_regs_rid,
781 		    sc->msix_regs_res);
782 	}
783 
784 	/*
785 	 * Free the adapter's taskqueue.
786 	 */
787 	if (sc->tq != NULL) {
788 		taskqueue_free(sc->tq);
789 		sc->tq = NULL;
790 	}
791 
792 	free(sc->filters, M_DEVBUF);
793 	t3_sge_free(sc);
794 
795 	if (sc->udbs_res != NULL)
796 		bus_release_resource(sc->dev, SYS_RES_MEMORY, sc->udbs_rid,
797 		    sc->udbs_res);
798 
799 	if (sc->regs_res != NULL)
800 		bus_release_resource(sc->dev, SYS_RES_MEMORY, sc->regs_rid,
801 		    sc->regs_res);
802 
803 	MTX_DESTROY(&sc->mdio_lock);
804 	MTX_DESTROY(&sc->sge.reg_lock);
805 	MTX_DESTROY(&sc->elmer_lock);
806 	mtx_lock(&t3_list_lock);
807 	SLIST_REMOVE(&t3_list, sc, adapter, link);
808 	mtx_unlock(&t3_list_lock);
809 	ADAPTER_LOCK_DEINIT(sc);
810 }
811 
812 /**
813  *	setup_sge_qsets - configure SGE Tx/Rx/response queues
814  *	@sc: the controller softc
815  *
816  *	Determines how many sets of SGE queues to use and initializes them.
817  *	We support multiple queue sets per port if we have MSI-X, otherwise
818  *	just one queue set per port.
819  */
820 static int
821 setup_sge_qsets(adapter_t *sc)
822 {
823 	int i, j, err, irq_idx = 0, qset_idx = 0;
824 	u_int ntxq = SGE_TXQ_PER_SET;
825 
826 	if ((err = t3_sge_alloc(sc)) != 0) {
827 		device_printf(sc->dev, "t3_sge_alloc returned %d\n", err);
828 		return (err);
829 	}
830 
831 	if (sc->params.rev > 0 && !(sc->flags & USING_MSI))
832 		irq_idx = -1;
833 
834 	for (i = 0; i < (sc)->params.nports; i++) {
835 		struct port_info *pi = &sc->port[i];
836 
837 		for (j = 0; j < pi->nqsets; j++, qset_idx++) {
838 			err = t3_sge_alloc_qset(sc, qset_idx, (sc)->params.nports,
839 			    (sc->flags & USING_MSIX) ? qset_idx + 1 : irq_idx,
840 			    &sc->params.sge.qset[qset_idx], ntxq, pi);
841 			if (err) {
842 				t3_free_sge_resources(sc, qset_idx);
843 				device_printf(sc->dev,
844 				    "t3_sge_alloc_qset failed with %d\n", err);
845 				return (err);
846 			}
847 		}
848 	}
849 
850 	return (0);
851 }
852 
853 static void
854 cxgb_teardown_interrupts(adapter_t *sc)
855 {
856 	int i;
857 
858 	for (i = 0; i < SGE_QSETS; i++) {
859 		if (sc->msix_intr_tag[i] == NULL) {
860 
861 			/* Should have been setup fully or not at all */
862 			KASSERT(sc->msix_irq_res[i] == NULL &&
863 				sc->msix_irq_rid[i] == 0,
864 				("%s: half-done interrupt (%d).", __func__, i));
865 
866 			continue;
867 		}
868 
869 		bus_teardown_intr(sc->dev, sc->msix_irq_res[i],
870 				  sc->msix_intr_tag[i]);
871 		bus_release_resource(sc->dev, SYS_RES_IRQ, sc->msix_irq_rid[i],
872 				     sc->msix_irq_res[i]);
873 
874 		sc->msix_irq_res[i] = sc->msix_intr_tag[i] = NULL;
875 		sc->msix_irq_rid[i] = 0;
876 	}
877 
878 	if (sc->intr_tag) {
879 		KASSERT(sc->irq_res != NULL,
880 			("%s: half-done interrupt.", __func__));
881 
882 		bus_teardown_intr(sc->dev, sc->irq_res, sc->intr_tag);
883 		bus_release_resource(sc->dev, SYS_RES_IRQ, sc->irq_rid,
884 				     sc->irq_res);
885 
886 		sc->irq_res = sc->intr_tag = NULL;
887 		sc->irq_rid = 0;
888 	}
889 }
890 
891 static int
892 cxgb_setup_interrupts(adapter_t *sc)
893 {
894 	struct resource *res;
895 	void *tag;
896 	int i, rid, err, intr_flag = sc->flags & (USING_MSI | USING_MSIX);
897 
898 	sc->irq_rid = intr_flag ? 1 : 0;
899 	sc->irq_res = bus_alloc_resource_any(sc->dev, SYS_RES_IRQ, &sc->irq_rid,
900 					     RF_SHAREABLE | RF_ACTIVE);
901 	if (sc->irq_res == NULL) {
902 		device_printf(sc->dev, "Cannot allocate interrupt (%x, %u)\n",
903 			      intr_flag, sc->irq_rid);
904 		err = EINVAL;
905 		sc->irq_rid = 0;
906 	} else {
907 		err = bus_setup_intr(sc->dev, sc->irq_res,
908 		    INTR_MPSAFE | INTR_TYPE_NET, NULL,
909 		    sc->cxgb_intr, sc, &sc->intr_tag);
910 
911 		if (err) {
912 			device_printf(sc->dev,
913 				      "Cannot set up interrupt (%x, %u, %d)\n",
914 				      intr_flag, sc->irq_rid, err);
915 			bus_release_resource(sc->dev, SYS_RES_IRQ, sc->irq_rid,
916 					     sc->irq_res);
917 			sc->irq_res = sc->intr_tag = NULL;
918 			sc->irq_rid = 0;
919 		}
920 	}
921 
922 	/* That's all for INTx or MSI */
923 	if (!(intr_flag & USING_MSIX) || err)
924 		return (err);
925 
926 	bus_describe_intr(sc->dev, sc->irq_res, sc->intr_tag, "err");
927 	for (i = 0; i < sc->msi_count - 1; i++) {
928 		rid = i + 2;
929 		res = bus_alloc_resource_any(sc->dev, SYS_RES_IRQ, &rid,
930 					     RF_SHAREABLE | RF_ACTIVE);
931 		if (res == NULL) {
932 			device_printf(sc->dev, "Cannot allocate interrupt "
933 				      "for message %d\n", rid);
934 			err = EINVAL;
935 			break;
936 		}
937 
938 		err = bus_setup_intr(sc->dev, res, INTR_MPSAFE | INTR_TYPE_NET,
939 				     NULL, t3_intr_msix, &sc->sge.qs[i], &tag);
940 		if (err) {
941 			device_printf(sc->dev, "Cannot set up interrupt "
942 				      "for message %d (%d)\n", rid, err);
943 			bus_release_resource(sc->dev, SYS_RES_IRQ, rid, res);
944 			break;
945 		}
946 
947 		sc->msix_irq_rid[i] = rid;
948 		sc->msix_irq_res[i] = res;
949 		sc->msix_intr_tag[i] = tag;
950 		bus_describe_intr(sc->dev, res, tag, "qs%d", i);
951 	}
952 
953 	if (err)
954 		cxgb_teardown_interrupts(sc);
955 
956 	return (err);
957 }
958 
959 
960 static int
961 cxgb_port_probe(device_t dev)
962 {
963 	struct port_info *p;
964 	char buf[80];
965 	const char *desc;
966 
967 	p = device_get_softc(dev);
968 	desc = p->phy.desc;
969 	snprintf(buf, sizeof(buf), "Port %d %s", p->port_id, desc);
970 	device_set_desc_copy(dev, buf);
971 	return (0);
972 }
973 
974 
975 static int
976 cxgb_makedev(struct port_info *pi)
977 {
978 
979 	pi->port_cdev = make_dev(&cxgb_cdevsw, pi->ifp->if_dunit,
980 	    UID_ROOT, GID_WHEEL, 0600, "%s", if_name(pi->ifp));
981 
982 	if (pi->port_cdev == NULL)
983 		return (ENOMEM);
984 
985 	pi->port_cdev->si_drv1 = (void *)pi;
986 
987 	return (0);
988 }
989 
990 #define CXGB_CAP (IFCAP_VLAN_HWTAGGING | IFCAP_VLAN_MTU | IFCAP_HWCSUM | \
991     IFCAP_VLAN_HWCSUM | IFCAP_TSO | IFCAP_JUMBO_MTU | IFCAP_LRO | \
992     IFCAP_VLAN_HWTSO | IFCAP_LINKSTATE | IFCAP_HWCSUM_IPV6)
993 #define CXGB_CAP_ENABLE CXGB_CAP
994 
995 static int
996 cxgb_port_attach(device_t dev)
997 {
998 	struct port_info *p;
999 	struct ifnet *ifp;
1000 	int err;
1001 	struct adapter *sc;
1002 
1003 	p = device_get_softc(dev);
1004 	sc = p->adapter;
1005 	snprintf(p->lockbuf, PORT_NAME_LEN, "cxgb port lock %d:%d",
1006 	    device_get_unit(device_get_parent(dev)), p->port_id);
1007 	PORT_LOCK_INIT(p, p->lockbuf);
1008 
1009 	callout_init(&p->link_check_ch, CALLOUT_MPSAFE);
1010 	TASK_INIT(&p->link_check_task, 0, check_link_status, p);
1011 
1012 	/* Allocate an ifnet object and set it up */
1013 	ifp = p->ifp = if_alloc(IFT_ETHER);
1014 	if (ifp == NULL) {
1015 		device_printf(dev, "Cannot allocate ifnet\n");
1016 		return (ENOMEM);
1017 	}
1018 
1019 	if_initname(ifp, device_get_name(dev), device_get_unit(dev));
1020 	ifp->if_init = cxgb_init;
1021 	ifp->if_softc = p;
1022 	ifp->if_flags = IFF_BROADCAST | IFF_SIMPLEX | IFF_MULTICAST;
1023 	ifp->if_ioctl = cxgb_ioctl;
1024 	ifp->if_transmit = cxgb_transmit;
1025 	ifp->if_qflush = cxgb_qflush;
1026 	ifp->if_get_counter = cxgb_get_counter;
1027 
1028 	ifp->if_capabilities = CXGB_CAP;
1029 #ifdef TCP_OFFLOAD
1030 	if (is_offload(sc))
1031 		ifp->if_capabilities |= IFCAP_TOE4;
1032 #endif
1033 	ifp->if_capenable = CXGB_CAP_ENABLE;
1034 	ifp->if_hwassist = CSUM_TCP | CSUM_UDP | CSUM_IP | CSUM_TSO |
1035 	    CSUM_UDP_IPV6 | CSUM_TCP_IPV6;
1036 
1037 	/*
1038 	 * Disable TSO on 4-port - it isn't supported by the firmware.
1039 	 */
1040 	if (sc->params.nports > 2) {
1041 		ifp->if_capabilities &= ~(IFCAP_TSO | IFCAP_VLAN_HWTSO);
1042 		ifp->if_capenable &= ~(IFCAP_TSO | IFCAP_VLAN_HWTSO);
1043 		ifp->if_hwassist &= ~CSUM_TSO;
1044 	}
1045 
1046 	ether_ifattach(ifp, p->hw_addr);
1047 
1048 #ifdef DEFAULT_JUMBO
1049 	if (sc->params.nports <= 2)
1050 		ifp->if_mtu = ETHERMTU_JUMBO;
1051 #endif
1052 	if ((err = cxgb_makedev(p)) != 0) {
1053 		printf("makedev failed %d\n", err);
1054 		return (err);
1055 	}
1056 
1057 	/* Create a list of media supported by this port */
1058 	ifmedia_init(&p->media, IFM_IMASK, cxgb_media_change,
1059 	    cxgb_media_status);
1060 	cxgb_build_medialist(p);
1061 
1062 	t3_sge_init_port(p);
1063 
1064 	return (err);
1065 }
1066 
1067 /*
1068  * cxgb_port_detach() is called via the device_detach methods when
1069  * cxgb_free() calls the bus_generic_detach.  It is responsible for
1070  * removing the device from the view of the kernel, i.e. from all
1071  * interfaces lists etc.  This routine is only called when the driver is
1072  * being unloaded, not when the link goes down.
1073  */
1074 static int
1075 cxgb_port_detach(device_t dev)
1076 {
1077 	struct port_info *p;
1078 	struct adapter *sc;
1079 	int i;
1080 
1081 	p = device_get_softc(dev);
1082 	sc = p->adapter;
1083 
1084 	/* Tell cxgb_ioctl and if_init that the port is going away */
1085 	ADAPTER_LOCK(sc);
1086 	SET_DOOMED(p);
1087 	wakeup(&sc->flags);
1088 	while (IS_BUSY(sc))
1089 		mtx_sleep(&sc->flags, &sc->lock, 0, "cxgbdtch", 0);
1090 	SET_BUSY(sc);
1091 	ADAPTER_UNLOCK(sc);
1092 
1093 	if (p->port_cdev != NULL)
1094 		destroy_dev(p->port_cdev);
1095 
1096 	cxgb_uninit_synchronized(p);
1097 	ether_ifdetach(p->ifp);
1098 
1099 	for (i = p->first_qset; i < p->first_qset + p->nqsets; i++) {
1100 		struct sge_qset *qs = &sc->sge.qs[i];
1101 		struct sge_txq *txq = &qs->txq[TXQ_ETH];
1102 
1103 		callout_drain(&txq->txq_watchdog);
1104 		callout_drain(&txq->txq_timer);
1105 	}
1106 
1107 	PORT_LOCK_DEINIT(p);
1108 	if_free(p->ifp);
1109 	p->ifp = NULL;
1110 
1111 	ADAPTER_LOCK(sc);
1112 	CLR_BUSY(sc);
1113 	wakeup_one(&sc->flags);
1114 	ADAPTER_UNLOCK(sc);
1115 	return (0);
1116 }
1117 
1118 void
1119 t3_fatal_err(struct adapter *sc)
1120 {
1121 	u_int fw_status[4];
1122 
1123 	if (sc->flags & FULL_INIT_DONE) {
1124 		t3_sge_stop(sc);
1125 		t3_write_reg(sc, A_XGM_TX_CTRL, 0);
1126 		t3_write_reg(sc, A_XGM_RX_CTRL, 0);
1127 		t3_write_reg(sc, XGM_REG(A_XGM_TX_CTRL, 1), 0);
1128 		t3_write_reg(sc, XGM_REG(A_XGM_RX_CTRL, 1), 0);
1129 		t3_intr_disable(sc);
1130 	}
1131 	device_printf(sc->dev,"encountered fatal error, operation suspended\n");
1132 	if (!t3_cim_ctl_blk_read(sc, 0xa0, 4, fw_status))
1133 		device_printf(sc->dev, "FW_ status: 0x%x, 0x%x, 0x%x, 0x%x\n",
1134 		    fw_status[0], fw_status[1], fw_status[2], fw_status[3]);
1135 }
1136 
1137 int
1138 t3_os_find_pci_capability(adapter_t *sc, int cap)
1139 {
1140 	device_t dev;
1141 	struct pci_devinfo *dinfo;
1142 	pcicfgregs *cfg;
1143 	uint32_t status;
1144 	uint8_t ptr;
1145 
1146 	dev = sc->dev;
1147 	dinfo = device_get_ivars(dev);
1148 	cfg = &dinfo->cfg;
1149 
1150 	status = pci_read_config(dev, PCIR_STATUS, 2);
1151 	if (!(status & PCIM_STATUS_CAPPRESENT))
1152 		return (0);
1153 
1154 	switch (cfg->hdrtype & PCIM_HDRTYPE) {
1155 	case 0:
1156 	case 1:
1157 		ptr = PCIR_CAP_PTR;
1158 		break;
1159 	case 2:
1160 		ptr = PCIR_CAP_PTR_2;
1161 		break;
1162 	default:
1163 		return (0);
1164 		break;
1165 	}
1166 	ptr = pci_read_config(dev, ptr, 1);
1167 
1168 	while (ptr != 0) {
1169 		if (pci_read_config(dev, ptr + PCICAP_ID, 1) == cap)
1170 			return (ptr);
1171 		ptr = pci_read_config(dev, ptr + PCICAP_NEXTPTR, 1);
1172 	}
1173 
1174 	return (0);
1175 }
1176 
1177 int
1178 t3_os_pci_save_state(struct adapter *sc)
1179 {
1180 	device_t dev;
1181 	struct pci_devinfo *dinfo;
1182 
1183 	dev = sc->dev;
1184 	dinfo = device_get_ivars(dev);
1185 
1186 	pci_cfg_save(dev, dinfo, 0);
1187 	return (0);
1188 }
1189 
1190 int
1191 t3_os_pci_restore_state(struct adapter *sc)
1192 {
1193 	device_t dev;
1194 	struct pci_devinfo *dinfo;
1195 
1196 	dev = sc->dev;
1197 	dinfo = device_get_ivars(dev);
1198 
1199 	pci_cfg_restore(dev, dinfo);
1200 	return (0);
1201 }
1202 
1203 /**
1204  *	t3_os_link_changed - handle link status changes
1205  *	@sc: the adapter associated with the link change
1206  *	@port_id: the port index whose link status has changed
1207  *	@link_status: the new status of the link
1208  *	@speed: the new speed setting
1209  *	@duplex: the new duplex setting
1210  *	@fc: the new flow-control setting
1211  *
1212  *	This is the OS-dependent handler for link status changes.  The OS
1213  *	neutral handler takes care of most of the processing for these events,
1214  *	then calls this handler for any OS-specific processing.
1215  */
1216 void
1217 t3_os_link_changed(adapter_t *adapter, int port_id, int link_status, int speed,
1218      int duplex, int fc, int mac_was_reset)
1219 {
1220 	struct port_info *pi = &adapter->port[port_id];
1221 	struct ifnet *ifp = pi->ifp;
1222 
1223 	/* no race with detach, so ifp should always be good */
1224 	KASSERT(ifp, ("%s: if detached.", __func__));
1225 
1226 	/* Reapply mac settings if they were lost due to a reset */
1227 	if (mac_was_reset) {
1228 		PORT_LOCK(pi);
1229 		cxgb_update_mac_settings(pi);
1230 		PORT_UNLOCK(pi);
1231 	}
1232 
1233 	if (link_status) {
1234 		ifp->if_baudrate = IF_Mbps(speed);
1235 		if_link_state_change(ifp, LINK_STATE_UP);
1236 	} else
1237 		if_link_state_change(ifp, LINK_STATE_DOWN);
1238 }
1239 
1240 /**
1241  *	t3_os_phymod_changed - handle PHY module changes
1242  *	@phy: the PHY reporting the module change
1243  *	@mod_type: new module type
1244  *
1245  *	This is the OS-dependent handler for PHY module changes.  It is
1246  *	invoked when a PHY module is removed or inserted for any OS-specific
1247  *	processing.
1248  */
1249 void t3_os_phymod_changed(struct adapter *adap, int port_id)
1250 {
1251 	static const char *mod_str[] = {
1252 		NULL, "SR", "LR", "LRM", "TWINAX", "TWINAX-L", "unknown"
1253 	};
1254 	struct port_info *pi = &adap->port[port_id];
1255 	int mod = pi->phy.modtype;
1256 
1257 	if (mod != pi->media.ifm_cur->ifm_data)
1258 		cxgb_build_medialist(pi);
1259 
1260 	if (mod == phy_modtype_none)
1261 		if_printf(pi->ifp, "PHY module unplugged\n");
1262 	else {
1263 		KASSERT(mod < ARRAY_SIZE(mod_str),
1264 			("invalid PHY module type %d", mod));
1265 		if_printf(pi->ifp, "%s PHY module inserted\n", mod_str[mod]);
1266 	}
1267 }
1268 
1269 void
1270 t3_os_set_hw_addr(adapter_t *adapter, int port_idx, u8 hw_addr[])
1271 {
1272 
1273 	/*
1274 	 * The ifnet might not be allocated before this gets called,
1275 	 * as this is called early on in attach by t3_prep_adapter
1276 	 * save the address off in the port structure
1277 	 */
1278 	if (cxgb_debug)
1279 		printf("set_hw_addr on idx %d addr %6D\n", port_idx, hw_addr, ":");
1280 	bcopy(hw_addr, adapter->port[port_idx].hw_addr, ETHER_ADDR_LEN);
1281 }
1282 
1283 /*
1284  * Programs the XGMAC based on the settings in the ifnet.  These settings
1285  * include MTU, MAC address, mcast addresses, etc.
1286  */
1287 static void
1288 cxgb_update_mac_settings(struct port_info *p)
1289 {
1290 	struct ifnet *ifp = p->ifp;
1291 	struct t3_rx_mode rm;
1292 	struct cmac *mac = &p->mac;
1293 	int mtu, hwtagging;
1294 
1295 	PORT_LOCK_ASSERT_OWNED(p);
1296 
1297 	bcopy(IF_LLADDR(ifp), p->hw_addr, ETHER_ADDR_LEN);
1298 
1299 	mtu = ifp->if_mtu;
1300 	if (ifp->if_capenable & IFCAP_VLAN_MTU)
1301 		mtu += ETHER_VLAN_ENCAP_LEN;
1302 
1303 	hwtagging = (ifp->if_capenable & IFCAP_VLAN_HWTAGGING) != 0;
1304 
1305 	t3_mac_set_mtu(mac, mtu);
1306 	t3_set_vlan_accel(p->adapter, 1 << p->tx_chan, hwtagging);
1307 	t3_mac_set_address(mac, 0, p->hw_addr);
1308 	t3_init_rx_mode(&rm, p);
1309 	t3_mac_set_rx_mode(mac, &rm);
1310 }
1311 
1312 
1313 static int
1314 await_mgmt_replies(struct adapter *adap, unsigned long init_cnt,
1315 			      unsigned long n)
1316 {
1317 	int attempts = 5;
1318 
1319 	while (adap->sge.qs[0].rspq.offload_pkts < init_cnt + n) {
1320 		if (!--attempts)
1321 			return (ETIMEDOUT);
1322 		t3_os_sleep(10);
1323 	}
1324 	return 0;
1325 }
1326 
1327 static int
1328 init_tp_parity(struct adapter *adap)
1329 {
1330 	int i;
1331 	struct mbuf *m;
1332 	struct cpl_set_tcb_field *greq;
1333 	unsigned long cnt = adap->sge.qs[0].rspq.offload_pkts;
1334 
1335 	t3_tp_set_offload_mode(adap, 1);
1336 
1337 	for (i = 0; i < 16; i++) {
1338 		struct cpl_smt_write_req *req;
1339 
1340 		m = m_gethdr(M_WAITOK, MT_DATA);
1341 		req = mtod(m, struct cpl_smt_write_req *);
1342 		m->m_len = m->m_pkthdr.len = sizeof(*req);
1343 		memset(req, 0, sizeof(*req));
1344 		req->wr.wrh_hi = htonl(V_WR_OP(FW_WROPCODE_FORWARD));
1345 		OPCODE_TID(req) = htonl(MK_OPCODE_TID(CPL_SMT_WRITE_REQ, i));
1346 		req->iff = i;
1347 		t3_mgmt_tx(adap, m);
1348 	}
1349 
1350 	for (i = 0; i < 2048; i++) {
1351 		struct cpl_l2t_write_req *req;
1352 
1353 		m = m_gethdr(M_WAITOK, MT_DATA);
1354 		req = mtod(m, struct cpl_l2t_write_req *);
1355 		m->m_len = m->m_pkthdr.len = sizeof(*req);
1356 		memset(req, 0, sizeof(*req));
1357 		req->wr.wrh_hi = htonl(V_WR_OP(FW_WROPCODE_FORWARD));
1358 		OPCODE_TID(req) = htonl(MK_OPCODE_TID(CPL_L2T_WRITE_REQ, i));
1359 		req->params = htonl(V_L2T_W_IDX(i));
1360 		t3_mgmt_tx(adap, m);
1361 	}
1362 
1363 	for (i = 0; i < 2048; i++) {
1364 		struct cpl_rte_write_req *req;
1365 
1366 		m = m_gethdr(M_WAITOK, MT_DATA);
1367 		req = mtod(m, struct cpl_rte_write_req *);
1368 		m->m_len = m->m_pkthdr.len = sizeof(*req);
1369 		memset(req, 0, sizeof(*req));
1370 		req->wr.wrh_hi = htonl(V_WR_OP(FW_WROPCODE_FORWARD));
1371 		OPCODE_TID(req) = htonl(MK_OPCODE_TID(CPL_RTE_WRITE_REQ, i));
1372 		req->l2t_idx = htonl(V_L2T_W_IDX(i));
1373 		t3_mgmt_tx(adap, m);
1374 	}
1375 
1376 	m = m_gethdr(M_WAITOK, MT_DATA);
1377 	greq = mtod(m, struct cpl_set_tcb_field *);
1378 	m->m_len = m->m_pkthdr.len = sizeof(*greq);
1379 	memset(greq, 0, sizeof(*greq));
1380 	greq->wr.wrh_hi = htonl(V_WR_OP(FW_WROPCODE_FORWARD));
1381 	OPCODE_TID(greq) = htonl(MK_OPCODE_TID(CPL_SET_TCB_FIELD, 0));
1382 	greq->mask = htobe64(1);
1383 	t3_mgmt_tx(adap, m);
1384 
1385 	i = await_mgmt_replies(adap, cnt, 16 + 2048 + 2048 + 1);
1386 	t3_tp_set_offload_mode(adap, 0);
1387 	return (i);
1388 }
1389 
1390 /**
1391  *	setup_rss - configure Receive Side Steering (per-queue connection demux)
1392  *	@adap: the adapter
1393  *
1394  *	Sets up RSS to distribute packets to multiple receive queues.  We
1395  *	configure the RSS CPU lookup table to distribute to the number of HW
1396  *	receive queues, and the response queue lookup table to narrow that
1397  *	down to the response queues actually configured for each port.
1398  *	We always configure the RSS mapping for two ports since the mapping
1399  *	table has plenty of entries.
1400  */
1401 static void
1402 setup_rss(adapter_t *adap)
1403 {
1404 	int i;
1405 	u_int nq[2];
1406 	uint8_t cpus[SGE_QSETS + 1];
1407 	uint16_t rspq_map[RSS_TABLE_SIZE];
1408 
1409 	for (i = 0; i < SGE_QSETS; ++i)
1410 		cpus[i] = i;
1411 	cpus[SGE_QSETS] = 0xff;
1412 
1413 	nq[0] = nq[1] = 0;
1414 	for_each_port(adap, i) {
1415 		const struct port_info *pi = adap2pinfo(adap, i);
1416 
1417 		nq[pi->tx_chan] += pi->nqsets;
1418 	}
1419 	for (i = 0; i < RSS_TABLE_SIZE / 2; ++i) {
1420 		rspq_map[i] = nq[0] ? i % nq[0] : 0;
1421 		rspq_map[i + RSS_TABLE_SIZE / 2] = nq[1] ? i % nq[1] + nq[0] : 0;
1422 	}
1423 
1424 	/* Calculate the reverse RSS map table */
1425 	for (i = 0; i < SGE_QSETS; ++i)
1426 		adap->rrss_map[i] = 0xff;
1427 	for (i = 0; i < RSS_TABLE_SIZE; ++i)
1428 		if (adap->rrss_map[rspq_map[i]] == 0xff)
1429 			adap->rrss_map[rspq_map[i]] = i;
1430 
1431 	t3_config_rss(adap, F_RQFEEDBACKENABLE | F_TNLLKPEN | F_TNLMAPEN |
1432 		      F_TNLPRTEN | F_TNL2TUPEN | F_TNL4TUPEN | F_OFDMAPEN |
1433 	              F_RRCPLMAPEN | V_RRCPLCPUSIZE(6) | F_HASHTOEPLITZ,
1434 	              cpus, rspq_map);
1435 
1436 }
1437 static void
1438 send_pktsched_cmd(struct adapter *adap, int sched, int qidx, int lo,
1439 			      int hi, int port)
1440 {
1441 	struct mbuf *m;
1442 	struct mngt_pktsched_wr *req;
1443 
1444 	m = m_gethdr(M_NOWAIT, MT_DATA);
1445 	if (m) {
1446 		req = mtod(m, struct mngt_pktsched_wr *);
1447 		req->wr.wrh_hi = htonl(V_WR_OP(FW_WROPCODE_MNGT));
1448 		req->mngt_opcode = FW_MNGTOPCODE_PKTSCHED_SET;
1449 		req->sched = sched;
1450 		req->idx = qidx;
1451 		req->min = lo;
1452 		req->max = hi;
1453 		req->binding = port;
1454 		m->m_len = m->m_pkthdr.len = sizeof(*req);
1455 		t3_mgmt_tx(adap, m);
1456 	}
1457 }
1458 
1459 static void
1460 bind_qsets(adapter_t *sc)
1461 {
1462 	int i, j;
1463 
1464 	for (i = 0; i < (sc)->params.nports; ++i) {
1465 		const struct port_info *pi = adap2pinfo(sc, i);
1466 
1467 		for (j = 0; j < pi->nqsets; ++j) {
1468 			send_pktsched_cmd(sc, 1, pi->first_qset + j, -1,
1469 					  -1, pi->tx_chan);
1470 
1471 		}
1472 	}
1473 }
1474 
1475 static void
1476 update_tpeeprom(struct adapter *adap)
1477 {
1478 	const struct firmware *tpeeprom;
1479 
1480 	uint32_t version;
1481 	unsigned int major, minor;
1482 	int ret, len;
1483 	char rev, name[32];
1484 
1485 	t3_seeprom_read(adap, TP_SRAM_OFFSET, &version);
1486 
1487 	major = G_TP_VERSION_MAJOR(version);
1488 	minor = G_TP_VERSION_MINOR(version);
1489 	if (major == TP_VERSION_MAJOR  && minor == TP_VERSION_MINOR)
1490 		return;
1491 
1492 	rev = t3rev2char(adap);
1493 	snprintf(name, sizeof(name), TPEEPROM_NAME, rev);
1494 
1495 	tpeeprom = firmware_get(name);
1496 	if (tpeeprom == NULL) {
1497 		device_printf(adap->dev,
1498 			      "could not load TP EEPROM: unable to load %s\n",
1499 			      name);
1500 		return;
1501 	}
1502 
1503 	len = tpeeprom->datasize - 4;
1504 
1505 	ret = t3_check_tpsram(adap, tpeeprom->data, tpeeprom->datasize);
1506 	if (ret)
1507 		goto release_tpeeprom;
1508 
1509 	if (len != TP_SRAM_LEN) {
1510 		device_printf(adap->dev,
1511 			      "%s length is wrong len=%d expected=%d\n", name,
1512 			      len, TP_SRAM_LEN);
1513 		return;
1514 	}
1515 
1516 	ret = set_eeprom(&adap->port[0], tpeeprom->data, tpeeprom->datasize,
1517 	    TP_SRAM_OFFSET);
1518 
1519 	if (!ret) {
1520 		device_printf(adap->dev,
1521 			"Protocol SRAM image updated in EEPROM to %d.%d.%d\n",
1522 			 TP_VERSION_MAJOR, TP_VERSION_MINOR, TP_VERSION_MICRO);
1523 	} else
1524 		device_printf(adap->dev,
1525 			      "Protocol SRAM image update in EEPROM failed\n");
1526 
1527 release_tpeeprom:
1528 	firmware_put(tpeeprom, FIRMWARE_UNLOAD);
1529 
1530 	return;
1531 }
1532 
1533 static int
1534 update_tpsram(struct adapter *adap)
1535 {
1536 	const struct firmware *tpsram;
1537 	int ret;
1538 	char rev, name[32];
1539 
1540 	rev = t3rev2char(adap);
1541 	snprintf(name, sizeof(name), TPSRAM_NAME, rev);
1542 
1543 	update_tpeeprom(adap);
1544 
1545 	tpsram = firmware_get(name);
1546 	if (tpsram == NULL){
1547 		device_printf(adap->dev, "could not load TP SRAM\n");
1548 		return (EINVAL);
1549 	} else
1550 		device_printf(adap->dev, "updating TP SRAM\n");
1551 
1552 	ret = t3_check_tpsram(adap, tpsram->data, tpsram->datasize);
1553 	if (ret)
1554 		goto release_tpsram;
1555 
1556 	ret = t3_set_proto_sram(adap, tpsram->data);
1557 	if (ret)
1558 		device_printf(adap->dev, "loading protocol SRAM failed\n");
1559 
1560 release_tpsram:
1561 	firmware_put(tpsram, FIRMWARE_UNLOAD);
1562 
1563 	return ret;
1564 }
1565 
1566 /**
1567  *	cxgb_up - enable the adapter
1568  *	@adap: adapter being enabled
1569  *
1570  *	Called when the first port is enabled, this function performs the
1571  *	actions necessary to make an adapter operational, such as completing
1572  *	the initialization of HW modules, and enabling interrupts.
1573  */
1574 static int
1575 cxgb_up(struct adapter *sc)
1576 {
1577 	int err = 0;
1578 	unsigned int mxf = t3_mc5_size(&sc->mc5) - MC5_MIN_TIDS;
1579 
1580 	KASSERT(sc->open_device_map == 0, ("%s: device(s) already open (%x)",
1581 					   __func__, sc->open_device_map));
1582 
1583 	if ((sc->flags & FULL_INIT_DONE) == 0) {
1584 
1585 		ADAPTER_LOCK_ASSERT_NOTOWNED(sc);
1586 
1587 		if ((sc->flags & FW_UPTODATE) == 0)
1588 			if ((err = upgrade_fw(sc)))
1589 				goto out;
1590 
1591 		if ((sc->flags & TPS_UPTODATE) == 0)
1592 			if ((err = update_tpsram(sc)))
1593 				goto out;
1594 
1595 		if (is_offload(sc) && nfilters != 0) {
1596 			sc->params.mc5.nservers = 0;
1597 
1598 			if (nfilters < 0)
1599 				sc->params.mc5.nfilters = mxf;
1600 			else
1601 				sc->params.mc5.nfilters = min(nfilters, mxf);
1602 		}
1603 
1604 		err = t3_init_hw(sc, 0);
1605 		if (err)
1606 			goto out;
1607 
1608 		t3_set_reg_field(sc, A_TP_PARA_REG5, 0, F_RXDDPOFFINIT);
1609 		t3_write_reg(sc, A_ULPRX_TDDP_PSZ, V_HPZ0(PAGE_SHIFT - 12));
1610 
1611 		err = setup_sge_qsets(sc);
1612 		if (err)
1613 			goto out;
1614 
1615 		alloc_filters(sc);
1616 		setup_rss(sc);
1617 
1618 		t3_add_configured_sysctls(sc);
1619 		sc->flags |= FULL_INIT_DONE;
1620 	}
1621 
1622 	t3_intr_clear(sc);
1623 	t3_sge_start(sc);
1624 	t3_intr_enable(sc);
1625 
1626 	if (sc->params.rev >= T3_REV_C && !(sc->flags & TP_PARITY_INIT) &&
1627 	    is_offload(sc) && init_tp_parity(sc) == 0)
1628 		sc->flags |= TP_PARITY_INIT;
1629 
1630 	if (sc->flags & TP_PARITY_INIT) {
1631 		t3_write_reg(sc, A_TP_INT_CAUSE, F_CMCACHEPERR | F_ARPLUTPERR);
1632 		t3_write_reg(sc, A_TP_INT_ENABLE, 0x7fbfffff);
1633 	}
1634 
1635 	if (!(sc->flags & QUEUES_BOUND)) {
1636 		bind_qsets(sc);
1637 		setup_hw_filters(sc);
1638 		sc->flags |= QUEUES_BOUND;
1639 	}
1640 
1641 	t3_sge_reset_adapter(sc);
1642 out:
1643 	return (err);
1644 }
1645 
1646 /*
1647  * Called when the last open device is closed.  Does NOT undo all of cxgb_up's
1648  * work.  Specifically, the resources grabbed under FULL_INIT_DONE are released
1649  * during controller_detach, not here.
1650  */
1651 static void
1652 cxgb_down(struct adapter *sc)
1653 {
1654 	t3_sge_stop(sc);
1655 	t3_intr_disable(sc);
1656 }
1657 
1658 /*
1659  * if_init for cxgb ports.
1660  */
1661 static void
1662 cxgb_init(void *arg)
1663 {
1664 	struct port_info *p = arg;
1665 	struct adapter *sc = p->adapter;
1666 
1667 	ADAPTER_LOCK(sc);
1668 	cxgb_init_locked(p); /* releases adapter lock */
1669 	ADAPTER_LOCK_ASSERT_NOTOWNED(sc);
1670 }
1671 
1672 static int
1673 cxgb_init_locked(struct port_info *p)
1674 {
1675 	struct adapter *sc = p->adapter;
1676 	struct ifnet *ifp = p->ifp;
1677 	struct cmac *mac = &p->mac;
1678 	int i, rc = 0, may_sleep = 0, gave_up_lock = 0;
1679 
1680 	ADAPTER_LOCK_ASSERT_OWNED(sc);
1681 
1682 	while (!IS_DOOMED(p) && IS_BUSY(sc)) {
1683 		gave_up_lock = 1;
1684 		if (mtx_sleep(&sc->flags, &sc->lock, PCATCH, "cxgbinit", 0)) {
1685 			rc = EINTR;
1686 			goto done;
1687 		}
1688 	}
1689 	if (IS_DOOMED(p)) {
1690 		rc = ENXIO;
1691 		goto done;
1692 	}
1693 	KASSERT(!IS_BUSY(sc), ("%s: controller busy.", __func__));
1694 
1695 	/*
1696 	 * The code that runs during one-time adapter initialization can sleep
1697 	 * so it's important not to hold any locks across it.
1698 	 */
1699 	may_sleep = sc->flags & FULL_INIT_DONE ? 0 : 1;
1700 
1701 	if (may_sleep) {
1702 		SET_BUSY(sc);
1703 		gave_up_lock = 1;
1704 		ADAPTER_UNLOCK(sc);
1705 	}
1706 
1707 	if (sc->open_device_map == 0 && ((rc = cxgb_up(sc)) != 0))
1708 			goto done;
1709 
1710 	PORT_LOCK(p);
1711 	if (isset(&sc->open_device_map, p->port_id) &&
1712 	    (ifp->if_drv_flags & IFF_DRV_RUNNING)) {
1713 		PORT_UNLOCK(p);
1714 		goto done;
1715 	}
1716 	t3_port_intr_enable(sc, p->port_id);
1717 	if (!mac->multiport)
1718 		t3_mac_init(mac);
1719 	cxgb_update_mac_settings(p);
1720 	t3_link_start(&p->phy, mac, &p->link_config);
1721 	t3_mac_enable(mac, MAC_DIRECTION_RX | MAC_DIRECTION_TX);
1722 	ifp->if_drv_flags |= IFF_DRV_RUNNING;
1723 	ifp->if_drv_flags &= ~IFF_DRV_OACTIVE;
1724 	PORT_UNLOCK(p);
1725 
1726 	for (i = p->first_qset; i < p->first_qset + p->nqsets; i++) {
1727 		struct sge_qset *qs = &sc->sge.qs[i];
1728 		struct sge_txq *txq = &qs->txq[TXQ_ETH];
1729 
1730 		callout_reset_on(&txq->txq_watchdog, hz, cxgb_tx_watchdog, qs,
1731 				 txq->txq_watchdog.c_cpu);
1732 	}
1733 
1734 	/* all ok */
1735 	setbit(&sc->open_device_map, p->port_id);
1736 	callout_reset(&p->link_check_ch,
1737 	    p->phy.caps & SUPPORTED_LINK_IRQ ?  hz * 3 : hz / 4,
1738 	    link_check_callout, p);
1739 
1740 done:
1741 	if (may_sleep) {
1742 		ADAPTER_LOCK(sc);
1743 		KASSERT(IS_BUSY(sc), ("%s: controller not busy.", __func__));
1744 		CLR_BUSY(sc);
1745 	}
1746 	if (gave_up_lock)
1747 		wakeup_one(&sc->flags);
1748 	ADAPTER_UNLOCK(sc);
1749 	return (rc);
1750 }
1751 
1752 static int
1753 cxgb_uninit_locked(struct port_info *p)
1754 {
1755 	struct adapter *sc = p->adapter;
1756 	int rc;
1757 
1758 	ADAPTER_LOCK_ASSERT_OWNED(sc);
1759 
1760 	while (!IS_DOOMED(p) && IS_BUSY(sc)) {
1761 		if (mtx_sleep(&sc->flags, &sc->lock, PCATCH, "cxgbunin", 0)) {
1762 			rc = EINTR;
1763 			goto done;
1764 		}
1765 	}
1766 	if (IS_DOOMED(p)) {
1767 		rc = ENXIO;
1768 		goto done;
1769 	}
1770 	KASSERT(!IS_BUSY(sc), ("%s: controller busy.", __func__));
1771 	SET_BUSY(sc);
1772 	ADAPTER_UNLOCK(sc);
1773 
1774 	rc = cxgb_uninit_synchronized(p);
1775 
1776 	ADAPTER_LOCK(sc);
1777 	KASSERT(IS_BUSY(sc), ("%s: controller not busy.", __func__));
1778 	CLR_BUSY(sc);
1779 	wakeup_one(&sc->flags);
1780 done:
1781 	ADAPTER_UNLOCK(sc);
1782 	return (rc);
1783 }
1784 
1785 /*
1786  * Called on "ifconfig down", and from port_detach
1787  */
1788 static int
1789 cxgb_uninit_synchronized(struct port_info *pi)
1790 {
1791 	struct adapter *sc = pi->adapter;
1792 	struct ifnet *ifp = pi->ifp;
1793 
1794 	/*
1795 	 * taskqueue_drain may cause a deadlock if the adapter lock is held.
1796 	 */
1797 	ADAPTER_LOCK_ASSERT_NOTOWNED(sc);
1798 
1799 	/*
1800 	 * Clear this port's bit from the open device map, and then drain all
1801 	 * the tasks that can access/manipulate this port's port_info or ifp.
1802 	 * We disable this port's interrupts here and so the slow/ext
1803 	 * interrupt tasks won't be enqueued.  The tick task will continue to
1804 	 * be enqueued every second but the runs after this drain will not see
1805 	 * this port in the open device map.
1806 	 *
1807 	 * A well behaved task must take open_device_map into account and ignore
1808 	 * ports that are not open.
1809 	 */
1810 	clrbit(&sc->open_device_map, pi->port_id);
1811 	t3_port_intr_disable(sc, pi->port_id);
1812 	taskqueue_drain(sc->tq, &sc->slow_intr_task);
1813 	taskqueue_drain(sc->tq, &sc->tick_task);
1814 
1815 	callout_drain(&pi->link_check_ch);
1816 	taskqueue_drain(sc->tq, &pi->link_check_task);
1817 
1818 	PORT_LOCK(pi);
1819 	ifp->if_drv_flags &= ~(IFF_DRV_RUNNING | IFF_DRV_OACTIVE);
1820 
1821 	/* disable pause frames */
1822 	t3_set_reg_field(sc, A_XGM_TX_CFG + pi->mac.offset, F_TXPAUSEEN, 0);
1823 
1824 	/* Reset RX FIFO HWM */
1825 	t3_set_reg_field(sc, A_XGM_RXFIFO_CFG +  pi->mac.offset,
1826 			 V_RXFIFOPAUSEHWM(M_RXFIFOPAUSEHWM), 0);
1827 
1828 	DELAY(100 * 1000);
1829 
1830 	/* Wait for TXFIFO empty */
1831 	t3_wait_op_done(sc, A_XGM_TXFIFO_CFG + pi->mac.offset,
1832 			F_TXFIFO_EMPTY, 1, 20, 5);
1833 
1834 	DELAY(100 * 1000);
1835 	t3_mac_disable(&pi->mac, MAC_DIRECTION_RX);
1836 
1837 	pi->phy.ops->power_down(&pi->phy, 1);
1838 
1839 	PORT_UNLOCK(pi);
1840 
1841 	pi->link_config.link_ok = 0;
1842 	t3_os_link_changed(sc, pi->port_id, 0, 0, 0, 0, 0);
1843 
1844 	if (sc->open_device_map == 0)
1845 		cxgb_down(pi->adapter);
1846 
1847 	return (0);
1848 }
1849 
1850 /*
1851  * Mark lro enabled or disabled in all qsets for this port
1852  */
1853 static int
1854 cxgb_set_lro(struct port_info *p, int enabled)
1855 {
1856 	int i;
1857 	struct adapter *adp = p->adapter;
1858 	struct sge_qset *q;
1859 
1860 	for (i = 0; i < p->nqsets; i++) {
1861 		q = &adp->sge.qs[p->first_qset + i];
1862 		q->lro.enabled = (enabled != 0);
1863 	}
1864 	return (0);
1865 }
1866 
1867 static int
1868 cxgb_ioctl(struct ifnet *ifp, unsigned long command, caddr_t data)
1869 {
1870 	struct port_info *p = ifp->if_softc;
1871 	struct adapter *sc = p->adapter;
1872 	struct ifreq *ifr = (struct ifreq *)data;
1873 	int flags, error = 0, mtu;
1874 	uint32_t mask;
1875 
1876 	switch (command) {
1877 	case SIOCSIFMTU:
1878 		ADAPTER_LOCK(sc);
1879 		error = IS_DOOMED(p) ? ENXIO : (IS_BUSY(sc) ? EBUSY : 0);
1880 		if (error) {
1881 fail:
1882 			ADAPTER_UNLOCK(sc);
1883 			return (error);
1884 		}
1885 
1886 		mtu = ifr->ifr_mtu;
1887 		if ((mtu < ETHERMIN) || (mtu > ETHERMTU_JUMBO)) {
1888 			error = EINVAL;
1889 		} else {
1890 			ifp->if_mtu = mtu;
1891 			PORT_LOCK(p);
1892 			cxgb_update_mac_settings(p);
1893 			PORT_UNLOCK(p);
1894 		}
1895 		ADAPTER_UNLOCK(sc);
1896 		break;
1897 	case SIOCSIFFLAGS:
1898 		ADAPTER_LOCK(sc);
1899 		if (IS_DOOMED(p)) {
1900 			error = ENXIO;
1901 			goto fail;
1902 		}
1903 		if (ifp->if_flags & IFF_UP) {
1904 			if (ifp->if_drv_flags & IFF_DRV_RUNNING) {
1905 				flags = p->if_flags;
1906 				if (((ifp->if_flags ^ flags) & IFF_PROMISC) ||
1907 				    ((ifp->if_flags ^ flags) & IFF_ALLMULTI)) {
1908 					if (IS_BUSY(sc)) {
1909 						error = EBUSY;
1910 						goto fail;
1911 					}
1912 					PORT_LOCK(p);
1913 					cxgb_update_mac_settings(p);
1914 					PORT_UNLOCK(p);
1915 				}
1916 				ADAPTER_UNLOCK(sc);
1917 			} else
1918 				error = cxgb_init_locked(p);
1919 			p->if_flags = ifp->if_flags;
1920 		} else if (ifp->if_drv_flags & IFF_DRV_RUNNING)
1921 			error = cxgb_uninit_locked(p);
1922 		else
1923 			ADAPTER_UNLOCK(sc);
1924 
1925 		ADAPTER_LOCK_ASSERT_NOTOWNED(sc);
1926 		break;
1927 	case SIOCADDMULTI:
1928 	case SIOCDELMULTI:
1929 		ADAPTER_LOCK(sc);
1930 		error = IS_DOOMED(p) ? ENXIO : (IS_BUSY(sc) ? EBUSY : 0);
1931 		if (error)
1932 			goto fail;
1933 
1934 		if (ifp->if_drv_flags & IFF_DRV_RUNNING) {
1935 			PORT_LOCK(p);
1936 			cxgb_update_mac_settings(p);
1937 			PORT_UNLOCK(p);
1938 		}
1939 		ADAPTER_UNLOCK(sc);
1940 
1941 		break;
1942 	case SIOCSIFCAP:
1943 		ADAPTER_LOCK(sc);
1944 		error = IS_DOOMED(p) ? ENXIO : (IS_BUSY(sc) ? EBUSY : 0);
1945 		if (error)
1946 			goto fail;
1947 
1948 		mask = ifr->ifr_reqcap ^ ifp->if_capenable;
1949 		if (mask & IFCAP_TXCSUM) {
1950 			ifp->if_capenable ^= IFCAP_TXCSUM;
1951 			ifp->if_hwassist ^= (CSUM_TCP | CSUM_UDP | CSUM_IP);
1952 
1953 			if (IFCAP_TSO4 & ifp->if_capenable &&
1954 			    !(IFCAP_TXCSUM & ifp->if_capenable)) {
1955 				ifp->if_capenable &= ~IFCAP_TSO4;
1956 				if_printf(ifp,
1957 				    "tso4 disabled due to -txcsum.\n");
1958 			}
1959 		}
1960 		if (mask & IFCAP_TXCSUM_IPV6) {
1961 			ifp->if_capenable ^= IFCAP_TXCSUM_IPV6;
1962 			ifp->if_hwassist ^= (CSUM_UDP_IPV6 | CSUM_TCP_IPV6);
1963 
1964 			if (IFCAP_TSO6 & ifp->if_capenable &&
1965 			    !(IFCAP_TXCSUM_IPV6 & ifp->if_capenable)) {
1966 				ifp->if_capenable &= ~IFCAP_TSO6;
1967 				if_printf(ifp,
1968 				    "tso6 disabled due to -txcsum6.\n");
1969 			}
1970 		}
1971 		if (mask & IFCAP_RXCSUM)
1972 			ifp->if_capenable ^= IFCAP_RXCSUM;
1973 		if (mask & IFCAP_RXCSUM_IPV6)
1974 			ifp->if_capenable ^= IFCAP_RXCSUM_IPV6;
1975 
1976 		/*
1977 		 * Note that we leave CSUM_TSO alone (it is always set).  The
1978 		 * kernel takes both IFCAP_TSOx and CSUM_TSO into account before
1979 		 * sending a TSO request our way, so it's sufficient to toggle
1980 		 * IFCAP_TSOx only.
1981 		 */
1982 		if (mask & IFCAP_TSO4) {
1983 			if (!(IFCAP_TSO4 & ifp->if_capenable) &&
1984 			    !(IFCAP_TXCSUM & ifp->if_capenable)) {
1985 				if_printf(ifp, "enable txcsum first.\n");
1986 				error = EAGAIN;
1987 				goto fail;
1988 			}
1989 			ifp->if_capenable ^= IFCAP_TSO4;
1990 		}
1991 		if (mask & IFCAP_TSO6) {
1992 			if (!(IFCAP_TSO6 & ifp->if_capenable) &&
1993 			    !(IFCAP_TXCSUM_IPV6 & ifp->if_capenable)) {
1994 				if_printf(ifp, "enable txcsum6 first.\n");
1995 				error = EAGAIN;
1996 				goto fail;
1997 			}
1998 			ifp->if_capenable ^= IFCAP_TSO6;
1999 		}
2000 		if (mask & IFCAP_LRO) {
2001 			ifp->if_capenable ^= IFCAP_LRO;
2002 
2003 			/* Safe to do this even if cxgb_up not called yet */
2004 			cxgb_set_lro(p, ifp->if_capenable & IFCAP_LRO);
2005 		}
2006 #ifdef TCP_OFFLOAD
2007 		if (mask & IFCAP_TOE4) {
2008 			int enable = (ifp->if_capenable ^ mask) & IFCAP_TOE4;
2009 
2010 			error = toe_capability(p, enable);
2011 			if (error == 0)
2012 				ifp->if_capenable ^= mask;
2013 		}
2014 #endif
2015 		if (mask & IFCAP_VLAN_HWTAGGING) {
2016 			ifp->if_capenable ^= IFCAP_VLAN_HWTAGGING;
2017 			if (ifp->if_drv_flags & IFF_DRV_RUNNING) {
2018 				PORT_LOCK(p);
2019 				cxgb_update_mac_settings(p);
2020 				PORT_UNLOCK(p);
2021 			}
2022 		}
2023 		if (mask & IFCAP_VLAN_MTU) {
2024 			ifp->if_capenable ^= IFCAP_VLAN_MTU;
2025 			if (ifp->if_drv_flags & IFF_DRV_RUNNING) {
2026 				PORT_LOCK(p);
2027 				cxgb_update_mac_settings(p);
2028 				PORT_UNLOCK(p);
2029 			}
2030 		}
2031 		if (mask & IFCAP_VLAN_HWTSO)
2032 			ifp->if_capenable ^= IFCAP_VLAN_HWTSO;
2033 		if (mask & IFCAP_VLAN_HWCSUM)
2034 			ifp->if_capenable ^= IFCAP_VLAN_HWCSUM;
2035 
2036 #ifdef VLAN_CAPABILITIES
2037 		VLAN_CAPABILITIES(ifp);
2038 #endif
2039 		ADAPTER_UNLOCK(sc);
2040 		break;
2041 	case SIOCSIFMEDIA:
2042 	case SIOCGIFMEDIA:
2043 		error = ifmedia_ioctl(ifp, ifr, &p->media, command);
2044 		break;
2045 	default:
2046 		error = ether_ioctl(ifp, command, data);
2047 	}
2048 
2049 	return (error);
2050 }
2051 
2052 static int
2053 cxgb_media_change(struct ifnet *ifp)
2054 {
2055 	return (EOPNOTSUPP);
2056 }
2057 
2058 /*
2059  * Translates phy->modtype to the correct Ethernet media subtype.
2060  */
2061 static int
2062 cxgb_ifm_type(int mod)
2063 {
2064 	switch (mod) {
2065 	case phy_modtype_sr:
2066 		return (IFM_10G_SR);
2067 	case phy_modtype_lr:
2068 		return (IFM_10G_LR);
2069 	case phy_modtype_lrm:
2070 		return (IFM_10G_LRM);
2071 	case phy_modtype_twinax:
2072 		return (IFM_10G_TWINAX);
2073 	case phy_modtype_twinax_long:
2074 		return (IFM_10G_TWINAX_LONG);
2075 	case phy_modtype_none:
2076 		return (IFM_NONE);
2077 	case phy_modtype_unknown:
2078 		return (IFM_UNKNOWN);
2079 	}
2080 
2081 	KASSERT(0, ("%s: modtype %d unknown", __func__, mod));
2082 	return (IFM_UNKNOWN);
2083 }
2084 
2085 /*
2086  * Rebuilds the ifmedia list for this port, and sets the current media.
2087  */
2088 static void
2089 cxgb_build_medialist(struct port_info *p)
2090 {
2091 	struct cphy *phy = &p->phy;
2092 	struct ifmedia *media = &p->media;
2093 	int mod = phy->modtype;
2094 	int m = IFM_ETHER | IFM_FDX;
2095 
2096 	PORT_LOCK(p);
2097 
2098 	ifmedia_removeall(media);
2099 	if (phy->caps & SUPPORTED_TP && phy->caps & SUPPORTED_Autoneg) {
2100 		/* Copper (RJ45) */
2101 
2102 		if (phy->caps & SUPPORTED_10000baseT_Full)
2103 			ifmedia_add(media, m | IFM_10G_T, mod, NULL);
2104 
2105 		if (phy->caps & SUPPORTED_1000baseT_Full)
2106 			ifmedia_add(media, m | IFM_1000_T, mod, NULL);
2107 
2108 		if (phy->caps & SUPPORTED_100baseT_Full)
2109 			ifmedia_add(media, m | IFM_100_TX, mod, NULL);
2110 
2111 		if (phy->caps & SUPPORTED_10baseT_Full)
2112 			ifmedia_add(media, m | IFM_10_T, mod, NULL);
2113 
2114 		ifmedia_add(media, IFM_ETHER | IFM_AUTO, mod, NULL);
2115 		ifmedia_set(media, IFM_ETHER | IFM_AUTO);
2116 
2117 	} else if (phy->caps & SUPPORTED_TP) {
2118 		/* Copper (CX4) */
2119 
2120 		KASSERT(phy->caps & SUPPORTED_10000baseT_Full,
2121 			("%s: unexpected cap 0x%x", __func__, phy->caps));
2122 
2123 		ifmedia_add(media, m | IFM_10G_CX4, mod, NULL);
2124 		ifmedia_set(media, m | IFM_10G_CX4);
2125 
2126 	} else if (phy->caps & SUPPORTED_FIBRE &&
2127 		   phy->caps & SUPPORTED_10000baseT_Full) {
2128 		/* 10G optical (but includes SFP+ twinax) */
2129 
2130 		m |= cxgb_ifm_type(mod);
2131 		if (IFM_SUBTYPE(m) == IFM_NONE)
2132 			m &= ~IFM_FDX;
2133 
2134 		ifmedia_add(media, m, mod, NULL);
2135 		ifmedia_set(media, m);
2136 
2137 	} else if (phy->caps & SUPPORTED_FIBRE &&
2138 		   phy->caps & SUPPORTED_1000baseT_Full) {
2139 		/* 1G optical */
2140 
2141 		/* XXX: Lie and claim to be SX, could actually be any 1G-X */
2142 		ifmedia_add(media, m | IFM_1000_SX, mod, NULL);
2143 		ifmedia_set(media, m | IFM_1000_SX);
2144 
2145 	} else {
2146 		KASSERT(0, ("%s: don't know how to handle 0x%x.", __func__,
2147 			    phy->caps));
2148 	}
2149 
2150 	PORT_UNLOCK(p);
2151 }
2152 
2153 static void
2154 cxgb_media_status(struct ifnet *ifp, struct ifmediareq *ifmr)
2155 {
2156 	struct port_info *p = ifp->if_softc;
2157 	struct ifmedia_entry *cur = p->media.ifm_cur;
2158 	int speed = p->link_config.speed;
2159 
2160 	if (cur->ifm_data != p->phy.modtype) {
2161 		cxgb_build_medialist(p);
2162 		cur = p->media.ifm_cur;
2163 	}
2164 
2165 	ifmr->ifm_status = IFM_AVALID;
2166 	if (!p->link_config.link_ok)
2167 		return;
2168 
2169 	ifmr->ifm_status |= IFM_ACTIVE;
2170 
2171 	/*
2172 	 * active and current will differ iff current media is autoselect.  That
2173 	 * can happen only for copper RJ45.
2174 	 */
2175 	if (IFM_SUBTYPE(cur->ifm_media) != IFM_AUTO)
2176 		return;
2177 	KASSERT(p->phy.caps & SUPPORTED_TP && p->phy.caps & SUPPORTED_Autoneg,
2178 		("%s: unexpected PHY caps 0x%x", __func__, p->phy.caps));
2179 
2180 	ifmr->ifm_active = IFM_ETHER | IFM_FDX;
2181 	if (speed == SPEED_10000)
2182 		ifmr->ifm_active |= IFM_10G_T;
2183 	else if (speed == SPEED_1000)
2184 		ifmr->ifm_active |= IFM_1000_T;
2185 	else if (speed == SPEED_100)
2186 		ifmr->ifm_active |= IFM_100_TX;
2187 	else if (speed == SPEED_10)
2188 		ifmr->ifm_active |= IFM_10_T;
2189 	else
2190 		KASSERT(0, ("%s: link up but speed unknown (%u)", __func__,
2191 			    speed));
2192 }
2193 
2194 static uint64_t
2195 cxgb_get_counter(struct ifnet *ifp, ift_counter c)
2196 {
2197 	struct port_info *pi = ifp->if_softc;
2198 	struct adapter *sc = pi->adapter;
2199 	struct cmac *mac = &pi->mac;
2200 	struct mac_stats *mstats = &mac->stats;
2201 
2202 	cxgb_refresh_stats(pi);
2203 
2204 	switch (c) {
2205 	case IFCOUNTER_IPACKETS:
2206 		return (mstats->rx_frames);
2207 
2208 	case IFCOUNTER_IERRORS:
2209 		return (mstats->rx_jabber + mstats->rx_data_errs +
2210 		    mstats->rx_sequence_errs + mstats->rx_runt +
2211 		    mstats->rx_too_long + mstats->rx_mac_internal_errs +
2212 		    mstats->rx_short + mstats->rx_fcs_errs);
2213 
2214 	case IFCOUNTER_OPACKETS:
2215 		return (mstats->tx_frames);
2216 
2217 	case IFCOUNTER_OERRORS:
2218 		return (mstats->tx_excess_collisions + mstats->tx_underrun +
2219 		    mstats->tx_len_errs + mstats->tx_mac_internal_errs +
2220 		    mstats->tx_excess_deferral + mstats->tx_fcs_errs);
2221 
2222 	case IFCOUNTER_COLLISIONS:
2223 		return (mstats->tx_total_collisions);
2224 
2225 	case IFCOUNTER_IBYTES:
2226 		return (mstats->rx_octets);
2227 
2228 	case IFCOUNTER_OBYTES:
2229 		return (mstats->tx_octets);
2230 
2231 	case IFCOUNTER_IMCASTS:
2232 		return (mstats->rx_mcast_frames);
2233 
2234 	case IFCOUNTER_OMCASTS:
2235 		return (mstats->tx_mcast_frames);
2236 
2237 	case IFCOUNTER_IQDROPS:
2238 		return (mstats->rx_cong_drops);
2239 
2240 	case IFCOUNTER_OQDROPS: {
2241 		int i;
2242 		uint64_t drops;
2243 
2244 		drops = 0;
2245 		if (sc->flags & FULL_INIT_DONE) {
2246 			for (i = pi->first_qset; i < pi->first_qset + pi->nqsets; i++)
2247 				drops += sc->sge.qs[i].txq[TXQ_ETH].txq_mr->br_drops;
2248 		}
2249 
2250 		return (drops);
2251 
2252 	}
2253 
2254 	default:
2255 		return (if_get_counter_default(ifp, c));
2256 	}
2257 }
2258 
2259 static void
2260 cxgb_async_intr(void *data)
2261 {
2262 	adapter_t *sc = data;
2263 
2264 	t3_write_reg(sc, A_PL_INT_ENABLE0, 0);
2265 	(void) t3_read_reg(sc, A_PL_INT_ENABLE0);
2266 	taskqueue_enqueue(sc->tq, &sc->slow_intr_task);
2267 }
2268 
2269 static void
2270 link_check_callout(void *arg)
2271 {
2272 	struct port_info *pi = arg;
2273 	struct adapter *sc = pi->adapter;
2274 
2275 	if (!isset(&sc->open_device_map, pi->port_id))
2276 		return;
2277 
2278 	taskqueue_enqueue(sc->tq, &pi->link_check_task);
2279 }
2280 
2281 static void
2282 check_link_status(void *arg, int pending)
2283 {
2284 	struct port_info *pi = arg;
2285 	struct adapter *sc = pi->adapter;
2286 
2287 	if (!isset(&sc->open_device_map, pi->port_id))
2288 		return;
2289 
2290 	t3_link_changed(sc, pi->port_id);
2291 
2292 	if (pi->link_fault || !(pi->phy.caps & SUPPORTED_LINK_IRQ))
2293 		callout_reset(&pi->link_check_ch, hz, link_check_callout, pi);
2294 }
2295 
2296 void
2297 t3_os_link_intr(struct port_info *pi)
2298 {
2299 	/*
2300 	 * Schedule a link check in the near future.  If the link is flapping
2301 	 * rapidly we'll keep resetting the callout and delaying the check until
2302 	 * things stabilize a bit.
2303 	 */
2304 	callout_reset(&pi->link_check_ch, hz / 4, link_check_callout, pi);
2305 }
2306 
2307 static void
2308 check_t3b2_mac(struct adapter *sc)
2309 {
2310 	int i;
2311 
2312 	if (sc->flags & CXGB_SHUTDOWN)
2313 		return;
2314 
2315 	for_each_port(sc, i) {
2316 		struct port_info *p = &sc->port[i];
2317 		int status;
2318 #ifdef INVARIANTS
2319 		struct ifnet *ifp = p->ifp;
2320 #endif
2321 
2322 		if (!isset(&sc->open_device_map, p->port_id) || p->link_fault ||
2323 		    !p->link_config.link_ok)
2324 			continue;
2325 
2326 		KASSERT(ifp->if_drv_flags & IFF_DRV_RUNNING,
2327 			("%s: state mismatch (drv_flags %x, device_map %x)",
2328 			 __func__, ifp->if_drv_flags, sc->open_device_map));
2329 
2330 		PORT_LOCK(p);
2331 		status = t3b2_mac_watchdog_task(&p->mac);
2332 		if (status == 1)
2333 			p->mac.stats.num_toggled++;
2334 		else if (status == 2) {
2335 			struct cmac *mac = &p->mac;
2336 
2337 			cxgb_update_mac_settings(p);
2338 			t3_link_start(&p->phy, mac, &p->link_config);
2339 			t3_mac_enable(mac, MAC_DIRECTION_RX | MAC_DIRECTION_TX);
2340 			t3_port_intr_enable(sc, p->port_id);
2341 			p->mac.stats.num_resets++;
2342 		}
2343 		PORT_UNLOCK(p);
2344 	}
2345 }
2346 
2347 static void
2348 cxgb_tick(void *arg)
2349 {
2350 	adapter_t *sc = (adapter_t *)arg;
2351 
2352 	if (sc->flags & CXGB_SHUTDOWN)
2353 		return;
2354 
2355 	taskqueue_enqueue(sc->tq, &sc->tick_task);
2356 	callout_reset(&sc->cxgb_tick_ch, hz, cxgb_tick, sc);
2357 }
2358 
2359 void
2360 cxgb_refresh_stats(struct port_info *pi)
2361 {
2362 	struct timeval tv;
2363 	const struct timeval interval = {0, 250000};    /* 250ms */
2364 
2365 	getmicrotime(&tv);
2366 	timevalsub(&tv, &interval);
2367 	if (timevalcmp(&tv, &pi->last_refreshed, <))
2368 		return;
2369 
2370 	PORT_LOCK(pi);
2371 	t3_mac_update_stats(&pi->mac);
2372 	PORT_UNLOCK(pi);
2373 	getmicrotime(&pi->last_refreshed);
2374 }
2375 
2376 static void
2377 cxgb_tick_handler(void *arg, int count)
2378 {
2379 	adapter_t *sc = (adapter_t *)arg;
2380 	const struct adapter_params *p = &sc->params;
2381 	int i;
2382 	uint32_t cause, reset;
2383 
2384 	if (sc->flags & CXGB_SHUTDOWN || !(sc->flags & FULL_INIT_DONE))
2385 		return;
2386 
2387 	if (p->rev == T3_REV_B2 && p->nports < 4 && sc->open_device_map)
2388 		check_t3b2_mac(sc);
2389 
2390 	cause = t3_read_reg(sc, A_SG_INT_CAUSE) & (F_RSPQSTARVE | F_FLEMPTY);
2391 	if (cause) {
2392 		struct sge_qset *qs = &sc->sge.qs[0];
2393 		uint32_t mask, v;
2394 
2395 		v = t3_read_reg(sc, A_SG_RSPQ_FL_STATUS) & ~0xff00;
2396 
2397 		mask = 1;
2398 		for (i = 0; i < SGE_QSETS; i++) {
2399 			if (v & mask)
2400 				qs[i].rspq.starved++;
2401 			mask <<= 1;
2402 		}
2403 
2404 		mask <<= SGE_QSETS; /* skip RSPQXDISABLED */
2405 
2406 		for (i = 0; i < SGE_QSETS * 2; i++) {
2407 			if (v & mask) {
2408 				qs[i / 2].fl[i % 2].empty++;
2409 			}
2410 			mask <<= 1;
2411 		}
2412 
2413 		/* clear */
2414 		t3_write_reg(sc, A_SG_RSPQ_FL_STATUS, v);
2415 		t3_write_reg(sc, A_SG_INT_CAUSE, cause);
2416 	}
2417 
2418 	for (i = 0; i < sc->params.nports; i++) {
2419 		struct port_info *pi = &sc->port[i];
2420 		struct cmac *mac = &pi->mac;
2421 
2422 		if (!isset(&sc->open_device_map, pi->port_id))
2423 			continue;
2424 
2425 		cxgb_refresh_stats(pi);
2426 
2427 		if (mac->multiport)
2428 			continue;
2429 
2430 		/* Count rx fifo overflows, once per second */
2431 		cause = t3_read_reg(sc, A_XGM_INT_CAUSE + mac->offset);
2432 		reset = 0;
2433 		if (cause & F_RXFIFO_OVERFLOW) {
2434 			mac->stats.rx_fifo_ovfl++;
2435 			reset |= F_RXFIFO_OVERFLOW;
2436 		}
2437 		t3_write_reg(sc, A_XGM_INT_CAUSE + mac->offset, reset);
2438 	}
2439 }
2440 
2441 static void
2442 touch_bars(device_t dev)
2443 {
2444 	/*
2445 	 * Don't enable yet
2446 	 */
2447 #if !defined(__LP64__) && 0
2448 	u32 v;
2449 
2450 	pci_read_config_dword(pdev, PCI_BASE_ADDRESS_1, &v);
2451 	pci_write_config_dword(pdev, PCI_BASE_ADDRESS_1, v);
2452 	pci_read_config_dword(pdev, PCI_BASE_ADDRESS_3, &v);
2453 	pci_write_config_dword(pdev, PCI_BASE_ADDRESS_3, v);
2454 	pci_read_config_dword(pdev, PCI_BASE_ADDRESS_5, &v);
2455 	pci_write_config_dword(pdev, PCI_BASE_ADDRESS_5, v);
2456 #endif
2457 }
2458 
2459 static int
2460 set_eeprom(struct port_info *pi, const uint8_t *data, int len, int offset)
2461 {
2462 	uint8_t *buf;
2463 	int err = 0;
2464 	u32 aligned_offset, aligned_len, *p;
2465 	struct adapter *adapter = pi->adapter;
2466 
2467 
2468 	aligned_offset = offset & ~3;
2469 	aligned_len = (len + (offset & 3) + 3) & ~3;
2470 
2471 	if (aligned_offset != offset || aligned_len != len) {
2472 		buf = malloc(aligned_len, M_DEVBUF, M_WAITOK|M_ZERO);
2473 		if (!buf)
2474 			return (ENOMEM);
2475 		err = t3_seeprom_read(adapter, aligned_offset, (u32 *)buf);
2476 		if (!err && aligned_len > 4)
2477 			err = t3_seeprom_read(adapter,
2478 					      aligned_offset + aligned_len - 4,
2479 					      (u32 *)&buf[aligned_len - 4]);
2480 		if (err)
2481 			goto out;
2482 		memcpy(buf + (offset & 3), data, len);
2483 	} else
2484 		buf = (uint8_t *)(uintptr_t)data;
2485 
2486 	err = t3_seeprom_wp(adapter, 0);
2487 	if (err)
2488 		goto out;
2489 
2490 	for (p = (u32 *)buf; !err && aligned_len; aligned_len -= 4, p++) {
2491 		err = t3_seeprom_write(adapter, aligned_offset, *p);
2492 		aligned_offset += 4;
2493 	}
2494 
2495 	if (!err)
2496 		err = t3_seeprom_wp(adapter, 1);
2497 out:
2498 	if (buf != data)
2499 		free(buf, M_DEVBUF);
2500 	return err;
2501 }
2502 
2503 
2504 static int
2505 in_range(int val, int lo, int hi)
2506 {
2507 	return val < 0 || (val <= hi && val >= lo);
2508 }
2509 
2510 static int
2511 cxgb_extension_open(struct cdev *dev, int flags, int fmp, struct thread *td)
2512 {
2513        return (0);
2514 }
2515 
2516 static int
2517 cxgb_extension_close(struct cdev *dev, int flags, int fmt, struct thread *td)
2518 {
2519        return (0);
2520 }
2521 
2522 static int
2523 cxgb_extension_ioctl(struct cdev *dev, unsigned long cmd, caddr_t data,
2524     int fflag, struct thread *td)
2525 {
2526 	int mmd, error = 0;
2527 	struct port_info *pi = dev->si_drv1;
2528 	adapter_t *sc = pi->adapter;
2529 
2530 #ifdef PRIV_SUPPORTED
2531 	if (priv_check(td, PRIV_DRIVER)) {
2532 		if (cxgb_debug)
2533 			printf("user does not have access to privileged ioctls\n");
2534 		return (EPERM);
2535 	}
2536 #else
2537 	if (suser(td)) {
2538 		if (cxgb_debug)
2539 			printf("user does not have access to privileged ioctls\n");
2540 		return (EPERM);
2541 	}
2542 #endif
2543 
2544 	switch (cmd) {
2545 	case CHELSIO_GET_MIIREG: {
2546 		uint32_t val;
2547 		struct cphy *phy = &pi->phy;
2548 		struct ch_mii_data *mid = (struct ch_mii_data *)data;
2549 
2550 		if (!phy->mdio_read)
2551 			return (EOPNOTSUPP);
2552 		if (is_10G(sc)) {
2553 			mmd = mid->phy_id >> 8;
2554 			if (!mmd)
2555 				mmd = MDIO_DEV_PCS;
2556 			else if (mmd > MDIO_DEV_VEND2)
2557 				return (EINVAL);
2558 
2559 			error = phy->mdio_read(sc, mid->phy_id & 0x1f, mmd,
2560 					     mid->reg_num, &val);
2561 		} else
2562 		        error = phy->mdio_read(sc, mid->phy_id & 0x1f, 0,
2563 					     mid->reg_num & 0x1f, &val);
2564 		if (error == 0)
2565 			mid->val_out = val;
2566 		break;
2567 	}
2568 	case CHELSIO_SET_MIIREG: {
2569 		struct cphy *phy = &pi->phy;
2570 		struct ch_mii_data *mid = (struct ch_mii_data *)data;
2571 
2572 		if (!phy->mdio_write)
2573 			return (EOPNOTSUPP);
2574 		if (is_10G(sc)) {
2575 			mmd = mid->phy_id >> 8;
2576 			if (!mmd)
2577 				mmd = MDIO_DEV_PCS;
2578 			else if (mmd > MDIO_DEV_VEND2)
2579 				return (EINVAL);
2580 
2581 			error = phy->mdio_write(sc, mid->phy_id & 0x1f,
2582 					      mmd, mid->reg_num, mid->val_in);
2583 		} else
2584 			error = phy->mdio_write(sc, mid->phy_id & 0x1f, 0,
2585 					      mid->reg_num & 0x1f,
2586 					      mid->val_in);
2587 		break;
2588 	}
2589 	case CHELSIO_SETREG: {
2590 		struct ch_reg *edata = (struct ch_reg *)data;
2591 		if ((edata->addr & 0x3) != 0 || edata->addr >= sc->mmio_len)
2592 			return (EFAULT);
2593 		t3_write_reg(sc, edata->addr, edata->val);
2594 		break;
2595 	}
2596 	case CHELSIO_GETREG: {
2597 		struct ch_reg *edata = (struct ch_reg *)data;
2598 		if ((edata->addr & 0x3) != 0 || edata->addr >= sc->mmio_len)
2599 			return (EFAULT);
2600 		edata->val = t3_read_reg(sc, edata->addr);
2601 		break;
2602 	}
2603 	case CHELSIO_GET_SGE_CONTEXT: {
2604 		struct ch_cntxt *ecntxt = (struct ch_cntxt *)data;
2605 		mtx_lock_spin(&sc->sge.reg_lock);
2606 		switch (ecntxt->cntxt_type) {
2607 		case CNTXT_TYPE_EGRESS:
2608 			error = -t3_sge_read_ecntxt(sc, ecntxt->cntxt_id,
2609 			    ecntxt->data);
2610 			break;
2611 		case CNTXT_TYPE_FL:
2612 			error = -t3_sge_read_fl(sc, ecntxt->cntxt_id,
2613 			    ecntxt->data);
2614 			break;
2615 		case CNTXT_TYPE_RSP:
2616 			error = -t3_sge_read_rspq(sc, ecntxt->cntxt_id,
2617 			    ecntxt->data);
2618 			break;
2619 		case CNTXT_TYPE_CQ:
2620 			error = -t3_sge_read_cq(sc, ecntxt->cntxt_id,
2621 			    ecntxt->data);
2622 			break;
2623 		default:
2624 			error = EINVAL;
2625 			break;
2626 		}
2627 		mtx_unlock_spin(&sc->sge.reg_lock);
2628 		break;
2629 	}
2630 	case CHELSIO_GET_SGE_DESC: {
2631 		struct ch_desc *edesc = (struct ch_desc *)data;
2632 		int ret;
2633 		if (edesc->queue_num >= SGE_QSETS * 6)
2634 			return (EINVAL);
2635 		ret = t3_get_desc(&sc->sge.qs[edesc->queue_num / 6],
2636 		    edesc->queue_num % 6, edesc->idx, edesc->data);
2637 		if (ret < 0)
2638 			return (EINVAL);
2639 		edesc->size = ret;
2640 		break;
2641 	}
2642 	case CHELSIO_GET_QSET_PARAMS: {
2643 		struct qset_params *q;
2644 		struct ch_qset_params *t = (struct ch_qset_params *)data;
2645 		int q1 = pi->first_qset;
2646 		int nqsets = pi->nqsets;
2647 		int i;
2648 
2649 		if (t->qset_idx >= nqsets)
2650 			return EINVAL;
2651 
2652 		i = q1 + t->qset_idx;
2653 		q = &sc->params.sge.qset[i];
2654 		t->rspq_size   = q->rspq_size;
2655 		t->txq_size[0] = q->txq_size[0];
2656 		t->txq_size[1] = q->txq_size[1];
2657 		t->txq_size[2] = q->txq_size[2];
2658 		t->fl_size[0]  = q->fl_size;
2659 		t->fl_size[1]  = q->jumbo_size;
2660 		t->polling     = q->polling;
2661 		t->lro         = q->lro;
2662 		t->intr_lat    = q->coalesce_usecs;
2663 		t->cong_thres  = q->cong_thres;
2664 		t->qnum        = i;
2665 
2666 		if ((sc->flags & FULL_INIT_DONE) == 0)
2667 			t->vector = 0;
2668 		else if (sc->flags & USING_MSIX)
2669 			t->vector = rman_get_start(sc->msix_irq_res[i]);
2670 		else
2671 			t->vector = rman_get_start(sc->irq_res);
2672 
2673 		break;
2674 	}
2675 	case CHELSIO_GET_QSET_NUM: {
2676 		struct ch_reg *edata = (struct ch_reg *)data;
2677 		edata->val = pi->nqsets;
2678 		break;
2679 	}
2680 	case CHELSIO_LOAD_FW: {
2681 		uint8_t *fw_data;
2682 		uint32_t vers;
2683 		struct ch_mem_range *t = (struct ch_mem_range *)data;
2684 
2685 		/*
2686 		 * You're allowed to load a firmware only before FULL_INIT_DONE
2687 		 *
2688 		 * FW_UPTODATE is also set so the rest of the initialization
2689 		 * will not overwrite what was loaded here.  This gives you the
2690 		 * flexibility to load any firmware (and maybe shoot yourself in
2691 		 * the foot).
2692 		 */
2693 
2694 		ADAPTER_LOCK(sc);
2695 		if (sc->open_device_map || sc->flags & FULL_INIT_DONE) {
2696 			ADAPTER_UNLOCK(sc);
2697 			return (EBUSY);
2698 		}
2699 
2700 		fw_data = malloc(t->len, M_DEVBUF, M_NOWAIT);
2701 		if (!fw_data)
2702 			error = ENOMEM;
2703 		else
2704 			error = copyin(t->buf, fw_data, t->len);
2705 
2706 		if (!error)
2707 			error = -t3_load_fw(sc, fw_data, t->len);
2708 
2709 		if (t3_get_fw_version(sc, &vers) == 0) {
2710 			snprintf(&sc->fw_version[0], sizeof(sc->fw_version),
2711 			    "%d.%d.%d", G_FW_VERSION_MAJOR(vers),
2712 			    G_FW_VERSION_MINOR(vers), G_FW_VERSION_MICRO(vers));
2713 		}
2714 
2715 		if (!error)
2716 			sc->flags |= FW_UPTODATE;
2717 
2718 		free(fw_data, M_DEVBUF);
2719 		ADAPTER_UNLOCK(sc);
2720 		break;
2721 	}
2722 	case CHELSIO_LOAD_BOOT: {
2723 		uint8_t *boot_data;
2724 		struct ch_mem_range *t = (struct ch_mem_range *)data;
2725 
2726 		boot_data = malloc(t->len, M_DEVBUF, M_NOWAIT);
2727 		if (!boot_data)
2728 			return ENOMEM;
2729 
2730 		error = copyin(t->buf, boot_data, t->len);
2731 		if (!error)
2732 			error = -t3_load_boot(sc, boot_data, t->len);
2733 
2734 		free(boot_data, M_DEVBUF);
2735 		break;
2736 	}
2737 	case CHELSIO_GET_PM: {
2738 		struct ch_pm *m = (struct ch_pm *)data;
2739 		struct tp_params *p = &sc->params.tp;
2740 
2741 		if (!is_offload(sc))
2742 			return (EOPNOTSUPP);
2743 
2744 		m->tx_pg_sz = p->tx_pg_size;
2745 		m->tx_num_pg = p->tx_num_pgs;
2746 		m->rx_pg_sz  = p->rx_pg_size;
2747 		m->rx_num_pg = p->rx_num_pgs;
2748 		m->pm_total  = p->pmtx_size + p->chan_rx_size * p->nchan;
2749 
2750 		break;
2751 	}
2752 	case CHELSIO_SET_PM: {
2753 		struct ch_pm *m = (struct ch_pm *)data;
2754 		struct tp_params *p = &sc->params.tp;
2755 
2756 		if (!is_offload(sc))
2757 			return (EOPNOTSUPP);
2758 		if (sc->flags & FULL_INIT_DONE)
2759 			return (EBUSY);
2760 
2761 		if (!m->rx_pg_sz || (m->rx_pg_sz & (m->rx_pg_sz - 1)) ||
2762 		    !m->tx_pg_sz || (m->tx_pg_sz & (m->tx_pg_sz - 1)))
2763 			return (EINVAL);	/* not power of 2 */
2764 		if (!(m->rx_pg_sz & 0x14000))
2765 			return (EINVAL);	/* not 16KB or 64KB */
2766 		if (!(m->tx_pg_sz & 0x1554000))
2767 			return (EINVAL);
2768 		if (m->tx_num_pg == -1)
2769 			m->tx_num_pg = p->tx_num_pgs;
2770 		if (m->rx_num_pg == -1)
2771 			m->rx_num_pg = p->rx_num_pgs;
2772 		if (m->tx_num_pg % 24 || m->rx_num_pg % 24)
2773 			return (EINVAL);
2774 		if (m->rx_num_pg * m->rx_pg_sz > p->chan_rx_size ||
2775 		    m->tx_num_pg * m->tx_pg_sz > p->chan_tx_size)
2776 			return (EINVAL);
2777 
2778 		p->rx_pg_size = m->rx_pg_sz;
2779 		p->tx_pg_size = m->tx_pg_sz;
2780 		p->rx_num_pgs = m->rx_num_pg;
2781 		p->tx_num_pgs = m->tx_num_pg;
2782 		break;
2783 	}
2784 	case CHELSIO_SETMTUTAB: {
2785 		struct ch_mtus *m = (struct ch_mtus *)data;
2786 		int i;
2787 
2788 		if (!is_offload(sc))
2789 			return (EOPNOTSUPP);
2790 		if (offload_running(sc))
2791 			return (EBUSY);
2792 		if (m->nmtus != NMTUS)
2793 			return (EINVAL);
2794 		if (m->mtus[0] < 81)         /* accommodate SACK */
2795 			return (EINVAL);
2796 
2797 		/*
2798 		 * MTUs must be in ascending order
2799 		 */
2800 		for (i = 1; i < NMTUS; ++i)
2801 			if (m->mtus[i] < m->mtus[i - 1])
2802 				return (EINVAL);
2803 
2804 		memcpy(sc->params.mtus, m->mtus, sizeof(sc->params.mtus));
2805 		break;
2806 	}
2807 	case CHELSIO_GETMTUTAB: {
2808 		struct ch_mtus *m = (struct ch_mtus *)data;
2809 
2810 		if (!is_offload(sc))
2811 			return (EOPNOTSUPP);
2812 
2813 		memcpy(m->mtus, sc->params.mtus, sizeof(m->mtus));
2814 		m->nmtus = NMTUS;
2815 		break;
2816 	}
2817 	case CHELSIO_GET_MEM: {
2818 		struct ch_mem_range *t = (struct ch_mem_range *)data;
2819 		struct mc7 *mem;
2820 		uint8_t *useraddr;
2821 		u64 buf[32];
2822 
2823 		/*
2824 		 * Use these to avoid modifying len/addr in the return
2825 		 * struct
2826 		 */
2827 		uint32_t len = t->len, addr = t->addr;
2828 
2829 		if (!is_offload(sc))
2830 			return (EOPNOTSUPP);
2831 		if (!(sc->flags & FULL_INIT_DONE))
2832 			return (EIO);         /* need the memory controllers */
2833 		if ((addr & 0x7) || (len & 0x7))
2834 			return (EINVAL);
2835 		if (t->mem_id == MEM_CM)
2836 			mem = &sc->cm;
2837 		else if (t->mem_id == MEM_PMRX)
2838 			mem = &sc->pmrx;
2839 		else if (t->mem_id == MEM_PMTX)
2840 			mem = &sc->pmtx;
2841 		else
2842 			return (EINVAL);
2843 
2844 		/*
2845 		 * Version scheme:
2846 		 * bits 0..9: chip version
2847 		 * bits 10..15: chip revision
2848 		 */
2849 		t->version = 3 | (sc->params.rev << 10);
2850 
2851 		/*
2852 		 * Read 256 bytes at a time as len can be large and we don't
2853 		 * want to use huge intermediate buffers.
2854 		 */
2855 		useraddr = (uint8_t *)t->buf;
2856 		while (len) {
2857 			unsigned int chunk = min(len, sizeof(buf));
2858 
2859 			error = t3_mc7_bd_read(mem, addr / 8, chunk / 8, buf);
2860 			if (error)
2861 				return (-error);
2862 			if (copyout(buf, useraddr, chunk))
2863 				return (EFAULT);
2864 			useraddr += chunk;
2865 			addr += chunk;
2866 			len -= chunk;
2867 		}
2868 		break;
2869 	}
2870 	case CHELSIO_READ_TCAM_WORD: {
2871 		struct ch_tcam_word *t = (struct ch_tcam_word *)data;
2872 
2873 		if (!is_offload(sc))
2874 			return (EOPNOTSUPP);
2875 		if (!(sc->flags & FULL_INIT_DONE))
2876 			return (EIO);         /* need MC5 */
2877 		return -t3_read_mc5_range(&sc->mc5, t->addr, 1, t->buf);
2878 		break;
2879 	}
2880 	case CHELSIO_SET_TRACE_FILTER: {
2881 		struct ch_trace *t = (struct ch_trace *)data;
2882 		const struct trace_params *tp;
2883 
2884 		tp = (const struct trace_params *)&t->sip;
2885 		if (t->config_tx)
2886 			t3_config_trace_filter(sc, tp, 0, t->invert_match,
2887 					       t->trace_tx);
2888 		if (t->config_rx)
2889 			t3_config_trace_filter(sc, tp, 1, t->invert_match,
2890 					       t->trace_rx);
2891 		break;
2892 	}
2893 	case CHELSIO_SET_PKTSCHED: {
2894 		struct ch_pktsched_params *p = (struct ch_pktsched_params *)data;
2895 		if (sc->open_device_map == 0)
2896 			return (EAGAIN);
2897 		send_pktsched_cmd(sc, p->sched, p->idx, p->min, p->max,
2898 		    p->binding);
2899 		break;
2900 	}
2901 	case CHELSIO_IFCONF_GETREGS: {
2902 		struct ch_ifconf_regs *regs = (struct ch_ifconf_regs *)data;
2903 		int reglen = cxgb_get_regs_len();
2904 		uint8_t *buf = malloc(reglen, M_DEVBUF, M_NOWAIT);
2905 		if (buf == NULL) {
2906 			return (ENOMEM);
2907 		}
2908 		if (regs->len > reglen)
2909 			regs->len = reglen;
2910 		else if (regs->len < reglen)
2911 			error = ENOBUFS;
2912 
2913 		if (!error) {
2914 			cxgb_get_regs(sc, regs, buf);
2915 			error = copyout(buf, regs->data, reglen);
2916 		}
2917 		free(buf, M_DEVBUF);
2918 
2919 		break;
2920 	}
2921 	case CHELSIO_SET_HW_SCHED: {
2922 		struct ch_hw_sched *t = (struct ch_hw_sched *)data;
2923 		unsigned int ticks_per_usec = core_ticks_per_usec(sc);
2924 
2925 		if ((sc->flags & FULL_INIT_DONE) == 0)
2926 			return (EAGAIN);       /* need TP to be initialized */
2927 		if (t->sched >= NTX_SCHED || !in_range(t->mode, 0, 1) ||
2928 		    !in_range(t->channel, 0, 1) ||
2929 		    !in_range(t->kbps, 0, 10000000) ||
2930 		    !in_range(t->class_ipg, 0, 10000 * 65535 / ticks_per_usec) ||
2931 		    !in_range(t->flow_ipg, 0,
2932 			      dack_ticks_to_usec(sc, 0x7ff)))
2933 			return (EINVAL);
2934 
2935 		if (t->kbps >= 0) {
2936 			error = t3_config_sched(sc, t->kbps, t->sched);
2937 			if (error < 0)
2938 				return (-error);
2939 		}
2940 		if (t->class_ipg >= 0)
2941 			t3_set_sched_ipg(sc, t->sched, t->class_ipg);
2942 		if (t->flow_ipg >= 0) {
2943 			t->flow_ipg *= 1000;     /* us -> ns */
2944 			t3_set_pace_tbl(sc, &t->flow_ipg, t->sched, 1);
2945 		}
2946 		if (t->mode >= 0) {
2947 			int bit = 1 << (S_TX_MOD_TIMER_MODE + t->sched);
2948 
2949 			t3_set_reg_field(sc, A_TP_TX_MOD_QUEUE_REQ_MAP,
2950 					 bit, t->mode ? bit : 0);
2951 		}
2952 		if (t->channel >= 0)
2953 			t3_set_reg_field(sc, A_TP_TX_MOD_QUEUE_REQ_MAP,
2954 					 1 << t->sched, t->channel << t->sched);
2955 		break;
2956 	}
2957 	case CHELSIO_GET_EEPROM: {
2958 		int i;
2959 		struct ch_eeprom *e = (struct ch_eeprom *)data;
2960 		uint8_t *buf = malloc(EEPROMSIZE, M_DEVBUF, M_NOWAIT);
2961 
2962 		if (buf == NULL) {
2963 			return (ENOMEM);
2964 		}
2965 		e->magic = EEPROM_MAGIC;
2966 		for (i = e->offset & ~3; !error && i < e->offset + e->len; i += 4)
2967 			error = -t3_seeprom_read(sc, i, (uint32_t *)&buf[i]);
2968 
2969 		if (!error)
2970 			error = copyout(buf + e->offset, e->data, e->len);
2971 
2972 		free(buf, M_DEVBUF);
2973 		break;
2974 	}
2975 	case CHELSIO_CLEAR_STATS: {
2976 		if (!(sc->flags & FULL_INIT_DONE))
2977 			return EAGAIN;
2978 
2979 		PORT_LOCK(pi);
2980 		t3_mac_update_stats(&pi->mac);
2981 		memset(&pi->mac.stats, 0, sizeof(pi->mac.stats));
2982 		PORT_UNLOCK(pi);
2983 		break;
2984 	}
2985 	case CHELSIO_GET_UP_LA: {
2986 		struct ch_up_la *la = (struct ch_up_la *)data;
2987 		uint8_t *buf = malloc(LA_BUFSIZE, M_DEVBUF, M_NOWAIT);
2988 		if (buf == NULL) {
2989 			return (ENOMEM);
2990 		}
2991 		if (la->bufsize < LA_BUFSIZE)
2992 			error = ENOBUFS;
2993 
2994 		if (!error)
2995 			error = -t3_get_up_la(sc, &la->stopped, &la->idx,
2996 					      &la->bufsize, buf);
2997 		if (!error)
2998 			error = copyout(buf, la->data, la->bufsize);
2999 
3000 		free(buf, M_DEVBUF);
3001 		break;
3002 	}
3003 	case CHELSIO_GET_UP_IOQS: {
3004 		struct ch_up_ioqs *ioqs = (struct ch_up_ioqs *)data;
3005 		uint8_t *buf = malloc(IOQS_BUFSIZE, M_DEVBUF, M_NOWAIT);
3006 		uint32_t *v;
3007 
3008 		if (buf == NULL) {
3009 			return (ENOMEM);
3010 		}
3011 		if (ioqs->bufsize < IOQS_BUFSIZE)
3012 			error = ENOBUFS;
3013 
3014 		if (!error)
3015 			error = -t3_get_up_ioqs(sc, &ioqs->bufsize, buf);
3016 
3017 		if (!error) {
3018 			v = (uint32_t *)buf;
3019 
3020 			ioqs->ioq_rx_enable = *v++;
3021 			ioqs->ioq_tx_enable = *v++;
3022 			ioqs->ioq_rx_status = *v++;
3023 			ioqs->ioq_tx_status = *v++;
3024 
3025 			error = copyout(v, ioqs->data, ioqs->bufsize);
3026 		}
3027 
3028 		free(buf, M_DEVBUF);
3029 		break;
3030 	}
3031 	case CHELSIO_SET_FILTER: {
3032 		struct ch_filter *f = (struct ch_filter *)data;
3033 		struct filter_info *p;
3034 		unsigned int nfilters = sc->params.mc5.nfilters;
3035 
3036 		if (!is_offload(sc))
3037 			return (EOPNOTSUPP);	/* No TCAM */
3038 		if (!(sc->flags & FULL_INIT_DONE))
3039 			return (EAGAIN);	/* mc5 not setup yet */
3040 		if (nfilters == 0)
3041 			return (EBUSY);		/* TOE will use TCAM */
3042 
3043 		/* sanity checks */
3044 		if (f->filter_id >= nfilters ||
3045 		    (f->val.dip && f->mask.dip != 0xffffffff) ||
3046 		    (f->val.sport && f->mask.sport != 0xffff) ||
3047 		    (f->val.dport && f->mask.dport != 0xffff) ||
3048 		    (f->val.vlan && f->mask.vlan != 0xfff) ||
3049 		    (f->val.vlan_prio &&
3050 			f->mask.vlan_prio != FILTER_NO_VLAN_PRI) ||
3051 		    (f->mac_addr_idx != 0xffff && f->mac_addr_idx > 15) ||
3052 		    f->qset >= SGE_QSETS ||
3053 		    sc->rrss_map[f->qset] >= RSS_TABLE_SIZE)
3054 			return (EINVAL);
3055 
3056 		/* Was allocated with M_WAITOK */
3057 		KASSERT(sc->filters, ("filter table NULL\n"));
3058 
3059 		p = &sc->filters[f->filter_id];
3060 		if (p->locked)
3061 			return (EPERM);
3062 
3063 		bzero(p, sizeof(*p));
3064 		p->sip = f->val.sip;
3065 		p->sip_mask = f->mask.sip;
3066 		p->dip = f->val.dip;
3067 		p->sport = f->val.sport;
3068 		p->dport = f->val.dport;
3069 		p->vlan = f->mask.vlan ? f->val.vlan : 0xfff;
3070 		p->vlan_prio = f->mask.vlan_prio ? (f->val.vlan_prio & 6) :
3071 		    FILTER_NO_VLAN_PRI;
3072 		p->mac_hit = f->mac_hit;
3073 		p->mac_vld = f->mac_addr_idx != 0xffff;
3074 		p->mac_idx = f->mac_addr_idx;
3075 		p->pkt_type = f->proto;
3076 		p->report_filter_id = f->want_filter_id;
3077 		p->pass = f->pass;
3078 		p->rss = f->rss;
3079 		p->qset = f->qset;
3080 
3081 		error = set_filter(sc, f->filter_id, p);
3082 		if (error == 0)
3083 			p->valid = 1;
3084 		break;
3085 	}
3086 	case CHELSIO_DEL_FILTER: {
3087 		struct ch_filter *f = (struct ch_filter *)data;
3088 		struct filter_info *p;
3089 		unsigned int nfilters = sc->params.mc5.nfilters;
3090 
3091 		if (!is_offload(sc))
3092 			return (EOPNOTSUPP);
3093 		if (!(sc->flags & FULL_INIT_DONE))
3094 			return (EAGAIN);
3095 		if (nfilters == 0 || sc->filters == NULL)
3096 			return (EINVAL);
3097 		if (f->filter_id >= nfilters)
3098 		       return (EINVAL);
3099 
3100 		p = &sc->filters[f->filter_id];
3101 		if (p->locked)
3102 			return (EPERM);
3103 		if (!p->valid)
3104 			return (EFAULT); /* Read "Bad address" as "Bad index" */
3105 
3106 		bzero(p, sizeof(*p));
3107 		p->sip = p->sip_mask = 0xffffffff;
3108 		p->vlan = 0xfff;
3109 		p->vlan_prio = FILTER_NO_VLAN_PRI;
3110 		p->pkt_type = 1;
3111 		error = set_filter(sc, f->filter_id, p);
3112 		break;
3113 	}
3114 	case CHELSIO_GET_FILTER: {
3115 		struct ch_filter *f = (struct ch_filter *)data;
3116 		struct filter_info *p;
3117 		unsigned int i, nfilters = sc->params.mc5.nfilters;
3118 
3119 		if (!is_offload(sc))
3120 			return (EOPNOTSUPP);
3121 		if (!(sc->flags & FULL_INIT_DONE))
3122 			return (EAGAIN);
3123 		if (nfilters == 0 || sc->filters == NULL)
3124 			return (EINVAL);
3125 
3126 		i = f->filter_id == 0xffffffff ? 0 : f->filter_id + 1;
3127 		for (; i < nfilters; i++) {
3128 			p = &sc->filters[i];
3129 			if (!p->valid)
3130 				continue;
3131 
3132 			bzero(f, sizeof(*f));
3133 
3134 			f->filter_id = i;
3135 			f->val.sip = p->sip;
3136 			f->mask.sip = p->sip_mask;
3137 			f->val.dip = p->dip;
3138 			f->mask.dip = p->dip ? 0xffffffff : 0;
3139 			f->val.sport = p->sport;
3140 			f->mask.sport = p->sport ? 0xffff : 0;
3141 			f->val.dport = p->dport;
3142 			f->mask.dport = p->dport ? 0xffff : 0;
3143 			f->val.vlan = p->vlan == 0xfff ? 0 : p->vlan;
3144 			f->mask.vlan = p->vlan == 0xfff ? 0 : 0xfff;
3145 			f->val.vlan_prio = p->vlan_prio == FILTER_NO_VLAN_PRI ?
3146 			    0 : p->vlan_prio;
3147 			f->mask.vlan_prio = p->vlan_prio == FILTER_NO_VLAN_PRI ?
3148 			    0 : FILTER_NO_VLAN_PRI;
3149 			f->mac_hit = p->mac_hit;
3150 			f->mac_addr_idx = p->mac_vld ? p->mac_idx : 0xffff;
3151 			f->proto = p->pkt_type;
3152 			f->want_filter_id = p->report_filter_id;
3153 			f->pass = p->pass;
3154 			f->rss = p->rss;
3155 			f->qset = p->qset;
3156 
3157 			break;
3158 		}
3159 
3160 		if (i == nfilters)
3161 			f->filter_id = 0xffffffff;
3162 		break;
3163 	}
3164 	default:
3165 		return (EOPNOTSUPP);
3166 		break;
3167 	}
3168 
3169 	return (error);
3170 }
3171 
3172 static __inline void
3173 reg_block_dump(struct adapter *ap, uint8_t *buf, unsigned int start,
3174     unsigned int end)
3175 {
3176 	uint32_t *p = (uint32_t *)(buf + start);
3177 
3178 	for ( ; start <= end; start += sizeof(uint32_t))
3179 		*p++ = t3_read_reg(ap, start);
3180 }
3181 
3182 #define T3_REGMAP_SIZE (3 * 1024)
3183 static int
3184 cxgb_get_regs_len(void)
3185 {
3186 	return T3_REGMAP_SIZE;
3187 }
3188 
3189 static void
3190 cxgb_get_regs(adapter_t *sc, struct ch_ifconf_regs *regs, uint8_t *buf)
3191 {
3192 
3193 	/*
3194 	 * Version scheme:
3195 	 * bits 0..9: chip version
3196 	 * bits 10..15: chip revision
3197 	 * bit 31: set for PCIe cards
3198 	 */
3199 	regs->version = 3 | (sc->params.rev << 10) | (is_pcie(sc) << 31);
3200 
3201 	/*
3202 	 * We skip the MAC statistics registers because they are clear-on-read.
3203 	 * Also reading multi-register stats would need to synchronize with the
3204 	 * periodic mac stats accumulation.  Hard to justify the complexity.
3205 	 */
3206 	memset(buf, 0, cxgb_get_regs_len());
3207 	reg_block_dump(sc, buf, 0, A_SG_RSPQ_CREDIT_RETURN);
3208 	reg_block_dump(sc, buf, A_SG_HI_DRB_HI_THRSH, A_ULPRX_PBL_ULIMIT);
3209 	reg_block_dump(sc, buf, A_ULPTX_CONFIG, A_MPS_INT_CAUSE);
3210 	reg_block_dump(sc, buf, A_CPL_SWITCH_CNTRL, A_CPL_MAP_TBL_DATA);
3211 	reg_block_dump(sc, buf, A_SMB_GLOBAL_TIME_CFG, A_XGM_SERDES_STAT3);
3212 	reg_block_dump(sc, buf, A_XGM_SERDES_STATUS0,
3213 		       XGM_REG(A_XGM_SERDES_STAT3, 1));
3214 	reg_block_dump(sc, buf, XGM_REG(A_XGM_SERDES_STATUS0, 1),
3215 		       XGM_REG(A_XGM_RX_SPI4_SOP_EOP_CNT, 1));
3216 }
3217 
3218 static int
3219 alloc_filters(struct adapter *sc)
3220 {
3221 	struct filter_info *p;
3222 	unsigned int nfilters = sc->params.mc5.nfilters;
3223 
3224 	if (nfilters == 0)
3225 		return (0);
3226 
3227 	p = malloc(sizeof(*p) * nfilters, M_DEVBUF, M_WAITOK | M_ZERO);
3228 	sc->filters = p;
3229 
3230 	p = &sc->filters[nfilters - 1];
3231 	p->vlan = 0xfff;
3232 	p->vlan_prio = FILTER_NO_VLAN_PRI;
3233 	p->pass = p->rss = p->valid = p->locked = 1;
3234 
3235 	return (0);
3236 }
3237 
3238 static int
3239 setup_hw_filters(struct adapter *sc)
3240 {
3241 	int i, rc;
3242 	unsigned int nfilters = sc->params.mc5.nfilters;
3243 
3244 	if (!sc->filters)
3245 		return (0);
3246 
3247 	t3_enable_filters(sc);
3248 
3249 	for (i = rc = 0; i < nfilters && !rc; i++) {
3250 		if (sc->filters[i].locked)
3251 			rc = set_filter(sc, i, &sc->filters[i]);
3252 	}
3253 
3254 	return (rc);
3255 }
3256 
3257 static int
3258 set_filter(struct adapter *sc, int id, const struct filter_info *f)
3259 {
3260 	int len;
3261 	struct mbuf *m;
3262 	struct ulp_txpkt *txpkt;
3263 	struct work_request_hdr *wr;
3264 	struct cpl_pass_open_req *oreq;
3265 	struct cpl_set_tcb_field *sreq;
3266 
3267 	len = sizeof(*wr) + sizeof(*oreq) + 2 * sizeof(*sreq);
3268 	KASSERT(len <= MHLEN, ("filter request too big for an mbuf"));
3269 
3270 	id += t3_mc5_size(&sc->mc5) - sc->params.mc5.nroutes -
3271 	      sc->params.mc5.nfilters;
3272 
3273 	m = m_gethdr(M_WAITOK, MT_DATA);
3274 	m->m_len = m->m_pkthdr.len = len;
3275 	bzero(mtod(m, char *), len);
3276 
3277 	wr = mtod(m, struct work_request_hdr *);
3278 	wr->wrh_hi = htonl(V_WR_OP(FW_WROPCODE_BYPASS) | F_WR_ATOMIC);
3279 
3280 	oreq = (struct cpl_pass_open_req *)(wr + 1);
3281 	txpkt = (struct ulp_txpkt *)oreq;
3282 	txpkt->cmd_dest = htonl(V_ULPTX_CMD(ULP_TXPKT));
3283 	txpkt->len = htonl(V_ULPTX_NFLITS(sizeof(*oreq) / 8));
3284 	OPCODE_TID(oreq) = htonl(MK_OPCODE_TID(CPL_PASS_OPEN_REQ, id));
3285 	oreq->local_port = htons(f->dport);
3286 	oreq->peer_port = htons(f->sport);
3287 	oreq->local_ip = htonl(f->dip);
3288 	oreq->peer_ip = htonl(f->sip);
3289 	oreq->peer_netmask = htonl(f->sip_mask);
3290 	oreq->opt0h = 0;
3291 	oreq->opt0l = htonl(F_NO_OFFLOAD);
3292 	oreq->opt1 = htonl(V_MAC_MATCH_VALID(f->mac_vld) |
3293 			 V_CONN_POLICY(CPL_CONN_POLICY_FILTER) |
3294 			 V_VLAN_PRI(f->vlan_prio >> 1) |
3295 			 V_VLAN_PRI_VALID(f->vlan_prio != FILTER_NO_VLAN_PRI) |
3296 			 V_PKT_TYPE(f->pkt_type) | V_OPT1_VLAN(f->vlan) |
3297 			 V_MAC_MATCH(f->mac_idx | (f->mac_hit << 4)));
3298 
3299 	sreq = (struct cpl_set_tcb_field *)(oreq + 1);
3300 	set_tcb_field_ulp(sreq, id, 1, 0x1800808000ULL,
3301 			  (f->report_filter_id << 15) | (1 << 23) |
3302 			  ((u64)f->pass << 35) | ((u64)!f->rss << 36));
3303 	set_tcb_field_ulp(sreq + 1, id, 0, 0xffffffff, (2 << 19) | 1);
3304 	t3_mgmt_tx(sc, m);
3305 
3306 	if (f->pass && !f->rss) {
3307 		len = sizeof(*sreq);
3308 		m = m_gethdr(M_WAITOK, MT_DATA);
3309 		m->m_len = m->m_pkthdr.len = len;
3310 		bzero(mtod(m, char *), len);
3311 		sreq = mtod(m, struct cpl_set_tcb_field *);
3312 		sreq->wr.wrh_hi = htonl(V_WR_OP(FW_WROPCODE_FORWARD));
3313 		mk_set_tcb_field(sreq, id, 25, 0x3f80000,
3314 				 (u64)sc->rrss_map[f->qset] << 19);
3315 		t3_mgmt_tx(sc, m);
3316 	}
3317 	return 0;
3318 }
3319 
3320 static inline void
3321 mk_set_tcb_field(struct cpl_set_tcb_field *req, unsigned int tid,
3322     unsigned int word, u64 mask, u64 val)
3323 {
3324 	OPCODE_TID(req) = htonl(MK_OPCODE_TID(CPL_SET_TCB_FIELD, tid));
3325 	req->reply = V_NO_REPLY(1);
3326 	req->cpu_idx = 0;
3327 	req->word = htons(word);
3328 	req->mask = htobe64(mask);
3329 	req->val = htobe64(val);
3330 }
3331 
3332 static inline void
3333 set_tcb_field_ulp(struct cpl_set_tcb_field *req, unsigned int tid,
3334     unsigned int word, u64 mask, u64 val)
3335 {
3336 	struct ulp_txpkt *txpkt = (struct ulp_txpkt *)req;
3337 
3338 	txpkt->cmd_dest = htonl(V_ULPTX_CMD(ULP_TXPKT));
3339 	txpkt->len = htonl(V_ULPTX_NFLITS(sizeof(*req) / 8));
3340 	mk_set_tcb_field(req, tid, word, mask, val);
3341 }
3342 
3343 void
3344 t3_iterate(void (*func)(struct adapter *, void *), void *arg)
3345 {
3346 	struct adapter *sc;
3347 
3348 	mtx_lock(&t3_list_lock);
3349 	SLIST_FOREACH(sc, &t3_list, link) {
3350 		/*
3351 		 * func should not make any assumptions about what state sc is
3352 		 * in - the only guarantee is that sc->sc_lock is a valid lock.
3353 		 */
3354 		func(sc, arg);
3355 	}
3356 	mtx_unlock(&t3_list_lock);
3357 }
3358 
3359 #ifdef TCP_OFFLOAD
3360 static int
3361 toe_capability(struct port_info *pi, int enable)
3362 {
3363 	int rc;
3364 	struct adapter *sc = pi->adapter;
3365 
3366 	ADAPTER_LOCK_ASSERT_OWNED(sc);
3367 
3368 	if (!is_offload(sc))
3369 		return (ENODEV);
3370 
3371 	if (enable) {
3372 		if (!(sc->flags & FULL_INIT_DONE)) {
3373 			log(LOG_WARNING,
3374 			    "You must enable a cxgb interface first\n");
3375 			return (EAGAIN);
3376 		}
3377 
3378 		if (isset(&sc->offload_map, pi->port_id))
3379 			return (0);
3380 
3381 		if (!(sc->flags & TOM_INIT_DONE)) {
3382 			rc = t3_activate_uld(sc, ULD_TOM);
3383 			if (rc == EAGAIN) {
3384 				log(LOG_WARNING,
3385 				    "You must kldload t3_tom.ko before trying "
3386 				    "to enable TOE on a cxgb interface.\n");
3387 			}
3388 			if (rc != 0)
3389 				return (rc);
3390 			KASSERT(sc->tom_softc != NULL,
3391 			    ("%s: TOM activated but softc NULL", __func__));
3392 			KASSERT(sc->flags & TOM_INIT_DONE,
3393 			    ("%s: TOM activated but flag not set", __func__));
3394 		}
3395 
3396 		setbit(&sc->offload_map, pi->port_id);
3397 
3398 		/*
3399 		 * XXX: Temporary code to allow iWARP to be enabled when TOE is
3400 		 * enabled on any port.  Need to figure out how to enable,
3401 		 * disable, load, and unload iWARP cleanly.
3402 		 */
3403 		if (!isset(&sc->offload_map, MAX_NPORTS) &&
3404 		    t3_activate_uld(sc, ULD_IWARP) == 0)
3405 			setbit(&sc->offload_map, MAX_NPORTS);
3406 	} else {
3407 		if (!isset(&sc->offload_map, pi->port_id))
3408 			return (0);
3409 
3410 		KASSERT(sc->flags & TOM_INIT_DONE,
3411 		    ("%s: TOM never initialized?", __func__));
3412 		clrbit(&sc->offload_map, pi->port_id);
3413 	}
3414 
3415 	return (0);
3416 }
3417 
3418 /*
3419  * Add an upper layer driver to the global list.
3420  */
3421 int
3422 t3_register_uld(struct uld_info *ui)
3423 {
3424 	int rc = 0;
3425 	struct uld_info *u;
3426 
3427 	mtx_lock(&t3_uld_list_lock);
3428 	SLIST_FOREACH(u, &t3_uld_list, link) {
3429 	    if (u->uld_id == ui->uld_id) {
3430 		    rc = EEXIST;
3431 		    goto done;
3432 	    }
3433 	}
3434 
3435 	SLIST_INSERT_HEAD(&t3_uld_list, ui, link);
3436 	ui->refcount = 0;
3437 done:
3438 	mtx_unlock(&t3_uld_list_lock);
3439 	return (rc);
3440 }
3441 
3442 int
3443 t3_unregister_uld(struct uld_info *ui)
3444 {
3445 	int rc = EINVAL;
3446 	struct uld_info *u;
3447 
3448 	mtx_lock(&t3_uld_list_lock);
3449 
3450 	SLIST_FOREACH(u, &t3_uld_list, link) {
3451 	    if (u == ui) {
3452 		    if (ui->refcount > 0) {
3453 			    rc = EBUSY;
3454 			    goto done;
3455 		    }
3456 
3457 		    SLIST_REMOVE(&t3_uld_list, ui, uld_info, link);
3458 		    rc = 0;
3459 		    goto done;
3460 	    }
3461 	}
3462 done:
3463 	mtx_unlock(&t3_uld_list_lock);
3464 	return (rc);
3465 }
3466 
3467 int
3468 t3_activate_uld(struct adapter *sc, int id)
3469 {
3470 	int rc = EAGAIN;
3471 	struct uld_info *ui;
3472 
3473 	mtx_lock(&t3_uld_list_lock);
3474 
3475 	SLIST_FOREACH(ui, &t3_uld_list, link) {
3476 		if (ui->uld_id == id) {
3477 			rc = ui->activate(sc);
3478 			if (rc == 0)
3479 				ui->refcount++;
3480 			goto done;
3481 		}
3482 	}
3483 done:
3484 	mtx_unlock(&t3_uld_list_lock);
3485 
3486 	return (rc);
3487 }
3488 
3489 int
3490 t3_deactivate_uld(struct adapter *sc, int id)
3491 {
3492 	int rc = EINVAL;
3493 	struct uld_info *ui;
3494 
3495 	mtx_lock(&t3_uld_list_lock);
3496 
3497 	SLIST_FOREACH(ui, &t3_uld_list, link) {
3498 		if (ui->uld_id == id) {
3499 			rc = ui->deactivate(sc);
3500 			if (rc == 0)
3501 				ui->refcount--;
3502 			goto done;
3503 		}
3504 	}
3505 done:
3506 	mtx_unlock(&t3_uld_list_lock);
3507 
3508 	return (rc);
3509 }
3510 
3511 static int
3512 cpl_not_handled(struct sge_qset *qs __unused, struct rsp_desc *r __unused,
3513     struct mbuf *m)
3514 {
3515 	m_freem(m);
3516 	return (EDOOFUS);
3517 }
3518 
3519 int
3520 t3_register_cpl_handler(struct adapter *sc, int opcode, cpl_handler_t h)
3521 {
3522 	uintptr_t *loc, new;
3523 
3524 	if (opcode >= NUM_CPL_HANDLERS)
3525 		return (EINVAL);
3526 
3527 	new = h ? (uintptr_t)h : (uintptr_t)cpl_not_handled;
3528 	loc = (uintptr_t *) &sc->cpl_handler[opcode];
3529 	atomic_store_rel_ptr(loc, new);
3530 
3531 	return (0);
3532 }
3533 #endif
3534 
3535 static int
3536 cxgbc_mod_event(module_t mod, int cmd, void *arg)
3537 {
3538 	int rc = 0;
3539 
3540 	switch (cmd) {
3541 	case MOD_LOAD:
3542 		mtx_init(&t3_list_lock, "T3 adapters", 0, MTX_DEF);
3543 		SLIST_INIT(&t3_list);
3544 #ifdef TCP_OFFLOAD
3545 		mtx_init(&t3_uld_list_lock, "T3 ULDs", 0, MTX_DEF);
3546 		SLIST_INIT(&t3_uld_list);
3547 #endif
3548 		break;
3549 
3550 	case MOD_UNLOAD:
3551 #ifdef TCP_OFFLOAD
3552 		mtx_lock(&t3_uld_list_lock);
3553 		if (!SLIST_EMPTY(&t3_uld_list)) {
3554 			rc = EBUSY;
3555 			mtx_unlock(&t3_uld_list_lock);
3556 			break;
3557 		}
3558 		mtx_unlock(&t3_uld_list_lock);
3559 		mtx_destroy(&t3_uld_list_lock);
3560 #endif
3561 		mtx_lock(&t3_list_lock);
3562 		if (!SLIST_EMPTY(&t3_list)) {
3563 			rc = EBUSY;
3564 			mtx_unlock(&t3_list_lock);
3565 			break;
3566 		}
3567 		mtx_unlock(&t3_list_lock);
3568 		mtx_destroy(&t3_list_lock);
3569 		break;
3570 	}
3571 
3572 	return (rc);
3573 }
3574