xref: /freebsd/sys/dev/cxgb/cxgb_main.c (revision dd21556857e8d40f66bf5ad54754d9d52669ebf7)
1 /**************************************************************************
2 SPDX-License-Identifier: BSD-2-Clause
3 
4 Copyright (c) 2007-2009, Chelsio Inc.
5 All rights reserved.
6 
7 Redistribution and use in source and binary forms, with or without
8 modification, are permitted provided that the following conditions are met:
9 
10  1. Redistributions of source code must retain the above copyright notice,
11     this list of conditions and the following disclaimer.
12 
13  2. Neither the name of the Chelsio Corporation nor the names of its
14     contributors may be used to endorse or promote products derived from
15     this software without specific prior written permission.
16 
17 THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
18 AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
21 LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
22 CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
23 SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
24 INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
25 CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
26 ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
27 POSSIBILITY OF SUCH DAMAGE.
28 
29 ***************************************************************************/
30 
31 #include <sys/cdefs.h>
32 #include "opt_inet.h"
33 
34 #include <sys/param.h>
35 #include <sys/systm.h>
36 #include <sys/kernel.h>
37 #include <sys/bus.h>
38 #include <sys/module.h>
39 #include <sys/pciio.h>
40 #include <sys/conf.h>
41 #include <machine/bus.h>
42 #include <machine/resource.h>
43 #include <sys/ktr.h>
44 #include <sys/rman.h>
45 #include <sys/ioccom.h>
46 #include <sys/mbuf.h>
47 #include <sys/linker.h>
48 #include <sys/firmware.h>
49 #include <sys/socket.h>
50 #include <sys/sockio.h>
51 #include <sys/smp.h>
52 #include <sys/sysctl.h>
53 #include <sys/syslog.h>
54 #include <sys/queue.h>
55 #include <sys/taskqueue.h>
56 #include <sys/proc.h>
57 
58 #include <net/bpf.h>
59 #include <net/debugnet.h>
60 #include <net/ethernet.h>
61 #include <net/if.h>
62 #include <net/if_var.h>
63 #include <net/if_arp.h>
64 #include <net/if_dl.h>
65 #include <net/if_media.h>
66 #include <net/if_types.h>
67 #include <net/if_vlan_var.h>
68 
69 #include <netinet/in_systm.h>
70 #include <netinet/in.h>
71 #include <netinet/if_ether.h>
72 #include <netinet/ip.h>
73 #include <netinet/ip.h>
74 #include <netinet/tcp.h>
75 #include <netinet/udp.h>
76 
77 #include <dev/pci/pcireg.h>
78 #include <dev/pci/pcivar.h>
79 #include <dev/pci/pci_private.h>
80 
81 #include <cxgb_include.h>
82 
83 #ifdef PRIV_SUPPORTED
84 #include <sys/priv.h>
85 #endif
86 
87 static int cxgb_setup_interrupts(adapter_t *);
88 static void cxgb_teardown_interrupts(adapter_t *);
89 static void cxgb_init(void *);
90 static int cxgb_init_locked(struct port_info *);
91 static int cxgb_uninit_locked(struct port_info *);
92 static int cxgb_uninit_synchronized(struct port_info *);
93 static int cxgb_ioctl(if_t, unsigned long, caddr_t);
94 static int cxgb_media_change(if_t);
95 static int cxgb_ifm_type(int);
96 static void cxgb_build_medialist(struct port_info *);
97 static void cxgb_media_status(if_t, struct ifmediareq *);
98 static uint64_t cxgb_get_counter(if_t, ift_counter);
99 static int setup_sge_qsets(adapter_t *);
100 static void cxgb_async_intr(void *);
101 static void cxgb_tick_handler(void *, int);
102 static void cxgb_tick(void *);
103 static void link_check_callout(void *);
104 static void check_link_status(void *, int);
105 static void setup_rss(adapter_t *sc);
106 static int alloc_filters(struct adapter *);
107 static int setup_hw_filters(struct adapter *);
108 static int set_filter(struct adapter *, int, const struct filter_info *);
109 static inline void mk_set_tcb_field(struct cpl_set_tcb_field *, unsigned int,
110     unsigned int, u64, u64);
111 static inline void set_tcb_field_ulp(struct cpl_set_tcb_field *, unsigned int,
112     unsigned int, u64, u64);
113 #ifdef TCP_OFFLOAD
114 static int cpl_not_handled(struct sge_qset *, struct rsp_desc *, struct mbuf *);
115 #endif
116 
117 /* Attachment glue for the PCI controller end of the device.  Each port of
118  * the device is attached separately, as defined later.
119  */
120 static int cxgb_controller_probe(device_t);
121 static int cxgb_controller_attach(device_t);
122 static int cxgb_controller_detach(device_t);
123 static void cxgb_free(struct adapter *);
124 static __inline void reg_block_dump(struct adapter *ap, uint8_t *buf, unsigned int start,
125     unsigned int end);
126 static void cxgb_get_regs(adapter_t *sc, struct ch_ifconf_regs *regs, uint8_t *buf);
127 static int cxgb_get_regs_len(void);
128 static void touch_bars(device_t dev);
129 static void cxgb_update_mac_settings(struct port_info *p);
130 #ifdef TCP_OFFLOAD
131 static int toe_capability(struct port_info *, int);
132 #endif
133 
134 /* Table for probing the cards.  The desc field isn't actually used */
135 struct cxgb_ident {
136 	uint16_t	vendor;
137 	uint16_t	device;
138 	int		index;
139 	char		*desc;
140 } cxgb_identifiers[] = {
141 	{PCI_VENDOR_ID_CHELSIO, 0x0020, 0, "PE9000"},
142 	{PCI_VENDOR_ID_CHELSIO, 0x0021, 1, "T302E"},
143 	{PCI_VENDOR_ID_CHELSIO, 0x0022, 2, "T310E"},
144 	{PCI_VENDOR_ID_CHELSIO, 0x0023, 3, "T320X"},
145 	{PCI_VENDOR_ID_CHELSIO, 0x0024, 1, "T302X"},
146 	{PCI_VENDOR_ID_CHELSIO, 0x0025, 3, "T320E"},
147 	{PCI_VENDOR_ID_CHELSIO, 0x0026, 2, "T310X"},
148 	{PCI_VENDOR_ID_CHELSIO, 0x0030, 2, "T3B10"},
149 	{PCI_VENDOR_ID_CHELSIO, 0x0031, 3, "T3B20"},
150 	{PCI_VENDOR_ID_CHELSIO, 0x0032, 1, "T3B02"},
151 	{PCI_VENDOR_ID_CHELSIO, 0x0033, 4, "T3B04"},
152 	{PCI_VENDOR_ID_CHELSIO, 0x0035, 6, "T3C10"},
153 	{PCI_VENDOR_ID_CHELSIO, 0x0036, 3, "S320E-CR"},
154 	{PCI_VENDOR_ID_CHELSIO, 0x0037, 7, "N320E-G2"},
155 	{0, 0, 0, NULL}
156 };
157 
158 static device_method_t cxgb_controller_methods[] = {
159 	DEVMETHOD(device_probe,		cxgb_controller_probe),
160 	DEVMETHOD(device_attach,	cxgb_controller_attach),
161 	DEVMETHOD(device_detach,	cxgb_controller_detach),
162 
163 	DEVMETHOD_END
164 };
165 
166 static driver_t cxgb_controller_driver = {
167 	"cxgbc",
168 	cxgb_controller_methods,
169 	sizeof(struct adapter)
170 };
171 
172 static int cxgbc_mod_event(module_t, int, void *);
173 
174 DRIVER_MODULE(cxgbc, pci, cxgb_controller_driver, cxgbc_mod_event, NULL);
175 MODULE_PNP_INFO("U16:vendor;U16:device", pci, cxgbc, cxgb_identifiers,
176     nitems(cxgb_identifiers) - 1);
177 MODULE_VERSION(cxgbc, 1);
178 MODULE_DEPEND(cxgbc, firmware, 1, 1, 1);
179 
180 /*
181  * Attachment glue for the ports.  Attachment is done directly to the
182  * controller device.
183  */
184 static int cxgb_port_probe(device_t);
185 static int cxgb_port_attach(device_t);
186 static int cxgb_port_detach(device_t);
187 
188 static device_method_t cxgb_port_methods[] = {
189 	DEVMETHOD(device_probe,		cxgb_port_probe),
190 	DEVMETHOD(device_attach,	cxgb_port_attach),
191 	DEVMETHOD(device_detach,	cxgb_port_detach),
192 	{ 0, 0 }
193 };
194 
195 static driver_t cxgb_port_driver = {
196 	"cxgb",
197 	cxgb_port_methods,
198 	0
199 };
200 
201 static d_ioctl_t cxgb_extension_ioctl;
202 static d_open_t cxgb_extension_open;
203 static d_close_t cxgb_extension_close;
204 
205 static struct cdevsw cxgb_cdevsw = {
206        .d_version =    D_VERSION,
207        .d_flags =      0,
208        .d_open =       cxgb_extension_open,
209        .d_close =      cxgb_extension_close,
210        .d_ioctl =      cxgb_extension_ioctl,
211        .d_name =       "cxgb",
212 };
213 
214 DRIVER_MODULE(cxgb, cxgbc, cxgb_port_driver, 0, 0);
215 MODULE_VERSION(cxgb, 1);
216 
217 DEBUGNET_DEFINE(cxgb);
218 
219 static struct mtx t3_list_lock;
220 static SLIST_HEAD(, adapter) t3_list;
221 #ifdef TCP_OFFLOAD
222 static struct mtx t3_uld_list_lock;
223 static SLIST_HEAD(, uld_info) t3_uld_list;
224 #endif
225 
226 /*
227  * The driver uses the best interrupt scheme available on a platform in the
228  * order MSI-X, MSI, legacy pin interrupts.  This parameter determines which
229  * of these schemes the driver may consider as follows:
230  *
231  * msi = 2: choose from among all three options
232  * msi = 1 : only consider MSI and pin interrupts
233  * msi = 0: force pin interrupts
234  */
235 static int msi_allowed = 2;
236 
237 SYSCTL_NODE(_hw, OID_AUTO, cxgb, CTLFLAG_RD | CTLFLAG_MPSAFE, 0,
238     "CXGB driver parameters");
239 SYSCTL_INT(_hw_cxgb, OID_AUTO, msi_allowed, CTLFLAG_RDTUN, &msi_allowed, 0,
240     "MSI-X, MSI, INTx selector");
241 
242 /*
243  * The driver uses an auto-queue algorithm by default.
244  * To disable it and force a single queue-set per port, use multiq = 0
245  */
246 static int multiq = 1;
247 SYSCTL_INT(_hw_cxgb, OID_AUTO, multiq, CTLFLAG_RDTUN, &multiq, 0,
248     "use min(ncpus/ports, 8) queue-sets per port");
249 
250 /*
251  * By default the driver will not update the firmware unless
252  * it was compiled against a newer version
253  *
254  */
255 static int force_fw_update = 0;
256 SYSCTL_INT(_hw_cxgb, OID_AUTO, force_fw_update, CTLFLAG_RDTUN, &force_fw_update, 0,
257     "update firmware even if up to date");
258 
259 int cxgb_use_16k_clusters = -1;
260 SYSCTL_INT(_hw_cxgb, OID_AUTO, use_16k_clusters, CTLFLAG_RDTUN,
261     &cxgb_use_16k_clusters, 0, "use 16kB clusters for the jumbo queue ");
262 
263 static int nfilters = -1;
264 SYSCTL_INT(_hw_cxgb, OID_AUTO, nfilters, CTLFLAG_RDTUN,
265     &nfilters, 0, "max number of entries in the filter table");
266 
267 enum {
268 	MAX_TXQ_ENTRIES      = 16384,
269 	MAX_CTRL_TXQ_ENTRIES = 1024,
270 	MAX_RSPQ_ENTRIES     = 16384,
271 	MAX_RX_BUFFERS       = 16384,
272 	MAX_RX_JUMBO_BUFFERS = 16384,
273 	MIN_TXQ_ENTRIES      = 4,
274 	MIN_CTRL_TXQ_ENTRIES = 4,
275 	MIN_RSPQ_ENTRIES     = 32,
276 	MIN_FL_ENTRIES       = 32,
277 	MIN_FL_JUMBO_ENTRIES = 32
278 };
279 
280 struct filter_info {
281 	u32 sip;
282 	u32 sip_mask;
283 	u32 dip;
284 	u16 sport;
285 	u16 dport;
286 	u32 vlan:12;
287 	u32 vlan_prio:3;
288 	u32 mac_hit:1;
289 	u32 mac_idx:4;
290 	u32 mac_vld:1;
291 	u32 pkt_type:2;
292 	u32 report_filter_id:1;
293 	u32 pass:1;
294 	u32 rss:1;
295 	u32 qset:3;
296 	u32 locked:1;
297 	u32 valid:1;
298 };
299 
300 enum { FILTER_NO_VLAN_PRI = 7 };
301 
302 #define EEPROM_MAGIC 0x38E2F10C
303 
304 #define PORT_MASK ((1 << MAX_NPORTS) - 1)
305 
306 
307 static int set_eeprom(struct port_info *pi, const uint8_t *data, int len, int offset);
308 
309 
310 static __inline char
311 t3rev2char(struct adapter *adapter)
312 {
313 	char rev = 'z';
314 
315 	switch(adapter->params.rev) {
316 	case T3_REV_A:
317 		rev = 'a';
318 		break;
319 	case T3_REV_B:
320 	case T3_REV_B2:
321 		rev = 'b';
322 		break;
323 	case T3_REV_C:
324 		rev = 'c';
325 		break;
326 	}
327 	return rev;
328 }
329 
330 static struct cxgb_ident *
331 cxgb_get_ident(device_t dev)
332 {
333 	struct cxgb_ident *id;
334 
335 	for (id = cxgb_identifiers; id->desc != NULL; id++) {
336 		if ((id->vendor == pci_get_vendor(dev)) &&
337 		    (id->device == pci_get_device(dev))) {
338 			return (id);
339 		}
340 	}
341 	return (NULL);
342 }
343 
344 static const struct adapter_info *
345 cxgb_get_adapter_info(device_t dev)
346 {
347 	struct cxgb_ident *id;
348 	const struct adapter_info *ai;
349 
350 	id = cxgb_get_ident(dev);
351 	if (id == NULL)
352 		return (NULL);
353 
354 	ai = t3_get_adapter_info(id->index);
355 
356 	return (ai);
357 }
358 
359 static int
360 cxgb_controller_probe(device_t dev)
361 {
362 	const struct adapter_info *ai;
363 	const char *ports;
364 	int nports;
365 
366 	ai = cxgb_get_adapter_info(dev);
367 	if (ai == NULL)
368 		return (ENXIO);
369 
370 	nports = ai->nports0 + ai->nports1;
371 	if (nports == 1)
372 		ports = "port";
373 	else
374 		ports = "ports";
375 
376 	device_set_descf(dev, "%s, %d %s", ai->desc, nports, ports);
377 	return (BUS_PROBE_DEFAULT);
378 }
379 
380 #define FW_FNAME "cxgb_t3fw"
381 #define TPEEPROM_NAME "cxgb_t3%c_tp_eeprom"
382 #define TPSRAM_NAME "cxgb_t3%c_protocol_sram"
383 
384 static int
385 upgrade_fw(adapter_t *sc)
386 {
387 	const struct firmware *fw;
388 	int status;
389 	u32 vers;
390 
391 	if ((fw = firmware_get(FW_FNAME)) == NULL)  {
392 		device_printf(sc->dev, "Could not find firmware image %s\n", FW_FNAME);
393 		return (ENOENT);
394 	} else
395 		device_printf(sc->dev, "installing firmware on card\n");
396 	status = t3_load_fw(sc, (const uint8_t *)fw->data, fw->datasize);
397 
398 	if (status != 0) {
399 		device_printf(sc->dev, "failed to install firmware: %d\n",
400 		    status);
401 	} else {
402 		t3_get_fw_version(sc, &vers);
403 		snprintf(&sc->fw_version[0], sizeof(sc->fw_version), "%d.%d.%d",
404 		    G_FW_VERSION_MAJOR(vers), G_FW_VERSION_MINOR(vers),
405 		    G_FW_VERSION_MICRO(vers));
406 	}
407 
408 	firmware_put(fw, FIRMWARE_UNLOAD);
409 
410 	return (status);
411 }
412 
413 /*
414  * The cxgb_controller_attach function is responsible for the initial
415  * bringup of the device.  Its responsibilities include:
416  *
417  *  1. Determine if the device supports MSI or MSI-X.
418  *  2. Allocate bus resources so that we can access the Base Address Register
419  *  3. Create and initialize mutexes for the controller and its control
420  *     logic such as SGE and MDIO.
421  *  4. Call hardware specific setup routine for the adapter as a whole.
422  *  5. Allocate the BAR for doing MSI-X.
423  *  6. Setup the line interrupt iff MSI-X is not supported.
424  *  7. Create the driver's taskq.
425  *  8. Start one task queue service thread.
426  *  9. Check if the firmware and SRAM are up-to-date.  They will be
427  *     auto-updated later (before FULL_INIT_DONE), if required.
428  * 10. Create a child device for each MAC (port)
429  * 11. Initialize T3 private state.
430  * 12. Trigger the LED
431  * 13. Setup offload iff supported.
432  * 14. Reset/restart the tick callout.
433  * 15. Attach sysctls
434  *
435  * NOTE: Any modification or deviation from this list MUST be reflected in
436  * the above comment.  Failure to do so will result in problems on various
437  * error conditions including link flapping.
438  */
439 static int
440 cxgb_controller_attach(device_t dev)
441 {
442 	device_t child;
443 	const struct adapter_info *ai;
444 	struct adapter *sc;
445 	int i, error = 0;
446 	uint32_t vers;
447 	int port_qsets = 1;
448 	int msi_needed, reg;
449 
450 	sc = device_get_softc(dev);
451 	sc->dev = dev;
452 	sc->msi_count = 0;
453 	ai = cxgb_get_adapter_info(dev);
454 
455 	snprintf(sc->lockbuf, ADAPTER_LOCK_NAME_LEN, "cxgb controller lock %d",
456 	    device_get_unit(dev));
457 	ADAPTER_LOCK_INIT(sc, sc->lockbuf);
458 
459 	snprintf(sc->reglockbuf, ADAPTER_LOCK_NAME_LEN, "SGE reg lock %d",
460 	    device_get_unit(dev));
461 	snprintf(sc->mdiolockbuf, ADAPTER_LOCK_NAME_LEN, "cxgb mdio lock %d",
462 	    device_get_unit(dev));
463 	snprintf(sc->elmerlockbuf, ADAPTER_LOCK_NAME_LEN, "cxgb elmer lock %d",
464 	    device_get_unit(dev));
465 
466 	MTX_INIT(&sc->sge.reg_lock, sc->reglockbuf, NULL, MTX_SPIN);
467 	MTX_INIT(&sc->mdio_lock, sc->mdiolockbuf, NULL, MTX_DEF);
468 	MTX_INIT(&sc->elmer_lock, sc->elmerlockbuf, NULL, MTX_DEF);
469 
470 	mtx_lock(&t3_list_lock);
471 	SLIST_INSERT_HEAD(&t3_list, sc, link);
472 	mtx_unlock(&t3_list_lock);
473 
474 	/* find the PCIe link width and set max read request to 4KB*/
475 	if (pci_find_cap(dev, PCIY_EXPRESS, &reg) == 0) {
476 		uint16_t lnk;
477 
478 		lnk = pci_read_config(dev, reg + PCIER_LINK_STA, 2);
479 		sc->link_width = (lnk & PCIEM_LINK_STA_WIDTH) >> 4;
480 		if (sc->link_width < 8 &&
481 		    (ai->caps & SUPPORTED_10000baseT_Full)) {
482 			device_printf(sc->dev,
483 			    "PCIe x%d Link, expect reduced performance\n",
484 			    sc->link_width);
485 		}
486 
487 		pci_set_max_read_req(dev, 4096);
488 	}
489 
490 	touch_bars(dev);
491 	pci_enable_busmaster(dev);
492 	/*
493 	 * Allocate the registers and make them available to the driver.
494 	 * The registers that we care about for NIC mode are in BAR 0
495 	 */
496 	sc->regs_rid = PCIR_BAR(0);
497 	if ((sc->regs_res = bus_alloc_resource_any(dev, SYS_RES_MEMORY,
498 	    &sc->regs_rid, RF_ACTIVE)) == NULL) {
499 		device_printf(dev, "Cannot allocate BAR region 0\n");
500 		error = ENXIO;
501 		goto out;
502 	}
503 
504 	sc->bt = rman_get_bustag(sc->regs_res);
505 	sc->bh = rman_get_bushandle(sc->regs_res);
506 	sc->mmio_len = rman_get_size(sc->regs_res);
507 
508 	for (i = 0; i < MAX_NPORTS; i++)
509 		sc->port[i].adapter = sc;
510 
511 	if (t3_prep_adapter(sc, ai, 1) < 0) {
512 		printf("prep adapter failed\n");
513 		error = ENODEV;
514 		goto out;
515 	}
516 
517 	sc->udbs_rid = PCIR_BAR(2);
518 	sc->udbs_res = NULL;
519 	if (is_offload(sc) &&
520 	    ((sc->udbs_res = bus_alloc_resource_any(dev, SYS_RES_MEMORY,
521 		   &sc->udbs_rid, RF_ACTIVE)) == NULL)) {
522 		device_printf(dev, "Cannot allocate BAR region 1\n");
523 		error = ENXIO;
524 		goto out;
525 	}
526 
527         /* Allocate the BAR for doing MSI-X.  If it succeeds, try to allocate
528 	 * enough messages for the queue sets.  If that fails, try falling
529 	 * back to MSI.  If that fails, then try falling back to the legacy
530 	 * interrupt pin model.
531 	 */
532 	sc->msix_regs_rid = 0x20;
533 	if ((msi_allowed >= 2) &&
534 	    (sc->msix_regs_res = bus_alloc_resource_any(dev, SYS_RES_MEMORY,
535 	    &sc->msix_regs_rid, RF_ACTIVE)) != NULL) {
536 
537 		if (multiq)
538 			port_qsets = min(SGE_QSETS/sc->params.nports, mp_ncpus);
539 		msi_needed = sc->msi_count = sc->params.nports * port_qsets + 1;
540 
541 		if (pci_msix_count(dev) == 0 ||
542 		    (error = pci_alloc_msix(dev, &sc->msi_count)) != 0 ||
543 		    sc->msi_count != msi_needed) {
544 			device_printf(dev, "alloc msix failed - "
545 				      "msi_count=%d, msi_needed=%d, err=%d; "
546 				      "will try MSI\n", sc->msi_count,
547 				      msi_needed, error);
548 			sc->msi_count = 0;
549 			port_qsets = 1;
550 			pci_release_msi(dev);
551 			bus_release_resource(dev, SYS_RES_MEMORY,
552 			    sc->msix_regs_rid, sc->msix_regs_res);
553 			sc->msix_regs_res = NULL;
554 		} else {
555 			sc->flags |= USING_MSIX;
556 			sc->cxgb_intr = cxgb_async_intr;
557 			device_printf(dev,
558 				      "using MSI-X interrupts (%u vectors)\n",
559 				      sc->msi_count);
560 		}
561 	}
562 
563 	if ((msi_allowed >= 1) && (sc->msi_count == 0)) {
564 		sc->msi_count = 1;
565 		if ((error = pci_alloc_msi(dev, &sc->msi_count)) != 0) {
566 			device_printf(dev, "alloc msi failed - "
567 				      "err=%d; will try INTx\n", error);
568 			sc->msi_count = 0;
569 			port_qsets = 1;
570 			pci_release_msi(dev);
571 		} else {
572 			sc->flags |= USING_MSI;
573 			sc->cxgb_intr = t3_intr_msi;
574 			device_printf(dev, "using MSI interrupts\n");
575 		}
576 	}
577 	if (sc->msi_count == 0) {
578 		device_printf(dev, "using line interrupts\n");
579 		sc->cxgb_intr = t3b_intr;
580 	}
581 
582 	/* Create a private taskqueue thread for handling driver events */
583 	sc->tq = taskqueue_create("cxgb_taskq", M_NOWAIT,
584 	    taskqueue_thread_enqueue, &sc->tq);
585 	if (sc->tq == NULL) {
586 		device_printf(dev, "failed to allocate controller task queue\n");
587 		goto out;
588 	}
589 
590 	taskqueue_start_threads(&sc->tq, 1, PI_NET, "%s taskq",
591 	    device_get_nameunit(dev));
592 	TASK_INIT(&sc->tick_task, 0, cxgb_tick_handler, sc);
593 
594 
595 	/* Create a periodic callout for checking adapter status */
596 	callout_init(&sc->cxgb_tick_ch, 1);
597 
598 	if (t3_check_fw_version(sc) < 0 || force_fw_update) {
599 		/*
600 		 * Warn user that a firmware update will be attempted in init.
601 		 */
602 		device_printf(dev, "firmware needs to be updated to version %d.%d.%d\n",
603 		    FW_VERSION_MAJOR, FW_VERSION_MINOR, FW_VERSION_MICRO);
604 		sc->flags &= ~FW_UPTODATE;
605 	} else {
606 		sc->flags |= FW_UPTODATE;
607 	}
608 
609 	if (t3_check_tpsram_version(sc) < 0) {
610 		/*
611 		 * Warn user that a firmware update will be attempted in init.
612 		 */
613 		device_printf(dev, "SRAM needs to be updated to version %c-%d.%d.%d\n",
614 		    t3rev2char(sc), TP_VERSION_MAJOR, TP_VERSION_MINOR, TP_VERSION_MICRO);
615 		sc->flags &= ~TPS_UPTODATE;
616 	} else {
617 		sc->flags |= TPS_UPTODATE;
618 	}
619 
620 	/*
621 	 * Create a child device for each MAC.  The ethernet attachment
622 	 * will be done in these children.
623 	 */
624 	for (i = 0; i < (sc)->params.nports; i++) {
625 		struct port_info *pi;
626 
627 		if ((child = device_add_child(dev, "cxgb", -1)) == NULL) {
628 			device_printf(dev, "failed to add child port\n");
629 			error = EINVAL;
630 			goto out;
631 		}
632 		pi = &sc->port[i];
633 		pi->adapter = sc;
634 		pi->nqsets = port_qsets;
635 		pi->first_qset = i*port_qsets;
636 		pi->port_id = i;
637 		pi->tx_chan = i >= ai->nports0;
638 		pi->txpkt_intf = pi->tx_chan ? 2 * (i - ai->nports0) + 1 : 2 * i;
639 		sc->rxpkt_map[pi->txpkt_intf] = i;
640 		sc->port[i].tx_chan = i >= ai->nports0;
641 		sc->portdev[i] = child;
642 		device_set_softc(child, pi);
643 	}
644 	bus_attach_children(dev);
645 
646 	/* initialize sge private state */
647 	t3_sge_init_adapter(sc);
648 
649 	t3_led_ready(sc);
650 
651 	error = t3_get_fw_version(sc, &vers);
652 	if (error)
653 		goto out;
654 
655 	snprintf(&sc->fw_version[0], sizeof(sc->fw_version), "%d.%d.%d",
656 	    G_FW_VERSION_MAJOR(vers), G_FW_VERSION_MINOR(vers),
657 	    G_FW_VERSION_MICRO(vers));
658 
659 	device_set_descf(dev, "%s %sNIC\t E/C: %s S/N: %s",
660 	    ai->desc, is_offload(sc) ? "R" : "",
661 	    sc->params.vpd.ec, sc->params.vpd.sn);
662 
663 	snprintf(&sc->port_types[0], sizeof(sc->port_types), "%x%x%x%x",
664 		 sc->params.vpd.port_type[0], sc->params.vpd.port_type[1],
665 		 sc->params.vpd.port_type[2], sc->params.vpd.port_type[3]);
666 
667 	device_printf(sc->dev, "Firmware Version %s\n", &sc->fw_version[0]);
668 	callout_reset(&sc->cxgb_tick_ch, hz, cxgb_tick, sc);
669 	t3_add_attach_sysctls(sc);
670 
671 #ifdef TCP_OFFLOAD
672 	for (i = 0; i < NUM_CPL_HANDLERS; i++)
673 		sc->cpl_handler[i] = cpl_not_handled;
674 #endif
675 
676 	t3_intr_clear(sc);
677 	error = cxgb_setup_interrupts(sc);
678 out:
679 	if (error)
680 		cxgb_free(sc);
681 
682 	return (error);
683 }
684 
685 /*
686  * The cxgb_controller_detach routine is called with the device is
687  * unloaded from the system.
688  */
689 
690 static int
691 cxgb_controller_detach(device_t dev)
692 {
693 	struct adapter *sc;
694 
695 	sc = device_get_softc(dev);
696 
697 	cxgb_free(sc);
698 
699 	return (0);
700 }
701 
702 /*
703  * The cxgb_free() is called by the cxgb_controller_detach() routine
704  * to tear down the structures that were built up in
705  * cxgb_controller_attach(), and should be the final piece of work
706  * done when fully unloading the driver.
707  *
708  *
709  *  1. Shutting down the threads started by the cxgb_controller_attach()
710  *     routine.
711  *  2. Stopping the lower level device and all callouts (cxgb_down_locked()).
712  *  3. Detaching all of the port devices created during the
713  *     cxgb_controller_attach() routine.
714  *  4. Removing the device children created via cxgb_controller_attach().
715  *  5. Releasing PCI resources associated with the device.
716  *  6. Turning off the offload support, iff it was turned on.
717  *  7. Destroying the mutexes created in cxgb_controller_attach().
718  *
719  */
720 static void
721 cxgb_free(struct adapter *sc)
722 {
723 	int i, nqsets = 0;
724 
725 	ADAPTER_LOCK(sc);
726 	sc->flags |= CXGB_SHUTDOWN;
727 	ADAPTER_UNLOCK(sc);
728 
729 	/*
730 	 * Make sure all child devices are gone.
731 	 */
732 	bus_detach_children(sc->dev);
733 	for (i = 0; i < (sc)->params.nports; i++) {
734 		if (sc->portdev[i] &&
735 		    device_delete_child(sc->dev, sc->portdev[i]) != 0)
736 			device_printf(sc->dev, "failed to delete child port\n");
737 		nqsets += sc->port[i].nqsets;
738 	}
739 
740 	/*
741 	 * At this point, it is as if cxgb_port_detach has run on all ports, and
742 	 * cxgb_down has run on the adapter.  All interrupts have been silenced,
743 	 * all open devices have been closed.
744 	 */
745 	KASSERT(sc->open_device_map == 0, ("%s: device(s) still open (%x)",
746 					   __func__, sc->open_device_map));
747 	for (i = 0; i < sc->params.nports; i++) {
748 		KASSERT(sc->port[i].ifp == NULL, ("%s: port %i undead!",
749 						  __func__, i));
750 	}
751 
752 	/*
753 	 * Finish off the adapter's callouts.
754 	 */
755 	callout_drain(&sc->cxgb_tick_ch);
756 	callout_drain(&sc->sge_timer_ch);
757 
758 	/*
759 	 * Release resources grabbed under FULL_INIT_DONE by cxgb_up.  The
760 	 * sysctls are cleaned up by the kernel linker.
761 	 */
762 	if (sc->flags & FULL_INIT_DONE) {
763  		t3_free_sge_resources(sc, nqsets);
764  		sc->flags &= ~FULL_INIT_DONE;
765  	}
766 
767 	/*
768 	 * Release all interrupt resources.
769 	 */
770 	cxgb_teardown_interrupts(sc);
771 	if (sc->flags & (USING_MSI | USING_MSIX)) {
772 		device_printf(sc->dev, "releasing msi message(s)\n");
773 		pci_release_msi(sc->dev);
774 	} else {
775 		device_printf(sc->dev, "no msi message to release\n");
776 	}
777 
778 	if (sc->msix_regs_res != NULL) {
779 		bus_release_resource(sc->dev, SYS_RES_MEMORY, sc->msix_regs_rid,
780 		    sc->msix_regs_res);
781 	}
782 
783 	/*
784 	 * Free the adapter's taskqueue.
785 	 */
786 	if (sc->tq != NULL) {
787 		taskqueue_free(sc->tq);
788 		sc->tq = NULL;
789 	}
790 
791 	free(sc->filters, M_DEVBUF);
792 	t3_sge_free(sc);
793 
794 	if (sc->udbs_res != NULL)
795 		bus_release_resource(sc->dev, SYS_RES_MEMORY, sc->udbs_rid,
796 		    sc->udbs_res);
797 
798 	if (sc->regs_res != NULL)
799 		bus_release_resource(sc->dev, SYS_RES_MEMORY, sc->regs_rid,
800 		    sc->regs_res);
801 
802 	MTX_DESTROY(&sc->mdio_lock);
803 	MTX_DESTROY(&sc->sge.reg_lock);
804 	MTX_DESTROY(&sc->elmer_lock);
805 	mtx_lock(&t3_list_lock);
806 	SLIST_REMOVE(&t3_list, sc, adapter, link);
807 	mtx_unlock(&t3_list_lock);
808 	ADAPTER_LOCK_DEINIT(sc);
809 }
810 
811 /**
812  *	setup_sge_qsets - configure SGE Tx/Rx/response queues
813  *	@sc: the controller softc
814  *
815  *	Determines how many sets of SGE queues to use and initializes them.
816  *	We support multiple queue sets per port if we have MSI-X, otherwise
817  *	just one queue set per port.
818  */
819 static int
820 setup_sge_qsets(adapter_t *sc)
821 {
822 	int i, j, err, irq_idx = 0, qset_idx = 0;
823 	u_int ntxq = SGE_TXQ_PER_SET;
824 
825 	if ((err = t3_sge_alloc(sc)) != 0) {
826 		device_printf(sc->dev, "t3_sge_alloc returned %d\n", err);
827 		return (err);
828 	}
829 
830 	if (sc->params.rev > 0 && !(sc->flags & USING_MSI))
831 		irq_idx = -1;
832 
833 	for (i = 0; i < (sc)->params.nports; i++) {
834 		struct port_info *pi = &sc->port[i];
835 
836 		for (j = 0; j < pi->nqsets; j++, qset_idx++) {
837 			err = t3_sge_alloc_qset(sc, qset_idx, (sc)->params.nports,
838 			    (sc->flags & USING_MSIX) ? qset_idx + 1 : irq_idx,
839 			    &sc->params.sge.qset[qset_idx], ntxq, pi);
840 			if (err) {
841 				t3_free_sge_resources(sc, qset_idx);
842 				device_printf(sc->dev,
843 				    "t3_sge_alloc_qset failed with %d\n", err);
844 				return (err);
845 			}
846 		}
847 	}
848 
849 	sc->nqsets = qset_idx;
850 
851 	return (0);
852 }
853 
854 static void
855 cxgb_teardown_interrupts(adapter_t *sc)
856 {
857 	int i;
858 
859 	for (i = 0; i < SGE_QSETS; i++) {
860 		if (sc->msix_intr_tag[i] == NULL) {
861 
862 			/* Should have been setup fully or not at all */
863 			KASSERT(sc->msix_irq_res[i] == NULL &&
864 				sc->msix_irq_rid[i] == 0,
865 				("%s: half-done interrupt (%d).", __func__, i));
866 
867 			continue;
868 		}
869 
870 		bus_teardown_intr(sc->dev, sc->msix_irq_res[i],
871 				  sc->msix_intr_tag[i]);
872 		bus_release_resource(sc->dev, SYS_RES_IRQ, sc->msix_irq_rid[i],
873 				     sc->msix_irq_res[i]);
874 
875 		sc->msix_irq_res[i] = sc->msix_intr_tag[i] = NULL;
876 		sc->msix_irq_rid[i] = 0;
877 	}
878 
879 	if (sc->intr_tag) {
880 		KASSERT(sc->irq_res != NULL,
881 			("%s: half-done interrupt.", __func__));
882 
883 		bus_teardown_intr(sc->dev, sc->irq_res, sc->intr_tag);
884 		bus_release_resource(sc->dev, SYS_RES_IRQ, sc->irq_rid,
885 				     sc->irq_res);
886 
887 		sc->irq_res = sc->intr_tag = NULL;
888 		sc->irq_rid = 0;
889 	}
890 }
891 
892 static int
893 cxgb_setup_interrupts(adapter_t *sc)
894 {
895 	struct resource *res;
896 	void *tag;
897 	int i, rid, err, intr_flag = sc->flags & (USING_MSI | USING_MSIX);
898 
899 	sc->irq_rid = intr_flag ? 1 : 0;
900 	sc->irq_res = bus_alloc_resource_any(sc->dev, SYS_RES_IRQ, &sc->irq_rid,
901 					     RF_SHAREABLE | RF_ACTIVE);
902 	if (sc->irq_res == NULL) {
903 		device_printf(sc->dev, "Cannot allocate interrupt (%x, %u)\n",
904 			      intr_flag, sc->irq_rid);
905 		err = EINVAL;
906 		sc->irq_rid = 0;
907 	} else {
908 		err = bus_setup_intr(sc->dev, sc->irq_res,
909 		    INTR_MPSAFE | INTR_TYPE_NET, NULL,
910 		    sc->cxgb_intr, sc, &sc->intr_tag);
911 
912 		if (err) {
913 			device_printf(sc->dev,
914 				      "Cannot set up interrupt (%x, %u, %d)\n",
915 				      intr_flag, sc->irq_rid, err);
916 			bus_release_resource(sc->dev, SYS_RES_IRQ, sc->irq_rid,
917 					     sc->irq_res);
918 			sc->irq_res = sc->intr_tag = NULL;
919 			sc->irq_rid = 0;
920 		}
921 	}
922 
923 	/* That's all for INTx or MSI */
924 	if (!(intr_flag & USING_MSIX) || err)
925 		return (err);
926 
927 	bus_describe_intr(sc->dev, sc->irq_res, sc->intr_tag, "err");
928 	for (i = 0; i < sc->msi_count - 1; i++) {
929 		rid = i + 2;
930 		res = bus_alloc_resource_any(sc->dev, SYS_RES_IRQ, &rid,
931 					     RF_SHAREABLE | RF_ACTIVE);
932 		if (res == NULL) {
933 			device_printf(sc->dev, "Cannot allocate interrupt "
934 				      "for message %d\n", rid);
935 			err = EINVAL;
936 			break;
937 		}
938 
939 		err = bus_setup_intr(sc->dev, res, INTR_MPSAFE | INTR_TYPE_NET,
940 				     NULL, t3_intr_msix, &sc->sge.qs[i], &tag);
941 		if (err) {
942 			device_printf(sc->dev, "Cannot set up interrupt "
943 				      "for message %d (%d)\n", rid, err);
944 			bus_release_resource(sc->dev, SYS_RES_IRQ, rid, res);
945 			break;
946 		}
947 
948 		sc->msix_irq_rid[i] = rid;
949 		sc->msix_irq_res[i] = res;
950 		sc->msix_intr_tag[i] = tag;
951 		bus_describe_intr(sc->dev, res, tag, "qs%d", i);
952 	}
953 
954 	if (err)
955 		cxgb_teardown_interrupts(sc);
956 
957 	return (err);
958 }
959 
960 
961 static int
962 cxgb_port_probe(device_t dev)
963 {
964 	struct port_info *p;
965 	const char *desc;
966 
967 	p = device_get_softc(dev);
968 	desc = p->phy.desc;
969 	device_set_descf(dev, "Port %d %s", p->port_id, desc);
970 	return (0);
971 }
972 
973 
974 static int
975 cxgb_makedev(struct port_info *pi)
976 {
977 
978 	pi->port_cdev = make_dev(&cxgb_cdevsw, if_getdunit(pi->ifp),
979 	    UID_ROOT, GID_WHEEL, 0600, "%s", if_name(pi->ifp));
980 
981 	if (pi->port_cdev == NULL)
982 		return (ENOMEM);
983 
984 	pi->port_cdev->si_drv1 = (void *)pi;
985 
986 	return (0);
987 }
988 
989 #define CXGB_CAP (IFCAP_VLAN_HWTAGGING | IFCAP_VLAN_MTU | IFCAP_HWCSUM | \
990     IFCAP_VLAN_HWCSUM | IFCAP_TSO | IFCAP_JUMBO_MTU | IFCAP_LRO | \
991     IFCAP_VLAN_HWTSO | IFCAP_LINKSTATE | IFCAP_HWCSUM_IPV6)
992 #define CXGB_CAP_ENABLE CXGB_CAP
993 
994 static int
995 cxgb_port_attach(device_t dev)
996 {
997 	struct port_info *p;
998 	if_t ifp;
999 	int err;
1000 	struct adapter *sc;
1001 
1002 	p = device_get_softc(dev);
1003 	sc = p->adapter;
1004 	snprintf(p->lockbuf, PORT_NAME_LEN, "cxgb port lock %d:%d",
1005 	    device_get_unit(device_get_parent(dev)), p->port_id);
1006 	PORT_LOCK_INIT(p, p->lockbuf);
1007 
1008 	callout_init(&p->link_check_ch, 1);
1009 	TASK_INIT(&p->link_check_task, 0, check_link_status, p);
1010 
1011 	/* Allocate an ifnet object and set it up */
1012 	ifp = p->ifp = if_alloc(IFT_ETHER);
1013 	if_initname(ifp, device_get_name(dev), device_get_unit(dev));
1014 	if_setinitfn(ifp, cxgb_init);
1015 	if_setsoftc(ifp, p);
1016 	if_setflags(ifp, IFF_BROADCAST | IFF_SIMPLEX | IFF_MULTICAST);
1017 	if_setioctlfn(ifp, cxgb_ioctl);
1018 	if_settransmitfn(ifp, cxgb_transmit);
1019 	if_setqflushfn(ifp, cxgb_qflush);
1020 	if_setgetcounterfn(ifp, cxgb_get_counter);
1021 
1022 	if_setcapabilities(ifp, CXGB_CAP);
1023 #ifdef TCP_OFFLOAD
1024 	if (is_offload(sc))
1025 		if_setcapabilitiesbit(ifp, IFCAP_TOE4, 0);
1026 #endif
1027 	if_setcapenable(ifp, CXGB_CAP_ENABLE);
1028 	if_sethwassist(ifp, CSUM_TCP | CSUM_UDP | CSUM_IP | CSUM_TSO |
1029 	    CSUM_UDP_IPV6 | CSUM_TCP_IPV6);
1030 	if_sethwtsomax(ifp, IP_MAXPACKET);
1031 	if_sethwtsomaxsegcount(ifp, 36);
1032 	if_sethwtsomaxsegsize(ifp, 65536);
1033 
1034 	/*
1035 	 * Disable TSO on 4-port - it isn't supported by the firmware.
1036 	 */
1037 	if (sc->params.nports > 2) {
1038 		if_setcapabilitiesbit(ifp, 0, IFCAP_TSO | IFCAP_VLAN_HWTSO);
1039 		if_setcapenablebit(ifp, 0, IFCAP_TSO | IFCAP_VLAN_HWTSO);
1040 		if_sethwassistbits(ifp, 0, CSUM_TSO);
1041 	}
1042 
1043 	/* Create a list of media supported by this port */
1044 	ifmedia_init(&p->media, IFM_IMASK, cxgb_media_change,
1045 	    cxgb_media_status);
1046 	cxgb_build_medialist(p);
1047 
1048 	ether_ifattach(ifp, p->hw_addr);
1049 
1050 	/* Attach driver debugnet methods. */
1051 	DEBUGNET_SET(ifp, cxgb);
1052 
1053 #ifdef DEFAULT_JUMBO
1054 	if (sc->params.nports <= 2)
1055 		if_setmtu(ifp, ETHERMTU_JUMBO);
1056 #endif
1057 	if ((err = cxgb_makedev(p)) != 0) {
1058 		printf("makedev failed %d\n", err);
1059 		return (err);
1060 	}
1061 
1062 	t3_sge_init_port(p);
1063 
1064 	return (err);
1065 }
1066 
1067 /*
1068  * cxgb_port_detach() is called via the device_detach methods when
1069  * cxgb_free() calls the bus_detach_children.  It is responsible for
1070  * removing the device from the view of the kernel, i.e. from all
1071  * interfaces lists etc.  This routine is only called when the driver is
1072  * being unloaded, not when the link goes down.
1073  */
1074 static int
1075 cxgb_port_detach(device_t dev)
1076 {
1077 	struct port_info *p;
1078 	struct adapter *sc;
1079 	int i;
1080 
1081 	p = device_get_softc(dev);
1082 	sc = p->adapter;
1083 
1084 	/* Tell cxgb_ioctl and if_init that the port is going away */
1085 	ADAPTER_LOCK(sc);
1086 	SET_DOOMED(p);
1087 	wakeup(&sc->flags);
1088 	while (IS_BUSY(sc))
1089 		mtx_sleep(&sc->flags, &sc->lock, 0, "cxgbdtch", 0);
1090 	SET_BUSY(sc);
1091 	ADAPTER_UNLOCK(sc);
1092 
1093 	if (p->port_cdev != NULL)
1094 		destroy_dev(p->port_cdev);
1095 
1096 	cxgb_uninit_synchronized(p);
1097 	ether_ifdetach(p->ifp);
1098 
1099 	for (i = p->first_qset; i < p->first_qset + p->nqsets; i++) {
1100 		struct sge_qset *qs = &sc->sge.qs[i];
1101 		struct sge_txq *txq = &qs->txq[TXQ_ETH];
1102 
1103 		callout_drain(&txq->txq_watchdog);
1104 		callout_drain(&txq->txq_timer);
1105 	}
1106 
1107 	PORT_LOCK_DEINIT(p);
1108 	if_free(p->ifp);
1109 	p->ifp = NULL;
1110 
1111 	ADAPTER_LOCK(sc);
1112 	CLR_BUSY(sc);
1113 	wakeup_one(&sc->flags);
1114 	ADAPTER_UNLOCK(sc);
1115 	return (0);
1116 }
1117 
1118 void
1119 t3_fatal_err(struct adapter *sc)
1120 {
1121 	u_int fw_status[4];
1122 
1123 	if (sc->flags & FULL_INIT_DONE) {
1124 		t3_sge_stop(sc);
1125 		t3_write_reg(sc, A_XGM_TX_CTRL, 0);
1126 		t3_write_reg(sc, A_XGM_RX_CTRL, 0);
1127 		t3_write_reg(sc, XGM_REG(A_XGM_TX_CTRL, 1), 0);
1128 		t3_write_reg(sc, XGM_REG(A_XGM_RX_CTRL, 1), 0);
1129 		t3_intr_disable(sc);
1130 	}
1131 	device_printf(sc->dev,"encountered fatal error, operation suspended\n");
1132 	if (!t3_cim_ctl_blk_read(sc, 0xa0, 4, fw_status))
1133 		device_printf(sc->dev, "FW_ status: 0x%x, 0x%x, 0x%x, 0x%x\n",
1134 		    fw_status[0], fw_status[1], fw_status[2], fw_status[3]);
1135 }
1136 
1137 int
1138 t3_os_find_pci_capability(adapter_t *sc, int cap)
1139 {
1140 	device_t dev;
1141 	struct pci_devinfo *dinfo;
1142 	pcicfgregs *cfg;
1143 	uint32_t status;
1144 	uint8_t ptr;
1145 
1146 	dev = sc->dev;
1147 	dinfo = device_get_ivars(dev);
1148 	cfg = &dinfo->cfg;
1149 
1150 	status = pci_read_config(dev, PCIR_STATUS, 2);
1151 	if (!(status & PCIM_STATUS_CAPPRESENT))
1152 		return (0);
1153 
1154 	switch (cfg->hdrtype & PCIM_HDRTYPE) {
1155 	case 0:
1156 	case 1:
1157 		ptr = PCIR_CAP_PTR;
1158 		break;
1159 	case 2:
1160 		ptr = PCIR_CAP_PTR_2;
1161 		break;
1162 	default:
1163 		return (0);
1164 		break;
1165 	}
1166 	ptr = pci_read_config(dev, ptr, 1);
1167 
1168 	while (ptr != 0) {
1169 		if (pci_read_config(dev, ptr + PCICAP_ID, 1) == cap)
1170 			return (ptr);
1171 		ptr = pci_read_config(dev, ptr + PCICAP_NEXTPTR, 1);
1172 	}
1173 
1174 	return (0);
1175 }
1176 
1177 int
1178 t3_os_pci_save_state(struct adapter *sc)
1179 {
1180 	device_t dev;
1181 	struct pci_devinfo *dinfo;
1182 
1183 	dev = sc->dev;
1184 	dinfo = device_get_ivars(dev);
1185 
1186 	pci_cfg_save(dev, dinfo, 0);
1187 	return (0);
1188 }
1189 
1190 int
1191 t3_os_pci_restore_state(struct adapter *sc)
1192 {
1193 	device_t dev;
1194 	struct pci_devinfo *dinfo;
1195 
1196 	dev = sc->dev;
1197 	dinfo = device_get_ivars(dev);
1198 
1199 	pci_cfg_restore(dev, dinfo);
1200 	return (0);
1201 }
1202 
1203 /**
1204  *	t3_os_link_changed - handle link status changes
1205  *	@sc: the adapter associated with the link change
1206  *	@port_id: the port index whose link status has changed
1207  *	@link_status: the new status of the link
1208  *	@speed: the new speed setting
1209  *	@duplex: the new duplex setting
1210  *	@fc: the new flow-control setting
1211  *
1212  *	This is the OS-dependent handler for link status changes.  The OS
1213  *	neutral handler takes care of most of the processing for these events,
1214  *	then calls this handler for any OS-specific processing.
1215  */
1216 void
1217 t3_os_link_changed(adapter_t *adapter, int port_id, int link_status, int speed,
1218      int duplex, int fc, int mac_was_reset)
1219 {
1220 	struct port_info *pi = &adapter->port[port_id];
1221 	if_t ifp = pi->ifp;
1222 
1223 	/* no race with detach, so ifp should always be good */
1224 	KASSERT(ifp, ("%s: if detached.", __func__));
1225 
1226 	/* Reapply mac settings if they were lost due to a reset */
1227 	if (mac_was_reset) {
1228 		PORT_LOCK(pi);
1229 		cxgb_update_mac_settings(pi);
1230 		PORT_UNLOCK(pi);
1231 	}
1232 
1233 	if (link_status) {
1234 		if_setbaudrate(ifp, IF_Mbps(speed));
1235 		if_link_state_change(ifp, LINK_STATE_UP);
1236 	} else
1237 		if_link_state_change(ifp, LINK_STATE_DOWN);
1238 }
1239 
1240 /**
1241  *	t3_os_phymod_changed - handle PHY module changes
1242  *	@phy: the PHY reporting the module change
1243  *	@mod_type: new module type
1244  *
1245  *	This is the OS-dependent handler for PHY module changes.  It is
1246  *	invoked when a PHY module is removed or inserted for any OS-specific
1247  *	processing.
1248  */
1249 void t3_os_phymod_changed(struct adapter *adap, int port_id)
1250 {
1251 	static const char *mod_str[] = {
1252 		NULL, "SR", "LR", "LRM", "TWINAX", "TWINAX-L", "unknown"
1253 	};
1254 	struct port_info *pi = &adap->port[port_id];
1255 	int mod = pi->phy.modtype;
1256 
1257 	if (mod != pi->media.ifm_cur->ifm_data)
1258 		cxgb_build_medialist(pi);
1259 
1260 	if (mod == phy_modtype_none)
1261 		if_printf(pi->ifp, "PHY module unplugged\n");
1262 	else {
1263 		KASSERT(mod < ARRAY_SIZE(mod_str),
1264 			("invalid PHY module type %d", mod));
1265 		if_printf(pi->ifp, "%s PHY module inserted\n", mod_str[mod]);
1266 	}
1267 }
1268 
1269 void
1270 t3_os_set_hw_addr(adapter_t *adapter, int port_idx, u8 hw_addr[])
1271 {
1272 
1273 	/*
1274 	 * The ifnet might not be allocated before this gets called,
1275 	 * as this is called early on in attach by t3_prep_adapter
1276 	 * save the address off in the port structure
1277 	 */
1278 	if (cxgb_debug)
1279 		printf("set_hw_addr on idx %d addr %6D\n", port_idx, hw_addr, ":");
1280 	bcopy(hw_addr, adapter->port[port_idx].hw_addr, ETHER_ADDR_LEN);
1281 }
1282 
1283 /*
1284  * Programs the XGMAC based on the settings in the ifnet.  These settings
1285  * include MTU, MAC address, mcast addresses, etc.
1286  */
1287 static void
1288 cxgb_update_mac_settings(struct port_info *p)
1289 {
1290 	if_t ifp = p->ifp;
1291 	struct t3_rx_mode rm;
1292 	struct cmac *mac = &p->mac;
1293 	int mtu, hwtagging;
1294 
1295 	PORT_LOCK_ASSERT_OWNED(p);
1296 
1297 	bcopy(if_getlladdr(ifp), p->hw_addr, ETHER_ADDR_LEN);
1298 
1299 	mtu = if_getmtu(ifp);
1300 	if (if_getcapenable(ifp) & IFCAP_VLAN_MTU)
1301 		mtu += ETHER_VLAN_ENCAP_LEN;
1302 
1303 	hwtagging = (if_getcapenable(ifp) & IFCAP_VLAN_HWTAGGING) != 0;
1304 
1305 	t3_mac_set_mtu(mac, mtu);
1306 	t3_set_vlan_accel(p->adapter, 1 << p->tx_chan, hwtagging);
1307 	t3_mac_set_address(mac, 0, p->hw_addr);
1308 	t3_init_rx_mode(&rm, p);
1309 	t3_mac_set_rx_mode(mac, &rm);
1310 }
1311 
1312 
1313 static int
1314 await_mgmt_replies(struct adapter *adap, unsigned long init_cnt,
1315 			      unsigned long n)
1316 {
1317 	int attempts = 5;
1318 
1319 	while (adap->sge.qs[0].rspq.offload_pkts < init_cnt + n) {
1320 		if (!--attempts)
1321 			return (ETIMEDOUT);
1322 		t3_os_sleep(10);
1323 	}
1324 	return 0;
1325 }
1326 
1327 static int
1328 init_tp_parity(struct adapter *adap)
1329 {
1330 	int i;
1331 	struct mbuf *m;
1332 	struct cpl_set_tcb_field *greq;
1333 	unsigned long cnt = adap->sge.qs[0].rspq.offload_pkts;
1334 
1335 	t3_tp_set_offload_mode(adap, 1);
1336 
1337 	for (i = 0; i < 16; i++) {
1338 		struct cpl_smt_write_req *req;
1339 
1340 		m = m_gethdr(M_WAITOK, MT_DATA);
1341 		req = mtod(m, struct cpl_smt_write_req *);
1342 		m->m_len = m->m_pkthdr.len = sizeof(*req);
1343 		memset(req, 0, sizeof(*req));
1344 		req->wr.wrh_hi = htonl(V_WR_OP(FW_WROPCODE_FORWARD));
1345 		OPCODE_TID(req) = htonl(MK_OPCODE_TID(CPL_SMT_WRITE_REQ, i));
1346 		req->iff = i;
1347 		t3_mgmt_tx(adap, m);
1348 	}
1349 
1350 	for (i = 0; i < 2048; i++) {
1351 		struct cpl_l2t_write_req *req;
1352 
1353 		m = m_gethdr(M_WAITOK, MT_DATA);
1354 		req = mtod(m, struct cpl_l2t_write_req *);
1355 		m->m_len = m->m_pkthdr.len = sizeof(*req);
1356 		memset(req, 0, sizeof(*req));
1357 		req->wr.wrh_hi = htonl(V_WR_OP(FW_WROPCODE_FORWARD));
1358 		OPCODE_TID(req) = htonl(MK_OPCODE_TID(CPL_L2T_WRITE_REQ, i));
1359 		req->params = htonl(V_L2T_W_IDX(i));
1360 		t3_mgmt_tx(adap, m);
1361 	}
1362 
1363 	for (i = 0; i < 2048; i++) {
1364 		struct cpl_rte_write_req *req;
1365 
1366 		m = m_gethdr(M_WAITOK, MT_DATA);
1367 		req = mtod(m, struct cpl_rte_write_req *);
1368 		m->m_len = m->m_pkthdr.len = sizeof(*req);
1369 		memset(req, 0, sizeof(*req));
1370 		req->wr.wrh_hi = htonl(V_WR_OP(FW_WROPCODE_FORWARD));
1371 		OPCODE_TID(req) = htonl(MK_OPCODE_TID(CPL_RTE_WRITE_REQ, i));
1372 		req->l2t_idx = htonl(V_L2T_W_IDX(i));
1373 		t3_mgmt_tx(adap, m);
1374 	}
1375 
1376 	m = m_gethdr(M_WAITOK, MT_DATA);
1377 	greq = mtod(m, struct cpl_set_tcb_field *);
1378 	m->m_len = m->m_pkthdr.len = sizeof(*greq);
1379 	memset(greq, 0, sizeof(*greq));
1380 	greq->wr.wrh_hi = htonl(V_WR_OP(FW_WROPCODE_FORWARD));
1381 	OPCODE_TID(greq) = htonl(MK_OPCODE_TID(CPL_SET_TCB_FIELD, 0));
1382 	greq->mask = htobe64(1);
1383 	t3_mgmt_tx(adap, m);
1384 
1385 	i = await_mgmt_replies(adap, cnt, 16 + 2048 + 2048 + 1);
1386 	t3_tp_set_offload_mode(adap, 0);
1387 	return (i);
1388 }
1389 
1390 /**
1391  *	setup_rss - configure Receive Side Steering (per-queue connection demux)
1392  *	@adap: the adapter
1393  *
1394  *	Sets up RSS to distribute packets to multiple receive queues.  We
1395  *	configure the RSS CPU lookup table to distribute to the number of HW
1396  *	receive queues, and the response queue lookup table to narrow that
1397  *	down to the response queues actually configured for each port.
1398  *	We always configure the RSS mapping for two ports since the mapping
1399  *	table has plenty of entries.
1400  */
1401 static void
1402 setup_rss(adapter_t *adap)
1403 {
1404 	int i;
1405 	u_int nq[2];
1406 	uint8_t cpus[SGE_QSETS + 1];
1407 	uint16_t rspq_map[RSS_TABLE_SIZE];
1408 
1409 	for (i = 0; i < SGE_QSETS; ++i)
1410 		cpus[i] = i;
1411 	cpus[SGE_QSETS] = 0xff;
1412 
1413 	nq[0] = nq[1] = 0;
1414 	for_each_port(adap, i) {
1415 		const struct port_info *pi = adap2pinfo(adap, i);
1416 
1417 		nq[pi->tx_chan] += pi->nqsets;
1418 	}
1419 	for (i = 0; i < RSS_TABLE_SIZE / 2; ++i) {
1420 		rspq_map[i] = nq[0] ? i % nq[0] : 0;
1421 		rspq_map[i + RSS_TABLE_SIZE / 2] = nq[1] ? i % nq[1] + nq[0] : 0;
1422 	}
1423 
1424 	/* Calculate the reverse RSS map table */
1425 	for (i = 0; i < SGE_QSETS; ++i)
1426 		adap->rrss_map[i] = 0xff;
1427 	for (i = 0; i < RSS_TABLE_SIZE; ++i)
1428 		if (adap->rrss_map[rspq_map[i]] == 0xff)
1429 			adap->rrss_map[rspq_map[i]] = i;
1430 
1431 	t3_config_rss(adap, F_RQFEEDBACKENABLE | F_TNLLKPEN | F_TNLMAPEN |
1432 		      F_TNLPRTEN | F_TNL2TUPEN | F_TNL4TUPEN | F_OFDMAPEN |
1433 	              F_RRCPLMAPEN | V_RRCPLCPUSIZE(6) | F_HASHTOEPLITZ,
1434 	              cpus, rspq_map);
1435 
1436 }
1437 static void
1438 send_pktsched_cmd(struct adapter *adap, int sched, int qidx, int lo,
1439 			      int hi, int port)
1440 {
1441 	struct mbuf *m;
1442 	struct mngt_pktsched_wr *req;
1443 
1444 	m = m_gethdr(M_NOWAIT, MT_DATA);
1445 	if (m) {
1446 		req = mtod(m, struct mngt_pktsched_wr *);
1447 		req->wr.wrh_hi = htonl(V_WR_OP(FW_WROPCODE_MNGT));
1448 		req->mngt_opcode = FW_MNGTOPCODE_PKTSCHED_SET;
1449 		req->sched = sched;
1450 		req->idx = qidx;
1451 		req->min = lo;
1452 		req->max = hi;
1453 		req->binding = port;
1454 		m->m_len = m->m_pkthdr.len = sizeof(*req);
1455 		t3_mgmt_tx(adap, m);
1456 	}
1457 }
1458 
1459 static void
1460 bind_qsets(adapter_t *sc)
1461 {
1462 	int i, j;
1463 
1464 	for (i = 0; i < (sc)->params.nports; ++i) {
1465 		const struct port_info *pi = adap2pinfo(sc, i);
1466 
1467 		for (j = 0; j < pi->nqsets; ++j) {
1468 			send_pktsched_cmd(sc, 1, pi->first_qset + j, -1,
1469 					  -1, pi->tx_chan);
1470 
1471 		}
1472 	}
1473 }
1474 
1475 static void
1476 update_tpeeprom(struct adapter *adap)
1477 {
1478 	const struct firmware *tpeeprom;
1479 
1480 	uint32_t version;
1481 	unsigned int major, minor;
1482 	int ret, len;
1483 	char rev, name[32];
1484 
1485 	t3_seeprom_read(adap, TP_SRAM_OFFSET, &version);
1486 
1487 	major = G_TP_VERSION_MAJOR(version);
1488 	minor = G_TP_VERSION_MINOR(version);
1489 	if (major == TP_VERSION_MAJOR  && minor == TP_VERSION_MINOR)
1490 		return;
1491 
1492 	rev = t3rev2char(adap);
1493 	snprintf(name, sizeof(name), TPEEPROM_NAME, rev);
1494 
1495 	tpeeprom = firmware_get(name);
1496 	if (tpeeprom == NULL) {
1497 		device_printf(adap->dev,
1498 			      "could not load TP EEPROM: unable to load %s\n",
1499 			      name);
1500 		return;
1501 	}
1502 
1503 	len = tpeeprom->datasize - 4;
1504 
1505 	ret = t3_check_tpsram(adap, tpeeprom->data, tpeeprom->datasize);
1506 	if (ret)
1507 		goto release_tpeeprom;
1508 
1509 	if (len != TP_SRAM_LEN) {
1510 		device_printf(adap->dev,
1511 			      "%s length is wrong len=%d expected=%d\n", name,
1512 			      len, TP_SRAM_LEN);
1513 		return;
1514 	}
1515 
1516 	ret = set_eeprom(&adap->port[0], tpeeprom->data, tpeeprom->datasize,
1517 	    TP_SRAM_OFFSET);
1518 
1519 	if (!ret) {
1520 		device_printf(adap->dev,
1521 			"Protocol SRAM image updated in EEPROM to %d.%d.%d\n",
1522 			 TP_VERSION_MAJOR, TP_VERSION_MINOR, TP_VERSION_MICRO);
1523 	} else
1524 		device_printf(adap->dev,
1525 			      "Protocol SRAM image update in EEPROM failed\n");
1526 
1527 release_tpeeprom:
1528 	firmware_put(tpeeprom, FIRMWARE_UNLOAD);
1529 
1530 	return;
1531 }
1532 
1533 static int
1534 update_tpsram(struct adapter *adap)
1535 {
1536 	const struct firmware *tpsram;
1537 	int ret;
1538 	char rev, name[32];
1539 
1540 	rev = t3rev2char(adap);
1541 	snprintf(name, sizeof(name), TPSRAM_NAME, rev);
1542 
1543 	update_tpeeprom(adap);
1544 
1545 	tpsram = firmware_get(name);
1546 	if (tpsram == NULL){
1547 		device_printf(adap->dev, "could not load TP SRAM\n");
1548 		return (EINVAL);
1549 	} else
1550 		device_printf(adap->dev, "updating TP SRAM\n");
1551 
1552 	ret = t3_check_tpsram(adap, tpsram->data, tpsram->datasize);
1553 	if (ret)
1554 		goto release_tpsram;
1555 
1556 	ret = t3_set_proto_sram(adap, tpsram->data);
1557 	if (ret)
1558 		device_printf(adap->dev, "loading protocol SRAM failed\n");
1559 
1560 release_tpsram:
1561 	firmware_put(tpsram, FIRMWARE_UNLOAD);
1562 
1563 	return ret;
1564 }
1565 
1566 /**
1567  *	cxgb_up - enable the adapter
1568  *	@adap: adapter being enabled
1569  *
1570  *	Called when the first port is enabled, this function performs the
1571  *	actions necessary to make an adapter operational, such as completing
1572  *	the initialization of HW modules, and enabling interrupts.
1573  */
1574 static int
1575 cxgb_up(struct adapter *sc)
1576 {
1577 	int err = 0;
1578 	unsigned int mxf = t3_mc5_size(&sc->mc5) - MC5_MIN_TIDS;
1579 
1580 	KASSERT(sc->open_device_map == 0, ("%s: device(s) already open (%x)",
1581 					   __func__, sc->open_device_map));
1582 
1583 	if ((sc->flags & FULL_INIT_DONE) == 0) {
1584 
1585 		ADAPTER_LOCK_ASSERT_NOTOWNED(sc);
1586 
1587 		if ((sc->flags & FW_UPTODATE) == 0)
1588 			if ((err = upgrade_fw(sc)))
1589 				goto out;
1590 
1591 		if ((sc->flags & TPS_UPTODATE) == 0)
1592 			if ((err = update_tpsram(sc)))
1593 				goto out;
1594 
1595 		if (is_offload(sc) && nfilters != 0) {
1596 			sc->params.mc5.nservers = 0;
1597 
1598 			if (nfilters < 0)
1599 				sc->params.mc5.nfilters = mxf;
1600 			else
1601 				sc->params.mc5.nfilters = min(nfilters, mxf);
1602 		}
1603 
1604 		err = t3_init_hw(sc, 0);
1605 		if (err)
1606 			goto out;
1607 
1608 		t3_set_reg_field(sc, A_TP_PARA_REG5, 0, F_RXDDPOFFINIT);
1609 		t3_write_reg(sc, A_ULPRX_TDDP_PSZ, V_HPZ0(PAGE_SHIFT - 12));
1610 
1611 		err = setup_sge_qsets(sc);
1612 		if (err)
1613 			goto out;
1614 
1615 		alloc_filters(sc);
1616 		setup_rss(sc);
1617 
1618 		t3_add_configured_sysctls(sc);
1619 		sc->flags |= FULL_INIT_DONE;
1620 	}
1621 
1622 	t3_intr_clear(sc);
1623 	t3_sge_start(sc);
1624 	t3_intr_enable(sc);
1625 
1626 	if (sc->params.rev >= T3_REV_C && !(sc->flags & TP_PARITY_INIT) &&
1627 	    is_offload(sc) && init_tp_parity(sc) == 0)
1628 		sc->flags |= TP_PARITY_INIT;
1629 
1630 	if (sc->flags & TP_PARITY_INIT) {
1631 		t3_write_reg(sc, A_TP_INT_CAUSE, F_CMCACHEPERR | F_ARPLUTPERR);
1632 		t3_write_reg(sc, A_TP_INT_ENABLE, 0x7fbfffff);
1633 	}
1634 
1635 	if (!(sc->flags & QUEUES_BOUND)) {
1636 		bind_qsets(sc);
1637 		setup_hw_filters(sc);
1638 		sc->flags |= QUEUES_BOUND;
1639 	}
1640 
1641 	t3_sge_reset_adapter(sc);
1642 out:
1643 	return (err);
1644 }
1645 
1646 /*
1647  * Called when the last open device is closed.  Does NOT undo all of cxgb_up's
1648  * work.  Specifically, the resources grabbed under FULL_INIT_DONE are released
1649  * during controller_detach, not here.
1650  */
1651 static void
1652 cxgb_down(struct adapter *sc)
1653 {
1654 	t3_sge_stop(sc);
1655 	t3_intr_disable(sc);
1656 }
1657 
1658 /*
1659  * if_init for cxgb ports.
1660  */
1661 static void
1662 cxgb_init(void *arg)
1663 {
1664 	struct port_info *p = arg;
1665 	struct adapter *sc = p->adapter;
1666 
1667 	ADAPTER_LOCK(sc);
1668 	cxgb_init_locked(p); /* releases adapter lock */
1669 	ADAPTER_LOCK_ASSERT_NOTOWNED(sc);
1670 }
1671 
1672 static int
1673 cxgb_init_locked(struct port_info *p)
1674 {
1675 	struct adapter *sc = p->adapter;
1676 	if_t ifp = p->ifp;
1677 	struct cmac *mac = &p->mac;
1678 	int i, rc = 0, may_sleep = 0, gave_up_lock = 0;
1679 
1680 	ADAPTER_LOCK_ASSERT_OWNED(sc);
1681 
1682 	while (!IS_DOOMED(p) && IS_BUSY(sc)) {
1683 		gave_up_lock = 1;
1684 		if (mtx_sleep(&sc->flags, &sc->lock, PCATCH, "cxgbinit", 0)) {
1685 			rc = EINTR;
1686 			goto done;
1687 		}
1688 	}
1689 	if (IS_DOOMED(p)) {
1690 		rc = ENXIO;
1691 		goto done;
1692 	}
1693 	KASSERT(!IS_BUSY(sc), ("%s: controller busy.", __func__));
1694 
1695 	/*
1696 	 * The code that runs during one-time adapter initialization can sleep
1697 	 * so it's important not to hold any locks across it.
1698 	 */
1699 	may_sleep = sc->flags & FULL_INIT_DONE ? 0 : 1;
1700 
1701 	if (may_sleep) {
1702 		SET_BUSY(sc);
1703 		gave_up_lock = 1;
1704 		ADAPTER_UNLOCK(sc);
1705 	}
1706 
1707 	if (sc->open_device_map == 0 && ((rc = cxgb_up(sc)) != 0))
1708 			goto done;
1709 
1710 	PORT_LOCK(p);
1711 	if (isset(&sc->open_device_map, p->port_id) &&
1712 	    (if_getdrvflags(ifp) & IFF_DRV_RUNNING)) {
1713 		PORT_UNLOCK(p);
1714 		goto done;
1715 	}
1716 	t3_port_intr_enable(sc, p->port_id);
1717 	if (!mac->multiport)
1718 		t3_mac_init(mac);
1719 	cxgb_update_mac_settings(p);
1720 	t3_link_start(&p->phy, mac, &p->link_config);
1721 	t3_mac_enable(mac, MAC_DIRECTION_RX | MAC_DIRECTION_TX);
1722 	if_setdrvflagbits(ifp, IFF_DRV_RUNNING, IFF_DRV_OACTIVE);
1723 	PORT_UNLOCK(p);
1724 
1725 	for (i = p->first_qset; i < p->first_qset + p->nqsets; i++) {
1726 		struct sge_qset *qs = &sc->sge.qs[i];
1727 		struct sge_txq *txq = &qs->txq[TXQ_ETH];
1728 
1729 		callout_reset_on(&txq->txq_watchdog, hz, cxgb_tx_watchdog, qs,
1730 				 txq->txq_watchdog.c_cpu);
1731 	}
1732 
1733 	/* all ok */
1734 	setbit(&sc->open_device_map, p->port_id);
1735 	callout_reset(&p->link_check_ch,
1736 	    p->phy.caps & SUPPORTED_LINK_IRQ ?  hz * 3 : hz / 4,
1737 	    link_check_callout, p);
1738 
1739 done:
1740 	if (may_sleep) {
1741 		ADAPTER_LOCK(sc);
1742 		KASSERT(IS_BUSY(sc), ("%s: controller not busy.", __func__));
1743 		CLR_BUSY(sc);
1744 	}
1745 	if (gave_up_lock)
1746 		wakeup_one(&sc->flags);
1747 	ADAPTER_UNLOCK(sc);
1748 	return (rc);
1749 }
1750 
1751 static int
1752 cxgb_uninit_locked(struct port_info *p)
1753 {
1754 	struct adapter *sc = p->adapter;
1755 	int rc;
1756 
1757 	ADAPTER_LOCK_ASSERT_OWNED(sc);
1758 
1759 	while (!IS_DOOMED(p) && IS_BUSY(sc)) {
1760 		if (mtx_sleep(&sc->flags, &sc->lock, PCATCH, "cxgbunin", 0)) {
1761 			rc = EINTR;
1762 			goto done;
1763 		}
1764 	}
1765 	if (IS_DOOMED(p)) {
1766 		rc = ENXIO;
1767 		goto done;
1768 	}
1769 	KASSERT(!IS_BUSY(sc), ("%s: controller busy.", __func__));
1770 	SET_BUSY(sc);
1771 	ADAPTER_UNLOCK(sc);
1772 
1773 	rc = cxgb_uninit_synchronized(p);
1774 
1775 	ADAPTER_LOCK(sc);
1776 	KASSERT(IS_BUSY(sc), ("%s: controller not busy.", __func__));
1777 	CLR_BUSY(sc);
1778 	wakeup_one(&sc->flags);
1779 done:
1780 	ADAPTER_UNLOCK(sc);
1781 	return (rc);
1782 }
1783 
1784 /*
1785  * Called on "ifconfig down", and from port_detach
1786  */
1787 static int
1788 cxgb_uninit_synchronized(struct port_info *pi)
1789 {
1790 	struct adapter *sc = pi->adapter;
1791 	if_t ifp = pi->ifp;
1792 
1793 	/*
1794 	 * taskqueue_drain may cause a deadlock if the adapter lock is held.
1795 	 */
1796 	ADAPTER_LOCK_ASSERT_NOTOWNED(sc);
1797 
1798 	/*
1799 	 * Clear this port's bit from the open device map, and then drain all
1800 	 * the tasks that can access/manipulate this port's port_info or ifp.
1801 	 * We disable this port's interrupts here and so the slow/ext
1802 	 * interrupt tasks won't be enqueued.  The tick task will continue to
1803 	 * be enqueued every second but the runs after this drain will not see
1804 	 * this port in the open device map.
1805 	 *
1806 	 * A well behaved task must take open_device_map into account and ignore
1807 	 * ports that are not open.
1808 	 */
1809 	clrbit(&sc->open_device_map, pi->port_id);
1810 	t3_port_intr_disable(sc, pi->port_id);
1811 	taskqueue_drain(sc->tq, &sc->slow_intr_task);
1812 	taskqueue_drain(sc->tq, &sc->tick_task);
1813 
1814 	callout_drain(&pi->link_check_ch);
1815 	taskqueue_drain(sc->tq, &pi->link_check_task);
1816 
1817 	PORT_LOCK(pi);
1818 	if_setdrvflagbits(ifp, 0, IFF_DRV_RUNNING | IFF_DRV_OACTIVE);
1819 
1820 	/* disable pause frames */
1821 	t3_set_reg_field(sc, A_XGM_TX_CFG + pi->mac.offset, F_TXPAUSEEN, 0);
1822 
1823 	/* Reset RX FIFO HWM */
1824 	t3_set_reg_field(sc, A_XGM_RXFIFO_CFG +  pi->mac.offset,
1825 			 V_RXFIFOPAUSEHWM(M_RXFIFOPAUSEHWM), 0);
1826 
1827 	DELAY(100 * 1000);
1828 
1829 	/* Wait for TXFIFO empty */
1830 	t3_wait_op_done(sc, A_XGM_TXFIFO_CFG + pi->mac.offset,
1831 			F_TXFIFO_EMPTY, 1, 20, 5);
1832 
1833 	DELAY(100 * 1000);
1834 	t3_mac_disable(&pi->mac, MAC_DIRECTION_RX);
1835 
1836 	pi->phy.ops->power_down(&pi->phy, 1);
1837 
1838 	PORT_UNLOCK(pi);
1839 
1840 	pi->link_config.link_ok = 0;
1841 	t3_os_link_changed(sc, pi->port_id, 0, 0, 0, 0, 0);
1842 
1843 	if (sc->open_device_map == 0)
1844 		cxgb_down(pi->adapter);
1845 
1846 	return (0);
1847 }
1848 
1849 /*
1850  * Mark lro enabled or disabled in all qsets for this port
1851  */
1852 static int
1853 cxgb_set_lro(struct port_info *p, int enabled)
1854 {
1855 	int i;
1856 	struct adapter *adp = p->adapter;
1857 	struct sge_qset *q;
1858 
1859 	for (i = 0; i < p->nqsets; i++) {
1860 		q = &adp->sge.qs[p->first_qset + i];
1861 		q->lro.enabled = (enabled != 0);
1862 	}
1863 	return (0);
1864 }
1865 
1866 static int
1867 cxgb_ioctl(if_t ifp, unsigned long command, caddr_t data)
1868 {
1869 	struct port_info *p = if_getsoftc(ifp);
1870 	struct adapter *sc = p->adapter;
1871 	struct ifreq *ifr = (struct ifreq *)data;
1872 	int flags, error = 0, mtu;
1873 	uint32_t mask;
1874 
1875 	switch (command) {
1876 	case SIOCSIFMTU:
1877 		ADAPTER_LOCK(sc);
1878 		error = IS_DOOMED(p) ? ENXIO : (IS_BUSY(sc) ? EBUSY : 0);
1879 		if (error) {
1880 fail:
1881 			ADAPTER_UNLOCK(sc);
1882 			return (error);
1883 		}
1884 
1885 		mtu = ifr->ifr_mtu;
1886 		if ((mtu < ETHERMIN) || (mtu > ETHERMTU_JUMBO)) {
1887 			error = EINVAL;
1888 		} else {
1889 			if_setmtu(ifp, mtu);
1890 			PORT_LOCK(p);
1891 			cxgb_update_mac_settings(p);
1892 			PORT_UNLOCK(p);
1893 		}
1894 		ADAPTER_UNLOCK(sc);
1895 		break;
1896 	case SIOCSIFFLAGS:
1897 		ADAPTER_LOCK(sc);
1898 		if (IS_DOOMED(p)) {
1899 			error = ENXIO;
1900 			goto fail;
1901 		}
1902 		if (if_getflags(ifp) & IFF_UP) {
1903 			if (if_getdrvflags(ifp) & IFF_DRV_RUNNING) {
1904 				flags = p->if_flags;
1905 				if (((if_getflags(ifp) ^ flags) & IFF_PROMISC) ||
1906 				    ((if_getflags(ifp) ^ flags) & IFF_ALLMULTI)) {
1907 					if (IS_BUSY(sc)) {
1908 						error = EBUSY;
1909 						goto fail;
1910 					}
1911 					PORT_LOCK(p);
1912 					cxgb_update_mac_settings(p);
1913 					PORT_UNLOCK(p);
1914 				}
1915 				ADAPTER_UNLOCK(sc);
1916 			} else
1917 				error = cxgb_init_locked(p);
1918 			p->if_flags = if_getflags(ifp);
1919 		} else if (if_getdrvflags(ifp) & IFF_DRV_RUNNING)
1920 			error = cxgb_uninit_locked(p);
1921 		else
1922 			ADAPTER_UNLOCK(sc);
1923 
1924 		ADAPTER_LOCK_ASSERT_NOTOWNED(sc);
1925 		break;
1926 	case SIOCADDMULTI:
1927 	case SIOCDELMULTI:
1928 		ADAPTER_LOCK(sc);
1929 		error = IS_DOOMED(p) ? ENXIO : (IS_BUSY(sc) ? EBUSY : 0);
1930 		if (error)
1931 			goto fail;
1932 
1933 		if (if_getdrvflags(ifp) & IFF_DRV_RUNNING) {
1934 			PORT_LOCK(p);
1935 			cxgb_update_mac_settings(p);
1936 			PORT_UNLOCK(p);
1937 		}
1938 		ADAPTER_UNLOCK(sc);
1939 
1940 		break;
1941 	case SIOCSIFCAP:
1942 		ADAPTER_LOCK(sc);
1943 		error = IS_DOOMED(p) ? ENXIO : (IS_BUSY(sc) ? EBUSY : 0);
1944 		if (error)
1945 			goto fail;
1946 
1947 		mask = ifr->ifr_reqcap ^ if_getcapenable(ifp);
1948 		if (mask & IFCAP_TXCSUM) {
1949 			if_togglecapenable(ifp, IFCAP_TXCSUM);
1950 			if_togglehwassist(ifp, CSUM_TCP | CSUM_UDP | CSUM_IP);
1951 
1952 			if (IFCAP_TSO4 & if_getcapenable(ifp) &&
1953 			    !(IFCAP_TXCSUM & if_getcapenable(ifp))) {
1954 				mask &= ~IFCAP_TSO4;
1955 				if_setcapenablebit(ifp, 0, IFCAP_TSO4);
1956 				if_printf(ifp,
1957 				    "tso4 disabled due to -txcsum.\n");
1958 			}
1959 		}
1960 		if (mask & IFCAP_TXCSUM_IPV6) {
1961 			if_togglecapenable(ifp, IFCAP_TXCSUM_IPV6);
1962 			if_togglehwassist(ifp, CSUM_UDP_IPV6 | CSUM_TCP_IPV6);
1963 
1964 			if (IFCAP_TSO6 & if_getcapenable(ifp) &&
1965 			    !(IFCAP_TXCSUM_IPV6 & if_getcapenable(ifp))) {
1966 				mask &= ~IFCAP_TSO6;
1967 				if_setcapenablebit(ifp, 0, IFCAP_TSO6);
1968 				if_printf(ifp,
1969 				    "tso6 disabled due to -txcsum6.\n");
1970 			}
1971 		}
1972 		if (mask & IFCAP_RXCSUM)
1973 			if_togglecapenable(ifp, IFCAP_RXCSUM);
1974 		if (mask & IFCAP_RXCSUM_IPV6)
1975 			if_togglecapenable(ifp, IFCAP_RXCSUM_IPV6);
1976 
1977 		/*
1978 		 * Note that we leave CSUM_TSO alone (it is always set).  The
1979 		 * kernel takes both IFCAP_TSOx and CSUM_TSO into account before
1980 		 * sending a TSO request our way, so it's sufficient to toggle
1981 		 * IFCAP_TSOx only.
1982 		 */
1983 		if (mask & IFCAP_TSO4) {
1984 			if (!(IFCAP_TSO4 & if_getcapenable(ifp)) &&
1985 			    !(IFCAP_TXCSUM & if_getcapenable(ifp))) {
1986 				if_printf(ifp, "enable txcsum first.\n");
1987 				error = EAGAIN;
1988 				goto fail;
1989 			}
1990 			if_togglecapenable(ifp, IFCAP_TSO4);
1991 		}
1992 		if (mask & IFCAP_TSO6) {
1993 			if (!(IFCAP_TSO6 & if_getcapenable(ifp)) &&
1994 			    !(IFCAP_TXCSUM_IPV6 & if_getcapenable(ifp))) {
1995 				if_printf(ifp, "enable txcsum6 first.\n");
1996 				error = EAGAIN;
1997 				goto fail;
1998 			}
1999 			if_togglecapenable(ifp, IFCAP_TSO6);
2000 		}
2001 		if (mask & IFCAP_LRO) {
2002 			if_togglecapenable(ifp, IFCAP_LRO);
2003 
2004 			/* Safe to do this even if cxgb_up not called yet */
2005 			cxgb_set_lro(p, if_getcapenable(ifp) & IFCAP_LRO);
2006 		}
2007 #ifdef TCP_OFFLOAD
2008 		if (mask & IFCAP_TOE4) {
2009 			int enable = (if_getcapenable(ifp) ^ mask) & IFCAP_TOE4;
2010 
2011 			error = toe_capability(p, enable);
2012 			if (error == 0)
2013 				if_togglecapenable(ifp, mask);
2014 		}
2015 #endif
2016 		if (mask & IFCAP_VLAN_HWTAGGING) {
2017 			if_togglecapenable(ifp, IFCAP_VLAN_HWTAGGING);
2018 			if (if_getdrvflags(ifp) & IFF_DRV_RUNNING) {
2019 				PORT_LOCK(p);
2020 				cxgb_update_mac_settings(p);
2021 				PORT_UNLOCK(p);
2022 			}
2023 		}
2024 		if (mask & IFCAP_VLAN_MTU) {
2025 			if_togglecapenable(ifp, IFCAP_VLAN_MTU);
2026 			if (if_getdrvflags(ifp) & IFF_DRV_RUNNING) {
2027 				PORT_LOCK(p);
2028 				cxgb_update_mac_settings(p);
2029 				PORT_UNLOCK(p);
2030 			}
2031 		}
2032 		if (mask & IFCAP_VLAN_HWTSO)
2033 			if_togglecapenable(ifp, IFCAP_VLAN_HWTSO);
2034 		if (mask & IFCAP_VLAN_HWCSUM)
2035 			if_togglecapenable(ifp, IFCAP_VLAN_HWCSUM);
2036 
2037 #ifdef VLAN_CAPABILITIES
2038 		VLAN_CAPABILITIES(ifp);
2039 #endif
2040 		ADAPTER_UNLOCK(sc);
2041 		break;
2042 	case SIOCSIFMEDIA:
2043 	case SIOCGIFMEDIA:
2044 		error = ifmedia_ioctl(ifp, ifr, &p->media, command);
2045 		break;
2046 	default:
2047 		error = ether_ioctl(ifp, command, data);
2048 	}
2049 
2050 	return (error);
2051 }
2052 
2053 static int
2054 cxgb_media_change(if_t ifp)
2055 {
2056 	return (EOPNOTSUPP);
2057 }
2058 
2059 /*
2060  * Translates phy->modtype to the correct Ethernet media subtype.
2061  */
2062 static int
2063 cxgb_ifm_type(int mod)
2064 {
2065 	switch (mod) {
2066 	case phy_modtype_sr:
2067 		return (IFM_10G_SR);
2068 	case phy_modtype_lr:
2069 		return (IFM_10G_LR);
2070 	case phy_modtype_lrm:
2071 		return (IFM_10G_LRM);
2072 	case phy_modtype_twinax:
2073 		return (IFM_10G_TWINAX);
2074 	case phy_modtype_twinax_long:
2075 		return (IFM_10G_TWINAX_LONG);
2076 	case phy_modtype_none:
2077 		return (IFM_NONE);
2078 	case phy_modtype_unknown:
2079 		return (IFM_UNKNOWN);
2080 	}
2081 
2082 	KASSERT(0, ("%s: modtype %d unknown", __func__, mod));
2083 	return (IFM_UNKNOWN);
2084 }
2085 
2086 /*
2087  * Rebuilds the ifmedia list for this port, and sets the current media.
2088  */
2089 static void
2090 cxgb_build_medialist(struct port_info *p)
2091 {
2092 	struct cphy *phy = &p->phy;
2093 	struct ifmedia *media = &p->media;
2094 	int mod = phy->modtype;
2095 	int m = IFM_ETHER | IFM_FDX;
2096 
2097 	PORT_LOCK(p);
2098 
2099 	ifmedia_removeall(media);
2100 	if (phy->caps & SUPPORTED_TP && phy->caps & SUPPORTED_Autoneg) {
2101 		/* Copper (RJ45) */
2102 
2103 		if (phy->caps & SUPPORTED_10000baseT_Full)
2104 			ifmedia_add(media, m | IFM_10G_T, mod, NULL);
2105 
2106 		if (phy->caps & SUPPORTED_1000baseT_Full)
2107 			ifmedia_add(media, m | IFM_1000_T, mod, NULL);
2108 
2109 		if (phy->caps & SUPPORTED_100baseT_Full)
2110 			ifmedia_add(media, m | IFM_100_TX, mod, NULL);
2111 
2112 		if (phy->caps & SUPPORTED_10baseT_Full)
2113 			ifmedia_add(media, m | IFM_10_T, mod, NULL);
2114 
2115 		ifmedia_add(media, IFM_ETHER | IFM_AUTO, mod, NULL);
2116 		ifmedia_set(media, IFM_ETHER | IFM_AUTO);
2117 
2118 	} else if (phy->caps & SUPPORTED_TP) {
2119 		/* Copper (CX4) */
2120 
2121 		KASSERT(phy->caps & SUPPORTED_10000baseT_Full,
2122 			("%s: unexpected cap 0x%x", __func__, phy->caps));
2123 
2124 		ifmedia_add(media, m | IFM_10G_CX4, mod, NULL);
2125 		ifmedia_set(media, m | IFM_10G_CX4);
2126 
2127 	} else if (phy->caps & SUPPORTED_FIBRE &&
2128 		   phy->caps & SUPPORTED_10000baseT_Full) {
2129 		/* 10G optical (but includes SFP+ twinax) */
2130 
2131 		m |= cxgb_ifm_type(mod);
2132 		if (IFM_SUBTYPE(m) == IFM_NONE)
2133 			m &= ~IFM_FDX;
2134 
2135 		ifmedia_add(media, m, mod, NULL);
2136 		ifmedia_set(media, m);
2137 
2138 	} else if (phy->caps & SUPPORTED_FIBRE &&
2139 		   phy->caps & SUPPORTED_1000baseT_Full) {
2140 		/* 1G optical */
2141 
2142 		/* XXX: Lie and claim to be SX, could actually be any 1G-X */
2143 		ifmedia_add(media, m | IFM_1000_SX, mod, NULL);
2144 		ifmedia_set(media, m | IFM_1000_SX);
2145 
2146 	} else {
2147 		KASSERT(0, ("%s: don't know how to handle 0x%x.", __func__,
2148 			    phy->caps));
2149 	}
2150 
2151 	PORT_UNLOCK(p);
2152 }
2153 
2154 static void
2155 cxgb_media_status(if_t ifp, struct ifmediareq *ifmr)
2156 {
2157 	struct port_info *p = if_getsoftc(ifp);
2158 	struct ifmedia_entry *cur = p->media.ifm_cur;
2159 	int speed = p->link_config.speed;
2160 
2161 	if (cur->ifm_data != p->phy.modtype) {
2162 		cxgb_build_medialist(p);
2163 		cur = p->media.ifm_cur;
2164 	}
2165 
2166 	ifmr->ifm_status = IFM_AVALID;
2167 	if (!p->link_config.link_ok)
2168 		return;
2169 
2170 	ifmr->ifm_status |= IFM_ACTIVE;
2171 
2172 	/*
2173 	 * active and current will differ iff current media is autoselect.  That
2174 	 * can happen only for copper RJ45.
2175 	 */
2176 	if (IFM_SUBTYPE(cur->ifm_media) != IFM_AUTO)
2177 		return;
2178 	KASSERT(p->phy.caps & SUPPORTED_TP && p->phy.caps & SUPPORTED_Autoneg,
2179 		("%s: unexpected PHY caps 0x%x", __func__, p->phy.caps));
2180 
2181 	ifmr->ifm_active = IFM_ETHER | IFM_FDX;
2182 	if (speed == SPEED_10000)
2183 		ifmr->ifm_active |= IFM_10G_T;
2184 	else if (speed == SPEED_1000)
2185 		ifmr->ifm_active |= IFM_1000_T;
2186 	else if (speed == SPEED_100)
2187 		ifmr->ifm_active |= IFM_100_TX;
2188 	else if (speed == SPEED_10)
2189 		ifmr->ifm_active |= IFM_10_T;
2190 	else
2191 		KASSERT(0, ("%s: link up but speed unknown (%u)", __func__,
2192 			    speed));
2193 }
2194 
2195 static uint64_t
2196 cxgb_get_counter(if_t ifp, ift_counter c)
2197 {
2198 	struct port_info *pi = if_getsoftc(ifp);
2199 	struct adapter *sc = pi->adapter;
2200 	struct cmac *mac = &pi->mac;
2201 	struct mac_stats *mstats = &mac->stats;
2202 
2203 	cxgb_refresh_stats(pi);
2204 
2205 	switch (c) {
2206 	case IFCOUNTER_IPACKETS:
2207 		return (mstats->rx_frames);
2208 
2209 	case IFCOUNTER_IERRORS:
2210 		return (mstats->rx_jabber + mstats->rx_data_errs +
2211 		    mstats->rx_sequence_errs + mstats->rx_runt +
2212 		    mstats->rx_too_long + mstats->rx_mac_internal_errs +
2213 		    mstats->rx_short + mstats->rx_fcs_errs);
2214 
2215 	case IFCOUNTER_OPACKETS:
2216 		return (mstats->tx_frames);
2217 
2218 	case IFCOUNTER_OERRORS:
2219 		return (mstats->tx_excess_collisions + mstats->tx_underrun +
2220 		    mstats->tx_len_errs + mstats->tx_mac_internal_errs +
2221 		    mstats->tx_excess_deferral + mstats->tx_fcs_errs);
2222 
2223 	case IFCOUNTER_COLLISIONS:
2224 		return (mstats->tx_total_collisions);
2225 
2226 	case IFCOUNTER_IBYTES:
2227 		return (mstats->rx_octets);
2228 
2229 	case IFCOUNTER_OBYTES:
2230 		return (mstats->tx_octets);
2231 
2232 	case IFCOUNTER_IMCASTS:
2233 		return (mstats->rx_mcast_frames);
2234 
2235 	case IFCOUNTER_OMCASTS:
2236 		return (mstats->tx_mcast_frames);
2237 
2238 	case IFCOUNTER_IQDROPS:
2239 		return (mstats->rx_cong_drops);
2240 
2241 	case IFCOUNTER_OQDROPS: {
2242 		int i;
2243 		uint64_t drops;
2244 
2245 		drops = 0;
2246 		if (sc->flags & FULL_INIT_DONE) {
2247 			for (i = pi->first_qset; i < pi->first_qset + pi->nqsets; i++)
2248 				drops += sc->sge.qs[i].txq[TXQ_ETH].txq_mr->br_drops;
2249 		}
2250 
2251 		return (drops);
2252 
2253 	}
2254 
2255 	default:
2256 		return (if_get_counter_default(ifp, c));
2257 	}
2258 }
2259 
2260 static void
2261 cxgb_async_intr(void *data)
2262 {
2263 	adapter_t *sc = data;
2264 
2265 	t3_write_reg(sc, A_PL_INT_ENABLE0, 0);
2266 	(void) t3_read_reg(sc, A_PL_INT_ENABLE0);
2267 	taskqueue_enqueue(sc->tq, &sc->slow_intr_task);
2268 }
2269 
2270 static void
2271 link_check_callout(void *arg)
2272 {
2273 	struct port_info *pi = arg;
2274 	struct adapter *sc = pi->adapter;
2275 
2276 	if (!isset(&sc->open_device_map, pi->port_id))
2277 		return;
2278 
2279 	taskqueue_enqueue(sc->tq, &pi->link_check_task);
2280 }
2281 
2282 static void
2283 check_link_status(void *arg, int pending)
2284 {
2285 	struct port_info *pi = arg;
2286 	struct adapter *sc = pi->adapter;
2287 
2288 	if (!isset(&sc->open_device_map, pi->port_id))
2289 		return;
2290 
2291 	t3_link_changed(sc, pi->port_id);
2292 
2293 	if (pi->link_fault || !(pi->phy.caps & SUPPORTED_LINK_IRQ) ||
2294 	    pi->link_config.link_ok == 0)
2295 		callout_reset(&pi->link_check_ch, hz, link_check_callout, pi);
2296 }
2297 
2298 void
2299 t3_os_link_intr(struct port_info *pi)
2300 {
2301 	/*
2302 	 * Schedule a link check in the near future.  If the link is flapping
2303 	 * rapidly we'll keep resetting the callout and delaying the check until
2304 	 * things stabilize a bit.
2305 	 */
2306 	callout_reset(&pi->link_check_ch, hz / 4, link_check_callout, pi);
2307 }
2308 
2309 static void
2310 check_t3b2_mac(struct adapter *sc)
2311 {
2312 	int i;
2313 
2314 	if (sc->flags & CXGB_SHUTDOWN)
2315 		return;
2316 
2317 	for_each_port(sc, i) {
2318 		struct port_info *p = &sc->port[i];
2319 		int status;
2320 #ifdef INVARIANTS
2321 		if_t ifp = p->ifp;
2322 #endif
2323 
2324 		if (!isset(&sc->open_device_map, p->port_id) || p->link_fault ||
2325 		    !p->link_config.link_ok)
2326 			continue;
2327 
2328 		KASSERT(if_getdrvflags(ifp) & IFF_DRV_RUNNING,
2329 			("%s: state mismatch (drv_flags %x, device_map %x)",
2330 			 __func__, if_getdrvflags(ifp), sc->open_device_map));
2331 
2332 		PORT_LOCK(p);
2333 		status = t3b2_mac_watchdog_task(&p->mac);
2334 		if (status == 1)
2335 			p->mac.stats.num_toggled++;
2336 		else if (status == 2) {
2337 			struct cmac *mac = &p->mac;
2338 
2339 			cxgb_update_mac_settings(p);
2340 			t3_link_start(&p->phy, mac, &p->link_config);
2341 			t3_mac_enable(mac, MAC_DIRECTION_RX | MAC_DIRECTION_TX);
2342 			t3_port_intr_enable(sc, p->port_id);
2343 			p->mac.stats.num_resets++;
2344 		}
2345 		PORT_UNLOCK(p);
2346 	}
2347 }
2348 
2349 static void
2350 cxgb_tick(void *arg)
2351 {
2352 	adapter_t *sc = (adapter_t *)arg;
2353 
2354 	if (sc->flags & CXGB_SHUTDOWN)
2355 		return;
2356 
2357 	taskqueue_enqueue(sc->tq, &sc->tick_task);
2358 	callout_reset(&sc->cxgb_tick_ch, hz, cxgb_tick, sc);
2359 }
2360 
2361 void
2362 cxgb_refresh_stats(struct port_info *pi)
2363 {
2364 	struct timeval tv;
2365 	const struct timeval interval = {0, 250000};    /* 250ms */
2366 
2367 	getmicrotime(&tv);
2368 	timevalsub(&tv, &interval);
2369 	if (timevalcmp(&tv, &pi->last_refreshed, <))
2370 		return;
2371 
2372 	PORT_LOCK(pi);
2373 	t3_mac_update_stats(&pi->mac);
2374 	PORT_UNLOCK(pi);
2375 	getmicrotime(&pi->last_refreshed);
2376 }
2377 
2378 static void
2379 cxgb_tick_handler(void *arg, int count)
2380 {
2381 	adapter_t *sc = (adapter_t *)arg;
2382 	const struct adapter_params *p = &sc->params;
2383 	int i;
2384 	uint32_t cause, reset;
2385 
2386 	if (sc->flags & CXGB_SHUTDOWN || !(sc->flags & FULL_INIT_DONE))
2387 		return;
2388 
2389 	if (p->rev == T3_REV_B2 && p->nports < 4 && sc->open_device_map)
2390 		check_t3b2_mac(sc);
2391 
2392 	cause = t3_read_reg(sc, A_SG_INT_CAUSE) & (F_RSPQSTARVE | F_FLEMPTY);
2393 	if (cause) {
2394 		struct sge_qset *qs = &sc->sge.qs[0];
2395 		uint32_t mask, v;
2396 
2397 		v = t3_read_reg(sc, A_SG_RSPQ_FL_STATUS) & ~0xff00;
2398 
2399 		mask = 1;
2400 		for (i = 0; i < SGE_QSETS; i++) {
2401 			if (v & mask)
2402 				qs[i].rspq.starved++;
2403 			mask <<= 1;
2404 		}
2405 
2406 		mask <<= SGE_QSETS; /* skip RSPQXDISABLED */
2407 
2408 		for (i = 0; i < SGE_QSETS * 2; i++) {
2409 			if (v & mask) {
2410 				qs[i / 2].fl[i % 2].empty++;
2411 			}
2412 			mask <<= 1;
2413 		}
2414 
2415 		/* clear */
2416 		t3_write_reg(sc, A_SG_RSPQ_FL_STATUS, v);
2417 		t3_write_reg(sc, A_SG_INT_CAUSE, cause);
2418 	}
2419 
2420 	for (i = 0; i < sc->params.nports; i++) {
2421 		struct port_info *pi = &sc->port[i];
2422 		struct cmac *mac = &pi->mac;
2423 
2424 		if (!isset(&sc->open_device_map, pi->port_id))
2425 			continue;
2426 
2427 		cxgb_refresh_stats(pi);
2428 
2429 		if (mac->multiport)
2430 			continue;
2431 
2432 		/* Count rx fifo overflows, once per second */
2433 		cause = t3_read_reg(sc, A_XGM_INT_CAUSE + mac->offset);
2434 		reset = 0;
2435 		if (cause & F_RXFIFO_OVERFLOW) {
2436 			mac->stats.rx_fifo_ovfl++;
2437 			reset |= F_RXFIFO_OVERFLOW;
2438 		}
2439 		t3_write_reg(sc, A_XGM_INT_CAUSE + mac->offset, reset);
2440 	}
2441 }
2442 
2443 static void
2444 touch_bars(device_t dev)
2445 {
2446 	/*
2447 	 * Don't enable yet
2448 	 */
2449 #if !defined(__LP64__) && 0
2450 	u32 v;
2451 
2452 	pci_read_config_dword(pdev, PCI_BASE_ADDRESS_1, &v);
2453 	pci_write_config_dword(pdev, PCI_BASE_ADDRESS_1, v);
2454 	pci_read_config_dword(pdev, PCI_BASE_ADDRESS_3, &v);
2455 	pci_write_config_dword(pdev, PCI_BASE_ADDRESS_3, v);
2456 	pci_read_config_dword(pdev, PCI_BASE_ADDRESS_5, &v);
2457 	pci_write_config_dword(pdev, PCI_BASE_ADDRESS_5, v);
2458 #endif
2459 }
2460 
2461 static int
2462 set_eeprom(struct port_info *pi, const uint8_t *data, int len, int offset)
2463 {
2464 	uint8_t *buf;
2465 	int err = 0;
2466 	u32 aligned_offset, aligned_len, *p;
2467 	struct adapter *adapter = pi->adapter;
2468 
2469 
2470 	aligned_offset = offset & ~3;
2471 	aligned_len = (len + (offset & 3) + 3) & ~3;
2472 
2473 	if (aligned_offset != offset || aligned_len != len) {
2474 		buf = malloc(aligned_len, M_DEVBUF, M_WAITOK | M_ZERO);
2475 		err = t3_seeprom_read(adapter, aligned_offset, (u32 *)buf);
2476 		if (!err && aligned_len > 4)
2477 			err = t3_seeprom_read(adapter,
2478 					      aligned_offset + aligned_len - 4,
2479 					      (u32 *)&buf[aligned_len - 4]);
2480 		if (err)
2481 			goto out;
2482 		memcpy(buf + (offset & 3), data, len);
2483 	} else
2484 		buf = (uint8_t *)(uintptr_t)data;
2485 
2486 	err = t3_seeprom_wp(adapter, 0);
2487 	if (err)
2488 		goto out;
2489 
2490 	for (p = (u32 *)buf; !err && aligned_len; aligned_len -= 4, p++) {
2491 		err = t3_seeprom_write(adapter, aligned_offset, *p);
2492 		aligned_offset += 4;
2493 	}
2494 
2495 	if (!err)
2496 		err = t3_seeprom_wp(adapter, 1);
2497 out:
2498 	if (buf != data)
2499 		free(buf, M_DEVBUF);
2500 	return err;
2501 }
2502 
2503 
2504 static int
2505 in_range(int val, int lo, int hi)
2506 {
2507 	return val < 0 || (val <= hi && val >= lo);
2508 }
2509 
2510 static int
2511 cxgb_extension_open(struct cdev *dev, int flags, int fmp, struct thread *td)
2512 {
2513        return (0);
2514 }
2515 
2516 static int
2517 cxgb_extension_close(struct cdev *dev, int flags, int fmt, struct thread *td)
2518 {
2519        return (0);
2520 }
2521 
2522 static int
2523 cxgb_extension_ioctl(struct cdev *dev, unsigned long cmd, caddr_t data,
2524     int fflag, struct thread *td)
2525 {
2526 	int mmd, error = 0;
2527 	struct port_info *pi = dev->si_drv1;
2528 	adapter_t *sc = pi->adapter;
2529 
2530 #ifdef PRIV_SUPPORTED
2531 	if (priv_check(td, PRIV_DRIVER)) {
2532 		if (cxgb_debug)
2533 			printf("user does not have access to privileged ioctls\n");
2534 		return (EPERM);
2535 	}
2536 #else
2537 	if (suser(td)) {
2538 		if (cxgb_debug)
2539 			printf("user does not have access to privileged ioctls\n");
2540 		return (EPERM);
2541 	}
2542 #endif
2543 
2544 	switch (cmd) {
2545 	case CHELSIO_GET_MIIREG: {
2546 		uint32_t val;
2547 		struct cphy *phy = &pi->phy;
2548 		struct ch_mii_data *mid = (struct ch_mii_data *)data;
2549 
2550 		if (!phy->mdio_read)
2551 			return (EOPNOTSUPP);
2552 		if (is_10G(sc)) {
2553 			mmd = mid->phy_id >> 8;
2554 			if (!mmd)
2555 				mmd = MDIO_DEV_PCS;
2556 			else if (mmd > MDIO_DEV_VEND2)
2557 				return (EINVAL);
2558 
2559 			error = phy->mdio_read(sc, mid->phy_id & 0x1f, mmd,
2560 					     mid->reg_num, &val);
2561 		} else
2562 		        error = phy->mdio_read(sc, mid->phy_id & 0x1f, 0,
2563 					     mid->reg_num & 0x1f, &val);
2564 		if (error == 0)
2565 			mid->val_out = val;
2566 		break;
2567 	}
2568 	case CHELSIO_SET_MIIREG: {
2569 		struct cphy *phy = &pi->phy;
2570 		struct ch_mii_data *mid = (struct ch_mii_data *)data;
2571 
2572 		if (!phy->mdio_write)
2573 			return (EOPNOTSUPP);
2574 		if (is_10G(sc)) {
2575 			mmd = mid->phy_id >> 8;
2576 			if (!mmd)
2577 				mmd = MDIO_DEV_PCS;
2578 			else if (mmd > MDIO_DEV_VEND2)
2579 				return (EINVAL);
2580 
2581 			error = phy->mdio_write(sc, mid->phy_id & 0x1f,
2582 					      mmd, mid->reg_num, mid->val_in);
2583 		} else
2584 			error = phy->mdio_write(sc, mid->phy_id & 0x1f, 0,
2585 					      mid->reg_num & 0x1f,
2586 					      mid->val_in);
2587 		break;
2588 	}
2589 	case CHELSIO_SETREG: {
2590 		struct ch_reg *edata = (struct ch_reg *)data;
2591 		if ((edata->addr & 0x3) != 0 || edata->addr >= sc->mmio_len)
2592 			return (EFAULT);
2593 		t3_write_reg(sc, edata->addr, edata->val);
2594 		break;
2595 	}
2596 	case CHELSIO_GETREG: {
2597 		struct ch_reg *edata = (struct ch_reg *)data;
2598 		if ((edata->addr & 0x3) != 0 || edata->addr >= sc->mmio_len)
2599 			return (EFAULT);
2600 		edata->val = t3_read_reg(sc, edata->addr);
2601 		break;
2602 	}
2603 	case CHELSIO_GET_SGE_CONTEXT: {
2604 		struct ch_cntxt *ecntxt = (struct ch_cntxt *)data;
2605 		mtx_lock_spin(&sc->sge.reg_lock);
2606 		switch (ecntxt->cntxt_type) {
2607 		case CNTXT_TYPE_EGRESS:
2608 			error = -t3_sge_read_ecntxt(sc, ecntxt->cntxt_id,
2609 			    ecntxt->data);
2610 			break;
2611 		case CNTXT_TYPE_FL:
2612 			error = -t3_sge_read_fl(sc, ecntxt->cntxt_id,
2613 			    ecntxt->data);
2614 			break;
2615 		case CNTXT_TYPE_RSP:
2616 			error = -t3_sge_read_rspq(sc, ecntxt->cntxt_id,
2617 			    ecntxt->data);
2618 			break;
2619 		case CNTXT_TYPE_CQ:
2620 			error = -t3_sge_read_cq(sc, ecntxt->cntxt_id,
2621 			    ecntxt->data);
2622 			break;
2623 		default:
2624 			error = EINVAL;
2625 			break;
2626 		}
2627 		mtx_unlock_spin(&sc->sge.reg_lock);
2628 		break;
2629 	}
2630 	case CHELSIO_GET_SGE_DESC: {
2631 		struct ch_desc *edesc = (struct ch_desc *)data;
2632 		int ret;
2633 		if (edesc->queue_num >= SGE_QSETS * 6)
2634 			return (EINVAL);
2635 		ret = t3_get_desc(&sc->sge.qs[edesc->queue_num / 6],
2636 		    edesc->queue_num % 6, edesc->idx, edesc->data);
2637 		if (ret < 0)
2638 			return (EINVAL);
2639 		edesc->size = ret;
2640 		break;
2641 	}
2642 	case CHELSIO_GET_QSET_PARAMS: {
2643 		struct qset_params *q;
2644 		struct ch_qset_params *t = (struct ch_qset_params *)data;
2645 		int q1 = pi->first_qset;
2646 		int nqsets = pi->nqsets;
2647 		int i;
2648 
2649 		if (t->qset_idx >= nqsets)
2650 			return EINVAL;
2651 
2652 		i = q1 + t->qset_idx;
2653 		q = &sc->params.sge.qset[i];
2654 		t->rspq_size   = q->rspq_size;
2655 		t->txq_size[0] = q->txq_size[0];
2656 		t->txq_size[1] = q->txq_size[1];
2657 		t->txq_size[2] = q->txq_size[2];
2658 		t->fl_size[0]  = q->fl_size;
2659 		t->fl_size[1]  = q->jumbo_size;
2660 		t->polling     = q->polling;
2661 		t->lro         = q->lro;
2662 		t->intr_lat    = q->coalesce_usecs;
2663 		t->cong_thres  = q->cong_thres;
2664 		t->qnum        = i;
2665 
2666 		if ((sc->flags & FULL_INIT_DONE) == 0)
2667 			t->vector = 0;
2668 		else if (sc->flags & USING_MSIX)
2669 			t->vector = rman_get_start(sc->msix_irq_res[i]);
2670 		else
2671 			t->vector = rman_get_start(sc->irq_res);
2672 
2673 		break;
2674 	}
2675 	case CHELSIO_GET_QSET_NUM: {
2676 		struct ch_reg *edata = (struct ch_reg *)data;
2677 		edata->val = pi->nqsets;
2678 		break;
2679 	}
2680 	case CHELSIO_LOAD_FW: {
2681 		uint8_t *fw_data;
2682 		uint32_t vers;
2683 		struct ch_mem_range *t = (struct ch_mem_range *)data;
2684 
2685 		/*
2686 		 * You're allowed to load a firmware only before FULL_INIT_DONE
2687 		 *
2688 		 * FW_UPTODATE is also set so the rest of the initialization
2689 		 * will not overwrite what was loaded here.  This gives you the
2690 		 * flexibility to load any firmware (and maybe shoot yourself in
2691 		 * the foot).
2692 		 */
2693 
2694 		ADAPTER_LOCK(sc);
2695 		if (sc->open_device_map || sc->flags & FULL_INIT_DONE) {
2696 			ADAPTER_UNLOCK(sc);
2697 			return (EBUSY);
2698 		}
2699 
2700 		fw_data = malloc(t->len, M_DEVBUF, M_NOWAIT);
2701 		if (!fw_data)
2702 			error = ENOMEM;
2703 		else
2704 			error = copyin(t->buf, fw_data, t->len);
2705 
2706 		if (!error)
2707 			error = -t3_load_fw(sc, fw_data, t->len);
2708 
2709 		if (t3_get_fw_version(sc, &vers) == 0) {
2710 			snprintf(&sc->fw_version[0], sizeof(sc->fw_version),
2711 			    "%d.%d.%d", G_FW_VERSION_MAJOR(vers),
2712 			    G_FW_VERSION_MINOR(vers), G_FW_VERSION_MICRO(vers));
2713 		}
2714 
2715 		if (!error)
2716 			sc->flags |= FW_UPTODATE;
2717 
2718 		free(fw_data, M_DEVBUF);
2719 		ADAPTER_UNLOCK(sc);
2720 		break;
2721 	}
2722 	case CHELSIO_LOAD_BOOT: {
2723 		uint8_t *boot_data;
2724 		struct ch_mem_range *t = (struct ch_mem_range *)data;
2725 
2726 		boot_data = malloc(t->len, M_DEVBUF, M_NOWAIT);
2727 		if (!boot_data)
2728 			return ENOMEM;
2729 
2730 		error = copyin(t->buf, boot_data, t->len);
2731 		if (!error)
2732 			error = -t3_load_boot(sc, boot_data, t->len);
2733 
2734 		free(boot_data, M_DEVBUF);
2735 		break;
2736 	}
2737 	case CHELSIO_GET_PM: {
2738 		struct ch_pm *m = (struct ch_pm *)data;
2739 		struct tp_params *p = &sc->params.tp;
2740 
2741 		if (!is_offload(sc))
2742 			return (EOPNOTSUPP);
2743 
2744 		m->tx_pg_sz = p->tx_pg_size;
2745 		m->tx_num_pg = p->tx_num_pgs;
2746 		m->rx_pg_sz  = p->rx_pg_size;
2747 		m->rx_num_pg = p->rx_num_pgs;
2748 		m->pm_total  = p->pmtx_size + p->chan_rx_size * p->nchan;
2749 
2750 		break;
2751 	}
2752 	case CHELSIO_SET_PM: {
2753 		struct ch_pm *m = (struct ch_pm *)data;
2754 		struct tp_params *p = &sc->params.tp;
2755 
2756 		if (!is_offload(sc))
2757 			return (EOPNOTSUPP);
2758 		if (sc->flags & FULL_INIT_DONE)
2759 			return (EBUSY);
2760 
2761 		if (!m->rx_pg_sz || (m->rx_pg_sz & (m->rx_pg_sz - 1)) ||
2762 		    !m->tx_pg_sz || (m->tx_pg_sz & (m->tx_pg_sz - 1)))
2763 			return (EINVAL);	/* not power of 2 */
2764 		if (!(m->rx_pg_sz & 0x14000))
2765 			return (EINVAL);	/* not 16KB or 64KB */
2766 		if (!(m->tx_pg_sz & 0x1554000))
2767 			return (EINVAL);
2768 		if (m->tx_num_pg == -1)
2769 			m->tx_num_pg = p->tx_num_pgs;
2770 		if (m->rx_num_pg == -1)
2771 			m->rx_num_pg = p->rx_num_pgs;
2772 		if (m->tx_num_pg % 24 || m->rx_num_pg % 24)
2773 			return (EINVAL);
2774 		if (m->rx_num_pg * m->rx_pg_sz > p->chan_rx_size ||
2775 		    m->tx_num_pg * m->tx_pg_sz > p->chan_tx_size)
2776 			return (EINVAL);
2777 
2778 		p->rx_pg_size = m->rx_pg_sz;
2779 		p->tx_pg_size = m->tx_pg_sz;
2780 		p->rx_num_pgs = m->rx_num_pg;
2781 		p->tx_num_pgs = m->tx_num_pg;
2782 		break;
2783 	}
2784 	case CHELSIO_SETMTUTAB: {
2785 		struct ch_mtus *m = (struct ch_mtus *)data;
2786 		int i;
2787 
2788 		if (!is_offload(sc))
2789 			return (EOPNOTSUPP);
2790 		if (offload_running(sc))
2791 			return (EBUSY);
2792 		if (m->nmtus != NMTUS)
2793 			return (EINVAL);
2794 		if (m->mtus[0] < 81)         /* accommodate SACK */
2795 			return (EINVAL);
2796 
2797 		/*
2798 		 * MTUs must be in ascending order
2799 		 */
2800 		for (i = 1; i < NMTUS; ++i)
2801 			if (m->mtus[i] < m->mtus[i - 1])
2802 				return (EINVAL);
2803 
2804 		memcpy(sc->params.mtus, m->mtus, sizeof(sc->params.mtus));
2805 		break;
2806 	}
2807 	case CHELSIO_GETMTUTAB: {
2808 		struct ch_mtus *m = (struct ch_mtus *)data;
2809 
2810 		if (!is_offload(sc))
2811 			return (EOPNOTSUPP);
2812 
2813 		memcpy(m->mtus, sc->params.mtus, sizeof(m->mtus));
2814 		m->nmtus = NMTUS;
2815 		break;
2816 	}
2817 	case CHELSIO_GET_MEM: {
2818 		struct ch_mem_range *t = (struct ch_mem_range *)data;
2819 		struct mc7 *mem;
2820 		uint8_t *useraddr;
2821 		u64 buf[32];
2822 
2823 		/*
2824 		 * Use these to avoid modifying len/addr in the return
2825 		 * struct
2826 		 */
2827 		uint32_t len = t->len, addr = t->addr;
2828 
2829 		if (!is_offload(sc))
2830 			return (EOPNOTSUPP);
2831 		if (!(sc->flags & FULL_INIT_DONE))
2832 			return (EIO);         /* need the memory controllers */
2833 		if ((addr & 0x7) || (len & 0x7))
2834 			return (EINVAL);
2835 		if (t->mem_id == MEM_CM)
2836 			mem = &sc->cm;
2837 		else if (t->mem_id == MEM_PMRX)
2838 			mem = &sc->pmrx;
2839 		else if (t->mem_id == MEM_PMTX)
2840 			mem = &sc->pmtx;
2841 		else
2842 			return (EINVAL);
2843 
2844 		/*
2845 		 * Version scheme:
2846 		 * bits 0..9: chip version
2847 		 * bits 10..15: chip revision
2848 		 */
2849 		t->version = 3 | (sc->params.rev << 10);
2850 
2851 		/*
2852 		 * Read 256 bytes at a time as len can be large and we don't
2853 		 * want to use huge intermediate buffers.
2854 		 */
2855 		useraddr = (uint8_t *)t->buf;
2856 		while (len) {
2857 			unsigned int chunk = min(len, sizeof(buf));
2858 
2859 			error = t3_mc7_bd_read(mem, addr / 8, chunk / 8, buf);
2860 			if (error)
2861 				return (-error);
2862 			if (copyout(buf, useraddr, chunk))
2863 				return (EFAULT);
2864 			useraddr += chunk;
2865 			addr += chunk;
2866 			len -= chunk;
2867 		}
2868 		break;
2869 	}
2870 	case CHELSIO_READ_TCAM_WORD: {
2871 		struct ch_tcam_word *t = (struct ch_tcam_word *)data;
2872 
2873 		if (!is_offload(sc))
2874 			return (EOPNOTSUPP);
2875 		if (!(sc->flags & FULL_INIT_DONE))
2876 			return (EIO);         /* need MC5 */
2877 		return -t3_read_mc5_range(&sc->mc5, t->addr, 1, t->buf);
2878 		break;
2879 	}
2880 	case CHELSIO_SET_TRACE_FILTER: {
2881 		struct ch_trace *t = (struct ch_trace *)data;
2882 		const struct trace_params *tp;
2883 
2884 		tp = (const struct trace_params *)&t->sip;
2885 		if (t->config_tx)
2886 			t3_config_trace_filter(sc, tp, 0, t->invert_match,
2887 					       t->trace_tx);
2888 		if (t->config_rx)
2889 			t3_config_trace_filter(sc, tp, 1, t->invert_match,
2890 					       t->trace_rx);
2891 		break;
2892 	}
2893 	case CHELSIO_SET_PKTSCHED: {
2894 		struct ch_pktsched_params *p = (struct ch_pktsched_params *)data;
2895 		if (sc->open_device_map == 0)
2896 			return (EAGAIN);
2897 		send_pktsched_cmd(sc, p->sched, p->idx, p->min, p->max,
2898 		    p->binding);
2899 		break;
2900 	}
2901 	case CHELSIO_IFCONF_GETREGS: {
2902 		struct ch_ifconf_regs *regs = (struct ch_ifconf_regs *)data;
2903 		int reglen = cxgb_get_regs_len();
2904 		uint8_t *buf = malloc(reglen, M_DEVBUF, M_NOWAIT);
2905 		if (buf == NULL) {
2906 			return (ENOMEM);
2907 		}
2908 		if (regs->len > reglen)
2909 			regs->len = reglen;
2910 		else if (regs->len < reglen)
2911 			error = ENOBUFS;
2912 
2913 		if (!error) {
2914 			cxgb_get_regs(sc, regs, buf);
2915 			error = copyout(buf, regs->data, reglen);
2916 		}
2917 		free(buf, M_DEVBUF);
2918 
2919 		break;
2920 	}
2921 	case CHELSIO_SET_HW_SCHED: {
2922 		struct ch_hw_sched *t = (struct ch_hw_sched *)data;
2923 		unsigned int ticks_per_usec = core_ticks_per_usec(sc);
2924 
2925 		if ((sc->flags & FULL_INIT_DONE) == 0)
2926 			return (EAGAIN);       /* need TP to be initialized */
2927 		if (t->sched >= NTX_SCHED || !in_range(t->mode, 0, 1) ||
2928 		    !in_range(t->channel, 0, 1) ||
2929 		    !in_range(t->kbps, 0, 10000000) ||
2930 		    !in_range(t->class_ipg, 0, 10000 * 65535 / ticks_per_usec) ||
2931 		    !in_range(t->flow_ipg, 0,
2932 			      dack_ticks_to_usec(sc, 0x7ff)))
2933 			return (EINVAL);
2934 
2935 		if (t->kbps >= 0) {
2936 			error = t3_config_sched(sc, t->kbps, t->sched);
2937 			if (error < 0)
2938 				return (-error);
2939 		}
2940 		if (t->class_ipg >= 0)
2941 			t3_set_sched_ipg(sc, t->sched, t->class_ipg);
2942 		if (t->flow_ipg >= 0) {
2943 			t->flow_ipg *= 1000;     /* us -> ns */
2944 			t3_set_pace_tbl(sc, &t->flow_ipg, t->sched, 1);
2945 		}
2946 		if (t->mode >= 0) {
2947 			int bit = 1 << (S_TX_MOD_TIMER_MODE + t->sched);
2948 
2949 			t3_set_reg_field(sc, A_TP_TX_MOD_QUEUE_REQ_MAP,
2950 					 bit, t->mode ? bit : 0);
2951 		}
2952 		if (t->channel >= 0)
2953 			t3_set_reg_field(sc, A_TP_TX_MOD_QUEUE_REQ_MAP,
2954 					 1 << t->sched, t->channel << t->sched);
2955 		break;
2956 	}
2957 	case CHELSIO_GET_EEPROM: {
2958 		int i;
2959 		struct ch_eeprom *e = (struct ch_eeprom *)data;
2960 		uint8_t *buf;
2961 
2962 		if (e->offset & 3 || e->offset >= EEPROMSIZE ||
2963 		    e->len > EEPROMSIZE || e->offset + e->len > EEPROMSIZE) {
2964 			return (EINVAL);
2965 		}
2966 
2967 		buf = malloc(EEPROMSIZE, M_DEVBUF, M_NOWAIT);
2968 		if (buf == NULL) {
2969 			return (ENOMEM);
2970 		}
2971 		e->magic = EEPROM_MAGIC;
2972 		for (i = e->offset & ~3; !error && i < e->offset + e->len; i += 4)
2973 			error = -t3_seeprom_read(sc, i, (uint32_t *)&buf[i]);
2974 
2975 		if (!error)
2976 			error = copyout(buf + e->offset, e->data, e->len);
2977 
2978 		free(buf, M_DEVBUF);
2979 		break;
2980 	}
2981 	case CHELSIO_CLEAR_STATS: {
2982 		if (!(sc->flags & FULL_INIT_DONE))
2983 			return EAGAIN;
2984 
2985 		PORT_LOCK(pi);
2986 		t3_mac_update_stats(&pi->mac);
2987 		memset(&pi->mac.stats, 0, sizeof(pi->mac.stats));
2988 		PORT_UNLOCK(pi);
2989 		break;
2990 	}
2991 	case CHELSIO_GET_UP_LA: {
2992 		struct ch_up_la *la = (struct ch_up_la *)data;
2993 		uint8_t *buf = malloc(LA_BUFSIZE, M_DEVBUF, M_NOWAIT);
2994 		if (buf == NULL) {
2995 			return (ENOMEM);
2996 		}
2997 		if (la->bufsize < LA_BUFSIZE)
2998 			error = ENOBUFS;
2999 
3000 		if (!error)
3001 			error = -t3_get_up_la(sc, &la->stopped, &la->idx,
3002 					      &la->bufsize, buf);
3003 		if (!error)
3004 			error = copyout(buf, la->data, la->bufsize);
3005 
3006 		free(buf, M_DEVBUF);
3007 		break;
3008 	}
3009 	case CHELSIO_GET_UP_IOQS: {
3010 		struct ch_up_ioqs *ioqs = (struct ch_up_ioqs *)data;
3011 		uint8_t *buf = malloc(IOQS_BUFSIZE, M_DEVBUF, M_NOWAIT);
3012 		uint32_t *v;
3013 
3014 		if (buf == NULL) {
3015 			return (ENOMEM);
3016 		}
3017 		if (ioqs->bufsize < IOQS_BUFSIZE)
3018 			error = ENOBUFS;
3019 
3020 		if (!error)
3021 			error = -t3_get_up_ioqs(sc, &ioqs->bufsize, buf);
3022 
3023 		if (!error) {
3024 			v = (uint32_t *)buf;
3025 
3026 			ioqs->ioq_rx_enable = *v++;
3027 			ioqs->ioq_tx_enable = *v++;
3028 			ioqs->ioq_rx_status = *v++;
3029 			ioqs->ioq_tx_status = *v++;
3030 
3031 			error = copyout(v, ioqs->data, ioqs->bufsize);
3032 		}
3033 
3034 		free(buf, M_DEVBUF);
3035 		break;
3036 	}
3037 	case CHELSIO_SET_FILTER: {
3038 		struct ch_filter *f = (struct ch_filter *)data;
3039 		struct filter_info *p;
3040 		unsigned int nfilters = sc->params.mc5.nfilters;
3041 
3042 		if (!is_offload(sc))
3043 			return (EOPNOTSUPP);	/* No TCAM */
3044 		if (!(sc->flags & FULL_INIT_DONE))
3045 			return (EAGAIN);	/* mc5 not setup yet */
3046 		if (nfilters == 0)
3047 			return (EBUSY);		/* TOE will use TCAM */
3048 
3049 		/* sanity checks */
3050 		if (f->filter_id >= nfilters ||
3051 		    (f->val.dip && f->mask.dip != 0xffffffff) ||
3052 		    (f->val.sport && f->mask.sport != 0xffff) ||
3053 		    (f->val.dport && f->mask.dport != 0xffff) ||
3054 		    (f->val.vlan && f->mask.vlan != 0xfff) ||
3055 		    (f->val.vlan_prio &&
3056 			f->mask.vlan_prio != FILTER_NO_VLAN_PRI) ||
3057 		    (f->mac_addr_idx != 0xffff && f->mac_addr_idx > 15) ||
3058 		    f->qset >= SGE_QSETS ||
3059 		    sc->rrss_map[f->qset] >= RSS_TABLE_SIZE)
3060 			return (EINVAL);
3061 
3062 		/* Was allocated with M_WAITOK */
3063 		KASSERT(sc->filters, ("filter table NULL\n"));
3064 
3065 		p = &sc->filters[f->filter_id];
3066 		if (p->locked)
3067 			return (EPERM);
3068 
3069 		bzero(p, sizeof(*p));
3070 		p->sip = f->val.sip;
3071 		p->sip_mask = f->mask.sip;
3072 		p->dip = f->val.dip;
3073 		p->sport = f->val.sport;
3074 		p->dport = f->val.dport;
3075 		p->vlan = f->mask.vlan ? f->val.vlan : 0xfff;
3076 		p->vlan_prio = f->mask.vlan_prio ? (f->val.vlan_prio & 6) :
3077 		    FILTER_NO_VLAN_PRI;
3078 		p->mac_hit = f->mac_hit;
3079 		p->mac_vld = f->mac_addr_idx != 0xffff;
3080 		p->mac_idx = f->mac_addr_idx;
3081 		p->pkt_type = f->proto;
3082 		p->report_filter_id = f->want_filter_id;
3083 		p->pass = f->pass;
3084 		p->rss = f->rss;
3085 		p->qset = f->qset;
3086 
3087 		error = set_filter(sc, f->filter_id, p);
3088 		if (error == 0)
3089 			p->valid = 1;
3090 		break;
3091 	}
3092 	case CHELSIO_DEL_FILTER: {
3093 		struct ch_filter *f = (struct ch_filter *)data;
3094 		struct filter_info *p;
3095 		unsigned int nfilters = sc->params.mc5.nfilters;
3096 
3097 		if (!is_offload(sc))
3098 			return (EOPNOTSUPP);
3099 		if (!(sc->flags & FULL_INIT_DONE))
3100 			return (EAGAIN);
3101 		if (nfilters == 0 || sc->filters == NULL)
3102 			return (EINVAL);
3103 		if (f->filter_id >= nfilters)
3104 		       return (EINVAL);
3105 
3106 		p = &sc->filters[f->filter_id];
3107 		if (p->locked)
3108 			return (EPERM);
3109 		if (!p->valid)
3110 			return (EFAULT); /* Read "Bad address" as "Bad index" */
3111 
3112 		bzero(p, sizeof(*p));
3113 		p->sip = p->sip_mask = 0xffffffff;
3114 		p->vlan = 0xfff;
3115 		p->vlan_prio = FILTER_NO_VLAN_PRI;
3116 		p->pkt_type = 1;
3117 		error = set_filter(sc, f->filter_id, p);
3118 		break;
3119 	}
3120 	case CHELSIO_GET_FILTER: {
3121 		struct ch_filter *f = (struct ch_filter *)data;
3122 		struct filter_info *p;
3123 		unsigned int i, nfilters = sc->params.mc5.nfilters;
3124 
3125 		if (!is_offload(sc))
3126 			return (EOPNOTSUPP);
3127 		if (!(sc->flags & FULL_INIT_DONE))
3128 			return (EAGAIN);
3129 		if (nfilters == 0 || sc->filters == NULL)
3130 			return (EINVAL);
3131 
3132 		i = f->filter_id == 0xffffffff ? 0 : f->filter_id + 1;
3133 		for (; i < nfilters; i++) {
3134 			p = &sc->filters[i];
3135 			if (!p->valid)
3136 				continue;
3137 
3138 			bzero(f, sizeof(*f));
3139 
3140 			f->filter_id = i;
3141 			f->val.sip = p->sip;
3142 			f->mask.sip = p->sip_mask;
3143 			f->val.dip = p->dip;
3144 			f->mask.dip = p->dip ? 0xffffffff : 0;
3145 			f->val.sport = p->sport;
3146 			f->mask.sport = p->sport ? 0xffff : 0;
3147 			f->val.dport = p->dport;
3148 			f->mask.dport = p->dport ? 0xffff : 0;
3149 			f->val.vlan = p->vlan == 0xfff ? 0 : p->vlan;
3150 			f->mask.vlan = p->vlan == 0xfff ? 0 : 0xfff;
3151 			f->val.vlan_prio = p->vlan_prio == FILTER_NO_VLAN_PRI ?
3152 			    0 : p->vlan_prio;
3153 			f->mask.vlan_prio = p->vlan_prio == FILTER_NO_VLAN_PRI ?
3154 			    0 : FILTER_NO_VLAN_PRI;
3155 			f->mac_hit = p->mac_hit;
3156 			f->mac_addr_idx = p->mac_vld ? p->mac_idx : 0xffff;
3157 			f->proto = p->pkt_type;
3158 			f->want_filter_id = p->report_filter_id;
3159 			f->pass = p->pass;
3160 			f->rss = p->rss;
3161 			f->qset = p->qset;
3162 
3163 			break;
3164 		}
3165 
3166 		if (i == nfilters)
3167 			f->filter_id = 0xffffffff;
3168 		break;
3169 	}
3170 	default:
3171 		return (EOPNOTSUPP);
3172 		break;
3173 	}
3174 
3175 	return (error);
3176 }
3177 
3178 static __inline void
3179 reg_block_dump(struct adapter *ap, uint8_t *buf, unsigned int start,
3180     unsigned int end)
3181 {
3182 	uint32_t *p = (uint32_t *)(buf + start);
3183 
3184 	for ( ; start <= end; start += sizeof(uint32_t))
3185 		*p++ = t3_read_reg(ap, start);
3186 }
3187 
3188 #define T3_REGMAP_SIZE (3 * 1024)
3189 static int
3190 cxgb_get_regs_len(void)
3191 {
3192 	return T3_REGMAP_SIZE;
3193 }
3194 
3195 static void
3196 cxgb_get_regs(adapter_t *sc, struct ch_ifconf_regs *regs, uint8_t *buf)
3197 {
3198 
3199 	/*
3200 	 * Version scheme:
3201 	 * bits 0..9: chip version
3202 	 * bits 10..15: chip revision
3203 	 * bit 31: set for PCIe cards
3204 	 */
3205 	regs->version = 3 | (sc->params.rev << 10) | (is_pcie(sc) << 31);
3206 
3207 	/*
3208 	 * We skip the MAC statistics registers because they are clear-on-read.
3209 	 * Also reading multi-register stats would need to synchronize with the
3210 	 * periodic mac stats accumulation.  Hard to justify the complexity.
3211 	 */
3212 	memset(buf, 0, cxgb_get_regs_len());
3213 	reg_block_dump(sc, buf, 0, A_SG_RSPQ_CREDIT_RETURN);
3214 	reg_block_dump(sc, buf, A_SG_HI_DRB_HI_THRSH, A_ULPRX_PBL_ULIMIT);
3215 	reg_block_dump(sc, buf, A_ULPTX_CONFIG, A_MPS_INT_CAUSE);
3216 	reg_block_dump(sc, buf, A_CPL_SWITCH_CNTRL, A_CPL_MAP_TBL_DATA);
3217 	reg_block_dump(sc, buf, A_SMB_GLOBAL_TIME_CFG, A_XGM_SERDES_STAT3);
3218 	reg_block_dump(sc, buf, A_XGM_SERDES_STATUS0,
3219 		       XGM_REG(A_XGM_SERDES_STAT3, 1));
3220 	reg_block_dump(sc, buf, XGM_REG(A_XGM_SERDES_STATUS0, 1),
3221 		       XGM_REG(A_XGM_RX_SPI4_SOP_EOP_CNT, 1));
3222 }
3223 
3224 static int
3225 alloc_filters(struct adapter *sc)
3226 {
3227 	struct filter_info *p;
3228 	unsigned int nfilters = sc->params.mc5.nfilters;
3229 
3230 	if (nfilters == 0)
3231 		return (0);
3232 
3233 	p = malloc(sizeof(*p) * nfilters, M_DEVBUF, M_WAITOK | M_ZERO);
3234 	sc->filters = p;
3235 
3236 	p = &sc->filters[nfilters - 1];
3237 	p->vlan = 0xfff;
3238 	p->vlan_prio = FILTER_NO_VLAN_PRI;
3239 	p->pass = p->rss = p->valid = p->locked = 1;
3240 
3241 	return (0);
3242 }
3243 
3244 static int
3245 setup_hw_filters(struct adapter *sc)
3246 {
3247 	int i, rc;
3248 	unsigned int nfilters = sc->params.mc5.nfilters;
3249 
3250 	if (!sc->filters)
3251 		return (0);
3252 
3253 	t3_enable_filters(sc);
3254 
3255 	for (i = rc = 0; i < nfilters && !rc; i++) {
3256 		if (sc->filters[i].locked)
3257 			rc = set_filter(sc, i, &sc->filters[i]);
3258 	}
3259 
3260 	return (rc);
3261 }
3262 
3263 static int
3264 set_filter(struct adapter *sc, int id, const struct filter_info *f)
3265 {
3266 	int len;
3267 	struct mbuf *m;
3268 	struct ulp_txpkt *txpkt;
3269 	struct work_request_hdr *wr;
3270 	struct cpl_pass_open_req *oreq;
3271 	struct cpl_set_tcb_field *sreq;
3272 
3273 	len = sizeof(*wr) + sizeof(*oreq) + 2 * sizeof(*sreq);
3274 	KASSERT(len <= MHLEN, ("filter request too big for an mbuf"));
3275 
3276 	id += t3_mc5_size(&sc->mc5) - sc->params.mc5.nroutes -
3277 	      sc->params.mc5.nfilters;
3278 
3279 	m = m_gethdr(M_WAITOK, MT_DATA);
3280 	m->m_len = m->m_pkthdr.len = len;
3281 	bzero(mtod(m, char *), len);
3282 
3283 	wr = mtod(m, struct work_request_hdr *);
3284 	wr->wrh_hi = htonl(V_WR_OP(FW_WROPCODE_BYPASS) | F_WR_ATOMIC);
3285 
3286 	oreq = (struct cpl_pass_open_req *)(wr + 1);
3287 	txpkt = (struct ulp_txpkt *)oreq;
3288 	txpkt->cmd_dest = htonl(V_ULPTX_CMD(ULP_TXPKT));
3289 	txpkt->len = htonl(V_ULPTX_NFLITS(sizeof(*oreq) / 8));
3290 	OPCODE_TID(oreq) = htonl(MK_OPCODE_TID(CPL_PASS_OPEN_REQ, id));
3291 	oreq->local_port = htons(f->dport);
3292 	oreq->peer_port = htons(f->sport);
3293 	oreq->local_ip = htonl(f->dip);
3294 	oreq->peer_ip = htonl(f->sip);
3295 	oreq->peer_netmask = htonl(f->sip_mask);
3296 	oreq->opt0h = 0;
3297 	oreq->opt0l = htonl(F_NO_OFFLOAD);
3298 	oreq->opt1 = htonl(V_MAC_MATCH_VALID(f->mac_vld) |
3299 			 V_CONN_POLICY(CPL_CONN_POLICY_FILTER) |
3300 			 V_VLAN_PRI(f->vlan_prio >> 1) |
3301 			 V_VLAN_PRI_VALID(f->vlan_prio != FILTER_NO_VLAN_PRI) |
3302 			 V_PKT_TYPE(f->pkt_type) | V_OPT1_VLAN(f->vlan) |
3303 			 V_MAC_MATCH(f->mac_idx | (f->mac_hit << 4)));
3304 
3305 	sreq = (struct cpl_set_tcb_field *)(oreq + 1);
3306 	set_tcb_field_ulp(sreq, id, 1, 0x1800808000ULL,
3307 			  (f->report_filter_id << 15) | (1 << 23) |
3308 			  ((u64)f->pass << 35) | ((u64)!f->rss << 36));
3309 	set_tcb_field_ulp(sreq + 1, id, 0, 0xffffffff, (2 << 19) | 1);
3310 	t3_mgmt_tx(sc, m);
3311 
3312 	if (f->pass && !f->rss) {
3313 		len = sizeof(*sreq);
3314 		m = m_gethdr(M_WAITOK, MT_DATA);
3315 		m->m_len = m->m_pkthdr.len = len;
3316 		bzero(mtod(m, char *), len);
3317 		sreq = mtod(m, struct cpl_set_tcb_field *);
3318 		sreq->wr.wrh_hi = htonl(V_WR_OP(FW_WROPCODE_FORWARD));
3319 		mk_set_tcb_field(sreq, id, 25, 0x3f80000,
3320 				 (u64)sc->rrss_map[f->qset] << 19);
3321 		t3_mgmt_tx(sc, m);
3322 	}
3323 	return 0;
3324 }
3325 
3326 static inline void
3327 mk_set_tcb_field(struct cpl_set_tcb_field *req, unsigned int tid,
3328     unsigned int word, u64 mask, u64 val)
3329 {
3330 	OPCODE_TID(req) = htonl(MK_OPCODE_TID(CPL_SET_TCB_FIELD, tid));
3331 	req->reply = V_NO_REPLY(1);
3332 	req->cpu_idx = 0;
3333 	req->word = htons(word);
3334 	req->mask = htobe64(mask);
3335 	req->val = htobe64(val);
3336 }
3337 
3338 static inline void
3339 set_tcb_field_ulp(struct cpl_set_tcb_field *req, unsigned int tid,
3340     unsigned int word, u64 mask, u64 val)
3341 {
3342 	struct ulp_txpkt *txpkt = (struct ulp_txpkt *)req;
3343 
3344 	txpkt->cmd_dest = htonl(V_ULPTX_CMD(ULP_TXPKT));
3345 	txpkt->len = htonl(V_ULPTX_NFLITS(sizeof(*req) / 8));
3346 	mk_set_tcb_field(req, tid, word, mask, val);
3347 }
3348 
3349 void
3350 t3_iterate(void (*func)(struct adapter *, void *), void *arg)
3351 {
3352 	struct adapter *sc;
3353 
3354 	mtx_lock(&t3_list_lock);
3355 	SLIST_FOREACH(sc, &t3_list, link) {
3356 		/*
3357 		 * func should not make any assumptions about what state sc is
3358 		 * in - the only guarantee is that sc->sc_lock is a valid lock.
3359 		 */
3360 		func(sc, arg);
3361 	}
3362 	mtx_unlock(&t3_list_lock);
3363 }
3364 
3365 #ifdef TCP_OFFLOAD
3366 static int
3367 toe_capability(struct port_info *pi, int enable)
3368 {
3369 	int rc;
3370 	struct adapter *sc = pi->adapter;
3371 
3372 	ADAPTER_LOCK_ASSERT_OWNED(sc);
3373 
3374 	if (!is_offload(sc))
3375 		return (ENODEV);
3376 
3377 	if (enable) {
3378 		if (!(sc->flags & FULL_INIT_DONE)) {
3379 			log(LOG_WARNING,
3380 			    "You must enable a cxgb interface first\n");
3381 			return (EAGAIN);
3382 		}
3383 
3384 		if (isset(&sc->offload_map, pi->port_id))
3385 			return (0);
3386 
3387 		if (!(sc->flags & TOM_INIT_DONE)) {
3388 			rc = t3_activate_uld(sc, ULD_TOM);
3389 			if (rc == EAGAIN) {
3390 				log(LOG_WARNING,
3391 				    "You must kldload t3_tom.ko before trying "
3392 				    "to enable TOE on a cxgb interface.\n");
3393 			}
3394 			if (rc != 0)
3395 				return (rc);
3396 			KASSERT(sc->tom_softc != NULL,
3397 			    ("%s: TOM activated but softc NULL", __func__));
3398 			KASSERT(sc->flags & TOM_INIT_DONE,
3399 			    ("%s: TOM activated but flag not set", __func__));
3400 		}
3401 
3402 		setbit(&sc->offload_map, pi->port_id);
3403 
3404 		/*
3405 		 * XXX: Temporary code to allow iWARP to be enabled when TOE is
3406 		 * enabled on any port.  Need to figure out how to enable,
3407 		 * disable, load, and unload iWARP cleanly.
3408 		 */
3409 		if (!isset(&sc->offload_map, MAX_NPORTS) &&
3410 		    t3_activate_uld(sc, ULD_IWARP) == 0)
3411 			setbit(&sc->offload_map, MAX_NPORTS);
3412 	} else {
3413 		if (!isset(&sc->offload_map, pi->port_id))
3414 			return (0);
3415 
3416 		KASSERT(sc->flags & TOM_INIT_DONE,
3417 		    ("%s: TOM never initialized?", __func__));
3418 		clrbit(&sc->offload_map, pi->port_id);
3419 	}
3420 
3421 	return (0);
3422 }
3423 
3424 /*
3425  * Add an upper layer driver to the global list.
3426  */
3427 int
3428 t3_register_uld(struct uld_info *ui)
3429 {
3430 	int rc = 0;
3431 	struct uld_info *u;
3432 
3433 	mtx_lock(&t3_uld_list_lock);
3434 	SLIST_FOREACH(u, &t3_uld_list, link) {
3435 	    if (u->uld_id == ui->uld_id) {
3436 		    rc = EEXIST;
3437 		    goto done;
3438 	    }
3439 	}
3440 
3441 	SLIST_INSERT_HEAD(&t3_uld_list, ui, link);
3442 	ui->refcount = 0;
3443 done:
3444 	mtx_unlock(&t3_uld_list_lock);
3445 	return (rc);
3446 }
3447 
3448 int
3449 t3_unregister_uld(struct uld_info *ui)
3450 {
3451 	int rc = EINVAL;
3452 	struct uld_info *u;
3453 
3454 	mtx_lock(&t3_uld_list_lock);
3455 
3456 	SLIST_FOREACH(u, &t3_uld_list, link) {
3457 	    if (u == ui) {
3458 		    if (ui->refcount > 0) {
3459 			    rc = EBUSY;
3460 			    goto done;
3461 		    }
3462 
3463 		    SLIST_REMOVE(&t3_uld_list, ui, uld_info, link);
3464 		    rc = 0;
3465 		    goto done;
3466 	    }
3467 	}
3468 done:
3469 	mtx_unlock(&t3_uld_list_lock);
3470 	return (rc);
3471 }
3472 
3473 int
3474 t3_activate_uld(struct adapter *sc, int id)
3475 {
3476 	int rc = EAGAIN;
3477 	struct uld_info *ui;
3478 
3479 	mtx_lock(&t3_uld_list_lock);
3480 
3481 	SLIST_FOREACH(ui, &t3_uld_list, link) {
3482 		if (ui->uld_id == id) {
3483 			rc = ui->activate(sc);
3484 			if (rc == 0)
3485 				ui->refcount++;
3486 			goto done;
3487 		}
3488 	}
3489 done:
3490 	mtx_unlock(&t3_uld_list_lock);
3491 
3492 	return (rc);
3493 }
3494 
3495 int
3496 t3_deactivate_uld(struct adapter *sc, int id)
3497 {
3498 	int rc = EINVAL;
3499 	struct uld_info *ui;
3500 
3501 	mtx_lock(&t3_uld_list_lock);
3502 
3503 	SLIST_FOREACH(ui, &t3_uld_list, link) {
3504 		if (ui->uld_id == id) {
3505 			rc = ui->deactivate(sc);
3506 			if (rc == 0)
3507 				ui->refcount--;
3508 			goto done;
3509 		}
3510 	}
3511 done:
3512 	mtx_unlock(&t3_uld_list_lock);
3513 
3514 	return (rc);
3515 }
3516 
3517 static int
3518 cpl_not_handled(struct sge_qset *qs __unused, struct rsp_desc *r __unused,
3519     struct mbuf *m)
3520 {
3521 	m_freem(m);
3522 	return (EDOOFUS);
3523 }
3524 
3525 int
3526 t3_register_cpl_handler(struct adapter *sc, int opcode, cpl_handler_t h)
3527 {
3528 	uintptr_t *loc, new;
3529 
3530 	if (opcode >= NUM_CPL_HANDLERS)
3531 		return (EINVAL);
3532 
3533 	new = h ? (uintptr_t)h : (uintptr_t)cpl_not_handled;
3534 	loc = (uintptr_t *) &sc->cpl_handler[opcode];
3535 	atomic_store_rel_ptr(loc, new);
3536 
3537 	return (0);
3538 }
3539 #endif
3540 
3541 static int
3542 cxgbc_mod_event(module_t mod, int cmd, void *arg)
3543 {
3544 	int rc = 0;
3545 
3546 	switch (cmd) {
3547 	case MOD_LOAD:
3548 		mtx_init(&t3_list_lock, "T3 adapters", 0, MTX_DEF);
3549 		SLIST_INIT(&t3_list);
3550 #ifdef TCP_OFFLOAD
3551 		mtx_init(&t3_uld_list_lock, "T3 ULDs", 0, MTX_DEF);
3552 		SLIST_INIT(&t3_uld_list);
3553 #endif
3554 		break;
3555 
3556 	case MOD_UNLOAD:
3557 #ifdef TCP_OFFLOAD
3558 		mtx_lock(&t3_uld_list_lock);
3559 		if (!SLIST_EMPTY(&t3_uld_list)) {
3560 			rc = EBUSY;
3561 			mtx_unlock(&t3_uld_list_lock);
3562 			break;
3563 		}
3564 		mtx_unlock(&t3_uld_list_lock);
3565 		mtx_destroy(&t3_uld_list_lock);
3566 #endif
3567 		mtx_lock(&t3_list_lock);
3568 		if (!SLIST_EMPTY(&t3_list)) {
3569 			rc = EBUSY;
3570 			mtx_unlock(&t3_list_lock);
3571 			break;
3572 		}
3573 		mtx_unlock(&t3_list_lock);
3574 		mtx_destroy(&t3_list_lock);
3575 		break;
3576 	}
3577 
3578 	return (rc);
3579 }
3580 
3581 #ifdef DEBUGNET
3582 static void
3583 cxgb_debugnet_init(if_t ifp, int *nrxr, int *ncl, int *clsize)
3584 {
3585 	struct port_info *pi;
3586 	adapter_t *adap;
3587 
3588 	pi = if_getsoftc(ifp);
3589 	adap = pi->adapter;
3590 	ADAPTER_LOCK(adap);
3591 	*nrxr = adap->nqsets;
3592 	*ncl = adap->sge.qs[0].fl[1].size;
3593 	*clsize = adap->sge.qs[0].fl[1].buf_size;
3594 	ADAPTER_UNLOCK(adap);
3595 }
3596 
3597 static void
3598 cxgb_debugnet_event(if_t ifp, enum debugnet_ev event)
3599 {
3600 	struct port_info *pi;
3601 	struct sge_qset *qs;
3602 	int i;
3603 
3604 	pi = if_getsoftc(ifp);
3605 	if (event == DEBUGNET_START)
3606 		for (i = 0; i < pi->adapter->nqsets; i++) {
3607 			qs = &pi->adapter->sge.qs[i];
3608 
3609 			/* Need to reinit after debugnet_mbuf_start(). */
3610 			qs->fl[0].zone = zone_pack;
3611 			qs->fl[1].zone = zone_clust;
3612 			qs->lro.enabled = 0;
3613 		}
3614 }
3615 
3616 static int
3617 cxgb_debugnet_transmit(if_t ifp, struct mbuf *m)
3618 {
3619 	struct port_info *pi;
3620 	struct sge_qset *qs;
3621 
3622 	pi = if_getsoftc(ifp);
3623 	if ((if_getdrvflags(ifp) & (IFF_DRV_RUNNING | IFF_DRV_OACTIVE)) !=
3624 	    IFF_DRV_RUNNING)
3625 		return (ENOENT);
3626 
3627 	qs = &pi->adapter->sge.qs[pi->first_qset];
3628 	return (cxgb_debugnet_encap(qs, &m));
3629 }
3630 
3631 static int
3632 cxgb_debugnet_poll(if_t ifp, int count)
3633 {
3634 	struct port_info *pi;
3635 	adapter_t *adap;
3636 	int i;
3637 
3638 	pi = if_getsoftc(ifp);
3639 	if ((if_getdrvflags(ifp) & IFF_DRV_RUNNING) == 0)
3640 		return (ENOENT);
3641 
3642 	adap = pi->adapter;
3643 	for (i = 0; i < adap->nqsets; i++)
3644 		(void)cxgb_debugnet_poll_rx(adap, &adap->sge.qs[i]);
3645 	(void)cxgb_debugnet_poll_tx(&adap->sge.qs[pi->first_qset]);
3646 	return (0);
3647 }
3648 #endif /* DEBUGNET */
3649