xref: /titanic_52/usr/src/uts/common/io/ixgbe/ixgbe_main.c (revision 9ab815e1e50104cb1004a5ccca7a6da582994b57)
1 /*
2  * CDDL HEADER START
3  *
4  * The contents of this file are subject to the terms of the
5  * Common Development and Distribution License (the "License").
6  * You may not use this file except in compliance with the License.
7  *
8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9  * or http://www.opensolaris.org/os/licensing.
10  * See the License for the specific language governing permissions
11  * and limitations under the License.
12  *
13  * When distributing Covered Code, include this CDDL HEADER in each
14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15  * If applicable, add the following below this CDDL HEADER, with the
16  * fields enclosed by brackets "[]" replaced with your own identifying
17  * information: Portions Copyright [yyyy] [name of copyright owner]
18  *
19  * CDDL HEADER END
20  */
21 
22 /*
23  * Copyright(c) 2007-2010 Intel Corporation. All rights reserved.
24  */
25 
26 /*
27  * Copyright (c) 2008, 2010, Oracle and/or its affiliates. All rights reserved.
28  */
29 
30 #include "ixgbe_sw.h"
31 
32 static char ixgbe_ident[] = "Intel 10Gb Ethernet";
33 static char ixgbe_version[] = "ixgbe 1.1.7";
34 
35 /*
36  * Local function protoypes
37  */
38 static int ixgbe_register_mac(ixgbe_t *);
39 static int ixgbe_identify_hardware(ixgbe_t *);
40 static int ixgbe_regs_map(ixgbe_t *);
41 static void ixgbe_init_properties(ixgbe_t *);
42 static int ixgbe_init_driver_settings(ixgbe_t *);
43 static void ixgbe_init_locks(ixgbe_t *);
44 static void ixgbe_destroy_locks(ixgbe_t *);
45 static int ixgbe_init(ixgbe_t *);
46 static int ixgbe_chip_start(ixgbe_t *);
47 static void ixgbe_chip_stop(ixgbe_t *);
48 static int ixgbe_reset(ixgbe_t *);
49 static void ixgbe_tx_clean(ixgbe_t *);
50 static boolean_t ixgbe_tx_drain(ixgbe_t *);
51 static boolean_t ixgbe_rx_drain(ixgbe_t *);
52 static int ixgbe_alloc_rings(ixgbe_t *);
53 static void ixgbe_free_rings(ixgbe_t *);
54 static int ixgbe_alloc_rx_data(ixgbe_t *);
55 static void ixgbe_free_rx_data(ixgbe_t *);
56 static void ixgbe_setup_rings(ixgbe_t *);
57 static void ixgbe_setup_rx(ixgbe_t *);
58 static void ixgbe_setup_tx(ixgbe_t *);
59 static void ixgbe_setup_rx_ring(ixgbe_rx_ring_t *);
60 static void ixgbe_setup_tx_ring(ixgbe_tx_ring_t *);
61 static void ixgbe_setup_rss(ixgbe_t *);
62 static void ixgbe_setup_vmdq(ixgbe_t *);
63 static void ixgbe_setup_vmdq_rss(ixgbe_t *);
64 static void ixgbe_init_unicst(ixgbe_t *);
65 static int ixgbe_unicst_find(ixgbe_t *, const uint8_t *);
66 static void ixgbe_setup_multicst(ixgbe_t *);
67 static void ixgbe_get_hw_state(ixgbe_t *);
68 static void ixgbe_setup_vmdq_rss_conf(ixgbe_t *ixgbe);
69 static void ixgbe_get_conf(ixgbe_t *);
70 static void ixgbe_init_params(ixgbe_t *);
71 static int ixgbe_get_prop(ixgbe_t *, char *, int, int, int);
72 static void ixgbe_driver_link_check(ixgbe_t *);
73 static void ixgbe_sfp_check(void *);
74 static void ixgbe_overtemp_check(void *);
75 static void ixgbe_link_timer(void *);
76 static void ixgbe_local_timer(void *);
77 static void ixgbe_arm_watchdog_timer(ixgbe_t *);
78 static void ixgbe_restart_watchdog_timer(ixgbe_t *);
79 static void ixgbe_disable_adapter_interrupts(ixgbe_t *);
80 static void ixgbe_enable_adapter_interrupts(ixgbe_t *);
81 static boolean_t is_valid_mac_addr(uint8_t *);
82 static boolean_t ixgbe_stall_check(ixgbe_t *);
83 static boolean_t ixgbe_set_loopback_mode(ixgbe_t *, uint32_t);
84 static void ixgbe_set_internal_mac_loopback(ixgbe_t *);
85 static boolean_t ixgbe_find_mac_address(ixgbe_t *);
86 static int ixgbe_alloc_intrs(ixgbe_t *);
87 static int ixgbe_alloc_intr_handles(ixgbe_t *, int);
88 static int ixgbe_add_intr_handlers(ixgbe_t *);
89 static void ixgbe_map_rxring_to_vector(ixgbe_t *, int, int);
90 static void ixgbe_map_txring_to_vector(ixgbe_t *, int, int);
91 static void ixgbe_setup_ivar(ixgbe_t *, uint16_t, uint8_t, int8_t);
92 static void ixgbe_enable_ivar(ixgbe_t *, uint16_t, int8_t);
93 static void ixgbe_disable_ivar(ixgbe_t *, uint16_t, int8_t);
94 static uint32_t ixgbe_get_hw_rx_index(ixgbe_t *ixgbe, uint32_t sw_rx_index);
95 static int ixgbe_map_intrs_to_vectors(ixgbe_t *);
96 static void ixgbe_setup_adapter_vector(ixgbe_t *);
97 static void ixgbe_rem_intr_handlers(ixgbe_t *);
98 static void ixgbe_rem_intrs(ixgbe_t *);
99 static int ixgbe_enable_intrs(ixgbe_t *);
100 static int ixgbe_disable_intrs(ixgbe_t *);
101 static uint_t ixgbe_intr_legacy(void *, void *);
102 static uint_t ixgbe_intr_msi(void *, void *);
103 static uint_t ixgbe_intr_msix(void *, void *);
104 static void ixgbe_intr_rx_work(ixgbe_rx_ring_t *);
105 static void ixgbe_intr_tx_work(ixgbe_tx_ring_t *);
106 static void ixgbe_intr_other_work(ixgbe_t *, uint32_t);
107 static void ixgbe_get_driver_control(struct ixgbe_hw *);
108 static int ixgbe_addmac(void *, const uint8_t *);
109 static int ixgbe_remmac(void *, const uint8_t *);
110 static void ixgbe_release_driver_control(struct ixgbe_hw *);
111 
112 static int ixgbe_attach(dev_info_t *, ddi_attach_cmd_t);
113 static int ixgbe_detach(dev_info_t *, ddi_detach_cmd_t);
114 static int ixgbe_resume(dev_info_t *);
115 static int ixgbe_suspend(dev_info_t *);
116 static void ixgbe_unconfigure(dev_info_t *, ixgbe_t *);
117 static uint8_t *ixgbe_mc_table_itr(struct ixgbe_hw *, uint8_t **, uint32_t *);
118 static int ixgbe_cbfunc(dev_info_t *, ddi_cb_action_t, void *, void *, void *);
119 static int ixgbe_intr_cb_register(ixgbe_t *);
120 static int ixgbe_intr_adjust(ixgbe_t *, ddi_cb_action_t, int);
121 
122 static int ixgbe_fm_error_cb(dev_info_t *dip, ddi_fm_error_t *err,
123     const void *impl_data);
124 static void ixgbe_fm_init(ixgbe_t *);
125 static void ixgbe_fm_fini(ixgbe_t *);
126 
127 char *ixgbe_priv_props[] = {
128 	"_tx_copy_thresh",
129 	"_tx_recycle_thresh",
130 	"_tx_overload_thresh",
131 	"_tx_resched_thresh",
132 	"_rx_copy_thresh",
133 	"_rx_limit_per_intr",
134 	"_intr_throttling",
135 	"_adv_pause_cap",
136 	"_adv_asym_pause_cap",
137 	NULL
138 };
139 
140 #define	IXGBE_MAX_PRIV_PROPS \
141 	(sizeof (ixgbe_priv_props) / sizeof (mac_priv_prop_t))
142 
143 static struct cb_ops ixgbe_cb_ops = {
144 	nulldev,		/* cb_open */
145 	nulldev,		/* cb_close */
146 	nodev,			/* cb_strategy */
147 	nodev,			/* cb_print */
148 	nodev,			/* cb_dump */
149 	nodev,			/* cb_read */
150 	nodev,			/* cb_write */
151 	nodev,			/* cb_ioctl */
152 	nodev,			/* cb_devmap */
153 	nodev,			/* cb_mmap */
154 	nodev,			/* cb_segmap */
155 	nochpoll,		/* cb_chpoll */
156 	ddi_prop_op,		/* cb_prop_op */
157 	NULL,			/* cb_stream */
158 	D_MP | D_HOTPLUG,	/* cb_flag */
159 	CB_REV,			/* cb_rev */
160 	nodev,			/* cb_aread */
161 	nodev			/* cb_awrite */
162 };
163 
164 static struct dev_ops ixgbe_dev_ops = {
165 	DEVO_REV,		/* devo_rev */
166 	0,			/* devo_refcnt */
167 	NULL,			/* devo_getinfo */
168 	nulldev,		/* devo_identify */
169 	nulldev,		/* devo_probe */
170 	ixgbe_attach,		/* devo_attach */
171 	ixgbe_detach,		/* devo_detach */
172 	nodev,			/* devo_reset */
173 	&ixgbe_cb_ops,		/* devo_cb_ops */
174 	NULL,			/* devo_bus_ops */
175 	ddi_power,		/* devo_power */
176 	ddi_quiesce_not_supported,	/* devo_quiesce */
177 };
178 
179 static struct modldrv ixgbe_modldrv = {
180 	&mod_driverops,		/* Type of module.  This one is a driver */
181 	ixgbe_ident,		/* Discription string */
182 	&ixgbe_dev_ops		/* driver ops */
183 };
184 
185 static struct modlinkage ixgbe_modlinkage = {
186 	MODREV_1, &ixgbe_modldrv, NULL
187 };
188 
189 /*
190  * Access attributes for register mapping
191  */
192 ddi_device_acc_attr_t ixgbe_regs_acc_attr = {
193 	DDI_DEVICE_ATTR_V1,
194 	DDI_STRUCTURE_LE_ACC,
195 	DDI_STRICTORDER_ACC,
196 	DDI_FLAGERR_ACC
197 };
198 
199 /*
200  * Loopback property
201  */
202 static lb_property_t lb_normal = {
203 	normal,	"normal", IXGBE_LB_NONE
204 };
205 
206 static lb_property_t lb_mac = {
207 	internal, "MAC", IXGBE_LB_INTERNAL_MAC
208 };
209 
210 static lb_property_t lb_external = {
211 	external, "External", IXGBE_LB_EXTERNAL
212 };
213 
214 #define	IXGBE_M_CALLBACK_FLAGS \
215 	(MC_IOCTL | MC_GETCAPAB | MC_SETPROP | MC_GETPROP | MC_PROPINFO)
216 
217 static mac_callbacks_t ixgbe_m_callbacks = {
218 	IXGBE_M_CALLBACK_FLAGS,
219 	ixgbe_m_stat,
220 	ixgbe_m_start,
221 	ixgbe_m_stop,
222 	ixgbe_m_promisc,
223 	ixgbe_m_multicst,
224 	NULL,
225 	NULL,
226 	NULL,
227 	ixgbe_m_ioctl,
228 	ixgbe_m_getcapab,
229 	NULL,
230 	NULL,
231 	ixgbe_m_setprop,
232 	ixgbe_m_getprop,
233 	ixgbe_m_propinfo
234 };
235 
236 /*
237  * Initialize capabilities of each supported adapter type
238  */
239 static adapter_info_t ixgbe_82598eb_cap = {
240 	64,		/* maximum number of rx queues */
241 	1,		/* minimum number of rx queues */
242 	64,		/* default number of rx queues */
243 	16,		/* maximum number of rx groups */
244 	1,		/* minimum number of rx groups */
245 	1,		/* default number of rx groups */
246 	32,		/* maximum number of tx queues */
247 	1,		/* minimum number of tx queues */
248 	8,		/* default number of tx queues */
249 	16366,		/* maximum MTU size */
250 	0xFFFF,		/* maximum interrupt throttle rate */
251 	0,		/* minimum interrupt throttle rate */
252 	200,		/* default interrupt throttle rate */
253 	18,		/* maximum total msix vectors */
254 	16,		/* maximum number of ring vectors */
255 	2,		/* maximum number of other vectors */
256 	IXGBE_EICR_LSC,	/* "other" interrupt types handled */
257 	0,		/* "other" interrupt types enable mask */
258 	(IXGBE_FLAG_DCA_CAPABLE	/* capability flags */
259 	| IXGBE_FLAG_RSS_CAPABLE
260 	| IXGBE_FLAG_VMDQ_CAPABLE)
261 };
262 
263 static adapter_info_t ixgbe_82599eb_cap = {
264 	128,		/* maximum number of rx queues */
265 	1,		/* minimum number of rx queues */
266 	128,		/* default number of rx queues */
267 	64,		/* maximum number of rx groups */
268 	1,		/* minimum number of rx groups */
269 	1,		/* default number of rx groups */
270 	128,		/* maximum number of tx queues */
271 	1,		/* minimum number of tx queues */
272 	8,		/* default number of tx queues */
273 	15500,		/* maximum MTU size */
274 	0xFF8,		/* maximum interrupt throttle rate */
275 	0,		/* minimum interrupt throttle rate */
276 	200,		/* default interrupt throttle rate */
277 	64,		/* maximum total msix vectors */
278 	16,		/* maximum number of ring vectors */
279 	2,		/* maximum number of other vectors */
280 	(IXGBE_EICR_LSC
281 	| IXGBE_EICR_GPI_SDP1
282 	| IXGBE_EICR_GPI_SDP2), /* "other" interrupt types handled */
283 
284 	(IXGBE_SDP1_GPIEN
285 	| IXGBE_SDP2_GPIEN), /* "other" interrupt types enable mask */
286 
287 	(IXGBE_FLAG_DCA_CAPABLE
288 	| IXGBE_FLAG_RSS_CAPABLE
289 	| IXGBE_FLAG_VMDQ_CAPABLE
290 	| IXGBE_FLAG_RSC_CAPABLE
291 	| IXGBE_FLAG_SFP_PLUG_CAPABLE) /* capability flags */
292 };
293 
294 /*
295  * Module Initialization Functions.
296  */
297 
298 int
299 _init(void)
300 {
301 	int status;
302 
303 	mac_init_ops(&ixgbe_dev_ops, MODULE_NAME);
304 
305 	status = mod_install(&ixgbe_modlinkage);
306 
307 	if (status != DDI_SUCCESS) {
308 		mac_fini_ops(&ixgbe_dev_ops);
309 	}
310 
311 	return (status);
312 }
313 
314 int
315 _fini(void)
316 {
317 	int status;
318 
319 	status = mod_remove(&ixgbe_modlinkage);
320 
321 	if (status == DDI_SUCCESS) {
322 		mac_fini_ops(&ixgbe_dev_ops);
323 	}
324 
325 	return (status);
326 }
327 
328 int
329 _info(struct modinfo *modinfop)
330 {
331 	int status;
332 
333 	status = mod_info(&ixgbe_modlinkage, modinfop);
334 
335 	return (status);
336 }
337 
338 /*
339  * ixgbe_attach - Driver attach.
340  *
341  * This function is the device specific initialization entry
342  * point. This entry point is required and must be written.
343  * The DDI_ATTACH command must be provided in the attach entry
344  * point. When attach() is called with cmd set to DDI_ATTACH,
345  * all normal kernel services (such as kmem_alloc(9F)) are
346  * available for use by the driver.
347  *
348  * The attach() function will be called once for each instance
349  * of  the  device  on  the  system with cmd set to DDI_ATTACH.
350  * Until attach() succeeds, the only driver entry points which
351  * may be called are open(9E) and getinfo(9E).
352  */
353 static int
354 ixgbe_attach(dev_info_t *devinfo, ddi_attach_cmd_t cmd)
355 {
356 	ixgbe_t *ixgbe;
357 	struct ixgbe_osdep *osdep;
358 	struct ixgbe_hw *hw;
359 	int instance;
360 	char taskqname[32];
361 
362 	/*
363 	 * Check the command and perform corresponding operations
364 	 */
365 	switch (cmd) {
366 	default:
367 		return (DDI_FAILURE);
368 
369 	case DDI_RESUME:
370 		return (ixgbe_resume(devinfo));
371 
372 	case DDI_ATTACH:
373 		break;
374 	}
375 
376 	/* Get the device instance */
377 	instance = ddi_get_instance(devinfo);
378 
379 	/* Allocate memory for the instance data structure */
380 	ixgbe = kmem_zalloc(sizeof (ixgbe_t), KM_SLEEP);
381 
382 	ixgbe->dip = devinfo;
383 	ixgbe->instance = instance;
384 
385 	hw = &ixgbe->hw;
386 	osdep = &ixgbe->osdep;
387 	hw->back = osdep;
388 	osdep->ixgbe = ixgbe;
389 
390 	/* Attach the instance pointer to the dev_info data structure */
391 	ddi_set_driver_private(devinfo, ixgbe);
392 
393 	/*
394 	 * Initialize for fma support
395 	 */
396 	ixgbe->fm_capabilities = ixgbe_get_prop(ixgbe, PROP_FM_CAPABLE,
397 	    0, 0x0f, DDI_FM_EREPORT_CAPABLE | DDI_FM_ACCCHK_CAPABLE |
398 	    DDI_FM_DMACHK_CAPABLE | DDI_FM_ERRCB_CAPABLE);
399 	ixgbe_fm_init(ixgbe);
400 	ixgbe->attach_progress |= ATTACH_PROGRESS_FM_INIT;
401 
402 	/*
403 	 * Map PCI config space registers
404 	 */
405 	if (pci_config_setup(devinfo, &osdep->cfg_handle) != DDI_SUCCESS) {
406 		ixgbe_error(ixgbe, "Failed to map PCI configurations");
407 		goto attach_fail;
408 	}
409 	ixgbe->attach_progress |= ATTACH_PROGRESS_PCI_CONFIG;
410 
411 	/*
412 	 * Identify the chipset family
413 	 */
414 	if (ixgbe_identify_hardware(ixgbe) != IXGBE_SUCCESS) {
415 		ixgbe_error(ixgbe, "Failed to identify hardware");
416 		goto attach_fail;
417 	}
418 
419 	/*
420 	 * Map device registers
421 	 */
422 	if (ixgbe_regs_map(ixgbe) != IXGBE_SUCCESS) {
423 		ixgbe_error(ixgbe, "Failed to map device registers");
424 		goto attach_fail;
425 	}
426 	ixgbe->attach_progress |= ATTACH_PROGRESS_REGS_MAP;
427 
428 	/*
429 	 * Initialize driver parameters
430 	 */
431 	ixgbe_init_properties(ixgbe);
432 	ixgbe->attach_progress |= ATTACH_PROGRESS_PROPS;
433 
434 	/*
435 	 * Register interrupt callback
436 	 */
437 	if (ixgbe_intr_cb_register(ixgbe) != IXGBE_SUCCESS) {
438 		ixgbe_error(ixgbe, "Failed to register interrupt callback");
439 		goto attach_fail;
440 	}
441 
442 	/*
443 	 * Allocate interrupts
444 	 */
445 	if (ixgbe_alloc_intrs(ixgbe) != IXGBE_SUCCESS) {
446 		ixgbe_error(ixgbe, "Failed to allocate interrupts");
447 		goto attach_fail;
448 	}
449 	ixgbe->attach_progress |= ATTACH_PROGRESS_ALLOC_INTR;
450 
451 	/*
452 	 * Allocate rx/tx rings based on the ring numbers.
453 	 * The actual numbers of rx/tx rings are decided by the number of
454 	 * allocated interrupt vectors, so we should allocate the rings after
455 	 * interrupts are allocated.
456 	 */
457 	if (ixgbe_alloc_rings(ixgbe) != IXGBE_SUCCESS) {
458 		ixgbe_error(ixgbe, "Failed to allocate rx and tx rings");
459 		goto attach_fail;
460 	}
461 	ixgbe->attach_progress |= ATTACH_PROGRESS_ALLOC_RINGS;
462 
463 	/*
464 	 * Map rings to interrupt vectors
465 	 */
466 	if (ixgbe_map_intrs_to_vectors(ixgbe) != IXGBE_SUCCESS) {
467 		ixgbe_error(ixgbe, "Failed to map interrupts to vectors");
468 		goto attach_fail;
469 	}
470 
471 	/*
472 	 * Add interrupt handlers
473 	 */
474 	if (ixgbe_add_intr_handlers(ixgbe) != IXGBE_SUCCESS) {
475 		ixgbe_error(ixgbe, "Failed to add interrupt handlers");
476 		goto attach_fail;
477 	}
478 	ixgbe->attach_progress |= ATTACH_PROGRESS_ADD_INTR;
479 
480 	/*
481 	 * Create a taskq for sfp-change
482 	 */
483 	(void) sprintf(taskqname, "ixgbe%d_sfp_taskq", instance);
484 	if ((ixgbe->sfp_taskq = ddi_taskq_create(devinfo, taskqname,
485 	    1, TASKQ_DEFAULTPRI, 0)) == NULL) {
486 		ixgbe_error(ixgbe, "sfp_taskq create failed");
487 		goto attach_fail;
488 	}
489 	ixgbe->attach_progress |= ATTACH_PROGRESS_SFP_TASKQ;
490 
491 	/*
492 	 * Create a taskq for over-temp
493 	 */
494 	(void) sprintf(taskqname, "ixgbe%d_overtemp_taskq", instance);
495 	if ((ixgbe->overtemp_taskq = ddi_taskq_create(devinfo, taskqname,
496 	    1, TASKQ_DEFAULTPRI, 0)) == NULL) {
497 		ixgbe_error(ixgbe, "overtemp_taskq create failed");
498 		goto attach_fail;
499 	}
500 	ixgbe->attach_progress |= ATTACH_PROGRESS_OVERTEMP_TASKQ;
501 
502 	/*
503 	 * Initialize driver parameters
504 	 */
505 	if (ixgbe_init_driver_settings(ixgbe) != IXGBE_SUCCESS) {
506 		ixgbe_error(ixgbe, "Failed to initialize driver settings");
507 		goto attach_fail;
508 	}
509 
510 	/*
511 	 * Initialize mutexes for this device.
512 	 * Do this before enabling the interrupt handler and
513 	 * register the softint to avoid the condition where
514 	 * interrupt handler can try using uninitialized mutex.
515 	 */
516 	ixgbe_init_locks(ixgbe);
517 	ixgbe->attach_progress |= ATTACH_PROGRESS_LOCKS;
518 
519 	/*
520 	 * Initialize chipset hardware
521 	 */
522 	if (ixgbe_init(ixgbe) != IXGBE_SUCCESS) {
523 		ixgbe_error(ixgbe, "Failed to initialize adapter");
524 		goto attach_fail;
525 	}
526 	ixgbe->link_check_complete = B_FALSE;
527 	ixgbe->link_check_hrtime = gethrtime() +
528 	    (IXGBE_LINK_UP_TIME * 100000000ULL);
529 	ixgbe->attach_progress |= ATTACH_PROGRESS_INIT;
530 
531 	if (ixgbe_check_acc_handle(ixgbe->osdep.cfg_handle) != DDI_FM_OK) {
532 		ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_LOST);
533 		goto attach_fail;
534 	}
535 
536 	/*
537 	 * Initialize statistics
538 	 */
539 	if (ixgbe_init_stats(ixgbe) != IXGBE_SUCCESS) {
540 		ixgbe_error(ixgbe, "Failed to initialize statistics");
541 		goto attach_fail;
542 	}
543 	ixgbe->attach_progress |= ATTACH_PROGRESS_STATS;
544 
545 	/*
546 	 * Register the driver to the MAC
547 	 */
548 	if (ixgbe_register_mac(ixgbe) != IXGBE_SUCCESS) {
549 		ixgbe_error(ixgbe, "Failed to register MAC");
550 		goto attach_fail;
551 	}
552 	mac_link_update(ixgbe->mac_hdl, LINK_STATE_UNKNOWN);
553 	ixgbe->attach_progress |= ATTACH_PROGRESS_MAC;
554 
555 	ixgbe->periodic_id = ddi_periodic_add(ixgbe_link_timer, ixgbe,
556 	    IXGBE_CYCLIC_PERIOD, DDI_IPL_0);
557 	if (ixgbe->periodic_id == 0) {
558 		ixgbe_error(ixgbe, "Failed to add the link check timer");
559 		goto attach_fail;
560 	}
561 	ixgbe->attach_progress |= ATTACH_PROGRESS_LINK_TIMER;
562 
563 	/*
564 	 * Now that mutex locks are initialized, and the chip is also
565 	 * initialized, enable interrupts.
566 	 */
567 	if (ixgbe_enable_intrs(ixgbe) != IXGBE_SUCCESS) {
568 		ixgbe_error(ixgbe, "Failed to enable DDI interrupts");
569 		goto attach_fail;
570 	}
571 	ixgbe->attach_progress |= ATTACH_PROGRESS_ENABLE_INTR;
572 
573 	ixgbe_log(ixgbe, "%s, %s", ixgbe_ident, ixgbe_version);
574 	atomic_or_32(&ixgbe->ixgbe_state, IXGBE_INITIALIZED);
575 
576 	return (DDI_SUCCESS);
577 
578 attach_fail:
579 	ixgbe_unconfigure(devinfo, ixgbe);
580 	return (DDI_FAILURE);
581 }
582 
583 /*
584  * ixgbe_detach - Driver detach.
585  *
586  * The detach() function is the complement of the attach routine.
587  * If cmd is set to DDI_DETACH, detach() is used to remove  the
588  * state  associated  with  a  given  instance of a device node
589  * prior to the removal of that instance from the system.
590  *
591  * The detach() function will be called once for each  instance
592  * of the device for which there has been a successful attach()
593  * once there are no longer  any  opens  on  the  device.
594  *
595  * Interrupts routine are disabled, All memory allocated by this
596  * driver are freed.
597  */
598 static int
599 ixgbe_detach(dev_info_t *devinfo, ddi_detach_cmd_t cmd)
600 {
601 	ixgbe_t *ixgbe;
602 
603 	/*
604 	 * Check detach command
605 	 */
606 	switch (cmd) {
607 	default:
608 		return (DDI_FAILURE);
609 
610 	case DDI_SUSPEND:
611 		return (ixgbe_suspend(devinfo));
612 
613 	case DDI_DETACH:
614 		break;
615 	}
616 
617 	/*
618 	 * Get the pointer to the driver private data structure
619 	 */
620 	ixgbe = (ixgbe_t *)ddi_get_driver_private(devinfo);
621 	if (ixgbe == NULL)
622 		return (DDI_FAILURE);
623 
624 	/*
625 	 * If the device is still running, it needs to be stopped first.
626 	 * This check is necessary because under some specific circumstances,
627 	 * the detach routine can be called without stopping the interface
628 	 * first.
629 	 */
630 	if (ixgbe->ixgbe_state & IXGBE_STARTED) {
631 		atomic_and_32(&ixgbe->ixgbe_state, ~IXGBE_STARTED);
632 		mutex_enter(&ixgbe->gen_lock);
633 		ixgbe_stop(ixgbe, B_TRUE);
634 		mutex_exit(&ixgbe->gen_lock);
635 		/* Disable and stop the watchdog timer */
636 		ixgbe_disable_watchdog_timer(ixgbe);
637 	}
638 
639 	/*
640 	 * Check if there are still rx buffers held by the upper layer.
641 	 * If so, fail the detach.
642 	 */
643 	if (!ixgbe_rx_drain(ixgbe))
644 		return (DDI_FAILURE);
645 
646 	/*
647 	 * Do the remaining unconfigure routines
648 	 */
649 	ixgbe_unconfigure(devinfo, ixgbe);
650 
651 	return (DDI_SUCCESS);
652 }
653 
654 static void
655 ixgbe_unconfigure(dev_info_t *devinfo, ixgbe_t *ixgbe)
656 {
657 	/*
658 	 * Disable interrupt
659 	 */
660 	if (ixgbe->attach_progress & ATTACH_PROGRESS_ENABLE_INTR) {
661 		(void) ixgbe_disable_intrs(ixgbe);
662 	}
663 
664 	/*
665 	 * remove the link check timer
666 	 */
667 	if (ixgbe->attach_progress & ATTACH_PROGRESS_LINK_TIMER) {
668 		if (ixgbe->periodic_id != NULL) {
669 			ddi_periodic_delete(ixgbe->periodic_id);
670 			ixgbe->periodic_id = NULL;
671 		}
672 	}
673 
674 	/*
675 	 * Unregister MAC
676 	 */
677 	if (ixgbe->attach_progress & ATTACH_PROGRESS_MAC) {
678 		(void) mac_unregister(ixgbe->mac_hdl);
679 	}
680 
681 	/*
682 	 * Free statistics
683 	 */
684 	if (ixgbe->attach_progress & ATTACH_PROGRESS_STATS) {
685 		kstat_delete((kstat_t *)ixgbe->ixgbe_ks);
686 	}
687 
688 	/*
689 	 * Remove interrupt handlers
690 	 */
691 	if (ixgbe->attach_progress & ATTACH_PROGRESS_ADD_INTR) {
692 		ixgbe_rem_intr_handlers(ixgbe);
693 	}
694 
695 	/*
696 	 * Remove taskq for sfp-status-change
697 	 */
698 	if (ixgbe->attach_progress & ATTACH_PROGRESS_SFP_TASKQ) {
699 		ddi_taskq_destroy(ixgbe->sfp_taskq);
700 	}
701 
702 	/*
703 	 * Remove taskq for over-temp
704 	 */
705 	if (ixgbe->attach_progress & ATTACH_PROGRESS_OVERTEMP_TASKQ) {
706 		ddi_taskq_destroy(ixgbe->overtemp_taskq);
707 	}
708 
709 	/*
710 	 * Remove interrupts
711 	 */
712 	if (ixgbe->attach_progress & ATTACH_PROGRESS_ALLOC_INTR) {
713 		ixgbe_rem_intrs(ixgbe);
714 	}
715 
716 	/*
717 	 * Unregister interrupt callback handler
718 	 */
719 	(void) ddi_cb_unregister(ixgbe->cb_hdl);
720 
721 	/*
722 	 * Remove driver properties
723 	 */
724 	if (ixgbe->attach_progress & ATTACH_PROGRESS_PROPS) {
725 		(void) ddi_prop_remove_all(devinfo);
726 	}
727 
728 	/*
729 	 * Stop the chipset
730 	 */
731 	if (ixgbe->attach_progress & ATTACH_PROGRESS_INIT) {
732 		mutex_enter(&ixgbe->gen_lock);
733 		ixgbe_chip_stop(ixgbe);
734 		mutex_exit(&ixgbe->gen_lock);
735 	}
736 
737 	/*
738 	 * Free register handle
739 	 */
740 	if (ixgbe->attach_progress & ATTACH_PROGRESS_REGS_MAP) {
741 		if (ixgbe->osdep.reg_handle != NULL)
742 			ddi_regs_map_free(&ixgbe->osdep.reg_handle);
743 	}
744 
745 	/*
746 	 * Free PCI config handle
747 	 */
748 	if (ixgbe->attach_progress & ATTACH_PROGRESS_PCI_CONFIG) {
749 		if (ixgbe->osdep.cfg_handle != NULL)
750 			pci_config_teardown(&ixgbe->osdep.cfg_handle);
751 	}
752 
753 	/*
754 	 * Free locks
755 	 */
756 	if (ixgbe->attach_progress & ATTACH_PROGRESS_LOCKS) {
757 		ixgbe_destroy_locks(ixgbe);
758 	}
759 
760 	/*
761 	 * Free the rx/tx rings
762 	 */
763 	if (ixgbe->attach_progress & ATTACH_PROGRESS_ALLOC_RINGS) {
764 		ixgbe_free_rings(ixgbe);
765 	}
766 
767 	/*
768 	 * Unregister FMA capabilities
769 	 */
770 	if (ixgbe->attach_progress & ATTACH_PROGRESS_FM_INIT) {
771 		ixgbe_fm_fini(ixgbe);
772 	}
773 
774 	/*
775 	 * Free the driver data structure
776 	 */
777 	kmem_free(ixgbe, sizeof (ixgbe_t));
778 
779 	ddi_set_driver_private(devinfo, NULL);
780 }
781 
782 /*
783  * ixgbe_register_mac - Register the driver and its function pointers with
784  * the GLD interface.
785  */
786 static int
787 ixgbe_register_mac(ixgbe_t *ixgbe)
788 {
789 	struct ixgbe_hw *hw = &ixgbe->hw;
790 	mac_register_t *mac;
791 	int status;
792 
793 	if ((mac = mac_alloc(MAC_VERSION)) == NULL)
794 		return (IXGBE_FAILURE);
795 
796 	mac->m_type_ident = MAC_PLUGIN_IDENT_ETHER;
797 	mac->m_driver = ixgbe;
798 	mac->m_dip = ixgbe->dip;
799 	mac->m_src_addr = hw->mac.addr;
800 	mac->m_callbacks = &ixgbe_m_callbacks;
801 	mac->m_min_sdu = 0;
802 	mac->m_max_sdu = ixgbe->default_mtu;
803 	mac->m_margin = VLAN_TAGSZ;
804 	mac->m_priv_props = ixgbe_priv_props;
805 	mac->m_v12n = MAC_VIRT_LEVEL1;
806 
807 	status = mac_register(mac, &ixgbe->mac_hdl);
808 
809 	mac_free(mac);
810 
811 	return ((status == 0) ? IXGBE_SUCCESS : IXGBE_FAILURE);
812 }
813 
814 /*
815  * ixgbe_identify_hardware - Identify the type of the chipset.
816  */
817 static int
818 ixgbe_identify_hardware(ixgbe_t *ixgbe)
819 {
820 	struct ixgbe_hw *hw = &ixgbe->hw;
821 	struct ixgbe_osdep *osdep = &ixgbe->osdep;
822 
823 	/*
824 	 * Get the device id
825 	 */
826 	hw->vendor_id =
827 	    pci_config_get16(osdep->cfg_handle, PCI_CONF_VENID);
828 	hw->device_id =
829 	    pci_config_get16(osdep->cfg_handle, PCI_CONF_DEVID);
830 	hw->revision_id =
831 	    pci_config_get8(osdep->cfg_handle, PCI_CONF_REVID);
832 	hw->subsystem_device_id =
833 	    pci_config_get16(osdep->cfg_handle, PCI_CONF_SUBSYSID);
834 	hw->subsystem_vendor_id =
835 	    pci_config_get16(osdep->cfg_handle, PCI_CONF_SUBVENID);
836 
837 	/*
838 	 * Set the mac type of the adapter based on the device id
839 	 */
840 	if (ixgbe_set_mac_type(hw) != IXGBE_SUCCESS) {
841 		return (IXGBE_FAILURE);
842 	}
843 
844 	/*
845 	 * Install adapter capabilities
846 	 */
847 	switch (hw->mac.type) {
848 	case ixgbe_mac_82598EB:
849 		IXGBE_DEBUGLOG_0(ixgbe, "identify 82598 adapter\n");
850 		ixgbe->capab = &ixgbe_82598eb_cap;
851 
852 		if (ixgbe_get_media_type(hw) == ixgbe_media_type_copper) {
853 			ixgbe->capab->flags |= IXGBE_FLAG_FAN_FAIL_CAPABLE;
854 			ixgbe->capab->other_intr |= IXGBE_EICR_GPI_SDP1;
855 			ixgbe->capab->other_gpie |= IXGBE_SDP1_GPIEN;
856 		}
857 		break;
858 
859 	case ixgbe_mac_82599EB:
860 		IXGBE_DEBUGLOG_0(ixgbe, "identify 82599 adapter\n");
861 		ixgbe->capab = &ixgbe_82599eb_cap;
862 
863 		if (hw->device_id == IXGBE_DEV_ID_82599_T3_LOM) {
864 			ixgbe->capab->flags |= IXGBE_FLAG_TEMP_SENSOR_CAPABLE;
865 			ixgbe->capab->other_intr |= IXGBE_EICR_GPI_SDP0;
866 			ixgbe->capab->other_gpie |= IXGBE_SDP0_GPIEN;
867 		}
868 		break;
869 
870 	default:
871 		IXGBE_DEBUGLOG_1(ixgbe,
872 		    "adapter not supported in ixgbe_identify_hardware(): %d\n",
873 		    hw->mac.type);
874 		return (IXGBE_FAILURE);
875 	}
876 
877 	return (IXGBE_SUCCESS);
878 }
879 
880 /*
881  * ixgbe_regs_map - Map the device registers.
882  *
883  */
884 static int
885 ixgbe_regs_map(ixgbe_t *ixgbe)
886 {
887 	dev_info_t *devinfo = ixgbe->dip;
888 	struct ixgbe_hw *hw = &ixgbe->hw;
889 	struct ixgbe_osdep *osdep = &ixgbe->osdep;
890 	off_t mem_size;
891 
892 	/*
893 	 * First get the size of device registers to be mapped.
894 	 */
895 	if (ddi_dev_regsize(devinfo, IXGBE_ADAPTER_REGSET, &mem_size)
896 	    != DDI_SUCCESS) {
897 		return (IXGBE_FAILURE);
898 	}
899 
900 	/*
901 	 * Call ddi_regs_map_setup() to map registers
902 	 */
903 	if ((ddi_regs_map_setup(devinfo, IXGBE_ADAPTER_REGSET,
904 	    (caddr_t *)&hw->hw_addr, 0,
905 	    mem_size, &ixgbe_regs_acc_attr,
906 	    &osdep->reg_handle)) != DDI_SUCCESS) {
907 		return (IXGBE_FAILURE);
908 	}
909 
910 	return (IXGBE_SUCCESS);
911 }
912 
913 /*
914  * ixgbe_init_properties - Initialize driver properties.
915  */
916 static void
917 ixgbe_init_properties(ixgbe_t *ixgbe)
918 {
919 	/*
920 	 * Get conf file properties, including link settings
921 	 * jumbo frames, ring number, descriptor number, etc.
922 	 */
923 	ixgbe_get_conf(ixgbe);
924 
925 	ixgbe_init_params(ixgbe);
926 }
927 
928 /*
929  * ixgbe_init_driver_settings - Initialize driver settings.
930  *
931  * The settings include hardware function pointers, bus information,
932  * rx/tx rings settings, link state, and any other parameters that
933  * need to be setup during driver initialization.
934  */
935 static int
936 ixgbe_init_driver_settings(ixgbe_t *ixgbe)
937 {
938 	struct ixgbe_hw *hw = &ixgbe->hw;
939 	dev_info_t *devinfo = ixgbe->dip;
940 	ixgbe_rx_ring_t *rx_ring;
941 	ixgbe_rx_group_t *rx_group;
942 	ixgbe_tx_ring_t *tx_ring;
943 	uint32_t rx_size;
944 	uint32_t tx_size;
945 	uint32_t ring_per_group;
946 	int i;
947 
948 	/*
949 	 * Initialize chipset specific hardware function pointers
950 	 */
951 	if (ixgbe_init_shared_code(hw) != IXGBE_SUCCESS) {
952 		return (IXGBE_FAILURE);
953 	}
954 
955 	/*
956 	 * Get the system page size
957 	 */
958 	ixgbe->sys_page_size = ddi_ptob(devinfo, (ulong_t)1);
959 
960 	/*
961 	 * Set rx buffer size
962 	 *
963 	 * The IP header alignment room is counted in the calculation.
964 	 * The rx buffer size is in unit of 1K that is required by the
965 	 * chipset hardware.
966 	 */
967 	rx_size = ixgbe->max_frame_size + IPHDR_ALIGN_ROOM;
968 	ixgbe->rx_buf_size = ((rx_size >> 10) +
969 	    ((rx_size & (((uint32_t)1 << 10) - 1)) > 0 ? 1 : 0)) << 10;
970 
971 	/*
972 	 * Set tx buffer size
973 	 */
974 	tx_size = ixgbe->max_frame_size;
975 	ixgbe->tx_buf_size = ((tx_size >> 10) +
976 	    ((tx_size & (((uint32_t)1 << 10) - 1)) > 0 ? 1 : 0)) << 10;
977 
978 	/*
979 	 * Initialize rx/tx rings/groups parameters
980 	 */
981 	ring_per_group = ixgbe->num_rx_rings / ixgbe->num_rx_groups;
982 	for (i = 0; i < ixgbe->num_rx_rings; i++) {
983 		rx_ring = &ixgbe->rx_rings[i];
984 		rx_ring->index = i;
985 		rx_ring->ixgbe = ixgbe;
986 		rx_ring->group_index = i / ring_per_group;
987 		rx_ring->hw_index = ixgbe_get_hw_rx_index(ixgbe, i);
988 	}
989 
990 	for (i = 0; i < ixgbe->num_rx_groups; i++) {
991 		rx_group = &ixgbe->rx_groups[i];
992 		rx_group->index = i;
993 		rx_group->ixgbe = ixgbe;
994 	}
995 
996 	for (i = 0; i < ixgbe->num_tx_rings; i++) {
997 		tx_ring = &ixgbe->tx_rings[i];
998 		tx_ring->index = i;
999 		tx_ring->ixgbe = ixgbe;
1000 		if (ixgbe->tx_head_wb_enable)
1001 			tx_ring->tx_recycle = ixgbe_tx_recycle_head_wb;
1002 		else
1003 			tx_ring->tx_recycle = ixgbe_tx_recycle_legacy;
1004 
1005 		tx_ring->ring_size = ixgbe->tx_ring_size;
1006 		tx_ring->free_list_size = ixgbe->tx_ring_size +
1007 		    (ixgbe->tx_ring_size >> 1);
1008 	}
1009 
1010 	/*
1011 	 * Initialize values of interrupt throttling rate
1012 	 */
1013 	for (i = 1; i < MAX_INTR_VECTOR; i++)
1014 		ixgbe->intr_throttling[i] = ixgbe->intr_throttling[0];
1015 
1016 	/*
1017 	 * The initial link state should be "unknown"
1018 	 */
1019 	ixgbe->link_state = LINK_STATE_UNKNOWN;
1020 
1021 	return (IXGBE_SUCCESS);
1022 }
1023 
1024 /*
1025  * ixgbe_init_locks - Initialize locks.
1026  */
1027 static void
1028 ixgbe_init_locks(ixgbe_t *ixgbe)
1029 {
1030 	ixgbe_rx_ring_t *rx_ring;
1031 	ixgbe_tx_ring_t *tx_ring;
1032 	int i;
1033 
1034 	for (i = 0; i < ixgbe->num_rx_rings; i++) {
1035 		rx_ring = &ixgbe->rx_rings[i];
1036 		mutex_init(&rx_ring->rx_lock, NULL,
1037 		    MUTEX_DRIVER, DDI_INTR_PRI(ixgbe->intr_pri));
1038 	}
1039 
1040 	for (i = 0; i < ixgbe->num_tx_rings; i++) {
1041 		tx_ring = &ixgbe->tx_rings[i];
1042 		mutex_init(&tx_ring->tx_lock, NULL,
1043 		    MUTEX_DRIVER, DDI_INTR_PRI(ixgbe->intr_pri));
1044 		mutex_init(&tx_ring->recycle_lock, NULL,
1045 		    MUTEX_DRIVER, DDI_INTR_PRI(ixgbe->intr_pri));
1046 		mutex_init(&tx_ring->tcb_head_lock, NULL,
1047 		    MUTEX_DRIVER, DDI_INTR_PRI(ixgbe->intr_pri));
1048 		mutex_init(&tx_ring->tcb_tail_lock, NULL,
1049 		    MUTEX_DRIVER, DDI_INTR_PRI(ixgbe->intr_pri));
1050 	}
1051 
1052 	mutex_init(&ixgbe->gen_lock, NULL,
1053 	    MUTEX_DRIVER, DDI_INTR_PRI(ixgbe->intr_pri));
1054 
1055 	mutex_init(&ixgbe->watchdog_lock, NULL,
1056 	    MUTEX_DRIVER, DDI_INTR_PRI(ixgbe->intr_pri));
1057 }
1058 
1059 /*
1060  * ixgbe_destroy_locks - Destroy locks.
1061  */
1062 static void
1063 ixgbe_destroy_locks(ixgbe_t *ixgbe)
1064 {
1065 	ixgbe_rx_ring_t *rx_ring;
1066 	ixgbe_tx_ring_t *tx_ring;
1067 	int i;
1068 
1069 	for (i = 0; i < ixgbe->num_rx_rings; i++) {
1070 		rx_ring = &ixgbe->rx_rings[i];
1071 		mutex_destroy(&rx_ring->rx_lock);
1072 	}
1073 
1074 	for (i = 0; i < ixgbe->num_tx_rings; i++) {
1075 		tx_ring = &ixgbe->tx_rings[i];
1076 		mutex_destroy(&tx_ring->tx_lock);
1077 		mutex_destroy(&tx_ring->recycle_lock);
1078 		mutex_destroy(&tx_ring->tcb_head_lock);
1079 		mutex_destroy(&tx_ring->tcb_tail_lock);
1080 	}
1081 
1082 	mutex_destroy(&ixgbe->gen_lock);
1083 	mutex_destroy(&ixgbe->watchdog_lock);
1084 }
1085 
1086 static int
1087 ixgbe_resume(dev_info_t *devinfo)
1088 {
1089 	ixgbe_t *ixgbe;
1090 	int i;
1091 
1092 	ixgbe = (ixgbe_t *)ddi_get_driver_private(devinfo);
1093 	if (ixgbe == NULL)
1094 		return (DDI_FAILURE);
1095 
1096 	mutex_enter(&ixgbe->gen_lock);
1097 
1098 	if (ixgbe->ixgbe_state & IXGBE_STARTED) {
1099 		if (ixgbe_start(ixgbe, B_FALSE) != IXGBE_SUCCESS) {
1100 			mutex_exit(&ixgbe->gen_lock);
1101 			return (DDI_FAILURE);
1102 		}
1103 
1104 		/*
1105 		 * Enable and start the watchdog timer
1106 		 */
1107 		ixgbe_enable_watchdog_timer(ixgbe);
1108 	}
1109 
1110 	atomic_and_32(&ixgbe->ixgbe_state, ~IXGBE_SUSPENDED);
1111 
1112 	if (ixgbe->ixgbe_state & IXGBE_STARTED) {
1113 		for (i = 0; i < ixgbe->num_tx_rings; i++) {
1114 			mac_tx_ring_update(ixgbe->mac_hdl,
1115 			    ixgbe->tx_rings[i].ring_handle);
1116 		}
1117 	}
1118 
1119 	mutex_exit(&ixgbe->gen_lock);
1120 
1121 	return (DDI_SUCCESS);
1122 }
1123 
1124 static int
1125 ixgbe_suspend(dev_info_t *devinfo)
1126 {
1127 	ixgbe_t *ixgbe;
1128 
1129 	ixgbe = (ixgbe_t *)ddi_get_driver_private(devinfo);
1130 	if (ixgbe == NULL)
1131 		return (DDI_FAILURE);
1132 
1133 	mutex_enter(&ixgbe->gen_lock);
1134 
1135 	atomic_or_32(&ixgbe->ixgbe_state, IXGBE_SUSPENDED);
1136 	if (!(ixgbe->ixgbe_state & IXGBE_STARTED)) {
1137 		mutex_exit(&ixgbe->gen_lock);
1138 		return (DDI_SUCCESS);
1139 	}
1140 	ixgbe_stop(ixgbe, B_FALSE);
1141 
1142 	mutex_exit(&ixgbe->gen_lock);
1143 
1144 	/*
1145 	 * Disable and stop the watchdog timer
1146 	 */
1147 	ixgbe_disable_watchdog_timer(ixgbe);
1148 
1149 	return (DDI_SUCCESS);
1150 }
1151 
1152 /*
1153  * ixgbe_init - Initialize the device.
1154  */
1155 static int
1156 ixgbe_init(ixgbe_t *ixgbe)
1157 {
1158 	struct ixgbe_hw *hw = &ixgbe->hw;
1159 
1160 	mutex_enter(&ixgbe->gen_lock);
1161 
1162 	/*
1163 	 * Reset chipset to put the hardware in a known state
1164 	 * before we try to do anything with the eeprom.
1165 	 */
1166 	if (ixgbe_reset_hw(hw) != IXGBE_SUCCESS) {
1167 		ixgbe_fm_ereport(ixgbe, DDI_FM_DEVICE_INVAL_STATE);
1168 		goto init_fail;
1169 	}
1170 
1171 	/*
1172 	 * Need to init eeprom before validating the checksum.
1173 	 */
1174 	if (ixgbe_init_eeprom_params(hw) < 0) {
1175 		ixgbe_error(ixgbe,
1176 		    "Unable to intitialize the eeprom interface.");
1177 		ixgbe_fm_ereport(ixgbe, DDI_FM_DEVICE_INVAL_STATE);
1178 		goto init_fail;
1179 	}
1180 
1181 	/*
1182 	 * NVM validation
1183 	 */
1184 	if (ixgbe_validate_eeprom_checksum(hw, NULL) < 0) {
1185 		/*
1186 		 * Some PCI-E parts fail the first check due to
1187 		 * the link being in sleep state.  Call it again,
1188 		 * if it fails a second time it's a real issue.
1189 		 */
1190 		if (ixgbe_validate_eeprom_checksum(hw, NULL) < 0) {
1191 			ixgbe_error(ixgbe,
1192 			    "Invalid NVM checksum. Please contact "
1193 			    "the vendor to update the NVM.");
1194 			ixgbe_fm_ereport(ixgbe, DDI_FM_DEVICE_INVAL_STATE);
1195 			goto init_fail;
1196 		}
1197 	}
1198 
1199 	/*
1200 	 * Setup default flow control thresholds - enable/disable
1201 	 * & flow control type is controlled by ixgbe.conf
1202 	 */
1203 	hw->fc.high_water = DEFAULT_FCRTH;
1204 	hw->fc.low_water = DEFAULT_FCRTL;
1205 	hw->fc.pause_time = DEFAULT_FCPAUSE;
1206 	hw->fc.send_xon = B_TRUE;
1207 
1208 	/*
1209 	 * Initialize link settings
1210 	 */
1211 	(void) ixgbe_driver_setup_link(ixgbe, B_FALSE);
1212 
1213 	/*
1214 	 * Initialize the chipset hardware
1215 	 */
1216 	if (ixgbe_chip_start(ixgbe) != IXGBE_SUCCESS) {
1217 		ixgbe_fm_ereport(ixgbe, DDI_FM_DEVICE_INVAL_STATE);
1218 		goto init_fail;
1219 	}
1220 
1221 	if (ixgbe_check_acc_handle(ixgbe->osdep.reg_handle) != DDI_FM_OK) {
1222 		goto init_fail;
1223 	}
1224 
1225 	mutex_exit(&ixgbe->gen_lock);
1226 	return (IXGBE_SUCCESS);
1227 
1228 init_fail:
1229 	/*
1230 	 * Reset PHY
1231 	 */
1232 	(void) ixgbe_reset_phy(hw);
1233 
1234 	mutex_exit(&ixgbe->gen_lock);
1235 	ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_LOST);
1236 	return (IXGBE_FAILURE);
1237 }
1238 
1239 /*
1240  * ixgbe_chip_start - Initialize and start the chipset hardware.
1241  */
1242 static int
1243 ixgbe_chip_start(ixgbe_t *ixgbe)
1244 {
1245 	struct ixgbe_hw *hw = &ixgbe->hw;
1246 	int ret_val, i;
1247 
1248 	ASSERT(mutex_owned(&ixgbe->gen_lock));
1249 
1250 	/*
1251 	 * Get the mac address
1252 	 * This function should handle SPARC case correctly.
1253 	 */
1254 	if (!ixgbe_find_mac_address(ixgbe)) {
1255 		ixgbe_error(ixgbe, "Failed to get the mac address");
1256 		return (IXGBE_FAILURE);
1257 	}
1258 
1259 	/*
1260 	 * Validate the mac address
1261 	 */
1262 	(void) ixgbe_init_rx_addrs(hw);
1263 	if (!is_valid_mac_addr(hw->mac.addr)) {
1264 		ixgbe_error(ixgbe, "Invalid mac address");
1265 		return (IXGBE_FAILURE);
1266 	}
1267 
1268 	/*
1269 	 * Configure/Initialize hardware
1270 	 */
1271 	ret_val = ixgbe_init_hw(hw);
1272 	if (ret_val != IXGBE_SUCCESS) {
1273 		if (ret_val == IXGBE_ERR_EEPROM_VERSION) {
1274 			ixgbe_error(ixgbe,
1275 			    "This 82599 device is pre-release and contains"
1276 			    " outdated firmware, please contact your hardware"
1277 			    " vendor for a replacement.");
1278 		} else {
1279 			ixgbe_error(ixgbe, "Failed to initialize hardware");
1280 			return (IXGBE_FAILURE);
1281 		}
1282 	}
1283 
1284 	/*
1285 	 * Re-enable relaxed ordering for performance.  It is disabled
1286 	 * by default in the hardware init.
1287 	 */
1288 	if (ixgbe->relax_order_enable == B_TRUE)
1289 		ixgbe_enable_relaxed_ordering(hw);
1290 
1291 	/*
1292 	 * Setup adapter interrupt vectors
1293 	 */
1294 	ixgbe_setup_adapter_vector(ixgbe);
1295 
1296 	/*
1297 	 * Initialize unicast addresses.
1298 	 */
1299 	ixgbe_init_unicst(ixgbe);
1300 
1301 	/*
1302 	 * Setup and initialize the mctable structures.
1303 	 */
1304 	ixgbe_setup_multicst(ixgbe);
1305 
1306 	/*
1307 	 * Set interrupt throttling rate
1308 	 */
1309 	for (i = 0; i < ixgbe->intr_cnt; i++) {
1310 		IXGBE_WRITE_REG(hw, IXGBE_EITR(i), ixgbe->intr_throttling[i]);
1311 	}
1312 
1313 	/*
1314 	 * Save the state of the phy
1315 	 */
1316 	ixgbe_get_hw_state(ixgbe);
1317 
1318 	/*
1319 	 * Make sure driver has control
1320 	 */
1321 	ixgbe_get_driver_control(hw);
1322 
1323 	return (IXGBE_SUCCESS);
1324 }
1325 
1326 /*
1327  * ixgbe_chip_stop - Stop the chipset hardware
1328  */
1329 static void
1330 ixgbe_chip_stop(ixgbe_t *ixgbe)
1331 {
1332 	struct ixgbe_hw *hw = &ixgbe->hw;
1333 
1334 	ASSERT(mutex_owned(&ixgbe->gen_lock));
1335 
1336 	/*
1337 	 * Tell firmware driver is no longer in control
1338 	 */
1339 	ixgbe_release_driver_control(hw);
1340 
1341 	/*
1342 	 * Reset the chipset
1343 	 */
1344 	(void) ixgbe_reset_hw(hw);
1345 
1346 	/*
1347 	 * Reset PHY
1348 	 */
1349 	(void) ixgbe_reset_phy(hw);
1350 }
1351 
1352 /*
1353  * ixgbe_reset - Reset the chipset and re-start the driver.
1354  *
1355  * It involves stopping and re-starting the chipset,
1356  * and re-configuring the rx/tx rings.
1357  */
1358 static int
1359 ixgbe_reset(ixgbe_t *ixgbe)
1360 {
1361 	int i;
1362 
1363 	/*
1364 	 * Disable and stop the watchdog timer
1365 	 */
1366 	ixgbe_disable_watchdog_timer(ixgbe);
1367 
1368 	mutex_enter(&ixgbe->gen_lock);
1369 
1370 	ASSERT(ixgbe->ixgbe_state & IXGBE_STARTED);
1371 	atomic_and_32(&ixgbe->ixgbe_state, ~IXGBE_STARTED);
1372 
1373 	ixgbe_stop(ixgbe, B_FALSE);
1374 
1375 	if (ixgbe_start(ixgbe, B_FALSE) != IXGBE_SUCCESS) {
1376 		mutex_exit(&ixgbe->gen_lock);
1377 		return (IXGBE_FAILURE);
1378 	}
1379 
1380 	/*
1381 	 * After resetting, need to recheck the link status.
1382 	 */
1383 	ixgbe->link_check_complete = B_FALSE;
1384 	ixgbe->link_check_hrtime = gethrtime() +
1385 	    (IXGBE_LINK_UP_TIME * 100000000ULL);
1386 
1387 	atomic_or_32(&ixgbe->ixgbe_state, IXGBE_STARTED);
1388 
1389 	if (!(ixgbe->ixgbe_state & IXGBE_SUSPENDED)) {
1390 		for (i = 0; i < ixgbe->num_tx_rings; i++) {
1391 			mac_tx_ring_update(ixgbe->mac_hdl,
1392 			    ixgbe->tx_rings[i].ring_handle);
1393 		}
1394 	}
1395 
1396 	mutex_exit(&ixgbe->gen_lock);
1397 
1398 	/*
1399 	 * Enable and start the watchdog timer
1400 	 */
1401 	ixgbe_enable_watchdog_timer(ixgbe);
1402 
1403 	return (IXGBE_SUCCESS);
1404 }
1405 
1406 /*
1407  * ixgbe_tx_clean - Clean the pending transmit packets and DMA resources.
1408  */
1409 static void
1410 ixgbe_tx_clean(ixgbe_t *ixgbe)
1411 {
1412 	ixgbe_tx_ring_t *tx_ring;
1413 	tx_control_block_t *tcb;
1414 	link_list_t pending_list;
1415 	uint32_t desc_num;
1416 	int i, j;
1417 
1418 	LINK_LIST_INIT(&pending_list);
1419 
1420 	for (i = 0; i < ixgbe->num_tx_rings; i++) {
1421 		tx_ring = &ixgbe->tx_rings[i];
1422 
1423 		mutex_enter(&tx_ring->recycle_lock);
1424 
1425 		/*
1426 		 * Clean the pending tx data - the pending packets in the
1427 		 * work_list that have no chances to be transmitted again.
1428 		 *
1429 		 * We must ensure the chipset is stopped or the link is down
1430 		 * before cleaning the transmit packets.
1431 		 */
1432 		desc_num = 0;
1433 		for (j = 0; j < tx_ring->ring_size; j++) {
1434 			tcb = tx_ring->work_list[j];
1435 			if (tcb != NULL) {
1436 				desc_num += tcb->desc_num;
1437 
1438 				tx_ring->work_list[j] = NULL;
1439 
1440 				ixgbe_free_tcb(tcb);
1441 
1442 				LIST_PUSH_TAIL(&pending_list, &tcb->link);
1443 			}
1444 		}
1445 
1446 		if (desc_num > 0) {
1447 			atomic_add_32(&tx_ring->tbd_free, desc_num);
1448 			ASSERT(tx_ring->tbd_free == tx_ring->ring_size);
1449 
1450 			/*
1451 			 * Reset the head and tail pointers of the tbd ring;
1452 			 * Reset the writeback head if it's enable.
1453 			 */
1454 			tx_ring->tbd_head = 0;
1455 			tx_ring->tbd_tail = 0;
1456 			if (ixgbe->tx_head_wb_enable)
1457 				*tx_ring->tbd_head_wb = 0;
1458 
1459 			IXGBE_WRITE_REG(&ixgbe->hw,
1460 			    IXGBE_TDH(tx_ring->index), 0);
1461 			IXGBE_WRITE_REG(&ixgbe->hw,
1462 			    IXGBE_TDT(tx_ring->index), 0);
1463 		}
1464 
1465 		mutex_exit(&tx_ring->recycle_lock);
1466 
1467 		/*
1468 		 * Add the tx control blocks in the pending list to
1469 		 * the free list.
1470 		 */
1471 		ixgbe_put_free_list(tx_ring, &pending_list);
1472 	}
1473 }
1474 
1475 /*
1476  * ixgbe_tx_drain - Drain the tx rings to allow pending packets to be
1477  * transmitted.
1478  */
1479 static boolean_t
1480 ixgbe_tx_drain(ixgbe_t *ixgbe)
1481 {
1482 	ixgbe_tx_ring_t *tx_ring;
1483 	boolean_t done;
1484 	int i, j;
1485 
1486 	/*
1487 	 * Wait for a specific time to allow pending tx packets
1488 	 * to be transmitted.
1489 	 *
1490 	 * Check the counter tbd_free to see if transmission is done.
1491 	 * No lock protection is needed here.
1492 	 *
1493 	 * Return B_TRUE if all pending packets have been transmitted;
1494 	 * Otherwise return B_FALSE;
1495 	 */
1496 	for (i = 0; i < TX_DRAIN_TIME; i++) {
1497 
1498 		done = B_TRUE;
1499 		for (j = 0; j < ixgbe->num_tx_rings; j++) {
1500 			tx_ring = &ixgbe->tx_rings[j];
1501 			done = done &&
1502 			    (tx_ring->tbd_free == tx_ring->ring_size);
1503 		}
1504 
1505 		if (done)
1506 			break;
1507 
1508 		msec_delay(1);
1509 	}
1510 
1511 	return (done);
1512 }
1513 
1514 /*
1515  * ixgbe_rx_drain - Wait for all rx buffers to be released by upper layer.
1516  */
1517 static boolean_t
1518 ixgbe_rx_drain(ixgbe_t *ixgbe)
1519 {
1520 	boolean_t done = B_TRUE;
1521 	int i;
1522 
1523 	/*
1524 	 * Polling the rx free list to check if those rx buffers held by
1525 	 * the upper layer are released.
1526 	 *
1527 	 * Check the counter rcb_free to see if all pending buffers are
1528 	 * released. No lock protection is needed here.
1529 	 *
1530 	 * Return B_TRUE if all pending buffers have been released;
1531 	 * Otherwise return B_FALSE;
1532 	 */
1533 	for (i = 0; i < RX_DRAIN_TIME; i++) {
1534 		done = (ixgbe->rcb_pending == 0);
1535 
1536 		if (done)
1537 			break;
1538 
1539 		msec_delay(1);
1540 	}
1541 
1542 	return (done);
1543 }
1544 
1545 /*
1546  * ixgbe_start - Start the driver/chipset.
1547  */
1548 int
1549 ixgbe_start(ixgbe_t *ixgbe, boolean_t alloc_buffer)
1550 {
1551 	int i;
1552 
1553 	ASSERT(mutex_owned(&ixgbe->gen_lock));
1554 
1555 	if (alloc_buffer) {
1556 		if (ixgbe_alloc_rx_data(ixgbe) != IXGBE_SUCCESS) {
1557 			ixgbe_error(ixgbe,
1558 			    "Failed to allocate software receive rings");
1559 			return (IXGBE_FAILURE);
1560 		}
1561 
1562 		/* Allocate buffers for all the rx/tx rings */
1563 		if (ixgbe_alloc_dma(ixgbe) != IXGBE_SUCCESS) {
1564 			ixgbe_error(ixgbe, "Failed to allocate DMA resource");
1565 			return (IXGBE_FAILURE);
1566 		}
1567 
1568 		ixgbe->tx_ring_init = B_TRUE;
1569 	} else {
1570 		ixgbe->tx_ring_init = B_FALSE;
1571 	}
1572 
1573 	for (i = 0; i < ixgbe->num_rx_rings; i++)
1574 		mutex_enter(&ixgbe->rx_rings[i].rx_lock);
1575 	for (i = 0; i < ixgbe->num_tx_rings; i++)
1576 		mutex_enter(&ixgbe->tx_rings[i].tx_lock);
1577 
1578 	/*
1579 	 * Start the chipset hardware
1580 	 */
1581 	if (ixgbe_chip_start(ixgbe) != IXGBE_SUCCESS) {
1582 		ixgbe_fm_ereport(ixgbe, DDI_FM_DEVICE_INVAL_STATE);
1583 		goto start_failure;
1584 	}
1585 
1586 	if (ixgbe_check_acc_handle(ixgbe->osdep.reg_handle) != DDI_FM_OK) {
1587 		goto start_failure;
1588 	}
1589 
1590 	/*
1591 	 * Setup the rx/tx rings
1592 	 */
1593 	ixgbe_setup_rings(ixgbe);
1594 
1595 	/*
1596 	 * ixgbe_start() will be called when resetting, however if reset
1597 	 * happens, we need to clear the ERROR, STALL and OVERTEMP flags
1598 	 * before enabling the interrupts.
1599 	 */
1600 	atomic_and_32(&ixgbe->ixgbe_state, ~(IXGBE_ERROR
1601 	    | IXGBE_STALL| IXGBE_OVERTEMP));
1602 
1603 	/*
1604 	 * Enable adapter interrupts
1605 	 * The interrupts must be enabled after the driver state is START
1606 	 */
1607 	ixgbe_enable_adapter_interrupts(ixgbe);
1608 
1609 	for (i = ixgbe->num_tx_rings - 1; i >= 0; i--)
1610 		mutex_exit(&ixgbe->tx_rings[i].tx_lock);
1611 	for (i = ixgbe->num_rx_rings - 1; i >= 0; i--)
1612 		mutex_exit(&ixgbe->rx_rings[i].rx_lock);
1613 
1614 	return (IXGBE_SUCCESS);
1615 
1616 start_failure:
1617 	for (i = ixgbe->num_tx_rings - 1; i >= 0; i--)
1618 		mutex_exit(&ixgbe->tx_rings[i].tx_lock);
1619 	for (i = ixgbe->num_rx_rings - 1; i >= 0; i--)
1620 		mutex_exit(&ixgbe->rx_rings[i].rx_lock);
1621 
1622 	ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_LOST);
1623 
1624 	return (IXGBE_FAILURE);
1625 }
1626 
1627 /*
1628  * ixgbe_stop - Stop the driver/chipset.
1629  */
1630 void
1631 ixgbe_stop(ixgbe_t *ixgbe, boolean_t free_buffer)
1632 {
1633 	int i;
1634 
1635 	ASSERT(mutex_owned(&ixgbe->gen_lock));
1636 
1637 	/*
1638 	 * Disable the adapter interrupts
1639 	 */
1640 	ixgbe_disable_adapter_interrupts(ixgbe);
1641 
1642 	/*
1643 	 * Drain the pending tx packets
1644 	 */
1645 	(void) ixgbe_tx_drain(ixgbe);
1646 
1647 	for (i = 0; i < ixgbe->num_rx_rings; i++)
1648 		mutex_enter(&ixgbe->rx_rings[i].rx_lock);
1649 	for (i = 0; i < ixgbe->num_tx_rings; i++)
1650 		mutex_enter(&ixgbe->tx_rings[i].tx_lock);
1651 
1652 	/*
1653 	 * Stop the chipset hardware
1654 	 */
1655 	ixgbe_chip_stop(ixgbe);
1656 
1657 	if (ixgbe_check_acc_handle(ixgbe->osdep.reg_handle) != DDI_FM_OK) {
1658 		ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_LOST);
1659 	}
1660 
1661 	/*
1662 	 * Clean the pending tx data/resources
1663 	 */
1664 	ixgbe_tx_clean(ixgbe);
1665 
1666 	for (i = ixgbe->num_tx_rings - 1; i >= 0; i--)
1667 		mutex_exit(&ixgbe->tx_rings[i].tx_lock);
1668 	for (i = ixgbe->num_rx_rings - 1; i >= 0; i--)
1669 		mutex_exit(&ixgbe->rx_rings[i].rx_lock);
1670 
1671 	if (ixgbe->link_state == LINK_STATE_UP) {
1672 		ixgbe->link_state = LINK_STATE_UNKNOWN;
1673 		mac_link_update(ixgbe->mac_hdl, ixgbe->link_state);
1674 	}
1675 
1676 	if (free_buffer) {
1677 		/*
1678 		 * Release the DMA/memory resources of rx/tx rings
1679 		 */
1680 		ixgbe_free_dma(ixgbe);
1681 		ixgbe_free_rx_data(ixgbe);
1682 	}
1683 }
1684 
1685 /*
1686  * ixgbe_cbfunc - Driver interface for generic DDI callbacks
1687  */
1688 /* ARGSUSED */
1689 static int
1690 ixgbe_cbfunc(dev_info_t *dip, ddi_cb_action_t cbaction, void *cbarg,
1691     void *arg1, void *arg2)
1692 {
1693 	ixgbe_t *ixgbe = (ixgbe_t *)arg1;
1694 
1695 	switch (cbaction) {
1696 	/* IRM callback */
1697 	int count;
1698 	case DDI_CB_INTR_ADD:
1699 	case DDI_CB_INTR_REMOVE:
1700 		count = (int)(uintptr_t)cbarg;
1701 		ASSERT(ixgbe->intr_type == DDI_INTR_TYPE_MSIX);
1702 		DTRACE_PROBE2(ixgbe__irm__callback, int, count,
1703 		    int, ixgbe->intr_cnt);
1704 		if (ixgbe_intr_adjust(ixgbe, cbaction, count) !=
1705 		    DDI_SUCCESS) {
1706 			ixgbe_error(ixgbe,
1707 			    "IRM CB: Failed to adjust interrupts");
1708 			goto cb_fail;
1709 		}
1710 		break;
1711 	default:
1712 		IXGBE_DEBUGLOG_1(ixgbe, "DDI CB: action 0x%x NOT supported",
1713 		    cbaction);
1714 		return (DDI_ENOTSUP);
1715 	}
1716 	return (DDI_SUCCESS);
1717 cb_fail:
1718 	return (DDI_FAILURE);
1719 }
1720 
1721 /*
1722  * ixgbe_intr_adjust - Adjust interrupt to respond to IRM request.
1723  */
1724 static int
1725 ixgbe_intr_adjust(ixgbe_t *ixgbe, ddi_cb_action_t cbaction, int count)
1726 {
1727 	int i, rc, actual;
1728 
1729 	if (count == 0)
1730 		return (DDI_SUCCESS);
1731 
1732 	if ((cbaction == DDI_CB_INTR_ADD &&
1733 	    ixgbe->intr_cnt + count > ixgbe->intr_cnt_max) ||
1734 	    (cbaction == DDI_CB_INTR_REMOVE &&
1735 	    ixgbe->intr_cnt - count < ixgbe->intr_cnt_min))
1736 		return (DDI_FAILURE);
1737 
1738 	if (!(ixgbe->ixgbe_state & IXGBE_STARTED)) {
1739 		return (DDI_FAILURE);
1740 	}
1741 
1742 	for (i = 0; i < ixgbe->num_rx_rings; i++)
1743 		mac_ring_intr_set(ixgbe->rx_rings[i].ring_handle, NULL);
1744 	for (i = 0; i < ixgbe->num_tx_rings; i++)
1745 		mac_ring_intr_set(ixgbe->tx_rings[i].ring_handle, NULL);
1746 
1747 	mutex_enter(&ixgbe->gen_lock);
1748 	ixgbe->ixgbe_state &= ~IXGBE_STARTED;
1749 	ixgbe->ixgbe_state |= IXGBE_INTR_ADJUST;
1750 	ixgbe->ixgbe_state |= IXGBE_SUSPENDED;
1751 	mac_link_update(ixgbe->mac_hdl, LINK_STATE_UNKNOWN);
1752 
1753 	ixgbe_stop(ixgbe, B_FALSE);
1754 	/*
1755 	 * Disable interrupts
1756 	 */
1757 	if (ixgbe->attach_progress & ATTACH_PROGRESS_ENABLE_INTR) {
1758 		rc = ixgbe_disable_intrs(ixgbe);
1759 		ASSERT(rc == IXGBE_SUCCESS);
1760 	}
1761 	ixgbe->attach_progress &= ~ATTACH_PROGRESS_ENABLE_INTR;
1762 
1763 	/*
1764 	 * Remove interrupt handlers
1765 	 */
1766 	if (ixgbe->attach_progress & ATTACH_PROGRESS_ADD_INTR) {
1767 		ixgbe_rem_intr_handlers(ixgbe);
1768 	}
1769 	ixgbe->attach_progress &= ~ATTACH_PROGRESS_ADD_INTR;
1770 
1771 	/*
1772 	 * Clear vect_map
1773 	 */
1774 	bzero(&ixgbe->vect_map, sizeof (ixgbe->vect_map));
1775 	switch (cbaction) {
1776 	case DDI_CB_INTR_ADD:
1777 		rc = ddi_intr_alloc(ixgbe->dip, ixgbe->htable,
1778 		    DDI_INTR_TYPE_MSIX, ixgbe->intr_cnt, count, &actual,
1779 		    DDI_INTR_ALLOC_NORMAL);
1780 		if (rc != DDI_SUCCESS || actual != count) {
1781 			ixgbe_log(ixgbe, "Adjust interrupts failed."
1782 			    "return: %d, irm cb size: %d, actual: %d",
1783 			    rc, count, actual);
1784 			goto intr_adjust_fail;
1785 		}
1786 		ixgbe->intr_cnt += count;
1787 		break;
1788 
1789 	case DDI_CB_INTR_REMOVE:
1790 		for (i = ixgbe->intr_cnt - count;
1791 		    i < ixgbe->intr_cnt; i ++) {
1792 			rc = ddi_intr_free(ixgbe->htable[i]);
1793 			ixgbe->htable[i] = NULL;
1794 			if (rc != DDI_SUCCESS) {
1795 				ixgbe_log(ixgbe, "Adjust interrupts failed."
1796 				    "return: %d, irm cb size: %d, actual: %d",
1797 				    rc, count, actual);
1798 				goto intr_adjust_fail;
1799 			}
1800 		}
1801 		ixgbe->intr_cnt -= count;
1802 		break;
1803 	}
1804 
1805 	/*
1806 	 * Get priority for first vector, assume remaining are all the same
1807 	 */
1808 	rc = ddi_intr_get_pri(ixgbe->htable[0], &ixgbe->intr_pri);
1809 	if (rc != DDI_SUCCESS) {
1810 		ixgbe_log(ixgbe,
1811 		    "Get interrupt priority failed: %d", rc);
1812 		goto intr_adjust_fail;
1813 	}
1814 	rc = ddi_intr_get_cap(ixgbe->htable[0], &ixgbe->intr_cap);
1815 	if (rc != DDI_SUCCESS) {
1816 		ixgbe_log(ixgbe, "Get interrupt cap failed: %d", rc);
1817 		goto intr_adjust_fail;
1818 	}
1819 	ixgbe->attach_progress |= ATTACH_PROGRESS_ALLOC_INTR;
1820 
1821 	/*
1822 	 * Map rings to interrupt vectors
1823 	 */
1824 	if (ixgbe_map_intrs_to_vectors(ixgbe) != IXGBE_SUCCESS) {
1825 		ixgbe_error(ixgbe,
1826 		    "IRM CB: Failed to map interrupts to vectors");
1827 		goto intr_adjust_fail;
1828 	}
1829 
1830 	/*
1831 	 * Add interrupt handlers
1832 	 */
1833 	if (ixgbe_add_intr_handlers(ixgbe) != IXGBE_SUCCESS) {
1834 		ixgbe_error(ixgbe, "IRM CB: Failed to add interrupt handlers");
1835 		goto intr_adjust_fail;
1836 	}
1837 	ixgbe->attach_progress |= ATTACH_PROGRESS_ADD_INTR;
1838 
1839 	/*
1840 	 * Now that mutex locks are initialized, and the chip is also
1841 	 * initialized, enable interrupts.
1842 	 */
1843 	if (ixgbe_enable_intrs(ixgbe) != IXGBE_SUCCESS) {
1844 		ixgbe_error(ixgbe, "IRM CB: Failed to enable DDI interrupts");
1845 		goto intr_adjust_fail;
1846 	}
1847 	ixgbe->attach_progress |= ATTACH_PROGRESS_ENABLE_INTR;
1848 	if (ixgbe_start(ixgbe, B_FALSE) != IXGBE_SUCCESS) {
1849 		ixgbe_error(ixgbe, "IRM CB: Failed to start");
1850 		goto intr_adjust_fail;
1851 	}
1852 	ixgbe->ixgbe_state &= ~IXGBE_INTR_ADJUST;
1853 	ixgbe->ixgbe_state &= ~IXGBE_SUSPENDED;
1854 	ixgbe->ixgbe_state |= IXGBE_STARTED;
1855 	mutex_exit(&ixgbe->gen_lock);
1856 
1857 	for (i = 0; i < ixgbe->num_rx_rings; i++) {
1858 		mac_ring_intr_set(ixgbe->rx_rings[i].ring_handle,
1859 		    ixgbe->htable[ixgbe->rx_rings[i].intr_vector]);
1860 	}
1861 	for (i = 0; i < ixgbe->num_tx_rings; i++) {
1862 		mac_ring_intr_set(ixgbe->tx_rings[i].ring_handle,
1863 		    ixgbe->htable[ixgbe->tx_rings[i].intr_vector]);
1864 	}
1865 
1866 	/* Wakeup all Tx rings */
1867 	for (i = 0; i < ixgbe->num_tx_rings; i++) {
1868 		mac_tx_ring_update(ixgbe->mac_hdl,
1869 		    ixgbe->tx_rings[i].ring_handle);
1870 	}
1871 
1872 	IXGBE_DEBUGLOG_3(ixgbe,
1873 	    "IRM CB: interrupts new value: 0x%x(0x%x:0x%x).",
1874 	    ixgbe->intr_cnt, ixgbe->intr_cnt_min, ixgbe->intr_cnt_max);
1875 	return (DDI_SUCCESS);
1876 
1877 intr_adjust_fail:
1878 	ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_LOST);
1879 	mutex_exit(&ixgbe->gen_lock);
1880 	return (DDI_FAILURE);
1881 }
1882 
1883 /*
1884  * ixgbe_intr_cb_register - Register interrupt callback function.
1885  */
1886 static int
1887 ixgbe_intr_cb_register(ixgbe_t *ixgbe)
1888 {
1889 	if (ddi_cb_register(ixgbe->dip, DDI_CB_FLAG_INTR, ixgbe_cbfunc,
1890 	    ixgbe, NULL, &ixgbe->cb_hdl) != DDI_SUCCESS) {
1891 		return (IXGBE_FAILURE);
1892 	}
1893 	IXGBE_DEBUGLOG_0(ixgbe, "Interrupt callback function registered.");
1894 	return (IXGBE_SUCCESS);
1895 }
1896 
1897 /*
1898  * ixgbe_alloc_rings - Allocate memory space for rx/tx rings.
1899  */
1900 static int
1901 ixgbe_alloc_rings(ixgbe_t *ixgbe)
1902 {
1903 	/*
1904 	 * Allocate memory space for rx rings
1905 	 */
1906 	ixgbe->rx_rings = kmem_zalloc(
1907 	    sizeof (ixgbe_rx_ring_t) * ixgbe->num_rx_rings,
1908 	    KM_NOSLEEP);
1909 
1910 	if (ixgbe->rx_rings == NULL) {
1911 		return (IXGBE_FAILURE);
1912 	}
1913 
1914 	/*
1915 	 * Allocate memory space for tx rings
1916 	 */
1917 	ixgbe->tx_rings = kmem_zalloc(
1918 	    sizeof (ixgbe_tx_ring_t) * ixgbe->num_tx_rings,
1919 	    KM_NOSLEEP);
1920 
1921 	if (ixgbe->tx_rings == NULL) {
1922 		kmem_free(ixgbe->rx_rings,
1923 		    sizeof (ixgbe_rx_ring_t) * ixgbe->num_rx_rings);
1924 		ixgbe->rx_rings = NULL;
1925 		return (IXGBE_FAILURE);
1926 	}
1927 
1928 	/*
1929 	 * Allocate memory space for rx ring groups
1930 	 */
1931 	ixgbe->rx_groups = kmem_zalloc(
1932 	    sizeof (ixgbe_rx_group_t) * ixgbe->num_rx_groups,
1933 	    KM_NOSLEEP);
1934 
1935 	if (ixgbe->rx_groups == NULL) {
1936 		kmem_free(ixgbe->rx_rings,
1937 		    sizeof (ixgbe_rx_ring_t) * ixgbe->num_rx_rings);
1938 		kmem_free(ixgbe->tx_rings,
1939 		    sizeof (ixgbe_tx_ring_t) * ixgbe->num_tx_rings);
1940 		ixgbe->rx_rings = NULL;
1941 		ixgbe->tx_rings = NULL;
1942 		return (IXGBE_FAILURE);
1943 	}
1944 
1945 	return (IXGBE_SUCCESS);
1946 }
1947 
1948 /*
1949  * ixgbe_free_rings - Free the memory space of rx/tx rings.
1950  */
1951 static void
1952 ixgbe_free_rings(ixgbe_t *ixgbe)
1953 {
1954 	if (ixgbe->rx_rings != NULL) {
1955 		kmem_free(ixgbe->rx_rings,
1956 		    sizeof (ixgbe_rx_ring_t) * ixgbe->num_rx_rings);
1957 		ixgbe->rx_rings = NULL;
1958 	}
1959 
1960 	if (ixgbe->tx_rings != NULL) {
1961 		kmem_free(ixgbe->tx_rings,
1962 		    sizeof (ixgbe_tx_ring_t) * ixgbe->num_tx_rings);
1963 		ixgbe->tx_rings = NULL;
1964 	}
1965 
1966 	if (ixgbe->rx_groups != NULL) {
1967 		kmem_free(ixgbe->rx_groups,
1968 		    sizeof (ixgbe_rx_group_t) * ixgbe->num_rx_groups);
1969 		ixgbe->rx_groups = NULL;
1970 	}
1971 }
1972 
1973 static int
1974 ixgbe_alloc_rx_data(ixgbe_t *ixgbe)
1975 {
1976 	ixgbe_rx_ring_t *rx_ring;
1977 	int i;
1978 
1979 	for (i = 0; i < ixgbe->num_rx_rings; i++) {
1980 		rx_ring = &ixgbe->rx_rings[i];
1981 		if (ixgbe_alloc_rx_ring_data(rx_ring) != IXGBE_SUCCESS)
1982 			goto alloc_rx_rings_failure;
1983 	}
1984 	return (IXGBE_SUCCESS);
1985 
1986 alloc_rx_rings_failure:
1987 	ixgbe_free_rx_data(ixgbe);
1988 	return (IXGBE_FAILURE);
1989 }
1990 
1991 static void
1992 ixgbe_free_rx_data(ixgbe_t *ixgbe)
1993 {
1994 	ixgbe_rx_ring_t *rx_ring;
1995 	ixgbe_rx_data_t *rx_data;
1996 	int i;
1997 
1998 	for (i = 0; i < ixgbe->num_rx_rings; i++) {
1999 		rx_ring = &ixgbe->rx_rings[i];
2000 
2001 		mutex_enter(&ixgbe->rx_pending_lock);
2002 		rx_data = rx_ring->rx_data;
2003 
2004 		if (rx_data != NULL) {
2005 			rx_data->flag |= IXGBE_RX_STOPPED;
2006 
2007 			if (rx_data->rcb_pending == 0) {
2008 				ixgbe_free_rx_ring_data(rx_data);
2009 				rx_ring->rx_data = NULL;
2010 			}
2011 		}
2012 
2013 		mutex_exit(&ixgbe->rx_pending_lock);
2014 	}
2015 }
2016 
2017 /*
2018  * ixgbe_setup_rings - Setup rx/tx rings.
2019  */
2020 static void
2021 ixgbe_setup_rings(ixgbe_t *ixgbe)
2022 {
2023 	/*
2024 	 * Setup the rx/tx rings, including the following:
2025 	 *
2026 	 * 1. Setup the descriptor ring and the control block buffers;
2027 	 * 2. Initialize necessary registers for receive/transmit;
2028 	 * 3. Initialize software pointers/parameters for receive/transmit;
2029 	 */
2030 	ixgbe_setup_rx(ixgbe);
2031 
2032 	ixgbe_setup_tx(ixgbe);
2033 }
2034 
2035 static void
2036 ixgbe_setup_rx_ring(ixgbe_rx_ring_t *rx_ring)
2037 {
2038 	ixgbe_t *ixgbe = rx_ring->ixgbe;
2039 	ixgbe_rx_data_t *rx_data = rx_ring->rx_data;
2040 	struct ixgbe_hw *hw = &ixgbe->hw;
2041 	rx_control_block_t *rcb;
2042 	union ixgbe_adv_rx_desc	*rbd;
2043 	uint32_t size;
2044 	uint32_t buf_low;
2045 	uint32_t buf_high;
2046 	uint32_t reg_val;
2047 	int i;
2048 
2049 	ASSERT(mutex_owned(&rx_ring->rx_lock));
2050 	ASSERT(mutex_owned(&ixgbe->gen_lock));
2051 
2052 	for (i = 0; i < ixgbe->rx_ring_size; i++) {
2053 		rcb = rx_data->work_list[i];
2054 		rbd = &rx_data->rbd_ring[i];
2055 
2056 		rbd->read.pkt_addr = rcb->rx_buf.dma_address;
2057 		rbd->read.hdr_addr = NULL;
2058 	}
2059 
2060 	/*
2061 	 * Initialize the length register
2062 	 */
2063 	size = rx_data->ring_size * sizeof (union ixgbe_adv_rx_desc);
2064 	IXGBE_WRITE_REG(hw, IXGBE_RDLEN(rx_ring->hw_index), size);
2065 
2066 	/*
2067 	 * Initialize the base address registers
2068 	 */
2069 	buf_low = (uint32_t)rx_data->rbd_area.dma_address;
2070 	buf_high = (uint32_t)(rx_data->rbd_area.dma_address >> 32);
2071 	IXGBE_WRITE_REG(hw, IXGBE_RDBAH(rx_ring->hw_index), buf_high);
2072 	IXGBE_WRITE_REG(hw, IXGBE_RDBAL(rx_ring->hw_index), buf_low);
2073 
2074 	/*
2075 	 * Setup head & tail pointers
2076 	 */
2077 	IXGBE_WRITE_REG(hw, IXGBE_RDT(rx_ring->hw_index),
2078 	    rx_data->ring_size - 1);
2079 	IXGBE_WRITE_REG(hw, IXGBE_RDH(rx_ring->hw_index), 0);
2080 
2081 	rx_data->rbd_next = 0;
2082 	rx_data->lro_first = 0;
2083 
2084 	/*
2085 	 * Setup the Receive Descriptor Control Register (RXDCTL)
2086 	 * PTHRESH=32 descriptors (half the internal cache)
2087 	 * HTHRESH=0 descriptors (to minimize latency on fetch)
2088 	 * WTHRESH defaults to 1 (writeback each descriptor)
2089 	 */
2090 	reg_val = IXGBE_READ_REG(hw, IXGBE_RXDCTL(rx_ring->hw_index));
2091 	reg_val |= IXGBE_RXDCTL_ENABLE;	/* enable queue */
2092 
2093 	/* Not a valid value for 82599 */
2094 	if (hw->mac.type < ixgbe_mac_82599EB) {
2095 		reg_val |= 0x0020;	/* pthresh */
2096 	}
2097 	IXGBE_WRITE_REG(hw, IXGBE_RXDCTL(rx_ring->hw_index), reg_val);
2098 
2099 	if (hw->mac.type == ixgbe_mac_82599EB) {
2100 		reg_val = IXGBE_READ_REG(hw, IXGBE_RDRXCTL);
2101 		reg_val |= (IXGBE_RDRXCTL_CRCSTRIP | IXGBE_RDRXCTL_AGGDIS);
2102 		IXGBE_WRITE_REG(hw, IXGBE_RDRXCTL, reg_val);
2103 	}
2104 
2105 	/*
2106 	 * Setup the Split and Replication Receive Control Register.
2107 	 * Set the rx buffer size and the advanced descriptor type.
2108 	 */
2109 	reg_val = (ixgbe->rx_buf_size >> IXGBE_SRRCTL_BSIZEPKT_SHIFT) |
2110 	    IXGBE_SRRCTL_DESCTYPE_ADV_ONEBUF;
2111 	reg_val |= IXGBE_SRRCTL_DROP_EN;
2112 	IXGBE_WRITE_REG(hw, IXGBE_SRRCTL(rx_ring->hw_index), reg_val);
2113 }
2114 
2115 static void
2116 ixgbe_setup_rx(ixgbe_t *ixgbe)
2117 {
2118 	ixgbe_rx_ring_t *rx_ring;
2119 	struct ixgbe_hw *hw = &ixgbe->hw;
2120 	uint32_t reg_val;
2121 	uint32_t ring_mapping;
2122 	uint32_t i, index;
2123 	uint32_t psrtype_rss_bit;
2124 
2125 	/* PSRTYPE must be configured for 82599 */
2126 	if (ixgbe->classify_mode != IXGBE_CLASSIFY_VMDQ &&
2127 	    ixgbe->classify_mode != IXGBE_CLASSIFY_VMDQ_RSS) {
2128 		reg_val = IXGBE_PSRTYPE_TCPHDR | IXGBE_PSRTYPE_UDPHDR |
2129 		    IXGBE_PSRTYPE_IPV4HDR | IXGBE_PSRTYPE_IPV6HDR;
2130 		reg_val |= IXGBE_PSRTYPE_L2HDR;
2131 		reg_val |= 0x80000000;
2132 		IXGBE_WRITE_REG(hw, IXGBE_PSRTYPE(0), reg_val);
2133 	} else {
2134 		if (ixgbe->num_rx_groups > 32) {
2135 			psrtype_rss_bit = 0x20000000;
2136 		} else {
2137 			psrtype_rss_bit = 0x40000000;
2138 		}
2139 		for (i = 0; i < ixgbe->capab->max_rx_grp_num; i++) {
2140 			reg_val = IXGBE_PSRTYPE_TCPHDR | IXGBE_PSRTYPE_UDPHDR |
2141 			    IXGBE_PSRTYPE_IPV4HDR | IXGBE_PSRTYPE_IPV6HDR;
2142 			reg_val |= IXGBE_PSRTYPE_L2HDR;
2143 			reg_val |= psrtype_rss_bit;
2144 			IXGBE_WRITE_REG(hw, IXGBE_PSRTYPE(i), reg_val);
2145 		}
2146 	}
2147 
2148 	/*
2149 	 * Set filter control in FCTRL to accept broadcast packets and do
2150 	 * not pass pause frames to host.  Flow control settings are already
2151 	 * in this register, so preserve them.
2152 	 */
2153 	reg_val = IXGBE_READ_REG(hw, IXGBE_FCTRL);
2154 	reg_val |= IXGBE_FCTRL_BAM;	/* broadcast accept mode */
2155 	reg_val |= IXGBE_FCTRL_DPF;	/* discard pause frames */
2156 	IXGBE_WRITE_REG(hw, IXGBE_FCTRL, reg_val);
2157 
2158 	/*
2159 	 * Hardware checksum settings
2160 	 */
2161 	if (ixgbe->rx_hcksum_enable) {
2162 		reg_val = IXGBE_RXCSUM_IPPCSE;	/* IP checksum */
2163 		IXGBE_WRITE_REG(hw, IXGBE_RXCSUM, reg_val);
2164 	}
2165 
2166 	/*
2167 	 * Setup VMDq and RSS for multiple receive queues
2168 	 */
2169 	switch (ixgbe->classify_mode) {
2170 	case IXGBE_CLASSIFY_RSS:
2171 		/*
2172 		 * One group, only RSS is needed when more than
2173 		 * one ring enabled.
2174 		 */
2175 		ixgbe_setup_rss(ixgbe);
2176 		break;
2177 
2178 	case IXGBE_CLASSIFY_VMDQ:
2179 		/*
2180 		 * Multiple groups, each group has one ring,
2181 		 * only VMDq is needed.
2182 		 */
2183 		ixgbe_setup_vmdq(ixgbe);
2184 		break;
2185 
2186 	case IXGBE_CLASSIFY_VMDQ_RSS:
2187 		/*
2188 		 * Multiple groups and multiple rings, both
2189 		 * VMDq and RSS are needed.
2190 		 */
2191 		ixgbe_setup_vmdq_rss(ixgbe);
2192 		break;
2193 
2194 	default:
2195 		break;
2196 	}
2197 
2198 	/*
2199 	 * Enable the receive unit.  This must be done after filter
2200 	 * control is set in FCTRL.
2201 	 */
2202 	reg_val = (IXGBE_RXCTRL_RXEN	/* Enable Receive Unit */
2203 	    | IXGBE_RXCTRL_DMBYPS);	/* descriptor monitor bypass */
2204 	IXGBE_WRITE_REG(hw, IXGBE_RXCTRL, reg_val);
2205 
2206 	/*
2207 	 * ixgbe_setup_rx_ring must be called after configuring RXCTRL
2208 	 */
2209 	for (i = 0; i < ixgbe->num_rx_rings; i++) {
2210 		rx_ring = &ixgbe->rx_rings[i];
2211 		ixgbe_setup_rx_ring(rx_ring);
2212 	}
2213 
2214 	/*
2215 	 * Setup the per-ring statistics mapping.
2216 	 */
2217 	ring_mapping = 0;
2218 	for (i = 0; i < ixgbe->num_rx_rings; i++) {
2219 		index = ixgbe->rx_rings[i].hw_index;
2220 		ring_mapping = IXGBE_READ_REG(hw, IXGBE_RQSMR(index >> 2));
2221 		ring_mapping |= (i & 0xF) << (8 * (index & 0x3));
2222 		IXGBE_WRITE_REG(hw, IXGBE_RQSMR(index >> 2), ring_mapping);
2223 	}
2224 
2225 	/*
2226 	 * The Max Frame Size in MHADD/MAXFRS will be internally increased
2227 	 * by four bytes if the packet has a VLAN field, so includes MTU,
2228 	 * ethernet header and frame check sequence.
2229 	 * Register is MAXFRS in 82599.
2230 	 */
2231 	reg_val = (ixgbe->default_mtu + sizeof (struct ether_header)
2232 	    + ETHERFCSL) << IXGBE_MHADD_MFS_SHIFT;
2233 	IXGBE_WRITE_REG(hw, IXGBE_MHADD, reg_val);
2234 
2235 	/*
2236 	 * Setup Jumbo Frame enable bit
2237 	 */
2238 	if (ixgbe->default_mtu > ETHERMTU) {
2239 		reg_val = IXGBE_READ_REG(hw, IXGBE_HLREG0);
2240 		reg_val |= IXGBE_HLREG0_JUMBOEN;
2241 		IXGBE_WRITE_REG(hw, IXGBE_HLREG0, reg_val);
2242 	}
2243 
2244 	/*
2245 	 * Setup RSC for multiple receive queues.
2246 	 */
2247 	if (ixgbe->lro_enable) {
2248 		for (i = 0; i < ixgbe->num_rx_rings; i++) {
2249 			/*
2250 			 * Make sure rx_buf_size * MAXDESC not greater
2251 			 * than 65535.
2252 			 * Intel recommends 4 for MAXDESC field value.
2253 			 */
2254 			reg_val = IXGBE_READ_REG(hw, IXGBE_RSCCTL(i));
2255 			reg_val |= IXGBE_RSCCTL_RSCEN;
2256 			if (ixgbe->rx_buf_size == IXGBE_PKG_BUF_16k)
2257 				reg_val |= IXGBE_RSCCTL_MAXDESC_1;
2258 			else
2259 				reg_val |= IXGBE_RSCCTL_MAXDESC_4;
2260 			IXGBE_WRITE_REG(hw,  IXGBE_RSCCTL(i), reg_val);
2261 		}
2262 
2263 		reg_val = IXGBE_READ_REG(hw, IXGBE_RSCDBU);
2264 		reg_val |= IXGBE_RSCDBU_RSCACKDIS;
2265 		IXGBE_WRITE_REG(hw, IXGBE_RSCDBU, reg_val);
2266 
2267 		reg_val = IXGBE_READ_REG(hw, IXGBE_RDRXCTL);
2268 		reg_val |= IXGBE_RDRXCTL_RSCACKC;
2269 		reg_val |= IXGBE_RDRXCTL_FCOE_WRFIX;
2270 		reg_val &= ~IXGBE_RDRXCTL_RSCFRSTSIZE;
2271 
2272 		IXGBE_WRITE_REG(hw, IXGBE_RDRXCTL, reg_val);
2273 	}
2274 }
2275 
2276 static void
2277 ixgbe_setup_tx_ring(ixgbe_tx_ring_t *tx_ring)
2278 {
2279 	ixgbe_t *ixgbe = tx_ring->ixgbe;
2280 	struct ixgbe_hw *hw = &ixgbe->hw;
2281 	uint32_t size;
2282 	uint32_t buf_low;
2283 	uint32_t buf_high;
2284 	uint32_t reg_val;
2285 
2286 	ASSERT(mutex_owned(&tx_ring->tx_lock));
2287 	ASSERT(mutex_owned(&ixgbe->gen_lock));
2288 
2289 	/*
2290 	 * Initialize the length register
2291 	 */
2292 	size = tx_ring->ring_size * sizeof (union ixgbe_adv_tx_desc);
2293 	IXGBE_WRITE_REG(hw, IXGBE_TDLEN(tx_ring->index), size);
2294 
2295 	/*
2296 	 * Initialize the base address registers
2297 	 */
2298 	buf_low = (uint32_t)tx_ring->tbd_area.dma_address;
2299 	buf_high = (uint32_t)(tx_ring->tbd_area.dma_address >> 32);
2300 	IXGBE_WRITE_REG(hw, IXGBE_TDBAL(tx_ring->index), buf_low);
2301 	IXGBE_WRITE_REG(hw, IXGBE_TDBAH(tx_ring->index), buf_high);
2302 
2303 	/*
2304 	 * Setup head & tail pointers
2305 	 */
2306 	IXGBE_WRITE_REG(hw, IXGBE_TDH(tx_ring->index), 0);
2307 	IXGBE_WRITE_REG(hw, IXGBE_TDT(tx_ring->index), 0);
2308 
2309 	/*
2310 	 * Setup head write-back
2311 	 */
2312 	if (ixgbe->tx_head_wb_enable) {
2313 		/*
2314 		 * The memory of the head write-back is allocated using
2315 		 * the extra tbd beyond the tail of the tbd ring.
2316 		 */
2317 		tx_ring->tbd_head_wb = (uint32_t *)
2318 		    ((uintptr_t)tx_ring->tbd_area.address + size);
2319 		*tx_ring->tbd_head_wb = 0;
2320 
2321 		buf_low = (uint32_t)
2322 		    (tx_ring->tbd_area.dma_address + size);
2323 		buf_high = (uint32_t)
2324 		    ((tx_ring->tbd_area.dma_address + size) >> 32);
2325 
2326 		/* Set the head write-back enable bit */
2327 		buf_low |= IXGBE_TDWBAL_HEAD_WB_ENABLE;
2328 
2329 		IXGBE_WRITE_REG(hw, IXGBE_TDWBAL(tx_ring->index), buf_low);
2330 		IXGBE_WRITE_REG(hw, IXGBE_TDWBAH(tx_ring->index), buf_high);
2331 
2332 		/*
2333 		 * Turn off relaxed ordering for head write back or it will
2334 		 * cause problems with the tx recycling
2335 		 */
2336 		reg_val = IXGBE_READ_REG(hw,
2337 		    IXGBE_DCA_TXCTRL(tx_ring->index));
2338 		reg_val &= ~IXGBE_DCA_TXCTRL_TX_WB_RO_EN;
2339 		IXGBE_WRITE_REG(hw,
2340 		    IXGBE_DCA_TXCTRL(tx_ring->index), reg_val);
2341 	} else {
2342 		tx_ring->tbd_head_wb = NULL;
2343 	}
2344 
2345 	tx_ring->tbd_head = 0;
2346 	tx_ring->tbd_tail = 0;
2347 	tx_ring->tbd_free = tx_ring->ring_size;
2348 
2349 	if (ixgbe->tx_ring_init == B_TRUE) {
2350 		tx_ring->tcb_head = 0;
2351 		tx_ring->tcb_tail = 0;
2352 		tx_ring->tcb_free = tx_ring->free_list_size;
2353 	}
2354 
2355 	/*
2356 	 * Initialize the s/w context structure
2357 	 */
2358 	bzero(&tx_ring->tx_context, sizeof (ixgbe_tx_context_t));
2359 }
2360 
2361 static void
2362 ixgbe_setup_tx(ixgbe_t *ixgbe)
2363 {
2364 	struct ixgbe_hw *hw = &ixgbe->hw;
2365 	ixgbe_tx_ring_t *tx_ring;
2366 	uint32_t reg_val;
2367 	uint32_t ring_mapping;
2368 	int i;
2369 
2370 	for (i = 0; i < ixgbe->num_tx_rings; i++) {
2371 		tx_ring = &ixgbe->tx_rings[i];
2372 		ixgbe_setup_tx_ring(tx_ring);
2373 	}
2374 
2375 	/*
2376 	 * Setup the per-ring statistics mapping.
2377 	 */
2378 	ring_mapping = 0;
2379 	for (i = 0; i < ixgbe->num_tx_rings; i++) {
2380 		ring_mapping |= (i & 0xF) << (8 * (i & 0x3));
2381 		if ((i & 0x3) == 0x3) {
2382 			switch (hw->mac.type) {
2383 			case ixgbe_mac_82598EB:
2384 				IXGBE_WRITE_REG(hw, IXGBE_TQSMR(i >> 2),
2385 				    ring_mapping);
2386 				break;
2387 
2388 			case ixgbe_mac_82599EB:
2389 				IXGBE_WRITE_REG(hw, IXGBE_TQSM(i >> 2),
2390 				    ring_mapping);
2391 				break;
2392 
2393 			default:
2394 				break;
2395 			}
2396 
2397 			ring_mapping = 0;
2398 		}
2399 	}
2400 	if (i & 0x3) {
2401 		switch (hw->mac.type) {
2402 		case ixgbe_mac_82598EB:
2403 			IXGBE_WRITE_REG(hw, IXGBE_TQSMR(i >> 2), ring_mapping);
2404 			break;
2405 
2406 		case ixgbe_mac_82599EB:
2407 			IXGBE_WRITE_REG(hw, IXGBE_TQSM(i >> 2), ring_mapping);
2408 			break;
2409 
2410 		default:
2411 			break;
2412 		}
2413 	}
2414 
2415 	/*
2416 	 * Enable CRC appending and TX padding (for short tx frames)
2417 	 */
2418 	reg_val = IXGBE_READ_REG(hw, IXGBE_HLREG0);
2419 	reg_val |= IXGBE_HLREG0_TXCRCEN | IXGBE_HLREG0_TXPADEN;
2420 	IXGBE_WRITE_REG(hw, IXGBE_HLREG0, reg_val);
2421 
2422 	/*
2423 	 * enable DMA for 82599 parts
2424 	 */
2425 	if (hw->mac.type == ixgbe_mac_82599EB) {
2426 	/* DMATXCTL.TE must be set after all Tx config is complete */
2427 		reg_val = IXGBE_READ_REG(hw, IXGBE_DMATXCTL);
2428 		reg_val |= IXGBE_DMATXCTL_TE;
2429 		IXGBE_WRITE_REG(hw, IXGBE_DMATXCTL, reg_val);
2430 	}
2431 
2432 	/*
2433 	 * Enabling tx queues ..
2434 	 * For 82599 must be done after DMATXCTL.TE is set
2435 	 */
2436 	for (i = 0; i < ixgbe->num_tx_rings; i++) {
2437 		tx_ring = &ixgbe->tx_rings[i];
2438 		reg_val = IXGBE_READ_REG(hw, IXGBE_TXDCTL(tx_ring->index));
2439 		reg_val |= IXGBE_TXDCTL_ENABLE;
2440 		IXGBE_WRITE_REG(hw, IXGBE_TXDCTL(tx_ring->index), reg_val);
2441 	}
2442 }
2443 
2444 /*
2445  * ixgbe_setup_rss - Setup receive-side scaling feature.
2446  */
2447 static void
2448 ixgbe_setup_rss(ixgbe_t *ixgbe)
2449 {
2450 	struct ixgbe_hw *hw = &ixgbe->hw;
2451 	uint32_t i, mrqc, rxcsum;
2452 	uint32_t random;
2453 	uint32_t reta;
2454 	uint32_t ring_per_group;
2455 
2456 	/*
2457 	 * Fill out redirection table
2458 	 */
2459 	reta = 0;
2460 	ring_per_group = ixgbe->num_rx_rings / ixgbe->num_rx_groups;
2461 
2462 	for (i = 0; i < 128; i++) {
2463 		reta = (reta << 8) | (i % ring_per_group) |
2464 		    ((i % ring_per_group) << 4);
2465 		if ((i & 3) == 3)
2466 			IXGBE_WRITE_REG(hw, IXGBE_RETA(i >> 2), reta);
2467 	}
2468 
2469 	/*
2470 	 * Fill out hash function seeds with a random constant
2471 	 */
2472 	for (i = 0; i < 10; i++) {
2473 		(void) random_get_pseudo_bytes((uint8_t *)&random,
2474 		    sizeof (uint32_t));
2475 		IXGBE_WRITE_REG(hw, IXGBE_RSSRK(i), random);
2476 	}
2477 
2478 	/*
2479 	 * Enable RSS & perform hash on these packet types
2480 	 */
2481 	mrqc = IXGBE_MRQC_RSSEN |
2482 	    IXGBE_MRQC_RSS_FIELD_IPV4 |
2483 	    IXGBE_MRQC_RSS_FIELD_IPV4_TCP |
2484 	    IXGBE_MRQC_RSS_FIELD_IPV4_UDP |
2485 	    IXGBE_MRQC_RSS_FIELD_IPV6_EX_TCP |
2486 	    IXGBE_MRQC_RSS_FIELD_IPV6_EX |
2487 	    IXGBE_MRQC_RSS_FIELD_IPV6 |
2488 	    IXGBE_MRQC_RSS_FIELD_IPV6_TCP |
2489 	    IXGBE_MRQC_RSS_FIELD_IPV6_UDP |
2490 	    IXGBE_MRQC_RSS_FIELD_IPV6_EX_UDP;
2491 	IXGBE_WRITE_REG(hw, IXGBE_MRQC, mrqc);
2492 
2493 	/*
2494 	 * Disable Packet Checksum to enable RSS for multiple receive queues.
2495 	 * It is an adapter hardware limitation that Packet Checksum is
2496 	 * mutually exclusive with RSS.
2497 	 */
2498 	rxcsum = IXGBE_READ_REG(hw, IXGBE_RXCSUM);
2499 	rxcsum |= IXGBE_RXCSUM_PCSD;
2500 	rxcsum &= ~IXGBE_RXCSUM_IPPCSE;
2501 	IXGBE_WRITE_REG(hw, IXGBE_RXCSUM, rxcsum);
2502 }
2503 
2504 /*
2505  * ixgbe_setup_vmdq - Setup MAC classification feature
2506  */
2507 static void
2508 ixgbe_setup_vmdq(ixgbe_t *ixgbe)
2509 {
2510 	struct ixgbe_hw *hw = &ixgbe->hw;
2511 	uint32_t vmdctl, i, vtctl;
2512 
2513 	/*
2514 	 * Setup the VMDq Control register, enable VMDq based on
2515 	 * packet destination MAC address:
2516 	 */
2517 	switch (hw->mac.type) {
2518 	case ixgbe_mac_82598EB:
2519 		/*
2520 		 * VMDq Enable = 1;
2521 		 * VMDq Filter = 0; MAC filtering
2522 		 * Default VMDq output index = 0;
2523 		 */
2524 		vmdctl = IXGBE_VMD_CTL_VMDQ_EN;
2525 		IXGBE_WRITE_REG(hw, IXGBE_VMD_CTL, vmdctl);
2526 		break;
2527 
2528 	case ixgbe_mac_82599EB:
2529 		/*
2530 		 * Enable VMDq-only.
2531 		 */
2532 		vmdctl = IXGBE_MRQC_VMDQEN;
2533 		IXGBE_WRITE_REG(hw, IXGBE_MRQC, vmdctl);
2534 
2535 		for (i = 0; i < hw->mac.num_rar_entries; i++) {
2536 			IXGBE_WRITE_REG(hw, IXGBE_MPSAR_LO(i), 0);
2537 			IXGBE_WRITE_REG(hw, IXGBE_MPSAR_HI(i), 0);
2538 		}
2539 
2540 		/*
2541 		 * Enable Virtualization and Replication.
2542 		 */
2543 		vtctl = IXGBE_VT_CTL_VT_ENABLE | IXGBE_VT_CTL_REPLEN;
2544 		IXGBE_WRITE_REG(hw, IXGBE_VT_CTL, vtctl);
2545 
2546 		/*
2547 		 * Enable receiving packets to all VFs
2548 		 */
2549 		IXGBE_WRITE_REG(hw, IXGBE_VFRE(0), IXGBE_VFRE_ENABLE_ALL);
2550 		IXGBE_WRITE_REG(hw, IXGBE_VFRE(1), IXGBE_VFRE_ENABLE_ALL);
2551 		break;
2552 
2553 	default:
2554 		break;
2555 	}
2556 }
2557 
2558 /*
2559  * ixgbe_setup_vmdq_rss - Setup both vmdq feature and rss feature.
2560  */
2561 static void
2562 ixgbe_setup_vmdq_rss(ixgbe_t *ixgbe)
2563 {
2564 	struct ixgbe_hw *hw = &ixgbe->hw;
2565 	uint32_t i, mrqc, rxcsum;
2566 	uint32_t random;
2567 	uint32_t reta;
2568 	uint32_t ring_per_group;
2569 	uint32_t vmdctl, vtctl;
2570 
2571 	/*
2572 	 * Fill out redirection table
2573 	 */
2574 	reta = 0;
2575 	ring_per_group = ixgbe->num_rx_rings / ixgbe->num_rx_groups;
2576 	for (i = 0; i < 128; i++) {
2577 		reta = (reta << 8) | (i % ring_per_group) |
2578 		    ((i % ring_per_group) << 4);
2579 		if ((i & 3) == 3)
2580 			IXGBE_WRITE_REG(hw, IXGBE_RETA(i >> 2), reta);
2581 	}
2582 
2583 	/*
2584 	 * Fill out hash function seeds with a random constant
2585 	 */
2586 	for (i = 0; i < 10; i++) {
2587 		(void) random_get_pseudo_bytes((uint8_t *)&random,
2588 		    sizeof (uint32_t));
2589 		IXGBE_WRITE_REG(hw, IXGBE_RSSRK(i), random);
2590 	}
2591 
2592 	/*
2593 	 * Enable and setup RSS and VMDq
2594 	 */
2595 	switch (hw->mac.type) {
2596 	case ixgbe_mac_82598EB:
2597 		/*
2598 		 * Enable RSS & Setup RSS Hash functions
2599 		 */
2600 		mrqc = IXGBE_MRQC_RSSEN |
2601 		    IXGBE_MRQC_RSS_FIELD_IPV4 |
2602 		    IXGBE_MRQC_RSS_FIELD_IPV4_TCP |
2603 		    IXGBE_MRQC_RSS_FIELD_IPV4_UDP |
2604 		    IXGBE_MRQC_RSS_FIELD_IPV6_EX_TCP |
2605 		    IXGBE_MRQC_RSS_FIELD_IPV6_EX |
2606 		    IXGBE_MRQC_RSS_FIELD_IPV6 |
2607 		    IXGBE_MRQC_RSS_FIELD_IPV6_TCP |
2608 		    IXGBE_MRQC_RSS_FIELD_IPV6_UDP |
2609 		    IXGBE_MRQC_RSS_FIELD_IPV6_EX_UDP;
2610 		IXGBE_WRITE_REG(hw, IXGBE_MRQC, mrqc);
2611 
2612 		/*
2613 		 * Enable and Setup VMDq
2614 		 * VMDq Filter = 0; MAC filtering
2615 		 * Default VMDq output index = 0;
2616 		 */
2617 		vmdctl = IXGBE_VMD_CTL_VMDQ_EN;
2618 		IXGBE_WRITE_REG(hw, IXGBE_VMD_CTL, vmdctl);
2619 		break;
2620 
2621 	case ixgbe_mac_82599EB:
2622 		/*
2623 		 * Enable RSS & Setup RSS Hash functions
2624 		 */
2625 		mrqc = IXGBE_MRQC_RSS_FIELD_IPV4 |
2626 		    IXGBE_MRQC_RSS_FIELD_IPV4_TCP |
2627 		    IXGBE_MRQC_RSS_FIELD_IPV4_UDP |
2628 		    IXGBE_MRQC_RSS_FIELD_IPV6_EX_TCP |
2629 		    IXGBE_MRQC_RSS_FIELD_IPV6_EX |
2630 		    IXGBE_MRQC_RSS_FIELD_IPV6 |
2631 		    IXGBE_MRQC_RSS_FIELD_IPV6_TCP |
2632 		    IXGBE_MRQC_RSS_FIELD_IPV6_UDP |
2633 		    IXGBE_MRQC_RSS_FIELD_IPV6_EX_UDP;
2634 
2635 		/*
2636 		 * Enable VMDq+RSS.
2637 		 */
2638 		if (ixgbe->num_rx_groups > 32)  {
2639 			mrqc = mrqc | IXGBE_MRQC_VMDQRSS64EN;
2640 		} else {
2641 			mrqc = mrqc | IXGBE_MRQC_VMDQRSS32EN;
2642 		}
2643 
2644 		IXGBE_WRITE_REG(hw, IXGBE_MRQC, mrqc);
2645 
2646 		for (i = 0; i < hw->mac.num_rar_entries; i++) {
2647 			IXGBE_WRITE_REG(hw, IXGBE_MPSAR_LO(i), 0);
2648 			IXGBE_WRITE_REG(hw, IXGBE_MPSAR_HI(i), 0);
2649 		}
2650 		break;
2651 
2652 	default:
2653 		break;
2654 
2655 	}
2656 
2657 	/*
2658 	 * Disable Packet Checksum to enable RSS for multiple receive queues.
2659 	 * It is an adapter hardware limitation that Packet Checksum is
2660 	 * mutually exclusive with RSS.
2661 	 */
2662 	rxcsum = IXGBE_READ_REG(hw, IXGBE_RXCSUM);
2663 	rxcsum |= IXGBE_RXCSUM_PCSD;
2664 	rxcsum &= ~IXGBE_RXCSUM_IPPCSE;
2665 	IXGBE_WRITE_REG(hw, IXGBE_RXCSUM, rxcsum);
2666 
2667 	if (hw->mac.type == ixgbe_mac_82599EB) {
2668 		/*
2669 		 * Enable Virtualization and Replication.
2670 		 */
2671 		vtctl = IXGBE_VT_CTL_VT_ENABLE | IXGBE_VT_CTL_REPLEN;
2672 		IXGBE_WRITE_REG(hw, IXGBE_VT_CTL, vtctl);
2673 
2674 		/*
2675 		 * Enable receiving packets to all VFs
2676 		 */
2677 		IXGBE_WRITE_REG(hw, IXGBE_VFRE(0), IXGBE_VFRE_ENABLE_ALL);
2678 		IXGBE_WRITE_REG(hw, IXGBE_VFRE(1), IXGBE_VFRE_ENABLE_ALL);
2679 	}
2680 }
2681 
2682 /*
2683  * ixgbe_init_unicst - Initialize the unicast addresses.
2684  */
2685 static void
2686 ixgbe_init_unicst(ixgbe_t *ixgbe)
2687 {
2688 	struct ixgbe_hw *hw = &ixgbe->hw;
2689 	uint8_t *mac_addr;
2690 	int slot;
2691 	/*
2692 	 * Here we should consider two situations:
2693 	 *
2694 	 * 1. Chipset is initialized at the first time,
2695 	 *    Clear all the multiple unicast addresses.
2696 	 *
2697 	 * 2. Chipset is reset
2698 	 *    Recover the multiple unicast addresses from the
2699 	 *    software data structure to the RAR registers.
2700 	 */
2701 	if (!ixgbe->unicst_init) {
2702 		/*
2703 		 * Initialize the multiple unicast addresses
2704 		 */
2705 		ixgbe->unicst_total = hw->mac.num_rar_entries;
2706 		ixgbe->unicst_avail = ixgbe->unicst_total;
2707 		for (slot = 0; slot < ixgbe->unicst_total; slot++) {
2708 			mac_addr = ixgbe->unicst_addr[slot].mac.addr;
2709 			bzero(mac_addr, ETHERADDRL);
2710 			(void) ixgbe_set_rar(hw, slot, mac_addr, NULL, NULL);
2711 			ixgbe->unicst_addr[slot].mac.set = 0;
2712 		}
2713 		ixgbe->unicst_init = B_TRUE;
2714 	} else {
2715 		/* Re-configure the RAR registers */
2716 		for (slot = 0; slot < ixgbe->unicst_total; slot++) {
2717 			mac_addr = ixgbe->unicst_addr[slot].mac.addr;
2718 			if (ixgbe->unicst_addr[slot].mac.set == 1) {
2719 				(void) ixgbe_set_rar(hw, slot, mac_addr,
2720 				    ixgbe->unicst_addr[slot].mac.group_index,
2721 				    IXGBE_RAH_AV);
2722 			} else {
2723 				bzero(mac_addr, ETHERADDRL);
2724 				(void) ixgbe_set_rar(hw, slot, mac_addr,
2725 				    NULL, NULL);
2726 			}
2727 		}
2728 	}
2729 }
2730 
2731 /*
2732  * ixgbe_unicst_find - Find the slot for the specified unicast address
2733  */
2734 int
2735 ixgbe_unicst_find(ixgbe_t *ixgbe, const uint8_t *mac_addr)
2736 {
2737 	int slot;
2738 
2739 	ASSERT(mutex_owned(&ixgbe->gen_lock));
2740 
2741 	for (slot = 0; slot < ixgbe->unicst_total; slot++) {
2742 		if (bcmp(ixgbe->unicst_addr[slot].mac.addr,
2743 		    mac_addr, ETHERADDRL) == 0)
2744 			return (slot);
2745 	}
2746 
2747 	return (-1);
2748 }
2749 
2750 /*
2751  * ixgbe_multicst_add - Add a multicst address.
2752  */
2753 int
2754 ixgbe_multicst_add(ixgbe_t *ixgbe, const uint8_t *multiaddr)
2755 {
2756 	ASSERT(mutex_owned(&ixgbe->gen_lock));
2757 
2758 	if ((multiaddr[0] & 01) == 0) {
2759 		return (EINVAL);
2760 	}
2761 
2762 	if (ixgbe->mcast_count >= MAX_NUM_MULTICAST_ADDRESSES) {
2763 		return (ENOENT);
2764 	}
2765 
2766 	bcopy(multiaddr,
2767 	    &ixgbe->mcast_table[ixgbe->mcast_count], ETHERADDRL);
2768 	ixgbe->mcast_count++;
2769 
2770 	/*
2771 	 * Update the multicast table in the hardware
2772 	 */
2773 	ixgbe_setup_multicst(ixgbe);
2774 
2775 	if (ixgbe_check_acc_handle(ixgbe->osdep.reg_handle) != DDI_FM_OK) {
2776 		ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_DEGRADED);
2777 		return (EIO);
2778 	}
2779 
2780 	return (0);
2781 }
2782 
2783 /*
2784  * ixgbe_multicst_remove - Remove a multicst address.
2785  */
2786 int
2787 ixgbe_multicst_remove(ixgbe_t *ixgbe, const uint8_t *multiaddr)
2788 {
2789 	int i;
2790 
2791 	ASSERT(mutex_owned(&ixgbe->gen_lock));
2792 
2793 	for (i = 0; i < ixgbe->mcast_count; i++) {
2794 		if (bcmp(multiaddr, &ixgbe->mcast_table[i],
2795 		    ETHERADDRL) == 0) {
2796 			for (i++; i < ixgbe->mcast_count; i++) {
2797 				ixgbe->mcast_table[i - 1] =
2798 				    ixgbe->mcast_table[i];
2799 			}
2800 			ixgbe->mcast_count--;
2801 			break;
2802 		}
2803 	}
2804 
2805 	/*
2806 	 * Update the multicast table in the hardware
2807 	 */
2808 	ixgbe_setup_multicst(ixgbe);
2809 
2810 	if (ixgbe_check_acc_handle(ixgbe->osdep.reg_handle) != DDI_FM_OK) {
2811 		ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_DEGRADED);
2812 		return (EIO);
2813 	}
2814 
2815 	return (0);
2816 }
2817 
2818 /*
2819  * ixgbe_setup_multicast - Setup multicast data structures.
2820  *
2821  * This routine initializes all of the multicast related structures
2822  * and save them in the hardware registers.
2823  */
2824 static void
2825 ixgbe_setup_multicst(ixgbe_t *ixgbe)
2826 {
2827 	uint8_t *mc_addr_list;
2828 	uint32_t mc_addr_count;
2829 	struct ixgbe_hw *hw = &ixgbe->hw;
2830 
2831 	ASSERT(mutex_owned(&ixgbe->gen_lock));
2832 
2833 	ASSERT(ixgbe->mcast_count <= MAX_NUM_MULTICAST_ADDRESSES);
2834 
2835 	mc_addr_list = (uint8_t *)ixgbe->mcast_table;
2836 	mc_addr_count = ixgbe->mcast_count;
2837 
2838 	/*
2839 	 * Update the multicast addresses to the MTA registers
2840 	 */
2841 	(void) ixgbe_update_mc_addr_list(hw, mc_addr_list, mc_addr_count,
2842 	    ixgbe_mc_table_itr);
2843 }
2844 
2845 /*
2846  * ixgbe_setup_vmdq_rss_conf - Configure vmdq and rss (number and mode).
2847  *
2848  * Configure the rx classification mode (vmdq & rss) and vmdq & rss numbers.
2849  * Different chipsets may have different allowed configuration of vmdq and rss.
2850  */
2851 static void
2852 ixgbe_setup_vmdq_rss_conf(ixgbe_t *ixgbe)
2853 {
2854 	struct ixgbe_hw *hw = &ixgbe->hw;
2855 	uint32_t ring_per_group;
2856 
2857 	switch (hw->mac.type) {
2858 	case ixgbe_mac_82598EB:
2859 		/*
2860 		 * 82598 supports the following combination:
2861 		 * vmdq no. x rss no.
2862 		 * [5..16]  x 1
2863 		 * [1..4]   x [1..16]
2864 		 * However 8 rss queue per pool (vmdq) is sufficient for
2865 		 * most cases.
2866 		 */
2867 		ring_per_group = ixgbe->num_rx_rings / ixgbe->num_rx_groups;
2868 		if (ixgbe->num_rx_groups > 4) {
2869 			ixgbe->num_rx_rings = ixgbe->num_rx_groups;
2870 		} else {
2871 			ixgbe->num_rx_rings = ixgbe->num_rx_groups *
2872 			    min(8, ring_per_group);
2873 		}
2874 
2875 		break;
2876 
2877 	case ixgbe_mac_82599EB:
2878 		/*
2879 		 * 82599 supports the following combination:
2880 		 * vmdq no. x rss no.
2881 		 * [33..64] x [1..2]
2882 		 * [2..32]  x [1..4]
2883 		 * 1 x [1..16]
2884 		 * However 8 rss queue per pool (vmdq) is sufficient for
2885 		 * most cases.
2886 		 */
2887 		ring_per_group = ixgbe->num_rx_rings / ixgbe->num_rx_groups;
2888 		if (ixgbe->num_rx_groups == 1) {
2889 			ixgbe->num_rx_rings = min(8, ring_per_group);
2890 		} else if (ixgbe->num_rx_groups <= 32) {
2891 			ixgbe->num_rx_rings = ixgbe->num_rx_groups *
2892 			    min(4, ring_per_group);
2893 		} else if (ixgbe->num_rx_groups <= 64) {
2894 			ixgbe->num_rx_rings = ixgbe->num_rx_groups *
2895 			    min(2, ring_per_group);
2896 		}
2897 		break;
2898 
2899 	default:
2900 		break;
2901 	}
2902 
2903 	ring_per_group = ixgbe->num_rx_rings / ixgbe->num_rx_groups;
2904 
2905 	if (ixgbe->num_rx_groups == 1 && ring_per_group == 1) {
2906 		ixgbe->classify_mode = IXGBE_CLASSIFY_NONE;
2907 	} else if (ixgbe->num_rx_groups != 1 && ring_per_group == 1) {
2908 		ixgbe->classify_mode = IXGBE_CLASSIFY_VMDQ;
2909 	} else if (ixgbe->num_rx_groups != 1 && ring_per_group != 1) {
2910 		ixgbe->classify_mode = IXGBE_CLASSIFY_VMDQ_RSS;
2911 	} else {
2912 		ixgbe->classify_mode = IXGBE_CLASSIFY_RSS;
2913 	}
2914 
2915 	IXGBE_DEBUGLOG_2(ixgbe, "rx group number:%d, rx ring number:%d",
2916 	    ixgbe->num_rx_groups, ixgbe->num_rx_rings);
2917 }
2918 
2919 /*
2920  * ixgbe_get_conf - Get driver configurations set in driver.conf.
2921  *
2922  * This routine gets user-configured values out of the configuration
2923  * file ixgbe.conf.
2924  *
2925  * For each configurable value, there is a minimum, a maximum, and a
2926  * default.
2927  * If user does not configure a value, use the default.
2928  * If user configures below the minimum, use the minumum.
2929  * If user configures above the maximum, use the maxumum.
2930  */
2931 static void
2932 ixgbe_get_conf(ixgbe_t *ixgbe)
2933 {
2934 	struct ixgbe_hw *hw = &ixgbe->hw;
2935 	uint32_t flow_control;
2936 
2937 	/*
2938 	 * ixgbe driver supports the following user configurations:
2939 	 *
2940 	 * Jumbo frame configuration:
2941 	 *    default_mtu
2942 	 *
2943 	 * Ethernet flow control configuration:
2944 	 *    flow_control
2945 	 *
2946 	 * Multiple rings configurations:
2947 	 *    tx_queue_number
2948 	 *    tx_ring_size
2949 	 *    rx_queue_number
2950 	 *    rx_ring_size
2951 	 *
2952 	 * Call ixgbe_get_prop() to get the value for a specific
2953 	 * configuration parameter.
2954 	 */
2955 
2956 	/*
2957 	 * Jumbo frame configuration - max_frame_size controls host buffer
2958 	 * allocation, so includes MTU, ethernet header, vlan tag and
2959 	 * frame check sequence.
2960 	 */
2961 	ixgbe->default_mtu = ixgbe_get_prop(ixgbe, PROP_DEFAULT_MTU,
2962 	    MIN_MTU, ixgbe->capab->max_mtu, DEFAULT_MTU);
2963 
2964 	ixgbe->max_frame_size = ixgbe->default_mtu +
2965 	    sizeof (struct ether_vlan_header) + ETHERFCSL;
2966 
2967 	/*
2968 	 * Ethernet flow control configuration
2969 	 */
2970 	flow_control = ixgbe_get_prop(ixgbe, PROP_FLOW_CONTROL,
2971 	    ixgbe_fc_none, 3, ixgbe_fc_none);
2972 	if (flow_control == 3)
2973 		flow_control = ixgbe_fc_default;
2974 
2975 	/*
2976 	 * fc.requested mode is what the user requests.  After autoneg,
2977 	 * fc.current_mode will be the flow_control mode that was negotiated.
2978 	 */
2979 	hw->fc.requested_mode = flow_control;
2980 
2981 	/*
2982 	 * Multiple rings configurations
2983 	 */
2984 	ixgbe->num_tx_rings = ixgbe_get_prop(ixgbe, PROP_TX_QUEUE_NUM,
2985 	    ixgbe->capab->min_tx_que_num,
2986 	    ixgbe->capab->max_tx_que_num,
2987 	    ixgbe->capab->def_tx_que_num);
2988 	ixgbe->tx_ring_size = ixgbe_get_prop(ixgbe, PROP_TX_RING_SIZE,
2989 	    MIN_TX_RING_SIZE, MAX_TX_RING_SIZE, DEFAULT_TX_RING_SIZE);
2990 
2991 	ixgbe->num_rx_rings = ixgbe_get_prop(ixgbe, PROP_RX_QUEUE_NUM,
2992 	    ixgbe->capab->min_rx_que_num,
2993 	    ixgbe->capab->max_rx_que_num,
2994 	    ixgbe->capab->def_rx_que_num);
2995 	ixgbe->rx_ring_size = ixgbe_get_prop(ixgbe, PROP_RX_RING_SIZE,
2996 	    MIN_RX_RING_SIZE, MAX_RX_RING_SIZE, DEFAULT_RX_RING_SIZE);
2997 
2998 	/*
2999 	 * Multiple groups configuration
3000 	 */
3001 	ixgbe->num_rx_groups = ixgbe_get_prop(ixgbe, PROP_RX_GROUP_NUM,
3002 	    ixgbe->capab->min_rx_grp_num, ixgbe->capab->max_rx_grp_num,
3003 	    ixgbe->capab->def_rx_grp_num);
3004 
3005 	ixgbe->mr_enable = ixgbe_get_prop(ixgbe, PROP_MR_ENABLE,
3006 	    0, 1, DEFAULT_MR_ENABLE);
3007 
3008 	if (ixgbe->mr_enable == B_FALSE) {
3009 		ixgbe->num_tx_rings = 1;
3010 		ixgbe->num_rx_rings = 1;
3011 		ixgbe->num_rx_groups = 1;
3012 		ixgbe->classify_mode = IXGBE_CLASSIFY_NONE;
3013 	} else {
3014 		ixgbe->num_rx_rings = ixgbe->num_rx_groups *
3015 		    max(ixgbe->num_rx_rings / ixgbe->num_rx_groups, 1);
3016 		/*
3017 		 * The combination of num_rx_rings and num_rx_groups
3018 		 * may be not supported by h/w. We need to adjust
3019 		 * them to appropriate values.
3020 		 */
3021 		ixgbe_setup_vmdq_rss_conf(ixgbe);
3022 	}
3023 
3024 	/*
3025 	 * Tunable used to force an interrupt type. The only use is
3026 	 * for testing of the lesser interrupt types.
3027 	 * 0 = don't force interrupt type
3028 	 * 1 = force interrupt type MSI-X
3029 	 * 2 = force interrupt type MSI
3030 	 * 3 = force interrupt type Legacy
3031 	 */
3032 	ixgbe->intr_force = ixgbe_get_prop(ixgbe, PROP_INTR_FORCE,
3033 	    IXGBE_INTR_NONE, IXGBE_INTR_LEGACY, IXGBE_INTR_NONE);
3034 
3035 	ixgbe->tx_hcksum_enable = ixgbe_get_prop(ixgbe, PROP_TX_HCKSUM_ENABLE,
3036 	    0, 1, DEFAULT_TX_HCKSUM_ENABLE);
3037 	ixgbe->rx_hcksum_enable = ixgbe_get_prop(ixgbe, PROP_RX_HCKSUM_ENABLE,
3038 	    0, 1, DEFAULT_RX_HCKSUM_ENABLE);
3039 	ixgbe->lso_enable = ixgbe_get_prop(ixgbe, PROP_LSO_ENABLE,
3040 	    0, 1, DEFAULT_LSO_ENABLE);
3041 	ixgbe->lro_enable = ixgbe_get_prop(ixgbe, PROP_LRO_ENABLE,
3042 	    0, 1, DEFAULT_LRO_ENABLE);
3043 	ixgbe->tx_head_wb_enable = ixgbe_get_prop(ixgbe, PROP_TX_HEAD_WB_ENABLE,
3044 	    0, 1, DEFAULT_TX_HEAD_WB_ENABLE);
3045 	ixgbe->relax_order_enable = ixgbe_get_prop(ixgbe,
3046 	    PROP_RELAX_ORDER_ENABLE, 0, 1, DEFAULT_RELAX_ORDER_ENABLE);
3047 
3048 	/* Head Write Back not recommended for 82599 */
3049 	if (hw->mac.type >= ixgbe_mac_82599EB) {
3050 		ixgbe->tx_head_wb_enable = B_FALSE;
3051 	}
3052 
3053 	/*
3054 	 * ixgbe LSO needs the tx h/w checksum support.
3055 	 * LSO will be disabled if tx h/w checksum is not
3056 	 * enabled.
3057 	 */
3058 	if (ixgbe->tx_hcksum_enable == B_FALSE) {
3059 		ixgbe->lso_enable = B_FALSE;
3060 	}
3061 
3062 	/*
3063 	 * ixgbe LRO needs the rx h/w checksum support.
3064 	 * LRO will be disabled if rx h/w checksum is not
3065 	 * enabled.
3066 	 */
3067 	if (ixgbe->rx_hcksum_enable == B_FALSE) {
3068 		ixgbe->lro_enable = B_FALSE;
3069 	}
3070 
3071 	/*
3072 	 * ixgbe LRO only been supported by 82599 now
3073 	 */
3074 	if (hw->mac.type != ixgbe_mac_82599EB) {
3075 		ixgbe->lro_enable = B_FALSE;
3076 	}
3077 	ixgbe->tx_copy_thresh = ixgbe_get_prop(ixgbe, PROP_TX_COPY_THRESHOLD,
3078 	    MIN_TX_COPY_THRESHOLD, MAX_TX_COPY_THRESHOLD,
3079 	    DEFAULT_TX_COPY_THRESHOLD);
3080 	ixgbe->tx_recycle_thresh = ixgbe_get_prop(ixgbe,
3081 	    PROP_TX_RECYCLE_THRESHOLD, MIN_TX_RECYCLE_THRESHOLD,
3082 	    MAX_TX_RECYCLE_THRESHOLD, DEFAULT_TX_RECYCLE_THRESHOLD);
3083 	ixgbe->tx_overload_thresh = ixgbe_get_prop(ixgbe,
3084 	    PROP_TX_OVERLOAD_THRESHOLD, MIN_TX_OVERLOAD_THRESHOLD,
3085 	    MAX_TX_OVERLOAD_THRESHOLD, DEFAULT_TX_OVERLOAD_THRESHOLD);
3086 	ixgbe->tx_resched_thresh = ixgbe_get_prop(ixgbe,
3087 	    PROP_TX_RESCHED_THRESHOLD, MIN_TX_RESCHED_THRESHOLD,
3088 	    MAX_TX_RESCHED_THRESHOLD, DEFAULT_TX_RESCHED_THRESHOLD);
3089 
3090 	ixgbe->rx_copy_thresh = ixgbe_get_prop(ixgbe, PROP_RX_COPY_THRESHOLD,
3091 	    MIN_RX_COPY_THRESHOLD, MAX_RX_COPY_THRESHOLD,
3092 	    DEFAULT_RX_COPY_THRESHOLD);
3093 	ixgbe->rx_limit_per_intr = ixgbe_get_prop(ixgbe, PROP_RX_LIMIT_PER_INTR,
3094 	    MIN_RX_LIMIT_PER_INTR, MAX_RX_LIMIT_PER_INTR,
3095 	    DEFAULT_RX_LIMIT_PER_INTR);
3096 
3097 	ixgbe->intr_throttling[0] = ixgbe_get_prop(ixgbe, PROP_INTR_THROTTLING,
3098 	    ixgbe->capab->min_intr_throttle,
3099 	    ixgbe->capab->max_intr_throttle,
3100 	    ixgbe->capab->def_intr_throttle);
3101 	/*
3102 	 * 82599 requires the interupt throttling rate is
3103 	 * a multiple of 8. This is enforced by the register
3104 	 * definiton.
3105 	 */
3106 	if (hw->mac.type == ixgbe_mac_82599EB)
3107 		ixgbe->intr_throttling[0] = ixgbe->intr_throttling[0] & 0xFF8;
3108 }
3109 
3110 static void
3111 ixgbe_init_params(ixgbe_t *ixgbe)
3112 {
3113 	ixgbe->param_en_10000fdx_cap = 1;
3114 	ixgbe->param_en_1000fdx_cap = 1;
3115 	ixgbe->param_en_100fdx_cap = 1;
3116 	ixgbe->param_adv_10000fdx_cap = 1;
3117 	ixgbe->param_adv_1000fdx_cap = 1;
3118 	ixgbe->param_adv_100fdx_cap = 1;
3119 
3120 	ixgbe->param_pause_cap = 1;
3121 	ixgbe->param_asym_pause_cap = 1;
3122 	ixgbe->param_rem_fault = 0;
3123 
3124 	ixgbe->param_adv_autoneg_cap = 1;
3125 	ixgbe->param_adv_pause_cap = 1;
3126 	ixgbe->param_adv_asym_pause_cap = 1;
3127 	ixgbe->param_adv_rem_fault = 0;
3128 
3129 	ixgbe->param_lp_10000fdx_cap = 0;
3130 	ixgbe->param_lp_1000fdx_cap = 0;
3131 	ixgbe->param_lp_100fdx_cap = 0;
3132 	ixgbe->param_lp_autoneg_cap = 0;
3133 	ixgbe->param_lp_pause_cap = 0;
3134 	ixgbe->param_lp_asym_pause_cap = 0;
3135 	ixgbe->param_lp_rem_fault = 0;
3136 }
3137 
3138 /*
3139  * ixgbe_get_prop - Get a property value out of the configuration file
3140  * ixgbe.conf.
3141  *
3142  * Caller provides the name of the property, a default value, a minimum
3143  * value, and a maximum value.
3144  *
3145  * Return configured value of the property, with default, minimum and
3146  * maximum properly applied.
3147  */
3148 static int
3149 ixgbe_get_prop(ixgbe_t *ixgbe,
3150     char *propname,	/* name of the property */
3151     int minval,		/* minimum acceptable value */
3152     int maxval,		/* maximim acceptable value */
3153     int defval)		/* default value */
3154 {
3155 	int value;
3156 
3157 	/*
3158 	 * Call ddi_prop_get_int() to read the conf settings
3159 	 */
3160 	value = ddi_prop_get_int(DDI_DEV_T_ANY, ixgbe->dip,
3161 	    DDI_PROP_DONTPASS, propname, defval);
3162 	if (value > maxval)
3163 		value = maxval;
3164 
3165 	if (value < minval)
3166 		value = minval;
3167 
3168 	return (value);
3169 }
3170 
3171 /*
3172  * ixgbe_driver_setup_link - Using the link properties to setup the link.
3173  */
3174 int
3175 ixgbe_driver_setup_link(ixgbe_t *ixgbe, boolean_t setup_hw)
3176 {
3177 	u32 autoneg_advertised = 0;
3178 
3179 	/*
3180 	 * No half duplex support with 10Gb parts
3181 	 */
3182 	if (ixgbe->param_adv_10000fdx_cap == 1)
3183 		autoneg_advertised |= IXGBE_LINK_SPEED_10GB_FULL;
3184 
3185 	if (ixgbe->param_adv_1000fdx_cap == 1)
3186 		autoneg_advertised |= IXGBE_LINK_SPEED_1GB_FULL;
3187 
3188 	if (ixgbe->param_adv_100fdx_cap == 1)
3189 		autoneg_advertised |= IXGBE_LINK_SPEED_100_FULL;
3190 
3191 	if (ixgbe->param_adv_autoneg_cap == 1 && autoneg_advertised == 0) {
3192 		ixgbe_notice(ixgbe, "Invalid link settings. Setup link "
3193 		    "to autonegotiation with full link capabilities.");
3194 
3195 		autoneg_advertised = IXGBE_LINK_SPEED_10GB_FULL |
3196 		    IXGBE_LINK_SPEED_1GB_FULL |
3197 		    IXGBE_LINK_SPEED_100_FULL;
3198 	}
3199 
3200 	if (setup_hw) {
3201 		if (ixgbe_setup_link(&ixgbe->hw, autoneg_advertised,
3202 		    ixgbe->param_adv_autoneg_cap, B_TRUE) != IXGBE_SUCCESS) {
3203 			ixgbe_notice(ixgbe, "Setup link failed on this "
3204 			    "device.");
3205 			return (IXGBE_FAILURE);
3206 		}
3207 	}
3208 
3209 	return (IXGBE_SUCCESS);
3210 }
3211 
3212 /*
3213  * ixgbe_driver_link_check - Link status processing.
3214  *
3215  * This function can be called in both kernel context and interrupt context
3216  */
3217 static void
3218 ixgbe_driver_link_check(ixgbe_t *ixgbe)
3219 {
3220 	struct ixgbe_hw *hw = &ixgbe->hw;
3221 	ixgbe_link_speed speed = IXGBE_LINK_SPEED_UNKNOWN;
3222 	boolean_t link_up = B_FALSE;
3223 	boolean_t link_changed = B_FALSE;
3224 
3225 	ASSERT(mutex_owned(&ixgbe->gen_lock));
3226 
3227 	(void) ixgbe_check_link(hw, &speed, &link_up, false);
3228 	if (link_up) {
3229 		ixgbe->link_check_complete = B_TRUE;
3230 
3231 		/* Link is up, enable flow control settings */
3232 		(void) ixgbe_fc_enable(hw, 0);
3233 
3234 		/*
3235 		 * The Link is up, check whether it was marked as down earlier
3236 		 */
3237 		if (ixgbe->link_state != LINK_STATE_UP) {
3238 			switch (speed) {
3239 			case IXGBE_LINK_SPEED_10GB_FULL:
3240 				ixgbe->link_speed = SPEED_10GB;
3241 				break;
3242 			case IXGBE_LINK_SPEED_1GB_FULL:
3243 				ixgbe->link_speed = SPEED_1GB;
3244 				break;
3245 			case IXGBE_LINK_SPEED_100_FULL:
3246 				ixgbe->link_speed = SPEED_100;
3247 			}
3248 			ixgbe->link_duplex = LINK_DUPLEX_FULL;
3249 			ixgbe->link_state = LINK_STATE_UP;
3250 			link_changed = B_TRUE;
3251 		}
3252 	} else {
3253 		if (ixgbe->link_check_complete == B_TRUE ||
3254 		    (ixgbe->link_check_complete == B_FALSE &&
3255 		    gethrtime() >= ixgbe->link_check_hrtime)) {
3256 			/*
3257 			 * The link is really down
3258 			 */
3259 			ixgbe->link_check_complete = B_TRUE;
3260 
3261 			if (ixgbe->link_state != LINK_STATE_DOWN) {
3262 				ixgbe->link_speed = 0;
3263 				ixgbe->link_duplex = LINK_DUPLEX_UNKNOWN;
3264 				ixgbe->link_state = LINK_STATE_DOWN;
3265 				link_changed = B_TRUE;
3266 			}
3267 		}
3268 	}
3269 
3270 	/*
3271 	 * If we are in an interrupt context, need to re-enable the
3272 	 * interrupt, which was automasked
3273 	 */
3274 	if (servicing_interrupt() != 0) {
3275 		ixgbe->eims |= IXGBE_EICR_LSC;
3276 		IXGBE_WRITE_REG(hw, IXGBE_EIMS, ixgbe->eims);
3277 	}
3278 
3279 	if (link_changed) {
3280 		mac_link_update(ixgbe->mac_hdl, ixgbe->link_state);
3281 	}
3282 }
3283 
3284 /*
3285  * ixgbe_sfp_check - sfp module processing done in taskq only for 82599.
3286  */
3287 static void
3288 ixgbe_sfp_check(void *arg)
3289 {
3290 	ixgbe_t *ixgbe = (ixgbe_t *)arg;
3291 	uint32_t eicr = ixgbe->eicr;
3292 	struct ixgbe_hw *hw = &ixgbe->hw;
3293 
3294 	mutex_enter(&ixgbe->gen_lock);
3295 	if (eicr & IXGBE_EICR_GPI_SDP1) {
3296 		/* clear the interrupt */
3297 		IXGBE_WRITE_REG(hw, IXGBE_EICR, IXGBE_EICR_GPI_SDP1);
3298 
3299 		/* if link up, do multispeed fiber setup */
3300 		(void) ixgbe_setup_link(hw, IXGBE_LINK_SPEED_82599_AUTONEG,
3301 		    B_TRUE, B_TRUE);
3302 		ixgbe_driver_link_check(ixgbe);
3303 		ixgbe_get_hw_state(ixgbe);
3304 	} else if (eicr & IXGBE_EICR_GPI_SDP2) {
3305 		/* clear the interrupt */
3306 		IXGBE_WRITE_REG(hw, IXGBE_EICR, IXGBE_EICR_GPI_SDP2);
3307 
3308 		/* if link up, do sfp module setup */
3309 		(void) hw->mac.ops.setup_sfp(hw);
3310 
3311 		/* do multispeed fiber setup */
3312 		(void) ixgbe_setup_link(hw, IXGBE_LINK_SPEED_82599_AUTONEG,
3313 		    B_TRUE, B_TRUE);
3314 		ixgbe_driver_link_check(ixgbe);
3315 		ixgbe_get_hw_state(ixgbe);
3316 	}
3317 	mutex_exit(&ixgbe->gen_lock);
3318 
3319 	/*
3320 	 * We need to fully re-check the link later.
3321 	 */
3322 	ixgbe->link_check_complete = B_FALSE;
3323 	ixgbe->link_check_hrtime = gethrtime() +
3324 	    (IXGBE_LINK_UP_TIME * 100000000ULL);
3325 }
3326 
3327 /*
3328  * ixgbe_overtemp_check - overtemp module processing done in taskq
3329  *
3330  * This routine will only be called on adapters with temperature sensor.
3331  * The indication of over-temperature can be either SDP0 interrupt or the link
3332  * status change interrupt.
3333  */
3334 static void
3335 ixgbe_overtemp_check(void *arg)
3336 {
3337 	ixgbe_t *ixgbe = (ixgbe_t *)arg;
3338 	struct ixgbe_hw *hw = &ixgbe->hw;
3339 	uint32_t eicr = ixgbe->eicr;
3340 	ixgbe_link_speed speed;
3341 	boolean_t link_up;
3342 
3343 	mutex_enter(&ixgbe->gen_lock);
3344 
3345 	/* make sure we know current state of link */
3346 	(void) ixgbe_check_link(hw, &speed, &link_up, false);
3347 
3348 	/* check over-temp condition */
3349 	if (((eicr & IXGBE_EICR_GPI_SDP0) && (!link_up)) ||
3350 	    (eicr & IXGBE_EICR_LSC)) {
3351 		if (hw->phy.ops.check_overtemp(hw) == IXGBE_ERR_OVERTEMP) {
3352 			atomic_or_32(&ixgbe->ixgbe_state, IXGBE_OVERTEMP);
3353 
3354 			/*
3355 			 * Disable the adapter interrupts
3356 			 */
3357 			ixgbe_disable_adapter_interrupts(ixgbe);
3358 
3359 			/*
3360 			 * Disable Rx/Tx units
3361 			 */
3362 			(void) ixgbe_stop_adapter(hw);
3363 
3364 			ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_LOST);
3365 			ixgbe_error(ixgbe,
3366 			    "Problem: Network adapter has been stopped "
3367 			    "because it has overheated");
3368 			ixgbe_error(ixgbe,
3369 			    "Action: Restart the computer. "
3370 			    "If the problem persists, power off the system "
3371 			    "and replace the adapter");
3372 		}
3373 	}
3374 
3375 	/* write to clear the interrupt */
3376 	IXGBE_WRITE_REG(hw, IXGBE_EICR, eicr);
3377 
3378 	mutex_exit(&ixgbe->gen_lock);
3379 }
3380 
3381 /*
3382  * ixgbe_link_timer - timer for link status detection
3383  */
3384 static void
3385 ixgbe_link_timer(void *arg)
3386 {
3387 	ixgbe_t *ixgbe = (ixgbe_t *)arg;
3388 
3389 	mutex_enter(&ixgbe->gen_lock);
3390 	ixgbe_driver_link_check(ixgbe);
3391 	mutex_exit(&ixgbe->gen_lock);
3392 }
3393 
3394 /*
3395  * ixgbe_local_timer - Driver watchdog function.
3396  *
3397  * This function will handle the transmit stall check and other routines.
3398  */
3399 static void
3400 ixgbe_local_timer(void *arg)
3401 {
3402 	ixgbe_t *ixgbe = (ixgbe_t *)arg;
3403 
3404 	if (ixgbe->ixgbe_state & IXGBE_OVERTEMP)
3405 		goto out;
3406 
3407 	if (ixgbe->ixgbe_state & IXGBE_ERROR) {
3408 		ixgbe->reset_count++;
3409 		if (ixgbe_reset(ixgbe) == IXGBE_SUCCESS)
3410 			ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_RESTORED);
3411 		goto out;
3412 	}
3413 
3414 	if (ixgbe_stall_check(ixgbe)) {
3415 		atomic_or_32(&ixgbe->ixgbe_state, IXGBE_STALL);
3416 		ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_DEGRADED);
3417 
3418 		ixgbe->reset_count++;
3419 		if (ixgbe_reset(ixgbe) == IXGBE_SUCCESS)
3420 			ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_RESTORED);
3421 	}
3422 
3423 out:
3424 	ixgbe_restart_watchdog_timer(ixgbe);
3425 }
3426 
3427 /*
3428  * ixgbe_stall_check - Check for transmit stall.
3429  *
3430  * This function checks if the adapter is stalled (in transmit).
3431  *
3432  * It is called each time the watchdog timeout is invoked.
3433  * If the transmit descriptor reclaim continuously fails,
3434  * the watchdog value will increment by 1. If the watchdog
3435  * value exceeds the threshold, the ixgbe is assumed to
3436  * have stalled and need to be reset.
3437  */
3438 static boolean_t
3439 ixgbe_stall_check(ixgbe_t *ixgbe)
3440 {
3441 	ixgbe_tx_ring_t *tx_ring;
3442 	boolean_t result;
3443 	int i;
3444 
3445 	if (ixgbe->link_state != LINK_STATE_UP)
3446 		return (B_FALSE);
3447 
3448 	/*
3449 	 * If any tx ring is stalled, we'll reset the chipset
3450 	 */
3451 	result = B_FALSE;
3452 	for (i = 0; i < ixgbe->num_tx_rings; i++) {
3453 		tx_ring = &ixgbe->tx_rings[i];
3454 		if (tx_ring->tbd_free <= ixgbe->tx_recycle_thresh) {
3455 			tx_ring->tx_recycle(tx_ring);
3456 		}
3457 
3458 		if (tx_ring->recycle_fail > 0)
3459 			tx_ring->stall_watchdog++;
3460 		else
3461 			tx_ring->stall_watchdog = 0;
3462 
3463 		if (tx_ring->stall_watchdog >= STALL_WATCHDOG_TIMEOUT) {
3464 			result = B_TRUE;
3465 			break;
3466 		}
3467 	}
3468 
3469 	if (result) {
3470 		tx_ring->stall_watchdog = 0;
3471 		tx_ring->recycle_fail = 0;
3472 	}
3473 
3474 	return (result);
3475 }
3476 
3477 
3478 /*
3479  * is_valid_mac_addr - Check if the mac address is valid.
3480  */
3481 static boolean_t
3482 is_valid_mac_addr(uint8_t *mac_addr)
3483 {
3484 	const uint8_t addr_test1[6] = { 0, 0, 0, 0, 0, 0 };
3485 	const uint8_t addr_test2[6] =
3486 	    { 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF };
3487 
3488 	if (!(bcmp(addr_test1, mac_addr, ETHERADDRL)) ||
3489 	    !(bcmp(addr_test2, mac_addr, ETHERADDRL)))
3490 		return (B_FALSE);
3491 
3492 	return (B_TRUE);
3493 }
3494 
3495 static boolean_t
3496 ixgbe_find_mac_address(ixgbe_t *ixgbe)
3497 {
3498 #ifdef __sparc
3499 	struct ixgbe_hw *hw = &ixgbe->hw;
3500 	uchar_t *bytes;
3501 	struct ether_addr sysaddr;
3502 	uint_t nelts;
3503 	int err;
3504 	boolean_t found = B_FALSE;
3505 
3506 	/*
3507 	 * The "vendor's factory-set address" may already have
3508 	 * been extracted from the chip, but if the property
3509 	 * "local-mac-address" is set we use that instead.
3510 	 *
3511 	 * We check whether it looks like an array of 6
3512 	 * bytes (which it should, if OBP set it).  If we can't
3513 	 * make sense of it this way, we'll ignore it.
3514 	 */
3515 	err = ddi_prop_lookup_byte_array(DDI_DEV_T_ANY, ixgbe->dip,
3516 	    DDI_PROP_DONTPASS, "local-mac-address", &bytes, &nelts);
3517 	if (err == DDI_PROP_SUCCESS) {
3518 		if (nelts == ETHERADDRL) {
3519 			while (nelts--)
3520 				hw->mac.addr[nelts] = bytes[nelts];
3521 			found = B_TRUE;
3522 		}
3523 		ddi_prop_free(bytes);
3524 	}
3525 
3526 	/*
3527 	 * Look up the OBP property "local-mac-address?". If the user has set
3528 	 * 'local-mac-address? = false', use "the system address" instead.
3529 	 */
3530 	if (ddi_prop_lookup_byte_array(DDI_DEV_T_ANY, ixgbe->dip, 0,
3531 	    "local-mac-address?", &bytes, &nelts) == DDI_PROP_SUCCESS) {
3532 		if (strncmp("false", (caddr_t)bytes, (size_t)nelts) == 0) {
3533 			if (localetheraddr(NULL, &sysaddr) != 0) {
3534 				bcopy(&sysaddr, hw->mac.addr, ETHERADDRL);
3535 				found = B_TRUE;
3536 			}
3537 		}
3538 		ddi_prop_free(bytes);
3539 	}
3540 
3541 	/*
3542 	 * Finally(!), if there's a valid "mac-address" property (created
3543 	 * if we netbooted from this interface), we must use this instead
3544 	 * of any of the above to ensure that the NFS/install server doesn't
3545 	 * get confused by the address changing as Solaris takes over!
3546 	 */
3547 	err = ddi_prop_lookup_byte_array(DDI_DEV_T_ANY, ixgbe->dip,
3548 	    DDI_PROP_DONTPASS, "mac-address", &bytes, &nelts);
3549 	if (err == DDI_PROP_SUCCESS) {
3550 		if (nelts == ETHERADDRL) {
3551 			while (nelts--)
3552 				hw->mac.addr[nelts] = bytes[nelts];
3553 			found = B_TRUE;
3554 		}
3555 		ddi_prop_free(bytes);
3556 	}
3557 
3558 	if (found) {
3559 		bcopy(hw->mac.addr, hw->mac.perm_addr, ETHERADDRL);
3560 		return (B_TRUE);
3561 	}
3562 #else
3563 	_NOTE(ARGUNUSED(ixgbe));
3564 #endif
3565 
3566 	return (B_TRUE);
3567 }
3568 
3569 #pragma inline(ixgbe_arm_watchdog_timer)
3570 static void
3571 ixgbe_arm_watchdog_timer(ixgbe_t *ixgbe)
3572 {
3573 	/*
3574 	 * Fire a watchdog timer
3575 	 */
3576 	ixgbe->watchdog_tid =
3577 	    timeout(ixgbe_local_timer,
3578 	    (void *)ixgbe, 1 * drv_usectohz(1000000));
3579 
3580 }
3581 
3582 /*
3583  * ixgbe_enable_watchdog_timer - Enable and start the driver watchdog timer.
3584  */
3585 void
3586 ixgbe_enable_watchdog_timer(ixgbe_t *ixgbe)
3587 {
3588 	mutex_enter(&ixgbe->watchdog_lock);
3589 
3590 	if (!ixgbe->watchdog_enable) {
3591 		ixgbe->watchdog_enable = B_TRUE;
3592 		ixgbe->watchdog_start = B_TRUE;
3593 		ixgbe_arm_watchdog_timer(ixgbe);
3594 	}
3595 
3596 	mutex_exit(&ixgbe->watchdog_lock);
3597 }
3598 
3599 /*
3600  * ixgbe_disable_watchdog_timer - Disable and stop the driver watchdog timer.
3601  */
3602 void
3603 ixgbe_disable_watchdog_timer(ixgbe_t *ixgbe)
3604 {
3605 	timeout_id_t tid;
3606 
3607 	mutex_enter(&ixgbe->watchdog_lock);
3608 
3609 	ixgbe->watchdog_enable = B_FALSE;
3610 	ixgbe->watchdog_start = B_FALSE;
3611 	tid = ixgbe->watchdog_tid;
3612 	ixgbe->watchdog_tid = 0;
3613 
3614 	mutex_exit(&ixgbe->watchdog_lock);
3615 
3616 	if (tid != 0)
3617 		(void) untimeout(tid);
3618 }
3619 
3620 /*
3621  * ixgbe_start_watchdog_timer - Start the driver watchdog timer.
3622  */
3623 void
3624 ixgbe_start_watchdog_timer(ixgbe_t *ixgbe)
3625 {
3626 	mutex_enter(&ixgbe->watchdog_lock);
3627 
3628 	if (ixgbe->watchdog_enable) {
3629 		if (!ixgbe->watchdog_start) {
3630 			ixgbe->watchdog_start = B_TRUE;
3631 			ixgbe_arm_watchdog_timer(ixgbe);
3632 		}
3633 	}
3634 
3635 	mutex_exit(&ixgbe->watchdog_lock);
3636 }
3637 
3638 /*
3639  * ixgbe_restart_watchdog_timer - Restart the driver watchdog timer.
3640  */
3641 static void
3642 ixgbe_restart_watchdog_timer(ixgbe_t *ixgbe)
3643 {
3644 	mutex_enter(&ixgbe->watchdog_lock);
3645 
3646 	if (ixgbe->watchdog_start)
3647 		ixgbe_arm_watchdog_timer(ixgbe);
3648 
3649 	mutex_exit(&ixgbe->watchdog_lock);
3650 }
3651 
3652 /*
3653  * ixgbe_stop_watchdog_timer - Stop the driver watchdog timer.
3654  */
3655 void
3656 ixgbe_stop_watchdog_timer(ixgbe_t *ixgbe)
3657 {
3658 	timeout_id_t tid;
3659 
3660 	mutex_enter(&ixgbe->watchdog_lock);
3661 
3662 	ixgbe->watchdog_start = B_FALSE;
3663 	tid = ixgbe->watchdog_tid;
3664 	ixgbe->watchdog_tid = 0;
3665 
3666 	mutex_exit(&ixgbe->watchdog_lock);
3667 
3668 	if (tid != 0)
3669 		(void) untimeout(tid);
3670 }
3671 
3672 /*
3673  * ixgbe_disable_adapter_interrupts - Disable all adapter interrupts.
3674  */
3675 static void
3676 ixgbe_disable_adapter_interrupts(ixgbe_t *ixgbe)
3677 {
3678 	struct ixgbe_hw *hw = &ixgbe->hw;
3679 
3680 	/*
3681 	 * mask all interrupts off
3682 	 */
3683 	IXGBE_WRITE_REG(hw, IXGBE_EIMC, 0xffffffff);
3684 
3685 	/*
3686 	 * for MSI-X, also disable autoclear
3687 	 */
3688 	if (ixgbe->intr_type == DDI_INTR_TYPE_MSIX) {
3689 		IXGBE_WRITE_REG(hw, IXGBE_EIAC, 0x0);
3690 	}
3691 
3692 	IXGBE_WRITE_FLUSH(hw);
3693 }
3694 
3695 /*
3696  * ixgbe_enable_adapter_interrupts - Enable all hardware interrupts.
3697  */
3698 static void
3699 ixgbe_enable_adapter_interrupts(ixgbe_t *ixgbe)
3700 {
3701 	struct ixgbe_hw *hw = &ixgbe->hw;
3702 	uint32_t eiac, eiam;
3703 	uint32_t gpie = IXGBE_READ_REG(hw, IXGBE_GPIE);
3704 
3705 	/* interrupt types to enable */
3706 	ixgbe->eims = IXGBE_EIMS_ENABLE_MASK;	/* shared code default */
3707 	ixgbe->eims &= ~IXGBE_EIMS_TCP_TIMER;	/* minus tcp timer */
3708 	ixgbe->eims |= ixgbe->capab->other_intr; /* "other" interrupt types */
3709 
3710 	/* enable automask on "other" causes that this adapter can generate */
3711 	eiam = ixgbe->capab->other_intr;
3712 
3713 	/*
3714 	 * msi-x mode
3715 	 */
3716 	if (ixgbe->intr_type == DDI_INTR_TYPE_MSIX) {
3717 		/* enable autoclear but not on bits 29:20 */
3718 		eiac = (ixgbe->eims & ~IXGBE_OTHER_INTR);
3719 
3720 		/* general purpose interrupt enable */
3721 		gpie |= (IXGBE_GPIE_MSIX_MODE
3722 		    | IXGBE_GPIE_PBA_SUPPORT
3723 		    | IXGBE_GPIE_OCD
3724 		    | IXGBE_GPIE_EIAME);
3725 	/*
3726 	 * non-msi-x mode
3727 	 */
3728 	} else {
3729 
3730 		/* disable autoclear, leave gpie at default */
3731 		eiac = 0;
3732 
3733 		/*
3734 		 * General purpose interrupt enable.
3735 		 * For 82599, extended interrupt automask enable
3736 		 * only in MSI or MSI-X mode
3737 		 */
3738 		if ((hw->mac.type < ixgbe_mac_82599EB) ||
3739 		    (ixgbe->intr_type == DDI_INTR_TYPE_MSI)) {
3740 			gpie |= IXGBE_GPIE_EIAME;
3741 		}
3742 	}
3743 
3744 	/* Enable specific "other" interrupt types */
3745 	switch (hw->mac.type) {
3746 	case ixgbe_mac_82598EB:
3747 		gpie |= ixgbe->capab->other_gpie;
3748 		break;
3749 
3750 	case ixgbe_mac_82599EB:
3751 		gpie |= ixgbe->capab->other_gpie;
3752 
3753 		/* Enable RSC Delay 8us when LRO enabled  */
3754 		if (ixgbe->lro_enable) {
3755 			gpie |= (1 << IXGBE_GPIE_RSC_DELAY_SHIFT);
3756 		}
3757 		break;
3758 
3759 	default:
3760 		break;
3761 	}
3762 
3763 	/* write to interrupt control registers */
3764 	IXGBE_WRITE_REG(hw, IXGBE_EIMS, ixgbe->eims);
3765 	IXGBE_WRITE_REG(hw, IXGBE_EIAC, eiac);
3766 	IXGBE_WRITE_REG(hw, IXGBE_EIAM, eiam);
3767 	IXGBE_WRITE_REG(hw, IXGBE_GPIE, gpie);
3768 	IXGBE_WRITE_FLUSH(hw);
3769 }
3770 
3771 /*
3772  * ixgbe_loopback_ioctl - Loopback support.
3773  */
3774 enum ioc_reply
3775 ixgbe_loopback_ioctl(ixgbe_t *ixgbe, struct iocblk *iocp, mblk_t *mp)
3776 {
3777 	lb_info_sz_t *lbsp;
3778 	lb_property_t *lbpp;
3779 	uint32_t *lbmp;
3780 	uint32_t size;
3781 	uint32_t value;
3782 
3783 	if (mp->b_cont == NULL)
3784 		return (IOC_INVAL);
3785 
3786 	switch (iocp->ioc_cmd) {
3787 	default:
3788 		return (IOC_INVAL);
3789 
3790 	case LB_GET_INFO_SIZE:
3791 		size = sizeof (lb_info_sz_t);
3792 		if (iocp->ioc_count != size)
3793 			return (IOC_INVAL);
3794 
3795 		value = sizeof (lb_normal);
3796 		value += sizeof (lb_mac);
3797 		value += sizeof (lb_external);
3798 
3799 		lbsp = (lb_info_sz_t *)(uintptr_t)mp->b_cont->b_rptr;
3800 		*lbsp = value;
3801 		break;
3802 
3803 	case LB_GET_INFO:
3804 		value = sizeof (lb_normal);
3805 		value += sizeof (lb_mac);
3806 		value += sizeof (lb_external);
3807 
3808 		size = value;
3809 		if (iocp->ioc_count != size)
3810 			return (IOC_INVAL);
3811 
3812 		value = 0;
3813 		lbpp = (lb_property_t *)(uintptr_t)mp->b_cont->b_rptr;
3814 
3815 		lbpp[value++] = lb_normal;
3816 		lbpp[value++] = lb_mac;
3817 		lbpp[value++] = lb_external;
3818 		break;
3819 
3820 	case LB_GET_MODE:
3821 		size = sizeof (uint32_t);
3822 		if (iocp->ioc_count != size)
3823 			return (IOC_INVAL);
3824 
3825 		lbmp = (uint32_t *)(uintptr_t)mp->b_cont->b_rptr;
3826 		*lbmp = ixgbe->loopback_mode;
3827 		break;
3828 
3829 	case LB_SET_MODE:
3830 		size = 0;
3831 		if (iocp->ioc_count != sizeof (uint32_t))
3832 			return (IOC_INVAL);
3833 
3834 		lbmp = (uint32_t *)(uintptr_t)mp->b_cont->b_rptr;
3835 		if (!ixgbe_set_loopback_mode(ixgbe, *lbmp))
3836 			return (IOC_INVAL);
3837 		break;
3838 	}
3839 
3840 	iocp->ioc_count = size;
3841 	iocp->ioc_error = 0;
3842 
3843 	if (ixgbe_check_acc_handle(ixgbe->osdep.reg_handle) != DDI_FM_OK) {
3844 		ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_DEGRADED);
3845 		return (IOC_INVAL);
3846 	}
3847 
3848 	return (IOC_REPLY);
3849 }
3850 
3851 /*
3852  * ixgbe_set_loopback_mode - Setup loopback based on the loopback mode.
3853  */
3854 static boolean_t
3855 ixgbe_set_loopback_mode(ixgbe_t *ixgbe, uint32_t mode)
3856 {
3857 	if (mode == ixgbe->loopback_mode)
3858 		return (B_TRUE);
3859 
3860 	ixgbe->loopback_mode = mode;
3861 
3862 	if (mode == IXGBE_LB_NONE) {
3863 		/*
3864 		 * Reset the chip
3865 		 */
3866 		(void) ixgbe_reset(ixgbe);
3867 		return (B_TRUE);
3868 	}
3869 
3870 	mutex_enter(&ixgbe->gen_lock);
3871 
3872 	switch (mode) {
3873 	default:
3874 		mutex_exit(&ixgbe->gen_lock);
3875 		return (B_FALSE);
3876 
3877 	case IXGBE_LB_EXTERNAL:
3878 		break;
3879 
3880 	case IXGBE_LB_INTERNAL_MAC:
3881 		ixgbe_set_internal_mac_loopback(ixgbe);
3882 		break;
3883 	}
3884 
3885 	mutex_exit(&ixgbe->gen_lock);
3886 
3887 	return (B_TRUE);
3888 }
3889 
3890 /*
3891  * ixgbe_set_internal_mac_loopback - Set the internal MAC loopback mode.
3892  */
3893 static void
3894 ixgbe_set_internal_mac_loopback(ixgbe_t *ixgbe)
3895 {
3896 	struct ixgbe_hw *hw;
3897 	uint32_t reg;
3898 	uint8_t atlas;
3899 
3900 	hw = &ixgbe->hw;
3901 
3902 	/*
3903 	 * Setup MAC loopback
3904 	 */
3905 	reg = IXGBE_READ_REG(&ixgbe->hw, IXGBE_HLREG0);
3906 	reg |= IXGBE_HLREG0_LPBK;
3907 	IXGBE_WRITE_REG(&ixgbe->hw, IXGBE_HLREG0, reg);
3908 
3909 	reg = IXGBE_READ_REG(&ixgbe->hw, IXGBE_AUTOC);
3910 	reg &= ~IXGBE_AUTOC_LMS_MASK;
3911 	IXGBE_WRITE_REG(&ixgbe->hw, IXGBE_AUTOC, reg);
3912 
3913 	/*
3914 	 * Disable Atlas Tx lanes to keep packets in loopback and not on wire
3915 	 */
3916 	switch (hw->mac.type) {
3917 	case ixgbe_mac_82598EB:
3918 		(void) ixgbe_read_analog_reg8(&ixgbe->hw, IXGBE_ATLAS_PDN_LPBK,
3919 		    &atlas);
3920 		atlas |= IXGBE_ATLAS_PDN_TX_REG_EN;
3921 		(void) ixgbe_write_analog_reg8(&ixgbe->hw, IXGBE_ATLAS_PDN_LPBK,
3922 		    atlas);
3923 
3924 		(void) ixgbe_read_analog_reg8(&ixgbe->hw, IXGBE_ATLAS_PDN_10G,
3925 		    &atlas);
3926 		atlas |= IXGBE_ATLAS_PDN_TX_10G_QL_ALL;
3927 		(void) ixgbe_write_analog_reg8(&ixgbe->hw, IXGBE_ATLAS_PDN_10G,
3928 		    atlas);
3929 
3930 		(void) ixgbe_read_analog_reg8(&ixgbe->hw, IXGBE_ATLAS_PDN_1G,
3931 		    &atlas);
3932 		atlas |= IXGBE_ATLAS_PDN_TX_1G_QL_ALL;
3933 		(void) ixgbe_write_analog_reg8(&ixgbe->hw, IXGBE_ATLAS_PDN_1G,
3934 		    atlas);
3935 
3936 		(void) ixgbe_read_analog_reg8(&ixgbe->hw, IXGBE_ATLAS_PDN_AN,
3937 		    &atlas);
3938 		atlas |= IXGBE_ATLAS_PDN_TX_AN_QL_ALL;
3939 		(void) ixgbe_write_analog_reg8(&ixgbe->hw, IXGBE_ATLAS_PDN_AN,
3940 		    atlas);
3941 		break;
3942 
3943 	case ixgbe_mac_82599EB:
3944 		reg = IXGBE_READ_REG(&ixgbe->hw, IXGBE_AUTOC);
3945 		reg |= (IXGBE_AUTOC_FLU |
3946 		    IXGBE_AUTOC_10G_KX4);
3947 		IXGBE_WRITE_REG(&ixgbe->hw, IXGBE_AUTOC, reg);
3948 
3949 		(void) ixgbe_setup_link(&ixgbe->hw, IXGBE_LINK_SPEED_10GB_FULL,
3950 		    B_FALSE, B_TRUE);
3951 		break;
3952 
3953 	default:
3954 		break;
3955 	}
3956 }
3957 
3958 #pragma inline(ixgbe_intr_rx_work)
3959 /*
3960  * ixgbe_intr_rx_work - RX processing of ISR.
3961  */
3962 static void
3963 ixgbe_intr_rx_work(ixgbe_rx_ring_t *rx_ring)
3964 {
3965 	mblk_t *mp;
3966 
3967 	mutex_enter(&rx_ring->rx_lock);
3968 
3969 	mp = ixgbe_ring_rx(rx_ring, IXGBE_POLL_NULL);
3970 	mutex_exit(&rx_ring->rx_lock);
3971 
3972 	if (mp != NULL)
3973 		mac_rx_ring(rx_ring->ixgbe->mac_hdl, rx_ring->ring_handle, mp,
3974 		    rx_ring->ring_gen_num);
3975 }
3976 
3977 #pragma inline(ixgbe_intr_tx_work)
3978 /*
3979  * ixgbe_intr_tx_work - TX processing of ISR.
3980  */
3981 static void
3982 ixgbe_intr_tx_work(ixgbe_tx_ring_t *tx_ring)
3983 {
3984 	ixgbe_t *ixgbe = tx_ring->ixgbe;
3985 
3986 	/*
3987 	 * Recycle the tx descriptors
3988 	 */
3989 	tx_ring->tx_recycle(tx_ring);
3990 
3991 	/*
3992 	 * Schedule the re-transmit
3993 	 */
3994 	if (tx_ring->reschedule &&
3995 	    (tx_ring->tbd_free >= ixgbe->tx_resched_thresh)) {
3996 		tx_ring->reschedule = B_FALSE;
3997 		mac_tx_ring_update(tx_ring->ixgbe->mac_hdl,
3998 		    tx_ring->ring_handle);
3999 		IXGBE_DEBUG_STAT(tx_ring->stat_reschedule);
4000 	}
4001 }
4002 
4003 #pragma inline(ixgbe_intr_other_work)
4004 /*
4005  * ixgbe_intr_other_work - Process interrupt types other than tx/rx
4006  */
4007 static void
4008 ixgbe_intr_other_work(ixgbe_t *ixgbe, uint32_t eicr)
4009 {
4010 	ASSERT(mutex_owned(&ixgbe->gen_lock));
4011 
4012 	/*
4013 	 * handle link status change
4014 	 */
4015 	if (eicr & IXGBE_EICR_LSC) {
4016 		ixgbe_driver_link_check(ixgbe);
4017 		ixgbe_get_hw_state(ixgbe);
4018 	}
4019 
4020 	/*
4021 	 * check for fan failure on adapters with fans
4022 	 */
4023 	if ((ixgbe->capab->flags & IXGBE_FLAG_FAN_FAIL_CAPABLE) &&
4024 	    (eicr & IXGBE_EICR_GPI_SDP1)) {
4025 		atomic_or_32(&ixgbe->ixgbe_state, IXGBE_OVERTEMP);
4026 
4027 		/*
4028 		 * Disable the adapter interrupts
4029 		 */
4030 		ixgbe_disable_adapter_interrupts(ixgbe);
4031 
4032 		/*
4033 		 * Disable Rx/Tx units
4034 		 */
4035 		(void) ixgbe_stop_adapter(&ixgbe->hw);
4036 
4037 		ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_LOST);
4038 		ixgbe_error(ixgbe,
4039 		    "Problem: Network adapter has been stopped "
4040 		    "because the fan has stopped.\n");
4041 		ixgbe_error(ixgbe,
4042 		    "Action: Replace the adapter.\n");
4043 
4044 		/* re-enable the interrupt, which was automasked */
4045 		ixgbe->eims |= IXGBE_EICR_GPI_SDP1;
4046 	}
4047 
4048 	/*
4049 	 * Do SFP check for adapters with hot-plug capability
4050 	 */
4051 	if ((ixgbe->capab->flags & IXGBE_FLAG_SFP_PLUG_CAPABLE) &&
4052 	    ((eicr & IXGBE_EICR_GPI_SDP1) || (eicr & IXGBE_EICR_GPI_SDP2))) {
4053 		ixgbe->eicr = eicr;
4054 		if ((ddi_taskq_dispatch(ixgbe->sfp_taskq,
4055 		    ixgbe_sfp_check, (void *)ixgbe,
4056 		    DDI_NOSLEEP)) != DDI_SUCCESS) {
4057 			ixgbe_log(ixgbe, "No memory available to dispatch "
4058 			    "taskq for SFP check");
4059 		}
4060 	}
4061 
4062 	/*
4063 	 * Do over-temperature check for adapters with temp sensor
4064 	 */
4065 	if ((ixgbe->capab->flags & IXGBE_FLAG_TEMP_SENSOR_CAPABLE) &&
4066 	    ((eicr & IXGBE_EICR_GPI_SDP0) || (eicr & IXGBE_EICR_LSC))) {
4067 		ixgbe->eicr = eicr;
4068 		if ((ddi_taskq_dispatch(ixgbe->overtemp_taskq,
4069 		    ixgbe_overtemp_check, (void *)ixgbe,
4070 		    DDI_NOSLEEP)) != DDI_SUCCESS) {
4071 			ixgbe_log(ixgbe, "No memory available to dispatch "
4072 			    "taskq for overtemp check");
4073 		}
4074 	}
4075 }
4076 
4077 /*
4078  * ixgbe_intr_legacy - Interrupt handler for legacy interrupts.
4079  */
4080 static uint_t
4081 ixgbe_intr_legacy(void *arg1, void *arg2)
4082 {
4083 	ixgbe_t *ixgbe = (ixgbe_t *)arg1;
4084 	struct ixgbe_hw *hw = &ixgbe->hw;
4085 	ixgbe_tx_ring_t *tx_ring;
4086 	ixgbe_rx_ring_t *rx_ring;
4087 	uint32_t eicr;
4088 	mblk_t *mp;
4089 	boolean_t tx_reschedule;
4090 	uint_t result;
4091 
4092 	_NOTE(ARGUNUSED(arg2));
4093 
4094 	mutex_enter(&ixgbe->gen_lock);
4095 	if (ixgbe->ixgbe_state & IXGBE_SUSPENDED) {
4096 		mutex_exit(&ixgbe->gen_lock);
4097 		return (DDI_INTR_UNCLAIMED);
4098 	}
4099 
4100 	mp = NULL;
4101 	tx_reschedule = B_FALSE;
4102 
4103 	/*
4104 	 * Any bit set in eicr: claim this interrupt
4105 	 */
4106 	eicr = IXGBE_READ_REG(hw, IXGBE_EICR);
4107 
4108 	if (ixgbe_check_acc_handle(ixgbe->osdep.reg_handle) != DDI_FM_OK) {
4109 		mutex_exit(&ixgbe->gen_lock);
4110 		ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_DEGRADED);
4111 		atomic_or_32(&ixgbe->ixgbe_state, IXGBE_ERROR);
4112 		return (DDI_INTR_CLAIMED);
4113 	}
4114 
4115 	if (eicr) {
4116 		/*
4117 		 * For legacy interrupt, we have only one interrupt,
4118 		 * so we have only one rx ring and one tx ring enabled.
4119 		 */
4120 		ASSERT(ixgbe->num_rx_rings == 1);
4121 		ASSERT(ixgbe->num_tx_rings == 1);
4122 
4123 		/*
4124 		 * For legacy interrupt, rx rings[0] will use RTxQ[0].
4125 		 */
4126 		if (eicr & 0x1) {
4127 			ixgbe->eimc |= IXGBE_EICR_RTX_QUEUE;
4128 			IXGBE_WRITE_REG(hw, IXGBE_EIMC, ixgbe->eimc);
4129 			ixgbe->eims |= IXGBE_EICR_RTX_QUEUE;
4130 			/*
4131 			 * Clean the rx descriptors
4132 			 */
4133 			rx_ring = &ixgbe->rx_rings[0];
4134 			mp = ixgbe_ring_rx(rx_ring, IXGBE_POLL_NULL);
4135 		}
4136 
4137 		/*
4138 		 * For legacy interrupt, tx rings[0] will use RTxQ[1].
4139 		 */
4140 		if (eicr & 0x2) {
4141 			/*
4142 			 * Recycle the tx descriptors
4143 			 */
4144 			tx_ring = &ixgbe->tx_rings[0];
4145 			tx_ring->tx_recycle(tx_ring);
4146 
4147 			/*
4148 			 * Schedule the re-transmit
4149 			 */
4150 			tx_reschedule = (tx_ring->reschedule &&
4151 			    (tx_ring->tbd_free >= ixgbe->tx_resched_thresh));
4152 		}
4153 
4154 		/* any interrupt type other than tx/rx */
4155 		if (eicr & ixgbe->capab->other_intr) {
4156 			switch (hw->mac.type) {
4157 			case ixgbe_mac_82598EB:
4158 				ixgbe->eims &= ~(eicr & IXGBE_OTHER_INTR);
4159 				break;
4160 
4161 			case ixgbe_mac_82599EB:
4162 				ixgbe->eimc = IXGBE_82599_OTHER_INTR;
4163 				IXGBE_WRITE_REG(hw, IXGBE_EIMC, ixgbe->eimc);
4164 				break;
4165 
4166 			default:
4167 				break;
4168 			}
4169 			ixgbe_intr_other_work(ixgbe, eicr);
4170 			ixgbe->eims &= ~(eicr & IXGBE_OTHER_INTR);
4171 		}
4172 
4173 		mutex_exit(&ixgbe->gen_lock);
4174 
4175 		result = DDI_INTR_CLAIMED;
4176 	} else {
4177 		mutex_exit(&ixgbe->gen_lock);
4178 
4179 		/*
4180 		 * No interrupt cause bits set: don't claim this interrupt.
4181 		 */
4182 		result = DDI_INTR_UNCLAIMED;
4183 	}
4184 
4185 	/* re-enable the interrupts which were automasked */
4186 	IXGBE_WRITE_REG(hw, IXGBE_EIMS, ixgbe->eims);
4187 
4188 	/*
4189 	 * Do the following work outside of the gen_lock
4190 	 */
4191 	if (mp != NULL) {
4192 		mac_rx_ring(rx_ring->ixgbe->mac_hdl, rx_ring->ring_handle, mp,
4193 		    rx_ring->ring_gen_num);
4194 	}
4195 
4196 	if (tx_reschedule)  {
4197 		tx_ring->reschedule = B_FALSE;
4198 		mac_tx_ring_update(ixgbe->mac_hdl, tx_ring->ring_handle);
4199 		IXGBE_DEBUG_STAT(tx_ring->stat_reschedule);
4200 	}
4201 
4202 	return (result);
4203 }
4204 
4205 /*
4206  * ixgbe_intr_msi - Interrupt handler for MSI.
4207  */
4208 static uint_t
4209 ixgbe_intr_msi(void *arg1, void *arg2)
4210 {
4211 	ixgbe_t *ixgbe = (ixgbe_t *)arg1;
4212 	struct ixgbe_hw *hw = &ixgbe->hw;
4213 	uint32_t eicr;
4214 
4215 	_NOTE(ARGUNUSED(arg2));
4216 
4217 	eicr = IXGBE_READ_REG(hw, IXGBE_EICR);
4218 
4219 	if (ixgbe_check_acc_handle(ixgbe->osdep.reg_handle) != DDI_FM_OK) {
4220 		ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_DEGRADED);
4221 		atomic_or_32(&ixgbe->ixgbe_state, IXGBE_ERROR);
4222 		return (DDI_INTR_CLAIMED);
4223 	}
4224 
4225 	/*
4226 	 * For MSI interrupt, we have only one vector,
4227 	 * so we have only one rx ring and one tx ring enabled.
4228 	 */
4229 	ASSERT(ixgbe->num_rx_rings == 1);
4230 	ASSERT(ixgbe->num_tx_rings == 1);
4231 
4232 	/*
4233 	 * For MSI interrupt, rx rings[0] will use RTxQ[0].
4234 	 */
4235 	if (eicr & 0x1) {
4236 		ixgbe_intr_rx_work(&ixgbe->rx_rings[0]);
4237 	}
4238 
4239 	/*
4240 	 * For MSI interrupt, tx rings[0] will use RTxQ[1].
4241 	 */
4242 	if (eicr & 0x2) {
4243 		ixgbe_intr_tx_work(&ixgbe->tx_rings[0]);
4244 	}
4245 
4246 	/* any interrupt type other than tx/rx */
4247 	if (eicr & ixgbe->capab->other_intr) {
4248 		mutex_enter(&ixgbe->gen_lock);
4249 		switch (hw->mac.type) {
4250 		case ixgbe_mac_82598EB:
4251 			ixgbe->eims &= ~(eicr & IXGBE_OTHER_INTR);
4252 			break;
4253 
4254 		case ixgbe_mac_82599EB:
4255 			ixgbe->eimc = IXGBE_82599_OTHER_INTR;
4256 			IXGBE_WRITE_REG(hw, IXGBE_EIMC, ixgbe->eimc);
4257 			break;
4258 
4259 		default:
4260 			break;
4261 		}
4262 		ixgbe_intr_other_work(ixgbe, eicr);
4263 		ixgbe->eims &= ~(eicr & IXGBE_OTHER_INTR);
4264 		mutex_exit(&ixgbe->gen_lock);
4265 	}
4266 
4267 	/* re-enable the interrupts which were automasked */
4268 	IXGBE_WRITE_REG(hw, IXGBE_EIMS, ixgbe->eims);
4269 
4270 	return (DDI_INTR_CLAIMED);
4271 }
4272 
4273 /*
4274  * ixgbe_intr_msix - Interrupt handler for MSI-X.
4275  */
4276 static uint_t
4277 ixgbe_intr_msix(void *arg1, void *arg2)
4278 {
4279 	ixgbe_intr_vector_t *vect = (ixgbe_intr_vector_t *)arg1;
4280 	ixgbe_t *ixgbe = vect->ixgbe;
4281 	struct ixgbe_hw *hw = &ixgbe->hw;
4282 	uint32_t eicr;
4283 	int r_idx = 0;
4284 
4285 	_NOTE(ARGUNUSED(arg2));
4286 
4287 	/*
4288 	 * Clean each rx ring that has its bit set in the map
4289 	 */
4290 	r_idx = bt_getlowbit(vect->rx_map, 0, (ixgbe->num_rx_rings - 1));
4291 	while (r_idx >= 0) {
4292 		ixgbe_intr_rx_work(&ixgbe->rx_rings[r_idx]);
4293 		r_idx = bt_getlowbit(vect->rx_map, (r_idx + 1),
4294 		    (ixgbe->num_rx_rings - 1));
4295 	}
4296 
4297 	/*
4298 	 * Clean each tx ring that has its bit set in the map
4299 	 */
4300 	r_idx = bt_getlowbit(vect->tx_map, 0, (ixgbe->num_tx_rings - 1));
4301 	while (r_idx >= 0) {
4302 		ixgbe_intr_tx_work(&ixgbe->tx_rings[r_idx]);
4303 		r_idx = bt_getlowbit(vect->tx_map, (r_idx + 1),
4304 		    (ixgbe->num_tx_rings - 1));
4305 	}
4306 
4307 
4308 	/*
4309 	 * Clean other interrupt (link change) that has its bit set in the map
4310 	 */
4311 	if (BT_TEST(vect->other_map, 0) == 1) {
4312 		eicr = IXGBE_READ_REG(hw, IXGBE_EICR);
4313 
4314 		if (ixgbe_check_acc_handle(ixgbe->osdep.reg_handle) !=
4315 		    DDI_FM_OK) {
4316 			ddi_fm_service_impact(ixgbe->dip,
4317 			    DDI_SERVICE_DEGRADED);
4318 			atomic_or_32(&ixgbe->ixgbe_state, IXGBE_ERROR);
4319 			return (DDI_INTR_CLAIMED);
4320 		}
4321 
4322 		/*
4323 		 * Check "other" cause bits: any interrupt type other than tx/rx
4324 		 */
4325 		if (eicr & ixgbe->capab->other_intr) {
4326 			mutex_enter(&ixgbe->gen_lock);
4327 			switch (hw->mac.type) {
4328 			case ixgbe_mac_82598EB:
4329 				ixgbe->eims &= ~(eicr & IXGBE_OTHER_INTR);
4330 				ixgbe_intr_other_work(ixgbe, eicr);
4331 				break;
4332 
4333 			case ixgbe_mac_82599EB:
4334 				ixgbe->eims |= IXGBE_EICR_RTX_QUEUE;
4335 				ixgbe_intr_other_work(ixgbe, eicr);
4336 				break;
4337 
4338 			default:
4339 				break;
4340 			}
4341 			mutex_exit(&ixgbe->gen_lock);
4342 		}
4343 
4344 		/* re-enable the interrupts which were automasked */
4345 		IXGBE_WRITE_REG(hw, IXGBE_EIMS, ixgbe->eims);
4346 	}
4347 
4348 	return (DDI_INTR_CLAIMED);
4349 }
4350 
4351 /*
4352  * ixgbe_alloc_intrs - Allocate interrupts for the driver.
4353  *
4354  * Normal sequence is to try MSI-X; if not sucessful, try MSI;
4355  * if not successful, try Legacy.
4356  * ixgbe->intr_force can be used to force sequence to start with
4357  * any of the 3 types.
4358  * If MSI-X is not used, number of tx/rx rings is forced to 1.
4359  */
4360 static int
4361 ixgbe_alloc_intrs(ixgbe_t *ixgbe)
4362 {
4363 	dev_info_t *devinfo;
4364 	int intr_types;
4365 	int rc;
4366 
4367 	devinfo = ixgbe->dip;
4368 
4369 	/*
4370 	 * Get supported interrupt types
4371 	 */
4372 	rc = ddi_intr_get_supported_types(devinfo, &intr_types);
4373 
4374 	if (rc != DDI_SUCCESS) {
4375 		ixgbe_log(ixgbe,
4376 		    "Get supported interrupt types failed: %d", rc);
4377 		return (IXGBE_FAILURE);
4378 	}
4379 	IXGBE_DEBUGLOG_1(ixgbe, "Supported interrupt types: %x", intr_types);
4380 
4381 	ixgbe->intr_type = 0;
4382 
4383 	/*
4384 	 * Install MSI-X interrupts
4385 	 */
4386 	if ((intr_types & DDI_INTR_TYPE_MSIX) &&
4387 	    (ixgbe->intr_force <= IXGBE_INTR_MSIX)) {
4388 		rc = ixgbe_alloc_intr_handles(ixgbe, DDI_INTR_TYPE_MSIX);
4389 		if (rc == IXGBE_SUCCESS)
4390 			return (IXGBE_SUCCESS);
4391 
4392 		ixgbe_log(ixgbe,
4393 		    "Allocate MSI-X failed, trying MSI interrupts...");
4394 	}
4395 
4396 	/*
4397 	 * MSI-X not used, force rings and groups to 1
4398 	 */
4399 	ixgbe->num_rx_rings = 1;
4400 	ixgbe->num_rx_groups = 1;
4401 	ixgbe->num_tx_rings = 1;
4402 	ixgbe->classify_mode = IXGBE_CLASSIFY_NONE;
4403 	ixgbe_log(ixgbe,
4404 	    "MSI-X not used, force rings and groups number to 1");
4405 
4406 	/*
4407 	 * Install MSI interrupts
4408 	 */
4409 	if ((intr_types & DDI_INTR_TYPE_MSI) &&
4410 	    (ixgbe->intr_force <= IXGBE_INTR_MSI)) {
4411 		rc = ixgbe_alloc_intr_handles(ixgbe, DDI_INTR_TYPE_MSI);
4412 		if (rc == IXGBE_SUCCESS)
4413 			return (IXGBE_SUCCESS);
4414 
4415 		ixgbe_log(ixgbe,
4416 		    "Allocate MSI failed, trying Legacy interrupts...");
4417 	}
4418 
4419 	/*
4420 	 * Install legacy interrupts
4421 	 */
4422 	if (intr_types & DDI_INTR_TYPE_FIXED) {
4423 		rc = ixgbe_alloc_intr_handles(ixgbe, DDI_INTR_TYPE_FIXED);
4424 		if (rc == IXGBE_SUCCESS)
4425 			return (IXGBE_SUCCESS);
4426 
4427 		ixgbe_log(ixgbe,
4428 		    "Allocate Legacy interrupts failed");
4429 	}
4430 
4431 	/*
4432 	 * If none of the 3 types succeeded, return failure
4433 	 */
4434 	return (IXGBE_FAILURE);
4435 }
4436 
4437 /*
4438  * ixgbe_alloc_intr_handles - Allocate interrupt handles.
4439  *
4440  * For legacy and MSI, only 1 handle is needed.  For MSI-X,
4441  * if fewer than 2 handles are available, return failure.
4442  * Upon success, this maps the vectors to rx and tx rings for
4443  * interrupts.
4444  */
4445 static int
4446 ixgbe_alloc_intr_handles(ixgbe_t *ixgbe, int intr_type)
4447 {
4448 	dev_info_t *devinfo;
4449 	int request, count, actual;
4450 	int minimum;
4451 	int rc;
4452 	uint32_t ring_per_group;
4453 
4454 	devinfo = ixgbe->dip;
4455 
4456 	switch (intr_type) {
4457 	case DDI_INTR_TYPE_FIXED:
4458 		request = 1;	/* Request 1 legacy interrupt handle */
4459 		minimum = 1;
4460 		IXGBE_DEBUGLOG_0(ixgbe, "interrupt type: legacy");
4461 		break;
4462 
4463 	case DDI_INTR_TYPE_MSI:
4464 		request = 1;	/* Request 1 MSI interrupt handle */
4465 		minimum = 1;
4466 		IXGBE_DEBUGLOG_0(ixgbe, "interrupt type: MSI");
4467 		break;
4468 
4469 	case DDI_INTR_TYPE_MSIX:
4470 		/*
4471 		 * Best number of vectors for the adapter is
4472 		 * (# rx rings + # tx rings), however we will
4473 		 * limit the request number.
4474 		 */
4475 		request = min(16, ixgbe->num_rx_rings + ixgbe->num_tx_rings);
4476 		if (request > ixgbe->capab->max_ring_vect)
4477 			request = ixgbe->capab->max_ring_vect;
4478 		minimum = 1;
4479 		IXGBE_DEBUGLOG_0(ixgbe, "interrupt type: MSI-X");
4480 		break;
4481 
4482 	default:
4483 		ixgbe_log(ixgbe,
4484 		    "invalid call to ixgbe_alloc_intr_handles(): %d\n",
4485 		    intr_type);
4486 		return (IXGBE_FAILURE);
4487 	}
4488 	IXGBE_DEBUGLOG_2(ixgbe, "interrupt handles requested: %d  minimum: %d",
4489 	    request, minimum);
4490 
4491 	/*
4492 	 * Get number of supported interrupts
4493 	 */
4494 	rc = ddi_intr_get_nintrs(devinfo, intr_type, &count);
4495 	if ((rc != DDI_SUCCESS) || (count < minimum)) {
4496 		ixgbe_log(ixgbe,
4497 		    "Get interrupt number failed. Return: %d, count: %d",
4498 		    rc, count);
4499 		return (IXGBE_FAILURE);
4500 	}
4501 	IXGBE_DEBUGLOG_1(ixgbe, "interrupts supported: %d", count);
4502 
4503 	actual = 0;
4504 	ixgbe->intr_cnt = 0;
4505 	ixgbe->intr_cnt_max = 0;
4506 	ixgbe->intr_cnt_min = 0;
4507 
4508 	/*
4509 	 * Allocate an array of interrupt handles
4510 	 */
4511 	ixgbe->intr_size = request * sizeof (ddi_intr_handle_t);
4512 	ixgbe->htable = kmem_alloc(ixgbe->intr_size, KM_SLEEP);
4513 
4514 	rc = ddi_intr_alloc(devinfo, ixgbe->htable, intr_type, 0,
4515 	    request, &actual, DDI_INTR_ALLOC_NORMAL);
4516 	if (rc != DDI_SUCCESS) {
4517 		ixgbe_log(ixgbe, "Allocate interrupts failed. "
4518 		    "return: %d, request: %d, actual: %d",
4519 		    rc, request, actual);
4520 		goto alloc_handle_fail;
4521 	}
4522 	IXGBE_DEBUGLOG_1(ixgbe, "interrupts actually allocated: %d", actual);
4523 
4524 	/*
4525 	 * upper/lower limit of interrupts
4526 	 */
4527 	ixgbe->intr_cnt = actual;
4528 	ixgbe->intr_cnt_max = request;
4529 	ixgbe->intr_cnt_min = minimum;
4530 
4531 	/*
4532 	 * rss number per group should not exceed the rx interrupt number,
4533 	 * else need to adjust rx ring number.
4534 	 */
4535 	ring_per_group = ixgbe->num_rx_rings / ixgbe->num_rx_groups;
4536 	ASSERT((ixgbe->num_rx_rings % ixgbe->num_rx_groups) == 0);
4537 	if (actual < ring_per_group) {
4538 		ixgbe->num_rx_rings = ixgbe->num_rx_groups * actual;
4539 		ixgbe_setup_vmdq_rss_conf(ixgbe);
4540 	}
4541 
4542 	/*
4543 	 * Now we know the actual number of vectors.  Here we map the vector
4544 	 * to other, rx rings and tx ring.
4545 	 */
4546 	if (actual < minimum) {
4547 		ixgbe_log(ixgbe, "Insufficient interrupt handles available: %d",
4548 		    actual);
4549 		goto alloc_handle_fail;
4550 	}
4551 
4552 	/*
4553 	 * Get priority for first vector, assume remaining are all the same
4554 	 */
4555 	rc = ddi_intr_get_pri(ixgbe->htable[0], &ixgbe->intr_pri);
4556 	if (rc != DDI_SUCCESS) {
4557 		ixgbe_log(ixgbe,
4558 		    "Get interrupt priority failed: %d", rc);
4559 		goto alloc_handle_fail;
4560 	}
4561 
4562 	rc = ddi_intr_get_cap(ixgbe->htable[0], &ixgbe->intr_cap);
4563 	if (rc != DDI_SUCCESS) {
4564 		ixgbe_log(ixgbe,
4565 		    "Get interrupt cap failed: %d", rc);
4566 		goto alloc_handle_fail;
4567 	}
4568 
4569 	ixgbe->intr_type = intr_type;
4570 
4571 	return (IXGBE_SUCCESS);
4572 
4573 alloc_handle_fail:
4574 	ixgbe_rem_intrs(ixgbe);
4575 
4576 	return (IXGBE_FAILURE);
4577 }
4578 
4579 /*
4580  * ixgbe_add_intr_handlers - Add interrupt handlers based on the interrupt type.
4581  *
4582  * Before adding the interrupt handlers, the interrupt vectors have
4583  * been allocated, and the rx/tx rings have also been allocated.
4584  */
4585 static int
4586 ixgbe_add_intr_handlers(ixgbe_t *ixgbe)
4587 {
4588 	int vector = 0;
4589 	int rc;
4590 
4591 	switch (ixgbe->intr_type) {
4592 	case DDI_INTR_TYPE_MSIX:
4593 		/*
4594 		 * Add interrupt handler for all vectors
4595 		 */
4596 		for (vector = 0; vector < ixgbe->intr_cnt; vector++) {
4597 			/*
4598 			 * install pointer to vect_map[vector]
4599 			 */
4600 			rc = ddi_intr_add_handler(ixgbe->htable[vector],
4601 			    (ddi_intr_handler_t *)ixgbe_intr_msix,
4602 			    (void *)&ixgbe->vect_map[vector], NULL);
4603 
4604 			if (rc != DDI_SUCCESS) {
4605 				ixgbe_log(ixgbe,
4606 				    "Add interrupt handler failed. "
4607 				    "return: %d, vector: %d", rc, vector);
4608 				for (vector--; vector >= 0; vector--) {
4609 					(void) ddi_intr_remove_handler(
4610 					    ixgbe->htable[vector]);
4611 				}
4612 				return (IXGBE_FAILURE);
4613 			}
4614 		}
4615 
4616 		break;
4617 
4618 	case DDI_INTR_TYPE_MSI:
4619 		/*
4620 		 * Add interrupt handlers for the only vector
4621 		 */
4622 		rc = ddi_intr_add_handler(ixgbe->htable[vector],
4623 		    (ddi_intr_handler_t *)ixgbe_intr_msi,
4624 		    (void *)ixgbe, NULL);
4625 
4626 		if (rc != DDI_SUCCESS) {
4627 			ixgbe_log(ixgbe,
4628 			    "Add MSI interrupt handler failed: %d", rc);
4629 			return (IXGBE_FAILURE);
4630 		}
4631 
4632 		break;
4633 
4634 	case DDI_INTR_TYPE_FIXED:
4635 		/*
4636 		 * Add interrupt handlers for the only vector
4637 		 */
4638 		rc = ddi_intr_add_handler(ixgbe->htable[vector],
4639 		    (ddi_intr_handler_t *)ixgbe_intr_legacy,
4640 		    (void *)ixgbe, NULL);
4641 
4642 		if (rc != DDI_SUCCESS) {
4643 			ixgbe_log(ixgbe,
4644 			    "Add legacy interrupt handler failed: %d", rc);
4645 			return (IXGBE_FAILURE);
4646 		}
4647 
4648 		break;
4649 
4650 	default:
4651 		return (IXGBE_FAILURE);
4652 	}
4653 
4654 	return (IXGBE_SUCCESS);
4655 }
4656 
4657 #pragma inline(ixgbe_map_rxring_to_vector)
4658 /*
4659  * ixgbe_map_rxring_to_vector - Map given rx ring to given interrupt vector.
4660  */
4661 static void
4662 ixgbe_map_rxring_to_vector(ixgbe_t *ixgbe, int r_idx, int v_idx)
4663 {
4664 	/*
4665 	 * Set bit in map
4666 	 */
4667 	BT_SET(ixgbe->vect_map[v_idx].rx_map, r_idx);
4668 
4669 	/*
4670 	 * Count bits set
4671 	 */
4672 	ixgbe->vect_map[v_idx].rxr_cnt++;
4673 
4674 	/*
4675 	 * Remember bit position
4676 	 */
4677 	ixgbe->rx_rings[r_idx].intr_vector = v_idx;
4678 	ixgbe->rx_rings[r_idx].vect_bit = 1 << v_idx;
4679 }
4680 
4681 #pragma inline(ixgbe_map_txring_to_vector)
4682 /*
4683  * ixgbe_map_txring_to_vector - Map given tx ring to given interrupt vector.
4684  */
4685 static void
4686 ixgbe_map_txring_to_vector(ixgbe_t *ixgbe, int t_idx, int v_idx)
4687 {
4688 	/*
4689 	 * Set bit in map
4690 	 */
4691 	BT_SET(ixgbe->vect_map[v_idx].tx_map, t_idx);
4692 
4693 	/*
4694 	 * Count bits set
4695 	 */
4696 	ixgbe->vect_map[v_idx].txr_cnt++;
4697 
4698 	/*
4699 	 * Remember bit position
4700 	 */
4701 	ixgbe->tx_rings[t_idx].intr_vector = v_idx;
4702 	ixgbe->tx_rings[t_idx].vect_bit = 1 << v_idx;
4703 }
4704 
4705 /*
4706  * ixgbe_setup_ivar - Set the given entry in the given interrupt vector
4707  * allocation register (IVAR).
4708  * cause:
4709  *   -1 : other cause
4710  *    0 : rx
4711  *    1 : tx
4712  */
4713 static void
4714 ixgbe_setup_ivar(ixgbe_t *ixgbe, uint16_t intr_alloc_entry, uint8_t msix_vector,
4715     int8_t cause)
4716 {
4717 	struct ixgbe_hw *hw = &ixgbe->hw;
4718 	u32 ivar, index;
4719 
4720 	switch (hw->mac.type) {
4721 	case ixgbe_mac_82598EB:
4722 		msix_vector |= IXGBE_IVAR_ALLOC_VAL;
4723 		if (cause == -1) {
4724 			cause = 0;
4725 		}
4726 		index = (((cause * 64) + intr_alloc_entry) >> 2) & 0x1F;
4727 		ivar = IXGBE_READ_REG(hw, IXGBE_IVAR(index));
4728 		ivar &= ~(0xFF << (8 * (intr_alloc_entry & 0x3)));
4729 		ivar |= (msix_vector << (8 * (intr_alloc_entry & 0x3)));
4730 		IXGBE_WRITE_REG(hw, IXGBE_IVAR(index), ivar);
4731 		break;
4732 
4733 	case ixgbe_mac_82599EB:
4734 		if (cause == -1) {
4735 			/* other causes */
4736 			msix_vector |= IXGBE_IVAR_ALLOC_VAL;
4737 			index = (intr_alloc_entry & 1) * 8;
4738 			ivar = IXGBE_READ_REG(hw, IXGBE_IVAR_MISC);
4739 			ivar &= ~(0xFF << index);
4740 			ivar |= (msix_vector << index);
4741 			IXGBE_WRITE_REG(hw, IXGBE_IVAR_MISC, ivar);
4742 		} else {
4743 			/* tx or rx causes */
4744 			msix_vector |= IXGBE_IVAR_ALLOC_VAL;
4745 			index = ((16 * (intr_alloc_entry & 1)) + (8 * cause));
4746 			ivar = IXGBE_READ_REG(hw,
4747 			    IXGBE_IVAR(intr_alloc_entry >> 1));
4748 			ivar &= ~(0xFF << index);
4749 			ivar |= (msix_vector << index);
4750 			IXGBE_WRITE_REG(hw, IXGBE_IVAR(intr_alloc_entry >> 1),
4751 			    ivar);
4752 		}
4753 		break;
4754 
4755 	default:
4756 		break;
4757 	}
4758 }
4759 
4760 /*
4761  * ixgbe_enable_ivar - Enable the given entry by setting the VAL bit of
4762  * given interrupt vector allocation register (IVAR).
4763  * cause:
4764  *   -1 : other cause
4765  *    0 : rx
4766  *    1 : tx
4767  */
4768 static void
4769 ixgbe_enable_ivar(ixgbe_t *ixgbe, uint16_t intr_alloc_entry, int8_t cause)
4770 {
4771 	struct ixgbe_hw *hw = &ixgbe->hw;
4772 	u32 ivar, index;
4773 
4774 	switch (hw->mac.type) {
4775 	case ixgbe_mac_82598EB:
4776 		if (cause == -1) {
4777 			cause = 0;
4778 		}
4779 		index = (((cause * 64) + intr_alloc_entry) >> 2) & 0x1F;
4780 		ivar = IXGBE_READ_REG(hw, IXGBE_IVAR(index));
4781 		ivar |= (IXGBE_IVAR_ALLOC_VAL << (8 *
4782 		    (intr_alloc_entry & 0x3)));
4783 		IXGBE_WRITE_REG(hw, IXGBE_IVAR(index), ivar);
4784 		break;
4785 
4786 	case ixgbe_mac_82599EB:
4787 		if (cause == -1) {
4788 			/* other causes */
4789 			index = (intr_alloc_entry & 1) * 8;
4790 			ivar = IXGBE_READ_REG(hw, IXGBE_IVAR_MISC);
4791 			ivar |= (IXGBE_IVAR_ALLOC_VAL << index);
4792 			IXGBE_WRITE_REG(hw, IXGBE_IVAR_MISC, ivar);
4793 		} else {
4794 			/* tx or rx causes */
4795 			index = ((16 * (intr_alloc_entry & 1)) + (8 * cause));
4796 			ivar = IXGBE_READ_REG(hw,
4797 			    IXGBE_IVAR(intr_alloc_entry >> 1));
4798 			ivar |= (IXGBE_IVAR_ALLOC_VAL << index);
4799 			IXGBE_WRITE_REG(hw, IXGBE_IVAR(intr_alloc_entry >> 1),
4800 			    ivar);
4801 		}
4802 		break;
4803 
4804 	default:
4805 		break;
4806 	}
4807 }
4808 
4809 /*
4810  * ixgbe_disable_ivar - Disble the given entry by clearing the VAL bit of
4811  * given interrupt vector allocation register (IVAR).
4812  * cause:
4813  *   -1 : other cause
4814  *    0 : rx
4815  *    1 : tx
4816  */
4817 static void
4818 ixgbe_disable_ivar(ixgbe_t *ixgbe, uint16_t intr_alloc_entry, int8_t cause)
4819 {
4820 	struct ixgbe_hw *hw = &ixgbe->hw;
4821 	u32 ivar, index;
4822 
4823 	switch (hw->mac.type) {
4824 	case ixgbe_mac_82598EB:
4825 		if (cause == -1) {
4826 			cause = 0;
4827 		}
4828 		index = (((cause * 64) + intr_alloc_entry) >> 2) & 0x1F;
4829 		ivar = IXGBE_READ_REG(hw, IXGBE_IVAR(index));
4830 		ivar &= ~(IXGBE_IVAR_ALLOC_VAL<< (8 *
4831 		    (intr_alloc_entry & 0x3)));
4832 		IXGBE_WRITE_REG(hw, IXGBE_IVAR(index), ivar);
4833 		break;
4834 
4835 	case ixgbe_mac_82599EB:
4836 		if (cause == -1) {
4837 			/* other causes */
4838 			index = (intr_alloc_entry & 1) * 8;
4839 			ivar = IXGBE_READ_REG(hw, IXGBE_IVAR_MISC);
4840 			ivar &= ~(IXGBE_IVAR_ALLOC_VAL << index);
4841 			IXGBE_WRITE_REG(hw, IXGBE_IVAR_MISC, ivar);
4842 		} else {
4843 			/* tx or rx causes */
4844 			index = ((16 * (intr_alloc_entry & 1)) + (8 * cause));
4845 			ivar = IXGBE_READ_REG(hw,
4846 			    IXGBE_IVAR(intr_alloc_entry >> 1));
4847 			ivar &= ~(IXGBE_IVAR_ALLOC_VAL << index);
4848 			IXGBE_WRITE_REG(hw, IXGBE_IVAR(intr_alloc_entry >> 1),
4849 			    ivar);
4850 		}
4851 		break;
4852 
4853 	default:
4854 		break;
4855 	}
4856 }
4857 
4858 /*
4859  * Convert the rx ring index driver maintained to the rx ring index
4860  * in h/w.
4861  */
4862 static uint32_t
4863 ixgbe_get_hw_rx_index(ixgbe_t *ixgbe, uint32_t sw_rx_index)
4864 {
4865 
4866 	struct ixgbe_hw *hw = &ixgbe->hw;
4867 	uint32_t rx_ring_per_group, hw_rx_index;
4868 
4869 	if (ixgbe->classify_mode == IXGBE_CLASSIFY_RSS ||
4870 	    ixgbe->classify_mode == IXGBE_CLASSIFY_NONE) {
4871 		return (sw_rx_index);
4872 	} else if (ixgbe->classify_mode == IXGBE_CLASSIFY_VMDQ) {
4873 		switch (hw->mac.type) {
4874 		case ixgbe_mac_82598EB:
4875 			return (sw_rx_index);
4876 
4877 		case ixgbe_mac_82599EB:
4878 			return (sw_rx_index * 2);
4879 
4880 		default:
4881 			break;
4882 		}
4883 	} else if (ixgbe->classify_mode == IXGBE_CLASSIFY_VMDQ_RSS) {
4884 		rx_ring_per_group = ixgbe->num_rx_rings / ixgbe->num_rx_groups;
4885 
4886 		switch (hw->mac.type) {
4887 		case ixgbe_mac_82598EB:
4888 			hw_rx_index = (sw_rx_index / rx_ring_per_group) *
4889 			    16 + (sw_rx_index % rx_ring_per_group);
4890 			return (hw_rx_index);
4891 
4892 		case ixgbe_mac_82599EB:
4893 			if (ixgbe->num_rx_groups > 32) {
4894 				hw_rx_index = (sw_rx_index /
4895 				    rx_ring_per_group) * 2 +
4896 				    (sw_rx_index % rx_ring_per_group);
4897 			} else {
4898 				hw_rx_index = (sw_rx_index /
4899 				    rx_ring_per_group) * 4 +
4900 				    (sw_rx_index % rx_ring_per_group);
4901 			}
4902 			return (hw_rx_index);
4903 
4904 		default:
4905 			break;
4906 		}
4907 	}
4908 
4909 	/*
4910 	 * Should never reach. Just to make compiler happy.
4911 	 */
4912 	return (sw_rx_index);
4913 }
4914 
4915 /*
4916  * ixgbe_map_intrs_to_vectors - Map different interrupts to MSI-X vectors.
4917  *
4918  * For MSI-X, here will map rx interrupt, tx interrupt and other interrupt
4919  * to vector[0 - (intr_cnt -1)].
4920  */
4921 static int
4922 ixgbe_map_intrs_to_vectors(ixgbe_t *ixgbe)
4923 {
4924 	int i, vector = 0;
4925 
4926 	/* initialize vector map */
4927 	bzero(&ixgbe->vect_map, sizeof (ixgbe->vect_map));
4928 	for (i = 0; i < ixgbe->intr_cnt; i++) {
4929 		ixgbe->vect_map[i].ixgbe = ixgbe;
4930 	}
4931 
4932 	/*
4933 	 * non-MSI-X case is very simple: rx rings[0] on RTxQ[0],
4934 	 * tx rings[0] on RTxQ[1].
4935 	 */
4936 	if (ixgbe->intr_type != DDI_INTR_TYPE_MSIX) {
4937 		ixgbe_map_rxring_to_vector(ixgbe, 0, 0);
4938 		ixgbe_map_txring_to_vector(ixgbe, 0, 1);
4939 		return (IXGBE_SUCCESS);
4940 	}
4941 
4942 	/*
4943 	 * Interrupts/vectors mapping for MSI-X
4944 	 */
4945 
4946 	/*
4947 	 * Map other interrupt to vector 0,
4948 	 * Set bit in map and count the bits set.
4949 	 */
4950 	BT_SET(ixgbe->vect_map[vector].other_map, 0);
4951 	ixgbe->vect_map[vector].other_cnt++;
4952 
4953 	/*
4954 	 * Map rx ring interrupts to vectors
4955 	 */
4956 	for (i = 0; i < ixgbe->num_rx_rings; i++) {
4957 		ixgbe_map_rxring_to_vector(ixgbe, i, vector);
4958 		vector = (vector +1) % ixgbe->intr_cnt;
4959 	}
4960 
4961 	/*
4962 	 * Map tx ring interrupts to vectors
4963 	 */
4964 	for (i = 0; i < ixgbe->num_tx_rings; i++) {
4965 		ixgbe_map_txring_to_vector(ixgbe, i, vector);
4966 		vector = (vector +1) % ixgbe->intr_cnt;
4967 	}
4968 
4969 	return (IXGBE_SUCCESS);
4970 }
4971 
4972 /*
4973  * ixgbe_setup_adapter_vector - Setup the adapter interrupt vector(s).
4974  *
4975  * This relies on ring/vector mapping already set up in the
4976  * vect_map[] structures
4977  */
4978 static void
4979 ixgbe_setup_adapter_vector(ixgbe_t *ixgbe)
4980 {
4981 	struct ixgbe_hw *hw = &ixgbe->hw;
4982 	ixgbe_intr_vector_t *vect;	/* vector bitmap */
4983 	int r_idx;	/* ring index */
4984 	int v_idx;	/* vector index */
4985 	uint32_t hw_index;
4986 
4987 	/*
4988 	 * Clear any previous entries
4989 	 */
4990 	switch (hw->mac.type) {
4991 	case ixgbe_mac_82598EB:
4992 		for (v_idx = 0; v_idx < 25; v_idx++)
4993 			IXGBE_WRITE_REG(hw, IXGBE_IVAR(v_idx), 0);
4994 		break;
4995 
4996 	case ixgbe_mac_82599EB:
4997 		for (v_idx = 0; v_idx < 64; v_idx++)
4998 			IXGBE_WRITE_REG(hw, IXGBE_IVAR(v_idx), 0);
4999 		IXGBE_WRITE_REG(hw, IXGBE_IVAR_MISC, 0);
5000 		break;
5001 
5002 	default:
5003 		break;
5004 	}
5005 
5006 	/*
5007 	 * For non MSI-X interrupt, rx rings[0] will use RTxQ[0], and
5008 	 * tx rings[0] will use RTxQ[1].
5009 	 */
5010 	if (ixgbe->intr_type != DDI_INTR_TYPE_MSIX) {
5011 		ixgbe_setup_ivar(ixgbe, 0, 0, 0);
5012 		ixgbe_setup_ivar(ixgbe, 0, 1, 1);
5013 		return;
5014 	}
5015 
5016 	/*
5017 	 * For MSI-X interrupt, "Other" is always on vector[0].
5018 	 */
5019 	ixgbe_setup_ivar(ixgbe, IXGBE_IVAR_OTHER_CAUSES_INDEX, 0, -1);
5020 
5021 	/*
5022 	 * For each interrupt vector, populate the IVAR table
5023 	 */
5024 	for (v_idx = 0; v_idx < ixgbe->intr_cnt; v_idx++) {
5025 		vect = &ixgbe->vect_map[v_idx];
5026 
5027 		/*
5028 		 * For each rx ring bit set
5029 		 */
5030 		r_idx = bt_getlowbit(vect->rx_map, 0,
5031 		    (ixgbe->num_rx_rings - 1));
5032 
5033 		while (r_idx >= 0) {
5034 			hw_index = ixgbe->rx_rings[r_idx].hw_index;
5035 			ixgbe_setup_ivar(ixgbe, hw_index, v_idx, 0);
5036 			r_idx = bt_getlowbit(vect->rx_map, (r_idx + 1),
5037 			    (ixgbe->num_rx_rings - 1));
5038 		}
5039 
5040 		/*
5041 		 * For each tx ring bit set
5042 		 */
5043 		r_idx = bt_getlowbit(vect->tx_map, 0,
5044 		    (ixgbe->num_tx_rings - 1));
5045 
5046 		while (r_idx >= 0) {
5047 			ixgbe_setup_ivar(ixgbe, r_idx, v_idx, 1);
5048 			r_idx = bt_getlowbit(vect->tx_map, (r_idx + 1),
5049 			    (ixgbe->num_tx_rings - 1));
5050 		}
5051 	}
5052 }
5053 
5054 /*
5055  * ixgbe_rem_intr_handlers - Remove the interrupt handlers.
5056  */
5057 static void
5058 ixgbe_rem_intr_handlers(ixgbe_t *ixgbe)
5059 {
5060 	int i;
5061 	int rc;
5062 
5063 	for (i = 0; i < ixgbe->intr_cnt; i++) {
5064 		rc = ddi_intr_remove_handler(ixgbe->htable[i]);
5065 		if (rc != DDI_SUCCESS) {
5066 			IXGBE_DEBUGLOG_1(ixgbe,
5067 			    "Remove intr handler failed: %d", rc);
5068 		}
5069 	}
5070 }
5071 
5072 /*
5073  * ixgbe_rem_intrs - Remove the allocated interrupts.
5074  */
5075 static void
5076 ixgbe_rem_intrs(ixgbe_t *ixgbe)
5077 {
5078 	int i;
5079 	int rc;
5080 
5081 	for (i = 0; i < ixgbe->intr_cnt; i++) {
5082 		rc = ddi_intr_free(ixgbe->htable[i]);
5083 		if (rc != DDI_SUCCESS) {
5084 			IXGBE_DEBUGLOG_1(ixgbe,
5085 			    "Free intr failed: %d", rc);
5086 		}
5087 	}
5088 
5089 	kmem_free(ixgbe->htable, ixgbe->intr_size);
5090 	ixgbe->htable = NULL;
5091 }
5092 
5093 /*
5094  * ixgbe_enable_intrs - Enable all the ddi interrupts.
5095  */
5096 static int
5097 ixgbe_enable_intrs(ixgbe_t *ixgbe)
5098 {
5099 	int i;
5100 	int rc;
5101 
5102 	/*
5103 	 * Enable interrupts
5104 	 */
5105 	if (ixgbe->intr_cap & DDI_INTR_FLAG_BLOCK) {
5106 		/*
5107 		 * Call ddi_intr_block_enable() for MSI
5108 		 */
5109 		rc = ddi_intr_block_enable(ixgbe->htable, ixgbe->intr_cnt);
5110 		if (rc != DDI_SUCCESS) {
5111 			ixgbe_log(ixgbe,
5112 			    "Enable block intr failed: %d", rc);
5113 			return (IXGBE_FAILURE);
5114 		}
5115 	} else {
5116 		/*
5117 		 * Call ddi_intr_enable() for Legacy/MSI non block enable
5118 		 */
5119 		for (i = 0; i < ixgbe->intr_cnt; i++) {
5120 			rc = ddi_intr_enable(ixgbe->htable[i]);
5121 			if (rc != DDI_SUCCESS) {
5122 				ixgbe_log(ixgbe,
5123 				    "Enable intr failed: %d", rc);
5124 				return (IXGBE_FAILURE);
5125 			}
5126 		}
5127 	}
5128 
5129 	return (IXGBE_SUCCESS);
5130 }
5131 
5132 /*
5133  * ixgbe_disable_intrs - Disable all the interrupts.
5134  */
5135 static int
5136 ixgbe_disable_intrs(ixgbe_t *ixgbe)
5137 {
5138 	int i;
5139 	int rc;
5140 
5141 	/*
5142 	 * Disable all interrupts
5143 	 */
5144 	if (ixgbe->intr_cap & DDI_INTR_FLAG_BLOCK) {
5145 		rc = ddi_intr_block_disable(ixgbe->htable, ixgbe->intr_cnt);
5146 		if (rc != DDI_SUCCESS) {
5147 			ixgbe_log(ixgbe,
5148 			    "Disable block intr failed: %d", rc);
5149 			return (IXGBE_FAILURE);
5150 		}
5151 	} else {
5152 		for (i = 0; i < ixgbe->intr_cnt; i++) {
5153 			rc = ddi_intr_disable(ixgbe->htable[i]);
5154 			if (rc != DDI_SUCCESS) {
5155 				ixgbe_log(ixgbe,
5156 				    "Disable intr failed: %d", rc);
5157 				return (IXGBE_FAILURE);
5158 			}
5159 		}
5160 	}
5161 
5162 	return (IXGBE_SUCCESS);
5163 }
5164 
5165 /*
5166  * ixgbe_get_hw_state - Get and save parameters related to adapter hardware.
5167  */
5168 static void
5169 ixgbe_get_hw_state(ixgbe_t *ixgbe)
5170 {
5171 	struct ixgbe_hw *hw = &ixgbe->hw;
5172 	ixgbe_link_speed speed = IXGBE_LINK_SPEED_UNKNOWN;
5173 	boolean_t link_up = B_FALSE;
5174 	uint32_t pcs1g_anlp = 0;
5175 	uint32_t pcs1g_ana = 0;
5176 	boolean_t autoneg = B_FALSE;
5177 
5178 	ASSERT(mutex_owned(&ixgbe->gen_lock));
5179 	ixgbe->param_lp_1000fdx_cap = 0;
5180 	ixgbe->param_lp_100fdx_cap  = 0;
5181 
5182 	/* check for link, don't wait */
5183 	(void) ixgbe_check_link(hw, &speed, &link_up, false);
5184 	pcs1g_ana = IXGBE_READ_REG(hw, IXGBE_PCS1GANA);
5185 
5186 	if (link_up) {
5187 		pcs1g_anlp = IXGBE_READ_REG(hw, IXGBE_PCS1GANLP);
5188 
5189 		ixgbe->param_lp_1000fdx_cap =
5190 		    (pcs1g_anlp & IXGBE_PCS1GANLP_LPFD) ? 1 : 0;
5191 		ixgbe->param_lp_100fdx_cap =
5192 		    (pcs1g_anlp & IXGBE_PCS1GANLP_LPFD) ? 1 : 0;
5193 	}
5194 
5195 	(void) ixgbe_get_link_capabilities(hw, &speed, &autoneg);
5196 
5197 	ixgbe->param_adv_1000fdx_cap = ((pcs1g_ana & IXGBE_PCS1GANA_FDC) &&
5198 	    (speed & IXGBE_LINK_SPEED_1GB_FULL)) ? 1 : 0;
5199 	ixgbe->param_adv_100fdx_cap = ((pcs1g_ana & IXGBE_PCS1GANA_FDC) &&
5200 	    (speed & IXGBE_LINK_SPEED_100_FULL)) ? 1 : 0;
5201 }
5202 
5203 /*
5204  * ixgbe_get_driver_control - Notify that driver is in control of device.
5205  */
5206 static void
5207 ixgbe_get_driver_control(struct ixgbe_hw *hw)
5208 {
5209 	uint32_t ctrl_ext;
5210 
5211 	/*
5212 	 * Notify firmware that driver is in control of device
5213 	 */
5214 	ctrl_ext = IXGBE_READ_REG(hw, IXGBE_CTRL_EXT);
5215 	ctrl_ext |= IXGBE_CTRL_EXT_DRV_LOAD;
5216 	IXGBE_WRITE_REG(hw, IXGBE_CTRL_EXT, ctrl_ext);
5217 }
5218 
5219 /*
5220  * ixgbe_release_driver_control - Notify that driver is no longer in control
5221  * of device.
5222  */
5223 static void
5224 ixgbe_release_driver_control(struct ixgbe_hw *hw)
5225 {
5226 	uint32_t ctrl_ext;
5227 
5228 	/*
5229 	 * Notify firmware that driver is no longer in control of device
5230 	 */
5231 	ctrl_ext = IXGBE_READ_REG(hw, IXGBE_CTRL_EXT);
5232 	ctrl_ext &= ~IXGBE_CTRL_EXT_DRV_LOAD;
5233 	IXGBE_WRITE_REG(hw, IXGBE_CTRL_EXT, ctrl_ext);
5234 }
5235 
5236 /*
5237  * ixgbe_atomic_reserve - Atomic decrease operation.
5238  */
5239 int
5240 ixgbe_atomic_reserve(uint32_t *count_p, uint32_t n)
5241 {
5242 	uint32_t oldval;
5243 	uint32_t newval;
5244 
5245 	/*
5246 	 * ATOMICALLY
5247 	 */
5248 	do {
5249 		oldval = *count_p;
5250 		if (oldval < n)
5251 			return (-1);
5252 		newval = oldval - n;
5253 	} while (atomic_cas_32(count_p, oldval, newval) != oldval);
5254 
5255 	return (newval);
5256 }
5257 
5258 /*
5259  * ixgbe_mc_table_itr - Traverse the entries in the multicast table.
5260  */
5261 static uint8_t *
5262 ixgbe_mc_table_itr(struct ixgbe_hw *hw, uint8_t **upd_ptr, uint32_t *vmdq)
5263 {
5264 	uint8_t *addr = *upd_ptr;
5265 	uint8_t *new_ptr;
5266 
5267 	_NOTE(ARGUNUSED(hw));
5268 	_NOTE(ARGUNUSED(vmdq));
5269 
5270 	new_ptr = addr + IXGBE_ETH_LENGTH_OF_ADDRESS;
5271 	*upd_ptr = new_ptr;
5272 	return (addr);
5273 }
5274 
5275 /*
5276  * FMA support
5277  */
5278 int
5279 ixgbe_check_acc_handle(ddi_acc_handle_t handle)
5280 {
5281 	ddi_fm_error_t de;
5282 
5283 	ddi_fm_acc_err_get(handle, &de, DDI_FME_VERSION);
5284 	ddi_fm_acc_err_clear(handle, DDI_FME_VERSION);
5285 	return (de.fme_status);
5286 }
5287 
5288 int
5289 ixgbe_check_dma_handle(ddi_dma_handle_t handle)
5290 {
5291 	ddi_fm_error_t de;
5292 
5293 	ddi_fm_dma_err_get(handle, &de, DDI_FME_VERSION);
5294 	return (de.fme_status);
5295 }
5296 
5297 /*
5298  * ixgbe_fm_error_cb - The IO fault service error handling callback function.
5299  */
5300 static int
5301 ixgbe_fm_error_cb(dev_info_t *dip, ddi_fm_error_t *err, const void *impl_data)
5302 {
5303 	_NOTE(ARGUNUSED(impl_data));
5304 	/*
5305 	 * as the driver can always deal with an error in any dma or
5306 	 * access handle, we can just return the fme_status value.
5307 	 */
5308 	pci_ereport_post(dip, err, NULL);
5309 	return (err->fme_status);
5310 }
5311 
5312 static void
5313 ixgbe_fm_init(ixgbe_t *ixgbe)
5314 {
5315 	ddi_iblock_cookie_t iblk;
5316 	int fma_dma_flag;
5317 
5318 	/*
5319 	 * Only register with IO Fault Services if we have some capability
5320 	 */
5321 	if (ixgbe->fm_capabilities & DDI_FM_ACCCHK_CAPABLE) {
5322 		ixgbe_regs_acc_attr.devacc_attr_access = DDI_FLAGERR_ACC;
5323 	} else {
5324 		ixgbe_regs_acc_attr.devacc_attr_access = DDI_DEFAULT_ACC;
5325 	}
5326 
5327 	if (ixgbe->fm_capabilities & DDI_FM_DMACHK_CAPABLE) {
5328 		fma_dma_flag = 1;
5329 	} else {
5330 		fma_dma_flag = 0;
5331 	}
5332 
5333 	ixgbe_set_fma_flags(fma_dma_flag);
5334 
5335 	if (ixgbe->fm_capabilities) {
5336 
5337 		/*
5338 		 * Register capabilities with IO Fault Services
5339 		 */
5340 		ddi_fm_init(ixgbe->dip, &ixgbe->fm_capabilities, &iblk);
5341 
5342 		/*
5343 		 * Initialize pci ereport capabilities if ereport capable
5344 		 */
5345 		if (DDI_FM_EREPORT_CAP(ixgbe->fm_capabilities) ||
5346 		    DDI_FM_ERRCB_CAP(ixgbe->fm_capabilities))
5347 			pci_ereport_setup(ixgbe->dip);
5348 
5349 		/*
5350 		 * Register error callback if error callback capable
5351 		 */
5352 		if (DDI_FM_ERRCB_CAP(ixgbe->fm_capabilities))
5353 			ddi_fm_handler_register(ixgbe->dip,
5354 			    ixgbe_fm_error_cb, (void*) ixgbe);
5355 	}
5356 }
5357 
5358 static void
5359 ixgbe_fm_fini(ixgbe_t *ixgbe)
5360 {
5361 	/*
5362 	 * Only unregister FMA capabilities if they are registered
5363 	 */
5364 	if (ixgbe->fm_capabilities) {
5365 
5366 		/*
5367 		 * Release any resources allocated by pci_ereport_setup()
5368 		 */
5369 		if (DDI_FM_EREPORT_CAP(ixgbe->fm_capabilities) ||
5370 		    DDI_FM_ERRCB_CAP(ixgbe->fm_capabilities))
5371 			pci_ereport_teardown(ixgbe->dip);
5372 
5373 		/*
5374 		 * Un-register error callback if error callback capable
5375 		 */
5376 		if (DDI_FM_ERRCB_CAP(ixgbe->fm_capabilities))
5377 			ddi_fm_handler_unregister(ixgbe->dip);
5378 
5379 		/*
5380 		 * Unregister from IO Fault Service
5381 		 */
5382 		ddi_fm_fini(ixgbe->dip);
5383 	}
5384 }
5385 
5386 void
5387 ixgbe_fm_ereport(ixgbe_t *ixgbe, char *detail)
5388 {
5389 	uint64_t ena;
5390 	char buf[FM_MAX_CLASS];
5391 
5392 	(void) snprintf(buf, FM_MAX_CLASS, "%s.%s", DDI_FM_DEVICE, detail);
5393 	ena = fm_ena_generate(0, FM_ENA_FMT1);
5394 	if (DDI_FM_EREPORT_CAP(ixgbe->fm_capabilities)) {
5395 		ddi_fm_ereport_post(ixgbe->dip, buf, ena, DDI_NOSLEEP,
5396 		    FM_VERSION, DATA_TYPE_UINT8, FM_EREPORT_VERS0, NULL);
5397 	}
5398 }
5399 
5400 static int
5401 ixgbe_ring_start(mac_ring_driver_t rh, uint64_t mr_gen_num)
5402 {
5403 	ixgbe_rx_ring_t *rx_ring = (ixgbe_rx_ring_t *)rh;
5404 
5405 	mutex_enter(&rx_ring->rx_lock);
5406 	rx_ring->ring_gen_num = mr_gen_num;
5407 	mutex_exit(&rx_ring->rx_lock);
5408 	return (0);
5409 }
5410 
5411 /*
5412  * Get the global ring index by a ring index within a group.
5413  */
5414 static int
5415 ixgbe_get_rx_ring_index(ixgbe_t *ixgbe, int gindex, int rindex)
5416 {
5417 	ixgbe_rx_ring_t *rx_ring;
5418 	int i;
5419 
5420 	for (i = 0; i < ixgbe->num_rx_rings; i++) {
5421 		rx_ring = &ixgbe->rx_rings[i];
5422 		if (rx_ring->group_index == gindex)
5423 			rindex--;
5424 		if (rindex < 0)
5425 			return (i);
5426 	}
5427 
5428 	return (-1);
5429 }
5430 
5431 /*
5432  * Callback funtion for MAC layer to register all rings.
5433  */
5434 /* ARGSUSED */
5435 void
5436 ixgbe_fill_ring(void *arg, mac_ring_type_t rtype, const int group_index,
5437     const int ring_index, mac_ring_info_t *infop, mac_ring_handle_t rh)
5438 {
5439 	ixgbe_t *ixgbe = (ixgbe_t *)arg;
5440 	mac_intr_t *mintr = &infop->mri_intr;
5441 
5442 	switch (rtype) {
5443 	case MAC_RING_TYPE_RX: {
5444 		/*
5445 		 * 'index' is the ring index within the group.
5446 		 * Need to get the global ring index by searching in groups.
5447 		 */
5448 		int global_ring_index = ixgbe_get_rx_ring_index(
5449 		    ixgbe, group_index, ring_index);
5450 
5451 		ASSERT(global_ring_index >= 0);
5452 
5453 		ixgbe_rx_ring_t *rx_ring = &ixgbe->rx_rings[global_ring_index];
5454 		rx_ring->ring_handle = rh;
5455 
5456 		infop->mri_driver = (mac_ring_driver_t)rx_ring;
5457 		infop->mri_start = ixgbe_ring_start;
5458 		infop->mri_stop = NULL;
5459 		infop->mri_poll = ixgbe_ring_rx_poll;
5460 		infop->mri_stat = ixgbe_rx_ring_stat;
5461 
5462 		mintr->mi_handle = (mac_intr_handle_t)rx_ring;
5463 		mintr->mi_enable = ixgbe_rx_ring_intr_enable;
5464 		mintr->mi_disable = ixgbe_rx_ring_intr_disable;
5465 		if (ixgbe->intr_type &
5466 		    (DDI_INTR_TYPE_MSIX | DDI_INTR_TYPE_MSI)) {
5467 			mintr->mi_ddi_handle =
5468 			    ixgbe->htable[rx_ring->intr_vector];
5469 		}
5470 
5471 		break;
5472 	}
5473 	case MAC_RING_TYPE_TX: {
5474 		ASSERT(group_index == -1);
5475 		ASSERT(ring_index < ixgbe->num_tx_rings);
5476 
5477 		ixgbe_tx_ring_t *tx_ring = &ixgbe->tx_rings[ring_index];
5478 		tx_ring->ring_handle = rh;
5479 
5480 		infop->mri_driver = (mac_ring_driver_t)tx_ring;
5481 		infop->mri_start = NULL;
5482 		infop->mri_stop = NULL;
5483 		infop->mri_tx = ixgbe_ring_tx;
5484 		infop->mri_stat = ixgbe_tx_ring_stat;
5485 		if (ixgbe->intr_type &
5486 		    (DDI_INTR_TYPE_MSIX | DDI_INTR_TYPE_MSI)) {
5487 			mintr->mi_ddi_handle =
5488 			    ixgbe->htable[tx_ring->intr_vector];
5489 		}
5490 		break;
5491 	}
5492 	default:
5493 		break;
5494 	}
5495 }
5496 
5497 /*
5498  * Callback funtion for MAC layer to register all groups.
5499  */
5500 void
5501 ixgbe_fill_group(void *arg, mac_ring_type_t rtype, const int index,
5502     mac_group_info_t *infop, mac_group_handle_t gh)
5503 {
5504 	ixgbe_t *ixgbe = (ixgbe_t *)arg;
5505 
5506 	switch (rtype) {
5507 	case MAC_RING_TYPE_RX: {
5508 		ixgbe_rx_group_t *rx_group;
5509 
5510 		rx_group = &ixgbe->rx_groups[index];
5511 		rx_group->group_handle = gh;
5512 
5513 		infop->mgi_driver = (mac_group_driver_t)rx_group;
5514 		infop->mgi_start = NULL;
5515 		infop->mgi_stop = NULL;
5516 		infop->mgi_addmac = ixgbe_addmac;
5517 		infop->mgi_remmac = ixgbe_remmac;
5518 		infop->mgi_count = (ixgbe->num_rx_rings / ixgbe->num_rx_groups);
5519 
5520 		break;
5521 	}
5522 	case MAC_RING_TYPE_TX:
5523 		break;
5524 	default:
5525 		break;
5526 	}
5527 }
5528 
5529 /*
5530  * Enable interrupt on the specificed rx ring.
5531  */
5532 int
5533 ixgbe_rx_ring_intr_enable(mac_intr_handle_t intrh)
5534 {
5535 	ixgbe_rx_ring_t *rx_ring = (ixgbe_rx_ring_t *)intrh;
5536 	ixgbe_t *ixgbe = rx_ring->ixgbe;
5537 	int r_idx = rx_ring->index;
5538 	int hw_r_idx = rx_ring->hw_index;
5539 	int v_idx = rx_ring->intr_vector;
5540 
5541 	mutex_enter(&ixgbe->gen_lock);
5542 	if (ixgbe->ixgbe_state & IXGBE_INTR_ADJUST) {
5543 		mutex_exit(&ixgbe->gen_lock);
5544 		/*
5545 		 * Simply return 0.
5546 		 * Interrupts are being adjusted. ixgbe_intr_adjust()
5547 		 * will eventually re-enable the interrupt when it's
5548 		 * done with the adjustment.
5549 		 */
5550 		return (0);
5551 	}
5552 
5553 	/*
5554 	 * To enable interrupt by setting the VAL bit of given interrupt
5555 	 * vector allocation register (IVAR).
5556 	 */
5557 	ixgbe_enable_ivar(ixgbe, hw_r_idx, 0);
5558 
5559 	BT_SET(ixgbe->vect_map[v_idx].rx_map, r_idx);
5560 
5561 	/*
5562 	 * Trigger a Rx interrupt on this ring
5563 	 */
5564 	IXGBE_WRITE_REG(&ixgbe->hw, IXGBE_EICS, (1 << v_idx));
5565 	IXGBE_WRITE_FLUSH(&ixgbe->hw);
5566 
5567 	mutex_exit(&ixgbe->gen_lock);
5568 
5569 	return (0);
5570 }
5571 
5572 /*
5573  * Disable interrupt on the specificed rx ring.
5574  */
5575 int
5576 ixgbe_rx_ring_intr_disable(mac_intr_handle_t intrh)
5577 {
5578 	ixgbe_rx_ring_t *rx_ring = (ixgbe_rx_ring_t *)intrh;
5579 	ixgbe_t *ixgbe = rx_ring->ixgbe;
5580 	int r_idx = rx_ring->index;
5581 	int hw_r_idx = rx_ring->hw_index;
5582 	int v_idx = rx_ring->intr_vector;
5583 
5584 	mutex_enter(&ixgbe->gen_lock);
5585 	if (ixgbe->ixgbe_state & IXGBE_INTR_ADJUST) {
5586 		mutex_exit(&ixgbe->gen_lock);
5587 		/*
5588 		 * Simply return 0.
5589 		 * In the rare case where an interrupt is being
5590 		 * disabled while interrupts are being adjusted,
5591 		 * we don't fail the operation. No interrupts will
5592 		 * be generated while they are adjusted, and
5593 		 * ixgbe_intr_adjust() will cause the interrupts
5594 		 * to be re-enabled once it completes. Note that
5595 		 * in this case, packets may be delivered to the
5596 		 * stack via interrupts before xgbe_rx_ring_intr_enable()
5597 		 * is called again. This is acceptable since interrupt
5598 		 * adjustment is infrequent, and the stack will be
5599 		 * able to handle these packets.
5600 		 */
5601 		return (0);
5602 	}
5603 
5604 	/*
5605 	 * To disable interrupt by clearing the VAL bit of given interrupt
5606 	 * vector allocation register (IVAR).
5607 	 */
5608 	ixgbe_disable_ivar(ixgbe, hw_r_idx, 0);
5609 
5610 	BT_CLEAR(ixgbe->vect_map[v_idx].rx_map, r_idx);
5611 
5612 	mutex_exit(&ixgbe->gen_lock);
5613 
5614 	return (0);
5615 }
5616 
5617 /*
5618  * Add a mac address.
5619  */
5620 static int
5621 ixgbe_addmac(void *arg, const uint8_t *mac_addr)
5622 {
5623 	ixgbe_rx_group_t *rx_group = (ixgbe_rx_group_t *)arg;
5624 	ixgbe_t *ixgbe = rx_group->ixgbe;
5625 	struct ixgbe_hw *hw = &ixgbe->hw;
5626 	int slot, i;
5627 
5628 	mutex_enter(&ixgbe->gen_lock);
5629 
5630 	if (ixgbe->ixgbe_state & IXGBE_SUSPENDED) {
5631 		mutex_exit(&ixgbe->gen_lock);
5632 		return (ECANCELED);
5633 	}
5634 
5635 	if (ixgbe->unicst_avail == 0) {
5636 		/* no slots available */
5637 		mutex_exit(&ixgbe->gen_lock);
5638 		return (ENOSPC);
5639 	}
5640 
5641 	/*
5642 	 * The first ixgbe->num_rx_groups slots are reserved for each respective
5643 	 * group. The rest slots are shared by all groups. While adding a
5644 	 * MAC address, reserved slots are firstly checked then the shared
5645 	 * slots are searched.
5646 	 */
5647 	slot = -1;
5648 	if (ixgbe->unicst_addr[rx_group->index].mac.set == 1) {
5649 		for (i = ixgbe->num_rx_groups; i < ixgbe->unicst_total; i++) {
5650 			if (ixgbe->unicst_addr[i].mac.set == 0) {
5651 				slot = i;
5652 				break;
5653 			}
5654 		}
5655 	} else {
5656 		slot = rx_group->index;
5657 	}
5658 
5659 	if (slot == -1) {
5660 		/* no slots available */
5661 		mutex_exit(&ixgbe->gen_lock);
5662 		return (ENOSPC);
5663 	}
5664 
5665 	bcopy(mac_addr, ixgbe->unicst_addr[slot].mac.addr, ETHERADDRL);
5666 	(void) ixgbe_set_rar(hw, slot, ixgbe->unicst_addr[slot].mac.addr,
5667 	    rx_group->index, IXGBE_RAH_AV);
5668 	ixgbe->unicst_addr[slot].mac.set = 1;
5669 	ixgbe->unicst_addr[slot].mac.group_index = rx_group->index;
5670 	ixgbe->unicst_avail--;
5671 
5672 	mutex_exit(&ixgbe->gen_lock);
5673 
5674 	return (0);
5675 }
5676 
5677 /*
5678  * Remove a mac address.
5679  */
5680 static int
5681 ixgbe_remmac(void *arg, const uint8_t *mac_addr)
5682 {
5683 	ixgbe_rx_group_t *rx_group = (ixgbe_rx_group_t *)arg;
5684 	ixgbe_t *ixgbe = rx_group->ixgbe;
5685 	struct ixgbe_hw *hw = &ixgbe->hw;
5686 	int slot;
5687 
5688 	mutex_enter(&ixgbe->gen_lock);
5689 
5690 	if (ixgbe->ixgbe_state & IXGBE_SUSPENDED) {
5691 		mutex_exit(&ixgbe->gen_lock);
5692 		return (ECANCELED);
5693 	}
5694 
5695 	slot = ixgbe_unicst_find(ixgbe, mac_addr);
5696 	if (slot == -1) {
5697 		mutex_exit(&ixgbe->gen_lock);
5698 		return (EINVAL);
5699 	}
5700 
5701 	if (ixgbe->unicst_addr[slot].mac.set == 0) {
5702 		mutex_exit(&ixgbe->gen_lock);
5703 		return (EINVAL);
5704 	}
5705 
5706 	bzero(ixgbe->unicst_addr[slot].mac.addr, ETHERADDRL);
5707 	(void) ixgbe_clear_rar(hw, slot);
5708 	ixgbe->unicst_addr[slot].mac.set = 0;
5709 	ixgbe->unicst_avail++;
5710 
5711 	mutex_exit(&ixgbe->gen_lock);
5712 
5713 	return (0);
5714 }
5715