1 /*
2 * CDDL HEADER START
3 *
4 * The contents of this file are subject to the terms of the
5 * Common Development and Distribution License (the "License").
6 * You may not use this file except in compliance with the License.
7 *
8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9 * or http://www.opensolaris.org/os/licensing.
10 * See the License for the specific language governing permissions
11 * and limitations under the License.
12 *
13 * When distributing Covered Code, include this CDDL HEADER in each
14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15 * If applicable, add the following below this CDDL HEADER, with the
16 * fields enclosed by brackets "[]" replaced with your own identifying
17 * information: Portions Copyright [yyyy] [name of copyright owner]
18 *
19 * CDDL HEADER END
20 */
21
22 /*
23 * Copyright(c) 2007-2010 Intel Corporation. All rights reserved.
24 */
25
26 /*
27 * Copyright (c) 2008, 2010, Oracle and/or its affiliates. All rights reserved.
28 * Copyright (c) 2017, Joyent, Inc.
29 * Copyright 2012 Nexenta Systems, Inc. All rights reserved.
30 * Copyright (c) 2013 Saso Kiselkov. All rights reserved.
31 * Copyright (c) 2013 OSN Online Service Nuernberg GmbH. All rights reserved.
32 * Copyright 2016 OmniTI Computer Consulting, Inc. All rights reserved.
33 */
34
35 #include "ixgbe_sw.h"
36
37 static char ixgbe_ident[] = "Intel 10Gb Ethernet";
38
39 /*
40 * Local function protoypes
41 */
42 static int ixgbe_register_mac(ixgbe_t *);
43 static int ixgbe_identify_hardware(ixgbe_t *);
44 static int ixgbe_regs_map(ixgbe_t *);
45 static void ixgbe_init_properties(ixgbe_t *);
46 static int ixgbe_init_driver_settings(ixgbe_t *);
47 static void ixgbe_init_locks(ixgbe_t *);
48 static void ixgbe_destroy_locks(ixgbe_t *);
49 static int ixgbe_init(ixgbe_t *);
50 static int ixgbe_chip_start(ixgbe_t *);
51 static void ixgbe_chip_stop(ixgbe_t *);
52 static int ixgbe_reset(ixgbe_t *);
53 static void ixgbe_tx_clean(ixgbe_t *);
54 static boolean_t ixgbe_tx_drain(ixgbe_t *);
55 static boolean_t ixgbe_rx_drain(ixgbe_t *);
56 static int ixgbe_alloc_rings(ixgbe_t *);
57 static void ixgbe_free_rings(ixgbe_t *);
58 static int ixgbe_alloc_rx_data(ixgbe_t *);
59 static void ixgbe_free_rx_data(ixgbe_t *);
60 static void ixgbe_setup_rings(ixgbe_t *);
61 static void ixgbe_setup_rx(ixgbe_t *);
62 static void ixgbe_setup_tx(ixgbe_t *);
63 static void ixgbe_setup_rx_ring(ixgbe_rx_ring_t *);
64 static void ixgbe_setup_tx_ring(ixgbe_tx_ring_t *);
65 static void ixgbe_setup_rss(ixgbe_t *);
66 static void ixgbe_setup_vmdq(ixgbe_t *);
67 static void ixgbe_setup_vmdq_rss(ixgbe_t *);
68 static void ixgbe_setup_rss_table(ixgbe_t *);
69 static void ixgbe_init_unicst(ixgbe_t *);
70 static int ixgbe_unicst_find(ixgbe_t *, const uint8_t *);
71 static void ixgbe_setup_multicst(ixgbe_t *);
72 static void ixgbe_get_hw_state(ixgbe_t *);
73 static void ixgbe_setup_vmdq_rss_conf(ixgbe_t *ixgbe);
74 static void ixgbe_get_conf(ixgbe_t *);
75 static void ixgbe_init_params(ixgbe_t *);
76 static int ixgbe_get_prop(ixgbe_t *, char *, int, int, int);
77 static void ixgbe_driver_link_check(ixgbe_t *);
78 static void ixgbe_sfp_check(void *);
79 static void ixgbe_overtemp_check(void *);
80 static void ixgbe_phy_check(void *);
81 static void ixgbe_link_timer(void *);
82 static void ixgbe_local_timer(void *);
83 static void ixgbe_arm_watchdog_timer(ixgbe_t *);
84 static void ixgbe_restart_watchdog_timer(ixgbe_t *);
85 static void ixgbe_disable_adapter_interrupts(ixgbe_t *);
86 static void ixgbe_enable_adapter_interrupts(ixgbe_t *);
87 static boolean_t is_valid_mac_addr(uint8_t *);
88 static boolean_t ixgbe_stall_check(ixgbe_t *);
89 static boolean_t ixgbe_set_loopback_mode(ixgbe_t *, uint32_t);
90 static void ixgbe_set_internal_mac_loopback(ixgbe_t *);
91 static boolean_t ixgbe_find_mac_address(ixgbe_t *);
92 static int ixgbe_alloc_intrs(ixgbe_t *);
93 static int ixgbe_alloc_intr_handles(ixgbe_t *, int);
94 static int ixgbe_add_intr_handlers(ixgbe_t *);
95 static void ixgbe_map_rxring_to_vector(ixgbe_t *, int, int);
96 static void ixgbe_map_txring_to_vector(ixgbe_t *, int, int);
97 static void ixgbe_setup_ivar(ixgbe_t *, uint16_t, uint8_t, int8_t);
98 static void ixgbe_enable_ivar(ixgbe_t *, uint16_t, int8_t);
99 static void ixgbe_disable_ivar(ixgbe_t *, uint16_t, int8_t);
100 static uint32_t ixgbe_get_hw_rx_index(ixgbe_t *ixgbe, uint32_t sw_rx_index);
101 static int ixgbe_map_intrs_to_vectors(ixgbe_t *);
102 static void ixgbe_setup_adapter_vector(ixgbe_t *);
103 static void ixgbe_rem_intr_handlers(ixgbe_t *);
104 static void ixgbe_rem_intrs(ixgbe_t *);
105 static int ixgbe_enable_intrs(ixgbe_t *);
106 static int ixgbe_disable_intrs(ixgbe_t *);
107 static uint_t ixgbe_intr_legacy(void *, void *);
108 static uint_t ixgbe_intr_msi(void *, void *);
109 static uint_t ixgbe_intr_msix(void *, void *);
110 static void ixgbe_intr_rx_work(ixgbe_rx_ring_t *);
111 static void ixgbe_intr_tx_work(ixgbe_tx_ring_t *);
112 static void ixgbe_intr_other_work(ixgbe_t *, uint32_t);
113 static void ixgbe_get_driver_control(struct ixgbe_hw *);
114 static int ixgbe_addmac(void *, const uint8_t *);
115 static int ixgbe_remmac(void *, const uint8_t *);
116 static void ixgbe_release_driver_control(struct ixgbe_hw *);
117
118 static int ixgbe_attach(dev_info_t *, ddi_attach_cmd_t);
119 static int ixgbe_detach(dev_info_t *, ddi_detach_cmd_t);
120 static int ixgbe_resume(dev_info_t *);
121 static int ixgbe_suspend(dev_info_t *);
122 static int ixgbe_quiesce(dev_info_t *);
123 static void ixgbe_unconfigure(dev_info_t *, ixgbe_t *);
124 static uint8_t *ixgbe_mc_table_itr(struct ixgbe_hw *, uint8_t **, uint32_t *);
125 static int ixgbe_cbfunc(dev_info_t *, ddi_cb_action_t, void *, void *, void *);
126 static int ixgbe_intr_cb_register(ixgbe_t *);
127 static int ixgbe_intr_adjust(ixgbe_t *, ddi_cb_action_t, int);
128
129 static int ixgbe_fm_error_cb(dev_info_t *dip, ddi_fm_error_t *err,
130 const void *impl_data);
131 static void ixgbe_fm_init(ixgbe_t *);
132 static void ixgbe_fm_fini(ixgbe_t *);
133
134 char *ixgbe_priv_props[] = {
135 "_tx_copy_thresh",
136 "_tx_recycle_thresh",
137 "_tx_overload_thresh",
138 "_tx_resched_thresh",
139 "_rx_copy_thresh",
140 "_rx_limit_per_intr",
141 "_intr_throttling",
142 "_adv_pause_cap",
143 "_adv_asym_pause_cap",
144 NULL
145 };
146
147 #define IXGBE_MAX_PRIV_PROPS \
148 (sizeof (ixgbe_priv_props) / sizeof (mac_priv_prop_t))
149
150 static struct cb_ops ixgbe_cb_ops = {
151 nulldev, /* cb_open */
152 nulldev, /* cb_close */
153 nodev, /* cb_strategy */
154 nodev, /* cb_print */
155 nodev, /* cb_dump */
156 nodev, /* cb_read */
157 nodev, /* cb_write */
158 nodev, /* cb_ioctl */
159 nodev, /* cb_devmap */
160 nodev, /* cb_mmap */
161 nodev, /* cb_segmap */
162 nochpoll, /* cb_chpoll */
163 ddi_prop_op, /* cb_prop_op */
164 NULL, /* cb_stream */
165 D_MP | D_HOTPLUG, /* cb_flag */
166 CB_REV, /* cb_rev */
167 nodev, /* cb_aread */
168 nodev /* cb_awrite */
169 };
170
171 static struct dev_ops ixgbe_dev_ops = {
172 DEVO_REV, /* devo_rev */
173 0, /* devo_refcnt */
174 NULL, /* devo_getinfo */
175 nulldev, /* devo_identify */
176 nulldev, /* devo_probe */
177 ixgbe_attach, /* devo_attach */
178 ixgbe_detach, /* devo_detach */
179 nodev, /* devo_reset */
180 &ixgbe_cb_ops, /* devo_cb_ops */
181 NULL, /* devo_bus_ops */
182 ddi_power, /* devo_power */
183 ixgbe_quiesce, /* devo_quiesce */
184 };
185
186 static struct modldrv ixgbe_modldrv = {
187 &mod_driverops, /* Type of module. This one is a driver */
188 ixgbe_ident, /* Discription string */
189 &ixgbe_dev_ops /* driver ops */
190 };
191
192 static struct modlinkage ixgbe_modlinkage = {
193 MODREV_1, &ixgbe_modldrv, NULL
194 };
195
196 /*
197 * Access attributes for register mapping
198 */
199 ddi_device_acc_attr_t ixgbe_regs_acc_attr = {
200 DDI_DEVICE_ATTR_V1,
201 DDI_STRUCTURE_LE_ACC,
202 DDI_STRICTORDER_ACC,
203 DDI_FLAGERR_ACC
204 };
205
206 /*
207 * Loopback property
208 */
209 static lb_property_t lb_normal = {
210 normal, "normal", IXGBE_LB_NONE
211 };
212
213 static lb_property_t lb_mac = {
214 internal, "MAC", IXGBE_LB_INTERNAL_MAC
215 };
216
217 static lb_property_t lb_external = {
218 external, "External", IXGBE_LB_EXTERNAL
219 };
220
221 #define IXGBE_M_CALLBACK_FLAGS \
222 (MC_IOCTL | MC_GETCAPAB | MC_SETPROP | MC_GETPROP | MC_PROPINFO)
223
224 static mac_callbacks_t ixgbe_m_callbacks = {
225 IXGBE_M_CALLBACK_FLAGS,
226 ixgbe_m_stat,
227 ixgbe_m_start,
228 ixgbe_m_stop,
229 ixgbe_m_promisc,
230 ixgbe_m_multicst,
231 NULL,
232 NULL,
233 NULL,
234 ixgbe_m_ioctl,
235 ixgbe_m_getcapab,
236 NULL,
237 NULL,
238 ixgbe_m_setprop,
239 ixgbe_m_getprop,
240 ixgbe_m_propinfo
241 };
242
243 /*
244 * Initialize capabilities of each supported adapter type
245 */
246 static adapter_info_t ixgbe_82598eb_cap = {
247 64, /* maximum number of rx queues */
248 1, /* minimum number of rx queues */
249 64, /* default number of rx queues */
250 16, /* maximum number of rx groups */
251 1, /* minimum number of rx groups */
252 1, /* default number of rx groups */
253 32, /* maximum number of tx queues */
254 1, /* minimum number of tx queues */
255 8, /* default number of tx queues */
256 16366, /* maximum MTU size */
257 0xFFFF, /* maximum interrupt throttle rate */
258 0, /* minimum interrupt throttle rate */
259 200, /* default interrupt throttle rate */
260 18, /* maximum total msix vectors */
261 16, /* maximum number of ring vectors */
262 2, /* maximum number of other vectors */
263 IXGBE_EICR_LSC, /* "other" interrupt types handled */
264 0, /* "other" interrupt types enable mask */
265 (IXGBE_FLAG_DCA_CAPABLE /* capability flags */
266 | IXGBE_FLAG_RSS_CAPABLE
267 | IXGBE_FLAG_VMDQ_CAPABLE)
268 };
269
270 static adapter_info_t ixgbe_82599eb_cap = {
271 128, /* maximum number of rx queues */
272 1, /* minimum number of rx queues */
273 128, /* default number of rx queues */
274 64, /* maximum number of rx groups */
275 1, /* minimum number of rx groups */
276 1, /* default number of rx groups */
277 128, /* maximum number of tx queues */
278 1, /* minimum number of tx queues */
279 8, /* default number of tx queues */
280 15500, /* maximum MTU size */
281 0xFF8, /* maximum interrupt throttle rate */
282 0, /* minimum interrupt throttle rate */
283 200, /* default interrupt throttle rate */
284 64, /* maximum total msix vectors */
285 16, /* maximum number of ring vectors */
286 2, /* maximum number of other vectors */
287 (IXGBE_EICR_LSC
288 | IXGBE_EICR_GPI_SDP1
289 | IXGBE_EICR_GPI_SDP2), /* "other" interrupt types handled */
290
291 (IXGBE_SDP1_GPIEN
292 | IXGBE_SDP2_GPIEN), /* "other" interrupt types enable mask */
293
294 (IXGBE_FLAG_DCA_CAPABLE
295 | IXGBE_FLAG_RSS_CAPABLE
296 | IXGBE_FLAG_VMDQ_CAPABLE
297 | IXGBE_FLAG_RSC_CAPABLE
298 | IXGBE_FLAG_SFP_PLUG_CAPABLE) /* capability flags */
299 };
300
301 static adapter_info_t ixgbe_X540_cap = {
302 128, /* maximum number of rx queues */
303 1, /* minimum number of rx queues */
304 128, /* default number of rx queues */
305 64, /* maximum number of rx groups */
306 1, /* minimum number of rx groups */
307 1, /* default number of rx groups */
308 128, /* maximum number of tx queues */
309 1, /* minimum number of tx queues */
310 8, /* default number of tx queues */
311 15500, /* maximum MTU size */
312 0xFF8, /* maximum interrupt throttle rate */
313 0, /* minimum interrupt throttle rate */
314 200, /* default interrupt throttle rate */
315 64, /* maximum total msix vectors */
316 16, /* maximum number of ring vectors */
317 2, /* maximum number of other vectors */
318 (IXGBE_EICR_LSC
319 | IXGBE_EICR_GPI_SDP1_X540
320 | IXGBE_EICR_GPI_SDP2_X540), /* "other" interrupt types handled */
321
322 (IXGBE_SDP1_GPIEN_X540
323 | IXGBE_SDP2_GPIEN_X540), /* "other" interrupt types enable mask */
324
325 (IXGBE_FLAG_DCA_CAPABLE
326 | IXGBE_FLAG_RSS_CAPABLE
327 | IXGBE_FLAG_VMDQ_CAPABLE
328 | IXGBE_FLAG_RSC_CAPABLE) /* capability flags */
329 };
330
331 static adapter_info_t ixgbe_X550_cap = {
332 128, /* maximum number of rx queues */
333 1, /* minimum number of rx queues */
334 128, /* default number of rx queues */
335 64, /* maximum number of rx groups */
336 1, /* minimum number of rx groups */
337 1, /* default number of rx groups */
338 128, /* maximum number of tx queues */
339 1, /* minimum number of tx queues */
340 8, /* default number of tx queues */
341 15500, /* maximum MTU size */
342 0xFF8, /* maximum interrupt throttle rate */
343 0, /* minimum interrupt throttle rate */
344 0x200, /* default interrupt throttle rate */
345 64, /* maximum total msix vectors */
346 16, /* maximum number of ring vectors */
347 2, /* maximum number of other vectors */
348 IXGBE_EICR_LSC, /* "other" interrupt types handled */
349 0, /* "other" interrupt types enable mask */
350 (IXGBE_FLAG_RSS_CAPABLE
351 | IXGBE_FLAG_VMDQ_CAPABLE
352 | IXGBE_FLAG_RSC_CAPABLE) /* capability flags */
353 };
354
355 /*
356 * Module Initialization Functions.
357 */
358
359 int
_init(void)360 _init(void)
361 {
362 int status;
363
364 mac_init_ops(&ixgbe_dev_ops, MODULE_NAME);
365
366 status = mod_install(&ixgbe_modlinkage);
367
368 if (status != DDI_SUCCESS) {
369 mac_fini_ops(&ixgbe_dev_ops);
370 }
371
372 return (status);
373 }
374
375 int
_fini(void)376 _fini(void)
377 {
378 int status;
379
380 status = mod_remove(&ixgbe_modlinkage);
381
382 if (status == DDI_SUCCESS) {
383 mac_fini_ops(&ixgbe_dev_ops);
384 }
385
386 return (status);
387 }
388
389 int
_info(struct modinfo * modinfop)390 _info(struct modinfo *modinfop)
391 {
392 int status;
393
394 status = mod_info(&ixgbe_modlinkage, modinfop);
395
396 return (status);
397 }
398
399 /*
400 * ixgbe_attach - Driver attach.
401 *
402 * This function is the device specific initialization entry
403 * point. This entry point is required and must be written.
404 * The DDI_ATTACH command must be provided in the attach entry
405 * point. When attach() is called with cmd set to DDI_ATTACH,
406 * all normal kernel services (such as kmem_alloc(9F)) are
407 * available for use by the driver.
408 *
409 * The attach() function will be called once for each instance
410 * of the device on the system with cmd set to DDI_ATTACH.
411 * Until attach() succeeds, the only driver entry points which
412 * may be called are open(9E) and getinfo(9E).
413 */
414 static int
ixgbe_attach(dev_info_t * devinfo,ddi_attach_cmd_t cmd)415 ixgbe_attach(dev_info_t *devinfo, ddi_attach_cmd_t cmd)
416 {
417 ixgbe_t *ixgbe;
418 struct ixgbe_osdep *osdep;
419 struct ixgbe_hw *hw;
420 int instance;
421 char taskqname[32];
422
423 /*
424 * Check the command and perform corresponding operations
425 */
426 switch (cmd) {
427 default:
428 return (DDI_FAILURE);
429
430 case DDI_RESUME:
431 return (ixgbe_resume(devinfo));
432
433 case DDI_ATTACH:
434 break;
435 }
436
437 /* Get the device instance */
438 instance = ddi_get_instance(devinfo);
439
440 /* Allocate memory for the instance data structure */
441 ixgbe = kmem_zalloc(sizeof (ixgbe_t), KM_SLEEP);
442
443 ixgbe->dip = devinfo;
444 ixgbe->instance = instance;
445
446 hw = &ixgbe->hw;
447 osdep = &ixgbe->osdep;
448 hw->back = osdep;
449 osdep->ixgbe = ixgbe;
450
451 /* Attach the instance pointer to the dev_info data structure */
452 ddi_set_driver_private(devinfo, ixgbe);
453
454 /*
455 * Initialize for FMA support
456 */
457 ixgbe->fm_capabilities = ixgbe_get_prop(ixgbe, PROP_FM_CAPABLE,
458 0, 0x0f, DDI_FM_EREPORT_CAPABLE | DDI_FM_ACCCHK_CAPABLE |
459 DDI_FM_DMACHK_CAPABLE | DDI_FM_ERRCB_CAPABLE);
460 ixgbe_fm_init(ixgbe);
461 ixgbe->attach_progress |= ATTACH_PROGRESS_FM_INIT;
462
463 /*
464 * Map PCI config space registers
465 */
466 if (pci_config_setup(devinfo, &osdep->cfg_handle) != DDI_SUCCESS) {
467 ixgbe_error(ixgbe, "Failed to map PCI configurations");
468 goto attach_fail;
469 }
470 ixgbe->attach_progress |= ATTACH_PROGRESS_PCI_CONFIG;
471
472 /*
473 * Identify the chipset family
474 */
475 if (ixgbe_identify_hardware(ixgbe) != IXGBE_SUCCESS) {
476 ixgbe_error(ixgbe, "Failed to identify hardware");
477 goto attach_fail;
478 }
479
480 /*
481 * Map device registers
482 */
483 if (ixgbe_regs_map(ixgbe) != IXGBE_SUCCESS) {
484 ixgbe_error(ixgbe, "Failed to map device registers");
485 goto attach_fail;
486 }
487 ixgbe->attach_progress |= ATTACH_PROGRESS_REGS_MAP;
488
489 /*
490 * Initialize driver parameters
491 */
492 ixgbe_init_properties(ixgbe);
493 ixgbe->attach_progress |= ATTACH_PROGRESS_PROPS;
494
495 /*
496 * Register interrupt callback
497 */
498 if (ixgbe_intr_cb_register(ixgbe) != IXGBE_SUCCESS) {
499 ixgbe_error(ixgbe, "Failed to register interrupt callback");
500 goto attach_fail;
501 }
502
503 /*
504 * Allocate interrupts
505 */
506 if (ixgbe_alloc_intrs(ixgbe) != IXGBE_SUCCESS) {
507 ixgbe_error(ixgbe, "Failed to allocate interrupts");
508 goto attach_fail;
509 }
510 ixgbe->attach_progress |= ATTACH_PROGRESS_ALLOC_INTR;
511
512 /*
513 * Allocate rx/tx rings based on the ring numbers.
514 * The actual numbers of rx/tx rings are decided by the number of
515 * allocated interrupt vectors, so we should allocate the rings after
516 * interrupts are allocated.
517 */
518 if (ixgbe_alloc_rings(ixgbe) != IXGBE_SUCCESS) {
519 ixgbe_error(ixgbe, "Failed to allocate rx and tx rings");
520 goto attach_fail;
521 }
522 ixgbe->attach_progress |= ATTACH_PROGRESS_ALLOC_RINGS;
523
524 /*
525 * Map rings to interrupt vectors
526 */
527 if (ixgbe_map_intrs_to_vectors(ixgbe) != IXGBE_SUCCESS) {
528 ixgbe_error(ixgbe, "Failed to map interrupts to vectors");
529 goto attach_fail;
530 }
531
532 /*
533 * Add interrupt handlers
534 */
535 if (ixgbe_add_intr_handlers(ixgbe) != IXGBE_SUCCESS) {
536 ixgbe_error(ixgbe, "Failed to add interrupt handlers");
537 goto attach_fail;
538 }
539 ixgbe->attach_progress |= ATTACH_PROGRESS_ADD_INTR;
540
541 /*
542 * Create a taskq for sfp-change
543 */
544 (void) sprintf(taskqname, "ixgbe%d_sfp_taskq", instance);
545 if ((ixgbe->sfp_taskq = ddi_taskq_create(devinfo, taskqname,
546 1, TASKQ_DEFAULTPRI, 0)) == NULL) {
547 ixgbe_error(ixgbe, "sfp_taskq create failed");
548 goto attach_fail;
549 }
550 ixgbe->attach_progress |= ATTACH_PROGRESS_SFP_TASKQ;
551
552 /*
553 * Create a taskq for over-temp
554 */
555 (void) sprintf(taskqname, "ixgbe%d_overtemp_taskq", instance);
556 if ((ixgbe->overtemp_taskq = ddi_taskq_create(devinfo, taskqname,
557 1, TASKQ_DEFAULTPRI, 0)) == NULL) {
558 ixgbe_error(ixgbe, "overtemp_taskq create failed");
559 goto attach_fail;
560 }
561 ixgbe->attach_progress |= ATTACH_PROGRESS_OVERTEMP_TASKQ;
562
563 /*
564 * Create a taskq for processing external PHY interrupts
565 */
566 (void) sprintf(taskqname, "ixgbe%d_phy_taskq", instance);
567 if ((ixgbe->phy_taskq = ddi_taskq_create(devinfo, taskqname,
568 1, TASKQ_DEFAULTPRI, 0)) == NULL) {
569 ixgbe_error(ixgbe, "phy_taskq create failed");
570 goto attach_fail;
571 }
572 ixgbe->attach_progress |= ATTACH_PROGRESS_PHY_TASKQ;
573
574 /*
575 * Initialize driver parameters
576 */
577 if (ixgbe_init_driver_settings(ixgbe) != IXGBE_SUCCESS) {
578 ixgbe_error(ixgbe, "Failed to initialize driver settings");
579 goto attach_fail;
580 }
581
582 /*
583 * Initialize mutexes for this device.
584 * Do this before enabling the interrupt handler and
585 * register the softint to avoid the condition where
586 * interrupt handler can try using uninitialized mutex.
587 */
588 ixgbe_init_locks(ixgbe);
589 ixgbe->attach_progress |= ATTACH_PROGRESS_LOCKS;
590
591 /*
592 * Initialize chipset hardware
593 */
594 if (ixgbe_init(ixgbe) != IXGBE_SUCCESS) {
595 ixgbe_error(ixgbe, "Failed to initialize adapter");
596 goto attach_fail;
597 }
598 ixgbe->link_check_complete = B_FALSE;
599 ixgbe->link_check_hrtime = gethrtime() +
600 (IXGBE_LINK_UP_TIME * 100000000ULL);
601 ixgbe->attach_progress |= ATTACH_PROGRESS_INIT;
602
603 if (ixgbe_check_acc_handle(ixgbe->osdep.cfg_handle) != DDI_FM_OK) {
604 ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_LOST);
605 goto attach_fail;
606 }
607
608 /*
609 * Initialize adapter capabilities
610 */
611 ixgbe_init_params(ixgbe);
612
613 /*
614 * Initialize statistics
615 */
616 if (ixgbe_init_stats(ixgbe) != IXGBE_SUCCESS) {
617 ixgbe_error(ixgbe, "Failed to initialize statistics");
618 goto attach_fail;
619 }
620 ixgbe->attach_progress |= ATTACH_PROGRESS_STATS;
621
622 /*
623 * Register the driver to the MAC
624 */
625 if (ixgbe_register_mac(ixgbe) != IXGBE_SUCCESS) {
626 ixgbe_error(ixgbe, "Failed to register MAC");
627 goto attach_fail;
628 }
629 mac_link_update(ixgbe->mac_hdl, LINK_STATE_UNKNOWN);
630 ixgbe->attach_progress |= ATTACH_PROGRESS_MAC;
631
632 ixgbe->periodic_id = ddi_periodic_add(ixgbe_link_timer, ixgbe,
633 IXGBE_CYCLIC_PERIOD, DDI_IPL_0);
634 if (ixgbe->periodic_id == 0) {
635 ixgbe_error(ixgbe, "Failed to add the link check timer");
636 goto attach_fail;
637 }
638 ixgbe->attach_progress |= ATTACH_PROGRESS_LINK_TIMER;
639
640 /*
641 * Now that mutex locks are initialized, and the chip is also
642 * initialized, enable interrupts.
643 */
644 if (ixgbe_enable_intrs(ixgbe) != IXGBE_SUCCESS) {
645 ixgbe_error(ixgbe, "Failed to enable DDI interrupts");
646 goto attach_fail;
647 }
648 ixgbe->attach_progress |= ATTACH_PROGRESS_ENABLE_INTR;
649
650 ixgbe_log(ixgbe, "%s", ixgbe_ident);
651 atomic_or_32(&ixgbe->ixgbe_state, IXGBE_INITIALIZED);
652
653 return (DDI_SUCCESS);
654
655 attach_fail:
656 ixgbe_unconfigure(devinfo, ixgbe);
657 return (DDI_FAILURE);
658 }
659
660 /*
661 * ixgbe_detach - Driver detach.
662 *
663 * The detach() function is the complement of the attach routine.
664 * If cmd is set to DDI_DETACH, detach() is used to remove the
665 * state associated with a given instance of a device node
666 * prior to the removal of that instance from the system.
667 *
668 * The detach() function will be called once for each instance
669 * of the device for which there has been a successful attach()
670 * once there are no longer any opens on the device.
671 *
672 * Interrupts routine are disabled, All memory allocated by this
673 * driver are freed.
674 */
675 static int
ixgbe_detach(dev_info_t * devinfo,ddi_detach_cmd_t cmd)676 ixgbe_detach(dev_info_t *devinfo, ddi_detach_cmd_t cmd)
677 {
678 ixgbe_t *ixgbe;
679
680 /*
681 * Check detach command
682 */
683 switch (cmd) {
684 default:
685 return (DDI_FAILURE);
686
687 case DDI_SUSPEND:
688 return (ixgbe_suspend(devinfo));
689
690 case DDI_DETACH:
691 break;
692 }
693
694 /*
695 * Get the pointer to the driver private data structure
696 */
697 ixgbe = (ixgbe_t *)ddi_get_driver_private(devinfo);
698 if (ixgbe == NULL)
699 return (DDI_FAILURE);
700
701 /*
702 * If the device is still running, it needs to be stopped first.
703 * This check is necessary because under some specific circumstances,
704 * the detach routine can be called without stopping the interface
705 * first.
706 */
707 if (ixgbe->ixgbe_state & IXGBE_STARTED) {
708 atomic_and_32(&ixgbe->ixgbe_state, ~IXGBE_STARTED);
709 mutex_enter(&ixgbe->gen_lock);
710 ixgbe_stop(ixgbe, B_TRUE);
711 mutex_exit(&ixgbe->gen_lock);
712 /* Disable and stop the watchdog timer */
713 ixgbe_disable_watchdog_timer(ixgbe);
714 }
715
716 /*
717 * Check if there are still rx buffers held by the upper layer.
718 * If so, fail the detach.
719 */
720 if (!ixgbe_rx_drain(ixgbe))
721 return (DDI_FAILURE);
722
723 /*
724 * Do the remaining unconfigure routines
725 */
726 ixgbe_unconfigure(devinfo, ixgbe);
727
728 return (DDI_SUCCESS);
729 }
730
731 /*
732 * quiesce(9E) entry point.
733 *
734 * This function is called when the system is single-threaded at high
735 * PIL with preemption disabled. Therefore, this function must not be
736 * blocked.
737 *
738 * This function returns DDI_SUCCESS on success, or DDI_FAILURE on failure.
739 * DDI_FAILURE indicates an error condition and should almost never happen.
740 */
741 static int
ixgbe_quiesce(dev_info_t * devinfo)742 ixgbe_quiesce(dev_info_t *devinfo)
743 {
744 ixgbe_t *ixgbe;
745 struct ixgbe_hw *hw;
746
747 ixgbe = (ixgbe_t *)ddi_get_driver_private(devinfo);
748
749 if (ixgbe == NULL)
750 return (DDI_FAILURE);
751
752 hw = &ixgbe->hw;
753
754 /*
755 * Disable the adapter interrupts
756 */
757 ixgbe_disable_adapter_interrupts(ixgbe);
758
759 /*
760 * Tell firmware driver is no longer in control
761 */
762 ixgbe_release_driver_control(hw);
763
764 /*
765 * Reset the chipset
766 */
767 (void) ixgbe_reset_hw(hw);
768
769 /*
770 * Reset PHY
771 */
772 (void) ixgbe_reset_phy(hw);
773
774 return (DDI_SUCCESS);
775 }
776
777 static void
ixgbe_unconfigure(dev_info_t * devinfo,ixgbe_t * ixgbe)778 ixgbe_unconfigure(dev_info_t *devinfo, ixgbe_t *ixgbe)
779 {
780 /*
781 * Disable interrupt
782 */
783 if (ixgbe->attach_progress & ATTACH_PROGRESS_ENABLE_INTR) {
784 (void) ixgbe_disable_intrs(ixgbe);
785 }
786
787 /*
788 * remove the link check timer
789 */
790 if (ixgbe->attach_progress & ATTACH_PROGRESS_LINK_TIMER) {
791 if (ixgbe->periodic_id != NULL) {
792 ddi_periodic_delete(ixgbe->periodic_id);
793 ixgbe->periodic_id = NULL;
794 }
795 }
796
797 /*
798 * Unregister MAC
799 */
800 if (ixgbe->attach_progress & ATTACH_PROGRESS_MAC) {
801 (void) mac_unregister(ixgbe->mac_hdl);
802 }
803
804 /*
805 * Free statistics
806 */
807 if (ixgbe->attach_progress & ATTACH_PROGRESS_STATS) {
808 kstat_delete((kstat_t *)ixgbe->ixgbe_ks);
809 }
810
811 /*
812 * Remove interrupt handlers
813 */
814 if (ixgbe->attach_progress & ATTACH_PROGRESS_ADD_INTR) {
815 ixgbe_rem_intr_handlers(ixgbe);
816 }
817
818 /*
819 * Remove taskq for sfp-status-change
820 */
821 if (ixgbe->attach_progress & ATTACH_PROGRESS_SFP_TASKQ) {
822 ddi_taskq_destroy(ixgbe->sfp_taskq);
823 }
824
825 /*
826 * Remove taskq for over-temp
827 */
828 if (ixgbe->attach_progress & ATTACH_PROGRESS_OVERTEMP_TASKQ) {
829 ddi_taskq_destroy(ixgbe->overtemp_taskq);
830 }
831
832 /*
833 * Remove taskq for external PHYs
834 */
835 if (ixgbe->attach_progress & ATTACH_PROGRESS_PHY_TASKQ) {
836 ddi_taskq_destroy(ixgbe->phy_taskq);
837 }
838
839 /*
840 * Remove interrupts
841 */
842 if (ixgbe->attach_progress & ATTACH_PROGRESS_ALLOC_INTR) {
843 ixgbe_rem_intrs(ixgbe);
844 }
845
846 /*
847 * Unregister interrupt callback handler
848 */
849 if (ixgbe->cb_hdl != NULL) {
850 (void) ddi_cb_unregister(ixgbe->cb_hdl);
851 }
852
853 /*
854 * Remove driver properties
855 */
856 if (ixgbe->attach_progress & ATTACH_PROGRESS_PROPS) {
857 (void) ddi_prop_remove_all(devinfo);
858 }
859
860 /*
861 * Stop the chipset
862 */
863 if (ixgbe->attach_progress & ATTACH_PROGRESS_INIT) {
864 mutex_enter(&ixgbe->gen_lock);
865 ixgbe_chip_stop(ixgbe);
866 mutex_exit(&ixgbe->gen_lock);
867 }
868
869 /*
870 * Free register handle
871 */
872 if (ixgbe->attach_progress & ATTACH_PROGRESS_REGS_MAP) {
873 if (ixgbe->osdep.reg_handle != NULL)
874 ddi_regs_map_free(&ixgbe->osdep.reg_handle);
875 }
876
877 /*
878 * Free PCI config handle
879 */
880 if (ixgbe->attach_progress & ATTACH_PROGRESS_PCI_CONFIG) {
881 if (ixgbe->osdep.cfg_handle != NULL)
882 pci_config_teardown(&ixgbe->osdep.cfg_handle);
883 }
884
885 /*
886 * Free locks
887 */
888 if (ixgbe->attach_progress & ATTACH_PROGRESS_LOCKS) {
889 ixgbe_destroy_locks(ixgbe);
890 }
891
892 /*
893 * Free the rx/tx rings
894 */
895 if (ixgbe->attach_progress & ATTACH_PROGRESS_ALLOC_RINGS) {
896 ixgbe_free_rings(ixgbe);
897 }
898
899 /*
900 * Unregister FMA capabilities
901 */
902 if (ixgbe->attach_progress & ATTACH_PROGRESS_FM_INIT) {
903 ixgbe_fm_fini(ixgbe);
904 }
905
906 /*
907 * Free the driver data structure
908 */
909 kmem_free(ixgbe, sizeof (ixgbe_t));
910
911 ddi_set_driver_private(devinfo, NULL);
912 }
913
914 /*
915 * ixgbe_register_mac - Register the driver and its function pointers with
916 * the GLD interface.
917 */
918 static int
ixgbe_register_mac(ixgbe_t * ixgbe)919 ixgbe_register_mac(ixgbe_t *ixgbe)
920 {
921 struct ixgbe_hw *hw = &ixgbe->hw;
922 mac_register_t *mac;
923 int status;
924
925 if ((mac = mac_alloc(MAC_VERSION)) == NULL)
926 return (IXGBE_FAILURE);
927
928 mac->m_type_ident = MAC_PLUGIN_IDENT_ETHER;
929 mac->m_driver = ixgbe;
930 mac->m_dip = ixgbe->dip;
931 mac->m_src_addr = hw->mac.addr;
932 mac->m_callbacks = &ixgbe_m_callbacks;
933 mac->m_min_sdu = 0;
934 mac->m_max_sdu = ixgbe->default_mtu;
935 mac->m_margin = VLAN_TAGSZ;
936 mac->m_priv_props = ixgbe_priv_props;
937 mac->m_v12n = MAC_VIRT_LEVEL1;
938
939 status = mac_register(mac, &ixgbe->mac_hdl);
940
941 mac_free(mac);
942
943 return ((status == 0) ? IXGBE_SUCCESS : IXGBE_FAILURE);
944 }
945
946 /*
947 * ixgbe_identify_hardware - Identify the type of the chipset.
948 */
949 static int
ixgbe_identify_hardware(ixgbe_t * ixgbe)950 ixgbe_identify_hardware(ixgbe_t *ixgbe)
951 {
952 struct ixgbe_hw *hw = &ixgbe->hw;
953 struct ixgbe_osdep *osdep = &ixgbe->osdep;
954
955 /*
956 * Get the device id
957 */
958 hw->vendor_id =
959 pci_config_get16(osdep->cfg_handle, PCI_CONF_VENID);
960 hw->device_id =
961 pci_config_get16(osdep->cfg_handle, PCI_CONF_DEVID);
962 hw->revision_id =
963 pci_config_get8(osdep->cfg_handle, PCI_CONF_REVID);
964 hw->subsystem_device_id =
965 pci_config_get16(osdep->cfg_handle, PCI_CONF_SUBSYSID);
966 hw->subsystem_vendor_id =
967 pci_config_get16(osdep->cfg_handle, PCI_CONF_SUBVENID);
968
969 /*
970 * Set the mac type of the adapter based on the device id
971 */
972 if (ixgbe_set_mac_type(hw) != IXGBE_SUCCESS) {
973 return (IXGBE_FAILURE);
974 }
975
976 /*
977 * Install adapter capabilities
978 */
979 switch (hw->mac.type) {
980 case ixgbe_mac_82598EB:
981 IXGBE_DEBUGLOG_0(ixgbe, "identify 82598 adapter\n");
982 ixgbe->capab = &ixgbe_82598eb_cap;
983
984 if (ixgbe_get_media_type(hw) == ixgbe_media_type_copper) {
985 ixgbe->capab->flags |= IXGBE_FLAG_FAN_FAIL_CAPABLE;
986 ixgbe->capab->other_intr |= IXGBE_EICR_GPI_SDP1;
987 ixgbe->capab->other_gpie |= IXGBE_SDP1_GPIEN;
988 }
989 break;
990
991 case ixgbe_mac_82599EB:
992 IXGBE_DEBUGLOG_0(ixgbe, "identify 82599 adapter\n");
993 ixgbe->capab = &ixgbe_82599eb_cap;
994
995 if (hw->device_id == IXGBE_DEV_ID_82599_T3_LOM) {
996 ixgbe->capab->flags |= IXGBE_FLAG_TEMP_SENSOR_CAPABLE;
997 ixgbe->capab->other_intr |= IXGBE_EICR_GPI_SDP0;
998 ixgbe->capab->other_gpie |= IXGBE_SDP0_GPIEN;
999 }
1000 break;
1001
1002 case ixgbe_mac_X540:
1003 IXGBE_DEBUGLOG_0(ixgbe, "identify X540 adapter\n");
1004 ixgbe->capab = &ixgbe_X540_cap;
1005 /*
1006 * For now, X540 is all set in its capab structure.
1007 * As other X540 variants show up, things can change here.
1008 */
1009 break;
1010
1011 case ixgbe_mac_X550:
1012 case ixgbe_mac_X550EM_x:
1013 IXGBE_DEBUGLOG_0(ixgbe, "identify X550 adapter\n");
1014 ixgbe->capab = &ixgbe_X550_cap;
1015
1016 if (hw->device_id == IXGBE_DEV_ID_X550EM_X_SFP)
1017 ixgbe->capab->flags |= IXGBE_FLAG_SFP_PLUG_CAPABLE;
1018
1019 /*
1020 * Link detection on X552 SFP+ and X552/X557-AT
1021 */
1022 if (hw->device_id == IXGBE_DEV_ID_X550EM_X_SFP ||
1023 hw->device_id == IXGBE_DEV_ID_X550EM_X_10G_T) {
1024 ixgbe->capab->other_intr |=
1025 IXGBE_EIMS_GPI_SDP0_BY_MAC(hw);
1026 ixgbe->capab->other_gpie |= IXGBE_SDP0_GPIEN_X540;
1027 }
1028 break;
1029
1030 default:
1031 IXGBE_DEBUGLOG_1(ixgbe,
1032 "adapter not supported in ixgbe_identify_hardware(): %d\n",
1033 hw->mac.type);
1034 return (IXGBE_FAILURE);
1035 }
1036
1037 return (IXGBE_SUCCESS);
1038 }
1039
1040 /*
1041 * ixgbe_regs_map - Map the device registers.
1042 *
1043 */
1044 static int
ixgbe_regs_map(ixgbe_t * ixgbe)1045 ixgbe_regs_map(ixgbe_t *ixgbe)
1046 {
1047 dev_info_t *devinfo = ixgbe->dip;
1048 struct ixgbe_hw *hw = &ixgbe->hw;
1049 struct ixgbe_osdep *osdep = &ixgbe->osdep;
1050 off_t mem_size;
1051
1052 /*
1053 * First get the size of device registers to be mapped.
1054 */
1055 if (ddi_dev_regsize(devinfo, IXGBE_ADAPTER_REGSET, &mem_size)
1056 != DDI_SUCCESS) {
1057 return (IXGBE_FAILURE);
1058 }
1059
1060 /*
1061 * Call ddi_regs_map_setup() to map registers
1062 */
1063 if ((ddi_regs_map_setup(devinfo, IXGBE_ADAPTER_REGSET,
1064 (caddr_t *)&hw->hw_addr, 0,
1065 mem_size, &ixgbe_regs_acc_attr,
1066 &osdep->reg_handle)) != DDI_SUCCESS) {
1067 return (IXGBE_FAILURE);
1068 }
1069
1070 return (IXGBE_SUCCESS);
1071 }
1072
1073 /*
1074 * ixgbe_init_properties - Initialize driver properties.
1075 */
1076 static void
ixgbe_init_properties(ixgbe_t * ixgbe)1077 ixgbe_init_properties(ixgbe_t *ixgbe)
1078 {
1079 /*
1080 * Get conf file properties, including link settings
1081 * jumbo frames, ring number, descriptor number, etc.
1082 */
1083 ixgbe_get_conf(ixgbe);
1084 }
1085
1086 /*
1087 * ixgbe_init_driver_settings - Initialize driver settings.
1088 *
1089 * The settings include hardware function pointers, bus information,
1090 * rx/tx rings settings, link state, and any other parameters that
1091 * need to be setup during driver initialization.
1092 */
1093 static int
ixgbe_init_driver_settings(ixgbe_t * ixgbe)1094 ixgbe_init_driver_settings(ixgbe_t *ixgbe)
1095 {
1096 struct ixgbe_hw *hw = &ixgbe->hw;
1097 dev_info_t *devinfo = ixgbe->dip;
1098 ixgbe_rx_ring_t *rx_ring;
1099 ixgbe_rx_group_t *rx_group;
1100 ixgbe_tx_ring_t *tx_ring;
1101 uint32_t rx_size;
1102 uint32_t tx_size;
1103 uint32_t ring_per_group;
1104 int i;
1105
1106 /*
1107 * Initialize chipset specific hardware function pointers
1108 */
1109 if (ixgbe_init_shared_code(hw) != IXGBE_SUCCESS) {
1110 return (IXGBE_FAILURE);
1111 }
1112
1113 /*
1114 * Get the system page size
1115 */
1116 ixgbe->sys_page_size = ddi_ptob(devinfo, (ulong_t)1);
1117
1118 /*
1119 * Set rx buffer size
1120 *
1121 * The IP header alignment room is counted in the calculation.
1122 * The rx buffer size is in unit of 1K that is required by the
1123 * chipset hardware.
1124 */
1125 rx_size = ixgbe->max_frame_size + IPHDR_ALIGN_ROOM;
1126 ixgbe->rx_buf_size = ((rx_size >> 10) +
1127 ((rx_size & (((uint32_t)1 << 10) - 1)) > 0 ? 1 : 0)) << 10;
1128
1129 /*
1130 * Set tx buffer size
1131 */
1132 tx_size = ixgbe->max_frame_size;
1133 ixgbe->tx_buf_size = ((tx_size >> 10) +
1134 ((tx_size & (((uint32_t)1 << 10) - 1)) > 0 ? 1 : 0)) << 10;
1135
1136 /*
1137 * Initialize rx/tx rings/groups parameters
1138 */
1139 ring_per_group = ixgbe->num_rx_rings / ixgbe->num_rx_groups;
1140 for (i = 0; i < ixgbe->num_rx_rings; i++) {
1141 rx_ring = &ixgbe->rx_rings[i];
1142 rx_ring->index = i;
1143 rx_ring->ixgbe = ixgbe;
1144 rx_ring->group_index = i / ring_per_group;
1145 rx_ring->hw_index = ixgbe_get_hw_rx_index(ixgbe, i);
1146 }
1147
1148 for (i = 0; i < ixgbe->num_rx_groups; i++) {
1149 rx_group = &ixgbe->rx_groups[i];
1150 rx_group->index = i;
1151 rx_group->ixgbe = ixgbe;
1152 }
1153
1154 for (i = 0; i < ixgbe->num_tx_rings; i++) {
1155 tx_ring = &ixgbe->tx_rings[i];
1156 tx_ring->index = i;
1157 tx_ring->ixgbe = ixgbe;
1158 if (ixgbe->tx_head_wb_enable)
1159 tx_ring->tx_recycle = ixgbe_tx_recycle_head_wb;
1160 else
1161 tx_ring->tx_recycle = ixgbe_tx_recycle_legacy;
1162
1163 tx_ring->ring_size = ixgbe->tx_ring_size;
1164 tx_ring->free_list_size = ixgbe->tx_ring_size +
1165 (ixgbe->tx_ring_size >> 1);
1166 }
1167
1168 /*
1169 * Initialize values of interrupt throttling rate
1170 */
1171 for (i = 1; i < MAX_INTR_VECTOR; i++)
1172 ixgbe->intr_throttling[i] = ixgbe->intr_throttling[0];
1173
1174 /*
1175 * The initial link state should be "unknown"
1176 */
1177 ixgbe->link_state = LINK_STATE_UNKNOWN;
1178
1179 return (IXGBE_SUCCESS);
1180 }
1181
1182 /*
1183 * ixgbe_init_locks - Initialize locks.
1184 */
1185 static void
ixgbe_init_locks(ixgbe_t * ixgbe)1186 ixgbe_init_locks(ixgbe_t *ixgbe)
1187 {
1188 ixgbe_rx_ring_t *rx_ring;
1189 ixgbe_tx_ring_t *tx_ring;
1190 int i;
1191
1192 for (i = 0; i < ixgbe->num_rx_rings; i++) {
1193 rx_ring = &ixgbe->rx_rings[i];
1194 mutex_init(&rx_ring->rx_lock, NULL,
1195 MUTEX_DRIVER, DDI_INTR_PRI(ixgbe->intr_pri));
1196 }
1197
1198 for (i = 0; i < ixgbe->num_tx_rings; i++) {
1199 tx_ring = &ixgbe->tx_rings[i];
1200 mutex_init(&tx_ring->tx_lock, NULL,
1201 MUTEX_DRIVER, DDI_INTR_PRI(ixgbe->intr_pri));
1202 mutex_init(&tx_ring->recycle_lock, NULL,
1203 MUTEX_DRIVER, DDI_INTR_PRI(ixgbe->intr_pri));
1204 mutex_init(&tx_ring->tcb_head_lock, NULL,
1205 MUTEX_DRIVER, DDI_INTR_PRI(ixgbe->intr_pri));
1206 mutex_init(&tx_ring->tcb_tail_lock, NULL,
1207 MUTEX_DRIVER, DDI_INTR_PRI(ixgbe->intr_pri));
1208 }
1209
1210 mutex_init(&ixgbe->gen_lock, NULL,
1211 MUTEX_DRIVER, DDI_INTR_PRI(ixgbe->intr_pri));
1212
1213 mutex_init(&ixgbe->watchdog_lock, NULL,
1214 MUTEX_DRIVER, DDI_INTR_PRI(ixgbe->intr_pri));
1215 }
1216
1217 /*
1218 * ixgbe_destroy_locks - Destroy locks.
1219 */
1220 static void
ixgbe_destroy_locks(ixgbe_t * ixgbe)1221 ixgbe_destroy_locks(ixgbe_t *ixgbe)
1222 {
1223 ixgbe_rx_ring_t *rx_ring;
1224 ixgbe_tx_ring_t *tx_ring;
1225 int i;
1226
1227 for (i = 0; i < ixgbe->num_rx_rings; i++) {
1228 rx_ring = &ixgbe->rx_rings[i];
1229 mutex_destroy(&rx_ring->rx_lock);
1230 }
1231
1232 for (i = 0; i < ixgbe->num_tx_rings; i++) {
1233 tx_ring = &ixgbe->tx_rings[i];
1234 mutex_destroy(&tx_ring->tx_lock);
1235 mutex_destroy(&tx_ring->recycle_lock);
1236 mutex_destroy(&tx_ring->tcb_head_lock);
1237 mutex_destroy(&tx_ring->tcb_tail_lock);
1238 }
1239
1240 mutex_destroy(&ixgbe->gen_lock);
1241 mutex_destroy(&ixgbe->watchdog_lock);
1242 }
1243
1244 static int
ixgbe_resume(dev_info_t * devinfo)1245 ixgbe_resume(dev_info_t *devinfo)
1246 {
1247 ixgbe_t *ixgbe;
1248 int i;
1249
1250 ixgbe = (ixgbe_t *)ddi_get_driver_private(devinfo);
1251 if (ixgbe == NULL)
1252 return (DDI_FAILURE);
1253
1254 mutex_enter(&ixgbe->gen_lock);
1255
1256 if (ixgbe->ixgbe_state & IXGBE_STARTED) {
1257 if (ixgbe_start(ixgbe, B_FALSE) != IXGBE_SUCCESS) {
1258 mutex_exit(&ixgbe->gen_lock);
1259 return (DDI_FAILURE);
1260 }
1261
1262 /*
1263 * Enable and start the watchdog timer
1264 */
1265 ixgbe_enable_watchdog_timer(ixgbe);
1266 }
1267
1268 atomic_and_32(&ixgbe->ixgbe_state, ~IXGBE_SUSPENDED);
1269
1270 if (ixgbe->ixgbe_state & IXGBE_STARTED) {
1271 for (i = 0; i < ixgbe->num_tx_rings; i++) {
1272 mac_tx_ring_update(ixgbe->mac_hdl,
1273 ixgbe->tx_rings[i].ring_handle);
1274 }
1275 }
1276
1277 mutex_exit(&ixgbe->gen_lock);
1278
1279 return (DDI_SUCCESS);
1280 }
1281
1282 static int
ixgbe_suspend(dev_info_t * devinfo)1283 ixgbe_suspend(dev_info_t *devinfo)
1284 {
1285 ixgbe_t *ixgbe;
1286
1287 ixgbe = (ixgbe_t *)ddi_get_driver_private(devinfo);
1288 if (ixgbe == NULL)
1289 return (DDI_FAILURE);
1290
1291 mutex_enter(&ixgbe->gen_lock);
1292
1293 atomic_or_32(&ixgbe->ixgbe_state, IXGBE_SUSPENDED);
1294 if (!(ixgbe->ixgbe_state & IXGBE_STARTED)) {
1295 mutex_exit(&ixgbe->gen_lock);
1296 return (DDI_SUCCESS);
1297 }
1298 ixgbe_stop(ixgbe, B_FALSE);
1299
1300 mutex_exit(&ixgbe->gen_lock);
1301
1302 /*
1303 * Disable and stop the watchdog timer
1304 */
1305 ixgbe_disable_watchdog_timer(ixgbe);
1306
1307 return (DDI_SUCCESS);
1308 }
1309
1310 /*
1311 * ixgbe_init - Initialize the device.
1312 */
1313 static int
ixgbe_init(ixgbe_t * ixgbe)1314 ixgbe_init(ixgbe_t *ixgbe)
1315 {
1316 struct ixgbe_hw *hw = &ixgbe->hw;
1317 u8 pbanum[IXGBE_PBANUM_LENGTH];
1318 int rv;
1319
1320 mutex_enter(&ixgbe->gen_lock);
1321
1322 /*
1323 * Configure/Initialize hardware
1324 */
1325 rv = ixgbe_init_hw(hw);
1326 if (rv != IXGBE_SUCCESS) {
1327 switch (rv) {
1328
1329 /*
1330 * The first three errors are not prohibitive to us progressing
1331 * further, and are maily advisory in nature. In the case of a
1332 * SFP module not being present or not deemed supported by the
1333 * common code, we adivse the operator of this fact but carry on
1334 * instead of failing hard, as SFPs can be inserted or replaced
1335 * while the driver is running. In the case of a unknown error,
1336 * we fail-hard, logging the reason and emitting a FMA event.
1337 */
1338 case IXGBE_ERR_EEPROM_VERSION:
1339 ixgbe_error(ixgbe,
1340 "This Intel 10Gb Ethernet device is pre-release and"
1341 " contains outdated firmware. Please contact your"
1342 " hardware vendor for a replacement.");
1343 break;
1344 case IXGBE_ERR_SFP_NOT_PRESENT:
1345 ixgbe_error(ixgbe,
1346 "No SFP+ module detected on this interface. Please "
1347 "install a supported SFP+ module for this "
1348 "interface to become operational.");
1349 break;
1350 case IXGBE_ERR_SFP_NOT_SUPPORTED:
1351 ixgbe_error(ixgbe,
1352 "Unsupported SFP+ module detected. Please replace "
1353 "it with a supported SFP+ module per Intel "
1354 "documentation, or bypass this check with "
1355 "allow_unsupported_sfp=1 in ixgbe.conf.");
1356 break;
1357 default:
1358 ixgbe_error(ixgbe,
1359 "Failed to initialize hardware. ixgbe_init_hw "
1360 "returned %d", rv);
1361 ixgbe_fm_ereport(ixgbe, DDI_FM_DEVICE_INVAL_STATE);
1362 goto init_fail;
1363 }
1364 }
1365
1366 /*
1367 * Need to init eeprom before validating the checksum.
1368 */
1369 if (ixgbe_init_eeprom_params(hw) < 0) {
1370 ixgbe_error(ixgbe,
1371 "Unable to intitialize the eeprom interface.");
1372 ixgbe_fm_ereport(ixgbe, DDI_FM_DEVICE_INVAL_STATE);
1373 goto init_fail;
1374 }
1375
1376 /*
1377 * NVM validation
1378 */
1379 if (ixgbe_validate_eeprom_checksum(hw, NULL) < 0) {
1380 /*
1381 * Some PCI-E parts fail the first check due to
1382 * the link being in sleep state. Call it again,
1383 * if it fails a second time it's a real issue.
1384 */
1385 if (ixgbe_validate_eeprom_checksum(hw, NULL) < 0) {
1386 ixgbe_error(ixgbe,
1387 "Invalid NVM checksum. Please contact "
1388 "the vendor to update the NVM.");
1389 ixgbe_fm_ereport(ixgbe, DDI_FM_DEVICE_INVAL_STATE);
1390 goto init_fail;
1391 }
1392 }
1393
1394 /*
1395 * Setup default flow control thresholds - enable/disable
1396 * & flow control type is controlled by ixgbe.conf
1397 */
1398 hw->fc.high_water[0] = DEFAULT_FCRTH;
1399 hw->fc.low_water[0] = DEFAULT_FCRTL;
1400 hw->fc.pause_time = DEFAULT_FCPAUSE;
1401 hw->fc.send_xon = B_TRUE;
1402
1403 /*
1404 * Initialize flow control
1405 */
1406 (void) ixgbe_start_hw(hw);
1407
1408 /*
1409 * Initialize link settings
1410 */
1411 (void) ixgbe_driver_setup_link(ixgbe, B_FALSE);
1412
1413 /*
1414 * Initialize the chipset hardware
1415 */
1416 if (ixgbe_chip_start(ixgbe) != IXGBE_SUCCESS) {
1417 ixgbe_fm_ereport(ixgbe, DDI_FM_DEVICE_INVAL_STATE);
1418 goto init_fail;
1419 }
1420
1421 /*
1422 * Read identifying information and place in devinfo.
1423 */
1424 pbanum[0] = '\0';
1425 (void) ixgbe_read_pba_string(hw, pbanum, sizeof (pbanum));
1426 if (*pbanum != '\0') {
1427 (void) ddi_prop_update_string(DDI_DEV_T_NONE, ixgbe->dip,
1428 "printed-board-assembly", (char *)pbanum);
1429 }
1430
1431 if (ixgbe_check_acc_handle(ixgbe->osdep.reg_handle) != DDI_FM_OK) {
1432 goto init_fail;
1433 }
1434
1435 mutex_exit(&ixgbe->gen_lock);
1436 return (IXGBE_SUCCESS);
1437
1438 init_fail:
1439 /*
1440 * Reset PHY
1441 */
1442 (void) ixgbe_reset_phy(hw);
1443
1444 mutex_exit(&ixgbe->gen_lock);
1445 ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_LOST);
1446 return (IXGBE_FAILURE);
1447 }
1448
1449 /*
1450 * ixgbe_chip_start - Initialize and start the chipset hardware.
1451 */
1452 static int
ixgbe_chip_start(ixgbe_t * ixgbe)1453 ixgbe_chip_start(ixgbe_t *ixgbe)
1454 {
1455 struct ixgbe_hw *hw = &ixgbe->hw;
1456 int i;
1457
1458 ASSERT(mutex_owned(&ixgbe->gen_lock));
1459
1460 /*
1461 * Get the mac address
1462 * This function should handle SPARC case correctly.
1463 */
1464 if (!ixgbe_find_mac_address(ixgbe)) {
1465 ixgbe_error(ixgbe, "Failed to get the mac address");
1466 return (IXGBE_FAILURE);
1467 }
1468
1469 /*
1470 * Validate the mac address
1471 */
1472 (void) ixgbe_init_rx_addrs(hw);
1473 if (!is_valid_mac_addr(hw->mac.addr)) {
1474 ixgbe_error(ixgbe, "Invalid mac address");
1475 return (IXGBE_FAILURE);
1476 }
1477
1478 /*
1479 * Re-enable relaxed ordering for performance. It is disabled
1480 * by default in the hardware init.
1481 */
1482 if (ixgbe->relax_order_enable == B_TRUE)
1483 ixgbe_enable_relaxed_ordering(hw);
1484
1485 /*
1486 * Setup adapter interrupt vectors
1487 */
1488 ixgbe_setup_adapter_vector(ixgbe);
1489
1490 /*
1491 * Initialize unicast addresses.
1492 */
1493 ixgbe_init_unicst(ixgbe);
1494
1495 /*
1496 * Setup and initialize the mctable structures.
1497 */
1498 ixgbe_setup_multicst(ixgbe);
1499
1500 /*
1501 * Set interrupt throttling rate
1502 */
1503 for (i = 0; i < ixgbe->intr_cnt; i++) {
1504 IXGBE_WRITE_REG(hw, IXGBE_EITR(i), ixgbe->intr_throttling[i]);
1505 }
1506
1507 /*
1508 * Disable Wake-on-LAN
1509 */
1510 IXGBE_WRITE_REG(hw, IXGBE_WUC, 0);
1511
1512 /*
1513 * Some adapters offer Energy Efficient Ethernet (EEE) support.
1514 * Due to issues with EEE in e1000g/igb, we disable this by default
1515 * as a precautionary measure.
1516 *
1517 * Currently, the only known adapter which supports EEE in the ixgbe
1518 * line is 8086,15AB (IXGBE_DEV_ID_X550EM_X_KR), and only after the
1519 * first revision of it, as well as any X550 with MAC type 6 (non-EM)
1520 */
1521 (void) ixgbe_setup_eee(hw, B_FALSE);
1522
1523 /*
1524 * Turn on any present SFP Tx laser
1525 */
1526 ixgbe_enable_tx_laser(hw);
1527
1528 /*
1529 * Power on the PHY
1530 */
1531 (void) ixgbe_set_phy_power(hw, B_TRUE);
1532
1533 /*
1534 * Save the state of the PHY
1535 */
1536 ixgbe_get_hw_state(ixgbe);
1537
1538 /*
1539 * Make sure driver has control
1540 */
1541 ixgbe_get_driver_control(hw);
1542
1543 return (IXGBE_SUCCESS);
1544 }
1545
1546 /*
1547 * ixgbe_chip_stop - Stop the chipset hardware
1548 */
1549 static void
ixgbe_chip_stop(ixgbe_t * ixgbe)1550 ixgbe_chip_stop(ixgbe_t *ixgbe)
1551 {
1552 struct ixgbe_hw *hw = &ixgbe->hw;
1553 int rv;
1554
1555 ASSERT(mutex_owned(&ixgbe->gen_lock));
1556
1557 /*
1558 * Stop interupt generation and disable Tx unit
1559 */
1560 hw->adapter_stopped = B_FALSE;
1561 (void) ixgbe_stop_adapter(hw);
1562
1563 /*
1564 * Reset the chipset
1565 */
1566 (void) ixgbe_reset_hw(hw);
1567
1568 /*
1569 * Reset PHY
1570 */
1571 (void) ixgbe_reset_phy(hw);
1572
1573 /*
1574 * Enter LPLU (Low Power, Link Up) mode, if available. Avoid resetting
1575 * the PHY while doing so. Else, just power down the PHY.
1576 */
1577 if (hw->phy.ops.enter_lplu != NULL) {
1578 hw->phy.reset_disable = B_TRUE;
1579 rv = hw->phy.ops.enter_lplu(hw);
1580 if (rv != IXGBE_SUCCESS)
1581 ixgbe_error(ixgbe, "Error while entering LPLU: %d", rv);
1582 hw->phy.reset_disable = B_FALSE;
1583 } else {
1584 (void) ixgbe_set_phy_power(hw, B_FALSE);
1585 }
1586
1587 /*
1588 * Turn off any present SFP Tx laser
1589 * Expected for health and safety reasons
1590 */
1591 ixgbe_disable_tx_laser(hw);
1592
1593 /*
1594 * Tell firmware driver is no longer in control
1595 */
1596 ixgbe_release_driver_control(hw);
1597
1598 }
1599
1600 /*
1601 * ixgbe_reset - Reset the chipset and re-start the driver.
1602 *
1603 * It involves stopping and re-starting the chipset,
1604 * and re-configuring the rx/tx rings.
1605 */
1606 static int
ixgbe_reset(ixgbe_t * ixgbe)1607 ixgbe_reset(ixgbe_t *ixgbe)
1608 {
1609 int i;
1610
1611 /*
1612 * Disable and stop the watchdog timer
1613 */
1614 ixgbe_disable_watchdog_timer(ixgbe);
1615
1616 mutex_enter(&ixgbe->gen_lock);
1617
1618 ASSERT(ixgbe->ixgbe_state & IXGBE_STARTED);
1619 atomic_and_32(&ixgbe->ixgbe_state, ~IXGBE_STARTED);
1620
1621 ixgbe_stop(ixgbe, B_FALSE);
1622
1623 if (ixgbe_start(ixgbe, B_FALSE) != IXGBE_SUCCESS) {
1624 mutex_exit(&ixgbe->gen_lock);
1625 return (IXGBE_FAILURE);
1626 }
1627
1628 /*
1629 * After resetting, need to recheck the link status.
1630 */
1631 ixgbe->link_check_complete = B_FALSE;
1632 ixgbe->link_check_hrtime = gethrtime() +
1633 (IXGBE_LINK_UP_TIME * 100000000ULL);
1634
1635 atomic_or_32(&ixgbe->ixgbe_state, IXGBE_STARTED);
1636
1637 if (!(ixgbe->ixgbe_state & IXGBE_SUSPENDED)) {
1638 for (i = 0; i < ixgbe->num_tx_rings; i++) {
1639 mac_tx_ring_update(ixgbe->mac_hdl,
1640 ixgbe->tx_rings[i].ring_handle);
1641 }
1642 }
1643
1644 mutex_exit(&ixgbe->gen_lock);
1645
1646 /*
1647 * Enable and start the watchdog timer
1648 */
1649 ixgbe_enable_watchdog_timer(ixgbe);
1650
1651 return (IXGBE_SUCCESS);
1652 }
1653
1654 /*
1655 * ixgbe_tx_clean - Clean the pending transmit packets and DMA resources.
1656 */
1657 static void
ixgbe_tx_clean(ixgbe_t * ixgbe)1658 ixgbe_tx_clean(ixgbe_t *ixgbe)
1659 {
1660 ixgbe_tx_ring_t *tx_ring;
1661 tx_control_block_t *tcb;
1662 link_list_t pending_list;
1663 uint32_t desc_num;
1664 int i, j;
1665
1666 LINK_LIST_INIT(&pending_list);
1667
1668 for (i = 0; i < ixgbe->num_tx_rings; i++) {
1669 tx_ring = &ixgbe->tx_rings[i];
1670
1671 mutex_enter(&tx_ring->recycle_lock);
1672
1673 /*
1674 * Clean the pending tx data - the pending packets in the
1675 * work_list that have no chances to be transmitted again.
1676 *
1677 * We must ensure the chipset is stopped or the link is down
1678 * before cleaning the transmit packets.
1679 */
1680 desc_num = 0;
1681 for (j = 0; j < tx_ring->ring_size; j++) {
1682 tcb = tx_ring->work_list[j];
1683 if (tcb != NULL) {
1684 desc_num += tcb->desc_num;
1685
1686 tx_ring->work_list[j] = NULL;
1687
1688 ixgbe_free_tcb(tcb);
1689
1690 LIST_PUSH_TAIL(&pending_list, &tcb->link);
1691 }
1692 }
1693
1694 if (desc_num > 0) {
1695 atomic_add_32(&tx_ring->tbd_free, desc_num);
1696 ASSERT(tx_ring->tbd_free == tx_ring->ring_size);
1697
1698 /*
1699 * Reset the head and tail pointers of the tbd ring;
1700 * Reset the writeback head if it's enable.
1701 */
1702 tx_ring->tbd_head = 0;
1703 tx_ring->tbd_tail = 0;
1704 if (ixgbe->tx_head_wb_enable)
1705 *tx_ring->tbd_head_wb = 0;
1706
1707 IXGBE_WRITE_REG(&ixgbe->hw,
1708 IXGBE_TDH(tx_ring->index), 0);
1709 IXGBE_WRITE_REG(&ixgbe->hw,
1710 IXGBE_TDT(tx_ring->index), 0);
1711 }
1712
1713 mutex_exit(&tx_ring->recycle_lock);
1714
1715 /*
1716 * Add the tx control blocks in the pending list to
1717 * the free list.
1718 */
1719 ixgbe_put_free_list(tx_ring, &pending_list);
1720 }
1721 }
1722
1723 /*
1724 * ixgbe_tx_drain - Drain the tx rings to allow pending packets to be
1725 * transmitted.
1726 */
1727 static boolean_t
ixgbe_tx_drain(ixgbe_t * ixgbe)1728 ixgbe_tx_drain(ixgbe_t *ixgbe)
1729 {
1730 ixgbe_tx_ring_t *tx_ring;
1731 boolean_t done;
1732 int i, j;
1733
1734 /*
1735 * Wait for a specific time to allow pending tx packets
1736 * to be transmitted.
1737 *
1738 * Check the counter tbd_free to see if transmission is done.
1739 * No lock protection is needed here.
1740 *
1741 * Return B_TRUE if all pending packets have been transmitted;
1742 * Otherwise return B_FALSE;
1743 */
1744 for (i = 0; i < TX_DRAIN_TIME; i++) {
1745
1746 done = B_TRUE;
1747 for (j = 0; j < ixgbe->num_tx_rings; j++) {
1748 tx_ring = &ixgbe->tx_rings[j];
1749 done = done &&
1750 (tx_ring->tbd_free == tx_ring->ring_size);
1751 }
1752
1753 if (done)
1754 break;
1755
1756 msec_delay(1);
1757 }
1758
1759 return (done);
1760 }
1761
1762 /*
1763 * ixgbe_rx_drain - Wait for all rx buffers to be released by upper layer.
1764 */
1765 static boolean_t
ixgbe_rx_drain(ixgbe_t * ixgbe)1766 ixgbe_rx_drain(ixgbe_t *ixgbe)
1767 {
1768 boolean_t done = B_TRUE;
1769 int i;
1770
1771 /*
1772 * Polling the rx free list to check if those rx buffers held by
1773 * the upper layer are released.
1774 *
1775 * Check the counter rcb_free to see if all pending buffers are
1776 * released. No lock protection is needed here.
1777 *
1778 * Return B_TRUE if all pending buffers have been released;
1779 * Otherwise return B_FALSE;
1780 */
1781 for (i = 0; i < RX_DRAIN_TIME; i++) {
1782 done = (ixgbe->rcb_pending == 0);
1783
1784 if (done)
1785 break;
1786
1787 msec_delay(1);
1788 }
1789
1790 return (done);
1791 }
1792
1793 /*
1794 * ixgbe_start - Start the driver/chipset.
1795 */
1796 int
ixgbe_start(ixgbe_t * ixgbe,boolean_t alloc_buffer)1797 ixgbe_start(ixgbe_t *ixgbe, boolean_t alloc_buffer)
1798 {
1799 struct ixgbe_hw *hw = &ixgbe->hw;
1800 int i;
1801
1802 ASSERT(mutex_owned(&ixgbe->gen_lock));
1803
1804 if (alloc_buffer) {
1805 if (ixgbe_alloc_rx_data(ixgbe) != IXGBE_SUCCESS) {
1806 ixgbe_error(ixgbe,
1807 "Failed to allocate software receive rings");
1808 return (IXGBE_FAILURE);
1809 }
1810
1811 /* Allocate buffers for all the rx/tx rings */
1812 if (ixgbe_alloc_dma(ixgbe) != IXGBE_SUCCESS) {
1813 ixgbe_error(ixgbe, "Failed to allocate DMA resource");
1814 return (IXGBE_FAILURE);
1815 }
1816
1817 ixgbe->tx_ring_init = B_TRUE;
1818 } else {
1819 ixgbe->tx_ring_init = B_FALSE;
1820 }
1821
1822 for (i = 0; i < ixgbe->num_rx_rings; i++)
1823 mutex_enter(&ixgbe->rx_rings[i].rx_lock);
1824 for (i = 0; i < ixgbe->num_tx_rings; i++)
1825 mutex_enter(&ixgbe->tx_rings[i].tx_lock);
1826
1827 /*
1828 * Start the chipset hardware
1829 */
1830 if (ixgbe_chip_start(ixgbe) != IXGBE_SUCCESS) {
1831 ixgbe_fm_ereport(ixgbe, DDI_FM_DEVICE_INVAL_STATE);
1832 goto start_failure;
1833 }
1834
1835 /*
1836 * Configure link now for X550
1837 *
1838 * X550 possesses a LPLU (Low-Power Link Up) mode which keeps the
1839 * resting state of the adapter at a 1Gb FDX speed. Prior to the X550,
1840 * the resting state of the link would be the maximum speed that
1841 * autonegotiation will allow (usually 10Gb, infrastructure allowing)
1842 * so we never bothered with explicitly setting the link to 10Gb as it
1843 * would already be at that state on driver attach. With X550, we must
1844 * trigger a re-negotiation of the link in order to switch from a LPLU
1845 * 1Gb link to 10Gb (cable and link partner permitting.)
1846 */
1847 if (hw->mac.type == ixgbe_mac_X550 ||
1848 hw->mac.type == ixgbe_mac_X550EM_x) {
1849 (void) ixgbe_driver_setup_link(ixgbe, B_TRUE);
1850 ixgbe_get_hw_state(ixgbe);
1851 }
1852
1853 if (ixgbe_check_acc_handle(ixgbe->osdep.reg_handle) != DDI_FM_OK) {
1854 goto start_failure;
1855 }
1856
1857 /*
1858 * Setup the rx/tx rings
1859 */
1860 ixgbe_setup_rings(ixgbe);
1861
1862 /*
1863 * ixgbe_start() will be called when resetting, however if reset
1864 * happens, we need to clear the ERROR, STALL and OVERTEMP flags
1865 * before enabling the interrupts.
1866 */
1867 atomic_and_32(&ixgbe->ixgbe_state, ~(IXGBE_ERROR
1868 | IXGBE_STALL| IXGBE_OVERTEMP));
1869
1870 /*
1871 * Enable adapter interrupts
1872 * The interrupts must be enabled after the driver state is START
1873 */
1874 ixgbe_enable_adapter_interrupts(ixgbe);
1875
1876 for (i = ixgbe->num_tx_rings - 1; i >= 0; i--)
1877 mutex_exit(&ixgbe->tx_rings[i].tx_lock);
1878 for (i = ixgbe->num_rx_rings - 1; i >= 0; i--)
1879 mutex_exit(&ixgbe->rx_rings[i].rx_lock);
1880
1881 return (IXGBE_SUCCESS);
1882
1883 start_failure:
1884 for (i = ixgbe->num_tx_rings - 1; i >= 0; i--)
1885 mutex_exit(&ixgbe->tx_rings[i].tx_lock);
1886 for (i = ixgbe->num_rx_rings - 1; i >= 0; i--)
1887 mutex_exit(&ixgbe->rx_rings[i].rx_lock);
1888
1889 ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_LOST);
1890
1891 return (IXGBE_FAILURE);
1892 }
1893
1894 /*
1895 * ixgbe_stop - Stop the driver/chipset.
1896 */
1897 void
ixgbe_stop(ixgbe_t * ixgbe,boolean_t free_buffer)1898 ixgbe_stop(ixgbe_t *ixgbe, boolean_t free_buffer)
1899 {
1900 int i;
1901
1902 ASSERT(mutex_owned(&ixgbe->gen_lock));
1903
1904 /*
1905 * Disable the adapter interrupts
1906 */
1907 ixgbe_disable_adapter_interrupts(ixgbe);
1908
1909 /*
1910 * Drain the pending tx packets
1911 */
1912 (void) ixgbe_tx_drain(ixgbe);
1913
1914 for (i = 0; i < ixgbe->num_rx_rings; i++)
1915 mutex_enter(&ixgbe->rx_rings[i].rx_lock);
1916 for (i = 0; i < ixgbe->num_tx_rings; i++)
1917 mutex_enter(&ixgbe->tx_rings[i].tx_lock);
1918
1919 /*
1920 * Stop the chipset hardware
1921 */
1922 ixgbe_chip_stop(ixgbe);
1923
1924 if (ixgbe_check_acc_handle(ixgbe->osdep.reg_handle) != DDI_FM_OK) {
1925 ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_LOST);
1926 }
1927
1928 /*
1929 * Clean the pending tx data/resources
1930 */
1931 ixgbe_tx_clean(ixgbe);
1932
1933 for (i = ixgbe->num_tx_rings - 1; i >= 0; i--)
1934 mutex_exit(&ixgbe->tx_rings[i].tx_lock);
1935 for (i = ixgbe->num_rx_rings - 1; i >= 0; i--)
1936 mutex_exit(&ixgbe->rx_rings[i].rx_lock);
1937
1938 if (ixgbe->link_state == LINK_STATE_UP) {
1939 ixgbe->link_state = LINK_STATE_UNKNOWN;
1940 mac_link_update(ixgbe->mac_hdl, ixgbe->link_state);
1941 }
1942
1943 if (free_buffer) {
1944 /*
1945 * Release the DMA/memory resources of rx/tx rings
1946 */
1947 ixgbe_free_dma(ixgbe);
1948 ixgbe_free_rx_data(ixgbe);
1949 }
1950 }
1951
1952 /*
1953 * ixgbe_cbfunc - Driver interface for generic DDI callbacks
1954 */
1955 /* ARGSUSED */
1956 static int
ixgbe_cbfunc(dev_info_t * dip,ddi_cb_action_t cbaction,void * cbarg,void * arg1,void * arg2)1957 ixgbe_cbfunc(dev_info_t *dip, ddi_cb_action_t cbaction, void *cbarg,
1958 void *arg1, void *arg2)
1959 {
1960 ixgbe_t *ixgbe = (ixgbe_t *)arg1;
1961
1962 switch (cbaction) {
1963 /* IRM callback */
1964 int count;
1965 case DDI_CB_INTR_ADD:
1966 case DDI_CB_INTR_REMOVE:
1967 count = (int)(uintptr_t)cbarg;
1968 ASSERT(ixgbe->intr_type == DDI_INTR_TYPE_MSIX);
1969 DTRACE_PROBE2(ixgbe__irm__callback, int, count,
1970 int, ixgbe->intr_cnt);
1971 if (ixgbe_intr_adjust(ixgbe, cbaction, count) !=
1972 DDI_SUCCESS) {
1973 ixgbe_error(ixgbe,
1974 "IRM CB: Failed to adjust interrupts");
1975 goto cb_fail;
1976 }
1977 break;
1978 default:
1979 IXGBE_DEBUGLOG_1(ixgbe, "DDI CB: action 0x%x NOT supported",
1980 cbaction);
1981 return (DDI_ENOTSUP);
1982 }
1983 return (DDI_SUCCESS);
1984 cb_fail:
1985 return (DDI_FAILURE);
1986 }
1987
1988 /*
1989 * ixgbe_intr_adjust - Adjust interrupt to respond to IRM request.
1990 */
1991 static int
ixgbe_intr_adjust(ixgbe_t * ixgbe,ddi_cb_action_t cbaction,int count)1992 ixgbe_intr_adjust(ixgbe_t *ixgbe, ddi_cb_action_t cbaction, int count)
1993 {
1994 int i, rc, actual;
1995
1996 if (count == 0)
1997 return (DDI_SUCCESS);
1998
1999 if ((cbaction == DDI_CB_INTR_ADD &&
2000 ixgbe->intr_cnt + count > ixgbe->intr_cnt_max) ||
2001 (cbaction == DDI_CB_INTR_REMOVE &&
2002 ixgbe->intr_cnt - count < ixgbe->intr_cnt_min))
2003 return (DDI_FAILURE);
2004
2005 if (!(ixgbe->ixgbe_state & IXGBE_STARTED)) {
2006 return (DDI_FAILURE);
2007 }
2008
2009 for (i = 0; i < ixgbe->num_rx_rings; i++)
2010 mac_ring_intr_set(ixgbe->rx_rings[i].ring_handle, NULL);
2011 for (i = 0; i < ixgbe->num_tx_rings; i++)
2012 mac_ring_intr_set(ixgbe->tx_rings[i].ring_handle, NULL);
2013
2014 mutex_enter(&ixgbe->gen_lock);
2015 ixgbe->ixgbe_state &= ~IXGBE_STARTED;
2016 ixgbe->ixgbe_state |= IXGBE_INTR_ADJUST;
2017 ixgbe->ixgbe_state |= IXGBE_SUSPENDED;
2018 mac_link_update(ixgbe->mac_hdl, LINK_STATE_UNKNOWN);
2019
2020 ixgbe_stop(ixgbe, B_FALSE);
2021 /*
2022 * Disable interrupts
2023 */
2024 if (ixgbe->attach_progress & ATTACH_PROGRESS_ENABLE_INTR) {
2025 rc = ixgbe_disable_intrs(ixgbe);
2026 ASSERT(rc == IXGBE_SUCCESS);
2027 }
2028 ixgbe->attach_progress &= ~ATTACH_PROGRESS_ENABLE_INTR;
2029
2030 /*
2031 * Remove interrupt handlers
2032 */
2033 if (ixgbe->attach_progress & ATTACH_PROGRESS_ADD_INTR) {
2034 ixgbe_rem_intr_handlers(ixgbe);
2035 }
2036 ixgbe->attach_progress &= ~ATTACH_PROGRESS_ADD_INTR;
2037
2038 /*
2039 * Clear vect_map
2040 */
2041 bzero(&ixgbe->vect_map, sizeof (ixgbe->vect_map));
2042 switch (cbaction) {
2043 case DDI_CB_INTR_ADD:
2044 rc = ddi_intr_alloc(ixgbe->dip, ixgbe->htable,
2045 DDI_INTR_TYPE_MSIX, ixgbe->intr_cnt, count, &actual,
2046 DDI_INTR_ALLOC_NORMAL);
2047 if (rc != DDI_SUCCESS || actual != count) {
2048 ixgbe_log(ixgbe, "Adjust interrupts failed."
2049 "return: %d, irm cb size: %d, actual: %d",
2050 rc, count, actual);
2051 goto intr_adjust_fail;
2052 }
2053 ixgbe->intr_cnt += count;
2054 break;
2055
2056 case DDI_CB_INTR_REMOVE:
2057 for (i = ixgbe->intr_cnt - count;
2058 i < ixgbe->intr_cnt; i ++) {
2059 rc = ddi_intr_free(ixgbe->htable[i]);
2060 ixgbe->htable[i] = NULL;
2061 if (rc != DDI_SUCCESS) {
2062 ixgbe_log(ixgbe, "Adjust interrupts failed."
2063 "return: %d, irm cb size: %d, actual: %d",
2064 rc, count, actual);
2065 goto intr_adjust_fail;
2066 }
2067 }
2068 ixgbe->intr_cnt -= count;
2069 break;
2070 }
2071
2072 /*
2073 * Get priority for first vector, assume remaining are all the same
2074 */
2075 rc = ddi_intr_get_pri(ixgbe->htable[0], &ixgbe->intr_pri);
2076 if (rc != DDI_SUCCESS) {
2077 ixgbe_log(ixgbe,
2078 "Get interrupt priority failed: %d", rc);
2079 goto intr_adjust_fail;
2080 }
2081 rc = ddi_intr_get_cap(ixgbe->htable[0], &ixgbe->intr_cap);
2082 if (rc != DDI_SUCCESS) {
2083 ixgbe_log(ixgbe, "Get interrupt cap failed: %d", rc);
2084 goto intr_adjust_fail;
2085 }
2086 ixgbe->attach_progress |= ATTACH_PROGRESS_ALLOC_INTR;
2087
2088 /*
2089 * Map rings to interrupt vectors
2090 */
2091 if (ixgbe_map_intrs_to_vectors(ixgbe) != IXGBE_SUCCESS) {
2092 ixgbe_error(ixgbe,
2093 "IRM CB: Failed to map interrupts to vectors");
2094 goto intr_adjust_fail;
2095 }
2096
2097 /*
2098 * Add interrupt handlers
2099 */
2100 if (ixgbe_add_intr_handlers(ixgbe) != IXGBE_SUCCESS) {
2101 ixgbe_error(ixgbe, "IRM CB: Failed to add interrupt handlers");
2102 goto intr_adjust_fail;
2103 }
2104 ixgbe->attach_progress |= ATTACH_PROGRESS_ADD_INTR;
2105
2106 /*
2107 * Now that mutex locks are initialized, and the chip is also
2108 * initialized, enable interrupts.
2109 */
2110 if (ixgbe_enable_intrs(ixgbe) != IXGBE_SUCCESS) {
2111 ixgbe_error(ixgbe, "IRM CB: Failed to enable DDI interrupts");
2112 goto intr_adjust_fail;
2113 }
2114 ixgbe->attach_progress |= ATTACH_PROGRESS_ENABLE_INTR;
2115 if (ixgbe_start(ixgbe, B_FALSE) != IXGBE_SUCCESS) {
2116 ixgbe_error(ixgbe, "IRM CB: Failed to start");
2117 goto intr_adjust_fail;
2118 }
2119 ixgbe->ixgbe_state &= ~IXGBE_INTR_ADJUST;
2120 ixgbe->ixgbe_state &= ~IXGBE_SUSPENDED;
2121 ixgbe->ixgbe_state |= IXGBE_STARTED;
2122 mutex_exit(&ixgbe->gen_lock);
2123
2124 for (i = 0; i < ixgbe->num_rx_rings; i++) {
2125 mac_ring_intr_set(ixgbe->rx_rings[i].ring_handle,
2126 ixgbe->htable[ixgbe->rx_rings[i].intr_vector]);
2127 }
2128 for (i = 0; i < ixgbe->num_tx_rings; i++) {
2129 mac_ring_intr_set(ixgbe->tx_rings[i].ring_handle,
2130 ixgbe->htable[ixgbe->tx_rings[i].intr_vector]);
2131 }
2132
2133 /* Wakeup all Tx rings */
2134 for (i = 0; i < ixgbe->num_tx_rings; i++) {
2135 mac_tx_ring_update(ixgbe->mac_hdl,
2136 ixgbe->tx_rings[i].ring_handle);
2137 }
2138
2139 IXGBE_DEBUGLOG_3(ixgbe,
2140 "IRM CB: interrupts new value: 0x%x(0x%x:0x%x).",
2141 ixgbe->intr_cnt, ixgbe->intr_cnt_min, ixgbe->intr_cnt_max);
2142 return (DDI_SUCCESS);
2143
2144 intr_adjust_fail:
2145 ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_LOST);
2146 mutex_exit(&ixgbe->gen_lock);
2147 return (DDI_FAILURE);
2148 }
2149
2150 /*
2151 * ixgbe_intr_cb_register - Register interrupt callback function.
2152 */
2153 static int
ixgbe_intr_cb_register(ixgbe_t * ixgbe)2154 ixgbe_intr_cb_register(ixgbe_t *ixgbe)
2155 {
2156 if (ddi_cb_register(ixgbe->dip, DDI_CB_FLAG_INTR, ixgbe_cbfunc,
2157 ixgbe, NULL, &ixgbe->cb_hdl) != DDI_SUCCESS) {
2158 return (IXGBE_FAILURE);
2159 }
2160 IXGBE_DEBUGLOG_0(ixgbe, "Interrupt callback function registered.");
2161 return (IXGBE_SUCCESS);
2162 }
2163
2164 /*
2165 * ixgbe_alloc_rings - Allocate memory space for rx/tx rings.
2166 */
2167 static int
ixgbe_alloc_rings(ixgbe_t * ixgbe)2168 ixgbe_alloc_rings(ixgbe_t *ixgbe)
2169 {
2170 /*
2171 * Allocate memory space for rx rings
2172 */
2173 ixgbe->rx_rings = kmem_zalloc(
2174 sizeof (ixgbe_rx_ring_t) * ixgbe->num_rx_rings,
2175 KM_NOSLEEP);
2176
2177 if (ixgbe->rx_rings == NULL) {
2178 return (IXGBE_FAILURE);
2179 }
2180
2181 /*
2182 * Allocate memory space for tx rings
2183 */
2184 ixgbe->tx_rings = kmem_zalloc(
2185 sizeof (ixgbe_tx_ring_t) * ixgbe->num_tx_rings,
2186 KM_NOSLEEP);
2187
2188 if (ixgbe->tx_rings == NULL) {
2189 kmem_free(ixgbe->rx_rings,
2190 sizeof (ixgbe_rx_ring_t) * ixgbe->num_rx_rings);
2191 ixgbe->rx_rings = NULL;
2192 return (IXGBE_FAILURE);
2193 }
2194
2195 /*
2196 * Allocate memory space for rx ring groups
2197 */
2198 ixgbe->rx_groups = kmem_zalloc(
2199 sizeof (ixgbe_rx_group_t) * ixgbe->num_rx_groups,
2200 KM_NOSLEEP);
2201
2202 if (ixgbe->rx_groups == NULL) {
2203 kmem_free(ixgbe->rx_rings,
2204 sizeof (ixgbe_rx_ring_t) * ixgbe->num_rx_rings);
2205 kmem_free(ixgbe->tx_rings,
2206 sizeof (ixgbe_tx_ring_t) * ixgbe->num_tx_rings);
2207 ixgbe->rx_rings = NULL;
2208 ixgbe->tx_rings = NULL;
2209 return (IXGBE_FAILURE);
2210 }
2211
2212 return (IXGBE_SUCCESS);
2213 }
2214
2215 /*
2216 * ixgbe_free_rings - Free the memory space of rx/tx rings.
2217 */
2218 static void
ixgbe_free_rings(ixgbe_t * ixgbe)2219 ixgbe_free_rings(ixgbe_t *ixgbe)
2220 {
2221 if (ixgbe->rx_rings != NULL) {
2222 kmem_free(ixgbe->rx_rings,
2223 sizeof (ixgbe_rx_ring_t) * ixgbe->num_rx_rings);
2224 ixgbe->rx_rings = NULL;
2225 }
2226
2227 if (ixgbe->tx_rings != NULL) {
2228 kmem_free(ixgbe->tx_rings,
2229 sizeof (ixgbe_tx_ring_t) * ixgbe->num_tx_rings);
2230 ixgbe->tx_rings = NULL;
2231 }
2232
2233 if (ixgbe->rx_groups != NULL) {
2234 kmem_free(ixgbe->rx_groups,
2235 sizeof (ixgbe_rx_group_t) * ixgbe->num_rx_groups);
2236 ixgbe->rx_groups = NULL;
2237 }
2238 }
2239
2240 static int
ixgbe_alloc_rx_data(ixgbe_t * ixgbe)2241 ixgbe_alloc_rx_data(ixgbe_t *ixgbe)
2242 {
2243 ixgbe_rx_ring_t *rx_ring;
2244 int i;
2245
2246 for (i = 0; i < ixgbe->num_rx_rings; i++) {
2247 rx_ring = &ixgbe->rx_rings[i];
2248 if (ixgbe_alloc_rx_ring_data(rx_ring) != IXGBE_SUCCESS)
2249 goto alloc_rx_rings_failure;
2250 }
2251 return (IXGBE_SUCCESS);
2252
2253 alloc_rx_rings_failure:
2254 ixgbe_free_rx_data(ixgbe);
2255 return (IXGBE_FAILURE);
2256 }
2257
2258 static void
ixgbe_free_rx_data(ixgbe_t * ixgbe)2259 ixgbe_free_rx_data(ixgbe_t *ixgbe)
2260 {
2261 ixgbe_rx_ring_t *rx_ring;
2262 ixgbe_rx_data_t *rx_data;
2263 int i;
2264
2265 for (i = 0; i < ixgbe->num_rx_rings; i++) {
2266 rx_ring = &ixgbe->rx_rings[i];
2267
2268 mutex_enter(&ixgbe->rx_pending_lock);
2269 rx_data = rx_ring->rx_data;
2270
2271 if (rx_data != NULL) {
2272 rx_data->flag |= IXGBE_RX_STOPPED;
2273
2274 if (rx_data->rcb_pending == 0) {
2275 ixgbe_free_rx_ring_data(rx_data);
2276 rx_ring->rx_data = NULL;
2277 }
2278 }
2279
2280 mutex_exit(&ixgbe->rx_pending_lock);
2281 }
2282 }
2283
2284 /*
2285 * ixgbe_setup_rings - Setup rx/tx rings.
2286 */
2287 static void
ixgbe_setup_rings(ixgbe_t * ixgbe)2288 ixgbe_setup_rings(ixgbe_t *ixgbe)
2289 {
2290 /*
2291 * Setup the rx/tx rings, including the following:
2292 *
2293 * 1. Setup the descriptor ring and the control block buffers;
2294 * 2. Initialize necessary registers for receive/transmit;
2295 * 3. Initialize software pointers/parameters for receive/transmit;
2296 */
2297 ixgbe_setup_rx(ixgbe);
2298
2299 ixgbe_setup_tx(ixgbe);
2300 }
2301
2302 static void
ixgbe_setup_rx_ring(ixgbe_rx_ring_t * rx_ring)2303 ixgbe_setup_rx_ring(ixgbe_rx_ring_t *rx_ring)
2304 {
2305 ixgbe_t *ixgbe = rx_ring->ixgbe;
2306 ixgbe_rx_data_t *rx_data = rx_ring->rx_data;
2307 struct ixgbe_hw *hw = &ixgbe->hw;
2308 rx_control_block_t *rcb;
2309 union ixgbe_adv_rx_desc *rbd;
2310 uint32_t size;
2311 uint32_t buf_low;
2312 uint32_t buf_high;
2313 uint32_t reg_val;
2314 int i;
2315
2316 ASSERT(mutex_owned(&rx_ring->rx_lock));
2317 ASSERT(mutex_owned(&ixgbe->gen_lock));
2318
2319 for (i = 0; i < ixgbe->rx_ring_size; i++) {
2320 rcb = rx_data->work_list[i];
2321 rbd = &rx_data->rbd_ring[i];
2322
2323 rbd->read.pkt_addr = rcb->rx_buf.dma_address;
2324 rbd->read.hdr_addr = NULL;
2325 }
2326
2327 /*
2328 * Initialize the length register
2329 */
2330 size = rx_data->ring_size * sizeof (union ixgbe_adv_rx_desc);
2331 IXGBE_WRITE_REG(hw, IXGBE_RDLEN(rx_ring->hw_index), size);
2332
2333 /*
2334 * Initialize the base address registers
2335 */
2336 buf_low = (uint32_t)rx_data->rbd_area.dma_address;
2337 buf_high = (uint32_t)(rx_data->rbd_area.dma_address >> 32);
2338 IXGBE_WRITE_REG(hw, IXGBE_RDBAH(rx_ring->hw_index), buf_high);
2339 IXGBE_WRITE_REG(hw, IXGBE_RDBAL(rx_ring->hw_index), buf_low);
2340
2341 /*
2342 * Setup head & tail pointers
2343 */
2344 IXGBE_WRITE_REG(hw, IXGBE_RDT(rx_ring->hw_index),
2345 rx_data->ring_size - 1);
2346 IXGBE_WRITE_REG(hw, IXGBE_RDH(rx_ring->hw_index), 0);
2347
2348 rx_data->rbd_next = 0;
2349 rx_data->lro_first = 0;
2350
2351 /*
2352 * Setup the Receive Descriptor Control Register (RXDCTL)
2353 * PTHRESH=32 descriptors (half the internal cache)
2354 * HTHRESH=0 descriptors (to minimize latency on fetch)
2355 * WTHRESH defaults to 1 (writeback each descriptor)
2356 */
2357 reg_val = IXGBE_READ_REG(hw, IXGBE_RXDCTL(rx_ring->hw_index));
2358 reg_val |= IXGBE_RXDCTL_ENABLE; /* enable queue */
2359
2360 /* Not a valid value for 82599, X540 or X550 */
2361 if (hw->mac.type == ixgbe_mac_82598EB) {
2362 reg_val |= 0x0020; /* pthresh */
2363 }
2364 IXGBE_WRITE_REG(hw, IXGBE_RXDCTL(rx_ring->hw_index), reg_val);
2365
2366 if (hw->mac.type == ixgbe_mac_82599EB ||
2367 hw->mac.type == ixgbe_mac_X540 ||
2368 hw->mac.type == ixgbe_mac_X550 ||
2369 hw->mac.type == ixgbe_mac_X550EM_x) {
2370 reg_val = IXGBE_READ_REG(hw, IXGBE_RDRXCTL);
2371 reg_val |= (IXGBE_RDRXCTL_CRCSTRIP | IXGBE_RDRXCTL_AGGDIS);
2372 IXGBE_WRITE_REG(hw, IXGBE_RDRXCTL, reg_val);
2373 }
2374
2375 /*
2376 * Setup the Split and Replication Receive Control Register.
2377 * Set the rx buffer size and the advanced descriptor type.
2378 */
2379 reg_val = (ixgbe->rx_buf_size >> IXGBE_SRRCTL_BSIZEPKT_SHIFT) |
2380 IXGBE_SRRCTL_DESCTYPE_ADV_ONEBUF;
2381 reg_val |= IXGBE_SRRCTL_DROP_EN;
2382 IXGBE_WRITE_REG(hw, IXGBE_SRRCTL(rx_ring->hw_index), reg_val);
2383 }
2384
2385 static void
ixgbe_setup_rx(ixgbe_t * ixgbe)2386 ixgbe_setup_rx(ixgbe_t *ixgbe)
2387 {
2388 ixgbe_rx_ring_t *rx_ring;
2389 struct ixgbe_hw *hw = &ixgbe->hw;
2390 uint32_t reg_val;
2391 uint32_t ring_mapping;
2392 uint32_t i, index;
2393 uint32_t psrtype_rss_bit;
2394
2395 /*
2396 * Ensure that Rx is disabled while setting up
2397 * the Rx unit and Rx descriptor ring(s)
2398 */
2399 ixgbe_disable_rx(hw);
2400
2401 /* PSRTYPE must be configured for 82599 */
2402 if (ixgbe->classify_mode != IXGBE_CLASSIFY_VMDQ &&
2403 ixgbe->classify_mode != IXGBE_CLASSIFY_VMDQ_RSS) {
2404 reg_val = IXGBE_PSRTYPE_TCPHDR | IXGBE_PSRTYPE_UDPHDR |
2405 IXGBE_PSRTYPE_IPV4HDR | IXGBE_PSRTYPE_IPV6HDR;
2406 reg_val |= IXGBE_PSRTYPE_L2HDR;
2407 reg_val |= 0x80000000;
2408 IXGBE_WRITE_REG(hw, IXGBE_PSRTYPE(0), reg_val);
2409 } else {
2410 if (ixgbe->num_rx_groups > 32) {
2411 psrtype_rss_bit = 0x20000000;
2412 } else {
2413 psrtype_rss_bit = 0x40000000;
2414 }
2415 for (i = 0; i < ixgbe->capab->max_rx_grp_num; i++) {
2416 reg_val = IXGBE_PSRTYPE_TCPHDR | IXGBE_PSRTYPE_UDPHDR |
2417 IXGBE_PSRTYPE_IPV4HDR | IXGBE_PSRTYPE_IPV6HDR;
2418 reg_val |= IXGBE_PSRTYPE_L2HDR;
2419 reg_val |= psrtype_rss_bit;
2420 IXGBE_WRITE_REG(hw, IXGBE_PSRTYPE(i), reg_val);
2421 }
2422 }
2423
2424 /*
2425 * Set filter control in FCTRL to determine types of packets are passed
2426 * up to the driver.
2427 * - Pass broadcast packets.
2428 * - Do not pass flow control pause frames (82598-specific)
2429 */
2430 reg_val = IXGBE_READ_REG(hw, IXGBE_FCTRL);
2431 reg_val |= IXGBE_FCTRL_BAM; /* Broadcast Accept Mode */
2432 if (hw->mac.type == ixgbe_mac_82598EB) {
2433 reg_val |= IXGBE_FCTRL_DPF; /* Discard Pause Frames */
2434 }
2435 IXGBE_WRITE_REG(hw, IXGBE_FCTRL, reg_val);
2436
2437 /*
2438 * Hardware checksum settings
2439 */
2440 if (ixgbe->rx_hcksum_enable) {
2441 reg_val = IXGBE_READ_REG(hw, IXGBE_RXCSUM);
2442 reg_val |= IXGBE_RXCSUM_IPPCSE; /* IP checksum */
2443 IXGBE_WRITE_REG(hw, IXGBE_RXCSUM, reg_val);
2444 }
2445
2446 /*
2447 * Setup VMDq and RSS for multiple receive queues
2448 */
2449 switch (ixgbe->classify_mode) {
2450 case IXGBE_CLASSIFY_RSS:
2451 /*
2452 * One group, only RSS is needed when more than
2453 * one ring enabled.
2454 */
2455 ixgbe_setup_rss(ixgbe);
2456 break;
2457
2458 case IXGBE_CLASSIFY_VMDQ:
2459 /*
2460 * Multiple groups, each group has one ring,
2461 * only VMDq is needed.
2462 */
2463 ixgbe_setup_vmdq(ixgbe);
2464 break;
2465
2466 case IXGBE_CLASSIFY_VMDQ_RSS:
2467 /*
2468 * Multiple groups and multiple rings, both
2469 * VMDq and RSS are needed.
2470 */
2471 ixgbe_setup_vmdq_rss(ixgbe);
2472 break;
2473
2474 default:
2475 break;
2476 }
2477
2478 /*
2479 * Enable the receive unit. This must be done after filter
2480 * control is set in FCTRL. On 82598, we disable the descriptor monitor.
2481 * 82598 is the only adapter which defines this RXCTRL option.
2482 */
2483 reg_val = IXGBE_READ_REG(hw, IXGBE_RXCTRL);
2484 if (hw->mac.type == ixgbe_mac_82598EB)
2485 reg_val |= IXGBE_RXCTRL_DMBYPS; /* descriptor monitor bypass */
2486 reg_val |= IXGBE_RXCTRL_RXEN;
2487 (void) ixgbe_enable_rx_dma(hw, reg_val);
2488
2489 /*
2490 * ixgbe_setup_rx_ring must be called after configuring RXCTRL
2491 */
2492 for (i = 0; i < ixgbe->num_rx_rings; i++) {
2493 rx_ring = &ixgbe->rx_rings[i];
2494 ixgbe_setup_rx_ring(rx_ring);
2495 }
2496
2497 /*
2498 * Setup the per-ring statistics mapping.
2499 */
2500 ring_mapping = 0;
2501 for (i = 0; i < ixgbe->num_rx_rings; i++) {
2502 index = ixgbe->rx_rings[i].hw_index;
2503 ring_mapping = IXGBE_READ_REG(hw, IXGBE_RQSMR(index >> 2));
2504 ring_mapping |= (i & 0xF) << (8 * (index & 0x3));
2505 IXGBE_WRITE_REG(hw, IXGBE_RQSMR(index >> 2), ring_mapping);
2506 }
2507
2508 /*
2509 * The Max Frame Size in MHADD/MAXFRS will be internally increased
2510 * by four bytes if the packet has a VLAN field, so includes MTU,
2511 * ethernet header and frame check sequence.
2512 * Register is MAXFRS in 82599.
2513 */
2514 reg_val = IXGBE_READ_REG(hw, IXGBE_MHADD);
2515 reg_val &= ~IXGBE_MHADD_MFS_MASK;
2516 reg_val |= (ixgbe->default_mtu + sizeof (struct ether_header)
2517 + ETHERFCSL) << IXGBE_MHADD_MFS_SHIFT;
2518 IXGBE_WRITE_REG(hw, IXGBE_MHADD, reg_val);
2519
2520 /*
2521 * Setup Jumbo Frame enable bit
2522 */
2523 reg_val = IXGBE_READ_REG(hw, IXGBE_HLREG0);
2524 if (ixgbe->default_mtu > ETHERMTU)
2525 reg_val |= IXGBE_HLREG0_JUMBOEN;
2526 else
2527 reg_val &= ~IXGBE_HLREG0_JUMBOEN;
2528 IXGBE_WRITE_REG(hw, IXGBE_HLREG0, reg_val);
2529
2530 /*
2531 * Setup RSC for multiple receive queues.
2532 */
2533 if (ixgbe->lro_enable) {
2534 for (i = 0; i < ixgbe->num_rx_rings; i++) {
2535 /*
2536 * Make sure rx_buf_size * MAXDESC not greater
2537 * than 65535.
2538 * Intel recommends 4 for MAXDESC field value.
2539 */
2540 reg_val = IXGBE_READ_REG(hw, IXGBE_RSCCTL(i));
2541 reg_val |= IXGBE_RSCCTL_RSCEN;
2542 if (ixgbe->rx_buf_size == IXGBE_PKG_BUF_16k)
2543 reg_val |= IXGBE_RSCCTL_MAXDESC_1;
2544 else
2545 reg_val |= IXGBE_RSCCTL_MAXDESC_4;
2546 IXGBE_WRITE_REG(hw, IXGBE_RSCCTL(i), reg_val);
2547 }
2548
2549 reg_val = IXGBE_READ_REG(hw, IXGBE_RSCDBU);
2550 reg_val |= IXGBE_RSCDBU_RSCACKDIS;
2551 IXGBE_WRITE_REG(hw, IXGBE_RSCDBU, reg_val);
2552
2553 reg_val = IXGBE_READ_REG(hw, IXGBE_RDRXCTL);
2554 reg_val |= IXGBE_RDRXCTL_RSCACKC;
2555 reg_val |= IXGBE_RDRXCTL_FCOE_WRFIX;
2556 reg_val &= ~IXGBE_RDRXCTL_RSCFRSTSIZE;
2557
2558 IXGBE_WRITE_REG(hw, IXGBE_RDRXCTL, reg_val);
2559 }
2560 }
2561
2562 static void
ixgbe_setup_tx_ring(ixgbe_tx_ring_t * tx_ring)2563 ixgbe_setup_tx_ring(ixgbe_tx_ring_t *tx_ring)
2564 {
2565 ixgbe_t *ixgbe = tx_ring->ixgbe;
2566 struct ixgbe_hw *hw = &ixgbe->hw;
2567 uint32_t size;
2568 uint32_t buf_low;
2569 uint32_t buf_high;
2570 uint32_t reg_val;
2571
2572 ASSERT(mutex_owned(&tx_ring->tx_lock));
2573 ASSERT(mutex_owned(&ixgbe->gen_lock));
2574
2575 /*
2576 * Initialize the length register
2577 */
2578 size = tx_ring->ring_size * sizeof (union ixgbe_adv_tx_desc);
2579 IXGBE_WRITE_REG(hw, IXGBE_TDLEN(tx_ring->index), size);
2580
2581 /*
2582 * Initialize the base address registers
2583 */
2584 buf_low = (uint32_t)tx_ring->tbd_area.dma_address;
2585 buf_high = (uint32_t)(tx_ring->tbd_area.dma_address >> 32);
2586 IXGBE_WRITE_REG(hw, IXGBE_TDBAL(tx_ring->index), buf_low);
2587 IXGBE_WRITE_REG(hw, IXGBE_TDBAH(tx_ring->index), buf_high);
2588
2589 /*
2590 * Setup head & tail pointers
2591 */
2592 IXGBE_WRITE_REG(hw, IXGBE_TDH(tx_ring->index), 0);
2593 IXGBE_WRITE_REG(hw, IXGBE_TDT(tx_ring->index), 0);
2594
2595 /*
2596 * Setup head write-back
2597 */
2598 if (ixgbe->tx_head_wb_enable) {
2599 /*
2600 * The memory of the head write-back is allocated using
2601 * the extra tbd beyond the tail of the tbd ring.
2602 */
2603 tx_ring->tbd_head_wb = (uint32_t *)
2604 ((uintptr_t)tx_ring->tbd_area.address + size);
2605 *tx_ring->tbd_head_wb = 0;
2606
2607 buf_low = (uint32_t)
2608 (tx_ring->tbd_area.dma_address + size);
2609 buf_high = (uint32_t)
2610 ((tx_ring->tbd_area.dma_address + size) >> 32);
2611
2612 /* Set the head write-back enable bit */
2613 buf_low |= IXGBE_TDWBAL_HEAD_WB_ENABLE;
2614
2615 IXGBE_WRITE_REG(hw, IXGBE_TDWBAL(tx_ring->index), buf_low);
2616 IXGBE_WRITE_REG(hw, IXGBE_TDWBAH(tx_ring->index), buf_high);
2617
2618 /*
2619 * Turn off relaxed ordering for head write back or it will
2620 * cause problems with the tx recycling
2621 */
2622
2623 reg_val = (hw->mac.type == ixgbe_mac_82598EB) ?
2624 IXGBE_READ_REG(hw, IXGBE_DCA_TXCTRL(tx_ring->index)) :
2625 IXGBE_READ_REG(hw, IXGBE_DCA_TXCTRL_82599(tx_ring->index));
2626 reg_val &= ~IXGBE_DCA_TXCTRL_DESC_WRO_EN;
2627 if (hw->mac.type == ixgbe_mac_82598EB) {
2628 IXGBE_WRITE_REG(hw,
2629 IXGBE_DCA_TXCTRL(tx_ring->index), reg_val);
2630 } else {
2631 IXGBE_WRITE_REG(hw,
2632 IXGBE_DCA_TXCTRL_82599(tx_ring->index), reg_val);
2633 }
2634 } else {
2635 tx_ring->tbd_head_wb = NULL;
2636 }
2637
2638 tx_ring->tbd_head = 0;
2639 tx_ring->tbd_tail = 0;
2640 tx_ring->tbd_free = tx_ring->ring_size;
2641
2642 if (ixgbe->tx_ring_init == B_TRUE) {
2643 tx_ring->tcb_head = 0;
2644 tx_ring->tcb_tail = 0;
2645 tx_ring->tcb_free = tx_ring->free_list_size;
2646 }
2647
2648 /*
2649 * Initialize the s/w context structure
2650 */
2651 bzero(&tx_ring->tx_context, sizeof (ixgbe_tx_context_t));
2652 }
2653
2654 static void
ixgbe_setup_tx(ixgbe_t * ixgbe)2655 ixgbe_setup_tx(ixgbe_t *ixgbe)
2656 {
2657 struct ixgbe_hw *hw = &ixgbe->hw;
2658 ixgbe_tx_ring_t *tx_ring;
2659 uint32_t reg_val;
2660 uint32_t ring_mapping;
2661 int i;
2662
2663 for (i = 0; i < ixgbe->num_tx_rings; i++) {
2664 tx_ring = &ixgbe->tx_rings[i];
2665 ixgbe_setup_tx_ring(tx_ring);
2666 }
2667
2668 /*
2669 * Setup the per-ring statistics mapping.
2670 */
2671 ring_mapping = 0;
2672 for (i = 0; i < ixgbe->num_tx_rings; i++) {
2673 ring_mapping |= (i & 0xF) << (8 * (i & 0x3));
2674 if ((i & 0x3) == 0x3) {
2675 switch (hw->mac.type) {
2676 case ixgbe_mac_82598EB:
2677 IXGBE_WRITE_REG(hw, IXGBE_TQSMR(i >> 2),
2678 ring_mapping);
2679 break;
2680
2681 case ixgbe_mac_82599EB:
2682 case ixgbe_mac_X540:
2683 case ixgbe_mac_X550:
2684 case ixgbe_mac_X550EM_x:
2685 IXGBE_WRITE_REG(hw, IXGBE_TQSM(i >> 2),
2686 ring_mapping);
2687 break;
2688
2689 default:
2690 break;
2691 }
2692
2693 ring_mapping = 0;
2694 }
2695 }
2696 if (i & 0x3) {
2697 switch (hw->mac.type) {
2698 case ixgbe_mac_82598EB:
2699 IXGBE_WRITE_REG(hw, IXGBE_TQSMR(i >> 2), ring_mapping);
2700 break;
2701
2702 case ixgbe_mac_82599EB:
2703 case ixgbe_mac_X540:
2704 case ixgbe_mac_X550:
2705 case ixgbe_mac_X550EM_x:
2706 IXGBE_WRITE_REG(hw, IXGBE_TQSM(i >> 2), ring_mapping);
2707 break;
2708
2709 default:
2710 break;
2711 }
2712 }
2713
2714 /*
2715 * Enable CRC appending and TX padding (for short tx frames)
2716 */
2717 reg_val = IXGBE_READ_REG(hw, IXGBE_HLREG0);
2718 reg_val |= IXGBE_HLREG0_TXCRCEN | IXGBE_HLREG0_TXPADEN;
2719 IXGBE_WRITE_REG(hw, IXGBE_HLREG0, reg_val);
2720
2721 /*
2722 * enable DMA for 82599, X540 and X550 parts
2723 */
2724 if (hw->mac.type == ixgbe_mac_82599EB ||
2725 hw->mac.type == ixgbe_mac_X540 ||
2726 hw->mac.type == ixgbe_mac_X550 ||
2727 hw->mac.type == ixgbe_mac_X550EM_x) {
2728 /* DMATXCTL.TE must be set after all Tx config is complete */
2729 reg_val = IXGBE_READ_REG(hw, IXGBE_DMATXCTL);
2730 reg_val |= IXGBE_DMATXCTL_TE;
2731 IXGBE_WRITE_REG(hw, IXGBE_DMATXCTL, reg_val);
2732
2733 /* Disable arbiter to set MTQC */
2734 reg_val = IXGBE_READ_REG(hw, IXGBE_RTTDCS);
2735 reg_val |= IXGBE_RTTDCS_ARBDIS;
2736 IXGBE_WRITE_REG(hw, IXGBE_RTTDCS, reg_val);
2737 IXGBE_WRITE_REG(hw, IXGBE_MTQC, IXGBE_MTQC_64Q_1PB);
2738 reg_val &= ~IXGBE_RTTDCS_ARBDIS;
2739 IXGBE_WRITE_REG(hw, IXGBE_RTTDCS, reg_val);
2740 }
2741
2742 /*
2743 * Enabling tx queues ..
2744 * For 82599 must be done after DMATXCTL.TE is set
2745 */
2746 for (i = 0; i < ixgbe->num_tx_rings; i++) {
2747 tx_ring = &ixgbe->tx_rings[i];
2748 reg_val = IXGBE_READ_REG(hw, IXGBE_TXDCTL(tx_ring->index));
2749 reg_val |= IXGBE_TXDCTL_ENABLE;
2750 IXGBE_WRITE_REG(hw, IXGBE_TXDCTL(tx_ring->index), reg_val);
2751 }
2752 }
2753
2754 /*
2755 * ixgbe_setup_rss - Setup receive-side scaling feature.
2756 */
2757 static void
ixgbe_setup_rss(ixgbe_t * ixgbe)2758 ixgbe_setup_rss(ixgbe_t *ixgbe)
2759 {
2760 struct ixgbe_hw *hw = &ixgbe->hw;
2761 uint32_t mrqc;
2762
2763 /*
2764 * Initialize RETA/ERETA table
2765 */
2766 ixgbe_setup_rss_table(ixgbe);
2767
2768 /*
2769 * Enable RSS & perform hash on these packet types
2770 */
2771 mrqc = IXGBE_MRQC_RSSEN |
2772 IXGBE_MRQC_RSS_FIELD_IPV4 |
2773 IXGBE_MRQC_RSS_FIELD_IPV4_TCP |
2774 IXGBE_MRQC_RSS_FIELD_IPV4_UDP |
2775 IXGBE_MRQC_RSS_FIELD_IPV6_EX_TCP |
2776 IXGBE_MRQC_RSS_FIELD_IPV6_EX |
2777 IXGBE_MRQC_RSS_FIELD_IPV6 |
2778 IXGBE_MRQC_RSS_FIELD_IPV6_TCP |
2779 IXGBE_MRQC_RSS_FIELD_IPV6_UDP |
2780 IXGBE_MRQC_RSS_FIELD_IPV6_EX_UDP;
2781 IXGBE_WRITE_REG(hw, IXGBE_MRQC, mrqc);
2782 }
2783
2784 /*
2785 * ixgbe_setup_vmdq - Setup MAC classification feature
2786 */
2787 static void
ixgbe_setup_vmdq(ixgbe_t * ixgbe)2788 ixgbe_setup_vmdq(ixgbe_t *ixgbe)
2789 {
2790 struct ixgbe_hw *hw = &ixgbe->hw;
2791 uint32_t vmdctl, i, vtctl;
2792
2793 /*
2794 * Setup the VMDq Control register, enable VMDq based on
2795 * packet destination MAC address:
2796 */
2797 switch (hw->mac.type) {
2798 case ixgbe_mac_82598EB:
2799 /*
2800 * VMDq Enable = 1;
2801 * VMDq Filter = 0; MAC filtering
2802 * Default VMDq output index = 0;
2803 */
2804 vmdctl = IXGBE_VMD_CTL_VMDQ_EN;
2805 IXGBE_WRITE_REG(hw, IXGBE_VMD_CTL, vmdctl);
2806 break;
2807
2808 case ixgbe_mac_82599EB:
2809 case ixgbe_mac_X540:
2810 case ixgbe_mac_X550:
2811 case ixgbe_mac_X550EM_x:
2812 /*
2813 * Enable VMDq-only.
2814 */
2815 vmdctl = IXGBE_MRQC_VMDQEN;
2816 IXGBE_WRITE_REG(hw, IXGBE_MRQC, vmdctl);
2817
2818 for (i = 0; i < hw->mac.num_rar_entries; i++) {
2819 IXGBE_WRITE_REG(hw, IXGBE_MPSAR_LO(i), 0);
2820 IXGBE_WRITE_REG(hw, IXGBE_MPSAR_HI(i), 0);
2821 }
2822
2823 /*
2824 * Enable Virtualization and Replication.
2825 */
2826 vtctl = IXGBE_VT_CTL_VT_ENABLE | IXGBE_VT_CTL_REPLEN;
2827 IXGBE_WRITE_REG(hw, IXGBE_VT_CTL, vtctl);
2828
2829 /*
2830 * Enable receiving packets to all VFs
2831 */
2832 IXGBE_WRITE_REG(hw, IXGBE_VFRE(0), IXGBE_VFRE_ENABLE_ALL);
2833 IXGBE_WRITE_REG(hw, IXGBE_VFRE(1), IXGBE_VFRE_ENABLE_ALL);
2834 break;
2835
2836 default:
2837 break;
2838 }
2839 }
2840
2841 /*
2842 * ixgbe_setup_vmdq_rss - Setup both vmdq feature and rss feature.
2843 */
2844 static void
ixgbe_setup_vmdq_rss(ixgbe_t * ixgbe)2845 ixgbe_setup_vmdq_rss(ixgbe_t *ixgbe)
2846 {
2847 struct ixgbe_hw *hw = &ixgbe->hw;
2848 uint32_t i, mrqc;
2849 uint32_t vtctl, vmdctl;
2850
2851 /*
2852 * Initialize RETA/ERETA table
2853 */
2854 ixgbe_setup_rss_table(ixgbe);
2855
2856 /*
2857 * Enable and setup RSS and VMDq
2858 */
2859 switch (hw->mac.type) {
2860 case ixgbe_mac_82598EB:
2861 /*
2862 * Enable RSS & Setup RSS Hash functions
2863 */
2864 mrqc = IXGBE_MRQC_RSSEN |
2865 IXGBE_MRQC_RSS_FIELD_IPV4 |
2866 IXGBE_MRQC_RSS_FIELD_IPV4_TCP |
2867 IXGBE_MRQC_RSS_FIELD_IPV4_UDP |
2868 IXGBE_MRQC_RSS_FIELD_IPV6_EX_TCP |
2869 IXGBE_MRQC_RSS_FIELD_IPV6_EX |
2870 IXGBE_MRQC_RSS_FIELD_IPV6 |
2871 IXGBE_MRQC_RSS_FIELD_IPV6_TCP |
2872 IXGBE_MRQC_RSS_FIELD_IPV6_UDP |
2873 IXGBE_MRQC_RSS_FIELD_IPV6_EX_UDP;
2874 IXGBE_WRITE_REG(hw, IXGBE_MRQC, mrqc);
2875
2876 /*
2877 * Enable and Setup VMDq
2878 * VMDq Filter = 0; MAC filtering
2879 * Default VMDq output index = 0;
2880 */
2881 vmdctl = IXGBE_VMD_CTL_VMDQ_EN;
2882 IXGBE_WRITE_REG(hw, IXGBE_VMD_CTL, vmdctl);
2883 break;
2884
2885 case ixgbe_mac_82599EB:
2886 case ixgbe_mac_X540:
2887 case ixgbe_mac_X550:
2888 case ixgbe_mac_X550EM_x:
2889 /*
2890 * Enable RSS & Setup RSS Hash functions
2891 */
2892 mrqc = IXGBE_MRQC_RSS_FIELD_IPV4 |
2893 IXGBE_MRQC_RSS_FIELD_IPV4_TCP |
2894 IXGBE_MRQC_RSS_FIELD_IPV4_UDP |
2895 IXGBE_MRQC_RSS_FIELD_IPV6_EX_TCP |
2896 IXGBE_MRQC_RSS_FIELD_IPV6_EX |
2897 IXGBE_MRQC_RSS_FIELD_IPV6 |
2898 IXGBE_MRQC_RSS_FIELD_IPV6_TCP |
2899 IXGBE_MRQC_RSS_FIELD_IPV6_UDP |
2900 IXGBE_MRQC_RSS_FIELD_IPV6_EX_UDP;
2901
2902 /*
2903 * Enable VMDq+RSS.
2904 */
2905 if (ixgbe->num_rx_groups > 32) {
2906 mrqc = mrqc | IXGBE_MRQC_VMDQRSS64EN;
2907 } else {
2908 mrqc = mrqc | IXGBE_MRQC_VMDQRSS32EN;
2909 }
2910
2911 IXGBE_WRITE_REG(hw, IXGBE_MRQC, mrqc);
2912
2913 for (i = 0; i < hw->mac.num_rar_entries; i++) {
2914 IXGBE_WRITE_REG(hw, IXGBE_MPSAR_LO(i), 0);
2915 IXGBE_WRITE_REG(hw, IXGBE_MPSAR_HI(i), 0);
2916 }
2917 break;
2918
2919 default:
2920 break;
2921
2922 }
2923
2924 if (hw->mac.type == ixgbe_mac_82599EB ||
2925 hw->mac.type == ixgbe_mac_X540 ||
2926 hw->mac.type == ixgbe_mac_X550 ||
2927 hw->mac.type == ixgbe_mac_X550EM_x) {
2928 /*
2929 * Enable Virtualization and Replication.
2930 */
2931 vtctl = IXGBE_VT_CTL_VT_ENABLE | IXGBE_VT_CTL_REPLEN;
2932 IXGBE_WRITE_REG(hw, IXGBE_VT_CTL, vtctl);
2933
2934 /*
2935 * Enable receiving packets to all VFs
2936 */
2937 IXGBE_WRITE_REG(hw, IXGBE_VFRE(0), IXGBE_VFRE_ENABLE_ALL);
2938 IXGBE_WRITE_REG(hw, IXGBE_VFRE(1), IXGBE_VFRE_ENABLE_ALL);
2939 }
2940 }
2941
2942 /*
2943 * ixgbe_setup_rss_table - Setup RSS table
2944 */
2945 static void
ixgbe_setup_rss_table(ixgbe_t * ixgbe)2946 ixgbe_setup_rss_table(ixgbe_t *ixgbe)
2947 {
2948 struct ixgbe_hw *hw = &ixgbe->hw;
2949 uint32_t i, j;
2950 uint32_t random;
2951 uint32_t reta;
2952 uint32_t ring_per_group;
2953 uint32_t ring;
2954 uint32_t table_size;
2955 uint32_t index_mult;
2956 uint32_t rxcsum;
2957
2958 /*
2959 * Set multiplier for RETA setup and table size based on MAC type.
2960 * RETA table sizes vary by model:
2961 *
2962 * 82598, 82599, X540: 128 table entries.
2963 * X550: 512 table entries.
2964 */
2965 index_mult = 0x1;
2966 table_size = 128;
2967 switch (ixgbe->hw.mac.type) {
2968 case ixgbe_mac_82598EB:
2969 index_mult = 0x11;
2970 break;
2971 case ixgbe_mac_X550:
2972 case ixgbe_mac_X550EM_x:
2973 table_size = 512;
2974 break;
2975 default:
2976 break;
2977 }
2978
2979 /*
2980 * Fill out RSS redirection table. The configuation of the indices is
2981 * hardware-dependent.
2982 *
2983 * 82598: 8 bits wide containing two 4 bit RSS indices
2984 * 82599, X540: 8 bits wide containing one 4 bit RSS index
2985 * X550: 8 bits wide containing one 6 bit RSS index
2986 */
2987 reta = 0;
2988 ring_per_group = ixgbe->num_rx_rings / ixgbe->num_rx_groups;
2989
2990 for (i = 0, j = 0; i < table_size; i++, j++) {
2991 if (j == ring_per_group) j = 0;
2992
2993 /*
2994 * The low 8 bits are for hash value (n+0);
2995 * The next 8 bits are for hash value (n+1), etc.
2996 */
2997 ring = (j * index_mult);
2998 reta = reta >> 8;
2999 reta = reta | (((uint32_t)ring) << 24);
3000
3001 if ((i & 3) == 3) {
3002 /*
3003 * The first 128 table entries are programmed into the
3004 * RETA register, with any beyond that (eg; on X550)
3005 * into ERETA.
3006 */
3007 if (i < 128)
3008 IXGBE_WRITE_REG(hw, IXGBE_RETA(i >> 2), reta);
3009 else
3010 IXGBE_WRITE_REG(hw, IXGBE_ERETA((i >> 2) - 32),
3011 reta);
3012 reta = 0;
3013 }
3014 }
3015
3016 /*
3017 * Fill out hash function seeds with a random constant
3018 */
3019 for (i = 0; i < 10; i++) {
3020 (void) random_get_pseudo_bytes((uint8_t *)&random,
3021 sizeof (uint32_t));
3022 IXGBE_WRITE_REG(hw, IXGBE_RSSRK(i), random);
3023 }
3024
3025 /*
3026 * Disable Packet Checksum to enable RSS for multiple receive queues.
3027 * It is an adapter hardware limitation that Packet Checksum is
3028 * mutually exclusive with RSS.
3029 */
3030 rxcsum = IXGBE_READ_REG(hw, IXGBE_RXCSUM);
3031 rxcsum |= IXGBE_RXCSUM_PCSD;
3032 rxcsum &= ~IXGBE_RXCSUM_IPPCSE;
3033 IXGBE_WRITE_REG(hw, IXGBE_RXCSUM, rxcsum);
3034 }
3035
3036 /*
3037 * ixgbe_init_unicst - Initialize the unicast addresses.
3038 */
3039 static void
ixgbe_init_unicst(ixgbe_t * ixgbe)3040 ixgbe_init_unicst(ixgbe_t *ixgbe)
3041 {
3042 struct ixgbe_hw *hw = &ixgbe->hw;
3043 uint8_t *mac_addr;
3044 int slot;
3045 /*
3046 * Here we should consider two situations:
3047 *
3048 * 1. Chipset is initialized at the first time,
3049 * Clear all the multiple unicast addresses.
3050 *
3051 * 2. Chipset is reset
3052 * Recover the multiple unicast addresses from the
3053 * software data structure to the RAR registers.
3054 */
3055 if (!ixgbe->unicst_init) {
3056 /*
3057 * Initialize the multiple unicast addresses
3058 */
3059 ixgbe->unicst_total = hw->mac.num_rar_entries;
3060 ixgbe->unicst_avail = ixgbe->unicst_total;
3061 for (slot = 0; slot < ixgbe->unicst_total; slot++) {
3062 mac_addr = ixgbe->unicst_addr[slot].mac.addr;
3063 bzero(mac_addr, ETHERADDRL);
3064 (void) ixgbe_set_rar(hw, slot, mac_addr, NULL, NULL);
3065 ixgbe->unicst_addr[slot].mac.set = 0;
3066 }
3067 ixgbe->unicst_init = B_TRUE;
3068 } else {
3069 /* Re-configure the RAR registers */
3070 for (slot = 0; slot < ixgbe->unicst_total; slot++) {
3071 mac_addr = ixgbe->unicst_addr[slot].mac.addr;
3072 if (ixgbe->unicst_addr[slot].mac.set == 1) {
3073 (void) ixgbe_set_rar(hw, slot, mac_addr,
3074 ixgbe->unicst_addr[slot].mac.group_index,
3075 IXGBE_RAH_AV);
3076 } else {
3077 bzero(mac_addr, ETHERADDRL);
3078 (void) ixgbe_set_rar(hw, slot, mac_addr,
3079 NULL, NULL);
3080 }
3081 }
3082 }
3083 }
3084
3085 /*
3086 * ixgbe_unicst_find - Find the slot for the specified unicast address
3087 */
3088 int
ixgbe_unicst_find(ixgbe_t * ixgbe,const uint8_t * mac_addr)3089 ixgbe_unicst_find(ixgbe_t *ixgbe, const uint8_t *mac_addr)
3090 {
3091 int slot;
3092
3093 ASSERT(mutex_owned(&ixgbe->gen_lock));
3094
3095 for (slot = 0; slot < ixgbe->unicst_total; slot++) {
3096 if (bcmp(ixgbe->unicst_addr[slot].mac.addr,
3097 mac_addr, ETHERADDRL) == 0)
3098 return (slot);
3099 }
3100
3101 return (-1);
3102 }
3103
3104 /*
3105 * ixgbe_multicst_add - Add a multicst address.
3106 */
3107 int
ixgbe_multicst_add(ixgbe_t * ixgbe,const uint8_t * multiaddr)3108 ixgbe_multicst_add(ixgbe_t *ixgbe, const uint8_t *multiaddr)
3109 {
3110 ASSERT(mutex_owned(&ixgbe->gen_lock));
3111
3112 if ((multiaddr[0] & 01) == 0) {
3113 return (EINVAL);
3114 }
3115
3116 if (ixgbe->mcast_count >= MAX_NUM_MULTICAST_ADDRESSES) {
3117 return (ENOENT);
3118 }
3119
3120 bcopy(multiaddr,
3121 &ixgbe->mcast_table[ixgbe->mcast_count], ETHERADDRL);
3122 ixgbe->mcast_count++;
3123
3124 /*
3125 * Update the multicast table in the hardware
3126 */
3127 ixgbe_setup_multicst(ixgbe);
3128
3129 if (ixgbe_check_acc_handle(ixgbe->osdep.reg_handle) != DDI_FM_OK) {
3130 ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_DEGRADED);
3131 return (EIO);
3132 }
3133
3134 return (0);
3135 }
3136
3137 /*
3138 * ixgbe_multicst_remove - Remove a multicst address.
3139 */
3140 int
ixgbe_multicst_remove(ixgbe_t * ixgbe,const uint8_t * multiaddr)3141 ixgbe_multicst_remove(ixgbe_t *ixgbe, const uint8_t *multiaddr)
3142 {
3143 int i;
3144
3145 ASSERT(mutex_owned(&ixgbe->gen_lock));
3146
3147 for (i = 0; i < ixgbe->mcast_count; i++) {
3148 if (bcmp(multiaddr, &ixgbe->mcast_table[i],
3149 ETHERADDRL) == 0) {
3150 for (i++; i < ixgbe->mcast_count; i++) {
3151 ixgbe->mcast_table[i - 1] =
3152 ixgbe->mcast_table[i];
3153 }
3154 ixgbe->mcast_count--;
3155 break;
3156 }
3157 }
3158
3159 /*
3160 * Update the multicast table in the hardware
3161 */
3162 ixgbe_setup_multicst(ixgbe);
3163
3164 if (ixgbe_check_acc_handle(ixgbe->osdep.reg_handle) != DDI_FM_OK) {
3165 ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_DEGRADED);
3166 return (EIO);
3167 }
3168
3169 return (0);
3170 }
3171
3172 /*
3173 * ixgbe_setup_multicast - Setup multicast data structures.
3174 *
3175 * This routine initializes all of the multicast related structures
3176 * and save them in the hardware registers.
3177 */
3178 static void
ixgbe_setup_multicst(ixgbe_t * ixgbe)3179 ixgbe_setup_multicst(ixgbe_t *ixgbe)
3180 {
3181 uint8_t *mc_addr_list;
3182 uint32_t mc_addr_count;
3183 struct ixgbe_hw *hw = &ixgbe->hw;
3184
3185 ASSERT(mutex_owned(&ixgbe->gen_lock));
3186
3187 ASSERT(ixgbe->mcast_count <= MAX_NUM_MULTICAST_ADDRESSES);
3188
3189 mc_addr_list = (uint8_t *)ixgbe->mcast_table;
3190 mc_addr_count = ixgbe->mcast_count;
3191
3192 /*
3193 * Update the multicast addresses to the MTA registers
3194 */
3195 (void) ixgbe_update_mc_addr_list(hw, mc_addr_list, mc_addr_count,
3196 ixgbe_mc_table_itr, TRUE);
3197 }
3198
3199 /*
3200 * ixgbe_setup_vmdq_rss_conf - Configure vmdq and rss (number and mode).
3201 *
3202 * Configure the rx classification mode (vmdq & rss) and vmdq & rss numbers.
3203 * Different chipsets may have different allowed configuration of vmdq and rss.
3204 */
3205 static void
ixgbe_setup_vmdq_rss_conf(ixgbe_t * ixgbe)3206 ixgbe_setup_vmdq_rss_conf(ixgbe_t *ixgbe)
3207 {
3208 struct ixgbe_hw *hw = &ixgbe->hw;
3209 uint32_t ring_per_group;
3210
3211 switch (hw->mac.type) {
3212 case ixgbe_mac_82598EB:
3213 /*
3214 * 82598 supports the following combination:
3215 * vmdq no. x rss no.
3216 * [5..16] x 1
3217 * [1..4] x [1..16]
3218 * However 8 rss queue per pool (vmdq) is sufficient for
3219 * most cases.
3220 */
3221 ring_per_group = ixgbe->num_rx_rings / ixgbe->num_rx_groups;
3222 if (ixgbe->num_rx_groups > 4) {
3223 ixgbe->num_rx_rings = ixgbe->num_rx_groups;
3224 } else {
3225 ixgbe->num_rx_rings = ixgbe->num_rx_groups *
3226 min(8, ring_per_group);
3227 }
3228
3229 break;
3230
3231 case ixgbe_mac_82599EB:
3232 case ixgbe_mac_X540:
3233 case ixgbe_mac_X550:
3234 case ixgbe_mac_X550EM_x:
3235 /*
3236 * 82599 supports the following combination:
3237 * vmdq no. x rss no.
3238 * [33..64] x [1..2]
3239 * [2..32] x [1..4]
3240 * 1 x [1..16]
3241 * However 8 rss queue per pool (vmdq) is sufficient for
3242 * most cases.
3243 *
3244 * For now, treat X540 and X550 like the 82599.
3245 */
3246 ring_per_group = ixgbe->num_rx_rings / ixgbe->num_rx_groups;
3247 if (ixgbe->num_rx_groups == 1) {
3248 ixgbe->num_rx_rings = min(8, ring_per_group);
3249 } else if (ixgbe->num_rx_groups <= 32) {
3250 ixgbe->num_rx_rings = ixgbe->num_rx_groups *
3251 min(4, ring_per_group);
3252 } else if (ixgbe->num_rx_groups <= 64) {
3253 ixgbe->num_rx_rings = ixgbe->num_rx_groups *
3254 min(2, ring_per_group);
3255 }
3256 break;
3257
3258 default:
3259 break;
3260 }
3261
3262 ring_per_group = ixgbe->num_rx_rings / ixgbe->num_rx_groups;
3263
3264 if (ixgbe->num_rx_groups == 1 && ring_per_group == 1) {
3265 ixgbe->classify_mode = IXGBE_CLASSIFY_NONE;
3266 } else if (ixgbe->num_rx_groups != 1 && ring_per_group == 1) {
3267 ixgbe->classify_mode = IXGBE_CLASSIFY_VMDQ;
3268 } else if (ixgbe->num_rx_groups != 1 && ring_per_group != 1) {
3269 ixgbe->classify_mode = IXGBE_CLASSIFY_VMDQ_RSS;
3270 } else {
3271 ixgbe->classify_mode = IXGBE_CLASSIFY_RSS;
3272 }
3273
3274 IXGBE_DEBUGLOG_2(ixgbe, "rx group number:%d, rx ring number:%d",
3275 ixgbe->num_rx_groups, ixgbe->num_rx_rings);
3276 }
3277
3278 /*
3279 * ixgbe_get_conf - Get driver configurations set in driver.conf.
3280 *
3281 * This routine gets user-configured values out of the configuration
3282 * file ixgbe.conf.
3283 *
3284 * For each configurable value, there is a minimum, a maximum, and a
3285 * default.
3286 * If user does not configure a value, use the default.
3287 * If user configures below the minimum, use the minumum.
3288 * If user configures above the maximum, use the maxumum.
3289 */
3290 static void
ixgbe_get_conf(ixgbe_t * ixgbe)3291 ixgbe_get_conf(ixgbe_t *ixgbe)
3292 {
3293 struct ixgbe_hw *hw = &ixgbe->hw;
3294 uint32_t flow_control;
3295
3296 /*
3297 * ixgbe driver supports the following user configurations:
3298 *
3299 * Jumbo frame configuration:
3300 * default_mtu
3301 *
3302 * Ethernet flow control configuration:
3303 * flow_control
3304 *
3305 * Multiple rings configurations:
3306 * tx_queue_number
3307 * tx_ring_size
3308 * rx_queue_number
3309 * rx_ring_size
3310 *
3311 * Call ixgbe_get_prop() to get the value for a specific
3312 * configuration parameter.
3313 */
3314
3315 /*
3316 * Jumbo frame configuration - max_frame_size controls host buffer
3317 * allocation, so includes MTU, ethernet header, vlan tag and
3318 * frame check sequence.
3319 */
3320 ixgbe->default_mtu = ixgbe_get_prop(ixgbe, PROP_DEFAULT_MTU,
3321 MIN_MTU, ixgbe->capab->max_mtu, DEFAULT_MTU);
3322
3323 ixgbe->max_frame_size = ixgbe->default_mtu +
3324 sizeof (struct ether_vlan_header) + ETHERFCSL;
3325
3326 /*
3327 * Ethernet flow control configuration
3328 */
3329 flow_control = ixgbe_get_prop(ixgbe, PROP_FLOW_CONTROL,
3330 ixgbe_fc_none, 3, ixgbe_fc_none);
3331 if (flow_control == 3)
3332 flow_control = ixgbe_fc_default;
3333
3334 /*
3335 * fc.requested mode is what the user requests. After autoneg,
3336 * fc.current_mode will be the flow_control mode that was negotiated.
3337 */
3338 hw->fc.requested_mode = flow_control;
3339
3340 /*
3341 * Multiple rings configurations
3342 */
3343 ixgbe->num_tx_rings = ixgbe_get_prop(ixgbe, PROP_TX_QUEUE_NUM,
3344 ixgbe->capab->min_tx_que_num,
3345 ixgbe->capab->max_tx_que_num,
3346 ixgbe->capab->def_tx_que_num);
3347 ixgbe->tx_ring_size = ixgbe_get_prop(ixgbe, PROP_TX_RING_SIZE,
3348 MIN_TX_RING_SIZE, MAX_TX_RING_SIZE, DEFAULT_TX_RING_SIZE);
3349
3350 ixgbe->num_rx_rings = ixgbe_get_prop(ixgbe, PROP_RX_QUEUE_NUM,
3351 ixgbe->capab->min_rx_que_num,
3352 ixgbe->capab->max_rx_que_num,
3353 ixgbe->capab->def_rx_que_num);
3354 ixgbe->rx_ring_size = ixgbe_get_prop(ixgbe, PROP_RX_RING_SIZE,
3355 MIN_RX_RING_SIZE, MAX_RX_RING_SIZE, DEFAULT_RX_RING_SIZE);
3356
3357 /*
3358 * Multiple groups configuration
3359 */
3360 ixgbe->num_rx_groups = ixgbe_get_prop(ixgbe, PROP_RX_GROUP_NUM,
3361 ixgbe->capab->min_rx_grp_num, ixgbe->capab->max_rx_grp_num,
3362 ixgbe->capab->def_rx_grp_num);
3363
3364 ixgbe->mr_enable = ixgbe_get_prop(ixgbe, PROP_MR_ENABLE,
3365 0, 1, DEFAULT_MR_ENABLE);
3366
3367 if (ixgbe->mr_enable == B_FALSE) {
3368 ixgbe->num_tx_rings = 1;
3369 ixgbe->num_rx_rings = 1;
3370 ixgbe->num_rx_groups = 1;
3371 ixgbe->classify_mode = IXGBE_CLASSIFY_NONE;
3372 } else {
3373 ixgbe->num_rx_rings = ixgbe->num_rx_groups *
3374 max(ixgbe->num_rx_rings / ixgbe->num_rx_groups, 1);
3375 /*
3376 * The combination of num_rx_rings and num_rx_groups
3377 * may be not supported by h/w. We need to adjust
3378 * them to appropriate values.
3379 */
3380 ixgbe_setup_vmdq_rss_conf(ixgbe);
3381 }
3382
3383 /*
3384 * Tunable used to force an interrupt type. The only use is
3385 * for testing of the lesser interrupt types.
3386 * 0 = don't force interrupt type
3387 * 1 = force interrupt type MSI-X
3388 * 2 = force interrupt type MSI
3389 * 3 = force interrupt type Legacy
3390 */
3391 ixgbe->intr_force = ixgbe_get_prop(ixgbe, PROP_INTR_FORCE,
3392 IXGBE_INTR_NONE, IXGBE_INTR_LEGACY, IXGBE_INTR_NONE);
3393
3394 ixgbe->tx_hcksum_enable = ixgbe_get_prop(ixgbe, PROP_TX_HCKSUM_ENABLE,
3395 0, 1, DEFAULT_TX_HCKSUM_ENABLE);
3396 ixgbe->rx_hcksum_enable = ixgbe_get_prop(ixgbe, PROP_RX_HCKSUM_ENABLE,
3397 0, 1, DEFAULT_RX_HCKSUM_ENABLE);
3398 ixgbe->lso_enable = ixgbe_get_prop(ixgbe, PROP_LSO_ENABLE,
3399 0, 1, DEFAULT_LSO_ENABLE);
3400 ixgbe->lro_enable = ixgbe_get_prop(ixgbe, PROP_LRO_ENABLE,
3401 0, 1, DEFAULT_LRO_ENABLE);
3402 ixgbe->tx_head_wb_enable = ixgbe_get_prop(ixgbe, PROP_TX_HEAD_WB_ENABLE,
3403 0, 1, DEFAULT_TX_HEAD_WB_ENABLE);
3404 ixgbe->relax_order_enable = ixgbe_get_prop(ixgbe,
3405 PROP_RELAX_ORDER_ENABLE, 0, 1, DEFAULT_RELAX_ORDER_ENABLE);
3406
3407 /* Head Write Back not recommended for 82599, X540 and X550 */
3408 if (hw->mac.type == ixgbe_mac_82599EB ||
3409 hw->mac.type == ixgbe_mac_X540 ||
3410 hw->mac.type == ixgbe_mac_X550 ||
3411 hw->mac.type == ixgbe_mac_X550EM_x) {
3412 ixgbe->tx_head_wb_enable = B_FALSE;
3413 }
3414
3415 /*
3416 * ixgbe LSO needs the tx h/w checksum support.
3417 * LSO will be disabled if tx h/w checksum is not
3418 * enabled.
3419 */
3420 if (ixgbe->tx_hcksum_enable == B_FALSE) {
3421 ixgbe->lso_enable = B_FALSE;
3422 }
3423
3424 /*
3425 * ixgbe LRO needs the rx h/w checksum support.
3426 * LRO will be disabled if rx h/w checksum is not
3427 * enabled.
3428 */
3429 if (ixgbe->rx_hcksum_enable == B_FALSE) {
3430 ixgbe->lro_enable = B_FALSE;
3431 }
3432
3433 /*
3434 * ixgbe LRO only supported by 82599, X540 and X550
3435 */
3436 if (hw->mac.type == ixgbe_mac_82598EB) {
3437 ixgbe->lro_enable = B_FALSE;
3438 }
3439 ixgbe->tx_copy_thresh = ixgbe_get_prop(ixgbe, PROP_TX_COPY_THRESHOLD,
3440 MIN_TX_COPY_THRESHOLD, MAX_TX_COPY_THRESHOLD,
3441 DEFAULT_TX_COPY_THRESHOLD);
3442 ixgbe->tx_recycle_thresh = ixgbe_get_prop(ixgbe,
3443 PROP_TX_RECYCLE_THRESHOLD, MIN_TX_RECYCLE_THRESHOLD,
3444 MAX_TX_RECYCLE_THRESHOLD, DEFAULT_TX_RECYCLE_THRESHOLD);
3445 ixgbe->tx_overload_thresh = ixgbe_get_prop(ixgbe,
3446 PROP_TX_OVERLOAD_THRESHOLD, MIN_TX_OVERLOAD_THRESHOLD,
3447 MAX_TX_OVERLOAD_THRESHOLD, DEFAULT_TX_OVERLOAD_THRESHOLD);
3448 ixgbe->tx_resched_thresh = ixgbe_get_prop(ixgbe,
3449 PROP_TX_RESCHED_THRESHOLD, MIN_TX_RESCHED_THRESHOLD,
3450 MAX_TX_RESCHED_THRESHOLD, DEFAULT_TX_RESCHED_THRESHOLD);
3451
3452 ixgbe->rx_copy_thresh = ixgbe_get_prop(ixgbe, PROP_RX_COPY_THRESHOLD,
3453 MIN_RX_COPY_THRESHOLD, MAX_RX_COPY_THRESHOLD,
3454 DEFAULT_RX_COPY_THRESHOLD);
3455 ixgbe->rx_limit_per_intr = ixgbe_get_prop(ixgbe, PROP_RX_LIMIT_PER_INTR,
3456 MIN_RX_LIMIT_PER_INTR, MAX_RX_LIMIT_PER_INTR,
3457 DEFAULT_RX_LIMIT_PER_INTR);
3458
3459 ixgbe->intr_throttling[0] = ixgbe_get_prop(ixgbe, PROP_INTR_THROTTLING,
3460 ixgbe->capab->min_intr_throttle,
3461 ixgbe->capab->max_intr_throttle,
3462 ixgbe->capab->def_intr_throttle);
3463 /*
3464 * 82599, X540 and X550 require the interrupt throttling rate is
3465 * a multiple of 8. This is enforced by the register definiton.
3466 */
3467 if (hw->mac.type == ixgbe_mac_82599EB ||
3468 hw->mac.type == ixgbe_mac_X540 ||
3469 hw->mac.type == ixgbe_mac_X550 ||
3470 hw->mac.type == ixgbe_mac_X550EM_x)
3471 ixgbe->intr_throttling[0] = ixgbe->intr_throttling[0] & 0xFF8;
3472
3473 hw->allow_unsupported_sfp = ixgbe_get_prop(ixgbe,
3474 PROP_ALLOW_UNSUPPORTED_SFP, 0, 1, DEFAULT_ALLOW_UNSUPPORTED_SFP);
3475 }
3476
3477 static void
ixgbe_init_params(ixgbe_t * ixgbe)3478 ixgbe_init_params(ixgbe_t *ixgbe)
3479 {
3480 struct ixgbe_hw *hw = &ixgbe->hw;
3481 ixgbe_link_speed speeds_supported = 0;
3482 boolean_t negotiate;
3483
3484 /*
3485 * Get a list of speeds the adapter supports. If the hw struct hasn't
3486 * been populated with this information yet, retrieve it from the
3487 * adapter and save it to our own variable.
3488 *
3489 * On certain adapters, such as ones which use SFPs, the contents of
3490 * hw->phy.speeds_supported (and hw->phy.autoneg_advertised) are not
3491 * updated, so we must rely on calling ixgbe_get_link_capabilities()
3492 * in order to ascertain the speeds which we are capable of supporting,
3493 * and in the case of SFP-equipped adapters, which speed we are
3494 * advertising. If ixgbe_get_link_capabilities() fails for some reason,
3495 * we'll go with a default list of speeds as a last resort.
3496 */
3497 speeds_supported = hw->phy.speeds_supported;
3498
3499 if (speeds_supported == 0) {
3500 if (ixgbe_get_link_capabilities(hw, &speeds_supported,
3501 &negotiate) != IXGBE_SUCCESS) {
3502 if (hw->mac.type == ixgbe_mac_82598EB) {
3503 speeds_supported =
3504 IXGBE_LINK_SPEED_82598_AUTONEG;
3505 } else {
3506 speeds_supported =
3507 IXGBE_LINK_SPEED_82599_AUTONEG;
3508 }
3509 }
3510 }
3511 ixgbe->speeds_supported = speeds_supported;
3512
3513 /*
3514 * By default, all supported speeds are enabled and advertised.
3515 */
3516 if (speeds_supported & IXGBE_LINK_SPEED_10GB_FULL) {
3517 ixgbe->param_en_10000fdx_cap = 1;
3518 ixgbe->param_adv_10000fdx_cap = 1;
3519 } else {
3520 ixgbe->param_en_10000fdx_cap = 0;
3521 ixgbe->param_adv_10000fdx_cap = 0;
3522 }
3523
3524 if (speeds_supported & IXGBE_LINK_SPEED_5GB_FULL) {
3525 ixgbe->param_en_5000fdx_cap = 1;
3526 ixgbe->param_adv_5000fdx_cap = 1;
3527 } else {
3528 ixgbe->param_en_5000fdx_cap = 0;
3529 ixgbe->param_adv_5000fdx_cap = 0;
3530 }
3531
3532 if (speeds_supported & IXGBE_LINK_SPEED_2_5GB_FULL) {
3533 ixgbe->param_en_2500fdx_cap = 1;
3534 ixgbe->param_adv_2500fdx_cap = 1;
3535 } else {
3536 ixgbe->param_en_2500fdx_cap = 0;
3537 ixgbe->param_adv_2500fdx_cap = 0;
3538 }
3539
3540 if (speeds_supported & IXGBE_LINK_SPEED_1GB_FULL) {
3541 ixgbe->param_en_1000fdx_cap = 1;
3542 ixgbe->param_adv_1000fdx_cap = 1;
3543 } else {
3544 ixgbe->param_en_1000fdx_cap = 0;
3545 ixgbe->param_adv_1000fdx_cap = 0;
3546 }
3547
3548 if (speeds_supported & IXGBE_LINK_SPEED_100_FULL) {
3549 ixgbe->param_en_100fdx_cap = 1;
3550 ixgbe->param_adv_100fdx_cap = 1;
3551 } else {
3552 ixgbe->param_en_100fdx_cap = 0;
3553 ixgbe->param_adv_100fdx_cap = 0;
3554 }
3555
3556 ixgbe->param_pause_cap = 1;
3557 ixgbe->param_asym_pause_cap = 1;
3558 ixgbe->param_rem_fault = 0;
3559
3560 ixgbe->param_adv_autoneg_cap = 1;
3561 ixgbe->param_adv_pause_cap = 1;
3562 ixgbe->param_adv_asym_pause_cap = 1;
3563 ixgbe->param_adv_rem_fault = 0;
3564
3565 ixgbe->param_lp_10000fdx_cap = 0;
3566 ixgbe->param_lp_5000fdx_cap = 0;
3567 ixgbe->param_lp_2500fdx_cap = 0;
3568 ixgbe->param_lp_1000fdx_cap = 0;
3569 ixgbe->param_lp_100fdx_cap = 0;
3570 ixgbe->param_lp_autoneg_cap = 0;
3571 ixgbe->param_lp_pause_cap = 0;
3572 ixgbe->param_lp_asym_pause_cap = 0;
3573 ixgbe->param_lp_rem_fault = 0;
3574 }
3575
3576 /*
3577 * ixgbe_get_prop - Get a property value out of the configuration file
3578 * ixgbe.conf.
3579 *
3580 * Caller provides the name of the property, a default value, a minimum
3581 * value, and a maximum value.
3582 *
3583 * Return configured value of the property, with default, minimum and
3584 * maximum properly applied.
3585 */
3586 static int
ixgbe_get_prop(ixgbe_t * ixgbe,char * propname,int minval,int maxval,int defval)3587 ixgbe_get_prop(ixgbe_t *ixgbe,
3588 char *propname, /* name of the property */
3589 int minval, /* minimum acceptable value */
3590 int maxval, /* maximim acceptable value */
3591 int defval) /* default value */
3592 {
3593 int value;
3594
3595 /*
3596 * Call ddi_prop_get_int() to read the conf settings
3597 */
3598 value = ddi_prop_get_int(DDI_DEV_T_ANY, ixgbe->dip,
3599 DDI_PROP_DONTPASS, propname, defval);
3600 if (value > maxval)
3601 value = maxval;
3602
3603 if (value < minval)
3604 value = minval;
3605
3606 return (value);
3607 }
3608
3609 /*
3610 * ixgbe_driver_setup_link - Using the link properties to setup the link.
3611 */
3612 int
ixgbe_driver_setup_link(ixgbe_t * ixgbe,boolean_t setup_hw)3613 ixgbe_driver_setup_link(ixgbe_t *ixgbe, boolean_t setup_hw)
3614 {
3615 struct ixgbe_hw *hw = &ixgbe->hw;
3616 ixgbe_link_speed advertised = 0;
3617
3618 /*
3619 * Assemble a list of enabled speeds to auto-negotiate with.
3620 */
3621 if (ixgbe->param_en_10000fdx_cap == 1)
3622 advertised |= IXGBE_LINK_SPEED_10GB_FULL;
3623
3624 if (ixgbe->param_en_5000fdx_cap == 1)
3625 advertised |= IXGBE_LINK_SPEED_5GB_FULL;
3626
3627 if (ixgbe->param_en_2500fdx_cap == 1)
3628 advertised |= IXGBE_LINK_SPEED_2_5GB_FULL;
3629
3630 if (ixgbe->param_en_1000fdx_cap == 1)
3631 advertised |= IXGBE_LINK_SPEED_1GB_FULL;
3632
3633 if (ixgbe->param_en_100fdx_cap == 1)
3634 advertised |= IXGBE_LINK_SPEED_100_FULL;
3635
3636 /*
3637 * As a last resort, autoneg with a default list of speeds.
3638 */
3639 if (ixgbe->param_adv_autoneg_cap == 1 && advertised == 0) {
3640 ixgbe_notice(ixgbe, "Invalid link settings. Setting link "
3641 "to autonegotiate with full capabilities.");
3642
3643 if (hw->mac.type == ixgbe_mac_82598EB)
3644 advertised = IXGBE_LINK_SPEED_82598_AUTONEG;
3645 else
3646 advertised = IXGBE_LINK_SPEED_82599_AUTONEG;
3647 }
3648
3649 if (setup_hw) {
3650 if (ixgbe_setup_link(&ixgbe->hw, advertised,
3651 ixgbe->param_adv_autoneg_cap) != IXGBE_SUCCESS) {
3652 ixgbe_notice(ixgbe, "Setup link failed on this "
3653 "device.");
3654 return (IXGBE_FAILURE);
3655 }
3656 }
3657
3658 return (IXGBE_SUCCESS);
3659 }
3660
3661 /*
3662 * ixgbe_driver_link_check - Link status processing.
3663 *
3664 * This function can be called in both kernel context and interrupt context
3665 */
3666 static void
ixgbe_driver_link_check(ixgbe_t * ixgbe)3667 ixgbe_driver_link_check(ixgbe_t *ixgbe)
3668 {
3669 struct ixgbe_hw *hw = &ixgbe->hw;
3670 ixgbe_link_speed speed = IXGBE_LINK_SPEED_UNKNOWN;
3671 boolean_t link_up = B_FALSE;
3672 boolean_t link_changed = B_FALSE;
3673
3674 ASSERT(mutex_owned(&ixgbe->gen_lock));
3675
3676 (void) ixgbe_check_link(hw, &speed, &link_up, B_FALSE);
3677 if (link_up) {
3678 ixgbe->link_check_complete = B_TRUE;
3679
3680 /* Link is up, enable flow control settings */
3681 (void) ixgbe_fc_enable(hw);
3682
3683 /*
3684 * The Link is up, check whether it was marked as down earlier
3685 */
3686 if (ixgbe->link_state != LINK_STATE_UP) {
3687 switch (speed) {
3688 case IXGBE_LINK_SPEED_10GB_FULL:
3689 ixgbe->link_speed = SPEED_10GB;
3690 break;
3691 case IXGBE_LINK_SPEED_5GB_FULL:
3692 ixgbe->link_speed = SPEED_5GB;
3693 break;
3694 case IXGBE_LINK_SPEED_2_5GB_FULL:
3695 ixgbe->link_speed = SPEED_2_5GB;
3696 break;
3697 case IXGBE_LINK_SPEED_1GB_FULL:
3698 ixgbe->link_speed = SPEED_1GB;
3699 break;
3700 case IXGBE_LINK_SPEED_100_FULL:
3701 ixgbe->link_speed = SPEED_100;
3702 }
3703 ixgbe->link_duplex = LINK_DUPLEX_FULL;
3704 ixgbe->link_state = LINK_STATE_UP;
3705 link_changed = B_TRUE;
3706 }
3707 } else {
3708 if (ixgbe->link_check_complete == B_TRUE ||
3709 (ixgbe->link_check_complete == B_FALSE &&
3710 gethrtime() >= ixgbe->link_check_hrtime)) {
3711 /*
3712 * The link is really down
3713 */
3714 ixgbe->link_check_complete = B_TRUE;
3715
3716 if (ixgbe->link_state != LINK_STATE_DOWN) {
3717 ixgbe->link_speed = 0;
3718 ixgbe->link_duplex = LINK_DUPLEX_UNKNOWN;
3719 ixgbe->link_state = LINK_STATE_DOWN;
3720 link_changed = B_TRUE;
3721 }
3722 }
3723 }
3724
3725 /*
3726 * If we are in an interrupt context, need to re-enable the
3727 * interrupt, which was automasked
3728 */
3729 if (servicing_interrupt() != 0) {
3730 ixgbe->eims |= IXGBE_EICR_LSC;
3731 IXGBE_WRITE_REG(hw, IXGBE_EIMS, ixgbe->eims);
3732 }
3733
3734 if (link_changed) {
3735 mac_link_update(ixgbe->mac_hdl, ixgbe->link_state);
3736 }
3737 }
3738
3739 /*
3740 * ixgbe_sfp_check - sfp module processing done in taskq only for 82599.
3741 */
3742 static void
ixgbe_sfp_check(void * arg)3743 ixgbe_sfp_check(void *arg)
3744 {
3745 ixgbe_t *ixgbe = (ixgbe_t *)arg;
3746 uint32_t eicr = ixgbe->eicr;
3747 struct ixgbe_hw *hw = &ixgbe->hw;
3748
3749 mutex_enter(&ixgbe->gen_lock);
3750 (void) hw->phy.ops.identify_sfp(hw);
3751 if (eicr & IXGBE_EICR_GPI_SDP1_BY_MAC(hw)) {
3752 /* clear the interrupt */
3753 IXGBE_WRITE_REG(hw, IXGBE_EICR, IXGBE_EICR_GPI_SDP1_BY_MAC(hw));
3754
3755 /* if link up, do multispeed fiber setup */
3756 (void) ixgbe_setup_link(hw, IXGBE_LINK_SPEED_82599_AUTONEG,
3757 B_TRUE);
3758 ixgbe_driver_link_check(ixgbe);
3759 ixgbe_get_hw_state(ixgbe);
3760 } else if (eicr & IXGBE_EICR_GPI_SDP2_BY_MAC(hw)) {
3761 /* clear the interrupt */
3762 IXGBE_WRITE_REG(hw, IXGBE_EICR, IXGBE_EICR_GPI_SDP2_BY_MAC(hw));
3763
3764 /* if link up, do sfp module setup */
3765 (void) hw->mac.ops.setup_sfp(hw);
3766
3767 /* do multispeed fiber setup */
3768 (void) ixgbe_setup_link(hw, IXGBE_LINK_SPEED_82599_AUTONEG,
3769 B_TRUE);
3770 ixgbe_driver_link_check(ixgbe);
3771 ixgbe_get_hw_state(ixgbe);
3772 }
3773 mutex_exit(&ixgbe->gen_lock);
3774
3775 /*
3776 * We need to fully re-check the link later.
3777 */
3778 ixgbe->link_check_complete = B_FALSE;
3779 ixgbe->link_check_hrtime = gethrtime() +
3780 (IXGBE_LINK_UP_TIME * 100000000ULL);
3781 }
3782
3783 /*
3784 * ixgbe_overtemp_check - overtemp module processing done in taskq
3785 *
3786 * This routine will only be called on adapters with temperature sensor.
3787 * The indication of over-temperature can be either SDP0 interrupt or the link
3788 * status change interrupt.
3789 */
3790 static void
ixgbe_overtemp_check(void * arg)3791 ixgbe_overtemp_check(void *arg)
3792 {
3793 ixgbe_t *ixgbe = (ixgbe_t *)arg;
3794 struct ixgbe_hw *hw = &ixgbe->hw;
3795 uint32_t eicr = ixgbe->eicr;
3796 ixgbe_link_speed speed;
3797 boolean_t link_up;
3798
3799 mutex_enter(&ixgbe->gen_lock);
3800
3801 /* make sure we know current state of link */
3802 (void) ixgbe_check_link(hw, &speed, &link_up, B_FALSE);
3803
3804 /* check over-temp condition */
3805 if (((eicr & IXGBE_EICR_GPI_SDP0_BY_MAC(hw)) && (!link_up)) ||
3806 (eicr & IXGBE_EICR_LSC)) {
3807 if (hw->phy.ops.check_overtemp(hw) == IXGBE_ERR_OVERTEMP) {
3808 atomic_or_32(&ixgbe->ixgbe_state, IXGBE_OVERTEMP);
3809
3810 /*
3811 * Disable the adapter interrupts
3812 */
3813 ixgbe_disable_adapter_interrupts(ixgbe);
3814
3815 /*
3816 * Disable Rx/Tx units
3817 */
3818 (void) ixgbe_stop_adapter(hw);
3819
3820 ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_LOST);
3821 ixgbe_error(ixgbe,
3822 "Problem: Network adapter has been stopped "
3823 "because it has overheated");
3824 ixgbe_error(ixgbe,
3825 "Action: Restart the computer. "
3826 "If the problem persists, power off the system "
3827 "and replace the adapter");
3828 }
3829 }
3830
3831 /* write to clear the interrupt */
3832 IXGBE_WRITE_REG(hw, IXGBE_EICR, eicr);
3833
3834 mutex_exit(&ixgbe->gen_lock);
3835 }
3836
3837 /*
3838 * ixgbe_phy_check - taskq to process interrupts from an external PHY
3839 *
3840 * This routine will only be called on adapters with external PHYs
3841 * (such as X550) that may be trying to raise our attention to some event.
3842 * Currently, this is limited to claiming PHY overtemperature and link status
3843 * change (LSC) events, however this may expand to include other things in
3844 * future adapters.
3845 */
3846 static void
ixgbe_phy_check(void * arg)3847 ixgbe_phy_check(void *arg)
3848 {
3849 ixgbe_t *ixgbe = (ixgbe_t *)arg;
3850 struct ixgbe_hw *hw = &ixgbe->hw;
3851 int rv;
3852
3853 mutex_enter(&ixgbe->gen_lock);
3854
3855 /*
3856 * X550 baseT PHY overtemp and LSC events are handled here.
3857 *
3858 * If an overtemp event occurs, it will be reflected in the
3859 * return value of phy.ops.handle_lasi() and the common code will
3860 * automatically power off the baseT PHY. This is our cue to trigger
3861 * an FMA event.
3862 *
3863 * If a link status change event occurs, phy.ops.handle_lasi() will
3864 * automatically initiate a link setup between the integrated KR PHY
3865 * and the external X557 PHY to ensure that the link speed between
3866 * them matches the link speed of the baseT link.
3867 */
3868 rv = ixgbe_handle_lasi(hw);
3869
3870 if (rv == IXGBE_ERR_OVERTEMP) {
3871 atomic_or_32(&ixgbe->ixgbe_state, IXGBE_OVERTEMP);
3872
3873 /*
3874 * Disable the adapter interrupts
3875 */
3876 ixgbe_disable_adapter_interrupts(ixgbe);
3877
3878 /*
3879 * Disable Rx/Tx units
3880 */
3881 (void) ixgbe_stop_adapter(hw);
3882
3883 ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_LOST);
3884 ixgbe_error(ixgbe,
3885 "Problem: Network adapter has been stopped due to a "
3886 "overtemperature event being detected.");
3887 ixgbe_error(ixgbe,
3888 "Action: Shut down or restart the computer. If the issue "
3889 "persists, please take action in accordance with the "
3890 "recommendations from your system vendor.");
3891 }
3892
3893 mutex_exit(&ixgbe->gen_lock);
3894 }
3895
3896 /*
3897 * ixgbe_link_timer - timer for link status detection
3898 */
3899 static void
ixgbe_link_timer(void * arg)3900 ixgbe_link_timer(void *arg)
3901 {
3902 ixgbe_t *ixgbe = (ixgbe_t *)arg;
3903
3904 mutex_enter(&ixgbe->gen_lock);
3905 ixgbe_driver_link_check(ixgbe);
3906 mutex_exit(&ixgbe->gen_lock);
3907 }
3908
3909 /*
3910 * ixgbe_local_timer - Driver watchdog function.
3911 *
3912 * This function will handle the transmit stall check and other routines.
3913 */
3914 static void
ixgbe_local_timer(void * arg)3915 ixgbe_local_timer(void *arg)
3916 {
3917 ixgbe_t *ixgbe = (ixgbe_t *)arg;
3918
3919 if (ixgbe->ixgbe_state & IXGBE_OVERTEMP)
3920 goto out;
3921
3922 if (ixgbe->ixgbe_state & IXGBE_ERROR) {
3923 ixgbe->reset_count++;
3924 if (ixgbe_reset(ixgbe) == IXGBE_SUCCESS)
3925 ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_RESTORED);
3926 goto out;
3927 }
3928
3929 if (ixgbe_stall_check(ixgbe)) {
3930 atomic_or_32(&ixgbe->ixgbe_state, IXGBE_STALL);
3931 ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_DEGRADED);
3932
3933 ixgbe->reset_count++;
3934 if (ixgbe_reset(ixgbe) == IXGBE_SUCCESS)
3935 ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_RESTORED);
3936 }
3937
3938 out:
3939 ixgbe_restart_watchdog_timer(ixgbe);
3940 }
3941
3942 /*
3943 * ixgbe_stall_check - Check for transmit stall.
3944 *
3945 * This function checks if the adapter is stalled (in transmit).
3946 *
3947 * It is called each time the watchdog timeout is invoked.
3948 * If the transmit descriptor reclaim continuously fails,
3949 * the watchdog value will increment by 1. If the watchdog
3950 * value exceeds the threshold, the ixgbe is assumed to
3951 * have stalled and need to be reset.
3952 */
3953 static boolean_t
ixgbe_stall_check(ixgbe_t * ixgbe)3954 ixgbe_stall_check(ixgbe_t *ixgbe)
3955 {
3956 ixgbe_tx_ring_t *tx_ring;
3957 boolean_t result;
3958 int i;
3959
3960 if (ixgbe->link_state != LINK_STATE_UP)
3961 return (B_FALSE);
3962
3963 /*
3964 * If any tx ring is stalled, we'll reset the chipset
3965 */
3966 result = B_FALSE;
3967 for (i = 0; i < ixgbe->num_tx_rings; i++) {
3968 tx_ring = &ixgbe->tx_rings[i];
3969 if (tx_ring->tbd_free <= ixgbe->tx_recycle_thresh) {
3970 tx_ring->tx_recycle(tx_ring);
3971 }
3972
3973 if (tx_ring->recycle_fail > 0)
3974 tx_ring->stall_watchdog++;
3975 else
3976 tx_ring->stall_watchdog = 0;
3977
3978 if (tx_ring->stall_watchdog >= STALL_WATCHDOG_TIMEOUT) {
3979 result = B_TRUE;
3980 break;
3981 }
3982 }
3983
3984 if (result) {
3985 tx_ring->stall_watchdog = 0;
3986 tx_ring->recycle_fail = 0;
3987 }
3988
3989 return (result);
3990 }
3991
3992
3993 /*
3994 * is_valid_mac_addr - Check if the mac address is valid.
3995 */
3996 static boolean_t
is_valid_mac_addr(uint8_t * mac_addr)3997 is_valid_mac_addr(uint8_t *mac_addr)
3998 {
3999 const uint8_t addr_test1[6] = { 0, 0, 0, 0, 0, 0 };
4000 const uint8_t addr_test2[6] =
4001 { 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF };
4002
4003 if (!(bcmp(addr_test1, mac_addr, ETHERADDRL)) ||
4004 !(bcmp(addr_test2, mac_addr, ETHERADDRL)))
4005 return (B_FALSE);
4006
4007 return (B_TRUE);
4008 }
4009
4010 static boolean_t
ixgbe_find_mac_address(ixgbe_t * ixgbe)4011 ixgbe_find_mac_address(ixgbe_t *ixgbe)
4012 {
4013 #ifdef __sparc
4014 struct ixgbe_hw *hw = &ixgbe->hw;
4015 uchar_t *bytes;
4016 struct ether_addr sysaddr;
4017 uint_t nelts;
4018 int err;
4019 boolean_t found = B_FALSE;
4020
4021 /*
4022 * The "vendor's factory-set address" may already have
4023 * been extracted from the chip, but if the property
4024 * "local-mac-address" is set we use that instead.
4025 *
4026 * We check whether it looks like an array of 6
4027 * bytes (which it should, if OBP set it). If we can't
4028 * make sense of it this way, we'll ignore it.
4029 */
4030 err = ddi_prop_lookup_byte_array(DDI_DEV_T_ANY, ixgbe->dip,
4031 DDI_PROP_DONTPASS, "local-mac-address", &bytes, &nelts);
4032 if (err == DDI_PROP_SUCCESS) {
4033 if (nelts == ETHERADDRL) {
4034 while (nelts--)
4035 hw->mac.addr[nelts] = bytes[nelts];
4036 found = B_TRUE;
4037 }
4038 ddi_prop_free(bytes);
4039 }
4040
4041 /*
4042 * Look up the OBP property "local-mac-address?". If the user has set
4043 * 'local-mac-address? = false', use "the system address" instead.
4044 */
4045 if (ddi_prop_lookup_byte_array(DDI_DEV_T_ANY, ixgbe->dip, 0,
4046 "local-mac-address?", &bytes, &nelts) == DDI_PROP_SUCCESS) {
4047 if (strncmp("false", (caddr_t)bytes, (size_t)nelts) == 0) {
4048 if (localetheraddr(NULL, &sysaddr) != 0) {
4049 bcopy(&sysaddr, hw->mac.addr, ETHERADDRL);
4050 found = B_TRUE;
4051 }
4052 }
4053 ddi_prop_free(bytes);
4054 }
4055
4056 /*
4057 * Finally(!), if there's a valid "mac-address" property (created
4058 * if we netbooted from this interface), we must use this instead
4059 * of any of the above to ensure that the NFS/install server doesn't
4060 * get confused by the address changing as illumos takes over!
4061 */
4062 err = ddi_prop_lookup_byte_array(DDI_DEV_T_ANY, ixgbe->dip,
4063 DDI_PROP_DONTPASS, "mac-address", &bytes, &nelts);
4064 if (err == DDI_PROP_SUCCESS) {
4065 if (nelts == ETHERADDRL) {
4066 while (nelts--)
4067 hw->mac.addr[nelts] = bytes[nelts];
4068 found = B_TRUE;
4069 }
4070 ddi_prop_free(bytes);
4071 }
4072
4073 if (found) {
4074 bcopy(hw->mac.addr, hw->mac.perm_addr, ETHERADDRL);
4075 return (B_TRUE);
4076 }
4077 #else
4078 _NOTE(ARGUNUSED(ixgbe));
4079 #endif
4080
4081 return (B_TRUE);
4082 }
4083
4084 #pragma inline(ixgbe_arm_watchdog_timer)
4085 static void
ixgbe_arm_watchdog_timer(ixgbe_t * ixgbe)4086 ixgbe_arm_watchdog_timer(ixgbe_t *ixgbe)
4087 {
4088 /*
4089 * Fire a watchdog timer
4090 */
4091 ixgbe->watchdog_tid =
4092 timeout(ixgbe_local_timer,
4093 (void *)ixgbe, 1 * drv_usectohz(1000000));
4094
4095 }
4096
4097 /*
4098 * ixgbe_enable_watchdog_timer - Enable and start the driver watchdog timer.
4099 */
4100 void
ixgbe_enable_watchdog_timer(ixgbe_t * ixgbe)4101 ixgbe_enable_watchdog_timer(ixgbe_t *ixgbe)
4102 {
4103 mutex_enter(&ixgbe->watchdog_lock);
4104
4105 if (!ixgbe->watchdog_enable) {
4106 ixgbe->watchdog_enable = B_TRUE;
4107 ixgbe->watchdog_start = B_TRUE;
4108 ixgbe_arm_watchdog_timer(ixgbe);
4109 }
4110
4111 mutex_exit(&ixgbe->watchdog_lock);
4112 }
4113
4114 /*
4115 * ixgbe_disable_watchdog_timer - Disable and stop the driver watchdog timer.
4116 */
4117 void
ixgbe_disable_watchdog_timer(ixgbe_t * ixgbe)4118 ixgbe_disable_watchdog_timer(ixgbe_t *ixgbe)
4119 {
4120 timeout_id_t tid;
4121
4122 mutex_enter(&ixgbe->watchdog_lock);
4123
4124 ixgbe->watchdog_enable = B_FALSE;
4125 ixgbe->watchdog_start = B_FALSE;
4126 tid = ixgbe->watchdog_tid;
4127 ixgbe->watchdog_tid = 0;
4128
4129 mutex_exit(&ixgbe->watchdog_lock);
4130
4131 if (tid != 0)
4132 (void) untimeout(tid);
4133 }
4134
4135 /*
4136 * ixgbe_start_watchdog_timer - Start the driver watchdog timer.
4137 */
4138 void
ixgbe_start_watchdog_timer(ixgbe_t * ixgbe)4139 ixgbe_start_watchdog_timer(ixgbe_t *ixgbe)
4140 {
4141 mutex_enter(&ixgbe->watchdog_lock);
4142
4143 if (ixgbe->watchdog_enable) {
4144 if (!ixgbe->watchdog_start) {
4145 ixgbe->watchdog_start = B_TRUE;
4146 ixgbe_arm_watchdog_timer(ixgbe);
4147 }
4148 }
4149
4150 mutex_exit(&ixgbe->watchdog_lock);
4151 }
4152
4153 /*
4154 * ixgbe_restart_watchdog_timer - Restart the driver watchdog timer.
4155 */
4156 static void
ixgbe_restart_watchdog_timer(ixgbe_t * ixgbe)4157 ixgbe_restart_watchdog_timer(ixgbe_t *ixgbe)
4158 {
4159 mutex_enter(&ixgbe->watchdog_lock);
4160
4161 if (ixgbe->watchdog_start)
4162 ixgbe_arm_watchdog_timer(ixgbe);
4163
4164 mutex_exit(&ixgbe->watchdog_lock);
4165 }
4166
4167 /*
4168 * ixgbe_stop_watchdog_timer - Stop the driver watchdog timer.
4169 */
4170 void
ixgbe_stop_watchdog_timer(ixgbe_t * ixgbe)4171 ixgbe_stop_watchdog_timer(ixgbe_t *ixgbe)
4172 {
4173 timeout_id_t tid;
4174
4175 mutex_enter(&ixgbe->watchdog_lock);
4176
4177 ixgbe->watchdog_start = B_FALSE;
4178 tid = ixgbe->watchdog_tid;
4179 ixgbe->watchdog_tid = 0;
4180
4181 mutex_exit(&ixgbe->watchdog_lock);
4182
4183 if (tid != 0)
4184 (void) untimeout(tid);
4185 }
4186
4187 /*
4188 * ixgbe_disable_adapter_interrupts - Disable all adapter interrupts.
4189 */
4190 static void
ixgbe_disable_adapter_interrupts(ixgbe_t * ixgbe)4191 ixgbe_disable_adapter_interrupts(ixgbe_t *ixgbe)
4192 {
4193 struct ixgbe_hw *hw = &ixgbe->hw;
4194
4195 /*
4196 * mask all interrupts off
4197 */
4198 IXGBE_WRITE_REG(hw, IXGBE_EIMC, 0xffffffff);
4199
4200 /*
4201 * for MSI-X, also disable autoclear
4202 */
4203 if (ixgbe->intr_type == DDI_INTR_TYPE_MSIX) {
4204 IXGBE_WRITE_REG(hw, IXGBE_EIAC, 0x0);
4205 }
4206
4207 IXGBE_WRITE_FLUSH(hw);
4208 }
4209
4210 /*
4211 * ixgbe_enable_adapter_interrupts - Enable all hardware interrupts.
4212 */
4213 static void
ixgbe_enable_adapter_interrupts(ixgbe_t * ixgbe)4214 ixgbe_enable_adapter_interrupts(ixgbe_t *ixgbe)
4215 {
4216 struct ixgbe_hw *hw = &ixgbe->hw;
4217 uint32_t eiac, eiam;
4218 uint32_t gpie = IXGBE_READ_REG(hw, IXGBE_GPIE);
4219
4220 /* interrupt types to enable */
4221 ixgbe->eims = IXGBE_EIMS_ENABLE_MASK; /* shared code default */
4222 ixgbe->eims &= ~IXGBE_EIMS_TCP_TIMER; /* minus tcp timer */
4223 ixgbe->eims |= ixgbe->capab->other_intr; /* "other" interrupt types */
4224
4225 /* enable automask on "other" causes that this adapter can generate */
4226 eiam = ixgbe->capab->other_intr;
4227
4228 /*
4229 * msi-x mode
4230 */
4231 if (ixgbe->intr_type == DDI_INTR_TYPE_MSIX) {
4232 /* enable autoclear but not on bits 29:20 */
4233 eiac = (ixgbe->eims & ~IXGBE_OTHER_INTR);
4234
4235 /* general purpose interrupt enable */
4236 gpie |= (IXGBE_GPIE_MSIX_MODE
4237 | IXGBE_GPIE_PBA_SUPPORT
4238 | IXGBE_GPIE_OCD
4239 | IXGBE_GPIE_EIAME);
4240 /*
4241 * non-msi-x mode
4242 */
4243 } else {
4244
4245 /* disable autoclear, leave gpie at default */
4246 eiac = 0;
4247
4248 /*
4249 * General purpose interrupt enable.
4250 * For 82599, X540 and X550, extended interrupt
4251 * automask enable only in MSI or MSI-X mode
4252 */
4253 if ((hw->mac.type == ixgbe_mac_82598EB) ||
4254 (ixgbe->intr_type == DDI_INTR_TYPE_MSI)) {
4255 gpie |= IXGBE_GPIE_EIAME;
4256 }
4257 }
4258
4259 /* Enable specific "other" interrupt types */
4260 switch (hw->mac.type) {
4261 case ixgbe_mac_82598EB:
4262 gpie |= ixgbe->capab->other_gpie;
4263 break;
4264
4265 case ixgbe_mac_82599EB:
4266 case ixgbe_mac_X540:
4267 case ixgbe_mac_X550:
4268 case ixgbe_mac_X550EM_x:
4269 gpie |= ixgbe->capab->other_gpie;
4270
4271 /* Enable RSC Delay 8us when LRO enabled */
4272 if (ixgbe->lro_enable) {
4273 gpie |= (1 << IXGBE_GPIE_RSC_DELAY_SHIFT);
4274 }
4275 break;
4276
4277 default:
4278 break;
4279 }
4280
4281 /* write to interrupt control registers */
4282 IXGBE_WRITE_REG(hw, IXGBE_EIMS, ixgbe->eims);
4283 IXGBE_WRITE_REG(hw, IXGBE_EIAC, eiac);
4284 IXGBE_WRITE_REG(hw, IXGBE_EIAM, eiam);
4285 IXGBE_WRITE_REG(hw, IXGBE_GPIE, gpie);
4286 IXGBE_WRITE_FLUSH(hw);
4287 }
4288
4289 /*
4290 * ixgbe_loopback_ioctl - Loopback support.
4291 */
4292 enum ioc_reply
ixgbe_loopback_ioctl(ixgbe_t * ixgbe,struct iocblk * iocp,mblk_t * mp)4293 ixgbe_loopback_ioctl(ixgbe_t *ixgbe, struct iocblk *iocp, mblk_t *mp)
4294 {
4295 lb_info_sz_t *lbsp;
4296 lb_property_t *lbpp;
4297 uint32_t *lbmp;
4298 uint32_t size;
4299 uint32_t value;
4300
4301 if (mp->b_cont == NULL)
4302 return (IOC_INVAL);
4303
4304 switch (iocp->ioc_cmd) {
4305 default:
4306 return (IOC_INVAL);
4307
4308 case LB_GET_INFO_SIZE:
4309 size = sizeof (lb_info_sz_t);
4310 if (iocp->ioc_count != size)
4311 return (IOC_INVAL);
4312
4313 value = sizeof (lb_normal);
4314 value += sizeof (lb_mac);
4315 value += sizeof (lb_external);
4316
4317 lbsp = (lb_info_sz_t *)(uintptr_t)mp->b_cont->b_rptr;
4318 *lbsp = value;
4319 break;
4320
4321 case LB_GET_INFO:
4322 value = sizeof (lb_normal);
4323 value += sizeof (lb_mac);
4324 value += sizeof (lb_external);
4325
4326 size = value;
4327 if (iocp->ioc_count != size)
4328 return (IOC_INVAL);
4329
4330 value = 0;
4331 lbpp = (lb_property_t *)(uintptr_t)mp->b_cont->b_rptr;
4332
4333 lbpp[value++] = lb_normal;
4334 lbpp[value++] = lb_mac;
4335 lbpp[value++] = lb_external;
4336 break;
4337
4338 case LB_GET_MODE:
4339 size = sizeof (uint32_t);
4340 if (iocp->ioc_count != size)
4341 return (IOC_INVAL);
4342
4343 lbmp = (uint32_t *)(uintptr_t)mp->b_cont->b_rptr;
4344 *lbmp = ixgbe->loopback_mode;
4345 break;
4346
4347 case LB_SET_MODE:
4348 size = 0;
4349 if (iocp->ioc_count != sizeof (uint32_t))
4350 return (IOC_INVAL);
4351
4352 lbmp = (uint32_t *)(uintptr_t)mp->b_cont->b_rptr;
4353 if (!ixgbe_set_loopback_mode(ixgbe, *lbmp))
4354 return (IOC_INVAL);
4355 break;
4356 }
4357
4358 iocp->ioc_count = size;
4359 iocp->ioc_error = 0;
4360
4361 if (ixgbe_check_acc_handle(ixgbe->osdep.reg_handle) != DDI_FM_OK) {
4362 ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_DEGRADED);
4363 return (IOC_INVAL);
4364 }
4365
4366 return (IOC_REPLY);
4367 }
4368
4369 /*
4370 * ixgbe_set_loopback_mode - Setup loopback based on the loopback mode.
4371 */
4372 static boolean_t
ixgbe_set_loopback_mode(ixgbe_t * ixgbe,uint32_t mode)4373 ixgbe_set_loopback_mode(ixgbe_t *ixgbe, uint32_t mode)
4374 {
4375 if (mode == ixgbe->loopback_mode)
4376 return (B_TRUE);
4377
4378 ixgbe->loopback_mode = mode;
4379
4380 if (mode == IXGBE_LB_NONE) {
4381 /*
4382 * Reset the chip
4383 */
4384 (void) ixgbe_reset(ixgbe);
4385 return (B_TRUE);
4386 }
4387
4388 mutex_enter(&ixgbe->gen_lock);
4389
4390 switch (mode) {
4391 default:
4392 mutex_exit(&ixgbe->gen_lock);
4393 return (B_FALSE);
4394
4395 case IXGBE_LB_EXTERNAL:
4396 break;
4397
4398 case IXGBE_LB_INTERNAL_MAC:
4399 ixgbe_set_internal_mac_loopback(ixgbe);
4400 break;
4401 }
4402
4403 mutex_exit(&ixgbe->gen_lock);
4404
4405 return (B_TRUE);
4406 }
4407
4408 /*
4409 * ixgbe_set_internal_mac_loopback - Set the internal MAC loopback mode.
4410 */
4411 static void
ixgbe_set_internal_mac_loopback(ixgbe_t * ixgbe)4412 ixgbe_set_internal_mac_loopback(ixgbe_t *ixgbe)
4413 {
4414 struct ixgbe_hw *hw;
4415 uint32_t reg;
4416 uint8_t atlas;
4417
4418 hw = &ixgbe->hw;
4419
4420 /*
4421 * Setup MAC loopback
4422 */
4423 reg = IXGBE_READ_REG(&ixgbe->hw, IXGBE_HLREG0);
4424 reg |= IXGBE_HLREG0_LPBK;
4425 IXGBE_WRITE_REG(&ixgbe->hw, IXGBE_HLREG0, reg);
4426
4427 reg = IXGBE_READ_REG(&ixgbe->hw, IXGBE_AUTOC);
4428 reg &= ~IXGBE_AUTOC_LMS_MASK;
4429 IXGBE_WRITE_REG(&ixgbe->hw, IXGBE_AUTOC, reg);
4430
4431 /*
4432 * Disable Atlas Tx lanes to keep packets in loopback and not on wire
4433 */
4434 switch (hw->mac.type) {
4435 case ixgbe_mac_82598EB:
4436 (void) ixgbe_read_analog_reg8(&ixgbe->hw, IXGBE_ATLAS_PDN_LPBK,
4437 &atlas);
4438 atlas |= IXGBE_ATLAS_PDN_TX_REG_EN;
4439 (void) ixgbe_write_analog_reg8(&ixgbe->hw, IXGBE_ATLAS_PDN_LPBK,
4440 atlas);
4441
4442 (void) ixgbe_read_analog_reg8(&ixgbe->hw, IXGBE_ATLAS_PDN_10G,
4443 &atlas);
4444 atlas |= IXGBE_ATLAS_PDN_TX_10G_QL_ALL;
4445 (void) ixgbe_write_analog_reg8(&ixgbe->hw, IXGBE_ATLAS_PDN_10G,
4446 atlas);
4447
4448 (void) ixgbe_read_analog_reg8(&ixgbe->hw, IXGBE_ATLAS_PDN_1G,
4449 &atlas);
4450 atlas |= IXGBE_ATLAS_PDN_TX_1G_QL_ALL;
4451 (void) ixgbe_write_analog_reg8(&ixgbe->hw, IXGBE_ATLAS_PDN_1G,
4452 atlas);
4453
4454 (void) ixgbe_read_analog_reg8(&ixgbe->hw, IXGBE_ATLAS_PDN_AN,
4455 &atlas);
4456 atlas |= IXGBE_ATLAS_PDN_TX_AN_QL_ALL;
4457 (void) ixgbe_write_analog_reg8(&ixgbe->hw, IXGBE_ATLAS_PDN_AN,
4458 atlas);
4459 break;
4460
4461 case ixgbe_mac_82599EB:
4462 case ixgbe_mac_X540:
4463 case ixgbe_mac_X550:
4464 case ixgbe_mac_X550EM_x:
4465 reg = IXGBE_READ_REG(&ixgbe->hw, IXGBE_AUTOC);
4466 reg |= (IXGBE_AUTOC_FLU |
4467 IXGBE_AUTOC_10G_KX4);
4468 IXGBE_WRITE_REG(&ixgbe->hw, IXGBE_AUTOC, reg);
4469
4470 (void) ixgbe_setup_link(&ixgbe->hw, IXGBE_LINK_SPEED_10GB_FULL,
4471 B_FALSE);
4472 break;
4473
4474 default:
4475 break;
4476 }
4477 }
4478
4479 #pragma inline(ixgbe_intr_rx_work)
4480 /*
4481 * ixgbe_intr_rx_work - RX processing of ISR.
4482 */
4483 static void
ixgbe_intr_rx_work(ixgbe_rx_ring_t * rx_ring)4484 ixgbe_intr_rx_work(ixgbe_rx_ring_t *rx_ring)
4485 {
4486 mblk_t *mp;
4487
4488 mutex_enter(&rx_ring->rx_lock);
4489
4490 mp = ixgbe_ring_rx(rx_ring, IXGBE_POLL_NULL);
4491 mutex_exit(&rx_ring->rx_lock);
4492
4493 if (mp != NULL)
4494 mac_rx_ring(rx_ring->ixgbe->mac_hdl, rx_ring->ring_handle, mp,
4495 rx_ring->ring_gen_num);
4496 }
4497
4498 #pragma inline(ixgbe_intr_tx_work)
4499 /*
4500 * ixgbe_intr_tx_work - TX processing of ISR.
4501 */
4502 static void
ixgbe_intr_tx_work(ixgbe_tx_ring_t * tx_ring)4503 ixgbe_intr_tx_work(ixgbe_tx_ring_t *tx_ring)
4504 {
4505 ixgbe_t *ixgbe = tx_ring->ixgbe;
4506
4507 /*
4508 * Recycle the tx descriptors
4509 */
4510 tx_ring->tx_recycle(tx_ring);
4511
4512 /*
4513 * Schedule the re-transmit
4514 */
4515 if (tx_ring->reschedule &&
4516 (tx_ring->tbd_free >= ixgbe->tx_resched_thresh)) {
4517 tx_ring->reschedule = B_FALSE;
4518 mac_tx_ring_update(tx_ring->ixgbe->mac_hdl,
4519 tx_ring->ring_handle);
4520 tx_ring->stat_reschedule++;
4521 }
4522 }
4523
4524 #pragma inline(ixgbe_intr_other_work)
4525 /*
4526 * ixgbe_intr_other_work - Process interrupt types other than tx/rx
4527 */
4528 static void
ixgbe_intr_other_work(ixgbe_t * ixgbe,uint32_t eicr)4529 ixgbe_intr_other_work(ixgbe_t *ixgbe, uint32_t eicr)
4530 {
4531 struct ixgbe_hw *hw = &ixgbe->hw;
4532
4533 ASSERT(mutex_owned(&ixgbe->gen_lock));
4534
4535 /*
4536 * handle link status change
4537 */
4538 if (eicr & IXGBE_EICR_LSC) {
4539 ixgbe_driver_link_check(ixgbe);
4540 ixgbe_get_hw_state(ixgbe);
4541 }
4542
4543 /*
4544 * check for fan failure on adapters with fans
4545 */
4546 if ((ixgbe->capab->flags & IXGBE_FLAG_FAN_FAIL_CAPABLE) &&
4547 (eicr & IXGBE_EICR_GPI_SDP1)) {
4548 atomic_or_32(&ixgbe->ixgbe_state, IXGBE_OVERTEMP);
4549
4550 /*
4551 * Disable the adapter interrupts
4552 */
4553 ixgbe_disable_adapter_interrupts(ixgbe);
4554
4555 /*
4556 * Disable Rx/Tx units
4557 */
4558 (void) ixgbe_stop_adapter(&ixgbe->hw);
4559
4560 ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_LOST);
4561 ixgbe_error(ixgbe,
4562 "Problem: Network adapter has been stopped "
4563 "because the fan has stopped.\n");
4564 ixgbe_error(ixgbe,
4565 "Action: Replace the adapter.\n");
4566
4567 /* re-enable the interrupt, which was automasked */
4568 ixgbe->eims |= IXGBE_EICR_GPI_SDP1;
4569 }
4570
4571 /*
4572 * Do SFP check for adapters with hot-plug capability
4573 */
4574 if ((ixgbe->capab->flags & IXGBE_FLAG_SFP_PLUG_CAPABLE) &&
4575 ((eicr & IXGBE_EICR_GPI_SDP1_BY_MAC(hw)) ||
4576 (eicr & IXGBE_EICR_GPI_SDP2_BY_MAC(hw)))) {
4577 ixgbe->eicr = eicr;
4578 if ((ddi_taskq_dispatch(ixgbe->sfp_taskq,
4579 ixgbe_sfp_check, (void *)ixgbe,
4580 DDI_NOSLEEP)) != DDI_SUCCESS) {
4581 ixgbe_log(ixgbe, "No memory available to dispatch "
4582 "taskq for SFP check");
4583 }
4584 }
4585
4586 /*
4587 * Do over-temperature check for adapters with temp sensor
4588 */
4589 if ((ixgbe->capab->flags & IXGBE_FLAG_TEMP_SENSOR_CAPABLE) &&
4590 ((eicr & IXGBE_EICR_GPI_SDP0_BY_MAC(hw)) ||
4591 (eicr & IXGBE_EICR_LSC))) {
4592 ixgbe->eicr = eicr;
4593 if ((ddi_taskq_dispatch(ixgbe->overtemp_taskq,
4594 ixgbe_overtemp_check, (void *)ixgbe,
4595 DDI_NOSLEEP)) != DDI_SUCCESS) {
4596 ixgbe_log(ixgbe, "No memory available to dispatch "
4597 "taskq for overtemp check");
4598 }
4599 }
4600
4601 /*
4602 * Process an external PHY interrupt
4603 */
4604 if (hw->device_id == IXGBE_DEV_ID_X550EM_X_10G_T &&
4605 (eicr & IXGBE_EICR_GPI_SDP0_X540)) {
4606 ixgbe->eicr = eicr;
4607 if ((ddi_taskq_dispatch(ixgbe->phy_taskq,
4608 ixgbe_phy_check, (void *)ixgbe,
4609 DDI_NOSLEEP)) != DDI_SUCCESS) {
4610 ixgbe_log(ixgbe, "No memory available to dispatch "
4611 "taskq for PHY check");
4612 }
4613 }
4614 }
4615
4616 /*
4617 * ixgbe_intr_legacy - Interrupt handler for legacy interrupts.
4618 */
4619 static uint_t
ixgbe_intr_legacy(void * arg1,void * arg2)4620 ixgbe_intr_legacy(void *arg1, void *arg2)
4621 {
4622 ixgbe_t *ixgbe = (ixgbe_t *)arg1;
4623 struct ixgbe_hw *hw = &ixgbe->hw;
4624 ixgbe_tx_ring_t *tx_ring;
4625 ixgbe_rx_ring_t *rx_ring;
4626 uint32_t eicr;
4627 mblk_t *mp;
4628 boolean_t tx_reschedule;
4629 uint_t result;
4630
4631 _NOTE(ARGUNUSED(arg2));
4632
4633 mutex_enter(&ixgbe->gen_lock);
4634 if (ixgbe->ixgbe_state & IXGBE_SUSPENDED) {
4635 mutex_exit(&ixgbe->gen_lock);
4636 return (DDI_INTR_UNCLAIMED);
4637 }
4638
4639 mp = NULL;
4640 tx_reschedule = B_FALSE;
4641
4642 /*
4643 * Any bit set in eicr: claim this interrupt
4644 */
4645 eicr = IXGBE_READ_REG(hw, IXGBE_EICR);
4646
4647 if (ixgbe_check_acc_handle(ixgbe->osdep.reg_handle) != DDI_FM_OK) {
4648 mutex_exit(&ixgbe->gen_lock);
4649 ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_DEGRADED);
4650 atomic_or_32(&ixgbe->ixgbe_state, IXGBE_ERROR);
4651 return (DDI_INTR_CLAIMED);
4652 }
4653
4654 if (eicr) {
4655 /*
4656 * For legacy interrupt, we have only one interrupt,
4657 * so we have only one rx ring and one tx ring enabled.
4658 */
4659 ASSERT(ixgbe->num_rx_rings == 1);
4660 ASSERT(ixgbe->num_tx_rings == 1);
4661
4662 /*
4663 * For legacy interrupt, rx rings[0] will use RTxQ[0].
4664 */
4665 if (eicr & 0x1) {
4666 ixgbe->eimc |= IXGBE_EICR_RTX_QUEUE;
4667 IXGBE_WRITE_REG(hw, IXGBE_EIMC, ixgbe->eimc);
4668 ixgbe->eims |= IXGBE_EICR_RTX_QUEUE;
4669 /*
4670 * Clean the rx descriptors
4671 */
4672 rx_ring = &ixgbe->rx_rings[0];
4673 mp = ixgbe_ring_rx(rx_ring, IXGBE_POLL_NULL);
4674 }
4675
4676 /*
4677 * For legacy interrupt, tx rings[0] will use RTxQ[1].
4678 */
4679 if (eicr & 0x2) {
4680 /*
4681 * Recycle the tx descriptors
4682 */
4683 tx_ring = &ixgbe->tx_rings[0];
4684 tx_ring->tx_recycle(tx_ring);
4685
4686 /*
4687 * Schedule the re-transmit
4688 */
4689 tx_reschedule = (tx_ring->reschedule &&
4690 (tx_ring->tbd_free >= ixgbe->tx_resched_thresh));
4691 }
4692
4693 /* any interrupt type other than tx/rx */
4694 if (eicr & ixgbe->capab->other_intr) {
4695 switch (hw->mac.type) {
4696 case ixgbe_mac_82598EB:
4697 ixgbe->eims &= ~(eicr & IXGBE_OTHER_INTR);
4698 break;
4699
4700 case ixgbe_mac_82599EB:
4701 case ixgbe_mac_X540:
4702 case ixgbe_mac_X550:
4703 case ixgbe_mac_X550EM_x:
4704 ixgbe->eimc = IXGBE_82599_OTHER_INTR;
4705 IXGBE_WRITE_REG(hw, IXGBE_EIMC, ixgbe->eimc);
4706 break;
4707
4708 default:
4709 break;
4710 }
4711 ixgbe_intr_other_work(ixgbe, eicr);
4712 ixgbe->eims &= ~(eicr & IXGBE_OTHER_INTR);
4713 }
4714
4715 mutex_exit(&ixgbe->gen_lock);
4716
4717 result = DDI_INTR_CLAIMED;
4718 } else {
4719 mutex_exit(&ixgbe->gen_lock);
4720
4721 /*
4722 * No interrupt cause bits set: don't claim this interrupt.
4723 */
4724 result = DDI_INTR_UNCLAIMED;
4725 }
4726
4727 /* re-enable the interrupts which were automasked */
4728 IXGBE_WRITE_REG(hw, IXGBE_EIMS, ixgbe->eims);
4729
4730 /*
4731 * Do the following work outside of the gen_lock
4732 */
4733 if (mp != NULL) {
4734 mac_rx_ring(rx_ring->ixgbe->mac_hdl, rx_ring->ring_handle, mp,
4735 rx_ring->ring_gen_num);
4736 }
4737
4738 if (tx_reschedule) {
4739 tx_ring->reschedule = B_FALSE;
4740 mac_tx_ring_update(ixgbe->mac_hdl, tx_ring->ring_handle);
4741 tx_ring->stat_reschedule++;
4742 }
4743
4744 return (result);
4745 }
4746
4747 /*
4748 * ixgbe_intr_msi - Interrupt handler for MSI.
4749 */
4750 static uint_t
ixgbe_intr_msi(void * arg1,void * arg2)4751 ixgbe_intr_msi(void *arg1, void *arg2)
4752 {
4753 ixgbe_t *ixgbe = (ixgbe_t *)arg1;
4754 struct ixgbe_hw *hw = &ixgbe->hw;
4755 uint32_t eicr;
4756
4757 _NOTE(ARGUNUSED(arg2));
4758
4759 eicr = IXGBE_READ_REG(hw, IXGBE_EICR);
4760
4761 if (ixgbe_check_acc_handle(ixgbe->osdep.reg_handle) != DDI_FM_OK) {
4762 ddi_fm_service_impact(ixgbe->dip, DDI_SERVICE_DEGRADED);
4763 atomic_or_32(&ixgbe->ixgbe_state, IXGBE_ERROR);
4764 return (DDI_INTR_CLAIMED);
4765 }
4766
4767 /*
4768 * For MSI interrupt, we have only one vector,
4769 * so we have only one rx ring and one tx ring enabled.
4770 */
4771 ASSERT(ixgbe->num_rx_rings == 1);
4772 ASSERT(ixgbe->num_tx_rings == 1);
4773
4774 /*
4775 * For MSI interrupt, rx rings[0] will use RTxQ[0].
4776 */
4777 if (eicr & 0x1) {
4778 ixgbe_intr_rx_work(&ixgbe->rx_rings[0]);
4779 }
4780
4781 /*
4782 * For MSI interrupt, tx rings[0] will use RTxQ[1].
4783 */
4784 if (eicr & 0x2) {
4785 ixgbe_intr_tx_work(&ixgbe->tx_rings[0]);
4786 }
4787
4788 /* any interrupt type other than tx/rx */
4789 if (eicr & ixgbe->capab->other_intr) {
4790 mutex_enter(&ixgbe->gen_lock);
4791 switch (hw->mac.type) {
4792 case ixgbe_mac_82598EB:
4793 ixgbe->eims &= ~(eicr & IXGBE_OTHER_INTR);
4794 break;
4795
4796 case ixgbe_mac_82599EB:
4797 case ixgbe_mac_X540:
4798 case ixgbe_mac_X550:
4799 case ixgbe_mac_X550EM_x:
4800 ixgbe->eimc = IXGBE_82599_OTHER_INTR;
4801 IXGBE_WRITE_REG(hw, IXGBE_EIMC, ixgbe->eimc);
4802 break;
4803
4804 default:
4805 break;
4806 }
4807 ixgbe_intr_other_work(ixgbe, eicr);
4808 ixgbe->eims &= ~(eicr & IXGBE_OTHER_INTR);
4809 mutex_exit(&ixgbe->gen_lock);
4810 }
4811
4812 /* re-enable the interrupts which were automasked */
4813 IXGBE_WRITE_REG(hw, IXGBE_EIMS, ixgbe->eims);
4814
4815 return (DDI_INTR_CLAIMED);
4816 }
4817
4818 /*
4819 * ixgbe_intr_msix - Interrupt handler for MSI-X.
4820 */
4821 static uint_t
ixgbe_intr_msix(void * arg1,void * arg2)4822 ixgbe_intr_msix(void *arg1, void *arg2)
4823 {
4824 ixgbe_intr_vector_t *vect = (ixgbe_intr_vector_t *)arg1;
4825 ixgbe_t *ixgbe = vect->ixgbe;
4826 struct ixgbe_hw *hw = &ixgbe->hw;
4827 uint32_t eicr;
4828 int r_idx = 0;
4829
4830 _NOTE(ARGUNUSED(arg2));
4831
4832 /*
4833 * Clean each rx ring that has its bit set in the map
4834 */
4835 r_idx = bt_getlowbit(vect->rx_map, 0, (ixgbe->num_rx_rings - 1));
4836 while (r_idx >= 0) {
4837 ixgbe_intr_rx_work(&ixgbe->rx_rings[r_idx]);
4838 r_idx = bt_getlowbit(vect->rx_map, (r_idx + 1),
4839 (ixgbe->num_rx_rings - 1));
4840 }
4841
4842 /*
4843 * Clean each tx ring that has its bit set in the map
4844 */
4845 r_idx = bt_getlowbit(vect->tx_map, 0, (ixgbe->num_tx_rings - 1));
4846 while (r_idx >= 0) {
4847 ixgbe_intr_tx_work(&ixgbe->tx_rings[r_idx]);
4848 r_idx = bt_getlowbit(vect->tx_map, (r_idx + 1),
4849 (ixgbe->num_tx_rings - 1));
4850 }
4851
4852
4853 /*
4854 * Clean other interrupt (link change) that has its bit set in the map
4855 */
4856 if (BT_TEST(vect->other_map, 0) == 1) {
4857 eicr = IXGBE_READ_REG(hw, IXGBE_EICR);
4858
4859 if (ixgbe_check_acc_handle(ixgbe->osdep.reg_handle) !=
4860 DDI_FM_OK) {
4861 ddi_fm_service_impact(ixgbe->dip,
4862 DDI_SERVICE_DEGRADED);
4863 atomic_or_32(&ixgbe->ixgbe_state, IXGBE_ERROR);
4864 return (DDI_INTR_CLAIMED);
4865 }
4866
4867 /*
4868 * Check "other" cause bits: any interrupt type other than tx/rx
4869 */
4870 if (eicr & ixgbe->capab->other_intr) {
4871 mutex_enter(&ixgbe->gen_lock);
4872 switch (hw->mac.type) {
4873 case ixgbe_mac_82598EB:
4874 ixgbe->eims &= ~(eicr & IXGBE_OTHER_INTR);
4875 ixgbe_intr_other_work(ixgbe, eicr);
4876 break;
4877
4878 case ixgbe_mac_82599EB:
4879 case ixgbe_mac_X540:
4880 case ixgbe_mac_X550:
4881 case ixgbe_mac_X550EM_x:
4882 ixgbe->eims |= IXGBE_EICR_RTX_QUEUE;
4883 ixgbe_intr_other_work(ixgbe, eicr);
4884 break;
4885
4886 default:
4887 break;
4888 }
4889 mutex_exit(&ixgbe->gen_lock);
4890 }
4891
4892 /* re-enable the interrupts which were automasked */
4893 IXGBE_WRITE_REG(hw, IXGBE_EIMS, ixgbe->eims);
4894 }
4895
4896 return (DDI_INTR_CLAIMED);
4897 }
4898
4899 /*
4900 * ixgbe_alloc_intrs - Allocate interrupts for the driver.
4901 *
4902 * Normal sequence is to try MSI-X; if not sucessful, try MSI;
4903 * if not successful, try Legacy.
4904 * ixgbe->intr_force can be used to force sequence to start with
4905 * any of the 3 types.
4906 * If MSI-X is not used, number of tx/rx rings is forced to 1.
4907 */
4908 static int
ixgbe_alloc_intrs(ixgbe_t * ixgbe)4909 ixgbe_alloc_intrs(ixgbe_t *ixgbe)
4910 {
4911 dev_info_t *devinfo;
4912 int intr_types;
4913 int rc;
4914
4915 devinfo = ixgbe->dip;
4916
4917 /*
4918 * Get supported interrupt types
4919 */
4920 rc = ddi_intr_get_supported_types(devinfo, &intr_types);
4921
4922 if (rc != DDI_SUCCESS) {
4923 ixgbe_log(ixgbe,
4924 "Get supported interrupt types failed: %d", rc);
4925 return (IXGBE_FAILURE);
4926 }
4927 IXGBE_DEBUGLOG_1(ixgbe, "Supported interrupt types: %x", intr_types);
4928
4929 ixgbe->intr_type = 0;
4930
4931 /*
4932 * Install MSI-X interrupts
4933 */
4934 if ((intr_types & DDI_INTR_TYPE_MSIX) &&
4935 (ixgbe->intr_force <= IXGBE_INTR_MSIX)) {
4936 rc = ixgbe_alloc_intr_handles(ixgbe, DDI_INTR_TYPE_MSIX);
4937 if (rc == IXGBE_SUCCESS)
4938 return (IXGBE_SUCCESS);
4939
4940 ixgbe_log(ixgbe,
4941 "Allocate MSI-X failed, trying MSI interrupts...");
4942 }
4943
4944 /*
4945 * MSI-X not used, force rings and groups to 1
4946 */
4947 ixgbe->num_rx_rings = 1;
4948 ixgbe->num_rx_groups = 1;
4949 ixgbe->num_tx_rings = 1;
4950 ixgbe->classify_mode = IXGBE_CLASSIFY_NONE;
4951 ixgbe_log(ixgbe,
4952 "MSI-X not used, force rings and groups number to 1");
4953
4954 /*
4955 * Install MSI interrupts
4956 */
4957 if ((intr_types & DDI_INTR_TYPE_MSI) &&
4958 (ixgbe->intr_force <= IXGBE_INTR_MSI)) {
4959 rc = ixgbe_alloc_intr_handles(ixgbe, DDI_INTR_TYPE_MSI);
4960 if (rc == IXGBE_SUCCESS)
4961 return (IXGBE_SUCCESS);
4962
4963 ixgbe_log(ixgbe,
4964 "Allocate MSI failed, trying Legacy interrupts...");
4965 }
4966
4967 /*
4968 * Install legacy interrupts
4969 */
4970 if (intr_types & DDI_INTR_TYPE_FIXED) {
4971 /*
4972 * Disallow legacy interrupts for X550. X550 has a silicon
4973 * bug which prevents Shared Legacy interrupts from working.
4974 * For details, please reference:
4975 *
4976 * Intel Ethernet Controller X550 Specification Update rev. 2.1
4977 * May 2016, erratum 22: PCIe Interrupt Status Bit
4978 */
4979 if (ixgbe->hw.mac.type == ixgbe_mac_X550 ||
4980 ixgbe->hw.mac.type == ixgbe_mac_X550EM_x ||
4981 ixgbe->hw.mac.type == ixgbe_mac_X550_vf ||
4982 ixgbe->hw.mac.type == ixgbe_mac_X550EM_x_vf) {
4983 ixgbe_log(ixgbe,
4984 "Legacy interrupts are not supported on this "
4985 "adapter. Please use MSI or MSI-X instead.");
4986 return (IXGBE_FAILURE);
4987 }
4988 rc = ixgbe_alloc_intr_handles(ixgbe, DDI_INTR_TYPE_FIXED);
4989 if (rc == IXGBE_SUCCESS)
4990 return (IXGBE_SUCCESS);
4991
4992 ixgbe_log(ixgbe,
4993 "Allocate Legacy interrupts failed");
4994 }
4995
4996 /*
4997 * If none of the 3 types succeeded, return failure
4998 */
4999 return (IXGBE_FAILURE);
5000 }
5001
5002 /*
5003 * ixgbe_alloc_intr_handles - Allocate interrupt handles.
5004 *
5005 * For legacy and MSI, only 1 handle is needed. For MSI-X,
5006 * if fewer than 2 handles are available, return failure.
5007 * Upon success, this maps the vectors to rx and tx rings for
5008 * interrupts.
5009 */
5010 static int
ixgbe_alloc_intr_handles(ixgbe_t * ixgbe,int intr_type)5011 ixgbe_alloc_intr_handles(ixgbe_t *ixgbe, int intr_type)
5012 {
5013 dev_info_t *devinfo;
5014 int request, count, actual;
5015 int minimum;
5016 int rc;
5017 uint32_t ring_per_group;
5018
5019 devinfo = ixgbe->dip;
5020
5021 switch (intr_type) {
5022 case DDI_INTR_TYPE_FIXED:
5023 request = 1; /* Request 1 legacy interrupt handle */
5024 minimum = 1;
5025 IXGBE_DEBUGLOG_0(ixgbe, "interrupt type: legacy");
5026 break;
5027
5028 case DDI_INTR_TYPE_MSI:
5029 request = 1; /* Request 1 MSI interrupt handle */
5030 minimum = 1;
5031 IXGBE_DEBUGLOG_0(ixgbe, "interrupt type: MSI");
5032 break;
5033
5034 case DDI_INTR_TYPE_MSIX:
5035 /*
5036 * Best number of vectors for the adapter is
5037 * (# rx rings + # tx rings), however we will
5038 * limit the request number.
5039 */
5040 request = min(16, ixgbe->num_rx_rings + ixgbe->num_tx_rings);
5041 if (request > ixgbe->capab->max_ring_vect)
5042 request = ixgbe->capab->max_ring_vect;
5043 minimum = 1;
5044 IXGBE_DEBUGLOG_0(ixgbe, "interrupt type: MSI-X");
5045 break;
5046
5047 default:
5048 ixgbe_log(ixgbe,
5049 "invalid call to ixgbe_alloc_intr_handles(): %d\n",
5050 intr_type);
5051 return (IXGBE_FAILURE);
5052 }
5053 IXGBE_DEBUGLOG_2(ixgbe, "interrupt handles requested: %d minimum: %d",
5054 request, minimum);
5055
5056 /*
5057 * Get number of supported interrupts
5058 */
5059 rc = ddi_intr_get_nintrs(devinfo, intr_type, &count);
5060 if ((rc != DDI_SUCCESS) || (count < minimum)) {
5061 ixgbe_log(ixgbe,
5062 "Get interrupt number failed. Return: %d, count: %d",
5063 rc, count);
5064 return (IXGBE_FAILURE);
5065 }
5066 IXGBE_DEBUGLOG_1(ixgbe, "interrupts supported: %d", count);
5067
5068 actual = 0;
5069 ixgbe->intr_cnt = 0;
5070 ixgbe->intr_cnt_max = 0;
5071 ixgbe->intr_cnt_min = 0;
5072
5073 /*
5074 * Allocate an array of interrupt handles
5075 */
5076 ixgbe->intr_size = request * sizeof (ddi_intr_handle_t);
5077 ixgbe->htable = kmem_alloc(ixgbe->intr_size, KM_SLEEP);
5078
5079 rc = ddi_intr_alloc(devinfo, ixgbe->htable, intr_type, 0,
5080 request, &actual, DDI_INTR_ALLOC_NORMAL);
5081 if (rc != DDI_SUCCESS) {
5082 ixgbe_log(ixgbe, "Allocate interrupts failed. "
5083 "return: %d, request: %d, actual: %d",
5084 rc, request, actual);
5085 goto alloc_handle_fail;
5086 }
5087 IXGBE_DEBUGLOG_1(ixgbe, "interrupts actually allocated: %d", actual);
5088
5089 /*
5090 * upper/lower limit of interrupts
5091 */
5092 ixgbe->intr_cnt = actual;
5093 ixgbe->intr_cnt_max = request;
5094 ixgbe->intr_cnt_min = minimum;
5095
5096 /*
5097 * rss number per group should not exceed the rx interrupt number,
5098 * else need to adjust rx ring number.
5099 */
5100 ring_per_group = ixgbe->num_rx_rings / ixgbe->num_rx_groups;
5101 ASSERT((ixgbe->num_rx_rings % ixgbe->num_rx_groups) == 0);
5102 if (actual < ring_per_group) {
5103 ixgbe->num_rx_rings = ixgbe->num_rx_groups * actual;
5104 ixgbe_setup_vmdq_rss_conf(ixgbe);
5105 }
5106
5107 /*
5108 * Now we know the actual number of vectors. Here we map the vector
5109 * to other, rx rings and tx ring.
5110 */
5111 if (actual < minimum) {
5112 ixgbe_log(ixgbe, "Insufficient interrupt handles available: %d",
5113 actual);
5114 goto alloc_handle_fail;
5115 }
5116
5117 /*
5118 * Get priority for first vector, assume remaining are all the same
5119 */
5120 rc = ddi_intr_get_pri(ixgbe->htable[0], &ixgbe->intr_pri);
5121 if (rc != DDI_SUCCESS) {
5122 ixgbe_log(ixgbe,
5123 "Get interrupt priority failed: %d", rc);
5124 goto alloc_handle_fail;
5125 }
5126
5127 rc = ddi_intr_get_cap(ixgbe->htable[0], &ixgbe->intr_cap);
5128 if (rc != DDI_SUCCESS) {
5129 ixgbe_log(ixgbe,
5130 "Get interrupt cap failed: %d", rc);
5131 goto alloc_handle_fail;
5132 }
5133
5134 ixgbe->intr_type = intr_type;
5135
5136 return (IXGBE_SUCCESS);
5137
5138 alloc_handle_fail:
5139 ixgbe_rem_intrs(ixgbe);
5140
5141 return (IXGBE_FAILURE);
5142 }
5143
5144 /*
5145 * ixgbe_add_intr_handlers - Add interrupt handlers based on the interrupt type.
5146 *
5147 * Before adding the interrupt handlers, the interrupt vectors have
5148 * been allocated, and the rx/tx rings have also been allocated.
5149 */
5150 static int
ixgbe_add_intr_handlers(ixgbe_t * ixgbe)5151 ixgbe_add_intr_handlers(ixgbe_t *ixgbe)
5152 {
5153 int vector = 0;
5154 int rc;
5155
5156 switch (ixgbe->intr_type) {
5157 case DDI_INTR_TYPE_MSIX:
5158 /*
5159 * Add interrupt handler for all vectors
5160 */
5161 for (vector = 0; vector < ixgbe->intr_cnt; vector++) {
5162 /*
5163 * install pointer to vect_map[vector]
5164 */
5165 rc = ddi_intr_add_handler(ixgbe->htable[vector],
5166 (ddi_intr_handler_t *)ixgbe_intr_msix,
5167 (void *)&ixgbe->vect_map[vector], NULL);
5168
5169 if (rc != DDI_SUCCESS) {
5170 ixgbe_log(ixgbe,
5171 "Add interrupt handler failed. "
5172 "return: %d, vector: %d", rc, vector);
5173 for (vector--; vector >= 0; vector--) {
5174 (void) ddi_intr_remove_handler(
5175 ixgbe->htable[vector]);
5176 }
5177 return (IXGBE_FAILURE);
5178 }
5179 }
5180
5181 break;
5182
5183 case DDI_INTR_TYPE_MSI:
5184 /*
5185 * Add interrupt handlers for the only vector
5186 */
5187 rc = ddi_intr_add_handler(ixgbe->htable[vector],
5188 (ddi_intr_handler_t *)ixgbe_intr_msi,
5189 (void *)ixgbe, NULL);
5190
5191 if (rc != DDI_SUCCESS) {
5192 ixgbe_log(ixgbe,
5193 "Add MSI interrupt handler failed: %d", rc);
5194 return (IXGBE_FAILURE);
5195 }
5196
5197 break;
5198
5199 case DDI_INTR_TYPE_FIXED:
5200 /*
5201 * Add interrupt handlers for the only vector
5202 */
5203 rc = ddi_intr_add_handler(ixgbe->htable[vector],
5204 (ddi_intr_handler_t *)ixgbe_intr_legacy,
5205 (void *)ixgbe, NULL);
5206
5207 if (rc != DDI_SUCCESS) {
5208 ixgbe_log(ixgbe,
5209 "Add legacy interrupt handler failed: %d", rc);
5210 return (IXGBE_FAILURE);
5211 }
5212
5213 break;
5214
5215 default:
5216 return (IXGBE_FAILURE);
5217 }
5218
5219 return (IXGBE_SUCCESS);
5220 }
5221
5222 #pragma inline(ixgbe_map_rxring_to_vector)
5223 /*
5224 * ixgbe_map_rxring_to_vector - Map given rx ring to given interrupt vector.
5225 */
5226 static void
ixgbe_map_rxring_to_vector(ixgbe_t * ixgbe,int r_idx,int v_idx)5227 ixgbe_map_rxring_to_vector(ixgbe_t *ixgbe, int r_idx, int v_idx)
5228 {
5229 /*
5230 * Set bit in map
5231 */
5232 BT_SET(ixgbe->vect_map[v_idx].rx_map, r_idx);
5233
5234 /*
5235 * Count bits set
5236 */
5237 ixgbe->vect_map[v_idx].rxr_cnt++;
5238
5239 /*
5240 * Remember bit position
5241 */
5242 ixgbe->rx_rings[r_idx].intr_vector = v_idx;
5243 ixgbe->rx_rings[r_idx].vect_bit = 1 << v_idx;
5244 }
5245
5246 #pragma inline(ixgbe_map_txring_to_vector)
5247 /*
5248 * ixgbe_map_txring_to_vector - Map given tx ring to given interrupt vector.
5249 */
5250 static void
ixgbe_map_txring_to_vector(ixgbe_t * ixgbe,int t_idx,int v_idx)5251 ixgbe_map_txring_to_vector(ixgbe_t *ixgbe, int t_idx, int v_idx)
5252 {
5253 /*
5254 * Set bit in map
5255 */
5256 BT_SET(ixgbe->vect_map[v_idx].tx_map, t_idx);
5257
5258 /*
5259 * Count bits set
5260 */
5261 ixgbe->vect_map[v_idx].txr_cnt++;
5262
5263 /*
5264 * Remember bit position
5265 */
5266 ixgbe->tx_rings[t_idx].intr_vector = v_idx;
5267 ixgbe->tx_rings[t_idx].vect_bit = 1 << v_idx;
5268 }
5269
5270 /*
5271 * ixgbe_setup_ivar - Set the given entry in the given interrupt vector
5272 * allocation register (IVAR).
5273 * cause:
5274 * -1 : other cause
5275 * 0 : rx
5276 * 1 : tx
5277 */
5278 static void
ixgbe_setup_ivar(ixgbe_t * ixgbe,uint16_t intr_alloc_entry,uint8_t msix_vector,int8_t cause)5279 ixgbe_setup_ivar(ixgbe_t *ixgbe, uint16_t intr_alloc_entry, uint8_t msix_vector,
5280 int8_t cause)
5281 {
5282 struct ixgbe_hw *hw = &ixgbe->hw;
5283 u32 ivar, index;
5284
5285 switch (hw->mac.type) {
5286 case ixgbe_mac_82598EB:
5287 msix_vector |= IXGBE_IVAR_ALLOC_VAL;
5288 if (cause == -1) {
5289 cause = 0;
5290 }
5291 index = (((cause * 64) + intr_alloc_entry) >> 2) & 0x1F;
5292 ivar = IXGBE_READ_REG(hw, IXGBE_IVAR(index));
5293 ivar &= ~(0xFF << (8 * (intr_alloc_entry & 0x3)));
5294 ivar |= (msix_vector << (8 * (intr_alloc_entry & 0x3)));
5295 IXGBE_WRITE_REG(hw, IXGBE_IVAR(index), ivar);
5296 break;
5297
5298 case ixgbe_mac_82599EB:
5299 case ixgbe_mac_X540:
5300 case ixgbe_mac_X550:
5301 case ixgbe_mac_X550EM_x:
5302 if (cause == -1) {
5303 /* other causes */
5304 msix_vector |= IXGBE_IVAR_ALLOC_VAL;
5305 index = (intr_alloc_entry & 1) * 8;
5306 ivar = IXGBE_READ_REG(hw, IXGBE_IVAR_MISC);
5307 ivar &= ~(0xFF << index);
5308 ivar |= (msix_vector << index);
5309 IXGBE_WRITE_REG(hw, IXGBE_IVAR_MISC, ivar);
5310 } else {
5311 /* tx or rx causes */
5312 msix_vector |= IXGBE_IVAR_ALLOC_VAL;
5313 index = ((16 * (intr_alloc_entry & 1)) + (8 * cause));
5314 ivar = IXGBE_READ_REG(hw,
5315 IXGBE_IVAR(intr_alloc_entry >> 1));
5316 ivar &= ~(0xFF << index);
5317 ivar |= (msix_vector << index);
5318 IXGBE_WRITE_REG(hw, IXGBE_IVAR(intr_alloc_entry >> 1),
5319 ivar);
5320 }
5321 break;
5322
5323 default:
5324 break;
5325 }
5326 }
5327
5328 /*
5329 * ixgbe_enable_ivar - Enable the given entry by setting the VAL bit of
5330 * given interrupt vector allocation register (IVAR).
5331 * cause:
5332 * -1 : other cause
5333 * 0 : rx
5334 * 1 : tx
5335 */
5336 static void
ixgbe_enable_ivar(ixgbe_t * ixgbe,uint16_t intr_alloc_entry,int8_t cause)5337 ixgbe_enable_ivar(ixgbe_t *ixgbe, uint16_t intr_alloc_entry, int8_t cause)
5338 {
5339 struct ixgbe_hw *hw = &ixgbe->hw;
5340 u32 ivar, index;
5341
5342 switch (hw->mac.type) {
5343 case ixgbe_mac_82598EB:
5344 if (cause == -1) {
5345 cause = 0;
5346 }
5347 index = (((cause * 64) + intr_alloc_entry) >> 2) & 0x1F;
5348 ivar = IXGBE_READ_REG(hw, IXGBE_IVAR(index));
5349 ivar |= (IXGBE_IVAR_ALLOC_VAL << (8 *
5350 (intr_alloc_entry & 0x3)));
5351 IXGBE_WRITE_REG(hw, IXGBE_IVAR(index), ivar);
5352 break;
5353
5354 case ixgbe_mac_82599EB:
5355 case ixgbe_mac_X540:
5356 case ixgbe_mac_X550:
5357 case ixgbe_mac_X550EM_x:
5358 if (cause == -1) {
5359 /* other causes */
5360 index = (intr_alloc_entry & 1) * 8;
5361 ivar = IXGBE_READ_REG(hw, IXGBE_IVAR_MISC);
5362 ivar |= (IXGBE_IVAR_ALLOC_VAL << index);
5363 IXGBE_WRITE_REG(hw, IXGBE_IVAR_MISC, ivar);
5364 } else {
5365 /* tx or rx causes */
5366 index = ((16 * (intr_alloc_entry & 1)) + (8 * cause));
5367 ivar = IXGBE_READ_REG(hw,
5368 IXGBE_IVAR(intr_alloc_entry >> 1));
5369 ivar |= (IXGBE_IVAR_ALLOC_VAL << index);
5370 IXGBE_WRITE_REG(hw, IXGBE_IVAR(intr_alloc_entry >> 1),
5371 ivar);
5372 }
5373 break;
5374
5375 default:
5376 break;
5377 }
5378 }
5379
5380 /*
5381 * ixgbe_disable_ivar - Disble the given entry by clearing the VAL bit of
5382 * given interrupt vector allocation register (IVAR).
5383 * cause:
5384 * -1 : other cause
5385 * 0 : rx
5386 * 1 : tx
5387 */
5388 static void
ixgbe_disable_ivar(ixgbe_t * ixgbe,uint16_t intr_alloc_entry,int8_t cause)5389 ixgbe_disable_ivar(ixgbe_t *ixgbe, uint16_t intr_alloc_entry, int8_t cause)
5390 {
5391 struct ixgbe_hw *hw = &ixgbe->hw;
5392 u32 ivar, index;
5393
5394 switch (hw->mac.type) {
5395 case ixgbe_mac_82598EB:
5396 if (cause == -1) {
5397 cause = 0;
5398 }
5399 index = (((cause * 64) + intr_alloc_entry) >> 2) & 0x1F;
5400 ivar = IXGBE_READ_REG(hw, IXGBE_IVAR(index));
5401 ivar &= ~(IXGBE_IVAR_ALLOC_VAL<< (8 *
5402 (intr_alloc_entry & 0x3)));
5403 IXGBE_WRITE_REG(hw, IXGBE_IVAR(index), ivar);
5404 break;
5405
5406 case ixgbe_mac_82599EB:
5407 case ixgbe_mac_X540:
5408 case ixgbe_mac_X550:
5409 case ixgbe_mac_X550EM_x:
5410 if (cause == -1) {
5411 /* other causes */
5412 index = (intr_alloc_entry & 1) * 8;
5413 ivar = IXGBE_READ_REG(hw, IXGBE_IVAR_MISC);
5414 ivar &= ~(IXGBE_IVAR_ALLOC_VAL << index);
5415 IXGBE_WRITE_REG(hw, IXGBE_IVAR_MISC, ivar);
5416 } else {
5417 /* tx or rx causes */
5418 index = ((16 * (intr_alloc_entry & 1)) + (8 * cause));
5419 ivar = IXGBE_READ_REG(hw,
5420 IXGBE_IVAR(intr_alloc_entry >> 1));
5421 ivar &= ~(IXGBE_IVAR_ALLOC_VAL << index);
5422 IXGBE_WRITE_REG(hw, IXGBE_IVAR(intr_alloc_entry >> 1),
5423 ivar);
5424 }
5425 break;
5426
5427 default:
5428 break;
5429 }
5430 }
5431
5432 /*
5433 * Convert the rx ring index driver maintained to the rx ring index
5434 * in h/w.
5435 */
5436 static uint32_t
ixgbe_get_hw_rx_index(ixgbe_t * ixgbe,uint32_t sw_rx_index)5437 ixgbe_get_hw_rx_index(ixgbe_t *ixgbe, uint32_t sw_rx_index)
5438 {
5439
5440 struct ixgbe_hw *hw = &ixgbe->hw;
5441 uint32_t rx_ring_per_group, hw_rx_index;
5442
5443 if (ixgbe->classify_mode == IXGBE_CLASSIFY_RSS ||
5444 ixgbe->classify_mode == IXGBE_CLASSIFY_NONE) {
5445 return (sw_rx_index);
5446 } else if (ixgbe->classify_mode == IXGBE_CLASSIFY_VMDQ) {
5447 switch (hw->mac.type) {
5448 case ixgbe_mac_82598EB:
5449 return (sw_rx_index);
5450
5451 case ixgbe_mac_82599EB:
5452 case ixgbe_mac_X540:
5453 case ixgbe_mac_X550:
5454 case ixgbe_mac_X550EM_x:
5455 return (sw_rx_index * 2);
5456
5457 default:
5458 break;
5459 }
5460 } else if (ixgbe->classify_mode == IXGBE_CLASSIFY_VMDQ_RSS) {
5461 rx_ring_per_group = ixgbe->num_rx_rings / ixgbe->num_rx_groups;
5462
5463 switch (hw->mac.type) {
5464 case ixgbe_mac_82598EB:
5465 hw_rx_index = (sw_rx_index / rx_ring_per_group) *
5466 16 + (sw_rx_index % rx_ring_per_group);
5467 return (hw_rx_index);
5468
5469 case ixgbe_mac_82599EB:
5470 case ixgbe_mac_X540:
5471 case ixgbe_mac_X550:
5472 case ixgbe_mac_X550EM_x:
5473 if (ixgbe->num_rx_groups > 32) {
5474 hw_rx_index = (sw_rx_index /
5475 rx_ring_per_group) * 2 +
5476 (sw_rx_index % rx_ring_per_group);
5477 } else {
5478 hw_rx_index = (sw_rx_index /
5479 rx_ring_per_group) * 4 +
5480 (sw_rx_index % rx_ring_per_group);
5481 }
5482 return (hw_rx_index);
5483
5484 default:
5485 break;
5486 }
5487 }
5488
5489 /*
5490 * Should never reach. Just to make compiler happy.
5491 */
5492 return (sw_rx_index);
5493 }
5494
5495 /*
5496 * ixgbe_map_intrs_to_vectors - Map different interrupts to MSI-X vectors.
5497 *
5498 * For MSI-X, here will map rx interrupt, tx interrupt and other interrupt
5499 * to vector[0 - (intr_cnt -1)].
5500 */
5501 static int
ixgbe_map_intrs_to_vectors(ixgbe_t * ixgbe)5502 ixgbe_map_intrs_to_vectors(ixgbe_t *ixgbe)
5503 {
5504 int i, vector = 0;
5505
5506 /* initialize vector map */
5507 bzero(&ixgbe->vect_map, sizeof (ixgbe->vect_map));
5508 for (i = 0; i < ixgbe->intr_cnt; i++) {
5509 ixgbe->vect_map[i].ixgbe = ixgbe;
5510 }
5511
5512 /*
5513 * non-MSI-X case is very simple: rx rings[0] on RTxQ[0],
5514 * tx rings[0] on RTxQ[1].
5515 */
5516 if (ixgbe->intr_type != DDI_INTR_TYPE_MSIX) {
5517 ixgbe_map_rxring_to_vector(ixgbe, 0, 0);
5518 ixgbe_map_txring_to_vector(ixgbe, 0, 1);
5519 return (IXGBE_SUCCESS);
5520 }
5521
5522 /*
5523 * Interrupts/vectors mapping for MSI-X
5524 */
5525
5526 /*
5527 * Map other interrupt to vector 0,
5528 * Set bit in map and count the bits set.
5529 */
5530 BT_SET(ixgbe->vect_map[vector].other_map, 0);
5531 ixgbe->vect_map[vector].other_cnt++;
5532
5533 /*
5534 * Map rx ring interrupts to vectors
5535 */
5536 for (i = 0; i < ixgbe->num_rx_rings; i++) {
5537 ixgbe_map_rxring_to_vector(ixgbe, i, vector);
5538 vector = (vector +1) % ixgbe->intr_cnt;
5539 }
5540
5541 /*
5542 * Map tx ring interrupts to vectors
5543 */
5544 for (i = 0; i < ixgbe->num_tx_rings; i++) {
5545 ixgbe_map_txring_to_vector(ixgbe, i, vector);
5546 vector = (vector +1) % ixgbe->intr_cnt;
5547 }
5548
5549 return (IXGBE_SUCCESS);
5550 }
5551
5552 /*
5553 * ixgbe_setup_adapter_vector - Setup the adapter interrupt vector(s).
5554 *
5555 * This relies on ring/vector mapping already set up in the
5556 * vect_map[] structures
5557 */
5558 static void
ixgbe_setup_adapter_vector(ixgbe_t * ixgbe)5559 ixgbe_setup_adapter_vector(ixgbe_t *ixgbe)
5560 {
5561 struct ixgbe_hw *hw = &ixgbe->hw;
5562 ixgbe_intr_vector_t *vect; /* vector bitmap */
5563 int r_idx; /* ring index */
5564 int v_idx; /* vector index */
5565 uint32_t hw_index;
5566
5567 /*
5568 * Clear any previous entries
5569 */
5570 switch (hw->mac.type) {
5571 case ixgbe_mac_82598EB:
5572 for (v_idx = 0; v_idx < 25; v_idx++)
5573 IXGBE_WRITE_REG(hw, IXGBE_IVAR(v_idx), 0);
5574 break;
5575
5576 case ixgbe_mac_82599EB:
5577 case ixgbe_mac_X540:
5578 case ixgbe_mac_X550:
5579 case ixgbe_mac_X550EM_x:
5580 for (v_idx = 0; v_idx < 64; v_idx++)
5581 IXGBE_WRITE_REG(hw, IXGBE_IVAR(v_idx), 0);
5582 IXGBE_WRITE_REG(hw, IXGBE_IVAR_MISC, 0);
5583 break;
5584
5585 default:
5586 break;
5587 }
5588
5589 /*
5590 * For non MSI-X interrupt, rx rings[0] will use RTxQ[0], and
5591 * tx rings[0] will use RTxQ[1].
5592 */
5593 if (ixgbe->intr_type != DDI_INTR_TYPE_MSIX) {
5594 ixgbe_setup_ivar(ixgbe, 0, 0, 0);
5595 ixgbe_setup_ivar(ixgbe, 0, 1, 1);
5596 return;
5597 }
5598
5599 /*
5600 * For MSI-X interrupt, "Other" is always on vector[0].
5601 */
5602 ixgbe_setup_ivar(ixgbe, IXGBE_IVAR_OTHER_CAUSES_INDEX, 0, -1);
5603
5604 /*
5605 * For each interrupt vector, populate the IVAR table
5606 */
5607 for (v_idx = 0; v_idx < ixgbe->intr_cnt; v_idx++) {
5608 vect = &ixgbe->vect_map[v_idx];
5609
5610 /*
5611 * For each rx ring bit set
5612 */
5613 r_idx = bt_getlowbit(vect->rx_map, 0,
5614 (ixgbe->num_rx_rings - 1));
5615
5616 while (r_idx >= 0) {
5617 hw_index = ixgbe->rx_rings[r_idx].hw_index;
5618 ixgbe_setup_ivar(ixgbe, hw_index, v_idx, 0);
5619 r_idx = bt_getlowbit(vect->rx_map, (r_idx + 1),
5620 (ixgbe->num_rx_rings - 1));
5621 }
5622
5623 /*
5624 * For each tx ring bit set
5625 */
5626 r_idx = bt_getlowbit(vect->tx_map, 0,
5627 (ixgbe->num_tx_rings - 1));
5628
5629 while (r_idx >= 0) {
5630 ixgbe_setup_ivar(ixgbe, r_idx, v_idx, 1);
5631 r_idx = bt_getlowbit(vect->tx_map, (r_idx + 1),
5632 (ixgbe->num_tx_rings - 1));
5633 }
5634 }
5635 }
5636
5637 /*
5638 * ixgbe_rem_intr_handlers - Remove the interrupt handlers.
5639 */
5640 static void
ixgbe_rem_intr_handlers(ixgbe_t * ixgbe)5641 ixgbe_rem_intr_handlers(ixgbe_t *ixgbe)
5642 {
5643 int i;
5644 int rc;
5645
5646 for (i = 0; i < ixgbe->intr_cnt; i++) {
5647 rc = ddi_intr_remove_handler(ixgbe->htable[i]);
5648 if (rc != DDI_SUCCESS) {
5649 IXGBE_DEBUGLOG_1(ixgbe,
5650 "Remove intr handler failed: %d", rc);
5651 }
5652 }
5653 }
5654
5655 /*
5656 * ixgbe_rem_intrs - Remove the allocated interrupts.
5657 */
5658 static void
ixgbe_rem_intrs(ixgbe_t * ixgbe)5659 ixgbe_rem_intrs(ixgbe_t *ixgbe)
5660 {
5661 int i;
5662 int rc;
5663
5664 for (i = 0; i < ixgbe->intr_cnt; i++) {
5665 rc = ddi_intr_free(ixgbe->htable[i]);
5666 if (rc != DDI_SUCCESS) {
5667 IXGBE_DEBUGLOG_1(ixgbe,
5668 "Free intr failed: %d", rc);
5669 }
5670 }
5671
5672 kmem_free(ixgbe->htable, ixgbe->intr_size);
5673 ixgbe->htable = NULL;
5674 }
5675
5676 /*
5677 * ixgbe_enable_intrs - Enable all the ddi interrupts.
5678 */
5679 static int
ixgbe_enable_intrs(ixgbe_t * ixgbe)5680 ixgbe_enable_intrs(ixgbe_t *ixgbe)
5681 {
5682 int i;
5683 int rc;
5684
5685 /*
5686 * Enable interrupts
5687 */
5688 if (ixgbe->intr_cap & DDI_INTR_FLAG_BLOCK) {
5689 /*
5690 * Call ddi_intr_block_enable() for MSI
5691 */
5692 rc = ddi_intr_block_enable(ixgbe->htable, ixgbe->intr_cnt);
5693 if (rc != DDI_SUCCESS) {
5694 ixgbe_log(ixgbe,
5695 "Enable block intr failed: %d", rc);
5696 return (IXGBE_FAILURE);
5697 }
5698 } else {
5699 /*
5700 * Call ddi_intr_enable() for Legacy/MSI non block enable
5701 */
5702 for (i = 0; i < ixgbe->intr_cnt; i++) {
5703 rc = ddi_intr_enable(ixgbe->htable[i]);
5704 if (rc != DDI_SUCCESS) {
5705 ixgbe_log(ixgbe,
5706 "Enable intr failed: %d", rc);
5707 return (IXGBE_FAILURE);
5708 }
5709 }
5710 }
5711
5712 return (IXGBE_SUCCESS);
5713 }
5714
5715 /*
5716 * ixgbe_disable_intrs - Disable all the interrupts.
5717 */
5718 static int
ixgbe_disable_intrs(ixgbe_t * ixgbe)5719 ixgbe_disable_intrs(ixgbe_t *ixgbe)
5720 {
5721 int i;
5722 int rc;
5723
5724 /*
5725 * Disable all interrupts
5726 */
5727 if (ixgbe->intr_cap & DDI_INTR_FLAG_BLOCK) {
5728 rc = ddi_intr_block_disable(ixgbe->htable, ixgbe->intr_cnt);
5729 if (rc != DDI_SUCCESS) {
5730 ixgbe_log(ixgbe,
5731 "Disable block intr failed: %d", rc);
5732 return (IXGBE_FAILURE);
5733 }
5734 } else {
5735 for (i = 0; i < ixgbe->intr_cnt; i++) {
5736 rc = ddi_intr_disable(ixgbe->htable[i]);
5737 if (rc != DDI_SUCCESS) {
5738 ixgbe_log(ixgbe,
5739 "Disable intr failed: %d", rc);
5740 return (IXGBE_FAILURE);
5741 }
5742 }
5743 }
5744
5745 return (IXGBE_SUCCESS);
5746 }
5747
5748 /*
5749 * ixgbe_get_hw_state - Get and save parameters related to adapter hardware.
5750 */
5751 static void
ixgbe_get_hw_state(ixgbe_t * ixgbe)5752 ixgbe_get_hw_state(ixgbe_t *ixgbe)
5753 {
5754 struct ixgbe_hw *hw = &ixgbe->hw;
5755 ixgbe_link_speed speed = 0;
5756 boolean_t link_up = B_FALSE;
5757 uint32_t pcs1g_anlp = 0;
5758
5759 ASSERT(mutex_owned(&ixgbe->gen_lock));
5760 ixgbe->param_lp_1000fdx_cap = 0;
5761 ixgbe->param_lp_100fdx_cap = 0;
5762
5763 /* check for link, don't wait */
5764 (void) ixgbe_check_link(hw, &speed, &link_up, B_FALSE);
5765
5766 /*
5767 * Update the observed Link Partner's capabilities. Not all adapters
5768 * can provide full information on the LP's capable speeds, so we
5769 * provide what we can.
5770 */
5771 if (link_up) {
5772 pcs1g_anlp = IXGBE_READ_REG(hw, IXGBE_PCS1GANLP);
5773
5774 ixgbe->param_lp_1000fdx_cap =
5775 (pcs1g_anlp & IXGBE_PCS1GANLP_LPFD) ? 1 : 0;
5776 ixgbe->param_lp_100fdx_cap =
5777 (pcs1g_anlp & IXGBE_PCS1GANLP_LPFD) ? 1 : 0;
5778 }
5779
5780 /*
5781 * Update GLD's notion of the adapter's currently advertised speeds.
5782 * Since the common code doesn't always record the current autonegotiate
5783 * settings in the phy struct for all parts (specifically, adapters with
5784 * SFPs) we first test to see if it is 0, and if so, we fall back to
5785 * using the adapter's speed capabilities which we saved during instance
5786 * init in ixgbe_init_params().
5787 *
5788 * Adapters with SFPs will always be shown as advertising all of their
5789 * supported speeds, and adapters with baseT PHYs (where the phy struct
5790 * is maintained by the common code) will always have a factual view of
5791 * their currently-advertised speeds. In the case of SFPs, this is
5792 * acceptable as we default to advertising all speeds that the adapter
5793 * claims to support, and those properties are immutable; unlike on
5794 * baseT (copper) PHYs, where speeds can be enabled or disabled at will.
5795 */
5796 speed = hw->phy.autoneg_advertised;
5797 if (speed == 0)
5798 speed = ixgbe->speeds_supported;
5799
5800 ixgbe->param_adv_10000fdx_cap =
5801 (speed & IXGBE_LINK_SPEED_10GB_FULL) ? 1 : 0;
5802 ixgbe->param_adv_5000fdx_cap =
5803 (speed & IXGBE_LINK_SPEED_5GB_FULL) ? 1 : 0;
5804 ixgbe->param_adv_2500fdx_cap =
5805 (speed & IXGBE_LINK_SPEED_2_5GB_FULL) ? 1 : 0;
5806 ixgbe->param_adv_1000fdx_cap =
5807 (speed & IXGBE_LINK_SPEED_1GB_FULL) ? 1 : 0;
5808 ixgbe->param_adv_100fdx_cap =
5809 (speed & IXGBE_LINK_SPEED_100_FULL) ? 1 : 0;
5810 }
5811
5812 /*
5813 * ixgbe_get_driver_control - Notify that driver is in control of device.
5814 */
5815 static void
ixgbe_get_driver_control(struct ixgbe_hw * hw)5816 ixgbe_get_driver_control(struct ixgbe_hw *hw)
5817 {
5818 uint32_t ctrl_ext;
5819
5820 /*
5821 * Notify firmware that driver is in control of device
5822 */
5823 ctrl_ext = IXGBE_READ_REG(hw, IXGBE_CTRL_EXT);
5824 ctrl_ext |= IXGBE_CTRL_EXT_DRV_LOAD;
5825 IXGBE_WRITE_REG(hw, IXGBE_CTRL_EXT, ctrl_ext);
5826 }
5827
5828 /*
5829 * ixgbe_release_driver_control - Notify that driver is no longer in control
5830 * of device.
5831 */
5832 static void
ixgbe_release_driver_control(struct ixgbe_hw * hw)5833 ixgbe_release_driver_control(struct ixgbe_hw *hw)
5834 {
5835 uint32_t ctrl_ext;
5836
5837 /*
5838 * Notify firmware that driver is no longer in control of device
5839 */
5840 ctrl_ext = IXGBE_READ_REG(hw, IXGBE_CTRL_EXT);
5841 ctrl_ext &= ~IXGBE_CTRL_EXT_DRV_LOAD;
5842 IXGBE_WRITE_REG(hw, IXGBE_CTRL_EXT, ctrl_ext);
5843 }
5844
5845 /*
5846 * ixgbe_atomic_reserve - Atomic decrease operation.
5847 */
5848 int
ixgbe_atomic_reserve(uint32_t * count_p,uint32_t n)5849 ixgbe_atomic_reserve(uint32_t *count_p, uint32_t n)
5850 {
5851 uint32_t oldval;
5852 uint32_t newval;
5853
5854 /*
5855 * ATOMICALLY
5856 */
5857 do {
5858 oldval = *count_p;
5859 if (oldval < n)
5860 return (-1);
5861 newval = oldval - n;
5862 } while (atomic_cas_32(count_p, oldval, newval) != oldval);
5863
5864 return (newval);
5865 }
5866
5867 /*
5868 * ixgbe_mc_table_itr - Traverse the entries in the multicast table.
5869 */
5870 static uint8_t *
ixgbe_mc_table_itr(struct ixgbe_hw * hw,uint8_t ** upd_ptr,uint32_t * vmdq)5871 ixgbe_mc_table_itr(struct ixgbe_hw *hw, uint8_t **upd_ptr, uint32_t *vmdq)
5872 {
5873 uint8_t *addr = *upd_ptr;
5874 uint8_t *new_ptr;
5875
5876 _NOTE(ARGUNUSED(hw));
5877 _NOTE(ARGUNUSED(vmdq));
5878
5879 new_ptr = addr + IXGBE_ETH_LENGTH_OF_ADDRESS;
5880 *upd_ptr = new_ptr;
5881 return (addr);
5882 }
5883
5884 /*
5885 * FMA support
5886 */
5887 int
ixgbe_check_acc_handle(ddi_acc_handle_t handle)5888 ixgbe_check_acc_handle(ddi_acc_handle_t handle)
5889 {
5890 ddi_fm_error_t de;
5891
5892 ddi_fm_acc_err_get(handle, &de, DDI_FME_VERSION);
5893 ddi_fm_acc_err_clear(handle, DDI_FME_VERSION);
5894 return (de.fme_status);
5895 }
5896
5897 int
ixgbe_check_dma_handle(ddi_dma_handle_t handle)5898 ixgbe_check_dma_handle(ddi_dma_handle_t handle)
5899 {
5900 ddi_fm_error_t de;
5901
5902 ddi_fm_dma_err_get(handle, &de, DDI_FME_VERSION);
5903 return (de.fme_status);
5904 }
5905
5906 /*
5907 * ixgbe_fm_error_cb - The IO fault service error handling callback function.
5908 */
5909 static int
ixgbe_fm_error_cb(dev_info_t * dip,ddi_fm_error_t * err,const void * impl_data)5910 ixgbe_fm_error_cb(dev_info_t *dip, ddi_fm_error_t *err, const void *impl_data)
5911 {
5912 _NOTE(ARGUNUSED(impl_data));
5913 /*
5914 * as the driver can always deal with an error in any dma or
5915 * access handle, we can just return the fme_status value.
5916 */
5917 pci_ereport_post(dip, err, NULL);
5918 return (err->fme_status);
5919 }
5920
5921 static void
ixgbe_fm_init(ixgbe_t * ixgbe)5922 ixgbe_fm_init(ixgbe_t *ixgbe)
5923 {
5924 ddi_iblock_cookie_t iblk;
5925 int fma_dma_flag;
5926
5927 /*
5928 * Only register with IO Fault Services if we have some capability
5929 */
5930 if (ixgbe->fm_capabilities & DDI_FM_ACCCHK_CAPABLE) {
5931 ixgbe_regs_acc_attr.devacc_attr_access = DDI_FLAGERR_ACC;
5932 } else {
5933 ixgbe_regs_acc_attr.devacc_attr_access = DDI_DEFAULT_ACC;
5934 }
5935
5936 if (ixgbe->fm_capabilities & DDI_FM_DMACHK_CAPABLE) {
5937 fma_dma_flag = 1;
5938 } else {
5939 fma_dma_flag = 0;
5940 }
5941
5942 ixgbe_set_fma_flags(fma_dma_flag);
5943
5944 if (ixgbe->fm_capabilities) {
5945
5946 /*
5947 * Register capabilities with IO Fault Services
5948 */
5949 ddi_fm_init(ixgbe->dip, &ixgbe->fm_capabilities, &iblk);
5950
5951 /*
5952 * Initialize pci ereport capabilities if ereport capable
5953 */
5954 if (DDI_FM_EREPORT_CAP(ixgbe->fm_capabilities) ||
5955 DDI_FM_ERRCB_CAP(ixgbe->fm_capabilities))
5956 pci_ereport_setup(ixgbe->dip);
5957
5958 /*
5959 * Register error callback if error callback capable
5960 */
5961 if (DDI_FM_ERRCB_CAP(ixgbe->fm_capabilities))
5962 ddi_fm_handler_register(ixgbe->dip,
5963 ixgbe_fm_error_cb, (void*) ixgbe);
5964 }
5965 }
5966
5967 static void
ixgbe_fm_fini(ixgbe_t * ixgbe)5968 ixgbe_fm_fini(ixgbe_t *ixgbe)
5969 {
5970 /*
5971 * Only unregister FMA capabilities if they are registered
5972 */
5973 if (ixgbe->fm_capabilities) {
5974
5975 /*
5976 * Release any resources allocated by pci_ereport_setup()
5977 */
5978 if (DDI_FM_EREPORT_CAP(ixgbe->fm_capabilities) ||
5979 DDI_FM_ERRCB_CAP(ixgbe->fm_capabilities))
5980 pci_ereport_teardown(ixgbe->dip);
5981
5982 /*
5983 * Un-register error callback if error callback capable
5984 */
5985 if (DDI_FM_ERRCB_CAP(ixgbe->fm_capabilities))
5986 ddi_fm_handler_unregister(ixgbe->dip);
5987
5988 /*
5989 * Unregister from IO Fault Service
5990 */
5991 ddi_fm_fini(ixgbe->dip);
5992 }
5993 }
5994
5995 void
ixgbe_fm_ereport(ixgbe_t * ixgbe,char * detail)5996 ixgbe_fm_ereport(ixgbe_t *ixgbe, char *detail)
5997 {
5998 uint64_t ena;
5999 char buf[FM_MAX_CLASS];
6000
6001 (void) snprintf(buf, FM_MAX_CLASS, "%s.%s", DDI_FM_DEVICE, detail);
6002 ena = fm_ena_generate(0, FM_ENA_FMT1);
6003 if (DDI_FM_EREPORT_CAP(ixgbe->fm_capabilities)) {
6004 ddi_fm_ereport_post(ixgbe->dip, buf, ena, DDI_NOSLEEP,
6005 FM_VERSION, DATA_TYPE_UINT8, FM_EREPORT_VERS0, NULL);
6006 }
6007 }
6008
6009 static int
ixgbe_ring_start(mac_ring_driver_t rh,uint64_t mr_gen_num)6010 ixgbe_ring_start(mac_ring_driver_t rh, uint64_t mr_gen_num)
6011 {
6012 ixgbe_rx_ring_t *rx_ring = (ixgbe_rx_ring_t *)rh;
6013
6014 mutex_enter(&rx_ring->rx_lock);
6015 rx_ring->ring_gen_num = mr_gen_num;
6016 mutex_exit(&rx_ring->rx_lock);
6017 return (0);
6018 }
6019
6020 /*
6021 * Get the global ring index by a ring index within a group.
6022 */
6023 static int
ixgbe_get_rx_ring_index(ixgbe_t * ixgbe,int gindex,int rindex)6024 ixgbe_get_rx_ring_index(ixgbe_t *ixgbe, int gindex, int rindex)
6025 {
6026 ixgbe_rx_ring_t *rx_ring;
6027 int i;
6028
6029 for (i = 0; i < ixgbe->num_rx_rings; i++) {
6030 rx_ring = &ixgbe->rx_rings[i];
6031 if (rx_ring->group_index == gindex)
6032 rindex--;
6033 if (rindex < 0)
6034 return (i);
6035 }
6036
6037 return (-1);
6038 }
6039
6040 /*
6041 * Callback funtion for MAC layer to register all rings.
6042 */
6043 /* ARGSUSED */
6044 void
ixgbe_fill_ring(void * arg,mac_ring_type_t rtype,const int group_index,const int ring_index,mac_ring_info_t * infop,mac_ring_handle_t rh)6045 ixgbe_fill_ring(void *arg, mac_ring_type_t rtype, const int group_index,
6046 const int ring_index, mac_ring_info_t *infop, mac_ring_handle_t rh)
6047 {
6048 ixgbe_t *ixgbe = (ixgbe_t *)arg;
6049 mac_intr_t *mintr = &infop->mri_intr;
6050
6051 switch (rtype) {
6052 case MAC_RING_TYPE_RX: {
6053 /*
6054 * 'index' is the ring index within the group.
6055 * Need to get the global ring index by searching in groups.
6056 */
6057 int global_ring_index = ixgbe_get_rx_ring_index(
6058 ixgbe, group_index, ring_index);
6059
6060 ASSERT(global_ring_index >= 0);
6061
6062 ixgbe_rx_ring_t *rx_ring = &ixgbe->rx_rings[global_ring_index];
6063 rx_ring->ring_handle = rh;
6064
6065 infop->mri_driver = (mac_ring_driver_t)rx_ring;
6066 infop->mri_start = ixgbe_ring_start;
6067 infop->mri_stop = NULL;
6068 infop->mri_poll = ixgbe_ring_rx_poll;
6069 infop->mri_stat = ixgbe_rx_ring_stat;
6070
6071 mintr->mi_handle = (mac_intr_handle_t)rx_ring;
6072 mintr->mi_enable = ixgbe_rx_ring_intr_enable;
6073 mintr->mi_disable = ixgbe_rx_ring_intr_disable;
6074 if (ixgbe->intr_type &
6075 (DDI_INTR_TYPE_MSIX | DDI_INTR_TYPE_MSI)) {
6076 mintr->mi_ddi_handle =
6077 ixgbe->htable[rx_ring->intr_vector];
6078 }
6079
6080 break;
6081 }
6082 case MAC_RING_TYPE_TX: {
6083 ASSERT(group_index == -1);
6084 ASSERT(ring_index < ixgbe->num_tx_rings);
6085
6086 ixgbe_tx_ring_t *tx_ring = &ixgbe->tx_rings[ring_index];
6087 tx_ring->ring_handle = rh;
6088
6089 infop->mri_driver = (mac_ring_driver_t)tx_ring;
6090 infop->mri_start = NULL;
6091 infop->mri_stop = NULL;
6092 infop->mri_tx = ixgbe_ring_tx;
6093 infop->mri_stat = ixgbe_tx_ring_stat;
6094 if (ixgbe->intr_type &
6095 (DDI_INTR_TYPE_MSIX | DDI_INTR_TYPE_MSI)) {
6096 mintr->mi_ddi_handle =
6097 ixgbe->htable[tx_ring->intr_vector];
6098 }
6099 break;
6100 }
6101 default:
6102 break;
6103 }
6104 }
6105
6106 /*
6107 * Callback funtion for MAC layer to register all groups.
6108 */
6109 void
ixgbe_fill_group(void * arg,mac_ring_type_t rtype,const int index,mac_group_info_t * infop,mac_group_handle_t gh)6110 ixgbe_fill_group(void *arg, mac_ring_type_t rtype, const int index,
6111 mac_group_info_t *infop, mac_group_handle_t gh)
6112 {
6113 ixgbe_t *ixgbe = (ixgbe_t *)arg;
6114
6115 switch (rtype) {
6116 case MAC_RING_TYPE_RX: {
6117 ixgbe_rx_group_t *rx_group;
6118
6119 rx_group = &ixgbe->rx_groups[index];
6120 rx_group->group_handle = gh;
6121
6122 infop->mgi_driver = (mac_group_driver_t)rx_group;
6123 infop->mgi_start = NULL;
6124 infop->mgi_stop = NULL;
6125 infop->mgi_addmac = ixgbe_addmac;
6126 infop->mgi_remmac = ixgbe_remmac;
6127 infop->mgi_count = (ixgbe->num_rx_rings / ixgbe->num_rx_groups);
6128
6129 break;
6130 }
6131 case MAC_RING_TYPE_TX:
6132 break;
6133 default:
6134 break;
6135 }
6136 }
6137
6138 /*
6139 * Enable interrupt on the specificed rx ring.
6140 */
6141 int
ixgbe_rx_ring_intr_enable(mac_intr_handle_t intrh)6142 ixgbe_rx_ring_intr_enable(mac_intr_handle_t intrh)
6143 {
6144 ixgbe_rx_ring_t *rx_ring = (ixgbe_rx_ring_t *)intrh;
6145 ixgbe_t *ixgbe = rx_ring->ixgbe;
6146 int r_idx = rx_ring->index;
6147 int hw_r_idx = rx_ring->hw_index;
6148 int v_idx = rx_ring->intr_vector;
6149
6150 mutex_enter(&ixgbe->gen_lock);
6151 if (ixgbe->ixgbe_state & IXGBE_INTR_ADJUST) {
6152 mutex_exit(&ixgbe->gen_lock);
6153 /*
6154 * Simply return 0.
6155 * Interrupts are being adjusted. ixgbe_intr_adjust()
6156 * will eventually re-enable the interrupt when it's
6157 * done with the adjustment.
6158 */
6159 return (0);
6160 }
6161
6162 /*
6163 * To enable interrupt by setting the VAL bit of given interrupt
6164 * vector allocation register (IVAR).
6165 */
6166 ixgbe_enable_ivar(ixgbe, hw_r_idx, 0);
6167
6168 BT_SET(ixgbe->vect_map[v_idx].rx_map, r_idx);
6169
6170 /*
6171 * Trigger a Rx interrupt on this ring
6172 */
6173 IXGBE_WRITE_REG(&ixgbe->hw, IXGBE_EICS, (1 << v_idx));
6174 IXGBE_WRITE_FLUSH(&ixgbe->hw);
6175
6176 mutex_exit(&ixgbe->gen_lock);
6177
6178 return (0);
6179 }
6180
6181 /*
6182 * Disable interrupt on the specificed rx ring.
6183 */
6184 int
ixgbe_rx_ring_intr_disable(mac_intr_handle_t intrh)6185 ixgbe_rx_ring_intr_disable(mac_intr_handle_t intrh)
6186 {
6187 ixgbe_rx_ring_t *rx_ring = (ixgbe_rx_ring_t *)intrh;
6188 ixgbe_t *ixgbe = rx_ring->ixgbe;
6189 int r_idx = rx_ring->index;
6190 int hw_r_idx = rx_ring->hw_index;
6191 int v_idx = rx_ring->intr_vector;
6192
6193 mutex_enter(&ixgbe->gen_lock);
6194 if (ixgbe->ixgbe_state & IXGBE_INTR_ADJUST) {
6195 mutex_exit(&ixgbe->gen_lock);
6196 /*
6197 * Simply return 0.
6198 * In the rare case where an interrupt is being
6199 * disabled while interrupts are being adjusted,
6200 * we don't fail the operation. No interrupts will
6201 * be generated while they are adjusted, and
6202 * ixgbe_intr_adjust() will cause the interrupts
6203 * to be re-enabled once it completes. Note that
6204 * in this case, packets may be delivered to the
6205 * stack via interrupts before xgbe_rx_ring_intr_enable()
6206 * is called again. This is acceptable since interrupt
6207 * adjustment is infrequent, and the stack will be
6208 * able to handle these packets.
6209 */
6210 return (0);
6211 }
6212
6213 /*
6214 * To disable interrupt by clearing the VAL bit of given interrupt
6215 * vector allocation register (IVAR).
6216 */
6217 ixgbe_disable_ivar(ixgbe, hw_r_idx, 0);
6218
6219 BT_CLEAR(ixgbe->vect_map[v_idx].rx_map, r_idx);
6220
6221 mutex_exit(&ixgbe->gen_lock);
6222
6223 return (0);
6224 }
6225
6226 /*
6227 * Add a mac address.
6228 */
6229 static int
ixgbe_addmac(void * arg,const uint8_t * mac_addr)6230 ixgbe_addmac(void *arg, const uint8_t *mac_addr)
6231 {
6232 ixgbe_rx_group_t *rx_group = (ixgbe_rx_group_t *)arg;
6233 ixgbe_t *ixgbe = rx_group->ixgbe;
6234 struct ixgbe_hw *hw = &ixgbe->hw;
6235 int slot, i;
6236
6237 mutex_enter(&ixgbe->gen_lock);
6238
6239 if (ixgbe->ixgbe_state & IXGBE_SUSPENDED) {
6240 mutex_exit(&ixgbe->gen_lock);
6241 return (ECANCELED);
6242 }
6243
6244 if (ixgbe->unicst_avail == 0) {
6245 /* no slots available */
6246 mutex_exit(&ixgbe->gen_lock);
6247 return (ENOSPC);
6248 }
6249
6250 /*
6251 * The first ixgbe->num_rx_groups slots are reserved for each respective
6252 * group. The rest slots are shared by all groups. While adding a
6253 * MAC address, reserved slots are firstly checked then the shared
6254 * slots are searched.
6255 */
6256 slot = -1;
6257 if (ixgbe->unicst_addr[rx_group->index].mac.set == 1) {
6258 for (i = ixgbe->num_rx_groups; i < ixgbe->unicst_total; i++) {
6259 if (ixgbe->unicst_addr[i].mac.set == 0) {
6260 slot = i;
6261 break;
6262 }
6263 }
6264 } else {
6265 slot = rx_group->index;
6266 }
6267
6268 if (slot == -1) {
6269 /* no slots available */
6270 mutex_exit(&ixgbe->gen_lock);
6271 return (ENOSPC);
6272 }
6273
6274 bcopy(mac_addr, ixgbe->unicst_addr[slot].mac.addr, ETHERADDRL);
6275 (void) ixgbe_set_rar(hw, slot, ixgbe->unicst_addr[slot].mac.addr,
6276 rx_group->index, IXGBE_RAH_AV);
6277 ixgbe->unicst_addr[slot].mac.set = 1;
6278 ixgbe->unicst_addr[slot].mac.group_index = rx_group->index;
6279 ixgbe->unicst_avail--;
6280
6281 mutex_exit(&ixgbe->gen_lock);
6282
6283 return (0);
6284 }
6285
6286 /*
6287 * Remove a mac address.
6288 */
6289 static int
ixgbe_remmac(void * arg,const uint8_t * mac_addr)6290 ixgbe_remmac(void *arg, const uint8_t *mac_addr)
6291 {
6292 ixgbe_rx_group_t *rx_group = (ixgbe_rx_group_t *)arg;
6293 ixgbe_t *ixgbe = rx_group->ixgbe;
6294 struct ixgbe_hw *hw = &ixgbe->hw;
6295 int slot;
6296
6297 mutex_enter(&ixgbe->gen_lock);
6298
6299 if (ixgbe->ixgbe_state & IXGBE_SUSPENDED) {
6300 mutex_exit(&ixgbe->gen_lock);
6301 return (ECANCELED);
6302 }
6303
6304 slot = ixgbe_unicst_find(ixgbe, mac_addr);
6305 if (slot == -1) {
6306 mutex_exit(&ixgbe->gen_lock);
6307 return (EINVAL);
6308 }
6309
6310 if (ixgbe->unicst_addr[slot].mac.set == 0) {
6311 mutex_exit(&ixgbe->gen_lock);
6312 return (EINVAL);
6313 }
6314
6315 bzero(ixgbe->unicst_addr[slot].mac.addr, ETHERADDRL);
6316 (void) ixgbe_clear_rar(hw, slot);
6317 ixgbe->unicst_addr[slot].mac.set = 0;
6318 ixgbe->unicst_avail++;
6319
6320 mutex_exit(&ixgbe->gen_lock);
6321
6322 return (0);
6323 }
6324