1 /* 2 * Copyright (c) 2007 Mellanox Technologies. All rights reserved. 3 * 4 * This software is available to you under a choice of one of two 5 * licenses. You may choose to be licensed under the terms of the GNU 6 * General Public License (GPL) Version 2, available from the file 7 * COPYING in the main directory of this source tree, or the 8 * OpenIB.org BSD license below: 9 * 10 * Redistribution and use in source and binary forms, with or 11 * without modification, are permitted provided that the following 12 * conditions are met: 13 * 14 * - Redistributions of source code must retain the above 15 * copyright notice, this list of conditions and the following 16 * disclaimer. 17 * 18 * - Redistributions in binary form must reproduce the above 19 * copyright notice, this list of conditions and the following 20 * disclaimer in the documentation and/or other materials 21 * provided with the distribution. 22 * 23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 30 * SOFTWARE. 31 * 32 */ 33 34 #include <linux/etherdevice.h> 35 #include <linux/tcp.h> 36 #include <linux/if_vlan.h> 37 #include <linux/delay.h> 38 #include <linux/slab.h> 39 #include <linux/hash.h> 40 #include <net/ip.h> 41 #include <net/busy_poll.h> 42 #include <net/vxlan.h> 43 44 #include <linux/mlx4/driver.h> 45 #include <linux/mlx4/device.h> 46 #include <linux/mlx4/cmd.h> 47 #include <linux/mlx4/cq.h> 48 49 #include "mlx4_en.h" 50 #include "en_port.h" 51 52 int mlx4_en_setup_tc(struct net_device *dev, u8 up) 53 { 54 struct mlx4_en_priv *priv = netdev_priv(dev); 55 int i; 56 unsigned int offset = 0; 57 58 if (up && up != MLX4_EN_NUM_UP) 59 return -EINVAL; 60 61 netdev_set_num_tc(dev, up); 62 63 /* Partition Tx queues evenly amongst UP's */ 64 for (i = 0; i < up; i++) { 65 netdev_set_tc_queue(dev, i, priv->num_tx_rings_p_up, offset); 66 offset += priv->num_tx_rings_p_up; 67 } 68 69 return 0; 70 } 71 72 #ifdef CONFIG_NET_RX_BUSY_POLL 73 /* must be called with local_bh_disable()d */ 74 static int mlx4_en_low_latency_recv(struct napi_struct *napi) 75 { 76 struct mlx4_en_cq *cq = container_of(napi, struct mlx4_en_cq, napi); 77 struct net_device *dev = cq->dev; 78 struct mlx4_en_priv *priv = netdev_priv(dev); 79 struct mlx4_en_rx_ring *rx_ring = priv->rx_ring[cq->ring]; 80 int done; 81 82 if (!priv->port_up) 83 return LL_FLUSH_FAILED; 84 85 if (!mlx4_en_cq_lock_poll(cq)) 86 return LL_FLUSH_BUSY; 87 88 done = mlx4_en_process_rx_cq(dev, cq, 4); 89 if (likely(done)) 90 rx_ring->cleaned += done; 91 else 92 rx_ring->misses++; 93 94 mlx4_en_cq_unlock_poll(cq); 95 96 return done; 97 } 98 #endif /* CONFIG_NET_RX_BUSY_POLL */ 99 100 #ifdef CONFIG_RFS_ACCEL 101 102 struct mlx4_en_filter { 103 struct list_head next; 104 struct work_struct work; 105 106 u8 ip_proto; 107 __be32 src_ip; 108 __be32 dst_ip; 109 __be16 src_port; 110 __be16 dst_port; 111 112 int rxq_index; 113 struct mlx4_en_priv *priv; 114 u32 flow_id; /* RFS infrastructure id */ 115 int id; /* mlx4_en driver id */ 116 u64 reg_id; /* Flow steering API id */ 117 u8 activated; /* Used to prevent expiry before filter 118 * is attached 119 */ 120 struct hlist_node filter_chain; 121 }; 122 123 static void mlx4_en_filter_rfs_expire(struct mlx4_en_priv *priv); 124 125 static enum mlx4_net_trans_rule_id mlx4_ip_proto_to_trans_rule_id(u8 ip_proto) 126 { 127 switch (ip_proto) { 128 case IPPROTO_UDP: 129 return MLX4_NET_TRANS_RULE_ID_UDP; 130 case IPPROTO_TCP: 131 return MLX4_NET_TRANS_RULE_ID_TCP; 132 default: 133 return MLX4_NET_TRANS_RULE_NUM; 134 } 135 }; 136 137 static void mlx4_en_filter_work(struct work_struct *work) 138 { 139 struct mlx4_en_filter *filter = container_of(work, 140 struct mlx4_en_filter, 141 work); 142 struct mlx4_en_priv *priv = filter->priv; 143 struct mlx4_spec_list spec_tcp_udp = { 144 .id = mlx4_ip_proto_to_trans_rule_id(filter->ip_proto), 145 { 146 .tcp_udp = { 147 .dst_port = filter->dst_port, 148 .dst_port_msk = (__force __be16)-1, 149 .src_port = filter->src_port, 150 .src_port_msk = (__force __be16)-1, 151 }, 152 }, 153 }; 154 struct mlx4_spec_list spec_ip = { 155 .id = MLX4_NET_TRANS_RULE_ID_IPV4, 156 { 157 .ipv4 = { 158 .dst_ip = filter->dst_ip, 159 .dst_ip_msk = (__force __be32)-1, 160 .src_ip = filter->src_ip, 161 .src_ip_msk = (__force __be32)-1, 162 }, 163 }, 164 }; 165 struct mlx4_spec_list spec_eth = { 166 .id = MLX4_NET_TRANS_RULE_ID_ETH, 167 }; 168 struct mlx4_net_trans_rule rule = { 169 .list = LIST_HEAD_INIT(rule.list), 170 .queue_mode = MLX4_NET_TRANS_Q_LIFO, 171 .exclusive = 1, 172 .allow_loopback = 1, 173 .promisc_mode = MLX4_FS_REGULAR, 174 .port = priv->port, 175 .priority = MLX4_DOMAIN_RFS, 176 }; 177 int rc; 178 __be64 mac_mask = cpu_to_be64(MLX4_MAC_MASK << 16); 179 180 if (spec_tcp_udp.id >= MLX4_NET_TRANS_RULE_NUM) { 181 en_warn(priv, "RFS: ignoring unsupported ip protocol (%d)\n", 182 filter->ip_proto); 183 goto ignore; 184 } 185 list_add_tail(&spec_eth.list, &rule.list); 186 list_add_tail(&spec_ip.list, &rule.list); 187 list_add_tail(&spec_tcp_udp.list, &rule.list); 188 189 rule.qpn = priv->rss_map.qps[filter->rxq_index].qpn; 190 memcpy(spec_eth.eth.dst_mac, priv->dev->dev_addr, ETH_ALEN); 191 memcpy(spec_eth.eth.dst_mac_msk, &mac_mask, ETH_ALEN); 192 193 filter->activated = 0; 194 195 if (filter->reg_id) { 196 rc = mlx4_flow_detach(priv->mdev->dev, filter->reg_id); 197 if (rc && rc != -ENOENT) 198 en_err(priv, "Error detaching flow. rc = %d\n", rc); 199 } 200 201 rc = mlx4_flow_attach(priv->mdev->dev, &rule, &filter->reg_id); 202 if (rc) 203 en_err(priv, "Error attaching flow. err = %d\n", rc); 204 205 ignore: 206 mlx4_en_filter_rfs_expire(priv); 207 208 filter->activated = 1; 209 } 210 211 static inline struct hlist_head * 212 filter_hash_bucket(struct mlx4_en_priv *priv, __be32 src_ip, __be32 dst_ip, 213 __be16 src_port, __be16 dst_port) 214 { 215 unsigned long l; 216 int bucket_idx; 217 218 l = (__force unsigned long)src_port | 219 ((__force unsigned long)dst_port << 2); 220 l ^= (__force unsigned long)(src_ip ^ dst_ip); 221 222 bucket_idx = hash_long(l, MLX4_EN_FILTER_HASH_SHIFT); 223 224 return &priv->filter_hash[bucket_idx]; 225 } 226 227 static struct mlx4_en_filter * 228 mlx4_en_filter_alloc(struct mlx4_en_priv *priv, int rxq_index, __be32 src_ip, 229 __be32 dst_ip, u8 ip_proto, __be16 src_port, 230 __be16 dst_port, u32 flow_id) 231 { 232 struct mlx4_en_filter *filter = NULL; 233 234 filter = kzalloc(sizeof(struct mlx4_en_filter), GFP_ATOMIC); 235 if (!filter) 236 return NULL; 237 238 filter->priv = priv; 239 filter->rxq_index = rxq_index; 240 INIT_WORK(&filter->work, mlx4_en_filter_work); 241 242 filter->src_ip = src_ip; 243 filter->dst_ip = dst_ip; 244 filter->ip_proto = ip_proto; 245 filter->src_port = src_port; 246 filter->dst_port = dst_port; 247 248 filter->flow_id = flow_id; 249 250 filter->id = priv->last_filter_id++ % RPS_NO_FILTER; 251 252 list_add_tail(&filter->next, &priv->filters); 253 hlist_add_head(&filter->filter_chain, 254 filter_hash_bucket(priv, src_ip, dst_ip, src_port, 255 dst_port)); 256 257 return filter; 258 } 259 260 static void mlx4_en_filter_free(struct mlx4_en_filter *filter) 261 { 262 struct mlx4_en_priv *priv = filter->priv; 263 int rc; 264 265 list_del(&filter->next); 266 267 rc = mlx4_flow_detach(priv->mdev->dev, filter->reg_id); 268 if (rc && rc != -ENOENT) 269 en_err(priv, "Error detaching flow. rc = %d\n", rc); 270 271 kfree(filter); 272 } 273 274 static inline struct mlx4_en_filter * 275 mlx4_en_filter_find(struct mlx4_en_priv *priv, __be32 src_ip, __be32 dst_ip, 276 u8 ip_proto, __be16 src_port, __be16 dst_port) 277 { 278 struct mlx4_en_filter *filter; 279 struct mlx4_en_filter *ret = NULL; 280 281 hlist_for_each_entry(filter, 282 filter_hash_bucket(priv, src_ip, dst_ip, 283 src_port, dst_port), 284 filter_chain) { 285 if (filter->src_ip == src_ip && 286 filter->dst_ip == dst_ip && 287 filter->ip_proto == ip_proto && 288 filter->src_port == src_port && 289 filter->dst_port == dst_port) { 290 ret = filter; 291 break; 292 } 293 } 294 295 return ret; 296 } 297 298 static int 299 mlx4_en_filter_rfs(struct net_device *net_dev, const struct sk_buff *skb, 300 u16 rxq_index, u32 flow_id) 301 { 302 struct mlx4_en_priv *priv = netdev_priv(net_dev); 303 struct mlx4_en_filter *filter; 304 const struct iphdr *ip; 305 const __be16 *ports; 306 u8 ip_proto; 307 __be32 src_ip; 308 __be32 dst_ip; 309 __be16 src_port; 310 __be16 dst_port; 311 int nhoff = skb_network_offset(skb); 312 int ret = 0; 313 314 if (skb->protocol != htons(ETH_P_IP)) 315 return -EPROTONOSUPPORT; 316 317 ip = (const struct iphdr *)(skb->data + nhoff); 318 if (ip_is_fragment(ip)) 319 return -EPROTONOSUPPORT; 320 321 if ((ip->protocol != IPPROTO_TCP) && (ip->protocol != IPPROTO_UDP)) 322 return -EPROTONOSUPPORT; 323 ports = (const __be16 *)(skb->data + nhoff + 4 * ip->ihl); 324 325 ip_proto = ip->protocol; 326 src_ip = ip->saddr; 327 dst_ip = ip->daddr; 328 src_port = ports[0]; 329 dst_port = ports[1]; 330 331 spin_lock_bh(&priv->filters_lock); 332 filter = mlx4_en_filter_find(priv, src_ip, dst_ip, ip_proto, 333 src_port, dst_port); 334 if (filter) { 335 if (filter->rxq_index == rxq_index) 336 goto out; 337 338 filter->rxq_index = rxq_index; 339 } else { 340 filter = mlx4_en_filter_alloc(priv, rxq_index, 341 src_ip, dst_ip, ip_proto, 342 src_port, dst_port, flow_id); 343 if (!filter) { 344 ret = -ENOMEM; 345 goto err; 346 } 347 } 348 349 queue_work(priv->mdev->workqueue, &filter->work); 350 351 out: 352 ret = filter->id; 353 err: 354 spin_unlock_bh(&priv->filters_lock); 355 356 return ret; 357 } 358 359 void mlx4_en_cleanup_filters(struct mlx4_en_priv *priv) 360 { 361 struct mlx4_en_filter *filter, *tmp; 362 LIST_HEAD(del_list); 363 364 spin_lock_bh(&priv->filters_lock); 365 list_for_each_entry_safe(filter, tmp, &priv->filters, next) { 366 list_move(&filter->next, &del_list); 367 hlist_del(&filter->filter_chain); 368 } 369 spin_unlock_bh(&priv->filters_lock); 370 371 list_for_each_entry_safe(filter, tmp, &del_list, next) { 372 cancel_work_sync(&filter->work); 373 mlx4_en_filter_free(filter); 374 } 375 } 376 377 static void mlx4_en_filter_rfs_expire(struct mlx4_en_priv *priv) 378 { 379 struct mlx4_en_filter *filter = NULL, *tmp, *last_filter = NULL; 380 LIST_HEAD(del_list); 381 int i = 0; 382 383 spin_lock_bh(&priv->filters_lock); 384 list_for_each_entry_safe(filter, tmp, &priv->filters, next) { 385 if (i > MLX4_EN_FILTER_EXPIRY_QUOTA) 386 break; 387 388 if (filter->activated && 389 !work_pending(&filter->work) && 390 rps_may_expire_flow(priv->dev, 391 filter->rxq_index, filter->flow_id, 392 filter->id)) { 393 list_move(&filter->next, &del_list); 394 hlist_del(&filter->filter_chain); 395 } else 396 last_filter = filter; 397 398 i++; 399 } 400 401 if (last_filter && (&last_filter->next != priv->filters.next)) 402 list_move(&priv->filters, &last_filter->next); 403 404 spin_unlock_bh(&priv->filters_lock); 405 406 list_for_each_entry_safe(filter, tmp, &del_list, next) 407 mlx4_en_filter_free(filter); 408 } 409 #endif 410 411 static int mlx4_en_vlan_rx_add_vid(struct net_device *dev, 412 __be16 proto, u16 vid) 413 { 414 struct mlx4_en_priv *priv = netdev_priv(dev); 415 struct mlx4_en_dev *mdev = priv->mdev; 416 int err; 417 int idx; 418 419 en_dbg(HW, priv, "adding VLAN:%d\n", vid); 420 421 set_bit(vid, priv->active_vlans); 422 423 /* Add VID to port VLAN filter */ 424 mutex_lock(&mdev->state_lock); 425 if (mdev->device_up && priv->port_up) { 426 err = mlx4_SET_VLAN_FLTR(mdev->dev, priv); 427 if (err) 428 en_err(priv, "Failed configuring VLAN filter\n"); 429 } 430 if (mlx4_register_vlan(mdev->dev, priv->port, vid, &idx)) 431 en_dbg(HW, priv, "failed adding vlan %d\n", vid); 432 mutex_unlock(&mdev->state_lock); 433 434 return 0; 435 } 436 437 static int mlx4_en_vlan_rx_kill_vid(struct net_device *dev, 438 __be16 proto, u16 vid) 439 { 440 struct mlx4_en_priv *priv = netdev_priv(dev); 441 struct mlx4_en_dev *mdev = priv->mdev; 442 int err; 443 444 en_dbg(HW, priv, "Killing VID:%d\n", vid); 445 446 clear_bit(vid, priv->active_vlans); 447 448 /* Remove VID from port VLAN filter */ 449 mutex_lock(&mdev->state_lock); 450 mlx4_unregister_vlan(mdev->dev, priv->port, vid); 451 452 if (mdev->device_up && priv->port_up) { 453 err = mlx4_SET_VLAN_FLTR(mdev->dev, priv); 454 if (err) 455 en_err(priv, "Failed configuring VLAN filter\n"); 456 } 457 mutex_unlock(&mdev->state_lock); 458 459 return 0; 460 } 461 462 static void mlx4_en_u64_to_mac(unsigned char dst_mac[ETH_ALEN + 2], u64 src_mac) 463 { 464 int i; 465 for (i = ETH_ALEN - 1; i >= 0; --i) { 466 dst_mac[i] = src_mac & 0xff; 467 src_mac >>= 8; 468 } 469 memset(&dst_mac[ETH_ALEN], 0, 2); 470 } 471 472 473 static int mlx4_en_tunnel_steer_add(struct mlx4_en_priv *priv, unsigned char *addr, 474 int qpn, u64 *reg_id) 475 { 476 int err; 477 478 if (priv->mdev->dev->caps.tunnel_offload_mode != MLX4_TUNNEL_OFFLOAD_MODE_VXLAN || 479 priv->mdev->dev->caps.dmfs_high_steer_mode == MLX4_STEERING_DMFS_A0_STATIC) 480 return 0; /* do nothing */ 481 482 err = mlx4_tunnel_steer_add(priv->mdev->dev, addr, priv->port, qpn, 483 MLX4_DOMAIN_NIC, reg_id); 484 if (err) { 485 en_err(priv, "failed to add vxlan steering rule, err %d\n", err); 486 return err; 487 } 488 en_dbg(DRV, priv, "added vxlan steering rule, mac %pM reg_id %llx\n", addr, *reg_id); 489 return 0; 490 } 491 492 493 static int mlx4_en_uc_steer_add(struct mlx4_en_priv *priv, 494 unsigned char *mac, int *qpn, u64 *reg_id) 495 { 496 struct mlx4_en_dev *mdev = priv->mdev; 497 struct mlx4_dev *dev = mdev->dev; 498 int err; 499 500 switch (dev->caps.steering_mode) { 501 case MLX4_STEERING_MODE_B0: { 502 struct mlx4_qp qp; 503 u8 gid[16] = {0}; 504 505 qp.qpn = *qpn; 506 memcpy(&gid[10], mac, ETH_ALEN); 507 gid[5] = priv->port; 508 509 err = mlx4_unicast_attach(dev, &qp, gid, 0, MLX4_PROT_ETH); 510 break; 511 } 512 case MLX4_STEERING_MODE_DEVICE_MANAGED: { 513 struct mlx4_spec_list spec_eth = { {NULL} }; 514 __be64 mac_mask = cpu_to_be64(MLX4_MAC_MASK << 16); 515 516 struct mlx4_net_trans_rule rule = { 517 .queue_mode = MLX4_NET_TRANS_Q_FIFO, 518 .exclusive = 0, 519 .allow_loopback = 1, 520 .promisc_mode = MLX4_FS_REGULAR, 521 .priority = MLX4_DOMAIN_NIC, 522 }; 523 524 rule.port = priv->port; 525 rule.qpn = *qpn; 526 INIT_LIST_HEAD(&rule.list); 527 528 spec_eth.id = MLX4_NET_TRANS_RULE_ID_ETH; 529 memcpy(spec_eth.eth.dst_mac, mac, ETH_ALEN); 530 memcpy(spec_eth.eth.dst_mac_msk, &mac_mask, ETH_ALEN); 531 list_add_tail(&spec_eth.list, &rule.list); 532 533 err = mlx4_flow_attach(dev, &rule, reg_id); 534 break; 535 } 536 default: 537 return -EINVAL; 538 } 539 if (err) 540 en_warn(priv, "Failed Attaching Unicast\n"); 541 542 return err; 543 } 544 545 static void mlx4_en_uc_steer_release(struct mlx4_en_priv *priv, 546 unsigned char *mac, int qpn, u64 reg_id) 547 { 548 struct mlx4_en_dev *mdev = priv->mdev; 549 struct mlx4_dev *dev = mdev->dev; 550 551 switch (dev->caps.steering_mode) { 552 case MLX4_STEERING_MODE_B0: { 553 struct mlx4_qp qp; 554 u8 gid[16] = {0}; 555 556 qp.qpn = qpn; 557 memcpy(&gid[10], mac, ETH_ALEN); 558 gid[5] = priv->port; 559 560 mlx4_unicast_detach(dev, &qp, gid, MLX4_PROT_ETH); 561 break; 562 } 563 case MLX4_STEERING_MODE_DEVICE_MANAGED: { 564 mlx4_flow_detach(dev, reg_id); 565 break; 566 } 567 default: 568 en_err(priv, "Invalid steering mode.\n"); 569 } 570 } 571 572 static int mlx4_en_get_qp(struct mlx4_en_priv *priv) 573 { 574 struct mlx4_en_dev *mdev = priv->mdev; 575 struct mlx4_dev *dev = mdev->dev; 576 struct mlx4_mac_entry *entry; 577 int index = 0; 578 int err = 0; 579 u64 reg_id = 0; 580 int *qpn = &priv->base_qpn; 581 u64 mac = mlx4_mac_to_u64(priv->dev->dev_addr); 582 583 en_dbg(DRV, priv, "Registering MAC: %pM for adding\n", 584 priv->dev->dev_addr); 585 index = mlx4_register_mac(dev, priv->port, mac); 586 if (index < 0) { 587 err = index; 588 en_err(priv, "Failed adding MAC: %pM\n", 589 priv->dev->dev_addr); 590 return err; 591 } 592 593 if (dev->caps.steering_mode == MLX4_STEERING_MODE_A0) { 594 int base_qpn = mlx4_get_base_qpn(dev, priv->port); 595 *qpn = base_qpn + index; 596 return 0; 597 } 598 599 err = mlx4_qp_reserve_range(dev, 1, 1, qpn, MLX4_RESERVE_A0_QP); 600 en_dbg(DRV, priv, "Reserved qp %d\n", *qpn); 601 if (err) { 602 en_err(priv, "Failed to reserve qp for mac registration\n"); 603 goto qp_err; 604 } 605 606 err = mlx4_en_uc_steer_add(priv, priv->dev->dev_addr, qpn, ®_id); 607 if (err) 608 goto steer_err; 609 610 err = mlx4_en_tunnel_steer_add(priv, priv->dev->dev_addr, *qpn, 611 &priv->tunnel_reg_id); 612 if (err) 613 goto tunnel_err; 614 615 entry = kmalloc(sizeof(*entry), GFP_KERNEL); 616 if (!entry) { 617 err = -ENOMEM; 618 goto alloc_err; 619 } 620 memcpy(entry->mac, priv->dev->dev_addr, sizeof(entry->mac)); 621 memcpy(priv->current_mac, entry->mac, sizeof(priv->current_mac)); 622 entry->reg_id = reg_id; 623 624 hlist_add_head_rcu(&entry->hlist, 625 &priv->mac_hash[entry->mac[MLX4_EN_MAC_HASH_IDX]]); 626 627 return 0; 628 629 alloc_err: 630 if (priv->tunnel_reg_id) 631 mlx4_flow_detach(priv->mdev->dev, priv->tunnel_reg_id); 632 tunnel_err: 633 mlx4_en_uc_steer_release(priv, priv->dev->dev_addr, *qpn, reg_id); 634 635 steer_err: 636 mlx4_qp_release_range(dev, *qpn, 1); 637 638 qp_err: 639 mlx4_unregister_mac(dev, priv->port, mac); 640 return err; 641 } 642 643 static void mlx4_en_put_qp(struct mlx4_en_priv *priv) 644 { 645 struct mlx4_en_dev *mdev = priv->mdev; 646 struct mlx4_dev *dev = mdev->dev; 647 int qpn = priv->base_qpn; 648 u64 mac; 649 650 if (dev->caps.steering_mode == MLX4_STEERING_MODE_A0) { 651 mac = mlx4_mac_to_u64(priv->dev->dev_addr); 652 en_dbg(DRV, priv, "Registering MAC: %pM for deleting\n", 653 priv->dev->dev_addr); 654 mlx4_unregister_mac(dev, priv->port, mac); 655 } else { 656 struct mlx4_mac_entry *entry; 657 struct hlist_node *tmp; 658 struct hlist_head *bucket; 659 unsigned int i; 660 661 for (i = 0; i < MLX4_EN_MAC_HASH_SIZE; ++i) { 662 bucket = &priv->mac_hash[i]; 663 hlist_for_each_entry_safe(entry, tmp, bucket, hlist) { 664 mac = mlx4_mac_to_u64(entry->mac); 665 en_dbg(DRV, priv, "Registering MAC: %pM for deleting\n", 666 entry->mac); 667 mlx4_en_uc_steer_release(priv, entry->mac, 668 qpn, entry->reg_id); 669 670 mlx4_unregister_mac(dev, priv->port, mac); 671 hlist_del_rcu(&entry->hlist); 672 kfree_rcu(entry, rcu); 673 } 674 } 675 676 if (priv->tunnel_reg_id) { 677 mlx4_flow_detach(priv->mdev->dev, priv->tunnel_reg_id); 678 priv->tunnel_reg_id = 0; 679 } 680 681 en_dbg(DRV, priv, "Releasing qp: port %d, qpn %d\n", 682 priv->port, qpn); 683 mlx4_qp_release_range(dev, qpn, 1); 684 priv->flags &= ~MLX4_EN_FLAG_FORCE_PROMISC; 685 } 686 } 687 688 static int mlx4_en_replace_mac(struct mlx4_en_priv *priv, int qpn, 689 unsigned char *new_mac, unsigned char *prev_mac) 690 { 691 struct mlx4_en_dev *mdev = priv->mdev; 692 struct mlx4_dev *dev = mdev->dev; 693 int err = 0; 694 u64 new_mac_u64 = mlx4_mac_to_u64(new_mac); 695 696 if (dev->caps.steering_mode != MLX4_STEERING_MODE_A0) { 697 struct hlist_head *bucket; 698 unsigned int mac_hash; 699 struct mlx4_mac_entry *entry; 700 struct hlist_node *tmp; 701 u64 prev_mac_u64 = mlx4_mac_to_u64(prev_mac); 702 703 bucket = &priv->mac_hash[prev_mac[MLX4_EN_MAC_HASH_IDX]]; 704 hlist_for_each_entry_safe(entry, tmp, bucket, hlist) { 705 if (ether_addr_equal_64bits(entry->mac, prev_mac)) { 706 mlx4_en_uc_steer_release(priv, entry->mac, 707 qpn, entry->reg_id); 708 mlx4_unregister_mac(dev, priv->port, 709 prev_mac_u64); 710 hlist_del_rcu(&entry->hlist); 711 synchronize_rcu(); 712 memcpy(entry->mac, new_mac, ETH_ALEN); 713 entry->reg_id = 0; 714 mac_hash = new_mac[MLX4_EN_MAC_HASH_IDX]; 715 hlist_add_head_rcu(&entry->hlist, 716 &priv->mac_hash[mac_hash]); 717 mlx4_register_mac(dev, priv->port, new_mac_u64); 718 err = mlx4_en_uc_steer_add(priv, new_mac, 719 &qpn, 720 &entry->reg_id); 721 if (err) 722 return err; 723 if (priv->tunnel_reg_id) { 724 mlx4_flow_detach(priv->mdev->dev, priv->tunnel_reg_id); 725 priv->tunnel_reg_id = 0; 726 } 727 err = mlx4_en_tunnel_steer_add(priv, new_mac, qpn, 728 &priv->tunnel_reg_id); 729 return err; 730 } 731 } 732 return -EINVAL; 733 } 734 735 return __mlx4_replace_mac(dev, priv->port, qpn, new_mac_u64); 736 } 737 738 static int mlx4_en_do_set_mac(struct mlx4_en_priv *priv, 739 unsigned char new_mac[ETH_ALEN + 2]) 740 { 741 int err = 0; 742 743 if (priv->port_up) { 744 /* Remove old MAC and insert the new one */ 745 err = mlx4_en_replace_mac(priv, priv->base_qpn, 746 new_mac, priv->current_mac); 747 if (err) 748 en_err(priv, "Failed changing HW MAC address\n"); 749 } else 750 en_dbg(HW, priv, "Port is down while registering mac, exiting...\n"); 751 752 if (!err) 753 memcpy(priv->current_mac, new_mac, sizeof(priv->current_mac)); 754 755 return err; 756 } 757 758 static int mlx4_en_set_mac(struct net_device *dev, void *addr) 759 { 760 struct mlx4_en_priv *priv = netdev_priv(dev); 761 struct mlx4_en_dev *mdev = priv->mdev; 762 struct sockaddr *saddr = addr; 763 unsigned char new_mac[ETH_ALEN + 2]; 764 int err; 765 766 if (!is_valid_ether_addr(saddr->sa_data)) 767 return -EADDRNOTAVAIL; 768 769 mutex_lock(&mdev->state_lock); 770 memcpy(new_mac, saddr->sa_data, ETH_ALEN); 771 err = mlx4_en_do_set_mac(priv, new_mac); 772 if (!err) 773 memcpy(dev->dev_addr, saddr->sa_data, ETH_ALEN); 774 mutex_unlock(&mdev->state_lock); 775 776 return err; 777 } 778 779 static void mlx4_en_clear_list(struct net_device *dev) 780 { 781 struct mlx4_en_priv *priv = netdev_priv(dev); 782 struct mlx4_en_mc_list *tmp, *mc_to_del; 783 784 list_for_each_entry_safe(mc_to_del, tmp, &priv->mc_list, list) { 785 list_del(&mc_to_del->list); 786 kfree(mc_to_del); 787 } 788 } 789 790 static void mlx4_en_cache_mclist(struct net_device *dev) 791 { 792 struct mlx4_en_priv *priv = netdev_priv(dev); 793 struct netdev_hw_addr *ha; 794 struct mlx4_en_mc_list *tmp; 795 796 mlx4_en_clear_list(dev); 797 netdev_for_each_mc_addr(ha, dev) { 798 tmp = kzalloc(sizeof(struct mlx4_en_mc_list), GFP_ATOMIC); 799 if (!tmp) { 800 mlx4_en_clear_list(dev); 801 return; 802 } 803 memcpy(tmp->addr, ha->addr, ETH_ALEN); 804 list_add_tail(&tmp->list, &priv->mc_list); 805 } 806 } 807 808 static void update_mclist_flags(struct mlx4_en_priv *priv, 809 struct list_head *dst, 810 struct list_head *src) 811 { 812 struct mlx4_en_mc_list *dst_tmp, *src_tmp, *new_mc; 813 bool found; 814 815 /* Find all the entries that should be removed from dst, 816 * These are the entries that are not found in src 817 */ 818 list_for_each_entry(dst_tmp, dst, list) { 819 found = false; 820 list_for_each_entry(src_tmp, src, list) { 821 if (ether_addr_equal(dst_tmp->addr, src_tmp->addr)) { 822 found = true; 823 break; 824 } 825 } 826 if (!found) 827 dst_tmp->action = MCLIST_REM; 828 } 829 830 /* Add entries that exist in src but not in dst 831 * mark them as need to add 832 */ 833 list_for_each_entry(src_tmp, src, list) { 834 found = false; 835 list_for_each_entry(dst_tmp, dst, list) { 836 if (ether_addr_equal(dst_tmp->addr, src_tmp->addr)) { 837 dst_tmp->action = MCLIST_NONE; 838 found = true; 839 break; 840 } 841 } 842 if (!found) { 843 new_mc = kmemdup(src_tmp, 844 sizeof(struct mlx4_en_mc_list), 845 GFP_KERNEL); 846 if (!new_mc) 847 return; 848 849 new_mc->action = MCLIST_ADD; 850 list_add_tail(&new_mc->list, dst); 851 } 852 } 853 } 854 855 static void mlx4_en_set_rx_mode(struct net_device *dev) 856 { 857 struct mlx4_en_priv *priv = netdev_priv(dev); 858 859 if (!priv->port_up) 860 return; 861 862 queue_work(priv->mdev->workqueue, &priv->rx_mode_task); 863 } 864 865 static void mlx4_en_set_promisc_mode(struct mlx4_en_priv *priv, 866 struct mlx4_en_dev *mdev) 867 { 868 int err = 0; 869 870 if (!(priv->flags & MLX4_EN_FLAG_PROMISC)) { 871 if (netif_msg_rx_status(priv)) 872 en_warn(priv, "Entering promiscuous mode\n"); 873 priv->flags |= MLX4_EN_FLAG_PROMISC; 874 875 /* Enable promiscouos mode */ 876 switch (mdev->dev->caps.steering_mode) { 877 case MLX4_STEERING_MODE_DEVICE_MANAGED: 878 err = mlx4_flow_steer_promisc_add(mdev->dev, 879 priv->port, 880 priv->base_qpn, 881 MLX4_FS_ALL_DEFAULT); 882 if (err) 883 en_err(priv, "Failed enabling promiscuous mode\n"); 884 priv->flags |= MLX4_EN_FLAG_MC_PROMISC; 885 break; 886 887 case MLX4_STEERING_MODE_B0: 888 err = mlx4_unicast_promisc_add(mdev->dev, 889 priv->base_qpn, 890 priv->port); 891 if (err) 892 en_err(priv, "Failed enabling unicast promiscuous mode\n"); 893 894 /* Add the default qp number as multicast 895 * promisc 896 */ 897 if (!(priv->flags & MLX4_EN_FLAG_MC_PROMISC)) { 898 err = mlx4_multicast_promisc_add(mdev->dev, 899 priv->base_qpn, 900 priv->port); 901 if (err) 902 en_err(priv, "Failed enabling multicast promiscuous mode\n"); 903 priv->flags |= MLX4_EN_FLAG_MC_PROMISC; 904 } 905 break; 906 907 case MLX4_STEERING_MODE_A0: 908 err = mlx4_SET_PORT_qpn_calc(mdev->dev, 909 priv->port, 910 priv->base_qpn, 911 1); 912 if (err) 913 en_err(priv, "Failed enabling promiscuous mode\n"); 914 break; 915 } 916 917 /* Disable port multicast filter (unconditionally) */ 918 err = mlx4_SET_MCAST_FLTR(mdev->dev, priv->port, 0, 919 0, MLX4_MCAST_DISABLE); 920 if (err) 921 en_err(priv, "Failed disabling multicast filter\n"); 922 } 923 } 924 925 static void mlx4_en_clear_promisc_mode(struct mlx4_en_priv *priv, 926 struct mlx4_en_dev *mdev) 927 { 928 int err = 0; 929 930 if (netif_msg_rx_status(priv)) 931 en_warn(priv, "Leaving promiscuous mode\n"); 932 priv->flags &= ~MLX4_EN_FLAG_PROMISC; 933 934 /* Disable promiscouos mode */ 935 switch (mdev->dev->caps.steering_mode) { 936 case MLX4_STEERING_MODE_DEVICE_MANAGED: 937 err = mlx4_flow_steer_promisc_remove(mdev->dev, 938 priv->port, 939 MLX4_FS_ALL_DEFAULT); 940 if (err) 941 en_err(priv, "Failed disabling promiscuous mode\n"); 942 priv->flags &= ~MLX4_EN_FLAG_MC_PROMISC; 943 break; 944 945 case MLX4_STEERING_MODE_B0: 946 err = mlx4_unicast_promisc_remove(mdev->dev, 947 priv->base_qpn, 948 priv->port); 949 if (err) 950 en_err(priv, "Failed disabling unicast promiscuous mode\n"); 951 /* Disable Multicast promisc */ 952 if (priv->flags & MLX4_EN_FLAG_MC_PROMISC) { 953 err = mlx4_multicast_promisc_remove(mdev->dev, 954 priv->base_qpn, 955 priv->port); 956 if (err) 957 en_err(priv, "Failed disabling multicast promiscuous mode\n"); 958 priv->flags &= ~MLX4_EN_FLAG_MC_PROMISC; 959 } 960 break; 961 962 case MLX4_STEERING_MODE_A0: 963 err = mlx4_SET_PORT_qpn_calc(mdev->dev, 964 priv->port, 965 priv->base_qpn, 0); 966 if (err) 967 en_err(priv, "Failed disabling promiscuous mode\n"); 968 break; 969 } 970 } 971 972 static void mlx4_en_do_multicast(struct mlx4_en_priv *priv, 973 struct net_device *dev, 974 struct mlx4_en_dev *mdev) 975 { 976 struct mlx4_en_mc_list *mclist, *tmp; 977 u64 mcast_addr = 0; 978 u8 mc_list[16] = {0}; 979 int err = 0; 980 981 /* Enable/disable the multicast filter according to IFF_ALLMULTI */ 982 if (dev->flags & IFF_ALLMULTI) { 983 err = mlx4_SET_MCAST_FLTR(mdev->dev, priv->port, 0, 984 0, MLX4_MCAST_DISABLE); 985 if (err) 986 en_err(priv, "Failed disabling multicast filter\n"); 987 988 /* Add the default qp number as multicast promisc */ 989 if (!(priv->flags & MLX4_EN_FLAG_MC_PROMISC)) { 990 switch (mdev->dev->caps.steering_mode) { 991 case MLX4_STEERING_MODE_DEVICE_MANAGED: 992 err = mlx4_flow_steer_promisc_add(mdev->dev, 993 priv->port, 994 priv->base_qpn, 995 MLX4_FS_MC_DEFAULT); 996 break; 997 998 case MLX4_STEERING_MODE_B0: 999 err = mlx4_multicast_promisc_add(mdev->dev, 1000 priv->base_qpn, 1001 priv->port); 1002 break; 1003 1004 case MLX4_STEERING_MODE_A0: 1005 break; 1006 } 1007 if (err) 1008 en_err(priv, "Failed entering multicast promisc mode\n"); 1009 priv->flags |= MLX4_EN_FLAG_MC_PROMISC; 1010 } 1011 } else { 1012 /* Disable Multicast promisc */ 1013 if (priv->flags & MLX4_EN_FLAG_MC_PROMISC) { 1014 switch (mdev->dev->caps.steering_mode) { 1015 case MLX4_STEERING_MODE_DEVICE_MANAGED: 1016 err = mlx4_flow_steer_promisc_remove(mdev->dev, 1017 priv->port, 1018 MLX4_FS_MC_DEFAULT); 1019 break; 1020 1021 case MLX4_STEERING_MODE_B0: 1022 err = mlx4_multicast_promisc_remove(mdev->dev, 1023 priv->base_qpn, 1024 priv->port); 1025 break; 1026 1027 case MLX4_STEERING_MODE_A0: 1028 break; 1029 } 1030 if (err) 1031 en_err(priv, "Failed disabling multicast promiscuous mode\n"); 1032 priv->flags &= ~MLX4_EN_FLAG_MC_PROMISC; 1033 } 1034 1035 err = mlx4_SET_MCAST_FLTR(mdev->dev, priv->port, 0, 1036 0, MLX4_MCAST_DISABLE); 1037 if (err) 1038 en_err(priv, "Failed disabling multicast filter\n"); 1039 1040 /* Flush mcast filter and init it with broadcast address */ 1041 mlx4_SET_MCAST_FLTR(mdev->dev, priv->port, ETH_BCAST, 1042 1, MLX4_MCAST_CONFIG); 1043 1044 /* Update multicast list - we cache all addresses so they won't 1045 * change while HW is updated holding the command semaphor */ 1046 netif_addr_lock_bh(dev); 1047 mlx4_en_cache_mclist(dev); 1048 netif_addr_unlock_bh(dev); 1049 list_for_each_entry(mclist, &priv->mc_list, list) { 1050 mcast_addr = mlx4_mac_to_u64(mclist->addr); 1051 mlx4_SET_MCAST_FLTR(mdev->dev, priv->port, 1052 mcast_addr, 0, MLX4_MCAST_CONFIG); 1053 } 1054 err = mlx4_SET_MCAST_FLTR(mdev->dev, priv->port, 0, 1055 0, MLX4_MCAST_ENABLE); 1056 if (err) 1057 en_err(priv, "Failed enabling multicast filter\n"); 1058 1059 update_mclist_flags(priv, &priv->curr_list, &priv->mc_list); 1060 list_for_each_entry_safe(mclist, tmp, &priv->curr_list, list) { 1061 if (mclist->action == MCLIST_REM) { 1062 /* detach this address and delete from list */ 1063 memcpy(&mc_list[10], mclist->addr, ETH_ALEN); 1064 mc_list[5] = priv->port; 1065 err = mlx4_multicast_detach(mdev->dev, 1066 &priv->rss_map.indir_qp, 1067 mc_list, 1068 MLX4_PROT_ETH, 1069 mclist->reg_id); 1070 if (err) 1071 en_err(priv, "Fail to detach multicast address\n"); 1072 1073 if (mclist->tunnel_reg_id) { 1074 err = mlx4_flow_detach(priv->mdev->dev, mclist->tunnel_reg_id); 1075 if (err) 1076 en_err(priv, "Failed to detach multicast address\n"); 1077 } 1078 1079 /* remove from list */ 1080 list_del(&mclist->list); 1081 kfree(mclist); 1082 } else if (mclist->action == MCLIST_ADD) { 1083 /* attach the address */ 1084 memcpy(&mc_list[10], mclist->addr, ETH_ALEN); 1085 /* needed for B0 steering support */ 1086 mc_list[5] = priv->port; 1087 err = mlx4_multicast_attach(mdev->dev, 1088 &priv->rss_map.indir_qp, 1089 mc_list, 1090 priv->port, 0, 1091 MLX4_PROT_ETH, 1092 &mclist->reg_id); 1093 if (err) 1094 en_err(priv, "Fail to attach multicast address\n"); 1095 1096 err = mlx4_en_tunnel_steer_add(priv, &mc_list[10], priv->base_qpn, 1097 &mclist->tunnel_reg_id); 1098 if (err) 1099 en_err(priv, "Failed to attach multicast address\n"); 1100 } 1101 } 1102 } 1103 } 1104 1105 static void mlx4_en_do_uc_filter(struct mlx4_en_priv *priv, 1106 struct net_device *dev, 1107 struct mlx4_en_dev *mdev) 1108 { 1109 struct netdev_hw_addr *ha; 1110 struct mlx4_mac_entry *entry; 1111 struct hlist_node *tmp; 1112 bool found; 1113 u64 mac; 1114 int err = 0; 1115 struct hlist_head *bucket; 1116 unsigned int i; 1117 int removed = 0; 1118 u32 prev_flags; 1119 1120 /* Note that we do not need to protect our mac_hash traversal with rcu, 1121 * since all modification code is protected by mdev->state_lock 1122 */ 1123 1124 /* find what to remove */ 1125 for (i = 0; i < MLX4_EN_MAC_HASH_SIZE; ++i) { 1126 bucket = &priv->mac_hash[i]; 1127 hlist_for_each_entry_safe(entry, tmp, bucket, hlist) { 1128 found = false; 1129 netdev_for_each_uc_addr(ha, dev) { 1130 if (ether_addr_equal_64bits(entry->mac, 1131 ha->addr)) { 1132 found = true; 1133 break; 1134 } 1135 } 1136 1137 /* MAC address of the port is not in uc list */ 1138 if (ether_addr_equal_64bits(entry->mac, 1139 priv->current_mac)) 1140 found = true; 1141 1142 if (!found) { 1143 mac = mlx4_mac_to_u64(entry->mac); 1144 mlx4_en_uc_steer_release(priv, entry->mac, 1145 priv->base_qpn, 1146 entry->reg_id); 1147 mlx4_unregister_mac(mdev->dev, priv->port, mac); 1148 1149 hlist_del_rcu(&entry->hlist); 1150 kfree_rcu(entry, rcu); 1151 en_dbg(DRV, priv, "Removed MAC %pM on port:%d\n", 1152 entry->mac, priv->port); 1153 ++removed; 1154 } 1155 } 1156 } 1157 1158 /* if we didn't remove anything, there is no use in trying to add 1159 * again once we are in a forced promisc mode state 1160 */ 1161 if ((priv->flags & MLX4_EN_FLAG_FORCE_PROMISC) && 0 == removed) 1162 return; 1163 1164 prev_flags = priv->flags; 1165 priv->flags &= ~MLX4_EN_FLAG_FORCE_PROMISC; 1166 1167 /* find what to add */ 1168 netdev_for_each_uc_addr(ha, dev) { 1169 found = false; 1170 bucket = &priv->mac_hash[ha->addr[MLX4_EN_MAC_HASH_IDX]]; 1171 hlist_for_each_entry(entry, bucket, hlist) { 1172 if (ether_addr_equal_64bits(entry->mac, ha->addr)) { 1173 found = true; 1174 break; 1175 } 1176 } 1177 1178 if (!found) { 1179 entry = kmalloc(sizeof(*entry), GFP_KERNEL); 1180 if (!entry) { 1181 en_err(priv, "Failed adding MAC %pM on port:%d (out of memory)\n", 1182 ha->addr, priv->port); 1183 priv->flags |= MLX4_EN_FLAG_FORCE_PROMISC; 1184 break; 1185 } 1186 mac = mlx4_mac_to_u64(ha->addr); 1187 memcpy(entry->mac, ha->addr, ETH_ALEN); 1188 err = mlx4_register_mac(mdev->dev, priv->port, mac); 1189 if (err < 0) { 1190 en_err(priv, "Failed registering MAC %pM on port %d: %d\n", 1191 ha->addr, priv->port, err); 1192 kfree(entry); 1193 priv->flags |= MLX4_EN_FLAG_FORCE_PROMISC; 1194 break; 1195 } 1196 err = mlx4_en_uc_steer_add(priv, ha->addr, 1197 &priv->base_qpn, 1198 &entry->reg_id); 1199 if (err) { 1200 en_err(priv, "Failed adding MAC %pM on port %d: %d\n", 1201 ha->addr, priv->port, err); 1202 mlx4_unregister_mac(mdev->dev, priv->port, mac); 1203 kfree(entry); 1204 priv->flags |= MLX4_EN_FLAG_FORCE_PROMISC; 1205 break; 1206 } else { 1207 unsigned int mac_hash; 1208 en_dbg(DRV, priv, "Added MAC %pM on port:%d\n", 1209 ha->addr, priv->port); 1210 mac_hash = ha->addr[MLX4_EN_MAC_HASH_IDX]; 1211 bucket = &priv->mac_hash[mac_hash]; 1212 hlist_add_head_rcu(&entry->hlist, bucket); 1213 } 1214 } 1215 } 1216 1217 if (priv->flags & MLX4_EN_FLAG_FORCE_PROMISC) { 1218 en_warn(priv, "Forcing promiscuous mode on port:%d\n", 1219 priv->port); 1220 } else if (prev_flags & MLX4_EN_FLAG_FORCE_PROMISC) { 1221 en_warn(priv, "Stop forcing promiscuous mode on port:%d\n", 1222 priv->port); 1223 } 1224 } 1225 1226 static void mlx4_en_do_set_rx_mode(struct work_struct *work) 1227 { 1228 struct mlx4_en_priv *priv = container_of(work, struct mlx4_en_priv, 1229 rx_mode_task); 1230 struct mlx4_en_dev *mdev = priv->mdev; 1231 struct net_device *dev = priv->dev; 1232 1233 mutex_lock(&mdev->state_lock); 1234 if (!mdev->device_up) { 1235 en_dbg(HW, priv, "Card is not up, ignoring rx mode change.\n"); 1236 goto out; 1237 } 1238 if (!priv->port_up) { 1239 en_dbg(HW, priv, "Port is down, ignoring rx mode change.\n"); 1240 goto out; 1241 } 1242 1243 if (!netif_carrier_ok(dev)) { 1244 if (!mlx4_en_QUERY_PORT(mdev, priv->port)) { 1245 if (priv->port_state.link_state) { 1246 priv->last_link_state = MLX4_DEV_EVENT_PORT_UP; 1247 netif_carrier_on(dev); 1248 en_dbg(LINK, priv, "Link Up\n"); 1249 } 1250 } 1251 } 1252 1253 if (dev->priv_flags & IFF_UNICAST_FLT) 1254 mlx4_en_do_uc_filter(priv, dev, mdev); 1255 1256 /* Promsicuous mode: disable all filters */ 1257 if ((dev->flags & IFF_PROMISC) || 1258 (priv->flags & MLX4_EN_FLAG_FORCE_PROMISC)) { 1259 mlx4_en_set_promisc_mode(priv, mdev); 1260 goto out; 1261 } 1262 1263 /* Not in promiscuous mode */ 1264 if (priv->flags & MLX4_EN_FLAG_PROMISC) 1265 mlx4_en_clear_promisc_mode(priv, mdev); 1266 1267 mlx4_en_do_multicast(priv, dev, mdev); 1268 out: 1269 mutex_unlock(&mdev->state_lock); 1270 } 1271 1272 #ifdef CONFIG_NET_POLL_CONTROLLER 1273 static void mlx4_en_netpoll(struct net_device *dev) 1274 { 1275 struct mlx4_en_priv *priv = netdev_priv(dev); 1276 struct mlx4_en_cq *cq; 1277 int i; 1278 1279 for (i = 0; i < priv->rx_ring_num; i++) { 1280 cq = priv->rx_cq[i]; 1281 napi_schedule(&cq->napi); 1282 } 1283 } 1284 #endif 1285 1286 static void mlx4_en_tx_timeout(struct net_device *dev) 1287 { 1288 struct mlx4_en_priv *priv = netdev_priv(dev); 1289 struct mlx4_en_dev *mdev = priv->mdev; 1290 int i; 1291 1292 if (netif_msg_timer(priv)) 1293 en_warn(priv, "Tx timeout called on port:%d\n", priv->port); 1294 1295 for (i = 0; i < priv->tx_ring_num; i++) { 1296 if (!netif_tx_queue_stopped(netdev_get_tx_queue(dev, i))) 1297 continue; 1298 en_warn(priv, "TX timeout on queue: %d, QP: 0x%x, CQ: 0x%x, Cons: 0x%x, Prod: 0x%x\n", 1299 i, priv->tx_ring[i]->qpn, priv->tx_ring[i]->cqn, 1300 priv->tx_ring[i]->cons, priv->tx_ring[i]->prod); 1301 } 1302 1303 priv->port_stats.tx_timeout++; 1304 en_dbg(DRV, priv, "Scheduling watchdog\n"); 1305 queue_work(mdev->workqueue, &priv->watchdog_task); 1306 } 1307 1308 1309 static struct net_device_stats *mlx4_en_get_stats(struct net_device *dev) 1310 { 1311 struct mlx4_en_priv *priv = netdev_priv(dev); 1312 1313 spin_lock_bh(&priv->stats_lock); 1314 memcpy(&priv->ret_stats, &priv->stats, sizeof(priv->stats)); 1315 spin_unlock_bh(&priv->stats_lock); 1316 1317 return &priv->ret_stats; 1318 } 1319 1320 static void mlx4_en_set_default_moderation(struct mlx4_en_priv *priv) 1321 { 1322 struct mlx4_en_cq *cq; 1323 int i; 1324 1325 /* If we haven't received a specific coalescing setting 1326 * (module param), we set the moderation parameters as follows: 1327 * - moder_cnt is set to the number of mtu sized packets to 1328 * satisfy our coalescing target. 1329 * - moder_time is set to a fixed value. 1330 */ 1331 priv->rx_frames = MLX4_EN_RX_COAL_TARGET; 1332 priv->rx_usecs = MLX4_EN_RX_COAL_TIME; 1333 priv->tx_frames = MLX4_EN_TX_COAL_PKTS; 1334 priv->tx_usecs = MLX4_EN_TX_COAL_TIME; 1335 en_dbg(INTR, priv, "Default coalesing params for mtu:%d - rx_frames:%d rx_usecs:%d\n", 1336 priv->dev->mtu, priv->rx_frames, priv->rx_usecs); 1337 1338 /* Setup cq moderation params */ 1339 for (i = 0; i < priv->rx_ring_num; i++) { 1340 cq = priv->rx_cq[i]; 1341 cq->moder_cnt = priv->rx_frames; 1342 cq->moder_time = priv->rx_usecs; 1343 priv->last_moder_time[i] = MLX4_EN_AUTO_CONF; 1344 priv->last_moder_packets[i] = 0; 1345 priv->last_moder_bytes[i] = 0; 1346 } 1347 1348 for (i = 0; i < priv->tx_ring_num; i++) { 1349 cq = priv->tx_cq[i]; 1350 cq->moder_cnt = priv->tx_frames; 1351 cq->moder_time = priv->tx_usecs; 1352 } 1353 1354 /* Reset auto-moderation params */ 1355 priv->pkt_rate_low = MLX4_EN_RX_RATE_LOW; 1356 priv->rx_usecs_low = MLX4_EN_RX_COAL_TIME_LOW; 1357 priv->pkt_rate_high = MLX4_EN_RX_RATE_HIGH; 1358 priv->rx_usecs_high = MLX4_EN_RX_COAL_TIME_HIGH; 1359 priv->sample_interval = MLX4_EN_SAMPLE_INTERVAL; 1360 priv->adaptive_rx_coal = 1; 1361 priv->last_moder_jiffies = 0; 1362 priv->last_moder_tx_packets = 0; 1363 } 1364 1365 static void mlx4_en_auto_moderation(struct mlx4_en_priv *priv) 1366 { 1367 unsigned long period = (unsigned long) (jiffies - priv->last_moder_jiffies); 1368 struct mlx4_en_cq *cq; 1369 unsigned long packets; 1370 unsigned long rate; 1371 unsigned long avg_pkt_size; 1372 unsigned long rx_packets; 1373 unsigned long rx_bytes; 1374 unsigned long rx_pkt_diff; 1375 int moder_time; 1376 int ring, err; 1377 1378 if (!priv->adaptive_rx_coal || period < priv->sample_interval * HZ) 1379 return; 1380 1381 for (ring = 0; ring < priv->rx_ring_num; ring++) { 1382 spin_lock_bh(&priv->stats_lock); 1383 rx_packets = priv->rx_ring[ring]->packets; 1384 rx_bytes = priv->rx_ring[ring]->bytes; 1385 spin_unlock_bh(&priv->stats_lock); 1386 1387 rx_pkt_diff = ((unsigned long) (rx_packets - 1388 priv->last_moder_packets[ring])); 1389 packets = rx_pkt_diff; 1390 rate = packets * HZ / period; 1391 avg_pkt_size = packets ? ((unsigned long) (rx_bytes - 1392 priv->last_moder_bytes[ring])) / packets : 0; 1393 1394 /* Apply auto-moderation only when packet rate 1395 * exceeds a rate that it matters */ 1396 if (rate > (MLX4_EN_RX_RATE_THRESH / priv->rx_ring_num) && 1397 avg_pkt_size > MLX4_EN_AVG_PKT_SMALL) { 1398 if (rate < priv->pkt_rate_low) 1399 moder_time = priv->rx_usecs_low; 1400 else if (rate > priv->pkt_rate_high) 1401 moder_time = priv->rx_usecs_high; 1402 else 1403 moder_time = (rate - priv->pkt_rate_low) * 1404 (priv->rx_usecs_high - priv->rx_usecs_low) / 1405 (priv->pkt_rate_high - priv->pkt_rate_low) + 1406 priv->rx_usecs_low; 1407 } else { 1408 moder_time = priv->rx_usecs_low; 1409 } 1410 1411 if (moder_time != priv->last_moder_time[ring]) { 1412 priv->last_moder_time[ring] = moder_time; 1413 cq = priv->rx_cq[ring]; 1414 cq->moder_time = moder_time; 1415 cq->moder_cnt = priv->rx_frames; 1416 err = mlx4_en_set_cq_moder(priv, cq); 1417 if (err) 1418 en_err(priv, "Failed modifying moderation for cq:%d\n", 1419 ring); 1420 } 1421 priv->last_moder_packets[ring] = rx_packets; 1422 priv->last_moder_bytes[ring] = rx_bytes; 1423 } 1424 1425 priv->last_moder_jiffies = jiffies; 1426 } 1427 1428 static void mlx4_en_do_get_stats(struct work_struct *work) 1429 { 1430 struct delayed_work *delay = to_delayed_work(work); 1431 struct mlx4_en_priv *priv = container_of(delay, struct mlx4_en_priv, 1432 stats_task); 1433 struct mlx4_en_dev *mdev = priv->mdev; 1434 int err; 1435 1436 mutex_lock(&mdev->state_lock); 1437 if (mdev->device_up) { 1438 if (priv->port_up) { 1439 err = mlx4_en_DUMP_ETH_STATS(mdev, priv->port, 0); 1440 if (err) 1441 en_dbg(HW, priv, "Could not update stats\n"); 1442 1443 mlx4_en_auto_moderation(priv); 1444 } 1445 1446 queue_delayed_work(mdev->workqueue, &priv->stats_task, STATS_DELAY); 1447 } 1448 if (mdev->mac_removed[MLX4_MAX_PORTS + 1 - priv->port]) { 1449 mlx4_en_do_set_mac(priv, priv->current_mac); 1450 mdev->mac_removed[MLX4_MAX_PORTS + 1 - priv->port] = 0; 1451 } 1452 mutex_unlock(&mdev->state_lock); 1453 } 1454 1455 /* mlx4_en_service_task - Run service task for tasks that needed to be done 1456 * periodically 1457 */ 1458 static void mlx4_en_service_task(struct work_struct *work) 1459 { 1460 struct delayed_work *delay = to_delayed_work(work); 1461 struct mlx4_en_priv *priv = container_of(delay, struct mlx4_en_priv, 1462 service_task); 1463 struct mlx4_en_dev *mdev = priv->mdev; 1464 1465 mutex_lock(&mdev->state_lock); 1466 if (mdev->device_up) { 1467 if (mdev->dev->caps.flags2 & MLX4_DEV_CAP_FLAG2_TS) 1468 mlx4_en_ptp_overflow_check(mdev); 1469 1470 queue_delayed_work(mdev->workqueue, &priv->service_task, 1471 SERVICE_TASK_DELAY); 1472 } 1473 mutex_unlock(&mdev->state_lock); 1474 } 1475 1476 static void mlx4_en_linkstate(struct work_struct *work) 1477 { 1478 struct mlx4_en_priv *priv = container_of(work, struct mlx4_en_priv, 1479 linkstate_task); 1480 struct mlx4_en_dev *mdev = priv->mdev; 1481 int linkstate = priv->link_state; 1482 1483 mutex_lock(&mdev->state_lock); 1484 /* If observable port state changed set carrier state and 1485 * report to system log */ 1486 if (priv->last_link_state != linkstate) { 1487 if (linkstate == MLX4_DEV_EVENT_PORT_DOWN) { 1488 en_info(priv, "Link Down\n"); 1489 netif_carrier_off(priv->dev); 1490 } else { 1491 en_info(priv, "Link Up\n"); 1492 netif_carrier_on(priv->dev); 1493 } 1494 } 1495 priv->last_link_state = linkstate; 1496 mutex_unlock(&mdev->state_lock); 1497 } 1498 1499 static int mlx4_en_init_affinity_hint(struct mlx4_en_priv *priv, int ring_idx) 1500 { 1501 struct mlx4_en_rx_ring *ring = priv->rx_ring[ring_idx]; 1502 int numa_node = priv->mdev->dev->numa_node; 1503 int ret = 0; 1504 1505 if (!zalloc_cpumask_var(&ring->affinity_mask, GFP_KERNEL)) 1506 return -ENOMEM; 1507 1508 ret = cpumask_set_cpu_local_first(ring_idx, numa_node, 1509 ring->affinity_mask); 1510 if (ret) 1511 free_cpumask_var(ring->affinity_mask); 1512 1513 return ret; 1514 } 1515 1516 static void mlx4_en_free_affinity_hint(struct mlx4_en_priv *priv, int ring_idx) 1517 { 1518 free_cpumask_var(priv->rx_ring[ring_idx]->affinity_mask); 1519 } 1520 1521 int mlx4_en_start_port(struct net_device *dev) 1522 { 1523 struct mlx4_en_priv *priv = netdev_priv(dev); 1524 struct mlx4_en_dev *mdev = priv->mdev; 1525 struct mlx4_en_cq *cq; 1526 struct mlx4_en_tx_ring *tx_ring; 1527 int rx_index = 0; 1528 int tx_index = 0; 1529 int err = 0; 1530 int i; 1531 int j; 1532 u8 mc_list[16] = {0}; 1533 1534 if (priv->port_up) { 1535 en_dbg(DRV, priv, "start port called while port already up\n"); 1536 return 0; 1537 } 1538 1539 INIT_LIST_HEAD(&priv->mc_list); 1540 INIT_LIST_HEAD(&priv->curr_list); 1541 INIT_LIST_HEAD(&priv->ethtool_list); 1542 memset(&priv->ethtool_rules[0], 0, 1543 sizeof(struct ethtool_flow_id) * MAX_NUM_OF_FS_RULES); 1544 1545 /* Calculate Rx buf size */ 1546 dev->mtu = min(dev->mtu, priv->max_mtu); 1547 mlx4_en_calc_rx_buf(dev); 1548 en_dbg(DRV, priv, "Rx buf size:%d\n", priv->rx_skb_size); 1549 1550 /* Configure rx cq's and rings */ 1551 err = mlx4_en_activate_rx_rings(priv); 1552 if (err) { 1553 en_err(priv, "Failed to activate RX rings\n"); 1554 return err; 1555 } 1556 for (i = 0; i < priv->rx_ring_num; i++) { 1557 cq = priv->rx_cq[i]; 1558 1559 mlx4_en_cq_init_lock(cq); 1560 1561 err = mlx4_en_init_affinity_hint(priv, i); 1562 if (err) { 1563 en_err(priv, "Failed preparing IRQ affinity hint\n"); 1564 goto cq_err; 1565 } 1566 1567 err = mlx4_en_activate_cq(priv, cq, i); 1568 if (err) { 1569 en_err(priv, "Failed activating Rx CQ\n"); 1570 mlx4_en_free_affinity_hint(priv, i); 1571 goto cq_err; 1572 } 1573 1574 for (j = 0; j < cq->size; j++) { 1575 struct mlx4_cqe *cqe = NULL; 1576 1577 cqe = mlx4_en_get_cqe(cq->buf, j, priv->cqe_size) + 1578 priv->cqe_factor; 1579 cqe->owner_sr_opcode = MLX4_CQE_OWNER_MASK; 1580 } 1581 1582 err = mlx4_en_set_cq_moder(priv, cq); 1583 if (err) { 1584 en_err(priv, "Failed setting cq moderation parameters\n"); 1585 mlx4_en_deactivate_cq(priv, cq); 1586 mlx4_en_free_affinity_hint(priv, i); 1587 goto cq_err; 1588 } 1589 mlx4_en_arm_cq(priv, cq); 1590 priv->rx_ring[i]->cqn = cq->mcq.cqn; 1591 ++rx_index; 1592 } 1593 1594 /* Set qp number */ 1595 en_dbg(DRV, priv, "Getting qp number for port %d\n", priv->port); 1596 err = mlx4_en_get_qp(priv); 1597 if (err) { 1598 en_err(priv, "Failed getting eth qp\n"); 1599 goto cq_err; 1600 } 1601 mdev->mac_removed[priv->port] = 0; 1602 1603 err = mlx4_en_config_rss_steer(priv); 1604 if (err) { 1605 en_err(priv, "Failed configuring rss steering\n"); 1606 goto mac_err; 1607 } 1608 1609 err = mlx4_en_create_drop_qp(priv); 1610 if (err) 1611 goto rss_err; 1612 1613 /* Configure tx cq's and rings */ 1614 for (i = 0; i < priv->tx_ring_num; i++) { 1615 /* Configure cq */ 1616 cq = priv->tx_cq[i]; 1617 err = mlx4_en_activate_cq(priv, cq, i); 1618 if (err) { 1619 en_err(priv, "Failed allocating Tx CQ\n"); 1620 goto tx_err; 1621 } 1622 err = mlx4_en_set_cq_moder(priv, cq); 1623 if (err) { 1624 en_err(priv, "Failed setting cq moderation parameters\n"); 1625 mlx4_en_deactivate_cq(priv, cq); 1626 goto tx_err; 1627 } 1628 en_dbg(DRV, priv, "Resetting index of collapsed CQ:%d to -1\n", i); 1629 cq->buf->wqe_index = cpu_to_be16(0xffff); 1630 1631 /* Configure ring */ 1632 tx_ring = priv->tx_ring[i]; 1633 err = mlx4_en_activate_tx_ring(priv, tx_ring, cq->mcq.cqn, 1634 i / priv->num_tx_rings_p_up); 1635 if (err) { 1636 en_err(priv, "Failed allocating Tx ring\n"); 1637 mlx4_en_deactivate_cq(priv, cq); 1638 goto tx_err; 1639 } 1640 tx_ring->tx_queue = netdev_get_tx_queue(dev, i); 1641 1642 /* Arm CQ for TX completions */ 1643 mlx4_en_arm_cq(priv, cq); 1644 1645 /* Set initial ownership of all Tx TXBBs to SW (1) */ 1646 for (j = 0; j < tx_ring->buf_size; j += STAMP_STRIDE) 1647 *((u32 *) (tx_ring->buf + j)) = 0xffffffff; 1648 ++tx_index; 1649 } 1650 1651 /* Configure port */ 1652 err = mlx4_SET_PORT_general(mdev->dev, priv->port, 1653 priv->rx_skb_size + ETH_FCS_LEN, 1654 priv->prof->tx_pause, 1655 priv->prof->tx_ppp, 1656 priv->prof->rx_pause, 1657 priv->prof->rx_ppp); 1658 if (err) { 1659 en_err(priv, "Failed setting port general configurations for port %d, with error %d\n", 1660 priv->port, err); 1661 goto tx_err; 1662 } 1663 /* Set default qp number */ 1664 err = mlx4_SET_PORT_qpn_calc(mdev->dev, priv->port, priv->base_qpn, 0); 1665 if (err) { 1666 en_err(priv, "Failed setting default qp numbers\n"); 1667 goto tx_err; 1668 } 1669 1670 if (mdev->dev->caps.tunnel_offload_mode == MLX4_TUNNEL_OFFLOAD_MODE_VXLAN) { 1671 err = mlx4_SET_PORT_VXLAN(mdev->dev, priv->port, VXLAN_STEER_BY_OUTER_MAC, 1); 1672 if (err) { 1673 en_err(priv, "Failed setting port L2 tunnel configuration, err %d\n", 1674 err); 1675 goto tx_err; 1676 } 1677 } 1678 1679 /* Init port */ 1680 en_dbg(HW, priv, "Initializing port\n"); 1681 err = mlx4_INIT_PORT(mdev->dev, priv->port); 1682 if (err) { 1683 en_err(priv, "Failed Initializing port\n"); 1684 goto tx_err; 1685 } 1686 1687 /* Attach rx QP to bradcast address */ 1688 memset(&mc_list[10], 0xff, ETH_ALEN); 1689 mc_list[5] = priv->port; /* needed for B0 steering support */ 1690 if (mlx4_multicast_attach(mdev->dev, &priv->rss_map.indir_qp, mc_list, 1691 priv->port, 0, MLX4_PROT_ETH, 1692 &priv->broadcast_id)) 1693 mlx4_warn(mdev, "Failed Attaching Broadcast\n"); 1694 1695 /* Must redo promiscuous mode setup. */ 1696 priv->flags &= ~(MLX4_EN_FLAG_PROMISC | MLX4_EN_FLAG_MC_PROMISC); 1697 1698 /* Schedule multicast task to populate multicast list */ 1699 queue_work(mdev->workqueue, &priv->rx_mode_task); 1700 1701 #ifdef CONFIG_MLX4_EN_VXLAN 1702 if (priv->mdev->dev->caps.tunnel_offload_mode == MLX4_TUNNEL_OFFLOAD_MODE_VXLAN) 1703 vxlan_get_rx_port(dev); 1704 #endif 1705 priv->port_up = true; 1706 netif_tx_start_all_queues(dev); 1707 netif_device_attach(dev); 1708 1709 return 0; 1710 1711 tx_err: 1712 while (tx_index--) { 1713 mlx4_en_deactivate_tx_ring(priv, priv->tx_ring[tx_index]); 1714 mlx4_en_deactivate_cq(priv, priv->tx_cq[tx_index]); 1715 } 1716 mlx4_en_destroy_drop_qp(priv); 1717 rss_err: 1718 mlx4_en_release_rss_steer(priv); 1719 mac_err: 1720 mlx4_en_put_qp(priv); 1721 cq_err: 1722 while (rx_index--) { 1723 mlx4_en_deactivate_cq(priv, priv->rx_cq[rx_index]); 1724 mlx4_en_free_affinity_hint(priv, i); 1725 } 1726 for (i = 0; i < priv->rx_ring_num; i++) 1727 mlx4_en_deactivate_rx_ring(priv, priv->rx_ring[i]); 1728 1729 return err; /* need to close devices */ 1730 } 1731 1732 1733 void mlx4_en_stop_port(struct net_device *dev, int detach) 1734 { 1735 struct mlx4_en_priv *priv = netdev_priv(dev); 1736 struct mlx4_en_dev *mdev = priv->mdev; 1737 struct mlx4_en_mc_list *mclist, *tmp; 1738 struct ethtool_flow_id *flow, *tmp_flow; 1739 int i; 1740 u8 mc_list[16] = {0}; 1741 1742 if (!priv->port_up) { 1743 en_dbg(DRV, priv, "stop port called while port already down\n"); 1744 return; 1745 } 1746 1747 /* close port*/ 1748 mlx4_CLOSE_PORT(mdev->dev, priv->port); 1749 1750 /* Synchronize with tx routine */ 1751 netif_tx_lock_bh(dev); 1752 if (detach) 1753 netif_device_detach(dev); 1754 netif_tx_stop_all_queues(dev); 1755 netif_tx_unlock_bh(dev); 1756 1757 netif_tx_disable(dev); 1758 1759 /* Set port as not active */ 1760 priv->port_up = false; 1761 1762 /* Promsicuous mode */ 1763 if (mdev->dev->caps.steering_mode == 1764 MLX4_STEERING_MODE_DEVICE_MANAGED) { 1765 priv->flags &= ~(MLX4_EN_FLAG_PROMISC | 1766 MLX4_EN_FLAG_MC_PROMISC); 1767 mlx4_flow_steer_promisc_remove(mdev->dev, 1768 priv->port, 1769 MLX4_FS_ALL_DEFAULT); 1770 mlx4_flow_steer_promisc_remove(mdev->dev, 1771 priv->port, 1772 MLX4_FS_MC_DEFAULT); 1773 } else if (priv->flags & MLX4_EN_FLAG_PROMISC) { 1774 priv->flags &= ~MLX4_EN_FLAG_PROMISC; 1775 1776 /* Disable promiscouos mode */ 1777 mlx4_unicast_promisc_remove(mdev->dev, priv->base_qpn, 1778 priv->port); 1779 1780 /* Disable Multicast promisc */ 1781 if (priv->flags & MLX4_EN_FLAG_MC_PROMISC) { 1782 mlx4_multicast_promisc_remove(mdev->dev, priv->base_qpn, 1783 priv->port); 1784 priv->flags &= ~MLX4_EN_FLAG_MC_PROMISC; 1785 } 1786 } 1787 1788 /* Detach All multicasts */ 1789 memset(&mc_list[10], 0xff, ETH_ALEN); 1790 mc_list[5] = priv->port; /* needed for B0 steering support */ 1791 mlx4_multicast_detach(mdev->dev, &priv->rss_map.indir_qp, mc_list, 1792 MLX4_PROT_ETH, priv->broadcast_id); 1793 list_for_each_entry(mclist, &priv->curr_list, list) { 1794 memcpy(&mc_list[10], mclist->addr, ETH_ALEN); 1795 mc_list[5] = priv->port; 1796 mlx4_multicast_detach(mdev->dev, &priv->rss_map.indir_qp, 1797 mc_list, MLX4_PROT_ETH, mclist->reg_id); 1798 if (mclist->tunnel_reg_id) 1799 mlx4_flow_detach(mdev->dev, mclist->tunnel_reg_id); 1800 } 1801 mlx4_en_clear_list(dev); 1802 list_for_each_entry_safe(mclist, tmp, &priv->curr_list, list) { 1803 list_del(&mclist->list); 1804 kfree(mclist); 1805 } 1806 1807 /* Flush multicast filter */ 1808 mlx4_SET_MCAST_FLTR(mdev->dev, priv->port, 0, 1, MLX4_MCAST_CONFIG); 1809 1810 /* Remove flow steering rules for the port*/ 1811 if (mdev->dev->caps.steering_mode == 1812 MLX4_STEERING_MODE_DEVICE_MANAGED) { 1813 ASSERT_RTNL(); 1814 list_for_each_entry_safe(flow, tmp_flow, 1815 &priv->ethtool_list, list) { 1816 mlx4_flow_detach(mdev->dev, flow->id); 1817 list_del(&flow->list); 1818 } 1819 } 1820 1821 mlx4_en_destroy_drop_qp(priv); 1822 1823 /* Free TX Rings */ 1824 for (i = 0; i < priv->tx_ring_num; i++) { 1825 mlx4_en_deactivate_tx_ring(priv, priv->tx_ring[i]); 1826 mlx4_en_deactivate_cq(priv, priv->tx_cq[i]); 1827 } 1828 msleep(10); 1829 1830 for (i = 0; i < priv->tx_ring_num; i++) 1831 mlx4_en_free_tx_buf(dev, priv->tx_ring[i]); 1832 1833 /* Free RSS qps */ 1834 mlx4_en_release_rss_steer(priv); 1835 1836 /* Unregister Mac address for the port */ 1837 mlx4_en_put_qp(priv); 1838 if (!(mdev->dev->caps.flags2 & MLX4_DEV_CAP_FLAG2_REASSIGN_MAC_EN)) 1839 mdev->mac_removed[priv->port] = 1; 1840 1841 /* Free RX Rings */ 1842 for (i = 0; i < priv->rx_ring_num; i++) { 1843 struct mlx4_en_cq *cq = priv->rx_cq[i]; 1844 1845 local_bh_disable(); 1846 while (!mlx4_en_cq_lock_napi(cq)) { 1847 pr_info("CQ %d locked\n", i); 1848 mdelay(1); 1849 } 1850 local_bh_enable(); 1851 1852 napi_synchronize(&cq->napi); 1853 mlx4_en_deactivate_rx_ring(priv, priv->rx_ring[i]); 1854 mlx4_en_deactivate_cq(priv, cq); 1855 1856 mlx4_en_free_affinity_hint(priv, i); 1857 } 1858 } 1859 1860 static void mlx4_en_restart(struct work_struct *work) 1861 { 1862 struct mlx4_en_priv *priv = container_of(work, struct mlx4_en_priv, 1863 watchdog_task); 1864 struct mlx4_en_dev *mdev = priv->mdev; 1865 struct net_device *dev = priv->dev; 1866 1867 en_dbg(DRV, priv, "Watchdog task called for port %d\n", priv->port); 1868 1869 mutex_lock(&mdev->state_lock); 1870 if (priv->port_up) { 1871 mlx4_en_stop_port(dev, 1); 1872 if (mlx4_en_start_port(dev)) 1873 en_err(priv, "Failed restarting port %d\n", priv->port); 1874 } 1875 mutex_unlock(&mdev->state_lock); 1876 } 1877 1878 static void mlx4_en_clear_stats(struct net_device *dev) 1879 { 1880 struct mlx4_en_priv *priv = netdev_priv(dev); 1881 struct mlx4_en_dev *mdev = priv->mdev; 1882 int i; 1883 1884 if (mlx4_en_DUMP_ETH_STATS(mdev, priv->port, 1)) 1885 en_dbg(HW, priv, "Failed dumping statistics\n"); 1886 1887 memset(&priv->stats, 0, sizeof(priv->stats)); 1888 memset(&priv->pstats, 0, sizeof(priv->pstats)); 1889 memset(&priv->pkstats, 0, sizeof(priv->pkstats)); 1890 memset(&priv->port_stats, 0, sizeof(priv->port_stats)); 1891 1892 for (i = 0; i < priv->tx_ring_num; i++) { 1893 priv->tx_ring[i]->bytes = 0; 1894 priv->tx_ring[i]->packets = 0; 1895 priv->tx_ring[i]->tx_csum = 0; 1896 } 1897 for (i = 0; i < priv->rx_ring_num; i++) { 1898 priv->rx_ring[i]->bytes = 0; 1899 priv->rx_ring[i]->packets = 0; 1900 priv->rx_ring[i]->csum_ok = 0; 1901 priv->rx_ring[i]->csum_none = 0; 1902 priv->rx_ring[i]->csum_complete = 0; 1903 } 1904 } 1905 1906 static int mlx4_en_open(struct net_device *dev) 1907 { 1908 struct mlx4_en_priv *priv = netdev_priv(dev); 1909 struct mlx4_en_dev *mdev = priv->mdev; 1910 int err = 0; 1911 1912 mutex_lock(&mdev->state_lock); 1913 1914 if (!mdev->device_up) { 1915 en_err(priv, "Cannot open - device down/disabled\n"); 1916 err = -EBUSY; 1917 goto out; 1918 } 1919 1920 /* Reset HW statistics and SW counters */ 1921 mlx4_en_clear_stats(dev); 1922 1923 err = mlx4_en_start_port(dev); 1924 if (err) 1925 en_err(priv, "Failed starting port:%d\n", priv->port); 1926 1927 out: 1928 mutex_unlock(&mdev->state_lock); 1929 return err; 1930 } 1931 1932 1933 static int mlx4_en_close(struct net_device *dev) 1934 { 1935 struct mlx4_en_priv *priv = netdev_priv(dev); 1936 struct mlx4_en_dev *mdev = priv->mdev; 1937 1938 en_dbg(IFDOWN, priv, "Close port called\n"); 1939 1940 mutex_lock(&mdev->state_lock); 1941 1942 mlx4_en_stop_port(dev, 0); 1943 netif_carrier_off(dev); 1944 1945 mutex_unlock(&mdev->state_lock); 1946 return 0; 1947 } 1948 1949 void mlx4_en_free_resources(struct mlx4_en_priv *priv) 1950 { 1951 int i; 1952 1953 #ifdef CONFIG_RFS_ACCEL 1954 free_irq_cpu_rmap(priv->dev->rx_cpu_rmap); 1955 priv->dev->rx_cpu_rmap = NULL; 1956 #endif 1957 1958 for (i = 0; i < priv->tx_ring_num; i++) { 1959 if (priv->tx_ring && priv->tx_ring[i]) 1960 mlx4_en_destroy_tx_ring(priv, &priv->tx_ring[i]); 1961 if (priv->tx_cq && priv->tx_cq[i]) 1962 mlx4_en_destroy_cq(priv, &priv->tx_cq[i]); 1963 } 1964 1965 for (i = 0; i < priv->rx_ring_num; i++) { 1966 if (priv->rx_ring[i]) 1967 mlx4_en_destroy_rx_ring(priv, &priv->rx_ring[i], 1968 priv->prof->rx_ring_size, priv->stride); 1969 if (priv->rx_cq[i]) 1970 mlx4_en_destroy_cq(priv, &priv->rx_cq[i]); 1971 } 1972 1973 if (priv->base_tx_qpn) { 1974 mlx4_qp_release_range(priv->mdev->dev, priv->base_tx_qpn, priv->tx_ring_num); 1975 priv->base_tx_qpn = 0; 1976 } 1977 } 1978 1979 int mlx4_en_alloc_resources(struct mlx4_en_priv *priv) 1980 { 1981 struct mlx4_en_port_profile *prof = priv->prof; 1982 int i; 1983 int node; 1984 1985 /* Create tx Rings */ 1986 for (i = 0; i < priv->tx_ring_num; i++) { 1987 node = cpu_to_node(i % num_online_cpus()); 1988 if (mlx4_en_create_cq(priv, &priv->tx_cq[i], 1989 prof->tx_ring_size, i, TX, node)) 1990 goto err; 1991 1992 if (mlx4_en_create_tx_ring(priv, &priv->tx_ring[i], 1993 prof->tx_ring_size, TXBB_SIZE, 1994 node, i)) 1995 goto err; 1996 } 1997 1998 /* Create rx Rings */ 1999 for (i = 0; i < priv->rx_ring_num; i++) { 2000 node = cpu_to_node(i % num_online_cpus()); 2001 if (mlx4_en_create_cq(priv, &priv->rx_cq[i], 2002 prof->rx_ring_size, i, RX, node)) 2003 goto err; 2004 2005 if (mlx4_en_create_rx_ring(priv, &priv->rx_ring[i], 2006 prof->rx_ring_size, priv->stride, 2007 node)) 2008 goto err; 2009 } 2010 2011 #ifdef CONFIG_RFS_ACCEL 2012 if (priv->mdev->dev->caps.comp_pool) { 2013 priv->dev->rx_cpu_rmap = alloc_irq_cpu_rmap(priv->mdev->dev->caps.comp_pool); 2014 if (!priv->dev->rx_cpu_rmap) 2015 goto err; 2016 } 2017 #endif 2018 2019 return 0; 2020 2021 err: 2022 en_err(priv, "Failed to allocate NIC resources\n"); 2023 for (i = 0; i < priv->rx_ring_num; i++) { 2024 if (priv->rx_ring[i]) 2025 mlx4_en_destroy_rx_ring(priv, &priv->rx_ring[i], 2026 prof->rx_ring_size, 2027 priv->stride); 2028 if (priv->rx_cq[i]) 2029 mlx4_en_destroy_cq(priv, &priv->rx_cq[i]); 2030 } 2031 for (i = 0; i < priv->tx_ring_num; i++) { 2032 if (priv->tx_ring[i]) 2033 mlx4_en_destroy_tx_ring(priv, &priv->tx_ring[i]); 2034 if (priv->tx_cq[i]) 2035 mlx4_en_destroy_cq(priv, &priv->tx_cq[i]); 2036 } 2037 return -ENOMEM; 2038 } 2039 2040 2041 void mlx4_en_destroy_netdev(struct net_device *dev) 2042 { 2043 struct mlx4_en_priv *priv = netdev_priv(dev); 2044 struct mlx4_en_dev *mdev = priv->mdev; 2045 2046 en_dbg(DRV, priv, "Destroying netdev on port:%d\n", priv->port); 2047 2048 /* Unregister device - this will close the port if it was up */ 2049 if (priv->registered) 2050 unregister_netdev(dev); 2051 2052 if (priv->allocated) 2053 mlx4_free_hwq_res(mdev->dev, &priv->res, MLX4_EN_PAGE_SIZE); 2054 2055 cancel_delayed_work(&priv->stats_task); 2056 cancel_delayed_work(&priv->service_task); 2057 /* flush any pending task for this netdev */ 2058 flush_workqueue(mdev->workqueue); 2059 2060 /* Detach the netdev so tasks would not attempt to access it */ 2061 mutex_lock(&mdev->state_lock); 2062 mdev->pndev[priv->port] = NULL; 2063 mdev->upper[priv->port] = NULL; 2064 mutex_unlock(&mdev->state_lock); 2065 2066 mlx4_en_free_resources(priv); 2067 2068 kfree(priv->tx_ring); 2069 kfree(priv->tx_cq); 2070 2071 free_netdev(dev); 2072 } 2073 2074 static int mlx4_en_change_mtu(struct net_device *dev, int new_mtu) 2075 { 2076 struct mlx4_en_priv *priv = netdev_priv(dev); 2077 struct mlx4_en_dev *mdev = priv->mdev; 2078 int err = 0; 2079 2080 en_dbg(DRV, priv, "Change MTU called - current:%d new:%d\n", 2081 dev->mtu, new_mtu); 2082 2083 if ((new_mtu < MLX4_EN_MIN_MTU) || (new_mtu > priv->max_mtu)) { 2084 en_err(priv, "Bad MTU size:%d.\n", new_mtu); 2085 return -EPERM; 2086 } 2087 dev->mtu = new_mtu; 2088 2089 if (netif_running(dev)) { 2090 mutex_lock(&mdev->state_lock); 2091 if (!mdev->device_up) { 2092 /* NIC is probably restarting - let watchdog task reset 2093 * the port */ 2094 en_dbg(DRV, priv, "Change MTU called with card down!?\n"); 2095 } else { 2096 mlx4_en_stop_port(dev, 1); 2097 err = mlx4_en_start_port(dev); 2098 if (err) { 2099 en_err(priv, "Failed restarting port:%d\n", 2100 priv->port); 2101 queue_work(mdev->workqueue, &priv->watchdog_task); 2102 } 2103 } 2104 mutex_unlock(&mdev->state_lock); 2105 } 2106 return 0; 2107 } 2108 2109 static int mlx4_en_hwtstamp_set(struct net_device *dev, struct ifreq *ifr) 2110 { 2111 struct mlx4_en_priv *priv = netdev_priv(dev); 2112 struct mlx4_en_dev *mdev = priv->mdev; 2113 struct hwtstamp_config config; 2114 2115 if (copy_from_user(&config, ifr->ifr_data, sizeof(config))) 2116 return -EFAULT; 2117 2118 /* reserved for future extensions */ 2119 if (config.flags) 2120 return -EINVAL; 2121 2122 /* device doesn't support time stamping */ 2123 if (!(mdev->dev->caps.flags2 & MLX4_DEV_CAP_FLAG2_TS)) 2124 return -EINVAL; 2125 2126 /* TX HW timestamp */ 2127 switch (config.tx_type) { 2128 case HWTSTAMP_TX_OFF: 2129 case HWTSTAMP_TX_ON: 2130 break; 2131 default: 2132 return -ERANGE; 2133 } 2134 2135 /* RX HW timestamp */ 2136 switch (config.rx_filter) { 2137 case HWTSTAMP_FILTER_NONE: 2138 break; 2139 case HWTSTAMP_FILTER_ALL: 2140 case HWTSTAMP_FILTER_SOME: 2141 case HWTSTAMP_FILTER_PTP_V1_L4_EVENT: 2142 case HWTSTAMP_FILTER_PTP_V1_L4_SYNC: 2143 case HWTSTAMP_FILTER_PTP_V1_L4_DELAY_REQ: 2144 case HWTSTAMP_FILTER_PTP_V2_L4_EVENT: 2145 case HWTSTAMP_FILTER_PTP_V2_L4_SYNC: 2146 case HWTSTAMP_FILTER_PTP_V2_L4_DELAY_REQ: 2147 case HWTSTAMP_FILTER_PTP_V2_L2_EVENT: 2148 case HWTSTAMP_FILTER_PTP_V2_L2_SYNC: 2149 case HWTSTAMP_FILTER_PTP_V2_L2_DELAY_REQ: 2150 case HWTSTAMP_FILTER_PTP_V2_EVENT: 2151 case HWTSTAMP_FILTER_PTP_V2_SYNC: 2152 case HWTSTAMP_FILTER_PTP_V2_DELAY_REQ: 2153 config.rx_filter = HWTSTAMP_FILTER_ALL; 2154 break; 2155 default: 2156 return -ERANGE; 2157 } 2158 2159 if (mlx4_en_reset_config(dev, config, dev->features)) { 2160 config.tx_type = HWTSTAMP_TX_OFF; 2161 config.rx_filter = HWTSTAMP_FILTER_NONE; 2162 } 2163 2164 return copy_to_user(ifr->ifr_data, &config, 2165 sizeof(config)) ? -EFAULT : 0; 2166 } 2167 2168 static int mlx4_en_hwtstamp_get(struct net_device *dev, struct ifreq *ifr) 2169 { 2170 struct mlx4_en_priv *priv = netdev_priv(dev); 2171 2172 return copy_to_user(ifr->ifr_data, &priv->hwtstamp_config, 2173 sizeof(priv->hwtstamp_config)) ? -EFAULT : 0; 2174 } 2175 2176 static int mlx4_en_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd) 2177 { 2178 switch (cmd) { 2179 case SIOCSHWTSTAMP: 2180 return mlx4_en_hwtstamp_set(dev, ifr); 2181 case SIOCGHWTSTAMP: 2182 return mlx4_en_hwtstamp_get(dev, ifr); 2183 default: 2184 return -EOPNOTSUPP; 2185 } 2186 } 2187 2188 static int mlx4_en_set_features(struct net_device *netdev, 2189 netdev_features_t features) 2190 { 2191 struct mlx4_en_priv *priv = netdev_priv(netdev); 2192 int ret = 0; 2193 2194 if (DEV_FEATURE_CHANGED(netdev, features, NETIF_F_HW_VLAN_CTAG_RX)) { 2195 en_info(priv, "Turn %s RX vlan strip offload\n", 2196 (features & NETIF_F_HW_VLAN_CTAG_RX) ? "ON" : "OFF"); 2197 ret = mlx4_en_reset_config(netdev, priv->hwtstamp_config, 2198 features); 2199 if (ret) 2200 return ret; 2201 } 2202 2203 if (DEV_FEATURE_CHANGED(netdev, features, NETIF_F_HW_VLAN_CTAG_TX)) 2204 en_info(priv, "Turn %s TX vlan strip offload\n", 2205 (features & NETIF_F_HW_VLAN_CTAG_TX) ? "ON" : "OFF"); 2206 2207 if (features & NETIF_F_LOOPBACK) 2208 priv->ctrl_flags |= cpu_to_be32(MLX4_WQE_CTRL_FORCE_LOOPBACK); 2209 else 2210 priv->ctrl_flags &= 2211 cpu_to_be32(~MLX4_WQE_CTRL_FORCE_LOOPBACK); 2212 2213 mlx4_en_update_loopback_state(netdev, features); 2214 2215 return 0; 2216 2217 } 2218 2219 static int mlx4_en_set_vf_mac(struct net_device *dev, int queue, u8 *mac) 2220 { 2221 struct mlx4_en_priv *en_priv = netdev_priv(dev); 2222 struct mlx4_en_dev *mdev = en_priv->mdev; 2223 u64 mac_u64 = mlx4_mac_to_u64(mac); 2224 2225 if (!is_valid_ether_addr(mac)) 2226 return -EINVAL; 2227 2228 return mlx4_set_vf_mac(mdev->dev, en_priv->port, queue, mac_u64); 2229 } 2230 2231 static int mlx4_en_set_vf_vlan(struct net_device *dev, int vf, u16 vlan, u8 qos) 2232 { 2233 struct mlx4_en_priv *en_priv = netdev_priv(dev); 2234 struct mlx4_en_dev *mdev = en_priv->mdev; 2235 2236 return mlx4_set_vf_vlan(mdev->dev, en_priv->port, vf, vlan, qos); 2237 } 2238 2239 static int mlx4_en_set_vf_spoofchk(struct net_device *dev, int vf, bool setting) 2240 { 2241 struct mlx4_en_priv *en_priv = netdev_priv(dev); 2242 struct mlx4_en_dev *mdev = en_priv->mdev; 2243 2244 return mlx4_set_vf_spoofchk(mdev->dev, en_priv->port, vf, setting); 2245 } 2246 2247 static int mlx4_en_get_vf_config(struct net_device *dev, int vf, struct ifla_vf_info *ivf) 2248 { 2249 struct mlx4_en_priv *en_priv = netdev_priv(dev); 2250 struct mlx4_en_dev *mdev = en_priv->mdev; 2251 2252 return mlx4_get_vf_config(mdev->dev, en_priv->port, vf, ivf); 2253 } 2254 2255 static int mlx4_en_set_vf_link_state(struct net_device *dev, int vf, int link_state) 2256 { 2257 struct mlx4_en_priv *en_priv = netdev_priv(dev); 2258 struct mlx4_en_dev *mdev = en_priv->mdev; 2259 2260 return mlx4_set_vf_link_state(mdev->dev, en_priv->port, vf, link_state); 2261 } 2262 2263 #define PORT_ID_BYTE_LEN 8 2264 static int mlx4_en_get_phys_port_id(struct net_device *dev, 2265 struct netdev_phys_item_id *ppid) 2266 { 2267 struct mlx4_en_priv *priv = netdev_priv(dev); 2268 struct mlx4_dev *mdev = priv->mdev->dev; 2269 int i; 2270 u64 phys_port_id = mdev->caps.phys_port_id[priv->port]; 2271 2272 if (!phys_port_id) 2273 return -EOPNOTSUPP; 2274 2275 ppid->id_len = sizeof(phys_port_id); 2276 for (i = PORT_ID_BYTE_LEN - 1; i >= 0; --i) { 2277 ppid->id[i] = phys_port_id & 0xff; 2278 phys_port_id >>= 8; 2279 } 2280 return 0; 2281 } 2282 2283 #ifdef CONFIG_MLX4_EN_VXLAN 2284 static void mlx4_en_add_vxlan_offloads(struct work_struct *work) 2285 { 2286 int ret; 2287 struct mlx4_en_priv *priv = container_of(work, struct mlx4_en_priv, 2288 vxlan_add_task); 2289 2290 ret = mlx4_config_vxlan_port(priv->mdev->dev, priv->vxlan_port); 2291 if (ret) 2292 goto out; 2293 2294 ret = mlx4_SET_PORT_VXLAN(priv->mdev->dev, priv->port, 2295 VXLAN_STEER_BY_OUTER_MAC, 1); 2296 out: 2297 if (ret) { 2298 en_err(priv, "failed setting L2 tunnel configuration ret %d\n", ret); 2299 return; 2300 } 2301 2302 /* set offloads */ 2303 priv->dev->hw_enc_features |= NETIF_F_IP_CSUM | NETIF_F_RXCSUM | 2304 NETIF_F_TSO | NETIF_F_GSO_UDP_TUNNEL; 2305 priv->dev->hw_features |= NETIF_F_GSO_UDP_TUNNEL; 2306 priv->dev->features |= NETIF_F_GSO_UDP_TUNNEL; 2307 } 2308 2309 static void mlx4_en_del_vxlan_offloads(struct work_struct *work) 2310 { 2311 int ret; 2312 struct mlx4_en_priv *priv = container_of(work, struct mlx4_en_priv, 2313 vxlan_del_task); 2314 /* unset offloads */ 2315 priv->dev->hw_enc_features &= ~(NETIF_F_IP_CSUM | NETIF_F_RXCSUM | 2316 NETIF_F_TSO | NETIF_F_GSO_UDP_TUNNEL); 2317 priv->dev->hw_features &= ~NETIF_F_GSO_UDP_TUNNEL; 2318 priv->dev->features &= ~NETIF_F_GSO_UDP_TUNNEL; 2319 2320 ret = mlx4_SET_PORT_VXLAN(priv->mdev->dev, priv->port, 2321 VXLAN_STEER_BY_OUTER_MAC, 0); 2322 if (ret) 2323 en_err(priv, "failed setting L2 tunnel configuration ret %d\n", ret); 2324 2325 priv->vxlan_port = 0; 2326 } 2327 2328 static void mlx4_en_add_vxlan_port(struct net_device *dev, 2329 sa_family_t sa_family, __be16 port) 2330 { 2331 struct mlx4_en_priv *priv = netdev_priv(dev); 2332 __be16 current_port; 2333 2334 if (priv->mdev->dev->caps.tunnel_offload_mode != MLX4_TUNNEL_OFFLOAD_MODE_VXLAN) 2335 return; 2336 2337 if (sa_family == AF_INET6) 2338 return; 2339 2340 current_port = priv->vxlan_port; 2341 if (current_port && current_port != port) { 2342 en_warn(priv, "vxlan port %d configured, can't add port %d\n", 2343 ntohs(current_port), ntohs(port)); 2344 return; 2345 } 2346 2347 priv->vxlan_port = port; 2348 queue_work(priv->mdev->workqueue, &priv->vxlan_add_task); 2349 } 2350 2351 static void mlx4_en_del_vxlan_port(struct net_device *dev, 2352 sa_family_t sa_family, __be16 port) 2353 { 2354 struct mlx4_en_priv *priv = netdev_priv(dev); 2355 __be16 current_port; 2356 2357 if (priv->mdev->dev->caps.tunnel_offload_mode != MLX4_TUNNEL_OFFLOAD_MODE_VXLAN) 2358 return; 2359 2360 if (sa_family == AF_INET6) 2361 return; 2362 2363 current_port = priv->vxlan_port; 2364 if (current_port != port) { 2365 en_dbg(DRV, priv, "vxlan port %d isn't configured, ignoring\n", ntohs(port)); 2366 return; 2367 } 2368 2369 queue_work(priv->mdev->workqueue, &priv->vxlan_del_task); 2370 } 2371 2372 static netdev_features_t mlx4_en_features_check(struct sk_buff *skb, 2373 struct net_device *dev, 2374 netdev_features_t features) 2375 { 2376 return vxlan_features_check(skb, features); 2377 } 2378 #endif 2379 2380 static const struct net_device_ops mlx4_netdev_ops = { 2381 .ndo_open = mlx4_en_open, 2382 .ndo_stop = mlx4_en_close, 2383 .ndo_start_xmit = mlx4_en_xmit, 2384 .ndo_select_queue = mlx4_en_select_queue, 2385 .ndo_get_stats = mlx4_en_get_stats, 2386 .ndo_set_rx_mode = mlx4_en_set_rx_mode, 2387 .ndo_set_mac_address = mlx4_en_set_mac, 2388 .ndo_validate_addr = eth_validate_addr, 2389 .ndo_change_mtu = mlx4_en_change_mtu, 2390 .ndo_do_ioctl = mlx4_en_ioctl, 2391 .ndo_tx_timeout = mlx4_en_tx_timeout, 2392 .ndo_vlan_rx_add_vid = mlx4_en_vlan_rx_add_vid, 2393 .ndo_vlan_rx_kill_vid = mlx4_en_vlan_rx_kill_vid, 2394 #ifdef CONFIG_NET_POLL_CONTROLLER 2395 .ndo_poll_controller = mlx4_en_netpoll, 2396 #endif 2397 .ndo_set_features = mlx4_en_set_features, 2398 .ndo_setup_tc = mlx4_en_setup_tc, 2399 #ifdef CONFIG_RFS_ACCEL 2400 .ndo_rx_flow_steer = mlx4_en_filter_rfs, 2401 #endif 2402 #ifdef CONFIG_NET_RX_BUSY_POLL 2403 .ndo_busy_poll = mlx4_en_low_latency_recv, 2404 #endif 2405 .ndo_get_phys_port_id = mlx4_en_get_phys_port_id, 2406 #ifdef CONFIG_MLX4_EN_VXLAN 2407 .ndo_add_vxlan_port = mlx4_en_add_vxlan_port, 2408 .ndo_del_vxlan_port = mlx4_en_del_vxlan_port, 2409 .ndo_features_check = mlx4_en_features_check, 2410 #endif 2411 }; 2412 2413 static const struct net_device_ops mlx4_netdev_ops_master = { 2414 .ndo_open = mlx4_en_open, 2415 .ndo_stop = mlx4_en_close, 2416 .ndo_start_xmit = mlx4_en_xmit, 2417 .ndo_select_queue = mlx4_en_select_queue, 2418 .ndo_get_stats = mlx4_en_get_stats, 2419 .ndo_set_rx_mode = mlx4_en_set_rx_mode, 2420 .ndo_set_mac_address = mlx4_en_set_mac, 2421 .ndo_validate_addr = eth_validate_addr, 2422 .ndo_change_mtu = mlx4_en_change_mtu, 2423 .ndo_tx_timeout = mlx4_en_tx_timeout, 2424 .ndo_vlan_rx_add_vid = mlx4_en_vlan_rx_add_vid, 2425 .ndo_vlan_rx_kill_vid = mlx4_en_vlan_rx_kill_vid, 2426 .ndo_set_vf_mac = mlx4_en_set_vf_mac, 2427 .ndo_set_vf_vlan = mlx4_en_set_vf_vlan, 2428 .ndo_set_vf_spoofchk = mlx4_en_set_vf_spoofchk, 2429 .ndo_set_vf_link_state = mlx4_en_set_vf_link_state, 2430 .ndo_get_vf_config = mlx4_en_get_vf_config, 2431 #ifdef CONFIG_NET_POLL_CONTROLLER 2432 .ndo_poll_controller = mlx4_en_netpoll, 2433 #endif 2434 .ndo_set_features = mlx4_en_set_features, 2435 .ndo_setup_tc = mlx4_en_setup_tc, 2436 #ifdef CONFIG_RFS_ACCEL 2437 .ndo_rx_flow_steer = mlx4_en_filter_rfs, 2438 #endif 2439 .ndo_get_phys_port_id = mlx4_en_get_phys_port_id, 2440 #ifdef CONFIG_MLX4_EN_VXLAN 2441 .ndo_add_vxlan_port = mlx4_en_add_vxlan_port, 2442 .ndo_del_vxlan_port = mlx4_en_del_vxlan_port, 2443 .ndo_features_check = mlx4_en_features_check, 2444 #endif 2445 }; 2446 2447 struct mlx4_en_bond { 2448 struct work_struct work; 2449 struct mlx4_en_priv *priv; 2450 int is_bonded; 2451 struct mlx4_port_map port_map; 2452 }; 2453 2454 static void mlx4_en_bond_work(struct work_struct *work) 2455 { 2456 struct mlx4_en_bond *bond = container_of(work, 2457 struct mlx4_en_bond, 2458 work); 2459 int err = 0; 2460 struct mlx4_dev *dev = bond->priv->mdev->dev; 2461 2462 if (bond->is_bonded) { 2463 if (!mlx4_is_bonded(dev)) { 2464 err = mlx4_bond(dev); 2465 if (err) 2466 en_err(bond->priv, "Fail to bond device\n"); 2467 } 2468 if (!err) { 2469 err = mlx4_port_map_set(dev, &bond->port_map); 2470 if (err) 2471 en_err(bond->priv, "Fail to set port map [%d][%d]: %d\n", 2472 bond->port_map.port1, 2473 bond->port_map.port2, 2474 err); 2475 } 2476 } else if (mlx4_is_bonded(dev)) { 2477 err = mlx4_unbond(dev); 2478 if (err) 2479 en_err(bond->priv, "Fail to unbond device\n"); 2480 } 2481 dev_put(bond->priv->dev); 2482 kfree(bond); 2483 } 2484 2485 static int mlx4_en_queue_bond_work(struct mlx4_en_priv *priv, int is_bonded, 2486 u8 v2p_p1, u8 v2p_p2) 2487 { 2488 struct mlx4_en_bond *bond = NULL; 2489 2490 bond = kzalloc(sizeof(*bond), GFP_ATOMIC); 2491 if (!bond) 2492 return -ENOMEM; 2493 2494 INIT_WORK(&bond->work, mlx4_en_bond_work); 2495 bond->priv = priv; 2496 bond->is_bonded = is_bonded; 2497 bond->port_map.port1 = v2p_p1; 2498 bond->port_map.port2 = v2p_p2; 2499 dev_hold(priv->dev); 2500 queue_work(priv->mdev->workqueue, &bond->work); 2501 return 0; 2502 } 2503 2504 int mlx4_en_netdev_event(struct notifier_block *this, 2505 unsigned long event, void *ptr) 2506 { 2507 struct net_device *ndev = netdev_notifier_info_to_dev(ptr); 2508 u8 port = 0; 2509 struct mlx4_en_dev *mdev; 2510 struct mlx4_dev *dev; 2511 int i, num_eth_ports = 0; 2512 bool do_bond = true; 2513 struct mlx4_en_priv *priv; 2514 u8 v2p_port1 = 0; 2515 u8 v2p_port2 = 0; 2516 2517 if (!net_eq(dev_net(ndev), &init_net)) 2518 return NOTIFY_DONE; 2519 2520 mdev = container_of(this, struct mlx4_en_dev, nb); 2521 dev = mdev->dev; 2522 2523 /* Go into this mode only when two network devices set on two ports 2524 * of the same mlx4 device are slaves of the same bonding master 2525 */ 2526 mlx4_foreach_port(i, dev, MLX4_PORT_TYPE_ETH) { 2527 ++num_eth_ports; 2528 if (!port && (mdev->pndev[i] == ndev)) 2529 port = i; 2530 mdev->upper[i] = mdev->pndev[i] ? 2531 netdev_master_upper_dev_get(mdev->pndev[i]) : NULL; 2532 /* condition not met: network device is a slave */ 2533 if (!mdev->upper[i]) 2534 do_bond = false; 2535 if (num_eth_ports < 2) 2536 continue; 2537 /* condition not met: same master */ 2538 if (mdev->upper[i] != mdev->upper[i-1]) 2539 do_bond = false; 2540 } 2541 /* condition not met: 2 salves */ 2542 do_bond = (num_eth_ports == 2) ? do_bond : false; 2543 2544 /* handle only events that come with enough info */ 2545 if ((do_bond && (event != NETDEV_BONDING_INFO)) || !port) 2546 return NOTIFY_DONE; 2547 2548 priv = netdev_priv(ndev); 2549 if (do_bond) { 2550 struct netdev_notifier_bonding_info *notifier_info = ptr; 2551 struct netdev_bonding_info *bonding_info = 2552 ¬ifier_info->bonding_info; 2553 2554 /* required mode 1, 2 or 4 */ 2555 if ((bonding_info->master.bond_mode != BOND_MODE_ACTIVEBACKUP) && 2556 (bonding_info->master.bond_mode != BOND_MODE_XOR) && 2557 (bonding_info->master.bond_mode != BOND_MODE_8023AD)) 2558 do_bond = false; 2559 2560 /* require exactly 2 slaves */ 2561 if (bonding_info->master.num_slaves != 2) 2562 do_bond = false; 2563 2564 /* calc v2p */ 2565 if (do_bond) { 2566 if (bonding_info->master.bond_mode == 2567 BOND_MODE_ACTIVEBACKUP) { 2568 /* in active-backup mode virtual ports are 2569 * mapped to the physical port of the active 2570 * slave */ 2571 if (bonding_info->slave.state == 2572 BOND_STATE_BACKUP) { 2573 if (port == 1) { 2574 v2p_port1 = 2; 2575 v2p_port2 = 2; 2576 } else { 2577 v2p_port1 = 1; 2578 v2p_port2 = 1; 2579 } 2580 } else { /* BOND_STATE_ACTIVE */ 2581 if (port == 1) { 2582 v2p_port1 = 1; 2583 v2p_port2 = 1; 2584 } else { 2585 v2p_port1 = 2; 2586 v2p_port2 = 2; 2587 } 2588 } 2589 } else { /* Active-Active */ 2590 /* in active-active mode a virtual port is 2591 * mapped to the native physical port if and only 2592 * if the physical port is up */ 2593 __s8 link = bonding_info->slave.link; 2594 2595 if (port == 1) 2596 v2p_port2 = 2; 2597 else 2598 v2p_port1 = 1; 2599 if ((link == BOND_LINK_UP) || 2600 (link == BOND_LINK_FAIL)) { 2601 if (port == 1) 2602 v2p_port1 = 1; 2603 else 2604 v2p_port2 = 2; 2605 } else { /* BOND_LINK_DOWN || BOND_LINK_BACK */ 2606 if (port == 1) 2607 v2p_port1 = 2; 2608 else 2609 v2p_port2 = 1; 2610 } 2611 } 2612 } 2613 } 2614 2615 mlx4_en_queue_bond_work(priv, do_bond, 2616 v2p_port1, v2p_port2); 2617 2618 return NOTIFY_DONE; 2619 } 2620 2621 int mlx4_en_init_netdev(struct mlx4_en_dev *mdev, int port, 2622 struct mlx4_en_port_profile *prof) 2623 { 2624 struct net_device *dev; 2625 struct mlx4_en_priv *priv; 2626 int i; 2627 int err; 2628 u64 mac_u64; 2629 2630 dev = alloc_etherdev_mqs(sizeof(struct mlx4_en_priv), 2631 MAX_TX_RINGS, MAX_RX_RINGS); 2632 if (dev == NULL) 2633 return -ENOMEM; 2634 2635 netif_set_real_num_tx_queues(dev, prof->tx_ring_num); 2636 netif_set_real_num_rx_queues(dev, prof->rx_ring_num); 2637 2638 SET_NETDEV_DEV(dev, &mdev->dev->persist->pdev->dev); 2639 dev->dev_port = port - 1; 2640 2641 /* 2642 * Initialize driver private data 2643 */ 2644 2645 priv = netdev_priv(dev); 2646 memset(priv, 0, sizeof(struct mlx4_en_priv)); 2647 spin_lock_init(&priv->stats_lock); 2648 INIT_WORK(&priv->rx_mode_task, mlx4_en_do_set_rx_mode); 2649 INIT_WORK(&priv->watchdog_task, mlx4_en_restart); 2650 INIT_WORK(&priv->linkstate_task, mlx4_en_linkstate); 2651 INIT_DELAYED_WORK(&priv->stats_task, mlx4_en_do_get_stats); 2652 INIT_DELAYED_WORK(&priv->service_task, mlx4_en_service_task); 2653 #ifdef CONFIG_MLX4_EN_VXLAN 2654 INIT_WORK(&priv->vxlan_add_task, mlx4_en_add_vxlan_offloads); 2655 INIT_WORK(&priv->vxlan_del_task, mlx4_en_del_vxlan_offloads); 2656 #endif 2657 #ifdef CONFIG_RFS_ACCEL 2658 INIT_LIST_HEAD(&priv->filters); 2659 spin_lock_init(&priv->filters_lock); 2660 #endif 2661 2662 priv->dev = dev; 2663 priv->mdev = mdev; 2664 priv->ddev = &mdev->pdev->dev; 2665 priv->prof = prof; 2666 priv->port = port; 2667 priv->port_up = false; 2668 priv->flags = prof->flags; 2669 priv->pflags = MLX4_EN_PRIV_FLAGS_BLUEFLAME; 2670 priv->ctrl_flags = cpu_to_be32(MLX4_WQE_CTRL_CQ_UPDATE | 2671 MLX4_WQE_CTRL_SOLICITED); 2672 priv->num_tx_rings_p_up = mdev->profile.num_tx_rings_p_up; 2673 priv->tx_ring_num = prof->tx_ring_num; 2674 priv->tx_work_limit = MLX4_EN_DEFAULT_TX_WORK; 2675 netdev_rss_key_fill(priv->rss_key, sizeof(priv->rss_key)); 2676 2677 priv->tx_ring = kzalloc(sizeof(struct mlx4_en_tx_ring *) * MAX_TX_RINGS, 2678 GFP_KERNEL); 2679 if (!priv->tx_ring) { 2680 err = -ENOMEM; 2681 goto out; 2682 } 2683 priv->tx_cq = kzalloc(sizeof(struct mlx4_en_cq *) * MAX_TX_RINGS, 2684 GFP_KERNEL); 2685 if (!priv->tx_cq) { 2686 err = -ENOMEM; 2687 goto out; 2688 } 2689 priv->rx_ring_num = prof->rx_ring_num; 2690 priv->cqe_factor = (mdev->dev->caps.cqe_size == 64) ? 1 : 0; 2691 priv->cqe_size = mdev->dev->caps.cqe_size; 2692 priv->mac_index = -1; 2693 priv->msg_enable = MLX4_EN_MSG_LEVEL; 2694 #ifdef CONFIG_MLX4_EN_DCB 2695 if (!mlx4_is_slave(priv->mdev->dev)) { 2696 if (mdev->dev->caps.flags & MLX4_DEV_CAP_FLAG_SET_ETH_SCHED) { 2697 dev->dcbnl_ops = &mlx4_en_dcbnl_ops; 2698 } else { 2699 en_info(priv, "enabling only PFC DCB ops\n"); 2700 dev->dcbnl_ops = &mlx4_en_dcbnl_pfc_ops; 2701 } 2702 } 2703 #endif 2704 2705 for (i = 0; i < MLX4_EN_MAC_HASH_SIZE; ++i) 2706 INIT_HLIST_HEAD(&priv->mac_hash[i]); 2707 2708 /* Query for default mac and max mtu */ 2709 priv->max_mtu = mdev->dev->caps.eth_mtu_cap[priv->port]; 2710 2711 if (mdev->dev->caps.rx_checksum_flags_port[priv->port] & 2712 MLX4_RX_CSUM_MODE_VAL_NON_TCP_UDP) 2713 priv->flags |= MLX4_EN_FLAG_RX_CSUM_NON_TCP_UDP; 2714 2715 /* Set default MAC */ 2716 dev->addr_len = ETH_ALEN; 2717 mlx4_en_u64_to_mac(dev->dev_addr, mdev->dev->caps.def_mac[priv->port]); 2718 if (!is_valid_ether_addr(dev->dev_addr)) { 2719 if (mlx4_is_slave(priv->mdev->dev)) { 2720 eth_hw_addr_random(dev); 2721 en_warn(priv, "Assigned random MAC address %pM\n", dev->dev_addr); 2722 mac_u64 = mlx4_mac_to_u64(dev->dev_addr); 2723 mdev->dev->caps.def_mac[priv->port] = mac_u64; 2724 } else { 2725 en_err(priv, "Port: %d, invalid mac burned: %pM, quiting\n", 2726 priv->port, dev->dev_addr); 2727 err = -EINVAL; 2728 goto out; 2729 } 2730 } 2731 2732 memcpy(priv->current_mac, dev->dev_addr, sizeof(priv->current_mac)); 2733 2734 priv->stride = roundup_pow_of_two(sizeof(struct mlx4_en_rx_desc) + 2735 DS_SIZE * MLX4_EN_MAX_RX_FRAGS); 2736 err = mlx4_en_alloc_resources(priv); 2737 if (err) 2738 goto out; 2739 2740 /* Initialize time stamping config */ 2741 priv->hwtstamp_config.flags = 0; 2742 priv->hwtstamp_config.tx_type = HWTSTAMP_TX_OFF; 2743 priv->hwtstamp_config.rx_filter = HWTSTAMP_FILTER_NONE; 2744 2745 /* Allocate page for receive rings */ 2746 err = mlx4_alloc_hwq_res(mdev->dev, &priv->res, 2747 MLX4_EN_PAGE_SIZE, MLX4_EN_PAGE_SIZE); 2748 if (err) { 2749 en_err(priv, "Failed to allocate page for rx qps\n"); 2750 goto out; 2751 } 2752 priv->allocated = 1; 2753 2754 /* 2755 * Initialize netdev entry points 2756 */ 2757 if (mlx4_is_master(priv->mdev->dev)) 2758 dev->netdev_ops = &mlx4_netdev_ops_master; 2759 else 2760 dev->netdev_ops = &mlx4_netdev_ops; 2761 dev->watchdog_timeo = MLX4_EN_WATCHDOG_TIMEOUT; 2762 netif_set_real_num_tx_queues(dev, priv->tx_ring_num); 2763 netif_set_real_num_rx_queues(dev, priv->rx_ring_num); 2764 2765 dev->ethtool_ops = &mlx4_en_ethtool_ops; 2766 2767 /* 2768 * Set driver features 2769 */ 2770 dev->hw_features = NETIF_F_SG | NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM; 2771 if (mdev->LSO_support) 2772 dev->hw_features |= NETIF_F_TSO | NETIF_F_TSO6; 2773 2774 dev->vlan_features = dev->hw_features; 2775 2776 dev->hw_features |= NETIF_F_RXCSUM | NETIF_F_RXHASH; 2777 dev->features = dev->hw_features | NETIF_F_HIGHDMA | 2778 NETIF_F_HW_VLAN_CTAG_TX | NETIF_F_HW_VLAN_CTAG_RX | 2779 NETIF_F_HW_VLAN_CTAG_FILTER; 2780 dev->hw_features |= NETIF_F_LOOPBACK | 2781 NETIF_F_HW_VLAN_CTAG_TX | NETIF_F_HW_VLAN_CTAG_RX; 2782 2783 if (mdev->dev->caps.steering_mode == 2784 MLX4_STEERING_MODE_DEVICE_MANAGED && 2785 mdev->dev->caps.dmfs_high_steer_mode != MLX4_STEERING_DMFS_A0_STATIC) 2786 dev->hw_features |= NETIF_F_NTUPLE; 2787 2788 if (mdev->dev->caps.steering_mode != MLX4_STEERING_MODE_A0) 2789 dev->priv_flags |= IFF_UNICAST_FLT; 2790 2791 /* Setting a default hash function value */ 2792 if (mdev->dev->caps.flags2 & MLX4_DEV_CAP_FLAG2_RSS_TOP) { 2793 priv->rss_hash_fn = ETH_RSS_HASH_TOP; 2794 } else if (mdev->dev->caps.flags2 & MLX4_DEV_CAP_FLAG2_RSS_XOR) { 2795 priv->rss_hash_fn = ETH_RSS_HASH_XOR; 2796 } else { 2797 en_warn(priv, 2798 "No RSS hash capabilities exposed, using Toeplitz\n"); 2799 priv->rss_hash_fn = ETH_RSS_HASH_TOP; 2800 } 2801 2802 mdev->pndev[port] = dev; 2803 mdev->upper[port] = NULL; 2804 2805 netif_carrier_off(dev); 2806 mlx4_en_set_default_moderation(priv); 2807 2808 en_warn(priv, "Using %d TX rings\n", prof->tx_ring_num); 2809 en_warn(priv, "Using %d RX rings\n", prof->rx_ring_num); 2810 2811 mlx4_en_update_loopback_state(priv->dev, priv->dev->features); 2812 2813 /* Configure port */ 2814 mlx4_en_calc_rx_buf(dev); 2815 err = mlx4_SET_PORT_general(mdev->dev, priv->port, 2816 priv->rx_skb_size + ETH_FCS_LEN, 2817 prof->tx_pause, prof->tx_ppp, 2818 prof->rx_pause, prof->rx_ppp); 2819 if (err) { 2820 en_err(priv, "Failed setting port general configurations for port %d, with error %d\n", 2821 priv->port, err); 2822 goto out; 2823 } 2824 2825 if (mdev->dev->caps.tunnel_offload_mode == MLX4_TUNNEL_OFFLOAD_MODE_VXLAN) { 2826 err = mlx4_SET_PORT_VXLAN(mdev->dev, priv->port, VXLAN_STEER_BY_OUTER_MAC, 1); 2827 if (err) { 2828 en_err(priv, "Failed setting port L2 tunnel configuration, err %d\n", 2829 err); 2830 goto out; 2831 } 2832 } 2833 2834 /* Init port */ 2835 en_warn(priv, "Initializing port\n"); 2836 err = mlx4_INIT_PORT(mdev->dev, priv->port); 2837 if (err) { 2838 en_err(priv, "Failed Initializing port\n"); 2839 goto out; 2840 } 2841 queue_delayed_work(mdev->workqueue, &priv->stats_task, STATS_DELAY); 2842 2843 if (mdev->dev->caps.flags2 & MLX4_DEV_CAP_FLAG2_TS) 2844 queue_delayed_work(mdev->workqueue, &priv->service_task, 2845 SERVICE_TASK_DELAY); 2846 2847 mlx4_set_stats_bitmap(mdev->dev, &priv->stats_bitmap); 2848 2849 err = register_netdev(dev); 2850 if (err) { 2851 en_err(priv, "Netdev registration failed for port %d\n", port); 2852 goto out; 2853 } 2854 2855 priv->registered = 1; 2856 2857 return 0; 2858 2859 out: 2860 mlx4_en_destroy_netdev(dev); 2861 return err; 2862 } 2863 2864 int mlx4_en_reset_config(struct net_device *dev, 2865 struct hwtstamp_config ts_config, 2866 netdev_features_t features) 2867 { 2868 struct mlx4_en_priv *priv = netdev_priv(dev); 2869 struct mlx4_en_dev *mdev = priv->mdev; 2870 int port_up = 0; 2871 int err = 0; 2872 2873 if (priv->hwtstamp_config.tx_type == ts_config.tx_type && 2874 priv->hwtstamp_config.rx_filter == ts_config.rx_filter && 2875 !DEV_FEATURE_CHANGED(dev, features, NETIF_F_HW_VLAN_CTAG_RX)) 2876 return 0; /* Nothing to change */ 2877 2878 if (DEV_FEATURE_CHANGED(dev, features, NETIF_F_HW_VLAN_CTAG_RX) && 2879 (features & NETIF_F_HW_VLAN_CTAG_RX) && 2880 (priv->hwtstamp_config.rx_filter != HWTSTAMP_FILTER_NONE)) { 2881 en_warn(priv, "Can't turn ON rx vlan offload while time-stamping rx filter is ON\n"); 2882 return -EINVAL; 2883 } 2884 2885 mutex_lock(&mdev->state_lock); 2886 if (priv->port_up) { 2887 port_up = 1; 2888 mlx4_en_stop_port(dev, 1); 2889 } 2890 2891 mlx4_en_free_resources(priv); 2892 2893 en_warn(priv, "Changing device configuration rx filter(%x) rx vlan(%x)\n", 2894 ts_config.rx_filter, !!(features & NETIF_F_HW_VLAN_CTAG_RX)); 2895 2896 priv->hwtstamp_config.tx_type = ts_config.tx_type; 2897 priv->hwtstamp_config.rx_filter = ts_config.rx_filter; 2898 2899 if (DEV_FEATURE_CHANGED(dev, features, NETIF_F_HW_VLAN_CTAG_RX)) { 2900 if (features & NETIF_F_HW_VLAN_CTAG_RX) 2901 dev->features |= NETIF_F_HW_VLAN_CTAG_RX; 2902 else 2903 dev->features &= ~NETIF_F_HW_VLAN_CTAG_RX; 2904 } else if (ts_config.rx_filter == HWTSTAMP_FILTER_NONE) { 2905 /* RX time-stamping is OFF, update the RX vlan offload 2906 * to the latest wanted state 2907 */ 2908 if (dev->wanted_features & NETIF_F_HW_VLAN_CTAG_RX) 2909 dev->features |= NETIF_F_HW_VLAN_CTAG_RX; 2910 else 2911 dev->features &= ~NETIF_F_HW_VLAN_CTAG_RX; 2912 } 2913 2914 /* RX vlan offload and RX time-stamping can't co-exist ! 2915 * Regardless of the caller's choice, 2916 * Turn Off RX vlan offload in case of time-stamping is ON 2917 */ 2918 if (ts_config.rx_filter != HWTSTAMP_FILTER_NONE) { 2919 if (dev->features & NETIF_F_HW_VLAN_CTAG_RX) 2920 en_warn(priv, "Turning off RX vlan offload since RX time-stamping is ON\n"); 2921 dev->features &= ~NETIF_F_HW_VLAN_CTAG_RX; 2922 } 2923 2924 err = mlx4_en_alloc_resources(priv); 2925 if (err) { 2926 en_err(priv, "Failed reallocating port resources\n"); 2927 goto out; 2928 } 2929 if (port_up) { 2930 err = mlx4_en_start_port(dev); 2931 if (err) 2932 en_err(priv, "Failed starting port\n"); 2933 } 2934 2935 out: 2936 mutex_unlock(&mdev->state_lock); 2937 netdev_features_change(dev); 2938 return err; 2939 } 2940