1 /* Copyright (c) 2014 Mahesh Bandewar <maheshb@google.com> 2 * 3 * This program is free software; you can redistribute it and/or 4 * modify it under the terms of the GNU General Public License as 5 * published by the Free Software Foundation; either version 2 of 6 * the License, or (at your option) any later version. 7 * 8 */ 9 10 #include "ipvlan.h" 11 12 static u32 ipvl_nf_hook_refcnt = 0; 13 14 static struct nf_hook_ops ipvl_nfops[] __read_mostly = { 15 { 16 .hook = ipvlan_nf_input, 17 .pf = NFPROTO_IPV4, 18 .hooknum = NF_INET_LOCAL_IN, 19 .priority = INT_MAX, 20 }, 21 { 22 .hook = ipvlan_nf_input, 23 .pf = NFPROTO_IPV6, 24 .hooknum = NF_INET_LOCAL_IN, 25 .priority = INT_MAX, 26 }, 27 }; 28 29 static const struct l3mdev_ops ipvl_l3mdev_ops = { 30 .l3mdev_l3_rcv = ipvlan_l3_rcv, 31 }; 32 33 static void ipvlan_adjust_mtu(struct ipvl_dev *ipvlan, struct net_device *dev) 34 { 35 ipvlan->dev->mtu = dev->mtu; 36 } 37 38 static int ipvlan_register_nf_hook(void) 39 { 40 int err = 0; 41 42 if (!ipvl_nf_hook_refcnt) { 43 err = _nf_register_hooks(ipvl_nfops, ARRAY_SIZE(ipvl_nfops)); 44 if (!err) 45 ipvl_nf_hook_refcnt = 1; 46 } else { 47 ipvl_nf_hook_refcnt++; 48 } 49 50 return err; 51 } 52 53 static void ipvlan_unregister_nf_hook(void) 54 { 55 WARN_ON(!ipvl_nf_hook_refcnt); 56 57 ipvl_nf_hook_refcnt--; 58 if (!ipvl_nf_hook_refcnt) 59 _nf_unregister_hooks(ipvl_nfops, ARRAY_SIZE(ipvl_nfops)); 60 } 61 62 static int ipvlan_set_port_mode(struct ipvl_port *port, u16 nval) 63 { 64 struct ipvl_dev *ipvlan; 65 struct net_device *mdev = port->dev; 66 int err = 0; 67 68 ASSERT_RTNL(); 69 if (port->mode != nval) { 70 if (nval == IPVLAN_MODE_L3S) { 71 /* New mode is L3S */ 72 err = ipvlan_register_nf_hook(); 73 if (!err) { 74 mdev->l3mdev_ops = &ipvl_l3mdev_ops; 75 mdev->priv_flags |= IFF_L3MDEV_MASTER; 76 } else 77 return err; 78 } else if (port->mode == IPVLAN_MODE_L3S) { 79 /* Old mode was L3S */ 80 mdev->priv_flags &= ~IFF_L3MDEV_MASTER; 81 ipvlan_unregister_nf_hook(); 82 mdev->l3mdev_ops = NULL; 83 } 84 list_for_each_entry(ipvlan, &port->ipvlans, pnode) { 85 if (nval == IPVLAN_MODE_L3 || nval == IPVLAN_MODE_L3S) 86 ipvlan->dev->flags |= IFF_NOARP; 87 else 88 ipvlan->dev->flags &= ~IFF_NOARP; 89 } 90 port->mode = nval; 91 } 92 return err; 93 } 94 95 static int ipvlan_port_create(struct net_device *dev) 96 { 97 struct ipvl_port *port; 98 int err, idx; 99 100 if (dev->type != ARPHRD_ETHER || dev->flags & IFF_LOOPBACK) { 101 netdev_err(dev, "Master is either lo or non-ether device\n"); 102 return -EINVAL; 103 } 104 105 if (netif_is_macvlan_port(dev)) { 106 netdev_err(dev, "Master is a macvlan port.\n"); 107 return -EBUSY; 108 } 109 110 port = kzalloc(sizeof(struct ipvl_port), GFP_KERNEL); 111 if (!port) 112 return -ENOMEM; 113 114 port->dev = dev; 115 port->mode = IPVLAN_MODE_L3; 116 INIT_LIST_HEAD(&port->ipvlans); 117 for (idx = 0; idx < IPVLAN_HASH_SIZE; idx++) 118 INIT_HLIST_HEAD(&port->hlhead[idx]); 119 120 skb_queue_head_init(&port->backlog); 121 INIT_WORK(&port->wq, ipvlan_process_multicast); 122 123 err = netdev_rx_handler_register(dev, ipvlan_handle_frame, port); 124 if (err) 125 goto err; 126 127 dev->priv_flags |= IFF_IPVLAN_MASTER; 128 return 0; 129 130 err: 131 kfree(port); 132 return err; 133 } 134 135 static void ipvlan_port_destroy(struct net_device *dev) 136 { 137 struct ipvl_port *port = ipvlan_port_get_rtnl(dev); 138 139 dev->priv_flags &= ~IFF_IPVLAN_MASTER; 140 if (port->mode == IPVLAN_MODE_L3S) { 141 dev->priv_flags &= ~IFF_L3MDEV_MASTER; 142 ipvlan_unregister_nf_hook(); 143 dev->l3mdev_ops = NULL; 144 } 145 netdev_rx_handler_unregister(dev); 146 cancel_work_sync(&port->wq); 147 __skb_queue_purge(&port->backlog); 148 kfree(port); 149 } 150 151 #define IPVLAN_FEATURES \ 152 (NETIF_F_SG | NETIF_F_HW_CSUM | NETIF_F_HIGHDMA | NETIF_F_FRAGLIST | \ 153 NETIF_F_GSO | NETIF_F_TSO | NETIF_F_UFO | NETIF_F_GSO_ROBUST | \ 154 NETIF_F_TSO_ECN | NETIF_F_TSO6 | NETIF_F_GRO | NETIF_F_RXCSUM | \ 155 NETIF_F_HW_VLAN_CTAG_FILTER | NETIF_F_HW_VLAN_STAG_FILTER) 156 157 #define IPVLAN_STATE_MASK \ 158 ((1<<__LINK_STATE_NOCARRIER) | (1<<__LINK_STATE_DORMANT)) 159 160 static int ipvlan_init(struct net_device *dev) 161 { 162 struct ipvl_dev *ipvlan = netdev_priv(dev); 163 const struct net_device *phy_dev = ipvlan->phy_dev; 164 struct ipvl_port *port = ipvlan->port; 165 166 dev->state = (dev->state & ~IPVLAN_STATE_MASK) | 167 (phy_dev->state & IPVLAN_STATE_MASK); 168 dev->features = phy_dev->features & IPVLAN_FEATURES; 169 dev->features |= NETIF_F_LLTX; 170 dev->gso_max_size = phy_dev->gso_max_size; 171 dev->gso_max_segs = phy_dev->gso_max_segs; 172 dev->hard_header_len = phy_dev->hard_header_len; 173 174 netdev_lockdep_set_classes(dev); 175 176 ipvlan->pcpu_stats = alloc_percpu(struct ipvl_pcpu_stats); 177 if (!ipvlan->pcpu_stats) 178 return -ENOMEM; 179 180 port->count += 1; 181 182 return 0; 183 } 184 185 static void ipvlan_uninit(struct net_device *dev) 186 { 187 struct ipvl_dev *ipvlan = netdev_priv(dev); 188 struct ipvl_port *port = ipvlan->port; 189 190 free_percpu(ipvlan->pcpu_stats); 191 192 port->count -= 1; 193 if (!port->count) 194 ipvlan_port_destroy(port->dev); 195 } 196 197 static int ipvlan_open(struct net_device *dev) 198 { 199 struct ipvl_dev *ipvlan = netdev_priv(dev); 200 struct net_device *phy_dev = ipvlan->phy_dev; 201 struct ipvl_addr *addr; 202 203 if (ipvlan->port->mode == IPVLAN_MODE_L3 || 204 ipvlan->port->mode == IPVLAN_MODE_L3S) 205 dev->flags |= IFF_NOARP; 206 else 207 dev->flags &= ~IFF_NOARP; 208 209 list_for_each_entry(addr, &ipvlan->addrs, anode) 210 ipvlan_ht_addr_add(ipvlan, addr); 211 212 return dev_uc_add(phy_dev, phy_dev->dev_addr); 213 } 214 215 static int ipvlan_stop(struct net_device *dev) 216 { 217 struct ipvl_dev *ipvlan = netdev_priv(dev); 218 struct net_device *phy_dev = ipvlan->phy_dev; 219 struct ipvl_addr *addr; 220 221 dev_uc_unsync(phy_dev, dev); 222 dev_mc_unsync(phy_dev, dev); 223 224 dev_uc_del(phy_dev, phy_dev->dev_addr); 225 226 list_for_each_entry(addr, &ipvlan->addrs, anode) 227 ipvlan_ht_addr_del(addr); 228 229 return 0; 230 } 231 232 static netdev_tx_t ipvlan_start_xmit(struct sk_buff *skb, 233 struct net_device *dev) 234 { 235 const struct ipvl_dev *ipvlan = netdev_priv(dev); 236 int skblen = skb->len; 237 int ret; 238 239 ret = ipvlan_queue_xmit(skb, dev); 240 if (likely(ret == NET_XMIT_SUCCESS || ret == NET_XMIT_CN)) { 241 struct ipvl_pcpu_stats *pcptr; 242 243 pcptr = this_cpu_ptr(ipvlan->pcpu_stats); 244 245 u64_stats_update_begin(&pcptr->syncp); 246 pcptr->tx_pkts++; 247 pcptr->tx_bytes += skblen; 248 u64_stats_update_end(&pcptr->syncp); 249 } else { 250 this_cpu_inc(ipvlan->pcpu_stats->tx_drps); 251 } 252 return ret; 253 } 254 255 static netdev_features_t ipvlan_fix_features(struct net_device *dev, 256 netdev_features_t features) 257 { 258 struct ipvl_dev *ipvlan = netdev_priv(dev); 259 260 return features & (ipvlan->sfeatures | ~IPVLAN_FEATURES); 261 } 262 263 static void ipvlan_change_rx_flags(struct net_device *dev, int change) 264 { 265 struct ipvl_dev *ipvlan = netdev_priv(dev); 266 struct net_device *phy_dev = ipvlan->phy_dev; 267 268 if (change & IFF_ALLMULTI) 269 dev_set_allmulti(phy_dev, dev->flags & IFF_ALLMULTI? 1 : -1); 270 } 271 272 static void ipvlan_set_multicast_mac_filter(struct net_device *dev) 273 { 274 struct ipvl_dev *ipvlan = netdev_priv(dev); 275 276 if (dev->flags & (IFF_PROMISC | IFF_ALLMULTI)) { 277 bitmap_fill(ipvlan->mac_filters, IPVLAN_MAC_FILTER_SIZE); 278 } else { 279 struct netdev_hw_addr *ha; 280 DECLARE_BITMAP(mc_filters, IPVLAN_MAC_FILTER_SIZE); 281 282 bitmap_zero(mc_filters, IPVLAN_MAC_FILTER_SIZE); 283 netdev_for_each_mc_addr(ha, dev) 284 __set_bit(ipvlan_mac_hash(ha->addr), mc_filters); 285 286 /* Turn-on broadcast bit irrespective of address family, 287 * since broadcast is deferred to a work-queue, hence no 288 * impact on fast-path processing. 289 */ 290 __set_bit(ipvlan_mac_hash(dev->broadcast), mc_filters); 291 292 bitmap_copy(ipvlan->mac_filters, mc_filters, 293 IPVLAN_MAC_FILTER_SIZE); 294 } 295 dev_uc_sync(ipvlan->phy_dev, dev); 296 dev_mc_sync(ipvlan->phy_dev, dev); 297 } 298 299 static struct rtnl_link_stats64 *ipvlan_get_stats64(struct net_device *dev, 300 struct rtnl_link_stats64 *s) 301 { 302 struct ipvl_dev *ipvlan = netdev_priv(dev); 303 304 if (ipvlan->pcpu_stats) { 305 struct ipvl_pcpu_stats *pcptr; 306 u64 rx_pkts, rx_bytes, rx_mcast, tx_pkts, tx_bytes; 307 u32 rx_errs = 0, tx_drps = 0; 308 u32 strt; 309 int idx; 310 311 for_each_possible_cpu(idx) { 312 pcptr = per_cpu_ptr(ipvlan->pcpu_stats, idx); 313 do { 314 strt= u64_stats_fetch_begin_irq(&pcptr->syncp); 315 rx_pkts = pcptr->rx_pkts; 316 rx_bytes = pcptr->rx_bytes; 317 rx_mcast = pcptr->rx_mcast; 318 tx_pkts = pcptr->tx_pkts; 319 tx_bytes = pcptr->tx_bytes; 320 } while (u64_stats_fetch_retry_irq(&pcptr->syncp, 321 strt)); 322 323 s->rx_packets += rx_pkts; 324 s->rx_bytes += rx_bytes; 325 s->multicast += rx_mcast; 326 s->tx_packets += tx_pkts; 327 s->tx_bytes += tx_bytes; 328 329 /* u32 values are updated without syncp protection. */ 330 rx_errs += pcptr->rx_errs; 331 tx_drps += pcptr->tx_drps; 332 } 333 s->rx_errors = rx_errs; 334 s->rx_dropped = rx_errs; 335 s->tx_dropped = tx_drps; 336 } 337 return s; 338 } 339 340 static int ipvlan_vlan_rx_add_vid(struct net_device *dev, __be16 proto, u16 vid) 341 { 342 struct ipvl_dev *ipvlan = netdev_priv(dev); 343 struct net_device *phy_dev = ipvlan->phy_dev; 344 345 return vlan_vid_add(phy_dev, proto, vid); 346 } 347 348 static int ipvlan_vlan_rx_kill_vid(struct net_device *dev, __be16 proto, 349 u16 vid) 350 { 351 struct ipvl_dev *ipvlan = netdev_priv(dev); 352 struct net_device *phy_dev = ipvlan->phy_dev; 353 354 vlan_vid_del(phy_dev, proto, vid); 355 return 0; 356 } 357 358 static int ipvlan_get_iflink(const struct net_device *dev) 359 { 360 struct ipvl_dev *ipvlan = netdev_priv(dev); 361 362 return ipvlan->phy_dev->ifindex; 363 } 364 365 static const struct net_device_ops ipvlan_netdev_ops = { 366 .ndo_init = ipvlan_init, 367 .ndo_uninit = ipvlan_uninit, 368 .ndo_open = ipvlan_open, 369 .ndo_stop = ipvlan_stop, 370 .ndo_start_xmit = ipvlan_start_xmit, 371 .ndo_fix_features = ipvlan_fix_features, 372 .ndo_change_rx_flags = ipvlan_change_rx_flags, 373 .ndo_set_rx_mode = ipvlan_set_multicast_mac_filter, 374 .ndo_get_stats64 = ipvlan_get_stats64, 375 .ndo_vlan_rx_add_vid = ipvlan_vlan_rx_add_vid, 376 .ndo_vlan_rx_kill_vid = ipvlan_vlan_rx_kill_vid, 377 .ndo_get_iflink = ipvlan_get_iflink, 378 }; 379 380 static int ipvlan_hard_header(struct sk_buff *skb, struct net_device *dev, 381 unsigned short type, const void *daddr, 382 const void *saddr, unsigned len) 383 { 384 const struct ipvl_dev *ipvlan = netdev_priv(dev); 385 struct net_device *phy_dev = ipvlan->phy_dev; 386 387 /* TODO Probably use a different field than dev_addr so that the 388 * mac-address on the virtual device is portable and can be carried 389 * while the packets use the mac-addr on the physical device. 390 */ 391 return dev_hard_header(skb, phy_dev, type, daddr, 392 saddr ? : dev->dev_addr, len); 393 } 394 395 static const struct header_ops ipvlan_header_ops = { 396 .create = ipvlan_hard_header, 397 .parse = eth_header_parse, 398 .cache = eth_header_cache, 399 .cache_update = eth_header_cache_update, 400 }; 401 402 static int ipvlan_ethtool_get_link_ksettings(struct net_device *dev, 403 struct ethtool_link_ksettings *cmd) 404 { 405 const struct ipvl_dev *ipvlan = netdev_priv(dev); 406 407 return __ethtool_get_link_ksettings(ipvlan->phy_dev, cmd); 408 } 409 410 static void ipvlan_ethtool_get_drvinfo(struct net_device *dev, 411 struct ethtool_drvinfo *drvinfo) 412 { 413 strlcpy(drvinfo->driver, IPVLAN_DRV, sizeof(drvinfo->driver)); 414 strlcpy(drvinfo->version, IPV_DRV_VER, sizeof(drvinfo->version)); 415 } 416 417 static u32 ipvlan_ethtool_get_msglevel(struct net_device *dev) 418 { 419 const struct ipvl_dev *ipvlan = netdev_priv(dev); 420 421 return ipvlan->msg_enable; 422 } 423 424 static void ipvlan_ethtool_set_msglevel(struct net_device *dev, u32 value) 425 { 426 struct ipvl_dev *ipvlan = netdev_priv(dev); 427 428 ipvlan->msg_enable = value; 429 } 430 431 static const struct ethtool_ops ipvlan_ethtool_ops = { 432 .get_link = ethtool_op_get_link, 433 .get_link_ksettings = ipvlan_ethtool_get_link_ksettings, 434 .get_drvinfo = ipvlan_ethtool_get_drvinfo, 435 .get_msglevel = ipvlan_ethtool_get_msglevel, 436 .set_msglevel = ipvlan_ethtool_set_msglevel, 437 }; 438 439 static int ipvlan_nl_changelink(struct net_device *dev, 440 struct nlattr *tb[], struct nlattr *data[]) 441 { 442 struct ipvl_dev *ipvlan = netdev_priv(dev); 443 struct ipvl_port *port = ipvlan_port_get_rtnl(ipvlan->phy_dev); 444 int err = 0; 445 446 if (data && data[IFLA_IPVLAN_MODE]) { 447 u16 nmode = nla_get_u16(data[IFLA_IPVLAN_MODE]); 448 449 err = ipvlan_set_port_mode(port, nmode); 450 } 451 return err; 452 } 453 454 static size_t ipvlan_nl_getsize(const struct net_device *dev) 455 { 456 return (0 457 + nla_total_size(2) /* IFLA_IPVLAN_MODE */ 458 ); 459 } 460 461 static int ipvlan_nl_validate(struct nlattr *tb[], struct nlattr *data[]) 462 { 463 if (data && data[IFLA_IPVLAN_MODE]) { 464 u16 mode = nla_get_u16(data[IFLA_IPVLAN_MODE]); 465 466 if (mode < IPVLAN_MODE_L2 || mode >= IPVLAN_MODE_MAX) 467 return -EINVAL; 468 } 469 return 0; 470 } 471 472 static int ipvlan_nl_fillinfo(struct sk_buff *skb, 473 const struct net_device *dev) 474 { 475 struct ipvl_dev *ipvlan = netdev_priv(dev); 476 struct ipvl_port *port = ipvlan_port_get_rtnl(ipvlan->phy_dev); 477 int ret = -EINVAL; 478 479 if (!port) 480 goto err; 481 482 ret = -EMSGSIZE; 483 if (nla_put_u16(skb, IFLA_IPVLAN_MODE, port->mode)) 484 goto err; 485 486 return 0; 487 488 err: 489 return ret; 490 } 491 492 static int ipvlan_link_new(struct net *src_net, struct net_device *dev, 493 struct nlattr *tb[], struct nlattr *data[]) 494 { 495 struct ipvl_dev *ipvlan = netdev_priv(dev); 496 struct ipvl_port *port; 497 struct net_device *phy_dev; 498 int err; 499 u16 mode = IPVLAN_MODE_L3; 500 bool create = false; 501 502 if (!tb[IFLA_LINK]) 503 return -EINVAL; 504 505 phy_dev = __dev_get_by_index(src_net, nla_get_u32(tb[IFLA_LINK])); 506 if (!phy_dev) 507 return -ENODEV; 508 509 if (netif_is_ipvlan(phy_dev)) { 510 struct ipvl_dev *tmp = netdev_priv(phy_dev); 511 512 phy_dev = tmp->phy_dev; 513 } else if (!netif_is_ipvlan_port(phy_dev)) { 514 err = ipvlan_port_create(phy_dev); 515 if (err < 0) 516 return err; 517 create = true; 518 } 519 520 if (data && data[IFLA_IPVLAN_MODE]) 521 mode = nla_get_u16(data[IFLA_IPVLAN_MODE]); 522 523 port = ipvlan_port_get_rtnl(phy_dev); 524 ipvlan->phy_dev = phy_dev; 525 ipvlan->dev = dev; 526 ipvlan->port = port; 527 ipvlan->sfeatures = IPVLAN_FEATURES; 528 ipvlan_adjust_mtu(ipvlan, phy_dev); 529 INIT_LIST_HEAD(&ipvlan->addrs); 530 531 /* TODO Probably put random address here to be presented to the 532 * world but keep using the physical-dev address for the outgoing 533 * packets. 534 */ 535 memcpy(dev->dev_addr, phy_dev->dev_addr, ETH_ALEN); 536 537 dev->priv_flags |= IFF_IPVLAN_SLAVE; 538 539 err = register_netdevice(dev); 540 if (err < 0) 541 goto destroy_ipvlan_port; 542 543 err = netdev_upper_dev_link(phy_dev, dev); 544 if (err) { 545 goto unregister_netdev; 546 } 547 err = ipvlan_set_port_mode(port, mode); 548 if (err) { 549 goto unlink_netdev; 550 } 551 552 list_add_tail_rcu(&ipvlan->pnode, &port->ipvlans); 553 netif_stacked_transfer_operstate(phy_dev, dev); 554 return 0; 555 556 unlink_netdev: 557 netdev_upper_dev_unlink(phy_dev, dev); 558 unregister_netdev: 559 unregister_netdevice(dev); 560 destroy_ipvlan_port: 561 if (create) 562 ipvlan_port_destroy(phy_dev); 563 return err; 564 } 565 566 static void ipvlan_link_delete(struct net_device *dev, struct list_head *head) 567 { 568 struct ipvl_dev *ipvlan = netdev_priv(dev); 569 struct ipvl_addr *addr, *next; 570 571 list_for_each_entry_safe(addr, next, &ipvlan->addrs, anode) { 572 ipvlan_ht_addr_del(addr); 573 list_del(&addr->anode); 574 kfree_rcu(addr, rcu); 575 } 576 577 list_del_rcu(&ipvlan->pnode); 578 unregister_netdevice_queue(dev, head); 579 netdev_upper_dev_unlink(ipvlan->phy_dev, dev); 580 } 581 582 static void ipvlan_link_setup(struct net_device *dev) 583 { 584 ether_setup(dev); 585 586 dev->priv_flags &= ~(IFF_XMIT_DST_RELEASE | IFF_TX_SKB_SHARING); 587 dev->priv_flags |= IFF_UNICAST_FLT | IFF_NO_QUEUE; 588 dev->netdev_ops = &ipvlan_netdev_ops; 589 dev->destructor = free_netdev; 590 dev->header_ops = &ipvlan_header_ops; 591 dev->ethtool_ops = &ipvlan_ethtool_ops; 592 } 593 594 static const struct nla_policy ipvlan_nl_policy[IFLA_IPVLAN_MAX + 1] = 595 { 596 [IFLA_IPVLAN_MODE] = { .type = NLA_U16 }, 597 }; 598 599 static struct rtnl_link_ops ipvlan_link_ops = { 600 .kind = "ipvlan", 601 .priv_size = sizeof(struct ipvl_dev), 602 603 .get_size = ipvlan_nl_getsize, 604 .policy = ipvlan_nl_policy, 605 .validate = ipvlan_nl_validate, 606 .fill_info = ipvlan_nl_fillinfo, 607 .changelink = ipvlan_nl_changelink, 608 .maxtype = IFLA_IPVLAN_MAX, 609 610 .setup = ipvlan_link_setup, 611 .newlink = ipvlan_link_new, 612 .dellink = ipvlan_link_delete, 613 }; 614 615 static int ipvlan_link_register(struct rtnl_link_ops *ops) 616 { 617 return rtnl_link_register(ops); 618 } 619 620 static int ipvlan_device_event(struct notifier_block *unused, 621 unsigned long event, void *ptr) 622 { 623 struct net_device *dev = netdev_notifier_info_to_dev(ptr); 624 struct ipvl_dev *ipvlan, *next; 625 struct ipvl_port *port; 626 LIST_HEAD(lst_kill); 627 628 if (!netif_is_ipvlan_port(dev)) 629 return NOTIFY_DONE; 630 631 port = ipvlan_port_get_rtnl(dev); 632 633 switch (event) { 634 case NETDEV_CHANGE: 635 list_for_each_entry(ipvlan, &port->ipvlans, pnode) 636 netif_stacked_transfer_operstate(ipvlan->phy_dev, 637 ipvlan->dev); 638 break; 639 640 case NETDEV_UNREGISTER: 641 if (dev->reg_state != NETREG_UNREGISTERING) 642 break; 643 644 list_for_each_entry_safe(ipvlan, next, &port->ipvlans, 645 pnode) 646 ipvlan->dev->rtnl_link_ops->dellink(ipvlan->dev, 647 &lst_kill); 648 unregister_netdevice_many(&lst_kill); 649 break; 650 651 case NETDEV_FEAT_CHANGE: 652 list_for_each_entry(ipvlan, &port->ipvlans, pnode) { 653 ipvlan->dev->features = dev->features & IPVLAN_FEATURES; 654 ipvlan->dev->gso_max_size = dev->gso_max_size; 655 ipvlan->dev->gso_max_segs = dev->gso_max_segs; 656 netdev_features_change(ipvlan->dev); 657 } 658 break; 659 660 case NETDEV_CHANGEMTU: 661 list_for_each_entry(ipvlan, &port->ipvlans, pnode) 662 ipvlan_adjust_mtu(ipvlan, dev); 663 break; 664 665 case NETDEV_PRE_TYPE_CHANGE: 666 /* Forbid underlying device to change its type. */ 667 return NOTIFY_BAD; 668 } 669 return NOTIFY_DONE; 670 } 671 672 static int ipvlan_add_addr6(struct ipvl_dev *ipvlan, struct in6_addr *ip6_addr) 673 { 674 struct ipvl_addr *addr; 675 676 if (ipvlan_addr_busy(ipvlan->port, ip6_addr, true)) { 677 netif_err(ipvlan, ifup, ipvlan->dev, 678 "Failed to add IPv6=%pI6c addr for %s intf\n", 679 ip6_addr, ipvlan->dev->name); 680 return -EINVAL; 681 } 682 addr = kzalloc(sizeof(struct ipvl_addr), GFP_ATOMIC); 683 if (!addr) 684 return -ENOMEM; 685 686 addr->master = ipvlan; 687 memcpy(&addr->ip6addr, ip6_addr, sizeof(struct in6_addr)); 688 addr->atype = IPVL_IPV6; 689 list_add_tail(&addr->anode, &ipvlan->addrs); 690 691 /* If the interface is not up, the address will be added to the hash 692 * list by ipvlan_open. 693 */ 694 if (netif_running(ipvlan->dev)) 695 ipvlan_ht_addr_add(ipvlan, addr); 696 697 return 0; 698 } 699 700 static void ipvlan_del_addr6(struct ipvl_dev *ipvlan, struct in6_addr *ip6_addr) 701 { 702 struct ipvl_addr *addr; 703 704 addr = ipvlan_find_addr(ipvlan, ip6_addr, true); 705 if (!addr) 706 return; 707 708 ipvlan_ht_addr_del(addr); 709 list_del(&addr->anode); 710 kfree_rcu(addr, rcu); 711 712 return; 713 } 714 715 static int ipvlan_addr6_event(struct notifier_block *unused, 716 unsigned long event, void *ptr) 717 { 718 struct inet6_ifaddr *if6 = (struct inet6_ifaddr *)ptr; 719 struct net_device *dev = (struct net_device *)if6->idev->dev; 720 struct ipvl_dev *ipvlan = netdev_priv(dev); 721 722 /* FIXME IPv6 autoconf calls us from bh without RTNL */ 723 if (in_softirq()) 724 return NOTIFY_DONE; 725 726 if (!netif_is_ipvlan(dev)) 727 return NOTIFY_DONE; 728 729 if (!ipvlan || !ipvlan->port) 730 return NOTIFY_DONE; 731 732 switch (event) { 733 case NETDEV_UP: 734 if (ipvlan_add_addr6(ipvlan, &if6->addr)) 735 return NOTIFY_BAD; 736 break; 737 738 case NETDEV_DOWN: 739 ipvlan_del_addr6(ipvlan, &if6->addr); 740 break; 741 } 742 743 return NOTIFY_OK; 744 } 745 746 static int ipvlan_add_addr4(struct ipvl_dev *ipvlan, struct in_addr *ip4_addr) 747 { 748 struct ipvl_addr *addr; 749 750 if (ipvlan_addr_busy(ipvlan->port, ip4_addr, false)) { 751 netif_err(ipvlan, ifup, ipvlan->dev, 752 "Failed to add IPv4=%pI4 on %s intf.\n", 753 ip4_addr, ipvlan->dev->name); 754 return -EINVAL; 755 } 756 addr = kzalloc(sizeof(struct ipvl_addr), GFP_KERNEL); 757 if (!addr) 758 return -ENOMEM; 759 760 addr->master = ipvlan; 761 memcpy(&addr->ip4addr, ip4_addr, sizeof(struct in_addr)); 762 addr->atype = IPVL_IPV4; 763 list_add_tail(&addr->anode, &ipvlan->addrs); 764 765 /* If the interface is not up, the address will be added to the hash 766 * list by ipvlan_open. 767 */ 768 if (netif_running(ipvlan->dev)) 769 ipvlan_ht_addr_add(ipvlan, addr); 770 771 return 0; 772 } 773 774 static void ipvlan_del_addr4(struct ipvl_dev *ipvlan, struct in_addr *ip4_addr) 775 { 776 struct ipvl_addr *addr; 777 778 addr = ipvlan_find_addr(ipvlan, ip4_addr, false); 779 if (!addr) 780 return; 781 782 ipvlan_ht_addr_del(addr); 783 list_del(&addr->anode); 784 kfree_rcu(addr, rcu); 785 786 return; 787 } 788 789 static int ipvlan_addr4_event(struct notifier_block *unused, 790 unsigned long event, void *ptr) 791 { 792 struct in_ifaddr *if4 = (struct in_ifaddr *)ptr; 793 struct net_device *dev = (struct net_device *)if4->ifa_dev->dev; 794 struct ipvl_dev *ipvlan = netdev_priv(dev); 795 struct in_addr ip4_addr; 796 797 if (!netif_is_ipvlan(dev)) 798 return NOTIFY_DONE; 799 800 if (!ipvlan || !ipvlan->port) 801 return NOTIFY_DONE; 802 803 switch (event) { 804 case NETDEV_UP: 805 ip4_addr.s_addr = if4->ifa_address; 806 if (ipvlan_add_addr4(ipvlan, &ip4_addr)) 807 return NOTIFY_BAD; 808 break; 809 810 case NETDEV_DOWN: 811 ip4_addr.s_addr = if4->ifa_address; 812 ipvlan_del_addr4(ipvlan, &ip4_addr); 813 break; 814 } 815 816 return NOTIFY_OK; 817 } 818 819 static struct notifier_block ipvlan_addr4_notifier_block __read_mostly = { 820 .notifier_call = ipvlan_addr4_event, 821 }; 822 823 static struct notifier_block ipvlan_notifier_block __read_mostly = { 824 .notifier_call = ipvlan_device_event, 825 }; 826 827 static struct notifier_block ipvlan_addr6_notifier_block __read_mostly = { 828 .notifier_call = ipvlan_addr6_event, 829 }; 830 831 static int __init ipvlan_init_module(void) 832 { 833 int err; 834 835 ipvlan_init_secret(); 836 register_netdevice_notifier(&ipvlan_notifier_block); 837 register_inet6addr_notifier(&ipvlan_addr6_notifier_block); 838 register_inetaddr_notifier(&ipvlan_addr4_notifier_block); 839 840 err = ipvlan_link_register(&ipvlan_link_ops); 841 if (err < 0) 842 goto error; 843 844 return 0; 845 error: 846 unregister_inetaddr_notifier(&ipvlan_addr4_notifier_block); 847 unregister_inet6addr_notifier(&ipvlan_addr6_notifier_block); 848 unregister_netdevice_notifier(&ipvlan_notifier_block); 849 return err; 850 } 851 852 static void __exit ipvlan_cleanup_module(void) 853 { 854 rtnl_link_unregister(&ipvlan_link_ops); 855 unregister_netdevice_notifier(&ipvlan_notifier_block); 856 unregister_inetaddr_notifier(&ipvlan_addr4_notifier_block); 857 unregister_inet6addr_notifier(&ipvlan_addr6_notifier_block); 858 } 859 860 module_init(ipvlan_init_module); 861 module_exit(ipvlan_cleanup_module); 862 863 MODULE_LICENSE("GPL"); 864 MODULE_AUTHOR("Mahesh Bandewar <maheshb@google.com>"); 865 MODULE_DESCRIPTION("Driver for L3 (IPv6/IPv4) based VLANs"); 866 MODULE_ALIAS_RTNL_LINK("ipvlan"); 867