1 // SPDX-License-Identifier: GPL-2.0-or-later 2 /* 3 * IPv6 Address [auto]configuration 4 * Linux INET6 implementation 5 * 6 * Authors: 7 * Pedro Roque <roque@di.fc.ul.pt> 8 * Alexey Kuznetsov <kuznet@ms2.inr.ac.ru> 9 */ 10 11 /* 12 * Changes: 13 * 14 * Janos Farkas : delete timer on ifdown 15 * <chexum@bankinf.banki.hu> 16 * Andi Kleen : kill double kfree on module 17 * unload. 18 * Maciej W. Rozycki : FDDI support 19 * sekiya@USAGI : Don't send too many RS 20 * packets. 21 * yoshfuji@USAGI : Fixed interval between DAD 22 * packets. 23 * YOSHIFUJI Hideaki @USAGI : improved accuracy of 24 * address validation timer. 25 * YOSHIFUJI Hideaki @USAGI : Privacy Extensions (RFC3041) 26 * support. 27 * Yuji SEKIYA @USAGI : Don't assign a same IPv6 28 * address on a same interface. 29 * YOSHIFUJI Hideaki @USAGI : ARCnet support 30 * YOSHIFUJI Hideaki @USAGI : convert /proc/net/if_inet6 to 31 * seq_file. 32 * YOSHIFUJI Hideaki @USAGI : improved source address 33 * selection; consider scope, 34 * status etc. 35 */ 36 37 #define pr_fmt(fmt) "IPv6: " fmt 38 39 #include <linux/errno.h> 40 #include <linux/types.h> 41 #include <linux/kernel.h> 42 #include <linux/sched/signal.h> 43 #include <linux/socket.h> 44 #include <linux/sockios.h> 45 #include <linux/net.h> 46 #include <linux/inet.h> 47 #include <linux/in6.h> 48 #include <linux/netdevice.h> 49 #include <linux/if_addr.h> 50 #include <linux/if_arp.h> 51 #include <linux/if_arcnet.h> 52 #include <linux/if_infiniband.h> 53 #include <linux/route.h> 54 #include <linux/inetdevice.h> 55 #include <linux/init.h> 56 #include <linux/slab.h> 57 #ifdef CONFIG_SYSCTL 58 #include <linux/sysctl.h> 59 #endif 60 #include <linux/capability.h> 61 #include <linux/delay.h> 62 #include <linux/notifier.h> 63 #include <linux/string.h> 64 #include <linux/hash.h> 65 66 #include <net/ip_tunnels.h> 67 #include <net/net_namespace.h> 68 #include <net/sock.h> 69 #include <net/snmp.h> 70 71 #include <net/6lowpan.h> 72 #include <net/firewire.h> 73 #include <net/ipv6.h> 74 #include <net/protocol.h> 75 #include <net/ndisc.h> 76 #include <net/ip6_route.h> 77 #include <net/addrconf.h> 78 #include <net/tcp.h> 79 #include <net/ip.h> 80 #include <net/netlink.h> 81 #include <net/pkt_sched.h> 82 #include <net/l3mdev.h> 83 #include <net/netdev_lock.h> 84 #include <linux/if_tunnel.h> 85 #include <linux/rtnetlink.h> 86 #include <linux/netconf.h> 87 #include <linux/random.h> 88 #include <linux/uaccess.h> 89 #include <linux/unaligned.h> 90 91 #include <linux/proc_fs.h> 92 #include <linux/seq_file.h> 93 #include <linux/export.h> 94 #include <linux/ioam6.h> 95 96 #define IPV6_MAX_STRLEN \ 97 sizeof("ffff:ffff:ffff:ffff:ffff:ffff:255.255.255.255") 98 99 static inline u32 cstamp_delta(unsigned long cstamp) 100 { 101 return (cstamp - INITIAL_JIFFIES) * 100UL / HZ; 102 } 103 104 static inline s32 rfc3315_s14_backoff_init(s32 irt) 105 { 106 /* multiply 'initial retransmission time' by 0.9 .. 1.1 */ 107 u64 tmp = get_random_u32_inclusive(900000, 1100000) * (u64)irt; 108 do_div(tmp, 1000000); 109 return (s32)tmp; 110 } 111 112 static inline s32 rfc3315_s14_backoff_update(s32 rt, s32 mrt) 113 { 114 /* multiply 'retransmission timeout' by 1.9 .. 2.1 */ 115 u64 tmp = get_random_u32_inclusive(1900000, 2100000) * (u64)rt; 116 do_div(tmp, 1000000); 117 if ((s32)tmp > mrt) { 118 /* multiply 'maximum retransmission time' by 0.9 .. 1.1 */ 119 tmp = get_random_u32_inclusive(900000, 1100000) * (u64)mrt; 120 do_div(tmp, 1000000); 121 } 122 return (s32)tmp; 123 } 124 125 #ifdef CONFIG_SYSCTL 126 static int addrconf_sysctl_register(struct inet6_dev *idev); 127 static void addrconf_sysctl_unregister(struct inet6_dev *idev); 128 #else 129 static inline int addrconf_sysctl_register(struct inet6_dev *idev) 130 { 131 return 0; 132 } 133 134 static inline void addrconf_sysctl_unregister(struct inet6_dev *idev) 135 { 136 } 137 #endif 138 139 static void ipv6_gen_rnd_iid(struct in6_addr *addr); 140 141 static int ipv6_generate_eui64(u8 *eui, struct net_device *dev); 142 static int ipv6_count_addresses(const struct inet6_dev *idev); 143 static int ipv6_generate_stable_address(struct in6_addr *addr, 144 u8 dad_count, 145 const struct inet6_dev *idev); 146 147 #define IN6_ADDR_HSIZE_SHIFT 8 148 #define IN6_ADDR_HSIZE (1 << IN6_ADDR_HSIZE_SHIFT) 149 150 static void addrconf_verify(struct net *net); 151 static void addrconf_verify_rtnl(struct net *net); 152 153 static struct workqueue_struct *addrconf_wq; 154 155 static void addrconf_join_anycast(struct inet6_ifaddr *ifp); 156 static void addrconf_leave_anycast(struct inet6_ifaddr *ifp); 157 158 static void addrconf_type_change(struct net_device *dev, 159 unsigned long event); 160 static int addrconf_ifdown(struct net_device *dev, bool unregister); 161 162 static struct fib6_info *addrconf_get_prefix_route(const struct in6_addr *pfx, 163 int plen, 164 const struct net_device *dev, 165 u32 flags, u32 noflags, 166 bool no_gw); 167 168 static void addrconf_dad_start(struct inet6_ifaddr *ifp); 169 static void addrconf_dad_work(struct work_struct *w); 170 static void addrconf_dad_completed(struct inet6_ifaddr *ifp, bool bump_id, 171 bool send_na); 172 static void addrconf_dad_run(struct inet6_dev *idev, bool restart); 173 static void addrconf_rs_timer(struct timer_list *t); 174 static void __ipv6_ifa_notify(int event, struct inet6_ifaddr *ifa); 175 static void ipv6_ifa_notify(int event, struct inet6_ifaddr *ifa); 176 177 static void inet6_prefix_notify(int event, struct inet6_dev *idev, 178 struct prefix_info *pinfo); 179 180 static struct ipv6_devconf ipv6_devconf __read_mostly = { 181 .forwarding = 0, 182 .hop_limit = IPV6_DEFAULT_HOPLIMIT, 183 .mtu6 = IPV6_MIN_MTU, 184 .accept_ra = 1, 185 .accept_redirects = 1, 186 .autoconf = 1, 187 .force_mld_version = 0, 188 .mldv1_unsolicited_report_interval = 10 * HZ, 189 .mldv2_unsolicited_report_interval = HZ, 190 .dad_transmits = 1, 191 .rtr_solicits = MAX_RTR_SOLICITATIONS, 192 .rtr_solicit_interval = RTR_SOLICITATION_INTERVAL, 193 .rtr_solicit_max_interval = RTR_SOLICITATION_MAX_INTERVAL, 194 .rtr_solicit_delay = MAX_RTR_SOLICITATION_DELAY, 195 .use_tempaddr = 0, 196 .temp_valid_lft = TEMP_VALID_LIFETIME, 197 .temp_prefered_lft = TEMP_PREFERRED_LIFETIME, 198 .regen_min_advance = REGEN_MIN_ADVANCE, 199 .regen_max_retry = REGEN_MAX_RETRY, 200 .max_desync_factor = MAX_DESYNC_FACTOR, 201 .max_addresses = IPV6_MAX_ADDRESSES, 202 .accept_ra_defrtr = 1, 203 .ra_defrtr_metric = IP6_RT_PRIO_USER, 204 .accept_ra_from_local = 0, 205 .accept_ra_min_hop_limit= 1, 206 .accept_ra_min_lft = 0, 207 .accept_ra_pinfo = 1, 208 #ifdef CONFIG_IPV6_ROUTER_PREF 209 .accept_ra_rtr_pref = 1, 210 .rtr_probe_interval = 60 * HZ, 211 #ifdef CONFIG_IPV6_ROUTE_INFO 212 .accept_ra_rt_info_min_plen = 0, 213 .accept_ra_rt_info_max_plen = 0, 214 #endif 215 #endif 216 .proxy_ndp = 0, 217 .accept_source_route = 0, /* we do not accept RH0 by default. */ 218 .disable_ipv6 = 0, 219 .accept_dad = 0, 220 .suppress_frag_ndisc = 1, 221 .accept_ra_mtu = 1, 222 .stable_secret = { 223 .initialized = false, 224 }, 225 .use_oif_addrs_only = 0, 226 .ignore_routes_with_linkdown = 0, 227 .keep_addr_on_down = 0, 228 .seg6_enabled = 0, 229 #ifdef CONFIG_IPV6_SEG6_HMAC 230 .seg6_require_hmac = 0, 231 #endif 232 .enhanced_dad = 1, 233 .addr_gen_mode = IN6_ADDR_GEN_MODE_EUI64, 234 .disable_policy = 0, 235 .rpl_seg_enabled = 0, 236 .ioam6_enabled = 0, 237 .ioam6_id = IOAM6_DEFAULT_IF_ID, 238 .ioam6_id_wide = IOAM6_DEFAULT_IF_ID_WIDE, 239 .ndisc_evict_nocarrier = 1, 240 .ra_honor_pio_life = 0, 241 .ra_honor_pio_pflag = 0, 242 }; 243 244 static struct ipv6_devconf ipv6_devconf_dflt __read_mostly = { 245 .forwarding = 0, 246 .hop_limit = IPV6_DEFAULT_HOPLIMIT, 247 .mtu6 = IPV6_MIN_MTU, 248 .accept_ra = 1, 249 .accept_redirects = 1, 250 .autoconf = 1, 251 .force_mld_version = 0, 252 .mldv1_unsolicited_report_interval = 10 * HZ, 253 .mldv2_unsolicited_report_interval = HZ, 254 .dad_transmits = 1, 255 .rtr_solicits = MAX_RTR_SOLICITATIONS, 256 .rtr_solicit_interval = RTR_SOLICITATION_INTERVAL, 257 .rtr_solicit_max_interval = RTR_SOLICITATION_MAX_INTERVAL, 258 .rtr_solicit_delay = MAX_RTR_SOLICITATION_DELAY, 259 .use_tempaddr = 0, 260 .temp_valid_lft = TEMP_VALID_LIFETIME, 261 .temp_prefered_lft = TEMP_PREFERRED_LIFETIME, 262 .regen_min_advance = REGEN_MIN_ADVANCE, 263 .regen_max_retry = REGEN_MAX_RETRY, 264 .max_desync_factor = MAX_DESYNC_FACTOR, 265 .max_addresses = IPV6_MAX_ADDRESSES, 266 .accept_ra_defrtr = 1, 267 .ra_defrtr_metric = IP6_RT_PRIO_USER, 268 .accept_ra_from_local = 0, 269 .accept_ra_min_hop_limit= 1, 270 .accept_ra_min_lft = 0, 271 .accept_ra_pinfo = 1, 272 #ifdef CONFIG_IPV6_ROUTER_PREF 273 .accept_ra_rtr_pref = 1, 274 .rtr_probe_interval = 60 * HZ, 275 #ifdef CONFIG_IPV6_ROUTE_INFO 276 .accept_ra_rt_info_min_plen = 0, 277 .accept_ra_rt_info_max_plen = 0, 278 #endif 279 #endif 280 .proxy_ndp = 0, 281 .accept_source_route = 0, /* we do not accept RH0 by default. */ 282 .disable_ipv6 = 0, 283 .accept_dad = 1, 284 .suppress_frag_ndisc = 1, 285 .accept_ra_mtu = 1, 286 .stable_secret = { 287 .initialized = false, 288 }, 289 .use_oif_addrs_only = 0, 290 .ignore_routes_with_linkdown = 0, 291 .keep_addr_on_down = 0, 292 .seg6_enabled = 0, 293 #ifdef CONFIG_IPV6_SEG6_HMAC 294 .seg6_require_hmac = 0, 295 #endif 296 .enhanced_dad = 1, 297 .addr_gen_mode = IN6_ADDR_GEN_MODE_EUI64, 298 .disable_policy = 0, 299 .rpl_seg_enabled = 0, 300 .ioam6_enabled = 0, 301 .ioam6_id = IOAM6_DEFAULT_IF_ID, 302 .ioam6_id_wide = IOAM6_DEFAULT_IF_ID_WIDE, 303 .ndisc_evict_nocarrier = 1, 304 .ra_honor_pio_life = 0, 305 .ra_honor_pio_pflag = 0, 306 }; 307 308 /* Check if link is ready: is it up and is a valid qdisc available */ 309 static inline bool addrconf_link_ready(const struct net_device *dev) 310 { 311 return netif_oper_up(dev) && !qdisc_tx_is_noop(dev); 312 } 313 314 static void addrconf_del_rs_timer(struct inet6_dev *idev) 315 { 316 if (timer_delete(&idev->rs_timer)) 317 __in6_dev_put(idev); 318 } 319 320 static void addrconf_del_dad_work(struct inet6_ifaddr *ifp) 321 { 322 if (cancel_delayed_work(&ifp->dad_work)) 323 __in6_ifa_put(ifp); 324 } 325 326 static void addrconf_mod_rs_timer(struct inet6_dev *idev, 327 unsigned long when) 328 { 329 if (!mod_timer(&idev->rs_timer, jiffies + when)) 330 in6_dev_hold(idev); 331 } 332 333 static void addrconf_mod_dad_work(struct inet6_ifaddr *ifp, 334 unsigned long delay) 335 { 336 in6_ifa_hold(ifp); 337 if (mod_delayed_work(addrconf_wq, &ifp->dad_work, delay)) 338 in6_ifa_put(ifp); 339 } 340 341 static int snmp6_alloc_dev(struct inet6_dev *idev) 342 { 343 int i; 344 345 idev->stats.ipv6 = alloc_percpu_gfp(struct ipstats_mib, GFP_KERNEL_ACCOUNT); 346 if (!idev->stats.ipv6) 347 goto err_ip; 348 349 for_each_possible_cpu(i) { 350 struct ipstats_mib *addrconf_stats; 351 addrconf_stats = per_cpu_ptr(idev->stats.ipv6, i); 352 u64_stats_init(&addrconf_stats->syncp); 353 } 354 355 356 idev->stats.icmpv6dev = kzalloc(sizeof(struct icmpv6_mib_device), 357 GFP_KERNEL); 358 if (!idev->stats.icmpv6dev) 359 goto err_icmp; 360 idev->stats.icmpv6msgdev = kzalloc(sizeof(struct icmpv6msg_mib_device), 361 GFP_KERNEL_ACCOUNT); 362 if (!idev->stats.icmpv6msgdev) 363 goto err_icmpmsg; 364 365 return 0; 366 367 err_icmpmsg: 368 kfree(idev->stats.icmpv6dev); 369 err_icmp: 370 free_percpu(idev->stats.ipv6); 371 err_ip: 372 return -ENOMEM; 373 } 374 375 static struct inet6_dev *ipv6_add_dev(struct net_device *dev) 376 { 377 struct inet6_dev *ndev; 378 int err = -ENOMEM; 379 380 ASSERT_RTNL(); 381 netdev_ops_assert_locked(dev); 382 383 if (dev->mtu < IPV6_MIN_MTU && dev != blackhole_netdev) 384 return ERR_PTR(-EINVAL); 385 386 ndev = kzalloc(sizeof(*ndev), GFP_KERNEL_ACCOUNT); 387 if (!ndev) 388 return ERR_PTR(err); 389 390 rwlock_init(&ndev->lock); 391 ndev->dev = dev; 392 INIT_LIST_HEAD(&ndev->addr_list); 393 timer_setup(&ndev->rs_timer, addrconf_rs_timer, 0); 394 memcpy(&ndev->cnf, dev_net(dev)->ipv6.devconf_dflt, sizeof(ndev->cnf)); 395 396 if (ndev->cnf.stable_secret.initialized) 397 ndev->cnf.addr_gen_mode = IN6_ADDR_GEN_MODE_STABLE_PRIVACY; 398 399 ndev->cnf.mtu6 = dev->mtu; 400 ndev->ra_mtu = 0; 401 ndev->nd_parms = neigh_parms_alloc(dev, &nd_tbl); 402 if (!ndev->nd_parms) { 403 kfree(ndev); 404 return ERR_PTR(err); 405 } 406 if (ndev->cnf.forwarding) 407 netif_disable_lro(dev); 408 /* We refer to the device */ 409 netdev_hold(dev, &ndev->dev_tracker, GFP_KERNEL); 410 411 if (snmp6_alloc_dev(ndev) < 0) { 412 netdev_dbg(dev, "%s: cannot allocate memory for statistics\n", 413 __func__); 414 neigh_parms_release(&nd_tbl, ndev->nd_parms); 415 netdev_put(dev, &ndev->dev_tracker); 416 kfree(ndev); 417 return ERR_PTR(err); 418 } 419 420 if (dev != blackhole_netdev) { 421 if (snmp6_register_dev(ndev) < 0) { 422 netdev_dbg(dev, "%s: cannot create /proc/net/dev_snmp6/%s\n", 423 __func__, dev->name); 424 goto err_release; 425 } 426 } 427 /* One reference from device. */ 428 refcount_set(&ndev->refcnt, 1); 429 430 if (dev->flags & (IFF_NOARP | IFF_LOOPBACK)) 431 ndev->cnf.accept_dad = -1; 432 433 #if IS_ENABLED(CONFIG_IPV6_SIT) 434 if (dev->type == ARPHRD_SIT && (dev->priv_flags & IFF_ISATAP)) { 435 pr_info("%s: Disabled Multicast RS\n", dev->name); 436 ndev->cnf.rtr_solicits = 0; 437 } 438 #endif 439 440 INIT_LIST_HEAD(&ndev->tempaddr_list); 441 ndev->desync_factor = U32_MAX; 442 if ((dev->flags&IFF_LOOPBACK) || 443 dev->type == ARPHRD_TUNNEL || 444 dev->type == ARPHRD_TUNNEL6 || 445 dev->type == ARPHRD_SIT || 446 dev->type == ARPHRD_NONE) { 447 ndev->cnf.use_tempaddr = -1; 448 } 449 450 ndev->token = in6addr_any; 451 452 if (netif_running(dev) && addrconf_link_ready(dev)) 453 ndev->if_flags |= IF_READY; 454 455 ipv6_mc_init_dev(ndev); 456 ndev->tstamp = jiffies; 457 if (dev != blackhole_netdev) { 458 err = addrconf_sysctl_register(ndev); 459 if (err) { 460 ipv6_mc_destroy_dev(ndev); 461 snmp6_unregister_dev(ndev); 462 goto err_release; 463 } 464 } 465 /* protected by rtnl_lock */ 466 rcu_assign_pointer(dev->ip6_ptr, ndev); 467 468 if (dev != blackhole_netdev) { 469 /* Join interface-local all-node multicast group */ 470 ipv6_dev_mc_inc(dev, &in6addr_interfacelocal_allnodes); 471 472 /* Join all-node multicast group */ 473 ipv6_dev_mc_inc(dev, &in6addr_linklocal_allnodes); 474 475 /* Join all-router multicast group if forwarding is set */ 476 if (ndev->cnf.forwarding && (dev->flags & IFF_MULTICAST)) 477 ipv6_dev_mc_inc(dev, &in6addr_linklocal_allrouters); 478 } 479 return ndev; 480 481 err_release: 482 neigh_parms_release(&nd_tbl, ndev->nd_parms); 483 ndev->dead = 1; 484 in6_dev_finish_destroy(ndev); 485 return ERR_PTR(err); 486 } 487 488 static struct inet6_dev *ipv6_find_idev(struct net_device *dev) 489 { 490 struct inet6_dev *idev; 491 492 ASSERT_RTNL(); 493 494 idev = __in6_dev_get(dev); 495 if (!idev) { 496 idev = ipv6_add_dev(dev); 497 if (IS_ERR(idev)) 498 return idev; 499 } 500 501 if (dev->flags&IFF_UP) 502 ipv6_mc_up(idev); 503 return idev; 504 } 505 506 static int inet6_netconf_msgsize_devconf(int type) 507 { 508 int size = NLMSG_ALIGN(sizeof(struct netconfmsg)) 509 + nla_total_size(4); /* NETCONFA_IFINDEX */ 510 bool all = false; 511 512 if (type == NETCONFA_ALL) 513 all = true; 514 515 if (all || type == NETCONFA_FORWARDING) 516 size += nla_total_size(4); 517 #ifdef CONFIG_IPV6_MROUTE 518 if (all || type == NETCONFA_MC_FORWARDING) 519 size += nla_total_size(4); 520 #endif 521 if (all || type == NETCONFA_PROXY_NEIGH) 522 size += nla_total_size(4); 523 524 if (all || type == NETCONFA_IGNORE_ROUTES_WITH_LINKDOWN) 525 size += nla_total_size(4); 526 527 return size; 528 } 529 530 static int inet6_netconf_fill_devconf(struct sk_buff *skb, int ifindex, 531 struct ipv6_devconf *devconf, u32 portid, 532 u32 seq, int event, unsigned int flags, 533 int type) 534 { 535 struct nlmsghdr *nlh; 536 struct netconfmsg *ncm; 537 bool all = false; 538 539 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct netconfmsg), 540 flags); 541 if (!nlh) 542 return -EMSGSIZE; 543 544 if (type == NETCONFA_ALL) 545 all = true; 546 547 ncm = nlmsg_data(nlh); 548 ncm->ncm_family = AF_INET6; 549 550 if (nla_put_s32(skb, NETCONFA_IFINDEX, ifindex) < 0) 551 goto nla_put_failure; 552 553 if (!devconf) 554 goto out; 555 556 if ((all || type == NETCONFA_FORWARDING) && 557 nla_put_s32(skb, NETCONFA_FORWARDING, 558 READ_ONCE(devconf->forwarding)) < 0) 559 goto nla_put_failure; 560 #ifdef CONFIG_IPV6_MROUTE 561 if ((all || type == NETCONFA_MC_FORWARDING) && 562 nla_put_s32(skb, NETCONFA_MC_FORWARDING, 563 atomic_read(&devconf->mc_forwarding)) < 0) 564 goto nla_put_failure; 565 #endif 566 if ((all || type == NETCONFA_PROXY_NEIGH) && 567 nla_put_s32(skb, NETCONFA_PROXY_NEIGH, 568 READ_ONCE(devconf->proxy_ndp)) < 0) 569 goto nla_put_failure; 570 571 if ((all || type == NETCONFA_IGNORE_ROUTES_WITH_LINKDOWN) && 572 nla_put_s32(skb, NETCONFA_IGNORE_ROUTES_WITH_LINKDOWN, 573 READ_ONCE(devconf->ignore_routes_with_linkdown)) < 0) 574 goto nla_put_failure; 575 576 out: 577 nlmsg_end(skb, nlh); 578 return 0; 579 580 nla_put_failure: 581 nlmsg_cancel(skb, nlh); 582 return -EMSGSIZE; 583 } 584 585 void inet6_netconf_notify_devconf(struct net *net, int event, int type, 586 int ifindex, struct ipv6_devconf *devconf) 587 { 588 struct sk_buff *skb; 589 int err = -ENOBUFS; 590 591 skb = nlmsg_new(inet6_netconf_msgsize_devconf(type), GFP_KERNEL); 592 if (!skb) 593 goto errout; 594 595 err = inet6_netconf_fill_devconf(skb, ifindex, devconf, 0, 0, 596 event, 0, type); 597 if (err < 0) { 598 /* -EMSGSIZE implies BUG in inet6_netconf_msgsize_devconf() */ 599 WARN_ON(err == -EMSGSIZE); 600 kfree_skb(skb); 601 goto errout; 602 } 603 rtnl_notify(skb, net, 0, RTNLGRP_IPV6_NETCONF, NULL, GFP_KERNEL); 604 return; 605 errout: 606 rtnl_set_sk_err(net, RTNLGRP_IPV6_NETCONF, err); 607 } 608 609 static const struct nla_policy devconf_ipv6_policy[NETCONFA_MAX+1] = { 610 [NETCONFA_IFINDEX] = { .len = sizeof(int) }, 611 [NETCONFA_FORWARDING] = { .len = sizeof(int) }, 612 [NETCONFA_PROXY_NEIGH] = { .len = sizeof(int) }, 613 [NETCONFA_IGNORE_ROUTES_WITH_LINKDOWN] = { .len = sizeof(int) }, 614 }; 615 616 static int inet6_netconf_valid_get_req(struct sk_buff *skb, 617 const struct nlmsghdr *nlh, 618 struct nlattr **tb, 619 struct netlink_ext_ack *extack) 620 { 621 int i, err; 622 623 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(struct netconfmsg))) { 624 NL_SET_ERR_MSG_MOD(extack, "Invalid header for netconf get request"); 625 return -EINVAL; 626 } 627 628 if (!netlink_strict_get_check(skb)) 629 return nlmsg_parse_deprecated(nlh, sizeof(struct netconfmsg), 630 tb, NETCONFA_MAX, 631 devconf_ipv6_policy, extack); 632 633 err = nlmsg_parse_deprecated_strict(nlh, sizeof(struct netconfmsg), 634 tb, NETCONFA_MAX, 635 devconf_ipv6_policy, extack); 636 if (err) 637 return err; 638 639 for (i = 0; i <= NETCONFA_MAX; i++) { 640 if (!tb[i]) 641 continue; 642 643 switch (i) { 644 case NETCONFA_IFINDEX: 645 break; 646 default: 647 NL_SET_ERR_MSG_MOD(extack, "Unsupported attribute in netconf get request"); 648 return -EINVAL; 649 } 650 } 651 652 return 0; 653 } 654 655 static int inet6_netconf_get_devconf(struct sk_buff *in_skb, 656 struct nlmsghdr *nlh, 657 struct netlink_ext_ack *extack) 658 { 659 struct net *net = sock_net(in_skb->sk); 660 struct nlattr *tb[NETCONFA_MAX+1]; 661 struct inet6_dev *in6_dev = NULL; 662 struct net_device *dev = NULL; 663 struct sk_buff *skb; 664 struct ipv6_devconf *devconf; 665 int ifindex; 666 int err; 667 668 err = inet6_netconf_valid_get_req(in_skb, nlh, tb, extack); 669 if (err < 0) 670 return err; 671 672 if (!tb[NETCONFA_IFINDEX]) 673 return -EINVAL; 674 675 err = -EINVAL; 676 ifindex = nla_get_s32(tb[NETCONFA_IFINDEX]); 677 switch (ifindex) { 678 case NETCONFA_IFINDEX_ALL: 679 devconf = net->ipv6.devconf_all; 680 break; 681 case NETCONFA_IFINDEX_DEFAULT: 682 devconf = net->ipv6.devconf_dflt; 683 break; 684 default: 685 dev = dev_get_by_index(net, ifindex); 686 if (!dev) 687 return -EINVAL; 688 in6_dev = in6_dev_get(dev); 689 if (!in6_dev) 690 goto errout; 691 devconf = &in6_dev->cnf; 692 break; 693 } 694 695 err = -ENOBUFS; 696 skb = nlmsg_new(inet6_netconf_msgsize_devconf(NETCONFA_ALL), GFP_KERNEL); 697 if (!skb) 698 goto errout; 699 700 err = inet6_netconf_fill_devconf(skb, ifindex, devconf, 701 NETLINK_CB(in_skb).portid, 702 nlh->nlmsg_seq, RTM_NEWNETCONF, 0, 703 NETCONFA_ALL); 704 if (err < 0) { 705 /* -EMSGSIZE implies BUG in inet6_netconf_msgsize_devconf() */ 706 WARN_ON(err == -EMSGSIZE); 707 kfree_skb(skb); 708 goto errout; 709 } 710 err = rtnl_unicast(skb, net, NETLINK_CB(in_skb).portid); 711 errout: 712 if (in6_dev) 713 in6_dev_put(in6_dev); 714 dev_put(dev); 715 return err; 716 } 717 718 /* Combine dev_addr_genid and dev_base_seq to detect changes. 719 */ 720 static u32 inet6_base_seq(const struct net *net) 721 { 722 u32 res = atomic_read(&net->ipv6.dev_addr_genid) + 723 READ_ONCE(net->dev_base_seq); 724 725 /* Must not return 0 (see nl_dump_check_consistent()). 726 * Chose a value far away from 0. 727 */ 728 if (!res) 729 res = 0x80000000; 730 return res; 731 } 732 733 static int inet6_netconf_dump_devconf(struct sk_buff *skb, 734 struct netlink_callback *cb) 735 { 736 const struct nlmsghdr *nlh = cb->nlh; 737 struct net *net = sock_net(skb->sk); 738 struct { 739 unsigned long ifindex; 740 unsigned int all_default; 741 } *ctx = (void *)cb->ctx; 742 struct net_device *dev; 743 struct inet6_dev *idev; 744 int err = 0; 745 746 if (cb->strict_check) { 747 struct netlink_ext_ack *extack = cb->extack; 748 struct netconfmsg *ncm; 749 750 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*ncm))) { 751 NL_SET_ERR_MSG_MOD(extack, "Invalid header for netconf dump request"); 752 return -EINVAL; 753 } 754 755 if (nlmsg_attrlen(nlh, sizeof(*ncm))) { 756 NL_SET_ERR_MSG_MOD(extack, "Invalid data after header in netconf dump request"); 757 return -EINVAL; 758 } 759 } 760 761 rcu_read_lock(); 762 for_each_netdev_dump(net, dev, ctx->ifindex) { 763 idev = __in6_dev_get(dev); 764 if (!idev) 765 continue; 766 err = inet6_netconf_fill_devconf(skb, dev->ifindex, 767 &idev->cnf, 768 NETLINK_CB(cb->skb).portid, 769 nlh->nlmsg_seq, 770 RTM_NEWNETCONF, 771 NLM_F_MULTI, 772 NETCONFA_ALL); 773 if (err < 0) 774 goto done; 775 } 776 if (ctx->all_default == 0) { 777 err = inet6_netconf_fill_devconf(skb, NETCONFA_IFINDEX_ALL, 778 net->ipv6.devconf_all, 779 NETLINK_CB(cb->skb).portid, 780 nlh->nlmsg_seq, 781 RTM_NEWNETCONF, NLM_F_MULTI, 782 NETCONFA_ALL); 783 if (err < 0) 784 goto done; 785 ctx->all_default++; 786 } 787 if (ctx->all_default == 1) { 788 err = inet6_netconf_fill_devconf(skb, NETCONFA_IFINDEX_DEFAULT, 789 net->ipv6.devconf_dflt, 790 NETLINK_CB(cb->skb).portid, 791 nlh->nlmsg_seq, 792 RTM_NEWNETCONF, NLM_F_MULTI, 793 NETCONFA_ALL); 794 if (err < 0) 795 goto done; 796 ctx->all_default++; 797 } 798 done: 799 rcu_read_unlock(); 800 return err; 801 } 802 803 #ifdef CONFIG_SYSCTL 804 static void dev_forward_change(struct inet6_dev *idev) 805 { 806 struct net_device *dev; 807 struct inet6_ifaddr *ifa; 808 LIST_HEAD(tmp_addr_list); 809 810 if (!idev) 811 return; 812 dev = idev->dev; 813 if (idev->cnf.forwarding) 814 dev_disable_lro(dev); 815 if (dev->flags & IFF_MULTICAST) { 816 if (idev->cnf.forwarding) { 817 ipv6_dev_mc_inc(dev, &in6addr_linklocal_allrouters); 818 ipv6_dev_mc_inc(dev, &in6addr_interfacelocal_allrouters); 819 ipv6_dev_mc_inc(dev, &in6addr_sitelocal_allrouters); 820 } else { 821 ipv6_dev_mc_dec(dev, &in6addr_linklocal_allrouters); 822 ipv6_dev_mc_dec(dev, &in6addr_interfacelocal_allrouters); 823 ipv6_dev_mc_dec(dev, &in6addr_sitelocal_allrouters); 824 } 825 } 826 827 read_lock_bh(&idev->lock); 828 list_for_each_entry(ifa, &idev->addr_list, if_list) { 829 if (ifa->flags&IFA_F_TENTATIVE) 830 continue; 831 list_add_tail(&ifa->if_list_aux, &tmp_addr_list); 832 } 833 read_unlock_bh(&idev->lock); 834 835 while (!list_empty(&tmp_addr_list)) { 836 ifa = list_first_entry(&tmp_addr_list, 837 struct inet6_ifaddr, if_list_aux); 838 list_del(&ifa->if_list_aux); 839 if (idev->cnf.forwarding) 840 addrconf_join_anycast(ifa); 841 else 842 addrconf_leave_anycast(ifa); 843 } 844 845 inet6_netconf_notify_devconf(dev_net(dev), RTM_NEWNETCONF, 846 NETCONFA_FORWARDING, 847 dev->ifindex, &idev->cnf); 848 } 849 850 851 static void addrconf_forward_change(struct net *net, __s32 newf) 852 { 853 struct net_device *dev; 854 struct inet6_dev *idev; 855 856 for_each_netdev(net, dev) { 857 idev = __in6_dev_get_rtnl_net(dev); 858 if (idev) { 859 int changed = (!idev->cnf.forwarding) ^ (!newf); 860 861 WRITE_ONCE(idev->cnf.forwarding, newf); 862 if (changed) 863 dev_forward_change(idev); 864 } 865 } 866 } 867 868 static int addrconf_fixup_forwarding(const struct ctl_table *table, int *p, int newf) 869 { 870 struct net *net = (struct net *)table->extra2; 871 int old; 872 873 if (!rtnl_net_trylock(net)) 874 return restart_syscall(); 875 876 old = *p; 877 WRITE_ONCE(*p, newf); 878 879 if (p == &net->ipv6.devconf_dflt->forwarding) { 880 if ((!newf) ^ (!old)) 881 inet6_netconf_notify_devconf(net, RTM_NEWNETCONF, 882 NETCONFA_FORWARDING, 883 NETCONFA_IFINDEX_DEFAULT, 884 net->ipv6.devconf_dflt); 885 rtnl_net_unlock(net); 886 return 0; 887 } 888 889 if (p == &net->ipv6.devconf_all->forwarding) { 890 int old_dflt = net->ipv6.devconf_dflt->forwarding; 891 892 WRITE_ONCE(net->ipv6.devconf_dflt->forwarding, newf); 893 if ((!newf) ^ (!old_dflt)) 894 inet6_netconf_notify_devconf(net, RTM_NEWNETCONF, 895 NETCONFA_FORWARDING, 896 NETCONFA_IFINDEX_DEFAULT, 897 net->ipv6.devconf_dflt); 898 899 addrconf_forward_change(net, newf); 900 if ((!newf) ^ (!old)) 901 inet6_netconf_notify_devconf(net, RTM_NEWNETCONF, 902 NETCONFA_FORWARDING, 903 NETCONFA_IFINDEX_ALL, 904 net->ipv6.devconf_all); 905 } else if ((!newf) ^ (!old)) 906 dev_forward_change((struct inet6_dev *)table->extra1); 907 rtnl_net_unlock(net); 908 909 if (newf) 910 rt6_purge_dflt_routers(net); 911 return 1; 912 } 913 914 static void addrconf_linkdown_change(struct net *net, __s32 newf) 915 { 916 struct net_device *dev; 917 struct inet6_dev *idev; 918 919 for_each_netdev(net, dev) { 920 idev = __in6_dev_get_rtnl_net(dev); 921 if (idev) { 922 int changed = (!idev->cnf.ignore_routes_with_linkdown) ^ (!newf); 923 924 WRITE_ONCE(idev->cnf.ignore_routes_with_linkdown, newf); 925 if (changed) 926 inet6_netconf_notify_devconf(dev_net(dev), 927 RTM_NEWNETCONF, 928 NETCONFA_IGNORE_ROUTES_WITH_LINKDOWN, 929 dev->ifindex, 930 &idev->cnf); 931 } 932 } 933 } 934 935 static int addrconf_fixup_linkdown(const struct ctl_table *table, int *p, int newf) 936 { 937 struct net *net = (struct net *)table->extra2; 938 int old; 939 940 if (!rtnl_net_trylock(net)) 941 return restart_syscall(); 942 943 old = *p; 944 WRITE_ONCE(*p, newf); 945 946 if (p == &net->ipv6.devconf_dflt->ignore_routes_with_linkdown) { 947 if ((!newf) ^ (!old)) 948 inet6_netconf_notify_devconf(net, 949 RTM_NEWNETCONF, 950 NETCONFA_IGNORE_ROUTES_WITH_LINKDOWN, 951 NETCONFA_IFINDEX_DEFAULT, 952 net->ipv6.devconf_dflt); 953 rtnl_net_unlock(net); 954 return 0; 955 } 956 957 if (p == &net->ipv6.devconf_all->ignore_routes_with_linkdown) { 958 WRITE_ONCE(net->ipv6.devconf_dflt->ignore_routes_with_linkdown, newf); 959 addrconf_linkdown_change(net, newf); 960 if ((!newf) ^ (!old)) 961 inet6_netconf_notify_devconf(net, 962 RTM_NEWNETCONF, 963 NETCONFA_IGNORE_ROUTES_WITH_LINKDOWN, 964 NETCONFA_IFINDEX_ALL, 965 net->ipv6.devconf_all); 966 } 967 968 rtnl_net_unlock(net); 969 970 return 1; 971 } 972 973 #endif 974 975 /* Nobody refers to this ifaddr, destroy it */ 976 void inet6_ifa_finish_destroy(struct inet6_ifaddr *ifp) 977 { 978 WARN_ON(!hlist_unhashed(&ifp->addr_lst)); 979 980 #ifdef NET_REFCNT_DEBUG 981 pr_debug("%s\n", __func__); 982 #endif 983 984 in6_dev_put(ifp->idev); 985 986 if (cancel_delayed_work(&ifp->dad_work)) 987 pr_notice("delayed DAD work was pending while freeing ifa=%p\n", 988 ifp); 989 990 if (ifp->state != INET6_IFADDR_STATE_DEAD) { 991 pr_warn("Freeing alive inet6 address %p\n", ifp); 992 return; 993 } 994 995 kfree_rcu(ifp, rcu); 996 } 997 998 static void 999 ipv6_link_dev_addr(struct inet6_dev *idev, struct inet6_ifaddr *ifp) 1000 { 1001 struct list_head *p; 1002 int ifp_scope = ipv6_addr_src_scope(&ifp->addr); 1003 1004 /* 1005 * Each device address list is sorted in order of scope - 1006 * global before linklocal. 1007 */ 1008 list_for_each(p, &idev->addr_list) { 1009 struct inet6_ifaddr *ifa 1010 = list_entry(p, struct inet6_ifaddr, if_list); 1011 if (ifp_scope >= ipv6_addr_src_scope(&ifa->addr)) 1012 break; 1013 } 1014 1015 list_add_tail_rcu(&ifp->if_list, p); 1016 } 1017 1018 static u32 inet6_addr_hash(const struct net *net, const struct in6_addr *addr) 1019 { 1020 u32 val = __ipv6_addr_jhash(addr, net_hash_mix(net)); 1021 1022 return hash_32(val, IN6_ADDR_HSIZE_SHIFT); 1023 } 1024 1025 static bool ipv6_chk_same_addr(struct net *net, const struct in6_addr *addr, 1026 struct net_device *dev, unsigned int hash) 1027 { 1028 struct inet6_ifaddr *ifp; 1029 1030 hlist_for_each_entry(ifp, &net->ipv6.inet6_addr_lst[hash], addr_lst) { 1031 if (ipv6_addr_equal(&ifp->addr, addr)) { 1032 if (!dev || ifp->idev->dev == dev) 1033 return true; 1034 } 1035 } 1036 return false; 1037 } 1038 1039 static int ipv6_add_addr_hash(struct net_device *dev, struct inet6_ifaddr *ifa) 1040 { 1041 struct net *net = dev_net(dev); 1042 unsigned int hash = inet6_addr_hash(net, &ifa->addr); 1043 int err = 0; 1044 1045 spin_lock_bh(&net->ipv6.addrconf_hash_lock); 1046 1047 /* Ignore adding duplicate addresses on an interface */ 1048 if (ipv6_chk_same_addr(net, &ifa->addr, dev, hash)) { 1049 netdev_dbg(dev, "ipv6_add_addr: already assigned\n"); 1050 err = -EEXIST; 1051 } else { 1052 hlist_add_head_rcu(&ifa->addr_lst, &net->ipv6.inet6_addr_lst[hash]); 1053 } 1054 1055 spin_unlock_bh(&net->ipv6.addrconf_hash_lock); 1056 1057 return err; 1058 } 1059 1060 /* On success it returns ifp with increased reference count */ 1061 1062 static struct inet6_ifaddr * 1063 ipv6_add_addr(struct inet6_dev *idev, struct ifa6_config *cfg, 1064 bool can_block, struct netlink_ext_ack *extack) 1065 { 1066 gfp_t gfp_flags = can_block ? GFP_KERNEL : GFP_ATOMIC; 1067 int addr_type = ipv6_addr_type(cfg->pfx); 1068 struct net *net = dev_net(idev->dev); 1069 struct inet6_ifaddr *ifa = NULL; 1070 struct fib6_info *f6i = NULL; 1071 int err = 0; 1072 1073 if (addr_type == IPV6_ADDR_ANY) { 1074 NL_SET_ERR_MSG_MOD(extack, "Invalid address"); 1075 return ERR_PTR(-EADDRNOTAVAIL); 1076 } else if (addr_type & IPV6_ADDR_MULTICAST && 1077 !(cfg->ifa_flags & IFA_F_MCAUTOJOIN)) { 1078 NL_SET_ERR_MSG_MOD(extack, "Cannot assign multicast address without \"IFA_F_MCAUTOJOIN\" flag"); 1079 return ERR_PTR(-EADDRNOTAVAIL); 1080 } else if (!(idev->dev->flags & IFF_LOOPBACK) && 1081 !netif_is_l3_master(idev->dev) && 1082 addr_type & IPV6_ADDR_LOOPBACK) { 1083 NL_SET_ERR_MSG_MOD(extack, "Cannot assign loopback address on this device"); 1084 return ERR_PTR(-EADDRNOTAVAIL); 1085 } 1086 1087 if (idev->dead) { 1088 NL_SET_ERR_MSG_MOD(extack, "device is going away"); 1089 err = -ENODEV; 1090 goto out; 1091 } 1092 1093 if (idev->cnf.disable_ipv6) { 1094 NL_SET_ERR_MSG_MOD(extack, "IPv6 is disabled on this device"); 1095 err = -EACCES; 1096 goto out; 1097 } 1098 1099 /* validator notifier needs to be blocking; 1100 * do not call in atomic context 1101 */ 1102 if (can_block) { 1103 struct in6_validator_info i6vi = { 1104 .i6vi_addr = *cfg->pfx, 1105 .i6vi_dev = idev, 1106 .extack = extack, 1107 }; 1108 1109 err = inet6addr_validator_notifier_call_chain(NETDEV_UP, &i6vi); 1110 err = notifier_to_errno(err); 1111 if (err < 0) 1112 goto out; 1113 } 1114 1115 ifa = kzalloc(sizeof(*ifa), gfp_flags | __GFP_ACCOUNT); 1116 if (!ifa) { 1117 err = -ENOBUFS; 1118 goto out; 1119 } 1120 1121 f6i = addrconf_f6i_alloc(net, idev, cfg->pfx, false, gfp_flags, extack); 1122 if (IS_ERR(f6i)) { 1123 err = PTR_ERR(f6i); 1124 f6i = NULL; 1125 goto out; 1126 } 1127 1128 neigh_parms_data_state_setall(idev->nd_parms); 1129 1130 ifa->addr = *cfg->pfx; 1131 if (cfg->peer_pfx) 1132 ifa->peer_addr = *cfg->peer_pfx; 1133 1134 spin_lock_init(&ifa->lock); 1135 INIT_DELAYED_WORK(&ifa->dad_work, addrconf_dad_work); 1136 INIT_HLIST_NODE(&ifa->addr_lst); 1137 ifa->scope = cfg->scope; 1138 ifa->prefix_len = cfg->plen; 1139 ifa->rt_priority = cfg->rt_priority; 1140 ifa->flags = cfg->ifa_flags; 1141 ifa->ifa_proto = cfg->ifa_proto; 1142 /* No need to add the TENTATIVE flag for addresses with NODAD */ 1143 if (!(cfg->ifa_flags & IFA_F_NODAD)) 1144 ifa->flags |= IFA_F_TENTATIVE; 1145 ifa->valid_lft = cfg->valid_lft; 1146 ifa->prefered_lft = cfg->preferred_lft; 1147 ifa->cstamp = ifa->tstamp = jiffies; 1148 ifa->tokenized = false; 1149 1150 ifa->rt = f6i; 1151 1152 ifa->idev = idev; 1153 in6_dev_hold(idev); 1154 1155 /* For caller */ 1156 refcount_set(&ifa->refcnt, 1); 1157 1158 rcu_read_lock(); 1159 1160 err = ipv6_add_addr_hash(idev->dev, ifa); 1161 if (err < 0) { 1162 rcu_read_unlock(); 1163 goto out; 1164 } 1165 1166 write_lock_bh(&idev->lock); 1167 1168 /* Add to inet6_dev unicast addr list. */ 1169 ipv6_link_dev_addr(idev, ifa); 1170 1171 if (ifa->flags&IFA_F_TEMPORARY) { 1172 list_add(&ifa->tmp_list, &idev->tempaddr_list); 1173 in6_ifa_hold(ifa); 1174 } 1175 1176 in6_ifa_hold(ifa); 1177 write_unlock_bh(&idev->lock); 1178 1179 rcu_read_unlock(); 1180 1181 inet6addr_notifier_call_chain(NETDEV_UP, ifa); 1182 out: 1183 if (unlikely(err < 0)) { 1184 fib6_info_release(f6i); 1185 1186 if (ifa) { 1187 if (ifa->idev) 1188 in6_dev_put(ifa->idev); 1189 kfree(ifa); 1190 } 1191 ifa = ERR_PTR(err); 1192 } 1193 1194 return ifa; 1195 } 1196 1197 enum cleanup_prefix_rt_t { 1198 CLEANUP_PREFIX_RT_NOP, /* no cleanup action for prefix route */ 1199 CLEANUP_PREFIX_RT_DEL, /* delete the prefix route */ 1200 CLEANUP_PREFIX_RT_EXPIRE, /* update the lifetime of the prefix route */ 1201 }; 1202 1203 /* 1204 * Check, whether the prefix for ifp would still need a prefix route 1205 * after deleting ifp. The function returns one of the CLEANUP_PREFIX_RT_* 1206 * constants. 1207 * 1208 * 1) we don't purge prefix if address was not permanent. 1209 * prefix is managed by its own lifetime. 1210 * 2) we also don't purge, if the address was IFA_F_NOPREFIXROUTE. 1211 * 3) if there are no addresses, delete prefix. 1212 * 4) if there are still other permanent address(es), 1213 * corresponding prefix is still permanent. 1214 * 5) if there are still other addresses with IFA_F_NOPREFIXROUTE, 1215 * don't purge the prefix, assume user space is managing it. 1216 * 6) otherwise, update prefix lifetime to the 1217 * longest valid lifetime among the corresponding 1218 * addresses on the device. 1219 * Note: subsequent RA will update lifetime. 1220 **/ 1221 static enum cleanup_prefix_rt_t 1222 check_cleanup_prefix_route(struct inet6_ifaddr *ifp, unsigned long *expires) 1223 { 1224 struct inet6_ifaddr *ifa; 1225 struct inet6_dev *idev = ifp->idev; 1226 unsigned long lifetime; 1227 enum cleanup_prefix_rt_t action = CLEANUP_PREFIX_RT_DEL; 1228 1229 *expires = jiffies; 1230 1231 list_for_each_entry(ifa, &idev->addr_list, if_list) { 1232 if (ifa == ifp) 1233 continue; 1234 if (ifa->prefix_len != ifp->prefix_len || 1235 !ipv6_prefix_equal(&ifa->addr, &ifp->addr, 1236 ifp->prefix_len)) 1237 continue; 1238 if (ifa->flags & (IFA_F_PERMANENT | IFA_F_NOPREFIXROUTE)) 1239 return CLEANUP_PREFIX_RT_NOP; 1240 1241 action = CLEANUP_PREFIX_RT_EXPIRE; 1242 1243 spin_lock(&ifa->lock); 1244 1245 lifetime = addrconf_timeout_fixup(ifa->valid_lft, HZ); 1246 /* 1247 * Note: Because this address is 1248 * not permanent, lifetime < 1249 * LONG_MAX / HZ here. 1250 */ 1251 if (time_before(*expires, ifa->tstamp + lifetime * HZ)) 1252 *expires = ifa->tstamp + lifetime * HZ; 1253 spin_unlock(&ifa->lock); 1254 } 1255 1256 return action; 1257 } 1258 1259 static void 1260 cleanup_prefix_route(struct inet6_ifaddr *ifp, unsigned long expires, 1261 bool del_rt, bool del_peer) 1262 { 1263 struct fib6_table *table; 1264 struct fib6_info *f6i; 1265 1266 f6i = addrconf_get_prefix_route(del_peer ? &ifp->peer_addr : &ifp->addr, 1267 ifp->prefix_len, 1268 ifp->idev->dev, 0, RTF_DEFAULT, true); 1269 if (f6i) { 1270 if (del_rt) 1271 ip6_del_rt(dev_net(ifp->idev->dev), f6i, false); 1272 else { 1273 if (!(f6i->fib6_flags & RTF_EXPIRES)) { 1274 table = f6i->fib6_table; 1275 spin_lock_bh(&table->tb6_lock); 1276 1277 fib6_set_expires(f6i, expires); 1278 fib6_add_gc_list(f6i); 1279 1280 spin_unlock_bh(&table->tb6_lock); 1281 } 1282 fib6_info_release(f6i); 1283 } 1284 } 1285 } 1286 1287 1288 /* This function wants to get referenced ifp and releases it before return */ 1289 1290 static void ipv6_del_addr(struct inet6_ifaddr *ifp) 1291 { 1292 enum cleanup_prefix_rt_t action = CLEANUP_PREFIX_RT_NOP; 1293 struct net *net = dev_net(ifp->idev->dev); 1294 unsigned long expires; 1295 int state; 1296 1297 ASSERT_RTNL(); 1298 1299 spin_lock_bh(&ifp->lock); 1300 state = ifp->state; 1301 ifp->state = INET6_IFADDR_STATE_DEAD; 1302 spin_unlock_bh(&ifp->lock); 1303 1304 if (state == INET6_IFADDR_STATE_DEAD) 1305 goto out; 1306 1307 spin_lock_bh(&net->ipv6.addrconf_hash_lock); 1308 hlist_del_init_rcu(&ifp->addr_lst); 1309 spin_unlock_bh(&net->ipv6.addrconf_hash_lock); 1310 1311 write_lock_bh(&ifp->idev->lock); 1312 1313 if (ifp->flags&IFA_F_TEMPORARY) { 1314 list_del(&ifp->tmp_list); 1315 if (ifp->ifpub) { 1316 in6_ifa_put(ifp->ifpub); 1317 ifp->ifpub = NULL; 1318 } 1319 __in6_ifa_put(ifp); 1320 } 1321 1322 if (ifp->flags & IFA_F_PERMANENT && !(ifp->flags & IFA_F_NOPREFIXROUTE)) 1323 action = check_cleanup_prefix_route(ifp, &expires); 1324 1325 list_del_rcu(&ifp->if_list); 1326 __in6_ifa_put(ifp); 1327 1328 write_unlock_bh(&ifp->idev->lock); 1329 1330 addrconf_del_dad_work(ifp); 1331 1332 ipv6_ifa_notify(RTM_DELADDR, ifp); 1333 1334 inet6addr_notifier_call_chain(NETDEV_DOWN, ifp); 1335 1336 if (action != CLEANUP_PREFIX_RT_NOP) { 1337 cleanup_prefix_route(ifp, expires, 1338 action == CLEANUP_PREFIX_RT_DEL, false); 1339 } 1340 1341 /* clean up prefsrc entries */ 1342 rt6_remove_prefsrc(ifp); 1343 out: 1344 in6_ifa_put(ifp); 1345 } 1346 1347 static unsigned long ipv6_get_regen_advance(const struct inet6_dev *idev) 1348 { 1349 return READ_ONCE(idev->cnf.regen_min_advance) + 1350 READ_ONCE(idev->cnf.regen_max_retry) * 1351 READ_ONCE(idev->cnf.dad_transmits) * 1352 max(NEIGH_VAR(idev->nd_parms, RETRANS_TIME), HZ/100) / HZ; 1353 } 1354 1355 static int ipv6_create_tempaddr(struct inet6_ifaddr *ifp, bool block) 1356 { 1357 struct inet6_dev *idev = ifp->idev; 1358 unsigned long tmp_tstamp, age; 1359 unsigned long regen_advance; 1360 unsigned long now = jiffies; 1361 u32 if_public_preferred_lft; 1362 s32 cnf_temp_preferred_lft; 1363 struct inet6_ifaddr *ift; 1364 struct ifa6_config cfg; 1365 long max_desync_factor; 1366 struct in6_addr addr; 1367 int ret = 0; 1368 1369 write_lock_bh(&idev->lock); 1370 1371 retry: 1372 in6_dev_hold(idev); 1373 if (READ_ONCE(idev->cnf.use_tempaddr) <= 0) { 1374 write_unlock_bh(&idev->lock); 1375 pr_info("%s: use_tempaddr is disabled\n", __func__); 1376 in6_dev_put(idev); 1377 ret = -1; 1378 goto out; 1379 } 1380 spin_lock_bh(&ifp->lock); 1381 if (ifp->regen_count++ >= READ_ONCE(idev->cnf.regen_max_retry)) { 1382 WRITE_ONCE(idev->cnf.use_tempaddr, -1); /*XXX*/ 1383 spin_unlock_bh(&ifp->lock); 1384 write_unlock_bh(&idev->lock); 1385 pr_warn("%s: regeneration time exceeded - disabled temporary address support\n", 1386 __func__); 1387 in6_dev_put(idev); 1388 ret = -1; 1389 goto out; 1390 } 1391 in6_ifa_hold(ifp); 1392 memcpy(addr.s6_addr, ifp->addr.s6_addr, 8); 1393 ipv6_gen_rnd_iid(&addr); 1394 1395 age = (now - ifp->tstamp) / HZ; 1396 1397 regen_advance = ipv6_get_regen_advance(idev); 1398 1399 /* recalculate max_desync_factor each time and update 1400 * idev->desync_factor if it's larger 1401 */ 1402 cnf_temp_preferred_lft = READ_ONCE(idev->cnf.temp_prefered_lft); 1403 max_desync_factor = min_t(long, 1404 READ_ONCE(idev->cnf.max_desync_factor), 1405 cnf_temp_preferred_lft - regen_advance); 1406 1407 if (unlikely(idev->desync_factor > max_desync_factor)) { 1408 if (max_desync_factor > 0) { 1409 get_random_bytes(&idev->desync_factor, 1410 sizeof(idev->desync_factor)); 1411 idev->desync_factor %= max_desync_factor; 1412 } else { 1413 idev->desync_factor = 0; 1414 } 1415 } 1416 1417 if_public_preferred_lft = ifp->prefered_lft; 1418 1419 memset(&cfg, 0, sizeof(cfg)); 1420 cfg.valid_lft = min_t(__u32, ifp->valid_lft, 1421 READ_ONCE(idev->cnf.temp_valid_lft) + age); 1422 cfg.preferred_lft = cnf_temp_preferred_lft + age - idev->desync_factor; 1423 cfg.preferred_lft = min_t(__u32, if_public_preferred_lft, cfg.preferred_lft); 1424 cfg.preferred_lft = min_t(__u32, cfg.valid_lft, cfg.preferred_lft); 1425 1426 cfg.plen = ifp->prefix_len; 1427 tmp_tstamp = ifp->tstamp; 1428 spin_unlock_bh(&ifp->lock); 1429 1430 write_unlock_bh(&idev->lock); 1431 1432 /* From RFC 4941: 1433 * 1434 * A temporary address is created only if this calculated Preferred 1435 * Lifetime is greater than REGEN_ADVANCE time units. In 1436 * particular, an implementation must not create a temporary address 1437 * with a zero Preferred Lifetime. 1438 * 1439 * ... 1440 * 1441 * When creating a temporary address, the lifetime values MUST be 1442 * derived from the corresponding prefix as follows: 1443 * 1444 * ... 1445 * 1446 * * Its Preferred Lifetime is the lower of the Preferred Lifetime 1447 * of the public address or TEMP_PREFERRED_LIFETIME - 1448 * DESYNC_FACTOR. 1449 * 1450 * To comply with the RFC's requirements, clamp the preferred lifetime 1451 * to a minimum of regen_advance, unless that would exceed valid_lft or 1452 * ifp->prefered_lft. 1453 * 1454 * Use age calculation as in addrconf_verify to avoid unnecessary 1455 * temporary addresses being generated. 1456 */ 1457 age = (now - tmp_tstamp + ADDRCONF_TIMER_FUZZ_MINUS) / HZ; 1458 if (cfg.preferred_lft <= regen_advance + age) { 1459 cfg.preferred_lft = regen_advance + age + 1; 1460 if (cfg.preferred_lft > cfg.valid_lft || 1461 cfg.preferred_lft > if_public_preferred_lft) { 1462 in6_ifa_put(ifp); 1463 in6_dev_put(idev); 1464 ret = -1; 1465 goto out; 1466 } 1467 } 1468 1469 cfg.ifa_flags = IFA_F_TEMPORARY; 1470 /* set in addrconf_prefix_rcv() */ 1471 if (ifp->flags & IFA_F_OPTIMISTIC) 1472 cfg.ifa_flags |= IFA_F_OPTIMISTIC; 1473 1474 cfg.pfx = &addr; 1475 cfg.scope = ipv6_addr_scope(cfg.pfx); 1476 1477 ift = ipv6_add_addr(idev, &cfg, block, NULL); 1478 if (IS_ERR(ift)) { 1479 in6_ifa_put(ifp); 1480 in6_dev_put(idev); 1481 pr_info("%s: retry temporary address regeneration\n", __func__); 1482 write_lock_bh(&idev->lock); 1483 goto retry; 1484 } 1485 1486 spin_lock_bh(&ift->lock); 1487 ift->ifpub = ifp; 1488 ift->cstamp = now; 1489 ift->tstamp = tmp_tstamp; 1490 spin_unlock_bh(&ift->lock); 1491 1492 addrconf_dad_start(ift); 1493 in6_ifa_put(ift); 1494 in6_dev_put(idev); 1495 out: 1496 return ret; 1497 } 1498 1499 /* 1500 * Choose an appropriate source address (RFC3484) 1501 */ 1502 enum { 1503 IPV6_SADDR_RULE_INIT = 0, 1504 IPV6_SADDR_RULE_LOCAL, 1505 IPV6_SADDR_RULE_SCOPE, 1506 IPV6_SADDR_RULE_PREFERRED, 1507 #ifdef CONFIG_IPV6_MIP6 1508 IPV6_SADDR_RULE_HOA, 1509 #endif 1510 IPV6_SADDR_RULE_OIF, 1511 IPV6_SADDR_RULE_LABEL, 1512 IPV6_SADDR_RULE_PRIVACY, 1513 IPV6_SADDR_RULE_ORCHID, 1514 IPV6_SADDR_RULE_PREFIX, 1515 #ifdef CONFIG_IPV6_OPTIMISTIC_DAD 1516 IPV6_SADDR_RULE_NOT_OPTIMISTIC, 1517 #endif 1518 IPV6_SADDR_RULE_MAX 1519 }; 1520 1521 struct ipv6_saddr_score { 1522 int rule; 1523 int addr_type; 1524 struct inet6_ifaddr *ifa; 1525 DECLARE_BITMAP(scorebits, IPV6_SADDR_RULE_MAX); 1526 int scopedist; 1527 int matchlen; 1528 }; 1529 1530 struct ipv6_saddr_dst { 1531 const struct in6_addr *addr; 1532 int ifindex; 1533 int scope; 1534 int label; 1535 unsigned int prefs; 1536 }; 1537 1538 static inline int ipv6_saddr_preferred(int type) 1539 { 1540 if (type & (IPV6_ADDR_MAPPED|IPV6_ADDR_COMPATv4|IPV6_ADDR_LOOPBACK)) 1541 return 1; 1542 return 0; 1543 } 1544 1545 static bool ipv6_use_optimistic_addr(const struct net *net, 1546 const struct inet6_dev *idev) 1547 { 1548 #ifdef CONFIG_IPV6_OPTIMISTIC_DAD 1549 if (!idev) 1550 return false; 1551 if (!READ_ONCE(net->ipv6.devconf_all->optimistic_dad) && 1552 !READ_ONCE(idev->cnf.optimistic_dad)) 1553 return false; 1554 if (!READ_ONCE(net->ipv6.devconf_all->use_optimistic) && 1555 !READ_ONCE(idev->cnf.use_optimistic)) 1556 return false; 1557 1558 return true; 1559 #else 1560 return false; 1561 #endif 1562 } 1563 1564 static bool ipv6_allow_optimistic_dad(const struct net *net, 1565 const struct inet6_dev *idev) 1566 { 1567 #ifdef CONFIG_IPV6_OPTIMISTIC_DAD 1568 if (!idev) 1569 return false; 1570 if (!READ_ONCE(net->ipv6.devconf_all->optimistic_dad) && 1571 !READ_ONCE(idev->cnf.optimistic_dad)) 1572 return false; 1573 1574 return true; 1575 #else 1576 return false; 1577 #endif 1578 } 1579 1580 static int ipv6_get_saddr_eval(struct net *net, 1581 struct ipv6_saddr_score *score, 1582 struct ipv6_saddr_dst *dst, 1583 int i) 1584 { 1585 int ret; 1586 1587 if (i <= score->rule) { 1588 switch (i) { 1589 case IPV6_SADDR_RULE_SCOPE: 1590 ret = score->scopedist; 1591 break; 1592 case IPV6_SADDR_RULE_PREFIX: 1593 ret = score->matchlen; 1594 break; 1595 default: 1596 ret = !!test_bit(i, score->scorebits); 1597 } 1598 goto out; 1599 } 1600 1601 switch (i) { 1602 case IPV6_SADDR_RULE_INIT: 1603 /* Rule 0: remember if hiscore is not ready yet */ 1604 ret = !!score->ifa; 1605 break; 1606 case IPV6_SADDR_RULE_LOCAL: 1607 /* Rule 1: Prefer same address */ 1608 ret = ipv6_addr_equal(&score->ifa->addr, dst->addr); 1609 break; 1610 case IPV6_SADDR_RULE_SCOPE: 1611 /* Rule 2: Prefer appropriate scope 1612 * 1613 * ret 1614 * ^ 1615 * -1 | d 15 1616 * ---+--+-+---> scope 1617 * | 1618 * | d is scope of the destination. 1619 * B-d | \ 1620 * | \ <- smaller scope is better if 1621 * B-15 | \ if scope is enough for destination. 1622 * | ret = B - scope (-1 <= scope >= d <= 15). 1623 * d-C-1 | / 1624 * |/ <- greater is better 1625 * -C / if scope is not enough for destination. 1626 * /| ret = scope - C (-1 <= d < scope <= 15). 1627 * 1628 * d - C - 1 < B -15 (for all -1 <= d <= 15). 1629 * C > d + 14 - B >= 15 + 14 - B = 29 - B. 1630 * Assume B = 0 and we get C > 29. 1631 */ 1632 ret = __ipv6_addr_src_scope(score->addr_type); 1633 if (ret >= dst->scope) 1634 ret = -ret; 1635 else 1636 ret -= 128; /* 30 is enough */ 1637 score->scopedist = ret; 1638 break; 1639 case IPV6_SADDR_RULE_PREFERRED: 1640 { 1641 /* Rule 3: Avoid deprecated and optimistic addresses */ 1642 u8 avoid = IFA_F_DEPRECATED; 1643 1644 if (!ipv6_use_optimistic_addr(net, score->ifa->idev)) 1645 avoid |= IFA_F_OPTIMISTIC; 1646 ret = ipv6_saddr_preferred(score->addr_type) || 1647 !(score->ifa->flags & avoid); 1648 break; 1649 } 1650 #ifdef CONFIG_IPV6_MIP6 1651 case IPV6_SADDR_RULE_HOA: 1652 { 1653 /* Rule 4: Prefer home address */ 1654 int prefhome = !(dst->prefs & IPV6_PREFER_SRC_COA); 1655 ret = !(score->ifa->flags & IFA_F_HOMEADDRESS) ^ prefhome; 1656 break; 1657 } 1658 #endif 1659 case IPV6_SADDR_RULE_OIF: 1660 /* Rule 5: Prefer outgoing interface */ 1661 ret = (!dst->ifindex || 1662 dst->ifindex == score->ifa->idev->dev->ifindex); 1663 break; 1664 case IPV6_SADDR_RULE_LABEL: 1665 /* Rule 6: Prefer matching label */ 1666 ret = ipv6_addr_label(net, 1667 &score->ifa->addr, score->addr_type, 1668 score->ifa->idev->dev->ifindex) == dst->label; 1669 break; 1670 case IPV6_SADDR_RULE_PRIVACY: 1671 { 1672 /* Rule 7: Prefer public address 1673 * Note: prefer temporary address if use_tempaddr >= 2 1674 */ 1675 int preftmp = dst->prefs & (IPV6_PREFER_SRC_PUBLIC|IPV6_PREFER_SRC_TMP) ? 1676 !!(dst->prefs & IPV6_PREFER_SRC_TMP) : 1677 READ_ONCE(score->ifa->idev->cnf.use_tempaddr) >= 2; 1678 ret = (!(score->ifa->flags & IFA_F_TEMPORARY)) ^ preftmp; 1679 break; 1680 } 1681 case IPV6_SADDR_RULE_ORCHID: 1682 /* Rule 8-: Prefer ORCHID vs ORCHID or 1683 * non-ORCHID vs non-ORCHID 1684 */ 1685 ret = !(ipv6_addr_orchid(&score->ifa->addr) ^ 1686 ipv6_addr_orchid(dst->addr)); 1687 break; 1688 case IPV6_SADDR_RULE_PREFIX: 1689 /* Rule 8: Use longest matching prefix */ 1690 ret = ipv6_addr_diff(&score->ifa->addr, dst->addr); 1691 if (ret > score->ifa->prefix_len) 1692 ret = score->ifa->prefix_len; 1693 score->matchlen = ret; 1694 break; 1695 #ifdef CONFIG_IPV6_OPTIMISTIC_DAD 1696 case IPV6_SADDR_RULE_NOT_OPTIMISTIC: 1697 /* Optimistic addresses still have lower precedence than other 1698 * preferred addresses. 1699 */ 1700 ret = !(score->ifa->flags & IFA_F_OPTIMISTIC); 1701 break; 1702 #endif 1703 default: 1704 ret = 0; 1705 } 1706 1707 if (ret) 1708 __set_bit(i, score->scorebits); 1709 score->rule = i; 1710 out: 1711 return ret; 1712 } 1713 1714 static int __ipv6_dev_get_saddr(struct net *net, 1715 struct ipv6_saddr_dst *dst, 1716 struct inet6_dev *idev, 1717 struct ipv6_saddr_score *scores, 1718 int hiscore_idx) 1719 { 1720 struct ipv6_saddr_score *score = &scores[1 - hiscore_idx], *hiscore = &scores[hiscore_idx]; 1721 1722 list_for_each_entry_rcu(score->ifa, &idev->addr_list, if_list) { 1723 int i; 1724 1725 /* 1726 * - Tentative Address (RFC2462 section 5.4) 1727 * - A tentative address is not considered 1728 * "assigned to an interface" in the traditional 1729 * sense, unless it is also flagged as optimistic. 1730 * - Candidate Source Address (section 4) 1731 * - In any case, anycast addresses, multicast 1732 * addresses, and the unspecified address MUST 1733 * NOT be included in a candidate set. 1734 */ 1735 if ((score->ifa->flags & IFA_F_TENTATIVE) && 1736 (!(score->ifa->flags & IFA_F_OPTIMISTIC))) 1737 continue; 1738 1739 score->addr_type = __ipv6_addr_type(&score->ifa->addr); 1740 1741 if (unlikely(score->addr_type == IPV6_ADDR_ANY || 1742 score->addr_type & IPV6_ADDR_MULTICAST)) { 1743 net_dbg_ratelimited("ADDRCONF: unspecified / multicast address assigned as unicast address on %s", 1744 idev->dev->name); 1745 continue; 1746 } 1747 1748 score->rule = -1; 1749 bitmap_zero(score->scorebits, IPV6_SADDR_RULE_MAX); 1750 1751 for (i = 0; i < IPV6_SADDR_RULE_MAX; i++) { 1752 int minihiscore, miniscore; 1753 1754 minihiscore = ipv6_get_saddr_eval(net, hiscore, dst, i); 1755 miniscore = ipv6_get_saddr_eval(net, score, dst, i); 1756 1757 if (minihiscore > miniscore) { 1758 if (i == IPV6_SADDR_RULE_SCOPE && 1759 score->scopedist > 0) { 1760 /* 1761 * special case: 1762 * each remaining entry 1763 * has too small (not enough) 1764 * scope, because ifa entries 1765 * are sorted by their scope 1766 * values. 1767 */ 1768 goto out; 1769 } 1770 break; 1771 } else if (minihiscore < miniscore) { 1772 swap(hiscore, score); 1773 hiscore_idx = 1 - hiscore_idx; 1774 1775 /* restore our iterator */ 1776 score->ifa = hiscore->ifa; 1777 1778 break; 1779 } 1780 } 1781 } 1782 out: 1783 return hiscore_idx; 1784 } 1785 1786 static int ipv6_get_saddr_master(struct net *net, 1787 const struct net_device *dst_dev, 1788 const struct net_device *master, 1789 struct ipv6_saddr_dst *dst, 1790 struct ipv6_saddr_score *scores, 1791 int hiscore_idx) 1792 { 1793 struct inet6_dev *idev; 1794 1795 idev = __in6_dev_get(dst_dev); 1796 if (idev) 1797 hiscore_idx = __ipv6_dev_get_saddr(net, dst, idev, 1798 scores, hiscore_idx); 1799 1800 idev = __in6_dev_get(master); 1801 if (idev) 1802 hiscore_idx = __ipv6_dev_get_saddr(net, dst, idev, 1803 scores, hiscore_idx); 1804 1805 return hiscore_idx; 1806 } 1807 1808 int ipv6_dev_get_saddr(struct net *net, const struct net_device *dst_dev, 1809 const struct in6_addr *daddr, unsigned int prefs, 1810 struct in6_addr *saddr) 1811 { 1812 struct ipv6_saddr_score scores[2], *hiscore; 1813 struct ipv6_saddr_dst dst; 1814 struct inet6_dev *idev; 1815 struct net_device *dev; 1816 int dst_type; 1817 bool use_oif_addr = false; 1818 int hiscore_idx = 0; 1819 int ret = 0; 1820 1821 dst_type = __ipv6_addr_type(daddr); 1822 dst.addr = daddr; 1823 dst.ifindex = dst_dev ? dst_dev->ifindex : 0; 1824 dst.scope = __ipv6_addr_src_scope(dst_type); 1825 dst.label = ipv6_addr_label(net, daddr, dst_type, dst.ifindex); 1826 dst.prefs = prefs; 1827 1828 scores[hiscore_idx].rule = -1; 1829 scores[hiscore_idx].ifa = NULL; 1830 1831 rcu_read_lock(); 1832 1833 /* Candidate Source Address (section 4) 1834 * - multicast and link-local destination address, 1835 * the set of candidate source address MUST only 1836 * include addresses assigned to interfaces 1837 * belonging to the same link as the outgoing 1838 * interface. 1839 * (- For site-local destination addresses, the 1840 * set of candidate source addresses MUST only 1841 * include addresses assigned to interfaces 1842 * belonging to the same site as the outgoing 1843 * interface.) 1844 * - "It is RECOMMENDED that the candidate source addresses 1845 * be the set of unicast addresses assigned to the 1846 * interface that will be used to send to the destination 1847 * (the 'outgoing' interface)." (RFC 6724) 1848 */ 1849 if (dst_dev) { 1850 idev = __in6_dev_get(dst_dev); 1851 if ((dst_type & IPV6_ADDR_MULTICAST) || 1852 dst.scope <= IPV6_ADDR_SCOPE_LINKLOCAL || 1853 (idev && READ_ONCE(idev->cnf.use_oif_addrs_only))) { 1854 use_oif_addr = true; 1855 } 1856 } 1857 1858 if (use_oif_addr) { 1859 if (idev) 1860 hiscore_idx = __ipv6_dev_get_saddr(net, &dst, idev, scores, hiscore_idx); 1861 } else { 1862 const struct net_device *master; 1863 int master_idx = 0; 1864 1865 /* if dst_dev exists and is enslaved to an L3 device, then 1866 * prefer addresses from dst_dev and then the master over 1867 * any other enslaved devices in the L3 domain. 1868 */ 1869 master = l3mdev_master_dev_rcu(dst_dev); 1870 if (master) { 1871 master_idx = master->ifindex; 1872 1873 hiscore_idx = ipv6_get_saddr_master(net, dst_dev, 1874 master, &dst, 1875 scores, hiscore_idx); 1876 1877 if (scores[hiscore_idx].ifa && 1878 scores[hiscore_idx].scopedist >= 0) 1879 goto out; 1880 } 1881 1882 for_each_netdev_rcu(net, dev) { 1883 /* only consider addresses on devices in the 1884 * same L3 domain 1885 */ 1886 if (l3mdev_master_ifindex_rcu(dev) != master_idx) 1887 continue; 1888 idev = __in6_dev_get(dev); 1889 if (!idev) 1890 continue; 1891 hiscore_idx = __ipv6_dev_get_saddr(net, &dst, idev, scores, hiscore_idx); 1892 } 1893 } 1894 1895 out: 1896 hiscore = &scores[hiscore_idx]; 1897 if (!hiscore->ifa) 1898 ret = -EADDRNOTAVAIL; 1899 else 1900 *saddr = hiscore->ifa->addr; 1901 1902 rcu_read_unlock(); 1903 return ret; 1904 } 1905 EXPORT_SYMBOL(ipv6_dev_get_saddr); 1906 1907 static int __ipv6_get_lladdr(struct inet6_dev *idev, struct in6_addr *addr, 1908 u32 banned_flags) 1909 { 1910 struct inet6_ifaddr *ifp; 1911 int err = -EADDRNOTAVAIL; 1912 1913 list_for_each_entry_reverse(ifp, &idev->addr_list, if_list) { 1914 if (ifp->scope > IFA_LINK) 1915 break; 1916 if (ifp->scope == IFA_LINK && 1917 !(ifp->flags & banned_flags)) { 1918 *addr = ifp->addr; 1919 err = 0; 1920 break; 1921 } 1922 } 1923 return err; 1924 } 1925 1926 int ipv6_get_lladdr(struct net_device *dev, struct in6_addr *addr, 1927 u32 banned_flags) 1928 { 1929 struct inet6_dev *idev; 1930 int err = -EADDRNOTAVAIL; 1931 1932 rcu_read_lock(); 1933 idev = __in6_dev_get(dev); 1934 if (idev) { 1935 read_lock_bh(&idev->lock); 1936 err = __ipv6_get_lladdr(idev, addr, banned_flags); 1937 read_unlock_bh(&idev->lock); 1938 } 1939 rcu_read_unlock(); 1940 return err; 1941 } 1942 1943 static int ipv6_count_addresses(const struct inet6_dev *idev) 1944 { 1945 const struct inet6_ifaddr *ifp; 1946 int cnt = 0; 1947 1948 rcu_read_lock(); 1949 list_for_each_entry_rcu(ifp, &idev->addr_list, if_list) 1950 cnt++; 1951 rcu_read_unlock(); 1952 return cnt; 1953 } 1954 1955 int ipv6_chk_addr(struct net *net, const struct in6_addr *addr, 1956 const struct net_device *dev, int strict) 1957 { 1958 return ipv6_chk_addr_and_flags(net, addr, dev, !dev, 1959 strict, IFA_F_TENTATIVE); 1960 } 1961 EXPORT_SYMBOL(ipv6_chk_addr); 1962 1963 /* device argument is used to find the L3 domain of interest. If 1964 * skip_dev_check is set, then the ifp device is not checked against 1965 * the passed in dev argument. So the 2 cases for addresses checks are: 1966 * 1. does the address exist in the L3 domain that dev is part of 1967 * (skip_dev_check = true), or 1968 * 1969 * 2. does the address exist on the specific device 1970 * (skip_dev_check = false) 1971 */ 1972 static struct net_device * 1973 __ipv6_chk_addr_and_flags(struct net *net, const struct in6_addr *addr, 1974 const struct net_device *dev, bool skip_dev_check, 1975 int strict, u32 banned_flags) 1976 { 1977 unsigned int hash = inet6_addr_hash(net, addr); 1978 struct net_device *l3mdev, *ndev; 1979 struct inet6_ifaddr *ifp; 1980 u32 ifp_flags; 1981 1982 rcu_read_lock(); 1983 1984 l3mdev = l3mdev_master_dev_rcu(dev); 1985 if (skip_dev_check) 1986 dev = NULL; 1987 1988 hlist_for_each_entry_rcu(ifp, &net->ipv6.inet6_addr_lst[hash], addr_lst) { 1989 ndev = ifp->idev->dev; 1990 1991 if (l3mdev_master_dev_rcu(ndev) != l3mdev) 1992 continue; 1993 1994 /* Decouple optimistic from tentative for evaluation here. 1995 * Ban optimistic addresses explicitly, when required. 1996 */ 1997 ifp_flags = (ifp->flags&IFA_F_OPTIMISTIC) 1998 ? (ifp->flags&~IFA_F_TENTATIVE) 1999 : ifp->flags; 2000 if (ipv6_addr_equal(&ifp->addr, addr) && 2001 !(ifp_flags&banned_flags) && 2002 (!dev || ndev == dev || 2003 !(ifp->scope&(IFA_LINK|IFA_HOST) || strict))) { 2004 rcu_read_unlock(); 2005 return ndev; 2006 } 2007 } 2008 2009 rcu_read_unlock(); 2010 return NULL; 2011 } 2012 2013 int ipv6_chk_addr_and_flags(struct net *net, const struct in6_addr *addr, 2014 const struct net_device *dev, bool skip_dev_check, 2015 int strict, u32 banned_flags) 2016 { 2017 return __ipv6_chk_addr_and_flags(net, addr, dev, skip_dev_check, 2018 strict, banned_flags) ? 1 : 0; 2019 } 2020 EXPORT_SYMBOL(ipv6_chk_addr_and_flags); 2021 2022 2023 /* Compares an address/prefix_len with addresses on device @dev. 2024 * If one is found it returns true. 2025 */ 2026 bool ipv6_chk_custom_prefix(const struct in6_addr *addr, 2027 const unsigned int prefix_len, struct net_device *dev) 2028 { 2029 const struct inet6_ifaddr *ifa; 2030 const struct inet6_dev *idev; 2031 bool ret = false; 2032 2033 rcu_read_lock(); 2034 idev = __in6_dev_get(dev); 2035 if (idev) { 2036 list_for_each_entry_rcu(ifa, &idev->addr_list, if_list) { 2037 ret = ipv6_prefix_equal(addr, &ifa->addr, prefix_len); 2038 if (ret) 2039 break; 2040 } 2041 } 2042 rcu_read_unlock(); 2043 2044 return ret; 2045 } 2046 EXPORT_SYMBOL(ipv6_chk_custom_prefix); 2047 2048 int ipv6_chk_prefix(const struct in6_addr *addr, struct net_device *dev) 2049 { 2050 const struct inet6_ifaddr *ifa; 2051 const struct inet6_dev *idev; 2052 int onlink; 2053 2054 onlink = 0; 2055 rcu_read_lock(); 2056 idev = __in6_dev_get(dev); 2057 if (idev) { 2058 list_for_each_entry_rcu(ifa, &idev->addr_list, if_list) { 2059 onlink = ipv6_prefix_equal(addr, &ifa->addr, 2060 ifa->prefix_len); 2061 if (onlink) 2062 break; 2063 } 2064 } 2065 rcu_read_unlock(); 2066 return onlink; 2067 } 2068 EXPORT_SYMBOL(ipv6_chk_prefix); 2069 2070 /** 2071 * ipv6_dev_find - find the first device with a given source address. 2072 * @net: the net namespace 2073 * @addr: the source address 2074 * @dev: used to find the L3 domain of interest 2075 * 2076 * The caller should be protected by RCU, or RTNL. 2077 */ 2078 struct net_device *ipv6_dev_find(struct net *net, const struct in6_addr *addr, 2079 struct net_device *dev) 2080 { 2081 return __ipv6_chk_addr_and_flags(net, addr, dev, !dev, 1, 2082 IFA_F_TENTATIVE); 2083 } 2084 EXPORT_SYMBOL(ipv6_dev_find); 2085 2086 struct inet6_ifaddr *ipv6_get_ifaddr(struct net *net, const struct in6_addr *addr, 2087 struct net_device *dev, int strict) 2088 { 2089 unsigned int hash = inet6_addr_hash(net, addr); 2090 struct inet6_ifaddr *ifp, *result = NULL; 2091 2092 rcu_read_lock(); 2093 hlist_for_each_entry_rcu(ifp, &net->ipv6.inet6_addr_lst[hash], addr_lst) { 2094 if (ipv6_addr_equal(&ifp->addr, addr)) { 2095 if (!dev || ifp->idev->dev == dev || 2096 !(ifp->scope&(IFA_LINK|IFA_HOST) || strict)) { 2097 if (in6_ifa_hold_safe(ifp)) { 2098 result = ifp; 2099 break; 2100 } 2101 } 2102 } 2103 } 2104 rcu_read_unlock(); 2105 2106 return result; 2107 } 2108 2109 /* Gets referenced address, destroys ifaddr */ 2110 2111 static void addrconf_dad_stop(struct inet6_ifaddr *ifp, int dad_failed) 2112 { 2113 if (dad_failed) 2114 ifp->flags |= IFA_F_DADFAILED; 2115 2116 if (ifp->flags&IFA_F_TEMPORARY) { 2117 struct inet6_ifaddr *ifpub; 2118 spin_lock_bh(&ifp->lock); 2119 ifpub = ifp->ifpub; 2120 if (ifpub) { 2121 in6_ifa_hold(ifpub); 2122 spin_unlock_bh(&ifp->lock); 2123 ipv6_create_tempaddr(ifpub, true); 2124 in6_ifa_put(ifpub); 2125 } else { 2126 spin_unlock_bh(&ifp->lock); 2127 } 2128 ipv6_del_addr(ifp); 2129 } else if (ifp->flags&IFA_F_PERMANENT || !dad_failed) { 2130 spin_lock_bh(&ifp->lock); 2131 addrconf_del_dad_work(ifp); 2132 ifp->flags |= IFA_F_TENTATIVE; 2133 if (dad_failed) 2134 ifp->flags &= ~IFA_F_OPTIMISTIC; 2135 spin_unlock_bh(&ifp->lock); 2136 if (dad_failed) 2137 ipv6_ifa_notify(0, ifp); 2138 in6_ifa_put(ifp); 2139 } else { 2140 ipv6_del_addr(ifp); 2141 } 2142 } 2143 2144 static int addrconf_dad_end(struct inet6_ifaddr *ifp) 2145 { 2146 int err = -ENOENT; 2147 2148 spin_lock_bh(&ifp->lock); 2149 if (ifp->state == INET6_IFADDR_STATE_DAD) { 2150 ifp->state = INET6_IFADDR_STATE_POSTDAD; 2151 err = 0; 2152 } 2153 spin_unlock_bh(&ifp->lock); 2154 2155 return err; 2156 } 2157 2158 void addrconf_dad_failure(struct sk_buff *skb, struct inet6_ifaddr *ifp) 2159 { 2160 struct inet6_dev *idev = ifp->idev; 2161 struct net *net = dev_net(idev->dev); 2162 int max_addresses; 2163 2164 if (addrconf_dad_end(ifp)) { 2165 in6_ifa_put(ifp); 2166 return; 2167 } 2168 2169 net_info_ratelimited("%s: IPv6 duplicate address %pI6c used by %pM detected!\n", 2170 ifp->idev->dev->name, &ifp->addr, eth_hdr(skb)->h_source); 2171 2172 spin_lock_bh(&ifp->lock); 2173 2174 if (ifp->flags & IFA_F_STABLE_PRIVACY) { 2175 struct in6_addr new_addr; 2176 struct inet6_ifaddr *ifp2; 2177 int retries = ifp->stable_privacy_retry + 1; 2178 struct ifa6_config cfg = { 2179 .pfx = &new_addr, 2180 .plen = ifp->prefix_len, 2181 .ifa_flags = ifp->flags, 2182 .valid_lft = ifp->valid_lft, 2183 .preferred_lft = ifp->prefered_lft, 2184 .scope = ifp->scope, 2185 }; 2186 2187 if (retries > net->ipv6.sysctl.idgen_retries) { 2188 net_info_ratelimited("%s: privacy stable address generation failed because of DAD conflicts!\n", 2189 ifp->idev->dev->name); 2190 goto errdad; 2191 } 2192 2193 new_addr = ifp->addr; 2194 if (ipv6_generate_stable_address(&new_addr, retries, 2195 idev)) 2196 goto errdad; 2197 2198 spin_unlock_bh(&ifp->lock); 2199 2200 max_addresses = READ_ONCE(idev->cnf.max_addresses); 2201 if (max_addresses && 2202 ipv6_count_addresses(idev) >= max_addresses) 2203 goto lock_errdad; 2204 2205 net_info_ratelimited("%s: generating new stable privacy address because of DAD conflict\n", 2206 ifp->idev->dev->name); 2207 2208 ifp2 = ipv6_add_addr(idev, &cfg, false, NULL); 2209 if (IS_ERR(ifp2)) 2210 goto lock_errdad; 2211 2212 spin_lock_bh(&ifp2->lock); 2213 ifp2->stable_privacy_retry = retries; 2214 ifp2->state = INET6_IFADDR_STATE_PREDAD; 2215 spin_unlock_bh(&ifp2->lock); 2216 2217 addrconf_mod_dad_work(ifp2, net->ipv6.sysctl.idgen_delay); 2218 in6_ifa_put(ifp2); 2219 lock_errdad: 2220 spin_lock_bh(&ifp->lock); 2221 } 2222 2223 errdad: 2224 /* transition from _POSTDAD to _ERRDAD */ 2225 ifp->state = INET6_IFADDR_STATE_ERRDAD; 2226 spin_unlock_bh(&ifp->lock); 2227 2228 addrconf_mod_dad_work(ifp, 0); 2229 in6_ifa_put(ifp); 2230 } 2231 2232 /* Join to solicited addr multicast group. 2233 * caller must hold RTNL */ 2234 void addrconf_join_solict(struct net_device *dev, const struct in6_addr *addr) 2235 { 2236 struct in6_addr maddr; 2237 2238 if (dev->flags&(IFF_LOOPBACK|IFF_NOARP)) 2239 return; 2240 2241 addrconf_addr_solict_mult(addr, &maddr); 2242 ipv6_dev_mc_inc(dev, &maddr); 2243 } 2244 2245 /* caller must hold RTNL */ 2246 void addrconf_leave_solict(struct inet6_dev *idev, const struct in6_addr *addr) 2247 { 2248 struct in6_addr maddr; 2249 2250 if (idev->dev->flags&(IFF_LOOPBACK|IFF_NOARP)) 2251 return; 2252 2253 addrconf_addr_solict_mult(addr, &maddr); 2254 __ipv6_dev_mc_dec(idev, &maddr); 2255 } 2256 2257 /* caller must hold RTNL */ 2258 static void addrconf_join_anycast(struct inet6_ifaddr *ifp) 2259 { 2260 struct in6_addr addr; 2261 2262 if (ifp->prefix_len >= 127) /* RFC 6164 */ 2263 return; 2264 ipv6_addr_prefix(&addr, &ifp->addr, ifp->prefix_len); 2265 if (ipv6_addr_any(&addr)) 2266 return; 2267 __ipv6_dev_ac_inc(ifp->idev, &addr); 2268 } 2269 2270 /* caller must hold RTNL */ 2271 static void addrconf_leave_anycast(struct inet6_ifaddr *ifp) 2272 { 2273 struct in6_addr addr; 2274 2275 if (ifp->prefix_len >= 127) /* RFC 6164 */ 2276 return; 2277 ipv6_addr_prefix(&addr, &ifp->addr, ifp->prefix_len); 2278 if (ipv6_addr_any(&addr)) 2279 return; 2280 __ipv6_dev_ac_dec(ifp->idev, &addr); 2281 } 2282 2283 static int addrconf_ifid_6lowpan(u8 *eui, struct net_device *dev) 2284 { 2285 switch (dev->addr_len) { 2286 case ETH_ALEN: 2287 memcpy(eui, dev->dev_addr, 3); 2288 eui[3] = 0xFF; 2289 eui[4] = 0xFE; 2290 memcpy(eui + 5, dev->dev_addr + 3, 3); 2291 break; 2292 case EUI64_ADDR_LEN: 2293 memcpy(eui, dev->dev_addr, EUI64_ADDR_LEN); 2294 eui[0] ^= 2; 2295 break; 2296 default: 2297 return -1; 2298 } 2299 2300 return 0; 2301 } 2302 2303 static int addrconf_ifid_ieee1394(u8 *eui, struct net_device *dev) 2304 { 2305 const union fwnet_hwaddr *ha; 2306 2307 if (dev->addr_len != FWNET_ALEN) 2308 return -1; 2309 2310 ha = (const union fwnet_hwaddr *)dev->dev_addr; 2311 2312 memcpy(eui, &ha->uc.uniq_id, sizeof(ha->uc.uniq_id)); 2313 eui[0] ^= 2; 2314 return 0; 2315 } 2316 2317 static int addrconf_ifid_arcnet(u8 *eui, struct net_device *dev) 2318 { 2319 /* XXX: inherit EUI-64 from other interface -- yoshfuji */ 2320 if (dev->addr_len != ARCNET_ALEN) 2321 return -1; 2322 memset(eui, 0, 7); 2323 eui[7] = *(u8 *)dev->dev_addr; 2324 return 0; 2325 } 2326 2327 static int addrconf_ifid_infiniband(u8 *eui, struct net_device *dev) 2328 { 2329 if (dev->addr_len != INFINIBAND_ALEN) 2330 return -1; 2331 memcpy(eui, dev->dev_addr + 12, 8); 2332 eui[0] |= 2; 2333 return 0; 2334 } 2335 2336 static int __ipv6_isatap_ifid(u8 *eui, __be32 addr) 2337 { 2338 if (addr == 0) 2339 return -1; 2340 eui[0] = (ipv4_is_zeronet(addr) || ipv4_is_private_10(addr) || 2341 ipv4_is_loopback(addr) || ipv4_is_linklocal_169(addr) || 2342 ipv4_is_private_172(addr) || ipv4_is_test_192(addr) || 2343 ipv4_is_anycast_6to4(addr) || ipv4_is_private_192(addr) || 2344 ipv4_is_test_198(addr) || ipv4_is_multicast(addr) || 2345 ipv4_is_lbcast(addr)) ? 0x00 : 0x02; 2346 eui[1] = 0; 2347 eui[2] = 0x5E; 2348 eui[3] = 0xFE; 2349 memcpy(eui + 4, &addr, 4); 2350 return 0; 2351 } 2352 2353 static int addrconf_ifid_sit(u8 *eui, struct net_device *dev) 2354 { 2355 if (dev->priv_flags & IFF_ISATAP) 2356 return __ipv6_isatap_ifid(eui, *(__be32 *)dev->dev_addr); 2357 return -1; 2358 } 2359 2360 static int addrconf_ifid_gre(u8 *eui, struct net_device *dev) 2361 { 2362 return __ipv6_isatap_ifid(eui, *(__be32 *)dev->dev_addr); 2363 } 2364 2365 static int addrconf_ifid_ip6tnl(u8 *eui, struct net_device *dev) 2366 { 2367 memcpy(eui, dev->perm_addr, 3); 2368 memcpy(eui + 5, dev->perm_addr + 3, 3); 2369 eui[3] = 0xFF; 2370 eui[4] = 0xFE; 2371 eui[0] ^= 2; 2372 return 0; 2373 } 2374 2375 static int ipv6_generate_eui64(u8 *eui, struct net_device *dev) 2376 { 2377 switch (dev->type) { 2378 case ARPHRD_ETHER: 2379 case ARPHRD_FDDI: 2380 return addrconf_ifid_eui48(eui, dev); 2381 case ARPHRD_ARCNET: 2382 return addrconf_ifid_arcnet(eui, dev); 2383 case ARPHRD_INFINIBAND: 2384 return addrconf_ifid_infiniband(eui, dev); 2385 case ARPHRD_SIT: 2386 return addrconf_ifid_sit(eui, dev); 2387 case ARPHRD_IPGRE: 2388 case ARPHRD_TUNNEL: 2389 return addrconf_ifid_gre(eui, dev); 2390 case ARPHRD_6LOWPAN: 2391 return addrconf_ifid_6lowpan(eui, dev); 2392 case ARPHRD_IEEE1394: 2393 return addrconf_ifid_ieee1394(eui, dev); 2394 case ARPHRD_TUNNEL6: 2395 case ARPHRD_IP6GRE: 2396 case ARPHRD_RAWIP: 2397 return addrconf_ifid_ip6tnl(eui, dev); 2398 } 2399 return -1; 2400 } 2401 2402 static int ipv6_inherit_eui64(u8 *eui, struct inet6_dev *idev) 2403 { 2404 int err = -1; 2405 struct inet6_ifaddr *ifp; 2406 2407 read_lock_bh(&idev->lock); 2408 list_for_each_entry_reverse(ifp, &idev->addr_list, if_list) { 2409 if (ifp->scope > IFA_LINK) 2410 break; 2411 if (ifp->scope == IFA_LINK && !(ifp->flags&IFA_F_TENTATIVE)) { 2412 memcpy(eui, ifp->addr.s6_addr+8, 8); 2413 err = 0; 2414 break; 2415 } 2416 } 2417 read_unlock_bh(&idev->lock); 2418 return err; 2419 } 2420 2421 /* Generation of a randomized Interface Identifier 2422 * draft-ietf-6man-rfc4941bis, Section 3.3.1 2423 */ 2424 2425 static void ipv6_gen_rnd_iid(struct in6_addr *addr) 2426 { 2427 regen: 2428 get_random_bytes(&addr->s6_addr[8], 8); 2429 2430 /* <draft-ietf-6man-rfc4941bis-08.txt>, Section 3.3.1: 2431 * check if generated address is not inappropriate: 2432 * 2433 * - Reserved IPv6 Interface Identifiers 2434 * - XXX: already assigned to an address on the device 2435 */ 2436 2437 /* Subnet-router anycast: 0000:0000:0000:0000 */ 2438 if (!(addr->s6_addr32[2] | addr->s6_addr32[3])) 2439 goto regen; 2440 2441 /* IANA Ethernet block: 0200:5EFF:FE00:0000-0200:5EFF:FE00:5212 2442 * Proxy Mobile IPv6: 0200:5EFF:FE00:5213 2443 * IANA Ethernet block: 0200:5EFF:FE00:5214-0200:5EFF:FEFF:FFFF 2444 */ 2445 if (ntohl(addr->s6_addr32[2]) == 0x02005eff && 2446 (ntohl(addr->s6_addr32[3]) & 0Xff000000) == 0xfe000000) 2447 goto regen; 2448 2449 /* Reserved subnet anycast addresses */ 2450 if (ntohl(addr->s6_addr32[2]) == 0xfdffffff && 2451 ntohl(addr->s6_addr32[3]) >= 0Xffffff80) 2452 goto regen; 2453 } 2454 2455 /* 2456 * Add prefix route. 2457 */ 2458 2459 static void 2460 addrconf_prefix_route(struct in6_addr *pfx, int plen, u32 metric, 2461 struct net_device *dev, unsigned long expires, 2462 u32 flags, gfp_t gfp_flags) 2463 { 2464 struct fib6_config cfg = { 2465 .fc_table = l3mdev_fib_table(dev) ? : RT6_TABLE_PREFIX, 2466 .fc_metric = metric ? : IP6_RT_PRIO_ADDRCONF, 2467 .fc_ifindex = dev->ifindex, 2468 .fc_expires = expires, 2469 .fc_dst_len = plen, 2470 .fc_flags = RTF_UP | flags, 2471 .fc_nlinfo.nl_net = dev_net(dev), 2472 .fc_protocol = RTPROT_KERNEL, 2473 .fc_type = RTN_UNICAST, 2474 }; 2475 2476 cfg.fc_dst = *pfx; 2477 2478 /* Prevent useless cloning on PtP SIT. 2479 This thing is done here expecting that the whole 2480 class of non-broadcast devices need not cloning. 2481 */ 2482 #if IS_ENABLED(CONFIG_IPV6_SIT) 2483 if (dev->type == ARPHRD_SIT && (dev->flags & IFF_POINTOPOINT)) 2484 cfg.fc_flags |= RTF_NONEXTHOP; 2485 #endif 2486 2487 ip6_route_add(&cfg, gfp_flags, NULL); 2488 } 2489 2490 2491 static struct fib6_info *addrconf_get_prefix_route(const struct in6_addr *pfx, 2492 int plen, 2493 const struct net_device *dev, 2494 u32 flags, u32 noflags, 2495 bool no_gw) 2496 { 2497 struct fib6_node *fn; 2498 struct fib6_info *rt = NULL; 2499 struct fib6_table *table; 2500 u32 tb_id = l3mdev_fib_table(dev) ? : RT6_TABLE_PREFIX; 2501 2502 table = fib6_get_table(dev_net(dev), tb_id); 2503 if (!table) 2504 return NULL; 2505 2506 rcu_read_lock(); 2507 fn = fib6_locate(&table->tb6_root, pfx, plen, NULL, 0, true); 2508 if (!fn) 2509 goto out; 2510 2511 for_each_fib6_node_rt_rcu(fn) { 2512 /* prefix routes only use builtin fib6_nh */ 2513 if (rt->nh) 2514 continue; 2515 2516 if (rt->fib6_nh->fib_nh_dev->ifindex != dev->ifindex) 2517 continue; 2518 if (no_gw && rt->fib6_nh->fib_nh_gw_family) 2519 continue; 2520 if ((rt->fib6_flags & flags) != flags) 2521 continue; 2522 if ((rt->fib6_flags & noflags) != 0) 2523 continue; 2524 if (!fib6_info_hold_safe(rt)) 2525 continue; 2526 break; 2527 } 2528 out: 2529 rcu_read_unlock(); 2530 return rt; 2531 } 2532 2533 2534 /* Create "default" multicast route to the interface */ 2535 2536 static void addrconf_add_mroute(struct net_device *dev) 2537 { 2538 struct fib6_config cfg = { 2539 .fc_table = l3mdev_fib_table(dev) ? : RT6_TABLE_LOCAL, 2540 .fc_metric = IP6_RT_PRIO_ADDRCONF, 2541 .fc_ifindex = dev->ifindex, 2542 .fc_dst_len = 8, 2543 .fc_flags = RTF_UP, 2544 .fc_type = RTN_MULTICAST, 2545 .fc_nlinfo.nl_net = dev_net(dev), 2546 .fc_protocol = RTPROT_KERNEL, 2547 }; 2548 2549 ipv6_addr_set(&cfg.fc_dst, htonl(0xFF000000), 0, 0, 0); 2550 2551 ip6_route_add(&cfg, GFP_KERNEL, NULL); 2552 } 2553 2554 static struct inet6_dev *addrconf_add_dev(struct net_device *dev) 2555 { 2556 struct inet6_dev *idev; 2557 2558 ASSERT_RTNL(); 2559 2560 idev = ipv6_find_idev(dev); 2561 if (IS_ERR(idev)) 2562 return idev; 2563 2564 if (idev->cnf.disable_ipv6) 2565 return ERR_PTR(-EACCES); 2566 2567 /* Add default multicast route */ 2568 if (!(dev->flags & IFF_LOOPBACK) && !netif_is_l3_master(dev)) 2569 addrconf_add_mroute(dev); 2570 2571 return idev; 2572 } 2573 2574 static void delete_tempaddrs(struct inet6_dev *idev, 2575 struct inet6_ifaddr *ifp) 2576 { 2577 struct inet6_ifaddr *ift, *tmp; 2578 2579 write_lock_bh(&idev->lock); 2580 list_for_each_entry_safe(ift, tmp, &idev->tempaddr_list, tmp_list) { 2581 if (ift->ifpub != ifp) 2582 continue; 2583 2584 in6_ifa_hold(ift); 2585 write_unlock_bh(&idev->lock); 2586 ipv6_del_addr(ift); 2587 write_lock_bh(&idev->lock); 2588 } 2589 write_unlock_bh(&idev->lock); 2590 } 2591 2592 static void manage_tempaddrs(struct inet6_dev *idev, 2593 struct inet6_ifaddr *ifp, 2594 __u32 valid_lft, __u32 prefered_lft, 2595 bool create, unsigned long now) 2596 { 2597 u32 flags; 2598 struct inet6_ifaddr *ift; 2599 2600 read_lock_bh(&idev->lock); 2601 /* update all temporary addresses in the list */ 2602 list_for_each_entry(ift, &idev->tempaddr_list, tmp_list) { 2603 int age, max_valid, max_prefered; 2604 2605 if (ifp != ift->ifpub) 2606 continue; 2607 2608 /* RFC 4941 section 3.3: 2609 * If a received option will extend the lifetime of a public 2610 * address, the lifetimes of temporary addresses should 2611 * be extended, subject to the overall constraint that no 2612 * temporary addresses should ever remain "valid" or "preferred" 2613 * for a time longer than (TEMP_VALID_LIFETIME) or 2614 * (TEMP_PREFERRED_LIFETIME - DESYNC_FACTOR), respectively. 2615 */ 2616 age = (now - ift->cstamp) / HZ; 2617 max_valid = READ_ONCE(idev->cnf.temp_valid_lft) - age; 2618 if (max_valid < 0) 2619 max_valid = 0; 2620 2621 max_prefered = READ_ONCE(idev->cnf.temp_prefered_lft) - 2622 idev->desync_factor - age; 2623 if (max_prefered < 0) 2624 max_prefered = 0; 2625 2626 if (valid_lft > max_valid) 2627 valid_lft = max_valid; 2628 2629 if (prefered_lft > max_prefered) 2630 prefered_lft = max_prefered; 2631 2632 spin_lock(&ift->lock); 2633 flags = ift->flags; 2634 ift->valid_lft = valid_lft; 2635 ift->prefered_lft = prefered_lft; 2636 ift->tstamp = now; 2637 if (prefered_lft > 0) 2638 ift->flags &= ~IFA_F_DEPRECATED; 2639 2640 spin_unlock(&ift->lock); 2641 if (!(flags&IFA_F_TENTATIVE)) 2642 ipv6_ifa_notify(0, ift); 2643 } 2644 2645 /* Also create a temporary address if it's enabled but no temporary 2646 * address currently exists. 2647 * However, we get called with valid_lft == 0, prefered_lft == 0, create == false 2648 * as part of cleanup (ie. deleting the mngtmpaddr). 2649 * We don't want that to result in creating a new temporary ip address. 2650 */ 2651 if (list_empty(&idev->tempaddr_list) && (valid_lft || prefered_lft)) 2652 create = true; 2653 2654 if (create && READ_ONCE(idev->cnf.use_tempaddr) > 0) { 2655 /* When a new public address is created as described 2656 * in [ADDRCONF], also create a new temporary address. 2657 */ 2658 read_unlock_bh(&idev->lock); 2659 ipv6_create_tempaddr(ifp, false); 2660 } else { 2661 read_unlock_bh(&idev->lock); 2662 } 2663 } 2664 2665 static bool is_addr_mode_generate_stable(struct inet6_dev *idev) 2666 { 2667 return idev->cnf.addr_gen_mode == IN6_ADDR_GEN_MODE_STABLE_PRIVACY || 2668 idev->cnf.addr_gen_mode == IN6_ADDR_GEN_MODE_RANDOM; 2669 } 2670 2671 int addrconf_prefix_rcv_add_addr(struct net *net, struct net_device *dev, 2672 const struct prefix_info *pinfo, 2673 struct inet6_dev *in6_dev, 2674 const struct in6_addr *addr, int addr_type, 2675 u32 addr_flags, bool sllao, bool tokenized, 2676 __u32 valid_lft, u32 prefered_lft) 2677 { 2678 struct inet6_ifaddr *ifp = ipv6_get_ifaddr(net, addr, dev, 1); 2679 int create = 0, update_lft = 0; 2680 2681 if (!ifp && valid_lft) { 2682 int max_addresses = READ_ONCE(in6_dev->cnf.max_addresses); 2683 struct ifa6_config cfg = { 2684 .pfx = addr, 2685 .plen = pinfo->prefix_len, 2686 .ifa_flags = addr_flags, 2687 .valid_lft = valid_lft, 2688 .preferred_lft = prefered_lft, 2689 .scope = addr_type & IPV6_ADDR_SCOPE_MASK, 2690 .ifa_proto = IFAPROT_KERNEL_RA 2691 }; 2692 2693 #ifdef CONFIG_IPV6_OPTIMISTIC_DAD 2694 if ((READ_ONCE(net->ipv6.devconf_all->optimistic_dad) || 2695 READ_ONCE(in6_dev->cnf.optimistic_dad)) && 2696 !net->ipv6.devconf_all->forwarding && sllao) 2697 cfg.ifa_flags |= IFA_F_OPTIMISTIC; 2698 #endif 2699 2700 /* Do not allow to create too much of autoconfigured 2701 * addresses; this would be too easy way to crash kernel. 2702 */ 2703 if (!max_addresses || 2704 ipv6_count_addresses(in6_dev) < max_addresses) 2705 ifp = ipv6_add_addr(in6_dev, &cfg, false, NULL); 2706 2707 if (IS_ERR_OR_NULL(ifp)) 2708 return -1; 2709 2710 create = 1; 2711 spin_lock_bh(&ifp->lock); 2712 ifp->flags |= IFA_F_MANAGETEMPADDR; 2713 ifp->cstamp = jiffies; 2714 ifp->tokenized = tokenized; 2715 spin_unlock_bh(&ifp->lock); 2716 addrconf_dad_start(ifp); 2717 } 2718 2719 if (ifp) { 2720 u32 flags; 2721 unsigned long now; 2722 u32 stored_lft; 2723 2724 /* update lifetime (RFC2462 5.5.3 e) */ 2725 spin_lock_bh(&ifp->lock); 2726 now = jiffies; 2727 if (ifp->valid_lft > (now - ifp->tstamp) / HZ) 2728 stored_lft = ifp->valid_lft - (now - ifp->tstamp) / HZ; 2729 else 2730 stored_lft = 0; 2731 2732 /* RFC4862 Section 5.5.3e: 2733 * "Note that the preferred lifetime of the 2734 * corresponding address is always reset to 2735 * the Preferred Lifetime in the received 2736 * Prefix Information option, regardless of 2737 * whether the valid lifetime is also reset or 2738 * ignored." 2739 * 2740 * So we should always update prefered_lft here. 2741 */ 2742 update_lft = !create && stored_lft; 2743 2744 if (update_lft && !READ_ONCE(in6_dev->cnf.ra_honor_pio_life)) { 2745 const u32 minimum_lft = min_t(u32, 2746 stored_lft, MIN_VALID_LIFETIME); 2747 valid_lft = max(valid_lft, minimum_lft); 2748 } 2749 2750 if (update_lft) { 2751 ifp->valid_lft = valid_lft; 2752 ifp->prefered_lft = prefered_lft; 2753 WRITE_ONCE(ifp->tstamp, now); 2754 flags = ifp->flags; 2755 ifp->flags &= ~IFA_F_DEPRECATED; 2756 spin_unlock_bh(&ifp->lock); 2757 2758 if (!(flags&IFA_F_TENTATIVE)) 2759 ipv6_ifa_notify(0, ifp); 2760 } else 2761 spin_unlock_bh(&ifp->lock); 2762 2763 manage_tempaddrs(in6_dev, ifp, valid_lft, prefered_lft, 2764 create, now); 2765 2766 in6_ifa_put(ifp); 2767 addrconf_verify(net); 2768 } 2769 2770 return 0; 2771 } 2772 EXPORT_SYMBOL_GPL(addrconf_prefix_rcv_add_addr); 2773 2774 void addrconf_prefix_rcv(struct net_device *dev, u8 *opt, int len, bool sllao) 2775 { 2776 struct prefix_info *pinfo; 2777 struct fib6_table *table; 2778 __u32 valid_lft; 2779 __u32 prefered_lft; 2780 int addr_type, err; 2781 u32 addr_flags = 0; 2782 struct inet6_dev *in6_dev; 2783 struct net *net = dev_net(dev); 2784 bool ignore_autoconf = false; 2785 2786 pinfo = (struct prefix_info *) opt; 2787 2788 if (len < sizeof(struct prefix_info)) { 2789 netdev_dbg(dev, "addrconf: prefix option too short\n"); 2790 return; 2791 } 2792 2793 /* 2794 * Validation checks ([ADDRCONF], page 19) 2795 */ 2796 2797 addr_type = ipv6_addr_type(&pinfo->prefix); 2798 2799 if (addr_type & (IPV6_ADDR_MULTICAST|IPV6_ADDR_LINKLOCAL)) 2800 return; 2801 2802 valid_lft = ntohl(pinfo->valid); 2803 prefered_lft = ntohl(pinfo->prefered); 2804 2805 if (prefered_lft > valid_lft) { 2806 net_warn_ratelimited("addrconf: prefix option has invalid lifetime\n"); 2807 return; 2808 } 2809 2810 in6_dev = in6_dev_get(dev); 2811 2812 if (!in6_dev) { 2813 net_dbg_ratelimited("addrconf: device %s not configured\n", 2814 dev->name); 2815 return; 2816 } 2817 2818 if (valid_lft != 0 && valid_lft < in6_dev->cnf.accept_ra_min_lft) 2819 goto put; 2820 2821 /* 2822 * Two things going on here: 2823 * 1) Add routes for on-link prefixes 2824 * 2) Configure prefixes with the auto flag set 2825 */ 2826 2827 if (pinfo->onlink) { 2828 struct fib6_info *rt; 2829 unsigned long rt_expires; 2830 2831 /* Avoid arithmetic overflow. Really, we could 2832 * save rt_expires in seconds, likely valid_lft, 2833 * but it would require division in fib gc, that it 2834 * not good. 2835 */ 2836 if (HZ > USER_HZ) 2837 rt_expires = addrconf_timeout_fixup(valid_lft, HZ); 2838 else 2839 rt_expires = addrconf_timeout_fixup(valid_lft, USER_HZ); 2840 2841 if (addrconf_finite_timeout(rt_expires)) 2842 rt_expires *= HZ; 2843 2844 rt = addrconf_get_prefix_route(&pinfo->prefix, 2845 pinfo->prefix_len, 2846 dev, 2847 RTF_ADDRCONF | RTF_PREFIX_RT, 2848 RTF_DEFAULT, true); 2849 2850 if (rt) { 2851 /* Autoconf prefix route */ 2852 if (valid_lft == 0) { 2853 ip6_del_rt(net, rt, false); 2854 rt = NULL; 2855 } else { 2856 table = rt->fib6_table; 2857 spin_lock_bh(&table->tb6_lock); 2858 2859 if (addrconf_finite_timeout(rt_expires)) { 2860 /* not infinity */ 2861 fib6_set_expires(rt, jiffies + rt_expires); 2862 fib6_add_gc_list(rt); 2863 } else { 2864 fib6_clean_expires(rt); 2865 fib6_remove_gc_list(rt); 2866 } 2867 2868 spin_unlock_bh(&table->tb6_lock); 2869 } 2870 } else if (valid_lft) { 2871 clock_t expires = 0; 2872 int flags = RTF_ADDRCONF | RTF_PREFIX_RT; 2873 if (addrconf_finite_timeout(rt_expires)) { 2874 /* not infinity */ 2875 flags |= RTF_EXPIRES; 2876 expires = jiffies_to_clock_t(rt_expires); 2877 } 2878 addrconf_prefix_route(&pinfo->prefix, pinfo->prefix_len, 2879 0, dev, expires, flags, 2880 GFP_ATOMIC); 2881 } 2882 fib6_info_release(rt); 2883 } 2884 2885 /* Try to figure out our local address for this prefix */ 2886 2887 ignore_autoconf = READ_ONCE(in6_dev->cnf.ra_honor_pio_pflag) && pinfo->preferpd; 2888 if (pinfo->autoconf && in6_dev->cnf.autoconf && !ignore_autoconf) { 2889 struct in6_addr addr; 2890 bool tokenized = false, dev_addr_generated = false; 2891 2892 if (pinfo->prefix_len == 64) { 2893 memcpy(&addr, &pinfo->prefix, 8); 2894 2895 if (!ipv6_addr_any(&in6_dev->token)) { 2896 read_lock_bh(&in6_dev->lock); 2897 memcpy(addr.s6_addr + 8, 2898 in6_dev->token.s6_addr + 8, 8); 2899 read_unlock_bh(&in6_dev->lock); 2900 tokenized = true; 2901 } else if (is_addr_mode_generate_stable(in6_dev) && 2902 !ipv6_generate_stable_address(&addr, 0, 2903 in6_dev)) { 2904 addr_flags |= IFA_F_STABLE_PRIVACY; 2905 goto ok; 2906 } else if (ipv6_generate_eui64(addr.s6_addr + 8, dev) && 2907 ipv6_inherit_eui64(addr.s6_addr + 8, in6_dev)) { 2908 goto put; 2909 } else { 2910 dev_addr_generated = true; 2911 } 2912 goto ok; 2913 } 2914 net_dbg_ratelimited("IPv6 addrconf: prefix with wrong length %d\n", 2915 pinfo->prefix_len); 2916 goto put; 2917 2918 ok: 2919 err = addrconf_prefix_rcv_add_addr(net, dev, pinfo, in6_dev, 2920 &addr, addr_type, 2921 addr_flags, sllao, 2922 tokenized, valid_lft, 2923 prefered_lft); 2924 if (err) 2925 goto put; 2926 2927 /* Ignore error case here because previous prefix add addr was 2928 * successful which will be notified. 2929 */ 2930 ndisc_ops_prefix_rcv_add_addr(net, dev, pinfo, in6_dev, &addr, 2931 addr_type, addr_flags, sllao, 2932 tokenized, valid_lft, 2933 prefered_lft, 2934 dev_addr_generated); 2935 } 2936 inet6_prefix_notify(RTM_NEWPREFIX, in6_dev, pinfo); 2937 put: 2938 in6_dev_put(in6_dev); 2939 } 2940 2941 static int addrconf_set_sit_dstaddr(struct net *net, struct net_device *dev, 2942 struct in6_ifreq *ireq) 2943 { 2944 struct ip_tunnel_parm_kern p = { }; 2945 int err; 2946 2947 if (!(ipv6_addr_type(&ireq->ifr6_addr) & IPV6_ADDR_COMPATv4)) 2948 return -EADDRNOTAVAIL; 2949 2950 p.iph.daddr = ireq->ifr6_addr.s6_addr32[3]; 2951 p.iph.version = 4; 2952 p.iph.ihl = 5; 2953 p.iph.protocol = IPPROTO_IPV6; 2954 p.iph.ttl = 64; 2955 2956 if (!dev->netdev_ops->ndo_tunnel_ctl) 2957 return -EOPNOTSUPP; 2958 err = dev->netdev_ops->ndo_tunnel_ctl(dev, &p, SIOCADDTUNNEL); 2959 if (err) 2960 return err; 2961 2962 dev = __dev_get_by_name(net, p.name); 2963 if (!dev) 2964 return -ENOBUFS; 2965 return dev_open(dev, NULL); 2966 } 2967 2968 /* 2969 * Set destination address. 2970 * Special case for SIT interfaces where we create a new "virtual" 2971 * device. 2972 */ 2973 int addrconf_set_dstaddr(struct net *net, void __user *arg) 2974 { 2975 struct net_device *dev; 2976 struct in6_ifreq ireq; 2977 int err = -ENODEV; 2978 2979 if (!IS_ENABLED(CONFIG_IPV6_SIT)) 2980 return -ENODEV; 2981 if (copy_from_user(&ireq, arg, sizeof(struct in6_ifreq))) 2982 return -EFAULT; 2983 2984 rtnl_net_lock(net); 2985 dev = __dev_get_by_index(net, ireq.ifr6_ifindex); 2986 if (dev && dev->type == ARPHRD_SIT) 2987 err = addrconf_set_sit_dstaddr(net, dev, &ireq); 2988 rtnl_net_unlock(net); 2989 return err; 2990 } 2991 2992 static int ipv6_mc_config(struct sock *sk, bool join, 2993 const struct in6_addr *addr, int ifindex) 2994 { 2995 int ret; 2996 2997 ASSERT_RTNL(); 2998 2999 lock_sock(sk); 3000 if (join) 3001 ret = ipv6_sock_mc_join(sk, ifindex, addr); 3002 else 3003 ret = ipv6_sock_mc_drop(sk, ifindex, addr); 3004 release_sock(sk); 3005 3006 return ret; 3007 } 3008 3009 /* 3010 * Manual configuration of address on an interface 3011 */ 3012 static int inet6_addr_add(struct net *net, struct net_device *dev, 3013 struct ifa6_config *cfg, clock_t expires, u32 flags, 3014 struct netlink_ext_ack *extack) 3015 { 3016 struct inet6_ifaddr *ifp; 3017 struct inet6_dev *idev; 3018 3019 ASSERT_RTNL_NET(net); 3020 3021 if (cfg->plen > 128) { 3022 NL_SET_ERR_MSG_MOD(extack, "Invalid prefix length"); 3023 return -EINVAL; 3024 } 3025 3026 if (cfg->ifa_flags & IFA_F_MANAGETEMPADDR && cfg->plen != 64) { 3027 NL_SET_ERR_MSG_MOD(extack, "address with \"mngtmpaddr\" flag must have a prefix length of 64"); 3028 return -EINVAL; 3029 } 3030 3031 idev = addrconf_add_dev(dev); 3032 if (IS_ERR(idev)) { 3033 NL_SET_ERR_MSG_MOD(extack, "IPv6 is disabled on this device"); 3034 return PTR_ERR(idev); 3035 } 3036 3037 if (cfg->ifa_flags & IFA_F_MCAUTOJOIN) { 3038 int ret = ipv6_mc_config(net->ipv6.mc_autojoin_sk, 3039 true, cfg->pfx, dev->ifindex); 3040 3041 if (ret < 0) { 3042 NL_SET_ERR_MSG_MOD(extack, "Multicast auto join failed"); 3043 return ret; 3044 } 3045 } 3046 3047 cfg->scope = ipv6_addr_scope(cfg->pfx); 3048 3049 ifp = ipv6_add_addr(idev, cfg, true, extack); 3050 if (!IS_ERR(ifp)) { 3051 if (!(cfg->ifa_flags & IFA_F_NOPREFIXROUTE)) { 3052 addrconf_prefix_route(&ifp->addr, ifp->prefix_len, 3053 ifp->rt_priority, dev, expires, 3054 flags, GFP_KERNEL); 3055 } 3056 3057 /* Send a netlink notification if DAD is enabled and 3058 * optimistic flag is not set 3059 */ 3060 if (!(ifp->flags & (IFA_F_OPTIMISTIC | IFA_F_NODAD))) 3061 ipv6_ifa_notify(0, ifp); 3062 /* 3063 * Note that section 3.1 of RFC 4429 indicates 3064 * that the Optimistic flag should not be set for 3065 * manually configured addresses 3066 */ 3067 addrconf_dad_start(ifp); 3068 if (cfg->ifa_flags & IFA_F_MANAGETEMPADDR) 3069 manage_tempaddrs(idev, ifp, cfg->valid_lft, 3070 cfg->preferred_lft, true, jiffies); 3071 in6_ifa_put(ifp); 3072 addrconf_verify_rtnl(net); 3073 return 0; 3074 } else if (cfg->ifa_flags & IFA_F_MCAUTOJOIN) { 3075 ipv6_mc_config(net->ipv6.mc_autojoin_sk, false, 3076 cfg->pfx, dev->ifindex); 3077 } 3078 3079 return PTR_ERR(ifp); 3080 } 3081 3082 static int inet6_addr_del(struct net *net, int ifindex, u32 ifa_flags, 3083 const struct in6_addr *pfx, unsigned int plen, 3084 struct netlink_ext_ack *extack) 3085 { 3086 struct inet6_ifaddr *ifp; 3087 struct inet6_dev *idev; 3088 struct net_device *dev; 3089 3090 if (plen > 128) { 3091 NL_SET_ERR_MSG_MOD(extack, "Invalid prefix length"); 3092 return -EINVAL; 3093 } 3094 3095 dev = __dev_get_by_index(net, ifindex); 3096 if (!dev) { 3097 NL_SET_ERR_MSG_MOD(extack, "Unable to find the interface"); 3098 return -ENODEV; 3099 } 3100 3101 idev = __in6_dev_get_rtnl_net(dev); 3102 if (!idev) { 3103 NL_SET_ERR_MSG_MOD(extack, "IPv6 is disabled on this device"); 3104 return -ENXIO; 3105 } 3106 3107 read_lock_bh(&idev->lock); 3108 list_for_each_entry(ifp, &idev->addr_list, if_list) { 3109 if (ifp->prefix_len == plen && 3110 ipv6_addr_equal(pfx, &ifp->addr)) { 3111 in6_ifa_hold(ifp); 3112 read_unlock_bh(&idev->lock); 3113 3114 ipv6_del_addr(ifp); 3115 3116 if (!(ifp->flags & IFA_F_TEMPORARY) && 3117 (ifp->flags & IFA_F_MANAGETEMPADDR)) 3118 delete_tempaddrs(idev, ifp); 3119 3120 addrconf_verify_rtnl(net); 3121 if (ipv6_addr_is_multicast(pfx)) { 3122 ipv6_mc_config(net->ipv6.mc_autojoin_sk, 3123 false, pfx, dev->ifindex); 3124 } 3125 return 0; 3126 } 3127 } 3128 read_unlock_bh(&idev->lock); 3129 3130 NL_SET_ERR_MSG_MOD(extack, "address not found"); 3131 return -EADDRNOTAVAIL; 3132 } 3133 3134 3135 int addrconf_add_ifaddr(struct net *net, void __user *arg) 3136 { 3137 struct ifa6_config cfg = { 3138 .ifa_flags = IFA_F_PERMANENT, 3139 .preferred_lft = INFINITY_LIFE_TIME, 3140 .valid_lft = INFINITY_LIFE_TIME, 3141 }; 3142 struct net_device *dev; 3143 struct in6_ifreq ireq; 3144 int err; 3145 3146 if (!ns_capable(net->user_ns, CAP_NET_ADMIN)) 3147 return -EPERM; 3148 3149 if (copy_from_user(&ireq, arg, sizeof(struct in6_ifreq))) 3150 return -EFAULT; 3151 3152 cfg.pfx = &ireq.ifr6_addr; 3153 cfg.plen = ireq.ifr6_prefixlen; 3154 3155 rtnl_net_lock(net); 3156 dev = __dev_get_by_index(net, ireq.ifr6_ifindex); 3157 if (dev) { 3158 netdev_lock_ops(dev); 3159 err = inet6_addr_add(net, dev, &cfg, 0, 0, NULL); 3160 netdev_unlock_ops(dev); 3161 } else { 3162 err = -ENODEV; 3163 } 3164 rtnl_net_unlock(net); 3165 return err; 3166 } 3167 3168 int addrconf_del_ifaddr(struct net *net, void __user *arg) 3169 { 3170 struct in6_ifreq ireq; 3171 int err; 3172 3173 if (!ns_capable(net->user_ns, CAP_NET_ADMIN)) 3174 return -EPERM; 3175 3176 if (copy_from_user(&ireq, arg, sizeof(struct in6_ifreq))) 3177 return -EFAULT; 3178 3179 rtnl_net_lock(net); 3180 err = inet6_addr_del(net, ireq.ifr6_ifindex, 0, &ireq.ifr6_addr, 3181 ireq.ifr6_prefixlen, NULL); 3182 rtnl_net_unlock(net); 3183 return err; 3184 } 3185 3186 static void add_addr(struct inet6_dev *idev, const struct in6_addr *addr, 3187 int plen, int scope, u8 proto) 3188 { 3189 struct inet6_ifaddr *ifp; 3190 struct ifa6_config cfg = { 3191 .pfx = addr, 3192 .plen = plen, 3193 .ifa_flags = IFA_F_PERMANENT, 3194 .valid_lft = INFINITY_LIFE_TIME, 3195 .preferred_lft = INFINITY_LIFE_TIME, 3196 .scope = scope, 3197 .ifa_proto = proto 3198 }; 3199 3200 ifp = ipv6_add_addr(idev, &cfg, true, NULL); 3201 if (!IS_ERR(ifp)) { 3202 spin_lock_bh(&ifp->lock); 3203 ifp->flags &= ~IFA_F_TENTATIVE; 3204 spin_unlock_bh(&ifp->lock); 3205 rt_genid_bump_ipv6(dev_net(idev->dev)); 3206 ipv6_ifa_notify(RTM_NEWADDR, ifp); 3207 in6_ifa_put(ifp); 3208 } 3209 } 3210 3211 #if IS_ENABLED(CONFIG_IPV6_SIT) || IS_ENABLED(CONFIG_NET_IPGRE) || IS_ENABLED(CONFIG_IPV6_GRE) 3212 static void add_v4_addrs(struct inet6_dev *idev) 3213 { 3214 struct in6_addr addr; 3215 struct net_device *dev; 3216 struct net *net = dev_net(idev->dev); 3217 int scope, plen; 3218 u32 pflags = 0; 3219 3220 ASSERT_RTNL(); 3221 3222 memset(&addr, 0, sizeof(struct in6_addr)); 3223 memcpy(&addr.s6_addr32[3], idev->dev->dev_addr, 4); 3224 3225 if (!(idev->dev->flags & IFF_POINTOPOINT) && idev->dev->type == ARPHRD_SIT) { 3226 scope = IPV6_ADDR_COMPATv4; 3227 plen = 96; 3228 pflags |= RTF_NONEXTHOP; 3229 } else { 3230 if (idev->cnf.addr_gen_mode == IN6_ADDR_GEN_MODE_NONE) 3231 return; 3232 3233 addr.s6_addr32[0] = htonl(0xfe800000); 3234 scope = IFA_LINK; 3235 plen = 64; 3236 } 3237 3238 if (addr.s6_addr32[3]) { 3239 add_addr(idev, &addr, plen, scope, IFAPROT_UNSPEC); 3240 addrconf_prefix_route(&addr, plen, 0, idev->dev, 0, pflags, 3241 GFP_KERNEL); 3242 return; 3243 } 3244 3245 for_each_netdev(net, dev) { 3246 struct in_device *in_dev = __in_dev_get_rtnl(dev); 3247 if (in_dev && (dev->flags & IFF_UP)) { 3248 struct in_ifaddr *ifa; 3249 int flag = scope; 3250 3251 in_dev_for_each_ifa_rtnl(ifa, in_dev) { 3252 addr.s6_addr32[3] = ifa->ifa_local; 3253 3254 if (ifa->ifa_scope == RT_SCOPE_LINK) 3255 continue; 3256 if (ifa->ifa_scope >= RT_SCOPE_HOST) { 3257 if (idev->dev->flags&IFF_POINTOPOINT) 3258 continue; 3259 flag |= IFA_HOST; 3260 } 3261 3262 add_addr(idev, &addr, plen, flag, 3263 IFAPROT_UNSPEC); 3264 addrconf_prefix_route(&addr, plen, 0, idev->dev, 3265 0, pflags, GFP_KERNEL); 3266 } 3267 } 3268 } 3269 } 3270 #endif 3271 3272 static void init_loopback(struct net_device *dev) 3273 { 3274 struct inet6_dev *idev; 3275 3276 /* ::1 */ 3277 3278 ASSERT_RTNL(); 3279 3280 idev = ipv6_find_idev(dev); 3281 if (IS_ERR(idev)) { 3282 pr_debug("%s: add_dev failed\n", __func__); 3283 return; 3284 } 3285 3286 add_addr(idev, &in6addr_loopback, 128, IFA_HOST, IFAPROT_KERNEL_LO); 3287 } 3288 3289 void addrconf_add_linklocal(struct inet6_dev *idev, 3290 const struct in6_addr *addr, u32 flags) 3291 { 3292 struct ifa6_config cfg = { 3293 .pfx = addr, 3294 .plen = 64, 3295 .ifa_flags = flags | IFA_F_PERMANENT, 3296 .valid_lft = INFINITY_LIFE_TIME, 3297 .preferred_lft = INFINITY_LIFE_TIME, 3298 .scope = IFA_LINK, 3299 .ifa_proto = IFAPROT_KERNEL_LL 3300 }; 3301 struct inet6_ifaddr *ifp; 3302 3303 #ifdef CONFIG_IPV6_OPTIMISTIC_DAD 3304 if ((READ_ONCE(dev_net(idev->dev)->ipv6.devconf_all->optimistic_dad) || 3305 READ_ONCE(idev->cnf.optimistic_dad)) && 3306 !dev_net(idev->dev)->ipv6.devconf_all->forwarding) 3307 cfg.ifa_flags |= IFA_F_OPTIMISTIC; 3308 #endif 3309 3310 ifp = ipv6_add_addr(idev, &cfg, true, NULL); 3311 if (!IS_ERR(ifp)) { 3312 addrconf_prefix_route(&ifp->addr, ifp->prefix_len, 0, idev->dev, 3313 0, 0, GFP_ATOMIC); 3314 addrconf_dad_start(ifp); 3315 in6_ifa_put(ifp); 3316 } 3317 } 3318 EXPORT_SYMBOL_GPL(addrconf_add_linklocal); 3319 3320 static bool ipv6_reserved_interfaceid(struct in6_addr address) 3321 { 3322 if ((address.s6_addr32[2] | address.s6_addr32[3]) == 0) 3323 return true; 3324 3325 if (address.s6_addr32[2] == htonl(0x02005eff) && 3326 ((address.s6_addr32[3] & htonl(0xfe000000)) == htonl(0xfe000000))) 3327 return true; 3328 3329 if (address.s6_addr32[2] == htonl(0xfdffffff) && 3330 ((address.s6_addr32[3] & htonl(0xffffff80)) == htonl(0xffffff80))) 3331 return true; 3332 3333 return false; 3334 } 3335 3336 static int ipv6_generate_stable_address(struct in6_addr *address, 3337 u8 dad_count, 3338 const struct inet6_dev *idev) 3339 { 3340 static DEFINE_SPINLOCK(lock); 3341 static __u32 digest[SHA1_DIGEST_WORDS]; 3342 static __u32 workspace[SHA1_WORKSPACE_WORDS]; 3343 3344 static union { 3345 char __data[SHA1_BLOCK_SIZE]; 3346 struct { 3347 struct in6_addr secret; 3348 __be32 prefix[2]; 3349 unsigned char hwaddr[MAX_ADDR_LEN]; 3350 u8 dad_count; 3351 } __packed; 3352 } data; 3353 3354 struct in6_addr secret; 3355 struct in6_addr temp; 3356 struct net *net = dev_net(idev->dev); 3357 3358 BUILD_BUG_ON(sizeof(data.__data) != sizeof(data)); 3359 3360 if (idev->cnf.stable_secret.initialized) 3361 secret = idev->cnf.stable_secret.secret; 3362 else if (net->ipv6.devconf_dflt->stable_secret.initialized) 3363 secret = net->ipv6.devconf_dflt->stable_secret.secret; 3364 else 3365 return -1; 3366 3367 retry: 3368 spin_lock_bh(&lock); 3369 3370 sha1_init_raw(digest); 3371 memset(&data, 0, sizeof(data)); 3372 memset(workspace, 0, sizeof(workspace)); 3373 memcpy(data.hwaddr, idev->dev->perm_addr, idev->dev->addr_len); 3374 data.prefix[0] = address->s6_addr32[0]; 3375 data.prefix[1] = address->s6_addr32[1]; 3376 data.secret = secret; 3377 data.dad_count = dad_count; 3378 3379 sha1_transform(digest, data.__data, workspace); 3380 3381 temp = *address; 3382 temp.s6_addr32[2] = (__force __be32)digest[0]; 3383 temp.s6_addr32[3] = (__force __be32)digest[1]; 3384 3385 spin_unlock_bh(&lock); 3386 3387 if (ipv6_reserved_interfaceid(temp)) { 3388 dad_count++; 3389 if (dad_count > dev_net(idev->dev)->ipv6.sysctl.idgen_retries) 3390 return -1; 3391 goto retry; 3392 } 3393 3394 *address = temp; 3395 return 0; 3396 } 3397 3398 static void ipv6_gen_mode_random_init(struct inet6_dev *idev) 3399 { 3400 struct ipv6_stable_secret *s = &idev->cnf.stable_secret; 3401 3402 if (s->initialized) 3403 return; 3404 s = &idev->cnf.stable_secret; 3405 get_random_bytes(&s->secret, sizeof(s->secret)); 3406 s->initialized = true; 3407 } 3408 3409 static void addrconf_addr_gen(struct inet6_dev *idev, bool prefix_route) 3410 { 3411 struct in6_addr addr; 3412 3413 /* no link local addresses on L3 master devices */ 3414 if (netif_is_l3_master(idev->dev)) 3415 return; 3416 3417 /* no link local addresses on devices flagged as slaves */ 3418 if (idev->dev->priv_flags & IFF_NO_ADDRCONF) 3419 return; 3420 3421 ipv6_addr_set(&addr, htonl(0xFE800000), 0, 0, 0); 3422 3423 switch (idev->cnf.addr_gen_mode) { 3424 case IN6_ADDR_GEN_MODE_RANDOM: 3425 ipv6_gen_mode_random_init(idev); 3426 fallthrough; 3427 case IN6_ADDR_GEN_MODE_STABLE_PRIVACY: 3428 if (!ipv6_generate_stable_address(&addr, 0, idev)) 3429 addrconf_add_linklocal(idev, &addr, 3430 IFA_F_STABLE_PRIVACY); 3431 else if (prefix_route) 3432 addrconf_prefix_route(&addr, 64, 0, idev->dev, 3433 0, 0, GFP_KERNEL); 3434 break; 3435 case IN6_ADDR_GEN_MODE_EUI64: 3436 /* addrconf_add_linklocal also adds a prefix_route and we 3437 * only need to care about prefix routes if ipv6_generate_eui64 3438 * couldn't generate one. 3439 */ 3440 if (ipv6_generate_eui64(addr.s6_addr + 8, idev->dev) == 0) 3441 addrconf_add_linklocal(idev, &addr, 0); 3442 else if (prefix_route) 3443 addrconf_prefix_route(&addr, 64, 0, idev->dev, 3444 0, 0, GFP_KERNEL); 3445 break; 3446 case IN6_ADDR_GEN_MODE_NONE: 3447 default: 3448 /* will not add any link local address */ 3449 break; 3450 } 3451 } 3452 3453 static void addrconf_dev_config(struct net_device *dev) 3454 { 3455 struct inet6_dev *idev; 3456 3457 ASSERT_RTNL(); 3458 3459 if ((dev->type != ARPHRD_ETHER) && 3460 (dev->type != ARPHRD_FDDI) && 3461 (dev->type != ARPHRD_ARCNET) && 3462 (dev->type != ARPHRD_INFINIBAND) && 3463 (dev->type != ARPHRD_IEEE1394) && 3464 (dev->type != ARPHRD_TUNNEL6) && 3465 (dev->type != ARPHRD_6LOWPAN) && 3466 (dev->type != ARPHRD_TUNNEL) && 3467 (dev->type != ARPHRD_NONE) && 3468 (dev->type != ARPHRD_RAWIP)) { 3469 /* Alas, we support only Ethernet autoconfiguration. */ 3470 idev = __in6_dev_get(dev); 3471 if (!IS_ERR_OR_NULL(idev) && dev->flags & IFF_UP && 3472 dev->flags & IFF_MULTICAST) 3473 ipv6_mc_up(idev); 3474 return; 3475 } 3476 3477 idev = addrconf_add_dev(dev); 3478 if (IS_ERR(idev)) 3479 return; 3480 3481 /* this device type has no EUI support */ 3482 if (dev->type == ARPHRD_NONE && 3483 idev->cnf.addr_gen_mode == IN6_ADDR_GEN_MODE_EUI64) 3484 WRITE_ONCE(idev->cnf.addr_gen_mode, 3485 IN6_ADDR_GEN_MODE_RANDOM); 3486 3487 addrconf_addr_gen(idev, false); 3488 } 3489 3490 #if IS_ENABLED(CONFIG_IPV6_SIT) 3491 static void addrconf_sit_config(struct net_device *dev) 3492 { 3493 struct inet6_dev *idev; 3494 3495 ASSERT_RTNL(); 3496 3497 /* 3498 * Configure the tunnel with one of our IPv4 3499 * addresses... we should configure all of 3500 * our v4 addrs in the tunnel 3501 */ 3502 3503 idev = ipv6_find_idev(dev); 3504 if (IS_ERR(idev)) { 3505 pr_debug("%s: add_dev failed\n", __func__); 3506 return; 3507 } 3508 3509 if (dev->priv_flags & IFF_ISATAP) { 3510 addrconf_addr_gen(idev, false); 3511 return; 3512 } 3513 3514 add_v4_addrs(idev); 3515 3516 if (dev->flags&IFF_POINTOPOINT) 3517 addrconf_add_mroute(dev); 3518 } 3519 #endif 3520 3521 #if IS_ENABLED(CONFIG_NET_IPGRE) || IS_ENABLED(CONFIG_IPV6_GRE) 3522 static void addrconf_gre_config(struct net_device *dev) 3523 { 3524 struct inet6_dev *idev; 3525 3526 ASSERT_RTNL(); 3527 3528 idev = addrconf_add_dev(dev); 3529 if (IS_ERR(idev)) 3530 return; 3531 3532 /* Generate the IPv6 link-local address using addrconf_addr_gen(), 3533 * unless we have an IPv4 GRE device not bound to an IP address and 3534 * which is in EUI64 mode (as __ipv6_isatap_ifid() would fail in this 3535 * case). Such devices fall back to add_v4_addrs() instead. 3536 */ 3537 if (!(dev->type == ARPHRD_IPGRE && *(__be32 *)dev->dev_addr == 0 && 3538 idev->cnf.addr_gen_mode == IN6_ADDR_GEN_MODE_EUI64)) { 3539 addrconf_addr_gen(idev, true); 3540 return; 3541 } 3542 3543 add_v4_addrs(idev); 3544 } 3545 #endif 3546 3547 static void addrconf_init_auto_addrs(struct net_device *dev) 3548 { 3549 switch (dev->type) { 3550 #if IS_ENABLED(CONFIG_IPV6_SIT) 3551 case ARPHRD_SIT: 3552 addrconf_sit_config(dev); 3553 break; 3554 #endif 3555 #if IS_ENABLED(CONFIG_NET_IPGRE) || IS_ENABLED(CONFIG_IPV6_GRE) 3556 case ARPHRD_IP6GRE: 3557 case ARPHRD_IPGRE: 3558 addrconf_gre_config(dev); 3559 break; 3560 #endif 3561 case ARPHRD_LOOPBACK: 3562 init_loopback(dev); 3563 break; 3564 3565 default: 3566 addrconf_dev_config(dev); 3567 break; 3568 } 3569 } 3570 3571 static int fixup_permanent_addr(struct net *net, 3572 struct inet6_dev *idev, 3573 struct inet6_ifaddr *ifp) 3574 { 3575 /* !fib6_node means the host route was removed from the 3576 * FIB, for example, if 'lo' device is taken down. In that 3577 * case regenerate the host route. 3578 */ 3579 if (!ifp->rt || !ifp->rt->fib6_node) { 3580 struct fib6_info *f6i, *prev; 3581 3582 f6i = addrconf_f6i_alloc(net, idev, &ifp->addr, false, 3583 GFP_ATOMIC, NULL); 3584 if (IS_ERR(f6i)) 3585 return PTR_ERR(f6i); 3586 3587 /* ifp->rt can be accessed outside of rtnl */ 3588 spin_lock(&ifp->lock); 3589 prev = ifp->rt; 3590 ifp->rt = f6i; 3591 spin_unlock(&ifp->lock); 3592 3593 fib6_info_release(prev); 3594 } 3595 3596 if (!(ifp->flags & IFA_F_NOPREFIXROUTE)) { 3597 addrconf_prefix_route(&ifp->addr, ifp->prefix_len, 3598 ifp->rt_priority, idev->dev, 0, 0, 3599 GFP_ATOMIC); 3600 } 3601 3602 if (ifp->state == INET6_IFADDR_STATE_PREDAD) 3603 addrconf_dad_start(ifp); 3604 3605 return 0; 3606 } 3607 3608 static void addrconf_permanent_addr(struct net *net, struct net_device *dev) 3609 { 3610 struct inet6_ifaddr *ifp, *tmp; 3611 struct inet6_dev *idev; 3612 3613 idev = __in6_dev_get(dev); 3614 if (!idev) 3615 return; 3616 3617 write_lock_bh(&idev->lock); 3618 3619 list_for_each_entry_safe(ifp, tmp, &idev->addr_list, if_list) { 3620 if ((ifp->flags & IFA_F_PERMANENT) && 3621 fixup_permanent_addr(net, idev, ifp) < 0) { 3622 write_unlock_bh(&idev->lock); 3623 in6_ifa_hold(ifp); 3624 ipv6_del_addr(ifp); 3625 write_lock_bh(&idev->lock); 3626 3627 net_info_ratelimited("%s: Failed to add prefix route for address %pI6c; dropping\n", 3628 idev->dev->name, &ifp->addr); 3629 } 3630 } 3631 3632 write_unlock_bh(&idev->lock); 3633 } 3634 3635 static int addrconf_notify(struct notifier_block *this, unsigned long event, 3636 void *ptr) 3637 { 3638 struct net_device *dev = netdev_notifier_info_to_dev(ptr); 3639 struct netdev_notifier_change_info *change_info; 3640 struct netdev_notifier_changeupper_info *info; 3641 struct inet6_dev *idev = __in6_dev_get(dev); 3642 struct net *net = dev_net(dev); 3643 int run_pending = 0; 3644 int err; 3645 3646 switch (event) { 3647 case NETDEV_REGISTER: 3648 if (!idev && dev->mtu >= IPV6_MIN_MTU) { 3649 idev = ipv6_add_dev(dev); 3650 if (IS_ERR(idev)) 3651 return notifier_from_errno(PTR_ERR(idev)); 3652 } 3653 break; 3654 3655 case NETDEV_CHANGEMTU: 3656 /* if MTU under IPV6_MIN_MTU stop IPv6 on this interface. */ 3657 if (dev->mtu < IPV6_MIN_MTU) { 3658 addrconf_ifdown(dev, dev != net->loopback_dev); 3659 break; 3660 } 3661 3662 if (idev) { 3663 rt6_mtu_change(dev, dev->mtu); 3664 WRITE_ONCE(idev->cnf.mtu6, dev->mtu); 3665 break; 3666 } 3667 3668 /* allocate new idev */ 3669 idev = ipv6_add_dev(dev); 3670 if (IS_ERR(idev)) 3671 break; 3672 3673 /* device is still not ready */ 3674 if (!(idev->if_flags & IF_READY)) 3675 break; 3676 3677 run_pending = 1; 3678 fallthrough; 3679 case NETDEV_UP: 3680 case NETDEV_CHANGE: 3681 if (idev && idev->cnf.disable_ipv6) 3682 break; 3683 3684 if (dev->priv_flags & IFF_NO_ADDRCONF) { 3685 if (event == NETDEV_UP && !IS_ERR_OR_NULL(idev) && 3686 dev->flags & IFF_UP && dev->flags & IFF_MULTICAST) 3687 ipv6_mc_up(idev); 3688 break; 3689 } 3690 3691 if (event == NETDEV_UP) { 3692 /* restore routes for permanent addresses */ 3693 addrconf_permanent_addr(net, dev); 3694 3695 if (!addrconf_link_ready(dev)) { 3696 /* device is not ready yet. */ 3697 pr_debug("ADDRCONF(NETDEV_UP): %s: link is not ready\n", 3698 dev->name); 3699 break; 3700 } 3701 3702 if (!idev && dev->mtu >= IPV6_MIN_MTU) 3703 idev = ipv6_add_dev(dev); 3704 3705 if (!IS_ERR_OR_NULL(idev)) { 3706 idev->if_flags |= IF_READY; 3707 run_pending = 1; 3708 } 3709 } else if (event == NETDEV_CHANGE) { 3710 if (!addrconf_link_ready(dev)) { 3711 /* device is still not ready. */ 3712 rt6_sync_down_dev(dev, event); 3713 break; 3714 } 3715 3716 if (!IS_ERR_OR_NULL(idev)) { 3717 if (idev->if_flags & IF_READY) { 3718 /* device is already configured - 3719 * but resend MLD reports, we might 3720 * have roamed and need to update 3721 * multicast snooping switches 3722 */ 3723 ipv6_mc_up(idev); 3724 change_info = ptr; 3725 if (change_info->flags_changed & IFF_NOARP) 3726 addrconf_dad_run(idev, true); 3727 rt6_sync_up(dev, RTNH_F_LINKDOWN); 3728 break; 3729 } 3730 idev->if_flags |= IF_READY; 3731 } 3732 3733 pr_debug("ADDRCONF(NETDEV_CHANGE): %s: link becomes ready\n", 3734 dev->name); 3735 3736 run_pending = 1; 3737 } 3738 3739 addrconf_init_auto_addrs(dev); 3740 3741 if (!IS_ERR_OR_NULL(idev)) { 3742 if (run_pending) 3743 addrconf_dad_run(idev, false); 3744 3745 /* Device has an address by now */ 3746 rt6_sync_up(dev, RTNH_F_DEAD); 3747 3748 /* 3749 * If the MTU changed during the interface down, 3750 * when the interface up, the changed MTU must be 3751 * reflected in the idev as well as routers. 3752 */ 3753 if (idev->cnf.mtu6 != dev->mtu && 3754 dev->mtu >= IPV6_MIN_MTU) { 3755 rt6_mtu_change(dev, dev->mtu); 3756 WRITE_ONCE(idev->cnf.mtu6, dev->mtu); 3757 } 3758 WRITE_ONCE(idev->tstamp, jiffies); 3759 inet6_ifinfo_notify(RTM_NEWLINK, idev); 3760 3761 /* 3762 * If the changed mtu during down is lower than 3763 * IPV6_MIN_MTU stop IPv6 on this interface. 3764 */ 3765 if (dev->mtu < IPV6_MIN_MTU) 3766 addrconf_ifdown(dev, dev != net->loopback_dev); 3767 } 3768 break; 3769 3770 case NETDEV_DOWN: 3771 case NETDEV_UNREGISTER: 3772 /* 3773 * Remove all addresses from this interface. 3774 */ 3775 addrconf_ifdown(dev, event != NETDEV_DOWN); 3776 break; 3777 3778 case NETDEV_CHANGENAME: 3779 if (idev) { 3780 snmp6_unregister_dev(idev); 3781 addrconf_sysctl_unregister(idev); 3782 err = addrconf_sysctl_register(idev); 3783 if (err) 3784 return notifier_from_errno(err); 3785 err = snmp6_register_dev(idev); 3786 if (err) { 3787 addrconf_sysctl_unregister(idev); 3788 return notifier_from_errno(err); 3789 } 3790 } 3791 break; 3792 3793 case NETDEV_PRE_TYPE_CHANGE: 3794 case NETDEV_POST_TYPE_CHANGE: 3795 if (idev) 3796 addrconf_type_change(dev, event); 3797 break; 3798 3799 case NETDEV_CHANGEUPPER: 3800 info = ptr; 3801 3802 /* flush all routes if dev is linked to or unlinked from 3803 * an L3 master device (e.g., VRF) 3804 */ 3805 if (info->upper_dev && netif_is_l3_master(info->upper_dev)) 3806 addrconf_ifdown(dev, false); 3807 } 3808 3809 return NOTIFY_OK; 3810 } 3811 3812 /* 3813 * addrconf module should be notified of a device going up 3814 */ 3815 static struct notifier_block ipv6_dev_notf = { 3816 .notifier_call = addrconf_notify, 3817 .priority = ADDRCONF_NOTIFY_PRIORITY, 3818 }; 3819 3820 static void addrconf_type_change(struct net_device *dev, unsigned long event) 3821 { 3822 struct inet6_dev *idev; 3823 ASSERT_RTNL(); 3824 3825 idev = __in6_dev_get(dev); 3826 3827 if (event == NETDEV_POST_TYPE_CHANGE) 3828 ipv6_mc_remap(idev); 3829 else if (event == NETDEV_PRE_TYPE_CHANGE) 3830 ipv6_mc_unmap(idev); 3831 } 3832 3833 static bool addr_is_local(const struct in6_addr *addr) 3834 { 3835 return ipv6_addr_type(addr) & 3836 (IPV6_ADDR_LINKLOCAL | IPV6_ADDR_LOOPBACK); 3837 } 3838 3839 static int addrconf_ifdown(struct net_device *dev, bool unregister) 3840 { 3841 unsigned long event = unregister ? NETDEV_UNREGISTER : NETDEV_DOWN; 3842 struct net *net = dev_net(dev); 3843 struct inet6_dev *idev; 3844 struct inet6_ifaddr *ifa; 3845 LIST_HEAD(tmp_addr_list); 3846 bool keep_addr = false; 3847 bool was_ready; 3848 int state, i; 3849 3850 ASSERT_RTNL(); 3851 3852 rt6_disable_ip(dev, event); 3853 3854 idev = __in6_dev_get(dev); 3855 if (!idev) 3856 return -ENODEV; 3857 3858 /* 3859 * Step 1: remove reference to ipv6 device from parent device. 3860 * Do not dev_put! 3861 */ 3862 if (unregister) { 3863 idev->dead = 1; 3864 3865 /* protected by rtnl_lock */ 3866 RCU_INIT_POINTER(dev->ip6_ptr, NULL); 3867 3868 /* Step 1.5: remove snmp6 entry */ 3869 snmp6_unregister_dev(idev); 3870 3871 } 3872 3873 /* combine the user config with event to determine if permanent 3874 * addresses are to be removed from address hash table 3875 */ 3876 if (!unregister && !idev->cnf.disable_ipv6) { 3877 /* aggregate the system setting and interface setting */ 3878 int _keep_addr = READ_ONCE(net->ipv6.devconf_all->keep_addr_on_down); 3879 3880 if (!_keep_addr) 3881 _keep_addr = READ_ONCE(idev->cnf.keep_addr_on_down); 3882 3883 keep_addr = (_keep_addr > 0); 3884 } 3885 3886 /* Step 2: clear hash table */ 3887 for (i = 0; i < IN6_ADDR_HSIZE; i++) { 3888 struct hlist_head *h = &net->ipv6.inet6_addr_lst[i]; 3889 3890 spin_lock_bh(&net->ipv6.addrconf_hash_lock); 3891 restart: 3892 hlist_for_each_entry_rcu(ifa, h, addr_lst) { 3893 if (ifa->idev == idev) { 3894 addrconf_del_dad_work(ifa); 3895 /* combined flag + permanent flag decide if 3896 * address is retained on a down event 3897 */ 3898 if (!keep_addr || 3899 !(ifa->flags & IFA_F_PERMANENT) || 3900 addr_is_local(&ifa->addr)) { 3901 hlist_del_init_rcu(&ifa->addr_lst); 3902 goto restart; 3903 } 3904 } 3905 } 3906 spin_unlock_bh(&net->ipv6.addrconf_hash_lock); 3907 } 3908 3909 write_lock_bh(&idev->lock); 3910 3911 addrconf_del_rs_timer(idev); 3912 3913 /* Step 2: clear flags for stateless addrconf, repeated down 3914 * detection 3915 */ 3916 was_ready = idev->if_flags & IF_READY; 3917 if (!unregister) 3918 idev->if_flags &= ~(IF_RS_SENT|IF_RA_RCVD|IF_READY); 3919 3920 /* Step 3: clear tempaddr list */ 3921 while (!list_empty(&idev->tempaddr_list)) { 3922 ifa = list_first_entry(&idev->tempaddr_list, 3923 struct inet6_ifaddr, tmp_list); 3924 list_del(&ifa->tmp_list); 3925 write_unlock_bh(&idev->lock); 3926 spin_lock_bh(&ifa->lock); 3927 3928 if (ifa->ifpub) { 3929 in6_ifa_put(ifa->ifpub); 3930 ifa->ifpub = NULL; 3931 } 3932 spin_unlock_bh(&ifa->lock); 3933 in6_ifa_put(ifa); 3934 write_lock_bh(&idev->lock); 3935 } 3936 3937 list_for_each_entry(ifa, &idev->addr_list, if_list) 3938 list_add_tail(&ifa->if_list_aux, &tmp_addr_list); 3939 write_unlock_bh(&idev->lock); 3940 3941 while (!list_empty(&tmp_addr_list)) { 3942 struct fib6_info *rt = NULL; 3943 bool keep; 3944 3945 ifa = list_first_entry(&tmp_addr_list, 3946 struct inet6_ifaddr, if_list_aux); 3947 list_del(&ifa->if_list_aux); 3948 3949 addrconf_del_dad_work(ifa); 3950 3951 keep = keep_addr && (ifa->flags & IFA_F_PERMANENT) && 3952 !addr_is_local(&ifa->addr); 3953 3954 spin_lock_bh(&ifa->lock); 3955 3956 if (keep) { 3957 /* set state to skip the notifier below */ 3958 state = INET6_IFADDR_STATE_DEAD; 3959 ifa->state = INET6_IFADDR_STATE_PREDAD; 3960 if (!(ifa->flags & IFA_F_NODAD)) 3961 ifa->flags |= IFA_F_TENTATIVE; 3962 3963 rt = ifa->rt; 3964 ifa->rt = NULL; 3965 } else { 3966 state = ifa->state; 3967 ifa->state = INET6_IFADDR_STATE_DEAD; 3968 } 3969 3970 spin_unlock_bh(&ifa->lock); 3971 3972 if (rt) 3973 ip6_del_rt(net, rt, false); 3974 3975 if (state != INET6_IFADDR_STATE_DEAD) { 3976 __ipv6_ifa_notify(RTM_DELADDR, ifa); 3977 inet6addr_notifier_call_chain(NETDEV_DOWN, ifa); 3978 } else { 3979 if (idev->cnf.forwarding) 3980 addrconf_leave_anycast(ifa); 3981 addrconf_leave_solict(ifa->idev, &ifa->addr); 3982 } 3983 3984 if (!keep) { 3985 write_lock_bh(&idev->lock); 3986 list_del_rcu(&ifa->if_list); 3987 write_unlock_bh(&idev->lock); 3988 in6_ifa_put(ifa); 3989 } 3990 } 3991 3992 /* Step 5: Discard anycast and multicast list */ 3993 if (unregister) { 3994 ipv6_ac_destroy_dev(idev); 3995 ipv6_mc_destroy_dev(idev); 3996 } else if (was_ready) { 3997 ipv6_mc_down(idev); 3998 } 3999 4000 WRITE_ONCE(idev->tstamp, jiffies); 4001 idev->ra_mtu = 0; 4002 4003 /* Last: Shot the device (if unregistered) */ 4004 if (unregister) { 4005 addrconf_sysctl_unregister(idev); 4006 neigh_parms_release(&nd_tbl, idev->nd_parms); 4007 neigh_ifdown(&nd_tbl, dev); 4008 in6_dev_put(idev); 4009 } 4010 return 0; 4011 } 4012 4013 static void addrconf_rs_timer(struct timer_list *t) 4014 { 4015 struct inet6_dev *idev = timer_container_of(idev, t, rs_timer); 4016 struct net_device *dev = idev->dev; 4017 struct in6_addr lladdr; 4018 int rtr_solicits; 4019 4020 write_lock(&idev->lock); 4021 if (idev->dead || !(idev->if_flags & IF_READY)) 4022 goto out; 4023 4024 if (!ipv6_accept_ra(idev)) 4025 goto out; 4026 4027 /* Announcement received after solicitation was sent */ 4028 if (idev->if_flags & IF_RA_RCVD) 4029 goto out; 4030 4031 rtr_solicits = READ_ONCE(idev->cnf.rtr_solicits); 4032 4033 if (idev->rs_probes++ < rtr_solicits || rtr_solicits < 0) { 4034 write_unlock(&idev->lock); 4035 if (!ipv6_get_lladdr(dev, &lladdr, IFA_F_TENTATIVE)) 4036 ndisc_send_rs(dev, &lladdr, 4037 &in6addr_linklocal_allrouters); 4038 else 4039 goto put; 4040 4041 write_lock(&idev->lock); 4042 idev->rs_interval = rfc3315_s14_backoff_update( 4043 idev->rs_interval, 4044 READ_ONCE(idev->cnf.rtr_solicit_max_interval)); 4045 /* The wait after the last probe can be shorter */ 4046 addrconf_mod_rs_timer(idev, (idev->rs_probes == 4047 READ_ONCE(idev->cnf.rtr_solicits)) ? 4048 READ_ONCE(idev->cnf.rtr_solicit_delay) : 4049 idev->rs_interval); 4050 } else { 4051 /* 4052 * Note: we do not support deprecated "all on-link" 4053 * assumption any longer. 4054 */ 4055 pr_debug("%s: no IPv6 routers present\n", idev->dev->name); 4056 } 4057 4058 out: 4059 write_unlock(&idev->lock); 4060 put: 4061 in6_dev_put(idev); 4062 } 4063 4064 /* 4065 * Duplicate Address Detection 4066 */ 4067 static void addrconf_dad_kick(struct inet6_ifaddr *ifp) 4068 { 4069 struct inet6_dev *idev = ifp->idev; 4070 unsigned long rand_num; 4071 u64 nonce; 4072 4073 if (ifp->flags & IFA_F_OPTIMISTIC) 4074 rand_num = 0; 4075 else 4076 rand_num = get_random_u32_below( 4077 READ_ONCE(idev->cnf.rtr_solicit_delay) ? : 1); 4078 4079 nonce = 0; 4080 if (READ_ONCE(idev->cnf.enhanced_dad) || 4081 READ_ONCE(dev_net(idev->dev)->ipv6.devconf_all->enhanced_dad)) { 4082 do 4083 get_random_bytes(&nonce, 6); 4084 while (nonce == 0); 4085 } 4086 ifp->dad_nonce = nonce; 4087 ifp->dad_probes = READ_ONCE(idev->cnf.dad_transmits); 4088 addrconf_mod_dad_work(ifp, rand_num); 4089 } 4090 4091 static void addrconf_dad_begin(struct inet6_ifaddr *ifp) 4092 { 4093 struct inet6_dev *idev = ifp->idev; 4094 struct net_device *dev = idev->dev; 4095 bool bump_id, notify = false; 4096 struct net *net; 4097 4098 addrconf_join_solict(dev, &ifp->addr); 4099 4100 read_lock_bh(&idev->lock); 4101 spin_lock(&ifp->lock); 4102 if (ifp->state == INET6_IFADDR_STATE_DEAD) 4103 goto out; 4104 4105 net = dev_net(dev); 4106 if (dev->flags&(IFF_NOARP|IFF_LOOPBACK) || 4107 (READ_ONCE(net->ipv6.devconf_all->accept_dad) < 1 && 4108 READ_ONCE(idev->cnf.accept_dad) < 1) || 4109 !(ifp->flags&IFA_F_TENTATIVE) || 4110 ifp->flags & IFA_F_NODAD) { 4111 bool send_na = false; 4112 4113 if (ifp->flags & IFA_F_TENTATIVE && 4114 !(ifp->flags & IFA_F_OPTIMISTIC)) 4115 send_na = true; 4116 bump_id = ifp->flags & IFA_F_TENTATIVE; 4117 ifp->flags &= ~(IFA_F_TENTATIVE|IFA_F_OPTIMISTIC|IFA_F_DADFAILED); 4118 spin_unlock(&ifp->lock); 4119 read_unlock_bh(&idev->lock); 4120 4121 addrconf_dad_completed(ifp, bump_id, send_na); 4122 return; 4123 } 4124 4125 if (!(idev->if_flags & IF_READY)) { 4126 spin_unlock(&ifp->lock); 4127 read_unlock_bh(&idev->lock); 4128 /* 4129 * If the device is not ready: 4130 * - keep it tentative if it is a permanent address. 4131 * - otherwise, kill it. 4132 */ 4133 in6_ifa_hold(ifp); 4134 addrconf_dad_stop(ifp, 0); 4135 return; 4136 } 4137 4138 /* 4139 * Optimistic nodes can start receiving 4140 * Frames right away 4141 */ 4142 if (ifp->flags & IFA_F_OPTIMISTIC) { 4143 ip6_ins_rt(net, ifp->rt); 4144 if (ipv6_use_optimistic_addr(net, idev)) { 4145 /* Because optimistic nodes can use this address, 4146 * notify listeners. If DAD fails, RTM_DELADDR is sent. 4147 */ 4148 notify = true; 4149 } 4150 } 4151 4152 addrconf_dad_kick(ifp); 4153 out: 4154 spin_unlock(&ifp->lock); 4155 read_unlock_bh(&idev->lock); 4156 if (notify) 4157 ipv6_ifa_notify(RTM_NEWADDR, ifp); 4158 } 4159 4160 static void addrconf_dad_start(struct inet6_ifaddr *ifp) 4161 { 4162 bool begin_dad = false; 4163 4164 spin_lock_bh(&ifp->lock); 4165 if (ifp->state != INET6_IFADDR_STATE_DEAD) { 4166 ifp->state = INET6_IFADDR_STATE_PREDAD; 4167 begin_dad = true; 4168 } 4169 spin_unlock_bh(&ifp->lock); 4170 4171 if (begin_dad) 4172 addrconf_mod_dad_work(ifp, 0); 4173 } 4174 4175 static void addrconf_dad_work(struct work_struct *w) 4176 { 4177 struct inet6_ifaddr *ifp = container_of(to_delayed_work(w), 4178 struct inet6_ifaddr, 4179 dad_work); 4180 struct inet6_dev *idev = ifp->idev; 4181 bool bump_id, disable_ipv6 = false; 4182 struct in6_addr mcaddr; 4183 struct net *net; 4184 4185 enum { 4186 DAD_PROCESS, 4187 DAD_BEGIN, 4188 DAD_ABORT, 4189 } action = DAD_PROCESS; 4190 4191 net = dev_net(idev->dev); 4192 4193 rtnl_net_lock(net); 4194 4195 spin_lock_bh(&ifp->lock); 4196 if (ifp->state == INET6_IFADDR_STATE_PREDAD) { 4197 action = DAD_BEGIN; 4198 ifp->state = INET6_IFADDR_STATE_DAD; 4199 } else if (ifp->state == INET6_IFADDR_STATE_ERRDAD) { 4200 action = DAD_ABORT; 4201 ifp->state = INET6_IFADDR_STATE_POSTDAD; 4202 4203 if ((READ_ONCE(net->ipv6.devconf_all->accept_dad) > 1 || 4204 READ_ONCE(idev->cnf.accept_dad) > 1) && 4205 !idev->cnf.disable_ipv6 && 4206 !(ifp->flags & IFA_F_STABLE_PRIVACY)) { 4207 struct in6_addr addr; 4208 4209 addr.s6_addr32[0] = htonl(0xfe800000); 4210 addr.s6_addr32[1] = 0; 4211 4212 if (!ipv6_generate_eui64(addr.s6_addr + 8, idev->dev) && 4213 ipv6_addr_equal(&ifp->addr, &addr)) { 4214 /* DAD failed for link-local based on MAC */ 4215 WRITE_ONCE(idev->cnf.disable_ipv6, 1); 4216 4217 pr_info("%s: IPv6 being disabled!\n", 4218 ifp->idev->dev->name); 4219 disable_ipv6 = true; 4220 } 4221 } 4222 } 4223 spin_unlock_bh(&ifp->lock); 4224 4225 if (action == DAD_BEGIN) { 4226 addrconf_dad_begin(ifp); 4227 goto out; 4228 } else if (action == DAD_ABORT) { 4229 in6_ifa_hold(ifp); 4230 addrconf_dad_stop(ifp, 1); 4231 if (disable_ipv6) 4232 addrconf_ifdown(idev->dev, false); 4233 goto out; 4234 } 4235 4236 if (!ifp->dad_probes && addrconf_dad_end(ifp)) 4237 goto out; 4238 4239 write_lock_bh(&idev->lock); 4240 if (idev->dead || !(idev->if_flags & IF_READY)) { 4241 write_unlock_bh(&idev->lock); 4242 goto out; 4243 } 4244 4245 spin_lock(&ifp->lock); 4246 if (ifp->state == INET6_IFADDR_STATE_DEAD) { 4247 spin_unlock(&ifp->lock); 4248 write_unlock_bh(&idev->lock); 4249 goto out; 4250 } 4251 4252 if (ifp->dad_probes == 0) { 4253 bool send_na = false; 4254 4255 /* 4256 * DAD was successful 4257 */ 4258 4259 if (ifp->flags & IFA_F_TENTATIVE && 4260 !(ifp->flags & IFA_F_OPTIMISTIC)) 4261 send_na = true; 4262 bump_id = ifp->flags & IFA_F_TENTATIVE; 4263 ifp->flags &= ~(IFA_F_TENTATIVE|IFA_F_OPTIMISTIC|IFA_F_DADFAILED); 4264 spin_unlock(&ifp->lock); 4265 write_unlock_bh(&idev->lock); 4266 4267 addrconf_dad_completed(ifp, bump_id, send_na); 4268 4269 goto out; 4270 } 4271 4272 ifp->dad_probes--; 4273 addrconf_mod_dad_work(ifp, 4274 max(NEIGH_VAR(ifp->idev->nd_parms, RETRANS_TIME), 4275 HZ/100)); 4276 spin_unlock(&ifp->lock); 4277 write_unlock_bh(&idev->lock); 4278 4279 /* send a neighbour solicitation for our addr */ 4280 addrconf_addr_solict_mult(&ifp->addr, &mcaddr); 4281 ndisc_send_ns(ifp->idev->dev, &ifp->addr, &mcaddr, &in6addr_any, 4282 ifp->dad_nonce); 4283 out: 4284 in6_ifa_put(ifp); 4285 rtnl_net_unlock(net); 4286 } 4287 4288 /* ifp->idev must be at least read locked */ 4289 static bool ipv6_lonely_lladdr(struct inet6_ifaddr *ifp) 4290 { 4291 struct inet6_ifaddr *ifpiter; 4292 struct inet6_dev *idev = ifp->idev; 4293 4294 list_for_each_entry_reverse(ifpiter, &idev->addr_list, if_list) { 4295 if (ifpiter->scope > IFA_LINK) 4296 break; 4297 if (ifp != ifpiter && ifpiter->scope == IFA_LINK && 4298 (ifpiter->flags & (IFA_F_PERMANENT|IFA_F_TENTATIVE| 4299 IFA_F_OPTIMISTIC|IFA_F_DADFAILED)) == 4300 IFA_F_PERMANENT) 4301 return false; 4302 } 4303 return true; 4304 } 4305 4306 static void addrconf_dad_completed(struct inet6_ifaddr *ifp, bool bump_id, 4307 bool send_na) 4308 { 4309 struct net_device *dev = ifp->idev->dev; 4310 struct in6_addr lladdr; 4311 bool send_rs, send_mld; 4312 4313 addrconf_del_dad_work(ifp); 4314 4315 /* 4316 * Configure the address for reception. Now it is valid. 4317 */ 4318 4319 ipv6_ifa_notify(RTM_NEWADDR, ifp); 4320 4321 /* If added prefix is link local and we are prepared to process 4322 router advertisements, start sending router solicitations. 4323 */ 4324 4325 read_lock_bh(&ifp->idev->lock); 4326 send_mld = ifp->scope == IFA_LINK && ipv6_lonely_lladdr(ifp); 4327 send_rs = send_mld && 4328 ipv6_accept_ra(ifp->idev) && 4329 READ_ONCE(ifp->idev->cnf.rtr_solicits) != 0 && 4330 (dev->flags & IFF_LOOPBACK) == 0 && 4331 (dev->type != ARPHRD_TUNNEL) && 4332 !netif_is_team_port(dev); 4333 read_unlock_bh(&ifp->idev->lock); 4334 4335 /* While dad is in progress mld report's source address is in6_addrany. 4336 * Resend with proper ll now. 4337 */ 4338 if (send_mld) 4339 ipv6_mc_dad_complete(ifp->idev); 4340 4341 /* send unsolicited NA if enabled */ 4342 if (send_na && 4343 (READ_ONCE(ifp->idev->cnf.ndisc_notify) || 4344 READ_ONCE(dev_net(dev)->ipv6.devconf_all->ndisc_notify))) { 4345 ndisc_send_na(dev, &in6addr_linklocal_allnodes, &ifp->addr, 4346 /*router=*/ !!ifp->idev->cnf.forwarding, 4347 /*solicited=*/ false, /*override=*/ true, 4348 /*inc_opt=*/ true); 4349 } 4350 4351 if (send_rs) { 4352 /* 4353 * If a host as already performed a random delay 4354 * [...] as part of DAD [...] there is no need 4355 * to delay again before sending the first RS 4356 */ 4357 if (ipv6_get_lladdr(dev, &lladdr, IFA_F_TENTATIVE)) 4358 return; 4359 ndisc_send_rs(dev, &lladdr, &in6addr_linklocal_allrouters); 4360 4361 write_lock_bh(&ifp->idev->lock); 4362 spin_lock(&ifp->lock); 4363 ifp->idev->rs_interval = rfc3315_s14_backoff_init( 4364 READ_ONCE(ifp->idev->cnf.rtr_solicit_interval)); 4365 ifp->idev->rs_probes = 1; 4366 ifp->idev->if_flags |= IF_RS_SENT; 4367 addrconf_mod_rs_timer(ifp->idev, ifp->idev->rs_interval); 4368 spin_unlock(&ifp->lock); 4369 write_unlock_bh(&ifp->idev->lock); 4370 } 4371 4372 if (bump_id) 4373 rt_genid_bump_ipv6(dev_net(dev)); 4374 4375 /* Make sure that a new temporary address will be created 4376 * before this temporary address becomes deprecated. 4377 */ 4378 if (ifp->flags & IFA_F_TEMPORARY) 4379 addrconf_verify_rtnl(dev_net(dev)); 4380 } 4381 4382 static void addrconf_dad_run(struct inet6_dev *idev, bool restart) 4383 { 4384 struct inet6_ifaddr *ifp; 4385 4386 read_lock_bh(&idev->lock); 4387 list_for_each_entry(ifp, &idev->addr_list, if_list) { 4388 spin_lock(&ifp->lock); 4389 if ((ifp->flags & IFA_F_TENTATIVE && 4390 ifp->state == INET6_IFADDR_STATE_DAD) || restart) { 4391 if (restart) 4392 ifp->state = INET6_IFADDR_STATE_PREDAD; 4393 addrconf_dad_kick(ifp); 4394 } 4395 spin_unlock(&ifp->lock); 4396 } 4397 read_unlock_bh(&idev->lock); 4398 } 4399 4400 #ifdef CONFIG_PROC_FS 4401 struct if6_iter_state { 4402 struct seq_net_private p; 4403 int bucket; 4404 int offset; 4405 }; 4406 4407 static struct inet6_ifaddr *if6_get_first(struct seq_file *seq, loff_t pos) 4408 { 4409 struct if6_iter_state *state = seq->private; 4410 struct net *net = seq_file_net(seq); 4411 struct inet6_ifaddr *ifa = NULL; 4412 int p = 0; 4413 4414 /* initial bucket if pos is 0 */ 4415 if (pos == 0) { 4416 state->bucket = 0; 4417 state->offset = 0; 4418 } 4419 4420 for (; state->bucket < IN6_ADDR_HSIZE; ++state->bucket) { 4421 hlist_for_each_entry_rcu(ifa, &net->ipv6.inet6_addr_lst[state->bucket], 4422 addr_lst) { 4423 /* sync with offset */ 4424 if (p < state->offset) { 4425 p++; 4426 continue; 4427 } 4428 return ifa; 4429 } 4430 4431 /* prepare for next bucket */ 4432 state->offset = 0; 4433 p = 0; 4434 } 4435 return NULL; 4436 } 4437 4438 static struct inet6_ifaddr *if6_get_next(struct seq_file *seq, 4439 struct inet6_ifaddr *ifa) 4440 { 4441 struct if6_iter_state *state = seq->private; 4442 struct net *net = seq_file_net(seq); 4443 4444 hlist_for_each_entry_continue_rcu(ifa, addr_lst) { 4445 state->offset++; 4446 return ifa; 4447 } 4448 4449 state->offset = 0; 4450 while (++state->bucket < IN6_ADDR_HSIZE) { 4451 hlist_for_each_entry_rcu(ifa, 4452 &net->ipv6.inet6_addr_lst[state->bucket], addr_lst) { 4453 return ifa; 4454 } 4455 } 4456 4457 return NULL; 4458 } 4459 4460 static void *if6_seq_start(struct seq_file *seq, loff_t *pos) 4461 __acquires(rcu) 4462 { 4463 rcu_read_lock(); 4464 return if6_get_first(seq, *pos); 4465 } 4466 4467 static void *if6_seq_next(struct seq_file *seq, void *v, loff_t *pos) 4468 { 4469 struct inet6_ifaddr *ifa; 4470 4471 ifa = if6_get_next(seq, v); 4472 ++*pos; 4473 return ifa; 4474 } 4475 4476 static void if6_seq_stop(struct seq_file *seq, void *v) 4477 __releases(rcu) 4478 { 4479 rcu_read_unlock(); 4480 } 4481 4482 static int if6_seq_show(struct seq_file *seq, void *v) 4483 { 4484 struct inet6_ifaddr *ifp = (struct inet6_ifaddr *)v; 4485 seq_printf(seq, "%pi6 %02x %02x %02x %02x %8s\n", 4486 &ifp->addr, 4487 ifp->idev->dev->ifindex, 4488 ifp->prefix_len, 4489 ifp->scope, 4490 (u8) ifp->flags, 4491 ifp->idev->dev->name); 4492 return 0; 4493 } 4494 4495 static const struct seq_operations if6_seq_ops = { 4496 .start = if6_seq_start, 4497 .next = if6_seq_next, 4498 .show = if6_seq_show, 4499 .stop = if6_seq_stop, 4500 }; 4501 4502 static int __net_init if6_proc_net_init(struct net *net) 4503 { 4504 if (!proc_create_net("if_inet6", 0444, net->proc_net, &if6_seq_ops, 4505 sizeof(struct if6_iter_state))) 4506 return -ENOMEM; 4507 return 0; 4508 } 4509 4510 static void __net_exit if6_proc_net_exit(struct net *net) 4511 { 4512 remove_proc_entry("if_inet6", net->proc_net); 4513 } 4514 4515 static struct pernet_operations if6_proc_net_ops = { 4516 .init = if6_proc_net_init, 4517 .exit = if6_proc_net_exit, 4518 }; 4519 4520 int __init if6_proc_init(void) 4521 { 4522 return register_pernet_subsys(&if6_proc_net_ops); 4523 } 4524 4525 void if6_proc_exit(void) 4526 { 4527 unregister_pernet_subsys(&if6_proc_net_ops); 4528 } 4529 #endif /* CONFIG_PROC_FS */ 4530 4531 #if IS_ENABLED(CONFIG_IPV6_MIP6) 4532 /* Check if address is a home address configured on any interface. */ 4533 int ipv6_chk_home_addr(struct net *net, const struct in6_addr *addr) 4534 { 4535 unsigned int hash = inet6_addr_hash(net, addr); 4536 struct inet6_ifaddr *ifp = NULL; 4537 int ret = 0; 4538 4539 rcu_read_lock(); 4540 hlist_for_each_entry_rcu(ifp, &net->ipv6.inet6_addr_lst[hash], addr_lst) { 4541 if (ipv6_addr_equal(&ifp->addr, addr) && 4542 (ifp->flags & IFA_F_HOMEADDRESS)) { 4543 ret = 1; 4544 break; 4545 } 4546 } 4547 rcu_read_unlock(); 4548 return ret; 4549 } 4550 #endif 4551 4552 /* RFC6554 has some algorithm to avoid loops in segment routing by 4553 * checking if the segments contains any of a local interface address. 4554 * 4555 * Quote: 4556 * 4557 * To detect loops in the SRH, a router MUST determine if the SRH 4558 * includes multiple addresses assigned to any interface on that router. 4559 * If such addresses appear more than once and are separated by at least 4560 * one address not assigned to that router. 4561 */ 4562 int ipv6_chk_rpl_srh_loop(struct net *net, const struct in6_addr *segs, 4563 unsigned char nsegs) 4564 { 4565 const struct in6_addr *addr; 4566 int i, ret = 0, found = 0; 4567 struct inet6_ifaddr *ifp; 4568 bool separated = false; 4569 unsigned int hash; 4570 bool hash_found; 4571 4572 rcu_read_lock(); 4573 for (i = 0; i < nsegs; i++) { 4574 addr = &segs[i]; 4575 hash = inet6_addr_hash(net, addr); 4576 4577 hash_found = false; 4578 hlist_for_each_entry_rcu(ifp, &net->ipv6.inet6_addr_lst[hash], addr_lst) { 4579 4580 if (ipv6_addr_equal(&ifp->addr, addr)) { 4581 hash_found = true; 4582 break; 4583 } 4584 } 4585 4586 if (hash_found) { 4587 if (found > 1 && separated) { 4588 ret = 1; 4589 break; 4590 } 4591 4592 separated = false; 4593 found++; 4594 } else { 4595 separated = true; 4596 } 4597 } 4598 rcu_read_unlock(); 4599 4600 return ret; 4601 } 4602 4603 /* 4604 * Periodic address status verification 4605 */ 4606 4607 static void addrconf_verify_rtnl(struct net *net) 4608 { 4609 unsigned long now, next, next_sec, next_sched; 4610 struct inet6_ifaddr *ifp; 4611 int i; 4612 4613 ASSERT_RTNL(); 4614 4615 rcu_read_lock_bh(); 4616 now = jiffies; 4617 next = round_jiffies_up(now + ADDR_CHECK_FREQUENCY); 4618 4619 cancel_delayed_work(&net->ipv6.addr_chk_work); 4620 4621 for (i = 0; i < IN6_ADDR_HSIZE; i++) { 4622 restart: 4623 hlist_for_each_entry_rcu_bh(ifp, &net->ipv6.inet6_addr_lst[i], addr_lst) { 4624 unsigned long age; 4625 4626 /* When setting preferred_lft to a value not zero or 4627 * infinity, while valid_lft is infinity 4628 * IFA_F_PERMANENT has a non-infinity life time. 4629 */ 4630 if ((ifp->flags & IFA_F_PERMANENT) && 4631 (ifp->prefered_lft == INFINITY_LIFE_TIME)) 4632 continue; 4633 4634 spin_lock(&ifp->lock); 4635 /* We try to batch several events at once. */ 4636 age = (now - ifp->tstamp + ADDRCONF_TIMER_FUZZ_MINUS) / HZ; 4637 4638 if ((ifp->flags&IFA_F_TEMPORARY) && 4639 !(ifp->flags&IFA_F_TENTATIVE) && 4640 ifp->prefered_lft != INFINITY_LIFE_TIME && 4641 !ifp->regen_count && ifp->ifpub) { 4642 /* This is a non-regenerated temporary addr. */ 4643 4644 unsigned long regen_advance = ipv6_get_regen_advance(ifp->idev); 4645 4646 if (age + regen_advance >= ifp->prefered_lft) { 4647 struct inet6_ifaddr *ifpub = ifp->ifpub; 4648 if (time_before(ifp->tstamp + ifp->prefered_lft * HZ, next)) 4649 next = ifp->tstamp + ifp->prefered_lft * HZ; 4650 4651 ifp->regen_count++; 4652 in6_ifa_hold(ifp); 4653 in6_ifa_hold(ifpub); 4654 spin_unlock(&ifp->lock); 4655 4656 spin_lock(&ifpub->lock); 4657 ifpub->regen_count = 0; 4658 spin_unlock(&ifpub->lock); 4659 rcu_read_unlock_bh(); 4660 ipv6_create_tempaddr(ifpub, true); 4661 in6_ifa_put(ifpub); 4662 in6_ifa_put(ifp); 4663 rcu_read_lock_bh(); 4664 goto restart; 4665 } else if (time_before(ifp->tstamp + ifp->prefered_lft * HZ - regen_advance * HZ, next)) 4666 next = ifp->tstamp + ifp->prefered_lft * HZ - regen_advance * HZ; 4667 } 4668 4669 if (ifp->valid_lft != INFINITY_LIFE_TIME && 4670 age >= ifp->valid_lft) { 4671 spin_unlock(&ifp->lock); 4672 in6_ifa_hold(ifp); 4673 rcu_read_unlock_bh(); 4674 ipv6_del_addr(ifp); 4675 rcu_read_lock_bh(); 4676 goto restart; 4677 } else if (ifp->prefered_lft == INFINITY_LIFE_TIME) { 4678 spin_unlock(&ifp->lock); 4679 continue; 4680 } else if (age >= ifp->prefered_lft) { 4681 /* jiffies - ifp->tstamp > age >= ifp->prefered_lft */ 4682 int deprecate = 0; 4683 4684 if (!(ifp->flags&IFA_F_DEPRECATED)) { 4685 deprecate = 1; 4686 ifp->flags |= IFA_F_DEPRECATED; 4687 } 4688 4689 if ((ifp->valid_lft != INFINITY_LIFE_TIME) && 4690 (time_before(ifp->tstamp + ifp->valid_lft * HZ, next))) 4691 next = ifp->tstamp + ifp->valid_lft * HZ; 4692 4693 spin_unlock(&ifp->lock); 4694 4695 if (deprecate) { 4696 in6_ifa_hold(ifp); 4697 4698 ipv6_ifa_notify(0, ifp); 4699 in6_ifa_put(ifp); 4700 goto restart; 4701 } 4702 } else { 4703 /* ifp->prefered_lft <= ifp->valid_lft */ 4704 if (time_before(ifp->tstamp + ifp->prefered_lft * HZ, next)) 4705 next = ifp->tstamp + ifp->prefered_lft * HZ; 4706 spin_unlock(&ifp->lock); 4707 } 4708 } 4709 } 4710 4711 next_sec = round_jiffies_up(next); 4712 next_sched = next; 4713 4714 /* If rounded timeout is accurate enough, accept it. */ 4715 if (time_before(next_sec, next + ADDRCONF_TIMER_FUZZ)) 4716 next_sched = next_sec; 4717 4718 /* And minimum interval is ADDRCONF_TIMER_FUZZ_MAX. */ 4719 if (time_before(next_sched, jiffies + ADDRCONF_TIMER_FUZZ_MAX)) 4720 next_sched = jiffies + ADDRCONF_TIMER_FUZZ_MAX; 4721 4722 pr_debug("now = %lu, schedule = %lu, rounded schedule = %lu => %lu\n", 4723 now, next, next_sec, next_sched); 4724 mod_delayed_work(addrconf_wq, &net->ipv6.addr_chk_work, next_sched - now); 4725 rcu_read_unlock_bh(); 4726 } 4727 4728 static void addrconf_verify_work(struct work_struct *w) 4729 { 4730 struct net *net = container_of(to_delayed_work(w), struct net, 4731 ipv6.addr_chk_work); 4732 4733 rtnl_net_lock(net); 4734 addrconf_verify_rtnl(net); 4735 rtnl_net_unlock(net); 4736 } 4737 4738 static void addrconf_verify(struct net *net) 4739 { 4740 mod_delayed_work(addrconf_wq, &net->ipv6.addr_chk_work, 0); 4741 } 4742 4743 static struct in6_addr *extract_addr(struct nlattr *addr, struct nlattr *local, 4744 struct in6_addr **peer_pfx) 4745 { 4746 struct in6_addr *pfx = NULL; 4747 4748 *peer_pfx = NULL; 4749 4750 if (addr) 4751 pfx = nla_data(addr); 4752 4753 if (local) { 4754 if (pfx && nla_memcmp(local, pfx, sizeof(*pfx))) 4755 *peer_pfx = pfx; 4756 pfx = nla_data(local); 4757 } 4758 4759 return pfx; 4760 } 4761 4762 static const struct nla_policy ifa_ipv6_policy[IFA_MAX+1] = { 4763 [IFA_ADDRESS] = { .len = sizeof(struct in6_addr) }, 4764 [IFA_LOCAL] = { .len = sizeof(struct in6_addr) }, 4765 [IFA_CACHEINFO] = { .len = sizeof(struct ifa_cacheinfo) }, 4766 [IFA_FLAGS] = { .len = sizeof(u32) }, 4767 [IFA_RT_PRIORITY] = { .len = sizeof(u32) }, 4768 [IFA_TARGET_NETNSID] = { .type = NLA_S32 }, 4769 [IFA_PROTO] = { .type = NLA_U8 }, 4770 }; 4771 4772 static int 4773 inet6_rtm_deladdr(struct sk_buff *skb, struct nlmsghdr *nlh, 4774 struct netlink_ext_ack *extack) 4775 { 4776 struct net *net = sock_net(skb->sk); 4777 struct ifaddrmsg *ifm; 4778 struct nlattr *tb[IFA_MAX+1]; 4779 struct in6_addr *pfx, *peer_pfx; 4780 u32 ifa_flags; 4781 int err; 4782 4783 err = nlmsg_parse_deprecated(nlh, sizeof(*ifm), tb, IFA_MAX, 4784 ifa_ipv6_policy, extack); 4785 if (err < 0) 4786 return err; 4787 4788 ifm = nlmsg_data(nlh); 4789 pfx = extract_addr(tb[IFA_ADDRESS], tb[IFA_LOCAL], &peer_pfx); 4790 if (!pfx) 4791 return -EINVAL; 4792 4793 ifa_flags = nla_get_u32_default(tb[IFA_FLAGS], ifm->ifa_flags); 4794 4795 /* We ignore other flags so far. */ 4796 ifa_flags &= IFA_F_MANAGETEMPADDR; 4797 4798 rtnl_net_lock(net); 4799 err = inet6_addr_del(net, ifm->ifa_index, ifa_flags, pfx, 4800 ifm->ifa_prefixlen, extack); 4801 rtnl_net_unlock(net); 4802 4803 return err; 4804 } 4805 4806 static int modify_prefix_route(struct net *net, struct inet6_ifaddr *ifp, 4807 unsigned long expires, u32 flags, 4808 bool modify_peer) 4809 { 4810 struct fib6_table *table; 4811 struct fib6_info *f6i; 4812 u32 prio; 4813 4814 f6i = addrconf_get_prefix_route(modify_peer ? &ifp->peer_addr : &ifp->addr, 4815 ifp->prefix_len, 4816 ifp->idev->dev, 0, RTF_DEFAULT, true); 4817 if (!f6i) 4818 return -ENOENT; 4819 4820 prio = ifp->rt_priority ? : IP6_RT_PRIO_ADDRCONF; 4821 if (f6i->fib6_metric != prio) { 4822 /* delete old one */ 4823 ip6_del_rt(dev_net(ifp->idev->dev), f6i, false); 4824 4825 /* add new one */ 4826 addrconf_prefix_route(modify_peer ? &ifp->peer_addr : &ifp->addr, 4827 ifp->prefix_len, 4828 ifp->rt_priority, ifp->idev->dev, 4829 expires, flags, GFP_KERNEL); 4830 return 0; 4831 } 4832 if (f6i != net->ipv6.fib6_null_entry) { 4833 table = f6i->fib6_table; 4834 spin_lock_bh(&table->tb6_lock); 4835 4836 if (!(flags & RTF_EXPIRES)) { 4837 fib6_clean_expires(f6i); 4838 fib6_remove_gc_list(f6i); 4839 } else { 4840 fib6_set_expires(f6i, expires); 4841 fib6_add_gc_list(f6i); 4842 } 4843 4844 spin_unlock_bh(&table->tb6_lock); 4845 } 4846 fib6_info_release(f6i); 4847 4848 return 0; 4849 } 4850 4851 static int inet6_addr_modify(struct net *net, struct inet6_ifaddr *ifp, 4852 struct ifa6_config *cfg, clock_t expires, 4853 u32 flags) 4854 { 4855 bool was_managetempaddr; 4856 bool new_peer = false; 4857 bool had_prefixroute; 4858 4859 ASSERT_RTNL_NET(net); 4860 4861 if (cfg->ifa_flags & IFA_F_MANAGETEMPADDR && 4862 (ifp->flags & IFA_F_TEMPORARY || ifp->prefix_len != 64)) 4863 return -EINVAL; 4864 4865 if (!(ifp->flags & IFA_F_TENTATIVE) || ifp->flags & IFA_F_DADFAILED) 4866 cfg->ifa_flags &= ~IFA_F_OPTIMISTIC; 4867 4868 if (cfg->peer_pfx && 4869 memcmp(&ifp->peer_addr, cfg->peer_pfx, sizeof(struct in6_addr))) { 4870 if (!ipv6_addr_any(&ifp->peer_addr)) 4871 cleanup_prefix_route(ifp, expires, true, true); 4872 new_peer = true; 4873 } 4874 4875 spin_lock_bh(&ifp->lock); 4876 was_managetempaddr = ifp->flags & IFA_F_MANAGETEMPADDR; 4877 had_prefixroute = ifp->flags & IFA_F_PERMANENT && 4878 !(ifp->flags & IFA_F_NOPREFIXROUTE); 4879 ifp->flags &= ~(IFA_F_DEPRECATED | IFA_F_PERMANENT | IFA_F_NODAD | 4880 IFA_F_HOMEADDRESS | IFA_F_MANAGETEMPADDR | 4881 IFA_F_NOPREFIXROUTE); 4882 ifp->flags |= cfg->ifa_flags; 4883 WRITE_ONCE(ifp->tstamp, jiffies); 4884 WRITE_ONCE(ifp->valid_lft, cfg->valid_lft); 4885 WRITE_ONCE(ifp->prefered_lft, cfg->preferred_lft); 4886 WRITE_ONCE(ifp->ifa_proto, cfg->ifa_proto); 4887 4888 if (cfg->rt_priority && cfg->rt_priority != ifp->rt_priority) 4889 WRITE_ONCE(ifp->rt_priority, cfg->rt_priority); 4890 4891 if (new_peer) 4892 ifp->peer_addr = *cfg->peer_pfx; 4893 4894 spin_unlock_bh(&ifp->lock); 4895 if (!(ifp->flags&IFA_F_TENTATIVE)) 4896 ipv6_ifa_notify(0, ifp); 4897 4898 if (!(cfg->ifa_flags & IFA_F_NOPREFIXROUTE)) { 4899 int rc = -ENOENT; 4900 4901 if (had_prefixroute) 4902 rc = modify_prefix_route(net, ifp, expires, flags, false); 4903 4904 /* prefix route could have been deleted; if so restore it */ 4905 if (rc == -ENOENT) { 4906 addrconf_prefix_route(&ifp->addr, ifp->prefix_len, 4907 ifp->rt_priority, ifp->idev->dev, 4908 expires, flags, GFP_KERNEL); 4909 } 4910 4911 if (had_prefixroute && !ipv6_addr_any(&ifp->peer_addr)) 4912 rc = modify_prefix_route(net, ifp, expires, flags, true); 4913 4914 if (rc == -ENOENT && !ipv6_addr_any(&ifp->peer_addr)) { 4915 addrconf_prefix_route(&ifp->peer_addr, ifp->prefix_len, 4916 ifp->rt_priority, ifp->idev->dev, 4917 expires, flags, GFP_KERNEL); 4918 } 4919 } else if (had_prefixroute) { 4920 enum cleanup_prefix_rt_t action; 4921 unsigned long rt_expires; 4922 4923 write_lock_bh(&ifp->idev->lock); 4924 action = check_cleanup_prefix_route(ifp, &rt_expires); 4925 write_unlock_bh(&ifp->idev->lock); 4926 4927 if (action != CLEANUP_PREFIX_RT_NOP) { 4928 cleanup_prefix_route(ifp, rt_expires, 4929 action == CLEANUP_PREFIX_RT_DEL, false); 4930 } 4931 } 4932 4933 if (was_managetempaddr || ifp->flags & IFA_F_MANAGETEMPADDR) { 4934 if (was_managetempaddr && !(ifp->flags & IFA_F_MANAGETEMPADDR)) 4935 delete_tempaddrs(ifp->idev, ifp); 4936 else 4937 manage_tempaddrs(ifp->idev, ifp, cfg->valid_lft, 4938 cfg->preferred_lft, !was_managetempaddr, 4939 jiffies); 4940 } 4941 4942 addrconf_verify_rtnl(net); 4943 4944 return 0; 4945 } 4946 4947 static int 4948 inet6_rtm_newaddr(struct sk_buff *skb, struct nlmsghdr *nlh, 4949 struct netlink_ext_ack *extack) 4950 { 4951 struct net *net = sock_net(skb->sk); 4952 struct nlattr *tb[IFA_MAX+1]; 4953 struct in6_addr *peer_pfx; 4954 struct inet6_ifaddr *ifa; 4955 struct net_device *dev; 4956 struct inet6_dev *idev; 4957 struct ifa6_config cfg; 4958 struct ifaddrmsg *ifm; 4959 unsigned long timeout; 4960 clock_t expires; 4961 u32 flags; 4962 int err; 4963 4964 err = nlmsg_parse_deprecated(nlh, sizeof(*ifm), tb, IFA_MAX, 4965 ifa_ipv6_policy, extack); 4966 if (err < 0) 4967 return err; 4968 4969 memset(&cfg, 0, sizeof(cfg)); 4970 4971 ifm = nlmsg_data(nlh); 4972 cfg.pfx = extract_addr(tb[IFA_ADDRESS], tb[IFA_LOCAL], &peer_pfx); 4973 if (!cfg.pfx) 4974 return -EINVAL; 4975 4976 cfg.peer_pfx = peer_pfx; 4977 cfg.plen = ifm->ifa_prefixlen; 4978 if (tb[IFA_RT_PRIORITY]) 4979 cfg.rt_priority = nla_get_u32(tb[IFA_RT_PRIORITY]); 4980 4981 if (tb[IFA_PROTO]) 4982 cfg.ifa_proto = nla_get_u8(tb[IFA_PROTO]); 4983 4984 cfg.ifa_flags = nla_get_u32_default(tb[IFA_FLAGS], ifm->ifa_flags); 4985 4986 /* We ignore other flags so far. */ 4987 cfg.ifa_flags &= IFA_F_NODAD | IFA_F_HOMEADDRESS | 4988 IFA_F_MANAGETEMPADDR | IFA_F_NOPREFIXROUTE | 4989 IFA_F_MCAUTOJOIN | IFA_F_OPTIMISTIC; 4990 4991 cfg.ifa_flags |= IFA_F_PERMANENT; 4992 cfg.valid_lft = INFINITY_LIFE_TIME; 4993 cfg.preferred_lft = INFINITY_LIFE_TIME; 4994 expires = 0; 4995 flags = 0; 4996 4997 if (tb[IFA_CACHEINFO]) { 4998 struct ifa_cacheinfo *ci; 4999 5000 ci = nla_data(tb[IFA_CACHEINFO]); 5001 cfg.valid_lft = ci->ifa_valid; 5002 cfg.preferred_lft = ci->ifa_prefered; 5003 5004 if (!cfg.valid_lft || cfg.preferred_lft > cfg.valid_lft) { 5005 NL_SET_ERR_MSG_MOD(extack, "address lifetime invalid"); 5006 return -EINVAL; 5007 } 5008 5009 timeout = addrconf_timeout_fixup(cfg.valid_lft, HZ); 5010 if (addrconf_finite_timeout(timeout)) { 5011 cfg.ifa_flags &= ~IFA_F_PERMANENT; 5012 cfg.valid_lft = timeout; 5013 expires = jiffies_to_clock_t(timeout * HZ); 5014 flags = RTF_EXPIRES; 5015 } 5016 5017 timeout = addrconf_timeout_fixup(cfg.preferred_lft, HZ); 5018 if (addrconf_finite_timeout(timeout)) { 5019 if (timeout == 0) 5020 cfg.ifa_flags |= IFA_F_DEPRECATED; 5021 5022 cfg.preferred_lft = timeout; 5023 } 5024 } 5025 5026 rtnl_net_lock(net); 5027 5028 dev = __dev_get_by_index(net, ifm->ifa_index); 5029 if (!dev) { 5030 NL_SET_ERR_MSG_MOD(extack, "Unable to find the interface"); 5031 err = -ENODEV; 5032 goto unlock_rtnl; 5033 } 5034 5035 netdev_lock_ops(dev); 5036 idev = ipv6_find_idev(dev); 5037 if (IS_ERR(idev)) { 5038 err = PTR_ERR(idev); 5039 goto unlock; 5040 } 5041 5042 if (!ipv6_allow_optimistic_dad(net, idev)) 5043 cfg.ifa_flags &= ~IFA_F_OPTIMISTIC; 5044 5045 if (cfg.ifa_flags & IFA_F_NODAD && 5046 cfg.ifa_flags & IFA_F_OPTIMISTIC) { 5047 NL_SET_ERR_MSG(extack, "IFA_F_NODAD and IFA_F_OPTIMISTIC are mutually exclusive"); 5048 err = -EINVAL; 5049 goto unlock; 5050 } 5051 5052 ifa = ipv6_get_ifaddr(net, cfg.pfx, dev, 1); 5053 if (!ifa) { 5054 /* 5055 * It would be best to check for !NLM_F_CREATE here but 5056 * userspace already relies on not having to provide this. 5057 */ 5058 err = inet6_addr_add(net, dev, &cfg, expires, flags, extack); 5059 goto unlock; 5060 } 5061 5062 if (nlh->nlmsg_flags & NLM_F_EXCL || 5063 !(nlh->nlmsg_flags & NLM_F_REPLACE)) { 5064 NL_SET_ERR_MSG_MOD(extack, "address already assigned"); 5065 err = -EEXIST; 5066 } else { 5067 err = inet6_addr_modify(net, ifa, &cfg, expires, flags); 5068 } 5069 5070 in6_ifa_put(ifa); 5071 unlock: 5072 netdev_unlock_ops(dev); 5073 unlock_rtnl: 5074 rtnl_net_unlock(net); 5075 5076 return err; 5077 } 5078 5079 static void put_ifaddrmsg(struct nlmsghdr *nlh, u8 prefixlen, u32 flags, 5080 u8 scope, int ifindex) 5081 { 5082 struct ifaddrmsg *ifm; 5083 5084 ifm = nlmsg_data(nlh); 5085 ifm->ifa_family = AF_INET6; 5086 ifm->ifa_prefixlen = prefixlen; 5087 ifm->ifa_flags = flags; 5088 ifm->ifa_scope = scope; 5089 ifm->ifa_index = ifindex; 5090 } 5091 5092 static int put_cacheinfo(struct sk_buff *skb, unsigned long cstamp, 5093 unsigned long tstamp, u32 preferred, u32 valid) 5094 { 5095 struct ifa_cacheinfo ci; 5096 5097 ci.cstamp = cstamp_delta(cstamp); 5098 ci.tstamp = cstamp_delta(tstamp); 5099 ci.ifa_prefered = preferred; 5100 ci.ifa_valid = valid; 5101 5102 return nla_put(skb, IFA_CACHEINFO, sizeof(ci), &ci); 5103 } 5104 5105 static inline int rt_scope(int ifa_scope) 5106 { 5107 if (ifa_scope & IFA_HOST) 5108 return RT_SCOPE_HOST; 5109 else if (ifa_scope & IFA_LINK) 5110 return RT_SCOPE_LINK; 5111 else if (ifa_scope & IFA_SITE) 5112 return RT_SCOPE_SITE; 5113 else 5114 return RT_SCOPE_UNIVERSE; 5115 } 5116 5117 static inline int inet6_ifaddr_msgsize(void) 5118 { 5119 return NLMSG_ALIGN(sizeof(struct ifaddrmsg)) 5120 + nla_total_size(16) /* IFA_LOCAL */ 5121 + nla_total_size(16) /* IFA_ADDRESS */ 5122 + nla_total_size(sizeof(struct ifa_cacheinfo)) 5123 + nla_total_size(4) /* IFA_FLAGS */ 5124 + nla_total_size(1) /* IFA_PROTO */ 5125 + nla_total_size(4) /* IFA_RT_PRIORITY */; 5126 } 5127 5128 static int inet6_fill_ifaddr(struct sk_buff *skb, 5129 const struct inet6_ifaddr *ifa, 5130 struct inet6_fill_args *args) 5131 { 5132 struct nlmsghdr *nlh; 5133 u32 preferred, valid; 5134 u32 flags, priority; 5135 u8 proto; 5136 5137 nlh = nlmsg_put(skb, args->portid, args->seq, args->event, 5138 sizeof(struct ifaddrmsg), args->flags); 5139 if (!nlh) 5140 return -EMSGSIZE; 5141 5142 flags = READ_ONCE(ifa->flags); 5143 put_ifaddrmsg(nlh, ifa->prefix_len, ifa->flags, rt_scope(ifa->scope), 5144 ifa->idev->dev->ifindex); 5145 5146 if (args->netnsid >= 0 && 5147 nla_put_s32(skb, IFA_TARGET_NETNSID, args->netnsid)) 5148 goto error; 5149 5150 preferred = READ_ONCE(ifa->prefered_lft); 5151 valid = READ_ONCE(ifa->valid_lft); 5152 5153 if (!((flags & IFA_F_PERMANENT) && 5154 (preferred == INFINITY_LIFE_TIME))) { 5155 if (preferred != INFINITY_LIFE_TIME) { 5156 long tval = (jiffies - READ_ONCE(ifa->tstamp)) / HZ; 5157 5158 if (preferred > tval) 5159 preferred -= tval; 5160 else 5161 preferred = 0; 5162 if (valid != INFINITY_LIFE_TIME) { 5163 if (valid > tval) 5164 valid -= tval; 5165 else 5166 valid = 0; 5167 } 5168 } 5169 } else { 5170 preferred = INFINITY_LIFE_TIME; 5171 valid = INFINITY_LIFE_TIME; 5172 } 5173 5174 if (!ipv6_addr_any(&ifa->peer_addr)) { 5175 if (nla_put_in6_addr(skb, IFA_LOCAL, &ifa->addr) < 0 || 5176 nla_put_in6_addr(skb, IFA_ADDRESS, &ifa->peer_addr) < 0) 5177 goto error; 5178 } else { 5179 if (nla_put_in6_addr(skb, IFA_ADDRESS, &ifa->addr) < 0) 5180 goto error; 5181 } 5182 5183 priority = READ_ONCE(ifa->rt_priority); 5184 if (priority && nla_put_u32(skb, IFA_RT_PRIORITY, priority)) 5185 goto error; 5186 5187 if (put_cacheinfo(skb, ifa->cstamp, READ_ONCE(ifa->tstamp), 5188 preferred, valid) < 0) 5189 goto error; 5190 5191 if (nla_put_u32(skb, IFA_FLAGS, flags) < 0) 5192 goto error; 5193 5194 proto = READ_ONCE(ifa->ifa_proto); 5195 if (proto && nla_put_u8(skb, IFA_PROTO, proto)) 5196 goto error; 5197 5198 nlmsg_end(skb, nlh); 5199 return 0; 5200 5201 error: 5202 nlmsg_cancel(skb, nlh); 5203 return -EMSGSIZE; 5204 } 5205 5206 int inet6_fill_ifmcaddr(struct sk_buff *skb, 5207 const struct ifmcaddr6 *ifmca, 5208 struct inet6_fill_args *args) 5209 { 5210 int ifindex = ifmca->idev->dev->ifindex; 5211 u8 scope = RT_SCOPE_UNIVERSE; 5212 struct nlmsghdr *nlh; 5213 5214 if (!args->force_rt_scope_universe && 5215 ipv6_addr_scope(&ifmca->mca_addr) & IFA_SITE) 5216 scope = RT_SCOPE_SITE; 5217 5218 nlh = nlmsg_put(skb, args->portid, args->seq, args->event, 5219 sizeof(struct ifaddrmsg), args->flags); 5220 if (!nlh) 5221 return -EMSGSIZE; 5222 5223 if (args->netnsid >= 0 && 5224 nla_put_s32(skb, IFA_TARGET_NETNSID, args->netnsid)) { 5225 nlmsg_cancel(skb, nlh); 5226 return -EMSGSIZE; 5227 } 5228 5229 put_ifaddrmsg(nlh, 128, IFA_F_PERMANENT, scope, ifindex); 5230 if (nla_put_in6_addr(skb, IFA_MULTICAST, &ifmca->mca_addr) < 0 || 5231 put_cacheinfo(skb, ifmca->mca_cstamp, READ_ONCE(ifmca->mca_tstamp), 5232 INFINITY_LIFE_TIME, INFINITY_LIFE_TIME) < 0) { 5233 nlmsg_cancel(skb, nlh); 5234 return -EMSGSIZE; 5235 } 5236 5237 nlmsg_end(skb, nlh); 5238 return 0; 5239 } 5240 5241 int inet6_fill_ifacaddr(struct sk_buff *skb, 5242 const struct ifacaddr6 *ifaca, 5243 struct inet6_fill_args *args) 5244 { 5245 struct net_device *dev = fib6_info_nh_dev(ifaca->aca_rt); 5246 int ifindex = dev ? dev->ifindex : 1; 5247 u8 scope = RT_SCOPE_UNIVERSE; 5248 struct nlmsghdr *nlh; 5249 5250 if (ipv6_addr_scope(&ifaca->aca_addr) & IFA_SITE) 5251 scope = RT_SCOPE_SITE; 5252 5253 nlh = nlmsg_put(skb, args->portid, args->seq, args->event, 5254 sizeof(struct ifaddrmsg), args->flags); 5255 if (!nlh) 5256 return -EMSGSIZE; 5257 5258 if (args->netnsid >= 0 && 5259 nla_put_s32(skb, IFA_TARGET_NETNSID, args->netnsid)) { 5260 nlmsg_cancel(skb, nlh); 5261 return -EMSGSIZE; 5262 } 5263 5264 put_ifaddrmsg(nlh, 128, IFA_F_PERMANENT, scope, ifindex); 5265 if (nla_put_in6_addr(skb, IFA_ANYCAST, &ifaca->aca_addr) < 0 || 5266 put_cacheinfo(skb, ifaca->aca_cstamp, READ_ONCE(ifaca->aca_tstamp), 5267 INFINITY_LIFE_TIME, INFINITY_LIFE_TIME) < 0) { 5268 nlmsg_cancel(skb, nlh); 5269 return -EMSGSIZE; 5270 } 5271 5272 nlmsg_end(skb, nlh); 5273 return 0; 5274 } 5275 5276 /* called with rcu_read_lock() */ 5277 static int in6_dump_addrs(const struct inet6_dev *idev, struct sk_buff *skb, 5278 struct netlink_callback *cb, int *s_ip_idx, 5279 struct inet6_fill_args *fillargs) 5280 { 5281 const struct ifmcaddr6 *ifmca; 5282 const struct ifacaddr6 *ifaca; 5283 int ip_idx = 0; 5284 int err = 0; 5285 5286 switch (fillargs->type) { 5287 case UNICAST_ADDR: { 5288 const struct inet6_ifaddr *ifa; 5289 fillargs->event = RTM_NEWADDR; 5290 5291 /* unicast address incl. temp addr */ 5292 list_for_each_entry_rcu(ifa, &idev->addr_list, if_list) { 5293 if (ip_idx < *s_ip_idx) 5294 goto next; 5295 err = inet6_fill_ifaddr(skb, ifa, fillargs); 5296 if (err < 0) 5297 break; 5298 nl_dump_check_consistent(cb, nlmsg_hdr(skb)); 5299 next: 5300 ip_idx++; 5301 } 5302 break; 5303 } 5304 case MULTICAST_ADDR: 5305 fillargs->event = RTM_GETMULTICAST; 5306 5307 /* multicast address */ 5308 for (ifmca = rcu_dereference(idev->mc_list); 5309 ifmca; 5310 ifmca = rcu_dereference(ifmca->next), ip_idx++) { 5311 if (ip_idx < *s_ip_idx) 5312 continue; 5313 err = inet6_fill_ifmcaddr(skb, ifmca, fillargs); 5314 if (err < 0) 5315 break; 5316 } 5317 break; 5318 case ANYCAST_ADDR: 5319 fillargs->event = RTM_GETANYCAST; 5320 /* anycast address */ 5321 for (ifaca = rcu_dereference(idev->ac_list); ifaca; 5322 ifaca = rcu_dereference(ifaca->aca_next), ip_idx++) { 5323 if (ip_idx < *s_ip_idx) 5324 continue; 5325 err = inet6_fill_ifacaddr(skb, ifaca, fillargs); 5326 if (err < 0) 5327 break; 5328 } 5329 break; 5330 default: 5331 break; 5332 } 5333 *s_ip_idx = err ? ip_idx : 0; 5334 return err; 5335 } 5336 5337 static int inet6_valid_dump_ifaddr_req(const struct nlmsghdr *nlh, 5338 struct inet6_fill_args *fillargs, 5339 struct net **tgt_net, struct sock *sk, 5340 struct netlink_callback *cb) 5341 { 5342 struct netlink_ext_ack *extack = cb->extack; 5343 struct nlattr *tb[IFA_MAX+1]; 5344 struct ifaddrmsg *ifm; 5345 int err, i; 5346 5347 ifm = nlmsg_payload(nlh, sizeof(*ifm)); 5348 if (!ifm) { 5349 NL_SET_ERR_MSG_MOD(extack, "Invalid header for address dump request"); 5350 return -EINVAL; 5351 } 5352 5353 if (ifm->ifa_prefixlen || ifm->ifa_flags || ifm->ifa_scope) { 5354 NL_SET_ERR_MSG_MOD(extack, "Invalid values in header for address dump request"); 5355 return -EINVAL; 5356 } 5357 5358 fillargs->ifindex = ifm->ifa_index; 5359 if (fillargs->ifindex) { 5360 cb->answer_flags |= NLM_F_DUMP_FILTERED; 5361 fillargs->flags |= NLM_F_DUMP_FILTERED; 5362 } 5363 5364 err = nlmsg_parse_deprecated_strict(nlh, sizeof(*ifm), tb, IFA_MAX, 5365 ifa_ipv6_policy, extack); 5366 if (err < 0) 5367 return err; 5368 5369 for (i = 0; i <= IFA_MAX; ++i) { 5370 if (!tb[i]) 5371 continue; 5372 5373 if (i == IFA_TARGET_NETNSID) { 5374 struct net *net; 5375 5376 fillargs->netnsid = nla_get_s32(tb[i]); 5377 net = rtnl_get_net_ns_capable(sk, fillargs->netnsid); 5378 if (IS_ERR(net)) { 5379 fillargs->netnsid = -1; 5380 NL_SET_ERR_MSG_MOD(extack, "Invalid target network namespace id"); 5381 return PTR_ERR(net); 5382 } 5383 *tgt_net = net; 5384 } else { 5385 NL_SET_ERR_MSG_MOD(extack, "Unsupported attribute in dump request"); 5386 return -EINVAL; 5387 } 5388 } 5389 5390 return 0; 5391 } 5392 5393 static int inet6_dump_addr(struct sk_buff *skb, struct netlink_callback *cb, 5394 enum addr_type_t type) 5395 { 5396 struct net *tgt_net = sock_net(skb->sk); 5397 const struct nlmsghdr *nlh = cb->nlh; 5398 struct inet6_fill_args fillargs = { 5399 .portid = NETLINK_CB(cb->skb).portid, 5400 .seq = cb->nlh->nlmsg_seq, 5401 .flags = NLM_F_MULTI, 5402 .netnsid = -1, 5403 .type = type, 5404 .force_rt_scope_universe = false, 5405 }; 5406 struct { 5407 unsigned long ifindex; 5408 int ip_idx; 5409 } *ctx = (void *)cb->ctx; 5410 struct net_device *dev; 5411 struct inet6_dev *idev; 5412 int err = 0; 5413 5414 rcu_read_lock(); 5415 if (cb->strict_check) { 5416 err = inet6_valid_dump_ifaddr_req(nlh, &fillargs, &tgt_net, 5417 skb->sk, cb); 5418 if (err < 0) 5419 goto done; 5420 5421 err = 0; 5422 if (fillargs.ifindex) { 5423 dev = dev_get_by_index_rcu(tgt_net, fillargs.ifindex); 5424 if (!dev) { 5425 err = -ENODEV; 5426 goto done; 5427 } 5428 idev = __in6_dev_get(dev); 5429 if (idev) 5430 err = in6_dump_addrs(idev, skb, cb, 5431 &ctx->ip_idx, 5432 &fillargs); 5433 goto done; 5434 } 5435 } 5436 5437 cb->seq = inet6_base_seq(tgt_net); 5438 for_each_netdev_dump(tgt_net, dev, ctx->ifindex) { 5439 idev = __in6_dev_get(dev); 5440 if (!idev) 5441 continue; 5442 err = in6_dump_addrs(idev, skb, cb, &ctx->ip_idx, 5443 &fillargs); 5444 if (err < 0) 5445 goto done; 5446 } 5447 done: 5448 rcu_read_unlock(); 5449 if (fillargs.netnsid >= 0) 5450 put_net(tgt_net); 5451 5452 return err; 5453 } 5454 5455 static int inet6_dump_ifaddr(struct sk_buff *skb, struct netlink_callback *cb) 5456 { 5457 enum addr_type_t type = UNICAST_ADDR; 5458 5459 return inet6_dump_addr(skb, cb, type); 5460 } 5461 5462 static int inet6_dump_ifmcaddr(struct sk_buff *skb, struct netlink_callback *cb) 5463 { 5464 enum addr_type_t type = MULTICAST_ADDR; 5465 5466 return inet6_dump_addr(skb, cb, type); 5467 } 5468 5469 5470 static int inet6_dump_ifacaddr(struct sk_buff *skb, struct netlink_callback *cb) 5471 { 5472 enum addr_type_t type = ANYCAST_ADDR; 5473 5474 return inet6_dump_addr(skb, cb, type); 5475 } 5476 5477 static int inet6_rtm_valid_getaddr_req(struct sk_buff *skb, 5478 const struct nlmsghdr *nlh, 5479 struct nlattr **tb, 5480 struct netlink_ext_ack *extack) 5481 { 5482 struct ifaddrmsg *ifm; 5483 int i, err; 5484 5485 ifm = nlmsg_payload(nlh, sizeof(*ifm)); 5486 if (!ifm) { 5487 NL_SET_ERR_MSG_MOD(extack, "Invalid header for get address request"); 5488 return -EINVAL; 5489 } 5490 5491 if (!netlink_strict_get_check(skb)) 5492 return nlmsg_parse_deprecated(nlh, sizeof(*ifm), tb, IFA_MAX, 5493 ifa_ipv6_policy, extack); 5494 5495 if (ifm->ifa_prefixlen || ifm->ifa_flags || ifm->ifa_scope) { 5496 NL_SET_ERR_MSG_MOD(extack, "Invalid values in header for get address request"); 5497 return -EINVAL; 5498 } 5499 5500 err = nlmsg_parse_deprecated_strict(nlh, sizeof(*ifm), tb, IFA_MAX, 5501 ifa_ipv6_policy, extack); 5502 if (err) 5503 return err; 5504 5505 for (i = 0; i <= IFA_MAX; i++) { 5506 if (!tb[i]) 5507 continue; 5508 5509 switch (i) { 5510 case IFA_TARGET_NETNSID: 5511 case IFA_ADDRESS: 5512 case IFA_LOCAL: 5513 break; 5514 default: 5515 NL_SET_ERR_MSG_MOD(extack, "Unsupported attribute in get address request"); 5516 return -EINVAL; 5517 } 5518 } 5519 5520 return 0; 5521 } 5522 5523 static int inet6_rtm_getaddr(struct sk_buff *in_skb, struct nlmsghdr *nlh, 5524 struct netlink_ext_ack *extack) 5525 { 5526 struct net *tgt_net = sock_net(in_skb->sk); 5527 struct inet6_fill_args fillargs = { 5528 .portid = NETLINK_CB(in_skb).portid, 5529 .seq = nlh->nlmsg_seq, 5530 .event = RTM_NEWADDR, 5531 .flags = 0, 5532 .netnsid = -1, 5533 .force_rt_scope_universe = false, 5534 }; 5535 struct ifaddrmsg *ifm; 5536 struct nlattr *tb[IFA_MAX+1]; 5537 struct in6_addr *addr = NULL, *peer; 5538 struct net_device *dev = NULL; 5539 struct inet6_ifaddr *ifa; 5540 struct sk_buff *skb; 5541 int err; 5542 5543 err = inet6_rtm_valid_getaddr_req(in_skb, nlh, tb, extack); 5544 if (err < 0) 5545 return err; 5546 5547 if (tb[IFA_TARGET_NETNSID]) { 5548 fillargs.netnsid = nla_get_s32(tb[IFA_TARGET_NETNSID]); 5549 5550 tgt_net = rtnl_get_net_ns_capable(NETLINK_CB(in_skb).sk, 5551 fillargs.netnsid); 5552 if (IS_ERR(tgt_net)) 5553 return PTR_ERR(tgt_net); 5554 } 5555 5556 addr = extract_addr(tb[IFA_ADDRESS], tb[IFA_LOCAL], &peer); 5557 if (!addr) { 5558 err = -EINVAL; 5559 goto errout; 5560 } 5561 ifm = nlmsg_data(nlh); 5562 if (ifm->ifa_index) 5563 dev = dev_get_by_index(tgt_net, ifm->ifa_index); 5564 5565 ifa = ipv6_get_ifaddr(tgt_net, addr, dev, 1); 5566 if (!ifa) { 5567 err = -EADDRNOTAVAIL; 5568 goto errout; 5569 } 5570 5571 skb = nlmsg_new(inet6_ifaddr_msgsize(), GFP_KERNEL); 5572 if (!skb) { 5573 err = -ENOBUFS; 5574 goto errout_ifa; 5575 } 5576 5577 err = inet6_fill_ifaddr(skb, ifa, &fillargs); 5578 if (err < 0) { 5579 /* -EMSGSIZE implies BUG in inet6_ifaddr_msgsize() */ 5580 WARN_ON(err == -EMSGSIZE); 5581 kfree_skb(skb); 5582 goto errout_ifa; 5583 } 5584 err = rtnl_unicast(skb, tgt_net, NETLINK_CB(in_skb).portid); 5585 errout_ifa: 5586 in6_ifa_put(ifa); 5587 errout: 5588 dev_put(dev); 5589 if (fillargs.netnsid >= 0) 5590 put_net(tgt_net); 5591 5592 return err; 5593 } 5594 5595 static void inet6_ifa_notify(int event, struct inet6_ifaddr *ifa) 5596 { 5597 struct sk_buff *skb; 5598 struct net *net = dev_net(ifa->idev->dev); 5599 struct inet6_fill_args fillargs = { 5600 .portid = 0, 5601 .seq = 0, 5602 .event = event, 5603 .flags = 0, 5604 .netnsid = -1, 5605 .force_rt_scope_universe = false, 5606 }; 5607 int err = -ENOBUFS; 5608 5609 skb = nlmsg_new(inet6_ifaddr_msgsize(), GFP_ATOMIC); 5610 if (!skb) 5611 goto errout; 5612 5613 err = inet6_fill_ifaddr(skb, ifa, &fillargs); 5614 if (err < 0) { 5615 /* -EMSGSIZE implies BUG in inet6_ifaddr_msgsize() */ 5616 WARN_ON(err == -EMSGSIZE); 5617 kfree_skb(skb); 5618 goto errout; 5619 } 5620 rtnl_notify(skb, net, 0, RTNLGRP_IPV6_IFADDR, NULL, GFP_ATOMIC); 5621 return; 5622 errout: 5623 rtnl_set_sk_err(net, RTNLGRP_IPV6_IFADDR, err); 5624 } 5625 5626 static void ipv6_store_devconf(const struct ipv6_devconf *cnf, 5627 __s32 *array, int bytes) 5628 { 5629 BUG_ON(bytes < (DEVCONF_MAX * 4)); 5630 5631 memset(array, 0, bytes); 5632 array[DEVCONF_FORWARDING] = READ_ONCE(cnf->forwarding); 5633 array[DEVCONF_HOPLIMIT] = READ_ONCE(cnf->hop_limit); 5634 array[DEVCONF_MTU6] = READ_ONCE(cnf->mtu6); 5635 array[DEVCONF_ACCEPT_RA] = READ_ONCE(cnf->accept_ra); 5636 array[DEVCONF_ACCEPT_REDIRECTS] = READ_ONCE(cnf->accept_redirects); 5637 array[DEVCONF_AUTOCONF] = READ_ONCE(cnf->autoconf); 5638 array[DEVCONF_DAD_TRANSMITS] = READ_ONCE(cnf->dad_transmits); 5639 array[DEVCONF_RTR_SOLICITS] = READ_ONCE(cnf->rtr_solicits); 5640 array[DEVCONF_RTR_SOLICIT_INTERVAL] = 5641 jiffies_to_msecs(READ_ONCE(cnf->rtr_solicit_interval)); 5642 array[DEVCONF_RTR_SOLICIT_MAX_INTERVAL] = 5643 jiffies_to_msecs(READ_ONCE(cnf->rtr_solicit_max_interval)); 5644 array[DEVCONF_RTR_SOLICIT_DELAY] = 5645 jiffies_to_msecs(READ_ONCE(cnf->rtr_solicit_delay)); 5646 array[DEVCONF_FORCE_MLD_VERSION] = READ_ONCE(cnf->force_mld_version); 5647 array[DEVCONF_MLDV1_UNSOLICITED_REPORT_INTERVAL] = 5648 jiffies_to_msecs(READ_ONCE(cnf->mldv1_unsolicited_report_interval)); 5649 array[DEVCONF_MLDV2_UNSOLICITED_REPORT_INTERVAL] = 5650 jiffies_to_msecs(READ_ONCE(cnf->mldv2_unsolicited_report_interval)); 5651 array[DEVCONF_USE_TEMPADDR] = READ_ONCE(cnf->use_tempaddr); 5652 array[DEVCONF_TEMP_VALID_LFT] = READ_ONCE(cnf->temp_valid_lft); 5653 array[DEVCONF_TEMP_PREFERED_LFT] = READ_ONCE(cnf->temp_prefered_lft); 5654 array[DEVCONF_REGEN_MAX_RETRY] = READ_ONCE(cnf->regen_max_retry); 5655 array[DEVCONF_MAX_DESYNC_FACTOR] = READ_ONCE(cnf->max_desync_factor); 5656 array[DEVCONF_MAX_ADDRESSES] = READ_ONCE(cnf->max_addresses); 5657 array[DEVCONF_ACCEPT_RA_DEFRTR] = READ_ONCE(cnf->accept_ra_defrtr); 5658 array[DEVCONF_RA_DEFRTR_METRIC] = READ_ONCE(cnf->ra_defrtr_metric); 5659 array[DEVCONF_ACCEPT_RA_MIN_HOP_LIMIT] = 5660 READ_ONCE(cnf->accept_ra_min_hop_limit); 5661 array[DEVCONF_ACCEPT_RA_PINFO] = READ_ONCE(cnf->accept_ra_pinfo); 5662 #ifdef CONFIG_IPV6_ROUTER_PREF 5663 array[DEVCONF_ACCEPT_RA_RTR_PREF] = READ_ONCE(cnf->accept_ra_rtr_pref); 5664 array[DEVCONF_RTR_PROBE_INTERVAL] = 5665 jiffies_to_msecs(READ_ONCE(cnf->rtr_probe_interval)); 5666 #ifdef CONFIG_IPV6_ROUTE_INFO 5667 array[DEVCONF_ACCEPT_RA_RT_INFO_MIN_PLEN] = 5668 READ_ONCE(cnf->accept_ra_rt_info_min_plen); 5669 array[DEVCONF_ACCEPT_RA_RT_INFO_MAX_PLEN] = 5670 READ_ONCE(cnf->accept_ra_rt_info_max_plen); 5671 #endif 5672 #endif 5673 array[DEVCONF_PROXY_NDP] = READ_ONCE(cnf->proxy_ndp); 5674 array[DEVCONF_ACCEPT_SOURCE_ROUTE] = 5675 READ_ONCE(cnf->accept_source_route); 5676 #ifdef CONFIG_IPV6_OPTIMISTIC_DAD 5677 array[DEVCONF_OPTIMISTIC_DAD] = READ_ONCE(cnf->optimistic_dad); 5678 array[DEVCONF_USE_OPTIMISTIC] = READ_ONCE(cnf->use_optimistic); 5679 #endif 5680 #ifdef CONFIG_IPV6_MROUTE 5681 array[DEVCONF_MC_FORWARDING] = atomic_read(&cnf->mc_forwarding); 5682 #endif 5683 array[DEVCONF_DISABLE_IPV6] = READ_ONCE(cnf->disable_ipv6); 5684 array[DEVCONF_ACCEPT_DAD] = READ_ONCE(cnf->accept_dad); 5685 array[DEVCONF_FORCE_TLLAO] = READ_ONCE(cnf->force_tllao); 5686 array[DEVCONF_NDISC_NOTIFY] = READ_ONCE(cnf->ndisc_notify); 5687 array[DEVCONF_SUPPRESS_FRAG_NDISC] = 5688 READ_ONCE(cnf->suppress_frag_ndisc); 5689 array[DEVCONF_ACCEPT_RA_FROM_LOCAL] = 5690 READ_ONCE(cnf->accept_ra_from_local); 5691 array[DEVCONF_ACCEPT_RA_MTU] = READ_ONCE(cnf->accept_ra_mtu); 5692 array[DEVCONF_IGNORE_ROUTES_WITH_LINKDOWN] = 5693 READ_ONCE(cnf->ignore_routes_with_linkdown); 5694 /* we omit DEVCONF_STABLE_SECRET for now */ 5695 array[DEVCONF_USE_OIF_ADDRS_ONLY] = READ_ONCE(cnf->use_oif_addrs_only); 5696 array[DEVCONF_DROP_UNICAST_IN_L2_MULTICAST] = 5697 READ_ONCE(cnf->drop_unicast_in_l2_multicast); 5698 array[DEVCONF_DROP_UNSOLICITED_NA] = READ_ONCE(cnf->drop_unsolicited_na); 5699 array[DEVCONF_KEEP_ADDR_ON_DOWN] = READ_ONCE(cnf->keep_addr_on_down); 5700 array[DEVCONF_SEG6_ENABLED] = READ_ONCE(cnf->seg6_enabled); 5701 #ifdef CONFIG_IPV6_SEG6_HMAC 5702 array[DEVCONF_SEG6_REQUIRE_HMAC] = READ_ONCE(cnf->seg6_require_hmac); 5703 #endif 5704 array[DEVCONF_ENHANCED_DAD] = READ_ONCE(cnf->enhanced_dad); 5705 array[DEVCONF_ADDR_GEN_MODE] = READ_ONCE(cnf->addr_gen_mode); 5706 array[DEVCONF_DISABLE_POLICY] = READ_ONCE(cnf->disable_policy); 5707 array[DEVCONF_NDISC_TCLASS] = READ_ONCE(cnf->ndisc_tclass); 5708 array[DEVCONF_RPL_SEG_ENABLED] = READ_ONCE(cnf->rpl_seg_enabled); 5709 array[DEVCONF_IOAM6_ENABLED] = READ_ONCE(cnf->ioam6_enabled); 5710 array[DEVCONF_IOAM6_ID] = READ_ONCE(cnf->ioam6_id); 5711 array[DEVCONF_IOAM6_ID_WIDE] = READ_ONCE(cnf->ioam6_id_wide); 5712 array[DEVCONF_NDISC_EVICT_NOCARRIER] = 5713 READ_ONCE(cnf->ndisc_evict_nocarrier); 5714 array[DEVCONF_ACCEPT_UNTRACKED_NA] = 5715 READ_ONCE(cnf->accept_untracked_na); 5716 array[DEVCONF_ACCEPT_RA_MIN_LFT] = READ_ONCE(cnf->accept_ra_min_lft); 5717 } 5718 5719 static inline size_t inet6_ifla6_size(void) 5720 { 5721 return nla_total_size(4) /* IFLA_INET6_FLAGS */ 5722 + nla_total_size(sizeof(struct ifla_cacheinfo)) 5723 + nla_total_size(DEVCONF_MAX * 4) /* IFLA_INET6_CONF */ 5724 + nla_total_size(IPSTATS_MIB_MAX * 8) /* IFLA_INET6_STATS */ 5725 + nla_total_size(ICMP6_MIB_MAX * 8) /* IFLA_INET6_ICMP6STATS */ 5726 + nla_total_size(sizeof(struct in6_addr)) /* IFLA_INET6_TOKEN */ 5727 + nla_total_size(1) /* IFLA_INET6_ADDR_GEN_MODE */ 5728 + nla_total_size(4) /* IFLA_INET6_RA_MTU */ 5729 + 0; 5730 } 5731 5732 static inline size_t inet6_if_nlmsg_size(void) 5733 { 5734 return NLMSG_ALIGN(sizeof(struct ifinfomsg)) 5735 + nla_total_size(IFNAMSIZ) /* IFLA_IFNAME */ 5736 + nla_total_size(MAX_ADDR_LEN) /* IFLA_ADDRESS */ 5737 + nla_total_size(4) /* IFLA_MTU */ 5738 + nla_total_size(4) /* IFLA_LINK */ 5739 + nla_total_size(1) /* IFLA_OPERSTATE */ 5740 + nla_total_size(inet6_ifla6_size()); /* IFLA_PROTINFO */ 5741 } 5742 5743 static inline void __snmp6_fill_statsdev(u64 *stats, atomic_long_t *mib, 5744 int bytes) 5745 { 5746 int i; 5747 int pad = bytes - sizeof(u64) * ICMP6_MIB_MAX; 5748 BUG_ON(pad < 0); 5749 5750 /* Use put_unaligned() because stats may not be aligned for u64. */ 5751 put_unaligned(ICMP6_MIB_MAX, &stats[0]); 5752 for (i = 1; i < ICMP6_MIB_MAX; i++) 5753 put_unaligned(atomic_long_read(&mib[i]), &stats[i]); 5754 5755 memset(&stats[ICMP6_MIB_MAX], 0, pad); 5756 } 5757 5758 static inline void __snmp6_fill_stats64(u64 *stats, void __percpu *mib, 5759 int bytes, size_t syncpoff) 5760 { 5761 int i, c; 5762 u64 buff[IPSTATS_MIB_MAX]; 5763 int pad = bytes - sizeof(u64) * IPSTATS_MIB_MAX; 5764 5765 BUG_ON(pad < 0); 5766 5767 memset(buff, 0, sizeof(buff)); 5768 buff[0] = IPSTATS_MIB_MAX; 5769 5770 for_each_possible_cpu(c) { 5771 for (i = 1; i < IPSTATS_MIB_MAX; i++) 5772 buff[i] += snmp_get_cpu_field64(mib, c, i, syncpoff); 5773 } 5774 5775 memcpy(stats, buff, IPSTATS_MIB_MAX * sizeof(u64)); 5776 memset(&stats[IPSTATS_MIB_MAX], 0, pad); 5777 } 5778 5779 static void snmp6_fill_stats(u64 *stats, struct inet6_dev *idev, int attrtype, 5780 int bytes) 5781 { 5782 switch (attrtype) { 5783 case IFLA_INET6_STATS: 5784 __snmp6_fill_stats64(stats, idev->stats.ipv6, bytes, 5785 offsetof(struct ipstats_mib, syncp)); 5786 break; 5787 case IFLA_INET6_ICMP6STATS: 5788 __snmp6_fill_statsdev(stats, idev->stats.icmpv6dev->mibs, bytes); 5789 break; 5790 } 5791 } 5792 5793 static int inet6_fill_ifla6_stats_attrs(struct sk_buff *skb, 5794 struct inet6_dev *idev) 5795 { 5796 struct nlattr *nla; 5797 5798 nla = nla_reserve(skb, IFLA_INET6_STATS, IPSTATS_MIB_MAX * sizeof(u64)); 5799 if (!nla) 5800 goto nla_put_failure; 5801 snmp6_fill_stats(nla_data(nla), idev, IFLA_INET6_STATS, nla_len(nla)); 5802 5803 nla = nla_reserve(skb, IFLA_INET6_ICMP6STATS, ICMP6_MIB_MAX * sizeof(u64)); 5804 if (!nla) 5805 goto nla_put_failure; 5806 snmp6_fill_stats(nla_data(nla), idev, IFLA_INET6_ICMP6STATS, nla_len(nla)); 5807 5808 return 0; 5809 5810 nla_put_failure: 5811 return -EMSGSIZE; 5812 } 5813 5814 static int inet6_fill_ifla6_attrs(struct sk_buff *skb, struct inet6_dev *idev, 5815 u32 ext_filter_mask) 5816 { 5817 struct ifla_cacheinfo ci; 5818 struct nlattr *nla; 5819 u32 ra_mtu; 5820 5821 if (nla_put_u32(skb, IFLA_INET6_FLAGS, READ_ONCE(idev->if_flags))) 5822 goto nla_put_failure; 5823 ci.max_reasm_len = IPV6_MAXPLEN; 5824 ci.tstamp = cstamp_delta(READ_ONCE(idev->tstamp)); 5825 ci.reachable_time = jiffies_to_msecs(idev->nd_parms->reachable_time); 5826 ci.retrans_time = jiffies_to_msecs(NEIGH_VAR(idev->nd_parms, RETRANS_TIME)); 5827 if (nla_put(skb, IFLA_INET6_CACHEINFO, sizeof(ci), &ci)) 5828 goto nla_put_failure; 5829 nla = nla_reserve(skb, IFLA_INET6_CONF, DEVCONF_MAX * sizeof(s32)); 5830 if (!nla) 5831 goto nla_put_failure; 5832 ipv6_store_devconf(&idev->cnf, nla_data(nla), nla_len(nla)); 5833 5834 /* XXX - MC not implemented */ 5835 5836 if (!(ext_filter_mask & RTEXT_FILTER_SKIP_STATS)) { 5837 if (inet6_fill_ifla6_stats_attrs(skb, idev) < 0) 5838 goto nla_put_failure; 5839 } 5840 5841 nla = nla_reserve(skb, IFLA_INET6_TOKEN, sizeof(struct in6_addr)); 5842 if (!nla) 5843 goto nla_put_failure; 5844 read_lock_bh(&idev->lock); 5845 memcpy(nla_data(nla), idev->token.s6_addr, nla_len(nla)); 5846 read_unlock_bh(&idev->lock); 5847 5848 if (nla_put_u8(skb, IFLA_INET6_ADDR_GEN_MODE, 5849 READ_ONCE(idev->cnf.addr_gen_mode))) 5850 goto nla_put_failure; 5851 5852 ra_mtu = READ_ONCE(idev->ra_mtu); 5853 if (ra_mtu && nla_put_u32(skb, IFLA_INET6_RA_MTU, ra_mtu)) 5854 goto nla_put_failure; 5855 5856 return 0; 5857 5858 nla_put_failure: 5859 return -EMSGSIZE; 5860 } 5861 5862 static size_t inet6_get_link_af_size(const struct net_device *dev, 5863 u32 ext_filter_mask) 5864 { 5865 if (!__in6_dev_get(dev)) 5866 return 0; 5867 5868 return inet6_ifla6_size(); 5869 } 5870 5871 static int inet6_fill_link_af(struct sk_buff *skb, const struct net_device *dev, 5872 u32 ext_filter_mask) 5873 { 5874 struct inet6_dev *idev = __in6_dev_get(dev); 5875 5876 if (!idev) 5877 return -ENODATA; 5878 5879 if (inet6_fill_ifla6_attrs(skb, idev, ext_filter_mask) < 0) 5880 return -EMSGSIZE; 5881 5882 return 0; 5883 } 5884 5885 static int inet6_set_iftoken(struct inet6_dev *idev, struct in6_addr *token, 5886 struct netlink_ext_ack *extack) 5887 { 5888 struct inet6_ifaddr *ifp; 5889 struct net_device *dev = idev->dev; 5890 bool clear_token, update_rs = false; 5891 struct in6_addr ll_addr; 5892 5893 ASSERT_RTNL(); 5894 5895 if (!token) 5896 return -EINVAL; 5897 5898 if (dev->flags & IFF_LOOPBACK) { 5899 NL_SET_ERR_MSG_MOD(extack, "Device is loopback"); 5900 return -EINVAL; 5901 } 5902 5903 if (dev->flags & IFF_NOARP) { 5904 NL_SET_ERR_MSG_MOD(extack, 5905 "Device does not do neighbour discovery"); 5906 return -EINVAL; 5907 } 5908 5909 if (!ipv6_accept_ra(idev)) { 5910 NL_SET_ERR_MSG_MOD(extack, 5911 "Router advertisement is disabled on device"); 5912 return -EINVAL; 5913 } 5914 5915 if (READ_ONCE(idev->cnf.rtr_solicits) == 0) { 5916 NL_SET_ERR_MSG(extack, 5917 "Router solicitation is disabled on device"); 5918 return -EINVAL; 5919 } 5920 5921 write_lock_bh(&idev->lock); 5922 5923 BUILD_BUG_ON(sizeof(token->s6_addr) != 16); 5924 memcpy(idev->token.s6_addr + 8, token->s6_addr + 8, 8); 5925 5926 write_unlock_bh(&idev->lock); 5927 5928 clear_token = ipv6_addr_any(token); 5929 if (clear_token) 5930 goto update_lft; 5931 5932 if (!idev->dead && (idev->if_flags & IF_READY) && 5933 !ipv6_get_lladdr(dev, &ll_addr, IFA_F_TENTATIVE | 5934 IFA_F_OPTIMISTIC)) { 5935 /* If we're not ready, then normal ifup will take care 5936 * of this. Otherwise, we need to request our rs here. 5937 */ 5938 ndisc_send_rs(dev, &ll_addr, &in6addr_linklocal_allrouters); 5939 update_rs = true; 5940 } 5941 5942 update_lft: 5943 write_lock_bh(&idev->lock); 5944 5945 if (update_rs) { 5946 idev->if_flags |= IF_RS_SENT; 5947 idev->rs_interval = rfc3315_s14_backoff_init( 5948 READ_ONCE(idev->cnf.rtr_solicit_interval)); 5949 idev->rs_probes = 1; 5950 addrconf_mod_rs_timer(idev, idev->rs_interval); 5951 } 5952 5953 /* Well, that's kinda nasty ... */ 5954 list_for_each_entry(ifp, &idev->addr_list, if_list) { 5955 spin_lock(&ifp->lock); 5956 if (ifp->tokenized) { 5957 ifp->valid_lft = 0; 5958 ifp->prefered_lft = 0; 5959 } 5960 spin_unlock(&ifp->lock); 5961 } 5962 5963 write_unlock_bh(&idev->lock); 5964 inet6_ifinfo_notify(RTM_NEWLINK, idev); 5965 addrconf_verify_rtnl(dev_net(dev)); 5966 return 0; 5967 } 5968 5969 static const struct nla_policy inet6_af_policy[IFLA_INET6_MAX + 1] = { 5970 [IFLA_INET6_ADDR_GEN_MODE] = { .type = NLA_U8 }, 5971 [IFLA_INET6_TOKEN] = { .len = sizeof(struct in6_addr) }, 5972 [IFLA_INET6_RA_MTU] = { .type = NLA_REJECT, 5973 .reject_message = 5974 "IFLA_INET6_RA_MTU can not be set" }, 5975 }; 5976 5977 static int check_addr_gen_mode(int mode) 5978 { 5979 if (mode != IN6_ADDR_GEN_MODE_EUI64 && 5980 mode != IN6_ADDR_GEN_MODE_NONE && 5981 mode != IN6_ADDR_GEN_MODE_STABLE_PRIVACY && 5982 mode != IN6_ADDR_GEN_MODE_RANDOM) 5983 return -EINVAL; 5984 return 1; 5985 } 5986 5987 static int check_stable_privacy(struct inet6_dev *idev, struct net *net, 5988 int mode) 5989 { 5990 if (mode == IN6_ADDR_GEN_MODE_STABLE_PRIVACY && 5991 !idev->cnf.stable_secret.initialized && 5992 !net->ipv6.devconf_dflt->stable_secret.initialized) 5993 return -EINVAL; 5994 return 1; 5995 } 5996 5997 static int inet6_validate_link_af(const struct net_device *dev, 5998 const struct nlattr *nla, 5999 struct netlink_ext_ack *extack) 6000 { 6001 struct nlattr *tb[IFLA_INET6_MAX + 1]; 6002 struct inet6_dev *idev = NULL; 6003 int err; 6004 6005 if (dev) { 6006 idev = __in6_dev_get(dev); 6007 if (!idev) 6008 return -EAFNOSUPPORT; 6009 } 6010 6011 err = nla_parse_nested_deprecated(tb, IFLA_INET6_MAX, nla, 6012 inet6_af_policy, extack); 6013 if (err) 6014 return err; 6015 6016 if (!tb[IFLA_INET6_TOKEN] && !tb[IFLA_INET6_ADDR_GEN_MODE]) 6017 return -EINVAL; 6018 6019 if (tb[IFLA_INET6_ADDR_GEN_MODE]) { 6020 u8 mode = nla_get_u8(tb[IFLA_INET6_ADDR_GEN_MODE]); 6021 6022 if (check_addr_gen_mode(mode) < 0) 6023 return -EINVAL; 6024 if (dev && check_stable_privacy(idev, dev_net(dev), mode) < 0) 6025 return -EINVAL; 6026 } 6027 6028 return 0; 6029 } 6030 6031 static int inet6_set_link_af(struct net_device *dev, const struct nlattr *nla, 6032 struct netlink_ext_ack *extack) 6033 { 6034 struct inet6_dev *idev = __in6_dev_get(dev); 6035 struct nlattr *tb[IFLA_INET6_MAX + 1]; 6036 int err; 6037 6038 if (!idev) 6039 return -EAFNOSUPPORT; 6040 6041 if (nla_parse_nested_deprecated(tb, IFLA_INET6_MAX, nla, NULL, NULL) < 0) 6042 return -EINVAL; 6043 6044 if (tb[IFLA_INET6_TOKEN]) { 6045 err = inet6_set_iftoken(idev, nla_data(tb[IFLA_INET6_TOKEN]), 6046 extack); 6047 if (err) 6048 return err; 6049 } 6050 6051 if (tb[IFLA_INET6_ADDR_GEN_MODE]) { 6052 u8 mode = nla_get_u8(tb[IFLA_INET6_ADDR_GEN_MODE]); 6053 6054 WRITE_ONCE(idev->cnf.addr_gen_mode, mode); 6055 } 6056 6057 return 0; 6058 } 6059 6060 static int inet6_fill_ifinfo(struct sk_buff *skb, struct inet6_dev *idev, 6061 u32 portid, u32 seq, int event, unsigned int flags) 6062 { 6063 struct net_device *dev = idev->dev; 6064 struct ifinfomsg *hdr; 6065 struct nlmsghdr *nlh; 6066 int ifindex, iflink; 6067 void *protoinfo; 6068 6069 nlh = nlmsg_put(skb, portid, seq, event, sizeof(*hdr), flags); 6070 if (!nlh) 6071 return -EMSGSIZE; 6072 6073 hdr = nlmsg_data(nlh); 6074 hdr->ifi_family = AF_INET6; 6075 hdr->__ifi_pad = 0; 6076 hdr->ifi_type = dev->type; 6077 ifindex = READ_ONCE(dev->ifindex); 6078 hdr->ifi_index = ifindex; 6079 hdr->ifi_flags = dev_get_flags(dev); 6080 hdr->ifi_change = 0; 6081 6082 iflink = dev_get_iflink(dev); 6083 if (nla_put_string(skb, IFLA_IFNAME, dev->name) || 6084 (dev->addr_len && 6085 nla_put(skb, IFLA_ADDRESS, dev->addr_len, dev->dev_addr)) || 6086 nla_put_u32(skb, IFLA_MTU, READ_ONCE(dev->mtu)) || 6087 (ifindex != iflink && 6088 nla_put_u32(skb, IFLA_LINK, iflink)) || 6089 nla_put_u8(skb, IFLA_OPERSTATE, 6090 netif_running(dev) ? READ_ONCE(dev->operstate) : IF_OPER_DOWN)) 6091 goto nla_put_failure; 6092 protoinfo = nla_nest_start_noflag(skb, IFLA_PROTINFO); 6093 if (!protoinfo) 6094 goto nla_put_failure; 6095 6096 if (inet6_fill_ifla6_attrs(skb, idev, 0) < 0) 6097 goto nla_put_failure; 6098 6099 nla_nest_end(skb, protoinfo); 6100 nlmsg_end(skb, nlh); 6101 return 0; 6102 6103 nla_put_failure: 6104 nlmsg_cancel(skb, nlh); 6105 return -EMSGSIZE; 6106 } 6107 6108 static int inet6_valid_dump_ifinfo(const struct nlmsghdr *nlh, 6109 struct netlink_ext_ack *extack) 6110 { 6111 struct ifinfomsg *ifm; 6112 6113 ifm = nlmsg_payload(nlh, sizeof(*ifm)); 6114 if (!ifm) { 6115 NL_SET_ERR_MSG_MOD(extack, "Invalid header for link dump request"); 6116 return -EINVAL; 6117 } 6118 6119 if (nlmsg_attrlen(nlh, sizeof(*ifm))) { 6120 NL_SET_ERR_MSG_MOD(extack, "Invalid data after header"); 6121 return -EINVAL; 6122 } 6123 6124 if (ifm->__ifi_pad || ifm->ifi_type || ifm->ifi_flags || 6125 ifm->ifi_change || ifm->ifi_index) { 6126 NL_SET_ERR_MSG_MOD(extack, "Invalid values in header for dump request"); 6127 return -EINVAL; 6128 } 6129 6130 return 0; 6131 } 6132 6133 static int inet6_dump_ifinfo(struct sk_buff *skb, struct netlink_callback *cb) 6134 { 6135 struct net *net = sock_net(skb->sk); 6136 struct { 6137 unsigned long ifindex; 6138 } *ctx = (void *)cb->ctx; 6139 struct net_device *dev; 6140 struct inet6_dev *idev; 6141 int err; 6142 6143 /* only requests using strict checking can pass data to 6144 * influence the dump 6145 */ 6146 if (cb->strict_check) { 6147 err = inet6_valid_dump_ifinfo(cb->nlh, cb->extack); 6148 6149 if (err < 0) 6150 return err; 6151 } 6152 6153 err = 0; 6154 rcu_read_lock(); 6155 for_each_netdev_dump(net, dev, ctx->ifindex) { 6156 idev = __in6_dev_get(dev); 6157 if (!idev) 6158 continue; 6159 err = inet6_fill_ifinfo(skb, idev, 6160 NETLINK_CB(cb->skb).portid, 6161 cb->nlh->nlmsg_seq, 6162 RTM_NEWLINK, NLM_F_MULTI); 6163 if (err < 0) 6164 break; 6165 } 6166 rcu_read_unlock(); 6167 6168 return err; 6169 } 6170 6171 void inet6_ifinfo_notify(int event, struct inet6_dev *idev) 6172 { 6173 struct sk_buff *skb; 6174 struct net *net = dev_net(idev->dev); 6175 int err = -ENOBUFS; 6176 6177 skb = nlmsg_new(inet6_if_nlmsg_size(), GFP_ATOMIC); 6178 if (!skb) 6179 goto errout; 6180 6181 err = inet6_fill_ifinfo(skb, idev, 0, 0, event, 0); 6182 if (err < 0) { 6183 /* -EMSGSIZE implies BUG in inet6_if_nlmsg_size() */ 6184 WARN_ON(err == -EMSGSIZE); 6185 kfree_skb(skb); 6186 goto errout; 6187 } 6188 rtnl_notify(skb, net, 0, RTNLGRP_IPV6_IFINFO, NULL, GFP_ATOMIC); 6189 return; 6190 errout: 6191 rtnl_set_sk_err(net, RTNLGRP_IPV6_IFINFO, err); 6192 } 6193 6194 static inline size_t inet6_prefix_nlmsg_size(void) 6195 { 6196 return NLMSG_ALIGN(sizeof(struct prefixmsg)) 6197 + nla_total_size(sizeof(struct in6_addr)) 6198 + nla_total_size(sizeof(struct prefix_cacheinfo)); 6199 } 6200 6201 static int inet6_fill_prefix(struct sk_buff *skb, struct inet6_dev *idev, 6202 struct prefix_info *pinfo, u32 portid, u32 seq, 6203 int event, unsigned int flags) 6204 { 6205 struct prefixmsg *pmsg; 6206 struct nlmsghdr *nlh; 6207 struct prefix_cacheinfo ci; 6208 6209 nlh = nlmsg_put(skb, portid, seq, event, sizeof(*pmsg), flags); 6210 if (!nlh) 6211 return -EMSGSIZE; 6212 6213 pmsg = nlmsg_data(nlh); 6214 pmsg->prefix_family = AF_INET6; 6215 pmsg->prefix_pad1 = 0; 6216 pmsg->prefix_pad2 = 0; 6217 pmsg->prefix_ifindex = idev->dev->ifindex; 6218 pmsg->prefix_len = pinfo->prefix_len; 6219 pmsg->prefix_type = pinfo->type; 6220 pmsg->prefix_pad3 = 0; 6221 pmsg->prefix_flags = pinfo->flags; 6222 6223 if (nla_put(skb, PREFIX_ADDRESS, sizeof(pinfo->prefix), &pinfo->prefix)) 6224 goto nla_put_failure; 6225 ci.preferred_time = ntohl(pinfo->prefered); 6226 ci.valid_time = ntohl(pinfo->valid); 6227 if (nla_put(skb, PREFIX_CACHEINFO, sizeof(ci), &ci)) 6228 goto nla_put_failure; 6229 nlmsg_end(skb, nlh); 6230 return 0; 6231 6232 nla_put_failure: 6233 nlmsg_cancel(skb, nlh); 6234 return -EMSGSIZE; 6235 } 6236 6237 static void inet6_prefix_notify(int event, struct inet6_dev *idev, 6238 struct prefix_info *pinfo) 6239 { 6240 struct sk_buff *skb; 6241 struct net *net = dev_net(idev->dev); 6242 int err = -ENOBUFS; 6243 6244 skb = nlmsg_new(inet6_prefix_nlmsg_size(), GFP_ATOMIC); 6245 if (!skb) 6246 goto errout; 6247 6248 err = inet6_fill_prefix(skb, idev, pinfo, 0, 0, event, 0); 6249 if (err < 0) { 6250 /* -EMSGSIZE implies BUG in inet6_prefix_nlmsg_size() */ 6251 WARN_ON(err == -EMSGSIZE); 6252 kfree_skb(skb); 6253 goto errout; 6254 } 6255 rtnl_notify(skb, net, 0, RTNLGRP_IPV6_PREFIX, NULL, GFP_ATOMIC); 6256 return; 6257 errout: 6258 rtnl_set_sk_err(net, RTNLGRP_IPV6_PREFIX, err); 6259 } 6260 6261 static void __ipv6_ifa_notify(int event, struct inet6_ifaddr *ifp) 6262 { 6263 struct net *net = dev_net(ifp->idev->dev); 6264 6265 if (event) 6266 ASSERT_RTNL(); 6267 6268 inet6_ifa_notify(event ? : RTM_NEWADDR, ifp); 6269 6270 switch (event) { 6271 case RTM_NEWADDR: 6272 /* 6273 * If the address was optimistic we inserted the route at the 6274 * start of our DAD process, so we don't need to do it again. 6275 * If the device was taken down in the middle of the DAD 6276 * cycle there is a race where we could get here without a 6277 * host route, so nothing to insert. That will be fixed when 6278 * the device is brought up. 6279 */ 6280 if (ifp->rt && !rcu_access_pointer(ifp->rt->fib6_node)) { 6281 ip6_ins_rt(net, ifp->rt); 6282 } else if (!ifp->rt && (ifp->idev->dev->flags & IFF_UP)) { 6283 pr_warn("BUG: Address %pI6c on device %s is missing its host route.\n", 6284 &ifp->addr, ifp->idev->dev->name); 6285 } 6286 6287 if (ifp->idev->cnf.forwarding) 6288 addrconf_join_anycast(ifp); 6289 if (!ipv6_addr_any(&ifp->peer_addr)) 6290 addrconf_prefix_route(&ifp->peer_addr, 128, 6291 ifp->rt_priority, ifp->idev->dev, 6292 0, 0, GFP_ATOMIC); 6293 break; 6294 case RTM_DELADDR: 6295 if (ifp->idev->cnf.forwarding) 6296 addrconf_leave_anycast(ifp); 6297 addrconf_leave_solict(ifp->idev, &ifp->addr); 6298 if (!ipv6_addr_any(&ifp->peer_addr)) { 6299 struct fib6_info *rt; 6300 6301 rt = addrconf_get_prefix_route(&ifp->peer_addr, 128, 6302 ifp->idev->dev, 0, 0, 6303 false); 6304 if (rt) 6305 ip6_del_rt(net, rt, false); 6306 } 6307 if (ifp->rt) { 6308 ip6_del_rt(net, ifp->rt, false); 6309 ifp->rt = NULL; 6310 } 6311 rt_genid_bump_ipv6(net); 6312 break; 6313 } 6314 atomic_inc(&net->ipv6.dev_addr_genid); 6315 } 6316 6317 static void ipv6_ifa_notify(int event, struct inet6_ifaddr *ifp) 6318 { 6319 if (likely(ifp->idev->dead == 0)) 6320 __ipv6_ifa_notify(event, ifp); 6321 } 6322 6323 #ifdef CONFIG_SYSCTL 6324 6325 static int addrconf_sysctl_forward(const struct ctl_table *ctl, int write, 6326 void *buffer, size_t *lenp, loff_t *ppos) 6327 { 6328 int *valp = ctl->data; 6329 int val = *valp; 6330 loff_t pos = *ppos; 6331 struct ctl_table lctl; 6332 int ret; 6333 6334 /* 6335 * ctl->data points to idev->cnf.forwarding, we should 6336 * not modify it until we get the rtnl lock. 6337 */ 6338 lctl = *ctl; 6339 lctl.data = &val; 6340 6341 ret = proc_dointvec(&lctl, write, buffer, lenp, ppos); 6342 6343 if (write) 6344 ret = addrconf_fixup_forwarding(ctl, valp, val); 6345 if (ret) 6346 *ppos = pos; 6347 return ret; 6348 } 6349 6350 static int addrconf_sysctl_mtu(const struct ctl_table *ctl, int write, 6351 void *buffer, size_t *lenp, loff_t *ppos) 6352 { 6353 struct inet6_dev *idev = ctl->extra1; 6354 int min_mtu = IPV6_MIN_MTU; 6355 struct ctl_table lctl; 6356 6357 lctl = *ctl; 6358 lctl.extra1 = &min_mtu; 6359 lctl.extra2 = idev ? &idev->dev->mtu : NULL; 6360 6361 return proc_dointvec_minmax(&lctl, write, buffer, lenp, ppos); 6362 } 6363 6364 static void dev_disable_change(struct inet6_dev *idev) 6365 { 6366 struct netdev_notifier_info info; 6367 6368 if (!idev || !idev->dev) 6369 return; 6370 6371 netdev_notifier_info_init(&info, idev->dev); 6372 if (idev->cnf.disable_ipv6) 6373 addrconf_notify(NULL, NETDEV_DOWN, &info); 6374 else 6375 addrconf_notify(NULL, NETDEV_UP, &info); 6376 } 6377 6378 static void addrconf_disable_change(struct net *net, __s32 newf) 6379 { 6380 struct net_device *dev; 6381 struct inet6_dev *idev; 6382 6383 for_each_netdev(net, dev) { 6384 idev = __in6_dev_get_rtnl_net(dev); 6385 if (idev) { 6386 int changed = (!idev->cnf.disable_ipv6) ^ (!newf); 6387 6388 WRITE_ONCE(idev->cnf.disable_ipv6, newf); 6389 if (changed) 6390 dev_disable_change(idev); 6391 } 6392 } 6393 } 6394 6395 static int addrconf_disable_ipv6(const struct ctl_table *table, int *p, int newf) 6396 { 6397 struct net *net = (struct net *)table->extra2; 6398 int old; 6399 6400 if (p == &net->ipv6.devconf_dflt->disable_ipv6) { 6401 WRITE_ONCE(*p, newf); 6402 return 0; 6403 } 6404 6405 if (!rtnl_net_trylock(net)) 6406 return restart_syscall(); 6407 6408 old = *p; 6409 WRITE_ONCE(*p, newf); 6410 6411 if (p == &net->ipv6.devconf_all->disable_ipv6) { 6412 WRITE_ONCE(net->ipv6.devconf_dflt->disable_ipv6, newf); 6413 addrconf_disable_change(net, newf); 6414 } else if ((!newf) ^ (!old)) { 6415 dev_disable_change((struct inet6_dev *)table->extra1); 6416 } 6417 6418 rtnl_net_unlock(net); 6419 return 0; 6420 } 6421 6422 static int addrconf_sysctl_disable(const struct ctl_table *ctl, int write, 6423 void *buffer, size_t *lenp, loff_t *ppos) 6424 { 6425 int *valp = ctl->data; 6426 int val = *valp; 6427 loff_t pos = *ppos; 6428 struct ctl_table lctl; 6429 int ret; 6430 6431 /* 6432 * ctl->data points to idev->cnf.disable_ipv6, we should 6433 * not modify it until we get the rtnl lock. 6434 */ 6435 lctl = *ctl; 6436 lctl.data = &val; 6437 6438 ret = proc_dointvec(&lctl, write, buffer, lenp, ppos); 6439 6440 if (write) 6441 ret = addrconf_disable_ipv6(ctl, valp, val); 6442 if (ret) 6443 *ppos = pos; 6444 return ret; 6445 } 6446 6447 static int addrconf_sysctl_proxy_ndp(const struct ctl_table *ctl, int write, 6448 void *buffer, size_t *lenp, loff_t *ppos) 6449 { 6450 int *valp = ctl->data; 6451 int ret; 6452 int old, new; 6453 6454 old = *valp; 6455 ret = proc_dointvec(ctl, write, buffer, lenp, ppos); 6456 new = *valp; 6457 6458 if (write && old != new) { 6459 struct net *net = ctl->extra2; 6460 6461 if (!rtnl_net_trylock(net)) 6462 return restart_syscall(); 6463 6464 if (valp == &net->ipv6.devconf_dflt->proxy_ndp) { 6465 inet6_netconf_notify_devconf(net, RTM_NEWNETCONF, 6466 NETCONFA_PROXY_NEIGH, 6467 NETCONFA_IFINDEX_DEFAULT, 6468 net->ipv6.devconf_dflt); 6469 } else if (valp == &net->ipv6.devconf_all->proxy_ndp) { 6470 inet6_netconf_notify_devconf(net, RTM_NEWNETCONF, 6471 NETCONFA_PROXY_NEIGH, 6472 NETCONFA_IFINDEX_ALL, 6473 net->ipv6.devconf_all); 6474 } else { 6475 struct inet6_dev *idev = ctl->extra1; 6476 6477 inet6_netconf_notify_devconf(net, RTM_NEWNETCONF, 6478 NETCONFA_PROXY_NEIGH, 6479 idev->dev->ifindex, 6480 &idev->cnf); 6481 } 6482 rtnl_net_unlock(net); 6483 } 6484 6485 return ret; 6486 } 6487 6488 static int addrconf_sysctl_addr_gen_mode(const struct ctl_table *ctl, int write, 6489 void *buffer, size_t *lenp, 6490 loff_t *ppos) 6491 { 6492 int ret = 0; 6493 u32 new_val; 6494 struct inet6_dev *idev = (struct inet6_dev *)ctl->extra1; 6495 struct net *net = (struct net *)ctl->extra2; 6496 struct ctl_table tmp = { 6497 .data = &new_val, 6498 .maxlen = sizeof(new_val), 6499 .mode = ctl->mode, 6500 }; 6501 6502 if (!rtnl_net_trylock(net)) 6503 return restart_syscall(); 6504 6505 new_val = *((u32 *)ctl->data); 6506 6507 ret = proc_douintvec(&tmp, write, buffer, lenp, ppos); 6508 if (ret != 0) 6509 goto out; 6510 6511 if (write) { 6512 if (check_addr_gen_mode(new_val) < 0) { 6513 ret = -EINVAL; 6514 goto out; 6515 } 6516 6517 if (idev) { 6518 if (check_stable_privacy(idev, net, new_val) < 0) { 6519 ret = -EINVAL; 6520 goto out; 6521 } 6522 6523 if (idev->cnf.addr_gen_mode != new_val) { 6524 WRITE_ONCE(idev->cnf.addr_gen_mode, new_val); 6525 netdev_lock_ops(idev->dev); 6526 addrconf_init_auto_addrs(idev->dev); 6527 netdev_unlock_ops(idev->dev); 6528 } 6529 } else if (&net->ipv6.devconf_all->addr_gen_mode == ctl->data) { 6530 struct net_device *dev; 6531 6532 WRITE_ONCE(net->ipv6.devconf_dflt->addr_gen_mode, new_val); 6533 for_each_netdev(net, dev) { 6534 idev = __in6_dev_get_rtnl_net(dev); 6535 if (idev && 6536 idev->cnf.addr_gen_mode != new_val) { 6537 WRITE_ONCE(idev->cnf.addr_gen_mode, 6538 new_val); 6539 netdev_lock_ops(idev->dev); 6540 addrconf_init_auto_addrs(idev->dev); 6541 netdev_unlock_ops(idev->dev); 6542 } 6543 } 6544 } 6545 6546 WRITE_ONCE(*((u32 *)ctl->data), new_val); 6547 } 6548 6549 out: 6550 rtnl_net_unlock(net); 6551 6552 return ret; 6553 } 6554 6555 static int addrconf_sysctl_stable_secret(const struct ctl_table *ctl, int write, 6556 void *buffer, size_t *lenp, 6557 loff_t *ppos) 6558 { 6559 int err; 6560 struct in6_addr addr; 6561 char str[IPV6_MAX_STRLEN]; 6562 struct ctl_table lctl = *ctl; 6563 struct net *net = ctl->extra2; 6564 struct ipv6_stable_secret *secret = ctl->data; 6565 6566 if (&net->ipv6.devconf_all->stable_secret == ctl->data) 6567 return -EIO; 6568 6569 lctl.maxlen = IPV6_MAX_STRLEN; 6570 lctl.data = str; 6571 6572 if (!rtnl_net_trylock(net)) 6573 return restart_syscall(); 6574 6575 if (!write && !secret->initialized) { 6576 err = -EIO; 6577 goto out; 6578 } 6579 6580 err = snprintf(str, sizeof(str), "%pI6", &secret->secret); 6581 if (err >= sizeof(str)) { 6582 err = -EIO; 6583 goto out; 6584 } 6585 6586 err = proc_dostring(&lctl, write, buffer, lenp, ppos); 6587 if (err || !write) 6588 goto out; 6589 6590 if (in6_pton(str, -1, addr.in6_u.u6_addr8, -1, NULL) != 1) { 6591 err = -EIO; 6592 goto out; 6593 } 6594 6595 secret->initialized = true; 6596 secret->secret = addr; 6597 6598 if (&net->ipv6.devconf_dflt->stable_secret == ctl->data) { 6599 struct net_device *dev; 6600 6601 for_each_netdev(net, dev) { 6602 struct inet6_dev *idev = __in6_dev_get_rtnl_net(dev); 6603 6604 if (idev) { 6605 WRITE_ONCE(idev->cnf.addr_gen_mode, 6606 IN6_ADDR_GEN_MODE_STABLE_PRIVACY); 6607 } 6608 } 6609 } else { 6610 struct inet6_dev *idev = ctl->extra1; 6611 6612 WRITE_ONCE(idev->cnf.addr_gen_mode, 6613 IN6_ADDR_GEN_MODE_STABLE_PRIVACY); 6614 } 6615 6616 out: 6617 rtnl_net_unlock(net); 6618 6619 return err; 6620 } 6621 6622 static 6623 int addrconf_sysctl_ignore_routes_with_linkdown(const struct ctl_table *ctl, 6624 int write, void *buffer, 6625 size_t *lenp, 6626 loff_t *ppos) 6627 { 6628 int *valp = ctl->data; 6629 int val = *valp; 6630 loff_t pos = *ppos; 6631 struct ctl_table lctl; 6632 int ret; 6633 6634 /* ctl->data points to idev->cnf.ignore_routes_when_linkdown 6635 * we should not modify it until we get the rtnl lock. 6636 */ 6637 lctl = *ctl; 6638 lctl.data = &val; 6639 6640 ret = proc_dointvec(&lctl, write, buffer, lenp, ppos); 6641 6642 if (write) 6643 ret = addrconf_fixup_linkdown(ctl, valp, val); 6644 if (ret) 6645 *ppos = pos; 6646 return ret; 6647 } 6648 6649 static 6650 void addrconf_set_nopolicy(struct rt6_info *rt, int action) 6651 { 6652 if (rt) { 6653 if (action) 6654 rt->dst.flags |= DST_NOPOLICY; 6655 else 6656 rt->dst.flags &= ~DST_NOPOLICY; 6657 } 6658 } 6659 6660 static 6661 void addrconf_disable_policy_idev(struct inet6_dev *idev, int val) 6662 { 6663 struct inet6_ifaddr *ifa; 6664 6665 read_lock_bh(&idev->lock); 6666 list_for_each_entry(ifa, &idev->addr_list, if_list) { 6667 spin_lock(&ifa->lock); 6668 if (ifa->rt) { 6669 /* host routes only use builtin fib6_nh */ 6670 struct fib6_nh *nh = ifa->rt->fib6_nh; 6671 int cpu; 6672 6673 rcu_read_lock(); 6674 ifa->rt->dst_nopolicy = val ? true : false; 6675 if (nh->rt6i_pcpu) { 6676 for_each_possible_cpu(cpu) { 6677 struct rt6_info **rtp; 6678 6679 rtp = per_cpu_ptr(nh->rt6i_pcpu, cpu); 6680 addrconf_set_nopolicy(*rtp, val); 6681 } 6682 } 6683 rcu_read_unlock(); 6684 } 6685 spin_unlock(&ifa->lock); 6686 } 6687 read_unlock_bh(&idev->lock); 6688 } 6689 6690 static 6691 int addrconf_disable_policy(const struct ctl_table *ctl, int *valp, int val) 6692 { 6693 struct net *net = (struct net *)ctl->extra2; 6694 struct inet6_dev *idev; 6695 6696 if (valp == &net->ipv6.devconf_dflt->disable_policy) { 6697 WRITE_ONCE(*valp, val); 6698 return 0; 6699 } 6700 6701 if (!rtnl_net_trylock(net)) 6702 return restart_syscall(); 6703 6704 WRITE_ONCE(*valp, val); 6705 6706 if (valp == &net->ipv6.devconf_all->disable_policy) { 6707 struct net_device *dev; 6708 6709 for_each_netdev(net, dev) { 6710 idev = __in6_dev_get_rtnl_net(dev); 6711 if (idev) 6712 addrconf_disable_policy_idev(idev, val); 6713 } 6714 } else { 6715 idev = (struct inet6_dev *)ctl->extra1; 6716 addrconf_disable_policy_idev(idev, val); 6717 } 6718 6719 rtnl_net_unlock(net); 6720 return 0; 6721 } 6722 6723 static int addrconf_sysctl_disable_policy(const struct ctl_table *ctl, int write, 6724 void *buffer, size_t *lenp, loff_t *ppos) 6725 { 6726 int *valp = ctl->data; 6727 int val = *valp; 6728 loff_t pos = *ppos; 6729 struct ctl_table lctl; 6730 int ret; 6731 6732 lctl = *ctl; 6733 lctl.data = &val; 6734 ret = proc_dointvec(&lctl, write, buffer, lenp, ppos); 6735 6736 if (write && (*valp != val)) 6737 ret = addrconf_disable_policy(ctl, valp, val); 6738 6739 if (ret) 6740 *ppos = pos; 6741 6742 return ret; 6743 } 6744 6745 static int minus_one = -1; 6746 static const int two_five_five = 255; 6747 static u32 ioam6_if_id_max = U16_MAX; 6748 6749 static const struct ctl_table addrconf_sysctl[] = { 6750 { 6751 .procname = "forwarding", 6752 .data = &ipv6_devconf.forwarding, 6753 .maxlen = sizeof(int), 6754 .mode = 0644, 6755 .proc_handler = addrconf_sysctl_forward, 6756 }, 6757 { 6758 .procname = "hop_limit", 6759 .data = &ipv6_devconf.hop_limit, 6760 .maxlen = sizeof(int), 6761 .mode = 0644, 6762 .proc_handler = proc_dointvec_minmax, 6763 .extra1 = (void *)SYSCTL_ONE, 6764 .extra2 = (void *)&two_five_five, 6765 }, 6766 { 6767 .procname = "mtu", 6768 .data = &ipv6_devconf.mtu6, 6769 .maxlen = sizeof(int), 6770 .mode = 0644, 6771 .proc_handler = addrconf_sysctl_mtu, 6772 }, 6773 { 6774 .procname = "accept_ra", 6775 .data = &ipv6_devconf.accept_ra, 6776 .maxlen = sizeof(int), 6777 .mode = 0644, 6778 .proc_handler = proc_dointvec, 6779 }, 6780 { 6781 .procname = "accept_redirects", 6782 .data = &ipv6_devconf.accept_redirects, 6783 .maxlen = sizeof(int), 6784 .mode = 0644, 6785 .proc_handler = proc_dointvec, 6786 }, 6787 { 6788 .procname = "autoconf", 6789 .data = &ipv6_devconf.autoconf, 6790 .maxlen = sizeof(int), 6791 .mode = 0644, 6792 .proc_handler = proc_dointvec, 6793 }, 6794 { 6795 .procname = "dad_transmits", 6796 .data = &ipv6_devconf.dad_transmits, 6797 .maxlen = sizeof(int), 6798 .mode = 0644, 6799 .proc_handler = proc_dointvec, 6800 }, 6801 { 6802 .procname = "router_solicitations", 6803 .data = &ipv6_devconf.rtr_solicits, 6804 .maxlen = sizeof(int), 6805 .mode = 0644, 6806 .proc_handler = proc_dointvec_minmax, 6807 .extra1 = &minus_one, 6808 }, 6809 { 6810 .procname = "router_solicitation_interval", 6811 .data = &ipv6_devconf.rtr_solicit_interval, 6812 .maxlen = sizeof(int), 6813 .mode = 0644, 6814 .proc_handler = proc_dointvec_jiffies, 6815 }, 6816 { 6817 .procname = "router_solicitation_max_interval", 6818 .data = &ipv6_devconf.rtr_solicit_max_interval, 6819 .maxlen = sizeof(int), 6820 .mode = 0644, 6821 .proc_handler = proc_dointvec_jiffies, 6822 }, 6823 { 6824 .procname = "router_solicitation_delay", 6825 .data = &ipv6_devconf.rtr_solicit_delay, 6826 .maxlen = sizeof(int), 6827 .mode = 0644, 6828 .proc_handler = proc_dointvec_jiffies, 6829 }, 6830 { 6831 .procname = "force_mld_version", 6832 .data = &ipv6_devconf.force_mld_version, 6833 .maxlen = sizeof(int), 6834 .mode = 0644, 6835 .proc_handler = proc_dointvec, 6836 }, 6837 { 6838 .procname = "mldv1_unsolicited_report_interval", 6839 .data = 6840 &ipv6_devconf.mldv1_unsolicited_report_interval, 6841 .maxlen = sizeof(int), 6842 .mode = 0644, 6843 .proc_handler = proc_dointvec_ms_jiffies, 6844 }, 6845 { 6846 .procname = "mldv2_unsolicited_report_interval", 6847 .data = 6848 &ipv6_devconf.mldv2_unsolicited_report_interval, 6849 .maxlen = sizeof(int), 6850 .mode = 0644, 6851 .proc_handler = proc_dointvec_ms_jiffies, 6852 }, 6853 { 6854 .procname = "use_tempaddr", 6855 .data = &ipv6_devconf.use_tempaddr, 6856 .maxlen = sizeof(int), 6857 .mode = 0644, 6858 .proc_handler = proc_dointvec, 6859 }, 6860 { 6861 .procname = "temp_valid_lft", 6862 .data = &ipv6_devconf.temp_valid_lft, 6863 .maxlen = sizeof(int), 6864 .mode = 0644, 6865 .proc_handler = proc_dointvec, 6866 }, 6867 { 6868 .procname = "temp_prefered_lft", 6869 .data = &ipv6_devconf.temp_prefered_lft, 6870 .maxlen = sizeof(int), 6871 .mode = 0644, 6872 .proc_handler = proc_dointvec, 6873 }, 6874 { 6875 .procname = "regen_min_advance", 6876 .data = &ipv6_devconf.regen_min_advance, 6877 .maxlen = sizeof(int), 6878 .mode = 0644, 6879 .proc_handler = proc_dointvec, 6880 }, 6881 { 6882 .procname = "regen_max_retry", 6883 .data = &ipv6_devconf.regen_max_retry, 6884 .maxlen = sizeof(int), 6885 .mode = 0644, 6886 .proc_handler = proc_dointvec, 6887 }, 6888 { 6889 .procname = "max_desync_factor", 6890 .data = &ipv6_devconf.max_desync_factor, 6891 .maxlen = sizeof(int), 6892 .mode = 0644, 6893 .proc_handler = proc_dointvec, 6894 }, 6895 { 6896 .procname = "max_addresses", 6897 .data = &ipv6_devconf.max_addresses, 6898 .maxlen = sizeof(int), 6899 .mode = 0644, 6900 .proc_handler = proc_dointvec, 6901 }, 6902 { 6903 .procname = "accept_ra_defrtr", 6904 .data = &ipv6_devconf.accept_ra_defrtr, 6905 .maxlen = sizeof(int), 6906 .mode = 0644, 6907 .proc_handler = proc_dointvec, 6908 }, 6909 { 6910 .procname = "ra_defrtr_metric", 6911 .data = &ipv6_devconf.ra_defrtr_metric, 6912 .maxlen = sizeof(u32), 6913 .mode = 0644, 6914 .proc_handler = proc_douintvec_minmax, 6915 .extra1 = (void *)SYSCTL_ONE, 6916 }, 6917 { 6918 .procname = "accept_ra_min_hop_limit", 6919 .data = &ipv6_devconf.accept_ra_min_hop_limit, 6920 .maxlen = sizeof(int), 6921 .mode = 0644, 6922 .proc_handler = proc_dointvec, 6923 }, 6924 { 6925 .procname = "accept_ra_min_lft", 6926 .data = &ipv6_devconf.accept_ra_min_lft, 6927 .maxlen = sizeof(int), 6928 .mode = 0644, 6929 .proc_handler = proc_dointvec, 6930 }, 6931 { 6932 .procname = "accept_ra_pinfo", 6933 .data = &ipv6_devconf.accept_ra_pinfo, 6934 .maxlen = sizeof(int), 6935 .mode = 0644, 6936 .proc_handler = proc_dointvec, 6937 }, 6938 { 6939 .procname = "ra_honor_pio_life", 6940 .data = &ipv6_devconf.ra_honor_pio_life, 6941 .maxlen = sizeof(u8), 6942 .mode = 0644, 6943 .proc_handler = proc_dou8vec_minmax, 6944 .extra1 = SYSCTL_ZERO, 6945 .extra2 = SYSCTL_ONE, 6946 }, 6947 { 6948 .procname = "ra_honor_pio_pflag", 6949 .data = &ipv6_devconf.ra_honor_pio_pflag, 6950 .maxlen = sizeof(u8), 6951 .mode = 0644, 6952 .proc_handler = proc_dou8vec_minmax, 6953 .extra1 = SYSCTL_ZERO, 6954 .extra2 = SYSCTL_ONE, 6955 }, 6956 #ifdef CONFIG_IPV6_ROUTER_PREF 6957 { 6958 .procname = "accept_ra_rtr_pref", 6959 .data = &ipv6_devconf.accept_ra_rtr_pref, 6960 .maxlen = sizeof(int), 6961 .mode = 0644, 6962 .proc_handler = proc_dointvec, 6963 }, 6964 { 6965 .procname = "router_probe_interval", 6966 .data = &ipv6_devconf.rtr_probe_interval, 6967 .maxlen = sizeof(int), 6968 .mode = 0644, 6969 .proc_handler = proc_dointvec_jiffies, 6970 }, 6971 #ifdef CONFIG_IPV6_ROUTE_INFO 6972 { 6973 .procname = "accept_ra_rt_info_min_plen", 6974 .data = &ipv6_devconf.accept_ra_rt_info_min_plen, 6975 .maxlen = sizeof(int), 6976 .mode = 0644, 6977 .proc_handler = proc_dointvec, 6978 }, 6979 { 6980 .procname = "accept_ra_rt_info_max_plen", 6981 .data = &ipv6_devconf.accept_ra_rt_info_max_plen, 6982 .maxlen = sizeof(int), 6983 .mode = 0644, 6984 .proc_handler = proc_dointvec, 6985 }, 6986 #endif 6987 #endif 6988 { 6989 .procname = "proxy_ndp", 6990 .data = &ipv6_devconf.proxy_ndp, 6991 .maxlen = sizeof(int), 6992 .mode = 0644, 6993 .proc_handler = addrconf_sysctl_proxy_ndp, 6994 }, 6995 { 6996 .procname = "accept_source_route", 6997 .data = &ipv6_devconf.accept_source_route, 6998 .maxlen = sizeof(int), 6999 .mode = 0644, 7000 .proc_handler = proc_dointvec, 7001 }, 7002 #ifdef CONFIG_IPV6_OPTIMISTIC_DAD 7003 { 7004 .procname = "optimistic_dad", 7005 .data = &ipv6_devconf.optimistic_dad, 7006 .maxlen = sizeof(int), 7007 .mode = 0644, 7008 .proc_handler = proc_dointvec, 7009 }, 7010 { 7011 .procname = "use_optimistic", 7012 .data = &ipv6_devconf.use_optimistic, 7013 .maxlen = sizeof(int), 7014 .mode = 0644, 7015 .proc_handler = proc_dointvec, 7016 }, 7017 #endif 7018 #ifdef CONFIG_IPV6_MROUTE 7019 { 7020 .procname = "mc_forwarding", 7021 .data = &ipv6_devconf.mc_forwarding, 7022 .maxlen = sizeof(int), 7023 .mode = 0444, 7024 .proc_handler = proc_dointvec, 7025 }, 7026 #endif 7027 { 7028 .procname = "disable_ipv6", 7029 .data = &ipv6_devconf.disable_ipv6, 7030 .maxlen = sizeof(int), 7031 .mode = 0644, 7032 .proc_handler = addrconf_sysctl_disable, 7033 }, 7034 { 7035 .procname = "accept_dad", 7036 .data = &ipv6_devconf.accept_dad, 7037 .maxlen = sizeof(int), 7038 .mode = 0644, 7039 .proc_handler = proc_dointvec, 7040 }, 7041 { 7042 .procname = "force_tllao", 7043 .data = &ipv6_devconf.force_tllao, 7044 .maxlen = sizeof(int), 7045 .mode = 0644, 7046 .proc_handler = proc_dointvec 7047 }, 7048 { 7049 .procname = "ndisc_notify", 7050 .data = &ipv6_devconf.ndisc_notify, 7051 .maxlen = sizeof(int), 7052 .mode = 0644, 7053 .proc_handler = proc_dointvec 7054 }, 7055 { 7056 .procname = "suppress_frag_ndisc", 7057 .data = &ipv6_devconf.suppress_frag_ndisc, 7058 .maxlen = sizeof(int), 7059 .mode = 0644, 7060 .proc_handler = proc_dointvec 7061 }, 7062 { 7063 .procname = "accept_ra_from_local", 7064 .data = &ipv6_devconf.accept_ra_from_local, 7065 .maxlen = sizeof(int), 7066 .mode = 0644, 7067 .proc_handler = proc_dointvec, 7068 }, 7069 { 7070 .procname = "accept_ra_mtu", 7071 .data = &ipv6_devconf.accept_ra_mtu, 7072 .maxlen = sizeof(int), 7073 .mode = 0644, 7074 .proc_handler = proc_dointvec, 7075 }, 7076 { 7077 .procname = "stable_secret", 7078 .data = &ipv6_devconf.stable_secret, 7079 .maxlen = IPV6_MAX_STRLEN, 7080 .mode = 0600, 7081 .proc_handler = addrconf_sysctl_stable_secret, 7082 }, 7083 { 7084 .procname = "use_oif_addrs_only", 7085 .data = &ipv6_devconf.use_oif_addrs_only, 7086 .maxlen = sizeof(int), 7087 .mode = 0644, 7088 .proc_handler = proc_dointvec, 7089 }, 7090 { 7091 .procname = "ignore_routes_with_linkdown", 7092 .data = &ipv6_devconf.ignore_routes_with_linkdown, 7093 .maxlen = sizeof(int), 7094 .mode = 0644, 7095 .proc_handler = addrconf_sysctl_ignore_routes_with_linkdown, 7096 }, 7097 { 7098 .procname = "drop_unicast_in_l2_multicast", 7099 .data = &ipv6_devconf.drop_unicast_in_l2_multicast, 7100 .maxlen = sizeof(int), 7101 .mode = 0644, 7102 .proc_handler = proc_dointvec, 7103 }, 7104 { 7105 .procname = "drop_unsolicited_na", 7106 .data = &ipv6_devconf.drop_unsolicited_na, 7107 .maxlen = sizeof(int), 7108 .mode = 0644, 7109 .proc_handler = proc_dointvec, 7110 }, 7111 { 7112 .procname = "keep_addr_on_down", 7113 .data = &ipv6_devconf.keep_addr_on_down, 7114 .maxlen = sizeof(int), 7115 .mode = 0644, 7116 .proc_handler = proc_dointvec, 7117 7118 }, 7119 { 7120 .procname = "seg6_enabled", 7121 .data = &ipv6_devconf.seg6_enabled, 7122 .maxlen = sizeof(int), 7123 .mode = 0644, 7124 .proc_handler = proc_dointvec, 7125 }, 7126 #ifdef CONFIG_IPV6_SEG6_HMAC 7127 { 7128 .procname = "seg6_require_hmac", 7129 .data = &ipv6_devconf.seg6_require_hmac, 7130 .maxlen = sizeof(int), 7131 .mode = 0644, 7132 .proc_handler = proc_dointvec, 7133 }, 7134 #endif 7135 { 7136 .procname = "enhanced_dad", 7137 .data = &ipv6_devconf.enhanced_dad, 7138 .maxlen = sizeof(int), 7139 .mode = 0644, 7140 .proc_handler = proc_dointvec, 7141 }, 7142 { 7143 .procname = "addr_gen_mode", 7144 .data = &ipv6_devconf.addr_gen_mode, 7145 .maxlen = sizeof(int), 7146 .mode = 0644, 7147 .proc_handler = addrconf_sysctl_addr_gen_mode, 7148 }, 7149 { 7150 .procname = "disable_policy", 7151 .data = &ipv6_devconf.disable_policy, 7152 .maxlen = sizeof(int), 7153 .mode = 0644, 7154 .proc_handler = addrconf_sysctl_disable_policy, 7155 }, 7156 { 7157 .procname = "ndisc_tclass", 7158 .data = &ipv6_devconf.ndisc_tclass, 7159 .maxlen = sizeof(int), 7160 .mode = 0644, 7161 .proc_handler = proc_dointvec_minmax, 7162 .extra1 = (void *)SYSCTL_ZERO, 7163 .extra2 = (void *)&two_five_five, 7164 }, 7165 { 7166 .procname = "rpl_seg_enabled", 7167 .data = &ipv6_devconf.rpl_seg_enabled, 7168 .maxlen = sizeof(int), 7169 .mode = 0644, 7170 .proc_handler = proc_dointvec, 7171 }, 7172 { 7173 .procname = "ioam6_enabled", 7174 .data = &ipv6_devconf.ioam6_enabled, 7175 .maxlen = sizeof(u8), 7176 .mode = 0644, 7177 .proc_handler = proc_dou8vec_minmax, 7178 .extra1 = (void *)SYSCTL_ZERO, 7179 .extra2 = (void *)SYSCTL_ONE, 7180 }, 7181 { 7182 .procname = "ioam6_id", 7183 .data = &ipv6_devconf.ioam6_id, 7184 .maxlen = sizeof(u32), 7185 .mode = 0644, 7186 .proc_handler = proc_douintvec_minmax, 7187 .extra1 = (void *)SYSCTL_ZERO, 7188 .extra2 = (void *)&ioam6_if_id_max, 7189 }, 7190 { 7191 .procname = "ioam6_id_wide", 7192 .data = &ipv6_devconf.ioam6_id_wide, 7193 .maxlen = sizeof(u32), 7194 .mode = 0644, 7195 .proc_handler = proc_douintvec, 7196 }, 7197 { 7198 .procname = "ndisc_evict_nocarrier", 7199 .data = &ipv6_devconf.ndisc_evict_nocarrier, 7200 .maxlen = sizeof(u8), 7201 .mode = 0644, 7202 .proc_handler = proc_dou8vec_minmax, 7203 .extra1 = (void *)SYSCTL_ZERO, 7204 .extra2 = (void *)SYSCTL_ONE, 7205 }, 7206 { 7207 .procname = "accept_untracked_na", 7208 .data = &ipv6_devconf.accept_untracked_na, 7209 .maxlen = sizeof(int), 7210 .mode = 0644, 7211 .proc_handler = proc_dointvec_minmax, 7212 .extra1 = SYSCTL_ZERO, 7213 .extra2 = SYSCTL_TWO, 7214 }, 7215 }; 7216 7217 static int __addrconf_sysctl_register(struct net *net, char *dev_name, 7218 struct inet6_dev *idev, struct ipv6_devconf *p) 7219 { 7220 size_t table_size = ARRAY_SIZE(addrconf_sysctl); 7221 int i, ifindex; 7222 struct ctl_table *table; 7223 char path[sizeof("net/ipv6/conf/") + IFNAMSIZ]; 7224 7225 table = kmemdup(addrconf_sysctl, sizeof(addrconf_sysctl), GFP_KERNEL_ACCOUNT); 7226 if (!table) 7227 goto out; 7228 7229 for (i = 0; i < table_size; i++) { 7230 table[i].data += (char *)p - (char *)&ipv6_devconf; 7231 /* If one of these is already set, then it is not safe to 7232 * overwrite either of them: this makes proc_dointvec_minmax 7233 * usable. 7234 */ 7235 if (!table[i].extra1 && !table[i].extra2) { 7236 table[i].extra1 = idev; /* embedded; no ref */ 7237 table[i].extra2 = net; 7238 } 7239 } 7240 7241 snprintf(path, sizeof(path), "net/ipv6/conf/%s", dev_name); 7242 7243 p->sysctl_header = register_net_sysctl_sz(net, path, table, 7244 table_size); 7245 if (!p->sysctl_header) 7246 goto free; 7247 7248 if (!strcmp(dev_name, "all")) 7249 ifindex = NETCONFA_IFINDEX_ALL; 7250 else if (!strcmp(dev_name, "default")) 7251 ifindex = NETCONFA_IFINDEX_DEFAULT; 7252 else 7253 ifindex = idev->dev->ifindex; 7254 inet6_netconf_notify_devconf(net, RTM_NEWNETCONF, NETCONFA_ALL, 7255 ifindex, p); 7256 return 0; 7257 7258 free: 7259 kfree(table); 7260 out: 7261 return -ENOBUFS; 7262 } 7263 7264 static void __addrconf_sysctl_unregister(struct net *net, 7265 struct ipv6_devconf *p, int ifindex) 7266 { 7267 const struct ctl_table *table; 7268 7269 if (!p->sysctl_header) 7270 return; 7271 7272 table = p->sysctl_header->ctl_table_arg; 7273 unregister_net_sysctl_table(p->sysctl_header); 7274 p->sysctl_header = NULL; 7275 kfree(table); 7276 7277 inet6_netconf_notify_devconf(net, RTM_DELNETCONF, 0, ifindex, NULL); 7278 } 7279 7280 static int addrconf_sysctl_register(struct inet6_dev *idev) 7281 { 7282 int err; 7283 7284 if (!sysctl_dev_name_is_allowed(idev->dev->name)) 7285 return -EINVAL; 7286 7287 err = neigh_sysctl_register(idev->dev, idev->nd_parms, 7288 &ndisc_ifinfo_sysctl_change); 7289 if (err) 7290 return err; 7291 err = __addrconf_sysctl_register(dev_net(idev->dev), idev->dev->name, 7292 idev, &idev->cnf); 7293 if (err) 7294 neigh_sysctl_unregister(idev->nd_parms); 7295 7296 return err; 7297 } 7298 7299 static void addrconf_sysctl_unregister(struct inet6_dev *idev) 7300 { 7301 __addrconf_sysctl_unregister(dev_net(idev->dev), &idev->cnf, 7302 idev->dev->ifindex); 7303 neigh_sysctl_unregister(idev->nd_parms); 7304 } 7305 7306 7307 #endif 7308 7309 static int __net_init addrconf_init_net(struct net *net) 7310 { 7311 int err = -ENOMEM; 7312 struct ipv6_devconf *all, *dflt; 7313 7314 spin_lock_init(&net->ipv6.addrconf_hash_lock); 7315 INIT_DEFERRABLE_WORK(&net->ipv6.addr_chk_work, addrconf_verify_work); 7316 net->ipv6.inet6_addr_lst = kcalloc(IN6_ADDR_HSIZE, 7317 sizeof(struct hlist_head), 7318 GFP_KERNEL); 7319 if (!net->ipv6.inet6_addr_lst) 7320 goto err_alloc_addr; 7321 7322 all = kmemdup(&ipv6_devconf, sizeof(ipv6_devconf), GFP_KERNEL); 7323 if (!all) 7324 goto err_alloc_all; 7325 7326 dflt = kmemdup(&ipv6_devconf_dflt, sizeof(ipv6_devconf_dflt), GFP_KERNEL); 7327 if (!dflt) 7328 goto err_alloc_dflt; 7329 7330 if (!net_eq(net, &init_net)) { 7331 switch (net_inherit_devconf()) { 7332 case 1: /* copy from init_net */ 7333 memcpy(all, init_net.ipv6.devconf_all, 7334 sizeof(ipv6_devconf)); 7335 memcpy(dflt, init_net.ipv6.devconf_dflt, 7336 sizeof(ipv6_devconf_dflt)); 7337 break; 7338 case 3: /* copy from the current netns */ 7339 memcpy(all, current->nsproxy->net_ns->ipv6.devconf_all, 7340 sizeof(ipv6_devconf)); 7341 memcpy(dflt, 7342 current->nsproxy->net_ns->ipv6.devconf_dflt, 7343 sizeof(ipv6_devconf_dflt)); 7344 break; 7345 case 0: 7346 case 2: 7347 /* use compiled values */ 7348 break; 7349 } 7350 } 7351 7352 /* these will be inherited by all namespaces */ 7353 dflt->autoconf = ipv6_defaults.autoconf; 7354 dflt->disable_ipv6 = ipv6_defaults.disable_ipv6; 7355 7356 dflt->stable_secret.initialized = false; 7357 all->stable_secret.initialized = false; 7358 7359 net->ipv6.devconf_all = all; 7360 net->ipv6.devconf_dflt = dflt; 7361 7362 #ifdef CONFIG_SYSCTL 7363 err = __addrconf_sysctl_register(net, "all", NULL, all); 7364 if (err < 0) 7365 goto err_reg_all; 7366 7367 err = __addrconf_sysctl_register(net, "default", NULL, dflt); 7368 if (err < 0) 7369 goto err_reg_dflt; 7370 #endif 7371 return 0; 7372 7373 #ifdef CONFIG_SYSCTL 7374 err_reg_dflt: 7375 __addrconf_sysctl_unregister(net, all, NETCONFA_IFINDEX_ALL); 7376 err_reg_all: 7377 kfree(dflt); 7378 net->ipv6.devconf_dflt = NULL; 7379 #endif 7380 err_alloc_dflt: 7381 kfree(all); 7382 net->ipv6.devconf_all = NULL; 7383 err_alloc_all: 7384 kfree(net->ipv6.inet6_addr_lst); 7385 err_alloc_addr: 7386 return err; 7387 } 7388 7389 static void __net_exit addrconf_exit_net(struct net *net) 7390 { 7391 int i; 7392 7393 #ifdef CONFIG_SYSCTL 7394 __addrconf_sysctl_unregister(net, net->ipv6.devconf_dflt, 7395 NETCONFA_IFINDEX_DEFAULT); 7396 __addrconf_sysctl_unregister(net, net->ipv6.devconf_all, 7397 NETCONFA_IFINDEX_ALL); 7398 #endif 7399 kfree(net->ipv6.devconf_dflt); 7400 net->ipv6.devconf_dflt = NULL; 7401 kfree(net->ipv6.devconf_all); 7402 net->ipv6.devconf_all = NULL; 7403 7404 cancel_delayed_work_sync(&net->ipv6.addr_chk_work); 7405 /* 7406 * Check hash table, then free it. 7407 */ 7408 for (i = 0; i < IN6_ADDR_HSIZE; i++) 7409 WARN_ON_ONCE(!hlist_empty(&net->ipv6.inet6_addr_lst[i])); 7410 7411 kfree(net->ipv6.inet6_addr_lst); 7412 net->ipv6.inet6_addr_lst = NULL; 7413 } 7414 7415 static struct pernet_operations addrconf_ops = { 7416 .init = addrconf_init_net, 7417 .exit = addrconf_exit_net, 7418 }; 7419 7420 static struct rtnl_af_ops inet6_ops __read_mostly = { 7421 .family = AF_INET6, 7422 .fill_link_af = inet6_fill_link_af, 7423 .get_link_af_size = inet6_get_link_af_size, 7424 .validate_link_af = inet6_validate_link_af, 7425 .set_link_af = inet6_set_link_af, 7426 }; 7427 7428 static const struct rtnl_msg_handler addrconf_rtnl_msg_handlers[] __initconst_or_module = { 7429 {.owner = THIS_MODULE, .protocol = PF_INET6, .msgtype = RTM_GETLINK, 7430 .dumpit = inet6_dump_ifinfo, .flags = RTNL_FLAG_DUMP_UNLOCKED}, 7431 {.owner = THIS_MODULE, .protocol = PF_INET6, .msgtype = RTM_NEWADDR, 7432 .doit = inet6_rtm_newaddr, .flags = RTNL_FLAG_DOIT_PERNET}, 7433 {.owner = THIS_MODULE, .protocol = PF_INET6, .msgtype = RTM_DELADDR, 7434 .doit = inet6_rtm_deladdr, .flags = RTNL_FLAG_DOIT_PERNET}, 7435 {.owner = THIS_MODULE, .protocol = PF_INET6, .msgtype = RTM_GETADDR, 7436 .doit = inet6_rtm_getaddr, .dumpit = inet6_dump_ifaddr, 7437 .flags = RTNL_FLAG_DOIT_UNLOCKED | RTNL_FLAG_DUMP_UNLOCKED}, 7438 {.owner = THIS_MODULE, .protocol = PF_INET6, .msgtype = RTM_GETMULTICAST, 7439 .dumpit = inet6_dump_ifmcaddr, 7440 .flags = RTNL_FLAG_DUMP_UNLOCKED}, 7441 {.owner = THIS_MODULE, .protocol = PF_INET6, .msgtype = RTM_GETANYCAST, 7442 .dumpit = inet6_dump_ifacaddr, 7443 .flags = RTNL_FLAG_DUMP_UNLOCKED}, 7444 {.owner = THIS_MODULE, .protocol = PF_INET6, .msgtype = RTM_GETNETCONF, 7445 .doit = inet6_netconf_get_devconf, .dumpit = inet6_netconf_dump_devconf, 7446 .flags = RTNL_FLAG_DOIT_UNLOCKED | RTNL_FLAG_DUMP_UNLOCKED}, 7447 }; 7448 7449 /* 7450 * Init / cleanup code 7451 */ 7452 7453 int __init addrconf_init(void) 7454 { 7455 struct inet6_dev *idev; 7456 int err; 7457 7458 err = ipv6_addr_label_init(); 7459 if (err < 0) { 7460 pr_crit("%s: cannot initialize default policy table: %d\n", 7461 __func__, err); 7462 goto out; 7463 } 7464 7465 err = register_pernet_subsys(&addrconf_ops); 7466 if (err < 0) 7467 goto out_addrlabel; 7468 7469 /* All works using addrconf_wq need to lock rtnl. */ 7470 addrconf_wq = create_singlethread_workqueue("ipv6_addrconf"); 7471 if (!addrconf_wq) { 7472 err = -ENOMEM; 7473 goto out_nowq; 7474 } 7475 7476 rtnl_net_lock(&init_net); 7477 idev = ipv6_add_dev(blackhole_netdev); 7478 rtnl_net_unlock(&init_net); 7479 if (IS_ERR(idev)) { 7480 err = PTR_ERR(idev); 7481 goto errlo; 7482 } 7483 7484 ip6_route_init_special_entries(); 7485 7486 register_netdevice_notifier(&ipv6_dev_notf); 7487 7488 addrconf_verify(&init_net); 7489 7490 err = rtnl_af_register(&inet6_ops); 7491 if (err) 7492 goto erraf; 7493 7494 err = rtnl_register_many(addrconf_rtnl_msg_handlers); 7495 if (err) 7496 goto errout; 7497 7498 err = ipv6_addr_label_rtnl_register(); 7499 if (err < 0) 7500 goto errout; 7501 7502 return 0; 7503 errout: 7504 rtnl_unregister_all(PF_INET6); 7505 rtnl_af_unregister(&inet6_ops); 7506 erraf: 7507 unregister_netdevice_notifier(&ipv6_dev_notf); 7508 errlo: 7509 destroy_workqueue(addrconf_wq); 7510 out_nowq: 7511 unregister_pernet_subsys(&addrconf_ops); 7512 out_addrlabel: 7513 ipv6_addr_label_cleanup(); 7514 out: 7515 return err; 7516 } 7517 7518 void addrconf_cleanup(void) 7519 { 7520 struct net_device *dev; 7521 7522 unregister_netdevice_notifier(&ipv6_dev_notf); 7523 unregister_pernet_subsys(&addrconf_ops); 7524 ipv6_addr_label_cleanup(); 7525 7526 rtnl_af_unregister(&inet6_ops); 7527 7528 rtnl_net_lock(&init_net); 7529 7530 /* clean dev list */ 7531 for_each_netdev(&init_net, dev) { 7532 if (!__in6_dev_get_rtnl_net(dev)) 7533 continue; 7534 addrconf_ifdown(dev, true); 7535 } 7536 addrconf_ifdown(init_net.loopback_dev, true); 7537 7538 rtnl_net_unlock(&init_net); 7539 7540 destroy_workqueue(addrconf_wq); 7541 } 7542