1 /* 2 * NET3 IP device support routines. 3 * 4 * Version: $Id: devinet.c,v 1.44 2001/10/31 21:55:54 davem Exp $ 5 * 6 * This program is free software; you can redistribute it and/or 7 * modify it under the terms of the GNU General Public License 8 * as published by the Free Software Foundation; either version 9 * 2 of the License, or (at your option) any later version. 10 * 11 * Derived from the IP parts of dev.c 1.0.19 12 * Authors: Ross Biro 13 * Fred N. van Kempen, <waltje@uWalt.NL.Mugnet.ORG> 14 * Mark Evans, <evansmp@uhura.aston.ac.uk> 15 * 16 * Additional Authors: 17 * Alan Cox, <gw4pts@gw4pts.ampr.org> 18 * Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru> 19 * 20 * Changes: 21 * Alexey Kuznetsov: pa_* fields are replaced with ifaddr 22 * lists. 23 * Cyrus Durgin: updated for kmod 24 * Matthias Andree: in devinet_ioctl, compare label and 25 * address (4.4BSD alias style support), 26 * fall back to comparing just the label 27 * if no match found. 28 */ 29 30 31 #include <asm/uaccess.h> 32 #include <asm/system.h> 33 #include <linux/bitops.h> 34 #include <linux/capability.h> 35 #include <linux/module.h> 36 #include <linux/types.h> 37 #include <linux/kernel.h> 38 #include <linux/string.h> 39 #include <linux/mm.h> 40 #include <linux/socket.h> 41 #include <linux/sockios.h> 42 #include <linux/in.h> 43 #include <linux/errno.h> 44 #include <linux/interrupt.h> 45 #include <linux/if_addr.h> 46 #include <linux/if_ether.h> 47 #include <linux/inet.h> 48 #include <linux/netdevice.h> 49 #include <linux/etherdevice.h> 50 #include <linux/skbuff.h> 51 #include <linux/init.h> 52 #include <linux/notifier.h> 53 #include <linux/inetdevice.h> 54 #include <linux/igmp.h> 55 #ifdef CONFIG_SYSCTL 56 #include <linux/sysctl.h> 57 #endif 58 #include <linux/kmod.h> 59 60 #include <net/arp.h> 61 #include <net/ip.h> 62 #include <net/route.h> 63 #include <net/ip_fib.h> 64 #include <net/rtnetlink.h> 65 66 struct ipv4_devconf ipv4_devconf = { 67 .data = { 68 [NET_IPV4_CONF_ACCEPT_REDIRECTS - 1] = 1, 69 [NET_IPV4_CONF_SEND_REDIRECTS - 1] = 1, 70 [NET_IPV4_CONF_SECURE_REDIRECTS - 1] = 1, 71 [NET_IPV4_CONF_SHARED_MEDIA - 1] = 1, 72 }, 73 }; 74 75 static struct ipv4_devconf ipv4_devconf_dflt = { 76 .data = { 77 [NET_IPV4_CONF_ACCEPT_REDIRECTS - 1] = 1, 78 [NET_IPV4_CONF_SEND_REDIRECTS - 1] = 1, 79 [NET_IPV4_CONF_SECURE_REDIRECTS - 1] = 1, 80 [NET_IPV4_CONF_SHARED_MEDIA - 1] = 1, 81 [NET_IPV4_CONF_ACCEPT_SOURCE_ROUTE - 1] = 1, 82 }, 83 }; 84 85 #define IPV4_DEVCONF_DFLT(attr) IPV4_DEVCONF(ipv4_devconf_dflt, attr) 86 87 static const struct nla_policy ifa_ipv4_policy[IFA_MAX+1] = { 88 [IFA_LOCAL] = { .type = NLA_U32 }, 89 [IFA_ADDRESS] = { .type = NLA_U32 }, 90 [IFA_BROADCAST] = { .type = NLA_U32 }, 91 [IFA_ANYCAST] = { .type = NLA_U32 }, 92 [IFA_LABEL] = { .type = NLA_STRING, .len = IFNAMSIZ - 1 }, 93 }; 94 95 static void rtmsg_ifa(int event, struct in_ifaddr *, struct nlmsghdr *, u32); 96 97 static BLOCKING_NOTIFIER_HEAD(inetaddr_chain); 98 static void inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap, 99 int destroy); 100 #ifdef CONFIG_SYSCTL 101 static void devinet_sysctl_register(struct in_device *in_dev, 102 struct ipv4_devconf *p); 103 static void devinet_sysctl_unregister(struct ipv4_devconf *p); 104 #endif 105 106 /* Locks all the inet devices. */ 107 108 static struct in_ifaddr *inet_alloc_ifa(void) 109 { 110 struct in_ifaddr *ifa = kzalloc(sizeof(*ifa), GFP_KERNEL); 111 112 if (ifa) { 113 INIT_RCU_HEAD(&ifa->rcu_head); 114 } 115 116 return ifa; 117 } 118 119 static void inet_rcu_free_ifa(struct rcu_head *head) 120 { 121 struct in_ifaddr *ifa = container_of(head, struct in_ifaddr, rcu_head); 122 if (ifa->ifa_dev) 123 in_dev_put(ifa->ifa_dev); 124 kfree(ifa); 125 } 126 127 static inline void inet_free_ifa(struct in_ifaddr *ifa) 128 { 129 call_rcu(&ifa->rcu_head, inet_rcu_free_ifa); 130 } 131 132 void in_dev_finish_destroy(struct in_device *idev) 133 { 134 struct net_device *dev = idev->dev; 135 136 BUG_TRAP(!idev->ifa_list); 137 BUG_TRAP(!idev->mc_list); 138 #ifdef NET_REFCNT_DEBUG 139 printk(KERN_DEBUG "in_dev_finish_destroy: %p=%s\n", 140 idev, dev ? dev->name : "NIL"); 141 #endif 142 dev_put(dev); 143 if (!idev->dead) 144 printk("Freeing alive in_device %p\n", idev); 145 else { 146 kfree(idev); 147 } 148 } 149 150 static struct in_device *inetdev_init(struct net_device *dev) 151 { 152 struct in_device *in_dev; 153 154 ASSERT_RTNL(); 155 156 in_dev = kzalloc(sizeof(*in_dev), GFP_KERNEL); 157 if (!in_dev) 158 goto out; 159 INIT_RCU_HEAD(&in_dev->rcu_head); 160 memcpy(&in_dev->cnf, &ipv4_devconf_dflt, sizeof(in_dev->cnf)); 161 in_dev->cnf.sysctl = NULL; 162 in_dev->dev = dev; 163 if ((in_dev->arp_parms = neigh_parms_alloc(dev, &arp_tbl)) == NULL) 164 goto out_kfree; 165 /* Reference in_dev->dev */ 166 dev_hold(dev); 167 #ifdef CONFIG_SYSCTL 168 neigh_sysctl_register(dev, in_dev->arp_parms, NET_IPV4, 169 NET_IPV4_NEIGH, "ipv4", NULL, NULL); 170 #endif 171 172 /* Account for reference dev->ip_ptr (below) */ 173 in_dev_hold(in_dev); 174 175 #ifdef CONFIG_SYSCTL 176 devinet_sysctl_register(in_dev, &in_dev->cnf); 177 #endif 178 ip_mc_init_dev(in_dev); 179 if (dev->flags & IFF_UP) 180 ip_mc_up(in_dev); 181 182 /* we can receive as soon as ip_ptr is set -- do this last */ 183 rcu_assign_pointer(dev->ip_ptr, in_dev); 184 out: 185 return in_dev; 186 out_kfree: 187 kfree(in_dev); 188 in_dev = NULL; 189 goto out; 190 } 191 192 static void in_dev_rcu_put(struct rcu_head *head) 193 { 194 struct in_device *idev = container_of(head, struct in_device, rcu_head); 195 in_dev_put(idev); 196 } 197 198 static void inetdev_destroy(struct in_device *in_dev) 199 { 200 struct in_ifaddr *ifa; 201 struct net_device *dev; 202 203 ASSERT_RTNL(); 204 205 dev = in_dev->dev; 206 207 in_dev->dead = 1; 208 209 ip_mc_destroy_dev(in_dev); 210 211 while ((ifa = in_dev->ifa_list) != NULL) { 212 inet_del_ifa(in_dev, &in_dev->ifa_list, 0); 213 inet_free_ifa(ifa); 214 } 215 216 #ifdef CONFIG_SYSCTL 217 devinet_sysctl_unregister(&in_dev->cnf); 218 #endif 219 220 dev->ip_ptr = NULL; 221 222 #ifdef CONFIG_SYSCTL 223 neigh_sysctl_unregister(in_dev->arp_parms); 224 #endif 225 neigh_parms_release(&arp_tbl, in_dev->arp_parms); 226 arp_ifdown(dev); 227 228 call_rcu(&in_dev->rcu_head, in_dev_rcu_put); 229 } 230 231 int inet_addr_onlink(struct in_device *in_dev, __be32 a, __be32 b) 232 { 233 rcu_read_lock(); 234 for_primary_ifa(in_dev) { 235 if (inet_ifa_match(a, ifa)) { 236 if (!b || inet_ifa_match(b, ifa)) { 237 rcu_read_unlock(); 238 return 1; 239 } 240 } 241 } endfor_ifa(in_dev); 242 rcu_read_unlock(); 243 return 0; 244 } 245 246 static void __inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap, 247 int destroy, struct nlmsghdr *nlh, u32 pid) 248 { 249 struct in_ifaddr *promote = NULL; 250 struct in_ifaddr *ifa, *ifa1 = *ifap; 251 struct in_ifaddr *last_prim = in_dev->ifa_list; 252 struct in_ifaddr *prev_prom = NULL; 253 int do_promote = IN_DEV_PROMOTE_SECONDARIES(in_dev); 254 255 ASSERT_RTNL(); 256 257 /* 1. Deleting primary ifaddr forces deletion all secondaries 258 * unless alias promotion is set 259 **/ 260 261 if (!(ifa1->ifa_flags & IFA_F_SECONDARY)) { 262 struct in_ifaddr **ifap1 = &ifa1->ifa_next; 263 264 while ((ifa = *ifap1) != NULL) { 265 if (!(ifa->ifa_flags & IFA_F_SECONDARY) && 266 ifa1->ifa_scope <= ifa->ifa_scope) 267 last_prim = ifa; 268 269 if (!(ifa->ifa_flags & IFA_F_SECONDARY) || 270 ifa1->ifa_mask != ifa->ifa_mask || 271 !inet_ifa_match(ifa1->ifa_address, ifa)) { 272 ifap1 = &ifa->ifa_next; 273 prev_prom = ifa; 274 continue; 275 } 276 277 if (!do_promote) { 278 *ifap1 = ifa->ifa_next; 279 280 rtmsg_ifa(RTM_DELADDR, ifa, nlh, pid); 281 blocking_notifier_call_chain(&inetaddr_chain, 282 NETDEV_DOWN, ifa); 283 inet_free_ifa(ifa); 284 } else { 285 promote = ifa; 286 break; 287 } 288 } 289 } 290 291 /* 2. Unlink it */ 292 293 *ifap = ifa1->ifa_next; 294 295 /* 3. Announce address deletion */ 296 297 /* Send message first, then call notifier. 298 At first sight, FIB update triggered by notifier 299 will refer to already deleted ifaddr, that could confuse 300 netlink listeners. It is not true: look, gated sees 301 that route deleted and if it still thinks that ifaddr 302 is valid, it will try to restore deleted routes... Grr. 303 So that, this order is correct. 304 */ 305 rtmsg_ifa(RTM_DELADDR, ifa1, nlh, pid); 306 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_DOWN, ifa1); 307 308 if (promote) { 309 310 if (prev_prom) { 311 prev_prom->ifa_next = promote->ifa_next; 312 promote->ifa_next = last_prim->ifa_next; 313 last_prim->ifa_next = promote; 314 } 315 316 promote->ifa_flags &= ~IFA_F_SECONDARY; 317 rtmsg_ifa(RTM_NEWADDR, promote, nlh, pid); 318 blocking_notifier_call_chain(&inetaddr_chain, 319 NETDEV_UP, promote); 320 for (ifa = promote->ifa_next; ifa; ifa = ifa->ifa_next) { 321 if (ifa1->ifa_mask != ifa->ifa_mask || 322 !inet_ifa_match(ifa1->ifa_address, ifa)) 323 continue; 324 fib_add_ifaddr(ifa); 325 } 326 327 } 328 if (destroy) 329 inet_free_ifa(ifa1); 330 } 331 332 static void inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap, 333 int destroy) 334 { 335 __inet_del_ifa(in_dev, ifap, destroy, NULL, 0); 336 } 337 338 static int __inet_insert_ifa(struct in_ifaddr *ifa, struct nlmsghdr *nlh, 339 u32 pid) 340 { 341 struct in_device *in_dev = ifa->ifa_dev; 342 struct in_ifaddr *ifa1, **ifap, **last_primary; 343 344 ASSERT_RTNL(); 345 346 if (!ifa->ifa_local) { 347 inet_free_ifa(ifa); 348 return 0; 349 } 350 351 ifa->ifa_flags &= ~IFA_F_SECONDARY; 352 last_primary = &in_dev->ifa_list; 353 354 for (ifap = &in_dev->ifa_list; (ifa1 = *ifap) != NULL; 355 ifap = &ifa1->ifa_next) { 356 if (!(ifa1->ifa_flags & IFA_F_SECONDARY) && 357 ifa->ifa_scope <= ifa1->ifa_scope) 358 last_primary = &ifa1->ifa_next; 359 if (ifa1->ifa_mask == ifa->ifa_mask && 360 inet_ifa_match(ifa1->ifa_address, ifa)) { 361 if (ifa1->ifa_local == ifa->ifa_local) { 362 inet_free_ifa(ifa); 363 return -EEXIST; 364 } 365 if (ifa1->ifa_scope != ifa->ifa_scope) { 366 inet_free_ifa(ifa); 367 return -EINVAL; 368 } 369 ifa->ifa_flags |= IFA_F_SECONDARY; 370 } 371 } 372 373 if (!(ifa->ifa_flags & IFA_F_SECONDARY)) { 374 net_srandom(ifa->ifa_local); 375 ifap = last_primary; 376 } 377 378 ifa->ifa_next = *ifap; 379 *ifap = ifa; 380 381 /* Send message first, then call notifier. 382 Notifier will trigger FIB update, so that 383 listeners of netlink will know about new ifaddr */ 384 rtmsg_ifa(RTM_NEWADDR, ifa, nlh, pid); 385 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_UP, ifa); 386 387 return 0; 388 } 389 390 static int inet_insert_ifa(struct in_ifaddr *ifa) 391 { 392 return __inet_insert_ifa(ifa, NULL, 0); 393 } 394 395 static int inet_set_ifa(struct net_device *dev, struct in_ifaddr *ifa) 396 { 397 struct in_device *in_dev = __in_dev_get_rtnl(dev); 398 399 ASSERT_RTNL(); 400 401 if (!in_dev) { 402 inet_free_ifa(ifa); 403 return -ENOBUFS; 404 } 405 ipv4_devconf_setall(in_dev); 406 if (ifa->ifa_dev != in_dev) { 407 BUG_TRAP(!ifa->ifa_dev); 408 in_dev_hold(in_dev); 409 ifa->ifa_dev = in_dev; 410 } 411 if (LOOPBACK(ifa->ifa_local)) 412 ifa->ifa_scope = RT_SCOPE_HOST; 413 return inet_insert_ifa(ifa); 414 } 415 416 struct in_device *inetdev_by_index(int ifindex) 417 { 418 struct net_device *dev; 419 struct in_device *in_dev = NULL; 420 read_lock(&dev_base_lock); 421 dev = __dev_get_by_index(&init_net, ifindex); 422 if (dev) 423 in_dev = in_dev_get(dev); 424 read_unlock(&dev_base_lock); 425 return in_dev; 426 } 427 428 /* Called only from RTNL semaphored context. No locks. */ 429 430 struct in_ifaddr *inet_ifa_byprefix(struct in_device *in_dev, __be32 prefix, 431 __be32 mask) 432 { 433 ASSERT_RTNL(); 434 435 for_primary_ifa(in_dev) { 436 if (ifa->ifa_mask == mask && inet_ifa_match(prefix, ifa)) 437 return ifa; 438 } endfor_ifa(in_dev); 439 return NULL; 440 } 441 442 static int inet_rtm_deladdr(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg) 443 { 444 struct nlattr *tb[IFA_MAX+1]; 445 struct in_device *in_dev; 446 struct ifaddrmsg *ifm; 447 struct in_ifaddr *ifa, **ifap; 448 int err = -EINVAL; 449 450 ASSERT_RTNL(); 451 452 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv4_policy); 453 if (err < 0) 454 goto errout; 455 456 ifm = nlmsg_data(nlh); 457 in_dev = inetdev_by_index(ifm->ifa_index); 458 if (in_dev == NULL) { 459 err = -ENODEV; 460 goto errout; 461 } 462 463 __in_dev_put(in_dev); 464 465 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL; 466 ifap = &ifa->ifa_next) { 467 if (tb[IFA_LOCAL] && 468 ifa->ifa_local != nla_get_be32(tb[IFA_LOCAL])) 469 continue; 470 471 if (tb[IFA_LABEL] && nla_strcmp(tb[IFA_LABEL], ifa->ifa_label)) 472 continue; 473 474 if (tb[IFA_ADDRESS] && 475 (ifm->ifa_prefixlen != ifa->ifa_prefixlen || 476 !inet_ifa_match(nla_get_be32(tb[IFA_ADDRESS]), ifa))) 477 continue; 478 479 __inet_del_ifa(in_dev, ifap, 1, nlh, NETLINK_CB(skb).pid); 480 return 0; 481 } 482 483 err = -EADDRNOTAVAIL; 484 errout: 485 return err; 486 } 487 488 static struct in_ifaddr *rtm_to_ifaddr(struct nlmsghdr *nlh) 489 { 490 struct nlattr *tb[IFA_MAX+1]; 491 struct in_ifaddr *ifa; 492 struct ifaddrmsg *ifm; 493 struct net_device *dev; 494 struct in_device *in_dev; 495 int err = -EINVAL; 496 497 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv4_policy); 498 if (err < 0) 499 goto errout; 500 501 ifm = nlmsg_data(nlh); 502 if (ifm->ifa_prefixlen > 32 || tb[IFA_LOCAL] == NULL) { 503 err = -EINVAL; 504 goto errout; 505 } 506 507 dev = __dev_get_by_index(&init_net, ifm->ifa_index); 508 if (dev == NULL) { 509 err = -ENODEV; 510 goto errout; 511 } 512 513 in_dev = __in_dev_get_rtnl(dev); 514 if (in_dev == NULL) { 515 err = -ENOBUFS; 516 goto errout; 517 } 518 519 ifa = inet_alloc_ifa(); 520 if (ifa == NULL) { 521 /* 522 * A potential indev allocation can be left alive, it stays 523 * assigned to its device and is destroy with it. 524 */ 525 err = -ENOBUFS; 526 goto errout; 527 } 528 529 ipv4_devconf_setall(in_dev); 530 in_dev_hold(in_dev); 531 532 if (tb[IFA_ADDRESS] == NULL) 533 tb[IFA_ADDRESS] = tb[IFA_LOCAL]; 534 535 ifa->ifa_prefixlen = ifm->ifa_prefixlen; 536 ifa->ifa_mask = inet_make_mask(ifm->ifa_prefixlen); 537 ifa->ifa_flags = ifm->ifa_flags; 538 ifa->ifa_scope = ifm->ifa_scope; 539 ifa->ifa_dev = in_dev; 540 541 ifa->ifa_local = nla_get_be32(tb[IFA_LOCAL]); 542 ifa->ifa_address = nla_get_be32(tb[IFA_ADDRESS]); 543 544 if (tb[IFA_BROADCAST]) 545 ifa->ifa_broadcast = nla_get_be32(tb[IFA_BROADCAST]); 546 547 if (tb[IFA_ANYCAST]) 548 ifa->ifa_anycast = nla_get_be32(tb[IFA_ANYCAST]); 549 550 if (tb[IFA_LABEL]) 551 nla_strlcpy(ifa->ifa_label, tb[IFA_LABEL], IFNAMSIZ); 552 else 553 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ); 554 555 return ifa; 556 557 errout: 558 return ERR_PTR(err); 559 } 560 561 static int inet_rtm_newaddr(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg) 562 { 563 struct in_ifaddr *ifa; 564 565 ASSERT_RTNL(); 566 567 ifa = rtm_to_ifaddr(nlh); 568 if (IS_ERR(ifa)) 569 return PTR_ERR(ifa); 570 571 return __inet_insert_ifa(ifa, nlh, NETLINK_CB(skb).pid); 572 } 573 574 /* 575 * Determine a default network mask, based on the IP address. 576 */ 577 578 static __inline__ int inet_abc_len(__be32 addr) 579 { 580 int rc = -1; /* Something else, probably a multicast. */ 581 582 if (ZERONET(addr)) 583 rc = 0; 584 else { 585 __u32 haddr = ntohl(addr); 586 587 if (IN_CLASSA(haddr)) 588 rc = 8; 589 else if (IN_CLASSB(haddr)) 590 rc = 16; 591 else if (IN_CLASSC(haddr)) 592 rc = 24; 593 } 594 595 return rc; 596 } 597 598 599 int devinet_ioctl(unsigned int cmd, void __user *arg) 600 { 601 struct ifreq ifr; 602 struct sockaddr_in sin_orig; 603 struct sockaddr_in *sin = (struct sockaddr_in *)&ifr.ifr_addr; 604 struct in_device *in_dev; 605 struct in_ifaddr **ifap = NULL; 606 struct in_ifaddr *ifa = NULL; 607 struct net_device *dev; 608 char *colon; 609 int ret = -EFAULT; 610 int tryaddrmatch = 0; 611 612 /* 613 * Fetch the caller's info block into kernel space 614 */ 615 616 if (copy_from_user(&ifr, arg, sizeof(struct ifreq))) 617 goto out; 618 ifr.ifr_name[IFNAMSIZ - 1] = 0; 619 620 /* save original address for comparison */ 621 memcpy(&sin_orig, sin, sizeof(*sin)); 622 623 colon = strchr(ifr.ifr_name, ':'); 624 if (colon) 625 *colon = 0; 626 627 #ifdef CONFIG_KMOD 628 dev_load(&init_net, ifr.ifr_name); 629 #endif 630 631 switch (cmd) { 632 case SIOCGIFADDR: /* Get interface address */ 633 case SIOCGIFBRDADDR: /* Get the broadcast address */ 634 case SIOCGIFDSTADDR: /* Get the destination address */ 635 case SIOCGIFNETMASK: /* Get the netmask for the interface */ 636 /* Note that these ioctls will not sleep, 637 so that we do not impose a lock. 638 One day we will be forced to put shlock here (I mean SMP) 639 */ 640 tryaddrmatch = (sin_orig.sin_family == AF_INET); 641 memset(sin, 0, sizeof(*sin)); 642 sin->sin_family = AF_INET; 643 break; 644 645 case SIOCSIFFLAGS: 646 ret = -EACCES; 647 if (!capable(CAP_NET_ADMIN)) 648 goto out; 649 break; 650 case SIOCSIFADDR: /* Set interface address (and family) */ 651 case SIOCSIFBRDADDR: /* Set the broadcast address */ 652 case SIOCSIFDSTADDR: /* Set the destination address */ 653 case SIOCSIFNETMASK: /* Set the netmask for the interface */ 654 ret = -EACCES; 655 if (!capable(CAP_NET_ADMIN)) 656 goto out; 657 ret = -EINVAL; 658 if (sin->sin_family != AF_INET) 659 goto out; 660 break; 661 default: 662 ret = -EINVAL; 663 goto out; 664 } 665 666 rtnl_lock(); 667 668 ret = -ENODEV; 669 if ((dev = __dev_get_by_name(&init_net, ifr.ifr_name)) == NULL) 670 goto done; 671 672 if (colon) 673 *colon = ':'; 674 675 if ((in_dev = __in_dev_get_rtnl(dev)) != NULL) { 676 if (tryaddrmatch) { 677 /* Matthias Andree */ 678 /* compare label and address (4.4BSD style) */ 679 /* note: we only do this for a limited set of ioctls 680 and only if the original address family was AF_INET. 681 This is checked above. */ 682 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL; 683 ifap = &ifa->ifa_next) { 684 if (!strcmp(ifr.ifr_name, ifa->ifa_label) && 685 sin_orig.sin_addr.s_addr == 686 ifa->ifa_address) { 687 break; /* found */ 688 } 689 } 690 } 691 /* we didn't get a match, maybe the application is 692 4.3BSD-style and passed in junk so we fall back to 693 comparing just the label */ 694 if (!ifa) { 695 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL; 696 ifap = &ifa->ifa_next) 697 if (!strcmp(ifr.ifr_name, ifa->ifa_label)) 698 break; 699 } 700 } 701 702 ret = -EADDRNOTAVAIL; 703 if (!ifa && cmd != SIOCSIFADDR && cmd != SIOCSIFFLAGS) 704 goto done; 705 706 switch (cmd) { 707 case SIOCGIFADDR: /* Get interface address */ 708 sin->sin_addr.s_addr = ifa->ifa_local; 709 goto rarok; 710 711 case SIOCGIFBRDADDR: /* Get the broadcast address */ 712 sin->sin_addr.s_addr = ifa->ifa_broadcast; 713 goto rarok; 714 715 case SIOCGIFDSTADDR: /* Get the destination address */ 716 sin->sin_addr.s_addr = ifa->ifa_address; 717 goto rarok; 718 719 case SIOCGIFNETMASK: /* Get the netmask for the interface */ 720 sin->sin_addr.s_addr = ifa->ifa_mask; 721 goto rarok; 722 723 case SIOCSIFFLAGS: 724 if (colon) { 725 ret = -EADDRNOTAVAIL; 726 if (!ifa) 727 break; 728 ret = 0; 729 if (!(ifr.ifr_flags & IFF_UP)) 730 inet_del_ifa(in_dev, ifap, 1); 731 break; 732 } 733 ret = dev_change_flags(dev, ifr.ifr_flags); 734 break; 735 736 case SIOCSIFADDR: /* Set interface address (and family) */ 737 ret = -EINVAL; 738 if (inet_abc_len(sin->sin_addr.s_addr) < 0) 739 break; 740 741 if (!ifa) { 742 ret = -ENOBUFS; 743 if ((ifa = inet_alloc_ifa()) == NULL) 744 break; 745 if (colon) 746 memcpy(ifa->ifa_label, ifr.ifr_name, IFNAMSIZ); 747 else 748 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ); 749 } else { 750 ret = 0; 751 if (ifa->ifa_local == sin->sin_addr.s_addr) 752 break; 753 inet_del_ifa(in_dev, ifap, 0); 754 ifa->ifa_broadcast = 0; 755 ifa->ifa_anycast = 0; 756 } 757 758 ifa->ifa_address = ifa->ifa_local = sin->sin_addr.s_addr; 759 760 if (!(dev->flags & IFF_POINTOPOINT)) { 761 ifa->ifa_prefixlen = inet_abc_len(ifa->ifa_address); 762 ifa->ifa_mask = inet_make_mask(ifa->ifa_prefixlen); 763 if ((dev->flags & IFF_BROADCAST) && 764 ifa->ifa_prefixlen < 31) 765 ifa->ifa_broadcast = ifa->ifa_address | 766 ~ifa->ifa_mask; 767 } else { 768 ifa->ifa_prefixlen = 32; 769 ifa->ifa_mask = inet_make_mask(32); 770 } 771 ret = inet_set_ifa(dev, ifa); 772 break; 773 774 case SIOCSIFBRDADDR: /* Set the broadcast address */ 775 ret = 0; 776 if (ifa->ifa_broadcast != sin->sin_addr.s_addr) { 777 inet_del_ifa(in_dev, ifap, 0); 778 ifa->ifa_broadcast = sin->sin_addr.s_addr; 779 inet_insert_ifa(ifa); 780 } 781 break; 782 783 case SIOCSIFDSTADDR: /* Set the destination address */ 784 ret = 0; 785 if (ifa->ifa_address == sin->sin_addr.s_addr) 786 break; 787 ret = -EINVAL; 788 if (inet_abc_len(sin->sin_addr.s_addr) < 0) 789 break; 790 ret = 0; 791 inet_del_ifa(in_dev, ifap, 0); 792 ifa->ifa_address = sin->sin_addr.s_addr; 793 inet_insert_ifa(ifa); 794 break; 795 796 case SIOCSIFNETMASK: /* Set the netmask for the interface */ 797 798 /* 799 * The mask we set must be legal. 800 */ 801 ret = -EINVAL; 802 if (bad_mask(sin->sin_addr.s_addr, 0)) 803 break; 804 ret = 0; 805 if (ifa->ifa_mask != sin->sin_addr.s_addr) { 806 __be32 old_mask = ifa->ifa_mask; 807 inet_del_ifa(in_dev, ifap, 0); 808 ifa->ifa_mask = sin->sin_addr.s_addr; 809 ifa->ifa_prefixlen = inet_mask_len(ifa->ifa_mask); 810 811 /* See if current broadcast address matches 812 * with current netmask, then recalculate 813 * the broadcast address. Otherwise it's a 814 * funny address, so don't touch it since 815 * the user seems to know what (s)he's doing... 816 */ 817 if ((dev->flags & IFF_BROADCAST) && 818 (ifa->ifa_prefixlen < 31) && 819 (ifa->ifa_broadcast == 820 (ifa->ifa_local|~old_mask))) { 821 ifa->ifa_broadcast = (ifa->ifa_local | 822 ~sin->sin_addr.s_addr); 823 } 824 inet_insert_ifa(ifa); 825 } 826 break; 827 } 828 done: 829 rtnl_unlock(); 830 out: 831 return ret; 832 rarok: 833 rtnl_unlock(); 834 ret = copy_to_user(arg, &ifr, sizeof(struct ifreq)) ? -EFAULT : 0; 835 goto out; 836 } 837 838 static int inet_gifconf(struct net_device *dev, char __user *buf, int len) 839 { 840 struct in_device *in_dev = __in_dev_get_rtnl(dev); 841 struct in_ifaddr *ifa; 842 struct ifreq ifr; 843 int done = 0; 844 845 if (!in_dev || (ifa = in_dev->ifa_list) == NULL) 846 goto out; 847 848 for (; ifa; ifa = ifa->ifa_next) { 849 if (!buf) { 850 done += sizeof(ifr); 851 continue; 852 } 853 if (len < (int) sizeof(ifr)) 854 break; 855 memset(&ifr, 0, sizeof(struct ifreq)); 856 if (ifa->ifa_label) 857 strcpy(ifr.ifr_name, ifa->ifa_label); 858 else 859 strcpy(ifr.ifr_name, dev->name); 860 861 (*(struct sockaddr_in *)&ifr.ifr_addr).sin_family = AF_INET; 862 (*(struct sockaddr_in *)&ifr.ifr_addr).sin_addr.s_addr = 863 ifa->ifa_local; 864 865 if (copy_to_user(buf, &ifr, sizeof(struct ifreq))) { 866 done = -EFAULT; 867 break; 868 } 869 buf += sizeof(struct ifreq); 870 len -= sizeof(struct ifreq); 871 done += sizeof(struct ifreq); 872 } 873 out: 874 return done; 875 } 876 877 __be32 inet_select_addr(const struct net_device *dev, __be32 dst, int scope) 878 { 879 __be32 addr = 0; 880 struct in_device *in_dev; 881 882 rcu_read_lock(); 883 in_dev = __in_dev_get_rcu(dev); 884 if (!in_dev) 885 goto no_in_dev; 886 887 for_primary_ifa(in_dev) { 888 if (ifa->ifa_scope > scope) 889 continue; 890 if (!dst || inet_ifa_match(dst, ifa)) { 891 addr = ifa->ifa_local; 892 break; 893 } 894 if (!addr) 895 addr = ifa->ifa_local; 896 } endfor_ifa(in_dev); 897 no_in_dev: 898 rcu_read_unlock(); 899 900 if (addr) 901 goto out; 902 903 /* Not loopback addresses on loopback should be preferred 904 in this case. It is importnat that lo is the first interface 905 in dev_base list. 906 */ 907 read_lock(&dev_base_lock); 908 rcu_read_lock(); 909 for_each_netdev(&init_net, dev) { 910 if ((in_dev = __in_dev_get_rcu(dev)) == NULL) 911 continue; 912 913 for_primary_ifa(in_dev) { 914 if (ifa->ifa_scope != RT_SCOPE_LINK && 915 ifa->ifa_scope <= scope) { 916 addr = ifa->ifa_local; 917 goto out_unlock_both; 918 } 919 } endfor_ifa(in_dev); 920 } 921 out_unlock_both: 922 read_unlock(&dev_base_lock); 923 rcu_read_unlock(); 924 out: 925 return addr; 926 } 927 928 static __be32 confirm_addr_indev(struct in_device *in_dev, __be32 dst, 929 __be32 local, int scope) 930 { 931 int same = 0; 932 __be32 addr = 0; 933 934 for_ifa(in_dev) { 935 if (!addr && 936 (local == ifa->ifa_local || !local) && 937 ifa->ifa_scope <= scope) { 938 addr = ifa->ifa_local; 939 if (same) 940 break; 941 } 942 if (!same) { 943 same = (!local || inet_ifa_match(local, ifa)) && 944 (!dst || inet_ifa_match(dst, ifa)); 945 if (same && addr) { 946 if (local || !dst) 947 break; 948 /* Is the selected addr into dst subnet? */ 949 if (inet_ifa_match(addr, ifa)) 950 break; 951 /* No, then can we use new local src? */ 952 if (ifa->ifa_scope <= scope) { 953 addr = ifa->ifa_local; 954 break; 955 } 956 /* search for large dst subnet for addr */ 957 same = 0; 958 } 959 } 960 } endfor_ifa(in_dev); 961 962 return same? addr : 0; 963 } 964 965 /* 966 * Confirm that local IP address exists using wildcards: 967 * - dev: only on this interface, 0=any interface 968 * - dst: only in the same subnet as dst, 0=any dst 969 * - local: address, 0=autoselect the local address 970 * - scope: maximum allowed scope value for the local address 971 */ 972 __be32 inet_confirm_addr(const struct net_device *dev, __be32 dst, __be32 local, int scope) 973 { 974 __be32 addr = 0; 975 struct in_device *in_dev; 976 977 if (dev) { 978 rcu_read_lock(); 979 if ((in_dev = __in_dev_get_rcu(dev))) 980 addr = confirm_addr_indev(in_dev, dst, local, scope); 981 rcu_read_unlock(); 982 983 return addr; 984 } 985 986 read_lock(&dev_base_lock); 987 rcu_read_lock(); 988 for_each_netdev(&init_net, dev) { 989 if ((in_dev = __in_dev_get_rcu(dev))) { 990 addr = confirm_addr_indev(in_dev, dst, local, scope); 991 if (addr) 992 break; 993 } 994 } 995 rcu_read_unlock(); 996 read_unlock(&dev_base_lock); 997 998 return addr; 999 } 1000 1001 /* 1002 * Device notifier 1003 */ 1004 1005 int register_inetaddr_notifier(struct notifier_block *nb) 1006 { 1007 return blocking_notifier_chain_register(&inetaddr_chain, nb); 1008 } 1009 1010 int unregister_inetaddr_notifier(struct notifier_block *nb) 1011 { 1012 return blocking_notifier_chain_unregister(&inetaddr_chain, nb); 1013 } 1014 1015 /* Rename ifa_labels for a device name change. Make some effort to preserve existing 1016 * alias numbering and to create unique labels if possible. 1017 */ 1018 static void inetdev_changename(struct net_device *dev, struct in_device *in_dev) 1019 { 1020 struct in_ifaddr *ifa; 1021 int named = 0; 1022 1023 for (ifa = in_dev->ifa_list; ifa; ifa = ifa->ifa_next) { 1024 char old[IFNAMSIZ], *dot; 1025 1026 memcpy(old, ifa->ifa_label, IFNAMSIZ); 1027 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ); 1028 if (named++ == 0) 1029 continue; 1030 dot = strchr(old, ':'); 1031 if (dot == NULL) { 1032 sprintf(old, ":%d", named); 1033 dot = old; 1034 } 1035 if (strlen(dot) + strlen(dev->name) < IFNAMSIZ) { 1036 strcat(ifa->ifa_label, dot); 1037 } else { 1038 strcpy(ifa->ifa_label + (IFNAMSIZ - strlen(dot) - 1), dot); 1039 } 1040 } 1041 } 1042 1043 /* Called only under RTNL semaphore */ 1044 1045 static int inetdev_event(struct notifier_block *this, unsigned long event, 1046 void *ptr) 1047 { 1048 struct net_device *dev = ptr; 1049 struct in_device *in_dev = __in_dev_get_rtnl(dev); 1050 1051 if (dev->nd_net != &init_net) 1052 return NOTIFY_DONE; 1053 1054 ASSERT_RTNL(); 1055 1056 if (!in_dev) { 1057 if (event == NETDEV_REGISTER) { 1058 in_dev = inetdev_init(dev); 1059 if (!in_dev) 1060 return notifier_from_errno(-ENOMEM); 1061 if (dev->flags & IFF_LOOPBACK) { 1062 IN_DEV_CONF_SET(in_dev, NOXFRM, 1); 1063 IN_DEV_CONF_SET(in_dev, NOPOLICY, 1); 1064 } 1065 } 1066 goto out; 1067 } 1068 1069 switch (event) { 1070 case NETDEV_REGISTER: 1071 printk(KERN_DEBUG "inetdev_event: bug\n"); 1072 dev->ip_ptr = NULL; 1073 break; 1074 case NETDEV_UP: 1075 if (dev->mtu < 68) 1076 break; 1077 if (dev->flags & IFF_LOOPBACK) { 1078 struct in_ifaddr *ifa; 1079 if ((ifa = inet_alloc_ifa()) != NULL) { 1080 ifa->ifa_local = 1081 ifa->ifa_address = htonl(INADDR_LOOPBACK); 1082 ifa->ifa_prefixlen = 8; 1083 ifa->ifa_mask = inet_make_mask(8); 1084 in_dev_hold(in_dev); 1085 ifa->ifa_dev = in_dev; 1086 ifa->ifa_scope = RT_SCOPE_HOST; 1087 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ); 1088 inet_insert_ifa(ifa); 1089 } 1090 } 1091 ip_mc_up(in_dev); 1092 break; 1093 case NETDEV_DOWN: 1094 ip_mc_down(in_dev); 1095 break; 1096 case NETDEV_CHANGEMTU: 1097 if (dev->mtu >= 68) 1098 break; 1099 /* MTU falled under 68, disable IP */ 1100 case NETDEV_UNREGISTER: 1101 inetdev_destroy(in_dev); 1102 break; 1103 case NETDEV_CHANGENAME: 1104 /* Do not notify about label change, this event is 1105 * not interesting to applications using netlink. 1106 */ 1107 inetdev_changename(dev, in_dev); 1108 1109 #ifdef CONFIG_SYSCTL 1110 devinet_sysctl_unregister(&in_dev->cnf); 1111 neigh_sysctl_unregister(in_dev->arp_parms); 1112 neigh_sysctl_register(dev, in_dev->arp_parms, NET_IPV4, 1113 NET_IPV4_NEIGH, "ipv4", NULL, NULL); 1114 devinet_sysctl_register(in_dev, &in_dev->cnf); 1115 #endif 1116 break; 1117 } 1118 out: 1119 return NOTIFY_DONE; 1120 } 1121 1122 static struct notifier_block ip_netdev_notifier = { 1123 .notifier_call =inetdev_event, 1124 }; 1125 1126 static inline size_t inet_nlmsg_size(void) 1127 { 1128 return NLMSG_ALIGN(sizeof(struct ifaddrmsg)) 1129 + nla_total_size(4) /* IFA_ADDRESS */ 1130 + nla_total_size(4) /* IFA_LOCAL */ 1131 + nla_total_size(4) /* IFA_BROADCAST */ 1132 + nla_total_size(4) /* IFA_ANYCAST */ 1133 + nla_total_size(IFNAMSIZ); /* IFA_LABEL */ 1134 } 1135 1136 static int inet_fill_ifaddr(struct sk_buff *skb, struct in_ifaddr *ifa, 1137 u32 pid, u32 seq, int event, unsigned int flags) 1138 { 1139 struct ifaddrmsg *ifm; 1140 struct nlmsghdr *nlh; 1141 1142 nlh = nlmsg_put(skb, pid, seq, event, sizeof(*ifm), flags); 1143 if (nlh == NULL) 1144 return -EMSGSIZE; 1145 1146 ifm = nlmsg_data(nlh); 1147 ifm->ifa_family = AF_INET; 1148 ifm->ifa_prefixlen = ifa->ifa_prefixlen; 1149 ifm->ifa_flags = ifa->ifa_flags|IFA_F_PERMANENT; 1150 ifm->ifa_scope = ifa->ifa_scope; 1151 ifm->ifa_index = ifa->ifa_dev->dev->ifindex; 1152 1153 if (ifa->ifa_address) 1154 NLA_PUT_BE32(skb, IFA_ADDRESS, ifa->ifa_address); 1155 1156 if (ifa->ifa_local) 1157 NLA_PUT_BE32(skb, IFA_LOCAL, ifa->ifa_local); 1158 1159 if (ifa->ifa_broadcast) 1160 NLA_PUT_BE32(skb, IFA_BROADCAST, ifa->ifa_broadcast); 1161 1162 if (ifa->ifa_anycast) 1163 NLA_PUT_BE32(skb, IFA_ANYCAST, ifa->ifa_anycast); 1164 1165 if (ifa->ifa_label[0]) 1166 NLA_PUT_STRING(skb, IFA_LABEL, ifa->ifa_label); 1167 1168 return nlmsg_end(skb, nlh); 1169 1170 nla_put_failure: 1171 nlmsg_cancel(skb, nlh); 1172 return -EMSGSIZE; 1173 } 1174 1175 static int inet_dump_ifaddr(struct sk_buff *skb, struct netlink_callback *cb) 1176 { 1177 int idx, ip_idx; 1178 struct net_device *dev; 1179 struct in_device *in_dev; 1180 struct in_ifaddr *ifa; 1181 int s_ip_idx, s_idx = cb->args[0]; 1182 1183 s_ip_idx = ip_idx = cb->args[1]; 1184 idx = 0; 1185 for_each_netdev(&init_net, dev) { 1186 if (idx < s_idx) 1187 goto cont; 1188 if (idx > s_idx) 1189 s_ip_idx = 0; 1190 if ((in_dev = __in_dev_get_rtnl(dev)) == NULL) 1191 goto cont; 1192 1193 for (ifa = in_dev->ifa_list, ip_idx = 0; ifa; 1194 ifa = ifa->ifa_next, ip_idx++) { 1195 if (ip_idx < s_ip_idx) 1196 continue; 1197 if (inet_fill_ifaddr(skb, ifa, NETLINK_CB(cb->skb).pid, 1198 cb->nlh->nlmsg_seq, 1199 RTM_NEWADDR, NLM_F_MULTI) <= 0) 1200 goto done; 1201 } 1202 cont: 1203 idx++; 1204 } 1205 1206 done: 1207 cb->args[0] = idx; 1208 cb->args[1] = ip_idx; 1209 1210 return skb->len; 1211 } 1212 1213 static void rtmsg_ifa(int event, struct in_ifaddr* ifa, struct nlmsghdr *nlh, 1214 u32 pid) 1215 { 1216 struct sk_buff *skb; 1217 u32 seq = nlh ? nlh->nlmsg_seq : 0; 1218 int err = -ENOBUFS; 1219 1220 skb = nlmsg_new(inet_nlmsg_size(), GFP_KERNEL); 1221 if (skb == NULL) 1222 goto errout; 1223 1224 err = inet_fill_ifaddr(skb, ifa, pid, seq, event, 0); 1225 if (err < 0) { 1226 /* -EMSGSIZE implies BUG in inet_nlmsg_size() */ 1227 WARN_ON(err == -EMSGSIZE); 1228 kfree_skb(skb); 1229 goto errout; 1230 } 1231 err = rtnl_notify(skb, pid, RTNLGRP_IPV4_IFADDR, nlh, GFP_KERNEL); 1232 errout: 1233 if (err < 0) 1234 rtnl_set_sk_err(RTNLGRP_IPV4_IFADDR, err); 1235 } 1236 1237 #ifdef CONFIG_SYSCTL 1238 1239 static void devinet_copy_dflt_conf(int i) 1240 { 1241 struct net_device *dev; 1242 1243 read_lock(&dev_base_lock); 1244 for_each_netdev(&init_net, dev) { 1245 struct in_device *in_dev; 1246 rcu_read_lock(); 1247 in_dev = __in_dev_get_rcu(dev); 1248 if (in_dev && !test_bit(i, in_dev->cnf.state)) 1249 in_dev->cnf.data[i] = ipv4_devconf_dflt.data[i]; 1250 rcu_read_unlock(); 1251 } 1252 read_unlock(&dev_base_lock); 1253 } 1254 1255 static int devinet_conf_proc(ctl_table *ctl, int write, 1256 struct file* filp, void __user *buffer, 1257 size_t *lenp, loff_t *ppos) 1258 { 1259 int ret = proc_dointvec(ctl, write, filp, buffer, lenp, ppos); 1260 1261 if (write) { 1262 struct ipv4_devconf *cnf = ctl->extra1; 1263 int i = (int *)ctl->data - cnf->data; 1264 1265 set_bit(i, cnf->state); 1266 1267 if (cnf == &ipv4_devconf_dflt) 1268 devinet_copy_dflt_conf(i); 1269 } 1270 1271 return ret; 1272 } 1273 1274 static int devinet_conf_sysctl(ctl_table *table, int __user *name, int nlen, 1275 void __user *oldval, size_t __user *oldlenp, 1276 void __user *newval, size_t newlen) 1277 { 1278 struct ipv4_devconf *cnf; 1279 int *valp = table->data; 1280 int new; 1281 int i; 1282 1283 if (!newval || !newlen) 1284 return 0; 1285 1286 if (newlen != sizeof(int)) 1287 return -EINVAL; 1288 1289 if (get_user(new, (int __user *)newval)) 1290 return -EFAULT; 1291 1292 if (new == *valp) 1293 return 0; 1294 1295 if (oldval && oldlenp) { 1296 size_t len; 1297 1298 if (get_user(len, oldlenp)) 1299 return -EFAULT; 1300 1301 if (len) { 1302 if (len > table->maxlen) 1303 len = table->maxlen; 1304 if (copy_to_user(oldval, valp, len)) 1305 return -EFAULT; 1306 if (put_user(len, oldlenp)) 1307 return -EFAULT; 1308 } 1309 } 1310 1311 *valp = new; 1312 1313 cnf = table->extra1; 1314 i = (int *)table->data - cnf->data; 1315 1316 set_bit(i, cnf->state); 1317 1318 if (cnf == &ipv4_devconf_dflt) 1319 devinet_copy_dflt_conf(i); 1320 1321 return 1; 1322 } 1323 1324 void inet_forward_change(void) 1325 { 1326 struct net_device *dev; 1327 int on = IPV4_DEVCONF_ALL(FORWARDING); 1328 1329 IPV4_DEVCONF_ALL(ACCEPT_REDIRECTS) = !on; 1330 IPV4_DEVCONF_DFLT(FORWARDING) = on; 1331 1332 read_lock(&dev_base_lock); 1333 for_each_netdev(&init_net, dev) { 1334 struct in_device *in_dev; 1335 rcu_read_lock(); 1336 in_dev = __in_dev_get_rcu(dev); 1337 if (in_dev) 1338 IN_DEV_CONF_SET(in_dev, FORWARDING, on); 1339 rcu_read_unlock(); 1340 } 1341 read_unlock(&dev_base_lock); 1342 1343 rt_cache_flush(0); 1344 } 1345 1346 static int devinet_sysctl_forward(ctl_table *ctl, int write, 1347 struct file* filp, void __user *buffer, 1348 size_t *lenp, loff_t *ppos) 1349 { 1350 int *valp = ctl->data; 1351 int val = *valp; 1352 int ret = proc_dointvec(ctl, write, filp, buffer, lenp, ppos); 1353 1354 if (write && *valp != val) { 1355 if (valp == &IPV4_DEVCONF_ALL(FORWARDING)) 1356 inet_forward_change(); 1357 else if (valp != &IPV4_DEVCONF_DFLT(FORWARDING)) 1358 rt_cache_flush(0); 1359 } 1360 1361 return ret; 1362 } 1363 1364 int ipv4_doint_and_flush(ctl_table *ctl, int write, 1365 struct file* filp, void __user *buffer, 1366 size_t *lenp, loff_t *ppos) 1367 { 1368 int *valp = ctl->data; 1369 int val = *valp; 1370 int ret = proc_dointvec(ctl, write, filp, buffer, lenp, ppos); 1371 1372 if (write && *valp != val) 1373 rt_cache_flush(0); 1374 1375 return ret; 1376 } 1377 1378 int ipv4_doint_and_flush_strategy(ctl_table *table, int __user *name, int nlen, 1379 void __user *oldval, size_t __user *oldlenp, 1380 void __user *newval, size_t newlen) 1381 { 1382 int ret = devinet_conf_sysctl(table, name, nlen, oldval, oldlenp, 1383 newval, newlen); 1384 1385 if (ret == 1) 1386 rt_cache_flush(0); 1387 1388 return ret; 1389 } 1390 1391 1392 #define DEVINET_SYSCTL_ENTRY(attr, name, mval, proc, sysctl) \ 1393 { \ 1394 .ctl_name = NET_IPV4_CONF_ ## attr, \ 1395 .procname = name, \ 1396 .data = ipv4_devconf.data + \ 1397 NET_IPV4_CONF_ ## attr - 1, \ 1398 .maxlen = sizeof(int), \ 1399 .mode = mval, \ 1400 .proc_handler = proc, \ 1401 .strategy = sysctl, \ 1402 .extra1 = &ipv4_devconf, \ 1403 } 1404 1405 #define DEVINET_SYSCTL_RW_ENTRY(attr, name) \ 1406 DEVINET_SYSCTL_ENTRY(attr, name, 0644, devinet_conf_proc, \ 1407 devinet_conf_sysctl) 1408 1409 #define DEVINET_SYSCTL_RO_ENTRY(attr, name) \ 1410 DEVINET_SYSCTL_ENTRY(attr, name, 0444, devinet_conf_proc, \ 1411 devinet_conf_sysctl) 1412 1413 #define DEVINET_SYSCTL_COMPLEX_ENTRY(attr, name, proc, sysctl) \ 1414 DEVINET_SYSCTL_ENTRY(attr, name, 0644, proc, sysctl) 1415 1416 #define DEVINET_SYSCTL_FLUSHING_ENTRY(attr, name) \ 1417 DEVINET_SYSCTL_COMPLEX_ENTRY(attr, name, ipv4_doint_and_flush, \ 1418 ipv4_doint_and_flush_strategy) 1419 1420 static struct devinet_sysctl_table { 1421 struct ctl_table_header *sysctl_header; 1422 ctl_table devinet_vars[__NET_IPV4_CONF_MAX]; 1423 ctl_table devinet_dev[2]; 1424 ctl_table devinet_conf_dir[2]; 1425 ctl_table devinet_proto_dir[2]; 1426 ctl_table devinet_root_dir[2]; 1427 } devinet_sysctl = { 1428 .devinet_vars = { 1429 DEVINET_SYSCTL_COMPLEX_ENTRY(FORWARDING, "forwarding", 1430 devinet_sysctl_forward, 1431 devinet_conf_sysctl), 1432 DEVINET_SYSCTL_RO_ENTRY(MC_FORWARDING, "mc_forwarding"), 1433 1434 DEVINET_SYSCTL_RW_ENTRY(ACCEPT_REDIRECTS, "accept_redirects"), 1435 DEVINET_SYSCTL_RW_ENTRY(SECURE_REDIRECTS, "secure_redirects"), 1436 DEVINET_SYSCTL_RW_ENTRY(SHARED_MEDIA, "shared_media"), 1437 DEVINET_SYSCTL_RW_ENTRY(RP_FILTER, "rp_filter"), 1438 DEVINET_SYSCTL_RW_ENTRY(SEND_REDIRECTS, "send_redirects"), 1439 DEVINET_SYSCTL_RW_ENTRY(ACCEPT_SOURCE_ROUTE, 1440 "accept_source_route"), 1441 DEVINET_SYSCTL_RW_ENTRY(PROXY_ARP, "proxy_arp"), 1442 DEVINET_SYSCTL_RW_ENTRY(MEDIUM_ID, "medium_id"), 1443 DEVINET_SYSCTL_RW_ENTRY(BOOTP_RELAY, "bootp_relay"), 1444 DEVINET_SYSCTL_RW_ENTRY(LOG_MARTIANS, "log_martians"), 1445 DEVINET_SYSCTL_RW_ENTRY(TAG, "tag"), 1446 DEVINET_SYSCTL_RW_ENTRY(ARPFILTER, "arp_filter"), 1447 DEVINET_SYSCTL_RW_ENTRY(ARP_ANNOUNCE, "arp_announce"), 1448 DEVINET_SYSCTL_RW_ENTRY(ARP_IGNORE, "arp_ignore"), 1449 DEVINET_SYSCTL_RW_ENTRY(ARP_ACCEPT, "arp_accept"), 1450 1451 DEVINET_SYSCTL_FLUSHING_ENTRY(NOXFRM, "disable_xfrm"), 1452 DEVINET_SYSCTL_FLUSHING_ENTRY(NOPOLICY, "disable_policy"), 1453 DEVINET_SYSCTL_FLUSHING_ENTRY(FORCE_IGMP_VERSION, 1454 "force_igmp_version"), 1455 DEVINET_SYSCTL_FLUSHING_ENTRY(PROMOTE_SECONDARIES, 1456 "promote_secondaries"), 1457 }, 1458 .devinet_dev = { 1459 { 1460 .ctl_name = NET_PROTO_CONF_ALL, 1461 .procname = "all", 1462 .mode = 0555, 1463 .child = devinet_sysctl.devinet_vars, 1464 }, 1465 }, 1466 .devinet_conf_dir = { 1467 { 1468 .ctl_name = NET_IPV4_CONF, 1469 .procname = "conf", 1470 .mode = 0555, 1471 .child = devinet_sysctl.devinet_dev, 1472 }, 1473 }, 1474 .devinet_proto_dir = { 1475 { 1476 .ctl_name = NET_IPV4, 1477 .procname = "ipv4", 1478 .mode = 0555, 1479 .child = devinet_sysctl.devinet_conf_dir, 1480 }, 1481 }, 1482 .devinet_root_dir = { 1483 { 1484 .ctl_name = CTL_NET, 1485 .procname = "net", 1486 .mode = 0555, 1487 .child = devinet_sysctl.devinet_proto_dir, 1488 }, 1489 }, 1490 }; 1491 1492 static void devinet_sysctl_register(struct in_device *in_dev, 1493 struct ipv4_devconf *p) 1494 { 1495 int i; 1496 struct net_device *dev = in_dev ? in_dev->dev : NULL; 1497 struct devinet_sysctl_table *t = kmemdup(&devinet_sysctl, sizeof(*t), 1498 GFP_KERNEL); 1499 char *dev_name = NULL; 1500 1501 if (!t) 1502 return; 1503 for (i = 0; i < ARRAY_SIZE(t->devinet_vars) - 1; i++) { 1504 t->devinet_vars[i].data += (char *)p - (char *)&ipv4_devconf; 1505 t->devinet_vars[i].extra1 = p; 1506 } 1507 1508 if (dev) { 1509 dev_name = dev->name; 1510 t->devinet_dev[0].ctl_name = dev->ifindex; 1511 } else { 1512 dev_name = "default"; 1513 t->devinet_dev[0].ctl_name = NET_PROTO_CONF_DEFAULT; 1514 } 1515 1516 /* 1517 * Make a copy of dev_name, because '.procname' is regarded as const 1518 * by sysctl and we wouldn't want anyone to change it under our feet 1519 * (see SIOCSIFNAME). 1520 */ 1521 dev_name = kstrdup(dev_name, GFP_KERNEL); 1522 if (!dev_name) 1523 goto free; 1524 1525 t->devinet_dev[0].procname = dev_name; 1526 t->devinet_dev[0].child = t->devinet_vars; 1527 t->devinet_conf_dir[0].child = t->devinet_dev; 1528 t->devinet_proto_dir[0].child = t->devinet_conf_dir; 1529 t->devinet_root_dir[0].child = t->devinet_proto_dir; 1530 1531 t->sysctl_header = register_sysctl_table(t->devinet_root_dir); 1532 if (!t->sysctl_header) 1533 goto free_procname; 1534 1535 p->sysctl = t; 1536 return; 1537 1538 /* error path */ 1539 free_procname: 1540 kfree(dev_name); 1541 free: 1542 kfree(t); 1543 return; 1544 } 1545 1546 static void devinet_sysctl_unregister(struct ipv4_devconf *p) 1547 { 1548 if (p->sysctl) { 1549 struct devinet_sysctl_table *t = p->sysctl; 1550 p->sysctl = NULL; 1551 unregister_sysctl_table(t->sysctl_header); 1552 kfree(t->devinet_dev[0].procname); 1553 kfree(t); 1554 } 1555 } 1556 #endif 1557 1558 void __init devinet_init(void) 1559 { 1560 register_gifconf(PF_INET, inet_gifconf); 1561 register_netdevice_notifier(&ip_netdev_notifier); 1562 1563 rtnl_register(PF_INET, RTM_NEWADDR, inet_rtm_newaddr, NULL); 1564 rtnl_register(PF_INET, RTM_DELADDR, inet_rtm_deladdr, NULL); 1565 rtnl_register(PF_INET, RTM_GETADDR, NULL, inet_dump_ifaddr); 1566 #ifdef CONFIG_SYSCTL 1567 devinet_sysctl.sysctl_header = 1568 register_sysctl_table(devinet_sysctl.devinet_root_dir); 1569 devinet_sysctl_register(NULL, &ipv4_devconf_dflt); 1570 #endif 1571 } 1572 1573 EXPORT_SYMBOL(in_dev_finish_destroy); 1574 EXPORT_SYMBOL(inet_select_addr); 1575 EXPORT_SYMBOL(inetdev_by_index); 1576 EXPORT_SYMBOL(register_inetaddr_notifier); 1577 EXPORT_SYMBOL(unregister_inetaddr_notifier); 1578