11da177e4SLinus Torvalds /* 21da177e4SLinus Torvalds * IP multicast routing support for mrouted 3.6/3.8 31da177e4SLinus Torvalds * 4113aa838SAlan Cox * (c) 1995 Alan Cox, <alan@lxorguk.ukuu.org.uk> 51da177e4SLinus Torvalds * Linux Consultancy and Custom Driver Development 61da177e4SLinus Torvalds * 71da177e4SLinus Torvalds * This program is free software; you can redistribute it and/or 81da177e4SLinus Torvalds * modify it under the terms of the GNU General Public License 91da177e4SLinus Torvalds * as published by the Free Software Foundation; either version 101da177e4SLinus Torvalds * 2 of the License, or (at your option) any later version. 111da177e4SLinus Torvalds * 121da177e4SLinus Torvalds * Fixes: 131da177e4SLinus Torvalds * Michael Chastain : Incorrect size of copying. 141da177e4SLinus Torvalds * Alan Cox : Added the cache manager code 151da177e4SLinus Torvalds * Alan Cox : Fixed the clone/copy bug and device race. 161da177e4SLinus Torvalds * Mike McLagan : Routing by source 171da177e4SLinus Torvalds * Malcolm Beattie : Buffer handling fixes. 181da177e4SLinus Torvalds * Alexey Kuznetsov : Double buffer free and other fixes. 191da177e4SLinus Torvalds * SVR Anand : Fixed several multicast bugs and problems. 201da177e4SLinus Torvalds * Alexey Kuznetsov : Status, optimisations and more. 211da177e4SLinus Torvalds * Brad Parker : Better behaviour on mrouted upcall 221da177e4SLinus Torvalds * overflow. 231da177e4SLinus Torvalds * Carlos Picoto : PIMv1 Support 241da177e4SLinus Torvalds * Pavlin Ivanov Radoslavov: PIMv2 Registers must checksum only PIM header 25f77f13e2SGilles Espinasse * Relax this requirement to work with older peers. 261da177e4SLinus Torvalds * 271da177e4SLinus Torvalds */ 281da177e4SLinus Torvalds 291da177e4SLinus Torvalds #include <asm/system.h> 301da177e4SLinus Torvalds #include <asm/uaccess.h> 311da177e4SLinus Torvalds #include <linux/types.h> 324fc268d2SRandy Dunlap #include <linux/capability.h> 331da177e4SLinus Torvalds #include <linux/errno.h> 341da177e4SLinus Torvalds #include <linux/timer.h> 351da177e4SLinus Torvalds #include <linux/mm.h> 361da177e4SLinus Torvalds #include <linux/kernel.h> 371da177e4SLinus Torvalds #include <linux/fcntl.h> 381da177e4SLinus Torvalds #include <linux/stat.h> 391da177e4SLinus Torvalds #include <linux/socket.h> 401da177e4SLinus Torvalds #include <linux/in.h> 411da177e4SLinus Torvalds #include <linux/inet.h> 421da177e4SLinus Torvalds #include <linux/netdevice.h> 431da177e4SLinus Torvalds #include <linux/inetdevice.h> 441da177e4SLinus Torvalds #include <linux/igmp.h> 451da177e4SLinus Torvalds #include <linux/proc_fs.h> 461da177e4SLinus Torvalds #include <linux/seq_file.h> 471da177e4SLinus Torvalds #include <linux/mroute.h> 481da177e4SLinus Torvalds #include <linux/init.h> 4946f25dffSKris Katterjohn #include <linux/if_ether.h> 505a0e3ad6STejun Heo #include <linux/slab.h> 51457c4cbcSEric W. Biederman #include <net/net_namespace.h> 521da177e4SLinus Torvalds #include <net/ip.h> 531da177e4SLinus Torvalds #include <net/protocol.h> 541da177e4SLinus Torvalds #include <linux/skbuff.h> 5514c85021SArnaldo Carvalho de Melo #include <net/route.h> 561da177e4SLinus Torvalds #include <net/sock.h> 571da177e4SLinus Torvalds #include <net/icmp.h> 581da177e4SLinus Torvalds #include <net/udp.h> 591da177e4SLinus Torvalds #include <net/raw.h> 601da177e4SLinus Torvalds #include <linux/notifier.h> 611da177e4SLinus Torvalds #include <linux/if_arp.h> 621da177e4SLinus Torvalds #include <linux/netfilter_ipv4.h> 63709b46e8SEric W. Biederman #include <linux/compat.h> 641da177e4SLinus Torvalds #include <net/ipip.h> 651da177e4SLinus Torvalds #include <net/checksum.h> 66dc5fc579SArnaldo Carvalho de Melo #include <net/netlink.h> 67f0ad0860SPatrick McHardy #include <net/fib_rules.h> 681da177e4SLinus Torvalds 691da177e4SLinus Torvalds #if defined(CONFIG_IP_PIMSM_V1) || defined(CONFIG_IP_PIMSM_V2) 701da177e4SLinus Torvalds #define CONFIG_IP_PIMSM 1 711da177e4SLinus Torvalds #endif 721da177e4SLinus Torvalds 730c12295aSPatrick McHardy struct mr_table { 74f0ad0860SPatrick McHardy struct list_head list; 758de53dfbSPatrick McHardy #ifdef CONFIG_NET_NS 768de53dfbSPatrick McHardy struct net *net; 778de53dfbSPatrick McHardy #endif 78f0ad0860SPatrick McHardy u32 id; 794c968709SEric Dumazet struct sock __rcu *mroute_sk; 800c12295aSPatrick McHardy struct timer_list ipmr_expire_timer; 810c12295aSPatrick McHardy struct list_head mfc_unres_queue; 820c12295aSPatrick McHardy struct list_head mfc_cache_array[MFC_LINES]; 830c12295aSPatrick McHardy struct vif_device vif_table[MAXVIFS]; 840c12295aSPatrick McHardy int maxvif; 850c12295aSPatrick McHardy atomic_t cache_resolve_queue_len; 860c12295aSPatrick McHardy int mroute_do_assert; 870c12295aSPatrick McHardy int mroute_do_pim; 880c12295aSPatrick McHardy #if defined(CONFIG_IP_PIMSM_V1) || defined(CONFIG_IP_PIMSM_V2) 890c12295aSPatrick McHardy int mroute_reg_vif_num; 900c12295aSPatrick McHardy #endif 910c12295aSPatrick McHardy }; 920c12295aSPatrick McHardy 93f0ad0860SPatrick McHardy struct ipmr_rule { 94f0ad0860SPatrick McHardy struct fib_rule common; 95f0ad0860SPatrick McHardy }; 96f0ad0860SPatrick McHardy 97f0ad0860SPatrick McHardy struct ipmr_result { 98f0ad0860SPatrick McHardy struct mr_table *mrt; 99f0ad0860SPatrick McHardy }; 100f0ad0860SPatrick McHardy 1011da177e4SLinus Torvalds /* Big lock, protecting vif table, mrt cache and mroute socket state. 102a8cb16ddSEric Dumazet * Note that the changes are semaphored via rtnl_lock. 1031da177e4SLinus Torvalds */ 1041da177e4SLinus Torvalds 1051da177e4SLinus Torvalds static DEFINE_RWLOCK(mrt_lock); 1061da177e4SLinus Torvalds 1071da177e4SLinus Torvalds /* 1081da177e4SLinus Torvalds * Multicast router control variables 1091da177e4SLinus Torvalds */ 1101da177e4SLinus Torvalds 1110c12295aSPatrick McHardy #define VIF_EXISTS(_mrt, _idx) ((_mrt)->vif_table[_idx].dev != NULL) 1121da177e4SLinus Torvalds 1131da177e4SLinus Torvalds /* Special spinlock for queue of unresolved entries */ 1141da177e4SLinus Torvalds static DEFINE_SPINLOCK(mfc_unres_lock); 1151da177e4SLinus Torvalds 1161da177e4SLinus Torvalds /* We return to original Alan's scheme. Hash table of resolved 117a8cb16ddSEric Dumazet * entries is changed only in process context and protected 118a8cb16ddSEric Dumazet * with weak lock mrt_lock. Queue of unresolved entries is protected 119a8cb16ddSEric Dumazet * with strong spinlock mfc_unres_lock. 120a8cb16ddSEric Dumazet * 121a8cb16ddSEric Dumazet * In this case data path is free of exclusive locks at all. 1221da177e4SLinus Torvalds */ 1231da177e4SLinus Torvalds 124e18b890bSChristoph Lameter static struct kmem_cache *mrt_cachep __read_mostly; 1251da177e4SLinus Torvalds 126f0ad0860SPatrick McHardy static struct mr_table *ipmr_new_table(struct net *net, u32 id); 1270c12295aSPatrick McHardy static int ip_mr_forward(struct net *net, struct mr_table *mrt, 1280c12295aSPatrick McHardy struct sk_buff *skb, struct mfc_cache *cache, 1290c12295aSPatrick McHardy int local); 1300c12295aSPatrick McHardy static int ipmr_cache_report(struct mr_table *mrt, 1314feb88e5SBenjamin Thery struct sk_buff *pkt, vifi_t vifi, int assert); 132cb6a4e46SPatrick McHardy static int __ipmr_fill_mroute(struct mr_table *mrt, struct sk_buff *skb, 133d658f8a0SPatrick McHardy struct mfc_cache *c, struct rtmsg *rtm); 134f0ad0860SPatrick McHardy static void ipmr_expire_process(unsigned long arg); 1351da177e4SLinus Torvalds 136f0ad0860SPatrick McHardy #ifdef CONFIG_IP_MROUTE_MULTIPLE_TABLES 137f0ad0860SPatrick McHardy #define ipmr_for_each_table(mrt, net) \ 138f0ad0860SPatrick McHardy list_for_each_entry_rcu(mrt, &net->ipv4.mr_tables, list) 139f0ad0860SPatrick McHardy 140f0ad0860SPatrick McHardy static struct mr_table *ipmr_get_table(struct net *net, u32 id) 141f0ad0860SPatrick McHardy { 142f0ad0860SPatrick McHardy struct mr_table *mrt; 143f0ad0860SPatrick McHardy 144f0ad0860SPatrick McHardy ipmr_for_each_table(mrt, net) { 145f0ad0860SPatrick McHardy if (mrt->id == id) 146f0ad0860SPatrick McHardy return mrt; 147f0ad0860SPatrick McHardy } 148f0ad0860SPatrick McHardy return NULL; 149f0ad0860SPatrick McHardy } 150f0ad0860SPatrick McHardy 151f0ad0860SPatrick McHardy static int ipmr_fib_lookup(struct net *net, struct flowi *flp, 152f0ad0860SPatrick McHardy struct mr_table **mrt) 153f0ad0860SPatrick McHardy { 154f0ad0860SPatrick McHardy struct ipmr_result res; 155f0ad0860SPatrick McHardy struct fib_lookup_arg arg = { .result = &res, }; 156f0ad0860SPatrick McHardy int err; 157f0ad0860SPatrick McHardy 158f0ad0860SPatrick McHardy err = fib_rules_lookup(net->ipv4.mr_rules_ops, flp, 0, &arg); 159f0ad0860SPatrick McHardy if (err < 0) 160f0ad0860SPatrick McHardy return err; 161f0ad0860SPatrick McHardy *mrt = res.mrt; 162f0ad0860SPatrick McHardy return 0; 163f0ad0860SPatrick McHardy } 164f0ad0860SPatrick McHardy 165f0ad0860SPatrick McHardy static int ipmr_rule_action(struct fib_rule *rule, struct flowi *flp, 166f0ad0860SPatrick McHardy int flags, struct fib_lookup_arg *arg) 167f0ad0860SPatrick McHardy { 168f0ad0860SPatrick McHardy struct ipmr_result *res = arg->result; 169f0ad0860SPatrick McHardy struct mr_table *mrt; 170f0ad0860SPatrick McHardy 171f0ad0860SPatrick McHardy switch (rule->action) { 172f0ad0860SPatrick McHardy case FR_ACT_TO_TBL: 173f0ad0860SPatrick McHardy break; 174f0ad0860SPatrick McHardy case FR_ACT_UNREACHABLE: 175f0ad0860SPatrick McHardy return -ENETUNREACH; 176f0ad0860SPatrick McHardy case FR_ACT_PROHIBIT: 177f0ad0860SPatrick McHardy return -EACCES; 178f0ad0860SPatrick McHardy case FR_ACT_BLACKHOLE: 179f0ad0860SPatrick McHardy default: 180f0ad0860SPatrick McHardy return -EINVAL; 181f0ad0860SPatrick McHardy } 182f0ad0860SPatrick McHardy 183f0ad0860SPatrick McHardy mrt = ipmr_get_table(rule->fr_net, rule->table); 184f0ad0860SPatrick McHardy if (mrt == NULL) 185f0ad0860SPatrick McHardy return -EAGAIN; 186f0ad0860SPatrick McHardy res->mrt = mrt; 187f0ad0860SPatrick McHardy return 0; 188f0ad0860SPatrick McHardy } 189f0ad0860SPatrick McHardy 190f0ad0860SPatrick McHardy static int ipmr_rule_match(struct fib_rule *rule, struct flowi *fl, int flags) 191f0ad0860SPatrick McHardy { 192f0ad0860SPatrick McHardy return 1; 193f0ad0860SPatrick McHardy } 194f0ad0860SPatrick McHardy 195f0ad0860SPatrick McHardy static const struct nla_policy ipmr_rule_policy[FRA_MAX + 1] = { 196f0ad0860SPatrick McHardy FRA_GENERIC_POLICY, 197f0ad0860SPatrick McHardy }; 198f0ad0860SPatrick McHardy 199f0ad0860SPatrick McHardy static int ipmr_rule_configure(struct fib_rule *rule, struct sk_buff *skb, 200f0ad0860SPatrick McHardy struct fib_rule_hdr *frh, struct nlattr **tb) 201f0ad0860SPatrick McHardy { 202f0ad0860SPatrick McHardy return 0; 203f0ad0860SPatrick McHardy } 204f0ad0860SPatrick McHardy 205f0ad0860SPatrick McHardy static int ipmr_rule_compare(struct fib_rule *rule, struct fib_rule_hdr *frh, 206f0ad0860SPatrick McHardy struct nlattr **tb) 207f0ad0860SPatrick McHardy { 208f0ad0860SPatrick McHardy return 1; 209f0ad0860SPatrick McHardy } 210f0ad0860SPatrick McHardy 211f0ad0860SPatrick McHardy static int ipmr_rule_fill(struct fib_rule *rule, struct sk_buff *skb, 212f0ad0860SPatrick McHardy struct fib_rule_hdr *frh) 213f0ad0860SPatrick McHardy { 214f0ad0860SPatrick McHardy frh->dst_len = 0; 215f0ad0860SPatrick McHardy frh->src_len = 0; 216f0ad0860SPatrick McHardy frh->tos = 0; 217f0ad0860SPatrick McHardy return 0; 218f0ad0860SPatrick McHardy } 219f0ad0860SPatrick McHardy 2203d0c9c4eSPatrick McHardy static const struct fib_rules_ops __net_initdata ipmr_rules_ops_template = { 22125239ceeSPatrick McHardy .family = RTNL_FAMILY_IPMR, 222f0ad0860SPatrick McHardy .rule_size = sizeof(struct ipmr_rule), 223f0ad0860SPatrick McHardy .addr_size = sizeof(u32), 224f0ad0860SPatrick McHardy .action = ipmr_rule_action, 225f0ad0860SPatrick McHardy .match = ipmr_rule_match, 226f0ad0860SPatrick McHardy .configure = ipmr_rule_configure, 227f0ad0860SPatrick McHardy .compare = ipmr_rule_compare, 228f0ad0860SPatrick McHardy .default_pref = fib_default_rule_pref, 229f0ad0860SPatrick McHardy .fill = ipmr_rule_fill, 230f0ad0860SPatrick McHardy .nlgroup = RTNLGRP_IPV4_RULE, 231f0ad0860SPatrick McHardy .policy = ipmr_rule_policy, 232f0ad0860SPatrick McHardy .owner = THIS_MODULE, 233f0ad0860SPatrick McHardy }; 234f0ad0860SPatrick McHardy 235f0ad0860SPatrick McHardy static int __net_init ipmr_rules_init(struct net *net) 236f0ad0860SPatrick McHardy { 237f0ad0860SPatrick McHardy struct fib_rules_ops *ops; 238f0ad0860SPatrick McHardy struct mr_table *mrt; 239f0ad0860SPatrick McHardy int err; 240f0ad0860SPatrick McHardy 241f0ad0860SPatrick McHardy ops = fib_rules_register(&ipmr_rules_ops_template, net); 242f0ad0860SPatrick McHardy if (IS_ERR(ops)) 243f0ad0860SPatrick McHardy return PTR_ERR(ops); 244f0ad0860SPatrick McHardy 245f0ad0860SPatrick McHardy INIT_LIST_HEAD(&net->ipv4.mr_tables); 246f0ad0860SPatrick McHardy 247f0ad0860SPatrick McHardy mrt = ipmr_new_table(net, RT_TABLE_DEFAULT); 248f0ad0860SPatrick McHardy if (mrt == NULL) { 249f0ad0860SPatrick McHardy err = -ENOMEM; 250f0ad0860SPatrick McHardy goto err1; 251f0ad0860SPatrick McHardy } 252f0ad0860SPatrick McHardy 253f0ad0860SPatrick McHardy err = fib_default_rule_add(ops, 0x7fff, RT_TABLE_DEFAULT, 0); 254f0ad0860SPatrick McHardy if (err < 0) 255f0ad0860SPatrick McHardy goto err2; 256f0ad0860SPatrick McHardy 257f0ad0860SPatrick McHardy net->ipv4.mr_rules_ops = ops; 258f0ad0860SPatrick McHardy return 0; 259f0ad0860SPatrick McHardy 260f0ad0860SPatrick McHardy err2: 261f0ad0860SPatrick McHardy kfree(mrt); 262f0ad0860SPatrick McHardy err1: 263f0ad0860SPatrick McHardy fib_rules_unregister(ops); 264f0ad0860SPatrick McHardy return err; 265f0ad0860SPatrick McHardy } 266f0ad0860SPatrick McHardy 267f0ad0860SPatrick McHardy static void __net_exit ipmr_rules_exit(struct net *net) 268f0ad0860SPatrick McHardy { 269f0ad0860SPatrick McHardy struct mr_table *mrt, *next; 270f0ad0860SPatrick McHardy 271035320d5SEric Dumazet list_for_each_entry_safe(mrt, next, &net->ipv4.mr_tables, list) { 272035320d5SEric Dumazet list_del(&mrt->list); 273f0ad0860SPatrick McHardy kfree(mrt); 274035320d5SEric Dumazet } 275f0ad0860SPatrick McHardy fib_rules_unregister(net->ipv4.mr_rules_ops); 276f0ad0860SPatrick McHardy } 277f0ad0860SPatrick McHardy #else 278f0ad0860SPatrick McHardy #define ipmr_for_each_table(mrt, net) \ 279f0ad0860SPatrick McHardy for (mrt = net->ipv4.mrt; mrt; mrt = NULL) 280f0ad0860SPatrick McHardy 281f0ad0860SPatrick McHardy static struct mr_table *ipmr_get_table(struct net *net, u32 id) 282f0ad0860SPatrick McHardy { 283f0ad0860SPatrick McHardy return net->ipv4.mrt; 284f0ad0860SPatrick McHardy } 285f0ad0860SPatrick McHardy 286f0ad0860SPatrick McHardy static int ipmr_fib_lookup(struct net *net, struct flowi *flp, 287f0ad0860SPatrick McHardy struct mr_table **mrt) 288f0ad0860SPatrick McHardy { 289f0ad0860SPatrick McHardy *mrt = net->ipv4.mrt; 290f0ad0860SPatrick McHardy return 0; 291f0ad0860SPatrick McHardy } 292f0ad0860SPatrick McHardy 293f0ad0860SPatrick McHardy static int __net_init ipmr_rules_init(struct net *net) 294f0ad0860SPatrick McHardy { 295f0ad0860SPatrick McHardy net->ipv4.mrt = ipmr_new_table(net, RT_TABLE_DEFAULT); 296f0ad0860SPatrick McHardy return net->ipv4.mrt ? 0 : -ENOMEM; 297f0ad0860SPatrick McHardy } 298f0ad0860SPatrick McHardy 299f0ad0860SPatrick McHardy static void __net_exit ipmr_rules_exit(struct net *net) 300f0ad0860SPatrick McHardy { 301f0ad0860SPatrick McHardy kfree(net->ipv4.mrt); 302f0ad0860SPatrick McHardy } 303f0ad0860SPatrick McHardy #endif 304f0ad0860SPatrick McHardy 305f0ad0860SPatrick McHardy static struct mr_table *ipmr_new_table(struct net *net, u32 id) 306f0ad0860SPatrick McHardy { 307f0ad0860SPatrick McHardy struct mr_table *mrt; 308f0ad0860SPatrick McHardy unsigned int i; 309f0ad0860SPatrick McHardy 310f0ad0860SPatrick McHardy mrt = ipmr_get_table(net, id); 311f0ad0860SPatrick McHardy if (mrt != NULL) 312f0ad0860SPatrick McHardy return mrt; 313f0ad0860SPatrick McHardy 314f0ad0860SPatrick McHardy mrt = kzalloc(sizeof(*mrt), GFP_KERNEL); 315f0ad0860SPatrick McHardy if (mrt == NULL) 316f0ad0860SPatrick McHardy return NULL; 3178de53dfbSPatrick McHardy write_pnet(&mrt->net, net); 318f0ad0860SPatrick McHardy mrt->id = id; 319f0ad0860SPatrick McHardy 320f0ad0860SPatrick McHardy /* Forwarding cache */ 321f0ad0860SPatrick McHardy for (i = 0; i < MFC_LINES; i++) 322f0ad0860SPatrick McHardy INIT_LIST_HEAD(&mrt->mfc_cache_array[i]); 323f0ad0860SPatrick McHardy 324f0ad0860SPatrick McHardy INIT_LIST_HEAD(&mrt->mfc_unres_queue); 325f0ad0860SPatrick McHardy 326f0ad0860SPatrick McHardy setup_timer(&mrt->ipmr_expire_timer, ipmr_expire_process, 327f0ad0860SPatrick McHardy (unsigned long)mrt); 328f0ad0860SPatrick McHardy 329f0ad0860SPatrick McHardy #ifdef CONFIG_IP_PIMSM 330f0ad0860SPatrick McHardy mrt->mroute_reg_vif_num = -1; 331f0ad0860SPatrick McHardy #endif 332f0ad0860SPatrick McHardy #ifdef CONFIG_IP_MROUTE_MULTIPLE_TABLES 333f0ad0860SPatrick McHardy list_add_tail_rcu(&mrt->list, &net->ipv4.mr_tables); 334f0ad0860SPatrick McHardy #endif 335f0ad0860SPatrick McHardy return mrt; 336f0ad0860SPatrick McHardy } 3371da177e4SLinus Torvalds 3381da177e4SLinus Torvalds /* Service routines creating virtual interfaces: DVMRP tunnels and PIMREG */ 3391da177e4SLinus Torvalds 340d607032dSWang Chen static void ipmr_del_tunnel(struct net_device *dev, struct vifctl *v) 341d607032dSWang Chen { 3424feb88e5SBenjamin Thery struct net *net = dev_net(dev); 3434feb88e5SBenjamin Thery 344d607032dSWang Chen dev_close(dev); 345d607032dSWang Chen 3464feb88e5SBenjamin Thery dev = __dev_get_by_name(net, "tunl0"); 347d607032dSWang Chen if (dev) { 3485bc3eb7eSStephen Hemminger const struct net_device_ops *ops = dev->netdev_ops; 349d607032dSWang Chen struct ifreq ifr; 350d607032dSWang Chen struct ip_tunnel_parm p; 351d607032dSWang Chen 352d607032dSWang Chen memset(&p, 0, sizeof(p)); 353d607032dSWang Chen p.iph.daddr = v->vifc_rmt_addr.s_addr; 354d607032dSWang Chen p.iph.saddr = v->vifc_lcl_addr.s_addr; 355d607032dSWang Chen p.iph.version = 4; 356d607032dSWang Chen p.iph.ihl = 5; 357d607032dSWang Chen p.iph.protocol = IPPROTO_IPIP; 358d607032dSWang Chen sprintf(p.name, "dvmrp%d", v->vifc_vifi); 359d607032dSWang Chen ifr.ifr_ifru.ifru_data = (__force void __user *)&p; 360d607032dSWang Chen 3615bc3eb7eSStephen Hemminger if (ops->ndo_do_ioctl) { 3625bc3eb7eSStephen Hemminger mm_segment_t oldfs = get_fs(); 3635bc3eb7eSStephen Hemminger 3645bc3eb7eSStephen Hemminger set_fs(KERNEL_DS); 3655bc3eb7eSStephen Hemminger ops->ndo_do_ioctl(dev, &ifr, SIOCDELTUNNEL); 366d607032dSWang Chen set_fs(oldfs); 367d607032dSWang Chen } 368d607032dSWang Chen } 3695bc3eb7eSStephen Hemminger } 370d607032dSWang Chen 3711da177e4SLinus Torvalds static 3724feb88e5SBenjamin Thery struct net_device *ipmr_new_tunnel(struct net *net, struct vifctl *v) 3731da177e4SLinus Torvalds { 3741da177e4SLinus Torvalds struct net_device *dev; 3751da177e4SLinus Torvalds 3764feb88e5SBenjamin Thery dev = __dev_get_by_name(net, "tunl0"); 3771da177e4SLinus Torvalds 3781da177e4SLinus Torvalds if (dev) { 3795bc3eb7eSStephen Hemminger const struct net_device_ops *ops = dev->netdev_ops; 3801da177e4SLinus Torvalds int err; 3811da177e4SLinus Torvalds struct ifreq ifr; 3821da177e4SLinus Torvalds struct ip_tunnel_parm p; 3831da177e4SLinus Torvalds struct in_device *in_dev; 3841da177e4SLinus Torvalds 3851da177e4SLinus Torvalds memset(&p, 0, sizeof(p)); 3861da177e4SLinus Torvalds p.iph.daddr = v->vifc_rmt_addr.s_addr; 3871da177e4SLinus Torvalds p.iph.saddr = v->vifc_lcl_addr.s_addr; 3881da177e4SLinus Torvalds p.iph.version = 4; 3891da177e4SLinus Torvalds p.iph.ihl = 5; 3901da177e4SLinus Torvalds p.iph.protocol = IPPROTO_IPIP; 3911da177e4SLinus Torvalds sprintf(p.name, "dvmrp%d", v->vifc_vifi); 392ba93ef74SStephen Hemminger ifr.ifr_ifru.ifru_data = (__force void __user *)&p; 3931da177e4SLinus Torvalds 3945bc3eb7eSStephen Hemminger if (ops->ndo_do_ioctl) { 3955bc3eb7eSStephen Hemminger mm_segment_t oldfs = get_fs(); 3965bc3eb7eSStephen Hemminger 3975bc3eb7eSStephen Hemminger set_fs(KERNEL_DS); 3985bc3eb7eSStephen Hemminger err = ops->ndo_do_ioctl(dev, &ifr, SIOCADDTUNNEL); 3991da177e4SLinus Torvalds set_fs(oldfs); 400a8cb16ddSEric Dumazet } else { 4015bc3eb7eSStephen Hemminger err = -EOPNOTSUPP; 402a8cb16ddSEric Dumazet } 4031da177e4SLinus Torvalds dev = NULL; 4041da177e4SLinus Torvalds 4054feb88e5SBenjamin Thery if (err == 0 && 4064feb88e5SBenjamin Thery (dev = __dev_get_by_name(net, p.name)) != NULL) { 4071da177e4SLinus Torvalds dev->flags |= IFF_MULTICAST; 4081da177e4SLinus Torvalds 409e5ed6399SHerbert Xu in_dev = __in_dev_get_rtnl(dev); 41071e27da9SHerbert Xu if (in_dev == NULL) 4111da177e4SLinus Torvalds goto failure; 41271e27da9SHerbert Xu 41371e27da9SHerbert Xu ipv4_devconf_setall(in_dev); 41471e27da9SHerbert Xu IPV4_DEVCONF(in_dev->cnf, RP_FILTER) = 0; 4151da177e4SLinus Torvalds 4161da177e4SLinus Torvalds if (dev_open(dev)) 4171da177e4SLinus Torvalds goto failure; 4187dc00c82SWang Chen dev_hold(dev); 4191da177e4SLinus Torvalds } 4201da177e4SLinus Torvalds } 4211da177e4SLinus Torvalds return dev; 4221da177e4SLinus Torvalds 4231da177e4SLinus Torvalds failure: 4241da177e4SLinus Torvalds /* allow the register to be completed before unregistering. */ 4251da177e4SLinus Torvalds rtnl_unlock(); 4261da177e4SLinus Torvalds rtnl_lock(); 4271da177e4SLinus Torvalds 4281da177e4SLinus Torvalds unregister_netdevice(dev); 4291da177e4SLinus Torvalds return NULL; 4301da177e4SLinus Torvalds } 4311da177e4SLinus Torvalds 4321da177e4SLinus Torvalds #ifdef CONFIG_IP_PIMSM 4331da177e4SLinus Torvalds 4346fef4c0cSStephen Hemminger static netdev_tx_t reg_vif_xmit(struct sk_buff *skb, struct net_device *dev) 4351da177e4SLinus Torvalds { 4364feb88e5SBenjamin Thery struct net *net = dev_net(dev); 437f0ad0860SPatrick McHardy struct mr_table *mrt; 438f0ad0860SPatrick McHardy struct flowi fl = { 439f0ad0860SPatrick McHardy .oif = dev->ifindex, 440f0ad0860SPatrick McHardy .iif = skb->skb_iif, 441f0ad0860SPatrick McHardy .mark = skb->mark, 442f0ad0860SPatrick McHardy }; 443f0ad0860SPatrick McHardy int err; 444f0ad0860SPatrick McHardy 445f0ad0860SPatrick McHardy err = ipmr_fib_lookup(net, &fl, &mrt); 446e40dbc51SBen Greear if (err < 0) { 447e40dbc51SBen Greear kfree_skb(skb); 448f0ad0860SPatrick McHardy return err; 449e40dbc51SBen Greear } 4504feb88e5SBenjamin Thery 4511da177e4SLinus Torvalds read_lock(&mrt_lock); 452cf3677aeSPavel Emelyanov dev->stats.tx_bytes += skb->len; 453cf3677aeSPavel Emelyanov dev->stats.tx_packets++; 4540c12295aSPatrick McHardy ipmr_cache_report(mrt, skb, mrt->mroute_reg_vif_num, IGMPMSG_WHOLEPKT); 4551da177e4SLinus Torvalds read_unlock(&mrt_lock); 4561da177e4SLinus Torvalds kfree_skb(skb); 4576ed10654SPatrick McHardy return NETDEV_TX_OK; 4581da177e4SLinus Torvalds } 4591da177e4SLinus Torvalds 460007c3838SStephen Hemminger static const struct net_device_ops reg_vif_netdev_ops = { 461007c3838SStephen Hemminger .ndo_start_xmit = reg_vif_xmit, 462007c3838SStephen Hemminger }; 463007c3838SStephen Hemminger 4641da177e4SLinus Torvalds static void reg_vif_setup(struct net_device *dev) 4651da177e4SLinus Torvalds { 4661da177e4SLinus Torvalds dev->type = ARPHRD_PIMREG; 46746f25dffSKris Katterjohn dev->mtu = ETH_DATA_LEN - sizeof(struct iphdr) - 8; 4681da177e4SLinus Torvalds dev->flags = IFF_NOARP; 469007c3838SStephen Hemminger dev->netdev_ops = ®_vif_netdev_ops, 4701da177e4SLinus Torvalds dev->destructor = free_netdev; 471403dbb97STom Goff dev->features |= NETIF_F_NETNS_LOCAL; 4721da177e4SLinus Torvalds } 4731da177e4SLinus Torvalds 474f0ad0860SPatrick McHardy static struct net_device *ipmr_reg_vif(struct net *net, struct mr_table *mrt) 4751da177e4SLinus Torvalds { 4761da177e4SLinus Torvalds struct net_device *dev; 4771da177e4SLinus Torvalds struct in_device *in_dev; 478f0ad0860SPatrick McHardy char name[IFNAMSIZ]; 4791da177e4SLinus Torvalds 480f0ad0860SPatrick McHardy if (mrt->id == RT_TABLE_DEFAULT) 481f0ad0860SPatrick McHardy sprintf(name, "pimreg"); 482f0ad0860SPatrick McHardy else 483f0ad0860SPatrick McHardy sprintf(name, "pimreg%u", mrt->id); 484f0ad0860SPatrick McHardy 485f0ad0860SPatrick McHardy dev = alloc_netdev(0, name, reg_vif_setup); 4861da177e4SLinus Torvalds 4871da177e4SLinus Torvalds if (dev == NULL) 4881da177e4SLinus Torvalds return NULL; 4891da177e4SLinus Torvalds 490403dbb97STom Goff dev_net_set(dev, net); 491403dbb97STom Goff 4921da177e4SLinus Torvalds if (register_netdevice(dev)) { 4931da177e4SLinus Torvalds free_netdev(dev); 4941da177e4SLinus Torvalds return NULL; 4951da177e4SLinus Torvalds } 4961da177e4SLinus Torvalds dev->iflink = 0; 4971da177e4SLinus Torvalds 49871e27da9SHerbert Xu rcu_read_lock(); 499a8cb16ddSEric Dumazet in_dev = __in_dev_get_rcu(dev); 500a8cb16ddSEric Dumazet if (!in_dev) { 50171e27da9SHerbert Xu rcu_read_unlock(); 5021da177e4SLinus Torvalds goto failure; 50371e27da9SHerbert Xu } 5041da177e4SLinus Torvalds 50571e27da9SHerbert Xu ipv4_devconf_setall(in_dev); 50671e27da9SHerbert Xu IPV4_DEVCONF(in_dev->cnf, RP_FILTER) = 0; 50771e27da9SHerbert Xu rcu_read_unlock(); 5081da177e4SLinus Torvalds 5091da177e4SLinus Torvalds if (dev_open(dev)) 5101da177e4SLinus Torvalds goto failure; 5111da177e4SLinus Torvalds 5127dc00c82SWang Chen dev_hold(dev); 5137dc00c82SWang Chen 5141da177e4SLinus Torvalds return dev; 5151da177e4SLinus Torvalds 5161da177e4SLinus Torvalds failure: 5171da177e4SLinus Torvalds /* allow the register to be completed before unregistering. */ 5181da177e4SLinus Torvalds rtnl_unlock(); 5191da177e4SLinus Torvalds rtnl_lock(); 5201da177e4SLinus Torvalds 5211da177e4SLinus Torvalds unregister_netdevice(dev); 5221da177e4SLinus Torvalds return NULL; 5231da177e4SLinus Torvalds } 5241da177e4SLinus Torvalds #endif 5251da177e4SLinus Torvalds 5261da177e4SLinus Torvalds /* 5271da177e4SLinus Torvalds * Delete a VIF entry 5287dc00c82SWang Chen * @notify: Set to 1, if the caller is a notifier_call 5291da177e4SLinus Torvalds */ 5301da177e4SLinus Torvalds 5310c12295aSPatrick McHardy static int vif_delete(struct mr_table *mrt, int vifi, int notify, 532d17fa6faSEric Dumazet struct list_head *head) 5331da177e4SLinus Torvalds { 5341da177e4SLinus Torvalds struct vif_device *v; 5351da177e4SLinus Torvalds struct net_device *dev; 5361da177e4SLinus Torvalds struct in_device *in_dev; 5371da177e4SLinus Torvalds 5380c12295aSPatrick McHardy if (vifi < 0 || vifi >= mrt->maxvif) 5391da177e4SLinus Torvalds return -EADDRNOTAVAIL; 5401da177e4SLinus Torvalds 5410c12295aSPatrick McHardy v = &mrt->vif_table[vifi]; 5421da177e4SLinus Torvalds 5431da177e4SLinus Torvalds write_lock_bh(&mrt_lock); 5441da177e4SLinus Torvalds dev = v->dev; 5451da177e4SLinus Torvalds v->dev = NULL; 5461da177e4SLinus Torvalds 5471da177e4SLinus Torvalds if (!dev) { 5481da177e4SLinus Torvalds write_unlock_bh(&mrt_lock); 5491da177e4SLinus Torvalds return -EADDRNOTAVAIL; 5501da177e4SLinus Torvalds } 5511da177e4SLinus Torvalds 5521da177e4SLinus Torvalds #ifdef CONFIG_IP_PIMSM 5530c12295aSPatrick McHardy if (vifi == mrt->mroute_reg_vif_num) 5540c12295aSPatrick McHardy mrt->mroute_reg_vif_num = -1; 5551da177e4SLinus Torvalds #endif 5561da177e4SLinus Torvalds 5570c12295aSPatrick McHardy if (vifi + 1 == mrt->maxvif) { 5581da177e4SLinus Torvalds int tmp; 559a8cb16ddSEric Dumazet 5601da177e4SLinus Torvalds for (tmp = vifi - 1; tmp >= 0; tmp--) { 5610c12295aSPatrick McHardy if (VIF_EXISTS(mrt, tmp)) 5621da177e4SLinus Torvalds break; 5631da177e4SLinus Torvalds } 5640c12295aSPatrick McHardy mrt->maxvif = tmp+1; 5651da177e4SLinus Torvalds } 5661da177e4SLinus Torvalds 5671da177e4SLinus Torvalds write_unlock_bh(&mrt_lock); 5681da177e4SLinus Torvalds 5691da177e4SLinus Torvalds dev_set_allmulti(dev, -1); 5701da177e4SLinus Torvalds 571a8cb16ddSEric Dumazet in_dev = __in_dev_get_rtnl(dev); 572a8cb16ddSEric Dumazet if (in_dev) { 57342f811b8SHerbert Xu IPV4_DEVCONF(in_dev->cnf, MC_FORWARDING)--; 5741da177e4SLinus Torvalds ip_rt_multicast_event(in_dev); 5751da177e4SLinus Torvalds } 5761da177e4SLinus Torvalds 5777dc00c82SWang Chen if (v->flags & (VIFF_TUNNEL | VIFF_REGISTER) && !notify) 578d17fa6faSEric Dumazet unregister_netdevice_queue(dev, head); 5791da177e4SLinus Torvalds 5801da177e4SLinus Torvalds dev_put(dev); 5811da177e4SLinus Torvalds return 0; 5821da177e4SLinus Torvalds } 5831da177e4SLinus Torvalds 584a8c9486bSEric Dumazet static void ipmr_cache_free_rcu(struct rcu_head *head) 585a8c9486bSEric Dumazet { 586a8c9486bSEric Dumazet struct mfc_cache *c = container_of(head, struct mfc_cache, rcu); 587a8c9486bSEric Dumazet 588a8c9486bSEric Dumazet kmem_cache_free(mrt_cachep, c); 589a8c9486bSEric Dumazet } 590a8c9486bSEric Dumazet 5915c0a66f5SBenjamin Thery static inline void ipmr_cache_free(struct mfc_cache *c) 5925c0a66f5SBenjamin Thery { 593a8c9486bSEric Dumazet call_rcu(&c->rcu, ipmr_cache_free_rcu); 5945c0a66f5SBenjamin Thery } 5955c0a66f5SBenjamin Thery 5961da177e4SLinus Torvalds /* Destroy an unresolved cache entry, killing queued skbs 597a8cb16ddSEric Dumazet * and reporting error to netlink readers. 5981da177e4SLinus Torvalds */ 5991da177e4SLinus Torvalds 6000c12295aSPatrick McHardy static void ipmr_destroy_unres(struct mr_table *mrt, struct mfc_cache *c) 6011da177e4SLinus Torvalds { 6028de53dfbSPatrick McHardy struct net *net = read_pnet(&mrt->net); 6031da177e4SLinus Torvalds struct sk_buff *skb; 6049ef1d4c7SPatrick McHardy struct nlmsgerr *e; 6051da177e4SLinus Torvalds 6060c12295aSPatrick McHardy atomic_dec(&mrt->cache_resolve_queue_len); 6071da177e4SLinus Torvalds 6081da177e4SLinus Torvalds while ((skb = skb_dequeue(&c->mfc_un.unres.unresolved))) { 609eddc9ec5SArnaldo Carvalho de Melo if (ip_hdr(skb)->version == 0) { 6101da177e4SLinus Torvalds struct nlmsghdr *nlh = (struct nlmsghdr *)skb_pull(skb, sizeof(struct iphdr)); 6111da177e4SLinus Torvalds nlh->nlmsg_type = NLMSG_ERROR; 6121da177e4SLinus Torvalds nlh->nlmsg_len = NLMSG_LENGTH(sizeof(struct nlmsgerr)); 6131da177e4SLinus Torvalds skb_trim(skb, nlh->nlmsg_len); 6149ef1d4c7SPatrick McHardy e = NLMSG_DATA(nlh); 6159ef1d4c7SPatrick McHardy e->error = -ETIMEDOUT; 6169ef1d4c7SPatrick McHardy memset(&e->msg, 0, sizeof(e->msg)); 6172942e900SThomas Graf 6184feb88e5SBenjamin Thery rtnl_unicast(skb, net, NETLINK_CB(skb).pid); 619a8cb16ddSEric Dumazet } else { 6201da177e4SLinus Torvalds kfree_skb(skb); 6211da177e4SLinus Torvalds } 622a8cb16ddSEric Dumazet } 6231da177e4SLinus Torvalds 6245c0a66f5SBenjamin Thery ipmr_cache_free(c); 6251da177e4SLinus Torvalds } 6261da177e4SLinus Torvalds 6271da177e4SLinus Torvalds 628e258beb2SPatrick McHardy /* Timer process for the unresolved queue. */ 6291da177e4SLinus Torvalds 630e258beb2SPatrick McHardy static void ipmr_expire_process(unsigned long arg) 6311da177e4SLinus Torvalds { 6320c12295aSPatrick McHardy struct mr_table *mrt = (struct mr_table *)arg; 6331da177e4SLinus Torvalds unsigned long now; 6341da177e4SLinus Torvalds unsigned long expires; 635862465f2SPatrick McHardy struct mfc_cache *c, *next; 6361da177e4SLinus Torvalds 6371da177e4SLinus Torvalds if (!spin_trylock(&mfc_unres_lock)) { 6380c12295aSPatrick McHardy mod_timer(&mrt->ipmr_expire_timer, jiffies+HZ/10); 6391da177e4SLinus Torvalds return; 6401da177e4SLinus Torvalds } 6411da177e4SLinus Torvalds 6420c12295aSPatrick McHardy if (list_empty(&mrt->mfc_unres_queue)) 6431da177e4SLinus Torvalds goto out; 6441da177e4SLinus Torvalds 6451da177e4SLinus Torvalds now = jiffies; 6461da177e4SLinus Torvalds expires = 10*HZ; 6471da177e4SLinus Torvalds 6480c12295aSPatrick McHardy list_for_each_entry_safe(c, next, &mrt->mfc_unres_queue, list) { 6491da177e4SLinus Torvalds if (time_after(c->mfc_un.unres.expires, now)) { 6501da177e4SLinus Torvalds unsigned long interval = c->mfc_un.unres.expires - now; 6511da177e4SLinus Torvalds if (interval < expires) 6521da177e4SLinus Torvalds expires = interval; 6531da177e4SLinus Torvalds continue; 6541da177e4SLinus Torvalds } 6551da177e4SLinus Torvalds 656862465f2SPatrick McHardy list_del(&c->list); 6570c12295aSPatrick McHardy ipmr_destroy_unres(mrt, c); 6581da177e4SLinus Torvalds } 6591da177e4SLinus Torvalds 6600c12295aSPatrick McHardy if (!list_empty(&mrt->mfc_unres_queue)) 6610c12295aSPatrick McHardy mod_timer(&mrt->ipmr_expire_timer, jiffies + expires); 6621da177e4SLinus Torvalds 6631da177e4SLinus Torvalds out: 6641da177e4SLinus Torvalds spin_unlock(&mfc_unres_lock); 6651da177e4SLinus Torvalds } 6661da177e4SLinus Torvalds 6671da177e4SLinus Torvalds /* Fill oifs list. It is called under write locked mrt_lock. */ 6681da177e4SLinus Torvalds 6690c12295aSPatrick McHardy static void ipmr_update_thresholds(struct mr_table *mrt, struct mfc_cache *cache, 670d658f8a0SPatrick McHardy unsigned char *ttls) 6711da177e4SLinus Torvalds { 6721da177e4SLinus Torvalds int vifi; 6731da177e4SLinus Torvalds 6741da177e4SLinus Torvalds cache->mfc_un.res.minvif = MAXVIFS; 6751da177e4SLinus Torvalds cache->mfc_un.res.maxvif = 0; 6761da177e4SLinus Torvalds memset(cache->mfc_un.res.ttls, 255, MAXVIFS); 6771da177e4SLinus Torvalds 6780c12295aSPatrick McHardy for (vifi = 0; vifi < mrt->maxvif; vifi++) { 6790c12295aSPatrick McHardy if (VIF_EXISTS(mrt, vifi) && 680cf958ae3SBenjamin Thery ttls[vifi] && ttls[vifi] < 255) { 6811da177e4SLinus Torvalds cache->mfc_un.res.ttls[vifi] = ttls[vifi]; 6821da177e4SLinus Torvalds if (cache->mfc_un.res.minvif > vifi) 6831da177e4SLinus Torvalds cache->mfc_un.res.minvif = vifi; 6841da177e4SLinus Torvalds if (cache->mfc_un.res.maxvif <= vifi) 6851da177e4SLinus Torvalds cache->mfc_un.res.maxvif = vifi + 1; 6861da177e4SLinus Torvalds } 6871da177e4SLinus Torvalds } 6881da177e4SLinus Torvalds } 6891da177e4SLinus Torvalds 6900c12295aSPatrick McHardy static int vif_add(struct net *net, struct mr_table *mrt, 6910c12295aSPatrick McHardy struct vifctl *vifc, int mrtsock) 6921da177e4SLinus Torvalds { 6931da177e4SLinus Torvalds int vifi = vifc->vifc_vifi; 6940c12295aSPatrick McHardy struct vif_device *v = &mrt->vif_table[vifi]; 6951da177e4SLinus Torvalds struct net_device *dev; 6961da177e4SLinus Torvalds struct in_device *in_dev; 697d607032dSWang Chen int err; 6981da177e4SLinus Torvalds 6991da177e4SLinus Torvalds /* Is vif busy ? */ 7000c12295aSPatrick McHardy if (VIF_EXISTS(mrt, vifi)) 7011da177e4SLinus Torvalds return -EADDRINUSE; 7021da177e4SLinus Torvalds 7031da177e4SLinus Torvalds switch (vifc->vifc_flags) { 7041da177e4SLinus Torvalds #ifdef CONFIG_IP_PIMSM 7051da177e4SLinus Torvalds case VIFF_REGISTER: 7061da177e4SLinus Torvalds /* 7071da177e4SLinus Torvalds * Special Purpose VIF in PIM 7081da177e4SLinus Torvalds * All the packets will be sent to the daemon 7091da177e4SLinus Torvalds */ 7100c12295aSPatrick McHardy if (mrt->mroute_reg_vif_num >= 0) 7111da177e4SLinus Torvalds return -EADDRINUSE; 712f0ad0860SPatrick McHardy dev = ipmr_reg_vif(net, mrt); 7131da177e4SLinus Torvalds if (!dev) 7141da177e4SLinus Torvalds return -ENOBUFS; 715d607032dSWang Chen err = dev_set_allmulti(dev, 1); 716d607032dSWang Chen if (err) { 717d607032dSWang Chen unregister_netdevice(dev); 7187dc00c82SWang Chen dev_put(dev); 719d607032dSWang Chen return err; 720d607032dSWang Chen } 7211da177e4SLinus Torvalds break; 7221da177e4SLinus Torvalds #endif 7231da177e4SLinus Torvalds case VIFF_TUNNEL: 7244feb88e5SBenjamin Thery dev = ipmr_new_tunnel(net, vifc); 7251da177e4SLinus Torvalds if (!dev) 7261da177e4SLinus Torvalds return -ENOBUFS; 727d607032dSWang Chen err = dev_set_allmulti(dev, 1); 728d607032dSWang Chen if (err) { 729d607032dSWang Chen ipmr_del_tunnel(dev, vifc); 7307dc00c82SWang Chen dev_put(dev); 731d607032dSWang Chen return err; 732d607032dSWang Chen } 7331da177e4SLinus Torvalds break; 734ee5e81f0SIlia K 735ee5e81f0SIlia K case VIFF_USE_IFINDEX: 7361da177e4SLinus Torvalds case 0: 737ee5e81f0SIlia K if (vifc->vifc_flags == VIFF_USE_IFINDEX) { 738ee5e81f0SIlia K dev = dev_get_by_index(net, vifc->vifc_lcl_ifindex); 73995ae6b22SEric Dumazet if (dev && __in_dev_get_rtnl(dev) == NULL) { 740ee5e81f0SIlia K dev_put(dev); 741ee5e81f0SIlia K return -EADDRNOTAVAIL; 742ee5e81f0SIlia K } 743a8cb16ddSEric Dumazet } else { 7444feb88e5SBenjamin Thery dev = ip_dev_find(net, vifc->vifc_lcl_addr.s_addr); 745a8cb16ddSEric Dumazet } 7461da177e4SLinus Torvalds if (!dev) 7471da177e4SLinus Torvalds return -EADDRNOTAVAIL; 748d607032dSWang Chen err = dev_set_allmulti(dev, 1); 7497dc00c82SWang Chen if (err) { 7507dc00c82SWang Chen dev_put(dev); 751d607032dSWang Chen return err; 7527dc00c82SWang Chen } 7531da177e4SLinus Torvalds break; 7541da177e4SLinus Torvalds default: 7551da177e4SLinus Torvalds return -EINVAL; 7561da177e4SLinus Torvalds } 7571da177e4SLinus Torvalds 758a8cb16ddSEric Dumazet in_dev = __in_dev_get_rtnl(dev); 759a8cb16ddSEric Dumazet if (!in_dev) { 760d0490cfdSDan Carpenter dev_put(dev); 7611da177e4SLinus Torvalds return -EADDRNOTAVAIL; 762d0490cfdSDan Carpenter } 76342f811b8SHerbert Xu IPV4_DEVCONF(in_dev->cnf, MC_FORWARDING)++; 7641da177e4SLinus Torvalds ip_rt_multicast_event(in_dev); 7651da177e4SLinus Torvalds 766a8cb16ddSEric Dumazet /* Fill in the VIF structures */ 767a8cb16ddSEric Dumazet 7681da177e4SLinus Torvalds v->rate_limit = vifc->vifc_rate_limit; 7691da177e4SLinus Torvalds v->local = vifc->vifc_lcl_addr.s_addr; 7701da177e4SLinus Torvalds v->remote = vifc->vifc_rmt_addr.s_addr; 7711da177e4SLinus Torvalds v->flags = vifc->vifc_flags; 7721da177e4SLinus Torvalds if (!mrtsock) 7731da177e4SLinus Torvalds v->flags |= VIFF_STATIC; 7741da177e4SLinus Torvalds v->threshold = vifc->vifc_threshold; 7751da177e4SLinus Torvalds v->bytes_in = 0; 7761da177e4SLinus Torvalds v->bytes_out = 0; 7771da177e4SLinus Torvalds v->pkt_in = 0; 7781da177e4SLinus Torvalds v->pkt_out = 0; 7791da177e4SLinus Torvalds v->link = dev->ifindex; 7801da177e4SLinus Torvalds if (v->flags & (VIFF_TUNNEL | VIFF_REGISTER)) 7811da177e4SLinus Torvalds v->link = dev->iflink; 7821da177e4SLinus Torvalds 7831da177e4SLinus Torvalds /* And finish update writing critical data */ 7841da177e4SLinus Torvalds write_lock_bh(&mrt_lock); 7851da177e4SLinus Torvalds v->dev = dev; 7861da177e4SLinus Torvalds #ifdef CONFIG_IP_PIMSM 7871da177e4SLinus Torvalds if (v->flags & VIFF_REGISTER) 7880c12295aSPatrick McHardy mrt->mroute_reg_vif_num = vifi; 7891da177e4SLinus Torvalds #endif 7900c12295aSPatrick McHardy if (vifi+1 > mrt->maxvif) 7910c12295aSPatrick McHardy mrt->maxvif = vifi+1; 7921da177e4SLinus Torvalds write_unlock_bh(&mrt_lock); 7931da177e4SLinus Torvalds return 0; 7941da177e4SLinus Torvalds } 7951da177e4SLinus Torvalds 796a8c9486bSEric Dumazet /* called with rcu_read_lock() */ 7970c12295aSPatrick McHardy static struct mfc_cache *ipmr_cache_find(struct mr_table *mrt, 7984feb88e5SBenjamin Thery __be32 origin, 7994feb88e5SBenjamin Thery __be32 mcastgrp) 8001da177e4SLinus Torvalds { 8011da177e4SLinus Torvalds int line = MFC_HASH(mcastgrp, origin); 8021da177e4SLinus Torvalds struct mfc_cache *c; 8031da177e4SLinus Torvalds 804a8c9486bSEric Dumazet list_for_each_entry_rcu(c, &mrt->mfc_cache_array[line], list) { 8051da177e4SLinus Torvalds if (c->mfc_origin == origin && c->mfc_mcastgrp == mcastgrp) 8061da177e4SLinus Torvalds return c; 8071da177e4SLinus Torvalds } 808862465f2SPatrick McHardy return NULL; 809862465f2SPatrick McHardy } 8101da177e4SLinus Torvalds 8111da177e4SLinus Torvalds /* 8121da177e4SLinus Torvalds * Allocate a multicast cache entry 8131da177e4SLinus Torvalds */ 814d658f8a0SPatrick McHardy static struct mfc_cache *ipmr_cache_alloc(void) 8151da177e4SLinus Torvalds { 816c3762229SRobert P. J. Day struct mfc_cache *c = kmem_cache_zalloc(mrt_cachep, GFP_KERNEL); 817a8c9486bSEric Dumazet 818a8c9486bSEric Dumazet if (c) 8191da177e4SLinus Torvalds c->mfc_un.res.minvif = MAXVIFS; 8201da177e4SLinus Torvalds return c; 8211da177e4SLinus Torvalds } 8221da177e4SLinus Torvalds 823d658f8a0SPatrick McHardy static struct mfc_cache *ipmr_cache_alloc_unres(void) 8241da177e4SLinus Torvalds { 825c3762229SRobert P. J. Day struct mfc_cache *c = kmem_cache_zalloc(mrt_cachep, GFP_ATOMIC); 826a8c9486bSEric Dumazet 827a8c9486bSEric Dumazet if (c) { 8281da177e4SLinus Torvalds skb_queue_head_init(&c->mfc_un.unres.unresolved); 8291da177e4SLinus Torvalds c->mfc_un.unres.expires = jiffies + 10*HZ; 830a8c9486bSEric Dumazet } 8311da177e4SLinus Torvalds return c; 8321da177e4SLinus Torvalds } 8331da177e4SLinus Torvalds 8341da177e4SLinus Torvalds /* 8351da177e4SLinus Torvalds * A cache entry has gone into a resolved state from queued 8361da177e4SLinus Torvalds */ 8371da177e4SLinus Torvalds 8380c12295aSPatrick McHardy static void ipmr_cache_resolve(struct net *net, struct mr_table *mrt, 8390c12295aSPatrick McHardy struct mfc_cache *uc, struct mfc_cache *c) 8401da177e4SLinus Torvalds { 8411da177e4SLinus Torvalds struct sk_buff *skb; 8429ef1d4c7SPatrick McHardy struct nlmsgerr *e; 8431da177e4SLinus Torvalds 844a8cb16ddSEric Dumazet /* Play the pending entries through our router */ 8451da177e4SLinus Torvalds 8461da177e4SLinus Torvalds while ((skb = __skb_dequeue(&uc->mfc_un.unres.unresolved))) { 847eddc9ec5SArnaldo Carvalho de Melo if (ip_hdr(skb)->version == 0) { 8481da177e4SLinus Torvalds struct nlmsghdr *nlh = (struct nlmsghdr *)skb_pull(skb, sizeof(struct iphdr)); 8491da177e4SLinus Torvalds 850cb6a4e46SPatrick McHardy if (__ipmr_fill_mroute(mrt, skb, c, NLMSG_DATA(nlh)) > 0) { 851a8cb16ddSEric Dumazet nlh->nlmsg_len = skb_tail_pointer(skb) - 852a8cb16ddSEric Dumazet (u8 *)nlh; 8531da177e4SLinus Torvalds } else { 8541da177e4SLinus Torvalds nlh->nlmsg_type = NLMSG_ERROR; 8551da177e4SLinus Torvalds nlh->nlmsg_len = NLMSG_LENGTH(sizeof(struct nlmsgerr)); 8561da177e4SLinus Torvalds skb_trim(skb, nlh->nlmsg_len); 8579ef1d4c7SPatrick McHardy e = NLMSG_DATA(nlh); 8589ef1d4c7SPatrick McHardy e->error = -EMSGSIZE; 8599ef1d4c7SPatrick McHardy memset(&e->msg, 0, sizeof(e->msg)); 8601da177e4SLinus Torvalds } 8612942e900SThomas Graf 862d658f8a0SPatrick McHardy rtnl_unicast(skb, net, NETLINK_CB(skb).pid); 863a8cb16ddSEric Dumazet } else { 8640c12295aSPatrick McHardy ip_mr_forward(net, mrt, skb, c, 0); 8651da177e4SLinus Torvalds } 8661da177e4SLinus Torvalds } 867a8cb16ddSEric Dumazet } 8681da177e4SLinus Torvalds 8691da177e4SLinus Torvalds /* 8701da177e4SLinus Torvalds * Bounce a cache query up to mrouted. We could use netlink for this but mrouted 8711da177e4SLinus Torvalds * expects the following bizarre scheme. 8721da177e4SLinus Torvalds * 8731da177e4SLinus Torvalds * Called under mrt_lock. 8741da177e4SLinus Torvalds */ 8751da177e4SLinus Torvalds 8760c12295aSPatrick McHardy static int ipmr_cache_report(struct mr_table *mrt, 8774feb88e5SBenjamin Thery struct sk_buff *pkt, vifi_t vifi, int assert) 8781da177e4SLinus Torvalds { 8791da177e4SLinus Torvalds struct sk_buff *skb; 880c9bdd4b5SArnaldo Carvalho de Melo const int ihl = ip_hdrlen(pkt); 8811da177e4SLinus Torvalds struct igmphdr *igmp; 8821da177e4SLinus Torvalds struct igmpmsg *msg; 8834c968709SEric Dumazet struct sock *mroute_sk; 8841da177e4SLinus Torvalds int ret; 8851da177e4SLinus Torvalds 8861da177e4SLinus Torvalds #ifdef CONFIG_IP_PIMSM 8871da177e4SLinus Torvalds if (assert == IGMPMSG_WHOLEPKT) 8881da177e4SLinus Torvalds skb = skb_realloc_headroom(pkt, sizeof(struct iphdr)); 8891da177e4SLinus Torvalds else 8901da177e4SLinus Torvalds #endif 8911da177e4SLinus Torvalds skb = alloc_skb(128, GFP_ATOMIC); 8921da177e4SLinus Torvalds 8931da177e4SLinus Torvalds if (!skb) 8941da177e4SLinus Torvalds return -ENOBUFS; 8951da177e4SLinus Torvalds 8961da177e4SLinus Torvalds #ifdef CONFIG_IP_PIMSM 8971da177e4SLinus Torvalds if (assert == IGMPMSG_WHOLEPKT) { 8981da177e4SLinus Torvalds /* Ugly, but we have no choice with this interface. 899a8cb16ddSEric Dumazet * Duplicate old header, fix ihl, length etc. 900a8cb16ddSEric Dumazet * And all this only to mangle msg->im_msgtype and 901a8cb16ddSEric Dumazet * to set msg->im_mbz to "mbz" :-) 9021da177e4SLinus Torvalds */ 903878c8145SArnaldo Carvalho de Melo skb_push(skb, sizeof(struct iphdr)); 904878c8145SArnaldo Carvalho de Melo skb_reset_network_header(skb); 905badff6d0SArnaldo Carvalho de Melo skb_reset_transport_header(skb); 9060272ffc4SArnaldo Carvalho de Melo msg = (struct igmpmsg *)skb_network_header(skb); 907d56f90a7SArnaldo Carvalho de Melo memcpy(msg, skb_network_header(pkt), sizeof(struct iphdr)); 9081da177e4SLinus Torvalds msg->im_msgtype = IGMPMSG_WHOLEPKT; 9091da177e4SLinus Torvalds msg->im_mbz = 0; 9100c12295aSPatrick McHardy msg->im_vif = mrt->mroute_reg_vif_num; 911eddc9ec5SArnaldo Carvalho de Melo ip_hdr(skb)->ihl = sizeof(struct iphdr) >> 2; 912eddc9ec5SArnaldo Carvalho de Melo ip_hdr(skb)->tot_len = htons(ntohs(ip_hdr(pkt)->tot_len) + 913eddc9ec5SArnaldo Carvalho de Melo sizeof(struct iphdr)); 9141da177e4SLinus Torvalds } else 9151da177e4SLinus Torvalds #endif 9161da177e4SLinus Torvalds { 9171da177e4SLinus Torvalds 918a8cb16ddSEric Dumazet /* Copy the IP header */ 9191da177e4SLinus Torvalds 92027a884dcSArnaldo Carvalho de Melo skb->network_header = skb->tail; 921ddc7b8e3SArnaldo Carvalho de Melo skb_put(skb, ihl); 92227d7ff46SArnaldo Carvalho de Melo skb_copy_to_linear_data(skb, pkt->data, ihl); 923eddc9ec5SArnaldo Carvalho de Melo ip_hdr(skb)->protocol = 0; /* Flag to the kernel this is a route add */ 924eddc9ec5SArnaldo Carvalho de Melo msg = (struct igmpmsg *)skb_network_header(skb); 9251da177e4SLinus Torvalds msg->im_vif = vifi; 926adf30907SEric Dumazet skb_dst_set(skb, dst_clone(skb_dst(pkt))); 9271da177e4SLinus Torvalds 928a8cb16ddSEric Dumazet /* Add our header */ 9291da177e4SLinus Torvalds 9301da177e4SLinus Torvalds igmp = (struct igmphdr *)skb_put(skb, sizeof(struct igmphdr)); 9311da177e4SLinus Torvalds igmp->type = 9321da177e4SLinus Torvalds msg->im_msgtype = assert; 9331da177e4SLinus Torvalds igmp->code = 0; 934eddc9ec5SArnaldo Carvalho de Melo ip_hdr(skb)->tot_len = htons(skb->len); /* Fix the length */ 935b0e380b1SArnaldo Carvalho de Melo skb->transport_header = skb->network_header; 9361da177e4SLinus Torvalds } 9371da177e4SLinus Torvalds 9384c968709SEric Dumazet rcu_read_lock(); 9394c968709SEric Dumazet mroute_sk = rcu_dereference(mrt->mroute_sk); 9404c968709SEric Dumazet if (mroute_sk == NULL) { 9414c968709SEric Dumazet rcu_read_unlock(); 9421da177e4SLinus Torvalds kfree_skb(skb); 9431da177e4SLinus Torvalds return -EINVAL; 9441da177e4SLinus Torvalds } 9451da177e4SLinus Torvalds 946a8cb16ddSEric Dumazet /* Deliver to mrouted */ 947a8cb16ddSEric Dumazet 9484c968709SEric Dumazet ret = sock_queue_rcv_skb(mroute_sk, skb); 9494c968709SEric Dumazet rcu_read_unlock(); 95070a269e6SBenjamin Thery if (ret < 0) { 9511da177e4SLinus Torvalds if (net_ratelimit()) 9521da177e4SLinus Torvalds printk(KERN_WARNING "mroute: pending queue full, dropping entries.\n"); 9531da177e4SLinus Torvalds kfree_skb(skb); 9541da177e4SLinus Torvalds } 9551da177e4SLinus Torvalds 9561da177e4SLinus Torvalds return ret; 9571da177e4SLinus Torvalds } 9581da177e4SLinus Torvalds 9591da177e4SLinus Torvalds /* 9601da177e4SLinus Torvalds * Queue a packet for resolution. It gets locked cache entry! 9611da177e4SLinus Torvalds */ 9621da177e4SLinus Torvalds 9631da177e4SLinus Torvalds static int 9640c12295aSPatrick McHardy ipmr_cache_unresolved(struct mr_table *mrt, vifi_t vifi, struct sk_buff *skb) 9651da177e4SLinus Torvalds { 966862465f2SPatrick McHardy bool found = false; 9671da177e4SLinus Torvalds int err; 9681da177e4SLinus Torvalds struct mfc_cache *c; 969eddc9ec5SArnaldo Carvalho de Melo const struct iphdr *iph = ip_hdr(skb); 9701da177e4SLinus Torvalds 9711da177e4SLinus Torvalds spin_lock_bh(&mfc_unres_lock); 9720c12295aSPatrick McHardy list_for_each_entry(c, &mrt->mfc_unres_queue, list) { 973e258beb2SPatrick McHardy if (c->mfc_mcastgrp == iph->daddr && 974862465f2SPatrick McHardy c->mfc_origin == iph->saddr) { 975862465f2SPatrick McHardy found = true; 9761da177e4SLinus Torvalds break; 9771da177e4SLinus Torvalds } 978862465f2SPatrick McHardy } 9791da177e4SLinus Torvalds 980862465f2SPatrick McHardy if (!found) { 981a8cb16ddSEric Dumazet /* Create a new entry if allowable */ 9821da177e4SLinus Torvalds 9830c12295aSPatrick McHardy if (atomic_read(&mrt->cache_resolve_queue_len) >= 10 || 984d658f8a0SPatrick McHardy (c = ipmr_cache_alloc_unres()) == NULL) { 9851da177e4SLinus Torvalds spin_unlock_bh(&mfc_unres_lock); 9861da177e4SLinus Torvalds 9871da177e4SLinus Torvalds kfree_skb(skb); 9881da177e4SLinus Torvalds return -ENOBUFS; 9891da177e4SLinus Torvalds } 9901da177e4SLinus Torvalds 991a8cb16ddSEric Dumazet /* Fill in the new cache entry */ 992a8cb16ddSEric Dumazet 9931da177e4SLinus Torvalds c->mfc_parent = -1; 994eddc9ec5SArnaldo Carvalho de Melo c->mfc_origin = iph->saddr; 995eddc9ec5SArnaldo Carvalho de Melo c->mfc_mcastgrp = iph->daddr; 9961da177e4SLinus Torvalds 997a8cb16ddSEric Dumazet /* Reflect first query at mrouted. */ 998a8cb16ddSEric Dumazet 9990c12295aSPatrick McHardy err = ipmr_cache_report(mrt, skb, vifi, IGMPMSG_NOCACHE); 10004feb88e5SBenjamin Thery if (err < 0) { 10011da177e4SLinus Torvalds /* If the report failed throw the cache entry 10021da177e4SLinus Torvalds out - Brad Parker 10031da177e4SLinus Torvalds */ 10041da177e4SLinus Torvalds spin_unlock_bh(&mfc_unres_lock); 10051da177e4SLinus Torvalds 10065c0a66f5SBenjamin Thery ipmr_cache_free(c); 10071da177e4SLinus Torvalds kfree_skb(skb); 10081da177e4SLinus Torvalds return err; 10091da177e4SLinus Torvalds } 10101da177e4SLinus Torvalds 10110c12295aSPatrick McHardy atomic_inc(&mrt->cache_resolve_queue_len); 10120c12295aSPatrick McHardy list_add(&c->list, &mrt->mfc_unres_queue); 10131da177e4SLinus Torvalds 1014278554bdSDavid S. Miller if (atomic_read(&mrt->cache_resolve_queue_len) == 1) 10150c12295aSPatrick McHardy mod_timer(&mrt->ipmr_expire_timer, c->mfc_un.unres.expires); 10161da177e4SLinus Torvalds } 10171da177e4SLinus Torvalds 1018a8cb16ddSEric Dumazet /* See if we can append the packet */ 1019a8cb16ddSEric Dumazet 10201da177e4SLinus Torvalds if (c->mfc_un.unres.unresolved.qlen > 3) { 10211da177e4SLinus Torvalds kfree_skb(skb); 10221da177e4SLinus Torvalds err = -ENOBUFS; 10231da177e4SLinus Torvalds } else { 10241da177e4SLinus Torvalds skb_queue_tail(&c->mfc_un.unres.unresolved, skb); 10251da177e4SLinus Torvalds err = 0; 10261da177e4SLinus Torvalds } 10271da177e4SLinus Torvalds 10281da177e4SLinus Torvalds spin_unlock_bh(&mfc_unres_lock); 10291da177e4SLinus Torvalds return err; 10301da177e4SLinus Torvalds } 10311da177e4SLinus Torvalds 10321da177e4SLinus Torvalds /* 10331da177e4SLinus Torvalds * MFC cache manipulation by user space mroute daemon 10341da177e4SLinus Torvalds */ 10351da177e4SLinus Torvalds 10360c12295aSPatrick McHardy static int ipmr_mfc_delete(struct mr_table *mrt, struct mfcctl *mfc) 10371da177e4SLinus Torvalds { 10381da177e4SLinus Torvalds int line; 1039862465f2SPatrick McHardy struct mfc_cache *c, *next; 10401da177e4SLinus Torvalds 10411da177e4SLinus Torvalds line = MFC_HASH(mfc->mfcc_mcastgrp.s_addr, mfc->mfcc_origin.s_addr); 10421da177e4SLinus Torvalds 10430c12295aSPatrick McHardy list_for_each_entry_safe(c, next, &mrt->mfc_cache_array[line], list) { 10441da177e4SLinus Torvalds if (c->mfc_origin == mfc->mfcc_origin.s_addr && 10451da177e4SLinus Torvalds c->mfc_mcastgrp == mfc->mfcc_mcastgrp.s_addr) { 1046a8c9486bSEric Dumazet list_del_rcu(&c->list); 10471da177e4SLinus Torvalds 10485c0a66f5SBenjamin Thery ipmr_cache_free(c); 10491da177e4SLinus Torvalds return 0; 10501da177e4SLinus Torvalds } 10511da177e4SLinus Torvalds } 10521da177e4SLinus Torvalds return -ENOENT; 10531da177e4SLinus Torvalds } 10541da177e4SLinus Torvalds 10550c12295aSPatrick McHardy static int ipmr_mfc_add(struct net *net, struct mr_table *mrt, 10560c12295aSPatrick McHardy struct mfcctl *mfc, int mrtsock) 10571da177e4SLinus Torvalds { 1058862465f2SPatrick McHardy bool found = false; 10591da177e4SLinus Torvalds int line; 1060862465f2SPatrick McHardy struct mfc_cache *uc, *c; 10611da177e4SLinus Torvalds 1062a50436f2SPatrick McHardy if (mfc->mfcc_parent >= MAXVIFS) 1063a50436f2SPatrick McHardy return -ENFILE; 1064a50436f2SPatrick McHardy 10651da177e4SLinus Torvalds line = MFC_HASH(mfc->mfcc_mcastgrp.s_addr, mfc->mfcc_origin.s_addr); 10661da177e4SLinus Torvalds 10670c12295aSPatrick McHardy list_for_each_entry(c, &mrt->mfc_cache_array[line], list) { 10681da177e4SLinus Torvalds if (c->mfc_origin == mfc->mfcc_origin.s_addr && 1069862465f2SPatrick McHardy c->mfc_mcastgrp == mfc->mfcc_mcastgrp.s_addr) { 1070862465f2SPatrick McHardy found = true; 10711da177e4SLinus Torvalds break; 10721da177e4SLinus Torvalds } 1073862465f2SPatrick McHardy } 10741da177e4SLinus Torvalds 1075862465f2SPatrick McHardy if (found) { 10761da177e4SLinus Torvalds write_lock_bh(&mrt_lock); 10771da177e4SLinus Torvalds c->mfc_parent = mfc->mfcc_parent; 10780c12295aSPatrick McHardy ipmr_update_thresholds(mrt, c, mfc->mfcc_ttls); 10791da177e4SLinus Torvalds if (!mrtsock) 10801da177e4SLinus Torvalds c->mfc_flags |= MFC_STATIC; 10811da177e4SLinus Torvalds write_unlock_bh(&mrt_lock); 10821da177e4SLinus Torvalds return 0; 10831da177e4SLinus Torvalds } 10841da177e4SLinus Torvalds 1085f97c1e0cSJoe Perches if (!ipv4_is_multicast(mfc->mfcc_mcastgrp.s_addr)) 10861da177e4SLinus Torvalds return -EINVAL; 10871da177e4SLinus Torvalds 1088d658f8a0SPatrick McHardy c = ipmr_cache_alloc(); 10891da177e4SLinus Torvalds if (c == NULL) 10901da177e4SLinus Torvalds return -ENOMEM; 10911da177e4SLinus Torvalds 10921da177e4SLinus Torvalds c->mfc_origin = mfc->mfcc_origin.s_addr; 10931da177e4SLinus Torvalds c->mfc_mcastgrp = mfc->mfcc_mcastgrp.s_addr; 10941da177e4SLinus Torvalds c->mfc_parent = mfc->mfcc_parent; 10950c12295aSPatrick McHardy ipmr_update_thresholds(mrt, c, mfc->mfcc_ttls); 10961da177e4SLinus Torvalds if (!mrtsock) 10971da177e4SLinus Torvalds c->mfc_flags |= MFC_STATIC; 10981da177e4SLinus Torvalds 1099a8c9486bSEric Dumazet list_add_rcu(&c->list, &mrt->mfc_cache_array[line]); 11001da177e4SLinus Torvalds 11011da177e4SLinus Torvalds /* 11021da177e4SLinus Torvalds * Check to see if we resolved a queued list. If so we 11031da177e4SLinus Torvalds * need to send on the frames and tidy up. 11041da177e4SLinus Torvalds */ 1105b0ebb739SPatrick McHardy found = false; 11061da177e4SLinus Torvalds spin_lock_bh(&mfc_unres_lock); 11070c12295aSPatrick McHardy list_for_each_entry(uc, &mrt->mfc_unres_queue, list) { 1108e258beb2SPatrick McHardy if (uc->mfc_origin == c->mfc_origin && 11091da177e4SLinus Torvalds uc->mfc_mcastgrp == c->mfc_mcastgrp) { 1110862465f2SPatrick McHardy list_del(&uc->list); 11110c12295aSPatrick McHardy atomic_dec(&mrt->cache_resolve_queue_len); 1112b0ebb739SPatrick McHardy found = true; 11131da177e4SLinus Torvalds break; 11141da177e4SLinus Torvalds } 11151da177e4SLinus Torvalds } 11160c12295aSPatrick McHardy if (list_empty(&mrt->mfc_unres_queue)) 11170c12295aSPatrick McHardy del_timer(&mrt->ipmr_expire_timer); 11181da177e4SLinus Torvalds spin_unlock_bh(&mfc_unres_lock); 11191da177e4SLinus Torvalds 1120b0ebb739SPatrick McHardy if (found) { 11210c12295aSPatrick McHardy ipmr_cache_resolve(net, mrt, uc, c); 11225c0a66f5SBenjamin Thery ipmr_cache_free(uc); 11231da177e4SLinus Torvalds } 11241da177e4SLinus Torvalds return 0; 11251da177e4SLinus Torvalds } 11261da177e4SLinus Torvalds 11271da177e4SLinus Torvalds /* 11281da177e4SLinus Torvalds * Close the multicast socket, and clear the vif tables etc 11291da177e4SLinus Torvalds */ 11301da177e4SLinus Torvalds 11310c12295aSPatrick McHardy static void mroute_clean_tables(struct mr_table *mrt) 11321da177e4SLinus Torvalds { 11331da177e4SLinus Torvalds int i; 1134d17fa6faSEric Dumazet LIST_HEAD(list); 1135862465f2SPatrick McHardy struct mfc_cache *c, *next; 11361da177e4SLinus Torvalds 1137a8cb16ddSEric Dumazet /* Shut down all active vif entries */ 1138a8cb16ddSEric Dumazet 11390c12295aSPatrick McHardy for (i = 0; i < mrt->maxvif; i++) { 11400c12295aSPatrick McHardy if (!(mrt->vif_table[i].flags & VIFF_STATIC)) 11410c12295aSPatrick McHardy vif_delete(mrt, i, 0, &list); 11421da177e4SLinus Torvalds } 1143d17fa6faSEric Dumazet unregister_netdevice_many(&list); 11441da177e4SLinus Torvalds 1145a8cb16ddSEric Dumazet /* Wipe the cache */ 1146a8cb16ddSEric Dumazet 11471da177e4SLinus Torvalds for (i = 0; i < MFC_LINES; i++) { 11480c12295aSPatrick McHardy list_for_each_entry_safe(c, next, &mrt->mfc_cache_array[i], list) { 1149862465f2SPatrick McHardy if (c->mfc_flags & MFC_STATIC) 11501da177e4SLinus Torvalds continue; 1151a8c9486bSEric Dumazet list_del_rcu(&c->list); 11525c0a66f5SBenjamin Thery ipmr_cache_free(c); 11531da177e4SLinus Torvalds } 11541da177e4SLinus Torvalds } 11551da177e4SLinus Torvalds 11560c12295aSPatrick McHardy if (atomic_read(&mrt->cache_resolve_queue_len) != 0) { 11571da177e4SLinus Torvalds spin_lock_bh(&mfc_unres_lock); 11580c12295aSPatrick McHardy list_for_each_entry_safe(c, next, &mrt->mfc_unres_queue, list) { 1159862465f2SPatrick McHardy list_del(&c->list); 11600c12295aSPatrick McHardy ipmr_destroy_unres(mrt, c); 11611da177e4SLinus Torvalds } 11621da177e4SLinus Torvalds spin_unlock_bh(&mfc_unres_lock); 11631da177e4SLinus Torvalds } 11641da177e4SLinus Torvalds } 11651da177e4SLinus Torvalds 11664c968709SEric Dumazet /* called from ip_ra_control(), before an RCU grace period, 11674c968709SEric Dumazet * we dont need to call synchronize_rcu() here 11684c968709SEric Dumazet */ 11691da177e4SLinus Torvalds static void mrtsock_destruct(struct sock *sk) 11701da177e4SLinus Torvalds { 11714feb88e5SBenjamin Thery struct net *net = sock_net(sk); 1172f0ad0860SPatrick McHardy struct mr_table *mrt; 11734feb88e5SBenjamin Thery 11741da177e4SLinus Torvalds rtnl_lock(); 1175f0ad0860SPatrick McHardy ipmr_for_each_table(mrt, net) { 11764c968709SEric Dumazet if (sk == rtnl_dereference(mrt->mroute_sk)) { 11774feb88e5SBenjamin Thery IPV4_DEVCONF_ALL(net, MC_FORWARDING)--; 11784c968709SEric Dumazet rcu_assign_pointer(mrt->mroute_sk, NULL); 11790c12295aSPatrick McHardy mroute_clean_tables(mrt); 11801da177e4SLinus Torvalds } 11811da177e4SLinus Torvalds } 11821da177e4SLinus Torvalds rtnl_unlock(); 11831da177e4SLinus Torvalds } 11841da177e4SLinus Torvalds 11851da177e4SLinus Torvalds /* 11861da177e4SLinus Torvalds * Socket options and virtual interface manipulation. The whole 11871da177e4SLinus Torvalds * virtual interface system is a complete heap, but unfortunately 11881da177e4SLinus Torvalds * that's how BSD mrouted happens to think. Maybe one day with a proper 11891da177e4SLinus Torvalds * MOSPF/PIM router set up we can clean this up. 11901da177e4SLinus Torvalds */ 11911da177e4SLinus Torvalds 1192b7058842SDavid S. Miller int ip_mroute_setsockopt(struct sock *sk, int optname, char __user *optval, unsigned int optlen) 11931da177e4SLinus Torvalds { 11941da177e4SLinus Torvalds int ret; 11951da177e4SLinus Torvalds struct vifctl vif; 11961da177e4SLinus Torvalds struct mfcctl mfc; 11974feb88e5SBenjamin Thery struct net *net = sock_net(sk); 1198f0ad0860SPatrick McHardy struct mr_table *mrt; 1199f0ad0860SPatrick McHardy 1200f0ad0860SPatrick McHardy mrt = ipmr_get_table(net, raw_sk(sk)->ipmr_table ? : RT_TABLE_DEFAULT); 1201f0ad0860SPatrick McHardy if (mrt == NULL) 1202f0ad0860SPatrick McHardy return -ENOENT; 12031da177e4SLinus Torvalds 1204132adf54SStephen Hemminger if (optname != MRT_INIT) { 12054c968709SEric Dumazet if (sk != rcu_dereference_raw(mrt->mroute_sk) && 12064c968709SEric Dumazet !capable(CAP_NET_ADMIN)) 12071da177e4SLinus Torvalds return -EACCES; 12081da177e4SLinus Torvalds } 12091da177e4SLinus Torvalds 1210132adf54SStephen Hemminger switch (optname) { 12111da177e4SLinus Torvalds case MRT_INIT: 12121da177e4SLinus Torvalds if (sk->sk_type != SOCK_RAW || 1213c720c7e8SEric Dumazet inet_sk(sk)->inet_num != IPPROTO_IGMP) 12141da177e4SLinus Torvalds return -EOPNOTSUPP; 12151da177e4SLinus Torvalds if (optlen != sizeof(int)) 12161da177e4SLinus Torvalds return -ENOPROTOOPT; 12171da177e4SLinus Torvalds 12181da177e4SLinus Torvalds rtnl_lock(); 12194c968709SEric Dumazet if (rtnl_dereference(mrt->mroute_sk)) { 12201da177e4SLinus Torvalds rtnl_unlock(); 12211da177e4SLinus Torvalds return -EADDRINUSE; 12221da177e4SLinus Torvalds } 12231da177e4SLinus Torvalds 12241da177e4SLinus Torvalds ret = ip_ra_control(sk, 1, mrtsock_destruct); 12251da177e4SLinus Torvalds if (ret == 0) { 12264c968709SEric Dumazet rcu_assign_pointer(mrt->mroute_sk, sk); 12274feb88e5SBenjamin Thery IPV4_DEVCONF_ALL(net, MC_FORWARDING)++; 12281da177e4SLinus Torvalds } 12291da177e4SLinus Torvalds rtnl_unlock(); 12301da177e4SLinus Torvalds return ret; 12311da177e4SLinus Torvalds case MRT_DONE: 12324c968709SEric Dumazet if (sk != rcu_dereference_raw(mrt->mroute_sk)) 12331da177e4SLinus Torvalds return -EACCES; 12341da177e4SLinus Torvalds return ip_ra_control(sk, 0, NULL); 12351da177e4SLinus Torvalds case MRT_ADD_VIF: 12361da177e4SLinus Torvalds case MRT_DEL_VIF: 12371da177e4SLinus Torvalds if (optlen != sizeof(vif)) 12381da177e4SLinus Torvalds return -EINVAL; 12391da177e4SLinus Torvalds if (copy_from_user(&vif, optval, sizeof(vif))) 12401da177e4SLinus Torvalds return -EFAULT; 12411da177e4SLinus Torvalds if (vif.vifc_vifi >= MAXVIFS) 12421da177e4SLinus Torvalds return -ENFILE; 12431da177e4SLinus Torvalds rtnl_lock(); 12441da177e4SLinus Torvalds if (optname == MRT_ADD_VIF) { 12454c968709SEric Dumazet ret = vif_add(net, mrt, &vif, 12464c968709SEric Dumazet sk == rtnl_dereference(mrt->mroute_sk)); 12471da177e4SLinus Torvalds } else { 12480c12295aSPatrick McHardy ret = vif_delete(mrt, vif.vifc_vifi, 0, NULL); 12491da177e4SLinus Torvalds } 12501da177e4SLinus Torvalds rtnl_unlock(); 12511da177e4SLinus Torvalds return ret; 12521da177e4SLinus Torvalds 12531da177e4SLinus Torvalds /* 12541da177e4SLinus Torvalds * Manipulate the forwarding caches. These live 12551da177e4SLinus Torvalds * in a sort of kernel/user symbiosis. 12561da177e4SLinus Torvalds */ 12571da177e4SLinus Torvalds case MRT_ADD_MFC: 12581da177e4SLinus Torvalds case MRT_DEL_MFC: 12591da177e4SLinus Torvalds if (optlen != sizeof(mfc)) 12601da177e4SLinus Torvalds return -EINVAL; 12611da177e4SLinus Torvalds if (copy_from_user(&mfc, optval, sizeof(mfc))) 12621da177e4SLinus Torvalds return -EFAULT; 12631da177e4SLinus Torvalds rtnl_lock(); 12641da177e4SLinus Torvalds if (optname == MRT_DEL_MFC) 12650c12295aSPatrick McHardy ret = ipmr_mfc_delete(mrt, &mfc); 12661da177e4SLinus Torvalds else 12674c968709SEric Dumazet ret = ipmr_mfc_add(net, mrt, &mfc, 12684c968709SEric Dumazet sk == rtnl_dereference(mrt->mroute_sk)); 12691da177e4SLinus Torvalds rtnl_unlock(); 12701da177e4SLinus Torvalds return ret; 12711da177e4SLinus Torvalds /* 12721da177e4SLinus Torvalds * Control PIM assert. 12731da177e4SLinus Torvalds */ 12741da177e4SLinus Torvalds case MRT_ASSERT: 12751da177e4SLinus Torvalds { 12761da177e4SLinus Torvalds int v; 12771da177e4SLinus Torvalds if (get_user(v, (int __user *)optval)) 12781da177e4SLinus Torvalds return -EFAULT; 12790c12295aSPatrick McHardy mrt->mroute_do_assert = (v) ? 1 : 0; 12801da177e4SLinus Torvalds return 0; 12811da177e4SLinus Torvalds } 12821da177e4SLinus Torvalds #ifdef CONFIG_IP_PIMSM 12831da177e4SLinus Torvalds case MRT_PIM: 12841da177e4SLinus Torvalds { 1285ba93ef74SStephen Hemminger int v; 1286ba93ef74SStephen Hemminger 12871da177e4SLinus Torvalds if (get_user(v, (int __user *)optval)) 12881da177e4SLinus Torvalds return -EFAULT; 12891da177e4SLinus Torvalds v = (v) ? 1 : 0; 1290ba93ef74SStephen Hemminger 12911da177e4SLinus Torvalds rtnl_lock(); 12921da177e4SLinus Torvalds ret = 0; 12930c12295aSPatrick McHardy if (v != mrt->mroute_do_pim) { 12940c12295aSPatrick McHardy mrt->mroute_do_pim = v; 12950c12295aSPatrick McHardy mrt->mroute_do_assert = v; 12961da177e4SLinus Torvalds } 12971da177e4SLinus Torvalds rtnl_unlock(); 12981da177e4SLinus Torvalds return ret; 12991da177e4SLinus Torvalds } 13001da177e4SLinus Torvalds #endif 1301f0ad0860SPatrick McHardy #ifdef CONFIG_IP_MROUTE_MULTIPLE_TABLES 1302f0ad0860SPatrick McHardy case MRT_TABLE: 1303f0ad0860SPatrick McHardy { 1304f0ad0860SPatrick McHardy u32 v; 1305f0ad0860SPatrick McHardy 1306f0ad0860SPatrick McHardy if (optlen != sizeof(u32)) 1307f0ad0860SPatrick McHardy return -EINVAL; 1308f0ad0860SPatrick McHardy if (get_user(v, (u32 __user *)optval)) 1309f0ad0860SPatrick McHardy return -EFAULT; 1310f0ad0860SPatrick McHardy 1311f0ad0860SPatrick McHardy rtnl_lock(); 1312f0ad0860SPatrick McHardy ret = 0; 13134c968709SEric Dumazet if (sk == rtnl_dereference(mrt->mroute_sk)) { 13144c968709SEric Dumazet ret = -EBUSY; 13154c968709SEric Dumazet } else { 1316f0ad0860SPatrick McHardy if (!ipmr_new_table(net, v)) 1317f0ad0860SPatrick McHardy ret = -ENOMEM; 1318f0ad0860SPatrick McHardy raw_sk(sk)->ipmr_table = v; 13194c968709SEric Dumazet } 1320f0ad0860SPatrick McHardy rtnl_unlock(); 1321f0ad0860SPatrick McHardy return ret; 1322f0ad0860SPatrick McHardy } 1323f0ad0860SPatrick McHardy #endif 13241da177e4SLinus Torvalds /* 13251da177e4SLinus Torvalds * Spurious command, or MRT_VERSION which you cannot 13261da177e4SLinus Torvalds * set. 13271da177e4SLinus Torvalds */ 13281da177e4SLinus Torvalds default: 13291da177e4SLinus Torvalds return -ENOPROTOOPT; 13301da177e4SLinus Torvalds } 13311da177e4SLinus Torvalds } 13321da177e4SLinus Torvalds 13331da177e4SLinus Torvalds /* 13341da177e4SLinus Torvalds * Getsock opt support for the multicast routing system. 13351da177e4SLinus Torvalds */ 13361da177e4SLinus Torvalds 13371da177e4SLinus Torvalds int ip_mroute_getsockopt(struct sock *sk, int optname, char __user *optval, int __user *optlen) 13381da177e4SLinus Torvalds { 13391da177e4SLinus Torvalds int olr; 13401da177e4SLinus Torvalds int val; 13414feb88e5SBenjamin Thery struct net *net = sock_net(sk); 1342f0ad0860SPatrick McHardy struct mr_table *mrt; 1343f0ad0860SPatrick McHardy 1344f0ad0860SPatrick McHardy mrt = ipmr_get_table(net, raw_sk(sk)->ipmr_table ? : RT_TABLE_DEFAULT); 1345f0ad0860SPatrick McHardy if (mrt == NULL) 1346f0ad0860SPatrick McHardy return -ENOENT; 13471da177e4SLinus Torvalds 13481da177e4SLinus Torvalds if (optname != MRT_VERSION && 13491da177e4SLinus Torvalds #ifdef CONFIG_IP_PIMSM 13501da177e4SLinus Torvalds optname != MRT_PIM && 13511da177e4SLinus Torvalds #endif 13521da177e4SLinus Torvalds optname != MRT_ASSERT) 13531da177e4SLinus Torvalds return -ENOPROTOOPT; 13541da177e4SLinus Torvalds 13551da177e4SLinus Torvalds if (get_user(olr, optlen)) 13561da177e4SLinus Torvalds return -EFAULT; 13571da177e4SLinus Torvalds 13581da177e4SLinus Torvalds olr = min_t(unsigned int, olr, sizeof(int)); 13591da177e4SLinus Torvalds if (olr < 0) 13601da177e4SLinus Torvalds return -EINVAL; 13611da177e4SLinus Torvalds 13621da177e4SLinus Torvalds if (put_user(olr, optlen)) 13631da177e4SLinus Torvalds return -EFAULT; 13641da177e4SLinus Torvalds if (optname == MRT_VERSION) 13651da177e4SLinus Torvalds val = 0x0305; 13661da177e4SLinus Torvalds #ifdef CONFIG_IP_PIMSM 13671da177e4SLinus Torvalds else if (optname == MRT_PIM) 13680c12295aSPatrick McHardy val = mrt->mroute_do_pim; 13691da177e4SLinus Torvalds #endif 13701da177e4SLinus Torvalds else 13710c12295aSPatrick McHardy val = mrt->mroute_do_assert; 13721da177e4SLinus Torvalds if (copy_to_user(optval, &val, olr)) 13731da177e4SLinus Torvalds return -EFAULT; 13741da177e4SLinus Torvalds return 0; 13751da177e4SLinus Torvalds } 13761da177e4SLinus Torvalds 13771da177e4SLinus Torvalds /* 13781da177e4SLinus Torvalds * The IP multicast ioctl support routines. 13791da177e4SLinus Torvalds */ 13801da177e4SLinus Torvalds 13811da177e4SLinus Torvalds int ipmr_ioctl(struct sock *sk, int cmd, void __user *arg) 13821da177e4SLinus Torvalds { 13831da177e4SLinus Torvalds struct sioc_sg_req sr; 13841da177e4SLinus Torvalds struct sioc_vif_req vr; 13851da177e4SLinus Torvalds struct vif_device *vif; 13861da177e4SLinus Torvalds struct mfc_cache *c; 13874feb88e5SBenjamin Thery struct net *net = sock_net(sk); 1388f0ad0860SPatrick McHardy struct mr_table *mrt; 1389f0ad0860SPatrick McHardy 1390f0ad0860SPatrick McHardy mrt = ipmr_get_table(net, raw_sk(sk)->ipmr_table ? : RT_TABLE_DEFAULT); 1391f0ad0860SPatrick McHardy if (mrt == NULL) 1392f0ad0860SPatrick McHardy return -ENOENT; 13931da177e4SLinus Torvalds 1394132adf54SStephen Hemminger switch (cmd) { 13951da177e4SLinus Torvalds case SIOCGETVIFCNT: 13961da177e4SLinus Torvalds if (copy_from_user(&vr, arg, sizeof(vr))) 13971da177e4SLinus Torvalds return -EFAULT; 13980c12295aSPatrick McHardy if (vr.vifi >= mrt->maxvif) 13991da177e4SLinus Torvalds return -EINVAL; 14001da177e4SLinus Torvalds read_lock(&mrt_lock); 14010c12295aSPatrick McHardy vif = &mrt->vif_table[vr.vifi]; 14020c12295aSPatrick McHardy if (VIF_EXISTS(mrt, vr.vifi)) { 14031da177e4SLinus Torvalds vr.icount = vif->pkt_in; 14041da177e4SLinus Torvalds vr.ocount = vif->pkt_out; 14051da177e4SLinus Torvalds vr.ibytes = vif->bytes_in; 14061da177e4SLinus Torvalds vr.obytes = vif->bytes_out; 14071da177e4SLinus Torvalds read_unlock(&mrt_lock); 14081da177e4SLinus Torvalds 14091da177e4SLinus Torvalds if (copy_to_user(arg, &vr, sizeof(vr))) 14101da177e4SLinus Torvalds return -EFAULT; 14111da177e4SLinus Torvalds return 0; 14121da177e4SLinus Torvalds } 14131da177e4SLinus Torvalds read_unlock(&mrt_lock); 14141da177e4SLinus Torvalds return -EADDRNOTAVAIL; 14151da177e4SLinus Torvalds case SIOCGETSGCNT: 14161da177e4SLinus Torvalds if (copy_from_user(&sr, arg, sizeof(sr))) 14171da177e4SLinus Torvalds return -EFAULT; 14181da177e4SLinus Torvalds 1419a8c9486bSEric Dumazet rcu_read_lock(); 14200c12295aSPatrick McHardy c = ipmr_cache_find(mrt, sr.src.s_addr, sr.grp.s_addr); 14211da177e4SLinus Torvalds if (c) { 14221da177e4SLinus Torvalds sr.pktcnt = c->mfc_un.res.pkt; 14231da177e4SLinus Torvalds sr.bytecnt = c->mfc_un.res.bytes; 14241da177e4SLinus Torvalds sr.wrong_if = c->mfc_un.res.wrong_if; 1425a8c9486bSEric Dumazet rcu_read_unlock(); 14261da177e4SLinus Torvalds 14271da177e4SLinus Torvalds if (copy_to_user(arg, &sr, sizeof(sr))) 14281da177e4SLinus Torvalds return -EFAULT; 14291da177e4SLinus Torvalds return 0; 14301da177e4SLinus Torvalds } 1431a8c9486bSEric Dumazet rcu_read_unlock(); 14321da177e4SLinus Torvalds return -EADDRNOTAVAIL; 14331da177e4SLinus Torvalds default: 14341da177e4SLinus Torvalds return -ENOIOCTLCMD; 14351da177e4SLinus Torvalds } 14361da177e4SLinus Torvalds } 14371da177e4SLinus Torvalds 1438709b46e8SEric W. Biederman #ifdef CONFIG_COMPAT 1439709b46e8SEric W. Biederman struct compat_sioc_sg_req { 1440709b46e8SEric W. Biederman struct in_addr src; 1441709b46e8SEric W. Biederman struct in_addr grp; 1442709b46e8SEric W. Biederman compat_ulong_t pktcnt; 1443709b46e8SEric W. Biederman compat_ulong_t bytecnt; 1444709b46e8SEric W. Biederman compat_ulong_t wrong_if; 1445709b46e8SEric W. Biederman }; 1446709b46e8SEric W. Biederman 1447709b46e8SEric W. Biederman int ipmr_compat_ioctl(struct sock *sk, unsigned int cmd, void __user *arg) 1448709b46e8SEric W. Biederman { 1449*0033d5adSDavid S. Miller struct compat_sioc_sg_req sr; 1450709b46e8SEric W. Biederman struct mfc_cache *c; 1451709b46e8SEric W. Biederman struct net *net = sock_net(sk); 1452709b46e8SEric W. Biederman struct mr_table *mrt; 1453709b46e8SEric W. Biederman 1454709b46e8SEric W. Biederman mrt = ipmr_get_table(net, raw_sk(sk)->ipmr_table ? : RT_TABLE_DEFAULT); 1455709b46e8SEric W. Biederman if (mrt == NULL) 1456709b46e8SEric W. Biederman return -ENOENT; 1457709b46e8SEric W. Biederman 1458709b46e8SEric W. Biederman switch (cmd) { 1459709b46e8SEric W. Biederman case SIOCGETSGCNT: 1460709b46e8SEric W. Biederman if (copy_from_user(&sr, arg, sizeof(sr))) 1461709b46e8SEric W. Biederman return -EFAULT; 1462709b46e8SEric W. Biederman 1463709b46e8SEric W. Biederman rcu_read_lock(); 1464709b46e8SEric W. Biederman c = ipmr_cache_find(mrt, sr.src.s_addr, sr.grp.s_addr); 1465709b46e8SEric W. Biederman if (c) { 1466709b46e8SEric W. Biederman sr.pktcnt = c->mfc_un.res.pkt; 1467709b46e8SEric W. Biederman sr.bytecnt = c->mfc_un.res.bytes; 1468709b46e8SEric W. Biederman sr.wrong_if = c->mfc_un.res.wrong_if; 1469709b46e8SEric W. Biederman rcu_read_unlock(); 1470709b46e8SEric W. Biederman 1471709b46e8SEric W. Biederman if (copy_to_user(arg, &sr, sizeof(sr))) 1472709b46e8SEric W. Biederman return -EFAULT; 1473709b46e8SEric W. Biederman return 0; 1474709b46e8SEric W. Biederman } 1475709b46e8SEric W. Biederman rcu_read_unlock(); 1476709b46e8SEric W. Biederman return -EADDRNOTAVAIL; 1477709b46e8SEric W. Biederman default: 1478709b46e8SEric W. Biederman return -ENOIOCTLCMD; 1479709b46e8SEric W. Biederman } 1480709b46e8SEric W. Biederman } 1481709b46e8SEric W. Biederman #endif 1482709b46e8SEric W. Biederman 14831da177e4SLinus Torvalds 14841da177e4SLinus Torvalds static int ipmr_device_event(struct notifier_block *this, unsigned long event, void *ptr) 14851da177e4SLinus Torvalds { 1486e9dc8653SEric W. Biederman struct net_device *dev = ptr; 14874feb88e5SBenjamin Thery struct net *net = dev_net(dev); 1488f0ad0860SPatrick McHardy struct mr_table *mrt; 14891da177e4SLinus Torvalds struct vif_device *v; 14901da177e4SLinus Torvalds int ct; 1491d17fa6faSEric Dumazet LIST_HEAD(list); 1492e9dc8653SEric W. Biederman 14931da177e4SLinus Torvalds if (event != NETDEV_UNREGISTER) 14941da177e4SLinus Torvalds return NOTIFY_DONE; 1495f0ad0860SPatrick McHardy 1496f0ad0860SPatrick McHardy ipmr_for_each_table(mrt, net) { 14970c12295aSPatrick McHardy v = &mrt->vif_table[0]; 14980c12295aSPatrick McHardy for (ct = 0; ct < mrt->maxvif; ct++, v++) { 1499e9dc8653SEric W. Biederman if (v->dev == dev) 15000c12295aSPatrick McHardy vif_delete(mrt, ct, 1, &list); 15011da177e4SLinus Torvalds } 15021da177e4SLinus Torvalds } 1503d17fa6faSEric Dumazet unregister_netdevice_many(&list); 15041da177e4SLinus Torvalds return NOTIFY_DONE; 15051da177e4SLinus Torvalds } 15061da177e4SLinus Torvalds 15071da177e4SLinus Torvalds 15081da177e4SLinus Torvalds static struct notifier_block ip_mr_notifier = { 15091da177e4SLinus Torvalds .notifier_call = ipmr_device_event, 15101da177e4SLinus Torvalds }; 15111da177e4SLinus Torvalds 15121da177e4SLinus Torvalds /* 15131da177e4SLinus Torvalds * Encapsulate a packet by attaching a valid IPIP header to it. 15141da177e4SLinus Torvalds * This avoids tunnel drivers and other mess and gives us the speed so 15151da177e4SLinus Torvalds * important for multicast video. 15161da177e4SLinus Torvalds */ 15171da177e4SLinus Torvalds 1518114c7844SAl Viro static void ip_encap(struct sk_buff *skb, __be32 saddr, __be32 daddr) 15191da177e4SLinus Torvalds { 15208856dfa3SArnaldo Carvalho de Melo struct iphdr *iph; 1521eddc9ec5SArnaldo Carvalho de Melo struct iphdr *old_iph = ip_hdr(skb); 15228856dfa3SArnaldo Carvalho de Melo 15238856dfa3SArnaldo Carvalho de Melo skb_push(skb, sizeof(struct iphdr)); 1524b0e380b1SArnaldo Carvalho de Melo skb->transport_header = skb->network_header; 15258856dfa3SArnaldo Carvalho de Melo skb_reset_network_header(skb); 1526eddc9ec5SArnaldo Carvalho de Melo iph = ip_hdr(skb); 15271da177e4SLinus Torvalds 15281da177e4SLinus Torvalds iph->version = 4; 1529e023dd64SArnaldo Carvalho de Melo iph->tos = old_iph->tos; 1530e023dd64SArnaldo Carvalho de Melo iph->ttl = old_iph->ttl; 15311da177e4SLinus Torvalds iph->frag_off = 0; 15321da177e4SLinus Torvalds iph->daddr = daddr; 15331da177e4SLinus Torvalds iph->saddr = saddr; 15341da177e4SLinus Torvalds iph->protocol = IPPROTO_IPIP; 15351da177e4SLinus Torvalds iph->ihl = 5; 15361da177e4SLinus Torvalds iph->tot_len = htons(skb->len); 1537adf30907SEric Dumazet ip_select_ident(iph, skb_dst(skb), NULL); 15381da177e4SLinus Torvalds ip_send_check(iph); 15391da177e4SLinus Torvalds 15401da177e4SLinus Torvalds memset(&(IPCB(skb)->opt), 0, sizeof(IPCB(skb)->opt)); 15411da177e4SLinus Torvalds nf_reset(skb); 15421da177e4SLinus Torvalds } 15431da177e4SLinus Torvalds 15441da177e4SLinus Torvalds static inline int ipmr_forward_finish(struct sk_buff *skb) 15451da177e4SLinus Torvalds { 15461da177e4SLinus Torvalds struct ip_options *opt = &(IPCB(skb)->opt); 15471da177e4SLinus Torvalds 1548adf30907SEric Dumazet IP_INC_STATS_BH(dev_net(skb_dst(skb)->dev), IPSTATS_MIB_OUTFORWDATAGRAMS); 15491da177e4SLinus Torvalds 15501da177e4SLinus Torvalds if (unlikely(opt->optlen)) 15511da177e4SLinus Torvalds ip_forward_options(skb); 15521da177e4SLinus Torvalds 15531da177e4SLinus Torvalds return dst_output(skb); 15541da177e4SLinus Torvalds } 15551da177e4SLinus Torvalds 15561da177e4SLinus Torvalds /* 15571da177e4SLinus Torvalds * Processing handlers for ipmr_forward 15581da177e4SLinus Torvalds */ 15591da177e4SLinus Torvalds 15600c12295aSPatrick McHardy static void ipmr_queue_xmit(struct net *net, struct mr_table *mrt, 15610c12295aSPatrick McHardy struct sk_buff *skb, struct mfc_cache *c, int vifi) 15621da177e4SLinus Torvalds { 1563eddc9ec5SArnaldo Carvalho de Melo const struct iphdr *iph = ip_hdr(skb); 15640c12295aSPatrick McHardy struct vif_device *vif = &mrt->vif_table[vifi]; 15651da177e4SLinus Torvalds struct net_device *dev; 15661da177e4SLinus Torvalds struct rtable *rt; 15671da177e4SLinus Torvalds int encap = 0; 15681da177e4SLinus Torvalds 15691da177e4SLinus Torvalds if (vif->dev == NULL) 15701da177e4SLinus Torvalds goto out_free; 15711da177e4SLinus Torvalds 15721da177e4SLinus Torvalds #ifdef CONFIG_IP_PIMSM 15731da177e4SLinus Torvalds if (vif->flags & VIFF_REGISTER) { 15741da177e4SLinus Torvalds vif->pkt_out++; 15751da177e4SLinus Torvalds vif->bytes_out += skb->len; 1576cf3677aeSPavel Emelyanov vif->dev->stats.tx_bytes += skb->len; 1577cf3677aeSPavel Emelyanov vif->dev->stats.tx_packets++; 15780c12295aSPatrick McHardy ipmr_cache_report(mrt, skb, vifi, IGMPMSG_WHOLEPKT); 157969ebbf58SIlpo Järvinen goto out_free; 15801da177e4SLinus Torvalds } 15811da177e4SLinus Torvalds #endif 15821da177e4SLinus Torvalds 15831da177e4SLinus Torvalds if (vif->flags & VIFF_TUNNEL) { 1584a8cb16ddSEric Dumazet struct flowi fl = { 1585a8cb16ddSEric Dumazet .oif = vif->link, 15865811662bSChangli Gao .fl4_dst = vif->remote, 15875811662bSChangli Gao .fl4_src = vif->local, 15885811662bSChangli Gao .fl4_tos = RT_TOS(iph->tos), 1589a8cb16ddSEric Dumazet .proto = IPPROTO_IPIP 1590a8cb16ddSEric Dumazet }; 1591a8cb16ddSEric Dumazet 15924feb88e5SBenjamin Thery if (ip_route_output_key(net, &rt, &fl)) 15931da177e4SLinus Torvalds goto out_free; 15941da177e4SLinus Torvalds encap = sizeof(struct iphdr); 15951da177e4SLinus Torvalds } else { 1596a8cb16ddSEric Dumazet struct flowi fl = { 1597a8cb16ddSEric Dumazet .oif = vif->link, 15985811662bSChangli Gao .fl4_dst = iph->daddr, 15995811662bSChangli Gao .fl4_tos = RT_TOS(iph->tos), 1600a8cb16ddSEric Dumazet .proto = IPPROTO_IPIP 1601a8cb16ddSEric Dumazet }; 1602a8cb16ddSEric Dumazet 16034feb88e5SBenjamin Thery if (ip_route_output_key(net, &rt, &fl)) 16041da177e4SLinus Torvalds goto out_free; 16051da177e4SLinus Torvalds } 16061da177e4SLinus Torvalds 1607d8d1f30bSChangli Gao dev = rt->dst.dev; 16081da177e4SLinus Torvalds 1609d8d1f30bSChangli Gao if (skb->len+encap > dst_mtu(&rt->dst) && (ntohs(iph->frag_off) & IP_DF)) { 16101da177e4SLinus Torvalds /* Do not fragment multicasts. Alas, IPv4 does not 1611a8cb16ddSEric Dumazet * allow to send ICMP, so that packets will disappear 1612a8cb16ddSEric Dumazet * to blackhole. 16131da177e4SLinus Torvalds */ 16141da177e4SLinus Torvalds 16157c73a6faSPavel Emelyanov IP_INC_STATS_BH(dev_net(dev), IPSTATS_MIB_FRAGFAILS); 16161da177e4SLinus Torvalds ip_rt_put(rt); 16171da177e4SLinus Torvalds goto out_free; 16181da177e4SLinus Torvalds } 16191da177e4SLinus Torvalds 1620d8d1f30bSChangli Gao encap += LL_RESERVED_SPACE(dev) + rt->dst.header_len; 16211da177e4SLinus Torvalds 16221da177e4SLinus Torvalds if (skb_cow(skb, encap)) { 16231da177e4SLinus Torvalds ip_rt_put(rt); 16241da177e4SLinus Torvalds goto out_free; 16251da177e4SLinus Torvalds } 16261da177e4SLinus Torvalds 16271da177e4SLinus Torvalds vif->pkt_out++; 16281da177e4SLinus Torvalds vif->bytes_out += skb->len; 16291da177e4SLinus Torvalds 1630adf30907SEric Dumazet skb_dst_drop(skb); 1631d8d1f30bSChangli Gao skb_dst_set(skb, &rt->dst); 1632eddc9ec5SArnaldo Carvalho de Melo ip_decrease_ttl(ip_hdr(skb)); 16331da177e4SLinus Torvalds 16341da177e4SLinus Torvalds /* FIXME: forward and output firewalls used to be called here. 1635a8cb16ddSEric Dumazet * What do we do with netfilter? -- RR 1636a8cb16ddSEric Dumazet */ 16371da177e4SLinus Torvalds if (vif->flags & VIFF_TUNNEL) { 16381da177e4SLinus Torvalds ip_encap(skb, vif->local, vif->remote); 16391da177e4SLinus Torvalds /* FIXME: extra output firewall step used to be here. --RR */ 16402f4c02d4SPavel Emelyanov vif->dev->stats.tx_packets++; 16412f4c02d4SPavel Emelyanov vif->dev->stats.tx_bytes += skb->len; 16421da177e4SLinus Torvalds } 16431da177e4SLinus Torvalds 16441da177e4SLinus Torvalds IPCB(skb)->flags |= IPSKB_FORWARDED; 16451da177e4SLinus Torvalds 16461da177e4SLinus Torvalds /* 16471da177e4SLinus Torvalds * RFC1584 teaches, that DVMRP/PIM router must deliver packets locally 16481da177e4SLinus Torvalds * not only before forwarding, but after forwarding on all output 16491da177e4SLinus Torvalds * interfaces. It is clear, if mrouter runs a multicasting 16501da177e4SLinus Torvalds * program, it should receive packets not depending to what interface 16511da177e4SLinus Torvalds * program is joined. 16521da177e4SLinus Torvalds * If we will not make it, the program will have to join on all 16531da177e4SLinus Torvalds * interfaces. On the other hand, multihoming host (or router, but 16541da177e4SLinus Torvalds * not mrouter) cannot join to more than one interface - it will 16551da177e4SLinus Torvalds * result in receiving multiple packets. 16561da177e4SLinus Torvalds */ 16579bbc768aSJan Engelhardt NF_HOOK(NFPROTO_IPV4, NF_INET_FORWARD, skb, skb->dev, dev, 16581da177e4SLinus Torvalds ipmr_forward_finish); 16591da177e4SLinus Torvalds return; 16601da177e4SLinus Torvalds 16611da177e4SLinus Torvalds out_free: 16621da177e4SLinus Torvalds kfree_skb(skb); 16631da177e4SLinus Torvalds } 16641da177e4SLinus Torvalds 16650c12295aSPatrick McHardy static int ipmr_find_vif(struct mr_table *mrt, struct net_device *dev) 16661da177e4SLinus Torvalds { 16671da177e4SLinus Torvalds int ct; 16680c12295aSPatrick McHardy 16690c12295aSPatrick McHardy for (ct = mrt->maxvif-1; ct >= 0; ct--) { 16700c12295aSPatrick McHardy if (mrt->vif_table[ct].dev == dev) 16711da177e4SLinus Torvalds break; 16721da177e4SLinus Torvalds } 16731da177e4SLinus Torvalds return ct; 16741da177e4SLinus Torvalds } 16751da177e4SLinus Torvalds 16761da177e4SLinus Torvalds /* "local" means that we should preserve one skb (for local delivery) */ 16771da177e4SLinus Torvalds 16780c12295aSPatrick McHardy static int ip_mr_forward(struct net *net, struct mr_table *mrt, 16790c12295aSPatrick McHardy struct sk_buff *skb, struct mfc_cache *cache, 16800c12295aSPatrick McHardy int local) 16811da177e4SLinus Torvalds { 16821da177e4SLinus Torvalds int psend = -1; 16831da177e4SLinus Torvalds int vif, ct; 16841da177e4SLinus Torvalds 16851da177e4SLinus Torvalds vif = cache->mfc_parent; 16861da177e4SLinus Torvalds cache->mfc_un.res.pkt++; 16871da177e4SLinus Torvalds cache->mfc_un.res.bytes += skb->len; 16881da177e4SLinus Torvalds 16891da177e4SLinus Torvalds /* 16901da177e4SLinus Torvalds * Wrong interface: drop packet and (maybe) send PIM assert. 16911da177e4SLinus Torvalds */ 16920c12295aSPatrick McHardy if (mrt->vif_table[vif].dev != skb->dev) { 16931da177e4SLinus Torvalds int true_vifi; 16941da177e4SLinus Torvalds 1695c7537967SDavid S. Miller if (rt_is_output_route(skb_rtable(skb))) { 16961da177e4SLinus Torvalds /* It is our own packet, looped back. 1697a8cb16ddSEric Dumazet * Very complicated situation... 1698a8cb16ddSEric Dumazet * 1699a8cb16ddSEric Dumazet * The best workaround until routing daemons will be 1700a8cb16ddSEric Dumazet * fixed is not to redistribute packet, if it was 1701a8cb16ddSEric Dumazet * send through wrong interface. It means, that 1702a8cb16ddSEric Dumazet * multicast applications WILL NOT work for 1703a8cb16ddSEric Dumazet * (S,G), which have default multicast route pointing 1704a8cb16ddSEric Dumazet * to wrong oif. In any case, it is not a good 1705a8cb16ddSEric Dumazet * idea to use multicasting applications on router. 17061da177e4SLinus Torvalds */ 17071da177e4SLinus Torvalds goto dont_forward; 17081da177e4SLinus Torvalds } 17091da177e4SLinus Torvalds 17101da177e4SLinus Torvalds cache->mfc_un.res.wrong_if++; 17110c12295aSPatrick McHardy true_vifi = ipmr_find_vif(mrt, skb->dev); 17121da177e4SLinus Torvalds 17130c12295aSPatrick McHardy if (true_vifi >= 0 && mrt->mroute_do_assert && 17141da177e4SLinus Torvalds /* pimsm uses asserts, when switching from RPT to SPT, 1715a8cb16ddSEric Dumazet * so that we cannot check that packet arrived on an oif. 1716a8cb16ddSEric Dumazet * It is bad, but otherwise we would need to move pretty 1717a8cb16ddSEric Dumazet * large chunk of pimd to kernel. Ough... --ANK 17181da177e4SLinus Torvalds */ 17190c12295aSPatrick McHardy (mrt->mroute_do_pim || 17206f9374a9SBenjamin Thery cache->mfc_un.res.ttls[true_vifi] < 255) && 17211da177e4SLinus Torvalds time_after(jiffies, 17221da177e4SLinus Torvalds cache->mfc_un.res.last_assert + MFC_ASSERT_THRESH)) { 17231da177e4SLinus Torvalds cache->mfc_un.res.last_assert = jiffies; 17240c12295aSPatrick McHardy ipmr_cache_report(mrt, skb, true_vifi, IGMPMSG_WRONGVIF); 17251da177e4SLinus Torvalds } 17261da177e4SLinus Torvalds goto dont_forward; 17271da177e4SLinus Torvalds } 17281da177e4SLinus Torvalds 17290c12295aSPatrick McHardy mrt->vif_table[vif].pkt_in++; 17300c12295aSPatrick McHardy mrt->vif_table[vif].bytes_in += skb->len; 17311da177e4SLinus Torvalds 17321da177e4SLinus Torvalds /* 17331da177e4SLinus Torvalds * Forward the frame 17341da177e4SLinus Torvalds */ 1735a8cb16ddSEric Dumazet for (ct = cache->mfc_un.res.maxvif - 1; 1736a8cb16ddSEric Dumazet ct >= cache->mfc_un.res.minvif; ct--) { 1737eddc9ec5SArnaldo Carvalho de Melo if (ip_hdr(skb)->ttl > cache->mfc_un.res.ttls[ct]) { 17381da177e4SLinus Torvalds if (psend != -1) { 17391da177e4SLinus Torvalds struct sk_buff *skb2 = skb_clone(skb, GFP_ATOMIC); 1740a8cb16ddSEric Dumazet 17411da177e4SLinus Torvalds if (skb2) 17420c12295aSPatrick McHardy ipmr_queue_xmit(net, mrt, skb2, cache, 17430c12295aSPatrick McHardy psend); 17441da177e4SLinus Torvalds } 17451da177e4SLinus Torvalds psend = ct; 17461da177e4SLinus Torvalds } 17471da177e4SLinus Torvalds } 17481da177e4SLinus Torvalds if (psend != -1) { 17491da177e4SLinus Torvalds if (local) { 17501da177e4SLinus Torvalds struct sk_buff *skb2 = skb_clone(skb, GFP_ATOMIC); 1751a8cb16ddSEric Dumazet 17521da177e4SLinus Torvalds if (skb2) 17530c12295aSPatrick McHardy ipmr_queue_xmit(net, mrt, skb2, cache, psend); 17541da177e4SLinus Torvalds } else { 17550c12295aSPatrick McHardy ipmr_queue_xmit(net, mrt, skb, cache, psend); 17561da177e4SLinus Torvalds return 0; 17571da177e4SLinus Torvalds } 17581da177e4SLinus Torvalds } 17591da177e4SLinus Torvalds 17601da177e4SLinus Torvalds dont_forward: 17611da177e4SLinus Torvalds if (!local) 17621da177e4SLinus Torvalds kfree_skb(skb); 17631da177e4SLinus Torvalds return 0; 17641da177e4SLinus Torvalds } 17651da177e4SLinus Torvalds 17661da177e4SLinus Torvalds 17671da177e4SLinus Torvalds /* 17681da177e4SLinus Torvalds * Multicast packets for forwarding arrive here 17694c968709SEric Dumazet * Called with rcu_read_lock(); 17701da177e4SLinus Torvalds */ 17711da177e4SLinus Torvalds 17721da177e4SLinus Torvalds int ip_mr_input(struct sk_buff *skb) 17731da177e4SLinus Torvalds { 17741da177e4SLinus Torvalds struct mfc_cache *cache; 17754feb88e5SBenjamin Thery struct net *net = dev_net(skb->dev); 1776511c3f92SEric Dumazet int local = skb_rtable(skb)->rt_flags & RTCF_LOCAL; 1777f0ad0860SPatrick McHardy struct mr_table *mrt; 1778f0ad0860SPatrick McHardy int err; 17791da177e4SLinus Torvalds 17801da177e4SLinus Torvalds /* Packet is looped back after forward, it should not be 1781a8cb16ddSEric Dumazet * forwarded second time, but still can be delivered locally. 17821da177e4SLinus Torvalds */ 17831da177e4SLinus Torvalds if (IPCB(skb)->flags & IPSKB_FORWARDED) 17841da177e4SLinus Torvalds goto dont_forward; 17851da177e4SLinus Torvalds 1786f0ad0860SPatrick McHardy err = ipmr_fib_lookup(net, &skb_rtable(skb)->fl, &mrt); 1787e40dbc51SBen Greear if (err < 0) { 1788e40dbc51SBen Greear kfree_skb(skb); 1789f0ad0860SPatrick McHardy return err; 1790e40dbc51SBen Greear } 1791f0ad0860SPatrick McHardy 17921da177e4SLinus Torvalds if (!local) { 17931da177e4SLinus Torvalds if (IPCB(skb)->opt.router_alert) { 17941da177e4SLinus Torvalds if (ip_call_ra_chain(skb)) 17951da177e4SLinus Torvalds return 0; 1796eddc9ec5SArnaldo Carvalho de Melo } else if (ip_hdr(skb)->protocol == IPPROTO_IGMP) { 17971da177e4SLinus Torvalds /* IGMPv1 (and broken IGMPv2 implementations sort of 17984c968709SEric Dumazet * Cisco IOS <= 11.2(8)) do not put router alert 17994c968709SEric Dumazet * option to IGMP packets destined to routable 18004c968709SEric Dumazet * groups. It is very bad, because it means 18014c968709SEric Dumazet * that we can forward NO IGMP messages. 18021da177e4SLinus Torvalds */ 18034c968709SEric Dumazet struct sock *mroute_sk; 18044c968709SEric Dumazet 18054c968709SEric Dumazet mroute_sk = rcu_dereference(mrt->mroute_sk); 18064c968709SEric Dumazet if (mroute_sk) { 18072715bcf9SPatrick McHardy nf_reset(skb); 18084c968709SEric Dumazet raw_rcv(mroute_sk, skb); 18091da177e4SLinus Torvalds return 0; 18101da177e4SLinus Torvalds } 18111da177e4SLinus Torvalds } 18121da177e4SLinus Torvalds } 18131da177e4SLinus Torvalds 1814a8c9486bSEric Dumazet /* already under rcu_read_lock() */ 18150c12295aSPatrick McHardy cache = ipmr_cache_find(mrt, ip_hdr(skb)->saddr, ip_hdr(skb)->daddr); 18161da177e4SLinus Torvalds 18171da177e4SLinus Torvalds /* 18181da177e4SLinus Torvalds * No usable cache entry 18191da177e4SLinus Torvalds */ 18201da177e4SLinus Torvalds if (cache == NULL) { 18211da177e4SLinus Torvalds int vif; 18221da177e4SLinus Torvalds 18231da177e4SLinus Torvalds if (local) { 18241da177e4SLinus Torvalds struct sk_buff *skb2 = skb_clone(skb, GFP_ATOMIC); 18251da177e4SLinus Torvalds ip_local_deliver(skb); 1826a8c9486bSEric Dumazet if (skb2 == NULL) 18271da177e4SLinus Torvalds return -ENOBUFS; 18281da177e4SLinus Torvalds skb = skb2; 18291da177e4SLinus Torvalds } 18301da177e4SLinus Torvalds 1831a8c9486bSEric Dumazet read_lock(&mrt_lock); 18320c12295aSPatrick McHardy vif = ipmr_find_vif(mrt, skb->dev); 18331da177e4SLinus Torvalds if (vif >= 0) { 18340eae88f3SEric Dumazet int err2 = ipmr_cache_unresolved(mrt, vif, skb); 18351da177e4SLinus Torvalds read_unlock(&mrt_lock); 18361da177e4SLinus Torvalds 18370eae88f3SEric Dumazet return err2; 18381da177e4SLinus Torvalds } 18391da177e4SLinus Torvalds read_unlock(&mrt_lock); 18401da177e4SLinus Torvalds kfree_skb(skb); 18411da177e4SLinus Torvalds return -ENODEV; 18421da177e4SLinus Torvalds } 18431da177e4SLinus Torvalds 1844a8c9486bSEric Dumazet read_lock(&mrt_lock); 18450c12295aSPatrick McHardy ip_mr_forward(net, mrt, skb, cache, local); 18461da177e4SLinus Torvalds read_unlock(&mrt_lock); 18471da177e4SLinus Torvalds 18481da177e4SLinus Torvalds if (local) 18491da177e4SLinus Torvalds return ip_local_deliver(skb); 18501da177e4SLinus Torvalds 18511da177e4SLinus Torvalds return 0; 18521da177e4SLinus Torvalds 18531da177e4SLinus Torvalds dont_forward: 18541da177e4SLinus Torvalds if (local) 18551da177e4SLinus Torvalds return ip_local_deliver(skb); 18561da177e4SLinus Torvalds kfree_skb(skb); 18571da177e4SLinus Torvalds return 0; 18581da177e4SLinus Torvalds } 18591da177e4SLinus Torvalds 1860b1879204SIlpo Järvinen #ifdef CONFIG_IP_PIMSM 186155747a0aSEric Dumazet /* called with rcu_read_lock() */ 1862f0ad0860SPatrick McHardy static int __pim_rcv(struct mr_table *mrt, struct sk_buff *skb, 1863f0ad0860SPatrick McHardy unsigned int pimlen) 18641da177e4SLinus Torvalds { 18651da177e4SLinus Torvalds struct net_device *reg_dev = NULL; 1866b1879204SIlpo Järvinen struct iphdr *encap; 18671da177e4SLinus Torvalds 1868b1879204SIlpo Järvinen encap = (struct iphdr *)(skb_transport_header(skb) + pimlen); 18691da177e4SLinus Torvalds /* 1870a8cb16ddSEric Dumazet * Check that: 1871a8cb16ddSEric Dumazet * a. packet is really sent to a multicast group 1872a8cb16ddSEric Dumazet * b. packet is not a NULL-REGISTER 1873a8cb16ddSEric Dumazet * c. packet is not truncated 18741da177e4SLinus Torvalds */ 1875f97c1e0cSJoe Perches if (!ipv4_is_multicast(encap->daddr) || 18761da177e4SLinus Torvalds encap->tot_len == 0 || 1877b1879204SIlpo Järvinen ntohs(encap->tot_len) + pimlen > skb->len) 1878b1879204SIlpo Järvinen return 1; 18791da177e4SLinus Torvalds 18801da177e4SLinus Torvalds read_lock(&mrt_lock); 18810c12295aSPatrick McHardy if (mrt->mroute_reg_vif_num >= 0) 18820c12295aSPatrick McHardy reg_dev = mrt->vif_table[mrt->mroute_reg_vif_num].dev; 18831da177e4SLinus Torvalds read_unlock(&mrt_lock); 18841da177e4SLinus Torvalds 18851da177e4SLinus Torvalds if (reg_dev == NULL) 1886b1879204SIlpo Järvinen return 1; 18871da177e4SLinus Torvalds 1888b0e380b1SArnaldo Carvalho de Melo skb->mac_header = skb->network_header; 18891da177e4SLinus Torvalds skb_pull(skb, (u8 *)encap - skb->data); 189031c7711bSArnaldo Carvalho de Melo skb_reset_network_header(skb); 18911da177e4SLinus Torvalds skb->protocol = htons(ETH_P_IP); 189255747a0aSEric Dumazet skb->ip_summed = CHECKSUM_NONE; 18931da177e4SLinus Torvalds skb->pkt_type = PACKET_HOST; 1894d19d56ddSEric Dumazet 1895d19d56ddSEric Dumazet skb_tunnel_rx(skb, reg_dev); 1896d19d56ddSEric Dumazet 18971da177e4SLinus Torvalds netif_rx(skb); 1898b1879204SIlpo Järvinen 189955747a0aSEric Dumazet return NET_RX_SUCCESS; 1900b1879204SIlpo Järvinen } 1901b1879204SIlpo Järvinen #endif 1902b1879204SIlpo Järvinen 1903b1879204SIlpo Järvinen #ifdef CONFIG_IP_PIMSM_V1 1904b1879204SIlpo Järvinen /* 1905b1879204SIlpo Järvinen * Handle IGMP messages of PIMv1 1906b1879204SIlpo Järvinen */ 1907b1879204SIlpo Järvinen 1908b1879204SIlpo Järvinen int pim_rcv_v1(struct sk_buff *skb) 1909b1879204SIlpo Järvinen { 1910b1879204SIlpo Järvinen struct igmphdr *pim; 19114feb88e5SBenjamin Thery struct net *net = dev_net(skb->dev); 1912f0ad0860SPatrick McHardy struct mr_table *mrt; 1913b1879204SIlpo Järvinen 1914b1879204SIlpo Järvinen if (!pskb_may_pull(skb, sizeof(*pim) + sizeof(struct iphdr))) 1915b1879204SIlpo Järvinen goto drop; 1916b1879204SIlpo Järvinen 1917b1879204SIlpo Järvinen pim = igmp_hdr(skb); 1918b1879204SIlpo Järvinen 1919f0ad0860SPatrick McHardy if (ipmr_fib_lookup(net, &skb_rtable(skb)->fl, &mrt) < 0) 1920f0ad0860SPatrick McHardy goto drop; 1921f0ad0860SPatrick McHardy 19220c12295aSPatrick McHardy if (!mrt->mroute_do_pim || 1923b1879204SIlpo Järvinen pim->group != PIM_V1_VERSION || pim->code != PIM_V1_REGISTER) 1924b1879204SIlpo Järvinen goto drop; 1925b1879204SIlpo Järvinen 1926f0ad0860SPatrick McHardy if (__pim_rcv(mrt, skb, sizeof(*pim))) { 19271da177e4SLinus Torvalds drop: 19281da177e4SLinus Torvalds kfree_skb(skb); 1929b1879204SIlpo Järvinen } 19301da177e4SLinus Torvalds return 0; 19311da177e4SLinus Torvalds } 19321da177e4SLinus Torvalds #endif 19331da177e4SLinus Torvalds 19341da177e4SLinus Torvalds #ifdef CONFIG_IP_PIMSM_V2 19351da177e4SLinus Torvalds static int pim_rcv(struct sk_buff *skb) 19361da177e4SLinus Torvalds { 19371da177e4SLinus Torvalds struct pimreghdr *pim; 1938f0ad0860SPatrick McHardy struct net *net = dev_net(skb->dev); 1939f0ad0860SPatrick McHardy struct mr_table *mrt; 19401da177e4SLinus Torvalds 1941b1879204SIlpo Järvinen if (!pskb_may_pull(skb, sizeof(*pim) + sizeof(struct iphdr))) 19421da177e4SLinus Torvalds goto drop; 19431da177e4SLinus Torvalds 19449c70220bSArnaldo Carvalho de Melo pim = (struct pimreghdr *)skb_transport_header(skb); 19451da177e4SLinus Torvalds if (pim->type != ((PIM_VERSION << 4) | (PIM_REGISTER)) || 19461da177e4SLinus Torvalds (pim->flags & PIM_NULL_REGISTER) || 19471da177e4SLinus Torvalds (ip_compute_csum((void *)pim, sizeof(*pim)) != 0 && 1948d3bc23e7SAl Viro csum_fold(skb_checksum(skb, 0, skb->len, 0)))) 19491da177e4SLinus Torvalds goto drop; 19501da177e4SLinus Torvalds 1951f0ad0860SPatrick McHardy if (ipmr_fib_lookup(net, &skb_rtable(skb)->fl, &mrt) < 0) 1952f0ad0860SPatrick McHardy goto drop; 1953f0ad0860SPatrick McHardy 1954f0ad0860SPatrick McHardy if (__pim_rcv(mrt, skb, sizeof(*pim))) { 19551da177e4SLinus Torvalds drop: 19561da177e4SLinus Torvalds kfree_skb(skb); 1957b1879204SIlpo Järvinen } 19581da177e4SLinus Torvalds return 0; 19591da177e4SLinus Torvalds } 19601da177e4SLinus Torvalds #endif 19611da177e4SLinus Torvalds 1962cb6a4e46SPatrick McHardy static int __ipmr_fill_mroute(struct mr_table *mrt, struct sk_buff *skb, 1963cb6a4e46SPatrick McHardy struct mfc_cache *c, struct rtmsg *rtm) 19641da177e4SLinus Torvalds { 19651da177e4SLinus Torvalds int ct; 19661da177e4SLinus Torvalds struct rtnexthop *nhp; 196727a884dcSArnaldo Carvalho de Melo u8 *b = skb_tail_pointer(skb); 19681da177e4SLinus Torvalds struct rtattr *mp_head; 19691da177e4SLinus Torvalds 19707438189bSNicolas Dichtel /* If cache is unresolved, don't try to parse IIF and OIF */ 1971ed0f160aSDan Carpenter if (c->mfc_parent >= MAXVIFS) 19727438189bSNicolas Dichtel return -ENOENT; 19737438189bSNicolas Dichtel 19740c12295aSPatrick McHardy if (VIF_EXISTS(mrt, c->mfc_parent)) 19750c12295aSPatrick McHardy RTA_PUT(skb, RTA_IIF, 4, &mrt->vif_table[c->mfc_parent].dev->ifindex); 19761da177e4SLinus Torvalds 19771da177e4SLinus Torvalds mp_head = (struct rtattr *)skb_put(skb, RTA_LENGTH(0)); 19781da177e4SLinus Torvalds 19791da177e4SLinus Torvalds for (ct = c->mfc_un.res.minvif; ct < c->mfc_un.res.maxvif; ct++) { 19800c12295aSPatrick McHardy if (VIF_EXISTS(mrt, ct) && c->mfc_un.res.ttls[ct] < 255) { 19811da177e4SLinus Torvalds if (skb_tailroom(skb) < RTA_ALIGN(RTA_ALIGN(sizeof(*nhp)) + 4)) 19821da177e4SLinus Torvalds goto rtattr_failure; 19831da177e4SLinus Torvalds nhp = (struct rtnexthop *)skb_put(skb, RTA_ALIGN(sizeof(*nhp))); 19841da177e4SLinus Torvalds nhp->rtnh_flags = 0; 19851da177e4SLinus Torvalds nhp->rtnh_hops = c->mfc_un.res.ttls[ct]; 19860c12295aSPatrick McHardy nhp->rtnh_ifindex = mrt->vif_table[ct].dev->ifindex; 19871da177e4SLinus Torvalds nhp->rtnh_len = sizeof(*nhp); 19881da177e4SLinus Torvalds } 19891da177e4SLinus Torvalds } 19901da177e4SLinus Torvalds mp_head->rta_type = RTA_MULTIPATH; 199127a884dcSArnaldo Carvalho de Melo mp_head->rta_len = skb_tail_pointer(skb) - (u8 *)mp_head; 19921da177e4SLinus Torvalds rtm->rtm_type = RTN_MULTICAST; 19931da177e4SLinus Torvalds return 1; 19941da177e4SLinus Torvalds 19951da177e4SLinus Torvalds rtattr_failure: 1996dc5fc579SArnaldo Carvalho de Melo nlmsg_trim(skb, b); 19971da177e4SLinus Torvalds return -EMSGSIZE; 19981da177e4SLinus Torvalds } 19991da177e4SLinus Torvalds 20004feb88e5SBenjamin Thery int ipmr_get_route(struct net *net, 20014feb88e5SBenjamin Thery struct sk_buff *skb, struct rtmsg *rtm, int nowait) 20021da177e4SLinus Torvalds { 20031da177e4SLinus Torvalds int err; 2004f0ad0860SPatrick McHardy struct mr_table *mrt; 20051da177e4SLinus Torvalds struct mfc_cache *cache; 2006511c3f92SEric Dumazet struct rtable *rt = skb_rtable(skb); 20071da177e4SLinus Torvalds 2008f0ad0860SPatrick McHardy mrt = ipmr_get_table(net, RT_TABLE_DEFAULT); 2009f0ad0860SPatrick McHardy if (mrt == NULL) 2010f0ad0860SPatrick McHardy return -ENOENT; 2011f0ad0860SPatrick McHardy 2012a8c9486bSEric Dumazet rcu_read_lock(); 20130c12295aSPatrick McHardy cache = ipmr_cache_find(mrt, rt->rt_src, rt->rt_dst); 20141da177e4SLinus Torvalds 20151da177e4SLinus Torvalds if (cache == NULL) { 201672287490SAlexey Kuznetsov struct sk_buff *skb2; 2017eddc9ec5SArnaldo Carvalho de Melo struct iphdr *iph; 20181da177e4SLinus Torvalds struct net_device *dev; 2019a8cb16ddSEric Dumazet int vif = -1; 20201da177e4SLinus Torvalds 20211da177e4SLinus Torvalds if (nowait) { 2022a8c9486bSEric Dumazet rcu_read_unlock(); 20231da177e4SLinus Torvalds return -EAGAIN; 20241da177e4SLinus Torvalds } 20251da177e4SLinus Torvalds 20261da177e4SLinus Torvalds dev = skb->dev; 2027a8c9486bSEric Dumazet read_lock(&mrt_lock); 2028a8cb16ddSEric Dumazet if (dev) 2029a8cb16ddSEric Dumazet vif = ipmr_find_vif(mrt, dev); 2030a8cb16ddSEric Dumazet if (vif < 0) { 20311da177e4SLinus Torvalds read_unlock(&mrt_lock); 2032a8c9486bSEric Dumazet rcu_read_unlock(); 20331da177e4SLinus Torvalds return -ENODEV; 20341da177e4SLinus Torvalds } 203572287490SAlexey Kuznetsov skb2 = skb_clone(skb, GFP_ATOMIC); 203672287490SAlexey Kuznetsov if (!skb2) { 203772287490SAlexey Kuznetsov read_unlock(&mrt_lock); 2038a8c9486bSEric Dumazet rcu_read_unlock(); 203972287490SAlexey Kuznetsov return -ENOMEM; 204072287490SAlexey Kuznetsov } 204172287490SAlexey Kuznetsov 2042e2d1bca7SArnaldo Carvalho de Melo skb_push(skb2, sizeof(struct iphdr)); 2043e2d1bca7SArnaldo Carvalho de Melo skb_reset_network_header(skb2); 2044eddc9ec5SArnaldo Carvalho de Melo iph = ip_hdr(skb2); 2045eddc9ec5SArnaldo Carvalho de Melo iph->ihl = sizeof(struct iphdr) >> 2; 2046eddc9ec5SArnaldo Carvalho de Melo iph->saddr = rt->rt_src; 2047eddc9ec5SArnaldo Carvalho de Melo iph->daddr = rt->rt_dst; 2048eddc9ec5SArnaldo Carvalho de Melo iph->version = 0; 20490c12295aSPatrick McHardy err = ipmr_cache_unresolved(mrt, vif, skb2); 20501da177e4SLinus Torvalds read_unlock(&mrt_lock); 2051a8c9486bSEric Dumazet rcu_read_unlock(); 20521da177e4SLinus Torvalds return err; 20531da177e4SLinus Torvalds } 20541da177e4SLinus Torvalds 2055a8c9486bSEric Dumazet read_lock(&mrt_lock); 20561da177e4SLinus Torvalds if (!nowait && (rtm->rtm_flags & RTM_F_NOTIFY)) 20571da177e4SLinus Torvalds cache->mfc_flags |= MFC_NOTIFY; 2058cb6a4e46SPatrick McHardy err = __ipmr_fill_mroute(mrt, skb, cache, rtm); 20591da177e4SLinus Torvalds read_unlock(&mrt_lock); 2060a8c9486bSEric Dumazet rcu_read_unlock(); 20611da177e4SLinus Torvalds return err; 20621da177e4SLinus Torvalds } 20631da177e4SLinus Torvalds 2064cb6a4e46SPatrick McHardy static int ipmr_fill_mroute(struct mr_table *mrt, struct sk_buff *skb, 2065cb6a4e46SPatrick McHardy u32 pid, u32 seq, struct mfc_cache *c) 2066cb6a4e46SPatrick McHardy { 2067cb6a4e46SPatrick McHardy struct nlmsghdr *nlh; 2068cb6a4e46SPatrick McHardy struct rtmsg *rtm; 2069cb6a4e46SPatrick McHardy 2070cb6a4e46SPatrick McHardy nlh = nlmsg_put(skb, pid, seq, RTM_NEWROUTE, sizeof(*rtm), NLM_F_MULTI); 2071cb6a4e46SPatrick McHardy if (nlh == NULL) 2072cb6a4e46SPatrick McHardy return -EMSGSIZE; 2073cb6a4e46SPatrick McHardy 2074cb6a4e46SPatrick McHardy rtm = nlmsg_data(nlh); 2075cb6a4e46SPatrick McHardy rtm->rtm_family = RTNL_FAMILY_IPMR; 2076cb6a4e46SPatrick McHardy rtm->rtm_dst_len = 32; 2077cb6a4e46SPatrick McHardy rtm->rtm_src_len = 32; 2078cb6a4e46SPatrick McHardy rtm->rtm_tos = 0; 2079cb6a4e46SPatrick McHardy rtm->rtm_table = mrt->id; 2080cb6a4e46SPatrick McHardy NLA_PUT_U32(skb, RTA_TABLE, mrt->id); 2081cb6a4e46SPatrick McHardy rtm->rtm_type = RTN_MULTICAST; 2082cb6a4e46SPatrick McHardy rtm->rtm_scope = RT_SCOPE_UNIVERSE; 2083cb6a4e46SPatrick McHardy rtm->rtm_protocol = RTPROT_UNSPEC; 2084cb6a4e46SPatrick McHardy rtm->rtm_flags = 0; 2085cb6a4e46SPatrick McHardy 2086cb6a4e46SPatrick McHardy NLA_PUT_BE32(skb, RTA_SRC, c->mfc_origin); 2087cb6a4e46SPatrick McHardy NLA_PUT_BE32(skb, RTA_DST, c->mfc_mcastgrp); 2088cb6a4e46SPatrick McHardy 2089cb6a4e46SPatrick McHardy if (__ipmr_fill_mroute(mrt, skb, c, rtm) < 0) 2090cb6a4e46SPatrick McHardy goto nla_put_failure; 2091cb6a4e46SPatrick McHardy 2092cb6a4e46SPatrick McHardy return nlmsg_end(skb, nlh); 2093cb6a4e46SPatrick McHardy 2094cb6a4e46SPatrick McHardy nla_put_failure: 2095cb6a4e46SPatrick McHardy nlmsg_cancel(skb, nlh); 2096cb6a4e46SPatrick McHardy return -EMSGSIZE; 2097cb6a4e46SPatrick McHardy } 2098cb6a4e46SPatrick McHardy 2099cb6a4e46SPatrick McHardy static int ipmr_rtm_dumproute(struct sk_buff *skb, struct netlink_callback *cb) 2100cb6a4e46SPatrick McHardy { 2101cb6a4e46SPatrick McHardy struct net *net = sock_net(skb->sk); 2102cb6a4e46SPatrick McHardy struct mr_table *mrt; 2103cb6a4e46SPatrick McHardy struct mfc_cache *mfc; 2104cb6a4e46SPatrick McHardy unsigned int t = 0, s_t; 2105cb6a4e46SPatrick McHardy unsigned int h = 0, s_h; 2106cb6a4e46SPatrick McHardy unsigned int e = 0, s_e; 2107cb6a4e46SPatrick McHardy 2108cb6a4e46SPatrick McHardy s_t = cb->args[0]; 2109cb6a4e46SPatrick McHardy s_h = cb->args[1]; 2110cb6a4e46SPatrick McHardy s_e = cb->args[2]; 2111cb6a4e46SPatrick McHardy 2112a8c9486bSEric Dumazet rcu_read_lock(); 2113cb6a4e46SPatrick McHardy ipmr_for_each_table(mrt, net) { 2114cb6a4e46SPatrick McHardy if (t < s_t) 2115cb6a4e46SPatrick McHardy goto next_table; 2116cb6a4e46SPatrick McHardy if (t > s_t) 2117cb6a4e46SPatrick McHardy s_h = 0; 2118cb6a4e46SPatrick McHardy for (h = s_h; h < MFC_LINES; h++) { 2119a8c9486bSEric Dumazet list_for_each_entry_rcu(mfc, &mrt->mfc_cache_array[h], list) { 2120cb6a4e46SPatrick McHardy if (e < s_e) 2121cb6a4e46SPatrick McHardy goto next_entry; 2122cb6a4e46SPatrick McHardy if (ipmr_fill_mroute(mrt, skb, 2123cb6a4e46SPatrick McHardy NETLINK_CB(cb->skb).pid, 2124cb6a4e46SPatrick McHardy cb->nlh->nlmsg_seq, 2125cb6a4e46SPatrick McHardy mfc) < 0) 2126cb6a4e46SPatrick McHardy goto done; 2127cb6a4e46SPatrick McHardy next_entry: 2128cb6a4e46SPatrick McHardy e++; 2129cb6a4e46SPatrick McHardy } 2130cb6a4e46SPatrick McHardy e = s_e = 0; 2131cb6a4e46SPatrick McHardy } 2132cb6a4e46SPatrick McHardy s_h = 0; 2133cb6a4e46SPatrick McHardy next_table: 2134cb6a4e46SPatrick McHardy t++; 2135cb6a4e46SPatrick McHardy } 2136cb6a4e46SPatrick McHardy done: 2137a8c9486bSEric Dumazet rcu_read_unlock(); 2138cb6a4e46SPatrick McHardy 2139cb6a4e46SPatrick McHardy cb->args[2] = e; 2140cb6a4e46SPatrick McHardy cb->args[1] = h; 2141cb6a4e46SPatrick McHardy cb->args[0] = t; 2142cb6a4e46SPatrick McHardy 2143cb6a4e46SPatrick McHardy return skb->len; 2144cb6a4e46SPatrick McHardy } 2145cb6a4e46SPatrick McHardy 21461da177e4SLinus Torvalds #ifdef CONFIG_PROC_FS 21471da177e4SLinus Torvalds /* 2148a8cb16ddSEric Dumazet * The /proc interfaces to multicast routing : 2149a8cb16ddSEric Dumazet * /proc/net/ip_mr_cache & /proc/net/ip_mr_vif 21501da177e4SLinus Torvalds */ 21511da177e4SLinus Torvalds struct ipmr_vif_iter { 2152f6bb4514SBenjamin Thery struct seq_net_private p; 2153f0ad0860SPatrick McHardy struct mr_table *mrt; 21541da177e4SLinus Torvalds int ct; 21551da177e4SLinus Torvalds }; 21561da177e4SLinus Torvalds 2157f6bb4514SBenjamin Thery static struct vif_device *ipmr_vif_seq_idx(struct net *net, 2158f6bb4514SBenjamin Thery struct ipmr_vif_iter *iter, 21591da177e4SLinus Torvalds loff_t pos) 21601da177e4SLinus Torvalds { 2161f0ad0860SPatrick McHardy struct mr_table *mrt = iter->mrt; 21620c12295aSPatrick McHardy 21630c12295aSPatrick McHardy for (iter->ct = 0; iter->ct < mrt->maxvif; ++iter->ct) { 21640c12295aSPatrick McHardy if (!VIF_EXISTS(mrt, iter->ct)) 21651da177e4SLinus Torvalds continue; 21661da177e4SLinus Torvalds if (pos-- == 0) 21670c12295aSPatrick McHardy return &mrt->vif_table[iter->ct]; 21681da177e4SLinus Torvalds } 21691da177e4SLinus Torvalds return NULL; 21701da177e4SLinus Torvalds } 21711da177e4SLinus Torvalds 21721da177e4SLinus Torvalds static void *ipmr_vif_seq_start(struct seq_file *seq, loff_t *pos) 2173ba93ef74SStephen Hemminger __acquires(mrt_lock) 21741da177e4SLinus Torvalds { 2175f0ad0860SPatrick McHardy struct ipmr_vif_iter *iter = seq->private; 2176f6bb4514SBenjamin Thery struct net *net = seq_file_net(seq); 2177f0ad0860SPatrick McHardy struct mr_table *mrt; 2178f0ad0860SPatrick McHardy 2179f0ad0860SPatrick McHardy mrt = ipmr_get_table(net, RT_TABLE_DEFAULT); 2180f0ad0860SPatrick McHardy if (mrt == NULL) 2181f0ad0860SPatrick McHardy return ERR_PTR(-ENOENT); 2182f0ad0860SPatrick McHardy 2183f0ad0860SPatrick McHardy iter->mrt = mrt; 2184f6bb4514SBenjamin Thery 21851da177e4SLinus Torvalds read_lock(&mrt_lock); 2186f6bb4514SBenjamin Thery return *pos ? ipmr_vif_seq_idx(net, seq->private, *pos - 1) 21871da177e4SLinus Torvalds : SEQ_START_TOKEN; 21881da177e4SLinus Torvalds } 21891da177e4SLinus Torvalds 21901da177e4SLinus Torvalds static void *ipmr_vif_seq_next(struct seq_file *seq, void *v, loff_t *pos) 21911da177e4SLinus Torvalds { 21921da177e4SLinus Torvalds struct ipmr_vif_iter *iter = seq->private; 2193f6bb4514SBenjamin Thery struct net *net = seq_file_net(seq); 2194f0ad0860SPatrick McHardy struct mr_table *mrt = iter->mrt; 21951da177e4SLinus Torvalds 21961da177e4SLinus Torvalds ++*pos; 21971da177e4SLinus Torvalds if (v == SEQ_START_TOKEN) 2198f6bb4514SBenjamin Thery return ipmr_vif_seq_idx(net, iter, 0); 21991da177e4SLinus Torvalds 22000c12295aSPatrick McHardy while (++iter->ct < mrt->maxvif) { 22010c12295aSPatrick McHardy if (!VIF_EXISTS(mrt, iter->ct)) 22021da177e4SLinus Torvalds continue; 22030c12295aSPatrick McHardy return &mrt->vif_table[iter->ct]; 22041da177e4SLinus Torvalds } 22051da177e4SLinus Torvalds return NULL; 22061da177e4SLinus Torvalds } 22071da177e4SLinus Torvalds 22081da177e4SLinus Torvalds static void ipmr_vif_seq_stop(struct seq_file *seq, void *v) 2209ba93ef74SStephen Hemminger __releases(mrt_lock) 22101da177e4SLinus Torvalds { 22111da177e4SLinus Torvalds read_unlock(&mrt_lock); 22121da177e4SLinus Torvalds } 22131da177e4SLinus Torvalds 22141da177e4SLinus Torvalds static int ipmr_vif_seq_show(struct seq_file *seq, void *v) 22151da177e4SLinus Torvalds { 2216f0ad0860SPatrick McHardy struct ipmr_vif_iter *iter = seq->private; 2217f0ad0860SPatrick McHardy struct mr_table *mrt = iter->mrt; 2218f6bb4514SBenjamin Thery 22191da177e4SLinus Torvalds if (v == SEQ_START_TOKEN) { 22201da177e4SLinus Torvalds seq_puts(seq, 22211da177e4SLinus Torvalds "Interface BytesIn PktsIn BytesOut PktsOut Flags Local Remote\n"); 22221da177e4SLinus Torvalds } else { 22231da177e4SLinus Torvalds const struct vif_device *vif = v; 22241da177e4SLinus Torvalds const char *name = vif->dev ? vif->dev->name : "none"; 22251da177e4SLinus Torvalds 22261da177e4SLinus Torvalds seq_printf(seq, 22271da177e4SLinus Torvalds "%2Zd %-10s %8ld %7ld %8ld %7ld %05X %08X %08X\n", 22280c12295aSPatrick McHardy vif - mrt->vif_table, 22291da177e4SLinus Torvalds name, vif->bytes_in, vif->pkt_in, 22301da177e4SLinus Torvalds vif->bytes_out, vif->pkt_out, 22311da177e4SLinus Torvalds vif->flags, vif->local, vif->remote); 22321da177e4SLinus Torvalds } 22331da177e4SLinus Torvalds return 0; 22341da177e4SLinus Torvalds } 22351da177e4SLinus Torvalds 2236f690808eSStephen Hemminger static const struct seq_operations ipmr_vif_seq_ops = { 22371da177e4SLinus Torvalds .start = ipmr_vif_seq_start, 22381da177e4SLinus Torvalds .next = ipmr_vif_seq_next, 22391da177e4SLinus Torvalds .stop = ipmr_vif_seq_stop, 22401da177e4SLinus Torvalds .show = ipmr_vif_seq_show, 22411da177e4SLinus Torvalds }; 22421da177e4SLinus Torvalds 22431da177e4SLinus Torvalds static int ipmr_vif_open(struct inode *inode, struct file *file) 22441da177e4SLinus Torvalds { 2245f6bb4514SBenjamin Thery return seq_open_net(inode, file, &ipmr_vif_seq_ops, 2246cf7732e4SPavel Emelyanov sizeof(struct ipmr_vif_iter)); 22471da177e4SLinus Torvalds } 22481da177e4SLinus Torvalds 22499a32144eSArjan van de Ven static const struct file_operations ipmr_vif_fops = { 22501da177e4SLinus Torvalds .owner = THIS_MODULE, 22511da177e4SLinus Torvalds .open = ipmr_vif_open, 22521da177e4SLinus Torvalds .read = seq_read, 22531da177e4SLinus Torvalds .llseek = seq_lseek, 2254f6bb4514SBenjamin Thery .release = seq_release_net, 22551da177e4SLinus Torvalds }; 22561da177e4SLinus Torvalds 22571da177e4SLinus Torvalds struct ipmr_mfc_iter { 2258f6bb4514SBenjamin Thery struct seq_net_private p; 2259f0ad0860SPatrick McHardy struct mr_table *mrt; 2260862465f2SPatrick McHardy struct list_head *cache; 22611da177e4SLinus Torvalds int ct; 22621da177e4SLinus Torvalds }; 22631da177e4SLinus Torvalds 22641da177e4SLinus Torvalds 2265f6bb4514SBenjamin Thery static struct mfc_cache *ipmr_mfc_seq_idx(struct net *net, 2266f6bb4514SBenjamin Thery struct ipmr_mfc_iter *it, loff_t pos) 22671da177e4SLinus Torvalds { 2268f0ad0860SPatrick McHardy struct mr_table *mrt = it->mrt; 22691da177e4SLinus Torvalds struct mfc_cache *mfc; 22701da177e4SLinus Torvalds 2271a8c9486bSEric Dumazet rcu_read_lock(); 2272862465f2SPatrick McHardy for (it->ct = 0; it->ct < MFC_LINES; it->ct++) { 22730c12295aSPatrick McHardy it->cache = &mrt->mfc_cache_array[it->ct]; 2274a8c9486bSEric Dumazet list_for_each_entry_rcu(mfc, it->cache, list) 22751da177e4SLinus Torvalds if (pos-- == 0) 22761da177e4SLinus Torvalds return mfc; 2277862465f2SPatrick McHardy } 2278a8c9486bSEric Dumazet rcu_read_unlock(); 22791da177e4SLinus Torvalds 22801da177e4SLinus Torvalds spin_lock_bh(&mfc_unres_lock); 22810c12295aSPatrick McHardy it->cache = &mrt->mfc_unres_queue; 2282862465f2SPatrick McHardy list_for_each_entry(mfc, it->cache, list) 2283e258beb2SPatrick McHardy if (pos-- == 0) 22841da177e4SLinus Torvalds return mfc; 22851da177e4SLinus Torvalds spin_unlock_bh(&mfc_unres_lock); 22861da177e4SLinus Torvalds 22871da177e4SLinus Torvalds it->cache = NULL; 22881da177e4SLinus Torvalds return NULL; 22891da177e4SLinus Torvalds } 22901da177e4SLinus Torvalds 22911da177e4SLinus Torvalds 22921da177e4SLinus Torvalds static void *ipmr_mfc_seq_start(struct seq_file *seq, loff_t *pos) 22931da177e4SLinus Torvalds { 22941da177e4SLinus Torvalds struct ipmr_mfc_iter *it = seq->private; 2295f6bb4514SBenjamin Thery struct net *net = seq_file_net(seq); 2296f0ad0860SPatrick McHardy struct mr_table *mrt; 2297f6bb4514SBenjamin Thery 2298f0ad0860SPatrick McHardy mrt = ipmr_get_table(net, RT_TABLE_DEFAULT); 2299f0ad0860SPatrick McHardy if (mrt == NULL) 2300f0ad0860SPatrick McHardy return ERR_PTR(-ENOENT); 2301f0ad0860SPatrick McHardy 2302f0ad0860SPatrick McHardy it->mrt = mrt; 23031da177e4SLinus Torvalds it->cache = NULL; 23041da177e4SLinus Torvalds it->ct = 0; 2305f6bb4514SBenjamin Thery return *pos ? ipmr_mfc_seq_idx(net, seq->private, *pos - 1) 23061da177e4SLinus Torvalds : SEQ_START_TOKEN; 23071da177e4SLinus Torvalds } 23081da177e4SLinus Torvalds 23091da177e4SLinus Torvalds static void *ipmr_mfc_seq_next(struct seq_file *seq, void *v, loff_t *pos) 23101da177e4SLinus Torvalds { 23111da177e4SLinus Torvalds struct mfc_cache *mfc = v; 23121da177e4SLinus Torvalds struct ipmr_mfc_iter *it = seq->private; 2313f6bb4514SBenjamin Thery struct net *net = seq_file_net(seq); 2314f0ad0860SPatrick McHardy struct mr_table *mrt = it->mrt; 23151da177e4SLinus Torvalds 23161da177e4SLinus Torvalds ++*pos; 23171da177e4SLinus Torvalds 23181da177e4SLinus Torvalds if (v == SEQ_START_TOKEN) 2319f6bb4514SBenjamin Thery return ipmr_mfc_seq_idx(net, seq->private, 0); 23201da177e4SLinus Torvalds 2321862465f2SPatrick McHardy if (mfc->list.next != it->cache) 2322862465f2SPatrick McHardy return list_entry(mfc->list.next, struct mfc_cache, list); 23231da177e4SLinus Torvalds 23240c12295aSPatrick McHardy if (it->cache == &mrt->mfc_unres_queue) 23251da177e4SLinus Torvalds goto end_of_list; 23261da177e4SLinus Torvalds 23270c12295aSPatrick McHardy BUG_ON(it->cache != &mrt->mfc_cache_array[it->ct]); 23281da177e4SLinus Torvalds 23291da177e4SLinus Torvalds while (++it->ct < MFC_LINES) { 23300c12295aSPatrick McHardy it->cache = &mrt->mfc_cache_array[it->ct]; 2331862465f2SPatrick McHardy if (list_empty(it->cache)) 2332862465f2SPatrick McHardy continue; 2333862465f2SPatrick McHardy return list_first_entry(it->cache, struct mfc_cache, list); 23341da177e4SLinus Torvalds } 23351da177e4SLinus Torvalds 23361da177e4SLinus Torvalds /* exhausted cache_array, show unresolved */ 2337a8c9486bSEric Dumazet rcu_read_unlock(); 23380c12295aSPatrick McHardy it->cache = &mrt->mfc_unres_queue; 23391da177e4SLinus Torvalds it->ct = 0; 23401da177e4SLinus Torvalds 23411da177e4SLinus Torvalds spin_lock_bh(&mfc_unres_lock); 2342862465f2SPatrick McHardy if (!list_empty(it->cache)) 2343862465f2SPatrick McHardy return list_first_entry(it->cache, struct mfc_cache, list); 23441da177e4SLinus Torvalds 23451da177e4SLinus Torvalds end_of_list: 23461da177e4SLinus Torvalds spin_unlock_bh(&mfc_unres_lock); 23471da177e4SLinus Torvalds it->cache = NULL; 23481da177e4SLinus Torvalds 23491da177e4SLinus Torvalds return NULL; 23501da177e4SLinus Torvalds } 23511da177e4SLinus Torvalds 23521da177e4SLinus Torvalds static void ipmr_mfc_seq_stop(struct seq_file *seq, void *v) 23531da177e4SLinus Torvalds { 23541da177e4SLinus Torvalds struct ipmr_mfc_iter *it = seq->private; 2355f0ad0860SPatrick McHardy struct mr_table *mrt = it->mrt; 23561da177e4SLinus Torvalds 23570c12295aSPatrick McHardy if (it->cache == &mrt->mfc_unres_queue) 23581da177e4SLinus Torvalds spin_unlock_bh(&mfc_unres_lock); 23590c12295aSPatrick McHardy else if (it->cache == &mrt->mfc_cache_array[it->ct]) 2360a8c9486bSEric Dumazet rcu_read_unlock(); 23611da177e4SLinus Torvalds } 23621da177e4SLinus Torvalds 23631da177e4SLinus Torvalds static int ipmr_mfc_seq_show(struct seq_file *seq, void *v) 23641da177e4SLinus Torvalds { 23651da177e4SLinus Torvalds int n; 23661da177e4SLinus Torvalds 23671da177e4SLinus Torvalds if (v == SEQ_START_TOKEN) { 23681da177e4SLinus Torvalds seq_puts(seq, 23691da177e4SLinus Torvalds "Group Origin Iif Pkts Bytes Wrong Oifs\n"); 23701da177e4SLinus Torvalds } else { 23711da177e4SLinus Torvalds const struct mfc_cache *mfc = v; 23721da177e4SLinus Torvalds const struct ipmr_mfc_iter *it = seq->private; 2373f0ad0860SPatrick McHardy const struct mr_table *mrt = it->mrt; 23741da177e4SLinus Torvalds 23750eae88f3SEric Dumazet seq_printf(seq, "%08X %08X %-3hd", 23760eae88f3SEric Dumazet (__force u32) mfc->mfc_mcastgrp, 23770eae88f3SEric Dumazet (__force u32) mfc->mfc_origin, 23781ea472e2SBenjamin Thery mfc->mfc_parent); 23791ea472e2SBenjamin Thery 23800c12295aSPatrick McHardy if (it->cache != &mrt->mfc_unres_queue) { 23811ea472e2SBenjamin Thery seq_printf(seq, " %8lu %8lu %8lu", 23821da177e4SLinus Torvalds mfc->mfc_un.res.pkt, 23831da177e4SLinus Torvalds mfc->mfc_un.res.bytes, 23841da177e4SLinus Torvalds mfc->mfc_un.res.wrong_if); 23851da177e4SLinus Torvalds for (n = mfc->mfc_un.res.minvif; 23861da177e4SLinus Torvalds n < mfc->mfc_un.res.maxvif; n++) { 23870c12295aSPatrick McHardy if (VIF_EXISTS(mrt, n) && 2388cf958ae3SBenjamin Thery mfc->mfc_un.res.ttls[n] < 255) 23891da177e4SLinus Torvalds seq_printf(seq, 23901da177e4SLinus Torvalds " %2d:%-3d", 23911da177e4SLinus Torvalds n, mfc->mfc_un.res.ttls[n]); 23921da177e4SLinus Torvalds } 23931ea472e2SBenjamin Thery } else { 23941ea472e2SBenjamin Thery /* unresolved mfc_caches don't contain 23951ea472e2SBenjamin Thery * pkt, bytes and wrong_if values 23961ea472e2SBenjamin Thery */ 23971ea472e2SBenjamin Thery seq_printf(seq, " %8lu %8lu %8lu", 0ul, 0ul, 0ul); 23981da177e4SLinus Torvalds } 23991da177e4SLinus Torvalds seq_putc(seq, '\n'); 24001da177e4SLinus Torvalds } 24011da177e4SLinus Torvalds return 0; 24021da177e4SLinus Torvalds } 24031da177e4SLinus Torvalds 2404f690808eSStephen Hemminger static const struct seq_operations ipmr_mfc_seq_ops = { 24051da177e4SLinus Torvalds .start = ipmr_mfc_seq_start, 24061da177e4SLinus Torvalds .next = ipmr_mfc_seq_next, 24071da177e4SLinus Torvalds .stop = ipmr_mfc_seq_stop, 24081da177e4SLinus Torvalds .show = ipmr_mfc_seq_show, 24091da177e4SLinus Torvalds }; 24101da177e4SLinus Torvalds 24111da177e4SLinus Torvalds static int ipmr_mfc_open(struct inode *inode, struct file *file) 24121da177e4SLinus Torvalds { 2413f6bb4514SBenjamin Thery return seq_open_net(inode, file, &ipmr_mfc_seq_ops, 2414cf7732e4SPavel Emelyanov sizeof(struct ipmr_mfc_iter)); 24151da177e4SLinus Torvalds } 24161da177e4SLinus Torvalds 24179a32144eSArjan van de Ven static const struct file_operations ipmr_mfc_fops = { 24181da177e4SLinus Torvalds .owner = THIS_MODULE, 24191da177e4SLinus Torvalds .open = ipmr_mfc_open, 24201da177e4SLinus Torvalds .read = seq_read, 24211da177e4SLinus Torvalds .llseek = seq_lseek, 2422f6bb4514SBenjamin Thery .release = seq_release_net, 24231da177e4SLinus Torvalds }; 24241da177e4SLinus Torvalds #endif 24251da177e4SLinus Torvalds 24261da177e4SLinus Torvalds #ifdef CONFIG_IP_PIMSM_V2 242732613090SAlexey Dobriyan static const struct net_protocol pim_protocol = { 24281da177e4SLinus Torvalds .handler = pim_rcv, 2429403dbb97STom Goff .netns_ok = 1, 24301da177e4SLinus Torvalds }; 24311da177e4SLinus Torvalds #endif 24321da177e4SLinus Torvalds 24331da177e4SLinus Torvalds 24341da177e4SLinus Torvalds /* 24351da177e4SLinus Torvalds * Setup for IP multicast routing 24361da177e4SLinus Torvalds */ 2437cf958ae3SBenjamin Thery static int __net_init ipmr_net_init(struct net *net) 2438cf958ae3SBenjamin Thery { 2439f0ad0860SPatrick McHardy int err; 2440cf958ae3SBenjamin Thery 2441f0ad0860SPatrick McHardy err = ipmr_rules_init(net); 2442f0ad0860SPatrick McHardy if (err < 0) 2443cf958ae3SBenjamin Thery goto fail; 2444f6bb4514SBenjamin Thery 2445f6bb4514SBenjamin Thery #ifdef CONFIG_PROC_FS 2446f6bb4514SBenjamin Thery err = -ENOMEM; 2447f6bb4514SBenjamin Thery if (!proc_net_fops_create(net, "ip_mr_vif", 0, &ipmr_vif_fops)) 2448f6bb4514SBenjamin Thery goto proc_vif_fail; 2449f6bb4514SBenjamin Thery if (!proc_net_fops_create(net, "ip_mr_cache", 0, &ipmr_mfc_fops)) 2450f6bb4514SBenjamin Thery goto proc_cache_fail; 2451f6bb4514SBenjamin Thery #endif 24522bb8b26cSBenjamin Thery return 0; 24532bb8b26cSBenjamin Thery 2454f6bb4514SBenjamin Thery #ifdef CONFIG_PROC_FS 2455f6bb4514SBenjamin Thery proc_cache_fail: 2456f6bb4514SBenjamin Thery proc_net_remove(net, "ip_mr_vif"); 2457f6bb4514SBenjamin Thery proc_vif_fail: 2458f0ad0860SPatrick McHardy ipmr_rules_exit(net); 2459f6bb4514SBenjamin Thery #endif 2460cf958ae3SBenjamin Thery fail: 2461cf958ae3SBenjamin Thery return err; 2462cf958ae3SBenjamin Thery } 2463cf958ae3SBenjamin Thery 2464cf958ae3SBenjamin Thery static void __net_exit ipmr_net_exit(struct net *net) 2465cf958ae3SBenjamin Thery { 2466f6bb4514SBenjamin Thery #ifdef CONFIG_PROC_FS 2467f6bb4514SBenjamin Thery proc_net_remove(net, "ip_mr_cache"); 2468f6bb4514SBenjamin Thery proc_net_remove(net, "ip_mr_vif"); 2469f6bb4514SBenjamin Thery #endif 2470f0ad0860SPatrick McHardy ipmr_rules_exit(net); 2471cf958ae3SBenjamin Thery } 2472cf958ae3SBenjamin Thery 2473cf958ae3SBenjamin Thery static struct pernet_operations ipmr_net_ops = { 2474cf958ae3SBenjamin Thery .init = ipmr_net_init, 2475cf958ae3SBenjamin Thery .exit = ipmr_net_exit, 2476cf958ae3SBenjamin Thery }; 24771da177e4SLinus Torvalds 247803d2f897SWang Chen int __init ip_mr_init(void) 24791da177e4SLinus Torvalds { 248003d2f897SWang Chen int err; 248103d2f897SWang Chen 24821da177e4SLinus Torvalds mrt_cachep = kmem_cache_create("ip_mrt_cache", 24831da177e4SLinus Torvalds sizeof(struct mfc_cache), 2484e5d679f3SAlexey Dobriyan 0, SLAB_HWCACHE_ALIGN | SLAB_PANIC, 248520c2df83SPaul Mundt NULL); 248603d2f897SWang Chen if (!mrt_cachep) 248703d2f897SWang Chen return -ENOMEM; 248803d2f897SWang Chen 2489cf958ae3SBenjamin Thery err = register_pernet_subsys(&ipmr_net_ops); 2490cf958ae3SBenjamin Thery if (err) 2491cf958ae3SBenjamin Thery goto reg_pernet_fail; 2492cf958ae3SBenjamin Thery 249303d2f897SWang Chen err = register_netdevice_notifier(&ip_mr_notifier); 249403d2f897SWang Chen if (err) 249503d2f897SWang Chen goto reg_notif_fail; 2496403dbb97STom Goff #ifdef CONFIG_IP_PIMSM_V2 2497403dbb97STom Goff if (inet_add_protocol(&pim_protocol, IPPROTO_PIM) < 0) { 2498403dbb97STom Goff printk(KERN_ERR "ip_mr_init: can't add PIM protocol\n"); 2499403dbb97STom Goff err = -EAGAIN; 2500403dbb97STom Goff goto add_proto_fail; 2501403dbb97STom Goff } 2502403dbb97STom Goff #endif 2503cb6a4e46SPatrick McHardy rtnl_register(RTNL_FAMILY_IPMR, RTM_GETROUTE, NULL, ipmr_rtm_dumproute); 250403d2f897SWang Chen return 0; 2505f6bb4514SBenjamin Thery 2506403dbb97STom Goff #ifdef CONFIG_IP_PIMSM_V2 2507403dbb97STom Goff add_proto_fail: 2508403dbb97STom Goff unregister_netdevice_notifier(&ip_mr_notifier); 2509403dbb97STom Goff #endif 2510c3e38896SBenjamin Thery reg_notif_fail: 2511cf958ae3SBenjamin Thery unregister_pernet_subsys(&ipmr_net_ops); 2512cf958ae3SBenjamin Thery reg_pernet_fail: 2513c3e38896SBenjamin Thery kmem_cache_destroy(mrt_cachep); 251403d2f897SWang Chen return err; 25151da177e4SLinus Torvalds } 2516