xref: /freebsd/sys/net/if.c (revision 5129159789cc9d7bc514e4546b88e3427695002d)
1 /*
2  * Copyright (c) 1980, 1986, 1993
3  *	The Regents of the University of California.  All rights reserved.
4  *
5  * Redistribution and use in source and binary forms, with or without
6  * modification, are permitted provided that the following conditions
7  * are met:
8  * 1. Redistributions of source code must retain the above copyright
9  *    notice, this list of conditions and the following disclaimer.
10  * 2. Redistributions in binary form must reproduce the above copyright
11  *    notice, this list of conditions and the following disclaimer in the
12  *    documentation and/or other materials provided with the distribution.
13  * 3. All advertising materials mentioning features or use of this software
14  *    must display the following acknowledgement:
15  *	This product includes software developed by the University of
16  *	California, Berkeley and its contributors.
17  * 4. Neither the name of the University nor the names of its contributors
18  *    may be used to endorse or promote products derived from this software
19  *    without specific prior written permission.
20  *
21  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
22  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
26  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
27  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
28  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
29  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
30  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
31  * SUCH DAMAGE.
32  *
33  *	@(#)if.c	8.3 (Berkeley) 1/4/94
34  * $FreeBSD$
35  */
36 
37 #include "opt_compat.h"
38 #include "opt_inet6.h"
39 
40 #include <sys/param.h>
41 #include <sys/malloc.h>
42 #include <sys/mbuf.h>
43 #include <sys/systm.h>
44 #include <sys/proc.h>
45 #include <sys/socket.h>
46 #include <sys/socketvar.h>
47 #include <sys/protosw.h>
48 #include <sys/kernel.h>
49 #include <sys/sockio.h>
50 #include <sys/syslog.h>
51 #include <sys/sysctl.h>
52 
53 #include <net/if.h>
54 #include <net/if_dl.h>
55 #include <net/radix.h>
56 #include <net/route.h>
57 
58 #ifdef INET6
59 /*XXX*/
60 #include <netinet/in.h>
61 #endif
62 
63 /*
64  * System initialization
65  */
66 
67 static int ifconf __P((u_long, caddr_t));
68 static void ifinit __P((void *));
69 static void if_qflush __P((struct ifqueue *));
70 static void if_slowtimo __P((void *));
71 static void link_rtrequest __P((int, struct rtentry *, struct sockaddr *));
72 static int  if_rtdel __P((struct radix_node *, void *));
73 
74 SYSINIT(interfaces, SI_SUB_PROTO_IF, SI_ORDER_FIRST, ifinit, NULL)
75 
76 MALLOC_DEFINE(M_IFADDR, "ifaddr", "interface address");
77 MALLOC_DEFINE(M_IFMADDR, "ether_multi", "link-level multicast address");
78 
79 int	ifqmaxlen = IFQ_MAXLEN;
80 struct	ifnethead ifnet;	/* depend on static init XXX */
81 
82 #ifdef INET6
83 /*
84  * XXX: declare here to avoid to include many inet6 related files..
85  * should be more generalized?
86  */
87 extern void	nd6_setmtu __P((struct ifnet *));
88 #endif
89 
90 /*
91  * Network interface utility routines.
92  *
93  * Routines with ifa_ifwith* names take sockaddr *'s as
94  * parameters.
95  */
96 /* ARGSUSED*/
97 void
98 ifinit(dummy)
99 	void *dummy;
100 {
101 	struct ifnet *ifp;
102 	int s;
103 
104 	s = splimp();
105 	for (ifp = ifnet.tqh_first; ifp; ifp = ifp->if_link.tqe_next)
106 		if (ifp->if_snd.ifq_maxlen == 0) {
107 			printf("%s%d XXX: driver didn't set ifq_maxlen\n",
108 			    ifp->if_name, ifp->if_unit);
109 			ifp->if_snd.ifq_maxlen = ifqmaxlen;
110 		}
111 	splx(s);
112 	if_slowtimo(0);
113 }
114 
115 int if_index = 0;
116 struct ifaddr **ifnet_addrs;
117 struct ifnet **ifindex2ifnet = NULL;
118 
119 
120 /*
121  * Attach an interface to the
122  * list of "active" interfaces.
123  */
124 void
125 if_attach(ifp)
126 	struct ifnet *ifp;
127 {
128 	unsigned socksize, ifasize;
129 	int namelen, masklen;
130 	char workbuf[64];
131 	register struct sockaddr_dl *sdl;
132 	register struct ifaddr *ifa;
133 	static int if_indexlim = 8;
134 	static int inited;
135 
136 	if (!inited) {
137 		TAILQ_INIT(&ifnet);
138 		inited = 1;
139 	}
140 
141 	TAILQ_INSERT_TAIL(&ifnet, ifp, if_link);
142 	ifp->if_index = ++if_index;
143 	/*
144 	 * XXX -
145 	 * The old code would work if the interface passed a pre-existing
146 	 * chain of ifaddrs to this code.  We don't trust our callers to
147 	 * properly initialize the tailq, however, so we no longer allow
148 	 * this unlikely case.
149 	 */
150 	TAILQ_INIT(&ifp->if_addrhead);
151 	TAILQ_INIT(&ifp->if_prefixhead);
152 	LIST_INIT(&ifp->if_multiaddrs);
153 	getmicrotime(&ifp->if_lastchange);
154 	if (ifnet_addrs == 0 || if_index >= if_indexlim) {
155 		unsigned n = (if_indexlim <<= 1) * sizeof(ifa);
156 		caddr_t q = malloc(n, M_IFADDR, M_WAITOK);
157 		bzero(q, n);
158 		if (ifnet_addrs) {
159 			bcopy((caddr_t)ifnet_addrs, (caddr_t)q, n/2);
160 			free((caddr_t)ifnet_addrs, M_IFADDR);
161 		}
162 		ifnet_addrs = (struct ifaddr **)q;
163 
164 		/* grow ifindex2ifnet */
165 		n = if_indexlim * sizeof(struct ifnet *);
166 		q = malloc(n, M_IFADDR, M_WAITOK);
167 		bzero(q, n);
168 		if (ifindex2ifnet) {
169 			bcopy((caddr_t)ifindex2ifnet, q, n/2);
170 			free((caddr_t)ifindex2ifnet, M_IFADDR);
171 		}
172 		ifindex2ifnet = (struct ifnet **)q;
173 	}
174 
175 	ifindex2ifnet[if_index] = ifp;
176 
177 	/*
178 	 * create a Link Level name for this device
179 	 */
180 	namelen = snprintf(workbuf, sizeof(workbuf),
181 	    "%s%d", ifp->if_name, ifp->if_unit);
182 #define _offsetof(t, m) ((int)((caddr_t)&((t *)0)->m))
183 	masklen = _offsetof(struct sockaddr_dl, sdl_data[0]) + namelen;
184 	socksize = masklen + ifp->if_addrlen;
185 #define ROUNDUP(a) (1 + (((a) - 1) | (sizeof(long) - 1)))
186 	if (socksize < sizeof(*sdl))
187 		socksize = sizeof(*sdl);
188 	socksize = ROUNDUP(socksize);
189 	ifasize = sizeof(*ifa) + 2 * socksize;
190 	ifa = (struct ifaddr *)malloc(ifasize, M_IFADDR, M_WAITOK);
191 	if (ifa) {
192 		bzero((caddr_t)ifa, ifasize);
193 		sdl = (struct sockaddr_dl *)(ifa + 1);
194 		sdl->sdl_len = socksize;
195 		sdl->sdl_family = AF_LINK;
196 		bcopy(workbuf, sdl->sdl_data, namelen);
197 		sdl->sdl_nlen = namelen;
198 		sdl->sdl_index = ifp->if_index;
199 		sdl->sdl_type = ifp->if_type;
200 		ifnet_addrs[if_index - 1] = ifa;
201 		ifa->ifa_ifp = ifp;
202 		ifa->ifa_rtrequest = link_rtrequest;
203 		ifa->ifa_addr = (struct sockaddr *)sdl;
204 		sdl = (struct sockaddr_dl *)(socksize + (caddr_t)sdl);
205 		ifa->ifa_netmask = (struct sockaddr *)sdl;
206 		sdl->sdl_len = masklen;
207 		while (namelen != 0)
208 			sdl->sdl_data[--namelen] = 0xff;
209 		TAILQ_INSERT_HEAD(&ifp->if_addrhead, ifa, ifa_link);
210 	}
211 }
212 
213 /*
214  * Detach an interface, removing it from the
215  * list of "active" interfaces.
216  */
217 void
218 if_detach(ifp)
219 	struct ifnet *ifp;
220 {
221 	struct ifaddr *ifa;
222 	struct radix_node_head	*rnh;
223 	int s;
224 	int i;
225 
226 	/*
227 	 * Remove routes and flush queues.
228 	 */
229 	s = splnet();
230 	if_down(ifp);
231 
232 	/*
233 	 * Remove address from ifnet_addrs[] and maybe decrement if_index.
234 	 * Clean up all addresses.
235 	 */
236 	ifnet_addrs[ifp->if_index - 1] = 0;
237 	while (if_index > 0 && ifnet_addrs[if_index - 1] == 0)
238 		if_index--;
239 
240 	for (ifa = TAILQ_FIRST(&ifp->if_addrhead); ifa;
241 	     ifa = TAILQ_FIRST(&ifp->if_addrhead)) {
242 		/* XXX: Ugly!! ad hoc just for INET */
243 		if (ifa->ifa_addr && ifa->ifa_addr->sa_family == AF_INET) {
244 			struct ifaliasreq ifr;
245 
246 			bzero(&ifr, sizeof(ifr));
247 			if (ifa->ifa_addr)
248 				ifr.ifra_addr = *ifa->ifa_addr;
249 			if (ifa->ifa_dstaddr)
250 				ifr.ifra_broadaddr = *ifa->ifa_dstaddr;
251 			if (in_control(NULL, SIOCDIFADDR, (caddr_t)&ifr, ifp,
252 			    NULL) == 0)
253 				continue;
254 		}
255 		TAILQ_REMOVE(&ifp->if_addrhead, ifa, ifa_link);
256 		IFAFREE(ifa);
257 	}
258 
259 	/*
260 	 * Delete all remaining routes using this interface
261 	 * Unfortuneatly the only way to do this is to slog through
262 	 * the entire routing table looking for routes which point
263 	 * to this interface...oh well...
264 	 */
265 	for (i = 1; i <= AF_MAX; i++) {
266 		if ((rnh = rt_tables[i]) == NULL)
267 			continue;
268 		(void) rnh->rnh_walktree(rnh, if_rtdel, ifp);
269 	}
270 
271 	TAILQ_REMOVE(&ifnet, ifp, if_link);
272 	splx(s);
273 }
274 
275 /*
276  * Delete Routes for a Network Interface
277  *
278  * Called for each routing entry via the rnh->rnh_walktree() call above
279  * to delete all route entries referencing a detaching network interface.
280  *
281  * Arguments:
282  *	rn	pointer to node in the routing table
283  *	arg	argument passed to rnh->rnh_walktree() - detaching interface
284  *
285  * Returns:
286  *	0	successful
287  *	errno	failed - reason indicated
288  *
289  */
290 static int
291 if_rtdel(rn, arg)
292 	struct radix_node	*rn;
293 	void			*arg;
294 {
295 	struct rtentry	*rt = (struct rtentry *)rn;
296 	struct ifnet	*ifp = arg;
297 	int		err;
298 
299 	if (rt->rt_ifp == ifp) {
300 
301 		/*
302 		 * Protect (sorta) against walktree recursion problems
303 		 * with cloned routes
304 		 */
305 		if ((rt->rt_flags & RTF_UP) == 0)
306 			return (0);
307 
308 		err = rtrequest(RTM_DELETE, rt_key(rt), rt->rt_gateway,
309 				rt_mask(rt), rt->rt_flags,
310 				(struct rtentry **) NULL);
311 		if (err) {
312 			log(LOG_WARNING, "if_rtdel: error %d\n", err);
313 		}
314 	}
315 
316 	return (0);
317 }
318 
319 /*
320  * Locate an interface based on a complete address.
321  */
322 /*ARGSUSED*/
323 struct ifaddr *
324 ifa_ifwithaddr(addr)
325 	register struct sockaddr *addr;
326 {
327 	register struct ifnet *ifp;
328 	register struct ifaddr *ifa;
329 
330 #define	equal(a1, a2) \
331   (bcmp((caddr_t)(a1), (caddr_t)(a2), ((struct sockaddr *)(a1))->sa_len) == 0)
332 	for (ifp = ifnet.tqh_first; ifp; ifp = ifp->if_link.tqe_next)
333 	    for (ifa = ifp->if_addrhead.tqh_first; ifa;
334 		 ifa = ifa->ifa_link.tqe_next) {
335 		if (ifa->ifa_addr->sa_family != addr->sa_family)
336 			continue;
337 		if (equal(addr, ifa->ifa_addr))
338 			return (ifa);
339 		if ((ifp->if_flags & IFF_BROADCAST) && ifa->ifa_broadaddr &&
340 		    /* IP6 doesn't have broadcast */
341 		    ifa->ifa_broadaddr->sa_len != 0 &&
342 		    equal(ifa->ifa_broadaddr, addr))
343 			return (ifa);
344 	}
345 	return ((struct ifaddr *)0);
346 }
347 /*
348  * Locate the point to point interface with a given destination address.
349  */
350 /*ARGSUSED*/
351 struct ifaddr *
352 ifa_ifwithdstaddr(addr)
353 	register struct sockaddr *addr;
354 {
355 	register struct ifnet *ifp;
356 	register struct ifaddr *ifa;
357 
358 	for (ifp = ifnet.tqh_first; ifp; ifp = ifp->if_link.tqe_next)
359 	    if (ifp->if_flags & IFF_POINTOPOINT)
360 		for (ifa = ifp->if_addrhead.tqh_first; ifa;
361 		     ifa = ifa->ifa_link.tqe_next) {
362 			if (ifa->ifa_addr->sa_family != addr->sa_family)
363 				continue;
364 			if (ifa->ifa_dstaddr && equal(addr, ifa->ifa_dstaddr))
365 				return (ifa);
366 	}
367 	return ((struct ifaddr *)0);
368 }
369 
370 /*
371  * Find an interface on a specific network.  If many, choice
372  * is most specific found.
373  */
374 struct ifaddr *
375 ifa_ifwithnet(addr)
376 	struct sockaddr *addr;
377 {
378 	register struct ifnet *ifp;
379 	register struct ifaddr *ifa;
380 	struct ifaddr *ifa_maybe = (struct ifaddr *) 0;
381 	u_int af = addr->sa_family;
382 	char *addr_data = addr->sa_data, *cplim;
383 
384 	/*
385 	 * AF_LINK addresses can be looked up directly by their index number,
386 	 * so do that if we can.
387 	 */
388 	if (af == AF_LINK) {
389 	    register struct sockaddr_dl *sdl = (struct sockaddr_dl *)addr;
390 	    if (sdl->sdl_index && sdl->sdl_index <= if_index)
391 		return (ifnet_addrs[sdl->sdl_index - 1]);
392 	}
393 
394 	/*
395 	 * Scan though each interface, looking for ones that have
396 	 * addresses in this address family.
397 	 */
398 	for (ifp = ifnet.tqh_first; ifp; ifp = ifp->if_link.tqe_next) {
399 		for (ifa = ifp->if_addrhead.tqh_first; ifa;
400 		     ifa = ifa->ifa_link.tqe_next) {
401 			register char *cp, *cp2, *cp3;
402 
403 			if (ifa->ifa_addr->sa_family != af)
404 next:				continue;
405 			if (
406 #ifdef INET6 /* XXX: for maching gif tunnel dst as routing entry gateway */
407 			    addr->sa_family != AF_INET6 &&
408 #endif
409 			    ifp->if_flags & IFF_POINTOPOINT) {
410 				/*
411 				 * This is a bit broken as it doesn't
412 				 * take into account that the remote end may
413 				 * be a single node in the network we are
414 				 * looking for.
415 				 * The trouble is that we don't know the
416 				 * netmask for the remote end.
417 				 */
418 				if (ifa->ifa_dstaddr != 0
419 				    && equal(addr, ifa->ifa_dstaddr))
420  					return (ifa);
421 			} else {
422 				/*
423 				 * if we have a special address handler,
424 				 * then use it instead of the generic one.
425 				 */
426 	          		if (ifa->ifa_claim_addr) {
427 					if ((*ifa->ifa_claim_addr)(ifa, addr)) {
428 						return (ifa);
429 					} else {
430 						continue;
431 					}
432 				}
433 
434 				/*
435 				 * Scan all the bits in the ifa's address.
436 				 * If a bit dissagrees with what we are
437 				 * looking for, mask it with the netmask
438 				 * to see if it really matters.
439 				 * (A byte at a time)
440 				 */
441 				if (ifa->ifa_netmask == 0)
442 					continue;
443 				cp = addr_data;
444 				cp2 = ifa->ifa_addr->sa_data;
445 				cp3 = ifa->ifa_netmask->sa_data;
446 				cplim = ifa->ifa_netmask->sa_len
447 					+ (char *)ifa->ifa_netmask;
448 				while (cp3 < cplim)
449 					if ((*cp++ ^ *cp2++) & *cp3++)
450 						goto next; /* next address! */
451 				/*
452 				 * If the netmask of what we just found
453 				 * is more specific than what we had before
454 				 * (if we had one) then remember the new one
455 				 * before continuing to search
456 				 * for an even better one.
457 				 */
458 				if (ifa_maybe == 0 ||
459 				    rn_refines((caddr_t)ifa->ifa_netmask,
460 				    (caddr_t)ifa_maybe->ifa_netmask))
461 					ifa_maybe = ifa;
462 			}
463 		}
464 	}
465 	return (ifa_maybe);
466 }
467 
468 /*
469  * Find an interface address specific to an interface best matching
470  * a given address.
471  */
472 struct ifaddr *
473 ifaof_ifpforaddr(addr, ifp)
474 	struct sockaddr *addr;
475 	register struct ifnet *ifp;
476 {
477 	register struct ifaddr *ifa;
478 	register char *cp, *cp2, *cp3;
479 	register char *cplim;
480 	struct ifaddr *ifa_maybe = 0;
481 	u_int af = addr->sa_family;
482 
483 	if (af >= AF_MAX)
484 		return (0);
485 	for (ifa = ifp->if_addrhead.tqh_first; ifa;
486 	     ifa = ifa->ifa_link.tqe_next) {
487 		if (ifa->ifa_addr->sa_family != af)
488 			continue;
489 		if (ifa_maybe == 0)
490 			ifa_maybe = ifa;
491 		if (ifa->ifa_netmask == 0) {
492 			if (equal(addr, ifa->ifa_addr) ||
493 			    (ifa->ifa_dstaddr && equal(addr, ifa->ifa_dstaddr)))
494 				return (ifa);
495 			continue;
496 		}
497 		if (ifp->if_flags & IFF_POINTOPOINT) {
498 			if (equal(addr, ifa->ifa_dstaddr))
499 				return (ifa);
500 		} else {
501 			cp = addr->sa_data;
502 			cp2 = ifa->ifa_addr->sa_data;
503 			cp3 = ifa->ifa_netmask->sa_data;
504 			cplim = ifa->ifa_netmask->sa_len + (char *)ifa->ifa_netmask;
505 			for (; cp3 < cplim; cp3++)
506 				if ((*cp++ ^ *cp2++) & *cp3)
507 					break;
508 			if (cp3 == cplim)
509 				return (ifa);
510 		}
511 	}
512 	return (ifa_maybe);
513 }
514 
515 #include <net/route.h>
516 
517 /*
518  * Default action when installing a route with a Link Level gateway.
519  * Lookup an appropriate real ifa to point to.
520  * This should be moved to /sys/net/link.c eventually.
521  */
522 static void
523 link_rtrequest(cmd, rt, sa)
524 	int cmd;
525 	register struct rtentry *rt;
526 	struct sockaddr *sa;
527 {
528 	register struct ifaddr *ifa;
529 	struct sockaddr *dst;
530 	struct ifnet *ifp;
531 
532 	if (cmd != RTM_ADD || ((ifa = rt->rt_ifa) == 0) ||
533 	    ((ifp = ifa->ifa_ifp) == 0) || ((dst = rt_key(rt)) == 0))
534 		return;
535 	ifa = ifaof_ifpforaddr(dst, ifp);
536 	if (ifa) {
537 		IFAFREE(rt->rt_ifa);
538 		rt->rt_ifa = ifa;
539 		ifa->ifa_refcnt++;
540 		if (ifa->ifa_rtrequest && ifa->ifa_rtrequest != link_rtrequest)
541 			ifa->ifa_rtrequest(cmd, rt, sa);
542 	}
543 }
544 
545 /*
546  * Mark an interface down and notify protocols of
547  * the transition.
548  * NOTE: must be called at splnet or eqivalent.
549  */
550 void
551 if_unroute(ifp, flag, fam)
552 	register struct ifnet *ifp;
553 	int flag, fam;
554 {
555 	register struct ifaddr *ifa;
556 
557 	ifp->if_flags &= ~flag;
558 	getmicrotime(&ifp->if_lastchange);
559 	TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link)
560 		if (fam == PF_UNSPEC || (fam == ifa->ifa_addr->sa_family))
561 			pfctlinput(PRC_IFDOWN, ifa->ifa_addr);
562 	if_qflush(&ifp->if_snd);
563 	rt_ifmsg(ifp);
564 }
565 
566 /*
567  * Mark an interface up and notify protocols of
568  * the transition.
569  * NOTE: must be called at splnet or eqivalent.
570  */
571 void
572 if_route(ifp, flag, fam)
573 	register struct ifnet *ifp;
574 	int flag, fam;
575 {
576 	register struct ifaddr *ifa;
577 
578 	ifp->if_flags |= flag;
579 	getmicrotime(&ifp->if_lastchange);
580 	TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link)
581 		if (fam == PF_UNSPEC || (fam == ifa->ifa_addr->sa_family))
582 			pfctlinput(PRC_IFUP, ifa->ifa_addr);
583 	rt_ifmsg(ifp);
584 #ifdef INET6
585 	in6_if_up(ifp);
586 #endif
587 }
588 
589 /*
590  * Mark an interface down and notify protocols of
591  * the transition.
592  * NOTE: must be called at splnet or eqivalent.
593  */
594 void
595 if_down(ifp)
596 	register struct ifnet *ifp;
597 {
598 
599 	if_unroute(ifp, IFF_UP, AF_UNSPEC);
600 }
601 
602 /*
603  * Mark an interface up and notify protocols of
604  * the transition.
605  * NOTE: must be called at splnet or eqivalent.
606  */
607 void
608 if_up(ifp)
609 	register struct ifnet *ifp;
610 {
611 
612 	if_route(ifp, IFF_UP, AF_UNSPEC);
613 }
614 
615 /*
616  * Flush an interface queue.
617  */
618 static void
619 if_qflush(ifq)
620 	register struct ifqueue *ifq;
621 {
622 	register struct mbuf *m, *n;
623 
624 	n = ifq->ifq_head;
625 	while ((m = n) != 0) {
626 		n = m->m_act;
627 		m_freem(m);
628 	}
629 	ifq->ifq_head = 0;
630 	ifq->ifq_tail = 0;
631 	ifq->ifq_len = 0;
632 }
633 
634 /*
635  * Handle interface watchdog timer routines.  Called
636  * from softclock, we decrement timers (if set) and
637  * call the appropriate interface routine on expiration.
638  */
639 static void
640 if_slowtimo(arg)
641 	void *arg;
642 {
643 	register struct ifnet *ifp;
644 	int s = splimp();
645 
646 	for (ifp = ifnet.tqh_first; ifp; ifp = ifp->if_link.tqe_next) {
647 		if (ifp->if_timer == 0 || --ifp->if_timer)
648 			continue;
649 		if (ifp->if_watchdog)
650 			(*ifp->if_watchdog)(ifp);
651 	}
652 	splx(s);
653 	timeout(if_slowtimo, (void *)0, hz / IFNET_SLOWHZ);
654 }
655 
656 /*
657  * Map interface name to
658  * interface structure pointer.
659  */
660 struct ifnet *
661 ifunit(char *name)
662 {
663 	char namebuf[IFNAMSIZ + 1];
664 	char *cp;
665 	struct ifnet *ifp;
666 	int unit;
667 	unsigned len, m;
668 	char c;
669 
670 	len = strlen(name);
671 	if (len < 2 || len > IFNAMSIZ)
672 		return NULL;
673 	cp = name + len - 1;
674 	c = *cp;
675 	if (c < '0' || c > '9')
676 		return NULL;		/* trailing garbage */
677 	unit = 0;
678 	m = 1;
679 	do {
680 		if (cp == name)
681 			return NULL;	/* no interface name */
682 		unit += (c - '0') * m;
683 		if (unit > 1000000)
684 			return NULL;	/* number is unreasonable */
685 		m *= 10;
686 		c = *--cp;
687 	} while (c >= '0' && c <= '9');
688 	len = cp - name + 1;
689 	bcopy(name, namebuf, len);
690 	namebuf[len] = '\0';
691 	/*
692 	 * Now search all the interfaces for this name/number
693 	 */
694 	for (ifp = ifnet.tqh_first; ifp; ifp = ifp->if_link.tqe_next) {
695 		if (strcmp(ifp->if_name, namebuf))
696 			continue;
697 		if (unit == ifp->if_unit)
698 			break;
699 	}
700 	return (ifp);
701 }
702 
703 
704 /*
705  * Map interface name in a sockaddr_dl to
706  * interface structure pointer.
707  */
708 struct ifnet *
709 if_withname(sa)
710 	struct sockaddr *sa;
711 {
712 	char ifname[IFNAMSIZ+1];
713 	struct sockaddr_dl *sdl = (struct sockaddr_dl *)sa;
714 
715 	if ( (sa->sa_family != AF_LINK) || (sdl->sdl_nlen == 0) ||
716 	     (sdl->sdl_nlen > IFNAMSIZ) )
717 		return NULL;
718 
719 	/*
720 	 * ifunit wants a null-terminated name.  It may not be null-terminated
721 	 * in the sockaddr.  We don't want to change the caller's sockaddr,
722 	 * and there might not be room to put the trailing null anyway, so we
723 	 * make a local copy that we know we can null terminate safely.
724 	 */
725 
726 	bcopy(sdl->sdl_data, ifname, sdl->sdl_nlen);
727 	ifname[sdl->sdl_nlen] = '\0';
728 	return ifunit(ifname);
729 }
730 
731 
732 /*
733  * Interface ioctls.
734  */
735 int
736 ifioctl(so, cmd, data, p)
737 	struct socket *so;
738 	u_long cmd;
739 	caddr_t data;
740 	struct proc *p;
741 {
742 	register struct ifnet *ifp;
743 	register struct ifreq *ifr;
744 	struct ifstat *ifs;
745 	int error;
746 	short oif_flags;
747 
748 	switch (cmd) {
749 
750 	case SIOCGIFCONF:
751 	case OSIOCGIFCONF:
752 		return (ifconf(cmd, data));
753 	}
754 	ifr = (struct ifreq *)data;
755 	ifp = ifunit(ifr->ifr_name);
756 	if (ifp == 0)
757 		return (ENXIO);
758 	switch (cmd) {
759 
760 	case SIOCGIFFLAGS:
761 		ifr->ifr_flags = ifp->if_flags;
762 		break;
763 
764 	case SIOCGIFMETRIC:
765 		ifr->ifr_metric = ifp->if_metric;
766 		break;
767 
768 	case SIOCGIFMTU:
769 		ifr->ifr_mtu = ifp->if_mtu;
770 		break;
771 
772 	case SIOCGIFPHYS:
773 		ifr->ifr_phys = ifp->if_physical;
774 		break;
775 
776 	case SIOCSIFFLAGS:
777 		error = suser(p);
778 		if (error)
779 			return (error);
780 		ifr->ifr_prevflags = ifp->if_flags;
781 		if (ifp->if_flags & IFF_SMART) {
782 			/* Smart drivers twiddle their own routes */
783 		} else if (ifp->if_flags & IFF_UP &&
784 		    (ifr->ifr_flags & IFF_UP) == 0) {
785 			int s = splimp();
786 			if_down(ifp);
787 			splx(s);
788 		} else if (ifr->ifr_flags & IFF_UP &&
789 		    (ifp->if_flags & IFF_UP) == 0) {
790 			int s = splimp();
791 			if_up(ifp);
792 			splx(s);
793 		}
794 		ifp->if_flags = (ifp->if_flags & IFF_CANTCHANGE) |
795 			(ifr->ifr_flags &~ IFF_CANTCHANGE);
796 		if (ifp->if_ioctl)
797 			(void) (*ifp->if_ioctl)(ifp, cmd, data);
798 		getmicrotime(&ifp->if_lastchange);
799 		break;
800 
801 	case SIOCSIFMETRIC:
802 		error = suser(p);
803 		if (error)
804 			return (error);
805 		ifp->if_metric = ifr->ifr_metric;
806 		getmicrotime(&ifp->if_lastchange);
807 		break;
808 
809 	case SIOCSIFPHYS:
810 		error = suser(p);
811 		if (error)
812 			return error;
813 		if (!ifp->if_ioctl)
814 		        return EOPNOTSUPP;
815 		error = (*ifp->if_ioctl)(ifp, cmd, data);
816 		if (error == 0)
817 			getmicrotime(&ifp->if_lastchange);
818 		return(error);
819 
820 	case SIOCSIFMTU:
821 	{
822 		u_long oldmtu = ifp->if_mtu;
823 
824 		error = suser(p);
825 		if (error)
826 			return (error);
827 		if (ifp->if_ioctl == NULL)
828 			return (EOPNOTSUPP);
829 		if (ifr->ifr_mtu < IF_MINMTU || ifr->ifr_mtu > IF_MAXMTU)
830 			return (EINVAL);
831 		error = (*ifp->if_ioctl)(ifp, cmd, data);
832 		if (error == 0)
833 			getmicrotime(&ifp->if_lastchange);
834 		/*
835 		 * If the link MTU changed, do network layer specific procedure.
836 		 */
837 		if (ifp->if_mtu != oldmtu) {
838 #ifdef INET6
839 			nd6_setmtu(ifp);
840 #endif
841 		}
842 		return (error);
843 	}
844 
845 	case SIOCADDMULTI:
846 	case SIOCDELMULTI:
847 		error = suser(p);
848 		if (error)
849 			return (error);
850 
851 		/* Don't allow group membership on non-multicast interfaces. */
852 		if ((ifp->if_flags & IFF_MULTICAST) == 0)
853 			return EOPNOTSUPP;
854 
855 		/* Don't let users screw up protocols' entries. */
856 		if (ifr->ifr_addr.sa_family != AF_LINK)
857 			return EINVAL;
858 
859 		if (cmd == SIOCADDMULTI) {
860 			struct ifmultiaddr *ifma;
861 			error = if_addmulti(ifp, &ifr->ifr_addr, &ifma);
862 		} else {
863 			error = if_delmulti(ifp, &ifr->ifr_addr);
864 		}
865 		if (error == 0)
866 			getmicrotime(&ifp->if_lastchange);
867 		return error;
868 
869         case SIOCSIFMEDIA:
870 	case SIOCSIFGENERIC:
871 		error = suser(p);
872 		if (error)
873 			return (error);
874 		if (ifp->if_ioctl == 0)
875 			return (EOPNOTSUPP);
876 		error = (*ifp->if_ioctl)(ifp, cmd, data);
877 		if (error == 0)
878 			getmicrotime(&ifp->if_lastchange);
879 		return error;
880 
881 	case SIOCGIFSTATUS:
882 		ifs = (struct ifstat *)data;
883 		ifs->ascii[0] = '\0';
884 
885 	case SIOCGIFMEDIA:
886 	case SIOCGIFGENERIC:
887 		if (ifp->if_ioctl == 0)
888 			return (EOPNOTSUPP);
889 		return ((*ifp->if_ioctl)(ifp, cmd, data));
890 
891 	default:
892 		oif_flags = ifp->if_flags;
893 		if (so->so_proto == 0)
894 			return (EOPNOTSUPP);
895 #ifndef COMPAT_43
896 		error = ((*so->so_proto->pr_usrreqs->pru_control)(so, cmd,
897 								 data,
898 								 ifp, p));
899 #else
900 	    {
901 		int ocmd = cmd;
902 
903 		switch (cmd) {
904 
905 		case SIOCSIFDSTADDR:
906 		case SIOCSIFADDR:
907 		case SIOCSIFBRDADDR:
908 		case SIOCSIFNETMASK:
909 #if BYTE_ORDER != BIG_ENDIAN
910 			if (ifr->ifr_addr.sa_family == 0 &&
911 			    ifr->ifr_addr.sa_len < 16) {
912 				ifr->ifr_addr.sa_family = ifr->ifr_addr.sa_len;
913 				ifr->ifr_addr.sa_len = 16;
914 			}
915 #else
916 			if (ifr->ifr_addr.sa_len == 0)
917 				ifr->ifr_addr.sa_len = 16;
918 #endif
919 			break;
920 
921 		case OSIOCGIFADDR:
922 			cmd = SIOCGIFADDR;
923 			break;
924 
925 		case OSIOCGIFDSTADDR:
926 			cmd = SIOCGIFDSTADDR;
927 			break;
928 
929 		case OSIOCGIFBRDADDR:
930 			cmd = SIOCGIFBRDADDR;
931 			break;
932 
933 		case OSIOCGIFNETMASK:
934 			cmd = SIOCGIFNETMASK;
935 		}
936 		error =  ((*so->so_proto->pr_usrreqs->pru_control)(so,
937 								   cmd,
938 								   data,
939 								   ifp, p));
940 		switch (ocmd) {
941 
942 		case OSIOCGIFADDR:
943 		case OSIOCGIFDSTADDR:
944 		case OSIOCGIFBRDADDR:
945 		case OSIOCGIFNETMASK:
946 			*(u_short *)&ifr->ifr_addr = ifr->ifr_addr.sa_family;
947 
948 		}
949 	    }
950 #endif /* COMPAT_43 */
951 
952 		if ((oif_flags ^ ifp->if_flags) & IFF_UP) {
953 #ifdef INET6
954 			if (ifp->if_flags & IFF_UP) {
955 				int s = splimp();
956 				in6_if_up(ifp);
957 				splx(s);
958 			}
959 #endif
960 		}
961 		return (error);
962 
963 	}
964 	return (0);
965 }
966 
967 /*
968  * Set/clear promiscuous mode on interface ifp based on the truth value
969  * of pswitch.  The calls are reference counted so that only the first
970  * "on" request actually has an effect, as does the final "off" request.
971  * Results are undefined if the "off" and "on" requests are not matched.
972  */
973 int
974 ifpromisc(ifp, pswitch)
975 	struct ifnet *ifp;
976 	int pswitch;
977 {
978 	struct ifreq ifr;
979 	int error;
980 
981 	if (pswitch) {
982 		/*
983 		 * If the device is not configured up, we cannot put it in
984 		 * promiscuous mode.
985 		 */
986 		if ((ifp->if_flags & IFF_UP) == 0)
987 			return (ENETDOWN);
988 		if (ifp->if_pcount++ != 0)
989 			return (0);
990 		ifp->if_flags |= IFF_PROMISC;
991 		log(LOG_INFO, "%s%d: promiscuous mode enabled\n",
992 		    ifp->if_name, ifp->if_unit);
993 	} else {
994 		if (--ifp->if_pcount > 0)
995 			return (0);
996 		ifp->if_flags &= ~IFF_PROMISC;
997 		log(LOG_INFO, "%s%d: promiscuous mode disabled\n",
998 		    ifp->if_name, ifp->if_unit);
999 	}
1000 	ifr.ifr_flags = ifp->if_flags;
1001 	error = (*ifp->if_ioctl)(ifp, SIOCSIFFLAGS, (caddr_t)&ifr);
1002 	if (error == 0)
1003 		rt_ifmsg(ifp);
1004 	return error;
1005 }
1006 
1007 /*
1008  * Return interface configuration
1009  * of system.  List may be used
1010  * in later ioctl's (above) to get
1011  * other information.
1012  */
1013 /*ARGSUSED*/
1014 static int
1015 ifconf(cmd, data)
1016 	u_long cmd;
1017 	caddr_t data;
1018 {
1019 	register struct ifconf *ifc = (struct ifconf *)data;
1020 	register struct ifnet *ifp = ifnet.tqh_first;
1021 	register struct ifaddr *ifa;
1022 	struct ifreq ifr, *ifrp;
1023 	int space = ifc->ifc_len, error = 0;
1024 
1025 	ifrp = ifc->ifc_req;
1026 	for (; space > sizeof (ifr) && ifp; ifp = ifp->if_link.tqe_next) {
1027 		char workbuf[64];
1028 		int ifnlen, addrs;
1029 
1030 		ifnlen = snprintf(workbuf, sizeof(workbuf),
1031 		    "%s%d", ifp->if_name, ifp->if_unit);
1032 		if(ifnlen + 1 > sizeof ifr.ifr_name) {
1033 			error = ENAMETOOLONG;
1034 		} else {
1035 			strcpy(ifr.ifr_name, workbuf);
1036 		}
1037 
1038 		addrs = 0;
1039 		ifa = ifp->if_addrhead.tqh_first;
1040 		for ( ; space > sizeof (ifr) && ifa;
1041 		    ifa = ifa->ifa_link.tqe_next) {
1042 			register struct sockaddr *sa = ifa->ifa_addr;
1043 			if (curproc->p_prison && prison_if(curproc, sa))
1044 				continue;
1045 			addrs++;
1046 #ifdef COMPAT_43
1047 			if (cmd == OSIOCGIFCONF) {
1048 				struct osockaddr *osa =
1049 					 (struct osockaddr *)&ifr.ifr_addr;
1050 				ifr.ifr_addr = *sa;
1051 				osa->sa_family = sa->sa_family;
1052 				error = copyout((caddr_t)&ifr, (caddr_t)ifrp,
1053 						sizeof (ifr));
1054 				ifrp++;
1055 			} else
1056 #endif
1057 			if (sa->sa_len <= sizeof(*sa)) {
1058 				ifr.ifr_addr = *sa;
1059 				error = copyout((caddr_t)&ifr, (caddr_t)ifrp,
1060 						sizeof (ifr));
1061 				ifrp++;
1062 			} else {
1063 				space -= sa->sa_len - sizeof(*sa);
1064 				if (space < sizeof (ifr))
1065 					break;
1066 				error = copyout((caddr_t)&ifr, (caddr_t)ifrp,
1067 						sizeof (ifr.ifr_name));
1068 				if (error == 0)
1069 				    error = copyout((caddr_t)sa,
1070 				      (caddr_t)&ifrp->ifr_addr, sa->sa_len);
1071 				ifrp = (struct ifreq *)
1072 					(sa->sa_len + (caddr_t)&ifrp->ifr_addr);
1073 			}
1074 			if (error)
1075 				break;
1076 			space -= sizeof (ifr);
1077 		}
1078 		if (!addrs) {
1079 			bzero((caddr_t)&ifr.ifr_addr, sizeof(ifr.ifr_addr));
1080 			error = copyout((caddr_t)&ifr, (caddr_t)ifrp,
1081 			    sizeof (ifr));
1082 			if (error)
1083 				break;
1084 			space -= sizeof (ifr), ifrp++;
1085 		}
1086 	}
1087 	ifc->ifc_len -= space;
1088 	return (error);
1089 }
1090 
1091 /*
1092  * Just like if_promisc(), but for all-multicast-reception mode.
1093  */
1094 int
1095 if_allmulti(ifp, onswitch)
1096 	struct ifnet *ifp;
1097 	int onswitch;
1098 {
1099 	int error = 0;
1100 	int s = splimp();
1101 
1102 	if (onswitch) {
1103 		if (ifp->if_amcount++ == 0) {
1104 			ifp->if_flags |= IFF_ALLMULTI;
1105 			error = ifp->if_ioctl(ifp, SIOCSIFFLAGS, 0);
1106 		}
1107 	} else {
1108 		if (ifp->if_amcount > 1) {
1109 			ifp->if_amcount--;
1110 		} else {
1111 			ifp->if_amcount = 0;
1112 			ifp->if_flags &= ~IFF_ALLMULTI;
1113 			error = ifp->if_ioctl(ifp, SIOCSIFFLAGS, 0);
1114 		}
1115 	}
1116 	splx(s);
1117 
1118 	if (error == 0)
1119 		rt_ifmsg(ifp);
1120 	return error;
1121 }
1122 
1123 /*
1124  * Add a multicast listenership to the interface in question.
1125  * The link layer provides a routine which converts
1126  */
1127 int
1128 if_addmulti(ifp, sa, retifma)
1129 	struct ifnet *ifp;	/* interface to manipulate */
1130 	struct sockaddr *sa;	/* address to add */
1131 	struct ifmultiaddr **retifma;
1132 {
1133 	struct sockaddr *llsa, *dupsa;
1134 	int error, s;
1135 	struct ifmultiaddr *ifma;
1136 
1137 	/*
1138 	 * If the matching multicast address already exists
1139 	 * then don't add a new one, just add a reference
1140 	 */
1141 	for (ifma = ifp->if_multiaddrs.lh_first; ifma;
1142 	     ifma = ifma->ifma_link.le_next) {
1143 		if (equal(sa, ifma->ifma_addr)) {
1144 			ifma->ifma_refcount++;
1145 			if (retifma)
1146 				*retifma = ifma;
1147 			return 0;
1148 		}
1149 	}
1150 
1151 	/*
1152 	 * Give the link layer a chance to accept/reject it, and also
1153 	 * find out which AF_LINK address this maps to, if it isn't one
1154 	 * already.
1155 	 */
1156 	if (ifp->if_resolvemulti) {
1157 		error = ifp->if_resolvemulti(ifp, &llsa, sa);
1158 		if (error) return error;
1159 	} else {
1160 		llsa = 0;
1161 	}
1162 
1163 	MALLOC(ifma, struct ifmultiaddr *, sizeof *ifma, M_IFMADDR, M_WAITOK);
1164 	MALLOC(dupsa, struct sockaddr *, sa->sa_len, M_IFMADDR, M_WAITOK);
1165 	bcopy(sa, dupsa, sa->sa_len);
1166 
1167 	ifma->ifma_addr = dupsa;
1168 	ifma->ifma_lladdr = llsa;
1169 	ifma->ifma_ifp = ifp;
1170 	ifma->ifma_refcount = 1;
1171 	ifma->ifma_protospec = 0;
1172 	rt_newmaddrmsg(RTM_NEWMADDR, ifma);
1173 
1174 	/*
1175 	 * Some network interfaces can scan the address list at
1176 	 * interrupt time; lock them out.
1177 	 */
1178 	s = splimp();
1179 	LIST_INSERT_HEAD(&ifp->if_multiaddrs, ifma, ifma_link);
1180 	splx(s);
1181 	*retifma = ifma;
1182 
1183 	if (llsa != 0) {
1184 		for (ifma = ifp->if_multiaddrs.lh_first; ifma;
1185 		     ifma = ifma->ifma_link.le_next) {
1186 			if (equal(ifma->ifma_addr, llsa))
1187 				break;
1188 		}
1189 		if (ifma) {
1190 			ifma->ifma_refcount++;
1191 		} else {
1192 			MALLOC(ifma, struct ifmultiaddr *, sizeof *ifma,
1193 			       M_IFMADDR, M_WAITOK);
1194 			MALLOC(dupsa, struct sockaddr *, llsa->sa_len,
1195 			       M_IFMADDR, M_WAITOK);
1196 			bcopy(llsa, dupsa, llsa->sa_len);
1197 			ifma->ifma_addr = dupsa;
1198 			ifma->ifma_ifp = ifp;
1199 			ifma->ifma_refcount = 1;
1200 			s = splimp();
1201 			LIST_INSERT_HEAD(&ifp->if_multiaddrs, ifma, ifma_link);
1202 			splx(s);
1203 		}
1204 	}
1205 	/*
1206 	 * We are certain we have added something, so call down to the
1207 	 * interface to let them know about it.
1208 	 */
1209 	s = splimp();
1210 	ifp->if_ioctl(ifp, SIOCADDMULTI, 0);
1211 	splx(s);
1212 
1213 	return 0;
1214 }
1215 
1216 /*
1217  * Remove a reference to a multicast address on this interface.  Yell
1218  * if the request does not match an existing membership.
1219  */
1220 int
1221 if_delmulti(ifp, sa)
1222 	struct ifnet *ifp;
1223 	struct sockaddr *sa;
1224 {
1225 	struct ifmultiaddr *ifma;
1226 	int s;
1227 
1228 	for (ifma = ifp->if_multiaddrs.lh_first; ifma;
1229 	     ifma = ifma->ifma_link.le_next)
1230 		if (equal(sa, ifma->ifma_addr))
1231 			break;
1232 	if (ifma == 0)
1233 		return ENOENT;
1234 
1235 	if (ifma->ifma_refcount > 1) {
1236 		ifma->ifma_refcount--;
1237 		return 0;
1238 	}
1239 
1240 	rt_newmaddrmsg(RTM_DELMADDR, ifma);
1241 	sa = ifma->ifma_lladdr;
1242 	s = splimp();
1243 	LIST_REMOVE(ifma, ifma_link);
1244 	splx(s);
1245 	free(ifma->ifma_addr, M_IFMADDR);
1246 	free(ifma, M_IFMADDR);
1247 	if (sa == 0)
1248 		return 0;
1249 
1250 	/*
1251 	 * Now look for the link-layer address which corresponds to
1252 	 * this network address.  It had been squirreled away in
1253 	 * ifma->ifma_lladdr for this purpose (so we don't have
1254 	 * to call ifp->if_resolvemulti() again), and we saved that
1255 	 * value in sa above.  If some nasty deleted the
1256 	 * link-layer address out from underneath us, we can deal because
1257 	 * the address we stored was is not the same as the one which was
1258 	 * in the record for the link-layer address.  (So we don't complain
1259 	 * in that case.)
1260 	 */
1261 	for (ifma = ifp->if_multiaddrs.lh_first; ifma;
1262 	     ifma = ifma->ifma_link.le_next)
1263 		if (equal(sa, ifma->ifma_addr))
1264 			break;
1265 	if (ifma == 0)
1266 		return 0;
1267 
1268 	if (ifma->ifma_refcount > 1) {
1269 		ifma->ifma_refcount--;
1270 		return 0;
1271 	}
1272 
1273 	s = splimp();
1274 	LIST_REMOVE(ifma, ifma_link);
1275 	ifp->if_ioctl(ifp, SIOCDELMULTI, 0);
1276 	splx(s);
1277 	free(ifma->ifma_addr, M_IFMADDR);
1278 	free(sa, M_IFMADDR);
1279 	free(ifma, M_IFMADDR);
1280 
1281 	return 0;
1282 }
1283 
1284 struct ifmultiaddr *
1285 ifmaof_ifpforaddr(sa, ifp)
1286 	struct sockaddr *sa;
1287 	struct ifnet *ifp;
1288 {
1289 	struct ifmultiaddr *ifma;
1290 
1291 	for (ifma = ifp->if_multiaddrs.lh_first; ifma;
1292 	     ifma = ifma->ifma_link.le_next)
1293 		if (equal(ifma->ifma_addr, sa))
1294 			break;
1295 
1296 	return ifma;
1297 }
1298 
1299 SYSCTL_NODE(_net, PF_LINK, link, CTLFLAG_RW, 0, "Link layers");
1300 SYSCTL_NODE(_net_link, 0, generic, CTLFLAG_RW, 0, "Generic link-management");
1301