xref: /freebsd/sys/net/if.c (revision af50ea380f6d56a33720eee1fd8b16e0766833c8)
1c398230bSWarner Losh /*-
2df8bae1dSRodney W. Grimes  * Copyright (c) 1980, 1986, 1993
3df8bae1dSRodney W. Grimes  *	The Regents of the University of California.  All rights reserved.
4df8bae1dSRodney W. Grimes  *
5df8bae1dSRodney W. Grimes  * Redistribution and use in source and binary forms, with or without
6df8bae1dSRodney W. Grimes  * modification, are permitted provided that the following conditions
7df8bae1dSRodney W. Grimes  * are met:
8df8bae1dSRodney W. Grimes  * 1. Redistributions of source code must retain the above copyright
9df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer.
10df8bae1dSRodney W. Grimes  * 2. Redistributions in binary form must reproduce the above copyright
11df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer in the
12df8bae1dSRodney W. Grimes  *    documentation and/or other materials provided with the distribution.
13df8bae1dSRodney W. Grimes  * 4. Neither the name of the University nor the names of its contributors
14df8bae1dSRodney W. Grimes  *    may be used to endorse or promote products derived from this software
15df8bae1dSRodney W. Grimes  *    without specific prior written permission.
16df8bae1dSRodney W. Grimes  *
17df8bae1dSRodney W. Grimes  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
18df8bae1dSRodney W. Grimes  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19df8bae1dSRodney W. Grimes  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20df8bae1dSRodney W. Grimes  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
21df8bae1dSRodney W. Grimes  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22df8bae1dSRodney W. Grimes  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23df8bae1dSRodney W. Grimes  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24df8bae1dSRodney W. Grimes  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25df8bae1dSRodney W. Grimes  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26df8bae1dSRodney W. Grimes  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27df8bae1dSRodney W. Grimes  * SUCH DAMAGE.
28df8bae1dSRodney W. Grimes  *
2966afbd68SRuslan Ermilov  *	@(#)if.c	8.5 (Berkeley) 1/9/95
30c3aac50fSPeter Wemm  * $FreeBSD$
31df8bae1dSRodney W. Grimes  */
32df8bae1dSRodney W. Grimes 
335591b823SEivind Eklund #include "opt_compat.h"
34cfa1ca9dSYoshinobu Inoue #include "opt_inet6.h"
350d0f9d1eSYoshinobu Inoue #include "opt_inet.h"
365591b823SEivind Eklund 
37df8bae1dSRodney W. Grimes #include <sys/param.h>
384dcf2bbbSBrooks Davis #include <sys/types.h>
39f13ad206SJonathan Lemon #include <sys/conf.h>
404d1d4912SBruce Evans #include <sys/malloc.h>
414dcf2bbbSBrooks Davis #include <sys/sbuf.h>
42d2b4566aSJonathan Lemon #include <sys/bus.h>
43df8bae1dSRodney W. Grimes #include <sys/mbuf.h>
44df8bae1dSRodney W. Grimes #include <sys/systm.h>
45acd3428bSRobert Watson #include <sys/priv.h>
46df8bae1dSRodney W. Grimes #include <sys/proc.h>
47df8bae1dSRodney W. Grimes #include <sys/socket.h>
48df8bae1dSRodney W. Grimes #include <sys/socketvar.h>
49df8bae1dSRodney W. Grimes #include <sys/protosw.h>
50df8bae1dSRodney W. Grimes #include <sys/kernel.h>
51653735c4SBjoern A. Zeeb #include <sys/lock.h>
5227d37320SRobert Watson #include <sys/refcount.h>
5321ca7b57SMarko Zec #include <sys/module.h>
54653735c4SBjoern A. Zeeb #include <sys/rwlock.h>
5551a53488SBruce Evans #include <sys/sockio.h>
56963e4c2aSGarrett Wollman #include <sys/syslog.h>
57602d513cSGarrett Wollman #include <sys/sysctl.h>
58af5e59bfSRobert Watson #include <sys/taskqueue.h>
5931b1bfe1SHajimu UMEMOTO #include <sys/domain.h>
6091421ba2SRobert Watson #include <sys/jail.h>
6135fd7bc0SBjoern A. Zeeb #include <sys/priv.h>
6235fd7bc0SBjoern A. Zeeb 
63fa882e87SBrooks Davis #include <machine/stdarg.h>
646e6b3f7cSQing Li #include <vm/uma.h>
65df8bae1dSRodney W. Grimes 
66df8bae1dSRodney W. Grimes #include <net/if.h>
675a97c9d4SBjoern A. Zeeb #include <net/if_arp.h>
68f889d2efSBrooks Davis #include <net/if_clone.h>
69df8bae1dSRodney W. Grimes #include <net/if_dl.h>
7066ce51ceSArchie Cobbs #include <net/if_types.h>
7130aad87dSBrooks Davis #include <net/if_var.h>
729448326fSPoul-Henning Kamp #include <net/radix.h>
735500d3beSWarner Losh #include <net/route.h>
744b79449eSBjoern A. Zeeb #include <net/vnet.h>
75df8bae1dSRodney W. Grimes 
760d0f9d1eSYoshinobu Inoue #if defined(INET) || defined(INET6)
7782cd038dSYoshinobu Inoue #include <netinet/in.h>
780d0f9d1eSYoshinobu Inoue #include <netinet/in_var.h>
793c914c54SAndre Oppermann #include <netinet/ip.h>
809963e8a5SWill Andrews #include <netinet/ip_carp.h>
813c914c54SAndre Oppermann #ifdef INET
823c914c54SAndre Oppermann #include <netinet/if_ether.h>
833c914c54SAndre Oppermann #endif /* INET */
843411310dSYoshinobu Inoue #ifdef INET6
85978ee2edSJun-ichiro itojun Hagino #include <netinet6/in6_var.h>
86978ee2edSJun-ichiro itojun Hagino #include <netinet6/in6_ifattach.h>
873c914c54SAndre Oppermann #endif /* INET6 */
883c914c54SAndre Oppermann #endif /* INET || INET6 */
8982cd038dSYoshinobu Inoue 
90aed55708SRobert Watson #include <security/mac/mac_framework.h>
91aed55708SRobert Watson 
929af74f3dSSergey Kandaurov #ifdef COMPAT_FREEBSD32
939af74f3dSSergey Kandaurov #include <sys/mount.h>
949af74f3dSSergey Kandaurov #include <compat/freebsd32/freebsd32.h>
959af74f3dSSergey Kandaurov #endif
969af74f3dSSergey Kandaurov 
976cb7f168SBrooks Davis struct ifindex_entry {
986cb7f168SBrooks Davis 	struct  ifnet *ife_ifnet;
996cb7f168SBrooks Davis };
1006cb7f168SBrooks Davis 
1015515c2e7SGleb Smirnoff SYSCTL_NODE(_net, PF_LINK, link, CTLFLAG_RW, 0, "Link layers");
1025515c2e7SGleb Smirnoff SYSCTL_NODE(_net_link, 0, generic, CTLFLAG_RW, 0, "Generic link-management");
1035515c2e7SGleb Smirnoff 
104e50d35e6SMaxim Sobolev TUNABLE_INT("net.link.ifqmaxlen", &ifqmaxlen);
105f88910cdSMatthew D Fleming SYSCTL_INT(_net_link, OID_AUTO, ifqmaxlen, CTLFLAG_RDTUN,
106e50d35e6SMaxim Sobolev     &ifqmaxlen, 0, "max send queue size");
107e50d35e6SMaxim Sobolev 
1085515c2e7SGleb Smirnoff /* Log link state change events */
1095515c2e7SGleb Smirnoff static int log_link_state_change = 1;
1105515c2e7SGleb Smirnoff 
1115515c2e7SGleb Smirnoff SYSCTL_INT(_net_link, OID_AUTO, log_link_state_change, CTLFLAG_RW,
1125515c2e7SGleb Smirnoff 	&log_link_state_change, 0,
1135515c2e7SGleb Smirnoff 	"log interface link state change events");
1145515c2e7SGleb Smirnoff 
115215940b3SXin LI /* Interface description */
116215940b3SXin LI static unsigned int ifdescr_maxlen = 1024;
117215940b3SXin LI SYSCTL_UINT(_net, OID_AUTO, ifdescr_maxlen, CTLFLAG_RW,
118215940b3SXin LI 	&ifdescr_maxlen, 0,
119215940b3SXin LI 	"administrative maximum length for interface description");
120215940b3SXin LI 
121d745c852SEd Schouten static MALLOC_DEFINE(M_IFDESCR, "ifdescr", "ifnet descriptions");
122215940b3SXin LI 
123215940b3SXin LI /* global sx for non-critical path ifdescr */
124215940b3SXin LI static struct sx ifdescr_sx;
125215940b3SXin LI SX_SYSINIT(ifdescr_sx, &ifdescr_sx, "ifnet descr");
126215940b3SXin LI 
1277702d401SAndrew Thompson void	(*bridge_linkstate_p)(struct ifnet *ifp);
1281c7899c7SGleb Smirnoff void	(*ng_ether_link_state_p)(struct ifnet *ifp, int state);
12918242d3bSAndrew Thompson void	(*lagg_linkstate_p)(struct ifnet *ifp, int state);
1309963e8a5SWill Andrews /* These are external hooks for CARP. */
13154bfbd51SWill Andrews void	(*carp_linkstate_p)(struct ifnet *ifp);
132f08535f8SGleb Smirnoff void	(*carp_demote_adj_p)(int, char *);
13324421c1cSGleb Smirnoff int	(*carp_master_p)(struct ifaddr *);
1349963e8a5SWill Andrews #if defined(INET) || defined(INET6)
13508b68b0eSGleb Smirnoff int	(*carp_forus_p)(struct ifnet *ifp, u_char *dhost);
1369963e8a5SWill Andrews int	(*carp_output_p)(struct ifnet *ifp, struct mbuf *m,
13747e8d432SGleb Smirnoff     const struct sockaddr *sa);
13808b68b0eSGleb Smirnoff int	(*carp_ioctl_p)(struct ifreq *, u_long, struct thread *);
13908b68b0eSGleb Smirnoff int	(*carp_attach_p)(struct ifaddr *, int);
14008b68b0eSGleb Smirnoff void	(*carp_detach_p)(struct ifaddr *);
1419963e8a5SWill Andrews #endif
1429963e8a5SWill Andrews #ifdef INET
14308b68b0eSGleb Smirnoff int	(*carp_iamatch_p)(struct ifaddr *, uint8_t **);
1449963e8a5SWill Andrews #endif
1459963e8a5SWill Andrews #ifdef INET6
1469963e8a5SWill Andrews struct ifaddr *(*carp_iamatch6_p)(struct ifnet *ifp, struct in6_addr *taddr6);
1479963e8a5SWill Andrews caddr_t	(*carp_macmatch6_p)(struct ifnet *ifp, struct mbuf *m,
1489963e8a5SWill Andrews     const struct in6_addr *taddr);
1499963e8a5SWill Andrews #endif
1501c7899c7SGleb Smirnoff 
1514cb655c0SMax Laier struct mbuf *(*tbr_dequeue_ptr)(struct ifaltq *, int) = NULL;
1524cb655c0SMax Laier 
153ec002feeSBruce M Simpson /*
154ec002feeSBruce M Simpson  * XXX: Style; these should be sorted alphabetically, and unprototyped
155ec002feeSBruce M Simpson  * static functions should be prototyped. Currently they are sorted by
156ec002feeSBruce M Simpson  * declaration order.
157ec002feeSBruce M Simpson  */
15831b1bfe1SHajimu UMEMOTO static void	if_attachdomain(void *);
15931b1bfe1SHajimu UMEMOTO static void	if_attachdomain1(struct ifnet *);
1600b59d917SJonathan Lemon static int	ifconf(u_long, caddr_t);
161ec002feeSBruce M Simpson static void	if_freemulti(struct ifmultiaddr *);
162f9132cebSJonathan Lemon static void	if_init(void *);
1638e937462SRobert Watson static void	if_grow(void);
1648614fb12SMax Laier static void	if_route(struct ifnet *, int flag, int fam);
1651a3b6859SYaroslav Tykhiy static int	if_setflag(struct ifnet *, int, int, int *, int);
166db7f0b97SKip Macy static int	if_transmit(struct ifnet *ifp, struct mbuf *m);
1678614fb12SMax Laier static void	if_unroute(struct ifnet *, int flag, int fam);
1688071913dSRuslan Ermilov static void	link_rtrequest(int, struct rtentry *, struct rt_addrinfo *);
1690b59d917SJonathan Lemon static int	if_rtdel(struct radix_node *, void *);
170f13ad206SJonathan Lemon static int	ifhwioctl(u_long, struct ifnet *, caddr_t, struct thread *);
171ec002feeSBruce M Simpson static int	if_delmulti_locked(struct ifnet *, struct ifmultiaddr *, int);
17268a3482fSGleb Smirnoff static void	do_link_state_change(void *, int);
1730dad3f0eSMax Laier static int	if_getgroup(struct ifgroupreq *, struct ifnet *);
1740dad3f0eSMax Laier static int	if_getgroupmembers(struct ifgroupreq *);
1758623f9fdSMax Laier static void	if_delgroups(struct ifnet *);
176e0c14af9SMarko Zec static void	if_attach_internal(struct ifnet *, int);
177e0c14af9SMarko Zec static void	if_detach_internal(struct ifnet *, int);
178db7f0b97SKip Macy 
17982cd038dSYoshinobu Inoue #ifdef INET6
18082cd038dSYoshinobu Inoue /*
18182cd038dSYoshinobu Inoue  * XXX: declare here to avoid to include many inet6 related files..
18282cd038dSYoshinobu Inoue  * should be more generalized?
18382cd038dSYoshinobu Inoue  */
184929ddbbbSAlfred Perlstein extern void	nd6_setmtu(struct ifnet *);
18582cd038dSYoshinobu Inoue #endif
18682cd038dSYoshinobu Inoue 
18782cea7e6SBjoern A. Zeeb VNET_DEFINE(int, if_index);
18882cea7e6SBjoern A. Zeeb int	ifqmaxlen = IFQ_MAXLEN;
189eddfbb76SRobert Watson VNET_DEFINE(struct ifnethead, ifnet);	/* depend on static init XXX */
190eddfbb76SRobert Watson VNET_DEFINE(struct ifgrouphead, ifg_head);
19182cea7e6SBjoern A. Zeeb 
1923e288e62SDimitry Andric static VNET_DEFINE(int, if_indexlim) = 8;
193eddfbb76SRobert Watson 
19477dfcdc4SRobert Watson /* Table of ifnet by index. */
195a38de013SBjoern A. Zeeb VNET_DEFINE(struct ifindex_entry *, ifindex_table);
196eddfbb76SRobert Watson 
1971e77c105SRobert Watson #define	V_if_indexlim		VNET(if_indexlim)
1981e77c105SRobert Watson #define	V_ifindex_table		VNET(ifindex_table)
19944e33a07SMarko Zec 
20077dfcdc4SRobert Watson /*
20177dfcdc4SRobert Watson  * The global network interface list (V_ifnet) and related state (such as
20277dfcdc4SRobert Watson  * if_index, if_indexlim, and ifindex_table) are protected by an sxlock and
20377dfcdc4SRobert Watson  * an rwlock.  Either may be acquired shared to stablize the list, but both
20477dfcdc4SRobert Watson  * must be acquired writable to modify the list.  This model allows us to
20577dfcdc4SRobert Watson  * both stablize the interface list during interrupt thread processing, but
20677dfcdc4SRobert Watson  * also to stablize it over long-running ioctls, without introducing priority
20777dfcdc4SRobert Watson  * inversions and deadlocks.
20877dfcdc4SRobert Watson  */
209f89d4c3aSAndre Oppermann struct rwlock ifnet_rwlock;
21077dfcdc4SRobert Watson struct sx ifnet_sxlock;
21177dfcdc4SRobert Watson 
212ed2dabfcSRobert Watson /*
213ed2dabfcSRobert Watson  * The allocation of network interfaces is a rather non-atomic affair; we
214ed2dabfcSRobert Watson  * need to select an index before we are ready to expose the interface for
215ed2dabfcSRobert Watson  * use, so will use this pointer value to indicate reservation.
216ed2dabfcSRobert Watson  */
217ed2dabfcSRobert Watson #define	IFNET_HOLD	(void *)(uintptr_t)(-1)
218ed2dabfcSRobert Watson 
219fc74a9f9SBrooks Davis static	if_com_alloc_t *if_com_alloc[256];
220fc74a9f9SBrooks Davis static	if_com_free_t *if_com_free[256];
2210b59d917SJonathan Lemon 
222d745c852SEd Schouten static MALLOC_DEFINE(M_IFNET, "ifnet", "interface internals");
2230b59d917SJonathan Lemon MALLOC_DEFINE(M_IFADDR, "ifaddr", "interface address");
2240b59d917SJonathan Lemon MALLOC_DEFINE(M_IFMADDR, "ether_multi", "link-level multicast address");
22530aad87dSBrooks Davis 
22621ca7b57SMarko Zec struct ifnet *
227d24c444cSKip Macy ifnet_byindex_locked(u_short idx)
22802f4879dSRobert Watson {
22902f4879dSRobert Watson 
23027d37320SRobert Watson 	if (idx > V_if_index)
23127d37320SRobert Watson 		return (NULL);
232ed2dabfcSRobert Watson 	if (V_ifindex_table[idx].ife_ifnet == IFNET_HOLD)
233ed2dabfcSRobert Watson 		return (NULL);
23427d37320SRobert Watson 	return (V_ifindex_table[idx].ife_ifnet);
235d24c444cSKip Macy }
236d24c444cSKip Macy 
237d24c444cSKip Macy struct ifnet *
238d24c444cSKip Macy ifnet_byindex(u_short idx)
239d24c444cSKip Macy {
240d24c444cSKip Macy 	struct ifnet *ifp;
241d24c444cSKip Macy 
24277dfcdc4SRobert Watson 	IFNET_RLOCK_NOSLEEP();
243d24c444cSKip Macy 	ifp = ifnet_byindex_locked(idx);
24477dfcdc4SRobert Watson 	IFNET_RUNLOCK_NOSLEEP();
24502f4879dSRobert Watson 	return (ifp);
24602f4879dSRobert Watson }
24702f4879dSRobert Watson 
24827d37320SRobert Watson struct ifnet *
24927d37320SRobert Watson ifnet_byindex_ref(u_short idx)
25027d37320SRobert Watson {
25127d37320SRobert Watson 	struct ifnet *ifp;
25227d37320SRobert Watson 
25377dfcdc4SRobert Watson 	IFNET_RLOCK_NOSLEEP();
25427d37320SRobert Watson 	ifp = ifnet_byindex_locked(idx);
255242a8e72SRobert Watson 	if (ifp == NULL || (ifp->if_flags & IFF_DYING)) {
25677dfcdc4SRobert Watson 		IFNET_RUNLOCK_NOSLEEP();
25727d37320SRobert Watson 		return (NULL);
25827d37320SRobert Watson 	}
25927d37320SRobert Watson 	if_ref(ifp);
26077dfcdc4SRobert Watson 	IFNET_RUNLOCK_NOSLEEP();
26127d37320SRobert Watson 	return (ifp);
26227d37320SRobert Watson }
26327d37320SRobert Watson 
26461f6986bSRobert Watson /*
26561f6986bSRobert Watson  * Allocate an ifindex array entry; return 0 on success or an error on
26661f6986bSRobert Watson  * failure.
26761f6986bSRobert Watson  */
26861f6986bSRobert Watson static int
269ed2dabfcSRobert Watson ifindex_alloc_locked(u_short *idxp)
27061f6986bSRobert Watson {
27161f6986bSRobert Watson 	u_short idx;
27261f6986bSRobert Watson 
27361f6986bSRobert Watson 	IFNET_WLOCK_ASSERT();
27461f6986bSRobert Watson 
2755f3b301aSJohn Baldwin retry:
27661f6986bSRobert Watson 	/*
277ed2dabfcSRobert Watson 	 * Try to find an empty slot below V_if_index.  If we fail, take the
27861f6986bSRobert Watson 	 * next slot.
27961f6986bSRobert Watson 	 */
28061f6986bSRobert Watson 	for (idx = 1; idx <= V_if_index; idx++) {
281ed2dabfcSRobert Watson 		if (V_ifindex_table[idx].ife_ifnet == NULL)
28261f6986bSRobert Watson 			break;
28361f6986bSRobert Watson 	}
28461f6986bSRobert Watson 
28561f6986bSRobert Watson 	/* Catch if_index overflow. */
28661f6986bSRobert Watson 	if (idx < 1)
28761f6986bSRobert Watson 		return (ENOSPC);
2885f3b301aSJohn Baldwin 	if (idx >= V_if_indexlim) {
2895f3b301aSJohn Baldwin 		if_grow();
2905f3b301aSJohn Baldwin 		goto retry;
2915f3b301aSJohn Baldwin 	}
29261f6986bSRobert Watson 	if (idx > V_if_index)
29361f6986bSRobert Watson 		V_if_index = idx;
29461f6986bSRobert Watson 	*idxp = idx;
29561f6986bSRobert Watson 	return (0);
29661f6986bSRobert Watson }
29761f6986bSRobert Watson 
298e0c14af9SMarko Zec static void
299ed2dabfcSRobert Watson ifindex_free_locked(u_short idx)
300ed2dabfcSRobert Watson {
301ed2dabfcSRobert Watson 
302ed2dabfcSRobert Watson 	IFNET_WLOCK_ASSERT();
303ed2dabfcSRobert Watson 
304ed2dabfcSRobert Watson 	V_ifindex_table[idx].ife_ifnet = NULL;
305ed2dabfcSRobert Watson 	while (V_if_index > 0 &&
306ed2dabfcSRobert Watson 	    V_ifindex_table[V_if_index].ife_ifnet == NULL)
307ed2dabfcSRobert Watson 		V_if_index--;
308ed2dabfcSRobert Watson }
309ed2dabfcSRobert Watson 
310ed2dabfcSRobert Watson static void
311ed2dabfcSRobert Watson ifindex_free(u_short idx)
312ed2dabfcSRobert Watson {
313ed2dabfcSRobert Watson 
314ed2dabfcSRobert Watson 	IFNET_WLOCK();
315ed2dabfcSRobert Watson 	ifindex_free_locked(idx);
316ed2dabfcSRobert Watson 	IFNET_WUNLOCK();
317ed2dabfcSRobert Watson }
318ed2dabfcSRobert Watson 
319ed2dabfcSRobert Watson static void
32077dfcdc4SRobert Watson ifnet_setbyindex_locked(u_short idx, struct ifnet *ifp)
32102f4879dSRobert Watson {
32202f4879dSRobert Watson 
32302f4879dSRobert Watson 	IFNET_WLOCK_ASSERT();
32402f4879dSRobert Watson 
325603724d3SBjoern A. Zeeb 	V_ifindex_table[idx].ife_ifnet = ifp;
32602f4879dSRobert Watson }
32702f4879dSRobert Watson 
32877dfcdc4SRobert Watson static void
32977dfcdc4SRobert Watson ifnet_setbyindex(u_short idx, struct ifnet *ifp)
33077dfcdc4SRobert Watson {
33177dfcdc4SRobert Watson 
33277dfcdc4SRobert Watson 	IFNET_WLOCK();
33377dfcdc4SRobert Watson 	ifnet_setbyindex_locked(idx, ifp);
33477dfcdc4SRobert Watson 	IFNET_WUNLOCK();
33577dfcdc4SRobert Watson }
33677dfcdc4SRobert Watson 
33702f4879dSRobert Watson struct ifaddr *
33802f4879dSRobert Watson ifaddr_byindex(u_short idx)
33902f4879dSRobert Watson {
34002f4879dSRobert Watson 	struct ifaddr *ifa;
34102f4879dSRobert Watson 
34277dfcdc4SRobert Watson 	IFNET_RLOCK_NOSLEEP();
343d24c444cSKip Macy 	ifa = ifnet_byindex_locked(idx)->if_addr;
3448c0fec80SRobert Watson 	if (ifa != NULL)
3458c0fec80SRobert Watson 		ifa_ref(ifa);
34677dfcdc4SRobert Watson 	IFNET_RUNLOCK_NOSLEEP();
34702f4879dSRobert Watson 	return (ifa);
34802f4879dSRobert Watson }
34902f4879dSRobert Watson 
350df8bae1dSRodney W. Grimes /*
351df8bae1dSRodney W. Grimes  * Network interface utility routines.
352df8bae1dSRodney W. Grimes  *
353df8bae1dSRodney W. Grimes  * Routines with ifa_ifwith* names take sockaddr *'s as
354df8bae1dSRodney W. Grimes  * parameters.
355df8bae1dSRodney W. Grimes  */
356a45cbf12SBrooks Davis 
357f9132cebSJonathan Lemon static void
358d0728d71SRobert Watson vnet_if_init(const void *unused __unused)
3591ed81b73SMarko Zec {
36044e33a07SMarko Zec 
361603724d3SBjoern A. Zeeb 	TAILQ_INIT(&V_ifnet);
362603724d3SBjoern A. Zeeb 	TAILQ_INIT(&V_ifg_head);
3635f3b301aSJohn Baldwin 	IFNET_WLOCK();
364f9132cebSJonathan Lemon 	if_grow();				/* create initial table */
3655f3b301aSJohn Baldwin 	IFNET_WUNLOCK();
366d0728d71SRobert Watson 	vnet_if_clone_init();
367f9132cebSJonathan Lemon }
3685f3b301aSJohn Baldwin VNET_SYSINIT(vnet_if_init, SI_SUB_INIT_IF, SI_ORDER_SECOND, vnet_if_init,
369d0728d71SRobert Watson     NULL);
370d0728d71SRobert Watson 
371d0728d71SRobert Watson /* ARGSUSED*/
372d0728d71SRobert Watson static void
373d0728d71SRobert Watson if_init(void *dummy __unused)
374d0728d71SRobert Watson {
375d0728d71SRobert Watson 
376d0728d71SRobert Watson 	IFNET_LOCK_INIT();
377d0728d71SRobert Watson 	if_clone_init();
378d0728d71SRobert Watson }
3795f3b301aSJohn Baldwin SYSINIT(interfaces, SI_SUB_INIT_IF, SI_ORDER_FIRST, if_init, NULL);
380d0728d71SRobert Watson 
381f9132cebSJonathan Lemon 
382bc29160dSMarko Zec #ifdef VIMAGE
383d0728d71SRobert Watson static void
384d0728d71SRobert Watson vnet_if_uninit(const void *unused __unused)
385bc29160dSMarko Zec {
386bc29160dSMarko Zec 
3870028e524SBjoern A. Zeeb 	VNET_ASSERT(TAILQ_EMPTY(&V_ifnet), ("%s:%d tailq &V_ifnet=%p "
3880028e524SBjoern A. Zeeb 	    "not empty", __func__, __LINE__, &V_ifnet));
3890028e524SBjoern A. Zeeb 	VNET_ASSERT(TAILQ_EMPTY(&V_ifg_head), ("%s:%d tailq &V_ifg_head=%p "
3900028e524SBjoern A. Zeeb 	    "not empty", __func__, __LINE__, &V_ifg_head));
391bc29160dSMarko Zec 
392bc29160dSMarko Zec 	free((caddr_t)V_ifindex_table, M_IFNET);
393bc29160dSMarko Zec }
394d0728d71SRobert Watson VNET_SYSUNINIT(vnet_if_uninit, SI_SUB_INIT_IF, SI_ORDER_FIRST,
395d0728d71SRobert Watson     vnet_if_uninit, NULL);
396bc29160dSMarko Zec #endif
397bc29160dSMarko Zec 
3988e937462SRobert Watson static void
399f9132cebSJonathan Lemon if_grow(void)
400f9132cebSJonathan Lemon {
4015f3b301aSJohn Baldwin 	int oldlim;
402f9132cebSJonathan Lemon 	u_int n;
403f9132cebSJonathan Lemon 	struct ifindex_entry *e;
404f9132cebSJonathan Lemon 
4055f3b301aSJohn Baldwin 	IFNET_WLOCK_ASSERT();
4065f3b301aSJohn Baldwin 	oldlim = V_if_indexlim;
4075f3b301aSJohn Baldwin 	IFNET_WUNLOCK();
4085f3b301aSJohn Baldwin 	n = (oldlim << 1) * sizeof(*e);
409fc74a9f9SBrooks Davis 	e = malloc(n, M_IFNET, M_WAITOK | M_ZERO);
4105f3b301aSJohn Baldwin 	IFNET_WLOCK();
4115f3b301aSJohn Baldwin 	if (V_if_indexlim != oldlim) {
4125f3b301aSJohn Baldwin 		free(e, M_IFNET);
4135f3b301aSJohn Baldwin 		return;
4145f3b301aSJohn Baldwin 	}
415603724d3SBjoern A. Zeeb 	if (V_ifindex_table != NULL) {
416603724d3SBjoern A. Zeeb 		memcpy((caddr_t)e, (caddr_t)V_ifindex_table, n/2);
417603724d3SBjoern A. Zeeb 		free((caddr_t)V_ifindex_table, M_IFNET);
418f9132cebSJonathan Lemon 	}
4195f3b301aSJohn Baldwin 	V_if_indexlim <<= 1;
420603724d3SBjoern A. Zeeb 	V_ifindex_table = e;
421f9132cebSJonathan Lemon }
422f9132cebSJonathan Lemon 
423df8bae1dSRodney W. Grimes /*
424a45cbf12SBrooks Davis  * Allocate a struct ifnet and an index for an interface.  A layer 2
425a45cbf12SBrooks Davis  * common structure will also be allocated if an allocation routine is
426a45cbf12SBrooks Davis  * registered for the passed type.
427fc74a9f9SBrooks Davis  */
428fc74a9f9SBrooks Davis struct ifnet *
429fc74a9f9SBrooks Davis if_alloc(u_char type)
430fc74a9f9SBrooks Davis {
431fc74a9f9SBrooks Davis 	struct ifnet *ifp;
43261f6986bSRobert Watson 	u_short idx;
433fc74a9f9SBrooks Davis 
434fc74a9f9SBrooks Davis 	ifp = malloc(sizeof(struct ifnet), M_IFNET, M_WAITOK|M_ZERO);
43561f6986bSRobert Watson 	IFNET_WLOCK();
436ed2dabfcSRobert Watson 	if (ifindex_alloc_locked(&idx) != 0) {
43761f6986bSRobert Watson 		IFNET_WUNLOCK();
438dc7c539eSBrooks Davis 		free(ifp, M_IFNET);
439dc7c539eSBrooks Davis 		return (NULL);
440dc7c539eSBrooks Davis 	}
441ed2dabfcSRobert Watson 	ifnet_setbyindex_locked(idx, IFNET_HOLD);
44261f6986bSRobert Watson 	IFNET_WUNLOCK();
44361f6986bSRobert Watson 	ifp->if_index = idx;
444fc74a9f9SBrooks Davis 	ifp->if_type = type;
44527d37320SRobert Watson 	ifp->if_alloctype = type;
446fc74a9f9SBrooks Davis 	if (if_com_alloc[type] != NULL) {
447fc74a9f9SBrooks Davis 		ifp->if_l2com = if_com_alloc[type](type, ifp);
44828ef2db4SBrooks Davis 		if (ifp->if_l2com == NULL) {
449fc74a9f9SBrooks Davis 			free(ifp, M_IFNET);
450ed2dabfcSRobert Watson 			ifindex_free(idx);
45128ef2db4SBrooks Davis 			return (NULL);
45228ef2db4SBrooks Davis 		}
453fc74a9f9SBrooks Davis 	}
45427d37320SRobert Watson 
45527d37320SRobert Watson 	IF_ADDR_LOCK_INIT(ifp);
456d6f157eaSRobert Watson 	TASK_INIT(&ifp->if_linktask, 0, do_link_state_change, ifp);
457d6f157eaSRobert Watson 	ifp->if_afdata_initialized = 0;
458e0c14af9SMarko Zec 	IF_AFDATA_LOCK_INIT(ifp);
459d6f157eaSRobert Watson 	TAILQ_INIT(&ifp->if_addrhead);
460d6f157eaSRobert Watson 	TAILQ_INIT(&ifp->if_multiaddrs);
461d6f157eaSRobert Watson 	TAILQ_INIT(&ifp->if_groups);
462d6f157eaSRobert Watson #ifdef MAC
463d6f157eaSRobert Watson 	mac_ifnet_init(ifp);
464d6f157eaSRobert Watson #endif
465d659538fSSam Leffler 	ifq_init(&ifp->if_snd, ifp);
466d6f157eaSRobert Watson 
46727d37320SRobert Watson 	refcount_init(&ifp->if_refcount, 1);	/* Index reference. */
46802f4879dSRobert Watson 	ifnet_setbyindex(ifp->if_index, ifp);
469fc74a9f9SBrooks Davis 	return (ifp);
470fc74a9f9SBrooks Davis }
471fc74a9f9SBrooks Davis 
472a45cbf12SBrooks Davis /*
4734c506522SGleb Smirnoff  * Do the actual work of freeing a struct ifnet, and layer 2 common
4744c506522SGleb Smirnoff  * structure.  This call is made when the last reference to an
475242a8e72SRobert Watson  * interface is released.
476a45cbf12SBrooks Davis  */
477242a8e72SRobert Watson static void
478242a8e72SRobert Watson if_free_internal(struct ifnet *ifp)
479fc74a9f9SBrooks Davis {
480fc74a9f9SBrooks Davis 
481242a8e72SRobert Watson 	KASSERT((ifp->if_flags & IFF_DYING),
482242a8e72SRobert Watson 	    ("if_free_internal: interface not dying"));
483fc74a9f9SBrooks Davis 
48427d37320SRobert Watson 	if (if_com_free[ifp->if_alloctype] != NULL)
48527d37320SRobert Watson 		if_com_free[ifp->if_alloctype](ifp->if_l2com,
48627d37320SRobert Watson 		    ifp->if_alloctype);
487fc74a9f9SBrooks Davis 
488d6f157eaSRobert Watson #ifdef MAC
489d6f157eaSRobert Watson 	mac_ifnet_destroy(ifp);
490d6f157eaSRobert Watson #endif /* MAC */
491215940b3SXin LI 	if (ifp->if_description != NULL)
492215940b3SXin LI 		free(ifp->if_description, M_IFDESCR);
493d6f157eaSRobert Watson 	IF_AFDATA_DESTROY(ifp);
49402f4879dSRobert Watson 	IF_ADDR_LOCK_DESTROY(ifp);
495d659538fSSam Leffler 	ifq_delete(&ifp->if_snd);
496fc74a9f9SBrooks Davis 	free(ifp, M_IFNET);
497c0c9ea90SSam Leffler }
498fc74a9f9SBrooks Davis 
499242a8e72SRobert Watson /*
500f26fa169SBrooks Davis  * Deregister an interface and free the associated storage.
501242a8e72SRobert Watson  */
502242a8e72SRobert Watson void
503f26fa169SBrooks Davis if_free(struct ifnet *ifp)
504242a8e72SRobert Watson {
505242a8e72SRobert Watson 
506242a8e72SRobert Watson 	ifp->if_flags |= IFF_DYING;			/* XXX: Locking */
5074c506522SGleb Smirnoff 
508719fb725SCraig Rodrigues 	CURVNET_SET_QUIET(ifp->if_vnet);
5094c506522SGleb Smirnoff 	IFNET_WLOCK();
5104c506522SGleb Smirnoff 	KASSERT(ifp == ifnet_byindex_locked(ifp->if_index),
5114c506522SGleb Smirnoff 	    ("%s: freeing unallocated ifnet", ifp->if_xname));
5124c506522SGleb Smirnoff 
5134c506522SGleb Smirnoff 	ifindex_free_locked(ifp->if_index);
5144c506522SGleb Smirnoff 	IFNET_WUNLOCK();
5154c506522SGleb Smirnoff 
516719fb725SCraig Rodrigues 	if (refcount_release(&ifp->if_refcount))
517242a8e72SRobert Watson 		if_free_internal(ifp);
518719fb725SCraig Rodrigues 	CURVNET_RESTORE();
519242a8e72SRobert Watson }
520242a8e72SRobert Watson 
521242a8e72SRobert Watson /*
522242a8e72SRobert Watson  * Interfaces to keep an ifnet type-stable despite the possibility of the
523242a8e72SRobert Watson  * driver calling if_free().  If there are additional references, we defer
524242a8e72SRobert Watson  * freeing the underlying data structure.
525242a8e72SRobert Watson  */
526db7f0b97SKip Macy void
52727d37320SRobert Watson if_ref(struct ifnet *ifp)
52827d37320SRobert Watson {
52927d37320SRobert Watson 
53027d37320SRobert Watson 	/* We don't assert the ifnet list lock here, but arguably should. */
53127d37320SRobert Watson 	refcount_acquire(&ifp->if_refcount);
53227d37320SRobert Watson }
53327d37320SRobert Watson 
53427d37320SRobert Watson void
53527d37320SRobert Watson if_rele(struct ifnet *ifp)
53627d37320SRobert Watson {
53727d37320SRobert Watson 
538242a8e72SRobert Watson 	if (!refcount_release(&ifp->if_refcount))
539242a8e72SRobert Watson 		return;
540242a8e72SRobert Watson 	if_free_internal(ifp);
54127d37320SRobert Watson }
54227d37320SRobert Watson 
54327d37320SRobert Watson void
544d659538fSSam Leffler ifq_init(struct ifaltq *ifq, struct ifnet *ifp)
545db7f0b97SKip Macy {
546db7f0b97SKip Macy 
547db7f0b97SKip Macy 	mtx_init(&ifq->ifq_mtx, ifp->if_xname, "if send queue", MTX_DEF);
548db7f0b97SKip Macy 
549db7f0b97SKip Macy 	if (ifq->ifq_maxlen == 0)
550db7f0b97SKip Macy 		ifq->ifq_maxlen = ifqmaxlen;
551db7f0b97SKip Macy 
552db7f0b97SKip Macy 	ifq->altq_type = 0;
553db7f0b97SKip Macy 	ifq->altq_disc = NULL;
554db7f0b97SKip Macy 	ifq->altq_flags &= ALTQF_CANTCHANGE;
555db7f0b97SKip Macy 	ifq->altq_tbr  = NULL;
556db7f0b97SKip Macy 	ifq->altq_ifp  = ifp;
557db7f0b97SKip Macy }
558db7f0b97SKip Macy 
559db7f0b97SKip Macy void
560d659538fSSam Leffler ifq_delete(struct ifaltq *ifq)
561db7f0b97SKip Macy {
562db7f0b97SKip Macy 	mtx_destroy(&ifq->ifq_mtx);
563db7f0b97SKip Macy }
564db7f0b97SKip Macy 
565fc74a9f9SBrooks Davis /*
566a45cbf12SBrooks Davis  * Perform generic interface initalization tasks and attach the interface
567e0c14af9SMarko Zec  * to the list of "active" interfaces.  If vmove flag is set on entry
568e0c14af9SMarko Zec  * to if_attach_internal(), perform only a limited subset of initialization
569e0c14af9SMarko Zec  * tasks, given that we are moving from one vnet to another an ifnet which
570e0c14af9SMarko Zec  * has already been fully initialized.
571a45cbf12SBrooks Davis  *
572a45cbf12SBrooks Davis  * XXX:
573a45cbf12SBrooks Davis  *  - The decision to return void and thus require this function to
574a45cbf12SBrooks Davis  *    succeed is questionable.
575a45cbf12SBrooks Davis  *  - We should probably do more sanity checking.  For instance we don't
576a45cbf12SBrooks Davis  *    do anything to insure if_xname is unique or non-empty.
577df8bae1dSRodney W. Grimes  */
578df8bae1dSRodney W. Grimes void
57972fd1b6aSDag-Erling Smørgrav if_attach(struct ifnet *ifp)
580df8bae1dSRodney W. Grimes {
581e0c14af9SMarko Zec 
582e0c14af9SMarko Zec 	if_attach_internal(ifp, 0);
583e0c14af9SMarko Zec }
584e0c14af9SMarko Zec 
585e0c14af9SMarko Zec static void
586e0c14af9SMarko Zec if_attach_internal(struct ifnet *ifp, int vmove)
587e0c14af9SMarko Zec {
588df8bae1dSRodney W. Grimes 	unsigned socksize, ifasize;
5891ce9bf88SPoul-Henning Kamp 	int namelen, masklen;
59072fd1b6aSDag-Erling Smørgrav 	struct sockaddr_dl *sdl;
59172fd1b6aSDag-Erling Smørgrav 	struct ifaddr *ifa;
592df8bae1dSRodney W. Grimes 
593fc74a9f9SBrooks Davis 	if (ifp->if_index == 0 || ifp != ifnet_byindex(ifp->if_index))
594fc74a9f9SBrooks Davis 		panic ("%s: BUG: if_attach called without if_alloc'd input()\n",
595fc74a9f9SBrooks Davis 		    ifp->if_xname);
596fc74a9f9SBrooks Davis 
597f6dfe47aSMarko Zec #ifdef VIMAGE
598f6dfe47aSMarko Zec 	ifp->if_vnet = curvnet;
599bc29160dSMarko Zec 	if (ifp->if_home_vnet == NULL)
600bc29160dSMarko Zec 		ifp->if_home_vnet = curvnet;
601f6dfe47aSMarko Zec #endif
602f6dfe47aSMarko Zec 
6030dad3f0eSMax Laier 	if_addgroup(ifp, IFG_ALL);
6040dad3f0eSMax Laier 
60598b9590eSPoul-Henning Kamp 	getmicrotime(&ifp->if_lastchange);
606bc9d2991SBrooks Davis 	ifp->if_data.ifi_epoch = time_uptime;
607fc74a9f9SBrooks Davis 	ifp->if_data.ifi_datalen = sizeof(struct if_data);
608d6f157eaSRobert Watson 
6097cc5b47fSKip Macy 	KASSERT((ifp->if_transmit == NULL && ifp->if_qflush == NULL) ||
6107cc5b47fSKip Macy 	    (ifp->if_transmit != NULL && ifp->if_qflush != NULL),
6117cc5b47fSKip Macy 	    ("transmit and qflush must both either be set or both be NULL"));
6127cc5b47fSKip Macy 	if (ifp->if_transmit == NULL) {
613db7f0b97SKip Macy 		ifp->if_transmit = if_transmit;
614db7f0b97SKip Macy 		ifp->if_qflush = if_qflush;
6157cc5b47fSKip Macy 	}
6167cc5b47fSKip Macy 
617e0c14af9SMarko Zec 	if (!vmove) {
618e70cd263SRobert Watson #ifdef MAC
61930d239bcSRobert Watson 		mac_ifnet_create(ifp);
620e70cd263SRobert Watson #endif
621e70cd263SRobert Watson 
622df8bae1dSRodney W. Grimes 		/*
623e0c14af9SMarko Zec 		 * Create a Link Level name for this device.
624df8bae1dSRodney W. Grimes 		 */
6259bf40edeSBrooks Davis 		namelen = strlen(ifp->if_xname);
62636c19a57SBrooks Davis 		/*
627e0c14af9SMarko Zec 		 * Always save enough space for any possiable name so we
628e0c14af9SMarko Zec 		 * can do a rename in place later.
62936c19a57SBrooks Davis 		 */
63036c19a57SBrooks Davis 		masklen = offsetof(struct sockaddr_dl, sdl_data[0]) + IFNAMSIZ;
631df8bae1dSRodney W. Grimes 		socksize = masklen + ifp->if_addrlen;
632df8bae1dSRodney W. Grimes 		if (socksize < sizeof(*sdl))
633df8bae1dSRodney W. Grimes 			socksize = sizeof(*sdl);
634ccb82468SBrooks Davis 		socksize = roundup2(socksize, sizeof(long));
635df8bae1dSRodney W. Grimes 		ifasize = sizeof(*ifa) + 2 * socksize;
63646758960SGleb Smirnoff 		ifa = ifa_alloc(ifasize, M_WAITOK);
637df8bae1dSRodney W. Grimes 		sdl = (struct sockaddr_dl *)(ifa + 1);
638df8bae1dSRodney W. Grimes 		sdl->sdl_len = socksize;
639df8bae1dSRodney W. Grimes 		sdl->sdl_family = AF_LINK;
6409bf40edeSBrooks Davis 		bcopy(ifp->if_xname, sdl->sdl_data, namelen);
6411ce9bf88SPoul-Henning Kamp 		sdl->sdl_nlen = namelen;
642df8bae1dSRodney W. Grimes 		sdl->sdl_index = ifp->if_index;
643df8bae1dSRodney W. Grimes 		sdl->sdl_type = ifp->if_type;
6444a0d6638SRuslan Ermilov 		ifp->if_addr = ifa;
645df8bae1dSRodney W. Grimes 		ifa->ifa_ifp = ifp;
646df8bae1dSRodney W. Grimes 		ifa->ifa_rtrequest = link_rtrequest;
647df8bae1dSRodney W. Grimes 		ifa->ifa_addr = (struct sockaddr *)sdl;
648df8bae1dSRodney W. Grimes 		sdl = (struct sockaddr_dl *)(socksize + (caddr_t)sdl);
649df8bae1dSRodney W. Grimes 		ifa->ifa_netmask = (struct sockaddr *)sdl;
650df8bae1dSRodney W. Grimes 		sdl->sdl_len = masklen;
651df8bae1dSRodney W. Grimes 		while (namelen != 0)
652df8bae1dSRodney W. Grimes 			sdl->sdl_data[--namelen] = 0xff;
65359562606SGarrett Wollman 		TAILQ_INSERT_HEAD(&ifp->if_addrhead, ifa, ifa_link);
654e0c14af9SMarko Zec 		/* Reliably crash if used uninitialized. */
655e0c14af9SMarko Zec 		ifp->if_broadcastaddr = NULL;
6563c914c54SAndre Oppermann 
6578aa99373SJohn Baldwin #if defined(INET) || defined(INET6)
6583c914c54SAndre Oppermann 		/* Initialize to max value. */
6593c914c54SAndre Oppermann 		if (ifp->if_hw_tsomax == 0)
6603c914c54SAndre Oppermann 			ifp->if_hw_tsomax = IP_MAXPACKET;
6613c914c54SAndre Oppermann 		KASSERT(ifp->if_hw_tsomax <= IP_MAXPACKET &&
6623c914c54SAndre Oppermann 		    ifp->if_hw_tsomax >= IP_MAXPACKET / 8,
6633c914c54SAndre Oppermann 		    ("%s: tsomax outside of range", __func__));
6648aa99373SJohn Baldwin #endif
665e0c14af9SMarko Zec 	}
66652db6805SMarko Zec #ifdef VIMAGE
66752db6805SMarko Zec 	else {
66852db6805SMarko Zec 		/*
66952db6805SMarko Zec 		 * Update the interface index in the link layer address
67052db6805SMarko Zec 		 * of the interface.
67152db6805SMarko Zec 		 */
67252db6805SMarko Zec 		for (ifa = ifp->if_addr; ifa != NULL;
67352db6805SMarko Zec 		    ifa = TAILQ_NEXT(ifa, ifa_link)) {
67452db6805SMarko Zec 			if (ifa->ifa_addr->sa_family == AF_LINK) {
67552db6805SMarko Zec 				sdl = (struct sockaddr_dl *)ifa->ifa_addr;
67652db6805SMarko Zec 				sdl->sdl_index = ifp->if_index;
67752db6805SMarko Zec 			}
67852db6805SMarko Zec 		}
67952db6805SMarko Zec 	}
68052db6805SMarko Zec #endif
681d94ccb09SBrooks Davis 
682457f48e6SGleb Smirnoff 	IFNET_WLOCK();
683603724d3SBjoern A. Zeeb 	TAILQ_INSERT_TAIL(&V_ifnet, ifp, if_link);
68421ca7b57SMarko Zec #ifdef VIMAGE
685006e9db4SRobert Watson 	curvnet->vnet_ifcnt++;
68621ca7b57SMarko Zec #endif
687457f48e6SGleb Smirnoff 	IFNET_WUNLOCK();
688457f48e6SGleb Smirnoff 
68969fb23b7SMax Laier 	if (domain_init_status >= 2)
69031b1bfe1SHajimu UMEMOTO 		if_attachdomain1(ifp);
69131b1bfe1SHajimu UMEMOTO 
69225a4adceSMax Laier 	EVENTHANDLER_INVOKE(ifnet_arrival_event, ifp);
69321ca7b57SMarko Zec 	if (IS_DEFAULT_VNET(curvnet))
694f3b90d48SAndrew Thompson 		devctl_notify("IFNET", ifp->if_xname, "ATTACH", NULL);
69525a4adceSMax Laier 
6967b6edd04SRuslan Ermilov 	/* Announce the interface. */
6977b6edd04SRuslan Ermilov 	rt_ifannouncemsg(ifp, IFAN_ARRIVAL);
698df8bae1dSRodney W. Grimes }
6996182fdbdSPeter Wemm 
70031b1bfe1SHajimu UMEMOTO static void
70172fd1b6aSDag-Erling Smørgrav if_attachdomain(void *dummy)
70231b1bfe1SHajimu UMEMOTO {
70331b1bfe1SHajimu UMEMOTO 	struct ifnet *ifp;
70431b1bfe1SHajimu UMEMOTO 
705603724d3SBjoern A. Zeeb 	TAILQ_FOREACH(ifp, &V_ifnet, if_link)
70631b1bfe1SHajimu UMEMOTO 		if_attachdomain1(ifp);
70731b1bfe1SHajimu UMEMOTO }
70869fb23b7SMax Laier SYSINIT(domainifattach, SI_SUB_PROTO_IFATTACHDOMAIN, SI_ORDER_SECOND,
70931b1bfe1SHajimu UMEMOTO     if_attachdomain, NULL);
71031b1bfe1SHajimu UMEMOTO 
71131b1bfe1SHajimu UMEMOTO static void
71272fd1b6aSDag-Erling Smørgrav if_attachdomain1(struct ifnet *ifp)
71331b1bfe1SHajimu UMEMOTO {
71431b1bfe1SHajimu UMEMOTO 	struct domain *dp;
71531b1bfe1SHajimu UMEMOTO 
716234a35c7SHajimu UMEMOTO 	/*
717234a35c7SHajimu UMEMOTO 	 * Since dp->dom_ifattach calls malloc() with M_WAITOK, we
718234a35c7SHajimu UMEMOTO 	 * cannot lock ifp->if_afdata initialization, entirely.
719234a35c7SHajimu UMEMOTO 	 */
720c9b652e3SAndre Oppermann 	if (IF_AFDATA_TRYLOCK(ifp) == 0)
721234a35c7SHajimu UMEMOTO 		return;
72269fb23b7SMax Laier 	if (ifp->if_afdata_initialized >= domain_init_status) {
723234a35c7SHajimu UMEMOTO 		IF_AFDATA_UNLOCK(ifp);
724813ee737SAndre Oppermann 		log(LOG_WARNING, "%s called more than once on %s\n",
725813ee737SAndre Oppermann 		    __func__, ifp->if_xname);
726234a35c7SHajimu UMEMOTO 		return;
727234a35c7SHajimu UMEMOTO 	}
72869fb23b7SMax Laier 	ifp->if_afdata_initialized = domain_init_status;
729234a35c7SHajimu UMEMOTO 	IF_AFDATA_UNLOCK(ifp);
730234a35c7SHajimu UMEMOTO 
73131b1bfe1SHajimu UMEMOTO 	/* address family dependent data region */
73231b1bfe1SHajimu UMEMOTO 	bzero(ifp->if_afdata, sizeof(ifp->if_afdata));
73331b1bfe1SHajimu UMEMOTO 	for (dp = domains; dp; dp = dp->dom_next) {
73431b1bfe1SHajimu UMEMOTO 		if (dp->dom_ifattach)
73531b1bfe1SHajimu UMEMOTO 			ifp->if_afdata[dp->dom_family] =
73631b1bfe1SHajimu UMEMOTO 			    (*dp->dom_ifattach)(ifp);
73731b1bfe1SHajimu UMEMOTO 	}
73831b1bfe1SHajimu UMEMOTO }
73931b1bfe1SHajimu UMEMOTO 
7406182fdbdSPeter Wemm /*
741ec002feeSBruce M Simpson  * Remove any unicast or broadcast network addresses from an interface.
74245778b37SPeter Edwards  */
74345778b37SPeter Edwards void
74445778b37SPeter Edwards if_purgeaddrs(struct ifnet *ifp)
74545778b37SPeter Edwards {
74645778b37SPeter Edwards 	struct ifaddr *ifa, *next;
74745778b37SPeter Edwards 
74845778b37SPeter Edwards 	TAILQ_FOREACH_SAFE(ifa, &ifp->if_addrhead, ifa_link, next) {
7494b97d7afSYaroslav Tykhiy 		if (ifa->ifa_addr->sa_family == AF_LINK)
75045778b37SPeter Edwards 			continue;
75145778b37SPeter Edwards #ifdef INET
75245778b37SPeter Edwards 		/* XXX: Ugly!! ad hoc just for INET */
7534b97d7afSYaroslav Tykhiy 		if (ifa->ifa_addr->sa_family == AF_INET) {
75445778b37SPeter Edwards 			struct ifaliasreq ifr;
75545778b37SPeter Edwards 
75645778b37SPeter Edwards 			bzero(&ifr, sizeof(ifr));
75745778b37SPeter Edwards 			ifr.ifra_addr = *ifa->ifa_addr;
75845778b37SPeter Edwards 			if (ifa->ifa_dstaddr)
75945778b37SPeter Edwards 				ifr.ifra_broadaddr = *ifa->ifa_dstaddr;
76045778b37SPeter Edwards 			if (in_control(NULL, SIOCDIFADDR, (caddr_t)&ifr, ifp,
76145778b37SPeter Edwards 			    NULL) == 0)
76245778b37SPeter Edwards 				continue;
76345778b37SPeter Edwards 		}
76445778b37SPeter Edwards #endif /* INET */
76545778b37SPeter Edwards #ifdef INET6
7664b97d7afSYaroslav Tykhiy 		if (ifa->ifa_addr->sa_family == AF_INET6) {
76745778b37SPeter Edwards 			in6_purgeaddr(ifa);
76845778b37SPeter Edwards 			/* ifp_addrhead is already updated */
76945778b37SPeter Edwards 			continue;
77045778b37SPeter Edwards 		}
77145778b37SPeter Edwards #endif /* INET6 */
77245778b37SPeter Edwards 		TAILQ_REMOVE(&ifp->if_addrhead, ifa, ifa_link);
7731099f828SRobert Watson 		ifa_free(ifa);
77445778b37SPeter Edwards 	}
77545778b37SPeter Edwards }
77645778b37SPeter Edwards 
77745778b37SPeter Edwards /*
77893ec7edcSShteryana Shopova  * Remove any multicast network addresses from an interface when an ifnet
77993ec7edcSShteryana Shopova  * is going away.
780ec002feeSBruce M Simpson  */
78193ec7edcSShteryana Shopova static void
782ec002feeSBruce M Simpson if_purgemaddrs(struct ifnet *ifp)
783ec002feeSBruce M Simpson {
784ec002feeSBruce M Simpson 	struct ifmultiaddr *ifma;
785ec002feeSBruce M Simpson 	struct ifmultiaddr *next;
786ec002feeSBruce M Simpson 
787137f91e8SJohn Baldwin 	IF_ADDR_WLOCK(ifp);
788ec002feeSBruce M Simpson 	TAILQ_FOREACH_SAFE(ifma, &ifp->if_multiaddrs, ifma_link, next)
789ec002feeSBruce M Simpson 		if_delmulti_locked(ifp, ifma, 1);
790137f91e8SJohn Baldwin 	IF_ADDR_WUNLOCK(ifp);
791ec002feeSBruce M Simpson }
792ec002feeSBruce M Simpson 
793ec002feeSBruce M Simpson /*
794e0c14af9SMarko Zec  * Detach an interface, removing it from the list of "active" interfaces.
795e0c14af9SMarko Zec  * If vmove flag is set on entry to if_detach_internal(), perform only a
796e0c14af9SMarko Zec  * limited subset of cleanup tasks, given that we are moving an ifnet from
797e0c14af9SMarko Zec  * one vnet to another, where it must be fully operational.
798b1c53bc9SRobert Watson  *
799b1c53bc9SRobert Watson  * XXXRW: There are some significant questions about event ordering, and
800b1c53bc9SRobert Watson  * how to prevent things from starting to use the interface during detach.
8016182fdbdSPeter Wemm  */
8026182fdbdSPeter Wemm void
80372fd1b6aSDag-Erling Smørgrav if_detach(struct ifnet *ifp)
8046182fdbdSPeter Wemm {
805e0c14af9SMarko Zec 
806719fb725SCraig Rodrigues 	CURVNET_SET_QUIET(ifp->if_vnet);
807e0c14af9SMarko Zec 	if_detach_internal(ifp, 0);
808719fb725SCraig Rodrigues 	CURVNET_RESTORE();
809e0c14af9SMarko Zec }
810e0c14af9SMarko Zec 
811e0c14af9SMarko Zec static void
812e0c14af9SMarko Zec if_detach_internal(struct ifnet *ifp, int vmove)
813e0c14af9SMarko Zec {
81445778b37SPeter Edwards 	struct ifaddr *ifa;
8155500d3beSWarner Losh 	struct radix_node_head	*rnh;
816e0c14af9SMarko Zec 	int i, j;
81731b1bfe1SHajimu UMEMOTO 	struct domain *dp;
8183f35d515SPeter Pentchev  	struct ifnet *iter;
819457f48e6SGleb Smirnoff  	int found = 0;
820457f48e6SGleb Smirnoff 
821457f48e6SGleb Smirnoff 	IFNET_WLOCK();
822603724d3SBjoern A. Zeeb 	TAILQ_FOREACH(iter, &V_ifnet, if_link)
823457f48e6SGleb Smirnoff 		if (iter == ifp) {
824603724d3SBjoern A. Zeeb 			TAILQ_REMOVE(&V_ifnet, ifp, if_link);
825457f48e6SGleb Smirnoff 			found = 1;
826457f48e6SGleb Smirnoff 			break;
827457f48e6SGleb Smirnoff 		}
82821ca7b57SMarko Zec #ifdef VIMAGE
82921ca7b57SMarko Zec 	if (found)
830006e9db4SRobert Watson 		curvnet->vnet_ifcnt--;
83121ca7b57SMarko Zec #endif
832457f48e6SGleb Smirnoff 	IFNET_WUNLOCK();
833e0c14af9SMarko Zec 	if (!found) {
834e0c14af9SMarko Zec 		if (vmove)
83558606037SBjoern A. Zeeb 			panic("%s: ifp=%p not on the ifnet tailq %p",
83658606037SBjoern A. Zeeb 			    __func__, ifp, &V_ifnet);
837e0c14af9SMarko Zec 		else
838e0c14af9SMarko Zec 			return; /* XXX this should panic as well? */
839e0c14af9SMarko Zec 	}
8406182fdbdSPeter Wemm 
84168a3482fSGleb Smirnoff 	/*
84268a3482fSGleb Smirnoff 	 * Remove/wait for pending events.
84368a3482fSGleb Smirnoff 	 */
84468a3482fSGleb Smirnoff 	taskqueue_drain(taskqueue_swi, &ifp->if_linktask);
84568a3482fSGleb Smirnoff 
8466182fdbdSPeter Wemm 	/*
8476182fdbdSPeter Wemm 	 * Remove routes and flush queues.
8486182fdbdSPeter Wemm 	 */
8496182fdbdSPeter Wemm 	if_down(ifp);
85002b199f1SMax Laier #ifdef ALTQ
85102b199f1SMax Laier 	if (ALTQ_IS_ENABLED(&ifp->if_snd))
85202b199f1SMax Laier 		altq_disable(&ifp->if_snd);
85302b199f1SMax Laier 	if (ALTQ_IS_ATTACHED(&ifp->if_snd))
85402b199f1SMax Laier 		altq_detach(&ifp->if_snd);
85502b199f1SMax Laier #endif
8566182fdbdSPeter Wemm 
85745778b37SPeter Edwards 	if_purgeaddrs(ifp);
8586182fdbdSPeter Wemm 
859b1c53bc9SRobert Watson #ifdef INET
860b1c53bc9SRobert Watson 	in_ifdetach(ifp);
861b1c53bc9SRobert Watson #endif
862b1c53bc9SRobert Watson 
86333841545SHajimu UMEMOTO #ifdef INET6
86433841545SHajimu UMEMOTO 	/*
86533841545SHajimu UMEMOTO 	 * Remove all IPv6 kernel structs related to ifp.  This should be done
86633841545SHajimu UMEMOTO 	 * before removing routing entries below, since IPv6 interface direct
86733841545SHajimu UMEMOTO 	 * routes are expected to be removed by the IPv6-specific kernel API.
86833841545SHajimu UMEMOTO 	 * Otherwise, the kernel will detect some inconsistency and bark it.
86933841545SHajimu UMEMOTO 	 */
87033841545SHajimu UMEMOTO 	in6_ifdetach(ifp);
87133841545SHajimu UMEMOTO #endif
872ec002feeSBruce M Simpson 	if_purgemaddrs(ifp);
873ec002feeSBruce M Simpson 
874e0c14af9SMarko Zec 	if (!vmove) {
875f4247b59SLuigi Rizzo 		/*
876111c6b61SRobert Watson 		 * Prevent further calls into the device driver via ifnet.
877111c6b61SRobert Watson 		 */
878111c6b61SRobert Watson 		if_dead(ifp);
879111c6b61SRobert Watson 
880111c6b61SRobert Watson 		/*
8814a0d6638SRuslan Ermilov 		 * Remove link ifaddr pointer and maybe decrement if_index.
882f4247b59SLuigi Rizzo 		 * Clean up all addresses.
883f4247b59SLuigi Rizzo 		 */
8844a0d6638SRuslan Ermilov 		ifp->if_addr = NULL;
885f4247b59SLuigi Rizzo 
886212bd869SHajimu UMEMOTO 		/* We can now free link ifaddr. */
8873f35d515SPeter Pentchev 		if (!TAILQ_EMPTY(&ifp->if_addrhead)) {
888212bd869SHajimu UMEMOTO 			ifa = TAILQ_FIRST(&ifp->if_addrhead);
889212bd869SHajimu UMEMOTO 			TAILQ_REMOVE(&ifp->if_addrhead, ifa, ifa_link);
8901099f828SRobert Watson 			ifa_free(ifa);
8913f35d515SPeter Pentchev 		}
892e0c14af9SMarko Zec 	}
893212bd869SHajimu UMEMOTO 
8945500d3beSWarner Losh 	/*
8955500d3beSWarner Losh 	 * Delete all remaining routes using this interface
8965500d3beSWarner Losh 	 * Unfortuneatly the only way to do this is to slog through
8975500d3beSWarner Losh 	 * the entire routing table looking for routes which point
8985500d3beSWarner Losh 	 * to this interface...oh well...
8995500d3beSWarner Losh 	 */
9005500d3beSWarner Losh 	for (i = 1; i <= AF_MAX; i++) {
9018b07e49aSJulian Elischer 		for (j = 0; j < rt_numfibs; j++) {
902c2c2a7c1SBjoern A. Zeeb 			rnh = rt_tables_get_rnh(j, i);
903c2c2a7c1SBjoern A. Zeeb 			if (rnh == NULL)
9045500d3beSWarner Losh 				continue;
905956b0b65SJeffrey Hsu 			RADIX_NODE_HEAD_LOCK(rnh);
9065500d3beSWarner Losh 			(void) rnh->rnh_walktree(rnh, if_rtdel, ifp);
907956b0b65SJeffrey Hsu 			RADIX_NODE_HEAD_UNLOCK(rnh);
9085500d3beSWarner Losh 		}
9098b07e49aSJulian Elischer 	}
9105500d3beSWarner Losh 
9117b6edd04SRuslan Ermilov 	/* Announce that the interface is gone. */
9127b6edd04SRuslan Ermilov 	rt_ifannouncemsg(ifp, IFAN_DEPARTURE);
91352023244SMax Laier 	EVENTHANDLER_INVOKE(ifnet_departure_event, ifp);
91421ca7b57SMarko Zec 	if (IS_DEFAULT_VNET(curvnet))
915f3b90d48SAndrew Thompson 		devctl_notify("IFNET", ifp->if_xname, "DETACH", NULL);
9168623f9fdSMax Laier 	if_delgroups(ifp);
9177b6edd04SRuslan Ermilov 
918d8c13659SBjoern A. Zeeb 	/*
919d8c13659SBjoern A. Zeeb 	 * We cannot hold the lock over dom_ifdetach calls as they might
920d8c13659SBjoern A. Zeeb 	 * sleep, for example trying to drain a callout, thus open up the
921d8c13659SBjoern A. Zeeb 	 * theoretical race with re-attaching.
922d8c13659SBjoern A. Zeeb 	 */
923234a35c7SHajimu UMEMOTO 	IF_AFDATA_LOCK(ifp);
924d8c13659SBjoern A. Zeeb 	i = ifp->if_afdata_initialized;
925d8c13659SBjoern A. Zeeb 	ifp->if_afdata_initialized = 0;
926d8c13659SBjoern A. Zeeb 	IF_AFDATA_UNLOCK(ifp);
927d8c13659SBjoern A. Zeeb 	for (dp = domains; i > 0 && dp; dp = dp->dom_next) {
92831b1bfe1SHajimu UMEMOTO 		if (dp->dom_ifdetach && ifp->if_afdata[dp->dom_family])
92931b1bfe1SHajimu UMEMOTO 			(*dp->dom_ifdetach)(ifp,
93031b1bfe1SHajimu UMEMOTO 			    ifp->if_afdata[dp->dom_family]);
93131b1bfe1SHajimu UMEMOTO 	}
9325500d3beSWarner Losh }
9335500d3beSWarner Losh 
934e0c14af9SMarko Zec #ifdef VIMAGE
935e0c14af9SMarko Zec /*
936e0c14af9SMarko Zec  * if_vmove() performs a limited version of if_detach() in current
937e0c14af9SMarko Zec  * vnet and if_attach()es the ifnet to the vnet specified as 2nd arg.
938e0c14af9SMarko Zec  * An attempt is made to shrink if_index in current vnet, find an
939e0c14af9SMarko Zec  * unused if_index in target vnet and calls if_grow() if necessary,
940e0c14af9SMarko Zec  * and finally find an unused if_xname for the target vnet.
941e0c14af9SMarko Zec  */
942e0c14af9SMarko Zec void
943e0c14af9SMarko Zec if_vmove(struct ifnet *ifp, struct vnet *new_vnet)
944e0c14af9SMarko Zec {
94561f6986bSRobert Watson 	u_short idx;
946e0c14af9SMarko Zec 
947e0c14af9SMarko Zec 	/*
948e0c14af9SMarko Zec 	 * Detach from current vnet, but preserve LLADDR info, do not
949e0c14af9SMarko Zec 	 * mark as dead etc. so that the ifnet can be reattached later.
950e0c14af9SMarko Zec 	 */
951e0c14af9SMarko Zec 	if_detach_internal(ifp, 1);
952e0c14af9SMarko Zec 
953e0c14af9SMarko Zec 	/*
95477dfcdc4SRobert Watson 	 * Unlink the ifnet from ifindex_table[] in current vnet, and shrink
95577dfcdc4SRobert Watson 	 * the if_index for that vnet if possible.
95677dfcdc4SRobert Watson 	 *
95777dfcdc4SRobert Watson 	 * NOTE: IFNET_WLOCK/IFNET_WUNLOCK() are assumed to be unvirtualized,
95877dfcdc4SRobert Watson 	 * or we'd lock on one vnet and unlock on another.
959e0c14af9SMarko Zec 	 */
960e0c14af9SMarko Zec 	IFNET_WLOCK();
961ed2dabfcSRobert Watson 	ifindex_free_locked(ifp->if_index);
962d3c351c5SMarko Zec 	IFNET_WUNLOCK();
963d3c351c5SMarko Zec 
964d3c351c5SMarko Zec 	/*
965d3c351c5SMarko Zec 	 * Perform interface-specific reassignment tasks, if provided by
966d3c351c5SMarko Zec 	 * the driver.
967d3c351c5SMarko Zec 	 */
968d3c351c5SMarko Zec 	if (ifp->if_reassign != NULL)
969d3c351c5SMarko Zec 		ifp->if_reassign(ifp, new_vnet, NULL);
970e0c14af9SMarko Zec 
971e0c14af9SMarko Zec 	/*
972e0c14af9SMarko Zec 	 * Switch to the context of the target vnet.
973e0c14af9SMarko Zec 	 */
974e0c14af9SMarko Zec 	CURVNET_SET_QUIET(new_vnet);
975e0c14af9SMarko Zec 
976d3c351c5SMarko Zec 	IFNET_WLOCK();
977ed2dabfcSRobert Watson 	if (ifindex_alloc_locked(&idx) != 0) {
97861f6986bSRobert Watson 		IFNET_WUNLOCK();
979e0c14af9SMarko Zec 		panic("if_index overflow");
98061f6986bSRobert Watson 	}
98161f6986bSRobert Watson 	ifp->if_index = idx;
98277dfcdc4SRobert Watson 	ifnet_setbyindex_locked(ifp->if_index, ifp);
983e0c14af9SMarko Zec 	IFNET_WUNLOCK();
984e0c14af9SMarko Zec 
985e0c14af9SMarko Zec 	if_attach_internal(ifp, 1);
986e0c14af9SMarko Zec 
987e0c14af9SMarko Zec 	CURVNET_RESTORE();
988e0c14af9SMarko Zec }
989be31e5e7SBjoern A. Zeeb 
990be31e5e7SBjoern A. Zeeb /*
991be31e5e7SBjoern A. Zeeb  * Move an ifnet to or from another child prison/vnet, specified by the jail id.
992be31e5e7SBjoern A. Zeeb  */
993be31e5e7SBjoern A. Zeeb static int
994be31e5e7SBjoern A. Zeeb if_vmove_loan(struct thread *td, struct ifnet *ifp, char *ifname, int jid)
995be31e5e7SBjoern A. Zeeb {
996be31e5e7SBjoern A. Zeeb 	struct prison *pr;
997be31e5e7SBjoern A. Zeeb 	struct ifnet *difp;
998be31e5e7SBjoern A. Zeeb 
999be31e5e7SBjoern A. Zeeb 	/* Try to find the prison within our visibility. */
1000be31e5e7SBjoern A. Zeeb 	sx_slock(&allprison_lock);
1001be31e5e7SBjoern A. Zeeb 	pr = prison_find_child(td->td_ucred->cr_prison, jid);
1002be31e5e7SBjoern A. Zeeb 	sx_sunlock(&allprison_lock);
1003be31e5e7SBjoern A. Zeeb 	if (pr == NULL)
1004be31e5e7SBjoern A. Zeeb 		return (ENXIO);
1005be31e5e7SBjoern A. Zeeb 	prison_hold_locked(pr);
1006be31e5e7SBjoern A. Zeeb 	mtx_unlock(&pr->pr_mtx);
1007be31e5e7SBjoern A. Zeeb 
1008be31e5e7SBjoern A. Zeeb 	/* Do not try to move the iface from and to the same prison. */
1009be31e5e7SBjoern A. Zeeb 	if (pr->pr_vnet == ifp->if_vnet) {
1010be31e5e7SBjoern A. Zeeb 		prison_free(pr);
1011be31e5e7SBjoern A. Zeeb 		return (EEXIST);
1012be31e5e7SBjoern A. Zeeb 	}
1013be31e5e7SBjoern A. Zeeb 
1014be31e5e7SBjoern A. Zeeb 	/* Make sure the named iface does not exists in the dst. prison/vnet. */
1015be31e5e7SBjoern A. Zeeb 	/* XXX Lock interfaces to avoid races. */
10169abb4862SMarko Zec 	CURVNET_SET_QUIET(pr->pr_vnet);
1017be31e5e7SBjoern A. Zeeb 	difp = ifunit(ifname);
1018be31e5e7SBjoern A. Zeeb 	CURVNET_RESTORE();
1019be31e5e7SBjoern A. Zeeb 	if (difp != NULL) {
1020be31e5e7SBjoern A. Zeeb 		prison_free(pr);
1021be31e5e7SBjoern A. Zeeb 		return (EEXIST);
1022be31e5e7SBjoern A. Zeeb 	}
1023be31e5e7SBjoern A. Zeeb 
1024be31e5e7SBjoern A. Zeeb 	/* Move the interface into the child jail/vnet. */
1025be31e5e7SBjoern A. Zeeb 	if_vmove(ifp, pr->pr_vnet);
1026be31e5e7SBjoern A. Zeeb 
1027be31e5e7SBjoern A. Zeeb 	/* Report the new if_xname back to the userland. */
1028be31e5e7SBjoern A. Zeeb 	sprintf(ifname, "%s", ifp->if_xname);
1029be31e5e7SBjoern A. Zeeb 
1030be31e5e7SBjoern A. Zeeb 	prison_free(pr);
1031be31e5e7SBjoern A. Zeeb 	return (0);
1032be31e5e7SBjoern A. Zeeb }
1033be31e5e7SBjoern A. Zeeb 
1034be31e5e7SBjoern A. Zeeb static int
1035be31e5e7SBjoern A. Zeeb if_vmove_reclaim(struct thread *td, char *ifname, int jid)
1036be31e5e7SBjoern A. Zeeb {
1037be31e5e7SBjoern A. Zeeb 	struct prison *pr;
1038be31e5e7SBjoern A. Zeeb 	struct vnet *vnet_dst;
1039be31e5e7SBjoern A. Zeeb 	struct ifnet *ifp;
1040be31e5e7SBjoern A. Zeeb 
1041be31e5e7SBjoern A. Zeeb 	/* Try to find the prison within our visibility. */
1042be31e5e7SBjoern A. Zeeb 	sx_slock(&allprison_lock);
1043be31e5e7SBjoern A. Zeeb 	pr = prison_find_child(td->td_ucred->cr_prison, jid);
1044be31e5e7SBjoern A. Zeeb 	sx_sunlock(&allprison_lock);
1045be31e5e7SBjoern A. Zeeb 	if (pr == NULL)
1046be31e5e7SBjoern A. Zeeb 		return (ENXIO);
1047be31e5e7SBjoern A. Zeeb 	prison_hold_locked(pr);
1048be31e5e7SBjoern A. Zeeb 	mtx_unlock(&pr->pr_mtx);
1049be31e5e7SBjoern A. Zeeb 
1050be31e5e7SBjoern A. Zeeb 	/* Make sure the named iface exists in the source prison/vnet. */
1051be31e5e7SBjoern A. Zeeb 	CURVNET_SET(pr->pr_vnet);
1052be31e5e7SBjoern A. Zeeb 	ifp = ifunit(ifname);		/* XXX Lock to avoid races. */
1053be31e5e7SBjoern A. Zeeb 	if (ifp == NULL) {
1054be31e5e7SBjoern A. Zeeb 		CURVNET_RESTORE();
1055be31e5e7SBjoern A. Zeeb 		prison_free(pr);
1056be31e5e7SBjoern A. Zeeb 		return (ENXIO);
1057be31e5e7SBjoern A. Zeeb 	}
1058be31e5e7SBjoern A. Zeeb 
1059be31e5e7SBjoern A. Zeeb 	/* Do not try to move the iface from and to the same prison. */
1060be31e5e7SBjoern A. Zeeb 	vnet_dst = TD_TO_VNET(td);
1061be31e5e7SBjoern A. Zeeb 	if (vnet_dst == ifp->if_vnet) {
1062be31e5e7SBjoern A. Zeeb 		CURVNET_RESTORE();
1063be31e5e7SBjoern A. Zeeb 		prison_free(pr);
1064be31e5e7SBjoern A. Zeeb 		return (EEXIST);
1065be31e5e7SBjoern A. Zeeb 	}
1066be31e5e7SBjoern A. Zeeb 
1067be31e5e7SBjoern A. Zeeb 	/* Get interface back from child jail/vnet. */
1068be31e5e7SBjoern A. Zeeb 	if_vmove(ifp, vnet_dst);
1069be31e5e7SBjoern A. Zeeb 	CURVNET_RESTORE();
1070be31e5e7SBjoern A. Zeeb 
1071be31e5e7SBjoern A. Zeeb 	/* Report the new if_xname back to the userland. */
1072be31e5e7SBjoern A. Zeeb 	sprintf(ifname, "%s", ifp->if_xname);
1073be31e5e7SBjoern A. Zeeb 
1074be31e5e7SBjoern A. Zeeb 	prison_free(pr);
1075be31e5e7SBjoern A. Zeeb 	return (0);
1076be31e5e7SBjoern A. Zeeb }
1077e0c14af9SMarko Zec #endif /* VIMAGE */
1078e0c14af9SMarko Zec 
10795500d3beSWarner Losh /*
10800dad3f0eSMax Laier  * Add a group to an interface
10810dad3f0eSMax Laier  */
10820dad3f0eSMax Laier int
10830dad3f0eSMax Laier if_addgroup(struct ifnet *ifp, const char *groupname)
10840dad3f0eSMax Laier {
10850dad3f0eSMax Laier 	struct ifg_list		*ifgl;
10860dad3f0eSMax Laier 	struct ifg_group	*ifg = NULL;
10870dad3f0eSMax Laier 	struct ifg_member	*ifgm;
1088d6d3f01eSGleb Smirnoff 	int 			 new = 0;
10890dad3f0eSMax Laier 
10900dad3f0eSMax Laier 	if (groupname[0] && groupname[strlen(groupname) - 1] >= '0' &&
10910dad3f0eSMax Laier 	    groupname[strlen(groupname) - 1] <= '9')
10920dad3f0eSMax Laier 		return (EINVAL);
10930dad3f0eSMax Laier 
10940dad3f0eSMax Laier 	IFNET_WLOCK();
10950dad3f0eSMax Laier 	TAILQ_FOREACH(ifgl, &ifp->if_groups, ifgl_next)
10960dad3f0eSMax Laier 		if (!strcmp(ifgl->ifgl_group->ifg_group, groupname)) {
10970dad3f0eSMax Laier 			IFNET_WUNLOCK();
10980dad3f0eSMax Laier 			return (EEXIST);
10990dad3f0eSMax Laier 		}
11000dad3f0eSMax Laier 
11010dad3f0eSMax Laier 	if ((ifgl = (struct ifg_list *)malloc(sizeof(struct ifg_list), M_TEMP,
11020dad3f0eSMax Laier 	    M_NOWAIT)) == NULL) {
11030dad3f0eSMax Laier 	    	IFNET_WUNLOCK();
11040dad3f0eSMax Laier 		return (ENOMEM);
11050dad3f0eSMax Laier 	}
11060dad3f0eSMax Laier 
11070dad3f0eSMax Laier 	if ((ifgm = (struct ifg_member *)malloc(sizeof(struct ifg_member),
11080dad3f0eSMax Laier 	    M_TEMP, M_NOWAIT)) == NULL) {
11090dad3f0eSMax Laier 		free(ifgl, M_TEMP);
11100dad3f0eSMax Laier 		IFNET_WUNLOCK();
11110dad3f0eSMax Laier 		return (ENOMEM);
11120dad3f0eSMax Laier 	}
11130dad3f0eSMax Laier 
1114603724d3SBjoern A. Zeeb 	TAILQ_FOREACH(ifg, &V_ifg_head, ifg_next)
11150dad3f0eSMax Laier 		if (!strcmp(ifg->ifg_group, groupname))
11160dad3f0eSMax Laier 			break;
11170dad3f0eSMax Laier 
11180dad3f0eSMax Laier 	if (ifg == NULL) {
11190dad3f0eSMax Laier 		if ((ifg = (struct ifg_group *)malloc(sizeof(struct ifg_group),
11200dad3f0eSMax Laier 		    M_TEMP, M_NOWAIT)) == NULL) {
11210dad3f0eSMax Laier 			free(ifgl, M_TEMP);
11220dad3f0eSMax Laier 			free(ifgm, M_TEMP);
11230dad3f0eSMax Laier 			IFNET_WUNLOCK();
11240dad3f0eSMax Laier 			return (ENOMEM);
11250dad3f0eSMax Laier 		}
11260dad3f0eSMax Laier 		strlcpy(ifg->ifg_group, groupname, sizeof(ifg->ifg_group));
11270dad3f0eSMax Laier 		ifg->ifg_refcnt = 0;
11280dad3f0eSMax Laier 		TAILQ_INIT(&ifg->ifg_members);
1129603724d3SBjoern A. Zeeb 		TAILQ_INSERT_TAIL(&V_ifg_head, ifg, ifg_next);
1130d6d3f01eSGleb Smirnoff 		new = 1;
11310dad3f0eSMax Laier 	}
11320dad3f0eSMax Laier 
11330dad3f0eSMax Laier 	ifg->ifg_refcnt++;
11340dad3f0eSMax Laier 	ifgl->ifgl_group = ifg;
11350dad3f0eSMax Laier 	ifgm->ifgm_ifp = ifp;
11360dad3f0eSMax Laier 
1137137f91e8SJohn Baldwin 	IF_ADDR_WLOCK(ifp);
11380dad3f0eSMax Laier 	TAILQ_INSERT_TAIL(&ifg->ifg_members, ifgm, ifgm_next);
11390dad3f0eSMax Laier 	TAILQ_INSERT_TAIL(&ifp->if_groups, ifgl, ifgl_next);
1140137f91e8SJohn Baldwin 	IF_ADDR_WUNLOCK(ifp);
11410dad3f0eSMax Laier 
11420dad3f0eSMax Laier 	IFNET_WUNLOCK();
11430dad3f0eSMax Laier 
1144d6d3f01eSGleb Smirnoff 	if (new)
1145d6d3f01eSGleb Smirnoff 		EVENTHANDLER_INVOKE(group_attach_event, ifg);
11460dad3f0eSMax Laier 	EVENTHANDLER_INVOKE(group_change_event, groupname);
11470dad3f0eSMax Laier 
11480dad3f0eSMax Laier 	return (0);
11490dad3f0eSMax Laier }
11500dad3f0eSMax Laier 
11510dad3f0eSMax Laier /*
11520dad3f0eSMax Laier  * Remove a group from an interface
11530dad3f0eSMax Laier  */
11540dad3f0eSMax Laier int
11550dad3f0eSMax Laier if_delgroup(struct ifnet *ifp, const char *groupname)
11560dad3f0eSMax Laier {
11570dad3f0eSMax Laier 	struct ifg_list		*ifgl;
11580dad3f0eSMax Laier 	struct ifg_member	*ifgm;
11590dad3f0eSMax Laier 
11600dad3f0eSMax Laier 	IFNET_WLOCK();
11610dad3f0eSMax Laier 	TAILQ_FOREACH(ifgl, &ifp->if_groups, ifgl_next)
11620dad3f0eSMax Laier 		if (!strcmp(ifgl->ifgl_group->ifg_group, groupname))
11630dad3f0eSMax Laier 			break;
11640dad3f0eSMax Laier 	if (ifgl == NULL) {
11650dad3f0eSMax Laier 		IFNET_WUNLOCK();
11660dad3f0eSMax Laier 		return (ENOENT);
11670dad3f0eSMax Laier 	}
11680dad3f0eSMax Laier 
1169137f91e8SJohn Baldwin 	IF_ADDR_WLOCK(ifp);
11700dad3f0eSMax Laier 	TAILQ_REMOVE(&ifp->if_groups, ifgl, ifgl_next);
1171137f91e8SJohn Baldwin 	IF_ADDR_WUNLOCK(ifp);
11720dad3f0eSMax Laier 
11730dad3f0eSMax Laier 	TAILQ_FOREACH(ifgm, &ifgl->ifgl_group->ifg_members, ifgm_next)
11740dad3f0eSMax Laier 		if (ifgm->ifgm_ifp == ifp)
11750dad3f0eSMax Laier 			break;
11760dad3f0eSMax Laier 
11770dad3f0eSMax Laier 	if (ifgm != NULL) {
11780dad3f0eSMax Laier 		TAILQ_REMOVE(&ifgl->ifgl_group->ifg_members, ifgm, ifgm_next);
11790dad3f0eSMax Laier 		free(ifgm, M_TEMP);
11800dad3f0eSMax Laier 	}
11810dad3f0eSMax Laier 
11820dad3f0eSMax Laier 	if (--ifgl->ifgl_group->ifg_refcnt == 0) {
1183603724d3SBjoern A. Zeeb 		TAILQ_REMOVE(&V_ifg_head, ifgl->ifgl_group, ifg_next);
1184d6d3f01eSGleb Smirnoff 		IFNET_WUNLOCK();
11850dad3f0eSMax Laier 		EVENTHANDLER_INVOKE(group_detach_event, ifgl->ifgl_group);
11860dad3f0eSMax Laier 		free(ifgl->ifgl_group, M_TEMP);
1187d6d3f01eSGleb Smirnoff 	} else
11880dad3f0eSMax Laier 		IFNET_WUNLOCK();
11890dad3f0eSMax Laier 
11900dad3f0eSMax Laier 	free(ifgl, M_TEMP);
11910dad3f0eSMax Laier 
11920dad3f0eSMax Laier 	EVENTHANDLER_INVOKE(group_change_event, groupname);
11930dad3f0eSMax Laier 
11940dad3f0eSMax Laier 	return (0);
11950dad3f0eSMax Laier }
11960dad3f0eSMax Laier 
11970dad3f0eSMax Laier /*
11988623f9fdSMax Laier  * Remove an interface from all groups
11998623f9fdSMax Laier  */
12008623f9fdSMax Laier static void
12018623f9fdSMax Laier if_delgroups(struct ifnet *ifp)
12028623f9fdSMax Laier {
12038623f9fdSMax Laier 	struct ifg_list		*ifgl;
12048623f9fdSMax Laier 	struct ifg_member	*ifgm;
12058623f9fdSMax Laier 	char groupname[IFNAMSIZ];
12068623f9fdSMax Laier 
12078623f9fdSMax Laier 	IFNET_WLOCK();
12088623f9fdSMax Laier 	while (!TAILQ_EMPTY(&ifp->if_groups)) {
12098623f9fdSMax Laier 		ifgl = TAILQ_FIRST(&ifp->if_groups);
12108623f9fdSMax Laier 
12118623f9fdSMax Laier 		strlcpy(groupname, ifgl->ifgl_group->ifg_group, IFNAMSIZ);
12128623f9fdSMax Laier 
1213137f91e8SJohn Baldwin 		IF_ADDR_WLOCK(ifp);
12148623f9fdSMax Laier 		TAILQ_REMOVE(&ifp->if_groups, ifgl, ifgl_next);
1215137f91e8SJohn Baldwin 		IF_ADDR_WUNLOCK(ifp);
12168623f9fdSMax Laier 
12178623f9fdSMax Laier 		TAILQ_FOREACH(ifgm, &ifgl->ifgl_group->ifg_members, ifgm_next)
12188623f9fdSMax Laier 			if (ifgm->ifgm_ifp == ifp)
12198623f9fdSMax Laier 				break;
12208623f9fdSMax Laier 
12218623f9fdSMax Laier 		if (ifgm != NULL) {
12228623f9fdSMax Laier 			TAILQ_REMOVE(&ifgl->ifgl_group->ifg_members, ifgm,
12238623f9fdSMax Laier 			    ifgm_next);
12248623f9fdSMax Laier 			free(ifgm, M_TEMP);
12258623f9fdSMax Laier 		}
12268623f9fdSMax Laier 
12278623f9fdSMax Laier 		if (--ifgl->ifgl_group->ifg_refcnt == 0) {
12288623f9fdSMax Laier 			TAILQ_REMOVE(&V_ifg_head, ifgl->ifgl_group, ifg_next);
1229d6d3f01eSGleb Smirnoff 			IFNET_WUNLOCK();
12308623f9fdSMax Laier 			EVENTHANDLER_INVOKE(group_detach_event,
12318623f9fdSMax Laier 			    ifgl->ifgl_group);
12328623f9fdSMax Laier 			free(ifgl->ifgl_group, M_TEMP);
1233d6d3f01eSGleb Smirnoff 		} else
12348623f9fdSMax Laier 			IFNET_WUNLOCK();
12358623f9fdSMax Laier 
12368623f9fdSMax Laier 		free(ifgl, M_TEMP);
12378623f9fdSMax Laier 
12388623f9fdSMax Laier 		EVENTHANDLER_INVOKE(group_change_event, groupname);
12398623f9fdSMax Laier 
12408623f9fdSMax Laier 		IFNET_WLOCK();
12418623f9fdSMax Laier 	}
12428623f9fdSMax Laier 	IFNET_WUNLOCK();
12438623f9fdSMax Laier }
12448623f9fdSMax Laier 
12458623f9fdSMax Laier /*
12460dad3f0eSMax Laier  * Stores all groups from an interface in memory pointed
12470dad3f0eSMax Laier  * to by data
12480dad3f0eSMax Laier  */
12490dad3f0eSMax Laier static int
12500dad3f0eSMax Laier if_getgroup(struct ifgroupreq *data, struct ifnet *ifp)
12510dad3f0eSMax Laier {
12520dad3f0eSMax Laier 	int			 len, error;
12530dad3f0eSMax Laier 	struct ifg_list		*ifgl;
12540dad3f0eSMax Laier 	struct ifg_req		 ifgrq, *ifgp;
12550dad3f0eSMax Laier 	struct ifgroupreq	*ifgr = data;
12560dad3f0eSMax Laier 
12570dad3f0eSMax Laier 	if (ifgr->ifgr_len == 0) {
1258137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
12590dad3f0eSMax Laier 		TAILQ_FOREACH(ifgl, &ifp->if_groups, ifgl_next)
12600dad3f0eSMax Laier 			ifgr->ifgr_len += sizeof(struct ifg_req);
1261137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
12620dad3f0eSMax Laier 		return (0);
12630dad3f0eSMax Laier 	}
12640dad3f0eSMax Laier 
12650dad3f0eSMax Laier 	len = ifgr->ifgr_len;
12660dad3f0eSMax Laier 	ifgp = ifgr->ifgr_groups;
12670dad3f0eSMax Laier 	/* XXX: wire */
1268137f91e8SJohn Baldwin 	IF_ADDR_RLOCK(ifp);
12690dad3f0eSMax Laier 	TAILQ_FOREACH(ifgl, &ifp->if_groups, ifgl_next) {
12700dad3f0eSMax Laier 		if (len < sizeof(ifgrq)) {
1271137f91e8SJohn Baldwin 			IF_ADDR_RUNLOCK(ifp);
12720dad3f0eSMax Laier 			return (EINVAL);
12730dad3f0eSMax Laier 		}
12740dad3f0eSMax Laier 		bzero(&ifgrq, sizeof ifgrq);
12750dad3f0eSMax Laier 		strlcpy(ifgrq.ifgrq_group, ifgl->ifgl_group->ifg_group,
12760dad3f0eSMax Laier 		    sizeof(ifgrq.ifgrq_group));
12770dad3f0eSMax Laier 		if ((error = copyout(&ifgrq, ifgp, sizeof(struct ifg_req)))) {
1278137f91e8SJohn Baldwin 		    	IF_ADDR_RUNLOCK(ifp);
12790dad3f0eSMax Laier 			return (error);
12800dad3f0eSMax Laier 		}
12810dad3f0eSMax Laier 		len -= sizeof(ifgrq);
12820dad3f0eSMax Laier 		ifgp++;
12830dad3f0eSMax Laier 	}
1284137f91e8SJohn Baldwin 	IF_ADDR_RUNLOCK(ifp);
12850dad3f0eSMax Laier 
12860dad3f0eSMax Laier 	return (0);
12870dad3f0eSMax Laier }
12880dad3f0eSMax Laier 
12890dad3f0eSMax Laier /*
12900dad3f0eSMax Laier  * Stores all members of a group in memory pointed to by data
12910dad3f0eSMax Laier  */
12920dad3f0eSMax Laier static int
12930dad3f0eSMax Laier if_getgroupmembers(struct ifgroupreq *data)
12940dad3f0eSMax Laier {
12950dad3f0eSMax Laier 	struct ifgroupreq	*ifgr = data;
12960dad3f0eSMax Laier 	struct ifg_group	*ifg;
12970dad3f0eSMax Laier 	struct ifg_member	*ifgm;
12980dad3f0eSMax Laier 	struct ifg_req		 ifgrq, *ifgp;
12990dad3f0eSMax Laier 	int			 len, error;
13000dad3f0eSMax Laier 
13010dad3f0eSMax Laier 	IFNET_RLOCK();
1302603724d3SBjoern A. Zeeb 	TAILQ_FOREACH(ifg, &V_ifg_head, ifg_next)
13030dad3f0eSMax Laier 		if (!strcmp(ifg->ifg_group, ifgr->ifgr_name))
13040dad3f0eSMax Laier 			break;
13050dad3f0eSMax Laier 	if (ifg == NULL) {
13060dad3f0eSMax Laier 		IFNET_RUNLOCK();
13070dad3f0eSMax Laier 		return (ENOENT);
13080dad3f0eSMax Laier 	}
13090dad3f0eSMax Laier 
13100dad3f0eSMax Laier 	if (ifgr->ifgr_len == 0) {
13110dad3f0eSMax Laier 		TAILQ_FOREACH(ifgm, &ifg->ifg_members, ifgm_next)
13120dad3f0eSMax Laier 			ifgr->ifgr_len += sizeof(ifgrq);
13130dad3f0eSMax Laier 		IFNET_RUNLOCK();
13140dad3f0eSMax Laier 		return (0);
13150dad3f0eSMax Laier 	}
13160dad3f0eSMax Laier 
13170dad3f0eSMax Laier 	len = ifgr->ifgr_len;
13180dad3f0eSMax Laier 	ifgp = ifgr->ifgr_groups;
13190dad3f0eSMax Laier 	TAILQ_FOREACH(ifgm, &ifg->ifg_members, ifgm_next) {
13200dad3f0eSMax Laier 		if (len < sizeof(ifgrq)) {
13210dad3f0eSMax Laier 			IFNET_RUNLOCK();
13220dad3f0eSMax Laier 			return (EINVAL);
13230dad3f0eSMax Laier 		}
13240dad3f0eSMax Laier 		bzero(&ifgrq, sizeof ifgrq);
13250dad3f0eSMax Laier 		strlcpy(ifgrq.ifgrq_member, ifgm->ifgm_ifp->if_xname,
13260dad3f0eSMax Laier 		    sizeof(ifgrq.ifgrq_member));
13270dad3f0eSMax Laier 		if ((error = copyout(&ifgrq, ifgp, sizeof(struct ifg_req)))) {
13280dad3f0eSMax Laier 			IFNET_RUNLOCK();
13290dad3f0eSMax Laier 			return (error);
13300dad3f0eSMax Laier 		}
13310dad3f0eSMax Laier 		len -= sizeof(ifgrq);
13320dad3f0eSMax Laier 		ifgp++;
13330dad3f0eSMax Laier 	}
13340dad3f0eSMax Laier 	IFNET_RUNLOCK();
13350dad3f0eSMax Laier 
13360dad3f0eSMax Laier 	return (0);
13370dad3f0eSMax Laier }
13380dad3f0eSMax Laier 
13390dad3f0eSMax Laier /*
13405500d3beSWarner Losh  * Delete Routes for a Network Interface
13415500d3beSWarner Losh  *
13425500d3beSWarner Losh  * Called for each routing entry via the rnh->rnh_walktree() call above
13435500d3beSWarner Losh  * to delete all route entries referencing a detaching network interface.
13445500d3beSWarner Losh  *
13455500d3beSWarner Losh  * Arguments:
13465500d3beSWarner Losh  *	rn	pointer to node in the routing table
13475500d3beSWarner Losh  *	arg	argument passed to rnh->rnh_walktree() - detaching interface
13485500d3beSWarner Losh  *
13495500d3beSWarner Losh  * Returns:
13505500d3beSWarner Losh  *	0	successful
13515500d3beSWarner Losh  *	errno	failed - reason indicated
13525500d3beSWarner Losh  *
13535500d3beSWarner Losh  */
13545500d3beSWarner Losh static int
135572fd1b6aSDag-Erling Smørgrav if_rtdel(struct radix_node *rn, void *arg)
13565500d3beSWarner Losh {
13575500d3beSWarner Losh 	struct rtentry	*rt = (struct rtentry *)rn;
13585500d3beSWarner Losh 	struct ifnet	*ifp = arg;
13595500d3beSWarner Losh 	int		err;
13605500d3beSWarner Losh 
13615500d3beSWarner Losh 	if (rt->rt_ifp == ifp) {
13625500d3beSWarner Losh 
13635500d3beSWarner Losh 		/*
13645500d3beSWarner Losh 		 * Protect (sorta) against walktree recursion problems
13655500d3beSWarner Losh 		 * with cloned routes
13665500d3beSWarner Losh 		 */
13675500d3beSWarner Losh 		if ((rt->rt_flags & RTF_UP) == 0)
13685500d3beSWarner Losh 			return (0);
13695500d3beSWarner Losh 
13708b07e49aSJulian Elischer 		err = rtrequest_fib(RTM_DELETE, rt_key(rt), rt->rt_gateway,
13713034f43fSAlexander V. Chernikov 				rt_mask(rt),
13723034f43fSAlexander V. Chernikov 				rt->rt_flags|RTF_RNH_LOCKED|RTF_PINNED,
13738b07e49aSJulian Elischer 				(struct rtentry **) NULL, rt->rt_fibnum);
13745500d3beSWarner Losh 		if (err) {
13755500d3beSWarner Losh 			log(LOG_WARNING, "if_rtdel: error %d\n", err);
13765500d3beSWarner Losh 		}
13775500d3beSWarner Losh 	}
13785500d3beSWarner Losh 
13795500d3beSWarner Losh 	return (0);
13806182fdbdSPeter Wemm }
13816182fdbdSPeter Wemm 
138240d8a302SBruce M Simpson /*
1383f9ef96caSRobert Watson  * Wrapper functions for struct ifnet address list locking macros.  These are
1384f9ef96caSRobert Watson  * used by kernel modules to avoid encoding programming interface or binary
1385f9ef96caSRobert Watson  * interface assumptions that may be violated when kernel-internal locking
1386f9ef96caSRobert Watson  * approaches change.
1387f9ef96caSRobert Watson  */
1388f9ef96caSRobert Watson void
1389f9ef96caSRobert Watson if_addr_rlock(struct ifnet *ifp)
1390f9ef96caSRobert Watson {
1391f9ef96caSRobert Watson 
1392137f91e8SJohn Baldwin 	IF_ADDR_RLOCK(ifp);
1393f9ef96caSRobert Watson }
1394f9ef96caSRobert Watson 
1395f9ef96caSRobert Watson void
1396f9ef96caSRobert Watson if_addr_runlock(struct ifnet *ifp)
1397f9ef96caSRobert Watson {
1398f9ef96caSRobert Watson 
1399137f91e8SJohn Baldwin 	IF_ADDR_RUNLOCK(ifp);
1400f9ef96caSRobert Watson }
1401f9ef96caSRobert Watson 
1402f9ef96caSRobert Watson void
1403f9ef96caSRobert Watson if_maddr_rlock(struct ifnet *ifp)
1404f9ef96caSRobert Watson {
1405f9ef96caSRobert Watson 
1406137f91e8SJohn Baldwin 	IF_ADDR_RLOCK(ifp);
1407f9ef96caSRobert Watson }
1408f9ef96caSRobert Watson 
1409f9ef96caSRobert Watson void
1410f9ef96caSRobert Watson if_maddr_runlock(struct ifnet *ifp)
1411f9ef96caSRobert Watson {
1412f9ef96caSRobert Watson 
1413137f91e8SJohn Baldwin 	IF_ADDR_RUNLOCK(ifp);
1414f9ef96caSRobert Watson }
1415f9ef96caSRobert Watson 
1416f9ef96caSRobert Watson /*
1417e8aa8bddSGleb Smirnoff  * Initialization, destruction and refcounting functions for ifaddrs.
14181099f828SRobert Watson  */
141946758960SGleb Smirnoff struct ifaddr *
142046758960SGleb Smirnoff ifa_alloc(size_t size, int flags)
14211099f828SRobert Watson {
142246758960SGleb Smirnoff 	struct ifaddr *ifa;
142346758960SGleb Smirnoff 
142446758960SGleb Smirnoff 	KASSERT(size >= sizeof(struct ifaddr),
142546758960SGleb Smirnoff 	    ("%s: invalid size %zu", __func__, size));
142646758960SGleb Smirnoff 
142746758960SGleb Smirnoff 	ifa = malloc(size, M_IFADDR, M_ZERO | flags);
142846758960SGleb Smirnoff 	if (ifa == NULL)
142946758960SGleb Smirnoff 		return (NULL);
14301099f828SRobert Watson 
14317caf4ab7SGleb Smirnoff 	if ((ifa->ifa_opackets = counter_u64_alloc(flags)) == NULL)
14327caf4ab7SGleb Smirnoff 		goto fail;
14337caf4ab7SGleb Smirnoff 	if ((ifa->ifa_ipackets = counter_u64_alloc(flags)) == NULL)
14347caf4ab7SGleb Smirnoff 		goto fail;
14357caf4ab7SGleb Smirnoff 	if ((ifa->ifa_obytes = counter_u64_alloc(flags)) == NULL)
14367caf4ab7SGleb Smirnoff 		goto fail;
14377caf4ab7SGleb Smirnoff 	if ((ifa->ifa_ibytes = counter_u64_alloc(flags)) == NULL)
14387caf4ab7SGleb Smirnoff 		goto fail;
14397caf4ab7SGleb Smirnoff 
14401099f828SRobert Watson 	refcount_init(&ifa->ifa_refcnt, 1);
144146758960SGleb Smirnoff 
144246758960SGleb Smirnoff 	return (ifa);
14437caf4ab7SGleb Smirnoff 
14447caf4ab7SGleb Smirnoff fail:
14457caf4ab7SGleb Smirnoff 	/* free(NULL) is okay */
14467caf4ab7SGleb Smirnoff 	counter_u64_free(ifa->ifa_opackets);
14477caf4ab7SGleb Smirnoff 	counter_u64_free(ifa->ifa_ipackets);
14487caf4ab7SGleb Smirnoff 	counter_u64_free(ifa->ifa_obytes);
14497caf4ab7SGleb Smirnoff 	counter_u64_free(ifa->ifa_ibytes);
14507caf4ab7SGleb Smirnoff 	free(ifa, M_IFADDR);
14517caf4ab7SGleb Smirnoff 
14527caf4ab7SGleb Smirnoff 	return (NULL);
14531099f828SRobert Watson }
14541099f828SRobert Watson 
14551099f828SRobert Watson void
14561099f828SRobert Watson ifa_ref(struct ifaddr *ifa)
14571099f828SRobert Watson {
14581099f828SRobert Watson 
14591099f828SRobert Watson 	refcount_acquire(&ifa->ifa_refcnt);
14601099f828SRobert Watson }
14611099f828SRobert Watson 
14621099f828SRobert Watson void
14631099f828SRobert Watson ifa_free(struct ifaddr *ifa)
14641099f828SRobert Watson {
14651099f828SRobert Watson 
14661099f828SRobert Watson 	if (refcount_release(&ifa->ifa_refcnt)) {
14677caf4ab7SGleb Smirnoff 		counter_u64_free(ifa->ifa_opackets);
14687caf4ab7SGleb Smirnoff 		counter_u64_free(ifa->ifa_ipackets);
14697caf4ab7SGleb Smirnoff 		counter_u64_free(ifa->ifa_obytes);
14707caf4ab7SGleb Smirnoff 		counter_u64_free(ifa->ifa_ibytes);
14711099f828SRobert Watson 		free(ifa, M_IFADDR);
14721099f828SRobert Watson 	}
14731099f828SRobert Watson }
14741099f828SRobert Watson 
14759bb7d0f4SQing Li int
14769bb7d0f4SQing Li ifa_add_loopback_route(struct ifaddr *ifa, struct sockaddr *ia)
14779bb7d0f4SQing Li {
14789bb7d0f4SQing Li 	int error = 0;
14799bb7d0f4SQing Li 	struct rtentry *rt = NULL;
14809bb7d0f4SQing Li 	struct rt_addrinfo info;
14819bb7d0f4SQing Li 	static struct sockaddr_dl null_sdl = {sizeof(null_sdl), AF_LINK};
14829bb7d0f4SQing Li 
14839bb7d0f4SQing Li 	bzero(&info, sizeof(info));
14849bb7d0f4SQing Li 	info.rti_ifp = V_loif;
14859bb7d0f4SQing Li 	info.rti_flags = ifa->ifa_flags | RTF_HOST | RTF_STATIC;
14869bb7d0f4SQing Li 	info.rti_info[RTAX_DST] = ia;
14879bb7d0f4SQing Li 	info.rti_info[RTAX_GATEWAY] = (struct sockaddr *)&null_sdl;
14889bb7d0f4SQing Li 	error = rtrequest1_fib(RTM_ADD, &info, &rt, 0);
14899bb7d0f4SQing Li 
14909bb7d0f4SQing Li 	if (error == 0 && rt != NULL) {
14919bb7d0f4SQing Li 		RT_LOCK(rt);
14929bb7d0f4SQing Li 		((struct sockaddr_dl *)rt->rt_gateway)->sdl_type  =
149346e7f983SQing Li 			ifa->ifa_ifp->if_type;
14949bb7d0f4SQing Li 		((struct sockaddr_dl *)rt->rt_gateway)->sdl_index =
149546e7f983SQing Li 			ifa->ifa_ifp->if_index;
14969bb7d0f4SQing Li 		RT_REMREF(rt);
14979bb7d0f4SQing Li 		RT_UNLOCK(rt);
14989bb7d0f4SQing Li 	} else if (error != 0)
1499c0ba290bSGleb Smirnoff 		log(LOG_DEBUG, "%s: insertion failed: %u\n", __func__, error);
15009bb7d0f4SQing Li 
15019bb7d0f4SQing Li 	return (error);
15029bb7d0f4SQing Li }
15039bb7d0f4SQing Li 
15049bb7d0f4SQing Li int
15059bb7d0f4SQing Li ifa_del_loopback_route(struct ifaddr *ifa, struct sockaddr *ia)
15069bb7d0f4SQing Li {
15079bb7d0f4SQing Li 	int error = 0;
15089bb7d0f4SQing Li 	struct rt_addrinfo info;
15099bb7d0f4SQing Li 	struct sockaddr_dl null_sdl;
15109bb7d0f4SQing Li 
15119bb7d0f4SQing Li 	bzero(&null_sdl, sizeof(null_sdl));
15129bb7d0f4SQing Li 	null_sdl.sdl_len = sizeof(null_sdl);
15139bb7d0f4SQing Li 	null_sdl.sdl_family = AF_LINK;
15149bb7d0f4SQing Li 	null_sdl.sdl_type = ifa->ifa_ifp->if_type;
15159bb7d0f4SQing Li 	null_sdl.sdl_index = ifa->ifa_ifp->if_index;
15169bb7d0f4SQing Li 	bzero(&info, sizeof(info));
15179bb7d0f4SQing Li 	info.rti_flags = ifa->ifa_flags | RTF_HOST | RTF_STATIC;
15189bb7d0f4SQing Li 	info.rti_info[RTAX_DST] = ia;
15199bb7d0f4SQing Li 	info.rti_info[RTAX_GATEWAY] = (struct sockaddr *)&null_sdl;
15209bb7d0f4SQing Li 	error = rtrequest1_fib(RTM_DELETE, &info, NULL, 0);
15219bb7d0f4SQing Li 
15229bb7d0f4SQing Li 	if (error != 0)
1523c0ba290bSGleb Smirnoff 		log(LOG_DEBUG, "%s: deletion failed: %u\n", __func__, error);
15249bb7d0f4SQing Li 
15259bb7d0f4SQing Li 	return (error);
15269bb7d0f4SQing Li }
15279bb7d0f4SQing Li 
15289a6356bcSGleb Smirnoff int
15299a6356bcSGleb Smirnoff ifa_switch_loopback_route(struct ifaddr *ifa, struct sockaddr *sa)
15309a6356bcSGleb Smirnoff {
15319a6356bcSGleb Smirnoff 	struct rtentry *rt;
15329a6356bcSGleb Smirnoff 
15339a6356bcSGleb Smirnoff 	rt = rtalloc1_fib(sa, 0, 0, 0);
15349a6356bcSGleb Smirnoff 	if (rt == NULL) {
15359a6356bcSGleb Smirnoff 		log(LOG_DEBUG, "%s: fail", __func__);
15369a6356bcSGleb Smirnoff 		return (EHOSTUNREACH);
15379a6356bcSGleb Smirnoff 	}
15389a6356bcSGleb Smirnoff 	((struct sockaddr_dl *)rt->rt_gateway)->sdl_type =
15399a6356bcSGleb Smirnoff 	    ifa->ifa_ifp->if_type;
15409a6356bcSGleb Smirnoff 	((struct sockaddr_dl *)rt->rt_gateway)->sdl_index =
15419a6356bcSGleb Smirnoff 	    ifa->ifa_ifp->if_index;
15429a6356bcSGleb Smirnoff 	RTFREE_LOCKED(rt);
15439a6356bcSGleb Smirnoff 
15449a6356bcSGleb Smirnoff 	return (0);
15459a6356bcSGleb Smirnoff }
15469a6356bcSGleb Smirnoff 
15471099f828SRobert Watson /*
154840d8a302SBruce M Simpson  * XXX: Because sockaddr_dl has deeper structure than the sockaddr
154940d8a302SBruce M Simpson  * structs used to represent other address families, it is necessary
155040d8a302SBruce M Simpson  * to perform a different comparison.
155140d8a302SBruce M Simpson  */
155240d8a302SBruce M Simpson 
155340d8a302SBruce M Simpson #define	sa_equal(a1, a2)	\
155440d8a302SBruce M Simpson 	(bcmp((a1), (a2), ((a1))->sa_len) == 0)
155540d8a302SBruce M Simpson 
155640d8a302SBruce M Simpson #define	sa_dl_equal(a1, a2)	\
155740d8a302SBruce M Simpson 	((((struct sockaddr_dl *)(a1))->sdl_len ==			\
155840d8a302SBruce M Simpson 	 ((struct sockaddr_dl *)(a2))->sdl_len) &&			\
155940d8a302SBruce M Simpson 	 (bcmp(LLADDR((struct sockaddr_dl *)(a1)),			\
156040d8a302SBruce M Simpson 	       LLADDR((struct sockaddr_dl *)(a2)),			\
156140d8a302SBruce M Simpson 	       ((struct sockaddr_dl *)(a1))->sdl_alen) == 0))
156219fc74fbSJeffrey Hsu 
156330aad87dSBrooks Davis /*
1564df8bae1dSRodney W. Grimes  * Locate an interface based on a complete address.
1565df8bae1dSRodney W. Grimes  */
1566df8bae1dSRodney W. Grimes /*ARGSUSED*/
15678896f83aSRobert Watson static struct ifaddr *
15688c0fec80SRobert Watson ifa_ifwithaddr_internal(struct sockaddr *addr, int getref)
1569df8bae1dSRodney W. Grimes {
15700b59d917SJonathan Lemon 	struct ifnet *ifp;
15710b59d917SJonathan Lemon 	struct ifaddr *ifa;
1572df8bae1dSRodney W. Grimes 
157377dfcdc4SRobert Watson 	IFNET_RLOCK_NOSLEEP();
1574ab5ed8a5SRobert Watson 	TAILQ_FOREACH(ifp, &V_ifnet, if_link) {
1575137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
157637d40066SPoul-Henning Kamp 		TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) {
1577df8bae1dSRodney W. Grimes 			if (ifa->ifa_addr->sa_family != addr->sa_family)
1578df8bae1dSRodney W. Grimes 				continue;
1579ab5ed8a5SRobert Watson 			if (sa_equal(addr, ifa->ifa_addr)) {
15808c0fec80SRobert Watson 				if (getref)
15818c0fec80SRobert Watson 					ifa_ref(ifa);
1582137f91e8SJohn Baldwin 				IF_ADDR_RUNLOCK(ifp);
15830b59d917SJonathan Lemon 				goto done;
1584ab5ed8a5SRobert Watson 			}
158582cd038dSYoshinobu Inoue 			/* IP6 doesn't have broadcast */
15860b59d917SJonathan Lemon 			if ((ifp->if_flags & IFF_BROADCAST) &&
15870b59d917SJonathan Lemon 			    ifa->ifa_broadaddr &&
158882cd038dSYoshinobu Inoue 			    ifa->ifa_broadaddr->sa_len != 0 &&
1589ab5ed8a5SRobert Watson 			    sa_equal(ifa->ifa_broadaddr, addr)) {
15908c0fec80SRobert Watson 				if (getref)
15918c0fec80SRobert Watson 					ifa_ref(ifa);
1592137f91e8SJohn Baldwin 				IF_ADDR_RUNLOCK(ifp);
15930b59d917SJonathan Lemon 				goto done;
15940b59d917SJonathan Lemon 			}
1595ab5ed8a5SRobert Watson 		}
1596137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
1597ab5ed8a5SRobert Watson 	}
15980b59d917SJonathan Lemon 	ifa = NULL;
15990b59d917SJonathan Lemon done:
160077dfcdc4SRobert Watson 	IFNET_RUNLOCK_NOSLEEP();
1601df8bae1dSRodney W. Grimes 	return (ifa);
1602df8bae1dSRodney W. Grimes }
16030b59d917SJonathan Lemon 
16048896f83aSRobert Watson struct ifaddr *
16058896f83aSRobert Watson ifa_ifwithaddr(struct sockaddr *addr)
16068896f83aSRobert Watson {
16078896f83aSRobert Watson 
16088c0fec80SRobert Watson 	return (ifa_ifwithaddr_internal(addr, 1));
16098896f83aSRobert Watson }
16108896f83aSRobert Watson 
16118896f83aSRobert Watson int
16128896f83aSRobert Watson ifa_ifwithaddr_check(struct sockaddr *addr)
16138896f83aSRobert Watson {
16148896f83aSRobert Watson 
16158c0fec80SRobert Watson 	return (ifa_ifwithaddr_internal(addr, 0) != NULL);
16168896f83aSRobert Watson }
16178896f83aSRobert Watson 
1618df8bae1dSRodney W. Grimes /*
1619773725a2SAndre Oppermann  * Locate an interface based on the broadcast address.
1620773725a2SAndre Oppermann  */
1621773725a2SAndre Oppermann /* ARGSUSED */
1622773725a2SAndre Oppermann struct ifaddr *
1623773725a2SAndre Oppermann ifa_ifwithbroadaddr(struct sockaddr *addr)
1624773725a2SAndre Oppermann {
1625773725a2SAndre Oppermann 	struct ifnet *ifp;
1626773725a2SAndre Oppermann 	struct ifaddr *ifa;
1627773725a2SAndre Oppermann 
162877dfcdc4SRobert Watson 	IFNET_RLOCK_NOSLEEP();
1629ab5ed8a5SRobert Watson 	TAILQ_FOREACH(ifp, &V_ifnet, if_link) {
1630137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
1631773725a2SAndre Oppermann 		TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) {
1632773725a2SAndre Oppermann 			if (ifa->ifa_addr->sa_family != addr->sa_family)
1633773725a2SAndre Oppermann 				continue;
1634773725a2SAndre Oppermann 			if ((ifp->if_flags & IFF_BROADCAST) &&
1635773725a2SAndre Oppermann 			    ifa->ifa_broadaddr &&
1636773725a2SAndre Oppermann 			    ifa->ifa_broadaddr->sa_len != 0 &&
1637ab5ed8a5SRobert Watson 			    sa_equal(ifa->ifa_broadaddr, addr)) {
16388c0fec80SRobert Watson 				ifa_ref(ifa);
1639137f91e8SJohn Baldwin 				IF_ADDR_RUNLOCK(ifp);
1640773725a2SAndre Oppermann 				goto done;
1641773725a2SAndre Oppermann 			}
1642ab5ed8a5SRobert Watson 		}
1643137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
1644ab5ed8a5SRobert Watson 	}
1645773725a2SAndre Oppermann 	ifa = NULL;
1646773725a2SAndre Oppermann done:
164777dfcdc4SRobert Watson 	IFNET_RUNLOCK_NOSLEEP();
1648773725a2SAndre Oppermann 	return (ifa);
1649773725a2SAndre Oppermann }
1650773725a2SAndre Oppermann 
1651773725a2SAndre Oppermann /*
1652df8bae1dSRodney W. Grimes  * Locate the point to point interface with a given destination address.
1653df8bae1dSRodney W. Grimes  */
1654df8bae1dSRodney W. Grimes /*ARGSUSED*/
1655df8bae1dSRodney W. Grimes struct ifaddr *
165672fd1b6aSDag-Erling Smørgrav ifa_ifwithdstaddr(struct sockaddr *addr)
1657df8bae1dSRodney W. Grimes {
16580b59d917SJonathan Lemon 	struct ifnet *ifp;
16590b59d917SJonathan Lemon 	struct ifaddr *ifa;
1660df8bae1dSRodney W. Grimes 
166177dfcdc4SRobert Watson 	IFNET_RLOCK_NOSLEEP();
1662603724d3SBjoern A. Zeeb 	TAILQ_FOREACH(ifp, &V_ifnet, if_link) {
16630b59d917SJonathan Lemon 		if ((ifp->if_flags & IFF_POINTOPOINT) == 0)
16640b59d917SJonathan Lemon 			continue;
1665137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
166637d40066SPoul-Henning Kamp 		TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) {
1667df8bae1dSRodney W. Grimes 			if (ifa->ifa_addr->sa_family != addr->sa_family)
1668df8bae1dSRodney W. Grimes 				continue;
1669f0c04221SBjoern A. Zeeb 			if (ifa->ifa_dstaddr != NULL &&
1670ab5ed8a5SRobert Watson 			    sa_equal(addr, ifa->ifa_dstaddr)) {
16718c0fec80SRobert Watson 				ifa_ref(ifa);
1672137f91e8SJohn Baldwin 				IF_ADDR_RUNLOCK(ifp);
16730b59d917SJonathan Lemon 				goto done;
1674df8bae1dSRodney W. Grimes 			}
16750b59d917SJonathan Lemon 		}
1676137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
1677ab5ed8a5SRobert Watson 	}
16780b59d917SJonathan Lemon 	ifa = NULL;
16790b59d917SJonathan Lemon done:
168077dfcdc4SRobert Watson 	IFNET_RUNLOCK_NOSLEEP();
16810b59d917SJonathan Lemon 	return (ifa);
1682df8bae1dSRodney W. Grimes }
1683df8bae1dSRodney W. Grimes 
1684df8bae1dSRodney W. Grimes /*
1685df8bae1dSRodney W. Grimes  * Find an interface on a specific network.  If many, choice
1686df8bae1dSRodney W. Grimes  * is most specific found.
1687df8bae1dSRodney W. Grimes  */
1688df8bae1dSRodney W. Grimes struct ifaddr *
16890ed6142bSQing Li ifa_ifwithnet(struct sockaddr *addr, int ignore_ptp)
1690df8bae1dSRodney W. Grimes {
169172fd1b6aSDag-Erling Smørgrav 	struct ifnet *ifp;
169272fd1b6aSDag-Erling Smørgrav 	struct ifaddr *ifa;
16938c0fec80SRobert Watson 	struct ifaddr *ifa_maybe = NULL;
1694df8bae1dSRodney W. Grimes 	u_int af = addr->sa_family;
1695df8bae1dSRodney W. Grimes 	char *addr_data = addr->sa_data, *cplim;
1696df8bae1dSRodney W. Grimes 
16977e2a6151SJulian Elischer 	/*
16987e2a6151SJulian Elischer 	 * AF_LINK addresses can be looked up directly by their index number,
16997e2a6151SJulian Elischer 	 * so do that if we can.
17007e2a6151SJulian Elischer 	 */
1701df8bae1dSRodney W. Grimes 	if (af == AF_LINK) {
1702d1dd20beSSam Leffler 	    struct sockaddr_dl *sdl = (struct sockaddr_dl *)addr;
1703603724d3SBjoern A. Zeeb 	    if (sdl->sdl_index && sdl->sdl_index <= V_if_index)
1704f9132cebSJonathan Lemon 		return (ifaddr_byindex(sdl->sdl_index));
1705df8bae1dSRodney W. Grimes 	}
17067e2a6151SJulian Elischer 
17077e2a6151SJulian Elischer 	/*
17088c0fec80SRobert Watson 	 * Scan though each interface, looking for ones that have addresses
17098c0fec80SRobert Watson 	 * in this address family.  Maintain a reference on ifa_maybe once
1710137f91e8SJohn Baldwin 	 * we find one, as we release the IF_ADDR_RLOCK() that kept it stable
17118c0fec80SRobert Watson 	 * when we move onto the next interface.
17127e2a6151SJulian Elischer 	 */
171377dfcdc4SRobert Watson 	IFNET_RLOCK_NOSLEEP();
1714603724d3SBjoern A. Zeeb 	TAILQ_FOREACH(ifp, &V_ifnet, if_link) {
1715137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
171637d40066SPoul-Henning Kamp 		TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) {
171772fd1b6aSDag-Erling Smørgrav 			char *cp, *cp2, *cp3;
1718df8bae1dSRodney W. Grimes 
1719523a02aaSDavid Greenman 			if (ifa->ifa_addr->sa_family != af)
1720df8bae1dSRodney W. Grimes next:				continue;
17210ed6142bSQing Li 			if (af == AF_INET &&
17220ed6142bSQing Li 			    ifp->if_flags & IFF_POINTOPOINT && !ignore_ptp) {
17237e2a6151SJulian Elischer 				/*
17247e2a6151SJulian Elischer 				 * This is a bit broken as it doesn't
17257e2a6151SJulian Elischer 				 * take into account that the remote end may
17267e2a6151SJulian Elischer 				 * be a single node in the network we are
17277e2a6151SJulian Elischer 				 * looking for.
17287e2a6151SJulian Elischer 				 * The trouble is that we don't know the
17297e2a6151SJulian Elischer 				 * netmask for the remote end.
17307e2a6151SJulian Elischer 				 */
1731f0c04221SBjoern A. Zeeb 				if (ifa->ifa_dstaddr != NULL &&
1732ab5ed8a5SRobert Watson 				    sa_equal(addr, ifa->ifa_dstaddr)) {
17338c0fec80SRobert Watson 					ifa_ref(ifa);
1734137f91e8SJohn Baldwin 					IF_ADDR_RUNLOCK(ifp);
17350b59d917SJonathan Lemon 					goto done;
1736ab5ed8a5SRobert Watson 				}
17373740e2adSDavid Greenman 			} else {
17387e2a6151SJulian Elischer 				/*
17397ed8f465SJulian Elischer 				 * if we have a special address handler,
17407ed8f465SJulian Elischer 				 * then use it instead of the generic one.
17417ed8f465SJulian Elischer 				 */
17427ed8f465SJulian Elischer 				if (ifa->ifa_claim_addr) {
1743ab5ed8a5SRobert Watson 					if ((*ifa->ifa_claim_addr)(ifa, addr)) {
17448c0fec80SRobert Watson 						ifa_ref(ifa);
1745137f91e8SJohn Baldwin 						IF_ADDR_RUNLOCK(ifp);
17460b59d917SJonathan Lemon 						goto done;
1747ab5ed8a5SRobert Watson 					}
17487ed8f465SJulian Elischer 					continue;
17497ed8f465SJulian Elischer 				}
17507ed8f465SJulian Elischer 
17517ed8f465SJulian Elischer 				/*
17527e2a6151SJulian Elischer 				 * Scan all the bits in the ifa's address.
17537e2a6151SJulian Elischer 				 * If a bit dissagrees with what we are
17547e2a6151SJulian Elischer 				 * looking for, mask it with the netmask
17557e2a6151SJulian Elischer 				 * to see if it really matters.
17567e2a6151SJulian Elischer 				 * (A byte at a time)
17577e2a6151SJulian Elischer 				 */
1758523a02aaSDavid Greenman 				if (ifa->ifa_netmask == 0)
1759523a02aaSDavid Greenman 					continue;
1760df8bae1dSRodney W. Grimes 				cp = addr_data;
1761df8bae1dSRodney W. Grimes 				cp2 = ifa->ifa_addr->sa_data;
1762df8bae1dSRodney W. Grimes 				cp3 = ifa->ifa_netmask->sa_data;
17637e2a6151SJulian Elischer 				cplim = ifa->ifa_netmask->sa_len
17647e2a6151SJulian Elischer 					+ (char *)ifa->ifa_netmask;
1765df8bae1dSRodney W. Grimes 				while (cp3 < cplim)
1766df8bae1dSRodney W. Grimes 					if ((*cp++ ^ *cp2++) & *cp3++)
17677e2a6151SJulian Elischer 						goto next; /* next address! */
17687e2a6151SJulian Elischer 				/*
17697e2a6151SJulian Elischer 				 * If the netmask of what we just found
17707e2a6151SJulian Elischer 				 * is more specific than what we had before
177124421c1cSGleb Smirnoff 				 * (if we had one), or if the virtual status
177224421c1cSGleb Smirnoff 				 * of new prefix is better than of the old one,
177324421c1cSGleb Smirnoff 				 * then remember the new one before continuing
177424421c1cSGleb Smirnoff 				 * to search for an even better one.
17757e2a6151SJulian Elischer 				 */
17768c0fec80SRobert Watson 				if (ifa_maybe == NULL ||
177724421c1cSGleb Smirnoff 				    ifa_preferred(ifa_maybe, ifa) ||
1778df8bae1dSRodney W. Grimes 				    rn_refines((caddr_t)ifa->ifa_netmask,
17798c0fec80SRobert Watson 				    (caddr_t)ifa_maybe->ifa_netmask)) {
17808c0fec80SRobert Watson 					if (ifa_maybe != NULL)
17818c0fec80SRobert Watson 						ifa_free(ifa_maybe);
1782df8bae1dSRodney W. Grimes 					ifa_maybe = ifa;
17838c0fec80SRobert Watson 					ifa_ref(ifa_maybe);
17848c0fec80SRobert Watson 				}
1785df8bae1dSRodney W. Grimes 			}
1786b2af64fdSDavid Greenman 		}
1787137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
1788b2af64fdSDavid Greenman 	}
17890b59d917SJonathan Lemon 	ifa = ifa_maybe;
17908c0fec80SRobert Watson 	ifa_maybe = NULL;
17910b59d917SJonathan Lemon done:
179277dfcdc4SRobert Watson 	IFNET_RUNLOCK_NOSLEEP();
17938c0fec80SRobert Watson 	if (ifa_maybe != NULL)
17948c0fec80SRobert Watson 		ifa_free(ifa_maybe);
17950b59d917SJonathan Lemon 	return (ifa);
1796df8bae1dSRodney W. Grimes }
1797df8bae1dSRodney W. Grimes 
1798df8bae1dSRodney W. Grimes /*
1799df8bae1dSRodney W. Grimes  * Find an interface address specific to an interface best matching
1800df8bae1dSRodney W. Grimes  * a given address.
1801df8bae1dSRodney W. Grimes  */
1802df8bae1dSRodney W. Grimes struct ifaddr *
180372fd1b6aSDag-Erling Smørgrav ifaof_ifpforaddr(struct sockaddr *addr, struct ifnet *ifp)
1804df8bae1dSRodney W. Grimes {
180572fd1b6aSDag-Erling Smørgrav 	struct ifaddr *ifa;
180672fd1b6aSDag-Erling Smørgrav 	char *cp, *cp2, *cp3;
180772fd1b6aSDag-Erling Smørgrav 	char *cplim;
18088c0fec80SRobert Watson 	struct ifaddr *ifa_maybe = NULL;
1809df8bae1dSRodney W. Grimes 	u_int af = addr->sa_family;
1810df8bae1dSRodney W. Grimes 
1811df8bae1dSRodney W. Grimes 	if (af >= AF_MAX)
1812cd292f12SBjoern A. Zeeb 		return (NULL);
1813137f91e8SJohn Baldwin 	IF_ADDR_RLOCK(ifp);
181437d40066SPoul-Henning Kamp 	TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) {
1815df8bae1dSRodney W. Grimes 		if (ifa->ifa_addr->sa_family != af)
1816df8bae1dSRodney W. Grimes 			continue;
18178c0fec80SRobert Watson 		if (ifa_maybe == NULL)
1818df8bae1dSRodney W. Grimes 			ifa_maybe = ifa;
1819df8bae1dSRodney W. Grimes 		if (ifa->ifa_netmask == 0) {
1820d8d5b10eSRobert Watson 			if (sa_equal(addr, ifa->ifa_addr) ||
1821d8d5b10eSRobert Watson 			    (ifa->ifa_dstaddr &&
1822d8d5b10eSRobert Watson 			    sa_equal(addr, ifa->ifa_dstaddr)))
18232defe5cdSJonathan Lemon 				goto done;
1824df8bae1dSRodney W. Grimes 			continue;
1825df8bae1dSRodney W. Grimes 		}
1826b2af64fdSDavid Greenman 		if (ifp->if_flags & IFF_POINTOPOINT) {
1827d8d5b10eSRobert Watson 			if (sa_equal(addr, ifa->ifa_dstaddr))
1828a8637146SJonathan Lemon 				goto done;
18293740e2adSDavid Greenman 		} else {
1830df8bae1dSRodney W. Grimes 			cp = addr->sa_data;
1831df8bae1dSRodney W. Grimes 			cp2 = ifa->ifa_addr->sa_data;
1832df8bae1dSRodney W. Grimes 			cp3 = ifa->ifa_netmask->sa_data;
1833df8bae1dSRodney W. Grimes 			cplim = ifa->ifa_netmask->sa_len + (char *)ifa->ifa_netmask;
1834df8bae1dSRodney W. Grimes 			for (; cp3 < cplim; cp3++)
1835df8bae1dSRodney W. Grimes 				if ((*cp++ ^ *cp2++) & *cp3)
1836df8bae1dSRodney W. Grimes 					break;
1837df8bae1dSRodney W. Grimes 			if (cp3 == cplim)
18382defe5cdSJonathan Lemon 				goto done;
1839df8bae1dSRodney W. Grimes 		}
1840b2af64fdSDavid Greenman 	}
1841f9132cebSJonathan Lemon 	ifa = ifa_maybe;
1842f9132cebSJonathan Lemon done:
18438c0fec80SRobert Watson 	if (ifa != NULL)
18448c0fec80SRobert Watson 		ifa_ref(ifa);
1845137f91e8SJohn Baldwin 	IF_ADDR_RUNLOCK(ifp);
1846f9132cebSJonathan Lemon 	return (ifa);
1847df8bae1dSRodney W. Grimes }
1848df8bae1dSRodney W. Grimes 
184924421c1cSGleb Smirnoff /*
185024421c1cSGleb Smirnoff  * See whether new ifa is better than current one:
185124421c1cSGleb Smirnoff  * 1) A non-virtual one is preferred over virtual.
185224421c1cSGleb Smirnoff  * 2) A virtual in master state preferred over any other state.
185324421c1cSGleb Smirnoff  *
185424421c1cSGleb Smirnoff  * Used in several address selecting functions.
185524421c1cSGleb Smirnoff  */
185624421c1cSGleb Smirnoff int
185724421c1cSGleb Smirnoff ifa_preferred(struct ifaddr *cur, struct ifaddr *next)
185824421c1cSGleb Smirnoff {
185924421c1cSGleb Smirnoff 
186024421c1cSGleb Smirnoff 	return (cur->ifa_carp && (!next->ifa_carp ||
186124421c1cSGleb Smirnoff 	    ((*carp_master_p)(next) && !(*carp_master_p)(cur))));
186224421c1cSGleb Smirnoff }
186324421c1cSGleb Smirnoff 
18646e6b3f7cSQing Li #include <net/if_llatbl.h>
18656e6b3f7cSQing Li 
1866df8bae1dSRodney W. Grimes /*
1867df8bae1dSRodney W. Grimes  * Default action when installing a route with a Link Level gateway.
1868df8bae1dSRodney W. Grimes  * Lookup an appropriate real ifa to point to.
1869df8bae1dSRodney W. Grimes  * This should be moved to /sys/net/link.c eventually.
1870df8bae1dSRodney W. Grimes  */
18713bda9f9bSPoul-Henning Kamp static void
187272fd1b6aSDag-Erling Smørgrav link_rtrequest(int cmd, struct rtentry *rt, struct rt_addrinfo *info)
1873df8bae1dSRodney W. Grimes {
187472fd1b6aSDag-Erling Smørgrav 	struct ifaddr *ifa, *oifa;
1875df8bae1dSRodney W. Grimes 	struct sockaddr *dst;
1876df8bae1dSRodney W. Grimes 	struct ifnet *ifp;
1877df8bae1dSRodney W. Grimes 
1878d1dd20beSSam Leffler 	RT_LOCK_ASSERT(rt);
1879d1dd20beSSam Leffler 
1880df8bae1dSRodney W. Grimes 	if (cmd != RTM_ADD || ((ifa = rt->rt_ifa) == 0) ||
1881df8bae1dSRodney W. Grimes 	    ((ifp = ifa->ifa_ifp) == 0) || ((dst = rt_key(rt)) == 0))
1882df8bae1dSRodney W. Grimes 		return;
18839448326fSPoul-Henning Kamp 	ifa = ifaof_ifpforaddr(dst, ifp);
18849448326fSPoul-Henning Kamp 	if (ifa) {
1885d1dd20beSSam Leffler 		oifa = rt->rt_ifa;
1886df8bae1dSRodney W. Grimes 		rt->rt_ifa = ifa;
18871099f828SRobert Watson 		ifa_free(oifa);
1888df8bae1dSRodney W. Grimes 		if (ifa->ifa_rtrequest && ifa->ifa_rtrequest != link_rtrequest)
18898071913dSRuslan Ermilov 			ifa->ifa_rtrequest(cmd, rt, info);
1890df8bae1dSRodney W. Grimes 	}
1891df8bae1dSRodney W. Grimes }
1892df8bae1dSRodney W. Grimes 
1893df8bae1dSRodney W. Grimes /*
1894df8bae1dSRodney W. Grimes  * Mark an interface down and notify protocols of
1895df8bae1dSRodney W. Grimes  * the transition.
1896df8bae1dSRodney W. Grimes  */
18978614fb12SMax Laier static void
189872fd1b6aSDag-Erling Smørgrav if_unroute(struct ifnet *ifp, int flag, int fam)
1899df8bae1dSRodney W. Grimes {
190072fd1b6aSDag-Erling Smørgrav 	struct ifaddr *ifa;
1901df8bae1dSRodney W. Grimes 
1902292ee7beSRobert Watson 	KASSERT(flag == IFF_UP, ("if_unroute: flag != IFF_UP"));
1903292ee7beSRobert Watson 
1904e8c2601dSPoul-Henning Kamp 	ifp->if_flags &= ~flag;
190598b9590eSPoul-Henning Kamp 	getmicrotime(&ifp->if_lastchange);
1906e8c2601dSPoul-Henning Kamp 	TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link)
1907e8c2601dSPoul-Henning Kamp 		if (fam == PF_UNSPEC || (fam == ifa->ifa_addr->sa_family))
1908df8bae1dSRodney W. Grimes 			pfctlinput(PRC_IFDOWN, ifa->ifa_addr);
1909db7f0b97SKip Macy 	ifp->if_qflush(ifp);
1910db7f0b97SKip Macy 
1911a9771948SGleb Smirnoff 	if (ifp->if_carp)
191254bfbd51SWill Andrews 		(*carp_linkstate_p)(ifp);
1913df8bae1dSRodney W. Grimes 	rt_ifmsg(ifp);
1914df8bae1dSRodney W. Grimes }
1915df8bae1dSRodney W. Grimes 
1916df8bae1dSRodney W. Grimes /*
1917df8bae1dSRodney W. Grimes  * Mark an interface up and notify protocols of
1918df8bae1dSRodney W. Grimes  * the transition.
1919df8bae1dSRodney W. Grimes  */
19208614fb12SMax Laier static void
192172fd1b6aSDag-Erling Smørgrav if_route(struct ifnet *ifp, int flag, int fam)
1922df8bae1dSRodney W. Grimes {
192372fd1b6aSDag-Erling Smørgrav 	struct ifaddr *ifa;
1924df8bae1dSRodney W. Grimes 
1925292ee7beSRobert Watson 	KASSERT(flag == IFF_UP, ("if_route: flag != IFF_UP"));
1926292ee7beSRobert Watson 
1927e8c2601dSPoul-Henning Kamp 	ifp->if_flags |= flag;
192898b9590eSPoul-Henning Kamp 	getmicrotime(&ifp->if_lastchange);
1929e8c2601dSPoul-Henning Kamp 	TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link)
1930e8c2601dSPoul-Henning Kamp 		if (fam == PF_UNSPEC || (fam == ifa->ifa_addr->sa_family))
1931df8bae1dSRodney W. Grimes 			pfctlinput(PRC_IFUP, ifa->ifa_addr);
1932a9771948SGleb Smirnoff 	if (ifp->if_carp)
193354bfbd51SWill Andrews 		(*carp_linkstate_p)(ifp);
1934df8bae1dSRodney W. Grimes 	rt_ifmsg(ifp);
193582cd038dSYoshinobu Inoue #ifdef INET6
193682cd038dSYoshinobu Inoue 	in6_if_up(ifp);
193782cd038dSYoshinobu Inoue #endif
1938df8bae1dSRodney W. Grimes }
1939df8bae1dSRodney W. Grimes 
1940a6fffd6cSBrooks Davis void	(*vlan_link_state_p)(struct ifnet *);	/* XXX: private from if_vlan */
194175ee267cSGleb Smirnoff void	(*vlan_trunk_cap_p)(struct ifnet *);		/* XXX: private from if_vlan */
1942e4cd31ddSJeff Roberson struct ifnet *(*vlan_trunkdev_p)(struct ifnet *);
1943e4cd31ddSJeff Roberson struct	ifnet *(*vlan_devat_p)(struct ifnet *, uint16_t);
1944e4cd31ddSJeff Roberson int	(*vlan_tag_p)(struct ifnet *, uint16_t *);
1945e4cd31ddSJeff Roberson int	(*vlan_setcookie_p)(struct ifnet *, void *);
1946e4cd31ddSJeff Roberson void	*(*vlan_cookie_p)(struct ifnet *);
194794f5c9cfSSam Leffler 
194894f5c9cfSSam Leffler /*
194968a3482fSGleb Smirnoff  * Handle a change in the interface link state. To avoid LORs
195068a3482fSGleb Smirnoff  * between driver lock and upper layer locks, as well as possible
195168a3482fSGleb Smirnoff  * recursions, we post event to taskqueue, and all job
195268a3482fSGleb Smirnoff  * is done in static do_link_state_change().
195394f5c9cfSSam Leffler  */
195494f5c9cfSSam Leffler void
195594f5c9cfSSam Leffler if_link_state_change(struct ifnet *ifp, int link_state)
195694f5c9cfSSam Leffler {
19574d96314fSGleb Smirnoff 	/* Return if state hasn't changed. */
19584d96314fSGleb Smirnoff 	if (ifp->if_link_state == link_state)
19594d96314fSGleb Smirnoff 		return;
19604d96314fSGleb Smirnoff 
196194f5c9cfSSam Leffler 	ifp->if_link_state = link_state;
19624d96314fSGleb Smirnoff 
196368a3482fSGleb Smirnoff 	taskqueue_enqueue(taskqueue_swi, &ifp->if_linktask);
196468a3482fSGleb Smirnoff }
196568a3482fSGleb Smirnoff 
196668a3482fSGleb Smirnoff static void
196768a3482fSGleb Smirnoff do_link_state_change(void *arg, int pending)
196868a3482fSGleb Smirnoff {
196968a3482fSGleb Smirnoff 	struct ifnet *ifp = (struct ifnet *)arg;
197068a3482fSGleb Smirnoff 	int link_state = ifp->if_link_state;
19718b615593SMarko Zec 	CURVNET_SET(ifp->if_vnet);
197268a3482fSGleb Smirnoff 
19734d96314fSGleb Smirnoff 	/* Notify that the link state has changed. */
197494f5c9cfSSam Leffler 	rt_ifmsg(ifp);
197575ee267cSGleb Smirnoff 	if (ifp->if_vlantrunk != NULL)
1976a6fffd6cSBrooks Davis 		(*vlan_link_state_p)(ifp);
19771c7899c7SGleb Smirnoff 
19781c7899c7SGleb Smirnoff 	if ((ifp->if_type == IFT_ETHER || ifp->if_type == IFT_L2VLAN) &&
19791c7899c7SGleb Smirnoff 	    IFP2AC(ifp)->ac_netgraph != NULL)
19801c7899c7SGleb Smirnoff 		(*ng_ether_link_state_p)(ifp, link_state);
19814d96314fSGleb Smirnoff 	if (ifp->if_carp)
198254bfbd51SWill Andrews 		(*carp_linkstate_p)(ifp);
1983ddf32010SAndrew Thompson 	if (ifp->if_bridge)
19847702d401SAndrew Thompson 		(*bridge_linkstate_p)(ifp);
1985ddf32010SAndrew Thompson 	if (ifp->if_lagg)
198618242d3bSAndrew Thompson 		(*lagg_linkstate_p)(ifp, link_state);
19878f867517SAndrew Thompson 
198821ca7b57SMarko Zec 	if (IS_DEFAULT_VNET(curvnet))
19899d80a330SBrooks Davis 		devctl_notify("IFNET", ifp->if_xname,
199021ca7b57SMarko Zec 		    (link_state == LINK_STATE_UP) ? "LINK_UP" : "LINK_DOWN",
199121ca7b57SMarko Zec 		    NULL);
199268a3482fSGleb Smirnoff 	if (pending > 1)
199368a3482fSGleb Smirnoff 		if_printf(ifp, "%d link states coalesced\n", pending);
19945515c2e7SGleb Smirnoff 	if (log_link_state_change)
19958b02df24SGleb Smirnoff 		log(LOG_NOTICE, "%s: link state changed to %s\n", ifp->if_xname,
19968b02df24SGleb Smirnoff 		    (link_state == LINK_STATE_UP) ? "UP" : "DOWN" );
1997e4cd31ddSJeff Roberson 	EVENTHANDLER_INVOKE(ifnet_link_event, ifp, ifp->if_link_state);
19988b615593SMarko Zec 	CURVNET_RESTORE();
199994f5c9cfSSam Leffler }
200094f5c9cfSSam Leffler 
2001df8bae1dSRodney W. Grimes /*
2002e8c2601dSPoul-Henning Kamp  * Mark an interface down and notify protocols of
2003e8c2601dSPoul-Henning Kamp  * the transition.
2004e8c2601dSPoul-Henning Kamp  */
2005e8c2601dSPoul-Henning Kamp void
200672fd1b6aSDag-Erling Smørgrav if_down(struct ifnet *ifp)
2007e8c2601dSPoul-Henning Kamp {
2008e8c2601dSPoul-Henning Kamp 
2009e8c2601dSPoul-Henning Kamp 	if_unroute(ifp, IFF_UP, AF_UNSPEC);
2010e8c2601dSPoul-Henning Kamp }
2011e8c2601dSPoul-Henning Kamp 
2012e8c2601dSPoul-Henning Kamp /*
2013e8c2601dSPoul-Henning Kamp  * Mark an interface up and notify protocols of
2014e8c2601dSPoul-Henning Kamp  * the transition.
2015e8c2601dSPoul-Henning Kamp  */
2016e8c2601dSPoul-Henning Kamp void
201772fd1b6aSDag-Erling Smørgrav if_up(struct ifnet *ifp)
2018e8c2601dSPoul-Henning Kamp {
2019e8c2601dSPoul-Henning Kamp 
2020e8c2601dSPoul-Henning Kamp 	if_route(ifp, IFF_UP, AF_UNSPEC);
2021e8c2601dSPoul-Henning Kamp }
2022e8c2601dSPoul-Henning Kamp 
2023e8c2601dSPoul-Henning Kamp /*
2024df8bae1dSRodney W. Grimes  * Flush an interface queue.
2025df8bae1dSRodney W. Grimes  */
20267cc5b47fSKip Macy void
2027db7f0b97SKip Macy if_qflush(struct ifnet *ifp)
2028df8bae1dSRodney W. Grimes {
202972fd1b6aSDag-Erling Smørgrav 	struct mbuf *m, *n;
2030db7f0b97SKip Macy 	struct ifaltq *ifq;
2031df8bae1dSRodney W. Grimes 
2032db7f0b97SKip Macy 	ifq = &ifp->if_snd;
20337b21048cSMax Laier 	IFQ_LOCK(ifq);
203402b199f1SMax Laier #ifdef ALTQ
203502b199f1SMax Laier 	if (ALTQ_IS_ENABLED(ifq))
203602b199f1SMax Laier 		ALTQ_PURGE(ifq);
203702b199f1SMax Laier #endif
2038df8bae1dSRodney W. Grimes 	n = ifq->ifq_head;
20399448326fSPoul-Henning Kamp 	while ((m = n) != 0) {
2040df8bae1dSRodney W. Grimes 		n = m->m_act;
2041df8bae1dSRodney W. Grimes 		m_freem(m);
2042df8bae1dSRodney W. Grimes 	}
2043df8bae1dSRodney W. Grimes 	ifq->ifq_head = 0;
2044df8bae1dSRodney W. Grimes 	ifq->ifq_tail = 0;
2045df8bae1dSRodney W. Grimes 	ifq->ifq_len = 0;
20467b21048cSMax Laier 	IFQ_UNLOCK(ifq);
2047df8bae1dSRodney W. Grimes }
2048df8bae1dSRodney W. Grimes 
2049df8bae1dSRodney W. Grimes /*
20506064c5d3SRobert Watson  * Map interface name to interface structure pointer, with or without
20516064c5d3SRobert Watson  * returning a reference.
2052df8bae1dSRodney W. Grimes  */
2053df8bae1dSRodney W. Grimes struct ifnet *
20546064c5d3SRobert Watson ifunit_ref(const char *name)
20556064c5d3SRobert Watson {
20566064c5d3SRobert Watson 	struct ifnet *ifp;
20576064c5d3SRobert Watson 
205877dfcdc4SRobert Watson 	IFNET_RLOCK_NOSLEEP();
20596064c5d3SRobert Watson 	TAILQ_FOREACH(ifp, &V_ifnet, if_link) {
20608bd015a1SRobert Watson 		if (strncmp(name, ifp->if_xname, IFNAMSIZ) == 0 &&
20618bd015a1SRobert Watson 		    !(ifp->if_flags & IFF_DYING))
20626064c5d3SRobert Watson 			break;
20636064c5d3SRobert Watson 	}
20646064c5d3SRobert Watson 	if (ifp != NULL)
20656064c5d3SRobert Watson 		if_ref(ifp);
206677dfcdc4SRobert Watson 	IFNET_RUNLOCK_NOSLEEP();
20676064c5d3SRobert Watson 	return (ifp);
20686064c5d3SRobert Watson }
20696064c5d3SRobert Watson 
20706064c5d3SRobert Watson struct ifnet *
207130aad87dSBrooks Davis ifunit(const char *name)
2072df8bae1dSRodney W. Grimes {
20738b7805e4SBoris Popov 	struct ifnet *ifp;
2074df8bae1dSRodney W. Grimes 
207577dfcdc4SRobert Watson 	IFNET_RLOCK_NOSLEEP();
2076603724d3SBjoern A. Zeeb 	TAILQ_FOREACH(ifp, &V_ifnet, if_link) {
207736c19a57SBrooks Davis 		if (strncmp(name, ifp->if_xname, IFNAMSIZ) == 0)
2078df8bae1dSRodney W. Grimes 			break;
2079df8bae1dSRodney W. Grimes 	}
208077dfcdc4SRobert Watson 	IFNET_RUNLOCK_NOSLEEP();
2081df8bae1dSRodney W. Grimes 	return (ifp);
2082df8bae1dSRodney W. Grimes }
2083df8bae1dSRodney W. Grimes 
208482cd038dSYoshinobu Inoue /*
2085f13ad206SJonathan Lemon  * Hardware specific interface ioctls.
2086df8bae1dSRodney W. Grimes  */
2087f13ad206SJonathan Lemon static int
2088f13ad206SJonathan Lemon ifhwioctl(u_long cmd, struct ifnet *ifp, caddr_t data, struct thread *td)
2089df8bae1dSRodney W. Grimes {
2090f13ad206SJonathan Lemon 	struct ifreq *ifr;
2091413dd0baSPoul-Henning Kamp 	struct ifstat *ifs;
2092f13ad206SJonathan Lemon 	int error = 0;
2093292ee7beSRobert Watson 	int new_flags, temp_flags;
209436c19a57SBrooks Davis 	size_t namelen, onamelen;
2095215940b3SXin LI 	size_t descrlen;
2096215940b3SXin LI 	char *descrbuf, *odescrbuf;
209736c19a57SBrooks Davis 	char new_name[IFNAMSIZ];
209836c19a57SBrooks Davis 	struct ifaddr *ifa;
209936c19a57SBrooks Davis 	struct sockaddr_dl *sdl;
2100df8bae1dSRodney W. Grimes 
2101df8bae1dSRodney W. Grimes 	ifr = (struct ifreq *)data;
210230aad87dSBrooks Davis 	switch (cmd) {
2103de593450SJonathan Lemon 	case SIOCGIFINDEX:
2104de593450SJonathan Lemon 		ifr->ifr_index = ifp->if_index;
2105de593450SJonathan Lemon 		break;
2106de593450SJonathan Lemon 
2107df8bae1dSRodney W. Grimes 	case SIOCGIFFLAGS:
2108292ee7beSRobert Watson 		temp_flags = ifp->if_flags | ifp->if_drv_flags;
2109292ee7beSRobert Watson 		ifr->ifr_flags = temp_flags & 0xffff;
2110292ee7beSRobert Watson 		ifr->ifr_flagshigh = temp_flags >> 16;
2111df8bae1dSRodney W. Grimes 		break;
2112df8bae1dSRodney W. Grimes 
2113016da741SJonathan Lemon 	case SIOCGIFCAP:
2114016da741SJonathan Lemon 		ifr->ifr_reqcap = ifp->if_capabilities;
2115016da741SJonathan Lemon 		ifr->ifr_curcap = ifp->if_capenable;
2116016da741SJonathan Lemon 		break;
2117016da741SJonathan Lemon 
21188f293a63SRobert Watson #ifdef MAC
21198f293a63SRobert Watson 	case SIOCGIFMAC:
212030d239bcSRobert Watson 		error = mac_ifnet_ioctl_get(td->td_ucred, ifr, ifp);
21218f293a63SRobert Watson 		break;
21228f293a63SRobert Watson #endif
21238f293a63SRobert Watson 
2124df8bae1dSRodney W. Grimes 	case SIOCGIFMETRIC:
2125df8bae1dSRodney W. Grimes 		ifr->ifr_metric = ifp->if_metric;
2126df8bae1dSRodney W. Grimes 		break;
2127df8bae1dSRodney W. Grimes 
2128a7028af7SDavid Greenman 	case SIOCGIFMTU:
2129a7028af7SDavid Greenman 		ifr->ifr_mtu = ifp->if_mtu;
2130a7028af7SDavid Greenman 		break;
2131a7028af7SDavid Greenman 
2132074c4a4eSGarrett Wollman 	case SIOCGIFPHYS:
2133074c4a4eSGarrett Wollman 		ifr->ifr_phys = ifp->if_physical;
2134074c4a4eSGarrett Wollman 		break;
2135074c4a4eSGarrett Wollman 
2136215940b3SXin LI 	case SIOCGIFDESCR:
2137215940b3SXin LI 		error = 0;
2138215940b3SXin LI 		sx_slock(&ifdescr_sx);
213957d84848SXin LI 		if (ifp->if_description == NULL)
2140215940b3SXin LI 			error = ENOMSG;
214157d84848SXin LI 		else {
2142215940b3SXin LI 			/* space for terminating nul */
2143215940b3SXin LI 			descrlen = strlen(ifp->if_description) + 1;
2144215940b3SXin LI 			if (ifr->ifr_buffer.length < descrlen)
214557d84848SXin LI 				ifr->ifr_buffer.buffer = NULL;
2146215940b3SXin LI 			else
2147215940b3SXin LI 				error = copyout(ifp->if_description,
2148215940b3SXin LI 				    ifr->ifr_buffer.buffer, descrlen);
2149215940b3SXin LI 			ifr->ifr_buffer.length = descrlen;
2150215940b3SXin LI 		}
2151215940b3SXin LI 		sx_sunlock(&ifdescr_sx);
2152215940b3SXin LI 		break;
2153215940b3SXin LI 
2154215940b3SXin LI 	case SIOCSIFDESCR:
2155215940b3SXin LI 		error = priv_check(td, PRIV_NET_SETIFDESCR);
2156215940b3SXin LI 		if (error)
2157215940b3SXin LI 			return (error);
2158215940b3SXin LI 
2159215940b3SXin LI 		/*
2160215940b3SXin LI 		 * Copy only (length-1) bytes to make sure that
2161215940b3SXin LI 		 * if_description is always nul terminated.  The
2162215940b3SXin LI 		 * length parameter is supposed to count the
2163215940b3SXin LI 		 * terminating nul in.
2164215940b3SXin LI 		 */
2165215940b3SXin LI 		if (ifr->ifr_buffer.length > ifdescr_maxlen)
2166215940b3SXin LI 			return (ENAMETOOLONG);
2167215940b3SXin LI 		else if (ifr->ifr_buffer.length == 0)
2168215940b3SXin LI 			descrbuf = NULL;
2169215940b3SXin LI 		else {
2170215940b3SXin LI 			descrbuf = malloc(ifr->ifr_buffer.length, M_IFDESCR,
2171215940b3SXin LI 			    M_WAITOK | M_ZERO);
2172215940b3SXin LI 			error = copyin(ifr->ifr_buffer.buffer, descrbuf,
2173215940b3SXin LI 			    ifr->ifr_buffer.length - 1);
2174215940b3SXin LI 			if (error) {
2175215940b3SXin LI 				free(descrbuf, M_IFDESCR);
2176215940b3SXin LI 				break;
2177215940b3SXin LI 			}
2178215940b3SXin LI 		}
2179215940b3SXin LI 
2180215940b3SXin LI 		sx_xlock(&ifdescr_sx);
2181215940b3SXin LI 		odescrbuf = ifp->if_description;
2182215940b3SXin LI 		ifp->if_description = descrbuf;
2183215940b3SXin LI 		sx_xunlock(&ifdescr_sx);
2184215940b3SXin LI 
2185215940b3SXin LI 		getmicrotime(&ifp->if_lastchange);
2186215940b3SXin LI 		free(odescrbuf, M_IFDESCR);
2187215940b3SXin LI 		break;
2188215940b3SXin LI 
218935fd7bc0SBjoern A. Zeeb 	case SIOCGIFFIB:
219035fd7bc0SBjoern A. Zeeb 		ifr->ifr_fib = ifp->if_fib;
219135fd7bc0SBjoern A. Zeeb 		break;
219235fd7bc0SBjoern A. Zeeb 
219335fd7bc0SBjoern A. Zeeb 	case SIOCSIFFIB:
219435fd7bc0SBjoern A. Zeeb 		error = priv_check(td, PRIV_NET_SETIFFIB);
219535fd7bc0SBjoern A. Zeeb 		if (error)
219635fd7bc0SBjoern A. Zeeb 			return (error);
219735fd7bc0SBjoern A. Zeeb 		if (ifr->ifr_fib >= rt_numfibs)
219835fd7bc0SBjoern A. Zeeb 			return (EINVAL);
219935fd7bc0SBjoern A. Zeeb 
220035fd7bc0SBjoern A. Zeeb 		ifp->if_fib = ifr->ifr_fib;
220135fd7bc0SBjoern A. Zeeb 		break;
220235fd7bc0SBjoern A. Zeeb 
2203df8bae1dSRodney W. Grimes 	case SIOCSIFFLAGS:
2204acd3428bSRobert Watson 		error = priv_check(td, PRIV_NET_SETIFFLAGS);
22059448326fSPoul-Henning Kamp 		if (error)
2206df8bae1dSRodney W. Grimes 			return (error);
2207292ee7beSRobert Watson 		/*
2208292ee7beSRobert Watson 		 * Currently, no driver owned flags pass the IFF_CANTCHANGE
2209292ee7beSRobert Watson 		 * check, so we don't need special handling here yet.
2210292ee7beSRobert Watson 		 */
221162f76486SMaxim Sobolev 		new_flags = (ifr->ifr_flags & 0xffff) |
221262f76486SMaxim Sobolev 		    (ifr->ifr_flagshigh << 16);
2213*af50ea38SGleb Smirnoff 		if (ifp->if_flags & IFF_UP &&
221462f76486SMaxim Sobolev 		    (new_flags & IFF_UP) == 0) {
2215df8bae1dSRodney W. Grimes 			if_down(ifp);
221662f76486SMaxim Sobolev 		} else if (new_flags & IFF_UP &&
2217cf4b9371SPoul-Henning Kamp 		    (ifp->if_flags & IFF_UP) == 0) {
2218df8bae1dSRodney W. Grimes 			if_up(ifp);
2219df8bae1dSRodney W. Grimes 		}
22207aebc5e8SYaroslav Tykhiy 		/* See if permanently promiscuous mode bit is about to flip */
22217aebc5e8SYaroslav Tykhiy 		if ((ifp->if_flags ^ new_flags) & IFF_PPROMISC) {
22227aebc5e8SYaroslav Tykhiy 			if (new_flags & IFF_PPROMISC)
22237aebc5e8SYaroslav Tykhiy 				ifp->if_flags |= IFF_PROMISC;
22247aebc5e8SYaroslav Tykhiy 			else if (ifp->if_pcount == 0)
22257aebc5e8SYaroslav Tykhiy 				ifp->if_flags &= ~IFF_PROMISC;
22267aebc5e8SYaroslav Tykhiy 			log(LOG_INFO, "%s: permanently promiscuous mode %s\n",
22277aebc5e8SYaroslav Tykhiy 			    ifp->if_xname,
22287aebc5e8SYaroslav Tykhiy 			    (new_flags & IFF_PPROMISC) ? "enabled" : "disabled");
22297aebc5e8SYaroslav Tykhiy 		}
2230df8bae1dSRodney W. Grimes 		ifp->if_flags = (ifp->if_flags & IFF_CANTCHANGE) |
223162f76486SMaxim Sobolev 			(new_flags &~ IFF_CANTCHANGE);
223231302ebfSRobert Watson 		if (ifp->if_ioctl) {
2233df8bae1dSRodney W. Grimes 			(void) (*ifp->if_ioctl)(ifp, cmd, data);
223431302ebfSRobert Watson 		}
223598b9590eSPoul-Henning Kamp 		getmicrotime(&ifp->if_lastchange);
2236df8bae1dSRodney W. Grimes 		break;
2237df8bae1dSRodney W. Grimes 
2238016da741SJonathan Lemon 	case SIOCSIFCAP:
2239acd3428bSRobert Watson 		error = priv_check(td, PRIV_NET_SETIFCAP);
2240016da741SJonathan Lemon 		if (error)
2241016da741SJonathan Lemon 			return (error);
2242efb4018bSYaroslav Tykhiy 		if (ifp->if_ioctl == NULL)
2243efb4018bSYaroslav Tykhiy 			return (EOPNOTSUPP);
2244016da741SJonathan Lemon 		if (ifr->ifr_reqcap & ~ifp->if_capabilities)
2245016da741SJonathan Lemon 			return (EINVAL);
2246efb4018bSYaroslav Tykhiy 		error = (*ifp->if_ioctl)(ifp, cmd, data);
2247efb4018bSYaroslav Tykhiy 		if (error == 0)
2248efb4018bSYaroslav Tykhiy 			getmicrotime(&ifp->if_lastchange);
2249016da741SJonathan Lemon 		break;
2250016da741SJonathan Lemon 
22518f293a63SRobert Watson #ifdef MAC
22528f293a63SRobert Watson 	case SIOCSIFMAC:
225330d239bcSRobert Watson 		error = mac_ifnet_ioctl_set(td->td_ucred, ifr, ifp);
22548f293a63SRobert Watson 		break;
22558f293a63SRobert Watson #endif
22568f293a63SRobert Watson 
225736c19a57SBrooks Davis 	case SIOCSIFNAME:
2258acd3428bSRobert Watson 		error = priv_check(td, PRIV_NET_SETIFNAME);
2259acd3428bSRobert Watson 		if (error)
226036c19a57SBrooks Davis 			return (error);
226136c19a57SBrooks Davis 		error = copyinstr(ifr->ifr_data, new_name, IFNAMSIZ, NULL);
2262bc1470f1SBrooks Davis 		if (error != 0)
226336c19a57SBrooks Davis 			return (error);
2264bc1470f1SBrooks Davis 		if (new_name[0] == '\0')
2265bc1470f1SBrooks Davis 			return (EINVAL);
226636c19a57SBrooks Davis 		if (ifunit(new_name) != NULL)
226736c19a57SBrooks Davis 			return (EEXIST);
226836c19a57SBrooks Davis 
22695428776eSJohn Baldwin 		/*
22705428776eSJohn Baldwin 		 * XXX: Locking.  Nothing else seems to lock if_flags,
22715428776eSJohn Baldwin 		 * and there are numerous other races with the
22725428776eSJohn Baldwin 		 * ifunit() checks not being atomic with namespace
22735428776eSJohn Baldwin 		 * changes (renames, vmoves, if_attach, etc).
22745428776eSJohn Baldwin 		 */
22755428776eSJohn Baldwin 		ifp->if_flags |= IFF_RENAMING;
22765428776eSJohn Baldwin 
227736c19a57SBrooks Davis 		/* Announce the departure of the interface. */
227836c19a57SBrooks Davis 		rt_ifannouncemsg(ifp, IFAN_DEPARTURE);
227952023244SMax Laier 		EVENTHANDLER_INVOKE(ifnet_departure_event, ifp);
228036c19a57SBrooks Davis 
228171672bb6SBrooks Davis 		log(LOG_INFO, "%s: changing name to '%s'\n",
228271672bb6SBrooks Davis 		    ifp->if_xname, new_name);
228371672bb6SBrooks Davis 
228467420bdaSGleb Smirnoff 		IF_ADDR_WLOCK(ifp);
228536c19a57SBrooks Davis 		strlcpy(ifp->if_xname, new_name, sizeof(ifp->if_xname));
22864a0d6638SRuslan Ermilov 		ifa = ifp->if_addr;
228736c19a57SBrooks Davis 		sdl = (struct sockaddr_dl *)ifa->ifa_addr;
228836c19a57SBrooks Davis 		namelen = strlen(new_name);
228936c19a57SBrooks Davis 		onamelen = sdl->sdl_nlen;
229036c19a57SBrooks Davis 		/*
229136c19a57SBrooks Davis 		 * Move the address if needed.  This is safe because we
229236c19a57SBrooks Davis 		 * allocate space for a name of length IFNAMSIZ when we
229336c19a57SBrooks Davis 		 * create this in if_attach().
229436c19a57SBrooks Davis 		 */
229536c19a57SBrooks Davis 		if (namelen != onamelen) {
229636c19a57SBrooks Davis 			bcopy(sdl->sdl_data + onamelen,
229736c19a57SBrooks Davis 			    sdl->sdl_data + namelen, sdl->sdl_alen);
229836c19a57SBrooks Davis 		}
229936c19a57SBrooks Davis 		bcopy(new_name, sdl->sdl_data, namelen);
230036c19a57SBrooks Davis 		sdl->sdl_nlen = namelen;
230136c19a57SBrooks Davis 		sdl = (struct sockaddr_dl *)ifa->ifa_netmask;
230236c19a57SBrooks Davis 		bzero(sdl->sdl_data, onamelen);
230336c19a57SBrooks Davis 		while (namelen != 0)
230436c19a57SBrooks Davis 			sdl->sdl_data[--namelen] = 0xff;
230567420bdaSGleb Smirnoff 		IF_ADDR_WUNLOCK(ifp);
230636c19a57SBrooks Davis 
230725a4adceSMax Laier 		EVENTHANDLER_INVOKE(ifnet_arrival_event, ifp);
230836c19a57SBrooks Davis 		/* Announce the return of the interface. */
230936c19a57SBrooks Davis 		rt_ifannouncemsg(ifp, IFAN_ARRIVAL);
23105428776eSJohn Baldwin 
23115428776eSJohn Baldwin 		ifp->if_flags &= ~IFF_RENAMING;
231236c19a57SBrooks Davis 		break;
231336c19a57SBrooks Davis 
2314679e1390SJamie Gritton #ifdef VIMAGE
2315679e1390SJamie Gritton 	case SIOCSIFVNET:
2316679e1390SJamie Gritton 		error = priv_check(td, PRIV_NET_SETIFVNET);
2317679e1390SJamie Gritton 		if (error)
2318679e1390SJamie Gritton 			return (error);
2319be31e5e7SBjoern A. Zeeb 		error = if_vmove_loan(td, ifp, ifr->ifr_name, ifr->ifr_jid);
2320679e1390SJamie Gritton 		break;
2321679e1390SJamie Gritton #endif
2322679e1390SJamie Gritton 
2323df8bae1dSRodney W. Grimes 	case SIOCSIFMETRIC:
2324acd3428bSRobert Watson 		error = priv_check(td, PRIV_NET_SETIFMETRIC);
23259448326fSPoul-Henning Kamp 		if (error)
2326df8bae1dSRodney W. Grimes 			return (error);
2327df8bae1dSRodney W. Grimes 		ifp->if_metric = ifr->ifr_metric;
232898b9590eSPoul-Henning Kamp 		getmicrotime(&ifp->if_lastchange);
2329df8bae1dSRodney W. Grimes 		break;
2330df8bae1dSRodney W. Grimes 
2331074c4a4eSGarrett Wollman 	case SIOCSIFPHYS:
2332acd3428bSRobert Watson 		error = priv_check(td, PRIV_NET_SETIFPHYS);
2333e39a0280SGary Palmer 		if (error)
2334913e410eSYaroslav Tykhiy 			return (error);
2335913e410eSYaroslav Tykhiy 		if (ifp->if_ioctl == NULL)
2336913e410eSYaroslav Tykhiy 			return (EOPNOTSUPP);
2337e39a0280SGary Palmer 		error = (*ifp->if_ioctl)(ifp, cmd, data);
2338e39a0280SGary Palmer 		if (error == 0)
233998b9590eSPoul-Henning Kamp 			getmicrotime(&ifp->if_lastchange);
2340913e410eSYaroslav Tykhiy 		break;
2341074c4a4eSGarrett Wollman 
2342a7028af7SDavid Greenman 	case SIOCSIFMTU:
234382cd038dSYoshinobu Inoue 	{
234482cd038dSYoshinobu Inoue 		u_long oldmtu = ifp->if_mtu;
234582cd038dSYoshinobu Inoue 
2346acd3428bSRobert Watson 		error = priv_check(td, PRIV_NET_SETIFMTU);
23479448326fSPoul-Henning Kamp 		if (error)
2348a7028af7SDavid Greenman 			return (error);
2349aab3beeeSBrian Somers 		if (ifr->ifr_mtu < IF_MINMTU || ifr->ifr_mtu > IF_MAXMTU)
235075ee03cbSDavid Greenman 			return (EINVAL);
2351f13ad206SJonathan Lemon 		if (ifp->if_ioctl == NULL)
2352f13ad206SJonathan Lemon 			return (EOPNOTSUPP);
2353e39a0280SGary Palmer 		error = (*ifp->if_ioctl)(ifp, cmd, data);
235448f71763SRuslan Ermilov 		if (error == 0) {
235598b9590eSPoul-Henning Kamp 			getmicrotime(&ifp->if_lastchange);
235648f71763SRuslan Ermilov 			rt_ifmsg(ifp);
235748f71763SRuslan Ermilov 		}
235882cd038dSYoshinobu Inoue 		/*
235982cd038dSYoshinobu Inoue 		 * If the link MTU changed, do network layer specific procedure.
236082cd038dSYoshinobu Inoue 		 */
236182cd038dSYoshinobu Inoue 		if (ifp->if_mtu != oldmtu) {
236282cd038dSYoshinobu Inoue #ifdef INET6
236382cd038dSYoshinobu Inoue 			nd6_setmtu(ifp);
236482cd038dSYoshinobu Inoue #endif
236582cd038dSYoshinobu Inoue 		}
2366f13ad206SJonathan Lemon 		break;
236782cd038dSYoshinobu Inoue 	}
2368a7028af7SDavid Greenman 
2369df8bae1dSRodney W. Grimes 	case SIOCADDMULTI:
2370df8bae1dSRodney W. Grimes 	case SIOCDELMULTI:
2371acd3428bSRobert Watson 		if (cmd == SIOCADDMULTI)
2372acd3428bSRobert Watson 			error = priv_check(td, PRIV_NET_ADDMULTI);
2373acd3428bSRobert Watson 		else
2374acd3428bSRobert Watson 			error = priv_check(td, PRIV_NET_DELMULTI);
23759448326fSPoul-Henning Kamp 		if (error)
2376df8bae1dSRodney W. Grimes 			return (error);
2377477180fbSGarrett Wollman 
2378477180fbSGarrett Wollman 		/* Don't allow group membership on non-multicast interfaces. */
2379477180fbSGarrett Wollman 		if ((ifp->if_flags & IFF_MULTICAST) == 0)
2380f13ad206SJonathan Lemon 			return (EOPNOTSUPP);
2381477180fbSGarrett Wollman 
2382477180fbSGarrett Wollman 		/* Don't let users screw up protocols' entries. */
2383477180fbSGarrett Wollman 		if (ifr->ifr_addr.sa_family != AF_LINK)
2384f13ad206SJonathan Lemon 			return (EINVAL);
2385477180fbSGarrett Wollman 
2386477180fbSGarrett Wollman 		if (cmd == SIOCADDMULTI) {
2387477180fbSGarrett Wollman 			struct ifmultiaddr *ifma;
2388ec002feeSBruce M Simpson 
2389ec002feeSBruce M Simpson 			/*
2390ec002feeSBruce M Simpson 			 * Userland is only permitted to join groups once
2391ec002feeSBruce M Simpson 			 * via the if_addmulti() KPI, because it cannot hold
2392ec002feeSBruce M Simpson 			 * struct ifmultiaddr * between calls. It may also
2393ec002feeSBruce M Simpson 			 * lose a race while we check if the membership
2394ec002feeSBruce M Simpson 			 * already exists.
2395ec002feeSBruce M Simpson 			 */
2396137f91e8SJohn Baldwin 			IF_ADDR_RLOCK(ifp);
2397ec002feeSBruce M Simpson 			ifma = if_findmulti(ifp, &ifr->ifr_addr);
2398137f91e8SJohn Baldwin 			IF_ADDR_RUNLOCK(ifp);
2399ec002feeSBruce M Simpson 			if (ifma != NULL)
2400ec002feeSBruce M Simpson 				error = EADDRINUSE;
2401ec002feeSBruce M Simpson 			else
2402477180fbSGarrett Wollman 				error = if_addmulti(ifp, &ifr->ifr_addr, &ifma);
2403477180fbSGarrett Wollman 		} else {
2404477180fbSGarrett Wollman 			error = if_delmulti(ifp, &ifr->ifr_addr);
2405477180fbSGarrett Wollman 		}
2406e39a0280SGary Palmer 		if (error == 0)
240798b9590eSPoul-Henning Kamp 			getmicrotime(&ifp->if_lastchange);
2408f13ad206SJonathan Lemon 		break;
2409df8bae1dSRodney W. Grimes 
241041b3e8e5SJun-ichiro itojun Hagino 	case SIOCSIFPHYADDR:
241141b3e8e5SJun-ichiro itojun Hagino 	case SIOCDIFPHYADDR:
241241b3e8e5SJun-ichiro itojun Hagino #ifdef INET6
241341b3e8e5SJun-ichiro itojun Hagino 	case SIOCSIFPHYADDR_IN6:
241441b3e8e5SJun-ichiro itojun Hagino #endif
241533841545SHajimu UMEMOTO 	case SIOCSLIFPHYADDR:
2416a912e453SPeter Wemm 	case SIOCSIFMEDIA:
2417d7189ec6SJoerg Wunsch 	case SIOCSIFGENERIC:
2418acd3428bSRobert Watson 		error = priv_check(td, PRIV_NET_HWIOCTL);
2419a912e453SPeter Wemm 		if (error)
2420a912e453SPeter Wemm 			return (error);
2421f13ad206SJonathan Lemon 		if (ifp->if_ioctl == NULL)
2422a912e453SPeter Wemm 			return (EOPNOTSUPP);
2423a912e453SPeter Wemm 		error = (*ifp->if_ioctl)(ifp, cmd, data);
2424a912e453SPeter Wemm 		if (error == 0)
242598b9590eSPoul-Henning Kamp 			getmicrotime(&ifp->if_lastchange);
2426f13ad206SJonathan Lemon 		break;
2427a912e453SPeter Wemm 
2428413dd0baSPoul-Henning Kamp 	case SIOCGIFSTATUS:
2429413dd0baSPoul-Henning Kamp 		ifs = (struct ifstat *)data;
2430413dd0baSPoul-Henning Kamp 		ifs->ascii[0] = '\0';
2431413dd0baSPoul-Henning Kamp 
243233841545SHajimu UMEMOTO 	case SIOCGIFPSRCADDR:
243333841545SHajimu UMEMOTO 	case SIOCGIFPDSTADDR:
243433841545SHajimu UMEMOTO 	case SIOCGLIFPHYADDR:
2435a912e453SPeter Wemm 	case SIOCGIFMEDIA:
2436d7189ec6SJoerg Wunsch 	case SIOCGIFGENERIC:
2437913e410eSYaroslav Tykhiy 		if (ifp->if_ioctl == NULL)
2438a912e453SPeter Wemm 			return (EOPNOTSUPP);
2439f13ad206SJonathan Lemon 		error = (*ifp->if_ioctl)(ifp, cmd, data);
2440f13ad206SJonathan Lemon 		break;
2441a912e453SPeter Wemm 
2442b106252cSBill Paul 	case SIOCSIFLLADDR:
2443acd3428bSRobert Watson 		error = priv_check(td, PRIV_NET_SETLLADDR);
2444b106252cSBill Paul 		if (error)
2445b106252cSBill Paul 			return (error);
2446f13ad206SJonathan Lemon 		error = if_setlladdr(ifp,
244766ce51ceSArchie Cobbs 		    ifr->ifr_addr.sa_data, ifr->ifr_addr.sa_len);
2448ea4ca115SAndrew Thompson 		EVENTHANDLER_INVOKE(iflladdr_event, ifp);
2449f13ad206SJonathan Lemon 		break;
245066ce51ceSArchie Cobbs 
24510dad3f0eSMax Laier 	case SIOCAIFGROUP:
24520dad3f0eSMax Laier 	{
24530dad3f0eSMax Laier 		struct ifgroupreq *ifgr = (struct ifgroupreq *)ifr;
24540dad3f0eSMax Laier 
2455acd3428bSRobert Watson 		error = priv_check(td, PRIV_NET_ADDIFGROUP);
24560dad3f0eSMax Laier 		if (error)
24570dad3f0eSMax Laier 			return (error);
24580dad3f0eSMax Laier 		if ((error = if_addgroup(ifp, ifgr->ifgr_group)))
24590dad3f0eSMax Laier 			return (error);
24600dad3f0eSMax Laier 		break;
24610dad3f0eSMax Laier 	}
24620dad3f0eSMax Laier 
24630dad3f0eSMax Laier 	case SIOCGIFGROUP:
24640dad3f0eSMax Laier 		if ((error = if_getgroup((struct ifgroupreq *)ifr, ifp)))
24650dad3f0eSMax Laier 			return (error);
24660dad3f0eSMax Laier 		break;
24670dad3f0eSMax Laier 
24680dad3f0eSMax Laier 	case SIOCDIFGROUP:
24690dad3f0eSMax Laier 	{
24700dad3f0eSMax Laier 		struct ifgroupreq *ifgr = (struct ifgroupreq *)ifr;
24710dad3f0eSMax Laier 
2472acd3428bSRobert Watson 		error = priv_check(td, PRIV_NET_DELIFGROUP);
24730dad3f0eSMax Laier 		if (error)
24740dad3f0eSMax Laier 			return (error);
24750dad3f0eSMax Laier 		if ((error = if_delgroup(ifp, ifgr->ifgr_group)))
24760dad3f0eSMax Laier 			return (error);
24770dad3f0eSMax Laier 		break;
24780dad3f0eSMax Laier 	}
24790dad3f0eSMax Laier 
2480df8bae1dSRodney W. Grimes 	default:
2481f13ad206SJonathan Lemon 		error = ENOIOCTL;
2482f13ad206SJonathan Lemon 		break;
2483f13ad206SJonathan Lemon 	}
2484f13ad206SJonathan Lemon 	return (error);
2485f13ad206SJonathan Lemon }
2486f13ad206SJonathan Lemon 
24879af74f3dSSergey Kandaurov #ifdef COMPAT_FREEBSD32
24889af74f3dSSergey Kandaurov struct ifconf32 {
24899af74f3dSSergey Kandaurov 	int32_t	ifc_len;
24909af74f3dSSergey Kandaurov 	union {
24919af74f3dSSergey Kandaurov 		uint32_t	ifcu_buf;
24929af74f3dSSergey Kandaurov 		uint32_t	ifcu_req;
24939af74f3dSSergey Kandaurov 	} ifc_ifcu;
24949af74f3dSSergey Kandaurov };
24959af74f3dSSergey Kandaurov #define	SIOCGIFCONF32	_IOWR('i', 36, struct ifconf32)
24969af74f3dSSergey Kandaurov #endif
24979af74f3dSSergey Kandaurov 
2498f13ad206SJonathan Lemon /*
2499f13ad206SJonathan Lemon  * Interface ioctls.
2500f13ad206SJonathan Lemon  */
2501f13ad206SJonathan Lemon int
250272fd1b6aSDag-Erling Smørgrav ifioctl(struct socket *so, u_long cmd, caddr_t data, struct thread *td)
2503f13ad206SJonathan Lemon {
2504f13ad206SJonathan Lemon 	struct ifnet *ifp;
2505f13ad206SJonathan Lemon 	struct ifreq *ifr;
2506f13ad206SJonathan Lemon 	int error;
250762f76486SMaxim Sobolev 	int oif_flags;
2508f13ad206SJonathan Lemon 
25091fb51a12SBjoern A. Zeeb 	CURVNET_SET(so->so_vnet);
2510f13ad206SJonathan Lemon 	switch (cmd) {
2511f13ad206SJonathan Lemon 	case SIOCGIFCONF:
25121fb51a12SBjoern A. Zeeb 		error = ifconf(cmd, data);
25131fb51a12SBjoern A. Zeeb 		CURVNET_RESTORE();
25141fb51a12SBjoern A. Zeeb 		return (error);
25159af74f3dSSergey Kandaurov 
25169af74f3dSSergey Kandaurov #ifdef COMPAT_FREEBSD32
25179af74f3dSSergey Kandaurov 	case SIOCGIFCONF32:
25189af74f3dSSergey Kandaurov 		{
25199af74f3dSSergey Kandaurov 			struct ifconf32 *ifc32;
25209af74f3dSSergey Kandaurov 			struct ifconf ifc;
25219af74f3dSSergey Kandaurov 
25229af74f3dSSergey Kandaurov 			ifc32 = (struct ifconf32 *)data;
25239af74f3dSSergey Kandaurov 			ifc.ifc_len = ifc32->ifc_len;
25249af74f3dSSergey Kandaurov 			ifc.ifc_buf = PTRIN(ifc32->ifc_buf);
25259af74f3dSSergey Kandaurov 
25261fb51a12SBjoern A. Zeeb 			error = ifconf(SIOCGIFCONF, (void *)&ifc);
25271fb51a12SBjoern A. Zeeb 			CURVNET_RESTORE();
252823519598SSergey Kandaurov 			if (error == 0)
252923519598SSergey Kandaurov 				ifc32->ifc_len = ifc.ifc_len;
25301fb51a12SBjoern A. Zeeb 			return (error);
25319af74f3dSSergey Kandaurov 		}
25329af74f3dSSergey Kandaurov #endif
2533f13ad206SJonathan Lemon 	}
2534f13ad206SJonathan Lemon 	ifr = (struct ifreq *)data;
2535f13ad206SJonathan Lemon 
2536f13ad206SJonathan Lemon 	switch (cmd) {
2537feb08d06SMarko Zec #ifdef VIMAGE
2538679e1390SJamie Gritton 	case SIOCSIFRVNET:
2539679e1390SJamie Gritton 		error = priv_check(td, PRIV_NET_SETIFVNET);
25401fb51a12SBjoern A. Zeeb 		if (error == 0)
25411fb51a12SBjoern A. Zeeb 			error = if_vmove_reclaim(td, ifr->ifr_name,
25421fb51a12SBjoern A. Zeeb 			    ifr->ifr_jid);
25431fb51a12SBjoern A. Zeeb 		CURVNET_RESTORE();
2544679e1390SJamie Gritton 		return (error);
2545feb08d06SMarko Zec #endif
2546f13ad206SJonathan Lemon 	case SIOCIFCREATE:
25476b7330e2SSam Leffler 	case SIOCIFCREATE2:
2548acd3428bSRobert Watson 		error = priv_check(td, PRIV_NET_IFCREATE);
25491fb51a12SBjoern A. Zeeb 		if (error == 0)
25501fb51a12SBjoern A. Zeeb 			error = if_clone_create(ifr->ifr_name,
25511fb51a12SBjoern A. Zeeb 			    sizeof(ifr->ifr_name),
25521fb51a12SBjoern A. Zeeb 			    cmd == SIOCIFCREATE2 ? ifr->ifr_data : NULL);
25531fb51a12SBjoern A. Zeeb 		CURVNET_RESTORE();
25546b7330e2SSam Leffler 		return (error);
2555f13ad206SJonathan Lemon 	case SIOCIFDESTROY:
2556acd3428bSRobert Watson 		error = priv_check(td, PRIV_NET_IFDESTROY);
25571fb51a12SBjoern A. Zeeb 		if (error == 0)
25581fb51a12SBjoern A. Zeeb 			error = if_clone_destroy(ifr->ifr_name);
25591fb51a12SBjoern A. Zeeb 		CURVNET_RESTORE();
2560f13ad206SJonathan Lemon 		return (error);
2561f13ad206SJonathan Lemon 
2562f13ad206SJonathan Lemon 	case SIOCIFGCLONERS:
25631fb51a12SBjoern A. Zeeb 		error = if_clone_list((struct if_clonereq *)data);
25641fb51a12SBjoern A. Zeeb 		CURVNET_RESTORE();
25651fb51a12SBjoern A. Zeeb 		return (error);
25660dad3f0eSMax Laier 	case SIOCGIFGMEMB:
25671fb51a12SBjoern A. Zeeb 		error = if_getgroupmembers((struct ifgroupreq *)data);
25681fb51a12SBjoern A. Zeeb 		CURVNET_RESTORE();
25691fb51a12SBjoern A. Zeeb 		return (error);
257008b68b0eSGleb Smirnoff #if defined(INET) || defined(INET6)
257108b68b0eSGleb Smirnoff 	case SIOCSVH:
257208b68b0eSGleb Smirnoff 	case SIOCGVH:
257308b68b0eSGleb Smirnoff 		if (carp_ioctl_p == NULL)
257408b68b0eSGleb Smirnoff 			error = EPROTONOSUPPORT;
257508b68b0eSGleb Smirnoff 		else
257608b68b0eSGleb Smirnoff 			error = (*carp_ioctl_p)(ifr, cmd, td);
257708b68b0eSGleb Smirnoff 		CURVNET_RESTORE();
257808b68b0eSGleb Smirnoff 		return (error);
257908b68b0eSGleb Smirnoff #endif
2580f13ad206SJonathan Lemon 	}
2581f13ad206SJonathan Lemon 
25826064c5d3SRobert Watson 	ifp = ifunit_ref(ifr->ifr_name);
25831fb51a12SBjoern A. Zeeb 	if (ifp == NULL) {
25841fb51a12SBjoern A. Zeeb 		CURVNET_RESTORE();
2585f13ad206SJonathan Lemon 		return (ENXIO);
25861fb51a12SBjoern A. Zeeb 	}
2587f13ad206SJonathan Lemon 
2588f13ad206SJonathan Lemon 	error = ifhwioctl(cmd, ifp, data, td);
25896064c5d3SRobert Watson 	if (error != ENOIOCTL) {
25906064c5d3SRobert Watson 		if_rele(ifp);
25911fb51a12SBjoern A. Zeeb 		CURVNET_RESTORE();
2592f13ad206SJonathan Lemon 		return (error);
25936064c5d3SRobert Watson 	}
2594f13ad206SJonathan Lemon 
259582cd038dSYoshinobu Inoue 	oif_flags = ifp->if_flags;
25966064c5d3SRobert Watson 	if (so->so_proto == NULL) {
25976064c5d3SRobert Watson 		if_rele(ifp);
25981fb51a12SBjoern A. Zeeb 		CURVNET_RESTORE();
2599df8bae1dSRodney W. Grimes 		return (EOPNOTSUPP);
26006064c5d3SRobert Watson 	}
26011a05c762SDag-Erling Smørgrav 
26021a05c762SDag-Erling Smørgrav 	/*
26031a05c762SDag-Erling Smørgrav 	 * Pass the request on to the socket control method, and if the
26041a05c762SDag-Erling Smørgrav 	 * latter returns EOPNOTSUPP, directly to the interface.
26051a05c762SDag-Erling Smørgrav 	 *
26061a05c762SDag-Erling Smørgrav 	 * Make an exception for the legacy SIOCSIF* requests.  Drivers
26071a05c762SDag-Erling Smørgrav 	 * trust SIOCSIFADDR et al to come from an already privileged
26081a05c762SDag-Erling Smørgrav 	 * layer, and do not perform any credentials checks or input
26091a05c762SDag-Erling Smørgrav 	 * validation.
26101a05c762SDag-Erling Smørgrav 	 */
26115fb009bdSGleb Smirnoff 	error = ((*so->so_proto->pr_usrreqs->pru_control)(so, cmd, data,
2612b40ce416SJulian Elischer 	    ifp, td));
26131a05c762SDag-Erling Smørgrav 	if (error == EOPNOTSUPP && ifp != NULL && ifp->if_ioctl != NULL &&
26141a05c762SDag-Erling Smørgrav 	    cmd != SIOCSIFADDR && cmd != SIOCSIFBRDADDR &&
26151a05c762SDag-Erling Smørgrav 	    cmd != SIOCSIFDSTADDR && cmd != SIOCSIFNETMASK)
2616bc3977f1SJamie Gritton 		error = (*ifp->if_ioctl)(ifp, cmd, data);
261782cd038dSYoshinobu Inoue 
261882cd038dSYoshinobu Inoue 	if ((oif_flags ^ ifp->if_flags) & IFF_UP) {
261982cd038dSYoshinobu Inoue #ifdef INET6
2620c9b652e3SAndre Oppermann 		if (ifp->if_flags & IFF_UP)
262182cd038dSYoshinobu Inoue 			in6_if_up(ifp);
262282cd038dSYoshinobu Inoue #endif
2623df8bae1dSRodney W. Grimes 	}
26246064c5d3SRobert Watson 	if_rele(ifp);
26251fb51a12SBjoern A. Zeeb 	CURVNET_RESTORE();
2626df8bae1dSRodney W. Grimes 	return (error);
2627df8bae1dSRodney W. Grimes }
2628df8bae1dSRodney W. Grimes 
2629df8bae1dSRodney W. Grimes /*
2630292ee7beSRobert Watson  * The code common to handling reference counted flags,
26311a3b6859SYaroslav Tykhiy  * e.g., in ifpromisc() and if_allmulti().
2632b5c8bd59SYaroslav Tykhiy  * The "pflag" argument can specify a permanent mode flag to check,
26331a3b6859SYaroslav Tykhiy  * such as IFF_PPROMISC for promiscuous mode; should be 0 if none.
2634292ee7beSRobert Watson  *
2635292ee7beSRobert Watson  * Only to be used on stack-owned flags, not driver-owned flags.
26361a3b6859SYaroslav Tykhiy  */
26371a3b6859SYaroslav Tykhiy static int
26381a3b6859SYaroslav Tykhiy if_setflag(struct ifnet *ifp, int flag, int pflag, int *refcount, int onswitch)
26391a3b6859SYaroslav Tykhiy {
26401a3b6859SYaroslav Tykhiy 	struct ifreq ifr;
26411a3b6859SYaroslav Tykhiy 	int error;
26421a3b6859SYaroslav Tykhiy 	int oldflags, oldcount;
26431a3b6859SYaroslav Tykhiy 
26441a3b6859SYaroslav Tykhiy 	/* Sanity checks to catch programming errors */
2645b5c8bd59SYaroslav Tykhiy 	KASSERT((flag & (IFF_DRV_OACTIVE|IFF_DRV_RUNNING)) == 0,
2646b5c8bd59SYaroslav Tykhiy 	    ("%s: setting driver-owned flag %d", __func__, flag));
2647b5c8bd59SYaroslav Tykhiy 
2648b5c8bd59SYaroslav Tykhiy 	if (onswitch)
2649b5c8bd59SYaroslav Tykhiy 		KASSERT(*refcount >= 0,
2650b5c8bd59SYaroslav Tykhiy 		    ("%s: increment negative refcount %d for flag %d",
2651b5c8bd59SYaroslav Tykhiy 		    __func__, *refcount, flag));
2652b5c8bd59SYaroslav Tykhiy 	else
2653b5c8bd59SYaroslav Tykhiy 		KASSERT(*refcount > 0,
2654b5c8bd59SYaroslav Tykhiy 		    ("%s: decrement non-positive refcount %d for flag %d",
2655b5c8bd59SYaroslav Tykhiy 		    __func__, *refcount, flag));
26561a3b6859SYaroslav Tykhiy 
26571a3b6859SYaroslav Tykhiy 	/* In case this mode is permanent, just touch refcount */
26581a3b6859SYaroslav Tykhiy 	if (ifp->if_flags & pflag) {
26591a3b6859SYaroslav Tykhiy 		*refcount += onswitch ? 1 : -1;
26601a3b6859SYaroslav Tykhiy 		return (0);
26611a3b6859SYaroslav Tykhiy 	}
26621a3b6859SYaroslav Tykhiy 
26631a3b6859SYaroslav Tykhiy 	/* Save ifnet parameters for if_ioctl() may fail */
26641a3b6859SYaroslav Tykhiy 	oldcount = *refcount;
26651a3b6859SYaroslav Tykhiy 	oldflags = ifp->if_flags;
26661a3b6859SYaroslav Tykhiy 
26671a3b6859SYaroslav Tykhiy 	/*
26681a3b6859SYaroslav Tykhiy 	 * See if we aren't the only and touching refcount is enough.
26691a3b6859SYaroslav Tykhiy 	 * Actually toggle interface flag if we are the first or last.
26701a3b6859SYaroslav Tykhiy 	 */
26711a3b6859SYaroslav Tykhiy 	if (onswitch) {
26721a3b6859SYaroslav Tykhiy 		if ((*refcount)++)
26731a3b6859SYaroslav Tykhiy 			return (0);
26741a3b6859SYaroslav Tykhiy 		ifp->if_flags |= flag;
26751a3b6859SYaroslav Tykhiy 	} else {
26761a3b6859SYaroslav Tykhiy 		if (--(*refcount))
26771a3b6859SYaroslav Tykhiy 			return (0);
26781a3b6859SYaroslav Tykhiy 		ifp->if_flags &= ~flag;
26791a3b6859SYaroslav Tykhiy 	}
26801a3b6859SYaroslav Tykhiy 
26811a3b6859SYaroslav Tykhiy 	/* Call down the driver since we've changed interface flags */
26821a3b6859SYaroslav Tykhiy 	if (ifp->if_ioctl == NULL) {
26831a3b6859SYaroslav Tykhiy 		error = EOPNOTSUPP;
26841a3b6859SYaroslav Tykhiy 		goto recover;
26851a3b6859SYaroslav Tykhiy 	}
26861a3b6859SYaroslav Tykhiy 	ifr.ifr_flags = ifp->if_flags & 0xffff;
26871a3b6859SYaroslav Tykhiy 	ifr.ifr_flagshigh = ifp->if_flags >> 16;
26881a3b6859SYaroslav Tykhiy 	error = (*ifp->if_ioctl)(ifp, SIOCSIFFLAGS, (caddr_t)&ifr);
26891a3b6859SYaroslav Tykhiy 	if (error)
26901a3b6859SYaroslav Tykhiy 		goto recover;
26911a3b6859SYaroslav Tykhiy 	/* Notify userland that interface flags have changed */
26921a3b6859SYaroslav Tykhiy 	rt_ifmsg(ifp);
26931a3b6859SYaroslav Tykhiy 	return (0);
26941a3b6859SYaroslav Tykhiy 
26951a3b6859SYaroslav Tykhiy recover:
26961a3b6859SYaroslav Tykhiy 	/* Recover after driver error */
26971a3b6859SYaroslav Tykhiy 	*refcount = oldcount;
26981a3b6859SYaroslav Tykhiy 	ifp->if_flags = oldflags;
26991a3b6859SYaroslav Tykhiy 	return (error);
27001a3b6859SYaroslav Tykhiy }
27011a3b6859SYaroslav Tykhiy 
27021a3b6859SYaroslav Tykhiy /*
2703963e4c2aSGarrett Wollman  * Set/clear promiscuous mode on interface ifp based on the truth value
2704963e4c2aSGarrett Wollman  * of pswitch.  The calls are reference counted so that only the first
2705963e4c2aSGarrett Wollman  * "on" request actually has an effect, as does the final "off" request.
2706963e4c2aSGarrett Wollman  * Results are undefined if the "off" and "on" requests are not matched.
2707963e4c2aSGarrett Wollman  */
2708963e4c2aSGarrett Wollman int
270972fd1b6aSDag-Erling Smørgrav ifpromisc(struct ifnet *ifp, int pswitch)
2710963e4c2aSGarrett Wollman {
27114a26224cSGarrett Wollman 	int error;
27121a3b6859SYaroslav Tykhiy 	int oldflags = ifp->if_flags;
2713963e4c2aSGarrett Wollman 
27141a3b6859SYaroslav Tykhiy 	error = if_setflag(ifp, IFF_PROMISC, IFF_PPROMISC,
27151a3b6859SYaroslav Tykhiy 			   &ifp->if_pcount, pswitch);
27161a3b6859SYaroslav Tykhiy 	/* If promiscuous mode status has changed, log a message */
27171a3b6859SYaroslav Tykhiy 	if (error == 0 && ((ifp->if_flags ^ oldflags) & IFF_PROMISC))
27189bf40edeSBrooks Davis 		log(LOG_INFO, "%s: promiscuous mode %s\n",
27199bf40edeSBrooks Davis 		    ifp->if_xname,
27204f3c11a6SBill Fenner 		    (ifp->if_flags & IFF_PROMISC) ? "enabled" : "disabled");
27211a3b6859SYaroslav Tykhiy 	return (error);
2722963e4c2aSGarrett Wollman }
2723963e4c2aSGarrett Wollman 
2724963e4c2aSGarrett Wollman /*
2725df8bae1dSRodney W. Grimes  * Return interface configuration
2726df8bae1dSRodney W. Grimes  * of system.  List may be used
2727df8bae1dSRodney W. Grimes  * in later ioctl's (above) to get
2728df8bae1dSRodney W. Grimes  * other information.
2729df8bae1dSRodney W. Grimes  */
2730df8bae1dSRodney W. Grimes /*ARGSUSED*/
27313bda9f9bSPoul-Henning Kamp static int
273272fd1b6aSDag-Erling Smørgrav ifconf(u_long cmd, caddr_t data)
2733df8bae1dSRodney W. Grimes {
27340b59d917SJonathan Lemon 	struct ifconf *ifc = (struct ifconf *)data;
27350b59d917SJonathan Lemon 	struct ifnet *ifp;
27360b59d917SJonathan Lemon 	struct ifaddr *ifa;
27374dcf2bbbSBrooks Davis 	struct ifreq ifr;
27384dcf2bbbSBrooks Davis 	struct sbuf *sb;
27394dcf2bbbSBrooks Davis 	int error, full = 0, valid_len, max_len;
2740df8bae1dSRodney W. Grimes 
27414dcf2bbbSBrooks Davis 	/* Limit initial buffer size to MAXPHYS to avoid DoS from userspace. */
27424dcf2bbbSBrooks Davis 	max_len = MAXPHYS - 1;
27434dcf2bbbSBrooks Davis 
2744b0b4b28bSXin LI 	/* Prevent hostile input from being able to crash the system */
2745b0b4b28bSXin LI 	if (ifc->ifc_len <= 0)
2746b0b4b28bSXin LI 		return (EINVAL);
2747b0b4b28bSXin LI 
27484dcf2bbbSBrooks Davis again:
27494dcf2bbbSBrooks Davis 	if (ifc->ifc_len <= max_len) {
27504dcf2bbbSBrooks Davis 		max_len = ifc->ifc_len;
27514dcf2bbbSBrooks Davis 		full = 1;
27524dcf2bbbSBrooks Davis 	}
27534dcf2bbbSBrooks Davis 	sb = sbuf_new(NULL, NULL, max_len + 1, SBUF_FIXEDLEN);
27544dcf2bbbSBrooks Davis 	max_len = 0;
27554dcf2bbbSBrooks Davis 	valid_len = 0;
27564dcf2bbbSBrooks Davis 
275777dfcdc4SRobert Watson 	IFNET_RLOCK();
2758603724d3SBjoern A. Zeeb 	TAILQ_FOREACH(ifp, &V_ifnet, if_link) {
27599bf40edeSBrooks Davis 		int addrs;
27602624cf89SGarrett Wollman 
2761fbd24c5eSColin Percival 		/*
2762fbd24c5eSColin Percival 		 * Zero the ifr_name buffer to make sure we don't
2763fbd24c5eSColin Percival 		 * disclose the contents of the stack.
2764fbd24c5eSColin Percival 		 */
2765fbd24c5eSColin Percival 		memset(ifr.ifr_name, 0, sizeof(ifr.ifr_name));
2766fbd24c5eSColin Percival 
27679bf40edeSBrooks Davis 		if (strlcpy(ifr.ifr_name, ifp->if_xname, sizeof(ifr.ifr_name))
276862313e4cSSam Leffler 		    >= sizeof(ifr.ifr_name)) {
276962313e4cSSam Leffler 			sbuf_delete(sb);
277062313e4cSSam Leffler 			IFNET_RUNLOCK();
27714dcf2bbbSBrooks Davis 			return (ENAMETOOLONG);
277262313e4cSSam Leffler 		}
27732624cf89SGarrett Wollman 
277475c13541SPoul-Henning Kamp 		addrs = 0;
2775137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
27762defe5cdSJonathan Lemon 		TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) {
27772defe5cdSJonathan Lemon 			struct sockaddr *sa = ifa->ifa_addr;
27782defe5cdSJonathan Lemon 
2779b89e82ddSJamie Gritton 			if (prison_if(curthread->td_ucred, sa) != 0)
278075c13541SPoul-Henning Kamp 				continue;
278175c13541SPoul-Henning Kamp 			addrs++;
2782df8bae1dSRodney W. Grimes 			if (sa->sa_len <= sizeof(*sa)) {
2783df8bae1dSRodney W. Grimes 				ifr.ifr_addr = *sa;
27844dcf2bbbSBrooks Davis 				sbuf_bcat(sb, &ifr, sizeof(ifr));
27854dcf2bbbSBrooks Davis 				max_len += sizeof(ifr);
2786df8bae1dSRodney W. Grimes 			} else {
27874dcf2bbbSBrooks Davis 				sbuf_bcat(sb, &ifr,
27884dcf2bbbSBrooks Davis 				    offsetof(struct ifreq, ifr_addr));
27894dcf2bbbSBrooks Davis 				max_len += offsetof(struct ifreq, ifr_addr);
27904dcf2bbbSBrooks Davis 				sbuf_bcat(sb, sa, sa->sa_len);
27914dcf2bbbSBrooks Davis 				max_len += sa->sa_len;
2792df8bae1dSRodney W. Grimes 			}
27934dcf2bbbSBrooks Davis 
27944d369413SMatthew D Fleming 			if (sbuf_error(sb) == 0)
27954dcf2bbbSBrooks Davis 				valid_len = sbuf_len(sb);
2796df8bae1dSRodney W. Grimes 		}
2797137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
27984dcf2bbbSBrooks Davis 		if (addrs == 0) {
279975c13541SPoul-Henning Kamp 			bzero((caddr_t)&ifr.ifr_addr, sizeof(ifr.ifr_addr));
28004dcf2bbbSBrooks Davis 			sbuf_bcat(sb, &ifr, sizeof(ifr));
28014dcf2bbbSBrooks Davis 			max_len += sizeof(ifr);
28024dcf2bbbSBrooks Davis 
28034d369413SMatthew D Fleming 			if (sbuf_error(sb) == 0)
28044dcf2bbbSBrooks Davis 				valid_len = sbuf_len(sb);
280575c13541SPoul-Henning Kamp 		}
2806df8bae1dSRodney W. Grimes 	}
2807b30a244cSJeffrey Hsu 	IFNET_RUNLOCK();
28084dcf2bbbSBrooks Davis 
28094dcf2bbbSBrooks Davis 	/*
28104dcf2bbbSBrooks Davis 	 * If we didn't allocate enough space (uncommon), try again.  If
28114dcf2bbbSBrooks Davis 	 * we have already allocated as much space as we are allowed,
28124dcf2bbbSBrooks Davis 	 * return what we've got.
28134dcf2bbbSBrooks Davis 	 */
28144dcf2bbbSBrooks Davis 	if (valid_len != max_len && !full) {
28154dcf2bbbSBrooks Davis 		sbuf_delete(sb);
28164dcf2bbbSBrooks Davis 		goto again;
28174dcf2bbbSBrooks Davis 	}
28184dcf2bbbSBrooks Davis 
28194dcf2bbbSBrooks Davis 	ifc->ifc_len = valid_len;
28205ed8cedcSBrian Feldman 	sbuf_finish(sb);
28214dcf2bbbSBrooks Davis 	error = copyout(sbuf_data(sb), ifc->ifc_req, ifc->ifc_len);
28224dcf2bbbSBrooks Davis 	sbuf_delete(sb);
2823df8bae1dSRodney W. Grimes 	return (error);
2824df8bae1dSRodney W. Grimes }
2825df8bae1dSRodney W. Grimes 
28261158dfb7SGarrett Wollman /*
28278b25904eSGleb Smirnoff  * Just like ifpromisc(), but for all-multicast-reception mode.
28281158dfb7SGarrett Wollman  */
28291158dfb7SGarrett Wollman int
283072fd1b6aSDag-Erling Smørgrav if_allmulti(struct ifnet *ifp, int onswitch)
28311158dfb7SGarrett Wollman {
28321158dfb7SGarrett Wollman 
28331a3b6859SYaroslav Tykhiy 	return (if_setflag(ifp, IFF_ALLMULTI, 0, &ifp->if_amcount, onswitch));
28341158dfb7SGarrett Wollman }
28351158dfb7SGarrett Wollman 
28365896d124SBruce M Simpson struct ifmultiaddr *
2837c3b31afdSRobert Watson if_findmulti(struct ifnet *ifp, struct sockaddr *sa)
28381158dfb7SGarrett Wollman {
28391158dfb7SGarrett Wollman 	struct ifmultiaddr *ifma;
28401158dfb7SGarrett Wollman 
2841c3b31afdSRobert Watson 	IF_ADDR_LOCK_ASSERT(ifp);
2842c3b31afdSRobert Watson 
28436817526dSPoul-Henning Kamp 	TAILQ_FOREACH(ifma, &ifp->if_multiaddrs, ifma_link) {
284440d8a302SBruce M Simpson 		if (sa->sa_family == AF_LINK) {
284540d8a302SBruce M Simpson 			if (sa_dl_equal(ifma->ifma_addr, sa))
284640d8a302SBruce M Simpson 				break;
284740d8a302SBruce M Simpson 		} else {
2848c3b31afdSRobert Watson 			if (sa_equal(ifma->ifma_addr, sa))
2849c3b31afdSRobert Watson 				break;
28501158dfb7SGarrett Wollman 		}
285140d8a302SBruce M Simpson 	}
2852c3b31afdSRobert Watson 
2853c3b31afdSRobert Watson 	return ifma;
285457af7922SJulian Elischer }
28551158dfb7SGarrett Wollman 
28561158dfb7SGarrett Wollman /*
2857c3b31afdSRobert Watson  * Allocate a new ifmultiaddr and initialize based on passed arguments.  We
2858c3b31afdSRobert Watson  * make copies of passed sockaddrs.  The ifmultiaddr will not be added to
2859c3b31afdSRobert Watson  * the ifnet multicast address list here, so the caller must do that and
2860c3b31afdSRobert Watson  * other setup work (such as notifying the device driver).  The reference
2861c3b31afdSRobert Watson  * count is initialized to 1.
28621158dfb7SGarrett Wollman  */
2863c3b31afdSRobert Watson static struct ifmultiaddr *
2864c3b31afdSRobert Watson if_allocmulti(struct ifnet *ifp, struct sockaddr *sa, struct sockaddr *llsa,
2865c3b31afdSRobert Watson     int mflags)
2866c3b31afdSRobert Watson {
2867c3b31afdSRobert Watson 	struct ifmultiaddr *ifma;
2868c3b31afdSRobert Watson 	struct sockaddr *dupsa;
2869c3b31afdSRobert Watson 
28701ede983cSDag-Erling Smørgrav 	ifma = malloc(sizeof *ifma, M_IFMADDR, mflags |
2871c3b31afdSRobert Watson 	    M_ZERO);
2872c3b31afdSRobert Watson 	if (ifma == NULL)
2873c3b31afdSRobert Watson 		return (NULL);
2874c3b31afdSRobert Watson 
28751ede983cSDag-Erling Smørgrav 	dupsa = malloc(sa->sa_len, M_IFMADDR, mflags);
2876c3b31afdSRobert Watson 	if (dupsa == NULL) {
28771ede983cSDag-Erling Smørgrav 		free(ifma, M_IFMADDR);
2878c3b31afdSRobert Watson 		return (NULL);
28791158dfb7SGarrett Wollman 	}
28801158dfb7SGarrett Wollman 	bcopy(sa, dupsa, sa->sa_len);
28811158dfb7SGarrett Wollman 	ifma->ifma_addr = dupsa;
2882c3b31afdSRobert Watson 
28831158dfb7SGarrett Wollman 	ifma->ifma_ifp = ifp;
28841158dfb7SGarrett Wollman 	ifma->ifma_refcount = 1;
2885d4d22970SGleb Smirnoff 	ifma->ifma_protospec = NULL;
2886c3b31afdSRobert Watson 
2887c3b31afdSRobert Watson 	if (llsa == NULL) {
2888c3b31afdSRobert Watson 		ifma->ifma_lladdr = NULL;
2889c3b31afdSRobert Watson 		return (ifma);
2890c3b31afdSRobert Watson 	}
2891c3b31afdSRobert Watson 
28921ede983cSDag-Erling Smørgrav 	dupsa = malloc(llsa->sa_len, M_IFMADDR, mflags);
2893c3b31afdSRobert Watson 	if (dupsa == NULL) {
28941ede983cSDag-Erling Smørgrav 		free(ifma->ifma_addr, M_IFMADDR);
28951ede983cSDag-Erling Smørgrav 		free(ifma, M_IFMADDR);
2896c3b31afdSRobert Watson 		return (NULL);
2897c3b31afdSRobert Watson 	}
2898c3b31afdSRobert Watson 	bcopy(llsa, dupsa, llsa->sa_len);
2899c3b31afdSRobert Watson 	ifma->ifma_lladdr = dupsa;
2900c3b31afdSRobert Watson 
2901c3b31afdSRobert Watson 	return (ifma);
2902c3b31afdSRobert Watson }
2903373f88edSGarrett Wollman 
29041158dfb7SGarrett Wollman /*
2905c3b31afdSRobert Watson  * if_freemulti: free ifmultiaddr structure and possibly attached related
2906c3b31afdSRobert Watson  * addresses.  The caller is responsible for implementing reference
2907c3b31afdSRobert Watson  * counting, notifying the driver, handling routing messages, and releasing
2908c3b31afdSRobert Watson  * any dependent link layer state.
29091158dfb7SGarrett Wollman  */
2910c3b31afdSRobert Watson static void
2911c3b31afdSRobert Watson if_freemulti(struct ifmultiaddr *ifma)
2912c3b31afdSRobert Watson {
2913c3b31afdSRobert Watson 
2914ec002feeSBruce M Simpson 	KASSERT(ifma->ifma_refcount == 0, ("if_freemulti: refcount %d",
2915c3b31afdSRobert Watson 	    ifma->ifma_refcount));
2916c3b31afdSRobert Watson 	KASSERT(ifma->ifma_protospec == NULL,
2917c3b31afdSRobert Watson 	    ("if_freemulti: protospec not NULL"));
2918c3b31afdSRobert Watson 
2919c3b31afdSRobert Watson 	if (ifma->ifma_lladdr != NULL)
29201ede983cSDag-Erling Smørgrav 		free(ifma->ifma_lladdr, M_IFMADDR);
29211ede983cSDag-Erling Smørgrav 	free(ifma->ifma_addr, M_IFMADDR);
29221ede983cSDag-Erling Smørgrav 	free(ifma, M_IFMADDR);
2923c3b31afdSRobert Watson }
2924c3b31afdSRobert Watson 
2925c3b31afdSRobert Watson /*
2926c3b31afdSRobert Watson  * Register an additional multicast address with a network interface.
2927c3b31afdSRobert Watson  *
2928c3b31afdSRobert Watson  * - If the address is already present, bump the reference count on the
2929c3b31afdSRobert Watson  *   address and return.
2930c3b31afdSRobert Watson  * - If the address is not link-layer, look up a link layer address.
2931c3b31afdSRobert Watson  * - Allocate address structures for one or both addresses, and attach to the
2932c3b31afdSRobert Watson  *   multicast address list on the interface.  If automatically adding a link
2933c3b31afdSRobert Watson  *   layer address, the protocol address will own a reference to the link
2934c3b31afdSRobert Watson  *   layer address, to be freed when it is freed.
2935c3b31afdSRobert Watson  * - Notify the network device driver of an addition to the multicast address
2936c3b31afdSRobert Watson  *   list.
2937c3b31afdSRobert Watson  *
2938c3b31afdSRobert Watson  * 'sa' points to caller-owned memory with the desired multicast address.
2939c3b31afdSRobert Watson  *
2940c3b31afdSRobert Watson  * 'retifma' will be used to return a pointer to the resulting multicast
2941c3b31afdSRobert Watson  * address reference, if desired.
2942c3b31afdSRobert Watson  */
2943c3b31afdSRobert Watson int
2944c3b31afdSRobert Watson if_addmulti(struct ifnet *ifp, struct sockaddr *sa,
2945c3b31afdSRobert Watson     struct ifmultiaddr **retifma)
2946c3b31afdSRobert Watson {
2947c3b31afdSRobert Watson 	struct ifmultiaddr *ifma, *ll_ifma;
2948c3b31afdSRobert Watson 	struct sockaddr *llsa;
2949c3b31afdSRobert Watson 	int error;
2950c3b31afdSRobert Watson 
2951c3b31afdSRobert Watson 	/*
2952c3b31afdSRobert Watson 	 * If the address is already present, return a new reference to it;
2953c3b31afdSRobert Watson 	 * otherwise, allocate storage and set up a new address.
2954c3b31afdSRobert Watson 	 */
2955137f91e8SJohn Baldwin 	IF_ADDR_WLOCK(ifp);
2956c3b31afdSRobert Watson 	ifma = if_findmulti(ifp, sa);
2957c3b31afdSRobert Watson 	if (ifma != NULL) {
2958c3b31afdSRobert Watson 		ifma->ifma_refcount++;
2959c3b31afdSRobert Watson 		if (retifma != NULL)
2960c3b31afdSRobert Watson 			*retifma = ifma;
2961137f91e8SJohn Baldwin 		IF_ADDR_WUNLOCK(ifp);
2962c3b31afdSRobert Watson 		return (0);
2963c3b31afdSRobert Watson 	}
2964c3b31afdSRobert Watson 
2965c3b31afdSRobert Watson 	/*
2966c3b31afdSRobert Watson 	 * The address isn't already present; resolve the protocol address
2967c3b31afdSRobert Watson 	 * into a link layer address, and then look that up, bump its
2968c3b31afdSRobert Watson 	 * refcount or allocate an ifma for that also.  If 'llsa' was
2969c3b31afdSRobert Watson 	 * returned, we will need to free it later.
2970c3b31afdSRobert Watson 	 */
2971c3b31afdSRobert Watson 	llsa = NULL;
2972c3b31afdSRobert Watson 	ll_ifma = NULL;
2973c3b31afdSRobert Watson 	if (ifp->if_resolvemulti != NULL) {
2974c3b31afdSRobert Watson 		error = ifp->if_resolvemulti(ifp, &llsa, sa);
2975c3b31afdSRobert Watson 		if (error)
2976c3b31afdSRobert Watson 			goto unlock_out;
2977c3b31afdSRobert Watson 	}
2978c3b31afdSRobert Watson 
2979c3b31afdSRobert Watson 	/*
2980c3b31afdSRobert Watson 	 * Allocate the new address.  Don't hook it up yet, as we may also
2981c3b31afdSRobert Watson 	 * need to allocate a link layer multicast address.
2982c3b31afdSRobert Watson 	 */
2983c3b31afdSRobert Watson 	ifma = if_allocmulti(ifp, sa, llsa, M_NOWAIT);
2984c3b31afdSRobert Watson 	if (ifma == NULL) {
2985c3b31afdSRobert Watson 		error = ENOMEM;
2986c3b31afdSRobert Watson 		goto free_llsa_out;
2987c3b31afdSRobert Watson 	}
2988c3b31afdSRobert Watson 
2989c3b31afdSRobert Watson 	/*
2990c3b31afdSRobert Watson 	 * If a link layer address is found, we'll need to see if it's
2991c3b31afdSRobert Watson 	 * already present in the address list, or allocate is as well.
2992c3b31afdSRobert Watson 	 * When this block finishes, the link layer address will be on the
2993c3b31afdSRobert Watson 	 * list.
2994c3b31afdSRobert Watson 	 */
2995c3b31afdSRobert Watson 	if (llsa != NULL) {
2996c3b31afdSRobert Watson 		ll_ifma = if_findmulti(ifp, llsa);
2997c3b31afdSRobert Watson 		if (ll_ifma == NULL) {
2998c3b31afdSRobert Watson 			ll_ifma = if_allocmulti(ifp, llsa, NULL, M_NOWAIT);
2999c3b31afdSRobert Watson 			if (ll_ifma == NULL) {
3000ec002feeSBruce M Simpson 				--ifma->ifma_refcount;
3001c3b31afdSRobert Watson 				if_freemulti(ifma);
3002c3b31afdSRobert Watson 				error = ENOMEM;
3003c3b31afdSRobert Watson 				goto free_llsa_out;
3004c3b31afdSRobert Watson 			}
3005c3b31afdSRobert Watson 			TAILQ_INSERT_HEAD(&ifp->if_multiaddrs, ll_ifma,
3006c3b31afdSRobert Watson 			    ifma_link);
3007c3b31afdSRobert Watson 		} else
3008c3b31afdSRobert Watson 			ll_ifma->ifma_refcount++;
3009ec002feeSBruce M Simpson 		ifma->ifma_llifma = ll_ifma;
3010c3b31afdSRobert Watson 	}
3011c3b31afdSRobert Watson 
3012c3b31afdSRobert Watson 	/*
3013c3b31afdSRobert Watson 	 * We now have a new multicast address, ifma, and possibly a new or
3014c3b31afdSRobert Watson 	 * referenced link layer address.  Add the primary address to the
3015c3b31afdSRobert Watson 	 * ifnet address list.
3016c3b31afdSRobert Watson 	 */
30176817526dSPoul-Henning Kamp 	TAILQ_INSERT_HEAD(&ifp->if_multiaddrs, ifma, ifma_link);
3018c3b31afdSRobert Watson 
301913990766SJonathan Mini 	if (retifma != NULL)
3020373f88edSGarrett Wollman 		*retifma = ifma;
30211158dfb7SGarrett Wollman 
3022c3b31afdSRobert Watson 	/*
3023c3b31afdSRobert Watson 	 * Must generate the message while holding the lock so that 'ifma'
3024c3b31afdSRobert Watson 	 * pointer is still valid.
3025c3b31afdSRobert Watson 	 */
3026c3b31afdSRobert Watson 	rt_newmaddrmsg(RTM_NEWMADDR, ifma);
3027137f91e8SJohn Baldwin 	IF_ADDR_WUNLOCK(ifp);
3028c3b31afdSRobert Watson 
30291158dfb7SGarrett Wollman 	/*
30301158dfb7SGarrett Wollman 	 * We are certain we have added something, so call down to the
30311158dfb7SGarrett Wollman 	 * interface to let them know about it.
30321158dfb7SGarrett Wollman 	 */
30332432c31cSRobert Watson 	if (ifp->if_ioctl != NULL) {
30341a3b6859SYaroslav Tykhiy 		(void) (*ifp->if_ioctl)(ifp, SIOCADDMULTI, 0);
30351a3b6859SYaroslav Tykhiy 	}
30361158dfb7SGarrett Wollman 
3037c3b31afdSRobert Watson 	if (llsa != NULL)
30381ede983cSDag-Erling Smørgrav 		free(llsa, M_IFMADDR);
3039c3b31afdSRobert Watson 
3040c3b31afdSRobert Watson 	return (0);
3041c3b31afdSRobert Watson 
3042c3b31afdSRobert Watson free_llsa_out:
3043c3b31afdSRobert Watson 	if (llsa != NULL)
30441ede983cSDag-Erling Smørgrav 		free(llsa, M_IFMADDR);
3045c3b31afdSRobert Watson 
3046c3b31afdSRobert Watson unlock_out:
3047137f91e8SJohn Baldwin 	IF_ADDR_WUNLOCK(ifp);
3048c3b31afdSRobert Watson 	return (error);
30491158dfb7SGarrett Wollman }
30501158dfb7SGarrett Wollman 
30511158dfb7SGarrett Wollman /*
3052ec002feeSBruce M Simpson  * Delete a multicast group membership by network-layer group address.
3053ec002feeSBruce M Simpson  *
3054ec002feeSBruce M Simpson  * Returns ENOENT if the entry could not be found. If ifp no longer
3055ec002feeSBruce M Simpson  * exists, results are undefined. This entry point should only be used
3056ec002feeSBruce M Simpson  * from subsystems which do appropriate locking to hold ifp for the
3057ec002feeSBruce M Simpson  * duration of the call.
3058ec002feeSBruce M Simpson  * Network-layer protocol domains must use if_delmulti_ifma().
30591158dfb7SGarrett Wollman  */
30601158dfb7SGarrett Wollman int
306172fd1b6aSDag-Erling Smørgrav if_delmulti(struct ifnet *ifp, struct sockaddr *sa)
30621158dfb7SGarrett Wollman {
3063ec002feeSBruce M Simpson 	struct ifmultiaddr *ifma;
3064ec002feeSBruce M Simpson 	int lastref;
3065ec002feeSBruce M Simpson #ifdef INVARIANTS
3066ec002feeSBruce M Simpson 	struct ifnet *oifp;
3067ec002feeSBruce M Simpson 
306877dfcdc4SRobert Watson 	IFNET_RLOCK_NOSLEEP();
3069603724d3SBjoern A. Zeeb 	TAILQ_FOREACH(oifp, &V_ifnet, if_link)
3070ec002feeSBruce M Simpson 		if (ifp == oifp)
3071ec002feeSBruce M Simpson 			break;
3072ec002feeSBruce M Simpson 	if (ifp != oifp)
3073ec002feeSBruce M Simpson 		ifp = NULL;
307477dfcdc4SRobert Watson 	IFNET_RUNLOCK_NOSLEEP();
3075ec002feeSBruce M Simpson 
3076ec002feeSBruce M Simpson 	KASSERT(ifp != NULL, ("%s: ifnet went away", __func__));
3077ec002feeSBruce M Simpson #endif
3078ec002feeSBruce M Simpson 	if (ifp == NULL)
3079ec002feeSBruce M Simpson 		return (ENOENT);
30801158dfb7SGarrett Wollman 
3081137f91e8SJohn Baldwin 	IF_ADDR_WLOCK(ifp);
3082ec002feeSBruce M Simpson 	lastref = 0;
3083c3b31afdSRobert Watson 	ifma = if_findmulti(ifp, sa);
3084ec002feeSBruce M Simpson 	if (ifma != NULL)
3085ec002feeSBruce M Simpson 		lastref = if_delmulti_locked(ifp, ifma, 0);
3086137f91e8SJohn Baldwin 	IF_ADDR_WUNLOCK(ifp);
3087c3b31afdSRobert Watson 
3088ec002feeSBruce M Simpson 	if (ifma == NULL)
3089ec002feeSBruce M Simpson 		return (ENOENT);
3090ec002feeSBruce M Simpson 
3091ec002feeSBruce M Simpson 	if (lastref && ifp->if_ioctl != NULL) {
30921a3b6859SYaroslav Tykhiy 		(void)(*ifp->if_ioctl)(ifp, SIOCDELMULTI, 0);
309331302ebfSRobert Watson 	}
30941158dfb7SGarrett Wollman 
3095ec002feeSBruce M Simpson 	return (0);
3096ec002feeSBruce M Simpson }
3097ec002feeSBruce M Simpson 
3098ec002feeSBruce M Simpson /*
309993ec7edcSShteryana Shopova  * Delete all multicast group membership for an interface.
310093ec7edcSShteryana Shopova  * Should be used to quickly flush all multicast filters.
310193ec7edcSShteryana Shopova  */
310293ec7edcSShteryana Shopova void
310393ec7edcSShteryana Shopova if_delallmulti(struct ifnet *ifp)
310493ec7edcSShteryana Shopova {
310593ec7edcSShteryana Shopova 	struct ifmultiaddr *ifma;
310693ec7edcSShteryana Shopova 	struct ifmultiaddr *next;
310793ec7edcSShteryana Shopova 
3108137f91e8SJohn Baldwin 	IF_ADDR_WLOCK(ifp);
310993ec7edcSShteryana Shopova 	TAILQ_FOREACH_SAFE(ifma, &ifp->if_multiaddrs, ifma_link, next)
311093ec7edcSShteryana Shopova 		if_delmulti_locked(ifp, ifma, 0);
3111137f91e8SJohn Baldwin 	IF_ADDR_WUNLOCK(ifp);
311293ec7edcSShteryana Shopova }
311393ec7edcSShteryana Shopova 
311493ec7edcSShteryana Shopova /*
3115ec002feeSBruce M Simpson  * Delete a multicast group membership by group membership pointer.
3116ec002feeSBruce M Simpson  * Network-layer protocol domains must use this routine.
3117ec002feeSBruce M Simpson  *
3118e5adda3dSRobert Watson  * It is safe to call this routine if the ifp disappeared.
3119ec002feeSBruce M Simpson  */
3120ec002feeSBruce M Simpson void
3121ec002feeSBruce M Simpson if_delmulti_ifma(struct ifmultiaddr *ifma)
3122ec002feeSBruce M Simpson {
3123ec002feeSBruce M Simpson 	struct ifnet *ifp;
3124ec002feeSBruce M Simpson 	int lastref;
3125ec002feeSBruce M Simpson 
3126ec002feeSBruce M Simpson 	ifp = ifma->ifma_ifp;
3127ec002feeSBruce M Simpson #ifdef DIAGNOSTIC
3128ec002feeSBruce M Simpson 	if (ifp == NULL) {
3129ec002feeSBruce M Simpson 		printf("%s: ifma_ifp seems to be detached\n", __func__);
3130ec002feeSBruce M Simpson 	} else {
3131ec002feeSBruce M Simpson 		struct ifnet *oifp;
3132ec002feeSBruce M Simpson 
313377dfcdc4SRobert Watson 		IFNET_RLOCK_NOSLEEP();
3134603724d3SBjoern A. Zeeb 		TAILQ_FOREACH(oifp, &V_ifnet, if_link)
3135ec002feeSBruce M Simpson 			if (ifp == oifp)
3136ec002feeSBruce M Simpson 				break;
3137ec002feeSBruce M Simpson 		if (ifp != oifp) {
3138ec002feeSBruce M Simpson 			printf("%s: ifnet %p disappeared\n", __func__, ifp);
3139ec002feeSBruce M Simpson 			ifp = NULL;
3140ec002feeSBruce M Simpson 		}
314177dfcdc4SRobert Watson 		IFNET_RUNLOCK_NOSLEEP();
3142ec002feeSBruce M Simpson 	}
3143ec002feeSBruce M Simpson #endif
3144ec002feeSBruce M Simpson 	/*
3145ec002feeSBruce M Simpson 	 * If and only if the ifnet instance exists: Acquire the address lock.
3146ec002feeSBruce M Simpson 	 */
3147ec002feeSBruce M Simpson 	if (ifp != NULL)
3148137f91e8SJohn Baldwin 		IF_ADDR_WLOCK(ifp);
3149ec002feeSBruce M Simpson 
3150ec002feeSBruce M Simpson 	lastref = if_delmulti_locked(ifp, ifma, 0);
3151ec002feeSBruce M Simpson 
3152ec002feeSBruce M Simpson 	if (ifp != NULL) {
3153ec002feeSBruce M Simpson 		/*
3154ec002feeSBruce M Simpson 		 * If and only if the ifnet instance exists:
3155ec002feeSBruce M Simpson 		 *  Release the address lock.
3156ec002feeSBruce M Simpson 		 *  If the group was left: update the hardware hash filter.
3157ec002feeSBruce M Simpson 		 */
3158137f91e8SJohn Baldwin 		IF_ADDR_WUNLOCK(ifp);
3159ec002feeSBruce M Simpson 		if (lastref && ifp->if_ioctl != NULL) {
3160ec002feeSBruce M Simpson 			(void)(*ifp->if_ioctl)(ifp, SIOCDELMULTI, 0);
3161ec002feeSBruce M Simpson 		}
3162ec002feeSBruce M Simpson 	}
3163ec002feeSBruce M Simpson }
3164ec002feeSBruce M Simpson 
3165ec002feeSBruce M Simpson /*
3166ec002feeSBruce M Simpson  * Perform deletion of network-layer and/or link-layer multicast address.
3167ec002feeSBruce M Simpson  *
3168ec002feeSBruce M Simpson  * Return 0 if the reference count was decremented.
3169ec002feeSBruce M Simpson  * Return 1 if the final reference was released, indicating that the
3170ec002feeSBruce M Simpson  * hardware hash filter should be reprogrammed.
3171ec002feeSBruce M Simpson  */
3172ec002feeSBruce M Simpson static int
3173ec002feeSBruce M Simpson if_delmulti_locked(struct ifnet *ifp, struct ifmultiaddr *ifma, int detaching)
3174ec002feeSBruce M Simpson {
3175ec002feeSBruce M Simpson 	struct ifmultiaddr *ll_ifma;
3176ec002feeSBruce M Simpson 
3177ec002feeSBruce M Simpson 	if (ifp != NULL && ifma->ifma_ifp != NULL) {
3178ec002feeSBruce M Simpson 		KASSERT(ifma->ifma_ifp == ifp,
3179ec002feeSBruce M Simpson 		    ("%s: inconsistent ifp %p", __func__, ifp));
3180137f91e8SJohn Baldwin 		IF_ADDR_WLOCK_ASSERT(ifp);
3181ec002feeSBruce M Simpson 	}
3182ec002feeSBruce M Simpson 
3183ec002feeSBruce M Simpson 	ifp = ifma->ifma_ifp;
3184ec002feeSBruce M Simpson 
3185ec002feeSBruce M Simpson 	/*
3186ec002feeSBruce M Simpson 	 * If the ifnet is detaching, null out references to ifnet,
3187ec002feeSBruce M Simpson 	 * so that upper protocol layers will notice, and not attempt
318875ae0c01SBruce M Simpson 	 * to obtain locks for an ifnet which no longer exists. The
318975ae0c01SBruce M Simpson 	 * routing socket announcement must happen before the ifnet
319075ae0c01SBruce M Simpson 	 * instance is detached from the system.
3191ec002feeSBruce M Simpson 	 */
3192ec002feeSBruce M Simpson 	if (detaching) {
3193ec002feeSBruce M Simpson #ifdef DIAGNOSTIC
3194ec002feeSBruce M Simpson 		printf("%s: detaching ifnet instance %p\n", __func__, ifp);
3195ec002feeSBruce M Simpson #endif
319675ae0c01SBruce M Simpson 		/*
319775ae0c01SBruce M Simpson 		 * ifp may already be nulled out if we are being reentered
319875ae0c01SBruce M Simpson 		 * to delete the ll_ifma.
319975ae0c01SBruce M Simpson 		 */
320075ae0c01SBruce M Simpson 		if (ifp != NULL) {
320175ae0c01SBruce M Simpson 			rt_newmaddrmsg(RTM_DELMADDR, ifma);
3202ec002feeSBruce M Simpson 			ifma->ifma_ifp = NULL;
3203ec002feeSBruce M Simpson 		}
320475ae0c01SBruce M Simpson 	}
3205ec002feeSBruce M Simpson 
3206ec002feeSBruce M Simpson 	if (--ifma->ifma_refcount > 0)
32071158dfb7SGarrett Wollman 		return 0;
3208ec002feeSBruce M Simpson 
3209ec002feeSBruce M Simpson 	/*
3210ec002feeSBruce M Simpson 	 * If this ifma is a network-layer ifma, a link-layer ifma may
3211ec002feeSBruce M Simpson 	 * have been associated with it. Release it first if so.
3212ec002feeSBruce M Simpson 	 */
3213ec002feeSBruce M Simpson 	ll_ifma = ifma->ifma_llifma;
3214ec002feeSBruce M Simpson 	if (ll_ifma != NULL) {
3215ec002feeSBruce M Simpson 		KASSERT(ifma->ifma_lladdr != NULL,
3216ec002feeSBruce M Simpson 		    ("%s: llifma w/o lladdr", __func__));
3217ec002feeSBruce M Simpson 		if (detaching)
3218ec002feeSBruce M Simpson 			ll_ifma->ifma_ifp = NULL;	/* XXX */
3219ec002feeSBruce M Simpson 		if (--ll_ifma->ifma_refcount == 0) {
3220ec002feeSBruce M Simpson 			if (ifp != NULL) {
3221ec002feeSBruce M Simpson 				TAILQ_REMOVE(&ifp->if_multiaddrs, ll_ifma,
3222ec002feeSBruce M Simpson 				    ifma_link);
3223ec002feeSBruce M Simpson 			}
3224ec002feeSBruce M Simpson 			if_freemulti(ll_ifma);
3225ec002feeSBruce M Simpson 		}
3226ec002feeSBruce M Simpson 	}
3227ec002feeSBruce M Simpson 
3228ec002feeSBruce M Simpson 	if (ifp != NULL)
3229ec002feeSBruce M Simpson 		TAILQ_REMOVE(&ifp->if_multiaddrs, ifma, ifma_link);
3230ec002feeSBruce M Simpson 
3231ec002feeSBruce M Simpson 	if_freemulti(ifma);
3232ec002feeSBruce M Simpson 
3233ec002feeSBruce M Simpson 	/*
3234ec002feeSBruce M Simpson 	 * The last reference to this instance of struct ifmultiaddr
3235ec002feeSBruce M Simpson 	 * was released; the hardware should be notified of this change.
3236ec002feeSBruce M Simpson 	 */
3237ec002feeSBruce M Simpson 	return 1;
32381158dfb7SGarrett Wollman }
32391158dfb7SGarrett Wollman 
324066ce51ceSArchie Cobbs /*
324166ce51ceSArchie Cobbs  * Set the link layer address on an interface.
324266ce51ceSArchie Cobbs  *
324366ce51ceSArchie Cobbs  * At this time we only support certain types of interfaces,
324466ce51ceSArchie Cobbs  * and we don't allow the length of the address to change.
324566ce51ceSArchie Cobbs  */
324666ce51ceSArchie Cobbs int
324766ce51ceSArchie Cobbs if_setlladdr(struct ifnet *ifp, const u_char *lladdr, int len)
324866ce51ceSArchie Cobbs {
324966ce51ceSArchie Cobbs 	struct sockaddr_dl *sdl;
325066ce51ceSArchie Cobbs 	struct ifaddr *ifa;
3251d637e989SPeter Wemm 	struct ifreq ifr;
325266ce51ceSArchie Cobbs 
3253137f91e8SJohn Baldwin 	IF_ADDR_RLOCK(ifp);
32544a0d6638SRuslan Ermilov 	ifa = ifp->if_addr;
32553baaf297SRobert Watson 	if (ifa == NULL) {
3256137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
325766ce51ceSArchie Cobbs 		return (EINVAL);
32583baaf297SRobert Watson 	}
32593baaf297SRobert Watson 	ifa_ref(ifa);
3260137f91e8SJohn Baldwin 	IF_ADDR_RUNLOCK(ifp);
326166ce51ceSArchie Cobbs 	sdl = (struct sockaddr_dl *)ifa->ifa_addr;
32623baaf297SRobert Watson 	if (sdl == NULL) {
32633baaf297SRobert Watson 		ifa_free(ifa);
326466ce51ceSArchie Cobbs 		return (EINVAL);
32653baaf297SRobert Watson 	}
32663baaf297SRobert Watson 	if (len != sdl->sdl_alen) {	/* don't allow length to change */
32673baaf297SRobert Watson 		ifa_free(ifa);
326866ce51ceSArchie Cobbs 		return (EINVAL);
32693baaf297SRobert Watson 	}
327066ce51ceSArchie Cobbs 	switch (ifp->if_type) {
3271d09ed26fSRuslan Ermilov 	case IFT_ETHER:
327266ce51ceSArchie Cobbs 	case IFT_FDDI:
327366ce51ceSArchie Cobbs 	case IFT_XETHER:
327466ce51ceSArchie Cobbs 	case IFT_ISO88025:
3275b7bffa71SYaroslav Tykhiy 	case IFT_L2VLAN:
32768f867517SAndrew Thompson 	case IFT_BRIDGE:
32776cdcc159SMax Khon 	case IFT_ARCNET:
3278b47888ceSAndrew Thompson 	case IFT_IEEE8023ADLAG:
3279a51f44a7SSam Leffler 	case IFT_IEEE80211:
328066ce51ceSArchie Cobbs 		bcopy(lladdr, LLADDR(sdl), len);
32813baaf297SRobert Watson 		ifa_free(ifa);
328266ce51ceSArchie Cobbs 		break;
328366ce51ceSArchie Cobbs 	default:
32843baaf297SRobert Watson 		ifa_free(ifa);
328566ce51ceSArchie Cobbs 		return (ENODEV);
328666ce51ceSArchie Cobbs 	}
32873baaf297SRobert Watson 
328866ce51ceSArchie Cobbs 	/*
328966ce51ceSArchie Cobbs 	 * If the interface is already up, we need
329066ce51ceSArchie Cobbs 	 * to re-init it in order to reprogram its
329166ce51ceSArchie Cobbs 	 * address filter.
329266ce51ceSArchie Cobbs 	 */
329366ce51ceSArchie Cobbs 	if ((ifp->if_flags & IFF_UP) != 0) {
32941a3b6859SYaroslav Tykhiy 		if (ifp->if_ioctl) {
329566ce51ceSArchie Cobbs 			ifp->if_flags &= ~IFF_UP;
329662f76486SMaxim Sobolev 			ifr.ifr_flags = ifp->if_flags & 0xffff;
329762f76486SMaxim Sobolev 			ifr.ifr_flagshigh = ifp->if_flags >> 16;
3298ee0a4f7eSSUZUKI Shinsuke 			(*ifp->if_ioctl)(ifp, SIOCSIFFLAGS, (caddr_t)&ifr);
329966ce51ceSArchie Cobbs 			ifp->if_flags |= IFF_UP;
330062f76486SMaxim Sobolev 			ifr.ifr_flags = ifp->if_flags & 0xffff;
330162f76486SMaxim Sobolev 			ifr.ifr_flagshigh = ifp->if_flags >> 16;
3302ee0a4f7eSSUZUKI Shinsuke 			(*ifp->if_ioctl)(ifp, SIOCSIFFLAGS, (caddr_t)&ifr);
33031a3b6859SYaroslav Tykhiy 		}
3304b2c08f43SLuigi Rizzo #ifdef INET
3305b2c08f43SLuigi Rizzo 		/*
3306b2c08f43SLuigi Rizzo 		 * Also send gratuitous ARPs to notify other nodes about
3307b2c08f43SLuigi Rizzo 		 * the address change.
3308b2c08f43SLuigi Rizzo 		 */
3309b2c08f43SLuigi Rizzo 		TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) {
33104b97d7afSYaroslav Tykhiy 			if (ifa->ifa_addr->sa_family == AF_INET)
3311c0933269SPeter Wemm 				arp_ifinit(ifp, ifa);
3312b2c08f43SLuigi Rizzo 		}
3313b2c08f43SLuigi Rizzo #endif
331466ce51ceSArchie Cobbs 	}
331566ce51ceSArchie Cobbs 	return (0);
331666ce51ceSArchie Cobbs }
331766ce51ceSArchie Cobbs 
33189bf40edeSBrooks Davis /*
33199bf40edeSBrooks Davis  * The name argument must be a pointer to storage which will last as
33209bf40edeSBrooks Davis  * long as the interface does.  For physical devices, the result of
33219bf40edeSBrooks Davis  * device_get_name(dev) is a good choice and for pseudo-devices a
33229bf40edeSBrooks Davis  * static string works well.
33239bf40edeSBrooks Davis  */
33249bf40edeSBrooks Davis void
33259bf40edeSBrooks Davis if_initname(struct ifnet *ifp, const char *name, int unit)
33269bf40edeSBrooks Davis {
33279bf40edeSBrooks Davis 	ifp->if_dname = name;
33289bf40edeSBrooks Davis 	ifp->if_dunit = unit;
33299bf40edeSBrooks Davis 	if (unit != IF_DUNIT_NONE)
33309bf40edeSBrooks Davis 		snprintf(ifp->if_xname, IFNAMSIZ, "%s%d", name, unit);
33319bf40edeSBrooks Davis 	else
33329bf40edeSBrooks Davis 		strlcpy(ifp->if_xname, name, IFNAMSIZ);
33339bf40edeSBrooks Davis }
33349bf40edeSBrooks Davis 
3335fa882e87SBrooks Davis int
3336fa882e87SBrooks Davis if_printf(struct ifnet *ifp, const char * fmt, ...)
3337fa882e87SBrooks Davis {
3338fa882e87SBrooks Davis 	va_list ap;
3339fa882e87SBrooks Davis 	int retval;
3340fa882e87SBrooks Davis 
33419bf40edeSBrooks Davis 	retval = printf("%s: ", ifp->if_xname);
3342fa882e87SBrooks Davis 	va_start(ap, fmt);
3343fa882e87SBrooks Davis 	retval += vprintf(fmt, ap);
3344fa882e87SBrooks Davis 	va_end(ap);
3345fa882e87SBrooks Davis 	return (retval);
3346fa882e87SBrooks Davis }
3347fa882e87SBrooks Davis 
3348af5e59bfSRobert Watson void
3349af5e59bfSRobert Watson if_start(struct ifnet *ifp)
3350af5e59bfSRobert Watson {
3351af5e59bfSRobert Watson 
3352af5e59bfSRobert Watson 	(*(ifp)->if_start)(ifp);
3353af5e59bfSRobert Watson }
3354af5e59bfSRobert Watson 
3355db7f0b97SKip Macy /*
3356db7f0b97SKip Macy  * Backwards compatibility interface for drivers
3357db7f0b97SKip Macy  * that have not implemented it
3358db7f0b97SKip Macy  */
3359db7f0b97SKip Macy static int
3360db7f0b97SKip Macy if_transmit(struct ifnet *ifp, struct mbuf *m)
3361db7f0b97SKip Macy {
3362db7f0b97SKip Macy 	int error;
3363db7f0b97SKip Macy 
3364db7f0b97SKip Macy 	IFQ_HANDOFF(ifp, m, error);
3365db7f0b97SKip Macy 	return (error);
3366db7f0b97SKip Macy }
3367db7f0b97SKip Macy 
33680b762445SRobert Watson int
33690b762445SRobert Watson if_handoff(struct ifqueue *ifq, struct mbuf *m, struct ifnet *ifp, int adjust)
33700b762445SRobert Watson {
33710b762445SRobert Watson 	int active = 0;
33720b762445SRobert Watson 
33730b762445SRobert Watson 	IF_LOCK(ifq);
33740b762445SRobert Watson 	if (_IF_QFULL(ifq)) {
33750b762445SRobert Watson 		_IF_DROP(ifq);
33760b762445SRobert Watson 		IF_UNLOCK(ifq);
33770b762445SRobert Watson 		m_freem(m);
33780b762445SRobert Watson 		return (0);
33790b762445SRobert Watson 	}
33800b762445SRobert Watson 	if (ifp != NULL) {
33810b762445SRobert Watson 		ifp->if_obytes += m->m_pkthdr.len + adjust;
33820b762445SRobert Watson 		if (m->m_flags & (M_BCAST|M_MCAST))
33830b762445SRobert Watson 			ifp->if_omcasts++;
3384292ee7beSRobert Watson 		active = ifp->if_drv_flags & IFF_DRV_OACTIVE;
33850b762445SRobert Watson 	}
33860b762445SRobert Watson 	_IF_ENQUEUE(ifq, m);
33870b762445SRobert Watson 	IF_UNLOCK(ifq);
33880b762445SRobert Watson 	if (ifp != NULL && !active)
3389e5adda3dSRobert Watson 		(*(ifp)->if_start)(ifp);
33900b762445SRobert Watson 	return (1);
33910b762445SRobert Watson }
3392fc74a9f9SBrooks Davis 
3393fc74a9f9SBrooks Davis void
3394fc74a9f9SBrooks Davis if_register_com_alloc(u_char type,
3395fc74a9f9SBrooks Davis     if_com_alloc_t *a, if_com_free_t *f)
3396fc74a9f9SBrooks Davis {
3397fc74a9f9SBrooks Davis 
3398fc74a9f9SBrooks Davis 	KASSERT(if_com_alloc[type] == NULL,
3399fc74a9f9SBrooks Davis 	    ("if_register_com_alloc: %d already registered", type));
3400fc74a9f9SBrooks Davis 	KASSERT(if_com_free[type] == NULL,
3401fc74a9f9SBrooks Davis 	    ("if_register_com_alloc: %d free already registered", type));
3402fc74a9f9SBrooks Davis 
3403fc74a9f9SBrooks Davis 	if_com_alloc[type] = a;
3404fc74a9f9SBrooks Davis 	if_com_free[type] = f;
3405fc74a9f9SBrooks Davis }
3406fc74a9f9SBrooks Davis 
3407fc74a9f9SBrooks Davis void
3408fc74a9f9SBrooks Davis if_deregister_com_alloc(u_char type)
3409fc74a9f9SBrooks Davis {
3410fc74a9f9SBrooks Davis 
3411affcaf78SMax Khon 	KASSERT(if_com_alloc[type] != NULL,
3412fc74a9f9SBrooks Davis 	    ("if_deregister_com_alloc: %d not registered", type));
3413affcaf78SMax Khon 	KASSERT(if_com_free[type] != NULL,
3414fc74a9f9SBrooks Davis 	    ("if_deregister_com_alloc: %d free not registered", type));
3415fc74a9f9SBrooks Davis 	if_com_alloc[type] = NULL;
3416fc74a9f9SBrooks Davis 	if_com_free[type] = NULL;
3417fc74a9f9SBrooks Davis }
3418