xref: /freebsd/sys/net/rtsock.c (revision 2d70c0ded1b1d6a066b246d07c4d2b1324fd7d93)
1c398230bSWarner Losh /*-
2df8bae1dSRodney W. Grimes  * Copyright (c) 1988, 1991, 1993
3df8bae1dSRodney W. Grimes  *	The Regents of the University of California.  All rights reserved.
4df8bae1dSRodney W. Grimes  *
5df8bae1dSRodney W. Grimes  * Redistribution and use in source and binary forms, with or without
6df8bae1dSRodney W. Grimes  * modification, are permitted provided that the following conditions
7df8bae1dSRodney W. Grimes  * are met:
8df8bae1dSRodney W. Grimes  * 1. Redistributions of source code must retain the above copyright
9df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer.
10df8bae1dSRodney W. Grimes  * 2. Redistributions in binary form must reproduce the above copyright
11df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer in the
12df8bae1dSRodney W. Grimes  *    documentation and/or other materials provided with the distribution.
13df8bae1dSRodney W. Grimes  * 4. Neither the name of the University nor the names of its contributors
14df8bae1dSRodney W. Grimes  *    may be used to endorse or promote products derived from this software
15df8bae1dSRodney W. Grimes  *    without specific prior written permission.
16df8bae1dSRodney W. Grimes  *
17df8bae1dSRodney W. Grimes  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
18df8bae1dSRodney W. Grimes  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19df8bae1dSRodney W. Grimes  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20df8bae1dSRodney W. Grimes  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
21df8bae1dSRodney W. Grimes  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22df8bae1dSRodney W. Grimes  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23df8bae1dSRodney W. Grimes  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24df8bae1dSRodney W. Grimes  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25df8bae1dSRodney W. Grimes  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26df8bae1dSRodney W. Grimes  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27df8bae1dSRodney W. Grimes  * SUCH DAMAGE.
28df8bae1dSRodney W. Grimes  *
2928070a0eSRuslan Ermilov  *	@(#)rtsock.c	8.7 (Berkeley) 10/12/95
30c3aac50fSPeter Wemm  * $FreeBSD$
31df8bae1dSRodney W. Grimes  */
32427a928aSKonstantin Belousov #include "opt_compat.h"
33e440aed9SQing Li #include "opt_mpath.h"
34413628a7SBjoern A. Zeeb #include "opt_inet.h"
35413628a7SBjoern A. Zeeb #include "opt_inet6.h"
36e440aed9SQing Li 
37df8bae1dSRodney W. Grimes #include <sys/param.h>
38960ed29cSSeigo Tanimura #include <sys/jail.h>
39413628a7SBjoern A. Zeeb #include <sys/kernel.h>
40d0728d71SRobert Watson #include <sys/domain.h>
41609ff41fSWarner Losh #include <sys/lock.h>
424d1d4912SBruce Evans #include <sys/malloc.h>
43df8bae1dSRodney W. Grimes #include <sys/mbuf.h>
44acd3428bSRobert Watson #include <sys/priv.h>
45960ed29cSSeigo Tanimura #include <sys/proc.h>
46960ed29cSSeigo Tanimura #include <sys/protosw.h>
473120b9d4SKip Macy #include <sys/rwlock.h>
48960ed29cSSeigo Tanimura #include <sys/signalvar.h>
49df8bae1dSRodney W. Grimes #include <sys/socket.h>
50df8bae1dSRodney W. Grimes #include <sys/socketvar.h>
51960ed29cSSeigo Tanimura #include <sys/sysctl.h>
52960ed29cSSeigo Tanimura #include <sys/systm.h>
53df8bae1dSRodney W. Grimes 
54df8bae1dSRodney W. Grimes #include <net/if.h>
5576039bc8SGleb Smirnoff #include <net/if_var.h>
568eca593cSQing Li #include <net/if_dl.h>
576e6b3f7cSQing Li #include <net/if_llatbl.h>
580ed6142bSQing Li #include <net/if_types.h>
59d989c7b3SRobert Watson #include <net/netisr.h>
60df8bae1dSRodney W. Grimes #include <net/raw_cb.h>
61960ed29cSSeigo Tanimura #include <net/route.h>
624b79449eSBjoern A. Zeeb #include <net/vnet.h>
63df8bae1dSRodney W. Grimes 
645a59cefcSBosko Milekic #include <netinet/in.h>
65c7ab6602SQing Li #include <netinet/if_ether.h>
6608b68b0eSGleb Smirnoff #include <netinet/ip_carp.h>
67413628a7SBjoern A. Zeeb #ifdef INET6
680bebb544SHiroki Sato #include <netinet6/ip6_var.h>
69413628a7SBjoern A. Zeeb #include <netinet6/scope6_var.h>
70413628a7SBjoern A. Zeeb #endif
715a59cefcSBosko Milekic 
72427a928aSKonstantin Belousov #ifdef COMPAT_FREEBSD32
73427a928aSKonstantin Belousov #include <sys/mount.h>
74427a928aSKonstantin Belousov #include <compat/freebsd32/freebsd32.h>
75427a928aSKonstantin Belousov 
76427a928aSKonstantin Belousov struct if_msghdr32 {
77427a928aSKonstantin Belousov 	uint16_t ifm_msglen;
78427a928aSKonstantin Belousov 	uint8_t	ifm_version;
79427a928aSKonstantin Belousov 	uint8_t	ifm_type;
80427a928aSKonstantin Belousov 	int32_t	ifm_addrs;
81427a928aSKonstantin Belousov 	int32_t	ifm_flags;
82427a928aSKonstantin Belousov 	uint16_t ifm_index;
83b245f96cSGleb Smirnoff 	struct	if_data ifm_data;
84427a928aSKonstantin Belousov };
856d076ae8SBjoern A. Zeeb 
866d076ae8SBjoern A. Zeeb struct if_msghdrl32 {
876d076ae8SBjoern A. Zeeb 	uint16_t ifm_msglen;
886d076ae8SBjoern A. Zeeb 	uint8_t	ifm_version;
896d076ae8SBjoern A. Zeeb 	uint8_t	ifm_type;
906d076ae8SBjoern A. Zeeb 	int32_t	ifm_addrs;
916d076ae8SBjoern A. Zeeb 	int32_t	ifm_flags;
926d076ae8SBjoern A. Zeeb 	uint16_t ifm_index;
936d076ae8SBjoern A. Zeeb 	uint16_t _ifm_spare1;
946d076ae8SBjoern A. Zeeb 	uint16_t ifm_len;
956d076ae8SBjoern A. Zeeb 	uint16_t ifm_data_off;
96b245f96cSGleb Smirnoff 	struct	if_data ifm_data;
976d076ae8SBjoern A. Zeeb };
986d076ae8SBjoern A. Zeeb 
996d076ae8SBjoern A. Zeeb struct ifa_msghdrl32 {
1006d076ae8SBjoern A. Zeeb 	uint16_t ifam_msglen;
1016d076ae8SBjoern A. Zeeb 	uint8_t	ifam_version;
1026d076ae8SBjoern A. Zeeb 	uint8_t	ifam_type;
1036d076ae8SBjoern A. Zeeb 	int32_t	ifam_addrs;
1046d076ae8SBjoern A. Zeeb 	int32_t	ifam_flags;
1056d076ae8SBjoern A. Zeeb 	uint16_t ifam_index;
1066d076ae8SBjoern A. Zeeb 	uint16_t _ifam_spare1;
1076d076ae8SBjoern A. Zeeb 	uint16_t ifam_len;
1086d076ae8SBjoern A. Zeeb 	uint16_t ifam_data_off;
1096d076ae8SBjoern A. Zeeb 	int32_t	ifam_metric;
110b245f96cSGleb Smirnoff 	struct	if_data ifam_data;
1116d076ae8SBjoern A. Zeeb };
1126d076ae8SBjoern A. Zeeb #endif /* COMPAT_FREEBSD32 */
113427a928aSKonstantin Belousov 
114a1c995b6SPoul-Henning Kamp MALLOC_DEFINE(M_RTABLE, "routetbl", "routing tables");
115a1c995b6SPoul-Henning Kamp 
116becc44d7SSam Leffler /* NB: these are not modified */
11752041295SPoul-Henning Kamp static struct	sockaddr route_src = { 2, PF_ROUTE, };
118076d0761SJulian Elischer static struct	sockaddr sa_zero   = { sizeof(sa_zero), AF_INET, };
119becc44d7SSam Leffler 
12008b68b0eSGleb Smirnoff /* These are external hooks for CARP. */
12108b68b0eSGleb Smirnoff int	(*carp_get_vhid_p)(struct ifaddr *);
12208b68b0eSGleb Smirnoff 
123528737fdSBjoern A. Zeeb /*
124528737fdSBjoern A. Zeeb  * Used by rtsock/raw_input callback code to decide whether to filter the update
125528737fdSBjoern A. Zeeb  * notification to a socket bound to a particular FIB.
126528737fdSBjoern A. Zeeb  */
127528737fdSBjoern A. Zeeb #define	RTS_FILTER_FIB	M_PROTO8
128528737fdSBjoern A. Zeeb 
129c5d4eab6SMarko Zec typedef struct {
13018aee723SPeter Pentchev 	int	ip_count;	/* attached w/ AF_INET */
131becc44d7SSam Leffler 	int	ip6_count;	/* attached w/ AF_INET6 */
132becc44d7SSam Leffler 	int	any_count;	/* total attached */
133c5d4eab6SMarko Zec } route_cb_t;
134c5d4eab6SMarko Zec static VNET_DEFINE(route_cb_t, route_cb);
135c5d4eab6SMarko Zec #define	V_route_cb VNET(route_cb)
136df8bae1dSRodney W. Grimes 
137aea8b30fSSam Leffler struct mtx rtsock_mtx;
138aea8b30fSSam Leffler MTX_SYSINIT(rtsock, &rtsock_mtx, "rtsock route_cb lock", MTX_DEF);
139aea8b30fSSam Leffler 
140aea8b30fSSam Leffler #define	RTSOCK_LOCK()	mtx_lock(&rtsock_mtx)
141aea8b30fSSam Leffler #define	RTSOCK_UNLOCK()	mtx_unlock(&rtsock_mtx)
142aea8b30fSSam Leffler #define	RTSOCK_LOCK_ASSERT()	mtx_assert(&rtsock_mtx, MA_OWNED)
143aea8b30fSSam Leffler 
1446472ac3dSEd Schouten static SYSCTL_NODE(_net, OID_AUTO, route, CTLFLAG_RD, 0, "");
145190a4c94SRobert Watson 
146df8bae1dSRodney W. Grimes struct walkarg {
14752041295SPoul-Henning Kamp 	int	w_tmemsize;
14852041295SPoul-Henning Kamp 	int	w_op, w_arg;
14952041295SPoul-Henning Kamp 	caddr_t	w_tmem;
15052041295SPoul-Henning Kamp 	struct sysctl_req *w_req;
151df8bae1dSRodney W. Grimes };
152df8bae1dSRodney W. Grimes 
153d989c7b3SRobert Watson static void	rts_input(struct mbuf *m);
1545dfc91d7SLuigi Rizzo static struct mbuf *rt_msg1(int type, struct rt_addrinfo *rtinfo);
1555dfc91d7SLuigi Rizzo static int	rt_msg2(int type, struct rt_addrinfo *rtinfo,
1565dfc91d7SLuigi Rizzo 			caddr_t cp, struct walkarg *w);
1575dfc91d7SLuigi Rizzo static int	rt_xaddrs(caddr_t cp, caddr_t cplim,
1585dfc91d7SLuigi Rizzo 			struct rt_addrinfo *rtinfo);
159929ddbbbSAlfred Perlstein static int	sysctl_dumpentry(struct radix_node *rn, void *vw);
160929ddbbbSAlfred Perlstein static int	sysctl_iflist(int af, struct walkarg *w);
16105b2efe0SBruce M Simpson static int	sysctl_ifmalist(int af, struct walkarg *w);
1625dfc91d7SLuigi Rizzo static int	route_output(struct mbuf *m, struct socket *so);
163e3a7aa6fSGleb Smirnoff static void	rt_setmetrics(const struct rt_msghdr *rtm, struct rtentry *rt);
164e3a7aa6fSGleb Smirnoff static void	rt_getmetrics(const struct rtentry *rt, struct rt_metrics *out);
1653ca1a2d6SMax Laier static void	rt_dispatch(struct mbuf *, sa_family_t);
166df8bae1dSRodney W. Grimes 
167d4b5cae4SRobert Watson static struct netisr_handler rtsock_nh = {
168d4b5cae4SRobert Watson 	.nh_name = "rtsock",
169d4b5cae4SRobert Watson 	.nh_handler = rts_input,
170d4b5cae4SRobert Watson 	.nh_proto = NETISR_ROUTE,
171d4b5cae4SRobert Watson 	.nh_policy = NETISR_POLICY_SOURCE,
172d4b5cae4SRobert Watson };
173d4b5cae4SRobert Watson 
174d4b5cae4SRobert Watson static int
175d4b5cae4SRobert Watson sysctl_route_netisr_maxqlen(SYSCTL_HANDLER_ARGS)
176d4b5cae4SRobert Watson {
177d4b5cae4SRobert Watson 	int error, qlimit;
178d4b5cae4SRobert Watson 
179d4b5cae4SRobert Watson 	netisr_getqlimit(&rtsock_nh, &qlimit);
180d4b5cae4SRobert Watson 	error = sysctl_handle_int(oidp, &qlimit, 0, req);
181d4b5cae4SRobert Watson         if (error || !req->newptr)
182d4b5cae4SRobert Watson                 return (error);
183d4b5cae4SRobert Watson 	if (qlimit < 1)
184d4b5cae4SRobert Watson 		return (EINVAL);
185d4b5cae4SRobert Watson 	return (netisr_setqlimit(&rtsock_nh, qlimit));
186d4b5cae4SRobert Watson }
187d4b5cae4SRobert Watson SYSCTL_PROC(_net_route, OID_AUTO, netisr_maxqlen, CTLTYPE_INT|CTLFLAG_RW,
188d4b5cae4SRobert Watson     0, 0, sysctl_route_netisr_maxqlen, "I",
189d4b5cae4SRobert Watson     "maximum routing socket dispatch queue length");
190d4b5cae4SRobert Watson 
191d989c7b3SRobert Watson static void
192d989c7b3SRobert Watson rts_init(void)
193d989c7b3SRobert Watson {
194b062951aSRobert Watson 	int tmp;
195d989c7b3SRobert Watson 
196b062951aSRobert Watson 	if (TUNABLE_INT_FETCH("net.route.netisr_maxqlen", &tmp))
197d4b5cae4SRobert Watson 		rtsock_nh.nh_qlimit = tmp;
198d4b5cae4SRobert Watson 	netisr_register(&rtsock_nh);
199d989c7b3SRobert Watson }
200237fdd78SRobert Watson SYSINIT(rtsock, SI_SUB_PROTO_DOMAIN, SI_ORDER_THIRD, rts_init, 0);
201d989c7b3SRobert Watson 
202528737fdSBjoern A. Zeeb static int
203528737fdSBjoern A. Zeeb raw_input_rts_cb(struct mbuf *m, struct sockproto *proto, struct sockaddr *src,
204528737fdSBjoern A. Zeeb     struct rawcb *rp)
205528737fdSBjoern A. Zeeb {
206528737fdSBjoern A. Zeeb 	int fibnum;
207528737fdSBjoern A. Zeeb 
208528737fdSBjoern A. Zeeb 	KASSERT(m != NULL, ("%s: m is NULL", __func__));
209528737fdSBjoern A. Zeeb 	KASSERT(proto != NULL, ("%s: proto is NULL", __func__));
210528737fdSBjoern A. Zeeb 	KASSERT(rp != NULL, ("%s: rp is NULL", __func__));
211528737fdSBjoern A. Zeeb 
212528737fdSBjoern A. Zeeb 	/* No filtering requested. */
213528737fdSBjoern A. Zeeb 	if ((m->m_flags & RTS_FILTER_FIB) == 0)
214528737fdSBjoern A. Zeeb 		return (0);
215528737fdSBjoern A. Zeeb 
216528737fdSBjoern A. Zeeb 	/* Check if it is a rts and the fib matches the one of the socket. */
217528737fdSBjoern A. Zeeb 	fibnum = M_GETFIB(m);
218528737fdSBjoern A. Zeeb 	if (proto->sp_family != PF_ROUTE ||
219528737fdSBjoern A. Zeeb 	    rp->rcb_socket == NULL ||
220528737fdSBjoern A. Zeeb 	    rp->rcb_socket->so_fibnum == fibnum)
221528737fdSBjoern A. Zeeb 		return (0);
222528737fdSBjoern A. Zeeb 
223528737fdSBjoern A. Zeeb 	/* Filtering requested and no match, the socket shall be skipped. */
224528737fdSBjoern A. Zeeb 	return (1);
225528737fdSBjoern A. Zeeb }
226528737fdSBjoern A. Zeeb 
227d989c7b3SRobert Watson static void
228d989c7b3SRobert Watson rts_input(struct mbuf *m)
229d989c7b3SRobert Watson {
230d989c7b3SRobert Watson 	struct sockproto route_proto;
231d989c7b3SRobert Watson 	unsigned short *family;
232d989c7b3SRobert Watson 	struct m_tag *tag;
233d989c7b3SRobert Watson 
234d989c7b3SRobert Watson 	route_proto.sp_family = PF_ROUTE;
235d989c7b3SRobert Watson 	tag = m_tag_find(m, PACKET_TAG_RTSOCKFAM, NULL);
236d989c7b3SRobert Watson 	if (tag != NULL) {
237d989c7b3SRobert Watson 		family = (unsigned short *)(tag + 1);
238d989c7b3SRobert Watson 		route_proto.sp_protocol = *family;
239d989c7b3SRobert Watson 		m_tag_delete(m, tag);
240d989c7b3SRobert Watson 	} else
241d989c7b3SRobert Watson 		route_proto.sp_protocol = 0;
242d989c7b3SRobert Watson 
243528737fdSBjoern A. Zeeb 	raw_input_ext(m, &route_proto, &route_src, raw_input_rts_cb);
244d989c7b3SRobert Watson }
245d989c7b3SRobert Watson 
246a29f300eSGarrett Wollman /*
247a29f300eSGarrett Wollman  * It really doesn't make any sense at all for this code to share much
248a29f300eSGarrett Wollman  * with raw_usrreq.c, since its functionality is so restricted.  XXX
249a29f300eSGarrett Wollman  */
250ac45e92fSRobert Watson static void
251a29f300eSGarrett Wollman rts_abort(struct socket *so)
252df8bae1dSRodney W. Grimes {
2537e994955SRobert Watson 
254ac45e92fSRobert Watson 	raw_usrreqs.pru_abort(so);
255df8bae1dSRodney W. Grimes }
256a29f300eSGarrett Wollman 
257a152f8a3SRobert Watson static void
258a152f8a3SRobert Watson rts_close(struct socket *so)
259a152f8a3SRobert Watson {
260a152f8a3SRobert Watson 
261a152f8a3SRobert Watson 	raw_usrreqs.pru_close(so);
262a152f8a3SRobert Watson }
263a152f8a3SRobert Watson 
264a29f300eSGarrett Wollman /* pru_accept is EOPNOTSUPP */
265a29f300eSGarrett Wollman 
266a29f300eSGarrett Wollman static int
267b40ce416SJulian Elischer rts_attach(struct socket *so, int proto, struct thread *td)
268a29f300eSGarrett Wollman {
269a29f300eSGarrett Wollman 	struct rawcb *rp;
270c9b652e3SAndre Oppermann 	int error;
271a29f300eSGarrett Wollman 
272bc725eafSRobert Watson 	KASSERT(so->so_pcb == NULL, ("rts_attach: so_pcb != NULL"));
273bc725eafSRobert Watson 
2747cc0979fSDavid Malone 	/* XXX */
2751ede983cSDag-Erling Smørgrav 	rp = malloc(sizeof *rp, M_PCB, M_WAITOK | M_ZERO);
2765dfc91d7SLuigi Rizzo 	if (rp == NULL)
277a29f300eSGarrett Wollman 		return ENOBUFS;
278a29f300eSGarrett Wollman 
279a29f300eSGarrett Wollman 	so->so_pcb = (caddr_t)rp;
2808b07e49aSJulian Elischer 	so->so_fibnum = td->td_proc->p_fibnum;
281162c0b2eSRuslan Ermilov 	error = raw_attach(so, proto);
282a29f300eSGarrett Wollman 	rp = sotorawcb(so);
283a29f300eSGarrett Wollman 	if (error) {
2847ba271aeSJonathan Chen 		so->so_pcb = NULL;
285a29f300eSGarrett Wollman 		free(rp, M_PCB);
286a29f300eSGarrett Wollman 		return error;
287a29f300eSGarrett Wollman 	}
288aea8b30fSSam Leffler 	RTSOCK_LOCK();
289a29f300eSGarrett Wollman 	switch(rp->rcb_proto.sp_protocol) {
290a29f300eSGarrett Wollman 	case AF_INET:
291c5d4eab6SMarko Zec 		V_route_cb.ip_count++;
292a29f300eSGarrett Wollman 		break;
293899ce4f4SYoshinobu Inoue 	case AF_INET6:
294c5d4eab6SMarko Zec 		V_route_cb.ip6_count++;
295899ce4f4SYoshinobu Inoue 		break;
296a29f300eSGarrett Wollman 	}
297c5d4eab6SMarko Zec 	V_route_cb.any_count++;
298aea8b30fSSam Leffler 	RTSOCK_UNLOCK();
29903e49181SSeigo Tanimura 	soisconnected(so);
300df8bae1dSRodney W. Grimes 	so->so_options |= SO_USELOOPBACK;
301a29f300eSGarrett Wollman 	return 0;
302df8bae1dSRodney W. Grimes }
303df8bae1dSRodney W. Grimes 
304a29f300eSGarrett Wollman static int
305b40ce416SJulian Elischer rts_bind(struct socket *so, struct sockaddr *nam, struct thread *td)
306a29f300eSGarrett Wollman {
3077e994955SRobert Watson 
3087e994955SRobert Watson 	return (raw_usrreqs.pru_bind(so, nam, td)); /* xxx just EINVAL */
309a29f300eSGarrett Wollman }
310a29f300eSGarrett Wollman 
311a29f300eSGarrett Wollman static int
312b40ce416SJulian Elischer rts_connect(struct socket *so, struct sockaddr *nam, struct thread *td)
313a29f300eSGarrett Wollman {
3147e994955SRobert Watson 
3157e994955SRobert Watson 	return (raw_usrreqs.pru_connect(so, nam, td)); /* XXX just EINVAL */
316a29f300eSGarrett Wollman }
317a29f300eSGarrett Wollman 
318a29f300eSGarrett Wollman /* pru_connect2 is EOPNOTSUPP */
319a29f300eSGarrett Wollman /* pru_control is EOPNOTSUPP */
320a29f300eSGarrett Wollman 
321bc725eafSRobert Watson static void
322a29f300eSGarrett Wollman rts_detach(struct socket *so)
323a29f300eSGarrett Wollman {
324a29f300eSGarrett Wollman 	struct rawcb *rp = sotorawcb(so);
325a29f300eSGarrett Wollman 
326bc725eafSRobert Watson 	KASSERT(rp != NULL, ("rts_detach: rp == NULL"));
327bc725eafSRobert Watson 
328aea8b30fSSam Leffler 	RTSOCK_LOCK();
329a29f300eSGarrett Wollman 	switch(rp->rcb_proto.sp_protocol) {
330a29f300eSGarrett Wollman 	case AF_INET:
331c5d4eab6SMarko Zec 		V_route_cb.ip_count--;
332a29f300eSGarrett Wollman 		break;
333899ce4f4SYoshinobu Inoue 	case AF_INET6:
334c5d4eab6SMarko Zec 		V_route_cb.ip6_count--;
335899ce4f4SYoshinobu Inoue 		break;
336a29f300eSGarrett Wollman 	}
337c5d4eab6SMarko Zec 	V_route_cb.any_count--;
338aea8b30fSSam Leffler 	RTSOCK_UNLOCK();
339bc725eafSRobert Watson 	raw_usrreqs.pru_detach(so);
340a29f300eSGarrett Wollman }
341a29f300eSGarrett Wollman 
342a29f300eSGarrett Wollman static int
343a29f300eSGarrett Wollman rts_disconnect(struct socket *so)
344a29f300eSGarrett Wollman {
3457e994955SRobert Watson 
3467e994955SRobert Watson 	return (raw_usrreqs.pru_disconnect(so));
347a29f300eSGarrett Wollman }
348a29f300eSGarrett Wollman 
349a29f300eSGarrett Wollman /* pru_listen is EOPNOTSUPP */
350a29f300eSGarrett Wollman 
351a29f300eSGarrett Wollman static int
35257bf258eSGarrett Wollman rts_peeraddr(struct socket *so, struct sockaddr **nam)
353a29f300eSGarrett Wollman {
3547e994955SRobert Watson 
3557e994955SRobert Watson 	return (raw_usrreqs.pru_peeraddr(so, nam));
356a29f300eSGarrett Wollman }
357a29f300eSGarrett Wollman 
358a29f300eSGarrett Wollman /* pru_rcvd is EOPNOTSUPP */
359a29f300eSGarrett Wollman /* pru_rcvoob is EOPNOTSUPP */
360a29f300eSGarrett Wollman 
361a29f300eSGarrett Wollman static int
36257bf258eSGarrett Wollman rts_send(struct socket *so, int flags, struct mbuf *m, struct sockaddr *nam,
363b40ce416SJulian Elischer 	 struct mbuf *control, struct thread *td)
364a29f300eSGarrett Wollman {
3657e994955SRobert Watson 
3667e994955SRobert Watson 	return (raw_usrreqs.pru_send(so, flags, m, nam, control, td));
367a29f300eSGarrett Wollman }
368a29f300eSGarrett Wollman 
369a29f300eSGarrett Wollman /* pru_sense is null */
370a29f300eSGarrett Wollman 
371a29f300eSGarrett Wollman static int
372a29f300eSGarrett Wollman rts_shutdown(struct socket *so)
373a29f300eSGarrett Wollman {
3747e994955SRobert Watson 
3757e994955SRobert Watson 	return (raw_usrreqs.pru_shutdown(so));
376a29f300eSGarrett Wollman }
377a29f300eSGarrett Wollman 
378a29f300eSGarrett Wollman static int
37957bf258eSGarrett Wollman rts_sockaddr(struct socket *so, struct sockaddr **nam)
380a29f300eSGarrett Wollman {
3817e994955SRobert Watson 
3827e994955SRobert Watson 	return (raw_usrreqs.pru_sockaddr(so, nam));
383a29f300eSGarrett Wollman }
384a29f300eSGarrett Wollman 
385a29f300eSGarrett Wollman static struct pr_usrreqs route_usrreqs = {
386756d52a1SPoul-Henning Kamp 	.pru_abort =		rts_abort,
387756d52a1SPoul-Henning Kamp 	.pru_attach =		rts_attach,
388756d52a1SPoul-Henning Kamp 	.pru_bind =		rts_bind,
389756d52a1SPoul-Henning Kamp 	.pru_connect =		rts_connect,
390756d52a1SPoul-Henning Kamp 	.pru_detach =		rts_detach,
391756d52a1SPoul-Henning Kamp 	.pru_disconnect =	rts_disconnect,
392756d52a1SPoul-Henning Kamp 	.pru_peeraddr =		rts_peeraddr,
393756d52a1SPoul-Henning Kamp 	.pru_send =		rts_send,
394756d52a1SPoul-Henning Kamp 	.pru_shutdown =		rts_shutdown,
395756d52a1SPoul-Henning Kamp 	.pru_sockaddr =		rts_sockaddr,
396a152f8a3SRobert Watson 	.pru_close =		rts_close,
397a29f300eSGarrett Wollman };
398a29f300eSGarrett Wollman 
399413628a7SBjoern A. Zeeb #ifndef _SOCKADDR_UNION_DEFINED
400413628a7SBjoern A. Zeeb #define	_SOCKADDR_UNION_DEFINED
401413628a7SBjoern A. Zeeb /*
402413628a7SBjoern A. Zeeb  * The union of all possible address formats we handle.
403413628a7SBjoern A. Zeeb  */
404413628a7SBjoern A. Zeeb union sockaddr_union {
405413628a7SBjoern A. Zeeb 	struct sockaddr		sa;
406413628a7SBjoern A. Zeeb 	struct sockaddr_in	sin;
407413628a7SBjoern A. Zeeb 	struct sockaddr_in6	sin6;
408413628a7SBjoern A. Zeeb };
409413628a7SBjoern A. Zeeb #endif /* _SOCKADDR_UNION_DEFINED */
410413628a7SBjoern A. Zeeb 
411413628a7SBjoern A. Zeeb static int
412413628a7SBjoern A. Zeeb rtm_get_jailed(struct rt_addrinfo *info, struct ifnet *ifp,
413413628a7SBjoern A. Zeeb     struct rtentry *rt, union sockaddr_union *saun, struct ucred *cred)
414413628a7SBjoern A. Zeeb {
415413628a7SBjoern A. Zeeb 
4169c79d243SJamie Gritton 	/* First, see if the returned address is part of the jail. */
4179c79d243SJamie Gritton 	if (prison_if(cred, rt->rt_ifa->ifa_addr) == 0) {
4189c79d243SJamie Gritton 		info->rti_info[RTAX_IFA] = rt->rt_ifa->ifa_addr;
4199c79d243SJamie Gritton 		return (0);
4209c79d243SJamie Gritton 	}
4219c79d243SJamie Gritton 
422413628a7SBjoern A. Zeeb 	switch (info->rti_info[RTAX_DST]->sa_family) {
423413628a7SBjoern A. Zeeb #ifdef INET
424413628a7SBjoern A. Zeeb 	case AF_INET:
425413628a7SBjoern A. Zeeb 	{
426413628a7SBjoern A. Zeeb 		struct in_addr ia;
427413628a7SBjoern A. Zeeb 		struct ifaddr *ifa;
428413628a7SBjoern A. Zeeb 		int found;
429413628a7SBjoern A. Zeeb 
430413628a7SBjoern A. Zeeb 		found = 0;
431413628a7SBjoern A. Zeeb 		/*
4329c79d243SJamie Gritton 		 * Try to find an address on the given outgoing interface
4339c79d243SJamie Gritton 		 * that belongs to the jail.
434413628a7SBjoern A. Zeeb 		 */
435137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
436413628a7SBjoern A. Zeeb 		TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) {
437413628a7SBjoern A. Zeeb 			struct sockaddr *sa;
438413628a7SBjoern A. Zeeb 			sa = ifa->ifa_addr;
439413628a7SBjoern A. Zeeb 			if (sa->sa_family != AF_INET)
440413628a7SBjoern A. Zeeb 				continue;
441413628a7SBjoern A. Zeeb 			ia = ((struct sockaddr_in *)sa)->sin_addr;
442b89e82ddSJamie Gritton 			if (prison_check_ip4(cred, &ia) == 0) {
443413628a7SBjoern A. Zeeb 				found = 1;
444413628a7SBjoern A. Zeeb 				break;
445413628a7SBjoern A. Zeeb 			}
446413628a7SBjoern A. Zeeb 		}
447137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
448413628a7SBjoern A. Zeeb 		if (!found) {
449413628a7SBjoern A. Zeeb 			/*
4509c79d243SJamie Gritton 			 * As a last resort return the 'default' jail address.
451413628a7SBjoern A. Zeeb 			 */
4520304c731SJamie Gritton 			ia = ((struct sockaddr_in *)rt->rt_ifa->ifa_addr)->
4530304c731SJamie Gritton 			    sin_addr;
4541cecba0fSBjoern A. Zeeb 			if (prison_get_ip4(cred, &ia) != 0)
455413628a7SBjoern A. Zeeb 				return (ESRCH);
456413628a7SBjoern A. Zeeb 		}
457413628a7SBjoern A. Zeeb 		bzero(&saun->sin, sizeof(struct sockaddr_in));
458413628a7SBjoern A. Zeeb 		saun->sin.sin_len = sizeof(struct sockaddr_in);
459413628a7SBjoern A. Zeeb 		saun->sin.sin_family = AF_INET;
460413628a7SBjoern A. Zeeb 		saun->sin.sin_addr.s_addr = ia.s_addr;
4619c79d243SJamie Gritton 		info->rti_info[RTAX_IFA] = (struct sockaddr *)&saun->sin;
462413628a7SBjoern A. Zeeb 		break;
463413628a7SBjoern A. Zeeb 	}
464413628a7SBjoern A. Zeeb #endif
465413628a7SBjoern A. Zeeb #ifdef INET6
466413628a7SBjoern A. Zeeb 	case AF_INET6:
467413628a7SBjoern A. Zeeb 	{
468413628a7SBjoern A. Zeeb 		struct in6_addr ia6;
469413628a7SBjoern A. Zeeb 		struct ifaddr *ifa;
470413628a7SBjoern A. Zeeb 		int found;
471413628a7SBjoern A. Zeeb 
472413628a7SBjoern A. Zeeb 		found = 0;
473413628a7SBjoern A. Zeeb 		/*
4749c79d243SJamie Gritton 		 * Try to find an address on the given outgoing interface
4759c79d243SJamie Gritton 		 * that belongs to the jail.
476413628a7SBjoern A. Zeeb 		 */
477137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
478413628a7SBjoern A. Zeeb 		TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) {
479413628a7SBjoern A. Zeeb 			struct sockaddr *sa;
480413628a7SBjoern A. Zeeb 			sa = ifa->ifa_addr;
481413628a7SBjoern A. Zeeb 			if (sa->sa_family != AF_INET6)
482413628a7SBjoern A. Zeeb 				continue;
483413628a7SBjoern A. Zeeb 			bcopy(&((struct sockaddr_in6 *)sa)->sin6_addr,
484413628a7SBjoern A. Zeeb 			    &ia6, sizeof(struct in6_addr));
485b89e82ddSJamie Gritton 			if (prison_check_ip6(cred, &ia6) == 0) {
486413628a7SBjoern A. Zeeb 				found = 1;
487413628a7SBjoern A. Zeeb 				break;
488413628a7SBjoern A. Zeeb 			}
489413628a7SBjoern A. Zeeb 		}
490137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
491413628a7SBjoern A. Zeeb 		if (!found) {
492413628a7SBjoern A. Zeeb 			/*
4939c79d243SJamie Gritton 			 * As a last resort return the 'default' jail address.
494413628a7SBjoern A. Zeeb 			 */
4950304c731SJamie Gritton 			ia6 = ((struct sockaddr_in6 *)rt->rt_ifa->ifa_addr)->
4960304c731SJamie Gritton 			    sin6_addr;
4971cecba0fSBjoern A. Zeeb 			if (prison_get_ip6(cred, &ia6) != 0)
498413628a7SBjoern A. Zeeb 				return (ESRCH);
499413628a7SBjoern A. Zeeb 		}
500413628a7SBjoern A. Zeeb 		bzero(&saun->sin6, sizeof(struct sockaddr_in6));
501413628a7SBjoern A. Zeeb 		saun->sin6.sin6_len = sizeof(struct sockaddr_in6);
502413628a7SBjoern A. Zeeb 		saun->sin6.sin6_family = AF_INET6;
5039c79d243SJamie Gritton 		bcopy(&ia6, &saun->sin6.sin6_addr, sizeof(struct in6_addr));
504413628a7SBjoern A. Zeeb 		if (sa6_recoverscope(&saun->sin6) != 0)
505413628a7SBjoern A. Zeeb 			return (ESRCH);
5069c79d243SJamie Gritton 		info->rti_info[RTAX_IFA] = (struct sockaddr *)&saun->sin6;
507413628a7SBjoern A. Zeeb 		break;
508413628a7SBjoern A. Zeeb 	}
509413628a7SBjoern A. Zeeb #endif
510413628a7SBjoern A. Zeeb 	default:
511413628a7SBjoern A. Zeeb 		return (ESRCH);
512413628a7SBjoern A. Zeeb 	}
513413628a7SBjoern A. Zeeb 	return (0);
514413628a7SBjoern A. Zeeb }
515413628a7SBjoern A. Zeeb 
516df8bae1dSRodney W. Grimes /*ARGSUSED*/
51752041295SPoul-Henning Kamp static int
5185dfc91d7SLuigi Rizzo route_output(struct mbuf *m, struct socket *so)
519df8bae1dSRodney W. Grimes {
520becc44d7SSam Leffler #define	sa_equal(a1, a2) (bcmp((a1), (a2), (a1)->sa_len) == 0)
5215dfc91d7SLuigi Rizzo 	struct rt_msghdr *rtm = NULL;
5225dfc91d7SLuigi Rizzo 	struct rtentry *rt = NULL;
52378a82810SGarrett Wollman 	struct radix_node_head *rnh;
524df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
5256bbfef90SHiroki Sato #ifdef INET6
5260bebb544SHiroki Sato 	struct sockaddr_storage ss;
5276bbfef90SHiroki Sato 	struct sockaddr_in6 *sin6;
5280bebb544SHiroki Sato 	int i, rti_need_deembed = 0;
5296bbfef90SHiroki Sato #endif
530df8bae1dSRodney W. Grimes 	int len, error = 0;
5315dfc91d7SLuigi Rizzo 	struct ifnet *ifp = NULL;
532413628a7SBjoern A. Zeeb 	union sockaddr_union saun;
5333ca1a2d6SMax Laier 	sa_family_t saf = AF_UNSPEC;
534df8bae1dSRodney W. Grimes 
535df8bae1dSRodney W. Grimes #define senderr(e) { error = e; goto flush;}
5365dfc91d7SLuigi Rizzo 	if (m == NULL || ((m->m_len < sizeof(long)) &&
5375dfc91d7SLuigi Rizzo 		       (m = m_pullup(m, sizeof(long))) == NULL))
538df8bae1dSRodney W. Grimes 		return (ENOBUFS);
539df8bae1dSRodney W. Grimes 	if ((m->m_flags & M_PKTHDR) == 0)
540df8bae1dSRodney W. Grimes 		panic("route_output");
541df8bae1dSRodney W. Grimes 	len = m->m_pkthdr.len;
542df8bae1dSRodney W. Grimes 	if (len < sizeof(*rtm) ||
543df8bae1dSRodney W. Grimes 	    len != mtod(m, struct rt_msghdr *)->rtm_msglen) {
5445dfc91d7SLuigi Rizzo 		info.rti_info[RTAX_DST] = NULL;
545df8bae1dSRodney W. Grimes 		senderr(EINVAL);
546df8bae1dSRodney W. Grimes 	}
547df8bae1dSRodney W. Grimes 	R_Malloc(rtm, struct rt_msghdr *, len);
5485dfc91d7SLuigi Rizzo 	if (rtm == NULL) {
5495dfc91d7SLuigi Rizzo 		info.rti_info[RTAX_DST] = NULL;
550df8bae1dSRodney W. Grimes 		senderr(ENOBUFS);
551df8bae1dSRodney W. Grimes 	}
552df8bae1dSRodney W. Grimes 	m_copydata(m, 0, len, (caddr_t)rtm);
553df8bae1dSRodney W. Grimes 	if (rtm->rtm_version != RTM_VERSION) {
5545dfc91d7SLuigi Rizzo 		info.rti_info[RTAX_DST] = NULL;
555df8bae1dSRodney W. Grimes 		senderr(EPROTONOSUPPORT);
556df8bae1dSRodney W. Grimes 	}
557df8bae1dSRodney W. Grimes 	rtm->rtm_pid = curproc->p_pid;
5588071913dSRuslan Ermilov 	bzero(&info, sizeof(info));
559df8bae1dSRodney W. Grimes 	info.rti_addrs = rtm->rtm_addrs;
5600bebb544SHiroki Sato 	/*
5610bebb544SHiroki Sato 	 * rt_xaddrs() performs s6_addr[2] := sin6_scope_id for AF_INET6
5620bebb544SHiroki Sato 	 * link-local address because rtrequest requires addresses with
5630bebb544SHiroki Sato 	 * embedded scope id.
5640bebb544SHiroki Sato 	 */
565076d0761SJulian Elischer 	if (rt_xaddrs((caddr_t)(rtm + 1), len + (caddr_t)rtm, &info)) {
5665dfc91d7SLuigi Rizzo 		info.rti_info[RTAX_DST] = NULL;
567076d0761SJulian Elischer 		senderr(EINVAL);
568076d0761SJulian Elischer 	}
5698071913dSRuslan Ermilov 	info.rti_flags = rtm->rtm_flags;
5705dfc91d7SLuigi Rizzo 	if (info.rti_info[RTAX_DST] == NULL ||
571becc44d7SSam Leffler 	    info.rti_info[RTAX_DST]->sa_family >= AF_MAX ||
5725dfc91d7SLuigi Rizzo 	    (info.rti_info[RTAX_GATEWAY] != NULL &&
573becc44d7SSam Leffler 	     info.rti_info[RTAX_GATEWAY]->sa_family >= AF_MAX))
574df8bae1dSRodney W. Grimes 		senderr(EINVAL);
5753ca1a2d6SMax Laier 	saf = info.rti_info[RTAX_DST]->sa_family;
576162c0b2eSRuslan Ermilov 	/*
577162c0b2eSRuslan Ermilov 	 * Verify that the caller has the appropriate privilege; RTM_GET
578162c0b2eSRuslan Ermilov 	 * is the only operation the non-superuser is allowed.
579162c0b2eSRuslan Ermilov 	 */
580acd3428bSRobert Watson 	if (rtm->rtm_type != RTM_GET) {
581acd3428bSRobert Watson 		error = priv_check(curthread, PRIV_NET_ROUTE);
582acd3428bSRobert Watson 		if (error)
583dadb6c3bSRuslan Ermilov 			senderr(error);
584acd3428bSRobert Watson 	}
585162c0b2eSRuslan Ermilov 
5869231d35fSQing Li 	/*
5879231d35fSQing Li 	 * The given gateway address may be an interface address.
5889231d35fSQing Li 	 * For example, issuing a "route change" command on a route
5899231d35fSQing Li 	 * entry that was created from a tunnel, and the gateway
5909231d35fSQing Li 	 * address given is the local end point. In this case the
5919231d35fSQing Li 	 * RTF_GATEWAY flag must be cleared or the destination will
5929231d35fSQing Li 	 * not be reachable even though there is no error message.
5939231d35fSQing Li 	 */
5949231d35fSQing Li 	if (info.rti_info[RTAX_GATEWAY] != NULL &&
5959231d35fSQing Li 	    info.rti_info[RTAX_GATEWAY]->sa_family != AF_LINK) {
5969231d35fSQing Li 		struct route gw_ro;
5979231d35fSQing Li 
5989231d35fSQing Li 		bzero(&gw_ro, sizeof(gw_ro));
5999231d35fSQing Li 		gw_ro.ro_dst = *info.rti_info[RTAX_GATEWAY];
6005311e988SQing Li 		rtalloc_ign_fib(&gw_ro, 0, so->so_fibnum);
6019231d35fSQing Li 		/*
6029231d35fSQing Li 		 * A host route through the loopback interface is
6039231d35fSQing Li 		 * installed for each interface adddress. In pre 8.0
6049231d35fSQing Li 		 * releases the interface address of a PPP link type
6059231d35fSQing Li 		 * is not reachable locally. This behavior is fixed as
6069231d35fSQing Li 		 * part of the new L2/L3 redesign and rewrite work. The
6079231d35fSQing Li 		 * signature of this interface address route is the
6089231d35fSQing Li 		 * AF_LINK sa_family type of the rt_gateway, and the
6099231d35fSQing Li 		 * rt_ifp has the IFF_LOOPBACK flag set.
6109231d35fSQing Li 		 */
6119231d35fSQing Li 		if (gw_ro.ro_rt != NULL &&
6129231d35fSQing Li 		    gw_ro.ro_rt->rt_gateway->sa_family == AF_LINK &&
613f672f56fSQing Li 		    gw_ro.ro_rt->rt_ifp->if_flags & IFF_LOOPBACK) {
6149231d35fSQing Li 			info.rti_flags &= ~RTF_GATEWAY;
615f672f56fSQing Li 			info.rti_flags |= RTF_GWFLAG_COMPAT;
616f672f56fSQing Li 		}
6179231d35fSQing Li 		if (gw_ro.ro_rt != NULL)
6189231d35fSQing Li 			RTFREE(gw_ro.ro_rt);
6199231d35fSQing Li 	}
6209231d35fSQing Li 
621df8bae1dSRodney W. Grimes 	switch (rtm->rtm_type) {
622becc44d7SSam Leffler 		struct rtentry *saved_nrt;
623df8bae1dSRodney W. Grimes 
624df8bae1dSRodney W. Grimes 	case RTM_ADD:
6255dfc91d7SLuigi Rizzo 		if (info.rti_info[RTAX_GATEWAY] == NULL)
626df8bae1dSRodney W. Grimes 			senderr(EINVAL);
6275dfc91d7SLuigi Rizzo 		saved_nrt = NULL;
6288eca593cSQing Li 
6296e6b3f7cSQing Li 		/* support for new ARP code */
6308eca593cSQing Li 		if (info.rti_info[RTAX_GATEWAY]->sa_family == AF_LINK &&
6318eca593cSQing Li 		    (rtm->rtm_flags & RTF_LLDATA) != 0) {
6326e6b3f7cSQing Li 			error = lla_rt_output(rtm, &info);
6330bebb544SHiroki Sato #ifdef INET6
6340bebb544SHiroki Sato 			if (error == 0)
6350bebb544SHiroki Sato 				rti_need_deembed = (V_deembed_scopeid) ? 1 : 0;
6360bebb544SHiroki Sato #endif
6376e6b3f7cSQing Li 			break;
6386e6b3f7cSQing Li 		}
6398b07e49aSJulian Elischer 		error = rtrequest1_fib(RTM_ADD, &info, &saved_nrt,
6408b07e49aSJulian Elischer 		    so->so_fibnum);
641df8bae1dSRodney W. Grimes 		if (error == 0 && saved_nrt) {
6420bebb544SHiroki Sato #ifdef INET6
6430bebb544SHiroki Sato 			rti_need_deembed = (V_deembed_scopeid) ? 1 : 0;
6440bebb544SHiroki Sato #endif
645d1dd20beSSam Leffler 			RT_LOCK(saved_nrt);
646e3a7aa6fSGleb Smirnoff 			rt_setmetrics(rtm, saved_nrt);
64722cafcf0SAndre Oppermann 			rtm->rtm_index = saved_nrt->rt_ifp->if_index;
6487138d65cSSam Leffler 			RT_REMREF(saved_nrt);
649d1dd20beSSam Leffler 			RT_UNLOCK(saved_nrt);
650df8bae1dSRodney W. Grimes 		}
651df8bae1dSRodney W. Grimes 		break;
652df8bae1dSRodney W. Grimes 
653df8bae1dSRodney W. Grimes 	case RTM_DELETE:
6545dfc91d7SLuigi Rizzo 		saved_nrt = NULL;
6556e6b3f7cSQing Li 		/* support for new ARP code */
6566e6b3f7cSQing Li 		if (info.rti_info[RTAX_GATEWAY] &&
6578eca593cSQing Li 		    (info.rti_info[RTAX_GATEWAY]->sa_family == AF_LINK) &&
6588eca593cSQing Li 		    (rtm->rtm_flags & RTF_LLDATA) != 0) {
6596e6b3f7cSQing Li 			error = lla_rt_output(rtm, &info);
6600bebb544SHiroki Sato #ifdef INET6
6610bebb544SHiroki Sato 			if (error == 0)
6620bebb544SHiroki Sato 				rti_need_deembed = (V_deembed_scopeid) ? 1 : 0;
6630bebb544SHiroki Sato #endif
6646e6b3f7cSQing Li 			break;
6656e6b3f7cSQing Li 		}
6668b07e49aSJulian Elischer 		error = rtrequest1_fib(RTM_DELETE, &info, &saved_nrt,
6678b07e49aSJulian Elischer 		    so->so_fibnum);
66878a82810SGarrett Wollman 		if (error == 0) {
669d1dd20beSSam Leffler 			RT_LOCK(saved_nrt);
67071eba915SRuslan Ermilov 			rt = saved_nrt;
67178a82810SGarrett Wollman 			goto report;
67278a82810SGarrett Wollman 		}
6730bebb544SHiroki Sato #ifdef INET6
6740bebb544SHiroki Sato 		/* rt_msg2() will not be used when RTM_DELETE fails. */
6750bebb544SHiroki Sato 		rti_need_deembed = (V_deembed_scopeid) ? 1 : 0;
6760bebb544SHiroki Sato #endif
677df8bae1dSRodney W. Grimes 		break;
678df8bae1dSRodney W. Grimes 
679df8bae1dSRodney W. Grimes 	case RTM_GET:
680df8bae1dSRodney W. Grimes 	case RTM_CHANGE:
681df8bae1dSRodney W. Grimes 	case RTM_LOCK:
682c2c2a7c1SBjoern A. Zeeb 		rnh = rt_tables_get_rnh(so->so_fibnum,
683c2c2a7c1SBjoern A. Zeeb 		    info.rti_info[RTAX_DST]->sa_family);
6845dfc91d7SLuigi Rizzo 		if (rnh == NULL)
68578a82810SGarrett Wollman 			senderr(EAFNOSUPPORT);
6865a2f4cbdSAlexander V. Chernikov 
6873120b9d4SKip Macy 		RADIX_NODE_HEAD_RLOCK(rnh);
6885a2f4cbdSAlexander V. Chernikov 
6895a2f4cbdSAlexander V. Chernikov 		if (info.rti_info[RTAX_NETMASK] == NULL &&
6905a2f4cbdSAlexander V. Chernikov 		    rtm->rtm_type == RTM_GET) {
6915a2f4cbdSAlexander V. Chernikov 			/*
6925a2f4cbdSAlexander V. Chernikov 			 * Provide logest prefix match for
6935a2f4cbdSAlexander V. Chernikov 			 * address lookup (no mask).
6945a2f4cbdSAlexander V. Chernikov 			 * 'route -n get addr'
6955a2f4cbdSAlexander V. Chernikov 			 */
6965a2f4cbdSAlexander V. Chernikov 			rt = (struct rtentry *) rnh->rnh_matchaddr(
6975a2f4cbdSAlexander V. Chernikov 			    info.rti_info[RTAX_DST], rnh);
6985a2f4cbdSAlexander V. Chernikov 		} else
6995a2f4cbdSAlexander V. Chernikov 			rt = (struct rtentry *) rnh->rnh_lookup(
7005a2f4cbdSAlexander V. Chernikov 			    info.rti_info[RTAX_DST],
701becc44d7SSam Leffler 			    info.rti_info[RTAX_NETMASK], rnh);
7025a2f4cbdSAlexander V. Chernikov 
7035a2f4cbdSAlexander V. Chernikov 		if (rt == NULL) {
7043120b9d4SKip Macy 			RADIX_NODE_HEAD_RUNLOCK(rnh);
705df8bae1dSRodney W. Grimes 			senderr(ESRCH);
70679188861SGleb Smirnoff 		}
707e440aed9SQing Li #ifdef RADIX_MPATH
708e440aed9SQing Li 		/*
709e440aed9SQing Li 		 * for RTM_CHANGE/LOCK, if we got multipath routes,
710e440aed9SQing Li 		 * we require users to specify a matching RTAX_GATEWAY.
711e440aed9SQing Li 		 *
712e440aed9SQing Li 		 * for RTM_GET, gate is optional even with multipath.
713e440aed9SQing Li 		 * if gate == NULL the first match is returned.
714e440aed9SQing Li 		 * (no need to call rt_mpath_matchgate if gate == NULL)
715e440aed9SQing Li 		 */
716e440aed9SQing Li 		if (rn_mpath_capable(rnh) &&
717e440aed9SQing Li 		    (rtm->rtm_type != RTM_GET || info.rti_info[RTAX_GATEWAY])) {
718e440aed9SQing Li 			rt = rt_mpath_matchgate(rt, info.rti_info[RTAX_GATEWAY]);
719e440aed9SQing Li 			if (!rt) {
7203120b9d4SKip Macy 				RADIX_NODE_HEAD_RUNLOCK(rnh);
721e440aed9SQing Li 				senderr(ESRCH);
722e440aed9SQing Li 			}
723e440aed9SQing Li 		}
724e440aed9SQing Li #endif
725c7ab6602SQing Li 		/*
726c7ab6602SQing Li 		 * If performing proxied L2 entry insertion, and
727c7ab6602SQing Li 		 * the actual PPP host entry is found, perform
728c7ab6602SQing Li 		 * another search to retrieve the prefix route of
729c7ab6602SQing Li 		 * the local end point of the PPP link.
730c7ab6602SQing Li 		 */
7310ed6142bSQing Li 		if (rtm->rtm_flags & RTF_ANNOUNCE) {
732c7ab6602SQing Li 			struct sockaddr laddr;
7330ed6142bSQing Li 
7340ed6142bSQing Li 			if (rt->rt_ifp != NULL &&
7350ed6142bSQing Li 			    rt->rt_ifp->if_type == IFT_PROPVIRTUAL) {
7360ed6142bSQing Li 				struct ifaddr *ifa;
7370ed6142bSQing Li 
7380ed6142bSQing Li 				ifa = ifa_ifwithnet(info.rti_info[RTAX_DST], 1);
7390ed6142bSQing Li 				if (ifa != NULL)
7400ed6142bSQing Li 					rt_maskedcopy(ifa->ifa_addr,
7410ed6142bSQing Li 						      &laddr,
7420ed6142bSQing Li 						      ifa->ifa_netmask);
7430ed6142bSQing Li 			} else
744c7ab6602SQing Li 				rt_maskedcopy(rt->rt_ifa->ifa_addr,
745c7ab6602SQing Li 					      &laddr,
746c7ab6602SQing Li 					      rt->rt_ifa->ifa_netmask);
747c7ab6602SQing Li 			/*
748c7ab6602SQing Li 			 * refactor rt and no lock operation necessary
749c7ab6602SQing Li 			 */
750c7ab6602SQing Li 			rt = (struct rtentry *)rnh->rnh_matchaddr(&laddr, rnh);
751c7ab6602SQing Li 			if (rt == NULL) {
752c7ab6602SQing Li 				RADIX_NODE_HEAD_RUNLOCK(rnh);
753c7ab6602SQing Li 				senderr(ESRCH);
754c7ab6602SQing Li 			}
755c7ab6602SQing Li 		}
756d1dd20beSSam Leffler 		RT_LOCK(rt);
7577138d65cSSam Leffler 		RT_ADDREF(rt);
7583120b9d4SKip Macy 		RADIX_NODE_HEAD_RUNLOCK(rnh);
759956b0b65SJeffrey Hsu 
760df8bae1dSRodney W. Grimes 		switch(rtm->rtm_type) {
761df8bae1dSRodney W. Grimes 
762df8bae1dSRodney W. Grimes 		case RTM_GET:
76378a82810SGarrett Wollman 		report:
764d1dd20beSSam Leffler 			RT_LOCK_ASSERT(rt);
765b89e82ddSJamie Gritton 			if ((rt->rt_flags & RTF_HOST) == 0
766de0bd6f7SBjoern A. Zeeb 			    ? jailed_without_vnet(curthread->td_ucred)
767b89e82ddSJamie Gritton 			    : prison_if(curthread->td_ucred,
768b89e82ddSJamie Gritton 			    rt_key(rt)) != 0) {
769813dd6aeSBjoern A. Zeeb 				RT_UNLOCK(rt);
770813dd6aeSBjoern A. Zeeb 				senderr(ESRCH);
771813dd6aeSBjoern A. Zeeb 			}
772becc44d7SSam Leffler 			info.rti_info[RTAX_DST] = rt_key(rt);
773becc44d7SSam Leffler 			info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
774becc44d7SSam Leffler 			info.rti_info[RTAX_NETMASK] = rt_mask(rt);
7756e6b3f7cSQing Li 			info.rti_info[RTAX_GENMASK] = 0;
776df8bae1dSRodney W. Grimes 			if (rtm->rtm_addrs & (RTA_IFP | RTA_IFA)) {
777df440948SPoul-Henning Kamp 				ifp = rt->rt_ifp;
778df440948SPoul-Henning Kamp 				if (ifp) {
7799b98ee2cSLuigi Rizzo 					info.rti_info[RTAX_IFP] =
7804a0d6638SRuslan Ermilov 					    ifp->if_addr->ifa_addr;
7819c79d243SJamie Gritton 					error = rtm_get_jailed(&info, ifp, rt,
7829c79d243SJamie Gritton 					    &saun, curthread->td_ucred);
783413628a7SBjoern A. Zeeb 					if (error != 0) {
784413628a7SBjoern A. Zeeb 						RT_UNLOCK(rt);
7859c79d243SJamie Gritton 						senderr(error);
786413628a7SBjoern A. Zeeb 					}
78728070a0eSRuslan Ermilov 					if (ifp->if_flags & IFF_POINTOPOINT)
788becc44d7SSam Leffler 						info.rti_info[RTAX_BRD] =
789becc44d7SSam Leffler 						    rt->rt_ifa->ifa_dstaddr;
790df8bae1dSRodney W. Grimes 					rtm->rtm_index = ifp->if_index;
791df8bae1dSRodney W. Grimes 				} else {
7925dfc91d7SLuigi Rizzo 					info.rti_info[RTAX_IFP] = NULL;
7935dfc91d7SLuigi Rizzo 					info.rti_info[RTAX_IFA] = NULL;
794df8bae1dSRodney W. Grimes 				}
79525029d6cSHartmut Brandt 			} else if ((ifp = rt->rt_ifp) != NULL) {
79625029d6cSHartmut Brandt 				rtm->rtm_index = ifp->if_index;
797df8bae1dSRodney W. Grimes 			}
798913af518SLuigi Rizzo 			len = rt_msg2(rtm->rtm_type, &info, NULL, NULL);
799df8bae1dSRodney W. Grimes 			if (len > rtm->rtm_msglen) {
800df8bae1dSRodney W. Grimes 				struct rt_msghdr *new_rtm;
801df8bae1dSRodney W. Grimes 				R_Malloc(new_rtm, struct rt_msghdr *, len);
8025dfc91d7SLuigi Rizzo 				if (new_rtm == NULL) {
803d1dd20beSSam Leffler 					RT_UNLOCK(rt);
804df8bae1dSRodney W. Grimes 					senderr(ENOBUFS);
805becc44d7SSam Leffler 				}
8066b96f1afSLuigi Rizzo 				bcopy(rtm, new_rtm, rtm->rtm_msglen);
807df8bae1dSRodney W. Grimes 				Free(rtm); rtm = new_rtm;
808df8bae1dSRodney W. Grimes 			}
809913af518SLuigi Rizzo 			(void)rt_msg2(rtm->rtm_type, &info, (caddr_t)rtm, NULL);
810f672f56fSQing Li 			if (rt->rt_flags & RTF_GWFLAG_COMPAT)
811f672f56fSQing Li 				rtm->rtm_flags = RTF_GATEWAY |
812f672f56fSQing Li 					(rt->rt_flags & ~RTF_GWFLAG_COMPAT);
813f672f56fSQing Li 			else
814df8bae1dSRodney W. Grimes 				rtm->rtm_flags = rt->rt_flags;
815e3a7aa6fSGleb Smirnoff 			rt_getmetrics(rt, &rtm->rtm_rmx);
816df8bae1dSRodney W. Grimes 			rtm->rtm_addrs = info.rti_addrs;
817df8bae1dSRodney W. Grimes 			break;
818df8bae1dSRodney W. Grimes 
819df8bae1dSRodney W. Grimes 		case RTM_CHANGE:
820becc44d7SSam Leffler 			/*
821becc44d7SSam Leffler 			 * New gateway could require new ifaddr, ifp;
822becc44d7SSam Leffler 			 * flags may also be different; ifp may be specified
823becc44d7SSam Leffler 			 * by ll sockaddr when protocol address is ambiguous
824becc44d7SSam Leffler 			 */
825becc44d7SSam Leffler 			if (((rt->rt_flags & RTF_GATEWAY) &&
826becc44d7SSam Leffler 			     info.rti_info[RTAX_GATEWAY] != NULL) ||
827becc44d7SSam Leffler 			    info.rti_info[RTAX_IFP] != NULL ||
828becc44d7SSam Leffler 			    (info.rti_info[RTAX_IFA] != NULL &&
829becc44d7SSam Leffler 			     !sa_equal(info.rti_info[RTAX_IFA],
830becc44d7SSam Leffler 				       rt->rt_ifa->ifa_addr))) {
831d1dd20beSSam Leffler 				RT_UNLOCK(rt);
8329b20205dSKip Macy 				RADIX_NODE_HEAD_LOCK(rnh);
833a5a3926cSAndrew Thompson 				error = rt_getifa_fib(&info, rt->rt_fibnum);
8348c0fec80SRobert Watson 				/*
8358c0fec80SRobert Watson 				 * XXXRW: Really we should release this
8368c0fec80SRobert Watson 				 * reference later, but this maintains
8378c0fec80SRobert Watson 				 * historical behavior.
8388c0fec80SRobert Watson 				 */
8398c0fec80SRobert Watson 				if (info.rti_ifa != NULL)
8408c0fec80SRobert Watson 					ifa_free(info.rti_ifa);
8419b20205dSKip Macy 				RADIX_NODE_HEAD_UNLOCK(rnh);
842a5a3926cSAndrew Thompson 				if (error != 0)
843a5a3926cSAndrew Thompson 					senderr(error);
844a11faa9fSGleb Smirnoff 				RT_LOCK(rt);
845becc44d7SSam Leffler 			}
8465de55821SGleb Smirnoff 			if (info.rti_ifa != NULL &&
8475de55821SGleb Smirnoff 			    info.rti_ifa != rt->rt_ifa &&
8485de55821SGleb Smirnoff 			    rt->rt_ifa != NULL &&
8499406b274SGleb Smirnoff 			    rt->rt_ifa->ifa_rtrequest != NULL) {
8509406b274SGleb Smirnoff 				rt->rt_ifa->ifa_rtrequest(RTM_DELETE, rt,
8519406b274SGleb Smirnoff 				    &info);
8521099f828SRobert Watson 				ifa_free(rt->rt_ifa);
8539406b274SGleb Smirnoff 			}
8549406b274SGleb Smirnoff 			if (info.rti_info[RTAX_GATEWAY] != NULL) {
8559b20205dSKip Macy 				RT_UNLOCK(rt);
8569b20205dSKip Macy 				RADIX_NODE_HEAD_LOCK(rnh);
8579b20205dSKip Macy 				RT_LOCK(rt);
8589b20205dSKip Macy 
8599b20205dSKip Macy 				error = rt_setgate(rt, rt_key(rt),
8609b20205dSKip Macy 				    info.rti_info[RTAX_GATEWAY]);
8619b20205dSKip Macy 				RADIX_NODE_HEAD_UNLOCK(rnh);
8629b20205dSKip Macy 				if (error != 0) {
863d1dd20beSSam Leffler 					RT_UNLOCK(rt);
8648071913dSRuslan Ermilov 					senderr(error);
865becc44d7SSam Leffler 				}
866f672f56fSQing Li 				rt->rt_flags &= ~RTF_GATEWAY;
8679231d35fSQing Li 				rt->rt_flags |= (RTF_GATEWAY & info.rti_flags);
86819fc74fbSJeffrey Hsu 			}
8695de55821SGleb Smirnoff 			if (info.rti_ifa != NULL &&
8705de55821SGleb Smirnoff 			    info.rti_ifa != rt->rt_ifa) {
8711099f828SRobert Watson 				ifa_ref(info.rti_ifa);
8725de55821SGleb Smirnoff 				rt->rt_ifa = info.rti_ifa;
8738071913dSRuslan Ermilov 				rt->rt_ifp = info.rti_ifp;
874df8bae1dSRodney W. Grimes 			}
87522cafcf0SAndre Oppermann 			/* Allow some flags to be toggled on change. */
876427ac07fSKip Macy 			rt->rt_flags = (rt->rt_flags & ~RTF_FMASK) |
877427ac07fSKip Macy 				    (rtm->rtm_flags & RTF_FMASK);
878e3a7aa6fSGleb Smirnoff 			rt_setmetrics(rtm, rt);
87922cafcf0SAndre Oppermann 			rtm->rtm_index = rt->rt_ifp->if_index;
880df8bae1dSRodney W. Grimes 			if (rt->rt_ifa && rt->rt_ifa->ifa_rtrequest)
8818071913dSRuslan Ermilov 			       rt->rt_ifa->ifa_rtrequest(RTM_ADD, rt, &info);
88293b0017fSPhilippe Charnier 			/* FALLTHROUGH */
883df8bae1dSRodney W. Grimes 		case RTM_LOCK:
88497d8d152SAndre Oppermann 			/* We don't support locks anymore */
885df8bae1dSRodney W. Grimes 			break;
886df8bae1dSRodney W. Grimes 		}
887d1dd20beSSam Leffler 		RT_UNLOCK(rt);
888df8bae1dSRodney W. Grimes 		break;
889df8bae1dSRodney W. Grimes 
890df8bae1dSRodney W. Grimes 	default:
891df8bae1dSRodney W. Grimes 		senderr(EOPNOTSUPP);
892df8bae1dSRodney W. Grimes 	}
893df8bae1dSRodney W. Grimes 
894df8bae1dSRodney W. Grimes flush:
895df8bae1dSRodney W. Grimes 	if (rtm) {
896df8bae1dSRodney W. Grimes 		if (error)
897df8bae1dSRodney W. Grimes 			rtm->rtm_errno = error;
898df8bae1dSRodney W. Grimes 		else
899df8bae1dSRodney W. Grimes 			rtm->rtm_flags |= RTF_DONE;
900df8bae1dSRodney W. Grimes 	}
901becc44d7SSam Leffler 	if (rt)		/* XXX can this be true? */
902becc44d7SSam Leffler 		RTFREE(rt);
903df8bae1dSRodney W. Grimes     {
9045dfc91d7SLuigi Rizzo 	struct rawcb *rp = NULL;
905df8bae1dSRodney W. Grimes 	/*
906df8bae1dSRodney W. Grimes 	 * Check to see if we don't want our own messages.
907df8bae1dSRodney W. Grimes 	 */
908df8bae1dSRodney W. Grimes 	if ((so->so_options & SO_USELOOPBACK) == 0) {
909c5d4eab6SMarko Zec 		if (V_route_cb.any_count <= 1) {
910df8bae1dSRodney W. Grimes 			if (rtm)
911df8bae1dSRodney W. Grimes 				Free(rtm);
912df8bae1dSRodney W. Grimes 			m_freem(m);
913df8bae1dSRodney W. Grimes 			return (error);
914df8bae1dSRodney W. Grimes 		}
915df8bae1dSRodney W. Grimes 		/* There is another listener, so construct message */
916df8bae1dSRodney W. Grimes 		rp = sotorawcb(so);
9174cc20ab1SSeigo Tanimura 	}
918df8bae1dSRodney W. Grimes 	if (rtm) {
9190bebb544SHiroki Sato #ifdef INET6
9200bebb544SHiroki Sato 		if (rti_need_deembed) {
9210bebb544SHiroki Sato 			/* sin6_scope_id is recovered before sending rtm. */
9220bebb544SHiroki Sato 			sin6 = (struct sockaddr_in6 *)&ss;
92312bdf23aSHiroki Sato 			for (i = 0; i < RTAX_MAX; i++) {
9240bebb544SHiroki Sato 				if (info.rti_info[i] == NULL)
9250bebb544SHiroki Sato 					continue;
9260bebb544SHiroki Sato 				if (info.rti_info[i]->sa_family != AF_INET6)
9270bebb544SHiroki Sato 					continue;
9280bebb544SHiroki Sato 				bcopy(info.rti_info[i], sin6, sizeof(*sin6));
9290bebb544SHiroki Sato 				if (sa6_recoverscope(sin6) == 0)
9300bebb544SHiroki Sato 					bcopy(sin6, info.rti_info[i],
9310bebb544SHiroki Sato 						    sizeof(*sin6));
9320bebb544SHiroki Sato 			}
9330bebb544SHiroki Sato 		}
9340bebb544SHiroki Sato #endif
935df8bae1dSRodney W. Grimes 		m_copyback(m, 0, rtm->rtm_msglen, (caddr_t)rtm);
93603311056SHajimu UMEMOTO 		if (m->m_pkthdr.len < rtm->rtm_msglen) {
93703311056SHajimu UMEMOTO 			m_freem(m);
93803311056SHajimu UMEMOTO 			m = NULL;
93903311056SHajimu UMEMOTO 		} else if (m->m_pkthdr.len > rtm->rtm_msglen)
94003311056SHajimu UMEMOTO 			m_adj(m, rtm->rtm_msglen - m->m_pkthdr.len);
941df8bae1dSRodney W. Grimes 	}
942becc44d7SSam Leffler 	if (m) {
943528737fdSBjoern A. Zeeb 		M_SETFIB(m, so->so_fibnum);
944528737fdSBjoern A. Zeeb 		m->m_flags |= RTS_FILTER_FIB;
945becc44d7SSam Leffler 		if (rp) {
946becc44d7SSam Leffler 			/*
947becc44d7SSam Leffler 			 * XXX insure we don't get a copy by
948becc44d7SSam Leffler 			 * invalidating our protocol
949becc44d7SSam Leffler 			 */
950becc44d7SSam Leffler 			unsigned short family = rp->rcb_proto.sp_family;
951becc44d7SSam Leffler 			rp->rcb_proto.sp_family = 0;
9523ca1a2d6SMax Laier 			rt_dispatch(m, saf);
953becc44d7SSam Leffler 			rp->rcb_proto.sp_family = family;
954becc44d7SSam Leffler 		} else
9553ca1a2d6SMax Laier 			rt_dispatch(m, saf);
956becc44d7SSam Leffler 	}
957826bf287SMax Laier 	/* info.rti_info[RTAX_DST] (used above) can point inside of rtm */
958826bf287SMax Laier 	if (rtm)
959826bf287SMax Laier 		Free(rtm);
960df8bae1dSRodney W. Grimes     }
961df8bae1dSRodney W. Grimes 	return (error);
962becc44d7SSam Leffler #undef	sa_equal
963df8bae1dSRodney W. Grimes }
964df8bae1dSRodney W. Grimes 
96552041295SPoul-Henning Kamp static void
966e3a7aa6fSGleb Smirnoff rt_setmetrics(const struct rt_msghdr *rtm, struct rtentry *rt)
967df8bae1dSRodney W. Grimes {
968e3a7aa6fSGleb Smirnoff 
969e3a7aa6fSGleb Smirnoff 	if (rtm->rtm_inits & RTV_MTU)
970e3a7aa6fSGleb Smirnoff 		rt->rt_mtu = rtm->rtm_rmx.rmx_mtu;
971e3a7aa6fSGleb Smirnoff 	if (rtm->rtm_inits & RTV_WEIGHT)
972e3a7aa6fSGleb Smirnoff 		rt->rt_weight = rtm->rtm_rmx.rmx_weight;
973e3a7aa6fSGleb Smirnoff 	/* Kernel -> userland timebase conversion. */
974e3a7aa6fSGleb Smirnoff 	if (rtm->rtm_inits & RTV_EXPIRE)
975e3a7aa6fSGleb Smirnoff 		rt->rt_expire = rtm->rtm_rmx.rmx_expire ?
976e3a7aa6fSGleb Smirnoff 		    rtm->rtm_rmx.rmx_expire - time_second + time_uptime : 0;
977df8bae1dSRodney W. Grimes }
978df8bae1dSRodney W. Grimes 
97997d8d152SAndre Oppermann static void
980e3a7aa6fSGleb Smirnoff rt_getmetrics(const struct rtentry *rt, struct rt_metrics *out)
98197d8d152SAndre Oppermann {
982e3a7aa6fSGleb Smirnoff 
98397d8d152SAndre Oppermann 	bzero(out, sizeof(*out));
984e3a7aa6fSGleb Smirnoff 	out->rmx_mtu = rt->rt_mtu;
985e3a7aa6fSGleb Smirnoff 	out->rmx_weight = rt->rt_weight;
986e3a7aa6fSGleb Smirnoff 	out->rmx_pksent = counter_u64_fetch(rt->rt_pksent);
987e27c3f48SOleg Bulyzhin 	/* Kernel -> userland timebase conversion. */
988e3a7aa6fSGleb Smirnoff 	out->rmx_expire = rt->rt_expire ?
989e3a7aa6fSGleb Smirnoff 	    rt->rt_expire - time_uptime + time_second : 0;
99097d8d152SAndre Oppermann }
99197d8d152SAndre Oppermann 
9927f33a738SJulian Elischer /*
9937f33a738SJulian Elischer  * Extract the addresses of the passed sockaddrs.
9947f33a738SJulian Elischer  * Do a little sanity checking so as to avoid bad memory references.
995076d0761SJulian Elischer  * This data is derived straight from userland.
9967f33a738SJulian Elischer  */
997076d0761SJulian Elischer static int
998becc44d7SSam Leffler rt_xaddrs(caddr_t cp, caddr_t cplim, struct rt_addrinfo *rtinfo)
999df8bae1dSRodney W. Grimes {
1000e74642dfSLuigi Rizzo 	struct sockaddr *sa;
1001e74642dfSLuigi Rizzo 	int i;
1002df8bae1dSRodney W. Grimes 
1003becc44d7SSam Leffler 	for (i = 0; i < RTAX_MAX && cp < cplim; i++) {
1004df8bae1dSRodney W. Grimes 		if ((rtinfo->rti_addrs & (1 << i)) == 0)
1005df8bae1dSRodney W. Grimes 			continue;
1006ff6d0a59SJulian Elischer 		sa = (struct sockaddr *)cp;
10077f33a738SJulian Elischer 		/*
1008076d0761SJulian Elischer 		 * It won't fit.
10097f33a738SJulian Elischer 		 */
1010becc44d7SSam Leffler 		if (cp + sa->sa_len > cplim)
1011076d0761SJulian Elischer 			return (EINVAL);
10127f33a738SJulian Elischer 		/*
10137f33a738SJulian Elischer 		 * there are no more.. quit now
10147f33a738SJulian Elischer 		 * If there are more bits, they are in error.
10157f33a738SJulian Elischer 		 * I've seen this. route(1) can evidently generate these.
10167f33a738SJulian Elischer 		 * This causes kernel to core dump.
1017076d0761SJulian Elischer 		 * for compatibility, If we see this, point to a safe address.
10187f33a738SJulian Elischer 		 */
1019076d0761SJulian Elischer 		if (sa->sa_len == 0) {
1020076d0761SJulian Elischer 			rtinfo->rti_info[i] = &sa_zero;
1021076d0761SJulian Elischer 			return (0); /* should be EINVAL but for compat */
1022df8bae1dSRodney W. Grimes 		}
1023076d0761SJulian Elischer 		/* accept it */
10240bebb544SHiroki Sato #ifdef INET6
10250bebb544SHiroki Sato 		if (sa->sa_family == AF_INET6)
10260bebb544SHiroki Sato 			sa6_embedscope((struct sockaddr_in6 *)sa,
10270bebb544SHiroki Sato 			    V_ip6_use_defzone);
10280bebb544SHiroki Sato #endif
1029076d0761SJulian Elischer 		rtinfo->rti_info[i] = sa;
1030e74642dfSLuigi Rizzo 		cp += SA_SIZE(sa);
1031076d0761SJulian Elischer 	}
1032076d0761SJulian Elischer 	return (0);
1033df8bae1dSRodney W. Grimes }
1034df8bae1dSRodney W. Grimes 
10356d076ae8SBjoern A. Zeeb /*
10366d076ae8SBjoern A. Zeeb  * Used by the routing socket.
10376d076ae8SBjoern A. Zeeb  */
1038df8bae1dSRodney W. Grimes static struct mbuf *
1039becc44d7SSam Leffler rt_msg1(int type, struct rt_addrinfo *rtinfo)
1040df8bae1dSRodney W. Grimes {
10415dfc91d7SLuigi Rizzo 	struct rt_msghdr *rtm;
10425dfc91d7SLuigi Rizzo 	struct mbuf *m;
10435dfc91d7SLuigi Rizzo 	int i;
10445dfc91d7SLuigi Rizzo 	struct sockaddr *sa;
10456bbfef90SHiroki Sato #ifdef INET6
10466bbfef90SHiroki Sato 	struct sockaddr_storage ss;
10476bbfef90SHiroki Sato 	struct sockaddr_in6 *sin6;
10486bbfef90SHiroki Sato #endif
1049df8bae1dSRodney W. Grimes 	int len, dlen;
1050df8bae1dSRodney W. Grimes 
1051df8bae1dSRodney W. Grimes 	switch (type) {
1052df8bae1dSRodney W. Grimes 
1053df8bae1dSRodney W. Grimes 	case RTM_DELADDR:
1054df8bae1dSRodney W. Grimes 	case RTM_NEWADDR:
1055df8bae1dSRodney W. Grimes 		len = sizeof(struct ifa_msghdr);
1056df8bae1dSRodney W. Grimes 		break;
1057df8bae1dSRodney W. Grimes 
1058477180fbSGarrett Wollman 	case RTM_DELMADDR:
1059477180fbSGarrett Wollman 	case RTM_NEWMADDR:
1060477180fbSGarrett Wollman 		len = sizeof(struct ifma_msghdr);
1061477180fbSGarrett Wollman 		break;
1062477180fbSGarrett Wollman 
1063df8bae1dSRodney W. Grimes 	case RTM_IFINFO:
1064df8bae1dSRodney W. Grimes 		len = sizeof(struct if_msghdr);
1065df8bae1dSRodney W. Grimes 		break;
1066df8bae1dSRodney W. Grimes 
10677b6edd04SRuslan Ermilov 	case RTM_IFANNOUNCE:
1068b83a279fSSam Leffler 	case RTM_IEEE80211:
10697b6edd04SRuslan Ermilov 		len = sizeof(struct if_announcemsghdr);
10707b6edd04SRuslan Ermilov 		break;
10717b6edd04SRuslan Ermilov 
1072df8bae1dSRodney W. Grimes 	default:
1073df8bae1dSRodney W. Grimes 		len = sizeof(struct rt_msghdr);
1074df8bae1dSRodney W. Grimes 	}
1075c69f77c3SGleb Smirnoff 
1076c69f77c3SGleb Smirnoff 	/* XXXGL: can we use MJUMPAGESIZE cluster here? */
1077c69f77c3SGleb Smirnoff 	KASSERT(len <= MCLBYTES, ("%s: message too big", __func__));
1078c69f77c3SGleb Smirnoff 	if (len > MHLEN)
1079c69f77c3SGleb Smirnoff 		m = m_getcl(M_NOWAIT, MT_DATA, M_PKTHDR);
1080c69f77c3SGleb Smirnoff 	else
1081eb1b1807SGleb Smirnoff 		m = m_gethdr(M_NOWAIT, MT_DATA);
10825dfc91d7SLuigi Rizzo 	if (m == NULL)
108333841545SHajimu UMEMOTO 		return (m);
1084c69f77c3SGleb Smirnoff 
1085df8bae1dSRodney W. Grimes 	m->m_pkthdr.len = m->m_len = len;
1086df8bae1dSRodney W. Grimes 	rtm = mtod(m, struct rt_msghdr *);
1087df8bae1dSRodney W. Grimes 	bzero((caddr_t)rtm, len);
1088df8bae1dSRodney W. Grimes 	for (i = 0; i < RTAX_MAX; i++) {
1089df8bae1dSRodney W. Grimes 		if ((sa = rtinfo->rti_info[i]) == NULL)
1090df8bae1dSRodney W. Grimes 			continue;
1091df8bae1dSRodney W. Grimes 		rtinfo->rti_addrs |= (1 << i);
1092e74642dfSLuigi Rizzo 		dlen = SA_SIZE(sa);
10936bbfef90SHiroki Sato #ifdef INET6
10945c9fa630SHiroki Sato 		if (V_deembed_scopeid && sa->sa_family == AF_INET6) {
10956bbfef90SHiroki Sato 			sin6 = (struct sockaddr_in6 *)&ss;
10966bbfef90SHiroki Sato 			bcopy(sa, sin6, sizeof(*sin6));
10976bbfef90SHiroki Sato 			if (sa6_recoverscope(sin6) == 0)
10986bbfef90SHiroki Sato 				sa = (struct sockaddr *)sin6;
10996bbfef90SHiroki Sato 		}
11006bbfef90SHiroki Sato #endif
1101df8bae1dSRodney W. Grimes 		m_copyback(m, len, dlen, (caddr_t)sa);
1102df8bae1dSRodney W. Grimes 		len += dlen;
1103df8bae1dSRodney W. Grimes 	}
1104df8bae1dSRodney W. Grimes 	if (m->m_pkthdr.len != len) {
1105df8bae1dSRodney W. Grimes 		m_freem(m);
1106df8bae1dSRodney W. Grimes 		return (NULL);
1107df8bae1dSRodney W. Grimes 	}
1108df8bae1dSRodney W. Grimes 	rtm->rtm_msglen = len;
1109df8bae1dSRodney W. Grimes 	rtm->rtm_version = RTM_VERSION;
1110df8bae1dSRodney W. Grimes 	rtm->rtm_type = type;
1111df8bae1dSRodney W. Grimes 	return (m);
1112df8bae1dSRodney W. Grimes }
1113df8bae1dSRodney W. Grimes 
11146d076ae8SBjoern A. Zeeb /*
11156d076ae8SBjoern A. Zeeb  * Used by the sysctl code and routing socket.
11166d076ae8SBjoern A. Zeeb  */
1117df8bae1dSRodney W. Grimes static int
1118becc44d7SSam Leffler rt_msg2(int type, struct rt_addrinfo *rtinfo, caddr_t cp, struct walkarg *w)
1119df8bae1dSRodney W. Grimes {
11205dfc91d7SLuigi Rizzo 	int i;
1121df8bae1dSRodney W. Grimes 	int len, dlen, second_time = 0;
1122df8bae1dSRodney W. Grimes 	caddr_t cp0;
11236bbfef90SHiroki Sato #ifdef INET6
11246bbfef90SHiroki Sato 	struct sockaddr_storage ss;
11256bbfef90SHiroki Sato 	struct sockaddr_in6 *sin6;
11266bbfef90SHiroki Sato #endif
1127df8bae1dSRodney W. Grimes 
1128df8bae1dSRodney W. Grimes 	rtinfo->rti_addrs = 0;
1129df8bae1dSRodney W. Grimes again:
1130df8bae1dSRodney W. Grimes 	switch (type) {
1131df8bae1dSRodney W. Grimes 
1132df8bae1dSRodney W. Grimes 	case RTM_DELADDR:
1133df8bae1dSRodney W. Grimes 	case RTM_NEWADDR:
11346d076ae8SBjoern A. Zeeb 		if (w != NULL && w->w_op == NET_RT_IFLISTL) {
11356d076ae8SBjoern A. Zeeb #ifdef COMPAT_FREEBSD32
11366d076ae8SBjoern A. Zeeb 			if (w->w_req->flags & SCTL_MASK32)
11376d076ae8SBjoern A. Zeeb 				len = sizeof(struct ifa_msghdrl32);
11386d076ae8SBjoern A. Zeeb 			else
11396d076ae8SBjoern A. Zeeb #endif
11406d076ae8SBjoern A. Zeeb 				len = sizeof(struct ifa_msghdrl);
11416d076ae8SBjoern A. Zeeb 		} else
1142df8bae1dSRodney W. Grimes 			len = sizeof(struct ifa_msghdr);
1143df8bae1dSRodney W. Grimes 		break;
1144df8bae1dSRodney W. Grimes 
1145df8bae1dSRodney W. Grimes 	case RTM_IFINFO:
1146427a928aSKonstantin Belousov #ifdef COMPAT_FREEBSD32
1147427a928aSKonstantin Belousov 		if (w != NULL && w->w_req->flags & SCTL_MASK32) {
11486d076ae8SBjoern A. Zeeb 			if (w->w_op == NET_RT_IFLISTL)
11496d076ae8SBjoern A. Zeeb 				len = sizeof(struct if_msghdrl32);
11506d076ae8SBjoern A. Zeeb 			else
1151427a928aSKonstantin Belousov 				len = sizeof(struct if_msghdr32);
1152427a928aSKonstantin Belousov 			break;
1153427a928aSKonstantin Belousov 		}
1154427a928aSKonstantin Belousov #endif
11556d076ae8SBjoern A. Zeeb 		if (w != NULL && w->w_op == NET_RT_IFLISTL)
11566d076ae8SBjoern A. Zeeb 			len = sizeof(struct if_msghdrl);
11576d076ae8SBjoern A. Zeeb 		else
1158df8bae1dSRodney W. Grimes 			len = sizeof(struct if_msghdr);
1159df8bae1dSRodney W. Grimes 		break;
1160df8bae1dSRodney W. Grimes 
116105b2efe0SBruce M Simpson 	case RTM_NEWMADDR:
116205b2efe0SBruce M Simpson 		len = sizeof(struct ifma_msghdr);
116305b2efe0SBruce M Simpson 		break;
116405b2efe0SBruce M Simpson 
1165df8bae1dSRodney W. Grimes 	default:
1166df8bae1dSRodney W. Grimes 		len = sizeof(struct rt_msghdr);
1167df8bae1dSRodney W. Grimes 	}
1168df440948SPoul-Henning Kamp 	cp0 = cp;
1169df440948SPoul-Henning Kamp 	if (cp0)
1170df8bae1dSRodney W. Grimes 		cp += len;
1171df8bae1dSRodney W. Grimes 	for (i = 0; i < RTAX_MAX; i++) {
11725dfc91d7SLuigi Rizzo 		struct sockaddr *sa;
1173df8bae1dSRodney W. Grimes 
11745dfc91d7SLuigi Rizzo 		if ((sa = rtinfo->rti_info[i]) == NULL)
1175df8bae1dSRodney W. Grimes 			continue;
1176df8bae1dSRodney W. Grimes 		rtinfo->rti_addrs |= (1 << i);
1177e74642dfSLuigi Rizzo 		dlen = SA_SIZE(sa);
11780bebb544SHiroki Sato 		if (cp) {
11796bbfef90SHiroki Sato #ifdef INET6
11805c9fa630SHiroki Sato 			if (V_deembed_scopeid && sa->sa_family == AF_INET6) {
11816bbfef90SHiroki Sato 				sin6 = (struct sockaddr_in6 *)&ss;
11826bbfef90SHiroki Sato 				bcopy(sa, sin6, sizeof(*sin6));
11836bbfef90SHiroki Sato 				if (sa6_recoverscope(sin6) == 0)
11846bbfef90SHiroki Sato 					sa = (struct sockaddr *)sin6;
11856bbfef90SHiroki Sato 			}
11866bbfef90SHiroki Sato #endif
1187df8bae1dSRodney W. Grimes 			bcopy((caddr_t)sa, cp, (unsigned)dlen);
1188df8bae1dSRodney W. Grimes 			cp += dlen;
1189df8bae1dSRodney W. Grimes 		}
1190df8bae1dSRodney W. Grimes 		len += dlen;
1191df8bae1dSRodney W. Grimes 	}
1192694ff264SAndrew Gallatin 	len = ALIGN(len);
11935dfc91d7SLuigi Rizzo 	if (cp == NULL && w != NULL && !second_time) {
11945dfc91d7SLuigi Rizzo 		struct walkarg *rw = w;
1195df8bae1dSRodney W. Grimes 
119652041295SPoul-Henning Kamp 		if (rw->w_req) {
1197df8bae1dSRodney W. Grimes 			if (rw->w_tmemsize < len) {
1198df8bae1dSRodney W. Grimes 				if (rw->w_tmem)
1199df8bae1dSRodney W. Grimes 					free(rw->w_tmem, M_RTABLE);
1200df440948SPoul-Henning Kamp 				rw->w_tmem = (caddr_t)
1201df440948SPoul-Henning Kamp 					malloc(len, M_RTABLE, M_NOWAIT);
1202df440948SPoul-Henning Kamp 				if (rw->w_tmem)
1203df8bae1dSRodney W. Grimes 					rw->w_tmemsize = len;
1204df8bae1dSRodney W. Grimes 			}
1205df8bae1dSRodney W. Grimes 			if (rw->w_tmem) {
1206df8bae1dSRodney W. Grimes 				cp = rw->w_tmem;
1207df8bae1dSRodney W. Grimes 				second_time = 1;
1208df8bae1dSRodney W. Grimes 				goto again;
120952041295SPoul-Henning Kamp 			}
1210df8bae1dSRodney W. Grimes 		}
1211df8bae1dSRodney W. Grimes 	}
1212df8bae1dSRodney W. Grimes 	if (cp) {
12135dfc91d7SLuigi Rizzo 		struct rt_msghdr *rtm = (struct rt_msghdr *)cp0;
1214df8bae1dSRodney W. Grimes 
1215df8bae1dSRodney W. Grimes 		rtm->rtm_version = RTM_VERSION;
1216df8bae1dSRodney W. Grimes 		rtm->rtm_type = type;
1217df8bae1dSRodney W. Grimes 		rtm->rtm_msglen = len;
1218df8bae1dSRodney W. Grimes 	}
1219df8bae1dSRodney W. Grimes 	return (len);
1220df8bae1dSRodney W. Grimes }
1221df8bae1dSRodney W. Grimes 
1222df8bae1dSRodney W. Grimes /*
1223df8bae1dSRodney W. Grimes  * This routine is called to generate a message from the routing
1224df8bae1dSRodney W. Grimes  * socket indicating that a redirect has occured, a routing lookup
1225df8bae1dSRodney W. Grimes  * has failed, or that a protocol has detected timeouts to a particular
1226df8bae1dSRodney W. Grimes  * destination.
1227df8bae1dSRodney W. Grimes  */
1228df8bae1dSRodney W. Grimes void
1229528737fdSBjoern A. Zeeb rt_missmsg_fib(int type, struct rt_addrinfo *rtinfo, int flags, int error,
1230528737fdSBjoern A. Zeeb     int fibnum)
1231df8bae1dSRodney W. Grimes {
1232becc44d7SSam Leffler 	struct rt_msghdr *rtm;
1233becc44d7SSam Leffler 	struct mbuf *m;
1234df8bae1dSRodney W. Grimes 	struct sockaddr *sa = rtinfo->rti_info[RTAX_DST];
1235df8bae1dSRodney W. Grimes 
1236c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
1237df8bae1dSRodney W. Grimes 		return;
1238df8bae1dSRodney W. Grimes 	m = rt_msg1(type, rtinfo);
12395dfc91d7SLuigi Rizzo 	if (m == NULL)
1240df8bae1dSRodney W. Grimes 		return;
1241528737fdSBjoern A. Zeeb 
12427d9b6df1SAlexander V. Chernikov 	if (fibnum != RT_ALL_FIBS) {
1243528737fdSBjoern A. Zeeb 		KASSERT(fibnum >= 0 && fibnum < rt_numfibs, ("%s: fibnum out "
1244528737fdSBjoern A. Zeeb 		    "of range 0 <= %d < %d", __func__, fibnum, rt_numfibs));
1245528737fdSBjoern A. Zeeb 		M_SETFIB(m, fibnum);
1246528737fdSBjoern A. Zeeb 		m->m_flags |= RTS_FILTER_FIB;
1247528737fdSBjoern A. Zeeb 	}
1248528737fdSBjoern A. Zeeb 
1249df8bae1dSRodney W. Grimes 	rtm = mtod(m, struct rt_msghdr *);
1250df8bae1dSRodney W. Grimes 	rtm->rtm_flags = RTF_DONE | flags;
1251df8bae1dSRodney W. Grimes 	rtm->rtm_errno = error;
1252df8bae1dSRodney W. Grimes 	rtm->rtm_addrs = rtinfo->rti_addrs;
12533ca1a2d6SMax Laier 	rt_dispatch(m, sa ? sa->sa_family : AF_UNSPEC);
1254df8bae1dSRodney W. Grimes }
1255df8bae1dSRodney W. Grimes 
1256528737fdSBjoern A. Zeeb void
1257528737fdSBjoern A. Zeeb rt_missmsg(int type, struct rt_addrinfo *rtinfo, int flags, int error)
1258528737fdSBjoern A. Zeeb {
1259528737fdSBjoern A. Zeeb 
12607d9b6df1SAlexander V. Chernikov 	rt_missmsg_fib(type, rtinfo, flags, error, RT_ALL_FIBS);
1261528737fdSBjoern A. Zeeb }
1262528737fdSBjoern A. Zeeb 
1263df8bae1dSRodney W. Grimes /*
1264df8bae1dSRodney W. Grimes  * This routine is called to generate a message from the routing
1265df8bae1dSRodney W. Grimes  * socket indicating that the status of a network interface has changed.
1266df8bae1dSRodney W. Grimes  */
1267df8bae1dSRodney W. Grimes void
1268becc44d7SSam Leffler rt_ifmsg(struct ifnet *ifp)
1269df8bae1dSRodney W. Grimes {
1270becc44d7SSam Leffler 	struct if_msghdr *ifm;
1271df8bae1dSRodney W. Grimes 	struct mbuf *m;
1272df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
1273df8bae1dSRodney W. Grimes 
1274c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
1275df8bae1dSRodney W. Grimes 		return;
1276df8bae1dSRodney W. Grimes 	bzero((caddr_t)&info, sizeof(info));
1277df8bae1dSRodney W. Grimes 	m = rt_msg1(RTM_IFINFO, &info);
12785dfc91d7SLuigi Rizzo 	if (m == NULL)
1279df8bae1dSRodney W. Grimes 		return;
1280df8bae1dSRodney W. Grimes 	ifm = mtod(m, struct if_msghdr *);
1281df8bae1dSRodney W. Grimes 	ifm->ifm_index = ifp->if_index;
1282292ee7beSRobert Watson 	ifm->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
1283df8bae1dSRodney W. Grimes 	ifm->ifm_data = ifp->if_data;
1284df8bae1dSRodney W. Grimes 	ifm->ifm_addrs = 0;
12853ca1a2d6SMax Laier 	rt_dispatch(m, AF_UNSPEC);
1286df8bae1dSRodney W. Grimes }
1287df8bae1dSRodney W. Grimes 
1288df8bae1dSRodney W. Grimes /*
12894cbac30bSAlexander V. Chernikov  * Announce interface address arrival/withdraw.
12904cbac30bSAlexander V. Chernikov  * Please do not call directly, use rt_addrmsg().
12914cbac30bSAlexander V. Chernikov  * Assume input data to be valid.
12924cbac30bSAlexander V. Chernikov  * Returns 0 on success.
1293df8bae1dSRodney W. Grimes  */
12944cbac30bSAlexander V. Chernikov int
12954cbac30bSAlexander V. Chernikov rtsock_addrmsg(int cmd, struct ifaddr *ifa, int fibnum)
1296df8bae1dSRodney W. Grimes {
1297df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
12984cbac30bSAlexander V. Chernikov 	struct sockaddr *sa;
12994cbac30bSAlexander V. Chernikov 	int ncmd;
13004cbac30bSAlexander V. Chernikov 	struct mbuf *m;
13014cbac30bSAlexander V. Chernikov 	struct ifa_msghdr *ifam;
1302df8bae1dSRodney W. Grimes 	struct ifnet *ifp = ifa->ifa_ifp;
1303df8bae1dSRodney W. Grimes 
1304c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
13054cbac30bSAlexander V. Chernikov 		return (0);
1306df8bae1dSRodney W. Grimes 
13074cbac30bSAlexander V. Chernikov 	ncmd = cmd == RTM_ADD ? RTM_NEWADDR : RTM_DELADDR;
13084cbac30bSAlexander V. Chernikov 
13094cbac30bSAlexander V. Chernikov 	bzero((caddr_t)&info, sizeof(info));
1310becc44d7SSam Leffler 	info.rti_info[RTAX_IFA] = sa = ifa->ifa_addr;
13114a0d6638SRuslan Ermilov 	info.rti_info[RTAX_IFP] = ifp->if_addr->ifa_addr;
1312becc44d7SSam Leffler 	info.rti_info[RTAX_NETMASK] = ifa->ifa_netmask;
1313becc44d7SSam Leffler 	info.rti_info[RTAX_BRD] = ifa->ifa_dstaddr;
1314df8bae1dSRodney W. Grimes 	if ((m = rt_msg1(ncmd, &info)) == NULL)
13154cbac30bSAlexander V. Chernikov 		return (ENOBUFS);
1316df8bae1dSRodney W. Grimes 	ifam = mtod(m, struct ifa_msghdr *);
1317df8bae1dSRodney W. Grimes 	ifam->ifam_index = ifp->if_index;
1318df8bae1dSRodney W. Grimes 	ifam->ifam_metric = ifa->ifa_metric;
1319df8bae1dSRodney W. Grimes 	ifam->ifam_flags = ifa->ifa_flags;
1320df8bae1dSRodney W. Grimes 	ifam->ifam_addrs = info.rti_addrs;
13214cbac30bSAlexander V. Chernikov 
13224cbac30bSAlexander V. Chernikov 	if (fibnum != RT_ALL_FIBS) {
13234cbac30bSAlexander V. Chernikov 		M_SETFIB(m, fibnum);
13244cbac30bSAlexander V. Chernikov 		m->m_flags |= RTS_FILTER_FIB;
1325df8bae1dSRodney W. Grimes 	}
13264cbac30bSAlexander V. Chernikov 
13274cbac30bSAlexander V. Chernikov 	rt_dispatch(m, sa ? sa->sa_family : AF_UNSPEC);
13284cbac30bSAlexander V. Chernikov 
13294cbac30bSAlexander V. Chernikov 	return (0);
13304cbac30bSAlexander V. Chernikov }
13314cbac30bSAlexander V. Chernikov 
13324cbac30bSAlexander V. Chernikov /*
13334cbac30bSAlexander V. Chernikov  * Announce route addition/removal.
13344cbac30bSAlexander V. Chernikov  * Please do not call directly, use rt_routemsg().
13354cbac30bSAlexander V. Chernikov  * Note that @rt data MAY be inconsistent/invalid:
13364cbac30bSAlexander V. Chernikov  * if some userland app sends us "invalid" route message (invalid mask,
13374cbac30bSAlexander V. Chernikov  * no dst, wrong address families, etc...) we need to pass it back
13384cbac30bSAlexander V. Chernikov  * to app (and any other rtsock consumers) with rtm_errno field set to
13394cbac30bSAlexander V. Chernikov  * non-zero value.
13404cbac30bSAlexander V. Chernikov  *
13414cbac30bSAlexander V. Chernikov  * Returns 0 on success.
13424cbac30bSAlexander V. Chernikov  */
13434cbac30bSAlexander V. Chernikov int
13444cbac30bSAlexander V. Chernikov rtsock_routemsg(int cmd, struct ifnet *ifp, int error, struct rtentry *rt,
13454cbac30bSAlexander V. Chernikov     int fibnum)
13464cbac30bSAlexander V. Chernikov {
13474cbac30bSAlexander V. Chernikov 	struct rt_addrinfo info;
13484cbac30bSAlexander V. Chernikov 	struct sockaddr *sa;
13494cbac30bSAlexander V. Chernikov 	struct mbuf *m;
13505dfc91d7SLuigi Rizzo 	struct rt_msghdr *rtm;
1351df8bae1dSRodney W. Grimes 
1352c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
13534cbac30bSAlexander V. Chernikov 		return (0);
13544cbac30bSAlexander V. Chernikov 
13554cbac30bSAlexander V. Chernikov 	bzero((caddr_t)&info, sizeof(info));
1356becc44d7SSam Leffler 	info.rti_info[RTAX_NETMASK] = rt_mask(rt);
1357becc44d7SSam Leffler 	info.rti_info[RTAX_DST] = sa = rt_key(rt);
1358becc44d7SSam Leffler 	info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
1359df8bae1dSRodney W. Grimes 	if ((m = rt_msg1(cmd, &info)) == NULL)
13604cbac30bSAlexander V. Chernikov 		return (ENOBUFS);
1361df8bae1dSRodney W. Grimes 	rtm = mtod(m, struct rt_msghdr *);
1362df8bae1dSRodney W. Grimes 	rtm->rtm_index = ifp->if_index;
1363df8bae1dSRodney W. Grimes 	rtm->rtm_flags |= rt->rt_flags;
1364df8bae1dSRodney W. Grimes 	rtm->rtm_errno = error;
1365df8bae1dSRodney W. Grimes 	rtm->rtm_addrs = info.rti_addrs;
13664cbac30bSAlexander V. Chernikov 
13677d9b6df1SAlexander V. Chernikov 	if (fibnum != RT_ALL_FIBS) {
1368528737fdSBjoern A. Zeeb 		M_SETFIB(m, fibnum);
1369528737fdSBjoern A. Zeeb 		m->m_flags |= RTS_FILTER_FIB;
1370528737fdSBjoern A. Zeeb 	}
13714cbac30bSAlexander V. Chernikov 
13723ca1a2d6SMax Laier 	rt_dispatch(m, sa ? sa->sa_family : AF_UNSPEC);
13734cbac30bSAlexander V. Chernikov 
13744cbac30bSAlexander V. Chernikov 	return (0);
1375df8bae1dSRodney W. Grimes }
1376df8bae1dSRodney W. Grimes 
1377477180fbSGarrett Wollman /*
1378477180fbSGarrett Wollman  * This is the analogue to the rt_newaddrmsg which performs the same
1379477180fbSGarrett Wollman  * function but for multicast group memberhips.  This is easier since
1380477180fbSGarrett Wollman  * there is no route state to worry about.
1381477180fbSGarrett Wollman  */
1382477180fbSGarrett Wollman void
1383becc44d7SSam Leffler rt_newmaddrmsg(int cmd, struct ifmultiaddr *ifma)
1384477180fbSGarrett Wollman {
1385477180fbSGarrett Wollman 	struct rt_addrinfo info;
13865dfc91d7SLuigi Rizzo 	struct mbuf *m = NULL;
1387477180fbSGarrett Wollman 	struct ifnet *ifp = ifma->ifma_ifp;
1388477180fbSGarrett Wollman 	struct ifma_msghdr *ifmam;
1389477180fbSGarrett Wollman 
1390c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
1391477180fbSGarrett Wollman 		return;
1392477180fbSGarrett Wollman 
1393477180fbSGarrett Wollman 	bzero((caddr_t)&info, sizeof(info));
1394becc44d7SSam Leffler 	info.rti_info[RTAX_IFA] = ifma->ifma_addr;
13954a0d6638SRuslan Ermilov 	info.rti_info[RTAX_IFP] = ifp ? ifp->if_addr->ifa_addr : NULL;
1396477180fbSGarrett Wollman 	/*
1397477180fbSGarrett Wollman 	 * If a link-layer address is present, present it as a ``gateway''
1398477180fbSGarrett Wollman 	 * (similarly to how ARP entries, e.g., are presented).
1399477180fbSGarrett Wollman 	 */
1400becc44d7SSam Leffler 	info.rti_info[RTAX_GATEWAY] = ifma->ifma_lladdr;
1401becc44d7SSam Leffler 	m = rt_msg1(cmd, &info);
1402becc44d7SSam Leffler 	if (m == NULL)
1403477180fbSGarrett Wollman 		return;
1404477180fbSGarrett Wollman 	ifmam = mtod(m, struct ifma_msghdr *);
140575ae0c01SBruce M Simpson 	KASSERT(ifp != NULL, ("%s: link-layer multicast address w/o ifp\n",
140675ae0c01SBruce M Simpson 	    __func__));
1407477180fbSGarrett Wollman 	ifmam->ifmam_index = ifp->if_index;
1408477180fbSGarrett Wollman 	ifmam->ifmam_addrs = info.rti_addrs;
14093ca1a2d6SMax Laier 	rt_dispatch(m, ifma->ifma_addr ? ifma->ifma_addr->sa_family : AF_UNSPEC);
1410477180fbSGarrett Wollman }
141152041295SPoul-Henning Kamp 
1412b83a279fSSam Leffler static struct mbuf *
1413b83a279fSSam Leffler rt_makeifannouncemsg(struct ifnet *ifp, int type, int what,
1414b83a279fSSam Leffler 	struct rt_addrinfo *info)
1415b83a279fSSam Leffler {
1416b83a279fSSam Leffler 	struct if_announcemsghdr *ifan;
1417b83a279fSSam Leffler 	struct mbuf *m;
1418b83a279fSSam Leffler 
1419c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
1420b83a279fSSam Leffler 		return NULL;
1421b83a279fSSam Leffler 	bzero((caddr_t)info, sizeof(*info));
1422b83a279fSSam Leffler 	m = rt_msg1(type, info);
1423b83a279fSSam Leffler 	if (m != NULL) {
1424b83a279fSSam Leffler 		ifan = mtod(m, struct if_announcemsghdr *);
1425b83a279fSSam Leffler 		ifan->ifan_index = ifp->if_index;
1426b83a279fSSam Leffler 		strlcpy(ifan->ifan_name, ifp->if_xname,
1427b83a279fSSam Leffler 			sizeof(ifan->ifan_name));
1428b83a279fSSam Leffler 		ifan->ifan_what = what;
1429b83a279fSSam Leffler 	}
1430b83a279fSSam Leffler 	return m;
1431b83a279fSSam Leffler }
1432b83a279fSSam Leffler 
1433b83a279fSSam Leffler /*
1434b83a279fSSam Leffler  * This is called to generate routing socket messages indicating
1435b83a279fSSam Leffler  * IEEE80211 wireless events.
1436b83a279fSSam Leffler  * XXX we piggyback on the RTM_IFANNOUNCE msg format in a clumsy way.
1437b83a279fSSam Leffler  */
1438b83a279fSSam Leffler void
1439b83a279fSSam Leffler rt_ieee80211msg(struct ifnet *ifp, int what, void *data, size_t data_len)
1440b83a279fSSam Leffler {
1441b83a279fSSam Leffler 	struct mbuf *m;
1442b83a279fSSam Leffler 	struct rt_addrinfo info;
1443b83a279fSSam Leffler 
1444b83a279fSSam Leffler 	m = rt_makeifannouncemsg(ifp, RTM_IEEE80211, what, &info);
1445b83a279fSSam Leffler 	if (m != NULL) {
1446b83a279fSSam Leffler 		/*
1447b83a279fSSam Leffler 		 * Append the ieee80211 data.  Try to stick it in the
1448b83a279fSSam Leffler 		 * mbuf containing the ifannounce msg; otherwise allocate
1449b83a279fSSam Leffler 		 * a new mbuf and append.
1450b83a279fSSam Leffler 		 *
1451b83a279fSSam Leffler 		 * NB: we assume m is a single mbuf.
1452b83a279fSSam Leffler 		 */
1453b83a279fSSam Leffler 		if (data_len > M_TRAILINGSPACE(m)) {
1454b83a279fSSam Leffler 			struct mbuf *n = m_get(M_NOWAIT, MT_DATA);
1455b83a279fSSam Leffler 			if (n == NULL) {
1456b83a279fSSam Leffler 				m_freem(m);
1457b83a279fSSam Leffler 				return;
1458b83a279fSSam Leffler 			}
1459b83a279fSSam Leffler 			bcopy(data, mtod(n, void *), data_len);
1460b83a279fSSam Leffler 			n->m_len = data_len;
1461b83a279fSSam Leffler 			m->m_next = n;
1462b83a279fSSam Leffler 		} else if (data_len > 0) {
1463b83a279fSSam Leffler 			bcopy(data, mtod(m, u_int8_t *) + m->m_len, data_len);
1464b83a279fSSam Leffler 			m->m_len += data_len;
1465b83a279fSSam Leffler 		}
1466b83a279fSSam Leffler 		if (m->m_flags & M_PKTHDR)
1467b83a279fSSam Leffler 			m->m_pkthdr.len += data_len;
1468b83a279fSSam Leffler 		mtod(m, struct if_announcemsghdr *)->ifan_msglen += data_len;
14693ca1a2d6SMax Laier 		rt_dispatch(m, AF_UNSPEC);
1470b83a279fSSam Leffler 	}
1471b83a279fSSam Leffler }
1472b83a279fSSam Leffler 
1473df8bae1dSRodney W. Grimes /*
14747b6edd04SRuslan Ermilov  * This is called to generate routing socket messages indicating
14757b6edd04SRuslan Ermilov  * network interface arrival and departure.
14767b6edd04SRuslan Ermilov  */
14777b6edd04SRuslan Ermilov void
1478becc44d7SSam Leffler rt_ifannouncemsg(struct ifnet *ifp, int what)
14797b6edd04SRuslan Ermilov {
14807b6edd04SRuslan Ermilov 	struct mbuf *m;
14817b6edd04SRuslan Ermilov 	struct rt_addrinfo info;
14827b6edd04SRuslan Ermilov 
1483b83a279fSSam Leffler 	m = rt_makeifannouncemsg(ifp, RTM_IFANNOUNCE, what, &info);
1484b83a279fSSam Leffler 	if (m != NULL)
14853ca1a2d6SMax Laier 		rt_dispatch(m, AF_UNSPEC);
1486becc44d7SSam Leffler }
1487becc44d7SSam Leffler 
1488becc44d7SSam Leffler static void
14893ca1a2d6SMax Laier rt_dispatch(struct mbuf *m, sa_family_t saf)
1490becc44d7SSam Leffler {
1491d989c7b3SRobert Watson 	struct m_tag *tag;
1492becc44d7SSam Leffler 
1493d989c7b3SRobert Watson 	/*
1494d989c7b3SRobert Watson 	 * Preserve the family from the sockaddr, if any, in an m_tag for
1495d989c7b3SRobert Watson 	 * use when injecting the mbuf into the routing socket buffer from
1496d989c7b3SRobert Watson 	 * the netisr.
1497d989c7b3SRobert Watson 	 */
14983ca1a2d6SMax Laier 	if (saf != AF_UNSPEC) {
1499d989c7b3SRobert Watson 		tag = m_tag_get(PACKET_TAG_RTSOCKFAM, sizeof(unsigned short),
1500d989c7b3SRobert Watson 		    M_NOWAIT);
1501d989c7b3SRobert Watson 		if (tag == NULL) {
1502d989c7b3SRobert Watson 			m_freem(m);
1503d989c7b3SRobert Watson 			return;
1504d989c7b3SRobert Watson 		}
15053ca1a2d6SMax Laier 		*(unsigned short *)(tag + 1) = saf;
1506d989c7b3SRobert Watson 		m_tag_prepend(m, tag);
1507d989c7b3SRobert Watson 	}
150821ca7b57SMarko Zec #ifdef VIMAGE
150921ca7b57SMarko Zec 	if (V_loif)
151021ca7b57SMarko Zec 		m->m_pkthdr.rcvif = V_loif;
151121ca7b57SMarko Zec 	else {
151221ca7b57SMarko Zec 		m_freem(m);
151321ca7b57SMarko Zec 		return;
151421ca7b57SMarko Zec 	}
151521ca7b57SMarko Zec #endif
15163161f583SAndre Oppermann 	netisr_queue(NETISR_ROUTE, m);	/* mbuf is free'd on failure. */
15177b6edd04SRuslan Ermilov }
15187b6edd04SRuslan Ermilov 
15197b6edd04SRuslan Ermilov /*
1520df8bae1dSRodney W. Grimes  * This is used in dumping the kernel table via sysctl().
1521df8bae1dSRodney W. Grimes  */
152237c84183SPoul-Henning Kamp static int
1523becc44d7SSam Leffler sysctl_dumpentry(struct radix_node *rn, void *vw)
1524df8bae1dSRodney W. Grimes {
1525becc44d7SSam Leffler 	struct walkarg *w = vw;
1526becc44d7SSam Leffler 	struct rtentry *rt = (struct rtentry *)rn;
1527df8bae1dSRodney W. Grimes 	int error = 0, size;
1528df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
1529df8bae1dSRodney W. Grimes 
1530df8bae1dSRodney W. Grimes 	if (w->w_op == NET_RT_FLAGS && !(rt->rt_flags & w->w_arg))
1531df8bae1dSRodney W. Grimes 		return 0;
1532b89e82ddSJamie Gritton 	if ((rt->rt_flags & RTF_HOST) == 0
1533de0bd6f7SBjoern A. Zeeb 	    ? jailed_without_vnet(w->w_req->td->td_ucred)
1534b89e82ddSJamie Gritton 	    : prison_if(w->w_req->td->td_ucred, rt_key(rt)) != 0)
1535813dd6aeSBjoern A. Zeeb 		return (0);
1536df8bae1dSRodney W. Grimes 	bzero((caddr_t)&info, sizeof(info));
1537becc44d7SSam Leffler 	info.rti_info[RTAX_DST] = rt_key(rt);
1538becc44d7SSam Leffler 	info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
1539becc44d7SSam Leffler 	info.rti_info[RTAX_NETMASK] = rt_mask(rt);
15406e6b3f7cSQing Li 	info.rti_info[RTAX_GENMASK] = 0;
154128070a0eSRuslan Ermilov 	if (rt->rt_ifp) {
15424a0d6638SRuslan Ermilov 		info.rti_info[RTAX_IFP] = rt->rt_ifp->if_addr->ifa_addr;
1543becc44d7SSam Leffler 		info.rti_info[RTAX_IFA] = rt->rt_ifa->ifa_addr;
154428070a0eSRuslan Ermilov 		if (rt->rt_ifp->if_flags & IFF_POINTOPOINT)
1545becc44d7SSam Leffler 			info.rti_info[RTAX_BRD] = rt->rt_ifa->ifa_dstaddr;
154628070a0eSRuslan Ermilov 	}
1547913af518SLuigi Rizzo 	size = rt_msg2(RTM_GET, &info, NULL, w);
154852041295SPoul-Henning Kamp 	if (w->w_req && w->w_tmem) {
1549becc44d7SSam Leffler 		struct rt_msghdr *rtm = (struct rt_msghdr *)w->w_tmem;
1550df8bae1dSRodney W. Grimes 
1551f672f56fSQing Li 		if (rt->rt_flags & RTF_GWFLAG_COMPAT)
1552f672f56fSQing Li 			rtm->rtm_flags = RTF_GATEWAY |
1553f672f56fSQing Li 				(rt->rt_flags & ~RTF_GWFLAG_COMPAT);
1554f672f56fSQing Li 		else
1555df8bae1dSRodney W. Grimes 			rtm->rtm_flags = rt->rt_flags;
1556e3a7aa6fSGleb Smirnoff 		rt_getmetrics(rt, &rtm->rtm_rmx);
1557df8bae1dSRodney W. Grimes 		rtm->rtm_index = rt->rt_ifp->if_index;
1558df8bae1dSRodney W. Grimes 		rtm->rtm_errno = rtm->rtm_pid = rtm->rtm_seq = 0;
1559df8bae1dSRodney W. Grimes 		rtm->rtm_addrs = info.rti_addrs;
156052041295SPoul-Henning Kamp 		error = SYSCTL_OUT(w->w_req, (caddr_t)rtm, size);
156152041295SPoul-Henning Kamp 		return (error);
1562df8bae1dSRodney W. Grimes 	}
1563df8bae1dSRodney W. Grimes 	return (error);
1564df8bae1dSRodney W. Grimes }
1565df8bae1dSRodney W. Grimes 
156637c84183SPoul-Henning Kamp static int
15676d076ae8SBjoern A. Zeeb sysctl_iflist_ifml(struct ifnet *ifp, struct rt_addrinfo *info,
15686d076ae8SBjoern A. Zeeb     struct walkarg *w, int len)
15696d076ae8SBjoern A. Zeeb {
15706d076ae8SBjoern A. Zeeb 	struct if_msghdrl *ifm;
1571b245f96cSGleb Smirnoff 	struct if_data *ifd;
1572b245f96cSGleb Smirnoff 
1573b245f96cSGleb Smirnoff 	ifm = (struct if_msghdrl *)w->w_tmem;
15746d076ae8SBjoern A. Zeeb 
15756d076ae8SBjoern A. Zeeb #ifdef COMPAT_FREEBSD32
15766d076ae8SBjoern A. Zeeb 	if (w->w_req->flags & SCTL_MASK32) {
15776d076ae8SBjoern A. Zeeb 		struct if_msghdrl32 *ifm32;
15786d076ae8SBjoern A. Zeeb 
1579b245f96cSGleb Smirnoff 		ifm32 = (struct if_msghdrl32 *)ifm;
15806d076ae8SBjoern A. Zeeb 		ifm32->ifm_addrs = info->rti_addrs;
15816d076ae8SBjoern A. Zeeb 		ifm32->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
15826d076ae8SBjoern A. Zeeb 		ifm32->ifm_index = ifp->if_index;
15836d076ae8SBjoern A. Zeeb 		ifm32->_ifm_spare1 = 0;
15846d076ae8SBjoern A. Zeeb 		ifm32->ifm_len = sizeof(*ifm32);
15856d076ae8SBjoern A. Zeeb 		ifm32->ifm_data_off = offsetof(struct if_msghdrl32, ifm_data);
1586b245f96cSGleb Smirnoff 		ifd = &ifm32->ifm_data;
1587b245f96cSGleb Smirnoff 	} else
15886d076ae8SBjoern A. Zeeb #endif
1589b245f96cSGleb Smirnoff 	{
15906d076ae8SBjoern A. Zeeb 		ifm->ifm_addrs = info->rti_addrs;
15916d076ae8SBjoern A. Zeeb 		ifm->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
15926d076ae8SBjoern A. Zeeb 		ifm->ifm_index = ifp->if_index;
15936d076ae8SBjoern A. Zeeb 		ifm->_ifm_spare1 = 0;
15946d076ae8SBjoern A. Zeeb 		ifm->ifm_len = sizeof(*ifm);
15956d076ae8SBjoern A. Zeeb 		ifm->ifm_data_off = offsetof(struct if_msghdrl, ifm_data);
1596b245f96cSGleb Smirnoff 		ifd = &ifm->ifm_data;
1597b245f96cSGleb Smirnoff 	}
15986d076ae8SBjoern A. Zeeb 
1599b245f96cSGleb Smirnoff 	*ifd = ifp->if_data;
1600b245f96cSGleb Smirnoff 
1601*2d70c0deSGleb Smirnoff 	/* Some drivers still use ifqueue(9), add its stats. */
1602*2d70c0deSGleb Smirnoff 	ifd->ifi_oqdrops += ifp->if_snd.ifq_drops;
16036d076ae8SBjoern A. Zeeb 
16046d076ae8SBjoern A. Zeeb 	return (SYSCTL_OUT(w->w_req, (caddr_t)ifm, len));
16056d076ae8SBjoern A. Zeeb }
16066d076ae8SBjoern A. Zeeb 
16076d076ae8SBjoern A. Zeeb static int
16086d076ae8SBjoern A. Zeeb sysctl_iflist_ifm(struct ifnet *ifp, struct rt_addrinfo *info,
16096d076ae8SBjoern A. Zeeb     struct walkarg *w, int len)
16106d076ae8SBjoern A. Zeeb {
16116d076ae8SBjoern A. Zeeb 	struct if_msghdr *ifm;
1612b245f96cSGleb Smirnoff 	struct if_data *ifd;
1613b245f96cSGleb Smirnoff 
1614b245f96cSGleb Smirnoff 	ifm = (struct if_msghdr *)w->w_tmem;
16156d076ae8SBjoern A. Zeeb 
16166d076ae8SBjoern A. Zeeb #ifdef COMPAT_FREEBSD32
16176d076ae8SBjoern A. Zeeb 	if (w->w_req->flags & SCTL_MASK32) {
16186d076ae8SBjoern A. Zeeb 		struct if_msghdr32 *ifm32;
16196d076ae8SBjoern A. Zeeb 
1620b245f96cSGleb Smirnoff 		ifm32 = (struct if_msghdr32 *)ifm;
16216d076ae8SBjoern A. Zeeb 		ifm32->ifm_addrs = info->rti_addrs;
16226d076ae8SBjoern A. Zeeb 		ifm32->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
16236d076ae8SBjoern A. Zeeb 		ifm32->ifm_index = ifp->if_index;
1624b245f96cSGleb Smirnoff 		ifd = &ifm32->ifm_data;
1625b245f96cSGleb Smirnoff 	} else
16266d076ae8SBjoern A. Zeeb #endif
1627b245f96cSGleb Smirnoff 	{
16286d076ae8SBjoern A. Zeeb 		ifm->ifm_addrs = info->rti_addrs;
16296d076ae8SBjoern A. Zeeb 		ifm->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
16306d076ae8SBjoern A. Zeeb 		ifm->ifm_index = ifp->if_index;
1631b245f96cSGleb Smirnoff 		ifd = &ifm->ifm_data;
1632b245f96cSGleb Smirnoff 	}
16336d076ae8SBjoern A. Zeeb 
1634b245f96cSGleb Smirnoff 	*ifd = ifp->if_data;
1635*2d70c0deSGleb Smirnoff 
1636*2d70c0deSGleb Smirnoff 	/* Some drivers still use ifqueue(9), add its stats. */
1637*2d70c0deSGleb Smirnoff 	ifd->ifi_oqdrops += ifp->if_snd.ifq_drops;
16386d076ae8SBjoern A. Zeeb 
16396d076ae8SBjoern A. Zeeb 	return (SYSCTL_OUT(w->w_req, (caddr_t)ifm, len));
16406d076ae8SBjoern A. Zeeb }
16416d076ae8SBjoern A. Zeeb 
16426d076ae8SBjoern A. Zeeb static int
16436d076ae8SBjoern A. Zeeb sysctl_iflist_ifaml(struct ifaddr *ifa, struct rt_addrinfo *info,
16446d076ae8SBjoern A. Zeeb     struct walkarg *w, int len)
16456d076ae8SBjoern A. Zeeb {
16466d076ae8SBjoern A. Zeeb 	struct ifa_msghdrl *ifam;
1647b245f96cSGleb Smirnoff 	struct if_data *ifd;
1648b245f96cSGleb Smirnoff 
1649b245f96cSGleb Smirnoff 	ifam = (struct ifa_msghdrl *)w->w_tmem;
16506d076ae8SBjoern A. Zeeb 
16516d076ae8SBjoern A. Zeeb #ifdef COMPAT_FREEBSD32
16526d076ae8SBjoern A. Zeeb 	if (w->w_req->flags & SCTL_MASK32) {
16536d076ae8SBjoern A. Zeeb 		struct ifa_msghdrl32 *ifam32;
16546d076ae8SBjoern A. Zeeb 
1655b245f96cSGleb Smirnoff 		ifam32 = (struct ifa_msghdrl32 *)ifam;
16566d076ae8SBjoern A. Zeeb 		ifam32->ifam_addrs = info->rti_addrs;
16576d076ae8SBjoern A. Zeeb 		ifam32->ifam_flags = ifa->ifa_flags;
16586d076ae8SBjoern A. Zeeb 		ifam32->ifam_index = ifa->ifa_ifp->if_index;
16596d076ae8SBjoern A. Zeeb 		ifam32->_ifam_spare1 = 0;
16606d076ae8SBjoern A. Zeeb 		ifam32->ifam_len = sizeof(*ifam32);
16616d076ae8SBjoern A. Zeeb 		ifam32->ifam_data_off =
16626d076ae8SBjoern A. Zeeb 		    offsetof(struct ifa_msghdrl32, ifam_data);
16636d076ae8SBjoern A. Zeeb 		ifam32->ifam_metric = ifa->ifa_metric;
1664b245f96cSGleb Smirnoff 		ifd = &ifam32->ifam_data;
1665b245f96cSGleb Smirnoff 	} else
16666d076ae8SBjoern A. Zeeb #endif
1667b245f96cSGleb Smirnoff 	{
16686d076ae8SBjoern A. Zeeb 		ifam->ifam_addrs = info->rti_addrs;
16696d076ae8SBjoern A. Zeeb 		ifam->ifam_flags = ifa->ifa_flags;
16706d076ae8SBjoern A. Zeeb 		ifam->ifam_index = ifa->ifa_ifp->if_index;
16716d076ae8SBjoern A. Zeeb 		ifam->_ifam_spare1 = 0;
16726d076ae8SBjoern A. Zeeb 		ifam->ifam_len = sizeof(*ifam);
16736d076ae8SBjoern A. Zeeb 		ifam->ifam_data_off = offsetof(struct ifa_msghdrl, ifam_data);
16746d076ae8SBjoern A. Zeeb 		ifam->ifam_metric = ifa->ifa_metric;
1675b245f96cSGleb Smirnoff 		ifd = &ifam->ifam_data;
1676b245f96cSGleb Smirnoff 	}
16776d076ae8SBjoern A. Zeeb 
1678b245f96cSGleb Smirnoff 	bzero(ifd, sizeof(*ifd));
1679b245f96cSGleb Smirnoff 	ifd->ifi_datalen = sizeof(struct if_data);
1680b245f96cSGleb Smirnoff 	ifd->ifi_ipackets = counter_u64_fetch(ifa->ifa_ipackets);
1681b245f96cSGleb Smirnoff 	ifd->ifi_opackets = counter_u64_fetch(ifa->ifa_opackets);
1682b245f96cSGleb Smirnoff 	ifd->ifi_ibytes = counter_u64_fetch(ifa->ifa_ibytes);
1683b245f96cSGleb Smirnoff 	ifd->ifi_obytes = counter_u64_fetch(ifa->ifa_obytes);
16847caf4ab7SGleb Smirnoff 
16856d076ae8SBjoern A. Zeeb 	/* Fixup if_data carp(4) vhid. */
16866d076ae8SBjoern A. Zeeb 	if (carp_get_vhid_p != NULL)
1687b245f96cSGleb Smirnoff 		ifd->ifi_vhid = (*carp_get_vhid_p)(ifa);
16886d076ae8SBjoern A. Zeeb 
16896d076ae8SBjoern A. Zeeb 	return (SYSCTL_OUT(w->w_req, w->w_tmem, len));
16906d076ae8SBjoern A. Zeeb }
16916d076ae8SBjoern A. Zeeb 
16926d076ae8SBjoern A. Zeeb static int
16936d076ae8SBjoern A. Zeeb sysctl_iflist_ifam(struct ifaddr *ifa, struct rt_addrinfo *info,
16946d076ae8SBjoern A. Zeeb     struct walkarg *w, int len)
16956d076ae8SBjoern A. Zeeb {
16966d076ae8SBjoern A. Zeeb 	struct ifa_msghdr *ifam;
16976d076ae8SBjoern A. Zeeb 
16986d076ae8SBjoern A. Zeeb 	ifam = (struct ifa_msghdr *)w->w_tmem;
16996d076ae8SBjoern A. Zeeb 	ifam->ifam_addrs = info->rti_addrs;
17006d076ae8SBjoern A. Zeeb 	ifam->ifam_flags = ifa->ifa_flags;
17016d076ae8SBjoern A. Zeeb 	ifam->ifam_index = ifa->ifa_ifp->if_index;
17026d076ae8SBjoern A. Zeeb 	ifam->ifam_metric = ifa->ifa_metric;
17036d076ae8SBjoern A. Zeeb 
17046d076ae8SBjoern A. Zeeb 	return (SYSCTL_OUT(w->w_req, w->w_tmem, len));
17056d076ae8SBjoern A. Zeeb }
17066d076ae8SBjoern A. Zeeb 
17076d076ae8SBjoern A. Zeeb static int
1708becc44d7SSam Leffler sysctl_iflist(int af, struct walkarg *w)
1709df8bae1dSRodney W. Grimes {
1710becc44d7SSam Leffler 	struct ifnet *ifp;
1711becc44d7SSam Leffler 	struct ifaddr *ifa;
1712df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
1713df8bae1dSRodney W. Grimes 	int len, error = 0;
1714df8bae1dSRodney W. Grimes 
1715df8bae1dSRodney W. Grimes 	bzero((caddr_t)&info, sizeof(info));
17165c9fa630SHiroki Sato 	IFNET_RLOCK_NOSLEEP();
1717603724d3SBjoern A. Zeeb 	TAILQ_FOREACH(ifp, &V_ifnet, if_link) {
1718df8bae1dSRodney W. Grimes 		if (w->w_arg && w->w_arg != ifp->if_index)
1719df8bae1dSRodney W. Grimes 			continue;
1720137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
17214a0d6638SRuslan Ermilov 		ifa = ifp->if_addr;
1722becc44d7SSam Leffler 		info.rti_info[RTAX_IFP] = ifa->ifa_addr;
1723913af518SLuigi Rizzo 		len = rt_msg2(RTM_IFINFO, &info, NULL, w);
17245dfc91d7SLuigi Rizzo 		info.rti_info[RTAX_IFP] = NULL;
172552041295SPoul-Henning Kamp 		if (w->w_req && w->w_tmem) {
17266d076ae8SBjoern A. Zeeb 			if (w->w_op == NET_RT_IFLISTL)
17276d076ae8SBjoern A. Zeeb 				error = sysctl_iflist_ifml(ifp, &info, w, len);
17286d076ae8SBjoern A. Zeeb 			else
17296d076ae8SBjoern A. Zeeb 				error = sysctl_iflist_ifm(ifp, &info, w, len);
1730df440948SPoul-Henning Kamp 			if (error)
1731a35b06c5SJonathan Lemon 				goto done;
1732df8bae1dSRodney W. Grimes 		}
17335dfc91d7SLuigi Rizzo 		while ((ifa = TAILQ_NEXT(ifa, ifa_link)) != NULL) {
1734df8bae1dSRodney W. Grimes 			if (af && af != ifa->ifa_addr->sa_family)
1735df8bae1dSRodney W. Grimes 				continue;
1736b89e82ddSJamie Gritton 			if (prison_if(w->w_req->td->td_ucred,
1737b89e82ddSJamie Gritton 			    ifa->ifa_addr) != 0)
173875c13541SPoul-Henning Kamp 				continue;
1739becc44d7SSam Leffler 			info.rti_info[RTAX_IFA] = ifa->ifa_addr;
1740becc44d7SSam Leffler 			info.rti_info[RTAX_NETMASK] = ifa->ifa_netmask;
1741becc44d7SSam Leffler 			info.rti_info[RTAX_BRD] = ifa->ifa_dstaddr;
1742913af518SLuigi Rizzo 			len = rt_msg2(RTM_NEWADDR, &info, NULL, w);
174352041295SPoul-Henning Kamp 			if (w->w_req && w->w_tmem) {
17446d076ae8SBjoern A. Zeeb 				if (w->w_op == NET_RT_IFLISTL)
17456d076ae8SBjoern A. Zeeb 					error = sysctl_iflist_ifaml(ifa, &info,
17466d076ae8SBjoern A. Zeeb 					    w, len);
17476d076ae8SBjoern A. Zeeb 				else
17486d076ae8SBjoern A. Zeeb 					error = sysctl_iflist_ifam(ifa, &info,
17496d076ae8SBjoern A. Zeeb 					    w, len);
1750df440948SPoul-Henning Kamp 				if (error)
1751a35b06c5SJonathan Lemon 					goto done;
1752df8bae1dSRodney W. Grimes 			}
1753df8bae1dSRodney W. Grimes 		}
1754137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
1755becc44d7SSam Leffler 		info.rti_info[RTAX_IFA] = info.rti_info[RTAX_NETMASK] =
17565dfc91d7SLuigi Rizzo 			info.rti_info[RTAX_BRD] = NULL;
1757df8bae1dSRodney W. Grimes 	}
1758a35b06c5SJonathan Lemon done:
1759ee7c7feeSBjoern A. Zeeb 	if (ifp != NULL)
1760137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
17615c9fa630SHiroki Sato 	IFNET_RUNLOCK_NOSLEEP();
1762a35b06c5SJonathan Lemon 	return (error);
1763df8bae1dSRodney W. Grimes }
1764df8bae1dSRodney W. Grimes 
1765ebda3fc3SBjoern A. Zeeb static int
17669b98ee2cSLuigi Rizzo sysctl_ifmalist(int af, struct walkarg *w)
176705b2efe0SBruce M Simpson {
17689b98ee2cSLuigi Rizzo 	struct ifnet *ifp;
176905b2efe0SBruce M Simpson 	struct ifmultiaddr *ifma;
177005b2efe0SBruce M Simpson 	struct	rt_addrinfo info;
177105b2efe0SBruce M Simpson 	int	len, error = 0;
17729b98ee2cSLuigi Rizzo 	struct ifaddr *ifa;
177305b2efe0SBruce M Simpson 
177405b2efe0SBruce M Simpson 	bzero((caddr_t)&info, sizeof(info));
17755c9fa630SHiroki Sato 	IFNET_RLOCK_NOSLEEP();
1776603724d3SBjoern A. Zeeb 	TAILQ_FOREACH(ifp, &V_ifnet, if_link) {
177705b2efe0SBruce M Simpson 		if (w->w_arg && w->w_arg != ifp->if_index)
177805b2efe0SBruce M Simpson 			continue;
17794a0d6638SRuslan Ermilov 		ifa = ifp->if_addr;
1780913af518SLuigi Rizzo 		info.rti_info[RTAX_IFP] = ifa ? ifa->ifa_addr : NULL;
1781137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
178205b2efe0SBruce M Simpson 		TAILQ_FOREACH(ifma, &ifp->if_multiaddrs, ifma_link) {
178305b2efe0SBruce M Simpson 			if (af && af != ifma->ifma_addr->sa_family)
178405b2efe0SBruce M Simpson 				continue;
1785b89e82ddSJamie Gritton 			if (prison_if(w->w_req->td->td_ucred,
1786b89e82ddSJamie Gritton 			    ifma->ifma_addr) != 0)
178705b2efe0SBruce M Simpson 				continue;
178805b2efe0SBruce M Simpson 			info.rti_info[RTAX_IFA] = ifma->ifma_addr;
1789913af518SLuigi Rizzo 			info.rti_info[RTAX_GATEWAY] =
1790913af518SLuigi Rizzo 			    (ifma->ifma_addr->sa_family != AF_LINK) ?
1791913af518SLuigi Rizzo 			    ifma->ifma_lladdr : NULL;
1792913af518SLuigi Rizzo 			len = rt_msg2(RTM_NEWMADDR, &info, NULL, w);
179305b2efe0SBruce M Simpson 			if (w->w_req && w->w_tmem) {
17949b98ee2cSLuigi Rizzo 				struct ifma_msghdr *ifmam;
179505b2efe0SBruce M Simpson 
179605b2efe0SBruce M Simpson 				ifmam = (struct ifma_msghdr *)w->w_tmem;
179705b2efe0SBruce M Simpson 				ifmam->ifmam_index = ifma->ifma_ifp->if_index;
179805b2efe0SBruce M Simpson 				ifmam->ifmam_flags = 0;
179905b2efe0SBruce M Simpson 				ifmam->ifmam_addrs = info.rti_addrs;
180005b2efe0SBruce M Simpson 				error = SYSCTL_OUT(w->w_req, w->w_tmem, len);
1801fe0fc7efSChristian S.J. Peron 				if (error) {
1802137f91e8SJohn Baldwin 					IF_ADDR_RUNLOCK(ifp);
180305b2efe0SBruce M Simpson 					goto done;
180405b2efe0SBruce M Simpson 				}
180505b2efe0SBruce M Simpson 			}
180605b2efe0SBruce M Simpson 		}
1807137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
1808fe0fc7efSChristian S.J. Peron 	}
180905b2efe0SBruce M Simpson done:
18105c9fa630SHiroki Sato 	IFNET_RUNLOCK_NOSLEEP();
181105b2efe0SBruce M Simpson 	return (error);
181205b2efe0SBruce M Simpson }
181305b2efe0SBruce M Simpson 
181452041295SPoul-Henning Kamp static int
181582d9ae4eSPoul-Henning Kamp sysctl_rtsock(SYSCTL_HANDLER_ARGS)
1816df8bae1dSRodney W. Grimes {
181752041295SPoul-Henning Kamp 	int	*name = (int *)arg1;
181852041295SPoul-Henning Kamp 	u_int	namelen = arg2;
1819c2c2a7c1SBjoern A. Zeeb 	struct radix_node_head *rnh = NULL; /* silence compiler. */
1820fe0fc7efSChristian S.J. Peron 	int	i, lim, error = EINVAL;
18214825b1e0SHiroki Sato 	int	fib = 0;
1822df8bae1dSRodney W. Grimes 	u_char	af;
1823df8bae1dSRodney W. Grimes 	struct	walkarg w;
1824df8bae1dSRodney W. Grimes 
182552041295SPoul-Henning Kamp 	name ++;
182652041295SPoul-Henning Kamp 	namelen--;
182752041295SPoul-Henning Kamp 	if (req->newptr)
1828df8bae1dSRodney W. Grimes 		return (EPERM);
18294825b1e0SHiroki Sato 	if (name[1] == NET_RT_DUMP) {
18304825b1e0SHiroki Sato 		if (namelen == 3)
18314825b1e0SHiroki Sato 			fib = req->td->td_proc->p_fibnum;
18324825b1e0SHiroki Sato 		else if (namelen == 4)
18337d9b6df1SAlexander V. Chernikov 			fib = (name[3] == RT_ALL_FIBS) ?
18344825b1e0SHiroki Sato 			    req->td->td_proc->p_fibnum : name[3];
18354825b1e0SHiroki Sato 		else
18364825b1e0SHiroki Sato 			return ((namelen < 3) ? EISDIR : ENOTDIR);
18374825b1e0SHiroki Sato 		if (fib < 0 || fib >= rt_numfibs)
18384825b1e0SHiroki Sato 			return (EINVAL);
18394825b1e0SHiroki Sato 	} else if (namelen != 3)
1840f7a54d06SCrist J. Clark 		return ((namelen < 3) ? EISDIR : ENOTDIR);
1841df8bae1dSRodney W. Grimes 	af = name[0];
1842b2aaf46eSJeffrey Hsu 	if (af > AF_MAX)
1843b2aaf46eSJeffrey Hsu 		return (EINVAL);
18446b96f1afSLuigi Rizzo 	bzero(&w, sizeof(w));
1845df8bae1dSRodney W. Grimes 	w.w_op = name[1];
1846df8bae1dSRodney W. Grimes 	w.w_arg = name[2];
184752041295SPoul-Henning Kamp 	w.w_req = req;
1848df8bae1dSRodney W. Grimes 
1849fe0fc7efSChristian S.J. Peron 	error = sysctl_wire_old_buffer(req, 0);
1850fe0fc7efSChristian S.J. Peron 	if (error)
1851fe0fc7efSChristian S.J. Peron 		return (error);
1852df8bae1dSRodney W. Grimes 	switch (w.w_op) {
1853df8bae1dSRodney W. Grimes 
1854df8bae1dSRodney W. Grimes 	case NET_RT_DUMP:
1855df8bae1dSRodney W. Grimes 	case NET_RT_FLAGS:
1856a8b76c8fSLuigi Rizzo 		if (af == 0) {			/* dump all tables */
1857a8b76c8fSLuigi Rizzo 			i = 1;
1858a8b76c8fSLuigi Rizzo 			lim = AF_MAX;
1859a8b76c8fSLuigi Rizzo 		} else				/* dump only one table */
1860a8b76c8fSLuigi Rizzo 			i = lim = af;
18618eca593cSQing Li 
18628eca593cSQing Li 		/*
18638eca593cSQing Li 		 * take care of llinfo entries, the caller must
18648eca593cSQing Li 		 * specify an AF
18658eca593cSQing Li 		 */
186614981d80SQing Li 		if (w.w_op == NET_RT_FLAGS &&
186782b334e8SQing Li 		    (w.w_arg == 0 || w.w_arg & RTF_LLINFO)) {
18688eca593cSQing Li 			if (af != 0)
18698eca593cSQing Li 				error = lltable_sysctl_dumparp(af, w.w_req);
18708eca593cSQing Li 			else
18718eca593cSQing Li 				error = EINVAL;
18728eca593cSQing Li 			break;
18738eca593cSQing Li 		}
18748eca593cSQing Li 		/*
18758eca593cSQing Li 		 * take care of routing entries
18768eca593cSQing Li 		 */
187720b0cdb7SBjoern A. Zeeb 		for (error = 0; error == 0 && i <= lim; i++) {
18784825b1e0SHiroki Sato 			rnh = rt_tables_get_rnh(fib, i);
1879c2c2a7c1SBjoern A. Zeeb 			if (rnh != NULL) {
1880c2508034SAlexander V. Chernikov 				RADIX_NODE_HEAD_RLOCK(rnh);
1881956b0b65SJeffrey Hsu 			    	error = rnh->rnh_walktree(rnh,
1882fe0fc7efSChristian S.J. Peron 				    sysctl_dumpentry, &w);
1883c2508034SAlexander V. Chernikov 				RADIX_NODE_HEAD_RUNLOCK(rnh);
1884a8b76c8fSLuigi Rizzo 			} else if (af != 0)
1885956b0b65SJeffrey Hsu 				error = EAFNOSUPPORT;
188620b0cdb7SBjoern A. Zeeb 		}
1887df8bae1dSRodney W. Grimes 		break;
1888df8bae1dSRodney W. Grimes 
1889df8bae1dSRodney W. Grimes 	case NET_RT_IFLIST:
18906d076ae8SBjoern A. Zeeb 	case NET_RT_IFLISTL:
1891df8bae1dSRodney W. Grimes 		error = sysctl_iflist(af, &w);
189205b2efe0SBruce M Simpson 		break;
189305b2efe0SBruce M Simpson 
189405b2efe0SBruce M Simpson 	case NET_RT_IFMALIST:
189505b2efe0SBruce M Simpson 		error = sysctl_ifmalist(af, &w);
189605b2efe0SBruce M Simpson 		break;
1897df8bae1dSRodney W. Grimes 	}
1898df8bae1dSRodney W. Grimes 	if (w.w_tmem)
1899df8bae1dSRodney W. Grimes 		free(w.w_tmem, M_RTABLE);
1900df8bae1dSRodney W. Grimes 	return (error);
1901df8bae1dSRodney W. Grimes }
1902df8bae1dSRodney W. Grimes 
19036472ac3dSEd Schouten static SYSCTL_NODE(_net, PF_ROUTE, routetable, CTLFLAG_RD, sysctl_rtsock, "");
190452041295SPoul-Henning Kamp 
1905df8bae1dSRodney W. Grimes /*
1906df8bae1dSRodney W. Grimes  * Definitions of protocols supported in the ROUTE domain.
1907df8bae1dSRodney W. Grimes  */
1908df8bae1dSRodney W. Grimes 
19095b1c0294SDavid E. O'Brien static struct domain routedomain;		/* or at least forward */
1910df8bae1dSRodney W. Grimes 
191152041295SPoul-Henning Kamp static struct protosw routesw[] = {
1912303989a2SRuslan Ermilov {
1913303989a2SRuslan Ermilov 	.pr_type =		SOCK_RAW,
1914303989a2SRuslan Ermilov 	.pr_domain =		&routedomain,
1915303989a2SRuslan Ermilov 	.pr_flags =		PR_ATOMIC|PR_ADDR,
1916303989a2SRuslan Ermilov 	.pr_output =		route_output,
1917303989a2SRuslan Ermilov 	.pr_ctlinput =		raw_ctlinput,
1918303989a2SRuslan Ermilov 	.pr_init =		raw_init,
1919303989a2SRuslan Ermilov 	.pr_usrreqs =		&route_usrreqs
1920df8bae1dSRodney W. Grimes }
1921df8bae1dSRodney W. Grimes };
1922df8bae1dSRodney W. Grimes 
1923303989a2SRuslan Ermilov static struct domain routedomain = {
1924303989a2SRuslan Ermilov 	.dom_family =		PF_ROUTE,
1925303989a2SRuslan Ermilov 	.dom_name =		 "route",
1926303989a2SRuslan Ermilov 	.dom_protosw =		routesw,
1927303989a2SRuslan Ermilov 	.dom_protoswNPROTOSW =	&routesw[sizeof(routesw)/sizeof(routesw[0])]
1928303989a2SRuslan Ermilov };
192978a82810SGarrett Wollman 
1930d0728d71SRobert Watson VNET_DOMAIN_SET(route);
1931