xref: /freebsd/sys/net/rtsock.c (revision 6db47af467bfd4b4f7a625cf71f2048f3660bd38)
1c398230bSWarner Losh /*-
2df8bae1dSRodney W. Grimes  * Copyright (c) 1988, 1991, 1993
3df8bae1dSRodney W. Grimes  *	The Regents of the University of California.  All rights reserved.
4df8bae1dSRodney W. Grimes  *
5df8bae1dSRodney W. Grimes  * Redistribution and use in source and binary forms, with or without
6df8bae1dSRodney W. Grimes  * modification, are permitted provided that the following conditions
7df8bae1dSRodney W. Grimes  * are met:
8df8bae1dSRodney W. Grimes  * 1. Redistributions of source code must retain the above copyright
9df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer.
10df8bae1dSRodney W. Grimes  * 2. Redistributions in binary form must reproduce the above copyright
11df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer in the
12df8bae1dSRodney W. Grimes  *    documentation and/or other materials provided with the distribution.
13df8bae1dSRodney W. Grimes  * 4. Neither the name of the University nor the names of its contributors
14df8bae1dSRodney W. Grimes  *    may be used to endorse or promote products derived from this software
15df8bae1dSRodney W. Grimes  *    without specific prior written permission.
16df8bae1dSRodney W. Grimes  *
17df8bae1dSRodney W. Grimes  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
18df8bae1dSRodney W. Grimes  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19df8bae1dSRodney W. Grimes  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20df8bae1dSRodney W. Grimes  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
21df8bae1dSRodney W. Grimes  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22df8bae1dSRodney W. Grimes  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23df8bae1dSRodney W. Grimes  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24df8bae1dSRodney W. Grimes  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25df8bae1dSRodney W. Grimes  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26df8bae1dSRodney W. Grimes  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27df8bae1dSRodney W. Grimes  * SUCH DAMAGE.
28df8bae1dSRodney W. Grimes  *
2928070a0eSRuslan Ermilov  *	@(#)rtsock.c	8.7 (Berkeley) 10/12/95
30c3aac50fSPeter Wemm  * $FreeBSD$
31df8bae1dSRodney W. Grimes  */
32427a928aSKonstantin Belousov #include "opt_compat.h"
33e440aed9SQing Li #include "opt_mpath.h"
34413628a7SBjoern A. Zeeb #include "opt_inet.h"
35413628a7SBjoern A. Zeeb #include "opt_inet6.h"
36e440aed9SQing Li 
37df8bae1dSRodney W. Grimes #include <sys/param.h>
38960ed29cSSeigo Tanimura #include <sys/jail.h>
39413628a7SBjoern A. Zeeb #include <sys/kernel.h>
40d0728d71SRobert Watson #include <sys/domain.h>
41609ff41fSWarner Losh #include <sys/lock.h>
424d1d4912SBruce Evans #include <sys/malloc.h>
43df8bae1dSRodney W. Grimes #include <sys/mbuf.h>
44acd3428bSRobert Watson #include <sys/priv.h>
45960ed29cSSeigo Tanimura #include <sys/proc.h>
46960ed29cSSeigo Tanimura #include <sys/protosw.h>
473120b9d4SKip Macy #include <sys/rwlock.h>
48960ed29cSSeigo Tanimura #include <sys/signalvar.h>
49df8bae1dSRodney W. Grimes #include <sys/socket.h>
50df8bae1dSRodney W. Grimes #include <sys/socketvar.h>
51960ed29cSSeigo Tanimura #include <sys/sysctl.h>
52960ed29cSSeigo Tanimura #include <sys/systm.h>
53df8bae1dSRodney W. Grimes 
54df8bae1dSRodney W. Grimes #include <net/if.h>
5576039bc8SGleb Smirnoff #include <net/if_var.h>
568eca593cSQing Li #include <net/if_dl.h>
576e6b3f7cSQing Li #include <net/if_llatbl.h>
580ed6142bSQing Li #include <net/if_types.h>
59d989c7b3SRobert Watson #include <net/netisr.h>
60df8bae1dSRodney W. Grimes #include <net/raw_cb.h>
61960ed29cSSeigo Tanimura #include <net/route.h>
624b79449eSBjoern A. Zeeb #include <net/vnet.h>
63df8bae1dSRodney W. Grimes 
645a59cefcSBosko Milekic #include <netinet/in.h>
65c7ab6602SQing Li #include <netinet/if_ether.h>
6608b68b0eSGleb Smirnoff #include <netinet/ip_carp.h>
67413628a7SBjoern A. Zeeb #ifdef INET6
680bebb544SHiroki Sato #include <netinet6/ip6_var.h>
69413628a7SBjoern A. Zeeb #include <netinet6/scope6_var.h>
70413628a7SBjoern A. Zeeb #endif
715a59cefcSBosko Milekic 
72427a928aSKonstantin Belousov #ifdef COMPAT_FREEBSD32
73427a928aSKonstantin Belousov #include <sys/mount.h>
74427a928aSKonstantin Belousov #include <compat/freebsd32/freebsd32.h>
75427a928aSKonstantin Belousov 
76427a928aSKonstantin Belousov struct if_msghdr32 {
77427a928aSKonstantin Belousov 	uint16_t ifm_msglen;
78427a928aSKonstantin Belousov 	uint8_t	ifm_version;
79427a928aSKonstantin Belousov 	uint8_t	ifm_type;
80427a928aSKonstantin Belousov 	int32_t	ifm_addrs;
81427a928aSKonstantin Belousov 	int32_t	ifm_flags;
82427a928aSKonstantin Belousov 	uint16_t ifm_index;
83b245f96cSGleb Smirnoff 	struct	if_data ifm_data;
84427a928aSKonstantin Belousov };
856d076ae8SBjoern A. Zeeb 
866d076ae8SBjoern A. Zeeb struct if_msghdrl32 {
876d076ae8SBjoern A. Zeeb 	uint16_t ifm_msglen;
886d076ae8SBjoern A. Zeeb 	uint8_t	ifm_version;
896d076ae8SBjoern A. Zeeb 	uint8_t	ifm_type;
906d076ae8SBjoern A. Zeeb 	int32_t	ifm_addrs;
916d076ae8SBjoern A. Zeeb 	int32_t	ifm_flags;
926d076ae8SBjoern A. Zeeb 	uint16_t ifm_index;
936d076ae8SBjoern A. Zeeb 	uint16_t _ifm_spare1;
946d076ae8SBjoern A. Zeeb 	uint16_t ifm_len;
956d076ae8SBjoern A. Zeeb 	uint16_t ifm_data_off;
96b245f96cSGleb Smirnoff 	struct	if_data ifm_data;
976d076ae8SBjoern A. Zeeb };
986d076ae8SBjoern A. Zeeb 
996d076ae8SBjoern A. Zeeb struct ifa_msghdrl32 {
1006d076ae8SBjoern A. Zeeb 	uint16_t ifam_msglen;
1016d076ae8SBjoern A. Zeeb 	uint8_t	ifam_version;
1026d076ae8SBjoern A. Zeeb 	uint8_t	ifam_type;
1036d076ae8SBjoern A. Zeeb 	int32_t	ifam_addrs;
1046d076ae8SBjoern A. Zeeb 	int32_t	ifam_flags;
1056d076ae8SBjoern A. Zeeb 	uint16_t ifam_index;
1066d076ae8SBjoern A. Zeeb 	uint16_t _ifam_spare1;
1076d076ae8SBjoern A. Zeeb 	uint16_t ifam_len;
1086d076ae8SBjoern A. Zeeb 	uint16_t ifam_data_off;
1096d076ae8SBjoern A. Zeeb 	int32_t	ifam_metric;
110b245f96cSGleb Smirnoff 	struct	if_data ifam_data;
1116d076ae8SBjoern A. Zeeb };
1126d076ae8SBjoern A. Zeeb #endif /* COMPAT_FREEBSD32 */
113427a928aSKonstantin Belousov 
114a1c995b6SPoul-Henning Kamp MALLOC_DEFINE(M_RTABLE, "routetbl", "routing tables");
115a1c995b6SPoul-Henning Kamp 
116becc44d7SSam Leffler /* NB: these are not modified */
11752041295SPoul-Henning Kamp static struct	sockaddr route_src = { 2, PF_ROUTE, };
118076d0761SJulian Elischer static struct	sockaddr sa_zero   = { sizeof(sa_zero), AF_INET, };
119becc44d7SSam Leffler 
12008b68b0eSGleb Smirnoff /* These are external hooks for CARP. */
12108b68b0eSGleb Smirnoff int	(*carp_get_vhid_p)(struct ifaddr *);
12208b68b0eSGleb Smirnoff 
123528737fdSBjoern A. Zeeb /*
124528737fdSBjoern A. Zeeb  * Used by rtsock/raw_input callback code to decide whether to filter the update
125528737fdSBjoern A. Zeeb  * notification to a socket bound to a particular FIB.
126528737fdSBjoern A. Zeeb  */
127528737fdSBjoern A. Zeeb #define	RTS_FILTER_FIB	M_PROTO8
128528737fdSBjoern A. Zeeb 
129c5d4eab6SMarko Zec typedef struct {
13018aee723SPeter Pentchev 	int	ip_count;	/* attached w/ AF_INET */
131becc44d7SSam Leffler 	int	ip6_count;	/* attached w/ AF_INET6 */
132becc44d7SSam Leffler 	int	any_count;	/* total attached */
133c5d4eab6SMarko Zec } route_cb_t;
134c5d4eab6SMarko Zec static VNET_DEFINE(route_cb_t, route_cb);
135c5d4eab6SMarko Zec #define	V_route_cb VNET(route_cb)
136df8bae1dSRodney W. Grimes 
137aea8b30fSSam Leffler struct mtx rtsock_mtx;
138aea8b30fSSam Leffler MTX_SYSINIT(rtsock, &rtsock_mtx, "rtsock route_cb lock", MTX_DEF);
139aea8b30fSSam Leffler 
140aea8b30fSSam Leffler #define	RTSOCK_LOCK()	mtx_lock(&rtsock_mtx)
141aea8b30fSSam Leffler #define	RTSOCK_UNLOCK()	mtx_unlock(&rtsock_mtx)
142aea8b30fSSam Leffler #define	RTSOCK_LOCK_ASSERT()	mtx_assert(&rtsock_mtx, MA_OWNED)
143aea8b30fSSam Leffler 
1446472ac3dSEd Schouten static SYSCTL_NODE(_net, OID_AUTO, route, CTLFLAG_RD, 0, "");
145190a4c94SRobert Watson 
146df8bae1dSRodney W. Grimes struct walkarg {
14752041295SPoul-Henning Kamp 	int	w_tmemsize;
14852041295SPoul-Henning Kamp 	int	w_op, w_arg;
14952041295SPoul-Henning Kamp 	caddr_t	w_tmem;
15052041295SPoul-Henning Kamp 	struct sysctl_req *w_req;
151df8bae1dSRodney W. Grimes };
152df8bae1dSRodney W. Grimes 
153d989c7b3SRobert Watson static void	rts_input(struct mbuf *m);
154*6db47af4SAlexander V. Chernikov static struct mbuf *rtsock_msg_mbuf(int type, struct rt_addrinfo *rtinfo);
155f2e5eb36SAlexander V. Chernikov static int	rtsock_msg_buffer(int type, struct rt_addrinfo *rtinfo,
156f2e5eb36SAlexander V. Chernikov 			struct walkarg *w, int *plen);
1575dfc91d7SLuigi Rizzo static int	rt_xaddrs(caddr_t cp, caddr_t cplim,
1585dfc91d7SLuigi Rizzo 			struct rt_addrinfo *rtinfo);
159929ddbbbSAlfred Perlstein static int	sysctl_dumpentry(struct radix_node *rn, void *vw);
160929ddbbbSAlfred Perlstein static int	sysctl_iflist(int af, struct walkarg *w);
16105b2efe0SBruce M Simpson static int	sysctl_ifmalist(int af, struct walkarg *w);
1625dfc91d7SLuigi Rizzo static int	route_output(struct mbuf *m, struct socket *so);
163e3a7aa6fSGleb Smirnoff static void	rt_getmetrics(const struct rtentry *rt, struct rt_metrics *out);
1643ca1a2d6SMax Laier static void	rt_dispatch(struct mbuf *, sa_family_t);
1653deb3649SAlexander V. Chernikov static struct sockaddr	*rtsock_fix_netmask(struct sockaddr *dst,
1663deb3649SAlexander V. Chernikov 			struct sockaddr *smask, struct sockaddr_storage *dmask);
167df8bae1dSRodney W. Grimes 
168d4b5cae4SRobert Watson static struct netisr_handler rtsock_nh = {
169d4b5cae4SRobert Watson 	.nh_name = "rtsock",
170d4b5cae4SRobert Watson 	.nh_handler = rts_input,
171d4b5cae4SRobert Watson 	.nh_proto = NETISR_ROUTE,
172d4b5cae4SRobert Watson 	.nh_policy = NETISR_POLICY_SOURCE,
173d4b5cae4SRobert Watson };
174d4b5cae4SRobert Watson 
175d4b5cae4SRobert Watson static int
176d4b5cae4SRobert Watson sysctl_route_netisr_maxqlen(SYSCTL_HANDLER_ARGS)
177d4b5cae4SRobert Watson {
178d4b5cae4SRobert Watson 	int error, qlimit;
179d4b5cae4SRobert Watson 
180d4b5cae4SRobert Watson 	netisr_getqlimit(&rtsock_nh, &qlimit);
181d4b5cae4SRobert Watson 	error = sysctl_handle_int(oidp, &qlimit, 0, req);
182d4b5cae4SRobert Watson         if (error || !req->newptr)
183d4b5cae4SRobert Watson                 return (error);
184d4b5cae4SRobert Watson 	if (qlimit < 1)
185d4b5cae4SRobert Watson 		return (EINVAL);
186d4b5cae4SRobert Watson 	return (netisr_setqlimit(&rtsock_nh, qlimit));
187d4b5cae4SRobert Watson }
188d4b5cae4SRobert Watson SYSCTL_PROC(_net_route, OID_AUTO, netisr_maxqlen, CTLTYPE_INT|CTLFLAG_RW,
189d4b5cae4SRobert Watson     0, 0, sysctl_route_netisr_maxqlen, "I",
190d4b5cae4SRobert Watson     "maximum routing socket dispatch queue length");
191d4b5cae4SRobert Watson 
192d989c7b3SRobert Watson static void
193d989c7b3SRobert Watson rts_init(void)
194d989c7b3SRobert Watson {
195b062951aSRobert Watson 	int tmp;
196d989c7b3SRobert Watson 
197b062951aSRobert Watson 	if (TUNABLE_INT_FETCH("net.route.netisr_maxqlen", &tmp))
198d4b5cae4SRobert Watson 		rtsock_nh.nh_qlimit = tmp;
199d4b5cae4SRobert Watson 	netisr_register(&rtsock_nh);
200d989c7b3SRobert Watson }
201237fdd78SRobert Watson SYSINIT(rtsock, SI_SUB_PROTO_DOMAIN, SI_ORDER_THIRD, rts_init, 0);
202d989c7b3SRobert Watson 
203528737fdSBjoern A. Zeeb static int
204528737fdSBjoern A. Zeeb raw_input_rts_cb(struct mbuf *m, struct sockproto *proto, struct sockaddr *src,
205528737fdSBjoern A. Zeeb     struct rawcb *rp)
206528737fdSBjoern A. Zeeb {
207528737fdSBjoern A. Zeeb 	int fibnum;
208528737fdSBjoern A. Zeeb 
209528737fdSBjoern A. Zeeb 	KASSERT(m != NULL, ("%s: m is NULL", __func__));
210528737fdSBjoern A. Zeeb 	KASSERT(proto != NULL, ("%s: proto is NULL", __func__));
211528737fdSBjoern A. Zeeb 	KASSERT(rp != NULL, ("%s: rp is NULL", __func__));
212528737fdSBjoern A. Zeeb 
213528737fdSBjoern A. Zeeb 	/* No filtering requested. */
214528737fdSBjoern A. Zeeb 	if ((m->m_flags & RTS_FILTER_FIB) == 0)
215528737fdSBjoern A. Zeeb 		return (0);
216528737fdSBjoern A. Zeeb 
217528737fdSBjoern A. Zeeb 	/* Check if it is a rts and the fib matches the one of the socket. */
218528737fdSBjoern A. Zeeb 	fibnum = M_GETFIB(m);
219528737fdSBjoern A. Zeeb 	if (proto->sp_family != PF_ROUTE ||
220528737fdSBjoern A. Zeeb 	    rp->rcb_socket == NULL ||
221528737fdSBjoern A. Zeeb 	    rp->rcb_socket->so_fibnum == fibnum)
222528737fdSBjoern A. Zeeb 		return (0);
223528737fdSBjoern A. Zeeb 
224528737fdSBjoern A. Zeeb 	/* Filtering requested and no match, the socket shall be skipped. */
225528737fdSBjoern A. Zeeb 	return (1);
226528737fdSBjoern A. Zeeb }
227528737fdSBjoern A. Zeeb 
228d989c7b3SRobert Watson static void
229d989c7b3SRobert Watson rts_input(struct mbuf *m)
230d989c7b3SRobert Watson {
231d989c7b3SRobert Watson 	struct sockproto route_proto;
232d989c7b3SRobert Watson 	unsigned short *family;
233d989c7b3SRobert Watson 	struct m_tag *tag;
234d989c7b3SRobert Watson 
235d989c7b3SRobert Watson 	route_proto.sp_family = PF_ROUTE;
236d989c7b3SRobert Watson 	tag = m_tag_find(m, PACKET_TAG_RTSOCKFAM, NULL);
237d989c7b3SRobert Watson 	if (tag != NULL) {
238d989c7b3SRobert Watson 		family = (unsigned short *)(tag + 1);
239d989c7b3SRobert Watson 		route_proto.sp_protocol = *family;
240d989c7b3SRobert Watson 		m_tag_delete(m, tag);
241d989c7b3SRobert Watson 	} else
242d989c7b3SRobert Watson 		route_proto.sp_protocol = 0;
243d989c7b3SRobert Watson 
244528737fdSBjoern A. Zeeb 	raw_input_ext(m, &route_proto, &route_src, raw_input_rts_cb);
245d989c7b3SRobert Watson }
246d989c7b3SRobert Watson 
247a29f300eSGarrett Wollman /*
248a29f300eSGarrett Wollman  * It really doesn't make any sense at all for this code to share much
249a29f300eSGarrett Wollman  * with raw_usrreq.c, since its functionality is so restricted.  XXX
250a29f300eSGarrett Wollman  */
251ac45e92fSRobert Watson static void
252a29f300eSGarrett Wollman rts_abort(struct socket *so)
253df8bae1dSRodney W. Grimes {
2547e994955SRobert Watson 
255ac45e92fSRobert Watson 	raw_usrreqs.pru_abort(so);
256df8bae1dSRodney W. Grimes }
257a29f300eSGarrett Wollman 
258a152f8a3SRobert Watson static void
259a152f8a3SRobert Watson rts_close(struct socket *so)
260a152f8a3SRobert Watson {
261a152f8a3SRobert Watson 
262a152f8a3SRobert Watson 	raw_usrreqs.pru_close(so);
263a152f8a3SRobert Watson }
264a152f8a3SRobert Watson 
265a29f300eSGarrett Wollman /* pru_accept is EOPNOTSUPP */
266a29f300eSGarrett Wollman 
267a29f300eSGarrett Wollman static int
268b40ce416SJulian Elischer rts_attach(struct socket *so, int proto, struct thread *td)
269a29f300eSGarrett Wollman {
270a29f300eSGarrett Wollman 	struct rawcb *rp;
271c9b652e3SAndre Oppermann 	int error;
272a29f300eSGarrett Wollman 
273bc725eafSRobert Watson 	KASSERT(so->so_pcb == NULL, ("rts_attach: so_pcb != NULL"));
274bc725eafSRobert Watson 
2757cc0979fSDavid Malone 	/* XXX */
2761ede983cSDag-Erling Smørgrav 	rp = malloc(sizeof *rp, M_PCB, M_WAITOK | M_ZERO);
2775dfc91d7SLuigi Rizzo 	if (rp == NULL)
278a29f300eSGarrett Wollman 		return ENOBUFS;
279a29f300eSGarrett Wollman 
280a29f300eSGarrett Wollman 	so->so_pcb = (caddr_t)rp;
2818b07e49aSJulian Elischer 	so->so_fibnum = td->td_proc->p_fibnum;
282162c0b2eSRuslan Ermilov 	error = raw_attach(so, proto);
283a29f300eSGarrett Wollman 	rp = sotorawcb(so);
284a29f300eSGarrett Wollman 	if (error) {
2857ba271aeSJonathan Chen 		so->so_pcb = NULL;
286a29f300eSGarrett Wollman 		free(rp, M_PCB);
287a29f300eSGarrett Wollman 		return error;
288a29f300eSGarrett Wollman 	}
289aea8b30fSSam Leffler 	RTSOCK_LOCK();
290a29f300eSGarrett Wollman 	switch(rp->rcb_proto.sp_protocol) {
291a29f300eSGarrett Wollman 	case AF_INET:
292c5d4eab6SMarko Zec 		V_route_cb.ip_count++;
293a29f300eSGarrett Wollman 		break;
294899ce4f4SYoshinobu Inoue 	case AF_INET6:
295c5d4eab6SMarko Zec 		V_route_cb.ip6_count++;
296899ce4f4SYoshinobu Inoue 		break;
297a29f300eSGarrett Wollman 	}
298c5d4eab6SMarko Zec 	V_route_cb.any_count++;
299aea8b30fSSam Leffler 	RTSOCK_UNLOCK();
30003e49181SSeigo Tanimura 	soisconnected(so);
301df8bae1dSRodney W. Grimes 	so->so_options |= SO_USELOOPBACK;
302a29f300eSGarrett Wollman 	return 0;
303df8bae1dSRodney W. Grimes }
304df8bae1dSRodney W. Grimes 
305a29f300eSGarrett Wollman static int
306b40ce416SJulian Elischer rts_bind(struct socket *so, struct sockaddr *nam, struct thread *td)
307a29f300eSGarrett Wollman {
3087e994955SRobert Watson 
3097e994955SRobert Watson 	return (raw_usrreqs.pru_bind(so, nam, td)); /* xxx just EINVAL */
310a29f300eSGarrett Wollman }
311a29f300eSGarrett Wollman 
312a29f300eSGarrett Wollman static int
313b40ce416SJulian Elischer rts_connect(struct socket *so, struct sockaddr *nam, struct thread *td)
314a29f300eSGarrett Wollman {
3157e994955SRobert Watson 
3167e994955SRobert Watson 	return (raw_usrreqs.pru_connect(so, nam, td)); /* XXX just EINVAL */
317a29f300eSGarrett Wollman }
318a29f300eSGarrett Wollman 
319a29f300eSGarrett Wollman /* pru_connect2 is EOPNOTSUPP */
320a29f300eSGarrett Wollman /* pru_control is EOPNOTSUPP */
321a29f300eSGarrett Wollman 
322bc725eafSRobert Watson static void
323a29f300eSGarrett Wollman rts_detach(struct socket *so)
324a29f300eSGarrett Wollman {
325a29f300eSGarrett Wollman 	struct rawcb *rp = sotorawcb(so);
326a29f300eSGarrett Wollman 
327bc725eafSRobert Watson 	KASSERT(rp != NULL, ("rts_detach: rp == NULL"));
328bc725eafSRobert Watson 
329aea8b30fSSam Leffler 	RTSOCK_LOCK();
330a29f300eSGarrett Wollman 	switch(rp->rcb_proto.sp_protocol) {
331a29f300eSGarrett Wollman 	case AF_INET:
332c5d4eab6SMarko Zec 		V_route_cb.ip_count--;
333a29f300eSGarrett Wollman 		break;
334899ce4f4SYoshinobu Inoue 	case AF_INET6:
335c5d4eab6SMarko Zec 		V_route_cb.ip6_count--;
336899ce4f4SYoshinobu Inoue 		break;
337a29f300eSGarrett Wollman 	}
338c5d4eab6SMarko Zec 	V_route_cb.any_count--;
339aea8b30fSSam Leffler 	RTSOCK_UNLOCK();
340bc725eafSRobert Watson 	raw_usrreqs.pru_detach(so);
341a29f300eSGarrett Wollman }
342a29f300eSGarrett Wollman 
343a29f300eSGarrett Wollman static int
344a29f300eSGarrett Wollman rts_disconnect(struct socket *so)
345a29f300eSGarrett Wollman {
3467e994955SRobert Watson 
3477e994955SRobert Watson 	return (raw_usrreqs.pru_disconnect(so));
348a29f300eSGarrett Wollman }
349a29f300eSGarrett Wollman 
350a29f300eSGarrett Wollman /* pru_listen is EOPNOTSUPP */
351a29f300eSGarrett Wollman 
352a29f300eSGarrett Wollman static int
35357bf258eSGarrett Wollman rts_peeraddr(struct socket *so, struct sockaddr **nam)
354a29f300eSGarrett Wollman {
3557e994955SRobert Watson 
3567e994955SRobert Watson 	return (raw_usrreqs.pru_peeraddr(so, nam));
357a29f300eSGarrett Wollman }
358a29f300eSGarrett Wollman 
359a29f300eSGarrett Wollman /* pru_rcvd is EOPNOTSUPP */
360a29f300eSGarrett Wollman /* pru_rcvoob is EOPNOTSUPP */
361a29f300eSGarrett Wollman 
362a29f300eSGarrett Wollman static int
36357bf258eSGarrett Wollman rts_send(struct socket *so, int flags, struct mbuf *m, struct sockaddr *nam,
364b40ce416SJulian Elischer 	 struct mbuf *control, struct thread *td)
365a29f300eSGarrett Wollman {
3667e994955SRobert Watson 
3677e994955SRobert Watson 	return (raw_usrreqs.pru_send(so, flags, m, nam, control, td));
368a29f300eSGarrett Wollman }
369a29f300eSGarrett Wollman 
370a29f300eSGarrett Wollman /* pru_sense is null */
371a29f300eSGarrett Wollman 
372a29f300eSGarrett Wollman static int
373a29f300eSGarrett Wollman rts_shutdown(struct socket *so)
374a29f300eSGarrett Wollman {
3757e994955SRobert Watson 
3767e994955SRobert Watson 	return (raw_usrreqs.pru_shutdown(so));
377a29f300eSGarrett Wollman }
378a29f300eSGarrett Wollman 
379a29f300eSGarrett Wollman static int
38057bf258eSGarrett Wollman rts_sockaddr(struct socket *so, struct sockaddr **nam)
381a29f300eSGarrett Wollman {
3827e994955SRobert Watson 
3837e994955SRobert Watson 	return (raw_usrreqs.pru_sockaddr(so, nam));
384a29f300eSGarrett Wollman }
385a29f300eSGarrett Wollman 
386a29f300eSGarrett Wollman static struct pr_usrreqs route_usrreqs = {
387756d52a1SPoul-Henning Kamp 	.pru_abort =		rts_abort,
388756d52a1SPoul-Henning Kamp 	.pru_attach =		rts_attach,
389756d52a1SPoul-Henning Kamp 	.pru_bind =		rts_bind,
390756d52a1SPoul-Henning Kamp 	.pru_connect =		rts_connect,
391756d52a1SPoul-Henning Kamp 	.pru_detach =		rts_detach,
392756d52a1SPoul-Henning Kamp 	.pru_disconnect =	rts_disconnect,
393756d52a1SPoul-Henning Kamp 	.pru_peeraddr =		rts_peeraddr,
394756d52a1SPoul-Henning Kamp 	.pru_send =		rts_send,
395756d52a1SPoul-Henning Kamp 	.pru_shutdown =		rts_shutdown,
396756d52a1SPoul-Henning Kamp 	.pru_sockaddr =		rts_sockaddr,
397a152f8a3SRobert Watson 	.pru_close =		rts_close,
398a29f300eSGarrett Wollman };
399a29f300eSGarrett Wollman 
400413628a7SBjoern A. Zeeb #ifndef _SOCKADDR_UNION_DEFINED
401413628a7SBjoern A. Zeeb #define	_SOCKADDR_UNION_DEFINED
402413628a7SBjoern A. Zeeb /*
403413628a7SBjoern A. Zeeb  * The union of all possible address formats we handle.
404413628a7SBjoern A. Zeeb  */
405413628a7SBjoern A. Zeeb union sockaddr_union {
406413628a7SBjoern A. Zeeb 	struct sockaddr		sa;
407413628a7SBjoern A. Zeeb 	struct sockaddr_in	sin;
408413628a7SBjoern A. Zeeb 	struct sockaddr_in6	sin6;
409413628a7SBjoern A. Zeeb };
410413628a7SBjoern A. Zeeb #endif /* _SOCKADDR_UNION_DEFINED */
411413628a7SBjoern A. Zeeb 
412413628a7SBjoern A. Zeeb static int
413413628a7SBjoern A. Zeeb rtm_get_jailed(struct rt_addrinfo *info, struct ifnet *ifp,
414413628a7SBjoern A. Zeeb     struct rtentry *rt, union sockaddr_union *saun, struct ucred *cred)
415413628a7SBjoern A. Zeeb {
416413628a7SBjoern A. Zeeb 
4179c79d243SJamie Gritton 	/* First, see if the returned address is part of the jail. */
4189c79d243SJamie Gritton 	if (prison_if(cred, rt->rt_ifa->ifa_addr) == 0) {
4199c79d243SJamie Gritton 		info->rti_info[RTAX_IFA] = rt->rt_ifa->ifa_addr;
4209c79d243SJamie Gritton 		return (0);
4219c79d243SJamie Gritton 	}
4229c79d243SJamie Gritton 
423413628a7SBjoern A. Zeeb 	switch (info->rti_info[RTAX_DST]->sa_family) {
424413628a7SBjoern A. Zeeb #ifdef INET
425413628a7SBjoern A. Zeeb 	case AF_INET:
426413628a7SBjoern A. Zeeb 	{
427413628a7SBjoern A. Zeeb 		struct in_addr ia;
428413628a7SBjoern A. Zeeb 		struct ifaddr *ifa;
429413628a7SBjoern A. Zeeb 		int found;
430413628a7SBjoern A. Zeeb 
431413628a7SBjoern A. Zeeb 		found = 0;
432413628a7SBjoern A. Zeeb 		/*
4339c79d243SJamie Gritton 		 * Try to find an address on the given outgoing interface
4349c79d243SJamie Gritton 		 * that belongs to the jail.
435413628a7SBjoern A. Zeeb 		 */
436137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
437413628a7SBjoern A. Zeeb 		TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) {
438413628a7SBjoern A. Zeeb 			struct sockaddr *sa;
439413628a7SBjoern A. Zeeb 			sa = ifa->ifa_addr;
440413628a7SBjoern A. Zeeb 			if (sa->sa_family != AF_INET)
441413628a7SBjoern A. Zeeb 				continue;
442413628a7SBjoern A. Zeeb 			ia = ((struct sockaddr_in *)sa)->sin_addr;
443b89e82ddSJamie Gritton 			if (prison_check_ip4(cred, &ia) == 0) {
444413628a7SBjoern A. Zeeb 				found = 1;
445413628a7SBjoern A. Zeeb 				break;
446413628a7SBjoern A. Zeeb 			}
447413628a7SBjoern A. Zeeb 		}
448137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
449413628a7SBjoern A. Zeeb 		if (!found) {
450413628a7SBjoern A. Zeeb 			/*
4519c79d243SJamie Gritton 			 * As a last resort return the 'default' jail address.
452413628a7SBjoern A. Zeeb 			 */
4530304c731SJamie Gritton 			ia = ((struct sockaddr_in *)rt->rt_ifa->ifa_addr)->
4540304c731SJamie Gritton 			    sin_addr;
4551cecba0fSBjoern A. Zeeb 			if (prison_get_ip4(cred, &ia) != 0)
456413628a7SBjoern A. Zeeb 				return (ESRCH);
457413628a7SBjoern A. Zeeb 		}
458413628a7SBjoern A. Zeeb 		bzero(&saun->sin, sizeof(struct sockaddr_in));
459413628a7SBjoern A. Zeeb 		saun->sin.sin_len = sizeof(struct sockaddr_in);
460413628a7SBjoern A. Zeeb 		saun->sin.sin_family = AF_INET;
461413628a7SBjoern A. Zeeb 		saun->sin.sin_addr.s_addr = ia.s_addr;
4629c79d243SJamie Gritton 		info->rti_info[RTAX_IFA] = (struct sockaddr *)&saun->sin;
463413628a7SBjoern A. Zeeb 		break;
464413628a7SBjoern A. Zeeb 	}
465413628a7SBjoern A. Zeeb #endif
466413628a7SBjoern A. Zeeb #ifdef INET6
467413628a7SBjoern A. Zeeb 	case AF_INET6:
468413628a7SBjoern A. Zeeb 	{
469413628a7SBjoern A. Zeeb 		struct in6_addr ia6;
470413628a7SBjoern A. Zeeb 		struct ifaddr *ifa;
471413628a7SBjoern A. Zeeb 		int found;
472413628a7SBjoern A. Zeeb 
473413628a7SBjoern A. Zeeb 		found = 0;
474413628a7SBjoern A. Zeeb 		/*
4759c79d243SJamie Gritton 		 * Try to find an address on the given outgoing interface
4769c79d243SJamie Gritton 		 * that belongs to the jail.
477413628a7SBjoern A. Zeeb 		 */
478137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
479413628a7SBjoern A. Zeeb 		TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) {
480413628a7SBjoern A. Zeeb 			struct sockaddr *sa;
481413628a7SBjoern A. Zeeb 			sa = ifa->ifa_addr;
482413628a7SBjoern A. Zeeb 			if (sa->sa_family != AF_INET6)
483413628a7SBjoern A. Zeeb 				continue;
484413628a7SBjoern A. Zeeb 			bcopy(&((struct sockaddr_in6 *)sa)->sin6_addr,
485413628a7SBjoern A. Zeeb 			    &ia6, sizeof(struct in6_addr));
486b89e82ddSJamie Gritton 			if (prison_check_ip6(cred, &ia6) == 0) {
487413628a7SBjoern A. Zeeb 				found = 1;
488413628a7SBjoern A. Zeeb 				break;
489413628a7SBjoern A. Zeeb 			}
490413628a7SBjoern A. Zeeb 		}
491137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
492413628a7SBjoern A. Zeeb 		if (!found) {
493413628a7SBjoern A. Zeeb 			/*
4949c79d243SJamie Gritton 			 * As a last resort return the 'default' jail address.
495413628a7SBjoern A. Zeeb 			 */
4960304c731SJamie Gritton 			ia6 = ((struct sockaddr_in6 *)rt->rt_ifa->ifa_addr)->
4970304c731SJamie Gritton 			    sin6_addr;
4981cecba0fSBjoern A. Zeeb 			if (prison_get_ip6(cred, &ia6) != 0)
499413628a7SBjoern A. Zeeb 				return (ESRCH);
500413628a7SBjoern A. Zeeb 		}
501413628a7SBjoern A. Zeeb 		bzero(&saun->sin6, sizeof(struct sockaddr_in6));
502413628a7SBjoern A. Zeeb 		saun->sin6.sin6_len = sizeof(struct sockaddr_in6);
503413628a7SBjoern A. Zeeb 		saun->sin6.sin6_family = AF_INET6;
5049c79d243SJamie Gritton 		bcopy(&ia6, &saun->sin6.sin6_addr, sizeof(struct in6_addr));
505413628a7SBjoern A. Zeeb 		if (sa6_recoverscope(&saun->sin6) != 0)
506413628a7SBjoern A. Zeeb 			return (ESRCH);
5079c79d243SJamie Gritton 		info->rti_info[RTAX_IFA] = (struct sockaddr *)&saun->sin6;
508413628a7SBjoern A. Zeeb 		break;
509413628a7SBjoern A. Zeeb 	}
510413628a7SBjoern A. Zeeb #endif
511413628a7SBjoern A. Zeeb 	default:
512413628a7SBjoern A. Zeeb 		return (ESRCH);
513413628a7SBjoern A. Zeeb 	}
514413628a7SBjoern A. Zeeb 	return (0);
515413628a7SBjoern A. Zeeb }
516413628a7SBjoern A. Zeeb 
517df8bae1dSRodney W. Grimes /*ARGSUSED*/
51852041295SPoul-Henning Kamp static int
5195dfc91d7SLuigi Rizzo route_output(struct mbuf *m, struct socket *so)
520df8bae1dSRodney W. Grimes {
5215dfc91d7SLuigi Rizzo 	struct rt_msghdr *rtm = NULL;
5225dfc91d7SLuigi Rizzo 	struct rtentry *rt = NULL;
52378a82810SGarrett Wollman 	struct radix_node_head *rnh;
524df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
5250bebb544SHiroki Sato 	struct sockaddr_storage ss;
5263deb3649SAlexander V. Chernikov #ifdef INET6
5276bbfef90SHiroki Sato 	struct sockaddr_in6 *sin6;
5280bebb544SHiroki Sato 	int i, rti_need_deembed = 0;
5296bbfef90SHiroki Sato #endif
530f2e5eb36SAlexander V. Chernikov 	int alloc_len = 0, len, error = 0, fibnum;
5315dfc91d7SLuigi Rizzo 	struct ifnet *ifp = NULL;
532413628a7SBjoern A. Zeeb 	union sockaddr_union saun;
5333ca1a2d6SMax Laier 	sa_family_t saf = AF_UNSPEC;
53492c227afSAlexander V. Chernikov 	struct rawcb *rp = NULL;
535f2e5eb36SAlexander V. Chernikov 	struct walkarg w;
536df8bae1dSRodney W. Grimes 
537f5d9a696SAlexander V. Chernikov 	fibnum = so->so_fibnum;
538f5d9a696SAlexander V. Chernikov 
539df8bae1dSRodney W. Grimes #define senderr(e) { error = e; goto flush;}
5405dfc91d7SLuigi Rizzo 	if (m == NULL || ((m->m_len < sizeof(long)) &&
5415dfc91d7SLuigi Rizzo 		       (m = m_pullup(m, sizeof(long))) == NULL))
542df8bae1dSRodney W. Grimes 		return (ENOBUFS);
543df8bae1dSRodney W. Grimes 	if ((m->m_flags & M_PKTHDR) == 0)
544df8bae1dSRodney W. Grimes 		panic("route_output");
545df8bae1dSRodney W. Grimes 	len = m->m_pkthdr.len;
546df8bae1dSRodney W. Grimes 	if (len < sizeof(*rtm) ||
547f1fcb552SAlexander V. Chernikov 	    len != mtod(m, struct rt_msghdr *)->rtm_msglen)
548df8bae1dSRodney W. Grimes 		senderr(EINVAL);
549f1fcb552SAlexander V. Chernikov 
550f2e5eb36SAlexander V. Chernikov 	/*
551f2e5eb36SAlexander V. Chernikov 	 * Most of current messages are in range 200-240 bytes,
552d9437c0fSAlexander V. Chernikov 	 * minimize possible re-allocation on reply using larger size
553d9437c0fSAlexander V. Chernikov 	 * buffer aligned on 1k boundaty.
554f2e5eb36SAlexander V. Chernikov 	 */
555f2e5eb36SAlexander V. Chernikov 	alloc_len = roundup2(len, 1024);
556d9437c0fSAlexander V. Chernikov 	if ((rtm = malloc(alloc_len, M_TEMP, M_NOWAIT)) == NULL)
557df8bae1dSRodney W. Grimes 		senderr(ENOBUFS);
558f2e5eb36SAlexander V. Chernikov 
559df8bae1dSRodney W. Grimes 	m_copydata(m, 0, len, (caddr_t)rtm);
560f1fcb552SAlexander V. Chernikov 	bzero(&info, sizeof(info));
561f2e5eb36SAlexander V. Chernikov 	bzero(&w, sizeof(w));
562f1fcb552SAlexander V. Chernikov 
563df8bae1dSRodney W. Grimes 	if (rtm->rtm_version != RTM_VERSION) {
564f1fcb552SAlexander V. Chernikov 		/* Do not touch message since format is unknown */
565f2e5eb36SAlexander V. Chernikov 		free(rtm, M_TEMP);
566f1fcb552SAlexander V. Chernikov 		rtm = NULL;
567df8bae1dSRodney W. Grimes 		senderr(EPROTONOSUPPORT);
568df8bae1dSRodney W. Grimes 	}
569f1fcb552SAlexander V. Chernikov 
570f1fcb552SAlexander V. Chernikov 	/*
571f1fcb552SAlexander V. Chernikov 	 * Starting from here, it is possible
572f1fcb552SAlexander V. Chernikov 	 * to alter original message and insert
573f1fcb552SAlexander V. Chernikov 	 * caller PID and error value.
574f1fcb552SAlexander V. Chernikov 	 */
575f1fcb552SAlexander V. Chernikov 
576df8bae1dSRodney W. Grimes 	rtm->rtm_pid = curproc->p_pid;
577df8bae1dSRodney W. Grimes 	info.rti_addrs = rtm->rtm_addrs;
5780fb9298dSAlexander V. Chernikov 
5790fb9298dSAlexander V. Chernikov 	info.rti_mflags = rtm->rtm_inits;
5800fb9298dSAlexander V. Chernikov 	info.rti_rmx = &rtm->rtm_rmx;
5810fb9298dSAlexander V. Chernikov 
5820bebb544SHiroki Sato 	/*
5830bebb544SHiroki Sato 	 * rt_xaddrs() performs s6_addr[2] := sin6_scope_id for AF_INET6
5840bebb544SHiroki Sato 	 * link-local address because rtrequest requires addresses with
5850bebb544SHiroki Sato 	 * embedded scope id.
5860bebb544SHiroki Sato 	 */
587f1fcb552SAlexander V. Chernikov 	if (rt_xaddrs((caddr_t)(rtm + 1), len + (caddr_t)rtm, &info))
588076d0761SJulian Elischer 		senderr(EINVAL);
589f1fcb552SAlexander V. Chernikov 
5908071913dSRuslan Ermilov 	info.rti_flags = rtm->rtm_flags;
5915dfc91d7SLuigi Rizzo 	if (info.rti_info[RTAX_DST] == NULL ||
592becc44d7SSam Leffler 	    info.rti_info[RTAX_DST]->sa_family >= AF_MAX ||
5935dfc91d7SLuigi Rizzo 	    (info.rti_info[RTAX_GATEWAY] != NULL &&
594becc44d7SSam Leffler 	     info.rti_info[RTAX_GATEWAY]->sa_family >= AF_MAX))
595df8bae1dSRodney W. Grimes 		senderr(EINVAL);
5963ca1a2d6SMax Laier 	saf = info.rti_info[RTAX_DST]->sa_family;
597162c0b2eSRuslan Ermilov 	/*
598162c0b2eSRuslan Ermilov 	 * Verify that the caller has the appropriate privilege; RTM_GET
599162c0b2eSRuslan Ermilov 	 * is the only operation the non-superuser is allowed.
600162c0b2eSRuslan Ermilov 	 */
601acd3428bSRobert Watson 	if (rtm->rtm_type != RTM_GET) {
602acd3428bSRobert Watson 		error = priv_check(curthread, PRIV_NET_ROUTE);
603acd3428bSRobert Watson 		if (error)
604dadb6c3bSRuslan Ermilov 			senderr(error);
605acd3428bSRobert Watson 	}
606162c0b2eSRuslan Ermilov 
6079231d35fSQing Li 	/*
6089231d35fSQing Li 	 * The given gateway address may be an interface address.
6099231d35fSQing Li 	 * For example, issuing a "route change" command on a route
6109231d35fSQing Li 	 * entry that was created from a tunnel, and the gateway
6119231d35fSQing Li 	 * address given is the local end point. In this case the
6129231d35fSQing Li 	 * RTF_GATEWAY flag must be cleared or the destination will
6139231d35fSQing Li 	 * not be reachable even though there is no error message.
6149231d35fSQing Li 	 */
6159231d35fSQing Li 	if (info.rti_info[RTAX_GATEWAY] != NULL &&
6169231d35fSQing Li 	    info.rti_info[RTAX_GATEWAY]->sa_family != AF_LINK) {
6179231d35fSQing Li 		struct route gw_ro;
6189231d35fSQing Li 
6199231d35fSQing Li 		bzero(&gw_ro, sizeof(gw_ro));
6209231d35fSQing Li 		gw_ro.ro_dst = *info.rti_info[RTAX_GATEWAY];
621773aa053SAlexander V. Chernikov 		rtalloc_ign_fib(&gw_ro, 0, fibnum);
6229231d35fSQing Li 		/*
6239231d35fSQing Li 		 * A host route through the loopback interface is
6249231d35fSQing Li 		 * installed for each interface adddress. In pre 8.0
6259231d35fSQing Li 		 * releases the interface address of a PPP link type
6269231d35fSQing Li 		 * is not reachable locally. This behavior is fixed as
6279231d35fSQing Li 		 * part of the new L2/L3 redesign and rewrite work. The
6289231d35fSQing Li 		 * signature of this interface address route is the
6299231d35fSQing Li 		 * AF_LINK sa_family type of the rt_gateway, and the
6309231d35fSQing Li 		 * rt_ifp has the IFF_LOOPBACK flag set.
6319231d35fSQing Li 		 */
6329231d35fSQing Li 		if (gw_ro.ro_rt != NULL &&
6339231d35fSQing Li 		    gw_ro.ro_rt->rt_gateway->sa_family == AF_LINK &&
634f672f56fSQing Li 		    gw_ro.ro_rt->rt_ifp->if_flags & IFF_LOOPBACK) {
6359231d35fSQing Li 			info.rti_flags &= ~RTF_GATEWAY;
636f672f56fSQing Li 			info.rti_flags |= RTF_GWFLAG_COMPAT;
637f672f56fSQing Li 		}
6389231d35fSQing Li 		if (gw_ro.ro_rt != NULL)
6399231d35fSQing Li 			RTFREE(gw_ro.ro_rt);
6409231d35fSQing Li 	}
6419231d35fSQing Li 
642df8bae1dSRodney W. Grimes 	switch (rtm->rtm_type) {
643becc44d7SSam Leffler 		struct rtentry *saved_nrt;
644df8bae1dSRodney W. Grimes 
645df8bae1dSRodney W. Grimes 	case RTM_ADD:
646c77462ddSAlexander V. Chernikov 	case RTM_CHANGE:
6475dfc91d7SLuigi Rizzo 		if (info.rti_info[RTAX_GATEWAY] == NULL)
648df8bae1dSRodney W. Grimes 			senderr(EINVAL);
6495dfc91d7SLuigi Rizzo 		saved_nrt = NULL;
6508eca593cSQing Li 
6516e6b3f7cSQing Li 		/* support for new ARP code */
6528eca593cSQing Li 		if (info.rti_info[RTAX_GATEWAY]->sa_family == AF_LINK &&
6538eca593cSQing Li 		    (rtm->rtm_flags & RTF_LLDATA) != 0) {
6546e6b3f7cSQing Li 			error = lla_rt_output(rtm, &info);
6550bebb544SHiroki Sato #ifdef INET6
6560bebb544SHiroki Sato 			if (error == 0)
6570bebb544SHiroki Sato 				rti_need_deembed = (V_deembed_scopeid) ? 1 : 0;
6580bebb544SHiroki Sato #endif
6596e6b3f7cSQing Li 			break;
6606e6b3f7cSQing Li 		}
661c77462ddSAlexander V. Chernikov 		error = rtrequest1_fib(rtm->rtm_type, &info, &saved_nrt,
662773aa053SAlexander V. Chernikov 		    fibnum);
663c77462ddSAlexander V. Chernikov 		if (error == 0 && saved_nrt != NULL) {
6640bebb544SHiroki Sato #ifdef INET6
6650bebb544SHiroki Sato 			rti_need_deembed = (V_deembed_scopeid) ? 1 : 0;
6660bebb544SHiroki Sato #endif
667d1dd20beSSam Leffler 			RT_LOCK(saved_nrt);
66822cafcf0SAndre Oppermann 			rtm->rtm_index = saved_nrt->rt_ifp->if_index;
6697138d65cSSam Leffler 			RT_REMREF(saved_nrt);
670d1dd20beSSam Leffler 			RT_UNLOCK(saved_nrt);
671df8bae1dSRodney W. Grimes 		}
672df8bae1dSRodney W. Grimes 		break;
673df8bae1dSRodney W. Grimes 
674df8bae1dSRodney W. Grimes 	case RTM_DELETE:
6755dfc91d7SLuigi Rizzo 		saved_nrt = NULL;
6766e6b3f7cSQing Li 		/* support for new ARP code */
6776e6b3f7cSQing Li 		if (info.rti_info[RTAX_GATEWAY] &&
6788eca593cSQing Li 		    (info.rti_info[RTAX_GATEWAY]->sa_family == AF_LINK) &&
6798eca593cSQing Li 		    (rtm->rtm_flags & RTF_LLDATA) != 0) {
6806e6b3f7cSQing Li 			error = lla_rt_output(rtm, &info);
6810bebb544SHiroki Sato #ifdef INET6
6820bebb544SHiroki Sato 			if (error == 0)
6830bebb544SHiroki Sato 				rti_need_deembed = (V_deembed_scopeid) ? 1 : 0;
6840bebb544SHiroki Sato #endif
6856e6b3f7cSQing Li 			break;
6866e6b3f7cSQing Li 		}
687773aa053SAlexander V. Chernikov 		error = rtrequest1_fib(RTM_DELETE, &info, &saved_nrt, fibnum);
68878a82810SGarrett Wollman 		if (error == 0) {
689d1dd20beSSam Leffler 			RT_LOCK(saved_nrt);
69071eba915SRuslan Ermilov 			rt = saved_nrt;
69178a82810SGarrett Wollman 			goto report;
69278a82810SGarrett Wollman 		}
6930bebb544SHiroki Sato #ifdef INET6
6940bebb544SHiroki Sato 		/* rt_msg2() will not be used when RTM_DELETE fails. */
6950bebb544SHiroki Sato 		rti_need_deembed = (V_deembed_scopeid) ? 1 : 0;
6960bebb544SHiroki Sato #endif
697df8bae1dSRodney W. Grimes 		break;
698df8bae1dSRodney W. Grimes 
699df8bae1dSRodney W. Grimes 	case RTM_GET:
700773aa053SAlexander V. Chernikov 		rnh = rt_tables_get_rnh(fibnum, saf);
7015dfc91d7SLuigi Rizzo 		if (rnh == NULL)
70278a82810SGarrett Wollman 			senderr(EAFNOSUPPORT);
7035a2f4cbdSAlexander V. Chernikov 
7043120b9d4SKip Macy 		RADIX_NODE_HEAD_RLOCK(rnh);
7055a2f4cbdSAlexander V. Chernikov 
7065a2f4cbdSAlexander V. Chernikov 		if (info.rti_info[RTAX_NETMASK] == NULL &&
7075a2f4cbdSAlexander V. Chernikov 		    rtm->rtm_type == RTM_GET) {
7085a2f4cbdSAlexander V. Chernikov 			/*
7095a2f4cbdSAlexander V. Chernikov 			 * Provide logest prefix match for
7105a2f4cbdSAlexander V. Chernikov 			 * address lookup (no mask).
7115a2f4cbdSAlexander V. Chernikov 			 * 'route -n get addr'
7125a2f4cbdSAlexander V. Chernikov 			 */
7135a2f4cbdSAlexander V. Chernikov 			rt = (struct rtentry *) rnh->rnh_matchaddr(
7145a2f4cbdSAlexander V. Chernikov 			    info.rti_info[RTAX_DST], rnh);
7155a2f4cbdSAlexander V. Chernikov 		} else
7165a2f4cbdSAlexander V. Chernikov 			rt = (struct rtentry *) rnh->rnh_lookup(
7175a2f4cbdSAlexander V. Chernikov 			    info.rti_info[RTAX_DST],
718becc44d7SSam Leffler 			    info.rti_info[RTAX_NETMASK], rnh);
7195a2f4cbdSAlexander V. Chernikov 
7205a2f4cbdSAlexander V. Chernikov 		if (rt == NULL) {
7213120b9d4SKip Macy 			RADIX_NODE_HEAD_RUNLOCK(rnh);
722df8bae1dSRodney W. Grimes 			senderr(ESRCH);
72379188861SGleb Smirnoff 		}
724e440aed9SQing Li #ifdef RADIX_MPATH
725e440aed9SQing Li 		/*
726e440aed9SQing Li 		 * for RTM_CHANGE/LOCK, if we got multipath routes,
727e440aed9SQing Li 		 * we require users to specify a matching RTAX_GATEWAY.
728e440aed9SQing Li 		 *
729e440aed9SQing Li 		 * for RTM_GET, gate is optional even with multipath.
730e440aed9SQing Li 		 * if gate == NULL the first match is returned.
731e440aed9SQing Li 		 * (no need to call rt_mpath_matchgate if gate == NULL)
732e440aed9SQing Li 		 */
733e440aed9SQing Li 		if (rn_mpath_capable(rnh) &&
734e440aed9SQing Li 		    (rtm->rtm_type != RTM_GET || info.rti_info[RTAX_GATEWAY])) {
735e440aed9SQing Li 			rt = rt_mpath_matchgate(rt, info.rti_info[RTAX_GATEWAY]);
736e440aed9SQing Li 			if (!rt) {
7373120b9d4SKip Macy 				RADIX_NODE_HEAD_RUNLOCK(rnh);
738e440aed9SQing Li 				senderr(ESRCH);
739e440aed9SQing Li 			}
740e440aed9SQing Li 		}
741e440aed9SQing Li #endif
742c7ab6602SQing Li 		/*
743c7ab6602SQing Li 		 * If performing proxied L2 entry insertion, and
744c7ab6602SQing Li 		 * the actual PPP host entry is found, perform
745c7ab6602SQing Li 		 * another search to retrieve the prefix route of
746c7ab6602SQing Li 		 * the local end point of the PPP link.
747c7ab6602SQing Li 		 */
7480ed6142bSQing Li 		if (rtm->rtm_flags & RTF_ANNOUNCE) {
749c7ab6602SQing Li 			struct sockaddr laddr;
7500ed6142bSQing Li 
7510ed6142bSQing Li 			if (rt->rt_ifp != NULL &&
7520ed6142bSQing Li 			    rt->rt_ifp->if_type == IFT_PROPVIRTUAL) {
7530ed6142bSQing Li 				struct ifaddr *ifa;
7540ed6142bSQing Li 
7550cfee0c2SAlan Somers 				ifa = ifa_ifwithnet(info.rti_info[RTAX_DST], 1,
7560cfee0c2SAlan Somers 				    RT_DEFAULT_FIB);
7570ed6142bSQing Li 				if (ifa != NULL)
7580ed6142bSQing Li 					rt_maskedcopy(ifa->ifa_addr,
7590ed6142bSQing Li 						      &laddr,
7600ed6142bSQing Li 						      ifa->ifa_netmask);
7610ed6142bSQing Li 			} else
762c7ab6602SQing Li 				rt_maskedcopy(rt->rt_ifa->ifa_addr,
763c7ab6602SQing Li 					      &laddr,
764c7ab6602SQing Li 					      rt->rt_ifa->ifa_netmask);
765c7ab6602SQing Li 			/*
766c7ab6602SQing Li 			 * refactor rt and no lock operation necessary
767c7ab6602SQing Li 			 */
768c7ab6602SQing Li 			rt = (struct rtentry *)rnh->rnh_matchaddr(&laddr, rnh);
769c7ab6602SQing Li 			if (rt == NULL) {
770c7ab6602SQing Li 				RADIX_NODE_HEAD_RUNLOCK(rnh);
771c7ab6602SQing Li 				senderr(ESRCH);
772c7ab6602SQing Li 			}
773c7ab6602SQing Li 		}
774d1dd20beSSam Leffler 		RT_LOCK(rt);
7757138d65cSSam Leffler 		RT_ADDREF(rt);
7763120b9d4SKip Macy 		RADIX_NODE_HEAD_RUNLOCK(rnh);
777956b0b65SJeffrey Hsu 
77878a82810SGarrett Wollman report:
779d1dd20beSSam Leffler 		RT_LOCK_ASSERT(rt);
780b89e82ddSJamie Gritton 		if ((rt->rt_flags & RTF_HOST) == 0
781de0bd6f7SBjoern A. Zeeb 		    ? jailed_without_vnet(curthread->td_ucred)
782b89e82ddSJamie Gritton 		    : prison_if(curthread->td_ucred,
783b89e82ddSJamie Gritton 		    rt_key(rt)) != 0) {
784813dd6aeSBjoern A. Zeeb 			RT_UNLOCK(rt);
785813dd6aeSBjoern A. Zeeb 			senderr(ESRCH);
786813dd6aeSBjoern A. Zeeb 		}
787becc44d7SSam Leffler 		info.rti_info[RTAX_DST] = rt_key(rt);
788becc44d7SSam Leffler 		info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
7893deb3649SAlexander V. Chernikov 		info.rti_info[RTAX_NETMASK] = rtsock_fix_netmask(rt_key(rt),
7903deb3649SAlexander V. Chernikov 		    rt_mask(rt), &ss);
7916e6b3f7cSQing Li 		info.rti_info[RTAX_GENMASK] = 0;
792df8bae1dSRodney W. Grimes 		if (rtm->rtm_addrs & (RTA_IFP | RTA_IFA)) {
793df440948SPoul-Henning Kamp 			ifp = rt->rt_ifp;
794df440948SPoul-Henning Kamp 			if (ifp) {
7959b98ee2cSLuigi Rizzo 				info.rti_info[RTAX_IFP] =
7964a0d6638SRuslan Ermilov 				    ifp->if_addr->ifa_addr;
7979c79d243SJamie Gritton 				error = rtm_get_jailed(&info, ifp, rt,
7989c79d243SJamie Gritton 				    &saun, curthread->td_ucred);
799413628a7SBjoern A. Zeeb 				if (error != 0) {
800413628a7SBjoern A. Zeeb 					RT_UNLOCK(rt);
8019c79d243SJamie Gritton 					senderr(error);
802413628a7SBjoern A. Zeeb 				}
80328070a0eSRuslan Ermilov 				if (ifp->if_flags & IFF_POINTOPOINT)
804becc44d7SSam Leffler 					info.rti_info[RTAX_BRD] =
805becc44d7SSam Leffler 					    rt->rt_ifa->ifa_dstaddr;
806df8bae1dSRodney W. Grimes 				rtm->rtm_index = ifp->if_index;
807df8bae1dSRodney W. Grimes 			} else {
8085dfc91d7SLuigi Rizzo 				info.rti_info[RTAX_IFP] = NULL;
8095dfc91d7SLuigi Rizzo 				info.rti_info[RTAX_IFA] = NULL;
810df8bae1dSRodney W. Grimes 			}
81125029d6cSHartmut Brandt 		} else if ((ifp = rt->rt_ifp) != NULL) {
81225029d6cSHartmut Brandt 			rtm->rtm_index = ifp->if_index;
813df8bae1dSRodney W. Grimes 		}
814f2e5eb36SAlexander V. Chernikov 
815f2e5eb36SAlexander V. Chernikov 		/* Check if we need to realloc storage */
816f2e5eb36SAlexander V. Chernikov 		rtsock_msg_buffer(rtm->rtm_type, &info, NULL, &len);
817f2e5eb36SAlexander V. Chernikov 		if (len > alloc_len) {
818df8bae1dSRodney W. Grimes 			struct rt_msghdr *new_rtm;
819f2e5eb36SAlexander V. Chernikov 			new_rtm = malloc(len, M_TEMP, M_NOWAIT);
8205dfc91d7SLuigi Rizzo 			if (new_rtm == NULL) {
821d1dd20beSSam Leffler 				RT_UNLOCK(rt);
822df8bae1dSRodney W. Grimes 				senderr(ENOBUFS);
823becc44d7SSam Leffler 			}
8246b96f1afSLuigi Rizzo 			bcopy(rtm, new_rtm, rtm->rtm_msglen);
825f2e5eb36SAlexander V. Chernikov 			free(rtm, M_TEMP);
826f2e5eb36SAlexander V. Chernikov 			rtm = new_rtm;
827f2e5eb36SAlexander V. Chernikov 			alloc_len = len;
828df8bae1dSRodney W. Grimes 		}
829f2e5eb36SAlexander V. Chernikov 
830f2e5eb36SAlexander V. Chernikov 		w.w_tmem = (caddr_t)rtm;
831f2e5eb36SAlexander V. Chernikov 		w.w_tmemsize = alloc_len;
832f2e5eb36SAlexander V. Chernikov 		rtsock_msg_buffer(rtm->rtm_type, &info, &w, &len);
833f2e5eb36SAlexander V. Chernikov 
834f672f56fSQing Li 		if (rt->rt_flags & RTF_GWFLAG_COMPAT)
835f672f56fSQing Li 			rtm->rtm_flags = RTF_GATEWAY |
836f672f56fSQing Li 				(rt->rt_flags & ~RTF_GWFLAG_COMPAT);
837f672f56fSQing Li 		else
838df8bae1dSRodney W. Grimes 			rtm->rtm_flags = rt->rt_flags;
839e3a7aa6fSGleb Smirnoff 		rt_getmetrics(rt, &rtm->rtm_rmx);
840df8bae1dSRodney W. Grimes 		rtm->rtm_addrs = info.rti_addrs;
841df8bae1dSRodney W. Grimes 
842d1dd20beSSam Leffler 		RT_UNLOCK(rt);
843df8bae1dSRodney W. Grimes 		break;
844df8bae1dSRodney W. Grimes 
845df8bae1dSRodney W. Grimes 	default:
846df8bae1dSRodney W. Grimes 		senderr(EOPNOTSUPP);
847df8bae1dSRodney W. Grimes 	}
848df8bae1dSRodney W. Grimes 
849df8bae1dSRodney W. Grimes flush:
85092c227afSAlexander V. Chernikov 	if (rt != NULL)
851becc44d7SSam Leffler 		RTFREE(rt);
852df8bae1dSRodney W. Grimes 	/*
853df8bae1dSRodney W. Grimes 	 * Check to see if we don't want our own messages.
854df8bae1dSRodney W. Grimes 	 */
855df8bae1dSRodney W. Grimes 	if ((so->so_options & SO_USELOOPBACK) == 0) {
856c5d4eab6SMarko Zec 		if (V_route_cb.any_count <= 1) {
857d9437c0fSAlexander V. Chernikov 			if (rtm != NULL)
858f2e5eb36SAlexander V. Chernikov 				free(rtm, M_TEMP);
859df8bae1dSRodney W. Grimes 			m_freem(m);
860df8bae1dSRodney W. Grimes 			return (error);
861df8bae1dSRodney W. Grimes 		}
862df8bae1dSRodney W. Grimes 		/* There is another listener, so construct message */
863df8bae1dSRodney W. Grimes 		rp = sotorawcb(so);
8644cc20ab1SSeigo Tanimura 	}
86592c227afSAlexander V. Chernikov 
8662277c5e5SAlexander V. Chernikov 	if (rtm != NULL) {
8670bebb544SHiroki Sato #ifdef INET6
8680bebb544SHiroki Sato 		if (rti_need_deembed) {
8690bebb544SHiroki Sato 			/* sin6_scope_id is recovered before sending rtm. */
8700bebb544SHiroki Sato 			sin6 = (struct sockaddr_in6 *)&ss;
87112bdf23aSHiroki Sato 			for (i = 0; i < RTAX_MAX; i++) {
8720bebb544SHiroki Sato 				if (info.rti_info[i] == NULL)
8730bebb544SHiroki Sato 					continue;
8740bebb544SHiroki Sato 				if (info.rti_info[i]->sa_family != AF_INET6)
8750bebb544SHiroki Sato 					continue;
8760bebb544SHiroki Sato 				bcopy(info.rti_info[i], sin6, sizeof(*sin6));
8770bebb544SHiroki Sato 				if (sa6_recoverscope(sin6) == 0)
8780bebb544SHiroki Sato 					bcopy(sin6, info.rti_info[i],
8790bebb544SHiroki Sato 						    sizeof(*sin6));
8800bebb544SHiroki Sato 			}
8810bebb544SHiroki Sato 		}
8820bebb544SHiroki Sato #endif
88392c227afSAlexander V. Chernikov 		if (error != 0)
88492c227afSAlexander V. Chernikov 			rtm->rtm_errno = error;
88592c227afSAlexander V. Chernikov 		else
88692c227afSAlexander V. Chernikov 			rtm->rtm_flags |= RTF_DONE;
88792c227afSAlexander V. Chernikov 
888df8bae1dSRodney W. Grimes 		m_copyback(m, 0, rtm->rtm_msglen, (caddr_t)rtm);
88903311056SHajimu UMEMOTO 		if (m->m_pkthdr.len < rtm->rtm_msglen) {
89003311056SHajimu UMEMOTO 			m_freem(m);
89103311056SHajimu UMEMOTO 			m = NULL;
89203311056SHajimu UMEMOTO 		} else if (m->m_pkthdr.len > rtm->rtm_msglen)
89303311056SHajimu UMEMOTO 			m_adj(m, rtm->rtm_msglen - m->m_pkthdr.len);
894f2e5eb36SAlexander V. Chernikov 
895f2e5eb36SAlexander V. Chernikov 		free(rtm, M_TEMP);
896df8bae1dSRodney W. Grimes 	}
89792c227afSAlexander V. Chernikov 	if (m != NULL) {
898773aa053SAlexander V. Chernikov 		M_SETFIB(m, fibnum);
899528737fdSBjoern A. Zeeb 		m->m_flags |= RTS_FILTER_FIB;
900becc44d7SSam Leffler 		if (rp) {
901becc44d7SSam Leffler 			/*
902becc44d7SSam Leffler 			 * XXX insure we don't get a copy by
903becc44d7SSam Leffler 			 * invalidating our protocol
904becc44d7SSam Leffler 			 */
905becc44d7SSam Leffler 			unsigned short family = rp->rcb_proto.sp_family;
906becc44d7SSam Leffler 			rp->rcb_proto.sp_family = 0;
9073ca1a2d6SMax Laier 			rt_dispatch(m, saf);
908becc44d7SSam Leffler 			rp->rcb_proto.sp_family = family;
909becc44d7SSam Leffler 		} else
9103ca1a2d6SMax Laier 			rt_dispatch(m, saf);
911becc44d7SSam Leffler 	}
91292c227afSAlexander V. Chernikov 
913df8bae1dSRodney W. Grimes 	return (error);
914df8bae1dSRodney W. Grimes }
915df8bae1dSRodney W. Grimes 
91652041295SPoul-Henning Kamp static void
917e3a7aa6fSGleb Smirnoff rt_getmetrics(const struct rtentry *rt, struct rt_metrics *out)
91897d8d152SAndre Oppermann {
919e3a7aa6fSGleb Smirnoff 
92097d8d152SAndre Oppermann 	bzero(out, sizeof(*out));
921e3a7aa6fSGleb Smirnoff 	out->rmx_mtu = rt->rt_mtu;
922e3a7aa6fSGleb Smirnoff 	out->rmx_weight = rt->rt_weight;
923e3a7aa6fSGleb Smirnoff 	out->rmx_pksent = counter_u64_fetch(rt->rt_pksent);
924e27c3f48SOleg Bulyzhin 	/* Kernel -> userland timebase conversion. */
925e3a7aa6fSGleb Smirnoff 	out->rmx_expire = rt->rt_expire ?
926e3a7aa6fSGleb Smirnoff 	    rt->rt_expire - time_uptime + time_second : 0;
92797d8d152SAndre Oppermann }
92897d8d152SAndre Oppermann 
9297f33a738SJulian Elischer /*
9307f33a738SJulian Elischer  * Extract the addresses of the passed sockaddrs.
9317f33a738SJulian Elischer  * Do a little sanity checking so as to avoid bad memory references.
932076d0761SJulian Elischer  * This data is derived straight from userland.
9337f33a738SJulian Elischer  */
934076d0761SJulian Elischer static int
935becc44d7SSam Leffler rt_xaddrs(caddr_t cp, caddr_t cplim, struct rt_addrinfo *rtinfo)
936df8bae1dSRodney W. Grimes {
937e74642dfSLuigi Rizzo 	struct sockaddr *sa;
938e74642dfSLuigi Rizzo 	int i;
939df8bae1dSRodney W. Grimes 
940becc44d7SSam Leffler 	for (i = 0; i < RTAX_MAX && cp < cplim; i++) {
941df8bae1dSRodney W. Grimes 		if ((rtinfo->rti_addrs & (1 << i)) == 0)
942df8bae1dSRodney W. Grimes 			continue;
943ff6d0a59SJulian Elischer 		sa = (struct sockaddr *)cp;
9447f33a738SJulian Elischer 		/*
945076d0761SJulian Elischer 		 * It won't fit.
9467f33a738SJulian Elischer 		 */
947becc44d7SSam Leffler 		if (cp + sa->sa_len > cplim)
948076d0761SJulian Elischer 			return (EINVAL);
9497f33a738SJulian Elischer 		/*
9507f33a738SJulian Elischer 		 * there are no more.. quit now
9517f33a738SJulian Elischer 		 * If there are more bits, they are in error.
9527f33a738SJulian Elischer 		 * I've seen this. route(1) can evidently generate these.
9537f33a738SJulian Elischer 		 * This causes kernel to core dump.
954076d0761SJulian Elischer 		 * for compatibility, If we see this, point to a safe address.
9557f33a738SJulian Elischer 		 */
956076d0761SJulian Elischer 		if (sa->sa_len == 0) {
957076d0761SJulian Elischer 			rtinfo->rti_info[i] = &sa_zero;
958076d0761SJulian Elischer 			return (0); /* should be EINVAL but for compat */
959df8bae1dSRodney W. Grimes 		}
960076d0761SJulian Elischer 		/* accept it */
9610bebb544SHiroki Sato #ifdef INET6
9620bebb544SHiroki Sato 		if (sa->sa_family == AF_INET6)
9630bebb544SHiroki Sato 			sa6_embedscope((struct sockaddr_in6 *)sa,
9640bebb544SHiroki Sato 			    V_ip6_use_defzone);
9650bebb544SHiroki Sato #endif
966076d0761SJulian Elischer 		rtinfo->rti_info[i] = sa;
967e74642dfSLuigi Rizzo 		cp += SA_SIZE(sa);
968076d0761SJulian Elischer 	}
969076d0761SJulian Elischer 	return (0);
970df8bae1dSRodney W. Grimes }
971df8bae1dSRodney W. Grimes 
9726d076ae8SBjoern A. Zeeb /*
9733deb3649SAlexander V. Chernikov  * Fill in @dmask with valid netmask leaving original @smask
9743deb3649SAlexander V. Chernikov  * intact. Mostly used with radix netmasks.
9753deb3649SAlexander V. Chernikov  */
9763deb3649SAlexander V. Chernikov static struct sockaddr *
9773deb3649SAlexander V. Chernikov rtsock_fix_netmask(struct sockaddr *dst, struct sockaddr *smask,
9783deb3649SAlexander V. Chernikov     struct sockaddr_storage *dmask)
9793deb3649SAlexander V. Chernikov {
9803deb3649SAlexander V. Chernikov 	if (dst == NULL || smask == NULL)
9813deb3649SAlexander V. Chernikov 		return (NULL);
9823deb3649SAlexander V. Chernikov 
9833deb3649SAlexander V. Chernikov 	memset(dmask, 0, dst->sa_len);
9843deb3649SAlexander V. Chernikov 	memcpy(dmask, smask, smask->sa_len);
9853deb3649SAlexander V. Chernikov 	dmask->ss_len = dst->sa_len;
9863deb3649SAlexander V. Chernikov 	dmask->ss_family = dst->sa_family;
9873deb3649SAlexander V. Chernikov 
9883deb3649SAlexander V. Chernikov 	return ((struct sockaddr *)dmask);
9893deb3649SAlexander V. Chernikov }
9903deb3649SAlexander V. Chernikov 
9913deb3649SAlexander V. Chernikov /*
992*6db47af4SAlexander V. Chernikov  * Writes information related to @rtinfo object to newly-allocated mbuf.
993*6db47af4SAlexander V. Chernikov  * Assumes MCLBYTES is enough to construct any message.
994*6db47af4SAlexander V. Chernikov  * Used for OS notifications of vaious events (if/ifa announces,etc)
995*6db47af4SAlexander V. Chernikov  *
996*6db47af4SAlexander V. Chernikov  * Returns allocated mbuf or NULL on failure.
9976d076ae8SBjoern A. Zeeb  */
998df8bae1dSRodney W. Grimes static struct mbuf *
999*6db47af4SAlexander V. Chernikov rtsock_msg_mbuf(int type, struct rt_addrinfo *rtinfo)
1000df8bae1dSRodney W. Grimes {
10015dfc91d7SLuigi Rizzo 	struct rt_msghdr *rtm;
10025dfc91d7SLuigi Rizzo 	struct mbuf *m;
10035dfc91d7SLuigi Rizzo 	int i;
10045dfc91d7SLuigi Rizzo 	struct sockaddr *sa;
10056bbfef90SHiroki Sato #ifdef INET6
10066bbfef90SHiroki Sato 	struct sockaddr_storage ss;
10076bbfef90SHiroki Sato 	struct sockaddr_in6 *sin6;
10086bbfef90SHiroki Sato #endif
1009df8bae1dSRodney W. Grimes 	int len, dlen;
1010df8bae1dSRodney W. Grimes 
1011df8bae1dSRodney W. Grimes 	switch (type) {
1012df8bae1dSRodney W. Grimes 
1013df8bae1dSRodney W. Grimes 	case RTM_DELADDR:
1014df8bae1dSRodney W. Grimes 	case RTM_NEWADDR:
1015df8bae1dSRodney W. Grimes 		len = sizeof(struct ifa_msghdr);
1016df8bae1dSRodney W. Grimes 		break;
1017df8bae1dSRodney W. Grimes 
1018477180fbSGarrett Wollman 	case RTM_DELMADDR:
1019477180fbSGarrett Wollman 	case RTM_NEWMADDR:
1020477180fbSGarrett Wollman 		len = sizeof(struct ifma_msghdr);
1021477180fbSGarrett Wollman 		break;
1022477180fbSGarrett Wollman 
1023df8bae1dSRodney W. Grimes 	case RTM_IFINFO:
1024df8bae1dSRodney W. Grimes 		len = sizeof(struct if_msghdr);
1025df8bae1dSRodney W. Grimes 		break;
1026df8bae1dSRodney W. Grimes 
10277b6edd04SRuslan Ermilov 	case RTM_IFANNOUNCE:
1028b83a279fSSam Leffler 	case RTM_IEEE80211:
10297b6edd04SRuslan Ermilov 		len = sizeof(struct if_announcemsghdr);
10307b6edd04SRuslan Ermilov 		break;
10317b6edd04SRuslan Ermilov 
1032df8bae1dSRodney W. Grimes 	default:
1033df8bae1dSRodney W. Grimes 		len = sizeof(struct rt_msghdr);
1034df8bae1dSRodney W. Grimes 	}
1035c69f77c3SGleb Smirnoff 
1036c69f77c3SGleb Smirnoff 	/* XXXGL: can we use MJUMPAGESIZE cluster here? */
1037c69f77c3SGleb Smirnoff 	KASSERT(len <= MCLBYTES, ("%s: message too big", __func__));
1038c69f77c3SGleb Smirnoff 	if (len > MHLEN)
1039c69f77c3SGleb Smirnoff 		m = m_getcl(M_NOWAIT, MT_DATA, M_PKTHDR);
1040c69f77c3SGleb Smirnoff 	else
1041eb1b1807SGleb Smirnoff 		m = m_gethdr(M_NOWAIT, MT_DATA);
10425dfc91d7SLuigi Rizzo 	if (m == NULL)
104333841545SHajimu UMEMOTO 		return (m);
1044c69f77c3SGleb Smirnoff 
1045df8bae1dSRodney W. Grimes 	m->m_pkthdr.len = m->m_len = len;
1046df8bae1dSRodney W. Grimes 	rtm = mtod(m, struct rt_msghdr *);
1047df8bae1dSRodney W. Grimes 	bzero((caddr_t)rtm, len);
1048df8bae1dSRodney W. Grimes 	for (i = 0; i < RTAX_MAX; i++) {
1049df8bae1dSRodney W. Grimes 		if ((sa = rtinfo->rti_info[i]) == NULL)
1050df8bae1dSRodney W. Grimes 			continue;
1051df8bae1dSRodney W. Grimes 		rtinfo->rti_addrs |= (1 << i);
1052e74642dfSLuigi Rizzo 		dlen = SA_SIZE(sa);
10536bbfef90SHiroki Sato #ifdef INET6
10545c9fa630SHiroki Sato 		if (V_deembed_scopeid && sa->sa_family == AF_INET6) {
10556bbfef90SHiroki Sato 			sin6 = (struct sockaddr_in6 *)&ss;
10566bbfef90SHiroki Sato 			bcopy(sa, sin6, sizeof(*sin6));
10576bbfef90SHiroki Sato 			if (sa6_recoverscope(sin6) == 0)
10586bbfef90SHiroki Sato 				sa = (struct sockaddr *)sin6;
10596bbfef90SHiroki Sato 		}
10606bbfef90SHiroki Sato #endif
1061df8bae1dSRodney W. Grimes 		m_copyback(m, len, dlen, (caddr_t)sa);
1062df8bae1dSRodney W. Grimes 		len += dlen;
1063df8bae1dSRodney W. Grimes 	}
1064df8bae1dSRodney W. Grimes 	if (m->m_pkthdr.len != len) {
1065df8bae1dSRodney W. Grimes 		m_freem(m);
1066df8bae1dSRodney W. Grimes 		return (NULL);
1067df8bae1dSRodney W. Grimes 	}
1068df8bae1dSRodney W. Grimes 	rtm->rtm_msglen = len;
1069df8bae1dSRodney W. Grimes 	rtm->rtm_version = RTM_VERSION;
1070df8bae1dSRodney W. Grimes 	rtm->rtm_type = type;
1071df8bae1dSRodney W. Grimes 	return (m);
1072df8bae1dSRodney W. Grimes }
1073df8bae1dSRodney W. Grimes 
10746d076ae8SBjoern A. Zeeb /*
1075f2e5eb36SAlexander V. Chernikov  * Writes information related to @rtinfo object to preallocated buffer.
1076f2e5eb36SAlexander V. Chernikov  * Stores needed size in @plen. If @w is NULL, calculates size without
1077f2e5eb36SAlexander V. Chernikov  * writing.
1078f2e5eb36SAlexander V. Chernikov  * Used for sysctl dumps and rtsock answers (RTM_DEL/RTM_GET) generation.
1079f2e5eb36SAlexander V. Chernikov  *
1080f2e5eb36SAlexander V. Chernikov  * Returns 0 on success.
1081f2e5eb36SAlexander V. Chernikov  *
10826d076ae8SBjoern A. Zeeb  */
1083df8bae1dSRodney W. Grimes static int
1084f2e5eb36SAlexander V. Chernikov rtsock_msg_buffer(int type, struct rt_addrinfo *rtinfo, struct walkarg *w, int *plen)
1085df8bae1dSRodney W. Grimes {
10865dfc91d7SLuigi Rizzo 	int i;
1087f2e5eb36SAlexander V. Chernikov 	int len, buflen = 0, dlen;
1088de46b2c6SAlexander V. Chernikov 	caddr_t cp = NULL;
1089f2e5eb36SAlexander V. Chernikov 	struct rt_msghdr *rtm = NULL;
10906bbfef90SHiroki Sato #ifdef INET6
10916bbfef90SHiroki Sato 	struct sockaddr_storage ss;
10926bbfef90SHiroki Sato 	struct sockaddr_in6 *sin6;
10936bbfef90SHiroki Sato #endif
1094df8bae1dSRodney W. Grimes 
1095df8bae1dSRodney W. Grimes 	switch (type) {
1096df8bae1dSRodney W. Grimes 
1097df8bae1dSRodney W. Grimes 	case RTM_DELADDR:
1098df8bae1dSRodney W. Grimes 	case RTM_NEWADDR:
10996d076ae8SBjoern A. Zeeb 		if (w != NULL && w->w_op == NET_RT_IFLISTL) {
11006d076ae8SBjoern A. Zeeb #ifdef COMPAT_FREEBSD32
11016d076ae8SBjoern A. Zeeb 			if (w->w_req->flags & SCTL_MASK32)
11026d076ae8SBjoern A. Zeeb 				len = sizeof(struct ifa_msghdrl32);
11036d076ae8SBjoern A. Zeeb 			else
11046d076ae8SBjoern A. Zeeb #endif
11056d076ae8SBjoern A. Zeeb 				len = sizeof(struct ifa_msghdrl);
11066d076ae8SBjoern A. Zeeb 		} else
1107df8bae1dSRodney W. Grimes 			len = sizeof(struct ifa_msghdr);
1108df8bae1dSRodney W. Grimes 		break;
1109df8bae1dSRodney W. Grimes 
1110df8bae1dSRodney W. Grimes 	case RTM_IFINFO:
1111427a928aSKonstantin Belousov #ifdef COMPAT_FREEBSD32
1112427a928aSKonstantin Belousov 		if (w != NULL && w->w_req->flags & SCTL_MASK32) {
11136d076ae8SBjoern A. Zeeb 			if (w->w_op == NET_RT_IFLISTL)
11146d076ae8SBjoern A. Zeeb 				len = sizeof(struct if_msghdrl32);
11156d076ae8SBjoern A. Zeeb 			else
1116427a928aSKonstantin Belousov 				len = sizeof(struct if_msghdr32);
1117427a928aSKonstantin Belousov 			break;
1118427a928aSKonstantin Belousov 		}
1119427a928aSKonstantin Belousov #endif
11206d076ae8SBjoern A. Zeeb 		if (w != NULL && w->w_op == NET_RT_IFLISTL)
11216d076ae8SBjoern A. Zeeb 			len = sizeof(struct if_msghdrl);
11226d076ae8SBjoern A. Zeeb 		else
1123df8bae1dSRodney W. Grimes 			len = sizeof(struct if_msghdr);
1124df8bae1dSRodney W. Grimes 		break;
1125df8bae1dSRodney W. Grimes 
112605b2efe0SBruce M Simpson 	case RTM_NEWMADDR:
112705b2efe0SBruce M Simpson 		len = sizeof(struct ifma_msghdr);
112805b2efe0SBruce M Simpson 		break;
112905b2efe0SBruce M Simpson 
1130df8bae1dSRodney W. Grimes 	default:
1131df8bae1dSRodney W. Grimes 		len = sizeof(struct rt_msghdr);
1132df8bae1dSRodney W. Grimes 	}
1133f2e5eb36SAlexander V. Chernikov 
1134f2e5eb36SAlexander V. Chernikov 	if (w != NULL) {
1135f2e5eb36SAlexander V. Chernikov 		rtm = (struct rt_msghdr *)w->w_tmem;
1136f2e5eb36SAlexander V. Chernikov 		buflen = w->w_tmemsize - len;
1137f2e5eb36SAlexander V. Chernikov 		cp = (caddr_t)w->w_tmem + len;
1138f2e5eb36SAlexander V. Chernikov 	}
1139f2e5eb36SAlexander V. Chernikov 
1140f2e5eb36SAlexander V. Chernikov 	rtinfo->rti_addrs = 0;
1141df8bae1dSRodney W. Grimes 	for (i = 0; i < RTAX_MAX; i++) {
11425dfc91d7SLuigi Rizzo 		struct sockaddr *sa;
1143df8bae1dSRodney W. Grimes 
11445dfc91d7SLuigi Rizzo 		if ((sa = rtinfo->rti_info[i]) == NULL)
1145df8bae1dSRodney W. Grimes 			continue;
1146df8bae1dSRodney W. Grimes 		rtinfo->rti_addrs |= (1 << i);
1147e74642dfSLuigi Rizzo 		dlen = SA_SIZE(sa);
1148f2e5eb36SAlexander V. Chernikov 		if (cp != NULL && buflen >= dlen) {
11496bbfef90SHiroki Sato #ifdef INET6
11505c9fa630SHiroki Sato 			if (V_deembed_scopeid && sa->sa_family == AF_INET6) {
11516bbfef90SHiroki Sato 				sin6 = (struct sockaddr_in6 *)&ss;
11526bbfef90SHiroki Sato 				bcopy(sa, sin6, sizeof(*sin6));
11536bbfef90SHiroki Sato 				if (sa6_recoverscope(sin6) == 0)
11546bbfef90SHiroki Sato 					sa = (struct sockaddr *)sin6;
11556bbfef90SHiroki Sato 			}
11566bbfef90SHiroki Sato #endif
1157df8bae1dSRodney W. Grimes 			bcopy((caddr_t)sa, cp, (unsigned)dlen);
1158df8bae1dSRodney W. Grimes 			cp += dlen;
1159f2e5eb36SAlexander V. Chernikov 			buflen -= dlen;
1160f2e5eb36SAlexander V. Chernikov 		} else if (cp != NULL) {
1161f2e5eb36SAlexander V. Chernikov 			/*
1162f2e5eb36SAlexander V. Chernikov 			 * Buffer too small. Count needed size
1163f2e5eb36SAlexander V. Chernikov 			 * and return with error.
1164f2e5eb36SAlexander V. Chernikov 			 */
1165f2e5eb36SAlexander V. Chernikov 			cp = NULL;
1166df8bae1dSRodney W. Grimes 		}
1167f2e5eb36SAlexander V. Chernikov 
1168df8bae1dSRodney W. Grimes 		len += dlen;
1169df8bae1dSRodney W. Grimes 	}
1170f2e5eb36SAlexander V. Chernikov 
1171f2e5eb36SAlexander V. Chernikov 	if (cp != NULL) {
1172f2e5eb36SAlexander V. Chernikov 		dlen = ALIGN(len) - len;
1173f2e5eb36SAlexander V. Chernikov 		if (buflen < dlen)
1174f2e5eb36SAlexander V. Chernikov 			cp = NULL;
1175f2e5eb36SAlexander V. Chernikov 		else
1176f2e5eb36SAlexander V. Chernikov 			buflen -= dlen;
1177f2e5eb36SAlexander V. Chernikov 	}
1178694ff264SAndrew Gallatin 	len = ALIGN(len);
1179df8bae1dSRodney W. Grimes 
1180f2e5eb36SAlexander V. Chernikov 	if (cp != NULL) {
1181f2e5eb36SAlexander V. Chernikov 		/* fill header iff buffer is large enough */
1182df8bae1dSRodney W. Grimes 		rtm->rtm_version = RTM_VERSION;
1183df8bae1dSRodney W. Grimes 		rtm->rtm_type = type;
1184df8bae1dSRodney W. Grimes 		rtm->rtm_msglen = len;
1185df8bae1dSRodney W. Grimes 	}
1186f2e5eb36SAlexander V. Chernikov 
1187f2e5eb36SAlexander V. Chernikov 	*plen = len;
1188f2e5eb36SAlexander V. Chernikov 
1189f2e5eb36SAlexander V. Chernikov 	if (w != NULL && cp == NULL)
1190f2e5eb36SAlexander V. Chernikov 		return (ENOBUFS);
1191f2e5eb36SAlexander V. Chernikov 
1192f2e5eb36SAlexander V. Chernikov 	return (0);
1193df8bae1dSRodney W. Grimes }
1194df8bae1dSRodney W. Grimes 
1195df8bae1dSRodney W. Grimes /*
1196df8bae1dSRodney W. Grimes  * This routine is called to generate a message from the routing
1197df8bae1dSRodney W. Grimes  * socket indicating that a redirect has occured, a routing lookup
1198df8bae1dSRodney W. Grimes  * has failed, or that a protocol has detected timeouts to a particular
1199df8bae1dSRodney W. Grimes  * destination.
1200df8bae1dSRodney W. Grimes  */
1201df8bae1dSRodney W. Grimes void
1202528737fdSBjoern A. Zeeb rt_missmsg_fib(int type, struct rt_addrinfo *rtinfo, int flags, int error,
1203528737fdSBjoern A. Zeeb     int fibnum)
1204df8bae1dSRodney W. Grimes {
1205becc44d7SSam Leffler 	struct rt_msghdr *rtm;
1206becc44d7SSam Leffler 	struct mbuf *m;
1207df8bae1dSRodney W. Grimes 	struct sockaddr *sa = rtinfo->rti_info[RTAX_DST];
1208df8bae1dSRodney W. Grimes 
1209c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
1210df8bae1dSRodney W. Grimes 		return;
1211*6db47af4SAlexander V. Chernikov 	m = rtsock_msg_mbuf(type, rtinfo);
12125dfc91d7SLuigi Rizzo 	if (m == NULL)
1213df8bae1dSRodney W. Grimes 		return;
1214528737fdSBjoern A. Zeeb 
12157d9b6df1SAlexander V. Chernikov 	if (fibnum != RT_ALL_FIBS) {
1216528737fdSBjoern A. Zeeb 		KASSERT(fibnum >= 0 && fibnum < rt_numfibs, ("%s: fibnum out "
1217528737fdSBjoern A. Zeeb 		    "of range 0 <= %d < %d", __func__, fibnum, rt_numfibs));
1218528737fdSBjoern A. Zeeb 		M_SETFIB(m, fibnum);
1219528737fdSBjoern A. Zeeb 		m->m_flags |= RTS_FILTER_FIB;
1220528737fdSBjoern A. Zeeb 	}
1221528737fdSBjoern A. Zeeb 
1222df8bae1dSRodney W. Grimes 	rtm = mtod(m, struct rt_msghdr *);
1223df8bae1dSRodney W. Grimes 	rtm->rtm_flags = RTF_DONE | flags;
1224df8bae1dSRodney W. Grimes 	rtm->rtm_errno = error;
1225df8bae1dSRodney W. Grimes 	rtm->rtm_addrs = rtinfo->rti_addrs;
12263ca1a2d6SMax Laier 	rt_dispatch(m, sa ? sa->sa_family : AF_UNSPEC);
1227df8bae1dSRodney W. Grimes }
1228df8bae1dSRodney W. Grimes 
1229528737fdSBjoern A. Zeeb void
1230528737fdSBjoern A. Zeeb rt_missmsg(int type, struct rt_addrinfo *rtinfo, int flags, int error)
1231528737fdSBjoern A. Zeeb {
1232528737fdSBjoern A. Zeeb 
12337d9b6df1SAlexander V. Chernikov 	rt_missmsg_fib(type, rtinfo, flags, error, RT_ALL_FIBS);
1234528737fdSBjoern A. Zeeb }
1235528737fdSBjoern A. Zeeb 
1236df8bae1dSRodney W. Grimes /*
1237df8bae1dSRodney W. Grimes  * This routine is called to generate a message from the routing
1238df8bae1dSRodney W. Grimes  * socket indicating that the status of a network interface has changed.
1239df8bae1dSRodney W. Grimes  */
1240df8bae1dSRodney W. Grimes void
1241becc44d7SSam Leffler rt_ifmsg(struct ifnet *ifp)
1242df8bae1dSRodney W. Grimes {
1243becc44d7SSam Leffler 	struct if_msghdr *ifm;
1244df8bae1dSRodney W. Grimes 	struct mbuf *m;
1245df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
1246df8bae1dSRodney W. Grimes 
1247c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
1248df8bae1dSRodney W. Grimes 		return;
1249df8bae1dSRodney W. Grimes 	bzero((caddr_t)&info, sizeof(info));
1250*6db47af4SAlexander V. Chernikov 	m = rtsock_msg_mbuf(RTM_IFINFO, &info);
12515dfc91d7SLuigi Rizzo 	if (m == NULL)
1252df8bae1dSRodney W. Grimes 		return;
1253df8bae1dSRodney W. Grimes 	ifm = mtod(m, struct if_msghdr *);
1254df8bae1dSRodney W. Grimes 	ifm->ifm_index = ifp->if_index;
1255292ee7beSRobert Watson 	ifm->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
1256df8bae1dSRodney W. Grimes 	ifm->ifm_data = ifp->if_data;
1257df8bae1dSRodney W. Grimes 	ifm->ifm_addrs = 0;
12583ca1a2d6SMax Laier 	rt_dispatch(m, AF_UNSPEC);
1259df8bae1dSRodney W. Grimes }
1260df8bae1dSRodney W. Grimes 
1261df8bae1dSRodney W. Grimes /*
12624cbac30bSAlexander V. Chernikov  * Announce interface address arrival/withdraw.
12634cbac30bSAlexander V. Chernikov  * Please do not call directly, use rt_addrmsg().
12644cbac30bSAlexander V. Chernikov  * Assume input data to be valid.
12654cbac30bSAlexander V. Chernikov  * Returns 0 on success.
1266df8bae1dSRodney W. Grimes  */
12674cbac30bSAlexander V. Chernikov int
12684cbac30bSAlexander V. Chernikov rtsock_addrmsg(int cmd, struct ifaddr *ifa, int fibnum)
1269df8bae1dSRodney W. Grimes {
1270df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
12714cbac30bSAlexander V. Chernikov 	struct sockaddr *sa;
12724cbac30bSAlexander V. Chernikov 	int ncmd;
12734cbac30bSAlexander V. Chernikov 	struct mbuf *m;
12744cbac30bSAlexander V. Chernikov 	struct ifa_msghdr *ifam;
1275df8bae1dSRodney W. Grimes 	struct ifnet *ifp = ifa->ifa_ifp;
12763deb3649SAlexander V. Chernikov 	struct sockaddr_storage ss;
1277df8bae1dSRodney W. Grimes 
1278c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
12794cbac30bSAlexander V. Chernikov 		return (0);
1280df8bae1dSRodney W. Grimes 
12814cbac30bSAlexander V. Chernikov 	ncmd = cmd == RTM_ADD ? RTM_NEWADDR : RTM_DELADDR;
12824cbac30bSAlexander V. Chernikov 
12834cbac30bSAlexander V. Chernikov 	bzero((caddr_t)&info, sizeof(info));
1284becc44d7SSam Leffler 	info.rti_info[RTAX_IFA] = sa = ifa->ifa_addr;
12854a0d6638SRuslan Ermilov 	info.rti_info[RTAX_IFP] = ifp->if_addr->ifa_addr;
12863deb3649SAlexander V. Chernikov 	info.rti_info[RTAX_NETMASK] = rtsock_fix_netmask(
12873deb3649SAlexander V. Chernikov 	    info.rti_info[RTAX_IFP], ifa->ifa_netmask, &ss);
1288becc44d7SSam Leffler 	info.rti_info[RTAX_BRD] = ifa->ifa_dstaddr;
1289*6db47af4SAlexander V. Chernikov 	if ((m = rtsock_msg_mbuf(ncmd, &info)) == NULL)
12904cbac30bSAlexander V. Chernikov 		return (ENOBUFS);
1291df8bae1dSRodney W. Grimes 	ifam = mtod(m, struct ifa_msghdr *);
1292df8bae1dSRodney W. Grimes 	ifam->ifam_index = ifp->if_index;
1293df8bae1dSRodney W. Grimes 	ifam->ifam_metric = ifa->ifa_metric;
1294df8bae1dSRodney W. Grimes 	ifam->ifam_flags = ifa->ifa_flags;
1295df8bae1dSRodney W. Grimes 	ifam->ifam_addrs = info.rti_addrs;
12964cbac30bSAlexander V. Chernikov 
12974cbac30bSAlexander V. Chernikov 	if (fibnum != RT_ALL_FIBS) {
12984cbac30bSAlexander V. Chernikov 		M_SETFIB(m, fibnum);
12994cbac30bSAlexander V. Chernikov 		m->m_flags |= RTS_FILTER_FIB;
1300df8bae1dSRodney W. Grimes 	}
13014cbac30bSAlexander V. Chernikov 
13024cbac30bSAlexander V. Chernikov 	rt_dispatch(m, sa ? sa->sa_family : AF_UNSPEC);
13034cbac30bSAlexander V. Chernikov 
13044cbac30bSAlexander V. Chernikov 	return (0);
13054cbac30bSAlexander V. Chernikov }
13064cbac30bSAlexander V. Chernikov 
13074cbac30bSAlexander V. Chernikov /*
13084cbac30bSAlexander V. Chernikov  * Announce route addition/removal.
13094cbac30bSAlexander V. Chernikov  * Please do not call directly, use rt_routemsg().
13104cbac30bSAlexander V. Chernikov  * Note that @rt data MAY be inconsistent/invalid:
13114cbac30bSAlexander V. Chernikov  * if some userland app sends us "invalid" route message (invalid mask,
13124cbac30bSAlexander V. Chernikov  * no dst, wrong address families, etc...) we need to pass it back
13134cbac30bSAlexander V. Chernikov  * to app (and any other rtsock consumers) with rtm_errno field set to
13144cbac30bSAlexander V. Chernikov  * non-zero value.
13154cbac30bSAlexander V. Chernikov  *
13164cbac30bSAlexander V. Chernikov  * Returns 0 on success.
13174cbac30bSAlexander V. Chernikov  */
13184cbac30bSAlexander V. Chernikov int
13194cbac30bSAlexander V. Chernikov rtsock_routemsg(int cmd, struct ifnet *ifp, int error, struct rtentry *rt,
13204cbac30bSAlexander V. Chernikov     int fibnum)
13214cbac30bSAlexander V. Chernikov {
13224cbac30bSAlexander V. Chernikov 	struct rt_addrinfo info;
13234cbac30bSAlexander V. Chernikov 	struct sockaddr *sa;
13244cbac30bSAlexander V. Chernikov 	struct mbuf *m;
13255dfc91d7SLuigi Rizzo 	struct rt_msghdr *rtm;
13263deb3649SAlexander V. Chernikov 	struct sockaddr_storage ss;
1327df8bae1dSRodney W. Grimes 
1328c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
13294cbac30bSAlexander V. Chernikov 		return (0);
13304cbac30bSAlexander V. Chernikov 
13314cbac30bSAlexander V. Chernikov 	bzero((caddr_t)&info, sizeof(info));
1332becc44d7SSam Leffler 	info.rti_info[RTAX_DST] = sa = rt_key(rt);
13333deb3649SAlexander V. Chernikov 	info.rti_info[RTAX_NETMASK] = rtsock_fix_netmask(sa, rt_mask(rt), &ss);
1334becc44d7SSam Leffler 	info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
1335*6db47af4SAlexander V. Chernikov 	if ((m = rtsock_msg_mbuf(cmd, &info)) == NULL)
13364cbac30bSAlexander V. Chernikov 		return (ENOBUFS);
1337df8bae1dSRodney W. Grimes 	rtm = mtod(m, struct rt_msghdr *);
1338df8bae1dSRodney W. Grimes 	rtm->rtm_index = ifp->if_index;
1339df8bae1dSRodney W. Grimes 	rtm->rtm_flags |= rt->rt_flags;
1340df8bae1dSRodney W. Grimes 	rtm->rtm_errno = error;
1341df8bae1dSRodney W. Grimes 	rtm->rtm_addrs = info.rti_addrs;
13424cbac30bSAlexander V. Chernikov 
13437d9b6df1SAlexander V. Chernikov 	if (fibnum != RT_ALL_FIBS) {
1344528737fdSBjoern A. Zeeb 		M_SETFIB(m, fibnum);
1345528737fdSBjoern A. Zeeb 		m->m_flags |= RTS_FILTER_FIB;
1346528737fdSBjoern A. Zeeb 	}
13474cbac30bSAlexander V. Chernikov 
13483ca1a2d6SMax Laier 	rt_dispatch(m, sa ? sa->sa_family : AF_UNSPEC);
13494cbac30bSAlexander V. Chernikov 
13504cbac30bSAlexander V. Chernikov 	return (0);
1351df8bae1dSRodney W. Grimes }
1352df8bae1dSRodney W. Grimes 
1353477180fbSGarrett Wollman /*
1354477180fbSGarrett Wollman  * This is the analogue to the rt_newaddrmsg which performs the same
1355477180fbSGarrett Wollman  * function but for multicast group memberhips.  This is easier since
1356477180fbSGarrett Wollman  * there is no route state to worry about.
1357477180fbSGarrett Wollman  */
1358477180fbSGarrett Wollman void
1359becc44d7SSam Leffler rt_newmaddrmsg(int cmd, struct ifmultiaddr *ifma)
1360477180fbSGarrett Wollman {
1361477180fbSGarrett Wollman 	struct rt_addrinfo info;
13625dfc91d7SLuigi Rizzo 	struct mbuf *m = NULL;
1363477180fbSGarrett Wollman 	struct ifnet *ifp = ifma->ifma_ifp;
1364477180fbSGarrett Wollman 	struct ifma_msghdr *ifmam;
1365477180fbSGarrett Wollman 
1366c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
1367477180fbSGarrett Wollman 		return;
1368477180fbSGarrett Wollman 
1369477180fbSGarrett Wollman 	bzero((caddr_t)&info, sizeof(info));
1370becc44d7SSam Leffler 	info.rti_info[RTAX_IFA] = ifma->ifma_addr;
13714a0d6638SRuslan Ermilov 	info.rti_info[RTAX_IFP] = ifp ? ifp->if_addr->ifa_addr : NULL;
1372477180fbSGarrett Wollman 	/*
1373477180fbSGarrett Wollman 	 * If a link-layer address is present, present it as a ``gateway''
1374477180fbSGarrett Wollman 	 * (similarly to how ARP entries, e.g., are presented).
1375477180fbSGarrett Wollman 	 */
1376becc44d7SSam Leffler 	info.rti_info[RTAX_GATEWAY] = ifma->ifma_lladdr;
1377*6db47af4SAlexander V. Chernikov 	m = rtsock_msg_mbuf(cmd, &info);
1378becc44d7SSam Leffler 	if (m == NULL)
1379477180fbSGarrett Wollman 		return;
1380477180fbSGarrett Wollman 	ifmam = mtod(m, struct ifma_msghdr *);
138175ae0c01SBruce M Simpson 	KASSERT(ifp != NULL, ("%s: link-layer multicast address w/o ifp\n",
138275ae0c01SBruce M Simpson 	    __func__));
1383477180fbSGarrett Wollman 	ifmam->ifmam_index = ifp->if_index;
1384477180fbSGarrett Wollman 	ifmam->ifmam_addrs = info.rti_addrs;
13853ca1a2d6SMax Laier 	rt_dispatch(m, ifma->ifma_addr ? ifma->ifma_addr->sa_family : AF_UNSPEC);
1386477180fbSGarrett Wollman }
138752041295SPoul-Henning Kamp 
1388b83a279fSSam Leffler static struct mbuf *
1389b83a279fSSam Leffler rt_makeifannouncemsg(struct ifnet *ifp, int type, int what,
1390b83a279fSSam Leffler 	struct rt_addrinfo *info)
1391b83a279fSSam Leffler {
1392b83a279fSSam Leffler 	struct if_announcemsghdr *ifan;
1393b83a279fSSam Leffler 	struct mbuf *m;
1394b83a279fSSam Leffler 
1395c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
1396b83a279fSSam Leffler 		return NULL;
1397b83a279fSSam Leffler 	bzero((caddr_t)info, sizeof(*info));
1398*6db47af4SAlexander V. Chernikov 	m = rtsock_msg_mbuf(type, info);
1399b83a279fSSam Leffler 	if (m != NULL) {
1400b83a279fSSam Leffler 		ifan = mtod(m, struct if_announcemsghdr *);
1401b83a279fSSam Leffler 		ifan->ifan_index = ifp->if_index;
1402b83a279fSSam Leffler 		strlcpy(ifan->ifan_name, ifp->if_xname,
1403b83a279fSSam Leffler 			sizeof(ifan->ifan_name));
1404b83a279fSSam Leffler 		ifan->ifan_what = what;
1405b83a279fSSam Leffler 	}
1406b83a279fSSam Leffler 	return m;
1407b83a279fSSam Leffler }
1408b83a279fSSam Leffler 
1409b83a279fSSam Leffler /*
1410b83a279fSSam Leffler  * This is called to generate routing socket messages indicating
1411b83a279fSSam Leffler  * IEEE80211 wireless events.
1412b83a279fSSam Leffler  * XXX we piggyback on the RTM_IFANNOUNCE msg format in a clumsy way.
1413b83a279fSSam Leffler  */
1414b83a279fSSam Leffler void
1415b83a279fSSam Leffler rt_ieee80211msg(struct ifnet *ifp, int what, void *data, size_t data_len)
1416b83a279fSSam Leffler {
1417b83a279fSSam Leffler 	struct mbuf *m;
1418b83a279fSSam Leffler 	struct rt_addrinfo info;
1419b83a279fSSam Leffler 
1420b83a279fSSam Leffler 	m = rt_makeifannouncemsg(ifp, RTM_IEEE80211, what, &info);
1421b83a279fSSam Leffler 	if (m != NULL) {
1422b83a279fSSam Leffler 		/*
1423b83a279fSSam Leffler 		 * Append the ieee80211 data.  Try to stick it in the
1424b83a279fSSam Leffler 		 * mbuf containing the ifannounce msg; otherwise allocate
1425b83a279fSSam Leffler 		 * a new mbuf and append.
1426b83a279fSSam Leffler 		 *
1427b83a279fSSam Leffler 		 * NB: we assume m is a single mbuf.
1428b83a279fSSam Leffler 		 */
1429b83a279fSSam Leffler 		if (data_len > M_TRAILINGSPACE(m)) {
1430b83a279fSSam Leffler 			struct mbuf *n = m_get(M_NOWAIT, MT_DATA);
1431b83a279fSSam Leffler 			if (n == NULL) {
1432b83a279fSSam Leffler 				m_freem(m);
1433b83a279fSSam Leffler 				return;
1434b83a279fSSam Leffler 			}
1435b83a279fSSam Leffler 			bcopy(data, mtod(n, void *), data_len);
1436b83a279fSSam Leffler 			n->m_len = data_len;
1437b83a279fSSam Leffler 			m->m_next = n;
1438b83a279fSSam Leffler 		} else if (data_len > 0) {
1439b83a279fSSam Leffler 			bcopy(data, mtod(m, u_int8_t *) + m->m_len, data_len);
1440b83a279fSSam Leffler 			m->m_len += data_len;
1441b83a279fSSam Leffler 		}
1442b83a279fSSam Leffler 		if (m->m_flags & M_PKTHDR)
1443b83a279fSSam Leffler 			m->m_pkthdr.len += data_len;
1444b83a279fSSam Leffler 		mtod(m, struct if_announcemsghdr *)->ifan_msglen += data_len;
14453ca1a2d6SMax Laier 		rt_dispatch(m, AF_UNSPEC);
1446b83a279fSSam Leffler 	}
1447b83a279fSSam Leffler }
1448b83a279fSSam Leffler 
1449df8bae1dSRodney W. Grimes /*
14507b6edd04SRuslan Ermilov  * This is called to generate routing socket messages indicating
14517b6edd04SRuslan Ermilov  * network interface arrival and departure.
14527b6edd04SRuslan Ermilov  */
14537b6edd04SRuslan Ermilov void
1454becc44d7SSam Leffler rt_ifannouncemsg(struct ifnet *ifp, int what)
14557b6edd04SRuslan Ermilov {
14567b6edd04SRuslan Ermilov 	struct mbuf *m;
14577b6edd04SRuslan Ermilov 	struct rt_addrinfo info;
14587b6edd04SRuslan Ermilov 
1459b83a279fSSam Leffler 	m = rt_makeifannouncemsg(ifp, RTM_IFANNOUNCE, what, &info);
1460b83a279fSSam Leffler 	if (m != NULL)
14613ca1a2d6SMax Laier 		rt_dispatch(m, AF_UNSPEC);
1462becc44d7SSam Leffler }
1463becc44d7SSam Leffler 
1464becc44d7SSam Leffler static void
14653ca1a2d6SMax Laier rt_dispatch(struct mbuf *m, sa_family_t saf)
1466becc44d7SSam Leffler {
1467d989c7b3SRobert Watson 	struct m_tag *tag;
1468becc44d7SSam Leffler 
1469d989c7b3SRobert Watson 	/*
1470d989c7b3SRobert Watson 	 * Preserve the family from the sockaddr, if any, in an m_tag for
1471d989c7b3SRobert Watson 	 * use when injecting the mbuf into the routing socket buffer from
1472d989c7b3SRobert Watson 	 * the netisr.
1473d989c7b3SRobert Watson 	 */
14743ca1a2d6SMax Laier 	if (saf != AF_UNSPEC) {
1475d989c7b3SRobert Watson 		tag = m_tag_get(PACKET_TAG_RTSOCKFAM, sizeof(unsigned short),
1476d989c7b3SRobert Watson 		    M_NOWAIT);
1477d989c7b3SRobert Watson 		if (tag == NULL) {
1478d989c7b3SRobert Watson 			m_freem(m);
1479d989c7b3SRobert Watson 			return;
1480d989c7b3SRobert Watson 		}
14813ca1a2d6SMax Laier 		*(unsigned short *)(tag + 1) = saf;
1482d989c7b3SRobert Watson 		m_tag_prepend(m, tag);
1483d989c7b3SRobert Watson 	}
148421ca7b57SMarko Zec #ifdef VIMAGE
148521ca7b57SMarko Zec 	if (V_loif)
148621ca7b57SMarko Zec 		m->m_pkthdr.rcvif = V_loif;
148721ca7b57SMarko Zec 	else {
148821ca7b57SMarko Zec 		m_freem(m);
148921ca7b57SMarko Zec 		return;
149021ca7b57SMarko Zec 	}
149121ca7b57SMarko Zec #endif
14923161f583SAndre Oppermann 	netisr_queue(NETISR_ROUTE, m);	/* mbuf is free'd on failure. */
14937b6edd04SRuslan Ermilov }
14947b6edd04SRuslan Ermilov 
14957b6edd04SRuslan Ermilov /*
1496df8bae1dSRodney W. Grimes  * This is used in dumping the kernel table via sysctl().
1497df8bae1dSRodney W. Grimes  */
149837c84183SPoul-Henning Kamp static int
1499becc44d7SSam Leffler sysctl_dumpentry(struct radix_node *rn, void *vw)
1500df8bae1dSRodney W. Grimes {
1501becc44d7SSam Leffler 	struct walkarg *w = vw;
1502becc44d7SSam Leffler 	struct rtentry *rt = (struct rtentry *)rn;
1503df8bae1dSRodney W. Grimes 	int error = 0, size;
1504df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
15053deb3649SAlexander V. Chernikov 	struct sockaddr_storage ss;
1506df8bae1dSRodney W. Grimes 
1507df8bae1dSRodney W. Grimes 	if (w->w_op == NET_RT_FLAGS && !(rt->rt_flags & w->w_arg))
1508df8bae1dSRodney W. Grimes 		return 0;
1509b89e82ddSJamie Gritton 	if ((rt->rt_flags & RTF_HOST) == 0
1510de0bd6f7SBjoern A. Zeeb 	    ? jailed_without_vnet(w->w_req->td->td_ucred)
1511b89e82ddSJamie Gritton 	    : prison_if(w->w_req->td->td_ucred, rt_key(rt)) != 0)
1512813dd6aeSBjoern A. Zeeb 		return (0);
1513df8bae1dSRodney W. Grimes 	bzero((caddr_t)&info, sizeof(info));
1514becc44d7SSam Leffler 	info.rti_info[RTAX_DST] = rt_key(rt);
1515becc44d7SSam Leffler 	info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
15163deb3649SAlexander V. Chernikov 	info.rti_info[RTAX_NETMASK] = rtsock_fix_netmask(rt_key(rt),
15173deb3649SAlexander V. Chernikov 	    rt_mask(rt), &ss);
15186e6b3f7cSQing Li 	info.rti_info[RTAX_GENMASK] = 0;
151928070a0eSRuslan Ermilov 	if (rt->rt_ifp) {
15204a0d6638SRuslan Ermilov 		info.rti_info[RTAX_IFP] = rt->rt_ifp->if_addr->ifa_addr;
1521becc44d7SSam Leffler 		info.rti_info[RTAX_IFA] = rt->rt_ifa->ifa_addr;
152228070a0eSRuslan Ermilov 		if (rt->rt_ifp->if_flags & IFF_POINTOPOINT)
1523becc44d7SSam Leffler 			info.rti_info[RTAX_BRD] = rt->rt_ifa->ifa_dstaddr;
152428070a0eSRuslan Ermilov 	}
1525f2e5eb36SAlexander V. Chernikov 	if ((error = rtsock_msg_buffer(RTM_GET, &info, w, &size)) != 0)
1526f2e5eb36SAlexander V. Chernikov 		return (error);
152752041295SPoul-Henning Kamp 	if (w->w_req && w->w_tmem) {
1528becc44d7SSam Leffler 		struct rt_msghdr *rtm = (struct rt_msghdr *)w->w_tmem;
1529df8bae1dSRodney W. Grimes 
1530f672f56fSQing Li 		if (rt->rt_flags & RTF_GWFLAG_COMPAT)
1531f672f56fSQing Li 			rtm->rtm_flags = RTF_GATEWAY |
1532f672f56fSQing Li 				(rt->rt_flags & ~RTF_GWFLAG_COMPAT);
1533f672f56fSQing Li 		else
1534df8bae1dSRodney W. Grimes 			rtm->rtm_flags = rt->rt_flags;
1535e3a7aa6fSGleb Smirnoff 		rt_getmetrics(rt, &rtm->rtm_rmx);
1536df8bae1dSRodney W. Grimes 		rtm->rtm_index = rt->rt_ifp->if_index;
1537df8bae1dSRodney W. Grimes 		rtm->rtm_errno = rtm->rtm_pid = rtm->rtm_seq = 0;
1538df8bae1dSRodney W. Grimes 		rtm->rtm_addrs = info.rti_addrs;
153952041295SPoul-Henning Kamp 		error = SYSCTL_OUT(w->w_req, (caddr_t)rtm, size);
154052041295SPoul-Henning Kamp 		return (error);
1541df8bae1dSRodney W. Grimes 	}
1542df8bae1dSRodney W. Grimes 	return (error);
1543df8bae1dSRodney W. Grimes }
1544df8bae1dSRodney W. Grimes 
154537c84183SPoul-Henning Kamp static int
15466d076ae8SBjoern A. Zeeb sysctl_iflist_ifml(struct ifnet *ifp, struct rt_addrinfo *info,
15476d076ae8SBjoern A. Zeeb     struct walkarg *w, int len)
15486d076ae8SBjoern A. Zeeb {
15496d076ae8SBjoern A. Zeeb 	struct if_msghdrl *ifm;
1550b245f96cSGleb Smirnoff 	struct if_data *ifd;
1551b245f96cSGleb Smirnoff 
1552b245f96cSGleb Smirnoff 	ifm = (struct if_msghdrl *)w->w_tmem;
15536d076ae8SBjoern A. Zeeb 
15546d076ae8SBjoern A. Zeeb #ifdef COMPAT_FREEBSD32
15556d076ae8SBjoern A. Zeeb 	if (w->w_req->flags & SCTL_MASK32) {
15566d076ae8SBjoern A. Zeeb 		struct if_msghdrl32 *ifm32;
15576d076ae8SBjoern A. Zeeb 
1558b245f96cSGleb Smirnoff 		ifm32 = (struct if_msghdrl32 *)ifm;
15596d076ae8SBjoern A. Zeeb 		ifm32->ifm_addrs = info->rti_addrs;
15606d076ae8SBjoern A. Zeeb 		ifm32->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
15616d076ae8SBjoern A. Zeeb 		ifm32->ifm_index = ifp->if_index;
15626d076ae8SBjoern A. Zeeb 		ifm32->_ifm_spare1 = 0;
15636d076ae8SBjoern A. Zeeb 		ifm32->ifm_len = sizeof(*ifm32);
15646d076ae8SBjoern A. Zeeb 		ifm32->ifm_data_off = offsetof(struct if_msghdrl32, ifm_data);
1565b245f96cSGleb Smirnoff 		ifd = &ifm32->ifm_data;
1566b245f96cSGleb Smirnoff 	} else
15676d076ae8SBjoern A. Zeeb #endif
1568b245f96cSGleb Smirnoff 	{
15696d076ae8SBjoern A. Zeeb 		ifm->ifm_addrs = info->rti_addrs;
15706d076ae8SBjoern A. Zeeb 		ifm->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
15716d076ae8SBjoern A. Zeeb 		ifm->ifm_index = ifp->if_index;
15726d076ae8SBjoern A. Zeeb 		ifm->_ifm_spare1 = 0;
15736d076ae8SBjoern A. Zeeb 		ifm->ifm_len = sizeof(*ifm);
15746d076ae8SBjoern A. Zeeb 		ifm->ifm_data_off = offsetof(struct if_msghdrl, ifm_data);
1575b245f96cSGleb Smirnoff 		ifd = &ifm->ifm_data;
1576b245f96cSGleb Smirnoff 	}
15776d076ae8SBjoern A. Zeeb 
1578b245f96cSGleb Smirnoff 	*ifd = ifp->if_data;
1579b245f96cSGleb Smirnoff 
15802d70c0deSGleb Smirnoff 	/* Some drivers still use ifqueue(9), add its stats. */
15812d70c0deSGleb Smirnoff 	ifd->ifi_oqdrops += ifp->if_snd.ifq_drops;
15826d076ae8SBjoern A. Zeeb 
15836d076ae8SBjoern A. Zeeb 	return (SYSCTL_OUT(w->w_req, (caddr_t)ifm, len));
15846d076ae8SBjoern A. Zeeb }
15856d076ae8SBjoern A. Zeeb 
15866d076ae8SBjoern A. Zeeb static int
15876d076ae8SBjoern A. Zeeb sysctl_iflist_ifm(struct ifnet *ifp, struct rt_addrinfo *info,
15886d076ae8SBjoern A. Zeeb     struct walkarg *w, int len)
15896d076ae8SBjoern A. Zeeb {
15906d076ae8SBjoern A. Zeeb 	struct if_msghdr *ifm;
1591b245f96cSGleb Smirnoff 	struct if_data *ifd;
1592b245f96cSGleb Smirnoff 
1593b245f96cSGleb Smirnoff 	ifm = (struct if_msghdr *)w->w_tmem;
15946d076ae8SBjoern A. Zeeb 
15956d076ae8SBjoern A. Zeeb #ifdef COMPAT_FREEBSD32
15966d076ae8SBjoern A. Zeeb 	if (w->w_req->flags & SCTL_MASK32) {
15976d076ae8SBjoern A. Zeeb 		struct if_msghdr32 *ifm32;
15986d076ae8SBjoern A. Zeeb 
1599b245f96cSGleb Smirnoff 		ifm32 = (struct if_msghdr32 *)ifm;
16006d076ae8SBjoern A. Zeeb 		ifm32->ifm_addrs = info->rti_addrs;
16016d076ae8SBjoern A. Zeeb 		ifm32->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
16026d076ae8SBjoern A. Zeeb 		ifm32->ifm_index = ifp->if_index;
1603b245f96cSGleb Smirnoff 		ifd = &ifm32->ifm_data;
1604b245f96cSGleb Smirnoff 	} else
16056d076ae8SBjoern A. Zeeb #endif
1606b245f96cSGleb Smirnoff 	{
16076d076ae8SBjoern A. Zeeb 		ifm->ifm_addrs = info->rti_addrs;
16086d076ae8SBjoern A. Zeeb 		ifm->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
16096d076ae8SBjoern A. Zeeb 		ifm->ifm_index = ifp->if_index;
1610b245f96cSGleb Smirnoff 		ifd = &ifm->ifm_data;
1611b245f96cSGleb Smirnoff 	}
16126d076ae8SBjoern A. Zeeb 
1613b245f96cSGleb Smirnoff 	*ifd = ifp->if_data;
16142d70c0deSGleb Smirnoff 
16152d70c0deSGleb Smirnoff 	/* Some drivers still use ifqueue(9), add its stats. */
16162d70c0deSGleb Smirnoff 	ifd->ifi_oqdrops += ifp->if_snd.ifq_drops;
16176d076ae8SBjoern A. Zeeb 
16186d076ae8SBjoern A. Zeeb 	return (SYSCTL_OUT(w->w_req, (caddr_t)ifm, len));
16196d076ae8SBjoern A. Zeeb }
16206d076ae8SBjoern A. Zeeb 
16216d076ae8SBjoern A. Zeeb static int
16226d076ae8SBjoern A. Zeeb sysctl_iflist_ifaml(struct ifaddr *ifa, struct rt_addrinfo *info,
16236d076ae8SBjoern A. Zeeb     struct walkarg *w, int len)
16246d076ae8SBjoern A. Zeeb {
16256d076ae8SBjoern A. Zeeb 	struct ifa_msghdrl *ifam;
1626b245f96cSGleb Smirnoff 	struct if_data *ifd;
1627b245f96cSGleb Smirnoff 
1628b245f96cSGleb Smirnoff 	ifam = (struct ifa_msghdrl *)w->w_tmem;
16296d076ae8SBjoern A. Zeeb 
16306d076ae8SBjoern A. Zeeb #ifdef COMPAT_FREEBSD32
16316d076ae8SBjoern A. Zeeb 	if (w->w_req->flags & SCTL_MASK32) {
16326d076ae8SBjoern A. Zeeb 		struct ifa_msghdrl32 *ifam32;
16336d076ae8SBjoern A. Zeeb 
1634b245f96cSGleb Smirnoff 		ifam32 = (struct ifa_msghdrl32 *)ifam;
16356d076ae8SBjoern A. Zeeb 		ifam32->ifam_addrs = info->rti_addrs;
16366d076ae8SBjoern A. Zeeb 		ifam32->ifam_flags = ifa->ifa_flags;
16376d076ae8SBjoern A. Zeeb 		ifam32->ifam_index = ifa->ifa_ifp->if_index;
16386d076ae8SBjoern A. Zeeb 		ifam32->_ifam_spare1 = 0;
16396d076ae8SBjoern A. Zeeb 		ifam32->ifam_len = sizeof(*ifam32);
16406d076ae8SBjoern A. Zeeb 		ifam32->ifam_data_off =
16416d076ae8SBjoern A. Zeeb 		    offsetof(struct ifa_msghdrl32, ifam_data);
16426d076ae8SBjoern A. Zeeb 		ifam32->ifam_metric = ifa->ifa_metric;
1643b245f96cSGleb Smirnoff 		ifd = &ifam32->ifam_data;
1644b245f96cSGleb Smirnoff 	} else
16456d076ae8SBjoern A. Zeeb #endif
1646b245f96cSGleb Smirnoff 	{
16476d076ae8SBjoern A. Zeeb 		ifam->ifam_addrs = info->rti_addrs;
16486d076ae8SBjoern A. Zeeb 		ifam->ifam_flags = ifa->ifa_flags;
16496d076ae8SBjoern A. Zeeb 		ifam->ifam_index = ifa->ifa_ifp->if_index;
16506d076ae8SBjoern A. Zeeb 		ifam->_ifam_spare1 = 0;
16516d076ae8SBjoern A. Zeeb 		ifam->ifam_len = sizeof(*ifam);
16526d076ae8SBjoern A. Zeeb 		ifam->ifam_data_off = offsetof(struct ifa_msghdrl, ifam_data);
16536d076ae8SBjoern A. Zeeb 		ifam->ifam_metric = ifa->ifa_metric;
1654b245f96cSGleb Smirnoff 		ifd = &ifam->ifam_data;
1655b245f96cSGleb Smirnoff 	}
16566d076ae8SBjoern A. Zeeb 
1657b245f96cSGleb Smirnoff 	bzero(ifd, sizeof(*ifd));
1658b245f96cSGleb Smirnoff 	ifd->ifi_datalen = sizeof(struct if_data);
1659b245f96cSGleb Smirnoff 	ifd->ifi_ipackets = counter_u64_fetch(ifa->ifa_ipackets);
1660b245f96cSGleb Smirnoff 	ifd->ifi_opackets = counter_u64_fetch(ifa->ifa_opackets);
1661b245f96cSGleb Smirnoff 	ifd->ifi_ibytes = counter_u64_fetch(ifa->ifa_ibytes);
1662b245f96cSGleb Smirnoff 	ifd->ifi_obytes = counter_u64_fetch(ifa->ifa_obytes);
16637caf4ab7SGleb Smirnoff 
16646d076ae8SBjoern A. Zeeb 	/* Fixup if_data carp(4) vhid. */
16656d076ae8SBjoern A. Zeeb 	if (carp_get_vhid_p != NULL)
1666b245f96cSGleb Smirnoff 		ifd->ifi_vhid = (*carp_get_vhid_p)(ifa);
16676d076ae8SBjoern A. Zeeb 
16686d076ae8SBjoern A. Zeeb 	return (SYSCTL_OUT(w->w_req, w->w_tmem, len));
16696d076ae8SBjoern A. Zeeb }
16706d076ae8SBjoern A. Zeeb 
16716d076ae8SBjoern A. Zeeb static int
16726d076ae8SBjoern A. Zeeb sysctl_iflist_ifam(struct ifaddr *ifa, struct rt_addrinfo *info,
16736d076ae8SBjoern A. Zeeb     struct walkarg *w, int len)
16746d076ae8SBjoern A. Zeeb {
16756d076ae8SBjoern A. Zeeb 	struct ifa_msghdr *ifam;
16766d076ae8SBjoern A. Zeeb 
16776d076ae8SBjoern A. Zeeb 	ifam = (struct ifa_msghdr *)w->w_tmem;
16786d076ae8SBjoern A. Zeeb 	ifam->ifam_addrs = info->rti_addrs;
16796d076ae8SBjoern A. Zeeb 	ifam->ifam_flags = ifa->ifa_flags;
16806d076ae8SBjoern A. Zeeb 	ifam->ifam_index = ifa->ifa_ifp->if_index;
16816d076ae8SBjoern A. Zeeb 	ifam->ifam_metric = ifa->ifa_metric;
16826d076ae8SBjoern A. Zeeb 
16836d076ae8SBjoern A. Zeeb 	return (SYSCTL_OUT(w->w_req, w->w_tmem, len));
16846d076ae8SBjoern A. Zeeb }
16856d076ae8SBjoern A. Zeeb 
16866d076ae8SBjoern A. Zeeb static int
1687becc44d7SSam Leffler sysctl_iflist(int af, struct walkarg *w)
1688df8bae1dSRodney W. Grimes {
1689becc44d7SSam Leffler 	struct ifnet *ifp;
1690becc44d7SSam Leffler 	struct ifaddr *ifa;
1691df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
1692df8bae1dSRodney W. Grimes 	int len, error = 0;
16933deb3649SAlexander V. Chernikov 	struct sockaddr_storage ss;
1694df8bae1dSRodney W. Grimes 
1695df8bae1dSRodney W. Grimes 	bzero((caddr_t)&info, sizeof(info));
16965c9fa630SHiroki Sato 	IFNET_RLOCK_NOSLEEP();
1697603724d3SBjoern A. Zeeb 	TAILQ_FOREACH(ifp, &V_ifnet, if_link) {
1698df8bae1dSRodney W. Grimes 		if (w->w_arg && w->w_arg != ifp->if_index)
1699df8bae1dSRodney W. Grimes 			continue;
1700137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
17014a0d6638SRuslan Ermilov 		ifa = ifp->if_addr;
1702becc44d7SSam Leffler 		info.rti_info[RTAX_IFP] = ifa->ifa_addr;
1703f2e5eb36SAlexander V. Chernikov 		error = rtsock_msg_buffer(RTM_IFINFO, &info, w, &len);
1704f2e5eb36SAlexander V. Chernikov 		if (error != 0)
1705f2e5eb36SAlexander V. Chernikov 			goto done;
17065dfc91d7SLuigi Rizzo 		info.rti_info[RTAX_IFP] = NULL;
170752041295SPoul-Henning Kamp 		if (w->w_req && w->w_tmem) {
17086d076ae8SBjoern A. Zeeb 			if (w->w_op == NET_RT_IFLISTL)
17096d076ae8SBjoern A. Zeeb 				error = sysctl_iflist_ifml(ifp, &info, w, len);
17106d076ae8SBjoern A. Zeeb 			else
17116d076ae8SBjoern A. Zeeb 				error = sysctl_iflist_ifm(ifp, &info, w, len);
1712df440948SPoul-Henning Kamp 			if (error)
1713a35b06c5SJonathan Lemon 				goto done;
1714df8bae1dSRodney W. Grimes 		}
17155dfc91d7SLuigi Rizzo 		while ((ifa = TAILQ_NEXT(ifa, ifa_link)) != NULL) {
1716df8bae1dSRodney W. Grimes 			if (af && af != ifa->ifa_addr->sa_family)
1717df8bae1dSRodney W. Grimes 				continue;
1718b89e82ddSJamie Gritton 			if (prison_if(w->w_req->td->td_ucred,
1719b89e82ddSJamie Gritton 			    ifa->ifa_addr) != 0)
172075c13541SPoul-Henning Kamp 				continue;
1721becc44d7SSam Leffler 			info.rti_info[RTAX_IFA] = ifa->ifa_addr;
17223deb3649SAlexander V. Chernikov 			info.rti_info[RTAX_NETMASK] = rtsock_fix_netmask(
17233deb3649SAlexander V. Chernikov 			    ifa->ifa_addr, ifa->ifa_netmask, &ss);
1724becc44d7SSam Leffler 			info.rti_info[RTAX_BRD] = ifa->ifa_dstaddr;
1725f2e5eb36SAlexander V. Chernikov 			error = rtsock_msg_buffer(RTM_NEWADDR, &info, w, &len);
1726f2e5eb36SAlexander V. Chernikov 			if (error != 0)
1727f2e5eb36SAlexander V. Chernikov 				goto done;
172852041295SPoul-Henning Kamp 			if (w->w_req && w->w_tmem) {
17296d076ae8SBjoern A. Zeeb 				if (w->w_op == NET_RT_IFLISTL)
17306d076ae8SBjoern A. Zeeb 					error = sysctl_iflist_ifaml(ifa, &info,
17316d076ae8SBjoern A. Zeeb 					    w, len);
17326d076ae8SBjoern A. Zeeb 				else
17336d076ae8SBjoern A. Zeeb 					error = sysctl_iflist_ifam(ifa, &info,
17346d076ae8SBjoern A. Zeeb 					    w, len);
1735df440948SPoul-Henning Kamp 				if (error)
1736a35b06c5SJonathan Lemon 					goto done;
1737df8bae1dSRodney W. Grimes 			}
1738df8bae1dSRodney W. Grimes 		}
1739137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
17403deb3649SAlexander V. Chernikov 		info.rti_info[RTAX_IFA] = NULL;
17413deb3649SAlexander V. Chernikov 		info.rti_info[RTAX_NETMASK] = NULL;
17425dfc91d7SLuigi Rizzo 		info.rti_info[RTAX_BRD] = NULL;
1743df8bae1dSRodney W. Grimes 	}
1744a35b06c5SJonathan Lemon done:
1745ee7c7feeSBjoern A. Zeeb 	if (ifp != NULL)
1746137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
17475c9fa630SHiroki Sato 	IFNET_RUNLOCK_NOSLEEP();
1748a35b06c5SJonathan Lemon 	return (error);
1749df8bae1dSRodney W. Grimes }
1750df8bae1dSRodney W. Grimes 
1751ebda3fc3SBjoern A. Zeeb static int
17529b98ee2cSLuigi Rizzo sysctl_ifmalist(int af, struct walkarg *w)
175305b2efe0SBruce M Simpson {
17549b98ee2cSLuigi Rizzo 	struct ifnet *ifp;
175505b2efe0SBruce M Simpson 	struct ifmultiaddr *ifma;
175605b2efe0SBruce M Simpson 	struct	rt_addrinfo info;
175705b2efe0SBruce M Simpson 	int	len, error = 0;
17589b98ee2cSLuigi Rizzo 	struct ifaddr *ifa;
175905b2efe0SBruce M Simpson 
176005b2efe0SBruce M Simpson 	bzero((caddr_t)&info, sizeof(info));
17615c9fa630SHiroki Sato 	IFNET_RLOCK_NOSLEEP();
1762603724d3SBjoern A. Zeeb 	TAILQ_FOREACH(ifp, &V_ifnet, if_link) {
176305b2efe0SBruce M Simpson 		if (w->w_arg && w->w_arg != ifp->if_index)
176405b2efe0SBruce M Simpson 			continue;
17654a0d6638SRuslan Ermilov 		ifa = ifp->if_addr;
1766913af518SLuigi Rizzo 		info.rti_info[RTAX_IFP] = ifa ? ifa->ifa_addr : NULL;
1767137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
176805b2efe0SBruce M Simpson 		TAILQ_FOREACH(ifma, &ifp->if_multiaddrs, ifma_link) {
176905b2efe0SBruce M Simpson 			if (af && af != ifma->ifma_addr->sa_family)
177005b2efe0SBruce M Simpson 				continue;
1771b89e82ddSJamie Gritton 			if (prison_if(w->w_req->td->td_ucred,
1772b89e82ddSJamie Gritton 			    ifma->ifma_addr) != 0)
177305b2efe0SBruce M Simpson 				continue;
177405b2efe0SBruce M Simpson 			info.rti_info[RTAX_IFA] = ifma->ifma_addr;
1775913af518SLuigi Rizzo 			info.rti_info[RTAX_GATEWAY] =
1776913af518SLuigi Rizzo 			    (ifma->ifma_addr->sa_family != AF_LINK) ?
1777913af518SLuigi Rizzo 			    ifma->ifma_lladdr : NULL;
1778c9f98940SAlexander V. Chernikov 			error = rtsock_msg_buffer(RTM_NEWMADDR, &info, w, &len);
1779f2e5eb36SAlexander V. Chernikov 			if (error != 0)
1780f2e5eb36SAlexander V. Chernikov 				goto done;
178105b2efe0SBruce M Simpson 			if (w->w_req && w->w_tmem) {
17829b98ee2cSLuigi Rizzo 				struct ifma_msghdr *ifmam;
178305b2efe0SBruce M Simpson 
178405b2efe0SBruce M Simpson 				ifmam = (struct ifma_msghdr *)w->w_tmem;
178505b2efe0SBruce M Simpson 				ifmam->ifmam_index = ifma->ifma_ifp->if_index;
178605b2efe0SBruce M Simpson 				ifmam->ifmam_flags = 0;
178705b2efe0SBruce M Simpson 				ifmam->ifmam_addrs = info.rti_addrs;
178805b2efe0SBruce M Simpson 				error = SYSCTL_OUT(w->w_req, w->w_tmem, len);
1789fe0fc7efSChristian S.J. Peron 				if (error) {
1790137f91e8SJohn Baldwin 					IF_ADDR_RUNLOCK(ifp);
179105b2efe0SBruce M Simpson 					goto done;
179205b2efe0SBruce M Simpson 				}
179305b2efe0SBruce M Simpson 			}
179405b2efe0SBruce M Simpson 		}
1795137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
1796fe0fc7efSChristian S.J. Peron 	}
179705b2efe0SBruce M Simpson done:
17985c9fa630SHiroki Sato 	IFNET_RUNLOCK_NOSLEEP();
179905b2efe0SBruce M Simpson 	return (error);
180005b2efe0SBruce M Simpson }
180105b2efe0SBruce M Simpson 
180252041295SPoul-Henning Kamp static int
180382d9ae4eSPoul-Henning Kamp sysctl_rtsock(SYSCTL_HANDLER_ARGS)
1804df8bae1dSRodney W. Grimes {
180552041295SPoul-Henning Kamp 	int	*name = (int *)arg1;
180652041295SPoul-Henning Kamp 	u_int	namelen = arg2;
1807c2c2a7c1SBjoern A. Zeeb 	struct radix_node_head *rnh = NULL; /* silence compiler. */
1808fe0fc7efSChristian S.J. Peron 	int	i, lim, error = EINVAL;
18094825b1e0SHiroki Sato 	int	fib = 0;
1810df8bae1dSRodney W. Grimes 	u_char	af;
1811df8bae1dSRodney W. Grimes 	struct	walkarg w;
1812df8bae1dSRodney W. Grimes 
181352041295SPoul-Henning Kamp 	name ++;
181452041295SPoul-Henning Kamp 	namelen--;
181552041295SPoul-Henning Kamp 	if (req->newptr)
1816df8bae1dSRodney W. Grimes 		return (EPERM);
18174825b1e0SHiroki Sato 	if (name[1] == NET_RT_DUMP) {
18184825b1e0SHiroki Sato 		if (namelen == 3)
18194825b1e0SHiroki Sato 			fib = req->td->td_proc->p_fibnum;
18204825b1e0SHiroki Sato 		else if (namelen == 4)
18217d9b6df1SAlexander V. Chernikov 			fib = (name[3] == RT_ALL_FIBS) ?
18224825b1e0SHiroki Sato 			    req->td->td_proc->p_fibnum : name[3];
18234825b1e0SHiroki Sato 		else
18244825b1e0SHiroki Sato 			return ((namelen < 3) ? EISDIR : ENOTDIR);
18254825b1e0SHiroki Sato 		if (fib < 0 || fib >= rt_numfibs)
18264825b1e0SHiroki Sato 			return (EINVAL);
18274825b1e0SHiroki Sato 	} else if (namelen != 3)
1828f7a54d06SCrist J. Clark 		return ((namelen < 3) ? EISDIR : ENOTDIR);
1829df8bae1dSRodney W. Grimes 	af = name[0];
1830b2aaf46eSJeffrey Hsu 	if (af > AF_MAX)
1831b2aaf46eSJeffrey Hsu 		return (EINVAL);
18326b96f1afSLuigi Rizzo 	bzero(&w, sizeof(w));
1833df8bae1dSRodney W. Grimes 	w.w_op = name[1];
1834df8bae1dSRodney W. Grimes 	w.w_arg = name[2];
183552041295SPoul-Henning Kamp 	w.w_req = req;
1836df8bae1dSRodney W. Grimes 
1837fe0fc7efSChristian S.J. Peron 	error = sysctl_wire_old_buffer(req, 0);
1838fe0fc7efSChristian S.J. Peron 	if (error)
1839fe0fc7efSChristian S.J. Peron 		return (error);
1840f2e5eb36SAlexander V. Chernikov 
1841f2e5eb36SAlexander V. Chernikov 	/*
1842f2e5eb36SAlexander V. Chernikov 	 * Allocate reply buffer in advance.
1843f2e5eb36SAlexander V. Chernikov 	 * All rtsock messages has maximum length of u_short.
1844f2e5eb36SAlexander V. Chernikov 	 */
1845f2e5eb36SAlexander V. Chernikov 	w.w_tmemsize = 65536;
1846f2e5eb36SAlexander V. Chernikov 	w.w_tmem = malloc(w.w_tmemsize, M_TEMP, M_WAITOK);
1847f2e5eb36SAlexander V. Chernikov 
1848df8bae1dSRodney W. Grimes 	switch (w.w_op) {
1849df8bae1dSRodney W. Grimes 
1850df8bae1dSRodney W. Grimes 	case NET_RT_DUMP:
1851df8bae1dSRodney W. Grimes 	case NET_RT_FLAGS:
1852a8b76c8fSLuigi Rizzo 		if (af == 0) {			/* dump all tables */
1853a8b76c8fSLuigi Rizzo 			i = 1;
1854a8b76c8fSLuigi Rizzo 			lim = AF_MAX;
1855a8b76c8fSLuigi Rizzo 		} else				/* dump only one table */
1856a8b76c8fSLuigi Rizzo 			i = lim = af;
18578eca593cSQing Li 
18588eca593cSQing Li 		/*
18598eca593cSQing Li 		 * take care of llinfo entries, the caller must
18608eca593cSQing Li 		 * specify an AF
18618eca593cSQing Li 		 */
186214981d80SQing Li 		if (w.w_op == NET_RT_FLAGS &&
186382b334e8SQing Li 		    (w.w_arg == 0 || w.w_arg & RTF_LLINFO)) {
18648eca593cSQing Li 			if (af != 0)
18658eca593cSQing Li 				error = lltable_sysctl_dumparp(af, w.w_req);
18668eca593cSQing Li 			else
18678eca593cSQing Li 				error = EINVAL;
18688eca593cSQing Li 			break;
18698eca593cSQing Li 		}
18708eca593cSQing Li 		/*
18718eca593cSQing Li 		 * take care of routing entries
18728eca593cSQing Li 		 */
187320b0cdb7SBjoern A. Zeeb 		for (error = 0; error == 0 && i <= lim; i++) {
18744825b1e0SHiroki Sato 			rnh = rt_tables_get_rnh(fib, i);
1875c2c2a7c1SBjoern A. Zeeb 			if (rnh != NULL) {
1876c2508034SAlexander V. Chernikov 				RADIX_NODE_HEAD_RLOCK(rnh);
1877956b0b65SJeffrey Hsu 			    	error = rnh->rnh_walktree(rnh,
1878fe0fc7efSChristian S.J. Peron 				    sysctl_dumpentry, &w);
1879c2508034SAlexander V. Chernikov 				RADIX_NODE_HEAD_RUNLOCK(rnh);
1880a8b76c8fSLuigi Rizzo 			} else if (af != 0)
1881956b0b65SJeffrey Hsu 				error = EAFNOSUPPORT;
188220b0cdb7SBjoern A. Zeeb 		}
1883df8bae1dSRodney W. Grimes 		break;
1884df8bae1dSRodney W. Grimes 
1885df8bae1dSRodney W. Grimes 	case NET_RT_IFLIST:
18866d076ae8SBjoern A. Zeeb 	case NET_RT_IFLISTL:
1887df8bae1dSRodney W. Grimes 		error = sysctl_iflist(af, &w);
188805b2efe0SBruce M Simpson 		break;
188905b2efe0SBruce M Simpson 
189005b2efe0SBruce M Simpson 	case NET_RT_IFMALIST:
189105b2efe0SBruce M Simpson 		error = sysctl_ifmalist(af, &w);
189205b2efe0SBruce M Simpson 		break;
1893df8bae1dSRodney W. Grimes 	}
1894f2e5eb36SAlexander V. Chernikov 
1895f2e5eb36SAlexander V. Chernikov 	free(w.w_tmem, M_TEMP);
1896df8bae1dSRodney W. Grimes 	return (error);
1897df8bae1dSRodney W. Grimes }
1898df8bae1dSRodney W. Grimes 
18996472ac3dSEd Schouten static SYSCTL_NODE(_net, PF_ROUTE, routetable, CTLFLAG_RD, sysctl_rtsock, "");
190052041295SPoul-Henning Kamp 
1901df8bae1dSRodney W. Grimes /*
1902df8bae1dSRodney W. Grimes  * Definitions of protocols supported in the ROUTE domain.
1903df8bae1dSRodney W. Grimes  */
1904df8bae1dSRodney W. Grimes 
19055b1c0294SDavid E. O'Brien static struct domain routedomain;		/* or at least forward */
1906df8bae1dSRodney W. Grimes 
190752041295SPoul-Henning Kamp static struct protosw routesw[] = {
1908303989a2SRuslan Ermilov {
1909303989a2SRuslan Ermilov 	.pr_type =		SOCK_RAW,
1910303989a2SRuslan Ermilov 	.pr_domain =		&routedomain,
1911303989a2SRuslan Ermilov 	.pr_flags =		PR_ATOMIC|PR_ADDR,
1912303989a2SRuslan Ermilov 	.pr_output =		route_output,
1913303989a2SRuslan Ermilov 	.pr_ctlinput =		raw_ctlinput,
1914303989a2SRuslan Ermilov 	.pr_init =		raw_init,
1915303989a2SRuslan Ermilov 	.pr_usrreqs =		&route_usrreqs
1916df8bae1dSRodney W. Grimes }
1917df8bae1dSRodney W. Grimes };
1918df8bae1dSRodney W. Grimes 
1919303989a2SRuslan Ermilov static struct domain routedomain = {
1920303989a2SRuslan Ermilov 	.dom_family =		PF_ROUTE,
1921303989a2SRuslan Ermilov 	.dom_name =		 "route",
1922303989a2SRuslan Ermilov 	.dom_protosw =		routesw,
1923303989a2SRuslan Ermilov 	.dom_protoswNPROTOSW =	&routesw[sizeof(routesw)/sizeof(routesw[0])]
1924303989a2SRuslan Ermilov };
192578a82810SGarrett Wollman 
1926d0728d71SRobert Watson VNET_DOMAIN_SET(route);
1927