xref: /freebsd/sys/net/rtsock.c (revision e6485f73de7d0375c1f64553de05adcae9da62b3)
1c398230bSWarner Losh /*-
2df8bae1dSRodney W. Grimes  * Copyright (c) 1988, 1991, 1993
3df8bae1dSRodney W. Grimes  *	The Regents of the University of California.  All rights reserved.
4df8bae1dSRodney W. Grimes  *
5df8bae1dSRodney W. Grimes  * Redistribution and use in source and binary forms, with or without
6df8bae1dSRodney W. Grimes  * modification, are permitted provided that the following conditions
7df8bae1dSRodney W. Grimes  * are met:
8df8bae1dSRodney W. Grimes  * 1. Redistributions of source code must retain the above copyright
9df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer.
10df8bae1dSRodney W. Grimes  * 2. Redistributions in binary form must reproduce the above copyright
11df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer in the
12df8bae1dSRodney W. Grimes  *    documentation and/or other materials provided with the distribution.
13df8bae1dSRodney W. Grimes  * 4. Neither the name of the University nor the names of its contributors
14df8bae1dSRodney W. Grimes  *    may be used to endorse or promote products derived from this software
15df8bae1dSRodney W. Grimes  *    without specific prior written permission.
16df8bae1dSRodney W. Grimes  *
17df8bae1dSRodney W. Grimes  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
18df8bae1dSRodney W. Grimes  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19df8bae1dSRodney W. Grimes  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20df8bae1dSRodney W. Grimes  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
21df8bae1dSRodney W. Grimes  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22df8bae1dSRodney W. Grimes  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23df8bae1dSRodney W. Grimes  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24df8bae1dSRodney W. Grimes  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25df8bae1dSRodney W. Grimes  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26df8bae1dSRodney W. Grimes  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27df8bae1dSRodney W. Grimes  * SUCH DAMAGE.
28df8bae1dSRodney W. Grimes  *
2928070a0eSRuslan Ermilov  *	@(#)rtsock.c	8.7 (Berkeley) 10/12/95
30c3aac50fSPeter Wemm  * $FreeBSD$
31df8bae1dSRodney W. Grimes  */
32427a928aSKonstantin Belousov #include "opt_compat.h"
33e440aed9SQing Li #include "opt_mpath.h"
34413628a7SBjoern A. Zeeb #include "opt_inet.h"
35413628a7SBjoern A. Zeeb #include "opt_inet6.h"
36e440aed9SQing Li 
37df8bae1dSRodney W. Grimes #include <sys/param.h>
38960ed29cSSeigo Tanimura #include <sys/jail.h>
39413628a7SBjoern A. Zeeb #include <sys/kernel.h>
40d0728d71SRobert Watson #include <sys/domain.h>
41609ff41fSWarner Losh #include <sys/lock.h>
424d1d4912SBruce Evans #include <sys/malloc.h>
43df8bae1dSRodney W. Grimes #include <sys/mbuf.h>
44acd3428bSRobert Watson #include <sys/priv.h>
45960ed29cSSeigo Tanimura #include <sys/proc.h>
46960ed29cSSeigo Tanimura #include <sys/protosw.h>
473120b9d4SKip Macy #include <sys/rwlock.h>
48960ed29cSSeigo Tanimura #include <sys/signalvar.h>
49df8bae1dSRodney W. Grimes #include <sys/socket.h>
50df8bae1dSRodney W. Grimes #include <sys/socketvar.h>
51960ed29cSSeigo Tanimura #include <sys/sysctl.h>
52960ed29cSSeigo Tanimura #include <sys/systm.h>
53df8bae1dSRodney W. Grimes 
54df8bae1dSRodney W. Grimes #include <net/if.h>
5576039bc8SGleb Smirnoff #include <net/if_var.h>
568eca593cSQing Li #include <net/if_dl.h>
576e6b3f7cSQing Li #include <net/if_llatbl.h>
580ed6142bSQing Li #include <net/if_types.h>
59d989c7b3SRobert Watson #include <net/netisr.h>
60df8bae1dSRodney W. Grimes #include <net/raw_cb.h>
61960ed29cSSeigo Tanimura #include <net/route.h>
624b79449eSBjoern A. Zeeb #include <net/vnet.h>
63df8bae1dSRodney W. Grimes 
645a59cefcSBosko Milekic #include <netinet/in.h>
65c7ab6602SQing Li #include <netinet/if_ether.h>
6608b68b0eSGleb Smirnoff #include <netinet/ip_carp.h>
67413628a7SBjoern A. Zeeb #ifdef INET6
680bebb544SHiroki Sato #include <netinet6/ip6_var.h>
69413628a7SBjoern A. Zeeb #include <netinet6/scope6_var.h>
70413628a7SBjoern A. Zeeb #endif
715a59cefcSBosko Milekic 
72427a928aSKonstantin Belousov #ifdef COMPAT_FREEBSD32
73427a928aSKonstantin Belousov #include <sys/mount.h>
74427a928aSKonstantin Belousov #include <compat/freebsd32/freebsd32.h>
75427a928aSKonstantin Belousov 
76427a928aSKonstantin Belousov struct if_msghdr32 {
77427a928aSKonstantin Belousov 	uint16_t ifm_msglen;
78427a928aSKonstantin Belousov 	uint8_t	ifm_version;
79427a928aSKonstantin Belousov 	uint8_t	ifm_type;
80427a928aSKonstantin Belousov 	int32_t	ifm_addrs;
81427a928aSKonstantin Belousov 	int32_t	ifm_flags;
82427a928aSKonstantin Belousov 	uint16_t ifm_index;
83b245f96cSGleb Smirnoff 	struct	if_data ifm_data;
84427a928aSKonstantin Belousov };
856d076ae8SBjoern A. Zeeb 
866d076ae8SBjoern A. Zeeb struct if_msghdrl32 {
876d076ae8SBjoern A. Zeeb 	uint16_t ifm_msglen;
886d076ae8SBjoern A. Zeeb 	uint8_t	ifm_version;
896d076ae8SBjoern A. Zeeb 	uint8_t	ifm_type;
906d076ae8SBjoern A. Zeeb 	int32_t	ifm_addrs;
916d076ae8SBjoern A. Zeeb 	int32_t	ifm_flags;
926d076ae8SBjoern A. Zeeb 	uint16_t ifm_index;
936d076ae8SBjoern A. Zeeb 	uint16_t _ifm_spare1;
946d076ae8SBjoern A. Zeeb 	uint16_t ifm_len;
956d076ae8SBjoern A. Zeeb 	uint16_t ifm_data_off;
96b245f96cSGleb Smirnoff 	struct	if_data ifm_data;
976d076ae8SBjoern A. Zeeb };
986d076ae8SBjoern A. Zeeb 
996d076ae8SBjoern A. Zeeb struct ifa_msghdrl32 {
1006d076ae8SBjoern A. Zeeb 	uint16_t ifam_msglen;
1016d076ae8SBjoern A. Zeeb 	uint8_t	ifam_version;
1026d076ae8SBjoern A. Zeeb 	uint8_t	ifam_type;
1036d076ae8SBjoern A. Zeeb 	int32_t	ifam_addrs;
1046d076ae8SBjoern A. Zeeb 	int32_t	ifam_flags;
1056d076ae8SBjoern A. Zeeb 	uint16_t ifam_index;
1066d076ae8SBjoern A. Zeeb 	uint16_t _ifam_spare1;
1076d076ae8SBjoern A. Zeeb 	uint16_t ifam_len;
1086d076ae8SBjoern A. Zeeb 	uint16_t ifam_data_off;
1096d076ae8SBjoern A. Zeeb 	int32_t	ifam_metric;
110b245f96cSGleb Smirnoff 	struct	if_data ifam_data;
1116d076ae8SBjoern A. Zeeb };
1126d076ae8SBjoern A. Zeeb #endif /* COMPAT_FREEBSD32 */
113427a928aSKonstantin Belousov 
114a1c995b6SPoul-Henning Kamp MALLOC_DEFINE(M_RTABLE, "routetbl", "routing tables");
115a1c995b6SPoul-Henning Kamp 
116becc44d7SSam Leffler /* NB: these are not modified */
11752041295SPoul-Henning Kamp static struct	sockaddr route_src = { 2, PF_ROUTE, };
118076d0761SJulian Elischer static struct	sockaddr sa_zero   = { sizeof(sa_zero), AF_INET, };
119becc44d7SSam Leffler 
12008b68b0eSGleb Smirnoff /* These are external hooks for CARP. */
12108b68b0eSGleb Smirnoff int	(*carp_get_vhid_p)(struct ifaddr *);
12208b68b0eSGleb Smirnoff 
123528737fdSBjoern A. Zeeb /*
124528737fdSBjoern A. Zeeb  * Used by rtsock/raw_input callback code to decide whether to filter the update
125528737fdSBjoern A. Zeeb  * notification to a socket bound to a particular FIB.
126528737fdSBjoern A. Zeeb  */
127528737fdSBjoern A. Zeeb #define	RTS_FILTER_FIB	M_PROTO8
128528737fdSBjoern A. Zeeb 
129c5d4eab6SMarko Zec typedef struct {
13018aee723SPeter Pentchev 	int	ip_count;	/* attached w/ AF_INET */
131becc44d7SSam Leffler 	int	ip6_count;	/* attached w/ AF_INET6 */
132becc44d7SSam Leffler 	int	any_count;	/* total attached */
133c5d4eab6SMarko Zec } route_cb_t;
134c5d4eab6SMarko Zec static VNET_DEFINE(route_cb_t, route_cb);
135c5d4eab6SMarko Zec #define	V_route_cb VNET(route_cb)
136df8bae1dSRodney W. Grimes 
137aea8b30fSSam Leffler struct mtx rtsock_mtx;
138aea8b30fSSam Leffler MTX_SYSINIT(rtsock, &rtsock_mtx, "rtsock route_cb lock", MTX_DEF);
139aea8b30fSSam Leffler 
140aea8b30fSSam Leffler #define	RTSOCK_LOCK()	mtx_lock(&rtsock_mtx)
141aea8b30fSSam Leffler #define	RTSOCK_UNLOCK()	mtx_unlock(&rtsock_mtx)
142aea8b30fSSam Leffler #define	RTSOCK_LOCK_ASSERT()	mtx_assert(&rtsock_mtx, MA_OWNED)
143aea8b30fSSam Leffler 
1446472ac3dSEd Schouten static SYSCTL_NODE(_net, OID_AUTO, route, CTLFLAG_RD, 0, "");
145190a4c94SRobert Watson 
146df8bae1dSRodney W. Grimes struct walkarg {
14752041295SPoul-Henning Kamp 	int	w_tmemsize;
14852041295SPoul-Henning Kamp 	int	w_op, w_arg;
14952041295SPoul-Henning Kamp 	caddr_t	w_tmem;
15052041295SPoul-Henning Kamp 	struct sysctl_req *w_req;
151df8bae1dSRodney W. Grimes };
152df8bae1dSRodney W. Grimes 
153d989c7b3SRobert Watson static void	rts_input(struct mbuf *m);
1546db47af4SAlexander V. Chernikov static struct mbuf *rtsock_msg_mbuf(int type, struct rt_addrinfo *rtinfo);
155f2e5eb36SAlexander V. Chernikov static int	rtsock_msg_buffer(int type, struct rt_addrinfo *rtinfo,
156f2e5eb36SAlexander V. Chernikov 			struct walkarg *w, int *plen);
1575dfc91d7SLuigi Rizzo static int	rt_xaddrs(caddr_t cp, caddr_t cplim,
1585dfc91d7SLuigi Rizzo 			struct rt_addrinfo *rtinfo);
159929ddbbbSAlfred Perlstein static int	sysctl_dumpentry(struct radix_node *rn, void *vw);
160929ddbbbSAlfred Perlstein static int	sysctl_iflist(int af, struct walkarg *w);
16105b2efe0SBruce M Simpson static int	sysctl_ifmalist(int af, struct walkarg *w);
16273d76e77SKevin Lo static int	route_output(struct mbuf *m, struct socket *so, ...);
163e3a7aa6fSGleb Smirnoff static void	rt_getmetrics(const struct rtentry *rt, struct rt_metrics *out);
1643ca1a2d6SMax Laier static void	rt_dispatch(struct mbuf *, sa_family_t);
1653deb3649SAlexander V. Chernikov static struct sockaddr	*rtsock_fix_netmask(struct sockaddr *dst,
1663deb3649SAlexander V. Chernikov 			struct sockaddr *smask, struct sockaddr_storage *dmask);
167df8bae1dSRodney W. Grimes 
168d4b5cae4SRobert Watson static struct netisr_handler rtsock_nh = {
169d4b5cae4SRobert Watson 	.nh_name = "rtsock",
170d4b5cae4SRobert Watson 	.nh_handler = rts_input,
171d4b5cae4SRobert Watson 	.nh_proto = NETISR_ROUTE,
172d4b5cae4SRobert Watson 	.nh_policy = NETISR_POLICY_SOURCE,
173d4b5cae4SRobert Watson };
174d4b5cae4SRobert Watson 
175d4b5cae4SRobert Watson static int
176d4b5cae4SRobert Watson sysctl_route_netisr_maxqlen(SYSCTL_HANDLER_ARGS)
177d4b5cae4SRobert Watson {
178d4b5cae4SRobert Watson 	int error, qlimit;
179d4b5cae4SRobert Watson 
180d4b5cae4SRobert Watson 	netisr_getqlimit(&rtsock_nh, &qlimit);
181d4b5cae4SRobert Watson 	error = sysctl_handle_int(oidp, &qlimit, 0, req);
182d4b5cae4SRobert Watson         if (error || !req->newptr)
183d4b5cae4SRobert Watson                 return (error);
184d4b5cae4SRobert Watson 	if (qlimit < 1)
185d4b5cae4SRobert Watson 		return (EINVAL);
186d4b5cae4SRobert Watson 	return (netisr_setqlimit(&rtsock_nh, qlimit));
187d4b5cae4SRobert Watson }
188d4b5cae4SRobert Watson SYSCTL_PROC(_net_route, OID_AUTO, netisr_maxqlen, CTLTYPE_INT|CTLFLAG_RW,
189d4b5cae4SRobert Watson     0, 0, sysctl_route_netisr_maxqlen, "I",
190d4b5cae4SRobert Watson     "maximum routing socket dispatch queue length");
191d4b5cae4SRobert Watson 
192d989c7b3SRobert Watson static void
193d989c7b3SRobert Watson rts_init(void)
194d989c7b3SRobert Watson {
195b062951aSRobert Watson 	int tmp;
196d989c7b3SRobert Watson 
197b062951aSRobert Watson 	if (TUNABLE_INT_FETCH("net.route.netisr_maxqlen", &tmp))
198d4b5cae4SRobert Watson 		rtsock_nh.nh_qlimit = tmp;
199d4b5cae4SRobert Watson 	netisr_register(&rtsock_nh);
200d989c7b3SRobert Watson }
201237fdd78SRobert Watson SYSINIT(rtsock, SI_SUB_PROTO_DOMAIN, SI_ORDER_THIRD, rts_init, 0);
202d989c7b3SRobert Watson 
203528737fdSBjoern A. Zeeb static int
204528737fdSBjoern A. Zeeb raw_input_rts_cb(struct mbuf *m, struct sockproto *proto, struct sockaddr *src,
205528737fdSBjoern A. Zeeb     struct rawcb *rp)
206528737fdSBjoern A. Zeeb {
207528737fdSBjoern A. Zeeb 	int fibnum;
208528737fdSBjoern A. Zeeb 
209528737fdSBjoern A. Zeeb 	KASSERT(m != NULL, ("%s: m is NULL", __func__));
210528737fdSBjoern A. Zeeb 	KASSERT(proto != NULL, ("%s: proto is NULL", __func__));
211528737fdSBjoern A. Zeeb 	KASSERT(rp != NULL, ("%s: rp is NULL", __func__));
212528737fdSBjoern A. Zeeb 
213528737fdSBjoern A. Zeeb 	/* No filtering requested. */
214528737fdSBjoern A. Zeeb 	if ((m->m_flags & RTS_FILTER_FIB) == 0)
215528737fdSBjoern A. Zeeb 		return (0);
216528737fdSBjoern A. Zeeb 
217528737fdSBjoern A. Zeeb 	/* Check if it is a rts and the fib matches the one of the socket. */
218528737fdSBjoern A. Zeeb 	fibnum = M_GETFIB(m);
219528737fdSBjoern A. Zeeb 	if (proto->sp_family != PF_ROUTE ||
220528737fdSBjoern A. Zeeb 	    rp->rcb_socket == NULL ||
221528737fdSBjoern A. Zeeb 	    rp->rcb_socket->so_fibnum == fibnum)
222528737fdSBjoern A. Zeeb 		return (0);
223528737fdSBjoern A. Zeeb 
224528737fdSBjoern A. Zeeb 	/* Filtering requested and no match, the socket shall be skipped. */
225528737fdSBjoern A. Zeeb 	return (1);
226528737fdSBjoern A. Zeeb }
227528737fdSBjoern A. Zeeb 
228d989c7b3SRobert Watson static void
229d989c7b3SRobert Watson rts_input(struct mbuf *m)
230d989c7b3SRobert Watson {
231d989c7b3SRobert Watson 	struct sockproto route_proto;
232d989c7b3SRobert Watson 	unsigned short *family;
233d989c7b3SRobert Watson 	struct m_tag *tag;
234d989c7b3SRobert Watson 
235d989c7b3SRobert Watson 	route_proto.sp_family = PF_ROUTE;
236d989c7b3SRobert Watson 	tag = m_tag_find(m, PACKET_TAG_RTSOCKFAM, NULL);
237d989c7b3SRobert Watson 	if (tag != NULL) {
238d989c7b3SRobert Watson 		family = (unsigned short *)(tag + 1);
239d989c7b3SRobert Watson 		route_proto.sp_protocol = *family;
240d989c7b3SRobert Watson 		m_tag_delete(m, tag);
241d989c7b3SRobert Watson 	} else
242d989c7b3SRobert Watson 		route_proto.sp_protocol = 0;
243d989c7b3SRobert Watson 
244528737fdSBjoern A. Zeeb 	raw_input_ext(m, &route_proto, &route_src, raw_input_rts_cb);
245d989c7b3SRobert Watson }
246d989c7b3SRobert Watson 
247a29f300eSGarrett Wollman /*
248a29f300eSGarrett Wollman  * It really doesn't make any sense at all for this code to share much
249a29f300eSGarrett Wollman  * with raw_usrreq.c, since its functionality is so restricted.  XXX
250a29f300eSGarrett Wollman  */
251ac45e92fSRobert Watson static void
252a29f300eSGarrett Wollman rts_abort(struct socket *so)
253df8bae1dSRodney W. Grimes {
2547e994955SRobert Watson 
255ac45e92fSRobert Watson 	raw_usrreqs.pru_abort(so);
256df8bae1dSRodney W. Grimes }
257a29f300eSGarrett Wollman 
258a152f8a3SRobert Watson static void
259a152f8a3SRobert Watson rts_close(struct socket *so)
260a152f8a3SRobert Watson {
261a152f8a3SRobert Watson 
262a152f8a3SRobert Watson 	raw_usrreqs.pru_close(so);
263a152f8a3SRobert Watson }
264a152f8a3SRobert Watson 
265a29f300eSGarrett Wollman /* pru_accept is EOPNOTSUPP */
266a29f300eSGarrett Wollman 
267a29f300eSGarrett Wollman static int
268b40ce416SJulian Elischer rts_attach(struct socket *so, int proto, struct thread *td)
269a29f300eSGarrett Wollman {
270a29f300eSGarrett Wollman 	struct rawcb *rp;
271c9b652e3SAndre Oppermann 	int error;
272a29f300eSGarrett Wollman 
273bc725eafSRobert Watson 	KASSERT(so->so_pcb == NULL, ("rts_attach: so_pcb != NULL"));
274bc725eafSRobert Watson 
2757cc0979fSDavid Malone 	/* XXX */
2761ede983cSDag-Erling Smørgrav 	rp = malloc(sizeof *rp, M_PCB, M_WAITOK | M_ZERO);
2775dfc91d7SLuigi Rizzo 	if (rp == NULL)
278a29f300eSGarrett Wollman 		return ENOBUFS;
279a29f300eSGarrett Wollman 
280a29f300eSGarrett Wollman 	so->so_pcb = (caddr_t)rp;
2818b07e49aSJulian Elischer 	so->so_fibnum = td->td_proc->p_fibnum;
282162c0b2eSRuslan Ermilov 	error = raw_attach(so, proto);
283a29f300eSGarrett Wollman 	rp = sotorawcb(so);
284a29f300eSGarrett Wollman 	if (error) {
2857ba271aeSJonathan Chen 		so->so_pcb = NULL;
286a29f300eSGarrett Wollman 		free(rp, M_PCB);
287a29f300eSGarrett Wollman 		return error;
288a29f300eSGarrett Wollman 	}
289aea8b30fSSam Leffler 	RTSOCK_LOCK();
290a29f300eSGarrett Wollman 	switch(rp->rcb_proto.sp_protocol) {
291a29f300eSGarrett Wollman 	case AF_INET:
292c5d4eab6SMarko Zec 		V_route_cb.ip_count++;
293a29f300eSGarrett Wollman 		break;
294899ce4f4SYoshinobu Inoue 	case AF_INET6:
295c5d4eab6SMarko Zec 		V_route_cb.ip6_count++;
296899ce4f4SYoshinobu Inoue 		break;
297a29f300eSGarrett Wollman 	}
298c5d4eab6SMarko Zec 	V_route_cb.any_count++;
299aea8b30fSSam Leffler 	RTSOCK_UNLOCK();
30003e49181SSeigo Tanimura 	soisconnected(so);
301df8bae1dSRodney W. Grimes 	so->so_options |= SO_USELOOPBACK;
302a29f300eSGarrett Wollman 	return 0;
303df8bae1dSRodney W. Grimes }
304df8bae1dSRodney W. Grimes 
305a29f300eSGarrett Wollman static int
306b40ce416SJulian Elischer rts_bind(struct socket *so, struct sockaddr *nam, struct thread *td)
307a29f300eSGarrett Wollman {
3087e994955SRobert Watson 
3097e994955SRobert Watson 	return (raw_usrreqs.pru_bind(so, nam, td)); /* xxx just EINVAL */
310a29f300eSGarrett Wollman }
311a29f300eSGarrett Wollman 
312a29f300eSGarrett Wollman static int
313b40ce416SJulian Elischer rts_connect(struct socket *so, struct sockaddr *nam, struct thread *td)
314a29f300eSGarrett Wollman {
3157e994955SRobert Watson 
3167e994955SRobert Watson 	return (raw_usrreqs.pru_connect(so, nam, td)); /* XXX just EINVAL */
317a29f300eSGarrett Wollman }
318a29f300eSGarrett Wollman 
319a29f300eSGarrett Wollman /* pru_connect2 is EOPNOTSUPP */
320a29f300eSGarrett Wollman /* pru_control is EOPNOTSUPP */
321a29f300eSGarrett Wollman 
322bc725eafSRobert Watson static void
323a29f300eSGarrett Wollman rts_detach(struct socket *so)
324a29f300eSGarrett Wollman {
325a29f300eSGarrett Wollman 	struct rawcb *rp = sotorawcb(so);
326a29f300eSGarrett Wollman 
327bc725eafSRobert Watson 	KASSERT(rp != NULL, ("rts_detach: rp == NULL"));
328bc725eafSRobert Watson 
329aea8b30fSSam Leffler 	RTSOCK_LOCK();
330a29f300eSGarrett Wollman 	switch(rp->rcb_proto.sp_protocol) {
331a29f300eSGarrett Wollman 	case AF_INET:
332c5d4eab6SMarko Zec 		V_route_cb.ip_count--;
333a29f300eSGarrett Wollman 		break;
334899ce4f4SYoshinobu Inoue 	case AF_INET6:
335c5d4eab6SMarko Zec 		V_route_cb.ip6_count--;
336899ce4f4SYoshinobu Inoue 		break;
337a29f300eSGarrett Wollman 	}
338c5d4eab6SMarko Zec 	V_route_cb.any_count--;
339aea8b30fSSam Leffler 	RTSOCK_UNLOCK();
340bc725eafSRobert Watson 	raw_usrreqs.pru_detach(so);
341a29f300eSGarrett Wollman }
342a29f300eSGarrett Wollman 
343a29f300eSGarrett Wollman static int
344a29f300eSGarrett Wollman rts_disconnect(struct socket *so)
345a29f300eSGarrett Wollman {
3467e994955SRobert Watson 
3477e994955SRobert Watson 	return (raw_usrreqs.pru_disconnect(so));
348a29f300eSGarrett Wollman }
349a29f300eSGarrett Wollman 
350a29f300eSGarrett Wollman /* pru_listen is EOPNOTSUPP */
351a29f300eSGarrett Wollman 
352a29f300eSGarrett Wollman static int
35357bf258eSGarrett Wollman rts_peeraddr(struct socket *so, struct sockaddr **nam)
354a29f300eSGarrett Wollman {
3557e994955SRobert Watson 
3567e994955SRobert Watson 	return (raw_usrreqs.pru_peeraddr(so, nam));
357a29f300eSGarrett Wollman }
358a29f300eSGarrett Wollman 
359a29f300eSGarrett Wollman /* pru_rcvd is EOPNOTSUPP */
360a29f300eSGarrett Wollman /* pru_rcvoob is EOPNOTSUPP */
361a29f300eSGarrett Wollman 
362a29f300eSGarrett Wollman static int
36357bf258eSGarrett Wollman rts_send(struct socket *so, int flags, struct mbuf *m, struct sockaddr *nam,
364b40ce416SJulian Elischer 	 struct mbuf *control, struct thread *td)
365a29f300eSGarrett Wollman {
3667e994955SRobert Watson 
3677e994955SRobert Watson 	return (raw_usrreqs.pru_send(so, flags, m, nam, control, td));
368a29f300eSGarrett Wollman }
369a29f300eSGarrett Wollman 
370a29f300eSGarrett Wollman /* pru_sense is null */
371a29f300eSGarrett Wollman 
372a29f300eSGarrett Wollman static int
373a29f300eSGarrett Wollman rts_shutdown(struct socket *so)
374a29f300eSGarrett Wollman {
3757e994955SRobert Watson 
3767e994955SRobert Watson 	return (raw_usrreqs.pru_shutdown(so));
377a29f300eSGarrett Wollman }
378a29f300eSGarrett Wollman 
379a29f300eSGarrett Wollman static int
38057bf258eSGarrett Wollman rts_sockaddr(struct socket *so, struct sockaddr **nam)
381a29f300eSGarrett Wollman {
3827e994955SRobert Watson 
3837e994955SRobert Watson 	return (raw_usrreqs.pru_sockaddr(so, nam));
384a29f300eSGarrett Wollman }
385a29f300eSGarrett Wollman 
386a29f300eSGarrett Wollman static struct pr_usrreqs route_usrreqs = {
387756d52a1SPoul-Henning Kamp 	.pru_abort =		rts_abort,
388756d52a1SPoul-Henning Kamp 	.pru_attach =		rts_attach,
389756d52a1SPoul-Henning Kamp 	.pru_bind =		rts_bind,
390756d52a1SPoul-Henning Kamp 	.pru_connect =		rts_connect,
391756d52a1SPoul-Henning Kamp 	.pru_detach =		rts_detach,
392756d52a1SPoul-Henning Kamp 	.pru_disconnect =	rts_disconnect,
393756d52a1SPoul-Henning Kamp 	.pru_peeraddr =		rts_peeraddr,
394756d52a1SPoul-Henning Kamp 	.pru_send =		rts_send,
395756d52a1SPoul-Henning Kamp 	.pru_shutdown =		rts_shutdown,
396756d52a1SPoul-Henning Kamp 	.pru_sockaddr =		rts_sockaddr,
397a152f8a3SRobert Watson 	.pru_close =		rts_close,
398a29f300eSGarrett Wollman };
399a29f300eSGarrett Wollman 
400413628a7SBjoern A. Zeeb #ifndef _SOCKADDR_UNION_DEFINED
401413628a7SBjoern A. Zeeb #define	_SOCKADDR_UNION_DEFINED
402413628a7SBjoern A. Zeeb /*
403413628a7SBjoern A. Zeeb  * The union of all possible address formats we handle.
404413628a7SBjoern A. Zeeb  */
405413628a7SBjoern A. Zeeb union sockaddr_union {
406413628a7SBjoern A. Zeeb 	struct sockaddr		sa;
407413628a7SBjoern A. Zeeb 	struct sockaddr_in	sin;
408413628a7SBjoern A. Zeeb 	struct sockaddr_in6	sin6;
409413628a7SBjoern A. Zeeb };
410413628a7SBjoern A. Zeeb #endif /* _SOCKADDR_UNION_DEFINED */
411413628a7SBjoern A. Zeeb 
412413628a7SBjoern A. Zeeb static int
413413628a7SBjoern A. Zeeb rtm_get_jailed(struct rt_addrinfo *info, struct ifnet *ifp,
414413628a7SBjoern A. Zeeb     struct rtentry *rt, union sockaddr_union *saun, struct ucred *cred)
415413628a7SBjoern A. Zeeb {
416413628a7SBjoern A. Zeeb 
4179c79d243SJamie Gritton 	/* First, see if the returned address is part of the jail. */
4189c79d243SJamie Gritton 	if (prison_if(cred, rt->rt_ifa->ifa_addr) == 0) {
4199c79d243SJamie Gritton 		info->rti_info[RTAX_IFA] = rt->rt_ifa->ifa_addr;
4209c79d243SJamie Gritton 		return (0);
4219c79d243SJamie Gritton 	}
4229c79d243SJamie Gritton 
423413628a7SBjoern A. Zeeb 	switch (info->rti_info[RTAX_DST]->sa_family) {
424413628a7SBjoern A. Zeeb #ifdef INET
425413628a7SBjoern A. Zeeb 	case AF_INET:
426413628a7SBjoern A. Zeeb 	{
427413628a7SBjoern A. Zeeb 		struct in_addr ia;
428413628a7SBjoern A. Zeeb 		struct ifaddr *ifa;
429413628a7SBjoern A. Zeeb 		int found;
430413628a7SBjoern A. Zeeb 
431413628a7SBjoern A. Zeeb 		found = 0;
432413628a7SBjoern A. Zeeb 		/*
4339c79d243SJamie Gritton 		 * Try to find an address on the given outgoing interface
4349c79d243SJamie Gritton 		 * that belongs to the jail.
435413628a7SBjoern A. Zeeb 		 */
436137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
437413628a7SBjoern A. Zeeb 		TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) {
438413628a7SBjoern A. Zeeb 			struct sockaddr *sa;
439413628a7SBjoern A. Zeeb 			sa = ifa->ifa_addr;
440413628a7SBjoern A. Zeeb 			if (sa->sa_family != AF_INET)
441413628a7SBjoern A. Zeeb 				continue;
442413628a7SBjoern A. Zeeb 			ia = ((struct sockaddr_in *)sa)->sin_addr;
443b89e82ddSJamie Gritton 			if (prison_check_ip4(cred, &ia) == 0) {
444413628a7SBjoern A. Zeeb 				found = 1;
445413628a7SBjoern A. Zeeb 				break;
446413628a7SBjoern A. Zeeb 			}
447413628a7SBjoern A. Zeeb 		}
448137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
449413628a7SBjoern A. Zeeb 		if (!found) {
450413628a7SBjoern A. Zeeb 			/*
4519c79d243SJamie Gritton 			 * As a last resort return the 'default' jail address.
452413628a7SBjoern A. Zeeb 			 */
4530304c731SJamie Gritton 			ia = ((struct sockaddr_in *)rt->rt_ifa->ifa_addr)->
4540304c731SJamie Gritton 			    sin_addr;
4551cecba0fSBjoern A. Zeeb 			if (prison_get_ip4(cred, &ia) != 0)
456413628a7SBjoern A. Zeeb 				return (ESRCH);
457413628a7SBjoern A. Zeeb 		}
458413628a7SBjoern A. Zeeb 		bzero(&saun->sin, sizeof(struct sockaddr_in));
459413628a7SBjoern A. Zeeb 		saun->sin.sin_len = sizeof(struct sockaddr_in);
460413628a7SBjoern A. Zeeb 		saun->sin.sin_family = AF_INET;
461413628a7SBjoern A. Zeeb 		saun->sin.sin_addr.s_addr = ia.s_addr;
4629c79d243SJamie Gritton 		info->rti_info[RTAX_IFA] = (struct sockaddr *)&saun->sin;
463413628a7SBjoern A. Zeeb 		break;
464413628a7SBjoern A. Zeeb 	}
465413628a7SBjoern A. Zeeb #endif
466413628a7SBjoern A. Zeeb #ifdef INET6
467413628a7SBjoern A. Zeeb 	case AF_INET6:
468413628a7SBjoern A. Zeeb 	{
469413628a7SBjoern A. Zeeb 		struct in6_addr ia6;
470413628a7SBjoern A. Zeeb 		struct ifaddr *ifa;
471413628a7SBjoern A. Zeeb 		int found;
472413628a7SBjoern A. Zeeb 
473413628a7SBjoern A. Zeeb 		found = 0;
474413628a7SBjoern A. Zeeb 		/*
4759c79d243SJamie Gritton 		 * Try to find an address on the given outgoing interface
4769c79d243SJamie Gritton 		 * that belongs to the jail.
477413628a7SBjoern A. Zeeb 		 */
478137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
479413628a7SBjoern A. Zeeb 		TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) {
480413628a7SBjoern A. Zeeb 			struct sockaddr *sa;
481413628a7SBjoern A. Zeeb 			sa = ifa->ifa_addr;
482413628a7SBjoern A. Zeeb 			if (sa->sa_family != AF_INET6)
483413628a7SBjoern A. Zeeb 				continue;
484413628a7SBjoern A. Zeeb 			bcopy(&((struct sockaddr_in6 *)sa)->sin6_addr,
485413628a7SBjoern A. Zeeb 			    &ia6, sizeof(struct in6_addr));
486b89e82ddSJamie Gritton 			if (prison_check_ip6(cred, &ia6) == 0) {
487413628a7SBjoern A. Zeeb 				found = 1;
488413628a7SBjoern A. Zeeb 				break;
489413628a7SBjoern A. Zeeb 			}
490413628a7SBjoern A. Zeeb 		}
491137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
492413628a7SBjoern A. Zeeb 		if (!found) {
493413628a7SBjoern A. Zeeb 			/*
4949c79d243SJamie Gritton 			 * As a last resort return the 'default' jail address.
495413628a7SBjoern A. Zeeb 			 */
4960304c731SJamie Gritton 			ia6 = ((struct sockaddr_in6 *)rt->rt_ifa->ifa_addr)->
4970304c731SJamie Gritton 			    sin6_addr;
4981cecba0fSBjoern A. Zeeb 			if (prison_get_ip6(cred, &ia6) != 0)
499413628a7SBjoern A. Zeeb 				return (ESRCH);
500413628a7SBjoern A. Zeeb 		}
501413628a7SBjoern A. Zeeb 		bzero(&saun->sin6, sizeof(struct sockaddr_in6));
502413628a7SBjoern A. Zeeb 		saun->sin6.sin6_len = sizeof(struct sockaddr_in6);
503413628a7SBjoern A. Zeeb 		saun->sin6.sin6_family = AF_INET6;
5049c79d243SJamie Gritton 		bcopy(&ia6, &saun->sin6.sin6_addr, sizeof(struct in6_addr));
505413628a7SBjoern A. Zeeb 		if (sa6_recoverscope(&saun->sin6) != 0)
506413628a7SBjoern A. Zeeb 			return (ESRCH);
5079c79d243SJamie Gritton 		info->rti_info[RTAX_IFA] = (struct sockaddr *)&saun->sin6;
508413628a7SBjoern A. Zeeb 		break;
509413628a7SBjoern A. Zeeb 	}
510413628a7SBjoern A. Zeeb #endif
511413628a7SBjoern A. Zeeb 	default:
512413628a7SBjoern A. Zeeb 		return (ESRCH);
513413628a7SBjoern A. Zeeb 	}
514413628a7SBjoern A. Zeeb 	return (0);
515413628a7SBjoern A. Zeeb }
516413628a7SBjoern A. Zeeb 
517df8bae1dSRodney W. Grimes /*ARGSUSED*/
51852041295SPoul-Henning Kamp static int
51973d76e77SKevin Lo route_output(struct mbuf *m, struct socket *so, ...)
520df8bae1dSRodney W. Grimes {
5215dfc91d7SLuigi Rizzo 	struct rt_msghdr *rtm = NULL;
5225dfc91d7SLuigi Rizzo 	struct rtentry *rt = NULL;
52378a82810SGarrett Wollman 	struct radix_node_head *rnh;
524df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
5250bebb544SHiroki Sato 	struct sockaddr_storage ss;
5263deb3649SAlexander V. Chernikov #ifdef INET6
5276bbfef90SHiroki Sato 	struct sockaddr_in6 *sin6;
5280bebb544SHiroki Sato 	int i, rti_need_deembed = 0;
5296bbfef90SHiroki Sato #endif
530f2e5eb36SAlexander V. Chernikov 	int alloc_len = 0, len, error = 0, fibnum;
5315dfc91d7SLuigi Rizzo 	struct ifnet *ifp = NULL;
532413628a7SBjoern A. Zeeb 	union sockaddr_union saun;
5333ca1a2d6SMax Laier 	sa_family_t saf = AF_UNSPEC;
53492c227afSAlexander V. Chernikov 	struct rawcb *rp = NULL;
535f2e5eb36SAlexander V. Chernikov 	struct walkarg w;
536df8bae1dSRodney W. Grimes 
537f5d9a696SAlexander V. Chernikov 	fibnum = so->so_fibnum;
538f5d9a696SAlexander V. Chernikov 
539df8bae1dSRodney W. Grimes #define senderr(e) { error = e; goto flush;}
5405dfc91d7SLuigi Rizzo 	if (m == NULL || ((m->m_len < sizeof(long)) &&
5415dfc91d7SLuigi Rizzo 		       (m = m_pullup(m, sizeof(long))) == NULL))
542df8bae1dSRodney W. Grimes 		return (ENOBUFS);
543df8bae1dSRodney W. Grimes 	if ((m->m_flags & M_PKTHDR) == 0)
544df8bae1dSRodney W. Grimes 		panic("route_output");
545df8bae1dSRodney W. Grimes 	len = m->m_pkthdr.len;
546df8bae1dSRodney W. Grimes 	if (len < sizeof(*rtm) ||
547f1fcb552SAlexander V. Chernikov 	    len != mtod(m, struct rt_msghdr *)->rtm_msglen)
548df8bae1dSRodney W. Grimes 		senderr(EINVAL);
549f1fcb552SAlexander V. Chernikov 
550f2e5eb36SAlexander V. Chernikov 	/*
551f2e5eb36SAlexander V. Chernikov 	 * Most of current messages are in range 200-240 bytes,
552d9437c0fSAlexander V. Chernikov 	 * minimize possible re-allocation on reply using larger size
553d9437c0fSAlexander V. Chernikov 	 * buffer aligned on 1k boundaty.
554f2e5eb36SAlexander V. Chernikov 	 */
555f2e5eb36SAlexander V. Chernikov 	alloc_len = roundup2(len, 1024);
556d9437c0fSAlexander V. Chernikov 	if ((rtm = malloc(alloc_len, M_TEMP, M_NOWAIT)) == NULL)
557df8bae1dSRodney W. Grimes 		senderr(ENOBUFS);
558f2e5eb36SAlexander V. Chernikov 
559df8bae1dSRodney W. Grimes 	m_copydata(m, 0, len, (caddr_t)rtm);
560f1fcb552SAlexander V. Chernikov 	bzero(&info, sizeof(info));
561f2e5eb36SAlexander V. Chernikov 	bzero(&w, sizeof(w));
562f1fcb552SAlexander V. Chernikov 
563df8bae1dSRodney W. Grimes 	if (rtm->rtm_version != RTM_VERSION) {
564f1fcb552SAlexander V. Chernikov 		/* Do not touch message since format is unknown */
565f2e5eb36SAlexander V. Chernikov 		free(rtm, M_TEMP);
566f1fcb552SAlexander V. Chernikov 		rtm = NULL;
567df8bae1dSRodney W. Grimes 		senderr(EPROTONOSUPPORT);
568df8bae1dSRodney W. Grimes 	}
569f1fcb552SAlexander V. Chernikov 
570f1fcb552SAlexander V. Chernikov 	/*
571f1fcb552SAlexander V. Chernikov 	 * Starting from here, it is possible
572f1fcb552SAlexander V. Chernikov 	 * to alter original message and insert
573f1fcb552SAlexander V. Chernikov 	 * caller PID and error value.
574f1fcb552SAlexander V. Chernikov 	 */
575f1fcb552SAlexander V. Chernikov 
576df8bae1dSRodney W. Grimes 	rtm->rtm_pid = curproc->p_pid;
577df8bae1dSRodney W. Grimes 	info.rti_addrs = rtm->rtm_addrs;
5780fb9298dSAlexander V. Chernikov 
5790fb9298dSAlexander V. Chernikov 	info.rti_mflags = rtm->rtm_inits;
5800fb9298dSAlexander V. Chernikov 	info.rti_rmx = &rtm->rtm_rmx;
5810fb9298dSAlexander V. Chernikov 
5820bebb544SHiroki Sato 	/*
5830bebb544SHiroki Sato 	 * rt_xaddrs() performs s6_addr[2] := sin6_scope_id for AF_INET6
5840bebb544SHiroki Sato 	 * link-local address because rtrequest requires addresses with
5850bebb544SHiroki Sato 	 * embedded scope id.
5860bebb544SHiroki Sato 	 */
587f1fcb552SAlexander V. Chernikov 	if (rt_xaddrs((caddr_t)(rtm + 1), len + (caddr_t)rtm, &info))
588076d0761SJulian Elischer 		senderr(EINVAL);
589f1fcb552SAlexander V. Chernikov 
5908071913dSRuslan Ermilov 	info.rti_flags = rtm->rtm_flags;
5915dfc91d7SLuigi Rizzo 	if (info.rti_info[RTAX_DST] == NULL ||
592becc44d7SSam Leffler 	    info.rti_info[RTAX_DST]->sa_family >= AF_MAX ||
5935dfc91d7SLuigi Rizzo 	    (info.rti_info[RTAX_GATEWAY] != NULL &&
594becc44d7SSam Leffler 	     info.rti_info[RTAX_GATEWAY]->sa_family >= AF_MAX))
595df8bae1dSRodney W. Grimes 		senderr(EINVAL);
5963ca1a2d6SMax Laier 	saf = info.rti_info[RTAX_DST]->sa_family;
597162c0b2eSRuslan Ermilov 	/*
598162c0b2eSRuslan Ermilov 	 * Verify that the caller has the appropriate privilege; RTM_GET
599162c0b2eSRuslan Ermilov 	 * is the only operation the non-superuser is allowed.
600162c0b2eSRuslan Ermilov 	 */
601acd3428bSRobert Watson 	if (rtm->rtm_type != RTM_GET) {
602acd3428bSRobert Watson 		error = priv_check(curthread, PRIV_NET_ROUTE);
603acd3428bSRobert Watson 		if (error)
604dadb6c3bSRuslan Ermilov 			senderr(error);
605acd3428bSRobert Watson 	}
606162c0b2eSRuslan Ermilov 
6079231d35fSQing Li 	/*
6089231d35fSQing Li 	 * The given gateway address may be an interface address.
6099231d35fSQing Li 	 * For example, issuing a "route change" command on a route
6109231d35fSQing Li 	 * entry that was created from a tunnel, and the gateway
6119231d35fSQing Li 	 * address given is the local end point. In this case the
6129231d35fSQing Li 	 * RTF_GATEWAY flag must be cleared or the destination will
6139231d35fSQing Li 	 * not be reachable even though there is no error message.
6149231d35fSQing Li 	 */
6159231d35fSQing Li 	if (info.rti_info[RTAX_GATEWAY] != NULL &&
6169231d35fSQing Li 	    info.rti_info[RTAX_GATEWAY]->sa_family != AF_LINK) {
6179231d35fSQing Li 		struct route gw_ro;
6189231d35fSQing Li 
6199231d35fSQing Li 		bzero(&gw_ro, sizeof(gw_ro));
6209231d35fSQing Li 		gw_ro.ro_dst = *info.rti_info[RTAX_GATEWAY];
621773aa053SAlexander V. Chernikov 		rtalloc_ign_fib(&gw_ro, 0, fibnum);
6229231d35fSQing Li 		/*
6239231d35fSQing Li 		 * A host route through the loopback interface is
6249231d35fSQing Li 		 * installed for each interface adddress. In pre 8.0
6259231d35fSQing Li 		 * releases the interface address of a PPP link type
6269231d35fSQing Li 		 * is not reachable locally. This behavior is fixed as
6279231d35fSQing Li 		 * part of the new L2/L3 redesign and rewrite work. The
6289231d35fSQing Li 		 * signature of this interface address route is the
6299231d35fSQing Li 		 * AF_LINK sa_family type of the rt_gateway, and the
6309231d35fSQing Li 		 * rt_ifp has the IFF_LOOPBACK flag set.
6319231d35fSQing Li 		 */
6329231d35fSQing Li 		if (gw_ro.ro_rt != NULL &&
6339231d35fSQing Li 		    gw_ro.ro_rt->rt_gateway->sa_family == AF_LINK &&
634f672f56fSQing Li 		    gw_ro.ro_rt->rt_ifp->if_flags & IFF_LOOPBACK) {
6359231d35fSQing Li 			info.rti_flags &= ~RTF_GATEWAY;
636f672f56fSQing Li 			info.rti_flags |= RTF_GWFLAG_COMPAT;
637f672f56fSQing Li 		}
6389231d35fSQing Li 		if (gw_ro.ro_rt != NULL)
6399231d35fSQing Li 			RTFREE(gw_ro.ro_rt);
6409231d35fSQing Li 	}
6419231d35fSQing Li 
642df8bae1dSRodney W. Grimes 	switch (rtm->rtm_type) {
643becc44d7SSam Leffler 		struct rtentry *saved_nrt;
644df8bae1dSRodney W. Grimes 
645df8bae1dSRodney W. Grimes 	case RTM_ADD:
646c77462ddSAlexander V. Chernikov 	case RTM_CHANGE:
6475dfc91d7SLuigi Rizzo 		if (info.rti_info[RTAX_GATEWAY] == NULL)
648df8bae1dSRodney W. Grimes 			senderr(EINVAL);
6495dfc91d7SLuigi Rizzo 		saved_nrt = NULL;
6508eca593cSQing Li 
6516e6b3f7cSQing Li 		/* support for new ARP code */
6528eca593cSQing Li 		if (info.rti_info[RTAX_GATEWAY]->sa_family == AF_LINK &&
6538eca593cSQing Li 		    (rtm->rtm_flags & RTF_LLDATA) != 0) {
6546e6b3f7cSQing Li 			error = lla_rt_output(rtm, &info);
6550bebb544SHiroki Sato #ifdef INET6
6560bebb544SHiroki Sato 			if (error == 0)
6570bebb544SHiroki Sato 				rti_need_deembed = (V_deembed_scopeid) ? 1 : 0;
6580bebb544SHiroki Sato #endif
6596e6b3f7cSQing Li 			break;
6606e6b3f7cSQing Li 		}
661c77462ddSAlexander V. Chernikov 		error = rtrequest1_fib(rtm->rtm_type, &info, &saved_nrt,
662773aa053SAlexander V. Chernikov 		    fibnum);
663c77462ddSAlexander V. Chernikov 		if (error == 0 && saved_nrt != NULL) {
6640bebb544SHiroki Sato #ifdef INET6
6650bebb544SHiroki Sato 			rti_need_deembed = (V_deembed_scopeid) ? 1 : 0;
6660bebb544SHiroki Sato #endif
667d1dd20beSSam Leffler 			RT_LOCK(saved_nrt);
66822cafcf0SAndre Oppermann 			rtm->rtm_index = saved_nrt->rt_ifp->if_index;
6697138d65cSSam Leffler 			RT_REMREF(saved_nrt);
670d1dd20beSSam Leffler 			RT_UNLOCK(saved_nrt);
671df8bae1dSRodney W. Grimes 		}
672df8bae1dSRodney W. Grimes 		break;
673df8bae1dSRodney W. Grimes 
674df8bae1dSRodney W. Grimes 	case RTM_DELETE:
6755dfc91d7SLuigi Rizzo 		saved_nrt = NULL;
6766e6b3f7cSQing Li 		/* support for new ARP code */
6776e6b3f7cSQing Li 		if (info.rti_info[RTAX_GATEWAY] &&
6788eca593cSQing Li 		    (info.rti_info[RTAX_GATEWAY]->sa_family == AF_LINK) &&
6798eca593cSQing Li 		    (rtm->rtm_flags & RTF_LLDATA) != 0) {
6806e6b3f7cSQing Li 			error = lla_rt_output(rtm, &info);
6810bebb544SHiroki Sato #ifdef INET6
6820bebb544SHiroki Sato 			if (error == 0)
6830bebb544SHiroki Sato 				rti_need_deembed = (V_deembed_scopeid) ? 1 : 0;
6840bebb544SHiroki Sato #endif
6856e6b3f7cSQing Li 			break;
6866e6b3f7cSQing Li 		}
687773aa053SAlexander V. Chernikov 		error = rtrequest1_fib(RTM_DELETE, &info, &saved_nrt, fibnum);
68878a82810SGarrett Wollman 		if (error == 0) {
689d1dd20beSSam Leffler 			RT_LOCK(saved_nrt);
69071eba915SRuslan Ermilov 			rt = saved_nrt;
69178a82810SGarrett Wollman 			goto report;
69278a82810SGarrett Wollman 		}
6930bebb544SHiroki Sato #ifdef INET6
6940bebb544SHiroki Sato 		/* rt_msg2() will not be used when RTM_DELETE fails. */
6950bebb544SHiroki Sato 		rti_need_deembed = (V_deembed_scopeid) ? 1 : 0;
6960bebb544SHiroki Sato #endif
697df8bae1dSRodney W. Grimes 		break;
698df8bae1dSRodney W. Grimes 
699df8bae1dSRodney W. Grimes 	case RTM_GET:
700773aa053SAlexander V. Chernikov 		rnh = rt_tables_get_rnh(fibnum, saf);
7015dfc91d7SLuigi Rizzo 		if (rnh == NULL)
70278a82810SGarrett Wollman 			senderr(EAFNOSUPPORT);
7035a2f4cbdSAlexander V. Chernikov 
7043120b9d4SKip Macy 		RADIX_NODE_HEAD_RLOCK(rnh);
7055a2f4cbdSAlexander V. Chernikov 
7065a2f4cbdSAlexander V. Chernikov 		if (info.rti_info[RTAX_NETMASK] == NULL &&
7075a2f4cbdSAlexander V. Chernikov 		    rtm->rtm_type == RTM_GET) {
7085a2f4cbdSAlexander V. Chernikov 			/*
7095a2f4cbdSAlexander V. Chernikov 			 * Provide logest prefix match for
7105a2f4cbdSAlexander V. Chernikov 			 * address lookup (no mask).
7115a2f4cbdSAlexander V. Chernikov 			 * 'route -n get addr'
7125a2f4cbdSAlexander V. Chernikov 			 */
7135a2f4cbdSAlexander V. Chernikov 			rt = (struct rtentry *) rnh->rnh_matchaddr(
7145a2f4cbdSAlexander V. Chernikov 			    info.rti_info[RTAX_DST], rnh);
7155a2f4cbdSAlexander V. Chernikov 		} else
7165a2f4cbdSAlexander V. Chernikov 			rt = (struct rtentry *) rnh->rnh_lookup(
7175a2f4cbdSAlexander V. Chernikov 			    info.rti_info[RTAX_DST],
718becc44d7SSam Leffler 			    info.rti_info[RTAX_NETMASK], rnh);
7195a2f4cbdSAlexander V. Chernikov 
7205a2f4cbdSAlexander V. Chernikov 		if (rt == NULL) {
7213120b9d4SKip Macy 			RADIX_NODE_HEAD_RUNLOCK(rnh);
722df8bae1dSRodney W. Grimes 			senderr(ESRCH);
72379188861SGleb Smirnoff 		}
724e440aed9SQing Li #ifdef RADIX_MPATH
725e440aed9SQing Li 		/*
726e440aed9SQing Li 		 * for RTM_CHANGE/LOCK, if we got multipath routes,
727e440aed9SQing Li 		 * we require users to specify a matching RTAX_GATEWAY.
728e440aed9SQing Li 		 *
729e440aed9SQing Li 		 * for RTM_GET, gate is optional even with multipath.
730e440aed9SQing Li 		 * if gate == NULL the first match is returned.
731e440aed9SQing Li 		 * (no need to call rt_mpath_matchgate if gate == NULL)
732e440aed9SQing Li 		 */
733e440aed9SQing Li 		if (rn_mpath_capable(rnh) &&
734e440aed9SQing Li 		    (rtm->rtm_type != RTM_GET || info.rti_info[RTAX_GATEWAY])) {
735e440aed9SQing Li 			rt = rt_mpath_matchgate(rt, info.rti_info[RTAX_GATEWAY]);
736e440aed9SQing Li 			if (!rt) {
7373120b9d4SKip Macy 				RADIX_NODE_HEAD_RUNLOCK(rnh);
738e440aed9SQing Li 				senderr(ESRCH);
739e440aed9SQing Li 			}
740e440aed9SQing Li 		}
741e440aed9SQing Li #endif
742c7ab6602SQing Li 		/*
743c7ab6602SQing Li 		 * If performing proxied L2 entry insertion, and
744c7ab6602SQing Li 		 * the actual PPP host entry is found, perform
745c7ab6602SQing Li 		 * another search to retrieve the prefix route of
746c7ab6602SQing Li 		 * the local end point of the PPP link.
747c7ab6602SQing Li 		 */
7480ed6142bSQing Li 		if (rtm->rtm_flags & RTF_ANNOUNCE) {
749c7ab6602SQing Li 			struct sockaddr laddr;
7500ed6142bSQing Li 
7510ed6142bSQing Li 			if (rt->rt_ifp != NULL &&
7520ed6142bSQing Li 			    rt->rt_ifp->if_type == IFT_PROPVIRTUAL) {
7530ed6142bSQing Li 				struct ifaddr *ifa;
7540ed6142bSQing Li 
7552f308a34SAlan Somers 				ifa = ifa_ifwithnet(info.rti_info[RTAX_DST], 1);
7560ed6142bSQing Li 				if (ifa != NULL)
7570ed6142bSQing Li 					rt_maskedcopy(ifa->ifa_addr,
7580ed6142bSQing Li 						      &laddr,
7590ed6142bSQing Li 						      ifa->ifa_netmask);
7600ed6142bSQing Li 			} else
761c7ab6602SQing Li 				rt_maskedcopy(rt->rt_ifa->ifa_addr,
762c7ab6602SQing Li 					      &laddr,
763c7ab6602SQing Li 					      rt->rt_ifa->ifa_netmask);
764c7ab6602SQing Li 			/*
765c7ab6602SQing Li 			 * refactor rt and no lock operation necessary
766c7ab6602SQing Li 			 */
767c7ab6602SQing Li 			rt = (struct rtentry *)rnh->rnh_matchaddr(&laddr, rnh);
768c7ab6602SQing Li 			if (rt == NULL) {
769c7ab6602SQing Li 				RADIX_NODE_HEAD_RUNLOCK(rnh);
770c7ab6602SQing Li 				senderr(ESRCH);
771c7ab6602SQing Li 			}
772c7ab6602SQing Li 		}
773d1dd20beSSam Leffler 		RT_LOCK(rt);
7747138d65cSSam Leffler 		RT_ADDREF(rt);
7753120b9d4SKip Macy 		RADIX_NODE_HEAD_RUNLOCK(rnh);
776956b0b65SJeffrey Hsu 
77778a82810SGarrett Wollman report:
778d1dd20beSSam Leffler 		RT_LOCK_ASSERT(rt);
779b89e82ddSJamie Gritton 		if ((rt->rt_flags & RTF_HOST) == 0
780de0bd6f7SBjoern A. Zeeb 		    ? jailed_without_vnet(curthread->td_ucred)
781b89e82ddSJamie Gritton 		    : prison_if(curthread->td_ucred,
782b89e82ddSJamie Gritton 		    rt_key(rt)) != 0) {
783813dd6aeSBjoern A. Zeeb 			RT_UNLOCK(rt);
784813dd6aeSBjoern A. Zeeb 			senderr(ESRCH);
785813dd6aeSBjoern A. Zeeb 		}
786becc44d7SSam Leffler 		info.rti_info[RTAX_DST] = rt_key(rt);
787becc44d7SSam Leffler 		info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
7883deb3649SAlexander V. Chernikov 		info.rti_info[RTAX_NETMASK] = rtsock_fix_netmask(rt_key(rt),
7893deb3649SAlexander V. Chernikov 		    rt_mask(rt), &ss);
7906e6b3f7cSQing Li 		info.rti_info[RTAX_GENMASK] = 0;
791df8bae1dSRodney W. Grimes 		if (rtm->rtm_addrs & (RTA_IFP | RTA_IFA)) {
792df440948SPoul-Henning Kamp 			ifp = rt->rt_ifp;
793df440948SPoul-Henning Kamp 			if (ifp) {
7949b98ee2cSLuigi Rizzo 				info.rti_info[RTAX_IFP] =
7954a0d6638SRuslan Ermilov 				    ifp->if_addr->ifa_addr;
7969c79d243SJamie Gritton 				error = rtm_get_jailed(&info, ifp, rt,
7979c79d243SJamie Gritton 				    &saun, curthread->td_ucred);
798413628a7SBjoern A. Zeeb 				if (error != 0) {
799413628a7SBjoern A. Zeeb 					RT_UNLOCK(rt);
8009c79d243SJamie Gritton 					senderr(error);
801413628a7SBjoern A. Zeeb 				}
80228070a0eSRuslan Ermilov 				if (ifp->if_flags & IFF_POINTOPOINT)
803becc44d7SSam Leffler 					info.rti_info[RTAX_BRD] =
804becc44d7SSam Leffler 					    rt->rt_ifa->ifa_dstaddr;
805df8bae1dSRodney W. Grimes 				rtm->rtm_index = ifp->if_index;
806df8bae1dSRodney W. Grimes 			} else {
8075dfc91d7SLuigi Rizzo 				info.rti_info[RTAX_IFP] = NULL;
8085dfc91d7SLuigi Rizzo 				info.rti_info[RTAX_IFA] = NULL;
809df8bae1dSRodney W. Grimes 			}
81025029d6cSHartmut Brandt 		} else if ((ifp = rt->rt_ifp) != NULL) {
81125029d6cSHartmut Brandt 			rtm->rtm_index = ifp->if_index;
812df8bae1dSRodney W. Grimes 		}
813f2e5eb36SAlexander V. Chernikov 
814f2e5eb36SAlexander V. Chernikov 		/* Check if we need to realloc storage */
815f2e5eb36SAlexander V. Chernikov 		rtsock_msg_buffer(rtm->rtm_type, &info, NULL, &len);
816f2e5eb36SAlexander V. Chernikov 		if (len > alloc_len) {
817df8bae1dSRodney W. Grimes 			struct rt_msghdr *new_rtm;
818f2e5eb36SAlexander V. Chernikov 			new_rtm = malloc(len, M_TEMP, M_NOWAIT);
8195dfc91d7SLuigi Rizzo 			if (new_rtm == NULL) {
820d1dd20beSSam Leffler 				RT_UNLOCK(rt);
821df8bae1dSRodney W. Grimes 				senderr(ENOBUFS);
822becc44d7SSam Leffler 			}
8236b96f1afSLuigi Rizzo 			bcopy(rtm, new_rtm, rtm->rtm_msglen);
824f2e5eb36SAlexander V. Chernikov 			free(rtm, M_TEMP);
825f2e5eb36SAlexander V. Chernikov 			rtm = new_rtm;
826f2e5eb36SAlexander V. Chernikov 			alloc_len = len;
827df8bae1dSRodney W. Grimes 		}
828f2e5eb36SAlexander V. Chernikov 
829f2e5eb36SAlexander V. Chernikov 		w.w_tmem = (caddr_t)rtm;
830f2e5eb36SAlexander V. Chernikov 		w.w_tmemsize = alloc_len;
831f2e5eb36SAlexander V. Chernikov 		rtsock_msg_buffer(rtm->rtm_type, &info, &w, &len);
832f2e5eb36SAlexander V. Chernikov 
833f672f56fSQing Li 		if (rt->rt_flags & RTF_GWFLAG_COMPAT)
834f672f56fSQing Li 			rtm->rtm_flags = RTF_GATEWAY |
835f672f56fSQing Li 				(rt->rt_flags & ~RTF_GWFLAG_COMPAT);
836f672f56fSQing Li 		else
837df8bae1dSRodney W. Grimes 			rtm->rtm_flags = rt->rt_flags;
838e3a7aa6fSGleb Smirnoff 		rt_getmetrics(rt, &rtm->rtm_rmx);
839df8bae1dSRodney W. Grimes 		rtm->rtm_addrs = info.rti_addrs;
840df8bae1dSRodney W. Grimes 
841d1dd20beSSam Leffler 		RT_UNLOCK(rt);
842df8bae1dSRodney W. Grimes 		break;
843df8bae1dSRodney W. Grimes 
844df8bae1dSRodney W. Grimes 	default:
845df8bae1dSRodney W. Grimes 		senderr(EOPNOTSUPP);
846df8bae1dSRodney W. Grimes 	}
847df8bae1dSRodney W. Grimes 
848df8bae1dSRodney W. Grimes flush:
84992c227afSAlexander V. Chernikov 	if (rt != NULL)
850becc44d7SSam Leffler 		RTFREE(rt);
851df8bae1dSRodney W. Grimes 	/*
852df8bae1dSRodney W. Grimes 	 * Check to see if we don't want our own messages.
853df8bae1dSRodney W. Grimes 	 */
854df8bae1dSRodney W. Grimes 	if ((so->so_options & SO_USELOOPBACK) == 0) {
855c5d4eab6SMarko Zec 		if (V_route_cb.any_count <= 1) {
856d9437c0fSAlexander V. Chernikov 			if (rtm != NULL)
857f2e5eb36SAlexander V. Chernikov 				free(rtm, M_TEMP);
858df8bae1dSRodney W. Grimes 			m_freem(m);
859df8bae1dSRodney W. Grimes 			return (error);
860df8bae1dSRodney W. Grimes 		}
861df8bae1dSRodney W. Grimes 		/* There is another listener, so construct message */
862df8bae1dSRodney W. Grimes 		rp = sotorawcb(so);
8634cc20ab1SSeigo Tanimura 	}
86492c227afSAlexander V. Chernikov 
8652277c5e5SAlexander V. Chernikov 	if (rtm != NULL) {
8660bebb544SHiroki Sato #ifdef INET6
8670bebb544SHiroki Sato 		if (rti_need_deembed) {
8680bebb544SHiroki Sato 			/* sin6_scope_id is recovered before sending rtm. */
8690bebb544SHiroki Sato 			sin6 = (struct sockaddr_in6 *)&ss;
87012bdf23aSHiroki Sato 			for (i = 0; i < RTAX_MAX; i++) {
8710bebb544SHiroki Sato 				if (info.rti_info[i] == NULL)
8720bebb544SHiroki Sato 					continue;
8730bebb544SHiroki Sato 				if (info.rti_info[i]->sa_family != AF_INET6)
8740bebb544SHiroki Sato 					continue;
8750bebb544SHiroki Sato 				bcopy(info.rti_info[i], sin6, sizeof(*sin6));
8760bebb544SHiroki Sato 				if (sa6_recoverscope(sin6) == 0)
8770bebb544SHiroki Sato 					bcopy(sin6, info.rti_info[i],
8780bebb544SHiroki Sato 						    sizeof(*sin6));
8790bebb544SHiroki Sato 			}
8800bebb544SHiroki Sato 		}
8810bebb544SHiroki Sato #endif
88292c227afSAlexander V. Chernikov 		if (error != 0)
88392c227afSAlexander V. Chernikov 			rtm->rtm_errno = error;
88492c227afSAlexander V. Chernikov 		else
88592c227afSAlexander V. Chernikov 			rtm->rtm_flags |= RTF_DONE;
88692c227afSAlexander V. Chernikov 
887df8bae1dSRodney W. Grimes 		m_copyback(m, 0, rtm->rtm_msglen, (caddr_t)rtm);
88803311056SHajimu UMEMOTO 		if (m->m_pkthdr.len < rtm->rtm_msglen) {
88903311056SHajimu UMEMOTO 			m_freem(m);
89003311056SHajimu UMEMOTO 			m = NULL;
89103311056SHajimu UMEMOTO 		} else if (m->m_pkthdr.len > rtm->rtm_msglen)
89203311056SHajimu UMEMOTO 			m_adj(m, rtm->rtm_msglen - m->m_pkthdr.len);
893f2e5eb36SAlexander V. Chernikov 
894f2e5eb36SAlexander V. Chernikov 		free(rtm, M_TEMP);
895df8bae1dSRodney W. Grimes 	}
89692c227afSAlexander V. Chernikov 	if (m != NULL) {
897773aa053SAlexander V. Chernikov 		M_SETFIB(m, fibnum);
898528737fdSBjoern A. Zeeb 		m->m_flags |= RTS_FILTER_FIB;
899becc44d7SSam Leffler 		if (rp) {
900becc44d7SSam Leffler 			/*
901becc44d7SSam Leffler 			 * XXX insure we don't get a copy by
902becc44d7SSam Leffler 			 * invalidating our protocol
903becc44d7SSam Leffler 			 */
904becc44d7SSam Leffler 			unsigned short family = rp->rcb_proto.sp_family;
905becc44d7SSam Leffler 			rp->rcb_proto.sp_family = 0;
9063ca1a2d6SMax Laier 			rt_dispatch(m, saf);
907becc44d7SSam Leffler 			rp->rcb_proto.sp_family = family;
908becc44d7SSam Leffler 		} else
9093ca1a2d6SMax Laier 			rt_dispatch(m, saf);
910becc44d7SSam Leffler 	}
91192c227afSAlexander V. Chernikov 
912df8bae1dSRodney W. Grimes 	return (error);
913df8bae1dSRodney W. Grimes }
914df8bae1dSRodney W. Grimes 
91552041295SPoul-Henning Kamp static void
916e3a7aa6fSGleb Smirnoff rt_getmetrics(const struct rtentry *rt, struct rt_metrics *out)
91797d8d152SAndre Oppermann {
918e3a7aa6fSGleb Smirnoff 
91997d8d152SAndre Oppermann 	bzero(out, sizeof(*out));
920e3a7aa6fSGleb Smirnoff 	out->rmx_mtu = rt->rt_mtu;
921e3a7aa6fSGleb Smirnoff 	out->rmx_weight = rt->rt_weight;
922e3a7aa6fSGleb Smirnoff 	out->rmx_pksent = counter_u64_fetch(rt->rt_pksent);
923e27c3f48SOleg Bulyzhin 	/* Kernel -> userland timebase conversion. */
924e3a7aa6fSGleb Smirnoff 	out->rmx_expire = rt->rt_expire ?
925e3a7aa6fSGleb Smirnoff 	    rt->rt_expire - time_uptime + time_second : 0;
92697d8d152SAndre Oppermann }
92797d8d152SAndre Oppermann 
9287f33a738SJulian Elischer /*
9297f33a738SJulian Elischer  * Extract the addresses of the passed sockaddrs.
9307f33a738SJulian Elischer  * Do a little sanity checking so as to avoid bad memory references.
931076d0761SJulian Elischer  * This data is derived straight from userland.
9327f33a738SJulian Elischer  */
933076d0761SJulian Elischer static int
934becc44d7SSam Leffler rt_xaddrs(caddr_t cp, caddr_t cplim, struct rt_addrinfo *rtinfo)
935df8bae1dSRodney W. Grimes {
936e74642dfSLuigi Rizzo 	struct sockaddr *sa;
937e74642dfSLuigi Rizzo 	int i;
938df8bae1dSRodney W. Grimes 
939becc44d7SSam Leffler 	for (i = 0; i < RTAX_MAX && cp < cplim; i++) {
940df8bae1dSRodney W. Grimes 		if ((rtinfo->rti_addrs & (1 << i)) == 0)
941df8bae1dSRodney W. Grimes 			continue;
942ff6d0a59SJulian Elischer 		sa = (struct sockaddr *)cp;
9437f33a738SJulian Elischer 		/*
944076d0761SJulian Elischer 		 * It won't fit.
9457f33a738SJulian Elischer 		 */
946becc44d7SSam Leffler 		if (cp + sa->sa_len > cplim)
947076d0761SJulian Elischer 			return (EINVAL);
9487f33a738SJulian Elischer 		/*
9497f33a738SJulian Elischer 		 * there are no more.. quit now
9507f33a738SJulian Elischer 		 * If there are more bits, they are in error.
9517f33a738SJulian Elischer 		 * I've seen this. route(1) can evidently generate these.
9527f33a738SJulian Elischer 		 * This causes kernel to core dump.
953076d0761SJulian Elischer 		 * for compatibility, If we see this, point to a safe address.
9547f33a738SJulian Elischer 		 */
955076d0761SJulian Elischer 		if (sa->sa_len == 0) {
956076d0761SJulian Elischer 			rtinfo->rti_info[i] = &sa_zero;
957076d0761SJulian Elischer 			return (0); /* should be EINVAL but for compat */
958df8bae1dSRodney W. Grimes 		}
959076d0761SJulian Elischer 		/* accept it */
9600bebb544SHiroki Sato #ifdef INET6
9610bebb544SHiroki Sato 		if (sa->sa_family == AF_INET6)
9620bebb544SHiroki Sato 			sa6_embedscope((struct sockaddr_in6 *)sa,
9630bebb544SHiroki Sato 			    V_ip6_use_defzone);
9640bebb544SHiroki Sato #endif
965076d0761SJulian Elischer 		rtinfo->rti_info[i] = sa;
966e74642dfSLuigi Rizzo 		cp += SA_SIZE(sa);
967076d0761SJulian Elischer 	}
968076d0761SJulian Elischer 	return (0);
969df8bae1dSRodney W. Grimes }
970df8bae1dSRodney W. Grimes 
9716d076ae8SBjoern A. Zeeb /*
9723deb3649SAlexander V. Chernikov  * Fill in @dmask with valid netmask leaving original @smask
9733deb3649SAlexander V. Chernikov  * intact. Mostly used with radix netmasks.
9743deb3649SAlexander V. Chernikov  */
9753deb3649SAlexander V. Chernikov static struct sockaddr *
9763deb3649SAlexander V. Chernikov rtsock_fix_netmask(struct sockaddr *dst, struct sockaddr *smask,
9773deb3649SAlexander V. Chernikov     struct sockaddr_storage *dmask)
9783deb3649SAlexander V. Chernikov {
9793deb3649SAlexander V. Chernikov 	if (dst == NULL || smask == NULL)
9803deb3649SAlexander V. Chernikov 		return (NULL);
9813deb3649SAlexander V. Chernikov 
9823deb3649SAlexander V. Chernikov 	memset(dmask, 0, dst->sa_len);
9833deb3649SAlexander V. Chernikov 	memcpy(dmask, smask, smask->sa_len);
9843deb3649SAlexander V. Chernikov 	dmask->ss_len = dst->sa_len;
9853deb3649SAlexander V. Chernikov 	dmask->ss_family = dst->sa_family;
9863deb3649SAlexander V. Chernikov 
9873deb3649SAlexander V. Chernikov 	return ((struct sockaddr *)dmask);
9883deb3649SAlexander V. Chernikov }
9893deb3649SAlexander V. Chernikov 
9903deb3649SAlexander V. Chernikov /*
9916db47af4SAlexander V. Chernikov  * Writes information related to @rtinfo object to newly-allocated mbuf.
9926db47af4SAlexander V. Chernikov  * Assumes MCLBYTES is enough to construct any message.
9936db47af4SAlexander V. Chernikov  * Used for OS notifications of vaious events (if/ifa announces,etc)
9946db47af4SAlexander V. Chernikov  *
9956db47af4SAlexander V. Chernikov  * Returns allocated mbuf or NULL on failure.
9966d076ae8SBjoern A. Zeeb  */
997df8bae1dSRodney W. Grimes static struct mbuf *
9986db47af4SAlexander V. Chernikov rtsock_msg_mbuf(int type, struct rt_addrinfo *rtinfo)
999df8bae1dSRodney W. Grimes {
10005dfc91d7SLuigi Rizzo 	struct rt_msghdr *rtm;
10015dfc91d7SLuigi Rizzo 	struct mbuf *m;
10025dfc91d7SLuigi Rizzo 	int i;
10035dfc91d7SLuigi Rizzo 	struct sockaddr *sa;
10046bbfef90SHiroki Sato #ifdef INET6
10056bbfef90SHiroki Sato 	struct sockaddr_storage ss;
10066bbfef90SHiroki Sato 	struct sockaddr_in6 *sin6;
10076bbfef90SHiroki Sato #endif
1008df8bae1dSRodney W. Grimes 	int len, dlen;
1009df8bae1dSRodney W. Grimes 
1010df8bae1dSRodney W. Grimes 	switch (type) {
1011df8bae1dSRodney W. Grimes 
1012df8bae1dSRodney W. Grimes 	case RTM_DELADDR:
1013df8bae1dSRodney W. Grimes 	case RTM_NEWADDR:
1014df8bae1dSRodney W. Grimes 		len = sizeof(struct ifa_msghdr);
1015df8bae1dSRodney W. Grimes 		break;
1016df8bae1dSRodney W. Grimes 
1017477180fbSGarrett Wollman 	case RTM_DELMADDR:
1018477180fbSGarrett Wollman 	case RTM_NEWMADDR:
1019477180fbSGarrett Wollman 		len = sizeof(struct ifma_msghdr);
1020477180fbSGarrett Wollman 		break;
1021477180fbSGarrett Wollman 
1022df8bae1dSRodney W. Grimes 	case RTM_IFINFO:
1023df8bae1dSRodney W. Grimes 		len = sizeof(struct if_msghdr);
1024df8bae1dSRodney W. Grimes 		break;
1025df8bae1dSRodney W. Grimes 
10267b6edd04SRuslan Ermilov 	case RTM_IFANNOUNCE:
1027b83a279fSSam Leffler 	case RTM_IEEE80211:
10287b6edd04SRuslan Ermilov 		len = sizeof(struct if_announcemsghdr);
10297b6edd04SRuslan Ermilov 		break;
10307b6edd04SRuslan Ermilov 
1031df8bae1dSRodney W. Grimes 	default:
1032df8bae1dSRodney W. Grimes 		len = sizeof(struct rt_msghdr);
1033df8bae1dSRodney W. Grimes 	}
1034c69f77c3SGleb Smirnoff 
1035c69f77c3SGleb Smirnoff 	/* XXXGL: can we use MJUMPAGESIZE cluster here? */
1036c69f77c3SGleb Smirnoff 	KASSERT(len <= MCLBYTES, ("%s: message too big", __func__));
1037c69f77c3SGleb Smirnoff 	if (len > MHLEN)
1038c69f77c3SGleb Smirnoff 		m = m_getcl(M_NOWAIT, MT_DATA, M_PKTHDR);
1039c69f77c3SGleb Smirnoff 	else
1040eb1b1807SGleb Smirnoff 		m = m_gethdr(M_NOWAIT, MT_DATA);
10415dfc91d7SLuigi Rizzo 	if (m == NULL)
104233841545SHajimu UMEMOTO 		return (m);
1043c69f77c3SGleb Smirnoff 
1044df8bae1dSRodney W. Grimes 	m->m_pkthdr.len = m->m_len = len;
1045df8bae1dSRodney W. Grimes 	rtm = mtod(m, struct rt_msghdr *);
1046df8bae1dSRodney W. Grimes 	bzero((caddr_t)rtm, len);
1047df8bae1dSRodney W. Grimes 	for (i = 0; i < RTAX_MAX; i++) {
1048df8bae1dSRodney W. Grimes 		if ((sa = rtinfo->rti_info[i]) == NULL)
1049df8bae1dSRodney W. Grimes 			continue;
1050df8bae1dSRodney W. Grimes 		rtinfo->rti_addrs |= (1 << i);
1051e74642dfSLuigi Rizzo 		dlen = SA_SIZE(sa);
10526bbfef90SHiroki Sato #ifdef INET6
10535c9fa630SHiroki Sato 		if (V_deembed_scopeid && sa->sa_family == AF_INET6) {
10546bbfef90SHiroki Sato 			sin6 = (struct sockaddr_in6 *)&ss;
10556bbfef90SHiroki Sato 			bcopy(sa, sin6, sizeof(*sin6));
10566bbfef90SHiroki Sato 			if (sa6_recoverscope(sin6) == 0)
10576bbfef90SHiroki Sato 				sa = (struct sockaddr *)sin6;
10586bbfef90SHiroki Sato 		}
10596bbfef90SHiroki Sato #endif
1060df8bae1dSRodney W. Grimes 		m_copyback(m, len, dlen, (caddr_t)sa);
1061df8bae1dSRodney W. Grimes 		len += dlen;
1062df8bae1dSRodney W. Grimes 	}
1063df8bae1dSRodney W. Grimes 	if (m->m_pkthdr.len != len) {
1064df8bae1dSRodney W. Grimes 		m_freem(m);
1065df8bae1dSRodney W. Grimes 		return (NULL);
1066df8bae1dSRodney W. Grimes 	}
1067df8bae1dSRodney W. Grimes 	rtm->rtm_msglen = len;
1068df8bae1dSRodney W. Grimes 	rtm->rtm_version = RTM_VERSION;
1069df8bae1dSRodney W. Grimes 	rtm->rtm_type = type;
1070df8bae1dSRodney W. Grimes 	return (m);
1071df8bae1dSRodney W. Grimes }
1072df8bae1dSRodney W. Grimes 
10736d076ae8SBjoern A. Zeeb /*
1074f2e5eb36SAlexander V. Chernikov  * Writes information related to @rtinfo object to preallocated buffer.
1075f2e5eb36SAlexander V. Chernikov  * Stores needed size in @plen. If @w is NULL, calculates size without
1076f2e5eb36SAlexander V. Chernikov  * writing.
1077f2e5eb36SAlexander V. Chernikov  * Used for sysctl dumps and rtsock answers (RTM_DEL/RTM_GET) generation.
1078f2e5eb36SAlexander V. Chernikov  *
1079f2e5eb36SAlexander V. Chernikov  * Returns 0 on success.
1080f2e5eb36SAlexander V. Chernikov  *
10816d076ae8SBjoern A. Zeeb  */
1082df8bae1dSRodney W. Grimes static int
1083f2e5eb36SAlexander V. Chernikov rtsock_msg_buffer(int type, struct rt_addrinfo *rtinfo, struct walkarg *w, int *plen)
1084df8bae1dSRodney W. Grimes {
10855dfc91d7SLuigi Rizzo 	int i;
1086f2e5eb36SAlexander V. Chernikov 	int len, buflen = 0, dlen;
1087de46b2c6SAlexander V. Chernikov 	caddr_t cp = NULL;
1088f2e5eb36SAlexander V. Chernikov 	struct rt_msghdr *rtm = NULL;
10896bbfef90SHiroki Sato #ifdef INET6
10906bbfef90SHiroki Sato 	struct sockaddr_storage ss;
10916bbfef90SHiroki Sato 	struct sockaddr_in6 *sin6;
10926bbfef90SHiroki Sato #endif
1093df8bae1dSRodney W. Grimes 
1094df8bae1dSRodney W. Grimes 	switch (type) {
1095df8bae1dSRodney W. Grimes 
1096df8bae1dSRodney W. Grimes 	case RTM_DELADDR:
1097df8bae1dSRodney W. Grimes 	case RTM_NEWADDR:
10986d076ae8SBjoern A. Zeeb 		if (w != NULL && w->w_op == NET_RT_IFLISTL) {
10996d076ae8SBjoern A. Zeeb #ifdef COMPAT_FREEBSD32
11006d076ae8SBjoern A. Zeeb 			if (w->w_req->flags & SCTL_MASK32)
11016d076ae8SBjoern A. Zeeb 				len = sizeof(struct ifa_msghdrl32);
11026d076ae8SBjoern A. Zeeb 			else
11036d076ae8SBjoern A. Zeeb #endif
11046d076ae8SBjoern A. Zeeb 				len = sizeof(struct ifa_msghdrl);
11056d076ae8SBjoern A. Zeeb 		} else
1106df8bae1dSRodney W. Grimes 			len = sizeof(struct ifa_msghdr);
1107df8bae1dSRodney W. Grimes 		break;
1108df8bae1dSRodney W. Grimes 
1109df8bae1dSRodney W. Grimes 	case RTM_IFINFO:
1110427a928aSKonstantin Belousov #ifdef COMPAT_FREEBSD32
1111427a928aSKonstantin Belousov 		if (w != NULL && w->w_req->flags & SCTL_MASK32) {
11126d076ae8SBjoern A. Zeeb 			if (w->w_op == NET_RT_IFLISTL)
11136d076ae8SBjoern A. Zeeb 				len = sizeof(struct if_msghdrl32);
11146d076ae8SBjoern A. Zeeb 			else
1115427a928aSKonstantin Belousov 				len = sizeof(struct if_msghdr32);
1116427a928aSKonstantin Belousov 			break;
1117427a928aSKonstantin Belousov 		}
1118427a928aSKonstantin Belousov #endif
11196d076ae8SBjoern A. Zeeb 		if (w != NULL && w->w_op == NET_RT_IFLISTL)
11206d076ae8SBjoern A. Zeeb 			len = sizeof(struct if_msghdrl);
11216d076ae8SBjoern A. Zeeb 		else
1122df8bae1dSRodney W. Grimes 			len = sizeof(struct if_msghdr);
1123df8bae1dSRodney W. Grimes 		break;
1124df8bae1dSRodney W. Grimes 
112505b2efe0SBruce M Simpson 	case RTM_NEWMADDR:
112605b2efe0SBruce M Simpson 		len = sizeof(struct ifma_msghdr);
112705b2efe0SBruce M Simpson 		break;
112805b2efe0SBruce M Simpson 
1129df8bae1dSRodney W. Grimes 	default:
1130df8bae1dSRodney W. Grimes 		len = sizeof(struct rt_msghdr);
1131df8bae1dSRodney W. Grimes 	}
1132f2e5eb36SAlexander V. Chernikov 
1133f2e5eb36SAlexander V. Chernikov 	if (w != NULL) {
1134f2e5eb36SAlexander V. Chernikov 		rtm = (struct rt_msghdr *)w->w_tmem;
1135f2e5eb36SAlexander V. Chernikov 		buflen = w->w_tmemsize - len;
1136f2e5eb36SAlexander V. Chernikov 		cp = (caddr_t)w->w_tmem + len;
1137f2e5eb36SAlexander V. Chernikov 	}
1138f2e5eb36SAlexander V. Chernikov 
1139f2e5eb36SAlexander V. Chernikov 	rtinfo->rti_addrs = 0;
1140df8bae1dSRodney W. Grimes 	for (i = 0; i < RTAX_MAX; i++) {
11415dfc91d7SLuigi Rizzo 		struct sockaddr *sa;
1142df8bae1dSRodney W. Grimes 
11435dfc91d7SLuigi Rizzo 		if ((sa = rtinfo->rti_info[i]) == NULL)
1144df8bae1dSRodney W. Grimes 			continue;
1145df8bae1dSRodney W. Grimes 		rtinfo->rti_addrs |= (1 << i);
1146e74642dfSLuigi Rizzo 		dlen = SA_SIZE(sa);
1147f2e5eb36SAlexander V. Chernikov 		if (cp != NULL && buflen >= dlen) {
11486bbfef90SHiroki Sato #ifdef INET6
11495c9fa630SHiroki Sato 			if (V_deembed_scopeid && sa->sa_family == AF_INET6) {
11506bbfef90SHiroki Sato 				sin6 = (struct sockaddr_in6 *)&ss;
11516bbfef90SHiroki Sato 				bcopy(sa, sin6, sizeof(*sin6));
11526bbfef90SHiroki Sato 				if (sa6_recoverscope(sin6) == 0)
11536bbfef90SHiroki Sato 					sa = (struct sockaddr *)sin6;
11546bbfef90SHiroki Sato 			}
11556bbfef90SHiroki Sato #endif
1156df8bae1dSRodney W. Grimes 			bcopy((caddr_t)sa, cp, (unsigned)dlen);
1157df8bae1dSRodney W. Grimes 			cp += dlen;
1158f2e5eb36SAlexander V. Chernikov 			buflen -= dlen;
1159f2e5eb36SAlexander V. Chernikov 		} else if (cp != NULL) {
1160f2e5eb36SAlexander V. Chernikov 			/*
1161f2e5eb36SAlexander V. Chernikov 			 * Buffer too small. Count needed size
1162f2e5eb36SAlexander V. Chernikov 			 * and return with error.
1163f2e5eb36SAlexander V. Chernikov 			 */
1164f2e5eb36SAlexander V. Chernikov 			cp = NULL;
1165df8bae1dSRodney W. Grimes 		}
1166f2e5eb36SAlexander V. Chernikov 
1167df8bae1dSRodney W. Grimes 		len += dlen;
1168df8bae1dSRodney W. Grimes 	}
1169f2e5eb36SAlexander V. Chernikov 
1170f2e5eb36SAlexander V. Chernikov 	if (cp != NULL) {
1171f2e5eb36SAlexander V. Chernikov 		dlen = ALIGN(len) - len;
1172f2e5eb36SAlexander V. Chernikov 		if (buflen < dlen)
1173f2e5eb36SAlexander V. Chernikov 			cp = NULL;
1174f2e5eb36SAlexander V. Chernikov 		else
1175f2e5eb36SAlexander V. Chernikov 			buflen -= dlen;
1176f2e5eb36SAlexander V. Chernikov 	}
1177694ff264SAndrew Gallatin 	len = ALIGN(len);
1178df8bae1dSRodney W. Grimes 
1179f2e5eb36SAlexander V. Chernikov 	if (cp != NULL) {
1180f2e5eb36SAlexander V. Chernikov 		/* fill header iff buffer is large enough */
1181df8bae1dSRodney W. Grimes 		rtm->rtm_version = RTM_VERSION;
1182df8bae1dSRodney W. Grimes 		rtm->rtm_type = type;
1183df8bae1dSRodney W. Grimes 		rtm->rtm_msglen = len;
1184df8bae1dSRodney W. Grimes 	}
1185f2e5eb36SAlexander V. Chernikov 
1186f2e5eb36SAlexander V. Chernikov 	*plen = len;
1187f2e5eb36SAlexander V. Chernikov 
1188f2e5eb36SAlexander V. Chernikov 	if (w != NULL && cp == NULL)
1189f2e5eb36SAlexander V. Chernikov 		return (ENOBUFS);
1190f2e5eb36SAlexander V. Chernikov 
1191f2e5eb36SAlexander V. Chernikov 	return (0);
1192df8bae1dSRodney W. Grimes }
1193df8bae1dSRodney W. Grimes 
1194df8bae1dSRodney W. Grimes /*
1195df8bae1dSRodney W. Grimes  * This routine is called to generate a message from the routing
1196df8bae1dSRodney W. Grimes  * socket indicating that a redirect has occured, a routing lookup
1197df8bae1dSRodney W. Grimes  * has failed, or that a protocol has detected timeouts to a particular
1198df8bae1dSRodney W. Grimes  * destination.
1199df8bae1dSRodney W. Grimes  */
1200df8bae1dSRodney W. Grimes void
1201528737fdSBjoern A. Zeeb rt_missmsg_fib(int type, struct rt_addrinfo *rtinfo, int flags, int error,
1202528737fdSBjoern A. Zeeb     int fibnum)
1203df8bae1dSRodney W. Grimes {
1204becc44d7SSam Leffler 	struct rt_msghdr *rtm;
1205becc44d7SSam Leffler 	struct mbuf *m;
1206df8bae1dSRodney W. Grimes 	struct sockaddr *sa = rtinfo->rti_info[RTAX_DST];
1207df8bae1dSRodney W. Grimes 
1208c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
1209df8bae1dSRodney W. Grimes 		return;
12106db47af4SAlexander V. Chernikov 	m = rtsock_msg_mbuf(type, rtinfo);
12115dfc91d7SLuigi Rizzo 	if (m == NULL)
1212df8bae1dSRodney W. Grimes 		return;
1213528737fdSBjoern A. Zeeb 
12147d9b6df1SAlexander V. Chernikov 	if (fibnum != RT_ALL_FIBS) {
1215528737fdSBjoern A. Zeeb 		KASSERT(fibnum >= 0 && fibnum < rt_numfibs, ("%s: fibnum out "
1216528737fdSBjoern A. Zeeb 		    "of range 0 <= %d < %d", __func__, fibnum, rt_numfibs));
1217528737fdSBjoern A. Zeeb 		M_SETFIB(m, fibnum);
1218528737fdSBjoern A. Zeeb 		m->m_flags |= RTS_FILTER_FIB;
1219528737fdSBjoern A. Zeeb 	}
1220528737fdSBjoern A. Zeeb 
1221df8bae1dSRodney W. Grimes 	rtm = mtod(m, struct rt_msghdr *);
1222df8bae1dSRodney W. Grimes 	rtm->rtm_flags = RTF_DONE | flags;
1223df8bae1dSRodney W. Grimes 	rtm->rtm_errno = error;
1224df8bae1dSRodney W. Grimes 	rtm->rtm_addrs = rtinfo->rti_addrs;
12253ca1a2d6SMax Laier 	rt_dispatch(m, sa ? sa->sa_family : AF_UNSPEC);
1226df8bae1dSRodney W. Grimes }
1227df8bae1dSRodney W. Grimes 
1228528737fdSBjoern A. Zeeb void
1229528737fdSBjoern A. Zeeb rt_missmsg(int type, struct rt_addrinfo *rtinfo, int flags, int error)
1230528737fdSBjoern A. Zeeb {
1231528737fdSBjoern A. Zeeb 
12327d9b6df1SAlexander V. Chernikov 	rt_missmsg_fib(type, rtinfo, flags, error, RT_ALL_FIBS);
1233528737fdSBjoern A. Zeeb }
1234528737fdSBjoern A. Zeeb 
1235df8bae1dSRodney W. Grimes /*
1236df8bae1dSRodney W. Grimes  * This routine is called to generate a message from the routing
1237df8bae1dSRodney W. Grimes  * socket indicating that the status of a network interface has changed.
1238df8bae1dSRodney W. Grimes  */
1239df8bae1dSRodney W. Grimes void
1240becc44d7SSam Leffler rt_ifmsg(struct ifnet *ifp)
1241df8bae1dSRodney W. Grimes {
1242becc44d7SSam Leffler 	struct if_msghdr *ifm;
1243df8bae1dSRodney W. Grimes 	struct mbuf *m;
1244df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
1245df8bae1dSRodney W. Grimes 
1246c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
1247df8bae1dSRodney W. Grimes 		return;
1248df8bae1dSRodney W. Grimes 	bzero((caddr_t)&info, sizeof(info));
12496db47af4SAlexander V. Chernikov 	m = rtsock_msg_mbuf(RTM_IFINFO, &info);
12505dfc91d7SLuigi Rizzo 	if (m == NULL)
1251df8bae1dSRodney W. Grimes 		return;
1252df8bae1dSRodney W. Grimes 	ifm = mtod(m, struct if_msghdr *);
1253df8bae1dSRodney W. Grimes 	ifm->ifm_index = ifp->if_index;
1254292ee7beSRobert Watson 	ifm->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
1255*e6485f73SGleb Smirnoff 	if_data_copy(ifp, &ifm->ifm_data);
1256df8bae1dSRodney W. Grimes 	ifm->ifm_addrs = 0;
12573ca1a2d6SMax Laier 	rt_dispatch(m, AF_UNSPEC);
1258df8bae1dSRodney W. Grimes }
1259df8bae1dSRodney W. Grimes 
1260df8bae1dSRodney W. Grimes /*
12614cbac30bSAlexander V. Chernikov  * Announce interface address arrival/withdraw.
12624cbac30bSAlexander V. Chernikov  * Please do not call directly, use rt_addrmsg().
12634cbac30bSAlexander V. Chernikov  * Assume input data to be valid.
12644cbac30bSAlexander V. Chernikov  * Returns 0 on success.
1265df8bae1dSRodney W. Grimes  */
12664cbac30bSAlexander V. Chernikov int
12674cbac30bSAlexander V. Chernikov rtsock_addrmsg(int cmd, struct ifaddr *ifa, int fibnum)
1268df8bae1dSRodney W. Grimes {
1269df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
12704cbac30bSAlexander V. Chernikov 	struct sockaddr *sa;
12714cbac30bSAlexander V. Chernikov 	int ncmd;
12724cbac30bSAlexander V. Chernikov 	struct mbuf *m;
12734cbac30bSAlexander V. Chernikov 	struct ifa_msghdr *ifam;
1274df8bae1dSRodney W. Grimes 	struct ifnet *ifp = ifa->ifa_ifp;
12753deb3649SAlexander V. Chernikov 	struct sockaddr_storage ss;
1276df8bae1dSRodney W. Grimes 
1277c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
12784cbac30bSAlexander V. Chernikov 		return (0);
1279df8bae1dSRodney W. Grimes 
12804cbac30bSAlexander V. Chernikov 	ncmd = cmd == RTM_ADD ? RTM_NEWADDR : RTM_DELADDR;
12814cbac30bSAlexander V. Chernikov 
12824cbac30bSAlexander V. Chernikov 	bzero((caddr_t)&info, sizeof(info));
1283becc44d7SSam Leffler 	info.rti_info[RTAX_IFA] = sa = ifa->ifa_addr;
12844a0d6638SRuslan Ermilov 	info.rti_info[RTAX_IFP] = ifp->if_addr->ifa_addr;
12853deb3649SAlexander V. Chernikov 	info.rti_info[RTAX_NETMASK] = rtsock_fix_netmask(
12863deb3649SAlexander V. Chernikov 	    info.rti_info[RTAX_IFP], ifa->ifa_netmask, &ss);
1287becc44d7SSam Leffler 	info.rti_info[RTAX_BRD] = ifa->ifa_dstaddr;
12886db47af4SAlexander V. Chernikov 	if ((m = rtsock_msg_mbuf(ncmd, &info)) == NULL)
12894cbac30bSAlexander V. Chernikov 		return (ENOBUFS);
1290df8bae1dSRodney W. Grimes 	ifam = mtod(m, struct ifa_msghdr *);
1291df8bae1dSRodney W. Grimes 	ifam->ifam_index = ifp->if_index;
12929753faf5SGleb Smirnoff 	ifam->ifam_metric = ifa->ifa_ifp->if_metric;
1293df8bae1dSRodney W. Grimes 	ifam->ifam_flags = ifa->ifa_flags;
1294df8bae1dSRodney W. Grimes 	ifam->ifam_addrs = info.rti_addrs;
12954cbac30bSAlexander V. Chernikov 
12964cbac30bSAlexander V. Chernikov 	if (fibnum != RT_ALL_FIBS) {
12974cbac30bSAlexander V. Chernikov 		M_SETFIB(m, fibnum);
12984cbac30bSAlexander V. Chernikov 		m->m_flags |= RTS_FILTER_FIB;
1299df8bae1dSRodney W. Grimes 	}
13004cbac30bSAlexander V. Chernikov 
13014cbac30bSAlexander V. Chernikov 	rt_dispatch(m, sa ? sa->sa_family : AF_UNSPEC);
13024cbac30bSAlexander V. Chernikov 
13034cbac30bSAlexander V. Chernikov 	return (0);
13044cbac30bSAlexander V. Chernikov }
13054cbac30bSAlexander V. Chernikov 
13064cbac30bSAlexander V. Chernikov /*
13074cbac30bSAlexander V. Chernikov  * Announce route addition/removal.
13084cbac30bSAlexander V. Chernikov  * Please do not call directly, use rt_routemsg().
13094cbac30bSAlexander V. Chernikov  * Note that @rt data MAY be inconsistent/invalid:
13104cbac30bSAlexander V. Chernikov  * if some userland app sends us "invalid" route message (invalid mask,
13114cbac30bSAlexander V. Chernikov  * no dst, wrong address families, etc...) we need to pass it back
13124cbac30bSAlexander V. Chernikov  * to app (and any other rtsock consumers) with rtm_errno field set to
13134cbac30bSAlexander V. Chernikov  * non-zero value.
13144cbac30bSAlexander V. Chernikov  *
13154cbac30bSAlexander V. Chernikov  * Returns 0 on success.
13164cbac30bSAlexander V. Chernikov  */
13174cbac30bSAlexander V. Chernikov int
13184cbac30bSAlexander V. Chernikov rtsock_routemsg(int cmd, struct ifnet *ifp, int error, struct rtentry *rt,
13194cbac30bSAlexander V. Chernikov     int fibnum)
13204cbac30bSAlexander V. Chernikov {
13214cbac30bSAlexander V. Chernikov 	struct rt_addrinfo info;
13224cbac30bSAlexander V. Chernikov 	struct sockaddr *sa;
13234cbac30bSAlexander V. Chernikov 	struct mbuf *m;
13245dfc91d7SLuigi Rizzo 	struct rt_msghdr *rtm;
13253deb3649SAlexander V. Chernikov 	struct sockaddr_storage ss;
1326df8bae1dSRodney W. Grimes 
1327c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
13284cbac30bSAlexander V. Chernikov 		return (0);
13294cbac30bSAlexander V. Chernikov 
13304cbac30bSAlexander V. Chernikov 	bzero((caddr_t)&info, sizeof(info));
1331becc44d7SSam Leffler 	info.rti_info[RTAX_DST] = sa = rt_key(rt);
13323deb3649SAlexander V. Chernikov 	info.rti_info[RTAX_NETMASK] = rtsock_fix_netmask(sa, rt_mask(rt), &ss);
1333becc44d7SSam Leffler 	info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
13346db47af4SAlexander V. Chernikov 	if ((m = rtsock_msg_mbuf(cmd, &info)) == NULL)
13354cbac30bSAlexander V. Chernikov 		return (ENOBUFS);
1336df8bae1dSRodney W. Grimes 	rtm = mtod(m, struct rt_msghdr *);
1337df8bae1dSRodney W. Grimes 	rtm->rtm_index = ifp->if_index;
1338df8bae1dSRodney W. Grimes 	rtm->rtm_flags |= rt->rt_flags;
1339df8bae1dSRodney W. Grimes 	rtm->rtm_errno = error;
1340df8bae1dSRodney W. Grimes 	rtm->rtm_addrs = info.rti_addrs;
13414cbac30bSAlexander V. Chernikov 
13427d9b6df1SAlexander V. Chernikov 	if (fibnum != RT_ALL_FIBS) {
1343528737fdSBjoern A. Zeeb 		M_SETFIB(m, fibnum);
1344528737fdSBjoern A. Zeeb 		m->m_flags |= RTS_FILTER_FIB;
1345528737fdSBjoern A. Zeeb 	}
13464cbac30bSAlexander V. Chernikov 
13473ca1a2d6SMax Laier 	rt_dispatch(m, sa ? sa->sa_family : AF_UNSPEC);
13484cbac30bSAlexander V. Chernikov 
13494cbac30bSAlexander V. Chernikov 	return (0);
1350df8bae1dSRodney W. Grimes }
1351df8bae1dSRodney W. Grimes 
1352477180fbSGarrett Wollman /*
1353477180fbSGarrett Wollman  * This is the analogue to the rt_newaddrmsg which performs the same
1354477180fbSGarrett Wollman  * function but for multicast group memberhips.  This is easier since
1355477180fbSGarrett Wollman  * there is no route state to worry about.
1356477180fbSGarrett Wollman  */
1357477180fbSGarrett Wollman void
1358becc44d7SSam Leffler rt_newmaddrmsg(int cmd, struct ifmultiaddr *ifma)
1359477180fbSGarrett Wollman {
1360477180fbSGarrett Wollman 	struct rt_addrinfo info;
13615dfc91d7SLuigi Rizzo 	struct mbuf *m = NULL;
1362477180fbSGarrett Wollman 	struct ifnet *ifp = ifma->ifma_ifp;
1363477180fbSGarrett Wollman 	struct ifma_msghdr *ifmam;
1364477180fbSGarrett Wollman 
1365c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
1366477180fbSGarrett Wollman 		return;
1367477180fbSGarrett Wollman 
1368477180fbSGarrett Wollman 	bzero((caddr_t)&info, sizeof(info));
1369becc44d7SSam Leffler 	info.rti_info[RTAX_IFA] = ifma->ifma_addr;
13704a0d6638SRuslan Ermilov 	info.rti_info[RTAX_IFP] = ifp ? ifp->if_addr->ifa_addr : NULL;
1371477180fbSGarrett Wollman 	/*
1372477180fbSGarrett Wollman 	 * If a link-layer address is present, present it as a ``gateway''
1373477180fbSGarrett Wollman 	 * (similarly to how ARP entries, e.g., are presented).
1374477180fbSGarrett Wollman 	 */
1375becc44d7SSam Leffler 	info.rti_info[RTAX_GATEWAY] = ifma->ifma_lladdr;
13766db47af4SAlexander V. Chernikov 	m = rtsock_msg_mbuf(cmd, &info);
1377becc44d7SSam Leffler 	if (m == NULL)
1378477180fbSGarrett Wollman 		return;
1379477180fbSGarrett Wollman 	ifmam = mtod(m, struct ifma_msghdr *);
138075ae0c01SBruce M Simpson 	KASSERT(ifp != NULL, ("%s: link-layer multicast address w/o ifp\n",
138175ae0c01SBruce M Simpson 	    __func__));
1382477180fbSGarrett Wollman 	ifmam->ifmam_index = ifp->if_index;
1383477180fbSGarrett Wollman 	ifmam->ifmam_addrs = info.rti_addrs;
13843ca1a2d6SMax Laier 	rt_dispatch(m, ifma->ifma_addr ? ifma->ifma_addr->sa_family : AF_UNSPEC);
1385477180fbSGarrett Wollman }
138652041295SPoul-Henning Kamp 
1387b83a279fSSam Leffler static struct mbuf *
1388b83a279fSSam Leffler rt_makeifannouncemsg(struct ifnet *ifp, int type, int what,
1389b83a279fSSam Leffler 	struct rt_addrinfo *info)
1390b83a279fSSam Leffler {
1391b83a279fSSam Leffler 	struct if_announcemsghdr *ifan;
1392b83a279fSSam Leffler 	struct mbuf *m;
1393b83a279fSSam Leffler 
1394c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
1395b83a279fSSam Leffler 		return NULL;
1396b83a279fSSam Leffler 	bzero((caddr_t)info, sizeof(*info));
13976db47af4SAlexander V. Chernikov 	m = rtsock_msg_mbuf(type, info);
1398b83a279fSSam Leffler 	if (m != NULL) {
1399b83a279fSSam Leffler 		ifan = mtod(m, struct if_announcemsghdr *);
1400b83a279fSSam Leffler 		ifan->ifan_index = ifp->if_index;
1401b83a279fSSam Leffler 		strlcpy(ifan->ifan_name, ifp->if_xname,
1402b83a279fSSam Leffler 			sizeof(ifan->ifan_name));
1403b83a279fSSam Leffler 		ifan->ifan_what = what;
1404b83a279fSSam Leffler 	}
1405b83a279fSSam Leffler 	return m;
1406b83a279fSSam Leffler }
1407b83a279fSSam Leffler 
1408b83a279fSSam Leffler /*
1409b83a279fSSam Leffler  * This is called to generate routing socket messages indicating
1410b83a279fSSam Leffler  * IEEE80211 wireless events.
1411b83a279fSSam Leffler  * XXX we piggyback on the RTM_IFANNOUNCE msg format in a clumsy way.
1412b83a279fSSam Leffler  */
1413b83a279fSSam Leffler void
1414b83a279fSSam Leffler rt_ieee80211msg(struct ifnet *ifp, int what, void *data, size_t data_len)
1415b83a279fSSam Leffler {
1416b83a279fSSam Leffler 	struct mbuf *m;
1417b83a279fSSam Leffler 	struct rt_addrinfo info;
1418b83a279fSSam Leffler 
1419b83a279fSSam Leffler 	m = rt_makeifannouncemsg(ifp, RTM_IEEE80211, what, &info);
1420b83a279fSSam Leffler 	if (m != NULL) {
1421b83a279fSSam Leffler 		/*
1422b83a279fSSam Leffler 		 * Append the ieee80211 data.  Try to stick it in the
1423b83a279fSSam Leffler 		 * mbuf containing the ifannounce msg; otherwise allocate
1424b83a279fSSam Leffler 		 * a new mbuf and append.
1425b83a279fSSam Leffler 		 *
1426b83a279fSSam Leffler 		 * NB: we assume m is a single mbuf.
1427b83a279fSSam Leffler 		 */
1428b83a279fSSam Leffler 		if (data_len > M_TRAILINGSPACE(m)) {
1429b83a279fSSam Leffler 			struct mbuf *n = m_get(M_NOWAIT, MT_DATA);
1430b83a279fSSam Leffler 			if (n == NULL) {
1431b83a279fSSam Leffler 				m_freem(m);
1432b83a279fSSam Leffler 				return;
1433b83a279fSSam Leffler 			}
1434b83a279fSSam Leffler 			bcopy(data, mtod(n, void *), data_len);
1435b83a279fSSam Leffler 			n->m_len = data_len;
1436b83a279fSSam Leffler 			m->m_next = n;
1437b83a279fSSam Leffler 		} else if (data_len > 0) {
1438b83a279fSSam Leffler 			bcopy(data, mtod(m, u_int8_t *) + m->m_len, data_len);
1439b83a279fSSam Leffler 			m->m_len += data_len;
1440b83a279fSSam Leffler 		}
1441b83a279fSSam Leffler 		if (m->m_flags & M_PKTHDR)
1442b83a279fSSam Leffler 			m->m_pkthdr.len += data_len;
1443b83a279fSSam Leffler 		mtod(m, struct if_announcemsghdr *)->ifan_msglen += data_len;
14443ca1a2d6SMax Laier 		rt_dispatch(m, AF_UNSPEC);
1445b83a279fSSam Leffler 	}
1446b83a279fSSam Leffler }
1447b83a279fSSam Leffler 
1448df8bae1dSRodney W. Grimes /*
14497b6edd04SRuslan Ermilov  * This is called to generate routing socket messages indicating
14507b6edd04SRuslan Ermilov  * network interface arrival and departure.
14517b6edd04SRuslan Ermilov  */
14527b6edd04SRuslan Ermilov void
1453becc44d7SSam Leffler rt_ifannouncemsg(struct ifnet *ifp, int what)
14547b6edd04SRuslan Ermilov {
14557b6edd04SRuslan Ermilov 	struct mbuf *m;
14567b6edd04SRuslan Ermilov 	struct rt_addrinfo info;
14577b6edd04SRuslan Ermilov 
1458b83a279fSSam Leffler 	m = rt_makeifannouncemsg(ifp, RTM_IFANNOUNCE, what, &info);
1459b83a279fSSam Leffler 	if (m != NULL)
14603ca1a2d6SMax Laier 		rt_dispatch(m, AF_UNSPEC);
1461becc44d7SSam Leffler }
1462becc44d7SSam Leffler 
1463becc44d7SSam Leffler static void
14643ca1a2d6SMax Laier rt_dispatch(struct mbuf *m, sa_family_t saf)
1465becc44d7SSam Leffler {
1466d989c7b3SRobert Watson 	struct m_tag *tag;
1467becc44d7SSam Leffler 
1468d989c7b3SRobert Watson 	/*
1469d989c7b3SRobert Watson 	 * Preserve the family from the sockaddr, if any, in an m_tag for
1470d989c7b3SRobert Watson 	 * use when injecting the mbuf into the routing socket buffer from
1471d989c7b3SRobert Watson 	 * the netisr.
1472d989c7b3SRobert Watson 	 */
14733ca1a2d6SMax Laier 	if (saf != AF_UNSPEC) {
1474d989c7b3SRobert Watson 		tag = m_tag_get(PACKET_TAG_RTSOCKFAM, sizeof(unsigned short),
1475d989c7b3SRobert Watson 		    M_NOWAIT);
1476d989c7b3SRobert Watson 		if (tag == NULL) {
1477d989c7b3SRobert Watson 			m_freem(m);
1478d989c7b3SRobert Watson 			return;
1479d989c7b3SRobert Watson 		}
14803ca1a2d6SMax Laier 		*(unsigned short *)(tag + 1) = saf;
1481d989c7b3SRobert Watson 		m_tag_prepend(m, tag);
1482d989c7b3SRobert Watson 	}
148321ca7b57SMarko Zec #ifdef VIMAGE
148421ca7b57SMarko Zec 	if (V_loif)
148521ca7b57SMarko Zec 		m->m_pkthdr.rcvif = V_loif;
148621ca7b57SMarko Zec 	else {
148721ca7b57SMarko Zec 		m_freem(m);
148821ca7b57SMarko Zec 		return;
148921ca7b57SMarko Zec 	}
149021ca7b57SMarko Zec #endif
14913161f583SAndre Oppermann 	netisr_queue(NETISR_ROUTE, m);	/* mbuf is free'd on failure. */
14927b6edd04SRuslan Ermilov }
14937b6edd04SRuslan Ermilov 
14947b6edd04SRuslan Ermilov /*
1495df8bae1dSRodney W. Grimes  * This is used in dumping the kernel table via sysctl().
1496df8bae1dSRodney W. Grimes  */
149737c84183SPoul-Henning Kamp static int
1498becc44d7SSam Leffler sysctl_dumpentry(struct radix_node *rn, void *vw)
1499df8bae1dSRodney W. Grimes {
1500becc44d7SSam Leffler 	struct walkarg *w = vw;
1501becc44d7SSam Leffler 	struct rtentry *rt = (struct rtentry *)rn;
1502df8bae1dSRodney W. Grimes 	int error = 0, size;
1503df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
15043deb3649SAlexander V. Chernikov 	struct sockaddr_storage ss;
1505df8bae1dSRodney W. Grimes 
1506df8bae1dSRodney W. Grimes 	if (w->w_op == NET_RT_FLAGS && !(rt->rt_flags & w->w_arg))
1507df8bae1dSRodney W. Grimes 		return 0;
1508b89e82ddSJamie Gritton 	if ((rt->rt_flags & RTF_HOST) == 0
1509de0bd6f7SBjoern A. Zeeb 	    ? jailed_without_vnet(w->w_req->td->td_ucred)
1510b89e82ddSJamie Gritton 	    : prison_if(w->w_req->td->td_ucred, rt_key(rt)) != 0)
1511813dd6aeSBjoern A. Zeeb 		return (0);
1512df8bae1dSRodney W. Grimes 	bzero((caddr_t)&info, sizeof(info));
1513becc44d7SSam Leffler 	info.rti_info[RTAX_DST] = rt_key(rt);
1514becc44d7SSam Leffler 	info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
15153deb3649SAlexander V. Chernikov 	info.rti_info[RTAX_NETMASK] = rtsock_fix_netmask(rt_key(rt),
15163deb3649SAlexander V. Chernikov 	    rt_mask(rt), &ss);
15176e6b3f7cSQing Li 	info.rti_info[RTAX_GENMASK] = 0;
151828070a0eSRuslan Ermilov 	if (rt->rt_ifp) {
15194a0d6638SRuslan Ermilov 		info.rti_info[RTAX_IFP] = rt->rt_ifp->if_addr->ifa_addr;
1520becc44d7SSam Leffler 		info.rti_info[RTAX_IFA] = rt->rt_ifa->ifa_addr;
152128070a0eSRuslan Ermilov 		if (rt->rt_ifp->if_flags & IFF_POINTOPOINT)
1522becc44d7SSam Leffler 			info.rti_info[RTAX_BRD] = rt->rt_ifa->ifa_dstaddr;
152328070a0eSRuslan Ermilov 	}
1524f2e5eb36SAlexander V. Chernikov 	if ((error = rtsock_msg_buffer(RTM_GET, &info, w, &size)) != 0)
1525f2e5eb36SAlexander V. Chernikov 		return (error);
152652041295SPoul-Henning Kamp 	if (w->w_req && w->w_tmem) {
1527becc44d7SSam Leffler 		struct rt_msghdr *rtm = (struct rt_msghdr *)w->w_tmem;
1528df8bae1dSRodney W. Grimes 
1529f672f56fSQing Li 		if (rt->rt_flags & RTF_GWFLAG_COMPAT)
1530f672f56fSQing Li 			rtm->rtm_flags = RTF_GATEWAY |
1531f672f56fSQing Li 				(rt->rt_flags & ~RTF_GWFLAG_COMPAT);
1532f672f56fSQing Li 		else
1533df8bae1dSRodney W. Grimes 			rtm->rtm_flags = rt->rt_flags;
1534e3a7aa6fSGleb Smirnoff 		rt_getmetrics(rt, &rtm->rtm_rmx);
1535df8bae1dSRodney W. Grimes 		rtm->rtm_index = rt->rt_ifp->if_index;
1536df8bae1dSRodney W. Grimes 		rtm->rtm_errno = rtm->rtm_pid = rtm->rtm_seq = 0;
1537df8bae1dSRodney W. Grimes 		rtm->rtm_addrs = info.rti_addrs;
153852041295SPoul-Henning Kamp 		error = SYSCTL_OUT(w->w_req, (caddr_t)rtm, size);
153952041295SPoul-Henning Kamp 		return (error);
1540df8bae1dSRodney W. Grimes 	}
1541df8bae1dSRodney W. Grimes 	return (error);
1542df8bae1dSRodney W. Grimes }
1543df8bae1dSRodney W. Grimes 
154437c84183SPoul-Henning Kamp static int
15456d076ae8SBjoern A. Zeeb sysctl_iflist_ifml(struct ifnet *ifp, struct rt_addrinfo *info,
15466d076ae8SBjoern A. Zeeb     struct walkarg *w, int len)
15476d076ae8SBjoern A. Zeeb {
15486d076ae8SBjoern A. Zeeb 	struct if_msghdrl *ifm;
1549b245f96cSGleb Smirnoff 	struct if_data *ifd;
1550b245f96cSGleb Smirnoff 
1551b245f96cSGleb Smirnoff 	ifm = (struct if_msghdrl *)w->w_tmem;
15526d076ae8SBjoern A. Zeeb 
15536d076ae8SBjoern A. Zeeb #ifdef COMPAT_FREEBSD32
15546d076ae8SBjoern A. Zeeb 	if (w->w_req->flags & SCTL_MASK32) {
15556d076ae8SBjoern A. Zeeb 		struct if_msghdrl32 *ifm32;
15566d076ae8SBjoern A. Zeeb 
1557b245f96cSGleb Smirnoff 		ifm32 = (struct if_msghdrl32 *)ifm;
15586d076ae8SBjoern A. Zeeb 		ifm32->ifm_addrs = info->rti_addrs;
15596d076ae8SBjoern A. Zeeb 		ifm32->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
15606d076ae8SBjoern A. Zeeb 		ifm32->ifm_index = ifp->if_index;
15616d076ae8SBjoern A. Zeeb 		ifm32->_ifm_spare1 = 0;
15626d076ae8SBjoern A. Zeeb 		ifm32->ifm_len = sizeof(*ifm32);
15636d076ae8SBjoern A. Zeeb 		ifm32->ifm_data_off = offsetof(struct if_msghdrl32, ifm_data);
1564b245f96cSGleb Smirnoff 		ifd = &ifm32->ifm_data;
1565b245f96cSGleb Smirnoff 	} else
15666d076ae8SBjoern A. Zeeb #endif
1567b245f96cSGleb Smirnoff 	{
15686d076ae8SBjoern A. Zeeb 		ifm->ifm_addrs = info->rti_addrs;
15696d076ae8SBjoern A. Zeeb 		ifm->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
15706d076ae8SBjoern A. Zeeb 		ifm->ifm_index = ifp->if_index;
15716d076ae8SBjoern A. Zeeb 		ifm->_ifm_spare1 = 0;
15726d076ae8SBjoern A. Zeeb 		ifm->ifm_len = sizeof(*ifm);
15736d076ae8SBjoern A. Zeeb 		ifm->ifm_data_off = offsetof(struct if_msghdrl, ifm_data);
1574b245f96cSGleb Smirnoff 		ifd = &ifm->ifm_data;
1575b245f96cSGleb Smirnoff 	}
15766d076ae8SBjoern A. Zeeb 
1577*e6485f73SGleb Smirnoff 	if_data_copy(ifp, ifd);
1578b245f96cSGleb Smirnoff 
15792d70c0deSGleb Smirnoff 	/* Some drivers still use ifqueue(9), add its stats. */
15802d70c0deSGleb Smirnoff 	ifd->ifi_oqdrops += ifp->if_snd.ifq_drops;
15816d076ae8SBjoern A. Zeeb 
15826d076ae8SBjoern A. Zeeb 	return (SYSCTL_OUT(w->w_req, (caddr_t)ifm, len));
15836d076ae8SBjoern A. Zeeb }
15846d076ae8SBjoern A. Zeeb 
15856d076ae8SBjoern A. Zeeb static int
15866d076ae8SBjoern A. Zeeb sysctl_iflist_ifm(struct ifnet *ifp, struct rt_addrinfo *info,
15876d076ae8SBjoern A. Zeeb     struct walkarg *w, int len)
15886d076ae8SBjoern A. Zeeb {
15896d076ae8SBjoern A. Zeeb 	struct if_msghdr *ifm;
1590b245f96cSGleb Smirnoff 	struct if_data *ifd;
1591b245f96cSGleb Smirnoff 
1592b245f96cSGleb Smirnoff 	ifm = (struct if_msghdr *)w->w_tmem;
15936d076ae8SBjoern A. Zeeb 
15946d076ae8SBjoern A. Zeeb #ifdef COMPAT_FREEBSD32
15956d076ae8SBjoern A. Zeeb 	if (w->w_req->flags & SCTL_MASK32) {
15966d076ae8SBjoern A. Zeeb 		struct if_msghdr32 *ifm32;
15976d076ae8SBjoern A. Zeeb 
1598b245f96cSGleb Smirnoff 		ifm32 = (struct if_msghdr32 *)ifm;
15996d076ae8SBjoern A. Zeeb 		ifm32->ifm_addrs = info->rti_addrs;
16006d076ae8SBjoern A. Zeeb 		ifm32->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
16016d076ae8SBjoern A. Zeeb 		ifm32->ifm_index = ifp->if_index;
1602b245f96cSGleb Smirnoff 		ifd = &ifm32->ifm_data;
1603b245f96cSGleb Smirnoff 	} else
16046d076ae8SBjoern A. Zeeb #endif
1605b245f96cSGleb Smirnoff 	{
16066d076ae8SBjoern A. Zeeb 		ifm->ifm_addrs = info->rti_addrs;
16076d076ae8SBjoern A. Zeeb 		ifm->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
16086d076ae8SBjoern A. Zeeb 		ifm->ifm_index = ifp->if_index;
1609b245f96cSGleb Smirnoff 		ifd = &ifm->ifm_data;
1610b245f96cSGleb Smirnoff 	}
16116d076ae8SBjoern A. Zeeb 
1612*e6485f73SGleb Smirnoff 	if_data_copy(ifp, ifd);
16132d70c0deSGleb Smirnoff 
16142d70c0deSGleb Smirnoff 	/* Some drivers still use ifqueue(9), add its stats. */
16152d70c0deSGleb Smirnoff 	ifd->ifi_oqdrops += ifp->if_snd.ifq_drops;
16166d076ae8SBjoern A. Zeeb 
16176d076ae8SBjoern A. Zeeb 	return (SYSCTL_OUT(w->w_req, (caddr_t)ifm, len));
16186d076ae8SBjoern A. Zeeb }
16196d076ae8SBjoern A. Zeeb 
16206d076ae8SBjoern A. Zeeb static int
16216d076ae8SBjoern A. Zeeb sysctl_iflist_ifaml(struct ifaddr *ifa, struct rt_addrinfo *info,
16226d076ae8SBjoern A. Zeeb     struct walkarg *w, int len)
16236d076ae8SBjoern A. Zeeb {
16246d076ae8SBjoern A. Zeeb 	struct ifa_msghdrl *ifam;
1625b245f96cSGleb Smirnoff 	struct if_data *ifd;
1626b245f96cSGleb Smirnoff 
1627b245f96cSGleb Smirnoff 	ifam = (struct ifa_msghdrl *)w->w_tmem;
16286d076ae8SBjoern A. Zeeb 
16296d076ae8SBjoern A. Zeeb #ifdef COMPAT_FREEBSD32
16306d076ae8SBjoern A. Zeeb 	if (w->w_req->flags & SCTL_MASK32) {
16316d076ae8SBjoern A. Zeeb 		struct ifa_msghdrl32 *ifam32;
16326d076ae8SBjoern A. Zeeb 
1633b245f96cSGleb Smirnoff 		ifam32 = (struct ifa_msghdrl32 *)ifam;
16346d076ae8SBjoern A. Zeeb 		ifam32->ifam_addrs = info->rti_addrs;
16356d076ae8SBjoern A. Zeeb 		ifam32->ifam_flags = ifa->ifa_flags;
16366d076ae8SBjoern A. Zeeb 		ifam32->ifam_index = ifa->ifa_ifp->if_index;
16376d076ae8SBjoern A. Zeeb 		ifam32->_ifam_spare1 = 0;
16386d076ae8SBjoern A. Zeeb 		ifam32->ifam_len = sizeof(*ifam32);
16396d076ae8SBjoern A. Zeeb 		ifam32->ifam_data_off =
16406d076ae8SBjoern A. Zeeb 		    offsetof(struct ifa_msghdrl32, ifam_data);
16419753faf5SGleb Smirnoff 		ifam32->ifam_metric = ifa->ifa_ifp->if_metric;
1642b245f96cSGleb Smirnoff 		ifd = &ifam32->ifam_data;
1643b245f96cSGleb Smirnoff 	} else
16446d076ae8SBjoern A. Zeeb #endif
1645b245f96cSGleb Smirnoff 	{
16466d076ae8SBjoern A. Zeeb 		ifam->ifam_addrs = info->rti_addrs;
16476d076ae8SBjoern A. Zeeb 		ifam->ifam_flags = ifa->ifa_flags;
16486d076ae8SBjoern A. Zeeb 		ifam->ifam_index = ifa->ifa_ifp->if_index;
16496d076ae8SBjoern A. Zeeb 		ifam->_ifam_spare1 = 0;
16506d076ae8SBjoern A. Zeeb 		ifam->ifam_len = sizeof(*ifam);
16516d076ae8SBjoern A. Zeeb 		ifam->ifam_data_off = offsetof(struct ifa_msghdrl, ifam_data);
16529753faf5SGleb Smirnoff 		ifam->ifam_metric = ifa->ifa_ifp->if_metric;
1653b245f96cSGleb Smirnoff 		ifd = &ifam->ifam_data;
1654b245f96cSGleb Smirnoff 	}
16556d076ae8SBjoern A. Zeeb 
1656b245f96cSGleb Smirnoff 	bzero(ifd, sizeof(*ifd));
1657b245f96cSGleb Smirnoff 	ifd->ifi_datalen = sizeof(struct if_data);
1658b245f96cSGleb Smirnoff 	ifd->ifi_ipackets = counter_u64_fetch(ifa->ifa_ipackets);
1659b245f96cSGleb Smirnoff 	ifd->ifi_opackets = counter_u64_fetch(ifa->ifa_opackets);
1660b245f96cSGleb Smirnoff 	ifd->ifi_ibytes = counter_u64_fetch(ifa->ifa_ibytes);
1661b245f96cSGleb Smirnoff 	ifd->ifi_obytes = counter_u64_fetch(ifa->ifa_obytes);
16627caf4ab7SGleb Smirnoff 
16636d076ae8SBjoern A. Zeeb 	/* Fixup if_data carp(4) vhid. */
16646d076ae8SBjoern A. Zeeb 	if (carp_get_vhid_p != NULL)
1665b245f96cSGleb Smirnoff 		ifd->ifi_vhid = (*carp_get_vhid_p)(ifa);
16666d076ae8SBjoern A. Zeeb 
16676d076ae8SBjoern A. Zeeb 	return (SYSCTL_OUT(w->w_req, w->w_tmem, len));
16686d076ae8SBjoern A. Zeeb }
16696d076ae8SBjoern A. Zeeb 
16706d076ae8SBjoern A. Zeeb static int
16716d076ae8SBjoern A. Zeeb sysctl_iflist_ifam(struct ifaddr *ifa, struct rt_addrinfo *info,
16726d076ae8SBjoern A. Zeeb     struct walkarg *w, int len)
16736d076ae8SBjoern A. Zeeb {
16746d076ae8SBjoern A. Zeeb 	struct ifa_msghdr *ifam;
16756d076ae8SBjoern A. Zeeb 
16766d076ae8SBjoern A. Zeeb 	ifam = (struct ifa_msghdr *)w->w_tmem;
16776d076ae8SBjoern A. Zeeb 	ifam->ifam_addrs = info->rti_addrs;
16786d076ae8SBjoern A. Zeeb 	ifam->ifam_flags = ifa->ifa_flags;
16796d076ae8SBjoern A. Zeeb 	ifam->ifam_index = ifa->ifa_ifp->if_index;
16809753faf5SGleb Smirnoff 	ifam->ifam_metric = ifa->ifa_ifp->if_metric;
16816d076ae8SBjoern A. Zeeb 
16826d076ae8SBjoern A. Zeeb 	return (SYSCTL_OUT(w->w_req, w->w_tmem, len));
16836d076ae8SBjoern A. Zeeb }
16846d076ae8SBjoern A. Zeeb 
16856d076ae8SBjoern A. Zeeb static int
1686becc44d7SSam Leffler sysctl_iflist(int af, struct walkarg *w)
1687df8bae1dSRodney W. Grimes {
1688becc44d7SSam Leffler 	struct ifnet *ifp;
1689becc44d7SSam Leffler 	struct ifaddr *ifa;
1690df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
1691df8bae1dSRodney W. Grimes 	int len, error = 0;
16923deb3649SAlexander V. Chernikov 	struct sockaddr_storage ss;
1693df8bae1dSRodney W. Grimes 
1694df8bae1dSRodney W. Grimes 	bzero((caddr_t)&info, sizeof(info));
16955c9fa630SHiroki Sato 	IFNET_RLOCK_NOSLEEP();
1696603724d3SBjoern A. Zeeb 	TAILQ_FOREACH(ifp, &V_ifnet, if_link) {
1697df8bae1dSRodney W. Grimes 		if (w->w_arg && w->w_arg != ifp->if_index)
1698df8bae1dSRodney W. Grimes 			continue;
1699137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
17004a0d6638SRuslan Ermilov 		ifa = ifp->if_addr;
1701becc44d7SSam Leffler 		info.rti_info[RTAX_IFP] = ifa->ifa_addr;
1702f2e5eb36SAlexander V. Chernikov 		error = rtsock_msg_buffer(RTM_IFINFO, &info, w, &len);
1703f2e5eb36SAlexander V. Chernikov 		if (error != 0)
1704f2e5eb36SAlexander V. Chernikov 			goto done;
17055dfc91d7SLuigi Rizzo 		info.rti_info[RTAX_IFP] = NULL;
170652041295SPoul-Henning Kamp 		if (w->w_req && w->w_tmem) {
17076d076ae8SBjoern A. Zeeb 			if (w->w_op == NET_RT_IFLISTL)
17086d076ae8SBjoern A. Zeeb 				error = sysctl_iflist_ifml(ifp, &info, w, len);
17096d076ae8SBjoern A. Zeeb 			else
17106d076ae8SBjoern A. Zeeb 				error = sysctl_iflist_ifm(ifp, &info, w, len);
1711df440948SPoul-Henning Kamp 			if (error)
1712a35b06c5SJonathan Lemon 				goto done;
1713df8bae1dSRodney W. Grimes 		}
17145dfc91d7SLuigi Rizzo 		while ((ifa = TAILQ_NEXT(ifa, ifa_link)) != NULL) {
1715df8bae1dSRodney W. Grimes 			if (af && af != ifa->ifa_addr->sa_family)
1716df8bae1dSRodney W. Grimes 				continue;
1717b89e82ddSJamie Gritton 			if (prison_if(w->w_req->td->td_ucred,
1718b89e82ddSJamie Gritton 			    ifa->ifa_addr) != 0)
171975c13541SPoul-Henning Kamp 				continue;
1720becc44d7SSam Leffler 			info.rti_info[RTAX_IFA] = ifa->ifa_addr;
17213deb3649SAlexander V. Chernikov 			info.rti_info[RTAX_NETMASK] = rtsock_fix_netmask(
17223deb3649SAlexander V. Chernikov 			    ifa->ifa_addr, ifa->ifa_netmask, &ss);
1723becc44d7SSam Leffler 			info.rti_info[RTAX_BRD] = ifa->ifa_dstaddr;
1724f2e5eb36SAlexander V. Chernikov 			error = rtsock_msg_buffer(RTM_NEWADDR, &info, w, &len);
1725f2e5eb36SAlexander V. Chernikov 			if (error != 0)
1726f2e5eb36SAlexander V. Chernikov 				goto done;
172752041295SPoul-Henning Kamp 			if (w->w_req && w->w_tmem) {
17286d076ae8SBjoern A. Zeeb 				if (w->w_op == NET_RT_IFLISTL)
17296d076ae8SBjoern A. Zeeb 					error = sysctl_iflist_ifaml(ifa, &info,
17306d076ae8SBjoern A. Zeeb 					    w, len);
17316d076ae8SBjoern A. Zeeb 				else
17326d076ae8SBjoern A. Zeeb 					error = sysctl_iflist_ifam(ifa, &info,
17336d076ae8SBjoern A. Zeeb 					    w, len);
1734df440948SPoul-Henning Kamp 				if (error)
1735a35b06c5SJonathan Lemon 					goto done;
1736df8bae1dSRodney W. Grimes 			}
1737df8bae1dSRodney W. Grimes 		}
1738137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
17393deb3649SAlexander V. Chernikov 		info.rti_info[RTAX_IFA] = NULL;
17403deb3649SAlexander V. Chernikov 		info.rti_info[RTAX_NETMASK] = NULL;
17415dfc91d7SLuigi Rizzo 		info.rti_info[RTAX_BRD] = NULL;
1742df8bae1dSRodney W. Grimes 	}
1743a35b06c5SJonathan Lemon done:
1744ee7c7feeSBjoern A. Zeeb 	if (ifp != NULL)
1745137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
17465c9fa630SHiroki Sato 	IFNET_RUNLOCK_NOSLEEP();
1747a35b06c5SJonathan Lemon 	return (error);
1748df8bae1dSRodney W. Grimes }
1749df8bae1dSRodney W. Grimes 
1750ebda3fc3SBjoern A. Zeeb static int
17519b98ee2cSLuigi Rizzo sysctl_ifmalist(int af, struct walkarg *w)
175205b2efe0SBruce M Simpson {
17539b98ee2cSLuigi Rizzo 	struct ifnet *ifp;
175405b2efe0SBruce M Simpson 	struct ifmultiaddr *ifma;
175505b2efe0SBruce M Simpson 	struct	rt_addrinfo info;
175605b2efe0SBruce M Simpson 	int	len, error = 0;
17579b98ee2cSLuigi Rizzo 	struct ifaddr *ifa;
175805b2efe0SBruce M Simpson 
175905b2efe0SBruce M Simpson 	bzero((caddr_t)&info, sizeof(info));
17605c9fa630SHiroki Sato 	IFNET_RLOCK_NOSLEEP();
1761603724d3SBjoern A. Zeeb 	TAILQ_FOREACH(ifp, &V_ifnet, if_link) {
176205b2efe0SBruce M Simpson 		if (w->w_arg && w->w_arg != ifp->if_index)
176305b2efe0SBruce M Simpson 			continue;
17644a0d6638SRuslan Ermilov 		ifa = ifp->if_addr;
1765913af518SLuigi Rizzo 		info.rti_info[RTAX_IFP] = ifa ? ifa->ifa_addr : NULL;
1766137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
176705b2efe0SBruce M Simpson 		TAILQ_FOREACH(ifma, &ifp->if_multiaddrs, ifma_link) {
176805b2efe0SBruce M Simpson 			if (af && af != ifma->ifma_addr->sa_family)
176905b2efe0SBruce M Simpson 				continue;
1770b89e82ddSJamie Gritton 			if (prison_if(w->w_req->td->td_ucred,
1771b89e82ddSJamie Gritton 			    ifma->ifma_addr) != 0)
177205b2efe0SBruce M Simpson 				continue;
177305b2efe0SBruce M Simpson 			info.rti_info[RTAX_IFA] = ifma->ifma_addr;
1774913af518SLuigi Rizzo 			info.rti_info[RTAX_GATEWAY] =
1775913af518SLuigi Rizzo 			    (ifma->ifma_addr->sa_family != AF_LINK) ?
1776913af518SLuigi Rizzo 			    ifma->ifma_lladdr : NULL;
1777c9f98940SAlexander V. Chernikov 			error = rtsock_msg_buffer(RTM_NEWMADDR, &info, w, &len);
1778f2e5eb36SAlexander V. Chernikov 			if (error != 0)
1779f2e5eb36SAlexander V. Chernikov 				goto done;
178005b2efe0SBruce M Simpson 			if (w->w_req && w->w_tmem) {
17819b98ee2cSLuigi Rizzo 				struct ifma_msghdr *ifmam;
178205b2efe0SBruce M Simpson 
178305b2efe0SBruce M Simpson 				ifmam = (struct ifma_msghdr *)w->w_tmem;
178405b2efe0SBruce M Simpson 				ifmam->ifmam_index = ifma->ifma_ifp->if_index;
178505b2efe0SBruce M Simpson 				ifmam->ifmam_flags = 0;
178605b2efe0SBruce M Simpson 				ifmam->ifmam_addrs = info.rti_addrs;
178705b2efe0SBruce M Simpson 				error = SYSCTL_OUT(w->w_req, w->w_tmem, len);
1788fe0fc7efSChristian S.J. Peron 				if (error) {
1789137f91e8SJohn Baldwin 					IF_ADDR_RUNLOCK(ifp);
179005b2efe0SBruce M Simpson 					goto done;
179105b2efe0SBruce M Simpson 				}
179205b2efe0SBruce M Simpson 			}
179305b2efe0SBruce M Simpson 		}
1794137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
1795fe0fc7efSChristian S.J. Peron 	}
179605b2efe0SBruce M Simpson done:
17975c9fa630SHiroki Sato 	IFNET_RUNLOCK_NOSLEEP();
179805b2efe0SBruce M Simpson 	return (error);
179905b2efe0SBruce M Simpson }
180005b2efe0SBruce M Simpson 
180152041295SPoul-Henning Kamp static int
180282d9ae4eSPoul-Henning Kamp sysctl_rtsock(SYSCTL_HANDLER_ARGS)
1803df8bae1dSRodney W. Grimes {
180452041295SPoul-Henning Kamp 	int	*name = (int *)arg1;
180552041295SPoul-Henning Kamp 	u_int	namelen = arg2;
1806c2c2a7c1SBjoern A. Zeeb 	struct radix_node_head *rnh = NULL; /* silence compiler. */
1807fe0fc7efSChristian S.J. Peron 	int	i, lim, error = EINVAL;
18084825b1e0SHiroki Sato 	int	fib = 0;
1809df8bae1dSRodney W. Grimes 	u_char	af;
1810df8bae1dSRodney W. Grimes 	struct	walkarg w;
1811df8bae1dSRodney W. Grimes 
181252041295SPoul-Henning Kamp 	name ++;
181352041295SPoul-Henning Kamp 	namelen--;
181452041295SPoul-Henning Kamp 	if (req->newptr)
1815df8bae1dSRodney W. Grimes 		return (EPERM);
18164825b1e0SHiroki Sato 	if (name[1] == NET_RT_DUMP) {
18174825b1e0SHiroki Sato 		if (namelen == 3)
18184825b1e0SHiroki Sato 			fib = req->td->td_proc->p_fibnum;
18194825b1e0SHiroki Sato 		else if (namelen == 4)
18207d9b6df1SAlexander V. Chernikov 			fib = (name[3] == RT_ALL_FIBS) ?
18214825b1e0SHiroki Sato 			    req->td->td_proc->p_fibnum : name[3];
18224825b1e0SHiroki Sato 		else
18234825b1e0SHiroki Sato 			return ((namelen < 3) ? EISDIR : ENOTDIR);
18244825b1e0SHiroki Sato 		if (fib < 0 || fib >= rt_numfibs)
18254825b1e0SHiroki Sato 			return (EINVAL);
18264825b1e0SHiroki Sato 	} else if (namelen != 3)
1827f7a54d06SCrist J. Clark 		return ((namelen < 3) ? EISDIR : ENOTDIR);
1828df8bae1dSRodney W. Grimes 	af = name[0];
1829b2aaf46eSJeffrey Hsu 	if (af > AF_MAX)
1830b2aaf46eSJeffrey Hsu 		return (EINVAL);
18316b96f1afSLuigi Rizzo 	bzero(&w, sizeof(w));
1832df8bae1dSRodney W. Grimes 	w.w_op = name[1];
1833df8bae1dSRodney W. Grimes 	w.w_arg = name[2];
183452041295SPoul-Henning Kamp 	w.w_req = req;
1835df8bae1dSRodney W. Grimes 
1836fe0fc7efSChristian S.J. Peron 	error = sysctl_wire_old_buffer(req, 0);
1837fe0fc7efSChristian S.J. Peron 	if (error)
1838fe0fc7efSChristian S.J. Peron 		return (error);
1839f2e5eb36SAlexander V. Chernikov 
1840f2e5eb36SAlexander V. Chernikov 	/*
1841f2e5eb36SAlexander V. Chernikov 	 * Allocate reply buffer in advance.
1842f2e5eb36SAlexander V. Chernikov 	 * All rtsock messages has maximum length of u_short.
1843f2e5eb36SAlexander V. Chernikov 	 */
1844f2e5eb36SAlexander V. Chernikov 	w.w_tmemsize = 65536;
1845f2e5eb36SAlexander V. Chernikov 	w.w_tmem = malloc(w.w_tmemsize, M_TEMP, M_WAITOK);
1846f2e5eb36SAlexander V. Chernikov 
1847df8bae1dSRodney W. Grimes 	switch (w.w_op) {
1848df8bae1dSRodney W. Grimes 
1849df8bae1dSRodney W. Grimes 	case NET_RT_DUMP:
1850df8bae1dSRodney W. Grimes 	case NET_RT_FLAGS:
1851a8b76c8fSLuigi Rizzo 		if (af == 0) {			/* dump all tables */
1852a8b76c8fSLuigi Rizzo 			i = 1;
1853a8b76c8fSLuigi Rizzo 			lim = AF_MAX;
1854a8b76c8fSLuigi Rizzo 		} else				/* dump only one table */
1855a8b76c8fSLuigi Rizzo 			i = lim = af;
18568eca593cSQing Li 
18578eca593cSQing Li 		/*
18588eca593cSQing Li 		 * take care of llinfo entries, the caller must
18598eca593cSQing Li 		 * specify an AF
18608eca593cSQing Li 		 */
186114981d80SQing Li 		if (w.w_op == NET_RT_FLAGS &&
186282b334e8SQing Li 		    (w.w_arg == 0 || w.w_arg & RTF_LLINFO)) {
18638eca593cSQing Li 			if (af != 0)
18648eca593cSQing Li 				error = lltable_sysctl_dumparp(af, w.w_req);
18658eca593cSQing Li 			else
18668eca593cSQing Li 				error = EINVAL;
18678eca593cSQing Li 			break;
18688eca593cSQing Li 		}
18698eca593cSQing Li 		/*
18708eca593cSQing Li 		 * take care of routing entries
18718eca593cSQing Li 		 */
187220b0cdb7SBjoern A. Zeeb 		for (error = 0; error == 0 && i <= lim; i++) {
18734825b1e0SHiroki Sato 			rnh = rt_tables_get_rnh(fib, i);
1874c2c2a7c1SBjoern A. Zeeb 			if (rnh != NULL) {
1875c2508034SAlexander V. Chernikov 				RADIX_NODE_HEAD_RLOCK(rnh);
1876956b0b65SJeffrey Hsu 			    	error = rnh->rnh_walktree(rnh,
1877fe0fc7efSChristian S.J. Peron 				    sysctl_dumpentry, &w);
1878c2508034SAlexander V. Chernikov 				RADIX_NODE_HEAD_RUNLOCK(rnh);
1879a8b76c8fSLuigi Rizzo 			} else if (af != 0)
1880956b0b65SJeffrey Hsu 				error = EAFNOSUPPORT;
188120b0cdb7SBjoern A. Zeeb 		}
1882df8bae1dSRodney W. Grimes 		break;
1883df8bae1dSRodney W. Grimes 
1884df8bae1dSRodney W. Grimes 	case NET_RT_IFLIST:
18856d076ae8SBjoern A. Zeeb 	case NET_RT_IFLISTL:
1886df8bae1dSRodney W. Grimes 		error = sysctl_iflist(af, &w);
188705b2efe0SBruce M Simpson 		break;
188805b2efe0SBruce M Simpson 
188905b2efe0SBruce M Simpson 	case NET_RT_IFMALIST:
189005b2efe0SBruce M Simpson 		error = sysctl_ifmalist(af, &w);
189105b2efe0SBruce M Simpson 		break;
1892df8bae1dSRodney W. Grimes 	}
1893f2e5eb36SAlexander V. Chernikov 
1894f2e5eb36SAlexander V. Chernikov 	free(w.w_tmem, M_TEMP);
1895df8bae1dSRodney W. Grimes 	return (error);
1896df8bae1dSRodney W. Grimes }
1897df8bae1dSRodney W. Grimes 
18986472ac3dSEd Schouten static SYSCTL_NODE(_net, PF_ROUTE, routetable, CTLFLAG_RD, sysctl_rtsock, "");
189952041295SPoul-Henning Kamp 
1900df8bae1dSRodney W. Grimes /*
1901df8bae1dSRodney W. Grimes  * Definitions of protocols supported in the ROUTE domain.
1902df8bae1dSRodney W. Grimes  */
1903df8bae1dSRodney W. Grimes 
19045b1c0294SDavid E. O'Brien static struct domain routedomain;		/* or at least forward */
1905df8bae1dSRodney W. Grimes 
190652041295SPoul-Henning Kamp static struct protosw routesw[] = {
1907303989a2SRuslan Ermilov {
1908303989a2SRuslan Ermilov 	.pr_type =		SOCK_RAW,
1909303989a2SRuslan Ermilov 	.pr_domain =		&routedomain,
1910303989a2SRuslan Ermilov 	.pr_flags =		PR_ATOMIC|PR_ADDR,
1911303989a2SRuslan Ermilov 	.pr_output =		route_output,
1912303989a2SRuslan Ermilov 	.pr_ctlinput =		raw_ctlinput,
1913303989a2SRuslan Ermilov 	.pr_init =		raw_init,
1914303989a2SRuslan Ermilov 	.pr_usrreqs =		&route_usrreqs
1915df8bae1dSRodney W. Grimes }
1916df8bae1dSRodney W. Grimes };
1917df8bae1dSRodney W. Grimes 
1918303989a2SRuslan Ermilov static struct domain routedomain = {
1919303989a2SRuslan Ermilov 	.dom_family =		PF_ROUTE,
1920303989a2SRuslan Ermilov 	.dom_name =		 "route",
1921303989a2SRuslan Ermilov 	.dom_protosw =		routesw,
1922303989a2SRuslan Ermilov 	.dom_protoswNPROTOSW =	&routesw[sizeof(routesw)/sizeof(routesw[0])]
1923303989a2SRuslan Ermilov };
192478a82810SGarrett Wollman 
1925d0728d71SRobert Watson VNET_DOMAIN_SET(route);
1926