xref: /freebsd/sys/net/rtsock.c (revision 61eee0e202c2bda75971193c95d870e6148a6152)
1c398230bSWarner Losh /*-
2df8bae1dSRodney W. Grimes  * Copyright (c) 1988, 1991, 1993
3df8bae1dSRodney W. Grimes  *	The Regents of the University of California.  All rights reserved.
4df8bae1dSRodney W. Grimes  *
5df8bae1dSRodney W. Grimes  * Redistribution and use in source and binary forms, with or without
6df8bae1dSRodney W. Grimes  * modification, are permitted provided that the following conditions
7df8bae1dSRodney W. Grimes  * are met:
8df8bae1dSRodney W. Grimes  * 1. Redistributions of source code must retain the above copyright
9df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer.
10df8bae1dSRodney W. Grimes  * 2. Redistributions in binary form must reproduce the above copyright
11df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer in the
12df8bae1dSRodney W. Grimes  *    documentation and/or other materials provided with the distribution.
13df8bae1dSRodney W. Grimes  * 4. Neither the name of the University nor the names of its contributors
14df8bae1dSRodney W. Grimes  *    may be used to endorse or promote products derived from this software
15df8bae1dSRodney W. Grimes  *    without specific prior written permission.
16df8bae1dSRodney W. Grimes  *
17df8bae1dSRodney W. Grimes  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
18df8bae1dSRodney W. Grimes  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19df8bae1dSRodney W. Grimes  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20df8bae1dSRodney W. Grimes  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
21df8bae1dSRodney W. Grimes  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22df8bae1dSRodney W. Grimes  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23df8bae1dSRodney W. Grimes  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24df8bae1dSRodney W. Grimes  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25df8bae1dSRodney W. Grimes  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26df8bae1dSRodney W. Grimes  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27df8bae1dSRodney W. Grimes  * SUCH DAMAGE.
28df8bae1dSRodney W. Grimes  *
2928070a0eSRuslan Ermilov  *	@(#)rtsock.c	8.7 (Berkeley) 10/12/95
30c3aac50fSPeter Wemm  * $FreeBSD$
31df8bae1dSRodney W. Grimes  */
32427a928aSKonstantin Belousov #include "opt_compat.h"
33e440aed9SQing Li #include "opt_mpath.h"
34413628a7SBjoern A. Zeeb #include "opt_inet.h"
35413628a7SBjoern A. Zeeb #include "opt_inet6.h"
36e440aed9SQing Li 
37df8bae1dSRodney W. Grimes #include <sys/param.h>
38960ed29cSSeigo Tanimura #include <sys/jail.h>
39413628a7SBjoern A. Zeeb #include <sys/kernel.h>
40d0728d71SRobert Watson #include <sys/domain.h>
41609ff41fSWarner Losh #include <sys/lock.h>
424d1d4912SBruce Evans #include <sys/malloc.h>
43df8bae1dSRodney W. Grimes #include <sys/mbuf.h>
44acd3428bSRobert Watson #include <sys/priv.h>
45960ed29cSSeigo Tanimura #include <sys/proc.h>
46960ed29cSSeigo Tanimura #include <sys/protosw.h>
473120b9d4SKip Macy #include <sys/rwlock.h>
48960ed29cSSeigo Tanimura #include <sys/signalvar.h>
49df8bae1dSRodney W. Grimes #include <sys/socket.h>
50df8bae1dSRodney W. Grimes #include <sys/socketvar.h>
51960ed29cSSeigo Tanimura #include <sys/sysctl.h>
52960ed29cSSeigo Tanimura #include <sys/systm.h>
53df8bae1dSRodney W. Grimes 
54df8bae1dSRodney W. Grimes #include <net/if.h>
5576039bc8SGleb Smirnoff #include <net/if_var.h>
568eca593cSQing Li #include <net/if_dl.h>
576e6b3f7cSQing Li #include <net/if_llatbl.h>
580ed6142bSQing Li #include <net/if_types.h>
59d989c7b3SRobert Watson #include <net/netisr.h>
60df8bae1dSRodney W. Grimes #include <net/raw_cb.h>
61960ed29cSSeigo Tanimura #include <net/route.h>
62*61eee0e2SAlexander V. Chernikov #include <net/route_var.h>
634b79449eSBjoern A. Zeeb #include <net/vnet.h>
64df8bae1dSRodney W. Grimes 
655a59cefcSBosko Milekic #include <netinet/in.h>
66c7ab6602SQing Li #include <netinet/if_ether.h>
6708b68b0eSGleb Smirnoff #include <netinet/ip_carp.h>
68413628a7SBjoern A. Zeeb #ifdef INET6
690bebb544SHiroki Sato #include <netinet6/ip6_var.h>
70413628a7SBjoern A. Zeeb #include <netinet6/scope6_var.h>
71413628a7SBjoern A. Zeeb #endif
725a59cefcSBosko Milekic 
73427a928aSKonstantin Belousov #ifdef COMPAT_FREEBSD32
74427a928aSKonstantin Belousov #include <sys/mount.h>
75427a928aSKonstantin Belousov #include <compat/freebsd32/freebsd32.h>
76427a928aSKonstantin Belousov 
77427a928aSKonstantin Belousov struct if_msghdr32 {
78427a928aSKonstantin Belousov 	uint16_t ifm_msglen;
79427a928aSKonstantin Belousov 	uint8_t	ifm_version;
80427a928aSKonstantin Belousov 	uint8_t	ifm_type;
81427a928aSKonstantin Belousov 	int32_t	ifm_addrs;
82427a928aSKonstantin Belousov 	int32_t	ifm_flags;
83427a928aSKonstantin Belousov 	uint16_t ifm_index;
84b245f96cSGleb Smirnoff 	struct	if_data ifm_data;
85427a928aSKonstantin Belousov };
866d076ae8SBjoern A. Zeeb 
876d076ae8SBjoern A. Zeeb struct if_msghdrl32 {
886d076ae8SBjoern A. Zeeb 	uint16_t ifm_msglen;
896d076ae8SBjoern A. Zeeb 	uint8_t	ifm_version;
906d076ae8SBjoern A. Zeeb 	uint8_t	ifm_type;
916d076ae8SBjoern A. Zeeb 	int32_t	ifm_addrs;
926d076ae8SBjoern A. Zeeb 	int32_t	ifm_flags;
936d076ae8SBjoern A. Zeeb 	uint16_t ifm_index;
946d076ae8SBjoern A. Zeeb 	uint16_t _ifm_spare1;
956d076ae8SBjoern A. Zeeb 	uint16_t ifm_len;
966d076ae8SBjoern A. Zeeb 	uint16_t ifm_data_off;
97b245f96cSGleb Smirnoff 	struct	if_data ifm_data;
986d076ae8SBjoern A. Zeeb };
996d076ae8SBjoern A. Zeeb 
1006d076ae8SBjoern A. Zeeb struct ifa_msghdrl32 {
1016d076ae8SBjoern A. Zeeb 	uint16_t ifam_msglen;
1026d076ae8SBjoern A. Zeeb 	uint8_t	ifam_version;
1036d076ae8SBjoern A. Zeeb 	uint8_t	ifam_type;
1046d076ae8SBjoern A. Zeeb 	int32_t	ifam_addrs;
1056d076ae8SBjoern A. Zeeb 	int32_t	ifam_flags;
1066d076ae8SBjoern A. Zeeb 	uint16_t ifam_index;
1076d076ae8SBjoern A. Zeeb 	uint16_t _ifam_spare1;
1086d076ae8SBjoern A. Zeeb 	uint16_t ifam_len;
1096d076ae8SBjoern A. Zeeb 	uint16_t ifam_data_off;
1106d076ae8SBjoern A. Zeeb 	int32_t	ifam_metric;
111b245f96cSGleb Smirnoff 	struct	if_data ifam_data;
1126d076ae8SBjoern A. Zeeb };
1136d076ae8SBjoern A. Zeeb #endif /* COMPAT_FREEBSD32 */
114427a928aSKonstantin Belousov 
115a1c995b6SPoul-Henning Kamp MALLOC_DEFINE(M_RTABLE, "routetbl", "routing tables");
116a1c995b6SPoul-Henning Kamp 
117becc44d7SSam Leffler /* NB: these are not modified */
11852041295SPoul-Henning Kamp static struct	sockaddr route_src = { 2, PF_ROUTE, };
119076d0761SJulian Elischer static struct	sockaddr sa_zero   = { sizeof(sa_zero), AF_INET, };
120becc44d7SSam Leffler 
12108b68b0eSGleb Smirnoff /* These are external hooks for CARP. */
12208b68b0eSGleb Smirnoff int	(*carp_get_vhid_p)(struct ifaddr *);
12308b68b0eSGleb Smirnoff 
124528737fdSBjoern A. Zeeb /*
125528737fdSBjoern A. Zeeb  * Used by rtsock/raw_input callback code to decide whether to filter the update
126528737fdSBjoern A. Zeeb  * notification to a socket bound to a particular FIB.
127528737fdSBjoern A. Zeeb  */
128528737fdSBjoern A. Zeeb #define	RTS_FILTER_FIB	M_PROTO8
129528737fdSBjoern A. Zeeb 
130c5d4eab6SMarko Zec typedef struct {
13118aee723SPeter Pentchev 	int	ip_count;	/* attached w/ AF_INET */
132becc44d7SSam Leffler 	int	ip6_count;	/* attached w/ AF_INET6 */
133becc44d7SSam Leffler 	int	any_count;	/* total attached */
134c5d4eab6SMarko Zec } route_cb_t;
135c5d4eab6SMarko Zec static VNET_DEFINE(route_cb_t, route_cb);
136c5d4eab6SMarko Zec #define	V_route_cb VNET(route_cb)
137df8bae1dSRodney W. Grimes 
138aea8b30fSSam Leffler struct mtx rtsock_mtx;
139aea8b30fSSam Leffler MTX_SYSINIT(rtsock, &rtsock_mtx, "rtsock route_cb lock", MTX_DEF);
140aea8b30fSSam Leffler 
141aea8b30fSSam Leffler #define	RTSOCK_LOCK()	mtx_lock(&rtsock_mtx)
142aea8b30fSSam Leffler #define	RTSOCK_UNLOCK()	mtx_unlock(&rtsock_mtx)
143aea8b30fSSam Leffler #define	RTSOCK_LOCK_ASSERT()	mtx_assert(&rtsock_mtx, MA_OWNED)
144aea8b30fSSam Leffler 
1456472ac3dSEd Schouten static SYSCTL_NODE(_net, OID_AUTO, route, CTLFLAG_RD, 0, "");
146190a4c94SRobert Watson 
147df8bae1dSRodney W. Grimes struct walkarg {
14852041295SPoul-Henning Kamp 	int	w_tmemsize;
14952041295SPoul-Henning Kamp 	int	w_op, w_arg;
15052041295SPoul-Henning Kamp 	caddr_t	w_tmem;
15152041295SPoul-Henning Kamp 	struct sysctl_req *w_req;
152df8bae1dSRodney W. Grimes };
153df8bae1dSRodney W. Grimes 
154d989c7b3SRobert Watson static void	rts_input(struct mbuf *m);
1556db47af4SAlexander V. Chernikov static struct mbuf *rtsock_msg_mbuf(int type, struct rt_addrinfo *rtinfo);
156f2e5eb36SAlexander V. Chernikov static int	rtsock_msg_buffer(int type, struct rt_addrinfo *rtinfo,
157f2e5eb36SAlexander V. Chernikov 			struct walkarg *w, int *plen);
1585dfc91d7SLuigi Rizzo static int	rt_xaddrs(caddr_t cp, caddr_t cplim,
1595dfc91d7SLuigi Rizzo 			struct rt_addrinfo *rtinfo);
160929ddbbbSAlfred Perlstein static int	sysctl_dumpentry(struct radix_node *rn, void *vw);
161929ddbbbSAlfred Perlstein static int	sysctl_iflist(int af, struct walkarg *w);
16205b2efe0SBruce M Simpson static int	sysctl_ifmalist(int af, struct walkarg *w);
16373d76e77SKevin Lo static int	route_output(struct mbuf *m, struct socket *so, ...);
164e3a7aa6fSGleb Smirnoff static void	rt_getmetrics(const struct rtentry *rt, struct rt_metrics *out);
1653ca1a2d6SMax Laier static void	rt_dispatch(struct mbuf *, sa_family_t);
1663deb3649SAlexander V. Chernikov static struct sockaddr	*rtsock_fix_netmask(struct sockaddr *dst,
1673deb3649SAlexander V. Chernikov 			struct sockaddr *smask, struct sockaddr_storage *dmask);
168df8bae1dSRodney W. Grimes 
169d4b5cae4SRobert Watson static struct netisr_handler rtsock_nh = {
170d4b5cae4SRobert Watson 	.nh_name = "rtsock",
171d4b5cae4SRobert Watson 	.nh_handler = rts_input,
172d4b5cae4SRobert Watson 	.nh_proto = NETISR_ROUTE,
173d4b5cae4SRobert Watson 	.nh_policy = NETISR_POLICY_SOURCE,
174d4b5cae4SRobert Watson };
175d4b5cae4SRobert Watson 
176d4b5cae4SRobert Watson static int
177d4b5cae4SRobert Watson sysctl_route_netisr_maxqlen(SYSCTL_HANDLER_ARGS)
178d4b5cae4SRobert Watson {
179d4b5cae4SRobert Watson 	int error, qlimit;
180d4b5cae4SRobert Watson 
181d4b5cae4SRobert Watson 	netisr_getqlimit(&rtsock_nh, &qlimit);
182d4b5cae4SRobert Watson 	error = sysctl_handle_int(oidp, &qlimit, 0, req);
183d4b5cae4SRobert Watson         if (error || !req->newptr)
184d4b5cae4SRobert Watson                 return (error);
185d4b5cae4SRobert Watson 	if (qlimit < 1)
186d4b5cae4SRobert Watson 		return (EINVAL);
187d4b5cae4SRobert Watson 	return (netisr_setqlimit(&rtsock_nh, qlimit));
188d4b5cae4SRobert Watson }
189d4b5cae4SRobert Watson SYSCTL_PROC(_net_route, OID_AUTO, netisr_maxqlen, CTLTYPE_INT|CTLFLAG_RW,
190d4b5cae4SRobert Watson     0, 0, sysctl_route_netisr_maxqlen, "I",
191d4b5cae4SRobert Watson     "maximum routing socket dispatch queue length");
192d4b5cae4SRobert Watson 
193d989c7b3SRobert Watson static void
194d989c7b3SRobert Watson rts_init(void)
195d989c7b3SRobert Watson {
196b062951aSRobert Watson 	int tmp;
197d989c7b3SRobert Watson 
198b062951aSRobert Watson 	if (TUNABLE_INT_FETCH("net.route.netisr_maxqlen", &tmp))
199d4b5cae4SRobert Watson 		rtsock_nh.nh_qlimit = tmp;
200d4b5cae4SRobert Watson 	netisr_register(&rtsock_nh);
201d989c7b3SRobert Watson }
202237fdd78SRobert Watson SYSINIT(rtsock, SI_SUB_PROTO_DOMAIN, SI_ORDER_THIRD, rts_init, 0);
203d989c7b3SRobert Watson 
204528737fdSBjoern A. Zeeb static int
205528737fdSBjoern A. Zeeb raw_input_rts_cb(struct mbuf *m, struct sockproto *proto, struct sockaddr *src,
206528737fdSBjoern A. Zeeb     struct rawcb *rp)
207528737fdSBjoern A. Zeeb {
208528737fdSBjoern A. Zeeb 	int fibnum;
209528737fdSBjoern A. Zeeb 
210528737fdSBjoern A. Zeeb 	KASSERT(m != NULL, ("%s: m is NULL", __func__));
211528737fdSBjoern A. Zeeb 	KASSERT(proto != NULL, ("%s: proto is NULL", __func__));
212528737fdSBjoern A. Zeeb 	KASSERT(rp != NULL, ("%s: rp is NULL", __func__));
213528737fdSBjoern A. Zeeb 
214528737fdSBjoern A. Zeeb 	/* No filtering requested. */
215528737fdSBjoern A. Zeeb 	if ((m->m_flags & RTS_FILTER_FIB) == 0)
216528737fdSBjoern A. Zeeb 		return (0);
217528737fdSBjoern A. Zeeb 
218528737fdSBjoern A. Zeeb 	/* Check if it is a rts and the fib matches the one of the socket. */
219528737fdSBjoern A. Zeeb 	fibnum = M_GETFIB(m);
220528737fdSBjoern A. Zeeb 	if (proto->sp_family != PF_ROUTE ||
221528737fdSBjoern A. Zeeb 	    rp->rcb_socket == NULL ||
222528737fdSBjoern A. Zeeb 	    rp->rcb_socket->so_fibnum == fibnum)
223528737fdSBjoern A. Zeeb 		return (0);
224528737fdSBjoern A. Zeeb 
225528737fdSBjoern A. Zeeb 	/* Filtering requested and no match, the socket shall be skipped. */
226528737fdSBjoern A. Zeeb 	return (1);
227528737fdSBjoern A. Zeeb }
228528737fdSBjoern A. Zeeb 
229d989c7b3SRobert Watson static void
230d989c7b3SRobert Watson rts_input(struct mbuf *m)
231d989c7b3SRobert Watson {
232d989c7b3SRobert Watson 	struct sockproto route_proto;
233d989c7b3SRobert Watson 	unsigned short *family;
234d989c7b3SRobert Watson 	struct m_tag *tag;
235d989c7b3SRobert Watson 
236d989c7b3SRobert Watson 	route_proto.sp_family = PF_ROUTE;
237d989c7b3SRobert Watson 	tag = m_tag_find(m, PACKET_TAG_RTSOCKFAM, NULL);
238d989c7b3SRobert Watson 	if (tag != NULL) {
239d989c7b3SRobert Watson 		family = (unsigned short *)(tag + 1);
240d989c7b3SRobert Watson 		route_proto.sp_protocol = *family;
241d989c7b3SRobert Watson 		m_tag_delete(m, tag);
242d989c7b3SRobert Watson 	} else
243d989c7b3SRobert Watson 		route_proto.sp_protocol = 0;
244d989c7b3SRobert Watson 
245528737fdSBjoern A. Zeeb 	raw_input_ext(m, &route_proto, &route_src, raw_input_rts_cb);
246d989c7b3SRobert Watson }
247d989c7b3SRobert Watson 
248a29f300eSGarrett Wollman /*
249a29f300eSGarrett Wollman  * It really doesn't make any sense at all for this code to share much
250a29f300eSGarrett Wollman  * with raw_usrreq.c, since its functionality is so restricted.  XXX
251a29f300eSGarrett Wollman  */
252ac45e92fSRobert Watson static void
253a29f300eSGarrett Wollman rts_abort(struct socket *so)
254df8bae1dSRodney W. Grimes {
2557e994955SRobert Watson 
256ac45e92fSRobert Watson 	raw_usrreqs.pru_abort(so);
257df8bae1dSRodney W. Grimes }
258a29f300eSGarrett Wollman 
259a152f8a3SRobert Watson static void
260a152f8a3SRobert Watson rts_close(struct socket *so)
261a152f8a3SRobert Watson {
262a152f8a3SRobert Watson 
263a152f8a3SRobert Watson 	raw_usrreqs.pru_close(so);
264a152f8a3SRobert Watson }
265a152f8a3SRobert Watson 
266a29f300eSGarrett Wollman /* pru_accept is EOPNOTSUPP */
267a29f300eSGarrett Wollman 
268a29f300eSGarrett Wollman static int
269b40ce416SJulian Elischer rts_attach(struct socket *so, int proto, struct thread *td)
270a29f300eSGarrett Wollman {
271a29f300eSGarrett Wollman 	struct rawcb *rp;
272c9b652e3SAndre Oppermann 	int error;
273a29f300eSGarrett Wollman 
274bc725eafSRobert Watson 	KASSERT(so->so_pcb == NULL, ("rts_attach: so_pcb != NULL"));
275bc725eafSRobert Watson 
2767cc0979fSDavid Malone 	/* XXX */
2771ede983cSDag-Erling Smørgrav 	rp = malloc(sizeof *rp, M_PCB, M_WAITOK | M_ZERO);
2785dfc91d7SLuigi Rizzo 	if (rp == NULL)
279a29f300eSGarrett Wollman 		return ENOBUFS;
280a29f300eSGarrett Wollman 
281a29f300eSGarrett Wollman 	so->so_pcb = (caddr_t)rp;
2828b07e49aSJulian Elischer 	so->so_fibnum = td->td_proc->p_fibnum;
283162c0b2eSRuslan Ermilov 	error = raw_attach(so, proto);
284a29f300eSGarrett Wollman 	rp = sotorawcb(so);
285a29f300eSGarrett Wollman 	if (error) {
2867ba271aeSJonathan Chen 		so->so_pcb = NULL;
287a29f300eSGarrett Wollman 		free(rp, M_PCB);
288a29f300eSGarrett Wollman 		return error;
289a29f300eSGarrett Wollman 	}
290aea8b30fSSam Leffler 	RTSOCK_LOCK();
291a29f300eSGarrett Wollman 	switch(rp->rcb_proto.sp_protocol) {
292a29f300eSGarrett Wollman 	case AF_INET:
293c5d4eab6SMarko Zec 		V_route_cb.ip_count++;
294a29f300eSGarrett Wollman 		break;
295899ce4f4SYoshinobu Inoue 	case AF_INET6:
296c5d4eab6SMarko Zec 		V_route_cb.ip6_count++;
297899ce4f4SYoshinobu Inoue 		break;
298a29f300eSGarrett Wollman 	}
299c5d4eab6SMarko Zec 	V_route_cb.any_count++;
300aea8b30fSSam Leffler 	RTSOCK_UNLOCK();
30103e49181SSeigo Tanimura 	soisconnected(so);
302df8bae1dSRodney W. Grimes 	so->so_options |= SO_USELOOPBACK;
303a29f300eSGarrett Wollman 	return 0;
304df8bae1dSRodney W. Grimes }
305df8bae1dSRodney W. Grimes 
306a29f300eSGarrett Wollman static int
307b40ce416SJulian Elischer rts_bind(struct socket *so, struct sockaddr *nam, struct thread *td)
308a29f300eSGarrett Wollman {
3097e994955SRobert Watson 
3107e994955SRobert Watson 	return (raw_usrreqs.pru_bind(so, nam, td)); /* xxx just EINVAL */
311a29f300eSGarrett Wollman }
312a29f300eSGarrett Wollman 
313a29f300eSGarrett Wollman static int
314b40ce416SJulian Elischer rts_connect(struct socket *so, struct sockaddr *nam, struct thread *td)
315a29f300eSGarrett Wollman {
3167e994955SRobert Watson 
3177e994955SRobert Watson 	return (raw_usrreqs.pru_connect(so, nam, td)); /* XXX just EINVAL */
318a29f300eSGarrett Wollman }
319a29f300eSGarrett Wollman 
320a29f300eSGarrett Wollman /* pru_connect2 is EOPNOTSUPP */
321a29f300eSGarrett Wollman /* pru_control is EOPNOTSUPP */
322a29f300eSGarrett Wollman 
323bc725eafSRobert Watson static void
324a29f300eSGarrett Wollman rts_detach(struct socket *so)
325a29f300eSGarrett Wollman {
326a29f300eSGarrett Wollman 	struct rawcb *rp = sotorawcb(so);
327a29f300eSGarrett Wollman 
328bc725eafSRobert Watson 	KASSERT(rp != NULL, ("rts_detach: rp == NULL"));
329bc725eafSRobert Watson 
330aea8b30fSSam Leffler 	RTSOCK_LOCK();
331a29f300eSGarrett Wollman 	switch(rp->rcb_proto.sp_protocol) {
332a29f300eSGarrett Wollman 	case AF_INET:
333c5d4eab6SMarko Zec 		V_route_cb.ip_count--;
334a29f300eSGarrett Wollman 		break;
335899ce4f4SYoshinobu Inoue 	case AF_INET6:
336c5d4eab6SMarko Zec 		V_route_cb.ip6_count--;
337899ce4f4SYoshinobu Inoue 		break;
338a29f300eSGarrett Wollman 	}
339c5d4eab6SMarko Zec 	V_route_cb.any_count--;
340aea8b30fSSam Leffler 	RTSOCK_UNLOCK();
341bc725eafSRobert Watson 	raw_usrreqs.pru_detach(so);
342a29f300eSGarrett Wollman }
343a29f300eSGarrett Wollman 
344a29f300eSGarrett Wollman static int
345a29f300eSGarrett Wollman rts_disconnect(struct socket *so)
346a29f300eSGarrett Wollman {
3477e994955SRobert Watson 
3487e994955SRobert Watson 	return (raw_usrreqs.pru_disconnect(so));
349a29f300eSGarrett Wollman }
350a29f300eSGarrett Wollman 
351a29f300eSGarrett Wollman /* pru_listen is EOPNOTSUPP */
352a29f300eSGarrett Wollman 
353a29f300eSGarrett Wollman static int
35457bf258eSGarrett Wollman rts_peeraddr(struct socket *so, struct sockaddr **nam)
355a29f300eSGarrett Wollman {
3567e994955SRobert Watson 
3577e994955SRobert Watson 	return (raw_usrreqs.pru_peeraddr(so, nam));
358a29f300eSGarrett Wollman }
359a29f300eSGarrett Wollman 
360a29f300eSGarrett Wollman /* pru_rcvd is EOPNOTSUPP */
361a29f300eSGarrett Wollman /* pru_rcvoob is EOPNOTSUPP */
362a29f300eSGarrett Wollman 
363a29f300eSGarrett Wollman static int
36457bf258eSGarrett Wollman rts_send(struct socket *so, int flags, struct mbuf *m, struct sockaddr *nam,
365b40ce416SJulian Elischer 	 struct mbuf *control, struct thread *td)
366a29f300eSGarrett Wollman {
3677e994955SRobert Watson 
3687e994955SRobert Watson 	return (raw_usrreqs.pru_send(so, flags, m, nam, control, td));
369a29f300eSGarrett Wollman }
370a29f300eSGarrett Wollman 
371a29f300eSGarrett Wollman /* pru_sense is null */
372a29f300eSGarrett Wollman 
373a29f300eSGarrett Wollman static int
374a29f300eSGarrett Wollman rts_shutdown(struct socket *so)
375a29f300eSGarrett Wollman {
3767e994955SRobert Watson 
3777e994955SRobert Watson 	return (raw_usrreqs.pru_shutdown(so));
378a29f300eSGarrett Wollman }
379a29f300eSGarrett Wollman 
380a29f300eSGarrett Wollman static int
38157bf258eSGarrett Wollman rts_sockaddr(struct socket *so, struct sockaddr **nam)
382a29f300eSGarrett Wollman {
3837e994955SRobert Watson 
3847e994955SRobert Watson 	return (raw_usrreqs.pru_sockaddr(so, nam));
385a29f300eSGarrett Wollman }
386a29f300eSGarrett Wollman 
387a29f300eSGarrett Wollman static struct pr_usrreqs route_usrreqs = {
388756d52a1SPoul-Henning Kamp 	.pru_abort =		rts_abort,
389756d52a1SPoul-Henning Kamp 	.pru_attach =		rts_attach,
390756d52a1SPoul-Henning Kamp 	.pru_bind =		rts_bind,
391756d52a1SPoul-Henning Kamp 	.pru_connect =		rts_connect,
392756d52a1SPoul-Henning Kamp 	.pru_detach =		rts_detach,
393756d52a1SPoul-Henning Kamp 	.pru_disconnect =	rts_disconnect,
394756d52a1SPoul-Henning Kamp 	.pru_peeraddr =		rts_peeraddr,
395756d52a1SPoul-Henning Kamp 	.pru_send =		rts_send,
396756d52a1SPoul-Henning Kamp 	.pru_shutdown =		rts_shutdown,
397756d52a1SPoul-Henning Kamp 	.pru_sockaddr =		rts_sockaddr,
398a152f8a3SRobert Watson 	.pru_close =		rts_close,
399a29f300eSGarrett Wollman };
400a29f300eSGarrett Wollman 
401413628a7SBjoern A. Zeeb #ifndef _SOCKADDR_UNION_DEFINED
402413628a7SBjoern A. Zeeb #define	_SOCKADDR_UNION_DEFINED
403413628a7SBjoern A. Zeeb /*
404413628a7SBjoern A. Zeeb  * The union of all possible address formats we handle.
405413628a7SBjoern A. Zeeb  */
406413628a7SBjoern A. Zeeb union sockaddr_union {
407413628a7SBjoern A. Zeeb 	struct sockaddr		sa;
408413628a7SBjoern A. Zeeb 	struct sockaddr_in	sin;
409413628a7SBjoern A. Zeeb 	struct sockaddr_in6	sin6;
410413628a7SBjoern A. Zeeb };
411413628a7SBjoern A. Zeeb #endif /* _SOCKADDR_UNION_DEFINED */
412413628a7SBjoern A. Zeeb 
413413628a7SBjoern A. Zeeb static int
414413628a7SBjoern A. Zeeb rtm_get_jailed(struct rt_addrinfo *info, struct ifnet *ifp,
415413628a7SBjoern A. Zeeb     struct rtentry *rt, union sockaddr_union *saun, struct ucred *cred)
416413628a7SBjoern A. Zeeb {
417413628a7SBjoern A. Zeeb 
4189c79d243SJamie Gritton 	/* First, see if the returned address is part of the jail. */
4199c79d243SJamie Gritton 	if (prison_if(cred, rt->rt_ifa->ifa_addr) == 0) {
4209c79d243SJamie Gritton 		info->rti_info[RTAX_IFA] = rt->rt_ifa->ifa_addr;
4219c79d243SJamie Gritton 		return (0);
4229c79d243SJamie Gritton 	}
4239c79d243SJamie Gritton 
424413628a7SBjoern A. Zeeb 	switch (info->rti_info[RTAX_DST]->sa_family) {
425413628a7SBjoern A. Zeeb #ifdef INET
426413628a7SBjoern A. Zeeb 	case AF_INET:
427413628a7SBjoern A. Zeeb 	{
428413628a7SBjoern A. Zeeb 		struct in_addr ia;
429413628a7SBjoern A. Zeeb 		struct ifaddr *ifa;
430413628a7SBjoern A. Zeeb 		int found;
431413628a7SBjoern A. Zeeb 
432413628a7SBjoern A. Zeeb 		found = 0;
433413628a7SBjoern A. Zeeb 		/*
4349c79d243SJamie Gritton 		 * Try to find an address on the given outgoing interface
4359c79d243SJamie Gritton 		 * that belongs to the jail.
436413628a7SBjoern A. Zeeb 		 */
437137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
438413628a7SBjoern A. Zeeb 		TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) {
439413628a7SBjoern A. Zeeb 			struct sockaddr *sa;
440413628a7SBjoern A. Zeeb 			sa = ifa->ifa_addr;
441413628a7SBjoern A. Zeeb 			if (sa->sa_family != AF_INET)
442413628a7SBjoern A. Zeeb 				continue;
443413628a7SBjoern A. Zeeb 			ia = ((struct sockaddr_in *)sa)->sin_addr;
444b89e82ddSJamie Gritton 			if (prison_check_ip4(cred, &ia) == 0) {
445413628a7SBjoern A. Zeeb 				found = 1;
446413628a7SBjoern A. Zeeb 				break;
447413628a7SBjoern A. Zeeb 			}
448413628a7SBjoern A. Zeeb 		}
449137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
450413628a7SBjoern A. Zeeb 		if (!found) {
451413628a7SBjoern A. Zeeb 			/*
4529c79d243SJamie Gritton 			 * As a last resort return the 'default' jail address.
453413628a7SBjoern A. Zeeb 			 */
4540304c731SJamie Gritton 			ia = ((struct sockaddr_in *)rt->rt_ifa->ifa_addr)->
4550304c731SJamie Gritton 			    sin_addr;
4561cecba0fSBjoern A. Zeeb 			if (prison_get_ip4(cred, &ia) != 0)
457413628a7SBjoern A. Zeeb 				return (ESRCH);
458413628a7SBjoern A. Zeeb 		}
459413628a7SBjoern A. Zeeb 		bzero(&saun->sin, sizeof(struct sockaddr_in));
460413628a7SBjoern A. Zeeb 		saun->sin.sin_len = sizeof(struct sockaddr_in);
461413628a7SBjoern A. Zeeb 		saun->sin.sin_family = AF_INET;
462413628a7SBjoern A. Zeeb 		saun->sin.sin_addr.s_addr = ia.s_addr;
4639c79d243SJamie Gritton 		info->rti_info[RTAX_IFA] = (struct sockaddr *)&saun->sin;
464413628a7SBjoern A. Zeeb 		break;
465413628a7SBjoern A. Zeeb 	}
466413628a7SBjoern A. Zeeb #endif
467413628a7SBjoern A. Zeeb #ifdef INET6
468413628a7SBjoern A. Zeeb 	case AF_INET6:
469413628a7SBjoern A. Zeeb 	{
470413628a7SBjoern A. Zeeb 		struct in6_addr ia6;
471413628a7SBjoern A. Zeeb 		struct ifaddr *ifa;
472413628a7SBjoern A. Zeeb 		int found;
473413628a7SBjoern A. Zeeb 
474413628a7SBjoern A. Zeeb 		found = 0;
475413628a7SBjoern A. Zeeb 		/*
4769c79d243SJamie Gritton 		 * Try to find an address on the given outgoing interface
4779c79d243SJamie Gritton 		 * that belongs to the jail.
478413628a7SBjoern A. Zeeb 		 */
479137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
480413628a7SBjoern A. Zeeb 		TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) {
481413628a7SBjoern A. Zeeb 			struct sockaddr *sa;
482413628a7SBjoern A. Zeeb 			sa = ifa->ifa_addr;
483413628a7SBjoern A. Zeeb 			if (sa->sa_family != AF_INET6)
484413628a7SBjoern A. Zeeb 				continue;
485413628a7SBjoern A. Zeeb 			bcopy(&((struct sockaddr_in6 *)sa)->sin6_addr,
486413628a7SBjoern A. Zeeb 			    &ia6, sizeof(struct in6_addr));
487b89e82ddSJamie Gritton 			if (prison_check_ip6(cred, &ia6) == 0) {
488413628a7SBjoern A. Zeeb 				found = 1;
489413628a7SBjoern A. Zeeb 				break;
490413628a7SBjoern A. Zeeb 			}
491413628a7SBjoern A. Zeeb 		}
492137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
493413628a7SBjoern A. Zeeb 		if (!found) {
494413628a7SBjoern A. Zeeb 			/*
4959c79d243SJamie Gritton 			 * As a last resort return the 'default' jail address.
496413628a7SBjoern A. Zeeb 			 */
4970304c731SJamie Gritton 			ia6 = ((struct sockaddr_in6 *)rt->rt_ifa->ifa_addr)->
4980304c731SJamie Gritton 			    sin6_addr;
4991cecba0fSBjoern A. Zeeb 			if (prison_get_ip6(cred, &ia6) != 0)
500413628a7SBjoern A. Zeeb 				return (ESRCH);
501413628a7SBjoern A. Zeeb 		}
502413628a7SBjoern A. Zeeb 		bzero(&saun->sin6, sizeof(struct sockaddr_in6));
503413628a7SBjoern A. Zeeb 		saun->sin6.sin6_len = sizeof(struct sockaddr_in6);
504413628a7SBjoern A. Zeeb 		saun->sin6.sin6_family = AF_INET6;
5059c79d243SJamie Gritton 		bcopy(&ia6, &saun->sin6.sin6_addr, sizeof(struct in6_addr));
506413628a7SBjoern A. Zeeb 		if (sa6_recoverscope(&saun->sin6) != 0)
507413628a7SBjoern A. Zeeb 			return (ESRCH);
5089c79d243SJamie Gritton 		info->rti_info[RTAX_IFA] = (struct sockaddr *)&saun->sin6;
509413628a7SBjoern A. Zeeb 		break;
510413628a7SBjoern A. Zeeb 	}
511413628a7SBjoern A. Zeeb #endif
512413628a7SBjoern A. Zeeb 	default:
513413628a7SBjoern A. Zeeb 		return (ESRCH);
514413628a7SBjoern A. Zeeb 	}
515413628a7SBjoern A. Zeeb 	return (0);
516413628a7SBjoern A. Zeeb }
517413628a7SBjoern A. Zeeb 
518df8bae1dSRodney W. Grimes /*ARGSUSED*/
51952041295SPoul-Henning Kamp static int
52073d76e77SKevin Lo route_output(struct mbuf *m, struct socket *so, ...)
521df8bae1dSRodney W. Grimes {
5225dfc91d7SLuigi Rizzo 	struct rt_msghdr *rtm = NULL;
5235dfc91d7SLuigi Rizzo 	struct rtentry *rt = NULL;
524*61eee0e2SAlexander V. Chernikov 	struct rib_head *rnh;
525df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
5260bebb544SHiroki Sato 	struct sockaddr_storage ss;
5273deb3649SAlexander V. Chernikov #ifdef INET6
5286bbfef90SHiroki Sato 	struct sockaddr_in6 *sin6;
5290bebb544SHiroki Sato 	int i, rti_need_deembed = 0;
5306bbfef90SHiroki Sato #endif
531f2e5eb36SAlexander V. Chernikov 	int alloc_len = 0, len, error = 0, fibnum;
5325dfc91d7SLuigi Rizzo 	struct ifnet *ifp = NULL;
533413628a7SBjoern A. Zeeb 	union sockaddr_union saun;
5343ca1a2d6SMax Laier 	sa_family_t saf = AF_UNSPEC;
53592c227afSAlexander V. Chernikov 	struct rawcb *rp = NULL;
536f2e5eb36SAlexander V. Chernikov 	struct walkarg w;
537df8bae1dSRodney W. Grimes 
538f5d9a696SAlexander V. Chernikov 	fibnum = so->so_fibnum;
539f5d9a696SAlexander V. Chernikov 
540df8bae1dSRodney W. Grimes #define senderr(e) { error = e; goto flush;}
5415dfc91d7SLuigi Rizzo 	if (m == NULL || ((m->m_len < sizeof(long)) &&
5425dfc91d7SLuigi Rizzo 		       (m = m_pullup(m, sizeof(long))) == NULL))
543df8bae1dSRodney W. Grimes 		return (ENOBUFS);
544df8bae1dSRodney W. Grimes 	if ((m->m_flags & M_PKTHDR) == 0)
545df8bae1dSRodney W. Grimes 		panic("route_output");
546df8bae1dSRodney W. Grimes 	len = m->m_pkthdr.len;
547df8bae1dSRodney W. Grimes 	if (len < sizeof(*rtm) ||
548f1fcb552SAlexander V. Chernikov 	    len != mtod(m, struct rt_msghdr *)->rtm_msglen)
549df8bae1dSRodney W. Grimes 		senderr(EINVAL);
550f1fcb552SAlexander V. Chernikov 
551f2e5eb36SAlexander V. Chernikov 	/*
552f2e5eb36SAlexander V. Chernikov 	 * Most of current messages are in range 200-240 bytes,
553d9437c0fSAlexander V. Chernikov 	 * minimize possible re-allocation on reply using larger size
554d9437c0fSAlexander V. Chernikov 	 * buffer aligned on 1k boundaty.
555f2e5eb36SAlexander V. Chernikov 	 */
556f2e5eb36SAlexander V. Chernikov 	alloc_len = roundup2(len, 1024);
557d9437c0fSAlexander V. Chernikov 	if ((rtm = malloc(alloc_len, M_TEMP, M_NOWAIT)) == NULL)
558df8bae1dSRodney W. Grimes 		senderr(ENOBUFS);
559f2e5eb36SAlexander V. Chernikov 
560df8bae1dSRodney W. Grimes 	m_copydata(m, 0, len, (caddr_t)rtm);
561f1fcb552SAlexander V. Chernikov 	bzero(&info, sizeof(info));
562f2e5eb36SAlexander V. Chernikov 	bzero(&w, sizeof(w));
563f1fcb552SAlexander V. Chernikov 
564df8bae1dSRodney W. Grimes 	if (rtm->rtm_version != RTM_VERSION) {
565f1fcb552SAlexander V. Chernikov 		/* Do not touch message since format is unknown */
566f2e5eb36SAlexander V. Chernikov 		free(rtm, M_TEMP);
567f1fcb552SAlexander V. Chernikov 		rtm = NULL;
568df8bae1dSRodney W. Grimes 		senderr(EPROTONOSUPPORT);
569df8bae1dSRodney W. Grimes 	}
570f1fcb552SAlexander V. Chernikov 
571f1fcb552SAlexander V. Chernikov 	/*
572f1fcb552SAlexander V. Chernikov 	 * Starting from here, it is possible
573f1fcb552SAlexander V. Chernikov 	 * to alter original message and insert
574f1fcb552SAlexander V. Chernikov 	 * caller PID and error value.
575f1fcb552SAlexander V. Chernikov 	 */
576f1fcb552SAlexander V. Chernikov 
577df8bae1dSRodney W. Grimes 	rtm->rtm_pid = curproc->p_pid;
578df8bae1dSRodney W. Grimes 	info.rti_addrs = rtm->rtm_addrs;
5790fb9298dSAlexander V. Chernikov 
5800fb9298dSAlexander V. Chernikov 	info.rti_mflags = rtm->rtm_inits;
5810fb9298dSAlexander V. Chernikov 	info.rti_rmx = &rtm->rtm_rmx;
5820fb9298dSAlexander V. Chernikov 
5830bebb544SHiroki Sato 	/*
5840bebb544SHiroki Sato 	 * rt_xaddrs() performs s6_addr[2] := sin6_scope_id for AF_INET6
5850bebb544SHiroki Sato 	 * link-local address because rtrequest requires addresses with
5860bebb544SHiroki Sato 	 * embedded scope id.
5870bebb544SHiroki Sato 	 */
588f1fcb552SAlexander V. Chernikov 	if (rt_xaddrs((caddr_t)(rtm + 1), len + (caddr_t)rtm, &info))
589076d0761SJulian Elischer 		senderr(EINVAL);
590f1fcb552SAlexander V. Chernikov 
5918071913dSRuslan Ermilov 	info.rti_flags = rtm->rtm_flags;
5925dfc91d7SLuigi Rizzo 	if (info.rti_info[RTAX_DST] == NULL ||
593becc44d7SSam Leffler 	    info.rti_info[RTAX_DST]->sa_family >= AF_MAX ||
5945dfc91d7SLuigi Rizzo 	    (info.rti_info[RTAX_GATEWAY] != NULL &&
595becc44d7SSam Leffler 	     info.rti_info[RTAX_GATEWAY]->sa_family >= AF_MAX))
596df8bae1dSRodney W. Grimes 		senderr(EINVAL);
5973ca1a2d6SMax Laier 	saf = info.rti_info[RTAX_DST]->sa_family;
598162c0b2eSRuslan Ermilov 	/*
599162c0b2eSRuslan Ermilov 	 * Verify that the caller has the appropriate privilege; RTM_GET
600162c0b2eSRuslan Ermilov 	 * is the only operation the non-superuser is allowed.
601162c0b2eSRuslan Ermilov 	 */
602acd3428bSRobert Watson 	if (rtm->rtm_type != RTM_GET) {
603acd3428bSRobert Watson 		error = priv_check(curthread, PRIV_NET_ROUTE);
604acd3428bSRobert Watson 		if (error)
605dadb6c3bSRuslan Ermilov 			senderr(error);
606acd3428bSRobert Watson 	}
607162c0b2eSRuslan Ermilov 
6089231d35fSQing Li 	/*
6099231d35fSQing Li 	 * The given gateway address may be an interface address.
6109231d35fSQing Li 	 * For example, issuing a "route change" command on a route
6119231d35fSQing Li 	 * entry that was created from a tunnel, and the gateway
6129231d35fSQing Li 	 * address given is the local end point. In this case the
6139231d35fSQing Li 	 * RTF_GATEWAY flag must be cleared or the destination will
6149231d35fSQing Li 	 * not be reachable even though there is no error message.
6159231d35fSQing Li 	 */
6169231d35fSQing Li 	if (info.rti_info[RTAX_GATEWAY] != NULL &&
6179231d35fSQing Li 	    info.rti_info[RTAX_GATEWAY]->sa_family != AF_LINK) {
6189a1b64d5SAlexander V. Chernikov 		struct rt_addrinfo ginfo;
6199a1b64d5SAlexander V. Chernikov 		struct sockaddr *gdst;
6209231d35fSQing Li 
6219a1b64d5SAlexander V. Chernikov 		bzero(&ginfo, sizeof(ginfo));
6229a1b64d5SAlexander V. Chernikov 		bzero(&ss, sizeof(ss));
6239a1b64d5SAlexander V. Chernikov 		ss.ss_len = sizeof(ss);
6249a1b64d5SAlexander V. Chernikov 
6259a1b64d5SAlexander V. Chernikov 		ginfo.rti_info[RTAX_GATEWAY] = (struct sockaddr *)&ss;
6269a1b64d5SAlexander V. Chernikov 		gdst = info.rti_info[RTAX_GATEWAY];
6279a1b64d5SAlexander V. Chernikov 
6289231d35fSQing Li 		/*
6299231d35fSQing Li 		 * A host route through the loopback interface is
6309231d35fSQing Li 		 * installed for each interface adddress. In pre 8.0
6319231d35fSQing Li 		 * releases the interface address of a PPP link type
6329231d35fSQing Li 		 * is not reachable locally. This behavior is fixed as
6339231d35fSQing Li 		 * part of the new L2/L3 redesign and rewrite work. The
6349231d35fSQing Li 		 * signature of this interface address route is the
6359231d35fSQing Li 		 * AF_LINK sa_family type of the rt_gateway, and the
6369231d35fSQing Li 		 * rt_ifp has the IFF_LOOPBACK flag set.
6379231d35fSQing Li 		 */
6389a1b64d5SAlexander V. Chernikov 		if (rib_lookup_info(fibnum, gdst, NHR_REF, 0, &ginfo) == 0) {
6399a1b64d5SAlexander V. Chernikov 			if (ss.ss_family == AF_LINK &&
6409a1b64d5SAlexander V. Chernikov 			    ginfo.rti_ifp->if_flags & IFF_LOOPBACK) {
6419231d35fSQing Li 				info.rti_flags &= ~RTF_GATEWAY;
642f672f56fSQing Li 				info.rti_flags |= RTF_GWFLAG_COMPAT;
643f672f56fSQing Li 			}
6449a1b64d5SAlexander V. Chernikov 			rib_free_info(&ginfo);
6459a1b64d5SAlexander V. Chernikov 		}
6469231d35fSQing Li 	}
6479231d35fSQing Li 
648df8bae1dSRodney W. Grimes 	switch (rtm->rtm_type) {
649becc44d7SSam Leffler 		struct rtentry *saved_nrt;
650df8bae1dSRodney W. Grimes 
651df8bae1dSRodney W. Grimes 	case RTM_ADD:
652c77462ddSAlexander V. Chernikov 	case RTM_CHANGE:
6535dfc91d7SLuigi Rizzo 		if (info.rti_info[RTAX_GATEWAY] == NULL)
654df8bae1dSRodney W. Grimes 			senderr(EINVAL);
6555dfc91d7SLuigi Rizzo 		saved_nrt = NULL;
6568eca593cSQing Li 
6576e6b3f7cSQing Li 		/* support for new ARP code */
6588eca593cSQing Li 		if (info.rti_info[RTAX_GATEWAY]->sa_family == AF_LINK &&
6598eca593cSQing Li 		    (rtm->rtm_flags & RTF_LLDATA) != 0) {
6606e6b3f7cSQing Li 			error = lla_rt_output(rtm, &info);
6610bebb544SHiroki Sato #ifdef INET6
6620bebb544SHiroki Sato 			if (error == 0)
6630bebb544SHiroki Sato 				rti_need_deembed = (V_deembed_scopeid) ? 1 : 0;
6640bebb544SHiroki Sato #endif
6656e6b3f7cSQing Li 			break;
6666e6b3f7cSQing Li 		}
667c77462ddSAlexander V. Chernikov 		error = rtrequest1_fib(rtm->rtm_type, &info, &saved_nrt,
668773aa053SAlexander V. Chernikov 		    fibnum);
669c77462ddSAlexander V. Chernikov 		if (error == 0 && saved_nrt != NULL) {
6700bebb544SHiroki Sato #ifdef INET6
6710bebb544SHiroki Sato 			rti_need_deembed = (V_deembed_scopeid) ? 1 : 0;
6720bebb544SHiroki Sato #endif
673d1dd20beSSam Leffler 			RT_LOCK(saved_nrt);
67422cafcf0SAndre Oppermann 			rtm->rtm_index = saved_nrt->rt_ifp->if_index;
6757138d65cSSam Leffler 			RT_REMREF(saved_nrt);
676d1dd20beSSam Leffler 			RT_UNLOCK(saved_nrt);
677df8bae1dSRodney W. Grimes 		}
678df8bae1dSRodney W. Grimes 		break;
679df8bae1dSRodney W. Grimes 
680df8bae1dSRodney W. Grimes 	case RTM_DELETE:
6815dfc91d7SLuigi Rizzo 		saved_nrt = NULL;
6826e6b3f7cSQing Li 		/* support for new ARP code */
6836e6b3f7cSQing Li 		if (info.rti_info[RTAX_GATEWAY] &&
6848eca593cSQing Li 		    (info.rti_info[RTAX_GATEWAY]->sa_family == AF_LINK) &&
6858eca593cSQing Li 		    (rtm->rtm_flags & RTF_LLDATA) != 0) {
6866e6b3f7cSQing Li 			error = lla_rt_output(rtm, &info);
6870bebb544SHiroki Sato #ifdef INET6
6880bebb544SHiroki Sato 			if (error == 0)
6890bebb544SHiroki Sato 				rti_need_deembed = (V_deembed_scopeid) ? 1 : 0;
6900bebb544SHiroki Sato #endif
6916e6b3f7cSQing Li 			break;
6926e6b3f7cSQing Li 		}
693773aa053SAlexander V. Chernikov 		error = rtrequest1_fib(RTM_DELETE, &info, &saved_nrt, fibnum);
69478a82810SGarrett Wollman 		if (error == 0) {
695d1dd20beSSam Leffler 			RT_LOCK(saved_nrt);
69671eba915SRuslan Ermilov 			rt = saved_nrt;
69778a82810SGarrett Wollman 			goto report;
69878a82810SGarrett Wollman 		}
6990bebb544SHiroki Sato #ifdef INET6
7000bebb544SHiroki Sato 		/* rt_msg2() will not be used when RTM_DELETE fails. */
7010bebb544SHiroki Sato 		rti_need_deembed = (V_deembed_scopeid) ? 1 : 0;
7020bebb544SHiroki Sato #endif
703df8bae1dSRodney W. Grimes 		break;
704df8bae1dSRodney W. Grimes 
705df8bae1dSRodney W. Grimes 	case RTM_GET:
706773aa053SAlexander V. Chernikov 		rnh = rt_tables_get_rnh(fibnum, saf);
7075dfc91d7SLuigi Rizzo 		if (rnh == NULL)
70878a82810SGarrett Wollman 			senderr(EAFNOSUPPORT);
7095a2f4cbdSAlexander V. Chernikov 
710*61eee0e2SAlexander V. Chernikov 		RIB_RLOCK(rnh);
7115a2f4cbdSAlexander V. Chernikov 
7125a2f4cbdSAlexander V. Chernikov 		if (info.rti_info[RTAX_NETMASK] == NULL &&
7135a2f4cbdSAlexander V. Chernikov 		    rtm->rtm_type == RTM_GET) {
7145a2f4cbdSAlexander V. Chernikov 			/*
7155a2f4cbdSAlexander V. Chernikov 			 * Provide logest prefix match for
7165a2f4cbdSAlexander V. Chernikov 			 * address lookup (no mask).
7175a2f4cbdSAlexander V. Chernikov 			 * 'route -n get addr'
7185a2f4cbdSAlexander V. Chernikov 			 */
7195a2f4cbdSAlexander V. Chernikov 			rt = (struct rtentry *) rnh->rnh_matchaddr(
720*61eee0e2SAlexander V. Chernikov 			    info.rti_info[RTAX_DST], &rnh->head);
7215a2f4cbdSAlexander V. Chernikov 		} else
7225a2f4cbdSAlexander V. Chernikov 			rt = (struct rtentry *) rnh->rnh_lookup(
7235a2f4cbdSAlexander V. Chernikov 			    info.rti_info[RTAX_DST],
724*61eee0e2SAlexander V. Chernikov 			    info.rti_info[RTAX_NETMASK], &rnh->head);
7255a2f4cbdSAlexander V. Chernikov 
7265a2f4cbdSAlexander V. Chernikov 		if (rt == NULL) {
727*61eee0e2SAlexander V. Chernikov 			RIB_RUNLOCK(rnh);
728df8bae1dSRodney W. Grimes 			senderr(ESRCH);
72979188861SGleb Smirnoff 		}
730e440aed9SQing Li #ifdef RADIX_MPATH
731e440aed9SQing Li 		/*
732e440aed9SQing Li 		 * for RTM_CHANGE/LOCK, if we got multipath routes,
733e440aed9SQing Li 		 * we require users to specify a matching RTAX_GATEWAY.
734e440aed9SQing Li 		 *
735e440aed9SQing Li 		 * for RTM_GET, gate is optional even with multipath.
736e440aed9SQing Li 		 * if gate == NULL the first match is returned.
737e440aed9SQing Li 		 * (no need to call rt_mpath_matchgate if gate == NULL)
738e440aed9SQing Li 		 */
739*61eee0e2SAlexander V. Chernikov 		if (rt_mpath_capable(rnh) &&
740e440aed9SQing Li 		    (rtm->rtm_type != RTM_GET || info.rti_info[RTAX_GATEWAY])) {
741e440aed9SQing Li 			rt = rt_mpath_matchgate(rt, info.rti_info[RTAX_GATEWAY]);
742e440aed9SQing Li 			if (!rt) {
743*61eee0e2SAlexander V. Chernikov 				RIB_RUNLOCK(rnh);
744e440aed9SQing Li 				senderr(ESRCH);
745e440aed9SQing Li 			}
746e440aed9SQing Li 		}
747e440aed9SQing Li #endif
748c7ab6602SQing Li 		/*
749c7ab6602SQing Li 		 * If performing proxied L2 entry insertion, and
750c7ab6602SQing Li 		 * the actual PPP host entry is found, perform
751c7ab6602SQing Li 		 * another search to retrieve the prefix route of
752c7ab6602SQing Li 		 * the local end point of the PPP link.
753c7ab6602SQing Li 		 */
7540ed6142bSQing Li 		if (rtm->rtm_flags & RTF_ANNOUNCE) {
755c7ab6602SQing Li 			struct sockaddr laddr;
7560ed6142bSQing Li 
7570ed6142bSQing Li 			if (rt->rt_ifp != NULL &&
7580ed6142bSQing Li 			    rt->rt_ifp->if_type == IFT_PROPVIRTUAL) {
7590ed6142bSQing Li 				struct ifaddr *ifa;
7600ed6142bSQing Li 
7614f8585e0SAlan Somers 				ifa = ifa_ifwithnet(info.rti_info[RTAX_DST], 1,
7624f8585e0SAlan Somers 						RT_ALL_FIBS);
7630ed6142bSQing Li 				if (ifa != NULL)
7640ed6142bSQing Li 					rt_maskedcopy(ifa->ifa_addr,
7650ed6142bSQing Li 						      &laddr,
7660ed6142bSQing Li 						      ifa->ifa_netmask);
7670ed6142bSQing Li 			} else
768c7ab6602SQing Li 				rt_maskedcopy(rt->rt_ifa->ifa_addr,
769c7ab6602SQing Li 					      &laddr,
770c7ab6602SQing Li 					      rt->rt_ifa->ifa_netmask);
771c7ab6602SQing Li 			/*
772c7ab6602SQing Li 			 * refactor rt and no lock operation necessary
773c7ab6602SQing Li 			 */
774*61eee0e2SAlexander V. Chernikov 			rt = (struct rtentry *)rnh->rnh_matchaddr(&laddr,
775*61eee0e2SAlexander V. Chernikov 			    &rnh->head);
776c7ab6602SQing Li 			if (rt == NULL) {
777*61eee0e2SAlexander V. Chernikov 				RIB_RUNLOCK(rnh);
778c7ab6602SQing Li 				senderr(ESRCH);
779c7ab6602SQing Li 			}
780c7ab6602SQing Li 		}
781d1dd20beSSam Leffler 		RT_LOCK(rt);
7827138d65cSSam Leffler 		RT_ADDREF(rt);
783*61eee0e2SAlexander V. Chernikov 		RIB_RUNLOCK(rnh);
784956b0b65SJeffrey Hsu 
78578a82810SGarrett Wollman report:
786d1dd20beSSam Leffler 		RT_LOCK_ASSERT(rt);
787b89e82ddSJamie Gritton 		if ((rt->rt_flags & RTF_HOST) == 0
788de0bd6f7SBjoern A. Zeeb 		    ? jailed_without_vnet(curthread->td_ucred)
789b89e82ddSJamie Gritton 		    : prison_if(curthread->td_ucred,
790b89e82ddSJamie Gritton 		    rt_key(rt)) != 0) {
791813dd6aeSBjoern A. Zeeb 			RT_UNLOCK(rt);
792813dd6aeSBjoern A. Zeeb 			senderr(ESRCH);
793813dd6aeSBjoern A. Zeeb 		}
794becc44d7SSam Leffler 		info.rti_info[RTAX_DST] = rt_key(rt);
795becc44d7SSam Leffler 		info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
7963deb3649SAlexander V. Chernikov 		info.rti_info[RTAX_NETMASK] = rtsock_fix_netmask(rt_key(rt),
7973deb3649SAlexander V. Chernikov 		    rt_mask(rt), &ss);
7986e6b3f7cSQing Li 		info.rti_info[RTAX_GENMASK] = 0;
799df8bae1dSRodney W. Grimes 		if (rtm->rtm_addrs & (RTA_IFP | RTA_IFA)) {
800df440948SPoul-Henning Kamp 			ifp = rt->rt_ifp;
801df440948SPoul-Henning Kamp 			if (ifp) {
8029b98ee2cSLuigi Rizzo 				info.rti_info[RTAX_IFP] =
8034a0d6638SRuslan Ermilov 				    ifp->if_addr->ifa_addr;
8049c79d243SJamie Gritton 				error = rtm_get_jailed(&info, ifp, rt,
8059c79d243SJamie Gritton 				    &saun, curthread->td_ucred);
806413628a7SBjoern A. Zeeb 				if (error != 0) {
807413628a7SBjoern A. Zeeb 					RT_UNLOCK(rt);
8089c79d243SJamie Gritton 					senderr(error);
809413628a7SBjoern A. Zeeb 				}
81028070a0eSRuslan Ermilov 				if (ifp->if_flags & IFF_POINTOPOINT)
811becc44d7SSam Leffler 					info.rti_info[RTAX_BRD] =
812becc44d7SSam Leffler 					    rt->rt_ifa->ifa_dstaddr;
813df8bae1dSRodney W. Grimes 				rtm->rtm_index = ifp->if_index;
814df8bae1dSRodney W. Grimes 			} else {
8155dfc91d7SLuigi Rizzo 				info.rti_info[RTAX_IFP] = NULL;
8165dfc91d7SLuigi Rizzo 				info.rti_info[RTAX_IFA] = NULL;
817df8bae1dSRodney W. Grimes 			}
81825029d6cSHartmut Brandt 		} else if ((ifp = rt->rt_ifp) != NULL) {
81925029d6cSHartmut Brandt 			rtm->rtm_index = ifp->if_index;
820df8bae1dSRodney W. Grimes 		}
821f2e5eb36SAlexander V. Chernikov 
822f2e5eb36SAlexander V. Chernikov 		/* Check if we need to realloc storage */
823f2e5eb36SAlexander V. Chernikov 		rtsock_msg_buffer(rtm->rtm_type, &info, NULL, &len);
824f2e5eb36SAlexander V. Chernikov 		if (len > alloc_len) {
825df8bae1dSRodney W. Grimes 			struct rt_msghdr *new_rtm;
826f2e5eb36SAlexander V. Chernikov 			new_rtm = malloc(len, M_TEMP, M_NOWAIT);
8275dfc91d7SLuigi Rizzo 			if (new_rtm == NULL) {
828d1dd20beSSam Leffler 				RT_UNLOCK(rt);
829df8bae1dSRodney W. Grimes 				senderr(ENOBUFS);
830becc44d7SSam Leffler 			}
8316b96f1afSLuigi Rizzo 			bcopy(rtm, new_rtm, rtm->rtm_msglen);
832f2e5eb36SAlexander V. Chernikov 			free(rtm, M_TEMP);
833f2e5eb36SAlexander V. Chernikov 			rtm = new_rtm;
834f2e5eb36SAlexander V. Chernikov 			alloc_len = len;
835df8bae1dSRodney W. Grimes 		}
836f2e5eb36SAlexander V. Chernikov 
837f2e5eb36SAlexander V. Chernikov 		w.w_tmem = (caddr_t)rtm;
838f2e5eb36SAlexander V. Chernikov 		w.w_tmemsize = alloc_len;
839f2e5eb36SAlexander V. Chernikov 		rtsock_msg_buffer(rtm->rtm_type, &info, &w, &len);
840f2e5eb36SAlexander V. Chernikov 
841f672f56fSQing Li 		if (rt->rt_flags & RTF_GWFLAG_COMPAT)
842f672f56fSQing Li 			rtm->rtm_flags = RTF_GATEWAY |
843f672f56fSQing Li 				(rt->rt_flags & ~RTF_GWFLAG_COMPAT);
844f672f56fSQing Li 		else
845df8bae1dSRodney W. Grimes 			rtm->rtm_flags = rt->rt_flags;
846e3a7aa6fSGleb Smirnoff 		rt_getmetrics(rt, &rtm->rtm_rmx);
847df8bae1dSRodney W. Grimes 		rtm->rtm_addrs = info.rti_addrs;
848df8bae1dSRodney W. Grimes 
849d1dd20beSSam Leffler 		RT_UNLOCK(rt);
850df8bae1dSRodney W. Grimes 		break;
851df8bae1dSRodney W. Grimes 
852df8bae1dSRodney W. Grimes 	default:
853df8bae1dSRodney W. Grimes 		senderr(EOPNOTSUPP);
854df8bae1dSRodney W. Grimes 	}
855df8bae1dSRodney W. Grimes 
856df8bae1dSRodney W. Grimes flush:
85792c227afSAlexander V. Chernikov 	if (rt != NULL)
858becc44d7SSam Leffler 		RTFREE(rt);
859df8bae1dSRodney W. Grimes 	/*
860df8bae1dSRodney W. Grimes 	 * Check to see if we don't want our own messages.
861df8bae1dSRodney W. Grimes 	 */
862df8bae1dSRodney W. Grimes 	if ((so->so_options & SO_USELOOPBACK) == 0) {
863c5d4eab6SMarko Zec 		if (V_route_cb.any_count <= 1) {
864d9437c0fSAlexander V. Chernikov 			if (rtm != NULL)
865f2e5eb36SAlexander V. Chernikov 				free(rtm, M_TEMP);
866df8bae1dSRodney W. Grimes 			m_freem(m);
867df8bae1dSRodney W. Grimes 			return (error);
868df8bae1dSRodney W. Grimes 		}
869df8bae1dSRodney W. Grimes 		/* There is another listener, so construct message */
870df8bae1dSRodney W. Grimes 		rp = sotorawcb(so);
8714cc20ab1SSeigo Tanimura 	}
87292c227afSAlexander V. Chernikov 
8732277c5e5SAlexander V. Chernikov 	if (rtm != NULL) {
8740bebb544SHiroki Sato #ifdef INET6
8750bebb544SHiroki Sato 		if (rti_need_deembed) {
8760bebb544SHiroki Sato 			/* sin6_scope_id is recovered before sending rtm. */
8770bebb544SHiroki Sato 			sin6 = (struct sockaddr_in6 *)&ss;
87812bdf23aSHiroki Sato 			for (i = 0; i < RTAX_MAX; i++) {
8790bebb544SHiroki Sato 				if (info.rti_info[i] == NULL)
8800bebb544SHiroki Sato 					continue;
8810bebb544SHiroki Sato 				if (info.rti_info[i]->sa_family != AF_INET6)
8820bebb544SHiroki Sato 					continue;
8830bebb544SHiroki Sato 				bcopy(info.rti_info[i], sin6, sizeof(*sin6));
8840bebb544SHiroki Sato 				if (sa6_recoverscope(sin6) == 0)
8850bebb544SHiroki Sato 					bcopy(sin6, info.rti_info[i],
8860bebb544SHiroki Sato 						    sizeof(*sin6));
8870bebb544SHiroki Sato 			}
8880bebb544SHiroki Sato 		}
8890bebb544SHiroki Sato #endif
89092c227afSAlexander V. Chernikov 		if (error != 0)
89192c227afSAlexander V. Chernikov 			rtm->rtm_errno = error;
89292c227afSAlexander V. Chernikov 		else
89392c227afSAlexander V. Chernikov 			rtm->rtm_flags |= RTF_DONE;
89492c227afSAlexander V. Chernikov 
895df8bae1dSRodney W. Grimes 		m_copyback(m, 0, rtm->rtm_msglen, (caddr_t)rtm);
89603311056SHajimu UMEMOTO 		if (m->m_pkthdr.len < rtm->rtm_msglen) {
89703311056SHajimu UMEMOTO 			m_freem(m);
89803311056SHajimu UMEMOTO 			m = NULL;
89903311056SHajimu UMEMOTO 		} else if (m->m_pkthdr.len > rtm->rtm_msglen)
90003311056SHajimu UMEMOTO 			m_adj(m, rtm->rtm_msglen - m->m_pkthdr.len);
901f2e5eb36SAlexander V. Chernikov 
902f2e5eb36SAlexander V. Chernikov 		free(rtm, M_TEMP);
903df8bae1dSRodney W. Grimes 	}
90492c227afSAlexander V. Chernikov 	if (m != NULL) {
905773aa053SAlexander V. Chernikov 		M_SETFIB(m, fibnum);
906528737fdSBjoern A. Zeeb 		m->m_flags |= RTS_FILTER_FIB;
907becc44d7SSam Leffler 		if (rp) {
908becc44d7SSam Leffler 			/*
909becc44d7SSam Leffler 			 * XXX insure we don't get a copy by
910becc44d7SSam Leffler 			 * invalidating our protocol
911becc44d7SSam Leffler 			 */
912becc44d7SSam Leffler 			unsigned short family = rp->rcb_proto.sp_family;
913becc44d7SSam Leffler 			rp->rcb_proto.sp_family = 0;
9143ca1a2d6SMax Laier 			rt_dispatch(m, saf);
915becc44d7SSam Leffler 			rp->rcb_proto.sp_family = family;
916becc44d7SSam Leffler 		} else
9173ca1a2d6SMax Laier 			rt_dispatch(m, saf);
918becc44d7SSam Leffler 	}
91992c227afSAlexander V. Chernikov 
920df8bae1dSRodney W. Grimes 	return (error);
921df8bae1dSRodney W. Grimes }
922df8bae1dSRodney W. Grimes 
92352041295SPoul-Henning Kamp static void
924e3a7aa6fSGleb Smirnoff rt_getmetrics(const struct rtentry *rt, struct rt_metrics *out)
92597d8d152SAndre Oppermann {
926e3a7aa6fSGleb Smirnoff 
92797d8d152SAndre Oppermann 	bzero(out, sizeof(*out));
928e3a7aa6fSGleb Smirnoff 	out->rmx_mtu = rt->rt_mtu;
929e3a7aa6fSGleb Smirnoff 	out->rmx_weight = rt->rt_weight;
930e3a7aa6fSGleb Smirnoff 	out->rmx_pksent = counter_u64_fetch(rt->rt_pksent);
931e27c3f48SOleg Bulyzhin 	/* Kernel -> userland timebase conversion. */
932e3a7aa6fSGleb Smirnoff 	out->rmx_expire = rt->rt_expire ?
933e3a7aa6fSGleb Smirnoff 	    rt->rt_expire - time_uptime + time_second : 0;
93497d8d152SAndre Oppermann }
93597d8d152SAndre Oppermann 
9367f33a738SJulian Elischer /*
9377f33a738SJulian Elischer  * Extract the addresses of the passed sockaddrs.
9387f33a738SJulian Elischer  * Do a little sanity checking so as to avoid bad memory references.
939076d0761SJulian Elischer  * This data is derived straight from userland.
9407f33a738SJulian Elischer  */
941076d0761SJulian Elischer static int
942becc44d7SSam Leffler rt_xaddrs(caddr_t cp, caddr_t cplim, struct rt_addrinfo *rtinfo)
943df8bae1dSRodney W. Grimes {
944e74642dfSLuigi Rizzo 	struct sockaddr *sa;
945e74642dfSLuigi Rizzo 	int i;
946df8bae1dSRodney W. Grimes 
947becc44d7SSam Leffler 	for (i = 0; i < RTAX_MAX && cp < cplim; i++) {
948df8bae1dSRodney W. Grimes 		if ((rtinfo->rti_addrs & (1 << i)) == 0)
949df8bae1dSRodney W. Grimes 			continue;
950ff6d0a59SJulian Elischer 		sa = (struct sockaddr *)cp;
9517f33a738SJulian Elischer 		/*
952076d0761SJulian Elischer 		 * It won't fit.
9537f33a738SJulian Elischer 		 */
954becc44d7SSam Leffler 		if (cp + sa->sa_len > cplim)
955076d0761SJulian Elischer 			return (EINVAL);
9567f33a738SJulian Elischer 		/*
9577f33a738SJulian Elischer 		 * there are no more.. quit now
9587f33a738SJulian Elischer 		 * If there are more bits, they are in error.
9597f33a738SJulian Elischer 		 * I've seen this. route(1) can evidently generate these.
9607f33a738SJulian Elischer 		 * This causes kernel to core dump.
961076d0761SJulian Elischer 		 * for compatibility, If we see this, point to a safe address.
9627f33a738SJulian Elischer 		 */
963076d0761SJulian Elischer 		if (sa->sa_len == 0) {
964076d0761SJulian Elischer 			rtinfo->rti_info[i] = &sa_zero;
965076d0761SJulian Elischer 			return (0); /* should be EINVAL but for compat */
966df8bae1dSRodney W. Grimes 		}
967076d0761SJulian Elischer 		/* accept it */
9680bebb544SHiroki Sato #ifdef INET6
9690bebb544SHiroki Sato 		if (sa->sa_family == AF_INET6)
9700bebb544SHiroki Sato 			sa6_embedscope((struct sockaddr_in6 *)sa,
9710bebb544SHiroki Sato 			    V_ip6_use_defzone);
9720bebb544SHiroki Sato #endif
973076d0761SJulian Elischer 		rtinfo->rti_info[i] = sa;
974e74642dfSLuigi Rizzo 		cp += SA_SIZE(sa);
975076d0761SJulian Elischer 	}
976076d0761SJulian Elischer 	return (0);
977df8bae1dSRodney W. Grimes }
978df8bae1dSRodney W. Grimes 
9796d076ae8SBjoern A. Zeeb /*
9803deb3649SAlexander V. Chernikov  * Fill in @dmask with valid netmask leaving original @smask
9813deb3649SAlexander V. Chernikov  * intact. Mostly used with radix netmasks.
9823deb3649SAlexander V. Chernikov  */
9833deb3649SAlexander V. Chernikov static struct sockaddr *
9843deb3649SAlexander V. Chernikov rtsock_fix_netmask(struct sockaddr *dst, struct sockaddr *smask,
9853deb3649SAlexander V. Chernikov     struct sockaddr_storage *dmask)
9863deb3649SAlexander V. Chernikov {
9873deb3649SAlexander V. Chernikov 	if (dst == NULL || smask == NULL)
9883deb3649SAlexander V. Chernikov 		return (NULL);
9893deb3649SAlexander V. Chernikov 
9903deb3649SAlexander V. Chernikov 	memset(dmask, 0, dst->sa_len);
9913deb3649SAlexander V. Chernikov 	memcpy(dmask, smask, smask->sa_len);
9923deb3649SAlexander V. Chernikov 	dmask->ss_len = dst->sa_len;
9933deb3649SAlexander V. Chernikov 	dmask->ss_family = dst->sa_family;
9943deb3649SAlexander V. Chernikov 
9953deb3649SAlexander V. Chernikov 	return ((struct sockaddr *)dmask);
9963deb3649SAlexander V. Chernikov }
9973deb3649SAlexander V. Chernikov 
9983deb3649SAlexander V. Chernikov /*
9996db47af4SAlexander V. Chernikov  * Writes information related to @rtinfo object to newly-allocated mbuf.
10006db47af4SAlexander V. Chernikov  * Assumes MCLBYTES is enough to construct any message.
10016db47af4SAlexander V. Chernikov  * Used for OS notifications of vaious events (if/ifa announces,etc)
10026db47af4SAlexander V. Chernikov  *
10036db47af4SAlexander V. Chernikov  * Returns allocated mbuf or NULL on failure.
10046d076ae8SBjoern A. Zeeb  */
1005df8bae1dSRodney W. Grimes static struct mbuf *
10066db47af4SAlexander V. Chernikov rtsock_msg_mbuf(int type, struct rt_addrinfo *rtinfo)
1007df8bae1dSRodney W. Grimes {
10085dfc91d7SLuigi Rizzo 	struct rt_msghdr *rtm;
10095dfc91d7SLuigi Rizzo 	struct mbuf *m;
10105dfc91d7SLuigi Rizzo 	int i;
10115dfc91d7SLuigi Rizzo 	struct sockaddr *sa;
10126bbfef90SHiroki Sato #ifdef INET6
10136bbfef90SHiroki Sato 	struct sockaddr_storage ss;
10146bbfef90SHiroki Sato 	struct sockaddr_in6 *sin6;
10156bbfef90SHiroki Sato #endif
1016df8bae1dSRodney W. Grimes 	int len, dlen;
1017df8bae1dSRodney W. Grimes 
1018df8bae1dSRodney W. Grimes 	switch (type) {
1019df8bae1dSRodney W. Grimes 
1020df8bae1dSRodney W. Grimes 	case RTM_DELADDR:
1021df8bae1dSRodney W. Grimes 	case RTM_NEWADDR:
1022df8bae1dSRodney W. Grimes 		len = sizeof(struct ifa_msghdr);
1023df8bae1dSRodney W. Grimes 		break;
1024df8bae1dSRodney W. Grimes 
1025477180fbSGarrett Wollman 	case RTM_DELMADDR:
1026477180fbSGarrett Wollman 	case RTM_NEWMADDR:
1027477180fbSGarrett Wollman 		len = sizeof(struct ifma_msghdr);
1028477180fbSGarrett Wollman 		break;
1029477180fbSGarrett Wollman 
1030df8bae1dSRodney W. Grimes 	case RTM_IFINFO:
1031df8bae1dSRodney W. Grimes 		len = sizeof(struct if_msghdr);
1032df8bae1dSRodney W. Grimes 		break;
1033df8bae1dSRodney W. Grimes 
10347b6edd04SRuslan Ermilov 	case RTM_IFANNOUNCE:
1035b83a279fSSam Leffler 	case RTM_IEEE80211:
10367b6edd04SRuslan Ermilov 		len = sizeof(struct if_announcemsghdr);
10377b6edd04SRuslan Ermilov 		break;
10387b6edd04SRuslan Ermilov 
1039df8bae1dSRodney W. Grimes 	default:
1040df8bae1dSRodney W. Grimes 		len = sizeof(struct rt_msghdr);
1041df8bae1dSRodney W. Grimes 	}
1042c69f77c3SGleb Smirnoff 
1043c69f77c3SGleb Smirnoff 	/* XXXGL: can we use MJUMPAGESIZE cluster here? */
1044c69f77c3SGleb Smirnoff 	KASSERT(len <= MCLBYTES, ("%s: message too big", __func__));
1045c69f77c3SGleb Smirnoff 	if (len > MHLEN)
1046c69f77c3SGleb Smirnoff 		m = m_getcl(M_NOWAIT, MT_DATA, M_PKTHDR);
1047c69f77c3SGleb Smirnoff 	else
1048eb1b1807SGleb Smirnoff 		m = m_gethdr(M_NOWAIT, MT_DATA);
10495dfc91d7SLuigi Rizzo 	if (m == NULL)
105033841545SHajimu UMEMOTO 		return (m);
1051c69f77c3SGleb Smirnoff 
1052df8bae1dSRodney W. Grimes 	m->m_pkthdr.len = m->m_len = len;
1053df8bae1dSRodney W. Grimes 	rtm = mtod(m, struct rt_msghdr *);
1054df8bae1dSRodney W. Grimes 	bzero((caddr_t)rtm, len);
1055df8bae1dSRodney W. Grimes 	for (i = 0; i < RTAX_MAX; i++) {
1056df8bae1dSRodney W. Grimes 		if ((sa = rtinfo->rti_info[i]) == NULL)
1057df8bae1dSRodney W. Grimes 			continue;
1058df8bae1dSRodney W. Grimes 		rtinfo->rti_addrs |= (1 << i);
1059e74642dfSLuigi Rizzo 		dlen = SA_SIZE(sa);
10606bbfef90SHiroki Sato #ifdef INET6
10615c9fa630SHiroki Sato 		if (V_deembed_scopeid && sa->sa_family == AF_INET6) {
10626bbfef90SHiroki Sato 			sin6 = (struct sockaddr_in6 *)&ss;
10636bbfef90SHiroki Sato 			bcopy(sa, sin6, sizeof(*sin6));
10646bbfef90SHiroki Sato 			if (sa6_recoverscope(sin6) == 0)
10656bbfef90SHiroki Sato 				sa = (struct sockaddr *)sin6;
10666bbfef90SHiroki Sato 		}
10676bbfef90SHiroki Sato #endif
1068df8bae1dSRodney W. Grimes 		m_copyback(m, len, dlen, (caddr_t)sa);
1069df8bae1dSRodney W. Grimes 		len += dlen;
1070df8bae1dSRodney W. Grimes 	}
1071df8bae1dSRodney W. Grimes 	if (m->m_pkthdr.len != len) {
1072df8bae1dSRodney W. Grimes 		m_freem(m);
1073df8bae1dSRodney W. Grimes 		return (NULL);
1074df8bae1dSRodney W. Grimes 	}
1075df8bae1dSRodney W. Grimes 	rtm->rtm_msglen = len;
1076df8bae1dSRodney W. Grimes 	rtm->rtm_version = RTM_VERSION;
1077df8bae1dSRodney W. Grimes 	rtm->rtm_type = type;
1078df8bae1dSRodney W. Grimes 	return (m);
1079df8bae1dSRodney W. Grimes }
1080df8bae1dSRodney W. Grimes 
10816d076ae8SBjoern A. Zeeb /*
1082f2e5eb36SAlexander V. Chernikov  * Writes information related to @rtinfo object to preallocated buffer.
1083f2e5eb36SAlexander V. Chernikov  * Stores needed size in @plen. If @w is NULL, calculates size without
1084f2e5eb36SAlexander V. Chernikov  * writing.
1085f2e5eb36SAlexander V. Chernikov  * Used for sysctl dumps and rtsock answers (RTM_DEL/RTM_GET) generation.
1086f2e5eb36SAlexander V. Chernikov  *
1087f2e5eb36SAlexander V. Chernikov  * Returns 0 on success.
1088f2e5eb36SAlexander V. Chernikov  *
10896d076ae8SBjoern A. Zeeb  */
1090df8bae1dSRodney W. Grimes static int
1091f2e5eb36SAlexander V. Chernikov rtsock_msg_buffer(int type, struct rt_addrinfo *rtinfo, struct walkarg *w, int *plen)
1092df8bae1dSRodney W. Grimes {
10935dfc91d7SLuigi Rizzo 	int i;
1094f2e5eb36SAlexander V. Chernikov 	int len, buflen = 0, dlen;
1095de46b2c6SAlexander V. Chernikov 	caddr_t cp = NULL;
1096f2e5eb36SAlexander V. Chernikov 	struct rt_msghdr *rtm = NULL;
10976bbfef90SHiroki Sato #ifdef INET6
10986bbfef90SHiroki Sato 	struct sockaddr_storage ss;
10996bbfef90SHiroki Sato 	struct sockaddr_in6 *sin6;
11006bbfef90SHiroki Sato #endif
1101df8bae1dSRodney W. Grimes 
1102df8bae1dSRodney W. Grimes 	switch (type) {
1103df8bae1dSRodney W. Grimes 
1104df8bae1dSRodney W. Grimes 	case RTM_DELADDR:
1105df8bae1dSRodney W. Grimes 	case RTM_NEWADDR:
11066d076ae8SBjoern A. Zeeb 		if (w != NULL && w->w_op == NET_RT_IFLISTL) {
11076d076ae8SBjoern A. Zeeb #ifdef COMPAT_FREEBSD32
11086d076ae8SBjoern A. Zeeb 			if (w->w_req->flags & SCTL_MASK32)
11096d076ae8SBjoern A. Zeeb 				len = sizeof(struct ifa_msghdrl32);
11106d076ae8SBjoern A. Zeeb 			else
11116d076ae8SBjoern A. Zeeb #endif
11126d076ae8SBjoern A. Zeeb 				len = sizeof(struct ifa_msghdrl);
11136d076ae8SBjoern A. Zeeb 		} else
1114df8bae1dSRodney W. Grimes 			len = sizeof(struct ifa_msghdr);
1115df8bae1dSRodney W. Grimes 		break;
1116df8bae1dSRodney W. Grimes 
1117df8bae1dSRodney W. Grimes 	case RTM_IFINFO:
1118427a928aSKonstantin Belousov #ifdef COMPAT_FREEBSD32
1119427a928aSKonstantin Belousov 		if (w != NULL && w->w_req->flags & SCTL_MASK32) {
11206d076ae8SBjoern A. Zeeb 			if (w->w_op == NET_RT_IFLISTL)
11216d076ae8SBjoern A. Zeeb 				len = sizeof(struct if_msghdrl32);
11226d076ae8SBjoern A. Zeeb 			else
1123427a928aSKonstantin Belousov 				len = sizeof(struct if_msghdr32);
1124427a928aSKonstantin Belousov 			break;
1125427a928aSKonstantin Belousov 		}
1126427a928aSKonstantin Belousov #endif
11276d076ae8SBjoern A. Zeeb 		if (w != NULL && w->w_op == NET_RT_IFLISTL)
11286d076ae8SBjoern A. Zeeb 			len = sizeof(struct if_msghdrl);
11296d076ae8SBjoern A. Zeeb 		else
1130df8bae1dSRodney W. Grimes 			len = sizeof(struct if_msghdr);
1131df8bae1dSRodney W. Grimes 		break;
1132df8bae1dSRodney W. Grimes 
113305b2efe0SBruce M Simpson 	case RTM_NEWMADDR:
113405b2efe0SBruce M Simpson 		len = sizeof(struct ifma_msghdr);
113505b2efe0SBruce M Simpson 		break;
113605b2efe0SBruce M Simpson 
1137df8bae1dSRodney W. Grimes 	default:
1138df8bae1dSRodney W. Grimes 		len = sizeof(struct rt_msghdr);
1139df8bae1dSRodney W. Grimes 	}
1140f2e5eb36SAlexander V. Chernikov 
1141f2e5eb36SAlexander V. Chernikov 	if (w != NULL) {
1142f2e5eb36SAlexander V. Chernikov 		rtm = (struct rt_msghdr *)w->w_tmem;
1143f2e5eb36SAlexander V. Chernikov 		buflen = w->w_tmemsize - len;
1144f2e5eb36SAlexander V. Chernikov 		cp = (caddr_t)w->w_tmem + len;
1145f2e5eb36SAlexander V. Chernikov 	}
1146f2e5eb36SAlexander V. Chernikov 
1147f2e5eb36SAlexander V. Chernikov 	rtinfo->rti_addrs = 0;
1148df8bae1dSRodney W. Grimes 	for (i = 0; i < RTAX_MAX; i++) {
11495dfc91d7SLuigi Rizzo 		struct sockaddr *sa;
1150df8bae1dSRodney W. Grimes 
11515dfc91d7SLuigi Rizzo 		if ((sa = rtinfo->rti_info[i]) == NULL)
1152df8bae1dSRodney W. Grimes 			continue;
1153df8bae1dSRodney W. Grimes 		rtinfo->rti_addrs |= (1 << i);
1154e74642dfSLuigi Rizzo 		dlen = SA_SIZE(sa);
1155f2e5eb36SAlexander V. Chernikov 		if (cp != NULL && buflen >= dlen) {
11566bbfef90SHiroki Sato #ifdef INET6
11575c9fa630SHiroki Sato 			if (V_deembed_scopeid && sa->sa_family == AF_INET6) {
11586bbfef90SHiroki Sato 				sin6 = (struct sockaddr_in6 *)&ss;
11596bbfef90SHiroki Sato 				bcopy(sa, sin6, sizeof(*sin6));
11606bbfef90SHiroki Sato 				if (sa6_recoverscope(sin6) == 0)
11616bbfef90SHiroki Sato 					sa = (struct sockaddr *)sin6;
11626bbfef90SHiroki Sato 			}
11636bbfef90SHiroki Sato #endif
1164df8bae1dSRodney W. Grimes 			bcopy((caddr_t)sa, cp, (unsigned)dlen);
1165df8bae1dSRodney W. Grimes 			cp += dlen;
1166f2e5eb36SAlexander V. Chernikov 			buflen -= dlen;
1167f2e5eb36SAlexander V. Chernikov 		} else if (cp != NULL) {
1168f2e5eb36SAlexander V. Chernikov 			/*
1169f2e5eb36SAlexander V. Chernikov 			 * Buffer too small. Count needed size
1170f2e5eb36SAlexander V. Chernikov 			 * and return with error.
1171f2e5eb36SAlexander V. Chernikov 			 */
1172f2e5eb36SAlexander V. Chernikov 			cp = NULL;
1173df8bae1dSRodney W. Grimes 		}
1174f2e5eb36SAlexander V. Chernikov 
1175df8bae1dSRodney W. Grimes 		len += dlen;
1176df8bae1dSRodney W. Grimes 	}
1177f2e5eb36SAlexander V. Chernikov 
1178f2e5eb36SAlexander V. Chernikov 	if (cp != NULL) {
1179f2e5eb36SAlexander V. Chernikov 		dlen = ALIGN(len) - len;
1180f2e5eb36SAlexander V. Chernikov 		if (buflen < dlen)
1181f2e5eb36SAlexander V. Chernikov 			cp = NULL;
1182f2e5eb36SAlexander V. Chernikov 		else
1183f2e5eb36SAlexander V. Chernikov 			buflen -= dlen;
1184f2e5eb36SAlexander V. Chernikov 	}
1185694ff264SAndrew Gallatin 	len = ALIGN(len);
1186df8bae1dSRodney W. Grimes 
1187f2e5eb36SAlexander V. Chernikov 	if (cp != NULL) {
1188f2e5eb36SAlexander V. Chernikov 		/* fill header iff buffer is large enough */
1189df8bae1dSRodney W. Grimes 		rtm->rtm_version = RTM_VERSION;
1190df8bae1dSRodney W. Grimes 		rtm->rtm_type = type;
1191df8bae1dSRodney W. Grimes 		rtm->rtm_msglen = len;
1192df8bae1dSRodney W. Grimes 	}
1193f2e5eb36SAlexander V. Chernikov 
1194f2e5eb36SAlexander V. Chernikov 	*plen = len;
1195f2e5eb36SAlexander V. Chernikov 
1196f2e5eb36SAlexander V. Chernikov 	if (w != NULL && cp == NULL)
1197f2e5eb36SAlexander V. Chernikov 		return (ENOBUFS);
1198f2e5eb36SAlexander V. Chernikov 
1199f2e5eb36SAlexander V. Chernikov 	return (0);
1200df8bae1dSRodney W. Grimes }
1201df8bae1dSRodney W. Grimes 
1202df8bae1dSRodney W. Grimes /*
1203df8bae1dSRodney W. Grimes  * This routine is called to generate a message from the routing
1204df8bae1dSRodney W. Grimes  * socket indicating that a redirect has occured, a routing lookup
1205df8bae1dSRodney W. Grimes  * has failed, or that a protocol has detected timeouts to a particular
1206df8bae1dSRodney W. Grimes  * destination.
1207df8bae1dSRodney W. Grimes  */
1208df8bae1dSRodney W. Grimes void
1209528737fdSBjoern A. Zeeb rt_missmsg_fib(int type, struct rt_addrinfo *rtinfo, int flags, int error,
1210528737fdSBjoern A. Zeeb     int fibnum)
1211df8bae1dSRodney W. Grimes {
1212becc44d7SSam Leffler 	struct rt_msghdr *rtm;
1213becc44d7SSam Leffler 	struct mbuf *m;
1214df8bae1dSRodney W. Grimes 	struct sockaddr *sa = rtinfo->rti_info[RTAX_DST];
1215df8bae1dSRodney W. Grimes 
1216c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
1217df8bae1dSRodney W. Grimes 		return;
12186db47af4SAlexander V. Chernikov 	m = rtsock_msg_mbuf(type, rtinfo);
12195dfc91d7SLuigi Rizzo 	if (m == NULL)
1220df8bae1dSRodney W. Grimes 		return;
1221528737fdSBjoern A. Zeeb 
12227d9b6df1SAlexander V. Chernikov 	if (fibnum != RT_ALL_FIBS) {
1223528737fdSBjoern A. Zeeb 		KASSERT(fibnum >= 0 && fibnum < rt_numfibs, ("%s: fibnum out "
1224528737fdSBjoern A. Zeeb 		    "of range 0 <= %d < %d", __func__, fibnum, rt_numfibs));
1225528737fdSBjoern A. Zeeb 		M_SETFIB(m, fibnum);
1226528737fdSBjoern A. Zeeb 		m->m_flags |= RTS_FILTER_FIB;
1227528737fdSBjoern A. Zeeb 	}
1228528737fdSBjoern A. Zeeb 
1229df8bae1dSRodney W. Grimes 	rtm = mtod(m, struct rt_msghdr *);
1230df8bae1dSRodney W. Grimes 	rtm->rtm_flags = RTF_DONE | flags;
1231df8bae1dSRodney W. Grimes 	rtm->rtm_errno = error;
1232df8bae1dSRodney W. Grimes 	rtm->rtm_addrs = rtinfo->rti_addrs;
12333ca1a2d6SMax Laier 	rt_dispatch(m, sa ? sa->sa_family : AF_UNSPEC);
1234df8bae1dSRodney W. Grimes }
1235df8bae1dSRodney W. Grimes 
1236528737fdSBjoern A. Zeeb void
1237528737fdSBjoern A. Zeeb rt_missmsg(int type, struct rt_addrinfo *rtinfo, int flags, int error)
1238528737fdSBjoern A. Zeeb {
1239528737fdSBjoern A. Zeeb 
12407d9b6df1SAlexander V. Chernikov 	rt_missmsg_fib(type, rtinfo, flags, error, RT_ALL_FIBS);
1241528737fdSBjoern A. Zeeb }
1242528737fdSBjoern A. Zeeb 
1243df8bae1dSRodney W. Grimes /*
1244df8bae1dSRodney W. Grimes  * This routine is called to generate a message from the routing
1245df8bae1dSRodney W. Grimes  * socket indicating that the status of a network interface has changed.
1246df8bae1dSRodney W. Grimes  */
1247df8bae1dSRodney W. Grimes void
1248becc44d7SSam Leffler rt_ifmsg(struct ifnet *ifp)
1249df8bae1dSRodney W. Grimes {
1250becc44d7SSam Leffler 	struct if_msghdr *ifm;
1251df8bae1dSRodney W. Grimes 	struct mbuf *m;
1252df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
1253df8bae1dSRodney W. Grimes 
1254c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
1255df8bae1dSRodney W. Grimes 		return;
1256df8bae1dSRodney W. Grimes 	bzero((caddr_t)&info, sizeof(info));
12576db47af4SAlexander V. Chernikov 	m = rtsock_msg_mbuf(RTM_IFINFO, &info);
12585dfc91d7SLuigi Rizzo 	if (m == NULL)
1259df8bae1dSRodney W. Grimes 		return;
1260df8bae1dSRodney W. Grimes 	ifm = mtod(m, struct if_msghdr *);
1261df8bae1dSRodney W. Grimes 	ifm->ifm_index = ifp->if_index;
1262292ee7beSRobert Watson 	ifm->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
1263e6485f73SGleb Smirnoff 	if_data_copy(ifp, &ifm->ifm_data);
1264df8bae1dSRodney W. Grimes 	ifm->ifm_addrs = 0;
12653ca1a2d6SMax Laier 	rt_dispatch(m, AF_UNSPEC);
1266df8bae1dSRodney W. Grimes }
1267df8bae1dSRodney W. Grimes 
1268df8bae1dSRodney W. Grimes /*
12694cbac30bSAlexander V. Chernikov  * Announce interface address arrival/withdraw.
12704cbac30bSAlexander V. Chernikov  * Please do not call directly, use rt_addrmsg().
12714cbac30bSAlexander V. Chernikov  * Assume input data to be valid.
12724cbac30bSAlexander V. Chernikov  * Returns 0 on success.
1273df8bae1dSRodney W. Grimes  */
12744cbac30bSAlexander V. Chernikov int
12754cbac30bSAlexander V. Chernikov rtsock_addrmsg(int cmd, struct ifaddr *ifa, int fibnum)
1276df8bae1dSRodney W. Grimes {
1277df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
12784cbac30bSAlexander V. Chernikov 	struct sockaddr *sa;
12794cbac30bSAlexander V. Chernikov 	int ncmd;
12804cbac30bSAlexander V. Chernikov 	struct mbuf *m;
12814cbac30bSAlexander V. Chernikov 	struct ifa_msghdr *ifam;
1282df8bae1dSRodney W. Grimes 	struct ifnet *ifp = ifa->ifa_ifp;
12833deb3649SAlexander V. Chernikov 	struct sockaddr_storage ss;
1284df8bae1dSRodney W. Grimes 
1285c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
12864cbac30bSAlexander V. Chernikov 		return (0);
1287df8bae1dSRodney W. Grimes 
12884cbac30bSAlexander V. Chernikov 	ncmd = cmd == RTM_ADD ? RTM_NEWADDR : RTM_DELADDR;
12894cbac30bSAlexander V. Chernikov 
12904cbac30bSAlexander V. Chernikov 	bzero((caddr_t)&info, sizeof(info));
1291becc44d7SSam Leffler 	info.rti_info[RTAX_IFA] = sa = ifa->ifa_addr;
12924a0d6638SRuslan Ermilov 	info.rti_info[RTAX_IFP] = ifp->if_addr->ifa_addr;
12933deb3649SAlexander V. Chernikov 	info.rti_info[RTAX_NETMASK] = rtsock_fix_netmask(
12943deb3649SAlexander V. Chernikov 	    info.rti_info[RTAX_IFP], ifa->ifa_netmask, &ss);
1295becc44d7SSam Leffler 	info.rti_info[RTAX_BRD] = ifa->ifa_dstaddr;
12966db47af4SAlexander V. Chernikov 	if ((m = rtsock_msg_mbuf(ncmd, &info)) == NULL)
12974cbac30bSAlexander V. Chernikov 		return (ENOBUFS);
1298df8bae1dSRodney W. Grimes 	ifam = mtod(m, struct ifa_msghdr *);
1299df8bae1dSRodney W. Grimes 	ifam->ifam_index = ifp->if_index;
13009753faf5SGleb Smirnoff 	ifam->ifam_metric = ifa->ifa_ifp->if_metric;
1301df8bae1dSRodney W. Grimes 	ifam->ifam_flags = ifa->ifa_flags;
1302df8bae1dSRodney W. Grimes 	ifam->ifam_addrs = info.rti_addrs;
13034cbac30bSAlexander V. Chernikov 
13044cbac30bSAlexander V. Chernikov 	if (fibnum != RT_ALL_FIBS) {
13054cbac30bSAlexander V. Chernikov 		M_SETFIB(m, fibnum);
13064cbac30bSAlexander V. Chernikov 		m->m_flags |= RTS_FILTER_FIB;
1307df8bae1dSRodney W. Grimes 	}
13084cbac30bSAlexander V. Chernikov 
13094cbac30bSAlexander V. Chernikov 	rt_dispatch(m, sa ? sa->sa_family : AF_UNSPEC);
13104cbac30bSAlexander V. Chernikov 
13114cbac30bSAlexander V. Chernikov 	return (0);
13124cbac30bSAlexander V. Chernikov }
13134cbac30bSAlexander V. Chernikov 
13144cbac30bSAlexander V. Chernikov /*
13154cbac30bSAlexander V. Chernikov  * Announce route addition/removal.
13164cbac30bSAlexander V. Chernikov  * Please do not call directly, use rt_routemsg().
13174cbac30bSAlexander V. Chernikov  * Note that @rt data MAY be inconsistent/invalid:
13184cbac30bSAlexander V. Chernikov  * if some userland app sends us "invalid" route message (invalid mask,
13194cbac30bSAlexander V. Chernikov  * no dst, wrong address families, etc...) we need to pass it back
13204cbac30bSAlexander V. Chernikov  * to app (and any other rtsock consumers) with rtm_errno field set to
13214cbac30bSAlexander V. Chernikov  * non-zero value.
13224cbac30bSAlexander V. Chernikov  *
13234cbac30bSAlexander V. Chernikov  * Returns 0 on success.
13244cbac30bSAlexander V. Chernikov  */
13254cbac30bSAlexander V. Chernikov int
13264cbac30bSAlexander V. Chernikov rtsock_routemsg(int cmd, struct ifnet *ifp, int error, struct rtentry *rt,
13274cbac30bSAlexander V. Chernikov     int fibnum)
13284cbac30bSAlexander V. Chernikov {
13294cbac30bSAlexander V. Chernikov 	struct rt_addrinfo info;
13304cbac30bSAlexander V. Chernikov 	struct sockaddr *sa;
13314cbac30bSAlexander V. Chernikov 	struct mbuf *m;
13325dfc91d7SLuigi Rizzo 	struct rt_msghdr *rtm;
13333deb3649SAlexander V. Chernikov 	struct sockaddr_storage ss;
1334df8bae1dSRodney W. Grimes 
1335c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
13364cbac30bSAlexander V. Chernikov 		return (0);
13374cbac30bSAlexander V. Chernikov 
13384cbac30bSAlexander V. Chernikov 	bzero((caddr_t)&info, sizeof(info));
1339becc44d7SSam Leffler 	info.rti_info[RTAX_DST] = sa = rt_key(rt);
13403deb3649SAlexander V. Chernikov 	info.rti_info[RTAX_NETMASK] = rtsock_fix_netmask(sa, rt_mask(rt), &ss);
1341becc44d7SSam Leffler 	info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
13426db47af4SAlexander V. Chernikov 	if ((m = rtsock_msg_mbuf(cmd, &info)) == NULL)
13434cbac30bSAlexander V. Chernikov 		return (ENOBUFS);
1344df8bae1dSRodney W. Grimes 	rtm = mtod(m, struct rt_msghdr *);
1345df8bae1dSRodney W. Grimes 	rtm->rtm_index = ifp->if_index;
1346df8bae1dSRodney W. Grimes 	rtm->rtm_flags |= rt->rt_flags;
1347df8bae1dSRodney W. Grimes 	rtm->rtm_errno = error;
1348df8bae1dSRodney W. Grimes 	rtm->rtm_addrs = info.rti_addrs;
13494cbac30bSAlexander V. Chernikov 
13507d9b6df1SAlexander V. Chernikov 	if (fibnum != RT_ALL_FIBS) {
1351528737fdSBjoern A. Zeeb 		M_SETFIB(m, fibnum);
1352528737fdSBjoern A. Zeeb 		m->m_flags |= RTS_FILTER_FIB;
1353528737fdSBjoern A. Zeeb 	}
13544cbac30bSAlexander V. Chernikov 
13553ca1a2d6SMax Laier 	rt_dispatch(m, sa ? sa->sa_family : AF_UNSPEC);
13564cbac30bSAlexander V. Chernikov 
13574cbac30bSAlexander V. Chernikov 	return (0);
1358df8bae1dSRodney W. Grimes }
1359df8bae1dSRodney W. Grimes 
1360477180fbSGarrett Wollman /*
1361477180fbSGarrett Wollman  * This is the analogue to the rt_newaddrmsg which performs the same
1362477180fbSGarrett Wollman  * function but for multicast group memberhips.  This is easier since
1363477180fbSGarrett Wollman  * there is no route state to worry about.
1364477180fbSGarrett Wollman  */
1365477180fbSGarrett Wollman void
1366becc44d7SSam Leffler rt_newmaddrmsg(int cmd, struct ifmultiaddr *ifma)
1367477180fbSGarrett Wollman {
1368477180fbSGarrett Wollman 	struct rt_addrinfo info;
13695dfc91d7SLuigi Rizzo 	struct mbuf *m = NULL;
1370477180fbSGarrett Wollman 	struct ifnet *ifp = ifma->ifma_ifp;
1371477180fbSGarrett Wollman 	struct ifma_msghdr *ifmam;
1372477180fbSGarrett Wollman 
1373c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
1374477180fbSGarrett Wollman 		return;
1375477180fbSGarrett Wollman 
1376477180fbSGarrett Wollman 	bzero((caddr_t)&info, sizeof(info));
1377becc44d7SSam Leffler 	info.rti_info[RTAX_IFA] = ifma->ifma_addr;
13784a0d6638SRuslan Ermilov 	info.rti_info[RTAX_IFP] = ifp ? ifp->if_addr->ifa_addr : NULL;
1379477180fbSGarrett Wollman 	/*
1380477180fbSGarrett Wollman 	 * If a link-layer address is present, present it as a ``gateway''
1381477180fbSGarrett Wollman 	 * (similarly to how ARP entries, e.g., are presented).
1382477180fbSGarrett Wollman 	 */
1383becc44d7SSam Leffler 	info.rti_info[RTAX_GATEWAY] = ifma->ifma_lladdr;
13846db47af4SAlexander V. Chernikov 	m = rtsock_msg_mbuf(cmd, &info);
1385becc44d7SSam Leffler 	if (m == NULL)
1386477180fbSGarrett Wollman 		return;
1387477180fbSGarrett Wollman 	ifmam = mtod(m, struct ifma_msghdr *);
138875ae0c01SBruce M Simpson 	KASSERT(ifp != NULL, ("%s: link-layer multicast address w/o ifp\n",
138975ae0c01SBruce M Simpson 	    __func__));
1390477180fbSGarrett Wollman 	ifmam->ifmam_index = ifp->if_index;
1391477180fbSGarrett Wollman 	ifmam->ifmam_addrs = info.rti_addrs;
13923ca1a2d6SMax Laier 	rt_dispatch(m, ifma->ifma_addr ? ifma->ifma_addr->sa_family : AF_UNSPEC);
1393477180fbSGarrett Wollman }
139452041295SPoul-Henning Kamp 
1395b83a279fSSam Leffler static struct mbuf *
1396b83a279fSSam Leffler rt_makeifannouncemsg(struct ifnet *ifp, int type, int what,
1397b83a279fSSam Leffler 	struct rt_addrinfo *info)
1398b83a279fSSam Leffler {
1399b83a279fSSam Leffler 	struct if_announcemsghdr *ifan;
1400b83a279fSSam Leffler 	struct mbuf *m;
1401b83a279fSSam Leffler 
1402c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
1403b83a279fSSam Leffler 		return NULL;
1404b83a279fSSam Leffler 	bzero((caddr_t)info, sizeof(*info));
14056db47af4SAlexander V. Chernikov 	m = rtsock_msg_mbuf(type, info);
1406b83a279fSSam Leffler 	if (m != NULL) {
1407b83a279fSSam Leffler 		ifan = mtod(m, struct if_announcemsghdr *);
1408b83a279fSSam Leffler 		ifan->ifan_index = ifp->if_index;
1409b83a279fSSam Leffler 		strlcpy(ifan->ifan_name, ifp->if_xname,
1410b83a279fSSam Leffler 			sizeof(ifan->ifan_name));
1411b83a279fSSam Leffler 		ifan->ifan_what = what;
1412b83a279fSSam Leffler 	}
1413b83a279fSSam Leffler 	return m;
1414b83a279fSSam Leffler }
1415b83a279fSSam Leffler 
1416b83a279fSSam Leffler /*
1417b83a279fSSam Leffler  * This is called to generate routing socket messages indicating
1418b83a279fSSam Leffler  * IEEE80211 wireless events.
1419b83a279fSSam Leffler  * XXX we piggyback on the RTM_IFANNOUNCE msg format in a clumsy way.
1420b83a279fSSam Leffler  */
1421b83a279fSSam Leffler void
1422b83a279fSSam Leffler rt_ieee80211msg(struct ifnet *ifp, int what, void *data, size_t data_len)
1423b83a279fSSam Leffler {
1424b83a279fSSam Leffler 	struct mbuf *m;
1425b83a279fSSam Leffler 	struct rt_addrinfo info;
1426b83a279fSSam Leffler 
1427b83a279fSSam Leffler 	m = rt_makeifannouncemsg(ifp, RTM_IEEE80211, what, &info);
1428b83a279fSSam Leffler 	if (m != NULL) {
1429b83a279fSSam Leffler 		/*
1430b83a279fSSam Leffler 		 * Append the ieee80211 data.  Try to stick it in the
1431b83a279fSSam Leffler 		 * mbuf containing the ifannounce msg; otherwise allocate
1432b83a279fSSam Leffler 		 * a new mbuf and append.
1433b83a279fSSam Leffler 		 *
1434b83a279fSSam Leffler 		 * NB: we assume m is a single mbuf.
1435b83a279fSSam Leffler 		 */
1436b83a279fSSam Leffler 		if (data_len > M_TRAILINGSPACE(m)) {
1437b83a279fSSam Leffler 			struct mbuf *n = m_get(M_NOWAIT, MT_DATA);
1438b83a279fSSam Leffler 			if (n == NULL) {
1439b83a279fSSam Leffler 				m_freem(m);
1440b83a279fSSam Leffler 				return;
1441b83a279fSSam Leffler 			}
1442b83a279fSSam Leffler 			bcopy(data, mtod(n, void *), data_len);
1443b83a279fSSam Leffler 			n->m_len = data_len;
1444b83a279fSSam Leffler 			m->m_next = n;
1445b83a279fSSam Leffler 		} else if (data_len > 0) {
1446b83a279fSSam Leffler 			bcopy(data, mtod(m, u_int8_t *) + m->m_len, data_len);
1447b83a279fSSam Leffler 			m->m_len += data_len;
1448b83a279fSSam Leffler 		}
1449b83a279fSSam Leffler 		if (m->m_flags & M_PKTHDR)
1450b83a279fSSam Leffler 			m->m_pkthdr.len += data_len;
1451b83a279fSSam Leffler 		mtod(m, struct if_announcemsghdr *)->ifan_msglen += data_len;
14523ca1a2d6SMax Laier 		rt_dispatch(m, AF_UNSPEC);
1453b83a279fSSam Leffler 	}
1454b83a279fSSam Leffler }
1455b83a279fSSam Leffler 
1456df8bae1dSRodney W. Grimes /*
14577b6edd04SRuslan Ermilov  * This is called to generate routing socket messages indicating
14587b6edd04SRuslan Ermilov  * network interface arrival and departure.
14597b6edd04SRuslan Ermilov  */
14607b6edd04SRuslan Ermilov void
1461becc44d7SSam Leffler rt_ifannouncemsg(struct ifnet *ifp, int what)
14627b6edd04SRuslan Ermilov {
14637b6edd04SRuslan Ermilov 	struct mbuf *m;
14647b6edd04SRuslan Ermilov 	struct rt_addrinfo info;
14657b6edd04SRuslan Ermilov 
1466b83a279fSSam Leffler 	m = rt_makeifannouncemsg(ifp, RTM_IFANNOUNCE, what, &info);
1467b83a279fSSam Leffler 	if (m != NULL)
14683ca1a2d6SMax Laier 		rt_dispatch(m, AF_UNSPEC);
1469becc44d7SSam Leffler }
1470becc44d7SSam Leffler 
1471becc44d7SSam Leffler static void
14723ca1a2d6SMax Laier rt_dispatch(struct mbuf *m, sa_family_t saf)
1473becc44d7SSam Leffler {
1474d989c7b3SRobert Watson 	struct m_tag *tag;
1475becc44d7SSam Leffler 
1476d989c7b3SRobert Watson 	/*
1477d989c7b3SRobert Watson 	 * Preserve the family from the sockaddr, if any, in an m_tag for
1478d989c7b3SRobert Watson 	 * use when injecting the mbuf into the routing socket buffer from
1479d989c7b3SRobert Watson 	 * the netisr.
1480d989c7b3SRobert Watson 	 */
14813ca1a2d6SMax Laier 	if (saf != AF_UNSPEC) {
1482d989c7b3SRobert Watson 		tag = m_tag_get(PACKET_TAG_RTSOCKFAM, sizeof(unsigned short),
1483d989c7b3SRobert Watson 		    M_NOWAIT);
1484d989c7b3SRobert Watson 		if (tag == NULL) {
1485d989c7b3SRobert Watson 			m_freem(m);
1486d989c7b3SRobert Watson 			return;
1487d989c7b3SRobert Watson 		}
14883ca1a2d6SMax Laier 		*(unsigned short *)(tag + 1) = saf;
1489d989c7b3SRobert Watson 		m_tag_prepend(m, tag);
1490d989c7b3SRobert Watson 	}
149121ca7b57SMarko Zec #ifdef VIMAGE
149221ca7b57SMarko Zec 	if (V_loif)
149321ca7b57SMarko Zec 		m->m_pkthdr.rcvif = V_loif;
149421ca7b57SMarko Zec 	else {
149521ca7b57SMarko Zec 		m_freem(m);
149621ca7b57SMarko Zec 		return;
149721ca7b57SMarko Zec 	}
149821ca7b57SMarko Zec #endif
14993161f583SAndre Oppermann 	netisr_queue(NETISR_ROUTE, m);	/* mbuf is free'd on failure. */
15007b6edd04SRuslan Ermilov }
15017b6edd04SRuslan Ermilov 
15027b6edd04SRuslan Ermilov /*
1503df8bae1dSRodney W. Grimes  * This is used in dumping the kernel table via sysctl().
1504df8bae1dSRodney W. Grimes  */
150537c84183SPoul-Henning Kamp static int
1506becc44d7SSam Leffler sysctl_dumpentry(struct radix_node *rn, void *vw)
1507df8bae1dSRodney W. Grimes {
1508becc44d7SSam Leffler 	struct walkarg *w = vw;
1509becc44d7SSam Leffler 	struct rtentry *rt = (struct rtentry *)rn;
1510df8bae1dSRodney W. Grimes 	int error = 0, size;
1511df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
15123deb3649SAlexander V. Chernikov 	struct sockaddr_storage ss;
1513df8bae1dSRodney W. Grimes 
1514df8bae1dSRodney W. Grimes 	if (w->w_op == NET_RT_FLAGS && !(rt->rt_flags & w->w_arg))
1515df8bae1dSRodney W. Grimes 		return 0;
1516b89e82ddSJamie Gritton 	if ((rt->rt_flags & RTF_HOST) == 0
1517de0bd6f7SBjoern A. Zeeb 	    ? jailed_without_vnet(w->w_req->td->td_ucred)
1518b89e82ddSJamie Gritton 	    : prison_if(w->w_req->td->td_ucred, rt_key(rt)) != 0)
1519813dd6aeSBjoern A. Zeeb 		return (0);
1520df8bae1dSRodney W. Grimes 	bzero((caddr_t)&info, sizeof(info));
1521becc44d7SSam Leffler 	info.rti_info[RTAX_DST] = rt_key(rt);
1522becc44d7SSam Leffler 	info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
15233deb3649SAlexander V. Chernikov 	info.rti_info[RTAX_NETMASK] = rtsock_fix_netmask(rt_key(rt),
15243deb3649SAlexander V. Chernikov 	    rt_mask(rt), &ss);
15256e6b3f7cSQing Li 	info.rti_info[RTAX_GENMASK] = 0;
152628070a0eSRuslan Ermilov 	if (rt->rt_ifp) {
15274a0d6638SRuslan Ermilov 		info.rti_info[RTAX_IFP] = rt->rt_ifp->if_addr->ifa_addr;
1528becc44d7SSam Leffler 		info.rti_info[RTAX_IFA] = rt->rt_ifa->ifa_addr;
152928070a0eSRuslan Ermilov 		if (rt->rt_ifp->if_flags & IFF_POINTOPOINT)
1530becc44d7SSam Leffler 			info.rti_info[RTAX_BRD] = rt->rt_ifa->ifa_dstaddr;
153128070a0eSRuslan Ermilov 	}
1532f2e5eb36SAlexander V. Chernikov 	if ((error = rtsock_msg_buffer(RTM_GET, &info, w, &size)) != 0)
1533f2e5eb36SAlexander V. Chernikov 		return (error);
153452041295SPoul-Henning Kamp 	if (w->w_req && w->w_tmem) {
1535becc44d7SSam Leffler 		struct rt_msghdr *rtm = (struct rt_msghdr *)w->w_tmem;
1536df8bae1dSRodney W. Grimes 
1537f672f56fSQing Li 		if (rt->rt_flags & RTF_GWFLAG_COMPAT)
1538f672f56fSQing Li 			rtm->rtm_flags = RTF_GATEWAY |
1539f672f56fSQing Li 				(rt->rt_flags & ~RTF_GWFLAG_COMPAT);
1540f672f56fSQing Li 		else
1541df8bae1dSRodney W. Grimes 			rtm->rtm_flags = rt->rt_flags;
1542e3a7aa6fSGleb Smirnoff 		rt_getmetrics(rt, &rtm->rtm_rmx);
1543df8bae1dSRodney W. Grimes 		rtm->rtm_index = rt->rt_ifp->if_index;
1544df8bae1dSRodney W. Grimes 		rtm->rtm_errno = rtm->rtm_pid = rtm->rtm_seq = 0;
1545df8bae1dSRodney W. Grimes 		rtm->rtm_addrs = info.rti_addrs;
154652041295SPoul-Henning Kamp 		error = SYSCTL_OUT(w->w_req, (caddr_t)rtm, size);
154752041295SPoul-Henning Kamp 		return (error);
1548df8bae1dSRodney W. Grimes 	}
1549df8bae1dSRodney W. Grimes 	return (error);
1550df8bae1dSRodney W. Grimes }
1551df8bae1dSRodney W. Grimes 
155237c84183SPoul-Henning Kamp static int
15536d076ae8SBjoern A. Zeeb sysctl_iflist_ifml(struct ifnet *ifp, struct rt_addrinfo *info,
15546d076ae8SBjoern A. Zeeb     struct walkarg *w, int len)
15556d076ae8SBjoern A. Zeeb {
15566d076ae8SBjoern A. Zeeb 	struct if_msghdrl *ifm;
1557b245f96cSGleb Smirnoff 	struct if_data *ifd;
1558b245f96cSGleb Smirnoff 
1559b245f96cSGleb Smirnoff 	ifm = (struct if_msghdrl *)w->w_tmem;
15606d076ae8SBjoern A. Zeeb 
15616d076ae8SBjoern A. Zeeb #ifdef COMPAT_FREEBSD32
15626d076ae8SBjoern A. Zeeb 	if (w->w_req->flags & SCTL_MASK32) {
15636d076ae8SBjoern A. Zeeb 		struct if_msghdrl32 *ifm32;
15646d076ae8SBjoern A. Zeeb 
1565b245f96cSGleb Smirnoff 		ifm32 = (struct if_msghdrl32 *)ifm;
15666d076ae8SBjoern A. Zeeb 		ifm32->ifm_addrs = info->rti_addrs;
15676d076ae8SBjoern A. Zeeb 		ifm32->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
15686d076ae8SBjoern A. Zeeb 		ifm32->ifm_index = ifp->if_index;
15696d076ae8SBjoern A. Zeeb 		ifm32->_ifm_spare1 = 0;
15706d076ae8SBjoern A. Zeeb 		ifm32->ifm_len = sizeof(*ifm32);
15716d076ae8SBjoern A. Zeeb 		ifm32->ifm_data_off = offsetof(struct if_msghdrl32, ifm_data);
1572b245f96cSGleb Smirnoff 		ifd = &ifm32->ifm_data;
1573b245f96cSGleb Smirnoff 	} else
15746d076ae8SBjoern A. Zeeb #endif
1575b245f96cSGleb Smirnoff 	{
15766d076ae8SBjoern A. Zeeb 		ifm->ifm_addrs = info->rti_addrs;
15776d076ae8SBjoern A. Zeeb 		ifm->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
15786d076ae8SBjoern A. Zeeb 		ifm->ifm_index = ifp->if_index;
15796d076ae8SBjoern A. Zeeb 		ifm->_ifm_spare1 = 0;
15806d076ae8SBjoern A. Zeeb 		ifm->ifm_len = sizeof(*ifm);
15816d076ae8SBjoern A. Zeeb 		ifm->ifm_data_off = offsetof(struct if_msghdrl, ifm_data);
1582b245f96cSGleb Smirnoff 		ifd = &ifm->ifm_data;
1583b245f96cSGleb Smirnoff 	}
15846d076ae8SBjoern A. Zeeb 
1585e6485f73SGleb Smirnoff 	if_data_copy(ifp, ifd);
1586b245f96cSGleb Smirnoff 
15876d076ae8SBjoern A. Zeeb 	return (SYSCTL_OUT(w->w_req, (caddr_t)ifm, len));
15886d076ae8SBjoern A. Zeeb }
15896d076ae8SBjoern A. Zeeb 
15906d076ae8SBjoern A. Zeeb static int
15916d076ae8SBjoern A. Zeeb sysctl_iflist_ifm(struct ifnet *ifp, struct rt_addrinfo *info,
15926d076ae8SBjoern A. Zeeb     struct walkarg *w, int len)
15936d076ae8SBjoern A. Zeeb {
15946d076ae8SBjoern A. Zeeb 	struct if_msghdr *ifm;
1595b245f96cSGleb Smirnoff 	struct if_data *ifd;
1596b245f96cSGleb Smirnoff 
1597b245f96cSGleb Smirnoff 	ifm = (struct if_msghdr *)w->w_tmem;
15986d076ae8SBjoern A. Zeeb 
15996d076ae8SBjoern A. Zeeb #ifdef COMPAT_FREEBSD32
16006d076ae8SBjoern A. Zeeb 	if (w->w_req->flags & SCTL_MASK32) {
16016d076ae8SBjoern A. Zeeb 		struct if_msghdr32 *ifm32;
16026d076ae8SBjoern A. Zeeb 
1603b245f96cSGleb Smirnoff 		ifm32 = (struct if_msghdr32 *)ifm;
16046d076ae8SBjoern A. Zeeb 		ifm32->ifm_addrs = info->rti_addrs;
16056d076ae8SBjoern A. Zeeb 		ifm32->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
16066d076ae8SBjoern A. Zeeb 		ifm32->ifm_index = ifp->if_index;
1607b245f96cSGleb Smirnoff 		ifd = &ifm32->ifm_data;
1608b245f96cSGleb Smirnoff 	} else
16096d076ae8SBjoern A. Zeeb #endif
1610b245f96cSGleb Smirnoff 	{
16116d076ae8SBjoern A. Zeeb 		ifm->ifm_addrs = info->rti_addrs;
16126d076ae8SBjoern A. Zeeb 		ifm->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
16136d076ae8SBjoern A. Zeeb 		ifm->ifm_index = ifp->if_index;
1614b245f96cSGleb Smirnoff 		ifd = &ifm->ifm_data;
1615b245f96cSGleb Smirnoff 	}
16166d076ae8SBjoern A. Zeeb 
1617e6485f73SGleb Smirnoff 	if_data_copy(ifp, ifd);
16182d70c0deSGleb Smirnoff 
16196d076ae8SBjoern A. Zeeb 	return (SYSCTL_OUT(w->w_req, (caddr_t)ifm, len));
16206d076ae8SBjoern A. Zeeb }
16216d076ae8SBjoern A. Zeeb 
16226d076ae8SBjoern A. Zeeb static int
16236d076ae8SBjoern A. Zeeb sysctl_iflist_ifaml(struct ifaddr *ifa, struct rt_addrinfo *info,
16246d076ae8SBjoern A. Zeeb     struct walkarg *w, int len)
16256d076ae8SBjoern A. Zeeb {
16266d076ae8SBjoern A. Zeeb 	struct ifa_msghdrl *ifam;
1627b245f96cSGleb Smirnoff 	struct if_data *ifd;
1628b245f96cSGleb Smirnoff 
1629b245f96cSGleb Smirnoff 	ifam = (struct ifa_msghdrl *)w->w_tmem;
16306d076ae8SBjoern A. Zeeb 
16316d076ae8SBjoern A. Zeeb #ifdef COMPAT_FREEBSD32
16326d076ae8SBjoern A. Zeeb 	if (w->w_req->flags & SCTL_MASK32) {
16336d076ae8SBjoern A. Zeeb 		struct ifa_msghdrl32 *ifam32;
16346d076ae8SBjoern A. Zeeb 
1635b245f96cSGleb Smirnoff 		ifam32 = (struct ifa_msghdrl32 *)ifam;
16366d076ae8SBjoern A. Zeeb 		ifam32->ifam_addrs = info->rti_addrs;
16376d076ae8SBjoern A. Zeeb 		ifam32->ifam_flags = ifa->ifa_flags;
16386d076ae8SBjoern A. Zeeb 		ifam32->ifam_index = ifa->ifa_ifp->if_index;
16396d076ae8SBjoern A. Zeeb 		ifam32->_ifam_spare1 = 0;
16406d076ae8SBjoern A. Zeeb 		ifam32->ifam_len = sizeof(*ifam32);
16416d076ae8SBjoern A. Zeeb 		ifam32->ifam_data_off =
16426d076ae8SBjoern A. Zeeb 		    offsetof(struct ifa_msghdrl32, ifam_data);
16439753faf5SGleb Smirnoff 		ifam32->ifam_metric = ifa->ifa_ifp->if_metric;
1644b245f96cSGleb Smirnoff 		ifd = &ifam32->ifam_data;
1645b245f96cSGleb Smirnoff 	} else
16466d076ae8SBjoern A. Zeeb #endif
1647b245f96cSGleb Smirnoff 	{
16486d076ae8SBjoern A. Zeeb 		ifam->ifam_addrs = info->rti_addrs;
16496d076ae8SBjoern A. Zeeb 		ifam->ifam_flags = ifa->ifa_flags;
16506d076ae8SBjoern A. Zeeb 		ifam->ifam_index = ifa->ifa_ifp->if_index;
16516d076ae8SBjoern A. Zeeb 		ifam->_ifam_spare1 = 0;
16526d076ae8SBjoern A. Zeeb 		ifam->ifam_len = sizeof(*ifam);
16536d076ae8SBjoern A. Zeeb 		ifam->ifam_data_off = offsetof(struct ifa_msghdrl, ifam_data);
16549753faf5SGleb Smirnoff 		ifam->ifam_metric = ifa->ifa_ifp->if_metric;
1655b245f96cSGleb Smirnoff 		ifd = &ifam->ifam_data;
1656b245f96cSGleb Smirnoff 	}
16576d076ae8SBjoern A. Zeeb 
1658b245f96cSGleb Smirnoff 	bzero(ifd, sizeof(*ifd));
1659b245f96cSGleb Smirnoff 	ifd->ifi_datalen = sizeof(struct if_data);
1660b245f96cSGleb Smirnoff 	ifd->ifi_ipackets = counter_u64_fetch(ifa->ifa_ipackets);
1661b245f96cSGleb Smirnoff 	ifd->ifi_opackets = counter_u64_fetch(ifa->ifa_opackets);
1662b245f96cSGleb Smirnoff 	ifd->ifi_ibytes = counter_u64_fetch(ifa->ifa_ibytes);
1663b245f96cSGleb Smirnoff 	ifd->ifi_obytes = counter_u64_fetch(ifa->ifa_obytes);
16647caf4ab7SGleb Smirnoff 
16656d076ae8SBjoern A. Zeeb 	/* Fixup if_data carp(4) vhid. */
16666d076ae8SBjoern A. Zeeb 	if (carp_get_vhid_p != NULL)
1667b245f96cSGleb Smirnoff 		ifd->ifi_vhid = (*carp_get_vhid_p)(ifa);
16686d076ae8SBjoern A. Zeeb 
16696d076ae8SBjoern A. Zeeb 	return (SYSCTL_OUT(w->w_req, w->w_tmem, len));
16706d076ae8SBjoern A. Zeeb }
16716d076ae8SBjoern A. Zeeb 
16726d076ae8SBjoern A. Zeeb static int
16736d076ae8SBjoern A. Zeeb sysctl_iflist_ifam(struct ifaddr *ifa, struct rt_addrinfo *info,
16746d076ae8SBjoern A. Zeeb     struct walkarg *w, int len)
16756d076ae8SBjoern A. Zeeb {
16766d076ae8SBjoern A. Zeeb 	struct ifa_msghdr *ifam;
16776d076ae8SBjoern A. Zeeb 
16786d076ae8SBjoern A. Zeeb 	ifam = (struct ifa_msghdr *)w->w_tmem;
16796d076ae8SBjoern A. Zeeb 	ifam->ifam_addrs = info->rti_addrs;
16806d076ae8SBjoern A. Zeeb 	ifam->ifam_flags = ifa->ifa_flags;
16816d076ae8SBjoern A. Zeeb 	ifam->ifam_index = ifa->ifa_ifp->if_index;
16829753faf5SGleb Smirnoff 	ifam->ifam_metric = ifa->ifa_ifp->if_metric;
16836d076ae8SBjoern A. Zeeb 
16846d076ae8SBjoern A. Zeeb 	return (SYSCTL_OUT(w->w_req, w->w_tmem, len));
16856d076ae8SBjoern A. Zeeb }
16866d076ae8SBjoern A. Zeeb 
16876d076ae8SBjoern A. Zeeb static int
1688becc44d7SSam Leffler sysctl_iflist(int af, struct walkarg *w)
1689df8bae1dSRodney W. Grimes {
1690becc44d7SSam Leffler 	struct ifnet *ifp;
1691becc44d7SSam Leffler 	struct ifaddr *ifa;
1692df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
1693df8bae1dSRodney W. Grimes 	int len, error = 0;
16943deb3649SAlexander V. Chernikov 	struct sockaddr_storage ss;
1695df8bae1dSRodney W. Grimes 
1696df8bae1dSRodney W. Grimes 	bzero((caddr_t)&info, sizeof(info));
16975c9fa630SHiroki Sato 	IFNET_RLOCK_NOSLEEP();
1698603724d3SBjoern A. Zeeb 	TAILQ_FOREACH(ifp, &V_ifnet, if_link) {
1699df8bae1dSRodney W. Grimes 		if (w->w_arg && w->w_arg != ifp->if_index)
1700df8bae1dSRodney W. Grimes 			continue;
1701137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
17024a0d6638SRuslan Ermilov 		ifa = ifp->if_addr;
1703becc44d7SSam Leffler 		info.rti_info[RTAX_IFP] = ifa->ifa_addr;
1704f2e5eb36SAlexander V. Chernikov 		error = rtsock_msg_buffer(RTM_IFINFO, &info, w, &len);
1705f2e5eb36SAlexander V. Chernikov 		if (error != 0)
1706f2e5eb36SAlexander V. Chernikov 			goto done;
17075dfc91d7SLuigi Rizzo 		info.rti_info[RTAX_IFP] = NULL;
170852041295SPoul-Henning Kamp 		if (w->w_req && w->w_tmem) {
17096d076ae8SBjoern A. Zeeb 			if (w->w_op == NET_RT_IFLISTL)
17106d076ae8SBjoern A. Zeeb 				error = sysctl_iflist_ifml(ifp, &info, w, len);
17116d076ae8SBjoern A. Zeeb 			else
17126d076ae8SBjoern A. Zeeb 				error = sysctl_iflist_ifm(ifp, &info, w, len);
1713df440948SPoul-Henning Kamp 			if (error)
1714a35b06c5SJonathan Lemon 				goto done;
1715df8bae1dSRodney W. Grimes 		}
17165dfc91d7SLuigi Rizzo 		while ((ifa = TAILQ_NEXT(ifa, ifa_link)) != NULL) {
1717df8bae1dSRodney W. Grimes 			if (af && af != ifa->ifa_addr->sa_family)
1718df8bae1dSRodney W. Grimes 				continue;
1719b89e82ddSJamie Gritton 			if (prison_if(w->w_req->td->td_ucred,
1720b89e82ddSJamie Gritton 			    ifa->ifa_addr) != 0)
172175c13541SPoul-Henning Kamp 				continue;
1722becc44d7SSam Leffler 			info.rti_info[RTAX_IFA] = ifa->ifa_addr;
17233deb3649SAlexander V. Chernikov 			info.rti_info[RTAX_NETMASK] = rtsock_fix_netmask(
17243deb3649SAlexander V. Chernikov 			    ifa->ifa_addr, ifa->ifa_netmask, &ss);
1725becc44d7SSam Leffler 			info.rti_info[RTAX_BRD] = ifa->ifa_dstaddr;
1726f2e5eb36SAlexander V. Chernikov 			error = rtsock_msg_buffer(RTM_NEWADDR, &info, w, &len);
1727f2e5eb36SAlexander V. Chernikov 			if (error != 0)
1728f2e5eb36SAlexander V. Chernikov 				goto done;
172952041295SPoul-Henning Kamp 			if (w->w_req && w->w_tmem) {
17306d076ae8SBjoern A. Zeeb 				if (w->w_op == NET_RT_IFLISTL)
17316d076ae8SBjoern A. Zeeb 					error = sysctl_iflist_ifaml(ifa, &info,
17326d076ae8SBjoern A. Zeeb 					    w, len);
17336d076ae8SBjoern A. Zeeb 				else
17346d076ae8SBjoern A. Zeeb 					error = sysctl_iflist_ifam(ifa, &info,
17356d076ae8SBjoern A. Zeeb 					    w, len);
1736df440948SPoul-Henning Kamp 				if (error)
1737a35b06c5SJonathan Lemon 					goto done;
1738df8bae1dSRodney W. Grimes 			}
1739df8bae1dSRodney W. Grimes 		}
1740137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
17413deb3649SAlexander V. Chernikov 		info.rti_info[RTAX_IFA] = NULL;
17423deb3649SAlexander V. Chernikov 		info.rti_info[RTAX_NETMASK] = NULL;
17435dfc91d7SLuigi Rizzo 		info.rti_info[RTAX_BRD] = NULL;
1744df8bae1dSRodney W. Grimes 	}
1745a35b06c5SJonathan Lemon done:
1746ee7c7feeSBjoern A. Zeeb 	if (ifp != NULL)
1747137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
17485c9fa630SHiroki Sato 	IFNET_RUNLOCK_NOSLEEP();
1749a35b06c5SJonathan Lemon 	return (error);
1750df8bae1dSRodney W. Grimes }
1751df8bae1dSRodney W. Grimes 
1752ebda3fc3SBjoern A. Zeeb static int
17539b98ee2cSLuigi Rizzo sysctl_ifmalist(int af, struct walkarg *w)
175405b2efe0SBruce M Simpson {
17559b98ee2cSLuigi Rizzo 	struct ifnet *ifp;
175605b2efe0SBruce M Simpson 	struct ifmultiaddr *ifma;
175705b2efe0SBruce M Simpson 	struct	rt_addrinfo info;
175805b2efe0SBruce M Simpson 	int	len, error = 0;
17599b98ee2cSLuigi Rizzo 	struct ifaddr *ifa;
176005b2efe0SBruce M Simpson 
176105b2efe0SBruce M Simpson 	bzero((caddr_t)&info, sizeof(info));
17625c9fa630SHiroki Sato 	IFNET_RLOCK_NOSLEEP();
1763603724d3SBjoern A. Zeeb 	TAILQ_FOREACH(ifp, &V_ifnet, if_link) {
176405b2efe0SBruce M Simpson 		if (w->w_arg && w->w_arg != ifp->if_index)
176505b2efe0SBruce M Simpson 			continue;
17664a0d6638SRuslan Ermilov 		ifa = ifp->if_addr;
1767913af518SLuigi Rizzo 		info.rti_info[RTAX_IFP] = ifa ? ifa->ifa_addr : NULL;
1768137f91e8SJohn Baldwin 		IF_ADDR_RLOCK(ifp);
176905b2efe0SBruce M Simpson 		TAILQ_FOREACH(ifma, &ifp->if_multiaddrs, ifma_link) {
177005b2efe0SBruce M Simpson 			if (af && af != ifma->ifma_addr->sa_family)
177105b2efe0SBruce M Simpson 				continue;
1772b89e82ddSJamie Gritton 			if (prison_if(w->w_req->td->td_ucred,
1773b89e82ddSJamie Gritton 			    ifma->ifma_addr) != 0)
177405b2efe0SBruce M Simpson 				continue;
177505b2efe0SBruce M Simpson 			info.rti_info[RTAX_IFA] = ifma->ifma_addr;
1776913af518SLuigi Rizzo 			info.rti_info[RTAX_GATEWAY] =
1777913af518SLuigi Rizzo 			    (ifma->ifma_addr->sa_family != AF_LINK) ?
1778913af518SLuigi Rizzo 			    ifma->ifma_lladdr : NULL;
1779c9f98940SAlexander V. Chernikov 			error = rtsock_msg_buffer(RTM_NEWMADDR, &info, w, &len);
1780f2e5eb36SAlexander V. Chernikov 			if (error != 0)
1781f2e5eb36SAlexander V. Chernikov 				goto done;
178205b2efe0SBruce M Simpson 			if (w->w_req && w->w_tmem) {
17839b98ee2cSLuigi Rizzo 				struct ifma_msghdr *ifmam;
178405b2efe0SBruce M Simpson 
178505b2efe0SBruce M Simpson 				ifmam = (struct ifma_msghdr *)w->w_tmem;
178605b2efe0SBruce M Simpson 				ifmam->ifmam_index = ifma->ifma_ifp->if_index;
178705b2efe0SBruce M Simpson 				ifmam->ifmam_flags = 0;
178805b2efe0SBruce M Simpson 				ifmam->ifmam_addrs = info.rti_addrs;
178905b2efe0SBruce M Simpson 				error = SYSCTL_OUT(w->w_req, w->w_tmem, len);
1790fe0fc7efSChristian S.J. Peron 				if (error) {
1791137f91e8SJohn Baldwin 					IF_ADDR_RUNLOCK(ifp);
179205b2efe0SBruce M Simpson 					goto done;
179305b2efe0SBruce M Simpson 				}
179405b2efe0SBruce M Simpson 			}
179505b2efe0SBruce M Simpson 		}
1796137f91e8SJohn Baldwin 		IF_ADDR_RUNLOCK(ifp);
1797fe0fc7efSChristian S.J. Peron 	}
179805b2efe0SBruce M Simpson done:
17995c9fa630SHiroki Sato 	IFNET_RUNLOCK_NOSLEEP();
180005b2efe0SBruce M Simpson 	return (error);
180105b2efe0SBruce M Simpson }
180205b2efe0SBruce M Simpson 
180352041295SPoul-Henning Kamp static int
180482d9ae4eSPoul-Henning Kamp sysctl_rtsock(SYSCTL_HANDLER_ARGS)
1805df8bae1dSRodney W. Grimes {
180652041295SPoul-Henning Kamp 	int	*name = (int *)arg1;
180752041295SPoul-Henning Kamp 	u_int	namelen = arg2;
1808*61eee0e2SAlexander V. Chernikov 	struct rib_head *rnh = NULL; /* silence compiler. */
1809fe0fc7efSChristian S.J. Peron 	int	i, lim, error = EINVAL;
18104825b1e0SHiroki Sato 	int	fib = 0;
1811df8bae1dSRodney W. Grimes 	u_char	af;
1812df8bae1dSRodney W. Grimes 	struct	walkarg w;
1813df8bae1dSRodney W. Grimes 
181452041295SPoul-Henning Kamp 	name ++;
181552041295SPoul-Henning Kamp 	namelen--;
181652041295SPoul-Henning Kamp 	if (req->newptr)
1817df8bae1dSRodney W. Grimes 		return (EPERM);
18184825b1e0SHiroki Sato 	if (name[1] == NET_RT_DUMP) {
18194825b1e0SHiroki Sato 		if (namelen == 3)
18204825b1e0SHiroki Sato 			fib = req->td->td_proc->p_fibnum;
18214825b1e0SHiroki Sato 		else if (namelen == 4)
18227d9b6df1SAlexander V. Chernikov 			fib = (name[3] == RT_ALL_FIBS) ?
18234825b1e0SHiroki Sato 			    req->td->td_proc->p_fibnum : name[3];
18244825b1e0SHiroki Sato 		else
18254825b1e0SHiroki Sato 			return ((namelen < 3) ? EISDIR : ENOTDIR);
18264825b1e0SHiroki Sato 		if (fib < 0 || fib >= rt_numfibs)
18274825b1e0SHiroki Sato 			return (EINVAL);
18284825b1e0SHiroki Sato 	} else if (namelen != 3)
1829f7a54d06SCrist J. Clark 		return ((namelen < 3) ? EISDIR : ENOTDIR);
1830df8bae1dSRodney W. Grimes 	af = name[0];
1831b2aaf46eSJeffrey Hsu 	if (af > AF_MAX)
1832b2aaf46eSJeffrey Hsu 		return (EINVAL);
18336b96f1afSLuigi Rizzo 	bzero(&w, sizeof(w));
1834df8bae1dSRodney W. Grimes 	w.w_op = name[1];
1835df8bae1dSRodney W. Grimes 	w.w_arg = name[2];
183652041295SPoul-Henning Kamp 	w.w_req = req;
1837df8bae1dSRodney W. Grimes 
1838fe0fc7efSChristian S.J. Peron 	error = sysctl_wire_old_buffer(req, 0);
1839fe0fc7efSChristian S.J. Peron 	if (error)
1840fe0fc7efSChristian S.J. Peron 		return (error);
1841f2e5eb36SAlexander V. Chernikov 
1842f2e5eb36SAlexander V. Chernikov 	/*
1843f2e5eb36SAlexander V. Chernikov 	 * Allocate reply buffer in advance.
1844f2e5eb36SAlexander V. Chernikov 	 * All rtsock messages has maximum length of u_short.
1845f2e5eb36SAlexander V. Chernikov 	 */
1846f2e5eb36SAlexander V. Chernikov 	w.w_tmemsize = 65536;
1847f2e5eb36SAlexander V. Chernikov 	w.w_tmem = malloc(w.w_tmemsize, M_TEMP, M_WAITOK);
1848f2e5eb36SAlexander V. Chernikov 
1849df8bae1dSRodney W. Grimes 	switch (w.w_op) {
1850df8bae1dSRodney W. Grimes 
1851df8bae1dSRodney W. Grimes 	case NET_RT_DUMP:
1852df8bae1dSRodney W. Grimes 	case NET_RT_FLAGS:
1853a8b76c8fSLuigi Rizzo 		if (af == 0) {			/* dump all tables */
1854a8b76c8fSLuigi Rizzo 			i = 1;
1855a8b76c8fSLuigi Rizzo 			lim = AF_MAX;
1856a8b76c8fSLuigi Rizzo 		} else				/* dump only one table */
1857a8b76c8fSLuigi Rizzo 			i = lim = af;
18588eca593cSQing Li 
18598eca593cSQing Li 		/*
18608eca593cSQing Li 		 * take care of llinfo entries, the caller must
18618eca593cSQing Li 		 * specify an AF
18628eca593cSQing Li 		 */
186314981d80SQing Li 		if (w.w_op == NET_RT_FLAGS &&
186482b334e8SQing Li 		    (w.w_arg == 0 || w.w_arg & RTF_LLINFO)) {
18658eca593cSQing Li 			if (af != 0)
18668eca593cSQing Li 				error = lltable_sysctl_dumparp(af, w.w_req);
18678eca593cSQing Li 			else
18688eca593cSQing Li 				error = EINVAL;
18698eca593cSQing Li 			break;
18708eca593cSQing Li 		}
18718eca593cSQing Li 		/*
18728eca593cSQing Li 		 * take care of routing entries
18738eca593cSQing Li 		 */
187420b0cdb7SBjoern A. Zeeb 		for (error = 0; error == 0 && i <= lim; i++) {
18754825b1e0SHiroki Sato 			rnh = rt_tables_get_rnh(fib, i);
1876c2c2a7c1SBjoern A. Zeeb 			if (rnh != NULL) {
1877*61eee0e2SAlexander V. Chernikov 				RIB_RLOCK(rnh);
1878*61eee0e2SAlexander V. Chernikov 			    	error = rnh->rnh_walktree(&rnh->head,
1879fe0fc7efSChristian S.J. Peron 				    sysctl_dumpentry, &w);
1880*61eee0e2SAlexander V. Chernikov 				RIB_RUNLOCK(rnh);
1881a8b76c8fSLuigi Rizzo 			} else if (af != 0)
1882956b0b65SJeffrey Hsu 				error = EAFNOSUPPORT;
188320b0cdb7SBjoern A. Zeeb 		}
1884df8bae1dSRodney W. Grimes 		break;
1885df8bae1dSRodney W. Grimes 
1886df8bae1dSRodney W. Grimes 	case NET_RT_IFLIST:
18876d076ae8SBjoern A. Zeeb 	case NET_RT_IFLISTL:
1888df8bae1dSRodney W. Grimes 		error = sysctl_iflist(af, &w);
188905b2efe0SBruce M Simpson 		break;
189005b2efe0SBruce M Simpson 
189105b2efe0SBruce M Simpson 	case NET_RT_IFMALIST:
189205b2efe0SBruce M Simpson 		error = sysctl_ifmalist(af, &w);
189305b2efe0SBruce M Simpson 		break;
1894df8bae1dSRodney W. Grimes 	}
1895f2e5eb36SAlexander V. Chernikov 
1896f2e5eb36SAlexander V. Chernikov 	free(w.w_tmem, M_TEMP);
1897df8bae1dSRodney W. Grimes 	return (error);
1898df8bae1dSRodney W. Grimes }
1899df8bae1dSRodney W. Grimes 
19006472ac3dSEd Schouten static SYSCTL_NODE(_net, PF_ROUTE, routetable, CTLFLAG_RD, sysctl_rtsock, "");
190152041295SPoul-Henning Kamp 
1902df8bae1dSRodney W. Grimes /*
1903df8bae1dSRodney W. Grimes  * Definitions of protocols supported in the ROUTE domain.
1904df8bae1dSRodney W. Grimes  */
1905df8bae1dSRodney W. Grimes 
19065b1c0294SDavid E. O'Brien static struct domain routedomain;		/* or at least forward */
1907df8bae1dSRodney W. Grimes 
190852041295SPoul-Henning Kamp static struct protosw routesw[] = {
1909303989a2SRuslan Ermilov {
1910303989a2SRuslan Ermilov 	.pr_type =		SOCK_RAW,
1911303989a2SRuslan Ermilov 	.pr_domain =		&routedomain,
1912303989a2SRuslan Ermilov 	.pr_flags =		PR_ATOMIC|PR_ADDR,
1913303989a2SRuslan Ermilov 	.pr_output =		route_output,
1914303989a2SRuslan Ermilov 	.pr_ctlinput =		raw_ctlinput,
1915303989a2SRuslan Ermilov 	.pr_init =		raw_init,
1916303989a2SRuslan Ermilov 	.pr_usrreqs =		&route_usrreqs
1917df8bae1dSRodney W. Grimes }
1918df8bae1dSRodney W. Grimes };
1919df8bae1dSRodney W. Grimes 
1920303989a2SRuslan Ermilov static struct domain routedomain = {
1921303989a2SRuslan Ermilov 	.dom_family =		PF_ROUTE,
1922303989a2SRuslan Ermilov 	.dom_name =		 "route",
1923303989a2SRuslan Ermilov 	.dom_protosw =		routesw,
1924303989a2SRuslan Ermilov 	.dom_protoswNPROTOSW =	&routesw[sizeof(routesw)/sizeof(routesw[0])]
1925303989a2SRuslan Ermilov };
192678a82810SGarrett Wollman 
1927d0728d71SRobert Watson VNET_DOMAIN_SET(route);
1928