xref: /freebsd/sys/net/rtsock.c (revision 33a0803f000fc52a50465a65d3e8b64168557ecf)
1c398230bSWarner Losh /*-
251369649SPedro F. Giffuni  * SPDX-License-Identifier: BSD-3-Clause
351369649SPedro F. Giffuni  *
4df8bae1dSRodney W. Grimes  * Copyright (c) 1988, 1991, 1993
5df8bae1dSRodney W. Grimes  *	The Regents of the University of California.  All rights reserved.
6df8bae1dSRodney W. Grimes  *
7df8bae1dSRodney W. Grimes  * Redistribution and use in source and binary forms, with or without
8df8bae1dSRodney W. Grimes  * modification, are permitted provided that the following conditions
9df8bae1dSRodney W. Grimes  * are met:
10df8bae1dSRodney W. Grimes  * 1. Redistributions of source code must retain the above copyright
11df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer.
12df8bae1dSRodney W. Grimes  * 2. Redistributions in binary form must reproduce the above copyright
13df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer in the
14df8bae1dSRodney W. Grimes  *    documentation and/or other materials provided with the distribution.
15fbbd9655SWarner Losh  * 3. Neither the name of the University nor the names of its contributors
16df8bae1dSRodney W. Grimes  *    may be used to endorse or promote products derived from this software
17df8bae1dSRodney W. Grimes  *    without specific prior written permission.
18df8bae1dSRodney W. Grimes  *
19df8bae1dSRodney W. Grimes  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
20df8bae1dSRodney W. Grimes  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21df8bae1dSRodney W. Grimes  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22df8bae1dSRodney W. Grimes  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
23df8bae1dSRodney W. Grimes  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24df8bae1dSRodney W. Grimes  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25df8bae1dSRodney W. Grimes  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26df8bae1dSRodney W. Grimes  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27df8bae1dSRodney W. Grimes  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28df8bae1dSRodney W. Grimes  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29df8bae1dSRodney W. Grimes  * SUCH DAMAGE.
30df8bae1dSRodney W. Grimes  *
3128070a0eSRuslan Ermilov  *	@(#)rtsock.c	8.7 (Berkeley) 10/12/95
32c3aac50fSPeter Wemm  * $FreeBSD$
33df8bae1dSRodney W. Grimes  */
348b6acd2bSConrad Meyer #include "opt_ddb.h"
35fedeb08bSAlexander V. Chernikov #include "opt_route.h"
36413628a7SBjoern A. Zeeb #include "opt_inet.h"
37413628a7SBjoern A. Zeeb #include "opt_inet6.h"
38e440aed9SQing Li 
39df8bae1dSRodney W. Grimes #include <sys/param.h>
40960ed29cSSeigo Tanimura #include <sys/jail.h>
41413628a7SBjoern A. Zeeb #include <sys/kernel.h>
42d0728d71SRobert Watson #include <sys/domain.h>
43609ff41fSWarner Losh #include <sys/lock.h>
444d1d4912SBruce Evans #include <sys/malloc.h>
45df8bae1dSRodney W. Grimes #include <sys/mbuf.h>
46acd3428bSRobert Watson #include <sys/priv.h>
47960ed29cSSeigo Tanimura #include <sys/proc.h>
48960ed29cSSeigo Tanimura #include <sys/protosw.h>
4920efcfc6SAndrey V. Elsukov #include <sys/rmlock.h>
503120b9d4SKip Macy #include <sys/rwlock.h>
51960ed29cSSeigo Tanimura #include <sys/signalvar.h>
52df8bae1dSRodney W. Grimes #include <sys/socket.h>
53df8bae1dSRodney W. Grimes #include <sys/socketvar.h>
54960ed29cSSeigo Tanimura #include <sys/sysctl.h>
55960ed29cSSeigo Tanimura #include <sys/systm.h>
56df8bae1dSRodney W. Grimes 
57df8bae1dSRodney W. Grimes #include <net/if.h>
5876039bc8SGleb Smirnoff #include <net/if_var.h>
598eca593cSQing Li #include <net/if_dl.h>
606e6b3f7cSQing Li #include <net/if_llatbl.h>
610ed6142bSQing Li #include <net/if_types.h>
62d989c7b3SRobert Watson #include <net/netisr.h>
63df8bae1dSRodney W. Grimes #include <net/raw_cb.h>
64960ed29cSSeigo Tanimura #include <net/route.h>
65a287a973SAlexander V. Chernikov #include <net/route/route_ctl.h>
66e7d8af4fSAlexander V. Chernikov #include <net/route/route_var.h>
674b79449eSBjoern A. Zeeb #include <net/vnet.h>
68df8bae1dSRodney W. Grimes 
695a59cefcSBosko Milekic #include <netinet/in.h>
70c7ab6602SQing Li #include <netinet/if_ether.h>
7108b68b0eSGleb Smirnoff #include <netinet/ip_carp.h>
72413628a7SBjoern A. Zeeb #ifdef INET6
732fe5a794SAlexander V. Chernikov #include <netinet6/in6_var.h>
740bebb544SHiroki Sato #include <netinet6/ip6_var.h>
75413628a7SBjoern A. Zeeb #include <netinet6/scope6_var.h>
76413628a7SBjoern A. Zeeb #endif
77a6663252SAlexander V. Chernikov #include <net/route/nhop.h>
785a59cefcSBosko Milekic 
790e87bab6SAlexander V. Chernikov #define	DEBUG_MOD_NAME	rtsock
800e87bab6SAlexander V. Chernikov #define	DEBUG_MAX_LEVEL	LOG_DEBUG
810e87bab6SAlexander V. Chernikov #include <net/route/route_debug.h>
82*33a0803fSAlexander V. Chernikov _DECLARE_DEBUG(LOG_INFO);
830e87bab6SAlexander V. Chernikov 
84427a928aSKonstantin Belousov #ifdef COMPAT_FREEBSD32
85427a928aSKonstantin Belousov #include <sys/mount.h>
86427a928aSKonstantin Belousov #include <compat/freebsd32/freebsd32.h>
87427a928aSKonstantin Belousov 
88427a928aSKonstantin Belousov struct if_msghdr32 {
89427a928aSKonstantin Belousov 	uint16_t ifm_msglen;
90427a928aSKonstantin Belousov 	uint8_t	ifm_version;
91427a928aSKonstantin Belousov 	uint8_t	ifm_type;
92427a928aSKonstantin Belousov 	int32_t	ifm_addrs;
93427a928aSKonstantin Belousov 	int32_t	ifm_flags;
94427a928aSKonstantin Belousov 	uint16_t ifm_index;
95d25f8522SMark Johnston 	uint16_t _ifm_spare1;
96b245f96cSGleb Smirnoff 	struct	if_data ifm_data;
97427a928aSKonstantin Belousov };
986d076ae8SBjoern A. Zeeb 
996d076ae8SBjoern A. Zeeb struct if_msghdrl32 {
1006d076ae8SBjoern A. Zeeb 	uint16_t ifm_msglen;
1016d076ae8SBjoern A. Zeeb 	uint8_t	ifm_version;
1026d076ae8SBjoern A. Zeeb 	uint8_t	ifm_type;
1036d076ae8SBjoern A. Zeeb 	int32_t	ifm_addrs;
1046d076ae8SBjoern A. Zeeb 	int32_t	ifm_flags;
1056d076ae8SBjoern A. Zeeb 	uint16_t ifm_index;
1066d076ae8SBjoern A. Zeeb 	uint16_t _ifm_spare1;
1076d076ae8SBjoern A. Zeeb 	uint16_t ifm_len;
1086d076ae8SBjoern A. Zeeb 	uint16_t ifm_data_off;
109d25f8522SMark Johnston 	uint32_t _ifm_spare2;
110b245f96cSGleb Smirnoff 	struct	if_data ifm_data;
1116d076ae8SBjoern A. Zeeb };
1126d076ae8SBjoern A. Zeeb 
1136d076ae8SBjoern A. Zeeb struct ifa_msghdrl32 {
1146d076ae8SBjoern A. Zeeb 	uint16_t ifam_msglen;
1156d076ae8SBjoern A. Zeeb 	uint8_t	ifam_version;
1166d076ae8SBjoern A. Zeeb 	uint8_t	ifam_type;
1176d076ae8SBjoern A. Zeeb 	int32_t	ifam_addrs;
1186d076ae8SBjoern A. Zeeb 	int32_t	ifam_flags;
1196d076ae8SBjoern A. Zeeb 	uint16_t ifam_index;
1206d076ae8SBjoern A. Zeeb 	uint16_t _ifam_spare1;
1216d076ae8SBjoern A. Zeeb 	uint16_t ifam_len;
1226d076ae8SBjoern A. Zeeb 	uint16_t ifam_data_off;
1236d076ae8SBjoern A. Zeeb 	int32_t	ifam_metric;
124b245f96cSGleb Smirnoff 	struct	if_data ifam_data;
1256d076ae8SBjoern A. Zeeb };
126279e33d4SKonstantin Belousov 
127279e33d4SKonstantin Belousov #define SA_SIZE32(sa)						\
128279e33d4SKonstantin Belousov     (  (((struct sockaddr *)(sa))->sa_len == 0) ?		\
129279e33d4SKonstantin Belousov 	sizeof(int)		:				\
130279e33d4SKonstantin Belousov 	1 + ( (((struct sockaddr *)(sa))->sa_len - 1) | (sizeof(int) - 1) ) )
131279e33d4SKonstantin Belousov 
1326d076ae8SBjoern A. Zeeb #endif /* COMPAT_FREEBSD32 */
133427a928aSKonstantin Belousov 
134b31fbebeSAlexander V. Chernikov struct linear_buffer {
135b31fbebeSAlexander V. Chernikov 	char		*base;	/* Base allocated memory pointer */
136b31fbebeSAlexander V. Chernikov 	uint32_t	offset;	/* Currently used offset */
137b31fbebeSAlexander V. Chernikov 	uint32_t	size;	/* Total buffer size */
138b31fbebeSAlexander V. Chernikov };
139b31fbebeSAlexander V. Chernikov #define	SCRATCH_BUFFER_SIZE	1024
140b31fbebeSAlexander V. Chernikov 
1416fa8ed43SAlexander V. Chernikov #define	RTS_PID_LOG(_l, _fmt, ...)	RT_LOG_##_l(_l, "PID %d: " _fmt, curproc ? curproc->p_pid : 0, ## __VA_ARGS__)
142758c9d54SAlexander V. Chernikov 
143a1c995b6SPoul-Henning Kamp MALLOC_DEFINE(M_RTABLE, "routetbl", "routing tables");
144a1c995b6SPoul-Henning Kamp 
145becc44d7SSam Leffler /* NB: these are not modified */
14652041295SPoul-Henning Kamp static struct	sockaddr route_src = { 2, PF_ROUTE, };
147076d0761SJulian Elischer static struct	sockaddr sa_zero   = { sizeof(sa_zero), AF_INET, };
148becc44d7SSam Leffler 
14908b68b0eSGleb Smirnoff /* These are external hooks for CARP. */
15008b68b0eSGleb Smirnoff int	(*carp_get_vhid_p)(struct ifaddr *);
15108b68b0eSGleb Smirnoff 
152528737fdSBjoern A. Zeeb /*
153528737fdSBjoern A. Zeeb  * Used by rtsock/raw_input callback code to decide whether to filter the update
154528737fdSBjoern A. Zeeb  * notification to a socket bound to a particular FIB.
155528737fdSBjoern A. Zeeb  */
156528737fdSBjoern A. Zeeb #define	RTS_FILTER_FIB	M_PROTO8
157528737fdSBjoern A. Zeeb 
158c5d4eab6SMarko Zec typedef struct {
15918aee723SPeter Pentchev 	int	ip_count;	/* attached w/ AF_INET */
160becc44d7SSam Leffler 	int	ip6_count;	/* attached w/ AF_INET6 */
161becc44d7SSam Leffler 	int	any_count;	/* total attached */
162c5d4eab6SMarko Zec } route_cb_t;
1635f901c92SAndrew Turner VNET_DEFINE_STATIC(route_cb_t, route_cb);
164c5d4eab6SMarko Zec #define	V_route_cb VNET(route_cb)
165df8bae1dSRodney W. Grimes 
166aea8b30fSSam Leffler struct mtx rtsock_mtx;
167aea8b30fSSam Leffler MTX_SYSINIT(rtsock, &rtsock_mtx, "rtsock route_cb lock", MTX_DEF);
168aea8b30fSSam Leffler 
169aea8b30fSSam Leffler #define	RTSOCK_LOCK()	mtx_lock(&rtsock_mtx)
170aea8b30fSSam Leffler #define	RTSOCK_UNLOCK()	mtx_unlock(&rtsock_mtx)
171aea8b30fSSam Leffler #define	RTSOCK_LOCK_ASSERT()	mtx_assert(&rtsock_mtx, MA_OWNED)
172aea8b30fSSam Leffler 
173fedeb08bSAlexander V. Chernikov SYSCTL_NODE(_net, OID_AUTO, route, CTLFLAG_RD | CTLFLAG_MPSAFE, 0, "");
174190a4c94SRobert Watson 
175df8bae1dSRodney W. Grimes struct walkarg {
176d68fb8d9SAlexander V. Chernikov 	int	family;
17752041295SPoul-Henning Kamp 	int	w_tmemsize;
17852041295SPoul-Henning Kamp 	int	w_op, w_arg;
17952041295SPoul-Henning Kamp 	caddr_t	w_tmem;
18052041295SPoul-Henning Kamp 	struct sysctl_req *w_req;
181d68fb8d9SAlexander V. Chernikov 	struct sockaddr *dst;
182d68fb8d9SAlexander V. Chernikov 	struct sockaddr *mask;
183df8bae1dSRodney W. Grimes };
184df8bae1dSRodney W. Grimes 
185d989c7b3SRobert Watson static void	rts_input(struct mbuf *m);
1866db47af4SAlexander V. Chernikov static struct mbuf *rtsock_msg_mbuf(int type, struct rt_addrinfo *rtinfo);
187f2e5eb36SAlexander V. Chernikov static int	rtsock_msg_buffer(int type, struct rt_addrinfo *rtinfo,
188f2e5eb36SAlexander V. Chernikov 			struct walkarg *w, int *plen);
1895dfc91d7SLuigi Rizzo static int	rt_xaddrs(caddr_t cp, caddr_t cplim,
1905dfc91d7SLuigi Rizzo 			struct rt_addrinfo *rtinfo);
191b31fbebeSAlexander V. Chernikov static int	cleanup_xaddrs(struct rt_addrinfo *info, struct linear_buffer *lb);
192d68fb8d9SAlexander V. Chernikov static int	sysctl_dumpentry(struct rtentry *rt, void *vw);
1932259a030SAlexander V. Chernikov static int	sysctl_dumpnhop(struct rtentry *rt, struct nhop_object *nh,
1942259a030SAlexander V. Chernikov 			uint32_t weight, struct walkarg *w);
195929ddbbbSAlfred Perlstein static int	sysctl_iflist(int af, struct walkarg *w);
19605b2efe0SBruce M Simpson static int	sysctl_ifmalist(int af, struct walkarg *w);
19773d76e77SKevin Lo static int	route_output(struct mbuf *m, struct socket *so, ...);
19893bfd365SAlexander V. Chernikov static void	rt_getmetrics(const struct rtentry *rt,
19993bfd365SAlexander V. Chernikov 			const struct nhop_object *nh, struct rt_metrics *out);
2003ca1a2d6SMax Laier static void	rt_dispatch(struct mbuf *, sa_family_t);
201c83dda36SAlexander V. Chernikov static int	handle_rtm_get(struct rt_addrinfo *info, u_int fibnum,
202a287a973SAlexander V. Chernikov 			struct rt_msghdr *rtm, struct rib_cmd_info *rc);
203592d300eSAlexander V. Chernikov static int	update_rtm_from_rc(struct rt_addrinfo *info,
204c83dda36SAlexander V. Chernikov 			struct rt_msghdr **prtm, int alloc_len,
205592d300eSAlexander V. Chernikov 			struct rib_cmd_info *rc, struct nhop_object *nh);
206c83dda36SAlexander V. Chernikov static void	send_rtm_reply(struct socket *so, struct rt_msghdr *rtm,
207c83dda36SAlexander V. Chernikov 			struct mbuf *m, sa_family_t saf, u_int fibnum,
208c83dda36SAlexander V. Chernikov 			int rtm_errno);
209d68fb8d9SAlexander V. Chernikov static bool	can_export_rte(struct ucred *td_ucred, bool rt_is_host,
210d68fb8d9SAlexander V. Chernikov 			const struct sockaddr *rt_dst);
211df8bae1dSRodney W. Grimes 
212d4b5cae4SRobert Watson static struct netisr_handler rtsock_nh = {
213d4b5cae4SRobert Watson 	.nh_name = "rtsock",
214d4b5cae4SRobert Watson 	.nh_handler = rts_input,
215d4b5cae4SRobert Watson 	.nh_proto = NETISR_ROUTE,
216d4b5cae4SRobert Watson 	.nh_policy = NETISR_POLICY_SOURCE,
217d4b5cae4SRobert Watson };
218d4b5cae4SRobert Watson 
219d4b5cae4SRobert Watson static int
220d4b5cae4SRobert Watson sysctl_route_netisr_maxqlen(SYSCTL_HANDLER_ARGS)
221d4b5cae4SRobert Watson {
222d4b5cae4SRobert Watson 	int error, qlimit;
223d4b5cae4SRobert Watson 
224d4b5cae4SRobert Watson 	netisr_getqlimit(&rtsock_nh, &qlimit);
225d4b5cae4SRobert Watson 	error = sysctl_handle_int(oidp, &qlimit, 0, req);
226d4b5cae4SRobert Watson         if (error || !req->newptr)
227d4b5cae4SRobert Watson                 return (error);
228d4b5cae4SRobert Watson 	if (qlimit < 1)
229d4b5cae4SRobert Watson 		return (EINVAL);
230d4b5cae4SRobert Watson 	return (netisr_setqlimit(&rtsock_nh, qlimit));
231d4b5cae4SRobert Watson }
2327029da5cSPawel Biernacki SYSCTL_PROC(_net_route, OID_AUTO, netisr_maxqlen,
2337029da5cSPawel Biernacki     CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE,
234d4b5cae4SRobert Watson     0, 0, sysctl_route_netisr_maxqlen, "I",
235d4b5cae4SRobert Watson     "maximum routing socket dispatch queue length");
236d4b5cae4SRobert Watson 
237d989c7b3SRobert Watson static void
238484149deSBjoern A. Zeeb vnet_rts_init(void)
239d989c7b3SRobert Watson {
240b062951aSRobert Watson 	int tmp;
241d989c7b3SRobert Watson 
242484149deSBjoern A. Zeeb 	if (IS_DEFAULT_VNET(curvnet)) {
243b062951aSRobert Watson 		if (TUNABLE_INT_FETCH("net.route.netisr_maxqlen", &tmp))
244d4b5cae4SRobert Watson 			rtsock_nh.nh_qlimit = tmp;
245d4b5cae4SRobert Watson 		netisr_register(&rtsock_nh);
246d989c7b3SRobert Watson 	}
247484149deSBjoern A. Zeeb #ifdef VIMAGE
248484149deSBjoern A. Zeeb 	 else
249484149deSBjoern A. Zeeb 		netisr_register_vnet(&rtsock_nh);
250484149deSBjoern A. Zeeb #endif
251484149deSBjoern A. Zeeb }
252484149deSBjoern A. Zeeb VNET_SYSINIT(vnet_rtsock, SI_SUB_PROTO_DOMAIN, SI_ORDER_THIRD,
253484149deSBjoern A. Zeeb     vnet_rts_init, 0);
254484149deSBjoern A. Zeeb 
255484149deSBjoern A. Zeeb #ifdef VIMAGE
256484149deSBjoern A. Zeeb static void
257484149deSBjoern A. Zeeb vnet_rts_uninit(void)
258484149deSBjoern A. Zeeb {
259484149deSBjoern A. Zeeb 
260484149deSBjoern A. Zeeb 	netisr_unregister_vnet(&rtsock_nh);
261484149deSBjoern A. Zeeb }
262484149deSBjoern A. Zeeb VNET_SYSUNINIT(vnet_rts_uninit, SI_SUB_PROTO_DOMAIN, SI_ORDER_THIRD,
263484149deSBjoern A. Zeeb     vnet_rts_uninit, 0);
264484149deSBjoern A. Zeeb #endif
265d989c7b3SRobert Watson 
266528737fdSBjoern A. Zeeb static int
267528737fdSBjoern A. Zeeb raw_input_rts_cb(struct mbuf *m, struct sockproto *proto, struct sockaddr *src,
268528737fdSBjoern A. Zeeb     struct rawcb *rp)
269528737fdSBjoern A. Zeeb {
270528737fdSBjoern A. Zeeb 	int fibnum;
271528737fdSBjoern A. Zeeb 
272528737fdSBjoern A. Zeeb 	KASSERT(m != NULL, ("%s: m is NULL", __func__));
273528737fdSBjoern A. Zeeb 	KASSERT(proto != NULL, ("%s: proto is NULL", __func__));
274528737fdSBjoern A. Zeeb 	KASSERT(rp != NULL, ("%s: rp is NULL", __func__));
275528737fdSBjoern A. Zeeb 
276528737fdSBjoern A. Zeeb 	/* No filtering requested. */
277528737fdSBjoern A. Zeeb 	if ((m->m_flags & RTS_FILTER_FIB) == 0)
278528737fdSBjoern A. Zeeb 		return (0);
279528737fdSBjoern A. Zeeb 
280528737fdSBjoern A. Zeeb 	/* Check if it is a rts and the fib matches the one of the socket. */
281528737fdSBjoern A. Zeeb 	fibnum = M_GETFIB(m);
282528737fdSBjoern A. Zeeb 	if (proto->sp_family != PF_ROUTE ||
283528737fdSBjoern A. Zeeb 	    rp->rcb_socket == NULL ||
284528737fdSBjoern A. Zeeb 	    rp->rcb_socket->so_fibnum == fibnum)
285528737fdSBjoern A. Zeeb 		return (0);
286528737fdSBjoern A. Zeeb 
287528737fdSBjoern A. Zeeb 	/* Filtering requested and no match, the socket shall be skipped. */
288528737fdSBjoern A. Zeeb 	return (1);
289528737fdSBjoern A. Zeeb }
290528737fdSBjoern A. Zeeb 
291d989c7b3SRobert Watson static void
292d989c7b3SRobert Watson rts_input(struct mbuf *m)
293d989c7b3SRobert Watson {
294d989c7b3SRobert Watson 	struct sockproto route_proto;
295d989c7b3SRobert Watson 	unsigned short *family;
296d989c7b3SRobert Watson 	struct m_tag *tag;
297d989c7b3SRobert Watson 
298d989c7b3SRobert Watson 	route_proto.sp_family = PF_ROUTE;
299d989c7b3SRobert Watson 	tag = m_tag_find(m, PACKET_TAG_RTSOCKFAM, NULL);
300d989c7b3SRobert Watson 	if (tag != NULL) {
301d989c7b3SRobert Watson 		family = (unsigned short *)(tag + 1);
302d989c7b3SRobert Watson 		route_proto.sp_protocol = *family;
303d989c7b3SRobert Watson 		m_tag_delete(m, tag);
304d989c7b3SRobert Watson 	} else
305d989c7b3SRobert Watson 		route_proto.sp_protocol = 0;
306d989c7b3SRobert Watson 
307528737fdSBjoern A. Zeeb 	raw_input_ext(m, &route_proto, &route_src, raw_input_rts_cb);
308d989c7b3SRobert Watson }
309d989c7b3SRobert Watson 
310a29f300eSGarrett Wollman /*
311a29f300eSGarrett Wollman  * It really doesn't make any sense at all for this code to share much
312a29f300eSGarrett Wollman  * with raw_usrreq.c, since its functionality is so restricted.  XXX
313a29f300eSGarrett Wollman  */
314ac45e92fSRobert Watson static void
315a29f300eSGarrett Wollman rts_abort(struct socket *so)
316df8bae1dSRodney W. Grimes {
3177e994955SRobert Watson 
318ac45e92fSRobert Watson 	raw_usrreqs.pru_abort(so);
319df8bae1dSRodney W. Grimes }
320a29f300eSGarrett Wollman 
321a152f8a3SRobert Watson static void
322a152f8a3SRobert Watson rts_close(struct socket *so)
323a152f8a3SRobert Watson {
324a152f8a3SRobert Watson 
325a152f8a3SRobert Watson 	raw_usrreqs.pru_close(so);
326a152f8a3SRobert Watson }
327a152f8a3SRobert Watson 
328a29f300eSGarrett Wollman /* pru_accept is EOPNOTSUPP */
329a29f300eSGarrett Wollman 
330a29f300eSGarrett Wollman static int
331b40ce416SJulian Elischer rts_attach(struct socket *so, int proto, struct thread *td)
332a29f300eSGarrett Wollman {
333a29f300eSGarrett Wollman 	struct rawcb *rp;
334c9b652e3SAndre Oppermann 	int error;
335a29f300eSGarrett Wollman 
336bc725eafSRobert Watson 	KASSERT(so->so_pcb == NULL, ("rts_attach: so_pcb != NULL"));
337bc725eafSRobert Watson 
3387cc0979fSDavid Malone 	/* XXX */
3391ede983cSDag-Erling Smørgrav 	rp = malloc(sizeof *rp, M_PCB, M_WAITOK | M_ZERO);
340a29f300eSGarrett Wollman 
341a29f300eSGarrett Wollman 	so->so_pcb = (caddr_t)rp;
3428b07e49aSJulian Elischer 	so->so_fibnum = td->td_proc->p_fibnum;
343162c0b2eSRuslan Ermilov 	error = raw_attach(so, proto);
344a29f300eSGarrett Wollman 	rp = sotorawcb(so);
345a29f300eSGarrett Wollman 	if (error) {
3467ba271aeSJonathan Chen 		so->so_pcb = NULL;
347a29f300eSGarrett Wollman 		free(rp, M_PCB);
348a29f300eSGarrett Wollman 		return error;
349a29f300eSGarrett Wollman 	}
350aea8b30fSSam Leffler 	RTSOCK_LOCK();
351a29f300eSGarrett Wollman 	switch(rp->rcb_proto.sp_protocol) {
352a29f300eSGarrett Wollman 	case AF_INET:
353c5d4eab6SMarko Zec 		V_route_cb.ip_count++;
354a29f300eSGarrett Wollman 		break;
355899ce4f4SYoshinobu Inoue 	case AF_INET6:
356c5d4eab6SMarko Zec 		V_route_cb.ip6_count++;
357899ce4f4SYoshinobu Inoue 		break;
358a29f300eSGarrett Wollman 	}
359c5d4eab6SMarko Zec 	V_route_cb.any_count++;
360aea8b30fSSam Leffler 	RTSOCK_UNLOCK();
36103e49181SSeigo Tanimura 	soisconnected(so);
362df8bae1dSRodney W. Grimes 	so->so_options |= SO_USELOOPBACK;
363a29f300eSGarrett Wollman 	return 0;
364df8bae1dSRodney W. Grimes }
365df8bae1dSRodney W. Grimes 
366a29f300eSGarrett Wollman static int
367b40ce416SJulian Elischer rts_bind(struct socket *so, struct sockaddr *nam, struct thread *td)
368a29f300eSGarrett Wollman {
3697e994955SRobert Watson 
3707e994955SRobert Watson 	return (raw_usrreqs.pru_bind(so, nam, td)); /* xxx just EINVAL */
371a29f300eSGarrett Wollman }
372a29f300eSGarrett Wollman 
373a29f300eSGarrett Wollman static int
374b40ce416SJulian Elischer rts_connect(struct socket *so, struct sockaddr *nam, struct thread *td)
375a29f300eSGarrett Wollman {
3767e994955SRobert Watson 
3777e994955SRobert Watson 	return (raw_usrreqs.pru_connect(so, nam, td)); /* XXX just EINVAL */
378a29f300eSGarrett Wollman }
379a29f300eSGarrett Wollman 
380a29f300eSGarrett Wollman /* pru_connect2 is EOPNOTSUPP */
381a29f300eSGarrett Wollman /* pru_control is EOPNOTSUPP */
382a29f300eSGarrett Wollman 
383bc725eafSRobert Watson static void
384a29f300eSGarrett Wollman rts_detach(struct socket *so)
385a29f300eSGarrett Wollman {
386a29f300eSGarrett Wollman 	struct rawcb *rp = sotorawcb(so);
387a29f300eSGarrett Wollman 
388bc725eafSRobert Watson 	KASSERT(rp != NULL, ("rts_detach: rp == NULL"));
389bc725eafSRobert Watson 
390aea8b30fSSam Leffler 	RTSOCK_LOCK();
391a29f300eSGarrett Wollman 	switch(rp->rcb_proto.sp_protocol) {
392a29f300eSGarrett Wollman 	case AF_INET:
393c5d4eab6SMarko Zec 		V_route_cb.ip_count--;
394a29f300eSGarrett Wollman 		break;
395899ce4f4SYoshinobu Inoue 	case AF_INET6:
396c5d4eab6SMarko Zec 		V_route_cb.ip6_count--;
397899ce4f4SYoshinobu Inoue 		break;
398a29f300eSGarrett Wollman 	}
399c5d4eab6SMarko Zec 	V_route_cb.any_count--;
400aea8b30fSSam Leffler 	RTSOCK_UNLOCK();
401bc725eafSRobert Watson 	raw_usrreqs.pru_detach(so);
402a29f300eSGarrett Wollman }
403a29f300eSGarrett Wollman 
404a29f300eSGarrett Wollman static int
405a29f300eSGarrett Wollman rts_disconnect(struct socket *so)
406a29f300eSGarrett Wollman {
4077e994955SRobert Watson 
4087e994955SRobert Watson 	return (raw_usrreqs.pru_disconnect(so));
409a29f300eSGarrett Wollman }
410a29f300eSGarrett Wollman 
411a29f300eSGarrett Wollman /* pru_listen is EOPNOTSUPP */
412a29f300eSGarrett Wollman 
413a29f300eSGarrett Wollman static int
41457bf258eSGarrett Wollman rts_peeraddr(struct socket *so, struct sockaddr **nam)
415a29f300eSGarrett Wollman {
4167e994955SRobert Watson 
4177e994955SRobert Watson 	return (raw_usrreqs.pru_peeraddr(so, nam));
418a29f300eSGarrett Wollman }
419a29f300eSGarrett Wollman 
420a29f300eSGarrett Wollman /* pru_rcvd is EOPNOTSUPP */
421a29f300eSGarrett Wollman /* pru_rcvoob is EOPNOTSUPP */
422a29f300eSGarrett Wollman 
423a29f300eSGarrett Wollman static int
42457bf258eSGarrett Wollman rts_send(struct socket *so, int flags, struct mbuf *m, struct sockaddr *nam,
425b40ce416SJulian Elischer 	 struct mbuf *control, struct thread *td)
426a29f300eSGarrett Wollman {
4277e994955SRobert Watson 
4287e994955SRobert Watson 	return (raw_usrreqs.pru_send(so, flags, m, nam, control, td));
429a29f300eSGarrett Wollman }
430a29f300eSGarrett Wollman 
431a29f300eSGarrett Wollman /* pru_sense is null */
432a29f300eSGarrett Wollman 
433a29f300eSGarrett Wollman static int
434a29f300eSGarrett Wollman rts_shutdown(struct socket *so)
435a29f300eSGarrett Wollman {
4367e994955SRobert Watson 
4377e994955SRobert Watson 	return (raw_usrreqs.pru_shutdown(so));
438a29f300eSGarrett Wollman }
439a29f300eSGarrett Wollman 
440a29f300eSGarrett Wollman static int
44157bf258eSGarrett Wollman rts_sockaddr(struct socket *so, struct sockaddr **nam)
442a29f300eSGarrett Wollman {
4437e994955SRobert Watson 
4447e994955SRobert Watson 	return (raw_usrreqs.pru_sockaddr(so, nam));
445a29f300eSGarrett Wollman }
446a29f300eSGarrett Wollman 
447a29f300eSGarrett Wollman static struct pr_usrreqs route_usrreqs = {
448756d52a1SPoul-Henning Kamp 	.pru_abort =		rts_abort,
449756d52a1SPoul-Henning Kamp 	.pru_attach =		rts_attach,
450756d52a1SPoul-Henning Kamp 	.pru_bind =		rts_bind,
451756d52a1SPoul-Henning Kamp 	.pru_connect =		rts_connect,
452756d52a1SPoul-Henning Kamp 	.pru_detach =		rts_detach,
453756d52a1SPoul-Henning Kamp 	.pru_disconnect =	rts_disconnect,
454756d52a1SPoul-Henning Kamp 	.pru_peeraddr =		rts_peeraddr,
455756d52a1SPoul-Henning Kamp 	.pru_send =		rts_send,
456756d52a1SPoul-Henning Kamp 	.pru_shutdown =		rts_shutdown,
457756d52a1SPoul-Henning Kamp 	.pru_sockaddr =		rts_sockaddr,
458a152f8a3SRobert Watson 	.pru_close =		rts_close,
459a29f300eSGarrett Wollman };
460a29f300eSGarrett Wollman 
461413628a7SBjoern A. Zeeb #ifndef _SOCKADDR_UNION_DEFINED
462413628a7SBjoern A. Zeeb #define	_SOCKADDR_UNION_DEFINED
463413628a7SBjoern A. Zeeb /*
464413628a7SBjoern A. Zeeb  * The union of all possible address formats we handle.
465413628a7SBjoern A. Zeeb  */
466413628a7SBjoern A. Zeeb union sockaddr_union {
467413628a7SBjoern A. Zeeb 	struct sockaddr		sa;
468413628a7SBjoern A. Zeeb 	struct sockaddr_in	sin;
469413628a7SBjoern A. Zeeb 	struct sockaddr_in6	sin6;
470413628a7SBjoern A. Zeeb };
471413628a7SBjoern A. Zeeb #endif /* _SOCKADDR_UNION_DEFINED */
472413628a7SBjoern A. Zeeb 
473413628a7SBjoern A. Zeeb static int
474413628a7SBjoern A. Zeeb rtm_get_jailed(struct rt_addrinfo *info, struct ifnet *ifp,
475aaad3c4fSAlexander V. Chernikov     struct nhop_object *nh, union sockaddr_union *saun, struct ucred *cred)
476413628a7SBjoern A. Zeeb {
477a68cc388SGleb Smirnoff #if defined(INET) || defined(INET6)
478a68cc388SGleb Smirnoff 	struct epoch_tracker et;
479a68cc388SGleb Smirnoff #endif
480413628a7SBjoern A. Zeeb 
4819c79d243SJamie Gritton 	/* First, see if the returned address is part of the jail. */
482aaad3c4fSAlexander V. Chernikov 	if (prison_if(cred, nh->nh_ifa->ifa_addr) == 0) {
483aaad3c4fSAlexander V. Chernikov 		info->rti_info[RTAX_IFA] = nh->nh_ifa->ifa_addr;
4849c79d243SJamie Gritton 		return (0);
4859c79d243SJamie Gritton 	}
4869c79d243SJamie Gritton 
487413628a7SBjoern A. Zeeb 	switch (info->rti_info[RTAX_DST]->sa_family) {
488413628a7SBjoern A. Zeeb #ifdef INET
489413628a7SBjoern A. Zeeb 	case AF_INET:
490413628a7SBjoern A. Zeeb 	{
491413628a7SBjoern A. Zeeb 		struct in_addr ia;
492413628a7SBjoern A. Zeeb 		struct ifaddr *ifa;
493413628a7SBjoern A. Zeeb 		int found;
494413628a7SBjoern A. Zeeb 
495413628a7SBjoern A. Zeeb 		found = 0;
496413628a7SBjoern A. Zeeb 		/*
4979c79d243SJamie Gritton 		 * Try to find an address on the given outgoing interface
4989c79d243SJamie Gritton 		 * that belongs to the jail.
499413628a7SBjoern A. Zeeb 		 */
500a68cc388SGleb Smirnoff 		NET_EPOCH_ENTER(et);
501d7c5a620SMatt Macy 		CK_STAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) {
502413628a7SBjoern A. Zeeb 			struct sockaddr *sa;
503413628a7SBjoern A. Zeeb 			sa = ifa->ifa_addr;
504413628a7SBjoern A. Zeeb 			if (sa->sa_family != AF_INET)
505413628a7SBjoern A. Zeeb 				continue;
506413628a7SBjoern A. Zeeb 			ia = ((struct sockaddr_in *)sa)->sin_addr;
507b89e82ddSJamie Gritton 			if (prison_check_ip4(cred, &ia) == 0) {
508413628a7SBjoern A. Zeeb 				found = 1;
509413628a7SBjoern A. Zeeb 				break;
510413628a7SBjoern A. Zeeb 			}
511413628a7SBjoern A. Zeeb 		}
512a68cc388SGleb Smirnoff 		NET_EPOCH_EXIT(et);
513413628a7SBjoern A. Zeeb 		if (!found) {
514413628a7SBjoern A. Zeeb 			/*
5159c79d243SJamie Gritton 			 * As a last resort return the 'default' jail address.
516413628a7SBjoern A. Zeeb 			 */
517aaad3c4fSAlexander V. Chernikov 			ia = ((struct sockaddr_in *)nh->nh_ifa->ifa_addr)->
5180304c731SJamie Gritton 			    sin_addr;
5191cecba0fSBjoern A. Zeeb 			if (prison_get_ip4(cred, &ia) != 0)
520413628a7SBjoern A. Zeeb 				return (ESRCH);
521413628a7SBjoern A. Zeeb 		}
522413628a7SBjoern A. Zeeb 		bzero(&saun->sin, sizeof(struct sockaddr_in));
523413628a7SBjoern A. Zeeb 		saun->sin.sin_len = sizeof(struct sockaddr_in);
524413628a7SBjoern A. Zeeb 		saun->sin.sin_family = AF_INET;
525413628a7SBjoern A. Zeeb 		saun->sin.sin_addr.s_addr = ia.s_addr;
5269c79d243SJamie Gritton 		info->rti_info[RTAX_IFA] = (struct sockaddr *)&saun->sin;
527413628a7SBjoern A. Zeeb 		break;
528413628a7SBjoern A. Zeeb 	}
529413628a7SBjoern A. Zeeb #endif
530413628a7SBjoern A. Zeeb #ifdef INET6
531413628a7SBjoern A. Zeeb 	case AF_INET6:
532413628a7SBjoern A. Zeeb 	{
533413628a7SBjoern A. Zeeb 		struct in6_addr ia6;
534413628a7SBjoern A. Zeeb 		struct ifaddr *ifa;
535413628a7SBjoern A. Zeeb 		int found;
536413628a7SBjoern A. Zeeb 
537413628a7SBjoern A. Zeeb 		found = 0;
538413628a7SBjoern A. Zeeb 		/*
5399c79d243SJamie Gritton 		 * Try to find an address on the given outgoing interface
5409c79d243SJamie Gritton 		 * that belongs to the jail.
541413628a7SBjoern A. Zeeb 		 */
542a68cc388SGleb Smirnoff 		NET_EPOCH_ENTER(et);
543d7c5a620SMatt Macy 		CK_STAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) {
544413628a7SBjoern A. Zeeb 			struct sockaddr *sa;
545413628a7SBjoern A. Zeeb 			sa = ifa->ifa_addr;
546413628a7SBjoern A. Zeeb 			if (sa->sa_family != AF_INET6)
547413628a7SBjoern A. Zeeb 				continue;
548413628a7SBjoern A. Zeeb 			bcopy(&((struct sockaddr_in6 *)sa)->sin6_addr,
549413628a7SBjoern A. Zeeb 			    &ia6, sizeof(struct in6_addr));
550b89e82ddSJamie Gritton 			if (prison_check_ip6(cred, &ia6) == 0) {
551413628a7SBjoern A. Zeeb 				found = 1;
552413628a7SBjoern A. Zeeb 				break;
553413628a7SBjoern A. Zeeb 			}
554413628a7SBjoern A. Zeeb 		}
555a68cc388SGleb Smirnoff 		NET_EPOCH_EXIT(et);
556413628a7SBjoern A. Zeeb 		if (!found) {
557413628a7SBjoern A. Zeeb 			/*
5589c79d243SJamie Gritton 			 * As a last resort return the 'default' jail address.
559413628a7SBjoern A. Zeeb 			 */
560aaad3c4fSAlexander V. Chernikov 			ia6 = ((struct sockaddr_in6 *)nh->nh_ifa->ifa_addr)->
5610304c731SJamie Gritton 			    sin6_addr;
5621cecba0fSBjoern A. Zeeb 			if (prison_get_ip6(cred, &ia6) != 0)
563413628a7SBjoern A. Zeeb 				return (ESRCH);
564413628a7SBjoern A. Zeeb 		}
565413628a7SBjoern A. Zeeb 		bzero(&saun->sin6, sizeof(struct sockaddr_in6));
566413628a7SBjoern A. Zeeb 		saun->sin6.sin6_len = sizeof(struct sockaddr_in6);
567413628a7SBjoern A. Zeeb 		saun->sin6.sin6_family = AF_INET6;
5689c79d243SJamie Gritton 		bcopy(&ia6, &saun->sin6.sin6_addr, sizeof(struct in6_addr));
569413628a7SBjoern A. Zeeb 		if (sa6_recoverscope(&saun->sin6) != 0)
570413628a7SBjoern A. Zeeb 			return (ESRCH);
5719c79d243SJamie Gritton 		info->rti_info[RTAX_IFA] = (struct sockaddr *)&saun->sin6;
572413628a7SBjoern A. Zeeb 		break;
573413628a7SBjoern A. Zeeb 	}
574413628a7SBjoern A. Zeeb #endif
575413628a7SBjoern A. Zeeb 	default:
576413628a7SBjoern A. Zeeb 		return (ESRCH);
577413628a7SBjoern A. Zeeb 	}
578413628a7SBjoern A. Zeeb 	return (0);
579413628a7SBjoern A. Zeeb }
580413628a7SBjoern A. Zeeb 
581145bf6c0SAlexander V. Chernikov static int
582145bf6c0SAlexander V. Chernikov fill_blackholeinfo(struct rt_addrinfo *info, union sockaddr_union *saun)
583145bf6c0SAlexander V. Chernikov {
584145bf6c0SAlexander V. Chernikov 	struct ifaddr *ifa;
585145bf6c0SAlexander V. Chernikov 	sa_family_t saf;
586145bf6c0SAlexander V. Chernikov 
587145bf6c0SAlexander V. Chernikov 	if (V_loif == NULL) {
5886fa8ed43SAlexander V. Chernikov 		RTS_PID_LOG(LOG_INFO, "Unable to add blackhole/reject nhop without loopback");
589145bf6c0SAlexander V. Chernikov 		return (ENOTSUP);
590145bf6c0SAlexander V. Chernikov 	}
591145bf6c0SAlexander V. Chernikov 	info->rti_ifp = V_loif;
592145bf6c0SAlexander V. Chernikov 
593145bf6c0SAlexander V. Chernikov 	saf = info->rti_info[RTAX_DST]->sa_family;
594145bf6c0SAlexander V. Chernikov 
595145bf6c0SAlexander V. Chernikov 	CK_STAILQ_FOREACH(ifa, &info->rti_ifp->if_addrhead, ifa_link) {
596145bf6c0SAlexander V. Chernikov 		if (ifa->ifa_addr->sa_family == saf) {
597145bf6c0SAlexander V. Chernikov 			info->rti_ifa = ifa;
598145bf6c0SAlexander V. Chernikov 			break;
599145bf6c0SAlexander V. Chernikov 		}
600145bf6c0SAlexander V. Chernikov 	}
6016fa8ed43SAlexander V. Chernikov 	if (info->rti_ifa == NULL) {
6026fa8ed43SAlexander V. Chernikov 		RTS_PID_LOG(LOG_INFO, "Unable to find ifa for blackhole/reject nhop");
603145bf6c0SAlexander V. Chernikov 		return (ENOTSUP);
6046fa8ed43SAlexander V. Chernikov 	}
605145bf6c0SAlexander V. Chernikov 
606145bf6c0SAlexander V. Chernikov 	bzero(saun, sizeof(union sockaddr_union));
607145bf6c0SAlexander V. Chernikov 	switch (saf) {
6088ca99aecSAlexander V. Chernikov #ifdef INET
609145bf6c0SAlexander V. Chernikov 	case AF_INET:
610145bf6c0SAlexander V. Chernikov 		saun->sin.sin_family = AF_INET;
611145bf6c0SAlexander V. Chernikov 		saun->sin.sin_len = sizeof(struct sockaddr_in);
612145bf6c0SAlexander V. Chernikov 		saun->sin.sin_addr.s_addr = htonl(INADDR_LOOPBACK);
613145bf6c0SAlexander V. Chernikov 		break;
6148ca99aecSAlexander V. Chernikov #endif
6158ca99aecSAlexander V. Chernikov #ifdef INET6
616145bf6c0SAlexander V. Chernikov 	case AF_INET6:
617145bf6c0SAlexander V. Chernikov 		saun->sin6.sin6_family = AF_INET6;
618145bf6c0SAlexander V. Chernikov 		saun->sin6.sin6_len = sizeof(struct sockaddr_in6);
619145bf6c0SAlexander V. Chernikov 		saun->sin6.sin6_addr = in6addr_loopback;
620145bf6c0SAlexander V. Chernikov 		break;
6218ca99aecSAlexander V. Chernikov #endif
622145bf6c0SAlexander V. Chernikov 	default:
6236fa8ed43SAlexander V. Chernikov 		RTS_PID_LOG(LOG_INFO, "unsupported family: %d", saf);
624145bf6c0SAlexander V. Chernikov 		return (ENOTSUP);
625145bf6c0SAlexander V. Chernikov 	}
626145bf6c0SAlexander V. Chernikov 	info->rti_info[RTAX_GATEWAY] = &saun->sa;
627145bf6c0SAlexander V. Chernikov 	info->rti_flags |= RTF_GATEWAY;
628145bf6c0SAlexander V. Chernikov 
629145bf6c0SAlexander V. Chernikov 	return (0);
630145bf6c0SAlexander V. Chernikov }
631145bf6c0SAlexander V. Chernikov 
632c83dda36SAlexander V. Chernikov /*
633c83dda36SAlexander V. Chernikov  * Fills in @info based on userland-provided @rtm message.
634c83dda36SAlexander V. Chernikov  *
635c83dda36SAlexander V. Chernikov  * Returns 0 on success.
636c83dda36SAlexander V. Chernikov  */
637c83dda36SAlexander V. Chernikov static int
638b31fbebeSAlexander V. Chernikov fill_addrinfo(struct rt_msghdr *rtm, int len, struct linear_buffer *lb, u_int fibnum,
639b31fbebeSAlexander V. Chernikov     struct rt_addrinfo *info)
640c83dda36SAlexander V. Chernikov {
641c83dda36SAlexander V. Chernikov 	int error;
642c83dda36SAlexander V. Chernikov 
643c83dda36SAlexander V. Chernikov 	rtm->rtm_pid = curproc->p_pid;
644c83dda36SAlexander V. Chernikov 	info->rti_addrs = rtm->rtm_addrs;
645c83dda36SAlexander V. Chernikov 
646c83dda36SAlexander V. Chernikov 	info->rti_mflags = rtm->rtm_inits;
647c83dda36SAlexander V. Chernikov 	info->rti_rmx = &rtm->rtm_rmx;
648c83dda36SAlexander V. Chernikov 
649c83dda36SAlexander V. Chernikov 	/*
650c83dda36SAlexander V. Chernikov 	 * rt_xaddrs() performs s6_addr[2] := sin6_scope_id for AF_INET6
651c83dda36SAlexander V. Chernikov 	 * link-local address because rtrequest requires addresses with
652c83dda36SAlexander V. Chernikov 	 * embedded scope id.
653c83dda36SAlexander V. Chernikov 	 */
654c83dda36SAlexander V. Chernikov 	if (rt_xaddrs((caddr_t)(rtm + 1), len + (caddr_t)rtm, info))
655c83dda36SAlexander V. Chernikov 		return (EINVAL);
656c83dda36SAlexander V. Chernikov 
657c83dda36SAlexander V. Chernikov 	info->rti_flags = rtm->rtm_flags;
658b31fbebeSAlexander V. Chernikov 	error = cleanup_xaddrs(info, lb);
6592fe5a794SAlexander V. Chernikov 	if (error != 0)
6602fe5a794SAlexander V. Chernikov 		return (error);
661c83dda36SAlexander V. Chernikov 	/*
662c83dda36SAlexander V. Chernikov 	 * Verify that the caller has the appropriate privilege; RTM_GET
663c83dda36SAlexander V. Chernikov 	 * is the only operation the non-superuser is allowed.
664c83dda36SAlexander V. Chernikov 	 */
665c83dda36SAlexander V. Chernikov 	if (rtm->rtm_type != RTM_GET) {
666c83dda36SAlexander V. Chernikov 		error = priv_check(curthread, PRIV_NET_ROUTE);
667c83dda36SAlexander V. Chernikov 		if (error != 0)
668c83dda36SAlexander V. Chernikov 			return (error);
669c83dda36SAlexander V. Chernikov 	}
670c83dda36SAlexander V. Chernikov 
671c83dda36SAlexander V. Chernikov 	/*
672c83dda36SAlexander V. Chernikov 	 * The given gateway address may be an interface address.
673c83dda36SAlexander V. Chernikov 	 * For example, issuing a "route change" command on a route
674c83dda36SAlexander V. Chernikov 	 * entry that was created from a tunnel, and the gateway
675c83dda36SAlexander V. Chernikov 	 * address given is the local end point. In this case the
676c83dda36SAlexander V. Chernikov 	 * RTF_GATEWAY flag must be cleared or the destination will
677c83dda36SAlexander V. Chernikov 	 * not be reachable even though there is no error message.
678c83dda36SAlexander V. Chernikov 	 */
679c83dda36SAlexander V. Chernikov 	if (info->rti_info[RTAX_GATEWAY] != NULL &&
680c83dda36SAlexander V. Chernikov 	    info->rti_info[RTAX_GATEWAY]->sa_family != AF_LINK) {
681c83dda36SAlexander V. Chernikov 		struct rt_addrinfo ginfo;
682c83dda36SAlexander V. Chernikov 		struct sockaddr *gdst;
683c83dda36SAlexander V. Chernikov 		struct sockaddr_storage ss;
684c83dda36SAlexander V. Chernikov 
685c83dda36SAlexander V. Chernikov 		bzero(&ginfo, sizeof(ginfo));
686c83dda36SAlexander V. Chernikov 		bzero(&ss, sizeof(ss));
687c83dda36SAlexander V. Chernikov 		ss.ss_len = sizeof(ss);
688c83dda36SAlexander V. Chernikov 
689c83dda36SAlexander V. Chernikov 		ginfo.rti_info[RTAX_GATEWAY] = (struct sockaddr *)&ss;
690c83dda36SAlexander V. Chernikov 		gdst = info->rti_info[RTAX_GATEWAY];
691c83dda36SAlexander V. Chernikov 
692c83dda36SAlexander V. Chernikov 		/*
693c83dda36SAlexander V. Chernikov 		 * A host route through the loopback interface is
694c83dda36SAlexander V. Chernikov 		 * installed for each interface adddress. In pre 8.0
695c83dda36SAlexander V. Chernikov 		 * releases the interface address of a PPP link type
696c83dda36SAlexander V. Chernikov 		 * is not reachable locally. This behavior is fixed as
697c83dda36SAlexander V. Chernikov 		 * part of the new L2/L3 redesign and rewrite work. The
698c83dda36SAlexander V. Chernikov 		 * signature of this interface address route is the
699aaad3c4fSAlexander V. Chernikov 		 * AF_LINK sa_family type of the gateway, and the
700c83dda36SAlexander V. Chernikov 		 * rt_ifp has the IFF_LOOPBACK flag set.
701c83dda36SAlexander V. Chernikov 		 */
702c83dda36SAlexander V. Chernikov 		if (rib_lookup_info(fibnum, gdst, NHR_REF, 0, &ginfo) == 0) {
703c83dda36SAlexander V. Chernikov 			if (ss.ss_family == AF_LINK &&
704c83dda36SAlexander V. Chernikov 			    ginfo.rti_ifp->if_flags & IFF_LOOPBACK) {
705c83dda36SAlexander V. Chernikov 				info->rti_flags &= ~RTF_GATEWAY;
706c83dda36SAlexander V. Chernikov 				info->rti_flags |= RTF_GWFLAG_COMPAT;
707c83dda36SAlexander V. Chernikov 			}
708c83dda36SAlexander V. Chernikov 			rib_free_info(&ginfo);
709c83dda36SAlexander V. Chernikov 		}
710c83dda36SAlexander V. Chernikov 	}
711c83dda36SAlexander V. Chernikov 
712c83dda36SAlexander V. Chernikov 	return (0);
713c83dda36SAlexander V. Chernikov }
714c83dda36SAlexander V. Chernikov 
715fedeb08bSAlexander V. Chernikov static struct nhop_object *
716fedeb08bSAlexander V. Chernikov select_nhop(struct nhop_object *nh, const struct sockaddr *gw)
717fedeb08bSAlexander V. Chernikov {
718fedeb08bSAlexander V. Chernikov 	if (!NH_IS_NHGRP(nh))
719fedeb08bSAlexander V. Chernikov 		return (nh);
720fedeb08bSAlexander V. Chernikov #ifdef ROUTE_MPATH
721fedeb08bSAlexander V. Chernikov 	struct weightened_nhop *wn;
722fedeb08bSAlexander V. Chernikov 	uint32_t num_nhops;
723fedeb08bSAlexander V. Chernikov 	wn = nhgrp_get_nhops((struct nhgrp_object *)nh, &num_nhops);
724fedeb08bSAlexander V. Chernikov 	if (gw == NULL)
725fedeb08bSAlexander V. Chernikov 		return (wn[0].nh);
726fedeb08bSAlexander V. Chernikov 	for (int i = 0; i < num_nhops; i++) {
727fedeb08bSAlexander V. Chernikov 		if (match_nhop_gw(wn[i].nh, gw))
728fedeb08bSAlexander V. Chernikov 			return (wn[i].nh);
729fedeb08bSAlexander V. Chernikov 	}
730fedeb08bSAlexander V. Chernikov #endif
731fedeb08bSAlexander V. Chernikov 	return (NULL);
732fedeb08bSAlexander V. Chernikov }
733fedeb08bSAlexander V. Chernikov 
734c83dda36SAlexander V. Chernikov /*
735c83dda36SAlexander V. Chernikov  * Handles RTM_GET message from routing socket, returning matching rt.
736c83dda36SAlexander V. Chernikov  *
737c83dda36SAlexander V. Chernikov  * Returns:
738c83dda36SAlexander V. Chernikov  * 0 on success, with locked and referenced matching rt in @rt_nrt
739c83dda36SAlexander V. Chernikov  * errno of failure
740c83dda36SAlexander V. Chernikov  */
741c83dda36SAlexander V. Chernikov static int
742c83dda36SAlexander V. Chernikov handle_rtm_get(struct rt_addrinfo *info, u_int fibnum,
743a287a973SAlexander V. Chernikov     struct rt_msghdr *rtm, struct rib_cmd_info *rc)
744c83dda36SAlexander V. Chernikov {
745c83dda36SAlexander V. Chernikov 	RIB_RLOCK_TRACKER;
746c83dda36SAlexander V. Chernikov 	struct rib_head *rnh;
747fedeb08bSAlexander V. Chernikov 	struct nhop_object *nh;
748c83dda36SAlexander V. Chernikov 	sa_family_t saf;
749c83dda36SAlexander V. Chernikov 
750c83dda36SAlexander V. Chernikov 	saf = info->rti_info[RTAX_DST]->sa_family;
751c83dda36SAlexander V. Chernikov 
752c83dda36SAlexander V. Chernikov 	rnh = rt_tables_get_rnh(fibnum, saf);
753c83dda36SAlexander V. Chernikov 	if (rnh == NULL)
754c83dda36SAlexander V. Chernikov 		return (EAFNOSUPPORT);
755c83dda36SAlexander V. Chernikov 
756c83dda36SAlexander V. Chernikov 	RIB_RLOCK(rnh);
757c83dda36SAlexander V. Chernikov 
7582fe5a794SAlexander V. Chernikov 	/*
7592fe5a794SAlexander V. Chernikov 	 * By (implicit) convention host route (one without netmask)
7602fe5a794SAlexander V. Chernikov 	 * means longest-prefix-match request and the route with netmask
7612fe5a794SAlexander V. Chernikov 	 * means exact-match lookup.
7622fe5a794SAlexander V. Chernikov 	 * As cleanup_xaddrs() cleans up info flags&addrs for the /32,/128
7632fe5a794SAlexander V. Chernikov 	 * prefixes, use original data to check for the netmask presence.
7642fe5a794SAlexander V. Chernikov 	 */
7652fe5a794SAlexander V. Chernikov 	if ((rtm->rtm_addrs & RTA_NETMASK) == 0) {
766c83dda36SAlexander V. Chernikov 		/*
767c83dda36SAlexander V. Chernikov 		 * Provide longest prefix match for
768c83dda36SAlexander V. Chernikov 		 * address lookup (no mask).
769c83dda36SAlexander V. Chernikov 		 * 'route -n get addr'
770c83dda36SAlexander V. Chernikov 		 */
771a287a973SAlexander V. Chernikov 		rc->rc_rt = (struct rtentry *) rnh->rnh_matchaddr(
772c83dda36SAlexander V. Chernikov 		    info->rti_info[RTAX_DST], &rnh->head);
773c83dda36SAlexander V. Chernikov 	} else
774a287a973SAlexander V. Chernikov 		rc->rc_rt = (struct rtentry *) rnh->rnh_lookup(
775c83dda36SAlexander V. Chernikov 		    info->rti_info[RTAX_DST],
776c83dda36SAlexander V. Chernikov 		    info->rti_info[RTAX_NETMASK], &rnh->head);
777c83dda36SAlexander V. Chernikov 
778a287a973SAlexander V. Chernikov 	if (rc->rc_rt == NULL) {
779c83dda36SAlexander V. Chernikov 		RIB_RUNLOCK(rnh);
780c83dda36SAlexander V. Chernikov 		return (ESRCH);
781c83dda36SAlexander V. Chernikov 	}
782fedeb08bSAlexander V. Chernikov 
783d68fb8d9SAlexander V. Chernikov 	nh = select_nhop(rt_get_raw_nhop(rc->rc_rt), info->rti_info[RTAX_GATEWAY]);
784fedeb08bSAlexander V. Chernikov 	if (nh == NULL) {
785c83dda36SAlexander V. Chernikov 		RIB_RUNLOCK(rnh);
786c83dda36SAlexander V. Chernikov 		return (ESRCH);
787c83dda36SAlexander V. Chernikov 	}
788c83dda36SAlexander V. Chernikov 	/*
789c83dda36SAlexander V. Chernikov 	 * If performing proxied L2 entry insertion, and
790c83dda36SAlexander V. Chernikov 	 * the actual PPP host entry is found, perform
791c83dda36SAlexander V. Chernikov 	 * another search to retrieve the prefix route of
792c83dda36SAlexander V. Chernikov 	 * the local end point of the PPP link.
793aaad3c4fSAlexander V. Chernikov 	 * TODO: move this logic to userland.
794c83dda36SAlexander V. Chernikov 	 */
795c83dda36SAlexander V. Chernikov 	if (rtm->rtm_flags & RTF_ANNOUNCE) {
7969573cc35SKurosawa Takahiro 		struct sockaddr_storage laddr;
797c83dda36SAlexander V. Chernikov 
798aaad3c4fSAlexander V. Chernikov 		if (nh->nh_ifp != NULL &&
799aaad3c4fSAlexander V. Chernikov 		    nh->nh_ifp->if_type == IFT_PROPVIRTUAL) {
800c83dda36SAlexander V. Chernikov 			struct ifaddr *ifa;
801c83dda36SAlexander V. Chernikov 
802c83dda36SAlexander V. Chernikov 			ifa = ifa_ifwithnet(info->rti_info[RTAX_DST], 1,
803c83dda36SAlexander V. Chernikov 					RT_ALL_FIBS);
804c83dda36SAlexander V. Chernikov 			if (ifa != NULL)
805c83dda36SAlexander V. Chernikov 				rt_maskedcopy(ifa->ifa_addr,
8069573cc35SKurosawa Takahiro 					      (struct sockaddr *)&laddr,
807c83dda36SAlexander V. Chernikov 					      ifa->ifa_netmask);
808c83dda36SAlexander V. Chernikov 		} else
809aaad3c4fSAlexander V. Chernikov 			rt_maskedcopy(nh->nh_ifa->ifa_addr,
8109573cc35SKurosawa Takahiro 				      (struct sockaddr *)&laddr,
811aaad3c4fSAlexander V. Chernikov 				      nh->nh_ifa->ifa_netmask);
812c83dda36SAlexander V. Chernikov 		/*
813c83dda36SAlexander V. Chernikov 		 * refactor rt and no lock operation necessary
814c83dda36SAlexander V. Chernikov 		 */
8159573cc35SKurosawa Takahiro 		rc->rc_rt = (struct rtentry *)rnh->rnh_matchaddr(
8169573cc35SKurosawa Takahiro 		    (struct sockaddr *)&laddr, &rnh->head);
817a287a973SAlexander V. Chernikov 		if (rc->rc_rt == NULL) {
818c83dda36SAlexander V. Chernikov 			RIB_RUNLOCK(rnh);
819c83dda36SAlexander V. Chernikov 			return (ESRCH);
820c83dda36SAlexander V. Chernikov 		}
821d68fb8d9SAlexander V. Chernikov 		nh = select_nhop(rt_get_raw_nhop(rc->rc_rt), info->rti_info[RTAX_GATEWAY]);
822fedeb08bSAlexander V. Chernikov 		if (nh == NULL) {
823fedeb08bSAlexander V. Chernikov 			RIB_RUNLOCK(rnh);
824fedeb08bSAlexander V. Chernikov 			return (ESRCH);
825c83dda36SAlexander V. Chernikov 		}
826fedeb08bSAlexander V. Chernikov 	}
827fedeb08bSAlexander V. Chernikov 	rc->rc_nh_new = nh;
8282259a030SAlexander V. Chernikov 	rc->rc_nh_weight = rc->rc_rt->rt_weight;
829c83dda36SAlexander V. Chernikov 	RIB_RUNLOCK(rnh);
830c83dda36SAlexander V. Chernikov 
831c83dda36SAlexander V. Chernikov 	return (0);
832c83dda36SAlexander V. Chernikov }
833c83dda36SAlexander V. Chernikov 
834d68fb8d9SAlexander V. Chernikov static void
835d68fb8d9SAlexander V. Chernikov init_sockaddrs_family(int family, struct sockaddr *dst, struct sockaddr *mask)
836d68fb8d9SAlexander V. Chernikov {
837d68fb8d9SAlexander V. Chernikov #ifdef INET
838d68fb8d9SAlexander V. Chernikov 	if (family == AF_INET) {
839d68fb8d9SAlexander V. Chernikov 		struct sockaddr_in *dst4 = (struct sockaddr_in *)dst;
840d68fb8d9SAlexander V. Chernikov 		struct sockaddr_in *mask4 = (struct sockaddr_in *)mask;
841d68fb8d9SAlexander V. Chernikov 
842d68fb8d9SAlexander V. Chernikov 		bzero(dst4, sizeof(struct sockaddr_in));
843d68fb8d9SAlexander V. Chernikov 		bzero(mask4, sizeof(struct sockaddr_in));
844d68fb8d9SAlexander V. Chernikov 
845d68fb8d9SAlexander V. Chernikov 		dst4->sin_family = AF_INET;
846d68fb8d9SAlexander V. Chernikov 		dst4->sin_len = sizeof(struct sockaddr_in);
847d68fb8d9SAlexander V. Chernikov 		mask4->sin_family = AF_INET;
848d68fb8d9SAlexander V. Chernikov 		mask4->sin_len = sizeof(struct sockaddr_in);
849d68fb8d9SAlexander V. Chernikov 	}
850d68fb8d9SAlexander V. Chernikov #endif
851d68fb8d9SAlexander V. Chernikov #ifdef INET6
852d68fb8d9SAlexander V. Chernikov 	if (family == AF_INET6) {
853d68fb8d9SAlexander V. Chernikov 		struct sockaddr_in6 *dst6 = (struct sockaddr_in6 *)dst;
854d68fb8d9SAlexander V. Chernikov 		struct sockaddr_in6 *mask6 = (struct sockaddr_in6 *)mask;
855d68fb8d9SAlexander V. Chernikov 
856d68fb8d9SAlexander V. Chernikov 		bzero(dst6, sizeof(struct sockaddr_in6));
857d68fb8d9SAlexander V. Chernikov 		bzero(mask6, sizeof(struct sockaddr_in6));
858d68fb8d9SAlexander V. Chernikov 
859d68fb8d9SAlexander V. Chernikov 		dst6->sin6_family = AF_INET6;
860d68fb8d9SAlexander V. Chernikov 		dst6->sin6_len = sizeof(struct sockaddr_in6);
861d68fb8d9SAlexander V. Chernikov 		mask6->sin6_family = AF_INET6;
862d68fb8d9SAlexander V. Chernikov 		mask6->sin6_len = sizeof(struct sockaddr_in6);
863d68fb8d9SAlexander V. Chernikov 	}
864d68fb8d9SAlexander V. Chernikov #endif
865d68fb8d9SAlexander V. Chernikov }
866d68fb8d9SAlexander V. Chernikov 
867d68fb8d9SAlexander V. Chernikov static void
868d68fb8d9SAlexander V. Chernikov export_rtaddrs(const struct rtentry *rt, struct sockaddr *dst,
869d68fb8d9SAlexander V. Chernikov     struct sockaddr *mask)
870d68fb8d9SAlexander V. Chernikov {
871d68fb8d9SAlexander V. Chernikov #ifdef INET
872d68fb8d9SAlexander V. Chernikov 	if (dst->sa_family == AF_INET) {
873d68fb8d9SAlexander V. Chernikov 		struct sockaddr_in *dst4 = (struct sockaddr_in *)dst;
874d68fb8d9SAlexander V. Chernikov 		struct sockaddr_in *mask4 = (struct sockaddr_in *)mask;
8752fb4a03dSRyan Libby 		uint32_t scopeid = 0;
876d68fb8d9SAlexander V. Chernikov 		rt_get_inet_prefix_pmask(rt, &dst4->sin_addr, &mask4->sin_addr,
877d68fb8d9SAlexander V. Chernikov 		    &scopeid);
878d68fb8d9SAlexander V. Chernikov 		return;
879d68fb8d9SAlexander V. Chernikov 	}
880d68fb8d9SAlexander V. Chernikov #endif
881d68fb8d9SAlexander V. Chernikov #ifdef INET6
882d68fb8d9SAlexander V. Chernikov 	if (dst->sa_family == AF_INET6) {
883d68fb8d9SAlexander V. Chernikov 		struct sockaddr_in6 *dst6 = (struct sockaddr_in6 *)dst;
884d68fb8d9SAlexander V. Chernikov 		struct sockaddr_in6 *mask6 = (struct sockaddr_in6 *)mask;
8852fb4a03dSRyan Libby 		uint32_t scopeid = 0;
8862fb4a03dSRyan Libby 		rt_get_inet6_prefix_pmask(rt, &dst6->sin6_addr,
8872fb4a03dSRyan Libby 		    &mask6->sin6_addr, &scopeid);
888d68fb8d9SAlexander V. Chernikov 		dst6->sin6_scope_id = scopeid;
889d68fb8d9SAlexander V. Chernikov 		return;
890d68fb8d9SAlexander V. Chernikov 	}
891d68fb8d9SAlexander V. Chernikov #endif
892d68fb8d9SAlexander V. Chernikov }
893d68fb8d9SAlexander V. Chernikov 
894b31fbebeSAlexander V. Chernikov static int
895b31fbebeSAlexander V. Chernikov update_rtm_from_info(struct rt_addrinfo *info, struct rt_msghdr **prtm,
896b31fbebeSAlexander V. Chernikov     int alloc_len)
897b31fbebeSAlexander V. Chernikov {
898b31fbebeSAlexander V. Chernikov 	struct rt_msghdr *rtm, *orig_rtm = NULL;
899b31fbebeSAlexander V. Chernikov 	struct walkarg w;
900b31fbebeSAlexander V. Chernikov 	int len;
901b31fbebeSAlexander V. Chernikov 
902b31fbebeSAlexander V. Chernikov 	rtm = *prtm;
903b31fbebeSAlexander V. Chernikov 	/* Check if we need to realloc storage */
904b31fbebeSAlexander V. Chernikov 	rtsock_msg_buffer(rtm->rtm_type, info, NULL, &len);
905b31fbebeSAlexander V. Chernikov 	if (len > alloc_len) {
906b31fbebeSAlexander V. Chernikov 		struct rt_msghdr *tmp_rtm;
907b31fbebeSAlexander V. Chernikov 
908b31fbebeSAlexander V. Chernikov 		tmp_rtm = malloc(len, M_TEMP, M_NOWAIT);
909b31fbebeSAlexander V. Chernikov 		if (tmp_rtm == NULL)
910b31fbebeSAlexander V. Chernikov 			return (ENOBUFS);
911b31fbebeSAlexander V. Chernikov 		bcopy(rtm, tmp_rtm, rtm->rtm_msglen);
912b31fbebeSAlexander V. Chernikov 		orig_rtm = rtm;
913b31fbebeSAlexander V. Chernikov 		rtm = tmp_rtm;
914b31fbebeSAlexander V. Chernikov 		alloc_len = len;
915b31fbebeSAlexander V. Chernikov 
916b31fbebeSAlexander V. Chernikov 		/*
917b31fbebeSAlexander V. Chernikov 		 * Delay freeing original rtm as info contains
918b31fbebeSAlexander V. Chernikov 		 * data referencing it.
919b31fbebeSAlexander V. Chernikov 		 */
920b31fbebeSAlexander V. Chernikov 	}
921b31fbebeSAlexander V. Chernikov 
922b31fbebeSAlexander V. Chernikov 	w.w_tmem = (caddr_t)rtm;
923b31fbebeSAlexander V. Chernikov 	w.w_tmemsize = alloc_len;
924b31fbebeSAlexander V. Chernikov 	rtsock_msg_buffer(rtm->rtm_type, info, &w, &len);
925b31fbebeSAlexander V. Chernikov 	rtm->rtm_addrs = info->rti_addrs;
926b31fbebeSAlexander V. Chernikov 
927b31fbebeSAlexander V. Chernikov 	if (orig_rtm != NULL)
928b31fbebeSAlexander V. Chernikov 		free(orig_rtm, M_TEMP);
929b31fbebeSAlexander V. Chernikov 	*prtm = rtm;
930b31fbebeSAlexander V. Chernikov 	return (0);
931b31fbebeSAlexander V. Chernikov }
932b31fbebeSAlexander V. Chernikov 
933d68fb8d9SAlexander V. Chernikov 
934c83dda36SAlexander V. Chernikov /*
935592d300eSAlexander V. Chernikov  * Update sockaddrs, flags, etc in @prtm based on @rc data.
936c83dda36SAlexander V. Chernikov  * rtm can be reallocated.
937c83dda36SAlexander V. Chernikov  *
938c83dda36SAlexander V. Chernikov  * Returns 0 on success, along with pointer to (potentially reallocated)
939c83dda36SAlexander V. Chernikov  *  rtm.
940c83dda36SAlexander V. Chernikov  *
941c83dda36SAlexander V. Chernikov  */
942c83dda36SAlexander V. Chernikov static int
943592d300eSAlexander V. Chernikov update_rtm_from_rc(struct rt_addrinfo *info, struct rt_msghdr **prtm,
944592d300eSAlexander V. Chernikov     int alloc_len, struct rib_cmd_info *rc, struct nhop_object *nh)
945c83dda36SAlexander V. Chernikov {
946c83dda36SAlexander V. Chernikov 	union sockaddr_union saun;
947b31fbebeSAlexander V. Chernikov 	struct rt_msghdr *rtm;
948c83dda36SAlexander V. Chernikov 	struct ifnet *ifp;
949b31fbebeSAlexander V. Chernikov 	int error;
950c83dda36SAlexander V. Chernikov 
951c83dda36SAlexander V. Chernikov 	rtm = *prtm;
952d68fb8d9SAlexander V. Chernikov 	union sockaddr_union sa_dst, sa_mask;
953d68fb8d9SAlexander V. Chernikov 	int family = info->rti_info[RTAX_DST]->sa_family;
954d68fb8d9SAlexander V. Chernikov 	init_sockaddrs_family(family, &sa_dst.sa, &sa_mask.sa);
955d68fb8d9SAlexander V. Chernikov 	export_rtaddrs(rc->rc_rt, &sa_dst.sa, &sa_mask.sa);
956c83dda36SAlexander V. Chernikov 
957d68fb8d9SAlexander V. Chernikov 	info->rti_info[RTAX_DST] = &sa_dst.sa;
958d68fb8d9SAlexander V. Chernikov 	info->rti_info[RTAX_NETMASK] = rt_is_host(rc->rc_rt) ? NULL : &sa_mask.sa;
959aaad3c4fSAlexander V. Chernikov 	info->rti_info[RTAX_GATEWAY] = &nh->gw_sa;
960c83dda36SAlexander V. Chernikov 	info->rti_info[RTAX_GENMASK] = 0;
961aaad3c4fSAlexander V. Chernikov 	ifp = nh->nh_ifp;
962c83dda36SAlexander V. Chernikov 	if (rtm->rtm_addrs & (RTA_IFP | RTA_IFA)) {
963c83dda36SAlexander V. Chernikov 		if (ifp) {
964c83dda36SAlexander V. Chernikov 			info->rti_info[RTAX_IFP] =
965c83dda36SAlexander V. Chernikov 			    ifp->if_addr->ifa_addr;
966aaad3c4fSAlexander V. Chernikov 			error = rtm_get_jailed(info, ifp, nh,
967c83dda36SAlexander V. Chernikov 			    &saun, curthread->td_ucred);
968c83dda36SAlexander V. Chernikov 			if (error != 0)
969c83dda36SAlexander V. Chernikov 				return (error);
970c83dda36SAlexander V. Chernikov 			if (ifp->if_flags & IFF_POINTOPOINT)
971c83dda36SAlexander V. Chernikov 				info->rti_info[RTAX_BRD] =
972aaad3c4fSAlexander V. Chernikov 				    nh->nh_ifa->ifa_dstaddr;
973c83dda36SAlexander V. Chernikov 			rtm->rtm_index = ifp->if_index;
974c83dda36SAlexander V. Chernikov 		} else {
975c83dda36SAlexander V. Chernikov 			info->rti_info[RTAX_IFP] = NULL;
976c83dda36SAlexander V. Chernikov 			info->rti_info[RTAX_IFA] = NULL;
977c83dda36SAlexander V. Chernikov 		}
978c83dda36SAlexander V. Chernikov 	} else if (ifp != NULL)
979c83dda36SAlexander V. Chernikov 		rtm->rtm_index = ifp->if_index;
980c83dda36SAlexander V. Chernikov 
981b31fbebeSAlexander V. Chernikov 	if ((error = update_rtm_from_info(info, prtm, alloc_len)) != 0)
982b31fbebeSAlexander V. Chernikov 		return (error);
983c83dda36SAlexander V. Chernikov 
98476cfc6faSAlexander V. Chernikov 	rtm = *prtm;
985592d300eSAlexander V. Chernikov 	rtm->rtm_flags = rc->rc_rt->rte_flags | nhop_get_rtflags(nh);
986592d300eSAlexander V. Chernikov 	if (rtm->rtm_flags & RTF_GWFLAG_COMPAT)
987c83dda36SAlexander V. Chernikov 		rtm->rtm_flags = RTF_GATEWAY |
988592d300eSAlexander V. Chernikov 			(rtm->rtm_flags & ~RTF_GWFLAG_COMPAT);
989592d300eSAlexander V. Chernikov 	rt_getmetrics(rc->rc_rt, nh, &rtm->rtm_rmx);
990592d300eSAlexander V. Chernikov 	rtm->rtm_rmx.rmx_weight = rc->rc_nh_weight;
991c83dda36SAlexander V. Chernikov 
992c83dda36SAlexander V. Chernikov 	return (0);
993c83dda36SAlexander V. Chernikov }
994c83dda36SAlexander V. Chernikov 
9959c584fa4SAlexander V. Chernikov #ifdef ROUTE_MPATH
996fedeb08bSAlexander V. Chernikov static void
997fedeb08bSAlexander V. Chernikov save_del_notification(struct rib_cmd_info *rc, void *_cbdata)
998fedeb08bSAlexander V. Chernikov {
999fedeb08bSAlexander V. Chernikov 	struct rib_cmd_info *rc_new = (struct rib_cmd_info *)_cbdata;
1000fedeb08bSAlexander V. Chernikov 
1001fedeb08bSAlexander V. Chernikov 	if (rc->rc_cmd == RTM_DELETE)
1002fedeb08bSAlexander V. Chernikov 		*rc_new = *rc;
1003fedeb08bSAlexander V. Chernikov }
1004fedeb08bSAlexander V. Chernikov 
1005fedeb08bSAlexander V. Chernikov static void
1006fedeb08bSAlexander V. Chernikov save_add_notification(struct rib_cmd_info *rc, void *_cbdata)
1007fedeb08bSAlexander V. Chernikov {
1008fedeb08bSAlexander V. Chernikov 	struct rib_cmd_info *rc_new = (struct rib_cmd_info *)_cbdata;
1009fedeb08bSAlexander V. Chernikov 
1010fedeb08bSAlexander V. Chernikov 	if (rc->rc_cmd == RTM_ADD)
1011fedeb08bSAlexander V. Chernikov 		*rc_new = *rc;
1012fedeb08bSAlexander V. Chernikov }
10139c584fa4SAlexander V. Chernikov #endif
1014fedeb08bSAlexander V. Chernikov 
1015a3c2c06bSBjoern A. Zeeb #if defined(INET6) || defined(INET)
1016b31fbebeSAlexander V. Chernikov static struct sockaddr *
1017b31fbebeSAlexander V. Chernikov alloc_sockaddr_aligned(struct linear_buffer *lb, int len)
1018b31fbebeSAlexander V. Chernikov {
101925682e6aSAlexander V. Chernikov 	len = roundup2(len, sizeof(uint64_t));
1020b31fbebeSAlexander V. Chernikov 	if (lb->offset + len > lb->size)
1021b31fbebeSAlexander V. Chernikov 		return (NULL);
1022b31fbebeSAlexander V. Chernikov 	struct sockaddr *sa = (struct sockaddr *)(lb->base + lb->offset);
1023b31fbebeSAlexander V. Chernikov 	lb->offset += len;
1024b31fbebeSAlexander V. Chernikov 	return (sa);
1025b31fbebeSAlexander V. Chernikov }
1026a3c2c06bSBjoern A. Zeeb #endif
1027b31fbebeSAlexander V. Chernikov 
1028df8bae1dSRodney W. Grimes /*ARGSUSED*/
102952041295SPoul-Henning Kamp static int
103073d76e77SKevin Lo route_output(struct mbuf *m, struct socket *so, ...)
1031df8bae1dSRodney W. Grimes {
10325dfc91d7SLuigi Rizzo 	struct rt_msghdr *rtm = NULL;
1033df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
1034b8a6e03fSGleb Smirnoff 	struct epoch_tracker et;
10353deb3649SAlexander V. Chernikov #ifdef INET6
1036d9302031SAlexander V. Chernikov 	struct sockaddr_storage ss;
10376bbfef90SHiroki Sato 	struct sockaddr_in6 *sin6;
10380bebb544SHiroki Sato 	int i, rti_need_deembed = 0;
10396bbfef90SHiroki Sato #endif
1040f2e5eb36SAlexander V. Chernikov 	int alloc_len = 0, len, error = 0, fibnum;
10413ca1a2d6SMax Laier 	sa_family_t saf = AF_UNSPEC;
1042a287a973SAlexander V. Chernikov 	struct rib_cmd_info rc;
1043a287a973SAlexander V. Chernikov 	struct nhop_object *nh;
1044df8bae1dSRodney W. Grimes 
1045f5d9a696SAlexander V. Chernikov 	fibnum = so->so_fibnum;
1046df8bae1dSRodney W. Grimes #define senderr(e) { error = e; goto flush;}
10475dfc91d7SLuigi Rizzo 	if (m == NULL || ((m->m_len < sizeof(long)) &&
10485dfc91d7SLuigi Rizzo 		       (m = m_pullup(m, sizeof(long))) == NULL))
1049df8bae1dSRodney W. Grimes 		return (ENOBUFS);
1050df8bae1dSRodney W. Grimes 	if ((m->m_flags & M_PKTHDR) == 0)
1051df8bae1dSRodney W. Grimes 		panic("route_output");
1052b8a6e03fSGleb Smirnoff 	NET_EPOCH_ENTER(et);
1053df8bae1dSRodney W. Grimes 	len = m->m_pkthdr.len;
1054df8bae1dSRodney W. Grimes 	if (len < sizeof(*rtm) ||
1055f1fcb552SAlexander V. Chernikov 	    len != mtod(m, struct rt_msghdr *)->rtm_msglen)
1056df8bae1dSRodney W. Grimes 		senderr(EINVAL);
1057f1fcb552SAlexander V. Chernikov 
1058f2e5eb36SAlexander V. Chernikov 	/*
1059f2e5eb36SAlexander V. Chernikov 	 * Most of current messages are in range 200-240 bytes,
1060d9437c0fSAlexander V. Chernikov 	 * minimize possible re-allocation on reply using larger size
1061d9437c0fSAlexander V. Chernikov 	 * buffer aligned on 1k boundaty.
1062f2e5eb36SAlexander V. Chernikov 	 */
1063f2e5eb36SAlexander V. Chernikov 	alloc_len = roundup2(len, 1024);
1064b31fbebeSAlexander V. Chernikov 	int total_len = alloc_len + SCRATCH_BUFFER_SIZE;
1065b31fbebeSAlexander V. Chernikov 	if ((rtm = malloc(total_len, M_TEMP, M_NOWAIT)) == NULL)
1066df8bae1dSRodney W. Grimes 		senderr(ENOBUFS);
1067f2e5eb36SAlexander V. Chernikov 
1068df8bae1dSRodney W. Grimes 	m_copydata(m, 0, len, (caddr_t)rtm);
1069f1fcb552SAlexander V. Chernikov 	bzero(&info, sizeof(info));
1070a287a973SAlexander V. Chernikov 	nh = NULL;
1071b31fbebeSAlexander V. Chernikov 	struct linear_buffer lb = {
1072b31fbebeSAlexander V. Chernikov 		.base = (char *)rtm + alloc_len,
1073b31fbebeSAlexander V. Chernikov 		.size = SCRATCH_BUFFER_SIZE,
1074b31fbebeSAlexander V. Chernikov 	};
1075f1fcb552SAlexander V. Chernikov 
1076df8bae1dSRodney W. Grimes 	if (rtm->rtm_version != RTM_VERSION) {
1077f1fcb552SAlexander V. Chernikov 		/* Do not touch message since format is unknown */
1078f2e5eb36SAlexander V. Chernikov 		free(rtm, M_TEMP);
1079f1fcb552SAlexander V. Chernikov 		rtm = NULL;
1080df8bae1dSRodney W. Grimes 		senderr(EPROTONOSUPPORT);
1081df8bae1dSRodney W. Grimes 	}
1082f1fcb552SAlexander V. Chernikov 
1083f1fcb552SAlexander V. Chernikov 	/*
1084f1fcb552SAlexander V. Chernikov 	 * Starting from here, it is possible
1085f1fcb552SAlexander V. Chernikov 	 * to alter original message and insert
1086f1fcb552SAlexander V. Chernikov 	 * caller PID and error value.
1087f1fcb552SAlexander V. Chernikov 	 */
1088f1fcb552SAlexander V. Chernikov 
1089b31fbebeSAlexander V. Chernikov 	if ((error = fill_addrinfo(rtm, len, &lb, fibnum, &info)) != 0) {
1090dadb6c3bSRuslan Ermilov 		senderr(error);
1091acd3428bSRobert Watson 	}
1092b31fbebeSAlexander V. Chernikov 	/* fill_addringo() embeds scope into IPv6 addresses */
1093b31fbebeSAlexander V. Chernikov #ifdef INET6
1094b31fbebeSAlexander V. Chernikov 	rti_need_deembed = 1;
1095b31fbebeSAlexander V. Chernikov #endif
1096162c0b2eSRuslan Ermilov 
1097c83dda36SAlexander V. Chernikov 	saf = info.rti_info[RTAX_DST]->sa_family;
10989231d35fSQing Li 
1099c83dda36SAlexander V. Chernikov 	/* support for new ARP code */
1100c83dda36SAlexander V. Chernikov 	if (rtm->rtm_flags & RTF_LLDATA) {
1101c83dda36SAlexander V. Chernikov 		error = lla_rt_output(rtm, &info);
1102c83dda36SAlexander V. Chernikov 		goto flush;
11039231d35fSQing Li 	}
11049231d35fSQing Li 
1105145bf6c0SAlexander V. Chernikov 	union sockaddr_union gw_saun;
1106145bf6c0SAlexander V. Chernikov 	int blackhole_flags = rtm->rtm_flags & (RTF_BLACKHOLE|RTF_REJECT);
1107145bf6c0SAlexander V. Chernikov 	if (blackhole_flags != 0) {
1108145bf6c0SAlexander V. Chernikov 		if (blackhole_flags != (RTF_BLACKHOLE | RTF_REJECT))
1109145bf6c0SAlexander V. Chernikov 			error = fill_blackholeinfo(&info, &gw_saun);
11106fa8ed43SAlexander V. Chernikov 		else {
11116fa8ed43SAlexander V. Chernikov 			RTS_PID_LOG(LOG_DEBUG, "both BLACKHOLE and REJECT flags specifiied");
1112145bf6c0SAlexander V. Chernikov 			error = EINVAL;
11136fa8ed43SAlexander V. Chernikov 		}
1114145bf6c0SAlexander V. Chernikov 		if (error != 0)
1115145bf6c0SAlexander V. Chernikov 			senderr(error);
1116145bf6c0SAlexander V. Chernikov 	}
1117145bf6c0SAlexander V. Chernikov 
1118df8bae1dSRodney W. Grimes 	switch (rtm->rtm_type) {
1119df8bae1dSRodney W. Grimes 	case RTM_ADD:
1120c77462ddSAlexander V. Chernikov 	case RTM_CHANGE:
1121b3b6ff23SRyan Stone 		if (rtm->rtm_type == RTM_ADD) {
11226fa8ed43SAlexander V. Chernikov 			if (info.rti_info[RTAX_GATEWAY] == NULL) {
11236fa8ed43SAlexander V. Chernikov 				RTS_PID_LOG(LOG_DEBUG, "RTM_ADD w/o gateway");
1124df8bae1dSRodney W. Grimes 				senderr(EINVAL);
1125b3b6ff23SRyan Stone 			}
11266fa8ed43SAlexander V. Chernikov 		}
1127a287a973SAlexander V. Chernikov 		error = rib_action(fibnum, rtm->rtm_type, &info, &rc);
1128a287a973SAlexander V. Chernikov 		if (error == 0) {
1129fedeb08bSAlexander V. Chernikov #ifdef ROUTE_MPATH
1130fedeb08bSAlexander V. Chernikov 			if (NH_IS_NHGRP(rc.rc_nh_new) ||
1131fedeb08bSAlexander V. Chernikov 			    (rc.rc_nh_old && NH_IS_NHGRP(rc.rc_nh_old))) {
1132fedeb08bSAlexander V. Chernikov 				struct rib_cmd_info rc_simple = {};
1133fedeb08bSAlexander V. Chernikov 				rib_decompose_notification(&rc,
1134fedeb08bSAlexander V. Chernikov 				    save_add_notification, (void *)&rc_simple);
1135fedeb08bSAlexander V. Chernikov 				rc = rc_simple;
1136fedeb08bSAlexander V. Chernikov 			}
1137fedeb08bSAlexander V. Chernikov #endif
1138c260d5cdSAlexander V. Chernikov 			/* nh MAY be empty if RTM_CHANGE request is no-op */
1139a287a973SAlexander V. Chernikov 			nh = rc.rc_nh_new;
1140c260d5cdSAlexander V. Chernikov 			if (nh != NULL) {
1141592d300eSAlexander V. Chernikov 				rtm->rtm_index = nh->nh_ifp->if_index;
11421b95005eSAlexander V. Chernikov 				rtm->rtm_flags = rc.rc_rt->rte_flags | nhop_get_rtflags(nh);
1143df8bae1dSRodney W. Grimes 			}
1144c260d5cdSAlexander V. Chernikov 		}
1145df8bae1dSRodney W. Grimes 		break;
1146df8bae1dSRodney W. Grimes 
1147df8bae1dSRodney W. Grimes 	case RTM_DELETE:
1148a287a973SAlexander V. Chernikov 		error = rib_action(fibnum, RTM_DELETE, &info, &rc);
114978a82810SGarrett Wollman 		if (error == 0) {
1150fedeb08bSAlexander V. Chernikov #ifdef ROUTE_MPATH
1151fedeb08bSAlexander V. Chernikov 			if (NH_IS_NHGRP(rc.rc_nh_old) ||
1152fedeb08bSAlexander V. Chernikov 			    (rc.rc_nh_new && NH_IS_NHGRP(rc.rc_nh_new))) {
1153fedeb08bSAlexander V. Chernikov 				struct rib_cmd_info rc_simple = {};
1154fedeb08bSAlexander V. Chernikov 				rib_decompose_notification(&rc,
1155fedeb08bSAlexander V. Chernikov 				    save_del_notification, (void *)&rc_simple);
1156fedeb08bSAlexander V. Chernikov 				rc = rc_simple;
1157fedeb08bSAlexander V. Chernikov 			}
1158fedeb08bSAlexander V. Chernikov #endif
1159a287a973SAlexander V. Chernikov 			nh = rc.rc_nh_old;
116078a82810SGarrett Wollman 		}
1161df8bae1dSRodney W. Grimes 		break;
1162df8bae1dSRodney W. Grimes 
1163df8bae1dSRodney W. Grimes 	case RTM_GET:
1164a287a973SAlexander V. Chernikov 		error = handle_rtm_get(&info, fibnum, rtm, &rc);
1165c83dda36SAlexander V. Chernikov 		if (error != 0)
1166c83dda36SAlexander V. Chernikov 			senderr(error);
1167a287a973SAlexander V. Chernikov 		nh = rc.rc_nh_new;
1168956b0b65SJeffrey Hsu 
1169d68fb8d9SAlexander V. Chernikov 		if (!can_export_rte(curthread->td_ucred,
1170d68fb8d9SAlexander V. Chernikov 		    info.rti_info[RTAX_NETMASK] == NULL,
1171d68fb8d9SAlexander V. Chernikov 		    info.rti_info[RTAX_DST])) {
1172813dd6aeSBjoern A. Zeeb 			senderr(ESRCH);
1173813dd6aeSBjoern A. Zeeb 		}
1174b31fbebeSAlexander V. Chernikov 		break;
1175a287a973SAlexander V. Chernikov 
1176b31fbebeSAlexander V. Chernikov 	default:
1177b31fbebeSAlexander V. Chernikov 		senderr(EOPNOTSUPP);
1178b31fbebeSAlexander V. Chernikov 	}
1179b31fbebeSAlexander V. Chernikov 
1180c260d5cdSAlexander V. Chernikov 	if (error == 0 && nh != NULL) {
1181592d300eSAlexander V. Chernikov 		error = update_rtm_from_rc(&info, &rtm, alloc_len, &rc, nh);
1182c83dda36SAlexander V. Chernikov 		/*
1183c83dda36SAlexander V. Chernikov 		 * Note that some sockaddr pointers may have changed to
1184c83dda36SAlexander V. Chernikov 		 * point to memory outsize @rtm. Some may be pointing
1185c83dda36SAlexander V. Chernikov 		 * to the on-stack variables.
1186c83dda36SAlexander V. Chernikov 		 * Given that, any pointer in @info CANNOT BE USED.
1187c83dda36SAlexander V. Chernikov 		 */
1188c83dda36SAlexander V. Chernikov 
1189c83dda36SAlexander V. Chernikov 		/*
1190c83dda36SAlexander V. Chernikov 		 * scopeid deembedding has been performed while
1191c83dda36SAlexander V. Chernikov 		 * writing updated rtm in rtsock_msg_buffer().
1192c83dda36SAlexander V. Chernikov 		 * With that in mind, skip deembedding procedure below.
1193c83dda36SAlexander V. Chernikov 		 */
1194d9302031SAlexander V. Chernikov #ifdef INET6
1195c83dda36SAlexander V. Chernikov 		rti_need_deembed = 0;
1196d9302031SAlexander V. Chernikov #endif
1197df8bae1dSRodney W. Grimes 	}
1198df8bae1dSRodney W. Grimes 
1199df8bae1dSRodney W. Grimes flush:
1200b8a6e03fSGleb Smirnoff 	NET_EPOCH_EXIT(et);
120192c227afSAlexander V. Chernikov 
12020bebb544SHiroki Sato #ifdef INET6
1203c83dda36SAlexander V. Chernikov 	if (rtm != NULL) {
12040bebb544SHiroki Sato 		if (rti_need_deembed) {
12050bebb544SHiroki Sato 			/* sin6_scope_id is recovered before sending rtm. */
12060bebb544SHiroki Sato 			sin6 = (struct sockaddr_in6 *)&ss;
120712bdf23aSHiroki Sato 			for (i = 0; i < RTAX_MAX; i++) {
12080bebb544SHiroki Sato 				if (info.rti_info[i] == NULL)
12090bebb544SHiroki Sato 					continue;
12100bebb544SHiroki Sato 				if (info.rti_info[i]->sa_family != AF_INET6)
12110bebb544SHiroki Sato 					continue;
12120bebb544SHiroki Sato 				bcopy(info.rti_info[i], sin6, sizeof(*sin6));
12130bebb544SHiroki Sato 				if (sa6_recoverscope(sin6) == 0)
12140bebb544SHiroki Sato 					bcopy(sin6, info.rti_info[i],
12150bebb544SHiroki Sato 						    sizeof(*sin6));
12160bebb544SHiroki Sato 			}
1217b31fbebeSAlexander V. Chernikov 			if (update_rtm_from_info(&info, &rtm, alloc_len) != 0) {
1218b31fbebeSAlexander V. Chernikov 				if (error != 0)
1219b31fbebeSAlexander V. Chernikov 					error = ENOBUFS;
1220b31fbebeSAlexander V. Chernikov 			}
12210bebb544SHiroki Sato 		}
1222c83dda36SAlexander V. Chernikov 	}
12230bebb544SHiroki Sato #endif
1224c83dda36SAlexander V. Chernikov 	send_rtm_reply(so, rtm, m, saf, fibnum, error);
1225c83dda36SAlexander V. Chernikov 
1226c83dda36SAlexander V. Chernikov 	return (error);
1227c83dda36SAlexander V. Chernikov }
1228c83dda36SAlexander V. Chernikov 
1229c83dda36SAlexander V. Chernikov /*
1230c83dda36SAlexander V. Chernikov  * Sends the prepared reply message in @rtm to all rtsock clients.
1231c83dda36SAlexander V. Chernikov  * Frees @m and @rtm.
1232c83dda36SAlexander V. Chernikov  *
1233c83dda36SAlexander V. Chernikov  */
1234c83dda36SAlexander V. Chernikov static void
1235c83dda36SAlexander V. Chernikov send_rtm_reply(struct socket *so, struct rt_msghdr *rtm, struct mbuf *m,
1236c83dda36SAlexander V. Chernikov     sa_family_t saf, u_int fibnum, int rtm_errno)
1237c83dda36SAlexander V. Chernikov {
1238c83dda36SAlexander V. Chernikov 	struct rawcb *rp = NULL;
1239c83dda36SAlexander V. Chernikov 
1240c83dda36SAlexander V. Chernikov 	/*
1241c83dda36SAlexander V. Chernikov 	 * Check to see if we don't want our own messages.
1242c83dda36SAlexander V. Chernikov 	 */
1243c83dda36SAlexander V. Chernikov 	if ((so->so_options & SO_USELOOPBACK) == 0) {
1244c83dda36SAlexander V. Chernikov 		if (V_route_cb.any_count <= 1) {
1245c83dda36SAlexander V. Chernikov 			if (rtm != NULL)
1246c83dda36SAlexander V. Chernikov 				free(rtm, M_TEMP);
1247c83dda36SAlexander V. Chernikov 			m_freem(m);
1248c83dda36SAlexander V. Chernikov 			return;
1249c83dda36SAlexander V. Chernikov 		}
1250c83dda36SAlexander V. Chernikov 		/* There is another listener, so construct message */
1251c83dda36SAlexander V. Chernikov 		rp = sotorawcb(so);
1252c83dda36SAlexander V. Chernikov 	}
1253c83dda36SAlexander V. Chernikov 
1254c83dda36SAlexander V. Chernikov 	if (rtm != NULL) {
1255c83dda36SAlexander V. Chernikov 		if (rtm_errno!= 0)
1256c83dda36SAlexander V. Chernikov 			rtm->rtm_errno = rtm_errno;
125792c227afSAlexander V. Chernikov 		else
125892c227afSAlexander V. Chernikov 			rtm->rtm_flags |= RTF_DONE;
125992c227afSAlexander V. Chernikov 
1260df8bae1dSRodney W. Grimes 		m_copyback(m, 0, rtm->rtm_msglen, (caddr_t)rtm);
126103311056SHajimu UMEMOTO 		if (m->m_pkthdr.len < rtm->rtm_msglen) {
126203311056SHajimu UMEMOTO 			m_freem(m);
126303311056SHajimu UMEMOTO 			m = NULL;
126403311056SHajimu UMEMOTO 		} else if (m->m_pkthdr.len > rtm->rtm_msglen)
126503311056SHajimu UMEMOTO 			m_adj(m, rtm->rtm_msglen - m->m_pkthdr.len);
1266f2e5eb36SAlexander V. Chernikov 
1267f2e5eb36SAlexander V. Chernikov 		free(rtm, M_TEMP);
1268df8bae1dSRodney W. Grimes 	}
126992c227afSAlexander V. Chernikov 	if (m != NULL) {
1270773aa053SAlexander V. Chernikov 		M_SETFIB(m, fibnum);
1271528737fdSBjoern A. Zeeb 		m->m_flags |= RTS_FILTER_FIB;
1272becc44d7SSam Leffler 		if (rp) {
1273becc44d7SSam Leffler 			/*
1274becc44d7SSam Leffler 			 * XXX insure we don't get a copy by
1275becc44d7SSam Leffler 			 * invalidating our protocol
1276becc44d7SSam Leffler 			 */
1277becc44d7SSam Leffler 			unsigned short family = rp->rcb_proto.sp_family;
1278becc44d7SSam Leffler 			rp->rcb_proto.sp_family = 0;
12793ca1a2d6SMax Laier 			rt_dispatch(m, saf);
1280becc44d7SSam Leffler 			rp->rcb_proto.sp_family = family;
1281becc44d7SSam Leffler 		} else
12823ca1a2d6SMax Laier 			rt_dispatch(m, saf);
1283becc44d7SSam Leffler 	}
1284df8bae1dSRodney W. Grimes }
1285df8bae1dSRodney W. Grimes 
128652041295SPoul-Henning Kamp static void
128793bfd365SAlexander V. Chernikov rt_getmetrics(const struct rtentry *rt, const struct nhop_object *nh,
128893bfd365SAlexander V. Chernikov     struct rt_metrics *out)
128997d8d152SAndre Oppermann {
1290e3a7aa6fSGleb Smirnoff 
129197d8d152SAndre Oppermann 	bzero(out, sizeof(*out));
129293bfd365SAlexander V. Chernikov 	out->rmx_mtu = nh->nh_mtu;
1293e3a7aa6fSGleb Smirnoff 	out->rmx_weight = rt->rt_weight;
129493bfd365SAlexander V. Chernikov 	out->rmx_nhidx = nhop_get_idx(nh);
1295e27c3f48SOleg Bulyzhin 	/* Kernel -> userland timebase conversion. */
1296e3a7aa6fSGleb Smirnoff 	out->rmx_expire = rt->rt_expire ?
1297e3a7aa6fSGleb Smirnoff 	    rt->rt_expire - time_uptime + time_second : 0;
129897d8d152SAndre Oppermann }
129997d8d152SAndre Oppermann 
13007f33a738SJulian Elischer /*
13017f33a738SJulian Elischer  * Extract the addresses of the passed sockaddrs.
13027f33a738SJulian Elischer  * Do a little sanity checking so as to avoid bad memory references.
1303076d0761SJulian Elischer  * This data is derived straight from userland.
13047f33a738SJulian Elischer  */
1305076d0761SJulian Elischer static int
1306becc44d7SSam Leffler rt_xaddrs(caddr_t cp, caddr_t cplim, struct rt_addrinfo *rtinfo)
1307df8bae1dSRodney W. Grimes {
1308e74642dfSLuigi Rizzo 	struct sockaddr *sa;
1309e74642dfSLuigi Rizzo 	int i;
1310df8bae1dSRodney W. Grimes 
1311becc44d7SSam Leffler 	for (i = 0; i < RTAX_MAX && cp < cplim; i++) {
1312df8bae1dSRodney W. Grimes 		if ((rtinfo->rti_addrs & (1 << i)) == 0)
1313df8bae1dSRodney W. Grimes 			continue;
1314ff6d0a59SJulian Elischer 		sa = (struct sockaddr *)cp;
13157f33a738SJulian Elischer 		/*
1316076d0761SJulian Elischer 		 * It won't fit.
13177f33a738SJulian Elischer 		 */
13186fa8ed43SAlexander V. Chernikov 		if (cp + sa->sa_len > cplim) {
13196fa8ed43SAlexander V. Chernikov 			RTS_PID_LOG(LOG_DEBUG, "sa_len too big for sa type %d", i);
1320076d0761SJulian Elischer 			return (EINVAL);
13216fa8ed43SAlexander V. Chernikov 		}
13227f33a738SJulian Elischer 		/*
13237f33a738SJulian Elischer 		 * there are no more.. quit now
13247f33a738SJulian Elischer 		 * If there are more bits, they are in error.
13257f33a738SJulian Elischer 		 * I've seen this. route(1) can evidently generate these.
13267f33a738SJulian Elischer 		 * This causes kernel to core dump.
1327076d0761SJulian Elischer 		 * for compatibility, If we see this, point to a safe address.
13287f33a738SJulian Elischer 		 */
1329076d0761SJulian Elischer 		if (sa->sa_len == 0) {
1330076d0761SJulian Elischer 			rtinfo->rti_info[i] = &sa_zero;
1331076d0761SJulian Elischer 			return (0); /* should be EINVAL but for compat */
1332df8bae1dSRodney W. Grimes 		}
1333076d0761SJulian Elischer 		/* accept it */
13340bebb544SHiroki Sato #ifdef INET6
13350bebb544SHiroki Sato 		if (sa->sa_family == AF_INET6)
13360bebb544SHiroki Sato 			sa6_embedscope((struct sockaddr_in6 *)sa,
13370bebb544SHiroki Sato 			    V_ip6_use_defzone);
13380bebb544SHiroki Sato #endif
1339076d0761SJulian Elischer 		rtinfo->rti_info[i] = sa;
1340e74642dfSLuigi Rizzo 		cp += SA_SIZE(sa);
1341076d0761SJulian Elischer 	}
1342076d0761SJulian Elischer 	return (0);
1343df8bae1dSRodney W. Grimes }
1344df8bae1dSRodney W. Grimes 
1345a4513bacSAlexander V. Chernikov #ifdef INET
13462fe5a794SAlexander V. Chernikov static inline void
13472fe5a794SAlexander V. Chernikov fill_sockaddr_inet(struct sockaddr_in *sin, struct in_addr addr)
13482fe5a794SAlexander V. Chernikov {
13492fe5a794SAlexander V. Chernikov 
13502fe5a794SAlexander V. Chernikov 	const struct sockaddr_in nsin = {
13512fe5a794SAlexander V. Chernikov 		.sin_family = AF_INET,
13522fe5a794SAlexander V. Chernikov 		.sin_len = sizeof(struct sockaddr_in),
13532fe5a794SAlexander V. Chernikov 		.sin_addr = addr,
13542fe5a794SAlexander V. Chernikov 	};
13552fe5a794SAlexander V. Chernikov 	*sin = nsin;
13562fe5a794SAlexander V. Chernikov }
1357a4513bacSAlexander V. Chernikov #endif
13582fe5a794SAlexander V. Chernikov 
1359a4513bacSAlexander V. Chernikov #ifdef INET6
13602fe5a794SAlexander V. Chernikov static inline void
13612fe5a794SAlexander V. Chernikov fill_sockaddr_inet6(struct sockaddr_in6 *sin6, const struct in6_addr *addr6,
13622fe5a794SAlexander V. Chernikov     uint32_t scopeid)
13632fe5a794SAlexander V. Chernikov {
13642fe5a794SAlexander V. Chernikov 
13652fe5a794SAlexander V. Chernikov 	const struct sockaddr_in6 nsin6 = {
13662fe5a794SAlexander V. Chernikov 		.sin6_family = AF_INET6,
13672fe5a794SAlexander V. Chernikov 		.sin6_len = sizeof(struct sockaddr_in6),
13682fe5a794SAlexander V. Chernikov 		.sin6_addr = *addr6,
13692fe5a794SAlexander V. Chernikov 		.sin6_scope_id = scopeid,
13702fe5a794SAlexander V. Chernikov 	};
13712fe5a794SAlexander V. Chernikov 	*sin6 = nsin6;
13722fe5a794SAlexander V. Chernikov }
1373a4513bacSAlexander V. Chernikov #endif
13742fe5a794SAlexander V. Chernikov 
1375a3c2c06bSBjoern A. Zeeb #if defined(INET6) || defined(INET)
1376e5b394f2SAlexander V. Chernikov /*
1377e5b394f2SAlexander V. Chernikov  * Checks if gateway is suitable for lltable operations.
1378e5b394f2SAlexander V. Chernikov  * Lltable code requires AF_LINK gateway with ifindex
1379e5b394f2SAlexander V. Chernikov  *  and mac address specified.
1380e5b394f2SAlexander V. Chernikov  * Returns 0 on success.
1381e5b394f2SAlexander V. Chernikov  */
1382e5b394f2SAlexander V. Chernikov static int
1383e5b394f2SAlexander V. Chernikov cleanup_xaddrs_lladdr(struct rt_addrinfo *info)
1384e5b394f2SAlexander V. Chernikov {
1385e5b394f2SAlexander V. Chernikov 	struct sockaddr_dl *sdl = (struct sockaddr_dl *)info->rti_info[RTAX_GATEWAY];
1386e5b394f2SAlexander V. Chernikov 
1387e5b394f2SAlexander V. Chernikov 	if (sdl->sdl_family != AF_LINK)
1388e5b394f2SAlexander V. Chernikov 		return (EINVAL);
1389e5b394f2SAlexander V. Chernikov 
13906fa8ed43SAlexander V. Chernikov 	if (sdl->sdl_index == 0) {
13916fa8ed43SAlexander V. Chernikov 		RTS_PID_LOG(LOG_DEBUG, "AF_LINK gateway w/o ifindex");
1392e5b394f2SAlexander V. Chernikov 		return (EINVAL);
13936fa8ed43SAlexander V. Chernikov 	}
1394e5b394f2SAlexander V. Chernikov 
13956fa8ed43SAlexander V. Chernikov 	if (offsetof(struct sockaddr_dl, sdl_data) + sdl->sdl_nlen + sdl->sdl_alen > sdl->sdl_len) {
13966fa8ed43SAlexander V. Chernikov 		RTS_PID_LOG(LOG_DEBUG, "AF_LINK gw: sdl_nlen/sdl_alen too large");
1397e5b394f2SAlexander V. Chernikov 		return (EINVAL);
13986fa8ed43SAlexander V. Chernikov 	}
1399e5b394f2SAlexander V. Chernikov 
1400e5b394f2SAlexander V. Chernikov 	return (0);
1401e5b394f2SAlexander V. Chernikov }
1402e5b394f2SAlexander V. Chernikov 
14032fe5a794SAlexander V. Chernikov static int
1404b31fbebeSAlexander V. Chernikov cleanup_xaddrs_gateway(struct rt_addrinfo *info, struct linear_buffer *lb)
14052fe5a794SAlexander V. Chernikov {
14062fe5a794SAlexander V. Chernikov 	struct sockaddr *gw = info->rti_info[RTAX_GATEWAY];
1407b31fbebeSAlexander V. Chernikov 	struct sockaddr *sa;
14082fe5a794SAlexander V. Chernikov 
1409e5b394f2SAlexander V. Chernikov 	if (info->rti_flags & RTF_LLDATA)
1410e5b394f2SAlexander V. Chernikov 		return (cleanup_xaddrs_lladdr(info));
1411e5b394f2SAlexander V. Chernikov 
14122fe5a794SAlexander V. Chernikov 	switch (gw->sa_family) {
14132fe5a794SAlexander V. Chernikov #ifdef INET
14142fe5a794SAlexander V. Chernikov 	case AF_INET:
14152fe5a794SAlexander V. Chernikov 		{
14162fe5a794SAlexander V. Chernikov 			struct sockaddr_in *gw_sin = (struct sockaddr_in *)gw;
1417b31fbebeSAlexander V. Chernikov 
1418b31fbebeSAlexander V. Chernikov 			/* Ensure reads do not go beyoud SA boundary */
1419b31fbebeSAlexander V. Chernikov 			if (SA_SIZE(gw) < offsetof(struct sockaddr_in, sin_zero)) {
14206fa8ed43SAlexander V. Chernikov 				RTS_PID_LOG(LOG_DEBUG, "gateway sin_len too small: %d",
14216fa8ed43SAlexander V. Chernikov 				    gw->sa_len);
14222fe5a794SAlexander V. Chernikov 				return (EINVAL);
14232fe5a794SAlexander V. Chernikov 			}
1424b31fbebeSAlexander V. Chernikov 			sa = alloc_sockaddr_aligned(lb, sizeof(struct sockaddr_in));
1425b31fbebeSAlexander V. Chernikov 			if (sa == NULL)
1426b31fbebeSAlexander V. Chernikov 				return (ENOBUFS);
1427b31fbebeSAlexander V. Chernikov 			fill_sockaddr_inet((struct sockaddr_in *)sa, gw_sin->sin_addr);
1428b31fbebeSAlexander V. Chernikov 			info->rti_info[RTAX_GATEWAY] = sa;
14292fe5a794SAlexander V. Chernikov 		}
14302fe5a794SAlexander V. Chernikov 		break;
14312fe5a794SAlexander V. Chernikov #endif
14322fe5a794SAlexander V. Chernikov #ifdef INET6
14332fe5a794SAlexander V. Chernikov 	case AF_INET6:
14342fe5a794SAlexander V. Chernikov 		{
14352fe5a794SAlexander V. Chernikov 			struct sockaddr_in6 *gw_sin6 = (struct sockaddr_in6 *)gw;
14362fe5a794SAlexander V. Chernikov 			if (gw_sin6->sin6_len < sizeof(struct sockaddr_in6)) {
14376fa8ed43SAlexander V. Chernikov 				RTS_PID_LOG(LOG_DEBUG, "gateway sin6_len too small: %d",
14386fa8ed43SAlexander V. Chernikov 				    gw->sa_len);
14392fe5a794SAlexander V. Chernikov 				return (EINVAL);
14402fe5a794SAlexander V. Chernikov 			}
14412fe5a794SAlexander V. Chernikov 			fill_sockaddr_inet6(gw_sin6, &gw_sin6->sin6_addr, 0);
14422fe5a794SAlexander V. Chernikov 			break;
14432fe5a794SAlexander V. Chernikov 		}
14442fe5a794SAlexander V. Chernikov #endif
14452fe5a794SAlexander V. Chernikov 	case AF_LINK:
14462fe5a794SAlexander V. Chernikov 		{
14477f5f3fccSAlexander V. Chernikov 			struct sockaddr_dl *gw_sdl;
14482fe5a794SAlexander V. Chernikov 
14497f5f3fccSAlexander V. Chernikov 			size_t sdl_min_len = offsetof(struct sockaddr_dl, sdl_data);
14507f5f3fccSAlexander V. Chernikov 			gw_sdl = (struct sockaddr_dl *)gw;
14517f5f3fccSAlexander V. Chernikov 			if (gw_sdl->sdl_len < sdl_min_len) {
14526fa8ed43SAlexander V. Chernikov 				RTS_PID_LOG(LOG_DEBUG, "gateway sdl_len too small: %d",
14536fa8ed43SAlexander V. Chernikov 				    gw_sdl->sdl_len);
14542fe5a794SAlexander V. Chernikov 				return (EINVAL);
14552fe5a794SAlexander V. Chernikov 			}
1456b31fbebeSAlexander V. Chernikov 			sa = alloc_sockaddr_aligned(lb, sizeof(struct sockaddr_dl_short));
1457b31fbebeSAlexander V. Chernikov 			if (sa == NULL)
1458b31fbebeSAlexander V. Chernikov 				return (ENOBUFS);
14592fe5a794SAlexander V. Chernikov 
14602fe5a794SAlexander V. Chernikov 			const struct sockaddr_dl_short sdl = {
14612fe5a794SAlexander V. Chernikov 				.sdl_family = AF_LINK,
1462b31fbebeSAlexander V. Chernikov 				.sdl_len = sizeof(struct sockaddr_dl_short),
14632fe5a794SAlexander V. Chernikov 				.sdl_index = gw_sdl->sdl_index,
14642fe5a794SAlexander V. Chernikov 			};
1465b31fbebeSAlexander V. Chernikov 			*((struct sockaddr_dl_short *)sa) = sdl;
1466b31fbebeSAlexander V. Chernikov 			info->rti_info[RTAX_GATEWAY] = sa;
14672fe5a794SAlexander V. Chernikov 			break;
14682fe5a794SAlexander V. Chernikov 		}
14692fe5a794SAlexander V. Chernikov 	}
14702fe5a794SAlexander V. Chernikov 
14712fe5a794SAlexander V. Chernikov 	return (0);
14722fe5a794SAlexander V. Chernikov }
1473a3c2c06bSBjoern A. Zeeb #endif
14742fe5a794SAlexander V. Chernikov 
1475f9e1cd6cSAlexander V. Chernikov static void
1476f9e1cd6cSAlexander V. Chernikov remove_netmask(struct rt_addrinfo *info)
1477f9e1cd6cSAlexander V. Chernikov {
1478f9e1cd6cSAlexander V. Chernikov 	info->rti_info[RTAX_NETMASK] = NULL;
1479f9e1cd6cSAlexander V. Chernikov 	info->rti_flags |= RTF_HOST;
1480f9e1cd6cSAlexander V. Chernikov 	info->rti_addrs &= ~RTA_NETMASK;
1481f9e1cd6cSAlexander V. Chernikov }
1482f9e1cd6cSAlexander V. Chernikov 
1483a4513bacSAlexander V. Chernikov #ifdef INET
14842fe5a794SAlexander V. Chernikov static int
1485b31fbebeSAlexander V. Chernikov cleanup_xaddrs_inet(struct rt_addrinfo *info, struct linear_buffer *lb)
14862fe5a794SAlexander V. Chernikov {
14872fe5a794SAlexander V. Chernikov 	struct sockaddr_in *dst_sa, *mask_sa;
1488b31fbebeSAlexander V. Chernikov 	const int sa_len = sizeof(struct sockaddr_in);
1489b31fbebeSAlexander V. Chernikov 	struct in_addr dst, mask;
14902fe5a794SAlexander V. Chernikov 
14912fe5a794SAlexander V. Chernikov 	/* Check & fixup dst/netmask combination first */
14922fe5a794SAlexander V. Chernikov 	dst_sa = (struct sockaddr_in *)info->rti_info[RTAX_DST];
14932fe5a794SAlexander V. Chernikov 	mask_sa = (struct sockaddr_in *)info->rti_info[RTAX_NETMASK];
14942fe5a794SAlexander V. Chernikov 
1495b31fbebeSAlexander V. Chernikov 	/* Ensure reads do not go beyound the buffer size */
14966fa8ed43SAlexander V. Chernikov 	if (SA_SIZE(dst_sa) < offsetof(struct sockaddr_in, sin_zero)) {
14976fa8ed43SAlexander V. Chernikov 		RTS_PID_LOG(LOG_DEBUG, "prefix dst sin_len too small: %d",
14986fa8ed43SAlexander V. Chernikov 		    dst_sa->sin_len);
14992fe5a794SAlexander V. Chernikov 		return (EINVAL);
15006fa8ed43SAlexander V. Chernikov 	}
1501b31fbebeSAlexander V. Chernikov 
1502b31fbebeSAlexander V. Chernikov 	if ((mask_sa != NULL) && mask_sa->sin_len < sizeof(struct sockaddr_in)) {
1503b31fbebeSAlexander V. Chernikov 		/*
1504b31fbebeSAlexander V. Chernikov 		 * Some older routing software encode mask length into the
1505b31fbebeSAlexander V. Chernikov 		 * sin_len, thus resulting in "truncated" sockaddr.
1506b31fbebeSAlexander V. Chernikov 		 */
1507b31fbebeSAlexander V. Chernikov 		int len = mask_sa->sin_len - offsetof(struct sockaddr_in, sin_addr);
1508b31fbebeSAlexander V. Chernikov 		if (len >= 0) {
1509b31fbebeSAlexander V. Chernikov 			mask.s_addr = 0;
1510b31fbebeSAlexander V. Chernikov 			if (len > sizeof(struct in_addr))
1511b31fbebeSAlexander V. Chernikov 				len = sizeof(struct in_addr);
1512b31fbebeSAlexander V. Chernikov 			memcpy(&mask, &mask_sa->sin_addr, len);
1513b31fbebeSAlexander V. Chernikov 		} else {
15146fa8ed43SAlexander V. Chernikov 			RTS_PID_LOG(LOG_DEBUG, "prefix mask sin_len too small: %d",
15156fa8ed43SAlexander V. Chernikov 			    mask_sa->sin_len);
15162fe5a794SAlexander V. Chernikov 			return (EINVAL);
15172fe5a794SAlexander V. Chernikov 		}
1518b31fbebeSAlexander V. Chernikov 	} else
1519b31fbebeSAlexander V. Chernikov 		mask.s_addr = mask_sa ? mask_sa->sin_addr.s_addr : INADDR_BROADCAST;
15202fe5a794SAlexander V. Chernikov 
1521b31fbebeSAlexander V. Chernikov 	dst.s_addr = htonl(ntohl(dst_sa->sin_addr.s_addr) & ntohl(mask.s_addr));
1522b31fbebeSAlexander V. Chernikov 
1523b31fbebeSAlexander V. Chernikov 	/* Construct new "clean" dst/mask sockaddresses */
1524b31fbebeSAlexander V. Chernikov 	if ((dst_sa = (struct sockaddr_in *)alloc_sockaddr_aligned(lb, sa_len)) == NULL)
1525b31fbebeSAlexander V. Chernikov 		return (ENOBUFS);
1526b31fbebeSAlexander V. Chernikov 	fill_sockaddr_inet(dst_sa, dst);
1527b31fbebeSAlexander V. Chernikov 	info->rti_info[RTAX_DST] = (struct sockaddr *)dst_sa;
1528b31fbebeSAlexander V. Chernikov 
1529b31fbebeSAlexander V. Chernikov 	if (mask.s_addr != INADDR_BROADCAST) {
1530b31fbebeSAlexander V. Chernikov 		if ((mask_sa = (struct sockaddr_in *)alloc_sockaddr_aligned(lb, sa_len)) == NULL)
1531b31fbebeSAlexander V. Chernikov 			return (ENOBUFS);
15322fe5a794SAlexander V. Chernikov 		fill_sockaddr_inet(mask_sa, mask);
1533b31fbebeSAlexander V. Chernikov 		info->rti_info[RTAX_NETMASK] = (struct sockaddr *)mask_sa;
15345d1403a7SAlexander V. Chernikov 		info->rti_flags &= ~RTF_HOST;
1535b31fbebeSAlexander V. Chernikov 	} else
1536f9e1cd6cSAlexander V. Chernikov 		remove_netmask(info);
15372fe5a794SAlexander V. Chernikov 
15382fe5a794SAlexander V. Chernikov 	/* Check gateway */
15392fe5a794SAlexander V. Chernikov 	if (info->rti_info[RTAX_GATEWAY] != NULL)
1540b31fbebeSAlexander V. Chernikov 		return (cleanup_xaddrs_gateway(info, lb));
15412fe5a794SAlexander V. Chernikov 
15422fe5a794SAlexander V. Chernikov 	return (0);
15432fe5a794SAlexander V. Chernikov }
1544a4513bacSAlexander V. Chernikov #endif
15452fe5a794SAlexander V. Chernikov 
1546a4513bacSAlexander V. Chernikov #ifdef INET6
15472fe5a794SAlexander V. Chernikov static int
1548b31fbebeSAlexander V. Chernikov cleanup_xaddrs_inet6(struct rt_addrinfo *info, struct linear_buffer *lb)
15492fe5a794SAlexander V. Chernikov {
1550b31fbebeSAlexander V. Chernikov 	struct sockaddr *sa;
15512fe5a794SAlexander V. Chernikov 	struct sockaddr_in6 *dst_sa, *mask_sa;
1552b31fbebeSAlexander V. Chernikov 	struct in6_addr mask, *dst;
1553b31fbebeSAlexander V. Chernikov 	const int sa_len = sizeof(struct sockaddr_in6);
15542fe5a794SAlexander V. Chernikov 
15552fe5a794SAlexander V. Chernikov 	/* Check & fixup dst/netmask combination first */
15562fe5a794SAlexander V. Chernikov 	dst_sa = (struct sockaddr_in6 *)info->rti_info[RTAX_DST];
15572fe5a794SAlexander V. Chernikov 	mask_sa = (struct sockaddr_in6 *)info->rti_info[RTAX_NETMASK];
15582fe5a794SAlexander V. Chernikov 
15592fe5a794SAlexander V. Chernikov 	if (dst_sa->sin6_len < sizeof(struct sockaddr_in6)) {
15606fa8ed43SAlexander V. Chernikov 		RTS_PID_LOG(LOG_DEBUG, "prefix dst sin6_len too small: %d",
15616fa8ed43SAlexander V. Chernikov 		    dst_sa->sin6_len);
15622fe5a794SAlexander V. Chernikov 		return (EINVAL);
15632fe5a794SAlexander V. Chernikov 	}
1564b31fbebeSAlexander V. Chernikov 
15652fe5a794SAlexander V. Chernikov 	if (mask_sa && mask_sa->sin6_len < sizeof(struct sockaddr_in6)) {
1566b31fbebeSAlexander V. Chernikov 		/*
1567b31fbebeSAlexander V. Chernikov 		 * Some older routing software encode mask length into the
1568b31fbebeSAlexander V. Chernikov 		 * sin6_len, thus resulting in "truncated" sockaddr.
1569b31fbebeSAlexander V. Chernikov 		 */
1570b31fbebeSAlexander V. Chernikov 		int len = mask_sa->sin6_len - offsetof(struct sockaddr_in6, sin6_addr);
1571b31fbebeSAlexander V. Chernikov 		if (len >= 0) {
1572b31fbebeSAlexander V. Chernikov 			bzero(&mask, sizeof(mask));
1573b31fbebeSAlexander V. Chernikov 			if (len > sizeof(struct in6_addr))
1574b31fbebeSAlexander V. Chernikov 				len = sizeof(struct in6_addr);
1575b31fbebeSAlexander V. Chernikov 			memcpy(&mask, &mask_sa->sin6_addr, len);
1576b31fbebeSAlexander V. Chernikov 		} else {
15776fa8ed43SAlexander V. Chernikov 			RTS_PID_LOG(LOG_DEBUG, "rtsock: prefix mask sin6_len too small: %d",
15786fa8ed43SAlexander V. Chernikov 			    mask_sa->sin6_len);
15792fe5a794SAlexander V. Chernikov 			return (EINVAL);
15802fe5a794SAlexander V. Chernikov 		}
1581b31fbebeSAlexander V. Chernikov 	} else
1582b31fbebeSAlexander V. Chernikov 		mask = mask_sa ? mask_sa->sin6_addr : in6mask128;
15832fe5a794SAlexander V. Chernikov 
1584b31fbebeSAlexander V. Chernikov 	dst = &dst_sa->sin6_addr;
1585b31fbebeSAlexander V. Chernikov 	IN6_MASK_ADDR(dst, &mask);
1586b31fbebeSAlexander V. Chernikov 
1587b31fbebeSAlexander V. Chernikov 	if ((sa = alloc_sockaddr_aligned(lb, sa_len)) == NULL)
1588b31fbebeSAlexander V. Chernikov 		return (ENOBUFS);
1589b31fbebeSAlexander V. Chernikov 	fill_sockaddr_inet6((struct sockaddr_in6 *)sa, dst, 0);
1590b31fbebeSAlexander V. Chernikov 	info->rti_info[RTAX_DST] = sa;
1591b31fbebeSAlexander V. Chernikov 
1592b31fbebeSAlexander V. Chernikov 	if (!IN6_ARE_ADDR_EQUAL(&mask, &in6mask128)) {
1593b31fbebeSAlexander V. Chernikov 		if ((sa = alloc_sockaddr_aligned(lb, sa_len)) == NULL)
1594b31fbebeSAlexander V. Chernikov 			return (ENOBUFS);
1595b31fbebeSAlexander V. Chernikov 		fill_sockaddr_inet6((struct sockaddr_in6 *)sa, &mask, 0);
1596b31fbebeSAlexander V. Chernikov 		info->rti_info[RTAX_NETMASK] = sa;
15975d1403a7SAlexander V. Chernikov 		info->rti_flags &= ~RTF_HOST;
1598b31fbebeSAlexander V. Chernikov 	} else
1599f9e1cd6cSAlexander V. Chernikov 		remove_netmask(info);
16002fe5a794SAlexander V. Chernikov 
16012fe5a794SAlexander V. Chernikov 	/* Check gateway */
16022fe5a794SAlexander V. Chernikov 	if (info->rti_info[RTAX_GATEWAY] != NULL)
1603b31fbebeSAlexander V. Chernikov 		return (cleanup_xaddrs_gateway(info, lb));
16042fe5a794SAlexander V. Chernikov 
16052fe5a794SAlexander V. Chernikov 	return (0);
16062fe5a794SAlexander V. Chernikov }
1607a4513bacSAlexander V. Chernikov #endif
16082fe5a794SAlexander V. Chernikov 
16092fe5a794SAlexander V. Chernikov static int
1610b31fbebeSAlexander V. Chernikov cleanup_xaddrs(struct rt_addrinfo *info, struct linear_buffer *lb)
16112fe5a794SAlexander V. Chernikov {
16122fe5a794SAlexander V. Chernikov 	int error = EAFNOSUPPORT;
16132fe5a794SAlexander V. Chernikov 
16146fa8ed43SAlexander V. Chernikov 	if (info->rti_info[RTAX_DST] == NULL) {
16156fa8ed43SAlexander V. Chernikov 		RTS_PID_LOG(LOG_DEBUG, "prefix dst is not set");
16162fe5a794SAlexander V. Chernikov 		return (EINVAL);
16176fa8ed43SAlexander V. Chernikov 	}
16182fe5a794SAlexander V. Chernikov 
1619f9e1cd6cSAlexander V. Chernikov 	if (info->rti_flags & RTF_LLDATA) {
1620f9e1cd6cSAlexander V. Chernikov 		/*
1621f9e1cd6cSAlexander V. Chernikov 		 * arp(8)/ndp(8) sends RTA_NETMASK for the associated
1622f9e1cd6cSAlexander V. Chernikov 		 * prefix along with the actual address in RTA_DST.
1623f9e1cd6cSAlexander V. Chernikov 		 * Remove netmask to avoid unnecessary address masking.
1624f9e1cd6cSAlexander V. Chernikov 		 */
1625f9e1cd6cSAlexander V. Chernikov 		remove_netmask(info);
1626f9e1cd6cSAlexander V. Chernikov 	}
1627f9e1cd6cSAlexander V. Chernikov 
16282fe5a794SAlexander V. Chernikov 	switch (info->rti_info[RTAX_DST]->sa_family) {
16292fe5a794SAlexander V. Chernikov #ifdef INET
16302fe5a794SAlexander V. Chernikov 	case AF_INET:
1631b31fbebeSAlexander V. Chernikov 		error = cleanup_xaddrs_inet(info, lb);
16322fe5a794SAlexander V. Chernikov 		break;
16332fe5a794SAlexander V. Chernikov #endif
16342fe5a794SAlexander V. Chernikov #ifdef INET6
16352fe5a794SAlexander V. Chernikov 	case AF_INET6:
1636b31fbebeSAlexander V. Chernikov 		error = cleanup_xaddrs_inet6(info, lb);
16372fe5a794SAlexander V. Chernikov 		break;
16382fe5a794SAlexander V. Chernikov #endif
16392fe5a794SAlexander V. Chernikov 	}
16402fe5a794SAlexander V. Chernikov 
16412fe5a794SAlexander V. Chernikov 	return (error);
16422fe5a794SAlexander V. Chernikov }
16432fe5a794SAlexander V. Chernikov 
16446d076ae8SBjoern A. Zeeb /*
16453deb3649SAlexander V. Chernikov  * Fill in @dmask with valid netmask leaving original @smask
16463deb3649SAlexander V. Chernikov  * intact. Mostly used with radix netmasks.
16473deb3649SAlexander V. Chernikov  */
1648fc88ecd3SAlexander V. Chernikov struct sockaddr *
1649fc88ecd3SAlexander V. Chernikov rtsock_fix_netmask(const struct sockaddr *dst, const struct sockaddr *smask,
16503deb3649SAlexander V. Chernikov     struct sockaddr_storage *dmask)
16513deb3649SAlexander V. Chernikov {
16523deb3649SAlexander V. Chernikov 	if (dst == NULL || smask == NULL)
16533deb3649SAlexander V. Chernikov 		return (NULL);
16543deb3649SAlexander V. Chernikov 
16553deb3649SAlexander V. Chernikov 	memset(dmask, 0, dst->sa_len);
16563deb3649SAlexander V. Chernikov 	memcpy(dmask, smask, smask->sa_len);
16573deb3649SAlexander V. Chernikov 	dmask->ss_len = dst->sa_len;
16583deb3649SAlexander V. Chernikov 	dmask->ss_family = dst->sa_family;
16593deb3649SAlexander V. Chernikov 
16603deb3649SAlexander V. Chernikov 	return ((struct sockaddr *)dmask);
16613deb3649SAlexander V. Chernikov }
16623deb3649SAlexander V. Chernikov 
16633deb3649SAlexander V. Chernikov /*
16646db47af4SAlexander V. Chernikov  * Writes information related to @rtinfo object to newly-allocated mbuf.
16656db47af4SAlexander V. Chernikov  * Assumes MCLBYTES is enough to construct any message.
16666db47af4SAlexander V. Chernikov  * Used for OS notifications of vaious events (if/ifa announces,etc)
16676db47af4SAlexander V. Chernikov  *
16686db47af4SAlexander V. Chernikov  * Returns allocated mbuf or NULL on failure.
16696d076ae8SBjoern A. Zeeb  */
1670df8bae1dSRodney W. Grimes static struct mbuf *
16716db47af4SAlexander V. Chernikov rtsock_msg_mbuf(int type, struct rt_addrinfo *rtinfo)
1672df8bae1dSRodney W. Grimes {
167392be2847SMark Johnston 	struct sockaddr_storage ss;
16745dfc91d7SLuigi Rizzo 	struct rt_msghdr *rtm;
16755dfc91d7SLuigi Rizzo 	struct mbuf *m;
16765dfc91d7SLuigi Rizzo 	int i;
16775dfc91d7SLuigi Rizzo 	struct sockaddr *sa;
16786bbfef90SHiroki Sato #ifdef INET6
16796bbfef90SHiroki Sato 	struct sockaddr_in6 *sin6;
16806bbfef90SHiroki Sato #endif
1681df8bae1dSRodney W. Grimes 	int len, dlen;
1682df8bae1dSRodney W. Grimes 
1683df8bae1dSRodney W. Grimes 	switch (type) {
1684df8bae1dSRodney W. Grimes 	case RTM_DELADDR:
1685df8bae1dSRodney W. Grimes 	case RTM_NEWADDR:
1686df8bae1dSRodney W. Grimes 		len = sizeof(struct ifa_msghdr);
1687df8bae1dSRodney W. Grimes 		break;
1688df8bae1dSRodney W. Grimes 
1689477180fbSGarrett Wollman 	case RTM_DELMADDR:
1690477180fbSGarrett Wollman 	case RTM_NEWMADDR:
1691477180fbSGarrett Wollman 		len = sizeof(struct ifma_msghdr);
1692477180fbSGarrett Wollman 		break;
1693477180fbSGarrett Wollman 
1694df8bae1dSRodney W. Grimes 	case RTM_IFINFO:
1695df8bae1dSRodney W. Grimes 		len = sizeof(struct if_msghdr);
1696df8bae1dSRodney W. Grimes 		break;
1697df8bae1dSRodney W. Grimes 
16987b6edd04SRuslan Ermilov 	case RTM_IFANNOUNCE:
1699b83a279fSSam Leffler 	case RTM_IEEE80211:
17007b6edd04SRuslan Ermilov 		len = sizeof(struct if_announcemsghdr);
17017b6edd04SRuslan Ermilov 		break;
17027b6edd04SRuslan Ermilov 
1703df8bae1dSRodney W. Grimes 	default:
1704df8bae1dSRodney W. Grimes 		len = sizeof(struct rt_msghdr);
1705df8bae1dSRodney W. Grimes 	}
1706c69f77c3SGleb Smirnoff 
1707c69f77c3SGleb Smirnoff 	/* XXXGL: can we use MJUMPAGESIZE cluster here? */
1708c69f77c3SGleb Smirnoff 	KASSERT(len <= MCLBYTES, ("%s: message too big", __func__));
1709c69f77c3SGleb Smirnoff 	if (len > MHLEN)
1710c69f77c3SGleb Smirnoff 		m = m_getcl(M_NOWAIT, MT_DATA, M_PKTHDR);
1711c69f77c3SGleb Smirnoff 	else
1712eb1b1807SGleb Smirnoff 		m = m_gethdr(M_NOWAIT, MT_DATA);
17135dfc91d7SLuigi Rizzo 	if (m == NULL)
171433841545SHajimu UMEMOTO 		return (m);
1715c69f77c3SGleb Smirnoff 
1716df8bae1dSRodney W. Grimes 	m->m_pkthdr.len = m->m_len = len;
1717df8bae1dSRodney W. Grimes 	rtm = mtod(m, struct rt_msghdr *);
1718df8bae1dSRodney W. Grimes 	bzero((caddr_t)rtm, len);
1719df8bae1dSRodney W. Grimes 	for (i = 0; i < RTAX_MAX; i++) {
1720df8bae1dSRodney W. Grimes 		if ((sa = rtinfo->rti_info[i]) == NULL)
1721df8bae1dSRodney W. Grimes 			continue;
1722df8bae1dSRodney W. Grimes 		rtinfo->rti_addrs |= (1 << i);
172392be2847SMark Johnston 
1724e74642dfSLuigi Rizzo 		dlen = SA_SIZE(sa);
172592be2847SMark Johnston 		KASSERT(dlen <= sizeof(ss),
172692be2847SMark Johnston 		    ("%s: sockaddr size overflow", __func__));
172792be2847SMark Johnston 		bzero(&ss, sizeof(ss));
172892be2847SMark Johnston 		bcopy(sa, &ss, sa->sa_len);
172992be2847SMark Johnston 		sa = (struct sockaddr *)&ss;
17306bbfef90SHiroki Sato #ifdef INET6
1731bec053ffSAlexander V. Chernikov 		if (sa->sa_family == AF_INET6) {
173292be2847SMark Johnston 			sin6 = (struct sockaddr_in6 *)sa;
173392be2847SMark Johnston 			(void)sa6_recoverscope(sin6);
17346bbfef90SHiroki Sato 		}
17356bbfef90SHiroki Sato #endif
1736df8bae1dSRodney W. Grimes 		m_copyback(m, len, dlen, (caddr_t)sa);
1737df8bae1dSRodney W. Grimes 		len += dlen;
1738df8bae1dSRodney W. Grimes 	}
1739df8bae1dSRodney W. Grimes 	if (m->m_pkthdr.len != len) {
1740df8bae1dSRodney W. Grimes 		m_freem(m);
1741df8bae1dSRodney W. Grimes 		return (NULL);
1742df8bae1dSRodney W. Grimes 	}
1743df8bae1dSRodney W. Grimes 	rtm->rtm_msglen = len;
1744df8bae1dSRodney W. Grimes 	rtm->rtm_version = RTM_VERSION;
1745df8bae1dSRodney W. Grimes 	rtm->rtm_type = type;
1746df8bae1dSRodney W. Grimes 	return (m);
1747df8bae1dSRodney W. Grimes }
1748df8bae1dSRodney W. Grimes 
17496d076ae8SBjoern A. Zeeb /*
1750f2e5eb36SAlexander V. Chernikov  * Writes information related to @rtinfo object to preallocated buffer.
1751f2e5eb36SAlexander V. Chernikov  * Stores needed size in @plen. If @w is NULL, calculates size without
1752f2e5eb36SAlexander V. Chernikov  * writing.
1753f2e5eb36SAlexander V. Chernikov  * Used for sysctl dumps and rtsock answers (RTM_DEL/RTM_GET) generation.
1754f2e5eb36SAlexander V. Chernikov  *
1755f2e5eb36SAlexander V. Chernikov  * Returns 0 on success.
1756f2e5eb36SAlexander V. Chernikov  *
17576d076ae8SBjoern A. Zeeb  */
1758df8bae1dSRodney W. Grimes static int
1759f2e5eb36SAlexander V. Chernikov rtsock_msg_buffer(int type, struct rt_addrinfo *rtinfo, struct walkarg *w, int *plen)
1760df8bae1dSRodney W. Grimes {
176192be2847SMark Johnston 	struct sockaddr_storage ss;
176292be2847SMark Johnston 	int len, buflen = 0, dlen, i;
1763de46b2c6SAlexander V. Chernikov 	caddr_t cp = NULL;
1764f2e5eb36SAlexander V. Chernikov 	struct rt_msghdr *rtm = NULL;
17656bbfef90SHiroki Sato #ifdef INET6
17666bbfef90SHiroki Sato 	struct sockaddr_in6 *sin6;
17676bbfef90SHiroki Sato #endif
1768279e33d4SKonstantin Belousov #ifdef COMPAT_FREEBSD32
1769279e33d4SKonstantin Belousov 	bool compat32 = false;
1770279e33d4SKonstantin Belousov #endif
1771df8bae1dSRodney W. Grimes 
1772df8bae1dSRodney W. Grimes 	switch (type) {
1773df8bae1dSRodney W. Grimes 	case RTM_DELADDR:
1774df8bae1dSRodney W. Grimes 	case RTM_NEWADDR:
17756d076ae8SBjoern A. Zeeb 		if (w != NULL && w->w_op == NET_RT_IFLISTL) {
17766d076ae8SBjoern A. Zeeb #ifdef COMPAT_FREEBSD32
1777279e33d4SKonstantin Belousov 			if (w->w_req->flags & SCTL_MASK32) {
17786d076ae8SBjoern A. Zeeb 				len = sizeof(struct ifa_msghdrl32);
1779279e33d4SKonstantin Belousov 				compat32 = true;
1780279e33d4SKonstantin Belousov 			} else
17816d076ae8SBjoern A. Zeeb #endif
17826d076ae8SBjoern A. Zeeb 				len = sizeof(struct ifa_msghdrl);
17836d076ae8SBjoern A. Zeeb 		} else
1784df8bae1dSRodney W. Grimes 			len = sizeof(struct ifa_msghdr);
1785df8bae1dSRodney W. Grimes 		break;
1786df8bae1dSRodney W. Grimes 
1787df8bae1dSRodney W. Grimes 	case RTM_IFINFO:
1788427a928aSKonstantin Belousov #ifdef COMPAT_FREEBSD32
1789427a928aSKonstantin Belousov 		if (w != NULL && w->w_req->flags & SCTL_MASK32) {
17906d076ae8SBjoern A. Zeeb 			if (w->w_op == NET_RT_IFLISTL)
17916d076ae8SBjoern A. Zeeb 				len = sizeof(struct if_msghdrl32);
17926d076ae8SBjoern A. Zeeb 			else
1793427a928aSKonstantin Belousov 				len = sizeof(struct if_msghdr32);
1794279e33d4SKonstantin Belousov 			compat32 = true;
1795427a928aSKonstantin Belousov 			break;
1796427a928aSKonstantin Belousov 		}
1797427a928aSKonstantin Belousov #endif
17986d076ae8SBjoern A. Zeeb 		if (w != NULL && w->w_op == NET_RT_IFLISTL)
17996d076ae8SBjoern A. Zeeb 			len = sizeof(struct if_msghdrl);
18006d076ae8SBjoern A. Zeeb 		else
1801df8bae1dSRodney W. Grimes 			len = sizeof(struct if_msghdr);
1802df8bae1dSRodney W. Grimes 		break;
1803df8bae1dSRodney W. Grimes 
180405b2efe0SBruce M Simpson 	case RTM_NEWMADDR:
180505b2efe0SBruce M Simpson 		len = sizeof(struct ifma_msghdr);
180605b2efe0SBruce M Simpson 		break;
180705b2efe0SBruce M Simpson 
1808df8bae1dSRodney W. Grimes 	default:
1809df8bae1dSRodney W. Grimes 		len = sizeof(struct rt_msghdr);
1810df8bae1dSRodney W. Grimes 	}
1811f2e5eb36SAlexander V. Chernikov 
1812f2e5eb36SAlexander V. Chernikov 	if (w != NULL) {
1813f2e5eb36SAlexander V. Chernikov 		rtm = (struct rt_msghdr *)w->w_tmem;
1814f2e5eb36SAlexander V. Chernikov 		buflen = w->w_tmemsize - len;
1815f2e5eb36SAlexander V. Chernikov 		cp = (caddr_t)w->w_tmem + len;
1816f2e5eb36SAlexander V. Chernikov 	}
1817f2e5eb36SAlexander V. Chernikov 
1818f2e5eb36SAlexander V. Chernikov 	rtinfo->rti_addrs = 0;
1819df8bae1dSRodney W. Grimes 	for (i = 0; i < RTAX_MAX; i++) {
18205dfc91d7SLuigi Rizzo 		struct sockaddr *sa;
1821df8bae1dSRodney W. Grimes 
18225dfc91d7SLuigi Rizzo 		if ((sa = rtinfo->rti_info[i]) == NULL)
1823df8bae1dSRodney W. Grimes 			continue;
1824df8bae1dSRodney W. Grimes 		rtinfo->rti_addrs |= (1 << i);
1825279e33d4SKonstantin Belousov #ifdef COMPAT_FREEBSD32
1826279e33d4SKonstantin Belousov 		if (compat32)
1827279e33d4SKonstantin Belousov 			dlen = SA_SIZE32(sa);
1828279e33d4SKonstantin Belousov 		else
1829279e33d4SKonstantin Belousov #endif
1830e74642dfSLuigi Rizzo 			dlen = SA_SIZE(sa);
1831f2e5eb36SAlexander V. Chernikov 		if (cp != NULL && buflen >= dlen) {
183292be2847SMark Johnston 			KASSERT(dlen <= sizeof(ss),
183392be2847SMark Johnston 			    ("%s: sockaddr size overflow", __func__));
183492be2847SMark Johnston 			bzero(&ss, sizeof(ss));
183592be2847SMark Johnston 			bcopy(sa, &ss, sa->sa_len);
183692be2847SMark Johnston 			sa = (struct sockaddr *)&ss;
18376bbfef90SHiroki Sato #ifdef INET6
1838bec053ffSAlexander V. Chernikov 			if (sa->sa_family == AF_INET6) {
183992be2847SMark Johnston 				sin6 = (struct sockaddr_in6 *)sa;
184092be2847SMark Johnston 				(void)sa6_recoverscope(sin6);
18416bbfef90SHiroki Sato 			}
18426bbfef90SHiroki Sato #endif
1843df8bae1dSRodney W. Grimes 			bcopy((caddr_t)sa, cp, (unsigned)dlen);
1844df8bae1dSRodney W. Grimes 			cp += dlen;
1845f2e5eb36SAlexander V. Chernikov 			buflen -= dlen;
1846f2e5eb36SAlexander V. Chernikov 		} else if (cp != NULL) {
1847f2e5eb36SAlexander V. Chernikov 			/*
1848f2e5eb36SAlexander V. Chernikov 			 * Buffer too small. Count needed size
1849f2e5eb36SAlexander V. Chernikov 			 * and return with error.
1850f2e5eb36SAlexander V. Chernikov 			 */
1851f2e5eb36SAlexander V. Chernikov 			cp = NULL;
1852df8bae1dSRodney W. Grimes 		}
1853f2e5eb36SAlexander V. Chernikov 
1854df8bae1dSRodney W. Grimes 		len += dlen;
1855df8bae1dSRodney W. Grimes 	}
1856f2e5eb36SAlexander V. Chernikov 
1857f2e5eb36SAlexander V. Chernikov 	if (cp != NULL) {
1858f2e5eb36SAlexander V. Chernikov 		dlen = ALIGN(len) - len;
1859f2e5eb36SAlexander V. Chernikov 		if (buflen < dlen)
1860f2e5eb36SAlexander V. Chernikov 			cp = NULL;
1861d25f8522SMark Johnston 		else {
1862d25f8522SMark Johnston 			bzero(cp, dlen);
1863d25f8522SMark Johnston 			cp += dlen;
1864f2e5eb36SAlexander V. Chernikov 			buflen -= dlen;
1865f2e5eb36SAlexander V. Chernikov 		}
1866d25f8522SMark Johnston 	}
1867694ff264SAndrew Gallatin 	len = ALIGN(len);
1868df8bae1dSRodney W. Grimes 
1869f2e5eb36SAlexander V. Chernikov 	if (cp != NULL) {
1870f2e5eb36SAlexander V. Chernikov 		/* fill header iff buffer is large enough */
1871df8bae1dSRodney W. Grimes 		rtm->rtm_version = RTM_VERSION;
1872df8bae1dSRodney W. Grimes 		rtm->rtm_type = type;
1873df8bae1dSRodney W. Grimes 		rtm->rtm_msglen = len;
1874df8bae1dSRodney W. Grimes 	}
1875f2e5eb36SAlexander V. Chernikov 
1876f2e5eb36SAlexander V. Chernikov 	*plen = len;
1877f2e5eb36SAlexander V. Chernikov 
1878f2e5eb36SAlexander V. Chernikov 	if (w != NULL && cp == NULL)
1879f2e5eb36SAlexander V. Chernikov 		return (ENOBUFS);
1880f2e5eb36SAlexander V. Chernikov 
1881f2e5eb36SAlexander V. Chernikov 	return (0);
1882df8bae1dSRodney W. Grimes }
1883df8bae1dSRodney W. Grimes 
1884df8bae1dSRodney W. Grimes /*
1885df8bae1dSRodney W. Grimes  * This routine is called to generate a message from the routing
1886a4641f4eSPedro F. Giffuni  * socket indicating that a redirect has occurred, a routing lookup
1887df8bae1dSRodney W. Grimes  * has failed, or that a protocol has detected timeouts to a particular
1888df8bae1dSRodney W. Grimes  * destination.
1889df8bae1dSRodney W. Grimes  */
1890df8bae1dSRodney W. Grimes void
1891528737fdSBjoern A. Zeeb rt_missmsg_fib(int type, struct rt_addrinfo *rtinfo, int flags, int error,
1892528737fdSBjoern A. Zeeb     int fibnum)
1893df8bae1dSRodney W. Grimes {
1894becc44d7SSam Leffler 	struct rt_msghdr *rtm;
1895becc44d7SSam Leffler 	struct mbuf *m;
1896df8bae1dSRodney W. Grimes 	struct sockaddr *sa = rtinfo->rti_info[RTAX_DST];
1897df8bae1dSRodney W. Grimes 
1898c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
1899df8bae1dSRodney W. Grimes 		return;
19006db47af4SAlexander V. Chernikov 	m = rtsock_msg_mbuf(type, rtinfo);
19015dfc91d7SLuigi Rizzo 	if (m == NULL)
1902df8bae1dSRodney W. Grimes 		return;
1903528737fdSBjoern A. Zeeb 
19047d9b6df1SAlexander V. Chernikov 	if (fibnum != RT_ALL_FIBS) {
1905528737fdSBjoern A. Zeeb 		KASSERT(fibnum >= 0 && fibnum < rt_numfibs, ("%s: fibnum out "
1906528737fdSBjoern A. Zeeb 		    "of range 0 <= %d < %d", __func__, fibnum, rt_numfibs));
1907528737fdSBjoern A. Zeeb 		M_SETFIB(m, fibnum);
1908528737fdSBjoern A. Zeeb 		m->m_flags |= RTS_FILTER_FIB;
1909528737fdSBjoern A. Zeeb 	}
1910528737fdSBjoern A. Zeeb 
1911df8bae1dSRodney W. Grimes 	rtm = mtod(m, struct rt_msghdr *);
1912df8bae1dSRodney W. Grimes 	rtm->rtm_flags = RTF_DONE | flags;
1913df8bae1dSRodney W. Grimes 	rtm->rtm_errno = error;
1914df8bae1dSRodney W. Grimes 	rtm->rtm_addrs = rtinfo->rti_addrs;
19153ca1a2d6SMax Laier 	rt_dispatch(m, sa ? sa->sa_family : AF_UNSPEC);
1916df8bae1dSRodney W. Grimes }
1917df8bae1dSRodney W. Grimes 
1918528737fdSBjoern A. Zeeb void
1919528737fdSBjoern A. Zeeb rt_missmsg(int type, struct rt_addrinfo *rtinfo, int flags, int error)
1920528737fdSBjoern A. Zeeb {
1921528737fdSBjoern A. Zeeb 
19227d9b6df1SAlexander V. Chernikov 	rt_missmsg_fib(type, rtinfo, flags, error, RT_ALL_FIBS);
1923528737fdSBjoern A. Zeeb }
1924528737fdSBjoern A. Zeeb 
1925df8bae1dSRodney W. Grimes /*
1926df8bae1dSRodney W. Grimes  * This routine is called to generate a message from the routing
1927df8bae1dSRodney W. Grimes  * socket indicating that the status of a network interface has changed.
1928df8bae1dSRodney W. Grimes  */
1929df8bae1dSRodney W. Grimes void
1930becc44d7SSam Leffler rt_ifmsg(struct ifnet *ifp)
1931df8bae1dSRodney W. Grimes {
1932becc44d7SSam Leffler 	struct if_msghdr *ifm;
1933df8bae1dSRodney W. Grimes 	struct mbuf *m;
1934df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
1935df8bae1dSRodney W. Grimes 
1936c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
1937df8bae1dSRodney W. Grimes 		return;
1938df8bae1dSRodney W. Grimes 	bzero((caddr_t)&info, sizeof(info));
19396db47af4SAlexander V. Chernikov 	m = rtsock_msg_mbuf(RTM_IFINFO, &info);
19405dfc91d7SLuigi Rizzo 	if (m == NULL)
1941df8bae1dSRodney W. Grimes 		return;
1942df8bae1dSRodney W. Grimes 	ifm = mtod(m, struct if_msghdr *);
1943df8bae1dSRodney W. Grimes 	ifm->ifm_index = ifp->if_index;
1944292ee7beSRobert Watson 	ifm->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
1945e6485f73SGleb Smirnoff 	if_data_copy(ifp, &ifm->ifm_data);
1946df8bae1dSRodney W. Grimes 	ifm->ifm_addrs = 0;
19473ca1a2d6SMax Laier 	rt_dispatch(m, AF_UNSPEC);
1948df8bae1dSRodney W. Grimes }
1949df8bae1dSRodney W. Grimes 
1950df8bae1dSRodney W. Grimes /*
19514cbac30bSAlexander V. Chernikov  * Announce interface address arrival/withdraw.
19524cbac30bSAlexander V. Chernikov  * Please do not call directly, use rt_addrmsg().
19534cbac30bSAlexander V. Chernikov  * Assume input data to be valid.
19544cbac30bSAlexander V. Chernikov  * Returns 0 on success.
1955df8bae1dSRodney W. Grimes  */
19564cbac30bSAlexander V. Chernikov int
19574cbac30bSAlexander V. Chernikov rtsock_addrmsg(int cmd, struct ifaddr *ifa, int fibnum)
1958df8bae1dSRodney W. Grimes {
1959df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
19604cbac30bSAlexander V. Chernikov 	struct sockaddr *sa;
19614cbac30bSAlexander V. Chernikov 	int ncmd;
19624cbac30bSAlexander V. Chernikov 	struct mbuf *m;
19634cbac30bSAlexander V. Chernikov 	struct ifa_msghdr *ifam;
1964df8bae1dSRodney W. Grimes 	struct ifnet *ifp = ifa->ifa_ifp;
19653deb3649SAlexander V. Chernikov 	struct sockaddr_storage ss;
1966df8bae1dSRodney W. Grimes 
1967c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
19684cbac30bSAlexander V. Chernikov 		return (0);
1969df8bae1dSRodney W. Grimes 
19704cbac30bSAlexander V. Chernikov 	ncmd = cmd == RTM_ADD ? RTM_NEWADDR : RTM_DELADDR;
19714cbac30bSAlexander V. Chernikov 
19724cbac30bSAlexander V. Chernikov 	bzero((caddr_t)&info, sizeof(info));
1973becc44d7SSam Leffler 	info.rti_info[RTAX_IFA] = sa = ifa->ifa_addr;
19744a0d6638SRuslan Ermilov 	info.rti_info[RTAX_IFP] = ifp->if_addr->ifa_addr;
19753deb3649SAlexander V. Chernikov 	info.rti_info[RTAX_NETMASK] = rtsock_fix_netmask(
1976e02d3fe7SAlexander V. Chernikov 	    info.rti_info[RTAX_IFA], ifa->ifa_netmask, &ss);
1977becc44d7SSam Leffler 	info.rti_info[RTAX_BRD] = ifa->ifa_dstaddr;
19786db47af4SAlexander V. Chernikov 	if ((m = rtsock_msg_mbuf(ncmd, &info)) == NULL)
19794cbac30bSAlexander V. Chernikov 		return (ENOBUFS);
1980df8bae1dSRodney W. Grimes 	ifam = mtod(m, struct ifa_msghdr *);
1981df8bae1dSRodney W. Grimes 	ifam->ifam_index = ifp->if_index;
19829753faf5SGleb Smirnoff 	ifam->ifam_metric = ifa->ifa_ifp->if_metric;
1983df8bae1dSRodney W. Grimes 	ifam->ifam_flags = ifa->ifa_flags;
1984df8bae1dSRodney W. Grimes 	ifam->ifam_addrs = info.rti_addrs;
19854cbac30bSAlexander V. Chernikov 
19864cbac30bSAlexander V. Chernikov 	if (fibnum != RT_ALL_FIBS) {
19874cbac30bSAlexander V. Chernikov 		M_SETFIB(m, fibnum);
19884cbac30bSAlexander V. Chernikov 		m->m_flags |= RTS_FILTER_FIB;
1989df8bae1dSRodney W. Grimes 	}
19904cbac30bSAlexander V. Chernikov 
19914cbac30bSAlexander V. Chernikov 	rt_dispatch(m, sa ? sa->sa_family : AF_UNSPEC);
19924cbac30bSAlexander V. Chernikov 
19934cbac30bSAlexander V. Chernikov 	return (0);
19944cbac30bSAlexander V. Chernikov }
19954cbac30bSAlexander V. Chernikov 
19964cbac30bSAlexander V. Chernikov /*
1997e02d3fe7SAlexander V. Chernikov  * Announce route addition/removal to rtsock based on @rt data.
1998e02d3fe7SAlexander V. Chernikov  * Callers are advives to use rt_routemsg() instead of using this
1999e02d3fe7SAlexander V. Chernikov  *  function directly.
2000e02d3fe7SAlexander V. Chernikov  * Assume @rt data is consistent.
20014cbac30bSAlexander V. Chernikov  *
20024cbac30bSAlexander V. Chernikov  * Returns 0 on success.
20034cbac30bSAlexander V. Chernikov  */
20044cbac30bSAlexander V. Chernikov int
2005d68cf57bSAlexander V. Chernikov rtsock_routemsg(int cmd, struct rtentry *rt, struct nhop_object *nh,
20064cbac30bSAlexander V. Chernikov     int fibnum)
20074cbac30bSAlexander V. Chernikov {
2008d68cf57bSAlexander V. Chernikov 	union sockaddr_union dst, mask;
2009e02d3fe7SAlexander V. Chernikov 	struct rt_addrinfo info;
2010df8bae1dSRodney W. Grimes 
2011c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
20124cbac30bSAlexander V. Chernikov 		return (0);
20134cbac30bSAlexander V. Chernikov 
2014d68cf57bSAlexander V. Chernikov 	int family = rt_get_family(rt);
2015d68cf57bSAlexander V. Chernikov 	init_sockaddrs_family(family, &dst.sa, &mask.sa);
2016d68cf57bSAlexander V. Chernikov 	export_rtaddrs(rt, &dst.sa, &mask.sa);
2017d68cf57bSAlexander V. Chernikov 
20184cbac30bSAlexander V. Chernikov 	bzero((caddr_t)&info, sizeof(info));
2019d68cf57bSAlexander V. Chernikov 	info.rti_info[RTAX_DST] = &dst.sa;
2020d68cf57bSAlexander V. Chernikov 	info.rti_info[RTAX_NETMASK] = &mask.sa;
202193bfd365SAlexander V. Chernikov 	info.rti_info[RTAX_GATEWAY] = &nh->gw_sa;
202293bfd365SAlexander V. Chernikov 	info.rti_flags = rt->rte_flags | nhop_get_rtflags(nh);
2023d68cf57bSAlexander V. Chernikov 	info.rti_ifp = nh->nh_ifp;
2024e02d3fe7SAlexander V. Chernikov 
2025e02d3fe7SAlexander V. Chernikov 	return (rtsock_routemsg_info(cmd, &info, fibnum));
2026e02d3fe7SAlexander V. Chernikov }
2027e02d3fe7SAlexander V. Chernikov 
2028e02d3fe7SAlexander V. Chernikov int
2029e02d3fe7SAlexander V. Chernikov rtsock_routemsg_info(int cmd, struct rt_addrinfo *info, int fibnum)
2030e02d3fe7SAlexander V. Chernikov {
2031e02d3fe7SAlexander V. Chernikov 	struct rt_msghdr *rtm;
2032e02d3fe7SAlexander V. Chernikov 	struct sockaddr *sa;
2033e02d3fe7SAlexander V. Chernikov 	struct mbuf *m;
2034e02d3fe7SAlexander V. Chernikov 
2035e02d3fe7SAlexander V. Chernikov 	if (V_route_cb.any_count == 0)
2036e02d3fe7SAlexander V. Chernikov 		return (0);
2037e02d3fe7SAlexander V. Chernikov 
2038e02d3fe7SAlexander V. Chernikov 	if (info->rti_flags & RTF_HOST)
2039e02d3fe7SAlexander V. Chernikov 		info->rti_info[RTAX_NETMASK] = NULL;
2040e02d3fe7SAlexander V. Chernikov 
2041e02d3fe7SAlexander V. Chernikov 	m = rtsock_msg_mbuf(cmd, info);
2042e02d3fe7SAlexander V. Chernikov 	if (m == NULL)
20434cbac30bSAlexander V. Chernikov 		return (ENOBUFS);
20444cbac30bSAlexander V. Chernikov 
20457d9b6df1SAlexander V. Chernikov 	if (fibnum != RT_ALL_FIBS) {
2046e02d3fe7SAlexander V. Chernikov 		KASSERT(fibnum >= 0 && fibnum < rt_numfibs, ("%s: fibnum out "
2047e02d3fe7SAlexander V. Chernikov 		    "of range 0 <= %d < %d", __func__, fibnum, rt_numfibs));
2048528737fdSBjoern A. Zeeb 		M_SETFIB(m, fibnum);
2049528737fdSBjoern A. Zeeb 		m->m_flags |= RTS_FILTER_FIB;
2050528737fdSBjoern A. Zeeb 	}
20514cbac30bSAlexander V. Chernikov 
2052e02d3fe7SAlexander V. Chernikov 	rtm = mtod(m, struct rt_msghdr *);
2053e02d3fe7SAlexander V. Chernikov 	rtm->rtm_addrs = info->rti_addrs;
2054e02d3fe7SAlexander V. Chernikov 	if (info->rti_ifp != NULL)
2055e02d3fe7SAlexander V. Chernikov 		rtm->rtm_index = info->rti_ifp->if_index;
2056e02d3fe7SAlexander V. Chernikov 	/* Add RTF_DONE to indicate command 'completion' required by API */
2057e02d3fe7SAlexander V. Chernikov 	info->rti_flags |= RTF_DONE;
2058e02d3fe7SAlexander V. Chernikov 	/* Reported routes has to be up */
2059e02d3fe7SAlexander V. Chernikov 	if (cmd == RTM_ADD || cmd == RTM_CHANGE)
2060e02d3fe7SAlexander V. Chernikov 		info->rti_flags |= RTF_UP;
2061e02d3fe7SAlexander V. Chernikov 	rtm->rtm_flags = info->rti_flags;
2062e02d3fe7SAlexander V. Chernikov 
2063e02d3fe7SAlexander V. Chernikov 	sa = info->rti_info[RTAX_DST];
20643ca1a2d6SMax Laier 	rt_dispatch(m, sa ? sa->sa_family : AF_UNSPEC);
20654cbac30bSAlexander V. Chernikov 
20664cbac30bSAlexander V. Chernikov 	return (0);
2067df8bae1dSRodney W. Grimes }
2068df8bae1dSRodney W. Grimes 
2069477180fbSGarrett Wollman /*
2070477180fbSGarrett Wollman  * This is the analogue to the rt_newaddrmsg which performs the same
2071477180fbSGarrett Wollman  * function but for multicast group memberhips.  This is easier since
2072477180fbSGarrett Wollman  * there is no route state to worry about.
2073477180fbSGarrett Wollman  */
2074477180fbSGarrett Wollman void
2075becc44d7SSam Leffler rt_newmaddrmsg(int cmd, struct ifmultiaddr *ifma)
2076477180fbSGarrett Wollman {
2077477180fbSGarrett Wollman 	struct rt_addrinfo info;
20785dfc91d7SLuigi Rizzo 	struct mbuf *m = NULL;
2079477180fbSGarrett Wollman 	struct ifnet *ifp = ifma->ifma_ifp;
2080477180fbSGarrett Wollman 	struct ifma_msghdr *ifmam;
2081477180fbSGarrett Wollman 
2082c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
2083477180fbSGarrett Wollman 		return;
2084477180fbSGarrett Wollman 
2085477180fbSGarrett Wollman 	bzero((caddr_t)&info, sizeof(info));
2086becc44d7SSam Leffler 	info.rti_info[RTAX_IFA] = ifma->ifma_addr;
20877edd877aSMatt Macy 	if (ifp && ifp->if_addr)
20887edd877aSMatt Macy 		info.rti_info[RTAX_IFP] = ifp->if_addr->ifa_addr;
20897edd877aSMatt Macy 	else
20907edd877aSMatt Macy 		info.rti_info[RTAX_IFP] = NULL;
2091477180fbSGarrett Wollman 	/*
2092477180fbSGarrett Wollman 	 * If a link-layer address is present, present it as a ``gateway''
2093477180fbSGarrett Wollman 	 * (similarly to how ARP entries, e.g., are presented).
2094477180fbSGarrett Wollman 	 */
2095becc44d7SSam Leffler 	info.rti_info[RTAX_GATEWAY] = ifma->ifma_lladdr;
20966db47af4SAlexander V. Chernikov 	m = rtsock_msg_mbuf(cmd, &info);
2097becc44d7SSam Leffler 	if (m == NULL)
2098477180fbSGarrett Wollman 		return;
2099477180fbSGarrett Wollman 	ifmam = mtod(m, struct ifma_msghdr *);
210075ae0c01SBruce M Simpson 	KASSERT(ifp != NULL, ("%s: link-layer multicast address w/o ifp\n",
210175ae0c01SBruce M Simpson 	    __func__));
2102477180fbSGarrett Wollman 	ifmam->ifmam_index = ifp->if_index;
2103477180fbSGarrett Wollman 	ifmam->ifmam_addrs = info.rti_addrs;
21043ca1a2d6SMax Laier 	rt_dispatch(m, ifma->ifma_addr ? ifma->ifma_addr->sa_family : AF_UNSPEC);
2105477180fbSGarrett Wollman }
210652041295SPoul-Henning Kamp 
2107b83a279fSSam Leffler static struct mbuf *
2108b83a279fSSam Leffler rt_makeifannouncemsg(struct ifnet *ifp, int type, int what,
2109b83a279fSSam Leffler 	struct rt_addrinfo *info)
2110b83a279fSSam Leffler {
2111b83a279fSSam Leffler 	struct if_announcemsghdr *ifan;
2112b83a279fSSam Leffler 	struct mbuf *m;
2113b83a279fSSam Leffler 
2114c5d4eab6SMarko Zec 	if (V_route_cb.any_count == 0)
2115b83a279fSSam Leffler 		return NULL;
2116b83a279fSSam Leffler 	bzero((caddr_t)info, sizeof(*info));
21176db47af4SAlexander V. Chernikov 	m = rtsock_msg_mbuf(type, info);
2118b83a279fSSam Leffler 	if (m != NULL) {
2119b83a279fSSam Leffler 		ifan = mtod(m, struct if_announcemsghdr *);
2120b83a279fSSam Leffler 		ifan->ifan_index = ifp->if_index;
2121b83a279fSSam Leffler 		strlcpy(ifan->ifan_name, ifp->if_xname,
2122b83a279fSSam Leffler 			sizeof(ifan->ifan_name));
2123b83a279fSSam Leffler 		ifan->ifan_what = what;
2124b83a279fSSam Leffler 	}
2125b83a279fSSam Leffler 	return m;
2126b83a279fSSam Leffler }
2127b83a279fSSam Leffler 
2128b83a279fSSam Leffler /*
2129b83a279fSSam Leffler  * This is called to generate routing socket messages indicating
2130b83a279fSSam Leffler  * IEEE80211 wireless events.
2131b83a279fSSam Leffler  * XXX we piggyback on the RTM_IFANNOUNCE msg format in a clumsy way.
2132b83a279fSSam Leffler  */
2133b83a279fSSam Leffler void
2134b83a279fSSam Leffler rt_ieee80211msg(struct ifnet *ifp, int what, void *data, size_t data_len)
2135b83a279fSSam Leffler {
2136b83a279fSSam Leffler 	struct mbuf *m;
2137b83a279fSSam Leffler 	struct rt_addrinfo info;
2138b83a279fSSam Leffler 
2139b83a279fSSam Leffler 	m = rt_makeifannouncemsg(ifp, RTM_IEEE80211, what, &info);
2140b83a279fSSam Leffler 	if (m != NULL) {
2141b83a279fSSam Leffler 		/*
2142b83a279fSSam Leffler 		 * Append the ieee80211 data.  Try to stick it in the
2143b83a279fSSam Leffler 		 * mbuf containing the ifannounce msg; otherwise allocate
2144b83a279fSSam Leffler 		 * a new mbuf and append.
2145b83a279fSSam Leffler 		 *
2146b83a279fSSam Leffler 		 * NB: we assume m is a single mbuf.
2147b83a279fSSam Leffler 		 */
2148b83a279fSSam Leffler 		if (data_len > M_TRAILINGSPACE(m)) {
2149b83a279fSSam Leffler 			struct mbuf *n = m_get(M_NOWAIT, MT_DATA);
2150b83a279fSSam Leffler 			if (n == NULL) {
2151b83a279fSSam Leffler 				m_freem(m);
2152b83a279fSSam Leffler 				return;
2153b83a279fSSam Leffler 			}
2154b83a279fSSam Leffler 			bcopy(data, mtod(n, void *), data_len);
2155b83a279fSSam Leffler 			n->m_len = data_len;
2156b83a279fSSam Leffler 			m->m_next = n;
2157b83a279fSSam Leffler 		} else if (data_len > 0) {
2158b83a279fSSam Leffler 			bcopy(data, mtod(m, u_int8_t *) + m->m_len, data_len);
2159b83a279fSSam Leffler 			m->m_len += data_len;
2160b83a279fSSam Leffler 		}
2161b83a279fSSam Leffler 		if (m->m_flags & M_PKTHDR)
2162b83a279fSSam Leffler 			m->m_pkthdr.len += data_len;
2163b83a279fSSam Leffler 		mtod(m, struct if_announcemsghdr *)->ifan_msglen += data_len;
21643ca1a2d6SMax Laier 		rt_dispatch(m, AF_UNSPEC);
2165b83a279fSSam Leffler 	}
2166b83a279fSSam Leffler }
2167b83a279fSSam Leffler 
2168df8bae1dSRodney W. Grimes /*
21697b6edd04SRuslan Ermilov  * This is called to generate routing socket messages indicating
21707b6edd04SRuslan Ermilov  * network interface arrival and departure.
21717b6edd04SRuslan Ermilov  */
21727b6edd04SRuslan Ermilov void
2173becc44d7SSam Leffler rt_ifannouncemsg(struct ifnet *ifp, int what)
21747b6edd04SRuslan Ermilov {
21757b6edd04SRuslan Ermilov 	struct mbuf *m;
21767b6edd04SRuslan Ermilov 	struct rt_addrinfo info;
21777b6edd04SRuslan Ermilov 
2178b83a279fSSam Leffler 	m = rt_makeifannouncemsg(ifp, RTM_IFANNOUNCE, what, &info);
2179b83a279fSSam Leffler 	if (m != NULL)
21803ca1a2d6SMax Laier 		rt_dispatch(m, AF_UNSPEC);
2181becc44d7SSam Leffler }
2182becc44d7SSam Leffler 
2183becc44d7SSam Leffler static void
21843ca1a2d6SMax Laier rt_dispatch(struct mbuf *m, sa_family_t saf)
2185becc44d7SSam Leffler {
2186d989c7b3SRobert Watson 	struct m_tag *tag;
2187becc44d7SSam Leffler 
2188d989c7b3SRobert Watson 	/*
2189d989c7b3SRobert Watson 	 * Preserve the family from the sockaddr, if any, in an m_tag for
2190d989c7b3SRobert Watson 	 * use when injecting the mbuf into the routing socket buffer from
2191d989c7b3SRobert Watson 	 * the netisr.
2192d989c7b3SRobert Watson 	 */
21933ca1a2d6SMax Laier 	if (saf != AF_UNSPEC) {
2194d989c7b3SRobert Watson 		tag = m_tag_get(PACKET_TAG_RTSOCKFAM, sizeof(unsigned short),
2195d989c7b3SRobert Watson 		    M_NOWAIT);
2196d989c7b3SRobert Watson 		if (tag == NULL) {
2197d989c7b3SRobert Watson 			m_freem(m);
2198d989c7b3SRobert Watson 			return;
2199d989c7b3SRobert Watson 		}
22003ca1a2d6SMax Laier 		*(unsigned short *)(tag + 1) = saf;
2201d989c7b3SRobert Watson 		m_tag_prepend(m, tag);
2202d989c7b3SRobert Watson 	}
220321ca7b57SMarko Zec 	if (V_loif)
220421ca7b57SMarko Zec 		m->m_pkthdr.rcvif = V_loif;
220521ca7b57SMarko Zec 	else {
220621ca7b57SMarko Zec 		m_freem(m);
220721ca7b57SMarko Zec 		return;
220821ca7b57SMarko Zec 	}
22093161f583SAndre Oppermann 	netisr_queue(NETISR_ROUTE, m);	/* mbuf is free'd on failure. */
22107b6edd04SRuslan Ermilov }
22117b6edd04SRuslan Ermilov 
22127b6edd04SRuslan Ermilov /*
2213758c9d54SAlexander V. Chernikov  * Checks if rte can be exported w.r.t jails/vnets.
2214c83dda36SAlexander V. Chernikov  *
2215758c9d54SAlexander V. Chernikov  * Returns true if it can, false otherwise.
2216c83dda36SAlexander V. Chernikov  */
2217d68fb8d9SAlexander V. Chernikov static bool
2218d68fb8d9SAlexander V. Chernikov can_export_rte(struct ucred *td_ucred, bool rt_is_host,
2219d68fb8d9SAlexander V. Chernikov     const struct sockaddr *rt_dst)
2220c83dda36SAlexander V. Chernikov {
2221c83dda36SAlexander V. Chernikov 
2222d68fb8d9SAlexander V. Chernikov 	if ((!rt_is_host) ? jailed_without_vnet(td_ucred)
2223d68fb8d9SAlexander V. Chernikov 	    : prison_if(td_ucred, rt_dst) != 0)
2224d68fb8d9SAlexander V. Chernikov 		return (false);
2225d68fb8d9SAlexander V. Chernikov 	return (true);
2226c83dda36SAlexander V. Chernikov }
2227c83dda36SAlexander V. Chernikov 
2228d68fb8d9SAlexander V. Chernikov 
2229c83dda36SAlexander V. Chernikov /*
2230df8bae1dSRodney W. Grimes  * This is used in dumping the kernel table via sysctl().
2231df8bae1dSRodney W. Grimes  */
223237c84183SPoul-Henning Kamp static int
2233d68fb8d9SAlexander V. Chernikov sysctl_dumpentry(struct rtentry *rt, void *vw)
2234df8bae1dSRodney W. Grimes {
2235becc44d7SSam Leffler 	struct walkarg *w = vw;
22368c61eb21SAlexander V. Chernikov 	struct nhop_object *nh;
2237df8bae1dSRodney W. Grimes 
2238a68cc388SGleb Smirnoff 	NET_EPOCH_ASSERT();
2239a716ad4aSAndrey V. Elsukov 
2240d68fb8d9SAlexander V. Chernikov 	export_rtaddrs(rt, w->dst, w->mask);
2241d68fb8d9SAlexander V. Chernikov 	if (!can_export_rte(w->w_req->td->td_ucred, rt_is_host(rt), w->dst))
2242813dd6aeSBjoern A. Zeeb 		return (0);
2243d68fb8d9SAlexander V. Chernikov 	nh = rt_get_raw_nhop(rt);
2244fedeb08bSAlexander V. Chernikov #ifdef ROUTE_MPATH
2245fedeb08bSAlexander V. Chernikov 	if (NH_IS_NHGRP(nh)) {
2246fedeb08bSAlexander V. Chernikov 		struct weightened_nhop *wn;
2247fedeb08bSAlexander V. Chernikov 		uint32_t num_nhops;
2248e606e5d1SWarner Losh 		int error;
2249fedeb08bSAlexander V. Chernikov 		wn = nhgrp_get_nhops((struct nhgrp_object *)nh, &num_nhops);
2250fedeb08bSAlexander V. Chernikov 		for (int i = 0; i < num_nhops; i++) {
2251fedeb08bSAlexander V. Chernikov 			error = sysctl_dumpnhop(rt, wn[i].nh, wn[i].weight, w);
2252fedeb08bSAlexander V. Chernikov 			if (error != 0)
2253fedeb08bSAlexander V. Chernikov 				return (error);
2254fedeb08bSAlexander V. Chernikov 		}
2255fedeb08bSAlexander V. Chernikov 	} else
2256fedeb08bSAlexander V. Chernikov #endif
2257e606e5d1SWarner Losh 		sysctl_dumpnhop(rt, nh, rt->rt_weight, w);
22582259a030SAlexander V. Chernikov 
22592259a030SAlexander V. Chernikov 	return (0);
22602259a030SAlexander V. Chernikov }
22612259a030SAlexander V. Chernikov 
22622259a030SAlexander V. Chernikov 
22632259a030SAlexander V. Chernikov static int
22642259a030SAlexander V. Chernikov sysctl_dumpnhop(struct rtentry *rt, struct nhop_object *nh, uint32_t weight,
22652259a030SAlexander V. Chernikov     struct walkarg *w)
22662259a030SAlexander V. Chernikov {
22672259a030SAlexander V. Chernikov 	struct rt_addrinfo info;
22682259a030SAlexander V. Chernikov 	int error = 0, size;
2269d68fb8d9SAlexander V. Chernikov 	uint32_t rtflags;
2270d68fb8d9SAlexander V. Chernikov 
2271d68fb8d9SAlexander V. Chernikov 	rtflags = nhop_get_rtflags(nh);
2272d68fb8d9SAlexander V. Chernikov 
2273d68fb8d9SAlexander V. Chernikov 	if (w->w_op == NET_RT_FLAGS && !(rtflags & w->w_arg))
2274d68fb8d9SAlexander V. Chernikov 		return (0);
22752259a030SAlexander V. Chernikov 
2276df8bae1dSRodney W. Grimes 	bzero((caddr_t)&info, sizeof(info));
2277d68fb8d9SAlexander V. Chernikov 	info.rti_info[RTAX_DST] = w->dst;
227893bfd365SAlexander V. Chernikov 	info.rti_info[RTAX_GATEWAY] = &nh->gw_sa;
2279d68fb8d9SAlexander V. Chernikov 	info.rti_info[RTAX_NETMASK] = (rtflags & RTF_HOST) ? NULL : w->mask;
22806e6b3f7cSQing Li 	info.rti_info[RTAX_GENMASK] = 0;
22818c61eb21SAlexander V. Chernikov 	if (nh->nh_ifp && !(nh->nh_ifp->if_flags & IFF_DYING)) {
22828c61eb21SAlexander V. Chernikov 		info.rti_info[RTAX_IFP] = nh->nh_ifp->if_addr->ifa_addr;
22838c61eb21SAlexander V. Chernikov 		info.rti_info[RTAX_IFA] = nh->nh_ifa->ifa_addr;
22848c61eb21SAlexander V. Chernikov 		if (nh->nh_ifp->if_flags & IFF_POINTOPOINT)
22858c61eb21SAlexander V. Chernikov 			info.rti_info[RTAX_BRD] = nh->nh_ifa->ifa_dstaddr;
228628070a0eSRuslan Ermilov 	}
2287f2e5eb36SAlexander V. Chernikov 	if ((error = rtsock_msg_buffer(RTM_GET, &info, w, &size)) != 0)
2288f2e5eb36SAlexander V. Chernikov 		return (error);
228952041295SPoul-Henning Kamp 	if (w->w_req && w->w_tmem) {
2290becc44d7SSam Leffler 		struct rt_msghdr *rtm = (struct rt_msghdr *)w->w_tmem;
2291df8bae1dSRodney W. Grimes 
2292d25f8522SMark Johnston 		bzero(&rtm->rtm_index,
2293d25f8522SMark Johnston 		    sizeof(*rtm) - offsetof(struct rt_msghdr, rtm_index));
2294d68fb8d9SAlexander V. Chernikov 
2295d68fb8d9SAlexander V. Chernikov 		/*
2296d68fb8d9SAlexander V. Chernikov 		 * rte flags may consist of RTF_HOST (duplicated in nhop rtflags)
2297d68fb8d9SAlexander V. Chernikov 		 * and RTF_UP (if entry is linked, which is always true here).
2298d68fb8d9SAlexander V. Chernikov 		 * Given that, use nhop rtflags & add RTF_UP.
2299d68fb8d9SAlexander V. Chernikov 		 */
2300d68fb8d9SAlexander V. Chernikov 		rtm->rtm_flags = rtflags | RTF_UP;
2301d68fb8d9SAlexander V. Chernikov 		if (rtm->rtm_flags & RTF_GWFLAG_COMPAT)
2302f672f56fSQing Li 			rtm->rtm_flags = RTF_GATEWAY |
2303d68fb8d9SAlexander V. Chernikov 				(rtm->rtm_flags & ~RTF_GWFLAG_COMPAT);
230493bfd365SAlexander V. Chernikov 		rt_getmetrics(rt, nh, &rtm->rtm_rmx);
2305fedeb08bSAlexander V. Chernikov 		rtm->rtm_rmx.rmx_weight = weight;
23068c61eb21SAlexander V. Chernikov 		rtm->rtm_index = nh->nh_ifp->if_index;
2307df8bae1dSRodney W. Grimes 		rtm->rtm_addrs = info.rti_addrs;
230852041295SPoul-Henning Kamp 		error = SYSCTL_OUT(w->w_req, (caddr_t)rtm, size);
230952041295SPoul-Henning Kamp 		return (error);
2310df8bae1dSRodney W. Grimes 	}
2311df8bae1dSRodney W. Grimes 	return (error);
2312df8bae1dSRodney W. Grimes }
2313df8bae1dSRodney W. Grimes 
231437c84183SPoul-Henning Kamp static int
2315ab607f28SRyan Stone sysctl_iflist_ifml(struct ifnet *ifp, const struct if_data *src_ifd,
2316ab607f28SRyan Stone     struct rt_addrinfo *info, struct walkarg *w, int len)
23176d076ae8SBjoern A. Zeeb {
23186d076ae8SBjoern A. Zeeb 	struct if_msghdrl *ifm;
2319b245f96cSGleb Smirnoff 	struct if_data *ifd;
2320b245f96cSGleb Smirnoff 
2321b245f96cSGleb Smirnoff 	ifm = (struct if_msghdrl *)w->w_tmem;
23226d076ae8SBjoern A. Zeeb 
23236d076ae8SBjoern A. Zeeb #ifdef COMPAT_FREEBSD32
23246d076ae8SBjoern A. Zeeb 	if (w->w_req->flags & SCTL_MASK32) {
23256d076ae8SBjoern A. Zeeb 		struct if_msghdrl32 *ifm32;
23266d076ae8SBjoern A. Zeeb 
2327b245f96cSGleb Smirnoff 		ifm32 = (struct if_msghdrl32 *)ifm;
23286d076ae8SBjoern A. Zeeb 		ifm32->ifm_addrs = info->rti_addrs;
23296d076ae8SBjoern A. Zeeb 		ifm32->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
23306d076ae8SBjoern A. Zeeb 		ifm32->ifm_index = ifp->if_index;
23316d076ae8SBjoern A. Zeeb 		ifm32->_ifm_spare1 = 0;
23326d076ae8SBjoern A. Zeeb 		ifm32->ifm_len = sizeof(*ifm32);
23336d076ae8SBjoern A. Zeeb 		ifm32->ifm_data_off = offsetof(struct if_msghdrl32, ifm_data);
2334d25f8522SMark Johnston 		ifm32->_ifm_spare2 = 0;
2335b245f96cSGleb Smirnoff 		ifd = &ifm32->ifm_data;
2336b245f96cSGleb Smirnoff 	} else
23376d076ae8SBjoern A. Zeeb #endif
2338b245f96cSGleb Smirnoff 	{
23396d076ae8SBjoern A. Zeeb 		ifm->ifm_addrs = info->rti_addrs;
23406d076ae8SBjoern A. Zeeb 		ifm->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
23416d076ae8SBjoern A. Zeeb 		ifm->ifm_index = ifp->if_index;
23426d076ae8SBjoern A. Zeeb 		ifm->_ifm_spare1 = 0;
23436d076ae8SBjoern A. Zeeb 		ifm->ifm_len = sizeof(*ifm);
23446d076ae8SBjoern A. Zeeb 		ifm->ifm_data_off = offsetof(struct if_msghdrl, ifm_data);
2345d25f8522SMark Johnston 		ifm->_ifm_spare2 = 0;
2346b245f96cSGleb Smirnoff 		ifd = &ifm->ifm_data;
2347b245f96cSGleb Smirnoff 	}
23486d076ae8SBjoern A. Zeeb 
2349ab607f28SRyan Stone 	memcpy(ifd, src_ifd, sizeof(*ifd));
2350b245f96cSGleb Smirnoff 
23516d076ae8SBjoern A. Zeeb 	return (SYSCTL_OUT(w->w_req, (caddr_t)ifm, len));
23526d076ae8SBjoern A. Zeeb }
23536d076ae8SBjoern A. Zeeb 
23546d076ae8SBjoern A. Zeeb static int
2355ab607f28SRyan Stone sysctl_iflist_ifm(struct ifnet *ifp, const struct if_data *src_ifd,
2356ab607f28SRyan Stone     struct rt_addrinfo *info, struct walkarg *w, int len)
23576d076ae8SBjoern A. Zeeb {
23586d076ae8SBjoern A. Zeeb 	struct if_msghdr *ifm;
2359b245f96cSGleb Smirnoff 	struct if_data *ifd;
2360b245f96cSGleb Smirnoff 
2361b245f96cSGleb Smirnoff 	ifm = (struct if_msghdr *)w->w_tmem;
23626d076ae8SBjoern A. Zeeb 
23636d076ae8SBjoern A. Zeeb #ifdef COMPAT_FREEBSD32
23646d076ae8SBjoern A. Zeeb 	if (w->w_req->flags & SCTL_MASK32) {
23656d076ae8SBjoern A. Zeeb 		struct if_msghdr32 *ifm32;
23666d076ae8SBjoern A. Zeeb 
2367b245f96cSGleb Smirnoff 		ifm32 = (struct if_msghdr32 *)ifm;
23686d076ae8SBjoern A. Zeeb 		ifm32->ifm_addrs = info->rti_addrs;
23696d076ae8SBjoern A. Zeeb 		ifm32->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
23706d076ae8SBjoern A. Zeeb 		ifm32->ifm_index = ifp->if_index;
2371d25f8522SMark Johnston 		ifm32->_ifm_spare1 = 0;
2372b245f96cSGleb Smirnoff 		ifd = &ifm32->ifm_data;
2373b245f96cSGleb Smirnoff 	} else
23746d076ae8SBjoern A. Zeeb #endif
2375b245f96cSGleb Smirnoff 	{
23766d076ae8SBjoern A. Zeeb 		ifm->ifm_addrs = info->rti_addrs;
23776d076ae8SBjoern A. Zeeb 		ifm->ifm_flags = ifp->if_flags | ifp->if_drv_flags;
23786d076ae8SBjoern A. Zeeb 		ifm->ifm_index = ifp->if_index;
2379d25f8522SMark Johnston 		ifm->_ifm_spare1 = 0;
2380b245f96cSGleb Smirnoff 		ifd = &ifm->ifm_data;
2381b245f96cSGleb Smirnoff 	}
23826d076ae8SBjoern A. Zeeb 
2383ab607f28SRyan Stone 	memcpy(ifd, src_ifd, sizeof(*ifd));
23842d70c0deSGleb Smirnoff 
23856d076ae8SBjoern A. Zeeb 	return (SYSCTL_OUT(w->w_req, (caddr_t)ifm, len));
23866d076ae8SBjoern A. Zeeb }
23876d076ae8SBjoern A. Zeeb 
23886d076ae8SBjoern A. Zeeb static int
23896d076ae8SBjoern A. Zeeb sysctl_iflist_ifaml(struct ifaddr *ifa, struct rt_addrinfo *info,
23906d076ae8SBjoern A. Zeeb     struct walkarg *w, int len)
23916d076ae8SBjoern A. Zeeb {
23926d076ae8SBjoern A. Zeeb 	struct ifa_msghdrl *ifam;
2393b245f96cSGleb Smirnoff 	struct if_data *ifd;
2394b245f96cSGleb Smirnoff 
2395b245f96cSGleb Smirnoff 	ifam = (struct ifa_msghdrl *)w->w_tmem;
23966d076ae8SBjoern A. Zeeb 
23976d076ae8SBjoern A. Zeeb #ifdef COMPAT_FREEBSD32
23986d076ae8SBjoern A. Zeeb 	if (w->w_req->flags & SCTL_MASK32) {
23996d076ae8SBjoern A. Zeeb 		struct ifa_msghdrl32 *ifam32;
24006d076ae8SBjoern A. Zeeb 
2401b245f96cSGleb Smirnoff 		ifam32 = (struct ifa_msghdrl32 *)ifam;
24026d076ae8SBjoern A. Zeeb 		ifam32->ifam_addrs = info->rti_addrs;
24036d076ae8SBjoern A. Zeeb 		ifam32->ifam_flags = ifa->ifa_flags;
24046d076ae8SBjoern A. Zeeb 		ifam32->ifam_index = ifa->ifa_ifp->if_index;
24056d076ae8SBjoern A. Zeeb 		ifam32->_ifam_spare1 = 0;
24066d076ae8SBjoern A. Zeeb 		ifam32->ifam_len = sizeof(*ifam32);
24076d076ae8SBjoern A. Zeeb 		ifam32->ifam_data_off =
24086d076ae8SBjoern A. Zeeb 		    offsetof(struct ifa_msghdrl32, ifam_data);
24099753faf5SGleb Smirnoff 		ifam32->ifam_metric = ifa->ifa_ifp->if_metric;
2410b245f96cSGleb Smirnoff 		ifd = &ifam32->ifam_data;
2411b245f96cSGleb Smirnoff 	} else
24126d076ae8SBjoern A. Zeeb #endif
2413b245f96cSGleb Smirnoff 	{
24146d076ae8SBjoern A. Zeeb 		ifam->ifam_addrs = info->rti_addrs;
24156d076ae8SBjoern A. Zeeb 		ifam->ifam_flags = ifa->ifa_flags;
24166d076ae8SBjoern A. Zeeb 		ifam->ifam_index = ifa->ifa_ifp->if_index;
24176d076ae8SBjoern A. Zeeb 		ifam->_ifam_spare1 = 0;
24186d076ae8SBjoern A. Zeeb 		ifam->ifam_len = sizeof(*ifam);
24196d076ae8SBjoern A. Zeeb 		ifam->ifam_data_off = offsetof(struct ifa_msghdrl, ifam_data);
24209753faf5SGleb Smirnoff 		ifam->ifam_metric = ifa->ifa_ifp->if_metric;
2421b245f96cSGleb Smirnoff 		ifd = &ifam->ifam_data;
2422b245f96cSGleb Smirnoff 	}
24236d076ae8SBjoern A. Zeeb 
2424b245f96cSGleb Smirnoff 	bzero(ifd, sizeof(*ifd));
2425b245f96cSGleb Smirnoff 	ifd->ifi_datalen = sizeof(struct if_data);
2426b245f96cSGleb Smirnoff 	ifd->ifi_ipackets = counter_u64_fetch(ifa->ifa_ipackets);
2427b245f96cSGleb Smirnoff 	ifd->ifi_opackets = counter_u64_fetch(ifa->ifa_opackets);
2428b245f96cSGleb Smirnoff 	ifd->ifi_ibytes = counter_u64_fetch(ifa->ifa_ibytes);
2429b245f96cSGleb Smirnoff 	ifd->ifi_obytes = counter_u64_fetch(ifa->ifa_obytes);
24307caf4ab7SGleb Smirnoff 
24316d076ae8SBjoern A. Zeeb 	/* Fixup if_data carp(4) vhid. */
24326d076ae8SBjoern A. Zeeb 	if (carp_get_vhid_p != NULL)
2433b245f96cSGleb Smirnoff 		ifd->ifi_vhid = (*carp_get_vhid_p)(ifa);
24346d076ae8SBjoern A. Zeeb 
24356d076ae8SBjoern A. Zeeb 	return (SYSCTL_OUT(w->w_req, w->w_tmem, len));
24366d076ae8SBjoern A. Zeeb }
24376d076ae8SBjoern A. Zeeb 
24386d076ae8SBjoern A. Zeeb static int
24396d076ae8SBjoern A. Zeeb sysctl_iflist_ifam(struct ifaddr *ifa, struct rt_addrinfo *info,
24406d076ae8SBjoern A. Zeeb     struct walkarg *w, int len)
24416d076ae8SBjoern A. Zeeb {
24426d076ae8SBjoern A. Zeeb 	struct ifa_msghdr *ifam;
24436d076ae8SBjoern A. Zeeb 
24446d076ae8SBjoern A. Zeeb 	ifam = (struct ifa_msghdr *)w->w_tmem;
24456d076ae8SBjoern A. Zeeb 	ifam->ifam_addrs = info->rti_addrs;
24466d076ae8SBjoern A. Zeeb 	ifam->ifam_flags = ifa->ifa_flags;
24476d076ae8SBjoern A. Zeeb 	ifam->ifam_index = ifa->ifa_ifp->if_index;
2448d25f8522SMark Johnston 	ifam->_ifam_spare1 = 0;
24499753faf5SGleb Smirnoff 	ifam->ifam_metric = ifa->ifa_ifp->if_metric;
24506d076ae8SBjoern A. Zeeb 
24516d076ae8SBjoern A. Zeeb 	return (SYSCTL_OUT(w->w_req, w->w_tmem, len));
24526d076ae8SBjoern A. Zeeb }
24536d076ae8SBjoern A. Zeeb 
24546d076ae8SBjoern A. Zeeb static int
2455becc44d7SSam Leffler sysctl_iflist(int af, struct walkarg *w)
2456df8bae1dSRodney W. Grimes {
2457becc44d7SSam Leffler 	struct ifnet *ifp;
2458becc44d7SSam Leffler 	struct ifaddr *ifa;
2459ab607f28SRyan Stone 	struct if_data ifd;
2460df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
2461df8bae1dSRodney W. Grimes 	int len, error = 0;
24623deb3649SAlexander V. Chernikov 	struct sockaddr_storage ss;
2463df8bae1dSRodney W. Grimes 
2464df8bae1dSRodney W. Grimes 	bzero((caddr_t)&info, sizeof(info));
2465ab607f28SRyan Stone 	bzero(&ifd, sizeof(ifd));
24664f6c66ccSMatt Macy 	CK_STAILQ_FOREACH(ifp, &V_ifnet, if_link) {
2467df8bae1dSRodney W. Grimes 		if (w->w_arg && w->w_arg != ifp->if_index)
2468df8bae1dSRodney W. Grimes 			continue;
2469ab607f28SRyan Stone 		if_data_copy(ifp, &ifd);
24704a0d6638SRuslan Ermilov 		ifa = ifp->if_addr;
2471becc44d7SSam Leffler 		info.rti_info[RTAX_IFP] = ifa->ifa_addr;
2472f2e5eb36SAlexander V. Chernikov 		error = rtsock_msg_buffer(RTM_IFINFO, &info, w, &len);
2473f2e5eb36SAlexander V. Chernikov 		if (error != 0)
2474f2e5eb36SAlexander V. Chernikov 			goto done;
24755dfc91d7SLuigi Rizzo 		info.rti_info[RTAX_IFP] = NULL;
247652041295SPoul-Henning Kamp 		if (w->w_req && w->w_tmem) {
24776d076ae8SBjoern A. Zeeb 			if (w->w_op == NET_RT_IFLISTL)
2478ab607f28SRyan Stone 				error = sysctl_iflist_ifml(ifp, &ifd, &info, w,
2479ab607f28SRyan Stone 				    len);
24806d076ae8SBjoern A. Zeeb 			else
2481ab607f28SRyan Stone 				error = sysctl_iflist_ifm(ifp, &ifd, &info, w,
2482ab607f28SRyan Stone 				    len);
2483df440948SPoul-Henning Kamp 			if (error)
2484a35b06c5SJonathan Lemon 				goto done;
2485df8bae1dSRodney W. Grimes 		}
2486d7c5a620SMatt Macy 		while ((ifa = CK_STAILQ_NEXT(ifa, ifa_link)) != NULL) {
2487df8bae1dSRodney W. Grimes 			if (af && af != ifa->ifa_addr->sa_family)
2488df8bae1dSRodney W. Grimes 				continue;
2489b89e82ddSJamie Gritton 			if (prison_if(w->w_req->td->td_ucred,
2490b89e82ddSJamie Gritton 			    ifa->ifa_addr) != 0)
249175c13541SPoul-Henning Kamp 				continue;
2492becc44d7SSam Leffler 			info.rti_info[RTAX_IFA] = ifa->ifa_addr;
24933deb3649SAlexander V. Chernikov 			info.rti_info[RTAX_NETMASK] = rtsock_fix_netmask(
24943deb3649SAlexander V. Chernikov 			    ifa->ifa_addr, ifa->ifa_netmask, &ss);
2495becc44d7SSam Leffler 			info.rti_info[RTAX_BRD] = ifa->ifa_dstaddr;
2496f2e5eb36SAlexander V. Chernikov 			error = rtsock_msg_buffer(RTM_NEWADDR, &info, w, &len);
2497f2e5eb36SAlexander V. Chernikov 			if (error != 0)
2498f2e5eb36SAlexander V. Chernikov 				goto done;
249952041295SPoul-Henning Kamp 			if (w->w_req && w->w_tmem) {
25006d076ae8SBjoern A. Zeeb 				if (w->w_op == NET_RT_IFLISTL)
25016d076ae8SBjoern A. Zeeb 					error = sysctl_iflist_ifaml(ifa, &info,
25026d076ae8SBjoern A. Zeeb 					    w, len);
25036d076ae8SBjoern A. Zeeb 				else
25046d076ae8SBjoern A. Zeeb 					error = sysctl_iflist_ifam(ifa, &info,
25056d076ae8SBjoern A. Zeeb 					    w, len);
2506df440948SPoul-Henning Kamp 				if (error)
2507a35b06c5SJonathan Lemon 					goto done;
2508df8bae1dSRodney W. Grimes 			}
2509df8bae1dSRodney W. Grimes 		}
25103deb3649SAlexander V. Chernikov 		info.rti_info[RTAX_IFA] = NULL;
25113deb3649SAlexander V. Chernikov 		info.rti_info[RTAX_NETMASK] = NULL;
25125dfc91d7SLuigi Rizzo 		info.rti_info[RTAX_BRD] = NULL;
2513df8bae1dSRodney W. Grimes 	}
2514a35b06c5SJonathan Lemon done:
2515a35b06c5SJonathan Lemon 	return (error);
2516df8bae1dSRodney W. Grimes }
2517df8bae1dSRodney W. Grimes 
2518ebda3fc3SBjoern A. Zeeb static int
25199b98ee2cSLuigi Rizzo sysctl_ifmalist(int af, struct walkarg *w)
252005b2efe0SBruce M Simpson {
252105b2efe0SBruce M Simpson 	struct rt_addrinfo info;
25229b98ee2cSLuigi Rizzo 	struct ifaddr *ifa;
252355dfce58SMark Johnston 	struct ifmultiaddr *ifma;
252455dfce58SMark Johnston 	struct ifnet *ifp;
252555dfce58SMark Johnston 	int error, len;
252605b2efe0SBruce M Simpson 
2527b8a6e03fSGleb Smirnoff 	NET_EPOCH_ASSERT();
2528b8a6e03fSGleb Smirnoff 
252955dfce58SMark Johnston 	error = 0;
253005b2efe0SBruce M Simpson 	bzero((caddr_t)&info, sizeof(info));
253155dfce58SMark Johnston 
25324f6c66ccSMatt Macy 	CK_STAILQ_FOREACH(ifp, &V_ifnet, if_link) {
253305b2efe0SBruce M Simpson 		if (w->w_arg && w->w_arg != ifp->if_index)
253405b2efe0SBruce M Simpson 			continue;
25354a0d6638SRuslan Ermilov 		ifa = ifp->if_addr;
2536913af518SLuigi Rizzo 		info.rti_info[RTAX_IFP] = ifa ? ifa->ifa_addr : NULL;
2537d7c5a620SMatt Macy 		CK_STAILQ_FOREACH(ifma, &ifp->if_multiaddrs, ifma_link) {
253805b2efe0SBruce M Simpson 			if (af && af != ifma->ifma_addr->sa_family)
253905b2efe0SBruce M Simpson 				continue;
2540b89e82ddSJamie Gritton 			if (prison_if(w->w_req->td->td_ucred,
2541b89e82ddSJamie Gritton 			    ifma->ifma_addr) != 0)
254205b2efe0SBruce M Simpson 				continue;
254305b2efe0SBruce M Simpson 			info.rti_info[RTAX_IFA] = ifma->ifma_addr;
2544913af518SLuigi Rizzo 			info.rti_info[RTAX_GATEWAY] =
2545913af518SLuigi Rizzo 			    (ifma->ifma_addr->sa_family != AF_LINK) ?
2546913af518SLuigi Rizzo 			    ifma->ifma_lladdr : NULL;
2547c9f98940SAlexander V. Chernikov 			error = rtsock_msg_buffer(RTM_NEWMADDR, &info, w, &len);
2548f2e5eb36SAlexander V. Chernikov 			if (error != 0)
254955dfce58SMark Johnston 				break;
255005b2efe0SBruce M Simpson 			if (w->w_req && w->w_tmem) {
25519b98ee2cSLuigi Rizzo 				struct ifma_msghdr *ifmam;
255205b2efe0SBruce M Simpson 
255305b2efe0SBruce M Simpson 				ifmam = (struct ifma_msghdr *)w->w_tmem;
255405b2efe0SBruce M Simpson 				ifmam->ifmam_index = ifma->ifma_ifp->if_index;
255505b2efe0SBruce M Simpson 				ifmam->ifmam_flags = 0;
255605b2efe0SBruce M Simpson 				ifmam->ifmam_addrs = info.rti_addrs;
2557d25f8522SMark Johnston 				ifmam->_ifmam_spare1 = 0;
255805b2efe0SBruce M Simpson 				error = SYSCTL_OUT(w->w_req, w->w_tmem, len);
255955dfce58SMark Johnston 				if (error != 0)
256055dfce58SMark Johnston 					break;
256105b2efe0SBruce M Simpson 			}
256205b2efe0SBruce M Simpson 		}
256355dfce58SMark Johnston 		if (error != 0)
256455dfce58SMark Johnston 			break;
2565fe0fc7efSChristian S.J. Peron 	}
256605b2efe0SBruce M Simpson 	return (error);
256705b2efe0SBruce M Simpson }
256805b2efe0SBruce M Simpson 
2569d68fb8d9SAlexander V. Chernikov static void
2570d68fb8d9SAlexander V. Chernikov rtable_sysctl_dump(uint32_t fibnum, int family, struct walkarg *w)
2571d68fb8d9SAlexander V. Chernikov {
2572d68fb8d9SAlexander V. Chernikov 	union sockaddr_union sa_dst, sa_mask;
2573d68fb8d9SAlexander V. Chernikov 
2574d68fb8d9SAlexander V. Chernikov 	w->family = family;
2575d68fb8d9SAlexander V. Chernikov 	w->dst = (struct sockaddr *)&sa_dst;
2576d68fb8d9SAlexander V. Chernikov 	w->mask = (struct sockaddr *)&sa_mask;
2577d68fb8d9SAlexander V. Chernikov 
2578d68fb8d9SAlexander V. Chernikov 	init_sockaddrs_family(family, w->dst, w->mask);
2579d68fb8d9SAlexander V. Chernikov 
2580d68fb8d9SAlexander V. Chernikov 	rib_walk(fibnum, family, false, sysctl_dumpentry, w);
2581d68fb8d9SAlexander V. Chernikov }
2582d68fb8d9SAlexander V. Chernikov 
258352041295SPoul-Henning Kamp static int
258482d9ae4eSPoul-Henning Kamp sysctl_rtsock(SYSCTL_HANDLER_ARGS)
2585df8bae1dSRodney W. Grimes {
2586b8a6e03fSGleb Smirnoff 	struct epoch_tracker et;
258752041295SPoul-Henning Kamp 	int	*name = (int *)arg1;
258852041295SPoul-Henning Kamp 	u_int	namelen = arg2;
258961eee0e2SAlexander V. Chernikov 	struct rib_head *rnh = NULL; /* silence compiler. */
2590fe0fc7efSChristian S.J. Peron 	int	i, lim, error = EINVAL;
25914825b1e0SHiroki Sato 	int	fib = 0;
2592df8bae1dSRodney W. Grimes 	u_char	af;
2593df8bae1dSRodney W. Grimes 	struct	walkarg w;
2594df8bae1dSRodney W. Grimes 
25950dcef81dSMark Johnston 	if (namelen < 3)
25960dcef81dSMark Johnston 		return (EINVAL);
25970dcef81dSMark Johnston 
259852041295SPoul-Henning Kamp 	name++;
259952041295SPoul-Henning Kamp 	namelen--;
260052041295SPoul-Henning Kamp 	if (req->newptr)
2601df8bae1dSRodney W. Grimes 		return (EPERM);
2602fedeb08bSAlexander V. Chernikov 	if (name[1] == NET_RT_DUMP || name[1] == NET_RT_NHOP || name[1] == NET_RT_NHGRP) {
26034825b1e0SHiroki Sato 		if (namelen == 3)
26044825b1e0SHiroki Sato 			fib = req->td->td_proc->p_fibnum;
26054825b1e0SHiroki Sato 		else if (namelen == 4)
26067d9b6df1SAlexander V. Chernikov 			fib = (name[3] == RT_ALL_FIBS) ?
26074825b1e0SHiroki Sato 			    req->td->td_proc->p_fibnum : name[3];
26084825b1e0SHiroki Sato 		else
26094825b1e0SHiroki Sato 			return ((namelen < 3) ? EISDIR : ENOTDIR);
26104825b1e0SHiroki Sato 		if (fib < 0 || fib >= rt_numfibs)
26114825b1e0SHiroki Sato 			return (EINVAL);
26124825b1e0SHiroki Sato 	} else if (namelen != 3)
2613f7a54d06SCrist J. Clark 		return ((namelen < 3) ? EISDIR : ENOTDIR);
2614df8bae1dSRodney W. Grimes 	af = name[0];
2615b2aaf46eSJeffrey Hsu 	if (af > AF_MAX)
2616b2aaf46eSJeffrey Hsu 		return (EINVAL);
26176b96f1afSLuigi Rizzo 	bzero(&w, sizeof(w));
2618df8bae1dSRodney W. Grimes 	w.w_op = name[1];
2619df8bae1dSRodney W. Grimes 	w.w_arg = name[2];
262052041295SPoul-Henning Kamp 	w.w_req = req;
2621df8bae1dSRodney W. Grimes 
2622fe0fc7efSChristian S.J. Peron 	error = sysctl_wire_old_buffer(req, 0);
2623fe0fc7efSChristian S.J. Peron 	if (error)
2624fe0fc7efSChristian S.J. Peron 		return (error);
2625f2e5eb36SAlexander V. Chernikov 
2626f2e5eb36SAlexander V. Chernikov 	/*
2627f2e5eb36SAlexander V. Chernikov 	 * Allocate reply buffer in advance.
2628f2e5eb36SAlexander V. Chernikov 	 * All rtsock messages has maximum length of u_short.
2629f2e5eb36SAlexander V. Chernikov 	 */
2630f2e5eb36SAlexander V. Chernikov 	w.w_tmemsize = 65536;
2631f2e5eb36SAlexander V. Chernikov 	w.w_tmem = malloc(w.w_tmemsize, M_TEMP, M_WAITOK);
2632f2e5eb36SAlexander V. Chernikov 
2633b8a6e03fSGleb Smirnoff 	NET_EPOCH_ENTER(et);
2634df8bae1dSRodney W. Grimes 	switch (w.w_op) {
2635df8bae1dSRodney W. Grimes 	case NET_RT_DUMP:
2636df8bae1dSRodney W. Grimes 	case NET_RT_FLAGS:
2637a8b76c8fSLuigi Rizzo 		if (af == 0) {			/* dump all tables */
2638a8b76c8fSLuigi Rizzo 			i = 1;
2639a8b76c8fSLuigi Rizzo 			lim = AF_MAX;
2640a8b76c8fSLuigi Rizzo 		} else				/* dump only one table */
2641a8b76c8fSLuigi Rizzo 			i = lim = af;
26428eca593cSQing Li 
26438eca593cSQing Li 		/*
26448eca593cSQing Li 		 * take care of llinfo entries, the caller must
26458eca593cSQing Li 		 * specify an AF
26468eca593cSQing Li 		 */
264714981d80SQing Li 		if (w.w_op == NET_RT_FLAGS &&
264882b334e8SQing Li 		    (w.w_arg == 0 || w.w_arg & RTF_LLINFO)) {
26498eca593cSQing Li 			if (af != 0)
26508eca593cSQing Li 				error = lltable_sysctl_dumparp(af, w.w_req);
26518eca593cSQing Li 			else
26528eca593cSQing Li 				error = EINVAL;
26538eca593cSQing Li 			break;
26548eca593cSQing Li 		}
26558eca593cSQing Li 		/*
26568eca593cSQing Li 		 * take care of routing entries
26578eca593cSQing Li 		 */
265820b0cdb7SBjoern A. Zeeb 		for (error = 0; error == 0 && i <= lim; i++) {
26594825b1e0SHiroki Sato 			rnh = rt_tables_get_rnh(fib, i);
2660c2c2a7c1SBjoern A. Zeeb 			if (rnh != NULL) {
2661d68fb8d9SAlexander V. Chernikov 				rtable_sysctl_dump(fib, i, &w);
2662a8b76c8fSLuigi Rizzo 			} else if (af != 0)
2663956b0b65SJeffrey Hsu 				error = EAFNOSUPPORT;
266420b0cdb7SBjoern A. Zeeb 		}
2665df8bae1dSRodney W. Grimes 		break;
2666a6663252SAlexander V. Chernikov 	case NET_RT_NHOP:
2667fedeb08bSAlexander V. Chernikov 	case NET_RT_NHGRP:
2668a6663252SAlexander V. Chernikov 		/* Allow dumping one specific af/fib at a time */
2669a6663252SAlexander V. Chernikov 		if (namelen < 4) {
2670a6663252SAlexander V. Chernikov 			error = EINVAL;
2671a6663252SAlexander V. Chernikov 			break;
2672a6663252SAlexander V. Chernikov 		}
2673a6663252SAlexander V. Chernikov 		fib = name[3];
2674a6663252SAlexander V. Chernikov 		if (fib < 0 || fib > rt_numfibs) {
2675a6663252SAlexander V. Chernikov 			error = EINVAL;
2676a6663252SAlexander V. Chernikov 			break;
2677a6663252SAlexander V. Chernikov 		}
2678a6663252SAlexander V. Chernikov 		rnh = rt_tables_get_rnh(fib, af);
2679a6663252SAlexander V. Chernikov 		if (rnh == NULL) {
2680a6663252SAlexander V. Chernikov 			error = EAFNOSUPPORT;
2681a6663252SAlexander V. Chernikov 			break;
2682a6663252SAlexander V. Chernikov 		}
2683a6663252SAlexander V. Chernikov 		if (w.w_op == NET_RT_NHOP)
2684a6663252SAlexander V. Chernikov 			error = nhops_dump_sysctl(rnh, w.w_req);
2685fedeb08bSAlexander V. Chernikov 		else
2686fedeb08bSAlexander V. Chernikov #ifdef ROUTE_MPATH
2687fedeb08bSAlexander V. Chernikov 			error = nhgrp_dump_sysctl(rnh, w.w_req);
2688fedeb08bSAlexander V. Chernikov #else
2689fedeb08bSAlexander V. Chernikov 			error = ENOTSUP;
2690fedeb08bSAlexander V. Chernikov #endif
2691a6663252SAlexander V. Chernikov 		break;
2692df8bae1dSRodney W. Grimes 	case NET_RT_IFLIST:
26936d076ae8SBjoern A. Zeeb 	case NET_RT_IFLISTL:
2694df8bae1dSRodney W. Grimes 		error = sysctl_iflist(af, &w);
269505b2efe0SBruce M Simpson 		break;
269605b2efe0SBruce M Simpson 
269705b2efe0SBruce M Simpson 	case NET_RT_IFMALIST:
269805b2efe0SBruce M Simpson 		error = sysctl_ifmalist(af, &w);
269905b2efe0SBruce M Simpson 		break;
2700df8bae1dSRodney W. Grimes 	}
2701b8a6e03fSGleb Smirnoff 	NET_EPOCH_EXIT(et);
2702f2e5eb36SAlexander V. Chernikov 
2703f2e5eb36SAlexander V. Chernikov 	free(w.w_tmem, M_TEMP);
2704df8bae1dSRodney W. Grimes 	return (error);
2705df8bae1dSRodney W. Grimes }
2706df8bae1dSRodney W. Grimes 
27078a9a28c4SGleb Smirnoff static SYSCTL_NODE(_net, PF_ROUTE, routetable, CTLFLAG_RD | CTLFLAG_MPSAFE,
27088a9a28c4SGleb Smirnoff     sysctl_rtsock, "Return route tables and interface/address lists");
270952041295SPoul-Henning Kamp 
2710df8bae1dSRodney W. Grimes /*
2711df8bae1dSRodney W. Grimes  * Definitions of protocols supported in the ROUTE domain.
2712df8bae1dSRodney W. Grimes  */
2713df8bae1dSRodney W. Grimes 
27145b1c0294SDavid E. O'Brien static struct domain routedomain;		/* or at least forward */
2715df8bae1dSRodney W. Grimes 
271652041295SPoul-Henning Kamp static struct protosw routesw[] = {
2717303989a2SRuslan Ermilov {
2718303989a2SRuslan Ermilov 	.pr_type =		SOCK_RAW,
2719303989a2SRuslan Ermilov 	.pr_domain =		&routedomain,
2720303989a2SRuslan Ermilov 	.pr_flags =		PR_ATOMIC|PR_ADDR,
2721303989a2SRuslan Ermilov 	.pr_output =		route_output,
2722303989a2SRuslan Ermilov 	.pr_ctlinput =		raw_ctlinput,
2723303989a2SRuslan Ermilov 	.pr_usrreqs =		&route_usrreqs
2724df8bae1dSRodney W. Grimes }
2725df8bae1dSRodney W. Grimes };
2726df8bae1dSRodney W. Grimes 
2727303989a2SRuslan Ermilov static struct domain routedomain = {
2728303989a2SRuslan Ermilov 	.dom_family =		PF_ROUTE,
2729303989a2SRuslan Ermilov 	.dom_name =		"route",
2730303989a2SRuslan Ermilov 	.dom_protosw =		routesw,
273102abd400SPedro F. Giffuni 	.dom_protoswNPROTOSW =	&routesw[nitems(routesw)]
2732303989a2SRuslan Ermilov };
273378a82810SGarrett Wollman 
2734644ca084SGleb Smirnoff DOMAIN_SET(route);
2735