xref: /freebsd/sys/net/route.c (revision edc37a66e34396fb480bab54650436095b9ac678)
1c398230bSWarner Losh /*-
251369649SPedro F. Giffuni  * SPDX-License-Identifier: BSD-3-Clause
351369649SPedro F. Giffuni  *
4df8bae1dSRodney W. Grimes  * Copyright (c) 1980, 1986, 1991, 1993
5df8bae1dSRodney W. Grimes  *	The Regents of the University of California.  All rights reserved.
6df8bae1dSRodney W. Grimes  *
7df8bae1dSRodney W. Grimes  * Redistribution and use in source and binary forms, with or without
8df8bae1dSRodney W. Grimes  * modification, are permitted provided that the following conditions
9df8bae1dSRodney W. Grimes  * are met:
10df8bae1dSRodney W. Grimes  * 1. Redistributions of source code must retain the above copyright
11df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer.
12df8bae1dSRodney W. Grimes  * 2. Redistributions in binary form must reproduce the above copyright
13df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer in the
14df8bae1dSRodney W. Grimes  *    documentation and/or other materials provided with the distribution.
15fbbd9655SWarner Losh  * 3. Neither the name of the University nor the names of its contributors
16df8bae1dSRodney W. Grimes  *    may be used to endorse or promote products derived from this software
17df8bae1dSRodney W. Grimes  *    without specific prior written permission.
18df8bae1dSRodney W. Grimes  *
19df8bae1dSRodney W. Grimes  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
20df8bae1dSRodney W. Grimes  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21df8bae1dSRodney W. Grimes  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22df8bae1dSRodney W. Grimes  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
23df8bae1dSRodney W. Grimes  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24df8bae1dSRodney W. Grimes  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25df8bae1dSRodney W. Grimes  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26df8bae1dSRodney W. Grimes  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27df8bae1dSRodney W. Grimes  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28df8bae1dSRodney W. Grimes  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29df8bae1dSRodney W. Grimes  * SUCH DAMAGE.
30df8bae1dSRodney W. Grimes  *
3142e9e16dSRuslan Ermilov  *	@(#)route.c	8.3.1.1 (Berkeley) 2/23/95
32c3aac50fSPeter Wemm  * $FreeBSD$
33df8bae1dSRodney W. Grimes  */
348b07e49aSJulian Elischer /************************************************************************
358b07e49aSJulian Elischer  * Note: In this file a 'fib' is a "forwarding information base"	*
368b07e49aSJulian Elischer  * Which is the new name for an in kernel routing (next hop) table.	*
378b07e49aSJulian Elischer  ***********************************************************************/
38df8bae1dSRodney W. Grimes 
391d5e9e22SEivind Eklund #include "opt_inet.h"
40096f2786SBjoern A. Zeeb #include "opt_inet6.h"
414bd49128SPeter Wemm #include "opt_mrouting.h"
42e440aed9SQing Li #include "opt_mpath.h"
43d6e23cf0SMichael Tuexen #include "opt_route.h"
444bd49128SPeter Wemm 
45df8bae1dSRodney W. Grimes #include <sys/param.h>
46df8bae1dSRodney W. Grimes #include <sys/systm.h>
474d1d4912SBruce Evans #include <sys/malloc.h>
48df8bae1dSRodney W. Grimes #include <sys/mbuf.h>
49df8bae1dSRodney W. Grimes #include <sys/socket.h>
508b07e49aSJulian Elischer #include <sys/sysctl.h>
513120b9d4SKip Macy #include <sys/syslog.h>
528b07e49aSJulian Elischer #include <sys/sysproto.h>
538b07e49aSJulian Elischer #include <sys/proc.h>
54df8bae1dSRodney W. Grimes #include <sys/domain.h>
5569104ebeSMichael Tuexen #include <sys/eventhandler.h>
56cb64988fSLuoqi Chen #include <sys/kernel.h>
5720efcfc6SAndrey V. Elsukov #include <sys/lock.h>
5820efcfc6SAndrey V. Elsukov #include <sys/rmlock.h>
59df8bae1dSRodney W. Grimes 
60df8bae1dSRodney W. Grimes #include <net/if.h>
6176039bc8SGleb Smirnoff #include <net/if_var.h>
626e6b3f7cSQing Li #include <net/if_dl.h>
63df8bae1dSRodney W. Grimes #include <net/route.h>
64da187ddbSAlexander V. Chernikov #include <net/route/route_ctl.h>
65e7d8af4fSAlexander V. Chernikov #include <net/route/route_var.h>
66a6663252SAlexander V. Chernikov #include <net/route/nhop.h>
67a6663252SAlexander V. Chernikov #include <net/route/shared.h>
68530c0060SRobert Watson #include <net/vnet.h>
69df8bae1dSRodney W. Grimes 
70e440aed9SQing Li #ifdef RADIX_MPATH
71e440aed9SQing Li #include <net/radix_mpath.h>
72e440aed9SQing Li #endif
73e440aed9SQing Li 
74df8bae1dSRodney W. Grimes #include <netinet/in.h>
75b5e8ce9fSBruce Evans #include <netinet/ip_mroute.h>
76df8bae1dSRodney W. Grimes 
772dc1d581SAndre Oppermann #include <vm/uma.h>
782dc1d581SAndre Oppermann 
794871fc4aSJulian Elischer #define	RT_MAXFIBS	UINT16_MAX
80bfca216eSBjoern A. Zeeb 
81bfca216eSBjoern A. Zeeb /* Kernel config default option. */
82bfca216eSBjoern A. Zeeb #ifdef ROUTETABLES
83bfca216eSBjoern A. Zeeb #if ROUTETABLES <= 0
84bfca216eSBjoern A. Zeeb #error "ROUTETABLES defined too low"
85bfca216eSBjoern A. Zeeb #endif
86bfca216eSBjoern A. Zeeb #if ROUTETABLES > RT_MAXFIBS
87bfca216eSBjoern A. Zeeb #error "ROUTETABLES defined too big"
88bfca216eSBjoern A. Zeeb #endif
89bfca216eSBjoern A. Zeeb #define	RT_NUMFIBS	ROUTETABLES
90bfca216eSBjoern A. Zeeb #endif /* ROUTETABLES */
91bfca216eSBjoern A. Zeeb /* Initialize to default if not otherwise set. */
92bfca216eSBjoern A. Zeeb #ifndef	RT_NUMFIBS
93bfca216eSBjoern A. Zeeb #define	RT_NUMFIBS	1
94bfca216eSBjoern A. Zeeb #endif
95bfca216eSBjoern A. Zeeb 
964871fc4aSJulian Elischer /* This is read-only.. */
978b07e49aSJulian Elischer u_int rt_numfibs = RT_NUMFIBS;
98af3b2549SHans Petter Selasky SYSCTL_UINT(_net, OID_AUTO, fibs, CTLFLAG_RDTUN, &rt_numfibs, 0, "");
998b07e49aSJulian Elischer 
10066e8505fSJulian Elischer /*
10166e8505fSJulian Elischer  * By default add routes to all fibs for new interfaces.
10266e8505fSJulian Elischer  * Once this is set to 0 then only allocate routes on interface
10366e8505fSJulian Elischer  * changes for the FIB of the caller when adding a new set of addresses
10466e8505fSJulian Elischer  * to an interface.  XXX this is a shotgun aproach to a problem that needs
10566e8505fSJulian Elischer  * a more fine grained solution.. that will come.
106a8498625SBjoern A. Zeeb  * XXX also has the problems getting the FIB from curthread which will not
107a8498625SBjoern A. Zeeb  * always work given the fib can be overridden and prefixes can be added
108a8498625SBjoern A. Zeeb  * from the network stack context.
10966e8505fSJulian Elischer  */
110ee0bd4b9SHiroki Sato VNET_DEFINE(u_int, rt_add_addr_allfibs) = 1;
111ee0bd4b9SHiroki Sato SYSCTL_UINT(_net, OID_AUTO, add_addr_allfibs, CTLFLAG_RWTUN | CTLFLAG_VNET,
112ee0bd4b9SHiroki Sato     &VNET_NAME(rt_add_addr_allfibs), 0, "");
11366e8505fSJulian Elischer 
114a6663252SAlexander V. Chernikov VNET_PCPUSTAT_DEFINE(struct rtstat, rtstat);
115185c3d2bSGleb Smirnoff 
116185c3d2bSGleb Smirnoff VNET_PCPUSTAT_SYSINIT(rtstat);
117185c3d2bSGleb Smirnoff #ifdef VIMAGE
118185c3d2bSGleb Smirnoff VNET_PCPUSTAT_SYSUNINIT(rtstat);
119185c3d2bSGleb Smirnoff #endif
120b58ea5f3SBjoern A. Zeeb 
12161eee0e2SAlexander V. Chernikov VNET_DEFINE(struct rib_head *, rt_tables);
12282cea7e6SBjoern A. Zeeb #define	V_rt_tables	VNET(rt_tables)
12382cea7e6SBjoern A. Zeeb 
124bfe1aba4SMarko Zec 
1254d2c2509SAlexander V. Chernikov VNET_DEFINE(uma_zone_t, rtzone);		/* Routing table UMA zone. */
12682cea7e6SBjoern A. Zeeb #define	V_rtzone	VNET(rtzone)
12782cea7e6SBjoern A. Zeeb 
128d6e23cf0SMichael Tuexen EVENTHANDLER_LIST_DEFINE(rt_addrmsg);
129d6e23cf0SMichael Tuexen 
130539642a2SAlexander V. Chernikov static int rt_ifdelroute(const struct rtentry *rt, const struct nhop_object *,
131539642a2SAlexander V. Chernikov     void *arg);
1322bbab0afSAlexander V. Chernikov static void destroy_rtentry_epoch(epoch_context_t ctx);
1339a1b64d5SAlexander V. Chernikov static int rt_exportinfo(struct rtentry *rt, struct rt_addrinfo *info,
1349a1b64d5SAlexander V. Chernikov     int flags);
135c77462ddSAlexander V. Chernikov 
1368b07e49aSJulian Elischer /*
1378b07e49aSJulian Elischer  * handler for net.my_fibnum
1388b07e49aSJulian Elischer  */
1398b07e49aSJulian Elischer static int
1408b07e49aSJulian Elischer sysctl_my_fibnum(SYSCTL_HANDLER_ARGS)
141df8bae1dSRodney W. Grimes {
1428b07e49aSJulian Elischer         int fibnum;
1438b07e49aSJulian Elischer         int error;
1448b07e49aSJulian Elischer 
1458b07e49aSJulian Elischer         fibnum = curthread->td_proc->p_fibnum;
1468b07e49aSJulian Elischer         error = sysctl_handle_int(oidp, &fibnum, 0, req);
1478b07e49aSJulian Elischer         return (error);
148df8bae1dSRodney W. Grimes }
149df8bae1dSRodney W. Grimes 
1507029da5cSPawel Biernacki SYSCTL_PROC(_net, OID_AUTO, my_fibnum,
1517029da5cSPawel Biernacki     CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_MPSAFE, NULL, 0,
1527029da5cSPawel Biernacki     &sysctl_my_fibnum, "I",
1537029da5cSPawel Biernacki     "default FIB of caller");
1542dc1d581SAndre Oppermann 
15561eee0e2SAlexander V. Chernikov static __inline struct rib_head **
156c2c2a7c1SBjoern A. Zeeb rt_tables_get_rnh_ptr(int table, int fam)
157c2c2a7c1SBjoern A. Zeeb {
15861eee0e2SAlexander V. Chernikov 	struct rib_head **rnh;
159c2c2a7c1SBjoern A. Zeeb 
16034a5582cSAlexander V. Chernikov 	KASSERT(table >= 0 && table < rt_numfibs,
16134a5582cSAlexander V. Chernikov 	    ("%s: table out of bounds (0 <= %d < %d)", __func__, table,
16234a5582cSAlexander V. Chernikov 	     rt_numfibs));
16334a5582cSAlexander V. Chernikov 	KASSERT(fam >= 0 && fam < (AF_MAX + 1),
16434a5582cSAlexander V. Chernikov 	    ("%s: fam out of bounds (0 <= %d < %d)", __func__, fam, AF_MAX+1));
165c2c2a7c1SBjoern A. Zeeb 
166c2c2a7c1SBjoern A. Zeeb 	/* rnh is [fib=0][af=0]. */
16761eee0e2SAlexander V. Chernikov 	rnh = (struct rib_head **)V_rt_tables;
168c2c2a7c1SBjoern A. Zeeb 	/* Get the offset to the requested table and fam. */
169c2c2a7c1SBjoern A. Zeeb 	rnh += table * (AF_MAX+1) + fam;
170c2c2a7c1SBjoern A. Zeeb 
171c2c2a7c1SBjoern A. Zeeb 	return (rnh);
172c2c2a7c1SBjoern A. Zeeb }
173c2c2a7c1SBjoern A. Zeeb 
17461eee0e2SAlexander V. Chernikov struct rib_head *
175c2c2a7c1SBjoern A. Zeeb rt_tables_get_rnh(int table, int fam)
176c2c2a7c1SBjoern A. Zeeb {
177c2c2a7c1SBjoern A. Zeeb 
178c2c2a7c1SBjoern A. Zeeb 	return (*rt_tables_get_rnh_ptr(table, fam));
179c2c2a7c1SBjoern A. Zeeb }
180c2c2a7c1SBjoern A. Zeeb 
1814f321dbdSBjoern A. Zeeb u_int
18284cc0778SGeorge V. Neville-Neil rt_tables_get_gen(int table, int fam)
18384cc0778SGeorge V. Neville-Neil {
18484cc0778SGeorge V. Neville-Neil 	struct rib_head *rnh;
18584cc0778SGeorge V. Neville-Neil 
18684cc0778SGeorge V. Neville-Neil 	rnh = *rt_tables_get_rnh_ptr(table, fam);
1876d768226SGeorge V. Neville-Neil 	KASSERT(rnh != NULL, ("%s: NULL rib_head pointer table %d fam %d",
1886d768226SGeorge V. Neville-Neil 	    __func__, table, fam));
18984cc0778SGeorge V. Neville-Neil 	return (rnh->rnh_gen);
19084cc0778SGeorge V. Neville-Neil }
19184cc0778SGeorge V. Neville-Neil 
19284cc0778SGeorge V. Neville-Neil 
193d0728d71SRobert Watson /*
194d0728d71SRobert Watson  * route initialization must occur before ip6_init2(), which happenas at
195d0728d71SRobert Watson  * SI_ORDER_MIDDLE.
196d0728d71SRobert Watson  */
1972eb5613fSLuigi Rizzo static void
1982eb5613fSLuigi Rizzo route_init(void)
199df8bae1dSRodney W. Grimes {
2008b07e49aSJulian Elischer 
2016f95a5ebSJulian Elischer 	/* whack the tunable ints into  line. */
2028b07e49aSJulian Elischer 	if (rt_numfibs > RT_MAXFIBS)
2038b07e49aSJulian Elischer 		rt_numfibs = RT_MAXFIBS;
2048b07e49aSJulian Elischer 	if (rt_numfibs == 0)
2058b07e49aSJulian Elischer 		rt_numfibs = 1;
206a6663252SAlexander V. Chernikov 	nhops_init();
2071ed81b73SMarko Zec }
208891cf3edSEd Maste SYSINIT(route_init, SI_SUB_PROTO_DOMAIN, SI_ORDER_THIRD, route_init, NULL);
2091ed81b73SMarko Zec 
210e3a7aa6fSGleb Smirnoff static int
211e3a7aa6fSGleb Smirnoff rtentry_zinit(void *mem, int size, int how)
212e3a7aa6fSGleb Smirnoff {
213e3a7aa6fSGleb Smirnoff 	struct rtentry *rt = mem;
214e3a7aa6fSGleb Smirnoff 
215e3a7aa6fSGleb Smirnoff 	RT_LOCK_INIT(rt);
216e3a7aa6fSGleb Smirnoff 
217e3a7aa6fSGleb Smirnoff 	return (0);
218e3a7aa6fSGleb Smirnoff }
219e3a7aa6fSGleb Smirnoff 
220e3a7aa6fSGleb Smirnoff static void
221e3a7aa6fSGleb Smirnoff rtentry_zfini(void *mem, int size)
222e3a7aa6fSGleb Smirnoff {
223e3a7aa6fSGleb Smirnoff 	struct rtentry *rt = mem;
224e3a7aa6fSGleb Smirnoff 
225e3a7aa6fSGleb Smirnoff 	RT_LOCK_DESTROY(rt);
226e3a7aa6fSGleb Smirnoff }
227e3a7aa6fSGleb Smirnoff 
228e3a7aa6fSGleb Smirnoff static int
229e3a7aa6fSGleb Smirnoff rtentry_ctor(void *mem, int size, void *arg, int how)
230e3a7aa6fSGleb Smirnoff {
231e3a7aa6fSGleb Smirnoff 	struct rtentry *rt = mem;
232e3a7aa6fSGleb Smirnoff 
233e3a7aa6fSGleb Smirnoff 	bzero(rt, offsetof(struct rtentry, rt_endzero));
234e8b0643eSAlexander V. Chernikov 	rt->rt_chain = NULL;
235e3a7aa6fSGleb Smirnoff 
236e3a7aa6fSGleb Smirnoff 	return (0);
237e3a7aa6fSGleb Smirnoff }
238e3a7aa6fSGleb Smirnoff 
239d0728d71SRobert Watson static void
240256ea2abSGleb Smirnoff rtentry_dtor(void *mem, int size, void *arg)
241256ea2abSGleb Smirnoff {
242256ea2abSGleb Smirnoff 	struct rtentry *rt = mem;
243256ea2abSGleb Smirnoff 
244256ea2abSGleb Smirnoff 	RT_UNLOCK_COND(rt);
245256ea2abSGleb Smirnoff }
246256ea2abSGleb Smirnoff 
247256ea2abSGleb Smirnoff static void
248d0728d71SRobert Watson vnet_route_init(const void *unused __unused)
2491ed81b73SMarko Zec {
2501ed81b73SMarko Zec 	struct domain *dom;
25161eee0e2SAlexander V. Chernikov 	struct rib_head **rnh;
252c2c2a7c1SBjoern A. Zeeb 	int table;
2531ed81b73SMarko Zec 	int fam;
2541ed81b73SMarko Zec 
255c2c2a7c1SBjoern A. Zeeb 	V_rt_tables = malloc(rt_numfibs * (AF_MAX+1) *
25661eee0e2SAlexander V. Chernikov 	    sizeof(struct rib_head *), M_RTABLE, M_WAITOK|M_ZERO);
257c2c2a7c1SBjoern A. Zeeb 
258e3a7aa6fSGleb Smirnoff 	V_rtzone = uma_zcreate("rtentry", sizeof(struct rtentry),
259256ea2abSGleb Smirnoff 	    rtentry_ctor, rtentry_dtor,
260e3a7aa6fSGleb Smirnoff 	    rtentry_zinit, rtentry_zfini, UMA_ALIGN_PTR, 0);
2618b07e49aSJulian Elischer 	for (dom = domains; dom; dom = dom->dom_next) {
262b680a383SBjoern A. Zeeb 		if (dom->dom_rtattach == NULL)
263b680a383SBjoern A. Zeeb 			continue;
264b680a383SBjoern A. Zeeb 
2658b07e49aSJulian Elischer 		for  (table = 0; table < rt_numfibs; table++) {
266b680a383SBjoern A. Zeeb 			fam = dom->dom_family;
267b680a383SBjoern A. Zeeb 			if (table != 0 && fam != AF_INET6 && fam != AF_INET)
268b680a383SBjoern A. Zeeb 				break;
269b680a383SBjoern A. Zeeb 
270c2c2a7c1SBjoern A. Zeeb 			rnh = rt_tables_get_rnh_ptr(table, fam);
271c2c2a7c1SBjoern A. Zeeb 			if (rnh == NULL)
272c2c2a7c1SBjoern A. Zeeb 				panic("%s: rnh NULL", __func__);
273ead85fe4SAlexander V. Chernikov 			dom->dom_rtattach((void **)rnh, 0, table);
2748b07e49aSJulian Elischer 		}
2758b07e49aSJulian Elischer 	}
2768b07e49aSJulian Elischer }
277d0728d71SRobert Watson VNET_SYSINIT(vnet_route_init, SI_SUB_PROTO_DOMAIN, SI_ORDER_FOURTH,
278d0728d71SRobert Watson     vnet_route_init, 0);
2798b07e49aSJulian Elischer 
280bc29160dSMarko Zec #ifdef VIMAGE
281d0728d71SRobert Watson static void
282d0728d71SRobert Watson vnet_route_uninit(const void *unused __unused)
283bc29160dSMarko Zec {
284bc29160dSMarko Zec 	int table;
285bc29160dSMarko Zec 	int fam;
286bc29160dSMarko Zec 	struct domain *dom;
28761eee0e2SAlexander V. Chernikov 	struct rib_head **rnh;
288bc29160dSMarko Zec 
289bc29160dSMarko Zec 	for (dom = domains; dom; dom = dom->dom_next) {
290b680a383SBjoern A. Zeeb 		if (dom->dom_rtdetach == NULL)
291b680a383SBjoern A. Zeeb 			continue;
292b680a383SBjoern A. Zeeb 
293bc29160dSMarko Zec 		for (table = 0; table < rt_numfibs; table++) {
294b680a383SBjoern A. Zeeb 			fam = dom->dom_family;
295b680a383SBjoern A. Zeeb 
296b680a383SBjoern A. Zeeb 			if (table != 0 && fam != AF_INET6 && fam != AF_INET)
297b680a383SBjoern A. Zeeb 				break;
298b680a383SBjoern A. Zeeb 
299bc29160dSMarko Zec 			rnh = rt_tables_get_rnh_ptr(table, fam);
300bc29160dSMarko Zec 			if (rnh == NULL)
301bc29160dSMarko Zec 				panic("%s: rnh NULL", __func__);
30257c3556bSAlexander V. Chernikov 			dom->dom_rtdetach((void **)rnh, 0);
303bc29160dSMarko Zec 		}
304bc29160dSMarko Zec 	}
3056274ce3eSCraig Rodrigues 
3062bbab0afSAlexander V. Chernikov 	/*
3072bbab0afSAlexander V. Chernikov 	 * dom_rtdetach calls rt_table_destroy(), which
3082bbab0afSAlexander V. Chernikov 	 *  schedules deletion for all rtentries, nexthops and control
3092bbab0afSAlexander V. Chernikov 	 *  structures. Wait for the destruction callbacks to fire.
3102bbab0afSAlexander V. Chernikov 	 * Note that this should result in freeing all rtentries, but
3112bbab0afSAlexander V. Chernikov 	 *  nexthops deletions will be scheduled for the next epoch run
3122bbab0afSAlexander V. Chernikov 	 *  and will be completed after vnet teardown.
3132bbab0afSAlexander V. Chernikov 	 */
3142bbab0afSAlexander V. Chernikov 	epoch_drain_callbacks(net_epoch_preempt);
3152bbab0afSAlexander V. Chernikov 
3166274ce3eSCraig Rodrigues 	free(V_rt_tables, M_RTABLE);
3176274ce3eSCraig Rodrigues 	uma_zdestroy(V_rtzone);
318bc29160dSMarko Zec }
31989856f7eSBjoern A. Zeeb VNET_SYSUNINIT(vnet_route_uninit, SI_SUB_PROTO_DOMAIN, SI_ORDER_FIRST,
320d0728d71SRobert Watson     vnet_route_uninit, 0);
321bc29160dSMarko Zec #endif
322bc29160dSMarko Zec 
32361eee0e2SAlexander V. Chernikov struct rib_head *
324ead85fe4SAlexander V. Chernikov rt_table_init(int offset, int family, u_int fibnum)
32561eee0e2SAlexander V. Chernikov {
32661eee0e2SAlexander V. Chernikov 	struct rib_head *rh;
32761eee0e2SAlexander V. Chernikov 
32861eee0e2SAlexander V. Chernikov 	rh = malloc(sizeof(struct rib_head), M_RTABLE, M_WAITOK | M_ZERO);
32961eee0e2SAlexander V. Chernikov 
33061eee0e2SAlexander V. Chernikov 	/* TODO: These details should be hidded inside radix.c */
33161eee0e2SAlexander V. Chernikov 	/* Init masks tree */
33261eee0e2SAlexander V. Chernikov 	rn_inithead_internal(&rh->head, rh->rnh_nodes, offset);
33361eee0e2SAlexander V. Chernikov 	rn_inithead_internal(&rh->rmhead.head, rh->rmhead.mask_nodes, 0);
33461eee0e2SAlexander V. Chernikov 	rh->head.rnh_masks = &rh->rmhead;
33561eee0e2SAlexander V. Chernikov 
336ead85fe4SAlexander V. Chernikov 	/* Save metadata associated with this routing table. */
337ead85fe4SAlexander V. Chernikov 	rh->rib_family = family;
338ead85fe4SAlexander V. Chernikov 	rh->rib_fibnum = fibnum;
339ead85fe4SAlexander V. Chernikov #ifdef VIMAGE
340ead85fe4SAlexander V. Chernikov 	rh->rib_vnet = curvnet;
341ead85fe4SAlexander V. Chernikov #endif
342ead85fe4SAlexander V. Chernikov 
34334a5582cSAlexander V. Chernikov 	tmproutes_init(rh);
34434a5582cSAlexander V. Chernikov 
34561eee0e2SAlexander V. Chernikov 	/* Init locks */
346abe95d87SAndrey V. Elsukov 	RIB_LOCK_INIT(rh);
34761eee0e2SAlexander V. Chernikov 
348a6663252SAlexander V. Chernikov 	nhops_init_rib(rh);
349a6663252SAlexander V. Chernikov 
350da187ddbSAlexander V. Chernikov 	/* Init subscription system */
351*edc37a66SAlexander V. Chernikov 	rib_init_subscriptions(rh);
352da187ddbSAlexander V. Chernikov 
35361eee0e2SAlexander V. Chernikov 	/* Finally, set base callbacks */
35461eee0e2SAlexander V. Chernikov 	rh->rnh_addaddr = rn_addroute;
35561eee0e2SAlexander V. Chernikov 	rh->rnh_deladdr = rn_delete;
35661eee0e2SAlexander V. Chernikov 	rh->rnh_matchaddr = rn_match;
35761eee0e2SAlexander V. Chernikov 	rh->rnh_lookup = rn_lookup;
35861eee0e2SAlexander V. Chernikov 	rh->rnh_walktree = rn_walktree;
35961eee0e2SAlexander V. Chernikov 	rh->rnh_walktree_from = rn_walktree_from;
36061eee0e2SAlexander V. Chernikov 
36161eee0e2SAlexander V. Chernikov 	return (rh);
36261eee0e2SAlexander V. Chernikov }
36361eee0e2SAlexander V. Chernikov 
364a5243af2SBjoern A. Zeeb static int
365a5243af2SBjoern A. Zeeb rt_freeentry(struct radix_node *rn, void *arg)
366a5243af2SBjoern A. Zeeb {
367a5243af2SBjoern A. Zeeb 	struct radix_head * const rnh = arg;
368a5243af2SBjoern A. Zeeb 	struct radix_node *x;
369a5243af2SBjoern A. Zeeb 
370a5243af2SBjoern A. Zeeb 	x = (struct radix_node *)rn_delete(rn + 2, NULL, rnh);
371a5243af2SBjoern A. Zeeb 	if (x != NULL)
372a5243af2SBjoern A. Zeeb 		R_Free(x);
373a5243af2SBjoern A. Zeeb 	return (0);
374a5243af2SBjoern A. Zeeb }
375a5243af2SBjoern A. Zeeb 
37661eee0e2SAlexander V. Chernikov void
37761eee0e2SAlexander V. Chernikov rt_table_destroy(struct rib_head *rh)
37861eee0e2SAlexander V. Chernikov {
37961eee0e2SAlexander V. Chernikov 
38034a5582cSAlexander V. Chernikov 	tmproutes_destroy(rh);
38134a5582cSAlexander V. Chernikov 
382a5243af2SBjoern A. Zeeb 	rn_walktree(&rh->rmhead.head, rt_freeentry, &rh->rmhead.head);
383a5243af2SBjoern A. Zeeb 
384a6663252SAlexander V. Chernikov 	nhops_destroy_rib(rh);
385a6663252SAlexander V. Chernikov 
386*edc37a66SAlexander V. Chernikov 	rib_destroy_subscriptions(rh);
387*edc37a66SAlexander V. Chernikov 
38861eee0e2SAlexander V. Chernikov 	/* Assume table is already empty */
389abe95d87SAndrey V. Elsukov 	RIB_LOCK_DESTROY(rh);
39061eee0e2SAlexander V. Chernikov 	free(rh, M_RTABLE);
39161eee0e2SAlexander V. Chernikov }
39261eee0e2SAlexander V. Chernikov 
39361eee0e2SAlexander V. Chernikov 
3948b07e49aSJulian Elischer #ifndef _SYS_SYSPROTO_H_
3958b07e49aSJulian Elischer struct setfib_args {
3968b07e49aSJulian Elischer 	int     fibnum;
3978b07e49aSJulian Elischer };
3988b07e49aSJulian Elischer #endif
3998b07e49aSJulian Elischer int
4008451d0ddSKip Macy sys_setfib(struct thread *td, struct setfib_args *uap)
4018b07e49aSJulian Elischer {
4028b07e49aSJulian Elischer 	if (uap->fibnum < 0 || uap->fibnum >= rt_numfibs)
4038b07e49aSJulian Elischer 		return EINVAL;
4048b07e49aSJulian Elischer 	td->td_proc->p_fibnum = uap->fibnum;
4058b07e49aSJulian Elischer 	return (0);
406df8bae1dSRodney W. Grimes }
407df8bae1dSRodney W. Grimes 
408df8bae1dSRodney W. Grimes /*
409499676dfSJulian Elischer  * Remove a reference count from an rtentry.
410499676dfSJulian Elischer  * If the count gets low enough, take it out of the routing table
411499676dfSJulian Elischer  */
412df8bae1dSRodney W. Grimes void
413d1dd20beSSam Leffler rtfree(struct rtentry *rt)
414df8bae1dSRodney W. Grimes {
415df8bae1dSRodney W. Grimes 
416a0c0e34bSGleb Smirnoff 	KASSERT(rt != NULL,("%s: NULL rt", __func__));
417499676dfSJulian Elischer 
418d1dd20beSSam Leffler 	RT_LOCK_ASSERT(rt);
419d1dd20beSSam Leffler 
420cb86ca48SAlexander V. Chernikov 	RT_UNLOCK(rt);
4212bbab0afSAlexander V. Chernikov 	epoch_call(net_epoch_preempt, destroy_rtentry_epoch,
4222bbab0afSAlexander V. Chernikov 	    &rt->rt_epoch_ctx);
423df8bae1dSRodney W. Grimes }
424df8bae1dSRodney W. Grimes 
4252bbab0afSAlexander V. Chernikov static void
4262bbab0afSAlexander V. Chernikov destroy_rtentry(struct rtentry *rt)
427dd4776f0SAlexander V. Chernikov {
428dd4776f0SAlexander V. Chernikov 
4292bbab0afSAlexander V. Chernikov 	/*
4302bbab0afSAlexander V. Chernikov 	 * At this moment rnh, nh_control may be already freed.
4312bbab0afSAlexander V. Chernikov 	 * nhop interface may have been migrated to a different vnet.
4322bbab0afSAlexander V. Chernikov 	 * Use vnet stored in the nexthop to delete the entry.
4332bbab0afSAlexander V. Chernikov 	 */
4342bbab0afSAlexander V. Chernikov 	CURVNET_SET(nhop_get_vnet(rt->rt_nhop));
4352bbab0afSAlexander V. Chernikov 
4362bbab0afSAlexander V. Chernikov 	/* Unreference nexthop */
4372bbab0afSAlexander V. Chernikov 	nhop_free(rt->rt_nhop);
4382bbab0afSAlexander V. Chernikov 
4392bbab0afSAlexander V. Chernikov 	uma_zfree(V_rtzone, rt);
4402bbab0afSAlexander V. Chernikov 
4412bbab0afSAlexander V. Chernikov 	CURVNET_RESTORE();
4422bbab0afSAlexander V. Chernikov }
4432bbab0afSAlexander V. Chernikov 
4442bbab0afSAlexander V. Chernikov /*
4452bbab0afSAlexander V. Chernikov  * Epoch callback indicating rtentry is safe to destroy
4462bbab0afSAlexander V. Chernikov  */
4472bbab0afSAlexander V. Chernikov static void
4482bbab0afSAlexander V. Chernikov destroy_rtentry_epoch(epoch_context_t ctx)
4492bbab0afSAlexander V. Chernikov {
4502bbab0afSAlexander V. Chernikov 	struct rtentry *rt;
4512bbab0afSAlexander V. Chernikov 
4522bbab0afSAlexander V. Chernikov 	rt = __containerof(ctx, struct rtentry, rt_epoch_ctx);
4532bbab0afSAlexander V. Chernikov 
4542bbab0afSAlexander V. Chernikov 	destroy_rtentry(rt);
455dd4776f0SAlexander V. Chernikov }
456dd4776f0SAlexander V. Chernikov 
457dd4776f0SAlexander V. Chernikov /*
45834a5582cSAlexander V. Chernikov  * Adds a temporal redirect entry to the routing table.
45934a5582cSAlexander V. Chernikov  * @fibnum: fib number
46034a5582cSAlexander V. Chernikov  * @dst: destination to install redirect to
46134a5582cSAlexander V. Chernikov  * @gateway: gateway to go via
46234a5582cSAlexander V. Chernikov  * @author: sockaddr of originating router, can be NULL
46334a5582cSAlexander V. Chernikov  * @ifp: interface to use for the redirected route
46434a5582cSAlexander V. Chernikov  * @flags: set of flags to add. Allowed: RTF_GATEWAY
46534a5582cSAlexander V. Chernikov  * @lifetime_sec: time in seconds to expire this redirect.
46634a5582cSAlexander V. Chernikov  *
46734a5582cSAlexander V. Chernikov  * Retuns 0 on success, errno otherwise.
468df8bae1dSRodney W. Grimes  */
46934a5582cSAlexander V. Chernikov int
47034a5582cSAlexander V. Chernikov rib_add_redirect(u_int fibnum, struct sockaddr *dst, struct sockaddr *gateway,
47134a5582cSAlexander V. Chernikov     struct sockaddr *author, struct ifnet *ifp, int flags, int lifetime_sec)
4728b07e49aSJulian Elischer {
473f2b2e77aSAlexander V. Chernikov 	struct rtentry *rt;
47434a5582cSAlexander V. Chernikov 	int error;
475df8bae1dSRodney W. Grimes 	struct rt_addrinfo info;
47634a5582cSAlexander V. Chernikov 	struct rt_metrics rti_rmx;
477df8bae1dSRodney W. Grimes 	struct ifaddr *ifa;
478c2c2a7c1SBjoern A. Zeeb 
479b8a6e03fSGleb Smirnoff 	NET_EPOCH_ASSERT();
480b8a6e03fSGleb Smirnoff 
48134a5582cSAlexander V. Chernikov 	if (rt_tables_get_rnh(fibnum, dst->sa_family) == NULL)
48234a5582cSAlexander V. Chernikov 		return (EAFNOSUPPORT);
4838e7e854cSKip Macy 
48434a5582cSAlexander V. Chernikov 	/* Verify the allowed flag mask. */
48534a5582cSAlexander V. Chernikov 	KASSERT(((flags & ~(RTF_GATEWAY)) == 0),
48634a5582cSAlexander V. Chernikov 	    ("invalid redirect flags: %x", flags));
48734a5582cSAlexander V. Chernikov 
48834a5582cSAlexander V. Chernikov 	/* Get the best ifa for the given interface and gateway. */
48934a5582cSAlexander V. Chernikov 	if ((ifa = ifaof_ifpforaddr(gateway, ifp)) == NULL)
49034a5582cSAlexander V. Chernikov 		return (ENETUNREACH);
49134a5582cSAlexander V. Chernikov 	ifa_ref(ifa);
49234a5582cSAlexander V. Chernikov 
49334a5582cSAlexander V. Chernikov 	bzero(&info, sizeof(info));
4948071913dSRuslan Ermilov 	info.rti_info[RTAX_DST] = dst;
4958071913dSRuslan Ermilov 	info.rti_info[RTAX_GATEWAY] = gateway;
4968071913dSRuslan Ermilov 	info.rti_ifa = ifa;
49734a5582cSAlexander V. Chernikov 	info.rti_ifp = ifp;
498ea277332SAlexander V. Chernikov 	info.rti_flags = flags | RTF_HOST | RTF_DYNAMIC;
49934a5582cSAlexander V. Chernikov 
50034a5582cSAlexander V. Chernikov 	/* Setup route metrics to define expire time. */
50134a5582cSAlexander V. Chernikov 	bzero(&rti_rmx, sizeof(rti_rmx));
50234a5582cSAlexander V. Chernikov 	/* Set expire time as absolute. */
50334a5582cSAlexander V. Chernikov 	rti_rmx.rmx_expire = lifetime_sec + time_second;
50434a5582cSAlexander V. Chernikov 	info.rti_mflags |= RTV_EXPIRE;
50534a5582cSAlexander V. Chernikov 	info.rti_rmx = &rti_rmx;
50634a5582cSAlexander V. Chernikov 
5078b07e49aSJulian Elischer 	error = rtrequest1_fib(RTM_ADD, &info, &rt, fibnum);
50834a5582cSAlexander V. Chernikov 	ifa_free(ifa);
50934a5582cSAlexander V. Chernikov 
51034a5582cSAlexander V. Chernikov 	if (error != 0) {
51134a5582cSAlexander V. Chernikov 		/* TODO: add per-fib redirect stats. */
51234a5582cSAlexander V. Chernikov 		return (error);
51334a5582cSAlexander V. Chernikov 	}
51434a5582cSAlexander V. Chernikov 
5154de5d90cSSam Leffler 	RT_LOCK(rt);
5168071913dSRuslan Ermilov 	flags = rt->rt_flags;
5172bbab0afSAlexander V. Chernikov 	RT_UNLOCK(rt);
51834a5582cSAlexander V. Chernikov 
51934a5582cSAlexander V. Chernikov 	RTSTAT_INC(rts_dynamic);
52034a5582cSAlexander V. Chernikov 
52134a5582cSAlexander V. Chernikov 	/* Send notification of a route addition to userland. */
52234a5582cSAlexander V. Chernikov 	bzero(&info, sizeof(info));
523df8bae1dSRodney W. Grimes 	info.rti_info[RTAX_DST] = dst;
524df8bae1dSRodney W. Grimes 	info.rti_info[RTAX_GATEWAY] = gateway;
52534a5582cSAlexander V. Chernikov 	info.rti_info[RTAX_AUTHOR] = author;
526528737fdSBjoern A. Zeeb 	rt_missmsg_fib(RTM_REDIRECT, &info, flags, error, fibnum);
52734a5582cSAlexander V. Chernikov 
52834a5582cSAlexander V. Chernikov 	return (0);
529df8bae1dSRodney W. Grimes }
530df8bae1dSRodney W. Grimes 
531df8bae1dSRodney W. Grimes /*
532df8bae1dSRodney W. Grimes  * Routing table ioctl interface.
533df8bae1dSRodney W. Grimes  */
534df8bae1dSRodney W. Grimes int
5358b07e49aSJulian Elischer rtioctl_fib(u_long req, caddr_t data, u_int fibnum)
536df8bae1dSRodney W. Grimes {
5375090559bSChristian S.J. Peron 
5385090559bSChristian S.J. Peron 	/*
5395090559bSChristian S.J. Peron 	 * If more ioctl commands are added here, make sure the proper
5405090559bSChristian S.J. Peron 	 * super-user checks are being performed because it is possible for
5415090559bSChristian S.J. Peron 	 * prison-root to make it this far if raw sockets have been enabled
5425090559bSChristian S.J. Peron 	 * in jails.
5435090559bSChristian S.J. Peron 	 */
544623ae52eSPoul-Henning Kamp #ifdef INET
545f0068c4aSGarrett Wollman 	/* Multicast goop, grrr... */
5468b07e49aSJulian Elischer 	return mrt_ioctl ? mrt_ioctl(req, data, fibnum) : EOPNOTSUPP;
547623ae52eSPoul-Henning Kamp #else /* INET */
548623ae52eSPoul-Henning Kamp 	return ENXIO;
549623ae52eSPoul-Henning Kamp #endif /* INET */
550df8bae1dSRodney W. Grimes }
551df8bae1dSRodney W. Grimes 
552df8bae1dSRodney W. Grimes struct ifaddr *
5534d2c2509SAlexander V. Chernikov ifa_ifwithroute(int flags, const struct sockaddr *dst,
5544d2c2509SAlexander V. Chernikov     const struct sockaddr *gateway, u_int fibnum)
5558b07e49aSJulian Elischer {
556f59c6cb0SAlexander V. Chernikov 	struct ifaddr *ifa;
557d1dd20beSSam Leffler 
55897168be8SGleb Smirnoff 	NET_EPOCH_ASSERT();
559df8bae1dSRodney W. Grimes 	if ((flags & RTF_GATEWAY) == 0) {
560df8bae1dSRodney W. Grimes 		/*
561df8bae1dSRodney W. Grimes 		 * If we are adding a route to an interface,
562df8bae1dSRodney W. Grimes 		 * and the interface is a pt to pt link
563df8bae1dSRodney W. Grimes 		 * we should search for the destination
564df8bae1dSRodney W. Grimes 		 * as our clue to the interface.  Otherwise
565df8bae1dSRodney W. Grimes 		 * we can use the local address.
566df8bae1dSRodney W. Grimes 		 */
56785911824SLuigi Rizzo 		ifa = NULL;
56885911824SLuigi Rizzo 		if (flags & RTF_HOST)
5694f8585e0SAlan Somers 			ifa = ifa_ifwithdstaddr(dst, fibnum);
57085911824SLuigi Rizzo 		if (ifa == NULL)
571df8bae1dSRodney W. Grimes 			ifa = ifa_ifwithaddr(gateway);
572df8bae1dSRodney W. Grimes 	} else {
573df8bae1dSRodney W. Grimes 		/*
574df8bae1dSRodney W. Grimes 		 * If we are adding a route to a remote net
575df8bae1dSRodney W. Grimes 		 * or host, the gateway may still be on the
576df8bae1dSRodney W. Grimes 		 * other end of a pt to pt link.
577df8bae1dSRodney W. Grimes 		 */
5784f8585e0SAlan Somers 		ifa = ifa_ifwithdstaddr(gateway, fibnum);
579df8bae1dSRodney W. Grimes 	}
58085911824SLuigi Rizzo 	if (ifa == NULL)
5814f8585e0SAlan Somers 		ifa = ifa_ifwithnet(gateway, 0, fibnum);
58285911824SLuigi Rizzo 	if (ifa == NULL) {
583682b902dSAlexander V. Chernikov 		struct nhop_object *nh;
584b83aa367SAndrey V. Elsukov 
585682b902dSAlexander V. Chernikov 		nh = rib_lookup(fibnum, gateway, NHR_NONE, 0);
586682b902dSAlexander V. Chernikov 
587e034e82cSQing Li 		/*
588e034e82cSQing Li 		 * dismiss a gateway that is reachable only
589e034e82cSQing Li 		 * through the default router
590e034e82cSQing Li 		 */
591682b902dSAlexander V. Chernikov 		if ((nh == NULL) || (nh->nh_flags & NHF_DEFAULT))
592682b902dSAlexander V. Chernikov 			return (NULL);
593682b902dSAlexander V. Chernikov 		ifa = nh->nh_ifa;
594df8bae1dSRodney W. Grimes 	}
595df8bae1dSRodney W. Grimes 	if (ifa->ifa_addr->sa_family != dst->sa_family) {
596df8bae1dSRodney W. Grimes 		struct ifaddr *oifa = ifa;
597df8bae1dSRodney W. Grimes 		ifa = ifaof_ifpforaddr(dst, ifa->ifa_ifp);
59885911824SLuigi Rizzo 		if (ifa == NULL)
599df8bae1dSRodney W. Grimes 			ifa = oifa;
600df8bae1dSRodney W. Grimes 	}
601682b902dSAlexander V. Chernikov 
602df8bae1dSRodney W. Grimes 	return (ifa);
603df8bae1dSRodney W. Grimes }
604df8bae1dSRodney W. Grimes 
605b0a76b88SJulian Elischer /*
606b0a76b88SJulian Elischer  * Do appropriate manipulations of a routing tree given
607b0a76b88SJulian Elischer  * all the bits of info needed
608b0a76b88SJulian Elischer  */
609df8bae1dSRodney W. Grimes int
6108b07e49aSJulian Elischer rtrequest_fib(int req,
6118b07e49aSJulian Elischer 	struct sockaddr *dst,
6128b07e49aSJulian Elischer 	struct sockaddr *gateway,
6138b07e49aSJulian Elischer 	struct sockaddr *netmask,
6148b07e49aSJulian Elischer 	int flags,
6158b07e49aSJulian Elischer 	struct rtentry **ret_nrt,
6168b07e49aSJulian Elischer 	u_int fibnum)
6178b07e49aSJulian Elischer {
6188071913dSRuslan Ermilov 	struct rt_addrinfo info;
6198071913dSRuslan Ermilov 
620ac4a76ebSBjoern A. Zeeb 	if (dst->sa_len == 0)
621ac4a76ebSBjoern A. Zeeb 		return(EINVAL);
622ac4a76ebSBjoern A. Zeeb 
6238071913dSRuslan Ermilov 	bzero((caddr_t)&info, sizeof(info));
6248071913dSRuslan Ermilov 	info.rti_flags = flags;
6258071913dSRuslan Ermilov 	info.rti_info[RTAX_DST] = dst;
6268071913dSRuslan Ermilov 	info.rti_info[RTAX_GATEWAY] = gateway;
6278071913dSRuslan Ermilov 	info.rti_info[RTAX_NETMASK] = netmask;
6288b07e49aSJulian Elischer 	return rtrequest1_fib(req, &info, ret_nrt, fibnum);
6298071913dSRuslan Ermilov }
6308071913dSRuslan Ermilov 
6314bdf0b6aSAlexander V. Chernikov 
6322caee4beSAlexander V. Chernikov /*
6339a1b64d5SAlexander V. Chernikov  * Copy most of @rt data into @info.
6349a1b64d5SAlexander V. Chernikov  *
6359a1b64d5SAlexander V. Chernikov  * If @flags contains NHR_COPY, copies dst,netmask and gw to the
6369a1b64d5SAlexander V. Chernikov  * pointers specified by @info structure. Assume such pointers
6379a1b64d5SAlexander V. Chernikov  * are zeroed sockaddr-like structures with sa_len field initialized
6389a1b64d5SAlexander V. Chernikov  * to reflect size of the provided buffer. if no NHR_COPY is specified,
6399a1b64d5SAlexander V. Chernikov  * point dst,netmask and gw @info fields to appropriate @rt values.
6409a1b64d5SAlexander V. Chernikov  *
6416b5d8e30SMark Johnston  * if @flags contains NHR_REF, do refcouting on rt_ifp and rt_ifa.
6429a1b64d5SAlexander V. Chernikov  *
6439a1b64d5SAlexander V. Chernikov  * Returns 0 on success.
6449a1b64d5SAlexander V. Chernikov  */
6459a1b64d5SAlexander V. Chernikov int
6469a1b64d5SAlexander V. Chernikov rt_exportinfo(struct rtentry *rt, struct rt_addrinfo *info, int flags)
6479a1b64d5SAlexander V. Chernikov {
6489a1b64d5SAlexander V. Chernikov 	struct rt_metrics *rmx;
6499a1b64d5SAlexander V. Chernikov 	struct sockaddr *src, *dst;
650aaad3c4fSAlexander V. Chernikov 	struct nhop_object *nh;
6519a1b64d5SAlexander V. Chernikov 	int sa_len;
6529a1b64d5SAlexander V. Chernikov 
6539a1b64d5SAlexander V. Chernikov 	if (flags & NHR_COPY) {
6549a1b64d5SAlexander V. Chernikov 		/* Copy destination if dst is non-zero */
6559a1b64d5SAlexander V. Chernikov 		src = rt_key(rt);
6569a1b64d5SAlexander V. Chernikov 		dst = info->rti_info[RTAX_DST];
6579a1b64d5SAlexander V. Chernikov 		sa_len = src->sa_len;
65816703ea8SAlexander V. Chernikov 		if (dst != NULL) {
6599a1b64d5SAlexander V. Chernikov 			if (src->sa_len > dst->sa_len)
6609a1b64d5SAlexander V. Chernikov 				return (ENOMEM);
6619a1b64d5SAlexander V. Chernikov 			memcpy(dst, src, src->sa_len);
6629a1b64d5SAlexander V. Chernikov 			info->rti_addrs |= RTA_DST;
6639a1b64d5SAlexander V. Chernikov 		}
6649a1b64d5SAlexander V. Chernikov 
6659a1b64d5SAlexander V. Chernikov 		/* Copy mask if set && dst is non-zero */
6669a1b64d5SAlexander V. Chernikov 		src = rt_mask(rt);
6679a1b64d5SAlexander V. Chernikov 		dst = info->rti_info[RTAX_NETMASK];
6689a1b64d5SAlexander V. Chernikov 		if (src != NULL && dst != NULL) {
6699a1b64d5SAlexander V. Chernikov 
6709a1b64d5SAlexander V. Chernikov 			/*
6719a1b64d5SAlexander V. Chernikov 			 * Radix stores different value in sa_len,
6729a1b64d5SAlexander V. Chernikov 			 * assume rt_mask() to have the same length
6739a1b64d5SAlexander V. Chernikov 			 * as rt_key()
6749a1b64d5SAlexander V. Chernikov 			 */
6759a1b64d5SAlexander V. Chernikov 			if (sa_len > dst->sa_len)
6769a1b64d5SAlexander V. Chernikov 				return (ENOMEM);
6779a1b64d5SAlexander V. Chernikov 			memcpy(dst, src, src->sa_len);
6789a1b64d5SAlexander V. Chernikov 			info->rti_addrs |= RTA_NETMASK;
6799a1b64d5SAlexander V. Chernikov 		}
6809a1b64d5SAlexander V. Chernikov 
6819a1b64d5SAlexander V. Chernikov 		/* Copy gateway is set && dst is non-zero */
682aaad3c4fSAlexander V. Chernikov 		src = &rt->rt_nhop->gw_sa;
6839a1b64d5SAlexander V. Chernikov 		dst = info->rti_info[RTAX_GATEWAY];
6849a1b64d5SAlexander V. Chernikov 		if ((rt->rt_flags & RTF_GATEWAY) && src != NULL && dst != NULL){
6859a1b64d5SAlexander V. Chernikov 			if (src->sa_len > dst->sa_len)
6869a1b64d5SAlexander V. Chernikov 				return (ENOMEM);
6879a1b64d5SAlexander V. Chernikov 			memcpy(dst, src, src->sa_len);
6889a1b64d5SAlexander V. Chernikov 			info->rti_addrs |= RTA_GATEWAY;
6899a1b64d5SAlexander V. Chernikov 		}
6909a1b64d5SAlexander V. Chernikov 	} else {
6919a1b64d5SAlexander V. Chernikov 		info->rti_info[RTAX_DST] = rt_key(rt);
6929a1b64d5SAlexander V. Chernikov 		info->rti_addrs |= RTA_DST;
6939a1b64d5SAlexander V. Chernikov 		if (rt_mask(rt) != NULL) {
6949a1b64d5SAlexander V. Chernikov 			info->rti_info[RTAX_NETMASK] = rt_mask(rt);
6959a1b64d5SAlexander V. Chernikov 			info->rti_addrs |= RTA_NETMASK;
6969a1b64d5SAlexander V. Chernikov 		}
6979a1b64d5SAlexander V. Chernikov 		if (rt->rt_flags & RTF_GATEWAY) {
698aaad3c4fSAlexander V. Chernikov 			info->rti_info[RTAX_GATEWAY] = &rt->rt_nhop->gw_sa;
6999a1b64d5SAlexander V. Chernikov 			info->rti_addrs |= RTA_GATEWAY;
7009a1b64d5SAlexander V. Chernikov 		}
7019a1b64d5SAlexander V. Chernikov 	}
7029a1b64d5SAlexander V. Chernikov 
703aaad3c4fSAlexander V. Chernikov 	nh = rt->rt_nhop;
7049a1b64d5SAlexander V. Chernikov 	rmx = info->rti_rmx;
7059a1b64d5SAlexander V. Chernikov 	if (rmx != NULL) {
7069a1b64d5SAlexander V. Chernikov 		info->rti_mflags |= RTV_MTU;
707aaad3c4fSAlexander V. Chernikov 		rmx->rmx_mtu = nh->nh_mtu;
7089a1b64d5SAlexander V. Chernikov 	}
7099a1b64d5SAlexander V. Chernikov 
710aaad3c4fSAlexander V. Chernikov 	info->rti_flags = rt->rt_flags | nhop_get_rtflags(nh);
711aaad3c4fSAlexander V. Chernikov 	info->rti_ifp = nh->nh_ifp;
712aaad3c4fSAlexander V. Chernikov 	info->rti_ifa = nh->nh_ifa;
7139a1b64d5SAlexander V. Chernikov 	if (flags & NHR_REF) {
7149a1b64d5SAlexander V. Chernikov 		if_ref(info->rti_ifp);
7156b5d8e30SMark Johnston 		ifa_ref(info->rti_ifa);
7169a1b64d5SAlexander V. Chernikov 	}
7179a1b64d5SAlexander V. Chernikov 
7189a1b64d5SAlexander V. Chernikov 	return (0);
7199a1b64d5SAlexander V. Chernikov }
7209a1b64d5SAlexander V. Chernikov 
7219a1b64d5SAlexander V. Chernikov /*
7229a1b64d5SAlexander V. Chernikov  * Lookups up route entry for @dst in RIB database for fib @fibnum.
7239a1b64d5SAlexander V. Chernikov  * Exports entry data to @info using rt_exportinfo().
7249a1b64d5SAlexander V. Chernikov  *
7256b5d8e30SMark Johnston  * If @flags contains NHR_REF, refcouting is performed on rt_ifp and rt_ifa.
7266b5d8e30SMark Johnston  * All references can be released later by calling rib_free_info().
7279a1b64d5SAlexander V. Chernikov  *
7289a1b64d5SAlexander V. Chernikov  * Returns 0 on success.
7299a1b64d5SAlexander V. Chernikov  * Returns ENOENT for lookup failure, ENOMEM for export failure.
7309a1b64d5SAlexander V. Chernikov  */
7319a1b64d5SAlexander V. Chernikov int
7329a1b64d5SAlexander V. Chernikov rib_lookup_info(uint32_t fibnum, const struct sockaddr *dst, uint32_t flags,
7339a1b64d5SAlexander V. Chernikov     uint32_t flowid, struct rt_addrinfo *info)
7349a1b64d5SAlexander V. Chernikov {
73520efcfc6SAndrey V. Elsukov 	RIB_RLOCK_TRACKER;
73661eee0e2SAlexander V. Chernikov 	struct rib_head *rh;
7379a1b64d5SAlexander V. Chernikov 	struct radix_node *rn;
7389a1b64d5SAlexander V. Chernikov 	struct rtentry *rt;
7399a1b64d5SAlexander V. Chernikov 	int error;
7409a1b64d5SAlexander V. Chernikov 
7419a1b64d5SAlexander V. Chernikov 	KASSERT((fibnum < rt_numfibs), ("rib_lookup_rte: bad fibnum"));
7429a1b64d5SAlexander V. Chernikov 	rh = rt_tables_get_rnh(fibnum, dst->sa_family);
7439a1b64d5SAlexander V. Chernikov 	if (rh == NULL)
7449a1b64d5SAlexander V. Chernikov 		return (ENOENT);
7459a1b64d5SAlexander V. Chernikov 
74661eee0e2SAlexander V. Chernikov 	RIB_RLOCK(rh);
74761eee0e2SAlexander V. Chernikov 	rn = rh->rnh_matchaddr(__DECONST(void *, dst), &rh->head);
7489a1b64d5SAlexander V. Chernikov 	if (rn != NULL && ((rn->rn_flags & RNF_ROOT) == 0)) {
7499a1b64d5SAlexander V. Chernikov 		rt = RNTORT(rn);
7509a1b64d5SAlexander V. Chernikov 		/* Ensure route & ifp is UP */
7518c61eb21SAlexander V. Chernikov 		if (RT_LINK_IS_UP(rt->rt_nhop->nh_ifp)) {
7529a1b64d5SAlexander V. Chernikov 			flags = (flags & NHR_REF) | NHR_COPY;
7539a1b64d5SAlexander V. Chernikov 			error = rt_exportinfo(rt, info, flags);
75461eee0e2SAlexander V. Chernikov 			RIB_RUNLOCK(rh);
7559a1b64d5SAlexander V. Chernikov 
7569a1b64d5SAlexander V. Chernikov 			return (error);
7579a1b64d5SAlexander V. Chernikov 		}
7589a1b64d5SAlexander V. Chernikov 	}
75961eee0e2SAlexander V. Chernikov 	RIB_RUNLOCK(rh);
7609a1b64d5SAlexander V. Chernikov 
7619a1b64d5SAlexander V. Chernikov 	return (ENOENT);
7629a1b64d5SAlexander V. Chernikov }
7639a1b64d5SAlexander V. Chernikov 
7649a1b64d5SAlexander V. Chernikov /*
7659a1b64d5SAlexander V. Chernikov  * Releases all references acquired by rib_lookup_info() when
7669a1b64d5SAlexander V. Chernikov  * called with NHR_REF flags.
7679a1b64d5SAlexander V. Chernikov  */
7689a1b64d5SAlexander V. Chernikov void
7699a1b64d5SAlexander V. Chernikov rib_free_info(struct rt_addrinfo *info)
7709a1b64d5SAlexander V. Chernikov {
7719a1b64d5SAlexander V. Chernikov 
7726b5d8e30SMark Johnston 	ifa_free(info->rti_ifa);
7739a1b64d5SAlexander V. Chernikov 	if_rele(info->rti_ifp);
7749a1b64d5SAlexander V. Chernikov }
7759a1b64d5SAlexander V. Chernikov 
7769a1b64d5SAlexander V. Chernikov /*
7772caee4beSAlexander V. Chernikov  * Iterates over all existing fibs in system calling
7782caee4beSAlexander V. Chernikov  *  @setwa_f function prior to traversing each fib.
7792caee4beSAlexander V. Chernikov  *  Calls @wa_f function for each element in current fib.
7802caee4beSAlexander V. Chernikov  * If af is not AF_UNSPEC, iterates over fibs in particular
7812caee4beSAlexander V. Chernikov  * address family.
7822caee4beSAlexander V. Chernikov  */
7834bdf0b6aSAlexander V. Chernikov void
7842caee4beSAlexander V. Chernikov rt_foreach_fib_walk(int af, rt_setwarg_t *setwa_f, rt_walktree_f_t *wa_f,
7852caee4beSAlexander V. Chernikov     void *arg)
7864bdf0b6aSAlexander V. Chernikov {
78761eee0e2SAlexander V. Chernikov 	struct rib_head *rnh;
7884bdf0b6aSAlexander V. Chernikov 	uint32_t fibnum;
7894bdf0b6aSAlexander V. Chernikov 	int i;
7904bdf0b6aSAlexander V. Chernikov 
7914bdf0b6aSAlexander V. Chernikov 	for (fibnum = 0; fibnum < rt_numfibs; fibnum++) {
7924bdf0b6aSAlexander V. Chernikov 		/* Do we want some specific family? */
7934bdf0b6aSAlexander V. Chernikov 		if (af != AF_UNSPEC) {
7944bdf0b6aSAlexander V. Chernikov 			rnh = rt_tables_get_rnh(fibnum, af);
7954bdf0b6aSAlexander V. Chernikov 			if (rnh == NULL)
7964bdf0b6aSAlexander V. Chernikov 				continue;
7974bdf0b6aSAlexander V. Chernikov 			if (setwa_f != NULL)
798e4790abfSAlexander V. Chernikov 				setwa_f(rnh, fibnum, af, arg);
7994bdf0b6aSAlexander V. Chernikov 
80061eee0e2SAlexander V. Chernikov 			RIB_WLOCK(rnh);
80161eee0e2SAlexander V. Chernikov 			rnh->rnh_walktree(&rnh->head, (walktree_f_t *)wa_f,arg);
80261eee0e2SAlexander V. Chernikov 			RIB_WUNLOCK(rnh);
8034bdf0b6aSAlexander V. Chernikov 			continue;
8044bdf0b6aSAlexander V. Chernikov 		}
8054bdf0b6aSAlexander V. Chernikov 
8064bdf0b6aSAlexander V. Chernikov 		for (i = 1; i <= AF_MAX; i++) {
8074bdf0b6aSAlexander V. Chernikov 			rnh = rt_tables_get_rnh(fibnum, i);
8084bdf0b6aSAlexander V. Chernikov 			if (rnh == NULL)
8094bdf0b6aSAlexander V. Chernikov 				continue;
8104bdf0b6aSAlexander V. Chernikov 			if (setwa_f != NULL)
8114bdf0b6aSAlexander V. Chernikov 				setwa_f(rnh, fibnum, i, arg);
8124bdf0b6aSAlexander V. Chernikov 
81361eee0e2SAlexander V. Chernikov 			RIB_WLOCK(rnh);
81461eee0e2SAlexander V. Chernikov 			rnh->rnh_walktree(&rnh->head, (walktree_f_t *)wa_f,arg);
81561eee0e2SAlexander V. Chernikov 			RIB_WUNLOCK(rnh);
8164bdf0b6aSAlexander V. Chernikov 		}
8174bdf0b6aSAlexander V. Chernikov 	}
8184bdf0b6aSAlexander V. Chernikov }
8194bdf0b6aSAlexander V. Chernikov 
82034a5582cSAlexander V. Chernikov /*
82134a5582cSAlexander V. Chernikov  * Iterates over all existing fibs in system and deletes each element
82234a5582cSAlexander V. Chernikov  *  for which @filter_f function returns non-zero value.
82334a5582cSAlexander V. Chernikov  * If @family is not AF_UNSPEC, iterates over fibs in particular
82434a5582cSAlexander V. Chernikov  * address family.
82534a5582cSAlexander V. Chernikov  */
82634a5582cSAlexander V. Chernikov void
82734a5582cSAlexander V. Chernikov rt_foreach_fib_walk_del(int family, rt_filter_f_t *filter_f, void *arg)
82834a5582cSAlexander V. Chernikov {
82934a5582cSAlexander V. Chernikov 	u_int fibnum;
83034a5582cSAlexander V. Chernikov 	int i, start, end;
83134a5582cSAlexander V. Chernikov 
83234a5582cSAlexander V. Chernikov 	for (fibnum = 0; fibnum < rt_numfibs; fibnum++) {
83334a5582cSAlexander V. Chernikov 		/* Do we want some specific family? */
83434a5582cSAlexander V. Chernikov 		if (family != AF_UNSPEC) {
83534a5582cSAlexander V. Chernikov 			start = family;
83634a5582cSAlexander V. Chernikov 			end = family;
83734a5582cSAlexander V. Chernikov 		} else {
83834a5582cSAlexander V. Chernikov 			start = 1;
83934a5582cSAlexander V. Chernikov 			end = AF_MAX;
84034a5582cSAlexander V. Chernikov 		}
84134a5582cSAlexander V. Chernikov 
84234a5582cSAlexander V. Chernikov 		for (i = start; i <= end; i++) {
84334a5582cSAlexander V. Chernikov 			if (rt_tables_get_rnh(fibnum, i) == NULL)
84434a5582cSAlexander V. Chernikov 				continue;
84534a5582cSAlexander V. Chernikov 
84634a5582cSAlexander V. Chernikov 			rib_walk_del(fibnum, i, filter_f, arg, 0);
847e8b0643eSAlexander V. Chernikov 		}
848e8b0643eSAlexander V. Chernikov 	}
849e8b0643eSAlexander V. Chernikov }
850e8b0643eSAlexander V. Chernikov 
8514bdf0b6aSAlexander V. Chernikov /*
8524bdf0b6aSAlexander V. Chernikov  * Delete Routes for a Network Interface
8534bdf0b6aSAlexander V. Chernikov  *
8544bdf0b6aSAlexander V. Chernikov  * Called for each routing entry via the rnh->rnh_walktree() call above
8554bdf0b6aSAlexander V. Chernikov  * to delete all route entries referencing a detaching network interface.
8564bdf0b6aSAlexander V. Chernikov  *
8574bdf0b6aSAlexander V. Chernikov  * Arguments:
8584bdf0b6aSAlexander V. Chernikov  *	rt	pointer to rtentry
859539642a2SAlexander V. Chernikov  *	nh	pointer to nhop
8604bdf0b6aSAlexander V. Chernikov  *	arg	argument passed to rnh->rnh_walktree() - detaching interface
8614bdf0b6aSAlexander V. Chernikov  *
8624bdf0b6aSAlexander V. Chernikov  * Returns:
8634bdf0b6aSAlexander V. Chernikov  *	0	successful
8644bdf0b6aSAlexander V. Chernikov  *	errno	failed - reason indicated
8654bdf0b6aSAlexander V. Chernikov  */
8664bdf0b6aSAlexander V. Chernikov static int
867539642a2SAlexander V. Chernikov rt_ifdelroute(const struct rtentry *rt, const struct nhop_object *nh, void *arg)
8684bdf0b6aSAlexander V. Chernikov {
8694bdf0b6aSAlexander V. Chernikov 	struct ifnet	*ifp = arg;
8704bdf0b6aSAlexander V. Chernikov 
871539642a2SAlexander V. Chernikov 	if (nh->nh_ifp != ifp)
8724bdf0b6aSAlexander V. Chernikov 		return (0);
8734bdf0b6aSAlexander V. Chernikov 
8744bdf0b6aSAlexander V. Chernikov 	/*
8754bdf0b6aSAlexander V. Chernikov 	 * Protect (sorta) against walktree recursion problems
8764bdf0b6aSAlexander V. Chernikov 	 * with cloned routes
8774bdf0b6aSAlexander V. Chernikov 	 */
8784bdf0b6aSAlexander V. Chernikov 	if ((rt->rt_flags & RTF_UP) == 0)
8794bdf0b6aSAlexander V. Chernikov 		return (0);
8804bdf0b6aSAlexander V. Chernikov 
881e8b0643eSAlexander V. Chernikov 	return (1);
8824bdf0b6aSAlexander V. Chernikov }
8834bdf0b6aSAlexander V. Chernikov 
8844bdf0b6aSAlexander V. Chernikov /*
8854bdf0b6aSAlexander V. Chernikov  * Delete all remaining routes using this interface
8864bdf0b6aSAlexander V. Chernikov  * Unfortuneatly the only way to do this is to slog through
8874bdf0b6aSAlexander V. Chernikov  * the entire routing table looking for routes which point
8884bdf0b6aSAlexander V. Chernikov  * to this interface...oh well...
8894bdf0b6aSAlexander V. Chernikov  */
8904bdf0b6aSAlexander V. Chernikov void
89180ae8d60SBjoern A. Zeeb rt_flushifroutes_af(struct ifnet *ifp, int af)
89280ae8d60SBjoern A. Zeeb {
89380ae8d60SBjoern A. Zeeb 	KASSERT((af >= 1 && af <= AF_MAX), ("%s: af %d not >= 1 and <= %d",
89480ae8d60SBjoern A. Zeeb 	    __func__, af, AF_MAX));
89580ae8d60SBjoern A. Zeeb 
89680ae8d60SBjoern A. Zeeb 	rt_foreach_fib_walk_del(af, rt_ifdelroute, ifp);
89780ae8d60SBjoern A. Zeeb }
89880ae8d60SBjoern A. Zeeb 
89980ae8d60SBjoern A. Zeeb void
9004bdf0b6aSAlexander V. Chernikov rt_flushifroutes(struct ifnet *ifp)
9014bdf0b6aSAlexander V. Chernikov {
9024bdf0b6aSAlexander V. Chernikov 
903e8b0643eSAlexander V. Chernikov 	rt_foreach_fib_walk_del(AF_UNSPEC, rt_ifdelroute, ifp);
9044bdf0b6aSAlexander V. Chernikov }
9054bdf0b6aSAlexander V. Chernikov 
9068071913dSRuslan Ermilov /*
9078c0fec80SRobert Watson  * Look up rt_addrinfo for a specific fib.  Note that if rti_ifa is defined,
9088c0fec80SRobert Watson  * it will be referenced so the caller must free it.
9092ad7ed6eSAlexander V. Chernikov  *
9102ad7ed6eSAlexander V. Chernikov  * Assume basic consistency checks are executed by callers:
9112ad7ed6eSAlexander V. Chernikov  * RTAX_DST exists, if RTF_GATEWAY is set, RTAX_GATEWAY exists as well.
9128c0fec80SRobert Watson  */
9138b07e49aSJulian Elischer int
9148b07e49aSJulian Elischer rt_getifa_fib(struct rt_addrinfo *info, u_int fibnum)
9158b07e49aSJulian Elischer {
9164d2c2509SAlexander V. Chernikov 	const struct sockaddr *dst, *gateway, *ifpaddr, *ifaaddr;
917a68cc388SGleb Smirnoff 	struct epoch_tracker et;
9184d2c2509SAlexander V. Chernikov 	int needref, error, flags;
9194d2c2509SAlexander V. Chernikov 
9204d2c2509SAlexander V. Chernikov 	dst = info->rti_info[RTAX_DST];
9214d2c2509SAlexander V. Chernikov 	gateway = info->rti_info[RTAX_GATEWAY];
9224d2c2509SAlexander V. Chernikov 	ifpaddr = info->rti_info[RTAX_IFP];
9234d2c2509SAlexander V. Chernikov 	ifaaddr = info->rti_info[RTAX_IFA];
9244d2c2509SAlexander V. Chernikov 	flags = info->rti_flags;
9258071913dSRuslan Ermilov 
9268071913dSRuslan Ermilov 	/*
9278071913dSRuslan Ermilov 	 * ifp may be specified by sockaddr_dl
9288071913dSRuslan Ermilov 	 * when protocol address is ambiguous.
9298071913dSRuslan Ermilov 	 */
9301ebec5faSMatt Macy 	error = 0;
9311ebec5faSMatt Macy 	needref = (info->rti_ifa == NULL);
932a68cc388SGleb Smirnoff 	NET_EPOCH_ENTER(et);
9332ad7ed6eSAlexander V. Chernikov 
9342ad7ed6eSAlexander V. Chernikov 	/* If we have interface specified by the ifindex in the address, use it */
9358071913dSRuslan Ermilov 	if (info->rti_ifp == NULL && ifpaddr != NULL &&
9362ad7ed6eSAlexander V. Chernikov 	    ifpaddr->sa_family == AF_LINK) {
9372ad7ed6eSAlexander V. Chernikov 	    const struct sockaddr_dl *sdl = (const struct sockaddr_dl *)ifpaddr;
9382ad7ed6eSAlexander V. Chernikov 	    if (sdl->sdl_index != 0)
939270b83b9SHans Petter Selasky 		    info->rti_ifp = ifnet_byindex(sdl->sdl_index);
9408c0fec80SRobert Watson 	}
9412ad7ed6eSAlexander V. Chernikov 	/*
9422ad7ed6eSAlexander V. Chernikov 	 * If we have source address specified, try to find it
9432ad7ed6eSAlexander V. Chernikov 	 * TODO: avoid enumerating all ifas on all interfaces.
9442ad7ed6eSAlexander V. Chernikov 	 */
9458071913dSRuslan Ermilov 	if (info->rti_ifa == NULL && ifaaddr != NULL)
9468071913dSRuslan Ermilov 		info->rti_ifa = ifa_ifwithaddr(ifaaddr);
9478071913dSRuslan Ermilov 	if (info->rti_ifa == NULL) {
9484d2c2509SAlexander V. Chernikov 		const struct sockaddr *sa;
9498071913dSRuslan Ermilov 
9502ad7ed6eSAlexander V. Chernikov 		/*
9512ad7ed6eSAlexander V. Chernikov 		 * Most common use case for the userland-supplied routes.
9522ad7ed6eSAlexander V. Chernikov 		 *
9532ad7ed6eSAlexander V. Chernikov 		 * Choose sockaddr to select ifa.
9542ad7ed6eSAlexander V. Chernikov 		 * -- if ifp is set --
9552ad7ed6eSAlexander V. Chernikov 		 * Order of preference:
9562ad7ed6eSAlexander V. Chernikov 		 * 1) IFA address
9572ad7ed6eSAlexander V. Chernikov 		 * 2) gateway address
9582ad7ed6eSAlexander V. Chernikov 		 *   Note: for interface routes link-level gateway address
9592ad7ed6eSAlexander V. Chernikov 		 *     is specified to indicate the interface index without
9602ad7ed6eSAlexander V. Chernikov 		 *     specifying RTF_GATEWAY. In this case, ignore gateway
9612ad7ed6eSAlexander V. Chernikov 		 *   Note: gateway AF may be different from dst AF. In this case,
9622ad7ed6eSAlexander V. Chernikov 		 *   ignore gateway
9632ad7ed6eSAlexander V. Chernikov 		 * 3) final destination.
9642ad7ed6eSAlexander V. Chernikov 		 * 4) if all of these fails, try to get at least link-level ifa.
9652ad7ed6eSAlexander V. Chernikov 		 * -- else --
9662ad7ed6eSAlexander V. Chernikov 		 * try to lookup gateway or dst in the routing table to get ifa
9672ad7ed6eSAlexander V. Chernikov 		 */
9682ad7ed6eSAlexander V. Chernikov 		if (info->rti_info[RTAX_IFA] != NULL)
9692ad7ed6eSAlexander V. Chernikov 			sa = info->rti_info[RTAX_IFA];
9702ad7ed6eSAlexander V. Chernikov 		else if ((info->rti_flags & RTF_GATEWAY) != 0 &&
9712ad7ed6eSAlexander V. Chernikov 		    gateway->sa_family == dst->sa_family)
9722ad7ed6eSAlexander V. Chernikov 			sa = gateway;
9732ad7ed6eSAlexander V. Chernikov 		else
9742ad7ed6eSAlexander V. Chernikov 			sa = dst;
9752ad7ed6eSAlexander V. Chernikov 		if (info->rti_ifp != NULL) {
9768071913dSRuslan Ermilov 			info->rti_ifa = ifaof_ifpforaddr(sa, info->rti_ifp);
9772ad7ed6eSAlexander V. Chernikov 			/* Case 4 */
9782ad7ed6eSAlexander V. Chernikov 			if (info->rti_ifa == NULL && gateway != NULL)
9792ad7ed6eSAlexander V. Chernikov 				info->rti_ifa = ifaof_ifpforaddr(gateway, info->rti_ifp);
9802ad7ed6eSAlexander V. Chernikov 		} else if (dst != NULL && gateway != NULL)
9814f8585e0SAlan Somers 			info->rti_ifa = ifa_ifwithroute(flags, dst, gateway,
9828b07e49aSJulian Elischer 							fibnum);
9838071913dSRuslan Ermilov 		else if (sa != NULL)
9844f8585e0SAlan Somers 			info->rti_ifa = ifa_ifwithroute(flags, sa, sa,
9858b07e49aSJulian Elischer 							fibnum);
9868071913dSRuslan Ermilov 	}
9871ebec5faSMatt Macy 	if (needref && info->rti_ifa != NULL) {
9888071913dSRuslan Ermilov 		if (info->rti_ifp == NULL)
989134804c8SMatt Macy 			info->rti_ifp = info->rti_ifa->ifa_ifp;
9904f6c66ccSMatt Macy 		ifa_ref(info->rti_ifa);
9918071913dSRuslan Ermilov 	} else
9928071913dSRuslan Ermilov 		error = ENETUNREACH;
993a68cc388SGleb Smirnoff 	NET_EPOCH_EXIT(et);
9948071913dSRuslan Ermilov 	return (error);
9958071913dSRuslan Ermilov }
9968071913dSRuslan Ermilov 
9977f948f12SAlexander V. Chernikov void
9987f948f12SAlexander V. Chernikov rt_updatemtu(struct ifnet *ifp)
9997f948f12SAlexander V. Chernikov {
100061eee0e2SAlexander V. Chernikov 	struct rib_head *rnh;
10019e022295SAlexander V. Chernikov 	int mtu;
10027f948f12SAlexander V. Chernikov 	int i, j;
10037f948f12SAlexander V. Chernikov 
10047f948f12SAlexander V. Chernikov 	/*
10057f948f12SAlexander V. Chernikov 	 * Try to update rt_mtu for all routes using this interface
10067f948f12SAlexander V. Chernikov 	 * Unfortunately the only way to do this is to traverse all
10077f948f12SAlexander V. Chernikov 	 * routing tables in all fibs/domains.
10087f948f12SAlexander V. Chernikov 	 */
10097f948f12SAlexander V. Chernikov 	for (i = 1; i <= AF_MAX; i++) {
10109e022295SAlexander V. Chernikov 		mtu = if_getmtu_family(ifp, i);
10117f948f12SAlexander V. Chernikov 		for (j = 0; j < rt_numfibs; j++) {
10127f948f12SAlexander V. Chernikov 			rnh = rt_tables_get_rnh(j, i);
10137f948f12SAlexander V. Chernikov 			if (rnh == NULL)
10147f948f12SAlexander V. Chernikov 				continue;
10159e022295SAlexander V. Chernikov 			nhops_update_ifmtu(rnh, ifp, mtu);
10167f948f12SAlexander V. Chernikov 		}
10177f948f12SAlexander V. Chernikov 	}
10187f948f12SAlexander V. Chernikov }
10197f948f12SAlexander V. Chernikov 
10207f948f12SAlexander V. Chernikov 
10215a2f4cbdSAlexander V. Chernikov #if 0
10225a2f4cbdSAlexander V. Chernikov int p_sockaddr(char *buf, int buflen, struct sockaddr *s);
10235a2f4cbdSAlexander V. Chernikov int rt_print(char *buf, int buflen, struct rtentry *rt);
10245a2f4cbdSAlexander V. Chernikov 
10255a2f4cbdSAlexander V. Chernikov int
10265a2f4cbdSAlexander V. Chernikov p_sockaddr(char *buf, int buflen, struct sockaddr *s)
10275a2f4cbdSAlexander V. Chernikov {
10285a2f4cbdSAlexander V. Chernikov 	void *paddr = NULL;
10295a2f4cbdSAlexander V. Chernikov 
10305a2f4cbdSAlexander V. Chernikov 	switch (s->sa_family) {
10315a2f4cbdSAlexander V. Chernikov 	case AF_INET:
10325a2f4cbdSAlexander V. Chernikov 		paddr = &((struct sockaddr_in *)s)->sin_addr;
10335a2f4cbdSAlexander V. Chernikov 		break;
10345a2f4cbdSAlexander V. Chernikov 	case AF_INET6:
10355a2f4cbdSAlexander V. Chernikov 		paddr = &((struct sockaddr_in6 *)s)->sin6_addr;
10365a2f4cbdSAlexander V. Chernikov 		break;
10375a2f4cbdSAlexander V. Chernikov 	}
10385a2f4cbdSAlexander V. Chernikov 
10395a2f4cbdSAlexander V. Chernikov 	if (paddr == NULL)
10405a2f4cbdSAlexander V. Chernikov 		return (0);
10415a2f4cbdSAlexander V. Chernikov 
10425a2f4cbdSAlexander V. Chernikov 	if (inet_ntop(s->sa_family, paddr, buf, buflen) == NULL)
10435a2f4cbdSAlexander V. Chernikov 		return (0);
10445a2f4cbdSAlexander V. Chernikov 
10455a2f4cbdSAlexander V. Chernikov 	return (strlen(buf));
10465a2f4cbdSAlexander V. Chernikov }
10475a2f4cbdSAlexander V. Chernikov 
10485a2f4cbdSAlexander V. Chernikov int
10495a2f4cbdSAlexander V. Chernikov rt_print(char *buf, int buflen, struct rtentry *rt)
10505a2f4cbdSAlexander V. Chernikov {
10515a2f4cbdSAlexander V. Chernikov 	struct sockaddr *addr, *mask;
10525a2f4cbdSAlexander V. Chernikov 	int i = 0;
10535a2f4cbdSAlexander V. Chernikov 
10545a2f4cbdSAlexander V. Chernikov 	addr = rt_key(rt);
10555a2f4cbdSAlexander V. Chernikov 	mask = rt_mask(rt);
10565a2f4cbdSAlexander V. Chernikov 
10575a2f4cbdSAlexander V. Chernikov 	i = p_sockaddr(buf, buflen, addr);
10585a2f4cbdSAlexander V. Chernikov 	if (!(rt->rt_flags & RTF_HOST)) {
10595a2f4cbdSAlexander V. Chernikov 		buf[i++] = '/';
10605a2f4cbdSAlexander V. Chernikov 		i += p_sockaddr(buf + i, buflen - i, mask);
10615a2f4cbdSAlexander V. Chernikov 	}
10625a2f4cbdSAlexander V. Chernikov 
10635a2f4cbdSAlexander V. Chernikov 	if (rt->rt_flags & RTF_GATEWAY) {
10645a2f4cbdSAlexander V. Chernikov 		buf[i++] = '>';
1065aaad3c4fSAlexander V. Chernikov 		i += p_sockaddr(buf + i, buflen - i, &rt->rt_nhop->gw_sa);
10665a2f4cbdSAlexander V. Chernikov 	}
10675a2f4cbdSAlexander V. Chernikov 
10685a2f4cbdSAlexander V. Chernikov 	return (i);
10695a2f4cbdSAlexander V. Chernikov }
10705a2f4cbdSAlexander V. Chernikov #endif
10715a2f4cbdSAlexander V. Chernikov 
1072427ac07fSKip Macy #ifdef RADIX_MPATH
1073e8b0643eSAlexander V. Chernikov /*
1074e8b0643eSAlexander V. Chernikov  * Deletes key for single-path routes, unlinks rtentry with
1075e8b0643eSAlexander V. Chernikov  * gateway specified in @info from multi-path routes.
1076e8b0643eSAlexander V. Chernikov  *
1077e8b0643eSAlexander V. Chernikov  * Returnes unlinked entry. In case of failure, returns NULL
1078e8b0643eSAlexander V. Chernikov  * and sets @perror to ESRCH.
1079e8b0643eSAlexander V. Chernikov  */
10804d2c2509SAlexander V. Chernikov struct radix_node *
108161eee0e2SAlexander V. Chernikov rt_mpath_unlink(struct rib_head *rnh, struct rt_addrinfo *info,
1082e8b0643eSAlexander V. Chernikov     struct rtentry *rto, int *perror)
1083427ac07fSKip Macy {
1084427ac07fSKip Macy 	/*
1085427ac07fSKip Macy 	 * if we got multipath routes, we require users to specify
1086427ac07fSKip Macy 	 * a matching RTAX_GATEWAY.
1087427ac07fSKip Macy 	 */
1088e8b0643eSAlexander V. Chernikov 	struct rtentry *rt; // *rto = NULL;
1089f59c6cb0SAlexander V. Chernikov 	struct radix_node *rn;
1090e8b0643eSAlexander V. Chernikov 	struct sockaddr *gw;
1091427ac07fSKip Macy 
1092e8b0643eSAlexander V. Chernikov 	gw = info->rti_info[RTAX_GATEWAY];
1093e8b0643eSAlexander V. Chernikov 	rt = rt_mpath_matchgate(rto, gw);
1094e8b0643eSAlexander V. Chernikov 	if (rt == NULL) {
1095e8b0643eSAlexander V. Chernikov 		*perror = ESRCH;
1096e8b0643eSAlexander V. Chernikov 		return (NULL);
1097e8b0643eSAlexander V. Chernikov 	}
10985a2f4cbdSAlexander V. Chernikov 
1099427ac07fSKip Macy 	/*
1100427ac07fSKip Macy 	 * this is the first entry in the chain
1101427ac07fSKip Macy 	 */
1102427ac07fSKip Macy 	if (rto == rt) {
1103427ac07fSKip Macy 		rn = rn_mpath_next((struct radix_node *)rt);
1104427ac07fSKip Macy 		/*
1105427ac07fSKip Macy 		 * there is another entry, now it's active
1106427ac07fSKip Macy 		 */
1107427ac07fSKip Macy 		if (rn) {
1108427ac07fSKip Macy 			rto = RNTORT(rn);
1109427ac07fSKip Macy 			RT_LOCK(rto);
1110427ac07fSKip Macy 			rto->rt_flags |= RTF_UP;
1111427ac07fSKip Macy 			RT_UNLOCK(rto);
1112427ac07fSKip Macy 		} else if (rt->rt_flags & RTF_GATEWAY) {
1113427ac07fSKip Macy 			/*
1114427ac07fSKip Macy 			 * For gateway routes, we need to
1115427ac07fSKip Macy 			 * make sure that we we are deleting
1116427ac07fSKip Macy 			 * the correct gateway.
1117427ac07fSKip Macy 			 * rt_mpath_matchgate() does not
1118427ac07fSKip Macy 			 * check the case when there is only
1119427ac07fSKip Macy 			 * one route in the chain.
1120427ac07fSKip Macy 			 */
1121e8b0643eSAlexander V. Chernikov 			if (gw &&
1122aaad3c4fSAlexander V. Chernikov 			    (rt->rt_nhop->gw_sa.sa_len != gw->sa_len ||
1123aaad3c4fSAlexander V. Chernikov 				memcmp(&rt->rt_nhop->gw_sa, gw, gw->sa_len))) {
1124e8b0643eSAlexander V. Chernikov 				*perror = ESRCH;
1125e8b0643eSAlexander V. Chernikov 				return (NULL);
1126e8b0643eSAlexander V. Chernikov 			}
11276a7bff2cSKip Macy 		}
11286a7bff2cSKip Macy 
1129427ac07fSKip Macy 		/*
1130427ac07fSKip Macy 		 * use the normal delete code to remove
1131427ac07fSKip Macy 		 * the first entry
1132427ac07fSKip Macy 		 */
11334d2c2509SAlexander V. Chernikov 		rn = rnh->rnh_deladdr(info->rti_info[RTAX_DST],
11344d2c2509SAlexander V. Chernikov 					info->rti_info[RTAX_NETMASK],
11354d2c2509SAlexander V. Chernikov 					&rnh->head);
1136e8b0643eSAlexander V. Chernikov 		*perror = 0;
1137e8b0643eSAlexander V. Chernikov 		return (rn);
1138427ac07fSKip Macy 	}
1139427ac07fSKip Macy 
1140427ac07fSKip Macy 	/*
1141427ac07fSKip Macy 	 * if the entry is 2nd and on up
1142427ac07fSKip Macy 	 */
1143e8b0643eSAlexander V. Chernikov 	if (rt_mpath_deldup(rto, rt) == 0)
1144427ac07fSKip Macy 		panic ("rtrequest1: rt_mpath_deldup");
1145e8b0643eSAlexander V. Chernikov 	*perror = 0;
1146e8b0643eSAlexander V. Chernikov 	rn = (struct radix_node *)rt;
1147e8b0643eSAlexander V. Chernikov 	return (rn);
1148427ac07fSKip Macy }
1149427ac07fSKip Macy #endif
1150427ac07fSKip Macy 
11518071913dSRuslan Ermilov int
11528b07e49aSJulian Elischer rtrequest1_fib(int req, struct rt_addrinfo *info, struct rtentry **ret_nrt,
11538b07e49aSJulian Elischer 				u_int fibnum)
11548b07e49aSJulian Elischer {
1155aef2d5fbSAlexander V. Chernikov 	const struct sockaddr *dst;
115661eee0e2SAlexander V. Chernikov 	struct rib_head *rnh;
1157da187ddbSAlexander V. Chernikov 	struct rib_cmd_info rc;
1158aef2d5fbSAlexander V. Chernikov 	int error;
1159df8bae1dSRodney W. Grimes 
11608b07e49aSJulian Elischer 	KASSERT((fibnum < rt_numfibs), ("rtrequest1_fib: bad fibnum"));
1161aef2d5fbSAlexander V. Chernikov 	KASSERT((info->rti_flags & RTF_RNH_LOCKED) == 0, ("rtrequest1_fib: locked"));
11622bbab0afSAlexander V. Chernikov 	NET_EPOCH_ASSERT();
1163aef2d5fbSAlexander V. Chernikov 
1164aef2d5fbSAlexander V. Chernikov 	dst = info->rti_info[RTAX_DST];
1165aef2d5fbSAlexander V. Chernikov 
1166b680a383SBjoern A. Zeeb 	switch (dst->sa_family) {
1167b680a383SBjoern A. Zeeb 	case AF_INET6:
1168b680a383SBjoern A. Zeeb 	case AF_INET:
1169b680a383SBjoern A. Zeeb 		/* We support multiple FIBs. */
1170b680a383SBjoern A. Zeeb 		break;
1171b680a383SBjoern A. Zeeb 	default:
1172b680a383SBjoern A. Zeeb 		fibnum = RT_DEFAULT_FIB;
1173b680a383SBjoern A. Zeeb 		break;
1174b680a383SBjoern A. Zeeb 	}
1175b680a383SBjoern A. Zeeb 
1176b0a76b88SJulian Elischer 	/*
1177b0a76b88SJulian Elischer 	 * Find the correct routing tree to use for this Address Family
1178b0a76b88SJulian Elischer 	 */
1179c2c2a7c1SBjoern A. Zeeb 	rnh = rt_tables_get_rnh(fibnum, dst->sa_family);
118085911824SLuigi Rizzo 	if (rnh == NULL)
1181983985c1SJeffrey Hsu 		return (EAFNOSUPPORT);
1182048738b5SAlexander V. Chernikov 
1183b0a76b88SJulian Elischer 	/*
1184b0a76b88SJulian Elischer 	 * If we are adding a host route then we don't want to put
118566953138SRuslan Ermilov 	 * a netmask in the tree, nor do we want to clone it.
1186b0a76b88SJulian Elischer 	 */
1187aef2d5fbSAlexander V. Chernikov 	if (info->rti_flags & RTF_HOST)
1188aef2d5fbSAlexander V. Chernikov 		info->rti_info[RTAX_NETMASK] = NULL;
11896e6b3f7cSQing Li 
1190da187ddbSAlexander V. Chernikov 	bzero(&rc, sizeof(struct rib_cmd_info));
1191aef2d5fbSAlexander V. Chernikov 	error = 0;
1192df8bae1dSRodney W. Grimes 	switch (req) {
1193df8bae1dSRodney W. Grimes 	case RTM_DELETE:
1194da187ddbSAlexander V. Chernikov 		error = del_route(rnh, info, &rc);
1195df8bae1dSRodney W. Grimes 		break;
1196df8bae1dSRodney W. Grimes 	case RTM_RESOLVE:
11976e6b3f7cSQing Li 		/*
11986e6b3f7cSQing Li 		 * resolve was only used for route cloning
11996e6b3f7cSQing Li 		 * here for compat
12006e6b3f7cSQing Li 		 */
12016e6b3f7cSQing Li 		break;
1202df8bae1dSRodney W. Grimes 	case RTM_ADD:
1203da187ddbSAlexander V. Chernikov 		error = add_route(rnh, info, &rc);
1204aef2d5fbSAlexander V. Chernikov 		break;
1205aef2d5fbSAlexander V. Chernikov 	case RTM_CHANGE:
1206da187ddbSAlexander V. Chernikov 		error = change_route(rnh, info, &rc);
1207aef2d5fbSAlexander V. Chernikov 		break;
1208aef2d5fbSAlexander V. Chernikov 	default:
1209aef2d5fbSAlexander V. Chernikov 		error = EOPNOTSUPP;
1210aef2d5fbSAlexander V. Chernikov 	}
1211aef2d5fbSAlexander V. Chernikov 
1212da187ddbSAlexander V. Chernikov 	if (ret_nrt != NULL)
1213da187ddbSAlexander V. Chernikov 		*ret_nrt = rc.rc_rt;
1214da187ddbSAlexander V. Chernikov 
1215aef2d5fbSAlexander V. Chernikov 	return (error);
1216aef2d5fbSAlexander V. Chernikov }
1217aef2d5fbSAlexander V. Chernikov 
12184d2c2509SAlexander V. Chernikov void
12190fb9298dSAlexander V. Chernikov rt_setmetrics(const struct rt_addrinfo *info, struct rtentry *rt)
12200fb9298dSAlexander V. Chernikov {
12210fb9298dSAlexander V. Chernikov 
12220fb9298dSAlexander V. Chernikov 	if (info->rti_mflags & RTV_WEIGHT)
12230fb9298dSAlexander V. Chernikov 		rt->rt_weight = info->rti_rmx->rmx_weight;
12240fb9298dSAlexander V. Chernikov 	/* Kernel -> userland timebase conversion. */
12250fb9298dSAlexander V. Chernikov 	if (info->rti_mflags & RTV_EXPIRE)
12260fb9298dSAlexander V. Chernikov 		rt->rt_expire = info->rti_rmx->rmx_expire ?
12270fb9298dSAlexander V. Chernikov 		    info->rti_rmx->rmx_expire - time_second + time_uptime : 0;
12280fb9298dSAlexander V. Chernikov }
12290fb9298dSAlexander V. Chernikov 
1230c7ab6602SQing Li void
1231d1dd20beSSam Leffler rt_maskedcopy(struct sockaddr *src, struct sockaddr *dst, struct sockaddr *netmask)
1232df8bae1dSRodney W. Grimes {
1233f59c6cb0SAlexander V. Chernikov 	u_char *cp1 = (u_char *)src;
1234f59c6cb0SAlexander V. Chernikov 	u_char *cp2 = (u_char *)dst;
1235f59c6cb0SAlexander V. Chernikov 	u_char *cp3 = (u_char *)netmask;
1236df8bae1dSRodney W. Grimes 	u_char *cplim = cp2 + *cp3;
1237df8bae1dSRodney W. Grimes 	u_char *cplim2 = cp2 + *cp1;
1238df8bae1dSRodney W. Grimes 
1239df8bae1dSRodney W. Grimes 	*cp2++ = *cp1++; *cp2++ = *cp1++; /* copies sa_len & sa_family */
1240df8bae1dSRodney W. Grimes 	cp3 += 2;
1241df8bae1dSRodney W. Grimes 	if (cplim > cplim2)
1242df8bae1dSRodney W. Grimes 		cplim = cplim2;
1243df8bae1dSRodney W. Grimes 	while (cp2 < cplim)
1244df8bae1dSRodney W. Grimes 		*cp2++ = *cp1++ & *cp3++;
1245df8bae1dSRodney W. Grimes 	if (cp2 < cplim2)
1246df8bae1dSRodney W. Grimes 		bzero((caddr_t)cp2, (unsigned)(cplim2 - cp2));
1247df8bae1dSRodney W. Grimes }
1248df8bae1dSRodney W. Grimes 
1249df8bae1dSRodney W. Grimes /*
1250df8bae1dSRodney W. Grimes  * Set up a routing table entry, normally
1251df8bae1dSRodney W. Grimes  * for an interface.
1252df8bae1dSRodney W. Grimes  */
12538b07e49aSJulian Elischer #define _SOCKADDR_TMPSIZE 128 /* Not too big.. kernel stack size is limited */
12548b07e49aSJulian Elischer static inline  int
12558b07e49aSJulian Elischer rtinit1(struct ifaddr *ifa, int cmd, int flags, int fibnum)
1256df8bae1dSRodney W. Grimes {
125720efcfc6SAndrey V. Elsukov 	RIB_RLOCK_TRACKER;
12582bbab0afSAlexander V. Chernikov 	struct epoch_tracker et;
12595aca0b30SLuigi Rizzo 	struct sockaddr *dst;
12608071913dSRuslan Ermilov 	struct sockaddr *netmask;
126185911824SLuigi Rizzo 	struct rtentry *rt = NULL;
12628071913dSRuslan Ermilov 	struct rt_addrinfo info;
1263e440aed9SQing Li 	int error = 0;
12648b07e49aSJulian Elischer 	int startfib, endfib;
12658b07e49aSJulian Elischer 	char tempbuf[_SOCKADDR_TMPSIZE];
12668b07e49aSJulian Elischer 	int didwork = 0;
12678b07e49aSJulian Elischer 	int a_failure = 0;
1268aaad3c4fSAlexander V. Chernikov 	struct sockaddr_dl_short *sdl = NULL;
126961eee0e2SAlexander V. Chernikov 	struct rib_head *rnh;
1270df8bae1dSRodney W. Grimes 
12718071913dSRuslan Ermilov 	if (flags & RTF_HOST) {
12728071913dSRuslan Ermilov 		dst = ifa->ifa_dstaddr;
12738071913dSRuslan Ermilov 		netmask = NULL;
12748071913dSRuslan Ermilov 	} else {
12758071913dSRuslan Ermilov 		dst = ifa->ifa_addr;
12768071913dSRuslan Ermilov 		netmask = ifa->ifa_netmask;
12778071913dSRuslan Ermilov 	}
1278b3dd0771SBjoern A. Zeeb 	if (dst->sa_len == 0)
1279b3dd0771SBjoern A. Zeeb 		return(EINVAL);
1280b680a383SBjoern A. Zeeb 	switch (dst->sa_family) {
1281b680a383SBjoern A. Zeeb 	case AF_INET6:
1282b680a383SBjoern A. Zeeb 	case AF_INET:
1283b680a383SBjoern A. Zeeb 		/* We support multiple FIBs. */
1284b680a383SBjoern A. Zeeb 		break;
1285b680a383SBjoern A. Zeeb 	default:
1286b680a383SBjoern A. Zeeb 		fibnum = RT_DEFAULT_FIB;
1287b680a383SBjoern A. Zeeb 		break;
1288b680a383SBjoern A. Zeeb 	}
12897d9b6df1SAlexander V. Chernikov 	if (fibnum == RT_ALL_FIBS) {
1290ee0bd4b9SHiroki Sato 		if (V_rt_add_addr_allfibs == 0 && cmd == (int)RTM_ADD)
12910489b891SAlan Somers 			startfib = endfib = ifa->ifa_ifp->if_fib;
1292ee0bd4b9SHiroki Sato 		else {
12938b07e49aSJulian Elischer 			startfib = 0;
12948b07e49aSJulian Elischer 			endfib = rt_numfibs - 1;
129566e8505fSJulian Elischer 		}
12968b07e49aSJulian Elischer 	} else {
12978b07e49aSJulian Elischer 		KASSERT((fibnum < rt_numfibs), ("rtinit1: bad fibnum"));
12988b07e49aSJulian Elischer 		startfib = fibnum;
12998b07e49aSJulian Elischer 		endfib = fibnum;
13008b07e49aSJulian Elischer 	}
1301ac4a76ebSBjoern A. Zeeb 
1302b0a76b88SJulian Elischer 	/*
13038b07e49aSJulian Elischer 	 * If it's a delete, check that if it exists,
13048b07e49aSJulian Elischer 	 * it's on the correct interface or we might scrub
13058b07e49aSJulian Elischer 	 * a route to another ifa which would
1306b0a76b88SJulian Elischer 	 * be confusing at best and possibly worse.
1307b0a76b88SJulian Elischer 	 */
1308df8bae1dSRodney W. Grimes 	if (cmd == RTM_DELETE) {
1309b0a76b88SJulian Elischer 		/*
1310b0a76b88SJulian Elischer 		 * It's a delete, so it should already exist..
1311b0a76b88SJulian Elischer 		 * If it's a net, mask off the host bits
1312b0a76b88SJulian Elischer 		 * (Assuming we have a mask)
13138b07e49aSJulian Elischer 		 * XXX this is kinda inet specific..
1314b0a76b88SJulian Elischer 		 */
13158071913dSRuslan Ermilov 		if (netmask != NULL) {
13168b07e49aSJulian Elischer 			rt_maskedcopy(dst, (struct sockaddr *)tempbuf, netmask);
13178b07e49aSJulian Elischer 			dst = (struct sockaddr *)tempbuf;
1318df8bae1dSRodney W. Grimes 		}
1319563ab4e4SAlexander V. Chernikov 	} else if (cmd == RTM_ADD) {
1320aaad3c4fSAlexander V. Chernikov 		sdl = (struct sockaddr_dl_short *)tempbuf;
1321aaad3c4fSAlexander V. Chernikov 		bzero(sdl, sizeof(struct sockaddr_dl_short));
1322563ab4e4SAlexander V. Chernikov 		sdl->sdl_family = AF_LINK;
1323aaad3c4fSAlexander V. Chernikov 		sdl->sdl_len = sizeof(struct sockaddr_dl_short);
1324563ab4e4SAlexander V. Chernikov 		sdl->sdl_type = ifa->ifa_ifp->if_type;
1325563ab4e4SAlexander V. Chernikov 		sdl->sdl_index = ifa->ifa_ifp->if_index;
13268b07e49aSJulian Elischer         }
13278b07e49aSJulian Elischer 	/*
13288b07e49aSJulian Elischer 	 * Now go through all the requested tables (fibs) and do the
13298b07e49aSJulian Elischer 	 * requested action. Realistically, this will either be fib 0
13308b07e49aSJulian Elischer 	 * for protocols that don't do multiple tables or all the
1331a8498625SBjoern A. Zeeb 	 * tables for those that do.
13328b07e49aSJulian Elischer 	 */
13338b07e49aSJulian Elischer 	for ( fibnum = startfib; fibnum <= endfib; fibnum++) {
13348b07e49aSJulian Elischer 		if (cmd == RTM_DELETE) {
13358b07e49aSJulian Elischer 			struct radix_node *rn;
1336b0a76b88SJulian Elischer 			/*
13378071913dSRuslan Ermilov 			 * Look up an rtentry that is in the routing tree and
13388071913dSRuslan Ermilov 			 * contains the correct info.
1339b0a76b88SJulian Elischer 			 */
1340c2c2a7c1SBjoern A. Zeeb 			rnh = rt_tables_get_rnh(fibnum, dst->sa_family);
1341c2c2a7c1SBjoern A. Zeeb 			if (rnh == NULL)
13428b07e49aSJulian Elischer 				/* this table doesn't exist but others might */
13438b07e49aSJulian Elischer 				continue;
134461eee0e2SAlexander V. Chernikov 			RIB_RLOCK(rnh);
134561eee0e2SAlexander V. Chernikov 			rn = rnh->rnh_lookup(dst, netmask, &rnh->head);
1346e440aed9SQing Li #ifdef RADIX_MPATH
134761eee0e2SAlexander V. Chernikov 			if (rt_mpath_capable(rnh)) {
1348e440aed9SQing Li 
1349e440aed9SQing Li 				if (rn == NULL)
1350e440aed9SQing Li 					error = ESRCH;
1351e440aed9SQing Li 				else {
1352e440aed9SQing Li 					rt = RNTORT(rn);
1353e440aed9SQing Li 					/*
13549e022295SAlexander V. Chernikov 					 * for interface route the gateway
13559e022295SAlexander V. Chernikov 					 * gateway is sockaddr_dl, so
13568b07e49aSJulian Elischer 					 * rt_mpath_matchgate must use the
13578b07e49aSJulian Elischer 					 * interface address
1358e440aed9SQing Li 					 */
13598b07e49aSJulian Elischer 					rt = rt_mpath_matchgate(rt,
13608b07e49aSJulian Elischer 					    ifa->ifa_addr);
1361034c09ffSAlexander V. Chernikov 					if (rt == NULL)
1362e440aed9SQing Li 						error = ESRCH;
1363e440aed9SQing Li 				}
1364e440aed9SQing Li 			}
1365e440aed9SQing Li #endif
13668b07e49aSJulian Elischer 			error = (rn == NULL ||
13678071913dSRuslan Ermilov 			    (rn->rn_flags & RNF_ROOT) ||
13688c61eb21SAlexander V. Chernikov 			    RNTORT(rn)->rt_nhop->nh_ifa != ifa);
136961eee0e2SAlexander V. Chernikov 			RIB_RUNLOCK(rnh);
1370956b0b65SJeffrey Hsu 			if (error) {
13718b07e49aSJulian Elischer 				/* this is only an error if bad on ALL tables */
13728b07e49aSJulian Elischer 				continue;
1373df8bae1dSRodney W. Grimes 			}
1374b0a76b88SJulian Elischer 		}
1375b0a76b88SJulian Elischer 		/*
1376b0a76b88SJulian Elischer 		 * Do the actual request
1377b0a76b88SJulian Elischer 		 */
13788071913dSRuslan Ermilov 		bzero((caddr_t)&info, sizeof(info));
13798071913dSRuslan Ermilov 		info.rti_ifa = ifa;
13803034f43fSAlexander V. Chernikov 		info.rti_flags = flags |
13813034f43fSAlexander V. Chernikov 		    (ifa->ifa_flags & ~IFA_RTSELF) | RTF_PINNED;
13828071913dSRuslan Ermilov 		info.rti_info[RTAX_DST] = dst;
13836e6b3f7cSQing Li 		/*
13846e6b3f7cSQing Li 		 * doing this for compatibility reasons
13856e6b3f7cSQing Li 		 */
13866e6b3f7cSQing Li 		if (cmd == RTM_ADD)
1387563ab4e4SAlexander V. Chernikov 			info.rti_info[RTAX_GATEWAY] = (struct sockaddr *)sdl;
13886e6b3f7cSQing Li 		else
13898071913dSRuslan Ermilov 			info.rti_info[RTAX_GATEWAY] = ifa->ifa_addr;
13908071913dSRuslan Ermilov 		info.rti_info[RTAX_NETMASK] = netmask;
13912bbab0afSAlexander V. Chernikov 		NET_EPOCH_ENTER(et);
13928b07e49aSJulian Elischer 		error = rtrequest1_fib(cmd, &info, &rt, fibnum);
13935aca0b30SLuigi Rizzo 		if (error == 0 && rt != NULL) {
13948071913dSRuslan Ermilov 			/*
13956f99b44cSBrian Somers 			 * notify any listening routing agents of the change
13968071913dSRuslan Ermilov 			 */
13979e022295SAlexander V. Chernikov 
13989e022295SAlexander V. Chernikov 			/* TODO: interface routes/aliases */
1399e02d3fe7SAlexander V. Chernikov 			rt_newaddrmsg_fib(cmd, ifa, rt, fibnum);
14008b07e49aSJulian Elischer 			didwork = 1;
1401df8bae1dSRodney W. Grimes 		}
14022bbab0afSAlexander V. Chernikov 		NET_EPOCH_EXIT(et);
14038b07e49aSJulian Elischer 		if (error)
14048b07e49aSJulian Elischer 			a_failure = error;
14058b07e49aSJulian Elischer 	}
14068b07e49aSJulian Elischer 	if (cmd == RTM_DELETE) {
14078b07e49aSJulian Elischer 		if (didwork) {
14088b07e49aSJulian Elischer 			error = 0;
14098b07e49aSJulian Elischer 		} else {
14108b07e49aSJulian Elischer 			/* we only give an error if it wasn't in any table */
14118b07e49aSJulian Elischer 			error = ((flags & RTF_HOST) ?
14128b07e49aSJulian Elischer 			    EHOSTUNREACH : ENETUNREACH);
14138b07e49aSJulian Elischer 		}
14148b07e49aSJulian Elischer 	} else {
14158b07e49aSJulian Elischer 		if (a_failure) {
14168b07e49aSJulian Elischer 			/* return an error if any of them failed */
14178b07e49aSJulian Elischer 			error = a_failure;
14188b07e49aSJulian Elischer 		}
14198b07e49aSJulian Elischer 	}
14203ec66d6cSDavid Greenman 	return (error);
14213ec66d6cSDavid Greenman }
1422cb64988fSLuoqi Chen 
14238b07e49aSJulian Elischer /*
14248b07e49aSJulian Elischer  * Set up a routing table entry, normally
14258b07e49aSJulian Elischer  * for an interface.
14268b07e49aSJulian Elischer  */
14278b07e49aSJulian Elischer int
14288b07e49aSJulian Elischer rtinit(struct ifaddr *ifa, int cmd, int flags)
14298b07e49aSJulian Elischer {
14308b07e49aSJulian Elischer 	struct sockaddr *dst;
1431a8498625SBjoern A. Zeeb 	int fib = RT_DEFAULT_FIB;
14328b07e49aSJulian Elischer 
14338b07e49aSJulian Elischer 	if (flags & RTF_HOST) {
14348b07e49aSJulian Elischer 		dst = ifa->ifa_dstaddr;
14358b07e49aSJulian Elischer 	} else {
14368b07e49aSJulian Elischer 		dst = ifa->ifa_addr;
14378b07e49aSJulian Elischer 	}
14388b07e49aSJulian Elischer 
1439b680a383SBjoern A. Zeeb 	switch (dst->sa_family) {
1440b680a383SBjoern A. Zeeb 	case AF_INET6:
1441b680a383SBjoern A. Zeeb 	case AF_INET:
1442b680a383SBjoern A. Zeeb 		/* We do support multiple FIBs. */
14437d9b6df1SAlexander V. Chernikov 		fib = RT_ALL_FIBS;
1444b680a383SBjoern A. Zeeb 		break;
1445b680a383SBjoern A. Zeeb 	}
14468b07e49aSJulian Elischer 	return (rtinit1(ifa, cmd, flags, fib));
14478b07e49aSJulian Elischer }
14484cbac30bSAlexander V. Chernikov 
14494cbac30bSAlexander V. Chernikov /*
14504cbac30bSAlexander V. Chernikov  * Announce interface address arrival/withdraw
14514cbac30bSAlexander V. Chernikov  * Returns 0 on success.
14524cbac30bSAlexander V. Chernikov  */
14534cbac30bSAlexander V. Chernikov int
14544cbac30bSAlexander V. Chernikov rt_addrmsg(int cmd, struct ifaddr *ifa, int fibnum)
14554cbac30bSAlexander V. Chernikov {
14564cbac30bSAlexander V. Chernikov 
14574cbac30bSAlexander V. Chernikov 	KASSERT(cmd == RTM_ADD || cmd == RTM_DELETE,
1458d375edc9SAlexander V. Chernikov 	    ("unexpected cmd %d", cmd));
1459d375edc9SAlexander V. Chernikov 	KASSERT(fibnum == RT_ALL_FIBS || (fibnum >= 0 && fibnum < rt_numfibs),
1460d375edc9SAlexander V. Chernikov 	    ("%s: fib out of range 0 <=%d<%d", __func__, fibnum, rt_numfibs));
14614cbac30bSAlexander V. Chernikov 
1462d6e23cf0SMichael Tuexen 	EVENTHANDLER_DIRECT_INVOKE(rt_addrmsg, ifa, cmd);
14634cbac30bSAlexander V. Chernikov 	return (rtsock_addrmsg(cmd, ifa, fibnum));
14644cbac30bSAlexander V. Chernikov }
14654cbac30bSAlexander V. Chernikov 
14664cbac30bSAlexander V. Chernikov /*
1467e02d3fe7SAlexander V. Chernikov  * Announce kernel-originated route addition/removal to rtsock based on @rt data.
1468e02d3fe7SAlexander V. Chernikov  * cmd: RTM_ cmd
1469e02d3fe7SAlexander V. Chernikov  * @rt: valid rtentry
1470e02d3fe7SAlexander V. Chernikov  * @ifp: target route interface
1471e02d3fe7SAlexander V. Chernikov  * @fibnum: fib id or RT_ALL_FIBS
1472e02d3fe7SAlexander V. Chernikov  *
14734cbac30bSAlexander V. Chernikov  * Returns 0 on success.
14744cbac30bSAlexander V. Chernikov  */
14754cbac30bSAlexander V. Chernikov int
1476e02d3fe7SAlexander V. Chernikov rt_routemsg(int cmd, struct rtentry *rt, struct ifnet *ifp, int rti_addrs,
14774cbac30bSAlexander V. Chernikov     int fibnum)
14784cbac30bSAlexander V. Chernikov {
14794cbac30bSAlexander V. Chernikov 
14804cbac30bSAlexander V. Chernikov 	KASSERT(cmd == RTM_ADD || cmd == RTM_DELETE,
1481d375edc9SAlexander V. Chernikov 	    ("unexpected cmd %d", cmd));
14824cbac30bSAlexander V. Chernikov 
1483d375edc9SAlexander V. Chernikov 	KASSERT(fibnum == RT_ALL_FIBS || (fibnum >= 0 && fibnum < rt_numfibs),
1484d375edc9SAlexander V. Chernikov 	    ("%s: fib out of range 0 <=%d<%d", __func__, fibnum, rt_numfibs));
14854cbac30bSAlexander V. Chernikov 
14864cbac30bSAlexander V. Chernikov 	KASSERT(rt_key(rt) != NULL, (":%s: rt_key must be supplied", __func__));
14874cbac30bSAlexander V. Chernikov 
1488e02d3fe7SAlexander V. Chernikov 	return (rtsock_routemsg(cmd, rt, ifp, 0, fibnum));
14894cbac30bSAlexander V. Chernikov }
14904cbac30bSAlexander V. Chernikov 
1491e02d3fe7SAlexander V. Chernikov /*
1492e02d3fe7SAlexander V. Chernikov  * Announce kernel-originated route addition/removal to rtsock based on @rt data.
1493e02d3fe7SAlexander V. Chernikov  * cmd: RTM_ cmd
1494e02d3fe7SAlexander V. Chernikov  * @info: addrinfo structure with valid data.
1495e02d3fe7SAlexander V. Chernikov  * @fibnum: fib id or RT_ALL_FIBS
1496e02d3fe7SAlexander V. Chernikov  *
1497e02d3fe7SAlexander V. Chernikov  * Returns 0 on success.
1498e02d3fe7SAlexander V. Chernikov  */
1499e02d3fe7SAlexander V. Chernikov int
1500e02d3fe7SAlexander V. Chernikov rt_routemsg_info(int cmd, struct rt_addrinfo *info, int fibnum)
15014cbac30bSAlexander V. Chernikov {
15024cbac30bSAlexander V. Chernikov 
1503e02d3fe7SAlexander V. Chernikov 	KASSERT(cmd == RTM_ADD || cmd == RTM_DELETE || cmd == RTM_CHANGE,
1504e02d3fe7SAlexander V. Chernikov 	    ("unexpected cmd %d", cmd));
1505e02d3fe7SAlexander V. Chernikov 
1506e02d3fe7SAlexander V. Chernikov 	KASSERT(fibnum == RT_ALL_FIBS || (fibnum >= 0 && fibnum < rt_numfibs),
1507e02d3fe7SAlexander V. Chernikov 	    ("%s: fib out of range 0 <=%d<%d", __func__, fibnum, rt_numfibs));
1508e02d3fe7SAlexander V. Chernikov 
1509e02d3fe7SAlexander V. Chernikov 	KASSERT(info->rti_info[RTAX_DST] != NULL, (":%s: RTAX_DST must be supplied", __func__));
1510e02d3fe7SAlexander V. Chernikov 
1511e02d3fe7SAlexander V. Chernikov 	return (rtsock_routemsg_info(cmd, info, fibnum));
15124cbac30bSAlexander V. Chernikov }
15134cbac30bSAlexander V. Chernikov 
1514e02d3fe7SAlexander V. Chernikov 
15154cbac30bSAlexander V. Chernikov /*
15164cbac30bSAlexander V. Chernikov  * This is called to generate messages from the routing socket
15174cbac30bSAlexander V. Chernikov  * indicating a network interface has had addresses associated with it.
15184cbac30bSAlexander V. Chernikov  */
15194cbac30bSAlexander V. Chernikov void
1520e02d3fe7SAlexander V. Chernikov rt_newaddrmsg_fib(int cmd, struct ifaddr *ifa, struct rtentry *rt, int fibnum)
15214cbac30bSAlexander V. Chernikov {
15224cbac30bSAlexander V. Chernikov 
15234cbac30bSAlexander V. Chernikov 	KASSERT(cmd == RTM_ADD || cmd == RTM_DELETE,
15244cbac30bSAlexander V. Chernikov 		("unexpected cmd %u", cmd));
1525d375edc9SAlexander V. Chernikov 	KASSERT(fibnum == RT_ALL_FIBS || (fibnum >= 0 && fibnum < rt_numfibs),
1526d375edc9SAlexander V. Chernikov 	    ("%s: fib out of range 0 <=%d<%d", __func__, fibnum, rt_numfibs));
15274cbac30bSAlexander V. Chernikov 
15284cbac30bSAlexander V. Chernikov 	if (cmd == RTM_ADD) {
15294cbac30bSAlexander V. Chernikov 		rt_addrmsg(cmd, ifa, fibnum);
15304cbac30bSAlexander V. Chernikov 		if (rt != NULL)
1531e02d3fe7SAlexander V. Chernikov 			rt_routemsg(cmd, rt, ifa->ifa_ifp, 0, fibnum);
15324cbac30bSAlexander V. Chernikov 	} else {
15334cbac30bSAlexander V. Chernikov 		if (rt != NULL)
1534e02d3fe7SAlexander V. Chernikov 			rt_routemsg(cmd, rt, ifa->ifa_ifp, 0, fibnum);
15354cbac30bSAlexander V. Chernikov 		rt_addrmsg(cmd, ifa, fibnum);
15364cbac30bSAlexander V. Chernikov 	}
15374cbac30bSAlexander V. Chernikov }
15384cbac30bSAlexander V. Chernikov 
1539