xref: /freebsd/sys/net/route/route_helpers.c (revision f9668e42b44f22c9ab213eb9a4792d5acfcf6903)
1a6663252SAlexander V. Chernikov /*-
2a6663252SAlexander V. Chernikov  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
3a6663252SAlexander V. Chernikov  *
4a6663252SAlexander V. Chernikov  * Copyright (c) 2020 Alexander V. Chernikov
5a6663252SAlexander V. Chernikov  *
6a6663252SAlexander V. Chernikov  * Redistribution and use in source and binary forms, with or without
7a6663252SAlexander V. Chernikov  * modification, are permitted provided that the following conditions
8a6663252SAlexander V. Chernikov  * are met:
9a6663252SAlexander V. Chernikov  * 1. Redistributions of source code must retain the above copyright
10a6663252SAlexander V. Chernikov  *    notice, this list of conditions and the following disclaimer.
11a6663252SAlexander V. Chernikov  * 2. Redistributions in binary form must reproduce the above copyright
12a6663252SAlexander V. Chernikov  *    notice, this list of conditions and the following disclaimer in the
13a6663252SAlexander V. Chernikov  *    documentation and/or other materials provided with the distribution.
14a6663252SAlexander V. Chernikov  *
15a6663252SAlexander V. Chernikov  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
16a6663252SAlexander V. Chernikov  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17a6663252SAlexander V. Chernikov  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18a6663252SAlexander V. Chernikov  * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
19a6663252SAlexander V. Chernikov  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20a6663252SAlexander V. Chernikov  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
21a6663252SAlexander V. Chernikov  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22a6663252SAlexander V. Chernikov  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23a6663252SAlexander V. Chernikov  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24a6663252SAlexander V. Chernikov  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25a6663252SAlexander V. Chernikov  * SUCH DAMAGE.
26a6663252SAlexander V. Chernikov  */
27a6663252SAlexander V. Chernikov 
28a6663252SAlexander V. Chernikov #include <sys/cdefs.h>
29a6663252SAlexander V. Chernikov __FBSDID("$FreeBSD$");
30a6663252SAlexander V. Chernikov #include "opt_inet.h"
31a6663252SAlexander V. Chernikov #include "opt_inet6.h"
32a6663252SAlexander V. Chernikov #include "opt_route.h"
33a6663252SAlexander V. Chernikov 
34a6663252SAlexander V. Chernikov #include <sys/param.h>
35a6663252SAlexander V. Chernikov #include <sys/jail.h>
36a6663252SAlexander V. Chernikov #include <sys/systm.h>
37a6663252SAlexander V. Chernikov #include <sys/malloc.h>
38a6663252SAlexander V. Chernikov #include <sys/mbuf.h>
39a6663252SAlexander V. Chernikov #include <sys/socket.h>
40a6663252SAlexander V. Chernikov #include <sys/sysctl.h>
41a6663252SAlexander V. Chernikov #include <sys/syslog.h>
42a6663252SAlexander V. Chernikov #include <sys/sysproto.h>
43a6663252SAlexander V. Chernikov #include <sys/proc.h>
44a6663252SAlexander V. Chernikov #include <sys/domain.h>
45a6663252SAlexander V. Chernikov #include <sys/kernel.h>
46a6663252SAlexander V. Chernikov #include <sys/lock.h>
47a6663252SAlexander V. Chernikov #include <sys/rmlock.h>
48a6663252SAlexander V. Chernikov 
49a6663252SAlexander V. Chernikov #include <net/if.h>
50a6663252SAlexander V. Chernikov #include <net/if_var.h>
51a6663252SAlexander V. Chernikov #include <net/if_dl.h>
52a6663252SAlexander V. Chernikov #include <net/route.h>
53da187ddbSAlexander V. Chernikov #include <net/route/route_ctl.h>
54e7d8af4fSAlexander V. Chernikov #include <net/route/route_var.h>
55a6663252SAlexander V. Chernikov #include <net/route/nhop_utils.h>
56a6663252SAlexander V. Chernikov #include <net/route/nhop.h>
57a6663252SAlexander V. Chernikov #include <net/route/nhop_var.h>
58682b902dSAlexander V. Chernikov #ifdef INET
59682b902dSAlexander V. Chernikov #include <netinet/in_fib.h>
60682b902dSAlexander V. Chernikov #endif
61682b902dSAlexander V. Chernikov #ifdef INET6
62682b902dSAlexander V. Chernikov #include <netinet6/in6_fib.h>
63682b902dSAlexander V. Chernikov #endif
64a6663252SAlexander V. Chernikov #include <net/vnet.h>
65a6663252SAlexander V. Chernikov 
66a6663252SAlexander V. Chernikov /*
67a6663252SAlexander V. Chernikov  * RIB helper functions.
68a6663252SAlexander V. Chernikov  */
69a6663252SAlexander V. Chernikov 
70151ec796SAlexander V. Chernikov void
71151ec796SAlexander V. Chernikov rib_walk_ext_locked(struct rib_head *rnh, rib_walktree_f_t *wa_f,
72151ec796SAlexander V. Chernikov     rib_walk_hook_f_t *hook_f, void *arg)
73151ec796SAlexander V. Chernikov {
74151ec796SAlexander V. Chernikov 	if (hook_f != NULL)
75151ec796SAlexander V. Chernikov 		hook_f(rnh, RIB_WALK_HOOK_PRE, arg);
76151ec796SAlexander V. Chernikov 	rnh->rnh_walktree(&rnh->head, (walktree_f_t *)wa_f, arg);
77151ec796SAlexander V. Chernikov 	if (hook_f != NULL)
78151ec796SAlexander V. Chernikov 		hook_f(rnh, RIB_WALK_HOOK_POST, arg);
79151ec796SAlexander V. Chernikov }
80151ec796SAlexander V. Chernikov 
81a6663252SAlexander V. Chernikov /*
82a6663252SAlexander V. Chernikov  * Calls @wa_f with @arg for each entry in the table specified by
83a6663252SAlexander V. Chernikov  * @af and @fibnum.
84a6663252SAlexander V. Chernikov  *
857511a638SAlexander V. Chernikov  * @ss_t callback is called before and after the tree traversal
867511a638SAlexander V. Chernikov  *  while holding table lock.
877511a638SAlexander V. Chernikov  *
887511a638SAlexander V. Chernikov  * Table is traversed under read lock unless @wlock is set.
89a6663252SAlexander V. Chernikov  */
90a6663252SAlexander V. Chernikov void
913b1654cbSAlexander V. Chernikov rib_walk_ext_internal(struct rib_head *rnh, bool wlock, rib_walktree_f_t *wa_f,
927511a638SAlexander V. Chernikov     rib_walk_hook_f_t *hook_f, void *arg)
93a6663252SAlexander V. Chernikov {
94a6663252SAlexander V. Chernikov 	RIB_RLOCK_TRACKER;
95a6663252SAlexander V. Chernikov 
967511a638SAlexander V. Chernikov 	if (wlock)
977511a638SAlexander V. Chernikov 		RIB_WLOCK(rnh);
987511a638SAlexander V. Chernikov 	else
99a6663252SAlexander V. Chernikov 		RIB_RLOCK(rnh);
100151ec796SAlexander V. Chernikov 	rib_walk_ext_locked(rnh, wa_f, hook_f, arg);
1017511a638SAlexander V. Chernikov 	if (wlock)
1027511a638SAlexander V. Chernikov 		RIB_WUNLOCK(rnh);
1037511a638SAlexander V. Chernikov 	else
104a6663252SAlexander V. Chernikov 		RIB_RUNLOCK(rnh);
105a6663252SAlexander V. Chernikov }
106a6663252SAlexander V. Chernikov 
1073b1654cbSAlexander V. Chernikov void
1083b1654cbSAlexander V. Chernikov rib_walk_ext(uint32_t fibnum, int family, bool wlock, rib_walktree_f_t *wa_f,
1093b1654cbSAlexander V. Chernikov     rib_walk_hook_f_t *hook_f, void *arg)
1103b1654cbSAlexander V. Chernikov {
1113b1654cbSAlexander V. Chernikov 	struct rib_head *rnh;
1123b1654cbSAlexander V. Chernikov 
1133b1654cbSAlexander V. Chernikov 	if ((rnh = rt_tables_get_rnh(fibnum, family)) != NULL)
1143b1654cbSAlexander V. Chernikov 		rib_walk_ext_internal(rnh, wlock, wa_f, hook_f, arg);
1153b1654cbSAlexander V. Chernikov }
1163b1654cbSAlexander V. Chernikov 
117682b902dSAlexander V. Chernikov /*
1187511a638SAlexander V. Chernikov  * Calls @wa_f with @arg for each entry in the table specified by
1197511a638SAlexander V. Chernikov  * @af and @fibnum.
1207511a638SAlexander V. Chernikov  *
1217511a638SAlexander V. Chernikov  * Table is traversed under read lock unless @wlock is set.
1227511a638SAlexander V. Chernikov  */
1237511a638SAlexander V. Chernikov void
1247511a638SAlexander V. Chernikov rib_walk(uint32_t fibnum, int family, bool wlock, rib_walktree_f_t *wa_f,
1257511a638SAlexander V. Chernikov     void *arg)
1267511a638SAlexander V. Chernikov {
1277511a638SAlexander V. Chernikov 
1287511a638SAlexander V. Chernikov 	rib_walk_ext(fibnum, family, wlock, wa_f, NULL, arg);
1297511a638SAlexander V. Chernikov }
1307511a638SAlexander V. Chernikov 
1317511a638SAlexander V. Chernikov /*
132*f9668e42SAlexander V. Chernikov  * Calls @wa_f with @arg for each entry in the table matching @prefix/@mask.
133*f9668e42SAlexander V. Chernikov  *
134*f9668e42SAlexander V. Chernikov  * The following flags are supported:
135*f9668e42SAlexander V. Chernikov  *  RIB_FLAG_WLOCK: acquire exclusive lock
136*f9668e42SAlexander V. Chernikov  *  RIB_FLAG_LOCKED: Assumes the table is already locked & skip locking
137*f9668e42SAlexander V. Chernikov  *
138*f9668e42SAlexander V. Chernikov  * By default, table is traversed under read lock.
139*f9668e42SAlexander V. Chernikov  */
140*f9668e42SAlexander V. Chernikov void
141*f9668e42SAlexander V. Chernikov rib_walk_from(uint32_t fibnum, int family, uint32_t flags, struct sockaddr *prefix,
142*f9668e42SAlexander V. Chernikov     struct sockaddr *mask, rib_walktree_f_t *wa_f, void *arg)
143*f9668e42SAlexander V. Chernikov {
144*f9668e42SAlexander V. Chernikov 	RIB_RLOCK_TRACKER;
145*f9668e42SAlexander V. Chernikov 	struct rib_head *rnh = rt_tables_get_rnh(fibnum, family);
146*f9668e42SAlexander V. Chernikov 
147*f9668e42SAlexander V. Chernikov 	if (rnh == NULL)
148*f9668e42SAlexander V. Chernikov 		return;
149*f9668e42SAlexander V. Chernikov 
150*f9668e42SAlexander V. Chernikov 	if (flags & RIB_FLAG_WLOCK)
151*f9668e42SAlexander V. Chernikov 		RIB_WLOCK(rnh);
152*f9668e42SAlexander V. Chernikov 	else if (!(flags & RIB_FLAG_LOCKED))
153*f9668e42SAlexander V. Chernikov 		RIB_RLOCK(rnh);
154*f9668e42SAlexander V. Chernikov 
155*f9668e42SAlexander V. Chernikov 	rnh->rnh_walktree_from(&rnh->head, prefix, mask, (walktree_f_t *)wa_f, arg);
156*f9668e42SAlexander V. Chernikov 
157*f9668e42SAlexander V. Chernikov 	if (flags & RIB_FLAG_WLOCK)
158*f9668e42SAlexander V. Chernikov 		RIB_WUNLOCK(rnh);
159*f9668e42SAlexander V. Chernikov 	else if (!(flags & RIB_FLAG_LOCKED))
160*f9668e42SAlexander V. Chernikov 		RIB_RUNLOCK(rnh);
161*f9668e42SAlexander V. Chernikov }
162*f9668e42SAlexander V. Chernikov 
163*f9668e42SAlexander V. Chernikov /*
1647511a638SAlexander V. Chernikov  * Iterates over all existing fibs in system calling
1657511a638SAlexander V. Chernikov  *  @hook_f function before/after traversing each fib.
1667511a638SAlexander V. Chernikov  *  Calls @wa_f function for each element in current fib.
1677511a638SAlexander V. Chernikov  * If af is not AF_UNSPEC, iterates over fibs in particular
1687511a638SAlexander V. Chernikov  * address family.
1697511a638SAlexander V. Chernikov  */
1707511a638SAlexander V. Chernikov void
1717511a638SAlexander V. Chernikov rib_foreach_table_walk(int family, bool wlock, rib_walktree_f_t *wa_f,
1727511a638SAlexander V. Chernikov     rib_walk_hook_f_t *hook_f, void *arg)
1737511a638SAlexander V. Chernikov {
1747511a638SAlexander V. Chernikov 
1757511a638SAlexander V. Chernikov 	for (uint32_t fibnum = 0; fibnum < rt_numfibs; fibnum++) {
1767511a638SAlexander V. Chernikov 		/* Do we want some specific family? */
1777511a638SAlexander V. Chernikov 		if (family != AF_UNSPEC) {
1787511a638SAlexander V. Chernikov 			rib_walk_ext(fibnum, family, wlock, wa_f, hook_f, arg);
1797511a638SAlexander V. Chernikov 			continue;
1807511a638SAlexander V. Chernikov 		}
1817511a638SAlexander V. Chernikov 
1827511a638SAlexander V. Chernikov 		for (int i = 1; i <= AF_MAX; i++)
1837511a638SAlexander V. Chernikov 			rib_walk_ext(fibnum, i, wlock, wa_f, hook_f, arg);
1847511a638SAlexander V. Chernikov 	}
1857511a638SAlexander V. Chernikov }
1867511a638SAlexander V. Chernikov 
1877511a638SAlexander V. Chernikov /*
1887511a638SAlexander V. Chernikov  * Iterates over all existing fibs in system and deletes each element
1897511a638SAlexander V. Chernikov  *  for which @filter_f function returns non-zero value.
1907511a638SAlexander V. Chernikov  * If @family is not AF_UNSPEC, iterates over fibs in particular
1917511a638SAlexander V. Chernikov  * address family.
1927511a638SAlexander V. Chernikov  */
1937511a638SAlexander V. Chernikov void
1947511a638SAlexander V. Chernikov rib_foreach_table_walk_del(int family, rib_filter_f_t *filter_f, void *arg)
1957511a638SAlexander V. Chernikov {
1967511a638SAlexander V. Chernikov 
1977511a638SAlexander V. Chernikov 	for (uint32_t fibnum = 0; fibnum < rt_numfibs; fibnum++) {
1987511a638SAlexander V. Chernikov 		/* Do we want some specific family? */
1997511a638SAlexander V. Chernikov 		if (family != AF_UNSPEC) {
2007511a638SAlexander V. Chernikov 			rib_walk_del(fibnum, family, filter_f, arg, 0);
2017511a638SAlexander V. Chernikov 			continue;
2027511a638SAlexander V. Chernikov 		}
2037511a638SAlexander V. Chernikov 
2047511a638SAlexander V. Chernikov 		for (int i = 1; i <= AF_MAX; i++)
2057511a638SAlexander V. Chernikov 			rib_walk_del(fibnum, i, filter_f, arg, 0);
2067511a638SAlexander V. Chernikov 	}
2077511a638SAlexander V. Chernikov }
2087511a638SAlexander V. Chernikov 
2097511a638SAlexander V. Chernikov 
2107511a638SAlexander V. Chernikov /*
211682b902dSAlexander V. Chernikov  * Wrapper for the control plane functions for performing af-agnostic
212682b902dSAlexander V. Chernikov  *  lookups.
213682b902dSAlexander V. Chernikov  * @fibnum: fib to perform the lookup.
214682b902dSAlexander V. Chernikov  * @dst: sockaddr with family and addr filled in. IPv6 addresses needs to be in
215682b902dSAlexander V. Chernikov  *  deembedded from.
216682b902dSAlexander V. Chernikov  * @flags: fib(9) flags.
217682b902dSAlexander V. Chernikov  * @flowid: flow id for path selection in multipath use case.
218682b902dSAlexander V. Chernikov  *
219682b902dSAlexander V. Chernikov  * Returns nhop_object or NULL.
220682b902dSAlexander V. Chernikov  *
221682b902dSAlexander V. Chernikov  * Requires NET_EPOCH.
222682b902dSAlexander V. Chernikov  *
223682b902dSAlexander V. Chernikov  */
224682b902dSAlexander V. Chernikov struct nhop_object *
225682b902dSAlexander V. Chernikov rib_lookup(uint32_t fibnum, const struct sockaddr *dst, uint32_t flags,
226682b902dSAlexander V. Chernikov     uint32_t flowid)
227682b902dSAlexander V. Chernikov {
228682b902dSAlexander V. Chernikov 	struct nhop_object *nh;
229682b902dSAlexander V. Chernikov 
230682b902dSAlexander V. Chernikov 	nh = NULL;
231682b902dSAlexander V. Chernikov 
232682b902dSAlexander V. Chernikov 	switch (dst->sa_family) {
233682b902dSAlexander V. Chernikov #ifdef INET
234682b902dSAlexander V. Chernikov 	case AF_INET:
235682b902dSAlexander V. Chernikov 	{
236682b902dSAlexander V. Chernikov 		const struct sockaddr_in *a = (const struct sockaddr_in *)dst;
237682b902dSAlexander V. Chernikov 		nh = fib4_lookup(fibnum, a->sin_addr, 0, flags, flowid);
238682b902dSAlexander V. Chernikov 		break;
239682b902dSAlexander V. Chernikov 	}
240682b902dSAlexander V. Chernikov #endif
241682b902dSAlexander V. Chernikov #ifdef INET6
242682b902dSAlexander V. Chernikov 	case AF_INET6:
243682b902dSAlexander V. Chernikov 	{
244682b902dSAlexander V. Chernikov 		const struct sockaddr_in6 *a = (const struct sockaddr_in6*)dst;
245682b902dSAlexander V. Chernikov 		nh = fib6_lookup(fibnum, &a->sin6_addr, a->sin6_scope_id,
246682b902dSAlexander V. Chernikov 		    flags, flowid);
247682b902dSAlexander V. Chernikov 		break;
248682b902dSAlexander V. Chernikov 	}
249682b902dSAlexander V. Chernikov #endif
250682b902dSAlexander V. Chernikov 	}
251682b902dSAlexander V. Chernikov 
252682b902dSAlexander V. Chernikov 	return (nh);
253682b902dSAlexander V. Chernikov }
254fedeb08bSAlexander V. Chernikov 
255fedeb08bSAlexander V. Chernikov #ifdef ROUTE_MPATH
256fedeb08bSAlexander V. Chernikov static void
257fedeb08bSAlexander V. Chernikov decompose_change_notification(struct rib_cmd_info *rc, route_notification_t *cb,
258fedeb08bSAlexander V. Chernikov     void *cbdata)
259fedeb08bSAlexander V. Chernikov {
260fedeb08bSAlexander V. Chernikov 	uint32_t num_old, num_new;
261fedeb08bSAlexander V. Chernikov 	uint32_t nh_idx_old, nh_idx_new;
262fedeb08bSAlexander V. Chernikov 	struct weightened_nhop *wn_old, *wn_new;
263fedeb08bSAlexander V. Chernikov 	struct weightened_nhop tmp = { NULL, 0 };
264fedeb08bSAlexander V. Chernikov 	uint32_t idx_old = 0, idx_new = 0;
265fedeb08bSAlexander V. Chernikov 
266fedeb08bSAlexander V. Chernikov 	struct rib_cmd_info rc_del = { .rc_cmd = RTM_DELETE, .rc_rt = rc->rc_rt };
267fedeb08bSAlexander V. Chernikov 	struct rib_cmd_info rc_add = { .rc_cmd = RTM_ADD, .rc_rt = rc->rc_rt };
268fedeb08bSAlexander V. Chernikov 
269fedeb08bSAlexander V. Chernikov 	if (NH_IS_NHGRP(rc->rc_nh_old)) {
270fedeb08bSAlexander V. Chernikov 		wn_old = nhgrp_get_nhops((struct nhgrp_object *)rc->rc_nh_old, &num_old);
271fedeb08bSAlexander V. Chernikov 	} else {
272fedeb08bSAlexander V. Chernikov 		tmp.nh = rc->rc_nh_old;
273fedeb08bSAlexander V. Chernikov 		tmp.weight = rc->rc_nh_weight;
274fedeb08bSAlexander V. Chernikov 		wn_old = &tmp;
275fedeb08bSAlexander V. Chernikov 		num_old = 1;
276fedeb08bSAlexander V. Chernikov 	}
277fedeb08bSAlexander V. Chernikov 	if (NH_IS_NHGRP(rc->rc_nh_new)) {
278fedeb08bSAlexander V. Chernikov 		wn_new = nhgrp_get_nhops((struct nhgrp_object *)rc->rc_nh_new, &num_new);
279fedeb08bSAlexander V. Chernikov 	} else {
280fedeb08bSAlexander V. Chernikov 		tmp.nh = rc->rc_nh_new;
281fedeb08bSAlexander V. Chernikov 		tmp.weight = rc->rc_nh_weight;
282fedeb08bSAlexander V. Chernikov 		wn_new = &tmp;
283fedeb08bSAlexander V. Chernikov 		num_new = 1;
284fedeb08bSAlexander V. Chernikov 	}
285fedeb08bSAlexander V. Chernikov 
286fedeb08bSAlexander V. Chernikov 	/* Use the fact that each @wn array is sorted */
287fedeb08bSAlexander V. Chernikov 	/*
288fedeb08bSAlexander V. Chernikov 	 * Want to convert into set of add and delete operations
289fedeb08bSAlexander V. Chernikov 	 * [1] -> [1, 2] = A{2}
290fedeb08bSAlexander V. Chernikov 	 * [2] -> [1, 2] = A{1}
291fedeb08bSAlexander V. Chernikov 	 * [1, 2, 4]->[1, 3, 4] = A{2}, D{3}
292fedeb08bSAlexander V. Chernikov 	 * [1, 2, 4]->[1, 4] = D{2}
293fedeb08bSAlexander V. Chernikov 	 * [1, 2, 4] -> [3, 4] = D{1}, C{2,3} OR C{1,3}, D{2} OR D{1},D{2},A{3}
294fedeb08bSAlexander V. Chernikov 	 * [1, 2] -> [3, 4] =
295fedeb08bSAlexander V. Chernikov 	 *
296fedeb08bSAlexander V. Chernikov 	 */
297fedeb08bSAlexander V. Chernikov 	idx_old = 0;
298fedeb08bSAlexander V. Chernikov 	while ((idx_old < num_old) && (idx_new < num_new)) {
299fedeb08bSAlexander V. Chernikov 		nh_idx_old = wn_old[idx_old].nh->nh_priv->nh_idx;
300fedeb08bSAlexander V. Chernikov 		nh_idx_new = wn_new[idx_new].nh->nh_priv->nh_idx;
301fedeb08bSAlexander V. Chernikov 
302fedeb08bSAlexander V. Chernikov 		if (nh_idx_old == nh_idx_new) {
303fedeb08bSAlexander V. Chernikov 			if (wn_old[idx_old].weight != wn_new[idx_new].weight) {
304fedeb08bSAlexander V. Chernikov 				/* Update weight by providing del/add notifications */
305fedeb08bSAlexander V. Chernikov 				rc_del.rc_nh_old = wn_old[idx_old].nh;
306fedeb08bSAlexander V. Chernikov 				rc_del.rc_nh_weight = wn_old[idx_old].weight;
307fedeb08bSAlexander V. Chernikov 				cb(&rc_del, cbdata);
308fedeb08bSAlexander V. Chernikov 
309fedeb08bSAlexander V. Chernikov 				rc_add.rc_nh_new = wn_new[idx_new].nh;
310fedeb08bSAlexander V. Chernikov 				rc_add.rc_nh_weight = wn_new[idx_new].weight;
311fedeb08bSAlexander V. Chernikov 				cb(&rc_add, cbdata);
312fedeb08bSAlexander V. Chernikov 			}
313fedeb08bSAlexander V. Chernikov 			idx_old++;
314fedeb08bSAlexander V. Chernikov 			idx_new++;
315fedeb08bSAlexander V. Chernikov 		} else if (nh_idx_old < nh_idx_new) {
316fedeb08bSAlexander V. Chernikov 			/*
317fedeb08bSAlexander V. Chernikov 			 * [1, ~2~, 4], [1, ~3~, 4]
318fedeb08bSAlexander V. Chernikov 			 * [1, ~2~, 5], [1, ~3~, 4]
319fedeb08bSAlexander V. Chernikov 			 * [1, ~2~], [1, ~3~, 4]
320fedeb08bSAlexander V. Chernikov 			 */
321fedeb08bSAlexander V. Chernikov 			if ((idx_old + 1 >= num_old) ||
322fedeb08bSAlexander V. Chernikov 			    (wn_old[idx_old + 1].nh->nh_priv->nh_idx > nh_idx_new)) {
323fedeb08bSAlexander V. Chernikov 				/* Add new unless the next old item is still <= new */
324fedeb08bSAlexander V. Chernikov 				rc_add.rc_nh_new = wn_new[idx_new].nh;
325fedeb08bSAlexander V. Chernikov 				rc_add.rc_nh_weight = wn_new[idx_new].weight;
326fedeb08bSAlexander V. Chernikov 				cb(&rc_add, cbdata);
327fedeb08bSAlexander V. Chernikov 				idx_new++;
328fedeb08bSAlexander V. Chernikov 			}
329fedeb08bSAlexander V. Chernikov 			/* In any case, delete current old */
330fedeb08bSAlexander V. Chernikov 			rc_del.rc_nh_old = wn_old[idx_old].nh;
331fedeb08bSAlexander V. Chernikov 			rc_del.rc_nh_weight = wn_old[idx_old].weight;
332fedeb08bSAlexander V. Chernikov 			cb(&rc_del, cbdata);
333fedeb08bSAlexander V. Chernikov 			idx_old++;
334fedeb08bSAlexander V. Chernikov 		} else {
335fedeb08bSAlexander V. Chernikov 			/*
336fedeb08bSAlexander V. Chernikov 			 * nh_idx_old > nh_idx_new
337fedeb08bSAlexander V. Chernikov 			 *
338fedeb08bSAlexander V. Chernikov 			 * [1, ~3~, 4], [1, ~2~, 4]
339fedeb08bSAlexander V. Chernikov 			 * [1, ~3~, 5], [1, ~2~, 4]
340fedeb08bSAlexander V. Chernikov 			 * [1, ~3~, 4], [1, ~2~]
341fedeb08bSAlexander V. Chernikov 			 */
342fedeb08bSAlexander V. Chernikov 			if ((idx_new + 1 >= num_new) ||
343fedeb08bSAlexander V. Chernikov 			    (wn_new[idx_new + 1].nh->nh_priv->nh_idx > nh_idx_old)) {
344fedeb08bSAlexander V. Chernikov 				/* No next item or next item is > current one */
345fedeb08bSAlexander V. Chernikov 				rc_add.rc_nh_new = wn_new[idx_new].nh;
346fedeb08bSAlexander V. Chernikov 				rc_add.rc_nh_weight = wn_new[idx_new].weight;
347fedeb08bSAlexander V. Chernikov 				cb(&rc_add, cbdata);
348fedeb08bSAlexander V. Chernikov 				idx_new++;
349fedeb08bSAlexander V. Chernikov 			}
350fedeb08bSAlexander V. Chernikov 			/* In any case, delete current old */
351fedeb08bSAlexander V. Chernikov 			rc_del.rc_nh_old = wn_old[idx_old].nh;
352fedeb08bSAlexander V. Chernikov 			rc_del.rc_nh_weight = wn_old[idx_old].weight;
353fedeb08bSAlexander V. Chernikov 			cb(&rc_del, cbdata);
354fedeb08bSAlexander V. Chernikov 			idx_old++;
355fedeb08bSAlexander V. Chernikov 		}
356fedeb08bSAlexander V. Chernikov 	}
357fedeb08bSAlexander V. Chernikov 
358fedeb08bSAlexander V. Chernikov 	while (idx_old < num_old) {
359fedeb08bSAlexander V. Chernikov 		rc_del.rc_nh_old = wn_old[idx_old].nh;
360fedeb08bSAlexander V. Chernikov 		rc_del.rc_nh_weight = wn_old[idx_old].weight;
361fedeb08bSAlexander V. Chernikov 		cb(&rc_del, cbdata);
362fedeb08bSAlexander V. Chernikov 		idx_old++;
363fedeb08bSAlexander V. Chernikov 	}
364fedeb08bSAlexander V. Chernikov 
365fedeb08bSAlexander V. Chernikov 	while (idx_new < num_new) {
366fedeb08bSAlexander V. Chernikov 		rc_add.rc_nh_new = wn_new[idx_new].nh;
367fedeb08bSAlexander V. Chernikov 		rc_add.rc_nh_weight = wn_new[idx_new].weight;
368fedeb08bSAlexander V. Chernikov 		cb(&rc_add, cbdata);
369fedeb08bSAlexander V. Chernikov 		idx_new++;
370fedeb08bSAlexander V. Chernikov 	}
371fedeb08bSAlexander V. Chernikov }
372fedeb08bSAlexander V. Chernikov 
373fedeb08bSAlexander V. Chernikov /*
374fedeb08bSAlexander V. Chernikov  * Decompose multipath cmd info @rc into a list of add/del/change
375fedeb08bSAlexander V. Chernikov  *  single-path operations, calling @cb callback for each operation.
376fedeb08bSAlexander V. Chernikov  * Assumes at least one of the nexthops in @rc is multipath.
377fedeb08bSAlexander V. Chernikov  */
378fedeb08bSAlexander V. Chernikov void
379fedeb08bSAlexander V. Chernikov rib_decompose_notification(struct rib_cmd_info *rc, route_notification_t *cb,
380fedeb08bSAlexander V. Chernikov     void *cbdata)
381fedeb08bSAlexander V. Chernikov {
382fedeb08bSAlexander V. Chernikov 	struct weightened_nhop *wn;
383fedeb08bSAlexander V. Chernikov 	uint32_t num_nhops;
384fedeb08bSAlexander V. Chernikov 	struct rib_cmd_info rc_new;
385fedeb08bSAlexander V. Chernikov 
386fedeb08bSAlexander V. Chernikov 	rc_new = *rc;
387fedeb08bSAlexander V. Chernikov 	DPRINTF("cb=%p cmd=%d nh_old=%p nh_new=%p",
388fedeb08bSAlexander V. Chernikov 	    cb, rc->cmd, rc->nh_old, rc->nh_new);
389fedeb08bSAlexander V. Chernikov 	switch (rc->rc_cmd) {
390fedeb08bSAlexander V. Chernikov 	case RTM_ADD:
391fedeb08bSAlexander V. Chernikov 		if (!NH_IS_NHGRP(rc->rc_nh_new))
392fedeb08bSAlexander V. Chernikov 			return;
393fedeb08bSAlexander V. Chernikov 		wn = nhgrp_get_nhops((struct nhgrp_object *)rc->rc_nh_new, &num_nhops);
394fedeb08bSAlexander V. Chernikov 		for (uint32_t i = 0; i < num_nhops; i++) {
395fedeb08bSAlexander V. Chernikov 			rc_new.rc_nh_new = wn[i].nh;
396fedeb08bSAlexander V. Chernikov 			rc_new.rc_nh_weight = wn[i].weight;
397fedeb08bSAlexander V. Chernikov 			cb(&rc_new, cbdata);
398fedeb08bSAlexander V. Chernikov 		}
399fedeb08bSAlexander V. Chernikov 		break;
400fedeb08bSAlexander V. Chernikov 	case RTM_DELETE:
401fedeb08bSAlexander V. Chernikov 		if (!NH_IS_NHGRP(rc->rc_nh_old))
402fedeb08bSAlexander V. Chernikov 			return;
403fedeb08bSAlexander V. Chernikov 		wn = nhgrp_get_nhops((struct nhgrp_object *)rc->rc_nh_old, &num_nhops);
404fedeb08bSAlexander V. Chernikov 		for (uint32_t i = 0; i < num_nhops; i++) {
405fedeb08bSAlexander V. Chernikov 			rc_new.rc_nh_old = wn[i].nh;
406fedeb08bSAlexander V. Chernikov 			rc_new.rc_nh_weight = wn[i].weight;
407fedeb08bSAlexander V. Chernikov 			cb(&rc_new, cbdata);
408fedeb08bSAlexander V. Chernikov 		}
409fedeb08bSAlexander V. Chernikov 		break;
410fedeb08bSAlexander V. Chernikov 	case RTM_CHANGE:
411fedeb08bSAlexander V. Chernikov 		if (!NH_IS_NHGRP(rc->rc_nh_old) && !NH_IS_NHGRP(rc->rc_nh_new))
412fedeb08bSAlexander V. Chernikov 			return;
413fedeb08bSAlexander V. Chernikov 		decompose_change_notification(rc, cb, cbdata);
414fedeb08bSAlexander V. Chernikov 		break;
415fedeb08bSAlexander V. Chernikov 	}
416fedeb08bSAlexander V. Chernikov }
417fedeb08bSAlexander V. Chernikov #endif
418