/* * Copyright 2005 Sun Microsystems, Inc. All rights reserved. * Use is subject to license terms. * * Copyright (c) 1995 * The Regents of the University of California. All rights reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * 1. Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * 2. Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution. * 3. All advertising materials mentioning features or use of this software * must display the following acknowledgment: * This product includes software developed by the University of * California, Berkeley and its contributors. * 4. Neither the name of the University nor the names of its contributors * may be used to endorse or promote products derived from this software * without specific prior written permission. * * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF * SUCH DAMAGE. * * $FreeBSD: src/sbin/routed/rdisc.c,v 1.8 2000/08/11 08:24:38 sheldonh Exp $ */ #pragma ident "%Z%%M% %I% %E% SMI" #include "defs.h" #include #include #include /* * The size of the control buffer passed to recvmsg() used to receive * ancillary data. */ #define CONTROL_BUFSIZE 1024 /* router advertisement ICMP packet */ struct icmp_ad { uint8_t icmp_type; /* type of message */ uint8_t icmp_code; /* type sub code */ uint16_t icmp_cksum; /* ones complement cksum of struct */ uint8_t icmp_ad_num; /* # of following router addresses */ uint8_t icmp_ad_asize; /* 2--words in each advertisement */ uint16_t icmp_ad_life; /* seconds of validity */ struct icmp_ad_info { in_addr_t icmp_ad_addr; uint32_t icmp_ad_pref; } icmp_ad_info[1]; }; /* router solicitation ICMP packet */ struct icmp_so { uint8_t icmp_type; /* type of message */ uint8_t icmp_code; /* type sub code */ uint16_t icmp_cksum; /* ones complement cksum of struct */ uint32_t icmp_so_rsvd; }; union ad_u { struct icmp icmp; struct icmp_ad ad; struct icmp_so so; }; int rdisc_sock = -1; /* router-discovery raw socket */ static struct interface *rdisc_sock_interface; /* current rdisc interface */ struct timeval rdisc_timer; boolean_t rdisc_ok; /* using solicited route */ #define MAX_ADS 16 int max_ads; /* at least one per interface */ /* accumulated advertisements */ static struct dr *cur_drp, *drs; /* * adjust unsigned preference by interface metric, * without driving it to infinity */ #define PREF(p, ifp) ((p) <= (uint32_t)(ifp)->int_metric ? ((p) != 0 ? 1 : 0) \ : (p) - ((ifp)->int_metric)) static void rdisc_sort(void); typedef enum { unicast, bcast, mcast } dstaddr_t; /* dump an ICMP Router Discovery Advertisement Message */ static void trace_rdisc(const char *act, uint32_t from, uint32_t to, struct interface *ifp, union ad_u *p, uint_t len) { int i; n_long *wp, *lim; if (!TRACEPACKETS || ftrace == 0) return; lastlog(); if (p->icmp.icmp_type == ICMP_ROUTERADVERT) { (void) fprintf(ftrace, "%s Router Ad" " from %s to %s via %s life=%d\n", act, naddr_ntoa(from), naddr_ntoa(to), ifp ? ifp->int_name : "?", ntohs(p->ad.icmp_ad_life)); if (!TRACECONTENTS) return; wp = &p->ad.icmp_ad_info[0].icmp_ad_addr; lim = &wp[(len - sizeof (p->ad)) / sizeof (*wp)]; for (i = 0; i < p->ad.icmp_ad_num && wp <= lim; i++) { (void) fprintf(ftrace, "\t%s preference=%ld", naddr_ntoa(wp[0]), (long)ntohl(wp[1])); wp += p->ad.icmp_ad_asize; } (void) fputc('\n', ftrace); } else { trace_act("%s Router Solic. from %s to %s via %s rsvd=%#x", act, naddr_ntoa(from), naddr_ntoa(to), ifp ? ifp->int_name : "?", ntohl(p->so.icmp_so_rsvd)); } } /* * Prepare Router Discovery socket. */ static void get_rdisc_sock(void) { int on = 1; unsigned char ttl = 1; if (rdisc_sock < 0) { max_ads = MAX_ADS; drs = rtmalloc(max_ads * sizeof (struct dr), "get_rdisc_sock"); (void) memset(drs, 0, max_ads * sizeof (struct dr)); rdisc_sock = socket(PF_INET, SOCK_RAW, IPPROTO_ICMP); if (rdisc_sock < 0) BADERR(_B_TRUE, "rdisc_sock = socket()"); fix_sock(rdisc_sock, "rdisc_sock"); if (setsockopt(rdisc_sock, IPPROTO_IP, IP_RECVIF, &on, sizeof (on))) BADERR(_B_FALSE, "setsockopt(IP_RECVIF)"); if (setsockopt(rdisc_sock, IPPROTO_IP, IP_MULTICAST_TTL, &ttl, sizeof (ttl)) < 0) DBGERR(_B_TRUE, "rdisc_sock setsockopt(IP_MULTICAST_TTL)"); fix_select(); } } /* * Pick multicast group for router-discovery socket */ void set_rdisc_mg(struct interface *ifp, int on) /* 0=turn it off */ { struct ip_mreq m; boolean_t dosupply; if (rdisc_sock < 0) { /* * Create the raw socket so that we can hear at least * broadcast router discovery packets. */ if ((ifp->int_state & IS_NO_RDISC) == IS_NO_RDISC || !on) return; get_rdisc_sock(); } if (!(ifp->int_if_flags & IFF_MULTICAST)) { /* Can't multicast, so no groups could have been joined. */ ifp->int_state &= ~(IS_ALL_HOSTS | IS_ALL_ROUTERS); return; } dosupply = should_supply(ifp); (void) memset(&m, 0, sizeof (m)); m.imr_interface.s_addr = ((ifp->int_if_flags & IFF_POINTOPOINT) && (ifp->int_dstaddr != 0) ? ifp->int_dstaddr : ifp->int_addr); if (dosupply || (ifp->int_state & IS_NO_ADV_IN) || !on) { /* stop listening to advertisements */ if (ifp->int_state & IS_ALL_HOSTS) { m.imr_multiaddr.s_addr = htonl(INADDR_ALLHOSTS_GROUP); if (setsockopt(rdisc_sock, IPPROTO_IP, IP_DROP_MEMBERSHIP, &m, sizeof (m)) < 0 && errno != EADDRNOTAVAIL && errno != ENOENT) LOGERR("IP_DROP_MEMBERSHIP ALLHOSTS"); ifp->int_state &= ~IS_ALL_HOSTS; } } else if (!(ifp->int_state & IS_ALL_HOSTS)) { /* start listening to advertisements */ m.imr_multiaddr.s_addr = htonl(INADDR_ALLHOSTS_GROUP); if (setsockopt(rdisc_sock, IPPROTO_IP, IP_ADD_MEMBERSHIP, &m, sizeof (m)) < 0) { LOGERR("IP_ADD_MEMBERSHIP ALLHOSTS"); } else { ifp->int_state |= IS_ALL_HOSTS; } } if (!dosupply || (ifp->int_state & IS_NO_ADV_OUT) || !IS_IFF_ROUTING(ifp->int_if_flags) || !on) { /* stop listening to solicitations */ if (ifp->int_state & IS_ALL_ROUTERS) { m.imr_multiaddr.s_addr = htonl(INADDR_ALLRTRS_GROUP); if (setsockopt(rdisc_sock, IPPROTO_IP, IP_DROP_MEMBERSHIP, &m, sizeof (m)) < 0 && errno != EADDRNOTAVAIL && errno != ENOENT) LOGERR("IP_DROP_MEMBERSHIP ALLROUTERS"); ifp->int_state &= ~IS_ALL_ROUTERS; } } else if (!(ifp->int_state & IS_ALL_ROUTERS)) { /* start hearing solicitations */ m.imr_multiaddr.s_addr = htonl(INADDR_ALLRTRS_GROUP); if (setsockopt(rdisc_sock, IPPROTO_IP, IP_ADD_MEMBERSHIP, &m, sizeof (m)) < 0) { LOGERR("IP_ADD_MEMBERSHIP ALLROUTERS"); } else { ifp->int_state |= IS_ALL_ROUTERS; } } } /* * start or stop supplying routes to other systems. */ void set_supplier(void) { struct interface *ifp; struct dr *drp; static boolean_t supplystate = _B_FALSE; if (supplystate == (fwd_interfaces > 1)) return; supplystate = fwd_interfaces > 1; trace_act("%d forwarding interfaces present; becoming %ssupplier", fwd_interfaces, supplystate ? "" : "non-"); if (supplystate) { /* Forget discovered routes. */ for (drp = drs; drp < &drs[max_ads]; drp++) { drp->dr_recv_pref = DEF_PREFERENCELEVEL; drp->dr_life = 0; } rdisc_age(0); /* * Do not start advertising until we have heard some * RIP routes. */ LIM_SEC(rdisc_timer, now.tv_sec+MIN_WAITTIME); /* get rid of any redirects */ del_redirects(0, 0); } else { /* * Flush out all those advertisements we had sent by sending * one with lifetime=0. */ rdisc_adv(_B_TRUE); } /* * Switch router discovery multicast groups from soliciting * to advertising or back. */ for (ifp = ifnet; ifp; ifp = ifp->int_next) { if (ifp->int_state & IS_BROKE) continue; ifp->int_rdisc_cnt = 0; ifp->int_rdisc_timer.tv_usec = rdisc_timer.tv_usec; ifp->int_rdisc_timer.tv_sec = now.tv_sec+MIN_WAITTIME; set_rdisc_mg(ifp, 1); } } /* * Age discovered routes and find the best one */ void rdisc_age(in_addr_t bad_gate) { time_t sec; struct dr *drp; struct rt_spare new; struct rt_entry *rt; /* * If we are being told about a bad router, * then age the discovered default route, and if there is * no alternative, solicit a replacement. */ if (bad_gate != 0) { /* * Look for the bad discovered default route. * Age it and note its interface. */ for (drp = drs; drp < &drs[max_ads]; drp++) { if (drp->dr_ts == 0) continue; /* * When we find the bad router, age the route * to at most SUPPLY_INTERVAL. * This is contrary to RFC 1256, but defends against * black holes. */ if (drp->dr_gate == bad_gate) { sec = (now.tv_sec - drp->dr_life + SUPPLY_INTERVAL); if (drp->dr_ts > sec) { trace_act("age 0.0.0.0 --> %s via %s", naddr_ntoa(drp->dr_gate), drp->dr_ifp->int_name); drp->dr_ts = sec; } break; } } } else if (should_supply(NULL)) { /* * If switching from client to server, get rid of old * default routes. */ if (cur_drp != NULL) { rt = rtget(RIP_DEFAULT, 0); /* * If there is a current default router, and the * there is no rt_spare entry, create one * for cur_drp to prevent segmentation fault * at rdisc_sort. */ if (rt == NULL) { (void) memset(&new, 0, sizeof (new)); new.rts_ifp = cur_drp->dr_ifp; new.rts_gate = cur_drp->dr_gate; new.rts_router = cur_drp->dr_gate; new.rts_metric = HOPCNT_INFINITY-1; new.rts_time = now.tv_sec; new.rts_origin = RO_RDISC; rtadd(RIP_DEFAULT, 0, RS_NOPROPAGATE, &new); } rdisc_sort(); } rdisc_adv(_B_FALSE); } rdisc_sol(); if (cur_drp != NULL) { rt = rtget(RIP_DEFAULT, 0); if (rt == NULL) { (void) memset(&new, 0, sizeof (new)); new.rts_ifp = cur_drp->dr_ifp; new.rts_gate = cur_drp->dr_gate; new.rts_router = cur_drp->dr_gate; new.rts_metric = HOPCNT_INFINITY-1; new.rts_time = now.tv_sec; new.rts_origin = RO_RDISC; rtadd(RIP_DEFAULT, 0, RS_NOPROPAGATE, &new); } } rdisc_sort(); /* * Delete old redirected routes to keep the kernel table small, * and to prevent black holes. Check that the kernel table * matches the daemon table (i.e. has the default route). * But only if RIP is not running and we are not dealing with * a bad gateway, since otherwise age() will be called. */ if (rip_sock < 0 && bad_gate == 0) age(0); } /* * Zap all routes discovered via an interface that has gone bad * This should only be called when !(ifp->int_state & IS_DUP) * This is called by if_del and if_bad, and the interface pointer * might not be valid after this. */ void if_bad_rdisc(struct interface *ifp) { struct dr *drp; for (drp = drs; drp < &drs[max_ads]; drp++) { if (drp->dr_ifp != ifp) continue; (void) memset(drp, 0, sizeof (*drp)); } /* make a note to re-solicit, turn RIP on or off, etc. */ rdisc_timer.tv_sec = 0; } /* * Rewire all routes discovered via an interface that has gone bad * This is only called by if_del. */ void if_rewire_rdisc(struct interface *oldifp, struct interface *newifp) { struct dr *drp; for (drp = drs; drp < &drs[max_ads]; drp++) { if (drp->dr_ifp != oldifp) continue; drp->dr_ifp = newifp; drp->dr_pref += (newifp->int_metric - oldifp->int_metric); drp->dr_flags |= DR_CHANGED; } /* make a note to re-solicit, turn RIP on or off, etc. */ rdisc_timer.tv_sec = 0; } /* * Mark an interface ok for router discovering. * This is called by if_ok and ifinit. */ void if_ok_rdisc(struct interface *ifp) { set_rdisc_mg(ifp, 1); ifp->int_rdisc_cnt = 0; ifp->int_rdisc_timer.tv_sec = now.tv_sec + ((ifp->int_state & IS_NO_ADV_OUT) ? MAX_SOLICITATION_DELAY : MIN_WAITTIME); if (timercmp(&rdisc_timer, &ifp->int_rdisc_timer, > /* cstyle */)) rdisc_timer = ifp->int_rdisc_timer; } /* * Get rid of a dead discovered router */ static void del_rdisc(struct dr *drp) { struct interface *ifp; uint32_t gate; int i; struct rt_entry *rt; struct rt_spare *rts = NULL; del_redirects(gate = drp->dr_gate, 0); drp->dr_ts = 0; drp->dr_life = 0; rt = rtget(RIP_DEFAULT, 0); if (rt == NULL) { trace_act("could not find default route in table"); } else { for (i = 0; i < rt->rt_num_spares; i++) { if ((rt->rt_spares[i].rts_gate == drp->dr_gate) && (rt->rt_spares[i].rts_origin == RO_RDISC)) { rts = &rt->rt_spares[i]; break; } } if (rts != NULL) rts_delete(rt, rts); else trace_act("could not find default route " "through %s in table", naddr_ntoa(drp->dr_gate)); } /* Count the other discovered routers on the interface. */ i = 0; ifp = drp->dr_ifp; for (drp = drs; drp < &drs[max_ads]; drp++) { if (drp->dr_ts != 0 && drp->dr_ifp == ifp) i++; } /* * If that was the last good discovered router on the interface, * then solicit a new one. * This is contrary to RFC 1256, but defends against black holes. */ if (i != 0) { trace_act("discovered router %s via %s" " is bad--have %d remaining", naddr_ntoa(gate), ifp->int_name, i); } else if (ifp->int_rdisc_cnt >= MAX_SOLICITATIONS) { trace_act("last discovered router %s via %s" " is bad--re-solicit", naddr_ntoa(gate), ifp->int_name); ifp->int_rdisc_cnt = 0; ifp->int_rdisc_timer.tv_sec = 0; rdisc_sol(); } else { trace_act("last discovered router %s via %s" " is bad--wait to solicit", naddr_ntoa(gate), ifp->int_name); } } /* Find the best discovered route, and discard stale routers. */ static void rdisc_sort(void) { struct dr *drp, *new_drp; struct rt_entry *rt; struct rt_spare new, *rts; struct interface *ifp; uint_t new_st = 0; uint32_t new_pref = DEF_PREFERENCELEVEL; int first_rdisc_slot = 0; int j; boolean_t spares_avail; void *ptr; size_t ptrsize; rt = rtget(RIP_DEFAULT, 0); /* * If all the rt_spare entries are taken up with with default routes * learnt from RIP (ie rts_origin = RO_RIP), bail out. * NOTE: * We *always* prefer default routes learned via RIP * (ie RO_RIP) over those learnt via RDISC (ie RO_RDISC). * The rdisc machinery should not modify, replace or * remove any existing default routes with RO_RIP set. */ if (rt != NULL) { spares_avail = _B_FALSE; for (j = 0; j < rt->rt_num_spares; j++) { rts = &rt->rt_spares[j]; if (rts->rts_gate == 0 || rts->rts_origin != RO_RIP || rts->rts_ifp == &dummy_ifp) { spares_avail = _B_TRUE; break; } } if (!spares_avail) { ptrsize = (rt->rt_num_spares + SPARE_INC) * sizeof (struct rt_spare); ptr = realloc(rt->rt_spares, ptrsize); if (ptr != NULL) { struct rt_spare *tmprts; rt->rt_spares = ptr; rts = &rt->rt_spares[rt->rt_num_spares]; (void) memset(rts, 0, (SPARE_INC * sizeof (struct rt_spare))); rt->rt_num_spares += SPARE_INC; for (tmprts = rts, j = SPARE_INC; j != 0; j--, tmprts++) tmprts->rts_metric = HOPCNT_INFINITY; spares_avail = _B_TRUE; } else { return; } } } /* Find the best RDISC advertiser */ rt = NULL; new_drp = NULL; for (drp = drs; drp < &drs[max_ads]; drp++) { if (drp->dr_ts == 0) continue; ifp = drp->dr_ifp; /* Get rid of expired discovered routers. */ if (drp->dr_ts + drp->dr_life <= now.tv_sec) { del_rdisc(drp); continue; } LIM_SEC(rdisc_timer, drp->dr_ts+drp->dr_life); /* * Update preference with possibly changed interface * metric. */ drp->dr_pref = PREF(drp->dr_recv_pref, ifp); /* * Prefer the current route to prevent thrashing. * Prefer shorter lifetimes to speed the detection of * bad routers. * Avoid sick interfaces. */ if (new_drp == NULL || (!((new_st ^ drp->dr_ifp->int_state) & IS_SICK) && (new_pref < drp->dr_pref || (new_pref == drp->dr_pref && (drp == cur_drp || (new_drp != cur_drp && new_drp->dr_life > drp->dr_life))))) || ((new_st & IS_SICK) && !(drp->dr_ifp->int_state & IS_SICK))) { new_drp = drp; new_st = drp->dr_ifp->int_state; new_pref = drp->dr_pref; } } /* * switch to a better RDISC advertiser */ if ((new_drp != cur_drp) || (rt == NULL)) { rt = rtget(RIP_DEFAULT, 0); /* * Purge the table of all the default routes that were * learnt via RDISC, while keeping an eye the first available * slot for the spare entry of new_drp */ if (rt != NULL) { int i; for (i = 0; i < rt->rt_num_spares; i++) { rts = &rt->rt_spares[i]; if ((rts->rts_gate == 0 || rts->rts_ifp == &dummy_ifp) && first_rdisc_slot == 0) first_rdisc_slot = i; if (rts->rts_origin == RO_RDISC) { rts_delete(rt, rts); if (first_rdisc_slot == 0) { first_rdisc_slot = i; } } } } /* Stop using RDISC routes if they are all bad */ if (new_drp == NULL) { trace_act("turn off Router Discovery client"); rdisc_ok = _B_FALSE; } else { if (cur_drp == NULL) { trace_act("turn on Router Discovery client" " using %s via %s", naddr_ntoa(new_drp->dr_gate), new_drp->dr_ifp->int_name); rdisc_ok = _B_TRUE; } /* Prepare a spare entry for the new_drp */ (void) memset(&new, 0, sizeof (new)); new.rts_ifp = new_drp->dr_ifp; new.rts_gate = new_drp->dr_gate; new.rts_router = new_drp->dr_gate; new.rts_metric = HOPCNT_INFINITY-1; new.rts_time = now.tv_sec; new.rts_origin = RO_RDISC; /* * If there is no existing default route, add it * to rts_spare[0]. */ if (rt == NULL) { rtadd(RIP_DEFAULT, 0, RS_NOPROPAGATE, &new); } else { /* * Add the spare entry for the new_drp in * the first available slot */ trace_act("Switching to " "default router with better " "preference %s via %s ", naddr_ntoa(new_drp->dr_gate), new_drp->dr_ifp->int_name); rt->rt_spares[first_rdisc_slot] = new; rt = NULL; /* redo rt_spares */ } } /* * Get ready to redo the entire table. The table should * only include : * a. empty rt_spare slots * b. default routes learnt via RIP * c. default route for the latest best RDISC advertiser * d. default routes of other RDISC advertisers whose * dr_pref == best RDISC advertiser->dr_pref */ cur_drp = new_drp; } /* Redo the entire spare table (without touching RO_RIP entries) */ if (rdisc_ok && rt == NULL) { int i; /* * We've either just turned on router discovery, * or switched to a router with better preference. * Find all other default routers whose * pref == cur_drp->dr_pref and add them as spares */ rt = rtget(RIP_DEFAULT, 0); for (drp = drs; drp < &drs[max_ads]; drp++) { boolean_t dr_done = _B_FALSE; int slot = -1; if (drp->dr_ts == 0) continue; if (drp->dr_pref != cur_drp->dr_pref && ((drp->dr_flags & DR_CHANGED) == 0)) continue; /* * Either pref matches cur_drp->dr_pref, * or something has changed in this drp. * In the former case, we may need to add * this to rt_spares. In the latter case, * if the pref has changed, need to take it * out of rt_spares and the kernel. * * First, find an empty slot in rt_spares * in case we have to add this drp to kernel. * Also check if it is already there. */ for (i = 0; i < rt->rt_num_spares; i++) { if (rt->rt_spares[i].rts_gate == 0) { if (slot < 0) slot = i; continue; } if ((rt->rt_spares[i].rts_gate == drp->dr_gate) && (rt->rt_spares[i].rts_origin == RO_RDISC)) { /* * a spare entry for this RDISC * advertiser already exists. We need * to check if this entry still belongs * in the table */ dr_done = _B_TRUE; break; } } drp->dr_flags &= ~DR_CHANGED; if (drp->dr_pref != cur_drp->dr_pref) { if (dr_done) { /* * The rt_spare of this RDISC advertiser * needs to be removed as it no longer * belongs in the table because its * dr_pref is different than the latest * RDISC advertiser's->dr_pref */ rts_delete(rt, &rt->rt_spares[i]); } continue; } if (slot < 0 && !dr_done) { ptrsize = (rt->rt_num_spares + SPARE_INC) * sizeof (struct rt_spare); ptr = realloc(rt->rt_spares, ptrsize); if (ptr != NULL) { struct rt_spare *tmprts; rt->rt_spares = ptr; slot = rt->rt_num_spares; rts = &rt->rt_spares[rt->rt_num_spares]; (void) memset(rts, 0, (SPARE_INC * sizeof (struct rt_spare))); rt->rt_num_spares += SPARE_INC; for (tmprts = rts, i = SPARE_INC; i != 0; i--, tmprts++) tmprts->rts_metric = HOPCNT_INFINITY; } } if (slot >= 0 && (dr_done != _B_TRUE)) { (void) memset(&new, 0, sizeof (new)); new.rts_ifp = drp->dr_ifp; new.rts_gate = drp->dr_gate; new.rts_router = drp->dr_gate; new.rts_metric = HOPCNT_INFINITY-1; new.rts_time = now.tv_sec; new.rts_origin = RO_RDISC; rt->rt_spares[slot] = new; trace_act("spare default %s via %s", naddr_ntoa(drp->dr_gate), drp->dr_ifp->int_name); } } } /* turn RIP on or off */ if (!rdisc_ok || rip_interfaces > 1) { rip_on(0); } else { rip_off(); } } /* Handle a single address in an advertisement */ static void parse_ad(uint32_t from, in_addr_t gate, uint32_t pref, /* signed and in network order */ ushort_t life, /* in host byte order */ struct interface *ifp) { static struct msg_limit bad_gate; struct dr *drp, *new_drp; void *ptr; size_t ptrsize; if (gate == RIP_DEFAULT || !check_dst(gate)) { msglim(&bad_gate, from, "router %s advertising bad gateway %s", naddr_ntoa(from), naddr_ntoa(gate)); return; } /* * ignore pointers to ourself and routes via unreachable networks */ if (ifwithaddr(gate, _B_TRUE, _B_FALSE) != 0) { trace_pkt(" discard Router Discovery Ad pointing at us"); return; } if (!on_net(gate, ifp->int_net, ifp->int_mask)) { trace_pkt(" discard Router Discovery Ad" " toward unreachable net"); return; } /* * Convert preference to an unsigned value * and later bias it by the metric of the interface. */ pref = UNSIGN_PREF(ntohl(pref)); if (pref == DEF_PREFERENCELEVEL || life < MIN_MAXADVERTISEINTERVAL) { pref = DEF_PREFERENCELEVEL; life = 0; } for (new_drp = NULL, drp = drs; drp < &drs[max_ads]; drp++) { /* accept new info for a familiar entry */ if ((drp->dr_gate == gate) && (drp->dr_ifp == ifp)) { new_drp = drp; drp->dr_flags |= DR_CHANGED; break; } if (life == 0) continue; /* do not worry about dead ads */ if (drp->dr_ts == 0) { new_drp = drp; /* use unused entry */ } else if (new_drp == NULL) { /* look for an entry worse than the new one to reuse. */ if ((!(ifp->int_state & IS_SICK) && (drp->dr_ifp->int_state & IS_SICK)) || (pref > drp->dr_pref && !((ifp->int_state ^ drp->dr_ifp->int_state) & IS_SICK))) new_drp = drp; } else if (new_drp->dr_ts != 0) { /* look for the least valuable entry to reuse */ if ((!(new_drp->dr_ifp->int_state & IS_SICK) && (drp->dr_ifp->int_state & IS_SICK)) || (new_drp->dr_pref > drp->dr_pref && !((new_drp->dr_ifp->int_state ^ drp->dr_ifp->int_state) & IS_SICK))) new_drp = drp; } } /* if all of the current entries are better, add more drs[] */ if (new_drp == NULL) { ptrsize = (max_ads + MAX_ADS) * sizeof (struct dr); ptr = realloc(drs, ptrsize); if (ptr == NULL) return; drs = ptr; (void) memset(&drs[max_ads], 0, MAX_ADS * sizeof (struct dr)); new_drp = &drs[max_ads]; max_ads += MAX_ADS; } /* * Pointer copy is safe here because if_del * calls if_bad_rdisc first, so a non-NULL df_ifp * is always a valid pointer. */ new_drp->dr_ifp = ifp; new_drp->dr_gate = gate; new_drp->dr_ts = now.tv_sec; new_drp->dr_life = life; new_drp->dr_recv_pref = pref; /* bias functional preference by metric of the interface */ new_drp->dr_pref = PREF(pref, ifp); /* after hearing a good advertisement, stop asking */ if (!(ifp->int_state & IS_SICK)) ifp->int_rdisc_cnt = MAX_SOLICITATIONS; } /* * Compute the IP checksum. This assumes the packet is less than 32K long. */ static uint16_t in_cksum(uint16_t *p, uint_t len) { uint32_t sum = 0; int nwords = len >> 1; while (nwords-- != 0) sum += *p++; if (len & 1) sum += *(uchar_t *)p; /* end-around-carry */ sum = (sum >> 16) + (sum & 0xffff); sum += (sum >> 16); return (~sum); } /* Send a router discovery advertisement or solicitation ICMP packet. */ static void send_rdisc(union ad_u *p, uint_t p_size, struct interface *ifp, in_addr_t dst, /* 0 or unicast destination */ dstaddr_t type) { struct sockaddr_in sin; int flags = 0; const char *msg; int ifindex; struct in_addr addr; /* * Don't send Rdisc packets on duplicate interfaces, we * don't want to generate duplicate packets. */ if (ifp->int_state & IS_DUP) return; (void) memset(&sin, 0, sizeof (sin)); sin.sin_addr.s_addr = dst; sin.sin_family = AF_INET; switch (type) { case unicast: /* unicast */ default: flags = MSG_DONTROUTE; msg = "Send"; break; case bcast: /* broadcast */ if (ifp->int_if_flags & IFF_POINTOPOINT) { msg = "Send pt-to-pt"; if (ifp->int_dstaddr == 0) sin.sin_addr.s_addr = htonl(INADDR_BROADCAST); else sin.sin_addr.s_addr = ifp->int_dstaddr; } else { msg = "Send broadcast"; sin.sin_addr.s_addr = ifp->int_brdaddr; } break; case mcast: /* multicast */ msg = "Send multicast"; break; } if (rdisc_sock < 0) get_rdisc_sock(); if (rdisc_sock_interface != ifp) { /* select the right interface. */ ifindex = (type != mcast && ifp->int_phys != NULL) ? ifp->int_phys->phyi_index : 0; if (setsockopt(rdisc_sock, IPPROTO_IP, IP_XMIT_IF, &ifindex, sizeof (ifindex)) == -1) { LOGERR("setsockopt(rdisc_sock, IP_XMIT_IF)"); return; } /* * For multicast, we have to choose the source * address. This is either the local address * (non-point-to-point) or the remote address. */ addr.s_addr = (ifp->int_if_flags & IFF_POINTOPOINT) ? ifp->int_dstaddr : ifp->int_addr; if (type == mcast && setsockopt(rdisc_sock, IPPROTO_IP, IP_MULTICAST_IF, &addr, sizeof (addr)) == -1) { LOGERR("setsockopt(rdisc_sock, IP_MULTICAST_IF)"); return; } rdisc_sock_interface = ifp; } trace_rdisc(msg, ifp->int_addr, sin.sin_addr.s_addr, ifp, p, p_size); if (0 > sendto(rdisc_sock, p, p_size, flags, (struct sockaddr *)&sin, sizeof (sin))) { if (!(ifp->int_state & IS_BROKE)) writelog(LOG_WARNING, "sendto(%s%s%s): %s", ifp->int_name, ", ", inet_ntoa(sin.sin_addr), rip_strerror(errno)); if (ifp != NULL) if_sick(ifp, _B_FALSE); } } /* Send an advertisement */ static void send_adv(struct interface *ifp, in_addr_t dst, dstaddr_t type) { union ad_u u; if ((ifp->int_state & (IS_SUPPRESS_RDISC|IS_FLUSH_RDISC)) == IS_SUPPRESS_RDISC) return; (void) memset(&u, 0, sizeof (u.ad)); u.ad.icmp_type = ICMP_ROUTERADVERT; u.ad.icmp_code = ICMP_ROUTERADVERT_COMMON; u.ad.icmp_ad_num = 1; u.ad.icmp_ad_asize = sizeof (u.ad.icmp_ad_info[0])/4; u.ad.icmp_ad_life = (stopint || !should_supply(ifp) || (ifp->int_state & IS_SUPPRESS_RDISC)) ? 0 : htons(ifp->int_rdisc_int*3); /* Send the configured preference as a network byte order value */ u.ad.icmp_ad_info[0].icmp_ad_pref = htonl(ifp->int_rdisc_pref); u.ad.icmp_ad_info[0].icmp_ad_addr = ifp->int_addr; u.ad.icmp_cksum = in_cksum((uint16_t *)&u.ad, sizeof (u.ad)); send_rdisc(&u, sizeof (u.ad), ifp, dst, type); if (ifp->int_state & IS_SUPPRESS_RDISC) ifp->int_state &= ~IS_FLUSH_RDISC; } /* Advertise as a default router by way of router discovery. */ void rdisc_adv(boolean_t forceadv) { struct interface *ifp; if (!forceadv && !should_supply(NULL)) return; rdisc_timer.tv_sec = now.tv_sec + NEVER; for (ifp = ifnet; ifp; ifp = ifp->int_next) { if ((ifp->int_state & (IS_NO_ADV_OUT | IS_BROKE)) || (!forceadv && !IS_IFF_ROUTING(ifp->int_if_flags))) continue; /* skip interfaces we shouldn't use */ if (IS_IFF_QUIET(ifp->int_if_flags)) continue; if (!timercmp(&ifp->int_rdisc_timer, &now, > /* cstyle */) || stopint != 0 || forceadv) { send_adv(ifp, htonl(INADDR_ALLHOSTS_GROUP), (ifp->int_state & IS_BCAST_RDISC) ? 1 : 2); ifp->int_rdisc_cnt++; intvl_random(&ifp->int_rdisc_timer, (ifp->int_rdisc_int*3)/4, ifp->int_rdisc_int); if (ifp->int_rdisc_cnt < MAX_INITIAL_ADVERTS && (ifp->int_rdisc_timer.tv_sec > MAX_INITIAL_ADVERT_INTERVAL)) { ifp->int_rdisc_timer.tv_sec = MAX_INITIAL_ADVERT_INTERVAL; } timevaladd(&ifp->int_rdisc_timer, &now); } if (timercmp(&rdisc_timer, &ifp->int_rdisc_timer, > /* cstyle */)) rdisc_timer = ifp->int_rdisc_timer; } } /* Solicit for Router Discovery */ void rdisc_sol(void) { struct interface *ifp; union ad_u u; if (should_supply(NULL)) return; rdisc_timer.tv_sec = now.tv_sec + NEVER; for (ifp = ifnet; ifp; ifp = ifp->int_next) { if (0 != (ifp->int_state & (IS_NO_SOL_OUT | IS_BROKE)) || ifp->int_rdisc_cnt >= MAX_SOLICITATIONS) continue; /* skip interfaces we shouldn't use */ if (IS_IFF_QUIET(ifp->int_if_flags)) continue; if (!timercmp(&ifp->int_rdisc_timer, &now, > /* cstyle */)) { (void) memset(&u, 0, sizeof (u.so)); u.so.icmp_type = ICMP_ROUTERSOLICIT; u.so.icmp_cksum = in_cksum((uint16_t *)&u.so, sizeof (u.so)); send_rdisc(&u, sizeof (u.so), ifp, htonl(INADDR_ALLRTRS_GROUP), ((ifp->int_state&IS_BCAST_RDISC) ? bcast : mcast)); if (++ifp->int_rdisc_cnt >= MAX_SOLICITATIONS) continue; ifp->int_rdisc_timer.tv_sec = SOLICITATION_INTERVAL; ifp->int_rdisc_timer.tv_usec = 0; timevaladd(&ifp->int_rdisc_timer, &now); } if (timercmp(&rdisc_timer, &ifp->int_rdisc_timer, > /* cstyle */)) rdisc_timer = ifp->int_rdisc_timer; } } /* * check the IP header of a possible Router Discovery ICMP packet * Returns 0 if bad */ static struct interface * ck_icmp(const char *act, in_addr_t from, struct interface *ifp, in_addr_t to, union ad_u *p, uint_t len) { const char *type; if (p->icmp.icmp_type == ICMP_ROUTERADVERT) { type = "advertisement"; if (p->icmp.icmp_code == ICMP_ROUTERADVERT_NOCOMMON) return (NULL); /* Mobile IP */ } else if (p->icmp.icmp_type == ICMP_ROUTERSOLICIT) { type = "solicitation"; } else { return (NULL); } if (p->icmp.icmp_code != ICMP_ROUTERADVERT_COMMON) { trace_pkt("unrecognized ICMP Router %s code=%d from %s to %s", type, p->icmp.icmp_code, naddr_ntoa(from), naddr_ntoa(to)); return (NULL); } trace_rdisc(act, from, to, ifp, p, len); if (ifp == NULL) trace_pkt("unknown interface for router-discovery %s from %s " "to %s", type, naddr_ntoa(from), naddr_ntoa(to)); return (ifp); } /* Read packets from the router discovery socket */ void read_d(void) { #define PKTLEN 512 static struct msg_limit bad_asize, bad_len; struct sockaddr_in from; int n, cc, hlen; struct { union { struct ip ip; uint16_t s[PKTLEN/sizeof (uint16_t)]; uint8_t b[PKTLEN/sizeof (uint8_t)]; } pkt; } buf; union ad_u *p; n_long *wp; struct interface *ifp; boolean_t needsort = _B_FALSE; struct msghdr msg; struct iovec iov; uint8_t ancillary_data[CONTROL_BUFSIZE]; iov.iov_base = &buf; iov.iov_len = sizeof (buf); msg.msg_iov = &iov; msg.msg_iovlen = 1; msg.msg_name = &from; msg.msg_control = &ancillary_data; for (;;) { msg.msg_namelen = sizeof (from); msg.msg_controllen = sizeof (ancillary_data); cc = recvmsg(rdisc_sock, &msg, 0); if (cc <= 0) { if (cc < 0 && errno != EWOULDBLOCK) LOGERR("recvmsg(rdisc_sock)"); break; } hlen = buf.pkt.ip.ip_hl << 2; if (cc < hlen + ICMP_MINLEN) continue; /* LINTED [alignment will be lw aligned] */ p = (union ad_u *)&buf.pkt.b[hlen]; cc -= hlen; /* * If we could tell the interface on which a packet from * address 0 arrived, we could deal with such solicitations. */ ifp = receiving_interface(&msg, _B_FALSE); ifp = ck_icmp("Recv", from.sin_addr.s_addr, ifp, buf.pkt.ip.ip_dst.s_addr, p, cc); if (ifp == NULL) continue; if (IS_IFF_QUIET(ifp->int_if_flags)) { trace_misc("discard RDISC packet received over %s, %X", ifp->int_name, ifp->int_if_flags); continue; } if (from.sin_addr.s_addr != 0 && ifwithaddr(from.sin_addr.s_addr, _B_FALSE, _B_FALSE)) { trace_pkt(" " "discard our own Router Discovery message"); continue; } /* The remote address *must* be directly connected. */ if (!remote_address_ok(ifp, from.sin_addr.s_addr)) { trace_misc("discard rdisc message; source %s not on " "interface %s", naddr_ntoa(from.sin_addr.s_addr), ifp->int_name); continue; } switch (p->icmp.icmp_type) { case ICMP_ROUTERADVERT: if (ifp->int_state & IS_NO_ADV_IN) continue; if (p->ad.icmp_ad_asize*2*sizeof (wp[0]) < sizeof (p->ad.icmp_ad_info[0])) { msglim(&bad_asize, from.sin_addr.s_addr, "intolerable rdisc address size=%d", p->ad.icmp_ad_asize); continue; } if (p->ad.icmp_ad_num == 0) { trace_pkt(" empty?"); continue; } if (cc < (sizeof (p->ad) - sizeof (p->ad.icmp_ad_info) + (p->ad.icmp_ad_num * sizeof (p->ad.icmp_ad_info[0])))) { msglim(&bad_len, from.sin_addr.s_addr, "rdisc length %d does not match ad_num" " %d", cc, p->ad.icmp_ad_num); continue; } needsort = _B_TRUE; wp = &p->ad.icmp_ad_info[0].icmp_ad_addr; for (n = 0; n < p->ad.icmp_ad_num; n++) { parse_ad(from.sin_addr.s_addr, wp[0], wp[1], ntohs(p->ad.icmp_ad_life), ifp); wp += p->ad.icmp_ad_asize; } break; case ICMP_ROUTERSOLICIT: if (!should_supply(ifp)) continue; if ((ifp->int_state & IS_NO_ADV_OUT) || !IS_IFF_ROUTING(ifp->int_if_flags)) continue; if (stopint != 0) continue; /* * We should handle messages from address 0, * but cannot due to kernel limitations. */ /* Respond with a point-to-point advertisement */ send_adv(ifp, from.sin_addr.s_addr, 0); break; } } if (needsort) rdisc_sort(); } void rdisc_dump(void) { struct dr *drp; for (drp = drs; drp < &drs[max_ads]; drp++) if (drp->dr_ts != 0) trace_dr(drp); } void rdisc_suppress(struct interface *ifp) { if (ifp->int_state & IS_ADV_OUT) { msglog("%s \"rdisc_adv\" specified, will not " "suppress rdisc adv", ifp->int_name); } else { if (ifp->int_state & IS_SUPPRESS_RDISC) return; ifp->int_state |= (IS_SUPPRESS_RDISC|IS_FLUSH_RDISC); trace_misc("suppress rdisc adv on %s", ifp->int_name); rdisc_timer.tv_sec = 0; } } void rdisc_restore(struct interface *ifp) { if ((ifp->int_state & IS_SUPPRESS_RDISC) == 0) return; ifp->int_state &= ~(IS_SUPPRESS_RDISC|IS_FLUSH_RDISC); trace_misc("restoring rdisc adv on %s", ifp->int_name); rdisc_timer.tv_sec = 0; }