xref: /illumos-gate/usr/src/cmd/cmd-inet/usr.lib/in.ndpd/main.c (revision bcd524b5c10222cf2a1ef37ac7ea8bf1baa3a2ee)
1 /*
2  * CDDL HEADER START
3  *
4  * The contents of this file are subject to the terms of the
5  * Common Development and Distribution License (the "License").
6  * You may not use this file except in compliance with the License.
7  *
8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9  * or http://www.opensolaris.org/os/licensing.
10  * See the License for the specific language governing permissions
11  * and limitations under the License.
12  *
13  * When distributing Covered Code, include this CDDL HEADER in each
14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15  * If applicable, add the following below this CDDL HEADER, with the
16  * fields enclosed by brackets "[]" replaced with your own identifying
17  * information: Portions Copyright [yyyy] [name of copyright owner]
18  *
19  * CDDL HEADER END
20  */
21 /*
22  * Copyright 2007 Sun Microsystems, Inc.  All rights reserved.
23  * Use is subject to license terms.
24  */
25 
26 #pragma ident	"%Z%%M%	%I%	%E% SMI"
27 
28 #include "defs.h"
29 #include "tables.h"
30 #include <fcntl.h>
31 #include <sys/un.h>
32 
33 static void	initlog(void);
34 static void	run_timeouts(void);
35 
36 static void	advertise(struct sockaddr_in6 *sin6, struct phyint *pi,
37 		    boolean_t no_prefixes);
38 static void	solicit(struct sockaddr_in6 *sin6, struct phyint *pi);
39 static void	initifs(boolean_t first);
40 static void	check_if_removed(struct phyint *pi);
41 static void	loopback_ra_enqueue(struct phyint *pi,
42 		    struct nd_router_advert *ra, int len);
43 static void	loopback_ra_dequeue(void);
44 static void	check_daemonize(void);
45 
46 struct in6_addr all_nodes_mcast = { { 0xff, 0x2, 0x0, 0x0,
47 				    0x0, 0x0, 0x0, 0x0,
48 				    0x0, 0x0, 0x0, 0x0,
49 				    0x0, 0x0, 0x0, 0x1 } };
50 
51 struct in6_addr all_routers_mcast = { { 0xff, 0x2, 0x0, 0x0,
52 				    0x0, 0x0, 0x0, 0x0,
53 				    0x0, 0x0, 0x0, 0x0,
54 				    0x0, 0x0, 0x0, 0x2 } };
55 
56 static struct sockaddr_in6 v6allnodes = { AF_INET6, 0, 0,
57 				    { 0xff, 0x2, 0x0, 0x0,
58 				    0x0, 0x0, 0x0, 0x0,
59 				    0x0, 0x0, 0x0, 0x0,
60 				    0x0, 0x0, 0x0, 0x1 } };
61 
62 static struct sockaddr_in6 v6allrouters = { AF_INET6, 0, 0,
63 				    { 0xff, 0x2, 0x0, 0x0,
64 				    0x0, 0x0, 0x0, 0x0,
65 				    0x0, 0x0, 0x0, 0x0,
66 				    0x0, 0x0, 0x0, 0x2 } };
67 
68 static char **argv0;		/* Saved for re-exec on SIGHUP */
69 
70 static uint64_t packet[(IP_MAXPACKET + 1)/8];
71 
72 static int	show_ifs = 0;
73 static boolean_t	already_daemonized = _B_FALSE;
74 int		debug = 0;
75 int		no_loopback = 0; /* Do not send RA packets to ourselves */
76 
77 /*
78  * Size of routing socket message used by in.ndpd which includes the header,
79  * space for the RTA_DST, RTA_GATEWAY and RTA_NETMASK (each a sockaddr_in6)
80  * plus space for the RTA_IFP (a sockaddr_dl).
81  */
82 #define	NDP_RTM_MSGLEN	sizeof (struct rt_msghdr) +	\
83 			sizeof (struct sockaddr_in6) +	\
84 			sizeof (struct sockaddr_in6) +	\
85 			sizeof (struct sockaddr_in6) +	\
86 			sizeof (struct sockaddr_dl)
87 
88 /*
89  * These are referenced externally in tables.c in order to fill in the
90  * dynamic portions of the routing socket message and then to send the message
91  * itself.
92  */
93 int	rtsock = -1;			/* Routing socket */
94 struct	rt_msghdr	*rt_msg;	/* Routing socket message */
95 struct	sockaddr_in6	*rta_gateway;	/* RTA_GATEWAY sockaddr */
96 struct	sockaddr_dl	*rta_ifp;	/* RTA_IFP sockaddr */
97 int	mibsock = -1;			/* mib request socket */
98 
99 /*
100  * Return the current time in milliseconds truncated to
101  * fit in an integer.
102  */
103 uint_t
104 getcurrenttime(void)
105 {
106 	struct timeval tp;
107 
108 	if (gettimeofday(&tp, NULL) < 0) {
109 		logperror("getcurrenttime: gettimeofday failed");
110 		exit(1);
111 	}
112 	return (tp.tv_sec * 1000 + tp.tv_usec / 1000);
113 }
114 
115 /*
116  * Output a preformated packet from the packet[] buffer.
117  */
118 static void
119 sendpacket(struct sockaddr_in6 *sin6, int sock, int size, int flags)
120 {
121 	int cc;
122 	char abuf[INET6_ADDRSTRLEN];
123 
124 	cc = sendto(sock, (char *)packet, size, flags,
125 		(struct sockaddr *)sin6, sizeof (*sin6));
126 	if (cc < 0 || cc != size) {
127 		if (cc < 0) {
128 			logperror("sendpacket: sendto");
129 		}
130 		logmsg(LOG_ERR, "sendpacket: wrote %s %d chars, ret=%d\n",
131 		    inet_ntop(sin6->sin6_family,
132 		    (void *)&sin6->sin6_addr,
133 		    abuf, sizeof (abuf)),
134 		    size, cc);
135 	}
136 }
137 
138 /* Send a Router Solicitation */
139 static void
140 solicit(struct sockaddr_in6 *sin6, struct phyint *pi)
141 {
142 	int packetlen = 0;
143 	struct	nd_router_solicit *rs = (struct nd_router_solicit *)packet;
144 	char *pptr = (char *)packet;
145 
146 	rs->nd_rs_type = ND_ROUTER_SOLICIT;
147 	rs->nd_rs_code = 0;
148 	rs->nd_rs_cksum = htons(0);
149 	rs->nd_rs_reserved = htonl(0);
150 
151 	packetlen += sizeof (*rs);
152 	pptr += sizeof (*rs);
153 
154 	/* Attach any options */
155 	if (pi->pi_hdw_addr_len != 0) {
156 		struct nd_opt_lla *lo = (struct nd_opt_lla *)pptr;
157 		int optlen;
158 
159 		/* roundup to multiple of 8 and make padding zero */
160 		optlen = ((sizeof (struct nd_opt_hdr) +
161 		    pi->pi_hdw_addr_len + 7) / 8) * 8;
162 		bzero(pptr, optlen);
163 
164 		lo->nd_opt_lla_type = ND_OPT_SOURCE_LINKADDR;
165 		lo->nd_opt_lla_len = optlen / 8;
166 		bcopy((char *)pi->pi_hdw_addr,
167 		    (char *)lo->nd_opt_lla_hdw_addr,
168 		    pi->pi_hdw_addr_len);
169 		packetlen += optlen;
170 		pptr += optlen;
171 	}
172 
173 	if (debug & D_PKTOUT) {
174 		print_route_sol("Sending solicitation to ", pi, rs, packetlen,
175 		    sin6);
176 	}
177 	sendpacket(sin6, pi->pi_sock, packetlen, 0);
178 }
179 
180 /*
181  * Send a (set of) Router Advertisements and feed them back to ourselves
182  * for processing. Unless no_prefixes is set all prefixes are included.
183  * If there are too many prefix options to fit in one packet multiple
184  * packets will be sent - each containing a subset of the prefix options.
185  */
186 static void
187 advertise(struct sockaddr_in6 *sin6, struct phyint *pi, boolean_t no_prefixes)
188 {
189 	struct	nd_opt_prefix_info *po;
190 	char *pptr = (char *)packet;
191 	struct nd_router_advert *ra;
192 	struct adv_prefix *adv_pr;
193 	int packetlen = 0;
194 
195 	ra = (struct nd_router_advert *)pptr;
196 	ra->nd_ra_type = ND_ROUTER_ADVERT;
197 	ra->nd_ra_code = 0;
198 	ra->nd_ra_cksum = htons(0);
199 	ra->nd_ra_curhoplimit = pi->pi_AdvCurHopLimit;
200 	ra->nd_ra_flags_reserved = 0;
201 	if (pi->pi_AdvManagedFlag)
202 		ra->nd_ra_flags_reserved |= ND_RA_FLAG_MANAGED;
203 	if (pi->pi_AdvOtherConfigFlag)
204 		ra->nd_ra_flags_reserved |= ND_RA_FLAG_OTHER;
205 
206 	if (pi->pi_adv_state == FINAL_ADV)
207 		ra->nd_ra_router_lifetime = htons(0);
208 	else
209 		ra->nd_ra_router_lifetime = htons(pi->pi_AdvDefaultLifetime);
210 	ra->nd_ra_reachable = htonl(pi->pi_AdvReachableTime);
211 	ra->nd_ra_retransmit = htonl(pi->pi_AdvRetransTimer);
212 
213 	packetlen = sizeof (*ra);
214 	pptr += sizeof (*ra);
215 
216 	if (pi->pi_adv_state == FINAL_ADV) {
217 		if (debug & D_PKTOUT) {
218 			print_route_adv("Sending advert (FINAL) to ", pi,
219 			    ra, packetlen, sin6);
220 		}
221 		sendpacket(sin6, pi->pi_sock, packetlen, 0);
222 		/* Feed packet back in for router operation */
223 		loopback_ra_enqueue(pi, ra, packetlen);
224 		return;
225 	}
226 
227 	/* Attach any options */
228 	if (pi->pi_hdw_addr_len != 0) {
229 		struct nd_opt_lla *lo = (struct nd_opt_lla *)pptr;
230 		int optlen;
231 
232 		/* roundup to multiple of 8 and make padding zero */
233 		optlen = ((sizeof (struct nd_opt_hdr) +
234 		    pi->pi_hdw_addr_len + 7) / 8) * 8;
235 		bzero(pptr, optlen);
236 
237 		lo->nd_opt_lla_type = ND_OPT_SOURCE_LINKADDR;
238 		lo->nd_opt_lla_len = optlen / 8;
239 		bcopy((char *)pi->pi_hdw_addr,
240 		    (char *)lo->nd_opt_lla_hdw_addr,
241 		    pi->pi_hdw_addr_len);
242 		packetlen += optlen;
243 		pptr += optlen;
244 	}
245 
246 	if (pi->pi_AdvLinkMTU != 0) {
247 		struct nd_opt_mtu *mo = (struct nd_opt_mtu *)pptr;
248 
249 		mo->nd_opt_mtu_type = ND_OPT_MTU;
250 		mo->nd_opt_mtu_len = sizeof (struct nd_opt_mtu) / 8;
251 		mo->nd_opt_mtu_reserved = 0;
252 		mo->nd_opt_mtu_mtu = htonl(pi->pi_AdvLinkMTU);
253 
254 		packetlen += sizeof (struct nd_opt_mtu);
255 		pptr += sizeof (struct nd_opt_mtu);
256 	}
257 
258 	if (no_prefixes) {
259 		if (debug & D_PKTOUT) {
260 			print_route_adv("Sending advert to ", pi,
261 			    ra, packetlen, sin6);
262 		}
263 		sendpacket(sin6, pi->pi_sock, packetlen, 0);
264 		/* Feed packet back in for router operation */
265 		loopback_ra_enqueue(pi, ra, packetlen);
266 		return;
267 	}
268 
269 	po = (struct nd_opt_prefix_info *)pptr;
270 	for (adv_pr = pi->pi_adv_prefix_list; adv_pr != NULL;
271 	    adv_pr = adv_pr->adv_pr_next) {
272 		if (!adv_pr->adv_pr_AdvOnLinkFlag &&
273 		    !adv_pr->adv_pr_AdvAutonomousFlag) {
274 			continue;
275 		}
276 
277 		/*
278 		 * If the prefix doesn't fit in packet send
279 		 * what we have so far and start with new packet.
280 		 */
281 		if (packetlen + sizeof (*po) >
282 		    pi->pi_LinkMTU - sizeof (struct ip6_hdr)) {
283 			if (debug & D_PKTOUT) {
284 				print_route_adv("Sending advert "
285 				    "(FRAG) to ",
286 				    pi, ra, packetlen, sin6);
287 			}
288 			sendpacket(sin6, pi->pi_sock, packetlen, 0);
289 			/* Feed packet back in for router operation */
290 			loopback_ra_enqueue(pi, ra, packetlen);
291 			packetlen = sizeof (*ra);
292 			pptr = (char *)packet + sizeof (*ra);
293 			po = (struct nd_opt_prefix_info *)pptr;
294 		}
295 		po->nd_opt_pi_type = ND_OPT_PREFIX_INFORMATION;
296 		po->nd_opt_pi_len = sizeof (*po)/8;
297 		po->nd_opt_pi_flags_reserved = 0;
298 		if (adv_pr->adv_pr_AdvOnLinkFlag) {
299 			po->nd_opt_pi_flags_reserved |=
300 			    ND_OPT_PI_FLAG_ONLINK;
301 		}
302 		if (adv_pr->adv_pr_AdvAutonomousFlag) {
303 			po->nd_opt_pi_flags_reserved |=
304 			    ND_OPT_PI_FLAG_AUTO;
305 		}
306 		po->nd_opt_pi_prefix_len = adv_pr->adv_pr_prefix_len;
307 		/*
308 		 * If both Adv*Expiration and Adv*Lifetime are
309 		 * set we prefer the former and make the lifetime
310 		 * decrement in real time.
311 		 */
312 		if (adv_pr->adv_pr_AdvValidRealTime) {
313 			po->nd_opt_pi_valid_time =
314 			    htonl(adv_pr->adv_pr_AdvValidExpiration);
315 		} else {
316 			po->nd_opt_pi_valid_time =
317 			    htonl(adv_pr->adv_pr_AdvValidLifetime);
318 		}
319 		if (adv_pr->adv_pr_AdvPreferredRealTime) {
320 			po->nd_opt_pi_preferred_time =
321 			    htonl(adv_pr->adv_pr_AdvPreferredExpiration);
322 		} else {
323 			po->nd_opt_pi_preferred_time =
324 			    htonl(adv_pr->adv_pr_AdvPreferredLifetime);
325 		}
326 		po->nd_opt_pi_reserved2 = htonl(0);
327 		po->nd_opt_pi_prefix = adv_pr->adv_pr_prefix;
328 
329 		po++;
330 		packetlen += sizeof (*po);
331 	}
332 	if (debug & D_PKTOUT) {
333 		print_route_adv("Sending advert to ", pi,
334 		    ra, packetlen, sin6);
335 	}
336 	sendpacket(sin6, pi->pi_sock, packetlen, 0);
337 	/* Feed packet back in for router operation */
338 	loopback_ra_enqueue(pi, ra, packetlen);
339 }
340 
341 /* Poll support */
342 static int		pollfd_num = 0;	/* Allocated and initialized */
343 static struct pollfd	*pollfds = NULL;
344 
345 /*
346  * Add fd to the set being polled. Returns 0 if ok; -1 if failed.
347  */
348 int
349 poll_add(int fd)
350 {
351 	int i;
352 	int new_num;
353 	struct pollfd *newfds;
354 
355 	/* Check if already present */
356 	for (i = 0; i < pollfd_num; i++) {
357 		if (pollfds[i].fd == fd)
358 			return (0);
359 	}
360 	/* Check for empty spot already present */
361 	for (i = 0; i < pollfd_num; i++) {
362 		if (pollfds[i].fd == -1) {
363 			pollfds[i].fd = fd;
364 			return (0);
365 		}
366 	}
367 
368 	/* Allocate space for 32 more fds and initialize to -1 */
369 	new_num = pollfd_num + 32;
370 	newfds = realloc(pollfds, new_num * sizeof (struct pollfd));
371 	if (newfds == NULL) {
372 		logperror("poll_add: realloc");
373 		return (-1);
374 	}
375 
376 	newfds[pollfd_num].fd = fd;
377 	newfds[pollfd_num++].events = POLLIN;
378 
379 	for (i = pollfd_num; i < new_num; i++) {
380 		newfds[i].fd = -1;
381 		newfds[i].events = POLLIN;
382 	}
383 	pollfd_num = new_num;
384 	pollfds = newfds;
385 	return (0);
386 }
387 
388 /*
389  * Remove fd from the set being polled. Returns 0 if ok; -1 if failed.
390  */
391 int
392 poll_remove(int fd)
393 {
394 	int i;
395 
396 	/* Check if already present */
397 	for (i = 0; i < pollfd_num; i++) {
398 		if (pollfds[i].fd == fd) {
399 			pollfds[i].fd = -1;
400 			return (0);
401 		}
402 	}
403 	return (-1);
404 }
405 
406 /*
407  * Extract information about the ifname (either a physical interface and
408  * the ":0" logical interface or just a logical interface).
409  * If the interface (still) exists in kernel set pr_in_use
410  * for caller to be able to detect interfaces that are removed.
411  * Starts sending advertisements/solicitations when new physical interfaces
412  * are detected.
413  */
414 static void
415 if_process(int s, char *ifname, boolean_t first)
416 {
417 	struct lifreq lifr;
418 	struct phyint *pi;
419 	struct prefix *pr;
420 	char *cp;
421 	char phyintname[LIFNAMSIZ + 1];
422 
423 	if (debug & D_IFSCAN)
424 		logmsg(LOG_DEBUG, "if_process(%s)\n", ifname);
425 
426 	(void) strncpy(lifr.lifr_name, ifname, sizeof (lifr.lifr_name));
427 	lifr.lifr_name[sizeof (lifr.lifr_name) - 1] = '\0';
428 	if (ioctl(s, SIOCGLIFFLAGS, (char *)&lifr) < 0) {
429 		if (errno == ENXIO) {
430 			/*
431 			 * Interface has disappeared
432 			 */
433 			return;
434 		}
435 		logperror("if_process: ioctl (get interface flags)");
436 		return;
437 	}
438 
439 	/*
440 	 * Ignore loopback and point-to-multipoint interfaces.
441 	 * Point-to-point interfaces always have IFF_MULTICAST set.
442 	 */
443 	if (!(lifr.lifr_flags & IFF_MULTICAST) ||
444 	    (lifr.lifr_flags & IFF_LOOPBACK)) {
445 		return;
446 	}
447 
448 	if (!(lifr.lifr_flags & IFF_IPV6))
449 		return;
450 
451 	(void) strncpy(phyintname, ifname, sizeof (phyintname));
452 	phyintname[sizeof (phyintname) - 1] = '\0';
453 	if ((cp = strchr(phyintname, IF_SEPARATOR)) != NULL) {
454 		*cp = '\0';
455 	}
456 
457 	pi = phyint_lookup(phyintname);
458 	if (pi == NULL) {
459 		/*
460 		 * Do not add anything for new interfaces until they are UP.
461 		 * For existing interfaces we track the up flag.
462 		 */
463 		if (!(lifr.lifr_flags & IFF_UP))
464 			return;
465 
466 		pi = phyint_create(phyintname);
467 		if (pi == NULL) {
468 			logmsg(LOG_ERR, "if_process: out of memory\n");
469 			return;
470 		}
471 	}
472 	(void) phyint_init_from_k(pi);
473 	if (pi->pi_sock == -1 && !(pi->pi_kernel_state & PI_PRESENT)) {
474 		/* Interface is not yet present */
475 		if (debug & D_PHYINT) {
476 			logmsg(LOG_DEBUG, "if_process: interface not yet "
477 			    "present %s\n", pi->pi_name);
478 		}
479 		return;
480 	}
481 
482 	if (pi->pi_sock != -1) {
483 		if (poll_add(pi->pi_sock) == -1) {
484 			/*
485 			 * reset state.
486 			 */
487 			phyint_cleanup(pi);
488 		}
489 	}
490 
491 	/*
492 	 * Check if IFF_ROUTER has been turned off in kernel in which
493 	 * case we have to turn off AdvSendAdvertisements.
494 	 * The kernel will automatically turn off IFF_ROUTER if
495 	 * ip6_forwarding is turned off.
496 	 * Note that we do not switch back should IFF_ROUTER be turned on.
497 	 */
498 	if (!first &&
499 	    pi->pi_AdvSendAdvertisements && !(pi->pi_flags & IFF_ROUTER)) {
500 		logmsg(LOG_INFO, "No longer a router on %s\n", pi->pi_name);
501 		check_to_advertise(pi, START_FINAL_ADV);
502 
503 		pi->pi_AdvSendAdvertisements = 0;
504 		pi->pi_sol_state = NO_SOLICIT;
505 	}
506 
507 	/*
508 	 * Send advertisments and solicitation only if the interface is
509 	 * present in the kernel.
510 	 */
511 	if (pi->pi_kernel_state & PI_PRESENT) {
512 
513 		if (pi->pi_AdvSendAdvertisements) {
514 			if (pi->pi_adv_state == NO_ADV)
515 				check_to_advertise(pi, START_INIT_ADV);
516 		} else {
517 			if (pi->pi_sol_state == NO_SOLICIT)
518 				check_to_solicit(pi, START_INIT_SOLICIT);
519 		}
520 	}
521 
522 	/*
523 	 * Track static kernel prefixes to prevent in.ndpd from clobbering
524 	 * them by creating a struct prefix for each prefix detected in the
525 	 * kernel.
526 	 */
527 	pr = prefix_lookup_name(pi, ifname);
528 	if (pr == NULL) {
529 		pr = prefix_create_name(pi, ifname);
530 		if (pr == NULL) {
531 			logmsg(LOG_ERR, "if_process: out of memory\n");
532 			return;
533 		}
534 		if (prefix_init_from_k(pr) == -1) {
535 			prefix_delete(pr);
536 			return;
537 		}
538 	}
539 	/* Detect prefixes which are removed */
540 	if (pr->pr_kernel_state != 0)
541 		pr->pr_in_use = _B_TRUE;
542 
543 	if ((lifr.lifr_flags & IFF_DUPLICATE) &&
544 	    !(lifr.lifr_flags & IFF_DHCPRUNNING) &&
545 	    (pr->pr_flags & IFF_TEMPORARY)) {
546 		in6_addr_t *token;
547 		int i;
548 		char abuf[INET6_ADDRSTRLEN];
549 
550 		if (++pr->pr_attempts >= MAX_DAD_FAILURES) {
551 			logmsg(LOG_ERR, "%s: token %s is duplicate after %d "
552 			    "attempts; disabling temporary addresses on %s",
553 			    pr->pr_name, inet_ntop(AF_INET6,
554 			    (void *)&pi->pi_tmp_token, abuf, sizeof (abuf)),
555 			    pr->pr_attempts, pi->pi_name);
556 			pi->pi_TmpAddrsEnabled = 0;
557 			tmptoken_delete(pi);
558 			prefix_delete(pr);
559 			return;
560 		}
561 		logmsg(LOG_WARNING, "%s: token %s is duplicate; trying again",
562 		    pr->pr_name, inet_ntop(AF_INET6, (void *)&pi->pi_tmp_token,
563 		    abuf, sizeof (abuf)));
564 		if (!tmptoken_create(pi)) {
565 			prefix_delete(pr);
566 			return;
567 		}
568 		token = &pi->pi_tmp_token;
569 		for (i = 0; i < 16; i++) {
570 			/*
571 			 * prefix_create ensures that pr_prefix has all-zero
572 			 * bits after prefixlen.
573 			 */
574 			pr->pr_address.s6_addr[i] = pr->pr_prefix.s6_addr[i] |
575 			    token->s6_addr[i];
576 		}
577 		if (prefix_lookup_addr_match(pr) != NULL) {
578 			prefix_delete(pr);
579 			return;
580 		}
581 		pr->pr_CreateTime = getcurrenttime() / MILLISEC;
582 		/*
583 		 * We've got a new token.  Clearing PR_AUTO causes
584 		 * prefix_update_k to bring the interface up and set the
585 		 * address.
586 		 */
587 		pr->pr_kernel_state &= ~PR_AUTO;
588 		prefix_update_k(pr);
589 	}
590 }
591 
592 static int ifsock = -1;
593 
594 /*
595  * Scan all interfaces to detect changes as well as new and deleted intefaces
596  * 'first' is set for the initial call only. Do not effect anything.
597  */
598 static void
599 initifs(boolean_t first)
600 {
601 	char *buf;
602 	int bufsize;
603 	int numifs;
604 	int n;
605 	struct lifnum lifn;
606 	struct lifconf lifc;
607 	struct lifreq *lifr;
608 	struct phyint *pi;
609 	struct phyint *next_pi;
610 	struct prefix *pr;
611 
612 	if (debug & D_IFSCAN)
613 		logmsg(LOG_DEBUG, "Reading interface configuration\n");
614 	if (ifsock < 0) {
615 		ifsock = socket(AF_INET6, SOCK_DGRAM, 0);
616 		if (ifsock < 0) {
617 			logperror("initifs: socket");
618 			return;
619 		}
620 	}
621 	lifn.lifn_family = AF_INET6;
622 	lifn.lifn_flags = LIFC_NOXMIT | LIFC_TEMPORARY;
623 	if (ioctl(ifsock, SIOCGLIFNUM, (char *)&lifn) < 0) {
624 		logperror("initifs: ioctl (get interface numbers)");
625 		return;
626 	}
627 	numifs = lifn.lifn_count;
628 	bufsize = numifs * sizeof (struct lifreq);
629 
630 	buf = (char *)malloc(bufsize);
631 	if (buf == NULL) {
632 		logmsg(LOG_ERR, "initifs: out of memory\n");
633 		return;
634 	}
635 
636 	/*
637 	 * Mark the interfaces so that we can find phyints and prefixes
638 	 * which have disappeared from the kernel.
639 	 * if_process will set pr_in_use when it finds the interface
640 	 * in the kernel.
641 	 */
642 	for (pi = phyints; pi != NULL; pi = pi->pi_next) {
643 		/*
644 		 * Before re-examining the state of the interfaces,
645 		 * PI_PRESENT should be cleared from pi_kernel_state.
646 		 */
647 		pi->pi_kernel_state &= ~PI_PRESENT;
648 		for (pr = pi->pi_prefix_list; pr != NULL; pr = pr->pr_next) {
649 			pr->pr_in_use = _B_FALSE;
650 		}
651 	}
652 
653 	lifc.lifc_family = AF_INET6;
654 	lifc.lifc_flags = LIFC_NOXMIT | LIFC_TEMPORARY;
655 	lifc.lifc_len = bufsize;
656 	lifc.lifc_buf = buf;
657 
658 	if (ioctl(ifsock, SIOCGLIFCONF, (char *)&lifc) < 0) {
659 		logperror("initifs: ioctl (get interface configuration)");
660 		free(buf);
661 		return;
662 	}
663 
664 	lifr = (struct lifreq *)lifc.lifc_req;
665 	for (n = lifc.lifc_len / sizeof (struct lifreq); n > 0; n--, lifr++)
666 		if_process(ifsock, lifr->lifr_name, first);
667 	free(buf);
668 
669 	/*
670 	 * Detect phyints that have been removed from the kernel.
671 	 * Since we can't recreate it here (would require ifconfig plumb
672 	 * logic) we just terminate use of that phyint.
673 	 */
674 	for (pi = phyints; pi != NULL; pi = next_pi) {
675 		next_pi = pi->pi_next;
676 		/*
677 		 * If interface (still) exists in kernel, set
678 		 * pi_state to indicate that.
679 		 */
680 		if (pi->pi_kernel_state & PI_PRESENT) {
681 			pi->pi_state |= PI_PRESENT;
682 		}
683 
684 		check_if_removed(pi);
685 	}
686 	if (show_ifs)
687 		phyint_print_all();
688 }
689 
690 
691 /*
692  * Router advertisement state machine. Used for everything but timer
693  * events which use advertise_event directly.
694  */
695 void
696 check_to_advertise(struct phyint *pi, enum adv_events event)
697 {
698 	uint_t delay;
699 	enum adv_states old_state = pi->pi_adv_state;
700 
701 	if (debug & D_STATE) {
702 		logmsg(LOG_DEBUG, "check_to_advertise(%s, %d) state %d\n",
703 		    pi->pi_name, (int)event, (int)old_state);
704 	}
705 	delay = advertise_event(pi, event, 0);
706 	if (delay != TIMER_INFINITY) {
707 		/* Make sure the global next event is updated */
708 		timer_schedule(delay);
709 	}
710 
711 	if (debug & D_STATE) {
712 		logmsg(LOG_DEBUG, "check_to_advertise(%s, %d) state %d -> %d\n",
713 		    pi->pi_name, (int)event, (int)old_state,
714 		    (int)pi->pi_adv_state);
715 	}
716 }
717 
718 /*
719  * Router advertisement state machine.
720  * Return the number of milliseconds until next timeout (TIMER_INFINITY
721  * if never).
722  * For the ADV_TIMER event the caller passes in the number of milliseconds
723  * since the last timer event in the 'elapsed' parameter.
724  */
725 uint_t
726 advertise_event(struct phyint *pi, enum adv_events event, uint_t elapsed)
727 {
728 	uint_t delay;
729 
730 	if (debug & D_STATE) {
731 		logmsg(LOG_DEBUG, "advertise_event(%s, %d, %d) state %d\n",
732 		    pi->pi_name, (int)event, elapsed, (int)pi->pi_adv_state);
733 	}
734 	check_daemonize();
735 	if (!pi->pi_AdvSendAdvertisements)
736 		return (TIMER_INFINITY);
737 	if (pi->pi_flags & IFF_NORTEXCH) {
738 		if (debug & D_PKTOUT) {
739 			logmsg(LOG_DEBUG, "Suppress sending RA packet on %s "
740 			    "(no route exchange on interface)\n",
741 			    pi->pi_name);
742 		}
743 		return (TIMER_INFINITY);
744 	}
745 
746 	switch (event) {
747 	case ADV_OFF:
748 		pi->pi_adv_state = NO_ADV;
749 		return (TIMER_INFINITY);
750 
751 	case START_INIT_ADV:
752 		if (pi->pi_adv_state == INIT_ADV)
753 			return (pi->pi_adv_time_left);
754 		pi->pi_adv_count = ND_MAX_INITIAL_RTR_ADVERTISEMENTS;
755 		pi->pi_adv_time_left = 0;
756 		pi->pi_adv_state = INIT_ADV;
757 		break;	/* send advertisement */
758 
759 	case START_FINAL_ADV:
760 		if (pi->pi_adv_state == NO_ADV)
761 			return (TIMER_INFINITY);
762 		if (pi->pi_adv_state == FINAL_ADV)
763 			return (pi->pi_adv_time_left);
764 		pi->pi_adv_count = ND_MAX_FINAL_RTR_ADVERTISEMENTS;
765 		pi->pi_adv_time_left = 0;
766 		pi->pi_adv_state = FINAL_ADV;
767 		break;	/* send advertisement */
768 
769 	case RECEIVED_SOLICIT:
770 		if (pi->pi_adv_state == NO_ADV)
771 			return (TIMER_INFINITY);
772 		if (pi->pi_adv_state == SOLICIT_ADV) {
773 			if (pi->pi_adv_time_left != 0)
774 				return (pi->pi_adv_time_left);
775 			break;
776 		}
777 		delay = GET_RANDOM(0, ND_MAX_RA_DELAY_TIME);
778 		if (delay < pi->pi_adv_time_left)
779 			pi->pi_adv_time_left = delay;
780 		if (pi->pi_adv_time_since_sent < ND_MIN_DELAY_BETWEEN_RAS) {
781 			/*
782 			 * Send an advertisement (ND_MIN_DELAY_BETWEEN_RAS
783 			 * plus random delay) after the previous
784 			 * advertisement was sent.
785 			 */
786 			pi->pi_adv_time_left = delay +
787 			    ND_MIN_DELAY_BETWEEN_RAS -
788 			    pi->pi_adv_time_since_sent;
789 		}
790 		pi->pi_adv_state = SOLICIT_ADV;
791 		break;
792 
793 	case ADV_TIMER:
794 		if (pi->pi_adv_state == NO_ADV)
795 			return (TIMER_INFINITY);
796 		/* Decrease time left */
797 		if (pi->pi_adv_time_left >= elapsed)
798 			pi->pi_adv_time_left -= elapsed;
799 		else
800 			pi->pi_adv_time_left = 0;
801 
802 		/* Increase time since last advertisement was sent */
803 		pi->pi_adv_time_since_sent += elapsed;
804 		break;
805 	default:
806 		logmsg(LOG_ERR, "advertise_event: Unknown event %d\n",
807 		    (int)event);
808 		return (TIMER_INFINITY);
809 	}
810 
811 	if (pi->pi_adv_time_left != 0)
812 		return (pi->pi_adv_time_left);
813 
814 	/* Send advertisement and calculate next time to send */
815 	if (pi->pi_adv_state == FINAL_ADV) {
816 		/* Omit the prefixes */
817 		advertise(&v6allnodes, pi, _B_TRUE);
818 	} else {
819 		advertise(&v6allnodes, pi, _B_FALSE);
820 	}
821 	pi->pi_adv_time_since_sent = 0;
822 
823 	switch (pi->pi_adv_state) {
824 	case SOLICIT_ADV:
825 		/*
826 		 * The solicited advertisement has been sent.
827 		 * Revert to periodic advertisements.
828 		 */
829 		pi->pi_adv_state = REG_ADV;
830 		/* FALLTHRU */
831 	case REG_ADV:
832 		pi->pi_adv_time_left =
833 		    GET_RANDOM(1000 * pi->pi_MinRtrAdvInterval,
834 		    1000 * pi->pi_MaxRtrAdvInterval);
835 		break;
836 
837 	case INIT_ADV:
838 		if (--pi->pi_adv_count > 0) {
839 			delay = GET_RANDOM(1000 * pi->pi_MinRtrAdvInterval,
840 			    1000 * pi->pi_MaxRtrAdvInterval);
841 			if (delay > ND_MAX_INITIAL_RTR_ADVERT_INTERVAL)
842 				delay = ND_MAX_INITIAL_RTR_ADVERT_INTERVAL;
843 			pi->pi_adv_time_left = delay;
844 		} else {
845 			pi->pi_adv_time_left =
846 			    GET_RANDOM(1000 * pi->pi_MinRtrAdvInterval,
847 			    1000 * pi->pi_MaxRtrAdvInterval);
848 			pi->pi_adv_state = REG_ADV;
849 		}
850 		break;
851 
852 	case FINAL_ADV:
853 		if (--pi->pi_adv_count > 0) {
854 			pi->pi_adv_time_left =
855 			    ND_MAX_INITIAL_RTR_ADVERT_INTERVAL;
856 		} else {
857 			pi->pi_adv_state = NO_ADV;
858 		}
859 		break;
860 	}
861 	if (pi->pi_adv_state != NO_ADV)
862 		return (pi->pi_adv_time_left);
863 	else
864 		return (TIMER_INFINITY);
865 }
866 
867 /*
868  * Router solicitation state machine. Used for everything but timer
869  * events which use solicit_event directly.
870  */
871 void
872 check_to_solicit(struct phyint *pi, enum solicit_events event)
873 {
874 	uint_t delay;
875 	enum solicit_states old_state = pi->pi_sol_state;
876 
877 	if (debug & D_STATE) {
878 		logmsg(LOG_DEBUG, "check_to_solicit(%s, %d) state %d\n",
879 		    pi->pi_name, (int)event, (int)old_state);
880 	}
881 	delay = solicit_event(pi, event, 0);
882 	if (delay != TIMER_INFINITY) {
883 		/* Make sure the global next event is updated */
884 		timer_schedule(delay);
885 	}
886 
887 	if (debug & D_STATE) {
888 		logmsg(LOG_DEBUG, "check_to_solicit(%s, %d) state %d -> %d\n",
889 		    pi->pi_name, (int)event, (int)old_state,
890 		    (int)pi->pi_sol_state);
891 	}
892 }
893 
894 static void
895 daemonize_ndpd(void)
896 {
897 	FILE *pidfp;
898 	mode_t pidmode = (S_IRUSR | S_IWUSR | S_IRGRP | S_IROTH); /* 0644 */
899 	struct itimerval it;
900 	boolean_t timerval = _B_TRUE;
901 
902 	/*
903 	 * Need to get current timer settings so they can be restored
904 	 * after the fork(), as the it_value and it_interval values for
905 	 * the ITIMER_REAL timer are reset to 0 in the child process.
906 	 */
907 	if (getitimer(ITIMER_REAL, &it) < 0) {
908 		if (debug & D_TIMER)
909 			logmsg(LOG_DEBUG,
910 			    "daemonize_ndpd: failed to get itimerval\n");
911 		timerval = _B_FALSE;
912 	}
913 
914 	/* Daemonize. */
915 	switch (fork()) {
916 	case 0:
917 		/* Child */
918 		break;
919 	case -1:
920 		logperror("fork");
921 		exit(1);
922 	default:
923 		/* Parent */
924 		_exit(0);
925 	}
926 
927 	/* Store our process id, blow away any existing file if it exists. */
928 	if ((pidfp = fopen(PATH_PID, "w")) == NULL) {
929 		(void) fprintf(stderr, "%s: unable to open " PATH_PID ": %s\n",
930 		    argv0[0], strerror(errno));
931 	} else {
932 		(void) fprintf(pidfp, "%ld\n", getpid());
933 		(void) fclose(pidfp);
934 		(void) chmod(PATH_PID, pidmode);
935 	}
936 
937 	(void) close(0);
938 	(void) close(1);
939 	(void) close(2);
940 
941 	(void) chdir("/");
942 	(void) open("/dev/null", O_RDWR);
943 	(void) dup2(0, 1);
944 	(void) dup2(0, 2);
945 	(void) setsid();
946 
947 	already_daemonized = _B_TRUE;
948 
949 	/*
950 	 * Restore timer values, if we were able to save them; if not,
951 	 * check and set the right value by calling run_timeouts().
952 	 */
953 	if (timerval) {
954 		if (setitimer(ITIMER_REAL, &it, NULL) < 0) {
955 			logperror("daemonize_ndpd: setitimer");
956 			exit(2);
957 		}
958 	} else {
959 		run_timeouts();
960 	}
961 }
962 
963 /*
964  * Check to see if the time is right to daemonize.  The right time is when:
965  *
966  * 1.  We haven't already daemonized.
967  * 2.  We are not in debug mode.
968  * 3.  All interfaces are marked IFF_NOXMIT.
969  * 4.  All non-router interfaces have their prefixes set up and we're
970  *     done sending router solicitations on those interfaces without
971  *     prefixes.
972  */
973 static void
974 check_daemonize(void)
975 {
976 	struct phyint		*pi;
977 
978 	if (already_daemonized || debug != 0)
979 		return;
980 
981 	for (pi = phyints; pi != NULL; pi = pi->pi_next) {
982 		if (!(pi->pi_flags & IFF_NOXMIT))
983 			break;
984 	}
985 
986 	/*
987 	 * If we can't transmit on any of the interfaces there is no reason
988 	 * to hold up progress.
989 	 */
990 	if (pi == NULL) {
991 		daemonize_ndpd();
992 		return;
993 	}
994 
995 	/* Check all interfaces.  If any are still soliciting, just return. */
996 	for (pi = phyints; pi != NULL; pi = pi->pi_next) {
997 		if (pi->pi_AdvSendAdvertisements ||
998 		    !(pi->pi_kernel_state & PI_PRESENT))
999 			continue;
1000 
1001 		if (pi->pi_sol_state == INIT_SOLICIT)
1002 			return;
1003 	}
1004 
1005 	daemonize_ndpd();
1006 }
1007 
1008 /*
1009  * Router solicitation state machine.
1010  * Return the number of milliseconds until next timeout (TIMER_INFINITY
1011  * if never).
1012  * For the SOL_TIMER event the caller passes in the number of milliseconds
1013  * since the last timer event in the 'elapsed' parameter.
1014  */
1015 uint_t
1016 solicit_event(struct phyint *pi, enum solicit_events event, uint_t elapsed)
1017 {
1018 	if (debug & D_STATE) {
1019 		logmsg(LOG_DEBUG, "solicit_event(%s, %d, %d) state %d\n",
1020 		    pi->pi_name, (int)event, elapsed, (int)pi->pi_sol_state);
1021 	}
1022 
1023 	if (pi->pi_AdvSendAdvertisements)
1024 		return (TIMER_INFINITY);
1025 	if (pi->pi_flags & IFF_NORTEXCH) {
1026 		if (debug & D_PKTOUT) {
1027 			logmsg(LOG_DEBUG, "Suppress sending RS packet on %s "
1028 			    "(no route exchange on interface)\n",
1029 			    pi->pi_name);
1030 		}
1031 		return (TIMER_INFINITY);
1032 	}
1033 
1034 	switch (event) {
1035 	case SOLICIT_OFF:
1036 		pi->pi_sol_state = NO_SOLICIT;
1037 		check_daemonize();
1038 		return (TIMER_INFINITY);
1039 
1040 	case SOLICIT_DONE:
1041 		pi->pi_sol_state = DONE_SOLICIT;
1042 		check_daemonize();
1043 		return (TIMER_INFINITY);
1044 
1045 	case RESTART_INIT_SOLICIT:
1046 		/*
1047 		 * This event allows us to start solicitation over again
1048 		 * without losing the RA flags.  We start solicitation over
1049 		 * when we are missing an interface prefix for a newly-
1050 		 * encountered DHCP interface.
1051 		 */
1052 		if (pi->pi_sol_state == INIT_SOLICIT)
1053 			return (pi->pi_sol_time_left);
1054 		pi->pi_sol_count = ND_MAX_RTR_SOLICITATIONS;
1055 		pi->pi_sol_time_left =
1056 		    GET_RANDOM(0, ND_MAX_RTR_SOLICITATION_DELAY);
1057 		pi->pi_sol_state = INIT_SOLICIT;
1058 		break;
1059 
1060 	case START_INIT_SOLICIT:
1061 		if (pi->pi_sol_state == INIT_SOLICIT)
1062 			return (pi->pi_sol_time_left);
1063 		pi->pi_ra_flags = 0;
1064 		pi->pi_sol_count = ND_MAX_RTR_SOLICITATIONS;
1065 		pi->pi_sol_time_left =
1066 		    GET_RANDOM(0, ND_MAX_RTR_SOLICITATION_DELAY);
1067 		pi->pi_sol_state = INIT_SOLICIT;
1068 		break;
1069 
1070 	case SOL_TIMER:
1071 		if (pi->pi_sol_state == NO_SOLICIT)
1072 			return (TIMER_INFINITY);
1073 		/* Decrease time left */
1074 		if (pi->pi_sol_time_left >= elapsed)
1075 			pi->pi_sol_time_left -= elapsed;
1076 		else
1077 			pi->pi_sol_time_left = 0;
1078 		break;
1079 	default:
1080 		logmsg(LOG_ERR, "solicit_event: Unknown event %d\n",
1081 		    (int)event);
1082 		return (TIMER_INFINITY);
1083 	}
1084 
1085 	if (pi->pi_sol_time_left != 0)
1086 		return (pi->pi_sol_time_left);
1087 
1088 	/* Send solicitation and calculate next time */
1089 	switch (pi->pi_sol_state) {
1090 	case INIT_SOLICIT:
1091 		solicit(&v6allrouters, pi);
1092 		if (--pi->pi_sol_count == 0) {
1093 			logmsg(LOG_DEBUG, "solicit_event: giving up on %s\n",
1094 			    pi->pi_name);
1095 			if (pi->pi_StatefulAddrConf) {
1096 				pi->pi_ra_flags |= ND_RA_FLAG_MANAGED |
1097 				    ND_RA_FLAG_OTHER;
1098 				start_dhcp(pi);
1099 			}
1100 			pi->pi_sol_state = DONE_SOLICIT;
1101 			check_daemonize();
1102 			return (TIMER_INFINITY);
1103 		}
1104 		pi->pi_sol_time_left = ND_RTR_SOLICITATION_INTERVAL;
1105 		return (pi->pi_sol_time_left);
1106 	case NO_SOLICIT:
1107 	case DONE_SOLICIT:
1108 		return (TIMER_INFINITY);
1109 	default:
1110 		return (pi->pi_sol_time_left);
1111 	}
1112 }
1113 
1114 /*
1115  * Timer mechanism using relative time (in milliseconds) from the
1116  * previous timer event. Timers exceeding TIMER_INFINITY milliseconds
1117  * will fire after TIMER_INFINITY milliseconds.
1118  */
1119 static uint_t timer_previous;	/* When last SIGALRM occurred */
1120 static uint_t timer_next;	/* Currently scheduled timeout */
1121 
1122 static void
1123 timer_init(void)
1124 {
1125 	timer_previous = getcurrenttime();
1126 	timer_next = TIMER_INFINITY;
1127 	run_timeouts();
1128 }
1129 
1130 /*
1131  * Make sure the next SIGALRM occurs delay milliseconds from the current
1132  * time if not earlier.
1133  * Handles getcurrenttime (32 bit integer holding milliseconds) wraparound
1134  * by treating differences greater than 0x80000000 as negative.
1135  */
1136 void
1137 timer_schedule(uint_t delay)
1138 {
1139 	uint_t now;
1140 	struct itimerval itimerval;
1141 
1142 	now = getcurrenttime();
1143 	if (debug & D_TIMER) {
1144 		logmsg(LOG_DEBUG, "timer_schedule(%u): now %u next %u\n",
1145 		    delay, now, timer_next);
1146 	}
1147 	/* Will this timer occur before the currently scheduled SIGALRM? */
1148 	if (delay >= timer_next - now) {
1149 		if (debug & D_TIMER) {
1150 			logmsg(LOG_DEBUG, "timer_schedule(%u): no action - "
1151 			    "next in %u ms\n",
1152 			    delay, timer_next - now);
1153 		}
1154 		return;
1155 	}
1156 	if (delay == 0) {
1157 		/* Minimum allowed delay */
1158 		delay = 1;
1159 	}
1160 	timer_next = now + delay;
1161 
1162 	itimerval.it_value.tv_sec = delay / 1000;
1163 	itimerval.it_value.tv_usec = (delay % 1000) * 1000;
1164 	itimerval.it_interval.tv_sec = 0;
1165 	itimerval.it_interval.tv_usec = 0;
1166 	if (debug & D_TIMER) {
1167 		logmsg(LOG_DEBUG, "timer_schedule(%u): sec %lu usec %lu\n",
1168 		    delay,
1169 		    itimerval.it_value.tv_sec, itimerval.it_value.tv_usec);
1170 	}
1171 	if (setitimer(ITIMER_REAL, &itimerval, NULL) < 0) {
1172 		logperror("timer_schedule: setitimer");
1173 		exit(2);
1174 	}
1175 }
1176 
1177 /*
1178  * Conditional running of timer. If more than 'minimal_time' millseconds
1179  * since the timer routines were last run we run them.
1180  * Used when packets arrive.
1181  */
1182 static void
1183 conditional_run_timeouts(uint_t minimal_time)
1184 {
1185 	uint_t now;
1186 	uint_t elapsed;
1187 
1188 	now = getcurrenttime();
1189 	elapsed = now - timer_previous;
1190 	if (elapsed > minimal_time) {
1191 		if (debug & D_TIMER) {
1192 			logmsg(LOG_DEBUG, "conditional_run_timeouts: "
1193 			    "elapsed %d\n", elapsed);
1194 		}
1195 		run_timeouts();
1196 	}
1197 }
1198 
1199 /*
1200  * Timer has fired.
1201  * Determine when the next timer event will occur by asking all
1202  * the timer routines.
1203  * Should not be called from a timer routine but in some cases this is
1204  * done because the code doesn't know that e.g. it was called from
1205  * ifconfig_timer(). In this case the nested run_timeouts will just return but
1206  * the running run_timeouts will ensure to call all the timer functions by
1207  * looping once more.
1208  */
1209 static void
1210 run_timeouts(void)
1211 {
1212 	uint_t now;
1213 	uint_t elapsed;
1214 	uint_t next;
1215 	uint_t nexti;
1216 	struct phyint *pi;
1217 	struct phyint *next_pi;
1218 	struct prefix *pr;
1219 	struct prefix *next_pr;
1220 	struct adv_prefix *adv_pr;
1221 	struct adv_prefix *next_adv_pr;
1222 	struct router *dr;
1223 	struct router *next_dr;
1224 	static boolean_t timeout_running;
1225 	static boolean_t do_retry;
1226 
1227 	if (timeout_running) {
1228 		if (debug & D_TIMER)
1229 			logmsg(LOG_DEBUG, "run_timeouts: nested call\n");
1230 		do_retry = _B_TRUE;
1231 		return;
1232 	}
1233 	timeout_running = _B_TRUE;
1234 retry:
1235 	/* How much time since the last time we were called? */
1236 	now = getcurrenttime();
1237 	elapsed = now - timer_previous;
1238 	timer_previous = now;
1239 
1240 	if (debug & D_TIMER)
1241 		logmsg(LOG_DEBUG, "run_timeouts: elapsed %d\n", elapsed);
1242 
1243 	next = TIMER_INFINITY;
1244 	for (pi = phyints; pi != NULL; pi = next_pi) {
1245 		next_pi = pi->pi_next;
1246 		nexti = phyint_timer(pi, elapsed);
1247 		if (nexti != TIMER_INFINITY && nexti < next)
1248 			next = nexti;
1249 		if (debug & D_TIMER) {
1250 			logmsg(LOG_DEBUG, "run_timeouts (pi %s): %d -> %u ms\n",
1251 			    pi->pi_name, nexti, next);
1252 		}
1253 		for (pr = pi->pi_prefix_list; pr != NULL; pr = next_pr) {
1254 			next_pr = pr->pr_next;
1255 			nexti = prefix_timer(pr, elapsed);
1256 			if (nexti != TIMER_INFINITY && nexti < next)
1257 				next = nexti;
1258 			if (debug & D_TIMER) {
1259 				logmsg(LOG_DEBUG, "run_timeouts (pr %s): "
1260 				    "%d -> %u ms\n", pr->pr_name, nexti, next);
1261 			}
1262 		}
1263 		for (adv_pr = pi->pi_adv_prefix_list; adv_pr != NULL;
1264 		    adv_pr = next_adv_pr) {
1265 			next_adv_pr = adv_pr->adv_pr_next;
1266 			nexti = adv_prefix_timer(adv_pr, elapsed);
1267 			if (nexti != TIMER_INFINITY && nexti < next)
1268 				next = nexti;
1269 			if (debug & D_TIMER) {
1270 				logmsg(LOG_DEBUG, "run_timeouts "
1271 				    "(adv pr on %s): %d -> %u ms\n",
1272 				    adv_pr->adv_pr_physical->pi_name,
1273 				    nexti, next);
1274 			}
1275 		}
1276 		for (dr = pi->pi_router_list; dr != NULL; dr = next_dr) {
1277 			next_dr = dr->dr_next;
1278 			nexti = router_timer(dr, elapsed);
1279 			if (nexti != TIMER_INFINITY && nexti < next)
1280 				next = nexti;
1281 			if (debug & D_TIMER) {
1282 				logmsg(LOG_DEBUG, "run_timeouts (dr): "
1283 				    "%d -> %u ms\n", nexti, next);
1284 			}
1285 		}
1286 		if (pi->pi_TmpAddrsEnabled) {
1287 			nexti = tmptoken_timer(pi, elapsed);
1288 			if (nexti != TIMER_INFINITY && nexti < next)
1289 				next = nexti;
1290 			if (debug & D_TIMER) {
1291 				logmsg(LOG_DEBUG, "run_timeouts (tmp on %s): "
1292 				    "%d -> %u ms\n", pi->pi_name, nexti, next);
1293 			}
1294 		}
1295 	}
1296 	/*
1297 	 * Make sure the timer functions are run at least once
1298 	 * an hour.
1299 	 */
1300 	if (next == TIMER_INFINITY)
1301 		next = 3600 * 1000;	/* 1 hour */
1302 
1303 	if (debug & D_TIMER)
1304 		logmsg(LOG_DEBUG, "run_timeouts: %u ms\n", next);
1305 	timer_schedule(next);
1306 	if (do_retry) {
1307 		if (debug & D_TIMER)
1308 			logmsg(LOG_DEBUG, "run_timeouts: retry\n");
1309 		do_retry = _B_FALSE;
1310 		goto retry;
1311 	}
1312 	timeout_running = _B_FALSE;
1313 }
1314 
1315 static int eventpipe_read = -1;	/* Used for synchronous signal delivery */
1316 static int eventpipe_write = -1;
1317 
1318 /*
1319  * Ensure that signals are processed synchronously with the rest of
1320  * the code by just writing a one character signal number on the pipe.
1321  * The poll loop will pick this up and process the signal event.
1322  */
1323 static void
1324 sig_handler(int signo)
1325 {
1326 	uchar_t buf = (uchar_t)signo;
1327 
1328 	if (eventpipe_write == -1) {
1329 		logmsg(LOG_ERR, "sig_handler: no pipe\n");
1330 		return;
1331 	}
1332 	if (write(eventpipe_write, &buf, sizeof (buf)) < 0)
1333 		logperror("sig_handler: write");
1334 }
1335 
1336 /*
1337  * Pick up a signal "byte" from the pipe and process it.
1338  */
1339 static void
1340 in_signal(int fd)
1341 {
1342 	uchar_t buf;
1343 	struct phyint *pi;
1344 	struct phyint *next_pi;
1345 
1346 	switch (read(fd, &buf, sizeof (buf))) {
1347 	case -1:
1348 		logperror("in_signal: read");
1349 		exit(1);
1350 		/* NOTREACHED */
1351 	case 1:
1352 		break;
1353 	case 0:
1354 		logmsg(LOG_ERR, "in_signal: read eof\n");
1355 		exit(1);
1356 		/* NOTREACHED */
1357 	default:
1358 		logmsg(LOG_ERR, "in_signal: read > 1\n");
1359 		exit(1);
1360 	}
1361 
1362 	if (debug & D_TIMER)
1363 		logmsg(LOG_DEBUG, "in_signal() got %d\n", buf);
1364 
1365 	switch (buf) {
1366 	case SIGALRM:
1367 		if (debug & D_TIMER) {
1368 			uint_t now = getcurrenttime();
1369 
1370 			logmsg(LOG_DEBUG, "in_signal(SIGALRM) delta %u\n",
1371 			    now - timer_next);
1372 		}
1373 		timer_next = TIMER_INFINITY;
1374 		run_timeouts();
1375 		break;
1376 	case SIGHUP:
1377 		/* Re-read config file by exec'ing ourselves */
1378 		for (pi = phyints; pi != NULL; pi = next_pi) {
1379 			next_pi = pi->pi_next;
1380 			if (pi->pi_AdvSendAdvertisements)
1381 				check_to_advertise(pi, START_FINAL_ADV);
1382 
1383 			phyint_delete(pi);
1384 		}
1385 
1386 		/*
1387 		 * Prevent fd leaks.  Everything gets re-opened at start-up
1388 		 * time.  0, 1, and 2 are closed and re-opened as
1389 		 * /dev/null, so we'll leave those open.
1390 		 */
1391 		closefrom(3);
1392 
1393 		logmsg(LOG_ERR, "SIGHUP: restart and reread config file\n");
1394 		(void) execv(argv0[0], argv0);
1395 		(void) unlink(PATH_PID);
1396 		_exit(0177);
1397 		/* NOTREACHED */
1398 	case SIGUSR1:
1399 		logmsg(LOG_DEBUG, "Printing configuration:\n");
1400 		phyint_print_all();
1401 		break;
1402 	case SIGINT:
1403 	case SIGTERM:
1404 	case SIGQUIT:
1405 		for (pi = phyints; pi != NULL; pi = next_pi) {
1406 			next_pi = pi->pi_next;
1407 			if (pi->pi_AdvSendAdvertisements)
1408 				check_to_advertise(pi, START_FINAL_ADV);
1409 
1410 			phyint_delete(pi);
1411 		}
1412 		(void) unlink(NDPD_SNMP_SOCKET);
1413 		(void) unlink(PATH_PID);
1414 		exit(0);
1415 		/* NOTREACHED */
1416 	case 255:
1417 		/*
1418 		 * Special "signal" from looback_ra_enqueue.
1419 		 * Handle any queued loopback router advertisements.
1420 		 */
1421 		loopback_ra_dequeue();
1422 		break;
1423 	default:
1424 		logmsg(LOG_ERR, "in_signal: unknown signal: %d\n", buf);
1425 	}
1426 }
1427 
1428 /*
1429  * Create pipe for signal delivery and set up signal handlers.
1430  */
1431 static void
1432 setup_eventpipe(void)
1433 {
1434 	int fds[2];
1435 	struct sigaction act;
1436 
1437 	if ((pipe(fds)) < 0) {
1438 		logperror("setup_eventpipe: pipe");
1439 		exit(1);
1440 	}
1441 	eventpipe_read = fds[0];
1442 	eventpipe_write = fds[1];
1443 	if (poll_add(eventpipe_read) == -1) {
1444 		exit(1);
1445 	}
1446 	act.sa_handler = sig_handler;
1447 	act.sa_flags = SA_RESTART;
1448 	(void) sigaction(SIGALRM, &act, NULL);
1449 
1450 	(void) sigset(SIGHUP, sig_handler);
1451 	(void) sigset(SIGUSR1, sig_handler);
1452 	(void) sigset(SIGTERM, sig_handler);
1453 	(void) sigset(SIGINT, sig_handler);
1454 	(void) sigset(SIGQUIT, sig_handler);
1455 }
1456 
1457 /*
1458  * Create a routing socket for receiving RTM_IFINFO messages and initialize
1459  * the routing socket message header and as much of the sockaddrs as possible.
1460  */
1461 static int
1462 setup_rtsock(void)
1463 {
1464 	int s;
1465 	int ret;
1466 	char *cp;
1467 	struct sockaddr_in6 *sin6;
1468 
1469 	s = socket(PF_ROUTE, SOCK_RAW, AF_INET6);
1470 	if (s == -1) {
1471 		logperror("socket(PF_ROUTE)");
1472 		exit(1);
1473 	}
1474 	ret = fcntl(s, F_SETFL, O_NDELAY|O_NONBLOCK);
1475 	if (ret < 0) {
1476 		logperror("fcntl(O_NDELAY)");
1477 		exit(1);
1478 	}
1479 	if (poll_add(s) == -1) {
1480 		exit(1);
1481 	}
1482 
1483 	/*
1484 	 * Allocate storage for the routing socket message.
1485 	 */
1486 	rt_msg = (struct rt_msghdr *)malloc(NDP_RTM_MSGLEN);
1487 	if (rt_msg == NULL) {
1488 		logperror("malloc");
1489 		exit(1);
1490 	}
1491 
1492 	/*
1493 	 * Initialize the routing socket message by zero-filling it and then
1494 	 * setting the fields where are constant through the lifetime of the
1495 	 * process.
1496 	 */
1497 	bzero(rt_msg, NDP_RTM_MSGLEN);
1498 	rt_msg->rtm_msglen = NDP_RTM_MSGLEN;
1499 	rt_msg->rtm_version = RTM_VERSION;
1500 	rt_msg->rtm_addrs = RTA_DST | RTA_GATEWAY | RTA_NETMASK | RTA_IFP;
1501 	rt_msg->rtm_pid = getpid();
1502 	if (rt_msg->rtm_pid < 0) {
1503 		logperror("getpid");
1504 		exit(1);
1505 	}
1506 
1507 	/*
1508 	 * The RTA_DST sockaddr does not change during the lifetime of the
1509 	 * process so it can be completely initialized at this time.
1510 	 */
1511 	cp = (char *)rt_msg + sizeof (struct rt_msghdr);
1512 	sin6 = (struct sockaddr_in6 *)cp;
1513 	sin6->sin6_family = AF_INET6;
1514 	sin6->sin6_addr = in6addr_any;
1515 
1516 	/*
1517 	 * Initialize the constant portion of the RTA_GATEWAY sockaddr.
1518 	 */
1519 	cp += sizeof (struct sockaddr_in6);
1520 	rta_gateway = (struct sockaddr_in6 *)cp;
1521 	rta_gateway->sin6_family = AF_INET6;
1522 
1523 	/*
1524 	 * The RTA_NETMASK sockaddr does not change during the lifetime of the
1525 	 * process so it can be completely initialized at this time.
1526 	 */
1527 	cp += sizeof (struct sockaddr_in6);
1528 	sin6 = (struct sockaddr_in6 *)cp;
1529 	sin6->sin6_family = AF_INET6;
1530 	sin6->sin6_addr = in6addr_any;
1531 
1532 	/*
1533 	 * Initialize the constant portion of the RTA_IFP sockaddr.
1534 	 */
1535 	cp += sizeof (struct sockaddr_in6);
1536 	rta_ifp = (struct sockaddr_dl *)cp;
1537 	rta_ifp->sdl_family = AF_LINK;
1538 
1539 	return (s);
1540 }
1541 
1542 static int
1543 setup_mibsock(void)
1544 {
1545 	int sock;
1546 	int ret;
1547 	int len;
1548 	struct sockaddr_un laddr;
1549 
1550 	sock = socket(AF_UNIX, SOCK_DGRAM, 0);
1551 	if (sock == -1) {
1552 		logperror("setup_mibsock: socket(AF_UNIX)");
1553 		exit(1);
1554 	}
1555 
1556 	bzero(&laddr, sizeof (laddr));
1557 	laddr.sun_family = AF_UNIX;
1558 
1559 	(void) strncpy(laddr.sun_path, NDPD_SNMP_SOCKET,
1560 	    sizeof (laddr.sun_path));
1561 	len = sizeof (struct sockaddr_un);
1562 
1563 	(void) unlink(NDPD_SNMP_SOCKET);
1564 	ret = bind(sock, (struct sockaddr *)&laddr, len);
1565 	if (ret < 0) {
1566 		logperror("setup_mibsock: bind\n");
1567 		exit(1);
1568 	}
1569 
1570 	ret = fcntl(sock, F_SETFL, O_NONBLOCK);
1571 	if (ret < 0) {
1572 		logperror("fcntl(O_NONBLOCK)");
1573 		exit(1);
1574 	}
1575 	if (poll_add(sock) == -1) {
1576 		exit(1);
1577 	}
1578 	return (sock);
1579 }
1580 
1581 /*
1582  * Retrieve one routing socket message. If RTM_IFINFO indicates
1583  * new phyint do a full scan of the interfaces. If RTM_IFINFO
1584  * indicates an existing phyint, only scan that phyint and associated
1585  * prefixes.
1586  */
1587 static void
1588 process_rtsock(int rtsock)
1589 {
1590 	int n;
1591 #define	MSG_SIZE	2048/8
1592 	int64_t msg[MSG_SIZE];
1593 	struct rt_msghdr *rtm;
1594 	struct if_msghdr *ifm;
1595 	struct phyint *pi;
1596 	struct prefix *pr;
1597 	boolean_t need_initifs = _B_FALSE;
1598 	boolean_t need_ifscan = _B_FALSE;
1599 	int64_t	ifscan_msg[10][MSG_SIZE];
1600 	int ifscan_index = 0;
1601 	int i;
1602 
1603 	/* Empty the rtsock and coealesce all the work that we have */
1604 	while (ifscan_index < 10) {
1605 		n = read(rtsock, msg, sizeof (msg));
1606 		if (n <= 0) {
1607 			/* No more messages */
1608 			break;
1609 		}
1610 		rtm = (struct rt_msghdr *)msg;
1611 		if (rtm->rtm_version != RTM_VERSION) {
1612 			logmsg(LOG_ERR,
1613 			    "process_rtsock: version %d not understood\n",
1614 			    rtm->rtm_version);
1615 			return;
1616 		}
1617 		switch (rtm->rtm_type) {
1618 		case RTM_NEWADDR:
1619 		case RTM_DELADDR:
1620 			/*
1621 			 * Some logical interface has changed - have to scan
1622 			 * everything to determine what actually changed.
1623 			 */
1624 			if (debug & D_IFSCAN) {
1625 				logmsg(LOG_DEBUG, "process_rtsock: "
1626 				    "message %d\n", rtm->rtm_type);
1627 			}
1628 			need_initifs = _B_TRUE;
1629 			break;
1630 		case RTM_IFINFO:
1631 			need_ifscan = _B_TRUE;
1632 			(void) memcpy(ifscan_msg[ifscan_index], rtm,
1633 			    sizeof (msg));
1634 			ifscan_index++;
1635 			/* Handled below */
1636 			break;
1637 		default:
1638 			/* Not interesting */
1639 			break;
1640 		}
1641 	}
1642 	/*
1643 	 * If we do full scan i.e initifs, we don't need to
1644 	 * scan a particular interface as we should have
1645 	 * done that as part of initifs.
1646 	 */
1647 	if (need_initifs) {
1648 		initifs(_B_FALSE);
1649 		return;
1650 	}
1651 
1652 	if (!need_ifscan)
1653 		return;
1654 
1655 	for (i = 0; i < ifscan_index; i++) {
1656 		ifm = (struct if_msghdr *)ifscan_msg[i];
1657 		if (debug & D_IFSCAN)
1658 			logmsg(LOG_DEBUG, "process_rtsock: index %d\n",
1659 			    ifm->ifm_index);
1660 
1661 		pi = phyint_lookup_on_index(ifm->ifm_index);
1662 		if (pi == NULL) {
1663 			/*
1664 			 * A new physical interface. Do a full scan of the
1665 			 * to catch any new logical interfaces.
1666 			 */
1667 			initifs(_B_FALSE);
1668 			return;
1669 		}
1670 
1671 		if (ifm->ifm_flags != pi->pi_flags) {
1672 			if (debug & D_IFSCAN) {
1673 				logmsg(LOG_DEBUG, "process_rtsock: clr for "
1674 				    "%s old flags 0x%x new flags 0x%x\n",
1675 				    pi->pi_name, pi->pi_flags, ifm->ifm_flags);
1676 			}
1677 		}
1678 
1679 
1680 		/*
1681 		 * Mark the interfaces so that we can find phyints and prefixes
1682 		 * which have disappeared from the kernel.
1683 		 * if_process will set pr_in_use when it finds the
1684 		 * interface in the kernel.
1685 		 * Before re-examining the state of the interfaces,
1686 		 * PI_PRESENT should be cleared from pi_kernel_state.
1687 		 */
1688 		pi->pi_kernel_state &= ~PI_PRESENT;
1689 		for (pr = pi->pi_prefix_list; pr != NULL; pr = pr->pr_next) {
1690 			pr->pr_in_use = _B_FALSE;
1691 		}
1692 
1693 		if (ifsock < 0) {
1694 			ifsock = socket(AF_INET6, SOCK_DGRAM, 0);
1695 			if (ifsock < 0) {
1696 				logperror("process_rtsock: socket");
1697 				return;
1698 			}
1699 		}
1700 		if_process(ifsock, pi->pi_name, _B_FALSE);
1701 		for (pr = pi->pi_prefix_list; pr != NULL; pr = pr->pr_next) {
1702 			if_process(ifsock, pr->pr_name, _B_FALSE);
1703 		}
1704 		/*
1705 		 * If interface (still) exists in kernel, set
1706 		 * pi_state to indicate that.
1707 		 */
1708 		if (pi->pi_kernel_state & PI_PRESENT) {
1709 			pi->pi_state |= PI_PRESENT;
1710 		}
1711 		check_if_removed(pi);
1712 		if (show_ifs)
1713 			phyint_print_all();
1714 	}
1715 }
1716 
1717 static void
1718 process_mibsock(int mibsock)
1719 {
1720 	struct phyint *pi;
1721 	socklen_t fromlen;
1722 	struct sockaddr_un from;
1723 	ndpd_info_t ndpd_info;
1724 	ssize_t len;
1725 	int command;
1726 
1727 	fromlen = (socklen_t)sizeof (from);
1728 	len = recvfrom(mibsock, &command, sizeof (int), 0,
1729 	    (struct sockaddr *)&from, &fromlen);
1730 
1731 	if (len < sizeof (int) || command != NDPD_SNMP_INFO_REQ) {
1732 		logperror("process_mibsock: bad command \n");
1733 		return;
1734 	}
1735 
1736 	ndpd_info.info_type = NDPD_SNMP_INFO_RESPONSE;
1737 	ndpd_info.info_version = NDPD_SNMP_INFO_VER;
1738 	ndpd_info.info_num_of_phyints = num_of_phyints;
1739 
1740 	(void) sendto(mibsock, &ndpd_info, sizeof (ndpd_info_t), 0,
1741 	    (struct sockaddr *)&from, fromlen);
1742 
1743 	for (pi = phyints; pi != NULL; pi = pi->pi_next) {
1744 		int prefixes;
1745 		int routers;
1746 		struct prefix   *prefix_list;
1747 		struct router   *router_list;
1748 		ndpd_phyint_info_t phyint;
1749 		ndpd_prefix_info_t prefix;
1750 		ndpd_router_info_t router;
1751 		/*
1752 		 * get number of prefixes
1753 		 */
1754 		routers = 0;
1755 		prefixes = 0;
1756 		prefix_list = pi->pi_prefix_list;
1757 		while (prefix_list != NULL) {
1758 			prefixes++;
1759 			prefix_list = prefix_list->pr_next;
1760 		}
1761 
1762 		/*
1763 		 * get number of routers
1764 		 */
1765 		router_list = pi->pi_router_list;
1766 		while (router_list != NULL) {
1767 			routers++;
1768 			router_list = router_list->dr_next;
1769 		}
1770 
1771 		phyint.phyint_info_type = NDPD_PHYINT_INFO;
1772 		phyint.phyint_info_version = NDPD_PHYINT_INFO_VER;
1773 		phyint.phyint_index = pi->pi_index;
1774 		bcopy(pi->pi_config,
1775 		    phyint.phyint_config, I_IFSIZE);
1776 		phyint.phyint_num_of_prefixes = prefixes;
1777 		phyint.phyint_num_of_routers = routers;
1778 		(void) sendto(mibsock, &phyint, sizeof (phyint), 0,
1779 		    (struct sockaddr *)&from, fromlen);
1780 
1781 		/*
1782 		 * Copy prefix information
1783 		 */
1784 
1785 		prefix_list = pi->pi_prefix_list;
1786 		while (prefix_list != NULL) {
1787 			prefix.prefix_info_type = NDPD_PREFIX_INFO;
1788 			prefix.prefix_info_version = NDPD_PREFIX_INFO_VER;
1789 			prefix.prefix_prefix = prefix_list->pr_prefix;
1790 			prefix.prefix_len = prefix_list->pr_prefix_len;
1791 			prefix.prefix_flags = prefix_list->pr_flags;
1792 			prefix.prefix_phyint_index = pi->pi_index;
1793 			prefix.prefix_ValidLifetime =
1794 			    prefix_list->pr_ValidLifetime;
1795 			prefix.prefix_PreferredLifetime =
1796 			    prefix_list->pr_PreferredLifetime;
1797 			prefix.prefix_OnLinkLifetime =
1798 			    prefix_list->pr_OnLinkLifetime;
1799 			prefix.prefix_OnLinkFlag =
1800 			    prefix_list->pr_OnLinkFlag;
1801 			prefix.prefix_AutonomousFlag =
1802 			    prefix_list->pr_AutonomousFlag;
1803 			(void) sendto(mibsock, &prefix, sizeof (prefix), 0,
1804 			    (struct sockaddr *)&from, fromlen);
1805 			prefix_list = prefix_list->pr_next;
1806 		}
1807 		/*
1808 		 * Copy router information
1809 		 */
1810 		router_list = pi->pi_router_list;
1811 		while (router_list != NULL) {
1812 			router.router_info_type = NDPD_ROUTER_INFO;
1813 			router.router_info_version = NDPD_ROUTER_INFO_VER;
1814 			router.router_address = router_list->dr_address;
1815 			router.router_lifetime = router_list->dr_lifetime;
1816 			router.router_phyint_index = pi->pi_index;
1817 			(void) sendto(mibsock, &router, sizeof (router), 0,
1818 			    (struct sockaddr *)&from, fromlen);
1819 			router_list = router_list->dr_next;
1820 		}
1821 	}
1822 }
1823 
1824 /*
1825  * Check whether the address formed by pr->pr_prefix and pi_token
1826  * exists in the kernel. Cannot call SIOCTMYADDR/ONLINK as it
1827  * does not check for down addresses. This function should not
1828  * be called for onlink prefixes.
1829  */
1830 static boolean_t
1831 is_address_present(struct phyint *pi, struct prefix *pr, uint64_t flags)
1832 {
1833 	int s;
1834 	in6_addr_t addr, *token;
1835 	int i;
1836 	int ret;
1837 	struct sockaddr_in6 sin6;
1838 
1839 	s = socket(AF_INET6, SOCK_DGRAM, 0);
1840 	if (s < 0) {
1841 		logperror("is_address_present: socket");
1842 		/*
1843 		 * By returning B_TRUE, we make the caller delete
1844 		 * the prefix from the internal table. In the worst
1845 		 * case the next RA will create the prefix.
1846 		 */
1847 		return (_B_TRUE);
1848 	}
1849 	if (flags & IFF_TEMPORARY)
1850 		token = &pi->pi_tmp_token;
1851 	else
1852 		token = &pi->pi_token;
1853 	for (i = 0; i < 16; i++) {
1854 		/*
1855 		 * prefix_create ensures that pr_prefix has all-zero
1856 		 * bits after prefixlen.
1857 		 */
1858 		addr.s6_addr[i] = pr->pr_prefix.s6_addr[i] | token->s6_addr[i];
1859 	}
1860 	(void) memset(&sin6, 0, sizeof (struct sockaddr_in6));
1861 	sin6.sin6_family = AF_INET6;
1862 	sin6.sin6_addr = addr;
1863 	ret = bind(s, (struct sockaddr *)&sin6, sizeof (struct sockaddr_in6));
1864 	(void) close(s);
1865 	if (ret < 0 && errno == EADDRNOTAVAIL)
1866 		return (_B_FALSE);
1867 	else
1868 		return (_B_TRUE);
1869 }
1870 
1871 /*
1872  * Look if the phyint or one of its prefixes have been removed from
1873  * the kernel and take appropriate action.
1874  * Uses {pi,pr}_in_use.
1875  */
1876 static void
1877 check_if_removed(struct phyint *pi)
1878 {
1879 	struct prefix *pr;
1880 	struct prefix *next_pr;
1881 
1882 	/*
1883 	 * Detect phyints that have been removed from the kernel.
1884 	 * Since we can't recreate it here (would require ifconfig plumb
1885 	 * logic) we just terminate use of that phyint.
1886 	 */
1887 	if (!(pi->pi_kernel_state & PI_PRESENT) &&
1888 	    (pi->pi_state & PI_PRESENT)) {
1889 		logmsg(LOG_ERR, "Interface %s has been removed from kernel. "
1890 		    "in.ndpd will no longer use it\n", pi->pi_name);
1891 		/*
1892 		 * Clear state so that should the phyint reappear
1893 		 * we will start with initial advertisements or
1894 		 * solicitations.
1895 		 */
1896 		phyint_cleanup(pi);
1897 	}
1898 	/*
1899 	 * Detect prefixes which are removed.
1900 	 *
1901 	 * We remove the prefix in all of the following cases :
1902 	 *
1903 	 * 1) Static prefixes are not the ones we create. So,
1904 	 *    just remove it from our tables.
1905 	 *
1906 	 * 2) On-link prefixes potentially move to a different
1907 	 *    phyint during failover. As it does not have
1908 	 *    an address, we can't use the logic in is_address_present
1909 	 *    to detect whether it is present in the kernel or not.
1910 	 *    Thus when it is manually removed we don't recreate it.
1911 	 *
1912 	 * 3) If there is a token mis-match and this prefix is not
1913 	 *    in the kernel, it means we don't need this prefix on
1914 	 *    this interface anymore. It must have been moved to a
1915 	 *    different interface by in.mpathd. This normally
1916 	 *    happens after a failover followed by a failback (or
1917 	 *    another failover) and we re-read the network
1918 	 *    configuration. For the failover from A to B, we would
1919 	 *    have created state on B about A's address, which will
1920 	 *    not be in use after the subsequent failback. So, we
1921 	 *    remove that prefix here.
1922 	 *
1923 	 * 4) If the physical interface is not present, then remove
1924 	 *    the prefix. In the cases where we are advertising
1925 	 *    prefixes, the state is kept in advertisement prefix and
1926 	 *    hence we can delete the prefix.
1927 	 *
1928 	 * 5) Similar to case (3), when we failover from A to B, the
1929 	 *    prefix in A will not be in use as it has been moved to B.
1930 	 *    We will delete it from our tables and recreate it when
1931 	 *    it fails back. is_address_present makes sure that the
1932 	 *    address is still valid in kernel.
1933 	 *
1934 	 * If none of the above is true, we recreate the prefix as it
1935 	 * has been manually removed. We do it only when the interface
1936 	 * is not FAILED or INACTIVE or OFFLINE.
1937 	 */
1938 	for (pr = pi->pi_prefix_list; pr != NULL; pr = next_pr) {
1939 		next_pr = pr->pr_next;
1940 		if (!pr->pr_in_use) {
1941 			/* Clear PR_AUTO and PR_ONLINK */
1942 			pr->pr_kernel_state &= PR_STATIC;
1943 			if ((pr->pr_state & PR_STATIC) ||
1944 			    !(pr->pr_state & PR_AUTO) ||
1945 			    !(prefix_token_match(pi, pr, pr->pr_flags)) ||
1946 			    (!(pi->pi_kernel_state & PI_PRESENT)) ||
1947 			    (is_address_present(pi, pr, pr->pr_flags))) {
1948 				prefix_delete(pr);
1949 			} else if (!(pi->pi_flags &
1950 			    (IFF_FAILED|IFF_INACTIVE|IFF_OFFLINE)) &&
1951 			    pr->pr_state != pr->pr_kernel_state) {
1952 				pr->pr_name[0] = '\0';
1953 				logmsg(LOG_INFO, "Prefix manually removed "
1954 				    "on %s - recreating it!\n",
1955 				    pi->pi_name);
1956 				prefix_update_k(pr);
1957 			}
1958 		}
1959 	}
1960 }
1961 
1962 
1963 /*
1964  * Queuing mechanism for router advertisements that are sent by in.ndpd
1965  * and that also need to be processed by in.ndpd.
1966  * Uses "signal number" 255 to indicate to the main poll loop
1967  * that there is something to dequeue and send to incomining_ra().
1968  */
1969 struct raq {
1970 	struct raq	*raq_next;
1971 	struct phyint	*raq_pi;
1972 	int		raq_packetlen;
1973 	uchar_t		*raq_packet;
1974 };
1975 static struct raq *raq_head = NULL;
1976 
1977 /*
1978  * Allocate a struct raq and memory for the packet.
1979  * Send signal 255 to have poll dequeue.
1980  */
1981 static void
1982 loopback_ra_enqueue(struct phyint *pi, struct nd_router_advert *ra, int len)
1983 {
1984 	struct raq *raq;
1985 	struct raq **raqp;
1986 
1987 	if (no_loopback)
1988 		return;
1989 
1990 	if (debug & D_PKTOUT)
1991 		logmsg(LOG_DEBUG, "loopback_ra_enqueue for %s\n", pi->pi_name);
1992 
1993 	raq = calloc(sizeof (struct raq), 1);
1994 	if (raq == NULL) {
1995 		logmsg(LOG_ERR, "loopback_ra_enqueue: out of memory\n");
1996 		return;
1997 	}
1998 	raq->raq_packet = malloc(len);
1999 	if (raq->raq_packet == NULL) {
2000 		free(raq);
2001 		logmsg(LOG_ERR, "loopback_ra_enqueue: out of memory\n");
2002 		return;
2003 	}
2004 	bcopy(ra, raq->raq_packet, len);
2005 	raq->raq_packetlen = len;
2006 	raq->raq_pi = pi;
2007 
2008 	/* Tail insert */
2009 	raqp = &raq_head;
2010 	while (*raqp != NULL)
2011 		raqp = &((*raqp)->raq_next);
2012 	*raqp = raq;
2013 
2014 	/* Signal for poll loop */
2015 	sig_handler(255);
2016 }
2017 
2018 /*
2019  * Dequeue and process all queued advertisements.
2020  */
2021 static void
2022 loopback_ra_dequeue(void)
2023 {
2024 	struct sockaddr_in6 from = IN6ADDR_LOOPBACK_INIT;
2025 	struct raq *raq;
2026 
2027 	if (debug & D_PKTIN)
2028 		logmsg(LOG_DEBUG, "loopback_ra_dequeue()\n");
2029 
2030 	while ((raq = raq_head) != NULL) {
2031 		raq_head = raq->raq_next;
2032 		raq->raq_next = NULL;
2033 
2034 		if (debug & D_PKTIN) {
2035 			logmsg(LOG_DEBUG, "loopback_ra_dequeue for %s\n",
2036 			    raq->raq_pi->pi_name);
2037 		}
2038 
2039 		incoming_ra(raq->raq_pi,
2040 		    (struct nd_router_advert *)raq->raq_packet,
2041 		    raq->raq_packetlen, &from, _B_TRUE);
2042 		free(raq->raq_packet);
2043 		free(raq);
2044 	}
2045 }
2046 
2047 
2048 static void
2049 usage(char *cmd)
2050 {
2051 	(void) fprintf(stderr,
2052 	    "usage: %s [ -adt ] [-f <config file>]\n", cmd);
2053 }
2054 
2055 int
2056 main(int argc, char *argv[])
2057 {
2058 	int i;
2059 	struct phyint *pi;
2060 	int c;
2061 	char *config_file = PATH_NDPD_CONF;
2062 	boolean_t file_required = _B_FALSE;
2063 
2064 	argv0 = argv;
2065 	srandom(gethostid());
2066 	(void) umask(0022);
2067 
2068 	while ((c = getopt(argc, argv, "adD:ntIf:")) != EOF) {
2069 		switch (c) {
2070 		case 'a':
2071 			/*
2072 			 * The StatelessAddrConf variable in ndpd.conf, if
2073 			 * present, will override this setting.
2074 			 */
2075 			ifdefaults[I_StatelessAddrConf].cf_value = 0;
2076 			break;
2077 		case 'd':
2078 			debug = D_ALL;
2079 			break;
2080 		case 'D':
2081 			i = strtol((char *)optarg, NULL, 0);
2082 			if (i == 0) {
2083 				(void) fprintf(stderr, "Bad debug flags: %s\n",
2084 				    (char *)optarg);
2085 				exit(1);
2086 			}
2087 			debug |= i;
2088 			break;
2089 		case 'n':
2090 			no_loopback = 1;
2091 			break;
2092 		case 'I':
2093 			show_ifs = 1;
2094 			break;
2095 		case 't':
2096 			debug |= D_PKTIN | D_PKTOUT | D_PKTBAD;
2097 			break;
2098 		case 'f':
2099 			config_file = (char *)optarg;
2100 			file_required = _B_TRUE;
2101 			break;
2102 		case '?':
2103 			usage(argv[0]);
2104 			exit(1);
2105 		}
2106 	}
2107 
2108 	if (parse_config(config_file, file_required) == -1)
2109 		exit(2);
2110 
2111 	if (show_ifs)
2112 		phyint_print_all();
2113 
2114 	if (debug == 0) {
2115 		initlog();
2116 	}
2117 
2118 	setup_eventpipe();
2119 	rtsock = setup_rtsock();
2120 	mibsock = setup_mibsock();
2121 	timer_init();
2122 	initifs(_B_TRUE);
2123 
2124 	check_daemonize();
2125 
2126 	for (;;) {
2127 		if (poll(pollfds, pollfd_num, -1) < 0) {
2128 			if (errno == EINTR)
2129 				continue;
2130 			logperror("main: poll");
2131 			exit(1);
2132 		}
2133 		for (i = 0; i < pollfd_num; i++) {
2134 			if (!(pollfds[i].revents & POLLIN))
2135 				continue;
2136 			if (pollfds[i].fd == eventpipe_read) {
2137 				in_signal(eventpipe_read);
2138 				break;
2139 			}
2140 			if (pollfds[i].fd == rtsock) {
2141 				process_rtsock(rtsock);
2142 				break;
2143 			}
2144 			if (pollfds[i].fd == mibsock) {
2145 				process_mibsock(mibsock);
2146 				break;
2147 			}
2148 			/*
2149 			 * Run timer routine to advance clock if more than
2150 			 * half a second since the clock was advanced.
2151 			 * This limits CPU usage under severe packet
2152 			 * arrival rates but it creates a slight inaccuracy
2153 			 * in the timer mechanism.
2154 			 */
2155 			conditional_run_timeouts(500U);
2156 			for (pi = phyints; pi != NULL; pi = pi->pi_next) {
2157 				if (pollfds[i].fd == pi->pi_sock) {
2158 					in_data(pi);
2159 					break;
2160 				}
2161 			}
2162 		}
2163 	}
2164 	/* NOTREACHED */
2165 	return (0);
2166 }
2167 
2168 /*
2169  * LOGGER
2170  */
2171 
2172 static boolean_t logging = _B_FALSE;
2173 
2174 static void
2175 initlog(void)
2176 {
2177 	logging = _B_TRUE;
2178 	openlog("in.ndpd", LOG_PID | LOG_CONS, LOG_DAEMON);
2179 }
2180 
2181 /* Print the date/time without a trailing carridge return */
2182 static void
2183 fprintdate(FILE *file)
2184 {
2185 	char buf[BUFSIZ];
2186 	struct tm tms;
2187 	time_t now;
2188 
2189 	now = time(NULL);
2190 	(void) localtime_r(&now, &tms);
2191 	(void) strftime(buf, sizeof (buf), "%h %d %X", &tms);
2192 	(void) fprintf(file, "%s ", buf);
2193 }
2194 
2195 /* PRINTFLIKE2 */
2196 void
2197 logmsg(int level, const char *fmt, ...)
2198 {
2199 	va_list ap;
2200 	va_start(ap, fmt);
2201 
2202 	if (logging) {
2203 		vsyslog(level, fmt, ap);
2204 	} else {
2205 		fprintdate(stderr);
2206 		(void) vfprintf(stderr, fmt, ap);
2207 	}
2208 	va_end(ap);
2209 }
2210 
2211 void
2212 logperror(const char *str)
2213 {
2214 	if (logging) {
2215 		syslog(LOG_ERR, "%s: %m\n", str);
2216 	} else {
2217 		fprintdate(stderr);
2218 		(void) fprintf(stderr, "%s: %s\n", str, strerror(errno));
2219 	}
2220 }
2221 
2222 void
2223 logperror_pi(const struct phyint *pi, const char *str)
2224 {
2225 	if (logging) {
2226 		syslog(LOG_ERR, "%s (interface %s): %m\n",
2227 		    str, pi->pi_name);
2228 	} else {
2229 		fprintdate(stderr);
2230 		(void) fprintf(stderr, "%s (interface %s): %s\n",
2231 		    str, pi->pi_name, strerror(errno));
2232 	}
2233 }
2234 
2235 void
2236 logperror_pr(const struct prefix *pr, const char *str)
2237 {
2238 	if (logging) {
2239 		syslog(LOG_ERR, "%s (prefix %s if %s): %m\n",
2240 		    str, pr->pr_name, pr->pr_physical->pi_name);
2241 	} else {
2242 		fprintdate(stderr);
2243 		(void) fprintf(stderr, "%s (prefix %s if %s): %s\n",
2244 		    str, pr->pr_name, pr->pr_physical->pi_name,
2245 		    strerror(errno));
2246 	}
2247 }
2248