1 /* $KAME: name6.c,v 1.25 2000/06/26 16:44:40 itojun Exp $ */ 2 3 /* 4 * Copyright (C) 1995, 1996, 1997, 1998, and 1999 WIDE Project. 5 * All rights reserved. 6 * 7 * Redistribution and use in source and binary forms, with or without 8 * modification, are permitted provided that the following conditions 9 * are met: 10 * 1. Redistributions of source code must retain the above copyright 11 * notice, this list of conditions and the following disclaimer. 12 * 2. Redistributions in binary form must reproduce the above copyright 13 * notice, this list of conditions and the following disclaimer in the 14 * documentation and/or other materials provided with the distribution. 15 * 3. Neither the name of the project nor the names of its contributors 16 * may be used to endorse or promote products derived from this software 17 * without specific prior written permission. 18 * 19 * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND 20 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22 * ARE DISCLAIMED. IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE 23 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29 * SUCH DAMAGE. 30 */ 31 /* 32 * ++Copyright++ 1985, 1988, 1993 33 * - 34 * Copyright (c) 1985, 1988, 1993 35 * The Regents of the University of California. All rights reserved. 36 * 37 * Redistribution and use in source and binary forms, with or without 38 * modification, are permitted provided that the following conditions 39 * are met: 40 * 1. Redistributions of source code must retain the above copyright 41 * notice, this list of conditions and the following disclaimer. 42 * 2. Redistributions in binary form must reproduce the above copyright 43 * notice, this list of conditions and the following disclaimer in the 44 * documentation and/or other materials provided with the distribution. 45 * 3. All advertising materials mentioning features or use of this software 46 * must display the following acknowledgement: 47 * This product includes software developed by the University of 48 * California, Berkeley and its contributors. 49 * 4. Neither the name of the University nor the names of its contributors 50 * may be used to endorse or promote products derived from this software 51 * without specific prior written permission. 52 * 53 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 54 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 55 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 56 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 57 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 58 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 59 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 60 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 61 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 62 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 63 * SUCH DAMAGE. 64 * - 65 * Portions Copyright (c) 1993 by Digital Equipment Corporation. 66 * 67 * Permission to use, copy, modify, and distribute this software for any 68 * purpose with or without fee is hereby granted, provided that the above 69 * copyright notice and this permission notice appear in all copies, and that 70 * the name of Digital Equipment Corporation not be used in advertising or 71 * publicity pertaining to distribution of the document or software without 72 * specific, written prior permission. 73 * 74 * THE SOFTWARE IS PROVIDED "AS IS" AND DIGITAL EQUIPMENT CORP. DISCLAIMS ALL 75 * WARRANTIES WITH REGARD TO THIS SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES 76 * OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL DIGITAL EQUIPMENT 77 * CORPORATION BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL 78 * DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR 79 * PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS 80 * ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS 81 * SOFTWARE. 82 * - 83 * --Copyright-- 84 */ 85 86 /* 87 * Atsushi Onoe <onoe@sm.sony.co.jp> 88 */ 89 90 #include <sys/cdefs.h> 91 __FBSDID("$FreeBSD$"); 92 93 #include "namespace.h" 94 #include <sys/param.h> 95 #include <sys/socket.h> 96 #include <sys/time.h> 97 #include <sys/queue.h> 98 #include <netinet/in.h> 99 #ifdef INET6 100 #include <net/if.h> 101 #include <net/if_var.h> 102 #include <sys/sysctl.h> 103 #include <sys/ioctl.h> 104 #include <netinet6/in6_var.h> /* XXX */ 105 #endif 106 107 #include <arpa/inet.h> 108 #include <arpa/nameser.h> 109 110 #include <errno.h> 111 #include <netdb.h> 112 #include <resolv.h> 113 #include <stdio.h> 114 #include <stdlib.h> 115 #include <string.h> 116 #include <stdarg.h> 117 #include <nsswitch.h> 118 #include <unistd.h> 119 #include "un-namespace.h" 120 #include "netdb_private.h" 121 #include "res_private.h" 122 123 #ifndef MAXALIASES 124 #define MAXALIASES 10 125 #endif 126 #ifndef MAXADDRS 127 #define MAXADDRS 20 128 #endif 129 #ifndef MAXDNAME 130 #define MAXDNAME 1025 131 #endif 132 133 #ifdef INET6 134 #define ADDRLEN(af) ((af) == AF_INET6 ? sizeof(struct in6_addr) : \ 135 sizeof(struct in_addr)) 136 #else 137 #define ADDRLEN(af) sizeof(struct in_addr) 138 #endif 139 140 #define MAPADDR(ab, ina) \ 141 do { \ 142 memcpy(&(ab)->map_inaddr, ina, sizeof(struct in_addr)); \ 143 memset((ab)->map_zero, 0, sizeof((ab)->map_zero)); \ 144 memset((ab)->map_one, 0xff, sizeof((ab)->map_one)); \ 145 } while (0) 146 #define MAPADDRENABLED(flags) \ 147 (((flags) & AI_V4MAPPED) || \ 148 (((flags) & AI_V4MAPPED_CFG))) 149 150 union inx_addr { 151 struct in_addr in_addr; 152 #ifdef INET6 153 struct in6_addr in6_addr; 154 #endif 155 struct { 156 u_char mau_zero[10]; 157 u_char mau_one[2]; 158 struct in_addr mau_inaddr; 159 } map_addr_un; 160 #define map_zero map_addr_un.mau_zero 161 #define map_one map_addr_un.mau_one 162 #define map_inaddr map_addr_un.mau_inaddr 163 }; 164 165 struct policyqueue { 166 TAILQ_ENTRY(policyqueue) pc_entry; 167 #ifdef INET6 168 struct in6_addrpolicy pc_policy; 169 #endif 170 }; 171 TAILQ_HEAD(policyhead, policyqueue); 172 173 #define AIO_SRCFLAG_DEPRECATED 0x1 174 175 struct hp_order { 176 union { 177 struct sockaddr_storage aiou_ss; 178 struct sockaddr aiou_sa; 179 } aio_src_un; 180 #define aio_srcsa aio_src_un.aiou_sa 181 u_int32_t aio_srcflag; 182 int aio_srcscope; 183 int aio_dstscope; 184 struct policyqueue *aio_srcpolicy; 185 struct policyqueue *aio_dstpolicy; 186 union { 187 struct sockaddr_storage aiou_ss; 188 struct sockaddr aiou_sa; 189 } aio_un; 190 #define aio_sa aio_un.aiou_sa 191 int aio_matchlen; 192 char *aio_h_addr; 193 }; 194 195 static struct hostent *_hpcopy(struct hostent *, int *); 196 static struct hostent *_hpaddr(int, const char *, void *, int *); 197 #ifdef INET6 198 static struct hostent *_hpmerge(struct hostent *, struct hostent *, int *); 199 static struct hostent *_hpmapv6(struct hostent *, int *); 200 #endif 201 static struct hostent *_hpsort(struct hostent *, res_state); 202 203 static struct hostent *_hpreorder(struct hostent *); 204 static int get_addrselectpolicy(struct policyhead *); 205 static void free_addrselectpolicy(struct policyhead *); 206 static struct policyqueue *match_addrselectpolicy(struct sockaddr *, 207 struct policyhead *); 208 static void set_source(struct hp_order *, struct policyhead *); 209 static int matchlen(struct sockaddr *, struct sockaddr *); 210 static int comp_dst(const void *, const void *); 211 static int gai_addr2scopetype(struct sockaddr *); 212 213 /* 214 * Functions defined in RFC2553 215 * getipnodebyname, getipnodebyaddr, freehostent 216 */ 217 218 struct hostent * 219 getipnodebyname(const char *name, int af, int flags, int *errp) 220 { 221 struct hostent *hp; 222 union inx_addr addrbuf; 223 res_state statp; 224 u_long options; 225 226 switch (af) { 227 case AF_INET: 228 #ifdef INET6 229 case AF_INET6: 230 #endif 231 break; 232 default: 233 *errp = NO_RECOVERY; 234 return NULL; 235 } 236 237 if (flags & AI_ADDRCONFIG) { 238 int s; 239 240 if ((s = _socket(af, SOCK_DGRAM, 0)) < 0) 241 return NULL; 242 /* 243 * TODO: 244 * Note that implementation dependent test for address 245 * configuration should be done everytime called 246 * (or apropriate interval), 247 * because addresses will be dynamically assigned or deleted. 248 */ 249 _close(s); 250 } 251 252 #ifdef INET6 253 /* special case for literal address */ 254 if (inet_pton(AF_INET6, name, &addrbuf) == 1) { 255 if (af != AF_INET6) { 256 *errp = HOST_NOT_FOUND; 257 return NULL; 258 } 259 return _hpaddr(af, name, &addrbuf, errp); 260 } 261 #endif 262 if (inet_aton(name, (struct in_addr *)&addrbuf) == 1) { 263 if (af != AF_INET) { 264 if (MAPADDRENABLED(flags)) { 265 MAPADDR(&addrbuf, &addrbuf.in_addr); 266 } else { 267 *errp = HOST_NOT_FOUND; 268 return NULL; 269 } 270 } 271 return _hpaddr(af, name, &addrbuf, errp); 272 } 273 274 275 statp = __res_state(); 276 if ((statp->options & RES_INIT) == 0) { 277 if (res_ninit(statp) < 0) { 278 *errp = NETDB_INTERNAL; 279 return NULL; 280 } 281 } 282 283 options = statp->options; 284 statp->options &= ~RES_USE_INET6; 285 286 hp = gethostbyname2(name, af); 287 hp = _hpcopy(hp, errp); 288 289 #ifdef INET6 290 if (af == AF_INET6 && ((flags & AI_ALL) || hp == NULL) && 291 MAPADDRENABLED(flags)) { 292 struct hostent *hp2 = gethostbyname2(name, AF_INET); 293 if (hp == NULL) 294 if (hp2 == NULL) 295 *errp = statp->res_h_errno; 296 else 297 hp = _hpmapv6(hp2, errp); 298 else { 299 if (hp2 && strcmp(hp->h_name, hp2->h_name) == 0) { 300 struct hostent *hpb = hp; 301 hp = _hpmerge(hpb, hp2, errp); 302 freehostent(hpb); 303 } 304 } 305 } 306 #endif 307 308 if (hp == NULL) 309 *errp = statp->res_h_errno; 310 311 statp->options = options; 312 return _hpreorder(_hpsort(hp, statp)); 313 } 314 315 struct hostent * 316 getipnodebyaddr(const void *src, size_t len, int af, int *errp) 317 { 318 struct hostent *hp; 319 res_state statp; 320 u_long options; 321 322 #ifdef INET6 323 struct in6_addr addrbuf; 324 #else 325 struct in_addr addrbuf; 326 #endif 327 328 switch (af) { 329 case AF_INET: 330 if (len != sizeof(struct in_addr)) { 331 *errp = NO_RECOVERY; 332 return NULL; 333 } 334 if ((long)src & ~(sizeof(struct in_addr) - 1)) { 335 memcpy(&addrbuf, src, len); 336 src = &addrbuf; 337 } 338 if (((struct in_addr *)src)->s_addr == 0) 339 return NULL; 340 break; 341 #ifdef INET6 342 case AF_INET6: 343 if (len != sizeof(struct in6_addr)) { 344 *errp = NO_RECOVERY; 345 return NULL; 346 } 347 if ((long)src & ~(sizeof(struct in6_addr) / 2 - 1)) { /*XXX*/ 348 memcpy(&addrbuf, src, len); 349 src = &addrbuf; 350 } 351 if (IN6_IS_ADDR_UNSPECIFIED((struct in6_addr *)src)) 352 return NULL; 353 if (IN6_IS_ADDR_V4MAPPED((struct in6_addr *)src) 354 || IN6_IS_ADDR_V4COMPAT((struct in6_addr *)src)) { 355 src = (char *)src + 356 (sizeof(struct in6_addr) - sizeof(struct in_addr)); 357 af = AF_INET; 358 len = sizeof(struct in_addr); 359 } 360 break; 361 #endif 362 default: 363 *errp = NO_RECOVERY; 364 return NULL; 365 } 366 367 statp = __res_state(); 368 if ((statp->options & RES_INIT) == 0) { 369 if (res_ninit(statp) < 0) { 370 RES_SET_H_ERRNO(statp, NETDB_INTERNAL); 371 return NULL; 372 } 373 } 374 375 options = statp->options; 376 statp->options &= ~RES_USE_INET6; 377 378 hp = gethostbyaddr(src, len, af); 379 if (hp == NULL) 380 *errp = statp->res_h_errno; 381 382 statp->options = options; 383 return (_hpcopy(hp, errp)); 384 } 385 386 void 387 freehostent(struct hostent *ptr) 388 { 389 free(ptr); 390 } 391 392 /* 393 * Private utility functions 394 */ 395 396 /* 397 * _hpcopy: allocate and copy hostent structure 398 */ 399 static struct hostent * 400 _hpcopy(struct hostent *hp, int *errp) 401 { 402 struct hostent *nhp; 403 char *cp, **pp; 404 int size, addrsize; 405 int nalias = 0, naddr = 0; 406 int al_off; 407 int i; 408 409 if (hp == NULL) 410 return hp; 411 412 /* count size to be allocated */ 413 size = sizeof(struct hostent); 414 if (hp->h_name != NULL) 415 size += strlen(hp->h_name) + 1; 416 if ((pp = hp->h_aliases) != NULL) { 417 for (i = 0; *pp != NULL; i++, pp++) { 418 if (**pp != '\0') { 419 size += strlen(*pp) + 1; 420 nalias++; 421 } 422 } 423 } 424 /* adjust alignment */ 425 size = ALIGN(size); 426 al_off = size; 427 size += sizeof(char *) * (nalias + 1); 428 addrsize = ALIGN(hp->h_length); 429 if ((pp = hp->h_addr_list) != NULL) { 430 while (*pp++ != NULL) 431 naddr++; 432 } 433 size += addrsize * naddr; 434 size += sizeof(char *) * (naddr + 1); 435 436 /* copy */ 437 if ((nhp = (struct hostent *)malloc(size)) == NULL) { 438 *errp = TRY_AGAIN; 439 return NULL; 440 } 441 cp = (char *)&nhp[1]; 442 if (hp->h_name != NULL) { 443 nhp->h_name = cp; 444 strcpy(cp, hp->h_name); 445 cp += strlen(cp) + 1; 446 } else 447 nhp->h_name = NULL; 448 nhp->h_aliases = (char **)((char *)nhp + al_off); 449 if ((pp = hp->h_aliases) != NULL) { 450 for (i = 0; *pp != NULL; pp++) { 451 if (**pp != '\0') { 452 nhp->h_aliases[i++] = cp; 453 strcpy(cp, *pp); 454 cp += strlen(cp) + 1; 455 } 456 } 457 } 458 nhp->h_aliases[nalias] = NULL; 459 cp = (char *)&nhp->h_aliases[nalias + 1]; 460 nhp->h_addrtype = hp->h_addrtype; 461 nhp->h_length = hp->h_length; 462 nhp->h_addr_list = (char **)cp; 463 if ((pp = hp->h_addr_list) != NULL) { 464 cp = (char *)&nhp->h_addr_list[naddr + 1]; 465 for (i = 0; *pp != NULL; pp++) { 466 nhp->h_addr_list[i++] = cp; 467 memcpy(cp, *pp, hp->h_length); 468 cp += addrsize; 469 } 470 } 471 nhp->h_addr_list[naddr] = NULL; 472 return nhp; 473 } 474 475 /* 476 * _hpaddr: construct hostent structure with one address 477 */ 478 static struct hostent * 479 _hpaddr(int af, const char *name, void *addr, int *errp) 480 { 481 struct hostent *hp, hpbuf; 482 char *addrs[2]; 483 484 hp = &hpbuf; 485 hp->h_name = (char *)name; 486 hp->h_aliases = NULL; 487 hp->h_addrtype = af; 488 hp->h_length = ADDRLEN(af); 489 hp->h_addr_list = addrs; 490 addrs[0] = (char *)addr; 491 addrs[1] = NULL; 492 return (_hpcopy(hp, errp)); 493 } 494 495 #ifdef INET6 496 /* 497 * _hpmerge: merge 2 hostent structure, arguments will be freed 498 */ 499 static struct hostent * 500 _hpmerge(struct hostent *hp1, struct hostent *hp2, int *errp) 501 { 502 int i, j; 503 int naddr, nalias; 504 char **pp; 505 struct hostent *hp, hpbuf; 506 char *aliases[MAXALIASES + 1], *addrs[MAXADDRS + 1]; 507 union inx_addr addrbuf[MAXADDRS]; 508 509 if (hp1 == NULL) 510 return _hpcopy(hp2, errp); 511 if (hp2 == NULL) 512 return _hpcopy(hp1, errp); 513 514 #define HP(i) (i == 1 ? hp1 : hp2) 515 hp = &hpbuf; 516 hp->h_name = (hp1->h_name != NULL ? hp1->h_name : hp2->h_name); 517 hp->h_aliases = aliases; 518 nalias = 0; 519 for (i = 1; i <= 2; i++) { 520 if ((pp = HP(i)->h_aliases) == NULL) 521 continue; 522 for (; nalias < MAXALIASES && *pp != NULL; pp++) { 523 /* check duplicates */ 524 for (j = 0; j < nalias; j++) 525 if (strcasecmp(*pp, aliases[j]) == 0) 526 break; 527 if (j == nalias) 528 aliases[nalias++] = *pp; 529 } 530 } 531 aliases[nalias] = NULL; 532 if (hp1->h_length != hp2->h_length) { 533 hp->h_addrtype = AF_INET6; 534 hp->h_length = sizeof(struct in6_addr); 535 } else { 536 hp->h_addrtype = hp1->h_addrtype; 537 hp->h_length = hp1->h_length; 538 } 539 540 hp->h_addr_list = addrs; 541 naddr = 0; 542 for (i = 1; i <= 2; i++) { 543 if ((pp = HP(i)->h_addr_list) == NULL) 544 continue; 545 if (HP(i)->h_length == hp->h_length) { 546 while (naddr < MAXADDRS && *pp != NULL) 547 addrs[naddr++] = *pp++; 548 } else { 549 /* copy IPv4 addr as mapped IPv6 addr */ 550 while (naddr < MAXADDRS && *pp != NULL) { 551 MAPADDR(&addrbuf[naddr], *pp++); 552 addrs[naddr] = (char *)&addrbuf[naddr]; 553 naddr++; 554 } 555 } 556 } 557 addrs[naddr] = NULL; 558 return (_hpcopy(hp, errp)); 559 } 560 #endif 561 562 /* 563 * _hpmapv6: convert IPv4 hostent into IPv4-mapped IPv6 addresses 564 */ 565 #ifdef INET6 566 static struct hostent * 567 _hpmapv6(struct hostent *hp, int *errp) 568 { 569 struct hostent hp6; 570 571 if (hp == NULL) 572 return NULL; 573 if (hp->h_addrtype == AF_INET6) 574 return _hpcopy(hp, errp); 575 576 memset(&hp6, 0, sizeof(struct hostent)); 577 hp6.h_addrtype = AF_INET6; 578 hp6.h_length = sizeof(struct in6_addr); 579 return _hpmerge(&hp6, hp, errp); 580 } 581 #endif 582 583 /* 584 * _hpsort: sort address by sortlist 585 */ 586 static struct hostent * 587 _hpsort(struct hostent *hp, res_state statp) 588 { 589 int i, j, n; 590 u_char *ap, *sp, *mp, **pp; 591 char t; 592 char order[MAXADDRS]; 593 int nsort = statp->nsort; 594 595 if (hp == NULL || hp->h_addr_list[1] == NULL || nsort == 0) 596 return hp; 597 for (i = 0; (ap = (u_char *)hp->h_addr_list[i]); i++) { 598 for (j = 0; j < nsort; j++) { 599 #ifdef INET6 600 if (statp->_u._ext.ext->sort_list[j].af != 601 hp->h_addrtype) 602 continue; 603 sp = (u_char *)&statp->_u._ext.ext->sort_list[j].addr; 604 mp = (u_char *)&statp->_u._ext.ext->sort_list[j].mask; 605 #else 606 sp = (u_char *)&statp->sort_list[j].addr; 607 mp = (u_char *)&statp->sort_list[j].mask; 608 #endif 609 for (n = 0; n < hp->h_length; n++) { 610 if ((ap[n] & mp[n]) != sp[n]) 611 break; 612 } 613 if (n == hp->h_length) 614 break; 615 } 616 order[i] = j; 617 } 618 n = i; 619 pp = (u_char **)hp->h_addr_list; 620 for (i = 0; i < n - 1; i++) { 621 for (j = i + 1; j < n; j++) { 622 if (order[i] > order[j]) { 623 ap = pp[i]; 624 pp[i] = pp[j]; 625 pp[j] = ap; 626 t = order[i]; 627 order[i] = order[j]; 628 order[j] = t; 629 } 630 } 631 } 632 return hp; 633 } 634 635 /* 636 * _hpreorder: sort address by default address selection 637 */ 638 static struct hostent * 639 _hpreorder(struct hostent *hp) 640 { 641 struct hp_order *aio; 642 int i, n; 643 char *ap; 644 struct sockaddr *sa; 645 struct policyhead policyhead; 646 647 if (hp == NULL) 648 return hp; 649 650 switch (hp->h_addrtype) { 651 case AF_INET: 652 #ifdef INET6 653 case AF_INET6: 654 #endif 655 break; 656 default: 657 free_addrselectpolicy(&policyhead); 658 return hp; 659 } 660 661 /* count the number of addrinfo elements for sorting. */ 662 for (n = 0; hp->h_addr_list[n] != NULL; n++) 663 ; 664 665 /* 666 * If the number is small enough, we can skip the reordering process. 667 */ 668 if (n <= 1) 669 return hp; 670 671 /* allocate a temporary array for sort and initialization of it. */ 672 if ((aio = malloc(sizeof(*aio) * n)) == NULL) 673 return hp; /* give up reordering */ 674 memset(aio, 0, sizeof(*aio) * n); 675 676 /* retrieve address selection policy from the kernel */ 677 TAILQ_INIT(&policyhead); 678 if (!get_addrselectpolicy(&policyhead)) { 679 /* no policy is installed into kernel, we don't sort. */ 680 free(aio); 681 return hp; 682 } 683 684 for (i = 0; i < n; i++) { 685 ap = hp->h_addr_list[i]; 686 aio[i].aio_h_addr = ap; 687 sa = &aio[i].aio_sa; 688 switch (hp->h_addrtype) { 689 case AF_INET: 690 sa->sa_family = AF_INET; 691 sa->sa_len = sizeof(struct sockaddr_in); 692 memcpy(&((struct sockaddr_in *)sa)->sin_addr, ap, 693 sizeof(struct in_addr)); 694 break; 695 #ifdef INET6 696 case AF_INET6: 697 if (IN6_IS_ADDR_V4MAPPED((struct in6_addr *)ap)) { 698 sa->sa_family = AF_INET; 699 sa->sa_len = sizeof(struct sockaddr_in); 700 memcpy(&((struct sockaddr_in *)sa)->sin_addr, 701 &ap[12], sizeof(struct in_addr)); 702 } else { 703 sa->sa_family = AF_INET6; 704 sa->sa_len = sizeof(struct sockaddr_in6); 705 memcpy(&((struct sockaddr_in6 *)sa)->sin6_addr, 706 ap, sizeof(struct in6_addr)); 707 } 708 break; 709 #endif 710 } 711 aio[i].aio_dstscope = gai_addr2scopetype(sa); 712 aio[i].aio_dstpolicy = match_addrselectpolicy(sa, &policyhead); 713 set_source(&aio[i], &policyhead); 714 } 715 716 /* perform sorting. */ 717 qsort(aio, n, sizeof(*aio), comp_dst); 718 719 /* reorder the h_addr_list. */ 720 for (i = 0; i < n; i++) 721 hp->h_addr_list[i] = aio[i].aio_h_addr; 722 723 /* cleanup and return */ 724 free(aio); 725 free_addrselectpolicy(&policyhead); 726 return hp; 727 } 728 729 static int 730 get_addrselectpolicy(struct policyhead *head) 731 { 732 #ifdef INET6 733 int mib[] = { CTL_NET, PF_INET6, IPPROTO_IPV6, IPV6CTL_ADDRCTLPOLICY }; 734 size_t l; 735 char *buf; 736 struct in6_addrpolicy *pol, *ep; 737 738 if (sysctl(mib, sizeof(mib) / sizeof(mib[0]), NULL, &l, NULL, 0) < 0) 739 return (0); 740 if ((buf = malloc(l)) == NULL) 741 return (0); 742 if (sysctl(mib, sizeof(mib) / sizeof(mib[0]), buf, &l, NULL, 0) < 0) { 743 free(buf); 744 return (0); 745 } 746 747 ep = (struct in6_addrpolicy *)(buf + l); 748 for (pol = (struct in6_addrpolicy *)buf; pol + 1 <= ep; pol++) { 749 struct policyqueue *new; 750 751 if ((new = malloc(sizeof(*new))) == NULL) { 752 free_addrselectpolicy(head); /* make the list empty */ 753 break; 754 } 755 new->pc_policy = *pol; 756 TAILQ_INSERT_TAIL(head, new, pc_entry); 757 } 758 759 free(buf); 760 return (1); 761 #else 762 return (0); 763 #endif 764 } 765 766 static void 767 free_addrselectpolicy(struct policyhead *head) 768 { 769 struct policyqueue *ent, *nent; 770 771 for (ent = TAILQ_FIRST(head); ent; ent = nent) { 772 nent = TAILQ_NEXT(ent, pc_entry); 773 TAILQ_REMOVE(head, ent, pc_entry); 774 free(ent); 775 } 776 } 777 778 static struct policyqueue * 779 match_addrselectpolicy(struct sockaddr *addr, struct policyhead *head) 780 { 781 #ifdef INET6 782 struct policyqueue *ent, *bestent = NULL; 783 struct in6_addrpolicy *pol; 784 int matchlen, bestmatchlen = -1; 785 u_char *mp, *ep, *k, *p, m; 786 struct sockaddr_in6 key; 787 788 switch(addr->sa_family) { 789 case AF_INET6: 790 key = *(struct sockaddr_in6 *)addr; 791 break; 792 case AF_INET: 793 /* convert the address into IPv4-mapped IPv6 address. */ 794 memset(&key, 0, sizeof(key)); 795 key.sin6_family = AF_INET6; 796 key.sin6_len = sizeof(key); 797 key.sin6_addr.s6_addr[10] = 0xff; 798 key.sin6_addr.s6_addr[11] = 0xff; 799 memcpy(&key.sin6_addr.s6_addr[12], 800 &((struct sockaddr_in *)addr)->sin_addr, 4); 801 break; 802 default: 803 return(NULL); 804 } 805 806 for (ent = TAILQ_FIRST(head); ent; ent = TAILQ_NEXT(ent, pc_entry)) { 807 pol = &ent->pc_policy; 808 matchlen = 0; 809 810 mp = (u_char *)&pol->addrmask.sin6_addr; 811 ep = mp + 16; /* XXX: scope field? */ 812 k = (u_char *)&key.sin6_addr; 813 p = (u_char *)&pol->addr.sin6_addr; 814 for (; mp < ep && *mp; mp++, k++, p++) { 815 m = *mp; 816 if ((*k & m) != *p) 817 goto next; /* not match */ 818 if (m == 0xff) /* short cut for a typical case */ 819 matchlen += 8; 820 else { 821 while (m >= 0x80) { 822 matchlen++; 823 m <<= 1; 824 } 825 } 826 } 827 828 /* matched. check if this is better than the current best. */ 829 if (matchlen > bestmatchlen) { 830 bestent = ent; 831 bestmatchlen = matchlen; 832 } 833 834 next: 835 continue; 836 } 837 838 return(bestent); 839 #else 840 return(NULL); 841 #endif 842 843 } 844 845 static void 846 set_source(struct hp_order *aio, struct policyhead *ph) 847 { 848 struct sockaddr_storage ss = aio->aio_un.aiou_ss; 849 socklen_t srclen; 850 int s; 851 852 /* set unspec ("no source is available"), just in case */ 853 aio->aio_srcsa.sa_family = AF_UNSPEC; 854 aio->aio_srcscope = -1; 855 856 switch(ss.ss_family) { 857 case AF_INET: 858 ((struct sockaddr_in *)&ss)->sin_port = htons(1); 859 break; 860 #ifdef INET6 861 case AF_INET6: 862 ((struct sockaddr_in6 *)&ss)->sin6_port = htons(1); 863 break; 864 #endif 865 default: /* ignore unsupported AFs explicitly */ 866 return; 867 } 868 869 /* open a socket to get the source address for the given dst */ 870 if ((s = _socket(ss.ss_family, SOCK_DGRAM, IPPROTO_UDP)) < 0) 871 return; /* give up */ 872 if (_connect(s, (struct sockaddr *)&ss, ss.ss_len) < 0) 873 goto cleanup; 874 srclen = ss.ss_len; 875 if (_getsockname(s, &aio->aio_srcsa, &srclen) < 0) { 876 aio->aio_srcsa.sa_family = AF_UNSPEC; 877 goto cleanup; 878 } 879 aio->aio_srcscope = gai_addr2scopetype(&aio->aio_srcsa); 880 aio->aio_srcpolicy = match_addrselectpolicy(&aio->aio_srcsa, ph); 881 aio->aio_matchlen = matchlen(&aio->aio_srcsa, (struct sockaddr *)&ss); 882 #ifdef INET6 883 if (ss.ss_family == AF_INET6) { 884 struct in6_ifreq ifr6; 885 u_int32_t flags6; 886 887 /* XXX: interface name should not be hardcoded */ 888 strncpy(ifr6.ifr_name, "lo0", sizeof(ifr6.ifr_name)); 889 memset(&ifr6, 0, sizeof(ifr6)); 890 memcpy(&ifr6.ifr_addr, &ss, ss.ss_len); 891 if (_ioctl(s, SIOCGIFAFLAG_IN6, &ifr6) == 0) { 892 flags6 = ifr6.ifr_ifru.ifru_flags6; 893 if ((flags6 & IN6_IFF_DEPRECATED)) 894 aio->aio_srcflag |= AIO_SRCFLAG_DEPRECATED; 895 } 896 } 897 #endif 898 899 cleanup: 900 _close(s); 901 return; 902 } 903 904 static int 905 matchlen(struct sockaddr *src, struct sockaddr *dst) 906 { 907 int match = 0; 908 u_char *s, *d; 909 u_char *lim, r; 910 int addrlen; 911 912 switch (src->sa_family) { 913 #ifdef INET6 914 case AF_INET6: 915 s = (u_char *)&((struct sockaddr_in6 *)src)->sin6_addr; 916 d = (u_char *)&((struct sockaddr_in6 *)dst)->sin6_addr; 917 addrlen = sizeof(struct in6_addr); 918 lim = s + addrlen; 919 break; 920 #endif 921 case AF_INET: 922 s = (u_char *)&((struct sockaddr_in *)src)->sin_addr; 923 d = (u_char *)&((struct sockaddr_in *)dst)->sin_addr; 924 addrlen = sizeof(struct in_addr); 925 lim = s + addrlen; 926 break; 927 default: 928 return(0); 929 } 930 931 while (s < lim) 932 if ((r = (*d++ ^ *s++)) != 0) { 933 while (r < addrlen * 8) { 934 match++; 935 r <<= 1; 936 } 937 break; 938 } else 939 match += 8; 940 return(match); 941 } 942 943 static int 944 comp_dst(const void *arg1, const void *arg2) 945 { 946 const struct hp_order *dst1 = arg1, *dst2 = arg2; 947 948 /* 949 * Rule 1: Avoid unusable destinations. 950 * XXX: we currently do not consider if an appropriate route exists. 951 */ 952 if (dst1->aio_srcsa.sa_family != AF_UNSPEC && 953 dst2->aio_srcsa.sa_family == AF_UNSPEC) { 954 return(-1); 955 } 956 if (dst1->aio_srcsa.sa_family == AF_UNSPEC && 957 dst2->aio_srcsa.sa_family != AF_UNSPEC) { 958 return(1); 959 } 960 961 /* Rule 2: Prefer matching scope. */ 962 if (dst1->aio_dstscope == dst1->aio_srcscope && 963 dst2->aio_dstscope != dst2->aio_srcscope) { 964 return(-1); 965 } 966 if (dst1->aio_dstscope != dst1->aio_srcscope && 967 dst2->aio_dstscope == dst2->aio_srcscope) { 968 return(1); 969 } 970 971 /* Rule 3: Avoid deprecated addresses. */ 972 if (dst1->aio_srcsa.sa_family != AF_UNSPEC && 973 dst2->aio_srcsa.sa_family != AF_UNSPEC) { 974 if (!(dst1->aio_srcflag & AIO_SRCFLAG_DEPRECATED) && 975 (dst2->aio_srcflag & AIO_SRCFLAG_DEPRECATED)) { 976 return(-1); 977 } 978 if ((dst1->aio_srcflag & AIO_SRCFLAG_DEPRECATED) && 979 !(dst2->aio_srcflag & AIO_SRCFLAG_DEPRECATED)) { 980 return(1); 981 } 982 } 983 984 /* Rule 4: Prefer home addresses. */ 985 /* XXX: not implemented yet */ 986 987 /* Rule 5: Prefer matching label. */ 988 #ifdef INET6 989 if (dst1->aio_srcpolicy && dst1->aio_dstpolicy && 990 dst1->aio_srcpolicy->pc_policy.label == 991 dst1->aio_dstpolicy->pc_policy.label && 992 (dst2->aio_srcpolicy == NULL || dst2->aio_dstpolicy == NULL || 993 dst2->aio_srcpolicy->pc_policy.label != 994 dst2->aio_dstpolicy->pc_policy.label)) { 995 return(-1); 996 } 997 if (dst2->aio_srcpolicy && dst2->aio_dstpolicy && 998 dst2->aio_srcpolicy->pc_policy.label == 999 dst2->aio_dstpolicy->pc_policy.label && 1000 (dst1->aio_srcpolicy == NULL || dst1->aio_dstpolicy == NULL || 1001 dst1->aio_srcpolicy->pc_policy.label != 1002 dst1->aio_dstpolicy->pc_policy.label)) { 1003 return(1); 1004 } 1005 #endif 1006 1007 /* Rule 6: Prefer higher precedence. */ 1008 #ifdef INET6 1009 if (dst1->aio_dstpolicy && 1010 (dst2->aio_dstpolicy == NULL || 1011 dst1->aio_dstpolicy->pc_policy.preced > 1012 dst2->aio_dstpolicy->pc_policy.preced)) { 1013 return(-1); 1014 } 1015 if (dst2->aio_dstpolicy && 1016 (dst1->aio_dstpolicy == NULL || 1017 dst2->aio_dstpolicy->pc_policy.preced > 1018 dst1->aio_dstpolicy->pc_policy.preced)) { 1019 return(1); 1020 } 1021 #endif 1022 1023 /* Rule 7: Prefer native transport. */ 1024 /* XXX: not implemented yet */ 1025 1026 /* Rule 8: Prefer smaller scope. */ 1027 if (dst1->aio_dstscope >= 0 && 1028 dst1->aio_dstscope < dst2->aio_dstscope) { 1029 return(-1); 1030 } 1031 if (dst2->aio_dstscope >= 0 && 1032 dst2->aio_dstscope < dst1->aio_dstscope) { 1033 return(1); 1034 } 1035 1036 /* 1037 * Rule 9: Use longest matching prefix. 1038 * We compare the match length in a same AF only. 1039 */ 1040 if (dst1->aio_sa.sa_family == dst2->aio_sa.sa_family) { 1041 if (dst1->aio_matchlen > dst2->aio_matchlen) { 1042 return(-1); 1043 } 1044 if (dst1->aio_matchlen < dst2->aio_matchlen) { 1045 return(1); 1046 } 1047 } 1048 1049 /* Rule 10: Otherwise, leave the order unchanged. */ 1050 return(-1); 1051 } 1052 1053 /* 1054 * Copy from scope.c. 1055 * XXX: we should standardize the functions and link them as standard 1056 * library. 1057 */ 1058 static int 1059 gai_addr2scopetype(struct sockaddr *sa) 1060 { 1061 #ifdef INET6 1062 struct sockaddr_in6 *sa6; 1063 #endif 1064 struct sockaddr_in *sa4; 1065 1066 switch(sa->sa_family) { 1067 #ifdef INET6 1068 case AF_INET6: 1069 sa6 = (struct sockaddr_in6 *)sa; 1070 if (IN6_IS_ADDR_MULTICAST(&sa6->sin6_addr)) { 1071 /* just use the scope field of the multicast address */ 1072 return(sa6->sin6_addr.s6_addr[2] & 0x0f); 1073 } 1074 /* 1075 * Unicast addresses: map scope type to corresponding scope 1076 * value defined for multcast addresses. 1077 * XXX: hardcoded scope type values are bad... 1078 */ 1079 if (IN6_IS_ADDR_LOOPBACK(&sa6->sin6_addr)) 1080 return(1); /* node local scope */ 1081 if (IN6_IS_ADDR_LINKLOCAL(&sa6->sin6_addr)) 1082 return(2); /* link-local scope */ 1083 if (IN6_IS_ADDR_SITELOCAL(&sa6->sin6_addr)) 1084 return(5); /* site-local scope */ 1085 return(14); /* global scope */ 1086 break; 1087 #endif 1088 case AF_INET: 1089 /* 1090 * IPv4 pseudo scoping according to RFC 3484. 1091 */ 1092 sa4 = (struct sockaddr_in *)sa; 1093 /* IPv4 autoconfiguration addresses have link-local scope. */ 1094 if (((u_char *)&sa4->sin_addr)[0] == 169 && 1095 ((u_char *)&sa4->sin_addr)[1] == 254) 1096 return(2); 1097 /* Private addresses have site-local scope. */ 1098 if (((u_char *)&sa4->sin_addr)[0] == 10 || 1099 (((u_char *)&sa4->sin_addr)[0] == 172 && 1100 (((u_char *)&sa4->sin_addr)[1] & 0xf0) == 16) || 1101 (((u_char *)&sa4->sin_addr)[0] == 192 && 1102 ((u_char *)&sa4->sin_addr)[1] == 168)) 1103 return(14); /* XXX: It should be 5 unless NAT */ 1104 /* Loopback addresses have link-local scope. */ 1105 if (((u_char *)&sa4->sin_addr)[0] == 127) 1106 return(2); 1107 return(14); 1108 break; 1109 default: 1110 errno = EAFNOSUPPORT; /* is this a good error? */ 1111 return(-1); 1112 } 1113 } 1114