1 /* 2 * CDDL HEADER START 3 * 4 * The contents of this file are subject to the terms of the 5 * Common Development and Distribution License (the "License"). 6 * You may not use this file except in compliance with the License. 7 * 8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9 * or http://www.opensolaris.org/os/licensing. 10 * See the License for the specific language governing permissions 11 * and limitations under the License. 12 * 13 * When distributing Covered Code, include this CDDL HEADER in each 14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15 * If applicable, add the following below this CDDL HEADER, with the 16 * fields enclosed by brackets "[]" replaced with your own identifying 17 * information: Portions Copyright [yyyy] [name of copyright owner] 18 * 19 * CDDL HEADER END 20 */ 21 /* 22 * Copyright 2009 Sun Microsystems, Inc. All rights reserved. 23 * Use is subject to license terms. 24 */ 25 26 #include <sys/types.h> 27 #include <sys/stream.h> 28 #include <sys/stropts.h> 29 #include <sys/errno.h> 30 #include <sys/strlog.h> 31 #include <sys/tihdr.h> 32 #include <sys/socket.h> 33 #include <sys/ddi.h> 34 #include <sys/sunddi.h> 35 #include <sys/mkdev.h> 36 #include <sys/kmem.h> 37 #include <sys/zone.h> 38 #include <sys/sysmacros.h> 39 #include <sys/cmn_err.h> 40 #include <sys/vtrace.h> 41 #include <sys/debug.h> 42 #include <sys/atomic.h> 43 #include <sys/strsun.h> 44 #include <sys/random.h> 45 #include <netinet/in.h> 46 #include <net/if.h> 47 #include <netinet/ip6.h> 48 #include <netinet/icmp6.h> 49 #include <net/pfkeyv2.h> 50 #include <net/pfpolicy.h> 51 52 #include <inet/common.h> 53 #include <inet/mi.h> 54 #include <inet/ip.h> 55 #include <inet/ip6.h> 56 #include <inet/nd.h> 57 #include <inet/ipsec_info.h> 58 #include <inet/ipsec_impl.h> 59 #include <inet/sadb.h> 60 #include <inet/ipsecah.h> 61 #include <inet/ipsec_impl.h> 62 #include <inet/ipdrop.h> 63 #include <sys/taskq.h> 64 #include <sys/policy.h> 65 #include <sys/iphada.h> 66 #include <sys/strsun.h> 67 68 #include <sys/crypto/common.h> 69 #include <sys/crypto/api.h> 70 #include <sys/kstat.h> 71 #include <sys/strsubr.h> 72 73 /* 74 * Table of ND variables supported by ipsecah. These are loaded into 75 * ipsecah_g_nd in ipsecah_init_nd. 76 * All of these are alterable, within the min/max values given, at run time. 77 */ 78 static ipsecahparam_t lcl_param_arr[] = { 79 /* min max value name */ 80 { 0, 3, 0, "ipsecah_debug"}, 81 { 125, 32000, SADB_AGE_INTERVAL_DEFAULT, "ipsecah_age_interval"}, 82 { 1, 10, 1, "ipsecah_reap_delay"}, 83 { 1, SADB_MAX_REPLAY, 64, "ipsecah_replay_size"}, 84 { 1, 300, 15, "ipsecah_acquire_timeout"}, 85 { 1, 1800, 90, "ipsecah_larval_timeout"}, 86 /* Default lifetime values for ACQUIRE messages. */ 87 { 0, 0xffffffffU, 0, "ipsecah_default_soft_bytes"}, 88 { 0, 0xffffffffU, 0, "ipsecah_default_hard_bytes"}, 89 { 0, 0xffffffffU, 24000, "ipsecah_default_soft_addtime"}, 90 { 0, 0xffffffffU, 28800, "ipsecah_default_hard_addtime"}, 91 { 0, 0xffffffffU, 0, "ipsecah_default_soft_usetime"}, 92 { 0, 0xffffffffU, 0, "ipsecah_default_hard_usetime"}, 93 { 0, 1, 0, "ipsecah_log_unknown_spi"}, 94 }; 95 #define ipsecah_debug ipsecah_params[0].ipsecah_param_value 96 #define ipsecah_age_interval ipsecah_params[1].ipsecah_param_value 97 #define ipsecah_age_int_max ipsecah_params[1].ipsecah_param_max 98 #define ipsecah_reap_delay ipsecah_params[2].ipsecah_param_value 99 #define ipsecah_replay_size ipsecah_params[3].ipsecah_param_value 100 #define ipsecah_acquire_timeout ipsecah_params[4].ipsecah_param_value 101 #define ipsecah_larval_timeout ipsecah_params[5].ipsecah_param_value 102 #define ipsecah_default_soft_bytes ipsecah_params[6].ipsecah_param_value 103 #define ipsecah_default_hard_bytes ipsecah_params[7].ipsecah_param_value 104 #define ipsecah_default_soft_addtime ipsecah_params[8].ipsecah_param_value 105 #define ipsecah_default_hard_addtime ipsecah_params[9].ipsecah_param_value 106 #define ipsecah_default_soft_usetime ipsecah_params[10].ipsecah_param_value 107 #define ipsecah_default_hard_usetime ipsecah_params[11].ipsecah_param_value 108 #define ipsecah_log_unknown_spi ipsecah_params[12].ipsecah_param_value 109 110 #define ah0dbg(a) printf a 111 /* NOTE: != 0 instead of > 0 so lint doesn't complain. */ 112 #define ah1dbg(ahstack, a) if (ahstack->ipsecah_debug != 0) printf a 113 #define ah2dbg(ahstack, a) if (ahstack->ipsecah_debug > 1) printf a 114 #define ah3dbg(ahstack, a) if (ahstack->ipsecah_debug > 2) printf a 115 116 /* 117 * XXX This is broken. Padding should be determined dynamically 118 * depending on the ICV size and IP version number so that the 119 * total AH header size is a multiple of 32 bits or 64 bits 120 * for V4 and V6 respectively. For 96bit ICVs we have no problems. 121 * Anything different from that, we need to fix our code. 122 */ 123 #define IPV4_PADDING_ALIGN 0x04 /* Multiple of 32 bits */ 124 #define IPV6_PADDING_ALIGN 0x04 /* Multiple of 32 bits */ 125 126 /* 127 * Helper macro. Avoids a call to msgdsize if there is only one 128 * mblk in the chain. 129 */ 130 #define AH_MSGSIZE(mp) ((mp)->b_cont != NULL ? msgdsize(mp) : MBLKL(mp)) 131 132 133 static ipsec_status_t ah_auth_out_done(mblk_t *); 134 static ipsec_status_t ah_auth_in_done(mblk_t *); 135 static mblk_t *ah_process_ip_options_v4(mblk_t *, ipsa_t *, int *, uint_t, 136 boolean_t, ipsecah_stack_t *); 137 static mblk_t *ah_process_ip_options_v6(mblk_t *, ipsa_t *, int *, uint_t, 138 boolean_t, ipsecah_stack_t *); 139 static void ah_getspi(mblk_t *, keysock_in_t *, ipsecah_stack_t *); 140 static ipsec_status_t ah_inbound_accelerated(mblk_t *, boolean_t, ipsa_t *, 141 uint32_t); 142 static ipsec_status_t ah_outbound_accelerated_v4(mblk_t *, ipsa_t *); 143 static ipsec_status_t ah_outbound_accelerated_v6(mblk_t *, ipsa_t *); 144 static ipsec_status_t ah_outbound(mblk_t *); 145 146 static int ipsecah_open(queue_t *, dev_t *, int, int, cred_t *); 147 static int ipsecah_close(queue_t *); 148 static void ipsecah_rput(queue_t *, mblk_t *); 149 static void ipsecah_wput(queue_t *, mblk_t *); 150 static void ah_send_acquire(ipsacq_t *, mblk_t *, netstack_t *); 151 static boolean_t ah_register_out(uint32_t, uint32_t, uint_t, ipsecah_stack_t *); 152 static void *ipsecah_stack_init(netstackid_t stackid, netstack_t *ns); 153 static void ipsecah_stack_fini(netstackid_t stackid, void *arg); 154 155 extern void (*cl_inet_getspi)(netstackid_t, uint8_t, uint8_t *, size_t, 156 void *); 157 158 /* Setable in /etc/system */ 159 uint32_t ah_hash_size = IPSEC_DEFAULT_HASH_SIZE; 160 161 static taskq_t *ah_taskq; 162 163 static struct module_info info = { 164 5136, "ipsecah", 0, INFPSZ, 65536, 1024 165 }; 166 167 static struct qinit rinit = { 168 (pfi_t)ipsecah_rput, NULL, ipsecah_open, ipsecah_close, NULL, &info, 169 NULL 170 }; 171 172 static struct qinit winit = { 173 (pfi_t)ipsecah_wput, NULL, ipsecah_open, ipsecah_close, NULL, &info, 174 NULL 175 }; 176 177 struct streamtab ipsecahinfo = { 178 &rinit, &winit, NULL, NULL 179 }; 180 181 static int ah_kstat_update(kstat_t *, int); 182 183 uint64_t ipsacq_maxpackets = IPSACQ_MAXPACKETS; 184 185 static boolean_t 186 ah_kstat_init(ipsecah_stack_t *ahstack, netstackid_t stackid) 187 { 188 ipsec_stack_t *ipss = ahstack->ipsecah_netstack->netstack_ipsec; 189 190 ahstack->ah_ksp = kstat_create_netstack("ipsecah", 0, "ah_stat", "net", 191 KSTAT_TYPE_NAMED, sizeof (ah_kstats_t) / sizeof (kstat_named_t), 192 KSTAT_FLAG_PERSISTENT, stackid); 193 194 if (ahstack->ah_ksp == NULL || ahstack->ah_ksp->ks_data == NULL) 195 return (B_FALSE); 196 197 ahstack->ah_kstats = ahstack->ah_ksp->ks_data; 198 199 ahstack->ah_ksp->ks_update = ah_kstat_update; 200 ahstack->ah_ksp->ks_private = (void *)(uintptr_t)stackid; 201 202 #define K64 KSTAT_DATA_UINT64 203 #define KI(x) kstat_named_init(&(ahstack->ah_kstats->ah_stat_##x), #x, K64) 204 205 KI(num_aalgs); 206 KI(good_auth); 207 KI(bad_auth); 208 KI(replay_failures); 209 KI(replay_early_failures); 210 KI(keysock_in); 211 KI(out_requests); 212 KI(acquire_requests); 213 KI(bytes_expired); 214 KI(out_discards); 215 KI(in_accelerated); 216 KI(out_accelerated); 217 KI(noaccel); 218 KI(crypto_sync); 219 KI(crypto_async); 220 KI(crypto_failures); 221 222 #undef KI 223 #undef K64 224 225 kstat_install(ahstack->ah_ksp); 226 IP_ACQUIRE_STAT(ipss, maxpackets, ipsacq_maxpackets); 227 return (B_TRUE); 228 } 229 230 static int 231 ah_kstat_update(kstat_t *kp, int rw) 232 { 233 ah_kstats_t *ekp; 234 netstackid_t stackid = (netstackid_t)(uintptr_t)kp->ks_private; 235 netstack_t *ns; 236 ipsec_stack_t *ipss; 237 238 if ((kp == NULL) || (kp->ks_data == NULL)) 239 return (EIO); 240 241 if (rw == KSTAT_WRITE) 242 return (EACCES); 243 244 ns = netstack_find_by_stackid(stackid); 245 if (ns == NULL) 246 return (-1); 247 ipss = ns->netstack_ipsec; 248 if (ipss == NULL) { 249 netstack_rele(ns); 250 return (-1); 251 } 252 ekp = (ah_kstats_t *)kp->ks_data; 253 254 mutex_enter(&ipss->ipsec_alg_lock); 255 ekp->ah_stat_num_aalgs.value.ui64 = ipss->ipsec_nalgs[IPSEC_ALG_AUTH]; 256 mutex_exit(&ipss->ipsec_alg_lock); 257 258 netstack_rele(ns); 259 return (0); 260 } 261 262 /* 263 * Don't have to lock ipsec_age_interval, as only one thread will access it at 264 * a time, because I control the one function that does a qtimeout() on 265 * ah_pfkey_q. 266 */ 267 static void 268 ah_ager(void *arg) 269 { 270 ipsecah_stack_t *ahstack = (ipsecah_stack_t *)arg; 271 netstack_t *ns = ahstack->ipsecah_netstack; 272 hrtime_t begin = gethrtime(); 273 274 sadb_ager(&ahstack->ah_sadb.s_v4, ahstack->ah_pfkey_q, 275 ahstack->ah_sadb.s_ip_q, ahstack->ipsecah_reap_delay, ns); 276 sadb_ager(&ahstack->ah_sadb.s_v6, ahstack->ah_pfkey_q, 277 ahstack->ah_sadb.s_ip_q, ahstack->ipsecah_reap_delay, ns); 278 279 ahstack->ah_event = sadb_retimeout(begin, ahstack->ah_pfkey_q, 280 ah_ager, ahstack, 281 &ahstack->ipsecah_age_interval, ahstack->ipsecah_age_int_max, 282 info.mi_idnum); 283 } 284 285 /* 286 * Get an AH NDD parameter. 287 */ 288 /* ARGSUSED */ 289 static int 290 ipsecah_param_get(q, mp, cp, cr) 291 queue_t *q; 292 mblk_t *mp; 293 caddr_t cp; 294 cred_t *cr; 295 { 296 ipsecahparam_t *ipsecahpa = (ipsecahparam_t *)cp; 297 uint_t value; 298 ipsecah_stack_t *ahstack = (ipsecah_stack_t *)q->q_ptr; 299 300 mutex_enter(&ahstack->ipsecah_param_lock); 301 value = ipsecahpa->ipsecah_param_value; 302 mutex_exit(&ahstack->ipsecah_param_lock); 303 304 (void) mi_mpprintf(mp, "%u", value); 305 return (0); 306 } 307 308 /* 309 * This routine sets an NDD variable in a ipsecahparam_t structure. 310 */ 311 /* ARGSUSED */ 312 static int 313 ipsecah_param_set(q, mp, value, cp, cr) 314 queue_t *q; 315 mblk_t *mp; 316 char *value; 317 caddr_t cp; 318 cred_t *cr; 319 { 320 ulong_t new_value; 321 ipsecahparam_t *ipsecahpa = (ipsecahparam_t *)cp; 322 ipsecah_stack_t *ahstack = (ipsecah_stack_t *)q->q_ptr; 323 324 /* 325 * Fail the request if the new value does not lie within the 326 * required bounds. 327 */ 328 if (ddi_strtoul(value, NULL, 10, &new_value) != 0 || 329 new_value < ipsecahpa->ipsecah_param_min || 330 new_value > ipsecahpa->ipsecah_param_max) { 331 return (EINVAL); 332 } 333 334 /* Set the new value */ 335 mutex_enter(&ahstack->ipsecah_param_lock); 336 ipsecahpa->ipsecah_param_value = new_value; 337 mutex_exit(&ahstack->ipsecah_param_lock); 338 return (0); 339 } 340 341 /* 342 * Using lifetime NDD variables, fill in an extended combination's 343 * lifetime information. 344 */ 345 void 346 ipsecah_fill_defs(sadb_x_ecomb_t *ecomb, netstack_t *ns) 347 { 348 ipsecah_stack_t *ahstack = ns->netstack_ipsecah; 349 350 ecomb->sadb_x_ecomb_soft_bytes = ahstack->ipsecah_default_soft_bytes; 351 ecomb->sadb_x_ecomb_hard_bytes = ahstack->ipsecah_default_hard_bytes; 352 ecomb->sadb_x_ecomb_soft_addtime = 353 ahstack->ipsecah_default_soft_addtime; 354 ecomb->sadb_x_ecomb_hard_addtime = 355 ahstack->ipsecah_default_hard_addtime; 356 ecomb->sadb_x_ecomb_soft_usetime = 357 ahstack->ipsecah_default_soft_usetime; 358 ecomb->sadb_x_ecomb_hard_usetime = 359 ahstack->ipsecah_default_hard_usetime; 360 } 361 362 /* 363 * Initialize things for AH at module load time. 364 */ 365 boolean_t 366 ipsecah_ddi_init(void) 367 { 368 ah_taskq = taskq_create("ah_taskq", 1, minclsyspri, 369 IPSEC_TASKQ_MIN, IPSEC_TASKQ_MAX, 0); 370 371 /* 372 * We want to be informed each time a stack is created or 373 * destroyed in the kernel, so we can maintain the 374 * set of ipsecah_stack_t's. 375 */ 376 netstack_register(NS_IPSECAH, ipsecah_stack_init, NULL, 377 ipsecah_stack_fini); 378 379 return (B_TRUE); 380 } 381 382 /* 383 * Walk through the param array specified registering each element with the 384 * named dispatch handler. 385 */ 386 static boolean_t 387 ipsecah_param_register(IDP *ndp, ipsecahparam_t *ahp, int cnt) 388 { 389 for (; cnt-- > 0; ahp++) { 390 if (ahp->ipsecah_param_name != NULL && 391 ahp->ipsecah_param_name[0]) { 392 if (!nd_load(ndp, 393 ahp->ipsecah_param_name, 394 ipsecah_param_get, ipsecah_param_set, 395 (caddr_t)ahp)) { 396 nd_free(ndp); 397 return (B_FALSE); 398 } 399 } 400 } 401 return (B_TRUE); 402 } 403 404 /* 405 * Initialize things for AH for each stack instance 406 */ 407 static void * 408 ipsecah_stack_init(netstackid_t stackid, netstack_t *ns) 409 { 410 ipsecah_stack_t *ahstack; 411 ipsecahparam_t *ahp; 412 413 ahstack = (ipsecah_stack_t *)kmem_zalloc(sizeof (*ahstack), KM_SLEEP); 414 ahstack->ipsecah_netstack = ns; 415 416 ahp = (ipsecahparam_t *)kmem_alloc(sizeof (lcl_param_arr), KM_SLEEP); 417 ahstack->ipsecah_params = ahp; 418 bcopy(lcl_param_arr, ahp, sizeof (lcl_param_arr)); 419 420 (void) ipsecah_param_register(&ahstack->ipsecah_g_nd, ahp, 421 A_CNT(lcl_param_arr)); 422 423 (void) ah_kstat_init(ahstack, stackid); 424 425 ahstack->ah_sadb.s_acquire_timeout = &ahstack->ipsecah_acquire_timeout; 426 ahstack->ah_sadb.s_acqfn = ah_send_acquire; 427 sadbp_init("AH", &ahstack->ah_sadb, SADB_SATYPE_AH, ah_hash_size, 428 ahstack->ipsecah_netstack); 429 430 mutex_init(&ahstack->ipsecah_param_lock, NULL, MUTEX_DEFAULT, 0); 431 432 ip_drop_register(&ahstack->ah_dropper, "IPsec AH"); 433 return (ahstack); 434 } 435 436 /* 437 * Destroy things for AH at module unload time. 438 */ 439 void 440 ipsecah_ddi_destroy(void) 441 { 442 netstack_unregister(NS_IPSECAH); 443 taskq_destroy(ah_taskq); 444 } 445 446 /* 447 * Destroy things for AH for one stack... Never called? 448 */ 449 static void 450 ipsecah_stack_fini(netstackid_t stackid, void *arg) 451 { 452 ipsecah_stack_t *ahstack = (ipsecah_stack_t *)arg; 453 454 if (ahstack->ah_pfkey_q != NULL) { 455 (void) quntimeout(ahstack->ah_pfkey_q, ahstack->ah_event); 456 } 457 ahstack->ah_sadb.s_acqfn = NULL; 458 ahstack->ah_sadb.s_acquire_timeout = NULL; 459 sadbp_destroy(&ahstack->ah_sadb, ahstack->ipsecah_netstack); 460 ip_drop_unregister(&ahstack->ah_dropper); 461 mutex_destroy(&ahstack->ipsecah_param_lock); 462 nd_free(&ahstack->ipsecah_g_nd); 463 464 kmem_free(ahstack->ipsecah_params, sizeof (lcl_param_arr)); 465 ahstack->ipsecah_params = NULL; 466 kstat_delete_netstack(ahstack->ah_ksp, stackid); 467 ahstack->ah_ksp = NULL; 468 ahstack->ah_kstats = NULL; 469 470 kmem_free(ahstack, sizeof (*ahstack)); 471 } 472 473 /* 474 * AH module open routine. The module should be opened by keysock. 475 */ 476 /* ARGSUSED */ 477 static int 478 ipsecah_open(queue_t *q, dev_t *devp, int flag, int sflag, cred_t *credp) 479 { 480 netstack_t *ns; 481 ipsecah_stack_t *ahstack; 482 483 if (secpolicy_ip_config(credp, B_FALSE) != 0) 484 return (EPERM); 485 486 if (q->q_ptr != NULL) 487 return (0); /* Re-open of an already open instance. */ 488 489 if (sflag != MODOPEN) 490 return (EINVAL); 491 492 ns = netstack_find_by_cred(credp); 493 ASSERT(ns != NULL); 494 ahstack = ns->netstack_ipsecah; 495 ASSERT(ahstack != NULL); 496 497 /* 498 * ASSUMPTIONS (because I'm MT_OCEXCL): 499 * 500 * * I'm being pushed on top of IP for all my opens (incl. #1). 501 * * Only ipsecah_open() can write into ah_sadb.s_ip_q. 502 * * Because of this, I can check lazily for ah_sadb.s_ip_q. 503 * 504 * If these assumptions are wrong, I'm in BIG trouble... 505 */ 506 507 q->q_ptr = ahstack; 508 WR(q)->q_ptr = q->q_ptr; 509 510 if (ahstack->ah_sadb.s_ip_q == NULL) { 511 struct T_unbind_req *tur; 512 513 ahstack->ah_sadb.s_ip_q = WR(q); 514 /* Allocate an unbind... */ 515 ahstack->ah_ip_unbind = allocb(sizeof (struct T_unbind_req), 516 BPRI_HI); 517 518 /* 519 * Send down T_BIND_REQ to bind IPPROTO_AH. 520 * Handle the ACK here in AH. 521 */ 522 qprocson(q); 523 if (ahstack->ah_ip_unbind == NULL || 524 !sadb_t_bind_req(ahstack->ah_sadb.s_ip_q, IPPROTO_AH)) { 525 if (ahstack->ah_ip_unbind != NULL) { 526 freeb(ahstack->ah_ip_unbind); 527 ahstack->ah_ip_unbind = NULL; 528 } 529 q->q_ptr = NULL; 530 qprocsoff(q); 531 netstack_rele(ahstack->ipsecah_netstack); 532 return (ENOMEM); 533 } 534 535 ahstack->ah_ip_unbind->b_datap->db_type = M_PROTO; 536 tur = (struct T_unbind_req *)ahstack->ah_ip_unbind->b_rptr; 537 tur->PRIM_type = T_UNBIND_REQ; 538 } else { 539 qprocson(q); 540 } 541 542 /* 543 * For now, there's not much I can do. I'll be getting a message 544 * passed down to me from keysock (in my wput), and a T_BIND_ACK 545 * up from IP (in my rput). 546 */ 547 548 return (0); 549 } 550 551 /* 552 * AH module close routine. 553 */ 554 static int 555 ipsecah_close(queue_t *q) 556 { 557 ipsecah_stack_t *ahstack = (ipsecah_stack_t *)q->q_ptr; 558 559 /* 560 * If ah_sadb.s_ip_q is attached to this instance, send a 561 * T_UNBIND_REQ to IP for the instance before doing 562 * a qprocsoff(). 563 */ 564 if (WR(q) == ahstack->ah_sadb.s_ip_q && 565 ahstack->ah_ip_unbind != NULL) { 566 putnext(WR(q), ahstack->ah_ip_unbind); 567 ahstack->ah_ip_unbind = NULL; 568 } 569 570 /* 571 * Clean up q_ptr, if needed. 572 */ 573 qprocsoff(q); 574 575 /* Keysock queue check is safe, because of OCEXCL perimeter. */ 576 577 if (q == ahstack->ah_pfkey_q) { 578 ah1dbg(ahstack, 579 ("ipsecah_close: Ummm... keysock is closing AH.\n")); 580 ahstack->ah_pfkey_q = NULL; 581 /* Detach qtimeouts. */ 582 (void) quntimeout(q, ahstack->ah_event); 583 } 584 585 if (WR(q) == ahstack->ah_sadb.s_ip_q) { 586 /* 587 * If the ah_sadb.s_ip_q is attached to this instance, find 588 * another. The OCEXCL outer perimeter helps us here. 589 */ 590 591 ahstack->ah_sadb.s_ip_q = NULL; 592 593 /* 594 * Find a replacement queue for ah_sadb.s_ip_q. 595 */ 596 if (ahstack->ah_pfkey_q != NULL && 597 ahstack->ah_pfkey_q != RD(q)) { 598 /* 599 * See if we can use the pfkey_q. 600 */ 601 ahstack->ah_sadb.s_ip_q = WR(ahstack->ah_pfkey_q); 602 } 603 604 if (ahstack->ah_sadb.s_ip_q == NULL || 605 !sadb_t_bind_req(ahstack->ah_sadb.s_ip_q, IPPROTO_AH)) { 606 ah1dbg(ahstack, 607 ("ipsecah: Can't reassign ah_sadb.s_ip_q.\n")); 608 ahstack->ah_sadb.s_ip_q = NULL; 609 } else { 610 ahstack->ah_ip_unbind = 611 allocb(sizeof (struct T_unbind_req), BPRI_HI); 612 613 if (ahstack->ah_ip_unbind != NULL) { 614 struct T_unbind_req *tur; 615 616 ahstack->ah_ip_unbind->b_datap->db_type = 617 M_PROTO; 618 tur = (struct T_unbind_req *) 619 ahstack->ah_ip_unbind->b_rptr; 620 tur->PRIM_type = T_UNBIND_REQ; 621 } 622 /* If it's NULL, I can't do much here. */ 623 } 624 } 625 626 netstack_rele(ahstack->ipsecah_netstack); 627 return (0); 628 } 629 630 /* 631 * AH module read put routine. 632 */ 633 /* ARGSUSED */ 634 static void 635 ipsecah_rput(queue_t *q, mblk_t *mp) 636 { 637 ipsecah_stack_t *ahstack = (ipsecah_stack_t *)q->q_ptr; 638 639 ASSERT(mp->b_datap->db_type != M_CTL); /* No more IRE_DB_REQ. */ 640 641 switch (mp->b_datap->db_type) { 642 case M_PROTO: 643 case M_PCPROTO: 644 /* TPI message of some sort. */ 645 switch (*((t_scalar_t *)mp->b_rptr)) { 646 case T_BIND_ACK: 647 /* We expect this. */ 648 ah3dbg(ahstack, 649 ("Thank you IP from AH for T_BIND_ACK\n")); 650 break; 651 case T_ERROR_ACK: 652 cmn_err(CE_WARN, 653 "ipsecah: AH received T_ERROR_ACK from IP."); 654 break; 655 case T_OK_ACK: 656 /* Probably from a (rarely sent) T_UNBIND_REQ. */ 657 break; 658 default: 659 ah1dbg(ahstack, ("Unknown M_{,PC}PROTO message.\n")); 660 } 661 freemsg(mp); 662 break; 663 default: 664 /* For now, passthru message. */ 665 ah2dbg(ahstack, ("AH got unknown mblk type %d.\n", 666 mp->b_datap->db_type)); 667 putnext(q, mp); 668 } 669 } 670 671 /* 672 * Construct an SADB_REGISTER message with the current algorithms. 673 */ 674 static boolean_t 675 ah_register_out(uint32_t sequence, uint32_t pid, uint_t serial, 676 ipsecah_stack_t *ahstack) 677 { 678 mblk_t *mp; 679 boolean_t rc = B_TRUE; 680 sadb_msg_t *samsg; 681 sadb_supported_t *sasupp; 682 sadb_alg_t *saalg; 683 uint_t allocsize = sizeof (*samsg); 684 uint_t i, numalgs_snap; 685 ipsec_alginfo_t **authalgs; 686 uint_t num_aalgs; 687 ipsec_stack_t *ipss = ahstack->ipsecah_netstack->netstack_ipsec; 688 689 /* Allocate the KEYSOCK_OUT. */ 690 mp = sadb_keysock_out(serial); 691 if (mp == NULL) { 692 ah0dbg(("ah_register_out: couldn't allocate mblk.\n")); 693 return (B_FALSE); 694 } 695 696 /* 697 * Allocate the PF_KEY message that follows KEYSOCK_OUT. 698 * The alg reader lock needs to be held while allocating 699 * the variable part (i.e. the algorithms) of the message. 700 */ 701 702 mutex_enter(&ipss->ipsec_alg_lock); 703 704 /* 705 * Return only valid algorithms, so the number of algorithms 706 * to send up may be less than the number of algorithm entries 707 * in the table. 708 */ 709 authalgs = ipss->ipsec_alglists[IPSEC_ALG_AUTH]; 710 for (num_aalgs = 0, i = 0; i < IPSEC_MAX_ALGS; i++) 711 if (authalgs[i] != NULL && ALG_VALID(authalgs[i])) 712 num_aalgs++; 713 714 /* 715 * Fill SADB_REGISTER message's algorithm descriptors. Hold 716 * down the lock while filling it. 717 */ 718 if (num_aalgs != 0) { 719 allocsize += (num_aalgs * sizeof (*saalg)); 720 allocsize += sizeof (*sasupp); 721 } 722 mp->b_cont = allocb(allocsize, BPRI_HI); 723 if (mp->b_cont == NULL) { 724 mutex_exit(&ipss->ipsec_alg_lock); 725 freemsg(mp); 726 return (B_FALSE); 727 } 728 729 mp->b_cont->b_wptr += allocsize; 730 if (num_aalgs != 0) { 731 732 saalg = (sadb_alg_t *)(mp->b_cont->b_rptr + sizeof (*samsg) + 733 sizeof (*sasupp)); 734 ASSERT(((ulong_t)saalg & 0x7) == 0); 735 736 numalgs_snap = 0; 737 for (i = 0; 738 ((i < IPSEC_MAX_ALGS) && (numalgs_snap < num_aalgs)); 739 i++) { 740 if (authalgs[i] == NULL || !ALG_VALID(authalgs[i])) 741 continue; 742 743 saalg->sadb_alg_id = authalgs[i]->alg_id; 744 saalg->sadb_alg_ivlen = 0; 745 saalg->sadb_alg_minbits = authalgs[i]->alg_ef_minbits; 746 saalg->sadb_alg_maxbits = authalgs[i]->alg_ef_maxbits; 747 saalg->sadb_x_alg_increment = 748 authalgs[i]->alg_increment; 749 /* For now, salt is meaningless in AH. */ 750 ASSERT(authalgs[i]->alg_saltlen == 0); 751 saalg->sadb_x_alg_saltbits = 752 SADB_8TO1(authalgs[i]->alg_saltlen); 753 numalgs_snap++; 754 saalg++; 755 } 756 ASSERT(numalgs_snap == num_aalgs); 757 #ifdef DEBUG 758 /* 759 * Reality check to make sure I snagged all of the 760 * algorithms. 761 */ 762 for (; i < IPSEC_MAX_ALGS; i++) 763 if (authalgs[i] != NULL && ALG_VALID(authalgs[i])) 764 cmn_err(CE_PANIC, 765 "ah_register_out()! Missed #%d.\n", i); 766 #endif /* DEBUG */ 767 } 768 769 mutex_exit(&ipss->ipsec_alg_lock); 770 771 /* Now fill the restof the SADB_REGISTER message. */ 772 773 samsg = (sadb_msg_t *)mp->b_cont->b_rptr; 774 samsg->sadb_msg_version = PF_KEY_V2; 775 samsg->sadb_msg_type = SADB_REGISTER; 776 samsg->sadb_msg_errno = 0; 777 samsg->sadb_msg_satype = SADB_SATYPE_AH; 778 samsg->sadb_msg_len = SADB_8TO64(allocsize); 779 samsg->sadb_msg_reserved = 0; 780 /* 781 * Assume caller has sufficient sequence/pid number info. If it's one 782 * from me over a new alg., I could give two hoots about sequence. 783 */ 784 samsg->sadb_msg_seq = sequence; 785 samsg->sadb_msg_pid = pid; 786 787 if (allocsize > sizeof (*samsg)) { 788 sasupp = (sadb_supported_t *)(samsg + 1); 789 sasupp->sadb_supported_len = 790 SADB_8TO64(allocsize - sizeof (sadb_msg_t)); 791 sasupp->sadb_supported_exttype = SADB_EXT_SUPPORTED_AUTH; 792 sasupp->sadb_supported_reserved = 0; 793 } 794 795 if (ahstack->ah_pfkey_q != NULL) 796 putnext(ahstack->ah_pfkey_q, mp); 797 else { 798 rc = B_FALSE; 799 freemsg(mp); 800 } 801 802 return (rc); 803 } 804 805 /* 806 * Invoked when the algorithm table changes. Causes SADB_REGISTER 807 * messages continaining the current list of algorithms to be 808 * sent up to the AH listeners. 809 */ 810 void 811 ipsecah_algs_changed(netstack_t *ns) 812 { 813 ipsecah_stack_t *ahstack = ns->netstack_ipsecah; 814 815 /* 816 * Time to send a PF_KEY SADB_REGISTER message to AH listeners 817 * everywhere. (The function itself checks for NULL ah_pfkey_q.) 818 */ 819 (void) ah_register_out(0, 0, 0, ahstack); 820 } 821 822 /* 823 * Stub function that taskq_dispatch() invokes to take the mblk (in arg) 824 * and put() it into AH and STREAMS again. 825 */ 826 static void 827 inbound_task(void *arg) 828 { 829 ah_t *ah; 830 mblk_t *mp = (mblk_t *)arg; 831 ipsec_in_t *ii = (ipsec_in_t *)mp->b_rptr; 832 int ipsec_rc; 833 netstack_t *ns; 834 ipsecah_stack_t *ahstack; 835 836 ns = netstack_find_by_stackid(ii->ipsec_in_stackid); 837 if (ns == NULL || ns != ii->ipsec_in_ns) { 838 /* Just freemsg(). */ 839 if (ns != NULL) 840 netstack_rele(ns); 841 freemsg(mp); 842 return; 843 } 844 845 ahstack = ns->netstack_ipsecah; 846 847 ah2dbg(ahstack, ("in AH inbound_task")); 848 849 ASSERT(ahstack != NULL); 850 ah = ipsec_inbound_ah_sa(mp, ns); 851 if (ah != NULL) { 852 ASSERT(ii->ipsec_in_ah_sa != NULL); 853 ipsec_rc = ii->ipsec_in_ah_sa->ipsa_input_func(mp, ah); 854 if (ipsec_rc == IPSEC_STATUS_SUCCESS) 855 ip_fanout_proto_again(mp, NULL, NULL, NULL); 856 } 857 netstack_rele(ns); 858 } 859 860 /* 861 * Now that weak-key passed, actually ADD the security association, and 862 * send back a reply ADD message. 863 */ 864 static int 865 ah_add_sa_finish(mblk_t *mp, sadb_msg_t *samsg, keysock_in_t *ksi, 866 int *diagnostic, ipsecah_stack_t *ahstack) 867 { 868 isaf_t *primary = NULL, *secondary, *inbound, *outbound; 869 sadb_sa_t *assoc = (sadb_sa_t *)ksi->ks_in_extv[SADB_EXT_SA]; 870 sadb_address_t *dstext = 871 (sadb_address_t *)ksi->ks_in_extv[SADB_EXT_ADDRESS_DST]; 872 struct sockaddr_in *dst; 873 struct sockaddr_in6 *dst6; 874 boolean_t is_ipv4, clone = B_FALSE, is_inbound = B_FALSE; 875 uint32_t *dstaddr; 876 ipsa_t *larval; 877 ipsacq_t *acqrec; 878 iacqf_t *acq_bucket; 879 mblk_t *acq_msgs = NULL; 880 mblk_t *lpkt; 881 int rc; 882 sadb_t *sp; 883 int outhash; 884 netstack_t *ns = ahstack->ipsecah_netstack; 885 ipsec_stack_t *ipss = ns->netstack_ipsec; 886 887 /* 888 * Locate the appropriate table(s). 889 */ 890 891 dst = (struct sockaddr_in *)(dstext + 1); 892 dst6 = (struct sockaddr_in6 *)dst; 893 is_ipv4 = (dst->sin_family == AF_INET); 894 if (is_ipv4) { 895 sp = &ahstack->ah_sadb.s_v4; 896 dstaddr = (uint32_t *)(&dst->sin_addr); 897 outhash = OUTBOUND_HASH_V4(sp, *(ipaddr_t *)dstaddr); 898 } else { 899 ASSERT(dst->sin_family == AF_INET6); 900 sp = &ahstack->ah_sadb.s_v6; 901 dstaddr = (uint32_t *)(&dst6->sin6_addr); 902 outhash = OUTBOUND_HASH_V6(sp, *(in6_addr_t *)dstaddr); 903 } 904 905 inbound = INBOUND_BUCKET(sp, assoc->sadb_sa_spi); 906 outbound = &sp->sdb_of[outhash]; 907 /* 908 * Use the direction flags provided by the KMD to determine 909 * if the inbound or outbound table should be the primary 910 * for this SA. If these flags were absent then make this 911 * decision based on the addresses. 912 */ 913 if (assoc->sadb_sa_flags & IPSA_F_INBOUND) { 914 primary = inbound; 915 secondary = outbound; 916 is_inbound = B_TRUE; 917 if (assoc->sadb_sa_flags & IPSA_F_OUTBOUND) 918 clone = B_TRUE; 919 } else { 920 if (assoc->sadb_sa_flags & IPSA_F_OUTBOUND) { 921 primary = outbound; 922 secondary = inbound; 923 } 924 } 925 926 if (primary == NULL) { 927 /* 928 * The KMD did not set a direction flag, determine which 929 * table to insert the SA into based on addresses. 930 */ 931 switch (ksi->ks_in_dsttype) { 932 case KS_IN_ADDR_MBCAST: 933 clone = B_TRUE; /* All mcast SAs can be bidirectional */ 934 assoc->sadb_sa_flags |= IPSA_F_OUTBOUND; 935 /* FALLTHRU */ 936 /* 937 * If the source address is either one of mine, or unspecified 938 * (which is best summed up by saying "not 'not mine'"), 939 * then the association is potentially bi-directional, 940 * in that it can be used for inbound traffic and outbound 941 * traffic. The best example of such and SA is a multicast 942 * SA (which allows me to receive the outbound traffic). 943 */ 944 case KS_IN_ADDR_ME: 945 assoc->sadb_sa_flags |= IPSA_F_INBOUND; 946 primary = inbound; 947 secondary = outbound; 948 if (ksi->ks_in_srctype != KS_IN_ADDR_NOTME) 949 clone = B_TRUE; 950 is_inbound = B_TRUE; 951 break; 952 /* 953 * If the source address literally not mine (either 954 * unspecified or not mine), then this SA may have an 955 * address that WILL be mine after some configuration. 956 * We pay the price for this by making it a bi-directional 957 * SA. 958 */ 959 case KS_IN_ADDR_NOTME: 960 assoc->sadb_sa_flags |= IPSA_F_OUTBOUND; 961 primary = outbound; 962 secondary = inbound; 963 if (ksi->ks_in_srctype != KS_IN_ADDR_ME) { 964 assoc->sadb_sa_flags |= IPSA_F_INBOUND; 965 clone = B_TRUE; 966 } 967 break; 968 default: 969 *diagnostic = SADB_X_DIAGNOSTIC_BAD_DST; 970 return (EINVAL); 971 } 972 } 973 974 /* 975 * Find a ACQUIRE list entry if possible. If we've added an SA that 976 * suits the needs of an ACQUIRE list entry, we can eliminate the 977 * ACQUIRE list entry and transmit the enqueued packets. Use the 978 * high-bit of the sequence number to queue it. Key off destination 979 * addr, and change acqrec's state. 980 */ 981 982 if (samsg->sadb_msg_seq & IACQF_LOWEST_SEQ) { 983 acq_bucket = &sp->sdb_acq[outhash]; 984 mutex_enter(&acq_bucket->iacqf_lock); 985 for (acqrec = acq_bucket->iacqf_ipsacq; acqrec != NULL; 986 acqrec = acqrec->ipsacq_next) { 987 mutex_enter(&acqrec->ipsacq_lock); 988 /* 989 * Q: I only check sequence. Should I check dst? 990 * A: Yes, check dest because those are the packets 991 * that are queued up. 992 */ 993 if (acqrec->ipsacq_seq == samsg->sadb_msg_seq && 994 IPSA_ARE_ADDR_EQUAL(dstaddr, 995 acqrec->ipsacq_dstaddr, acqrec->ipsacq_addrfam)) 996 break; 997 mutex_exit(&acqrec->ipsacq_lock); 998 } 999 if (acqrec != NULL) { 1000 /* 1001 * AHA! I found an ACQUIRE record for this SA. 1002 * Grab the msg list, and free the acquire record. 1003 * I already am holding the lock for this record, 1004 * so all I have to do is free it. 1005 */ 1006 acq_msgs = acqrec->ipsacq_mp; 1007 acqrec->ipsacq_mp = NULL; 1008 mutex_exit(&acqrec->ipsacq_lock); 1009 sadb_destroy_acquire(acqrec, ns); 1010 } 1011 mutex_exit(&acq_bucket->iacqf_lock); 1012 } 1013 1014 /* 1015 * Find PF_KEY message, and see if I'm an update. If so, find entry 1016 * in larval list (if there). 1017 */ 1018 1019 larval = NULL; 1020 1021 if (samsg->sadb_msg_type == SADB_UPDATE) { 1022 mutex_enter(&inbound->isaf_lock); 1023 larval = ipsec_getassocbyspi(inbound, assoc->sadb_sa_spi, 1024 ALL_ZEROES_PTR, dstaddr, dst->sin_family); 1025 mutex_exit(&inbound->isaf_lock); 1026 1027 if ((larval == NULL) || 1028 (larval->ipsa_state != IPSA_STATE_LARVAL)) { 1029 *diagnostic = SADB_X_DIAGNOSTIC_SA_NOTFOUND; 1030 if (larval != NULL) { 1031 IPSA_REFRELE(larval); 1032 } 1033 ah0dbg(("Larval update, but larval disappeared.\n")); 1034 return (ESRCH); 1035 } /* Else sadb_common_add unlinks it for me! */ 1036 } 1037 1038 lpkt = NULL; 1039 if (larval != NULL) 1040 lpkt = sadb_clear_lpkt(larval); 1041 1042 rc = sadb_common_add(ahstack->ah_sadb.s_ip_q, ahstack->ah_pfkey_q, mp, 1043 samsg, ksi, primary, secondary, larval, clone, is_inbound, 1044 diagnostic, ns, &ahstack->ah_sadb); 1045 1046 /* 1047 * How much more stack will I create with all of these 1048 * ah_inbound_* and ah_outbound_*() calls? 1049 */ 1050 1051 if (rc == 0 && lpkt != NULL) 1052 rc = !taskq_dispatch(ah_taskq, inbound_task, lpkt, TQ_NOSLEEP); 1053 1054 if (rc != 0) { 1055 ip_drop_packet(lpkt, B_TRUE, NULL, NULL, 1056 DROPPER(ipss, ipds_sadb_inlarval_timeout), 1057 &ahstack->ah_dropper); 1058 } 1059 1060 while (acq_msgs != NULL) { 1061 mblk_t *mp = acq_msgs; 1062 1063 acq_msgs = acq_msgs->b_next; 1064 mp->b_next = NULL; 1065 if (rc == 0) { 1066 ipsec_out_t *io = (ipsec_out_t *)mp->b_rptr; 1067 1068 ASSERT(ahstack->ah_sadb.s_ip_q != NULL); 1069 if (ipsec_outbound_sa(mp, IPPROTO_AH)) { 1070 io->ipsec_out_ah_done = B_TRUE; 1071 if (ah_outbound(mp) == IPSEC_STATUS_SUCCESS) { 1072 ipha_t *ipha = (ipha_t *) 1073 mp->b_cont->b_rptr; 1074 if (is_ipv4) { 1075 ip_wput_ipsec_out(NULL, mp, 1076 ipha, NULL, NULL); 1077 } else { 1078 ip6_t *ip6h = (ip6_t *)ipha; 1079 ip_wput_ipsec_out_v6(NULL, 1080 mp, ip6h, NULL, NULL); 1081 } 1082 } 1083 continue; 1084 } 1085 } 1086 AH_BUMP_STAT(ahstack, out_discards); 1087 ip_drop_packet(mp, B_FALSE, NULL, NULL, 1088 DROPPER(ipss, ipds_sadb_acquire_timeout), 1089 &ahstack->ah_dropper); 1090 } 1091 1092 return (rc); 1093 } 1094 1095 /* 1096 * Add new AH security association. This may become a generic AH/ESP 1097 * routine eventually. 1098 */ 1099 static int 1100 ah_add_sa(mblk_t *mp, keysock_in_t *ksi, int *diagnostic, netstack_t *ns) 1101 { 1102 sadb_sa_t *assoc = (sadb_sa_t *)ksi->ks_in_extv[SADB_EXT_SA]; 1103 sadb_address_t *srcext = 1104 (sadb_address_t *)ksi->ks_in_extv[SADB_EXT_ADDRESS_SRC]; 1105 sadb_address_t *dstext = 1106 (sadb_address_t *)ksi->ks_in_extv[SADB_EXT_ADDRESS_DST]; 1107 sadb_address_t *isrcext = 1108 (sadb_address_t *)ksi->ks_in_extv[SADB_X_EXT_ADDRESS_INNER_SRC]; 1109 sadb_address_t *idstext = 1110 (sadb_address_t *)ksi->ks_in_extv[SADB_X_EXT_ADDRESS_INNER_DST]; 1111 sadb_key_t *key = (sadb_key_t *)ksi->ks_in_extv[SADB_EXT_KEY_AUTH]; 1112 struct sockaddr_in *src, *dst; 1113 /* We don't need sockaddr_in6 for now. */ 1114 sadb_lifetime_t *soft = 1115 (sadb_lifetime_t *)ksi->ks_in_extv[SADB_EXT_LIFETIME_SOFT]; 1116 sadb_lifetime_t *hard = 1117 (sadb_lifetime_t *)ksi->ks_in_extv[SADB_EXT_LIFETIME_HARD]; 1118 sadb_lifetime_t *idle = 1119 (sadb_lifetime_t *)ksi->ks_in_extv[SADB_X_EXT_LIFETIME_IDLE]; 1120 ipsec_alginfo_t *aalg; 1121 ipsecah_stack_t *ahstack = ns->netstack_ipsecah; 1122 ipsec_stack_t *ipss = ns->netstack_ipsec; 1123 1124 /* I need certain extensions present for an ADD message. */ 1125 if (srcext == NULL) { 1126 *diagnostic = SADB_X_DIAGNOSTIC_MISSING_SRC; 1127 return (EINVAL); 1128 } 1129 if (dstext == NULL) { 1130 *diagnostic = SADB_X_DIAGNOSTIC_MISSING_DST; 1131 return (EINVAL); 1132 } 1133 if (isrcext == NULL && idstext != NULL) { 1134 *diagnostic = SADB_X_DIAGNOSTIC_MISSING_INNER_SRC; 1135 return (EINVAL); 1136 } 1137 if (isrcext != NULL && idstext == NULL) { 1138 *diagnostic = SADB_X_DIAGNOSTIC_MISSING_INNER_DST; 1139 return (EINVAL); 1140 } 1141 if (assoc == NULL) { 1142 *diagnostic = SADB_X_DIAGNOSTIC_MISSING_SA; 1143 return (EINVAL); 1144 } 1145 if (key == NULL) { 1146 *diagnostic = SADB_X_DIAGNOSTIC_MISSING_AKEY; 1147 return (EINVAL); 1148 } 1149 1150 src = (struct sockaddr_in *)(srcext + 1); 1151 dst = (struct sockaddr_in *)(dstext + 1); 1152 1153 /* Sundry ADD-specific reality checks. */ 1154 /* XXX STATS : Logging/stats here? */ 1155 1156 if ((assoc->sadb_sa_state != SADB_SASTATE_MATURE) && 1157 (assoc->sadb_sa_state != SADB_X_SASTATE_ACTIVE_ELSEWHERE)) { 1158 *diagnostic = SADB_X_DIAGNOSTIC_BAD_SASTATE; 1159 return (EINVAL); 1160 } 1161 if (assoc->sadb_sa_encrypt != SADB_EALG_NONE) { 1162 *diagnostic = SADB_X_DIAGNOSTIC_ENCR_NOTSUPP; 1163 return (EINVAL); 1164 } 1165 if (assoc->sadb_sa_flags & ~ahstack->ah_sadb.s_addflags) { 1166 *diagnostic = SADB_X_DIAGNOSTIC_BAD_SAFLAGS; 1167 return (EINVAL); 1168 } 1169 if ((*diagnostic = sadb_hardsoftchk(hard, soft, idle)) != 0) 1170 return (EINVAL); 1171 1172 ASSERT(src->sin_family == dst->sin_family); 1173 1174 /* Stuff I don't support, for now. XXX Diagnostic? */ 1175 if (ksi->ks_in_extv[SADB_EXT_LIFETIME_CURRENT] != NULL || 1176 ksi->ks_in_extv[SADB_EXT_SENSITIVITY] != NULL) 1177 return (EOPNOTSUPP); 1178 1179 /* 1180 * XXX Policy : I'm not checking identities or sensitivity 1181 * labels at this time, but if I did, I'd do them here, before I sent 1182 * the weak key check up to the algorithm. 1183 */ 1184 1185 /* verify that there is a mapping for the specified algorithm */ 1186 mutex_enter(&ipss->ipsec_alg_lock); 1187 aalg = ipss->ipsec_alglists[IPSEC_ALG_AUTH][assoc->sadb_sa_auth]; 1188 if (aalg == NULL || !ALG_VALID(aalg)) { 1189 mutex_exit(&ipss->ipsec_alg_lock); 1190 ah1dbg(ahstack, ("Couldn't find auth alg #%d.\n", 1191 assoc->sadb_sa_auth)); 1192 *diagnostic = SADB_X_DIAGNOSTIC_BAD_AALG; 1193 return (EINVAL); 1194 } 1195 ASSERT(aalg->alg_mech_type != CRYPTO_MECHANISM_INVALID); 1196 1197 /* sanity check key sizes */ 1198 if (!ipsec_valid_key_size(key->sadb_key_bits, aalg)) { 1199 mutex_exit(&ipss->ipsec_alg_lock); 1200 *diagnostic = SADB_X_DIAGNOSTIC_BAD_AKEYBITS; 1201 return (EINVAL); 1202 } 1203 1204 /* check key and fix parity if needed */ 1205 if (ipsec_check_key(aalg->alg_mech_type, key, B_TRUE, 1206 diagnostic) != 0) { 1207 mutex_exit(&ipss->ipsec_alg_lock); 1208 return (EINVAL); 1209 } 1210 1211 mutex_exit(&ipss->ipsec_alg_lock); 1212 1213 return (ah_add_sa_finish(mp, (sadb_msg_t *)mp->b_cont->b_rptr, ksi, 1214 diagnostic, ahstack)); 1215 } 1216 1217 /* 1218 * Update a security association. Updates come in two varieties. The first 1219 * is an update of lifetimes on a non-larval SA. The second is an update of 1220 * a larval SA, which ends up looking a lot more like an add. 1221 */ 1222 static int 1223 ah_update_sa(mblk_t *mp, keysock_in_t *ksi, int *diagnostic, 1224 ipsecah_stack_t *ahstack, uint8_t sadb_msg_type) 1225 { 1226 sadb_sa_t *assoc = (sadb_sa_t *)ksi->ks_in_extv[SADB_EXT_SA]; 1227 sadb_address_t *dstext = 1228 (sadb_address_t *)ksi->ks_in_extv[SADB_EXT_ADDRESS_DST]; 1229 mblk_t *buf_pkt; 1230 int rcode; 1231 1232 if (dstext == NULL) { 1233 *diagnostic = SADB_X_DIAGNOSTIC_MISSING_DST; 1234 return (EINVAL); 1235 } 1236 1237 rcode = sadb_update_sa(mp, ksi, &buf_pkt, &ahstack->ah_sadb, 1238 diagnostic, ahstack->ah_pfkey_q, ah_add_sa, 1239 ahstack->ipsecah_netstack, sadb_msg_type); 1240 1241 if ((assoc->sadb_sa_state != SADB_X_SASTATE_ACTIVE) || 1242 (rcode != 0)) { 1243 return (rcode); 1244 } 1245 1246 HANDLE_BUF_PKT(ah_taskq, ahstack->ipsecah_netstack->netstack_ipsec, 1247 ahstack->ah_dropper, buf_pkt); 1248 1249 return (rcode); 1250 } 1251 1252 /* 1253 * Delete a security association. This is REALLY likely to be code common to 1254 * both AH and ESP. Find the association, then unlink it. 1255 */ 1256 static int 1257 ah_del_sa(mblk_t *mp, keysock_in_t *ksi, int *diagnostic, 1258 ipsecah_stack_t *ahstack, uint8_t sadb_msg_type) 1259 { 1260 sadb_sa_t *assoc = (sadb_sa_t *)ksi->ks_in_extv[SADB_EXT_SA]; 1261 sadb_address_t *dstext = 1262 (sadb_address_t *)ksi->ks_in_extv[SADB_EXT_ADDRESS_DST]; 1263 sadb_address_t *srcext = 1264 (sadb_address_t *)ksi->ks_in_extv[SADB_EXT_ADDRESS_SRC]; 1265 struct sockaddr_in *sin; 1266 1267 if (assoc == NULL) { 1268 if (dstext != NULL) 1269 sin = (struct sockaddr_in *)(dstext + 1); 1270 else if (srcext != NULL) 1271 sin = (struct sockaddr_in *)(srcext + 1); 1272 else { 1273 *diagnostic = SADB_X_DIAGNOSTIC_MISSING_SA; 1274 return (EINVAL); 1275 } 1276 return (sadb_purge_sa(mp, ksi, 1277 (sin->sin_family == AF_INET6) ? &ahstack->ah_sadb.s_v6 : 1278 &ahstack->ah_sadb.s_v4, 1279 ahstack->ah_pfkey_q, ahstack->ah_sadb.s_ip_q)); 1280 } 1281 1282 return (sadb_delget_sa(mp, ksi, &ahstack->ah_sadb, diagnostic, 1283 ahstack->ah_pfkey_q, sadb_msg_type)); 1284 } 1285 1286 /* 1287 * Convert the entire contents of all of AH's SA tables into PF_KEY SADB_DUMP 1288 * messages. 1289 */ 1290 static void 1291 ah_dump(mblk_t *mp, keysock_in_t *ksi, ipsecah_stack_t *ahstack) 1292 { 1293 int error; 1294 sadb_msg_t *samsg; 1295 1296 /* 1297 * Dump each fanout, bailing if error is non-zero. 1298 */ 1299 1300 error = sadb_dump(ahstack->ah_pfkey_q, mp, ksi, &ahstack->ah_sadb.s_v4); 1301 if (error != 0) 1302 goto bail; 1303 1304 error = sadb_dump(ahstack->ah_pfkey_q, mp, ksi, &ahstack->ah_sadb.s_v6); 1305 bail: 1306 ASSERT(mp->b_cont != NULL); 1307 samsg = (sadb_msg_t *)mp->b_cont->b_rptr; 1308 samsg->sadb_msg_errno = (uint8_t)error; 1309 sadb_pfkey_echo(ahstack->ah_pfkey_q, mp, 1310 (sadb_msg_t *)mp->b_cont->b_rptr, ksi, NULL); 1311 } 1312 1313 /* 1314 * First-cut reality check for an inbound PF_KEY message. 1315 */ 1316 static boolean_t 1317 ah_pfkey_reality_failures(mblk_t *mp, keysock_in_t *ksi, 1318 ipsecah_stack_t *ahstack) 1319 { 1320 int diagnostic; 1321 1322 if (mp->b_cont == NULL) { 1323 freemsg(mp); 1324 return (B_TRUE); 1325 } 1326 1327 if (ksi->ks_in_extv[SADB_EXT_KEY_ENCRYPT] != NULL) { 1328 diagnostic = SADB_X_DIAGNOSTIC_EKEY_PRESENT; 1329 goto badmsg; 1330 } 1331 if (ksi->ks_in_extv[SADB_EXT_PROPOSAL] != NULL) { 1332 diagnostic = SADB_X_DIAGNOSTIC_PROP_PRESENT; 1333 goto badmsg; 1334 } 1335 if (ksi->ks_in_extv[SADB_EXT_SUPPORTED_AUTH] != NULL || 1336 ksi->ks_in_extv[SADB_EXT_SUPPORTED_ENCRYPT] != NULL) { 1337 diagnostic = SADB_X_DIAGNOSTIC_SUPP_PRESENT; 1338 goto badmsg; 1339 } 1340 return (B_FALSE); /* False ==> no failures */ 1341 1342 badmsg: 1343 sadb_pfkey_error(ahstack->ah_pfkey_q, mp, EINVAL, 1344 diagnostic, ksi->ks_in_serial); 1345 return (B_TRUE); /* True ==> failures */ 1346 } 1347 1348 /* 1349 * AH parsing of PF_KEY messages. Keysock did most of the really silly 1350 * error cases. What I receive is a fully-formed, syntactically legal 1351 * PF_KEY message. I then need to check semantics... 1352 * 1353 * This code may become common to AH and ESP. Stay tuned. 1354 * 1355 * I also make the assumption that db_ref's are cool. If this assumption 1356 * is wrong, this means that someone other than keysock or me has been 1357 * mucking with PF_KEY messages. 1358 */ 1359 static void 1360 ah_parse_pfkey(mblk_t *mp, ipsecah_stack_t *ahstack) 1361 { 1362 mblk_t *msg = mp->b_cont; 1363 sadb_msg_t *samsg; 1364 keysock_in_t *ksi; 1365 int error; 1366 int diagnostic = SADB_X_DIAGNOSTIC_NONE; 1367 1368 ASSERT(msg != NULL); 1369 1370 samsg = (sadb_msg_t *)msg->b_rptr; 1371 ksi = (keysock_in_t *)mp->b_rptr; 1372 1373 /* 1374 * If applicable, convert unspecified AF_INET6 to unspecified 1375 * AF_INET. 1376 */ 1377 if (!sadb_addrfix(ksi, ahstack->ah_pfkey_q, mp, 1378 ahstack->ipsecah_netstack) || 1379 ah_pfkey_reality_failures(mp, ksi, ahstack)) { 1380 return; 1381 } 1382 1383 switch (samsg->sadb_msg_type) { 1384 case SADB_ADD: 1385 error = ah_add_sa(mp, ksi, &diagnostic, 1386 ahstack->ipsecah_netstack); 1387 if (error != 0) { 1388 sadb_pfkey_error(ahstack->ah_pfkey_q, mp, error, 1389 diagnostic, ksi->ks_in_serial); 1390 } 1391 /* else ah_add_sa() took care of things. */ 1392 break; 1393 case SADB_DELETE: 1394 case SADB_X_DELPAIR: 1395 case SADB_X_DELPAIR_STATE: 1396 error = ah_del_sa(mp, ksi, &diagnostic, ahstack, 1397 samsg->sadb_msg_type); 1398 if (error != 0) { 1399 sadb_pfkey_error(ahstack->ah_pfkey_q, mp, error, 1400 diagnostic, ksi->ks_in_serial); 1401 } 1402 /* Else ah_del_sa() took care of things. */ 1403 break; 1404 case SADB_GET: 1405 error = sadb_delget_sa(mp, ksi, &ahstack->ah_sadb, &diagnostic, 1406 ahstack->ah_pfkey_q, samsg->sadb_msg_type); 1407 if (error != 0) { 1408 sadb_pfkey_error(ahstack->ah_pfkey_q, mp, error, 1409 diagnostic, ksi->ks_in_serial); 1410 } 1411 /* Else sadb_get_sa() took care of things. */ 1412 break; 1413 case SADB_FLUSH: 1414 sadbp_flush(&ahstack->ah_sadb, ahstack->ipsecah_netstack); 1415 sadb_pfkey_echo(ahstack->ah_pfkey_q, mp, samsg, ksi, NULL); 1416 break; 1417 case SADB_REGISTER: 1418 /* 1419 * Hmmm, let's do it! Check for extensions (there should 1420 * be none), extract the fields, call ah_register_out(), 1421 * then either free or report an error. 1422 * 1423 * Keysock takes care of the PF_KEY bookkeeping for this. 1424 */ 1425 if (ah_register_out(samsg->sadb_msg_seq, samsg->sadb_msg_pid, 1426 ksi->ks_in_serial, ahstack)) { 1427 freemsg(mp); 1428 } else { 1429 /* 1430 * Only way this path hits is if there is a memory 1431 * failure. It will not return B_FALSE because of 1432 * lack of ah_pfkey_q if I am in wput(). 1433 */ 1434 sadb_pfkey_error(ahstack->ah_pfkey_q, mp, ENOMEM, 1435 diagnostic, ksi->ks_in_serial); 1436 } 1437 break; 1438 case SADB_UPDATE: 1439 case SADB_X_UPDATEPAIR: 1440 /* 1441 * Find a larval, if not there, find a full one and get 1442 * strict. 1443 */ 1444 error = ah_update_sa(mp, ksi, &diagnostic, ahstack, 1445 samsg->sadb_msg_type); 1446 if (error != 0) { 1447 sadb_pfkey_error(ahstack->ah_pfkey_q, mp, error, 1448 diagnostic, ksi->ks_in_serial); 1449 } 1450 /* else ah_update_sa() took care of things. */ 1451 break; 1452 case SADB_GETSPI: 1453 /* 1454 * Reserve a new larval entry. 1455 */ 1456 ah_getspi(mp, ksi, ahstack); 1457 break; 1458 case SADB_ACQUIRE: 1459 /* 1460 * Find larval and/or ACQUIRE record and kill it (them), I'm 1461 * most likely an error. Inbound ACQUIRE messages should only 1462 * have the base header. 1463 */ 1464 sadb_in_acquire(samsg, &ahstack->ah_sadb, ahstack->ah_pfkey_q, 1465 ahstack->ipsecah_netstack); 1466 freemsg(mp); 1467 break; 1468 case SADB_DUMP: 1469 /* 1470 * Dump all entries. 1471 */ 1472 ah_dump(mp, ksi, ahstack); 1473 /* ah_dump will take care of the return message, etc. */ 1474 break; 1475 case SADB_EXPIRE: 1476 /* Should never reach me. */ 1477 sadb_pfkey_error(ahstack->ah_pfkey_q, mp, EOPNOTSUPP, 1478 diagnostic, ksi->ks_in_serial); 1479 break; 1480 default: 1481 sadb_pfkey_error(ahstack->ah_pfkey_q, mp, EINVAL, 1482 SADB_X_DIAGNOSTIC_UNKNOWN_MSG, ksi->ks_in_serial); 1483 break; 1484 } 1485 } 1486 1487 /* 1488 * Handle case where PF_KEY says it can't find a keysock for one of my 1489 * ACQUIRE messages. 1490 */ 1491 static void 1492 ah_keysock_no_socket(mblk_t *mp, ipsecah_stack_t *ahstack) 1493 { 1494 sadb_msg_t *samsg; 1495 keysock_out_err_t *kse = (keysock_out_err_t *)mp->b_rptr; 1496 1497 if (mp->b_cont == NULL) { 1498 freemsg(mp); 1499 return; 1500 } 1501 samsg = (sadb_msg_t *)mp->b_cont->b_rptr; 1502 1503 /* 1504 * If keysock can't find any registered, delete the acquire record 1505 * immediately, and handle errors. 1506 */ 1507 if (samsg->sadb_msg_type == SADB_ACQUIRE) { 1508 samsg->sadb_msg_errno = kse->ks_err_errno; 1509 samsg->sadb_msg_len = SADB_8TO64(sizeof (*samsg)); 1510 /* 1511 * Use the write-side of the ah_pfkey_q, in case there is 1512 * no ahstack->ah_sadb.s_ip_q. 1513 */ 1514 sadb_in_acquire(samsg, &ahstack->ah_sadb, 1515 WR(ahstack->ah_pfkey_q), ahstack->ipsecah_netstack); 1516 } 1517 1518 freemsg(mp); 1519 } 1520 1521 /* 1522 * AH module write put routine. 1523 */ 1524 static void 1525 ipsecah_wput(queue_t *q, mblk_t *mp) 1526 { 1527 ipsec_info_t *ii; 1528 struct iocblk *iocp; 1529 ipsecah_stack_t *ahstack = (ipsecah_stack_t *)q->q_ptr; 1530 1531 ah3dbg(ahstack, ("In ah_wput().\n")); 1532 1533 /* NOTE: Each case must take care of freeing or passing mp. */ 1534 switch (mp->b_datap->db_type) { 1535 case M_CTL: 1536 if ((mp->b_wptr - mp->b_rptr) < sizeof (ipsec_info_t)) { 1537 /* Not big enough message. */ 1538 freemsg(mp); 1539 break; 1540 } 1541 ii = (ipsec_info_t *)mp->b_rptr; 1542 1543 switch (ii->ipsec_info_type) { 1544 case KEYSOCK_OUT_ERR: 1545 ah1dbg(ahstack, ("Got KEYSOCK_OUT_ERR message.\n")); 1546 ah_keysock_no_socket(mp, ahstack); 1547 break; 1548 case KEYSOCK_IN: 1549 AH_BUMP_STAT(ahstack, keysock_in); 1550 ah3dbg(ahstack, ("Got KEYSOCK_IN message.\n")); 1551 1552 /* Parse the message. */ 1553 ah_parse_pfkey(mp, ahstack); 1554 break; 1555 case KEYSOCK_HELLO: 1556 sadb_keysock_hello(&ahstack->ah_pfkey_q, q, mp, 1557 ah_ager, (void *)ahstack, &ahstack->ah_event, 1558 SADB_SATYPE_AH); 1559 break; 1560 default: 1561 ah1dbg(ahstack, ("Got M_CTL from above of 0x%x.\n", 1562 ii->ipsec_info_type)); 1563 freemsg(mp); 1564 break; 1565 } 1566 break; 1567 case M_IOCTL: 1568 iocp = (struct iocblk *)mp->b_rptr; 1569 switch (iocp->ioc_cmd) { 1570 case ND_SET: 1571 case ND_GET: 1572 if (nd_getset(q, ahstack->ipsecah_g_nd, mp)) { 1573 qreply(q, mp); 1574 return; 1575 } else { 1576 iocp->ioc_error = ENOENT; 1577 } 1578 /* FALLTHRU */ 1579 default: 1580 /* We really don't support any other ioctls, do we? */ 1581 1582 /* Return EINVAL */ 1583 if (iocp->ioc_error != ENOENT) 1584 iocp->ioc_error = EINVAL; 1585 iocp->ioc_count = 0; 1586 mp->b_datap->db_type = M_IOCACK; 1587 qreply(q, mp); 1588 return; 1589 } 1590 default: 1591 ah3dbg(ahstack, 1592 ("Got default message, type %d, passing to IP.\n", 1593 mp->b_datap->db_type)); 1594 putnext(q, mp); 1595 } 1596 } 1597 1598 /* 1599 * Updating use times can be tricky business if the ipsa_haspeer flag is 1600 * set. This function is called once in an SA's lifetime. 1601 * 1602 * Caller has to REFRELE "assoc" which is passed in. This function has 1603 * to REFRELE any peer SA that is obtained. 1604 */ 1605 static void 1606 ah_set_usetime(ipsa_t *assoc, boolean_t inbound) 1607 { 1608 ipsa_t *inassoc, *outassoc; 1609 isaf_t *bucket; 1610 sadb_t *sp; 1611 int outhash; 1612 boolean_t isv6; 1613 netstack_t *ns = assoc->ipsa_netstack; 1614 ipsecah_stack_t *ahstack = ns->netstack_ipsecah; 1615 1616 /* No peer? No problem! */ 1617 if (!assoc->ipsa_haspeer) { 1618 sadb_set_usetime(assoc); 1619 return; 1620 } 1621 1622 /* 1623 * Otherwise, we want to grab both the original assoc and its peer. 1624 * There might be a race for this, but if it's a real race, the times 1625 * will be out-of-synch by at most a second, and since our time 1626 * granularity is a second, this won't be a problem. 1627 * 1628 * If we need tight synchronization on the peer SA, then we need to 1629 * reconsider. 1630 */ 1631 1632 /* Use address family to select IPv6/IPv4 */ 1633 isv6 = (assoc->ipsa_addrfam == AF_INET6); 1634 if (isv6) { 1635 sp = &ahstack->ah_sadb.s_v6; 1636 } else { 1637 sp = &ahstack->ah_sadb.s_v4; 1638 ASSERT(assoc->ipsa_addrfam == AF_INET); 1639 } 1640 if (inbound) { 1641 inassoc = assoc; 1642 if (isv6) 1643 outhash = OUTBOUND_HASH_V6(sp, 1644 *((in6_addr_t *)&inassoc->ipsa_dstaddr)); 1645 else 1646 outhash = OUTBOUND_HASH_V4(sp, 1647 *((ipaddr_t *)&inassoc->ipsa_dstaddr)); 1648 bucket = &sp->sdb_of[outhash]; 1649 1650 mutex_enter(&bucket->isaf_lock); 1651 outassoc = ipsec_getassocbyspi(bucket, inassoc->ipsa_spi, 1652 inassoc->ipsa_srcaddr, inassoc->ipsa_dstaddr, 1653 inassoc->ipsa_addrfam); 1654 mutex_exit(&bucket->isaf_lock); 1655 if (outassoc == NULL) { 1656 /* Q: Do we wish to set haspeer == B_FALSE? */ 1657 ah0dbg(("ah_set_usetime: " 1658 "can't find peer for inbound.\n")); 1659 sadb_set_usetime(inassoc); 1660 return; 1661 } 1662 } else { 1663 outassoc = assoc; 1664 bucket = INBOUND_BUCKET(sp, outassoc->ipsa_spi); 1665 mutex_enter(&bucket->isaf_lock); 1666 inassoc = ipsec_getassocbyspi(bucket, outassoc->ipsa_spi, 1667 outassoc->ipsa_srcaddr, outassoc->ipsa_dstaddr, 1668 outassoc->ipsa_addrfam); 1669 mutex_exit(&bucket->isaf_lock); 1670 if (inassoc == NULL) { 1671 /* Q: Do we wish to set haspeer == B_FALSE? */ 1672 ah0dbg(("ah_set_usetime: " 1673 "can't find peer for outbound.\n")); 1674 sadb_set_usetime(outassoc); 1675 return; 1676 } 1677 } 1678 1679 /* Update usetime on both. */ 1680 sadb_set_usetime(inassoc); 1681 sadb_set_usetime(outassoc); 1682 1683 /* 1684 * REFRELE any peer SA. 1685 * 1686 * Because of the multi-line macro nature of IPSA_REFRELE, keep 1687 * them in { }. 1688 */ 1689 if (inbound) { 1690 IPSA_REFRELE(outassoc); 1691 } else { 1692 IPSA_REFRELE(inassoc); 1693 } 1694 } 1695 1696 /* 1697 * Add a number of bytes to what the SA has protected so far. Return 1698 * B_TRUE if the SA can still protect that many bytes. 1699 * 1700 * Caller must REFRELE the passed-in assoc. This function must REFRELE 1701 * any obtained peer SA. 1702 */ 1703 static boolean_t 1704 ah_age_bytes(ipsa_t *assoc, uint64_t bytes, boolean_t inbound) 1705 { 1706 ipsa_t *inassoc, *outassoc; 1707 isaf_t *bucket; 1708 boolean_t inrc, outrc, isv6; 1709 sadb_t *sp; 1710 int outhash; 1711 netstack_t *ns = assoc->ipsa_netstack; 1712 ipsecah_stack_t *ahstack = ns->netstack_ipsecah; 1713 1714 /* No peer? No problem! */ 1715 if (!assoc->ipsa_haspeer) { 1716 return (sadb_age_bytes(ahstack->ah_pfkey_q, assoc, bytes, 1717 B_TRUE)); 1718 } 1719 1720 /* 1721 * Otherwise, we want to grab both the original assoc and its peer. 1722 * There might be a race for this, but if it's a real race, two 1723 * expire messages may occur. We limit this by only sending the 1724 * expire message on one of the peers, we'll pick the inbound 1725 * arbitrarily. 1726 * 1727 * If we need tight synchronization on the peer SA, then we need to 1728 * reconsider. 1729 */ 1730 1731 /* Pick v4/v6 bucket based on addrfam. */ 1732 isv6 = (assoc->ipsa_addrfam == AF_INET6); 1733 if (isv6) { 1734 sp = &ahstack->ah_sadb.s_v6; 1735 } else { 1736 sp = &ahstack->ah_sadb.s_v4; 1737 ASSERT(assoc->ipsa_addrfam == AF_INET); 1738 } 1739 if (inbound) { 1740 inassoc = assoc; 1741 if (isv6) 1742 outhash = OUTBOUND_HASH_V6(sp, 1743 *((in6_addr_t *)&inassoc->ipsa_dstaddr)); 1744 else 1745 outhash = OUTBOUND_HASH_V4(sp, 1746 *((ipaddr_t *)&inassoc->ipsa_dstaddr)); 1747 bucket = &sp->sdb_of[outhash]; 1748 mutex_enter(&bucket->isaf_lock); 1749 outassoc = ipsec_getassocbyspi(bucket, inassoc->ipsa_spi, 1750 inassoc->ipsa_srcaddr, inassoc->ipsa_dstaddr, 1751 inassoc->ipsa_addrfam); 1752 mutex_exit(&bucket->isaf_lock); 1753 if (outassoc == NULL) { 1754 /* Q: Do we wish to set haspeer == B_FALSE? */ 1755 ah0dbg(("ah_age_bytes: " 1756 "can't find peer for inbound.\n")); 1757 return (sadb_age_bytes(ahstack->ah_pfkey_q, inassoc, 1758 bytes, B_TRUE)); 1759 } 1760 } else { 1761 outassoc = assoc; 1762 bucket = INBOUND_BUCKET(sp, outassoc->ipsa_spi); 1763 mutex_enter(&bucket->isaf_lock); 1764 inassoc = ipsec_getassocbyspi(bucket, outassoc->ipsa_spi, 1765 outassoc->ipsa_srcaddr, outassoc->ipsa_dstaddr, 1766 outassoc->ipsa_addrfam); 1767 mutex_exit(&bucket->isaf_lock); 1768 if (inassoc == NULL) { 1769 /* Q: Do we wish to set haspeer == B_FALSE? */ 1770 ah0dbg(("ah_age_bytes: " 1771 "can't find peer for outbound.\n")); 1772 return (sadb_age_bytes(ahstack->ah_pfkey_q, outassoc, 1773 bytes, B_TRUE)); 1774 } 1775 } 1776 1777 inrc = sadb_age_bytes(ahstack->ah_pfkey_q, inassoc, bytes, B_TRUE); 1778 outrc = sadb_age_bytes(ahstack->ah_pfkey_q, outassoc, bytes, B_FALSE); 1779 1780 /* 1781 * REFRELE any peer SA. 1782 * 1783 * Because of the multi-line macro nature of IPSA_REFRELE, keep 1784 * them in { }. 1785 */ 1786 if (inbound) { 1787 IPSA_REFRELE(outassoc); 1788 } else { 1789 IPSA_REFRELE(inassoc); 1790 } 1791 1792 return (inrc && outrc); 1793 } 1794 1795 /* 1796 * Perform the really difficult work of inserting the proposed situation. 1797 * Called while holding the algorithm lock. 1798 */ 1799 static void 1800 ah_insert_prop(sadb_prop_t *prop, ipsacq_t *acqrec, uint_t combs) 1801 { 1802 sadb_comb_t *comb = (sadb_comb_t *)(prop + 1); 1803 ipsec_out_t *io; 1804 ipsec_action_t *ap; 1805 ipsec_prot_t *prot; 1806 ipsecah_stack_t *ahstack; 1807 netstack_t *ns; 1808 ipsec_stack_t *ipss; 1809 1810 io = (ipsec_out_t *)acqrec->ipsacq_mp->b_rptr; 1811 ASSERT(io->ipsec_out_type == IPSEC_OUT); 1812 1813 ns = io->ipsec_out_ns; 1814 ipss = ns->netstack_ipsec; 1815 ahstack = ns->netstack_ipsecah; 1816 ASSERT(MUTEX_HELD(&ipss->ipsec_alg_lock)); 1817 1818 prop->sadb_prop_exttype = SADB_EXT_PROPOSAL; 1819 prop->sadb_prop_len = SADB_8TO64(sizeof (sadb_prop_t)); 1820 *(uint32_t *)(&prop->sadb_prop_replay) = 0; /* Quick zero-out! */ 1821 1822 prop->sadb_prop_replay = ahstack->ipsecah_replay_size; 1823 1824 /* 1825 * Based upon algorithm properties, and what-not, prioritize a 1826 * proposal, based on the ordering of the ah algorithms in the 1827 * alternatives presented in the policy rule passed down 1828 * through the ipsec_out_t and attached to the acquire record. 1829 */ 1830 1831 for (ap = acqrec->ipsacq_act; ap != NULL; 1832 ap = ap->ipa_next) { 1833 ipsec_alginfo_t *aalg; 1834 1835 if ((ap->ipa_act.ipa_type != IPSEC_POLICY_APPLY) || 1836 (!ap->ipa_act.ipa_apply.ipp_use_ah)) 1837 continue; 1838 1839 prot = &ap->ipa_act.ipa_apply; 1840 1841 ASSERT(prot->ipp_auth_alg > 0); 1842 1843 aalg = ipss->ipsec_alglists[IPSEC_ALG_AUTH] 1844 [prot->ipp_auth_alg]; 1845 if (aalg == NULL || !ALG_VALID(aalg)) 1846 continue; 1847 1848 /* XXX check aalg for duplicates??.. */ 1849 1850 comb->sadb_comb_flags = 0; 1851 comb->sadb_comb_reserved = 0; 1852 comb->sadb_comb_encrypt = 0; 1853 comb->sadb_comb_encrypt_minbits = 0; 1854 comb->sadb_comb_encrypt_maxbits = 0; 1855 1856 comb->sadb_comb_auth = aalg->alg_id; 1857 comb->sadb_comb_auth_minbits = 1858 MAX(prot->ipp_ah_minbits, aalg->alg_ef_minbits); 1859 comb->sadb_comb_auth_maxbits = 1860 MIN(prot->ipp_ah_maxbits, aalg->alg_ef_maxbits); 1861 1862 /* 1863 * The following may be based on algorithm 1864 * properties, but in the meantime, we just pick 1865 * some good, sensible numbers. Key mgmt. can 1866 * (and perhaps should) be the place to finalize 1867 * such decisions. 1868 */ 1869 1870 /* 1871 * No limits on allocations, since we really don't 1872 * support that concept currently. 1873 */ 1874 comb->sadb_comb_soft_allocations = 0; 1875 comb->sadb_comb_hard_allocations = 0; 1876 1877 /* 1878 * These may want to come from policy rule.. 1879 */ 1880 comb->sadb_comb_soft_bytes = 1881 ahstack->ipsecah_default_soft_bytes; 1882 comb->sadb_comb_hard_bytes = 1883 ahstack->ipsecah_default_hard_bytes; 1884 comb->sadb_comb_soft_addtime = 1885 ahstack->ipsecah_default_soft_addtime; 1886 comb->sadb_comb_hard_addtime = 1887 ahstack->ipsecah_default_hard_addtime; 1888 comb->sadb_comb_soft_usetime = 1889 ahstack->ipsecah_default_soft_usetime; 1890 comb->sadb_comb_hard_usetime = 1891 ahstack->ipsecah_default_hard_usetime; 1892 1893 prop->sadb_prop_len += SADB_8TO64(sizeof (*comb)); 1894 if (--combs == 0) 1895 return; /* out of space.. */ 1896 comb++; 1897 } 1898 } 1899 1900 /* 1901 * Prepare and actually send the SADB_ACQUIRE message to PF_KEY. 1902 */ 1903 static void 1904 ah_send_acquire(ipsacq_t *acqrec, mblk_t *extended, netstack_t *ns) 1905 { 1906 uint_t combs; 1907 sadb_msg_t *samsg; 1908 sadb_prop_t *prop; 1909 mblk_t *pfkeymp, *msgmp; 1910 ipsecah_stack_t *ahstack = ns->netstack_ipsecah; 1911 ipsec_stack_t *ipss = ns->netstack_ipsec; 1912 1913 AH_BUMP_STAT(ahstack, acquire_requests); 1914 1915 if (ahstack->ah_pfkey_q == NULL) { 1916 mutex_exit(&acqrec->ipsacq_lock); 1917 return; 1918 } 1919 1920 /* Set up ACQUIRE. */ 1921 pfkeymp = sadb_setup_acquire(acqrec, SADB_SATYPE_AH, 1922 ns->netstack_ipsec); 1923 if (pfkeymp == NULL) { 1924 ah0dbg(("sadb_setup_acquire failed.\n")); 1925 mutex_exit(&acqrec->ipsacq_lock); 1926 return; 1927 } 1928 ASSERT(MUTEX_HELD(&ipss->ipsec_alg_lock)); 1929 combs = ipss->ipsec_nalgs[IPSEC_ALG_AUTH]; 1930 msgmp = pfkeymp->b_cont; 1931 samsg = (sadb_msg_t *)(msgmp->b_rptr); 1932 1933 /* Insert proposal here. */ 1934 1935 prop = (sadb_prop_t *)(((uint64_t *)samsg) + samsg->sadb_msg_len); 1936 ah_insert_prop(prop, acqrec, combs); 1937 samsg->sadb_msg_len += prop->sadb_prop_len; 1938 msgmp->b_wptr += SADB_64TO8(samsg->sadb_msg_len); 1939 1940 mutex_exit(&ipss->ipsec_alg_lock); 1941 1942 /* 1943 * Must mutex_exit() before sending PF_KEY message up, in 1944 * order to avoid recursive mutex_enter() if there are no registered 1945 * listeners. 1946 * 1947 * Once I've sent the message, I'm cool anyway. 1948 */ 1949 mutex_exit(&acqrec->ipsacq_lock); 1950 if (extended != NULL) { 1951 putnext(ahstack->ah_pfkey_q, extended); 1952 } 1953 putnext(ahstack->ah_pfkey_q, pfkeymp); 1954 } 1955 1956 /* 1957 * Handle the SADB_GETSPI message. Create a larval SA. 1958 */ 1959 static void 1960 ah_getspi(mblk_t *mp, keysock_in_t *ksi, ipsecah_stack_t *ahstack) 1961 { 1962 ipsa_t *newbie, *target; 1963 isaf_t *outbound, *inbound; 1964 int rc, diagnostic; 1965 sadb_sa_t *assoc; 1966 keysock_out_t *kso; 1967 uint32_t newspi; 1968 1969 /* 1970 * Randomly generate a proposed SPI value. 1971 */ 1972 if (cl_inet_getspi != NULL) { 1973 cl_inet_getspi(ahstack->ipsecah_netstack->netstack_stackid, 1974 IPPROTO_AH, (uint8_t *)&newspi, sizeof (uint32_t), NULL); 1975 } else { 1976 (void) random_get_pseudo_bytes((uint8_t *)&newspi, 1977 sizeof (uint32_t)); 1978 } 1979 newbie = sadb_getspi(ksi, newspi, &diagnostic, 1980 ahstack->ipsecah_netstack, IPPROTO_AH); 1981 1982 if (newbie == NULL) { 1983 sadb_pfkey_error(ahstack->ah_pfkey_q, mp, ENOMEM, diagnostic, 1984 ksi->ks_in_serial); 1985 return; 1986 } else if (newbie == (ipsa_t *)-1) { 1987 sadb_pfkey_error(ahstack->ah_pfkey_q, mp, EINVAL, diagnostic, 1988 ksi->ks_in_serial); 1989 return; 1990 } 1991 1992 /* 1993 * XXX - We may randomly collide. We really should recover from this. 1994 * Unfortunately, that could require spending way-too-much-time 1995 * in here. For now, let the user retry. 1996 */ 1997 1998 if (newbie->ipsa_addrfam == AF_INET6) { 1999 outbound = OUTBOUND_BUCKET_V6(&ahstack->ah_sadb.s_v6, 2000 *(uint32_t *)(newbie->ipsa_dstaddr)); 2001 inbound = INBOUND_BUCKET(&ahstack->ah_sadb.s_v6, 2002 newbie->ipsa_spi); 2003 } else { 2004 outbound = OUTBOUND_BUCKET_V4(&ahstack->ah_sadb.s_v4, 2005 *(uint32_t *)(newbie->ipsa_dstaddr)); 2006 inbound = INBOUND_BUCKET(&ahstack->ah_sadb.s_v4, 2007 newbie->ipsa_spi); 2008 } 2009 2010 mutex_enter(&outbound->isaf_lock); 2011 mutex_enter(&inbound->isaf_lock); 2012 2013 /* 2014 * Check for collisions (i.e. did sadb_getspi() return with something 2015 * that already exists?). 2016 * 2017 * Try outbound first. Even though SADB_GETSPI is traditionally 2018 * for inbound SAs, you never know what a user might do. 2019 */ 2020 target = ipsec_getassocbyspi(outbound, newbie->ipsa_spi, 2021 newbie->ipsa_srcaddr, newbie->ipsa_dstaddr, newbie->ipsa_addrfam); 2022 if (target == NULL) { 2023 target = ipsec_getassocbyspi(inbound, newbie->ipsa_spi, 2024 newbie->ipsa_srcaddr, newbie->ipsa_dstaddr, 2025 newbie->ipsa_addrfam); 2026 } 2027 2028 /* 2029 * I don't have collisions elsewhere! 2030 * (Nor will I because I'm still holding inbound/outbound locks.) 2031 */ 2032 2033 if (target != NULL) { 2034 rc = EEXIST; 2035 IPSA_REFRELE(target); 2036 } else { 2037 /* 2038 * sadb_insertassoc() also checks for collisions, so 2039 * if there's a colliding larval entry, rc will be set 2040 * to EEXIST. 2041 */ 2042 rc = sadb_insertassoc(newbie, inbound); 2043 newbie->ipsa_hardexpiretime = gethrestime_sec(); 2044 newbie->ipsa_hardexpiretime += ahstack->ipsecah_larval_timeout; 2045 } 2046 2047 /* 2048 * Can exit outbound mutex. Hold inbound until we're done with 2049 * newbie. 2050 */ 2051 mutex_exit(&outbound->isaf_lock); 2052 2053 if (rc != 0) { 2054 mutex_exit(&inbound->isaf_lock); 2055 IPSA_REFRELE(newbie); 2056 sadb_pfkey_error(ahstack->ah_pfkey_q, mp, rc, 2057 SADB_X_DIAGNOSTIC_NONE, ksi->ks_in_serial); 2058 return; 2059 } 2060 2061 /* Can write here because I'm still holding the bucket lock. */ 2062 newbie->ipsa_type = SADB_SATYPE_AH; 2063 2064 /* 2065 * Construct successful return message. We have one thing going 2066 * for us in PF_KEY v2. That's the fact that 2067 * sizeof (sadb_spirange_t) == sizeof (sadb_sa_t) 2068 */ 2069 assoc = (sadb_sa_t *)ksi->ks_in_extv[SADB_EXT_SPIRANGE]; 2070 assoc->sadb_sa_exttype = SADB_EXT_SA; 2071 assoc->sadb_sa_spi = newbie->ipsa_spi; 2072 *((uint64_t *)(&assoc->sadb_sa_replay)) = 0; 2073 mutex_exit(&inbound->isaf_lock); 2074 2075 /* Convert KEYSOCK_IN to KEYSOCK_OUT. */ 2076 kso = (keysock_out_t *)ksi; 2077 kso->ks_out_len = sizeof (*kso); 2078 kso->ks_out_serial = ksi->ks_in_serial; 2079 kso->ks_out_type = KEYSOCK_OUT; 2080 2081 /* 2082 * Can safely putnext() to ah_pfkey_q, because this is a turnaround 2083 * from the ah_pfkey_q. 2084 */ 2085 putnext(ahstack->ah_pfkey_q, mp); 2086 } 2087 2088 /* 2089 * IPv6 sends up the ICMP errors for validation and the removal of the AH 2090 * header. 2091 */ 2092 static ipsec_status_t 2093 ah_icmp_error_v6(mblk_t *ipsec_mp, ipsecah_stack_t *ahstack) 2094 { 2095 mblk_t *mp; 2096 ip6_t *ip6h, *oip6h; 2097 uint16_t hdr_length, ah_length; 2098 uint8_t *nexthdrp; 2099 ah_t *ah; 2100 icmp6_t *icmp6; 2101 isaf_t *isaf; 2102 ipsa_t *assoc; 2103 uint8_t *post_ah_ptr; 2104 ipsec_stack_t *ipss = ahstack->ipsecah_netstack->netstack_ipsec; 2105 2106 mp = ipsec_mp->b_cont; 2107 ASSERT(mp->b_datap->db_type == M_CTL); 2108 2109 /* 2110 * Change the type to M_DATA till we finish pullups. 2111 */ 2112 mp->b_datap->db_type = M_DATA; 2113 2114 /* 2115 * Eat the cost of a pullupmsg() for now. It makes the rest of this 2116 * code far less convoluted. 2117 */ 2118 if (!pullupmsg(mp, -1) || 2119 !ip_hdr_length_nexthdr_v6(mp, (ip6_t *)mp->b_rptr, &hdr_length, 2120 &nexthdrp) || 2121 mp->b_rptr + hdr_length + sizeof (icmp6_t) + sizeof (ip6_t) + 2122 sizeof (ah_t) > mp->b_wptr) { 2123 IP_AH_BUMP_STAT(ipss, in_discards); 2124 ip_drop_packet(ipsec_mp, B_TRUE, NULL, NULL, 2125 DROPPER(ipss, ipds_ah_nomem), 2126 &ahstack->ah_dropper); 2127 return (IPSEC_STATUS_FAILED); 2128 } 2129 2130 oip6h = (ip6_t *)mp->b_rptr; 2131 icmp6 = (icmp6_t *)((uint8_t *)oip6h + hdr_length); 2132 ip6h = (ip6_t *)(icmp6 + 1); 2133 if (!ip_hdr_length_nexthdr_v6(mp, ip6h, &hdr_length, &nexthdrp)) { 2134 IP_AH_BUMP_STAT(ipss, in_discards); 2135 ip_drop_packet(ipsec_mp, B_TRUE, NULL, NULL, 2136 DROPPER(ipss, ipds_ah_bad_v6_hdrs), 2137 &ahstack->ah_dropper); 2138 return (IPSEC_STATUS_FAILED); 2139 } 2140 ah = (ah_t *)((uint8_t *)ip6h + hdr_length); 2141 2142 isaf = OUTBOUND_BUCKET_V6(&ahstack->ah_sadb.s_v6, ip6h->ip6_dst); 2143 mutex_enter(&isaf->isaf_lock); 2144 assoc = ipsec_getassocbyspi(isaf, ah->ah_spi, 2145 (uint32_t *)&ip6h->ip6_src, (uint32_t *)&ip6h->ip6_dst, AF_INET6); 2146 mutex_exit(&isaf->isaf_lock); 2147 2148 if (assoc == NULL) { 2149 IP_AH_BUMP_STAT(ipss, lookup_failure); 2150 IP_AH_BUMP_STAT(ipss, in_discards); 2151 if (ahstack->ipsecah_log_unknown_spi) { 2152 ipsec_assocfailure(info.mi_idnum, 0, 0, 2153 SL_CONSOLE | SL_WARN | SL_ERROR, 2154 "Bad ICMP message - No association for the " 2155 "attached AH header whose spi is 0x%x, " 2156 "sender is 0x%x\n", 2157 ah->ah_spi, &oip6h->ip6_src, AF_INET6, 2158 ahstack->ipsecah_netstack); 2159 } 2160 ip_drop_packet(ipsec_mp, B_TRUE, NULL, NULL, 2161 DROPPER(ipss, ipds_ah_no_sa), 2162 &ahstack->ah_dropper); 2163 return (IPSEC_STATUS_FAILED); 2164 } 2165 2166 IPSA_REFRELE(assoc); 2167 2168 /* 2169 * There seems to be a valid association. If there is enough of AH 2170 * header remove it, otherwise bail. One could check whether it has 2171 * complete AH header plus 8 bytes but it does not make sense if an 2172 * icmp error is returned for ICMP messages e.g ICMP time exceeded, 2173 * that are being sent up. Let the caller figure out. 2174 * 2175 * NOTE: ah_length is the number of 32 bit words minus 2. 2176 */ 2177 ah_length = (ah->ah_length << 2) + 8; 2178 post_ah_ptr = (uint8_t *)ah + ah_length; 2179 2180 if (post_ah_ptr > mp->b_wptr) { 2181 IP_AH_BUMP_STAT(ipss, in_discards); 2182 ip_drop_packet(ipsec_mp, B_TRUE, NULL, NULL, 2183 DROPPER(ipss, ipds_ah_bad_length), 2184 &ahstack->ah_dropper); 2185 return (IPSEC_STATUS_FAILED); 2186 } 2187 2188 ip6h->ip6_plen = htons(ntohs(ip6h->ip6_plen) - ah_length); 2189 *nexthdrp = ah->ah_nexthdr; 2190 ovbcopy(post_ah_ptr, ah, 2191 (size_t)((uintptr_t)mp->b_wptr - (uintptr_t)post_ah_ptr)); 2192 mp->b_wptr -= ah_length; 2193 /* Rewhack to be an ICMP error. */ 2194 mp->b_datap->db_type = M_CTL; 2195 2196 return (IPSEC_STATUS_SUCCESS); 2197 } 2198 2199 /* 2200 * IP sends up the ICMP errors for validation and the removal of 2201 * the AH header. 2202 */ 2203 static ipsec_status_t 2204 ah_icmp_error_v4(mblk_t *ipsec_mp, ipsecah_stack_t *ahstack) 2205 { 2206 mblk_t *mp; 2207 mblk_t *mp1; 2208 icmph_t *icmph; 2209 int iph_hdr_length; 2210 int hdr_length; 2211 isaf_t *hptr; 2212 ipsa_t *assoc; 2213 int ah_length; 2214 ipha_t *ipha; 2215 ipha_t *oipha; 2216 ah_t *ah; 2217 uint32_t length; 2218 int alloc_size; 2219 uint8_t nexthdr; 2220 ipsec_stack_t *ipss = ahstack->ipsecah_netstack->netstack_ipsec; 2221 2222 mp = ipsec_mp->b_cont; 2223 ASSERT(mp->b_datap->db_type == M_CTL); 2224 2225 /* 2226 * Change the type to M_DATA till we finish pullups. 2227 */ 2228 mp->b_datap->db_type = M_DATA; 2229 2230 oipha = ipha = (ipha_t *)mp->b_rptr; 2231 iph_hdr_length = IPH_HDR_LENGTH(ipha); 2232 icmph = (icmph_t *)&mp->b_rptr[iph_hdr_length]; 2233 2234 ipha = (ipha_t *)&icmph[1]; 2235 hdr_length = IPH_HDR_LENGTH(ipha); 2236 2237 /* 2238 * See if we have enough to locate the SPI 2239 */ 2240 if ((uchar_t *)ipha + hdr_length + 8 > mp->b_wptr) { 2241 if (!pullupmsg(mp, (uchar_t *)ipha + hdr_length + 8 - 2242 mp->b_rptr)) { 2243 ipsec_rl_strlog(ahstack->ipsecah_netstack, 2244 info.mi_idnum, 0, 0, 2245 SL_WARN | SL_ERROR, 2246 "ICMP error: Small AH header\n"); 2247 IP_AH_BUMP_STAT(ipss, in_discards); 2248 ip_drop_packet(ipsec_mp, B_TRUE, NULL, NULL, 2249 DROPPER(ipss, ipds_ah_bad_length), 2250 &ahstack->ah_dropper); 2251 return (IPSEC_STATUS_FAILED); 2252 } 2253 icmph = (icmph_t *)&mp->b_rptr[iph_hdr_length]; 2254 ipha = (ipha_t *)&icmph[1]; 2255 } 2256 2257 ah = (ah_t *)((uint8_t *)ipha + hdr_length); 2258 nexthdr = ah->ah_nexthdr; 2259 2260 hptr = OUTBOUND_BUCKET_V4(&ahstack->ah_sadb.s_v4, ipha->ipha_dst); 2261 mutex_enter(&hptr->isaf_lock); 2262 assoc = ipsec_getassocbyspi(hptr, ah->ah_spi, 2263 (uint32_t *)&ipha->ipha_src, (uint32_t *)&ipha->ipha_dst, AF_INET); 2264 mutex_exit(&hptr->isaf_lock); 2265 2266 if (assoc == NULL) { 2267 IP_AH_BUMP_STAT(ipss, lookup_failure); 2268 IP_AH_BUMP_STAT(ipss, in_discards); 2269 if (ahstack->ipsecah_log_unknown_spi) { 2270 ipsec_assocfailure(info.mi_idnum, 0, 0, 2271 SL_CONSOLE | SL_WARN | SL_ERROR, 2272 "Bad ICMP message - No association for the " 2273 "attached AH header whose spi is 0x%x, " 2274 "sender is 0x%x\n", 2275 ah->ah_spi, &oipha->ipha_src, AF_INET, 2276 ahstack->ipsecah_netstack); 2277 } 2278 ip_drop_packet(ipsec_mp, B_TRUE, NULL, NULL, 2279 DROPPER(ipss, ipds_ah_no_sa), 2280 &ahstack->ah_dropper); 2281 return (IPSEC_STATUS_FAILED); 2282 } 2283 2284 IPSA_REFRELE(assoc); 2285 /* 2286 * There seems to be a valid association. If there 2287 * is enough of AH header remove it, otherwise remove 2288 * as much as possible and send it back. One could check 2289 * whether it has complete AH header plus 8 bytes but it 2290 * does not make sense if an icmp error is returned for 2291 * ICMP messages e.g ICMP time exceeded, that are being 2292 * sent up. Let the caller figure out. 2293 * 2294 * NOTE: ah_length is the number of 32 bit words minus 2. 2295 */ 2296 ah_length = (ah->ah_length << 2) + 8; 2297 2298 if ((uchar_t *)ipha + hdr_length + ah_length > mp->b_wptr) { 2299 if (mp->b_cont == NULL) { 2300 /* 2301 * There is nothing to pullup. Just remove as 2302 * much as possible. This is a common case for 2303 * IPV4. 2304 */ 2305 ah_length = (mp->b_wptr - ((uchar_t *)ipha + 2306 hdr_length)); 2307 goto done; 2308 } 2309 /* Pullup the full ah header */ 2310 if (!pullupmsg(mp, (uchar_t *)ah + ah_length - mp->b_rptr)) { 2311 /* 2312 * pullupmsg could have failed if there was not 2313 * enough to pullup or memory allocation failed. 2314 * We tried hard, give up now. 2315 */ 2316 IP_AH_BUMP_STAT(ipss, in_discards); 2317 ip_drop_packet(ipsec_mp, B_TRUE, NULL, NULL, 2318 DROPPER(ipss, ipds_ah_nomem), 2319 &ahstack->ah_dropper); 2320 return (IPSEC_STATUS_FAILED); 2321 } 2322 icmph = (icmph_t *)&mp->b_rptr[iph_hdr_length]; 2323 ipha = (ipha_t *)&icmph[1]; 2324 } 2325 done: 2326 /* 2327 * Remove the AH header and change the protocol. 2328 * Don't update the spi fields in the ipsec_in 2329 * message as we are called just to validate the 2330 * message attached to the ICMP message. 2331 * 2332 * If we never pulled up since all of the message 2333 * is in one single mblk, we can't remove the AH header 2334 * by just setting the b_wptr to the beginning of the 2335 * AH header. We need to allocate a mblk that can hold 2336 * up until the inner IP header and copy them. 2337 */ 2338 alloc_size = iph_hdr_length + sizeof (icmph_t) + hdr_length; 2339 2340 if ((mp1 = allocb(alloc_size, BPRI_LO)) == NULL) { 2341 IP_AH_BUMP_STAT(ipss, in_discards); 2342 ip_drop_packet(ipsec_mp, B_TRUE, NULL, NULL, 2343 DROPPER(ipss, ipds_ah_nomem), 2344 &ahstack->ah_dropper); 2345 return (IPSEC_STATUS_FAILED); 2346 } 2347 /* ICMP errors are M_CTL messages */ 2348 mp1->b_datap->db_type = M_CTL; 2349 ipsec_mp->b_cont = mp1; 2350 bcopy(mp->b_rptr, mp1->b_rptr, alloc_size); 2351 mp1->b_wptr += alloc_size; 2352 2353 /* 2354 * Skip whatever we have copied and as much of AH header 2355 * possible. If we still have something left in the original 2356 * message, tag on. 2357 */ 2358 mp->b_rptr = (uchar_t *)ipha + hdr_length + ah_length; 2359 2360 if (mp->b_rptr != mp->b_wptr) { 2361 mp1->b_cont = mp; 2362 } else { 2363 if (mp->b_cont != NULL) 2364 mp1->b_cont = mp->b_cont; 2365 freeb(mp); 2366 } 2367 2368 ipha = (ipha_t *)(mp1->b_rptr + iph_hdr_length + sizeof (icmph_t)); 2369 ipha->ipha_protocol = nexthdr; 2370 length = ntohs(ipha->ipha_length); 2371 length -= ah_length; 2372 ipha->ipha_length = htons((uint16_t)length); 2373 ipha->ipha_hdr_checksum = 0; 2374 ipha->ipha_hdr_checksum = (uint16_t)ip_csum_hdr(ipha); 2375 2376 return (IPSEC_STATUS_SUCCESS); 2377 } 2378 2379 /* 2380 * IP calls this to validate the ICMP errors that 2381 * we got from the network. 2382 */ 2383 ipsec_status_t 2384 ipsecah_icmp_error(mblk_t *mp) 2385 { 2386 ipsec_in_t *ii = (ipsec_in_t *)mp->b_rptr; 2387 netstack_t *ns = ii->ipsec_in_ns; 2388 ipsecah_stack_t *ahstack = ns->netstack_ipsecah; 2389 2390 if (ii->ipsec_in_v4) 2391 return (ah_icmp_error_v4(mp, ahstack)); 2392 else 2393 return (ah_icmp_error_v6(mp, ahstack)); 2394 } 2395 2396 static int 2397 ah_fix_tlv_options_v6(uint8_t *oi_opt, uint8_t *pi_opt, uint_t ehdrlen, 2398 uint8_t hdr_type, boolean_t copy_always) 2399 { 2400 uint8_t opt_type; 2401 uint_t optlen; 2402 2403 ASSERT(hdr_type == IPPROTO_DSTOPTS || hdr_type == IPPROTO_HOPOPTS); 2404 2405 /* 2406 * Copy the next header and hdr ext. len of the HOP-by-HOP 2407 * and Destination option. 2408 */ 2409 *pi_opt++ = *oi_opt++; 2410 *pi_opt++ = *oi_opt++; 2411 ehdrlen -= 2; 2412 2413 /* 2414 * Now handle all the TLV encoded options. 2415 */ 2416 while (ehdrlen != 0) { 2417 opt_type = *oi_opt; 2418 2419 if (opt_type == IP6OPT_PAD1) { 2420 optlen = 1; 2421 } else { 2422 if (ehdrlen < 2) 2423 goto bad_opt; 2424 optlen = 2 + oi_opt[1]; 2425 if (optlen > ehdrlen) 2426 goto bad_opt; 2427 } 2428 if (copy_always || !(opt_type & IP6OPT_MUTABLE)) { 2429 bcopy(oi_opt, pi_opt, optlen); 2430 } else { 2431 if (optlen == 1) { 2432 *pi_opt = 0; 2433 } else { 2434 /* 2435 * Copy the type and data length fields. 2436 * Zero the option data by skipping 2437 * option type and option data len 2438 * fields. 2439 */ 2440 *pi_opt = *oi_opt; 2441 *(pi_opt + 1) = *(oi_opt + 1); 2442 bzero(pi_opt + 2, optlen - 2); 2443 } 2444 } 2445 ehdrlen -= optlen; 2446 oi_opt += optlen; 2447 pi_opt += optlen; 2448 } 2449 return (0); 2450 bad_opt: 2451 return (-1); 2452 } 2453 2454 /* 2455 * Construct a pseudo header for AH, processing all the options. 2456 * 2457 * oip6h is the IPv6 header of the incoming or outgoing packet. 2458 * ip6h is the pointer to the pseudo headers IPV6 header. All 2459 * the space needed for the options have been allocated including 2460 * the AH header. 2461 * 2462 * If copy_always is set, all the options that appear before AH are copied 2463 * blindly without checking for IP6OPT_MUTABLE. This is used by 2464 * ah_auth_out_done(). Please refer to that function for details. 2465 * 2466 * NOTE : 2467 * 2468 * * AH header is never copied in this function even if copy_always 2469 * is set. It just returns the ah_offset - offset of the AH header 2470 * and the caller needs to do the copying. This is done so that we 2471 * don't have pass extra arguments e.g. SA etc. and also, 2472 * it is not needed when ah_auth_out_done is calling this function. 2473 */ 2474 static uint_t 2475 ah_fix_phdr_v6(ip6_t *ip6h, ip6_t *oip6h, boolean_t outbound, 2476 boolean_t copy_always) 2477 { 2478 uint8_t *oi_opt; 2479 uint8_t *pi_opt; 2480 uint8_t nexthdr; 2481 uint8_t *prev_nexthdr; 2482 ip6_hbh_t *hbhhdr; 2483 ip6_dest_t *dsthdr = NULL; 2484 ip6_rthdr0_t *rthdr; 2485 int ehdrlen; 2486 ah_t *ah; 2487 int ret; 2488 2489 /* 2490 * In the outbound case for source route, ULP has already moved 2491 * the first hop, which is now in ip6_dst. We need to re-arrange 2492 * the header to make it look like how it would appear in the 2493 * receiver i.e 2494 * 2495 * Because of ip_massage_options_v6 the header looks like 2496 * this : 2497 * 2498 * ip6_src = S, ip6_dst = I1. followed by I2,I3,D. 2499 * 2500 * When it reaches the receiver, it would look like 2501 * 2502 * ip6_src = S, ip6_dst = D. followed by I1,I2,I3. 2503 * 2504 * NOTE : We assume that there are no problems with the options 2505 * as IP should have already checked this. 2506 */ 2507 2508 oi_opt = (uchar_t *)&oip6h[1]; 2509 pi_opt = (uchar_t *)&ip6h[1]; 2510 2511 /* 2512 * We set the prev_nexthdr properly in the pseudo header. 2513 * After we finish authentication and come back from the 2514 * algorithm module, pseudo header will become the real 2515 * IP header. 2516 */ 2517 prev_nexthdr = (uint8_t *)&ip6h->ip6_nxt; 2518 nexthdr = oip6h->ip6_nxt; 2519 /* Assume IP has already stripped it */ 2520 ASSERT(nexthdr != IPPROTO_FRAGMENT && nexthdr != IPPROTO_RAW); 2521 ah = NULL; 2522 dsthdr = NULL; 2523 for (;;) { 2524 switch (nexthdr) { 2525 case IPPROTO_HOPOPTS: 2526 hbhhdr = (ip6_hbh_t *)oi_opt; 2527 nexthdr = hbhhdr->ip6h_nxt; 2528 ehdrlen = 8 * (hbhhdr->ip6h_len + 1); 2529 ret = ah_fix_tlv_options_v6(oi_opt, pi_opt, ehdrlen, 2530 IPPROTO_HOPOPTS, copy_always); 2531 /* 2532 * Return a zero offset indicating error if there 2533 * was error. 2534 */ 2535 if (ret == -1) 2536 return (0); 2537 hbhhdr = (ip6_hbh_t *)pi_opt; 2538 prev_nexthdr = (uint8_t *)&hbhhdr->ip6h_nxt; 2539 break; 2540 case IPPROTO_ROUTING: 2541 rthdr = (ip6_rthdr0_t *)oi_opt; 2542 nexthdr = rthdr->ip6r0_nxt; 2543 ehdrlen = 8 * (rthdr->ip6r0_len + 1); 2544 if (!copy_always && outbound) { 2545 int i, left; 2546 ip6_rthdr0_t *prthdr; 2547 in6_addr_t *ap, *pap; 2548 2549 left = rthdr->ip6r0_segleft; 2550 prthdr = (ip6_rthdr0_t *)pi_opt; 2551 pap = (in6_addr_t *)(prthdr + 1); 2552 ap = (in6_addr_t *)(rthdr + 1); 2553 /* 2554 * First eight bytes except seg_left 2555 * does not change en route. 2556 */ 2557 bcopy(oi_opt, pi_opt, 8); 2558 prthdr->ip6r0_segleft = 0; 2559 /* 2560 * First address has been moved to 2561 * the destination address of the 2562 * ip header by ip_massage_options_v6. 2563 * And the real destination address is 2564 * in the last address part of the 2565 * option. 2566 */ 2567 *pap = oip6h->ip6_dst; 2568 for (i = 1; i < left - 1; i++) 2569 pap[i] = ap[i - 1]; 2570 ip6h->ip6_dst = *(ap + left - 1); 2571 } else { 2572 bcopy(oi_opt, pi_opt, ehdrlen); 2573 } 2574 rthdr = (ip6_rthdr0_t *)pi_opt; 2575 prev_nexthdr = (uint8_t *)&rthdr->ip6r0_nxt; 2576 break; 2577 case IPPROTO_DSTOPTS: 2578 /* 2579 * Destination options are tricky. If there is 2580 * a terminal (e.g. non-IPv6-extension) header 2581 * following the destination options, don't 2582 * reset prev_nexthdr or advance the AH insertion 2583 * point and just treat this as a terminal header. 2584 * 2585 * If this is an inbound packet, just deal with 2586 * it as is. 2587 */ 2588 dsthdr = (ip6_dest_t *)oi_opt; 2589 /* 2590 * XXX I hope common-subexpression elimination 2591 * saves us the double-evaluate. 2592 */ 2593 if (outbound && dsthdr->ip6d_nxt != IPPROTO_ROUTING && 2594 dsthdr->ip6d_nxt != IPPROTO_HOPOPTS) 2595 goto terminal_hdr; 2596 nexthdr = dsthdr->ip6d_nxt; 2597 ehdrlen = 8 * (dsthdr->ip6d_len + 1); 2598 ret = ah_fix_tlv_options_v6(oi_opt, pi_opt, ehdrlen, 2599 IPPROTO_DSTOPTS, copy_always); 2600 /* 2601 * Return a zero offset indicating error if there 2602 * was error. 2603 */ 2604 if (ret == -1) 2605 return (0); 2606 break; 2607 case IPPROTO_AH: 2608 /* 2609 * Be conservative in what you send. We shouldn't 2610 * see two same-scoped AH's in one packet. 2611 * (Inner-IP-scoped AH will be hit by terminal 2612 * header of IP or IPv6.) 2613 */ 2614 ASSERT(!outbound); 2615 return ((uint_t)(pi_opt - (uint8_t *)ip6h)); 2616 default: 2617 ASSERT(outbound); 2618 terminal_hdr: 2619 *prev_nexthdr = IPPROTO_AH; 2620 ah = (ah_t *)pi_opt; 2621 ah->ah_nexthdr = nexthdr; 2622 return ((uint_t)(pi_opt - (uint8_t *)ip6h)); 2623 } 2624 pi_opt += ehdrlen; 2625 oi_opt += ehdrlen; 2626 } 2627 /* NOTREACHED */ 2628 } 2629 2630 static boolean_t 2631 ah_finish_up(ah_t *phdr_ah, ah_t *inbound_ah, ipsa_t *assoc, 2632 int ah_data_sz, int ah_align_sz, ipsecah_stack_t *ahstack) 2633 { 2634 int i; 2635 2636 /* 2637 * Padding : 2638 * 2639 * 1) Authentication data may have to be padded 2640 * before ICV calculation if ICV is not a multiple 2641 * of 64 bits. This padding is arbitrary and transmitted 2642 * with the packet at the end of the authentication data. 2643 * Payload length should include the padding bytes. 2644 * 2645 * 2) Explicit padding of the whole datagram may be 2646 * required by the algorithm which need not be 2647 * transmitted. It is assumed that this will be taken 2648 * care by the algorithm module. 2649 */ 2650 bzero(phdr_ah + 1, ah_data_sz); /* Zero out ICV for pseudo-hdr. */ 2651 2652 if (inbound_ah == NULL) { 2653 /* Outbound AH datagram. */ 2654 2655 phdr_ah->ah_length = (ah_align_sz >> 2) + 1; 2656 phdr_ah->ah_reserved = 0; 2657 phdr_ah->ah_spi = assoc->ipsa_spi; 2658 2659 phdr_ah->ah_replay = 2660 htonl(atomic_add_32_nv(&assoc->ipsa_replay, 1)); 2661 if (phdr_ah->ah_replay == 0 && assoc->ipsa_replay_wsize != 0) { 2662 /* 2663 * XXX We have replay counter wrapping. We probably 2664 * want to nuke this SA (and its peer). 2665 */ 2666 ipsec_assocfailure(info.mi_idnum, 0, 0, 2667 SL_ERROR | SL_CONSOLE | SL_WARN, 2668 "Outbound AH SA (0x%x), dst %s has wrapped " 2669 "sequence.\n", phdr_ah->ah_spi, 2670 assoc->ipsa_dstaddr, assoc->ipsa_addrfam, 2671 ahstack->ipsecah_netstack); 2672 2673 sadb_replay_delete(assoc); 2674 /* Caller will free phdr_mp and return NULL. */ 2675 return (B_FALSE); 2676 } 2677 2678 if (ah_data_sz != ah_align_sz) { 2679 uchar_t *pad = ((uchar_t *)phdr_ah + sizeof (ah_t) + 2680 ah_data_sz); 2681 2682 for (i = 0; i < (ah_align_sz - ah_data_sz); i++) { 2683 pad[i] = (uchar_t)i; /* Fill the padding */ 2684 } 2685 } 2686 } else { 2687 /* Inbound AH datagram. */ 2688 phdr_ah->ah_nexthdr = inbound_ah->ah_nexthdr; 2689 phdr_ah->ah_length = inbound_ah->ah_length; 2690 phdr_ah->ah_reserved = 0; 2691 ASSERT(inbound_ah->ah_spi == assoc->ipsa_spi); 2692 phdr_ah->ah_spi = inbound_ah->ah_spi; 2693 phdr_ah->ah_replay = inbound_ah->ah_replay; 2694 2695 if (ah_data_sz != ah_align_sz) { 2696 uchar_t *opad = ((uchar_t *)inbound_ah + 2697 sizeof (ah_t) + ah_data_sz); 2698 uchar_t *pad = ((uchar_t *)phdr_ah + sizeof (ah_t) + 2699 ah_data_sz); 2700 2701 for (i = 0; i < (ah_align_sz - ah_data_sz); i++) { 2702 pad[i] = opad[i]; /* Copy the padding */ 2703 } 2704 } 2705 } 2706 2707 return (B_TRUE); 2708 } 2709 2710 /* 2711 * Called upon failing the inbound ICV check. The message passed as 2712 * argument is freed. 2713 */ 2714 static void 2715 ah_log_bad_auth(mblk_t *ipsec_in) 2716 { 2717 mblk_t *mp = ipsec_in->b_cont->b_cont; 2718 ipsec_in_t *ii = (ipsec_in_t *)ipsec_in->b_rptr; 2719 boolean_t isv4 = ii->ipsec_in_v4; 2720 ipsa_t *assoc = ii->ipsec_in_ah_sa; 2721 int af; 2722 void *addr; 2723 netstack_t *ns = ii->ipsec_in_ns; 2724 ipsecah_stack_t *ahstack = ns->netstack_ipsecah; 2725 ipsec_stack_t *ipss = ns->netstack_ipsec; 2726 2727 mp->b_rptr -= ii->ipsec_in_skip_len; 2728 2729 if (isv4) { 2730 ipha_t *ipha = (ipha_t *)mp->b_rptr; 2731 addr = &ipha->ipha_dst; 2732 af = AF_INET; 2733 } else { 2734 ip6_t *ip6h = (ip6_t *)mp->b_rptr; 2735 addr = &ip6h->ip6_dst; 2736 af = AF_INET6; 2737 } 2738 2739 /* 2740 * Log the event. Don't print to the console, block 2741 * potential denial-of-service attack. 2742 */ 2743 AH_BUMP_STAT(ahstack, bad_auth); 2744 2745 ipsec_assocfailure(info.mi_idnum, 0, 0, SL_ERROR | SL_WARN, 2746 "AH Authentication failed spi %x, dst_addr %s", 2747 assoc->ipsa_spi, addr, af, ahstack->ipsecah_netstack); 2748 2749 IP_AH_BUMP_STAT(ipss, in_discards); 2750 ip_drop_packet(ipsec_in, B_TRUE, NULL, NULL, 2751 DROPPER(ipss, ipds_ah_bad_auth), 2752 &ahstack->ah_dropper); 2753 } 2754 2755 /* 2756 * Kernel crypto framework callback invoked after completion of async 2757 * crypto requests. 2758 */ 2759 static void 2760 ah_kcf_callback(void *arg, int status) 2761 { 2762 mblk_t *ipsec_mp = (mblk_t *)arg; 2763 ipsec_in_t *ii = (ipsec_in_t *)ipsec_mp->b_rptr; 2764 boolean_t is_inbound = (ii->ipsec_in_type == IPSEC_IN); 2765 netstackid_t stackid; 2766 netstack_t *ns, *ns_arg; 2767 ipsec_stack_t *ipss; 2768 ipsecah_stack_t *ahstack; 2769 ipsec_out_t *io = (ipsec_out_t *)ii; 2770 2771 ASSERT(ipsec_mp->b_cont != NULL); 2772 2773 if (is_inbound) { 2774 stackid = ii->ipsec_in_stackid; 2775 ns_arg = ii->ipsec_in_ns; 2776 } else { 2777 stackid = io->ipsec_out_stackid; 2778 ns_arg = io->ipsec_out_ns; 2779 } 2780 /* 2781 * Verify that the netstack is still around; could have vanished 2782 * while kEf was doing its work. 2783 */ 2784 ns = netstack_find_by_stackid(stackid); 2785 if (ns == NULL || ns != ns_arg) { 2786 /* Disappeared on us */ 2787 if (ns != NULL) 2788 netstack_rele(ns); 2789 freemsg(ipsec_mp); 2790 return; 2791 } 2792 2793 ahstack = ns->netstack_ipsecah; 2794 ipss = ns->netstack_ipsec; 2795 2796 if (status == CRYPTO_SUCCESS) { 2797 if (is_inbound) { 2798 if (ah_auth_in_done(ipsec_mp) != IPSEC_STATUS_SUCCESS) { 2799 netstack_rele(ns); 2800 return; 2801 } 2802 /* finish IPsec processing */ 2803 ip_fanout_proto_again(ipsec_mp, NULL, NULL, NULL); 2804 } else { 2805 ipha_t *ipha; 2806 2807 if (ah_auth_out_done(ipsec_mp) != 2808 IPSEC_STATUS_SUCCESS) { 2809 netstack_rele(ns); 2810 return; 2811 } 2812 2813 /* finish IPsec processing */ 2814 ipha = (ipha_t *)ipsec_mp->b_cont->b_rptr; 2815 if (IPH_HDR_VERSION(ipha) == IP_VERSION) { 2816 ip_wput_ipsec_out(NULL, ipsec_mp, ipha, NULL, 2817 NULL); 2818 } else { 2819 ip6_t *ip6h = (ip6_t *)ipha; 2820 ip_wput_ipsec_out_v6(NULL, ipsec_mp, ip6h, 2821 NULL, NULL); 2822 } 2823 } 2824 2825 } else if (status == CRYPTO_INVALID_MAC) { 2826 ah_log_bad_auth(ipsec_mp); 2827 } else { 2828 ah1dbg(ahstack, ("ah_kcf_callback: crypto failed with 0x%x\n", 2829 status)); 2830 AH_BUMP_STAT(ahstack, crypto_failures); 2831 if (is_inbound) 2832 IP_AH_BUMP_STAT(ipss, in_discards); 2833 else 2834 AH_BUMP_STAT(ahstack, out_discards); 2835 ip_drop_packet(ipsec_mp, is_inbound, NULL, NULL, 2836 DROPPER(ipss, ipds_ah_crypto_failed), 2837 &ahstack->ah_dropper); 2838 } 2839 netstack_rele(ns); 2840 } 2841 2842 /* 2843 * Invoked on kernel crypto failure during inbound and outbound processing. 2844 */ 2845 static void 2846 ah_crypto_failed(mblk_t *mp, boolean_t is_inbound, int kef_rc, 2847 ipsecah_stack_t *ahstack) 2848 { 2849 ipsec_stack_t *ipss = ahstack->ipsecah_netstack->netstack_ipsec; 2850 2851 ah1dbg(ahstack, ("crypto failed for %s AH with 0x%x\n", 2852 is_inbound ? "inbound" : "outbound", kef_rc)); 2853 ip_drop_packet(mp, is_inbound, NULL, NULL, 2854 DROPPER(ipss, ipds_ah_crypto_failed), 2855 &ahstack->ah_dropper); 2856 AH_BUMP_STAT(ahstack, crypto_failures); 2857 if (is_inbound) 2858 IP_AH_BUMP_STAT(ipss, in_discards); 2859 else 2860 AH_BUMP_STAT(ahstack, out_discards); 2861 } 2862 2863 /* 2864 * Helper macros for the ah_submit_req_{inbound,outbound}() functions. 2865 */ 2866 2867 #define AH_INIT_CALLREQ(_cr, _ipss) { \ 2868 (_cr)->cr_flag = CRYPTO_SKIP_REQID|CRYPTO_RESTRICTED; \ 2869 if ((_ipss)->ipsec_algs_exec_mode[IPSEC_ALG_AUTH] == \ 2870 IPSEC_ALGS_EXEC_ASYNC) \ 2871 (_cr)->cr_flag |= CRYPTO_ALWAYS_QUEUE; \ 2872 (_cr)->cr_callback_arg = ipsec_mp; \ 2873 (_cr)->cr_callback_func = ah_kcf_callback; \ 2874 } 2875 2876 #define AH_INIT_CRYPTO_DATA(data, msglen, mblk) { \ 2877 (data)->cd_format = CRYPTO_DATA_MBLK; \ 2878 (data)->cd_mp = mblk; \ 2879 (data)->cd_offset = 0; \ 2880 (data)->cd_length = msglen; \ 2881 } 2882 2883 #define AH_INIT_CRYPTO_MAC(mac, icvlen, icvbuf) { \ 2884 (mac)->cd_format = CRYPTO_DATA_RAW; \ 2885 (mac)->cd_offset = 0; \ 2886 (mac)->cd_length = icvlen; \ 2887 (mac)->cd_raw.iov_base = icvbuf; \ 2888 (mac)->cd_raw.iov_len = icvlen; \ 2889 } 2890 2891 /* 2892 * Submit an inbound packet for processing by the crypto framework. 2893 */ 2894 static ipsec_status_t 2895 ah_submit_req_inbound(mblk_t *ipsec_mp, size_t skip_len, uint32_t ah_offset, 2896 ipsa_t *assoc) 2897 { 2898 int kef_rc; 2899 mblk_t *phdr_mp; 2900 crypto_call_req_t call_req; 2901 ipsec_in_t *ii = (ipsec_in_t *)ipsec_mp->b_rptr; 2902 uint_t icv_len = assoc->ipsa_mac_len; 2903 crypto_ctx_template_t ctx_tmpl; 2904 netstack_t *ns = ii->ipsec_in_ns; 2905 ipsecah_stack_t *ahstack = ns->netstack_ipsecah; 2906 ipsec_stack_t *ipss = ns->netstack_ipsec; 2907 2908 phdr_mp = ipsec_mp->b_cont; 2909 ASSERT(phdr_mp != NULL); 2910 ASSERT(ii->ipsec_in_type == IPSEC_IN); 2911 2912 /* 2913 * In case kEF queues and calls back, make sure we have the 2914 * netstackid_t for verification that the IP instance is still around 2915 * in esp_kcf_callback(). 2916 */ 2917 ASSERT(ii->ipsec_in_stackid == ns->netstack_stackid); 2918 2919 /* init arguments for the crypto framework */ 2920 AH_INIT_CRYPTO_DATA(&ii->ipsec_in_crypto_data, AH_MSGSIZE(phdr_mp), 2921 phdr_mp); 2922 2923 AH_INIT_CRYPTO_MAC(&ii->ipsec_in_crypto_mac, icv_len, 2924 (char *)phdr_mp->b_cont->b_rptr - skip_len + ah_offset + 2925 sizeof (ah_t)); 2926 2927 AH_INIT_CALLREQ(&call_req, ipss); 2928 2929 ii->ipsec_in_skip_len = skip_len; 2930 2931 IPSEC_CTX_TMPL(assoc, ipsa_authtmpl, IPSEC_ALG_AUTH, ctx_tmpl); 2932 2933 /* call KEF to do the MAC operation */ 2934 kef_rc = crypto_mac_verify(&assoc->ipsa_amech, 2935 &ii->ipsec_in_crypto_data, &assoc->ipsa_kcfauthkey, ctx_tmpl, 2936 &ii->ipsec_in_crypto_mac, &call_req); 2937 2938 switch (kef_rc) { 2939 case CRYPTO_SUCCESS: 2940 AH_BUMP_STAT(ahstack, crypto_sync); 2941 return (ah_auth_in_done(ipsec_mp)); 2942 case CRYPTO_QUEUED: 2943 /* ah_kcf_callback() will be invoked on completion */ 2944 AH_BUMP_STAT(ahstack, crypto_async); 2945 return (IPSEC_STATUS_PENDING); 2946 case CRYPTO_INVALID_MAC: 2947 AH_BUMP_STAT(ahstack, crypto_sync); 2948 ah_log_bad_auth(ipsec_mp); 2949 return (IPSEC_STATUS_FAILED); 2950 } 2951 2952 ah_crypto_failed(ipsec_mp, B_TRUE, kef_rc, ahstack); 2953 return (IPSEC_STATUS_FAILED); 2954 } 2955 2956 /* 2957 * Submit an outbound packet for processing by the crypto framework. 2958 */ 2959 static ipsec_status_t 2960 ah_submit_req_outbound(mblk_t *ipsec_mp, size_t skip_len, ipsa_t *assoc) 2961 { 2962 int kef_rc; 2963 mblk_t *phdr_mp; 2964 crypto_call_req_t call_req; 2965 ipsec_out_t *io = (ipsec_out_t *)ipsec_mp->b_rptr; 2966 uint_t icv_len = assoc->ipsa_mac_len; 2967 netstack_t *ns = io->ipsec_out_ns; 2968 ipsecah_stack_t *ahstack = ns->netstack_ipsecah; 2969 ipsec_stack_t *ipss = ns->netstack_ipsec; 2970 2971 phdr_mp = ipsec_mp->b_cont; 2972 ASSERT(phdr_mp != NULL); 2973 ASSERT(io->ipsec_out_type == IPSEC_OUT); 2974 2975 /* 2976 * In case kEF queues and calls back, keep netstackid_t for 2977 * verification that the IP instance is still around in 2978 * ah_kcf_callback(). 2979 */ 2980 io->ipsec_out_stackid = ns->netstack_stackid; 2981 2982 /* init arguments for the crypto framework */ 2983 AH_INIT_CRYPTO_DATA(&io->ipsec_out_crypto_data, AH_MSGSIZE(phdr_mp), 2984 phdr_mp); 2985 2986 AH_INIT_CRYPTO_MAC(&io->ipsec_out_crypto_mac, icv_len, 2987 (char *)phdr_mp->b_wptr); 2988 2989 AH_INIT_CALLREQ(&call_req, ipss); 2990 2991 io->ipsec_out_skip_len = skip_len; 2992 2993 ASSERT(io->ipsec_out_ah_sa != NULL); 2994 2995 /* call KEF to do the MAC operation */ 2996 kef_rc = crypto_mac(&assoc->ipsa_amech, &io->ipsec_out_crypto_data, 2997 &assoc->ipsa_kcfauthkey, assoc->ipsa_authtmpl, 2998 &io->ipsec_out_crypto_mac, &call_req); 2999 3000 switch (kef_rc) { 3001 case CRYPTO_SUCCESS: 3002 AH_BUMP_STAT(ahstack, crypto_sync); 3003 return (ah_auth_out_done(ipsec_mp)); 3004 case CRYPTO_QUEUED: 3005 /* ah_kcf_callback() will be invoked on completion */ 3006 AH_BUMP_STAT(ahstack, crypto_async); 3007 return (IPSEC_STATUS_PENDING); 3008 } 3009 3010 ah_crypto_failed(ipsec_mp, B_FALSE, kef_rc, ahstack); 3011 return (IPSEC_STATUS_FAILED); 3012 } 3013 3014 /* 3015 * This function constructs a pseudo header by looking at the IP header 3016 * and options if any. This is called for both outbound and inbound, 3017 * before computing the ICV. 3018 */ 3019 static mblk_t * 3020 ah_process_ip_options_v6(mblk_t *mp, ipsa_t *assoc, int *length_to_skip, 3021 uint_t ah_data_sz, boolean_t outbound, ipsecah_stack_t *ahstack) 3022 { 3023 ip6_t *ip6h; 3024 ip6_t *oip6h; 3025 mblk_t *phdr_mp; 3026 int option_length; 3027 uint_t ah_align_sz; 3028 uint_t ah_offset; 3029 int hdr_size; 3030 ipsec_stack_t *ipss = ahstack->ipsecah_netstack->netstack_ipsec; 3031 3032 /* 3033 * Allocate space for the authentication data also. It is 3034 * useful both during the ICV calculation where we need to 3035 * feed in zeroes and while sending the datagram back to IP 3036 * where we will be using the same space. 3037 * 3038 * We need to allocate space for padding bytes if it is not 3039 * a multiple of IPV6_PADDING_ALIGN. 3040 * 3041 * In addition, we allocate space for the ICV computed by 3042 * the kernel crypto framework, saving us a separate kmem 3043 * allocation down the road. 3044 */ 3045 3046 ah_align_sz = P2ALIGN(ah_data_sz + IPV6_PADDING_ALIGN - 1, 3047 IPV6_PADDING_ALIGN); 3048 3049 ASSERT(ah_align_sz >= ah_data_sz); 3050 3051 hdr_size = ipsec_ah_get_hdr_size_v6(mp, B_FALSE); 3052 option_length = hdr_size - IPV6_HDR_LEN; 3053 3054 /* This was not included in ipsec_ah_get_hdr_size_v6() */ 3055 hdr_size += (sizeof (ah_t) + ah_align_sz); 3056 3057 if (!outbound && (MBLKL(mp) < hdr_size)) { 3058 /* 3059 * We have post-AH header options in a separate mblk, 3060 * a pullup is required. 3061 */ 3062 if (!pullupmsg(mp, hdr_size)) 3063 return (NULL); 3064 } 3065 3066 if ((phdr_mp = allocb_tmpl(hdr_size + ah_data_sz, mp)) == NULL) { 3067 return (NULL); 3068 } 3069 3070 oip6h = (ip6_t *)mp->b_rptr; 3071 3072 /* 3073 * Form the basic IP header first. Zero out the header 3074 * so that the mutable fields are zeroed out. 3075 */ 3076 ip6h = (ip6_t *)phdr_mp->b_rptr; 3077 bzero(ip6h, sizeof (ip6_t)); 3078 ip6h->ip6_vcf = IPV6_DEFAULT_VERS_AND_FLOW; 3079 3080 if (outbound) { 3081 /* 3082 * Include the size of AH and authentication data. 3083 * This is how our recipient would compute the 3084 * authentication data. Look at what we do in the 3085 * inbound case below. 3086 */ 3087 ip6h->ip6_plen = htons(ntohs(oip6h->ip6_plen) + 3088 sizeof (ah_t) + ah_align_sz); 3089 } else { 3090 ip6h->ip6_plen = oip6h->ip6_plen; 3091 } 3092 3093 ip6h->ip6_src = oip6h->ip6_src; 3094 ip6h->ip6_dst = oip6h->ip6_dst; 3095 3096 *length_to_skip = IPV6_HDR_LEN; 3097 if (option_length == 0) { 3098 /* Form the AH header */ 3099 ip6h->ip6_nxt = IPPROTO_AH; 3100 ((ah_t *)(ip6h + 1))->ah_nexthdr = oip6h->ip6_nxt; 3101 ah_offset = *length_to_skip; 3102 } else { 3103 ip6h->ip6_nxt = oip6h->ip6_nxt; 3104 /* option_length does not include the AH header's size */ 3105 *length_to_skip += option_length; 3106 3107 ah_offset = ah_fix_phdr_v6(ip6h, oip6h, outbound, B_FALSE); 3108 if (ah_offset == 0) { 3109 ip_drop_packet(phdr_mp, !outbound, NULL, NULL, 3110 DROPPER(ipss, ipds_ah_bad_v6_hdrs), 3111 &ahstack->ah_dropper); 3112 return (NULL); 3113 } 3114 } 3115 3116 if (!ah_finish_up(((ah_t *)((uint8_t *)ip6h + ah_offset)), 3117 (outbound ? NULL : ((ah_t *)((uint8_t *)oip6h + ah_offset))), 3118 assoc, ah_data_sz, ah_align_sz, ahstack)) { 3119 freeb(phdr_mp); 3120 /* 3121 * Returning NULL will tell the caller to 3122 * IPSA_REFELE(), free the memory, etc. 3123 */ 3124 return (NULL); 3125 } 3126 3127 phdr_mp->b_wptr = ((uint8_t *)ip6h + ah_offset + sizeof (ah_t) + 3128 ah_align_sz); 3129 if (!outbound) 3130 *length_to_skip += sizeof (ah_t) + ah_align_sz; 3131 return (phdr_mp); 3132 } 3133 3134 /* 3135 * This function constructs a pseudo header by looking at the IP header 3136 * and options if any. This is called for both outbound and inbound, 3137 * before computing the ICV. 3138 */ 3139 static mblk_t * 3140 ah_process_ip_options_v4(mblk_t *mp, ipsa_t *assoc, int *length_to_skip, 3141 uint_t ah_data_sz, boolean_t outbound, ipsecah_stack_t *ahstack) 3142 { 3143 ipoptp_t opts; 3144 uint32_t option_length; 3145 ipha_t *ipha; 3146 ipha_t *oipha; 3147 mblk_t *phdr_mp; 3148 int size; 3149 uchar_t *optptr; 3150 uint8_t optval; 3151 uint8_t optlen; 3152 ipaddr_t dst; 3153 uint32_t v_hlen_tos_len; 3154 int ip_hdr_length; 3155 uint_t ah_align_sz; 3156 uint32_t off; 3157 3158 #ifdef _BIG_ENDIAN 3159 #define V_HLEN (v_hlen_tos_len >> 24) 3160 #else 3161 #define V_HLEN (v_hlen_tos_len & 0xFF) 3162 #endif 3163 3164 oipha = (ipha_t *)mp->b_rptr; 3165 v_hlen_tos_len = ((uint32_t *)oipha)[0]; 3166 3167 /* 3168 * Allocate space for the authentication data also. It is 3169 * useful both during the ICV calculation where we need to 3170 * feed in zeroes and while sending the datagram back to IP 3171 * where we will be using the same space. 3172 * 3173 * We need to allocate space for padding bytes if it is not 3174 * a multiple of IPV4_PADDING_ALIGN. 3175 * 3176 * In addition, we allocate space for the ICV computed by 3177 * the kernel crypto framework, saving us a separate kmem 3178 * allocation down the road. 3179 */ 3180 3181 ah_align_sz = P2ALIGN(ah_data_sz + IPV4_PADDING_ALIGN - 1, 3182 IPV4_PADDING_ALIGN); 3183 3184 ASSERT(ah_align_sz >= ah_data_sz); 3185 3186 size = IP_SIMPLE_HDR_LENGTH + sizeof (ah_t) + ah_align_sz + 3187 ah_data_sz; 3188 3189 if (V_HLEN != IP_SIMPLE_HDR_VERSION) { 3190 option_length = oipha->ipha_version_and_hdr_length - 3191 (uint8_t)((IP_VERSION << 4) + 3192 IP_SIMPLE_HDR_LENGTH_IN_WORDS); 3193 option_length <<= 2; 3194 size += option_length; 3195 } 3196 3197 if ((phdr_mp = allocb_tmpl(size, mp)) == NULL) { 3198 return (NULL); 3199 } 3200 3201 /* 3202 * Form the basic IP header first. 3203 */ 3204 ipha = (ipha_t *)phdr_mp->b_rptr; 3205 ipha->ipha_version_and_hdr_length = oipha->ipha_version_and_hdr_length; 3206 ipha->ipha_type_of_service = 0; 3207 3208 if (outbound) { 3209 /* 3210 * Include the size of AH and authentication data. 3211 * This is how our recipient would compute the 3212 * authentication data. Look at what we do in the 3213 * inbound case below. 3214 */ 3215 ipha->ipha_length = ntohs(htons(oipha->ipha_length) + 3216 sizeof (ah_t) + ah_align_sz); 3217 } else { 3218 ipha->ipha_length = oipha->ipha_length; 3219 } 3220 3221 ipha->ipha_ident = oipha->ipha_ident; 3222 ipha->ipha_fragment_offset_and_flags = 0; 3223 ipha->ipha_ttl = 0; 3224 ipha->ipha_protocol = IPPROTO_AH; 3225 ipha->ipha_hdr_checksum = 0; 3226 ipha->ipha_src = oipha->ipha_src; 3227 ipha->ipha_dst = dst = oipha->ipha_dst; 3228 3229 /* 3230 * If there is no option to process return now. 3231 */ 3232 ip_hdr_length = IP_SIMPLE_HDR_LENGTH; 3233 3234 if (V_HLEN == IP_SIMPLE_HDR_VERSION) { 3235 /* Form the AH header */ 3236 goto ah_hdr; 3237 } 3238 3239 ip_hdr_length += option_length; 3240 3241 /* 3242 * We have options. In the outbound case for source route, 3243 * ULP has already moved the first hop, which is now in 3244 * ipha_dst. We need the final destination for the calculation 3245 * of authentication data. And also make sure that mutable 3246 * and experimental fields are zeroed out in the IP options. 3247 */ 3248 3249 bcopy(&oipha[1], &ipha[1], option_length); 3250 3251 for (optval = ipoptp_first(&opts, ipha); 3252 optval != IPOPT_EOL; 3253 optval = ipoptp_next(&opts)) { 3254 optptr = opts.ipoptp_cur; 3255 optlen = opts.ipoptp_len; 3256 switch (optval) { 3257 case IPOPT_EXTSEC: 3258 case IPOPT_COMSEC: 3259 case IPOPT_RA: 3260 case IPOPT_SDMDD: 3261 case IPOPT_SECURITY: 3262 /* 3263 * These options are Immutable, leave them as-is. 3264 * Note that IPOPT_NOP is also Immutable, but it 3265 * was skipped by ipoptp_next() and thus remains 3266 * intact in the header. 3267 */ 3268 break; 3269 case IPOPT_SSRR: 3270 case IPOPT_LSRR: 3271 if ((opts.ipoptp_flags & IPOPTP_ERROR) != 0) 3272 goto bad_ipv4opt; 3273 /* 3274 * These two are mutable and will be zeroed, but 3275 * first get the final destination. 3276 */ 3277 off = optptr[IPOPT_OFFSET]; 3278 /* 3279 * If one of the conditions is true, it means 3280 * end of options and dst already has the right 3281 * value. So, just fall through. 3282 */ 3283 if (!(optlen < IP_ADDR_LEN || off > optlen - 3)) { 3284 off = optlen - IP_ADDR_LEN; 3285 bcopy(&optptr[off], &dst, IP_ADDR_LEN); 3286 } 3287 /* FALLTHRU */ 3288 case IPOPT_RR: 3289 case IPOPT_TS: 3290 case IPOPT_SATID: 3291 default: 3292 /* 3293 * optlen should include from the beginning of an 3294 * option. 3295 * NOTE : Stream Identifier Option (SID): RFC 791 3296 * shows the bit pattern of optlen as 2 and documents 3297 * the length as 4. We assume it to be 2 here. 3298 */ 3299 bzero(optptr, optlen); 3300 break; 3301 } 3302 } 3303 3304 if ((opts.ipoptp_flags & IPOPTP_ERROR) != 0) { 3305 bad_ipv4opt: 3306 ah1dbg(ahstack, ("AH : bad IPv4 option")); 3307 freeb(phdr_mp); 3308 return (NULL); 3309 } 3310 3311 /* 3312 * Don't change ipha_dst for an inbound datagram as it points 3313 * to the right value. Only for the outbound with LSRR/SSRR, 3314 * because of ip_massage_options called by the ULP, ipha_dst 3315 * points to the first hop and we need to use the final 3316 * destination for computing the ICV. 3317 */ 3318 3319 if (outbound) 3320 ipha->ipha_dst = dst; 3321 ah_hdr: 3322 ((ah_t *)((uint8_t *)ipha + ip_hdr_length))->ah_nexthdr = 3323 oipha->ipha_protocol; 3324 if (!ah_finish_up(((ah_t *)((uint8_t *)ipha + ip_hdr_length)), 3325 (outbound ? NULL : ((ah_t *)((uint8_t *)oipha + ip_hdr_length))), 3326 assoc, ah_data_sz, ah_align_sz, ahstack)) { 3327 freeb(phdr_mp); 3328 /* 3329 * Returning NULL will tell the caller to IPSA_REFELE(), free 3330 * the memory, etc. 3331 */ 3332 return (NULL); 3333 } 3334 3335 phdr_mp->b_wptr = ((uchar_t *)ipha + ip_hdr_length + 3336 sizeof (ah_t) + ah_align_sz); 3337 3338 ASSERT(phdr_mp->b_wptr <= phdr_mp->b_datap->db_lim); 3339 if (outbound) 3340 *length_to_skip = ip_hdr_length; 3341 else 3342 *length_to_skip = ip_hdr_length + sizeof (ah_t) + ah_align_sz; 3343 return (phdr_mp); 3344 } 3345 3346 /* 3347 * Authenticate an outbound datagram. This function is called 3348 * whenever IP sends an outbound datagram that needs authentication. 3349 */ 3350 static ipsec_status_t 3351 ah_outbound(mblk_t *ipsec_out) 3352 { 3353 mblk_t *mp; 3354 mblk_t *phdr_mp; 3355 ipsec_out_t *oi; 3356 ipsa_t *assoc; 3357 int length_to_skip; 3358 uint_t ah_align_sz; 3359 uint_t age_bytes; 3360 netstack_t *ns; 3361 ipsec_stack_t *ipss; 3362 ipsecah_stack_t *ahstack; 3363 3364 /* 3365 * Construct the chain of mblks 3366 * 3367 * IPSEC_OUT->PSEUDO_HDR->DATA 3368 * 3369 * one by one. 3370 */ 3371 3372 ASSERT(ipsec_out->b_datap->db_type == M_CTL); 3373 3374 ASSERT(MBLKL(ipsec_out) >= sizeof (ipsec_info_t)); 3375 3376 mp = ipsec_out->b_cont; 3377 oi = (ipsec_out_t *)ipsec_out->b_rptr; 3378 ns = oi->ipsec_out_ns; 3379 ipss = ns->netstack_ipsec; 3380 ahstack = ns->netstack_ipsecah; 3381 3382 AH_BUMP_STAT(ahstack, out_requests); 3383 3384 ASSERT(mp->b_datap->db_type == M_DATA); 3385 3386 assoc = oi->ipsec_out_ah_sa; 3387 ASSERT(assoc != NULL); 3388 3389 /* 3390 * Age SA according to number of bytes that will be sent after 3391 * adding the AH header, ICV, and padding to the packet. 3392 */ 3393 3394 if (oi->ipsec_out_v4) { 3395 ipha_t *ipha = (ipha_t *)mp->b_rptr; 3396 ah_align_sz = P2ALIGN(assoc->ipsa_mac_len + 3397 IPV4_PADDING_ALIGN - 1, IPV4_PADDING_ALIGN); 3398 age_bytes = ntohs(ipha->ipha_length) + sizeof (ah_t) + 3399 ah_align_sz; 3400 } else { 3401 ip6_t *ip6h = (ip6_t *)mp->b_rptr; 3402 ah_align_sz = P2ALIGN(assoc->ipsa_mac_len + 3403 IPV6_PADDING_ALIGN - 1, IPV6_PADDING_ALIGN); 3404 age_bytes = sizeof (ip6_t) + ntohs(ip6h->ip6_plen) + 3405 sizeof (ah_t) + ah_align_sz; 3406 } 3407 3408 if (!ah_age_bytes(assoc, age_bytes, B_FALSE)) { 3409 /* rig things as if ipsec_getassocbyconn() failed */ 3410 ipsec_assocfailure(info.mi_idnum, 0, 0, SL_ERROR | SL_WARN, 3411 "AH association 0x%x, dst %s had bytes expire.\n", 3412 ntohl(assoc->ipsa_spi), assoc->ipsa_dstaddr, AF_INET, 3413 ahstack->ipsecah_netstack); 3414 freemsg(ipsec_out); 3415 return (IPSEC_STATUS_FAILED); 3416 } 3417 3418 if (oi->ipsec_out_is_capab_ill) { 3419 ah3dbg(ahstack, ("ah_outbound: pkt can be accelerated\n")); 3420 if (oi->ipsec_out_v4) 3421 return (ah_outbound_accelerated_v4(ipsec_out, assoc)); 3422 else 3423 return (ah_outbound_accelerated_v6(ipsec_out, assoc)); 3424 } 3425 AH_BUMP_STAT(ahstack, noaccel); 3426 3427 /* 3428 * Insert pseudo header: 3429 * IPSEC_INFO -> [IP, ULP] => IPSEC_INFO -> [IP, AH, ICV] -> ULP 3430 */ 3431 3432 if (oi->ipsec_out_v4) { 3433 phdr_mp = ah_process_ip_options_v4(mp, assoc, &length_to_skip, 3434 assoc->ipsa_mac_len, B_TRUE, ahstack); 3435 } else { 3436 phdr_mp = ah_process_ip_options_v6(mp, assoc, &length_to_skip, 3437 assoc->ipsa_mac_len, B_TRUE, ahstack); 3438 } 3439 3440 if (phdr_mp == NULL) { 3441 AH_BUMP_STAT(ahstack, out_discards); 3442 ip_drop_packet(ipsec_out, B_FALSE, NULL, NULL, 3443 DROPPER(ipss, ipds_ah_bad_v4_opts), 3444 &ahstack->ah_dropper); 3445 return (IPSEC_STATUS_FAILED); 3446 } 3447 3448 ipsec_out->b_cont = phdr_mp; 3449 phdr_mp->b_cont = mp; 3450 mp->b_rptr += length_to_skip; 3451 3452 /* 3453 * At this point ipsec_out points to the IPSEC_OUT, new_mp 3454 * points to an mblk containing the pseudo header (IP header, 3455 * AH header, and ICV with mutable fields zero'ed out). 3456 * mp points to the mblk containing the ULP data. The original 3457 * IP header is kept before the ULP data in mp. 3458 */ 3459 3460 /* submit MAC request to KCF */ 3461 return (ah_submit_req_outbound(ipsec_out, length_to_skip, assoc)); 3462 } 3463 3464 static ipsec_status_t 3465 ah_inbound(mblk_t *ipsec_in_mp, void *arg) 3466 { 3467 mblk_t *data_mp = ipsec_in_mp->b_cont; 3468 ipsec_in_t *ii = (ipsec_in_t *)ipsec_in_mp->b_rptr; 3469 ah_t *ah = (ah_t *)arg; 3470 ipsa_t *assoc = ii->ipsec_in_ah_sa; 3471 int length_to_skip; 3472 int ah_length; 3473 mblk_t *phdr_mp; 3474 uint32_t ah_offset; 3475 netstack_t *ns = ii->ipsec_in_ns; 3476 ipsecah_stack_t *ahstack = ns->netstack_ipsecah; 3477 ipsec_stack_t *ipss = ns->netstack_ipsec; 3478 3479 ASSERT(assoc != NULL); 3480 3481 /* 3482 * We may wish to check replay in-range-only here as an optimization. 3483 * Include the reality check of ipsa->ipsa_replay > 3484 * ipsa->ipsa_replay_wsize for times when it's the first N packets, 3485 * where N == ipsa->ipsa_replay_wsize. 3486 * 3487 * Another check that may come here later is the "collision" check. 3488 * If legitimate packets flow quickly enough, this won't be a problem, 3489 * but collisions may cause authentication algorithm crunching to 3490 * take place when it doesn't need to. 3491 */ 3492 if (!sadb_replay_peek(assoc, ah->ah_replay)) { 3493 AH_BUMP_STAT(ahstack, replay_early_failures); 3494 IP_AH_BUMP_STAT(ipss, in_discards); 3495 ip_drop_packet(ipsec_in_mp, B_TRUE, NULL, NULL, 3496 DROPPER(ipss, ipds_ah_early_replay), 3497 &ahstack->ah_dropper); 3498 return (IPSEC_STATUS_FAILED); 3499 } 3500 3501 /* 3502 * The offset of the AH header can be computed from its pointer 3503 * within the data mblk, which was pulled up until the AH header 3504 * by ipsec_inbound_ah_sa() during SA selection. 3505 */ 3506 ah_offset = (uchar_t *)ah - data_mp->b_rptr; 3507 3508 /* 3509 * Has this packet already been processed by a hardware 3510 * IPsec accelerator? 3511 */ 3512 if (ii->ipsec_in_accelerated) { 3513 ah3dbg(ahstack, 3514 ("ah_inbound_v6: pkt processed by ill=%d isv6=%d\n", 3515 ii->ipsec_in_ill_index, !ii->ipsec_in_v4)); 3516 return (ah_inbound_accelerated(ipsec_in_mp, ii->ipsec_in_v4, 3517 assoc, ah_offset)); 3518 } 3519 AH_BUMP_STAT(ahstack, noaccel); 3520 3521 /* 3522 * We need to pullup until the ICV before we call 3523 * ah_process_ip_options_v6. 3524 */ 3525 ah_length = (ah->ah_length << 2) + 8; 3526 3527 /* 3528 * NOTE : If we want to use any field of IP/AH header, you need 3529 * to re-assign following the pullup. 3530 */ 3531 if (((uchar_t *)ah + ah_length) > data_mp->b_wptr) { 3532 if (!pullupmsg(data_mp, (uchar_t *)ah + ah_length - 3533 data_mp->b_rptr)) { 3534 (void) ipsec_rl_strlog(ns, info.mi_idnum, 0, 0, 3535 SL_WARN | SL_ERROR, 3536 "ah_inbound: Small AH header\n"); 3537 IP_AH_BUMP_STAT(ipss, in_discards); 3538 ip_drop_packet(ipsec_in_mp, B_TRUE, NULL, NULL, 3539 DROPPER(ipss, ipds_ah_nomem), 3540 &ahstack->ah_dropper); 3541 return (IPSEC_STATUS_FAILED); 3542 } 3543 } 3544 3545 /* 3546 * Insert pseudo header: 3547 * IPSEC_INFO -> [IP, ULP] => IPSEC_INFO -> [IP, AH, ICV] -> ULP 3548 */ 3549 if (ii->ipsec_in_v4) { 3550 phdr_mp = ah_process_ip_options_v4(data_mp, assoc, 3551 &length_to_skip, assoc->ipsa_mac_len, B_FALSE, ahstack); 3552 } else { 3553 phdr_mp = ah_process_ip_options_v6(data_mp, assoc, 3554 &length_to_skip, assoc->ipsa_mac_len, B_FALSE, ahstack); 3555 } 3556 3557 if (phdr_mp == NULL) { 3558 IP_AH_BUMP_STAT(ipss, in_discards); 3559 ip_drop_packet(ipsec_in_mp, B_TRUE, NULL, NULL, 3560 (ii->ipsec_in_v4 ? 3561 DROPPER(ipss, ipds_ah_bad_v4_opts) : 3562 DROPPER(ipss, ipds_ah_bad_v6_hdrs)), 3563 &ahstack->ah_dropper); 3564 return (IPSEC_STATUS_FAILED); 3565 } 3566 3567 ipsec_in_mp->b_cont = phdr_mp; 3568 phdr_mp->b_cont = data_mp; 3569 data_mp->b_rptr += length_to_skip; 3570 3571 /* submit request to KCF */ 3572 return (ah_submit_req_inbound(ipsec_in_mp, length_to_skip, ah_offset, 3573 assoc)); 3574 } 3575 3576 /* 3577 * ah_inbound_accelerated: 3578 * Called from ah_inbound() to process IPsec packets that have been 3579 * accelerated by hardware. 3580 * 3581 * Basically does what ah_auth_in_done() with some changes since 3582 * no pseudo-headers are involved, i.e. the passed message is a 3583 * IPSEC_INFO->DATA. 3584 * 3585 * It is assumed that only packets that have been successfully 3586 * processed by the adapter come here. 3587 * 3588 * 1. get algorithm structure corresponding to association 3589 * 2. calculate pointers to authentication header and ICV 3590 * 3. compare ICV in AH header with ICV in data attributes 3591 * 3.1 if different: 3592 * 3.1.1 generate error 3593 * 3.1.2 discard message 3594 * 3.2 if ICV matches: 3595 * 3.2.1 check replay 3596 * 3.2.2 remove AH header 3597 * 3.2.3 age SA byte 3598 * 3.2.4 send to IP 3599 */ 3600 ipsec_status_t 3601 ah_inbound_accelerated(mblk_t *ipsec_in, boolean_t isv4, ipsa_t *assoc, 3602 uint32_t ah_offset) 3603 { 3604 mblk_t *mp; 3605 ipha_t *ipha; 3606 ah_t *ah; 3607 ipsec_in_t *ii; 3608 uint32_t icv_len; 3609 uint32_t align_len; 3610 uint32_t age_bytes; 3611 ip6_t *ip6h; 3612 uint8_t *in_icv; 3613 mblk_t *hada_mp; 3614 uint32_t next_hdr; 3615 da_ipsec_t *hada; 3616 kstat_named_t *counter; 3617 ipsecah_stack_t *ahstack; 3618 netstack_t *ns; 3619 ipsec_stack_t *ipss; 3620 3621 ii = (ipsec_in_t *)ipsec_in->b_rptr; 3622 ns = ii->ipsec_in_ns; 3623 ahstack = ns->netstack_ipsecah; 3624 ipss = ns->netstack_ipsec; 3625 3626 mp = ipsec_in->b_cont; 3627 hada_mp = ii->ipsec_in_da; 3628 ASSERT(hada_mp != NULL); 3629 hada = (da_ipsec_t *)hada_mp->b_rptr; 3630 3631 AH_BUMP_STAT(ahstack, in_accelerated); 3632 3633 /* 3634 * We only support one level of decapsulation in hardware, so 3635 * nuke the pointer. 3636 */ 3637 ii->ipsec_in_da = NULL; 3638 ii->ipsec_in_accelerated = B_FALSE; 3639 3640 /* 3641 * Extract ICV length from attributes M_CTL and sanity check 3642 * its value. We allow the mblk to be smaller than da_ipsec_t 3643 * for a small ICV, as long as the entire ICV fits within the mblk. 3644 * Also ensures that the ICV length computed by Provider 3645 * corresponds to the ICV length of the algorithm specified by the SA. 3646 */ 3647 icv_len = hada->da_icv_len; 3648 if ((icv_len != assoc->ipsa_mac_len) || 3649 (icv_len > DA_ICV_MAX_LEN) || (MBLKL(hada_mp) < 3650 (sizeof (da_ipsec_t) - DA_ICV_MAX_LEN + icv_len))) { 3651 ah0dbg(("ah_inbound_accelerated: " 3652 "ICV len (%u) incorrect or mblk too small (%u)\n", 3653 icv_len, (uint32_t)(MBLKL(hada_mp)))); 3654 counter = DROPPER(ipss, ipds_ah_bad_length); 3655 goto ah_in_discard; 3656 } 3657 ASSERT(icv_len != 0); 3658 3659 /* compute the padded AH ICV len */ 3660 if (isv4) { 3661 ipha = (ipha_t *)mp->b_rptr; 3662 align_len = (icv_len + IPV4_PADDING_ALIGN - 1) & 3663 -IPV4_PADDING_ALIGN; 3664 } else { 3665 ip6h = (ip6_t *)mp->b_rptr; 3666 align_len = (icv_len + IPV6_PADDING_ALIGN - 1) & 3667 -IPV6_PADDING_ALIGN; 3668 } 3669 3670 ah = (ah_t *)(mp->b_rptr + ah_offset); 3671 in_icv = (uint8_t *)ah + sizeof (ah_t); 3672 3673 /* compare ICV in AH header vs ICV computed by adapter */ 3674 if (bcmp(hada->da_icv, in_icv, icv_len)) { 3675 int af; 3676 void *addr; 3677 3678 if (isv4) { 3679 addr = &ipha->ipha_dst; 3680 af = AF_INET; 3681 } else { 3682 addr = &ip6h->ip6_dst; 3683 af = AF_INET6; 3684 } 3685 3686 /* 3687 * Log the event. Don't print to the console, block 3688 * potential denial-of-service attack. 3689 */ 3690 AH_BUMP_STAT(ahstack, bad_auth); 3691 ipsec_assocfailure(info.mi_idnum, 0, 0, SL_ERROR | SL_WARN, 3692 "AH Authentication failed spi %x, dst_addr %s", 3693 assoc->ipsa_spi, addr, af, ahstack->ipsecah_netstack); 3694 counter = DROPPER(ipss, ipds_ah_bad_auth); 3695 goto ah_in_discard; 3696 } 3697 3698 ah3dbg(ahstack, ("AH succeeded, checking replay\n")); 3699 AH_BUMP_STAT(ahstack, good_auth); 3700 3701 if (!sadb_replay_check(assoc, ah->ah_replay)) { 3702 int af; 3703 void *addr; 3704 3705 if (isv4) { 3706 addr = &ipha->ipha_dst; 3707 af = AF_INET; 3708 } else { 3709 addr = &ip6h->ip6_dst; 3710 af = AF_INET6; 3711 } 3712 3713 /* 3714 * Log the event. As of now we print out an event. 3715 * Do not print the replay failure number, or else 3716 * syslog cannot collate the error messages. Printing 3717 * the replay number that failed (or printing to the 3718 * console) opens a denial-of-service attack. 3719 */ 3720 AH_BUMP_STAT(ahstack, replay_failures); 3721 ipsec_assocfailure(info.mi_idnum, 0, 0, 3722 SL_ERROR | SL_WARN, 3723 "Replay failed for AH spi %x, dst_addr %s", 3724 assoc->ipsa_spi, addr, af, ahstack->ipsecah_netstack); 3725 counter = DROPPER(ipss, ipds_ah_replay); 3726 goto ah_in_discard; 3727 } 3728 3729 /* 3730 * Remove AH header. We do this by copying everything before 3731 * the AH header onto the AH header+ICV. 3732 */ 3733 /* overwrite AH with what was preceeding it (IP header) */ 3734 next_hdr = ah->ah_nexthdr; 3735 ovbcopy(mp->b_rptr, mp->b_rptr + sizeof (ah_t) + align_len, 3736 ah_offset); 3737 mp->b_rptr += sizeof (ah_t) + align_len; 3738 if (isv4) { 3739 /* adjust IP header next protocol */ 3740 ipha = (ipha_t *)mp->b_rptr; 3741 ipha->ipha_protocol = next_hdr; 3742 3743 age_bytes = ipha->ipha_length; 3744 3745 /* adjust length in IP header */ 3746 ipha->ipha_length -= (sizeof (ah_t) + align_len); 3747 3748 /* recalculate checksum */ 3749 ipha->ipha_hdr_checksum = 0; 3750 ipha->ipha_hdr_checksum = (uint16_t)ip_csum_hdr(ipha); 3751 } else { 3752 /* adjust IP header next protocol */ 3753 ip6h = (ip6_t *)mp->b_rptr; 3754 ip6h->ip6_nxt = next_hdr; 3755 3756 age_bytes = sizeof (ip6_t) + ntohs(ip6h->ip6_plen) + 3757 sizeof (ah_t); 3758 3759 /* adjust length in IP header */ 3760 ip6h->ip6_plen = htons(ntohs(ip6h->ip6_plen) - 3761 (sizeof (ah_t) + align_len)); 3762 } 3763 3764 /* age SA */ 3765 if (!ah_age_bytes(assoc, age_bytes, B_TRUE)) { 3766 /* The ipsa has hit hard expiration, LOG and AUDIT. */ 3767 ipsec_assocfailure(info.mi_idnum, 0, 0, 3768 SL_ERROR | SL_WARN, 3769 "AH Association 0x%x, dst %s had bytes expire.\n", 3770 assoc->ipsa_spi, assoc->ipsa_dstaddr, 3771 AF_INET, ahstack->ipsecah_netstack); 3772 AH_BUMP_STAT(ahstack, bytes_expired); 3773 counter = DROPPER(ipss, ipds_ah_bytes_expire); 3774 goto ah_in_discard; 3775 } 3776 3777 freeb(hada_mp); 3778 return (IPSEC_STATUS_SUCCESS); 3779 3780 ah_in_discard: 3781 IP_AH_BUMP_STAT(ipss, in_discards); 3782 freeb(hada_mp); 3783 ip_drop_packet(ipsec_in, B_TRUE, NULL, NULL, counter, 3784 &ahstack->ah_dropper); 3785 return (IPSEC_STATUS_FAILED); 3786 } 3787 3788 /* 3789 * ah_outbound_accelerated_v4: 3790 * Called from ah_outbound_v4() and once it is determined that the 3791 * packet is elligible for hardware acceleration. 3792 * 3793 * We proceed as follows: 3794 * 1. allocate and initialize attributes mblk 3795 * 2. mark IPSEC_OUT to indicate that pkt is accelerated 3796 * 3. insert AH header 3797 */ 3798 static ipsec_status_t 3799 ah_outbound_accelerated_v4(mblk_t *ipsec_mp, ipsa_t *assoc) 3800 { 3801 mblk_t *mp, *new_mp; 3802 ipsec_out_t *oi; 3803 uint_t ah_data_sz; /* ICV length, algorithm dependent */ 3804 uint_t ah_align_sz; /* ICV length + padding */ 3805 uint32_t v_hlen_tos_len; /* from original IP header */ 3806 ipha_t *oipha; /* original IP header */ 3807 ipha_t *nipha; /* new IP header */ 3808 uint_t option_length = 0; 3809 uint_t new_hdr_len; /* new header length */ 3810 uint_t iphdr_length; 3811 ah_t *ah_hdr; /* ptr to AH header */ 3812 netstack_t *ns; 3813 ipsec_stack_t *ipss; 3814 ipsecah_stack_t *ahstack; 3815 3816 oi = (ipsec_out_t *)ipsec_mp->b_rptr; 3817 ns = oi->ipsec_out_ns; 3818 ipss = ns->netstack_ipsec; 3819 ahstack = ns->netstack_ipsecah; 3820 3821 mp = ipsec_mp->b_cont; 3822 3823 AH_BUMP_STAT(ahstack, out_accelerated); 3824 3825 oipha = (ipha_t *)mp->b_rptr; 3826 v_hlen_tos_len = ((uint32_t *)oipha)[0]; 3827 3828 /* mark packet as being accelerated in IPSEC_OUT */ 3829 ASSERT(oi->ipsec_out_accelerated == B_FALSE); 3830 oi->ipsec_out_accelerated = B_TRUE; 3831 3832 /* calculate authentication data length, i.e. ICV + padding */ 3833 ah_data_sz = assoc->ipsa_mac_len; 3834 ah_align_sz = (ah_data_sz + IPV4_PADDING_ALIGN - 1) & 3835 -IPV4_PADDING_ALIGN; 3836 3837 /* 3838 * Insert pseudo header: 3839 * IPSEC_INFO -> [IP, ULP] => IPSEC_INFO -> [IP, AH, ICV] -> ULP 3840 */ 3841 3842 /* IP + AH + authentication + padding data length */ 3843 new_hdr_len = IP_SIMPLE_HDR_LENGTH + sizeof (ah_t) + ah_align_sz; 3844 if (V_HLEN != IP_SIMPLE_HDR_VERSION) { 3845 option_length = oipha->ipha_version_and_hdr_length - 3846 (uint8_t)((IP_VERSION << 4) + 3847 IP_SIMPLE_HDR_LENGTH_IN_WORDS); 3848 option_length <<= 2; 3849 new_hdr_len += option_length; 3850 } 3851 3852 /* allocate pseudo-header mblk */ 3853 if ((new_mp = allocb(new_hdr_len, BPRI_HI)) == NULL) { 3854 /* IPsec kstats: bump bean counter here */ 3855 ip_drop_packet(ipsec_mp, B_FALSE, NULL, NULL, 3856 DROPPER(ipss, ipds_ah_nomem), 3857 &ahstack->ah_dropper); 3858 return (IPSEC_STATUS_FAILED); 3859 } 3860 3861 new_mp->b_cont = mp; 3862 ipsec_mp->b_cont = new_mp; 3863 new_mp->b_wptr += new_hdr_len; 3864 3865 /* copy original IP header to new header */ 3866 bcopy(mp->b_rptr, new_mp->b_rptr, IP_SIMPLE_HDR_LENGTH + 3867 option_length); 3868 3869 /* update IP header */ 3870 nipha = (ipha_t *)new_mp->b_rptr; 3871 nipha->ipha_protocol = IPPROTO_AH; 3872 iphdr_length = ntohs(nipha->ipha_length); 3873 iphdr_length += sizeof (ah_t) + ah_align_sz; 3874 nipha->ipha_length = htons(iphdr_length); 3875 nipha->ipha_hdr_checksum = 0; 3876 nipha->ipha_hdr_checksum = (uint16_t)ip_csum_hdr(nipha); 3877 3878 /* skip original IP header in mp */ 3879 mp->b_rptr += IP_SIMPLE_HDR_LENGTH + option_length; 3880 3881 /* initialize AH header */ 3882 ah_hdr = (ah_t *)(new_mp->b_rptr + IP_SIMPLE_HDR_LENGTH + 3883 option_length); 3884 ah_hdr->ah_nexthdr = oipha->ipha_protocol; 3885 if (!ah_finish_up(ah_hdr, NULL, assoc, ah_data_sz, ah_align_sz, 3886 ahstack)) { 3887 /* Only way this fails is if outbound replay counter wraps. */ 3888 ip_drop_packet(ipsec_mp, B_FALSE, NULL, NULL, 3889 DROPPER(ipss, ipds_ah_replay), 3890 &ahstack->ah_dropper); 3891 return (IPSEC_STATUS_FAILED); 3892 } 3893 3894 return (IPSEC_STATUS_SUCCESS); 3895 } 3896 3897 /* 3898 * ah_outbound_accelerated_v6: 3899 * 3900 * Called from ah_outbound_v6() once it is determined that the packet 3901 * is eligible for hardware acceleration. 3902 * 3903 * We proceed as follows: 3904 * 1. allocate and initialize attributes mblk 3905 * 2. mark IPSEC_OUT to indicate that pkt is accelerated 3906 * 3. insert AH header 3907 */ 3908 static ipsec_status_t 3909 ah_outbound_accelerated_v6(mblk_t *ipsec_mp, ipsa_t *assoc) 3910 { 3911 mblk_t *mp, *phdr_mp; 3912 ipsec_out_t *oi; 3913 uint_t ah_data_sz; /* ICV length, algorithm dependent */ 3914 uint_t ah_align_sz; /* ICV length + padding */ 3915 ip6_t *oip6h; /* original IP header */ 3916 ip6_t *ip6h; /* new IP header */ 3917 uint_t option_length = 0; 3918 uint_t hdr_size; 3919 uint_t ah_offset; 3920 ah_t *ah_hdr; /* ptr to AH header */ 3921 netstack_t *ns; 3922 ipsec_stack_t *ipss; 3923 ipsecah_stack_t *ahstack; 3924 3925 oi = (ipsec_out_t *)ipsec_mp->b_rptr; 3926 ns = oi->ipsec_out_ns; 3927 ipss = ns->netstack_ipsec; 3928 ahstack = ns->netstack_ipsecah; 3929 3930 mp = ipsec_mp->b_cont; 3931 3932 AH_BUMP_STAT(ahstack, out_accelerated); 3933 3934 oip6h = (ip6_t *)mp->b_rptr; 3935 3936 /* mark packet as being accelerated in IPSEC_OUT */ 3937 ASSERT(oi->ipsec_out_accelerated == B_FALSE); 3938 oi->ipsec_out_accelerated = B_TRUE; 3939 3940 /* calculate authentication data length, i.e. ICV + padding */ 3941 ah_data_sz = assoc->ipsa_mac_len; 3942 ah_align_sz = (ah_data_sz + IPV4_PADDING_ALIGN - 1) & 3943 -IPV4_PADDING_ALIGN; 3944 3945 ASSERT(ah_align_sz >= ah_data_sz); 3946 3947 hdr_size = ipsec_ah_get_hdr_size_v6(mp, B_FALSE); 3948 option_length = hdr_size - IPV6_HDR_LEN; 3949 3950 /* This was not included in ipsec_ah_get_hdr_size_v6() */ 3951 hdr_size += (sizeof (ah_t) + ah_align_sz); 3952 3953 if ((phdr_mp = allocb(hdr_size, BPRI_HI)) == NULL) { 3954 ip_drop_packet(ipsec_mp, B_FALSE, NULL, NULL, 3955 DROPPER(ipss, ipds_ah_nomem), 3956 &ahstack->ah_dropper); 3957 return (IPSEC_STATUS_FAILED); 3958 } 3959 phdr_mp->b_wptr += hdr_size; 3960 3961 /* 3962 * Form the basic IP header first. We always assign every bit 3963 * of the v6 basic header, so a separate bzero is unneeded. 3964 */ 3965 ip6h = (ip6_t *)phdr_mp->b_rptr; 3966 ip6h->ip6_vcf = oip6h->ip6_vcf; 3967 ip6h->ip6_hlim = oip6h->ip6_hlim; 3968 ip6h->ip6_src = oip6h->ip6_src; 3969 ip6h->ip6_dst = oip6h->ip6_dst; 3970 /* 3971 * Include the size of AH and authentication data. 3972 * This is how our recipient would compute the 3973 * authentication data. Look at what we do in the 3974 * inbound case below. 3975 */ 3976 ip6h->ip6_plen = htons(ntohs(oip6h->ip6_plen) + sizeof (ah_t) + 3977 ah_align_sz); 3978 3979 /* 3980 * Insert pseudo header: 3981 * IPSEC_INFO -> [IP6, LLH, ULP] => 3982 * IPSEC_INFO -> [IP, LLH, AH, ICV] -> ULP 3983 */ 3984 3985 if (option_length == 0) { 3986 /* Form the AH header */ 3987 ip6h->ip6_nxt = IPPROTO_AH; 3988 ((ah_t *)(ip6h + 1))->ah_nexthdr = oip6h->ip6_nxt; 3989 ah_offset = IPV6_HDR_LEN; 3990 } else { 3991 ip6h->ip6_nxt = oip6h->ip6_nxt; 3992 /* option_length does not include the AH header's size */ 3993 ah_offset = ah_fix_phdr_v6(ip6h, oip6h, B_TRUE, B_FALSE); 3994 if (ah_offset == 0) { 3995 freemsg(phdr_mp); 3996 ip_drop_packet(ipsec_mp, B_FALSE, NULL, NULL, 3997 DROPPER(ipss, ipds_ah_bad_v6_hdrs), 3998 &ahstack->ah_dropper); 3999 return (IPSEC_STATUS_FAILED); 4000 } 4001 } 4002 4003 phdr_mp->b_cont = mp; 4004 ipsec_mp->b_cont = phdr_mp; 4005 4006 /* skip original IP header in mp */ 4007 mp->b_rptr += IPV6_HDR_LEN + option_length; 4008 4009 /* initialize AH header */ 4010 ah_hdr = (ah_t *)(phdr_mp->b_rptr + IPV6_HDR_LEN + option_length); 4011 ah_hdr->ah_nexthdr = oip6h->ip6_nxt; 4012 4013 if (!ah_finish_up(((ah_t *)((uint8_t *)ip6h + ah_offset)), NULL, 4014 assoc, ah_data_sz, ah_align_sz, ahstack)) { 4015 /* Only way this fails is if outbound replay counter wraps. */ 4016 ip_drop_packet(ipsec_mp, B_FALSE, NULL, NULL, 4017 DROPPER(ipss, ipds_ah_replay), 4018 &ahstack->ah_dropper); 4019 return (IPSEC_STATUS_FAILED); 4020 } 4021 4022 return (IPSEC_STATUS_SUCCESS); 4023 } 4024 4025 /* 4026 * Invoked after processing of an inbound packet by the 4027 * kernel crypto framework. Called by ah_submit_req() for a sync request, 4028 * or by the kcf callback for an async request. 4029 * Returns IPSEC_STATUS_SUCCESS on success, IPSEC_STATUS_FAILED on failure. 4030 * On failure, the mblk chain ipsec_in is freed by this function. 4031 */ 4032 static ipsec_status_t 4033 ah_auth_in_done(mblk_t *ipsec_in) 4034 { 4035 mblk_t *phdr_mp; 4036 ipha_t *ipha; 4037 uint_t ah_offset = 0; 4038 mblk_t *mp; 4039 int align_len, newpos; 4040 ah_t *ah; 4041 uint32_t length; 4042 uint32_t *dest32; 4043 uint8_t *dest; 4044 ipsec_in_t *ii; 4045 boolean_t isv4; 4046 ip6_t *ip6h; 4047 uint_t icv_len; 4048 ipsa_t *assoc; 4049 kstat_named_t *counter; 4050 netstack_t *ns; 4051 ipsecah_stack_t *ahstack; 4052 ipsec_stack_t *ipss; 4053 4054 ii = (ipsec_in_t *)ipsec_in->b_rptr; 4055 ns = ii->ipsec_in_ns; 4056 ahstack = ns->netstack_ipsecah; 4057 ipss = ns->netstack_ipsec; 4058 4059 isv4 = ii->ipsec_in_v4; 4060 assoc = ii->ipsec_in_ah_sa; 4061 icv_len = (uint_t)ii->ipsec_in_crypto_mac.cd_raw.iov_len; 4062 4063 phdr_mp = ipsec_in->b_cont; 4064 if (phdr_mp == NULL) { 4065 ip_drop_packet(ipsec_in, B_TRUE, NULL, NULL, 4066 DROPPER(ipss, ipds_ah_nomem), 4067 &ahstack->ah_dropper); 4068 return (IPSEC_STATUS_FAILED); 4069 } 4070 4071 mp = phdr_mp->b_cont; 4072 if (mp == NULL) { 4073 ip_drop_packet(ipsec_in, B_TRUE, NULL, NULL, 4074 DROPPER(ipss, ipds_ah_nomem), 4075 &ahstack->ah_dropper); 4076 return (IPSEC_STATUS_FAILED); 4077 } 4078 mp->b_rptr -= ii->ipsec_in_skip_len; 4079 4080 ah_set_usetime(assoc, B_TRUE); 4081 4082 if (isv4) { 4083 ipha = (ipha_t *)mp->b_rptr; 4084 ah_offset = ipha->ipha_version_and_hdr_length - 4085 (uint8_t)((IP_VERSION << 4)); 4086 ah_offset <<= 2; 4087 align_len = P2ALIGN(icv_len + IPV4_PADDING_ALIGN - 1, 4088 IPV4_PADDING_ALIGN); 4089 } else { 4090 ip6h = (ip6_t *)mp->b_rptr; 4091 ah_offset = ipsec_ah_get_hdr_size_v6(mp, B_TRUE); 4092 ASSERT((mp->b_wptr - mp->b_rptr) >= ah_offset); 4093 align_len = P2ALIGN(icv_len + IPV6_PADDING_ALIGN - 1, 4094 IPV6_PADDING_ALIGN); 4095 } 4096 4097 ah = (ah_t *)(mp->b_rptr + ah_offset); 4098 newpos = sizeof (ah_t) + align_len; 4099 4100 /* 4101 * We get here only when authentication passed. 4102 */ 4103 4104 ah3dbg(ahstack, ("AH succeeded, checking replay\n")); 4105 AH_BUMP_STAT(ahstack, good_auth); 4106 4107 if (!sadb_replay_check(assoc, ah->ah_replay)) { 4108 int af; 4109 void *addr; 4110 4111 if (isv4) { 4112 addr = &ipha->ipha_dst; 4113 af = AF_INET; 4114 } else { 4115 addr = &ip6h->ip6_dst; 4116 af = AF_INET6; 4117 } 4118 4119 /* 4120 * Log the event. As of now we print out an event. 4121 * Do not print the replay failure number, or else 4122 * syslog cannot collate the error messages. Printing 4123 * the replay number that failed (or printing to the 4124 * console) opens a denial-of-service attack. 4125 */ 4126 AH_BUMP_STAT(ahstack, replay_failures); 4127 ipsec_assocfailure(info.mi_idnum, 0, 0, 4128 SL_ERROR | SL_WARN, 4129 "Replay failed for AH spi %x, dst_addr %s", 4130 assoc->ipsa_spi, addr, af, ahstack->ipsecah_netstack); 4131 counter = DROPPER(ipss, ipds_ah_replay); 4132 goto ah_in_discard; 4133 } 4134 4135 /* 4136 * We need to remove the AH header from the original 4137 * datagram. Best way to do this is to move the pre-AH headers 4138 * forward in the (relatively simple) IPv4 case. In IPv6, it's 4139 * a bit more complicated because of IPv6's next-header chaining, 4140 * but it's doable. 4141 */ 4142 if (isv4) { 4143 /* 4144 * Assign the right protocol, adjust the length as we 4145 * are removing the AH header and adjust the checksum to 4146 * account for the protocol and length. 4147 */ 4148 length = ntohs(ipha->ipha_length); 4149 if (!ah_age_bytes(assoc, length, B_TRUE)) { 4150 /* The ipsa has hit hard expiration, LOG and AUDIT. */ 4151 ipsec_assocfailure(info.mi_idnum, 0, 0, 4152 SL_ERROR | SL_WARN, 4153 "AH Association 0x%x, dst %s had bytes expire.\n", 4154 assoc->ipsa_spi, assoc->ipsa_dstaddr, 4155 AF_INET, ahstack->ipsecah_netstack); 4156 AH_BUMP_STAT(ahstack, bytes_expired); 4157 counter = DROPPER(ipss, ipds_ah_bytes_expire); 4158 goto ah_in_discard; 4159 } 4160 ipha->ipha_protocol = ah->ah_nexthdr; 4161 length -= newpos; 4162 4163 ipha->ipha_length = htons((uint16_t)length); 4164 ipha->ipha_hdr_checksum = 0; 4165 ipha->ipha_hdr_checksum = (uint16_t)ip_csum_hdr(ipha); 4166 } else { 4167 uchar_t *whereptr; 4168 int hdrlen; 4169 uint8_t *nexthdr; 4170 ip6_hbh_t *hbhhdr; 4171 ip6_dest_t *dsthdr; 4172 ip6_rthdr0_t *rthdr; 4173 4174 /* 4175 * Make phdr_mp hold until the AH header and make 4176 * mp hold everything past AH header. 4177 */ 4178 length = ntohs(ip6h->ip6_plen); 4179 if (!ah_age_bytes(assoc, length + sizeof (ip6_t), B_TRUE)) { 4180 /* The ipsa has hit hard expiration, LOG and AUDIT. */ 4181 ipsec_assocfailure(info.mi_idnum, 0, 0, 4182 SL_ERROR | SL_WARN, 4183 "AH Association 0x%x, dst %s had bytes " 4184 "expire.\n", assoc->ipsa_spi, &ip6h->ip6_dst, 4185 AF_INET6, ahstack->ipsecah_netstack); 4186 AH_BUMP_STAT(ahstack, bytes_expired); 4187 counter = DROPPER(ipss, ipds_ah_bytes_expire); 4188 goto ah_in_discard; 4189 } 4190 4191 /* 4192 * Update the next header field of the header preceding 4193 * AH with the next header field of AH. Start with the 4194 * IPv6 header and proceed with the extension headers 4195 * until we find what we're looking for. 4196 */ 4197 nexthdr = &ip6h->ip6_nxt; 4198 whereptr = (uchar_t *)ip6h; 4199 hdrlen = sizeof (ip6_t); 4200 4201 while (*nexthdr != IPPROTO_AH) { 4202 whereptr += hdrlen; 4203 /* Assume IP has already stripped it */ 4204 ASSERT(*nexthdr != IPPROTO_FRAGMENT && 4205 *nexthdr != IPPROTO_RAW); 4206 switch (*nexthdr) { 4207 case IPPROTO_HOPOPTS: 4208 hbhhdr = (ip6_hbh_t *)whereptr; 4209 nexthdr = &hbhhdr->ip6h_nxt; 4210 hdrlen = 8 * (hbhhdr->ip6h_len + 1); 4211 break; 4212 case IPPROTO_DSTOPTS: 4213 dsthdr = (ip6_dest_t *)whereptr; 4214 nexthdr = &dsthdr->ip6d_nxt; 4215 hdrlen = 8 * (dsthdr->ip6d_len + 1); 4216 break; 4217 case IPPROTO_ROUTING: 4218 rthdr = (ip6_rthdr0_t *)whereptr; 4219 nexthdr = &rthdr->ip6r0_nxt; 4220 hdrlen = 8 * (rthdr->ip6r0_len + 1); 4221 break; 4222 } 4223 } 4224 *nexthdr = ah->ah_nexthdr; 4225 length -= newpos; 4226 ip6h->ip6_plen = htons((uint16_t)length); 4227 } 4228 4229 /* Now that we've fixed the IP header, move it forward. */ 4230 mp->b_rptr += newpos; 4231 if (IS_P2ALIGNED(mp->b_rptr, sizeof (uint32_t))) { 4232 dest32 = (uint32_t *)(mp->b_rptr + ah_offset); 4233 while (--dest32 >= (uint32_t *)mp->b_rptr) 4234 *dest32 = *(dest32 - (newpos >> 2)); 4235 } else { 4236 dest = mp->b_rptr + ah_offset; 4237 while (--dest >= mp->b_rptr) 4238 *dest = *(dest - newpos); 4239 } 4240 /* 4241 * If a db_credp exists in phdr_mp, it must also exist in mp. 4242 */ 4243 ASSERT(DB_CRED(phdr_mp) == NULL || 4244 msg_getcred(mp, NULL) != NULL); 4245 4246 freeb(phdr_mp); 4247 ipsec_in->b_cont = mp; 4248 if (assoc->ipsa_state == IPSA_STATE_IDLE) { 4249 /* 4250 * Cluster buffering case. Tell caller that we're 4251 * handling the packet. 4252 */ 4253 sadb_buf_pkt(assoc, ipsec_in, ns); 4254 return (IPSEC_STATUS_PENDING); 4255 } 4256 return (IPSEC_STATUS_SUCCESS); 4257 4258 ah_in_discard: 4259 IP_AH_BUMP_STAT(ipss, in_discards); 4260 ip_drop_packet(ipsec_in, B_TRUE, NULL, NULL, counter, 4261 &ahstack->ah_dropper); 4262 return (IPSEC_STATUS_FAILED); 4263 } 4264 4265 /* 4266 * Invoked after processing of an outbound packet by the 4267 * kernel crypto framework, either by ah_submit_req() for a request 4268 * executed syncrhonously, or by the KEF callback for a request 4269 * executed asynchronously. 4270 */ 4271 static ipsec_status_t 4272 ah_auth_out_done(mblk_t *ipsec_out) 4273 { 4274 mblk_t *phdr_mp; 4275 mblk_t *mp; 4276 int align_len; 4277 uint32_t hdrs_length; 4278 uchar_t *ptr; 4279 uint32_t length; 4280 boolean_t isv4; 4281 ipsec_out_t *io; 4282 size_t icv_len; 4283 netstack_t *ns; 4284 ipsec_stack_t *ipss; 4285 ipsecah_stack_t *ahstack; 4286 4287 io = (ipsec_out_t *)ipsec_out->b_rptr; 4288 ns = io->ipsec_out_ns; 4289 ipss = ns->netstack_ipsec; 4290 ahstack = ns->netstack_ipsecah; 4291 4292 isv4 = io->ipsec_out_v4; 4293 icv_len = io->ipsec_out_crypto_mac.cd_raw.iov_len; 4294 4295 phdr_mp = ipsec_out->b_cont; 4296 if (phdr_mp == NULL) { 4297 ip_drop_packet(ipsec_out, B_FALSE, NULL, NULL, 4298 DROPPER(ipss, ipds_ah_nomem), 4299 &ahstack->ah_dropper); 4300 return (IPSEC_STATUS_FAILED); 4301 } 4302 4303 mp = phdr_mp->b_cont; 4304 if (mp == NULL) { 4305 ip_drop_packet(ipsec_out, B_FALSE, NULL, NULL, 4306 DROPPER(ipss, ipds_ah_nomem), 4307 &ahstack->ah_dropper); 4308 return (IPSEC_STATUS_FAILED); 4309 } 4310 mp->b_rptr -= io->ipsec_out_skip_len; 4311 4312 ASSERT(io->ipsec_out_ah_sa != NULL); 4313 ah_set_usetime(io->ipsec_out_ah_sa, B_FALSE); 4314 4315 if (isv4) { 4316 ipha_t *ipha; 4317 ipha_t *nipha; 4318 4319 ipha = (ipha_t *)mp->b_rptr; 4320 hdrs_length = ipha->ipha_version_and_hdr_length - 4321 (uint8_t)((IP_VERSION << 4)); 4322 hdrs_length <<= 2; 4323 align_len = P2ALIGN(icv_len + IPV4_PADDING_ALIGN - 1, 4324 IPV4_PADDING_ALIGN); 4325 /* 4326 * phdr_mp must have the right amount of space for the 4327 * combined IP and AH header. Copy the IP header and 4328 * the ack_data onto AH. Note that the AH header was 4329 * already formed before the ICV calculation and hence 4330 * you don't have to copy it here. 4331 */ 4332 bcopy(mp->b_rptr, phdr_mp->b_rptr, hdrs_length); 4333 4334 ptr = phdr_mp->b_rptr + hdrs_length + sizeof (ah_t); 4335 bcopy(phdr_mp->b_wptr, ptr, icv_len); 4336 4337 /* 4338 * Compute the new header checksum as we are assigning 4339 * IPPROTO_AH and adjusting the length here. 4340 */ 4341 nipha = (ipha_t *)phdr_mp->b_rptr; 4342 4343 nipha->ipha_protocol = IPPROTO_AH; 4344 length = ntohs(nipha->ipha_length); 4345 length += (sizeof (ah_t) + align_len); 4346 nipha->ipha_length = htons((uint16_t)length); 4347 nipha->ipha_hdr_checksum = 0; 4348 nipha->ipha_hdr_checksum = (uint16_t)ip_csum_hdr(nipha); 4349 } else { 4350 ip6_t *ip6h; 4351 ip6_t *nip6h; 4352 uint_t ah_offset; 4353 4354 ip6h = (ip6_t *)mp->b_rptr; 4355 nip6h = (ip6_t *)phdr_mp->b_rptr; 4356 align_len = P2ALIGN(icv_len + IPV6_PADDING_ALIGN - 1, 4357 IPV6_PADDING_ALIGN); 4358 /* 4359 * phdr_mp must have the right amount of space for the 4360 * combined IP and AH header. Copy the IP header with 4361 * options into the pseudo header. When we constructed 4362 * a pseudo header, we did not copy some of the mutable 4363 * fields. We do it now by calling ah_fix_phdr_v6() 4364 * with the last argument B_TRUE. It returns the 4365 * ah_offset into the pseudo header. 4366 */ 4367 4368 bcopy(ip6h, nip6h, IPV6_HDR_LEN); 4369 ah_offset = ah_fix_phdr_v6(nip6h, ip6h, B_TRUE, B_TRUE); 4370 ASSERT(ah_offset != 0); 4371 /* 4372 * phdr_mp can hold exactly the whole IP header with options 4373 * plus the AH header also. Thus subtracting the AH header's 4374 * size should give exactly how much of the original header 4375 * should be skipped. 4376 */ 4377 hdrs_length = (phdr_mp->b_wptr - phdr_mp->b_rptr) - 4378 sizeof (ah_t) - icv_len; 4379 bcopy(phdr_mp->b_wptr, ((uint8_t *)nip6h + ah_offset + 4380 sizeof (ah_t)), icv_len); 4381 length = ntohs(nip6h->ip6_plen); 4382 length += (sizeof (ah_t) + align_len); 4383 nip6h->ip6_plen = htons((uint16_t)length); 4384 } 4385 4386 /* Skip the original IP header */ 4387 mp->b_rptr += hdrs_length; 4388 if (mp->b_rptr == mp->b_wptr) { 4389 phdr_mp->b_cont = mp->b_cont; 4390 freeb(mp); 4391 } 4392 4393 return (IPSEC_STATUS_SUCCESS); 4394 } 4395 4396 /* 4397 * Wrapper to allow IP to trigger an AH association failure message 4398 * during SA inbound selection. 4399 */ 4400 void 4401 ipsecah_in_assocfailure(mblk_t *mp, char level, ushort_t sl, char *fmt, 4402 uint32_t spi, void *addr, int af, ipsecah_stack_t *ahstack) 4403 { 4404 ipsec_stack_t *ipss = ahstack->ipsecah_netstack->netstack_ipsec; 4405 4406 if (ahstack->ipsecah_log_unknown_spi) { 4407 ipsec_assocfailure(info.mi_idnum, 0, level, sl, fmt, spi, 4408 addr, af, ahstack->ipsecah_netstack); 4409 } 4410 4411 ip_drop_packet(mp, B_TRUE, NULL, NULL, 4412 DROPPER(ipss, ipds_ah_no_sa), 4413 &ahstack->ah_dropper); 4414 } 4415 4416 /* 4417 * Initialize the AH input and output processing functions. 4418 */ 4419 void 4420 ipsecah_init_funcs(ipsa_t *sa) 4421 { 4422 if (sa->ipsa_output_func == NULL) 4423 sa->ipsa_output_func = ah_outbound; 4424 if (sa->ipsa_input_func == NULL) 4425 sa->ipsa_input_func = ah_inbound; 4426 } 4427