17c478bd9Sstevel@tonic-gate /*
27c478bd9Sstevel@tonic-gate * CDDL HEADER START
37c478bd9Sstevel@tonic-gate *
47c478bd9Sstevel@tonic-gate * The contents of this file are subject to the terms of the
55dddb8baSkcpoon * Common Development and Distribution License (the "License").
65dddb8baSkcpoon * You may not use this file except in compliance with the License.
77c478bd9Sstevel@tonic-gate *
87c478bd9Sstevel@tonic-gate * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
97c478bd9Sstevel@tonic-gate * or http://www.opensolaris.org/os/licensing.
107c478bd9Sstevel@tonic-gate * See the License for the specific language governing permissions
117c478bd9Sstevel@tonic-gate * and limitations under the License.
127c478bd9Sstevel@tonic-gate *
137c478bd9Sstevel@tonic-gate * When distributing Covered Code, include this CDDL HEADER in each
147c478bd9Sstevel@tonic-gate * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
157c478bd9Sstevel@tonic-gate * If applicable, add the following below this CDDL HEADER, with the
167c478bd9Sstevel@tonic-gate * fields enclosed by brackets "[]" replaced with your own identifying
177c478bd9Sstevel@tonic-gate * information: Portions Copyright [yyyy] [name of copyright owner]
187c478bd9Sstevel@tonic-gate *
197c478bd9Sstevel@tonic-gate * CDDL HEADER END
207c478bd9Sstevel@tonic-gate */
215dddb8baSkcpoon
227c478bd9Sstevel@tonic-gate /*
23fd7b5aedSGeorge Shepherd * Copyright (c) 2004, 2010, Oracle and/or its affiliates. All rights reserved.
247c478bd9Sstevel@tonic-gate */
257c478bd9Sstevel@tonic-gate
267c478bd9Sstevel@tonic-gate #include <sys/types.h>
277c478bd9Sstevel@tonic-gate #include <sys/stream.h>
287c478bd9Sstevel@tonic-gate #include <sys/strsubr.h>
297c478bd9Sstevel@tonic-gate #include <sys/stropts.h>
307c478bd9Sstevel@tonic-gate #include <sys/strsun.h>
317c478bd9Sstevel@tonic-gate #define _SUN_TPI_VERSION 2
327c478bd9Sstevel@tonic-gate #include <sys/tihdr.h>
337c478bd9Sstevel@tonic-gate #include <sys/ddi.h>
347c478bd9Sstevel@tonic-gate #include <sys/sunddi.h>
357c478bd9Sstevel@tonic-gate #include <sys/xti_inet.h>
367c478bd9Sstevel@tonic-gate #include <sys/cmn_err.h>
377c478bd9Sstevel@tonic-gate #include <sys/debug.h>
387c478bd9Sstevel@tonic-gate #include <sys/vtrace.h>
397c478bd9Sstevel@tonic-gate #include <sys/kmem.h>
407c478bd9Sstevel@tonic-gate #include <sys/cpuvar.h>
417c478bd9Sstevel@tonic-gate #include <sys/random.h>
4245916cd2Sjpk #include <sys/priv.h>
43f4b3ec61Sdh155122 #include <sys/sunldi.h>
447c478bd9Sstevel@tonic-gate
457c478bd9Sstevel@tonic-gate #include <sys/errno.h>
467c478bd9Sstevel@tonic-gate #include <sys/signal.h>
477c478bd9Sstevel@tonic-gate #include <sys/socket.h>
487c478bd9Sstevel@tonic-gate #include <sys/isa_defs.h>
497c478bd9Sstevel@tonic-gate #include <netinet/in.h>
507c478bd9Sstevel@tonic-gate #include <netinet/tcp.h>
517c478bd9Sstevel@tonic-gate #include <netinet/ip6.h>
527c478bd9Sstevel@tonic-gate #include <netinet/icmp6.h>
537c478bd9Sstevel@tonic-gate #include <netinet/sctp.h>
547c478bd9Sstevel@tonic-gate #include <net/if.h>
557c478bd9Sstevel@tonic-gate
567c478bd9Sstevel@tonic-gate #include <inet/common.h>
577c478bd9Sstevel@tonic-gate #include <inet/ip.h>
58bd670b35SErik Nordmark #include <inet/ip_if.h>
59bd670b35SErik Nordmark #include <inet/ip_ire.h>
607c478bd9Sstevel@tonic-gate #include <inet/ip6.h>
617c478bd9Sstevel@tonic-gate #include <inet/mi.h>
627c478bd9Sstevel@tonic-gate #include <inet/mib2.h>
63f4b3ec61Sdh155122 #include <inet/kstatcom.h>
647c478bd9Sstevel@tonic-gate #include <inet/optcom.h>
657c478bd9Sstevel@tonic-gate #include <inet/ipclassifier.h>
667c478bd9Sstevel@tonic-gate #include <inet/ipsec_impl.h>
677c478bd9Sstevel@tonic-gate #include <inet/sctp_ip.h>
687c478bd9Sstevel@tonic-gate #include <inet/sctp_crc32.h>
697c478bd9Sstevel@tonic-gate
707c478bd9Sstevel@tonic-gate #include "sctp_impl.h"
717c478bd9Sstevel@tonic-gate #include "sctp_addr.h"
721d8c4025Svi117747 #include "sctp_asconf.h"
737c478bd9Sstevel@tonic-gate
747c478bd9Sstevel@tonic-gate int sctpdebug;
757c478bd9Sstevel@tonic-gate sin6_t sctp_sin6_null; /* Zero address for quick clears */
767c478bd9Sstevel@tonic-gate
777c478bd9Sstevel@tonic-gate static void sctp_closei_local(sctp_t *sctp);
787c478bd9Sstevel@tonic-gate static int sctp_init_values(sctp_t *, sctp_t *, int);
797c478bd9Sstevel@tonic-gate static void sctp_icmp_error_ipv6(sctp_t *sctp, mblk_t *mp);
807c478bd9Sstevel@tonic-gate static void sctp_process_recvq(void *);
81f4b3ec61Sdh155122 static void sctp_rq_tq_init(sctp_stack_t *);
82f4b3ec61Sdh155122 static void sctp_rq_tq_fini(sctp_stack_t *);
837c478bd9Sstevel@tonic-gate static void sctp_conn_cache_init();
847c478bd9Sstevel@tonic-gate static void sctp_conn_cache_fini();
857c478bd9Sstevel@tonic-gate static int sctp_conn_cache_constructor();
867c478bd9Sstevel@tonic-gate static void sctp_conn_cache_destructor();
87121e5416Skcpoon static void sctp_conn_clear(conn_t *);
88bd670b35SErik Nordmark static void sctp_notify(void *, ip_xmit_attr_t *, ixa_notify_type_t,
89bd670b35SErik Nordmark ixa_notify_arg_t);
90f4b3ec61Sdh155122
91f4b3ec61Sdh155122 static void *sctp_stack_init(netstackid_t stackid, netstack_t *ns);
92f4b3ec61Sdh155122 static void sctp_stack_fini(netstackid_t stackid, void *arg);
937c478bd9Sstevel@tonic-gate
947c478bd9Sstevel@tonic-gate /*
957c478bd9Sstevel@tonic-gate * SCTP receive queue taskq
967c478bd9Sstevel@tonic-gate *
977c478bd9Sstevel@tonic-gate * At SCTP initialization time, a default taskq is created for
987c478bd9Sstevel@tonic-gate * servicing packets received when the interrupt thread cannot
997c478bd9Sstevel@tonic-gate * get a hold on the sctp_t. The number of taskq can be increased in
1007c478bd9Sstevel@tonic-gate * sctp_find_next_tq() when an existing taskq cannot be dispatched.
1017c478bd9Sstevel@tonic-gate * The taskqs are never removed. But the max number of taskq which
1027c478bd9Sstevel@tonic-gate * can be created is controlled by sctp_recvq_tq_list_max_sz. Note
1037c478bd9Sstevel@tonic-gate * that SCTP recvq taskq is not tied to any specific CPU or ill.
1047c478bd9Sstevel@tonic-gate *
1057c478bd9Sstevel@tonic-gate * Those taskqs are stored in an array recvq_tq_list. And they are
1067c478bd9Sstevel@tonic-gate * used in a round robin fashion. The current taskq being used is
1077c478bd9Sstevel@tonic-gate * determined by recvq_tq_list_cur.
1087c478bd9Sstevel@tonic-gate */
1097c478bd9Sstevel@tonic-gate
110f4b3ec61Sdh155122 /* /etc/system variables */
1117c478bd9Sstevel@tonic-gate /* The minimum number of threads for each taskq. */
1127c478bd9Sstevel@tonic-gate int sctp_recvq_tq_thr_min = 4;
1137c478bd9Sstevel@tonic-gate /* The maximum number of threads for each taskq. */
1145dd46ab5SKacheong Poon int sctp_recvq_tq_thr_max = 48;
1155dd46ab5SKacheong Poon /* The mnimum number of tasks for each taskq. */
1165dd46ab5SKacheong Poon int sctp_recvq_tq_task_min = 8;
1175dd46ab5SKacheong Poon /* Default value of sctp_recvq_tq_list_max_sz. */
1185dd46ab5SKacheong Poon int sctp_recvq_tq_list_max = 16;
1197c478bd9Sstevel@tonic-gate
1206e91bba0SGirish Moodalbail /*
1216e91bba0SGirish Moodalbail * SCTP tunables related declarations. Definitions are in sctp_tunables.c
1226e91bba0SGirish Moodalbail */
1236e91bba0SGirish Moodalbail extern mod_prop_info_t sctp_propinfo_tbl[];
1246e91bba0SGirish Moodalbail extern int sctp_propinfo_count;
1256e91bba0SGirish Moodalbail
1267c478bd9Sstevel@tonic-gate /* sctp_t/conn_t kmem cache */
1277c478bd9Sstevel@tonic-gate struct kmem_cache *sctp_conn_cache;
1287c478bd9Sstevel@tonic-gate
1297c478bd9Sstevel@tonic-gate #define SCTP_CONDEMNED(sctp) \
1307c478bd9Sstevel@tonic-gate mutex_enter(&(sctp)->sctp_reflock); \
1317c478bd9Sstevel@tonic-gate ((sctp)->sctp_condemned = B_TRUE); \
1325dddb8baSkcpoon mutex_exit(&(sctp)->sctp_reflock);
1337c478bd9Sstevel@tonic-gate
1347c478bd9Sstevel@tonic-gate /* Link/unlink a sctp_t to/from the global list. */
135f4b3ec61Sdh155122 #define SCTP_LINK(sctp, sctps) \
136f4b3ec61Sdh155122 mutex_enter(&(sctps)->sctps_g_lock); \
137f4b3ec61Sdh155122 list_insert_tail(&sctps->sctps_g_list, (sctp)); \
138f4b3ec61Sdh155122 mutex_exit(&(sctps)->sctps_g_lock);
1397c478bd9Sstevel@tonic-gate
140f4b3ec61Sdh155122 #define SCTP_UNLINK(sctp, sctps) \
141f4b3ec61Sdh155122 mutex_enter(&(sctps)->sctps_g_lock); \
1427c478bd9Sstevel@tonic-gate ASSERT((sctp)->sctp_condemned); \
143f4b3ec61Sdh155122 list_remove(&(sctps)->sctps_g_list, (sctp)); \
144f4b3ec61Sdh155122 mutex_exit(&(sctps)->sctps_g_lock);
1457c478bd9Sstevel@tonic-gate
1467c478bd9Sstevel@tonic-gate /*
1471d8c4025Svi117747 * Hooks for Sun Cluster. On non-clustered nodes these will remain NULL.
1481d8c4025Svi117747 * PSARC/2005/602.
1491d8c4025Svi117747 */
1501d8c4025Svi117747 void (*cl_sctp_listen)(sa_family_t, uchar_t *, uint_t, in_port_t) = NULL;
1511d8c4025Svi117747 void (*cl_sctp_unlisten)(sa_family_t, uchar_t *, uint_t, in_port_t) = NULL;
1521d8c4025Svi117747 void (*cl_sctp_connect)(sa_family_t, uchar_t *, uint_t, in_port_t,
1531d8c4025Svi117747 uchar_t *, uint_t, in_port_t, boolean_t, cl_sctp_handle_t) = NULL;
1541d8c4025Svi117747 void (*cl_sctp_disconnect)(sa_family_t, cl_sctp_handle_t) = NULL;
1551d8c4025Svi117747 void (*cl_sctp_assoc_change)(sa_family_t, uchar_t *, size_t, uint_t,
1561d8c4025Svi117747 uchar_t *, size_t, uint_t, int, cl_sctp_handle_t) = NULL;
1571d8c4025Svi117747 void (*cl_sctp_check_addrs)(sa_family_t, in_port_t, uchar_t **, size_t,
1581d8c4025Svi117747 uint_t *, boolean_t) = NULL;
1591d8c4025Svi117747 /*
1607c478bd9Sstevel@tonic-gate * Return the version number of the SCTP kernel interface.
1617c478bd9Sstevel@tonic-gate */
1627c478bd9Sstevel@tonic-gate int
sctp_itf_ver(int cl_ver)1637c478bd9Sstevel@tonic-gate sctp_itf_ver(int cl_ver)
1647c478bd9Sstevel@tonic-gate {
1657c478bd9Sstevel@tonic-gate if (cl_ver != SCTP_ITF_VER)
1667c478bd9Sstevel@tonic-gate return (-1);
1677c478bd9Sstevel@tonic-gate return (SCTP_ITF_VER);
1687c478bd9Sstevel@tonic-gate }
1697c478bd9Sstevel@tonic-gate
1707c478bd9Sstevel@tonic-gate /*
1717c478bd9Sstevel@tonic-gate * Called when we need a new sctp instantiation but don't really have a
1727c478bd9Sstevel@tonic-gate * new q to hang it off of. Copy the priv flag from the passed in structure.
1737c478bd9Sstevel@tonic-gate */
1747c478bd9Sstevel@tonic-gate sctp_t *
sctp_create_eager(sctp_t * psctp)1757c478bd9Sstevel@tonic-gate sctp_create_eager(sctp_t *psctp)
1767c478bd9Sstevel@tonic-gate {
1777c478bd9Sstevel@tonic-gate sctp_t *sctp;
1787c478bd9Sstevel@tonic-gate mblk_t *ack_mp, *hb_mp;
179bd670b35SErik Nordmark conn_t *connp;
18045916cd2Sjpk cred_t *credp;
181f4b3ec61Sdh155122 sctp_stack_t *sctps = psctp->sctp_sctps;
1827c478bd9Sstevel@tonic-gate
183f4b3ec61Sdh155122 if ((connp = ipcl_conn_create(IPCL_SCTPCONN, KM_NOSLEEP,
184f4b3ec61Sdh155122 sctps->sctps_netstack)) == NULL) {
1857c478bd9Sstevel@tonic-gate return (NULL);
186f4b3ec61Sdh155122 }
18745916cd2Sjpk
1887c478bd9Sstevel@tonic-gate sctp = CONN2SCTP(connp);
189f4b3ec61Sdh155122 sctp->sctp_sctps = sctps;
1907c478bd9Sstevel@tonic-gate
191121e5416Skcpoon if ((ack_mp = sctp_timer_alloc(sctp, sctp_ack_timer,
192121e5416Skcpoon KM_NOSLEEP)) == NULL ||
193121e5416Skcpoon (hb_mp = sctp_timer_alloc(sctp, sctp_heartbeat_timer,
194121e5416Skcpoon KM_NOSLEEP)) == NULL) {
1957c478bd9Sstevel@tonic-gate if (ack_mp != NULL)
1967c478bd9Sstevel@tonic-gate freeb(ack_mp);
197121e5416Skcpoon sctp_conn_clear(connp);
198f4b3ec61Sdh155122 sctp->sctp_sctps = NULL;
1997c478bd9Sstevel@tonic-gate kmem_cache_free(sctp_conn_cache, connp);
2007c478bd9Sstevel@tonic-gate return (NULL);
2017c478bd9Sstevel@tonic-gate }
2027c478bd9Sstevel@tonic-gate
2037c478bd9Sstevel@tonic-gate sctp->sctp_ack_mp = ack_mp;
2047c478bd9Sstevel@tonic-gate sctp->sctp_heartbeat_mp = hb_mp;
2057c478bd9Sstevel@tonic-gate
2067c478bd9Sstevel@tonic-gate if (sctp_init_values(sctp, psctp, KM_NOSLEEP) != 0) {
2077c478bd9Sstevel@tonic-gate freeb(ack_mp);
2087c478bd9Sstevel@tonic-gate freeb(hb_mp);
209121e5416Skcpoon sctp_conn_clear(connp);
210f4b3ec61Sdh155122 sctp->sctp_sctps = NULL;
2117c478bd9Sstevel@tonic-gate kmem_cache_free(sctp_conn_cache, connp);
2127c478bd9Sstevel@tonic-gate return (NULL);
2137c478bd9Sstevel@tonic-gate }
21445916cd2Sjpk
215bd670b35SErik Nordmark if ((credp = psctp->sctp_connp->conn_cred) != NULL) {
21645916cd2Sjpk connp->conn_cred = credp;
21745916cd2Sjpk crhold(credp);
2187c478bd9Sstevel@tonic-gate }
2195d0bc3edSsommerfe
2207c478bd9Sstevel@tonic-gate sctp->sctp_mss = psctp->sctp_mss;
2217c478bd9Sstevel@tonic-gate sctp->sctp_detached = B_TRUE;
2227c478bd9Sstevel@tonic-gate /*
2237c478bd9Sstevel@tonic-gate * Link to the global as soon as possible so that this sctp_t
2247c478bd9Sstevel@tonic-gate * can be found.
2257c478bd9Sstevel@tonic-gate */
226f4b3ec61Sdh155122 SCTP_LINK(sctp, sctps);
2277c478bd9Sstevel@tonic-gate
2285dd46ab5SKacheong Poon /* If the listener has a limit, inherit the counter info. */
2295dd46ab5SKacheong Poon sctp->sctp_listen_cnt = psctp->sctp_listen_cnt;
2305dd46ab5SKacheong Poon
2317c478bd9Sstevel@tonic-gate return (sctp);
2327c478bd9Sstevel@tonic-gate }
2337c478bd9Sstevel@tonic-gate
2347c478bd9Sstevel@tonic-gate /*
2357c478bd9Sstevel@tonic-gate * We are dying for some reason. Try to do it gracefully.
2367c478bd9Sstevel@tonic-gate */
2377c478bd9Sstevel@tonic-gate void
sctp_clean_death(sctp_t * sctp,int err)2387c478bd9Sstevel@tonic-gate sctp_clean_death(sctp_t *sctp, int err)
2397c478bd9Sstevel@tonic-gate {
2407c478bd9Sstevel@tonic-gate ASSERT(sctp != NULL);
2417c478bd9Sstevel@tonic-gate
24245916cd2Sjpk dprint(3, ("sctp_clean_death %p, state %d\n", (void *)sctp,
24345916cd2Sjpk sctp->sctp_state));
2447c478bd9Sstevel@tonic-gate
2457c478bd9Sstevel@tonic-gate sctp->sctp_client_errno = err;
2467c478bd9Sstevel@tonic-gate /*
2477c478bd9Sstevel@tonic-gate * Check to see if we need to notify upper layer.
2487c478bd9Sstevel@tonic-gate */
2497c478bd9Sstevel@tonic-gate if ((sctp->sctp_state >= SCTPS_COOKIE_WAIT) &&
2507c478bd9Sstevel@tonic-gate !SCTP_IS_DETACHED(sctp)) {
2517c478bd9Sstevel@tonic-gate if (sctp->sctp_xmit_head || sctp->sctp_xmit_unsent) {
2527c478bd9Sstevel@tonic-gate sctp_regift_xmitlist(sctp);
2537c478bd9Sstevel@tonic-gate }
2540f1702c5SYu Xiangning if (sctp->sctp_ulp_disconnected(sctp->sctp_ulpd, 0, err)) {
2557c478bd9Sstevel@tonic-gate /*
2567c478bd9Sstevel@tonic-gate * Socket is gone, detach.
2577c478bd9Sstevel@tonic-gate */
2587c478bd9Sstevel@tonic-gate sctp->sctp_detached = B_TRUE;
2597c478bd9Sstevel@tonic-gate sctp->sctp_ulpd = NULL;
2600f1702c5SYu Xiangning sctp->sctp_upcalls = NULL;
2617c478bd9Sstevel@tonic-gate }
2627c478bd9Sstevel@tonic-gate }
2637c478bd9Sstevel@tonic-gate
2647c478bd9Sstevel@tonic-gate /* Remove this sctp from all hashes. */
2657c478bd9Sstevel@tonic-gate sctp_closei_local(sctp);
2667c478bd9Sstevel@tonic-gate
2677c478bd9Sstevel@tonic-gate /*
2687c478bd9Sstevel@tonic-gate * If the sctp_t is detached, we need to finish freeing up
2697c478bd9Sstevel@tonic-gate * the resources. At this point, ip_fanout_sctp() should have
2707c478bd9Sstevel@tonic-gate * a hold on this sctp_t. Some thread doing snmp stuff can
2717c478bd9Sstevel@tonic-gate * have a hold. And a taskq can also have a hold waiting to
2727c478bd9Sstevel@tonic-gate * work. sctp_unlink() the sctp_t from the global list so
2737c478bd9Sstevel@tonic-gate * that no new thread can find it. Then do a SCTP_REFRELE().
2747c478bd9Sstevel@tonic-gate * The sctp_t will be freed after all those threads are done.
2757c478bd9Sstevel@tonic-gate */
2767c478bd9Sstevel@tonic-gate if (SCTP_IS_DETACHED(sctp)) {
2777c478bd9Sstevel@tonic-gate SCTP_CONDEMNED(sctp);
2787c478bd9Sstevel@tonic-gate SCTP_REFRELE(sctp);
2797c478bd9Sstevel@tonic-gate }
2807c478bd9Sstevel@tonic-gate }
2817c478bd9Sstevel@tonic-gate
2827c478bd9Sstevel@tonic-gate /*
2837c478bd9Sstevel@tonic-gate * Called by upper layer when it wants to close this association.
2847c478bd9Sstevel@tonic-gate * Depending on the state of this assoication, we need to do
2857c478bd9Sstevel@tonic-gate * different things.
2867c478bd9Sstevel@tonic-gate *
2877c478bd9Sstevel@tonic-gate * If the state is below COOKIE_ECHOED or it is COOKIE_ECHOED but with
2887c478bd9Sstevel@tonic-gate * no sent data, just remove this sctp from all the hashes. This
2897c478bd9Sstevel@tonic-gate * makes sure that all packets from the other end will go to the default
2907c478bd9Sstevel@tonic-gate * sctp handling. The upper layer will then do a sctp_close() to clean
2917c478bd9Sstevel@tonic-gate * up.
2927c478bd9Sstevel@tonic-gate *
2937c478bd9Sstevel@tonic-gate * Otherwise, check and see if SO_LINGER is set. If it is set, check
2947c478bd9Sstevel@tonic-gate * the value. If the value is 0, consider this an abortive close. Send
2957c478bd9Sstevel@tonic-gate * an ABORT message and kill the associatiion.
2967c478bd9Sstevel@tonic-gate *
2977c478bd9Sstevel@tonic-gate */
2987c478bd9Sstevel@tonic-gate int
sctp_disconnect(sctp_t * sctp)2997c478bd9Sstevel@tonic-gate sctp_disconnect(sctp_t *sctp)
3007c478bd9Sstevel@tonic-gate {
3017c478bd9Sstevel@tonic-gate int error = 0;
302bd670b35SErik Nordmark conn_t *connp = sctp->sctp_connp;
3037c478bd9Sstevel@tonic-gate
30445916cd2Sjpk dprint(3, ("sctp_disconnect %p, state %d\n", (void *)sctp,
30545916cd2Sjpk sctp->sctp_state));
3067c478bd9Sstevel@tonic-gate
3077c478bd9Sstevel@tonic-gate RUN_SCTP(sctp);
3087c478bd9Sstevel@tonic-gate
3097c478bd9Sstevel@tonic-gate switch (sctp->sctp_state) {
3107c478bd9Sstevel@tonic-gate case SCTPS_IDLE:
3117c478bd9Sstevel@tonic-gate case SCTPS_BOUND:
3127c478bd9Sstevel@tonic-gate case SCTPS_LISTEN:
3137c478bd9Sstevel@tonic-gate break;
3147c478bd9Sstevel@tonic-gate case SCTPS_COOKIE_WAIT:
3157c478bd9Sstevel@tonic-gate case SCTPS_COOKIE_ECHOED:
3167c478bd9Sstevel@tonic-gate /*
3177c478bd9Sstevel@tonic-gate * Close during the connect 3-way handshake
3187c478bd9Sstevel@tonic-gate * but here there may or may not be pending data
3197c478bd9Sstevel@tonic-gate * already on queue. Process almost same as in
3207c478bd9Sstevel@tonic-gate * the ESTABLISHED state.
3217c478bd9Sstevel@tonic-gate */
3227c478bd9Sstevel@tonic-gate if (sctp->sctp_xmit_head == NULL &&
3237c478bd9Sstevel@tonic-gate sctp->sctp_xmit_unsent == NULL) {
3247c478bd9Sstevel@tonic-gate break;
3257c478bd9Sstevel@tonic-gate }
3267c478bd9Sstevel@tonic-gate /* FALLTHRU */
3277c478bd9Sstevel@tonic-gate default:
3287c478bd9Sstevel@tonic-gate /*
329e6f13f86SKacheong Poon * If SO_LINGER has set a zero linger time, terminate the
330e6f13f86SKacheong Poon * association and send an ABORT.
3317c478bd9Sstevel@tonic-gate */
332bd670b35SErik Nordmark if (connp->conn_linger && connp->conn_lingertime == 0) {
333e6f13f86SKacheong Poon sctp_user_abort(sctp, NULL);
334e6f13f86SKacheong Poon WAKE_SCTP(sctp);
335e6f13f86SKacheong Poon return (error);
3367c478bd9Sstevel@tonic-gate }
3377c478bd9Sstevel@tonic-gate
3387c478bd9Sstevel@tonic-gate /*
339a215d4ebSKacheong Poon * If there is unread data, send an ABORT and terminate the
340e6f13f86SKacheong Poon * association.
3411d8c4025Svi117747 */
342a215d4ebSKacheong Poon if (sctp->sctp_rxqueued > 0 || sctp->sctp_ulp_rxqueued > 0) {
343e6f13f86SKacheong Poon sctp_user_abort(sctp, NULL);
344e6f13f86SKacheong Poon WAKE_SCTP(sctp);
345e6f13f86SKacheong Poon return (error);
3461d8c4025Svi117747 }
3471d8c4025Svi117747 /*
3487c478bd9Sstevel@tonic-gate * Transmit the shutdown before detaching the sctp_t.
3497c478bd9Sstevel@tonic-gate * After sctp_detach returns this queue/perimeter
3507c478bd9Sstevel@tonic-gate * no longer owns the sctp_t thus others can modify it.
3517c478bd9Sstevel@tonic-gate */
3527c478bd9Sstevel@tonic-gate sctp_send_shutdown(sctp, 0);
3537c478bd9Sstevel@tonic-gate
3547c478bd9Sstevel@tonic-gate /* Pass gathered wisdom to IP for keeping */
355bd670b35SErik Nordmark sctp_update_dce(sctp);
3567c478bd9Sstevel@tonic-gate
3577c478bd9Sstevel@tonic-gate /*
3587c478bd9Sstevel@tonic-gate * If lingering on close then wait until the shutdown
3597c478bd9Sstevel@tonic-gate * is complete, or the SO_LINGER time passes, or an
3607c478bd9Sstevel@tonic-gate * ABORT is sent/received. Note that sctp_disconnect()
3617c478bd9Sstevel@tonic-gate * can be called more than once. Make sure that only
3627c478bd9Sstevel@tonic-gate * one thread waits.
3637c478bd9Sstevel@tonic-gate */
364bd670b35SErik Nordmark if (connp->conn_linger && connp->conn_lingertime > 0 &&
3657c478bd9Sstevel@tonic-gate sctp->sctp_state >= SCTPS_ESTABLISHED &&
3667c478bd9Sstevel@tonic-gate !sctp->sctp_lingering) {
3677c478bd9Sstevel@tonic-gate clock_t stoptime; /* in ticks */
3687c478bd9Sstevel@tonic-gate clock_t ret;
3697c478bd9Sstevel@tonic-gate
3707c478bd9Sstevel@tonic-gate sctp->sctp_lingering = 1;
3717c478bd9Sstevel@tonic-gate sctp->sctp_client_errno = 0;
372d3d50737SRafael Vanoni stoptime = ddi_get_lbolt() +
373d3d50737SRafael Vanoni connp->conn_lingertime * hz;
3747c478bd9Sstevel@tonic-gate
3757c478bd9Sstevel@tonic-gate mutex_enter(&sctp->sctp_lock);
3767c478bd9Sstevel@tonic-gate sctp->sctp_running = B_FALSE;
3777c478bd9Sstevel@tonic-gate while (sctp->sctp_state >= SCTPS_ESTABLISHED &&
3787c478bd9Sstevel@tonic-gate sctp->sctp_client_errno == 0) {
3795dd46ab5SKacheong Poon cv_signal(&sctp->sctp_cv);
3807c478bd9Sstevel@tonic-gate ret = cv_timedwait_sig(&sctp->sctp_cv,
3817c478bd9Sstevel@tonic-gate &sctp->sctp_lock, stoptime);
3827c478bd9Sstevel@tonic-gate if (ret < 0) {
3837c478bd9Sstevel@tonic-gate /* Stoptime has reached. */
3847c478bd9Sstevel@tonic-gate sctp->sctp_client_errno = EWOULDBLOCK;
3857c478bd9Sstevel@tonic-gate break;
3867c478bd9Sstevel@tonic-gate } else if (ret == 0) {
3877c478bd9Sstevel@tonic-gate /* Got a signal. */
3887c478bd9Sstevel@tonic-gate break;
3897c478bd9Sstevel@tonic-gate }
3907c478bd9Sstevel@tonic-gate }
3917c478bd9Sstevel@tonic-gate error = sctp->sctp_client_errno;
3927c478bd9Sstevel@tonic-gate sctp->sctp_client_errno = 0;
3937c478bd9Sstevel@tonic-gate mutex_exit(&sctp->sctp_lock);
3947c478bd9Sstevel@tonic-gate }
3957c478bd9Sstevel@tonic-gate
3967c478bd9Sstevel@tonic-gate WAKE_SCTP(sctp);
3977c478bd9Sstevel@tonic-gate return (error);
3987c478bd9Sstevel@tonic-gate }
3997c478bd9Sstevel@tonic-gate
4007c478bd9Sstevel@tonic-gate
4017c478bd9Sstevel@tonic-gate /* Remove this sctp from all hashes so nobody can find it. */
4027c478bd9Sstevel@tonic-gate sctp_closei_local(sctp);
4037c478bd9Sstevel@tonic-gate WAKE_SCTP(sctp);
4047c478bd9Sstevel@tonic-gate return (error);
4057c478bd9Sstevel@tonic-gate }
4067c478bd9Sstevel@tonic-gate
4077c478bd9Sstevel@tonic-gate void
sctp_close(sctp_t * sctp)4087c478bd9Sstevel@tonic-gate sctp_close(sctp_t *sctp)
4097c478bd9Sstevel@tonic-gate {
41045916cd2Sjpk dprint(3, ("sctp_close %p, state %d\n", (void *)sctp,
41145916cd2Sjpk sctp->sctp_state));
4127c478bd9Sstevel@tonic-gate
4137c478bd9Sstevel@tonic-gate RUN_SCTP(sctp);
4147c478bd9Sstevel@tonic-gate sctp->sctp_detached = 1;
4157c478bd9Sstevel@tonic-gate sctp->sctp_ulpd = NULL;
4160f1702c5SYu Xiangning sctp->sctp_upcalls = NULL;
4177c478bd9Sstevel@tonic-gate bzero(&sctp->sctp_events, sizeof (sctp->sctp_events));
4187c478bd9Sstevel@tonic-gate
4197c478bd9Sstevel@tonic-gate /* If the graceful shutdown has not been completed, just return. */
4207c478bd9Sstevel@tonic-gate if (sctp->sctp_state != SCTPS_IDLE) {
4217c478bd9Sstevel@tonic-gate WAKE_SCTP(sctp);
4227c478bd9Sstevel@tonic-gate return;
4237c478bd9Sstevel@tonic-gate }
4247c478bd9Sstevel@tonic-gate
4257c478bd9Sstevel@tonic-gate /*
4267c478bd9Sstevel@tonic-gate * Since sctp_t is in SCTPS_IDLE state, so the only thread which
4277c478bd9Sstevel@tonic-gate * can have a hold on the sctp_t is doing snmp stuff. Just do
4287c478bd9Sstevel@tonic-gate * a SCTP_REFRELE() here after the SCTP_UNLINK(). It will
4297c478bd9Sstevel@tonic-gate * be freed when the other thread is done.
4307c478bd9Sstevel@tonic-gate */
4317c478bd9Sstevel@tonic-gate SCTP_CONDEMNED(sctp);
4327c478bd9Sstevel@tonic-gate WAKE_SCTP(sctp);
4337c478bd9Sstevel@tonic-gate SCTP_REFRELE(sctp);
4347c478bd9Sstevel@tonic-gate }
4357c478bd9Sstevel@tonic-gate
4367c478bd9Sstevel@tonic-gate /*
4377c478bd9Sstevel@tonic-gate * Unlink from global list and do the eager close.
4387c478bd9Sstevel@tonic-gate * Remove the refhold implicit in being on the global list.
4397c478bd9Sstevel@tonic-gate */
4407c478bd9Sstevel@tonic-gate void
sctp_close_eager(sctp_t * sctp)4417c478bd9Sstevel@tonic-gate sctp_close_eager(sctp_t *sctp)
4427c478bd9Sstevel@tonic-gate {
4437c478bd9Sstevel@tonic-gate SCTP_CONDEMNED(sctp);
4447c478bd9Sstevel@tonic-gate sctp_closei_local(sctp);
4457c478bd9Sstevel@tonic-gate SCTP_REFRELE(sctp);
4467c478bd9Sstevel@tonic-gate }
4477c478bd9Sstevel@tonic-gate
4487c478bd9Sstevel@tonic-gate /*
4497c478bd9Sstevel@tonic-gate * The sctp_t is going away. Remove it from all lists and set it
4507c478bd9Sstevel@tonic-gate * to SCTPS_IDLE. The caller has to remove it from the
4517c478bd9Sstevel@tonic-gate * global list. The freeing up of memory is deferred until
4527c478bd9Sstevel@tonic-gate * sctp_free(). This is needed since a thread in sctp_input() might have
4537c478bd9Sstevel@tonic-gate * done a SCTP_REFHOLD on this structure before it was removed from the
4547c478bd9Sstevel@tonic-gate * hashes.
4557c478bd9Sstevel@tonic-gate */
4567c478bd9Sstevel@tonic-gate static void
sctp_closei_local(sctp_t * sctp)4577c478bd9Sstevel@tonic-gate sctp_closei_local(sctp_t *sctp)
4587c478bd9Sstevel@tonic-gate {
4597c478bd9Sstevel@tonic-gate mblk_t *mp;
4607c478bd9Sstevel@tonic-gate conn_t *connp = sctp->sctp_connp;
4617c478bd9Sstevel@tonic-gate
4625dd46ab5SKacheong Poon /* The counter is incremented only for established associations. */
4635dd46ab5SKacheong Poon if (sctp->sctp_state >= SCTPS_ESTABLISHED)
4645dd46ab5SKacheong Poon SCTPS_ASSOC_DEC(sctp->sctp_sctps);
4655dd46ab5SKacheong Poon
4665dd46ab5SKacheong Poon if (sctp->sctp_listen_cnt != NULL)
4675dd46ab5SKacheong Poon SCTP_DECR_LISTEN_CNT(sctp);
4685dd46ab5SKacheong Poon
469b34b8d1aSkcpoon /* Sanity check, don't do the same thing twice. */
470b34b8d1aSkcpoon if (connp->conn_state_flags & CONN_CLOSING) {
471b34b8d1aSkcpoon ASSERT(sctp->sctp_state == SCTPS_IDLE);
472b34b8d1aSkcpoon return;
473b34b8d1aSkcpoon }
474b34b8d1aSkcpoon
4757c478bd9Sstevel@tonic-gate /* Stop and free the timers */
4767c478bd9Sstevel@tonic-gate sctp_free_faddr_timers(sctp);
4777c478bd9Sstevel@tonic-gate if ((mp = sctp->sctp_heartbeat_mp) != NULL) {
4787c478bd9Sstevel@tonic-gate sctp_timer_free(mp);
4797c478bd9Sstevel@tonic-gate sctp->sctp_heartbeat_mp = NULL;
4807c478bd9Sstevel@tonic-gate }
4817c478bd9Sstevel@tonic-gate if ((mp = sctp->sctp_ack_mp) != NULL) {
4827c478bd9Sstevel@tonic-gate sctp_timer_free(mp);
4837c478bd9Sstevel@tonic-gate sctp->sctp_ack_mp = NULL;
4847c478bd9Sstevel@tonic-gate }
4857c478bd9Sstevel@tonic-gate
4867c478bd9Sstevel@tonic-gate /* Set the CONN_CLOSING flag so that IP will not cache IRE again. */
4877c478bd9Sstevel@tonic-gate mutex_enter(&connp->conn_lock);
4887c478bd9Sstevel@tonic-gate connp->conn_state_flags |= CONN_CLOSING;
4897c478bd9Sstevel@tonic-gate mutex_exit(&connp->conn_lock);
4907c478bd9Sstevel@tonic-gate
4917c478bd9Sstevel@tonic-gate /* Remove from all hashes. */
4927c478bd9Sstevel@tonic-gate sctp_bind_hash_remove(sctp);
4937c478bd9Sstevel@tonic-gate sctp_conn_hash_remove(sctp);
4947c478bd9Sstevel@tonic-gate sctp_listen_hash_remove(sctp);
4957c478bd9Sstevel@tonic-gate sctp->sctp_state = SCTPS_IDLE;
4967c478bd9Sstevel@tonic-gate
4977c478bd9Sstevel@tonic-gate /*
4987c478bd9Sstevel@tonic-gate * Clean up the recvq as much as possible. All those packets
4997c478bd9Sstevel@tonic-gate * will be silently dropped as this sctp_t is now in idle state.
5007c478bd9Sstevel@tonic-gate */
5017c478bd9Sstevel@tonic-gate mutex_enter(&sctp->sctp_recvq_lock);
5027c478bd9Sstevel@tonic-gate while ((mp = sctp->sctp_recvq) != NULL) {
5037c478bd9Sstevel@tonic-gate sctp->sctp_recvq = mp->b_next;
5047c478bd9Sstevel@tonic-gate mp->b_next = NULL;
505bd670b35SErik Nordmark
506bd670b35SErik Nordmark if (ip_recv_attr_is_mblk(mp))
507bd670b35SErik Nordmark mp = ip_recv_attr_free_mblk(mp);
508bd670b35SErik Nordmark
5097c478bd9Sstevel@tonic-gate freemsg(mp);
5107c478bd9Sstevel@tonic-gate }
5117c478bd9Sstevel@tonic-gate mutex_exit(&sctp->sctp_recvq_lock);
5127c478bd9Sstevel@tonic-gate }
5137c478bd9Sstevel@tonic-gate
5147c478bd9Sstevel@tonic-gate /*
5157c478bd9Sstevel@tonic-gate * Free memory associated with the sctp/ip header template.
5167c478bd9Sstevel@tonic-gate */
5177c478bd9Sstevel@tonic-gate static void
sctp_headers_free(sctp_t * sctp)5187c478bd9Sstevel@tonic-gate sctp_headers_free(sctp_t *sctp)
5197c478bd9Sstevel@tonic-gate {
5207c478bd9Sstevel@tonic-gate if (sctp->sctp_iphc != NULL) {
5217c478bd9Sstevel@tonic-gate kmem_free(sctp->sctp_iphc, sctp->sctp_iphc_len);
5227c478bd9Sstevel@tonic-gate sctp->sctp_iphc = NULL;
5237c478bd9Sstevel@tonic-gate sctp->sctp_ipha = NULL;
5247c478bd9Sstevel@tonic-gate sctp->sctp_hdr_len = 0;
5257c478bd9Sstevel@tonic-gate sctp->sctp_ip_hdr_len = 0;
5267c478bd9Sstevel@tonic-gate sctp->sctp_iphc_len = 0;
5277c478bd9Sstevel@tonic-gate sctp->sctp_sctph = NULL;
5287c478bd9Sstevel@tonic-gate sctp->sctp_hdr_len = 0;
5297c478bd9Sstevel@tonic-gate }
5307c478bd9Sstevel@tonic-gate if (sctp->sctp_iphc6 != NULL) {
5317c478bd9Sstevel@tonic-gate kmem_free(sctp->sctp_iphc6, sctp->sctp_iphc6_len);
5327c478bd9Sstevel@tonic-gate sctp->sctp_iphc6 = NULL;
5337c478bd9Sstevel@tonic-gate sctp->sctp_ip6h = NULL;
5347c478bd9Sstevel@tonic-gate sctp->sctp_hdr6_len = 0;
5357c478bd9Sstevel@tonic-gate sctp->sctp_ip_hdr6_len = 0;
5367c478bd9Sstevel@tonic-gate sctp->sctp_iphc6_len = 0;
5377c478bd9Sstevel@tonic-gate sctp->sctp_sctph6 = NULL;
5387c478bd9Sstevel@tonic-gate sctp->sctp_hdr6_len = 0;
5397c478bd9Sstevel@tonic-gate }
5407c478bd9Sstevel@tonic-gate }
5417c478bd9Sstevel@tonic-gate
5427c478bd9Sstevel@tonic-gate static void
sctp_free_xmit_data(sctp_t * sctp)5437c478bd9Sstevel@tonic-gate sctp_free_xmit_data(sctp_t *sctp)
5447c478bd9Sstevel@tonic-gate {
5457c478bd9Sstevel@tonic-gate mblk_t *ump = NULL;
5467c478bd9Sstevel@tonic-gate mblk_t *nump;
5477c478bd9Sstevel@tonic-gate mblk_t *mp;
5487c478bd9Sstevel@tonic-gate mblk_t *nmp;
5497c478bd9Sstevel@tonic-gate
5507c478bd9Sstevel@tonic-gate sctp->sctp_xmit_unacked = NULL;
5517c478bd9Sstevel@tonic-gate ump = sctp->sctp_xmit_head;
5527c478bd9Sstevel@tonic-gate sctp->sctp_xmit_tail = sctp->sctp_xmit_head = NULL;
5537c478bd9Sstevel@tonic-gate free_unsent:
5547c478bd9Sstevel@tonic-gate for (; ump != NULL; ump = nump) {
5557c478bd9Sstevel@tonic-gate for (mp = ump->b_cont; mp != NULL; mp = nmp) {
5567c478bd9Sstevel@tonic-gate nmp = mp->b_next;
5577c478bd9Sstevel@tonic-gate mp->b_next = NULL;
5587c478bd9Sstevel@tonic-gate mp->b_prev = NULL;
5597c478bd9Sstevel@tonic-gate freemsg(mp);
5607c478bd9Sstevel@tonic-gate }
5617c478bd9Sstevel@tonic-gate ASSERT(DB_REF(ump) == 1);
5627c478bd9Sstevel@tonic-gate nump = ump->b_next;
5637c478bd9Sstevel@tonic-gate ump->b_next = NULL;
5647c478bd9Sstevel@tonic-gate ump->b_prev = NULL;
5657c478bd9Sstevel@tonic-gate ump->b_cont = NULL;
5667c478bd9Sstevel@tonic-gate freeb(ump);
5677c478bd9Sstevel@tonic-gate }
5687c478bd9Sstevel@tonic-gate if ((ump = sctp->sctp_xmit_unsent) == NULL) {
5697c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_xmit_unsent_tail == NULL);
5707c478bd9Sstevel@tonic-gate return;
5717c478bd9Sstevel@tonic-gate }
5727c478bd9Sstevel@tonic-gate sctp->sctp_xmit_unsent = sctp->sctp_xmit_unsent_tail = NULL;
5737c478bd9Sstevel@tonic-gate goto free_unsent;
5747c478bd9Sstevel@tonic-gate }
5757c478bd9Sstevel@tonic-gate
5767c478bd9Sstevel@tonic-gate /*
5777c478bd9Sstevel@tonic-gate * Cleanup all the messages in the stream queue and the reassembly lists.
5787c478bd9Sstevel@tonic-gate * If 'free' is true, then delete the streams as well.
5797c478bd9Sstevel@tonic-gate */
5807c478bd9Sstevel@tonic-gate void
sctp_instream_cleanup(sctp_t * sctp,boolean_t free)5817c478bd9Sstevel@tonic-gate sctp_instream_cleanup(sctp_t *sctp, boolean_t free)
5827c478bd9Sstevel@tonic-gate {
5837c478bd9Sstevel@tonic-gate int i;
5847c478bd9Sstevel@tonic-gate mblk_t *mp;
5857c478bd9Sstevel@tonic-gate mblk_t *mp1;
5867c478bd9Sstevel@tonic-gate
5877c478bd9Sstevel@tonic-gate if (sctp->sctp_instr != NULL) {
5887c478bd9Sstevel@tonic-gate /* walk thru and flush out anything remaining in the Q */
5897c478bd9Sstevel@tonic-gate for (i = 0; i < sctp->sctp_num_istr; i++) {
5907c478bd9Sstevel@tonic-gate mp = sctp->sctp_instr[i].istr_msgs;
5917c478bd9Sstevel@tonic-gate while (mp != NULL) {
5927c478bd9Sstevel@tonic-gate mp1 = mp->b_next;
5937c478bd9Sstevel@tonic-gate mp->b_next = mp->b_prev = NULL;
5947c478bd9Sstevel@tonic-gate freemsg(mp);
5957c478bd9Sstevel@tonic-gate mp = mp1;
5967c478bd9Sstevel@tonic-gate }
5977c478bd9Sstevel@tonic-gate sctp->sctp_instr[i].istr_msgs = NULL;
598a0263d1cSnh145002 sctp->sctp_instr[i].istr_nmsgs = 0;
5997c478bd9Sstevel@tonic-gate sctp_free_reass((sctp->sctp_instr) + i);
6007c478bd9Sstevel@tonic-gate sctp->sctp_instr[i].nextseq = 0;
6017c478bd9Sstevel@tonic-gate }
6027c478bd9Sstevel@tonic-gate if (free) {
6037c478bd9Sstevel@tonic-gate kmem_free(sctp->sctp_instr,
6047c478bd9Sstevel@tonic-gate sizeof (*sctp->sctp_instr) * sctp->sctp_num_istr);
6057c478bd9Sstevel@tonic-gate sctp->sctp_instr = NULL;
6067c478bd9Sstevel@tonic-gate sctp->sctp_num_istr = 0;
6077c478bd9Sstevel@tonic-gate }
6087c478bd9Sstevel@tonic-gate }
6097c478bd9Sstevel@tonic-gate /* un-ordered fragments */
6107c478bd9Sstevel@tonic-gate if (sctp->sctp_uo_frags != NULL) {
6117c478bd9Sstevel@tonic-gate for (mp = sctp->sctp_uo_frags; mp != NULL; mp = mp1) {
6127c478bd9Sstevel@tonic-gate mp1 = mp->b_next;
6137c478bd9Sstevel@tonic-gate mp->b_next = mp->b_prev = NULL;
6147c478bd9Sstevel@tonic-gate freemsg(mp);
6157c478bd9Sstevel@tonic-gate }
61692baa190SGeorge Shepherd sctp->sctp_uo_frags = NULL;
6177c478bd9Sstevel@tonic-gate }
6187c478bd9Sstevel@tonic-gate }
6197c478bd9Sstevel@tonic-gate
6207c478bd9Sstevel@tonic-gate /*
6217c478bd9Sstevel@tonic-gate * Last reference to the sctp_t is gone. Free all memory associated with it.
6227c478bd9Sstevel@tonic-gate * Called from SCTP_REFRELE. Called inline in sctp_close()
6237c478bd9Sstevel@tonic-gate */
6247c478bd9Sstevel@tonic-gate void
sctp_free(conn_t * connp)6257c478bd9Sstevel@tonic-gate sctp_free(conn_t *connp)
6267c478bd9Sstevel@tonic-gate {
6277c478bd9Sstevel@tonic-gate sctp_t *sctp = CONN2SCTP(connp);
6287c478bd9Sstevel@tonic-gate int cnt;
629f4b3ec61Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps;
6307c478bd9Sstevel@tonic-gate
631f4b3ec61Sdh155122 ASSERT(sctps != NULL);
6327c478bd9Sstevel@tonic-gate /* Unlink it from the global list */
633f4b3ec61Sdh155122 SCTP_UNLINK(sctp, sctps);
6347c478bd9Sstevel@tonic-gate
6357c478bd9Sstevel@tonic-gate ASSERT(connp->conn_ref == 0);
636bd670b35SErik Nordmark ASSERT(connp->conn_proto == IPPROTO_SCTP);
6377c478bd9Sstevel@tonic-gate ASSERT(!MUTEX_HELD(&sctp->sctp_reflock));
6387c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_refcnt == 0);
6397c478bd9Sstevel@tonic-gate
6407c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_ptpbhn == NULL && sctp->sctp_bind_hash == NULL);
6417c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_conn_hash_next == NULL &&
6427c478bd9Sstevel@tonic-gate sctp->sctp_conn_hash_prev == NULL);
6437c478bd9Sstevel@tonic-gate
6447c478bd9Sstevel@tonic-gate
6457c478bd9Sstevel@tonic-gate /* Free up all the resources. */
6467c478bd9Sstevel@tonic-gate
6477c478bd9Sstevel@tonic-gate /* blow away sctp stream management */
6487c478bd9Sstevel@tonic-gate if (sctp->sctp_ostrcntrs != NULL) {
6497c478bd9Sstevel@tonic-gate kmem_free(sctp->sctp_ostrcntrs,
6507c478bd9Sstevel@tonic-gate sizeof (uint16_t) * sctp->sctp_num_ostr);
6517c478bd9Sstevel@tonic-gate sctp->sctp_ostrcntrs = NULL;
6527c478bd9Sstevel@tonic-gate }
6537c478bd9Sstevel@tonic-gate sctp_instream_cleanup(sctp, B_TRUE);
6547c478bd9Sstevel@tonic-gate
6557c478bd9Sstevel@tonic-gate /* Remove all data transfer resources. */
6567c478bd9Sstevel@tonic-gate sctp->sctp_istr_nmsgs = 0;
6577c478bd9Sstevel@tonic-gate sctp->sctp_rxqueued = 0;
6587c478bd9Sstevel@tonic-gate sctp_free_xmit_data(sctp);
6597c478bd9Sstevel@tonic-gate sctp->sctp_unacked = 0;
6607c478bd9Sstevel@tonic-gate sctp->sctp_unsent = 0;
6611d8c4025Svi117747 if (sctp->sctp_cxmit_list != NULL)
6621d8c4025Svi117747 sctp_asconf_free_cxmit(sctp, NULL);
6631d8c4025Svi117747
6647c478bd9Sstevel@tonic-gate sctp->sctp_lastdata = NULL;
6657c478bd9Sstevel@tonic-gate
6667c478bd9Sstevel@tonic-gate /* Clear out default xmit settings */
6677c478bd9Sstevel@tonic-gate sctp->sctp_def_stream = 0;
6687c478bd9Sstevel@tonic-gate sctp->sctp_def_flags = 0;
6697c478bd9Sstevel@tonic-gate sctp->sctp_def_ppid = 0;
6707c478bd9Sstevel@tonic-gate sctp->sctp_def_context = 0;
6717c478bd9Sstevel@tonic-gate sctp->sctp_def_timetolive = 0;
6727c478bd9Sstevel@tonic-gate
6737c478bd9Sstevel@tonic-gate if (sctp->sctp_sack_info != NULL) {
6747c478bd9Sstevel@tonic-gate sctp_free_set(sctp->sctp_sack_info);
6757c478bd9Sstevel@tonic-gate sctp->sctp_sack_info = NULL;
6767c478bd9Sstevel@tonic-gate }
6777c478bd9Sstevel@tonic-gate sctp->sctp_sack_gaps = 0;
6787c478bd9Sstevel@tonic-gate
6797c478bd9Sstevel@tonic-gate if (sctp->sctp_cookie_mp != NULL) {
6807c478bd9Sstevel@tonic-gate freemsg(sctp->sctp_cookie_mp);
6817c478bd9Sstevel@tonic-gate sctp->sctp_cookie_mp = NULL;
6827c478bd9Sstevel@tonic-gate }
6837c478bd9Sstevel@tonic-gate
6847c478bd9Sstevel@tonic-gate /* Remove all the address resources. */
6857c478bd9Sstevel@tonic-gate sctp_zap_addrs(sctp);
6867c478bd9Sstevel@tonic-gate for (cnt = 0; cnt < SCTP_IPIF_HASH; cnt++) {
6877c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_saddrs[cnt].ipif_count == 0);
6887c478bd9Sstevel@tonic-gate list_destroy(&sctp->sctp_saddrs[cnt].sctp_ipif_list);
6897c478bd9Sstevel@tonic-gate }
6907c478bd9Sstevel@tonic-gate
6917c478bd9Sstevel@tonic-gate if (sctp->sctp_hopopts != NULL) {
6927c478bd9Sstevel@tonic-gate mi_free(sctp->sctp_hopopts);
6937c478bd9Sstevel@tonic-gate sctp->sctp_hopopts = NULL;
6947c478bd9Sstevel@tonic-gate sctp->sctp_hopoptslen = 0;
6957c478bd9Sstevel@tonic-gate }
6967c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_hopoptslen == 0);
6977c478bd9Sstevel@tonic-gate if (sctp->sctp_dstopts != NULL) {
6987c478bd9Sstevel@tonic-gate mi_free(sctp->sctp_dstopts);
6997c478bd9Sstevel@tonic-gate sctp->sctp_dstopts = NULL;
7007c478bd9Sstevel@tonic-gate sctp->sctp_dstoptslen = 0;
7017c478bd9Sstevel@tonic-gate }
7027c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_dstoptslen == 0);
703bd670b35SErik Nordmark if (sctp->sctp_rthdrdstopts != NULL) {
704bd670b35SErik Nordmark mi_free(sctp->sctp_rthdrdstopts);
705bd670b35SErik Nordmark sctp->sctp_rthdrdstopts = NULL;
706bd670b35SErik Nordmark sctp->sctp_rthdrdstoptslen = 0;
7077c478bd9Sstevel@tonic-gate }
708bd670b35SErik Nordmark ASSERT(sctp->sctp_rthdrdstoptslen == 0);
7097c478bd9Sstevel@tonic-gate if (sctp->sctp_rthdr != NULL) {
7107c478bd9Sstevel@tonic-gate mi_free(sctp->sctp_rthdr);
7117c478bd9Sstevel@tonic-gate sctp->sctp_rthdr = NULL;
7127c478bd9Sstevel@tonic-gate sctp->sctp_rthdrlen = 0;
7137c478bd9Sstevel@tonic-gate }
7147c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_rthdrlen == 0);
7157c478bd9Sstevel@tonic-gate sctp_headers_free(sctp);
7167c478bd9Sstevel@tonic-gate
7177c478bd9Sstevel@tonic-gate sctp->sctp_shutdown_faddr = NULL;
7187c478bd9Sstevel@tonic-gate
7197f093707Skcpoon if (sctp->sctp_err_chunks != NULL) {
7207f093707Skcpoon freemsg(sctp->sctp_err_chunks);
7217f093707Skcpoon sctp->sctp_err_chunks = NULL;
7227f093707Skcpoon sctp->sctp_err_len = 0;
7237f093707Skcpoon }
7247f093707Skcpoon
7257c478bd9Sstevel@tonic-gate /* Clear all the bitfields. */
7267c478bd9Sstevel@tonic-gate bzero(&sctp->sctp_bits, sizeof (sctp->sctp_bits));
7277c478bd9Sstevel@tonic-gate
7287c478bd9Sstevel@tonic-gate /* It is time to update the global statistics. */
7295dd46ab5SKacheong Poon SCTPS_UPDATE_MIB(sctps, sctpOutSCTPPkts, sctp->sctp_opkts);
7305dd46ab5SKacheong Poon SCTPS_UPDATE_MIB(sctps, sctpOutCtrlChunks, sctp->sctp_obchunks);
7315dd46ab5SKacheong Poon SCTPS_UPDATE_MIB(sctps, sctpOutOrderChunks, sctp->sctp_odchunks);
7325dd46ab5SKacheong Poon SCTPS_UPDATE_MIB(sctps, sctpOutUnorderChunks, sctp->sctp_oudchunks);
7335dd46ab5SKacheong Poon SCTPS_UPDATE_MIB(sctps, sctpRetransChunks, sctp->sctp_rxtchunks);
7345dd46ab5SKacheong Poon SCTPS_UPDATE_MIB(sctps, sctpInSCTPPkts, sctp->sctp_ipkts);
7355dd46ab5SKacheong Poon SCTPS_UPDATE_MIB(sctps, sctpInCtrlChunks, sctp->sctp_ibchunks);
7365dd46ab5SKacheong Poon SCTPS_UPDATE_MIB(sctps, sctpInOrderChunks, sctp->sctp_idchunks);
7375dd46ab5SKacheong Poon SCTPS_UPDATE_MIB(sctps, sctpInUnorderChunks, sctp->sctp_iudchunks);
7385dd46ab5SKacheong Poon SCTPS_UPDATE_MIB(sctps, sctpFragUsrMsgs, sctp->sctp_fragdmsgs);
7395dd46ab5SKacheong Poon SCTPS_UPDATE_MIB(sctps, sctpReasmUsrMsgs, sctp->sctp_reassmsgs);
7407c478bd9Sstevel@tonic-gate sctp->sctp_opkts = 0;
7417c478bd9Sstevel@tonic-gate sctp->sctp_obchunks = 0;
7427c478bd9Sstevel@tonic-gate sctp->sctp_odchunks = 0;
7437c478bd9Sstevel@tonic-gate sctp->sctp_oudchunks = 0;
7447c478bd9Sstevel@tonic-gate sctp->sctp_rxtchunks = 0;
7457c478bd9Sstevel@tonic-gate sctp->sctp_ipkts = 0;
7467c478bd9Sstevel@tonic-gate sctp->sctp_ibchunks = 0;
7477c478bd9Sstevel@tonic-gate sctp->sctp_idchunks = 0;
7487c478bd9Sstevel@tonic-gate sctp->sctp_iudchunks = 0;
7497c478bd9Sstevel@tonic-gate sctp->sctp_fragdmsgs = 0;
7507c478bd9Sstevel@tonic-gate sctp->sctp_reassmsgs = 0;
75135e12f9cSGeorge Shepherd sctp->sctp_outseqtsns = 0;
75235e12f9cSGeorge Shepherd sctp->sctp_osacks = 0;
75335e12f9cSGeorge Shepherd sctp->sctp_isacks = 0;
75435e12f9cSGeorge Shepherd sctp->sctp_idupchunks = 0;
75535e12f9cSGeorge Shepherd sctp->sctp_gapcnt = 0;
75635e12f9cSGeorge Shepherd sctp->sctp_cum_obchunks = 0;
75735e12f9cSGeorge Shepherd sctp->sctp_cum_odchunks = 0;
75835e12f9cSGeorge Shepherd sctp->sctp_cum_oudchunks = 0;
75935e12f9cSGeorge Shepherd sctp->sctp_cum_rxtchunks = 0;
76035e12f9cSGeorge Shepherd sctp->sctp_cum_ibchunks = 0;
76135e12f9cSGeorge Shepherd sctp->sctp_cum_idchunks = 0;
76235e12f9cSGeorge Shepherd sctp->sctp_cum_iudchunks = 0;
7637c478bd9Sstevel@tonic-gate
7647c478bd9Sstevel@tonic-gate sctp->sctp_autoclose = 0;
765558fbd03Skcpoon sctp->sctp_tx_adaptation_code = 0;
7667c478bd9Sstevel@tonic-gate
7677f99e6fcSkp158701 sctp->sctp_v6label_len = 0;
7687f99e6fcSkp158701 sctp->sctp_v4label_len = 0;
7697f99e6fcSkp158701
770f4b3ec61Sdh155122 sctp->sctp_sctps = NULL;
771f4b3ec61Sdh155122
772121e5416Skcpoon sctp_conn_clear(connp);
7737c478bd9Sstevel@tonic-gate kmem_cache_free(sctp_conn_cache, connp);
7747c478bd9Sstevel@tonic-gate }
7757c478bd9Sstevel@tonic-gate
7767c478bd9Sstevel@tonic-gate /*
7777c478bd9Sstevel@tonic-gate * Initialize protocol control block. If a parent exists, inherit
7787c478bd9Sstevel@tonic-gate * all values set through setsockopt().
7797c478bd9Sstevel@tonic-gate */
7807c478bd9Sstevel@tonic-gate static int
sctp_init_values(sctp_t * sctp,sctp_t * psctp,int sleep)7817c478bd9Sstevel@tonic-gate sctp_init_values(sctp_t *sctp, sctp_t *psctp, int sleep)
7827c478bd9Sstevel@tonic-gate {
7837c478bd9Sstevel@tonic-gate int err;
7847c478bd9Sstevel@tonic-gate int cnt;
785f4b3ec61Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps;
786bd670b35SErik Nordmark conn_t *connp;
7877c478bd9Sstevel@tonic-gate
788bd670b35SErik Nordmark connp = sctp->sctp_connp;
7897c478bd9Sstevel@tonic-gate
7907c478bd9Sstevel@tonic-gate sctp->sctp_nsaddrs = 0;
7917c478bd9Sstevel@tonic-gate for (cnt = 0; cnt < SCTP_IPIF_HASH; cnt++) {
7927c478bd9Sstevel@tonic-gate sctp->sctp_saddrs[cnt].ipif_count = 0;
7937c478bd9Sstevel@tonic-gate list_create(&sctp->sctp_saddrs[cnt].sctp_ipif_list,
7947c478bd9Sstevel@tonic-gate sizeof (sctp_saddr_ipif_t), offsetof(sctp_saddr_ipif_t,
7957c478bd9Sstevel@tonic-gate saddr_ipif));
7967c478bd9Sstevel@tonic-gate }
797bd670b35SErik Nordmark connp->conn_ports = 0;
7987c478bd9Sstevel@tonic-gate sctp->sctp_running = B_FALSE;
7997c478bd9Sstevel@tonic-gate sctp->sctp_state = SCTPS_IDLE;
8007c478bd9Sstevel@tonic-gate
8017c478bd9Sstevel@tonic-gate sctp->sctp_refcnt = 1;
8027c478bd9Sstevel@tonic-gate
8037c478bd9Sstevel@tonic-gate sctp->sctp_strikes = 0;
8047c478bd9Sstevel@tonic-gate
805d3d50737SRafael Vanoni sctp->sctp_last_mtu_probe = ddi_get_lbolt64();
806f4b3ec61Sdh155122 sctp->sctp_mtu_probe_intvl = sctps->sctps_mtu_probe_interval;
8077c478bd9Sstevel@tonic-gate
8087c478bd9Sstevel@tonic-gate sctp->sctp_sack_gaps = 0;
809a215d4ebSKacheong Poon /* So we will not delay sending the first SACK. */
810a215d4ebSKacheong Poon sctp->sctp_sack_toggle = sctps->sctps_deferred_acks_max;
8117c478bd9Sstevel@tonic-gate
812121e5416Skcpoon /* Only need to do the allocation if there is no "cached" one. */
813121e5416Skcpoon if (sctp->sctp_pad_mp == NULL) {
814121e5416Skcpoon if (sleep == KM_SLEEP) {
815121e5416Skcpoon sctp->sctp_pad_mp = allocb_wait(SCTP_ALIGN, BPRI_MED,
816121e5416Skcpoon STR_NOSIG, NULL);
817121e5416Skcpoon } else {
818121e5416Skcpoon sctp->sctp_pad_mp = allocb(SCTP_ALIGN, BPRI_MED);
819121e5416Skcpoon if (sctp->sctp_pad_mp == NULL)
820121e5416Skcpoon return (ENOMEM);
821121e5416Skcpoon }
822121e5416Skcpoon bzero(sctp->sctp_pad_mp->b_rptr, SCTP_ALIGN);
823121e5416Skcpoon }
824121e5416Skcpoon
8257c478bd9Sstevel@tonic-gate if (psctp != NULL) {
8267c478bd9Sstevel@tonic-gate /*
8277c478bd9Sstevel@tonic-gate * Inherit from parent
828bd670b35SErik Nordmark *
829bd670b35SErik Nordmark * Start by inheriting from the conn_t, including conn_ixa and
830bd670b35SErik Nordmark * conn_xmit_ipp.
8317c478bd9Sstevel@tonic-gate */
832bd670b35SErik Nordmark err = conn_inherit_parent(psctp->sctp_connp, connp);
833bd670b35SErik Nordmark if (err != 0)
834121e5416Skcpoon goto failure;
8357c478bd9Sstevel@tonic-gate
836a215d4ebSKacheong Poon sctp->sctp_upcalls = psctp->sctp_upcalls;
837a215d4ebSKacheong Poon
8387c478bd9Sstevel@tonic-gate sctp->sctp_cookie_lifetime = psctp->sctp_cookie_lifetime;
839bd670b35SErik Nordmark
8407c478bd9Sstevel@tonic-gate sctp->sctp_cwnd_max = psctp->sctp_cwnd_max;
8417c478bd9Sstevel@tonic-gate sctp->sctp_rwnd = psctp->sctp_rwnd;
842a215d4ebSKacheong Poon sctp->sctp_arwnd = psctp->sctp_arwnd;
8437d546a59Svi117747 sctp->sctp_pd_point = psctp->sctp_pd_point;
8447c478bd9Sstevel@tonic-gate sctp->sctp_rto_max = psctp->sctp_rto_max;
845fd7b5aedSGeorge Shepherd sctp->sctp_rto_max_init = psctp->sctp_rto_max_init;
8467c478bd9Sstevel@tonic-gate sctp->sctp_rto_min = psctp->sctp_rto_min;
8477c478bd9Sstevel@tonic-gate sctp->sctp_rto_initial = psctp->sctp_rto_initial;
8487c478bd9Sstevel@tonic-gate sctp->sctp_pa_max_rxt = psctp->sctp_pa_max_rxt;
8497c478bd9Sstevel@tonic-gate sctp->sctp_pp_max_rxt = psctp->sctp_pp_max_rxt;
8507c478bd9Sstevel@tonic-gate sctp->sctp_max_init_rxt = psctp->sctp_max_init_rxt;
8517c478bd9Sstevel@tonic-gate
8527c478bd9Sstevel@tonic-gate sctp->sctp_def_stream = psctp->sctp_def_stream;
8537c478bd9Sstevel@tonic-gate sctp->sctp_def_flags = psctp->sctp_def_flags;
8547c478bd9Sstevel@tonic-gate sctp->sctp_def_ppid = psctp->sctp_def_ppid;
8557c478bd9Sstevel@tonic-gate sctp->sctp_def_context = psctp->sctp_def_context;
8567c478bd9Sstevel@tonic-gate sctp->sctp_def_timetolive = psctp->sctp_def_timetolive;
8577c478bd9Sstevel@tonic-gate
8587c478bd9Sstevel@tonic-gate sctp->sctp_num_istr = psctp->sctp_num_istr;
8597c478bd9Sstevel@tonic-gate sctp->sctp_num_ostr = psctp->sctp_num_ostr;
8607c478bd9Sstevel@tonic-gate
8617c478bd9Sstevel@tonic-gate sctp->sctp_hb_interval = psctp->sctp_hb_interval;
8627c478bd9Sstevel@tonic-gate sctp->sctp_autoclose = psctp->sctp_autoclose;
863558fbd03Skcpoon sctp->sctp_tx_adaptation_code = psctp->sctp_tx_adaptation_code;
8647c478bd9Sstevel@tonic-gate
8657c478bd9Sstevel@tonic-gate /* xxx should be a better way to copy these flags xxx */
8667c478bd9Sstevel@tonic-gate sctp->sctp_bound_to_all = psctp->sctp_bound_to_all;
8677c478bd9Sstevel@tonic-gate sctp->sctp_cansleep = psctp->sctp_cansleep;
868558fbd03Skcpoon sctp->sctp_send_adaptation = psctp->sctp_send_adaptation;
8697c478bd9Sstevel@tonic-gate sctp->sctp_ndelay = psctp->sctp_ndelay;
8707c478bd9Sstevel@tonic-gate sctp->sctp_events = psctp->sctp_events;
8717c478bd9Sstevel@tonic-gate } else {
8727c478bd9Sstevel@tonic-gate /*
8737c478bd9Sstevel@tonic-gate * Set to system defaults
8747c478bd9Sstevel@tonic-gate */
875f4b3ec61Sdh155122 sctp->sctp_cookie_lifetime =
876f4b3ec61Sdh155122 MSEC_TO_TICK(sctps->sctps_cookie_life);
877bd670b35SErik Nordmark connp->conn_sndlowat = sctps->sctps_xmit_lowat;
878bd670b35SErik Nordmark connp->conn_sndbuf = sctps->sctps_xmit_hiwat;
879bd670b35SErik Nordmark connp->conn_rcvbuf = sctps->sctps_recv_hiwat;
880bd670b35SErik Nordmark
881f4b3ec61Sdh155122 sctp->sctp_cwnd_max = sctps->sctps_cwnd_max_;
882bd670b35SErik Nordmark sctp->sctp_rwnd = connp->conn_rcvbuf;
883a215d4ebSKacheong Poon sctp->sctp_arwnd = connp->conn_rcvbuf;
8847d546a59Svi117747 sctp->sctp_pd_point = sctp->sctp_rwnd;
885f4b3ec61Sdh155122 sctp->sctp_rto_max = MSEC_TO_TICK(sctps->sctps_rto_maxg);
886fd7b5aedSGeorge Shepherd sctp->sctp_rto_max_init = sctp->sctp_rto_max;
887f4b3ec61Sdh155122 sctp->sctp_rto_min = MSEC_TO_TICK(sctps->sctps_rto_ming);
888f4b3ec61Sdh155122 sctp->sctp_rto_initial = MSEC_TO_TICK(
889f4b3ec61Sdh155122 sctps->sctps_rto_initialg);
890f4b3ec61Sdh155122 sctp->sctp_pa_max_rxt = sctps->sctps_pa_max_retr;
891f4b3ec61Sdh155122 sctp->sctp_pp_max_rxt = sctps->sctps_pp_max_retr;
892f4b3ec61Sdh155122 sctp->sctp_max_init_rxt = sctps->sctps_max_init_retr;
8937c478bd9Sstevel@tonic-gate
894f4b3ec61Sdh155122 sctp->sctp_num_istr = sctps->sctps_max_in_streams;
895f4b3ec61Sdh155122 sctp->sctp_num_ostr = sctps->sctps_initial_out_streams;
8967c478bd9Sstevel@tonic-gate
897f4b3ec61Sdh155122 sctp->sctp_hb_interval =
898f4b3ec61Sdh155122 MSEC_TO_TICK(sctps->sctps_heartbeat_interval);
899bd670b35SErik Nordmark
900bd670b35SErik Nordmark if (connp->conn_family == AF_INET)
901bd670b35SErik Nordmark connp->conn_default_ttl = sctps->sctps_ipv4_ttl;
902bd670b35SErik Nordmark else
903bd670b35SErik Nordmark connp->conn_default_ttl = sctps->sctps_ipv6_hoplimit;
904bd670b35SErik Nordmark
905bd670b35SErik Nordmark connp->conn_xmit_ipp.ipp_unicast_hops =
906bd670b35SErik Nordmark connp->conn_default_ttl;
907bd670b35SErik Nordmark
908bd670b35SErik Nordmark /*
909bd670b35SErik Nordmark * Initialize the header template
910bd670b35SErik Nordmark */
911bd670b35SErik Nordmark if ((err = sctp_build_hdrs(sctp, sleep)) != 0) {
912bd670b35SErik Nordmark goto failure;
9137c478bd9Sstevel@tonic-gate }
914bd670b35SErik Nordmark }
915bd670b35SErik Nordmark
9167c478bd9Sstevel@tonic-gate sctp->sctp_understands_asconf = B_TRUE;
9177c478bd9Sstevel@tonic-gate sctp->sctp_understands_addip = B_TRUE;
9187c478bd9Sstevel@tonic-gate sctp->sctp_prsctp_aware = B_FALSE;
9197c478bd9Sstevel@tonic-gate
9207c478bd9Sstevel@tonic-gate sctp->sctp_connp->conn_ref = 1;
9217c478bd9Sstevel@tonic-gate
9227c478bd9Sstevel@tonic-gate sctp->sctp_prsctpdrop = 0;
9237c478bd9Sstevel@tonic-gate sctp->sctp_msgcount = 0;
9247c478bd9Sstevel@tonic-gate
9257c478bd9Sstevel@tonic-gate return (0);
926121e5416Skcpoon
927121e5416Skcpoon failure:
928bd670b35SErik Nordmark sctp_headers_free(sctp);
929121e5416Skcpoon return (err);
9307c478bd9Sstevel@tonic-gate }
9317c478bd9Sstevel@tonic-gate
9327c478bd9Sstevel@tonic-gate /*
9337c478bd9Sstevel@tonic-gate * Extracts the init tag from an INIT chunk and checks if it matches
9347c478bd9Sstevel@tonic-gate * the sctp's verification tag. Returns 0 if it doesn't match, 1 if
9357c478bd9Sstevel@tonic-gate * it does.
9367c478bd9Sstevel@tonic-gate */
9377c478bd9Sstevel@tonic-gate static boolean_t
sctp_icmp_verf(sctp_t * sctp,sctp_hdr_t * sh,mblk_t * mp)9387c478bd9Sstevel@tonic-gate sctp_icmp_verf(sctp_t *sctp, sctp_hdr_t *sh, mblk_t *mp)
9397c478bd9Sstevel@tonic-gate {
9407c478bd9Sstevel@tonic-gate sctp_chunk_hdr_t *sch;
9417c478bd9Sstevel@tonic-gate uint32_t verf, *vp;
9427c478bd9Sstevel@tonic-gate
9437c478bd9Sstevel@tonic-gate sch = (sctp_chunk_hdr_t *)(sh + 1);
9447c478bd9Sstevel@tonic-gate vp = (uint32_t *)(sch + 1);
9457c478bd9Sstevel@tonic-gate
9467c478bd9Sstevel@tonic-gate /* Need at least the data chunk hdr and the first 4 bytes of INIT */
9477c478bd9Sstevel@tonic-gate if ((unsigned char *)(vp + 1) > mp->b_wptr) {
9487c478bd9Sstevel@tonic-gate return (B_FALSE);
9497c478bd9Sstevel@tonic-gate }
9507c478bd9Sstevel@tonic-gate
9517c478bd9Sstevel@tonic-gate bcopy(vp, &verf, sizeof (verf));
9527c478bd9Sstevel@tonic-gate
9537c478bd9Sstevel@tonic-gate if (verf == sctp->sctp_lvtag) {
9547c478bd9Sstevel@tonic-gate return (B_TRUE);
9557c478bd9Sstevel@tonic-gate }
9567c478bd9Sstevel@tonic-gate return (B_FALSE);
9577c478bd9Sstevel@tonic-gate }
9587c478bd9Sstevel@tonic-gate
9597c478bd9Sstevel@tonic-gate /*
960bd670b35SErik Nordmark * Update the SCTP state according to change of PMTU.
961bd670b35SErik Nordmark *
962bd670b35SErik Nordmark * Path MTU might have changed by either increase or decrease, so need to
963bd670b35SErik Nordmark * adjust the MSS based on the value of ixa_pmtu.
964bd670b35SErik Nordmark */
965bd670b35SErik Nordmark static void
sctp_update_pmtu(sctp_t * sctp,sctp_faddr_t * fp,boolean_t decrease_only)966bd670b35SErik Nordmark sctp_update_pmtu(sctp_t *sctp, sctp_faddr_t *fp, boolean_t decrease_only)
967bd670b35SErik Nordmark {
968bd670b35SErik Nordmark uint32_t pmtu;
969bd670b35SErik Nordmark int32_t mss;
9706be61d4eSchandrasekar marimuthu - Sun Microsystems - Bangalore India ip_xmit_attr_t *ixa = fp->sf_ixa;
971bd670b35SErik Nordmark
972bd670b35SErik Nordmark if (sctp->sctp_state < SCTPS_ESTABLISHED)
973bd670b35SErik Nordmark return;
974bd670b35SErik Nordmark
975bd670b35SErik Nordmark /*
976bd670b35SErik Nordmark * Always call ip_get_pmtu() to make sure that IP has updated
977bd670b35SErik Nordmark * ixa_flags properly.
978bd670b35SErik Nordmark */
979bd670b35SErik Nordmark pmtu = ip_get_pmtu(ixa);
980bd670b35SErik Nordmark
981bd670b35SErik Nordmark /*
982bd670b35SErik Nordmark * Calculate the MSS by decreasing the PMTU by sctp_hdr_len and
983bd670b35SErik Nordmark * IPsec overhead if applied. Make sure to use the most recent
984bd670b35SErik Nordmark * IPsec information.
985bd670b35SErik Nordmark */
986bd670b35SErik Nordmark mss = pmtu - conn_ipsec_length(sctp->sctp_connp);
987bd670b35SErik Nordmark if (ixa->ixa_flags & IXAF_IS_IPV4)
988bd670b35SErik Nordmark mss -= sctp->sctp_hdr_len;
989bd670b35SErik Nordmark else
990bd670b35SErik Nordmark mss -= sctp->sctp_hdr6_len;
991bd670b35SErik Nordmark
992bd670b35SErik Nordmark /*
993bd670b35SErik Nordmark * Nothing to change, so just return.
994bd670b35SErik Nordmark */
9956be61d4eSchandrasekar marimuthu - Sun Microsystems - Bangalore India if (mss == fp->sf_pmss)
996bd670b35SErik Nordmark return;
997bd670b35SErik Nordmark
998bd670b35SErik Nordmark /*
999bd670b35SErik Nordmark * Currently, for ICMP errors, only PMTU decrease is handled.
1000bd670b35SErik Nordmark */
10016be61d4eSchandrasekar marimuthu - Sun Microsystems - Bangalore India if (mss > fp->sf_pmss && decrease_only)
1002bd670b35SErik Nordmark return;
1003bd670b35SErik Nordmark
1004bd670b35SErik Nordmark #ifdef DEBUG
1005bd670b35SErik Nordmark (void) printf("sctp_update_pmtu mss from %d to %d\n",
10066be61d4eSchandrasekar marimuthu - Sun Microsystems - Bangalore India fp->sf_pmss, mss);
1007bd670b35SErik Nordmark #endif
10086be61d4eSchandrasekar marimuthu - Sun Microsystems - Bangalore India DTRACE_PROBE2(sctp_update_pmtu, int32_t, fp->sf_pmss, uint32_t, mss);
1009bd670b35SErik Nordmark
1010bd670b35SErik Nordmark /*
1011bd670b35SErik Nordmark * Update ixa_fragsize and ixa_pmtu.
1012bd670b35SErik Nordmark */
1013bd670b35SErik Nordmark ixa->ixa_fragsize = ixa->ixa_pmtu = pmtu;
1014bd670b35SErik Nordmark
1015bd670b35SErik Nordmark /*
1016bd670b35SErik Nordmark * Make sure that sfa_pmss is a multiple of
1017bd670b35SErik Nordmark * SCTP_ALIGN.
1018bd670b35SErik Nordmark */
10196be61d4eSchandrasekar marimuthu - Sun Microsystems - Bangalore India fp->sf_pmss = mss & ~(SCTP_ALIGN - 1);
10206be61d4eSchandrasekar marimuthu - Sun Microsystems - Bangalore India fp->sf_pmtu_discovered = 1;
1021bd670b35SErik Nordmark
1022bd670b35SErik Nordmark #ifdef notyet
1023bd670b35SErik Nordmark if (mss < sctp->sctp_sctps->sctps_mss_min)
1024bd670b35SErik Nordmark ixa->ixa_flags |= IXAF_PMTU_TOO_SMALL;
1025bd670b35SErik Nordmark #endif
1026bd670b35SErik Nordmark if (ixa->ixa_flags & IXAF_PMTU_TOO_SMALL)
1027bd670b35SErik Nordmark ixa->ixa_flags &= ~(IXAF_DONTFRAG | IXAF_PMTU_IPV4_DF);
1028bd670b35SErik Nordmark
1029bd670b35SErik Nordmark /*
1030bd670b35SErik Nordmark * If below the min size then ip_get_pmtu cleared IXAF_PMTU_IPV4_DF.
1031bd670b35SErik Nordmark * Make sure to clear IXAF_DONTFRAG, which is used by IP to decide
1032bd670b35SErik Nordmark * whether to fragment the packet.
1033bd670b35SErik Nordmark */
1034bd670b35SErik Nordmark if (ixa->ixa_flags & IXAF_IS_IPV4) {
1035bd670b35SErik Nordmark if (!(ixa->ixa_flags & IXAF_PMTU_IPV4_DF)) {
10366be61d4eSchandrasekar marimuthu - Sun Microsystems - Bangalore India fp->sf_df = B_FALSE;
1037bd670b35SErik Nordmark if (fp == sctp->sctp_current) {
1038bd670b35SErik Nordmark sctp->sctp_ipha->
1039bd670b35SErik Nordmark ipha_fragment_offset_and_flags = 0;
1040bd670b35SErik Nordmark }
1041bd670b35SErik Nordmark }
1042bd670b35SErik Nordmark }
1043bd670b35SErik Nordmark }
1044bd670b35SErik Nordmark
1045bd670b35SErik Nordmark /*
1046bd670b35SErik Nordmark * Notify function registered with ip_xmit_attr_t. It's called in the context
1047bd670b35SErik Nordmark * of conn_ip_output so it's safe to update the SCTP state.
1048bd670b35SErik Nordmark * Currently only used for pmtu changes.
1049bd670b35SErik Nordmark */
1050bd670b35SErik Nordmark /* ARGSUSED1 */
1051bd670b35SErik Nordmark static void
sctp_notify(void * arg,ip_xmit_attr_t * ixa,ixa_notify_type_t ntype,ixa_notify_arg_t narg)1052bd670b35SErik Nordmark sctp_notify(void *arg, ip_xmit_attr_t *ixa, ixa_notify_type_t ntype,
1053bd670b35SErik Nordmark ixa_notify_arg_t narg)
1054bd670b35SErik Nordmark {
1055bd670b35SErik Nordmark sctp_t *sctp = (sctp_t *)arg;
1056bd670b35SErik Nordmark sctp_faddr_t *fp;
1057bd670b35SErik Nordmark
1058bd670b35SErik Nordmark switch (ntype) {
1059bd670b35SErik Nordmark case IXAN_PMTU:
1060bd670b35SErik Nordmark /* Find the faddr based on the ip_xmit_attr_t pointer */
10616be61d4eSchandrasekar marimuthu - Sun Microsystems - Bangalore India for (fp = sctp->sctp_faddrs; fp != NULL; fp = fp->sf_next) {
10626be61d4eSchandrasekar marimuthu - Sun Microsystems - Bangalore India if (fp->sf_ixa == ixa)
1063bd670b35SErik Nordmark break;
1064bd670b35SErik Nordmark }
1065bd670b35SErik Nordmark if (fp != NULL)
1066bd670b35SErik Nordmark sctp_update_pmtu(sctp, fp, B_FALSE);
1067bd670b35SErik Nordmark break;
1068bd670b35SErik Nordmark default:
1069bd670b35SErik Nordmark break;
1070bd670b35SErik Nordmark }
1071bd670b35SErik Nordmark }
1072bd670b35SErik Nordmark
1073bd670b35SErik Nordmark /*
10747c478bd9Sstevel@tonic-gate * sctp_icmp_error is called by sctp_input() to process ICMP error messages
1075bd670b35SErik Nordmark * passed up by IP. We need to find a sctp_t
10767c478bd9Sstevel@tonic-gate * that corresponds to the returned datagram. Passes the message back in on
10777c478bd9Sstevel@tonic-gate * the correct queue once it has located the connection.
10787c478bd9Sstevel@tonic-gate * Assumes that IP has pulled up everything up to and including
10797c478bd9Sstevel@tonic-gate * the ICMP header.
10807c478bd9Sstevel@tonic-gate */
10817c478bd9Sstevel@tonic-gate void
sctp_icmp_error(sctp_t * sctp,mblk_t * mp)10827c478bd9Sstevel@tonic-gate sctp_icmp_error(sctp_t *sctp, mblk_t *mp)
10837c478bd9Sstevel@tonic-gate {
10847c478bd9Sstevel@tonic-gate icmph_t *icmph;
10857c478bd9Sstevel@tonic-gate ipha_t *ipha;
10867c478bd9Sstevel@tonic-gate int iph_hdr_length;
10877c478bd9Sstevel@tonic-gate sctp_hdr_t *sctph;
10887c478bd9Sstevel@tonic-gate in6_addr_t dst;
10897c478bd9Sstevel@tonic-gate sctp_faddr_t *fp;
1090f4b3ec61Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps;
10917c478bd9Sstevel@tonic-gate
109245916cd2Sjpk dprint(1, ("sctp_icmp_error: sctp=%p, mp=%p\n", (void *)sctp,
109345916cd2Sjpk (void *)mp));
10947c478bd9Sstevel@tonic-gate
10957c478bd9Sstevel@tonic-gate ipha = (ipha_t *)mp->b_rptr;
10967c478bd9Sstevel@tonic-gate if (IPH_HDR_VERSION(ipha) != IPV4_VERSION) {
10977c478bd9Sstevel@tonic-gate ASSERT(IPH_HDR_VERSION(ipha) == IPV6_VERSION);
1098bd670b35SErik Nordmark sctp_icmp_error_ipv6(sctp, mp);
10997c478bd9Sstevel@tonic-gate return;
11007c478bd9Sstevel@tonic-gate }
11017c478bd9Sstevel@tonic-gate
1102f0c3911fSGeorge Shepherd /* account for the ip hdr from the icmp message */
11037c478bd9Sstevel@tonic-gate iph_hdr_length = IPH_HDR_LENGTH(ipha);
11047c478bd9Sstevel@tonic-gate icmph = (icmph_t *)&mp->b_rptr[iph_hdr_length];
1105f0c3911fSGeorge Shepherd /* now the ip hdr of message resulting in this icmp */
11067c478bd9Sstevel@tonic-gate ipha = (ipha_t *)&icmph[1];
11077c478bd9Sstevel@tonic-gate iph_hdr_length = IPH_HDR_LENGTH(ipha);
11087c478bd9Sstevel@tonic-gate sctph = (sctp_hdr_t *)((char *)ipha + iph_hdr_length);
1109f0c3911fSGeorge Shepherd /* first_mp must expose the full sctp header. */
11107c478bd9Sstevel@tonic-gate if ((uchar_t *)(sctph + 1) >= mp->b_wptr) {
11117c478bd9Sstevel@tonic-gate /* not enough data for SCTP header */
1112bd670b35SErik Nordmark freemsg(mp);
11137c478bd9Sstevel@tonic-gate return;
11147c478bd9Sstevel@tonic-gate }
11157c478bd9Sstevel@tonic-gate
11167c478bd9Sstevel@tonic-gate switch (icmph->icmph_type) {
11177c478bd9Sstevel@tonic-gate case ICMP_DEST_UNREACHABLE:
11187c478bd9Sstevel@tonic-gate switch (icmph->icmph_code) {
11197c478bd9Sstevel@tonic-gate case ICMP_FRAGMENTATION_NEEDED:
11207c478bd9Sstevel@tonic-gate /*
11217c478bd9Sstevel@tonic-gate * Reduce the MSS based on the new MTU. This will
11227c478bd9Sstevel@tonic-gate * eliminate any fragmentation locally.
11237c478bd9Sstevel@tonic-gate * N.B. There may well be some funny side-effects on
11247c478bd9Sstevel@tonic-gate * the local send policy and the remote receive policy.
11257c478bd9Sstevel@tonic-gate * Pending further research, we provide
11267c478bd9Sstevel@tonic-gate * sctp_ignore_path_mtu just in case this proves
11277c478bd9Sstevel@tonic-gate * disastrous somewhere.
11287c478bd9Sstevel@tonic-gate *
11297c478bd9Sstevel@tonic-gate * After updating the MSS, retransmit part of the
11307c478bd9Sstevel@tonic-gate * dropped segment using the new mss by calling
11317c478bd9Sstevel@tonic-gate * sctp_wput_slow(). Need to adjust all those
11327c478bd9Sstevel@tonic-gate * params to make sure sctp_wput_slow() work properly.
11337c478bd9Sstevel@tonic-gate */
1134f4b3ec61Sdh155122 if (sctps->sctps_ignore_path_mtu)
11357c478bd9Sstevel@tonic-gate break;
11367c478bd9Sstevel@tonic-gate
11377c478bd9Sstevel@tonic-gate /* find the offending faddr */
11387c478bd9Sstevel@tonic-gate IN6_IPADDR_TO_V4MAPPED(ipha->ipha_dst, &dst);
11397c478bd9Sstevel@tonic-gate fp = sctp_lookup_faddr(sctp, &dst);
11407c478bd9Sstevel@tonic-gate if (fp == NULL) {
11417c478bd9Sstevel@tonic-gate break;
11427c478bd9Sstevel@tonic-gate }
1143bd670b35SErik Nordmark sctp_update_pmtu(sctp, fp, B_TRUE);
1144f0c3911fSGeorge Shepherd /*
1145f0c3911fSGeorge Shepherd * It is possible, even likely that a fast retransmit
1146f0c3911fSGeorge Shepherd * attempt has been dropped by ip as a result of this
1147f0c3911fSGeorge Shepherd * error, retransmission bundles as much as possible.
1148f0c3911fSGeorge Shepherd * A retransmit here prevents significant delays waiting
1149f0c3911fSGeorge Shepherd * on the timer. Analogous to behaviour of TCP after
1150f0c3911fSGeorge Shepherd * ICMP too big.
1151f0c3911fSGeorge Shepherd */
1152f0c3911fSGeorge Shepherd sctp_rexmit(sctp, fp);
11537c478bd9Sstevel@tonic-gate break;
11547c478bd9Sstevel@tonic-gate case ICMP_PORT_UNREACHABLE:
11557c478bd9Sstevel@tonic-gate case ICMP_PROTOCOL_UNREACHABLE:
11567c478bd9Sstevel@tonic-gate switch (sctp->sctp_state) {
11577c478bd9Sstevel@tonic-gate case SCTPS_COOKIE_WAIT:
11587c478bd9Sstevel@tonic-gate case SCTPS_COOKIE_ECHOED:
11597c478bd9Sstevel@tonic-gate /* make sure the verification tag matches */
11607c478bd9Sstevel@tonic-gate if (!sctp_icmp_verf(sctp, sctph, mp)) {
11617c478bd9Sstevel@tonic-gate break;
11627c478bd9Sstevel@tonic-gate }
11635dd46ab5SKacheong Poon SCTPS_BUMP_MIB(sctps, sctpAborted);
1164c9da23f8Skcpoon sctp_assoc_event(sctp, SCTP_CANT_STR_ASSOC, 0,
1165c9da23f8Skcpoon NULL);
11667c478bd9Sstevel@tonic-gate sctp_clean_death(sctp, ECONNREFUSED);
11677c478bd9Sstevel@tonic-gate break;
11687c478bd9Sstevel@tonic-gate }
11697c478bd9Sstevel@tonic-gate break;
11707c478bd9Sstevel@tonic-gate case ICMP_HOST_UNREACHABLE:
11717c478bd9Sstevel@tonic-gate case ICMP_NET_UNREACHABLE:
11727c478bd9Sstevel@tonic-gate /* Record the error in case we finally time out. */
11737c478bd9Sstevel@tonic-gate sctp->sctp_client_errno = (icmph->icmph_code ==
11747c478bd9Sstevel@tonic-gate ICMP_HOST_UNREACHABLE) ? EHOSTUNREACH : ENETUNREACH;
11757c478bd9Sstevel@tonic-gate break;
11767c478bd9Sstevel@tonic-gate default:
11777c478bd9Sstevel@tonic-gate break;
11787c478bd9Sstevel@tonic-gate }
11797c478bd9Sstevel@tonic-gate break;
11807c478bd9Sstevel@tonic-gate case ICMP_SOURCE_QUENCH: {
11817c478bd9Sstevel@tonic-gate /* Reduce the sending rate as if we got a retransmit timeout */
11827c478bd9Sstevel@tonic-gate break;
11837c478bd9Sstevel@tonic-gate }
11847c478bd9Sstevel@tonic-gate }
1185bd670b35SErik Nordmark freemsg(mp);
11867c478bd9Sstevel@tonic-gate }
11877c478bd9Sstevel@tonic-gate
11887c478bd9Sstevel@tonic-gate /*
11897c478bd9Sstevel@tonic-gate * sctp_icmp_error_ipv6() is called by sctp_icmp_error() to process ICMPv6
11907c478bd9Sstevel@tonic-gate * error messages passed up by IP.
11917c478bd9Sstevel@tonic-gate * Assumes that IP has pulled up all the extension headers as well
11927c478bd9Sstevel@tonic-gate * as the ICMPv6 header.
11937c478bd9Sstevel@tonic-gate */
11947c478bd9Sstevel@tonic-gate static void
sctp_icmp_error_ipv6(sctp_t * sctp,mblk_t * mp)11957c478bd9Sstevel@tonic-gate sctp_icmp_error_ipv6(sctp_t *sctp, mblk_t *mp)
11967c478bd9Sstevel@tonic-gate {
11977c478bd9Sstevel@tonic-gate icmp6_t *icmp6;
11987c478bd9Sstevel@tonic-gate ip6_t *ip6h;
11997c478bd9Sstevel@tonic-gate uint16_t iph_hdr_length;
12007c478bd9Sstevel@tonic-gate sctp_hdr_t *sctpha;
12017c478bd9Sstevel@tonic-gate uint8_t *nexthdrp;
12027c478bd9Sstevel@tonic-gate sctp_faddr_t *fp;
1203f4b3ec61Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps;
12047c478bd9Sstevel@tonic-gate
12057c478bd9Sstevel@tonic-gate ip6h = (ip6_t *)mp->b_rptr;
12067c478bd9Sstevel@tonic-gate iph_hdr_length = (ip6h->ip6_nxt != IPPROTO_SCTP) ?
12077c478bd9Sstevel@tonic-gate ip_hdr_length_v6(mp, ip6h) : IPV6_HDR_LEN;
12087c478bd9Sstevel@tonic-gate
12097c478bd9Sstevel@tonic-gate icmp6 = (icmp6_t *)&mp->b_rptr[iph_hdr_length];
12107c478bd9Sstevel@tonic-gate ip6h = (ip6_t *)&icmp6[1];
12117c478bd9Sstevel@tonic-gate if (!ip_hdr_length_nexthdr_v6(mp, ip6h, &iph_hdr_length, &nexthdrp)) {
12127c478bd9Sstevel@tonic-gate freemsg(mp);
12137c478bd9Sstevel@tonic-gate return;
12147c478bd9Sstevel@tonic-gate }
12157c478bd9Sstevel@tonic-gate ASSERT(*nexthdrp == IPPROTO_SCTP);
12167c478bd9Sstevel@tonic-gate
12177c478bd9Sstevel@tonic-gate /* XXX need ifindex to find connection */
12187c478bd9Sstevel@tonic-gate sctpha = (sctp_hdr_t *)((char *)ip6h + iph_hdr_length);
12197c478bd9Sstevel@tonic-gate if ((uchar_t *)sctpha >= mp->b_wptr) {
12207c478bd9Sstevel@tonic-gate /* not enough data for SCTP header */
12217c478bd9Sstevel@tonic-gate freemsg(mp);
12227c478bd9Sstevel@tonic-gate return;
12237c478bd9Sstevel@tonic-gate }
12247c478bd9Sstevel@tonic-gate switch (icmp6->icmp6_type) {
12257c478bd9Sstevel@tonic-gate case ICMP6_PACKET_TOO_BIG:
12267c478bd9Sstevel@tonic-gate /*
12277c478bd9Sstevel@tonic-gate * Reduce the MSS based on the new MTU. This will
12287c478bd9Sstevel@tonic-gate * eliminate any fragmentation locally.
12297c478bd9Sstevel@tonic-gate * N.B. There may well be some funny side-effects on
12307c478bd9Sstevel@tonic-gate * the local send policy and the remote receive policy.
12317c478bd9Sstevel@tonic-gate * Pending further research, we provide
12327c478bd9Sstevel@tonic-gate * sctp_ignore_path_mtu just in case this proves
12337c478bd9Sstevel@tonic-gate * disastrous somewhere.
12347c478bd9Sstevel@tonic-gate *
12357c478bd9Sstevel@tonic-gate * After updating the MSS, retransmit part of the
12367c478bd9Sstevel@tonic-gate * dropped segment using the new mss by calling
12377c478bd9Sstevel@tonic-gate * sctp_wput_slow(). Need to adjust all those
12387c478bd9Sstevel@tonic-gate * params to make sure sctp_wput_slow() work properly.
12397c478bd9Sstevel@tonic-gate */
1240f4b3ec61Sdh155122 if (sctps->sctps_ignore_path_mtu)
12417c478bd9Sstevel@tonic-gate break;
12427c478bd9Sstevel@tonic-gate
12437c478bd9Sstevel@tonic-gate /* find the offending faddr */
12447c478bd9Sstevel@tonic-gate fp = sctp_lookup_faddr(sctp, &ip6h->ip6_dst);
12457c478bd9Sstevel@tonic-gate if (fp == NULL) {
12467c478bd9Sstevel@tonic-gate break;
12477c478bd9Sstevel@tonic-gate }
12487c478bd9Sstevel@tonic-gate
1249bd670b35SErik Nordmark sctp_update_pmtu(sctp, fp, B_TRUE);
1250bd670b35SErik Nordmark /*
1251bd670b35SErik Nordmark * It is possible, even likely that a fast retransmit
1252bd670b35SErik Nordmark * attempt has been dropped by ip as a result of this
1253bd670b35SErik Nordmark * error, retransmission bundles as much as possible.
1254bd670b35SErik Nordmark * A retransmit here prevents significant delays waiting
1255bd670b35SErik Nordmark * on the timer. Analogous to behaviour of TCP after
1256bd670b35SErik Nordmark * ICMP too big.
1257bd670b35SErik Nordmark */
1258bd670b35SErik Nordmark sctp_rexmit(sctp, fp);
12597c478bd9Sstevel@tonic-gate break;
12607c478bd9Sstevel@tonic-gate
12617c478bd9Sstevel@tonic-gate case ICMP6_DST_UNREACH:
12627c478bd9Sstevel@tonic-gate switch (icmp6->icmp6_code) {
12637c478bd9Sstevel@tonic-gate case ICMP6_DST_UNREACH_NOPORT:
12647c478bd9Sstevel@tonic-gate /* make sure the verification tag matches */
12657c478bd9Sstevel@tonic-gate if (!sctp_icmp_verf(sctp, sctpha, mp)) {
12667c478bd9Sstevel@tonic-gate break;
12677c478bd9Sstevel@tonic-gate }
12687c478bd9Sstevel@tonic-gate if (sctp->sctp_state == SCTPS_COOKIE_WAIT ||
12697c478bd9Sstevel@tonic-gate sctp->sctp_state == SCTPS_COOKIE_ECHOED) {
12705dd46ab5SKacheong Poon SCTPS_BUMP_MIB(sctps, sctpAborted);
1271c9da23f8Skcpoon sctp_assoc_event(sctp, SCTP_CANT_STR_ASSOC, 0,
1272c9da23f8Skcpoon NULL);
12737c478bd9Sstevel@tonic-gate sctp_clean_death(sctp, ECONNREFUSED);
12747c478bd9Sstevel@tonic-gate }
12757c478bd9Sstevel@tonic-gate break;
12767c478bd9Sstevel@tonic-gate
12777c478bd9Sstevel@tonic-gate case ICMP6_DST_UNREACH_ADMIN:
12787c478bd9Sstevel@tonic-gate case ICMP6_DST_UNREACH_NOROUTE:
12797c478bd9Sstevel@tonic-gate case ICMP6_DST_UNREACH_NOTNEIGHBOR:
12807c478bd9Sstevel@tonic-gate case ICMP6_DST_UNREACH_ADDR:
12817c478bd9Sstevel@tonic-gate /* Record the error in case we finally time out. */
12827c478bd9Sstevel@tonic-gate sctp->sctp_client_errno = EHOSTUNREACH;
12837c478bd9Sstevel@tonic-gate break;
12847c478bd9Sstevel@tonic-gate default:
12857c478bd9Sstevel@tonic-gate break;
12867c478bd9Sstevel@tonic-gate }
12877c478bd9Sstevel@tonic-gate break;
12887c478bd9Sstevel@tonic-gate
12897c478bd9Sstevel@tonic-gate case ICMP6_PARAM_PROB:
12907c478bd9Sstevel@tonic-gate /* If this corresponds to an ICMP_PROTOCOL_UNREACHABLE */
12917c478bd9Sstevel@tonic-gate if (icmp6->icmp6_code == ICMP6_PARAMPROB_NEXTHEADER &&
12927c478bd9Sstevel@tonic-gate (uchar_t *)ip6h + icmp6->icmp6_pptr ==
12937c478bd9Sstevel@tonic-gate (uchar_t *)nexthdrp) {
12947c478bd9Sstevel@tonic-gate /* make sure the verification tag matches */
12957c478bd9Sstevel@tonic-gate if (!sctp_icmp_verf(sctp, sctpha, mp)) {
12967c478bd9Sstevel@tonic-gate break;
12977c478bd9Sstevel@tonic-gate }
12987c478bd9Sstevel@tonic-gate if (sctp->sctp_state == SCTPS_COOKIE_WAIT) {
12995dd46ab5SKacheong Poon SCTPS_BUMP_MIB(sctps, sctpAborted);
1300c9da23f8Skcpoon sctp_assoc_event(sctp, SCTP_CANT_STR_ASSOC, 0,
1301c9da23f8Skcpoon NULL);
13027c478bd9Sstevel@tonic-gate sctp_clean_death(sctp, ECONNREFUSED);
13037c478bd9Sstevel@tonic-gate }
13047c478bd9Sstevel@tonic-gate break;
13057c478bd9Sstevel@tonic-gate }
13067c478bd9Sstevel@tonic-gate break;
13077c478bd9Sstevel@tonic-gate
13087c478bd9Sstevel@tonic-gate case ICMP6_TIME_EXCEEDED:
13097c478bd9Sstevel@tonic-gate default:
13107c478bd9Sstevel@tonic-gate break;
13117c478bd9Sstevel@tonic-gate }
13127c478bd9Sstevel@tonic-gate freemsg(mp);
13137c478bd9Sstevel@tonic-gate }
13147c478bd9Sstevel@tonic-gate
13157c478bd9Sstevel@tonic-gate /*
13167c478bd9Sstevel@tonic-gate * Called by sockfs to create a new sctp instance.
13177c478bd9Sstevel@tonic-gate *
13187c478bd9Sstevel@tonic-gate * If parent pointer is passed in, inherit settings from it.
13197c478bd9Sstevel@tonic-gate */
13207c478bd9Sstevel@tonic-gate sctp_t *
sctp_create(void * ulpd,sctp_t * parent,int family,int type,int flags,sock_upcalls_t * upcalls,sctp_sockbuf_limits_t * sbl,cred_t * credp)1321bd670b35SErik Nordmark sctp_create(void *ulpd, sctp_t *parent, int family, int type, int flags,
13220f1702c5SYu Xiangning sock_upcalls_t *upcalls, sctp_sockbuf_limits_t *sbl,
13237c478bd9Sstevel@tonic-gate cred_t *credp)
13247c478bd9Sstevel@tonic-gate {
13257c478bd9Sstevel@tonic-gate sctp_t *sctp, *psctp;
1326bd670b35SErik Nordmark conn_t *connp;
13277c478bd9Sstevel@tonic-gate mblk_t *ack_mp, *hb_mp;
13287c478bd9Sstevel@tonic-gate int sleep = flags & SCTP_CAN_BLOCK ? KM_SLEEP : KM_NOSLEEP;
1329f4b3ec61Sdh155122 zoneid_t zoneid;
1330f4b3ec61Sdh155122 sctp_stack_t *sctps;
13317c478bd9Sstevel@tonic-gate
13327c478bd9Sstevel@tonic-gate /* User must supply a credential. */
13337c478bd9Sstevel@tonic-gate if (credp == NULL)
13347c478bd9Sstevel@tonic-gate return (NULL);
13357c478bd9Sstevel@tonic-gate
1336f4b3ec61Sdh155122 psctp = (sctp_t *)parent;
1337f4b3ec61Sdh155122 if (psctp != NULL) {
1338f4b3ec61Sdh155122 sctps = psctp->sctp_sctps;
1339f4b3ec61Sdh155122 /* Increase here to have common decrease at end */
1340f4b3ec61Sdh155122 netstack_hold(sctps->sctps_netstack);
13415dd46ab5SKacheong Poon ASSERT(sctps->sctps_recvq_tq_list_cur_sz > 0);
1342f4b3ec61Sdh155122 } else {
1343f4b3ec61Sdh155122 netstack_t *ns;
1344f4b3ec61Sdh155122
1345f4b3ec61Sdh155122 ns = netstack_find_by_cred(credp);
1346f4b3ec61Sdh155122 sctps = ns->netstack_sctp;
13475dd46ab5SKacheong Poon /*
13485dd46ab5SKacheong Poon * Check if the receive queue taskq for this sctp_stack_t has
13495dd46ab5SKacheong Poon * been set up.
13505dd46ab5SKacheong Poon */
13515dd46ab5SKacheong Poon if (sctps->sctps_recvq_tq_list_cur_sz == 0)
13525dd46ab5SKacheong Poon sctp_rq_tq_init(sctps);
1353f4b3ec61Sdh155122
1354f4b3ec61Sdh155122 /*
1355f4b3ec61Sdh155122 * For exclusive stacks we set the zoneid to zero
1356f4b3ec61Sdh155122 * to make SCTP operate as if in the global zone.
1357f4b3ec61Sdh155122 */
1358f4b3ec61Sdh155122 if (sctps->sctps_netstack->netstack_stackid !=
1359f4b3ec61Sdh155122 GLOBAL_NETSTACKID)
1360f4b3ec61Sdh155122 zoneid = GLOBAL_ZONEID;
1361f4b3ec61Sdh155122 else
1362f4b3ec61Sdh155122 zoneid = crgetzoneid(credp);
1363f4b3ec61Sdh155122 }
1364bd670b35SErik Nordmark if ((connp = ipcl_conn_create(IPCL_SCTPCONN, sleep,
1365f4b3ec61Sdh155122 sctps->sctps_netstack)) == NULL) {
1366f4b3ec61Sdh155122 netstack_rele(sctps->sctps_netstack);
1367f4b3ec61Sdh155122 SCTP_KSTAT(sctps, sctp_conn_create);
13687c478bd9Sstevel@tonic-gate return (NULL);
136977c67f2fSkcpoon }
1370f4b3ec61Sdh155122 /*
1371f4b3ec61Sdh155122 * ipcl_conn_create did a netstack_hold. Undo the hold that was
1372f4b3ec61Sdh155122 * done at top of sctp_create.
1373f4b3ec61Sdh155122 */
1374f4b3ec61Sdh155122 netstack_rele(sctps->sctps_netstack);
1375bd670b35SErik Nordmark sctp = CONN2SCTP(connp);
1376f4b3ec61Sdh155122 sctp->sctp_sctps = sctps;
13777c478bd9Sstevel@tonic-gate
1378121e5416Skcpoon if ((ack_mp = sctp_timer_alloc(sctp, sctp_ack_timer, sleep)) == NULL ||
1379121e5416Skcpoon (hb_mp = sctp_timer_alloc(sctp, sctp_heartbeat_timer,
1380121e5416Skcpoon sleep)) == NULL) {
13817c478bd9Sstevel@tonic-gate if (ack_mp != NULL)
13827c478bd9Sstevel@tonic-gate freeb(ack_mp);
1383bd670b35SErik Nordmark sctp_conn_clear(connp);
1384f4b3ec61Sdh155122 sctp->sctp_sctps = NULL;
1385bd670b35SErik Nordmark kmem_cache_free(sctp_conn_cache, connp);
13867c478bd9Sstevel@tonic-gate return (NULL);
13877c478bd9Sstevel@tonic-gate }
13887c478bd9Sstevel@tonic-gate
13897c478bd9Sstevel@tonic-gate sctp->sctp_ack_mp = ack_mp;
13907c478bd9Sstevel@tonic-gate sctp->sctp_heartbeat_mp = hb_mp;
13917c478bd9Sstevel@tonic-gate
1392bd670b35SErik Nordmark /*
1393bd670b35SErik Nordmark * Have conn_ip_output drop packets should our outer source
1394bd670b35SErik Nordmark * go invalid, and tell us about mtu changes.
1395bd670b35SErik Nordmark */
1396bd670b35SErik Nordmark connp->conn_ixa->ixa_flags |= IXAF_SET_ULP_CKSUM | IXAF_VERIFY_SOURCE |
1397bd670b35SErik Nordmark IXAF_VERIFY_PMTU;
1398bd670b35SErik Nordmark connp->conn_family = family;
1399bd670b35SErik Nordmark connp->conn_so_type = type;
14007c478bd9Sstevel@tonic-gate
14017c478bd9Sstevel@tonic-gate if (sctp_init_values(sctp, psctp, sleep) != 0) {
14027c478bd9Sstevel@tonic-gate freeb(ack_mp);
14037c478bd9Sstevel@tonic-gate freeb(hb_mp);
1404bd670b35SErik Nordmark sctp_conn_clear(connp);
1405f4b3ec61Sdh155122 sctp->sctp_sctps = NULL;
1406bd670b35SErik Nordmark kmem_cache_free(sctp_conn_cache, connp);
14077c478bd9Sstevel@tonic-gate return (NULL);
14087c478bd9Sstevel@tonic-gate }
14097c478bd9Sstevel@tonic-gate sctp->sctp_cansleep = ((flags & SCTP_CAN_BLOCK) == SCTP_CAN_BLOCK);
14107c478bd9Sstevel@tonic-gate
1411f4b3ec61Sdh155122 sctp->sctp_mss = sctps->sctps_initial_mtu - ((family == AF_INET6) ?
14127c478bd9Sstevel@tonic-gate sctp->sctp_hdr6_len : sctp->sctp_hdr_len);
14137c478bd9Sstevel@tonic-gate
14147c478bd9Sstevel@tonic-gate if (psctp != NULL) {
1415bd670b35SErik Nordmark conn_t *pconnp = psctp->sctp_connp;
1416bd670b35SErik Nordmark
14177c478bd9Sstevel@tonic-gate RUN_SCTP(psctp);
14187c478bd9Sstevel@tonic-gate /*
14197c478bd9Sstevel@tonic-gate * Inherit local address list, local port. Parent is either
14207c478bd9Sstevel@tonic-gate * in SCTPS_BOUND, or SCTPS_LISTEN state.
14217c478bd9Sstevel@tonic-gate */
14227c478bd9Sstevel@tonic-gate ASSERT((psctp->sctp_state == SCTPS_BOUND) ||
14237c478bd9Sstevel@tonic-gate (psctp->sctp_state == SCTPS_LISTEN));
14247c478bd9Sstevel@tonic-gate if (sctp_dup_saddrs(psctp, sctp, sleep)) {
14257c478bd9Sstevel@tonic-gate WAKE_SCTP(psctp);
14267c478bd9Sstevel@tonic-gate freeb(ack_mp);
14277c478bd9Sstevel@tonic-gate freeb(hb_mp);
14287c478bd9Sstevel@tonic-gate sctp_headers_free(sctp);
1429bd670b35SErik Nordmark sctp_conn_clear(connp);
1430f4b3ec61Sdh155122 sctp->sctp_sctps = NULL;
1431bd670b35SErik Nordmark kmem_cache_free(sctp_conn_cache, connp);
14327c478bd9Sstevel@tonic-gate return (NULL);
14337c478bd9Sstevel@tonic-gate }
14347c478bd9Sstevel@tonic-gate
14357c478bd9Sstevel@tonic-gate /*
14367c478bd9Sstevel@tonic-gate * If the parent is specified, it'll be immediatelly
14377c478bd9Sstevel@tonic-gate * followed by sctp_connect(). So don't add this guy to
14387c478bd9Sstevel@tonic-gate * bind hash.
14397c478bd9Sstevel@tonic-gate */
1440bd670b35SErik Nordmark connp->conn_lport = pconnp->conn_lport;
14417c478bd9Sstevel@tonic-gate sctp->sctp_state = SCTPS_BOUND;
14427c478bd9Sstevel@tonic-gate WAKE_SCTP(psctp);
14437c478bd9Sstevel@tonic-gate } else {
1444bd670b35SErik Nordmark ASSERT(connp->conn_cred == NULL);
1445bd670b35SErik Nordmark connp->conn_zoneid = zoneid;
1446bd670b35SErik Nordmark /*
1447bd670b35SErik Nordmark * conn_allzones can not be set this early, hence
1448bd670b35SErik Nordmark * no IPCL_ZONEID
1449bd670b35SErik Nordmark */
1450bd670b35SErik Nordmark connp->conn_ixa->ixa_zoneid = zoneid;
1451d3d50737SRafael Vanoni connp->conn_open_time = ddi_get_lbolt64();
1452bd670b35SErik Nordmark connp->conn_cred = credp;
14537c478bd9Sstevel@tonic-gate crhold(credp);
1454bd670b35SErik Nordmark connp->conn_cpid = curproc->p_pid;
14557c478bd9Sstevel@tonic-gate
145645916cd2Sjpk /*
1457bd670b35SErik Nordmark * If the caller has the process-wide flag set, then default to
1458bd670b35SErik Nordmark * MAC exempt mode. This allows read-down to unlabeled hosts.
145945916cd2Sjpk */
146045916cd2Sjpk if (getpflags(NET_MAC_AWARE, credp) != 0)
1461bd670b35SErik Nordmark connp->conn_mac_mode = CONN_MAC_AWARE;
1462bd670b35SErik Nordmark
1463bd670b35SErik Nordmark connp->conn_zone_is_global =
1464bd670b35SErik Nordmark (crgetzoneid(credp) == GLOBAL_ZONEID);
1465bd670b35SErik Nordmark }
146645916cd2Sjpk
14677c478bd9Sstevel@tonic-gate /* Initialize SCTP instance values, our verf tag must never be 0 */
14687c478bd9Sstevel@tonic-gate (void) random_get_pseudo_bytes((uint8_t *)&sctp->sctp_lvtag,
14697c478bd9Sstevel@tonic-gate sizeof (sctp->sctp_lvtag));
14707c478bd9Sstevel@tonic-gate if (sctp->sctp_lvtag == 0)
14717c478bd9Sstevel@tonic-gate sctp->sctp_lvtag = (uint32_t)gethrtime();
14727c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_lvtag != 0);
14737c478bd9Sstevel@tonic-gate
14747c478bd9Sstevel@tonic-gate sctp->sctp_ltsn = sctp->sctp_lvtag + 1;
14757c478bd9Sstevel@tonic-gate sctp->sctp_lcsn = sctp->sctp_ltsn;
14767c478bd9Sstevel@tonic-gate sctp->sctp_recovery_tsn = sctp->sctp_lastack_rxd = sctp->sctp_ltsn - 1;
14777c478bd9Sstevel@tonic-gate sctp->sctp_adv_pap = sctp->sctp_lastack_rxd;
14787c478bd9Sstevel@tonic-gate
14797c478bd9Sstevel@tonic-gate /* Information required by upper layer */
1480bd670b35SErik Nordmark ASSERT(ulpd != NULL);
14810f1702c5SYu Xiangning sctp->sctp_ulpd = ulpd;
14827c478bd9Sstevel@tonic-gate
14830f1702c5SYu Xiangning ASSERT(upcalls != NULL);
14840f1702c5SYu Xiangning sctp->sctp_upcalls = upcalls;
14857c478bd9Sstevel@tonic-gate ASSERT(sbl != NULL);
14867c478bd9Sstevel@tonic-gate /* Fill in the socket buffer limits for sctpsockfs */
1487bd670b35SErik Nordmark sbl->sbl_txlowat = connp->conn_sndlowat;
1488bd670b35SErik Nordmark sbl->sbl_txbuf = connp->conn_sndbuf;
14897c478bd9Sstevel@tonic-gate sbl->sbl_rxbuf = sctp->sctp_rwnd;
14907c478bd9Sstevel@tonic-gate sbl->sbl_rxlowat = SCTP_RECV_LOWATER;
14917c478bd9Sstevel@tonic-gate
14927c478bd9Sstevel@tonic-gate /* Insert this in the global list. */
1493f4b3ec61Sdh155122 SCTP_LINK(sctp, sctps);
14947c478bd9Sstevel@tonic-gate
14957c478bd9Sstevel@tonic-gate return (sctp);
14967c478bd9Sstevel@tonic-gate }
14977c478bd9Sstevel@tonic-gate
1498f4b3ec61Sdh155122 /* Run at module load time */
1499f4b3ec61Sdh155122 void
sctp_ddi_g_init(void)1500f4b3ec61Sdh155122 sctp_ddi_g_init(void)
1501f4b3ec61Sdh155122 {
15027c478bd9Sstevel@tonic-gate /* Create sctp_t/conn_t cache */
15037c478bd9Sstevel@tonic-gate sctp_conn_cache_init();
15047c478bd9Sstevel@tonic-gate
15057c478bd9Sstevel@tonic-gate /* Create the faddr cache */
15067c478bd9Sstevel@tonic-gate sctp_faddr_init();
15077c478bd9Sstevel@tonic-gate
15087c478bd9Sstevel@tonic-gate /* Create the sets cache */
15097c478bd9Sstevel@tonic-gate sctp_sets_init();
15107c478bd9Sstevel@tonic-gate
15117c478bd9Sstevel@tonic-gate /* Create the PR-SCTP sets cache */
15127c478bd9Sstevel@tonic-gate sctp_ftsn_sets_init();
15137c478bd9Sstevel@tonic-gate
15147c478bd9Sstevel@tonic-gate /* Initialize tables used for CRC calculation */
15157c478bd9Sstevel@tonic-gate sctp_crc32_init();
15167c478bd9Sstevel@tonic-gate
1517f4b3ec61Sdh155122 /*
1518f4b3ec61Sdh155122 * We want to be informed each time a stack is created or
1519f4b3ec61Sdh155122 * destroyed in the kernel, so we can maintain the
1520f4b3ec61Sdh155122 * set of sctp_stack_t's.
1521f4b3ec61Sdh155122 */
1522bd670b35SErik Nordmark netstack_register(NS_SCTP, sctp_stack_init, NULL, sctp_stack_fini);
15237c478bd9Sstevel@tonic-gate }
15247c478bd9Sstevel@tonic-gate
1525f4b3ec61Sdh155122 static void *
sctp_stack_init(netstackid_t stackid,netstack_t * ns)1526f4b3ec61Sdh155122 sctp_stack_init(netstackid_t stackid, netstack_t *ns)
15277c478bd9Sstevel@tonic-gate {
1528f4b3ec61Sdh155122 sctp_stack_t *sctps;
15296e91bba0SGirish Moodalbail size_t arrsz;
15305dd46ab5SKacheong Poon int i;
15317c478bd9Sstevel@tonic-gate
1532f4b3ec61Sdh155122 sctps = kmem_zalloc(sizeof (*sctps), KM_SLEEP);
1533f4b3ec61Sdh155122 sctps->sctps_netstack = ns;
1534f4b3ec61Sdh155122
1535f4b3ec61Sdh155122 /* Initialize locks */
1536f4b3ec61Sdh155122 mutex_init(&sctps->sctps_g_lock, NULL, MUTEX_DEFAULT, NULL);
1537f4b3ec61Sdh155122 mutex_init(&sctps->sctps_epriv_port_lock, NULL, MUTEX_DEFAULT, NULL);
1538f4b3ec61Sdh155122 sctps->sctps_g_num_epriv_ports = SCTP_NUM_EPRIV_PORTS;
15396e91bba0SGirish Moodalbail sctps->sctps_g_epriv_ports[0] = ULP_DEF_EPRIV_PORT1;
15406e91bba0SGirish Moodalbail sctps->sctps_g_epriv_ports[1] = ULP_DEF_EPRIV_PORT2;
1541f4b3ec61Sdh155122
1542f4b3ec61Sdh155122 /* Initialize SCTP hash arrays. */
1543f4b3ec61Sdh155122 sctp_hash_init(sctps);
1544f4b3ec61Sdh155122
15456e91bba0SGirish Moodalbail arrsz = sctp_propinfo_count * sizeof (mod_prop_info_t);
15466e91bba0SGirish Moodalbail sctps->sctps_propinfo_tbl = (mod_prop_info_t *)kmem_alloc(arrsz,
15476e91bba0SGirish Moodalbail KM_SLEEP);
15486e91bba0SGirish Moodalbail bcopy(sctp_propinfo_tbl, sctps->sctps_propinfo_tbl, arrsz);
1549f4b3ec61Sdh155122
1550f4b3ec61Sdh155122 /* saddr init */
1551f4b3ec61Sdh155122 sctp_saddr_init(sctps);
1552f4b3ec61Sdh155122
1553f4b3ec61Sdh155122 /* Global SCTP PCB list. */
1554f4b3ec61Sdh155122 list_create(&sctps->sctps_g_list, sizeof (sctp_t),
1555f4b3ec61Sdh155122 offsetof(sctp_t, sctp_list));
1556f4b3ec61Sdh155122
15575dd46ab5SKacheong Poon /* Initialize SCTP kstats. */
1558f4b3ec61Sdh155122 sctps->sctps_mibkp = sctp_kstat_init(stackid);
15595dd46ab5SKacheong Poon sctps->sctps_kstat = sctp_kstat2_init(stackid);
15605dd46ab5SKacheong Poon
15615dd46ab5SKacheong Poon mutex_init(&sctps->sctps_reclaim_lock, NULL, MUTEX_DEFAULT, NULL);
15625dd46ab5SKacheong Poon sctps->sctps_reclaim = B_FALSE;
15635dd46ab5SKacheong Poon sctps->sctps_reclaim_tid = 0;
15645dd46ab5SKacheong Poon sctps->sctps_reclaim_period = sctps->sctps_rto_maxg;
15655dd46ab5SKacheong Poon
15665dd46ab5SKacheong Poon /* Allocate the per netstack stats */
15675dd46ab5SKacheong Poon mutex_enter(&cpu_lock);
15685dd46ab5SKacheong Poon sctps->sctps_sc_cnt = MAX(ncpus, boot_ncpus);
15695dd46ab5SKacheong Poon mutex_exit(&cpu_lock);
15705dd46ab5SKacheong Poon sctps->sctps_sc = kmem_zalloc(max_ncpus * sizeof (sctp_stats_cpu_t *),
15715dd46ab5SKacheong Poon KM_SLEEP);
15725dd46ab5SKacheong Poon for (i = 0; i < sctps->sctps_sc_cnt; i++) {
15735dd46ab5SKacheong Poon sctps->sctps_sc[i] = kmem_zalloc(sizeof (sctp_stats_cpu_t),
15745dd46ab5SKacheong Poon KM_SLEEP);
15755dd46ab5SKacheong Poon }
15765dd46ab5SKacheong Poon
15775dd46ab5SKacheong Poon mutex_init(&sctps->sctps_listener_conf_lock, NULL, MUTEX_DEFAULT, NULL);
15785dd46ab5SKacheong Poon list_create(&sctps->sctps_listener_conf, sizeof (sctp_listener_t),
15795dd46ab5SKacheong Poon offsetof(sctp_listener_t, sl_link));
1580f4b3ec61Sdh155122
1581f4b3ec61Sdh155122 return (sctps);
1582f4b3ec61Sdh155122 }
1583f4b3ec61Sdh155122
1584f4b3ec61Sdh155122 /*
1585f4b3ec61Sdh155122 * Called when the module is about to be unloaded.
1586f4b3ec61Sdh155122 */
1587f4b3ec61Sdh155122 void
sctp_ddi_g_destroy(void)1588f4b3ec61Sdh155122 sctp_ddi_g_destroy(void)
1589f4b3ec61Sdh155122 {
15907c478bd9Sstevel@tonic-gate /* Destroy sctp_t/conn_t caches */
15917c478bd9Sstevel@tonic-gate sctp_conn_cache_fini();
15927c478bd9Sstevel@tonic-gate
15937c478bd9Sstevel@tonic-gate /* Destroy the faddr cache */
15947c478bd9Sstevel@tonic-gate sctp_faddr_fini();
15957c478bd9Sstevel@tonic-gate
15967c478bd9Sstevel@tonic-gate /* Destroy the sets cache */
15977c478bd9Sstevel@tonic-gate sctp_sets_fini();
15987c478bd9Sstevel@tonic-gate
15997c478bd9Sstevel@tonic-gate /* Destroy the PR-SCTP sets cache */
16007c478bd9Sstevel@tonic-gate sctp_ftsn_sets_fini();
16017c478bd9Sstevel@tonic-gate
1602f4b3ec61Sdh155122 netstack_unregister(NS_SCTP);
1603f4b3ec61Sdh155122 }
1604f4b3ec61Sdh155122
1605f4b3ec61Sdh155122 /*
1606f4b3ec61Sdh155122 * Free the SCTP stack instance.
1607f4b3ec61Sdh155122 */
1608f4b3ec61Sdh155122 static void
sctp_stack_fini(netstackid_t stackid,void * arg)1609f4b3ec61Sdh155122 sctp_stack_fini(netstackid_t stackid, void *arg)
1610f4b3ec61Sdh155122 {
1611f4b3ec61Sdh155122 sctp_stack_t *sctps = (sctp_stack_t *)arg;
16125dd46ab5SKacheong Poon int i;
16135dd46ab5SKacheong Poon
16145dd46ab5SKacheong Poon /*
16155dd46ab5SKacheong Poon * Set sctps_reclaim to false tells sctp_reclaim_timer() not to restart
16165dd46ab5SKacheong Poon * the timer.
16175dd46ab5SKacheong Poon */
16185dd46ab5SKacheong Poon mutex_enter(&sctps->sctps_reclaim_lock);
16195dd46ab5SKacheong Poon sctps->sctps_reclaim = B_FALSE;
16205dd46ab5SKacheong Poon mutex_exit(&sctps->sctps_reclaim_lock);
16215dd46ab5SKacheong Poon if (sctps->sctps_reclaim_tid != 0)
16225dd46ab5SKacheong Poon (void) untimeout(sctps->sctps_reclaim_tid);
16235dd46ab5SKacheong Poon mutex_destroy(&sctps->sctps_reclaim_lock);
16245dd46ab5SKacheong Poon
16255dd46ab5SKacheong Poon sctp_listener_conf_cleanup(sctps);
1626f4b3ec61Sdh155122
16276e91bba0SGirish Moodalbail kmem_free(sctps->sctps_propinfo_tbl,
16286e91bba0SGirish Moodalbail sctp_propinfo_count * sizeof (mod_prop_info_t));
16296e91bba0SGirish Moodalbail sctps->sctps_propinfo_tbl = NULL;
1630f4b3ec61Sdh155122
16317c478bd9Sstevel@tonic-gate /* Destroy the recvq taskqs. */
1632f4b3ec61Sdh155122 sctp_rq_tq_fini(sctps);
16337c478bd9Sstevel@tonic-gate
16347c478bd9Sstevel@tonic-gate /* Destroy saddr */
1635f4b3ec61Sdh155122 sctp_saddr_fini(sctps);
16367c478bd9Sstevel@tonic-gate
16377c478bd9Sstevel@tonic-gate /* Global SCTP PCB list. */
1638f4b3ec61Sdh155122 list_destroy(&sctps->sctps_g_list);
16397c478bd9Sstevel@tonic-gate
16407c478bd9Sstevel@tonic-gate /* Destroy SCTP hash arrays. */
1641f4b3ec61Sdh155122 sctp_hash_destroy(sctps);
16427c478bd9Sstevel@tonic-gate
1643f4b3ec61Sdh155122 /* Destroy SCTP kernel stats. */
16445dd46ab5SKacheong Poon for (i = 0; i < sctps->sctps_sc_cnt; i++)
16455dd46ab5SKacheong Poon kmem_free(sctps->sctps_sc[i], sizeof (sctp_stats_cpu_t));
16465dd46ab5SKacheong Poon kmem_free(sctps->sctps_sc, max_ncpus * sizeof (sctp_stats_cpu_t *));
16477c478bd9Sstevel@tonic-gate
1648f4b3ec61Sdh155122 sctp_kstat_fini(stackid, sctps->sctps_mibkp);
1649f4b3ec61Sdh155122 sctps->sctps_mibkp = NULL;
16505dd46ab5SKacheong Poon sctp_kstat2_fini(stackid, sctps->sctps_kstat);
16515dd46ab5SKacheong Poon sctps->sctps_kstat = NULL;
1652f4b3ec61Sdh155122
1653f4b3ec61Sdh155122 mutex_destroy(&sctps->sctps_g_lock);
1654f4b3ec61Sdh155122 mutex_destroy(&sctps->sctps_epriv_port_lock);
1655f4b3ec61Sdh155122
1656f4b3ec61Sdh155122 kmem_free(sctps, sizeof (*sctps));
16577c478bd9Sstevel@tonic-gate }
16587c478bd9Sstevel@tonic-gate
16597c478bd9Sstevel@tonic-gate static void
sctp_rq_tq_init(sctp_stack_t * sctps)1660f4b3ec61Sdh155122 sctp_rq_tq_init(sctp_stack_t *sctps)
16617c478bd9Sstevel@tonic-gate {
16625dd46ab5SKacheong Poon char tq_name[TASKQ_NAMELEN];
16635dd46ab5SKacheong Poon int thrs;
16645dd46ab5SKacheong Poon int max_tasks;
16655dd46ab5SKacheong Poon
1666a215d4ebSKacheong Poon mutex_enter(&sctps->sctps_g_lock);
1667a215d4ebSKacheong Poon /* Someone may have beaten us in creating the taskqs. */
1668a215d4ebSKacheong Poon if (sctps->sctps_recvq_tq_list_cur_sz > 0) {
1669a215d4ebSKacheong Poon mutex_exit(&sctps->sctps_g_lock);
1670a215d4ebSKacheong Poon return;
1671a215d4ebSKacheong Poon }
1672a215d4ebSKacheong Poon
16735dd46ab5SKacheong Poon thrs = MIN(sctp_recvq_tq_thr_max, MAX(sctp_recvq_tq_thr_min,
16745dd46ab5SKacheong Poon MAX(ncpus, boot_ncpus)));
16755dd46ab5SKacheong Poon /*
16765dd46ab5SKacheong Poon * Make sure that the maximum number of tasks is at least thrice as
16775dd46ab5SKacheong Poon * large as the number of threads.
16785dd46ab5SKacheong Poon */
16795dd46ab5SKacheong Poon max_tasks = MAX(sctp_recvq_tq_task_min, thrs) * 3;
16805dd46ab5SKacheong Poon
16815dd46ab5SKacheong Poon /*
16825dd46ab5SKacheong Poon * This helps differentiate the default taskqs in different IP stacks.
16835dd46ab5SKacheong Poon */
16845dd46ab5SKacheong Poon (void) snprintf(tq_name, sizeof (tq_name), "sctp_def_rq_taskq_%d",
16855dd46ab5SKacheong Poon sctps->sctps_netstack->netstack_stackid);
16865dd46ab5SKacheong Poon
16875dd46ab5SKacheong Poon sctps->sctps_recvq_tq_list_max_sz = sctp_recvq_tq_list_max;
1688f4b3ec61Sdh155122 sctps->sctps_recvq_tq_list_cur_sz = 1;
16895dd46ab5SKacheong Poon
16907c478bd9Sstevel@tonic-gate /*
16917c478bd9Sstevel@tonic-gate * Initialize the recvq_tq_list and create the first recvq taskq.
16927c478bd9Sstevel@tonic-gate * What to do if it fails?
16937c478bd9Sstevel@tonic-gate */
1694f4b3ec61Sdh155122 sctps->sctps_recvq_tq_list =
1695f4b3ec61Sdh155122 kmem_zalloc(sctps->sctps_recvq_tq_list_max_sz * sizeof (taskq_t *),
1696f4b3ec61Sdh155122 KM_SLEEP);
16975dd46ab5SKacheong Poon sctps->sctps_recvq_tq_list[0] = taskq_create(tq_name, thrs,
16985dd46ab5SKacheong Poon minclsyspri, sctp_recvq_tq_task_min, max_tasks, TASKQ_PREPOPULATE);
1699f4b3ec61Sdh155122 mutex_init(&sctps->sctps_rq_tq_lock, NULL, MUTEX_DEFAULT, NULL);
1700a215d4ebSKacheong Poon
1701a215d4ebSKacheong Poon mutex_exit(&sctps->sctps_g_lock);
17027c478bd9Sstevel@tonic-gate }
17037c478bd9Sstevel@tonic-gate
17047c478bd9Sstevel@tonic-gate static void
sctp_rq_tq_fini(sctp_stack_t * sctps)1705f4b3ec61Sdh155122 sctp_rq_tq_fini(sctp_stack_t *sctps)
17067c478bd9Sstevel@tonic-gate {
17077c478bd9Sstevel@tonic-gate int i;
17087c478bd9Sstevel@tonic-gate
17095dd46ab5SKacheong Poon if (sctps->sctps_recvq_tq_list_cur_sz == 0)
17105dd46ab5SKacheong Poon return;
17115dd46ab5SKacheong Poon
1712f4b3ec61Sdh155122 for (i = 0; i < sctps->sctps_recvq_tq_list_cur_sz; i++) {
1713f4b3ec61Sdh155122 ASSERT(sctps->sctps_recvq_tq_list[i] != NULL);
1714f4b3ec61Sdh155122 taskq_destroy(sctps->sctps_recvq_tq_list[i]);
17157c478bd9Sstevel@tonic-gate }
1716f4b3ec61Sdh155122 kmem_free(sctps->sctps_recvq_tq_list,
1717f4b3ec61Sdh155122 sctps->sctps_recvq_tq_list_max_sz * sizeof (taskq_t *));
1718f4b3ec61Sdh155122 sctps->sctps_recvq_tq_list = NULL;
17197c478bd9Sstevel@tonic-gate }
17207c478bd9Sstevel@tonic-gate
17217c478bd9Sstevel@tonic-gate /* Add another taskq for a new ill. */
17227c478bd9Sstevel@tonic-gate void
sctp_inc_taskq(sctp_stack_t * sctps)1723f4b3ec61Sdh155122 sctp_inc_taskq(sctp_stack_t *sctps)
17247c478bd9Sstevel@tonic-gate {
17257c478bd9Sstevel@tonic-gate taskq_t *tq;
17267c478bd9Sstevel@tonic-gate char tq_name[TASKQ_NAMELEN];
17275dd46ab5SKacheong Poon int thrs;
17285dd46ab5SKacheong Poon int max_tasks;
17295dd46ab5SKacheong Poon
17305dd46ab5SKacheong Poon thrs = MIN(sctp_recvq_tq_thr_max, MAX(sctp_recvq_tq_thr_min,
17315dd46ab5SKacheong Poon MAX(ncpus, boot_ncpus)));
17325dd46ab5SKacheong Poon /*
17335dd46ab5SKacheong Poon * Make sure that the maximum number of tasks is at least thrice as
17345dd46ab5SKacheong Poon * large as the number of threads.
17355dd46ab5SKacheong Poon */
17365dd46ab5SKacheong Poon max_tasks = MAX(sctp_recvq_tq_task_min, thrs) * 3;
17377c478bd9Sstevel@tonic-gate
1738f4b3ec61Sdh155122 mutex_enter(&sctps->sctps_rq_tq_lock);
1739f4b3ec61Sdh155122 if (sctps->sctps_recvq_tq_list_cur_sz + 1 >
1740f4b3ec61Sdh155122 sctps->sctps_recvq_tq_list_max_sz) {
1741f4b3ec61Sdh155122 mutex_exit(&sctps->sctps_rq_tq_lock);
17427c478bd9Sstevel@tonic-gate cmn_err(CE_NOTE, "Cannot create more SCTP recvq taskq");
17437c478bd9Sstevel@tonic-gate return;
17447c478bd9Sstevel@tonic-gate }
17457c478bd9Sstevel@tonic-gate
17465dd46ab5SKacheong Poon (void) snprintf(tq_name, sizeof (tq_name), "sctp_rq_taskq_%d_%u",
17475dd46ab5SKacheong Poon sctps->sctps_netstack->netstack_stackid,
1748f4b3ec61Sdh155122 sctps->sctps_recvq_tq_list_cur_sz);
17495dd46ab5SKacheong Poon tq = taskq_create(tq_name, thrs, minclsyspri, sctp_recvq_tq_task_min,
17505dd46ab5SKacheong Poon max_tasks, TASKQ_PREPOPULATE);
17517c478bd9Sstevel@tonic-gate if (tq == NULL) {
1752f4b3ec61Sdh155122 mutex_exit(&sctps->sctps_rq_tq_lock);
17537c478bd9Sstevel@tonic-gate cmn_err(CE_NOTE, "SCTP recvq taskq creation failed");
17547c478bd9Sstevel@tonic-gate return;
17557c478bd9Sstevel@tonic-gate }
1756f4b3ec61Sdh155122 ASSERT(sctps->sctps_recvq_tq_list[
1757f4b3ec61Sdh155122 sctps->sctps_recvq_tq_list_cur_sz] == NULL);
1758f4b3ec61Sdh155122 sctps->sctps_recvq_tq_list[sctps->sctps_recvq_tq_list_cur_sz] = tq;
1759*1a5e258fSJosef 'Jeff' Sipek atomic_inc_32(&sctps->sctps_recvq_tq_list_cur_sz);
1760f4b3ec61Sdh155122 mutex_exit(&sctps->sctps_rq_tq_lock);
17617c478bd9Sstevel@tonic-gate }
17627c478bd9Sstevel@tonic-gate
17637c478bd9Sstevel@tonic-gate #ifdef DEBUG
17647c478bd9Sstevel@tonic-gate uint32_t recvq_loop_cnt = 0;
17657c478bd9Sstevel@tonic-gate uint32_t recvq_call = 0;
17667c478bd9Sstevel@tonic-gate #endif
17677c478bd9Sstevel@tonic-gate
17687c478bd9Sstevel@tonic-gate /*
17697c478bd9Sstevel@tonic-gate * Find the next recvq_tq to use. This routine will go thru all the
17707c478bd9Sstevel@tonic-gate * taskqs until it can dispatch a job for the sctp. If this fails,
17717c478bd9Sstevel@tonic-gate * it will create a new taskq and try it.
17727c478bd9Sstevel@tonic-gate */
17737c478bd9Sstevel@tonic-gate static boolean_t
sctp_find_next_tq(sctp_t * sctp)17747c478bd9Sstevel@tonic-gate sctp_find_next_tq(sctp_t *sctp)
17757c478bd9Sstevel@tonic-gate {
17767c478bd9Sstevel@tonic-gate int next_tq, try;
17777c478bd9Sstevel@tonic-gate taskq_t *tq;
1778f4b3ec61Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps;
17797c478bd9Sstevel@tonic-gate
17807c478bd9Sstevel@tonic-gate /*
17817c478bd9Sstevel@tonic-gate * Note that since we don't hold a lock on sctp_rq_tq_lock for
17827c478bd9Sstevel@tonic-gate * performance reason, recvq_ta_list_cur_sz can be changed during
17837c478bd9Sstevel@tonic-gate * this loop. The problem this will create is that the loop may
17847c478bd9Sstevel@tonic-gate * not have tried all the recvq_tq. This should be OK.
17857c478bd9Sstevel@tonic-gate */
1786*1a5e258fSJosef 'Jeff' Sipek next_tq = atomic_inc_32_nv(&sctps->sctps_recvq_tq_list_cur) %
1787f4b3ec61Sdh155122 sctps->sctps_recvq_tq_list_cur_sz;
1788f4b3ec61Sdh155122 for (try = 0; try < sctps->sctps_recvq_tq_list_cur_sz; try++) {
1789f4b3ec61Sdh155122 tq = sctps->sctps_recvq_tq_list[next_tq];
17907c478bd9Sstevel@tonic-gate if (taskq_dispatch(tq, sctp_process_recvq, sctp,
17917c478bd9Sstevel@tonic-gate TQ_NOSLEEP) != NULL) {
17927c478bd9Sstevel@tonic-gate sctp->sctp_recvq_tq = tq;
17937c478bd9Sstevel@tonic-gate return (B_TRUE);
17947c478bd9Sstevel@tonic-gate }
1795f4b3ec61Sdh155122 next_tq = (next_tq + 1) % sctps->sctps_recvq_tq_list_cur_sz;
17967c478bd9Sstevel@tonic-gate }
17977c478bd9Sstevel@tonic-gate
17987c478bd9Sstevel@tonic-gate /*
17997c478bd9Sstevel@tonic-gate * Create one more taskq and try it. Note that sctp_inc_taskq()
18007c478bd9Sstevel@tonic-gate * may not have created another taskq if the number of recvq
18017c478bd9Sstevel@tonic-gate * taskqs is at the maximum. We are probably in a pretty bad
18027c478bd9Sstevel@tonic-gate * shape if this actually happens...
18037c478bd9Sstevel@tonic-gate */
1804f4b3ec61Sdh155122 sctp_inc_taskq(sctps);
1805f4b3ec61Sdh155122 tq = sctps->sctps_recvq_tq_list[sctps->sctps_recvq_tq_list_cur_sz - 1];
18067c478bd9Sstevel@tonic-gate if (taskq_dispatch(tq, sctp_process_recvq, sctp, TQ_NOSLEEP) != NULL) {
18077c478bd9Sstevel@tonic-gate sctp->sctp_recvq_tq = tq;
18087c478bd9Sstevel@tonic-gate return (B_TRUE);
18097c478bd9Sstevel@tonic-gate }
1810f4b3ec61Sdh155122 SCTP_KSTAT(sctps, sctp_find_next_tq);
18117c478bd9Sstevel@tonic-gate return (B_FALSE);
18127c478bd9Sstevel@tonic-gate }
18137c478bd9Sstevel@tonic-gate
18147c478bd9Sstevel@tonic-gate /*
18157c478bd9Sstevel@tonic-gate * To add a message to the recvq. Note that the sctp_timer_fire()
18167c478bd9Sstevel@tonic-gate * routine also uses this function to add the timer message to the
18177c478bd9Sstevel@tonic-gate * receive queue for later processing. And it should be the only
18187c478bd9Sstevel@tonic-gate * caller of sctp_add_recvq() which sets the try_harder argument
18197c478bd9Sstevel@tonic-gate * to B_TRUE.
18207c478bd9Sstevel@tonic-gate *
18217c478bd9Sstevel@tonic-gate * If the try_harder argument is B_TRUE, this routine sctp_find_next_tq()
18227c478bd9Sstevel@tonic-gate * will try very hard to dispatch the task. Refer to the comment
18237c478bd9Sstevel@tonic-gate * for that routine on how it does that.
1824bd670b35SErik Nordmark *
1825bd670b35SErik Nordmark * On failure the message has been freed i.e., this routine always consumes the
1826bd670b35SErik Nordmark * message. It bumps ipIfStatsInDiscards and and uses ip_drop_input to drop.
18277c478bd9Sstevel@tonic-gate */
1828bd670b35SErik Nordmark void
sctp_add_recvq(sctp_t * sctp,mblk_t * mp,boolean_t caller_hold_lock,ip_recv_attr_t * ira)1829bd670b35SErik Nordmark sctp_add_recvq(sctp_t *sctp, mblk_t *mp, boolean_t caller_hold_lock,
1830bd670b35SErik Nordmark ip_recv_attr_t *ira)
18317c478bd9Sstevel@tonic-gate {
1832bd670b35SErik Nordmark mblk_t *attrmp;
1833bd670b35SErik Nordmark ip_stack_t *ipst = sctp->sctp_sctps->sctps_netstack->netstack_ip;
1834bd670b35SErik Nordmark
1835bd670b35SErik Nordmark ASSERT(ira->ira_ill == NULL);
1836bd670b35SErik Nordmark
18377c478bd9Sstevel@tonic-gate if (!caller_hold_lock)
18387c478bd9Sstevel@tonic-gate mutex_enter(&sctp->sctp_recvq_lock);
18397c478bd9Sstevel@tonic-gate
18407c478bd9Sstevel@tonic-gate /* If the taskq dispatch has not been scheduled, do it now. */
18417c478bd9Sstevel@tonic-gate if (sctp->sctp_recvq_tq == NULL) {
18427c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_recvq == NULL);
18437c478bd9Sstevel@tonic-gate if (!sctp_find_next_tq(sctp)) {
18447c478bd9Sstevel@tonic-gate if (!caller_hold_lock)
18457c478bd9Sstevel@tonic-gate mutex_exit(&sctp->sctp_recvq_lock);
1846bd670b35SErik Nordmark BUMP_MIB(&ipst->ips_ip_mib, ipIfStatsInDiscards);
1847bd670b35SErik Nordmark ip_drop_input("ipIfStatsInDiscards", mp, NULL);
1848bd670b35SErik Nordmark freemsg(mp);
1849bd670b35SErik Nordmark return;
18507c478bd9Sstevel@tonic-gate }
18517c478bd9Sstevel@tonic-gate /* Make sure the sctp_t will not go away. */
18527c478bd9Sstevel@tonic-gate SCTP_REFHOLD(sctp);
18537c478bd9Sstevel@tonic-gate }
18547c478bd9Sstevel@tonic-gate
1855bd670b35SErik Nordmark attrmp = ip_recv_attr_to_mblk(ira);
1856bd670b35SErik Nordmark if (attrmp == NULL) {
1857bd670b35SErik Nordmark if (!caller_hold_lock)
1858bd670b35SErik Nordmark mutex_exit(&sctp->sctp_recvq_lock);
1859bd670b35SErik Nordmark BUMP_MIB(&ipst->ips_ip_mib, ipIfStatsInDiscards);
1860bd670b35SErik Nordmark ip_drop_input("ipIfStatsInDiscards", mp, NULL);
1861bd670b35SErik Nordmark freemsg(mp);
1862bd670b35SErik Nordmark return;
1863bd670b35SErik Nordmark }
1864bd670b35SErik Nordmark ASSERT(attrmp->b_cont == NULL);
1865bd670b35SErik Nordmark attrmp->b_cont = mp;
1866bd670b35SErik Nordmark mp = attrmp;
1867bd670b35SErik Nordmark
18687c478bd9Sstevel@tonic-gate if (sctp->sctp_recvq == NULL) {
18697c478bd9Sstevel@tonic-gate sctp->sctp_recvq = mp;
18707c478bd9Sstevel@tonic-gate sctp->sctp_recvq_tail = mp;
18717c478bd9Sstevel@tonic-gate } else {
18727c478bd9Sstevel@tonic-gate sctp->sctp_recvq_tail->b_next = mp;
18737c478bd9Sstevel@tonic-gate sctp->sctp_recvq_tail = mp;
18747c478bd9Sstevel@tonic-gate }
18757c478bd9Sstevel@tonic-gate
18767c478bd9Sstevel@tonic-gate if (!caller_hold_lock)
18777c478bd9Sstevel@tonic-gate mutex_exit(&sctp->sctp_recvq_lock);
18787c478bd9Sstevel@tonic-gate }
18797c478bd9Sstevel@tonic-gate
18807c478bd9Sstevel@tonic-gate static void
sctp_process_recvq(void * arg)18817c478bd9Sstevel@tonic-gate sctp_process_recvq(void *arg)
18827c478bd9Sstevel@tonic-gate {
18837c478bd9Sstevel@tonic-gate sctp_t *sctp = (sctp_t *)arg;
18847c478bd9Sstevel@tonic-gate mblk_t *mp;
18857c478bd9Sstevel@tonic-gate #ifdef DEBUG
18867c478bd9Sstevel@tonic-gate uint32_t loop_cnt = 0;
18877c478bd9Sstevel@tonic-gate #endif
1888bd670b35SErik Nordmark ip_recv_attr_t iras;
18897c478bd9Sstevel@tonic-gate
18907c478bd9Sstevel@tonic-gate #ifdef _BIG_ENDIAN
18917c478bd9Sstevel@tonic-gate #define IPVER(ip6h) ((((uint32_t *)ip6h)[0] >> 28) & 0x7)
18927c478bd9Sstevel@tonic-gate #else
18937c478bd9Sstevel@tonic-gate #define IPVER(ip6h) ((((uint32_t *)ip6h)[0] >> 4) & 0x7)
18947c478bd9Sstevel@tonic-gate #endif
18957c478bd9Sstevel@tonic-gate
18967c478bd9Sstevel@tonic-gate RUN_SCTP(sctp);
18977c478bd9Sstevel@tonic-gate mutex_enter(&sctp->sctp_recvq_lock);
18987c478bd9Sstevel@tonic-gate
18997c478bd9Sstevel@tonic-gate #ifdef DEBUG
19007c478bd9Sstevel@tonic-gate recvq_call++;
19017c478bd9Sstevel@tonic-gate #endif
19027c478bd9Sstevel@tonic-gate /*
19037c478bd9Sstevel@tonic-gate * Note that while we are in this loop, other thread can put
19047c478bd9Sstevel@tonic-gate * new packets in the receive queue. We may be looping for
19057c478bd9Sstevel@tonic-gate * quite a while.
19067c478bd9Sstevel@tonic-gate */
19077c478bd9Sstevel@tonic-gate while ((mp = sctp->sctp_recvq) != NULL) {
1908bd670b35SErik Nordmark mblk_t *data_mp;
1909bd670b35SErik Nordmark
19107c478bd9Sstevel@tonic-gate sctp->sctp_recvq = mp->b_next;
19117c478bd9Sstevel@tonic-gate mutex_exit(&sctp->sctp_recvq_lock);
19127c478bd9Sstevel@tonic-gate mp->b_next = NULL;
19137c478bd9Sstevel@tonic-gate #ifdef DEBUG
19147c478bd9Sstevel@tonic-gate loop_cnt++;
19157c478bd9Sstevel@tonic-gate #endif
19167c478bd9Sstevel@tonic-gate mp->b_prev = NULL;
19177c478bd9Sstevel@tonic-gate
1918bd670b35SErik Nordmark data_mp = mp->b_cont;
1919bd670b35SErik Nordmark mp->b_cont = NULL;
1920bd670b35SErik Nordmark if (!ip_recv_attr_from_mblk(mp, &iras)) {
1921bd670b35SErik Nordmark ip_drop_input("ip_recv_attr_from_mblk", mp, NULL);
1922bd670b35SErik Nordmark freemsg(mp);
1923bd670b35SErik Nordmark ira_cleanup(&iras, B_TRUE);
1924bd670b35SErik Nordmark continue;
1925bd670b35SErik Nordmark }
1926bd670b35SErik Nordmark
1927bd670b35SErik Nordmark if (iras.ira_flags & IRAF_ICMP_ERROR)
1928bd670b35SErik Nordmark sctp_icmp_error(sctp, data_mp);
1929bd670b35SErik Nordmark else
1930bd670b35SErik Nordmark sctp_input_data(sctp, data_mp, &iras);
1931bd670b35SErik Nordmark
1932bd670b35SErik Nordmark ira_cleanup(&iras, B_TRUE);
19337c478bd9Sstevel@tonic-gate mutex_enter(&sctp->sctp_recvq_lock);
19347c478bd9Sstevel@tonic-gate }
19357c478bd9Sstevel@tonic-gate
19367c478bd9Sstevel@tonic-gate sctp->sctp_recvq_tail = NULL;
19377c478bd9Sstevel@tonic-gate sctp->sctp_recvq_tq = NULL;
19387c478bd9Sstevel@tonic-gate
19397c478bd9Sstevel@tonic-gate mutex_exit(&sctp->sctp_recvq_lock);
19407c478bd9Sstevel@tonic-gate
19417c478bd9Sstevel@tonic-gate WAKE_SCTP(sctp);
19427c478bd9Sstevel@tonic-gate
19437c478bd9Sstevel@tonic-gate #ifdef DEBUG
19447c478bd9Sstevel@tonic-gate if (loop_cnt > recvq_loop_cnt)
19457c478bd9Sstevel@tonic-gate recvq_loop_cnt = loop_cnt;
19467c478bd9Sstevel@tonic-gate #endif
19477c478bd9Sstevel@tonic-gate /* Now it can go away. */
19487c478bd9Sstevel@tonic-gate SCTP_REFRELE(sctp);
19497c478bd9Sstevel@tonic-gate }
19507c478bd9Sstevel@tonic-gate
19517c478bd9Sstevel@tonic-gate /* ARGSUSED */
19527c478bd9Sstevel@tonic-gate static int
sctp_conn_cache_constructor(void * buf,void * cdrarg,int kmflags)19537c478bd9Sstevel@tonic-gate sctp_conn_cache_constructor(void *buf, void *cdrarg, int kmflags)
19547c478bd9Sstevel@tonic-gate {
1955bd670b35SErik Nordmark conn_t *connp = (conn_t *)buf;
1956bd670b35SErik Nordmark sctp_t *sctp = (sctp_t *)&connp[1];
195792baa190SGeorge Shepherd int cnt;
19587c478bd9Sstevel@tonic-gate
1959bd670b35SErik Nordmark bzero(connp, sizeof (conn_t));
19607c478bd9Sstevel@tonic-gate bzero(buf, (char *)&sctp[1] - (char *)buf);
19617c478bd9Sstevel@tonic-gate
19627c478bd9Sstevel@tonic-gate mutex_init(&sctp->sctp_reflock, NULL, MUTEX_DEFAULT, NULL);
19637c478bd9Sstevel@tonic-gate mutex_init(&sctp->sctp_lock, NULL, MUTEX_DEFAULT, NULL);
19647c478bd9Sstevel@tonic-gate mutex_init(&sctp->sctp_recvq_lock, NULL, MUTEX_DEFAULT, NULL);
19657c478bd9Sstevel@tonic-gate cv_init(&sctp->sctp_cv, NULL, CV_DEFAULT, NULL);
196692baa190SGeorge Shepherd for (cnt = 0; cnt < SCTP_IPIF_HASH; cnt++) {
196792baa190SGeorge Shepherd rw_init(&sctp->sctp_saddrs[cnt].ipif_hash_lock, NULL,
196892baa190SGeorge Shepherd RW_DEFAULT, NULL);
196992baa190SGeorge Shepherd }
19707c478bd9Sstevel@tonic-gate
1971bd670b35SErik Nordmark mutex_init(&connp->conn_lock, NULL, MUTEX_DEFAULT, NULL);
1972bd670b35SErik Nordmark cv_init(&connp->conn_cv, NULL, CV_DEFAULT, NULL);
1973bd670b35SErik Nordmark connp->conn_flags = IPCL_SCTPCONN;
1974bd670b35SErik Nordmark connp->conn_proto = IPPROTO_SCTP;
1975bd670b35SErik Nordmark connp->conn_sctp = sctp;
1976bd670b35SErik Nordmark sctp->sctp_connp = connp;
1977bd670b35SErik Nordmark rw_init(&connp->conn_ilg_lock, NULL, RW_DEFAULT, NULL);
1978bd670b35SErik Nordmark
1979bd670b35SErik Nordmark connp->conn_ixa = kmem_zalloc(sizeof (ip_xmit_attr_t), kmflags);
1980bd670b35SErik Nordmark if (connp->conn_ixa == NULL) {
1981bd670b35SErik Nordmark return (ENOMEM);
1982bd670b35SErik Nordmark }
1983bd670b35SErik Nordmark connp->conn_ixa->ixa_refcnt = 1;
1984bd670b35SErik Nordmark connp->conn_ixa->ixa_protocol = connp->conn_proto;
1985bd670b35SErik Nordmark connp->conn_ixa->ixa_xmit_hint = CONN_TO_XMIT_HINT(connp);
19867c478bd9Sstevel@tonic-gate return (0);
19877c478bd9Sstevel@tonic-gate }
19887c478bd9Sstevel@tonic-gate
19897c478bd9Sstevel@tonic-gate /* ARGSUSED */
19907c478bd9Sstevel@tonic-gate static void
sctp_conn_cache_destructor(void * buf,void * cdrarg)19917c478bd9Sstevel@tonic-gate sctp_conn_cache_destructor(void *buf, void *cdrarg)
19927c478bd9Sstevel@tonic-gate {
1993bd670b35SErik Nordmark conn_t *connp = (conn_t *)buf;
1994bd670b35SErik Nordmark sctp_t *sctp = (sctp_t *)&connp[1];
199592baa190SGeorge Shepherd int cnt;
19967c478bd9Sstevel@tonic-gate
1997bd670b35SErik Nordmark ASSERT(sctp->sctp_connp == connp);
19987c478bd9Sstevel@tonic-gate ASSERT(!MUTEX_HELD(&sctp->sctp_lock));
19997c478bd9Sstevel@tonic-gate ASSERT(!MUTEX_HELD(&sctp->sctp_reflock));
20007c478bd9Sstevel@tonic-gate ASSERT(!MUTEX_HELD(&sctp->sctp_recvq_lock));
20017c478bd9Sstevel@tonic-gate
20027c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_conn_hash_next == NULL);
20037c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_conn_hash_prev == NULL);
20047c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_listen_hash_next == NULL);
20057c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_listen_hash_prev == NULL);
20067c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_listen_tfp == NULL);
20077c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_conn_tfp == NULL);
20087c478bd9Sstevel@tonic-gate
20097c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_faddrs == NULL);
20107c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_nsaddrs == 0);
20117c478bd9Sstevel@tonic-gate
20127c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_ulpd == NULL);
20137c478bd9Sstevel@tonic-gate
20147c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_lastfaddr == NULL);
20157c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_primary == NULL);
20167c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_current == NULL);
20177c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_lastdata == NULL);
20187c478bd9Sstevel@tonic-gate
20197c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_xmit_head == NULL);
20207c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_xmit_tail == NULL);
20217c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_xmit_unsent == NULL);
20227c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_xmit_unsent_tail == NULL);
20237c478bd9Sstevel@tonic-gate
20247c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_ostrcntrs == NULL);
20257c478bd9Sstevel@tonic-gate
20267c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_sack_info == NULL);
20277c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_ack_mp == NULL);
20287c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_instr == NULL);
20297c478bd9Sstevel@tonic-gate
20307c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_iphc == NULL);
20317c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_iphc6 == NULL);
20327c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_ipha == NULL);
20337c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_ip6h == NULL);
20347c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_sctph == NULL);
20357c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_sctph6 == NULL);
20367c478bd9Sstevel@tonic-gate
20377c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_cookie_mp == NULL);
20387c478bd9Sstevel@tonic-gate
20397c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_refcnt == 0);
20407c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_timer_mp == NULL);
20417c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_connp->conn_ref == 0);
20427c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_heartbeat_mp == NULL);
20437c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_ptpbhn == NULL && sctp->sctp_bind_hash == NULL);
20447c478bd9Sstevel@tonic-gate
20457c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_shutdown_faddr == NULL);
20467c478bd9Sstevel@tonic-gate
20477c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_cxmit_list == NULL);
20487c478bd9Sstevel@tonic-gate
20497c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_recvq == NULL);
20507c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_recvq_tail == NULL);
20517c478bd9Sstevel@tonic-gate ASSERT(sctp->sctp_recvq_tq == NULL);
20527c478bd9Sstevel@tonic-gate
2053121e5416Skcpoon /*
2054121e5416Skcpoon * sctp_pad_mp can be NULL if the memory allocation fails
2055121e5416Skcpoon * in sctp_init_values() and the conn_t is freed.
2056121e5416Skcpoon */
2057121e5416Skcpoon if (sctp->sctp_pad_mp != NULL) {
2058121e5416Skcpoon freeb(sctp->sctp_pad_mp);
2059121e5416Skcpoon sctp->sctp_pad_mp = NULL;
2060121e5416Skcpoon }
2061121e5416Skcpoon
20627c478bd9Sstevel@tonic-gate mutex_destroy(&sctp->sctp_reflock);
20637c478bd9Sstevel@tonic-gate mutex_destroy(&sctp->sctp_lock);
20647c478bd9Sstevel@tonic-gate mutex_destroy(&sctp->sctp_recvq_lock);
20657c478bd9Sstevel@tonic-gate cv_destroy(&sctp->sctp_cv);
206692baa190SGeorge Shepherd for (cnt = 0; cnt < SCTP_IPIF_HASH; cnt++) {
206792baa190SGeorge Shepherd rw_destroy(&sctp->sctp_saddrs[cnt].ipif_hash_lock);
206892baa190SGeorge Shepherd }
20697c478bd9Sstevel@tonic-gate
2070bd670b35SErik Nordmark mutex_destroy(&connp->conn_lock);
2071bd670b35SErik Nordmark cv_destroy(&connp->conn_cv);
2072bd670b35SErik Nordmark rw_destroy(&connp->conn_ilg_lock);
2073bd670b35SErik Nordmark
2074bd670b35SErik Nordmark /* Can be NULL if constructor failed */
2075bd670b35SErik Nordmark if (connp->conn_ixa != NULL) {
2076bd670b35SErik Nordmark ASSERT(connp->conn_ixa->ixa_refcnt == 1);
2077bd670b35SErik Nordmark ASSERT(connp->conn_ixa->ixa_ire == NULL);
2078bd670b35SErik Nordmark ASSERT(connp->conn_ixa->ixa_nce == NULL);
2079bd670b35SErik Nordmark ixa_refrele(connp->conn_ixa);
2080bd670b35SErik Nordmark }
20817c478bd9Sstevel@tonic-gate }
20827c478bd9Sstevel@tonic-gate
20837c478bd9Sstevel@tonic-gate static void
sctp_conn_cache_init()20847c478bd9Sstevel@tonic-gate sctp_conn_cache_init()
20857c478bd9Sstevel@tonic-gate {
20867c478bd9Sstevel@tonic-gate sctp_conn_cache = kmem_cache_create("sctp_conn_cache",
20877c478bd9Sstevel@tonic-gate sizeof (sctp_t) + sizeof (conn_t), 0, sctp_conn_cache_constructor,
20885dd46ab5SKacheong Poon sctp_conn_cache_destructor, sctp_conn_reclaim, NULL, NULL, 0);
20897c478bd9Sstevel@tonic-gate }
20907c478bd9Sstevel@tonic-gate
20917c478bd9Sstevel@tonic-gate static void
sctp_conn_cache_fini()20927c478bd9Sstevel@tonic-gate sctp_conn_cache_fini()
20937c478bd9Sstevel@tonic-gate {
20947c478bd9Sstevel@tonic-gate kmem_cache_destroy(sctp_conn_cache);
20957c478bd9Sstevel@tonic-gate }
2096121e5416Skcpoon
2097121e5416Skcpoon void
sctp_conn_init(conn_t * connp)2098121e5416Skcpoon sctp_conn_init(conn_t *connp)
2099121e5416Skcpoon {
2100bd670b35SErik Nordmark ASSERT(connp->conn_flags == IPCL_SCTPCONN);
2101121e5416Skcpoon connp->conn_rq = connp->conn_wq = NULL;
2102bd670b35SErik Nordmark connp->conn_ixa->ixa_flags |= IXAF_SET_ULP_CKSUM | IXAF_VERIFY_SOURCE |
2103bd670b35SErik Nordmark IXAF_VERIFY_PMTU;
2104bd670b35SErik Nordmark
2105bd670b35SErik Nordmark ASSERT(connp->conn_proto == IPPROTO_SCTP);
2106bd670b35SErik Nordmark ASSERT(connp->conn_ixa->ixa_protocol == connp->conn_proto);
2107121e5416Skcpoon connp->conn_state_flags |= CONN_INCIPIENT;
2108bd670b35SErik Nordmark
2109bd670b35SErik Nordmark ASSERT(connp->conn_sctp != NULL);
2110bd670b35SErik Nordmark
2111bd670b35SErik Nordmark /*
2112bd670b35SErik Nordmark * Register sctp_notify to listen to capability changes detected by IP.
2113bd670b35SErik Nordmark * This upcall is made in the context of the call to conn_ip_output
2114bd670b35SErik Nordmark * thus it holds whatever locks sctp holds across conn_ip_output.
2115bd670b35SErik Nordmark */
2116bd670b35SErik Nordmark connp->conn_ixa->ixa_notify = sctp_notify;
2117bd670b35SErik Nordmark connp->conn_ixa->ixa_notify_cookie = connp->conn_sctp;
2118121e5416Skcpoon }
2119121e5416Skcpoon
2120121e5416Skcpoon static void
sctp_conn_clear(conn_t * connp)2121121e5416Skcpoon sctp_conn_clear(conn_t *connp)
2122121e5416Skcpoon {
2123121e5416Skcpoon /* Clean up conn_t stuff */
2124bd670b35SErik Nordmark if (connp->conn_latch != NULL) {
2125bd670b35SErik Nordmark IPLATCH_REFRELE(connp->conn_latch);
2126bd670b35SErik Nordmark connp->conn_latch = NULL;
2127bd670b35SErik Nordmark }
2128bd670b35SErik Nordmark if (connp->conn_latch_in_policy != NULL) {
2129bd670b35SErik Nordmark IPPOL_REFRELE(connp->conn_latch_in_policy);
2130bd670b35SErik Nordmark connp->conn_latch_in_policy = NULL;
2131bd670b35SErik Nordmark }
2132bd670b35SErik Nordmark if (connp->conn_latch_in_action != NULL) {
2133bd670b35SErik Nordmark IPACT_REFRELE(connp->conn_latch_in_action);
2134bd670b35SErik Nordmark connp->conn_latch_in_action = NULL;
2135bd670b35SErik Nordmark }
2136bd670b35SErik Nordmark if (connp->conn_policy != NULL) {
2137121e5416Skcpoon IPPH_REFRELE(connp->conn_policy, connp->conn_netstack);
2138bd670b35SErik Nordmark connp->conn_policy = NULL;
2139bd670b35SErik Nordmark }
2140bd670b35SErik Nordmark if (connp->conn_ipsec_opt_mp != NULL) {
2141121e5416Skcpoon freemsg(connp->conn_ipsec_opt_mp);
2142bd670b35SErik Nordmark connp->conn_ipsec_opt_mp = NULL;
2143bd670b35SErik Nordmark }
2144121e5416Skcpoon netstack_rele(connp->conn_netstack);
2145bd670b35SErik Nordmark connp->conn_netstack = NULL;
2146bd670b35SErik Nordmark
2147bd670b35SErik Nordmark /* Leave conn_ixa and other constructed fields in place */
2148bd670b35SErik Nordmark ipcl_conn_cleanup(connp);
2149121e5416Skcpoon }
2150