xref: /freebsd/sys/netinet/sctp_timer.c (revision 1f4bcc459a76b7aa664f3fd557684cd0ba6da352)
1 /*-
2  * Copyright (c) 2001-2007, by Cisco Systems, Inc. All rights reserved.
3  * Copyright (c) 2008-2012, by Randall Stewart. All rights reserved.
4  * Copyright (c) 2008-2012, by Michael Tuexen. All rights reserved.
5  *
6  * Redistribution and use in source and binary forms, with or without
7  * modification, are permitted provided that the following conditions are met:
8  *
9  * a) Redistributions of source code must retain the above copyright notice,
10  *    this list of conditions and the following disclaimer.
11  *
12  * b) Redistributions in binary form must reproduce the above copyright
13  *    notice, this list of conditions and the following disclaimer in
14  *    the documentation and/or other materials provided with the distribution.
15  *
16  * c) Neither the name of Cisco Systems, Inc. nor the names of its
17  *    contributors may be used to endorse or promote products derived
18  *    from this software without specific prior written permission.
19  *
20  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
21  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
22  * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
23  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
24  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
25  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
26  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
27  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
28  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
29  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
30  * THE POSSIBILITY OF SUCH DAMAGE.
31  */
32 
33 #include <sys/cdefs.h>
34 __FBSDID("$FreeBSD$");
35 
36 #define _IP_VHL
37 #include <netinet/sctp_os.h>
38 #include <netinet/sctp_pcb.h>
39 #ifdef INET6
40 #endif
41 #include <netinet/sctp_var.h>
42 #include <netinet/sctp_sysctl.h>
43 #include <netinet/sctp_timer.h>
44 #include <netinet/sctputil.h>
45 #include <netinet/sctp_output.h>
46 #include <netinet/sctp_header.h>
47 #include <netinet/sctp_indata.h>
48 #include <netinet/sctp_asconf.h>
49 #include <netinet/sctp_input.h>
50 #include <netinet/sctp.h>
51 #include <netinet/sctp_uio.h>
52 #if defined(INET) || defined(INET6)
53 #include <netinet/udp.h>
54 #endif
55 
56 
57 void
58 sctp_audit_retranmission_queue(struct sctp_association *asoc)
59 {
60 	struct sctp_tmit_chunk *chk;
61 
62 	SCTPDBG(SCTP_DEBUG_TIMER4, "Audit invoked on send queue cnt:%d onqueue:%d\n",
63 	    asoc->sent_queue_retran_cnt,
64 	    asoc->sent_queue_cnt);
65 	asoc->sent_queue_retran_cnt = 0;
66 	asoc->sent_queue_cnt = 0;
67 	TAILQ_FOREACH(chk, &asoc->sent_queue, sctp_next) {
68 		if (chk->sent == SCTP_DATAGRAM_RESEND) {
69 			sctp_ucount_incr(asoc->sent_queue_retran_cnt);
70 		}
71 		asoc->sent_queue_cnt++;
72 	}
73 	TAILQ_FOREACH(chk, &asoc->control_send_queue, sctp_next) {
74 		if (chk->sent == SCTP_DATAGRAM_RESEND) {
75 			sctp_ucount_incr(asoc->sent_queue_retran_cnt);
76 		}
77 	}
78 	TAILQ_FOREACH(chk, &asoc->asconf_send_queue, sctp_next) {
79 		if (chk->sent == SCTP_DATAGRAM_RESEND) {
80 			sctp_ucount_incr(asoc->sent_queue_retran_cnt);
81 		}
82 	}
83 	SCTPDBG(SCTP_DEBUG_TIMER4, "Audit completes retran:%d onqueue:%d\n",
84 	    asoc->sent_queue_retran_cnt,
85 	    asoc->sent_queue_cnt);
86 }
87 
88 int
89 sctp_threshold_management(struct sctp_inpcb *inp, struct sctp_tcb *stcb,
90     struct sctp_nets *net, uint16_t threshold)
91 {
92 	if (net) {
93 		net->error_count++;
94 		SCTPDBG(SCTP_DEBUG_TIMER4, "Error count for %p now %d thresh:%d\n",
95 		    (void *)net, net->error_count,
96 		    net->failure_threshold);
97 		if (net->error_count > net->failure_threshold) {
98 			/* We had a threshold failure */
99 			if (net->dest_state & SCTP_ADDR_REACHABLE) {
100 				net->dest_state &= ~SCTP_ADDR_REACHABLE;
101 				net->dest_state &= ~SCTP_ADDR_REQ_PRIMARY;
102 				net->dest_state &= ~SCTP_ADDR_PF;
103 				sctp_ulp_notify(SCTP_NOTIFY_INTERFACE_DOWN,
104 				    stcb, 0,
105 				    (void *)net, SCTP_SO_NOT_LOCKED);
106 			}
107 		} else if ((net->pf_threshold < net->failure_threshold) &&
108 		    (net->error_count > net->pf_threshold)) {
109 			if (!(net->dest_state & SCTP_ADDR_PF)) {
110 				net->dest_state |= SCTP_ADDR_PF;
111 				net->last_active = sctp_get_tick_count();
112 				sctp_send_hb(stcb, net, SCTP_SO_NOT_LOCKED);
113 				sctp_timer_stop(SCTP_TIMER_TYPE_HEARTBEAT,
114 				    stcb->sctp_ep, stcb, net,
115 				    SCTP_FROM_SCTP_TIMER + SCTP_LOC_1);
116 				sctp_timer_start(SCTP_TIMER_TYPE_HEARTBEAT, stcb->sctp_ep, stcb, net);
117 			}
118 		}
119 	}
120 	if (stcb == NULL)
121 		return (0);
122 
123 	if (net) {
124 		if ((net->dest_state & SCTP_ADDR_UNCONFIRMED) == 0) {
125 			if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_THRESHOLD_LOGGING) {
126 				sctp_misc_ints(SCTP_THRESHOLD_INCR,
127 				    stcb->asoc.overall_error_count,
128 				    (stcb->asoc.overall_error_count + 1),
129 				    SCTP_FROM_SCTP_TIMER,
130 				    __LINE__);
131 			}
132 			stcb->asoc.overall_error_count++;
133 		}
134 	} else {
135 		if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_THRESHOLD_LOGGING) {
136 			sctp_misc_ints(SCTP_THRESHOLD_INCR,
137 			    stcb->asoc.overall_error_count,
138 			    (stcb->asoc.overall_error_count + 1),
139 			    SCTP_FROM_SCTP_TIMER,
140 			    __LINE__);
141 		}
142 		stcb->asoc.overall_error_count++;
143 	}
144 	SCTPDBG(SCTP_DEBUG_TIMER4, "Overall error count for %p now %d thresh:%u state:%x\n",
145 	    (void *)&stcb->asoc, stcb->asoc.overall_error_count,
146 	    (uint32_t) threshold,
147 	    ((net == NULL) ? (uint32_t) 0 : (uint32_t) net->dest_state));
148 	/*
149 	 * We specifically do not do >= to give the assoc one more change
150 	 * before we fail it.
151 	 */
152 	if (stcb->asoc.overall_error_count > threshold) {
153 		/* Abort notification sends a ULP notify */
154 		struct mbuf *op_err;
155 
156 		op_err = sctp_generate_cause(SCTP_BASE_SYSCTL(sctp_diag_info_code),
157 		    "Association error counter exceeded");
158 		inp->last_abort_code = SCTP_FROM_SCTP_TIMER + SCTP_LOC_2;
159 		sctp_abort_an_association(inp, stcb, op_err, SCTP_SO_NOT_LOCKED);
160 		return (1);
161 	}
162 	return (0);
163 }
164 
165 /*
166  * sctp_find_alternate_net() returns a non-NULL pointer as long
167  * the argument net is non-NULL.
168  */
169 struct sctp_nets *
170 sctp_find_alternate_net(struct sctp_tcb *stcb,
171     struct sctp_nets *net,
172     int mode)
173 {
174 	/* Find and return an alternate network if possible */
175 	struct sctp_nets *alt, *mnet, *min_errors_net = NULL, *max_cwnd_net = NULL;
176 	int once;
177 
178 	/* JRS 5/14/07 - Initialize min_errors to an impossible value. */
179 	int min_errors = -1;
180 	uint32_t max_cwnd = 0;
181 
182 	if (stcb->asoc.numnets == 1) {
183 		/* No others but net */
184 		return (TAILQ_FIRST(&stcb->asoc.nets));
185 	}
186 	/*
187 	 * JRS 5/14/07 - If mode is set to 2, use the CMT PF find alternate
188 	 * net algorithm. This algorithm chooses the active destination (not
189 	 * in PF state) with the largest cwnd value. If all destinations are
190 	 * in PF state, unreachable, or unconfirmed, choose the desination
191 	 * that is in PF state with the lowest error count. In case of a
192 	 * tie, choose the destination that was most recently active.
193 	 */
194 	if (mode == 2) {
195 		TAILQ_FOREACH(mnet, &stcb->asoc.nets, sctp_next) {
196 			/*
197 			 * JRS 5/14/07 - If the destination is unreachable
198 			 * or unconfirmed, skip it.
199 			 */
200 			if (((mnet->dest_state & SCTP_ADDR_REACHABLE) != SCTP_ADDR_REACHABLE) ||
201 			    (mnet->dest_state & SCTP_ADDR_UNCONFIRMED)) {
202 				continue;
203 			}
204 			/*
205 			 * JRS 5/14/07 -  If the destination is reachable
206 			 * but in PF state, compare the error count of the
207 			 * destination to the minimum error count seen thus
208 			 * far. Store the destination with the lower error
209 			 * count.  If the error counts are equal, store the
210 			 * destination that was most recently active.
211 			 */
212 			if (mnet->dest_state & SCTP_ADDR_PF) {
213 				/*
214 				 * JRS 5/14/07 - If the destination under
215 				 * consideration is the current destination,
216 				 * work as if the error count is one higher.
217 				 * The actual error count will not be
218 				 * incremented until later in the t3
219 				 * handler.
220 				 */
221 				if (mnet == net) {
222 					if (min_errors == -1) {
223 						min_errors = mnet->error_count + 1;
224 						min_errors_net = mnet;
225 					} else if (mnet->error_count + 1 < min_errors) {
226 						min_errors = mnet->error_count + 1;
227 						min_errors_net = mnet;
228 					} else if (mnet->error_count + 1 == min_errors
229 					    && mnet->last_active > min_errors_net->last_active) {
230 						min_errors_net = mnet;
231 						min_errors = mnet->error_count + 1;
232 					}
233 					continue;
234 				} else {
235 					if (min_errors == -1) {
236 						min_errors = mnet->error_count;
237 						min_errors_net = mnet;
238 					} else if (mnet->error_count < min_errors) {
239 						min_errors = mnet->error_count;
240 						min_errors_net = mnet;
241 					} else if (mnet->error_count == min_errors
242 					    && mnet->last_active > min_errors_net->last_active) {
243 						min_errors_net = mnet;
244 						min_errors = mnet->error_count;
245 					}
246 					continue;
247 				}
248 			}
249 			/*
250 			 * JRS 5/14/07 - If the destination is reachable and
251 			 * not in PF state, compare the cwnd of the
252 			 * destination to the highest cwnd seen thus far.
253 			 * Store the destination with the higher cwnd value.
254 			 * If the cwnd values are equal, randomly choose one
255 			 * of the two destinations.
256 			 */
257 			if (max_cwnd < mnet->cwnd) {
258 				max_cwnd_net = mnet;
259 				max_cwnd = mnet->cwnd;
260 			} else if (max_cwnd == mnet->cwnd) {
261 				uint32_t rndval;
262 				uint8_t this_random;
263 
264 				if (stcb->asoc.hb_random_idx > 3) {
265 					rndval = sctp_select_initial_TSN(&stcb->sctp_ep->sctp_ep);
266 					memcpy(stcb->asoc.hb_random_values, &rndval, sizeof(stcb->asoc.hb_random_values));
267 					this_random = stcb->asoc.hb_random_values[0];
268 					stcb->asoc.hb_random_idx++;
269 					stcb->asoc.hb_ect_randombit = 0;
270 				} else {
271 					this_random = stcb->asoc.hb_random_values[stcb->asoc.hb_random_idx];
272 					stcb->asoc.hb_random_idx++;
273 					stcb->asoc.hb_ect_randombit = 0;
274 				}
275 				if (this_random % 2 == 1) {
276 					max_cwnd_net = mnet;
277 					max_cwnd = mnet->cwnd;	/* Useless? */
278 				}
279 			}
280 		}
281 		if (max_cwnd_net == NULL) {
282 			if (min_errors_net == NULL) {
283 				return (net);
284 			}
285 			return (min_errors_net);
286 		} else {
287 			return (max_cwnd_net);
288 		}
289 	}
290 	/*
291 	 * JRS 5/14/07 - If mode is set to 1, use the CMT policy for
292 	 * choosing an alternate net.
293 	 */
294 	else if (mode == 1) {
295 		TAILQ_FOREACH(mnet, &stcb->asoc.nets, sctp_next) {
296 			if (((mnet->dest_state & SCTP_ADDR_REACHABLE) != SCTP_ADDR_REACHABLE) ||
297 			    (mnet->dest_state & SCTP_ADDR_UNCONFIRMED)) {
298 				/*
299 				 * will skip ones that are not-reachable or
300 				 * unconfirmed
301 				 */
302 				continue;
303 			}
304 			if (max_cwnd < mnet->cwnd) {
305 				max_cwnd_net = mnet;
306 				max_cwnd = mnet->cwnd;
307 			} else if (max_cwnd == mnet->cwnd) {
308 				uint32_t rndval;
309 				uint8_t this_random;
310 
311 				if (stcb->asoc.hb_random_idx > 3) {
312 					rndval = sctp_select_initial_TSN(&stcb->sctp_ep->sctp_ep);
313 					memcpy(stcb->asoc.hb_random_values, &rndval,
314 					    sizeof(stcb->asoc.hb_random_values));
315 					this_random = stcb->asoc.hb_random_values[0];
316 					stcb->asoc.hb_random_idx = 0;
317 					stcb->asoc.hb_ect_randombit = 0;
318 				} else {
319 					this_random = stcb->asoc.hb_random_values[stcb->asoc.hb_random_idx];
320 					stcb->asoc.hb_random_idx++;
321 					stcb->asoc.hb_ect_randombit = 0;
322 				}
323 				if (this_random % 2) {
324 					max_cwnd_net = mnet;
325 					max_cwnd = mnet->cwnd;
326 				}
327 			}
328 		}
329 		if (max_cwnd_net) {
330 			return (max_cwnd_net);
331 		}
332 	}
333 	mnet = net;
334 	once = 0;
335 
336 	if (mnet == NULL) {
337 		mnet = TAILQ_FIRST(&stcb->asoc.nets);
338 		if (mnet == NULL) {
339 			return (NULL);
340 		}
341 	}
342 	for (;;) {
343 		alt = TAILQ_NEXT(mnet, sctp_next);
344 		if (alt == NULL) {
345 			once++;
346 			if (once > 1) {
347 				break;
348 			}
349 			alt = TAILQ_FIRST(&stcb->asoc.nets);
350 			if (alt == NULL) {
351 				return (NULL);
352 			}
353 		}
354 		if (alt->ro.ro_rt == NULL) {
355 			if (alt->ro._s_addr) {
356 				sctp_free_ifa(alt->ro._s_addr);
357 				alt->ro._s_addr = NULL;
358 			}
359 			alt->src_addr_selected = 0;
360 		}
361 		if (((alt->dest_state & SCTP_ADDR_REACHABLE) == SCTP_ADDR_REACHABLE) &&
362 		    (alt->ro.ro_rt != NULL) &&
363 		    (!(alt->dest_state & SCTP_ADDR_UNCONFIRMED))) {
364 			/* Found a reachable address */
365 			break;
366 		}
367 		mnet = alt;
368 	}
369 
370 	if (alt == NULL) {
371 		/* Case where NO insv network exists (dormant state) */
372 		/* we rotate destinations */
373 		once = 0;
374 		mnet = net;
375 		for (;;) {
376 			if (mnet == NULL) {
377 				return (TAILQ_FIRST(&stcb->asoc.nets));
378 			}
379 			alt = TAILQ_NEXT(mnet, sctp_next);
380 			if (alt == NULL) {
381 				once++;
382 				if (once > 1) {
383 					break;
384 				}
385 				alt = TAILQ_FIRST(&stcb->asoc.nets);
386 				if (alt == NULL) {
387 					break;
388 				}
389 			}
390 			if ((!(alt->dest_state & SCTP_ADDR_UNCONFIRMED)) &&
391 			    (alt != net)) {
392 				/* Found an alternate address */
393 				break;
394 			}
395 			mnet = alt;
396 		}
397 	}
398 	if (alt == NULL) {
399 		return (net);
400 	}
401 	return (alt);
402 }
403 
404 static void
405 sctp_backoff_on_timeout(struct sctp_tcb *stcb,
406     struct sctp_nets *net,
407     int win_probe,
408     int num_marked, int num_abandoned)
409 {
410 	if (net->RTO == 0) {
411 		if (net->RTO_measured) {
412 			net->RTO = stcb->asoc.minrto;
413 		} else {
414 			net->RTO = stcb->asoc.initial_rto;
415 		}
416 	}
417 	net->RTO <<= 1;
418 	if (net->RTO > stcb->asoc.maxrto) {
419 		net->RTO = stcb->asoc.maxrto;
420 	}
421 	if ((win_probe == 0) && (num_marked || num_abandoned)) {
422 		/* We don't apply penalty to window probe scenarios */
423 		/* JRS - Use the congestion control given in the CC module */
424 		stcb->asoc.cc_functions.sctp_cwnd_update_after_timeout(stcb, net);
425 	}
426 }
427 
428 #ifndef INVARIANTS
429 static void
430 sctp_recover_sent_list(struct sctp_tcb *stcb)
431 {
432 	struct sctp_tmit_chunk *chk, *nchk;
433 	struct sctp_association *asoc;
434 
435 	asoc = &stcb->asoc;
436 	TAILQ_FOREACH_SAFE(chk, &asoc->sent_queue, sctp_next, nchk) {
437 		if (SCTP_TSN_GE(asoc->last_acked_seq, chk->rec.data.TSN_seq)) {
438 			SCTP_PRINTF("Found chk:%p tsn:%x <= last_acked_seq:%x\n",
439 			    (void *)chk, chk->rec.data.TSN_seq, asoc->last_acked_seq);
440 			if (chk->sent != SCTP_DATAGRAM_NR_ACKED) {
441 				if (asoc->strmout[chk->rec.data.stream_number].chunks_on_queues > 0) {
442 					asoc->strmout[chk->rec.data.stream_number].chunks_on_queues--;
443 				}
444 			}
445 			if ((asoc->strmout[chk->rec.data.stream_number].chunks_on_queues == 0) &&
446 			    (asoc->strmout[chk->rec.data.stream_number].state == SCTP_STREAM_RESET_PENDING) &&
447 			    TAILQ_EMPTY(&asoc->strmout[chk->rec.data.stream_number].outqueue)) {
448 				asoc->trigger_reset = 1;
449 			}
450 			TAILQ_REMOVE(&asoc->sent_queue, chk, sctp_next);
451 			if (PR_SCTP_ENABLED(chk->flags)) {
452 				if (asoc->pr_sctp_cnt != 0)
453 					asoc->pr_sctp_cnt--;
454 			}
455 			if (chk->data) {
456 				/* sa_ignore NO_NULL_CHK */
457 				sctp_free_bufspace(stcb, asoc, chk, 1);
458 				sctp_m_freem(chk->data);
459 				chk->data = NULL;
460 				if (asoc->prsctp_supported && PR_SCTP_BUF_ENABLED(chk->flags)) {
461 					asoc->sent_queue_cnt_removeable--;
462 				}
463 			}
464 			asoc->sent_queue_cnt--;
465 			sctp_free_a_chunk(stcb, chk, SCTP_SO_NOT_LOCKED);
466 		}
467 	}
468 	SCTP_PRINTF("after recover order is as follows\n");
469 	TAILQ_FOREACH(chk, &asoc->sent_queue, sctp_next) {
470 		SCTP_PRINTF("chk:%p TSN:%x\n", (void *)chk, chk->rec.data.TSN_seq);
471 	}
472 }
473 
474 #endif
475 
476 static int
477 sctp_mark_all_for_resend(struct sctp_tcb *stcb,
478     struct sctp_nets *net,
479     struct sctp_nets *alt,
480     int window_probe,
481     int *num_marked,
482     int *num_abandoned)
483 {
484 
485 	/*
486 	 * Mark all chunks (well not all) that were sent to *net for
487 	 * retransmission. Move them to alt for there destination as well...
488 	 * We only mark chunks that have been outstanding long enough to
489 	 * have received feed-back.
490 	 */
491 	struct sctp_tmit_chunk *chk, *nchk;
492 	struct sctp_nets *lnets;
493 	struct timeval now, min_wait, tv;
494 	int cur_rto;
495 	int cnt_abandoned;
496 	int audit_tf, num_mk, fir;
497 	unsigned int cnt_mk;
498 	uint32_t orig_flight, orig_tf;
499 	uint32_t tsnlast, tsnfirst;
500 	int recovery_cnt = 0;
501 
502 
503 	/* none in flight now */
504 	audit_tf = 0;
505 	fir = 0;
506 	/*
507 	 * figure out how long a data chunk must be pending before we can
508 	 * mark it ..
509 	 */
510 	(void)SCTP_GETTIME_TIMEVAL(&now);
511 	/* get cur rto in micro-seconds */
512 	cur_rto = (net->lastsa >> SCTP_RTT_SHIFT) + net->lastsv;
513 	cur_rto *= 1000;
514 	if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_FR_LOGGING_ENABLE) {
515 		sctp_log_fr(cur_rto,
516 		    stcb->asoc.peers_rwnd,
517 		    window_probe,
518 		    SCTP_FR_T3_MARK_TIME);
519 		sctp_log_fr(net->flight_size, 0, 0, SCTP_FR_CWND_REPORT);
520 		sctp_log_fr(net->flight_size, net->cwnd, stcb->asoc.total_flight, SCTP_FR_CWND_REPORT);
521 	}
522 	tv.tv_sec = cur_rto / 1000000;
523 	tv.tv_usec = cur_rto % 1000000;
524 	min_wait = now;
525 	timevalsub(&min_wait, &tv);
526 	if (min_wait.tv_sec < 0 || min_wait.tv_usec < 0) {
527 		/*
528 		 * if we hit here, we don't have enough seconds on the clock
529 		 * to account for the RTO. We just let the lower seconds be
530 		 * the bounds and don't worry about it. This may mean we
531 		 * will mark a lot more than we should.
532 		 */
533 		min_wait.tv_sec = min_wait.tv_usec = 0;
534 	}
535 	if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_FR_LOGGING_ENABLE) {
536 		sctp_log_fr(cur_rto, now.tv_sec, now.tv_usec, SCTP_FR_T3_MARK_TIME);
537 		sctp_log_fr(0, min_wait.tv_sec, min_wait.tv_usec, SCTP_FR_T3_MARK_TIME);
538 	}
539 	/*
540 	 * Our rwnd will be incorrect here since we are not adding back the
541 	 * cnt * mbuf but we will fix that down below.
542 	 */
543 	orig_flight = net->flight_size;
544 	orig_tf = stcb->asoc.total_flight;
545 
546 	net->fast_retran_ip = 0;
547 	/* Now on to each chunk */
548 	cnt_abandoned = 0;
549 	num_mk = cnt_mk = 0;
550 	tsnfirst = tsnlast = 0;
551 #ifndef INVARIANTS
552 start_again:
553 #endif
554 	TAILQ_FOREACH_SAFE(chk, &stcb->asoc.sent_queue, sctp_next, nchk) {
555 		if (SCTP_TSN_GE(stcb->asoc.last_acked_seq, chk->rec.data.TSN_seq)) {
556 			/* Strange case our list got out of order? */
557 			SCTP_PRINTF("Our list is out of order? last_acked:%x chk:%x\n",
558 			    (unsigned int)stcb->asoc.last_acked_seq, (unsigned int)chk->rec.data.TSN_seq);
559 			recovery_cnt++;
560 #ifdef INVARIANTS
561 			panic("last acked >= chk on sent-Q");
562 #else
563 			SCTP_PRINTF("Recover attempts a restart cnt:%d\n", recovery_cnt);
564 			sctp_recover_sent_list(stcb);
565 			if (recovery_cnt < 10) {
566 				goto start_again;
567 			} else {
568 				SCTP_PRINTF("Recovery fails %d times??\n", recovery_cnt);
569 			}
570 #endif
571 		}
572 		if ((chk->whoTo == net) && (chk->sent < SCTP_DATAGRAM_ACKED)) {
573 			/*
574 			 * found one to mark: If it is less than
575 			 * DATAGRAM_ACKED it MUST not be a skipped or marked
576 			 * TSN but instead one that is either already set
577 			 * for retransmission OR one that needs
578 			 * retransmission.
579 			 */
580 
581 			/* validate its been outstanding long enough */
582 			if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_FR_LOGGING_ENABLE) {
583 				sctp_log_fr(chk->rec.data.TSN_seq,
584 				    chk->sent_rcv_time.tv_sec,
585 				    chk->sent_rcv_time.tv_usec,
586 				    SCTP_FR_T3_MARK_TIME);
587 			}
588 			if ((chk->sent_rcv_time.tv_sec > min_wait.tv_sec) && (window_probe == 0)) {
589 				/*
590 				 * we have reached a chunk that was sent
591 				 * some seconds past our min.. forget it we
592 				 * will find no more to send.
593 				 */
594 				if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_FR_LOGGING_ENABLE) {
595 					sctp_log_fr(0,
596 					    chk->sent_rcv_time.tv_sec,
597 					    chk->sent_rcv_time.tv_usec,
598 					    SCTP_FR_T3_STOPPED);
599 				}
600 				continue;
601 			} else if ((chk->sent_rcv_time.tv_sec == min_wait.tv_sec) &&
602 			    (window_probe == 0)) {
603 				/*
604 				 * we must look at the micro seconds to
605 				 * know.
606 				 */
607 				if (chk->sent_rcv_time.tv_usec >= min_wait.tv_usec) {
608 					/*
609 					 * ok it was sent after our boundary
610 					 * time.
611 					 */
612 					continue;
613 				}
614 			}
615 			if (stcb->asoc.prsctp_supported && PR_SCTP_TTL_ENABLED(chk->flags)) {
616 				/* Is it expired? */
617 				if (timevalcmp(&now, &chk->rec.data.timetodrop, >)) {
618 					/* Yes so drop it */
619 					if (chk->data) {
620 						(void)sctp_release_pr_sctp_chunk(stcb,
621 						    chk,
622 						    1,
623 						    SCTP_SO_NOT_LOCKED);
624 						cnt_abandoned++;
625 					}
626 					continue;
627 				}
628 			}
629 			if (stcb->asoc.prsctp_supported && PR_SCTP_RTX_ENABLED(chk->flags)) {
630 				/* Has it been retransmitted tv_sec times? */
631 				if (chk->snd_count > chk->rec.data.timetodrop.tv_sec) {
632 					if (chk->data) {
633 						(void)sctp_release_pr_sctp_chunk(stcb,
634 						    chk,
635 						    1,
636 						    SCTP_SO_NOT_LOCKED);
637 						cnt_abandoned++;
638 					}
639 					continue;
640 				}
641 			}
642 			if (chk->sent < SCTP_DATAGRAM_RESEND) {
643 				sctp_ucount_incr(stcb->asoc.sent_queue_retran_cnt);
644 				num_mk++;
645 				if (fir == 0) {
646 					fir = 1;
647 					tsnfirst = chk->rec.data.TSN_seq;
648 				}
649 				tsnlast = chk->rec.data.TSN_seq;
650 				if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_FR_LOGGING_ENABLE) {
651 					sctp_log_fr(chk->rec.data.TSN_seq, chk->snd_count,
652 					    0, SCTP_FR_T3_MARKED);
653 				}
654 				if (chk->rec.data.chunk_was_revoked) {
655 					/* deflate the cwnd */
656 					chk->whoTo->cwnd -= chk->book_size;
657 					chk->rec.data.chunk_was_revoked = 0;
658 				}
659 				net->marked_retrans++;
660 				stcb->asoc.marked_retrans++;
661 				if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_FLIGHT_LOGGING_ENABLE) {
662 					sctp_misc_ints(SCTP_FLIGHT_LOG_DOWN_RSND_TO,
663 					    chk->whoTo->flight_size,
664 					    chk->book_size,
665 					    (uintptr_t) chk->whoTo,
666 					    chk->rec.data.TSN_seq);
667 				}
668 				sctp_flight_size_decrease(chk);
669 				sctp_total_flight_decrease(stcb, chk);
670 				stcb->asoc.peers_rwnd += chk->send_size;
671 				stcb->asoc.peers_rwnd += SCTP_BASE_SYSCTL(sctp_peer_chunk_oh);
672 			}
673 			chk->sent = SCTP_DATAGRAM_RESEND;
674 			SCTP_STAT_INCR(sctps_markedretrans);
675 
676 			/* reset the TSN for striking and other FR stuff */
677 			chk->rec.data.doing_fast_retransmit = 0;
678 			/* Clear any time so NO RTT is being done */
679 
680 			if (chk->do_rtt) {
681 				if (chk->whoTo->rto_needed == 0) {
682 					chk->whoTo->rto_needed = 1;
683 				}
684 			}
685 			chk->do_rtt = 0;
686 			if (alt != net) {
687 				sctp_free_remote_addr(chk->whoTo);
688 				chk->no_fr_allowed = 1;
689 				chk->whoTo = alt;
690 				atomic_add_int(&alt->ref_count, 1);
691 			} else {
692 				chk->no_fr_allowed = 0;
693 				if (TAILQ_EMPTY(&stcb->asoc.send_queue)) {
694 					chk->rec.data.fast_retran_tsn = stcb->asoc.sending_seq;
695 				} else {
696 					chk->rec.data.fast_retran_tsn = (TAILQ_FIRST(&stcb->asoc.send_queue))->rec.data.TSN_seq;
697 				}
698 			}
699 			/*
700 			 * CMT: Do not allow FRs on retransmitted TSNs.
701 			 */
702 			if (stcb->asoc.sctp_cmt_on_off > 0) {
703 				chk->no_fr_allowed = 1;
704 			}
705 #ifdef THIS_SHOULD_NOT_BE_DONE
706 		} else if (chk->sent == SCTP_DATAGRAM_ACKED) {
707 			/* remember highest acked one */
708 			could_be_sent = chk;
709 #endif
710 		}
711 		if (chk->sent == SCTP_DATAGRAM_RESEND) {
712 			cnt_mk++;
713 		}
714 	}
715 	if ((orig_flight - net->flight_size) != (orig_tf - stcb->asoc.total_flight)) {
716 		/* we did not subtract the same things? */
717 		audit_tf = 1;
718 	}
719 	if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_FR_LOGGING_ENABLE) {
720 		sctp_log_fr(tsnfirst, tsnlast, num_mk, SCTP_FR_T3_TIMEOUT);
721 	}
722 #ifdef SCTP_DEBUG
723 	if (num_mk) {
724 		SCTPDBG(SCTP_DEBUG_TIMER1, "LAST TSN marked was %x\n",
725 		    tsnlast);
726 		SCTPDBG(SCTP_DEBUG_TIMER1, "Num marked for retransmission was %d peer-rwd:%ld\n",
727 		    num_mk, (u_long)stcb->asoc.peers_rwnd);
728 		SCTPDBG(SCTP_DEBUG_TIMER1, "LAST TSN marked was %x\n",
729 		    tsnlast);
730 		SCTPDBG(SCTP_DEBUG_TIMER1, "Num marked for retransmission was %d peer-rwd:%d\n",
731 		    num_mk,
732 		    (int)stcb->asoc.peers_rwnd);
733 	}
734 #endif
735 	*num_marked = num_mk;
736 	*num_abandoned = cnt_abandoned;
737 	/*
738 	 * Now check for a ECN Echo that may be stranded And include the
739 	 * cnt_mk'd to have all resends in the control queue.
740 	 */
741 	TAILQ_FOREACH(chk, &stcb->asoc.control_send_queue, sctp_next) {
742 		if (chk->sent == SCTP_DATAGRAM_RESEND) {
743 			cnt_mk++;
744 		}
745 		if ((chk->whoTo == net) &&
746 		    (chk->rec.chunk_id.id == SCTP_ECN_ECHO)) {
747 			sctp_free_remote_addr(chk->whoTo);
748 			chk->whoTo = alt;
749 			if (chk->sent != SCTP_DATAGRAM_RESEND) {
750 				chk->sent = SCTP_DATAGRAM_RESEND;
751 				sctp_ucount_incr(stcb->asoc.sent_queue_retran_cnt);
752 				cnt_mk++;
753 			}
754 			atomic_add_int(&alt->ref_count, 1);
755 		}
756 	}
757 #ifdef THIS_SHOULD_NOT_BE_DONE
758 	if ((stcb->asoc.sent_queue_retran_cnt == 0) && (could_be_sent)) {
759 		/* fix it so we retransmit the highest acked anyway */
760 		sctp_ucount_incr(stcb->asoc.sent_queue_retran_cnt);
761 		cnt_mk++;
762 		could_be_sent->sent = SCTP_DATAGRAM_RESEND;
763 	}
764 #endif
765 	if (stcb->asoc.sent_queue_retran_cnt != cnt_mk) {
766 #ifdef INVARIANTS
767 		SCTP_PRINTF("Local Audit says there are %d for retran asoc cnt:%d we marked:%d this time\n",
768 		    cnt_mk, stcb->asoc.sent_queue_retran_cnt, num_mk);
769 #endif
770 #ifndef SCTP_AUDITING_ENABLED
771 		stcb->asoc.sent_queue_retran_cnt = cnt_mk;
772 #endif
773 	}
774 	if (audit_tf) {
775 		SCTPDBG(SCTP_DEBUG_TIMER4,
776 		    "Audit total flight due to negative value net:%p\n",
777 		    (void *)net);
778 		stcb->asoc.total_flight = 0;
779 		stcb->asoc.total_flight_count = 0;
780 		/* Clear all networks flight size */
781 		TAILQ_FOREACH(lnets, &stcb->asoc.nets, sctp_next) {
782 			lnets->flight_size = 0;
783 			SCTPDBG(SCTP_DEBUG_TIMER4,
784 			    "Net:%p c-f cwnd:%d ssthresh:%d\n",
785 			    (void *)lnets, lnets->cwnd, lnets->ssthresh);
786 		}
787 		TAILQ_FOREACH(chk, &stcb->asoc.sent_queue, sctp_next) {
788 			if (chk->sent < SCTP_DATAGRAM_RESEND) {
789 				if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_FLIGHT_LOGGING_ENABLE) {
790 					sctp_misc_ints(SCTP_FLIGHT_LOG_UP,
791 					    chk->whoTo->flight_size,
792 					    chk->book_size,
793 					    (uintptr_t) chk->whoTo,
794 					    chk->rec.data.TSN_seq);
795 				}
796 				sctp_flight_size_increase(chk);
797 				sctp_total_flight_increase(stcb, chk);
798 			}
799 		}
800 	}
801 	/* We return 1 if we only have a window probe outstanding */
802 	return (0);
803 }
804 
805 
806 int
807 sctp_t3rxt_timer(struct sctp_inpcb *inp,
808     struct sctp_tcb *stcb,
809     struct sctp_nets *net)
810 {
811 	struct sctp_nets *alt;
812 	int win_probe, num_mk, num_abandoned;
813 
814 	if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_FR_LOGGING_ENABLE) {
815 		sctp_log_fr(0, 0, 0, SCTP_FR_T3_TIMEOUT);
816 	}
817 	if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_CWND_LOGGING_ENABLE) {
818 		struct sctp_nets *lnet;
819 
820 		TAILQ_FOREACH(lnet, &stcb->asoc.nets, sctp_next) {
821 			if (net == lnet) {
822 				sctp_log_cwnd(stcb, lnet, 1, SCTP_CWND_LOG_FROM_T3);
823 			} else {
824 				sctp_log_cwnd(stcb, lnet, 0, SCTP_CWND_LOG_FROM_T3);
825 			}
826 		}
827 	}
828 	/* Find an alternate and mark those for retransmission */
829 	if ((stcb->asoc.peers_rwnd == 0) &&
830 	    (stcb->asoc.total_flight < net->mtu)) {
831 		SCTP_STAT_INCR(sctps_timowindowprobe);
832 		win_probe = 1;
833 	} else {
834 		win_probe = 0;
835 	}
836 
837 	if (win_probe == 0) {
838 		/* We don't do normal threshold management on window probes */
839 		if (sctp_threshold_management(inp, stcb, net,
840 		    stcb->asoc.max_send_times)) {
841 			/* Association was destroyed */
842 			return (1);
843 		} else {
844 			if (net != stcb->asoc.primary_destination) {
845 				/* send a immediate HB if our RTO is stale */
846 				struct timeval now;
847 				unsigned int ms_goneby;
848 
849 				(void)SCTP_GETTIME_TIMEVAL(&now);
850 				if (net->last_sent_time.tv_sec) {
851 					ms_goneby = (now.tv_sec - net->last_sent_time.tv_sec) * 1000;
852 				} else {
853 					ms_goneby = 0;
854 				}
855 				if ((net->dest_state & SCTP_ADDR_PF) == 0) {
856 					if ((ms_goneby > net->RTO) || (net->RTO == 0)) {
857 						/*
858 						 * no recent feed back in an
859 						 * RTO or more, request a
860 						 * RTT update
861 						 */
862 						sctp_send_hb(stcb, net, SCTP_SO_NOT_LOCKED);
863 					}
864 				}
865 			}
866 		}
867 	} else {
868 		/*
869 		 * For a window probe we don't penalize the net's but only
870 		 * the association. This may fail it if SACKs are not coming
871 		 * back. If sack's are coming with rwnd locked at 0, we will
872 		 * continue to hold things waiting for rwnd to raise
873 		 */
874 		if (sctp_threshold_management(inp, stcb, NULL,
875 		    stcb->asoc.max_send_times)) {
876 			/* Association was destroyed */
877 			return (1);
878 		}
879 	}
880 	if (stcb->asoc.sctp_cmt_on_off > 0) {
881 		if (net->pf_threshold < net->failure_threshold) {
882 			alt = sctp_find_alternate_net(stcb, net, 2);
883 		} else {
884 			/*
885 			 * CMT: Using RTX_SSTHRESH policy for CMT. If CMT is
886 			 * being used, then pick dest with largest ssthresh
887 			 * for any retransmission.
888 			 */
889 			alt = sctp_find_alternate_net(stcb, net, 1);
890 			/*
891 			 * CUCv2: If a different dest is picked for the
892 			 * retransmission, then new (rtx-)pseudo_cumack
893 			 * needs to be tracked for orig dest. Let CUCv2
894 			 * track new (rtx-) pseudo-cumack always.
895 			 */
896 			net->find_pseudo_cumack = 1;
897 			net->find_rtx_pseudo_cumack = 1;
898 		}
899 	} else {
900 		alt = sctp_find_alternate_net(stcb, net, 0);
901 	}
902 
903 	num_mk = 0;
904 	num_abandoned = 0;
905 	(void)sctp_mark_all_for_resend(stcb, net, alt, win_probe,
906 	    &num_mk, &num_abandoned);
907 	/* FR Loss recovery just ended with the T3. */
908 	stcb->asoc.fast_retran_loss_recovery = 0;
909 
910 	/* CMT FR loss recovery ended with the T3 */
911 	net->fast_retran_loss_recovery = 0;
912 	if ((stcb->asoc.cc_functions.sctp_cwnd_new_transmission_begins) &&
913 	    (net->flight_size == 0)) {
914 		(*stcb->asoc.cc_functions.sctp_cwnd_new_transmission_begins) (stcb, net);
915 	}
916 	/*
917 	 * setup the sat loss recovery that prevents satellite cwnd advance.
918 	 */
919 	stcb->asoc.sat_t3_loss_recovery = 1;
920 	stcb->asoc.sat_t3_recovery_tsn = stcb->asoc.sending_seq;
921 
922 	/* Backoff the timer and cwnd */
923 	sctp_backoff_on_timeout(stcb, net, win_probe, num_mk, num_abandoned);
924 	if ((!(net->dest_state & SCTP_ADDR_REACHABLE)) ||
925 	    (net->dest_state & SCTP_ADDR_PF)) {
926 		/* Move all pending over too */
927 		sctp_move_chunks_from_net(stcb, net);
928 
929 		/*
930 		 * Get the address that failed, to force a new src address
931 		 * selecton and a route allocation.
932 		 */
933 		if (net->ro._s_addr) {
934 			sctp_free_ifa(net->ro._s_addr);
935 			net->ro._s_addr = NULL;
936 		}
937 		net->src_addr_selected = 0;
938 
939 		/* Force a route allocation too */
940 		if (net->ro.ro_rt) {
941 			RTFREE(net->ro.ro_rt);
942 			net->ro.ro_rt = NULL;
943 		}
944 		/* Was it our primary? */
945 		if ((stcb->asoc.primary_destination == net) && (alt != net)) {
946 			/*
947 			 * Yes, note it as such and find an alternate note:
948 			 * this means HB code must use this to resent the
949 			 * primary if it goes active AND if someone does a
950 			 * change-primary then this flag must be cleared
951 			 * from any net structures.
952 			 */
953 			if (stcb->asoc.alternate) {
954 				sctp_free_remote_addr(stcb->asoc.alternate);
955 			}
956 			stcb->asoc.alternate = alt;
957 			atomic_add_int(&stcb->asoc.alternate->ref_count, 1);
958 		}
959 	}
960 	/*
961 	 * Special case for cookie-echo'ed case, we don't do output but must
962 	 * await the COOKIE-ACK before retransmission
963 	 */
964 	if (SCTP_GET_STATE(&stcb->asoc) == SCTP_STATE_COOKIE_ECHOED) {
965 		/*
966 		 * Here we just reset the timer and start again since we
967 		 * have not established the asoc
968 		 */
969 		sctp_timer_start(SCTP_TIMER_TYPE_SEND, inp, stcb, net);
970 		return (0);
971 	}
972 	if (stcb->asoc.prsctp_supported) {
973 		struct sctp_tmit_chunk *lchk;
974 
975 		lchk = sctp_try_advance_peer_ack_point(stcb, &stcb->asoc);
976 		/* C3. See if we need to send a Fwd-TSN */
977 		if (SCTP_TSN_GT(stcb->asoc.advanced_peer_ack_point, stcb->asoc.last_acked_seq)) {
978 			send_forward_tsn(stcb, &stcb->asoc);
979 			if (lchk) {
980 				/* Assure a timer is up */
981 				sctp_timer_start(SCTP_TIMER_TYPE_SEND, stcb->sctp_ep, stcb, lchk->whoTo);
982 			}
983 		}
984 	}
985 	if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_CWND_MONITOR_ENABLE) {
986 		sctp_log_cwnd(stcb, net, net->cwnd, SCTP_CWND_LOG_FROM_RTX);
987 	}
988 	return (0);
989 }
990 
991 int
992 sctp_t1init_timer(struct sctp_inpcb *inp,
993     struct sctp_tcb *stcb,
994     struct sctp_nets *net)
995 {
996 	/* bump the thresholds */
997 	if (stcb->asoc.delayed_connection) {
998 		/*
999 		 * special hook for delayed connection. The library did NOT
1000 		 * complete the rest of its sends.
1001 		 */
1002 		stcb->asoc.delayed_connection = 0;
1003 		sctp_send_initiate(inp, stcb, SCTP_SO_NOT_LOCKED);
1004 		return (0);
1005 	}
1006 	if (SCTP_GET_STATE((&stcb->asoc)) != SCTP_STATE_COOKIE_WAIT) {
1007 		return (0);
1008 	}
1009 	if (sctp_threshold_management(inp, stcb, net,
1010 	    stcb->asoc.max_init_times)) {
1011 		/* Association was destroyed */
1012 		return (1);
1013 	}
1014 	stcb->asoc.dropped_special_cnt = 0;
1015 	sctp_backoff_on_timeout(stcb, stcb->asoc.primary_destination, 1, 0, 0);
1016 	if (stcb->asoc.initial_init_rto_max < net->RTO) {
1017 		net->RTO = stcb->asoc.initial_init_rto_max;
1018 	}
1019 	if (stcb->asoc.numnets > 1) {
1020 		/* If we have more than one addr use it */
1021 		struct sctp_nets *alt;
1022 
1023 		alt = sctp_find_alternate_net(stcb, stcb->asoc.primary_destination, 0);
1024 		if (alt != stcb->asoc.primary_destination) {
1025 			sctp_move_chunks_from_net(stcb, stcb->asoc.primary_destination);
1026 			stcb->asoc.primary_destination = alt;
1027 		}
1028 	}
1029 	/* Send out a new init */
1030 	sctp_send_initiate(inp, stcb, SCTP_SO_NOT_LOCKED);
1031 	return (0);
1032 }
1033 
1034 /*
1035  * For cookie and asconf we actually need to find and mark for resend, then
1036  * increment the resend counter (after all the threshold management stuff of
1037  * course).
1038  */
1039 int
1040 sctp_cookie_timer(struct sctp_inpcb *inp,
1041     struct sctp_tcb *stcb,
1042     struct sctp_nets *net SCTP_UNUSED)
1043 {
1044 	struct sctp_nets *alt;
1045 	struct sctp_tmit_chunk *cookie;
1046 
1047 	/* first before all else we must find the cookie */
1048 	TAILQ_FOREACH(cookie, &stcb->asoc.control_send_queue, sctp_next) {
1049 		if (cookie->rec.chunk_id.id == SCTP_COOKIE_ECHO) {
1050 			break;
1051 		}
1052 	}
1053 	if (cookie == NULL) {
1054 		if (SCTP_GET_STATE(&stcb->asoc) == SCTP_STATE_COOKIE_ECHOED) {
1055 			/* FOOBAR! */
1056 			struct mbuf *op_err;
1057 
1058 			op_err = sctp_generate_cause(SCTP_BASE_SYSCTL(sctp_diag_info_code),
1059 			    "Cookie timer expired, but no cookie");
1060 			inp->last_abort_code = SCTP_FROM_SCTP_TIMER + SCTP_LOC_3;
1061 			sctp_abort_an_association(inp, stcb, op_err, SCTP_SO_NOT_LOCKED);
1062 		} else {
1063 #ifdef INVARIANTS
1064 			panic("Cookie timer expires in wrong state?");
1065 #else
1066 			SCTP_PRINTF("Strange in state %d not cookie-echoed yet c-e timer expires?\n", SCTP_GET_STATE(&stcb->asoc));
1067 			return (0);
1068 #endif
1069 		}
1070 		return (0);
1071 	}
1072 	/* Ok we found the cookie, threshold management next */
1073 	if (sctp_threshold_management(inp, stcb, cookie->whoTo,
1074 	    stcb->asoc.max_init_times)) {
1075 		/* Assoc is over */
1076 		return (1);
1077 	}
1078 	/*
1079 	 * cleared theshold management now lets backoff the address & select
1080 	 * an alternate
1081 	 */
1082 	stcb->asoc.dropped_special_cnt = 0;
1083 	sctp_backoff_on_timeout(stcb, cookie->whoTo, 1, 0, 0);
1084 	alt = sctp_find_alternate_net(stcb, cookie->whoTo, 0);
1085 	if (alt != cookie->whoTo) {
1086 		sctp_free_remote_addr(cookie->whoTo);
1087 		cookie->whoTo = alt;
1088 		atomic_add_int(&alt->ref_count, 1);
1089 	}
1090 	/* Now mark the retran info */
1091 	if (cookie->sent != SCTP_DATAGRAM_RESEND) {
1092 		sctp_ucount_incr(stcb->asoc.sent_queue_retran_cnt);
1093 	}
1094 	cookie->sent = SCTP_DATAGRAM_RESEND;
1095 	/*
1096 	 * Now call the output routine to kick out the cookie again, Note we
1097 	 * don't mark any chunks for retran so that FR will need to kick in
1098 	 * to move these (or a send timer).
1099 	 */
1100 	return (0);
1101 }
1102 
1103 int
1104 sctp_strreset_timer(struct sctp_inpcb *inp, struct sctp_tcb *stcb,
1105     struct sctp_nets *net)
1106 {
1107 	struct sctp_nets *alt;
1108 	struct sctp_tmit_chunk *strrst = NULL, *chk = NULL;
1109 
1110 	if (stcb->asoc.stream_reset_outstanding == 0) {
1111 		return (0);
1112 	}
1113 	/* find the existing STRRESET, we use the seq number we sent out on */
1114 	(void)sctp_find_stream_reset(stcb, stcb->asoc.str_reset_seq_out, &strrst);
1115 	if (strrst == NULL) {
1116 		return (0);
1117 	}
1118 	/* do threshold management */
1119 	if (sctp_threshold_management(inp, stcb, strrst->whoTo,
1120 	    stcb->asoc.max_send_times)) {
1121 		/* Assoc is over */
1122 		return (1);
1123 	}
1124 	/*
1125 	 * cleared theshold management now lets backoff the address & select
1126 	 * an alternate
1127 	 */
1128 	sctp_backoff_on_timeout(stcb, strrst->whoTo, 1, 0, 0);
1129 	alt = sctp_find_alternate_net(stcb, strrst->whoTo, 0);
1130 	sctp_free_remote_addr(strrst->whoTo);
1131 	strrst->whoTo = alt;
1132 	atomic_add_int(&alt->ref_count, 1);
1133 
1134 	/* See if a ECN Echo is also stranded */
1135 	TAILQ_FOREACH(chk, &stcb->asoc.control_send_queue, sctp_next) {
1136 		if ((chk->whoTo == net) &&
1137 		    (chk->rec.chunk_id.id == SCTP_ECN_ECHO)) {
1138 			sctp_free_remote_addr(chk->whoTo);
1139 			if (chk->sent != SCTP_DATAGRAM_RESEND) {
1140 				chk->sent = SCTP_DATAGRAM_RESEND;
1141 				sctp_ucount_incr(stcb->asoc.sent_queue_retran_cnt);
1142 			}
1143 			chk->whoTo = alt;
1144 			atomic_add_int(&alt->ref_count, 1);
1145 		}
1146 	}
1147 	if (!(net->dest_state & SCTP_ADDR_REACHABLE)) {
1148 		/*
1149 		 * If the address went un-reachable, we need to move to
1150 		 * alternates for ALL chk's in queue
1151 		 */
1152 		sctp_move_chunks_from_net(stcb, net);
1153 	}
1154 	/* mark the retran info */
1155 	if (strrst->sent != SCTP_DATAGRAM_RESEND)
1156 		sctp_ucount_incr(stcb->asoc.sent_queue_retran_cnt);
1157 	strrst->sent = SCTP_DATAGRAM_RESEND;
1158 
1159 	/* restart the timer */
1160 	sctp_timer_start(SCTP_TIMER_TYPE_STRRESET, inp, stcb, strrst->whoTo);
1161 	return (0);
1162 }
1163 
1164 int
1165 sctp_asconf_timer(struct sctp_inpcb *inp, struct sctp_tcb *stcb,
1166     struct sctp_nets *net)
1167 {
1168 	struct sctp_nets *alt;
1169 	struct sctp_tmit_chunk *asconf, *chk;
1170 
1171 	/* is this a first send, or a retransmission? */
1172 	if (TAILQ_EMPTY(&stcb->asoc.asconf_send_queue)) {
1173 		/* compose a new ASCONF chunk and send it */
1174 		sctp_send_asconf(stcb, net, SCTP_ADDR_NOT_LOCKED);
1175 	} else {
1176 		/*
1177 		 * Retransmission of the existing ASCONF is needed
1178 		 */
1179 
1180 		/* find the existing ASCONF */
1181 		asconf = TAILQ_FIRST(&stcb->asoc.asconf_send_queue);
1182 		if (asconf == NULL) {
1183 			return (0);
1184 		}
1185 		/* do threshold management */
1186 		if (sctp_threshold_management(inp, stcb, asconf->whoTo,
1187 		    stcb->asoc.max_send_times)) {
1188 			/* Assoc is over */
1189 			return (1);
1190 		}
1191 		if (asconf->snd_count > stcb->asoc.max_send_times) {
1192 			/*
1193 			 * Something is rotten: our peer is not responding
1194 			 * to ASCONFs but apparently is to other chunks.
1195 			 * i.e. it is not properly handling the chunk type
1196 			 * upper bits. Mark this peer as ASCONF incapable
1197 			 * and cleanup.
1198 			 */
1199 			SCTPDBG(SCTP_DEBUG_TIMER1, "asconf_timer: Peer has not responded to our repeated ASCONFs\n");
1200 			sctp_asconf_cleanup(stcb, net);
1201 			return (0);
1202 		}
1203 		/*
1204 		 * cleared threshold management, so now backoff the net and
1205 		 * select an alternate
1206 		 */
1207 		sctp_backoff_on_timeout(stcb, asconf->whoTo, 1, 0, 0);
1208 		alt = sctp_find_alternate_net(stcb, asconf->whoTo, 0);
1209 		if (asconf->whoTo != alt) {
1210 			sctp_free_remote_addr(asconf->whoTo);
1211 			asconf->whoTo = alt;
1212 			atomic_add_int(&alt->ref_count, 1);
1213 		}
1214 		/* See if an ECN Echo is also stranded */
1215 		TAILQ_FOREACH(chk, &stcb->asoc.control_send_queue, sctp_next) {
1216 			if ((chk->whoTo == net) &&
1217 			    (chk->rec.chunk_id.id == SCTP_ECN_ECHO)) {
1218 				sctp_free_remote_addr(chk->whoTo);
1219 				chk->whoTo = alt;
1220 				if (chk->sent != SCTP_DATAGRAM_RESEND) {
1221 					chk->sent = SCTP_DATAGRAM_RESEND;
1222 					sctp_ucount_incr(stcb->asoc.sent_queue_retran_cnt);
1223 				}
1224 				atomic_add_int(&alt->ref_count, 1);
1225 			}
1226 		}
1227 		TAILQ_FOREACH(chk, &stcb->asoc.asconf_send_queue, sctp_next) {
1228 			if (chk->whoTo != alt) {
1229 				sctp_free_remote_addr(chk->whoTo);
1230 				chk->whoTo = alt;
1231 				atomic_add_int(&alt->ref_count, 1);
1232 			}
1233 			if (asconf->sent != SCTP_DATAGRAM_RESEND && chk->sent != SCTP_DATAGRAM_UNSENT)
1234 				sctp_ucount_incr(stcb->asoc.sent_queue_retran_cnt);
1235 			chk->sent = SCTP_DATAGRAM_RESEND;
1236 		}
1237 		if (!(net->dest_state & SCTP_ADDR_REACHABLE)) {
1238 			/*
1239 			 * If the address went un-reachable, we need to move
1240 			 * to the alternate for ALL chunks in queue
1241 			 */
1242 			sctp_move_chunks_from_net(stcb, net);
1243 		}
1244 		/* mark the retran info */
1245 		if (asconf->sent != SCTP_DATAGRAM_RESEND)
1246 			sctp_ucount_incr(stcb->asoc.sent_queue_retran_cnt);
1247 		asconf->sent = SCTP_DATAGRAM_RESEND;
1248 
1249 		/* send another ASCONF if any and we can do */
1250 		sctp_send_asconf(stcb, alt, SCTP_ADDR_NOT_LOCKED);
1251 	}
1252 	return (0);
1253 }
1254 
1255 /* Mobility adaptation */
1256 void
1257 sctp_delete_prim_timer(struct sctp_inpcb *inp, struct sctp_tcb *stcb,
1258     struct sctp_nets *net SCTP_UNUSED)
1259 {
1260 	if (stcb->asoc.deleted_primary == NULL) {
1261 		SCTPDBG(SCTP_DEBUG_ASCONF1, "delete_prim_timer: deleted_primary is not stored...\n");
1262 		sctp_mobility_feature_off(inp, SCTP_MOBILITY_PRIM_DELETED);
1263 		return;
1264 	}
1265 	SCTPDBG(SCTP_DEBUG_ASCONF1, "delete_prim_timer: finished to keep deleted primary ");
1266 	SCTPDBG_ADDR(SCTP_DEBUG_ASCONF1, &stcb->asoc.deleted_primary->ro._l_addr.sa);
1267 	sctp_free_remote_addr(stcb->asoc.deleted_primary);
1268 	stcb->asoc.deleted_primary = NULL;
1269 	sctp_mobility_feature_off(inp, SCTP_MOBILITY_PRIM_DELETED);
1270 	return;
1271 }
1272 
1273 /*
1274  * For the shutdown and shutdown-ack, we do not keep one around on the
1275  * control queue. This means we must generate a new one and call the general
1276  * chunk output routine, AFTER having done threshold management.
1277  * It is assumed that net is non-NULL.
1278  */
1279 int
1280 sctp_shutdown_timer(struct sctp_inpcb *inp, struct sctp_tcb *stcb,
1281     struct sctp_nets *net)
1282 {
1283 	struct sctp_nets *alt;
1284 
1285 	/* first threshold managment */
1286 	if (sctp_threshold_management(inp, stcb, net, stcb->asoc.max_send_times)) {
1287 		/* Assoc is over */
1288 		return (1);
1289 	}
1290 	sctp_backoff_on_timeout(stcb, net, 1, 0, 0);
1291 	/* second select an alternative */
1292 	alt = sctp_find_alternate_net(stcb, net, 0);
1293 
1294 	/* third generate a shutdown into the queue for out net */
1295 	sctp_send_shutdown(stcb, alt);
1296 
1297 	/* fourth restart timer */
1298 	sctp_timer_start(SCTP_TIMER_TYPE_SHUTDOWN, inp, stcb, alt);
1299 	return (0);
1300 }
1301 
1302 int
1303 sctp_shutdownack_timer(struct sctp_inpcb *inp, struct sctp_tcb *stcb,
1304     struct sctp_nets *net)
1305 {
1306 	struct sctp_nets *alt;
1307 
1308 	/* first threshold managment */
1309 	if (sctp_threshold_management(inp, stcb, net, stcb->asoc.max_send_times)) {
1310 		/* Assoc is over */
1311 		return (1);
1312 	}
1313 	sctp_backoff_on_timeout(stcb, net, 1, 0, 0);
1314 	/* second select an alternative */
1315 	alt = sctp_find_alternate_net(stcb, net, 0);
1316 
1317 	/* third generate a shutdown into the queue for out net */
1318 	sctp_send_shutdown_ack(stcb, alt);
1319 
1320 	/* fourth restart timer */
1321 	sctp_timer_start(SCTP_TIMER_TYPE_SHUTDOWNACK, inp, stcb, alt);
1322 	return (0);
1323 }
1324 
1325 static void
1326 sctp_audit_stream_queues_for_size(struct sctp_inpcb *inp,
1327     struct sctp_tcb *stcb)
1328 {
1329 	struct sctp_stream_queue_pending *sp;
1330 	unsigned int i, chks_in_queue = 0;
1331 	int being_filled = 0;
1332 
1333 	/*
1334 	 * This function is ONLY called when the send/sent queues are empty.
1335 	 */
1336 	if ((stcb == NULL) || (inp == NULL))
1337 		return;
1338 
1339 	if (stcb->asoc.sent_queue_retran_cnt) {
1340 		SCTP_PRINTF("Hmm, sent_queue_retran_cnt is non-zero %d\n",
1341 		    stcb->asoc.sent_queue_retran_cnt);
1342 		stcb->asoc.sent_queue_retran_cnt = 0;
1343 	}
1344 	if (stcb->asoc.ss_functions.sctp_ss_is_empty(stcb, &stcb->asoc)) {
1345 		/* No stream scheduler information, initialize scheduler */
1346 		stcb->asoc.ss_functions.sctp_ss_init(stcb, &stcb->asoc, 0);
1347 		if (!stcb->asoc.ss_functions.sctp_ss_is_empty(stcb, &stcb->asoc)) {
1348 			/* yep, we lost a stream or two */
1349 			SCTP_PRINTF("Found additional streams NOT managed by scheduler, corrected\n");
1350 		} else {
1351 			/* no streams lost */
1352 			stcb->asoc.total_output_queue_size = 0;
1353 		}
1354 	}
1355 	/* Check to see if some data queued, if so report it */
1356 	for (i = 0; i < stcb->asoc.streamoutcnt; i++) {
1357 		if (!TAILQ_EMPTY(&stcb->asoc.strmout[i].outqueue)) {
1358 			TAILQ_FOREACH(sp, &stcb->asoc.strmout[i].outqueue, next) {
1359 				if (sp->msg_is_complete)
1360 					being_filled++;
1361 				chks_in_queue++;
1362 			}
1363 		}
1364 	}
1365 	if (chks_in_queue != stcb->asoc.stream_queue_cnt) {
1366 		SCTP_PRINTF("Hmm, stream queue cnt at %d I counted %d in stream out wheel\n",
1367 		    stcb->asoc.stream_queue_cnt, chks_in_queue);
1368 	}
1369 	if (chks_in_queue) {
1370 		/* call the output queue function */
1371 		sctp_chunk_output(inp, stcb, SCTP_OUTPUT_FROM_T3, SCTP_SO_NOT_LOCKED);
1372 		if ((TAILQ_EMPTY(&stcb->asoc.send_queue)) &&
1373 		    (TAILQ_EMPTY(&stcb->asoc.sent_queue))) {
1374 			/*
1375 			 * Probably should go in and make it go back through
1376 			 * and add fragments allowed
1377 			 */
1378 			if (being_filled == 0) {
1379 				SCTP_PRINTF("Still nothing moved %d chunks are stuck\n",
1380 				    chks_in_queue);
1381 			}
1382 		}
1383 	} else {
1384 		SCTP_PRINTF("Found no chunks on any queue tot:%lu\n",
1385 		    (u_long)stcb->asoc.total_output_queue_size);
1386 		stcb->asoc.total_output_queue_size = 0;
1387 	}
1388 }
1389 
1390 int
1391 sctp_heartbeat_timer(struct sctp_inpcb *inp, struct sctp_tcb *stcb,
1392     struct sctp_nets *net)
1393 {
1394 	uint8_t net_was_pf;
1395 
1396 	if (net->dest_state & SCTP_ADDR_PF) {
1397 		net_was_pf = 1;
1398 	} else {
1399 		net_was_pf = 0;
1400 	}
1401 	if (net->hb_responded == 0) {
1402 		if (net->ro._s_addr) {
1403 			/*
1404 			 * Invalidate the src address if we did not get a
1405 			 * response last time.
1406 			 */
1407 			sctp_free_ifa(net->ro._s_addr);
1408 			net->ro._s_addr = NULL;
1409 			net->src_addr_selected = 0;
1410 		}
1411 		sctp_backoff_on_timeout(stcb, net, 1, 0, 0);
1412 		if (sctp_threshold_management(inp, stcb, net, stcb->asoc.max_send_times)) {
1413 			/* Assoc is over */
1414 			return (1);
1415 		}
1416 	}
1417 	/* Zero PBA, if it needs it */
1418 	if (net->partial_bytes_acked) {
1419 		net->partial_bytes_acked = 0;
1420 	}
1421 	if ((stcb->asoc.total_output_queue_size > 0) &&
1422 	    (TAILQ_EMPTY(&stcb->asoc.send_queue)) &&
1423 	    (TAILQ_EMPTY(&stcb->asoc.sent_queue))) {
1424 		sctp_audit_stream_queues_for_size(inp, stcb);
1425 	}
1426 	if (!(net->dest_state & SCTP_ADDR_NOHB) &&
1427 	    !((net_was_pf == 0) && (net->dest_state & SCTP_ADDR_PF))) {
1428 		/*
1429 		 * when move to PF during threshold mangement, a HB has been
1430 		 * queued in that routine
1431 		 */
1432 		uint32_t ms_gone_by;
1433 
1434 		if ((net->last_sent_time.tv_sec > 0) ||
1435 		    (net->last_sent_time.tv_usec > 0)) {
1436 			struct timeval diff;
1437 
1438 			SCTP_GETTIME_TIMEVAL(&diff);
1439 			timevalsub(&diff, &net->last_sent_time);
1440 			ms_gone_by = (uint32_t) (diff.tv_sec * 1000) +
1441 			    (uint32_t) (diff.tv_usec / 1000);
1442 		} else {
1443 			ms_gone_by = 0xffffffff;
1444 		}
1445 		if ((ms_gone_by >= net->heart_beat_delay) ||
1446 		    (net->dest_state & SCTP_ADDR_PF)) {
1447 			sctp_send_hb(stcb, net, SCTP_SO_NOT_LOCKED);
1448 		}
1449 	}
1450 	return (0);
1451 }
1452 
1453 void
1454 sctp_pathmtu_timer(struct sctp_inpcb *inp,
1455     struct sctp_tcb *stcb,
1456     struct sctp_nets *net)
1457 {
1458 	uint32_t next_mtu, mtu;
1459 
1460 	next_mtu = sctp_get_next_mtu(net->mtu);
1461 
1462 	if ((next_mtu > net->mtu) && (net->port == 0)) {
1463 		if ((net->src_addr_selected == 0) ||
1464 		    (net->ro._s_addr == NULL) ||
1465 		    (net->ro._s_addr->localifa_flags & SCTP_BEING_DELETED)) {
1466 			if ((net->ro._s_addr != NULL) && (net->ro._s_addr->localifa_flags & SCTP_BEING_DELETED)) {
1467 				sctp_free_ifa(net->ro._s_addr);
1468 				net->ro._s_addr = NULL;
1469 				net->src_addr_selected = 0;
1470 			} else if (net->ro._s_addr == NULL) {
1471 #if defined(INET6) && defined(SCTP_EMBEDDED_V6_SCOPE)
1472 				if (net->ro._l_addr.sa.sa_family == AF_INET6) {
1473 					struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)&net->ro._l_addr;
1474 
1475 					/* KAME hack: embed scopeid */
1476 					(void)sa6_embedscope(sin6, MODULE_GLOBAL(ip6_use_defzone));
1477 				}
1478 #endif
1479 
1480 				net->ro._s_addr = sctp_source_address_selection(inp,
1481 				    stcb,
1482 				    (sctp_route_t *) & net->ro,
1483 				    net, 0, stcb->asoc.vrf_id);
1484 #if defined(INET6) && defined(SCTP_EMBEDDED_V6_SCOPE)
1485 				if (net->ro._l_addr.sa.sa_family == AF_INET6) {
1486 					struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)&net->ro._l_addr;
1487 
1488 					(void)sa6_recoverscope(sin6);
1489 				}
1490 #endif				/* INET6 */
1491 			}
1492 			if (net->ro._s_addr)
1493 				net->src_addr_selected = 1;
1494 		}
1495 		if (net->ro._s_addr) {
1496 			mtu = SCTP_GATHER_MTU_FROM_ROUTE(net->ro._s_addr, &net->ro._s_addr.sa, net->ro.ro_rt);
1497 #if defined(INET) || defined(INET6)
1498 			if (net->port) {
1499 				mtu -= sizeof(struct udphdr);
1500 			}
1501 #endif
1502 			if (mtu > next_mtu) {
1503 				net->mtu = next_mtu;
1504 			} else {
1505 				net->mtu = mtu;
1506 			}
1507 		}
1508 	}
1509 	/* restart the timer */
1510 	sctp_timer_start(SCTP_TIMER_TYPE_PATHMTURAISE, inp, stcb, net);
1511 }
1512 
1513 void
1514 sctp_autoclose_timer(struct sctp_inpcb *inp,
1515     struct sctp_tcb *stcb,
1516     struct sctp_nets *net)
1517 {
1518 	struct timeval tn, *tim_touse;
1519 	struct sctp_association *asoc;
1520 	int ticks_gone_by;
1521 
1522 	(void)SCTP_GETTIME_TIMEVAL(&tn);
1523 	if (stcb->asoc.sctp_autoclose_ticks &&
1524 	    sctp_is_feature_on(inp, SCTP_PCB_FLAGS_AUTOCLOSE)) {
1525 		/* Auto close is on */
1526 		asoc = &stcb->asoc;
1527 		/* pick the time to use */
1528 		if (asoc->time_last_rcvd.tv_sec >
1529 		    asoc->time_last_sent.tv_sec) {
1530 			tim_touse = &asoc->time_last_rcvd;
1531 		} else {
1532 			tim_touse = &asoc->time_last_sent;
1533 		}
1534 		/* Now has long enough transpired to autoclose? */
1535 		ticks_gone_by = SEC_TO_TICKS(tn.tv_sec - tim_touse->tv_sec);
1536 		if ((ticks_gone_by > 0) &&
1537 		    (ticks_gone_by >= (int)asoc->sctp_autoclose_ticks)) {
1538 			/*
1539 			 * autoclose time has hit, call the output routine,
1540 			 * which should do nothing just to be SURE we don't
1541 			 * have hanging data. We can then safely check the
1542 			 * queues and know that we are clear to send
1543 			 * shutdown
1544 			 */
1545 			sctp_chunk_output(inp, stcb, SCTP_OUTPUT_FROM_AUTOCLOSE_TMR, SCTP_SO_NOT_LOCKED);
1546 			/* Are we clean? */
1547 			if (TAILQ_EMPTY(&asoc->send_queue) &&
1548 			    TAILQ_EMPTY(&asoc->sent_queue)) {
1549 				/*
1550 				 * there is nothing queued to send, so I'm
1551 				 * done...
1552 				 */
1553 				if (SCTP_GET_STATE(asoc) != SCTP_STATE_SHUTDOWN_SENT) {
1554 					/* only send SHUTDOWN 1st time thru */
1555 					struct sctp_nets *netp;
1556 
1557 					if ((SCTP_GET_STATE(asoc) == SCTP_STATE_OPEN) ||
1558 					    (SCTP_GET_STATE(asoc) == SCTP_STATE_SHUTDOWN_RECEIVED)) {
1559 						SCTP_STAT_DECR_GAUGE32(sctps_currestab);
1560 					}
1561 					SCTP_SET_STATE(asoc, SCTP_STATE_SHUTDOWN_SENT);
1562 					SCTP_CLEAR_SUBSTATE(asoc, SCTP_STATE_SHUTDOWN_PENDING);
1563 					sctp_stop_timers_for_shutdown(stcb);
1564 					if (stcb->asoc.alternate) {
1565 						netp = stcb->asoc.alternate;
1566 					} else {
1567 						netp = stcb->asoc.primary_destination;
1568 					}
1569 					sctp_send_shutdown(stcb, netp);
1570 					sctp_timer_start(SCTP_TIMER_TYPE_SHUTDOWN,
1571 					    stcb->sctp_ep, stcb,
1572 					    netp);
1573 					sctp_timer_start(SCTP_TIMER_TYPE_SHUTDOWNGUARD,
1574 					    stcb->sctp_ep, stcb,
1575 					    netp);
1576 				}
1577 			}
1578 		} else {
1579 			/*
1580 			 * No auto close at this time, reset t-o to check
1581 			 * later
1582 			 */
1583 			int tmp;
1584 
1585 			/* fool the timer startup to use the time left */
1586 			tmp = asoc->sctp_autoclose_ticks;
1587 			asoc->sctp_autoclose_ticks -= ticks_gone_by;
1588 			sctp_timer_start(SCTP_TIMER_TYPE_AUTOCLOSE, inp, stcb,
1589 			    net);
1590 			/* restore the real tick value */
1591 			asoc->sctp_autoclose_ticks = tmp;
1592 		}
1593 	}
1594 }
1595