xref: /freebsd/sys/dev/cxgbe/tom/t4_tls.c (revision 6829dae12bb055451fa467da4589c43bd03b1e64)
1 /*-
2  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
3  *
4  * Copyright (c) 2017-2018 Chelsio Communications, Inc.
5  * All rights reserved.
6  * Written by: John Baldwin <jhb@FreeBSD.org>
7  *
8  * Redistribution and use in source and binary forms, with or without
9  * modification, are permitted provided that the following conditions
10  * are met:
11  * 1. Redistributions of source code must retain the above copyright
12  *    notice, this list of conditions and the following disclaimer.
13  * 2. Redistributions in binary form must reproduce the above copyright
14  *    notice, this list of conditions and the following disclaimer in the
15  *    documentation and/or other materials provided with the distribution.
16  *
17  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
18  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
21  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27  * SUCH DAMAGE.
28  */
29 
30 #include "opt_inet.h"
31 
32 #include <sys/cdefs.h>
33 __FBSDID("$FreeBSD$");
34 
35 #include <sys/param.h>
36 #include <sys/sglist.h>
37 #include <sys/socket.h>
38 #include <sys/socketvar.h>
39 #include <sys/systm.h>
40 #include <netinet/in.h>
41 #include <netinet/in_pcb.h>
42 #include <netinet/tcp_var.h>
43 #include <netinet/toecore.h>
44 
45 #ifdef TCP_OFFLOAD
46 #include "common/common.h"
47 #include "common/t4_tcb.h"
48 #include "crypto/t4_crypto.h"
49 #include "tom/t4_tom_l2t.h"
50 #include "tom/t4_tom.h"
51 
52 /*
53  * The TCP sequence number of a CPL_TLS_DATA mbuf is saved here while
54  * the mbuf is in the ulp_pdu_reclaimq.
55  */
56 #define	tls_tcp_seq	PH_loc.thirtytwo[0]
57 
58 /*
59  * Handshake lock used for the handshake timer.  Having a global lock
60  * is perhaps not ideal, but it avoids having to use callout_drain()
61  * in tls_uninit_toep() which can't block.  Also, the timer shouldn't
62  * actually fire for most connections.
63  */
64 static struct mtx tls_handshake_lock;
65 
66 static void
67 t4_set_tls_tcb_field(struct toepcb *toep, uint16_t word, uint64_t mask,
68     uint64_t val)
69 {
70 	struct adapter *sc = td_adapter(toep->td);
71 
72 	t4_set_tcb_field(sc, toep->ofld_txq, toep, word, mask, val, 0, 0);
73 }
74 
75 /* TLS and DTLS common routines */
76 bool
77 can_tls_offload(struct adapter *sc)
78 {
79 
80 	return (sc->tt.tls && sc->cryptocaps & FW_CAPS_CONFIG_TLSKEYS);
81 }
82 
83 int
84 tls_tx_key(struct toepcb *toep)
85 {
86 	struct tls_ofld_info *tls_ofld = &toep->tls;
87 
88 	return (tls_ofld->tx_key_addr >= 0);
89 }
90 
91 int
92 tls_rx_key(struct toepcb *toep)
93 {
94 	struct tls_ofld_info *tls_ofld = &toep->tls;
95 
96 	return (tls_ofld->rx_key_addr >= 0);
97 }
98 
99 static int
100 key_size(struct toepcb *toep)
101 {
102 	struct tls_ofld_info *tls_ofld = &toep->tls;
103 
104 	return ((tls_ofld->key_location == TLS_SFO_WR_CONTEXTLOC_IMMEDIATE) ?
105 		tls_ofld->k_ctx.tx_key_info_size : KEY_IN_DDR_SIZE);
106 }
107 
108 /* Set TLS Key-Id in TCB */
109 static void
110 t4_set_tls_keyid(struct toepcb *toep, unsigned int key_id)
111 {
112 
113 	t4_set_tls_tcb_field(toep, W_TCB_RX_TLS_KEY_TAG,
114 			 V_TCB_RX_TLS_KEY_TAG(M_TCB_RX_TLS_BUF_TAG),
115 			 V_TCB_RX_TLS_KEY_TAG(key_id));
116 }
117 
118 /* Clear TF_RX_QUIESCE to re-enable receive. */
119 static void
120 t4_clear_rx_quiesce(struct toepcb *toep)
121 {
122 
123 	t4_set_tls_tcb_field(toep, W_TCB_T_FLAGS, V_TF_RX_QUIESCE(1), 0);
124 }
125 
126 static void
127 tls_clr_ofld_mode(struct toepcb *toep)
128 {
129 
130 	tls_stop_handshake_timer(toep);
131 
132 	/* Operate in PDU extraction mode only. */
133 	t4_set_tls_tcb_field(toep, W_TCB_ULP_RAW,
134 	    V_TCB_ULP_RAW(M_TCB_ULP_RAW),
135 	    V_TCB_ULP_RAW(V_TF_TLS_ENABLE(1)));
136 	t4_clear_rx_quiesce(toep);
137 }
138 
139 static void
140 tls_clr_quiesce(struct toepcb *toep)
141 {
142 
143 	tls_stop_handshake_timer(toep);
144 	t4_clear_rx_quiesce(toep);
145 }
146 
147 /*
148  * Calculate the TLS data expansion size
149  */
150 static int
151 tls_expansion_size(struct toepcb *toep, int data_len, int full_pdus_only,
152     unsigned short *pdus_per_ulp)
153 {
154 	struct tls_ofld_info *tls_ofld = &toep->tls;
155 	struct tls_scmd *scmd = &tls_ofld->scmd0;
156 	int expn_size = 0, frag_count = 0, pad_per_pdu = 0,
157 	    pad_last_pdu = 0, last_frag_size = 0, max_frag_size = 0;
158 	int exp_per_pdu = 0;
159 	int hdr_len = TLS_HEADER_LENGTH;
160 
161 	do {
162 		max_frag_size = tls_ofld->k_ctx.frag_size;
163 		if (G_SCMD_CIPH_MODE(scmd->seqno_numivs) ==
164 		   SCMD_CIPH_MODE_AES_GCM) {
165 			frag_count = (data_len / max_frag_size);
166 			exp_per_pdu = GCM_TAG_SIZE + AEAD_EXPLICIT_DATA_SIZE +
167 				hdr_len;
168 			expn_size =  frag_count * exp_per_pdu;
169 			if (full_pdus_only) {
170 				*pdus_per_ulp = data_len / (exp_per_pdu +
171 					max_frag_size);
172 				if (*pdus_per_ulp > 32)
173 					*pdus_per_ulp = 32;
174 				else if(!*pdus_per_ulp)
175 					*pdus_per_ulp = 1;
176 				expn_size = (*pdus_per_ulp) * exp_per_pdu;
177 				break;
178 			}
179 			if ((last_frag_size = data_len % max_frag_size) > 0) {
180 				frag_count += 1;
181 				expn_size += exp_per_pdu;
182 			}
183 			break;
184 		} else if (G_SCMD_CIPH_MODE(scmd->seqno_numivs) !=
185 			   SCMD_CIPH_MODE_NOP) {
186 			/* Calculate the number of fragments we can make */
187 			frag_count  = (data_len / max_frag_size);
188 			if (frag_count > 0) {
189 				pad_per_pdu = (((howmany((max_frag_size +
190 						       tls_ofld->mac_length),
191 						      CIPHER_BLOCK_SIZE)) *
192 						CIPHER_BLOCK_SIZE) -
193 					       (max_frag_size +
194 						tls_ofld->mac_length));
195 				if (!pad_per_pdu)
196 					pad_per_pdu = CIPHER_BLOCK_SIZE;
197 				exp_per_pdu = pad_per_pdu +
198 				       	tls_ofld->mac_length +
199 					hdr_len + CIPHER_BLOCK_SIZE;
200 				expn_size = frag_count * exp_per_pdu;
201 			}
202 			if (full_pdus_only) {
203 				*pdus_per_ulp = data_len / (exp_per_pdu +
204 					max_frag_size);
205 				if (*pdus_per_ulp > 32)
206 					*pdus_per_ulp = 32;
207 				else if (!*pdus_per_ulp)
208 					*pdus_per_ulp = 1;
209 				expn_size = (*pdus_per_ulp) * exp_per_pdu;
210 				break;
211 			}
212 			/* Consider the last fragment */
213 			if ((last_frag_size = data_len % max_frag_size) > 0) {
214 				pad_last_pdu = (((howmany((last_frag_size +
215 							tls_ofld->mac_length),
216 						       CIPHER_BLOCK_SIZE)) *
217 						 CIPHER_BLOCK_SIZE) -
218 						(last_frag_size +
219 						 tls_ofld->mac_length));
220 				if (!pad_last_pdu)
221 					pad_last_pdu = CIPHER_BLOCK_SIZE;
222 				expn_size += (pad_last_pdu +
223 					      tls_ofld->mac_length + hdr_len +
224 					      CIPHER_BLOCK_SIZE);
225 			}
226 		}
227 	} while (0);
228 
229 	return (expn_size);
230 }
231 
232 /* Copy Key to WR */
233 static void
234 tls_copy_tx_key(struct toepcb *toep, void *dst)
235 {
236 	struct tls_ofld_info *tls_ofld = &toep->tls;
237 	struct ulptx_sc_memrd *sc_memrd;
238 	struct ulptx_idata *sc;
239 
240 	if (tls_ofld->k_ctx.tx_key_info_size <= 0)
241 		return;
242 
243 	if (tls_ofld->key_location == TLS_SFO_WR_CONTEXTLOC_DDR) {
244 		sc = dst;
245 		sc->cmd_more = htobe32(V_ULPTX_CMD(ULP_TX_SC_NOOP));
246 		sc->len = htobe32(0);
247 		sc_memrd = (struct ulptx_sc_memrd *)(sc + 1);
248 		sc_memrd->cmd_to_len = htobe32(V_ULPTX_CMD(ULP_TX_SC_MEMRD) |
249 		    V_ULP_TX_SC_MORE(1) |
250 		    V_ULPTX_LEN16(tls_ofld->k_ctx.tx_key_info_size >> 4));
251 		sc_memrd->addr = htobe32(tls_ofld->tx_key_addr >> 5);
252 	} else if (tls_ofld->key_location == TLS_SFO_WR_CONTEXTLOC_IMMEDIATE) {
253 		memcpy(dst, &tls_ofld->k_ctx.tx,
254 		    tls_ofld->k_ctx.tx_key_info_size);
255 	}
256 }
257 
258 /* TLS/DTLS content type  for CPL SFO */
259 static inline unsigned char
260 tls_content_type(unsigned char content_type)
261 {
262 	/*
263 	 * XXX: Shouldn't this map CONTENT_TYPE_APP_DATA to DATA and
264 	 * default to "CUSTOM" for all other types including
265 	 * heartbeat?
266 	 */
267 	switch (content_type) {
268 	case CONTENT_TYPE_CCS:
269 		return CPL_TX_TLS_SFO_TYPE_CCS;
270 	case CONTENT_TYPE_ALERT:
271 		return CPL_TX_TLS_SFO_TYPE_ALERT;
272 	case CONTENT_TYPE_HANDSHAKE:
273 		return CPL_TX_TLS_SFO_TYPE_HANDSHAKE;
274 	case CONTENT_TYPE_HEARTBEAT:
275 		return CPL_TX_TLS_SFO_TYPE_HEARTBEAT;
276 	}
277 	return CPL_TX_TLS_SFO_TYPE_DATA;
278 }
279 
280 static unsigned char
281 get_cipher_key_size(unsigned int ck_size)
282 {
283 	switch (ck_size) {
284 	case AES_NOP: /* NOP */
285 		return 15;
286 	case AES_128: /* AES128 */
287 		return CH_CK_SIZE_128;
288 	case AES_192: /* AES192 */
289 		return CH_CK_SIZE_192;
290 	case AES_256: /* AES256 */
291 		return CH_CK_SIZE_256;
292 	default:
293 		return CH_CK_SIZE_256;
294 	}
295 }
296 
297 static unsigned char
298 get_mac_key_size(unsigned int mk_size)
299 {
300 	switch (mk_size) {
301 	case SHA_NOP: /* NOP */
302 		return CH_MK_SIZE_128;
303 	case SHA_GHASH: /* GHASH */
304 	case SHA_512: /* SHA512 */
305 		return CH_MK_SIZE_512;
306 	case SHA_224: /* SHA2-224 */
307 		return CH_MK_SIZE_192;
308 	case SHA_256: /* SHA2-256*/
309 		return CH_MK_SIZE_256;
310 	case SHA_384: /* SHA384 */
311 		return CH_MK_SIZE_512;
312 	case SHA1: /* SHA1 */
313 	default:
314 		return CH_MK_SIZE_160;
315 	}
316 }
317 
318 static unsigned int
319 get_proto_ver(int proto_ver)
320 {
321 	switch (proto_ver) {
322 	case TLS1_2_VERSION:
323 		return TLS_1_2_VERSION;
324 	case TLS1_1_VERSION:
325 		return TLS_1_1_VERSION;
326 	case DTLS1_2_VERSION:
327 		return DTLS_1_2_VERSION;
328 	default:
329 		return TLS_VERSION_MAX;
330 	}
331 }
332 
333 static void
334 tls_rxkey_flit1(struct tls_keyctx *kwr, struct tls_key_context *kctx)
335 {
336 
337 	if (kctx->state.enc_mode == CH_EVP_CIPH_GCM_MODE) {
338 		kwr->u.rxhdr.ivinsert_to_authinsrt =
339 		    htobe64(V_TLS_KEYCTX_TX_WR_IVINSERT(6ULL) |
340 			V_TLS_KEYCTX_TX_WR_AADSTRTOFST(1ULL) |
341 			V_TLS_KEYCTX_TX_WR_AADSTOPOFST(5ULL) |
342 			V_TLS_KEYCTX_TX_WR_AUTHSRTOFST(14ULL) |
343 			V_TLS_KEYCTX_TX_WR_AUTHSTOPOFST(16ULL) |
344 			V_TLS_KEYCTX_TX_WR_CIPHERSRTOFST(14ULL) |
345 			V_TLS_KEYCTX_TX_WR_CIPHERSTOPOFST(0ULL) |
346 			V_TLS_KEYCTX_TX_WR_AUTHINSRT(16ULL));
347 		kwr->u.rxhdr.ivpresent_to_rxmk_size &=
348 			~(V_TLS_KEYCTX_TX_WR_RXOPAD_PRESENT(1));
349 		kwr->u.rxhdr.authmode_to_rxvalid &=
350 			~(V_TLS_KEYCTX_TX_WR_CIPHAUTHSEQCTRL(1));
351 	} else {
352 		kwr->u.rxhdr.ivinsert_to_authinsrt =
353 		    htobe64(V_TLS_KEYCTX_TX_WR_IVINSERT(6ULL) |
354 			V_TLS_KEYCTX_TX_WR_AADSTRTOFST(1ULL) |
355 			V_TLS_KEYCTX_TX_WR_AADSTOPOFST(5ULL) |
356 			V_TLS_KEYCTX_TX_WR_AUTHSRTOFST(22ULL) |
357 			V_TLS_KEYCTX_TX_WR_AUTHSTOPOFST(0ULL) |
358 			V_TLS_KEYCTX_TX_WR_CIPHERSRTOFST(22ULL) |
359 			V_TLS_KEYCTX_TX_WR_CIPHERSTOPOFST(0ULL) |
360 			V_TLS_KEYCTX_TX_WR_AUTHINSRT(0ULL));
361 	}
362 }
363 
364 /* Rx key */
365 static void
366 prepare_rxkey_wr(struct tls_keyctx *kwr, struct tls_key_context *kctx)
367 {
368 	unsigned int ck_size = kctx->cipher_secret_size;
369 	unsigned int mk_size = kctx->mac_secret_size;
370 	int proto_ver = kctx->proto_ver;
371 
372 	kwr->u.rxhdr.flitcnt_hmacctrl =
373 		((kctx->tx_key_info_size >> 4) << 3) | kctx->hmac_ctrl;
374 
375 	kwr->u.rxhdr.protover_ciphmode =
376 		V_TLS_KEYCTX_TX_WR_PROTOVER(get_proto_ver(proto_ver)) |
377 		V_TLS_KEYCTX_TX_WR_CIPHMODE(kctx->state.enc_mode);
378 
379 	kwr->u.rxhdr.authmode_to_rxvalid =
380 		V_TLS_KEYCTX_TX_WR_AUTHMODE(kctx->state.auth_mode) |
381 		V_TLS_KEYCTX_TX_WR_CIPHAUTHSEQCTRL(1) |
382 		V_TLS_KEYCTX_TX_WR_SEQNUMCTRL(3) |
383 		V_TLS_KEYCTX_TX_WR_RXVALID(1);
384 
385 	kwr->u.rxhdr.ivpresent_to_rxmk_size =
386 		V_TLS_KEYCTX_TX_WR_IVPRESENT(0) |
387 		V_TLS_KEYCTX_TX_WR_RXOPAD_PRESENT(1) |
388 		V_TLS_KEYCTX_TX_WR_RXCK_SIZE(get_cipher_key_size(ck_size)) |
389 		V_TLS_KEYCTX_TX_WR_RXMK_SIZE(get_mac_key_size(mk_size));
390 
391 	tls_rxkey_flit1(kwr, kctx);
392 
393 	/* No key reversal for GCM */
394 	if (kctx->state.enc_mode != CH_EVP_CIPH_GCM_MODE) {
395 		t4_aes_getdeckey(kwr->keys.edkey, kctx->rx.key,
396 				 (kctx->cipher_secret_size << 3));
397 		memcpy(kwr->keys.edkey + kctx->cipher_secret_size,
398 		       kctx->rx.key + kctx->cipher_secret_size,
399 		       (IPAD_SIZE + OPAD_SIZE));
400 	} else {
401 		memcpy(kwr->keys.edkey, kctx->rx.key,
402 		       (kctx->tx_key_info_size - SALT_SIZE));
403 		memcpy(kwr->u.rxhdr.rxsalt, kctx->rx.salt, SALT_SIZE);
404 	}
405 }
406 
407 /* Tx key */
408 static void
409 prepare_txkey_wr(struct tls_keyctx *kwr, struct tls_key_context *kctx)
410 {
411 	unsigned int ck_size = kctx->cipher_secret_size;
412 	unsigned int mk_size = kctx->mac_secret_size;
413 
414 	kwr->u.txhdr.ctxlen =
415 		(kctx->tx_key_info_size >> 4);
416 	kwr->u.txhdr.dualck_to_txvalid =
417 		V_TLS_KEYCTX_TX_WR_TXOPAD_PRESENT(1) |
418 		V_TLS_KEYCTX_TX_WR_SALT_PRESENT(1) |
419 		V_TLS_KEYCTX_TX_WR_TXCK_SIZE(get_cipher_key_size(ck_size)) |
420 		V_TLS_KEYCTX_TX_WR_TXMK_SIZE(get_mac_key_size(mk_size)) |
421 		V_TLS_KEYCTX_TX_WR_TXVALID(1);
422 
423 	memcpy(kwr->keys.edkey, kctx->tx.key, HDR_KCTX_SIZE);
424 	if (kctx->state.enc_mode == CH_EVP_CIPH_GCM_MODE) {
425 		memcpy(kwr->u.txhdr.txsalt, kctx->tx.salt, SALT_SIZE);
426 		kwr->u.txhdr.dualck_to_txvalid &=
427 			~(V_TLS_KEYCTX_TX_WR_TXOPAD_PRESENT(1));
428 	}
429 	kwr->u.txhdr.dualck_to_txvalid = htons(kwr->u.txhdr.dualck_to_txvalid);
430 }
431 
432 /* TLS Key memory management */
433 static int
434 get_new_keyid(struct toepcb *toep, struct tls_key_context *k_ctx)
435 {
436 	struct adapter *sc = td_adapter(toep->td);
437 	vmem_addr_t addr;
438 
439 	if (vmem_alloc(sc->key_map, TLS_KEY_CONTEXT_SZ, M_NOWAIT | M_FIRSTFIT,
440 	    &addr) != 0)
441 		return (-1);
442 
443 	return (addr);
444 }
445 
446 static void
447 free_keyid(struct toepcb *toep, int keyid)
448 {
449 	struct adapter *sc = td_adapter(toep->td);
450 
451 	vmem_free(sc->key_map, keyid, TLS_KEY_CONTEXT_SZ);
452 }
453 
454 static void
455 clear_tls_keyid(struct toepcb *toep)
456 {
457 	struct tls_ofld_info *tls_ofld = &toep->tls;
458 
459 	if (tls_ofld->rx_key_addr >= 0) {
460 		free_keyid(toep, tls_ofld->rx_key_addr);
461 		tls_ofld->rx_key_addr = -1;
462 	}
463 	if (tls_ofld->tx_key_addr >= 0) {
464 		free_keyid(toep, tls_ofld->tx_key_addr);
465 		tls_ofld->tx_key_addr = -1;
466 	}
467 }
468 
469 static int
470 get_keyid(struct tls_ofld_info *tls_ofld, unsigned int ops)
471 {
472 	return (ops & KEY_WRITE_RX ? tls_ofld->rx_key_addr :
473 		((ops & KEY_WRITE_TX) ? tls_ofld->tx_key_addr : -1));
474 }
475 
476 static int
477 get_tp_plen_max(struct tls_ofld_info *tls_ofld)
478 {
479 	int plen = ((min(3*4096, TP_TX_PG_SZ))/1448) * 1448;
480 
481 	return (tls_ofld->k_ctx.frag_size <= 8192 ? plen : FC_TP_PLEN_MAX);
482 }
483 
484 /* Send request to get the key-id */
485 static int
486 tls_program_key_id(struct toepcb *toep, struct tls_key_context *k_ctx)
487 {
488 	struct tls_ofld_info *tls_ofld = &toep->tls;
489 	struct adapter *sc = td_adapter(toep->td);
490 	struct ofld_tx_sdesc *txsd;
491 	int kwrlen, kctxlen, keyid, len;
492 	struct wrqe *wr;
493 	struct tls_key_req *kwr;
494 	struct tls_keyctx *kctx;
495 
496 	kwrlen = sizeof(*kwr);
497 	kctxlen = roundup2(sizeof(*kctx), 32);
498 	len = roundup2(kwrlen + kctxlen, 16);
499 
500 	if (toep->txsd_avail == 0)
501 		return (EAGAIN);
502 
503 	/* Dont initialize key for re-neg */
504 	if (!G_KEY_CLR_LOC(k_ctx->l_p_key)) {
505 		if ((keyid = get_new_keyid(toep, k_ctx)) < 0) {
506 			return (ENOSPC);
507 		}
508 	} else {
509 		keyid = get_keyid(tls_ofld, k_ctx->l_p_key);
510 	}
511 
512 	wr = alloc_wrqe(len, toep->ofld_txq);
513 	if (wr == NULL) {
514 		free_keyid(toep, keyid);
515 		return (ENOMEM);
516 	}
517 	kwr = wrtod(wr);
518 	memset(kwr, 0, kwrlen);
519 
520 	kwr->wr_hi = htobe32(V_FW_WR_OP(FW_ULPTX_WR) | F_FW_WR_COMPL |
521 	    F_FW_WR_ATOMIC);
522 	kwr->wr_mid = htobe32(V_FW_WR_LEN16(DIV_ROUND_UP(len, 16)) |
523 	    V_FW_WR_FLOWID(toep->tid));
524 	kwr->protocol = get_proto_ver(k_ctx->proto_ver);
525 	kwr->mfs = htons(k_ctx->frag_size);
526 	kwr->reneg_to_write_rx = k_ctx->l_p_key;
527 
528 	/* master command */
529 	kwr->cmd = htobe32(V_ULPTX_CMD(ULP_TX_MEM_WRITE) |
530 	    V_T5_ULP_MEMIO_ORDER(1) | V_T5_ULP_MEMIO_IMM(1));
531 	kwr->dlen = htobe32(V_ULP_MEMIO_DATA_LEN(kctxlen >> 5));
532 	kwr->len16 = htobe32((toep->tid << 8) |
533 	    DIV_ROUND_UP(len - sizeof(struct work_request_hdr), 16));
534 	kwr->kaddr = htobe32(V_ULP_MEMIO_ADDR(keyid >> 5));
535 
536 	/* sub command */
537 	kwr->sc_more = htobe32(V_ULPTX_CMD(ULP_TX_SC_IMM));
538 	kwr->sc_len = htobe32(kctxlen);
539 
540 	kctx = (struct tls_keyctx *)(kwr + 1);
541 	memset(kctx, 0, kctxlen);
542 
543 	if (G_KEY_GET_LOC(k_ctx->l_p_key) == KEY_WRITE_TX) {
544 		tls_ofld->tx_key_addr = keyid;
545 		prepare_txkey_wr(kctx, k_ctx);
546 	} else if (G_KEY_GET_LOC(k_ctx->l_p_key) == KEY_WRITE_RX) {
547 		tls_ofld->rx_key_addr = keyid;
548 		prepare_rxkey_wr(kctx, k_ctx);
549 	}
550 
551 	txsd = &toep->txsd[toep->txsd_pidx];
552 	txsd->tx_credits = DIV_ROUND_UP(len, 16);
553 	txsd->plen = 0;
554 	toep->tx_credits -= txsd->tx_credits;
555 	if (__predict_false(++toep->txsd_pidx == toep->txsd_total))
556 		toep->txsd_pidx = 0;
557 	toep->txsd_avail--;
558 
559 	t4_wrq_tx(sc, wr);
560 
561 	return (0);
562 }
563 
564 /* Store a key received from SSL in DDR. */
565 static int
566 program_key_context(struct tcpcb *tp, struct toepcb *toep,
567     struct tls_key_context *uk_ctx)
568 {
569 	struct adapter *sc = td_adapter(toep->td);
570 	struct tls_ofld_info *tls_ofld = &toep->tls;
571 	struct tls_key_context *k_ctx;
572 	int error, key_offset;
573 
574 	if (tp->t_state != TCPS_ESTABLISHED) {
575 		/*
576 		 * XXX: Matches Linux driver, but not sure this is a
577 		 * very appropriate error.
578 		 */
579 		return (ENOENT);
580 	}
581 
582 	/* Stop timer on handshake completion */
583 	tls_stop_handshake_timer(toep);
584 
585 	toep->flags &= ~TPF_FORCE_CREDITS;
586 
587 	CTR4(KTR_CXGBE, "%s: tid %d %s proto_ver %#x", __func__, toep->tid,
588 	    G_KEY_GET_LOC(uk_ctx->l_p_key) == KEY_WRITE_RX ? "KEY_WRITE_RX" :
589 	    "KEY_WRITE_TX", uk_ctx->proto_ver);
590 
591 	if (G_KEY_GET_LOC(uk_ctx->l_p_key) == KEY_WRITE_RX &&
592 	    toep->ulp_mode != ULP_MODE_TLS)
593 		return (EOPNOTSUPP);
594 
595 	/* Don't copy the 'tx' and 'rx' fields. */
596 	k_ctx = &tls_ofld->k_ctx;
597 	memcpy(&k_ctx->l_p_key, &uk_ctx->l_p_key,
598 	    sizeof(*k_ctx) - offsetof(struct tls_key_context, l_p_key));
599 
600 	/* TLS version != 1.1 and !1.2 OR DTLS != 1.2 */
601 	if (get_proto_ver(k_ctx->proto_ver) > DTLS_1_2_VERSION) {
602 		if (G_KEY_GET_LOC(k_ctx->l_p_key) == KEY_WRITE_RX) {
603 			tls_ofld->rx_key_addr = -1;
604 			t4_clear_rx_quiesce(toep);
605 		} else {
606 			tls_ofld->tx_key_addr = -1;
607 		}
608 		return (0);
609 	}
610 
611 	if (k_ctx->state.enc_mode == CH_EVP_CIPH_GCM_MODE) {
612 		k_ctx->iv_size = 4;
613 		k_ctx->mac_first = 0;
614 		k_ctx->hmac_ctrl = 0;
615 	} else {
616 		k_ctx->iv_size = 8; /* for CBC, iv is 16B, unit of 2B */
617 		k_ctx->mac_first = 1;
618 	}
619 
620 	tls_ofld->scmd0.seqno_numivs =
621 		(V_SCMD_SEQ_NO_CTRL(3) |
622 		 V_SCMD_PROTO_VERSION(get_proto_ver(k_ctx->proto_ver)) |
623 		 V_SCMD_ENC_DEC_CTRL(SCMD_ENCDECCTRL_ENCRYPT) |
624 		 V_SCMD_CIPH_AUTH_SEQ_CTRL((k_ctx->mac_first == 0)) |
625 		 V_SCMD_CIPH_MODE(k_ctx->state.enc_mode) |
626 		 V_SCMD_AUTH_MODE(k_ctx->state.auth_mode) |
627 		 V_SCMD_HMAC_CTRL(k_ctx->hmac_ctrl) |
628 		 V_SCMD_IV_SIZE(k_ctx->iv_size));
629 
630 	tls_ofld->scmd0.ivgen_hdrlen =
631 		(V_SCMD_IV_GEN_CTRL(k_ctx->iv_ctrl) |
632 		 V_SCMD_KEY_CTX_INLINE(0) |
633 		 V_SCMD_TLS_FRAG_ENABLE(1));
634 
635 	tls_ofld->mac_length = k_ctx->mac_secret_size;
636 
637 	if (G_KEY_GET_LOC(k_ctx->l_p_key) == KEY_WRITE_RX) {
638 		k_ctx->rx = uk_ctx->rx;
639 		/* Dont initialize key for re-neg */
640 		if (!G_KEY_CLR_LOC(k_ctx->l_p_key))
641 			tls_ofld->rx_key_addr = -1;
642 	} else {
643 		k_ctx->tx = uk_ctx->tx;
644 		/* Dont initialize key for re-neg */
645 		if (!G_KEY_CLR_LOC(k_ctx->l_p_key))
646 			tls_ofld->tx_key_addr = -1;
647 	}
648 
649 	/* Flush pending data before new Tx key becomes active */
650 	if (G_KEY_GET_LOC(k_ctx->l_p_key) == KEY_WRITE_TX) {
651 		struct sockbuf *sb;
652 
653 		/* XXX: This might not drain everything. */
654 		t4_push_frames(sc, toep, 0);
655 		sb = &toep->inp->inp_socket->so_snd;
656 		SOCKBUF_LOCK(sb);
657 
658 		/* XXX: This asserts that everything has been pushed. */
659 		MPASS(sb->sb_sndptr == NULL || sb->sb_sndptr->m_next == NULL);
660 		sb->sb_sndptr = NULL;
661 		tls_ofld->sb_off = sbavail(sb);
662 		SOCKBUF_UNLOCK(sb);
663 		tls_ofld->tx_seq_no = 0;
664 	}
665 
666 	if ((G_KEY_GET_LOC(k_ctx->l_p_key) == KEY_WRITE_RX) ||
667 	    (tls_ofld->key_location == TLS_SFO_WR_CONTEXTLOC_DDR)) {
668 		error = tls_program_key_id(toep, k_ctx);
669 		if (error) {
670 			/* XXX: Only clear quiesce for KEY_WRITE_RX? */
671 			t4_clear_rx_quiesce(toep);
672 			return (error);
673 		}
674 	}
675 
676 	if (G_KEY_GET_LOC(k_ctx->l_p_key) == KEY_WRITE_RX) {
677 		/*
678 		 * RX key tags are an index into the key portion of MA
679 		 * memory stored as an offset from the base address in
680 		 * units of 64 bytes.
681 		 */
682 		key_offset = tls_ofld->rx_key_addr - sc->vres.key.start;
683 		t4_set_tls_keyid(toep, key_offset / 64);
684 		t4_set_tls_tcb_field(toep, W_TCB_ULP_RAW,
685 				 V_TCB_ULP_RAW(M_TCB_ULP_RAW),
686 				 V_TCB_ULP_RAW((V_TF_TLS_KEY_SIZE(3) |
687 						V_TF_TLS_CONTROL(1) |
688 						V_TF_TLS_ACTIVE(1) |
689 						V_TF_TLS_ENABLE(1))));
690 		t4_set_tls_tcb_field(toep, W_TCB_TLS_SEQ,
691 				 V_TCB_TLS_SEQ(M_TCB_TLS_SEQ),
692 				 V_TCB_TLS_SEQ(0));
693 		t4_clear_rx_quiesce(toep);
694 	} else {
695 		unsigned short pdus_per_ulp;
696 
697 		if (tls_ofld->key_location == TLS_SFO_WR_CONTEXTLOC_IMMEDIATE)
698 			tls_ofld->tx_key_addr = 1;
699 
700 		tls_ofld->fcplenmax = get_tp_plen_max(tls_ofld);
701 		tls_ofld->expn_per_ulp = tls_expansion_size(toep,
702 				tls_ofld->fcplenmax, 1, &pdus_per_ulp);
703 		tls_ofld->pdus_per_ulp = pdus_per_ulp;
704 		tls_ofld->adjusted_plen = tls_ofld->pdus_per_ulp *
705 			((tls_ofld->expn_per_ulp/tls_ofld->pdus_per_ulp) +
706 			 tls_ofld->k_ctx.frag_size);
707 	}
708 
709 	return (0);
710 }
711 
712 /*
713  * In some cases a client connection can hang without sending the
714  * ServerHelloDone message from the NIC to the host.  Send a dummy
715  * RX_DATA_ACK with RX_MODULATE to unstick the connection.
716  */
717 static void
718 tls_send_handshake_ack(void *arg)
719 {
720 	struct toepcb *toep = arg;
721 	struct tls_ofld_info *tls_ofld = &toep->tls;
722 	struct adapter *sc = td_adapter(toep->td);
723 
724 	/*
725 	 * XXX: Does not have the t4_get_tcb() checks to refine the
726 	 * workaround.
727 	 */
728 	callout_schedule(&tls_ofld->handshake_timer, TLS_SRV_HELLO_RD_TM * hz);
729 
730 	CTR2(KTR_CXGBE, "%s: tid %d sending RX_DATA_ACK", __func__, toep->tid);
731 	send_rx_modulate(sc, toep);
732 }
733 
734 static void
735 tls_start_handshake_timer(struct toepcb *toep)
736 {
737 	struct tls_ofld_info *tls_ofld = &toep->tls;
738 
739 	mtx_lock(&tls_handshake_lock);
740 	callout_reset(&tls_ofld->handshake_timer, TLS_SRV_HELLO_BKOFF_TM * hz,
741 	    tls_send_handshake_ack, toep);
742 	mtx_unlock(&tls_handshake_lock);
743 }
744 
745 void
746 tls_stop_handshake_timer(struct toepcb *toep)
747 {
748 	struct tls_ofld_info *tls_ofld = &toep->tls;
749 
750 	mtx_lock(&tls_handshake_lock);
751 	callout_stop(&tls_ofld->handshake_timer);
752 	mtx_unlock(&tls_handshake_lock);
753 }
754 
755 int
756 t4_ctloutput_tls(struct socket *so, struct sockopt *sopt)
757 {
758 	struct tls_key_context uk_ctx;
759 	struct inpcb *inp;
760 	struct tcpcb *tp;
761 	struct toepcb *toep;
762 	int error, optval;
763 
764 	error = 0;
765 	if (sopt->sopt_dir == SOPT_SET &&
766 	    sopt->sopt_name == TCP_TLSOM_SET_TLS_CONTEXT) {
767 		error = sooptcopyin(sopt, &uk_ctx, sizeof(uk_ctx),
768 		    sizeof(uk_ctx));
769 		if (error)
770 			return (error);
771 	}
772 
773 	inp = sotoinpcb(so);
774 	KASSERT(inp != NULL, ("tcp_ctloutput: inp == NULL"));
775 	INP_WLOCK(inp);
776 	if (inp->inp_flags & (INP_TIMEWAIT | INP_DROPPED)) {
777 		INP_WUNLOCK(inp);
778 		return (ECONNRESET);
779 	}
780 	tp = intotcpcb(inp);
781 	toep = tp->t_toe;
782 	switch (sopt->sopt_dir) {
783 	case SOPT_SET:
784 		switch (sopt->sopt_name) {
785 		case TCP_TLSOM_SET_TLS_CONTEXT:
786 			error = program_key_context(tp, toep, &uk_ctx);
787 			INP_WUNLOCK(inp);
788 			break;
789 		case TCP_TLSOM_CLR_TLS_TOM:
790 			if (toep->ulp_mode == ULP_MODE_TLS) {
791 				CTR2(KTR_CXGBE, "%s: tid %d CLR_TLS_TOM",
792 				    __func__, toep->tid);
793 				tls_clr_ofld_mode(toep);
794 			} else
795 				error = EOPNOTSUPP;
796 			INP_WUNLOCK(inp);
797 			break;
798 		case TCP_TLSOM_CLR_QUIES:
799 			if (toep->ulp_mode == ULP_MODE_TLS) {
800 				CTR2(KTR_CXGBE, "%s: tid %d CLR_QUIES",
801 				    __func__, toep->tid);
802 				tls_clr_quiesce(toep);
803 			} else
804 				error = EOPNOTSUPP;
805 			INP_WUNLOCK(inp);
806 			break;
807 		default:
808 			INP_WUNLOCK(inp);
809 			error = EOPNOTSUPP;
810 			break;
811 		}
812 		break;
813 	case SOPT_GET:
814 		switch (sopt->sopt_name) {
815 		case TCP_TLSOM_GET_TLS_TOM:
816 			/*
817 			 * TLS TX is permitted on any TOE socket, but
818 			 * TLS RX requires a TLS ULP mode.
819 			 */
820 			optval = TLS_TOM_NONE;
821 			if (can_tls_offload(td_adapter(toep->td))) {
822 				switch (toep->ulp_mode) {
823 				case ULP_MODE_NONE:
824 				case ULP_MODE_TCPDDP:
825 					optval = TLS_TOM_TXONLY;
826 					break;
827 				case ULP_MODE_TLS:
828 					optval = TLS_TOM_BOTH;
829 					break;
830 				}
831 			}
832 			CTR3(KTR_CXGBE, "%s: tid %d GET_TLS_TOM = %d",
833 			    __func__, toep->tid, optval);
834 			INP_WUNLOCK(inp);
835 			error = sooptcopyout(sopt, &optval, sizeof(optval));
836 			break;
837 		default:
838 			INP_WUNLOCK(inp);
839 			error = EOPNOTSUPP;
840 			break;
841 		}
842 		break;
843 	}
844 	return (error);
845 }
846 
847 void
848 tls_init_toep(struct toepcb *toep)
849 {
850 	struct tls_ofld_info *tls_ofld = &toep->tls;
851 
852 	tls_ofld->key_location = TLS_SFO_WR_CONTEXTLOC_DDR;
853 	tls_ofld->rx_key_addr = -1;
854 	tls_ofld->tx_key_addr = -1;
855 	if (toep->ulp_mode == ULP_MODE_TLS)
856 		callout_init_mtx(&tls_ofld->handshake_timer,
857 		    &tls_handshake_lock, 0);
858 }
859 
860 void
861 tls_establish(struct toepcb *toep)
862 {
863 
864 	/*
865 	 * Enable PDU extraction.
866 	 *
867 	 * XXX: Supposedly this should be done by the firmware when
868 	 * the ULP_MODE FLOWC parameter is set in send_flowc_wr(), but
869 	 * in practice this seems to be required.
870 	 */
871 	CTR2(KTR_CXGBE, "%s: tid %d setting TLS_ENABLE", __func__, toep->tid);
872 	t4_set_tls_tcb_field(toep, W_TCB_ULP_RAW, V_TCB_ULP_RAW(M_TCB_ULP_RAW),
873 	    V_TCB_ULP_RAW(V_TF_TLS_ENABLE(1)));
874 
875 	toep->flags |= TPF_FORCE_CREDITS;
876 
877 	tls_start_handshake_timer(toep);
878 }
879 
880 void
881 tls_uninit_toep(struct toepcb *toep)
882 {
883 
884 	if (toep->ulp_mode == ULP_MODE_TLS)
885 		tls_stop_handshake_timer(toep);
886 	clear_tls_keyid(toep);
887 }
888 
889 #define MAX_OFLD_TX_CREDITS (SGE_MAX_WR_LEN / 16)
890 #define	MIN_OFLD_TLSTX_CREDITS(toep)					\
891 	(howmany(sizeof(struct fw_tlstx_data_wr) +			\
892 	    sizeof(struct cpl_tx_tls_sfo) + key_size((toep)) +		\
893 	    CIPHER_BLOCK_SIZE + 1, 16))
894 
895 static inline u_int
896 max_imm_tls_space(int tx_credits)
897 {
898 	const int n = 2;	/* Use only up to 2 desc for imm. data WR */
899 	int space;
900 
901 	KASSERT(tx_credits >= 0 &&
902 		tx_credits <= MAX_OFLD_TX_CREDITS,
903 		("%s: %d credits", __func__, tx_credits));
904 
905 	if (tx_credits >= (n * EQ_ESIZE) / 16)
906 		space = (n * EQ_ESIZE);
907 	else
908 		space = tx_credits * 16;
909 	return (space);
910 }
911 
912 static int
913 count_mbuf_segs(struct mbuf *m, int skip, int len, int *max_nsegs_1mbufp)
914 {
915 	int max_nsegs_1mbuf, n, nsegs;
916 
917 	while (skip >= m->m_len) {
918 		skip -= m->m_len;
919 		m = m->m_next;
920 	}
921 
922 	nsegs = 0;
923 	max_nsegs_1mbuf = 0;
924 	while (len > 0) {
925 		n = sglist_count(mtod(m, char *) + skip, m->m_len - skip);
926 		if (n > max_nsegs_1mbuf)
927 			max_nsegs_1mbuf = n;
928 		nsegs += n;
929 		len -= m->m_len - skip;
930 		skip = 0;
931 		m = m->m_next;
932 	}
933 	*max_nsegs_1mbufp = max_nsegs_1mbuf;
934 	return (nsegs);
935 }
936 
937 static void
938 write_tlstx_wr(struct fw_tlstx_data_wr *txwr, struct toepcb *toep,
939     unsigned int immdlen, unsigned int plen, unsigned int expn,
940     unsigned int pdus, uint8_t credits, int shove, int imm_ivs)
941 {
942 	struct tls_ofld_info *tls_ofld = &toep->tls;
943 	unsigned int len = plen + expn;
944 
945 	txwr->op_to_immdlen = htobe32(V_WR_OP(FW_TLSTX_DATA_WR) |
946 	    V_FW_TLSTX_DATA_WR_COMPL(1) |
947 	    V_FW_TLSTX_DATA_WR_IMMDLEN(immdlen));
948 	txwr->flowid_len16 = htobe32(V_FW_TLSTX_DATA_WR_FLOWID(toep->tid) |
949 	    V_FW_TLSTX_DATA_WR_LEN16(credits));
950 	txwr->plen = htobe32(len);
951 	txwr->lsodisable_to_flags = htobe32(V_TX_ULP_MODE(ULP_MODE_TLS) |
952 	    V_TX_URG(0) | /* F_T6_TX_FORCE | */ V_TX_SHOVE(shove));
953 	txwr->ctxloc_to_exp = htobe32(V_FW_TLSTX_DATA_WR_NUMIVS(pdus) |
954 	    V_FW_TLSTX_DATA_WR_EXP(expn) |
955 	    V_FW_TLSTX_DATA_WR_CTXLOC(tls_ofld->key_location) |
956 	    V_FW_TLSTX_DATA_WR_IVDSGL(!imm_ivs) |
957 	    V_FW_TLSTX_DATA_WR_KEYSIZE(tls_ofld->k_ctx.tx_key_info_size >> 4));
958 	txwr->mfs = htobe16(tls_ofld->k_ctx.frag_size);
959 	txwr->adjustedplen_pkd = htobe16(
960 	    V_FW_TLSTX_DATA_WR_ADJUSTEDPLEN(tls_ofld->adjusted_plen));
961 	txwr->expinplenmax_pkd = htobe16(
962 	    V_FW_TLSTX_DATA_WR_EXPINPLENMAX(tls_ofld->expn_per_ulp));
963 	txwr->pdusinplenmax_pkd = htobe16(
964 	    V_FW_TLSTX_DATA_WR_PDUSINPLENMAX(tls_ofld->pdus_per_ulp));
965 }
966 
967 static void
968 write_tlstx_cpl(struct cpl_tx_tls_sfo *cpl, struct toepcb *toep,
969     struct tls_hdr *tls_hdr, unsigned int plen, unsigned int pdus)
970 {
971 	struct tls_ofld_info *tls_ofld = &toep->tls;
972 	int data_type, seglen;
973 
974 	if (plen < tls_ofld->k_ctx.frag_size)
975 		seglen = plen;
976 	else
977 		seglen = tls_ofld->k_ctx.frag_size;
978 	data_type = tls_content_type(tls_hdr->type);
979 	cpl->op_to_seg_len = htobe32(V_CPL_TX_TLS_SFO_OPCODE(CPL_TX_TLS_SFO) |
980 	    V_CPL_TX_TLS_SFO_DATA_TYPE(data_type) |
981 	    V_CPL_TX_TLS_SFO_CPL_LEN(2) | V_CPL_TX_TLS_SFO_SEG_LEN(seglen));
982 	cpl->pld_len = htobe32(plen);
983 	if (data_type == CPL_TX_TLS_SFO_TYPE_HEARTBEAT)
984 		cpl->type_protover = htobe32(
985 		    V_CPL_TX_TLS_SFO_TYPE(tls_hdr->type));
986 	cpl->seqno_numivs = htobe32(tls_ofld->scmd0.seqno_numivs |
987 	    V_SCMD_NUM_IVS(pdus));
988 	cpl->ivgen_hdrlen = htobe32(tls_ofld->scmd0.ivgen_hdrlen);
989 	cpl->scmd1 = htobe64(tls_ofld->tx_seq_no);
990 	tls_ofld->tx_seq_no += pdus;
991 }
992 
993 /*
994  * Similar to write_tx_sgl() except that it accepts an optional
995  * trailer buffer for IVs.
996  */
997 static void
998 write_tlstx_sgl(void *dst, struct mbuf *start, int skip, int plen,
999     void *iv_buffer, int iv_len, int nsegs, int n)
1000 {
1001 	struct mbuf *m;
1002 	struct ulptx_sgl *usgl = dst;
1003 	int i, j, rc;
1004 	struct sglist sg;
1005 	struct sglist_seg segs[n];
1006 
1007 	KASSERT(nsegs > 0, ("%s: nsegs 0", __func__));
1008 
1009 	sglist_init(&sg, n, segs);
1010 	usgl->cmd_nsge = htobe32(V_ULPTX_CMD(ULP_TX_SC_DSGL) |
1011 	    V_ULPTX_NSGE(nsegs));
1012 
1013 	for (m = start; skip >= m->m_len; m = m->m_next)
1014 		skip -= m->m_len;
1015 
1016 	i = -1;
1017 	for (m = start; plen > 0; m = m->m_next) {
1018 		rc = sglist_append(&sg, mtod(m, char *) + skip,
1019 		    m->m_len - skip);
1020 		if (__predict_false(rc != 0))
1021 			panic("%s: sglist_append %d", __func__, rc);
1022 		plen -= m->m_len - skip;
1023 		skip = 0;
1024 
1025 		for (j = 0; j < sg.sg_nseg; i++, j++) {
1026 			if (i < 0) {
1027 				usgl->len0 = htobe32(segs[j].ss_len);
1028 				usgl->addr0 = htobe64(segs[j].ss_paddr);
1029 			} else {
1030 				usgl->sge[i / 2].len[i & 1] =
1031 				    htobe32(segs[j].ss_len);
1032 				usgl->sge[i / 2].addr[i & 1] =
1033 				    htobe64(segs[j].ss_paddr);
1034 			}
1035 #ifdef INVARIANTS
1036 			nsegs--;
1037 #endif
1038 		}
1039 		sglist_reset(&sg);
1040 	}
1041 	if (iv_buffer != NULL) {
1042 		rc = sglist_append(&sg, iv_buffer, iv_len);
1043 		if (__predict_false(rc != 0))
1044 			panic("%s: sglist_append %d", __func__, rc);
1045 
1046 		for (j = 0; j < sg.sg_nseg; i++, j++) {
1047 			if (i < 0) {
1048 				usgl->len0 = htobe32(segs[j].ss_len);
1049 				usgl->addr0 = htobe64(segs[j].ss_paddr);
1050 			} else {
1051 				usgl->sge[i / 2].len[i & 1] =
1052 				    htobe32(segs[j].ss_len);
1053 				usgl->sge[i / 2].addr[i & 1] =
1054 				    htobe64(segs[j].ss_paddr);
1055 			}
1056 #ifdef INVARIANTS
1057 			nsegs--;
1058 #endif
1059 		}
1060 	}
1061 	if (i & 1)
1062 		usgl->sge[i / 2].len[1] = htobe32(0);
1063 	KASSERT(nsegs == 0, ("%s: nsegs %d, start %p, iv_buffer %p",
1064 	    __func__, nsegs, start, iv_buffer));
1065 }
1066 
1067 /*
1068  * Similar to t4_push_frames() but handles TLS sockets when TLS offload
1069  * is enabled.  Rather than transmitting bulk data, the socket buffer
1070  * contains TLS records.  The work request requires a full TLS record,
1071  * so batch mbufs up until a full TLS record is seen.  This requires
1072  * reading the TLS header out of the start of each record to determine
1073  * its length.
1074  */
1075 void
1076 t4_push_tls_records(struct adapter *sc, struct toepcb *toep, int drop)
1077 {
1078 	struct tls_hdr thdr;
1079 	struct mbuf *sndptr;
1080 	struct fw_tlstx_data_wr *txwr;
1081 	struct cpl_tx_tls_sfo *cpl;
1082 	struct wrqe *wr;
1083 	u_int plen, nsegs, credits, space, max_nsegs_1mbuf, wr_len;
1084 	u_int expn_size, iv_len, pdus, sndptroff;
1085 	struct tls_ofld_info *tls_ofld = &toep->tls;
1086 	struct inpcb *inp = toep->inp;
1087 	struct tcpcb *tp = intotcpcb(inp);
1088 	struct socket *so = inp->inp_socket;
1089 	struct sockbuf *sb = &so->so_snd;
1090 	int tls_size, tx_credits, shove, /* compl,*/ sowwakeup;
1091 	struct ofld_tx_sdesc *txsd;
1092 	bool imm_ivs, imm_payload;
1093 	void *iv_buffer, *iv_dst, *buf;
1094 
1095 	INP_WLOCK_ASSERT(inp);
1096 	KASSERT(toep->flags & TPF_FLOWC_WR_SENT,
1097 	    ("%s: flowc_wr not sent for tid %u.", __func__, toep->tid));
1098 
1099 	KASSERT(toep->ulp_mode == ULP_MODE_NONE ||
1100 	    toep->ulp_mode == ULP_MODE_TCPDDP || toep->ulp_mode == ULP_MODE_TLS,
1101 	    ("%s: ulp_mode %u for toep %p", __func__, toep->ulp_mode, toep));
1102 	KASSERT(tls_tx_key(toep),
1103 	    ("%s: TX key not set for toep %p", __func__, toep));
1104 
1105 #ifdef VERBOSE_TRACES
1106 	CTR4(KTR_CXGBE, "%s: tid %d toep flags %#x tp flags %#x drop %d",
1107 	    __func__, toep->tid, toep->flags, tp->t_flags);
1108 #endif
1109 	if (__predict_false(toep->flags & TPF_ABORT_SHUTDOWN))
1110 		return;
1111 
1112 #ifdef RATELIMIT
1113 	if (__predict_false(inp->inp_flags2 & INP_RATE_LIMIT_CHANGED) &&
1114 	    (update_tx_rate_limit(sc, toep, so->so_max_pacing_rate) == 0)) {
1115 		inp->inp_flags2 &= ~INP_RATE_LIMIT_CHANGED;
1116 	}
1117 #endif
1118 
1119 	/*
1120 	 * This function doesn't resume by itself.  Someone else must clear the
1121 	 * flag and call this function.
1122 	 */
1123 	if (__predict_false(toep->flags & TPF_TX_SUSPENDED)) {
1124 		KASSERT(drop == 0,
1125 		    ("%s: drop (%d) != 0 but tx is suspended", __func__, drop));
1126 		return;
1127 	}
1128 
1129 	txsd = &toep->txsd[toep->txsd_pidx];
1130 	for (;;) {
1131 		tx_credits = min(toep->tx_credits, MAX_OFLD_TX_CREDITS);
1132 		space = max_imm_tls_space(tx_credits);
1133 		wr_len = sizeof(struct fw_tlstx_data_wr) +
1134 		    sizeof(struct cpl_tx_tls_sfo) + key_size(toep);
1135 		if (wr_len + CIPHER_BLOCK_SIZE + 1 > space) {
1136 #ifdef VERBOSE_TRACES
1137 			CTR5(KTR_CXGBE,
1138 			    "%s: tid %d tx_credits %d min_wr %d space %d",
1139 			    __func__, toep->tid, tx_credits, wr_len +
1140 			    CIPHER_BLOCK_SIZE + 1, space);
1141 #endif
1142 			return;
1143 		}
1144 
1145 		SOCKBUF_LOCK(sb);
1146 		sowwakeup = drop;
1147 		if (drop) {
1148 			sbdrop_locked(sb, drop);
1149 			MPASS(tls_ofld->sb_off >= drop);
1150 			tls_ofld->sb_off -= drop;
1151 			drop = 0;
1152 		}
1153 
1154 		/*
1155 		 * Send a FIN if requested, but only if there's no
1156 		 * more data to send.
1157 		 */
1158 		if (sbavail(sb) == tls_ofld->sb_off &&
1159 		    toep->flags & TPF_SEND_FIN) {
1160 			if (sowwakeup)
1161 				sowwakeup_locked(so);
1162 			else
1163 				SOCKBUF_UNLOCK(sb);
1164 			SOCKBUF_UNLOCK_ASSERT(sb);
1165 			t4_close_conn(sc, toep);
1166 			return;
1167 		}
1168 
1169 		if (sbavail(sb) < tls_ofld->sb_off + TLS_HEADER_LENGTH) {
1170 			/*
1171 			 * A full TLS header is not yet queued, stop
1172 			 * for now until more data is added to the
1173 			 * socket buffer.  However, if the connection
1174 			 * has been closed, we will never get the rest
1175 			 * of the header so just discard the partial
1176 			 * header and close the connection.
1177 			 */
1178 #ifdef VERBOSE_TRACES
1179 			CTR5(KTR_CXGBE, "%s: tid %d sbavail %d sb_off %d%s",
1180 			    __func__, toep->tid, sbavail(sb), tls_ofld->sb_off,
1181 			    toep->flags & TPF_SEND_FIN ? "" : " SEND_FIN");
1182 #endif
1183 			if (sowwakeup)
1184 				sowwakeup_locked(so);
1185 			else
1186 				SOCKBUF_UNLOCK(sb);
1187 			SOCKBUF_UNLOCK_ASSERT(sb);
1188 			if (toep->flags & TPF_SEND_FIN)
1189 				t4_close_conn(sc, toep);
1190 			return;
1191 		}
1192 
1193 		/* Read the header of the next TLS record. */
1194 		sndptr = sbsndmbuf(sb, tls_ofld->sb_off, &sndptroff);
1195 		MPASS(!IS_AIOTX_MBUF(sndptr));
1196 		m_copydata(sndptr, sndptroff, sizeof(thdr), (caddr_t)&thdr);
1197 		tls_size = htons(thdr.length);
1198 		plen = TLS_HEADER_LENGTH + tls_size;
1199 		pdus = howmany(tls_size, tls_ofld->k_ctx.frag_size);
1200 		iv_len = pdus * CIPHER_BLOCK_SIZE;
1201 
1202 		if (sbavail(sb) < tls_ofld->sb_off + plen) {
1203 			/*
1204 			 * The full TLS record is not yet queued, stop
1205 			 * for now until more data is added to the
1206 			 * socket buffer.  However, if the connection
1207 			 * has been closed, we will never get the rest
1208 			 * of the record so just discard the partial
1209 			 * record and close the connection.
1210 			 */
1211 #ifdef VERBOSE_TRACES
1212 			CTR6(KTR_CXGBE,
1213 			    "%s: tid %d sbavail %d sb_off %d plen %d%s",
1214 			    __func__, toep->tid, sbavail(sb), tls_ofld->sb_off,
1215 			    plen, toep->flags & TPF_SEND_FIN ? "" :
1216 			    " SEND_FIN");
1217 #endif
1218 			if (sowwakeup)
1219 				sowwakeup_locked(so);
1220 			else
1221 				SOCKBUF_UNLOCK(sb);
1222 			SOCKBUF_UNLOCK_ASSERT(sb);
1223 			if (toep->flags & TPF_SEND_FIN)
1224 				t4_close_conn(sc, toep);
1225 			return;
1226 		}
1227 
1228 		/* Shove if there is no additional data pending. */
1229 		shove = (sbavail(sb) == tls_ofld->sb_off + plen) &&
1230 		    !(tp->t_flags & TF_MORETOCOME);
1231 
1232 		if (sb->sb_flags & SB_AUTOSIZE &&
1233 		    V_tcp_do_autosndbuf &&
1234 		    sb->sb_hiwat < V_tcp_autosndbuf_max &&
1235 		    sbused(sb) >= sb->sb_hiwat * 7 / 8) {
1236 			int newsize = min(sb->sb_hiwat + V_tcp_autosndbuf_inc,
1237 			    V_tcp_autosndbuf_max);
1238 
1239 			if (!sbreserve_locked(sb, newsize, so, NULL))
1240 				sb->sb_flags &= ~SB_AUTOSIZE;
1241 			else
1242 				sowwakeup = 1;	/* room available */
1243 		}
1244 		if (sowwakeup)
1245 			sowwakeup_locked(so);
1246 		else
1247 			SOCKBUF_UNLOCK(sb);
1248 		SOCKBUF_UNLOCK_ASSERT(sb);
1249 
1250 		if (__predict_false(toep->flags & TPF_FIN_SENT))
1251 			panic("%s: excess tx.", __func__);
1252 
1253 		/* Determine whether to use immediate vs SGL. */
1254 		imm_payload = false;
1255 		imm_ivs = false;
1256 		if (wr_len + iv_len <= space) {
1257 			imm_ivs = true;
1258 			wr_len += iv_len;
1259 			if (wr_len + tls_size <= space) {
1260 				wr_len += tls_size;
1261 				imm_payload = true;
1262 			}
1263 		}
1264 
1265 		/* Allocate space for IVs if needed. */
1266 		if (!imm_ivs) {
1267 			iv_buffer = malloc(iv_len, M_CXGBE, M_NOWAIT);
1268 			if (iv_buffer == NULL) {
1269 				/*
1270 				 * XXX: How to restart this?
1271 				 */
1272 				if (sowwakeup)
1273 					sowwakeup_locked(so);
1274 				else
1275 					SOCKBUF_UNLOCK(sb);
1276 				SOCKBUF_UNLOCK_ASSERT(sb);
1277 				CTR3(KTR_CXGBE,
1278 			    "%s: tid %d failed to alloc IV space len %d",
1279 				    __func__, toep->tid, iv_len);
1280 				return;
1281 			}
1282 		} else
1283 			iv_buffer = NULL;
1284 
1285 		/* Determine size of SGL. */
1286 		nsegs = 0;
1287 		max_nsegs_1mbuf = 0; /* max # of SGL segments in any one mbuf */
1288 		if (!imm_payload) {
1289 			nsegs = count_mbuf_segs(sndptr, sndptroff +
1290 			    TLS_HEADER_LENGTH, tls_size, &max_nsegs_1mbuf);
1291 			if (!imm_ivs) {
1292 				int n = sglist_count(iv_buffer, iv_len);
1293 				nsegs += n;
1294 				if (n > max_nsegs_1mbuf)
1295 					max_nsegs_1mbuf = n;
1296 			}
1297 
1298 			/* Account for SGL in work request length. */
1299 			wr_len += sizeof(struct ulptx_sgl) +
1300 			    ((3 * (nsegs - 1)) / 2 + ((nsegs - 1) & 1)) * 8;
1301 		}
1302 
1303 		wr = alloc_wrqe(roundup2(wr_len, 16), toep->ofld_txq);
1304 		if (wr == NULL) {
1305 			/* XXX: how will we recover from this? */
1306 			toep->flags |= TPF_TX_SUSPENDED;
1307 			return;
1308 		}
1309 
1310 #ifdef VERBOSE_TRACES
1311 		CTR5(KTR_CXGBE, "%s: tid %d TLS record %d len %#x pdus %d",
1312 		    __func__, toep->tid, thdr.type, tls_size, pdus);
1313 #endif
1314 		txwr = wrtod(wr);
1315 		cpl = (struct cpl_tx_tls_sfo *)(txwr + 1);
1316 		memset(txwr, 0, roundup2(wr_len, 16));
1317 		credits = howmany(wr_len, 16);
1318 		expn_size = tls_expansion_size(toep, tls_size, 0, NULL);
1319 		write_tlstx_wr(txwr, toep, imm_payload ? tls_size : 0,
1320 		    tls_size, expn_size, pdus, credits, shove, imm_ivs ? 1 : 0);
1321 		write_tlstx_cpl(cpl, toep, &thdr, tls_size, pdus);
1322 		tls_copy_tx_key(toep, cpl + 1);
1323 
1324 		/* Generate random IVs */
1325 		buf = (char *)(cpl + 1) + key_size(toep);
1326 		if (imm_ivs) {
1327 			MPASS(iv_buffer == NULL);
1328 			iv_dst = buf;
1329 			buf = (char *)iv_dst + iv_len;
1330 		} else
1331 			iv_dst = iv_buffer;
1332 		arc4rand(iv_dst, iv_len, 0);
1333 
1334 		if (imm_payload) {
1335 			m_copydata(sndptr, sndptroff + TLS_HEADER_LENGTH,
1336 			    tls_size, buf);
1337 		} else {
1338 			write_tlstx_sgl(buf, sndptr,
1339 			    sndptroff + TLS_HEADER_LENGTH, tls_size, iv_buffer,
1340 			    iv_len, nsegs, max_nsegs_1mbuf);
1341 		}
1342 
1343 		KASSERT(toep->tx_credits >= credits,
1344 			("%s: not enough credits", __func__));
1345 
1346 		toep->tx_credits -= credits;
1347 
1348 		tp->snd_nxt += plen;
1349 		tp->snd_max += plen;
1350 
1351 		SOCKBUF_LOCK(sb);
1352 		sbsndptr_adv(sb, sb->sb_sndptr, plen);
1353 		tls_ofld->sb_off += plen;
1354 		SOCKBUF_UNLOCK(sb);
1355 
1356 		toep->flags |= TPF_TX_DATA_SENT;
1357 		if (toep->tx_credits < MIN_OFLD_TLSTX_CREDITS(toep))
1358 			toep->flags |= TPF_TX_SUSPENDED;
1359 
1360 		KASSERT(toep->txsd_avail > 0, ("%s: no txsd", __func__));
1361 		txsd->plen = plen;
1362 		txsd->tx_credits = credits;
1363 		txsd->iv_buffer = iv_buffer;
1364 		txsd++;
1365 		if (__predict_false(++toep->txsd_pidx == toep->txsd_total)) {
1366 			toep->txsd_pidx = 0;
1367 			txsd = &toep->txsd[0];
1368 		}
1369 		toep->txsd_avail--;
1370 
1371 		atomic_add_long(&toep->vi->pi->tx_tls_records, 1);
1372 		atomic_add_long(&toep->vi->pi->tx_tls_octets, plen);
1373 
1374 		t4_l2t_send(sc, wr, toep->l2te);
1375 	}
1376 }
1377 
1378 /*
1379  * For TLS data we place received mbufs received via CPL_TLS_DATA into
1380  * an mbufq in the TLS offload state.  When CPL_RX_TLS_CMP is
1381  * received, the completed PDUs are placed into the socket receive
1382  * buffer.
1383  *
1384  * The TLS code reuses the ulp_pdu_reclaimq to hold the pending mbufs.
1385  */
1386 static int
1387 do_tls_data(struct sge_iq *iq, const struct rss_header *rss, struct mbuf *m)
1388 {
1389 	struct adapter *sc = iq->adapter;
1390 	const struct cpl_tls_data *cpl = mtod(m, const void *);
1391 	unsigned int tid = GET_TID(cpl);
1392 	struct toepcb *toep = lookup_tid(sc, tid);
1393 	struct inpcb *inp = toep->inp;
1394 	struct tcpcb *tp;
1395 	int len;
1396 
1397 	/* XXX: Should this match do_rx_data instead? */
1398 	KASSERT(!(toep->flags & TPF_SYNQE),
1399 	    ("%s: toep %p claims to be a synq entry", __func__, toep));
1400 
1401 	KASSERT(toep->tid == tid, ("%s: toep tid/atid mismatch", __func__));
1402 
1403 	/* strip off CPL header */
1404 	m_adj(m, sizeof(*cpl));
1405 	len = m->m_pkthdr.len;
1406 
1407 	atomic_add_long(&toep->vi->pi->rx_tls_octets, len);
1408 
1409 	KASSERT(len == G_CPL_TLS_DATA_LENGTH(be32toh(cpl->length_pkd)),
1410 	    ("%s: payload length mismatch", __func__));
1411 
1412 	INP_WLOCK(inp);
1413 	if (inp->inp_flags & (INP_DROPPED | INP_TIMEWAIT)) {
1414 		CTR4(KTR_CXGBE, "%s: tid %u, rx (%d bytes), inp_flags 0x%x",
1415 		    __func__, tid, len, inp->inp_flags);
1416 		INP_WUNLOCK(inp);
1417 		m_freem(m);
1418 		return (0);
1419 	}
1420 
1421 	/* Save TCP sequence number. */
1422 	m->m_pkthdr.tls_tcp_seq = be32toh(cpl->seq);
1423 
1424 	if (mbufq_enqueue(&toep->ulp_pdu_reclaimq, m)) {
1425 #ifdef INVARIANTS
1426 		panic("Failed to queue TLS data packet");
1427 #else
1428 		printf("%s: Failed to queue TLS data packet\n", __func__);
1429 		INP_WUNLOCK(inp);
1430 		m_freem(m);
1431 		return (0);
1432 #endif
1433 	}
1434 
1435 	tp = intotcpcb(inp);
1436 	tp->t_rcvtime = ticks;
1437 
1438 #ifdef VERBOSE_TRACES
1439 	CTR4(KTR_CXGBE, "%s: tid %u len %d seq %u", __func__, tid, len,
1440 	    be32toh(cpl->seq));
1441 #endif
1442 
1443 	INP_WUNLOCK(inp);
1444 	return (0);
1445 }
1446 
1447 static int
1448 do_rx_tls_cmp(struct sge_iq *iq, const struct rss_header *rss, struct mbuf *m)
1449 {
1450 	struct adapter *sc = iq->adapter;
1451 	const struct cpl_rx_tls_cmp *cpl = mtod(m, const void *);
1452 	struct tlsrx_hdr_pkt *tls_hdr_pkt;
1453 	unsigned int tid = GET_TID(cpl);
1454 	struct toepcb *toep = lookup_tid(sc, tid);
1455 	struct inpcb *inp = toep->inp;
1456 	struct tcpcb *tp;
1457 	struct socket *so;
1458 	struct sockbuf *sb;
1459 	struct mbuf *tls_data;
1460 	int len, pdu_length, pdu_overhead, sb_length;
1461 
1462 	KASSERT(toep->tid == tid, ("%s: toep tid/atid mismatch", __func__));
1463 	KASSERT(!(toep->flags & TPF_SYNQE),
1464 	    ("%s: toep %p claims to be a synq entry", __func__, toep));
1465 
1466 	/* strip off CPL header */
1467 	m_adj(m, sizeof(*cpl));
1468 	len = m->m_pkthdr.len;
1469 
1470 	atomic_add_long(&toep->vi->pi->rx_tls_records, 1);
1471 
1472 	KASSERT(len == G_CPL_RX_TLS_CMP_LENGTH(be32toh(cpl->pdulength_length)),
1473 	    ("%s: payload length mismatch", __func__));
1474 
1475 	INP_WLOCK(inp);
1476 	if (inp->inp_flags & (INP_DROPPED | INP_TIMEWAIT)) {
1477 		CTR4(KTR_CXGBE, "%s: tid %u, rx (%d bytes), inp_flags 0x%x",
1478 		    __func__, tid, len, inp->inp_flags);
1479 		INP_WUNLOCK(inp);
1480 		m_freem(m);
1481 		return (0);
1482 	}
1483 
1484 	pdu_length = G_CPL_RX_TLS_CMP_PDULENGTH(be32toh(cpl->pdulength_length));
1485 
1486 	tp = intotcpcb(inp);
1487 
1488 #ifdef VERBOSE_TRACES
1489 	CTR6(KTR_CXGBE, "%s: tid %u PDU len %d len %d seq %u, rcv_nxt %u",
1490 	    __func__, tid, pdu_length, len, be32toh(cpl->seq), tp->rcv_nxt);
1491 #endif
1492 
1493 	tp->rcv_nxt += pdu_length;
1494 	if (tp->rcv_wnd < pdu_length) {
1495 		toep->tls.rcv_over += pdu_length - tp->rcv_wnd;
1496 		tp->rcv_wnd = 0;
1497 	} else
1498 		tp->rcv_wnd -= pdu_length;
1499 
1500 	/* XXX: Not sure what to do about urgent data. */
1501 
1502 	/*
1503 	 * The payload of this CPL is the TLS header followed by
1504 	 * additional fields.
1505 	 */
1506 	KASSERT(m->m_len >= sizeof(*tls_hdr_pkt),
1507 	    ("%s: payload too small", __func__));
1508 	tls_hdr_pkt = mtod(m, void *);
1509 
1510 	/*
1511 	 * Only the TLS header is sent to OpenSSL, so report errors by
1512 	 * altering the record type.
1513 	 */
1514 	if ((tls_hdr_pkt->res_to_mac_error & M_TLSRX_HDR_PKT_ERROR) != 0)
1515 		tls_hdr_pkt->type = CONTENT_TYPE_ERROR;
1516 
1517 	/* Trim this CPL's mbuf to only include the TLS header. */
1518 	KASSERT(m->m_len == len && m->m_next == NULL,
1519 	    ("%s: CPL spans multiple mbufs", __func__));
1520 	m->m_len = TLS_HEADER_LENGTH;
1521 	m->m_pkthdr.len = TLS_HEADER_LENGTH;
1522 
1523 	tls_data = mbufq_dequeue(&toep->ulp_pdu_reclaimq);
1524 	if (tls_data != NULL) {
1525 		KASSERT(be32toh(cpl->seq) == tls_data->m_pkthdr.tls_tcp_seq,
1526 		    ("%s: sequence mismatch", __func__));
1527 
1528 		/*
1529 		 * Update the TLS header length to be the length of
1530 		 * the payload data.
1531 		 */
1532 		tls_hdr_pkt->length = htobe16(tls_data->m_pkthdr.len);
1533 
1534 		m->m_next = tls_data;
1535 		m->m_pkthdr.len += tls_data->m_len;
1536 	}
1537 
1538 	so = inp_inpcbtosocket(inp);
1539 	sb = &so->so_rcv;
1540 	SOCKBUF_LOCK(sb);
1541 
1542 	if (__predict_false(sb->sb_state & SBS_CANTRCVMORE)) {
1543 		struct epoch_tracker et;
1544 
1545 		CTR3(KTR_CXGBE, "%s: tid %u, excess rx (%d bytes)",
1546 		    __func__, tid, pdu_length);
1547 		m_freem(m);
1548 		SOCKBUF_UNLOCK(sb);
1549 		INP_WUNLOCK(inp);
1550 
1551 		CURVNET_SET(toep->vnet);
1552 		INP_INFO_RLOCK_ET(&V_tcbinfo, et);
1553 		INP_WLOCK(inp);
1554 		tp = tcp_drop(tp, ECONNRESET);
1555 		if (tp)
1556 			INP_WUNLOCK(inp);
1557 		INP_INFO_RUNLOCK_ET(&V_tcbinfo, et);
1558 		CURVNET_RESTORE();
1559 
1560 		return (0);
1561 	}
1562 
1563 	/*
1564 	 * Not all of the bytes on the wire are included in the socket
1565 	 * buffer (e.g. the MAC of the TLS record).  However, those
1566 	 * bytes are included in the TCP sequence space.  To handle
1567 	 * this, compute the delta for this TLS record in
1568 	 * 'pdu_overhead' and treat those bytes as having already been
1569 	 * "read" by the application for the purposes of expanding the
1570 	 * window.  The meat of the TLS record passed to the
1571 	 * application ('sb_length') will still not be counted as
1572 	 * "read" until userland actually reads the bytes.
1573 	 *
1574 	 * XXX: Some of the calculations below are probably still not
1575 	 * really correct.
1576 	 */
1577 	sb_length = m->m_pkthdr.len;
1578 	pdu_overhead = pdu_length - sb_length;
1579 	toep->rx_credits += pdu_overhead;
1580 	tp->rcv_wnd += pdu_overhead;
1581 	tp->rcv_adv += pdu_overhead;
1582 
1583 	/* receive buffer autosize */
1584 	MPASS(toep->vnet == so->so_vnet);
1585 	CURVNET_SET(toep->vnet);
1586 	if (sb->sb_flags & SB_AUTOSIZE &&
1587 	    V_tcp_do_autorcvbuf &&
1588 	    sb->sb_hiwat < V_tcp_autorcvbuf_max &&
1589 	    sb_length > (sbspace(sb) / 8 * 7)) {
1590 		unsigned int hiwat = sb->sb_hiwat;
1591 		unsigned int newsize = min(hiwat + V_tcp_autorcvbuf_inc,
1592 		    V_tcp_autorcvbuf_max);
1593 
1594 		if (!sbreserve_locked(sb, newsize, so, NULL))
1595 			sb->sb_flags &= ~SB_AUTOSIZE;
1596 		else
1597 			toep->rx_credits += newsize - hiwat;
1598 	}
1599 
1600 	KASSERT(toep->sb_cc >= sbused(sb),
1601 	    ("%s: sb %p has more data (%d) than last time (%d).",
1602 	    __func__, sb, sbused(sb), toep->sb_cc));
1603 	toep->rx_credits += toep->sb_cc - sbused(sb);
1604 	sbappendstream_locked(sb, m, 0);
1605 	toep->sb_cc = sbused(sb);
1606 #ifdef VERBOSE_TRACES
1607 	CTR5(KTR_CXGBE, "%s: tid %u PDU overhead %d rx_credits %u rcv_wnd %u",
1608 	    __func__, tid, pdu_overhead, toep->rx_credits, tp->rcv_wnd);
1609 #endif
1610 	if (toep->rx_credits > 0 && toep->sb_cc + tp->rcv_wnd < sb->sb_lowat) {
1611 		int credits;
1612 
1613 		credits = send_rx_credits(sc, toep, toep->rx_credits);
1614 		toep->rx_credits -= credits;
1615 		tp->rcv_wnd += credits;
1616 		tp->rcv_adv += credits;
1617 	}
1618 
1619 	sorwakeup_locked(so);
1620 	SOCKBUF_UNLOCK_ASSERT(sb);
1621 
1622 	INP_WUNLOCK(inp);
1623 	CURVNET_RESTORE();
1624 	return (0);
1625 }
1626 
1627 void
1628 t4_tls_mod_load(void)
1629 {
1630 
1631 	mtx_init(&tls_handshake_lock, "t4tls handshake", NULL, MTX_DEF);
1632 	t4_register_cpl_handler(CPL_TLS_DATA, do_tls_data);
1633 	t4_register_cpl_handler(CPL_RX_TLS_CMP, do_rx_tls_cmp);
1634 }
1635 
1636 void
1637 t4_tls_mod_unload(void)
1638 {
1639 
1640 	t4_register_cpl_handler(CPL_TLS_DATA, NULL);
1641 	t4_register_cpl_handler(CPL_RX_TLS_CMP, NULL);
1642 	mtx_destroy(&tls_handshake_lock);
1643 }
1644 #endif	/* TCP_OFFLOAD */
1645