xref: /freebsd/sys/dev/iscsi/icl_soft.c (revision 872d2d9276daf0ce92e66a0ab8826a0d472fb3c1)
1321b17ecSEdward Tomasz Napierala /*-
2321b17ecSEdward Tomasz Napierala  * Copyright (c) 2012 The FreeBSD Foundation
3321b17ecSEdward Tomasz Napierala  * All rights reserved.
4321b17ecSEdward Tomasz Napierala  *
5321b17ecSEdward Tomasz Napierala  * This software was developed by Edward Tomasz Napierala under sponsorship
6321b17ecSEdward Tomasz Napierala  * from the FreeBSD Foundation.
7321b17ecSEdward Tomasz Napierala  *
8321b17ecSEdward Tomasz Napierala  * Redistribution and use in source and binary forms, with or without
9321b17ecSEdward Tomasz Napierala  * modification, are permitted provided that the following conditions
10321b17ecSEdward Tomasz Napierala  * are met:
11321b17ecSEdward Tomasz Napierala  * 1. Redistributions of source code must retain the above copyright
12321b17ecSEdward Tomasz Napierala  *    notice, this list of conditions and the following disclaimer.
13321b17ecSEdward Tomasz Napierala  * 2. Redistributions in binary form must reproduce the above copyright
14321b17ecSEdward Tomasz Napierala  *    notice, this list of conditions and the following disclaimer in the
15321b17ecSEdward Tomasz Napierala  *    documentation and/or other materials provided with the distribution.
16321b17ecSEdward Tomasz Napierala  *
17321b17ecSEdward Tomasz Napierala  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
18321b17ecSEdward Tomasz Napierala  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19321b17ecSEdward Tomasz Napierala  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20321b17ecSEdward Tomasz Napierala  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
21321b17ecSEdward Tomasz Napierala  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22321b17ecSEdward Tomasz Napierala  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23321b17ecSEdward Tomasz Napierala  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24321b17ecSEdward Tomasz Napierala  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25321b17ecSEdward Tomasz Napierala  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26321b17ecSEdward Tomasz Napierala  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27321b17ecSEdward Tomasz Napierala  * SUCH DAMAGE.
28321b17ecSEdward Tomasz Napierala  *
29321b17ecSEdward Tomasz Napierala  */
30321b17ecSEdward Tomasz Napierala 
31321b17ecSEdward Tomasz Napierala /*
32321b17ecSEdward Tomasz Napierala  * iSCSI Common Layer.  It's used by both the initiator and target to send
33321b17ecSEdward Tomasz Napierala  * and receive iSCSI PDUs.
34321b17ecSEdward Tomasz Napierala  */
35321b17ecSEdward Tomasz Napierala 
36321b17ecSEdward Tomasz Napierala #include <sys/cdefs.h>
37321b17ecSEdward Tomasz Napierala __FBSDID("$FreeBSD$");
38321b17ecSEdward Tomasz Napierala 
39321b17ecSEdward Tomasz Napierala #include <sys/param.h>
40321b17ecSEdward Tomasz Napierala #include <sys/capsicum.h>
41321b17ecSEdward Tomasz Napierala #include <sys/condvar.h>
42321b17ecSEdward Tomasz Napierala #include <sys/conf.h>
43321b17ecSEdward Tomasz Napierala #include <sys/file.h>
44321b17ecSEdward Tomasz Napierala #include <sys/kernel.h>
45321b17ecSEdward Tomasz Napierala #include <sys/kthread.h>
46321b17ecSEdward Tomasz Napierala #include <sys/lock.h>
47321b17ecSEdward Tomasz Napierala #include <sys/mbuf.h>
48321b17ecSEdward Tomasz Napierala #include <sys/mutex.h>
49321b17ecSEdward Tomasz Napierala #include <sys/module.h>
50321b17ecSEdward Tomasz Napierala #include <sys/protosw.h>
51321b17ecSEdward Tomasz Napierala #include <sys/socket.h>
52321b17ecSEdward Tomasz Napierala #include <sys/socketvar.h>
53321b17ecSEdward Tomasz Napierala #include <sys/sysctl.h>
54321b17ecSEdward Tomasz Napierala #include <sys/systm.h>
55321b17ecSEdward Tomasz Napierala #include <sys/sx.h>
56321b17ecSEdward Tomasz Napierala #include <sys/uio.h>
57321b17ecSEdward Tomasz Napierala #include <vm/uma.h>
58321b17ecSEdward Tomasz Napierala #include <netinet/in.h>
59321b17ecSEdward Tomasz Napierala #include <netinet/tcp.h>
60321b17ecSEdward Tomasz Napierala 
61321b17ecSEdward Tomasz Napierala #include <dev/iscsi/icl.h>
62321b17ecSEdward Tomasz Napierala #include <dev/iscsi/iscsi_proto.h>
63321b17ecSEdward Tomasz Napierala #include <icl_conn_if.h>
64321b17ecSEdward Tomasz Napierala 
65321b17ecSEdward Tomasz Napierala static int coalesce = 1;
66321b17ecSEdward Tomasz Napierala SYSCTL_INT(_kern_icl, OID_AUTO, coalesce, CTLFLAG_RWTUN,
67321b17ecSEdward Tomasz Napierala     &coalesce, 0, "Try to coalesce PDUs before sending");
68321b17ecSEdward Tomasz Napierala static int partial_receive_len = 128 * 1024;
69321b17ecSEdward Tomasz Napierala SYSCTL_INT(_kern_icl, OID_AUTO, partial_receive_len, CTLFLAG_RWTUN,
70321b17ecSEdward Tomasz Napierala     &partial_receive_len, 0, "Minimum read size for partially received "
71321b17ecSEdward Tomasz Napierala     "data segment");
72321b17ecSEdward Tomasz Napierala static int sendspace = 1048576;
73321b17ecSEdward Tomasz Napierala SYSCTL_INT(_kern_icl, OID_AUTO, sendspace, CTLFLAG_RWTUN,
74321b17ecSEdward Tomasz Napierala     &sendspace, 0, "Default send socket buffer size");
75321b17ecSEdward Tomasz Napierala static int recvspace = 1048576;
76321b17ecSEdward Tomasz Napierala SYSCTL_INT(_kern_icl, OID_AUTO, recvspace, CTLFLAG_RWTUN,
77321b17ecSEdward Tomasz Napierala     &recvspace, 0, "Default receive socket buffer size");
78321b17ecSEdward Tomasz Napierala 
79321b17ecSEdward Tomasz Napierala static MALLOC_DEFINE(M_ICL_SOFT, "icl_soft", "iSCSI software backend");
80321b17ecSEdward Tomasz Napierala static uma_zone_t icl_pdu_zone;
81321b17ecSEdward Tomasz Napierala 
82321b17ecSEdward Tomasz Napierala static volatile u_int	icl_ncons;
83321b17ecSEdward Tomasz Napierala 
84321b17ecSEdward Tomasz Napierala #define ICL_CONN_LOCK(X)		mtx_lock(X->ic_lock)
85321b17ecSEdward Tomasz Napierala #define ICL_CONN_UNLOCK(X)		mtx_unlock(X->ic_lock)
86321b17ecSEdward Tomasz Napierala #define ICL_CONN_LOCK_ASSERT(X)		mtx_assert(X->ic_lock, MA_OWNED)
87321b17ecSEdward Tomasz Napierala #define ICL_CONN_LOCK_ASSERT_NOT(X)	mtx_assert(X->ic_lock, MA_NOTOWNED)
88321b17ecSEdward Tomasz Napierala 
89321b17ecSEdward Tomasz Napierala STAILQ_HEAD(icl_pdu_stailq, icl_pdu);
90321b17ecSEdward Tomasz Napierala 
91321b17ecSEdward Tomasz Napierala static icl_conn_new_pdu_t	icl_soft_conn_new_pdu;
92321b17ecSEdward Tomasz Napierala static icl_conn_pdu_free_t	icl_soft_conn_pdu_free;
93321b17ecSEdward Tomasz Napierala static icl_conn_pdu_data_segment_length_t
94321b17ecSEdward Tomasz Napierala 				    icl_soft_conn_pdu_data_segment_length;
95321b17ecSEdward Tomasz Napierala static icl_conn_pdu_append_data_t	icl_soft_conn_pdu_append_data;
96321b17ecSEdward Tomasz Napierala static icl_conn_pdu_get_data_t	icl_soft_conn_pdu_get_data;
97321b17ecSEdward Tomasz Napierala static icl_conn_pdu_queue_t	icl_soft_conn_pdu_queue;
98321b17ecSEdward Tomasz Napierala static icl_conn_handoff_t	icl_soft_conn_handoff;
99321b17ecSEdward Tomasz Napierala static icl_conn_free_t		icl_soft_conn_free;
100321b17ecSEdward Tomasz Napierala static icl_conn_close_t		icl_soft_conn_close;
101321b17ecSEdward Tomasz Napierala static icl_conn_connected_t	icl_soft_conn_connected;
102321b17ecSEdward Tomasz Napierala 
103321b17ecSEdward Tomasz Napierala static kobj_method_t icl_soft_methods[] = {
104321b17ecSEdward Tomasz Napierala 	KOBJMETHOD(icl_conn_new_pdu, icl_soft_conn_new_pdu),
105321b17ecSEdward Tomasz Napierala 	KOBJMETHOD(icl_conn_pdu_free, icl_soft_conn_pdu_free),
106321b17ecSEdward Tomasz Napierala 	KOBJMETHOD(icl_conn_pdu_data_segment_length,
107321b17ecSEdward Tomasz Napierala 	    icl_soft_conn_pdu_data_segment_length),
108321b17ecSEdward Tomasz Napierala 	KOBJMETHOD(icl_conn_pdu_append_data, icl_soft_conn_pdu_append_data),
109321b17ecSEdward Tomasz Napierala 	KOBJMETHOD(icl_conn_pdu_get_data, icl_soft_conn_pdu_get_data),
110321b17ecSEdward Tomasz Napierala 	KOBJMETHOD(icl_conn_pdu_queue, icl_soft_conn_pdu_queue),
111321b17ecSEdward Tomasz Napierala 	KOBJMETHOD(icl_conn_handoff, icl_soft_conn_handoff),
112321b17ecSEdward Tomasz Napierala 	KOBJMETHOD(icl_conn_free, icl_soft_conn_free),
113321b17ecSEdward Tomasz Napierala 	KOBJMETHOD(icl_conn_close, icl_soft_conn_close),
114321b17ecSEdward Tomasz Napierala 	KOBJMETHOD(icl_conn_connected, icl_soft_conn_connected),
115321b17ecSEdward Tomasz Napierala 	{ 0, 0 }
116321b17ecSEdward Tomasz Napierala };
117321b17ecSEdward Tomasz Napierala 
118321b17ecSEdward Tomasz Napierala DEFINE_CLASS(icl_soft, icl_soft_methods, sizeof(struct icl_conn));
119321b17ecSEdward Tomasz Napierala 
120321b17ecSEdward Tomasz Napierala static void	icl_conn_close(struct icl_conn *ic);
121321b17ecSEdward Tomasz Napierala 
122321b17ecSEdward Tomasz Napierala static void
123321b17ecSEdward Tomasz Napierala icl_conn_fail(struct icl_conn *ic)
124321b17ecSEdward Tomasz Napierala {
125321b17ecSEdward Tomasz Napierala 	if (ic->ic_socket == NULL)
126321b17ecSEdward Tomasz Napierala 		return;
127321b17ecSEdward Tomasz Napierala 
128321b17ecSEdward Tomasz Napierala 	/*
129321b17ecSEdward Tomasz Napierala 	 * XXX
130321b17ecSEdward Tomasz Napierala 	 */
131321b17ecSEdward Tomasz Napierala 	ic->ic_socket->so_error = EDOOFUS;
132321b17ecSEdward Tomasz Napierala 	(ic->ic_error)(ic);
133321b17ecSEdward Tomasz Napierala }
134321b17ecSEdward Tomasz Napierala 
135321b17ecSEdward Tomasz Napierala static struct mbuf *
136321b17ecSEdward Tomasz Napierala icl_conn_receive(struct icl_conn *ic, size_t len)
137321b17ecSEdward Tomasz Napierala {
138321b17ecSEdward Tomasz Napierala 	struct uio uio;
139321b17ecSEdward Tomasz Napierala 	struct socket *so;
140321b17ecSEdward Tomasz Napierala 	struct mbuf *m;
141321b17ecSEdward Tomasz Napierala 	int error, flags;
142321b17ecSEdward Tomasz Napierala 
143321b17ecSEdward Tomasz Napierala 	so = ic->ic_socket;
144321b17ecSEdward Tomasz Napierala 
145321b17ecSEdward Tomasz Napierala 	memset(&uio, 0, sizeof(uio));
146321b17ecSEdward Tomasz Napierala 	uio.uio_resid = len;
147321b17ecSEdward Tomasz Napierala 
148321b17ecSEdward Tomasz Napierala 	flags = MSG_DONTWAIT;
149321b17ecSEdward Tomasz Napierala 	error = soreceive(so, NULL, &uio, &m, NULL, &flags);
150321b17ecSEdward Tomasz Napierala 	if (error != 0) {
151321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("soreceive error %d", error);
152321b17ecSEdward Tomasz Napierala 		return (NULL);
153321b17ecSEdward Tomasz Napierala 	}
154321b17ecSEdward Tomasz Napierala 	if (uio.uio_resid != 0) {
155321b17ecSEdward Tomasz Napierala 		m_freem(m);
156321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("short read");
157321b17ecSEdward Tomasz Napierala 		return (NULL);
158321b17ecSEdward Tomasz Napierala 	}
159321b17ecSEdward Tomasz Napierala 
160321b17ecSEdward Tomasz Napierala 	return (m);
161321b17ecSEdward Tomasz Napierala }
162321b17ecSEdward Tomasz Napierala 
163321b17ecSEdward Tomasz Napierala static struct icl_pdu *
164321b17ecSEdward Tomasz Napierala icl_pdu_new_empty(struct icl_conn *ic, int flags)
165321b17ecSEdward Tomasz Napierala {
166321b17ecSEdward Tomasz Napierala 	struct icl_pdu *ip;
167321b17ecSEdward Tomasz Napierala 
168321b17ecSEdward Tomasz Napierala #ifdef DIAGNOSTIC
169321b17ecSEdward Tomasz Napierala 	refcount_acquire(&ic->ic_outstanding_pdus);
170321b17ecSEdward Tomasz Napierala #endif
171321b17ecSEdward Tomasz Napierala 	ip = uma_zalloc(icl_pdu_zone, flags | M_ZERO);
172321b17ecSEdward Tomasz Napierala 	if (ip == NULL) {
173321b17ecSEdward Tomasz Napierala 		ICL_WARN("failed to allocate %zd bytes", sizeof(*ip));
174321b17ecSEdward Tomasz Napierala #ifdef DIAGNOSTIC
175321b17ecSEdward Tomasz Napierala 		refcount_release(&ic->ic_outstanding_pdus);
176321b17ecSEdward Tomasz Napierala #endif
177321b17ecSEdward Tomasz Napierala 		return (NULL);
178321b17ecSEdward Tomasz Napierala 	}
179321b17ecSEdward Tomasz Napierala 
180321b17ecSEdward Tomasz Napierala 	ip->ip_conn = ic;
181321b17ecSEdward Tomasz Napierala 
182321b17ecSEdward Tomasz Napierala 	return (ip);
183321b17ecSEdward Tomasz Napierala }
184321b17ecSEdward Tomasz Napierala 
185321b17ecSEdward Tomasz Napierala static void
186321b17ecSEdward Tomasz Napierala icl_pdu_free(struct icl_pdu *ip)
187321b17ecSEdward Tomasz Napierala {
188321b17ecSEdward Tomasz Napierala 	struct icl_conn *ic;
189321b17ecSEdward Tomasz Napierala 
190321b17ecSEdward Tomasz Napierala 	ic = ip->ip_conn;
191321b17ecSEdward Tomasz Napierala 
192321b17ecSEdward Tomasz Napierala 	m_freem(ip->ip_bhs_mbuf);
193321b17ecSEdward Tomasz Napierala 	m_freem(ip->ip_ahs_mbuf);
194321b17ecSEdward Tomasz Napierala 	m_freem(ip->ip_data_mbuf);
195321b17ecSEdward Tomasz Napierala 	uma_zfree(icl_pdu_zone, ip);
196321b17ecSEdward Tomasz Napierala #ifdef DIAGNOSTIC
197321b17ecSEdward Tomasz Napierala 	refcount_release(&ic->ic_outstanding_pdus);
198321b17ecSEdward Tomasz Napierala #endif
199321b17ecSEdward Tomasz Napierala }
200321b17ecSEdward Tomasz Napierala 
201321b17ecSEdward Tomasz Napierala void
202321b17ecSEdward Tomasz Napierala icl_soft_conn_pdu_free(struct icl_conn *ic, struct icl_pdu *ip)
203321b17ecSEdward Tomasz Napierala {
204321b17ecSEdward Tomasz Napierala 	icl_pdu_free(ip);
205321b17ecSEdward Tomasz Napierala }
206321b17ecSEdward Tomasz Napierala 
207321b17ecSEdward Tomasz Napierala /*
208321b17ecSEdward Tomasz Napierala  * Allocate icl_pdu with empty BHS to fill up by the caller.
209321b17ecSEdward Tomasz Napierala  */
210321b17ecSEdward Tomasz Napierala struct icl_pdu *
211321b17ecSEdward Tomasz Napierala icl_soft_conn_new_pdu(struct icl_conn *ic, int flags)
212321b17ecSEdward Tomasz Napierala {
213321b17ecSEdward Tomasz Napierala 	struct icl_pdu *ip;
214321b17ecSEdward Tomasz Napierala 
215321b17ecSEdward Tomasz Napierala 	ip = icl_pdu_new_empty(ic, flags);
216321b17ecSEdward Tomasz Napierala 	if (ip == NULL)
217321b17ecSEdward Tomasz Napierala 		return (NULL);
218321b17ecSEdward Tomasz Napierala 
219321b17ecSEdward Tomasz Napierala 	ip->ip_bhs_mbuf = m_getm2(NULL, sizeof(struct iscsi_bhs),
220321b17ecSEdward Tomasz Napierala 	    flags, MT_DATA, M_PKTHDR);
221321b17ecSEdward Tomasz Napierala 	if (ip->ip_bhs_mbuf == NULL) {
222321b17ecSEdward Tomasz Napierala 		ICL_WARN("failed to allocate %zd bytes", sizeof(*ip));
223321b17ecSEdward Tomasz Napierala 		icl_pdu_free(ip);
224321b17ecSEdward Tomasz Napierala 		return (NULL);
225321b17ecSEdward Tomasz Napierala 	}
226321b17ecSEdward Tomasz Napierala 	ip->ip_bhs = mtod(ip->ip_bhs_mbuf, struct iscsi_bhs *);
227321b17ecSEdward Tomasz Napierala 	memset(ip->ip_bhs, 0, sizeof(struct iscsi_bhs));
228321b17ecSEdward Tomasz Napierala 	ip->ip_bhs_mbuf->m_len = sizeof(struct iscsi_bhs);
229321b17ecSEdward Tomasz Napierala 
230321b17ecSEdward Tomasz Napierala 	return (ip);
231321b17ecSEdward Tomasz Napierala }
232321b17ecSEdward Tomasz Napierala 
233321b17ecSEdward Tomasz Napierala static int
234321b17ecSEdward Tomasz Napierala icl_pdu_ahs_length(const struct icl_pdu *request)
235321b17ecSEdward Tomasz Napierala {
236321b17ecSEdward Tomasz Napierala 
237321b17ecSEdward Tomasz Napierala 	return (request->ip_bhs->bhs_total_ahs_len * 4);
238321b17ecSEdward Tomasz Napierala }
239321b17ecSEdward Tomasz Napierala 
240321b17ecSEdward Tomasz Napierala static size_t
241321b17ecSEdward Tomasz Napierala icl_pdu_data_segment_length(const struct icl_pdu *request)
242321b17ecSEdward Tomasz Napierala {
243321b17ecSEdward Tomasz Napierala 	uint32_t len = 0;
244321b17ecSEdward Tomasz Napierala 
245321b17ecSEdward Tomasz Napierala 	len += request->ip_bhs->bhs_data_segment_len[0];
246321b17ecSEdward Tomasz Napierala 	len <<= 8;
247321b17ecSEdward Tomasz Napierala 	len += request->ip_bhs->bhs_data_segment_len[1];
248321b17ecSEdward Tomasz Napierala 	len <<= 8;
249321b17ecSEdward Tomasz Napierala 	len += request->ip_bhs->bhs_data_segment_len[2];
250321b17ecSEdward Tomasz Napierala 
251321b17ecSEdward Tomasz Napierala 	return (len);
252321b17ecSEdward Tomasz Napierala }
253321b17ecSEdward Tomasz Napierala 
254321b17ecSEdward Tomasz Napierala size_t
255321b17ecSEdward Tomasz Napierala icl_soft_conn_pdu_data_segment_length(struct icl_conn *ic,
256321b17ecSEdward Tomasz Napierala     const struct icl_pdu *request)
257321b17ecSEdward Tomasz Napierala {
258321b17ecSEdward Tomasz Napierala 
259321b17ecSEdward Tomasz Napierala 	return (icl_pdu_data_segment_length(request));
260321b17ecSEdward Tomasz Napierala }
261321b17ecSEdward Tomasz Napierala 
262321b17ecSEdward Tomasz Napierala static void
263321b17ecSEdward Tomasz Napierala icl_pdu_set_data_segment_length(struct icl_pdu *response, uint32_t len)
264321b17ecSEdward Tomasz Napierala {
265321b17ecSEdward Tomasz Napierala 
266321b17ecSEdward Tomasz Napierala 	response->ip_bhs->bhs_data_segment_len[2] = len;
267321b17ecSEdward Tomasz Napierala 	response->ip_bhs->bhs_data_segment_len[1] = len >> 8;
268321b17ecSEdward Tomasz Napierala 	response->ip_bhs->bhs_data_segment_len[0] = len >> 16;
269321b17ecSEdward Tomasz Napierala }
270321b17ecSEdward Tomasz Napierala 
271321b17ecSEdward Tomasz Napierala static size_t
272321b17ecSEdward Tomasz Napierala icl_pdu_padding(const struct icl_pdu *ip)
273321b17ecSEdward Tomasz Napierala {
274321b17ecSEdward Tomasz Napierala 
275321b17ecSEdward Tomasz Napierala 	if ((ip->ip_data_len % 4) != 0)
276321b17ecSEdward Tomasz Napierala 		return (4 - (ip->ip_data_len % 4));
277321b17ecSEdward Tomasz Napierala 
278321b17ecSEdward Tomasz Napierala 	return (0);
279321b17ecSEdward Tomasz Napierala }
280321b17ecSEdward Tomasz Napierala 
281321b17ecSEdward Tomasz Napierala static size_t
282321b17ecSEdward Tomasz Napierala icl_pdu_size(const struct icl_pdu *response)
283321b17ecSEdward Tomasz Napierala {
284321b17ecSEdward Tomasz Napierala 	size_t len;
285321b17ecSEdward Tomasz Napierala 
286321b17ecSEdward Tomasz Napierala 	KASSERT(response->ip_ahs_len == 0, ("responding with AHS"));
287321b17ecSEdward Tomasz Napierala 
288321b17ecSEdward Tomasz Napierala 	len = sizeof(struct iscsi_bhs) + response->ip_data_len +
289321b17ecSEdward Tomasz Napierala 	    icl_pdu_padding(response);
290321b17ecSEdward Tomasz Napierala 	if (response->ip_conn->ic_header_crc32c)
291321b17ecSEdward Tomasz Napierala 		len += ISCSI_HEADER_DIGEST_SIZE;
292321b17ecSEdward Tomasz Napierala 	if (response->ip_data_len != 0 && response->ip_conn->ic_data_crc32c)
293321b17ecSEdward Tomasz Napierala 		len += ISCSI_DATA_DIGEST_SIZE;
294321b17ecSEdward Tomasz Napierala 
295321b17ecSEdward Tomasz Napierala 	return (len);
296321b17ecSEdward Tomasz Napierala }
297321b17ecSEdward Tomasz Napierala 
298321b17ecSEdward Tomasz Napierala static int
299321b17ecSEdward Tomasz Napierala icl_pdu_receive_bhs(struct icl_pdu *request, size_t *availablep)
300321b17ecSEdward Tomasz Napierala {
301321b17ecSEdward Tomasz Napierala 	struct mbuf *m;
302321b17ecSEdward Tomasz Napierala 
303321b17ecSEdward Tomasz Napierala 	m = icl_conn_receive(request->ip_conn, sizeof(struct iscsi_bhs));
304321b17ecSEdward Tomasz Napierala 	if (m == NULL) {
305321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("failed to receive BHS");
306321b17ecSEdward Tomasz Napierala 		return (-1);
307321b17ecSEdward Tomasz Napierala 	}
308321b17ecSEdward Tomasz Napierala 
309321b17ecSEdward Tomasz Napierala 	request->ip_bhs_mbuf = m_pullup(m, sizeof(struct iscsi_bhs));
310321b17ecSEdward Tomasz Napierala 	if (request->ip_bhs_mbuf == NULL) {
311321b17ecSEdward Tomasz Napierala 		ICL_WARN("m_pullup failed");
312321b17ecSEdward Tomasz Napierala 		return (-1);
313321b17ecSEdward Tomasz Napierala 	}
314321b17ecSEdward Tomasz Napierala 	request->ip_bhs = mtod(request->ip_bhs_mbuf, struct iscsi_bhs *);
315321b17ecSEdward Tomasz Napierala 
316321b17ecSEdward Tomasz Napierala 	/*
317321b17ecSEdward Tomasz Napierala 	 * XXX: For architectures with strict alignment requirements
318321b17ecSEdward Tomasz Napierala 	 * 	we may need to allocate ip_bhs and copy the data into it.
319321b17ecSEdward Tomasz Napierala 	 * 	For some reason, though, not doing this doesn't seem
320321b17ecSEdward Tomasz Napierala 	 * 	to cause problems; tested on sparc64.
321321b17ecSEdward Tomasz Napierala 	 */
322321b17ecSEdward Tomasz Napierala 
323321b17ecSEdward Tomasz Napierala 	*availablep -= sizeof(struct iscsi_bhs);
324321b17ecSEdward Tomasz Napierala 	return (0);
325321b17ecSEdward Tomasz Napierala }
326321b17ecSEdward Tomasz Napierala 
327321b17ecSEdward Tomasz Napierala static int
328321b17ecSEdward Tomasz Napierala icl_pdu_receive_ahs(struct icl_pdu *request, size_t *availablep)
329321b17ecSEdward Tomasz Napierala {
330321b17ecSEdward Tomasz Napierala 
331321b17ecSEdward Tomasz Napierala 	request->ip_ahs_len = icl_pdu_ahs_length(request);
332321b17ecSEdward Tomasz Napierala 	if (request->ip_ahs_len == 0)
333321b17ecSEdward Tomasz Napierala 		return (0);
334321b17ecSEdward Tomasz Napierala 
335321b17ecSEdward Tomasz Napierala 	request->ip_ahs_mbuf = icl_conn_receive(request->ip_conn,
336321b17ecSEdward Tomasz Napierala 	    request->ip_ahs_len);
337321b17ecSEdward Tomasz Napierala 	if (request->ip_ahs_mbuf == NULL) {
338321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("failed to receive AHS");
339321b17ecSEdward Tomasz Napierala 		return (-1);
340321b17ecSEdward Tomasz Napierala 	}
341321b17ecSEdward Tomasz Napierala 
342321b17ecSEdward Tomasz Napierala 	*availablep -= request->ip_ahs_len;
343321b17ecSEdward Tomasz Napierala 	return (0);
344321b17ecSEdward Tomasz Napierala }
345321b17ecSEdward Tomasz Napierala 
346321b17ecSEdward Tomasz Napierala static uint32_t
347321b17ecSEdward Tomasz Napierala icl_mbuf_to_crc32c(const struct mbuf *m0)
348321b17ecSEdward Tomasz Napierala {
349321b17ecSEdward Tomasz Napierala 	uint32_t digest = 0xffffffff;
350321b17ecSEdward Tomasz Napierala 	const struct mbuf *m;
351321b17ecSEdward Tomasz Napierala 
352321b17ecSEdward Tomasz Napierala 	for (m = m0; m != NULL; m = m->m_next)
353321b17ecSEdward Tomasz Napierala 		digest = calculate_crc32c(digest,
354321b17ecSEdward Tomasz Napierala 		    mtod(m, const void *), m->m_len);
355321b17ecSEdward Tomasz Napierala 
356321b17ecSEdward Tomasz Napierala 	digest = digest ^ 0xffffffff;
357321b17ecSEdward Tomasz Napierala 
358321b17ecSEdward Tomasz Napierala 	return (digest);
359321b17ecSEdward Tomasz Napierala }
360321b17ecSEdward Tomasz Napierala 
361321b17ecSEdward Tomasz Napierala static int
362321b17ecSEdward Tomasz Napierala icl_pdu_check_header_digest(struct icl_pdu *request, size_t *availablep)
363321b17ecSEdward Tomasz Napierala {
364321b17ecSEdward Tomasz Napierala 	struct mbuf *m;
365321b17ecSEdward Tomasz Napierala 	uint32_t received_digest, valid_digest;
366321b17ecSEdward Tomasz Napierala 
367321b17ecSEdward Tomasz Napierala 	if (request->ip_conn->ic_header_crc32c == false)
368321b17ecSEdward Tomasz Napierala 		return (0);
369321b17ecSEdward Tomasz Napierala 
370321b17ecSEdward Tomasz Napierala 	m = icl_conn_receive(request->ip_conn, ISCSI_HEADER_DIGEST_SIZE);
371321b17ecSEdward Tomasz Napierala 	if (m == NULL) {
372321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("failed to receive header digest");
373321b17ecSEdward Tomasz Napierala 		return (-1);
374321b17ecSEdward Tomasz Napierala 	}
375321b17ecSEdward Tomasz Napierala 
376321b17ecSEdward Tomasz Napierala 	CTASSERT(sizeof(received_digest) == ISCSI_HEADER_DIGEST_SIZE);
377321b17ecSEdward Tomasz Napierala 	m_copydata(m, 0, ISCSI_HEADER_DIGEST_SIZE, (void *)&received_digest);
378321b17ecSEdward Tomasz Napierala 	m_freem(m);
379321b17ecSEdward Tomasz Napierala 
380321b17ecSEdward Tomasz Napierala 	*availablep -= ISCSI_HEADER_DIGEST_SIZE;
381321b17ecSEdward Tomasz Napierala 
382321b17ecSEdward Tomasz Napierala 	/*
383321b17ecSEdward Tomasz Napierala 	 * XXX: Handle AHS.
384321b17ecSEdward Tomasz Napierala 	 */
385321b17ecSEdward Tomasz Napierala 	valid_digest = icl_mbuf_to_crc32c(request->ip_bhs_mbuf);
386321b17ecSEdward Tomasz Napierala 	if (received_digest != valid_digest) {
387321b17ecSEdward Tomasz Napierala 		ICL_WARN("header digest check failed; got 0x%x, "
388321b17ecSEdward Tomasz Napierala 		    "should be 0x%x", received_digest, valid_digest);
389321b17ecSEdward Tomasz Napierala 		return (-1);
390321b17ecSEdward Tomasz Napierala 	}
391321b17ecSEdward Tomasz Napierala 
392321b17ecSEdward Tomasz Napierala 	return (0);
393321b17ecSEdward Tomasz Napierala }
394321b17ecSEdward Tomasz Napierala 
395321b17ecSEdward Tomasz Napierala /*
396321b17ecSEdward Tomasz Napierala  * Return the number of bytes that should be waiting in the receive socket
397321b17ecSEdward Tomasz Napierala  * before icl_pdu_receive_data_segment() gets called.
398321b17ecSEdward Tomasz Napierala  */
399321b17ecSEdward Tomasz Napierala static size_t
400321b17ecSEdward Tomasz Napierala icl_pdu_data_segment_receive_len(const struct icl_pdu *request)
401321b17ecSEdward Tomasz Napierala {
402321b17ecSEdward Tomasz Napierala 	size_t len;
403321b17ecSEdward Tomasz Napierala 
404321b17ecSEdward Tomasz Napierala 	len = icl_pdu_data_segment_length(request);
405321b17ecSEdward Tomasz Napierala 	if (len == 0)
406321b17ecSEdward Tomasz Napierala 		return (0);
407321b17ecSEdward Tomasz Napierala 
408321b17ecSEdward Tomasz Napierala 	/*
409321b17ecSEdward Tomasz Napierala 	 * Account for the parts of data segment already read from
410321b17ecSEdward Tomasz Napierala 	 * the socket buffer.
411321b17ecSEdward Tomasz Napierala 	 */
412321b17ecSEdward Tomasz Napierala 	KASSERT(len > request->ip_data_len, ("len <= request->ip_data_len"));
413321b17ecSEdward Tomasz Napierala 	len -= request->ip_data_len;
414321b17ecSEdward Tomasz Napierala 
415321b17ecSEdward Tomasz Napierala 	/*
416321b17ecSEdward Tomasz Napierala 	 * Don't always wait for the full data segment to be delivered
417321b17ecSEdward Tomasz Napierala 	 * to the socket; this might badly affect performance due to
418321b17ecSEdward Tomasz Napierala 	 * TCP window scaling.
419321b17ecSEdward Tomasz Napierala 	 */
420321b17ecSEdward Tomasz Napierala 	if (len > partial_receive_len) {
421321b17ecSEdward Tomasz Napierala #if 0
422321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("need %zd bytes of data, limiting to %zd",
423321b17ecSEdward Tomasz Napierala 		    len, partial_receive_len));
424321b17ecSEdward Tomasz Napierala #endif
425321b17ecSEdward Tomasz Napierala 		len = partial_receive_len;
426321b17ecSEdward Tomasz Napierala 
427321b17ecSEdward Tomasz Napierala 		return (len);
428321b17ecSEdward Tomasz Napierala 	}
429321b17ecSEdward Tomasz Napierala 
430321b17ecSEdward Tomasz Napierala 	/*
431321b17ecSEdward Tomasz Napierala 	 * Account for padding.  Note that due to the way code is written,
432321b17ecSEdward Tomasz Napierala 	 * the icl_pdu_receive_data_segment() must always receive padding
433321b17ecSEdward Tomasz Napierala 	 * along with the last part of data segment, because it would be
434321b17ecSEdward Tomasz Napierala 	 * impossible to tell whether we've already received the full data
435321b17ecSEdward Tomasz Napierala 	 * segment including padding, or without it.
436321b17ecSEdward Tomasz Napierala 	 */
437321b17ecSEdward Tomasz Napierala 	if ((len % 4) != 0)
438321b17ecSEdward Tomasz Napierala 		len += 4 - (len % 4);
439321b17ecSEdward Tomasz Napierala 
440321b17ecSEdward Tomasz Napierala #if 0
441321b17ecSEdward Tomasz Napierala 	ICL_DEBUG("need %zd bytes of data", len));
442321b17ecSEdward Tomasz Napierala #endif
443321b17ecSEdward Tomasz Napierala 
444321b17ecSEdward Tomasz Napierala 	return (len);
445321b17ecSEdward Tomasz Napierala }
446321b17ecSEdward Tomasz Napierala 
447321b17ecSEdward Tomasz Napierala static int
448321b17ecSEdward Tomasz Napierala icl_pdu_receive_data_segment(struct icl_pdu *request,
449321b17ecSEdward Tomasz Napierala     size_t *availablep, bool *more_neededp)
450321b17ecSEdward Tomasz Napierala {
451321b17ecSEdward Tomasz Napierala 	struct icl_conn *ic;
452321b17ecSEdward Tomasz Napierala 	size_t len, padding = 0;
453321b17ecSEdward Tomasz Napierala 	struct mbuf *m;
454321b17ecSEdward Tomasz Napierala 
455321b17ecSEdward Tomasz Napierala 	ic = request->ip_conn;
456321b17ecSEdward Tomasz Napierala 
457321b17ecSEdward Tomasz Napierala 	*more_neededp = false;
458321b17ecSEdward Tomasz Napierala 	ic->ic_receive_len = 0;
459321b17ecSEdward Tomasz Napierala 
460321b17ecSEdward Tomasz Napierala 	len = icl_pdu_data_segment_length(request);
461321b17ecSEdward Tomasz Napierala 	if (len == 0)
462321b17ecSEdward Tomasz Napierala 		return (0);
463321b17ecSEdward Tomasz Napierala 
464321b17ecSEdward Tomasz Napierala 	if ((len % 4) != 0)
465321b17ecSEdward Tomasz Napierala 		padding = 4 - (len % 4);
466321b17ecSEdward Tomasz Napierala 
467321b17ecSEdward Tomasz Napierala 	/*
468321b17ecSEdward Tomasz Napierala 	 * Account for already received parts of data segment.
469321b17ecSEdward Tomasz Napierala 	 */
470321b17ecSEdward Tomasz Napierala 	KASSERT(len > request->ip_data_len, ("len <= request->ip_data_len"));
471321b17ecSEdward Tomasz Napierala 	len -= request->ip_data_len;
472321b17ecSEdward Tomasz Napierala 
473321b17ecSEdward Tomasz Napierala 	if (len + padding > *availablep) {
474321b17ecSEdward Tomasz Napierala 		/*
475321b17ecSEdward Tomasz Napierala 		 * Not enough data in the socket buffer.  Receive as much
476321b17ecSEdward Tomasz Napierala 		 * as we can.  Don't receive padding, since, obviously, it's
477321b17ecSEdward Tomasz Napierala 		 * not the end of data segment yet.
478321b17ecSEdward Tomasz Napierala 		 */
479321b17ecSEdward Tomasz Napierala #if 0
480321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("limited from %zd to %zd",
481321b17ecSEdward Tomasz Napierala 		    len + padding, *availablep - padding));
482321b17ecSEdward Tomasz Napierala #endif
483321b17ecSEdward Tomasz Napierala 		len = *availablep - padding;
484321b17ecSEdward Tomasz Napierala 		*more_neededp = true;
485321b17ecSEdward Tomasz Napierala 		padding = 0;
486321b17ecSEdward Tomasz Napierala 	}
487321b17ecSEdward Tomasz Napierala 
488321b17ecSEdward Tomasz Napierala 	/*
489321b17ecSEdward Tomasz Napierala 	 * Must not try to receive padding without at least one byte
490321b17ecSEdward Tomasz Napierala 	 * of actual data segment.
491321b17ecSEdward Tomasz Napierala 	 */
492321b17ecSEdward Tomasz Napierala 	if (len > 0) {
493321b17ecSEdward Tomasz Napierala 		m = icl_conn_receive(request->ip_conn, len + padding);
494321b17ecSEdward Tomasz Napierala 		if (m == NULL) {
495321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("failed to receive data segment");
496321b17ecSEdward Tomasz Napierala 			return (-1);
497321b17ecSEdward Tomasz Napierala 		}
498321b17ecSEdward Tomasz Napierala 
499321b17ecSEdward Tomasz Napierala 		if (request->ip_data_mbuf == NULL)
500321b17ecSEdward Tomasz Napierala 			request->ip_data_mbuf = m;
501321b17ecSEdward Tomasz Napierala 		else
502321b17ecSEdward Tomasz Napierala 			m_cat(request->ip_data_mbuf, m);
503321b17ecSEdward Tomasz Napierala 
504321b17ecSEdward Tomasz Napierala 		request->ip_data_len += len;
505321b17ecSEdward Tomasz Napierala 		*availablep -= len + padding;
506321b17ecSEdward Tomasz Napierala 	} else
507321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("len 0");
508321b17ecSEdward Tomasz Napierala 
509321b17ecSEdward Tomasz Napierala 	if (*more_neededp)
510321b17ecSEdward Tomasz Napierala 		ic->ic_receive_len =
511321b17ecSEdward Tomasz Napierala 		    icl_pdu_data_segment_receive_len(request);
512321b17ecSEdward Tomasz Napierala 
513321b17ecSEdward Tomasz Napierala 	return (0);
514321b17ecSEdward Tomasz Napierala }
515321b17ecSEdward Tomasz Napierala 
516321b17ecSEdward Tomasz Napierala static int
517321b17ecSEdward Tomasz Napierala icl_pdu_check_data_digest(struct icl_pdu *request, size_t *availablep)
518321b17ecSEdward Tomasz Napierala {
519321b17ecSEdward Tomasz Napierala 	struct mbuf *m;
520321b17ecSEdward Tomasz Napierala 	uint32_t received_digest, valid_digest;
521321b17ecSEdward Tomasz Napierala 
522321b17ecSEdward Tomasz Napierala 	if (request->ip_conn->ic_data_crc32c == false)
523321b17ecSEdward Tomasz Napierala 		return (0);
524321b17ecSEdward Tomasz Napierala 
525321b17ecSEdward Tomasz Napierala 	if (request->ip_data_len == 0)
526321b17ecSEdward Tomasz Napierala 		return (0);
527321b17ecSEdward Tomasz Napierala 
528321b17ecSEdward Tomasz Napierala 	m = icl_conn_receive(request->ip_conn, ISCSI_DATA_DIGEST_SIZE);
529321b17ecSEdward Tomasz Napierala 	if (m == NULL) {
530321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("failed to receive data digest");
531321b17ecSEdward Tomasz Napierala 		return (-1);
532321b17ecSEdward Tomasz Napierala 	}
533321b17ecSEdward Tomasz Napierala 
534321b17ecSEdward Tomasz Napierala 	CTASSERT(sizeof(received_digest) == ISCSI_DATA_DIGEST_SIZE);
535321b17ecSEdward Tomasz Napierala 	m_copydata(m, 0, ISCSI_DATA_DIGEST_SIZE, (void *)&received_digest);
536321b17ecSEdward Tomasz Napierala 	m_freem(m);
537321b17ecSEdward Tomasz Napierala 
538321b17ecSEdward Tomasz Napierala 	*availablep -= ISCSI_DATA_DIGEST_SIZE;
539321b17ecSEdward Tomasz Napierala 
540321b17ecSEdward Tomasz Napierala 	/*
541321b17ecSEdward Tomasz Napierala 	 * Note that ip_data_mbuf also contains padding; since digest
542321b17ecSEdward Tomasz Napierala 	 * calculation is supposed to include that, we iterate over
543321b17ecSEdward Tomasz Napierala 	 * the entire ip_data_mbuf chain, not just ip_data_len bytes of it.
544321b17ecSEdward Tomasz Napierala 	 */
545321b17ecSEdward Tomasz Napierala 	valid_digest = icl_mbuf_to_crc32c(request->ip_data_mbuf);
546321b17ecSEdward Tomasz Napierala 	if (received_digest != valid_digest) {
547321b17ecSEdward Tomasz Napierala 		ICL_WARN("data digest check failed; got 0x%x, "
548321b17ecSEdward Tomasz Napierala 		    "should be 0x%x", received_digest, valid_digest);
549321b17ecSEdward Tomasz Napierala 		return (-1);
550321b17ecSEdward Tomasz Napierala 	}
551321b17ecSEdward Tomasz Napierala 
552321b17ecSEdward Tomasz Napierala 	return (0);
553321b17ecSEdward Tomasz Napierala }
554321b17ecSEdward Tomasz Napierala 
555321b17ecSEdward Tomasz Napierala /*
556321b17ecSEdward Tomasz Napierala  * Somewhat contrary to the name, this attempts to receive only one
557321b17ecSEdward Tomasz Napierala  * "part" of PDU at a time; call it repeatedly until it returns non-NULL.
558321b17ecSEdward Tomasz Napierala  */
559321b17ecSEdward Tomasz Napierala static struct icl_pdu *
560321b17ecSEdward Tomasz Napierala icl_conn_receive_pdu(struct icl_conn *ic, size_t *availablep)
561321b17ecSEdward Tomasz Napierala {
562321b17ecSEdward Tomasz Napierala 	struct icl_pdu *request;
563321b17ecSEdward Tomasz Napierala 	struct socket *so;
564321b17ecSEdward Tomasz Napierala 	size_t len;
565321b17ecSEdward Tomasz Napierala 	int error;
566321b17ecSEdward Tomasz Napierala 	bool more_needed;
567321b17ecSEdward Tomasz Napierala 
568321b17ecSEdward Tomasz Napierala 	so = ic->ic_socket;
569321b17ecSEdward Tomasz Napierala 
570321b17ecSEdward Tomasz Napierala 	if (ic->ic_receive_state == ICL_CONN_STATE_BHS) {
571321b17ecSEdward Tomasz Napierala 		KASSERT(ic->ic_receive_pdu == NULL,
572321b17ecSEdward Tomasz Napierala 		    ("ic->ic_receive_pdu != NULL"));
573321b17ecSEdward Tomasz Napierala 		request = icl_pdu_new_empty(ic, M_NOWAIT);
574321b17ecSEdward Tomasz Napierala 		if (request == NULL) {
575321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("failed to allocate PDU; "
576321b17ecSEdward Tomasz Napierala 			    "dropping connection");
577321b17ecSEdward Tomasz Napierala 			icl_conn_fail(ic);
578321b17ecSEdward Tomasz Napierala 			return (NULL);
579321b17ecSEdward Tomasz Napierala 		}
580321b17ecSEdward Tomasz Napierala 		ic->ic_receive_pdu = request;
581321b17ecSEdward Tomasz Napierala 	} else {
582321b17ecSEdward Tomasz Napierala 		KASSERT(ic->ic_receive_pdu != NULL,
583321b17ecSEdward Tomasz Napierala 		    ("ic->ic_receive_pdu == NULL"));
584321b17ecSEdward Tomasz Napierala 		request = ic->ic_receive_pdu;
585321b17ecSEdward Tomasz Napierala 	}
586321b17ecSEdward Tomasz Napierala 
587321b17ecSEdward Tomasz Napierala 	if (*availablep < ic->ic_receive_len) {
588321b17ecSEdward Tomasz Napierala #if 0
589321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("not enough data; need %zd, "
590321b17ecSEdward Tomasz Napierala 		    "have %zd", ic->ic_receive_len, *availablep);
591321b17ecSEdward Tomasz Napierala #endif
592321b17ecSEdward Tomasz Napierala 		return (NULL);
593321b17ecSEdward Tomasz Napierala 	}
594321b17ecSEdward Tomasz Napierala 
595321b17ecSEdward Tomasz Napierala 	switch (ic->ic_receive_state) {
596321b17ecSEdward Tomasz Napierala 	case ICL_CONN_STATE_BHS:
597321b17ecSEdward Tomasz Napierala 		//ICL_DEBUG("receiving BHS");
598321b17ecSEdward Tomasz Napierala 		error = icl_pdu_receive_bhs(request, availablep);
599321b17ecSEdward Tomasz Napierala 		if (error != 0) {
600321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("failed to receive BHS; "
601321b17ecSEdward Tomasz Napierala 			    "dropping connection");
602321b17ecSEdward Tomasz Napierala 			break;
603321b17ecSEdward Tomasz Napierala 		}
604321b17ecSEdward Tomasz Napierala 
605321b17ecSEdward Tomasz Napierala 		/*
606321b17ecSEdward Tomasz Napierala 		 * We don't enforce any limit for AHS length;
607321b17ecSEdward Tomasz Napierala 		 * its length is stored in 8 bit field.
608321b17ecSEdward Tomasz Napierala 		 */
609321b17ecSEdward Tomasz Napierala 
610321b17ecSEdward Tomasz Napierala 		len = icl_pdu_data_segment_length(request);
611321b17ecSEdward Tomasz Napierala 		if (len > ic->ic_max_data_segment_length) {
612321b17ecSEdward Tomasz Napierala 			ICL_WARN("received data segment "
613321b17ecSEdward Tomasz Napierala 			    "length %zd is larger than negotiated "
614321b17ecSEdward Tomasz Napierala 			    "MaxDataSegmentLength %zd; "
615321b17ecSEdward Tomasz Napierala 			    "dropping connection",
616321b17ecSEdward Tomasz Napierala 			    len, ic->ic_max_data_segment_length);
617321b17ecSEdward Tomasz Napierala 			error = EINVAL;
618321b17ecSEdward Tomasz Napierala 			break;
619321b17ecSEdward Tomasz Napierala 		}
620321b17ecSEdward Tomasz Napierala 
621321b17ecSEdward Tomasz Napierala 		ic->ic_receive_state = ICL_CONN_STATE_AHS;
622321b17ecSEdward Tomasz Napierala 		ic->ic_receive_len = icl_pdu_ahs_length(request);
623321b17ecSEdward Tomasz Napierala 		break;
624321b17ecSEdward Tomasz Napierala 
625321b17ecSEdward Tomasz Napierala 	case ICL_CONN_STATE_AHS:
626321b17ecSEdward Tomasz Napierala 		//ICL_DEBUG("receiving AHS");
627321b17ecSEdward Tomasz Napierala 		error = icl_pdu_receive_ahs(request, availablep);
628321b17ecSEdward Tomasz Napierala 		if (error != 0) {
629321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("failed to receive AHS; "
630321b17ecSEdward Tomasz Napierala 			    "dropping connection");
631321b17ecSEdward Tomasz Napierala 			break;
632321b17ecSEdward Tomasz Napierala 		}
633321b17ecSEdward Tomasz Napierala 		ic->ic_receive_state = ICL_CONN_STATE_HEADER_DIGEST;
634321b17ecSEdward Tomasz Napierala 		if (ic->ic_header_crc32c == false)
635321b17ecSEdward Tomasz Napierala 			ic->ic_receive_len = 0;
636321b17ecSEdward Tomasz Napierala 		else
637321b17ecSEdward Tomasz Napierala 			ic->ic_receive_len = ISCSI_HEADER_DIGEST_SIZE;
638321b17ecSEdward Tomasz Napierala 		break;
639321b17ecSEdward Tomasz Napierala 
640321b17ecSEdward Tomasz Napierala 	case ICL_CONN_STATE_HEADER_DIGEST:
641321b17ecSEdward Tomasz Napierala 		//ICL_DEBUG("receiving header digest");
642321b17ecSEdward Tomasz Napierala 		error = icl_pdu_check_header_digest(request, availablep);
643321b17ecSEdward Tomasz Napierala 		if (error != 0) {
644321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("header digest failed; "
645321b17ecSEdward Tomasz Napierala 			    "dropping connection");
646321b17ecSEdward Tomasz Napierala 			break;
647321b17ecSEdward Tomasz Napierala 		}
648321b17ecSEdward Tomasz Napierala 
649321b17ecSEdward Tomasz Napierala 		ic->ic_receive_state = ICL_CONN_STATE_DATA;
650321b17ecSEdward Tomasz Napierala 		ic->ic_receive_len =
651321b17ecSEdward Tomasz Napierala 		    icl_pdu_data_segment_receive_len(request);
652321b17ecSEdward Tomasz Napierala 		break;
653321b17ecSEdward Tomasz Napierala 
654321b17ecSEdward Tomasz Napierala 	case ICL_CONN_STATE_DATA:
655321b17ecSEdward Tomasz Napierala 		//ICL_DEBUG("receiving data segment");
656321b17ecSEdward Tomasz Napierala 		error = icl_pdu_receive_data_segment(request, availablep,
657321b17ecSEdward Tomasz Napierala 		    &more_needed);
658321b17ecSEdward Tomasz Napierala 		if (error != 0) {
659321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("failed to receive data segment;"
660321b17ecSEdward Tomasz Napierala 			    "dropping connection");
661321b17ecSEdward Tomasz Napierala 			break;
662321b17ecSEdward Tomasz Napierala 		}
663321b17ecSEdward Tomasz Napierala 
664321b17ecSEdward Tomasz Napierala 		if (more_needed)
665321b17ecSEdward Tomasz Napierala 			break;
666321b17ecSEdward Tomasz Napierala 
667321b17ecSEdward Tomasz Napierala 		ic->ic_receive_state = ICL_CONN_STATE_DATA_DIGEST;
668321b17ecSEdward Tomasz Napierala 		if (request->ip_data_len == 0 || ic->ic_data_crc32c == false)
669321b17ecSEdward Tomasz Napierala 			ic->ic_receive_len = 0;
670321b17ecSEdward Tomasz Napierala 		else
671321b17ecSEdward Tomasz Napierala 			ic->ic_receive_len = ISCSI_DATA_DIGEST_SIZE;
672321b17ecSEdward Tomasz Napierala 		break;
673321b17ecSEdward Tomasz Napierala 
674321b17ecSEdward Tomasz Napierala 	case ICL_CONN_STATE_DATA_DIGEST:
675321b17ecSEdward Tomasz Napierala 		//ICL_DEBUG("receiving data digest");
676321b17ecSEdward Tomasz Napierala 		error = icl_pdu_check_data_digest(request, availablep);
677321b17ecSEdward Tomasz Napierala 		if (error != 0) {
678321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("data digest failed; "
679321b17ecSEdward Tomasz Napierala 			    "dropping connection");
680321b17ecSEdward Tomasz Napierala 			break;
681321b17ecSEdward Tomasz Napierala 		}
682321b17ecSEdward Tomasz Napierala 
683321b17ecSEdward Tomasz Napierala 		/*
684321b17ecSEdward Tomasz Napierala 		 * We've received complete PDU; reset the receive state machine
685321b17ecSEdward Tomasz Napierala 		 * and return the PDU.
686321b17ecSEdward Tomasz Napierala 		 */
687321b17ecSEdward Tomasz Napierala 		ic->ic_receive_state = ICL_CONN_STATE_BHS;
688321b17ecSEdward Tomasz Napierala 		ic->ic_receive_len = sizeof(struct iscsi_bhs);
689321b17ecSEdward Tomasz Napierala 		ic->ic_receive_pdu = NULL;
690321b17ecSEdward Tomasz Napierala 		return (request);
691321b17ecSEdward Tomasz Napierala 
692321b17ecSEdward Tomasz Napierala 	default:
693321b17ecSEdward Tomasz Napierala 		panic("invalid ic_receive_state %d\n", ic->ic_receive_state);
694321b17ecSEdward Tomasz Napierala 	}
695321b17ecSEdward Tomasz Napierala 
696321b17ecSEdward Tomasz Napierala 	if (error != 0) {
697321b17ecSEdward Tomasz Napierala 		/*
698321b17ecSEdward Tomasz Napierala 		 * Don't free the PDU; it's pointed to by ic->ic_receive_pdu
699321b17ecSEdward Tomasz Napierala 		 * and will get freed in icl_conn_close().
700321b17ecSEdward Tomasz Napierala 		 */
701321b17ecSEdward Tomasz Napierala 		icl_conn_fail(ic);
702321b17ecSEdward Tomasz Napierala 	}
703321b17ecSEdward Tomasz Napierala 
704321b17ecSEdward Tomasz Napierala 	return (NULL);
705321b17ecSEdward Tomasz Napierala }
706321b17ecSEdward Tomasz Napierala 
707321b17ecSEdward Tomasz Napierala static void
708321b17ecSEdward Tomasz Napierala icl_conn_receive_pdus(struct icl_conn *ic, size_t available)
709321b17ecSEdward Tomasz Napierala {
710321b17ecSEdward Tomasz Napierala 	struct icl_pdu *response;
711321b17ecSEdward Tomasz Napierala 	struct socket *so;
712321b17ecSEdward Tomasz Napierala 
713321b17ecSEdward Tomasz Napierala 	so = ic->ic_socket;
714321b17ecSEdward Tomasz Napierala 
715321b17ecSEdward Tomasz Napierala 	/*
716321b17ecSEdward Tomasz Napierala 	 * This can never happen; we're careful to only mess with ic->ic_socket
717321b17ecSEdward Tomasz Napierala 	 * pointer when the send/receive threads are not running.
718321b17ecSEdward Tomasz Napierala 	 */
719321b17ecSEdward Tomasz Napierala 	KASSERT(so != NULL, ("NULL socket"));
720321b17ecSEdward Tomasz Napierala 
721321b17ecSEdward Tomasz Napierala 	for (;;) {
722321b17ecSEdward Tomasz Napierala 		if (ic->ic_disconnecting)
723321b17ecSEdward Tomasz Napierala 			return;
724321b17ecSEdward Tomasz Napierala 
725321b17ecSEdward Tomasz Napierala 		if (so->so_error != 0) {
726321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("connection error %d; "
727321b17ecSEdward Tomasz Napierala 			    "dropping connection", so->so_error);
728321b17ecSEdward Tomasz Napierala 			icl_conn_fail(ic);
729321b17ecSEdward Tomasz Napierala 			return;
730321b17ecSEdward Tomasz Napierala 		}
731321b17ecSEdward Tomasz Napierala 
732321b17ecSEdward Tomasz Napierala 		/*
733321b17ecSEdward Tomasz Napierala 		 * Loop until we have a complete PDU or there is not enough
734321b17ecSEdward Tomasz Napierala 		 * data in the socket buffer.
735321b17ecSEdward Tomasz Napierala 		 */
736321b17ecSEdward Tomasz Napierala 		if (available < ic->ic_receive_len) {
737321b17ecSEdward Tomasz Napierala #if 0
738321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("not enough data; have %zd, "
739321b17ecSEdward Tomasz Napierala 			    "need %zd", available,
740321b17ecSEdward Tomasz Napierala 			    ic->ic_receive_len);
741321b17ecSEdward Tomasz Napierala #endif
742321b17ecSEdward Tomasz Napierala 			return;
743321b17ecSEdward Tomasz Napierala 		}
744321b17ecSEdward Tomasz Napierala 
745321b17ecSEdward Tomasz Napierala 		response = icl_conn_receive_pdu(ic, &available);
746321b17ecSEdward Tomasz Napierala 		if (response == NULL)
747321b17ecSEdward Tomasz Napierala 			continue;
748321b17ecSEdward Tomasz Napierala 
749321b17ecSEdward Tomasz Napierala 		if (response->ip_ahs_len > 0) {
750321b17ecSEdward Tomasz Napierala 			ICL_WARN("received PDU with unsupported "
751321b17ecSEdward Tomasz Napierala 			    "AHS; opcode 0x%x; dropping connection",
752321b17ecSEdward Tomasz Napierala 			    response->ip_bhs->bhs_opcode);
753321b17ecSEdward Tomasz Napierala 			icl_pdu_free(response);
754321b17ecSEdward Tomasz Napierala 			icl_conn_fail(ic);
755321b17ecSEdward Tomasz Napierala 			return;
756321b17ecSEdward Tomasz Napierala 		}
757321b17ecSEdward Tomasz Napierala 
758321b17ecSEdward Tomasz Napierala 		(ic->ic_receive)(response);
759321b17ecSEdward Tomasz Napierala 	}
760321b17ecSEdward Tomasz Napierala }
761321b17ecSEdward Tomasz Napierala 
762321b17ecSEdward Tomasz Napierala static void
763321b17ecSEdward Tomasz Napierala icl_receive_thread(void *arg)
764321b17ecSEdward Tomasz Napierala {
765321b17ecSEdward Tomasz Napierala 	struct icl_conn *ic;
766321b17ecSEdward Tomasz Napierala 	size_t available;
767321b17ecSEdward Tomasz Napierala 	struct socket *so;
768321b17ecSEdward Tomasz Napierala 
769321b17ecSEdward Tomasz Napierala 	ic = arg;
770321b17ecSEdward Tomasz Napierala 	so = ic->ic_socket;
771321b17ecSEdward Tomasz Napierala 
772321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
773321b17ecSEdward Tomasz Napierala 	ic->ic_receive_running = true;
774321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
775321b17ecSEdward Tomasz Napierala 
776321b17ecSEdward Tomasz Napierala 	for (;;) {
777321b17ecSEdward Tomasz Napierala 		if (ic->ic_disconnecting) {
778321b17ecSEdward Tomasz Napierala 			//ICL_DEBUG("terminating");
779321b17ecSEdward Tomasz Napierala 			break;
780321b17ecSEdward Tomasz Napierala 		}
781321b17ecSEdward Tomasz Napierala 
782321b17ecSEdward Tomasz Napierala 		/*
783321b17ecSEdward Tomasz Napierala 		 * Set the low watermark, to be checked by
784321b17ecSEdward Tomasz Napierala 		 * soreadable() in icl_soupcall_receive()
785321b17ecSEdward Tomasz Napierala 		 * to avoid unneccessary wakeups until there
786321b17ecSEdward Tomasz Napierala 		 * is enough data received to read the PDU.
787321b17ecSEdward Tomasz Napierala 		 */
788321b17ecSEdward Tomasz Napierala 		SOCKBUF_LOCK(&so->so_rcv);
789321b17ecSEdward Tomasz Napierala 		available = sbavail(&so->so_rcv);
790321b17ecSEdward Tomasz Napierala 		if (available < ic->ic_receive_len) {
791321b17ecSEdward Tomasz Napierala 			so->so_rcv.sb_lowat = ic->ic_receive_len;
792321b17ecSEdward Tomasz Napierala 			cv_wait(&ic->ic_receive_cv, &so->so_rcv.sb_mtx);
793321b17ecSEdward Tomasz Napierala 		} else
794321b17ecSEdward Tomasz Napierala 			so->so_rcv.sb_lowat = so->so_rcv.sb_hiwat + 1;
795321b17ecSEdward Tomasz Napierala 		SOCKBUF_UNLOCK(&so->so_rcv);
796321b17ecSEdward Tomasz Napierala 
797321b17ecSEdward Tomasz Napierala 		icl_conn_receive_pdus(ic, available);
798321b17ecSEdward Tomasz Napierala 	}
799321b17ecSEdward Tomasz Napierala 
800321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
801321b17ecSEdward Tomasz Napierala 	ic->ic_receive_running = false;
802321b17ecSEdward Tomasz Napierala 	cv_signal(&ic->ic_send_cv);
803321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
804321b17ecSEdward Tomasz Napierala 	kthread_exit();
805321b17ecSEdward Tomasz Napierala }
806321b17ecSEdward Tomasz Napierala 
807321b17ecSEdward Tomasz Napierala static int
808321b17ecSEdward Tomasz Napierala icl_soupcall_receive(struct socket *so, void *arg, int waitflag)
809321b17ecSEdward Tomasz Napierala {
810321b17ecSEdward Tomasz Napierala 	struct icl_conn *ic;
811321b17ecSEdward Tomasz Napierala 
812321b17ecSEdward Tomasz Napierala 	if (!soreadable(so))
813321b17ecSEdward Tomasz Napierala 		return (SU_OK);
814321b17ecSEdward Tomasz Napierala 
815321b17ecSEdward Tomasz Napierala 	ic = arg;
816321b17ecSEdward Tomasz Napierala 	cv_signal(&ic->ic_receive_cv);
817321b17ecSEdward Tomasz Napierala 	return (SU_OK);
818321b17ecSEdward Tomasz Napierala }
819321b17ecSEdward Tomasz Napierala 
820321b17ecSEdward Tomasz Napierala static int
821321b17ecSEdward Tomasz Napierala icl_pdu_finalize(struct icl_pdu *request)
822321b17ecSEdward Tomasz Napierala {
823321b17ecSEdward Tomasz Napierala 	size_t padding, pdu_len;
824321b17ecSEdward Tomasz Napierala 	uint32_t digest, zero = 0;
825321b17ecSEdward Tomasz Napierala 	int ok;
826321b17ecSEdward Tomasz Napierala 	struct icl_conn *ic;
827321b17ecSEdward Tomasz Napierala 
828321b17ecSEdward Tomasz Napierala 	ic = request->ip_conn;
829321b17ecSEdward Tomasz Napierala 
830321b17ecSEdward Tomasz Napierala 	icl_pdu_set_data_segment_length(request, request->ip_data_len);
831321b17ecSEdward Tomasz Napierala 
832321b17ecSEdward Tomasz Napierala 	pdu_len = icl_pdu_size(request);
833321b17ecSEdward Tomasz Napierala 
834321b17ecSEdward Tomasz Napierala 	if (ic->ic_header_crc32c) {
835321b17ecSEdward Tomasz Napierala 		digest = icl_mbuf_to_crc32c(request->ip_bhs_mbuf);
836321b17ecSEdward Tomasz Napierala 		ok = m_append(request->ip_bhs_mbuf, sizeof(digest),
837321b17ecSEdward Tomasz Napierala 		    (void *)&digest);
838321b17ecSEdward Tomasz Napierala 		if (ok != 1) {
839321b17ecSEdward Tomasz Napierala 			ICL_WARN("failed to append header digest");
840321b17ecSEdward Tomasz Napierala 			return (1);
841321b17ecSEdward Tomasz Napierala 		}
842321b17ecSEdward Tomasz Napierala 	}
843321b17ecSEdward Tomasz Napierala 
844321b17ecSEdward Tomasz Napierala 	if (request->ip_data_len != 0) {
845321b17ecSEdward Tomasz Napierala 		padding = icl_pdu_padding(request);
846321b17ecSEdward Tomasz Napierala 		if (padding > 0) {
847321b17ecSEdward Tomasz Napierala 			ok = m_append(request->ip_data_mbuf, padding,
848321b17ecSEdward Tomasz Napierala 			    (void *)&zero);
849321b17ecSEdward Tomasz Napierala 			if (ok != 1) {
850321b17ecSEdward Tomasz Napierala 				ICL_WARN("failed to append padding");
851321b17ecSEdward Tomasz Napierala 				return (1);
852321b17ecSEdward Tomasz Napierala 			}
853321b17ecSEdward Tomasz Napierala 		}
854321b17ecSEdward Tomasz Napierala 
855321b17ecSEdward Tomasz Napierala 		if (ic->ic_data_crc32c) {
856321b17ecSEdward Tomasz Napierala 			digest = icl_mbuf_to_crc32c(request->ip_data_mbuf);
857321b17ecSEdward Tomasz Napierala 
858321b17ecSEdward Tomasz Napierala 			ok = m_append(request->ip_data_mbuf, sizeof(digest),
859321b17ecSEdward Tomasz Napierala 			    (void *)&digest);
860321b17ecSEdward Tomasz Napierala 			if (ok != 1) {
861321b17ecSEdward Tomasz Napierala 				ICL_WARN("failed to append data digest");
862321b17ecSEdward Tomasz Napierala 				return (1);
863321b17ecSEdward Tomasz Napierala 			}
864321b17ecSEdward Tomasz Napierala 		}
865321b17ecSEdward Tomasz Napierala 
866321b17ecSEdward Tomasz Napierala 		m_cat(request->ip_bhs_mbuf, request->ip_data_mbuf);
867321b17ecSEdward Tomasz Napierala 		request->ip_data_mbuf = NULL;
868321b17ecSEdward Tomasz Napierala 	}
869321b17ecSEdward Tomasz Napierala 
870321b17ecSEdward Tomasz Napierala 	request->ip_bhs_mbuf->m_pkthdr.len = pdu_len;
871321b17ecSEdward Tomasz Napierala 
872321b17ecSEdward Tomasz Napierala 	return (0);
873321b17ecSEdward Tomasz Napierala }
874321b17ecSEdward Tomasz Napierala 
875321b17ecSEdward Tomasz Napierala static void
876321b17ecSEdward Tomasz Napierala icl_conn_send_pdus(struct icl_conn *ic, struct icl_pdu_stailq *queue)
877321b17ecSEdward Tomasz Napierala {
878321b17ecSEdward Tomasz Napierala 	struct icl_pdu *request, *request2;
879321b17ecSEdward Tomasz Napierala 	struct socket *so;
880321b17ecSEdward Tomasz Napierala 	size_t available, size, size2;
881321b17ecSEdward Tomasz Napierala 	int coalesced, error;
882321b17ecSEdward Tomasz Napierala 
883321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK_ASSERT_NOT(ic);
884321b17ecSEdward Tomasz Napierala 
885321b17ecSEdward Tomasz Napierala 	so = ic->ic_socket;
886321b17ecSEdward Tomasz Napierala 
887321b17ecSEdward Tomasz Napierala 	SOCKBUF_LOCK(&so->so_snd);
888321b17ecSEdward Tomasz Napierala 	/*
889321b17ecSEdward Tomasz Napierala 	 * Check how much space do we have for transmit.  We can't just
890321b17ecSEdward Tomasz Napierala 	 * call sosend() and retry when we get EWOULDBLOCK or EMSGSIZE,
891321b17ecSEdward Tomasz Napierala 	 * as it always frees the mbuf chain passed to it, even in case
892321b17ecSEdward Tomasz Napierala 	 * of error.
893321b17ecSEdward Tomasz Napierala 	 */
894321b17ecSEdward Tomasz Napierala 	available = sbspace(&so->so_snd);
895321b17ecSEdward Tomasz Napierala 
896321b17ecSEdward Tomasz Napierala 	/*
897321b17ecSEdward Tomasz Napierala 	 * Notify the socket upcall that we don't need wakeups
898321b17ecSEdward Tomasz Napierala 	 * for the time being.
899321b17ecSEdward Tomasz Napierala 	 */
900321b17ecSEdward Tomasz Napierala 	so->so_snd.sb_lowat = so->so_snd.sb_hiwat + 1;
901321b17ecSEdward Tomasz Napierala 	SOCKBUF_UNLOCK(&so->so_snd);
902321b17ecSEdward Tomasz Napierala 
903321b17ecSEdward Tomasz Napierala 	while (!STAILQ_EMPTY(queue)) {
904321b17ecSEdward Tomasz Napierala 		request = STAILQ_FIRST(queue);
905321b17ecSEdward Tomasz Napierala 		size = icl_pdu_size(request);
906321b17ecSEdward Tomasz Napierala 		if (available < size) {
907321b17ecSEdward Tomasz Napierala 
908321b17ecSEdward Tomasz Napierala 			/*
909321b17ecSEdward Tomasz Napierala 			 * Set the low watermark, to be checked by
910321b17ecSEdward Tomasz Napierala 			 * sowriteable() in icl_soupcall_send()
911321b17ecSEdward Tomasz Napierala 			 * to avoid unneccessary wakeups until there
912321b17ecSEdward Tomasz Napierala 			 * is enough space for the PDU to fit.
913321b17ecSEdward Tomasz Napierala 			 */
914321b17ecSEdward Tomasz Napierala 			SOCKBUF_LOCK(&so->so_snd);
915321b17ecSEdward Tomasz Napierala 			available = sbspace(&so->so_snd);
916321b17ecSEdward Tomasz Napierala 			if (available < size) {
917321b17ecSEdward Tomasz Napierala #if 1
918321b17ecSEdward Tomasz Napierala 				ICL_DEBUG("no space to send; "
919321b17ecSEdward Tomasz Napierala 				    "have %zd, need %zd",
920321b17ecSEdward Tomasz Napierala 				    available, size);
921321b17ecSEdward Tomasz Napierala #endif
922321b17ecSEdward Tomasz Napierala 				so->so_snd.sb_lowat = size;
923321b17ecSEdward Tomasz Napierala 				SOCKBUF_UNLOCK(&so->so_snd);
924321b17ecSEdward Tomasz Napierala 				return;
925321b17ecSEdward Tomasz Napierala 			}
926321b17ecSEdward Tomasz Napierala 			SOCKBUF_UNLOCK(&so->so_snd);
927321b17ecSEdward Tomasz Napierala 		}
928321b17ecSEdward Tomasz Napierala 		STAILQ_REMOVE_HEAD(queue, ip_next);
929321b17ecSEdward Tomasz Napierala 		error = icl_pdu_finalize(request);
930321b17ecSEdward Tomasz Napierala 		if (error != 0) {
931321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("failed to finalize PDU; "
932321b17ecSEdward Tomasz Napierala 			    "dropping connection");
933321b17ecSEdward Tomasz Napierala 			icl_conn_fail(ic);
934321b17ecSEdward Tomasz Napierala 			icl_pdu_free(request);
935321b17ecSEdward Tomasz Napierala 			return;
936321b17ecSEdward Tomasz Napierala 		}
937321b17ecSEdward Tomasz Napierala 		if (coalesce) {
938321b17ecSEdward Tomasz Napierala 			coalesced = 1;
939321b17ecSEdward Tomasz Napierala 			for (;;) {
940321b17ecSEdward Tomasz Napierala 				request2 = STAILQ_FIRST(queue);
941321b17ecSEdward Tomasz Napierala 				if (request2 == NULL)
942321b17ecSEdward Tomasz Napierala 					break;
943321b17ecSEdward Tomasz Napierala 				size2 = icl_pdu_size(request2);
944321b17ecSEdward Tomasz Napierala 				if (available < size + size2)
945321b17ecSEdward Tomasz Napierala 					break;
946321b17ecSEdward Tomasz Napierala 				STAILQ_REMOVE_HEAD(queue, ip_next);
947321b17ecSEdward Tomasz Napierala 				error = icl_pdu_finalize(request2);
948321b17ecSEdward Tomasz Napierala 				if (error != 0) {
949321b17ecSEdward Tomasz Napierala 					ICL_DEBUG("failed to finalize PDU; "
950321b17ecSEdward Tomasz Napierala 					    "dropping connection");
951321b17ecSEdward Tomasz Napierala 					icl_conn_fail(ic);
952321b17ecSEdward Tomasz Napierala 					icl_pdu_free(request);
953321b17ecSEdward Tomasz Napierala 					icl_pdu_free(request2);
954321b17ecSEdward Tomasz Napierala 					return;
955321b17ecSEdward Tomasz Napierala 				}
956321b17ecSEdward Tomasz Napierala 				m_cat(request->ip_bhs_mbuf, request2->ip_bhs_mbuf);
957321b17ecSEdward Tomasz Napierala 				request2->ip_bhs_mbuf = NULL;
958321b17ecSEdward Tomasz Napierala 				request->ip_bhs_mbuf->m_pkthdr.len += size2;
959321b17ecSEdward Tomasz Napierala 				size += size2;
960321b17ecSEdward Tomasz Napierala 				STAILQ_REMOVE_AFTER(queue, request, ip_next);
961321b17ecSEdward Tomasz Napierala 				icl_pdu_free(request2);
962321b17ecSEdward Tomasz Napierala 				coalesced++;
963321b17ecSEdward Tomasz Napierala 			}
964321b17ecSEdward Tomasz Napierala #if 0
965321b17ecSEdward Tomasz Napierala 			if (coalesced > 1) {
966321b17ecSEdward Tomasz Napierala 				ICL_DEBUG("coalesced %d PDUs into %zd bytes",
967321b17ecSEdward Tomasz Napierala 				    coalesced, size);
968321b17ecSEdward Tomasz Napierala 			}
969321b17ecSEdward Tomasz Napierala #endif
970321b17ecSEdward Tomasz Napierala 		}
971321b17ecSEdward Tomasz Napierala 		available -= size;
972321b17ecSEdward Tomasz Napierala 		error = sosend(so, NULL, NULL, request->ip_bhs_mbuf,
973321b17ecSEdward Tomasz Napierala 		    NULL, MSG_DONTWAIT, curthread);
974321b17ecSEdward Tomasz Napierala 		request->ip_bhs_mbuf = NULL; /* Sosend consumes the mbuf. */
975321b17ecSEdward Tomasz Napierala 		if (error != 0) {
976321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("failed to send PDU, error %d; "
977321b17ecSEdward Tomasz Napierala 			    "dropping connection", error);
978321b17ecSEdward Tomasz Napierala 			icl_conn_fail(ic);
979321b17ecSEdward Tomasz Napierala 			icl_pdu_free(request);
980321b17ecSEdward Tomasz Napierala 			return;
981321b17ecSEdward Tomasz Napierala 		}
982321b17ecSEdward Tomasz Napierala 		icl_pdu_free(request);
983321b17ecSEdward Tomasz Napierala 	}
984321b17ecSEdward Tomasz Napierala }
985321b17ecSEdward Tomasz Napierala 
986321b17ecSEdward Tomasz Napierala static void
987321b17ecSEdward Tomasz Napierala icl_send_thread(void *arg)
988321b17ecSEdward Tomasz Napierala {
989321b17ecSEdward Tomasz Napierala 	struct icl_conn *ic;
990321b17ecSEdward Tomasz Napierala 	struct icl_pdu_stailq queue;
991321b17ecSEdward Tomasz Napierala 
992321b17ecSEdward Tomasz Napierala 	ic = arg;
993321b17ecSEdward Tomasz Napierala 
994321b17ecSEdward Tomasz Napierala 	STAILQ_INIT(&queue);
995321b17ecSEdward Tomasz Napierala 
996321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
997321b17ecSEdward Tomasz Napierala 	ic->ic_send_running = true;
998321b17ecSEdward Tomasz Napierala 
999321b17ecSEdward Tomasz Napierala 	for (;;) {
1000321b17ecSEdward Tomasz Napierala 		for (;;) {
1001321b17ecSEdward Tomasz Napierala 			/*
1002321b17ecSEdward Tomasz Napierala 			 * If the local queue is empty, populate it from
1003321b17ecSEdward Tomasz Napierala 			 * the main one.  This way the icl_conn_send_pdus()
1004321b17ecSEdward Tomasz Napierala 			 * can go through all the queued PDUs without holding
1005321b17ecSEdward Tomasz Napierala 			 * any locks.
1006321b17ecSEdward Tomasz Napierala 			 */
1007321b17ecSEdward Tomasz Napierala 			if (STAILQ_EMPTY(&queue))
1008321b17ecSEdward Tomasz Napierala 				STAILQ_SWAP(&ic->ic_to_send, &queue, icl_pdu);
1009321b17ecSEdward Tomasz Napierala 
1010321b17ecSEdward Tomasz Napierala 			ic->ic_check_send_space = false;
1011321b17ecSEdward Tomasz Napierala 			ICL_CONN_UNLOCK(ic);
1012321b17ecSEdward Tomasz Napierala 			icl_conn_send_pdus(ic, &queue);
1013321b17ecSEdward Tomasz Napierala 			ICL_CONN_LOCK(ic);
1014321b17ecSEdward Tomasz Napierala 
1015321b17ecSEdward Tomasz Napierala 			/*
1016321b17ecSEdward Tomasz Napierala 			 * The icl_soupcall_send() was called since the last
1017321b17ecSEdward Tomasz Napierala 			 * call to sbspace(); go around;
1018321b17ecSEdward Tomasz Napierala 			 */
1019321b17ecSEdward Tomasz Napierala 			if (ic->ic_check_send_space)
1020321b17ecSEdward Tomasz Napierala 				continue;
1021321b17ecSEdward Tomasz Napierala 
1022321b17ecSEdward Tomasz Napierala 			/*
1023321b17ecSEdward Tomasz Napierala 			 * Local queue is empty, but we still have PDUs
1024321b17ecSEdward Tomasz Napierala 			 * in the main one; go around.
1025321b17ecSEdward Tomasz Napierala 			 */
1026321b17ecSEdward Tomasz Napierala 			if (STAILQ_EMPTY(&queue) &&
1027321b17ecSEdward Tomasz Napierala 			    !STAILQ_EMPTY(&ic->ic_to_send))
1028321b17ecSEdward Tomasz Napierala 				continue;
1029321b17ecSEdward Tomasz Napierala 
1030321b17ecSEdward Tomasz Napierala 			/*
1031321b17ecSEdward Tomasz Napierala 			 * There might be some stuff in the local queue,
1032321b17ecSEdward Tomasz Napierala 			 * which didn't get sent due to not having enough send
1033321b17ecSEdward Tomasz Napierala 			 * space.  Wait for socket upcall.
1034321b17ecSEdward Tomasz Napierala 			 */
1035321b17ecSEdward Tomasz Napierala 			break;
1036321b17ecSEdward Tomasz Napierala 		}
1037321b17ecSEdward Tomasz Napierala 
1038321b17ecSEdward Tomasz Napierala 		if (ic->ic_disconnecting) {
1039321b17ecSEdward Tomasz Napierala 			//ICL_DEBUG("terminating");
1040321b17ecSEdward Tomasz Napierala 			break;
1041321b17ecSEdward Tomasz Napierala 		}
1042321b17ecSEdward Tomasz Napierala 
1043321b17ecSEdward Tomasz Napierala 		cv_wait(&ic->ic_send_cv, ic->ic_lock);
1044321b17ecSEdward Tomasz Napierala 	}
1045321b17ecSEdward Tomasz Napierala 
1046321b17ecSEdward Tomasz Napierala 	/*
1047321b17ecSEdward Tomasz Napierala 	 * We're exiting; move PDUs back to the main queue, so they can
1048321b17ecSEdward Tomasz Napierala 	 * get freed properly.  At this point ordering doesn't matter.
1049321b17ecSEdward Tomasz Napierala 	 */
1050321b17ecSEdward Tomasz Napierala 	STAILQ_CONCAT(&ic->ic_to_send, &queue);
1051321b17ecSEdward Tomasz Napierala 
1052321b17ecSEdward Tomasz Napierala 	ic->ic_send_running = false;
1053321b17ecSEdward Tomasz Napierala 	cv_signal(&ic->ic_send_cv);
1054321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
1055321b17ecSEdward Tomasz Napierala 	kthread_exit();
1056321b17ecSEdward Tomasz Napierala }
1057321b17ecSEdward Tomasz Napierala 
1058321b17ecSEdward Tomasz Napierala static int
1059321b17ecSEdward Tomasz Napierala icl_soupcall_send(struct socket *so, void *arg, int waitflag)
1060321b17ecSEdward Tomasz Napierala {
1061321b17ecSEdward Tomasz Napierala 	struct icl_conn *ic;
1062321b17ecSEdward Tomasz Napierala 
1063321b17ecSEdward Tomasz Napierala 	if (!sowriteable(so))
1064321b17ecSEdward Tomasz Napierala 		return (SU_OK);
1065321b17ecSEdward Tomasz Napierala 
1066321b17ecSEdward Tomasz Napierala 	ic = arg;
1067321b17ecSEdward Tomasz Napierala 
1068321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
1069321b17ecSEdward Tomasz Napierala 	ic->ic_check_send_space = true;
1070321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
1071321b17ecSEdward Tomasz Napierala 
1072321b17ecSEdward Tomasz Napierala 	cv_signal(&ic->ic_send_cv);
1073321b17ecSEdward Tomasz Napierala 
1074321b17ecSEdward Tomasz Napierala 	return (SU_OK);
1075321b17ecSEdward Tomasz Napierala }
1076321b17ecSEdward Tomasz Napierala 
1077321b17ecSEdward Tomasz Napierala static int
1078321b17ecSEdward Tomasz Napierala icl_pdu_append_data(struct icl_pdu *request, const void *addr, size_t len,
1079321b17ecSEdward Tomasz Napierala     int flags)
1080321b17ecSEdward Tomasz Napierala {
1081321b17ecSEdward Tomasz Napierala 	struct mbuf *mb, *newmb;
1082321b17ecSEdward Tomasz Napierala 	size_t copylen, off = 0;
1083321b17ecSEdward Tomasz Napierala 
1084321b17ecSEdward Tomasz Napierala 	KASSERT(len > 0, ("len == 0"));
1085321b17ecSEdward Tomasz Napierala 
1086321b17ecSEdward Tomasz Napierala 	newmb = m_getm2(NULL, len, flags, MT_DATA, M_PKTHDR);
1087321b17ecSEdward Tomasz Napierala 	if (newmb == NULL) {
1088321b17ecSEdward Tomasz Napierala 		ICL_WARN("failed to allocate mbuf for %zd bytes", len);
1089321b17ecSEdward Tomasz Napierala 		return (ENOMEM);
1090321b17ecSEdward Tomasz Napierala 	}
1091321b17ecSEdward Tomasz Napierala 
1092321b17ecSEdward Tomasz Napierala 	for (mb = newmb; mb != NULL; mb = mb->m_next) {
1093321b17ecSEdward Tomasz Napierala 		copylen = min(M_TRAILINGSPACE(mb), len - off);
1094321b17ecSEdward Tomasz Napierala 		memcpy(mtod(mb, char *), (const char *)addr + off, copylen);
1095321b17ecSEdward Tomasz Napierala 		mb->m_len = copylen;
1096321b17ecSEdward Tomasz Napierala 		off += copylen;
1097321b17ecSEdward Tomasz Napierala 	}
1098321b17ecSEdward Tomasz Napierala 	KASSERT(off == len, ("%s: off != len", __func__));
1099321b17ecSEdward Tomasz Napierala 
1100321b17ecSEdward Tomasz Napierala 	if (request->ip_data_mbuf == NULL) {
1101321b17ecSEdward Tomasz Napierala 		request->ip_data_mbuf = newmb;
1102321b17ecSEdward Tomasz Napierala 		request->ip_data_len = len;
1103321b17ecSEdward Tomasz Napierala 	} else {
1104321b17ecSEdward Tomasz Napierala 		m_cat(request->ip_data_mbuf, newmb);
1105321b17ecSEdward Tomasz Napierala 		request->ip_data_len += len;
1106321b17ecSEdward Tomasz Napierala 	}
1107321b17ecSEdward Tomasz Napierala 
1108321b17ecSEdward Tomasz Napierala 	return (0);
1109321b17ecSEdward Tomasz Napierala }
1110321b17ecSEdward Tomasz Napierala 
1111321b17ecSEdward Tomasz Napierala int
1112321b17ecSEdward Tomasz Napierala icl_soft_conn_pdu_append_data(struct icl_conn *ic, struct icl_pdu *request,
1113321b17ecSEdward Tomasz Napierala     const void *addr, size_t len, int flags)
1114321b17ecSEdward Tomasz Napierala {
1115321b17ecSEdward Tomasz Napierala 
1116321b17ecSEdward Tomasz Napierala 	return (icl_pdu_append_data(request, addr, len, flags));
1117321b17ecSEdward Tomasz Napierala }
1118321b17ecSEdward Tomasz Napierala 
1119321b17ecSEdward Tomasz Napierala static void
1120321b17ecSEdward Tomasz Napierala icl_pdu_get_data(struct icl_pdu *ip, size_t off, void *addr, size_t len)
1121321b17ecSEdward Tomasz Napierala {
1122321b17ecSEdward Tomasz Napierala 
1123321b17ecSEdward Tomasz Napierala 	m_copydata(ip->ip_data_mbuf, off, len, addr);
1124321b17ecSEdward Tomasz Napierala }
1125321b17ecSEdward Tomasz Napierala 
1126321b17ecSEdward Tomasz Napierala void
1127321b17ecSEdward Tomasz Napierala icl_soft_conn_pdu_get_data(struct icl_conn *ic, struct icl_pdu *ip,
1128321b17ecSEdward Tomasz Napierala     size_t off, void *addr, size_t len)
1129321b17ecSEdward Tomasz Napierala {
1130321b17ecSEdward Tomasz Napierala 
1131321b17ecSEdward Tomasz Napierala 	return (icl_pdu_get_data(ip, off, addr, len));
1132321b17ecSEdward Tomasz Napierala }
1133321b17ecSEdward Tomasz Napierala 
1134321b17ecSEdward Tomasz Napierala static void
1135321b17ecSEdward Tomasz Napierala icl_pdu_queue(struct icl_pdu *ip)
1136321b17ecSEdward Tomasz Napierala {
1137321b17ecSEdward Tomasz Napierala 	struct icl_conn *ic;
1138321b17ecSEdward Tomasz Napierala 
1139321b17ecSEdward Tomasz Napierala 	ic = ip->ip_conn;
1140321b17ecSEdward Tomasz Napierala 
1141321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK_ASSERT(ic);
1142321b17ecSEdward Tomasz Napierala 
1143321b17ecSEdward Tomasz Napierala 	if (ic->ic_disconnecting || ic->ic_socket == NULL) {
1144321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("icl_pdu_queue on closed connection");
1145321b17ecSEdward Tomasz Napierala 		icl_pdu_free(ip);
1146321b17ecSEdward Tomasz Napierala 		return;
1147321b17ecSEdward Tomasz Napierala 	}
1148321b17ecSEdward Tomasz Napierala 
1149321b17ecSEdward Tomasz Napierala 	if (!STAILQ_EMPTY(&ic->ic_to_send)) {
1150321b17ecSEdward Tomasz Napierala 		STAILQ_INSERT_TAIL(&ic->ic_to_send, ip, ip_next);
1151321b17ecSEdward Tomasz Napierala 		/*
1152321b17ecSEdward Tomasz Napierala 		 * If the queue is not empty, someone else had already
1153321b17ecSEdward Tomasz Napierala 		 * signaled the send thread; no need to do that again,
1154321b17ecSEdward Tomasz Napierala 		 * just return.
1155321b17ecSEdward Tomasz Napierala 		 */
1156321b17ecSEdward Tomasz Napierala 		return;
1157321b17ecSEdward Tomasz Napierala 	}
1158321b17ecSEdward Tomasz Napierala 
1159321b17ecSEdward Tomasz Napierala 	STAILQ_INSERT_TAIL(&ic->ic_to_send, ip, ip_next);
1160321b17ecSEdward Tomasz Napierala 	cv_signal(&ic->ic_send_cv);
1161321b17ecSEdward Tomasz Napierala }
1162321b17ecSEdward Tomasz Napierala 
1163321b17ecSEdward Tomasz Napierala void
1164321b17ecSEdward Tomasz Napierala icl_soft_conn_pdu_queue(struct icl_conn *ic, struct icl_pdu *ip)
1165321b17ecSEdward Tomasz Napierala {
1166321b17ecSEdward Tomasz Napierala 
1167321b17ecSEdward Tomasz Napierala 	icl_pdu_queue(ip);
1168321b17ecSEdward Tomasz Napierala }
1169321b17ecSEdward Tomasz Napierala 
1170321b17ecSEdward Tomasz Napierala static struct icl_conn *
1171321b17ecSEdward Tomasz Napierala icl_soft_new_conn(const char *name, struct mtx *lock)
1172321b17ecSEdward Tomasz Napierala {
1173321b17ecSEdward Tomasz Napierala 	struct icl_conn *ic;
1174321b17ecSEdward Tomasz Napierala 
1175321b17ecSEdward Tomasz Napierala 	refcount_acquire(&icl_ncons);
1176321b17ecSEdward Tomasz Napierala 
1177321b17ecSEdward Tomasz Napierala 	ic = (struct icl_conn *)kobj_create(&icl_soft_class, M_ICL_SOFT, M_WAITOK | M_ZERO);
1178321b17ecSEdward Tomasz Napierala 
1179321b17ecSEdward Tomasz Napierala 	STAILQ_INIT(&ic->ic_to_send);
1180321b17ecSEdward Tomasz Napierala 	ic->ic_lock = lock;
1181321b17ecSEdward Tomasz Napierala 	cv_init(&ic->ic_send_cv, "icl_tx");
1182321b17ecSEdward Tomasz Napierala 	cv_init(&ic->ic_receive_cv, "icl_rx");
1183321b17ecSEdward Tomasz Napierala #ifdef DIAGNOSTIC
1184321b17ecSEdward Tomasz Napierala 	refcount_init(&ic->ic_outstanding_pdus, 0);
1185321b17ecSEdward Tomasz Napierala #endif
1186321b17ecSEdward Tomasz Napierala 	ic->ic_max_data_segment_length = ICL_MAX_DATA_SEGMENT_LENGTH;
1187321b17ecSEdward Tomasz Napierala 	ic->ic_name = name;
1188321b17ecSEdward Tomasz Napierala 
1189321b17ecSEdward Tomasz Napierala 	return (ic);
1190321b17ecSEdward Tomasz Napierala }
1191321b17ecSEdward Tomasz Napierala 
1192321b17ecSEdward Tomasz Napierala void
1193321b17ecSEdward Tomasz Napierala icl_soft_conn_free(struct icl_conn *ic)
1194321b17ecSEdward Tomasz Napierala {
1195321b17ecSEdward Tomasz Napierala 
1196321b17ecSEdward Tomasz Napierala 	cv_destroy(&ic->ic_send_cv);
1197321b17ecSEdward Tomasz Napierala 	cv_destroy(&ic->ic_receive_cv);
1198321b17ecSEdward Tomasz Napierala 	kobj_delete((struct kobj *)ic, M_ICL_SOFT);
1199321b17ecSEdward Tomasz Napierala 	refcount_release(&icl_ncons);
1200321b17ecSEdward Tomasz Napierala }
1201321b17ecSEdward Tomasz Napierala 
1202321b17ecSEdward Tomasz Napierala static int
1203321b17ecSEdward Tomasz Napierala icl_conn_start(struct icl_conn *ic)
1204321b17ecSEdward Tomasz Napierala {
1205321b17ecSEdward Tomasz Napierala 	size_t minspace;
1206321b17ecSEdward Tomasz Napierala 	struct sockopt opt;
1207321b17ecSEdward Tomasz Napierala 	int error, one = 1;
1208321b17ecSEdward Tomasz Napierala 
1209321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
1210321b17ecSEdward Tomasz Napierala 
1211321b17ecSEdward Tomasz Napierala 	/*
1212321b17ecSEdward Tomasz Napierala 	 * XXX: Ugly hack.
1213321b17ecSEdward Tomasz Napierala 	 */
1214321b17ecSEdward Tomasz Napierala 	if (ic->ic_socket == NULL) {
1215321b17ecSEdward Tomasz Napierala 		ICL_CONN_UNLOCK(ic);
1216321b17ecSEdward Tomasz Napierala 		return (EINVAL);
1217321b17ecSEdward Tomasz Napierala 	}
1218321b17ecSEdward Tomasz Napierala 
1219321b17ecSEdward Tomasz Napierala 	ic->ic_receive_state = ICL_CONN_STATE_BHS;
1220321b17ecSEdward Tomasz Napierala 	ic->ic_receive_len = sizeof(struct iscsi_bhs);
1221321b17ecSEdward Tomasz Napierala 	ic->ic_disconnecting = false;
1222321b17ecSEdward Tomasz Napierala 
1223321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
1224321b17ecSEdward Tomasz Napierala 
1225321b17ecSEdward Tomasz Napierala 	/*
1226321b17ecSEdward Tomasz Napierala 	 * For sendspace, this is required because the current code cannot
1227321b17ecSEdward Tomasz Napierala 	 * send a PDU in pieces; thus, the minimum buffer size is equal
1228321b17ecSEdward Tomasz Napierala 	 * to the maximum PDU size.  "+4" is to account for possible padding.
1229321b17ecSEdward Tomasz Napierala 	 *
1230321b17ecSEdward Tomasz Napierala 	 * What we should actually do here is to use autoscaling, but set
1231321b17ecSEdward Tomasz Napierala 	 * some minimal buffer size to "minspace".  I don't know a way to do
1232321b17ecSEdward Tomasz Napierala 	 * that, though.
1233321b17ecSEdward Tomasz Napierala 	 */
1234321b17ecSEdward Tomasz Napierala 	minspace = sizeof(struct iscsi_bhs) + ic->ic_max_data_segment_length +
1235321b17ecSEdward Tomasz Napierala 	    ISCSI_HEADER_DIGEST_SIZE + ISCSI_DATA_DIGEST_SIZE + 4;
1236321b17ecSEdward Tomasz Napierala 	if (sendspace < minspace) {
1237321b17ecSEdward Tomasz Napierala 		ICL_WARN("kern.icl.sendspace too low; must be at least %zd",
1238321b17ecSEdward Tomasz Napierala 		    minspace);
1239321b17ecSEdward Tomasz Napierala 		sendspace = minspace;
1240321b17ecSEdward Tomasz Napierala 	}
1241321b17ecSEdward Tomasz Napierala 	if (recvspace < minspace) {
1242321b17ecSEdward Tomasz Napierala 		ICL_WARN("kern.icl.recvspace too low; must be at least %zd",
1243321b17ecSEdward Tomasz Napierala 		    minspace);
1244321b17ecSEdward Tomasz Napierala 		recvspace = minspace;
1245321b17ecSEdward Tomasz Napierala 	}
1246321b17ecSEdward Tomasz Napierala 
1247321b17ecSEdward Tomasz Napierala 	error = soreserve(ic->ic_socket, sendspace, recvspace);
1248321b17ecSEdward Tomasz Napierala 	if (error != 0) {
1249321b17ecSEdward Tomasz Napierala 		ICL_WARN("soreserve failed with error %d", error);
1250321b17ecSEdward Tomasz Napierala 		icl_conn_close(ic);
1251321b17ecSEdward Tomasz Napierala 		return (error);
1252321b17ecSEdward Tomasz Napierala 	}
1253321b17ecSEdward Tomasz Napierala 	ic->ic_socket->so_snd.sb_flags |= SB_AUTOSIZE;
1254321b17ecSEdward Tomasz Napierala 	ic->ic_socket->so_rcv.sb_flags |= SB_AUTOSIZE;
1255321b17ecSEdward Tomasz Napierala 
1256321b17ecSEdward Tomasz Napierala 	/*
1257321b17ecSEdward Tomasz Napierala 	 * Disable Nagle.
1258321b17ecSEdward Tomasz Napierala 	 */
1259321b17ecSEdward Tomasz Napierala 	bzero(&opt, sizeof(opt));
1260321b17ecSEdward Tomasz Napierala 	opt.sopt_dir = SOPT_SET;
1261321b17ecSEdward Tomasz Napierala 	opt.sopt_level = IPPROTO_TCP;
1262321b17ecSEdward Tomasz Napierala 	opt.sopt_name = TCP_NODELAY;
1263321b17ecSEdward Tomasz Napierala 	opt.sopt_val = &one;
1264321b17ecSEdward Tomasz Napierala 	opt.sopt_valsize = sizeof(one);
1265321b17ecSEdward Tomasz Napierala 	error = sosetopt(ic->ic_socket, &opt);
1266321b17ecSEdward Tomasz Napierala 	if (error != 0) {
1267321b17ecSEdward Tomasz Napierala 		ICL_WARN("disabling TCP_NODELAY failed with error %d", error);
1268321b17ecSEdward Tomasz Napierala 		icl_conn_close(ic);
1269321b17ecSEdward Tomasz Napierala 		return (error);
1270321b17ecSEdward Tomasz Napierala 	}
1271321b17ecSEdward Tomasz Napierala 
1272321b17ecSEdward Tomasz Napierala 	/*
1273321b17ecSEdward Tomasz Napierala 	 * Start threads.
1274321b17ecSEdward Tomasz Napierala 	 */
1275321b17ecSEdward Tomasz Napierala 	error = kthread_add(icl_send_thread, ic, NULL, NULL, 0, 0, "%stx",
1276321b17ecSEdward Tomasz Napierala 	    ic->ic_name);
1277321b17ecSEdward Tomasz Napierala 	if (error != 0) {
1278321b17ecSEdward Tomasz Napierala 		ICL_WARN("kthread_add(9) failed with error %d", error);
1279321b17ecSEdward Tomasz Napierala 		icl_conn_close(ic);
1280321b17ecSEdward Tomasz Napierala 		return (error);
1281321b17ecSEdward Tomasz Napierala 	}
1282321b17ecSEdward Tomasz Napierala 
1283321b17ecSEdward Tomasz Napierala 	error = kthread_add(icl_receive_thread, ic, NULL, NULL, 0, 0, "%srx",
1284321b17ecSEdward Tomasz Napierala 	    ic->ic_name);
1285321b17ecSEdward Tomasz Napierala 	if (error != 0) {
1286321b17ecSEdward Tomasz Napierala 		ICL_WARN("kthread_add(9) failed with error %d", error);
1287321b17ecSEdward Tomasz Napierala 		icl_conn_close(ic);
1288321b17ecSEdward Tomasz Napierala 		return (error);
1289321b17ecSEdward Tomasz Napierala 	}
1290321b17ecSEdward Tomasz Napierala 
1291321b17ecSEdward Tomasz Napierala 	/*
1292321b17ecSEdward Tomasz Napierala 	 * Register socket upcall, to get notified about incoming PDUs
1293321b17ecSEdward Tomasz Napierala 	 * and free space to send outgoing ones.
1294321b17ecSEdward Tomasz Napierala 	 */
1295321b17ecSEdward Tomasz Napierala 	SOCKBUF_LOCK(&ic->ic_socket->so_snd);
1296321b17ecSEdward Tomasz Napierala 	soupcall_set(ic->ic_socket, SO_SND, icl_soupcall_send, ic);
1297321b17ecSEdward Tomasz Napierala 	SOCKBUF_UNLOCK(&ic->ic_socket->so_snd);
1298321b17ecSEdward Tomasz Napierala 	SOCKBUF_LOCK(&ic->ic_socket->so_rcv);
1299321b17ecSEdward Tomasz Napierala 	soupcall_set(ic->ic_socket, SO_RCV, icl_soupcall_receive, ic);
1300321b17ecSEdward Tomasz Napierala 	SOCKBUF_UNLOCK(&ic->ic_socket->so_rcv);
1301321b17ecSEdward Tomasz Napierala 
1302321b17ecSEdward Tomasz Napierala 	return (0);
1303321b17ecSEdward Tomasz Napierala }
1304321b17ecSEdward Tomasz Napierala 
1305321b17ecSEdward Tomasz Napierala int
1306321b17ecSEdward Tomasz Napierala icl_soft_conn_handoff(struct icl_conn *ic, int fd)
1307321b17ecSEdward Tomasz Napierala {
1308321b17ecSEdward Tomasz Napierala 	struct file *fp;
1309321b17ecSEdward Tomasz Napierala 	struct socket *so;
1310321b17ecSEdward Tomasz Napierala 	cap_rights_t rights;
1311321b17ecSEdward Tomasz Napierala 	int error;
1312321b17ecSEdward Tomasz Napierala 
1313321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK_ASSERT_NOT(ic);
1314321b17ecSEdward Tomasz Napierala 
1315321b17ecSEdward Tomasz Napierala 	/*
1316321b17ecSEdward Tomasz Napierala 	 * Steal the socket from userland.
1317321b17ecSEdward Tomasz Napierala 	 */
1318321b17ecSEdward Tomasz Napierala 	error = fget(curthread, fd,
1319321b17ecSEdward Tomasz Napierala 	    cap_rights_init(&rights, CAP_SOCK_CLIENT), &fp);
1320321b17ecSEdward Tomasz Napierala 	if (error != 0)
1321321b17ecSEdward Tomasz Napierala 		return (error);
1322321b17ecSEdward Tomasz Napierala 	if (fp->f_type != DTYPE_SOCKET) {
1323321b17ecSEdward Tomasz Napierala 		fdrop(fp, curthread);
1324321b17ecSEdward Tomasz Napierala 		return (EINVAL);
1325321b17ecSEdward Tomasz Napierala 	}
1326321b17ecSEdward Tomasz Napierala 	so = fp->f_data;
1327321b17ecSEdward Tomasz Napierala 	if (so->so_type != SOCK_STREAM) {
1328321b17ecSEdward Tomasz Napierala 		fdrop(fp, curthread);
1329321b17ecSEdward Tomasz Napierala 		return (EINVAL);
1330321b17ecSEdward Tomasz Napierala 	}
1331321b17ecSEdward Tomasz Napierala 
1332321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
1333321b17ecSEdward Tomasz Napierala 
1334321b17ecSEdward Tomasz Napierala 	if (ic->ic_socket != NULL) {
1335321b17ecSEdward Tomasz Napierala 		ICL_CONN_UNLOCK(ic);
1336321b17ecSEdward Tomasz Napierala 		fdrop(fp, curthread);
1337321b17ecSEdward Tomasz Napierala 		return (EBUSY);
1338321b17ecSEdward Tomasz Napierala 	}
1339321b17ecSEdward Tomasz Napierala 
1340321b17ecSEdward Tomasz Napierala 	ic->ic_socket = fp->f_data;
1341321b17ecSEdward Tomasz Napierala 	fp->f_ops = &badfileops;
1342321b17ecSEdward Tomasz Napierala 	fp->f_data = NULL;
1343321b17ecSEdward Tomasz Napierala 	fdrop(fp, curthread);
1344321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
1345321b17ecSEdward Tomasz Napierala 
1346321b17ecSEdward Tomasz Napierala 	error = icl_conn_start(ic);
1347321b17ecSEdward Tomasz Napierala 
1348321b17ecSEdward Tomasz Napierala 	return (error);
1349321b17ecSEdward Tomasz Napierala }
1350321b17ecSEdward Tomasz Napierala 
1351321b17ecSEdward Tomasz Napierala void
1352321b17ecSEdward Tomasz Napierala icl_conn_close(struct icl_conn *ic)
1353321b17ecSEdward Tomasz Napierala {
1354321b17ecSEdward Tomasz Napierala 	struct icl_pdu *pdu;
1355321b17ecSEdward Tomasz Napierala 
1356321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK_ASSERT_NOT(ic);
1357321b17ecSEdward Tomasz Napierala 
1358321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
1359321b17ecSEdward Tomasz Napierala 	if (ic->ic_socket == NULL) {
1360321b17ecSEdward Tomasz Napierala 		ICL_CONN_UNLOCK(ic);
1361321b17ecSEdward Tomasz Napierala 		return;
1362321b17ecSEdward Tomasz Napierala 	}
1363321b17ecSEdward Tomasz Napierala 
1364321b17ecSEdward Tomasz Napierala 	/*
1365321b17ecSEdward Tomasz Napierala 	 * Deregister socket upcalls.
1366321b17ecSEdward Tomasz Napierala 	 */
1367321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
1368321b17ecSEdward Tomasz Napierala 	SOCKBUF_LOCK(&ic->ic_socket->so_snd);
1369321b17ecSEdward Tomasz Napierala 	if (ic->ic_socket->so_snd.sb_upcall != NULL)
1370321b17ecSEdward Tomasz Napierala 		soupcall_clear(ic->ic_socket, SO_SND);
1371321b17ecSEdward Tomasz Napierala 	SOCKBUF_UNLOCK(&ic->ic_socket->so_snd);
1372321b17ecSEdward Tomasz Napierala 	SOCKBUF_LOCK(&ic->ic_socket->so_rcv);
1373321b17ecSEdward Tomasz Napierala 	if (ic->ic_socket->so_rcv.sb_upcall != NULL)
1374321b17ecSEdward Tomasz Napierala 		soupcall_clear(ic->ic_socket, SO_RCV);
1375321b17ecSEdward Tomasz Napierala 	SOCKBUF_UNLOCK(&ic->ic_socket->so_rcv);
1376321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
1377321b17ecSEdward Tomasz Napierala 
1378321b17ecSEdward Tomasz Napierala 	ic->ic_disconnecting = true;
1379321b17ecSEdward Tomasz Napierala 
1380321b17ecSEdward Tomasz Napierala 	/*
1381321b17ecSEdward Tomasz Napierala 	 * Wake up the threads, so they can properly terminate.
1382321b17ecSEdward Tomasz Napierala 	 */
1383321b17ecSEdward Tomasz Napierala 	while (ic->ic_receive_running || ic->ic_send_running) {
1384321b17ecSEdward Tomasz Napierala 		//ICL_DEBUG("waiting for send/receive threads to terminate");
1385321b17ecSEdward Tomasz Napierala 		cv_signal(&ic->ic_receive_cv);
1386321b17ecSEdward Tomasz Napierala 		cv_signal(&ic->ic_send_cv);
1387321b17ecSEdward Tomasz Napierala 		cv_wait(&ic->ic_send_cv, ic->ic_lock);
1388321b17ecSEdward Tomasz Napierala 	}
1389321b17ecSEdward Tomasz Napierala 	//ICL_DEBUG("send/receive threads terminated");
1390321b17ecSEdward Tomasz Napierala 
1391321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
1392321b17ecSEdward Tomasz Napierala 	soclose(ic->ic_socket);
1393321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
1394321b17ecSEdward Tomasz Napierala 	ic->ic_socket = NULL;
1395321b17ecSEdward Tomasz Napierala 
1396321b17ecSEdward Tomasz Napierala 	if (ic->ic_receive_pdu != NULL) {
1397321b17ecSEdward Tomasz Napierala 		//ICL_DEBUG("freeing partially received PDU");
1398321b17ecSEdward Tomasz Napierala 		icl_pdu_free(ic->ic_receive_pdu);
1399321b17ecSEdward Tomasz Napierala 		ic->ic_receive_pdu = NULL;
1400321b17ecSEdward Tomasz Napierala 	}
1401321b17ecSEdward Tomasz Napierala 
1402321b17ecSEdward Tomasz Napierala 	/*
1403321b17ecSEdward Tomasz Napierala 	 * Remove any outstanding PDUs from the send queue.
1404321b17ecSEdward Tomasz Napierala 	 */
1405321b17ecSEdward Tomasz Napierala 	while (!STAILQ_EMPTY(&ic->ic_to_send)) {
1406321b17ecSEdward Tomasz Napierala 		pdu = STAILQ_FIRST(&ic->ic_to_send);
1407321b17ecSEdward Tomasz Napierala 		STAILQ_REMOVE_HEAD(&ic->ic_to_send, ip_next);
1408321b17ecSEdward Tomasz Napierala 		icl_pdu_free(pdu);
1409321b17ecSEdward Tomasz Napierala 	}
1410321b17ecSEdward Tomasz Napierala 
1411321b17ecSEdward Tomasz Napierala 	KASSERT(STAILQ_EMPTY(&ic->ic_to_send),
1412321b17ecSEdward Tomasz Napierala 	    ("destroying session with non-empty send queue"));
1413321b17ecSEdward Tomasz Napierala #ifdef DIAGNOSTIC
1414321b17ecSEdward Tomasz Napierala 	KASSERT(ic->ic_outstanding_pdus == 0,
1415321b17ecSEdward Tomasz Napierala 	    ("destroying session with %d outstanding PDUs",
1416321b17ecSEdward Tomasz Napierala 	     ic->ic_outstanding_pdus));
1417321b17ecSEdward Tomasz Napierala #endif
1418321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
1419321b17ecSEdward Tomasz Napierala }
1420321b17ecSEdward Tomasz Napierala 
1421321b17ecSEdward Tomasz Napierala void
1422321b17ecSEdward Tomasz Napierala icl_soft_conn_close(struct icl_conn *ic)
1423321b17ecSEdward Tomasz Napierala {
1424321b17ecSEdward Tomasz Napierala 
1425321b17ecSEdward Tomasz Napierala 	icl_conn_close(ic);
1426321b17ecSEdward Tomasz Napierala }
1427321b17ecSEdward Tomasz Napierala 
1428321b17ecSEdward Tomasz Napierala bool
1429321b17ecSEdward Tomasz Napierala icl_soft_conn_connected(struct icl_conn *ic)
1430321b17ecSEdward Tomasz Napierala {
1431321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK_ASSERT_NOT(ic);
1432321b17ecSEdward Tomasz Napierala 
1433321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
1434321b17ecSEdward Tomasz Napierala 	if (ic->ic_socket == NULL) {
1435321b17ecSEdward Tomasz Napierala 		ICL_CONN_UNLOCK(ic);
1436321b17ecSEdward Tomasz Napierala 		return (false);
1437321b17ecSEdward Tomasz Napierala 	}
1438321b17ecSEdward Tomasz Napierala 	if (ic->ic_socket->so_error != 0) {
1439321b17ecSEdward Tomasz Napierala 		ICL_CONN_UNLOCK(ic);
1440321b17ecSEdward Tomasz Napierala 		return (false);
1441321b17ecSEdward Tomasz Napierala 	}
1442321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
1443321b17ecSEdward Tomasz Napierala 	return (true);
1444321b17ecSEdward Tomasz Napierala }
1445321b17ecSEdward Tomasz Napierala 
1446321b17ecSEdward Tomasz Napierala static int
1447321b17ecSEdward Tomasz Napierala icl_soft_limits(size_t *limitp)
1448321b17ecSEdward Tomasz Napierala {
1449321b17ecSEdward Tomasz Napierala 
1450321b17ecSEdward Tomasz Napierala 	*limitp = 128 * 1024;
1451321b17ecSEdward Tomasz Napierala 
1452321b17ecSEdward Tomasz Napierala 	return (0);
1453321b17ecSEdward Tomasz Napierala }
1454321b17ecSEdward Tomasz Napierala 
1455321b17ecSEdward Tomasz Napierala #ifdef ICL_KERNEL_PROXY
1456321b17ecSEdward Tomasz Napierala int
1457321b17ecSEdward Tomasz Napierala icl_conn_handoff_sock(struct icl_conn *ic, struct socket *so)
1458321b17ecSEdward Tomasz Napierala {
1459321b17ecSEdward Tomasz Napierala 	int error;
1460321b17ecSEdward Tomasz Napierala 
1461321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK_ASSERT_NOT(ic);
1462321b17ecSEdward Tomasz Napierala 
1463321b17ecSEdward Tomasz Napierala 	if (so->so_type != SOCK_STREAM)
1464321b17ecSEdward Tomasz Napierala 		return (EINVAL);
1465321b17ecSEdward Tomasz Napierala 
1466321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
1467321b17ecSEdward Tomasz Napierala 	if (ic->ic_socket != NULL) {
1468321b17ecSEdward Tomasz Napierala 		ICL_CONN_UNLOCK(ic);
1469321b17ecSEdward Tomasz Napierala 		return (EBUSY);
1470321b17ecSEdward Tomasz Napierala 	}
1471321b17ecSEdward Tomasz Napierala 	ic->ic_socket = so;
1472321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
1473321b17ecSEdward Tomasz Napierala 
1474321b17ecSEdward Tomasz Napierala 	error = icl_conn_start(ic);
1475321b17ecSEdward Tomasz Napierala 
1476321b17ecSEdward Tomasz Napierala 	return (error);
1477321b17ecSEdward Tomasz Napierala }
1478321b17ecSEdward Tomasz Napierala #endif /* ICL_KERNEL_PROXY */
1479321b17ecSEdward Tomasz Napierala 
1480321b17ecSEdward Tomasz Napierala static int
1481321b17ecSEdward Tomasz Napierala icl_soft_load(void)
1482321b17ecSEdward Tomasz Napierala {
1483321b17ecSEdward Tomasz Napierala 	int error;
1484321b17ecSEdward Tomasz Napierala 
1485321b17ecSEdward Tomasz Napierala 	icl_pdu_zone = uma_zcreate("icl_pdu",
1486321b17ecSEdward Tomasz Napierala 	    sizeof(struct icl_pdu), NULL, NULL, NULL, NULL,
1487321b17ecSEdward Tomasz Napierala 	    UMA_ALIGN_PTR, 0);
1488321b17ecSEdward Tomasz Napierala 	refcount_init(&icl_ncons, 0);
1489321b17ecSEdward Tomasz Napierala 
1490321b17ecSEdward Tomasz Napierala 	/*
1491321b17ecSEdward Tomasz Napierala 	 * The reason we call this "none" is that to the user,
1492321b17ecSEdward Tomasz Napierala 	 * it's known as "offload driver"; "offload driver: soft"
1493321b17ecSEdward Tomasz Napierala 	 * doesn't make much sense.
1494321b17ecSEdward Tomasz Napierala 	 */
1495321b17ecSEdward Tomasz Napierala 	error = icl_register("none", 0, icl_soft_limits, icl_soft_new_conn);
1496321b17ecSEdward Tomasz Napierala 	KASSERT(error == 0, ("failed to register"));
1497321b17ecSEdward Tomasz Napierala 
1498321b17ecSEdward Tomasz Napierala 	return (error);
1499321b17ecSEdward Tomasz Napierala }
1500321b17ecSEdward Tomasz Napierala 
1501321b17ecSEdward Tomasz Napierala static int
1502321b17ecSEdward Tomasz Napierala icl_soft_unload(void)
1503321b17ecSEdward Tomasz Napierala {
1504321b17ecSEdward Tomasz Napierala 
1505321b17ecSEdward Tomasz Napierala 	if (icl_ncons != 0)
1506321b17ecSEdward Tomasz Napierala 		return (EBUSY);
1507321b17ecSEdward Tomasz Napierala 
1508321b17ecSEdward Tomasz Napierala 	icl_unregister("none");
1509321b17ecSEdward Tomasz Napierala 
1510321b17ecSEdward Tomasz Napierala 	uma_zdestroy(icl_pdu_zone);
1511321b17ecSEdward Tomasz Napierala 
1512321b17ecSEdward Tomasz Napierala 	return (0);
1513321b17ecSEdward Tomasz Napierala }
1514321b17ecSEdward Tomasz Napierala 
1515321b17ecSEdward Tomasz Napierala static int
1516321b17ecSEdward Tomasz Napierala icl_soft_modevent(module_t mod, int what, void *arg)
1517321b17ecSEdward Tomasz Napierala {
1518321b17ecSEdward Tomasz Napierala 
1519321b17ecSEdward Tomasz Napierala 	switch (what) {
1520321b17ecSEdward Tomasz Napierala 	case MOD_LOAD:
1521321b17ecSEdward Tomasz Napierala 		return (icl_soft_load());
1522321b17ecSEdward Tomasz Napierala 	case MOD_UNLOAD:
1523321b17ecSEdward Tomasz Napierala 		return (icl_soft_unload());
1524321b17ecSEdward Tomasz Napierala 	default:
1525321b17ecSEdward Tomasz Napierala 		return (EINVAL);
1526321b17ecSEdward Tomasz Napierala 	}
1527321b17ecSEdward Tomasz Napierala }
1528321b17ecSEdward Tomasz Napierala 
1529321b17ecSEdward Tomasz Napierala moduledata_t icl_soft_data = {
1530321b17ecSEdward Tomasz Napierala 	"icl_soft",
1531321b17ecSEdward Tomasz Napierala 	icl_soft_modevent,
1532321b17ecSEdward Tomasz Napierala 	0
1533321b17ecSEdward Tomasz Napierala };
1534321b17ecSEdward Tomasz Napierala 
1535321b17ecSEdward Tomasz Napierala DECLARE_MODULE(icl_soft, icl_soft_data, SI_SUB_DRIVERS, SI_ORDER_MIDDLE);
1536321b17ecSEdward Tomasz Napierala MODULE_DEPEND(icl_soft, icl, 1, 1, 1);
1537*872d2d92SEdward Tomasz Napierala MODULE_VERSION(icl_soft, 1);
1538