xref: /freebsd/sys/dev/iscsi/icl_soft.c (revision d4b195d315907a711640f8a11a2dd636b3ec70ff)
1321b17ecSEdward Tomasz Napierala /*-
2321b17ecSEdward Tomasz Napierala  * Copyright (c) 2012 The FreeBSD Foundation
3321b17ecSEdward Tomasz Napierala  * All rights reserved.
4321b17ecSEdward Tomasz Napierala  *
5321b17ecSEdward Tomasz Napierala  * This software was developed by Edward Tomasz Napierala under sponsorship
6321b17ecSEdward Tomasz Napierala  * from the FreeBSD Foundation.
7321b17ecSEdward Tomasz Napierala  *
8321b17ecSEdward Tomasz Napierala  * Redistribution and use in source and binary forms, with or without
9321b17ecSEdward Tomasz Napierala  * modification, are permitted provided that the following conditions
10321b17ecSEdward Tomasz Napierala  * are met:
11321b17ecSEdward Tomasz Napierala  * 1. Redistributions of source code must retain the above copyright
12321b17ecSEdward Tomasz Napierala  *    notice, this list of conditions and the following disclaimer.
13321b17ecSEdward Tomasz Napierala  * 2. Redistributions in binary form must reproduce the above copyright
14321b17ecSEdward Tomasz Napierala  *    notice, this list of conditions and the following disclaimer in the
15321b17ecSEdward Tomasz Napierala  *    documentation and/or other materials provided with the distribution.
16321b17ecSEdward Tomasz Napierala  *
17321b17ecSEdward Tomasz Napierala  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
18321b17ecSEdward Tomasz Napierala  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19321b17ecSEdward Tomasz Napierala  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20321b17ecSEdward Tomasz Napierala  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
21321b17ecSEdward Tomasz Napierala  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22321b17ecSEdward Tomasz Napierala  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23321b17ecSEdward Tomasz Napierala  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24321b17ecSEdward Tomasz Napierala  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25321b17ecSEdward Tomasz Napierala  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26321b17ecSEdward Tomasz Napierala  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27321b17ecSEdward Tomasz Napierala  * SUCH DAMAGE.
28321b17ecSEdward Tomasz Napierala  *
29321b17ecSEdward Tomasz Napierala  */
30321b17ecSEdward Tomasz Napierala 
31321b17ecSEdward Tomasz Napierala /*
325aabcd7cSEdward Tomasz Napierala  * Software implementation of iSCSI Common Layer kobj(9) interface.
33321b17ecSEdward Tomasz Napierala  */
34321b17ecSEdward Tomasz Napierala 
35321b17ecSEdward Tomasz Napierala #include <sys/cdefs.h>
36321b17ecSEdward Tomasz Napierala __FBSDID("$FreeBSD$");
37321b17ecSEdward Tomasz Napierala 
38321b17ecSEdward Tomasz Napierala #include <sys/param.h>
39321b17ecSEdward Tomasz Napierala #include <sys/capsicum.h>
40321b17ecSEdward Tomasz Napierala #include <sys/condvar.h>
41321b17ecSEdward Tomasz Napierala #include <sys/conf.h>
42321b17ecSEdward Tomasz Napierala #include <sys/file.h>
43321b17ecSEdward Tomasz Napierala #include <sys/kernel.h>
44321b17ecSEdward Tomasz Napierala #include <sys/kthread.h>
45321b17ecSEdward Tomasz Napierala #include <sys/lock.h>
46321b17ecSEdward Tomasz Napierala #include <sys/mbuf.h>
47321b17ecSEdward Tomasz Napierala #include <sys/mutex.h>
48321b17ecSEdward Tomasz Napierala #include <sys/module.h>
49321b17ecSEdward Tomasz Napierala #include <sys/protosw.h>
50321b17ecSEdward Tomasz Napierala #include <sys/socket.h>
51321b17ecSEdward Tomasz Napierala #include <sys/socketvar.h>
52321b17ecSEdward Tomasz Napierala #include <sys/sysctl.h>
53321b17ecSEdward Tomasz Napierala #include <sys/systm.h>
54321b17ecSEdward Tomasz Napierala #include <sys/sx.h>
55321b17ecSEdward Tomasz Napierala #include <sys/uio.h>
56321b17ecSEdward Tomasz Napierala #include <vm/uma.h>
57321b17ecSEdward Tomasz Napierala #include <netinet/in.h>
58321b17ecSEdward Tomasz Napierala #include <netinet/tcp.h>
59321b17ecSEdward Tomasz Napierala 
60321b17ecSEdward Tomasz Napierala #include <dev/iscsi/icl.h>
61321b17ecSEdward Tomasz Napierala #include <dev/iscsi/iscsi_proto.h>
62321b17ecSEdward Tomasz Napierala #include <icl_conn_if.h>
63321b17ecSEdward Tomasz Napierala 
64321b17ecSEdward Tomasz Napierala static int coalesce = 1;
65321b17ecSEdward Tomasz Napierala SYSCTL_INT(_kern_icl, OID_AUTO, coalesce, CTLFLAG_RWTUN,
66321b17ecSEdward Tomasz Napierala     &coalesce, 0, "Try to coalesce PDUs before sending");
67321b17ecSEdward Tomasz Napierala static int partial_receive_len = 128 * 1024;
68321b17ecSEdward Tomasz Napierala SYSCTL_INT(_kern_icl, OID_AUTO, partial_receive_len, CTLFLAG_RWTUN,
69321b17ecSEdward Tomasz Napierala     &partial_receive_len, 0, "Minimum read size for partially received "
70321b17ecSEdward Tomasz Napierala     "data segment");
71321b17ecSEdward Tomasz Napierala static int sendspace = 1048576;
72321b17ecSEdward Tomasz Napierala SYSCTL_INT(_kern_icl, OID_AUTO, sendspace, CTLFLAG_RWTUN,
73321b17ecSEdward Tomasz Napierala     &sendspace, 0, "Default send socket buffer size");
74321b17ecSEdward Tomasz Napierala static int recvspace = 1048576;
75321b17ecSEdward Tomasz Napierala SYSCTL_INT(_kern_icl, OID_AUTO, recvspace, CTLFLAG_RWTUN,
76321b17ecSEdward Tomasz Napierala     &recvspace, 0, "Default receive socket buffer size");
77321b17ecSEdward Tomasz Napierala 
78321b17ecSEdward Tomasz Napierala static MALLOC_DEFINE(M_ICL_SOFT, "icl_soft", "iSCSI software backend");
79321b17ecSEdward Tomasz Napierala static uma_zone_t icl_pdu_zone;
80321b17ecSEdward Tomasz Napierala 
81321b17ecSEdward Tomasz Napierala static volatile u_int	icl_ncons;
82321b17ecSEdward Tomasz Napierala 
83321b17ecSEdward Tomasz Napierala #define ICL_CONN_LOCK(X)		mtx_lock(X->ic_lock)
84321b17ecSEdward Tomasz Napierala #define ICL_CONN_UNLOCK(X)		mtx_unlock(X->ic_lock)
85321b17ecSEdward Tomasz Napierala #define ICL_CONN_LOCK_ASSERT(X)		mtx_assert(X->ic_lock, MA_OWNED)
86321b17ecSEdward Tomasz Napierala #define ICL_CONN_LOCK_ASSERT_NOT(X)	mtx_assert(X->ic_lock, MA_NOTOWNED)
87321b17ecSEdward Tomasz Napierala 
88321b17ecSEdward Tomasz Napierala STAILQ_HEAD(icl_pdu_stailq, icl_pdu);
89321b17ecSEdward Tomasz Napierala 
90321b17ecSEdward Tomasz Napierala static icl_conn_new_pdu_t	icl_soft_conn_new_pdu;
91321b17ecSEdward Tomasz Napierala static icl_conn_pdu_free_t	icl_soft_conn_pdu_free;
92321b17ecSEdward Tomasz Napierala static icl_conn_pdu_data_segment_length_t
93321b17ecSEdward Tomasz Napierala 				    icl_soft_conn_pdu_data_segment_length;
94321b17ecSEdward Tomasz Napierala static icl_conn_pdu_append_data_t	icl_soft_conn_pdu_append_data;
95321b17ecSEdward Tomasz Napierala static icl_conn_pdu_get_data_t	icl_soft_conn_pdu_get_data;
96321b17ecSEdward Tomasz Napierala static icl_conn_pdu_queue_t	icl_soft_conn_pdu_queue;
97321b17ecSEdward Tomasz Napierala static icl_conn_handoff_t	icl_soft_conn_handoff;
98321b17ecSEdward Tomasz Napierala static icl_conn_free_t		icl_soft_conn_free;
99321b17ecSEdward Tomasz Napierala static icl_conn_close_t		icl_soft_conn_close;
100321b17ecSEdward Tomasz Napierala static icl_conn_connected_t	icl_soft_conn_connected;
101321b17ecSEdward Tomasz Napierala 
102321b17ecSEdward Tomasz Napierala static kobj_method_t icl_soft_methods[] = {
103321b17ecSEdward Tomasz Napierala 	KOBJMETHOD(icl_conn_new_pdu, icl_soft_conn_new_pdu),
104321b17ecSEdward Tomasz Napierala 	KOBJMETHOD(icl_conn_pdu_free, icl_soft_conn_pdu_free),
105321b17ecSEdward Tomasz Napierala 	KOBJMETHOD(icl_conn_pdu_data_segment_length,
106321b17ecSEdward Tomasz Napierala 	    icl_soft_conn_pdu_data_segment_length),
107321b17ecSEdward Tomasz Napierala 	KOBJMETHOD(icl_conn_pdu_append_data, icl_soft_conn_pdu_append_data),
108321b17ecSEdward Tomasz Napierala 	KOBJMETHOD(icl_conn_pdu_get_data, icl_soft_conn_pdu_get_data),
109321b17ecSEdward Tomasz Napierala 	KOBJMETHOD(icl_conn_pdu_queue, icl_soft_conn_pdu_queue),
110321b17ecSEdward Tomasz Napierala 	KOBJMETHOD(icl_conn_handoff, icl_soft_conn_handoff),
111321b17ecSEdward Tomasz Napierala 	KOBJMETHOD(icl_conn_free, icl_soft_conn_free),
112321b17ecSEdward Tomasz Napierala 	KOBJMETHOD(icl_conn_close, icl_soft_conn_close),
113321b17ecSEdward Tomasz Napierala 	KOBJMETHOD(icl_conn_connected, icl_soft_conn_connected),
114321b17ecSEdward Tomasz Napierala 	{ 0, 0 }
115321b17ecSEdward Tomasz Napierala };
116321b17ecSEdward Tomasz Napierala 
117321b17ecSEdward Tomasz Napierala DEFINE_CLASS(icl_soft, icl_soft_methods, sizeof(struct icl_conn));
118321b17ecSEdward Tomasz Napierala 
119321b17ecSEdward Tomasz Napierala static void
120321b17ecSEdward Tomasz Napierala icl_conn_fail(struct icl_conn *ic)
121321b17ecSEdward Tomasz Napierala {
122321b17ecSEdward Tomasz Napierala 	if (ic->ic_socket == NULL)
123321b17ecSEdward Tomasz Napierala 		return;
124321b17ecSEdward Tomasz Napierala 
125321b17ecSEdward Tomasz Napierala 	/*
126321b17ecSEdward Tomasz Napierala 	 * XXX
127321b17ecSEdward Tomasz Napierala 	 */
128321b17ecSEdward Tomasz Napierala 	ic->ic_socket->so_error = EDOOFUS;
129321b17ecSEdward Tomasz Napierala 	(ic->ic_error)(ic);
130321b17ecSEdward Tomasz Napierala }
131321b17ecSEdward Tomasz Napierala 
132321b17ecSEdward Tomasz Napierala static struct mbuf *
133321b17ecSEdward Tomasz Napierala icl_conn_receive(struct icl_conn *ic, size_t len)
134321b17ecSEdward Tomasz Napierala {
135321b17ecSEdward Tomasz Napierala 	struct uio uio;
136321b17ecSEdward Tomasz Napierala 	struct socket *so;
137321b17ecSEdward Tomasz Napierala 	struct mbuf *m;
138321b17ecSEdward Tomasz Napierala 	int error, flags;
139321b17ecSEdward Tomasz Napierala 
140321b17ecSEdward Tomasz Napierala 	so = ic->ic_socket;
141321b17ecSEdward Tomasz Napierala 
142321b17ecSEdward Tomasz Napierala 	memset(&uio, 0, sizeof(uio));
143321b17ecSEdward Tomasz Napierala 	uio.uio_resid = len;
144321b17ecSEdward Tomasz Napierala 
145321b17ecSEdward Tomasz Napierala 	flags = MSG_DONTWAIT;
146321b17ecSEdward Tomasz Napierala 	error = soreceive(so, NULL, &uio, &m, NULL, &flags);
147321b17ecSEdward Tomasz Napierala 	if (error != 0) {
148321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("soreceive error %d", error);
149321b17ecSEdward Tomasz Napierala 		return (NULL);
150321b17ecSEdward Tomasz Napierala 	}
151321b17ecSEdward Tomasz Napierala 	if (uio.uio_resid != 0) {
152321b17ecSEdward Tomasz Napierala 		m_freem(m);
153321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("short read");
154321b17ecSEdward Tomasz Napierala 		return (NULL);
155321b17ecSEdward Tomasz Napierala 	}
156321b17ecSEdward Tomasz Napierala 
157321b17ecSEdward Tomasz Napierala 	return (m);
158321b17ecSEdward Tomasz Napierala }
159321b17ecSEdward Tomasz Napierala 
160321b17ecSEdward Tomasz Napierala static struct icl_pdu *
161321b17ecSEdward Tomasz Napierala icl_pdu_new_empty(struct icl_conn *ic, int flags)
162321b17ecSEdward Tomasz Napierala {
163321b17ecSEdward Tomasz Napierala 	struct icl_pdu *ip;
164321b17ecSEdward Tomasz Napierala 
165321b17ecSEdward Tomasz Napierala #ifdef DIAGNOSTIC
166321b17ecSEdward Tomasz Napierala 	refcount_acquire(&ic->ic_outstanding_pdus);
167321b17ecSEdward Tomasz Napierala #endif
168321b17ecSEdward Tomasz Napierala 	ip = uma_zalloc(icl_pdu_zone, flags | M_ZERO);
169321b17ecSEdward Tomasz Napierala 	if (ip == NULL) {
170321b17ecSEdward Tomasz Napierala 		ICL_WARN("failed to allocate %zd bytes", sizeof(*ip));
171321b17ecSEdward Tomasz Napierala #ifdef DIAGNOSTIC
172321b17ecSEdward Tomasz Napierala 		refcount_release(&ic->ic_outstanding_pdus);
173321b17ecSEdward Tomasz Napierala #endif
174321b17ecSEdward Tomasz Napierala 		return (NULL);
175321b17ecSEdward Tomasz Napierala 	}
176321b17ecSEdward Tomasz Napierala 
177321b17ecSEdward Tomasz Napierala 	ip->ip_conn = ic;
178321b17ecSEdward Tomasz Napierala 
179321b17ecSEdward Tomasz Napierala 	return (ip);
180321b17ecSEdward Tomasz Napierala }
181321b17ecSEdward Tomasz Napierala 
182321b17ecSEdward Tomasz Napierala static void
183321b17ecSEdward Tomasz Napierala icl_pdu_free(struct icl_pdu *ip)
184321b17ecSEdward Tomasz Napierala {
185321b17ecSEdward Tomasz Napierala 	struct icl_conn *ic;
186321b17ecSEdward Tomasz Napierala 
187321b17ecSEdward Tomasz Napierala 	ic = ip->ip_conn;
188321b17ecSEdward Tomasz Napierala 
189321b17ecSEdward Tomasz Napierala 	m_freem(ip->ip_bhs_mbuf);
190321b17ecSEdward Tomasz Napierala 	m_freem(ip->ip_ahs_mbuf);
191321b17ecSEdward Tomasz Napierala 	m_freem(ip->ip_data_mbuf);
192321b17ecSEdward Tomasz Napierala 	uma_zfree(icl_pdu_zone, ip);
193321b17ecSEdward Tomasz Napierala #ifdef DIAGNOSTIC
194321b17ecSEdward Tomasz Napierala 	refcount_release(&ic->ic_outstanding_pdus);
195321b17ecSEdward Tomasz Napierala #endif
196321b17ecSEdward Tomasz Napierala }
197321b17ecSEdward Tomasz Napierala 
198321b17ecSEdward Tomasz Napierala void
199321b17ecSEdward Tomasz Napierala icl_soft_conn_pdu_free(struct icl_conn *ic, struct icl_pdu *ip)
200321b17ecSEdward Tomasz Napierala {
2015aabcd7cSEdward Tomasz Napierala 
202321b17ecSEdward Tomasz Napierala 	icl_pdu_free(ip);
203321b17ecSEdward Tomasz Napierala }
204321b17ecSEdward Tomasz Napierala 
205321b17ecSEdward Tomasz Napierala /*
206321b17ecSEdward Tomasz Napierala  * Allocate icl_pdu with empty BHS to fill up by the caller.
207321b17ecSEdward Tomasz Napierala  */
208321b17ecSEdward Tomasz Napierala struct icl_pdu *
209321b17ecSEdward Tomasz Napierala icl_soft_conn_new_pdu(struct icl_conn *ic, int flags)
210321b17ecSEdward Tomasz Napierala {
211321b17ecSEdward Tomasz Napierala 	struct icl_pdu *ip;
212321b17ecSEdward Tomasz Napierala 
213321b17ecSEdward Tomasz Napierala 	ip = icl_pdu_new_empty(ic, flags);
214321b17ecSEdward Tomasz Napierala 	if (ip == NULL)
215321b17ecSEdward Tomasz Napierala 		return (NULL);
216321b17ecSEdward Tomasz Napierala 
217321b17ecSEdward Tomasz Napierala 	ip->ip_bhs_mbuf = m_getm2(NULL, sizeof(struct iscsi_bhs),
218321b17ecSEdward Tomasz Napierala 	    flags, MT_DATA, M_PKTHDR);
219321b17ecSEdward Tomasz Napierala 	if (ip->ip_bhs_mbuf == NULL) {
220321b17ecSEdward Tomasz Napierala 		ICL_WARN("failed to allocate %zd bytes", sizeof(*ip));
221321b17ecSEdward Tomasz Napierala 		icl_pdu_free(ip);
222321b17ecSEdward Tomasz Napierala 		return (NULL);
223321b17ecSEdward Tomasz Napierala 	}
224321b17ecSEdward Tomasz Napierala 	ip->ip_bhs = mtod(ip->ip_bhs_mbuf, struct iscsi_bhs *);
225321b17ecSEdward Tomasz Napierala 	memset(ip->ip_bhs, 0, sizeof(struct iscsi_bhs));
226321b17ecSEdward Tomasz Napierala 	ip->ip_bhs_mbuf->m_len = sizeof(struct iscsi_bhs);
227321b17ecSEdward Tomasz Napierala 
228321b17ecSEdward Tomasz Napierala 	return (ip);
229321b17ecSEdward Tomasz Napierala }
230321b17ecSEdward Tomasz Napierala 
231321b17ecSEdward Tomasz Napierala static int
232321b17ecSEdward Tomasz Napierala icl_pdu_ahs_length(const struct icl_pdu *request)
233321b17ecSEdward Tomasz Napierala {
234321b17ecSEdward Tomasz Napierala 
235321b17ecSEdward Tomasz Napierala 	return (request->ip_bhs->bhs_total_ahs_len * 4);
236321b17ecSEdward Tomasz Napierala }
237321b17ecSEdward Tomasz Napierala 
238321b17ecSEdward Tomasz Napierala static size_t
239321b17ecSEdward Tomasz Napierala icl_pdu_data_segment_length(const struct icl_pdu *request)
240321b17ecSEdward Tomasz Napierala {
241321b17ecSEdward Tomasz Napierala 	uint32_t len = 0;
242321b17ecSEdward Tomasz Napierala 
243321b17ecSEdward Tomasz Napierala 	len += request->ip_bhs->bhs_data_segment_len[0];
244321b17ecSEdward Tomasz Napierala 	len <<= 8;
245321b17ecSEdward Tomasz Napierala 	len += request->ip_bhs->bhs_data_segment_len[1];
246321b17ecSEdward Tomasz Napierala 	len <<= 8;
247321b17ecSEdward Tomasz Napierala 	len += request->ip_bhs->bhs_data_segment_len[2];
248321b17ecSEdward Tomasz Napierala 
249321b17ecSEdward Tomasz Napierala 	return (len);
250321b17ecSEdward Tomasz Napierala }
251321b17ecSEdward Tomasz Napierala 
252321b17ecSEdward Tomasz Napierala size_t
253321b17ecSEdward Tomasz Napierala icl_soft_conn_pdu_data_segment_length(struct icl_conn *ic,
254321b17ecSEdward Tomasz Napierala     const struct icl_pdu *request)
255321b17ecSEdward Tomasz Napierala {
256321b17ecSEdward Tomasz Napierala 
257321b17ecSEdward Tomasz Napierala 	return (icl_pdu_data_segment_length(request));
258321b17ecSEdward Tomasz Napierala }
259321b17ecSEdward Tomasz Napierala 
260321b17ecSEdward Tomasz Napierala static void
261321b17ecSEdward Tomasz Napierala icl_pdu_set_data_segment_length(struct icl_pdu *response, uint32_t len)
262321b17ecSEdward Tomasz Napierala {
263321b17ecSEdward Tomasz Napierala 
264321b17ecSEdward Tomasz Napierala 	response->ip_bhs->bhs_data_segment_len[2] = len;
265321b17ecSEdward Tomasz Napierala 	response->ip_bhs->bhs_data_segment_len[1] = len >> 8;
266321b17ecSEdward Tomasz Napierala 	response->ip_bhs->bhs_data_segment_len[0] = len >> 16;
267321b17ecSEdward Tomasz Napierala }
268321b17ecSEdward Tomasz Napierala 
269321b17ecSEdward Tomasz Napierala static size_t
270321b17ecSEdward Tomasz Napierala icl_pdu_padding(const struct icl_pdu *ip)
271321b17ecSEdward Tomasz Napierala {
272321b17ecSEdward Tomasz Napierala 
273321b17ecSEdward Tomasz Napierala 	if ((ip->ip_data_len % 4) != 0)
274321b17ecSEdward Tomasz Napierala 		return (4 - (ip->ip_data_len % 4));
275321b17ecSEdward Tomasz Napierala 
276321b17ecSEdward Tomasz Napierala 	return (0);
277321b17ecSEdward Tomasz Napierala }
278321b17ecSEdward Tomasz Napierala 
279321b17ecSEdward Tomasz Napierala static size_t
280321b17ecSEdward Tomasz Napierala icl_pdu_size(const struct icl_pdu *response)
281321b17ecSEdward Tomasz Napierala {
282321b17ecSEdward Tomasz Napierala 	size_t len;
283321b17ecSEdward Tomasz Napierala 
284321b17ecSEdward Tomasz Napierala 	KASSERT(response->ip_ahs_len == 0, ("responding with AHS"));
285321b17ecSEdward Tomasz Napierala 
286321b17ecSEdward Tomasz Napierala 	len = sizeof(struct iscsi_bhs) + response->ip_data_len +
287321b17ecSEdward Tomasz Napierala 	    icl_pdu_padding(response);
288321b17ecSEdward Tomasz Napierala 	if (response->ip_conn->ic_header_crc32c)
289321b17ecSEdward Tomasz Napierala 		len += ISCSI_HEADER_DIGEST_SIZE;
290321b17ecSEdward Tomasz Napierala 	if (response->ip_data_len != 0 && response->ip_conn->ic_data_crc32c)
291321b17ecSEdward Tomasz Napierala 		len += ISCSI_DATA_DIGEST_SIZE;
292321b17ecSEdward Tomasz Napierala 
293321b17ecSEdward Tomasz Napierala 	return (len);
294321b17ecSEdward Tomasz Napierala }
295321b17ecSEdward Tomasz Napierala 
296321b17ecSEdward Tomasz Napierala static int
297321b17ecSEdward Tomasz Napierala icl_pdu_receive_bhs(struct icl_pdu *request, size_t *availablep)
298321b17ecSEdward Tomasz Napierala {
299321b17ecSEdward Tomasz Napierala 	struct mbuf *m;
300321b17ecSEdward Tomasz Napierala 
301321b17ecSEdward Tomasz Napierala 	m = icl_conn_receive(request->ip_conn, sizeof(struct iscsi_bhs));
302321b17ecSEdward Tomasz Napierala 	if (m == NULL) {
303321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("failed to receive BHS");
304321b17ecSEdward Tomasz Napierala 		return (-1);
305321b17ecSEdward Tomasz Napierala 	}
306321b17ecSEdward Tomasz Napierala 
307321b17ecSEdward Tomasz Napierala 	request->ip_bhs_mbuf = m_pullup(m, sizeof(struct iscsi_bhs));
308321b17ecSEdward Tomasz Napierala 	if (request->ip_bhs_mbuf == NULL) {
309321b17ecSEdward Tomasz Napierala 		ICL_WARN("m_pullup failed");
310321b17ecSEdward Tomasz Napierala 		return (-1);
311321b17ecSEdward Tomasz Napierala 	}
312321b17ecSEdward Tomasz Napierala 	request->ip_bhs = mtod(request->ip_bhs_mbuf, struct iscsi_bhs *);
313321b17ecSEdward Tomasz Napierala 
314321b17ecSEdward Tomasz Napierala 	/*
315321b17ecSEdward Tomasz Napierala 	 * XXX: For architectures with strict alignment requirements
316321b17ecSEdward Tomasz Napierala 	 * 	we may need to allocate ip_bhs and copy the data into it.
317321b17ecSEdward Tomasz Napierala 	 * 	For some reason, though, not doing this doesn't seem
318321b17ecSEdward Tomasz Napierala 	 * 	to cause problems; tested on sparc64.
319321b17ecSEdward Tomasz Napierala 	 */
320321b17ecSEdward Tomasz Napierala 
321321b17ecSEdward Tomasz Napierala 	*availablep -= sizeof(struct iscsi_bhs);
322321b17ecSEdward Tomasz Napierala 	return (0);
323321b17ecSEdward Tomasz Napierala }
324321b17ecSEdward Tomasz Napierala 
325321b17ecSEdward Tomasz Napierala static int
326321b17ecSEdward Tomasz Napierala icl_pdu_receive_ahs(struct icl_pdu *request, size_t *availablep)
327321b17ecSEdward Tomasz Napierala {
328321b17ecSEdward Tomasz Napierala 
329321b17ecSEdward Tomasz Napierala 	request->ip_ahs_len = icl_pdu_ahs_length(request);
330321b17ecSEdward Tomasz Napierala 	if (request->ip_ahs_len == 0)
331321b17ecSEdward Tomasz Napierala 		return (0);
332321b17ecSEdward Tomasz Napierala 
333321b17ecSEdward Tomasz Napierala 	request->ip_ahs_mbuf = icl_conn_receive(request->ip_conn,
334321b17ecSEdward Tomasz Napierala 	    request->ip_ahs_len);
335321b17ecSEdward Tomasz Napierala 	if (request->ip_ahs_mbuf == NULL) {
336321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("failed to receive AHS");
337321b17ecSEdward Tomasz Napierala 		return (-1);
338321b17ecSEdward Tomasz Napierala 	}
339321b17ecSEdward Tomasz Napierala 
340321b17ecSEdward Tomasz Napierala 	*availablep -= request->ip_ahs_len;
341321b17ecSEdward Tomasz Napierala 	return (0);
342321b17ecSEdward Tomasz Napierala }
343321b17ecSEdward Tomasz Napierala 
344321b17ecSEdward Tomasz Napierala static uint32_t
345321b17ecSEdward Tomasz Napierala icl_mbuf_to_crc32c(const struct mbuf *m0)
346321b17ecSEdward Tomasz Napierala {
347321b17ecSEdward Tomasz Napierala 	uint32_t digest = 0xffffffff;
348321b17ecSEdward Tomasz Napierala 	const struct mbuf *m;
349321b17ecSEdward Tomasz Napierala 
350321b17ecSEdward Tomasz Napierala 	for (m = m0; m != NULL; m = m->m_next)
351321b17ecSEdward Tomasz Napierala 		digest = calculate_crc32c(digest,
352321b17ecSEdward Tomasz Napierala 		    mtod(m, const void *), m->m_len);
353321b17ecSEdward Tomasz Napierala 
354321b17ecSEdward Tomasz Napierala 	digest = digest ^ 0xffffffff;
355321b17ecSEdward Tomasz Napierala 
356321b17ecSEdward Tomasz Napierala 	return (digest);
357321b17ecSEdward Tomasz Napierala }
358321b17ecSEdward Tomasz Napierala 
359321b17ecSEdward Tomasz Napierala static int
360321b17ecSEdward Tomasz Napierala icl_pdu_check_header_digest(struct icl_pdu *request, size_t *availablep)
361321b17ecSEdward Tomasz Napierala {
362321b17ecSEdward Tomasz Napierala 	struct mbuf *m;
363321b17ecSEdward Tomasz Napierala 	uint32_t received_digest, valid_digest;
364321b17ecSEdward Tomasz Napierala 
365321b17ecSEdward Tomasz Napierala 	if (request->ip_conn->ic_header_crc32c == false)
366321b17ecSEdward Tomasz Napierala 		return (0);
367321b17ecSEdward Tomasz Napierala 
368321b17ecSEdward Tomasz Napierala 	m = icl_conn_receive(request->ip_conn, ISCSI_HEADER_DIGEST_SIZE);
369321b17ecSEdward Tomasz Napierala 	if (m == NULL) {
370321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("failed to receive header digest");
371321b17ecSEdward Tomasz Napierala 		return (-1);
372321b17ecSEdward Tomasz Napierala 	}
373321b17ecSEdward Tomasz Napierala 
374321b17ecSEdward Tomasz Napierala 	CTASSERT(sizeof(received_digest) == ISCSI_HEADER_DIGEST_SIZE);
375321b17ecSEdward Tomasz Napierala 	m_copydata(m, 0, ISCSI_HEADER_DIGEST_SIZE, (void *)&received_digest);
376321b17ecSEdward Tomasz Napierala 	m_freem(m);
377321b17ecSEdward Tomasz Napierala 
378321b17ecSEdward Tomasz Napierala 	*availablep -= ISCSI_HEADER_DIGEST_SIZE;
379321b17ecSEdward Tomasz Napierala 
380321b17ecSEdward Tomasz Napierala 	/*
381321b17ecSEdward Tomasz Napierala 	 * XXX: Handle AHS.
382321b17ecSEdward Tomasz Napierala 	 */
383321b17ecSEdward Tomasz Napierala 	valid_digest = icl_mbuf_to_crc32c(request->ip_bhs_mbuf);
384321b17ecSEdward Tomasz Napierala 	if (received_digest != valid_digest) {
385321b17ecSEdward Tomasz Napierala 		ICL_WARN("header digest check failed; got 0x%x, "
386321b17ecSEdward Tomasz Napierala 		    "should be 0x%x", received_digest, valid_digest);
387321b17ecSEdward Tomasz Napierala 		return (-1);
388321b17ecSEdward Tomasz Napierala 	}
389321b17ecSEdward Tomasz Napierala 
390321b17ecSEdward Tomasz Napierala 	return (0);
391321b17ecSEdward Tomasz Napierala }
392321b17ecSEdward Tomasz Napierala 
393321b17ecSEdward Tomasz Napierala /*
394321b17ecSEdward Tomasz Napierala  * Return the number of bytes that should be waiting in the receive socket
395321b17ecSEdward Tomasz Napierala  * before icl_pdu_receive_data_segment() gets called.
396321b17ecSEdward Tomasz Napierala  */
397321b17ecSEdward Tomasz Napierala static size_t
398321b17ecSEdward Tomasz Napierala icl_pdu_data_segment_receive_len(const struct icl_pdu *request)
399321b17ecSEdward Tomasz Napierala {
400321b17ecSEdward Tomasz Napierala 	size_t len;
401321b17ecSEdward Tomasz Napierala 
402321b17ecSEdward Tomasz Napierala 	len = icl_pdu_data_segment_length(request);
403321b17ecSEdward Tomasz Napierala 	if (len == 0)
404321b17ecSEdward Tomasz Napierala 		return (0);
405321b17ecSEdward Tomasz Napierala 
406321b17ecSEdward Tomasz Napierala 	/*
407321b17ecSEdward Tomasz Napierala 	 * Account for the parts of data segment already read from
408321b17ecSEdward Tomasz Napierala 	 * the socket buffer.
409321b17ecSEdward Tomasz Napierala 	 */
410321b17ecSEdward Tomasz Napierala 	KASSERT(len > request->ip_data_len, ("len <= request->ip_data_len"));
411321b17ecSEdward Tomasz Napierala 	len -= request->ip_data_len;
412321b17ecSEdward Tomasz Napierala 
413321b17ecSEdward Tomasz Napierala 	/*
414321b17ecSEdward Tomasz Napierala 	 * Don't always wait for the full data segment to be delivered
415321b17ecSEdward Tomasz Napierala 	 * to the socket; this might badly affect performance due to
416321b17ecSEdward Tomasz Napierala 	 * TCP window scaling.
417321b17ecSEdward Tomasz Napierala 	 */
418321b17ecSEdward Tomasz Napierala 	if (len > partial_receive_len) {
419321b17ecSEdward Tomasz Napierala #if 0
420321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("need %zd bytes of data, limiting to %zd",
421321b17ecSEdward Tomasz Napierala 		    len, partial_receive_len));
422321b17ecSEdward Tomasz Napierala #endif
423321b17ecSEdward Tomasz Napierala 		len = partial_receive_len;
424321b17ecSEdward Tomasz Napierala 
425321b17ecSEdward Tomasz Napierala 		return (len);
426321b17ecSEdward Tomasz Napierala 	}
427321b17ecSEdward Tomasz Napierala 
428321b17ecSEdward Tomasz Napierala 	/*
429321b17ecSEdward Tomasz Napierala 	 * Account for padding.  Note that due to the way code is written,
430321b17ecSEdward Tomasz Napierala 	 * the icl_pdu_receive_data_segment() must always receive padding
431321b17ecSEdward Tomasz Napierala 	 * along with the last part of data segment, because it would be
432321b17ecSEdward Tomasz Napierala 	 * impossible to tell whether we've already received the full data
433321b17ecSEdward Tomasz Napierala 	 * segment including padding, or without it.
434321b17ecSEdward Tomasz Napierala 	 */
435321b17ecSEdward Tomasz Napierala 	if ((len % 4) != 0)
436321b17ecSEdward Tomasz Napierala 		len += 4 - (len % 4);
437321b17ecSEdward Tomasz Napierala 
438321b17ecSEdward Tomasz Napierala #if 0
439321b17ecSEdward Tomasz Napierala 	ICL_DEBUG("need %zd bytes of data", len));
440321b17ecSEdward Tomasz Napierala #endif
441321b17ecSEdward Tomasz Napierala 
442321b17ecSEdward Tomasz Napierala 	return (len);
443321b17ecSEdward Tomasz Napierala }
444321b17ecSEdward Tomasz Napierala 
445321b17ecSEdward Tomasz Napierala static int
446321b17ecSEdward Tomasz Napierala icl_pdu_receive_data_segment(struct icl_pdu *request,
447321b17ecSEdward Tomasz Napierala     size_t *availablep, bool *more_neededp)
448321b17ecSEdward Tomasz Napierala {
449321b17ecSEdward Tomasz Napierala 	struct icl_conn *ic;
450321b17ecSEdward Tomasz Napierala 	size_t len, padding = 0;
451321b17ecSEdward Tomasz Napierala 	struct mbuf *m;
452321b17ecSEdward Tomasz Napierala 
453321b17ecSEdward Tomasz Napierala 	ic = request->ip_conn;
454321b17ecSEdward Tomasz Napierala 
455321b17ecSEdward Tomasz Napierala 	*more_neededp = false;
456321b17ecSEdward Tomasz Napierala 	ic->ic_receive_len = 0;
457321b17ecSEdward Tomasz Napierala 
458321b17ecSEdward Tomasz Napierala 	len = icl_pdu_data_segment_length(request);
459321b17ecSEdward Tomasz Napierala 	if (len == 0)
460321b17ecSEdward Tomasz Napierala 		return (0);
461321b17ecSEdward Tomasz Napierala 
462321b17ecSEdward Tomasz Napierala 	if ((len % 4) != 0)
463321b17ecSEdward Tomasz Napierala 		padding = 4 - (len % 4);
464321b17ecSEdward Tomasz Napierala 
465321b17ecSEdward Tomasz Napierala 	/*
466321b17ecSEdward Tomasz Napierala 	 * Account for already received parts of data segment.
467321b17ecSEdward Tomasz Napierala 	 */
468321b17ecSEdward Tomasz Napierala 	KASSERT(len > request->ip_data_len, ("len <= request->ip_data_len"));
469321b17ecSEdward Tomasz Napierala 	len -= request->ip_data_len;
470321b17ecSEdward Tomasz Napierala 
471321b17ecSEdward Tomasz Napierala 	if (len + padding > *availablep) {
472321b17ecSEdward Tomasz Napierala 		/*
473321b17ecSEdward Tomasz Napierala 		 * Not enough data in the socket buffer.  Receive as much
474321b17ecSEdward Tomasz Napierala 		 * as we can.  Don't receive padding, since, obviously, it's
475321b17ecSEdward Tomasz Napierala 		 * not the end of data segment yet.
476321b17ecSEdward Tomasz Napierala 		 */
477321b17ecSEdward Tomasz Napierala #if 0
478321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("limited from %zd to %zd",
479321b17ecSEdward Tomasz Napierala 		    len + padding, *availablep - padding));
480321b17ecSEdward Tomasz Napierala #endif
481321b17ecSEdward Tomasz Napierala 		len = *availablep - padding;
482321b17ecSEdward Tomasz Napierala 		*more_neededp = true;
483321b17ecSEdward Tomasz Napierala 		padding = 0;
484321b17ecSEdward Tomasz Napierala 	}
485321b17ecSEdward Tomasz Napierala 
486321b17ecSEdward Tomasz Napierala 	/*
487321b17ecSEdward Tomasz Napierala 	 * Must not try to receive padding without at least one byte
488321b17ecSEdward Tomasz Napierala 	 * of actual data segment.
489321b17ecSEdward Tomasz Napierala 	 */
490321b17ecSEdward Tomasz Napierala 	if (len > 0) {
491321b17ecSEdward Tomasz Napierala 		m = icl_conn_receive(request->ip_conn, len + padding);
492321b17ecSEdward Tomasz Napierala 		if (m == NULL) {
493321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("failed to receive data segment");
494321b17ecSEdward Tomasz Napierala 			return (-1);
495321b17ecSEdward Tomasz Napierala 		}
496321b17ecSEdward Tomasz Napierala 
497321b17ecSEdward Tomasz Napierala 		if (request->ip_data_mbuf == NULL)
498321b17ecSEdward Tomasz Napierala 			request->ip_data_mbuf = m;
499321b17ecSEdward Tomasz Napierala 		else
500321b17ecSEdward Tomasz Napierala 			m_cat(request->ip_data_mbuf, m);
501321b17ecSEdward Tomasz Napierala 
502321b17ecSEdward Tomasz Napierala 		request->ip_data_len += len;
503321b17ecSEdward Tomasz Napierala 		*availablep -= len + padding;
504321b17ecSEdward Tomasz Napierala 	} else
505321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("len 0");
506321b17ecSEdward Tomasz Napierala 
507321b17ecSEdward Tomasz Napierala 	if (*more_neededp)
508321b17ecSEdward Tomasz Napierala 		ic->ic_receive_len =
509321b17ecSEdward Tomasz Napierala 		    icl_pdu_data_segment_receive_len(request);
510321b17ecSEdward Tomasz Napierala 
511321b17ecSEdward Tomasz Napierala 	return (0);
512321b17ecSEdward Tomasz Napierala }
513321b17ecSEdward Tomasz Napierala 
514321b17ecSEdward Tomasz Napierala static int
515321b17ecSEdward Tomasz Napierala icl_pdu_check_data_digest(struct icl_pdu *request, size_t *availablep)
516321b17ecSEdward Tomasz Napierala {
517321b17ecSEdward Tomasz Napierala 	struct mbuf *m;
518321b17ecSEdward Tomasz Napierala 	uint32_t received_digest, valid_digest;
519321b17ecSEdward Tomasz Napierala 
520321b17ecSEdward Tomasz Napierala 	if (request->ip_conn->ic_data_crc32c == false)
521321b17ecSEdward Tomasz Napierala 		return (0);
522321b17ecSEdward Tomasz Napierala 
523321b17ecSEdward Tomasz Napierala 	if (request->ip_data_len == 0)
524321b17ecSEdward Tomasz Napierala 		return (0);
525321b17ecSEdward Tomasz Napierala 
526321b17ecSEdward Tomasz Napierala 	m = icl_conn_receive(request->ip_conn, ISCSI_DATA_DIGEST_SIZE);
527321b17ecSEdward Tomasz Napierala 	if (m == NULL) {
528321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("failed to receive data digest");
529321b17ecSEdward Tomasz Napierala 		return (-1);
530321b17ecSEdward Tomasz Napierala 	}
531321b17ecSEdward Tomasz Napierala 
532321b17ecSEdward Tomasz Napierala 	CTASSERT(sizeof(received_digest) == ISCSI_DATA_DIGEST_SIZE);
533321b17ecSEdward Tomasz Napierala 	m_copydata(m, 0, ISCSI_DATA_DIGEST_SIZE, (void *)&received_digest);
534321b17ecSEdward Tomasz Napierala 	m_freem(m);
535321b17ecSEdward Tomasz Napierala 
536321b17ecSEdward Tomasz Napierala 	*availablep -= ISCSI_DATA_DIGEST_SIZE;
537321b17ecSEdward Tomasz Napierala 
538321b17ecSEdward Tomasz Napierala 	/*
539321b17ecSEdward Tomasz Napierala 	 * Note that ip_data_mbuf also contains padding; since digest
540321b17ecSEdward Tomasz Napierala 	 * calculation is supposed to include that, we iterate over
541321b17ecSEdward Tomasz Napierala 	 * the entire ip_data_mbuf chain, not just ip_data_len bytes of it.
542321b17ecSEdward Tomasz Napierala 	 */
543321b17ecSEdward Tomasz Napierala 	valid_digest = icl_mbuf_to_crc32c(request->ip_data_mbuf);
544321b17ecSEdward Tomasz Napierala 	if (received_digest != valid_digest) {
545321b17ecSEdward Tomasz Napierala 		ICL_WARN("data digest check failed; got 0x%x, "
546321b17ecSEdward Tomasz Napierala 		    "should be 0x%x", received_digest, valid_digest);
547321b17ecSEdward Tomasz Napierala 		return (-1);
548321b17ecSEdward Tomasz Napierala 	}
549321b17ecSEdward Tomasz Napierala 
550321b17ecSEdward Tomasz Napierala 	return (0);
551321b17ecSEdward Tomasz Napierala }
552321b17ecSEdward Tomasz Napierala 
553321b17ecSEdward Tomasz Napierala /*
554321b17ecSEdward Tomasz Napierala  * Somewhat contrary to the name, this attempts to receive only one
555321b17ecSEdward Tomasz Napierala  * "part" of PDU at a time; call it repeatedly until it returns non-NULL.
556321b17ecSEdward Tomasz Napierala  */
557321b17ecSEdward Tomasz Napierala static struct icl_pdu *
558321b17ecSEdward Tomasz Napierala icl_conn_receive_pdu(struct icl_conn *ic, size_t *availablep)
559321b17ecSEdward Tomasz Napierala {
560321b17ecSEdward Tomasz Napierala 	struct icl_pdu *request;
561321b17ecSEdward Tomasz Napierala 	struct socket *so;
562321b17ecSEdward Tomasz Napierala 	size_t len;
563321b17ecSEdward Tomasz Napierala 	int error;
564321b17ecSEdward Tomasz Napierala 	bool more_needed;
565321b17ecSEdward Tomasz Napierala 
566321b17ecSEdward Tomasz Napierala 	so = ic->ic_socket;
567321b17ecSEdward Tomasz Napierala 
568321b17ecSEdward Tomasz Napierala 	if (ic->ic_receive_state == ICL_CONN_STATE_BHS) {
569321b17ecSEdward Tomasz Napierala 		KASSERT(ic->ic_receive_pdu == NULL,
570321b17ecSEdward Tomasz Napierala 		    ("ic->ic_receive_pdu != NULL"));
571321b17ecSEdward Tomasz Napierala 		request = icl_pdu_new_empty(ic, M_NOWAIT);
572321b17ecSEdward Tomasz Napierala 		if (request == NULL) {
573321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("failed to allocate PDU; "
574321b17ecSEdward Tomasz Napierala 			    "dropping connection");
575321b17ecSEdward Tomasz Napierala 			icl_conn_fail(ic);
576321b17ecSEdward Tomasz Napierala 			return (NULL);
577321b17ecSEdward Tomasz Napierala 		}
578321b17ecSEdward Tomasz Napierala 		ic->ic_receive_pdu = request;
579321b17ecSEdward Tomasz Napierala 	} else {
580321b17ecSEdward Tomasz Napierala 		KASSERT(ic->ic_receive_pdu != NULL,
581321b17ecSEdward Tomasz Napierala 		    ("ic->ic_receive_pdu == NULL"));
582321b17ecSEdward Tomasz Napierala 		request = ic->ic_receive_pdu;
583321b17ecSEdward Tomasz Napierala 	}
584321b17ecSEdward Tomasz Napierala 
585321b17ecSEdward Tomasz Napierala 	if (*availablep < ic->ic_receive_len) {
586321b17ecSEdward Tomasz Napierala #if 0
587321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("not enough data; need %zd, "
588321b17ecSEdward Tomasz Napierala 		    "have %zd", ic->ic_receive_len, *availablep);
589321b17ecSEdward Tomasz Napierala #endif
590321b17ecSEdward Tomasz Napierala 		return (NULL);
591321b17ecSEdward Tomasz Napierala 	}
592321b17ecSEdward Tomasz Napierala 
593321b17ecSEdward Tomasz Napierala 	switch (ic->ic_receive_state) {
594321b17ecSEdward Tomasz Napierala 	case ICL_CONN_STATE_BHS:
595321b17ecSEdward Tomasz Napierala 		//ICL_DEBUG("receiving BHS");
596321b17ecSEdward Tomasz Napierala 		error = icl_pdu_receive_bhs(request, availablep);
597321b17ecSEdward Tomasz Napierala 		if (error != 0) {
598321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("failed to receive BHS; "
599321b17ecSEdward Tomasz Napierala 			    "dropping connection");
600321b17ecSEdward Tomasz Napierala 			break;
601321b17ecSEdward Tomasz Napierala 		}
602321b17ecSEdward Tomasz Napierala 
603321b17ecSEdward Tomasz Napierala 		/*
604321b17ecSEdward Tomasz Napierala 		 * We don't enforce any limit for AHS length;
605321b17ecSEdward Tomasz Napierala 		 * its length is stored in 8 bit field.
606321b17ecSEdward Tomasz Napierala 		 */
607321b17ecSEdward Tomasz Napierala 
608321b17ecSEdward Tomasz Napierala 		len = icl_pdu_data_segment_length(request);
609321b17ecSEdward Tomasz Napierala 		if (len > ic->ic_max_data_segment_length) {
610321b17ecSEdward Tomasz Napierala 			ICL_WARN("received data segment "
611321b17ecSEdward Tomasz Napierala 			    "length %zd is larger than negotiated "
612321b17ecSEdward Tomasz Napierala 			    "MaxDataSegmentLength %zd; "
613321b17ecSEdward Tomasz Napierala 			    "dropping connection",
614321b17ecSEdward Tomasz Napierala 			    len, ic->ic_max_data_segment_length);
615321b17ecSEdward Tomasz Napierala 			error = EINVAL;
616321b17ecSEdward Tomasz Napierala 			break;
617321b17ecSEdward Tomasz Napierala 		}
618321b17ecSEdward Tomasz Napierala 
619321b17ecSEdward Tomasz Napierala 		ic->ic_receive_state = ICL_CONN_STATE_AHS;
620321b17ecSEdward Tomasz Napierala 		ic->ic_receive_len = icl_pdu_ahs_length(request);
621321b17ecSEdward Tomasz Napierala 		break;
622321b17ecSEdward Tomasz Napierala 
623321b17ecSEdward Tomasz Napierala 	case ICL_CONN_STATE_AHS:
624321b17ecSEdward Tomasz Napierala 		//ICL_DEBUG("receiving AHS");
625321b17ecSEdward Tomasz Napierala 		error = icl_pdu_receive_ahs(request, availablep);
626321b17ecSEdward Tomasz Napierala 		if (error != 0) {
627321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("failed to receive AHS; "
628321b17ecSEdward Tomasz Napierala 			    "dropping connection");
629321b17ecSEdward Tomasz Napierala 			break;
630321b17ecSEdward Tomasz Napierala 		}
631321b17ecSEdward Tomasz Napierala 		ic->ic_receive_state = ICL_CONN_STATE_HEADER_DIGEST;
632321b17ecSEdward Tomasz Napierala 		if (ic->ic_header_crc32c == false)
633321b17ecSEdward Tomasz Napierala 			ic->ic_receive_len = 0;
634321b17ecSEdward Tomasz Napierala 		else
635321b17ecSEdward Tomasz Napierala 			ic->ic_receive_len = ISCSI_HEADER_DIGEST_SIZE;
636321b17ecSEdward Tomasz Napierala 		break;
637321b17ecSEdward Tomasz Napierala 
638321b17ecSEdward Tomasz Napierala 	case ICL_CONN_STATE_HEADER_DIGEST:
639321b17ecSEdward Tomasz Napierala 		//ICL_DEBUG("receiving header digest");
640321b17ecSEdward Tomasz Napierala 		error = icl_pdu_check_header_digest(request, availablep);
641321b17ecSEdward Tomasz Napierala 		if (error != 0) {
642321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("header digest failed; "
643321b17ecSEdward Tomasz Napierala 			    "dropping connection");
644321b17ecSEdward Tomasz Napierala 			break;
645321b17ecSEdward Tomasz Napierala 		}
646321b17ecSEdward Tomasz Napierala 
647321b17ecSEdward Tomasz Napierala 		ic->ic_receive_state = ICL_CONN_STATE_DATA;
648321b17ecSEdward Tomasz Napierala 		ic->ic_receive_len =
649321b17ecSEdward Tomasz Napierala 		    icl_pdu_data_segment_receive_len(request);
650321b17ecSEdward Tomasz Napierala 		break;
651321b17ecSEdward Tomasz Napierala 
652321b17ecSEdward Tomasz Napierala 	case ICL_CONN_STATE_DATA:
653321b17ecSEdward Tomasz Napierala 		//ICL_DEBUG("receiving data segment");
654321b17ecSEdward Tomasz Napierala 		error = icl_pdu_receive_data_segment(request, availablep,
655321b17ecSEdward Tomasz Napierala 		    &more_needed);
656321b17ecSEdward Tomasz Napierala 		if (error != 0) {
657321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("failed to receive data segment;"
658321b17ecSEdward Tomasz Napierala 			    "dropping connection");
659321b17ecSEdward Tomasz Napierala 			break;
660321b17ecSEdward Tomasz Napierala 		}
661321b17ecSEdward Tomasz Napierala 
662321b17ecSEdward Tomasz Napierala 		if (more_needed)
663321b17ecSEdward Tomasz Napierala 			break;
664321b17ecSEdward Tomasz Napierala 
665321b17ecSEdward Tomasz Napierala 		ic->ic_receive_state = ICL_CONN_STATE_DATA_DIGEST;
666321b17ecSEdward Tomasz Napierala 		if (request->ip_data_len == 0 || ic->ic_data_crc32c == false)
667321b17ecSEdward Tomasz Napierala 			ic->ic_receive_len = 0;
668321b17ecSEdward Tomasz Napierala 		else
669321b17ecSEdward Tomasz Napierala 			ic->ic_receive_len = ISCSI_DATA_DIGEST_SIZE;
670321b17ecSEdward Tomasz Napierala 		break;
671321b17ecSEdward Tomasz Napierala 
672321b17ecSEdward Tomasz Napierala 	case ICL_CONN_STATE_DATA_DIGEST:
673321b17ecSEdward Tomasz Napierala 		//ICL_DEBUG("receiving data digest");
674321b17ecSEdward Tomasz Napierala 		error = icl_pdu_check_data_digest(request, availablep);
675321b17ecSEdward Tomasz Napierala 		if (error != 0) {
676321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("data digest failed; "
677321b17ecSEdward Tomasz Napierala 			    "dropping connection");
678321b17ecSEdward Tomasz Napierala 			break;
679321b17ecSEdward Tomasz Napierala 		}
680321b17ecSEdward Tomasz Napierala 
681321b17ecSEdward Tomasz Napierala 		/*
682321b17ecSEdward Tomasz Napierala 		 * We've received complete PDU; reset the receive state machine
683321b17ecSEdward Tomasz Napierala 		 * and return the PDU.
684321b17ecSEdward Tomasz Napierala 		 */
685321b17ecSEdward Tomasz Napierala 		ic->ic_receive_state = ICL_CONN_STATE_BHS;
686321b17ecSEdward Tomasz Napierala 		ic->ic_receive_len = sizeof(struct iscsi_bhs);
687321b17ecSEdward Tomasz Napierala 		ic->ic_receive_pdu = NULL;
688321b17ecSEdward Tomasz Napierala 		return (request);
689321b17ecSEdward Tomasz Napierala 
690321b17ecSEdward Tomasz Napierala 	default:
691321b17ecSEdward Tomasz Napierala 		panic("invalid ic_receive_state %d\n", ic->ic_receive_state);
692321b17ecSEdward Tomasz Napierala 	}
693321b17ecSEdward Tomasz Napierala 
694321b17ecSEdward Tomasz Napierala 	if (error != 0) {
695321b17ecSEdward Tomasz Napierala 		/*
696321b17ecSEdward Tomasz Napierala 		 * Don't free the PDU; it's pointed to by ic->ic_receive_pdu
6975aabcd7cSEdward Tomasz Napierala 		 * and will get freed in icl_soft_conn_close().
698321b17ecSEdward Tomasz Napierala 		 */
699321b17ecSEdward Tomasz Napierala 		icl_conn_fail(ic);
700321b17ecSEdward Tomasz Napierala 	}
701321b17ecSEdward Tomasz Napierala 
702321b17ecSEdward Tomasz Napierala 	return (NULL);
703321b17ecSEdward Tomasz Napierala }
704321b17ecSEdward Tomasz Napierala 
705321b17ecSEdward Tomasz Napierala static void
706321b17ecSEdward Tomasz Napierala icl_conn_receive_pdus(struct icl_conn *ic, size_t available)
707321b17ecSEdward Tomasz Napierala {
708321b17ecSEdward Tomasz Napierala 	struct icl_pdu *response;
709321b17ecSEdward Tomasz Napierala 	struct socket *so;
710321b17ecSEdward Tomasz Napierala 
711321b17ecSEdward Tomasz Napierala 	so = ic->ic_socket;
712321b17ecSEdward Tomasz Napierala 
713321b17ecSEdward Tomasz Napierala 	/*
714321b17ecSEdward Tomasz Napierala 	 * This can never happen; we're careful to only mess with ic->ic_socket
715321b17ecSEdward Tomasz Napierala 	 * pointer when the send/receive threads are not running.
716321b17ecSEdward Tomasz Napierala 	 */
717321b17ecSEdward Tomasz Napierala 	KASSERT(so != NULL, ("NULL socket"));
718321b17ecSEdward Tomasz Napierala 
719321b17ecSEdward Tomasz Napierala 	for (;;) {
720321b17ecSEdward Tomasz Napierala 		if (ic->ic_disconnecting)
721321b17ecSEdward Tomasz Napierala 			return;
722321b17ecSEdward Tomasz Napierala 
723321b17ecSEdward Tomasz Napierala 		if (so->so_error != 0) {
724321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("connection error %d; "
725321b17ecSEdward Tomasz Napierala 			    "dropping connection", so->so_error);
726321b17ecSEdward Tomasz Napierala 			icl_conn_fail(ic);
727321b17ecSEdward Tomasz Napierala 			return;
728321b17ecSEdward Tomasz Napierala 		}
729321b17ecSEdward Tomasz Napierala 
730321b17ecSEdward Tomasz Napierala 		/*
731321b17ecSEdward Tomasz Napierala 		 * Loop until we have a complete PDU or there is not enough
732321b17ecSEdward Tomasz Napierala 		 * data in the socket buffer.
733321b17ecSEdward Tomasz Napierala 		 */
734321b17ecSEdward Tomasz Napierala 		if (available < ic->ic_receive_len) {
735321b17ecSEdward Tomasz Napierala #if 0
736321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("not enough data; have %zd, "
737321b17ecSEdward Tomasz Napierala 			    "need %zd", available,
738321b17ecSEdward Tomasz Napierala 			    ic->ic_receive_len);
739321b17ecSEdward Tomasz Napierala #endif
740321b17ecSEdward Tomasz Napierala 			return;
741321b17ecSEdward Tomasz Napierala 		}
742321b17ecSEdward Tomasz Napierala 
743321b17ecSEdward Tomasz Napierala 		response = icl_conn_receive_pdu(ic, &available);
744321b17ecSEdward Tomasz Napierala 		if (response == NULL)
745321b17ecSEdward Tomasz Napierala 			continue;
746321b17ecSEdward Tomasz Napierala 
747321b17ecSEdward Tomasz Napierala 		if (response->ip_ahs_len > 0) {
748321b17ecSEdward Tomasz Napierala 			ICL_WARN("received PDU with unsupported "
749321b17ecSEdward Tomasz Napierala 			    "AHS; opcode 0x%x; dropping connection",
750321b17ecSEdward Tomasz Napierala 			    response->ip_bhs->bhs_opcode);
751321b17ecSEdward Tomasz Napierala 			icl_pdu_free(response);
752321b17ecSEdward Tomasz Napierala 			icl_conn_fail(ic);
753321b17ecSEdward Tomasz Napierala 			return;
754321b17ecSEdward Tomasz Napierala 		}
755321b17ecSEdward Tomasz Napierala 
756321b17ecSEdward Tomasz Napierala 		(ic->ic_receive)(response);
757321b17ecSEdward Tomasz Napierala 	}
758321b17ecSEdward Tomasz Napierala }
759321b17ecSEdward Tomasz Napierala 
760321b17ecSEdward Tomasz Napierala static void
761321b17ecSEdward Tomasz Napierala icl_receive_thread(void *arg)
762321b17ecSEdward Tomasz Napierala {
763321b17ecSEdward Tomasz Napierala 	struct icl_conn *ic;
764321b17ecSEdward Tomasz Napierala 	size_t available;
765321b17ecSEdward Tomasz Napierala 	struct socket *so;
766321b17ecSEdward Tomasz Napierala 
767321b17ecSEdward Tomasz Napierala 	ic = arg;
768321b17ecSEdward Tomasz Napierala 	so = ic->ic_socket;
769321b17ecSEdward Tomasz Napierala 
770321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
771321b17ecSEdward Tomasz Napierala 	ic->ic_receive_running = true;
772321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
773321b17ecSEdward Tomasz Napierala 
774321b17ecSEdward Tomasz Napierala 	for (;;) {
775321b17ecSEdward Tomasz Napierala 		if (ic->ic_disconnecting) {
776321b17ecSEdward Tomasz Napierala 			//ICL_DEBUG("terminating");
777321b17ecSEdward Tomasz Napierala 			break;
778321b17ecSEdward Tomasz Napierala 		}
779321b17ecSEdward Tomasz Napierala 
780321b17ecSEdward Tomasz Napierala 		/*
781321b17ecSEdward Tomasz Napierala 		 * Set the low watermark, to be checked by
782321b17ecSEdward Tomasz Napierala 		 * soreadable() in icl_soupcall_receive()
783321b17ecSEdward Tomasz Napierala 		 * to avoid unneccessary wakeups until there
784321b17ecSEdward Tomasz Napierala 		 * is enough data received to read the PDU.
785321b17ecSEdward Tomasz Napierala 		 */
786321b17ecSEdward Tomasz Napierala 		SOCKBUF_LOCK(&so->so_rcv);
787321b17ecSEdward Tomasz Napierala 		available = sbavail(&so->so_rcv);
788321b17ecSEdward Tomasz Napierala 		if (available < ic->ic_receive_len) {
789321b17ecSEdward Tomasz Napierala 			so->so_rcv.sb_lowat = ic->ic_receive_len;
790321b17ecSEdward Tomasz Napierala 			cv_wait(&ic->ic_receive_cv, &so->so_rcv.sb_mtx);
791321b17ecSEdward Tomasz Napierala 		} else
792321b17ecSEdward Tomasz Napierala 			so->so_rcv.sb_lowat = so->so_rcv.sb_hiwat + 1;
793321b17ecSEdward Tomasz Napierala 		SOCKBUF_UNLOCK(&so->so_rcv);
794321b17ecSEdward Tomasz Napierala 
795321b17ecSEdward Tomasz Napierala 		icl_conn_receive_pdus(ic, available);
796321b17ecSEdward Tomasz Napierala 	}
797321b17ecSEdward Tomasz Napierala 
798321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
799321b17ecSEdward Tomasz Napierala 	ic->ic_receive_running = false;
800321b17ecSEdward Tomasz Napierala 	cv_signal(&ic->ic_send_cv);
801321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
802321b17ecSEdward Tomasz Napierala 	kthread_exit();
803321b17ecSEdward Tomasz Napierala }
804321b17ecSEdward Tomasz Napierala 
805321b17ecSEdward Tomasz Napierala static int
806321b17ecSEdward Tomasz Napierala icl_soupcall_receive(struct socket *so, void *arg, int waitflag)
807321b17ecSEdward Tomasz Napierala {
808321b17ecSEdward Tomasz Napierala 	struct icl_conn *ic;
809321b17ecSEdward Tomasz Napierala 
810321b17ecSEdward Tomasz Napierala 	if (!soreadable(so))
811321b17ecSEdward Tomasz Napierala 		return (SU_OK);
812321b17ecSEdward Tomasz Napierala 
813321b17ecSEdward Tomasz Napierala 	ic = arg;
814321b17ecSEdward Tomasz Napierala 	cv_signal(&ic->ic_receive_cv);
815321b17ecSEdward Tomasz Napierala 	return (SU_OK);
816321b17ecSEdward Tomasz Napierala }
817321b17ecSEdward Tomasz Napierala 
818321b17ecSEdward Tomasz Napierala static int
819321b17ecSEdward Tomasz Napierala icl_pdu_finalize(struct icl_pdu *request)
820321b17ecSEdward Tomasz Napierala {
821321b17ecSEdward Tomasz Napierala 	size_t padding, pdu_len;
822321b17ecSEdward Tomasz Napierala 	uint32_t digest, zero = 0;
823321b17ecSEdward Tomasz Napierala 	int ok;
824321b17ecSEdward Tomasz Napierala 	struct icl_conn *ic;
825321b17ecSEdward Tomasz Napierala 
826321b17ecSEdward Tomasz Napierala 	ic = request->ip_conn;
827321b17ecSEdward Tomasz Napierala 
828321b17ecSEdward Tomasz Napierala 	icl_pdu_set_data_segment_length(request, request->ip_data_len);
829321b17ecSEdward Tomasz Napierala 
830321b17ecSEdward Tomasz Napierala 	pdu_len = icl_pdu_size(request);
831321b17ecSEdward Tomasz Napierala 
832321b17ecSEdward Tomasz Napierala 	if (ic->ic_header_crc32c) {
833321b17ecSEdward Tomasz Napierala 		digest = icl_mbuf_to_crc32c(request->ip_bhs_mbuf);
834321b17ecSEdward Tomasz Napierala 		ok = m_append(request->ip_bhs_mbuf, sizeof(digest),
835321b17ecSEdward Tomasz Napierala 		    (void *)&digest);
836321b17ecSEdward Tomasz Napierala 		if (ok != 1) {
837321b17ecSEdward Tomasz Napierala 			ICL_WARN("failed to append header digest");
838321b17ecSEdward Tomasz Napierala 			return (1);
839321b17ecSEdward Tomasz Napierala 		}
840321b17ecSEdward Tomasz Napierala 	}
841321b17ecSEdward Tomasz Napierala 
842321b17ecSEdward Tomasz Napierala 	if (request->ip_data_len != 0) {
843321b17ecSEdward Tomasz Napierala 		padding = icl_pdu_padding(request);
844321b17ecSEdward Tomasz Napierala 		if (padding > 0) {
845321b17ecSEdward Tomasz Napierala 			ok = m_append(request->ip_data_mbuf, padding,
846321b17ecSEdward Tomasz Napierala 			    (void *)&zero);
847321b17ecSEdward Tomasz Napierala 			if (ok != 1) {
848321b17ecSEdward Tomasz Napierala 				ICL_WARN("failed to append padding");
849321b17ecSEdward Tomasz Napierala 				return (1);
850321b17ecSEdward Tomasz Napierala 			}
851321b17ecSEdward Tomasz Napierala 		}
852321b17ecSEdward Tomasz Napierala 
853321b17ecSEdward Tomasz Napierala 		if (ic->ic_data_crc32c) {
854321b17ecSEdward Tomasz Napierala 			digest = icl_mbuf_to_crc32c(request->ip_data_mbuf);
855321b17ecSEdward Tomasz Napierala 
856321b17ecSEdward Tomasz Napierala 			ok = m_append(request->ip_data_mbuf, sizeof(digest),
857321b17ecSEdward Tomasz Napierala 			    (void *)&digest);
858321b17ecSEdward Tomasz Napierala 			if (ok != 1) {
859321b17ecSEdward Tomasz Napierala 				ICL_WARN("failed to append data digest");
860321b17ecSEdward Tomasz Napierala 				return (1);
861321b17ecSEdward Tomasz Napierala 			}
862321b17ecSEdward Tomasz Napierala 		}
863321b17ecSEdward Tomasz Napierala 
864321b17ecSEdward Tomasz Napierala 		m_cat(request->ip_bhs_mbuf, request->ip_data_mbuf);
865321b17ecSEdward Tomasz Napierala 		request->ip_data_mbuf = NULL;
866321b17ecSEdward Tomasz Napierala 	}
867321b17ecSEdward Tomasz Napierala 
868321b17ecSEdward Tomasz Napierala 	request->ip_bhs_mbuf->m_pkthdr.len = pdu_len;
869321b17ecSEdward Tomasz Napierala 
870321b17ecSEdward Tomasz Napierala 	return (0);
871321b17ecSEdward Tomasz Napierala }
872321b17ecSEdward Tomasz Napierala 
873321b17ecSEdward Tomasz Napierala static void
874321b17ecSEdward Tomasz Napierala icl_conn_send_pdus(struct icl_conn *ic, struct icl_pdu_stailq *queue)
875321b17ecSEdward Tomasz Napierala {
876321b17ecSEdward Tomasz Napierala 	struct icl_pdu *request, *request2;
877321b17ecSEdward Tomasz Napierala 	struct socket *so;
878321b17ecSEdward Tomasz Napierala 	size_t available, size, size2;
879321b17ecSEdward Tomasz Napierala 	int coalesced, error;
880321b17ecSEdward Tomasz Napierala 
881321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK_ASSERT_NOT(ic);
882321b17ecSEdward Tomasz Napierala 
883321b17ecSEdward Tomasz Napierala 	so = ic->ic_socket;
884321b17ecSEdward Tomasz Napierala 
885321b17ecSEdward Tomasz Napierala 	SOCKBUF_LOCK(&so->so_snd);
886321b17ecSEdward Tomasz Napierala 	/*
887321b17ecSEdward Tomasz Napierala 	 * Check how much space do we have for transmit.  We can't just
888321b17ecSEdward Tomasz Napierala 	 * call sosend() and retry when we get EWOULDBLOCK or EMSGSIZE,
889321b17ecSEdward Tomasz Napierala 	 * as it always frees the mbuf chain passed to it, even in case
890321b17ecSEdward Tomasz Napierala 	 * of error.
891321b17ecSEdward Tomasz Napierala 	 */
892321b17ecSEdward Tomasz Napierala 	available = sbspace(&so->so_snd);
893321b17ecSEdward Tomasz Napierala 
894321b17ecSEdward Tomasz Napierala 	/*
895321b17ecSEdward Tomasz Napierala 	 * Notify the socket upcall that we don't need wakeups
896321b17ecSEdward Tomasz Napierala 	 * for the time being.
897321b17ecSEdward Tomasz Napierala 	 */
898321b17ecSEdward Tomasz Napierala 	so->so_snd.sb_lowat = so->so_snd.sb_hiwat + 1;
899321b17ecSEdward Tomasz Napierala 	SOCKBUF_UNLOCK(&so->so_snd);
900321b17ecSEdward Tomasz Napierala 
901321b17ecSEdward Tomasz Napierala 	while (!STAILQ_EMPTY(queue)) {
902321b17ecSEdward Tomasz Napierala 		request = STAILQ_FIRST(queue);
903321b17ecSEdward Tomasz Napierala 		size = icl_pdu_size(request);
904321b17ecSEdward Tomasz Napierala 		if (available < size) {
905321b17ecSEdward Tomasz Napierala 
906321b17ecSEdward Tomasz Napierala 			/*
907321b17ecSEdward Tomasz Napierala 			 * Set the low watermark, to be checked by
908321b17ecSEdward Tomasz Napierala 			 * sowriteable() in icl_soupcall_send()
909321b17ecSEdward Tomasz Napierala 			 * to avoid unneccessary wakeups until there
910321b17ecSEdward Tomasz Napierala 			 * is enough space for the PDU to fit.
911321b17ecSEdward Tomasz Napierala 			 */
912321b17ecSEdward Tomasz Napierala 			SOCKBUF_LOCK(&so->so_snd);
913321b17ecSEdward Tomasz Napierala 			available = sbspace(&so->so_snd);
914321b17ecSEdward Tomasz Napierala 			if (available < size) {
915321b17ecSEdward Tomasz Napierala #if 1
916321b17ecSEdward Tomasz Napierala 				ICL_DEBUG("no space to send; "
917321b17ecSEdward Tomasz Napierala 				    "have %zd, need %zd",
918321b17ecSEdward Tomasz Napierala 				    available, size);
919321b17ecSEdward Tomasz Napierala #endif
920321b17ecSEdward Tomasz Napierala 				so->so_snd.sb_lowat = size;
921321b17ecSEdward Tomasz Napierala 				SOCKBUF_UNLOCK(&so->so_snd);
922321b17ecSEdward Tomasz Napierala 				return;
923321b17ecSEdward Tomasz Napierala 			}
924321b17ecSEdward Tomasz Napierala 			SOCKBUF_UNLOCK(&so->so_snd);
925321b17ecSEdward Tomasz Napierala 		}
926321b17ecSEdward Tomasz Napierala 		STAILQ_REMOVE_HEAD(queue, ip_next);
927321b17ecSEdward Tomasz Napierala 		error = icl_pdu_finalize(request);
928321b17ecSEdward Tomasz Napierala 		if (error != 0) {
929321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("failed to finalize PDU; "
930321b17ecSEdward Tomasz Napierala 			    "dropping connection");
931321b17ecSEdward Tomasz Napierala 			icl_conn_fail(ic);
932321b17ecSEdward Tomasz Napierala 			icl_pdu_free(request);
933321b17ecSEdward Tomasz Napierala 			return;
934321b17ecSEdward Tomasz Napierala 		}
935321b17ecSEdward Tomasz Napierala 		if (coalesce) {
936321b17ecSEdward Tomasz Napierala 			coalesced = 1;
937321b17ecSEdward Tomasz Napierala 			for (;;) {
938321b17ecSEdward Tomasz Napierala 				request2 = STAILQ_FIRST(queue);
939321b17ecSEdward Tomasz Napierala 				if (request2 == NULL)
940321b17ecSEdward Tomasz Napierala 					break;
941321b17ecSEdward Tomasz Napierala 				size2 = icl_pdu_size(request2);
942321b17ecSEdward Tomasz Napierala 				if (available < size + size2)
943321b17ecSEdward Tomasz Napierala 					break;
944321b17ecSEdward Tomasz Napierala 				STAILQ_REMOVE_HEAD(queue, ip_next);
945321b17ecSEdward Tomasz Napierala 				error = icl_pdu_finalize(request2);
946321b17ecSEdward Tomasz Napierala 				if (error != 0) {
947321b17ecSEdward Tomasz Napierala 					ICL_DEBUG("failed to finalize PDU; "
948321b17ecSEdward Tomasz Napierala 					    "dropping connection");
949321b17ecSEdward Tomasz Napierala 					icl_conn_fail(ic);
950321b17ecSEdward Tomasz Napierala 					icl_pdu_free(request);
951321b17ecSEdward Tomasz Napierala 					icl_pdu_free(request2);
952321b17ecSEdward Tomasz Napierala 					return;
953321b17ecSEdward Tomasz Napierala 				}
954321b17ecSEdward Tomasz Napierala 				m_cat(request->ip_bhs_mbuf, request2->ip_bhs_mbuf);
955321b17ecSEdward Tomasz Napierala 				request2->ip_bhs_mbuf = NULL;
956321b17ecSEdward Tomasz Napierala 				request->ip_bhs_mbuf->m_pkthdr.len += size2;
957321b17ecSEdward Tomasz Napierala 				size += size2;
958321b17ecSEdward Tomasz Napierala 				STAILQ_REMOVE_AFTER(queue, request, ip_next);
959321b17ecSEdward Tomasz Napierala 				icl_pdu_free(request2);
960321b17ecSEdward Tomasz Napierala 				coalesced++;
961321b17ecSEdward Tomasz Napierala 			}
962321b17ecSEdward Tomasz Napierala #if 0
963321b17ecSEdward Tomasz Napierala 			if (coalesced > 1) {
964321b17ecSEdward Tomasz Napierala 				ICL_DEBUG("coalesced %d PDUs into %zd bytes",
965321b17ecSEdward Tomasz Napierala 				    coalesced, size);
966321b17ecSEdward Tomasz Napierala 			}
967321b17ecSEdward Tomasz Napierala #endif
968321b17ecSEdward Tomasz Napierala 		}
969321b17ecSEdward Tomasz Napierala 		available -= size;
970321b17ecSEdward Tomasz Napierala 		error = sosend(so, NULL, NULL, request->ip_bhs_mbuf,
971321b17ecSEdward Tomasz Napierala 		    NULL, MSG_DONTWAIT, curthread);
972321b17ecSEdward Tomasz Napierala 		request->ip_bhs_mbuf = NULL; /* Sosend consumes the mbuf. */
973321b17ecSEdward Tomasz Napierala 		if (error != 0) {
974321b17ecSEdward Tomasz Napierala 			ICL_DEBUG("failed to send PDU, error %d; "
975321b17ecSEdward Tomasz Napierala 			    "dropping connection", error);
976321b17ecSEdward Tomasz Napierala 			icl_conn_fail(ic);
977321b17ecSEdward Tomasz Napierala 			icl_pdu_free(request);
978321b17ecSEdward Tomasz Napierala 			return;
979321b17ecSEdward Tomasz Napierala 		}
980321b17ecSEdward Tomasz Napierala 		icl_pdu_free(request);
981321b17ecSEdward Tomasz Napierala 	}
982321b17ecSEdward Tomasz Napierala }
983321b17ecSEdward Tomasz Napierala 
984321b17ecSEdward Tomasz Napierala static void
985321b17ecSEdward Tomasz Napierala icl_send_thread(void *arg)
986321b17ecSEdward Tomasz Napierala {
987321b17ecSEdward Tomasz Napierala 	struct icl_conn *ic;
988321b17ecSEdward Tomasz Napierala 	struct icl_pdu_stailq queue;
989321b17ecSEdward Tomasz Napierala 
990321b17ecSEdward Tomasz Napierala 	ic = arg;
991321b17ecSEdward Tomasz Napierala 
992321b17ecSEdward Tomasz Napierala 	STAILQ_INIT(&queue);
993321b17ecSEdward Tomasz Napierala 
994321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
995321b17ecSEdward Tomasz Napierala 	ic->ic_send_running = true;
996321b17ecSEdward Tomasz Napierala 
997321b17ecSEdward Tomasz Napierala 	for (;;) {
998321b17ecSEdward Tomasz Napierala 		for (;;) {
999321b17ecSEdward Tomasz Napierala 			/*
1000321b17ecSEdward Tomasz Napierala 			 * If the local queue is empty, populate it from
1001321b17ecSEdward Tomasz Napierala 			 * the main one.  This way the icl_conn_send_pdus()
1002321b17ecSEdward Tomasz Napierala 			 * can go through all the queued PDUs without holding
1003321b17ecSEdward Tomasz Napierala 			 * any locks.
1004321b17ecSEdward Tomasz Napierala 			 */
1005321b17ecSEdward Tomasz Napierala 			if (STAILQ_EMPTY(&queue))
1006321b17ecSEdward Tomasz Napierala 				STAILQ_SWAP(&ic->ic_to_send, &queue, icl_pdu);
1007321b17ecSEdward Tomasz Napierala 
1008321b17ecSEdward Tomasz Napierala 			ic->ic_check_send_space = false;
1009321b17ecSEdward Tomasz Napierala 			ICL_CONN_UNLOCK(ic);
1010321b17ecSEdward Tomasz Napierala 			icl_conn_send_pdus(ic, &queue);
1011321b17ecSEdward Tomasz Napierala 			ICL_CONN_LOCK(ic);
1012321b17ecSEdward Tomasz Napierala 
1013321b17ecSEdward Tomasz Napierala 			/*
1014321b17ecSEdward Tomasz Napierala 			 * The icl_soupcall_send() was called since the last
1015321b17ecSEdward Tomasz Napierala 			 * call to sbspace(); go around;
1016321b17ecSEdward Tomasz Napierala 			 */
1017321b17ecSEdward Tomasz Napierala 			if (ic->ic_check_send_space)
1018321b17ecSEdward Tomasz Napierala 				continue;
1019321b17ecSEdward Tomasz Napierala 
1020321b17ecSEdward Tomasz Napierala 			/*
1021321b17ecSEdward Tomasz Napierala 			 * Local queue is empty, but we still have PDUs
1022321b17ecSEdward Tomasz Napierala 			 * in the main one; go around.
1023321b17ecSEdward Tomasz Napierala 			 */
1024321b17ecSEdward Tomasz Napierala 			if (STAILQ_EMPTY(&queue) &&
1025321b17ecSEdward Tomasz Napierala 			    !STAILQ_EMPTY(&ic->ic_to_send))
1026321b17ecSEdward Tomasz Napierala 				continue;
1027321b17ecSEdward Tomasz Napierala 
1028321b17ecSEdward Tomasz Napierala 			/*
1029321b17ecSEdward Tomasz Napierala 			 * There might be some stuff in the local queue,
1030321b17ecSEdward Tomasz Napierala 			 * which didn't get sent due to not having enough send
1031321b17ecSEdward Tomasz Napierala 			 * space.  Wait for socket upcall.
1032321b17ecSEdward Tomasz Napierala 			 */
1033321b17ecSEdward Tomasz Napierala 			break;
1034321b17ecSEdward Tomasz Napierala 		}
1035321b17ecSEdward Tomasz Napierala 
1036321b17ecSEdward Tomasz Napierala 		if (ic->ic_disconnecting) {
1037321b17ecSEdward Tomasz Napierala 			//ICL_DEBUG("terminating");
1038321b17ecSEdward Tomasz Napierala 			break;
1039321b17ecSEdward Tomasz Napierala 		}
1040321b17ecSEdward Tomasz Napierala 
1041321b17ecSEdward Tomasz Napierala 		cv_wait(&ic->ic_send_cv, ic->ic_lock);
1042321b17ecSEdward Tomasz Napierala 	}
1043321b17ecSEdward Tomasz Napierala 
1044321b17ecSEdward Tomasz Napierala 	/*
1045321b17ecSEdward Tomasz Napierala 	 * We're exiting; move PDUs back to the main queue, so they can
1046321b17ecSEdward Tomasz Napierala 	 * get freed properly.  At this point ordering doesn't matter.
1047321b17ecSEdward Tomasz Napierala 	 */
1048321b17ecSEdward Tomasz Napierala 	STAILQ_CONCAT(&ic->ic_to_send, &queue);
1049321b17ecSEdward Tomasz Napierala 
1050321b17ecSEdward Tomasz Napierala 	ic->ic_send_running = false;
1051321b17ecSEdward Tomasz Napierala 	cv_signal(&ic->ic_send_cv);
1052321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
1053321b17ecSEdward Tomasz Napierala 	kthread_exit();
1054321b17ecSEdward Tomasz Napierala }
1055321b17ecSEdward Tomasz Napierala 
1056321b17ecSEdward Tomasz Napierala static int
1057321b17ecSEdward Tomasz Napierala icl_soupcall_send(struct socket *so, void *arg, int waitflag)
1058321b17ecSEdward Tomasz Napierala {
1059321b17ecSEdward Tomasz Napierala 	struct icl_conn *ic;
1060321b17ecSEdward Tomasz Napierala 
1061321b17ecSEdward Tomasz Napierala 	if (!sowriteable(so))
1062321b17ecSEdward Tomasz Napierala 		return (SU_OK);
1063321b17ecSEdward Tomasz Napierala 
1064321b17ecSEdward Tomasz Napierala 	ic = arg;
1065321b17ecSEdward Tomasz Napierala 
1066321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
1067321b17ecSEdward Tomasz Napierala 	ic->ic_check_send_space = true;
1068321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
1069321b17ecSEdward Tomasz Napierala 
1070321b17ecSEdward Tomasz Napierala 	cv_signal(&ic->ic_send_cv);
1071321b17ecSEdward Tomasz Napierala 
1072321b17ecSEdward Tomasz Napierala 	return (SU_OK);
1073321b17ecSEdward Tomasz Napierala }
1074321b17ecSEdward Tomasz Napierala 
1075321b17ecSEdward Tomasz Napierala static int
1076321b17ecSEdward Tomasz Napierala icl_pdu_append_data(struct icl_pdu *request, const void *addr, size_t len,
1077321b17ecSEdward Tomasz Napierala     int flags)
1078321b17ecSEdward Tomasz Napierala {
1079321b17ecSEdward Tomasz Napierala 	struct mbuf *mb, *newmb;
1080321b17ecSEdward Tomasz Napierala 	size_t copylen, off = 0;
1081321b17ecSEdward Tomasz Napierala 
1082321b17ecSEdward Tomasz Napierala 	KASSERT(len > 0, ("len == 0"));
1083321b17ecSEdward Tomasz Napierala 
1084321b17ecSEdward Tomasz Napierala 	newmb = m_getm2(NULL, len, flags, MT_DATA, M_PKTHDR);
1085321b17ecSEdward Tomasz Napierala 	if (newmb == NULL) {
1086321b17ecSEdward Tomasz Napierala 		ICL_WARN("failed to allocate mbuf for %zd bytes", len);
1087321b17ecSEdward Tomasz Napierala 		return (ENOMEM);
1088321b17ecSEdward Tomasz Napierala 	}
1089321b17ecSEdward Tomasz Napierala 
1090321b17ecSEdward Tomasz Napierala 	for (mb = newmb; mb != NULL; mb = mb->m_next) {
1091321b17ecSEdward Tomasz Napierala 		copylen = min(M_TRAILINGSPACE(mb), len - off);
1092321b17ecSEdward Tomasz Napierala 		memcpy(mtod(mb, char *), (const char *)addr + off, copylen);
1093321b17ecSEdward Tomasz Napierala 		mb->m_len = copylen;
1094321b17ecSEdward Tomasz Napierala 		off += copylen;
1095321b17ecSEdward Tomasz Napierala 	}
1096321b17ecSEdward Tomasz Napierala 	KASSERT(off == len, ("%s: off != len", __func__));
1097321b17ecSEdward Tomasz Napierala 
1098321b17ecSEdward Tomasz Napierala 	if (request->ip_data_mbuf == NULL) {
1099321b17ecSEdward Tomasz Napierala 		request->ip_data_mbuf = newmb;
1100321b17ecSEdward Tomasz Napierala 		request->ip_data_len = len;
1101321b17ecSEdward Tomasz Napierala 	} else {
1102321b17ecSEdward Tomasz Napierala 		m_cat(request->ip_data_mbuf, newmb);
1103321b17ecSEdward Tomasz Napierala 		request->ip_data_len += len;
1104321b17ecSEdward Tomasz Napierala 	}
1105321b17ecSEdward Tomasz Napierala 
1106321b17ecSEdward Tomasz Napierala 	return (0);
1107321b17ecSEdward Tomasz Napierala }
1108321b17ecSEdward Tomasz Napierala 
1109321b17ecSEdward Tomasz Napierala int
1110321b17ecSEdward Tomasz Napierala icl_soft_conn_pdu_append_data(struct icl_conn *ic, struct icl_pdu *request,
1111321b17ecSEdward Tomasz Napierala     const void *addr, size_t len, int flags)
1112321b17ecSEdward Tomasz Napierala {
1113321b17ecSEdward Tomasz Napierala 
1114321b17ecSEdward Tomasz Napierala 	return (icl_pdu_append_data(request, addr, len, flags));
1115321b17ecSEdward Tomasz Napierala }
1116321b17ecSEdward Tomasz Napierala 
1117321b17ecSEdward Tomasz Napierala static void
1118321b17ecSEdward Tomasz Napierala icl_pdu_get_data(struct icl_pdu *ip, size_t off, void *addr, size_t len)
1119321b17ecSEdward Tomasz Napierala {
1120321b17ecSEdward Tomasz Napierala 
1121321b17ecSEdward Tomasz Napierala 	m_copydata(ip->ip_data_mbuf, off, len, addr);
1122321b17ecSEdward Tomasz Napierala }
1123321b17ecSEdward Tomasz Napierala 
1124321b17ecSEdward Tomasz Napierala void
1125321b17ecSEdward Tomasz Napierala icl_soft_conn_pdu_get_data(struct icl_conn *ic, struct icl_pdu *ip,
1126321b17ecSEdward Tomasz Napierala     size_t off, void *addr, size_t len)
1127321b17ecSEdward Tomasz Napierala {
1128321b17ecSEdward Tomasz Napierala 
1129321b17ecSEdward Tomasz Napierala 	return (icl_pdu_get_data(ip, off, addr, len));
1130321b17ecSEdward Tomasz Napierala }
1131321b17ecSEdward Tomasz Napierala 
1132321b17ecSEdward Tomasz Napierala static void
1133321b17ecSEdward Tomasz Napierala icl_pdu_queue(struct icl_pdu *ip)
1134321b17ecSEdward Tomasz Napierala {
1135321b17ecSEdward Tomasz Napierala 	struct icl_conn *ic;
1136321b17ecSEdward Tomasz Napierala 
1137321b17ecSEdward Tomasz Napierala 	ic = ip->ip_conn;
1138321b17ecSEdward Tomasz Napierala 
1139321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK_ASSERT(ic);
1140321b17ecSEdward Tomasz Napierala 
1141321b17ecSEdward Tomasz Napierala 	if (ic->ic_disconnecting || ic->ic_socket == NULL) {
1142321b17ecSEdward Tomasz Napierala 		ICL_DEBUG("icl_pdu_queue on closed connection");
1143321b17ecSEdward Tomasz Napierala 		icl_pdu_free(ip);
1144321b17ecSEdward Tomasz Napierala 		return;
1145321b17ecSEdward Tomasz Napierala 	}
1146321b17ecSEdward Tomasz Napierala 
1147321b17ecSEdward Tomasz Napierala 	if (!STAILQ_EMPTY(&ic->ic_to_send)) {
1148321b17ecSEdward Tomasz Napierala 		STAILQ_INSERT_TAIL(&ic->ic_to_send, ip, ip_next);
1149321b17ecSEdward Tomasz Napierala 		/*
1150321b17ecSEdward Tomasz Napierala 		 * If the queue is not empty, someone else had already
1151321b17ecSEdward Tomasz Napierala 		 * signaled the send thread; no need to do that again,
1152321b17ecSEdward Tomasz Napierala 		 * just return.
1153321b17ecSEdward Tomasz Napierala 		 */
1154321b17ecSEdward Tomasz Napierala 		return;
1155321b17ecSEdward Tomasz Napierala 	}
1156321b17ecSEdward Tomasz Napierala 
1157321b17ecSEdward Tomasz Napierala 	STAILQ_INSERT_TAIL(&ic->ic_to_send, ip, ip_next);
1158321b17ecSEdward Tomasz Napierala 	cv_signal(&ic->ic_send_cv);
1159321b17ecSEdward Tomasz Napierala }
1160321b17ecSEdward Tomasz Napierala 
1161321b17ecSEdward Tomasz Napierala void
1162321b17ecSEdward Tomasz Napierala icl_soft_conn_pdu_queue(struct icl_conn *ic, struct icl_pdu *ip)
1163321b17ecSEdward Tomasz Napierala {
1164321b17ecSEdward Tomasz Napierala 
1165321b17ecSEdward Tomasz Napierala 	icl_pdu_queue(ip);
1166321b17ecSEdward Tomasz Napierala }
1167321b17ecSEdward Tomasz Napierala 
1168321b17ecSEdward Tomasz Napierala static struct icl_conn *
1169321b17ecSEdward Tomasz Napierala icl_soft_new_conn(const char *name, struct mtx *lock)
1170321b17ecSEdward Tomasz Napierala {
1171321b17ecSEdward Tomasz Napierala 	struct icl_conn *ic;
1172321b17ecSEdward Tomasz Napierala 
1173321b17ecSEdward Tomasz Napierala 	refcount_acquire(&icl_ncons);
1174321b17ecSEdward Tomasz Napierala 
1175321b17ecSEdward Tomasz Napierala 	ic = (struct icl_conn *)kobj_create(&icl_soft_class, M_ICL_SOFT, M_WAITOK | M_ZERO);
1176321b17ecSEdward Tomasz Napierala 
1177321b17ecSEdward Tomasz Napierala 	STAILQ_INIT(&ic->ic_to_send);
1178321b17ecSEdward Tomasz Napierala 	ic->ic_lock = lock;
1179321b17ecSEdward Tomasz Napierala 	cv_init(&ic->ic_send_cv, "icl_tx");
1180321b17ecSEdward Tomasz Napierala 	cv_init(&ic->ic_receive_cv, "icl_rx");
1181321b17ecSEdward Tomasz Napierala #ifdef DIAGNOSTIC
1182321b17ecSEdward Tomasz Napierala 	refcount_init(&ic->ic_outstanding_pdus, 0);
1183321b17ecSEdward Tomasz Napierala #endif
1184321b17ecSEdward Tomasz Napierala 	ic->ic_max_data_segment_length = ICL_MAX_DATA_SEGMENT_LENGTH;
1185321b17ecSEdward Tomasz Napierala 	ic->ic_name = name;
1186*d4b195d3SEdward Tomasz Napierala 	ic->ic_offload = "None";
1187321b17ecSEdward Tomasz Napierala 
1188321b17ecSEdward Tomasz Napierala 	return (ic);
1189321b17ecSEdward Tomasz Napierala }
1190321b17ecSEdward Tomasz Napierala 
1191321b17ecSEdward Tomasz Napierala void
1192321b17ecSEdward Tomasz Napierala icl_soft_conn_free(struct icl_conn *ic)
1193321b17ecSEdward Tomasz Napierala {
1194321b17ecSEdward Tomasz Napierala 
1195321b17ecSEdward Tomasz Napierala 	cv_destroy(&ic->ic_send_cv);
1196321b17ecSEdward Tomasz Napierala 	cv_destroy(&ic->ic_receive_cv);
1197321b17ecSEdward Tomasz Napierala 	kobj_delete((struct kobj *)ic, M_ICL_SOFT);
1198321b17ecSEdward Tomasz Napierala 	refcount_release(&icl_ncons);
1199321b17ecSEdward Tomasz Napierala }
1200321b17ecSEdward Tomasz Napierala 
1201321b17ecSEdward Tomasz Napierala static int
1202321b17ecSEdward Tomasz Napierala icl_conn_start(struct icl_conn *ic)
1203321b17ecSEdward Tomasz Napierala {
1204321b17ecSEdward Tomasz Napierala 	size_t minspace;
1205321b17ecSEdward Tomasz Napierala 	struct sockopt opt;
1206321b17ecSEdward Tomasz Napierala 	int error, one = 1;
1207321b17ecSEdward Tomasz Napierala 
1208321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
1209321b17ecSEdward Tomasz Napierala 
1210321b17ecSEdward Tomasz Napierala 	/*
1211321b17ecSEdward Tomasz Napierala 	 * XXX: Ugly hack.
1212321b17ecSEdward Tomasz Napierala 	 */
1213321b17ecSEdward Tomasz Napierala 	if (ic->ic_socket == NULL) {
1214321b17ecSEdward Tomasz Napierala 		ICL_CONN_UNLOCK(ic);
1215321b17ecSEdward Tomasz Napierala 		return (EINVAL);
1216321b17ecSEdward Tomasz Napierala 	}
1217321b17ecSEdward Tomasz Napierala 
1218321b17ecSEdward Tomasz Napierala 	ic->ic_receive_state = ICL_CONN_STATE_BHS;
1219321b17ecSEdward Tomasz Napierala 	ic->ic_receive_len = sizeof(struct iscsi_bhs);
1220321b17ecSEdward Tomasz Napierala 	ic->ic_disconnecting = false;
1221321b17ecSEdward Tomasz Napierala 
1222321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
1223321b17ecSEdward Tomasz Napierala 
1224321b17ecSEdward Tomasz Napierala 	/*
1225321b17ecSEdward Tomasz Napierala 	 * For sendspace, this is required because the current code cannot
1226321b17ecSEdward Tomasz Napierala 	 * send a PDU in pieces; thus, the minimum buffer size is equal
1227321b17ecSEdward Tomasz Napierala 	 * to the maximum PDU size.  "+4" is to account for possible padding.
1228321b17ecSEdward Tomasz Napierala 	 *
1229321b17ecSEdward Tomasz Napierala 	 * What we should actually do here is to use autoscaling, but set
1230321b17ecSEdward Tomasz Napierala 	 * some minimal buffer size to "minspace".  I don't know a way to do
1231321b17ecSEdward Tomasz Napierala 	 * that, though.
1232321b17ecSEdward Tomasz Napierala 	 */
1233321b17ecSEdward Tomasz Napierala 	minspace = sizeof(struct iscsi_bhs) + ic->ic_max_data_segment_length +
1234321b17ecSEdward Tomasz Napierala 	    ISCSI_HEADER_DIGEST_SIZE + ISCSI_DATA_DIGEST_SIZE + 4;
1235321b17ecSEdward Tomasz Napierala 	if (sendspace < minspace) {
1236321b17ecSEdward Tomasz Napierala 		ICL_WARN("kern.icl.sendspace too low; must be at least %zd",
1237321b17ecSEdward Tomasz Napierala 		    minspace);
1238321b17ecSEdward Tomasz Napierala 		sendspace = minspace;
1239321b17ecSEdward Tomasz Napierala 	}
1240321b17ecSEdward Tomasz Napierala 	if (recvspace < minspace) {
1241321b17ecSEdward Tomasz Napierala 		ICL_WARN("kern.icl.recvspace too low; must be at least %zd",
1242321b17ecSEdward Tomasz Napierala 		    minspace);
1243321b17ecSEdward Tomasz Napierala 		recvspace = minspace;
1244321b17ecSEdward Tomasz Napierala 	}
1245321b17ecSEdward Tomasz Napierala 
1246321b17ecSEdward Tomasz Napierala 	error = soreserve(ic->ic_socket, sendspace, recvspace);
1247321b17ecSEdward Tomasz Napierala 	if (error != 0) {
1248321b17ecSEdward Tomasz Napierala 		ICL_WARN("soreserve failed with error %d", error);
12495aabcd7cSEdward Tomasz Napierala 		icl_soft_conn_close(ic);
1250321b17ecSEdward Tomasz Napierala 		return (error);
1251321b17ecSEdward Tomasz Napierala 	}
1252321b17ecSEdward Tomasz Napierala 	ic->ic_socket->so_snd.sb_flags |= SB_AUTOSIZE;
1253321b17ecSEdward Tomasz Napierala 	ic->ic_socket->so_rcv.sb_flags |= SB_AUTOSIZE;
1254321b17ecSEdward Tomasz Napierala 
1255321b17ecSEdward Tomasz Napierala 	/*
1256321b17ecSEdward Tomasz Napierala 	 * Disable Nagle.
1257321b17ecSEdward Tomasz Napierala 	 */
1258321b17ecSEdward Tomasz Napierala 	bzero(&opt, sizeof(opt));
1259321b17ecSEdward Tomasz Napierala 	opt.sopt_dir = SOPT_SET;
1260321b17ecSEdward Tomasz Napierala 	opt.sopt_level = IPPROTO_TCP;
1261321b17ecSEdward Tomasz Napierala 	opt.sopt_name = TCP_NODELAY;
1262321b17ecSEdward Tomasz Napierala 	opt.sopt_val = &one;
1263321b17ecSEdward Tomasz Napierala 	opt.sopt_valsize = sizeof(one);
1264321b17ecSEdward Tomasz Napierala 	error = sosetopt(ic->ic_socket, &opt);
1265321b17ecSEdward Tomasz Napierala 	if (error != 0) {
1266321b17ecSEdward Tomasz Napierala 		ICL_WARN("disabling TCP_NODELAY failed with error %d", error);
12675aabcd7cSEdward Tomasz Napierala 		icl_soft_conn_close(ic);
1268321b17ecSEdward Tomasz Napierala 		return (error);
1269321b17ecSEdward Tomasz Napierala 	}
1270321b17ecSEdward Tomasz Napierala 
1271321b17ecSEdward Tomasz Napierala 	/*
1272321b17ecSEdward Tomasz Napierala 	 * Start threads.
1273321b17ecSEdward Tomasz Napierala 	 */
1274321b17ecSEdward Tomasz Napierala 	error = kthread_add(icl_send_thread, ic, NULL, NULL, 0, 0, "%stx",
1275321b17ecSEdward Tomasz Napierala 	    ic->ic_name);
1276321b17ecSEdward Tomasz Napierala 	if (error != 0) {
1277321b17ecSEdward Tomasz Napierala 		ICL_WARN("kthread_add(9) failed with error %d", error);
12785aabcd7cSEdward Tomasz Napierala 		icl_soft_conn_close(ic);
1279321b17ecSEdward Tomasz Napierala 		return (error);
1280321b17ecSEdward Tomasz Napierala 	}
1281321b17ecSEdward Tomasz Napierala 
1282321b17ecSEdward Tomasz Napierala 	error = kthread_add(icl_receive_thread, ic, NULL, NULL, 0, 0, "%srx",
1283321b17ecSEdward Tomasz Napierala 	    ic->ic_name);
1284321b17ecSEdward Tomasz Napierala 	if (error != 0) {
1285321b17ecSEdward Tomasz Napierala 		ICL_WARN("kthread_add(9) failed with error %d", error);
12865aabcd7cSEdward Tomasz Napierala 		icl_soft_conn_close(ic);
1287321b17ecSEdward Tomasz Napierala 		return (error);
1288321b17ecSEdward Tomasz Napierala 	}
1289321b17ecSEdward Tomasz Napierala 
1290321b17ecSEdward Tomasz Napierala 	/*
1291321b17ecSEdward Tomasz Napierala 	 * Register socket upcall, to get notified about incoming PDUs
1292321b17ecSEdward Tomasz Napierala 	 * and free space to send outgoing ones.
1293321b17ecSEdward Tomasz Napierala 	 */
1294321b17ecSEdward Tomasz Napierala 	SOCKBUF_LOCK(&ic->ic_socket->so_snd);
1295321b17ecSEdward Tomasz Napierala 	soupcall_set(ic->ic_socket, SO_SND, icl_soupcall_send, ic);
1296321b17ecSEdward Tomasz Napierala 	SOCKBUF_UNLOCK(&ic->ic_socket->so_snd);
1297321b17ecSEdward Tomasz Napierala 	SOCKBUF_LOCK(&ic->ic_socket->so_rcv);
1298321b17ecSEdward Tomasz Napierala 	soupcall_set(ic->ic_socket, SO_RCV, icl_soupcall_receive, ic);
1299321b17ecSEdward Tomasz Napierala 	SOCKBUF_UNLOCK(&ic->ic_socket->so_rcv);
1300321b17ecSEdward Tomasz Napierala 
1301321b17ecSEdward Tomasz Napierala 	return (0);
1302321b17ecSEdward Tomasz Napierala }
1303321b17ecSEdward Tomasz Napierala 
1304321b17ecSEdward Tomasz Napierala int
1305321b17ecSEdward Tomasz Napierala icl_soft_conn_handoff(struct icl_conn *ic, int fd)
1306321b17ecSEdward Tomasz Napierala {
1307321b17ecSEdward Tomasz Napierala 	struct file *fp;
1308321b17ecSEdward Tomasz Napierala 	struct socket *so;
1309321b17ecSEdward Tomasz Napierala 	cap_rights_t rights;
1310321b17ecSEdward Tomasz Napierala 	int error;
1311321b17ecSEdward Tomasz Napierala 
1312321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK_ASSERT_NOT(ic);
1313321b17ecSEdward Tomasz Napierala 
1314321b17ecSEdward Tomasz Napierala 	/*
1315321b17ecSEdward Tomasz Napierala 	 * Steal the socket from userland.
1316321b17ecSEdward Tomasz Napierala 	 */
1317321b17ecSEdward Tomasz Napierala 	error = fget(curthread, fd,
1318321b17ecSEdward Tomasz Napierala 	    cap_rights_init(&rights, CAP_SOCK_CLIENT), &fp);
1319321b17ecSEdward Tomasz Napierala 	if (error != 0)
1320321b17ecSEdward Tomasz Napierala 		return (error);
1321321b17ecSEdward Tomasz Napierala 	if (fp->f_type != DTYPE_SOCKET) {
1322321b17ecSEdward Tomasz Napierala 		fdrop(fp, curthread);
1323321b17ecSEdward Tomasz Napierala 		return (EINVAL);
1324321b17ecSEdward Tomasz Napierala 	}
1325321b17ecSEdward Tomasz Napierala 	so = fp->f_data;
1326321b17ecSEdward Tomasz Napierala 	if (so->so_type != SOCK_STREAM) {
1327321b17ecSEdward Tomasz Napierala 		fdrop(fp, curthread);
1328321b17ecSEdward Tomasz Napierala 		return (EINVAL);
1329321b17ecSEdward Tomasz Napierala 	}
1330321b17ecSEdward Tomasz Napierala 
1331321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
1332321b17ecSEdward Tomasz Napierala 
1333321b17ecSEdward Tomasz Napierala 	if (ic->ic_socket != NULL) {
1334321b17ecSEdward Tomasz Napierala 		ICL_CONN_UNLOCK(ic);
1335321b17ecSEdward Tomasz Napierala 		fdrop(fp, curthread);
1336321b17ecSEdward Tomasz Napierala 		return (EBUSY);
1337321b17ecSEdward Tomasz Napierala 	}
1338321b17ecSEdward Tomasz Napierala 
1339321b17ecSEdward Tomasz Napierala 	ic->ic_socket = fp->f_data;
1340321b17ecSEdward Tomasz Napierala 	fp->f_ops = &badfileops;
1341321b17ecSEdward Tomasz Napierala 	fp->f_data = NULL;
1342321b17ecSEdward Tomasz Napierala 	fdrop(fp, curthread);
1343321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
1344321b17ecSEdward Tomasz Napierala 
1345321b17ecSEdward Tomasz Napierala 	error = icl_conn_start(ic);
1346321b17ecSEdward Tomasz Napierala 
1347321b17ecSEdward Tomasz Napierala 	return (error);
1348321b17ecSEdward Tomasz Napierala }
1349321b17ecSEdward Tomasz Napierala 
1350321b17ecSEdward Tomasz Napierala void
13515aabcd7cSEdward Tomasz Napierala icl_soft_conn_close(struct icl_conn *ic)
1352321b17ecSEdward Tomasz Napierala {
1353321b17ecSEdward Tomasz Napierala 	struct icl_pdu *pdu;
1354321b17ecSEdward Tomasz Napierala 
1355321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK_ASSERT_NOT(ic);
1356321b17ecSEdward Tomasz Napierala 
1357321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
1358321b17ecSEdward Tomasz Napierala 	if (ic->ic_socket == NULL) {
1359321b17ecSEdward Tomasz Napierala 		ICL_CONN_UNLOCK(ic);
1360321b17ecSEdward Tomasz Napierala 		return;
1361321b17ecSEdward Tomasz Napierala 	}
1362321b17ecSEdward Tomasz Napierala 
1363321b17ecSEdward Tomasz Napierala 	/*
1364321b17ecSEdward Tomasz Napierala 	 * Deregister socket upcalls.
1365321b17ecSEdward Tomasz Napierala 	 */
1366321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
1367321b17ecSEdward Tomasz Napierala 	SOCKBUF_LOCK(&ic->ic_socket->so_snd);
1368321b17ecSEdward Tomasz Napierala 	if (ic->ic_socket->so_snd.sb_upcall != NULL)
1369321b17ecSEdward Tomasz Napierala 		soupcall_clear(ic->ic_socket, SO_SND);
1370321b17ecSEdward Tomasz Napierala 	SOCKBUF_UNLOCK(&ic->ic_socket->so_snd);
1371321b17ecSEdward Tomasz Napierala 	SOCKBUF_LOCK(&ic->ic_socket->so_rcv);
1372321b17ecSEdward Tomasz Napierala 	if (ic->ic_socket->so_rcv.sb_upcall != NULL)
1373321b17ecSEdward Tomasz Napierala 		soupcall_clear(ic->ic_socket, SO_RCV);
1374321b17ecSEdward Tomasz Napierala 	SOCKBUF_UNLOCK(&ic->ic_socket->so_rcv);
1375321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
1376321b17ecSEdward Tomasz Napierala 
1377321b17ecSEdward Tomasz Napierala 	ic->ic_disconnecting = true;
1378321b17ecSEdward Tomasz Napierala 
1379321b17ecSEdward Tomasz Napierala 	/*
1380321b17ecSEdward Tomasz Napierala 	 * Wake up the threads, so they can properly terminate.
1381321b17ecSEdward Tomasz Napierala 	 */
1382321b17ecSEdward Tomasz Napierala 	while (ic->ic_receive_running || ic->ic_send_running) {
1383321b17ecSEdward Tomasz Napierala 		//ICL_DEBUG("waiting for send/receive threads to terminate");
1384321b17ecSEdward Tomasz Napierala 		cv_signal(&ic->ic_receive_cv);
1385321b17ecSEdward Tomasz Napierala 		cv_signal(&ic->ic_send_cv);
1386321b17ecSEdward Tomasz Napierala 		cv_wait(&ic->ic_send_cv, ic->ic_lock);
1387321b17ecSEdward Tomasz Napierala 	}
1388321b17ecSEdward Tomasz Napierala 	//ICL_DEBUG("send/receive threads terminated");
1389321b17ecSEdward Tomasz Napierala 
1390321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
1391321b17ecSEdward Tomasz Napierala 	soclose(ic->ic_socket);
1392321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
1393321b17ecSEdward Tomasz Napierala 	ic->ic_socket = NULL;
1394321b17ecSEdward Tomasz Napierala 
1395321b17ecSEdward Tomasz Napierala 	if (ic->ic_receive_pdu != NULL) {
1396321b17ecSEdward Tomasz Napierala 		//ICL_DEBUG("freeing partially received PDU");
1397321b17ecSEdward Tomasz Napierala 		icl_pdu_free(ic->ic_receive_pdu);
1398321b17ecSEdward Tomasz Napierala 		ic->ic_receive_pdu = NULL;
1399321b17ecSEdward Tomasz Napierala 	}
1400321b17ecSEdward Tomasz Napierala 
1401321b17ecSEdward Tomasz Napierala 	/*
1402321b17ecSEdward Tomasz Napierala 	 * Remove any outstanding PDUs from the send queue.
1403321b17ecSEdward Tomasz Napierala 	 */
1404321b17ecSEdward Tomasz Napierala 	while (!STAILQ_EMPTY(&ic->ic_to_send)) {
1405321b17ecSEdward Tomasz Napierala 		pdu = STAILQ_FIRST(&ic->ic_to_send);
1406321b17ecSEdward Tomasz Napierala 		STAILQ_REMOVE_HEAD(&ic->ic_to_send, ip_next);
1407321b17ecSEdward Tomasz Napierala 		icl_pdu_free(pdu);
1408321b17ecSEdward Tomasz Napierala 	}
1409321b17ecSEdward Tomasz Napierala 
1410321b17ecSEdward Tomasz Napierala 	KASSERT(STAILQ_EMPTY(&ic->ic_to_send),
1411321b17ecSEdward Tomasz Napierala 	    ("destroying session with non-empty send queue"));
1412321b17ecSEdward Tomasz Napierala #ifdef DIAGNOSTIC
1413321b17ecSEdward Tomasz Napierala 	KASSERT(ic->ic_outstanding_pdus == 0,
1414321b17ecSEdward Tomasz Napierala 	    ("destroying session with %d outstanding PDUs",
1415321b17ecSEdward Tomasz Napierala 	     ic->ic_outstanding_pdus));
1416321b17ecSEdward Tomasz Napierala #endif
1417321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
1418321b17ecSEdward Tomasz Napierala }
1419321b17ecSEdward Tomasz Napierala 
1420321b17ecSEdward Tomasz Napierala bool
1421321b17ecSEdward Tomasz Napierala icl_soft_conn_connected(struct icl_conn *ic)
1422321b17ecSEdward Tomasz Napierala {
1423321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK_ASSERT_NOT(ic);
1424321b17ecSEdward Tomasz Napierala 
1425321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
1426321b17ecSEdward Tomasz Napierala 	if (ic->ic_socket == NULL) {
1427321b17ecSEdward Tomasz Napierala 		ICL_CONN_UNLOCK(ic);
1428321b17ecSEdward Tomasz Napierala 		return (false);
1429321b17ecSEdward Tomasz Napierala 	}
1430321b17ecSEdward Tomasz Napierala 	if (ic->ic_socket->so_error != 0) {
1431321b17ecSEdward Tomasz Napierala 		ICL_CONN_UNLOCK(ic);
1432321b17ecSEdward Tomasz Napierala 		return (false);
1433321b17ecSEdward Tomasz Napierala 	}
1434321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
1435321b17ecSEdward Tomasz Napierala 	return (true);
1436321b17ecSEdward Tomasz Napierala }
1437321b17ecSEdward Tomasz Napierala 
1438321b17ecSEdward Tomasz Napierala static int
1439321b17ecSEdward Tomasz Napierala icl_soft_limits(size_t *limitp)
1440321b17ecSEdward Tomasz Napierala {
1441321b17ecSEdward Tomasz Napierala 
1442321b17ecSEdward Tomasz Napierala 	*limitp = 128 * 1024;
1443321b17ecSEdward Tomasz Napierala 
1444321b17ecSEdward Tomasz Napierala 	return (0);
1445321b17ecSEdward Tomasz Napierala }
1446321b17ecSEdward Tomasz Napierala 
1447321b17ecSEdward Tomasz Napierala #ifdef ICL_KERNEL_PROXY
1448321b17ecSEdward Tomasz Napierala int
1449321b17ecSEdward Tomasz Napierala icl_conn_handoff_sock(struct icl_conn *ic, struct socket *so)
1450321b17ecSEdward Tomasz Napierala {
1451321b17ecSEdward Tomasz Napierala 	int error;
1452321b17ecSEdward Tomasz Napierala 
1453321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK_ASSERT_NOT(ic);
1454321b17ecSEdward Tomasz Napierala 
1455321b17ecSEdward Tomasz Napierala 	if (so->so_type != SOCK_STREAM)
1456321b17ecSEdward Tomasz Napierala 		return (EINVAL);
1457321b17ecSEdward Tomasz Napierala 
1458321b17ecSEdward Tomasz Napierala 	ICL_CONN_LOCK(ic);
1459321b17ecSEdward Tomasz Napierala 	if (ic->ic_socket != NULL) {
1460321b17ecSEdward Tomasz Napierala 		ICL_CONN_UNLOCK(ic);
1461321b17ecSEdward Tomasz Napierala 		return (EBUSY);
1462321b17ecSEdward Tomasz Napierala 	}
1463321b17ecSEdward Tomasz Napierala 	ic->ic_socket = so;
1464321b17ecSEdward Tomasz Napierala 	ICL_CONN_UNLOCK(ic);
1465321b17ecSEdward Tomasz Napierala 
1466321b17ecSEdward Tomasz Napierala 	error = icl_conn_start(ic);
1467321b17ecSEdward Tomasz Napierala 
1468321b17ecSEdward Tomasz Napierala 	return (error);
1469321b17ecSEdward Tomasz Napierala }
1470321b17ecSEdward Tomasz Napierala #endif /* ICL_KERNEL_PROXY */
1471321b17ecSEdward Tomasz Napierala 
1472321b17ecSEdward Tomasz Napierala static int
1473321b17ecSEdward Tomasz Napierala icl_soft_load(void)
1474321b17ecSEdward Tomasz Napierala {
1475321b17ecSEdward Tomasz Napierala 	int error;
1476321b17ecSEdward Tomasz Napierala 
1477321b17ecSEdward Tomasz Napierala 	icl_pdu_zone = uma_zcreate("icl_pdu",
1478321b17ecSEdward Tomasz Napierala 	    sizeof(struct icl_pdu), NULL, NULL, NULL, NULL,
1479321b17ecSEdward Tomasz Napierala 	    UMA_ALIGN_PTR, 0);
1480321b17ecSEdward Tomasz Napierala 	refcount_init(&icl_ncons, 0);
1481321b17ecSEdward Tomasz Napierala 
1482321b17ecSEdward Tomasz Napierala 	/*
1483321b17ecSEdward Tomasz Napierala 	 * The reason we call this "none" is that to the user,
1484321b17ecSEdward Tomasz Napierala 	 * it's known as "offload driver"; "offload driver: soft"
1485321b17ecSEdward Tomasz Napierala 	 * doesn't make much sense.
1486321b17ecSEdward Tomasz Napierala 	 */
1487321b17ecSEdward Tomasz Napierala 	error = icl_register("none", 0, icl_soft_limits, icl_soft_new_conn);
1488321b17ecSEdward Tomasz Napierala 	KASSERT(error == 0, ("failed to register"));
1489321b17ecSEdward Tomasz Napierala 
1490321b17ecSEdward Tomasz Napierala 	return (error);
1491321b17ecSEdward Tomasz Napierala }
1492321b17ecSEdward Tomasz Napierala 
1493321b17ecSEdward Tomasz Napierala static int
1494321b17ecSEdward Tomasz Napierala icl_soft_unload(void)
1495321b17ecSEdward Tomasz Napierala {
1496321b17ecSEdward Tomasz Napierala 
1497321b17ecSEdward Tomasz Napierala 	if (icl_ncons != 0)
1498321b17ecSEdward Tomasz Napierala 		return (EBUSY);
1499321b17ecSEdward Tomasz Napierala 
1500321b17ecSEdward Tomasz Napierala 	icl_unregister("none");
1501321b17ecSEdward Tomasz Napierala 
1502321b17ecSEdward Tomasz Napierala 	uma_zdestroy(icl_pdu_zone);
1503321b17ecSEdward Tomasz Napierala 
1504321b17ecSEdward Tomasz Napierala 	return (0);
1505321b17ecSEdward Tomasz Napierala }
1506321b17ecSEdward Tomasz Napierala 
1507321b17ecSEdward Tomasz Napierala static int
1508321b17ecSEdward Tomasz Napierala icl_soft_modevent(module_t mod, int what, void *arg)
1509321b17ecSEdward Tomasz Napierala {
1510321b17ecSEdward Tomasz Napierala 
1511321b17ecSEdward Tomasz Napierala 	switch (what) {
1512321b17ecSEdward Tomasz Napierala 	case MOD_LOAD:
1513321b17ecSEdward Tomasz Napierala 		return (icl_soft_load());
1514321b17ecSEdward Tomasz Napierala 	case MOD_UNLOAD:
1515321b17ecSEdward Tomasz Napierala 		return (icl_soft_unload());
1516321b17ecSEdward Tomasz Napierala 	default:
1517321b17ecSEdward Tomasz Napierala 		return (EINVAL);
1518321b17ecSEdward Tomasz Napierala 	}
1519321b17ecSEdward Tomasz Napierala }
1520321b17ecSEdward Tomasz Napierala 
1521321b17ecSEdward Tomasz Napierala moduledata_t icl_soft_data = {
1522321b17ecSEdward Tomasz Napierala 	"icl_soft",
1523321b17ecSEdward Tomasz Napierala 	icl_soft_modevent,
1524321b17ecSEdward Tomasz Napierala 	0
1525321b17ecSEdward Tomasz Napierala };
1526321b17ecSEdward Tomasz Napierala 
1527321b17ecSEdward Tomasz Napierala DECLARE_MODULE(icl_soft, icl_soft_data, SI_SUB_DRIVERS, SI_ORDER_MIDDLE);
1528321b17ecSEdward Tomasz Napierala MODULE_DEPEND(icl_soft, icl, 1, 1, 1);
1529872d2d92SEdward Tomasz Napierala MODULE_VERSION(icl_soft, 1);
1530