1321b17ecSEdward Tomasz Napierala /*- 2321b17ecSEdward Tomasz Napierala * Copyright (c) 2012 The FreeBSD Foundation 3321b17ecSEdward Tomasz Napierala * All rights reserved. 4321b17ecSEdward Tomasz Napierala * 5321b17ecSEdward Tomasz Napierala * This software was developed by Edward Tomasz Napierala under sponsorship 6321b17ecSEdward Tomasz Napierala * from the FreeBSD Foundation. 7321b17ecSEdward Tomasz Napierala * 8321b17ecSEdward Tomasz Napierala * Redistribution and use in source and binary forms, with or without 9321b17ecSEdward Tomasz Napierala * modification, are permitted provided that the following conditions 10321b17ecSEdward Tomasz Napierala * are met: 11321b17ecSEdward Tomasz Napierala * 1. Redistributions of source code must retain the above copyright 12321b17ecSEdward Tomasz Napierala * notice, this list of conditions and the following disclaimer. 13321b17ecSEdward Tomasz Napierala * 2. Redistributions in binary form must reproduce the above copyright 14321b17ecSEdward Tomasz Napierala * notice, this list of conditions and the following disclaimer in the 15321b17ecSEdward Tomasz Napierala * documentation and/or other materials provided with the distribution. 16321b17ecSEdward Tomasz Napierala * 17321b17ecSEdward Tomasz Napierala * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 18321b17ecSEdward Tomasz Napierala * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 19321b17ecSEdward Tomasz Napierala * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 20321b17ecSEdward Tomasz Napierala * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 21321b17ecSEdward Tomasz Napierala * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 22321b17ecSEdward Tomasz Napierala * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 23321b17ecSEdward Tomasz Napierala * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 24321b17ecSEdward Tomasz Napierala * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 25321b17ecSEdward Tomasz Napierala * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 26321b17ecSEdward Tomasz Napierala * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 27321b17ecSEdward Tomasz Napierala * SUCH DAMAGE. 28321b17ecSEdward Tomasz Napierala * 29321b17ecSEdward Tomasz Napierala */ 30321b17ecSEdward Tomasz Napierala 31321b17ecSEdward Tomasz Napierala /* 32321b17ecSEdward Tomasz Napierala * iSCSI Common Layer. It's used by both the initiator and target to send 33321b17ecSEdward Tomasz Napierala * and receive iSCSI PDUs. 34321b17ecSEdward Tomasz Napierala */ 35321b17ecSEdward Tomasz Napierala 36321b17ecSEdward Tomasz Napierala #include <sys/cdefs.h> 37321b17ecSEdward Tomasz Napierala __FBSDID("$FreeBSD$"); 38321b17ecSEdward Tomasz Napierala 39321b17ecSEdward Tomasz Napierala #include <sys/param.h> 40321b17ecSEdward Tomasz Napierala #include <sys/capsicum.h> 41321b17ecSEdward Tomasz Napierala #include <sys/condvar.h> 42321b17ecSEdward Tomasz Napierala #include <sys/conf.h> 43321b17ecSEdward Tomasz Napierala #include <sys/file.h> 44321b17ecSEdward Tomasz Napierala #include <sys/kernel.h> 45321b17ecSEdward Tomasz Napierala #include <sys/kthread.h> 46321b17ecSEdward Tomasz Napierala #include <sys/lock.h> 47321b17ecSEdward Tomasz Napierala #include <sys/mbuf.h> 48321b17ecSEdward Tomasz Napierala #include <sys/mutex.h> 49321b17ecSEdward Tomasz Napierala #include <sys/module.h> 50321b17ecSEdward Tomasz Napierala #include <sys/protosw.h> 51321b17ecSEdward Tomasz Napierala #include <sys/socket.h> 52321b17ecSEdward Tomasz Napierala #include <sys/socketvar.h> 53321b17ecSEdward Tomasz Napierala #include <sys/sysctl.h> 54321b17ecSEdward Tomasz Napierala #include <sys/systm.h> 55321b17ecSEdward Tomasz Napierala #include <sys/sx.h> 56321b17ecSEdward Tomasz Napierala #include <sys/uio.h> 57321b17ecSEdward Tomasz Napierala #include <vm/uma.h> 58321b17ecSEdward Tomasz Napierala #include <netinet/in.h> 59321b17ecSEdward Tomasz Napierala #include <netinet/tcp.h> 60321b17ecSEdward Tomasz Napierala 61321b17ecSEdward Tomasz Napierala #include <dev/iscsi/icl.h> 62321b17ecSEdward Tomasz Napierala #include <dev/iscsi/iscsi_proto.h> 63321b17ecSEdward Tomasz Napierala #include <icl_conn_if.h> 64321b17ecSEdward Tomasz Napierala 65321b17ecSEdward Tomasz Napierala static int coalesce = 1; 66321b17ecSEdward Tomasz Napierala SYSCTL_INT(_kern_icl, OID_AUTO, coalesce, CTLFLAG_RWTUN, 67321b17ecSEdward Tomasz Napierala &coalesce, 0, "Try to coalesce PDUs before sending"); 68321b17ecSEdward Tomasz Napierala static int partial_receive_len = 128 * 1024; 69321b17ecSEdward Tomasz Napierala SYSCTL_INT(_kern_icl, OID_AUTO, partial_receive_len, CTLFLAG_RWTUN, 70321b17ecSEdward Tomasz Napierala &partial_receive_len, 0, "Minimum read size for partially received " 71321b17ecSEdward Tomasz Napierala "data segment"); 72321b17ecSEdward Tomasz Napierala static int sendspace = 1048576; 73321b17ecSEdward Tomasz Napierala SYSCTL_INT(_kern_icl, OID_AUTO, sendspace, CTLFLAG_RWTUN, 74321b17ecSEdward Tomasz Napierala &sendspace, 0, "Default send socket buffer size"); 75321b17ecSEdward Tomasz Napierala static int recvspace = 1048576; 76321b17ecSEdward Tomasz Napierala SYSCTL_INT(_kern_icl, OID_AUTO, recvspace, CTLFLAG_RWTUN, 77321b17ecSEdward Tomasz Napierala &recvspace, 0, "Default receive socket buffer size"); 78321b17ecSEdward Tomasz Napierala 79321b17ecSEdward Tomasz Napierala static MALLOC_DEFINE(M_ICL_SOFT, "icl_soft", "iSCSI software backend"); 80321b17ecSEdward Tomasz Napierala static uma_zone_t icl_pdu_zone; 81321b17ecSEdward Tomasz Napierala 82321b17ecSEdward Tomasz Napierala static volatile u_int icl_ncons; 83321b17ecSEdward Tomasz Napierala 84321b17ecSEdward Tomasz Napierala #define ICL_CONN_LOCK(X) mtx_lock(X->ic_lock) 85321b17ecSEdward Tomasz Napierala #define ICL_CONN_UNLOCK(X) mtx_unlock(X->ic_lock) 86321b17ecSEdward Tomasz Napierala #define ICL_CONN_LOCK_ASSERT(X) mtx_assert(X->ic_lock, MA_OWNED) 87321b17ecSEdward Tomasz Napierala #define ICL_CONN_LOCK_ASSERT_NOT(X) mtx_assert(X->ic_lock, MA_NOTOWNED) 88321b17ecSEdward Tomasz Napierala 89321b17ecSEdward Tomasz Napierala STAILQ_HEAD(icl_pdu_stailq, icl_pdu); 90321b17ecSEdward Tomasz Napierala 91321b17ecSEdward Tomasz Napierala static icl_conn_new_pdu_t icl_soft_conn_new_pdu; 92321b17ecSEdward Tomasz Napierala static icl_conn_pdu_free_t icl_soft_conn_pdu_free; 93321b17ecSEdward Tomasz Napierala static icl_conn_pdu_data_segment_length_t 94321b17ecSEdward Tomasz Napierala icl_soft_conn_pdu_data_segment_length; 95321b17ecSEdward Tomasz Napierala static icl_conn_pdu_append_data_t icl_soft_conn_pdu_append_data; 96321b17ecSEdward Tomasz Napierala static icl_conn_pdu_get_data_t icl_soft_conn_pdu_get_data; 97321b17ecSEdward Tomasz Napierala static icl_conn_pdu_queue_t icl_soft_conn_pdu_queue; 98321b17ecSEdward Tomasz Napierala static icl_conn_handoff_t icl_soft_conn_handoff; 99321b17ecSEdward Tomasz Napierala static icl_conn_free_t icl_soft_conn_free; 100321b17ecSEdward Tomasz Napierala static icl_conn_close_t icl_soft_conn_close; 101321b17ecSEdward Tomasz Napierala static icl_conn_connected_t icl_soft_conn_connected; 102321b17ecSEdward Tomasz Napierala 103321b17ecSEdward Tomasz Napierala static kobj_method_t icl_soft_methods[] = { 104321b17ecSEdward Tomasz Napierala KOBJMETHOD(icl_conn_new_pdu, icl_soft_conn_new_pdu), 105321b17ecSEdward Tomasz Napierala KOBJMETHOD(icl_conn_pdu_free, icl_soft_conn_pdu_free), 106321b17ecSEdward Tomasz Napierala KOBJMETHOD(icl_conn_pdu_data_segment_length, 107321b17ecSEdward Tomasz Napierala icl_soft_conn_pdu_data_segment_length), 108321b17ecSEdward Tomasz Napierala KOBJMETHOD(icl_conn_pdu_append_data, icl_soft_conn_pdu_append_data), 109321b17ecSEdward Tomasz Napierala KOBJMETHOD(icl_conn_pdu_get_data, icl_soft_conn_pdu_get_data), 110321b17ecSEdward Tomasz Napierala KOBJMETHOD(icl_conn_pdu_queue, icl_soft_conn_pdu_queue), 111321b17ecSEdward Tomasz Napierala KOBJMETHOD(icl_conn_handoff, icl_soft_conn_handoff), 112321b17ecSEdward Tomasz Napierala KOBJMETHOD(icl_conn_free, icl_soft_conn_free), 113321b17ecSEdward Tomasz Napierala KOBJMETHOD(icl_conn_close, icl_soft_conn_close), 114321b17ecSEdward Tomasz Napierala KOBJMETHOD(icl_conn_connected, icl_soft_conn_connected), 115321b17ecSEdward Tomasz Napierala { 0, 0 } 116321b17ecSEdward Tomasz Napierala }; 117321b17ecSEdward Tomasz Napierala 118321b17ecSEdward Tomasz Napierala DEFINE_CLASS(icl_soft, icl_soft_methods, sizeof(struct icl_conn)); 119321b17ecSEdward Tomasz Napierala 120321b17ecSEdward Tomasz Napierala static void icl_conn_close(struct icl_conn *ic); 121321b17ecSEdward Tomasz Napierala 122321b17ecSEdward Tomasz Napierala static void 123321b17ecSEdward Tomasz Napierala icl_conn_fail(struct icl_conn *ic) 124321b17ecSEdward Tomasz Napierala { 125321b17ecSEdward Tomasz Napierala if (ic->ic_socket == NULL) 126321b17ecSEdward Tomasz Napierala return; 127321b17ecSEdward Tomasz Napierala 128321b17ecSEdward Tomasz Napierala /* 129321b17ecSEdward Tomasz Napierala * XXX 130321b17ecSEdward Tomasz Napierala */ 131321b17ecSEdward Tomasz Napierala ic->ic_socket->so_error = EDOOFUS; 132321b17ecSEdward Tomasz Napierala (ic->ic_error)(ic); 133321b17ecSEdward Tomasz Napierala } 134321b17ecSEdward Tomasz Napierala 135321b17ecSEdward Tomasz Napierala static struct mbuf * 136321b17ecSEdward Tomasz Napierala icl_conn_receive(struct icl_conn *ic, size_t len) 137321b17ecSEdward Tomasz Napierala { 138321b17ecSEdward Tomasz Napierala struct uio uio; 139321b17ecSEdward Tomasz Napierala struct socket *so; 140321b17ecSEdward Tomasz Napierala struct mbuf *m; 141321b17ecSEdward Tomasz Napierala int error, flags; 142321b17ecSEdward Tomasz Napierala 143321b17ecSEdward Tomasz Napierala so = ic->ic_socket; 144321b17ecSEdward Tomasz Napierala 145321b17ecSEdward Tomasz Napierala memset(&uio, 0, sizeof(uio)); 146321b17ecSEdward Tomasz Napierala uio.uio_resid = len; 147321b17ecSEdward Tomasz Napierala 148321b17ecSEdward Tomasz Napierala flags = MSG_DONTWAIT; 149321b17ecSEdward Tomasz Napierala error = soreceive(so, NULL, &uio, &m, NULL, &flags); 150321b17ecSEdward Tomasz Napierala if (error != 0) { 151321b17ecSEdward Tomasz Napierala ICL_DEBUG("soreceive error %d", error); 152321b17ecSEdward Tomasz Napierala return (NULL); 153321b17ecSEdward Tomasz Napierala } 154321b17ecSEdward Tomasz Napierala if (uio.uio_resid != 0) { 155321b17ecSEdward Tomasz Napierala m_freem(m); 156321b17ecSEdward Tomasz Napierala ICL_DEBUG("short read"); 157321b17ecSEdward Tomasz Napierala return (NULL); 158321b17ecSEdward Tomasz Napierala } 159321b17ecSEdward Tomasz Napierala 160321b17ecSEdward Tomasz Napierala return (m); 161321b17ecSEdward Tomasz Napierala } 162321b17ecSEdward Tomasz Napierala 163321b17ecSEdward Tomasz Napierala static struct icl_pdu * 164321b17ecSEdward Tomasz Napierala icl_pdu_new_empty(struct icl_conn *ic, int flags) 165321b17ecSEdward Tomasz Napierala { 166321b17ecSEdward Tomasz Napierala struct icl_pdu *ip; 167321b17ecSEdward Tomasz Napierala 168321b17ecSEdward Tomasz Napierala #ifdef DIAGNOSTIC 169321b17ecSEdward Tomasz Napierala refcount_acquire(&ic->ic_outstanding_pdus); 170321b17ecSEdward Tomasz Napierala #endif 171321b17ecSEdward Tomasz Napierala ip = uma_zalloc(icl_pdu_zone, flags | M_ZERO); 172321b17ecSEdward Tomasz Napierala if (ip == NULL) { 173321b17ecSEdward Tomasz Napierala ICL_WARN("failed to allocate %zd bytes", sizeof(*ip)); 174321b17ecSEdward Tomasz Napierala #ifdef DIAGNOSTIC 175321b17ecSEdward Tomasz Napierala refcount_release(&ic->ic_outstanding_pdus); 176321b17ecSEdward Tomasz Napierala #endif 177321b17ecSEdward Tomasz Napierala return (NULL); 178321b17ecSEdward Tomasz Napierala } 179321b17ecSEdward Tomasz Napierala 180321b17ecSEdward Tomasz Napierala ip->ip_conn = ic; 181321b17ecSEdward Tomasz Napierala 182321b17ecSEdward Tomasz Napierala return (ip); 183321b17ecSEdward Tomasz Napierala } 184321b17ecSEdward Tomasz Napierala 185321b17ecSEdward Tomasz Napierala static void 186321b17ecSEdward Tomasz Napierala icl_pdu_free(struct icl_pdu *ip) 187321b17ecSEdward Tomasz Napierala { 188321b17ecSEdward Tomasz Napierala struct icl_conn *ic; 189321b17ecSEdward Tomasz Napierala 190321b17ecSEdward Tomasz Napierala ic = ip->ip_conn; 191321b17ecSEdward Tomasz Napierala 192321b17ecSEdward Tomasz Napierala m_freem(ip->ip_bhs_mbuf); 193321b17ecSEdward Tomasz Napierala m_freem(ip->ip_ahs_mbuf); 194321b17ecSEdward Tomasz Napierala m_freem(ip->ip_data_mbuf); 195321b17ecSEdward Tomasz Napierala uma_zfree(icl_pdu_zone, ip); 196321b17ecSEdward Tomasz Napierala #ifdef DIAGNOSTIC 197321b17ecSEdward Tomasz Napierala refcount_release(&ic->ic_outstanding_pdus); 198321b17ecSEdward Tomasz Napierala #endif 199321b17ecSEdward Tomasz Napierala } 200321b17ecSEdward Tomasz Napierala 201321b17ecSEdward Tomasz Napierala void 202321b17ecSEdward Tomasz Napierala icl_soft_conn_pdu_free(struct icl_conn *ic, struct icl_pdu *ip) 203321b17ecSEdward Tomasz Napierala { 204321b17ecSEdward Tomasz Napierala icl_pdu_free(ip); 205321b17ecSEdward Tomasz Napierala } 206321b17ecSEdward Tomasz Napierala 207321b17ecSEdward Tomasz Napierala /* 208321b17ecSEdward Tomasz Napierala * Allocate icl_pdu with empty BHS to fill up by the caller. 209321b17ecSEdward Tomasz Napierala */ 210321b17ecSEdward Tomasz Napierala struct icl_pdu * 211321b17ecSEdward Tomasz Napierala icl_soft_conn_new_pdu(struct icl_conn *ic, int flags) 212321b17ecSEdward Tomasz Napierala { 213321b17ecSEdward Tomasz Napierala struct icl_pdu *ip; 214321b17ecSEdward Tomasz Napierala 215321b17ecSEdward Tomasz Napierala ip = icl_pdu_new_empty(ic, flags); 216321b17ecSEdward Tomasz Napierala if (ip == NULL) 217321b17ecSEdward Tomasz Napierala return (NULL); 218321b17ecSEdward Tomasz Napierala 219321b17ecSEdward Tomasz Napierala ip->ip_bhs_mbuf = m_getm2(NULL, sizeof(struct iscsi_bhs), 220321b17ecSEdward Tomasz Napierala flags, MT_DATA, M_PKTHDR); 221321b17ecSEdward Tomasz Napierala if (ip->ip_bhs_mbuf == NULL) { 222321b17ecSEdward Tomasz Napierala ICL_WARN("failed to allocate %zd bytes", sizeof(*ip)); 223321b17ecSEdward Tomasz Napierala icl_pdu_free(ip); 224321b17ecSEdward Tomasz Napierala return (NULL); 225321b17ecSEdward Tomasz Napierala } 226321b17ecSEdward Tomasz Napierala ip->ip_bhs = mtod(ip->ip_bhs_mbuf, struct iscsi_bhs *); 227321b17ecSEdward Tomasz Napierala memset(ip->ip_bhs, 0, sizeof(struct iscsi_bhs)); 228321b17ecSEdward Tomasz Napierala ip->ip_bhs_mbuf->m_len = sizeof(struct iscsi_bhs); 229321b17ecSEdward Tomasz Napierala 230321b17ecSEdward Tomasz Napierala return (ip); 231321b17ecSEdward Tomasz Napierala } 232321b17ecSEdward Tomasz Napierala 233321b17ecSEdward Tomasz Napierala static int 234321b17ecSEdward Tomasz Napierala icl_pdu_ahs_length(const struct icl_pdu *request) 235321b17ecSEdward Tomasz Napierala { 236321b17ecSEdward Tomasz Napierala 237321b17ecSEdward Tomasz Napierala return (request->ip_bhs->bhs_total_ahs_len * 4); 238321b17ecSEdward Tomasz Napierala } 239321b17ecSEdward Tomasz Napierala 240321b17ecSEdward Tomasz Napierala static size_t 241321b17ecSEdward Tomasz Napierala icl_pdu_data_segment_length(const struct icl_pdu *request) 242321b17ecSEdward Tomasz Napierala { 243321b17ecSEdward Tomasz Napierala uint32_t len = 0; 244321b17ecSEdward Tomasz Napierala 245321b17ecSEdward Tomasz Napierala len += request->ip_bhs->bhs_data_segment_len[0]; 246321b17ecSEdward Tomasz Napierala len <<= 8; 247321b17ecSEdward Tomasz Napierala len += request->ip_bhs->bhs_data_segment_len[1]; 248321b17ecSEdward Tomasz Napierala len <<= 8; 249321b17ecSEdward Tomasz Napierala len += request->ip_bhs->bhs_data_segment_len[2]; 250321b17ecSEdward Tomasz Napierala 251321b17ecSEdward Tomasz Napierala return (len); 252321b17ecSEdward Tomasz Napierala } 253321b17ecSEdward Tomasz Napierala 254321b17ecSEdward Tomasz Napierala size_t 255321b17ecSEdward Tomasz Napierala icl_soft_conn_pdu_data_segment_length(struct icl_conn *ic, 256321b17ecSEdward Tomasz Napierala const struct icl_pdu *request) 257321b17ecSEdward Tomasz Napierala { 258321b17ecSEdward Tomasz Napierala 259321b17ecSEdward Tomasz Napierala return (icl_pdu_data_segment_length(request)); 260321b17ecSEdward Tomasz Napierala } 261321b17ecSEdward Tomasz Napierala 262321b17ecSEdward Tomasz Napierala static void 263321b17ecSEdward Tomasz Napierala icl_pdu_set_data_segment_length(struct icl_pdu *response, uint32_t len) 264321b17ecSEdward Tomasz Napierala { 265321b17ecSEdward Tomasz Napierala 266321b17ecSEdward Tomasz Napierala response->ip_bhs->bhs_data_segment_len[2] = len; 267321b17ecSEdward Tomasz Napierala response->ip_bhs->bhs_data_segment_len[1] = len >> 8; 268321b17ecSEdward Tomasz Napierala response->ip_bhs->bhs_data_segment_len[0] = len >> 16; 269321b17ecSEdward Tomasz Napierala } 270321b17ecSEdward Tomasz Napierala 271321b17ecSEdward Tomasz Napierala static size_t 272321b17ecSEdward Tomasz Napierala icl_pdu_padding(const struct icl_pdu *ip) 273321b17ecSEdward Tomasz Napierala { 274321b17ecSEdward Tomasz Napierala 275321b17ecSEdward Tomasz Napierala if ((ip->ip_data_len % 4) != 0) 276321b17ecSEdward Tomasz Napierala return (4 - (ip->ip_data_len % 4)); 277321b17ecSEdward Tomasz Napierala 278321b17ecSEdward Tomasz Napierala return (0); 279321b17ecSEdward Tomasz Napierala } 280321b17ecSEdward Tomasz Napierala 281321b17ecSEdward Tomasz Napierala static size_t 282321b17ecSEdward Tomasz Napierala icl_pdu_size(const struct icl_pdu *response) 283321b17ecSEdward Tomasz Napierala { 284321b17ecSEdward Tomasz Napierala size_t len; 285321b17ecSEdward Tomasz Napierala 286321b17ecSEdward Tomasz Napierala KASSERT(response->ip_ahs_len == 0, ("responding with AHS")); 287321b17ecSEdward Tomasz Napierala 288321b17ecSEdward Tomasz Napierala len = sizeof(struct iscsi_bhs) + response->ip_data_len + 289321b17ecSEdward Tomasz Napierala icl_pdu_padding(response); 290321b17ecSEdward Tomasz Napierala if (response->ip_conn->ic_header_crc32c) 291321b17ecSEdward Tomasz Napierala len += ISCSI_HEADER_DIGEST_SIZE; 292321b17ecSEdward Tomasz Napierala if (response->ip_data_len != 0 && response->ip_conn->ic_data_crc32c) 293321b17ecSEdward Tomasz Napierala len += ISCSI_DATA_DIGEST_SIZE; 294321b17ecSEdward Tomasz Napierala 295321b17ecSEdward Tomasz Napierala return (len); 296321b17ecSEdward Tomasz Napierala } 297321b17ecSEdward Tomasz Napierala 298321b17ecSEdward Tomasz Napierala static int 299321b17ecSEdward Tomasz Napierala icl_pdu_receive_bhs(struct icl_pdu *request, size_t *availablep) 300321b17ecSEdward Tomasz Napierala { 301321b17ecSEdward Tomasz Napierala struct mbuf *m; 302321b17ecSEdward Tomasz Napierala 303321b17ecSEdward Tomasz Napierala m = icl_conn_receive(request->ip_conn, sizeof(struct iscsi_bhs)); 304321b17ecSEdward Tomasz Napierala if (m == NULL) { 305321b17ecSEdward Tomasz Napierala ICL_DEBUG("failed to receive BHS"); 306321b17ecSEdward Tomasz Napierala return (-1); 307321b17ecSEdward Tomasz Napierala } 308321b17ecSEdward Tomasz Napierala 309321b17ecSEdward Tomasz Napierala request->ip_bhs_mbuf = m_pullup(m, sizeof(struct iscsi_bhs)); 310321b17ecSEdward Tomasz Napierala if (request->ip_bhs_mbuf == NULL) { 311321b17ecSEdward Tomasz Napierala ICL_WARN("m_pullup failed"); 312321b17ecSEdward Tomasz Napierala return (-1); 313321b17ecSEdward Tomasz Napierala } 314321b17ecSEdward Tomasz Napierala request->ip_bhs = mtod(request->ip_bhs_mbuf, struct iscsi_bhs *); 315321b17ecSEdward Tomasz Napierala 316321b17ecSEdward Tomasz Napierala /* 317321b17ecSEdward Tomasz Napierala * XXX: For architectures with strict alignment requirements 318321b17ecSEdward Tomasz Napierala * we may need to allocate ip_bhs and copy the data into it. 319321b17ecSEdward Tomasz Napierala * For some reason, though, not doing this doesn't seem 320321b17ecSEdward Tomasz Napierala * to cause problems; tested on sparc64. 321321b17ecSEdward Tomasz Napierala */ 322321b17ecSEdward Tomasz Napierala 323321b17ecSEdward Tomasz Napierala *availablep -= sizeof(struct iscsi_bhs); 324321b17ecSEdward Tomasz Napierala return (0); 325321b17ecSEdward Tomasz Napierala } 326321b17ecSEdward Tomasz Napierala 327321b17ecSEdward Tomasz Napierala static int 328321b17ecSEdward Tomasz Napierala icl_pdu_receive_ahs(struct icl_pdu *request, size_t *availablep) 329321b17ecSEdward Tomasz Napierala { 330321b17ecSEdward Tomasz Napierala 331321b17ecSEdward Tomasz Napierala request->ip_ahs_len = icl_pdu_ahs_length(request); 332321b17ecSEdward Tomasz Napierala if (request->ip_ahs_len == 0) 333321b17ecSEdward Tomasz Napierala return (0); 334321b17ecSEdward Tomasz Napierala 335321b17ecSEdward Tomasz Napierala request->ip_ahs_mbuf = icl_conn_receive(request->ip_conn, 336321b17ecSEdward Tomasz Napierala request->ip_ahs_len); 337321b17ecSEdward Tomasz Napierala if (request->ip_ahs_mbuf == NULL) { 338321b17ecSEdward Tomasz Napierala ICL_DEBUG("failed to receive AHS"); 339321b17ecSEdward Tomasz Napierala return (-1); 340321b17ecSEdward Tomasz Napierala } 341321b17ecSEdward Tomasz Napierala 342321b17ecSEdward Tomasz Napierala *availablep -= request->ip_ahs_len; 343321b17ecSEdward Tomasz Napierala return (0); 344321b17ecSEdward Tomasz Napierala } 345321b17ecSEdward Tomasz Napierala 346321b17ecSEdward Tomasz Napierala static uint32_t 347321b17ecSEdward Tomasz Napierala icl_mbuf_to_crc32c(const struct mbuf *m0) 348321b17ecSEdward Tomasz Napierala { 349321b17ecSEdward Tomasz Napierala uint32_t digest = 0xffffffff; 350321b17ecSEdward Tomasz Napierala const struct mbuf *m; 351321b17ecSEdward Tomasz Napierala 352321b17ecSEdward Tomasz Napierala for (m = m0; m != NULL; m = m->m_next) 353321b17ecSEdward Tomasz Napierala digest = calculate_crc32c(digest, 354321b17ecSEdward Tomasz Napierala mtod(m, const void *), m->m_len); 355321b17ecSEdward Tomasz Napierala 356321b17ecSEdward Tomasz Napierala digest = digest ^ 0xffffffff; 357321b17ecSEdward Tomasz Napierala 358321b17ecSEdward Tomasz Napierala return (digest); 359321b17ecSEdward Tomasz Napierala } 360321b17ecSEdward Tomasz Napierala 361321b17ecSEdward Tomasz Napierala static int 362321b17ecSEdward Tomasz Napierala icl_pdu_check_header_digest(struct icl_pdu *request, size_t *availablep) 363321b17ecSEdward Tomasz Napierala { 364321b17ecSEdward Tomasz Napierala struct mbuf *m; 365321b17ecSEdward Tomasz Napierala uint32_t received_digest, valid_digest; 366321b17ecSEdward Tomasz Napierala 367321b17ecSEdward Tomasz Napierala if (request->ip_conn->ic_header_crc32c == false) 368321b17ecSEdward Tomasz Napierala return (0); 369321b17ecSEdward Tomasz Napierala 370321b17ecSEdward Tomasz Napierala m = icl_conn_receive(request->ip_conn, ISCSI_HEADER_DIGEST_SIZE); 371321b17ecSEdward Tomasz Napierala if (m == NULL) { 372321b17ecSEdward Tomasz Napierala ICL_DEBUG("failed to receive header digest"); 373321b17ecSEdward Tomasz Napierala return (-1); 374321b17ecSEdward Tomasz Napierala } 375321b17ecSEdward Tomasz Napierala 376321b17ecSEdward Tomasz Napierala CTASSERT(sizeof(received_digest) == ISCSI_HEADER_DIGEST_SIZE); 377321b17ecSEdward Tomasz Napierala m_copydata(m, 0, ISCSI_HEADER_DIGEST_SIZE, (void *)&received_digest); 378321b17ecSEdward Tomasz Napierala m_freem(m); 379321b17ecSEdward Tomasz Napierala 380321b17ecSEdward Tomasz Napierala *availablep -= ISCSI_HEADER_DIGEST_SIZE; 381321b17ecSEdward Tomasz Napierala 382321b17ecSEdward Tomasz Napierala /* 383321b17ecSEdward Tomasz Napierala * XXX: Handle AHS. 384321b17ecSEdward Tomasz Napierala */ 385321b17ecSEdward Tomasz Napierala valid_digest = icl_mbuf_to_crc32c(request->ip_bhs_mbuf); 386321b17ecSEdward Tomasz Napierala if (received_digest != valid_digest) { 387321b17ecSEdward Tomasz Napierala ICL_WARN("header digest check failed; got 0x%x, " 388321b17ecSEdward Tomasz Napierala "should be 0x%x", received_digest, valid_digest); 389321b17ecSEdward Tomasz Napierala return (-1); 390321b17ecSEdward Tomasz Napierala } 391321b17ecSEdward Tomasz Napierala 392321b17ecSEdward Tomasz Napierala return (0); 393321b17ecSEdward Tomasz Napierala } 394321b17ecSEdward Tomasz Napierala 395321b17ecSEdward Tomasz Napierala /* 396321b17ecSEdward Tomasz Napierala * Return the number of bytes that should be waiting in the receive socket 397321b17ecSEdward Tomasz Napierala * before icl_pdu_receive_data_segment() gets called. 398321b17ecSEdward Tomasz Napierala */ 399321b17ecSEdward Tomasz Napierala static size_t 400321b17ecSEdward Tomasz Napierala icl_pdu_data_segment_receive_len(const struct icl_pdu *request) 401321b17ecSEdward Tomasz Napierala { 402321b17ecSEdward Tomasz Napierala size_t len; 403321b17ecSEdward Tomasz Napierala 404321b17ecSEdward Tomasz Napierala len = icl_pdu_data_segment_length(request); 405321b17ecSEdward Tomasz Napierala if (len == 0) 406321b17ecSEdward Tomasz Napierala return (0); 407321b17ecSEdward Tomasz Napierala 408321b17ecSEdward Tomasz Napierala /* 409321b17ecSEdward Tomasz Napierala * Account for the parts of data segment already read from 410321b17ecSEdward Tomasz Napierala * the socket buffer. 411321b17ecSEdward Tomasz Napierala */ 412321b17ecSEdward Tomasz Napierala KASSERT(len > request->ip_data_len, ("len <= request->ip_data_len")); 413321b17ecSEdward Tomasz Napierala len -= request->ip_data_len; 414321b17ecSEdward Tomasz Napierala 415321b17ecSEdward Tomasz Napierala /* 416321b17ecSEdward Tomasz Napierala * Don't always wait for the full data segment to be delivered 417321b17ecSEdward Tomasz Napierala * to the socket; this might badly affect performance due to 418321b17ecSEdward Tomasz Napierala * TCP window scaling. 419321b17ecSEdward Tomasz Napierala */ 420321b17ecSEdward Tomasz Napierala if (len > partial_receive_len) { 421321b17ecSEdward Tomasz Napierala #if 0 422321b17ecSEdward Tomasz Napierala ICL_DEBUG("need %zd bytes of data, limiting to %zd", 423321b17ecSEdward Tomasz Napierala len, partial_receive_len)); 424321b17ecSEdward Tomasz Napierala #endif 425321b17ecSEdward Tomasz Napierala len = partial_receive_len; 426321b17ecSEdward Tomasz Napierala 427321b17ecSEdward Tomasz Napierala return (len); 428321b17ecSEdward Tomasz Napierala } 429321b17ecSEdward Tomasz Napierala 430321b17ecSEdward Tomasz Napierala /* 431321b17ecSEdward Tomasz Napierala * Account for padding. Note that due to the way code is written, 432321b17ecSEdward Tomasz Napierala * the icl_pdu_receive_data_segment() must always receive padding 433321b17ecSEdward Tomasz Napierala * along with the last part of data segment, because it would be 434321b17ecSEdward Tomasz Napierala * impossible to tell whether we've already received the full data 435321b17ecSEdward Tomasz Napierala * segment including padding, or without it. 436321b17ecSEdward Tomasz Napierala */ 437321b17ecSEdward Tomasz Napierala if ((len % 4) != 0) 438321b17ecSEdward Tomasz Napierala len += 4 - (len % 4); 439321b17ecSEdward Tomasz Napierala 440321b17ecSEdward Tomasz Napierala #if 0 441321b17ecSEdward Tomasz Napierala ICL_DEBUG("need %zd bytes of data", len)); 442321b17ecSEdward Tomasz Napierala #endif 443321b17ecSEdward Tomasz Napierala 444321b17ecSEdward Tomasz Napierala return (len); 445321b17ecSEdward Tomasz Napierala } 446321b17ecSEdward Tomasz Napierala 447321b17ecSEdward Tomasz Napierala static int 448321b17ecSEdward Tomasz Napierala icl_pdu_receive_data_segment(struct icl_pdu *request, 449321b17ecSEdward Tomasz Napierala size_t *availablep, bool *more_neededp) 450321b17ecSEdward Tomasz Napierala { 451321b17ecSEdward Tomasz Napierala struct icl_conn *ic; 452321b17ecSEdward Tomasz Napierala size_t len, padding = 0; 453321b17ecSEdward Tomasz Napierala struct mbuf *m; 454321b17ecSEdward Tomasz Napierala 455321b17ecSEdward Tomasz Napierala ic = request->ip_conn; 456321b17ecSEdward Tomasz Napierala 457321b17ecSEdward Tomasz Napierala *more_neededp = false; 458321b17ecSEdward Tomasz Napierala ic->ic_receive_len = 0; 459321b17ecSEdward Tomasz Napierala 460321b17ecSEdward Tomasz Napierala len = icl_pdu_data_segment_length(request); 461321b17ecSEdward Tomasz Napierala if (len == 0) 462321b17ecSEdward Tomasz Napierala return (0); 463321b17ecSEdward Tomasz Napierala 464321b17ecSEdward Tomasz Napierala if ((len % 4) != 0) 465321b17ecSEdward Tomasz Napierala padding = 4 - (len % 4); 466321b17ecSEdward Tomasz Napierala 467321b17ecSEdward Tomasz Napierala /* 468321b17ecSEdward Tomasz Napierala * Account for already received parts of data segment. 469321b17ecSEdward Tomasz Napierala */ 470321b17ecSEdward Tomasz Napierala KASSERT(len > request->ip_data_len, ("len <= request->ip_data_len")); 471321b17ecSEdward Tomasz Napierala len -= request->ip_data_len; 472321b17ecSEdward Tomasz Napierala 473321b17ecSEdward Tomasz Napierala if (len + padding > *availablep) { 474321b17ecSEdward Tomasz Napierala /* 475321b17ecSEdward Tomasz Napierala * Not enough data in the socket buffer. Receive as much 476321b17ecSEdward Tomasz Napierala * as we can. Don't receive padding, since, obviously, it's 477321b17ecSEdward Tomasz Napierala * not the end of data segment yet. 478321b17ecSEdward Tomasz Napierala */ 479321b17ecSEdward Tomasz Napierala #if 0 480321b17ecSEdward Tomasz Napierala ICL_DEBUG("limited from %zd to %zd", 481321b17ecSEdward Tomasz Napierala len + padding, *availablep - padding)); 482321b17ecSEdward Tomasz Napierala #endif 483321b17ecSEdward Tomasz Napierala len = *availablep - padding; 484321b17ecSEdward Tomasz Napierala *more_neededp = true; 485321b17ecSEdward Tomasz Napierala padding = 0; 486321b17ecSEdward Tomasz Napierala } 487321b17ecSEdward Tomasz Napierala 488321b17ecSEdward Tomasz Napierala /* 489321b17ecSEdward Tomasz Napierala * Must not try to receive padding without at least one byte 490321b17ecSEdward Tomasz Napierala * of actual data segment. 491321b17ecSEdward Tomasz Napierala */ 492321b17ecSEdward Tomasz Napierala if (len > 0) { 493321b17ecSEdward Tomasz Napierala m = icl_conn_receive(request->ip_conn, len + padding); 494321b17ecSEdward Tomasz Napierala if (m == NULL) { 495321b17ecSEdward Tomasz Napierala ICL_DEBUG("failed to receive data segment"); 496321b17ecSEdward Tomasz Napierala return (-1); 497321b17ecSEdward Tomasz Napierala } 498321b17ecSEdward Tomasz Napierala 499321b17ecSEdward Tomasz Napierala if (request->ip_data_mbuf == NULL) 500321b17ecSEdward Tomasz Napierala request->ip_data_mbuf = m; 501321b17ecSEdward Tomasz Napierala else 502321b17ecSEdward Tomasz Napierala m_cat(request->ip_data_mbuf, m); 503321b17ecSEdward Tomasz Napierala 504321b17ecSEdward Tomasz Napierala request->ip_data_len += len; 505321b17ecSEdward Tomasz Napierala *availablep -= len + padding; 506321b17ecSEdward Tomasz Napierala } else 507321b17ecSEdward Tomasz Napierala ICL_DEBUG("len 0"); 508321b17ecSEdward Tomasz Napierala 509321b17ecSEdward Tomasz Napierala if (*more_neededp) 510321b17ecSEdward Tomasz Napierala ic->ic_receive_len = 511321b17ecSEdward Tomasz Napierala icl_pdu_data_segment_receive_len(request); 512321b17ecSEdward Tomasz Napierala 513321b17ecSEdward Tomasz Napierala return (0); 514321b17ecSEdward Tomasz Napierala } 515321b17ecSEdward Tomasz Napierala 516321b17ecSEdward Tomasz Napierala static int 517321b17ecSEdward Tomasz Napierala icl_pdu_check_data_digest(struct icl_pdu *request, size_t *availablep) 518321b17ecSEdward Tomasz Napierala { 519321b17ecSEdward Tomasz Napierala struct mbuf *m; 520321b17ecSEdward Tomasz Napierala uint32_t received_digest, valid_digest; 521321b17ecSEdward Tomasz Napierala 522321b17ecSEdward Tomasz Napierala if (request->ip_conn->ic_data_crc32c == false) 523321b17ecSEdward Tomasz Napierala return (0); 524321b17ecSEdward Tomasz Napierala 525321b17ecSEdward Tomasz Napierala if (request->ip_data_len == 0) 526321b17ecSEdward Tomasz Napierala return (0); 527321b17ecSEdward Tomasz Napierala 528321b17ecSEdward Tomasz Napierala m = icl_conn_receive(request->ip_conn, ISCSI_DATA_DIGEST_SIZE); 529321b17ecSEdward Tomasz Napierala if (m == NULL) { 530321b17ecSEdward Tomasz Napierala ICL_DEBUG("failed to receive data digest"); 531321b17ecSEdward Tomasz Napierala return (-1); 532321b17ecSEdward Tomasz Napierala } 533321b17ecSEdward Tomasz Napierala 534321b17ecSEdward Tomasz Napierala CTASSERT(sizeof(received_digest) == ISCSI_DATA_DIGEST_SIZE); 535321b17ecSEdward Tomasz Napierala m_copydata(m, 0, ISCSI_DATA_DIGEST_SIZE, (void *)&received_digest); 536321b17ecSEdward Tomasz Napierala m_freem(m); 537321b17ecSEdward Tomasz Napierala 538321b17ecSEdward Tomasz Napierala *availablep -= ISCSI_DATA_DIGEST_SIZE; 539321b17ecSEdward Tomasz Napierala 540321b17ecSEdward Tomasz Napierala /* 541321b17ecSEdward Tomasz Napierala * Note that ip_data_mbuf also contains padding; since digest 542321b17ecSEdward Tomasz Napierala * calculation is supposed to include that, we iterate over 543321b17ecSEdward Tomasz Napierala * the entire ip_data_mbuf chain, not just ip_data_len bytes of it. 544321b17ecSEdward Tomasz Napierala */ 545321b17ecSEdward Tomasz Napierala valid_digest = icl_mbuf_to_crc32c(request->ip_data_mbuf); 546321b17ecSEdward Tomasz Napierala if (received_digest != valid_digest) { 547321b17ecSEdward Tomasz Napierala ICL_WARN("data digest check failed; got 0x%x, " 548321b17ecSEdward Tomasz Napierala "should be 0x%x", received_digest, valid_digest); 549321b17ecSEdward Tomasz Napierala return (-1); 550321b17ecSEdward Tomasz Napierala } 551321b17ecSEdward Tomasz Napierala 552321b17ecSEdward Tomasz Napierala return (0); 553321b17ecSEdward Tomasz Napierala } 554321b17ecSEdward Tomasz Napierala 555321b17ecSEdward Tomasz Napierala /* 556321b17ecSEdward Tomasz Napierala * Somewhat contrary to the name, this attempts to receive only one 557321b17ecSEdward Tomasz Napierala * "part" of PDU at a time; call it repeatedly until it returns non-NULL. 558321b17ecSEdward Tomasz Napierala */ 559321b17ecSEdward Tomasz Napierala static struct icl_pdu * 560321b17ecSEdward Tomasz Napierala icl_conn_receive_pdu(struct icl_conn *ic, size_t *availablep) 561321b17ecSEdward Tomasz Napierala { 562321b17ecSEdward Tomasz Napierala struct icl_pdu *request; 563321b17ecSEdward Tomasz Napierala struct socket *so; 564321b17ecSEdward Tomasz Napierala size_t len; 565321b17ecSEdward Tomasz Napierala int error; 566321b17ecSEdward Tomasz Napierala bool more_needed; 567321b17ecSEdward Tomasz Napierala 568321b17ecSEdward Tomasz Napierala so = ic->ic_socket; 569321b17ecSEdward Tomasz Napierala 570321b17ecSEdward Tomasz Napierala if (ic->ic_receive_state == ICL_CONN_STATE_BHS) { 571321b17ecSEdward Tomasz Napierala KASSERT(ic->ic_receive_pdu == NULL, 572321b17ecSEdward Tomasz Napierala ("ic->ic_receive_pdu != NULL")); 573321b17ecSEdward Tomasz Napierala request = icl_pdu_new_empty(ic, M_NOWAIT); 574321b17ecSEdward Tomasz Napierala if (request == NULL) { 575321b17ecSEdward Tomasz Napierala ICL_DEBUG("failed to allocate PDU; " 576321b17ecSEdward Tomasz Napierala "dropping connection"); 577321b17ecSEdward Tomasz Napierala icl_conn_fail(ic); 578321b17ecSEdward Tomasz Napierala return (NULL); 579321b17ecSEdward Tomasz Napierala } 580321b17ecSEdward Tomasz Napierala ic->ic_receive_pdu = request; 581321b17ecSEdward Tomasz Napierala } else { 582321b17ecSEdward Tomasz Napierala KASSERT(ic->ic_receive_pdu != NULL, 583321b17ecSEdward Tomasz Napierala ("ic->ic_receive_pdu == NULL")); 584321b17ecSEdward Tomasz Napierala request = ic->ic_receive_pdu; 585321b17ecSEdward Tomasz Napierala } 586321b17ecSEdward Tomasz Napierala 587321b17ecSEdward Tomasz Napierala if (*availablep < ic->ic_receive_len) { 588321b17ecSEdward Tomasz Napierala #if 0 589321b17ecSEdward Tomasz Napierala ICL_DEBUG("not enough data; need %zd, " 590321b17ecSEdward Tomasz Napierala "have %zd", ic->ic_receive_len, *availablep); 591321b17ecSEdward Tomasz Napierala #endif 592321b17ecSEdward Tomasz Napierala return (NULL); 593321b17ecSEdward Tomasz Napierala } 594321b17ecSEdward Tomasz Napierala 595321b17ecSEdward Tomasz Napierala switch (ic->ic_receive_state) { 596321b17ecSEdward Tomasz Napierala case ICL_CONN_STATE_BHS: 597321b17ecSEdward Tomasz Napierala //ICL_DEBUG("receiving BHS"); 598321b17ecSEdward Tomasz Napierala error = icl_pdu_receive_bhs(request, availablep); 599321b17ecSEdward Tomasz Napierala if (error != 0) { 600321b17ecSEdward Tomasz Napierala ICL_DEBUG("failed to receive BHS; " 601321b17ecSEdward Tomasz Napierala "dropping connection"); 602321b17ecSEdward Tomasz Napierala break; 603321b17ecSEdward Tomasz Napierala } 604321b17ecSEdward Tomasz Napierala 605321b17ecSEdward Tomasz Napierala /* 606321b17ecSEdward Tomasz Napierala * We don't enforce any limit for AHS length; 607321b17ecSEdward Tomasz Napierala * its length is stored in 8 bit field. 608321b17ecSEdward Tomasz Napierala */ 609321b17ecSEdward Tomasz Napierala 610321b17ecSEdward Tomasz Napierala len = icl_pdu_data_segment_length(request); 611321b17ecSEdward Tomasz Napierala if (len > ic->ic_max_data_segment_length) { 612321b17ecSEdward Tomasz Napierala ICL_WARN("received data segment " 613321b17ecSEdward Tomasz Napierala "length %zd is larger than negotiated " 614321b17ecSEdward Tomasz Napierala "MaxDataSegmentLength %zd; " 615321b17ecSEdward Tomasz Napierala "dropping connection", 616321b17ecSEdward Tomasz Napierala len, ic->ic_max_data_segment_length); 617321b17ecSEdward Tomasz Napierala error = EINVAL; 618321b17ecSEdward Tomasz Napierala break; 619321b17ecSEdward Tomasz Napierala } 620321b17ecSEdward Tomasz Napierala 621321b17ecSEdward Tomasz Napierala ic->ic_receive_state = ICL_CONN_STATE_AHS; 622321b17ecSEdward Tomasz Napierala ic->ic_receive_len = icl_pdu_ahs_length(request); 623321b17ecSEdward Tomasz Napierala break; 624321b17ecSEdward Tomasz Napierala 625321b17ecSEdward Tomasz Napierala case ICL_CONN_STATE_AHS: 626321b17ecSEdward Tomasz Napierala //ICL_DEBUG("receiving AHS"); 627321b17ecSEdward Tomasz Napierala error = icl_pdu_receive_ahs(request, availablep); 628321b17ecSEdward Tomasz Napierala if (error != 0) { 629321b17ecSEdward Tomasz Napierala ICL_DEBUG("failed to receive AHS; " 630321b17ecSEdward Tomasz Napierala "dropping connection"); 631321b17ecSEdward Tomasz Napierala break; 632321b17ecSEdward Tomasz Napierala } 633321b17ecSEdward Tomasz Napierala ic->ic_receive_state = ICL_CONN_STATE_HEADER_DIGEST; 634321b17ecSEdward Tomasz Napierala if (ic->ic_header_crc32c == false) 635321b17ecSEdward Tomasz Napierala ic->ic_receive_len = 0; 636321b17ecSEdward Tomasz Napierala else 637321b17ecSEdward Tomasz Napierala ic->ic_receive_len = ISCSI_HEADER_DIGEST_SIZE; 638321b17ecSEdward Tomasz Napierala break; 639321b17ecSEdward Tomasz Napierala 640321b17ecSEdward Tomasz Napierala case ICL_CONN_STATE_HEADER_DIGEST: 641321b17ecSEdward Tomasz Napierala //ICL_DEBUG("receiving header digest"); 642321b17ecSEdward Tomasz Napierala error = icl_pdu_check_header_digest(request, availablep); 643321b17ecSEdward Tomasz Napierala if (error != 0) { 644321b17ecSEdward Tomasz Napierala ICL_DEBUG("header digest failed; " 645321b17ecSEdward Tomasz Napierala "dropping connection"); 646321b17ecSEdward Tomasz Napierala break; 647321b17ecSEdward Tomasz Napierala } 648321b17ecSEdward Tomasz Napierala 649321b17ecSEdward Tomasz Napierala ic->ic_receive_state = ICL_CONN_STATE_DATA; 650321b17ecSEdward Tomasz Napierala ic->ic_receive_len = 651321b17ecSEdward Tomasz Napierala icl_pdu_data_segment_receive_len(request); 652321b17ecSEdward Tomasz Napierala break; 653321b17ecSEdward Tomasz Napierala 654321b17ecSEdward Tomasz Napierala case ICL_CONN_STATE_DATA: 655321b17ecSEdward Tomasz Napierala //ICL_DEBUG("receiving data segment"); 656321b17ecSEdward Tomasz Napierala error = icl_pdu_receive_data_segment(request, availablep, 657321b17ecSEdward Tomasz Napierala &more_needed); 658321b17ecSEdward Tomasz Napierala if (error != 0) { 659321b17ecSEdward Tomasz Napierala ICL_DEBUG("failed to receive data segment;" 660321b17ecSEdward Tomasz Napierala "dropping connection"); 661321b17ecSEdward Tomasz Napierala break; 662321b17ecSEdward Tomasz Napierala } 663321b17ecSEdward Tomasz Napierala 664321b17ecSEdward Tomasz Napierala if (more_needed) 665321b17ecSEdward Tomasz Napierala break; 666321b17ecSEdward Tomasz Napierala 667321b17ecSEdward Tomasz Napierala ic->ic_receive_state = ICL_CONN_STATE_DATA_DIGEST; 668321b17ecSEdward Tomasz Napierala if (request->ip_data_len == 0 || ic->ic_data_crc32c == false) 669321b17ecSEdward Tomasz Napierala ic->ic_receive_len = 0; 670321b17ecSEdward Tomasz Napierala else 671321b17ecSEdward Tomasz Napierala ic->ic_receive_len = ISCSI_DATA_DIGEST_SIZE; 672321b17ecSEdward Tomasz Napierala break; 673321b17ecSEdward Tomasz Napierala 674321b17ecSEdward Tomasz Napierala case ICL_CONN_STATE_DATA_DIGEST: 675321b17ecSEdward Tomasz Napierala //ICL_DEBUG("receiving data digest"); 676321b17ecSEdward Tomasz Napierala error = icl_pdu_check_data_digest(request, availablep); 677321b17ecSEdward Tomasz Napierala if (error != 0) { 678321b17ecSEdward Tomasz Napierala ICL_DEBUG("data digest failed; " 679321b17ecSEdward Tomasz Napierala "dropping connection"); 680321b17ecSEdward Tomasz Napierala break; 681321b17ecSEdward Tomasz Napierala } 682321b17ecSEdward Tomasz Napierala 683321b17ecSEdward Tomasz Napierala /* 684321b17ecSEdward Tomasz Napierala * We've received complete PDU; reset the receive state machine 685321b17ecSEdward Tomasz Napierala * and return the PDU. 686321b17ecSEdward Tomasz Napierala */ 687321b17ecSEdward Tomasz Napierala ic->ic_receive_state = ICL_CONN_STATE_BHS; 688321b17ecSEdward Tomasz Napierala ic->ic_receive_len = sizeof(struct iscsi_bhs); 689321b17ecSEdward Tomasz Napierala ic->ic_receive_pdu = NULL; 690321b17ecSEdward Tomasz Napierala return (request); 691321b17ecSEdward Tomasz Napierala 692321b17ecSEdward Tomasz Napierala default: 693321b17ecSEdward Tomasz Napierala panic("invalid ic_receive_state %d\n", ic->ic_receive_state); 694321b17ecSEdward Tomasz Napierala } 695321b17ecSEdward Tomasz Napierala 696321b17ecSEdward Tomasz Napierala if (error != 0) { 697321b17ecSEdward Tomasz Napierala /* 698321b17ecSEdward Tomasz Napierala * Don't free the PDU; it's pointed to by ic->ic_receive_pdu 699321b17ecSEdward Tomasz Napierala * and will get freed in icl_conn_close(). 700321b17ecSEdward Tomasz Napierala */ 701321b17ecSEdward Tomasz Napierala icl_conn_fail(ic); 702321b17ecSEdward Tomasz Napierala } 703321b17ecSEdward Tomasz Napierala 704321b17ecSEdward Tomasz Napierala return (NULL); 705321b17ecSEdward Tomasz Napierala } 706321b17ecSEdward Tomasz Napierala 707321b17ecSEdward Tomasz Napierala static void 708321b17ecSEdward Tomasz Napierala icl_conn_receive_pdus(struct icl_conn *ic, size_t available) 709321b17ecSEdward Tomasz Napierala { 710321b17ecSEdward Tomasz Napierala struct icl_pdu *response; 711321b17ecSEdward Tomasz Napierala struct socket *so; 712321b17ecSEdward Tomasz Napierala 713321b17ecSEdward Tomasz Napierala so = ic->ic_socket; 714321b17ecSEdward Tomasz Napierala 715321b17ecSEdward Tomasz Napierala /* 716321b17ecSEdward Tomasz Napierala * This can never happen; we're careful to only mess with ic->ic_socket 717321b17ecSEdward Tomasz Napierala * pointer when the send/receive threads are not running. 718321b17ecSEdward Tomasz Napierala */ 719321b17ecSEdward Tomasz Napierala KASSERT(so != NULL, ("NULL socket")); 720321b17ecSEdward Tomasz Napierala 721321b17ecSEdward Tomasz Napierala for (;;) { 722321b17ecSEdward Tomasz Napierala if (ic->ic_disconnecting) 723321b17ecSEdward Tomasz Napierala return; 724321b17ecSEdward Tomasz Napierala 725321b17ecSEdward Tomasz Napierala if (so->so_error != 0) { 726321b17ecSEdward Tomasz Napierala ICL_DEBUG("connection error %d; " 727321b17ecSEdward Tomasz Napierala "dropping connection", so->so_error); 728321b17ecSEdward Tomasz Napierala icl_conn_fail(ic); 729321b17ecSEdward Tomasz Napierala return; 730321b17ecSEdward Tomasz Napierala } 731321b17ecSEdward Tomasz Napierala 732321b17ecSEdward Tomasz Napierala /* 733321b17ecSEdward Tomasz Napierala * Loop until we have a complete PDU or there is not enough 734321b17ecSEdward Tomasz Napierala * data in the socket buffer. 735321b17ecSEdward Tomasz Napierala */ 736321b17ecSEdward Tomasz Napierala if (available < ic->ic_receive_len) { 737321b17ecSEdward Tomasz Napierala #if 0 738321b17ecSEdward Tomasz Napierala ICL_DEBUG("not enough data; have %zd, " 739321b17ecSEdward Tomasz Napierala "need %zd", available, 740321b17ecSEdward Tomasz Napierala ic->ic_receive_len); 741321b17ecSEdward Tomasz Napierala #endif 742321b17ecSEdward Tomasz Napierala return; 743321b17ecSEdward Tomasz Napierala } 744321b17ecSEdward Tomasz Napierala 745321b17ecSEdward Tomasz Napierala response = icl_conn_receive_pdu(ic, &available); 746321b17ecSEdward Tomasz Napierala if (response == NULL) 747321b17ecSEdward Tomasz Napierala continue; 748321b17ecSEdward Tomasz Napierala 749321b17ecSEdward Tomasz Napierala if (response->ip_ahs_len > 0) { 750321b17ecSEdward Tomasz Napierala ICL_WARN("received PDU with unsupported " 751321b17ecSEdward Tomasz Napierala "AHS; opcode 0x%x; dropping connection", 752321b17ecSEdward Tomasz Napierala response->ip_bhs->bhs_opcode); 753321b17ecSEdward Tomasz Napierala icl_pdu_free(response); 754321b17ecSEdward Tomasz Napierala icl_conn_fail(ic); 755321b17ecSEdward Tomasz Napierala return; 756321b17ecSEdward Tomasz Napierala } 757321b17ecSEdward Tomasz Napierala 758321b17ecSEdward Tomasz Napierala (ic->ic_receive)(response); 759321b17ecSEdward Tomasz Napierala } 760321b17ecSEdward Tomasz Napierala } 761321b17ecSEdward Tomasz Napierala 762321b17ecSEdward Tomasz Napierala static void 763321b17ecSEdward Tomasz Napierala icl_receive_thread(void *arg) 764321b17ecSEdward Tomasz Napierala { 765321b17ecSEdward Tomasz Napierala struct icl_conn *ic; 766321b17ecSEdward Tomasz Napierala size_t available; 767321b17ecSEdward Tomasz Napierala struct socket *so; 768321b17ecSEdward Tomasz Napierala 769321b17ecSEdward Tomasz Napierala ic = arg; 770321b17ecSEdward Tomasz Napierala so = ic->ic_socket; 771321b17ecSEdward Tomasz Napierala 772321b17ecSEdward Tomasz Napierala ICL_CONN_LOCK(ic); 773321b17ecSEdward Tomasz Napierala ic->ic_receive_running = true; 774321b17ecSEdward Tomasz Napierala ICL_CONN_UNLOCK(ic); 775321b17ecSEdward Tomasz Napierala 776321b17ecSEdward Tomasz Napierala for (;;) { 777321b17ecSEdward Tomasz Napierala if (ic->ic_disconnecting) { 778321b17ecSEdward Tomasz Napierala //ICL_DEBUG("terminating"); 779321b17ecSEdward Tomasz Napierala break; 780321b17ecSEdward Tomasz Napierala } 781321b17ecSEdward Tomasz Napierala 782321b17ecSEdward Tomasz Napierala /* 783321b17ecSEdward Tomasz Napierala * Set the low watermark, to be checked by 784321b17ecSEdward Tomasz Napierala * soreadable() in icl_soupcall_receive() 785321b17ecSEdward Tomasz Napierala * to avoid unneccessary wakeups until there 786321b17ecSEdward Tomasz Napierala * is enough data received to read the PDU. 787321b17ecSEdward Tomasz Napierala */ 788321b17ecSEdward Tomasz Napierala SOCKBUF_LOCK(&so->so_rcv); 789321b17ecSEdward Tomasz Napierala available = sbavail(&so->so_rcv); 790321b17ecSEdward Tomasz Napierala if (available < ic->ic_receive_len) { 791321b17ecSEdward Tomasz Napierala so->so_rcv.sb_lowat = ic->ic_receive_len; 792321b17ecSEdward Tomasz Napierala cv_wait(&ic->ic_receive_cv, &so->so_rcv.sb_mtx); 793321b17ecSEdward Tomasz Napierala } else 794321b17ecSEdward Tomasz Napierala so->so_rcv.sb_lowat = so->so_rcv.sb_hiwat + 1; 795321b17ecSEdward Tomasz Napierala SOCKBUF_UNLOCK(&so->so_rcv); 796321b17ecSEdward Tomasz Napierala 797321b17ecSEdward Tomasz Napierala icl_conn_receive_pdus(ic, available); 798321b17ecSEdward Tomasz Napierala } 799321b17ecSEdward Tomasz Napierala 800321b17ecSEdward Tomasz Napierala ICL_CONN_LOCK(ic); 801321b17ecSEdward Tomasz Napierala ic->ic_receive_running = false; 802321b17ecSEdward Tomasz Napierala cv_signal(&ic->ic_send_cv); 803321b17ecSEdward Tomasz Napierala ICL_CONN_UNLOCK(ic); 804321b17ecSEdward Tomasz Napierala kthread_exit(); 805321b17ecSEdward Tomasz Napierala } 806321b17ecSEdward Tomasz Napierala 807321b17ecSEdward Tomasz Napierala static int 808321b17ecSEdward Tomasz Napierala icl_soupcall_receive(struct socket *so, void *arg, int waitflag) 809321b17ecSEdward Tomasz Napierala { 810321b17ecSEdward Tomasz Napierala struct icl_conn *ic; 811321b17ecSEdward Tomasz Napierala 812321b17ecSEdward Tomasz Napierala if (!soreadable(so)) 813321b17ecSEdward Tomasz Napierala return (SU_OK); 814321b17ecSEdward Tomasz Napierala 815321b17ecSEdward Tomasz Napierala ic = arg; 816321b17ecSEdward Tomasz Napierala cv_signal(&ic->ic_receive_cv); 817321b17ecSEdward Tomasz Napierala return (SU_OK); 818321b17ecSEdward Tomasz Napierala } 819321b17ecSEdward Tomasz Napierala 820321b17ecSEdward Tomasz Napierala static int 821321b17ecSEdward Tomasz Napierala icl_pdu_finalize(struct icl_pdu *request) 822321b17ecSEdward Tomasz Napierala { 823321b17ecSEdward Tomasz Napierala size_t padding, pdu_len; 824321b17ecSEdward Tomasz Napierala uint32_t digest, zero = 0; 825321b17ecSEdward Tomasz Napierala int ok; 826321b17ecSEdward Tomasz Napierala struct icl_conn *ic; 827321b17ecSEdward Tomasz Napierala 828321b17ecSEdward Tomasz Napierala ic = request->ip_conn; 829321b17ecSEdward Tomasz Napierala 830321b17ecSEdward Tomasz Napierala icl_pdu_set_data_segment_length(request, request->ip_data_len); 831321b17ecSEdward Tomasz Napierala 832321b17ecSEdward Tomasz Napierala pdu_len = icl_pdu_size(request); 833321b17ecSEdward Tomasz Napierala 834321b17ecSEdward Tomasz Napierala if (ic->ic_header_crc32c) { 835321b17ecSEdward Tomasz Napierala digest = icl_mbuf_to_crc32c(request->ip_bhs_mbuf); 836321b17ecSEdward Tomasz Napierala ok = m_append(request->ip_bhs_mbuf, sizeof(digest), 837321b17ecSEdward Tomasz Napierala (void *)&digest); 838321b17ecSEdward Tomasz Napierala if (ok != 1) { 839321b17ecSEdward Tomasz Napierala ICL_WARN("failed to append header digest"); 840321b17ecSEdward Tomasz Napierala return (1); 841321b17ecSEdward Tomasz Napierala } 842321b17ecSEdward Tomasz Napierala } 843321b17ecSEdward Tomasz Napierala 844321b17ecSEdward Tomasz Napierala if (request->ip_data_len != 0) { 845321b17ecSEdward Tomasz Napierala padding = icl_pdu_padding(request); 846321b17ecSEdward Tomasz Napierala if (padding > 0) { 847321b17ecSEdward Tomasz Napierala ok = m_append(request->ip_data_mbuf, padding, 848321b17ecSEdward Tomasz Napierala (void *)&zero); 849321b17ecSEdward Tomasz Napierala if (ok != 1) { 850321b17ecSEdward Tomasz Napierala ICL_WARN("failed to append padding"); 851321b17ecSEdward Tomasz Napierala return (1); 852321b17ecSEdward Tomasz Napierala } 853321b17ecSEdward Tomasz Napierala } 854321b17ecSEdward Tomasz Napierala 855321b17ecSEdward Tomasz Napierala if (ic->ic_data_crc32c) { 856321b17ecSEdward Tomasz Napierala digest = icl_mbuf_to_crc32c(request->ip_data_mbuf); 857321b17ecSEdward Tomasz Napierala 858321b17ecSEdward Tomasz Napierala ok = m_append(request->ip_data_mbuf, sizeof(digest), 859321b17ecSEdward Tomasz Napierala (void *)&digest); 860321b17ecSEdward Tomasz Napierala if (ok != 1) { 861321b17ecSEdward Tomasz Napierala ICL_WARN("failed to append data digest"); 862321b17ecSEdward Tomasz Napierala return (1); 863321b17ecSEdward Tomasz Napierala } 864321b17ecSEdward Tomasz Napierala } 865321b17ecSEdward Tomasz Napierala 866321b17ecSEdward Tomasz Napierala m_cat(request->ip_bhs_mbuf, request->ip_data_mbuf); 867321b17ecSEdward Tomasz Napierala request->ip_data_mbuf = NULL; 868321b17ecSEdward Tomasz Napierala } 869321b17ecSEdward Tomasz Napierala 870321b17ecSEdward Tomasz Napierala request->ip_bhs_mbuf->m_pkthdr.len = pdu_len; 871321b17ecSEdward Tomasz Napierala 872321b17ecSEdward Tomasz Napierala return (0); 873321b17ecSEdward Tomasz Napierala } 874321b17ecSEdward Tomasz Napierala 875321b17ecSEdward Tomasz Napierala static void 876321b17ecSEdward Tomasz Napierala icl_conn_send_pdus(struct icl_conn *ic, struct icl_pdu_stailq *queue) 877321b17ecSEdward Tomasz Napierala { 878321b17ecSEdward Tomasz Napierala struct icl_pdu *request, *request2; 879321b17ecSEdward Tomasz Napierala struct socket *so; 880321b17ecSEdward Tomasz Napierala size_t available, size, size2; 881321b17ecSEdward Tomasz Napierala int coalesced, error; 882321b17ecSEdward Tomasz Napierala 883321b17ecSEdward Tomasz Napierala ICL_CONN_LOCK_ASSERT_NOT(ic); 884321b17ecSEdward Tomasz Napierala 885321b17ecSEdward Tomasz Napierala so = ic->ic_socket; 886321b17ecSEdward Tomasz Napierala 887321b17ecSEdward Tomasz Napierala SOCKBUF_LOCK(&so->so_snd); 888321b17ecSEdward Tomasz Napierala /* 889321b17ecSEdward Tomasz Napierala * Check how much space do we have for transmit. We can't just 890321b17ecSEdward Tomasz Napierala * call sosend() and retry when we get EWOULDBLOCK or EMSGSIZE, 891321b17ecSEdward Tomasz Napierala * as it always frees the mbuf chain passed to it, even in case 892321b17ecSEdward Tomasz Napierala * of error. 893321b17ecSEdward Tomasz Napierala */ 894321b17ecSEdward Tomasz Napierala available = sbspace(&so->so_snd); 895321b17ecSEdward Tomasz Napierala 896321b17ecSEdward Tomasz Napierala /* 897321b17ecSEdward Tomasz Napierala * Notify the socket upcall that we don't need wakeups 898321b17ecSEdward Tomasz Napierala * for the time being. 899321b17ecSEdward Tomasz Napierala */ 900321b17ecSEdward Tomasz Napierala so->so_snd.sb_lowat = so->so_snd.sb_hiwat + 1; 901321b17ecSEdward Tomasz Napierala SOCKBUF_UNLOCK(&so->so_snd); 902321b17ecSEdward Tomasz Napierala 903321b17ecSEdward Tomasz Napierala while (!STAILQ_EMPTY(queue)) { 904321b17ecSEdward Tomasz Napierala request = STAILQ_FIRST(queue); 905321b17ecSEdward Tomasz Napierala size = icl_pdu_size(request); 906321b17ecSEdward Tomasz Napierala if (available < size) { 907321b17ecSEdward Tomasz Napierala 908321b17ecSEdward Tomasz Napierala /* 909321b17ecSEdward Tomasz Napierala * Set the low watermark, to be checked by 910321b17ecSEdward Tomasz Napierala * sowriteable() in icl_soupcall_send() 911321b17ecSEdward Tomasz Napierala * to avoid unneccessary wakeups until there 912321b17ecSEdward Tomasz Napierala * is enough space for the PDU to fit. 913321b17ecSEdward Tomasz Napierala */ 914321b17ecSEdward Tomasz Napierala SOCKBUF_LOCK(&so->so_snd); 915321b17ecSEdward Tomasz Napierala available = sbspace(&so->so_snd); 916321b17ecSEdward Tomasz Napierala if (available < size) { 917321b17ecSEdward Tomasz Napierala #if 1 918321b17ecSEdward Tomasz Napierala ICL_DEBUG("no space to send; " 919321b17ecSEdward Tomasz Napierala "have %zd, need %zd", 920321b17ecSEdward Tomasz Napierala available, size); 921321b17ecSEdward Tomasz Napierala #endif 922321b17ecSEdward Tomasz Napierala so->so_snd.sb_lowat = size; 923321b17ecSEdward Tomasz Napierala SOCKBUF_UNLOCK(&so->so_snd); 924321b17ecSEdward Tomasz Napierala return; 925321b17ecSEdward Tomasz Napierala } 926321b17ecSEdward Tomasz Napierala SOCKBUF_UNLOCK(&so->so_snd); 927321b17ecSEdward Tomasz Napierala } 928321b17ecSEdward Tomasz Napierala STAILQ_REMOVE_HEAD(queue, ip_next); 929321b17ecSEdward Tomasz Napierala error = icl_pdu_finalize(request); 930321b17ecSEdward Tomasz Napierala if (error != 0) { 931321b17ecSEdward Tomasz Napierala ICL_DEBUG("failed to finalize PDU; " 932321b17ecSEdward Tomasz Napierala "dropping connection"); 933321b17ecSEdward Tomasz Napierala icl_conn_fail(ic); 934321b17ecSEdward Tomasz Napierala icl_pdu_free(request); 935321b17ecSEdward Tomasz Napierala return; 936321b17ecSEdward Tomasz Napierala } 937321b17ecSEdward Tomasz Napierala if (coalesce) { 938321b17ecSEdward Tomasz Napierala coalesced = 1; 939321b17ecSEdward Tomasz Napierala for (;;) { 940321b17ecSEdward Tomasz Napierala request2 = STAILQ_FIRST(queue); 941321b17ecSEdward Tomasz Napierala if (request2 == NULL) 942321b17ecSEdward Tomasz Napierala break; 943321b17ecSEdward Tomasz Napierala size2 = icl_pdu_size(request2); 944321b17ecSEdward Tomasz Napierala if (available < size + size2) 945321b17ecSEdward Tomasz Napierala break; 946321b17ecSEdward Tomasz Napierala STAILQ_REMOVE_HEAD(queue, ip_next); 947321b17ecSEdward Tomasz Napierala error = icl_pdu_finalize(request2); 948321b17ecSEdward Tomasz Napierala if (error != 0) { 949321b17ecSEdward Tomasz Napierala ICL_DEBUG("failed to finalize PDU; " 950321b17ecSEdward Tomasz Napierala "dropping connection"); 951321b17ecSEdward Tomasz Napierala icl_conn_fail(ic); 952321b17ecSEdward Tomasz Napierala icl_pdu_free(request); 953321b17ecSEdward Tomasz Napierala icl_pdu_free(request2); 954321b17ecSEdward Tomasz Napierala return; 955321b17ecSEdward Tomasz Napierala } 956321b17ecSEdward Tomasz Napierala m_cat(request->ip_bhs_mbuf, request2->ip_bhs_mbuf); 957321b17ecSEdward Tomasz Napierala request2->ip_bhs_mbuf = NULL; 958321b17ecSEdward Tomasz Napierala request->ip_bhs_mbuf->m_pkthdr.len += size2; 959321b17ecSEdward Tomasz Napierala size += size2; 960321b17ecSEdward Tomasz Napierala STAILQ_REMOVE_AFTER(queue, request, ip_next); 961321b17ecSEdward Tomasz Napierala icl_pdu_free(request2); 962321b17ecSEdward Tomasz Napierala coalesced++; 963321b17ecSEdward Tomasz Napierala } 964321b17ecSEdward Tomasz Napierala #if 0 965321b17ecSEdward Tomasz Napierala if (coalesced > 1) { 966321b17ecSEdward Tomasz Napierala ICL_DEBUG("coalesced %d PDUs into %zd bytes", 967321b17ecSEdward Tomasz Napierala coalesced, size); 968321b17ecSEdward Tomasz Napierala } 969321b17ecSEdward Tomasz Napierala #endif 970321b17ecSEdward Tomasz Napierala } 971321b17ecSEdward Tomasz Napierala available -= size; 972321b17ecSEdward Tomasz Napierala error = sosend(so, NULL, NULL, request->ip_bhs_mbuf, 973321b17ecSEdward Tomasz Napierala NULL, MSG_DONTWAIT, curthread); 974321b17ecSEdward Tomasz Napierala request->ip_bhs_mbuf = NULL; /* Sosend consumes the mbuf. */ 975321b17ecSEdward Tomasz Napierala if (error != 0) { 976321b17ecSEdward Tomasz Napierala ICL_DEBUG("failed to send PDU, error %d; " 977321b17ecSEdward Tomasz Napierala "dropping connection", error); 978321b17ecSEdward Tomasz Napierala icl_conn_fail(ic); 979321b17ecSEdward Tomasz Napierala icl_pdu_free(request); 980321b17ecSEdward Tomasz Napierala return; 981321b17ecSEdward Tomasz Napierala } 982321b17ecSEdward Tomasz Napierala icl_pdu_free(request); 983321b17ecSEdward Tomasz Napierala } 984321b17ecSEdward Tomasz Napierala } 985321b17ecSEdward Tomasz Napierala 986321b17ecSEdward Tomasz Napierala static void 987321b17ecSEdward Tomasz Napierala icl_send_thread(void *arg) 988321b17ecSEdward Tomasz Napierala { 989321b17ecSEdward Tomasz Napierala struct icl_conn *ic; 990321b17ecSEdward Tomasz Napierala struct icl_pdu_stailq queue; 991321b17ecSEdward Tomasz Napierala 992321b17ecSEdward Tomasz Napierala ic = arg; 993321b17ecSEdward Tomasz Napierala 994321b17ecSEdward Tomasz Napierala STAILQ_INIT(&queue); 995321b17ecSEdward Tomasz Napierala 996321b17ecSEdward Tomasz Napierala ICL_CONN_LOCK(ic); 997321b17ecSEdward Tomasz Napierala ic->ic_send_running = true; 998321b17ecSEdward Tomasz Napierala 999321b17ecSEdward Tomasz Napierala for (;;) { 1000321b17ecSEdward Tomasz Napierala for (;;) { 1001321b17ecSEdward Tomasz Napierala /* 1002321b17ecSEdward Tomasz Napierala * If the local queue is empty, populate it from 1003321b17ecSEdward Tomasz Napierala * the main one. This way the icl_conn_send_pdus() 1004321b17ecSEdward Tomasz Napierala * can go through all the queued PDUs without holding 1005321b17ecSEdward Tomasz Napierala * any locks. 1006321b17ecSEdward Tomasz Napierala */ 1007321b17ecSEdward Tomasz Napierala if (STAILQ_EMPTY(&queue)) 1008321b17ecSEdward Tomasz Napierala STAILQ_SWAP(&ic->ic_to_send, &queue, icl_pdu); 1009321b17ecSEdward Tomasz Napierala 1010321b17ecSEdward Tomasz Napierala ic->ic_check_send_space = false; 1011321b17ecSEdward Tomasz Napierala ICL_CONN_UNLOCK(ic); 1012321b17ecSEdward Tomasz Napierala icl_conn_send_pdus(ic, &queue); 1013321b17ecSEdward Tomasz Napierala ICL_CONN_LOCK(ic); 1014321b17ecSEdward Tomasz Napierala 1015321b17ecSEdward Tomasz Napierala /* 1016321b17ecSEdward Tomasz Napierala * The icl_soupcall_send() was called since the last 1017321b17ecSEdward Tomasz Napierala * call to sbspace(); go around; 1018321b17ecSEdward Tomasz Napierala */ 1019321b17ecSEdward Tomasz Napierala if (ic->ic_check_send_space) 1020321b17ecSEdward Tomasz Napierala continue; 1021321b17ecSEdward Tomasz Napierala 1022321b17ecSEdward Tomasz Napierala /* 1023321b17ecSEdward Tomasz Napierala * Local queue is empty, but we still have PDUs 1024321b17ecSEdward Tomasz Napierala * in the main one; go around. 1025321b17ecSEdward Tomasz Napierala */ 1026321b17ecSEdward Tomasz Napierala if (STAILQ_EMPTY(&queue) && 1027321b17ecSEdward Tomasz Napierala !STAILQ_EMPTY(&ic->ic_to_send)) 1028321b17ecSEdward Tomasz Napierala continue; 1029321b17ecSEdward Tomasz Napierala 1030321b17ecSEdward Tomasz Napierala /* 1031321b17ecSEdward Tomasz Napierala * There might be some stuff in the local queue, 1032321b17ecSEdward Tomasz Napierala * which didn't get sent due to not having enough send 1033321b17ecSEdward Tomasz Napierala * space. Wait for socket upcall. 1034321b17ecSEdward Tomasz Napierala */ 1035321b17ecSEdward Tomasz Napierala break; 1036321b17ecSEdward Tomasz Napierala } 1037321b17ecSEdward Tomasz Napierala 1038321b17ecSEdward Tomasz Napierala if (ic->ic_disconnecting) { 1039321b17ecSEdward Tomasz Napierala //ICL_DEBUG("terminating"); 1040321b17ecSEdward Tomasz Napierala break; 1041321b17ecSEdward Tomasz Napierala } 1042321b17ecSEdward Tomasz Napierala 1043321b17ecSEdward Tomasz Napierala cv_wait(&ic->ic_send_cv, ic->ic_lock); 1044321b17ecSEdward Tomasz Napierala } 1045321b17ecSEdward Tomasz Napierala 1046321b17ecSEdward Tomasz Napierala /* 1047321b17ecSEdward Tomasz Napierala * We're exiting; move PDUs back to the main queue, so they can 1048321b17ecSEdward Tomasz Napierala * get freed properly. At this point ordering doesn't matter. 1049321b17ecSEdward Tomasz Napierala */ 1050321b17ecSEdward Tomasz Napierala STAILQ_CONCAT(&ic->ic_to_send, &queue); 1051321b17ecSEdward Tomasz Napierala 1052321b17ecSEdward Tomasz Napierala ic->ic_send_running = false; 1053321b17ecSEdward Tomasz Napierala cv_signal(&ic->ic_send_cv); 1054321b17ecSEdward Tomasz Napierala ICL_CONN_UNLOCK(ic); 1055321b17ecSEdward Tomasz Napierala kthread_exit(); 1056321b17ecSEdward Tomasz Napierala } 1057321b17ecSEdward Tomasz Napierala 1058321b17ecSEdward Tomasz Napierala static int 1059321b17ecSEdward Tomasz Napierala icl_soupcall_send(struct socket *so, void *arg, int waitflag) 1060321b17ecSEdward Tomasz Napierala { 1061321b17ecSEdward Tomasz Napierala struct icl_conn *ic; 1062321b17ecSEdward Tomasz Napierala 1063321b17ecSEdward Tomasz Napierala if (!sowriteable(so)) 1064321b17ecSEdward Tomasz Napierala return (SU_OK); 1065321b17ecSEdward Tomasz Napierala 1066321b17ecSEdward Tomasz Napierala ic = arg; 1067321b17ecSEdward Tomasz Napierala 1068321b17ecSEdward Tomasz Napierala ICL_CONN_LOCK(ic); 1069321b17ecSEdward Tomasz Napierala ic->ic_check_send_space = true; 1070321b17ecSEdward Tomasz Napierala ICL_CONN_UNLOCK(ic); 1071321b17ecSEdward Tomasz Napierala 1072321b17ecSEdward Tomasz Napierala cv_signal(&ic->ic_send_cv); 1073321b17ecSEdward Tomasz Napierala 1074321b17ecSEdward Tomasz Napierala return (SU_OK); 1075321b17ecSEdward Tomasz Napierala } 1076321b17ecSEdward Tomasz Napierala 1077321b17ecSEdward Tomasz Napierala static int 1078321b17ecSEdward Tomasz Napierala icl_pdu_append_data(struct icl_pdu *request, const void *addr, size_t len, 1079321b17ecSEdward Tomasz Napierala int flags) 1080321b17ecSEdward Tomasz Napierala { 1081321b17ecSEdward Tomasz Napierala struct mbuf *mb, *newmb; 1082321b17ecSEdward Tomasz Napierala size_t copylen, off = 0; 1083321b17ecSEdward Tomasz Napierala 1084321b17ecSEdward Tomasz Napierala KASSERT(len > 0, ("len == 0")); 1085321b17ecSEdward Tomasz Napierala 1086321b17ecSEdward Tomasz Napierala newmb = m_getm2(NULL, len, flags, MT_DATA, M_PKTHDR); 1087321b17ecSEdward Tomasz Napierala if (newmb == NULL) { 1088321b17ecSEdward Tomasz Napierala ICL_WARN("failed to allocate mbuf for %zd bytes", len); 1089321b17ecSEdward Tomasz Napierala return (ENOMEM); 1090321b17ecSEdward Tomasz Napierala } 1091321b17ecSEdward Tomasz Napierala 1092321b17ecSEdward Tomasz Napierala for (mb = newmb; mb != NULL; mb = mb->m_next) { 1093321b17ecSEdward Tomasz Napierala copylen = min(M_TRAILINGSPACE(mb), len - off); 1094321b17ecSEdward Tomasz Napierala memcpy(mtod(mb, char *), (const char *)addr + off, copylen); 1095321b17ecSEdward Tomasz Napierala mb->m_len = copylen; 1096321b17ecSEdward Tomasz Napierala off += copylen; 1097321b17ecSEdward Tomasz Napierala } 1098321b17ecSEdward Tomasz Napierala KASSERT(off == len, ("%s: off != len", __func__)); 1099321b17ecSEdward Tomasz Napierala 1100321b17ecSEdward Tomasz Napierala if (request->ip_data_mbuf == NULL) { 1101321b17ecSEdward Tomasz Napierala request->ip_data_mbuf = newmb; 1102321b17ecSEdward Tomasz Napierala request->ip_data_len = len; 1103321b17ecSEdward Tomasz Napierala } else { 1104321b17ecSEdward Tomasz Napierala m_cat(request->ip_data_mbuf, newmb); 1105321b17ecSEdward Tomasz Napierala request->ip_data_len += len; 1106321b17ecSEdward Tomasz Napierala } 1107321b17ecSEdward Tomasz Napierala 1108321b17ecSEdward Tomasz Napierala return (0); 1109321b17ecSEdward Tomasz Napierala } 1110321b17ecSEdward Tomasz Napierala 1111321b17ecSEdward Tomasz Napierala int 1112321b17ecSEdward Tomasz Napierala icl_soft_conn_pdu_append_data(struct icl_conn *ic, struct icl_pdu *request, 1113321b17ecSEdward Tomasz Napierala const void *addr, size_t len, int flags) 1114321b17ecSEdward Tomasz Napierala { 1115321b17ecSEdward Tomasz Napierala 1116321b17ecSEdward Tomasz Napierala return (icl_pdu_append_data(request, addr, len, flags)); 1117321b17ecSEdward Tomasz Napierala } 1118321b17ecSEdward Tomasz Napierala 1119321b17ecSEdward Tomasz Napierala static void 1120321b17ecSEdward Tomasz Napierala icl_pdu_get_data(struct icl_pdu *ip, size_t off, void *addr, size_t len) 1121321b17ecSEdward Tomasz Napierala { 1122321b17ecSEdward Tomasz Napierala 1123321b17ecSEdward Tomasz Napierala m_copydata(ip->ip_data_mbuf, off, len, addr); 1124321b17ecSEdward Tomasz Napierala } 1125321b17ecSEdward Tomasz Napierala 1126321b17ecSEdward Tomasz Napierala void 1127321b17ecSEdward Tomasz Napierala icl_soft_conn_pdu_get_data(struct icl_conn *ic, struct icl_pdu *ip, 1128321b17ecSEdward Tomasz Napierala size_t off, void *addr, size_t len) 1129321b17ecSEdward Tomasz Napierala { 1130321b17ecSEdward Tomasz Napierala 1131321b17ecSEdward Tomasz Napierala return (icl_pdu_get_data(ip, off, addr, len)); 1132321b17ecSEdward Tomasz Napierala } 1133321b17ecSEdward Tomasz Napierala 1134321b17ecSEdward Tomasz Napierala static void 1135321b17ecSEdward Tomasz Napierala icl_pdu_queue(struct icl_pdu *ip) 1136321b17ecSEdward Tomasz Napierala { 1137321b17ecSEdward Tomasz Napierala struct icl_conn *ic; 1138321b17ecSEdward Tomasz Napierala 1139321b17ecSEdward Tomasz Napierala ic = ip->ip_conn; 1140321b17ecSEdward Tomasz Napierala 1141321b17ecSEdward Tomasz Napierala ICL_CONN_LOCK_ASSERT(ic); 1142321b17ecSEdward Tomasz Napierala 1143321b17ecSEdward Tomasz Napierala if (ic->ic_disconnecting || ic->ic_socket == NULL) { 1144321b17ecSEdward Tomasz Napierala ICL_DEBUG("icl_pdu_queue on closed connection"); 1145321b17ecSEdward Tomasz Napierala icl_pdu_free(ip); 1146321b17ecSEdward Tomasz Napierala return; 1147321b17ecSEdward Tomasz Napierala } 1148321b17ecSEdward Tomasz Napierala 1149321b17ecSEdward Tomasz Napierala if (!STAILQ_EMPTY(&ic->ic_to_send)) { 1150321b17ecSEdward Tomasz Napierala STAILQ_INSERT_TAIL(&ic->ic_to_send, ip, ip_next); 1151321b17ecSEdward Tomasz Napierala /* 1152321b17ecSEdward Tomasz Napierala * If the queue is not empty, someone else had already 1153321b17ecSEdward Tomasz Napierala * signaled the send thread; no need to do that again, 1154321b17ecSEdward Tomasz Napierala * just return. 1155321b17ecSEdward Tomasz Napierala */ 1156321b17ecSEdward Tomasz Napierala return; 1157321b17ecSEdward Tomasz Napierala } 1158321b17ecSEdward Tomasz Napierala 1159321b17ecSEdward Tomasz Napierala STAILQ_INSERT_TAIL(&ic->ic_to_send, ip, ip_next); 1160321b17ecSEdward Tomasz Napierala cv_signal(&ic->ic_send_cv); 1161321b17ecSEdward Tomasz Napierala } 1162321b17ecSEdward Tomasz Napierala 1163321b17ecSEdward Tomasz Napierala void 1164321b17ecSEdward Tomasz Napierala icl_soft_conn_pdu_queue(struct icl_conn *ic, struct icl_pdu *ip) 1165321b17ecSEdward Tomasz Napierala { 1166321b17ecSEdward Tomasz Napierala 1167321b17ecSEdward Tomasz Napierala icl_pdu_queue(ip); 1168321b17ecSEdward Tomasz Napierala } 1169321b17ecSEdward Tomasz Napierala 1170321b17ecSEdward Tomasz Napierala static struct icl_conn * 1171321b17ecSEdward Tomasz Napierala icl_soft_new_conn(const char *name, struct mtx *lock) 1172321b17ecSEdward Tomasz Napierala { 1173321b17ecSEdward Tomasz Napierala struct icl_conn *ic; 1174321b17ecSEdward Tomasz Napierala 1175321b17ecSEdward Tomasz Napierala refcount_acquire(&icl_ncons); 1176321b17ecSEdward Tomasz Napierala 1177321b17ecSEdward Tomasz Napierala ic = (struct icl_conn *)kobj_create(&icl_soft_class, M_ICL_SOFT, M_WAITOK | M_ZERO); 1178321b17ecSEdward Tomasz Napierala 1179321b17ecSEdward Tomasz Napierala STAILQ_INIT(&ic->ic_to_send); 1180321b17ecSEdward Tomasz Napierala ic->ic_lock = lock; 1181321b17ecSEdward Tomasz Napierala cv_init(&ic->ic_send_cv, "icl_tx"); 1182321b17ecSEdward Tomasz Napierala cv_init(&ic->ic_receive_cv, "icl_rx"); 1183321b17ecSEdward Tomasz Napierala #ifdef DIAGNOSTIC 1184321b17ecSEdward Tomasz Napierala refcount_init(&ic->ic_outstanding_pdus, 0); 1185321b17ecSEdward Tomasz Napierala #endif 1186321b17ecSEdward Tomasz Napierala ic->ic_max_data_segment_length = ICL_MAX_DATA_SEGMENT_LENGTH; 1187321b17ecSEdward Tomasz Napierala ic->ic_name = name; 1188321b17ecSEdward Tomasz Napierala 1189321b17ecSEdward Tomasz Napierala return (ic); 1190321b17ecSEdward Tomasz Napierala } 1191321b17ecSEdward Tomasz Napierala 1192321b17ecSEdward Tomasz Napierala void 1193321b17ecSEdward Tomasz Napierala icl_soft_conn_free(struct icl_conn *ic) 1194321b17ecSEdward Tomasz Napierala { 1195321b17ecSEdward Tomasz Napierala 1196321b17ecSEdward Tomasz Napierala cv_destroy(&ic->ic_send_cv); 1197321b17ecSEdward Tomasz Napierala cv_destroy(&ic->ic_receive_cv); 1198321b17ecSEdward Tomasz Napierala kobj_delete((struct kobj *)ic, M_ICL_SOFT); 1199321b17ecSEdward Tomasz Napierala refcount_release(&icl_ncons); 1200321b17ecSEdward Tomasz Napierala } 1201321b17ecSEdward Tomasz Napierala 1202321b17ecSEdward Tomasz Napierala static int 1203321b17ecSEdward Tomasz Napierala icl_conn_start(struct icl_conn *ic) 1204321b17ecSEdward Tomasz Napierala { 1205321b17ecSEdward Tomasz Napierala size_t minspace; 1206321b17ecSEdward Tomasz Napierala struct sockopt opt; 1207321b17ecSEdward Tomasz Napierala int error, one = 1; 1208321b17ecSEdward Tomasz Napierala 1209321b17ecSEdward Tomasz Napierala ICL_CONN_LOCK(ic); 1210321b17ecSEdward Tomasz Napierala 1211321b17ecSEdward Tomasz Napierala /* 1212321b17ecSEdward Tomasz Napierala * XXX: Ugly hack. 1213321b17ecSEdward Tomasz Napierala */ 1214321b17ecSEdward Tomasz Napierala if (ic->ic_socket == NULL) { 1215321b17ecSEdward Tomasz Napierala ICL_CONN_UNLOCK(ic); 1216321b17ecSEdward Tomasz Napierala return (EINVAL); 1217321b17ecSEdward Tomasz Napierala } 1218321b17ecSEdward Tomasz Napierala 1219321b17ecSEdward Tomasz Napierala ic->ic_receive_state = ICL_CONN_STATE_BHS; 1220321b17ecSEdward Tomasz Napierala ic->ic_receive_len = sizeof(struct iscsi_bhs); 1221321b17ecSEdward Tomasz Napierala ic->ic_disconnecting = false; 1222321b17ecSEdward Tomasz Napierala 1223321b17ecSEdward Tomasz Napierala ICL_CONN_UNLOCK(ic); 1224321b17ecSEdward Tomasz Napierala 1225321b17ecSEdward Tomasz Napierala /* 1226321b17ecSEdward Tomasz Napierala * For sendspace, this is required because the current code cannot 1227321b17ecSEdward Tomasz Napierala * send a PDU in pieces; thus, the minimum buffer size is equal 1228321b17ecSEdward Tomasz Napierala * to the maximum PDU size. "+4" is to account for possible padding. 1229321b17ecSEdward Tomasz Napierala * 1230321b17ecSEdward Tomasz Napierala * What we should actually do here is to use autoscaling, but set 1231321b17ecSEdward Tomasz Napierala * some minimal buffer size to "minspace". I don't know a way to do 1232321b17ecSEdward Tomasz Napierala * that, though. 1233321b17ecSEdward Tomasz Napierala */ 1234321b17ecSEdward Tomasz Napierala minspace = sizeof(struct iscsi_bhs) + ic->ic_max_data_segment_length + 1235321b17ecSEdward Tomasz Napierala ISCSI_HEADER_DIGEST_SIZE + ISCSI_DATA_DIGEST_SIZE + 4; 1236321b17ecSEdward Tomasz Napierala if (sendspace < minspace) { 1237321b17ecSEdward Tomasz Napierala ICL_WARN("kern.icl.sendspace too low; must be at least %zd", 1238321b17ecSEdward Tomasz Napierala minspace); 1239321b17ecSEdward Tomasz Napierala sendspace = minspace; 1240321b17ecSEdward Tomasz Napierala } 1241321b17ecSEdward Tomasz Napierala if (recvspace < minspace) { 1242321b17ecSEdward Tomasz Napierala ICL_WARN("kern.icl.recvspace too low; must be at least %zd", 1243321b17ecSEdward Tomasz Napierala minspace); 1244321b17ecSEdward Tomasz Napierala recvspace = minspace; 1245321b17ecSEdward Tomasz Napierala } 1246321b17ecSEdward Tomasz Napierala 1247321b17ecSEdward Tomasz Napierala error = soreserve(ic->ic_socket, sendspace, recvspace); 1248321b17ecSEdward Tomasz Napierala if (error != 0) { 1249321b17ecSEdward Tomasz Napierala ICL_WARN("soreserve failed with error %d", error); 1250321b17ecSEdward Tomasz Napierala icl_conn_close(ic); 1251321b17ecSEdward Tomasz Napierala return (error); 1252321b17ecSEdward Tomasz Napierala } 1253321b17ecSEdward Tomasz Napierala ic->ic_socket->so_snd.sb_flags |= SB_AUTOSIZE; 1254321b17ecSEdward Tomasz Napierala ic->ic_socket->so_rcv.sb_flags |= SB_AUTOSIZE; 1255321b17ecSEdward Tomasz Napierala 1256321b17ecSEdward Tomasz Napierala /* 1257321b17ecSEdward Tomasz Napierala * Disable Nagle. 1258321b17ecSEdward Tomasz Napierala */ 1259321b17ecSEdward Tomasz Napierala bzero(&opt, sizeof(opt)); 1260321b17ecSEdward Tomasz Napierala opt.sopt_dir = SOPT_SET; 1261321b17ecSEdward Tomasz Napierala opt.sopt_level = IPPROTO_TCP; 1262321b17ecSEdward Tomasz Napierala opt.sopt_name = TCP_NODELAY; 1263321b17ecSEdward Tomasz Napierala opt.sopt_val = &one; 1264321b17ecSEdward Tomasz Napierala opt.sopt_valsize = sizeof(one); 1265321b17ecSEdward Tomasz Napierala error = sosetopt(ic->ic_socket, &opt); 1266321b17ecSEdward Tomasz Napierala if (error != 0) { 1267321b17ecSEdward Tomasz Napierala ICL_WARN("disabling TCP_NODELAY failed with error %d", error); 1268321b17ecSEdward Tomasz Napierala icl_conn_close(ic); 1269321b17ecSEdward Tomasz Napierala return (error); 1270321b17ecSEdward Tomasz Napierala } 1271321b17ecSEdward Tomasz Napierala 1272321b17ecSEdward Tomasz Napierala /* 1273321b17ecSEdward Tomasz Napierala * Start threads. 1274321b17ecSEdward Tomasz Napierala */ 1275321b17ecSEdward Tomasz Napierala error = kthread_add(icl_send_thread, ic, NULL, NULL, 0, 0, "%stx", 1276321b17ecSEdward Tomasz Napierala ic->ic_name); 1277321b17ecSEdward Tomasz Napierala if (error != 0) { 1278321b17ecSEdward Tomasz Napierala ICL_WARN("kthread_add(9) failed with error %d", error); 1279321b17ecSEdward Tomasz Napierala icl_conn_close(ic); 1280321b17ecSEdward Tomasz Napierala return (error); 1281321b17ecSEdward Tomasz Napierala } 1282321b17ecSEdward Tomasz Napierala 1283321b17ecSEdward Tomasz Napierala error = kthread_add(icl_receive_thread, ic, NULL, NULL, 0, 0, "%srx", 1284321b17ecSEdward Tomasz Napierala ic->ic_name); 1285321b17ecSEdward Tomasz Napierala if (error != 0) { 1286321b17ecSEdward Tomasz Napierala ICL_WARN("kthread_add(9) failed with error %d", error); 1287321b17ecSEdward Tomasz Napierala icl_conn_close(ic); 1288321b17ecSEdward Tomasz Napierala return (error); 1289321b17ecSEdward Tomasz Napierala } 1290321b17ecSEdward Tomasz Napierala 1291321b17ecSEdward Tomasz Napierala /* 1292321b17ecSEdward Tomasz Napierala * Register socket upcall, to get notified about incoming PDUs 1293321b17ecSEdward Tomasz Napierala * and free space to send outgoing ones. 1294321b17ecSEdward Tomasz Napierala */ 1295321b17ecSEdward Tomasz Napierala SOCKBUF_LOCK(&ic->ic_socket->so_snd); 1296321b17ecSEdward Tomasz Napierala soupcall_set(ic->ic_socket, SO_SND, icl_soupcall_send, ic); 1297321b17ecSEdward Tomasz Napierala SOCKBUF_UNLOCK(&ic->ic_socket->so_snd); 1298321b17ecSEdward Tomasz Napierala SOCKBUF_LOCK(&ic->ic_socket->so_rcv); 1299321b17ecSEdward Tomasz Napierala soupcall_set(ic->ic_socket, SO_RCV, icl_soupcall_receive, ic); 1300321b17ecSEdward Tomasz Napierala SOCKBUF_UNLOCK(&ic->ic_socket->so_rcv); 1301321b17ecSEdward Tomasz Napierala 1302321b17ecSEdward Tomasz Napierala return (0); 1303321b17ecSEdward Tomasz Napierala } 1304321b17ecSEdward Tomasz Napierala 1305321b17ecSEdward Tomasz Napierala int 1306321b17ecSEdward Tomasz Napierala icl_soft_conn_handoff(struct icl_conn *ic, int fd) 1307321b17ecSEdward Tomasz Napierala { 1308321b17ecSEdward Tomasz Napierala struct file *fp; 1309321b17ecSEdward Tomasz Napierala struct socket *so; 1310321b17ecSEdward Tomasz Napierala cap_rights_t rights; 1311321b17ecSEdward Tomasz Napierala int error; 1312321b17ecSEdward Tomasz Napierala 1313321b17ecSEdward Tomasz Napierala ICL_CONN_LOCK_ASSERT_NOT(ic); 1314321b17ecSEdward Tomasz Napierala 1315321b17ecSEdward Tomasz Napierala /* 1316321b17ecSEdward Tomasz Napierala * Steal the socket from userland. 1317321b17ecSEdward Tomasz Napierala */ 1318321b17ecSEdward Tomasz Napierala error = fget(curthread, fd, 1319321b17ecSEdward Tomasz Napierala cap_rights_init(&rights, CAP_SOCK_CLIENT), &fp); 1320321b17ecSEdward Tomasz Napierala if (error != 0) 1321321b17ecSEdward Tomasz Napierala return (error); 1322321b17ecSEdward Tomasz Napierala if (fp->f_type != DTYPE_SOCKET) { 1323321b17ecSEdward Tomasz Napierala fdrop(fp, curthread); 1324321b17ecSEdward Tomasz Napierala return (EINVAL); 1325321b17ecSEdward Tomasz Napierala } 1326321b17ecSEdward Tomasz Napierala so = fp->f_data; 1327321b17ecSEdward Tomasz Napierala if (so->so_type != SOCK_STREAM) { 1328321b17ecSEdward Tomasz Napierala fdrop(fp, curthread); 1329321b17ecSEdward Tomasz Napierala return (EINVAL); 1330321b17ecSEdward Tomasz Napierala } 1331321b17ecSEdward Tomasz Napierala 1332321b17ecSEdward Tomasz Napierala ICL_CONN_LOCK(ic); 1333321b17ecSEdward Tomasz Napierala 1334321b17ecSEdward Tomasz Napierala if (ic->ic_socket != NULL) { 1335321b17ecSEdward Tomasz Napierala ICL_CONN_UNLOCK(ic); 1336321b17ecSEdward Tomasz Napierala fdrop(fp, curthread); 1337321b17ecSEdward Tomasz Napierala return (EBUSY); 1338321b17ecSEdward Tomasz Napierala } 1339321b17ecSEdward Tomasz Napierala 1340321b17ecSEdward Tomasz Napierala ic->ic_socket = fp->f_data; 1341321b17ecSEdward Tomasz Napierala fp->f_ops = &badfileops; 1342321b17ecSEdward Tomasz Napierala fp->f_data = NULL; 1343321b17ecSEdward Tomasz Napierala fdrop(fp, curthread); 1344321b17ecSEdward Tomasz Napierala ICL_CONN_UNLOCK(ic); 1345321b17ecSEdward Tomasz Napierala 1346321b17ecSEdward Tomasz Napierala error = icl_conn_start(ic); 1347321b17ecSEdward Tomasz Napierala 1348321b17ecSEdward Tomasz Napierala return (error); 1349321b17ecSEdward Tomasz Napierala } 1350321b17ecSEdward Tomasz Napierala 1351321b17ecSEdward Tomasz Napierala void 1352321b17ecSEdward Tomasz Napierala icl_conn_close(struct icl_conn *ic) 1353321b17ecSEdward Tomasz Napierala { 1354321b17ecSEdward Tomasz Napierala struct icl_pdu *pdu; 1355321b17ecSEdward Tomasz Napierala 1356321b17ecSEdward Tomasz Napierala ICL_CONN_LOCK_ASSERT_NOT(ic); 1357321b17ecSEdward Tomasz Napierala 1358321b17ecSEdward Tomasz Napierala ICL_CONN_LOCK(ic); 1359321b17ecSEdward Tomasz Napierala if (ic->ic_socket == NULL) { 1360321b17ecSEdward Tomasz Napierala ICL_CONN_UNLOCK(ic); 1361321b17ecSEdward Tomasz Napierala return; 1362321b17ecSEdward Tomasz Napierala } 1363321b17ecSEdward Tomasz Napierala 1364321b17ecSEdward Tomasz Napierala /* 1365321b17ecSEdward Tomasz Napierala * Deregister socket upcalls. 1366321b17ecSEdward Tomasz Napierala */ 1367321b17ecSEdward Tomasz Napierala ICL_CONN_UNLOCK(ic); 1368321b17ecSEdward Tomasz Napierala SOCKBUF_LOCK(&ic->ic_socket->so_snd); 1369321b17ecSEdward Tomasz Napierala if (ic->ic_socket->so_snd.sb_upcall != NULL) 1370321b17ecSEdward Tomasz Napierala soupcall_clear(ic->ic_socket, SO_SND); 1371321b17ecSEdward Tomasz Napierala SOCKBUF_UNLOCK(&ic->ic_socket->so_snd); 1372321b17ecSEdward Tomasz Napierala SOCKBUF_LOCK(&ic->ic_socket->so_rcv); 1373321b17ecSEdward Tomasz Napierala if (ic->ic_socket->so_rcv.sb_upcall != NULL) 1374321b17ecSEdward Tomasz Napierala soupcall_clear(ic->ic_socket, SO_RCV); 1375321b17ecSEdward Tomasz Napierala SOCKBUF_UNLOCK(&ic->ic_socket->so_rcv); 1376321b17ecSEdward Tomasz Napierala ICL_CONN_LOCK(ic); 1377321b17ecSEdward Tomasz Napierala 1378321b17ecSEdward Tomasz Napierala ic->ic_disconnecting = true; 1379321b17ecSEdward Tomasz Napierala 1380321b17ecSEdward Tomasz Napierala /* 1381321b17ecSEdward Tomasz Napierala * Wake up the threads, so they can properly terminate. 1382321b17ecSEdward Tomasz Napierala */ 1383321b17ecSEdward Tomasz Napierala while (ic->ic_receive_running || ic->ic_send_running) { 1384321b17ecSEdward Tomasz Napierala //ICL_DEBUG("waiting for send/receive threads to terminate"); 1385321b17ecSEdward Tomasz Napierala cv_signal(&ic->ic_receive_cv); 1386321b17ecSEdward Tomasz Napierala cv_signal(&ic->ic_send_cv); 1387321b17ecSEdward Tomasz Napierala cv_wait(&ic->ic_send_cv, ic->ic_lock); 1388321b17ecSEdward Tomasz Napierala } 1389321b17ecSEdward Tomasz Napierala //ICL_DEBUG("send/receive threads terminated"); 1390321b17ecSEdward Tomasz Napierala 1391321b17ecSEdward Tomasz Napierala ICL_CONN_UNLOCK(ic); 1392321b17ecSEdward Tomasz Napierala soclose(ic->ic_socket); 1393321b17ecSEdward Tomasz Napierala ICL_CONN_LOCK(ic); 1394321b17ecSEdward Tomasz Napierala ic->ic_socket = NULL; 1395321b17ecSEdward Tomasz Napierala 1396321b17ecSEdward Tomasz Napierala if (ic->ic_receive_pdu != NULL) { 1397321b17ecSEdward Tomasz Napierala //ICL_DEBUG("freeing partially received PDU"); 1398321b17ecSEdward Tomasz Napierala icl_pdu_free(ic->ic_receive_pdu); 1399321b17ecSEdward Tomasz Napierala ic->ic_receive_pdu = NULL; 1400321b17ecSEdward Tomasz Napierala } 1401321b17ecSEdward Tomasz Napierala 1402321b17ecSEdward Tomasz Napierala /* 1403321b17ecSEdward Tomasz Napierala * Remove any outstanding PDUs from the send queue. 1404321b17ecSEdward Tomasz Napierala */ 1405321b17ecSEdward Tomasz Napierala while (!STAILQ_EMPTY(&ic->ic_to_send)) { 1406321b17ecSEdward Tomasz Napierala pdu = STAILQ_FIRST(&ic->ic_to_send); 1407321b17ecSEdward Tomasz Napierala STAILQ_REMOVE_HEAD(&ic->ic_to_send, ip_next); 1408321b17ecSEdward Tomasz Napierala icl_pdu_free(pdu); 1409321b17ecSEdward Tomasz Napierala } 1410321b17ecSEdward Tomasz Napierala 1411321b17ecSEdward Tomasz Napierala KASSERT(STAILQ_EMPTY(&ic->ic_to_send), 1412321b17ecSEdward Tomasz Napierala ("destroying session with non-empty send queue")); 1413321b17ecSEdward Tomasz Napierala #ifdef DIAGNOSTIC 1414321b17ecSEdward Tomasz Napierala KASSERT(ic->ic_outstanding_pdus == 0, 1415321b17ecSEdward Tomasz Napierala ("destroying session with %d outstanding PDUs", 1416321b17ecSEdward Tomasz Napierala ic->ic_outstanding_pdus)); 1417321b17ecSEdward Tomasz Napierala #endif 1418321b17ecSEdward Tomasz Napierala ICL_CONN_UNLOCK(ic); 1419321b17ecSEdward Tomasz Napierala } 1420321b17ecSEdward Tomasz Napierala 1421321b17ecSEdward Tomasz Napierala void 1422321b17ecSEdward Tomasz Napierala icl_soft_conn_close(struct icl_conn *ic) 1423321b17ecSEdward Tomasz Napierala { 1424321b17ecSEdward Tomasz Napierala 1425321b17ecSEdward Tomasz Napierala icl_conn_close(ic); 1426321b17ecSEdward Tomasz Napierala } 1427321b17ecSEdward Tomasz Napierala 1428321b17ecSEdward Tomasz Napierala bool 1429321b17ecSEdward Tomasz Napierala icl_soft_conn_connected(struct icl_conn *ic) 1430321b17ecSEdward Tomasz Napierala { 1431321b17ecSEdward Tomasz Napierala ICL_CONN_LOCK_ASSERT_NOT(ic); 1432321b17ecSEdward Tomasz Napierala 1433321b17ecSEdward Tomasz Napierala ICL_CONN_LOCK(ic); 1434321b17ecSEdward Tomasz Napierala if (ic->ic_socket == NULL) { 1435321b17ecSEdward Tomasz Napierala ICL_CONN_UNLOCK(ic); 1436321b17ecSEdward Tomasz Napierala return (false); 1437321b17ecSEdward Tomasz Napierala } 1438321b17ecSEdward Tomasz Napierala if (ic->ic_socket->so_error != 0) { 1439321b17ecSEdward Tomasz Napierala ICL_CONN_UNLOCK(ic); 1440321b17ecSEdward Tomasz Napierala return (false); 1441321b17ecSEdward Tomasz Napierala } 1442321b17ecSEdward Tomasz Napierala ICL_CONN_UNLOCK(ic); 1443321b17ecSEdward Tomasz Napierala return (true); 1444321b17ecSEdward Tomasz Napierala } 1445321b17ecSEdward Tomasz Napierala 1446321b17ecSEdward Tomasz Napierala static int 1447321b17ecSEdward Tomasz Napierala icl_soft_limits(size_t *limitp) 1448321b17ecSEdward Tomasz Napierala { 1449321b17ecSEdward Tomasz Napierala 1450321b17ecSEdward Tomasz Napierala *limitp = 128 * 1024; 1451321b17ecSEdward Tomasz Napierala 1452321b17ecSEdward Tomasz Napierala return (0); 1453321b17ecSEdward Tomasz Napierala } 1454321b17ecSEdward Tomasz Napierala 1455321b17ecSEdward Tomasz Napierala #ifdef ICL_KERNEL_PROXY 1456321b17ecSEdward Tomasz Napierala int 1457321b17ecSEdward Tomasz Napierala icl_conn_handoff_sock(struct icl_conn *ic, struct socket *so) 1458321b17ecSEdward Tomasz Napierala { 1459321b17ecSEdward Tomasz Napierala int error; 1460321b17ecSEdward Tomasz Napierala 1461321b17ecSEdward Tomasz Napierala ICL_CONN_LOCK_ASSERT_NOT(ic); 1462321b17ecSEdward Tomasz Napierala 1463321b17ecSEdward Tomasz Napierala if (so->so_type != SOCK_STREAM) 1464321b17ecSEdward Tomasz Napierala return (EINVAL); 1465321b17ecSEdward Tomasz Napierala 1466321b17ecSEdward Tomasz Napierala ICL_CONN_LOCK(ic); 1467321b17ecSEdward Tomasz Napierala if (ic->ic_socket != NULL) { 1468321b17ecSEdward Tomasz Napierala ICL_CONN_UNLOCK(ic); 1469321b17ecSEdward Tomasz Napierala return (EBUSY); 1470321b17ecSEdward Tomasz Napierala } 1471321b17ecSEdward Tomasz Napierala ic->ic_socket = so; 1472321b17ecSEdward Tomasz Napierala ICL_CONN_UNLOCK(ic); 1473321b17ecSEdward Tomasz Napierala 1474321b17ecSEdward Tomasz Napierala error = icl_conn_start(ic); 1475321b17ecSEdward Tomasz Napierala 1476321b17ecSEdward Tomasz Napierala return (error); 1477321b17ecSEdward Tomasz Napierala } 1478321b17ecSEdward Tomasz Napierala #endif /* ICL_KERNEL_PROXY */ 1479321b17ecSEdward Tomasz Napierala 1480321b17ecSEdward Tomasz Napierala static int 1481321b17ecSEdward Tomasz Napierala icl_soft_load(void) 1482321b17ecSEdward Tomasz Napierala { 1483321b17ecSEdward Tomasz Napierala int error; 1484321b17ecSEdward Tomasz Napierala 1485321b17ecSEdward Tomasz Napierala icl_pdu_zone = uma_zcreate("icl_pdu", 1486321b17ecSEdward Tomasz Napierala sizeof(struct icl_pdu), NULL, NULL, NULL, NULL, 1487321b17ecSEdward Tomasz Napierala UMA_ALIGN_PTR, 0); 1488321b17ecSEdward Tomasz Napierala refcount_init(&icl_ncons, 0); 1489321b17ecSEdward Tomasz Napierala 1490321b17ecSEdward Tomasz Napierala /* 1491321b17ecSEdward Tomasz Napierala * The reason we call this "none" is that to the user, 1492321b17ecSEdward Tomasz Napierala * it's known as "offload driver"; "offload driver: soft" 1493321b17ecSEdward Tomasz Napierala * doesn't make much sense. 1494321b17ecSEdward Tomasz Napierala */ 1495321b17ecSEdward Tomasz Napierala error = icl_register("none", 0, icl_soft_limits, icl_soft_new_conn); 1496321b17ecSEdward Tomasz Napierala KASSERT(error == 0, ("failed to register")); 1497321b17ecSEdward Tomasz Napierala 1498321b17ecSEdward Tomasz Napierala return (error); 1499321b17ecSEdward Tomasz Napierala } 1500321b17ecSEdward Tomasz Napierala 1501321b17ecSEdward Tomasz Napierala static int 1502321b17ecSEdward Tomasz Napierala icl_soft_unload(void) 1503321b17ecSEdward Tomasz Napierala { 1504321b17ecSEdward Tomasz Napierala 1505321b17ecSEdward Tomasz Napierala if (icl_ncons != 0) 1506321b17ecSEdward Tomasz Napierala return (EBUSY); 1507321b17ecSEdward Tomasz Napierala 1508321b17ecSEdward Tomasz Napierala icl_unregister("none"); 1509321b17ecSEdward Tomasz Napierala 1510321b17ecSEdward Tomasz Napierala uma_zdestroy(icl_pdu_zone); 1511321b17ecSEdward Tomasz Napierala 1512321b17ecSEdward Tomasz Napierala return (0); 1513321b17ecSEdward Tomasz Napierala } 1514321b17ecSEdward Tomasz Napierala 1515321b17ecSEdward Tomasz Napierala static int 1516321b17ecSEdward Tomasz Napierala icl_soft_modevent(module_t mod, int what, void *arg) 1517321b17ecSEdward Tomasz Napierala { 1518321b17ecSEdward Tomasz Napierala 1519321b17ecSEdward Tomasz Napierala switch (what) { 1520321b17ecSEdward Tomasz Napierala case MOD_LOAD: 1521321b17ecSEdward Tomasz Napierala return (icl_soft_load()); 1522321b17ecSEdward Tomasz Napierala case MOD_UNLOAD: 1523321b17ecSEdward Tomasz Napierala return (icl_soft_unload()); 1524321b17ecSEdward Tomasz Napierala default: 1525321b17ecSEdward Tomasz Napierala return (EINVAL); 1526321b17ecSEdward Tomasz Napierala } 1527321b17ecSEdward Tomasz Napierala } 1528321b17ecSEdward Tomasz Napierala 1529321b17ecSEdward Tomasz Napierala moduledata_t icl_soft_data = { 1530321b17ecSEdward Tomasz Napierala "icl_soft", 1531321b17ecSEdward Tomasz Napierala icl_soft_modevent, 1532321b17ecSEdward Tomasz Napierala 0 1533321b17ecSEdward Tomasz Napierala }; 1534321b17ecSEdward Tomasz Napierala 1535321b17ecSEdward Tomasz Napierala DECLARE_MODULE(icl_soft, icl_soft_data, SI_SUB_DRIVERS, SI_ORDER_MIDDLE); 1536321b17ecSEdward Tomasz Napierala MODULE_DEPEND(icl_soft, icl, 1, 1, 1); 1537*872d2d92SEdward Tomasz Napierala MODULE_VERSION(icl_soft, 1); 1538