xref: /titanic_50/usr/src/uts/common/syscall/sendfile.c (revision 3b3d24f3fd8a5920a6c0fa6412113e669fe0129e)
17c478bd9Sstevel@tonic-gate /*
27c478bd9Sstevel@tonic-gate  * CDDL HEADER START
37c478bd9Sstevel@tonic-gate  *
47c478bd9Sstevel@tonic-gate  * The contents of this file are subject to the terms of the
52caf0dcdSrshoaib  * Common Development and Distribution License (the "License").
62caf0dcdSrshoaib  * You may not use this file except in compliance with the License.
77c478bd9Sstevel@tonic-gate  *
87c478bd9Sstevel@tonic-gate  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
97c478bd9Sstevel@tonic-gate  * or http://www.opensolaris.org/os/licensing.
107c478bd9Sstevel@tonic-gate  * See the License for the specific language governing permissions
117c478bd9Sstevel@tonic-gate  * and limitations under the License.
127c478bd9Sstevel@tonic-gate  *
137c478bd9Sstevel@tonic-gate  * When distributing Covered Code, include this CDDL HEADER in each
147c478bd9Sstevel@tonic-gate  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
157c478bd9Sstevel@tonic-gate  * If applicable, add the following below this CDDL HEADER, with the
167c478bd9Sstevel@tonic-gate  * fields enclosed by brackets "[]" replaced with your own identifying
177c478bd9Sstevel@tonic-gate  * information: Portions Copyright [yyyy] [name of copyright owner]
187c478bd9Sstevel@tonic-gate  *
197c478bd9Sstevel@tonic-gate  * CDDL HEADER END
207c478bd9Sstevel@tonic-gate  */
212caf0dcdSrshoaib 
227c478bd9Sstevel@tonic-gate /*
23311e3d4cSgeorges  * Copyright 2008 Sun Microsystems, Inc.  All rights reserved.
247c478bd9Sstevel@tonic-gate  * Use is subject to license terms.
257c478bd9Sstevel@tonic-gate  */
267c478bd9Sstevel@tonic-gate 
277c478bd9Sstevel@tonic-gate #include <sys/types.h>
287c478bd9Sstevel@tonic-gate #include <sys/t_lock.h>
297c478bd9Sstevel@tonic-gate #include <sys/param.h>
307c478bd9Sstevel@tonic-gate #include <sys/systm.h>
317c478bd9Sstevel@tonic-gate #include <sys/buf.h>
327c478bd9Sstevel@tonic-gate #include <sys/conf.h>
337c478bd9Sstevel@tonic-gate #include <sys/cred.h>
347c478bd9Sstevel@tonic-gate #include <sys/kmem.h>
357c478bd9Sstevel@tonic-gate #include <sys/sysmacros.h>
367c478bd9Sstevel@tonic-gate #include <sys/vfs.h>
377c478bd9Sstevel@tonic-gate #include <sys/vnode.h>
387c478bd9Sstevel@tonic-gate #include <sys/debug.h>
397c478bd9Sstevel@tonic-gate #include <sys/errno.h>
407c478bd9Sstevel@tonic-gate #include <sys/time.h>
417c478bd9Sstevel@tonic-gate #include <sys/file.h>
427c478bd9Sstevel@tonic-gate #include <sys/open.h>
437c478bd9Sstevel@tonic-gate #include <sys/user.h>
447c478bd9Sstevel@tonic-gate #include <sys/termios.h>
457c478bd9Sstevel@tonic-gate #include <sys/stream.h>
467c478bd9Sstevel@tonic-gate #include <sys/strsubr.h>
4774024373Spr14459 #include <sys/sunddi.h>
487c478bd9Sstevel@tonic-gate #include <sys/esunddi.h>
497c478bd9Sstevel@tonic-gate #include <sys/flock.h>
507c478bd9Sstevel@tonic-gate #include <sys/modctl.h>
517c478bd9Sstevel@tonic-gate #include <sys/cmn_err.h>
527c478bd9Sstevel@tonic-gate #include <sys/vmsystm.h>
537c478bd9Sstevel@tonic-gate 
547c478bd9Sstevel@tonic-gate #include <sys/socket.h>
557c478bd9Sstevel@tonic-gate #include <sys/socketvar.h>
5645916cd2Sjpk /* swilly code in sys/socketvar.h turns off DEBUG */
5745916cd2Sjpk #ifdef __lint
5845916cd2Sjpk #define	DEBUG
5945916cd2Sjpk #endif
6045916cd2Sjpk 
617c478bd9Sstevel@tonic-gate #include <netinet/in.h>
627c478bd9Sstevel@tonic-gate #include <sys/sendfile.h>
637c478bd9Sstevel@tonic-gate #include <sys/un.h>
647c478bd9Sstevel@tonic-gate #include <sys/tihdr.h>
657c478bd9Sstevel@tonic-gate #include <sys/atomic.h>
667c478bd9Sstevel@tonic-gate 
677c478bd9Sstevel@tonic-gate #include <inet/common.h>
687c478bd9Sstevel@tonic-gate #include <inet/ip.h>
697c478bd9Sstevel@tonic-gate #include <inet/ip6.h>
707c478bd9Sstevel@tonic-gate #include <inet/tcp.h>
717c478bd9Sstevel@tonic-gate 
727c478bd9Sstevel@tonic-gate extern int sosendfile64(file_t *, file_t *, const struct ksendfilevec64 *,
737c478bd9Sstevel@tonic-gate 		ssize32_t *);
742c9e429eSbrutus extern int nl7c_sendfilev(struct sonode *, u_offset_t *, struct sendfilevec *,
752c9e429eSbrutus 		int, ssize_t *);
76*3b3d24f3SJayakara Kini extern int snf_segmap(file_t *, vnode_t *, u_offset_t, u_offset_t, ssize_t *,
77*3b3d24f3SJayakara Kini 		boolean_t);
7874024373Spr14459 
7974024373Spr14459 #define	readflg	(V_WRITELOCK_FALSE)
8074024373Spr14459 #define	rwflag	(V_WRITELOCK_TRUE)
817c478bd9Sstevel@tonic-gate 
82ff550d0eSmasputra /*
83ff550d0eSmasputra  * kstrwritemp() has very similar semantics as that of strwrite().
84ff550d0eSmasputra  * The main difference is it obtains mblks from the caller and also
85ff550d0eSmasputra  * does not do any copy as done in strwrite() from user buffers to
86ff550d0eSmasputra  * kernel buffers.
87ff550d0eSmasputra  *
88ff550d0eSmasputra  * Currently, this routine is used by sendfile to send data allocated
89ff550d0eSmasputra  * within the kernel without any copying. This interface does not use the
90ff550d0eSmasputra  * synchronous stream interface as synch. stream interface implies
91ff550d0eSmasputra  * copying.
92ff550d0eSmasputra  */
93ff550d0eSmasputra int
94ff550d0eSmasputra kstrwritemp(struct vnode *vp, mblk_t *mp, ushort_t fmode)
95ff550d0eSmasputra {
96ff550d0eSmasputra 	struct stdata *stp;
97ff550d0eSmasputra 	struct queue *wqp;
98c28749e9Skais 	mblk_t *newmp;
99ff550d0eSmasputra 	char waitflag;
100ff550d0eSmasputra 	int tempmode;
101ff550d0eSmasputra 	int error = 0;
102ff550d0eSmasputra 	int done = 0;
103ff550d0eSmasputra 	struct sonode *so;
104ff550d0eSmasputra 	boolean_t direct;
105ff550d0eSmasputra 
106ff550d0eSmasputra 	ASSERT(vp->v_stream);
107ff550d0eSmasputra 	stp = vp->v_stream;
108ff550d0eSmasputra 
109ff550d0eSmasputra 	so = VTOSO(vp);
110ff550d0eSmasputra 	direct = (so->so_state & SS_DIRECT);
111ff550d0eSmasputra 
112ff550d0eSmasputra 	/*
113ff550d0eSmasputra 	 * This is the sockfs direct fast path. canputnext() need
114ff550d0eSmasputra 	 * not be accurate so we don't grab the sd_lock here. If
115ff550d0eSmasputra 	 * we get flow-controlled, we grab sd_lock just before the
116ff550d0eSmasputra 	 * do..while loop below to emulate what strwrite() does.
117ff550d0eSmasputra 	 */
118ff550d0eSmasputra 	wqp = stp->sd_wrq;
119ff550d0eSmasputra 	if (canputnext(wqp) && direct &&
120ff550d0eSmasputra 	    !(stp->sd_flag & (STWRERR|STRHUP|STPLEX))) {
121ff550d0eSmasputra 		return (sostream_direct(so, NULL, mp, CRED()));
122ff550d0eSmasputra 	} else if (stp->sd_flag & (STWRERR|STRHUP|STPLEX)) {
123ff550d0eSmasputra 		/* Fast check of flags before acquiring the lock */
124ff550d0eSmasputra 		mutex_enter(&stp->sd_lock);
125ff550d0eSmasputra 		error = strgeterr(stp, STWRERR|STRHUP|STPLEX, 0);
126ff550d0eSmasputra 		mutex_exit(&stp->sd_lock);
127ff550d0eSmasputra 		if (error != 0) {
128ff550d0eSmasputra 			if (!(stp->sd_flag & STPLEX) &&
129ff550d0eSmasputra 			    (stp->sd_wput_opt & SW_SIGPIPE)) {
130ff550d0eSmasputra 				tsignal(curthread, SIGPIPE);
131ff550d0eSmasputra 				error = EPIPE;
132ff550d0eSmasputra 			}
133ff550d0eSmasputra 			return (error);
134ff550d0eSmasputra 		}
135ff550d0eSmasputra 	}
136ff550d0eSmasputra 
137ff550d0eSmasputra 	waitflag = WRITEWAIT;
138ff550d0eSmasputra 	if (stp->sd_flag & OLDNDELAY)
139ff550d0eSmasputra 		tempmode = fmode & ~FNDELAY;
140ff550d0eSmasputra 	else
141ff550d0eSmasputra 		tempmode = fmode;
142ff550d0eSmasputra 
143ff550d0eSmasputra 	mutex_enter(&stp->sd_lock);
144ff550d0eSmasputra 	do {
145ff550d0eSmasputra 		if (canputnext(wqp)) {
146ff550d0eSmasputra 			mutex_exit(&stp->sd_lock);
147c28749e9Skais 			if (stp->sd_wputdatafunc != NULL) {
148c28749e9Skais 				newmp = (stp->sd_wputdatafunc)(vp, mp, NULL,
149c28749e9Skais 				    NULL, NULL, NULL);
150c28749e9Skais 				if (newmp == NULL) {
151c28749e9Skais 					/* The caller will free mp */
152c28749e9Skais 					return (ECOMM);
153c28749e9Skais 				}
154c28749e9Skais 				mp = newmp;
155c28749e9Skais 			}
156ff550d0eSmasputra 			putnext(wqp, mp);
157ff550d0eSmasputra 			return (0);
158ff550d0eSmasputra 		}
159ff550d0eSmasputra 		error = strwaitq(stp, waitflag, (ssize_t)0, tempmode, -1,
160ff550d0eSmasputra 		    &done);
161ff550d0eSmasputra 	} while (error == 0 && !done);
162ff550d0eSmasputra 
163ff550d0eSmasputra 	mutex_exit(&stp->sd_lock);
164ff550d0eSmasputra 	/*
165ff550d0eSmasputra 	 * EAGAIN tells the application to try again. ENOMEM
166ff550d0eSmasputra 	 * is returned only if the memory allocation size
167ff550d0eSmasputra 	 * exceeds the physical limits of the system. ENOMEM
168ff550d0eSmasputra 	 * can't be true here.
169ff550d0eSmasputra 	 */
170ff550d0eSmasputra 	if (error == ENOMEM)
171ff550d0eSmasputra 		error = EAGAIN;
172ff550d0eSmasputra 	return (error);
173ff550d0eSmasputra }
174ff550d0eSmasputra 
1757c478bd9Sstevel@tonic-gate #define	SEND_MAX_CHUNK	16
1767c478bd9Sstevel@tonic-gate 
1777c478bd9Sstevel@tonic-gate #if defined(_SYSCALL32_IMPL) || defined(_ILP32)
1787c478bd9Sstevel@tonic-gate /*
1797c478bd9Sstevel@tonic-gate  * 64 bit offsets for 32 bit applications only running either on
1807c478bd9Sstevel@tonic-gate  * 64 bit kernel or 32 bit kernel. For 32 bit apps, we can't transfer
1817c478bd9Sstevel@tonic-gate  * more than 2GB of data.
1827c478bd9Sstevel@tonic-gate  */
1837c478bd9Sstevel@tonic-gate int
1847c478bd9Sstevel@tonic-gate sendvec_chunk64(file_t *fp, u_offset_t *fileoff, struct ksendfilevec64 *sfv,
1857c478bd9Sstevel@tonic-gate     int copy_cnt, ssize32_t *count)
1867c478bd9Sstevel@tonic-gate {
1877c478bd9Sstevel@tonic-gate 	struct vnode *vp;
1887c478bd9Sstevel@tonic-gate 	ushort_t fflag;
1897c478bd9Sstevel@tonic-gate 	int ioflag;
1907c478bd9Sstevel@tonic-gate 	size32_t cnt;
1917c478bd9Sstevel@tonic-gate 	ssize32_t sfv_len;
1927c478bd9Sstevel@tonic-gate 	ssize32_t tmpcount;
1937c478bd9Sstevel@tonic-gate 	u_offset_t sfv_off;
1947c478bd9Sstevel@tonic-gate 	struct uio auio;
1957c478bd9Sstevel@tonic-gate 	struct iovec aiov;
1967c478bd9Sstevel@tonic-gate 	int i, error;
1977c478bd9Sstevel@tonic-gate 
1987c478bd9Sstevel@tonic-gate 	fflag = fp->f_flag;
1997c478bd9Sstevel@tonic-gate 	vp = fp->f_vnode;
2007c478bd9Sstevel@tonic-gate 	for (i = 0; i < copy_cnt; i++) {
2017c478bd9Sstevel@tonic-gate 
2027c478bd9Sstevel@tonic-gate 		if (ISSIG(curthread, JUSTLOOKING))
2037c478bd9Sstevel@tonic-gate 			return (EINTR);
2047c478bd9Sstevel@tonic-gate 
2057c478bd9Sstevel@tonic-gate 		/*
2067c478bd9Sstevel@tonic-gate 		 * Do similar checks as "write" as we are writing
2077c478bd9Sstevel@tonic-gate 		 * sfv_len bytes into "vp".
2087c478bd9Sstevel@tonic-gate 		 */
2097c478bd9Sstevel@tonic-gate 		sfv_len = (ssize32_t)sfv->sfv_len;
2107c478bd9Sstevel@tonic-gate 
2117c478bd9Sstevel@tonic-gate 		if (sfv_len == 0)
2127c478bd9Sstevel@tonic-gate 			continue;
2137c478bd9Sstevel@tonic-gate 
2147c478bd9Sstevel@tonic-gate 		if (sfv_len < 0)
2157c478bd9Sstevel@tonic-gate 			return (EINVAL);
2167c478bd9Sstevel@tonic-gate 
2177c478bd9Sstevel@tonic-gate 		if (vp->v_type == VREG) {
2187c478bd9Sstevel@tonic-gate 			if (*fileoff >= curproc->p_fsz_ctl) {
2197c478bd9Sstevel@tonic-gate 				mutex_enter(&curproc->p_lock);
2207c478bd9Sstevel@tonic-gate 				(void) rctl_action(
2217c478bd9Sstevel@tonic-gate 				    rctlproc_legacy[RLIMIT_FSIZE],
2227c478bd9Sstevel@tonic-gate 				    curproc->p_rctls, curproc, RCA_SAFE);
2237c478bd9Sstevel@tonic-gate 				mutex_exit(&curproc->p_lock);
2247c478bd9Sstevel@tonic-gate 				return (EFBIG);
2257c478bd9Sstevel@tonic-gate 			}
2267c478bd9Sstevel@tonic-gate 
2277c478bd9Sstevel@tonic-gate 			if (*fileoff >= OFFSET_MAX(fp))
2287c478bd9Sstevel@tonic-gate 				return (EFBIG);
2297c478bd9Sstevel@tonic-gate 
2307c478bd9Sstevel@tonic-gate 			if (*fileoff + sfv_len > OFFSET_MAX(fp))
2317c478bd9Sstevel@tonic-gate 				return (EINVAL);
2327c478bd9Sstevel@tonic-gate 		}
2337c478bd9Sstevel@tonic-gate 
2347c478bd9Sstevel@tonic-gate 		tmpcount = *count + sfv_len;
2357c478bd9Sstevel@tonic-gate 		if (tmpcount < 0)
2367c478bd9Sstevel@tonic-gate 			return (EINVAL);
2377c478bd9Sstevel@tonic-gate 
2387c478bd9Sstevel@tonic-gate 		sfv_off = sfv->sfv_off;
2397c478bd9Sstevel@tonic-gate 
2407c478bd9Sstevel@tonic-gate 		auio.uio_extflg = UIO_COPY_DEFAULT;
2417c478bd9Sstevel@tonic-gate 		if (sfv->sfv_fd == SFV_FD_SELF) {
2427c478bd9Sstevel@tonic-gate 			aiov.iov_len = sfv_len;
2437c478bd9Sstevel@tonic-gate 			aiov.iov_base = (caddr_t)(uintptr_t)sfv_off;
2447c478bd9Sstevel@tonic-gate 			auio.uio_loffset = *fileoff;
2457c478bd9Sstevel@tonic-gate 			auio.uio_iovcnt = 1;
2467c478bd9Sstevel@tonic-gate 			auio.uio_resid = sfv_len;
2477c478bd9Sstevel@tonic-gate 			auio.uio_iov = &aiov;
2487c478bd9Sstevel@tonic-gate 			auio.uio_segflg = UIO_USERSPACE;
2497c478bd9Sstevel@tonic-gate 			auio.uio_llimit = curproc->p_fsz_ctl;
2507c478bd9Sstevel@tonic-gate 			auio.uio_fmode = fflag;
2517c478bd9Sstevel@tonic-gate 			ioflag = auio.uio_fmode & (FAPPEND|FSYNC|FDSYNC|FRSYNC);
2527c478bd9Sstevel@tonic-gate 			while (sfv_len > 0) {
2537c478bd9Sstevel@tonic-gate 				error = VOP_WRITE(vp, &auio, ioflag,
2547c478bd9Sstevel@tonic-gate 				    fp->f_cred, NULL);
2557c478bd9Sstevel@tonic-gate 				cnt = sfv_len - auio.uio_resid;
2567c478bd9Sstevel@tonic-gate 				sfv_len -= cnt;
2577c478bd9Sstevel@tonic-gate 				ttolwp(curthread)->lwp_ru.ioch += (ulong_t)cnt;
2587c478bd9Sstevel@tonic-gate 				if (vp->v_type == VREG)
2597c478bd9Sstevel@tonic-gate 					*fileoff += cnt;
2607c478bd9Sstevel@tonic-gate 				*count += cnt;
2617c478bd9Sstevel@tonic-gate 				if (error != 0)
2627c478bd9Sstevel@tonic-gate 					return (error);
2637c478bd9Sstevel@tonic-gate 			}
2647c478bd9Sstevel@tonic-gate 		} else {
2657c478bd9Sstevel@tonic-gate 			file_t	*ffp;
2667c478bd9Sstevel@tonic-gate 			vnode_t	*readvp;
2677c478bd9Sstevel@tonic-gate 			size_t	size;
2687c478bd9Sstevel@tonic-gate 			caddr_t	ptr;
2697c478bd9Sstevel@tonic-gate 
2707c478bd9Sstevel@tonic-gate 			if ((ffp = getf(sfv->sfv_fd)) == NULL)
2717c478bd9Sstevel@tonic-gate 				return (EBADF);
2727c478bd9Sstevel@tonic-gate 
2737c478bd9Sstevel@tonic-gate 			if ((ffp->f_flag & FREAD) == 0) {
2747c478bd9Sstevel@tonic-gate 				releasef(sfv->sfv_fd);
2757c478bd9Sstevel@tonic-gate 				return (EBADF);
2767c478bd9Sstevel@tonic-gate 			}
2777c478bd9Sstevel@tonic-gate 
2787c478bd9Sstevel@tonic-gate 			readvp = ffp->f_vnode;
2797c478bd9Sstevel@tonic-gate 			if (readvp->v_type != VREG) {
2807c478bd9Sstevel@tonic-gate 				releasef(sfv->sfv_fd);
2817c478bd9Sstevel@tonic-gate 				return (EINVAL);
2827c478bd9Sstevel@tonic-gate 			}
2837c478bd9Sstevel@tonic-gate 
2847c478bd9Sstevel@tonic-gate 			/*
2857c478bd9Sstevel@tonic-gate 			 * No point reading and writing to same vp,
2867c478bd9Sstevel@tonic-gate 			 * as long as both are regular files. readvp is not
2877c478bd9Sstevel@tonic-gate 			 * locked; but since we got it from an open file the
2887c478bd9Sstevel@tonic-gate 			 * contents will be valid during the time of access.
2897c478bd9Sstevel@tonic-gate 			 */
290bfb244baSpr14459 			if (vn_compare(vp, readvp)) {
2917c478bd9Sstevel@tonic-gate 				releasef(sfv->sfv_fd);
2927c478bd9Sstevel@tonic-gate 				return (EINVAL);
2937c478bd9Sstevel@tonic-gate 			}
2947c478bd9Sstevel@tonic-gate 
2957c478bd9Sstevel@tonic-gate 			/*
2967c478bd9Sstevel@tonic-gate 			 * Note: we assume readvp != vp. "vp" is already
2977c478bd9Sstevel@tonic-gate 			 * locked, and "readvp" must not be.
2987c478bd9Sstevel@tonic-gate 			 */
2997c478bd9Sstevel@tonic-gate 			(void) VOP_RWLOCK(readvp, readflg, NULL);
3007c478bd9Sstevel@tonic-gate 
3017c478bd9Sstevel@tonic-gate 			/*
3027c478bd9Sstevel@tonic-gate 			 * Same checks as in pread64.
3037c478bd9Sstevel@tonic-gate 			 */
3047c478bd9Sstevel@tonic-gate 			if (sfv_off > MAXOFFSET_T) {
3057c478bd9Sstevel@tonic-gate 				VOP_RWUNLOCK(readvp, readflg, NULL);
3067c478bd9Sstevel@tonic-gate 				releasef(sfv->sfv_fd);
3077c478bd9Sstevel@tonic-gate 				return (EINVAL);
3087c478bd9Sstevel@tonic-gate 			}
3097c478bd9Sstevel@tonic-gate 
3107c478bd9Sstevel@tonic-gate 			if (sfv_off + sfv_len > MAXOFFSET_T)
3117c478bd9Sstevel@tonic-gate 				sfv_len = (ssize32_t)(MAXOFFSET_T - sfv_off);
3127c478bd9Sstevel@tonic-gate 
3137c478bd9Sstevel@tonic-gate 			/* Find the native blocksize to transfer data */
3147c478bd9Sstevel@tonic-gate 			size = MIN(vp->v_vfsp->vfs_bsize,
3157c478bd9Sstevel@tonic-gate 			    readvp->v_vfsp->vfs_bsize);
3167c478bd9Sstevel@tonic-gate 			size = sfv_len < size ? sfv_len : size;
3177c478bd9Sstevel@tonic-gate 			ptr = kmem_alloc(size, KM_SLEEP);
3187c478bd9Sstevel@tonic-gate 
3197c478bd9Sstevel@tonic-gate 			while (sfv_len > 0) {
3207c478bd9Sstevel@tonic-gate 				size_t	iov_len;
3217c478bd9Sstevel@tonic-gate 
3227c478bd9Sstevel@tonic-gate 				iov_len = MIN(size, sfv_len);
3237c478bd9Sstevel@tonic-gate 				aiov.iov_base = ptr;
3247c478bd9Sstevel@tonic-gate 				aiov.iov_len = iov_len;
3257c478bd9Sstevel@tonic-gate 				auio.uio_loffset = sfv_off;
3267c478bd9Sstevel@tonic-gate 				auio.uio_iov = &aiov;
3277c478bd9Sstevel@tonic-gate 				auio.uio_iovcnt = 1;
3287c478bd9Sstevel@tonic-gate 				auio.uio_resid = iov_len;
3297c478bd9Sstevel@tonic-gate 				auio.uio_segflg = UIO_SYSSPACE;
3307c478bd9Sstevel@tonic-gate 				auio.uio_llimit = MAXOFFSET_T;
3317c478bd9Sstevel@tonic-gate 				auio.uio_fmode = ffp->f_flag;
3327c478bd9Sstevel@tonic-gate 				ioflag = auio.uio_fmode &
3337c478bd9Sstevel@tonic-gate 				    (FAPPEND|FSYNC|FDSYNC|FRSYNC);
3347c478bd9Sstevel@tonic-gate 
3357c478bd9Sstevel@tonic-gate 				/*
3367c478bd9Sstevel@tonic-gate 				 * If read sync is not asked for,
3377c478bd9Sstevel@tonic-gate 				 * filter sync flags
3387c478bd9Sstevel@tonic-gate 				 */
3397c478bd9Sstevel@tonic-gate 				if ((ioflag & FRSYNC) == 0)
3407c478bd9Sstevel@tonic-gate 					ioflag &= ~(FSYNC|FDSYNC);
3417c478bd9Sstevel@tonic-gate 				error = VOP_READ(readvp, &auio, ioflag,
3427c478bd9Sstevel@tonic-gate 				    fp->f_cred, NULL);
3437c478bd9Sstevel@tonic-gate 				if (error) {
3447c478bd9Sstevel@tonic-gate 					kmem_free(ptr, size);
3457c478bd9Sstevel@tonic-gate 					VOP_RWUNLOCK(readvp, readflg, NULL);
3467c478bd9Sstevel@tonic-gate 					releasef(sfv->sfv_fd);
3477c478bd9Sstevel@tonic-gate 					return (error);
3487c478bd9Sstevel@tonic-gate 				}
3497c478bd9Sstevel@tonic-gate 
3507c478bd9Sstevel@tonic-gate 				/*
3517c478bd9Sstevel@tonic-gate 				 * Check how must data was really read.
3527c478bd9Sstevel@tonic-gate 				 * Decrement the 'len' and increment the
3537c478bd9Sstevel@tonic-gate 				 * 'off' appropriately.
3547c478bd9Sstevel@tonic-gate 				 */
3557c478bd9Sstevel@tonic-gate 				cnt = iov_len - auio.uio_resid;
3567c478bd9Sstevel@tonic-gate 				if (cnt == 0) {
3577c478bd9Sstevel@tonic-gate 					/*
3587c478bd9Sstevel@tonic-gate 					 * If we were reading a pipe (currently
3597c478bd9Sstevel@tonic-gate 					 * not implemented), we may now lose
3607c478bd9Sstevel@tonic-gate 					 * data.
3617c478bd9Sstevel@tonic-gate 					 */
3627c478bd9Sstevel@tonic-gate 					kmem_free(ptr, size);
3637c478bd9Sstevel@tonic-gate 					VOP_RWUNLOCK(readvp, readflg, NULL);
3647c478bd9Sstevel@tonic-gate 					releasef(sfv->sfv_fd);
3657c478bd9Sstevel@tonic-gate 					return (EINVAL);
3667c478bd9Sstevel@tonic-gate 				}
3677c478bd9Sstevel@tonic-gate 				sfv_len -= cnt;
3687c478bd9Sstevel@tonic-gate 				sfv_off += cnt;
3697c478bd9Sstevel@tonic-gate 
3707c478bd9Sstevel@tonic-gate 				aiov.iov_base = ptr;
3717c478bd9Sstevel@tonic-gate 				aiov.iov_len = cnt;
3727c478bd9Sstevel@tonic-gate 				auio.uio_loffset = *fileoff;
3737c478bd9Sstevel@tonic-gate 				auio.uio_resid = cnt;
3747c478bd9Sstevel@tonic-gate 				auio.uio_segflg = UIO_SYSSPACE;
3757c478bd9Sstevel@tonic-gate 				auio.uio_llimit = curproc->p_fsz_ctl;
3767c478bd9Sstevel@tonic-gate 				auio.uio_fmode = fflag;
3777c478bd9Sstevel@tonic-gate 				ioflag = auio.uio_fmode &
3787c478bd9Sstevel@tonic-gate 				    (FAPPEND|FSYNC|FDSYNC|FRSYNC);
3797c478bd9Sstevel@tonic-gate 				error = VOP_WRITE(vp, &auio, ioflag,
3807c478bd9Sstevel@tonic-gate 				    fp->f_cred, NULL);
3817c478bd9Sstevel@tonic-gate 
3827c478bd9Sstevel@tonic-gate 				/*
3837c478bd9Sstevel@tonic-gate 				 * Check how much data was written. Increment
3847c478bd9Sstevel@tonic-gate 				 * the 'len' and decrement the 'off' if all
3857c478bd9Sstevel@tonic-gate 				 * the data was not written.
3867c478bd9Sstevel@tonic-gate 				 */
3877c478bd9Sstevel@tonic-gate 				cnt -= auio.uio_resid;
3887c478bd9Sstevel@tonic-gate 				sfv_len += auio.uio_resid;
3897c478bd9Sstevel@tonic-gate 				sfv_off -= auio.uio_resid;
3907c478bd9Sstevel@tonic-gate 				ttolwp(curthread)->lwp_ru.ioch += (ulong_t)cnt;
3917c478bd9Sstevel@tonic-gate 				if (vp->v_type == VREG)
3927c478bd9Sstevel@tonic-gate 					*fileoff += cnt;
3937c478bd9Sstevel@tonic-gate 				*count += cnt;
3947c478bd9Sstevel@tonic-gate 				if (error != 0) {
3957c478bd9Sstevel@tonic-gate 					kmem_free(ptr, size);
3967c478bd9Sstevel@tonic-gate 					VOP_RWUNLOCK(readvp, readflg, NULL);
3977c478bd9Sstevel@tonic-gate 					releasef(sfv->sfv_fd);
3987c478bd9Sstevel@tonic-gate 					return (error);
3997c478bd9Sstevel@tonic-gate 				}
4007c478bd9Sstevel@tonic-gate 			}
4017c478bd9Sstevel@tonic-gate 			VOP_RWUNLOCK(readvp, readflg, NULL);
4027c478bd9Sstevel@tonic-gate 			releasef(sfv->sfv_fd);
4037c478bd9Sstevel@tonic-gate 			kmem_free(ptr, size);
4047c478bd9Sstevel@tonic-gate 		}
4057c478bd9Sstevel@tonic-gate 		sfv++;
4067c478bd9Sstevel@tonic-gate 	}
4077c478bd9Sstevel@tonic-gate 	return (0);
4087c478bd9Sstevel@tonic-gate }
4097c478bd9Sstevel@tonic-gate 
4107c478bd9Sstevel@tonic-gate ssize32_t
4117c478bd9Sstevel@tonic-gate sendvec64(file_t *fp, const struct ksendfilevec64 *vec, int sfvcnt,
4127c478bd9Sstevel@tonic-gate 	size32_t *xferred, int fildes)
4137c478bd9Sstevel@tonic-gate {
4147c478bd9Sstevel@tonic-gate 	u_offset_t		fileoff;
4157c478bd9Sstevel@tonic-gate 	int			copy_cnt;
4167c478bd9Sstevel@tonic-gate 	const struct ksendfilevec64 *copy_vec;
4177c478bd9Sstevel@tonic-gate 	struct ksendfilevec64 sfv[SEND_MAX_CHUNK];
4187c478bd9Sstevel@tonic-gate 	struct vnode *vp;
4197c478bd9Sstevel@tonic-gate 	int error;
4207c478bd9Sstevel@tonic-gate 	ssize32_t count = 0;
4217c478bd9Sstevel@tonic-gate 
4227c478bd9Sstevel@tonic-gate 	vp = fp->f_vnode;
4237c478bd9Sstevel@tonic-gate 	(void) VOP_RWLOCK(vp, rwflag, NULL);
4247c478bd9Sstevel@tonic-gate 
4257c478bd9Sstevel@tonic-gate 	copy_vec = vec;
4267c478bd9Sstevel@tonic-gate 	fileoff = fp->f_offset;
4277c478bd9Sstevel@tonic-gate 
4287c478bd9Sstevel@tonic-gate 	do {
4297c478bd9Sstevel@tonic-gate 		copy_cnt = MIN(sfvcnt, SEND_MAX_CHUNK);
4307c478bd9Sstevel@tonic-gate 		if (copyin(copy_vec, sfv, copy_cnt *
4317c478bd9Sstevel@tonic-gate 		    sizeof (struct ksendfilevec64))) {
4327c478bd9Sstevel@tonic-gate 			error = EFAULT;
4337c478bd9Sstevel@tonic-gate 			break;
4347c478bd9Sstevel@tonic-gate 		}
4357c478bd9Sstevel@tonic-gate 
4367c478bd9Sstevel@tonic-gate 		/*
43774024373Spr14459 		 * Optimize the regular file over
4387c478bd9Sstevel@tonic-gate 		 * the socket case.
4397c478bd9Sstevel@tonic-gate 		 */
44074024373Spr14459 		if (vp->v_type == VSOCK && sfv->sfv_fd != SFV_FD_SELF) {
4417c478bd9Sstevel@tonic-gate 			file_t *rfp;
4427c478bd9Sstevel@tonic-gate 			vnode_t *rvp;
4437c478bd9Sstevel@tonic-gate 
4447c478bd9Sstevel@tonic-gate 			if ((rfp = getf(sfv->sfv_fd)) == NULL) {
4457c478bd9Sstevel@tonic-gate 				error = EBADF;
4467c478bd9Sstevel@tonic-gate 				break;
4477c478bd9Sstevel@tonic-gate 			}
4487c478bd9Sstevel@tonic-gate 			if ((rfp->f_flag & FREAD) == 0) {
4497c478bd9Sstevel@tonic-gate 				releasef(sfv->sfv_fd);
4507c478bd9Sstevel@tonic-gate 				error = EBADF;
4517c478bd9Sstevel@tonic-gate 				break;
4527c478bd9Sstevel@tonic-gate 			}
4537c478bd9Sstevel@tonic-gate 			rvp = rfp->f_vnode;
4547c478bd9Sstevel@tonic-gate 			if (rvp->v_type == VREG) {
4557c478bd9Sstevel@tonic-gate 				error = sosendfile64(fp, rfp, sfv, &count);
45674024373Spr14459 				if (error)
4577c478bd9Sstevel@tonic-gate 					break;
45874024373Spr14459 				copy_vec++;
45974024373Spr14459 				sfvcnt--;
46074024373Spr14459 				continue;
4617c478bd9Sstevel@tonic-gate 			}
4627c478bd9Sstevel@tonic-gate 			releasef(sfv->sfv_fd);
4637c478bd9Sstevel@tonic-gate 		}
4647c478bd9Sstevel@tonic-gate 		error = sendvec_chunk64(fp, &fileoff, sfv, copy_cnt, &count);
4657c478bd9Sstevel@tonic-gate 		if (error != 0)
4667c478bd9Sstevel@tonic-gate 			break;
4677c478bd9Sstevel@tonic-gate 
4687c478bd9Sstevel@tonic-gate 		copy_vec += copy_cnt;
4697c478bd9Sstevel@tonic-gate 		sfvcnt -= copy_cnt;
4707c478bd9Sstevel@tonic-gate 	} while (sfvcnt > 0);
4717c478bd9Sstevel@tonic-gate 
4727c478bd9Sstevel@tonic-gate 	if (vp->v_type == VREG)
4737c478bd9Sstevel@tonic-gate 		fp->f_offset += count;
4747c478bd9Sstevel@tonic-gate 
4757c478bd9Sstevel@tonic-gate 	VOP_RWUNLOCK(vp, rwflag, NULL);
4767c478bd9Sstevel@tonic-gate 	if (copyout(&count, xferred, sizeof (count)))
4777c478bd9Sstevel@tonic-gate 		error = EFAULT;
4787c478bd9Sstevel@tonic-gate 	releasef(fildes);
4797c478bd9Sstevel@tonic-gate 	if (error != 0)
4807c478bd9Sstevel@tonic-gate 		return (set_errno(error));
4817c478bd9Sstevel@tonic-gate 	return (count);
4827c478bd9Sstevel@tonic-gate }
4837c478bd9Sstevel@tonic-gate #endif
4847c478bd9Sstevel@tonic-gate 
4857c478bd9Sstevel@tonic-gate int
4867c478bd9Sstevel@tonic-gate sendvec_small_chunk(file_t *fp, u_offset_t *fileoff, struct sendfilevec *sfv,
4877c478bd9Sstevel@tonic-gate     int copy_cnt, ssize_t total_size, int maxblk, ssize_t *count)
4887c478bd9Sstevel@tonic-gate {
4897c478bd9Sstevel@tonic-gate 	struct vnode *vp;
4907c478bd9Sstevel@tonic-gate 	struct uio auio;
4917c478bd9Sstevel@tonic-gate 	struct iovec aiov;
4927c478bd9Sstevel@tonic-gate 	ushort_t fflag;
4937c478bd9Sstevel@tonic-gate 	int ioflag;
4947c478bd9Sstevel@tonic-gate 	int i, error;
4957c478bd9Sstevel@tonic-gate 	size_t cnt;
4967c478bd9Sstevel@tonic-gate 	ssize_t sfv_len;
4977c478bd9Sstevel@tonic-gate 	u_offset_t sfv_off;
4987c478bd9Sstevel@tonic-gate #ifdef _SYSCALL32_IMPL
4997c478bd9Sstevel@tonic-gate 	model_t model = get_udatamodel();
5007c478bd9Sstevel@tonic-gate 	u_offset_t maxoff = (model == DATAMODEL_ILP32) ?
5017c478bd9Sstevel@tonic-gate 	    MAXOFF32_T : MAXOFFSET_T;
5027c478bd9Sstevel@tonic-gate #else
5037c478bd9Sstevel@tonic-gate 	const u_offset_t maxoff = MAXOFF32_T;
5047c478bd9Sstevel@tonic-gate #endif
5057c478bd9Sstevel@tonic-gate 	mblk_t *dmp = NULL;
5067c478bd9Sstevel@tonic-gate 	int wroff;
5077c478bd9Sstevel@tonic-gate 	int buf_left = 0;
5087c478bd9Sstevel@tonic-gate 	size_t	iov_len;
5097c478bd9Sstevel@tonic-gate 	mblk_t  *head, *tmp;
5107c478bd9Sstevel@tonic-gate 	size_t  size = total_size;
511c28749e9Skais 	size_t  extra;
512c28749e9Skais 	int tail_len;
5137c478bd9Sstevel@tonic-gate 
5147c478bd9Sstevel@tonic-gate 	fflag = fp->f_flag;
5157c478bd9Sstevel@tonic-gate 	vp = fp->f_vnode;
5167c478bd9Sstevel@tonic-gate 
5177c478bd9Sstevel@tonic-gate 	ASSERT(vp->v_type == VSOCK);
5187c478bd9Sstevel@tonic-gate 	ASSERT(maxblk > 0);
5197c478bd9Sstevel@tonic-gate 
5207c478bd9Sstevel@tonic-gate 	wroff = (int)vp->v_stream->sd_wroff;
521c28749e9Skais 	tail_len = (int)vp->v_stream->sd_tail;
522c28749e9Skais 	extra = wroff + tail_len;
523c28749e9Skais 
5247c478bd9Sstevel@tonic-gate 	buf_left = MIN(total_size, maxblk);
525c28749e9Skais 	head = dmp = allocb(buf_left + extra, BPRI_HI);
5267c478bd9Sstevel@tonic-gate 	if (head == NULL)
5277c478bd9Sstevel@tonic-gate 		return (ENOMEM);
5287c478bd9Sstevel@tonic-gate 	head->b_wptr = head->b_rptr = head->b_rptr + wroff;
5297c478bd9Sstevel@tonic-gate 
5307c478bd9Sstevel@tonic-gate 	auio.uio_extflg = UIO_COPY_DEFAULT;
5317c478bd9Sstevel@tonic-gate 	for (i = 0; i < copy_cnt; i++) {
532311e3d4cSgeorges 		if (ISSIG(curthread, JUSTLOOKING)) {
533311e3d4cSgeorges 			freemsg(head);
5347c478bd9Sstevel@tonic-gate 			return (EINTR);
535311e3d4cSgeorges 		}
5367c478bd9Sstevel@tonic-gate 
5377c478bd9Sstevel@tonic-gate 		/*
5387c478bd9Sstevel@tonic-gate 		 * Do similar checks as "write" as we are writing
5397c478bd9Sstevel@tonic-gate 		 * sfv_len bytes into "vp".
5407c478bd9Sstevel@tonic-gate 		 */
5417c478bd9Sstevel@tonic-gate 		sfv_len = (ssize_t)sfv->sfv_len;
5427c478bd9Sstevel@tonic-gate 
5437c478bd9Sstevel@tonic-gate 		if (sfv_len == 0) {
5447c478bd9Sstevel@tonic-gate 			sfv++;
5457c478bd9Sstevel@tonic-gate 			continue;
5467c478bd9Sstevel@tonic-gate 		}
5477c478bd9Sstevel@tonic-gate 
5487c478bd9Sstevel@tonic-gate 		/* Check for overflow */
5497c478bd9Sstevel@tonic-gate #ifdef _SYSCALL32_IMPL
5507c478bd9Sstevel@tonic-gate 		if (model == DATAMODEL_ILP32) {
551311e3d4cSgeorges 			if (((ssize32_t)(*count + sfv_len)) < 0) {
552311e3d4cSgeorges 				freemsg(head);
5537c478bd9Sstevel@tonic-gate 				return (EINVAL);
554311e3d4cSgeorges 			}
5557c478bd9Sstevel@tonic-gate 		} else
5567c478bd9Sstevel@tonic-gate #endif
557311e3d4cSgeorges 		if ((*count + sfv_len) < 0) {
558311e3d4cSgeorges 			freemsg(head);
5597c478bd9Sstevel@tonic-gate 			return (EINVAL);
560311e3d4cSgeorges 		}
5617c478bd9Sstevel@tonic-gate 
5627c478bd9Sstevel@tonic-gate 		sfv_off = (u_offset_t)(ulong_t)sfv->sfv_off;
5637c478bd9Sstevel@tonic-gate 
5647c478bd9Sstevel@tonic-gate 		if (sfv->sfv_fd == SFV_FD_SELF) {
5657c478bd9Sstevel@tonic-gate 			while (sfv_len > 0) {
5667c478bd9Sstevel@tonic-gate 				if (buf_left == 0) {
5677c478bd9Sstevel@tonic-gate 					tmp = dmp;
5687c478bd9Sstevel@tonic-gate 					buf_left = MIN(total_size, maxblk);
5697c478bd9Sstevel@tonic-gate 					iov_len = MIN(buf_left, sfv_len);
570c28749e9Skais 					dmp = allocb(buf_left + extra, BPRI_HI);
5717c478bd9Sstevel@tonic-gate 					if (dmp == NULL) {
5727c478bd9Sstevel@tonic-gate 						freemsg(head);
5737c478bd9Sstevel@tonic-gate 						return (ENOMEM);
5747c478bd9Sstevel@tonic-gate 					}
5757c478bd9Sstevel@tonic-gate 					dmp->b_wptr = dmp->b_rptr =
5767c478bd9Sstevel@tonic-gate 					    dmp->b_rptr + wroff;
5777c478bd9Sstevel@tonic-gate 					tmp->b_cont = dmp;
5787c478bd9Sstevel@tonic-gate 				} else {
5797c478bd9Sstevel@tonic-gate 					iov_len = MIN(buf_left, sfv_len);
5807c478bd9Sstevel@tonic-gate 				}
5817c478bd9Sstevel@tonic-gate 
5827c478bd9Sstevel@tonic-gate 				aiov.iov_len = iov_len;
5837c478bd9Sstevel@tonic-gate 				aiov.iov_base = (caddr_t)(uintptr_t)sfv_off;
5847c478bd9Sstevel@tonic-gate 				auio.uio_loffset = *fileoff;
5857c478bd9Sstevel@tonic-gate 				auio.uio_iovcnt = 1;
5867c478bd9Sstevel@tonic-gate 				auio.uio_resid = iov_len;
5877c478bd9Sstevel@tonic-gate 				auio.uio_iov = &aiov;
5887c478bd9Sstevel@tonic-gate 				auio.uio_segflg = UIO_USERSPACE;
5897c478bd9Sstevel@tonic-gate 				auio.uio_llimit = curproc->p_fsz_ctl;
5907c478bd9Sstevel@tonic-gate 				auio.uio_fmode = fflag;
5917c478bd9Sstevel@tonic-gate 
5927c478bd9Sstevel@tonic-gate 				buf_left -= iov_len;
5937c478bd9Sstevel@tonic-gate 				total_size -= iov_len;
5947c478bd9Sstevel@tonic-gate 				sfv_len -= iov_len;
5957c478bd9Sstevel@tonic-gate 				sfv_off += iov_len;
5967c478bd9Sstevel@tonic-gate 
5977c478bd9Sstevel@tonic-gate 				error = uiomove((caddr_t)dmp->b_wptr,
5987c478bd9Sstevel@tonic-gate 				    iov_len, UIO_WRITE, &auio);
5997c478bd9Sstevel@tonic-gate 				if (error != 0) {
6007c478bd9Sstevel@tonic-gate 					freemsg(head);
6017c478bd9Sstevel@tonic-gate 					return (error);
6027c478bd9Sstevel@tonic-gate 				}
6037c478bd9Sstevel@tonic-gate 				dmp->b_wptr += iov_len;
6047c478bd9Sstevel@tonic-gate 			}
6057c478bd9Sstevel@tonic-gate 		} else {
6067c478bd9Sstevel@tonic-gate 			file_t	*ffp;
6077c478bd9Sstevel@tonic-gate 			vnode_t	*readvp;
6087c478bd9Sstevel@tonic-gate 
6097c478bd9Sstevel@tonic-gate 			if ((ffp = getf(sfv->sfv_fd)) == NULL) {
6107c478bd9Sstevel@tonic-gate 				freemsg(head);
6117c478bd9Sstevel@tonic-gate 				return (EBADF);
6127c478bd9Sstevel@tonic-gate 			}
6137c478bd9Sstevel@tonic-gate 
6147c478bd9Sstevel@tonic-gate 			if ((ffp->f_flag & FREAD) == 0) {
6157c478bd9Sstevel@tonic-gate 				releasef(sfv->sfv_fd);
6167c478bd9Sstevel@tonic-gate 				freemsg(head);
6177c478bd9Sstevel@tonic-gate 				return (EACCES);
6187c478bd9Sstevel@tonic-gate 			}
6197c478bd9Sstevel@tonic-gate 
6207c478bd9Sstevel@tonic-gate 			readvp = ffp->f_vnode;
6217c478bd9Sstevel@tonic-gate 			if (readvp->v_type != VREG) {
6227c478bd9Sstevel@tonic-gate 				releasef(sfv->sfv_fd);
6237c478bd9Sstevel@tonic-gate 				freemsg(head);
6247c478bd9Sstevel@tonic-gate 				return (EINVAL);
6257c478bd9Sstevel@tonic-gate 			}
6267c478bd9Sstevel@tonic-gate 
6277c478bd9Sstevel@tonic-gate 			/*
6287c478bd9Sstevel@tonic-gate 			 * No point reading and writing to same vp,
6297c478bd9Sstevel@tonic-gate 			 * as long as both are regular files. readvp is not
6307c478bd9Sstevel@tonic-gate 			 * locked; but since we got it from an open file the
6317c478bd9Sstevel@tonic-gate 			 * contents will be valid during the time of access.
6327c478bd9Sstevel@tonic-gate 			 */
6337c478bd9Sstevel@tonic-gate 
634bfb244baSpr14459 			if (vn_compare(vp, readvp)) {
6357c478bd9Sstevel@tonic-gate 				releasef(sfv->sfv_fd);
6367c478bd9Sstevel@tonic-gate 				freemsg(head);
6377c478bd9Sstevel@tonic-gate 				return (EINVAL);
6387c478bd9Sstevel@tonic-gate 			}
6397c478bd9Sstevel@tonic-gate 
6407c478bd9Sstevel@tonic-gate 			/*
6417c478bd9Sstevel@tonic-gate 			 * Note: we assume readvp != vp. "vp" is already
6427c478bd9Sstevel@tonic-gate 			 * locked, and "readvp" must not be.
6437c478bd9Sstevel@tonic-gate 			 */
6447c478bd9Sstevel@tonic-gate 
6457c478bd9Sstevel@tonic-gate 			(void) VOP_RWLOCK(readvp, readflg, NULL);
6467c478bd9Sstevel@tonic-gate 
6477c478bd9Sstevel@tonic-gate 			/* Same checks as in pread */
6487c478bd9Sstevel@tonic-gate 			if (sfv_off > maxoff) {
6497c478bd9Sstevel@tonic-gate 				VOP_RWUNLOCK(readvp, readflg, NULL);
6507c478bd9Sstevel@tonic-gate 				releasef(sfv->sfv_fd);
6517c478bd9Sstevel@tonic-gate 				freemsg(head);
6527c478bd9Sstevel@tonic-gate 				return (EINVAL);
6537c478bd9Sstevel@tonic-gate 			}
6547c478bd9Sstevel@tonic-gate 			if (sfv_off + sfv_len > maxoff) {
6550a8433caSrshoaib 				total_size -= (sfv_off + sfv_len - maxoff);
6567c478bd9Sstevel@tonic-gate 				sfv_len = (ssize_t)((offset_t)maxoff -
6577c478bd9Sstevel@tonic-gate 				    sfv_off);
6587c478bd9Sstevel@tonic-gate 			}
6597c478bd9Sstevel@tonic-gate 
6607c478bd9Sstevel@tonic-gate 			while (sfv_len > 0) {
6617c478bd9Sstevel@tonic-gate 				if (buf_left == 0) {
6627c478bd9Sstevel@tonic-gate 					tmp = dmp;
6637c478bd9Sstevel@tonic-gate 					buf_left = MIN(total_size, maxblk);
6647c478bd9Sstevel@tonic-gate 					iov_len = MIN(buf_left, sfv_len);
665c28749e9Skais 					dmp = allocb(buf_left + extra, BPRI_HI);
6667c478bd9Sstevel@tonic-gate 					if (dmp == NULL) {
6677c478bd9Sstevel@tonic-gate 						VOP_RWUNLOCK(readvp, readflg,
6687c478bd9Sstevel@tonic-gate 						    NULL);
6697c478bd9Sstevel@tonic-gate 						releasef(sfv->sfv_fd);
6707c478bd9Sstevel@tonic-gate 						freemsg(head);
6717c478bd9Sstevel@tonic-gate 						return (ENOMEM);
6727c478bd9Sstevel@tonic-gate 					}
6737c478bd9Sstevel@tonic-gate 					dmp->b_wptr = dmp->b_rptr =
6747c478bd9Sstevel@tonic-gate 					    dmp->b_rptr + wroff;
6757c478bd9Sstevel@tonic-gate 					tmp->b_cont = dmp;
6767c478bd9Sstevel@tonic-gate 				} else {
6777c478bd9Sstevel@tonic-gate 					iov_len = MIN(buf_left, sfv_len);
6787c478bd9Sstevel@tonic-gate 				}
6797c478bd9Sstevel@tonic-gate 				aiov.iov_base = (caddr_t)dmp->b_wptr;
6807c478bd9Sstevel@tonic-gate 				aiov.iov_len = iov_len;
6817c478bd9Sstevel@tonic-gate 				auio.uio_loffset = sfv_off;
6827c478bd9Sstevel@tonic-gate 				auio.uio_iov = &aiov;
6837c478bd9Sstevel@tonic-gate 				auio.uio_iovcnt = 1;
6847c478bd9Sstevel@tonic-gate 				auio.uio_resid = iov_len;
6857c478bd9Sstevel@tonic-gate 				auio.uio_segflg = UIO_SYSSPACE;
6867c478bd9Sstevel@tonic-gate 				auio.uio_llimit = MAXOFFSET_T;
6877c478bd9Sstevel@tonic-gate 				auio.uio_fmode = ffp->f_flag;
6887c478bd9Sstevel@tonic-gate 				ioflag = auio.uio_fmode &
6897c478bd9Sstevel@tonic-gate 				    (FAPPEND|FSYNC|FDSYNC|FRSYNC);
6907c478bd9Sstevel@tonic-gate 
6917c478bd9Sstevel@tonic-gate 				/*
6927c478bd9Sstevel@tonic-gate 				 * If read sync is not asked for,
6937c478bd9Sstevel@tonic-gate 				 * filter sync flags
6947c478bd9Sstevel@tonic-gate 				 */
6957c478bd9Sstevel@tonic-gate 				if ((ioflag & FRSYNC) == 0)
6967c478bd9Sstevel@tonic-gate 					ioflag &= ~(FSYNC|FDSYNC);
6977c478bd9Sstevel@tonic-gate 				error = VOP_READ(readvp, &auio, ioflag,
6987c478bd9Sstevel@tonic-gate 				    fp->f_cred, NULL);
6997c478bd9Sstevel@tonic-gate 				if (error != 0) {
7007c478bd9Sstevel@tonic-gate 					/*
7017c478bd9Sstevel@tonic-gate 					 * If we were reading a pipe (currently
7027c478bd9Sstevel@tonic-gate 					 * not implemented), we may now loose
7037c478bd9Sstevel@tonic-gate 					 * data.
7047c478bd9Sstevel@tonic-gate 					 */
7057c478bd9Sstevel@tonic-gate 					VOP_RWUNLOCK(readvp, readflg, NULL);
7067c478bd9Sstevel@tonic-gate 					releasef(sfv->sfv_fd);
7077c478bd9Sstevel@tonic-gate 					freemsg(head);
7087c478bd9Sstevel@tonic-gate 					return (error);
7097c478bd9Sstevel@tonic-gate 				}
7107c478bd9Sstevel@tonic-gate 
7117c478bd9Sstevel@tonic-gate 				/*
7127c478bd9Sstevel@tonic-gate 				 * Check how much data was really read.
7137c478bd9Sstevel@tonic-gate 				 * Decrement the 'len' and increment the
7147c478bd9Sstevel@tonic-gate 				 * 'off' appropriately.
7157c478bd9Sstevel@tonic-gate 				 */
7167c478bd9Sstevel@tonic-gate 				cnt = iov_len - auio.uio_resid;
7177c478bd9Sstevel@tonic-gate 				if (cnt == 0) {
7187c478bd9Sstevel@tonic-gate 					VOP_RWUNLOCK(readvp, readflg, NULL);
7197c478bd9Sstevel@tonic-gate 					releasef(sfv->sfv_fd);
7207c478bd9Sstevel@tonic-gate 					freemsg(head);
7217c478bd9Sstevel@tonic-gate 					return (EINVAL);
7227c478bd9Sstevel@tonic-gate 				}
7237c478bd9Sstevel@tonic-gate 				sfv_len -= cnt;
7247c478bd9Sstevel@tonic-gate 				sfv_off += cnt;
7257c478bd9Sstevel@tonic-gate 				total_size -= cnt;
7267c478bd9Sstevel@tonic-gate 				buf_left -= cnt;
7277c478bd9Sstevel@tonic-gate 
7287c478bd9Sstevel@tonic-gate 				dmp->b_wptr += cnt;
7297c478bd9Sstevel@tonic-gate 			}
7307c478bd9Sstevel@tonic-gate 			VOP_RWUNLOCK(readvp, readflg, NULL);
7317c478bd9Sstevel@tonic-gate 			releasef(sfv->sfv_fd);
7327c478bd9Sstevel@tonic-gate 		}
7337c478bd9Sstevel@tonic-gate 		sfv++;
7347c478bd9Sstevel@tonic-gate 	}
7357c478bd9Sstevel@tonic-gate 
7367c478bd9Sstevel@tonic-gate 	ASSERT(total_size == 0);
7377c478bd9Sstevel@tonic-gate 	error = kstrwritemp(vp, head, fflag);
7387c478bd9Sstevel@tonic-gate 	if (error != 0) {
7397c478bd9Sstevel@tonic-gate 		freemsg(head);
7407c478bd9Sstevel@tonic-gate 		return (error);
7417c478bd9Sstevel@tonic-gate 	}
7427c478bd9Sstevel@tonic-gate 	ttolwp(curthread)->lwp_ru.ioch += (ulong_t)size;
7437c478bd9Sstevel@tonic-gate 	*count += size;
7447c478bd9Sstevel@tonic-gate 
7457c478bd9Sstevel@tonic-gate 	return (0);
7467c478bd9Sstevel@tonic-gate }
7477c478bd9Sstevel@tonic-gate 
7487c478bd9Sstevel@tonic-gate 
7497c478bd9Sstevel@tonic-gate int
7507c478bd9Sstevel@tonic-gate sendvec_chunk(file_t *fp, u_offset_t *fileoff, struct sendfilevec *sfv,
7517c478bd9Sstevel@tonic-gate     int copy_cnt, ssize_t *count)
7527c478bd9Sstevel@tonic-gate {
7537c478bd9Sstevel@tonic-gate 	struct vnode *vp;
7547c478bd9Sstevel@tonic-gate 	struct uio auio;
7557c478bd9Sstevel@tonic-gate 	struct iovec aiov;
7567c478bd9Sstevel@tonic-gate 	ushort_t fflag;
7577c478bd9Sstevel@tonic-gate 	int ioflag;
7587c478bd9Sstevel@tonic-gate 	int i, error;
7597c478bd9Sstevel@tonic-gate 	size_t cnt;
7607c478bd9Sstevel@tonic-gate 	ssize_t sfv_len;
7617c478bd9Sstevel@tonic-gate 	u_offset_t sfv_off;
7627c478bd9Sstevel@tonic-gate #ifdef _SYSCALL32_IMPL
7637c478bd9Sstevel@tonic-gate 	model_t model = get_udatamodel();
7647c478bd9Sstevel@tonic-gate 	u_offset_t maxoff = (model == DATAMODEL_ILP32) ?
7657c478bd9Sstevel@tonic-gate 	    MAXOFF32_T : MAXOFFSET_T;
7667c478bd9Sstevel@tonic-gate #else
7677c478bd9Sstevel@tonic-gate 	const u_offset_t maxoff = MAXOFF32_T;
7687c478bd9Sstevel@tonic-gate #endif
7691574ae68Sjohansen 	mblk_t	*dmp = NULL;
7701574ae68Sjohansen 	char	*buf = NULL;
771c28749e9Skais 	size_t  extra;
772c28749e9Skais 	int maxblk, wroff, tail_len;
773c28749e9Skais 	struct sonode *so;
774c28749e9Skais 	stdata_t *stp;
7757c478bd9Sstevel@tonic-gate 
7767c478bd9Sstevel@tonic-gate 	fflag = fp->f_flag;
7777c478bd9Sstevel@tonic-gate 	vp = fp->f_vnode;
7787c478bd9Sstevel@tonic-gate 
779c28749e9Skais 	if (vp->v_type == VSOCK) {
780c28749e9Skais 		so = VTOSO(vp);
781c28749e9Skais 		stp = vp->v_stream;
782c28749e9Skais 		wroff = (int)stp->sd_wroff;
783c28749e9Skais 		tail_len = (int)stp->sd_tail;
784c28749e9Skais 		maxblk = (int)stp->sd_maxblk;
785c28749e9Skais 		extra = wroff + tail_len;
786c28749e9Skais 	}
787c28749e9Skais 
7887c478bd9Sstevel@tonic-gate 	auio.uio_extflg = UIO_COPY_DEFAULT;
7897c478bd9Sstevel@tonic-gate 	for (i = 0; i < copy_cnt; i++) {
7907c478bd9Sstevel@tonic-gate 		if (ISSIG(curthread, JUSTLOOKING))
7917c478bd9Sstevel@tonic-gate 			return (EINTR);
7927c478bd9Sstevel@tonic-gate 
7937c478bd9Sstevel@tonic-gate 		/*
7947c478bd9Sstevel@tonic-gate 		 * Do similar checks as "write" as we are writing
7957c478bd9Sstevel@tonic-gate 		 * sfv_len bytes into "vp".
7967c478bd9Sstevel@tonic-gate 		 */
7977c478bd9Sstevel@tonic-gate 		sfv_len = (ssize_t)sfv->sfv_len;
7987c478bd9Sstevel@tonic-gate 
7997c478bd9Sstevel@tonic-gate 		if (sfv_len == 0) {
8007c478bd9Sstevel@tonic-gate 			sfv++;
8017c478bd9Sstevel@tonic-gate 			continue;
8027c478bd9Sstevel@tonic-gate 		}
8037c478bd9Sstevel@tonic-gate 
8047c478bd9Sstevel@tonic-gate 		if (vp->v_type == VREG) {
8057c478bd9Sstevel@tonic-gate 			if (*fileoff >= curproc->p_fsz_ctl) {
8067c478bd9Sstevel@tonic-gate 				mutex_enter(&curproc->p_lock);
8077c478bd9Sstevel@tonic-gate 				(void) rctl_action(
8087c478bd9Sstevel@tonic-gate 				    rctlproc_legacy[RLIMIT_FSIZE],
8097c478bd9Sstevel@tonic-gate 				    curproc->p_rctls, curproc, RCA_SAFE);
8107c478bd9Sstevel@tonic-gate 				mutex_exit(&curproc->p_lock);
8117c478bd9Sstevel@tonic-gate 
8127c478bd9Sstevel@tonic-gate 				return (EFBIG);
8137c478bd9Sstevel@tonic-gate 			}
8147c478bd9Sstevel@tonic-gate 
8157c478bd9Sstevel@tonic-gate 			if (*fileoff >= maxoff)
8167c478bd9Sstevel@tonic-gate 				return (EFBIG);
8177c478bd9Sstevel@tonic-gate 
8187c478bd9Sstevel@tonic-gate 			if (*fileoff + sfv_len > maxoff)
8197c478bd9Sstevel@tonic-gate 				return (EINVAL);
8207c478bd9Sstevel@tonic-gate 		}
8217c478bd9Sstevel@tonic-gate 
8227c478bd9Sstevel@tonic-gate 		/* Check for overflow */
8237c478bd9Sstevel@tonic-gate #ifdef _SYSCALL32_IMPL
8247c478bd9Sstevel@tonic-gate 		if (model == DATAMODEL_ILP32) {
8257c478bd9Sstevel@tonic-gate 			if (((ssize32_t)(*count + sfv_len)) < 0)
8267c478bd9Sstevel@tonic-gate 				return (EINVAL);
8277c478bd9Sstevel@tonic-gate 		} else
8287c478bd9Sstevel@tonic-gate #endif
8297c478bd9Sstevel@tonic-gate 		if ((*count + sfv_len) < 0)
8307c478bd9Sstevel@tonic-gate 			return (EINVAL);
8317c478bd9Sstevel@tonic-gate 
8327c478bd9Sstevel@tonic-gate 		sfv_off = (u_offset_t)(ulong_t)sfv->sfv_off;
8337c478bd9Sstevel@tonic-gate 
8347c478bd9Sstevel@tonic-gate 		if (sfv->sfv_fd == SFV_FD_SELF) {
8357c478bd9Sstevel@tonic-gate 			aiov.iov_len = sfv_len;
8367c478bd9Sstevel@tonic-gate 			aiov.iov_base = (caddr_t)(uintptr_t)sfv_off;
8377c478bd9Sstevel@tonic-gate 			auio.uio_loffset = *fileoff;
8387c478bd9Sstevel@tonic-gate 			auio.uio_iovcnt = 1;
8397c478bd9Sstevel@tonic-gate 			auio.uio_resid = sfv_len;
8407c478bd9Sstevel@tonic-gate 			auio.uio_iov = &aiov;
8417c478bd9Sstevel@tonic-gate 			auio.uio_segflg = UIO_USERSPACE;
8427c478bd9Sstevel@tonic-gate 			auio.uio_llimit = curproc->p_fsz_ctl;
8437c478bd9Sstevel@tonic-gate 			auio.uio_fmode = fflag;
8447c478bd9Sstevel@tonic-gate 
8457c478bd9Sstevel@tonic-gate 			if (vp->v_type == VSOCK) {
8467c478bd9Sstevel@tonic-gate 
8477c478bd9Sstevel@tonic-gate 				/*
8487c478bd9Sstevel@tonic-gate 				 * Optimize for the socket case
8497c478bd9Sstevel@tonic-gate 				 */
8507c478bd9Sstevel@tonic-gate 
851c28749e9Skais 				dmp = allocb(sfv_len + extra, BPRI_HI);
8527c478bd9Sstevel@tonic-gate 				if (dmp == NULL)
8537c478bd9Sstevel@tonic-gate 					return (ENOMEM);
8547c478bd9Sstevel@tonic-gate 				dmp->b_wptr = dmp->b_rptr = dmp->b_rptr + wroff;
8557c478bd9Sstevel@tonic-gate 				error = uiomove((caddr_t)dmp->b_wptr,
8567c478bd9Sstevel@tonic-gate 				    sfv_len, UIO_WRITE, &auio);
8577c478bd9Sstevel@tonic-gate 				if (error != 0) {
8587c478bd9Sstevel@tonic-gate 					freeb(dmp);
8597c478bd9Sstevel@tonic-gate 					return (error);
8607c478bd9Sstevel@tonic-gate 				}
8617c478bd9Sstevel@tonic-gate 				dmp->b_wptr += sfv_len;
8627c478bd9Sstevel@tonic-gate 				error = kstrwritemp(vp, dmp, fflag);
8637c478bd9Sstevel@tonic-gate 				if (error != 0) {
8647c478bd9Sstevel@tonic-gate 					freeb(dmp);
8657c478bd9Sstevel@tonic-gate 					return (error);
8667c478bd9Sstevel@tonic-gate 				}
8677c478bd9Sstevel@tonic-gate 				ttolwp(curthread)->lwp_ru.ioch +=
8687c478bd9Sstevel@tonic-gate 				    (ulong_t)sfv_len;
8697c478bd9Sstevel@tonic-gate 				*count += sfv_len;
8707c478bd9Sstevel@tonic-gate 			} else {
8717c478bd9Sstevel@tonic-gate 				ioflag = auio.uio_fmode &
8727c478bd9Sstevel@tonic-gate 				    (FAPPEND|FSYNC|FDSYNC|FRSYNC);
8737c478bd9Sstevel@tonic-gate 				while (sfv_len > 0) {
8747c478bd9Sstevel@tonic-gate 					error = VOP_WRITE(vp, &auio, ioflag,
8757c478bd9Sstevel@tonic-gate 					    fp->f_cred, NULL);
8767c478bd9Sstevel@tonic-gate 					cnt = sfv_len - auio.uio_resid;
8777c478bd9Sstevel@tonic-gate 					sfv_len -= cnt;
8787c478bd9Sstevel@tonic-gate 					ttolwp(curthread)->lwp_ru.ioch +=
8797c478bd9Sstevel@tonic-gate 					    (ulong_t)cnt;
8807c478bd9Sstevel@tonic-gate 					*fileoff += cnt;
8817c478bd9Sstevel@tonic-gate 					*count += cnt;
8827c478bd9Sstevel@tonic-gate 					if (error != 0)
8837c478bd9Sstevel@tonic-gate 						return (error);
8847c478bd9Sstevel@tonic-gate 				}
8857c478bd9Sstevel@tonic-gate 			}
8867c478bd9Sstevel@tonic-gate 		} else {
8877f9ee850Sblu 			int segmapit = 0;
8887c478bd9Sstevel@tonic-gate 			file_t	*ffp;
8897c478bd9Sstevel@tonic-gate 			vnode_t	*readvp;
890bfb244baSpr14459 			struct vnode *realvp;
8917c478bd9Sstevel@tonic-gate 			size_t	size;
8927c478bd9Sstevel@tonic-gate 			caddr_t	ptr;
8937c478bd9Sstevel@tonic-gate 
8947c478bd9Sstevel@tonic-gate 			if ((ffp = getf(sfv->sfv_fd)) == NULL)
8957c478bd9Sstevel@tonic-gate 				return (EBADF);
8967c478bd9Sstevel@tonic-gate 
8977c478bd9Sstevel@tonic-gate 			if ((ffp->f_flag & FREAD) == 0) {
8987c478bd9Sstevel@tonic-gate 				releasef(sfv->sfv_fd);
8997c478bd9Sstevel@tonic-gate 				return (EBADF);
9007c478bd9Sstevel@tonic-gate 			}
9017c478bd9Sstevel@tonic-gate 
9027c478bd9Sstevel@tonic-gate 			readvp = ffp->f_vnode;
903da6c28aaSamw 			if (VOP_REALVP(readvp, &realvp, NULL) == 0)
904bfb244baSpr14459 				readvp = realvp;
9057c478bd9Sstevel@tonic-gate 			if (readvp->v_type != VREG) {
9067c478bd9Sstevel@tonic-gate 				releasef(sfv->sfv_fd);
9077c478bd9Sstevel@tonic-gate 				return (EINVAL);
9087c478bd9Sstevel@tonic-gate 			}
9097c478bd9Sstevel@tonic-gate 
9107c478bd9Sstevel@tonic-gate 			/*
9117c478bd9Sstevel@tonic-gate 			 * No point reading and writing to same vp,
9127c478bd9Sstevel@tonic-gate 			 * as long as both are regular files. readvp is not
9137c478bd9Sstevel@tonic-gate 			 * locked; but since we got it from an open file the
9147c478bd9Sstevel@tonic-gate 			 * contents will be valid during the time of access.
9157c478bd9Sstevel@tonic-gate 			 */
916bfb244baSpr14459 			if (vn_compare(vp, readvp)) {
9177c478bd9Sstevel@tonic-gate 				releasef(sfv->sfv_fd);
9187c478bd9Sstevel@tonic-gate 				return (EINVAL);
9197c478bd9Sstevel@tonic-gate 			}
9207c478bd9Sstevel@tonic-gate 
9217c478bd9Sstevel@tonic-gate 			/*
9227c478bd9Sstevel@tonic-gate 			 * Note: we assume readvp != vp. "vp" is already
9237c478bd9Sstevel@tonic-gate 			 * locked, and "readvp" must not be.
9247c478bd9Sstevel@tonic-gate 			 */
9257c478bd9Sstevel@tonic-gate 			(void) VOP_RWLOCK(readvp, readflg, NULL);
9267c478bd9Sstevel@tonic-gate 
9277c478bd9Sstevel@tonic-gate 			/* Same checks as in pread */
9287c478bd9Sstevel@tonic-gate 			if (sfv_off > maxoff) {
9297c478bd9Sstevel@tonic-gate 				VOP_RWUNLOCK(readvp, readflg, NULL);
9307c478bd9Sstevel@tonic-gate 				releasef(sfv->sfv_fd);
9317c478bd9Sstevel@tonic-gate 				return (EINVAL);
9327c478bd9Sstevel@tonic-gate 			}
9337c478bd9Sstevel@tonic-gate 			if (sfv_off + sfv_len > maxoff) {
9347c478bd9Sstevel@tonic-gate 				sfv_len = (ssize_t)((offset_t)maxoff -
9357c478bd9Sstevel@tonic-gate 				    sfv_off);
9367c478bd9Sstevel@tonic-gate 			}
9377c478bd9Sstevel@tonic-gate 			/* Find the native blocksize to transfer data */
9387c478bd9Sstevel@tonic-gate 			size = MIN(vp->v_vfsp->vfs_bsize,
9397c478bd9Sstevel@tonic-gate 			    readvp->v_vfsp->vfs_bsize);
9407c478bd9Sstevel@tonic-gate 			size = sfv_len < size ? sfv_len : size;
9417c478bd9Sstevel@tonic-gate 
9421574ae68Sjohansen 			if (vp->v_type != VSOCK) {
94374024373Spr14459 				segmapit = 0;
9441574ae68Sjohansen 				buf = kmem_alloc(size, KM_NOSLEEP);
9451574ae68Sjohansen 				if (buf == NULL) {
9461574ae68Sjohansen 					VOP_RWUNLOCK(readvp, readflg, NULL);
9471574ae68Sjohansen 					releasef(sfv->sfv_fd);
9481574ae68Sjohansen 					return (ENOMEM);
9491574ae68Sjohansen 				}
950c28749e9Skais 			} else {
951c28749e9Skais 				/*
952c28749e9Skais 				 * For sockets acting as an SSL proxy, we
953c28749e9Skais 				 * need to adjust the size to the maximum
954c28749e9Skais 				 * SSL record size set in the stream head.
955c28749e9Skais 				 */
956c28749e9Skais 				if (so->so_kssl_ctx != NULL)
957c28749e9Skais 					size = MIN(size, maxblk);
95874024373Spr14459 
95974024373Spr14459 				if (vn_has_flocks(readvp) ||
96074024373Spr14459 				    readvp->v_flag & VNOMAP ||
96174024373Spr14459 				    stp->sd_copyflag & STZCVMUNSAFE) {
96274024373Spr14459 					segmapit = 0;
96374024373Spr14459 				} else if (stp->sd_copyflag & STZCVMSAFE) {
96474024373Spr14459 					segmapit = 1;
96574024373Spr14459 				} else {
96674024373Spr14459 					int on = 1;
96774024373Spr14459 					if (SOP_SETSOCKOPT(VTOSO(vp),
96874024373Spr14459 					    SOL_SOCKET, SO_SND_COPYAVOID,
96974024373Spr14459 					    &on, sizeof (on)) == 0)
97074024373Spr14459 					segmapit = 1;
97174024373Spr14459 				}
97274024373Spr14459 			}
97374024373Spr14459 
97474024373Spr14459 			if (segmapit) {
97574024373Spr14459 				boolean_t nowait;
97674024373Spr14459 
97774024373Spr14459 				nowait = (sfv->sfv_flag & SFV_NOWAIT) != 0;
97874024373Spr14459 				error = snf_segmap(fp, readvp, sfv_off,
979*3b3d24f3SJayakara Kini 				    (u_offset_t)sfv_len, (ssize_t *)&cnt,
980*3b3d24f3SJayakara Kini 				    nowait);
98174024373Spr14459 				releasef(sfv->sfv_fd);
98274024373Spr14459 				*count += cnt;
98374024373Spr14459 				if (error)
98474024373Spr14459 					return (error);
98574024373Spr14459 				sfv++;
98674024373Spr14459 				continue;
9871574ae68Sjohansen 			}
9881574ae68Sjohansen 
9897c478bd9Sstevel@tonic-gate 			while (sfv_len > 0) {
9907c478bd9Sstevel@tonic-gate 				size_t	iov_len;
9917c478bd9Sstevel@tonic-gate 
9927c478bd9Sstevel@tonic-gate 				iov_len = MIN(size, sfv_len);
9937c478bd9Sstevel@tonic-gate 
9941574ae68Sjohansen 				if (vp->v_type == VSOCK) {
995c28749e9Skais 					dmp = allocb(iov_len + extra, BPRI_HI);
9967c478bd9Sstevel@tonic-gate 					if (dmp == NULL) {
9971574ae68Sjohansen 						VOP_RWUNLOCK(readvp, readflg,
9981574ae68Sjohansen 						    NULL);
9997c478bd9Sstevel@tonic-gate 						releasef(sfv->sfv_fd);
10007c478bd9Sstevel@tonic-gate 						return (ENOMEM);
10017c478bd9Sstevel@tonic-gate 					}
1002c28749e9Skais 					dmp->b_wptr = dmp->b_rptr =
1003c28749e9Skais 					    dmp->b_rptr + wroff;
10047c478bd9Sstevel@tonic-gate 					ptr = (caddr_t)dmp->b_rptr;
10051574ae68Sjohansen 				} else {
10061574ae68Sjohansen 					ptr = buf;
10071574ae68Sjohansen 				}
10087c478bd9Sstevel@tonic-gate 
10097c478bd9Sstevel@tonic-gate 				aiov.iov_base = ptr;
10107c478bd9Sstevel@tonic-gate 				aiov.iov_len = iov_len;
10117c478bd9Sstevel@tonic-gate 				auio.uio_loffset = sfv_off;
10127c478bd9Sstevel@tonic-gate 				auio.uio_iov = &aiov;
10137c478bd9Sstevel@tonic-gate 				auio.uio_iovcnt = 1;
10147c478bd9Sstevel@tonic-gate 				auio.uio_resid = iov_len;
10157c478bd9Sstevel@tonic-gate 				auio.uio_segflg = UIO_SYSSPACE;
10167c478bd9Sstevel@tonic-gate 				auio.uio_llimit = MAXOFFSET_T;
10177c478bd9Sstevel@tonic-gate 				auio.uio_fmode = ffp->f_flag;
10187c478bd9Sstevel@tonic-gate 				ioflag = auio.uio_fmode &
10197c478bd9Sstevel@tonic-gate 				    (FAPPEND|FSYNC|FDSYNC|FRSYNC);
10207c478bd9Sstevel@tonic-gate 
10217c478bd9Sstevel@tonic-gate 				/*
10227c478bd9Sstevel@tonic-gate 				 * If read sync is not asked for,
10237c478bd9Sstevel@tonic-gate 				 * filter sync flags
10247c478bd9Sstevel@tonic-gate 				 */
10257c478bd9Sstevel@tonic-gate 				if ((ioflag & FRSYNC) == 0)
10267c478bd9Sstevel@tonic-gate 					ioflag &= ~(FSYNC|FDSYNC);
10277c478bd9Sstevel@tonic-gate 				error = VOP_READ(readvp, &auio, ioflag,
10287c478bd9Sstevel@tonic-gate 				    fp->f_cred, NULL);
10297c478bd9Sstevel@tonic-gate 				if (error != 0) {
10307c478bd9Sstevel@tonic-gate 					/*
10317c478bd9Sstevel@tonic-gate 					 * If we were reading a pipe (currently
10327c478bd9Sstevel@tonic-gate 					 * not implemented), we may now lose
10337c478bd9Sstevel@tonic-gate 					 * data.
10347c478bd9Sstevel@tonic-gate 					 */
10351574ae68Sjohansen 					if (vp->v_type == VSOCK)
10367c478bd9Sstevel@tonic-gate 						freeb(dmp);
10371574ae68Sjohansen 					else
10381574ae68Sjohansen 						kmem_free(buf, size);
10397c478bd9Sstevel@tonic-gate 					VOP_RWUNLOCK(readvp, readflg, NULL);
10407c478bd9Sstevel@tonic-gate 					releasef(sfv->sfv_fd);
10417c478bd9Sstevel@tonic-gate 					return (error);
10427c478bd9Sstevel@tonic-gate 				}
10437c478bd9Sstevel@tonic-gate 
10447c478bd9Sstevel@tonic-gate 				/*
10457c478bd9Sstevel@tonic-gate 				 * Check how much data was really read.
10467c478bd9Sstevel@tonic-gate 				 * Decrement the 'len' and increment the
10477c478bd9Sstevel@tonic-gate 				 * 'off' appropriately.
10487c478bd9Sstevel@tonic-gate 				 */
10497c478bd9Sstevel@tonic-gate 				cnt = iov_len - auio.uio_resid;
10507c478bd9Sstevel@tonic-gate 				if (cnt == 0) {
10511574ae68Sjohansen 					if (vp->v_type == VSOCK)
10527c478bd9Sstevel@tonic-gate 						freeb(dmp);
10531574ae68Sjohansen 					else
10541574ae68Sjohansen 						kmem_free(buf, size);
10557c478bd9Sstevel@tonic-gate 					VOP_RWUNLOCK(readvp, readflg, NULL);
10567c478bd9Sstevel@tonic-gate 					releasef(sfv->sfv_fd);
10577c478bd9Sstevel@tonic-gate 					return (EINVAL);
10587c478bd9Sstevel@tonic-gate 				}
10597c478bd9Sstevel@tonic-gate 				sfv_len -= cnt;
10607c478bd9Sstevel@tonic-gate 				sfv_off += cnt;
10617c478bd9Sstevel@tonic-gate 
10627c478bd9Sstevel@tonic-gate 				if (vp->v_type == VSOCK) {
10637c478bd9Sstevel@tonic-gate 					dmp->b_wptr = dmp->b_rptr + cnt;
10647c478bd9Sstevel@tonic-gate 
10657c478bd9Sstevel@tonic-gate 					error = kstrwritemp(vp, dmp, fflag);
10667c478bd9Sstevel@tonic-gate 					if (error != 0) {
10677c478bd9Sstevel@tonic-gate 						freeb(dmp);
10687c478bd9Sstevel@tonic-gate 						VOP_RWUNLOCK(readvp, readflg,
10697c478bd9Sstevel@tonic-gate 						    NULL);
10707c478bd9Sstevel@tonic-gate 						releasef(sfv->sfv_fd);
10717c478bd9Sstevel@tonic-gate 						return (error);
10727c478bd9Sstevel@tonic-gate 					}
10737c478bd9Sstevel@tonic-gate 
10747c478bd9Sstevel@tonic-gate 					ttolwp(curthread)->lwp_ru.ioch +=
10757c478bd9Sstevel@tonic-gate 					    (ulong_t)cnt;
10767c478bd9Sstevel@tonic-gate 					*count += cnt;
10777c478bd9Sstevel@tonic-gate 				} else {
10787c478bd9Sstevel@tonic-gate 
10797c478bd9Sstevel@tonic-gate 					aiov.iov_base = ptr;
10807c478bd9Sstevel@tonic-gate 					aiov.iov_len = cnt;
10817c478bd9Sstevel@tonic-gate 					auio.uio_loffset = *fileoff;
10827c478bd9Sstevel@tonic-gate 					auio.uio_resid = cnt;
10837c478bd9Sstevel@tonic-gate 					auio.uio_segflg = UIO_SYSSPACE;
10847c478bd9Sstevel@tonic-gate 					auio.uio_llimit = curproc->p_fsz_ctl;
10857c478bd9Sstevel@tonic-gate 					auio.uio_fmode = fflag;
10867c478bd9Sstevel@tonic-gate 					ioflag = auio.uio_fmode &
10877c478bd9Sstevel@tonic-gate 					    (FAPPEND|FSYNC|FDSYNC|FRSYNC);
10887c478bd9Sstevel@tonic-gate 					error = VOP_WRITE(vp, &auio, ioflag,
10897c478bd9Sstevel@tonic-gate 					    fp->f_cred, NULL);
10907c478bd9Sstevel@tonic-gate 
10917c478bd9Sstevel@tonic-gate 					/*
10927c478bd9Sstevel@tonic-gate 					 * Check how much data was written.
10937c478bd9Sstevel@tonic-gate 					 * Increment the 'len' and decrement the
10947c478bd9Sstevel@tonic-gate 					 * 'off' if all the data was not
10957c478bd9Sstevel@tonic-gate 					 * written.
10967c478bd9Sstevel@tonic-gate 					 */
10977c478bd9Sstevel@tonic-gate 					cnt -= auio.uio_resid;
10987c478bd9Sstevel@tonic-gate 					sfv_len += auio.uio_resid;
10997c478bd9Sstevel@tonic-gate 					sfv_off -= auio.uio_resid;
11007c478bd9Sstevel@tonic-gate 					ttolwp(curthread)->lwp_ru.ioch +=
11017c478bd9Sstevel@tonic-gate 					    (ulong_t)cnt;
11027c478bd9Sstevel@tonic-gate 					*fileoff += cnt;
11037c478bd9Sstevel@tonic-gate 					*count += cnt;
11047c478bd9Sstevel@tonic-gate 					if (error != 0) {
11052db6c79fSstevel 						kmem_free(buf, size);
11067c478bd9Sstevel@tonic-gate 						VOP_RWUNLOCK(readvp, readflg,
11077c478bd9Sstevel@tonic-gate 						    NULL);
11087c478bd9Sstevel@tonic-gate 						releasef(sfv->sfv_fd);
11097c478bd9Sstevel@tonic-gate 						return (error);
11107c478bd9Sstevel@tonic-gate 					}
11117c478bd9Sstevel@tonic-gate 				}
11127c478bd9Sstevel@tonic-gate 			}
11131574ae68Sjohansen 			if (buf) {
11141574ae68Sjohansen 				kmem_free(buf, size);
11151574ae68Sjohansen 				buf = NULL;
11161574ae68Sjohansen 			}
11177c478bd9Sstevel@tonic-gate 			VOP_RWUNLOCK(readvp, readflg, NULL);
11187c478bd9Sstevel@tonic-gate 			releasef(sfv->sfv_fd);
11197c478bd9Sstevel@tonic-gate 		}
11207c478bd9Sstevel@tonic-gate 		sfv++;
11217c478bd9Sstevel@tonic-gate 	}
11227c478bd9Sstevel@tonic-gate 	return (0);
11237c478bd9Sstevel@tonic-gate }
11247c478bd9Sstevel@tonic-gate 
11257c478bd9Sstevel@tonic-gate ssize_t
11267c478bd9Sstevel@tonic-gate sendfilev(int opcode, int fildes, const struct sendfilevec *vec, int sfvcnt,
11277c478bd9Sstevel@tonic-gate     size_t *xferred)
11287c478bd9Sstevel@tonic-gate {
1129311e3d4cSgeorges 	int error = 0;
1130311e3d4cSgeorges 	int first_vector_error = 0;
11317c478bd9Sstevel@tonic-gate 	file_t *fp;
11327c478bd9Sstevel@tonic-gate 	struct vnode *vp;
11337c478bd9Sstevel@tonic-gate 	struct sonode *so;
11347c478bd9Sstevel@tonic-gate 	u_offset_t fileoff;
11357c478bd9Sstevel@tonic-gate 	int copy_cnt;
11367c478bd9Sstevel@tonic-gate 	const struct sendfilevec *copy_vec;
11377c478bd9Sstevel@tonic-gate 	struct sendfilevec sfv[SEND_MAX_CHUNK];
11387c478bd9Sstevel@tonic-gate 	ssize_t count = 0;
11397c478bd9Sstevel@tonic-gate #ifdef _SYSCALL32_IMPL
11407c478bd9Sstevel@tonic-gate 	struct ksendfilevec32 sfv32[SEND_MAX_CHUNK];
11417c478bd9Sstevel@tonic-gate #endif
11420a8433caSrshoaib 	ssize_t total_size;
11437c478bd9Sstevel@tonic-gate 	int i;
11447c478bd9Sstevel@tonic-gate 	boolean_t is_sock = B_FALSE;
11457c478bd9Sstevel@tonic-gate 	int maxblk = 0;
11467c478bd9Sstevel@tonic-gate 
11477c478bd9Sstevel@tonic-gate 	if (sfvcnt <= 0)
11487c478bd9Sstevel@tonic-gate 		return (set_errno(EINVAL));
11497c478bd9Sstevel@tonic-gate 
11507c478bd9Sstevel@tonic-gate 	if ((fp = getf(fildes)) == NULL)
11517c478bd9Sstevel@tonic-gate 		return (set_errno(EBADF));
11527c478bd9Sstevel@tonic-gate 
11537c478bd9Sstevel@tonic-gate 	if (((fp->f_flag) & FWRITE) == 0) {
11547c478bd9Sstevel@tonic-gate 		error = EBADF;
11557c478bd9Sstevel@tonic-gate 		goto err;
11567c478bd9Sstevel@tonic-gate 	}
11577c478bd9Sstevel@tonic-gate 
11587c478bd9Sstevel@tonic-gate 	fileoff = fp->f_offset;
11597c478bd9Sstevel@tonic-gate 	vp = fp->f_vnode;
11607c478bd9Sstevel@tonic-gate 
11617c478bd9Sstevel@tonic-gate 	switch (vp->v_type) {
11627c478bd9Sstevel@tonic-gate 	case VSOCK:
11637c478bd9Sstevel@tonic-gate 		so = VTOSO(vp);
11647c478bd9Sstevel@tonic-gate 		/* sendfile not supported for SCTP */
11657c478bd9Sstevel@tonic-gate 		if (so->so_protocol == IPPROTO_SCTP) {
11667c478bd9Sstevel@tonic-gate 			error = EPROTONOSUPPORT;
11677c478bd9Sstevel@tonic-gate 			goto err;
11687c478bd9Sstevel@tonic-gate 		}
11697c478bd9Sstevel@tonic-gate 		is_sock = B_TRUE;
11707c478bd9Sstevel@tonic-gate 		switch (so->so_family) {
11717c478bd9Sstevel@tonic-gate 		case AF_INET:
11727c478bd9Sstevel@tonic-gate 		case AF_INET6:
11737c478bd9Sstevel@tonic-gate 			/*
11747c478bd9Sstevel@tonic-gate 			 * Make similar checks done in SOP_WRITE().
11757c478bd9Sstevel@tonic-gate 			 */
11767c478bd9Sstevel@tonic-gate 			if (so->so_state & SS_CANTSENDMORE) {
11777c478bd9Sstevel@tonic-gate 				tsignal(curthread, SIGPIPE);
11787c478bd9Sstevel@tonic-gate 				error = EPIPE;
11797c478bd9Sstevel@tonic-gate 				goto err;
11807c478bd9Sstevel@tonic-gate 			}
11817c478bd9Sstevel@tonic-gate 			if (so->so_type != SOCK_STREAM) {
11827c478bd9Sstevel@tonic-gate 				error = EOPNOTSUPP;
11837c478bd9Sstevel@tonic-gate 				goto err;
11847c478bd9Sstevel@tonic-gate 			}
11857c478bd9Sstevel@tonic-gate 
11867c478bd9Sstevel@tonic-gate 			if ((so->so_state & (SS_ISCONNECTED|SS_ISBOUND)) !=
11877c478bd9Sstevel@tonic-gate 			    (SS_ISCONNECTED|SS_ISBOUND)) {
11887c478bd9Sstevel@tonic-gate 				error = ENOTCONN;
11897c478bd9Sstevel@tonic-gate 				goto err;
11907c478bd9Sstevel@tonic-gate 			}
11917c478bd9Sstevel@tonic-gate 
1192ff550d0eSmasputra 			if ((so->so_state & SS_DIRECT) &&
1193c28749e9Skais 			    (so->so_priv != NULL) &&
1194c28749e9Skais 			    (so->so_kssl_ctx == NULL)) {
11957c478bd9Sstevel@tonic-gate 				maxblk = ((tcp_t *)so->so_priv)->tcp_mss;
11967c478bd9Sstevel@tonic-gate 			} else {
11977c478bd9Sstevel@tonic-gate 				maxblk = (int)vp->v_stream->sd_maxblk;
11987c478bd9Sstevel@tonic-gate 			}
11997c478bd9Sstevel@tonic-gate 			break;
12007c478bd9Sstevel@tonic-gate 		default:
12017c478bd9Sstevel@tonic-gate 			error = EAFNOSUPPORT;
12027c478bd9Sstevel@tonic-gate 			goto err;
12037c478bd9Sstevel@tonic-gate 		}
12047c478bd9Sstevel@tonic-gate 		break;
12057c478bd9Sstevel@tonic-gate 	case VREG:
12067c478bd9Sstevel@tonic-gate 		break;
12077c478bd9Sstevel@tonic-gate 	default:
12087c478bd9Sstevel@tonic-gate 		error = EINVAL;
12097c478bd9Sstevel@tonic-gate 		goto err;
12107c478bd9Sstevel@tonic-gate 	}
12117c478bd9Sstevel@tonic-gate 
12127c478bd9Sstevel@tonic-gate 	switch (opcode) {
12137c478bd9Sstevel@tonic-gate 	case SENDFILEV :
12147c478bd9Sstevel@tonic-gate 		break;
12157c478bd9Sstevel@tonic-gate #if defined(_SYSCALL32_IMPL) || defined(_ILP32)
12167c478bd9Sstevel@tonic-gate 	case SENDFILEV64 :
12177c478bd9Sstevel@tonic-gate 		return (sendvec64(fp, (struct ksendfilevec64 *)vec, sfvcnt,
12187c478bd9Sstevel@tonic-gate 		    (size32_t *)xferred, fildes));
12197c478bd9Sstevel@tonic-gate #endif
12207c478bd9Sstevel@tonic-gate 	default :
12217c478bd9Sstevel@tonic-gate 		error = ENOSYS;
12227c478bd9Sstevel@tonic-gate 		break;
12237c478bd9Sstevel@tonic-gate 	}
12247c478bd9Sstevel@tonic-gate 
12257c478bd9Sstevel@tonic-gate 	(void) VOP_RWLOCK(vp, V_WRITELOCK_TRUE, NULL);
12267c478bd9Sstevel@tonic-gate 	copy_vec = vec;
12277c478bd9Sstevel@tonic-gate 
12287c478bd9Sstevel@tonic-gate 	do {
12290a8433caSrshoaib 		total_size = 0;
12307c478bd9Sstevel@tonic-gate 		copy_cnt = MIN(sfvcnt, SEND_MAX_CHUNK);
12317c478bd9Sstevel@tonic-gate #ifdef _SYSCALL32_IMPL
12327c478bd9Sstevel@tonic-gate 		/* 32-bit callers need to have their iovec expanded. */
12337c478bd9Sstevel@tonic-gate 		if (get_udatamodel() == DATAMODEL_ILP32) {
12347c478bd9Sstevel@tonic-gate 			if (copyin(copy_vec, sfv32,
12357c478bd9Sstevel@tonic-gate 			    copy_cnt * sizeof (ksendfilevec32_t))) {
12367c478bd9Sstevel@tonic-gate 				error = EFAULT;
12377c478bd9Sstevel@tonic-gate 				break;
12387c478bd9Sstevel@tonic-gate 			}
12397c478bd9Sstevel@tonic-gate 
12407c478bd9Sstevel@tonic-gate 			for (i = 0; i < copy_cnt; i++) {
12417c478bd9Sstevel@tonic-gate 				sfv[i].sfv_fd = sfv32[i].sfv_fd;
12427c478bd9Sstevel@tonic-gate 				sfv[i].sfv_off =
12437c478bd9Sstevel@tonic-gate 				    (off_t)(uint32_t)sfv32[i].sfv_off;
12447c478bd9Sstevel@tonic-gate 				sfv[i].sfv_len = (size_t)sfv32[i].sfv_len;
12457c478bd9Sstevel@tonic-gate 				total_size += sfv[i].sfv_len;
12467c478bd9Sstevel@tonic-gate 				sfv[i].sfv_flag = sfv32[i].sfv_flag;
1247311e3d4cSgeorges 				/*
1248311e3d4cSgeorges 				 * Individual elements of the vector must not
1249311e3d4cSgeorges 				 * wrap or overflow, as later math is signed.
1250311e3d4cSgeorges 				 * Equally total_size needs to be checked after
1251311e3d4cSgeorges 				 * each vector is added in, to be sure that
1252311e3d4cSgeorges 				 * rogue values haven't overflowed the counter.
1253311e3d4cSgeorges 				 */
1254311e3d4cSgeorges 				if (((ssize32_t)sfv[i].sfv_len < 0) ||
1255311e3d4cSgeorges 				    ((ssize32_t)total_size < 0)) {
1256311e3d4cSgeorges 					/*
1257311e3d4cSgeorges 					 * Truncate the vector to send data
1258311e3d4cSgeorges 					 * described by elements before the
1259311e3d4cSgeorges 					 * error.
1260311e3d4cSgeorges 					 */
1261311e3d4cSgeorges 					copy_cnt = i;
1262311e3d4cSgeorges 					first_vector_error = EINVAL;
1263311e3d4cSgeorges 					/* total_size can't be trusted */
1264311e3d4cSgeorges 					if ((ssize32_t)total_size < 0)
1265311e3d4cSgeorges 						error = EINVAL;
1266311e3d4cSgeorges 					break;
12677c478bd9Sstevel@tonic-gate 				}
1268311e3d4cSgeorges 			}
1269311e3d4cSgeorges 			/* Nothing to do, process errors */
1270311e3d4cSgeorges 			if (copy_cnt == 0)
1271311e3d4cSgeorges 				break;
1272311e3d4cSgeorges 
12737c478bd9Sstevel@tonic-gate 		} else {
12747c478bd9Sstevel@tonic-gate #endif
12757c478bd9Sstevel@tonic-gate 			if (copyin(copy_vec, sfv,
12767c478bd9Sstevel@tonic-gate 			    copy_cnt * sizeof (sendfilevec_t))) {
12777c478bd9Sstevel@tonic-gate 				error = EFAULT;
12787c478bd9Sstevel@tonic-gate 				break;
12797c478bd9Sstevel@tonic-gate 			}
12807c478bd9Sstevel@tonic-gate 
12817c478bd9Sstevel@tonic-gate 			for (i = 0; i < copy_cnt; i++) {
12827c478bd9Sstevel@tonic-gate 				total_size += sfv[i].sfv_len;
1283311e3d4cSgeorges 				/*
1284311e3d4cSgeorges 				 * Individual elements of the vector must not
1285311e3d4cSgeorges 				 * wrap or overflow, as later math is signed.
1286311e3d4cSgeorges 				 * Equally total_size needs to be checked after
1287311e3d4cSgeorges 				 * each vector is added in, to be sure that
1288311e3d4cSgeorges 				 * rogue values haven't overflowed the counter.
1289311e3d4cSgeorges 				 */
1290311e3d4cSgeorges 				if (((ssize_t)sfv[i].sfv_len < 0) ||
1291311e3d4cSgeorges 				    (total_size < 0)) {
1292311e3d4cSgeorges 					/*
1293311e3d4cSgeorges 					 * Truncate the vector to send data
1294311e3d4cSgeorges 					 * described by elements before the
1295311e3d4cSgeorges 					 * error.
1296311e3d4cSgeorges 					 */
1297311e3d4cSgeorges 					copy_cnt = i;
1298311e3d4cSgeorges 					first_vector_error = EINVAL;
1299311e3d4cSgeorges 					/* total_size can't be trusted */
1300311e3d4cSgeorges 					if (total_size < 0)
1301311e3d4cSgeorges 						error = EINVAL;
1302311e3d4cSgeorges 					break;
13037c478bd9Sstevel@tonic-gate 				}
1304311e3d4cSgeorges 			}
1305311e3d4cSgeorges 			/* Nothing to do, process errors */
1306311e3d4cSgeorges 			if (copy_cnt == 0)
1307311e3d4cSgeorges 				break;
13087c478bd9Sstevel@tonic-gate #ifdef _SYSCALL32_IMPL
13097c478bd9Sstevel@tonic-gate 		}
13107c478bd9Sstevel@tonic-gate #endif
13117c478bd9Sstevel@tonic-gate 
13127c478bd9Sstevel@tonic-gate 		/*
13137c478bd9Sstevel@tonic-gate 		 * The task between deciding to use sendvec_small_chunk
13147c478bd9Sstevel@tonic-gate 		 * and sendvec_chunk is dependant on multiple things:
13157c478bd9Sstevel@tonic-gate 		 *
13167c478bd9Sstevel@tonic-gate 		 * i) latency is important for smaller files. So if the
13177c478bd9Sstevel@tonic-gate 		 * data is smaller than 'tcp_slow_start_initial' times
13187c478bd9Sstevel@tonic-gate 		 * maxblk, then use sendvec_small_chunk which creates
1319*3b3d24f3SJayakara Kini 		 * maxblk size mblks and chains them together and sends
13207c478bd9Sstevel@tonic-gate 		 * them to TCP in one shot. It also leaves 'wroff' size
13217c478bd9Sstevel@tonic-gate 		 * space for the headers in each mblk.
13227c478bd9Sstevel@tonic-gate 		 *
13237c478bd9Sstevel@tonic-gate 		 * ii) for total size bigger than 'tcp_slow_start_initial'
13247c478bd9Sstevel@tonic-gate 		 * time maxblk, its probably real file data which is
13257c478bd9Sstevel@tonic-gate 		 * dominating. So its better to use sendvec_chunk because
13267c478bd9Sstevel@tonic-gate 		 * performance goes to dog if we don't do pagesize reads.
13277c478bd9Sstevel@tonic-gate 		 * sendvec_chunk will do pagesize reads and write them
13287c478bd9Sstevel@tonic-gate 		 * in pagesize mblks to TCP.
13297c478bd9Sstevel@tonic-gate 		 *
13307c478bd9Sstevel@tonic-gate 		 * Side Notes: A write to file has not been optimized.
13317c478bd9Sstevel@tonic-gate 		 * Future zero copy code will plugin into sendvec_chunk
13327c478bd9Sstevel@tonic-gate 		 * only because doing zero copy for files smaller then
13337c478bd9Sstevel@tonic-gate 		 * pagesize is useless.
13347c478bd9Sstevel@tonic-gate 		 *
13357c478bd9Sstevel@tonic-gate 		 * Note, if socket has NL7C enabled then call NL7C's
13362c9e429eSbrutus 		 * senfilev() function to consume the sfv[].
13377c478bd9Sstevel@tonic-gate 		 */
13387c478bd9Sstevel@tonic-gate 		if (is_sock) {
13397c478bd9Sstevel@tonic-gate 			switch (so->so_family) {
13407c478bd9Sstevel@tonic-gate 			case AF_INET:
13417c478bd9Sstevel@tonic-gate 			case AF_INET6:
13422c9e429eSbrutus 				if (so->so_nl7c_flags != 0)
13432c9e429eSbrutus 					error = nl7c_sendfilev(so, &fileoff,
13442c9e429eSbrutus 					    sfv, copy_cnt, &count);
1345311e3d4cSgeorges 				else if ((total_size <= (4 * maxblk)) &&
1346311e3d4cSgeorges 				    error == 0)
13477c478bd9Sstevel@tonic-gate 					error = sendvec_small_chunk(fp,
13487c478bd9Sstevel@tonic-gate 					    &fileoff, sfv, copy_cnt,
13497c478bd9Sstevel@tonic-gate 					    total_size, maxblk, &count);
13507c478bd9Sstevel@tonic-gate 				else
13517c478bd9Sstevel@tonic-gate 					error = sendvec_chunk(fp, &fileoff,
13527c478bd9Sstevel@tonic-gate 					    sfv, copy_cnt, &count);
13537c478bd9Sstevel@tonic-gate 				break;
13547c478bd9Sstevel@tonic-gate 			}
13557c478bd9Sstevel@tonic-gate 		} else {
13567c478bd9Sstevel@tonic-gate 			ASSERT(vp->v_type == VREG);
13577c478bd9Sstevel@tonic-gate 			error = sendvec_chunk(fp, &fileoff, sfv, copy_cnt,
13587c478bd9Sstevel@tonic-gate 			    &count);
13597c478bd9Sstevel@tonic-gate 		}
13607c478bd9Sstevel@tonic-gate 
13617c478bd9Sstevel@tonic-gate 
13627c478bd9Sstevel@tonic-gate #ifdef _SYSCALL32_IMPL
13637c478bd9Sstevel@tonic-gate 	if (get_udatamodel() == DATAMODEL_ILP32)
13647c478bd9Sstevel@tonic-gate 		copy_vec = (const struct sendfilevec *)((char *)copy_vec +
13657c478bd9Sstevel@tonic-gate 		    (copy_cnt * sizeof (ksendfilevec32_t)));
13667c478bd9Sstevel@tonic-gate 	else
13677c478bd9Sstevel@tonic-gate #endif
13687c478bd9Sstevel@tonic-gate 		copy_vec += copy_cnt;
13697c478bd9Sstevel@tonic-gate 		sfvcnt -= copy_cnt;
1370311e3d4cSgeorges 
1371311e3d4cSgeorges 	/* Process all vector members up to first error */
1372311e3d4cSgeorges 	} while ((sfvcnt > 0) && first_vector_error == 0 && error == 0);
13737c478bd9Sstevel@tonic-gate 
13747c478bd9Sstevel@tonic-gate 	if (vp->v_type == VREG)
13757c478bd9Sstevel@tonic-gate 		fp->f_offset += count;
13767c478bd9Sstevel@tonic-gate 
13777c478bd9Sstevel@tonic-gate 	VOP_RWUNLOCK(vp, V_WRITELOCK_TRUE, NULL);
13787c478bd9Sstevel@tonic-gate 
13797c478bd9Sstevel@tonic-gate #ifdef _SYSCALL32_IMPL
13807c478bd9Sstevel@tonic-gate 	if (get_udatamodel() == DATAMODEL_ILP32) {
13817c478bd9Sstevel@tonic-gate 		ssize32_t count32 = (ssize32_t)count;
13827c478bd9Sstevel@tonic-gate 		if (copyout(&count32, xferred, sizeof (count32)))
13837c478bd9Sstevel@tonic-gate 			error = EFAULT;
13847c478bd9Sstevel@tonic-gate 		releasef(fildes);
13857c478bd9Sstevel@tonic-gate 		if (error != 0)
13867c478bd9Sstevel@tonic-gate 			return (set_errno(error));
1387311e3d4cSgeorges 		if (first_vector_error != 0)
1388311e3d4cSgeorges 			return (set_errno(first_vector_error));
13897c478bd9Sstevel@tonic-gate 		return (count32);
13907c478bd9Sstevel@tonic-gate 	}
13917c478bd9Sstevel@tonic-gate #endif
13927c478bd9Sstevel@tonic-gate 	if (copyout(&count, xferred, sizeof (count)))
13937c478bd9Sstevel@tonic-gate 		error = EFAULT;
13947c478bd9Sstevel@tonic-gate 	releasef(fildes);
13957c478bd9Sstevel@tonic-gate 	if (error != 0)
13967c478bd9Sstevel@tonic-gate 		return (set_errno(error));
1397311e3d4cSgeorges 	if (first_vector_error != 0)
1398311e3d4cSgeorges 		return (set_errno(first_vector_error));
13997c478bd9Sstevel@tonic-gate 	return (count);
14007c478bd9Sstevel@tonic-gate err:
14017c478bd9Sstevel@tonic-gate 	ASSERT(error != 0);
14027c478bd9Sstevel@tonic-gate 	releasef(fildes);
14037c478bd9Sstevel@tonic-gate 	return (set_errno(error));
14047c478bd9Sstevel@tonic-gate }
1405