xref: /titanic_50/usr/src/uts/common/rpc/rpcmod.c (revision 07e751310052c13869cb1cb2013faf5da656f9f8)
17c478bd9Sstevel@tonic-gate /*
27c478bd9Sstevel@tonic-gate  * CDDL HEADER START
37c478bd9Sstevel@tonic-gate  *
47c478bd9Sstevel@tonic-gate  * The contents of this file are subject to the terms of the
5a26eed27Sgt29601  * Common Development and Distribution License (the "License").
6a26eed27Sgt29601  * You may not use this file except in compliance with the License.
77c478bd9Sstevel@tonic-gate  *
87c478bd9Sstevel@tonic-gate  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
97c478bd9Sstevel@tonic-gate  * or http://www.opensolaris.org/os/licensing.
107c478bd9Sstevel@tonic-gate  * See the License for the specific language governing permissions
117c478bd9Sstevel@tonic-gate  * and limitations under the License.
127c478bd9Sstevel@tonic-gate  *
137c478bd9Sstevel@tonic-gate  * When distributing Covered Code, include this CDDL HEADER in each
147c478bd9Sstevel@tonic-gate  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
157c478bd9Sstevel@tonic-gate  * If applicable, add the following below this CDDL HEADER, with the
167c478bd9Sstevel@tonic-gate  * fields enclosed by brackets "[]" replaced with your own identifying
177c478bd9Sstevel@tonic-gate  * information: Portions Copyright [yyyy] [name of copyright owner]
187c478bd9Sstevel@tonic-gate  *
197c478bd9Sstevel@tonic-gate  * CDDL HEADER END
207c478bd9Sstevel@tonic-gate  */
217c478bd9Sstevel@tonic-gate /*
22fcfe7086Sgeorges  * Copyright 2007 Sun Microsystems, Inc.  All rights reserved.
237c478bd9Sstevel@tonic-gate  * Use is subject to license terms.
247c478bd9Sstevel@tonic-gate  */
257c478bd9Sstevel@tonic-gate /* Copyright (c) 1990 Mentat Inc. */
267c478bd9Sstevel@tonic-gate 
277c478bd9Sstevel@tonic-gate /*	Copyright (c) 1984, 1986, 1987, 1988, 1989 AT&T	*/
287c478bd9Sstevel@tonic-gate /*	  All Rights Reserved  	*/
297c478bd9Sstevel@tonic-gate 
307c478bd9Sstevel@tonic-gate #pragma ident	"%Z%%M%	%I%	%E% SMI"
317c478bd9Sstevel@tonic-gate 
327c478bd9Sstevel@tonic-gate /*
337c478bd9Sstevel@tonic-gate  * Kernel RPC filtering module
347c478bd9Sstevel@tonic-gate  */
357c478bd9Sstevel@tonic-gate 
367c478bd9Sstevel@tonic-gate #include <sys/param.h>
377c478bd9Sstevel@tonic-gate #include <sys/types.h>
387c478bd9Sstevel@tonic-gate #include <sys/stream.h>
397c478bd9Sstevel@tonic-gate #include <sys/stropts.h>
407c478bd9Sstevel@tonic-gate #include <sys/tihdr.h>
417c478bd9Sstevel@tonic-gate #include <sys/timod.h>
427c478bd9Sstevel@tonic-gate #include <sys/tiuser.h>
437c478bd9Sstevel@tonic-gate #include <sys/debug.h>
447c478bd9Sstevel@tonic-gate #include <sys/signal.h>
457c478bd9Sstevel@tonic-gate #include <sys/pcb.h>
467c478bd9Sstevel@tonic-gate #include <sys/user.h>
477c478bd9Sstevel@tonic-gate #include <sys/errno.h>
487c478bd9Sstevel@tonic-gate #include <sys/cred.h>
497c478bd9Sstevel@tonic-gate #include <sys/policy.h>
507c478bd9Sstevel@tonic-gate #include <sys/inline.h>
517c478bd9Sstevel@tonic-gate #include <sys/cmn_err.h>
527c478bd9Sstevel@tonic-gate #include <sys/kmem.h>
537c478bd9Sstevel@tonic-gate #include <sys/file.h>
547c478bd9Sstevel@tonic-gate #include <sys/sysmacros.h>
557c478bd9Sstevel@tonic-gate #include <sys/systm.h>
567c478bd9Sstevel@tonic-gate #include <sys/t_lock.h>
577c478bd9Sstevel@tonic-gate #include <sys/ddi.h>
587c478bd9Sstevel@tonic-gate #include <sys/vtrace.h>
597c478bd9Sstevel@tonic-gate #include <sys/callb.h>
607c478bd9Sstevel@tonic-gate 
617c478bd9Sstevel@tonic-gate #include <sys/strlog.h>
627c478bd9Sstevel@tonic-gate #include <rpc/rpc_com.h>
637c478bd9Sstevel@tonic-gate #include <inet/common.h>
647c478bd9Sstevel@tonic-gate #include <rpc/types.h>
657c478bd9Sstevel@tonic-gate #include <sys/time.h>
667c478bd9Sstevel@tonic-gate #include <rpc/xdr.h>
677c478bd9Sstevel@tonic-gate #include <rpc/auth.h>
687c478bd9Sstevel@tonic-gate #include <rpc/clnt.h>
697c478bd9Sstevel@tonic-gate #include <rpc/rpc_msg.h>
707c478bd9Sstevel@tonic-gate #include <rpc/clnt.h>
717c478bd9Sstevel@tonic-gate #include <rpc/svc.h>
727c478bd9Sstevel@tonic-gate #include <rpc/rpcsys.h>
737c478bd9Sstevel@tonic-gate #include <rpc/rpc_rdma.h>
747c478bd9Sstevel@tonic-gate 
757c478bd9Sstevel@tonic-gate /*
767c478bd9Sstevel@tonic-gate  * This is the loadable module wrapper.
777c478bd9Sstevel@tonic-gate  */
787c478bd9Sstevel@tonic-gate #include <sys/conf.h>
797c478bd9Sstevel@tonic-gate #include <sys/modctl.h>
807c478bd9Sstevel@tonic-gate #include <sys/syscall.h>
817c478bd9Sstevel@tonic-gate 
827c478bd9Sstevel@tonic-gate extern struct streamtab rpcinfo;
837c478bd9Sstevel@tonic-gate 
847c478bd9Sstevel@tonic-gate static struct fmodsw fsw = {
857c478bd9Sstevel@tonic-gate 	"rpcmod",
867c478bd9Sstevel@tonic-gate 	&rpcinfo,
877c478bd9Sstevel@tonic-gate 	D_NEW|D_MP,
887c478bd9Sstevel@tonic-gate };
897c478bd9Sstevel@tonic-gate 
907c478bd9Sstevel@tonic-gate /*
917c478bd9Sstevel@tonic-gate  * Module linkage information for the kernel.
927c478bd9Sstevel@tonic-gate  */
937c478bd9Sstevel@tonic-gate 
947c478bd9Sstevel@tonic-gate static struct modlstrmod modlstrmod = {
957c478bd9Sstevel@tonic-gate 	&mod_strmodops, "rpc interface str mod", &fsw
967c478bd9Sstevel@tonic-gate };
977c478bd9Sstevel@tonic-gate 
987c478bd9Sstevel@tonic-gate /*
997c478bd9Sstevel@tonic-gate  * For the RPC system call.
1007c478bd9Sstevel@tonic-gate  */
1017c478bd9Sstevel@tonic-gate static struct sysent rpcsysent = {
1027c478bd9Sstevel@tonic-gate 	2,
1037c478bd9Sstevel@tonic-gate 	SE_32RVAL1 | SE_ARGC | SE_NOUNLOAD,
1047c478bd9Sstevel@tonic-gate 	rpcsys
1057c478bd9Sstevel@tonic-gate };
1067c478bd9Sstevel@tonic-gate 
1077c478bd9Sstevel@tonic-gate static struct modlsys modlsys = {
1087c478bd9Sstevel@tonic-gate 	&mod_syscallops,
1097c478bd9Sstevel@tonic-gate 	"RPC syscall",
1107c478bd9Sstevel@tonic-gate 	&rpcsysent
1117c478bd9Sstevel@tonic-gate };
1127c478bd9Sstevel@tonic-gate 
1137c478bd9Sstevel@tonic-gate #ifdef _SYSCALL32_IMPL
1147c478bd9Sstevel@tonic-gate static struct modlsys modlsys32 = {
1157c478bd9Sstevel@tonic-gate 	&mod_syscallops32,
1167c478bd9Sstevel@tonic-gate 	"32-bit RPC syscall",
1177c478bd9Sstevel@tonic-gate 	&rpcsysent
1187c478bd9Sstevel@tonic-gate };
1197c478bd9Sstevel@tonic-gate #endif /* _SYSCALL32_IMPL */
1207c478bd9Sstevel@tonic-gate 
1217c478bd9Sstevel@tonic-gate static struct modlinkage modlinkage = {
1227c478bd9Sstevel@tonic-gate 	MODREV_1,
1237c478bd9Sstevel@tonic-gate 	{
1247c478bd9Sstevel@tonic-gate 		&modlsys,
1257c478bd9Sstevel@tonic-gate #ifdef _SYSCALL32_IMPL
1267c478bd9Sstevel@tonic-gate 		&modlsys32,
1277c478bd9Sstevel@tonic-gate #endif
1287c478bd9Sstevel@tonic-gate 		&modlstrmod,
1297c478bd9Sstevel@tonic-gate 		NULL
1307c478bd9Sstevel@tonic-gate 	}
1317c478bd9Sstevel@tonic-gate };
1327c478bd9Sstevel@tonic-gate 
1337c478bd9Sstevel@tonic-gate int
1347c478bd9Sstevel@tonic-gate _init(void)
1357c478bd9Sstevel@tonic-gate {
1367c478bd9Sstevel@tonic-gate 	int error = 0;
1377c478bd9Sstevel@tonic-gate 	callb_id_t cid;
1387c478bd9Sstevel@tonic-gate 	int status;
1397c478bd9Sstevel@tonic-gate 
1407c478bd9Sstevel@tonic-gate 	svc_init();
1417c478bd9Sstevel@tonic-gate 	clnt_init();
1427c478bd9Sstevel@tonic-gate 	cid = callb_add(connmgr_cpr_reset, 0, CB_CL_CPR_RPC, "rpc");
1437c478bd9Sstevel@tonic-gate 
1447c478bd9Sstevel@tonic-gate 	if (error = mod_install(&modlinkage)) {
1457c478bd9Sstevel@tonic-gate 		/*
1467c478bd9Sstevel@tonic-gate 		 * Could not install module, cleanup previous
1477c478bd9Sstevel@tonic-gate 		 * initialization work.
1487c478bd9Sstevel@tonic-gate 		 */
1497c478bd9Sstevel@tonic-gate 		clnt_fini();
1507c478bd9Sstevel@tonic-gate 		if (cid != NULL)
1517c478bd9Sstevel@tonic-gate 			(void) callb_delete(cid);
1527c478bd9Sstevel@tonic-gate 
1537c478bd9Sstevel@tonic-gate 		return (error);
1547c478bd9Sstevel@tonic-gate 	}
1557c478bd9Sstevel@tonic-gate 
1567c478bd9Sstevel@tonic-gate 	/*
1577c478bd9Sstevel@tonic-gate 	 * Load up the RDMA plugins and initialize the stats. Even if the
1587c478bd9Sstevel@tonic-gate 	 * plugins loadup fails, but rpcmod was successfully installed the
1597c478bd9Sstevel@tonic-gate 	 * counters still get initialized.
1607c478bd9Sstevel@tonic-gate 	 */
1617c478bd9Sstevel@tonic-gate 	rw_init(&rdma_lock, NULL, RW_DEFAULT, NULL);
1627c478bd9Sstevel@tonic-gate 	mutex_init(&rdma_modload_lock, NULL, MUTEX_DEFAULT, NULL);
1637c478bd9Sstevel@tonic-gate 	mt_kstat_init();
1647c478bd9Sstevel@tonic-gate 
1657c478bd9Sstevel@tonic-gate 	/*
1667c478bd9Sstevel@tonic-gate 	 * Get our identification into ldi.  This is used for loading
1677c478bd9Sstevel@tonic-gate 	 * other modules, e.g. rpcib.
1687c478bd9Sstevel@tonic-gate 	 */
1697c478bd9Sstevel@tonic-gate 	status = ldi_ident_from_mod(&modlinkage, &rpcmod_li);
1707c478bd9Sstevel@tonic-gate 	if (status != 0) {
1717c478bd9Sstevel@tonic-gate 		cmn_err(CE_WARN, "ldi_ident_from_mod fails with %d", status);
1727c478bd9Sstevel@tonic-gate 		rpcmod_li = NULL;
1737c478bd9Sstevel@tonic-gate 	}
1747c478bd9Sstevel@tonic-gate 
1757c478bd9Sstevel@tonic-gate 	return (error);
1767c478bd9Sstevel@tonic-gate }
1777c478bd9Sstevel@tonic-gate 
1787c478bd9Sstevel@tonic-gate /*
1797c478bd9Sstevel@tonic-gate  * The unload entry point fails, because we advertise entry points into
1807c478bd9Sstevel@tonic-gate  * rpcmod from the rest of kRPC: rpcmod_release().
1817c478bd9Sstevel@tonic-gate  */
1827c478bd9Sstevel@tonic-gate int
1837c478bd9Sstevel@tonic-gate _fini(void)
1847c478bd9Sstevel@tonic-gate {
1857c478bd9Sstevel@tonic-gate 	return (EBUSY);
1867c478bd9Sstevel@tonic-gate }
1877c478bd9Sstevel@tonic-gate 
1887c478bd9Sstevel@tonic-gate int
1897c478bd9Sstevel@tonic-gate _info(struct modinfo *modinfop)
1907c478bd9Sstevel@tonic-gate {
1917c478bd9Sstevel@tonic-gate 	return (mod_info(&modlinkage, modinfop));
1927c478bd9Sstevel@tonic-gate }
1937c478bd9Sstevel@tonic-gate 
1947c478bd9Sstevel@tonic-gate extern int nulldev();
1957c478bd9Sstevel@tonic-gate 
1967c478bd9Sstevel@tonic-gate #define	RPCMOD_ID	2049
1977c478bd9Sstevel@tonic-gate 
1987c478bd9Sstevel@tonic-gate int rmm_open(), rmm_close();
1997c478bd9Sstevel@tonic-gate 
2007c478bd9Sstevel@tonic-gate /*
2017c478bd9Sstevel@tonic-gate  * To save instructions, since STREAMS ignores the return value
2027c478bd9Sstevel@tonic-gate  * from these functions, they are defined as void here. Kind of icky, but...
2037c478bd9Sstevel@tonic-gate  */
2047c478bd9Sstevel@tonic-gate void rmm_rput(queue_t *, mblk_t *);
2057c478bd9Sstevel@tonic-gate void rmm_wput(queue_t *, mblk_t *);
2067c478bd9Sstevel@tonic-gate void rmm_rsrv(queue_t *);
2077c478bd9Sstevel@tonic-gate void rmm_wsrv(queue_t *);
2087c478bd9Sstevel@tonic-gate 
2097c478bd9Sstevel@tonic-gate int rpcmodopen(), rpcmodclose();
2107c478bd9Sstevel@tonic-gate void rpcmodrput(), rpcmodwput();
2117c478bd9Sstevel@tonic-gate void rpcmodrsrv(), rpcmodwsrv();
2127c478bd9Sstevel@tonic-gate 
2137c478bd9Sstevel@tonic-gate static	void	rpcmodwput_other(queue_t *, mblk_t *);
2147c478bd9Sstevel@tonic-gate static	int	mir_close(queue_t *q);
2157c478bd9Sstevel@tonic-gate static	int	mir_open(queue_t *q, dev_t *devp, int flag, int sflag,
2167c478bd9Sstevel@tonic-gate 		    cred_t *credp);
2177c478bd9Sstevel@tonic-gate static	void	mir_rput(queue_t *q, mblk_t *mp);
2187c478bd9Sstevel@tonic-gate static	void	mir_rsrv(queue_t *q);
2197c478bd9Sstevel@tonic-gate static	void	mir_wput(queue_t *q, mblk_t *mp);
2207c478bd9Sstevel@tonic-gate static	void	mir_wsrv(queue_t *q);
2217c478bd9Sstevel@tonic-gate 
2227c478bd9Sstevel@tonic-gate static struct module_info rpcmod_info =
2237c478bd9Sstevel@tonic-gate 	{RPCMOD_ID, "rpcmod", 0, INFPSZ, 256*1024, 1024};
2247c478bd9Sstevel@tonic-gate 
2257c478bd9Sstevel@tonic-gate /*
2267c478bd9Sstevel@tonic-gate  * Read side has no service procedure.
2277c478bd9Sstevel@tonic-gate  */
2287c478bd9Sstevel@tonic-gate static struct qinit rpcmodrinit = {
2297c478bd9Sstevel@tonic-gate 	(int (*)())rmm_rput,
2307c478bd9Sstevel@tonic-gate 	(int (*)())rmm_rsrv,
2317c478bd9Sstevel@tonic-gate 	rmm_open,
2327c478bd9Sstevel@tonic-gate 	rmm_close,
2337c478bd9Sstevel@tonic-gate 	nulldev,
2347c478bd9Sstevel@tonic-gate 	&rpcmod_info,
2357c478bd9Sstevel@tonic-gate 	NULL
2367c478bd9Sstevel@tonic-gate };
2377c478bd9Sstevel@tonic-gate 
2387c478bd9Sstevel@tonic-gate /*
2397c478bd9Sstevel@tonic-gate  * The write put procedure is simply putnext to conserve stack space.
2407c478bd9Sstevel@tonic-gate  * The write service procedure is not used to queue data, but instead to
2417c478bd9Sstevel@tonic-gate  * synchronize with flow control.
2427c478bd9Sstevel@tonic-gate  */
2437c478bd9Sstevel@tonic-gate static struct qinit rpcmodwinit = {
2447c478bd9Sstevel@tonic-gate 	(int (*)())rmm_wput,
2457c478bd9Sstevel@tonic-gate 	(int (*)())rmm_wsrv,
2467c478bd9Sstevel@tonic-gate 	rmm_open,
2477c478bd9Sstevel@tonic-gate 	rmm_close,
2487c478bd9Sstevel@tonic-gate 	nulldev,
2497c478bd9Sstevel@tonic-gate 	&rpcmod_info,
2507c478bd9Sstevel@tonic-gate 	NULL
2517c478bd9Sstevel@tonic-gate };
2527c478bd9Sstevel@tonic-gate struct streamtab rpcinfo = { &rpcmodrinit, &rpcmodwinit, NULL, NULL };
2537c478bd9Sstevel@tonic-gate 
2547c478bd9Sstevel@tonic-gate struct xprt_style_ops {
2557c478bd9Sstevel@tonic-gate 	int (*xo_open)();
2567c478bd9Sstevel@tonic-gate 	int (*xo_close)();
2577c478bd9Sstevel@tonic-gate 	void (*xo_wput)();
2587c478bd9Sstevel@tonic-gate 	void (*xo_wsrv)();
2597c478bd9Sstevel@tonic-gate 	void (*xo_rput)();
2607c478bd9Sstevel@tonic-gate 	void (*xo_rsrv)();
2617c478bd9Sstevel@tonic-gate };
2627c478bd9Sstevel@tonic-gate 
2637c478bd9Sstevel@tonic-gate static struct xprt_style_ops xprt_clts_ops = {
2647c478bd9Sstevel@tonic-gate 	rpcmodopen,
2657c478bd9Sstevel@tonic-gate 	rpcmodclose,
2667c478bd9Sstevel@tonic-gate 	rpcmodwput,
2677c478bd9Sstevel@tonic-gate 	rpcmodwsrv,
2687c478bd9Sstevel@tonic-gate 	rpcmodrput,
2697c478bd9Sstevel@tonic-gate 	NULL
2707c478bd9Sstevel@tonic-gate };
2717c478bd9Sstevel@tonic-gate 
2727c478bd9Sstevel@tonic-gate static struct xprt_style_ops xprt_cots_ops = {
2737c478bd9Sstevel@tonic-gate 	mir_open,
2747c478bd9Sstevel@tonic-gate 	mir_close,
2757c478bd9Sstevel@tonic-gate 	mir_wput,
2767c478bd9Sstevel@tonic-gate 	mir_wsrv,
2777c478bd9Sstevel@tonic-gate 	mir_rput,
2787c478bd9Sstevel@tonic-gate 	mir_rsrv
2797c478bd9Sstevel@tonic-gate };
2807c478bd9Sstevel@tonic-gate 
2817c478bd9Sstevel@tonic-gate /*
2827c478bd9Sstevel@tonic-gate  * Per rpcmod "slot" data structure. q->q_ptr points to one of these.
2837c478bd9Sstevel@tonic-gate  */
2847c478bd9Sstevel@tonic-gate struct rpcm {
2857c478bd9Sstevel@tonic-gate 	void		*rm_krpc_cell;	/* Reserved for use by KRPC */
2867c478bd9Sstevel@tonic-gate 	struct		xprt_style_ops	*rm_ops;
2877c478bd9Sstevel@tonic-gate 	int		rm_type;	/* Client or server side stream */
2887c478bd9Sstevel@tonic-gate #define	RM_CLOSING	0x1		/* somebody is trying to close slot */
2897c478bd9Sstevel@tonic-gate 	uint_t		rm_state;	/* state of the slot. see above */
2907c478bd9Sstevel@tonic-gate 	uint_t		rm_ref;		/* cnt of external references to slot */
2917c478bd9Sstevel@tonic-gate 	kmutex_t	rm_lock;	/* mutex protecting above fields */
2927c478bd9Sstevel@tonic-gate 	kcondvar_t	rm_cwait;	/* condition for closing */
2937c478bd9Sstevel@tonic-gate 	zoneid_t	rm_zoneid;	/* zone which pushed rpcmod */
2947c478bd9Sstevel@tonic-gate };
2957c478bd9Sstevel@tonic-gate 
2967c478bd9Sstevel@tonic-gate struct temp_slot {
2977c478bd9Sstevel@tonic-gate 	void *cell;
2987c478bd9Sstevel@tonic-gate 	struct xprt_style_ops *ops;
2997c478bd9Sstevel@tonic-gate 	int type;
3007c478bd9Sstevel@tonic-gate 	mblk_t *info_ack;
3017c478bd9Sstevel@tonic-gate 	kmutex_t lock;
3027c478bd9Sstevel@tonic-gate 	kcondvar_t wait;
3037c478bd9Sstevel@tonic-gate };
3047c478bd9Sstevel@tonic-gate 
305fcfe7086Sgeorges typedef struct mir_s {
306fcfe7086Sgeorges 	void	*mir_krpc_cell;	/* Reserved for KRPC use. This field */
307fcfe7086Sgeorges 					/* must be first in the structure. */
308fcfe7086Sgeorges 	struct xprt_style_ops	*rm_ops;
309fcfe7086Sgeorges 	int	mir_type;		/* Client or server side stream */
310fcfe7086Sgeorges 
311fcfe7086Sgeorges 	mblk_t	*mir_head_mp;		/* RPC msg in progress */
312fcfe7086Sgeorges 		/*
313fcfe7086Sgeorges 		 * mir_head_mp points the first mblk being collected in
314fcfe7086Sgeorges 		 * the current RPC message.  Record headers are removed
315fcfe7086Sgeorges 		 * before data is linked into mir_head_mp.
316fcfe7086Sgeorges 		 */
317fcfe7086Sgeorges 	mblk_t	*mir_tail_mp;		/* Last mblk in mir_head_mp */
318fcfe7086Sgeorges 		/*
319fcfe7086Sgeorges 		 * mir_tail_mp points to the last mblk in the message
320fcfe7086Sgeorges 		 * chain starting at mir_head_mp.  It is only valid
321fcfe7086Sgeorges 		 * if mir_head_mp is non-NULL and is used to add new
322fcfe7086Sgeorges 		 * data blocks to the end of chain quickly.
323fcfe7086Sgeorges 		 */
324fcfe7086Sgeorges 
325fcfe7086Sgeorges 	int32_t	mir_frag_len;		/* Bytes seen in the current frag */
326fcfe7086Sgeorges 		/*
327fcfe7086Sgeorges 		 * mir_frag_len starts at -4 for beginning of each fragment.
328fcfe7086Sgeorges 		 * When this length is negative, it indicates the number of
329fcfe7086Sgeorges 		 * bytes that rpcmod needs to complete the record marker
330fcfe7086Sgeorges 		 * header.  When it is positive or zero, it holds the number
331fcfe7086Sgeorges 		 * of bytes that have arrived for the current fragment and
332fcfe7086Sgeorges 		 * are held in mir_header_mp.
333fcfe7086Sgeorges 		 */
334fcfe7086Sgeorges 
335fcfe7086Sgeorges 	int32_t	mir_frag_header;
336fcfe7086Sgeorges 		/*
337fcfe7086Sgeorges 		 * Fragment header as collected for the current fragment.
338fcfe7086Sgeorges 		 * It holds the last-fragment indicator and the number
339fcfe7086Sgeorges 		 * of bytes in the fragment.
340fcfe7086Sgeorges 		 */
341fcfe7086Sgeorges 
342fcfe7086Sgeorges 	unsigned int
343fcfe7086Sgeorges 		mir_ordrel_pending : 1,	/* Sent T_ORDREL_REQ */
344fcfe7086Sgeorges 		mir_hold_inbound : 1,	/* Hold inbound messages on server */
345fcfe7086Sgeorges 					/* side until outbound flow control */
346fcfe7086Sgeorges 					/* is relieved. */
347fcfe7086Sgeorges 		mir_closing : 1,	/* The stream is being closed */
348fcfe7086Sgeorges 		mir_inrservice : 1,	/* data queued or rd srv proc running */
349fcfe7086Sgeorges 		mir_inwservice : 1,	/* data queued or wr srv proc running */
350fcfe7086Sgeorges 		mir_inwflushdata : 1,	/* flush M_DATAs when srv runs */
351fcfe7086Sgeorges 		/*
352fcfe7086Sgeorges 		 * On client streams, mir_clntreq is 0 or 1; it is set
353fcfe7086Sgeorges 		 * to 1 whenever a new request is sent out (mir_wput)
354fcfe7086Sgeorges 		 * and cleared when the timer fires (mir_timer).  If
355fcfe7086Sgeorges 		 * the timer fires with this value equal to 0, then the
356fcfe7086Sgeorges 		 * stream is considered idle and KRPC is notified.
357fcfe7086Sgeorges 		 */
358fcfe7086Sgeorges 		mir_clntreq : 1,
359fcfe7086Sgeorges 		/*
360fcfe7086Sgeorges 		 * On server streams, stop accepting messages
361fcfe7086Sgeorges 		 */
362fcfe7086Sgeorges 		mir_svc_no_more_msgs : 1,
363fcfe7086Sgeorges 		mir_listen_stream : 1,	/* listen end point */
364fcfe7086Sgeorges 		mir_unused : 1,	/* no longer used */
365fcfe7086Sgeorges 		mir_timer_call : 1,
366fcfe7086Sgeorges 		mir_junk_fill_thru_bit_31 : 21;
367fcfe7086Sgeorges 
368fcfe7086Sgeorges 	int	mir_setup_complete;	/* server has initialized everything */
369fcfe7086Sgeorges 	timeout_id_t mir_timer_id;	/* Timer for idle checks */
370fcfe7086Sgeorges 	clock_t	mir_idle_timeout;	/* Allowed idle time before shutdown */
371fcfe7086Sgeorges 		/*
372fcfe7086Sgeorges 		 * This value is copied from clnt_idle_timeout or
373fcfe7086Sgeorges 		 * svc_idle_timeout during the appropriate ioctl.
374fcfe7086Sgeorges 		 * Kept in milliseconds
375fcfe7086Sgeorges 		 */
376fcfe7086Sgeorges 	clock_t	mir_use_timestamp;	/* updated on client with each use */
377fcfe7086Sgeorges 		/*
378fcfe7086Sgeorges 		 * This value is set to lbolt
379fcfe7086Sgeorges 		 * every time a client stream sends or receives data.
380fcfe7086Sgeorges 		 * Even if the timer message arrives, we don't shutdown
381fcfe7086Sgeorges 		 * client unless:
382fcfe7086Sgeorges 		 *    lbolt >= MSEC_TO_TICK(mir_idle_timeout)+mir_use_timestamp.
383fcfe7086Sgeorges 		 * This value is kept in HZ.
384fcfe7086Sgeorges 		 */
385fcfe7086Sgeorges 
386fcfe7086Sgeorges 	uint_t	*mir_max_msg_sizep;	/* Reference to sanity check size */
387fcfe7086Sgeorges 		/*
388fcfe7086Sgeorges 		 * This pointer is set to &clnt_max_msg_size or
389fcfe7086Sgeorges 		 * &svc_max_msg_size during the appropriate ioctl.
390fcfe7086Sgeorges 		 */
391fcfe7086Sgeorges 	zoneid_t mir_zoneid;	/* zone which pushed rpcmod */
392fcfe7086Sgeorges 	/* Server-side fields. */
393fcfe7086Sgeorges 	int	mir_ref_cnt;		/* Reference count: server side only */
394fcfe7086Sgeorges 					/* counts the number of references */
395fcfe7086Sgeorges 					/* that a kernel RPC server thread */
396fcfe7086Sgeorges 					/* (see svc_run()) has on this rpcmod */
397fcfe7086Sgeorges 					/* slot. Effectively, it is the */
398fcfe7086Sgeorges 					/* number * of unprocessed messages */
399fcfe7086Sgeorges 					/* that have been passed up to the */
400fcfe7086Sgeorges 					/* KRPC layer */
401fcfe7086Sgeorges 
402fcfe7086Sgeorges 	mblk_t	*mir_svc_pend_mp;	/* Pending T_ORDREL_IND or */
403fcfe7086Sgeorges 					/* T_DISCON_IND */
404fcfe7086Sgeorges 
405fcfe7086Sgeorges 	/*
406fcfe7086Sgeorges 	 * these fields are for both client and server, but for debugging,
407fcfe7086Sgeorges 	 * it is easier to have these last in the structure.
408fcfe7086Sgeorges 	 */
409fcfe7086Sgeorges 	kmutex_t	mir_mutex;	/* Mutex and condvar for close */
410fcfe7086Sgeorges 	kcondvar_t	mir_condvar;	/* synchronization. */
411fcfe7086Sgeorges 	kcondvar_t	mir_timer_cv;	/* Timer routine sync. */
412fcfe7086Sgeorges } mir_t;
413fcfe7086Sgeorges 
4147c478bd9Sstevel@tonic-gate void tmp_rput(queue_t *q, mblk_t *mp);
4157c478bd9Sstevel@tonic-gate 
4167c478bd9Sstevel@tonic-gate struct xprt_style_ops tmpops = {
4177c478bd9Sstevel@tonic-gate 	NULL,
4187c478bd9Sstevel@tonic-gate 	NULL,
4197c478bd9Sstevel@tonic-gate 	putnext,
4207c478bd9Sstevel@tonic-gate 	NULL,
4217c478bd9Sstevel@tonic-gate 	tmp_rput,
4227c478bd9Sstevel@tonic-gate 	NULL
4237c478bd9Sstevel@tonic-gate };
4247c478bd9Sstevel@tonic-gate 
4257c478bd9Sstevel@tonic-gate void
4267c478bd9Sstevel@tonic-gate tmp_rput(queue_t *q, mblk_t *mp)
4277c478bd9Sstevel@tonic-gate {
4287c478bd9Sstevel@tonic-gate 	struct temp_slot *t = (struct temp_slot *)(q->q_ptr);
4297c478bd9Sstevel@tonic-gate 	struct T_info_ack *pptr;
4307c478bd9Sstevel@tonic-gate 
4317c478bd9Sstevel@tonic-gate 	switch (mp->b_datap->db_type) {
4327c478bd9Sstevel@tonic-gate 	case M_PCPROTO:
4337c478bd9Sstevel@tonic-gate 		pptr = (struct T_info_ack *)mp->b_rptr;
4347c478bd9Sstevel@tonic-gate 		switch (pptr->PRIM_type) {
4357c478bd9Sstevel@tonic-gate 		case T_INFO_ACK:
4367c478bd9Sstevel@tonic-gate 			mutex_enter(&t->lock);
4377c478bd9Sstevel@tonic-gate 			t->info_ack = mp;
4387c478bd9Sstevel@tonic-gate 			cv_signal(&t->wait);
4397c478bd9Sstevel@tonic-gate 			mutex_exit(&t->lock);
4407c478bd9Sstevel@tonic-gate 			return;
4417c478bd9Sstevel@tonic-gate 		default:
4427c478bd9Sstevel@tonic-gate 			break;
4437c478bd9Sstevel@tonic-gate 		}
4447c478bd9Sstevel@tonic-gate 	default:
4457c478bd9Sstevel@tonic-gate 		break;
4467c478bd9Sstevel@tonic-gate 	}
4477c478bd9Sstevel@tonic-gate 
4487c478bd9Sstevel@tonic-gate 	/*
4497c478bd9Sstevel@tonic-gate 	 * Not an info-ack, so free it. This is ok because we should
4507c478bd9Sstevel@tonic-gate 	 * not be receiving data until the open finishes: rpcmod
4517c478bd9Sstevel@tonic-gate 	 * is pushed well before the end-point is bound to an address.
4527c478bd9Sstevel@tonic-gate 	 */
4537c478bd9Sstevel@tonic-gate 	freemsg(mp);
4547c478bd9Sstevel@tonic-gate }
4557c478bd9Sstevel@tonic-gate 
4567c478bd9Sstevel@tonic-gate int
4577c478bd9Sstevel@tonic-gate rmm_open(queue_t *q, dev_t *devp, int flag, int sflag, cred_t *crp)
4587c478bd9Sstevel@tonic-gate {
4597c478bd9Sstevel@tonic-gate 	mblk_t *bp;
4607c478bd9Sstevel@tonic-gate 	struct temp_slot ts, *t;
4617c478bd9Sstevel@tonic-gate 	struct T_info_ack *pptr;
4627c478bd9Sstevel@tonic-gate 	int error = 0;
4637c478bd9Sstevel@tonic-gate 
4647c478bd9Sstevel@tonic-gate 	ASSERT(q != NULL);
4657c478bd9Sstevel@tonic-gate 	/*
4667c478bd9Sstevel@tonic-gate 	 * Check for re-opens.
4677c478bd9Sstevel@tonic-gate 	 */
4687c478bd9Sstevel@tonic-gate 	if (q->q_ptr) {
4697c478bd9Sstevel@tonic-gate 		TRACE_1(TR_FAC_KRPC, TR_RPCMODOPEN_END,
4707c478bd9Sstevel@tonic-gate 		    "rpcmodopen_end:(%s)", "q->qptr");
4717c478bd9Sstevel@tonic-gate 		return (0);
4727c478bd9Sstevel@tonic-gate 	}
4737c478bd9Sstevel@tonic-gate 
4747c478bd9Sstevel@tonic-gate 	t = &ts;
4757c478bd9Sstevel@tonic-gate 	bzero(t, sizeof (*t));
4767c478bd9Sstevel@tonic-gate 	q->q_ptr = (void *)t;
477fcfe7086Sgeorges 	WR(q)->q_ptr = (void *)t;
4787c478bd9Sstevel@tonic-gate 
4797c478bd9Sstevel@tonic-gate 	/*
4807c478bd9Sstevel@tonic-gate 	 * Allocate the required messages upfront.
4817c478bd9Sstevel@tonic-gate 	 */
4827c478bd9Sstevel@tonic-gate 	if ((bp = allocb(sizeof (struct T_info_req) +
4837c478bd9Sstevel@tonic-gate 	    sizeof (struct T_info_ack), BPRI_LO)) == (mblk_t *)NULL) {
4847c478bd9Sstevel@tonic-gate 		return (ENOBUFS);
4857c478bd9Sstevel@tonic-gate 	}
4867c478bd9Sstevel@tonic-gate 
4877c478bd9Sstevel@tonic-gate 	mutex_init(&t->lock, NULL, MUTEX_DEFAULT, NULL);
4887c478bd9Sstevel@tonic-gate 	cv_init(&t->wait, NULL, CV_DEFAULT, NULL);
4897c478bd9Sstevel@tonic-gate 
4907c478bd9Sstevel@tonic-gate 	t->ops = &tmpops;
4917c478bd9Sstevel@tonic-gate 
4927c478bd9Sstevel@tonic-gate 	qprocson(q);
4937c478bd9Sstevel@tonic-gate 	bp->b_datap->db_type = M_PCPROTO;
4947c478bd9Sstevel@tonic-gate 	*(int32_t *)bp->b_wptr = (int32_t)T_INFO_REQ;
4957c478bd9Sstevel@tonic-gate 	bp->b_wptr += sizeof (struct T_info_req);
4967c478bd9Sstevel@tonic-gate 	putnext(WR(q), bp);
4977c478bd9Sstevel@tonic-gate 
4987c478bd9Sstevel@tonic-gate 	mutex_enter(&t->lock);
499fcfe7086Sgeorges 	while (t->info_ack == NULL) {
5007c478bd9Sstevel@tonic-gate 		if (cv_wait_sig(&t->wait, &t->lock) == 0) {
5017c478bd9Sstevel@tonic-gate 			error = EINTR;
5027c478bd9Sstevel@tonic-gate 			break;
5037c478bd9Sstevel@tonic-gate 		}
5047c478bd9Sstevel@tonic-gate 	}
5057c478bd9Sstevel@tonic-gate 	mutex_exit(&t->lock);
506fcfe7086Sgeorges 
5077c478bd9Sstevel@tonic-gate 	if (error)
5087c478bd9Sstevel@tonic-gate 		goto out;
5097c478bd9Sstevel@tonic-gate 
5107c478bd9Sstevel@tonic-gate 	pptr = (struct T_info_ack *)t->info_ack->b_rptr;
5117c478bd9Sstevel@tonic-gate 
5127c478bd9Sstevel@tonic-gate 	if (pptr->SERV_type == T_CLTS) {
513fcfe7086Sgeorges 		if ((error = rpcmodopen(q, devp, flag, sflag, crp)) == 0)
514fcfe7086Sgeorges 			((struct rpcm *)q->q_ptr)->rm_ops = &xprt_clts_ops;
5157c478bd9Sstevel@tonic-gate 	} else {
516fcfe7086Sgeorges 		if ((error = mir_open(q, devp, flag, sflag, crp)) == 0)
517fcfe7086Sgeorges 			((mir_t *)q->q_ptr)->rm_ops = &xprt_cots_ops;
5187c478bd9Sstevel@tonic-gate 	}
5197c478bd9Sstevel@tonic-gate 
5207c478bd9Sstevel@tonic-gate out:
521fcfe7086Sgeorges 	if (error)
5227c478bd9Sstevel@tonic-gate 		qprocsoff(q);
5237c478bd9Sstevel@tonic-gate 
524fcfe7086Sgeorges 	freemsg(t->info_ack);
525fcfe7086Sgeorges 	mutex_destroy(&t->lock);
526fcfe7086Sgeorges 	cv_destroy(&t->wait);
527fcfe7086Sgeorges 
5287c478bd9Sstevel@tonic-gate 	return (error);
5297c478bd9Sstevel@tonic-gate }
5307c478bd9Sstevel@tonic-gate 
5317c478bd9Sstevel@tonic-gate void
5327c478bd9Sstevel@tonic-gate rmm_rput(queue_t *q, mblk_t  *mp)
5337c478bd9Sstevel@tonic-gate {
5347c478bd9Sstevel@tonic-gate 	(*((struct temp_slot *)q->q_ptr)->ops->xo_rput)(q, mp);
5357c478bd9Sstevel@tonic-gate }
5367c478bd9Sstevel@tonic-gate 
5377c478bd9Sstevel@tonic-gate void
5387c478bd9Sstevel@tonic-gate rmm_rsrv(queue_t *q)
5397c478bd9Sstevel@tonic-gate {
5407c478bd9Sstevel@tonic-gate 	(*((struct temp_slot *)q->q_ptr)->ops->xo_rsrv)(q);
5417c478bd9Sstevel@tonic-gate }
5427c478bd9Sstevel@tonic-gate 
5437c478bd9Sstevel@tonic-gate void
5447c478bd9Sstevel@tonic-gate rmm_wput(queue_t *q, mblk_t *mp)
5457c478bd9Sstevel@tonic-gate {
5467c478bd9Sstevel@tonic-gate 	(*((struct temp_slot *)q->q_ptr)->ops->xo_wput)(q, mp);
5477c478bd9Sstevel@tonic-gate }
5487c478bd9Sstevel@tonic-gate 
5497c478bd9Sstevel@tonic-gate void
5507c478bd9Sstevel@tonic-gate rmm_wsrv(queue_t *q)
5517c478bd9Sstevel@tonic-gate {
5527c478bd9Sstevel@tonic-gate 	(*((struct temp_slot *)q->q_ptr)->ops->xo_wsrv)(q);
5537c478bd9Sstevel@tonic-gate }
5547c478bd9Sstevel@tonic-gate 
5557c478bd9Sstevel@tonic-gate int
5567c478bd9Sstevel@tonic-gate rmm_close(queue_t *q, int flag, cred_t *crp)
5577c478bd9Sstevel@tonic-gate {
5587c478bd9Sstevel@tonic-gate 	return ((*((struct temp_slot *)q->q_ptr)->ops->xo_close)(q, flag, crp));
5597c478bd9Sstevel@tonic-gate }
5607c478bd9Sstevel@tonic-gate 
5617c478bd9Sstevel@tonic-gate /*
5627c478bd9Sstevel@tonic-gate  * rpcmodopen -	open routine gets called when the module gets pushed
5637c478bd9Sstevel@tonic-gate  *		onto the stream.
5647c478bd9Sstevel@tonic-gate  */
5657c478bd9Sstevel@tonic-gate /*ARGSUSED*/
5667c478bd9Sstevel@tonic-gate int
5677c478bd9Sstevel@tonic-gate rpcmodopen(queue_t *q, dev_t *devp, int flag, int sflag, cred_t *crp)
5687c478bd9Sstevel@tonic-gate {
5697c478bd9Sstevel@tonic-gate 	struct rpcm *rmp;
5707c478bd9Sstevel@tonic-gate 
5717c478bd9Sstevel@tonic-gate 	extern void (*rpc_rele)(queue_t *, mblk_t *);
5727c478bd9Sstevel@tonic-gate 	static void rpcmod_release(queue_t *, mblk_t *);
5737c478bd9Sstevel@tonic-gate 
5747c478bd9Sstevel@tonic-gate 	TRACE_0(TR_FAC_KRPC, TR_RPCMODOPEN_START, "rpcmodopen_start:");
5757c478bd9Sstevel@tonic-gate 
5767c478bd9Sstevel@tonic-gate 	/*
5777c478bd9Sstevel@tonic-gate 	 * Initialize entry points to release a rpcmod slot (and an input
5787c478bd9Sstevel@tonic-gate 	 * message if supplied) and to send an output message to the module
5797c478bd9Sstevel@tonic-gate 	 * below rpcmod.
5807c478bd9Sstevel@tonic-gate 	 */
5817c478bd9Sstevel@tonic-gate 	if (rpc_rele == NULL)
5827c478bd9Sstevel@tonic-gate 		rpc_rele = rpcmod_release;
5837c478bd9Sstevel@tonic-gate 
5847c478bd9Sstevel@tonic-gate 	/*
5857c478bd9Sstevel@tonic-gate 	 * Only sufficiently privileged users can use this module, and it
5867c478bd9Sstevel@tonic-gate 	 * is assumed that they will use this module properly, and NOT send
5877c478bd9Sstevel@tonic-gate 	 * bulk data from downstream.
5887c478bd9Sstevel@tonic-gate 	 */
5897c478bd9Sstevel@tonic-gate 	if (secpolicy_rpcmod_open(crp) != 0)
5907c478bd9Sstevel@tonic-gate 		return (EPERM);
5917c478bd9Sstevel@tonic-gate 
5927c478bd9Sstevel@tonic-gate 	/*
5937c478bd9Sstevel@tonic-gate 	 * Allocate slot data structure.
5947c478bd9Sstevel@tonic-gate 	 */
5957c478bd9Sstevel@tonic-gate 	rmp = kmem_zalloc(sizeof (*rmp), KM_SLEEP);
5967c478bd9Sstevel@tonic-gate 
5977c478bd9Sstevel@tonic-gate 	mutex_init(&rmp->rm_lock, NULL, MUTEX_DEFAULT, NULL);
5987c478bd9Sstevel@tonic-gate 	cv_init(&rmp->rm_cwait, NULL, CV_DEFAULT, NULL);
599108322fbScarlsonj 	rmp->rm_zoneid = rpc_zoneid();
6007c478bd9Sstevel@tonic-gate 	/*
6017c478bd9Sstevel@tonic-gate 	 * slot type will be set by kRPC client and server ioctl's
6027c478bd9Sstevel@tonic-gate 	 */
6037c478bd9Sstevel@tonic-gate 	rmp->rm_type = 0;
6047c478bd9Sstevel@tonic-gate 
6057c478bd9Sstevel@tonic-gate 	q->q_ptr = (void *)rmp;
6067c478bd9Sstevel@tonic-gate 	WR(q)->q_ptr = (void *)rmp;
6077c478bd9Sstevel@tonic-gate 
6087c478bd9Sstevel@tonic-gate 	TRACE_1(TR_FAC_KRPC, TR_RPCMODOPEN_END, "rpcmodopen_end:(%s)", "end");
6097c478bd9Sstevel@tonic-gate 	return (0);
6107c478bd9Sstevel@tonic-gate }
6117c478bd9Sstevel@tonic-gate 
6127c478bd9Sstevel@tonic-gate /*
6137c478bd9Sstevel@tonic-gate  * rpcmodclose - This routine gets called when the module gets popped
6147c478bd9Sstevel@tonic-gate  * off of the stream.
6157c478bd9Sstevel@tonic-gate  */
6167c478bd9Sstevel@tonic-gate /*ARGSUSED*/
6177c478bd9Sstevel@tonic-gate int
6187c478bd9Sstevel@tonic-gate rpcmodclose(queue_t *q, int flag, cred_t *crp)
6197c478bd9Sstevel@tonic-gate {
6207c478bd9Sstevel@tonic-gate 	struct rpcm *rmp;
6217c478bd9Sstevel@tonic-gate 
6227c478bd9Sstevel@tonic-gate 	ASSERT(q != NULL);
6237c478bd9Sstevel@tonic-gate 	rmp = (struct rpcm *)q->q_ptr;
6247c478bd9Sstevel@tonic-gate 
6257c478bd9Sstevel@tonic-gate 	/*
6267c478bd9Sstevel@tonic-gate 	 * Mark our state as closing.
6277c478bd9Sstevel@tonic-gate 	 */
6287c478bd9Sstevel@tonic-gate 	mutex_enter(&rmp->rm_lock);
6297c478bd9Sstevel@tonic-gate 	rmp->rm_state |= RM_CLOSING;
6307c478bd9Sstevel@tonic-gate 
6317c478bd9Sstevel@tonic-gate 	/*
6327c478bd9Sstevel@tonic-gate 	 * Check and see if there are any messages on the queue.  If so, send
6337c478bd9Sstevel@tonic-gate 	 * the messages, regardless whether the downstream module is ready to
6347c478bd9Sstevel@tonic-gate 	 * accept data.
6357c478bd9Sstevel@tonic-gate 	 */
6367c478bd9Sstevel@tonic-gate 	if (rmp->rm_type == RPC_SERVER) {
6377c478bd9Sstevel@tonic-gate 		flushq(q, FLUSHDATA);
6387c478bd9Sstevel@tonic-gate 
6397c478bd9Sstevel@tonic-gate 		qenable(WR(q));
6407c478bd9Sstevel@tonic-gate 
6417c478bd9Sstevel@tonic-gate 		if (rmp->rm_ref) {
6427c478bd9Sstevel@tonic-gate 			mutex_exit(&rmp->rm_lock);
6437c478bd9Sstevel@tonic-gate 			/*
6447c478bd9Sstevel@tonic-gate 			 * call into SVC to clean the queue
6457c478bd9Sstevel@tonic-gate 			 */
6467c478bd9Sstevel@tonic-gate 			svc_queueclean(q);
6477c478bd9Sstevel@tonic-gate 			mutex_enter(&rmp->rm_lock);
6487c478bd9Sstevel@tonic-gate 
6497c478bd9Sstevel@tonic-gate 			/*
6507c478bd9Sstevel@tonic-gate 			 * Block while there are kRPC threads with a reference
6517c478bd9Sstevel@tonic-gate 			 * to this message.
6527c478bd9Sstevel@tonic-gate 			 */
6537c478bd9Sstevel@tonic-gate 			while (rmp->rm_ref)
6547c478bd9Sstevel@tonic-gate 				cv_wait(&rmp->rm_cwait, &rmp->rm_lock);
6557c478bd9Sstevel@tonic-gate 		}
6567c478bd9Sstevel@tonic-gate 
6577c478bd9Sstevel@tonic-gate 		mutex_exit(&rmp->rm_lock);
6587c478bd9Sstevel@tonic-gate 
6597c478bd9Sstevel@tonic-gate 		/*
6607c478bd9Sstevel@tonic-gate 		 * It is now safe to remove this queue from the stream. No kRPC
6617c478bd9Sstevel@tonic-gate 		 * threads have a reference to the stream, and none ever will,
6627c478bd9Sstevel@tonic-gate 		 * because RM_CLOSING is set.
6637c478bd9Sstevel@tonic-gate 		 */
6647c478bd9Sstevel@tonic-gate 		qprocsoff(q);
6657c478bd9Sstevel@tonic-gate 
6667c478bd9Sstevel@tonic-gate 		/* Notify kRPC that this stream is going away. */
6677c478bd9Sstevel@tonic-gate 		svc_queueclose(q);
6687c478bd9Sstevel@tonic-gate 	} else {
6697c478bd9Sstevel@tonic-gate 		mutex_exit(&rmp->rm_lock);
6707c478bd9Sstevel@tonic-gate 		qprocsoff(q);
6717c478bd9Sstevel@tonic-gate 	}
6727c478bd9Sstevel@tonic-gate 
6737c478bd9Sstevel@tonic-gate 	q->q_ptr = NULL;
6747c478bd9Sstevel@tonic-gate 	WR(q)->q_ptr = NULL;
6757c478bd9Sstevel@tonic-gate 	mutex_destroy(&rmp->rm_lock);
6767c478bd9Sstevel@tonic-gate 	cv_destroy(&rmp->rm_cwait);
6777c478bd9Sstevel@tonic-gate 	kmem_free(rmp, sizeof (*rmp));
6787c478bd9Sstevel@tonic-gate 	return (0);
6797c478bd9Sstevel@tonic-gate }
6807c478bd9Sstevel@tonic-gate 
6817c478bd9Sstevel@tonic-gate #ifdef	DEBUG
6827c478bd9Sstevel@tonic-gate int	rpcmod_send_msg_up = 0;
6837c478bd9Sstevel@tonic-gate int	rpcmod_send_uderr = 0;
6847c478bd9Sstevel@tonic-gate int	rpcmod_send_dup = 0;
6857c478bd9Sstevel@tonic-gate int	rpcmod_send_dup_cnt = 0;
6867c478bd9Sstevel@tonic-gate #endif
6877c478bd9Sstevel@tonic-gate 
6887c478bd9Sstevel@tonic-gate /*
6897c478bd9Sstevel@tonic-gate  * rpcmodrput -	Module read put procedure.  This is called from
6907c478bd9Sstevel@tonic-gate  *		the module, driver, or stream head downstream.
6917c478bd9Sstevel@tonic-gate  */
6927c478bd9Sstevel@tonic-gate void
6937c478bd9Sstevel@tonic-gate rpcmodrput(queue_t *q, mblk_t *mp)
6947c478bd9Sstevel@tonic-gate {
6957c478bd9Sstevel@tonic-gate 	struct rpcm *rmp;
6967c478bd9Sstevel@tonic-gate 	union T_primitives *pptr;
6977c478bd9Sstevel@tonic-gate 	int hdrsz;
6987c478bd9Sstevel@tonic-gate 
6997c478bd9Sstevel@tonic-gate 	TRACE_0(TR_FAC_KRPC, TR_RPCMODRPUT_START, "rpcmodrput_start:");
7007c478bd9Sstevel@tonic-gate 
7017c478bd9Sstevel@tonic-gate 	ASSERT(q != NULL);
7027c478bd9Sstevel@tonic-gate 	rmp = (struct rpcm *)q->q_ptr;
7037c478bd9Sstevel@tonic-gate 
7047c478bd9Sstevel@tonic-gate 	if (rmp->rm_type == 0) {
7057c478bd9Sstevel@tonic-gate 		freemsg(mp);
7067c478bd9Sstevel@tonic-gate 		return;
7077c478bd9Sstevel@tonic-gate 	}
7087c478bd9Sstevel@tonic-gate 
7097c478bd9Sstevel@tonic-gate #ifdef DEBUG
7107c478bd9Sstevel@tonic-gate 	if (rpcmod_send_msg_up > 0) {
7117c478bd9Sstevel@tonic-gate 		mblk_t *nmp = copymsg(mp);
7127c478bd9Sstevel@tonic-gate 		if (nmp) {
7137c478bd9Sstevel@tonic-gate 			putnext(q, nmp);
7147c478bd9Sstevel@tonic-gate 			rpcmod_send_msg_up--;
7157c478bd9Sstevel@tonic-gate 		}
7167c478bd9Sstevel@tonic-gate 	}
7177c478bd9Sstevel@tonic-gate 	if ((rpcmod_send_uderr > 0) && mp->b_datap->db_type == M_PROTO) {
7187c478bd9Sstevel@tonic-gate 		mblk_t *nmp;
7197c478bd9Sstevel@tonic-gate 		struct T_unitdata_ind *data;
7207c478bd9Sstevel@tonic-gate 		struct T_uderror_ind *ud;
7217c478bd9Sstevel@tonic-gate 		int d;
7227c478bd9Sstevel@tonic-gate 		data = (struct T_unitdata_ind *)mp->b_rptr;
7237c478bd9Sstevel@tonic-gate 		if (data->PRIM_type == T_UNITDATA_IND) {
7247c478bd9Sstevel@tonic-gate 			d = sizeof (*ud) - sizeof (*data);
7257c478bd9Sstevel@tonic-gate 			nmp = allocb(mp->b_wptr - mp->b_rptr + d, BPRI_HI);
7267c478bd9Sstevel@tonic-gate 			if (nmp) {
7277c478bd9Sstevel@tonic-gate 				ud = (struct T_uderror_ind *)nmp->b_rptr;
7287c478bd9Sstevel@tonic-gate 				ud->PRIM_type = T_UDERROR_IND;
7297c478bd9Sstevel@tonic-gate 				ud->DEST_length = data->SRC_length;
7307c478bd9Sstevel@tonic-gate 				ud->DEST_offset = data->SRC_offset + d;
7317c478bd9Sstevel@tonic-gate 				ud->OPT_length = data->OPT_length;
7327c478bd9Sstevel@tonic-gate 				ud->OPT_offset = data->OPT_offset + d;
7337c478bd9Sstevel@tonic-gate 				ud->ERROR_type = ENETDOWN;
7347c478bd9Sstevel@tonic-gate 				if (data->SRC_length) {
7357c478bd9Sstevel@tonic-gate 					bcopy(mp->b_rptr +
7367c478bd9Sstevel@tonic-gate 					    data->SRC_offset,
7377c478bd9Sstevel@tonic-gate 					    nmp->b_rptr +
7387c478bd9Sstevel@tonic-gate 					    ud->DEST_offset,
7397c478bd9Sstevel@tonic-gate 					    data->SRC_length);
7407c478bd9Sstevel@tonic-gate 				}
7417c478bd9Sstevel@tonic-gate 				if (data->OPT_length) {
7427c478bd9Sstevel@tonic-gate 					bcopy(mp->b_rptr +
7437c478bd9Sstevel@tonic-gate 					    data->OPT_offset,
7447c478bd9Sstevel@tonic-gate 					    nmp->b_rptr +
7457c478bd9Sstevel@tonic-gate 					    ud->OPT_offset,
7467c478bd9Sstevel@tonic-gate 					    data->OPT_length);
7477c478bd9Sstevel@tonic-gate 				}
7487c478bd9Sstevel@tonic-gate 				nmp->b_wptr += d;
7497c478bd9Sstevel@tonic-gate 				nmp->b_wptr += (mp->b_wptr - mp->b_rptr);
7507c478bd9Sstevel@tonic-gate 				nmp->b_datap->db_type = M_PROTO;
7517c478bd9Sstevel@tonic-gate 				putnext(q, nmp);
7527c478bd9Sstevel@tonic-gate 				rpcmod_send_uderr--;
7537c478bd9Sstevel@tonic-gate 			}
7547c478bd9Sstevel@tonic-gate 		}
7557c478bd9Sstevel@tonic-gate 	}
7567c478bd9Sstevel@tonic-gate #endif
7577c478bd9Sstevel@tonic-gate 	switch (mp->b_datap->db_type) {
7587c478bd9Sstevel@tonic-gate 	default:
7597c478bd9Sstevel@tonic-gate 		putnext(q, mp);
7607c478bd9Sstevel@tonic-gate 		break;
7617c478bd9Sstevel@tonic-gate 
7627c478bd9Sstevel@tonic-gate 	case M_PROTO:
7637c478bd9Sstevel@tonic-gate 	case M_PCPROTO:
7647c478bd9Sstevel@tonic-gate 		ASSERT((mp->b_wptr - mp->b_rptr) >= sizeof (int32_t));
7657c478bd9Sstevel@tonic-gate 		pptr = (union T_primitives *)mp->b_rptr;
7667c478bd9Sstevel@tonic-gate 
7677c478bd9Sstevel@tonic-gate 		/*
7687c478bd9Sstevel@tonic-gate 		 * Forward this message to krpc if it is data.
7697c478bd9Sstevel@tonic-gate 		 */
7707c478bd9Sstevel@tonic-gate 		if (pptr->type == T_UNITDATA_IND) {
7717c478bd9Sstevel@tonic-gate 			mblk_t *nmp;
7727c478bd9Sstevel@tonic-gate 
7737c478bd9Sstevel@tonic-gate 		/*
7747c478bd9Sstevel@tonic-gate 		 * Check if the module is being popped.
7757c478bd9Sstevel@tonic-gate 		 */
7767c478bd9Sstevel@tonic-gate 			mutex_enter(&rmp->rm_lock);
7777c478bd9Sstevel@tonic-gate 			if (rmp->rm_state & RM_CLOSING) {
7787c478bd9Sstevel@tonic-gate 				mutex_exit(&rmp->rm_lock);
7797c478bd9Sstevel@tonic-gate 				putnext(q, mp);
7807c478bd9Sstevel@tonic-gate 				break;
7817c478bd9Sstevel@tonic-gate 			}
7827c478bd9Sstevel@tonic-gate 
7837c478bd9Sstevel@tonic-gate 			switch (rmp->rm_type) {
7847c478bd9Sstevel@tonic-gate 			case RPC_CLIENT:
7857c478bd9Sstevel@tonic-gate 				mutex_exit(&rmp->rm_lock);
7867c478bd9Sstevel@tonic-gate 				hdrsz = mp->b_wptr - mp->b_rptr;
7877c478bd9Sstevel@tonic-gate 
7887c478bd9Sstevel@tonic-gate 				/*
7897c478bd9Sstevel@tonic-gate 				 * Make sure the header is sane.
7907c478bd9Sstevel@tonic-gate 				 */
7917c478bd9Sstevel@tonic-gate 				if (hdrsz < TUNITDATAINDSZ ||
7927c478bd9Sstevel@tonic-gate 				    hdrsz < (pptr->unitdata_ind.OPT_length +
7937c478bd9Sstevel@tonic-gate 				    pptr->unitdata_ind.OPT_offset) ||
7947c478bd9Sstevel@tonic-gate 				    hdrsz < (pptr->unitdata_ind.SRC_length +
7957c478bd9Sstevel@tonic-gate 				    pptr->unitdata_ind.SRC_offset)) {
7967c478bd9Sstevel@tonic-gate 					freemsg(mp);
7977c478bd9Sstevel@tonic-gate 					return;
7987c478bd9Sstevel@tonic-gate 				}
7997c478bd9Sstevel@tonic-gate 
8007c478bd9Sstevel@tonic-gate 				/*
801*07e75131Sgt29601 				 * Call clnt_clts_dispatch_notify, so that it
802*07e75131Sgt29601 				 * can pass the message to the proper caller.
803*07e75131Sgt29601 				 * Don't discard the header just yet since the
804*07e75131Sgt29601 				 * client may need the sender's address.
8057c478bd9Sstevel@tonic-gate 				 */
806*07e75131Sgt29601 				clnt_clts_dispatch_notify(mp, hdrsz,
807*07e75131Sgt29601 				    rmp->rm_zoneid);
8087c478bd9Sstevel@tonic-gate 				return;
8097c478bd9Sstevel@tonic-gate 			case RPC_SERVER:
8107c478bd9Sstevel@tonic-gate 				/*
8117c478bd9Sstevel@tonic-gate 				 * rm_krpc_cell is exclusively used by the kRPC
8127c478bd9Sstevel@tonic-gate 				 * CLTS server
8137c478bd9Sstevel@tonic-gate 				 */
8147c478bd9Sstevel@tonic-gate 				if (rmp->rm_krpc_cell) {
8157c478bd9Sstevel@tonic-gate #ifdef DEBUG
8167c478bd9Sstevel@tonic-gate 					/*
8177c478bd9Sstevel@tonic-gate 					 * Test duplicate request cache and
8187c478bd9Sstevel@tonic-gate 					 * rm_ref count handling by sending a
8197c478bd9Sstevel@tonic-gate 					 * duplicate every so often, if
8207c478bd9Sstevel@tonic-gate 					 * desired.
8217c478bd9Sstevel@tonic-gate 					 */
8227c478bd9Sstevel@tonic-gate 					if (rpcmod_send_dup &&
8237c478bd9Sstevel@tonic-gate 					    rpcmod_send_dup_cnt++ %
8247c478bd9Sstevel@tonic-gate 					    rpcmod_send_dup)
8257c478bd9Sstevel@tonic-gate 						nmp = copymsg(mp);
8267c478bd9Sstevel@tonic-gate 					else
8277c478bd9Sstevel@tonic-gate 						nmp = NULL;
8287c478bd9Sstevel@tonic-gate #endif
8297c478bd9Sstevel@tonic-gate 					/*
8307c478bd9Sstevel@tonic-gate 					 * Raise the reference count on this
8317c478bd9Sstevel@tonic-gate 					 * module to prevent it from being
8327c478bd9Sstevel@tonic-gate 					 * popped before krpc generates the
8337c478bd9Sstevel@tonic-gate 					 * reply.
8347c478bd9Sstevel@tonic-gate 					 */
8357c478bd9Sstevel@tonic-gate 					rmp->rm_ref++;
8367c478bd9Sstevel@tonic-gate 					mutex_exit(&rmp->rm_lock);
8377c478bd9Sstevel@tonic-gate 
8387c478bd9Sstevel@tonic-gate 					/*
8397c478bd9Sstevel@tonic-gate 					 * Submit the message to krpc.
8407c478bd9Sstevel@tonic-gate 					 */
8417c478bd9Sstevel@tonic-gate 					svc_queuereq(q, mp);
8427c478bd9Sstevel@tonic-gate #ifdef DEBUG
8437c478bd9Sstevel@tonic-gate 					/*
8447c478bd9Sstevel@tonic-gate 					 * Send duplicate if we created one.
8457c478bd9Sstevel@tonic-gate 					 */
8467c478bd9Sstevel@tonic-gate 					if (nmp) {
8477c478bd9Sstevel@tonic-gate 						mutex_enter(&rmp->rm_lock);
8487c478bd9Sstevel@tonic-gate 						rmp->rm_ref++;
8497c478bd9Sstevel@tonic-gate 						mutex_exit(&rmp->rm_lock);
8507c478bd9Sstevel@tonic-gate 						svc_queuereq(q, nmp);
8517c478bd9Sstevel@tonic-gate 					}
8527c478bd9Sstevel@tonic-gate #endif
8537c478bd9Sstevel@tonic-gate 				} else {
8547c478bd9Sstevel@tonic-gate 					mutex_exit(&rmp->rm_lock);
8557c478bd9Sstevel@tonic-gate 					freemsg(mp);
8567c478bd9Sstevel@tonic-gate 				}
8577c478bd9Sstevel@tonic-gate 				return;
8587c478bd9Sstevel@tonic-gate 			default:
8597c478bd9Sstevel@tonic-gate 				mutex_exit(&rmp->rm_lock);
8607c478bd9Sstevel@tonic-gate 				freemsg(mp);
8617c478bd9Sstevel@tonic-gate 				return;
8627c478bd9Sstevel@tonic-gate 			} /* end switch(rmp->rm_type) */
8637c478bd9Sstevel@tonic-gate 		} else if (pptr->type == T_UDERROR_IND) {
8647c478bd9Sstevel@tonic-gate 			mutex_enter(&rmp->rm_lock);
8657c478bd9Sstevel@tonic-gate 			hdrsz = mp->b_wptr - mp->b_rptr;
8667c478bd9Sstevel@tonic-gate 
8677c478bd9Sstevel@tonic-gate 			/*
8687c478bd9Sstevel@tonic-gate 			 * Make sure the header is sane
8697c478bd9Sstevel@tonic-gate 			 */
8707c478bd9Sstevel@tonic-gate 			if (hdrsz < TUDERRORINDSZ ||
8717c478bd9Sstevel@tonic-gate 			    hdrsz < (pptr->uderror_ind.OPT_length +
8727c478bd9Sstevel@tonic-gate 			    pptr->uderror_ind.OPT_offset) ||
8737c478bd9Sstevel@tonic-gate 			    hdrsz < (pptr->uderror_ind.DEST_length +
8747c478bd9Sstevel@tonic-gate 			    pptr->uderror_ind.DEST_offset)) {
8757c478bd9Sstevel@tonic-gate 				mutex_exit(&rmp->rm_lock);
8767c478bd9Sstevel@tonic-gate 				freemsg(mp);
8777c478bd9Sstevel@tonic-gate 				return;
8787c478bd9Sstevel@tonic-gate 			}
8797c478bd9Sstevel@tonic-gate 
8807c478bd9Sstevel@tonic-gate 			/*
8817c478bd9Sstevel@tonic-gate 			 * In the case where a unit data error has been
8827c478bd9Sstevel@tonic-gate 			 * received, all we need to do is clear the message from
8837c478bd9Sstevel@tonic-gate 			 * the queue.
8847c478bd9Sstevel@tonic-gate 			 */
8857c478bd9Sstevel@tonic-gate 			mutex_exit(&rmp->rm_lock);
8867c478bd9Sstevel@tonic-gate 			freemsg(mp);
8877c478bd9Sstevel@tonic-gate 			RPCLOG(32, "rpcmodrput: unitdata error received at "
8887c478bd9Sstevel@tonic-gate 			    "%ld\n", gethrestime_sec());
8897c478bd9Sstevel@tonic-gate 			return;
8907c478bd9Sstevel@tonic-gate 		} /* end else if (pptr->type == T_UDERROR_IND) */
8917c478bd9Sstevel@tonic-gate 
8927c478bd9Sstevel@tonic-gate 		putnext(q, mp);
8937c478bd9Sstevel@tonic-gate 		break;
8947c478bd9Sstevel@tonic-gate 	} /* end switch (mp->b_datap->db_type) */
8957c478bd9Sstevel@tonic-gate 
8967c478bd9Sstevel@tonic-gate 	TRACE_0(TR_FAC_KRPC, TR_RPCMODRPUT_END,
8977c478bd9Sstevel@tonic-gate 	    "rpcmodrput_end:");
8987c478bd9Sstevel@tonic-gate 	/*
8997c478bd9Sstevel@tonic-gate 	 * Return codes are not looked at by the STREAMS framework.
9007c478bd9Sstevel@tonic-gate 	 */
9017c478bd9Sstevel@tonic-gate }
9027c478bd9Sstevel@tonic-gate 
9037c478bd9Sstevel@tonic-gate /*
9047c478bd9Sstevel@tonic-gate  * write put procedure
9057c478bd9Sstevel@tonic-gate  */
9067c478bd9Sstevel@tonic-gate void
9077c478bd9Sstevel@tonic-gate rpcmodwput(queue_t *q, mblk_t *mp)
9087c478bd9Sstevel@tonic-gate {
9097c478bd9Sstevel@tonic-gate 	struct rpcm	*rmp;
9107c478bd9Sstevel@tonic-gate 
9117c478bd9Sstevel@tonic-gate 	ASSERT(q != NULL);
9127c478bd9Sstevel@tonic-gate 
9137c478bd9Sstevel@tonic-gate 	switch (mp->b_datap->db_type) {
9147c478bd9Sstevel@tonic-gate 		case M_PROTO:
9157c478bd9Sstevel@tonic-gate 		case M_PCPROTO:
9167c478bd9Sstevel@tonic-gate 			break;
9177c478bd9Sstevel@tonic-gate 		default:
9187c478bd9Sstevel@tonic-gate 			rpcmodwput_other(q, mp);
9197c478bd9Sstevel@tonic-gate 			return;
9207c478bd9Sstevel@tonic-gate 	}
9217c478bd9Sstevel@tonic-gate 
9227c478bd9Sstevel@tonic-gate 	/*
9237c478bd9Sstevel@tonic-gate 	 * Check to see if we can send the message downstream.
9247c478bd9Sstevel@tonic-gate 	 */
9257c478bd9Sstevel@tonic-gate 	if (canputnext(q)) {
9267c478bd9Sstevel@tonic-gate 		putnext(q, mp);
9277c478bd9Sstevel@tonic-gate 		return;
9287c478bd9Sstevel@tonic-gate 	}
9297c478bd9Sstevel@tonic-gate 
9307c478bd9Sstevel@tonic-gate 	rmp = (struct rpcm *)q->q_ptr;
9317c478bd9Sstevel@tonic-gate 	ASSERT(rmp != NULL);
9327c478bd9Sstevel@tonic-gate 
9337c478bd9Sstevel@tonic-gate 	/*
9347c478bd9Sstevel@tonic-gate 	 * The first canputnext failed.  Try again except this time with the
9357c478bd9Sstevel@tonic-gate 	 * lock held, so that we can check the state of the stream to see if
9367c478bd9Sstevel@tonic-gate 	 * it is closing.  If either of these conditions evaluate to true
9377c478bd9Sstevel@tonic-gate 	 * then send the meesage.
9387c478bd9Sstevel@tonic-gate 	 */
9397c478bd9Sstevel@tonic-gate 	mutex_enter(&rmp->rm_lock);
9407c478bd9Sstevel@tonic-gate 	if (canputnext(q) || (rmp->rm_state & RM_CLOSING)) {
9417c478bd9Sstevel@tonic-gate 		mutex_exit(&rmp->rm_lock);
9427c478bd9Sstevel@tonic-gate 		putnext(q, mp);
9437c478bd9Sstevel@tonic-gate 	} else {
9447c478bd9Sstevel@tonic-gate 		/*
9457c478bd9Sstevel@tonic-gate 		 * canputnext failed again and the stream is not closing.
9467c478bd9Sstevel@tonic-gate 		 * Place the message on the queue and let the service
9477c478bd9Sstevel@tonic-gate 		 * procedure handle the message.
9487c478bd9Sstevel@tonic-gate 		 */
9497c478bd9Sstevel@tonic-gate 		mutex_exit(&rmp->rm_lock);
9507c478bd9Sstevel@tonic-gate 		(void) putq(q, mp);
9517c478bd9Sstevel@tonic-gate 	}
9527c478bd9Sstevel@tonic-gate }
9537c478bd9Sstevel@tonic-gate 
9547c478bd9Sstevel@tonic-gate static void
9557c478bd9Sstevel@tonic-gate rpcmodwput_other(queue_t *q, mblk_t *mp)
9567c478bd9Sstevel@tonic-gate {
9577c478bd9Sstevel@tonic-gate 	struct rpcm	*rmp;
9587c478bd9Sstevel@tonic-gate 	struct iocblk	*iocp;
9597c478bd9Sstevel@tonic-gate 
9607c478bd9Sstevel@tonic-gate 	rmp = (struct rpcm *)q->q_ptr;
9617c478bd9Sstevel@tonic-gate 	ASSERT(rmp != NULL);
9627c478bd9Sstevel@tonic-gate 
9637c478bd9Sstevel@tonic-gate 	switch (mp->b_datap->db_type) {
9647c478bd9Sstevel@tonic-gate 		case M_IOCTL:
9657c478bd9Sstevel@tonic-gate 			iocp = (struct iocblk *)mp->b_rptr;
9667c478bd9Sstevel@tonic-gate 			ASSERT(iocp != NULL);
9677c478bd9Sstevel@tonic-gate 			switch (iocp->ioc_cmd) {
9687c478bd9Sstevel@tonic-gate 				case RPC_CLIENT:
9697c478bd9Sstevel@tonic-gate 				case RPC_SERVER:
9707c478bd9Sstevel@tonic-gate 					mutex_enter(&rmp->rm_lock);
9717c478bd9Sstevel@tonic-gate 					rmp->rm_type = iocp->ioc_cmd;
9727c478bd9Sstevel@tonic-gate 					mutex_exit(&rmp->rm_lock);
9737c478bd9Sstevel@tonic-gate 					mp->b_datap->db_type = M_IOCACK;
9747c478bd9Sstevel@tonic-gate 					qreply(q, mp);
9757c478bd9Sstevel@tonic-gate 					return;
9767c478bd9Sstevel@tonic-gate 				default:
9777c478bd9Sstevel@tonic-gate 				/*
9787c478bd9Sstevel@tonic-gate 				 * pass the ioctl downstream and hope someone
9797c478bd9Sstevel@tonic-gate 				 * down there knows how to handle it.
9807c478bd9Sstevel@tonic-gate 				 */
9817c478bd9Sstevel@tonic-gate 					putnext(q, mp);
9827c478bd9Sstevel@tonic-gate 					return;
9837c478bd9Sstevel@tonic-gate 			}
9847c478bd9Sstevel@tonic-gate 		default:
9857c478bd9Sstevel@tonic-gate 			break;
9867c478bd9Sstevel@tonic-gate 	}
9877c478bd9Sstevel@tonic-gate 	/*
9887c478bd9Sstevel@tonic-gate 	 * This is something we definitely do not know how to handle, just
9897c478bd9Sstevel@tonic-gate 	 * pass the message downstream
9907c478bd9Sstevel@tonic-gate 	 */
9917c478bd9Sstevel@tonic-gate 	putnext(q, mp);
9927c478bd9Sstevel@tonic-gate }
9937c478bd9Sstevel@tonic-gate 
9947c478bd9Sstevel@tonic-gate /*
9957c478bd9Sstevel@tonic-gate  * Module write service procedure. This is called by downstream modules
9967c478bd9Sstevel@tonic-gate  * for back enabling during flow control.
9977c478bd9Sstevel@tonic-gate  */
9987c478bd9Sstevel@tonic-gate void
9997c478bd9Sstevel@tonic-gate rpcmodwsrv(queue_t *q)
10007c478bd9Sstevel@tonic-gate {
10017c478bd9Sstevel@tonic-gate 	struct rpcm	*rmp;
10027c478bd9Sstevel@tonic-gate 	mblk_t		*mp = NULL;
10037c478bd9Sstevel@tonic-gate 
10047c478bd9Sstevel@tonic-gate 	rmp = (struct rpcm *)q->q_ptr;
10057c478bd9Sstevel@tonic-gate 	ASSERT(rmp != NULL);
10067c478bd9Sstevel@tonic-gate 
10077c478bd9Sstevel@tonic-gate 	/*
10087c478bd9Sstevel@tonic-gate 	 * Get messages that may be queued and send them down stream
10097c478bd9Sstevel@tonic-gate 	 */
10107c478bd9Sstevel@tonic-gate 	while ((mp = getq(q)) != NULL) {
10117c478bd9Sstevel@tonic-gate 		/*
10127c478bd9Sstevel@tonic-gate 		 * Optimize the service procedure for the server-side, by
10137c478bd9Sstevel@tonic-gate 		 * avoiding a call to canputnext().
10147c478bd9Sstevel@tonic-gate 		 */
10157c478bd9Sstevel@tonic-gate 		if (rmp->rm_type == RPC_SERVER || canputnext(q)) {
10167c478bd9Sstevel@tonic-gate 			putnext(q, mp);
10177c478bd9Sstevel@tonic-gate 			continue;
10187c478bd9Sstevel@tonic-gate 		}
10197c478bd9Sstevel@tonic-gate 		(void) putbq(q, mp);
10207c478bd9Sstevel@tonic-gate 		return;
10217c478bd9Sstevel@tonic-gate 	}
10227c478bd9Sstevel@tonic-gate }
10237c478bd9Sstevel@tonic-gate 
10247c478bd9Sstevel@tonic-gate static void
10257c478bd9Sstevel@tonic-gate rpcmod_release(queue_t *q, mblk_t *bp)
10267c478bd9Sstevel@tonic-gate {
10277c478bd9Sstevel@tonic-gate 	struct rpcm *rmp;
10287c478bd9Sstevel@tonic-gate 
10297c478bd9Sstevel@tonic-gate 	/*
10307c478bd9Sstevel@tonic-gate 	 * For now, just free the message.
10317c478bd9Sstevel@tonic-gate 	 */
10327c478bd9Sstevel@tonic-gate 	if (bp)
10337c478bd9Sstevel@tonic-gate 		freemsg(bp);
10347c478bd9Sstevel@tonic-gate 	rmp = (struct rpcm *)q->q_ptr;
10357c478bd9Sstevel@tonic-gate 
10367c478bd9Sstevel@tonic-gate 	mutex_enter(&rmp->rm_lock);
10377c478bd9Sstevel@tonic-gate 	rmp->rm_ref--;
10387c478bd9Sstevel@tonic-gate 
10397c478bd9Sstevel@tonic-gate 	if (rmp->rm_ref == 0 && (rmp->rm_state & RM_CLOSING)) {
10407c478bd9Sstevel@tonic-gate 		cv_broadcast(&rmp->rm_cwait);
10417c478bd9Sstevel@tonic-gate 	}
10427c478bd9Sstevel@tonic-gate 
10437c478bd9Sstevel@tonic-gate 	mutex_exit(&rmp->rm_lock);
10447c478bd9Sstevel@tonic-gate }
10457c478bd9Sstevel@tonic-gate 
10467c478bd9Sstevel@tonic-gate /*
10477c478bd9Sstevel@tonic-gate  * This part of rpcmod is pushed on a connection-oriented transport for use
10487c478bd9Sstevel@tonic-gate  * by RPC.  It serves to bypass the Stream head, implements
10497c478bd9Sstevel@tonic-gate  * the record marking protocol, and dispatches incoming RPC messages.
10507c478bd9Sstevel@tonic-gate  */
10517c478bd9Sstevel@tonic-gate 
10527c478bd9Sstevel@tonic-gate /* Default idle timer values */
10537c478bd9Sstevel@tonic-gate #define	MIR_CLNT_IDLE_TIMEOUT	(5 * (60 * 1000L))	/* 5 minutes */
10547c478bd9Sstevel@tonic-gate #define	MIR_SVC_IDLE_TIMEOUT	(6 * (60 * 1000L))	/* 6 minutes */
10557c478bd9Sstevel@tonic-gate #define	MIR_SVC_ORDREL_TIMEOUT	(10 * (60 * 1000L))	/* 10 minutes */
10567c478bd9Sstevel@tonic-gate #define	MIR_LASTFRAG	0x80000000	/* Record marker */
10577c478bd9Sstevel@tonic-gate 
10587c478bd9Sstevel@tonic-gate #define	DLEN(mp) (mp->b_cont ? msgdsize(mp) : (mp->b_wptr - mp->b_rptr))
10597c478bd9Sstevel@tonic-gate 
10607c478bd9Sstevel@tonic-gate #define	MIR_SVC_QUIESCED(mir)	\
10617c478bd9Sstevel@tonic-gate 	(mir->mir_ref_cnt == 0 && mir->mir_inrservice == 0)
10627c478bd9Sstevel@tonic-gate 
10637c478bd9Sstevel@tonic-gate #define	MIR_CLEAR_INRSRV(mir_ptr)	{	\
10647c478bd9Sstevel@tonic-gate 	(mir_ptr)->mir_inrservice = 0;	\
10657c478bd9Sstevel@tonic-gate 	if ((mir_ptr)->mir_type == RPC_SERVER &&	\
10667c478bd9Sstevel@tonic-gate 		(mir_ptr)->mir_closing)	\
10677c478bd9Sstevel@tonic-gate 		cv_signal(&(mir_ptr)->mir_condvar);	\
10687c478bd9Sstevel@tonic-gate }
10697c478bd9Sstevel@tonic-gate 
10707c478bd9Sstevel@tonic-gate /*
10717c478bd9Sstevel@tonic-gate  * Don't block service procedure (and mir_close) if
10727c478bd9Sstevel@tonic-gate  * we are in the process of closing.
10737c478bd9Sstevel@tonic-gate  */
10747c478bd9Sstevel@tonic-gate #define	MIR_WCANPUTNEXT(mir_ptr, write_q)	\
10757c478bd9Sstevel@tonic-gate 	(canputnext(write_q) || ((mir_ptr)->mir_svc_no_more_msgs == 1))
10767c478bd9Sstevel@tonic-gate 
10777c478bd9Sstevel@tonic-gate static int	mir_clnt_dup_request(queue_t *q, mblk_t *mp);
10787c478bd9Sstevel@tonic-gate static void	mir_rput_proto(queue_t *q, mblk_t *mp);
10797c478bd9Sstevel@tonic-gate static int	mir_svc_policy_notify(queue_t *q, int event);
10807c478bd9Sstevel@tonic-gate static void	mir_svc_release(queue_t *wq, mblk_t *mp);
10817c478bd9Sstevel@tonic-gate static void	mir_svc_start(queue_t *wq);
10827c478bd9Sstevel@tonic-gate static void	mir_svc_idle_start(queue_t *, mir_t *);
10837c478bd9Sstevel@tonic-gate static void	mir_svc_idle_stop(queue_t *, mir_t *);
10847c478bd9Sstevel@tonic-gate static void	mir_svc_start_close(queue_t *, mir_t *);
10857c478bd9Sstevel@tonic-gate static void	mir_clnt_idle_do_stop(queue_t *);
10867c478bd9Sstevel@tonic-gate static void	mir_clnt_idle_stop(queue_t *, mir_t *);
10877c478bd9Sstevel@tonic-gate static void	mir_clnt_idle_start(queue_t *, mir_t *);
10887c478bd9Sstevel@tonic-gate static void	mir_wput(queue_t *q, mblk_t *mp);
10897c478bd9Sstevel@tonic-gate static void	mir_wput_other(queue_t *q, mblk_t *mp);
10907c478bd9Sstevel@tonic-gate static void	mir_wsrv(queue_t *q);
10917c478bd9Sstevel@tonic-gate static	void	mir_disconnect(queue_t *, mir_t *ir);
10927c478bd9Sstevel@tonic-gate static	int	mir_check_len(queue_t *, int32_t, mblk_t *);
10937c478bd9Sstevel@tonic-gate static	void	mir_timer(void *);
10947c478bd9Sstevel@tonic-gate 
10957c478bd9Sstevel@tonic-gate extern void	(*mir_rele)(queue_t *, mblk_t *);
10967c478bd9Sstevel@tonic-gate extern void	(*mir_start)(queue_t *);
10977c478bd9Sstevel@tonic-gate extern void	(*clnt_stop_idle)(queue_t *);
10987c478bd9Sstevel@tonic-gate 
10997c478bd9Sstevel@tonic-gate clock_t	clnt_idle_timeout = MIR_CLNT_IDLE_TIMEOUT;
11007c478bd9Sstevel@tonic-gate clock_t	svc_idle_timeout = MIR_SVC_IDLE_TIMEOUT;
11017c478bd9Sstevel@tonic-gate 
11027c478bd9Sstevel@tonic-gate /*
11037c478bd9Sstevel@tonic-gate  * Timeout for subsequent notifications of idle connection.  This is
11047c478bd9Sstevel@tonic-gate  * typically used to clean up after a wedged orderly release.
11057c478bd9Sstevel@tonic-gate  */
11067c478bd9Sstevel@tonic-gate clock_t	svc_ordrel_timeout = MIR_SVC_ORDREL_TIMEOUT; /* milliseconds */
11077c478bd9Sstevel@tonic-gate 
11087c478bd9Sstevel@tonic-gate extern	uint_t	*clnt_max_msg_sizep;
11097c478bd9Sstevel@tonic-gate extern	uint_t	*svc_max_msg_sizep;
11107c478bd9Sstevel@tonic-gate uint_t	clnt_max_msg_size = RPC_MAXDATASIZE;
11117c478bd9Sstevel@tonic-gate uint_t	svc_max_msg_size = RPC_MAXDATASIZE;
11127c478bd9Sstevel@tonic-gate uint_t	mir_krpc_cell_null;
11137c478bd9Sstevel@tonic-gate 
11147c478bd9Sstevel@tonic-gate static void
11157c478bd9Sstevel@tonic-gate mir_timer_stop(mir_t *mir)
11167c478bd9Sstevel@tonic-gate {
11177c478bd9Sstevel@tonic-gate 	timeout_id_t tid;
11187c478bd9Sstevel@tonic-gate 
11197c478bd9Sstevel@tonic-gate 	ASSERT(MUTEX_HELD(&mir->mir_mutex));
11207c478bd9Sstevel@tonic-gate 
11217c478bd9Sstevel@tonic-gate 	/*
11227c478bd9Sstevel@tonic-gate 	 * Since the mir_mutex lock needs to be released to call
11237c478bd9Sstevel@tonic-gate 	 * untimeout(), we need to make sure that no other thread
11247c478bd9Sstevel@tonic-gate 	 * can start/stop the timer (changing mir_timer_id) during
11257c478bd9Sstevel@tonic-gate 	 * that time.  The mir_timer_call bit and the mir_timer_cv
11267c478bd9Sstevel@tonic-gate 	 * condition variable are used to synchronize this.  Setting
11277c478bd9Sstevel@tonic-gate 	 * mir_timer_call also tells mir_timer() (refer to the comments
11287c478bd9Sstevel@tonic-gate 	 * in mir_timer()) that it does not need to do anything.
11297c478bd9Sstevel@tonic-gate 	 */
11307c478bd9Sstevel@tonic-gate 	while (mir->mir_timer_call)
11317c478bd9Sstevel@tonic-gate 		cv_wait(&mir->mir_timer_cv, &mir->mir_mutex);
11327c478bd9Sstevel@tonic-gate 	mir->mir_timer_call = B_TRUE;
11337c478bd9Sstevel@tonic-gate 
11347c478bd9Sstevel@tonic-gate 	if ((tid = mir->mir_timer_id) != 0) {
11357c478bd9Sstevel@tonic-gate 		mir->mir_timer_id = 0;
11367c478bd9Sstevel@tonic-gate 		mutex_exit(&mir->mir_mutex);
11377c478bd9Sstevel@tonic-gate 		(void) untimeout(tid);
11387c478bd9Sstevel@tonic-gate 		mutex_enter(&mir->mir_mutex);
11397c478bd9Sstevel@tonic-gate 	}
11407c478bd9Sstevel@tonic-gate 	mir->mir_timer_call = B_FALSE;
11417c478bd9Sstevel@tonic-gate 	cv_broadcast(&mir->mir_timer_cv);
11427c478bd9Sstevel@tonic-gate }
11437c478bd9Sstevel@tonic-gate 
11447c478bd9Sstevel@tonic-gate static void
11457c478bd9Sstevel@tonic-gate mir_timer_start(queue_t *q, mir_t *mir, clock_t intrvl)
11467c478bd9Sstevel@tonic-gate {
11477c478bd9Sstevel@tonic-gate 	timeout_id_t tid;
11487c478bd9Sstevel@tonic-gate 
11497c478bd9Sstevel@tonic-gate 	ASSERT(MUTEX_HELD(&mir->mir_mutex));
11507c478bd9Sstevel@tonic-gate 
11517c478bd9Sstevel@tonic-gate 	while (mir->mir_timer_call)
11527c478bd9Sstevel@tonic-gate 		cv_wait(&mir->mir_timer_cv, &mir->mir_mutex);
11537c478bd9Sstevel@tonic-gate 	mir->mir_timer_call = B_TRUE;
11547c478bd9Sstevel@tonic-gate 
11557c478bd9Sstevel@tonic-gate 	if ((tid = mir->mir_timer_id) != 0) {
11567c478bd9Sstevel@tonic-gate 		mutex_exit(&mir->mir_mutex);
11577c478bd9Sstevel@tonic-gate 		(void) untimeout(tid);
11587c478bd9Sstevel@tonic-gate 		mutex_enter(&mir->mir_mutex);
11597c478bd9Sstevel@tonic-gate 	}
11607c478bd9Sstevel@tonic-gate 	/* Only start the timer when it is not closing. */
11617c478bd9Sstevel@tonic-gate 	if (!mir->mir_closing) {
11627c478bd9Sstevel@tonic-gate 		mir->mir_timer_id = timeout(mir_timer, q,
11637c478bd9Sstevel@tonic-gate 		    MSEC_TO_TICK(intrvl));
11647c478bd9Sstevel@tonic-gate 	}
11657c478bd9Sstevel@tonic-gate 	mir->mir_timer_call = B_FALSE;
11667c478bd9Sstevel@tonic-gate 	cv_broadcast(&mir->mir_timer_cv);
11677c478bd9Sstevel@tonic-gate }
11687c478bd9Sstevel@tonic-gate 
11697c478bd9Sstevel@tonic-gate static int
11707c478bd9Sstevel@tonic-gate mir_clnt_dup_request(queue_t *q, mblk_t *mp)
11717c478bd9Sstevel@tonic-gate {
11727c478bd9Sstevel@tonic-gate 	mblk_t  *mp1;
11737c478bd9Sstevel@tonic-gate 	uint32_t  new_xid;
11747c478bd9Sstevel@tonic-gate 	uint32_t  old_xid;
11757c478bd9Sstevel@tonic-gate 
11767c478bd9Sstevel@tonic-gate 	ASSERT(MUTEX_HELD(&((mir_t *)q->q_ptr)->mir_mutex));
11777c478bd9Sstevel@tonic-gate 	new_xid = BE32_TO_U32(&mp->b_rptr[4]);
11787c478bd9Sstevel@tonic-gate 	/*
11797c478bd9Sstevel@tonic-gate 	 * This loop is a bit tacky -- it walks the STREAMS list of
11807c478bd9Sstevel@tonic-gate 	 * flow-controlled messages.
11817c478bd9Sstevel@tonic-gate 	 */
11827c478bd9Sstevel@tonic-gate 	if ((mp1 = q->q_first) != NULL) {
11837c478bd9Sstevel@tonic-gate 		do {
11847c478bd9Sstevel@tonic-gate 			old_xid = BE32_TO_U32(&mp1->b_rptr[4]);
11857c478bd9Sstevel@tonic-gate 			if (new_xid == old_xid)
11867c478bd9Sstevel@tonic-gate 				return (1);
11877c478bd9Sstevel@tonic-gate 		} while ((mp1 = mp1->b_next) != NULL);
11887c478bd9Sstevel@tonic-gate 	}
11897c478bd9Sstevel@tonic-gate 	return (0);
11907c478bd9Sstevel@tonic-gate }
11917c478bd9Sstevel@tonic-gate 
11927c478bd9Sstevel@tonic-gate static int
11937c478bd9Sstevel@tonic-gate mir_close(queue_t *q)
11947c478bd9Sstevel@tonic-gate {
11957c478bd9Sstevel@tonic-gate 	mir_t	*mir;
11967c478bd9Sstevel@tonic-gate 	mblk_t	*mp;
11977c478bd9Sstevel@tonic-gate 	bool_t queue_cleaned = FALSE;
11987c478bd9Sstevel@tonic-gate 
11997c478bd9Sstevel@tonic-gate 	RPCLOG(32, "rpcmod: mir_close of q 0x%p\n", (void *)q);
12007c478bd9Sstevel@tonic-gate 	mir = (mir_t *)q->q_ptr;
12017c478bd9Sstevel@tonic-gate 	ASSERT(MUTEX_NOT_HELD(&mir->mir_mutex));
12027c478bd9Sstevel@tonic-gate 	mutex_enter(&mir->mir_mutex);
12037c478bd9Sstevel@tonic-gate 	if ((mp = mir->mir_head_mp) != NULL) {
12047c478bd9Sstevel@tonic-gate 		mir->mir_head_mp = (mblk_t *)0;
12057c478bd9Sstevel@tonic-gate 		freemsg(mp);
12067c478bd9Sstevel@tonic-gate 	}
12077c478bd9Sstevel@tonic-gate 	/*
12087c478bd9Sstevel@tonic-gate 	 * Set mir_closing so we get notified when MIR_SVC_QUIESCED()
12097c478bd9Sstevel@tonic-gate 	 * is TRUE.  And mir_timer_start() won't start the timer again.
12107c478bd9Sstevel@tonic-gate 	 */
12117c478bd9Sstevel@tonic-gate 	mir->mir_closing = B_TRUE;
12127c478bd9Sstevel@tonic-gate 	mir_timer_stop(mir);
12137c478bd9Sstevel@tonic-gate 
12147c478bd9Sstevel@tonic-gate 	if (mir->mir_type == RPC_SERVER) {
12157c478bd9Sstevel@tonic-gate 		flushq(q, FLUSHDATA);	/* Ditch anything waiting on read q */
12167c478bd9Sstevel@tonic-gate 
12177c478bd9Sstevel@tonic-gate 		/*
12187c478bd9Sstevel@tonic-gate 		 * This will prevent more requests from arriving and
12197c478bd9Sstevel@tonic-gate 		 * will force rpcmod to ignore flow control.
12207c478bd9Sstevel@tonic-gate 		 */
12217c478bd9Sstevel@tonic-gate 		mir_svc_start_close(WR(q), mir);
12227c478bd9Sstevel@tonic-gate 
12237c478bd9Sstevel@tonic-gate 		while ((!MIR_SVC_QUIESCED(mir)) || mir->mir_inwservice == 1) {
12247c478bd9Sstevel@tonic-gate 
12257c478bd9Sstevel@tonic-gate 			if (mir->mir_ref_cnt && !mir->mir_inrservice &&
12267c478bd9Sstevel@tonic-gate 			    (queue_cleaned == FALSE)) {
12277c478bd9Sstevel@tonic-gate 				/*
12287c478bd9Sstevel@tonic-gate 				 * call into SVC to clean the queue
12297c478bd9Sstevel@tonic-gate 				 */
12307c478bd9Sstevel@tonic-gate 				mutex_exit(&mir->mir_mutex);
12317c478bd9Sstevel@tonic-gate 				svc_queueclean(q);
12327c478bd9Sstevel@tonic-gate 				queue_cleaned = TRUE;
12337c478bd9Sstevel@tonic-gate 				mutex_enter(&mir->mir_mutex);
12347c478bd9Sstevel@tonic-gate 				continue;
12357c478bd9Sstevel@tonic-gate 			}
12367c478bd9Sstevel@tonic-gate 
12377c478bd9Sstevel@tonic-gate 			/*
12387c478bd9Sstevel@tonic-gate 			 * Bugid 1253810 - Force the write service
12397c478bd9Sstevel@tonic-gate 			 * procedure to send its messages, regardless
12407c478bd9Sstevel@tonic-gate 			 * whether the downstream  module is ready
12417c478bd9Sstevel@tonic-gate 			 * to accept data.
12427c478bd9Sstevel@tonic-gate 			 */
12437c478bd9Sstevel@tonic-gate 			if (mir->mir_inwservice == 1)
12447c478bd9Sstevel@tonic-gate 				qenable(WR(q));
12457c478bd9Sstevel@tonic-gate 
12467c478bd9Sstevel@tonic-gate 			cv_wait(&mir->mir_condvar, &mir->mir_mutex);
12477c478bd9Sstevel@tonic-gate 		}
12487c478bd9Sstevel@tonic-gate 
12497c478bd9Sstevel@tonic-gate 		mutex_exit(&mir->mir_mutex);
12507c478bd9Sstevel@tonic-gate 		qprocsoff(q);
12517c478bd9Sstevel@tonic-gate 
12527c478bd9Sstevel@tonic-gate 		/* Notify KRPC that this stream is going away. */
12537c478bd9Sstevel@tonic-gate 		svc_queueclose(q);
12547c478bd9Sstevel@tonic-gate 	} else {
12557c478bd9Sstevel@tonic-gate 		mutex_exit(&mir->mir_mutex);
12567c478bd9Sstevel@tonic-gate 		qprocsoff(q);
12577c478bd9Sstevel@tonic-gate 	}
12587c478bd9Sstevel@tonic-gate 
12597c478bd9Sstevel@tonic-gate 	mutex_destroy(&mir->mir_mutex);
12607c478bd9Sstevel@tonic-gate 	cv_destroy(&mir->mir_condvar);
12617c478bd9Sstevel@tonic-gate 	cv_destroy(&mir->mir_timer_cv);
12627c478bd9Sstevel@tonic-gate 	kmem_free(mir, sizeof (mir_t));
12637c478bd9Sstevel@tonic-gate 	return (0);
12647c478bd9Sstevel@tonic-gate }
12657c478bd9Sstevel@tonic-gate 
12667c478bd9Sstevel@tonic-gate /*
12677c478bd9Sstevel@tonic-gate  * This is server side only (RPC_SERVER).
12687c478bd9Sstevel@tonic-gate  *
12697c478bd9Sstevel@tonic-gate  * Exit idle mode.
12707c478bd9Sstevel@tonic-gate  */
12717c478bd9Sstevel@tonic-gate static void
12727c478bd9Sstevel@tonic-gate mir_svc_idle_stop(queue_t *q, mir_t *mir)
12737c478bd9Sstevel@tonic-gate {
12747c478bd9Sstevel@tonic-gate 	ASSERT(MUTEX_HELD(&mir->mir_mutex));
12757c478bd9Sstevel@tonic-gate 	ASSERT((q->q_flag & QREADR) == 0);
12767c478bd9Sstevel@tonic-gate 	ASSERT(mir->mir_type == RPC_SERVER);
12777c478bd9Sstevel@tonic-gate 	RPCLOG(16, "rpcmod: mir_svc_idle_stop of q 0x%p\n", (void *)q);
12787c478bd9Sstevel@tonic-gate 
12797c478bd9Sstevel@tonic-gate 	mir_timer_stop(mir);
12807c478bd9Sstevel@tonic-gate }
12817c478bd9Sstevel@tonic-gate 
12827c478bd9Sstevel@tonic-gate /*
12837c478bd9Sstevel@tonic-gate  * This is server side only (RPC_SERVER).
12847c478bd9Sstevel@tonic-gate  *
12857c478bd9Sstevel@tonic-gate  * Start idle processing, which will include setting idle timer if the
12867c478bd9Sstevel@tonic-gate  * stream is not being closed.
12877c478bd9Sstevel@tonic-gate  */
12887c478bd9Sstevel@tonic-gate static void
12897c478bd9Sstevel@tonic-gate mir_svc_idle_start(queue_t *q, mir_t *mir)
12907c478bd9Sstevel@tonic-gate {
12917c478bd9Sstevel@tonic-gate 	ASSERT(MUTEX_HELD(&mir->mir_mutex));
12927c478bd9Sstevel@tonic-gate 	ASSERT((q->q_flag & QREADR) == 0);
12937c478bd9Sstevel@tonic-gate 	ASSERT(mir->mir_type == RPC_SERVER);
12947c478bd9Sstevel@tonic-gate 	RPCLOG(16, "rpcmod: mir_svc_idle_start q 0x%p\n", (void *)q);
12957c478bd9Sstevel@tonic-gate 
12967c478bd9Sstevel@tonic-gate 	/*
12977c478bd9Sstevel@tonic-gate 	 * Don't re-start idle timer if we are closing queues.
12987c478bd9Sstevel@tonic-gate 	 */
12997c478bd9Sstevel@tonic-gate 	if (mir->mir_closing) {
13007c478bd9Sstevel@tonic-gate 		RPCLOG(16, "mir_svc_idle_start - closing: 0x%p\n",
13017c478bd9Sstevel@tonic-gate 		    (void *)q);
13027c478bd9Sstevel@tonic-gate 
13037c478bd9Sstevel@tonic-gate 		/*
13047c478bd9Sstevel@tonic-gate 		 * We will call mir_svc_idle_start() whenever MIR_SVC_QUIESCED()
13057c478bd9Sstevel@tonic-gate 		 * is true.  When it is true, and we are in the process of
13067c478bd9Sstevel@tonic-gate 		 * closing the stream, signal any thread waiting in
13077c478bd9Sstevel@tonic-gate 		 * mir_close().
13087c478bd9Sstevel@tonic-gate 		 */
13097c478bd9Sstevel@tonic-gate 		if (mir->mir_inwservice == 0)
13107c478bd9Sstevel@tonic-gate 			cv_signal(&mir->mir_condvar);
13117c478bd9Sstevel@tonic-gate 
13127c478bd9Sstevel@tonic-gate 	} else {
13137c478bd9Sstevel@tonic-gate 		RPCLOG(16, "mir_svc_idle_start - reset %s timer\n",
13147c478bd9Sstevel@tonic-gate 		    mir->mir_ordrel_pending ? "ordrel" : "normal");
13157c478bd9Sstevel@tonic-gate 		/*
13167c478bd9Sstevel@tonic-gate 		 * Normal condition, start the idle timer.  If an orderly
13177c478bd9Sstevel@tonic-gate 		 * release has been sent, set the timeout to wait for the
13187c478bd9Sstevel@tonic-gate 		 * client to close its side of the connection.  Otherwise,
13197c478bd9Sstevel@tonic-gate 		 * use the normal idle timeout.
13207c478bd9Sstevel@tonic-gate 		 */
13217c478bd9Sstevel@tonic-gate 		mir_timer_start(q, mir, mir->mir_ordrel_pending ?
13227c478bd9Sstevel@tonic-gate 		    svc_ordrel_timeout : mir->mir_idle_timeout);
13237c478bd9Sstevel@tonic-gate 	}
13247c478bd9Sstevel@tonic-gate }
13257c478bd9Sstevel@tonic-gate 
13267c478bd9Sstevel@tonic-gate /* ARGSUSED */
13277c478bd9Sstevel@tonic-gate static int
13287c478bd9Sstevel@tonic-gate mir_open(queue_t *q, dev_t *devp, int flag, int sflag, cred_t *credp)
13297c478bd9Sstevel@tonic-gate {
13307c478bd9Sstevel@tonic-gate 	mir_t	*mir;
13317c478bd9Sstevel@tonic-gate 
13327c478bd9Sstevel@tonic-gate 	RPCLOG(32, "rpcmod: mir_open of q 0x%p\n", (void *)q);
13337c478bd9Sstevel@tonic-gate 	/* Set variables used directly by KRPC. */
13347c478bd9Sstevel@tonic-gate 	if (!mir_rele)
13357c478bd9Sstevel@tonic-gate 		mir_rele = mir_svc_release;
13367c478bd9Sstevel@tonic-gate 	if (!mir_start)
13377c478bd9Sstevel@tonic-gate 		mir_start = mir_svc_start;
13387c478bd9Sstevel@tonic-gate 	if (!clnt_stop_idle)
13397c478bd9Sstevel@tonic-gate 		clnt_stop_idle = mir_clnt_idle_do_stop;
13407c478bd9Sstevel@tonic-gate 	if (!clnt_max_msg_sizep)
13417c478bd9Sstevel@tonic-gate 		clnt_max_msg_sizep = &clnt_max_msg_size;
13427c478bd9Sstevel@tonic-gate 	if (!svc_max_msg_sizep)
13437c478bd9Sstevel@tonic-gate 		svc_max_msg_sizep = &svc_max_msg_size;
13447c478bd9Sstevel@tonic-gate 
13457c478bd9Sstevel@tonic-gate 	/* Allocate a zero'ed out mir structure for this stream. */
13467c478bd9Sstevel@tonic-gate 	mir = kmem_zalloc(sizeof (mir_t), KM_SLEEP);
13477c478bd9Sstevel@tonic-gate 
13487c478bd9Sstevel@tonic-gate 	/*
13497c478bd9Sstevel@tonic-gate 	 * We set hold inbound here so that incoming messages will
13507c478bd9Sstevel@tonic-gate 	 * be held on the read-side queue until the stream is completely
13517c478bd9Sstevel@tonic-gate 	 * initialized with a RPC_CLIENT or RPC_SERVER ioctl.  During
13527c478bd9Sstevel@tonic-gate 	 * the ioctl processing, the flag is cleared and any messages that
13537c478bd9Sstevel@tonic-gate 	 * arrived between the open and the ioctl are delivered to KRPC.
13547c478bd9Sstevel@tonic-gate 	 *
13557c478bd9Sstevel@tonic-gate 	 * Early data should never arrive on a client stream since
13567c478bd9Sstevel@tonic-gate 	 * servers only respond to our requests and we do not send any.
13577c478bd9Sstevel@tonic-gate 	 * until after the stream is initialized.  Early data is
13587c478bd9Sstevel@tonic-gate 	 * very common on a server stream where the client will start
13597c478bd9Sstevel@tonic-gate 	 * sending data as soon as the connection is made (and this
13607c478bd9Sstevel@tonic-gate 	 * is especially true with TCP where the protocol accepts the
13617c478bd9Sstevel@tonic-gate 	 * connection before nfsd or KRPC is notified about it).
13627c478bd9Sstevel@tonic-gate 	 */
13637c478bd9Sstevel@tonic-gate 
13647c478bd9Sstevel@tonic-gate 	mir->mir_hold_inbound = 1;
13657c478bd9Sstevel@tonic-gate 
13667c478bd9Sstevel@tonic-gate 	/*
13677c478bd9Sstevel@tonic-gate 	 * Start the record marker looking for a 4-byte header.  When
13687c478bd9Sstevel@tonic-gate 	 * this length is negative, it indicates that rpcmod is looking
13697c478bd9Sstevel@tonic-gate 	 * for bytes to consume for the record marker header.  When it
13707c478bd9Sstevel@tonic-gate 	 * is positive, it holds the number of bytes that have arrived
13717c478bd9Sstevel@tonic-gate 	 * for the current fragment and are being held in mir_header_mp.
13727c478bd9Sstevel@tonic-gate 	 */
13737c478bd9Sstevel@tonic-gate 
13747c478bd9Sstevel@tonic-gate 	mir->mir_frag_len = -(int32_t)sizeof (uint32_t);
13757c478bd9Sstevel@tonic-gate 
1376108322fbScarlsonj 	mir->mir_zoneid = rpc_zoneid();
13777c478bd9Sstevel@tonic-gate 	mutex_init(&mir->mir_mutex, NULL, MUTEX_DEFAULT, NULL);
13787c478bd9Sstevel@tonic-gate 	cv_init(&mir->mir_condvar, NULL, CV_DRIVER, NULL);
13797c478bd9Sstevel@tonic-gate 	cv_init(&mir->mir_timer_cv, NULL, CV_DRIVER, NULL);
13807c478bd9Sstevel@tonic-gate 
13817c478bd9Sstevel@tonic-gate 	q->q_ptr = (char *)mir;
13827c478bd9Sstevel@tonic-gate 	WR(q)->q_ptr = (char *)mir;
13837c478bd9Sstevel@tonic-gate 
13847c478bd9Sstevel@tonic-gate 	/*
13857c478bd9Sstevel@tonic-gate 	 * We noenable the read-side queue because we don't want it
13867c478bd9Sstevel@tonic-gate 	 * automatically enabled by putq.  We enable it explicitly
13877c478bd9Sstevel@tonic-gate 	 * in mir_wsrv when appropriate. (See additional comments on
13887c478bd9Sstevel@tonic-gate 	 * flow control at the beginning of mir_rsrv.)
13897c478bd9Sstevel@tonic-gate 	 */
13907c478bd9Sstevel@tonic-gate 	noenable(q);
13917c478bd9Sstevel@tonic-gate 
13927c478bd9Sstevel@tonic-gate 	qprocson(q);
13937c478bd9Sstevel@tonic-gate 	return (0);
13947c478bd9Sstevel@tonic-gate }
13957c478bd9Sstevel@tonic-gate 
13967c478bd9Sstevel@tonic-gate /*
13977c478bd9Sstevel@tonic-gate  * Read-side put routine for both the client and server side.  Does the
13987c478bd9Sstevel@tonic-gate  * record marking for incoming RPC messages, and when complete, dispatches
13997c478bd9Sstevel@tonic-gate  * the message to either the client or server.
14007c478bd9Sstevel@tonic-gate  */
14017c478bd9Sstevel@tonic-gate static void
14027c478bd9Sstevel@tonic-gate mir_do_rput(queue_t *q, mblk_t *mp, int srv)
14037c478bd9Sstevel@tonic-gate {
14047c478bd9Sstevel@tonic-gate 	mblk_t	*cont_mp;
14057c478bd9Sstevel@tonic-gate 	int	excess;
14067c478bd9Sstevel@tonic-gate 	int32_t	frag_len;
14077c478bd9Sstevel@tonic-gate 	int32_t	frag_header;
14087c478bd9Sstevel@tonic-gate 	mblk_t	*head_mp;
14097c478bd9Sstevel@tonic-gate 	int	len;
14107c478bd9Sstevel@tonic-gate 	mir_t	*mir;
14117c478bd9Sstevel@tonic-gate 	mblk_t	*mp1;
14127c478bd9Sstevel@tonic-gate 	unsigned char	*rptr;
14137c478bd9Sstevel@tonic-gate 	mblk_t	*tail_mp;
14147c478bd9Sstevel@tonic-gate 	unsigned char	*wptr;
14157c478bd9Sstevel@tonic-gate 	boolean_t	stop_timer = B_FALSE;
14167c478bd9Sstevel@tonic-gate 
14177c478bd9Sstevel@tonic-gate 	mir = (mir_t *)q->q_ptr;
14187c478bd9Sstevel@tonic-gate 	ASSERT(mir != NULL);
14197c478bd9Sstevel@tonic-gate 
14207c478bd9Sstevel@tonic-gate 	/*
14217c478bd9Sstevel@tonic-gate 	 * If the stream has not been set up as a RPC_CLIENT or RPC_SERVER
14227c478bd9Sstevel@tonic-gate 	 * with the corresponding ioctl, then don't accept
14237c478bd9Sstevel@tonic-gate 	 * any inbound data.  This should never happen for streams
14247c478bd9Sstevel@tonic-gate 	 * created by nfsd or client-side KRPC because they are careful
14257c478bd9Sstevel@tonic-gate 	 * to set the mode of the stream before doing anything else.
14267c478bd9Sstevel@tonic-gate 	 */
14277c478bd9Sstevel@tonic-gate 	if (mir->mir_type == 0) {
14287c478bd9Sstevel@tonic-gate 		freemsg(mp);
14297c478bd9Sstevel@tonic-gate 		return;
14307c478bd9Sstevel@tonic-gate 	}
14317c478bd9Sstevel@tonic-gate 
14327c478bd9Sstevel@tonic-gate 	ASSERT(MUTEX_NOT_HELD(&mir->mir_mutex));
14337c478bd9Sstevel@tonic-gate 
14347c478bd9Sstevel@tonic-gate 	switch (mp->b_datap->db_type) {
14357c478bd9Sstevel@tonic-gate 	case M_DATA:
14367c478bd9Sstevel@tonic-gate 		break;
14377c478bd9Sstevel@tonic-gate 	case M_PROTO:
14387c478bd9Sstevel@tonic-gate 	case M_PCPROTO:
14397c478bd9Sstevel@tonic-gate 		rptr = mp->b_rptr;
14407c478bd9Sstevel@tonic-gate 		if (mp->b_wptr - rptr < sizeof (uint32_t)) {
14417c478bd9Sstevel@tonic-gate 			RPCLOG(1, "mir_rput: runt TPI message (%d bytes)\n",
14427c478bd9Sstevel@tonic-gate 			    (int)(mp->b_wptr - rptr));
14437c478bd9Sstevel@tonic-gate 			freemsg(mp);
14447c478bd9Sstevel@tonic-gate 			return;
14457c478bd9Sstevel@tonic-gate 		}
14467c478bd9Sstevel@tonic-gate 		if (((union T_primitives *)rptr)->type != T_DATA_IND) {
14477c478bd9Sstevel@tonic-gate 			mir_rput_proto(q, mp);
14487c478bd9Sstevel@tonic-gate 			return;
14497c478bd9Sstevel@tonic-gate 		}
14507c478bd9Sstevel@tonic-gate 
14517c478bd9Sstevel@tonic-gate 		/* Throw away the T_DATA_IND block and continue with data. */
14527c478bd9Sstevel@tonic-gate 		mp1 = mp;
14537c478bd9Sstevel@tonic-gate 		mp = mp->b_cont;
14547c478bd9Sstevel@tonic-gate 		freeb(mp1);
14557c478bd9Sstevel@tonic-gate 		break;
14567c478bd9Sstevel@tonic-gate 	case M_SETOPTS:
14577c478bd9Sstevel@tonic-gate 		/*
14587c478bd9Sstevel@tonic-gate 		 * If a module on the stream is trying set the Stream head's
14597c478bd9Sstevel@tonic-gate 		 * high water mark, then set our hiwater to the requested
14607c478bd9Sstevel@tonic-gate 		 * value.  We are the "stream head" for all inbound
14617c478bd9Sstevel@tonic-gate 		 * data messages since messages are passed directly to KRPC.
14627c478bd9Sstevel@tonic-gate 		 */
14637c478bd9Sstevel@tonic-gate 		if ((mp->b_wptr - mp->b_rptr) >= sizeof (struct stroptions)) {
14647c478bd9Sstevel@tonic-gate 			struct stroptions	*stropts;
14657c478bd9Sstevel@tonic-gate 
14667c478bd9Sstevel@tonic-gate 			stropts = (struct stroptions *)mp->b_rptr;
14677c478bd9Sstevel@tonic-gate 			if ((stropts->so_flags & SO_HIWAT) &&
14687c478bd9Sstevel@tonic-gate 			    !(stropts->so_flags & SO_BAND)) {
14697c478bd9Sstevel@tonic-gate 				(void) strqset(q, QHIWAT, 0, stropts->so_hiwat);
14707c478bd9Sstevel@tonic-gate 			}
14717c478bd9Sstevel@tonic-gate 		}
14727c478bd9Sstevel@tonic-gate 		putnext(q, mp);
14737c478bd9Sstevel@tonic-gate 		return;
14747c478bd9Sstevel@tonic-gate 	case M_FLUSH:
14757c478bd9Sstevel@tonic-gate 		RPCLOG(32, "mir_do_rput: ignoring M_FLUSH on q 0x%p. ",
14767c478bd9Sstevel@tonic-gate 		    (void *)q);
14777c478bd9Sstevel@tonic-gate 		RPCLOG(32, "M_FLUSH is %x\n", (uint_t)*mp->b_rptr);
14787c478bd9Sstevel@tonic-gate 
14797c478bd9Sstevel@tonic-gate 		putnext(q, mp);
14807c478bd9Sstevel@tonic-gate 		return;
14817c478bd9Sstevel@tonic-gate 	default:
14827c478bd9Sstevel@tonic-gate 		putnext(q, mp);
14837c478bd9Sstevel@tonic-gate 		return;
14847c478bd9Sstevel@tonic-gate 	}
14857c478bd9Sstevel@tonic-gate 
14867c478bd9Sstevel@tonic-gate 	mutex_enter(&mir->mir_mutex);
14877c478bd9Sstevel@tonic-gate 
14887c478bd9Sstevel@tonic-gate 	/*
14897c478bd9Sstevel@tonic-gate 	 * If this connection is closing, don't accept any new messages.
14907c478bd9Sstevel@tonic-gate 	 */
14917c478bd9Sstevel@tonic-gate 	if (mir->mir_svc_no_more_msgs) {
14927c478bd9Sstevel@tonic-gate 		ASSERT(mir->mir_type == RPC_SERVER);
14937c478bd9Sstevel@tonic-gate 		mutex_exit(&mir->mir_mutex);
14947c478bd9Sstevel@tonic-gate 		freemsg(mp);
14957c478bd9Sstevel@tonic-gate 		return;
14967c478bd9Sstevel@tonic-gate 	}
14977c478bd9Sstevel@tonic-gate 
14987c478bd9Sstevel@tonic-gate 	/* Get local copies for quicker access. */
14997c478bd9Sstevel@tonic-gate 	frag_len = mir->mir_frag_len;
15007c478bd9Sstevel@tonic-gate 	frag_header = mir->mir_frag_header;
15017c478bd9Sstevel@tonic-gate 	head_mp = mir->mir_head_mp;
15027c478bd9Sstevel@tonic-gate 	tail_mp = mir->mir_tail_mp;
15037c478bd9Sstevel@tonic-gate 
15047c478bd9Sstevel@tonic-gate 	/* Loop, processing each message block in the mp chain separately. */
15057c478bd9Sstevel@tonic-gate 	do {
15067c478bd9Sstevel@tonic-gate 		/*
15077c478bd9Sstevel@tonic-gate 		 * cont_mp is used in the do/while condition below to
15087c478bd9Sstevel@tonic-gate 		 * walk to the next block in the STREAMS message.
15097c478bd9Sstevel@tonic-gate 		 * mp->b_cont may be nil'ed during processing so we
15107c478bd9Sstevel@tonic-gate 		 * can't rely on it to find the next block.
15117c478bd9Sstevel@tonic-gate 		 */
15127c478bd9Sstevel@tonic-gate 		cont_mp = mp->b_cont;
15137c478bd9Sstevel@tonic-gate 
15147c478bd9Sstevel@tonic-gate 		/*
15157c478bd9Sstevel@tonic-gate 		 * Get local copies of rptr and wptr for our processing.
15167c478bd9Sstevel@tonic-gate 		 * These always point into "mp" (the current block being
15177c478bd9Sstevel@tonic-gate 		 * processed), but rptr is updated as we consume any
15187c478bd9Sstevel@tonic-gate 		 * record header in this message, and wptr is updated to
15197c478bd9Sstevel@tonic-gate 		 * point to the end of the data for the current fragment,
15207c478bd9Sstevel@tonic-gate 		 * if it ends in this block.  The main point is that
15217c478bd9Sstevel@tonic-gate 		 * they are not always the same as b_rptr and b_wptr.
15227c478bd9Sstevel@tonic-gate 		 * b_rptr and b_wptr will be updated when appropriate.
15237c478bd9Sstevel@tonic-gate 		 */
15247c478bd9Sstevel@tonic-gate 		rptr = mp->b_rptr;
15257c478bd9Sstevel@tonic-gate 		wptr = mp->b_wptr;
15267c478bd9Sstevel@tonic-gate same_mblk:;
15277c478bd9Sstevel@tonic-gate 		len = (int)(wptr - rptr);
15287c478bd9Sstevel@tonic-gate 		if (len <= 0) {
15297c478bd9Sstevel@tonic-gate 			/*
15307c478bd9Sstevel@tonic-gate 			 * If we have processed all of the data in the message
15317c478bd9Sstevel@tonic-gate 			 * or the block is empty to begin with, then we're
15327c478bd9Sstevel@tonic-gate 			 * done with this block and can go on to cont_mp,
15337c478bd9Sstevel@tonic-gate 			 * if there is one.
15347c478bd9Sstevel@tonic-gate 			 *
15357c478bd9Sstevel@tonic-gate 			 * First, we check to see if the current block is
15367c478bd9Sstevel@tonic-gate 			 * now zero-length and, if so, we free it.
15377c478bd9Sstevel@tonic-gate 			 * This happens when either the block was empty
15387c478bd9Sstevel@tonic-gate 			 * to begin with or we consumed all of the data
15397c478bd9Sstevel@tonic-gate 			 * for the record marking header.
15407c478bd9Sstevel@tonic-gate 			 */
15417c478bd9Sstevel@tonic-gate 			if (rptr <= mp->b_rptr) {
15427c478bd9Sstevel@tonic-gate 				/*
15437c478bd9Sstevel@tonic-gate 				 * If head_mp is non-NULL, add cont_mp to the
15447c478bd9Sstevel@tonic-gate 				 * mblk list. XXX But there is a possibility
15457c478bd9Sstevel@tonic-gate 				 * that tail_mp = mp or even head_mp = mp XXX
15467c478bd9Sstevel@tonic-gate 				 */
15477c478bd9Sstevel@tonic-gate 				if (head_mp) {
15487c478bd9Sstevel@tonic-gate 					if (head_mp == mp)
15497c478bd9Sstevel@tonic-gate 						head_mp = NULL;
15507c478bd9Sstevel@tonic-gate 					else if (tail_mp != mp) {
15517c478bd9Sstevel@tonic-gate 		ASSERT((tail_mp->b_cont == NULL) || (tail_mp->b_cont == mp));
15527c478bd9Sstevel@tonic-gate 						tail_mp->b_cont = cont_mp;
15537c478bd9Sstevel@tonic-gate 						/*
15547c478bd9Sstevel@tonic-gate 						 * It's possible that, because
15557c478bd9Sstevel@tonic-gate 						 * of a very short mblk (0-3
15567c478bd9Sstevel@tonic-gate 						 * bytes), we've ended up here
15577c478bd9Sstevel@tonic-gate 						 * and that cont_mp could be
15587c478bd9Sstevel@tonic-gate 						 * NULL (if we're at the end
15597c478bd9Sstevel@tonic-gate 						 * of an mblk chain). If so,
15607c478bd9Sstevel@tonic-gate 						 * don't set tail_mp to
15617c478bd9Sstevel@tonic-gate 						 * cont_mp, because the next
15627c478bd9Sstevel@tonic-gate 						 * time we access it, we'll
15637c478bd9Sstevel@tonic-gate 						 * dereference a NULL pointer
15647c478bd9Sstevel@tonic-gate 						 * and crash. Just leave
15657c478bd9Sstevel@tonic-gate 						 * tail_mp pointing at the
15667c478bd9Sstevel@tonic-gate 						 * current end of chain.
15677c478bd9Sstevel@tonic-gate 						 */
15687c478bd9Sstevel@tonic-gate 						if (cont_mp)
15697c478bd9Sstevel@tonic-gate 							tail_mp = cont_mp;
15707c478bd9Sstevel@tonic-gate 					} else {
15717c478bd9Sstevel@tonic-gate 						mblk_t *smp = head_mp;
15727c478bd9Sstevel@tonic-gate 
15737c478bd9Sstevel@tonic-gate 						while ((smp->b_cont != NULL) &&
15747c478bd9Sstevel@tonic-gate 						    (smp->b_cont != mp))
15757c478bd9Sstevel@tonic-gate 							smp = smp->b_cont;
15767c478bd9Sstevel@tonic-gate 						smp->b_cont = cont_mp;
15777c478bd9Sstevel@tonic-gate 						/*
15787c478bd9Sstevel@tonic-gate 						 * Don't set tail_mp to cont_mp
15797c478bd9Sstevel@tonic-gate 						 * if it's NULL. Instead, set
15807c478bd9Sstevel@tonic-gate 						 * tail_mp to smp, which is the
15817c478bd9Sstevel@tonic-gate 						 * end of the chain starting
15827c478bd9Sstevel@tonic-gate 						 * at head_mp.
15837c478bd9Sstevel@tonic-gate 						 */
15847c478bd9Sstevel@tonic-gate 						if (cont_mp)
15857c478bd9Sstevel@tonic-gate 							tail_mp = cont_mp;
15867c478bd9Sstevel@tonic-gate 						else
15877c478bd9Sstevel@tonic-gate 							tail_mp = smp;
15887c478bd9Sstevel@tonic-gate 					}
15897c478bd9Sstevel@tonic-gate 				}
15907c478bd9Sstevel@tonic-gate 				freeb(mp);
15917c478bd9Sstevel@tonic-gate 			}
15927c478bd9Sstevel@tonic-gate 			continue;
15937c478bd9Sstevel@tonic-gate 		}
15947c478bd9Sstevel@tonic-gate 
15957c478bd9Sstevel@tonic-gate 		/*
15967c478bd9Sstevel@tonic-gate 		 * frag_len starts at -4 and is incremented past the record
15977c478bd9Sstevel@tonic-gate 		 * marking header to 0, and then becomes positive as real data
15987c478bd9Sstevel@tonic-gate 		 * bytes are received for the message.  While frag_len is less
15997c478bd9Sstevel@tonic-gate 		 * than zero, we need more bytes for the record marking
16007c478bd9Sstevel@tonic-gate 		 * header.
16017c478bd9Sstevel@tonic-gate 		 */
16027c478bd9Sstevel@tonic-gate 		if (frag_len < 0) {
16037c478bd9Sstevel@tonic-gate 			uchar_t	*up = rptr;
16047c478bd9Sstevel@tonic-gate 			/*
16057c478bd9Sstevel@tonic-gate 			 * Collect as many bytes as we need for the record
16067c478bd9Sstevel@tonic-gate 			 * marking header and that are available in this block.
16077c478bd9Sstevel@tonic-gate 			 */
16087c478bd9Sstevel@tonic-gate 			do {
16097c478bd9Sstevel@tonic-gate 				--len;
16107c478bd9Sstevel@tonic-gate 				frag_len++;
16117c478bd9Sstevel@tonic-gate 				frag_header <<= 8;
16127c478bd9Sstevel@tonic-gate 				frag_header += (*up++ & 0xFF);
16137c478bd9Sstevel@tonic-gate 			} while (len > 0 && frag_len < 0);
16147c478bd9Sstevel@tonic-gate 
16157c478bd9Sstevel@tonic-gate 			if (rptr == mp->b_rptr) {
16167c478bd9Sstevel@tonic-gate 				/*
16177c478bd9Sstevel@tonic-gate 				 * The record header is located at the
16187c478bd9Sstevel@tonic-gate 				 * beginning of the block, so just walk
16197c478bd9Sstevel@tonic-gate 				 * b_rptr past it.
16207c478bd9Sstevel@tonic-gate 				 */
16217c478bd9Sstevel@tonic-gate 				mp->b_rptr = rptr = up;
16227c478bd9Sstevel@tonic-gate 			} else {
16237c478bd9Sstevel@tonic-gate 				/*
16247c478bd9Sstevel@tonic-gate 				 * The record header is located in the middle
16257c478bd9Sstevel@tonic-gate 				 * of a block, so copy any remaining data up.
16267c478bd9Sstevel@tonic-gate 				 * This happens when an RPC message is
16277c478bd9Sstevel@tonic-gate 				 * fragmented into multiple pieces and
16287c478bd9Sstevel@tonic-gate 				 * a middle (or end) fragment immediately
16297c478bd9Sstevel@tonic-gate 				 * follows a previous fragment in the same
16307c478bd9Sstevel@tonic-gate 				 * message block.
16317c478bd9Sstevel@tonic-gate 				 */
16327c478bd9Sstevel@tonic-gate 				wptr = &rptr[len];
16337c478bd9Sstevel@tonic-gate 				mp->b_wptr = wptr;
16347c478bd9Sstevel@tonic-gate 				if (len) {
16357c478bd9Sstevel@tonic-gate 					RPCLOG(32, "mir_do_rput: copying %d "
16367c478bd9Sstevel@tonic-gate 					    "bytes of data up", len);
16377c478bd9Sstevel@tonic-gate 					RPCLOG(32, " db_ref %d\n",
16387c478bd9Sstevel@tonic-gate 					    (uint_t)mp->b_datap->db_ref);
16397c478bd9Sstevel@tonic-gate 					bcopy(up, rptr, len);
16407c478bd9Sstevel@tonic-gate 				}
16417c478bd9Sstevel@tonic-gate 			}
16427c478bd9Sstevel@tonic-gate 
16437c478bd9Sstevel@tonic-gate 			/*
16447c478bd9Sstevel@tonic-gate 			 * If we haven't received the complete record header
16457c478bd9Sstevel@tonic-gate 			 * yet, then loop around to get the next block in the
16467c478bd9Sstevel@tonic-gate 			 * STREAMS message. The logic at same_mblk label will
16477c478bd9Sstevel@tonic-gate 			 * free the current block if it has become empty.
16487c478bd9Sstevel@tonic-gate 			 */
16497c478bd9Sstevel@tonic-gate 			if (frag_len < 0) {
16507c478bd9Sstevel@tonic-gate 				RPCLOG(32, "mir_do_rput: frag_len is still < 0 "
16517c478bd9Sstevel@tonic-gate 				"(%d)", len);
16527c478bd9Sstevel@tonic-gate 				goto same_mblk;
16537c478bd9Sstevel@tonic-gate 			}
16547c478bd9Sstevel@tonic-gate 
16557c478bd9Sstevel@tonic-gate #ifdef	RPCDEBUG
16567c478bd9Sstevel@tonic-gate 			if ((frag_header & MIR_LASTFRAG) == 0) {
16577c478bd9Sstevel@tonic-gate 				RPCLOG0(32, "mir_do_rput: multi-fragment "
16587c478bd9Sstevel@tonic-gate 				    "record\n");
16597c478bd9Sstevel@tonic-gate 			}
16607c478bd9Sstevel@tonic-gate 			{
16617c478bd9Sstevel@tonic-gate 				uint_t l = frag_header & ~MIR_LASTFRAG;
16627c478bd9Sstevel@tonic-gate 
16637c478bd9Sstevel@tonic-gate 				if (l != 0 && mir->mir_max_msg_sizep &&
16647c478bd9Sstevel@tonic-gate 				    l >= *mir->mir_max_msg_sizep) {
16657c478bd9Sstevel@tonic-gate 					RPCLOG(32, "mir_do_rput: fragment size"
16667c478bd9Sstevel@tonic-gate 					    " (%d) > maximum", l);
16677c478bd9Sstevel@tonic-gate 					RPCLOG(32, " (%u)\n",
16687c478bd9Sstevel@tonic-gate 					    *mir->mir_max_msg_sizep);
16697c478bd9Sstevel@tonic-gate 				}
16707c478bd9Sstevel@tonic-gate 			}
16717c478bd9Sstevel@tonic-gate #endif
16727c478bd9Sstevel@tonic-gate 			/*
16737c478bd9Sstevel@tonic-gate 			 * At this point we have retrieved the complete record
16747c478bd9Sstevel@tonic-gate 			 * header for this fragment.  If the current block is
16757c478bd9Sstevel@tonic-gate 			 * empty, then we need to free it and walk to the next
16767c478bd9Sstevel@tonic-gate 			 * block.
16777c478bd9Sstevel@tonic-gate 			 */
16787c478bd9Sstevel@tonic-gate 			if (mp->b_rptr >= wptr) {
16797c478bd9Sstevel@tonic-gate 				/*
16807c478bd9Sstevel@tonic-gate 				 * If this is not the last fragment or if we
16817c478bd9Sstevel@tonic-gate 				 * have not received all the data for this
16827c478bd9Sstevel@tonic-gate 				 * RPC message, then loop around to the next
16837c478bd9Sstevel@tonic-gate 				 * block.
16847c478bd9Sstevel@tonic-gate 				 */
16857c478bd9Sstevel@tonic-gate 				if (!(frag_header & MIR_LASTFRAG) ||
16867c478bd9Sstevel@tonic-gate 				    (frag_len -
16877c478bd9Sstevel@tonic-gate 				    (frag_header & ~MIR_LASTFRAG)) ||
16887c478bd9Sstevel@tonic-gate 				    !head_mp)
16897c478bd9Sstevel@tonic-gate 					goto same_mblk;
16907c478bd9Sstevel@tonic-gate 
16917c478bd9Sstevel@tonic-gate 				/*
16927c478bd9Sstevel@tonic-gate 				 * Quick walk to next block in the
16937c478bd9Sstevel@tonic-gate 				 * STREAMS message.
16947c478bd9Sstevel@tonic-gate 				 */
16957c478bd9Sstevel@tonic-gate 				freeb(mp);
16967c478bd9Sstevel@tonic-gate 				continue;
16977c478bd9Sstevel@tonic-gate 			}
16987c478bd9Sstevel@tonic-gate 		}
16997c478bd9Sstevel@tonic-gate 
17007c478bd9Sstevel@tonic-gate 		/*
17017c478bd9Sstevel@tonic-gate 		 * We've collected the complete record header.  The data
17027c478bd9Sstevel@tonic-gate 		 * in the current block is added to the end of the RPC
17037c478bd9Sstevel@tonic-gate 		 * message.  Note that tail_mp is the same as mp after
17047c478bd9Sstevel@tonic-gate 		 * this linkage.
17057c478bd9Sstevel@tonic-gate 		 */
17067c478bd9Sstevel@tonic-gate 		if (!head_mp)
17077c478bd9Sstevel@tonic-gate 			head_mp = mp;
17087c478bd9Sstevel@tonic-gate 		else if (tail_mp != mp) {
17097c478bd9Sstevel@tonic-gate 			ASSERT((tail_mp->b_cont == NULL) ||
17107c478bd9Sstevel@tonic-gate 			    (tail_mp->b_cont == mp));
17117c478bd9Sstevel@tonic-gate 			tail_mp->b_cont = mp;
17127c478bd9Sstevel@tonic-gate 		}
17137c478bd9Sstevel@tonic-gate 		tail_mp = mp;
17147c478bd9Sstevel@tonic-gate 
17157c478bd9Sstevel@tonic-gate 		/*
17167c478bd9Sstevel@tonic-gate 		 * Add the length of this block to the accumulated
17177c478bd9Sstevel@tonic-gate 		 * fragment length.
17187c478bd9Sstevel@tonic-gate 		 */
17197c478bd9Sstevel@tonic-gate 		frag_len += len;
17207c478bd9Sstevel@tonic-gate 		excess = frag_len - (frag_header & ~MIR_LASTFRAG);
17217c478bd9Sstevel@tonic-gate 		/*
17227c478bd9Sstevel@tonic-gate 		 * If we have not received all the data for this fragment,
17237c478bd9Sstevel@tonic-gate 		 * then walk to the next block.
17247c478bd9Sstevel@tonic-gate 		 */
17257c478bd9Sstevel@tonic-gate 		if (excess < 0)
17267c478bd9Sstevel@tonic-gate 			continue;
17277c478bd9Sstevel@tonic-gate 
17287c478bd9Sstevel@tonic-gate 		/*
17297c478bd9Sstevel@tonic-gate 		 * We've received a complete fragment, so reset frag_len
17307c478bd9Sstevel@tonic-gate 		 * for the next one.
17317c478bd9Sstevel@tonic-gate 		 */
17327c478bd9Sstevel@tonic-gate 		frag_len = -(int32_t)sizeof (uint32_t);
17337c478bd9Sstevel@tonic-gate 
17347c478bd9Sstevel@tonic-gate 		/*
17357c478bd9Sstevel@tonic-gate 		 * Update rptr to point to the beginning of the next
17367c478bd9Sstevel@tonic-gate 		 * fragment in this block.  If there are no more bytes
17377c478bd9Sstevel@tonic-gate 		 * in the block (excess is 0), then rptr will be equal
17387c478bd9Sstevel@tonic-gate 		 * to wptr.
17397c478bd9Sstevel@tonic-gate 		 */
17407c478bd9Sstevel@tonic-gate 		rptr = wptr - excess;
17417c478bd9Sstevel@tonic-gate 
17427c478bd9Sstevel@tonic-gate 		/*
17437c478bd9Sstevel@tonic-gate 		 * Now we check to see if this fragment is the last one in
17447c478bd9Sstevel@tonic-gate 		 * the RPC message.
17457c478bd9Sstevel@tonic-gate 		 */
17467c478bd9Sstevel@tonic-gate 		if (!(frag_header & MIR_LASTFRAG)) {
17477c478bd9Sstevel@tonic-gate 			/*
17487c478bd9Sstevel@tonic-gate 			 * This isn't the last one, so start processing the
17497c478bd9Sstevel@tonic-gate 			 * next fragment.
17507c478bd9Sstevel@tonic-gate 			 */
17517c478bd9Sstevel@tonic-gate 			frag_header = 0;
17527c478bd9Sstevel@tonic-gate 
17537c478bd9Sstevel@tonic-gate 			/*
17547c478bd9Sstevel@tonic-gate 			 * If excess is 0, the next fragment
17557c478bd9Sstevel@tonic-gate 			 * starts at the beginning of the next block --
17567c478bd9Sstevel@tonic-gate 			 * we "continue" to the end of the while loop and
17577c478bd9Sstevel@tonic-gate 			 * walk to cont_mp.
17587c478bd9Sstevel@tonic-gate 			 */
17597c478bd9Sstevel@tonic-gate 			if (excess == 0)
17607c478bd9Sstevel@tonic-gate 				continue;
17617c478bd9Sstevel@tonic-gate 			RPCLOG0(32, "mir_do_rput: multi-fragment message with "
17627c478bd9Sstevel@tonic-gate 			    "two or more fragments in one mblk\n");
17637c478bd9Sstevel@tonic-gate 
17647c478bd9Sstevel@tonic-gate 			/*
17657c478bd9Sstevel@tonic-gate 			 * If excess is non-0, then the next fragment starts
17667c478bd9Sstevel@tonic-gate 			 * in this block.  rptr points to the beginning
17677c478bd9Sstevel@tonic-gate 			 * of the next fragment and we "goto same_mblk"
17687c478bd9Sstevel@tonic-gate 			 * to continue processing.
17697c478bd9Sstevel@tonic-gate 			 */
17707c478bd9Sstevel@tonic-gate 			goto same_mblk;
17717c478bd9Sstevel@tonic-gate 		}
17727c478bd9Sstevel@tonic-gate 
17737c478bd9Sstevel@tonic-gate 		/*
17747c478bd9Sstevel@tonic-gate 		 * We've got a complete RPC message.  Before passing it
17757c478bd9Sstevel@tonic-gate 		 * upstream, check to see if there is extra data in this
17767c478bd9Sstevel@tonic-gate 		 * message block. If so, then we separate the excess
17777c478bd9Sstevel@tonic-gate 		 * from the complete message. The excess data is processed
17787c478bd9Sstevel@tonic-gate 		 * after the current message goes upstream.
17797c478bd9Sstevel@tonic-gate 		 */
17807c478bd9Sstevel@tonic-gate 		if (excess > 0) {
17817c478bd9Sstevel@tonic-gate 			RPCLOG(32, "mir_do_rput: end of record, but excess "
17827c478bd9Sstevel@tonic-gate 			    "data (%d bytes) in this mblk. dupb/copyb "
17837c478bd9Sstevel@tonic-gate 			    "needed\n", excess);
17847c478bd9Sstevel@tonic-gate 
17857c478bd9Sstevel@tonic-gate 			/* Duplicate only the overlapping block. */
17867c478bd9Sstevel@tonic-gate 			mp1 = dupb(tail_mp);
17877c478bd9Sstevel@tonic-gate 
17887c478bd9Sstevel@tonic-gate 			/*
17897c478bd9Sstevel@tonic-gate 			 * dupb() might have failed due to ref count wrap around
17907c478bd9Sstevel@tonic-gate 			 * so try a copyb().
17917c478bd9Sstevel@tonic-gate 			 */
17927c478bd9Sstevel@tonic-gate 			if (mp1 == NULL)
17937c478bd9Sstevel@tonic-gate 				mp1 = copyb(tail_mp);
17947c478bd9Sstevel@tonic-gate 
17957c478bd9Sstevel@tonic-gate 			/*
17967c478bd9Sstevel@tonic-gate 			 * Do not use bufcall() to schedule a "buffer
17977c478bd9Sstevel@tonic-gate 			 * availability event."  The reason is that
17987c478bd9Sstevel@tonic-gate 			 * bufcall() has problems.  For example, if memory
17997c478bd9Sstevel@tonic-gate 			 * runs out, bufcall() itself will fail since it
18007c478bd9Sstevel@tonic-gate 			 * needs to allocate memory.  The most appropriate
18017c478bd9Sstevel@tonic-gate 			 * action right now is to disconnect this connection
18027c478bd9Sstevel@tonic-gate 			 * as the system is under stress.  We should try to
18037c478bd9Sstevel@tonic-gate 			 * free up resources.
18047c478bd9Sstevel@tonic-gate 			 */
18057c478bd9Sstevel@tonic-gate 			if (mp1 == NULL) {
18067c478bd9Sstevel@tonic-gate 				freemsg(head_mp);
18077c478bd9Sstevel@tonic-gate 				RPCLOG0(1, "mir_do_rput: dupb/copyb failed\n");
18087c478bd9Sstevel@tonic-gate 				mir->mir_frag_header = 0;
18097c478bd9Sstevel@tonic-gate 				mir->mir_frag_len = -(int)sizeof (uint32_t);
18107c478bd9Sstevel@tonic-gate 				mir->mir_head_mp = NULL;
18117c478bd9Sstevel@tonic-gate 				mir->mir_tail_mp = NULL;
18127c478bd9Sstevel@tonic-gate 
18137c478bd9Sstevel@tonic-gate 				mir_disconnect(q, mir);
18147c478bd9Sstevel@tonic-gate 				return;
18157c478bd9Sstevel@tonic-gate 			}
18167c478bd9Sstevel@tonic-gate 
18177c478bd9Sstevel@tonic-gate 			/*
18187c478bd9Sstevel@tonic-gate 			 * The new message block is linked with the
18197c478bd9Sstevel@tonic-gate 			 * continuation block in cont_mp.  We then point
18207c478bd9Sstevel@tonic-gate 			 * cont_mp to the new block so that we will
18217c478bd9Sstevel@tonic-gate 			 * process it next.
18227c478bd9Sstevel@tonic-gate 			 */
18237c478bd9Sstevel@tonic-gate 			mp1->b_cont = cont_mp;
18247c478bd9Sstevel@tonic-gate 			cont_mp = mp1;
18257c478bd9Sstevel@tonic-gate 			/*
18267c478bd9Sstevel@tonic-gate 			 * Data in the new block begins at the
18277c478bd9Sstevel@tonic-gate 			 * next fragment (rptr).
18287c478bd9Sstevel@tonic-gate 			 */
18297c478bd9Sstevel@tonic-gate 			cont_mp->b_rptr += (rptr - tail_mp->b_rptr);
18307c478bd9Sstevel@tonic-gate 			ASSERT(cont_mp->b_rptr >= cont_mp->b_datap->db_base);
18317c478bd9Sstevel@tonic-gate 			ASSERT(cont_mp->b_rptr <= cont_mp->b_wptr);
18327c478bd9Sstevel@tonic-gate 
18337c478bd9Sstevel@tonic-gate 			/* Data in the current fragment ends at rptr. */
18347c478bd9Sstevel@tonic-gate 			tail_mp->b_wptr = rptr;
18357c478bd9Sstevel@tonic-gate 			ASSERT(tail_mp->b_wptr <= tail_mp->b_datap->db_lim);
18367c478bd9Sstevel@tonic-gate 			ASSERT(tail_mp->b_wptr >= tail_mp->b_rptr);
18377c478bd9Sstevel@tonic-gate 
18387c478bd9Sstevel@tonic-gate 		}
18397c478bd9Sstevel@tonic-gate 
18407c478bd9Sstevel@tonic-gate 		/* tail_mp is the last block with data for this RPC message. */
18417c478bd9Sstevel@tonic-gate 		tail_mp->b_cont = NULL;
18427c478bd9Sstevel@tonic-gate 
18437c478bd9Sstevel@tonic-gate 		/* Pass the RPC message to the current consumer. */
18447c478bd9Sstevel@tonic-gate 		switch (mir->mir_type) {
18457c478bd9Sstevel@tonic-gate 		case RPC_CLIENT:
18467c478bd9Sstevel@tonic-gate 			if (clnt_dispatch_notify(head_mp, mir->mir_zoneid)) {
18477c478bd9Sstevel@tonic-gate 				/*
18487c478bd9Sstevel@tonic-gate 				 * Mark this stream as active.  This marker
18497c478bd9Sstevel@tonic-gate 				 * is used in mir_timer().
18507c478bd9Sstevel@tonic-gate 				 */
18517c478bd9Sstevel@tonic-gate 
18527c478bd9Sstevel@tonic-gate 				mir->mir_clntreq = 1;
18537c478bd9Sstevel@tonic-gate 				mir->mir_use_timestamp = lbolt;
18547c478bd9Sstevel@tonic-gate 			} else
18557c478bd9Sstevel@tonic-gate 				freemsg(head_mp);
18567c478bd9Sstevel@tonic-gate 			break;
18577c478bd9Sstevel@tonic-gate 
18587c478bd9Sstevel@tonic-gate 		case RPC_SERVER:
18597c478bd9Sstevel@tonic-gate 			/*
18607c478bd9Sstevel@tonic-gate 			 * Check for flow control before passing the
18617c478bd9Sstevel@tonic-gate 			 * message to KRPC.
18627c478bd9Sstevel@tonic-gate 			 */
18637c478bd9Sstevel@tonic-gate 
18647c478bd9Sstevel@tonic-gate 			if (!mir->mir_hold_inbound) {
18657c478bd9Sstevel@tonic-gate 				if (mir->mir_krpc_cell) {
18667c478bd9Sstevel@tonic-gate 					/*
18677c478bd9Sstevel@tonic-gate 					 * If the reference count is 0
18687c478bd9Sstevel@tonic-gate 					 * (not including this request),
18697c478bd9Sstevel@tonic-gate 					 * then the stream is transitioning
18707c478bd9Sstevel@tonic-gate 					 * from idle to non-idle.  In this case,
18717c478bd9Sstevel@tonic-gate 					 * we cancel the idle timer.
18727c478bd9Sstevel@tonic-gate 					 */
18737c478bd9Sstevel@tonic-gate 					if (mir->mir_ref_cnt++ == 0)
18747c478bd9Sstevel@tonic-gate 						stop_timer = B_TRUE;
18757c478bd9Sstevel@tonic-gate 					if (mir_check_len(q,
18767c478bd9Sstevel@tonic-gate 					    (int32_t)msgdsize(mp), mp))
18777c478bd9Sstevel@tonic-gate 						return;
18787c478bd9Sstevel@tonic-gate 					svc_queuereq(q, head_mp); /* to KRPC */
18797c478bd9Sstevel@tonic-gate 				} else {
18807c478bd9Sstevel@tonic-gate 					/*
1881*07e75131Sgt29601 					 * Count # of times this happens. Should
1882*07e75131Sgt29601 					 * be never, but experience shows
1883*07e75131Sgt29601 					 * otherwise.
18847c478bd9Sstevel@tonic-gate 					 */
18857c478bd9Sstevel@tonic-gate 					mir_krpc_cell_null++;
18867c478bd9Sstevel@tonic-gate 					freemsg(head_mp);
18877c478bd9Sstevel@tonic-gate 				}
18887c478bd9Sstevel@tonic-gate 
18897c478bd9Sstevel@tonic-gate 			} else {
18907c478bd9Sstevel@tonic-gate 				/*
18917c478bd9Sstevel@tonic-gate 				 * If the outbound side of the stream is
18927c478bd9Sstevel@tonic-gate 				 * flow controlled, then hold this message
18937c478bd9Sstevel@tonic-gate 				 * until client catches up. mir_hold_inbound
18947c478bd9Sstevel@tonic-gate 				 * is set in mir_wput and cleared in mir_wsrv.
18957c478bd9Sstevel@tonic-gate 				 */
18967c478bd9Sstevel@tonic-gate 				if (srv)
18977c478bd9Sstevel@tonic-gate 					(void) putbq(q, head_mp);
18987c478bd9Sstevel@tonic-gate 				else
18997c478bd9Sstevel@tonic-gate 					(void) putq(q, head_mp);
19007c478bd9Sstevel@tonic-gate 				mir->mir_inrservice = B_TRUE;
19017c478bd9Sstevel@tonic-gate 			}
19027c478bd9Sstevel@tonic-gate 			break;
19037c478bd9Sstevel@tonic-gate 		default:
19047c478bd9Sstevel@tonic-gate 			RPCLOG(1, "mir_rput: unknown mir_type %d\n",
19057c478bd9Sstevel@tonic-gate 			    mir->mir_type);
19067c478bd9Sstevel@tonic-gate 			freemsg(head_mp);
19077c478bd9Sstevel@tonic-gate 			break;
19087c478bd9Sstevel@tonic-gate 		}
19097c478bd9Sstevel@tonic-gate 
19107c478bd9Sstevel@tonic-gate 		/*
19117c478bd9Sstevel@tonic-gate 		 * Reset head_mp and frag_header since we're starting on a
19127c478bd9Sstevel@tonic-gate 		 * new RPC fragment and message.
19137c478bd9Sstevel@tonic-gate 		 */
19147c478bd9Sstevel@tonic-gate 		head_mp = NULL;
19157c478bd9Sstevel@tonic-gate 		tail_mp = NULL;
19167c478bd9Sstevel@tonic-gate 		frag_header = 0;
19177c478bd9Sstevel@tonic-gate 	} while ((mp = cont_mp) != NULL);
19187c478bd9Sstevel@tonic-gate 
19197c478bd9Sstevel@tonic-gate 	/*
19207c478bd9Sstevel@tonic-gate 	 * Do a sanity check on the message length.  If this message is
19217c478bd9Sstevel@tonic-gate 	 * getting excessively large, shut down the connection.
19227c478bd9Sstevel@tonic-gate 	 */
19237c478bd9Sstevel@tonic-gate 	if (head_mp != NULL && mir->mir_setup_complete &&
19247c478bd9Sstevel@tonic-gate 	    mir_check_len(q, frag_len, head_mp))
19257c478bd9Sstevel@tonic-gate 		return;
19267c478bd9Sstevel@tonic-gate 
19277c478bd9Sstevel@tonic-gate 	/* Save our local copies back in the mir structure. */
19287c478bd9Sstevel@tonic-gate 	mir->mir_frag_header = frag_header;
19297c478bd9Sstevel@tonic-gate 	mir->mir_frag_len = frag_len;
19307c478bd9Sstevel@tonic-gate 	mir->mir_head_mp = head_mp;
19317c478bd9Sstevel@tonic-gate 	mir->mir_tail_mp = tail_mp;
19327c478bd9Sstevel@tonic-gate 
19337c478bd9Sstevel@tonic-gate 	/*
19347c478bd9Sstevel@tonic-gate 	 * The timer is stopped after the whole message chain is processed.
19357c478bd9Sstevel@tonic-gate 	 * The reason is that stopping the timer releases the mir_mutex
19367c478bd9Sstevel@tonic-gate 	 * lock temporarily.  This means that the request can be serviced
19377c478bd9Sstevel@tonic-gate 	 * while we are still processing the message chain.  This is not
19387c478bd9Sstevel@tonic-gate 	 * good.  So we stop the timer here instead.
19397c478bd9Sstevel@tonic-gate 	 *
19407c478bd9Sstevel@tonic-gate 	 * Note that if the timer fires before we stop it, it will not
19417c478bd9Sstevel@tonic-gate 	 * do any harm as MIR_SVC_QUIESCED() is false and mir_timer()
19427c478bd9Sstevel@tonic-gate 	 * will just return;
19437c478bd9Sstevel@tonic-gate 	 */
19447c478bd9Sstevel@tonic-gate 	if (stop_timer) {
19457c478bd9Sstevel@tonic-gate 		RPCLOG(16, "mir_do_rput stopping idle timer on 0x%p because "
19467c478bd9Sstevel@tonic-gate 		    "ref cnt going to non zero\n", (void *) WR(q));
19477c478bd9Sstevel@tonic-gate 		mir_svc_idle_stop(WR(q), mir);
19487c478bd9Sstevel@tonic-gate 	}
19497c478bd9Sstevel@tonic-gate 	mutex_exit(&mir->mir_mutex);
19507c478bd9Sstevel@tonic-gate }
19517c478bd9Sstevel@tonic-gate 
19527c478bd9Sstevel@tonic-gate static void
19537c478bd9Sstevel@tonic-gate mir_rput(queue_t *q, mblk_t *mp)
19547c478bd9Sstevel@tonic-gate {
19557c478bd9Sstevel@tonic-gate 	mir_do_rput(q, mp, 0);
19567c478bd9Sstevel@tonic-gate }
19577c478bd9Sstevel@tonic-gate 
19587c478bd9Sstevel@tonic-gate static void
19597c478bd9Sstevel@tonic-gate mir_rput_proto(queue_t *q, mblk_t *mp)
19607c478bd9Sstevel@tonic-gate {
19617c478bd9Sstevel@tonic-gate 	mir_t	*mir = (mir_t *)q->q_ptr;
19627c478bd9Sstevel@tonic-gate 	uint32_t	type;
19637c478bd9Sstevel@tonic-gate 	uint32_t reason = 0;
19647c478bd9Sstevel@tonic-gate 
19657c478bd9Sstevel@tonic-gate 	ASSERT(MUTEX_NOT_HELD(&mir->mir_mutex));
19667c478bd9Sstevel@tonic-gate 
19677c478bd9Sstevel@tonic-gate 	type = ((union T_primitives *)mp->b_rptr)->type;
19687c478bd9Sstevel@tonic-gate 	switch (mir->mir_type) {
19697c478bd9Sstevel@tonic-gate 	case RPC_CLIENT:
19707c478bd9Sstevel@tonic-gate 		switch (type) {
19717c478bd9Sstevel@tonic-gate 		case T_DISCON_IND:
1972*07e75131Sgt29601 			reason = ((struct T_discon_ind *)
1973*07e75131Sgt29601 			    (mp->b_rptr))->DISCON_reason;
19747c478bd9Sstevel@tonic-gate 		    /*FALLTHROUGH*/
19757c478bd9Sstevel@tonic-gate 		case T_ORDREL_IND:
19767c478bd9Sstevel@tonic-gate 			mutex_enter(&mir->mir_mutex);
19777c478bd9Sstevel@tonic-gate 			if (mir->mir_head_mp) {
19787c478bd9Sstevel@tonic-gate 				freemsg(mir->mir_head_mp);
19797c478bd9Sstevel@tonic-gate 				mir->mir_head_mp = (mblk_t *)0;
19807c478bd9Sstevel@tonic-gate 				mir->mir_tail_mp = (mblk_t *)0;
19817c478bd9Sstevel@tonic-gate 			}
19827c478bd9Sstevel@tonic-gate 			/*
19837c478bd9Sstevel@tonic-gate 			 * We are disconnecting, but not necessarily
19847c478bd9Sstevel@tonic-gate 			 * closing. By not closing, we will fail to
19857c478bd9Sstevel@tonic-gate 			 * pick up a possibly changed global timeout value,
19867c478bd9Sstevel@tonic-gate 			 * unless we store it now.
19877c478bd9Sstevel@tonic-gate 			 */
19887c478bd9Sstevel@tonic-gate 			mir->mir_idle_timeout = clnt_idle_timeout;
19897c478bd9Sstevel@tonic-gate 			mir_clnt_idle_stop(WR(q), mir);
19907c478bd9Sstevel@tonic-gate 
19917c478bd9Sstevel@tonic-gate 			/*
19927c478bd9Sstevel@tonic-gate 			 * Even though we are unconnected, we still
19937c478bd9Sstevel@tonic-gate 			 * leave the idle timer going on the client. The
19947c478bd9Sstevel@tonic-gate 			 * reason for is that if we've disconnected due
19957c478bd9Sstevel@tonic-gate 			 * to a server-side disconnect, reset, or connection
19967c478bd9Sstevel@tonic-gate 			 * timeout, there is a possibility the client may
19977c478bd9Sstevel@tonic-gate 			 * retry the RPC request. This retry needs to done on
19987c478bd9Sstevel@tonic-gate 			 * the same bound address for the server to interpret
19997c478bd9Sstevel@tonic-gate 			 * it as such. However, we don't want
20007c478bd9Sstevel@tonic-gate 			 * to wait forever for that possibility. If the
20017c478bd9Sstevel@tonic-gate 			 * end-point stays unconnected for mir_idle_timeout
20027c478bd9Sstevel@tonic-gate 			 * units of time, then that is a signal to the
20037c478bd9Sstevel@tonic-gate 			 * connection manager to give up waiting for the
20047c478bd9Sstevel@tonic-gate 			 * application (eg. NFS) to send a retry.
20057c478bd9Sstevel@tonic-gate 			 */
20067c478bd9Sstevel@tonic-gate 			mir_clnt_idle_start(WR(q), mir);
20077c478bd9Sstevel@tonic-gate 			mutex_exit(&mir->mir_mutex);
20087c478bd9Sstevel@tonic-gate 			clnt_dispatch_notifyall(WR(q), type, reason);
20097c478bd9Sstevel@tonic-gate 			freemsg(mp);
20107c478bd9Sstevel@tonic-gate 			return;
20117c478bd9Sstevel@tonic-gate 		case T_ERROR_ACK:
20127c478bd9Sstevel@tonic-gate 		{
20137c478bd9Sstevel@tonic-gate 			struct T_error_ack	*terror;
20147c478bd9Sstevel@tonic-gate 
20157c478bd9Sstevel@tonic-gate 			terror = (struct T_error_ack *)mp->b_rptr;
20167c478bd9Sstevel@tonic-gate 			RPCLOG(1, "mir_rput_proto T_ERROR_ACK for queue 0x%p",
20177c478bd9Sstevel@tonic-gate 			    (void *)q);
20187c478bd9Sstevel@tonic-gate 			RPCLOG(1, " ERROR_prim: %s,",
20197c478bd9Sstevel@tonic-gate 			    rpc_tpiprim2name(terror->ERROR_prim));
20207c478bd9Sstevel@tonic-gate 			RPCLOG(1, " TLI_error: %s,",
20217c478bd9Sstevel@tonic-gate 			    rpc_tpierr2name(terror->TLI_error));
20227c478bd9Sstevel@tonic-gate 			RPCLOG(1, " UNIX_error: %d\n", terror->UNIX_error);
20237c478bd9Sstevel@tonic-gate 			if (terror->ERROR_prim == T_DISCON_REQ)  {
20247c478bd9Sstevel@tonic-gate 				clnt_dispatch_notifyall(WR(q), type, reason);
20257c478bd9Sstevel@tonic-gate 				freemsg(mp);
20267c478bd9Sstevel@tonic-gate 				return;
20277c478bd9Sstevel@tonic-gate 			} else {
20287c478bd9Sstevel@tonic-gate 				if (clnt_dispatch_notifyconn(WR(q), mp))
20297c478bd9Sstevel@tonic-gate 					return;
20307c478bd9Sstevel@tonic-gate 			}
20317c478bd9Sstevel@tonic-gate 			break;
20327c478bd9Sstevel@tonic-gate 		}
20337c478bd9Sstevel@tonic-gate 		case T_OK_ACK:
20347c478bd9Sstevel@tonic-gate 		{
20357c478bd9Sstevel@tonic-gate 			struct T_ok_ack	*tok = (struct T_ok_ack *)mp->b_rptr;
20367c478bd9Sstevel@tonic-gate 
20377c478bd9Sstevel@tonic-gate 			if (tok->CORRECT_prim == T_DISCON_REQ) {
20387c478bd9Sstevel@tonic-gate 				clnt_dispatch_notifyall(WR(q), type, reason);
20397c478bd9Sstevel@tonic-gate 				freemsg(mp);
20407c478bd9Sstevel@tonic-gate 				return;
20417c478bd9Sstevel@tonic-gate 			} else {
20427c478bd9Sstevel@tonic-gate 				if (clnt_dispatch_notifyconn(WR(q), mp))
20437c478bd9Sstevel@tonic-gate 					return;
20447c478bd9Sstevel@tonic-gate 			}
20457c478bd9Sstevel@tonic-gate 			break;
20467c478bd9Sstevel@tonic-gate 		}
20477c478bd9Sstevel@tonic-gate 		case T_CONN_CON:
20487c478bd9Sstevel@tonic-gate 		case T_INFO_ACK:
20497c478bd9Sstevel@tonic-gate 		case T_OPTMGMT_ACK:
20507c478bd9Sstevel@tonic-gate 			if (clnt_dispatch_notifyconn(WR(q), mp))
20517c478bd9Sstevel@tonic-gate 				return;
20527c478bd9Sstevel@tonic-gate 			break;
20537c478bd9Sstevel@tonic-gate 		case T_BIND_ACK:
20547c478bd9Sstevel@tonic-gate 			break;
20557c478bd9Sstevel@tonic-gate 		default:
20567c478bd9Sstevel@tonic-gate 			RPCLOG(1, "mir_rput: unexpected message %d "
20577c478bd9Sstevel@tonic-gate 			    "for KRPC client\n",
20587c478bd9Sstevel@tonic-gate 			    ((union T_primitives *)mp->b_rptr)->type);
20597c478bd9Sstevel@tonic-gate 			break;
20607c478bd9Sstevel@tonic-gate 		}
20617c478bd9Sstevel@tonic-gate 		break;
20627c478bd9Sstevel@tonic-gate 
20637c478bd9Sstevel@tonic-gate 	case RPC_SERVER:
20647c478bd9Sstevel@tonic-gate 		switch (type) {
20657c478bd9Sstevel@tonic-gate 		case T_BIND_ACK:
20667c478bd9Sstevel@tonic-gate 		{
20677c478bd9Sstevel@tonic-gate 			struct T_bind_ack	*tbind;
20687c478bd9Sstevel@tonic-gate 
20697c478bd9Sstevel@tonic-gate 			/*
20707c478bd9Sstevel@tonic-gate 			 * If this is a listening stream, then shut
20717c478bd9Sstevel@tonic-gate 			 * off the idle timer.
20727c478bd9Sstevel@tonic-gate 			 */
20737c478bd9Sstevel@tonic-gate 			tbind = (struct T_bind_ack *)mp->b_rptr;
20747c478bd9Sstevel@tonic-gate 			if (tbind->CONIND_number > 0) {
20757c478bd9Sstevel@tonic-gate 				mutex_enter(&mir->mir_mutex);
20767c478bd9Sstevel@tonic-gate 				mir_svc_idle_stop(WR(q), mir);
20777c478bd9Sstevel@tonic-gate 
20787c478bd9Sstevel@tonic-gate 				/*
20797c478bd9Sstevel@tonic-gate 				 * mark this as a listen endpoint
20807c478bd9Sstevel@tonic-gate 				 * for special handling.
20817c478bd9Sstevel@tonic-gate 				 */
20827c478bd9Sstevel@tonic-gate 
20837c478bd9Sstevel@tonic-gate 				mir->mir_listen_stream = 1;
20847c478bd9Sstevel@tonic-gate 				mutex_exit(&mir->mir_mutex);
20857c478bd9Sstevel@tonic-gate 			}
20867c478bd9Sstevel@tonic-gate 			break;
20877c478bd9Sstevel@tonic-gate 		}
20887c478bd9Sstevel@tonic-gate 		case T_DISCON_IND:
20897c478bd9Sstevel@tonic-gate 		case T_ORDREL_IND:
20907c478bd9Sstevel@tonic-gate 			RPCLOG(16, "mir_rput_proto: got %s indication\n",
20917c478bd9Sstevel@tonic-gate 			    type == T_DISCON_IND ? "disconnect"
20927c478bd9Sstevel@tonic-gate 			    : "orderly release");
20937c478bd9Sstevel@tonic-gate 
20947c478bd9Sstevel@tonic-gate 			/*
20957c478bd9Sstevel@tonic-gate 			 * For listen endpoint just pass
20967c478bd9Sstevel@tonic-gate 			 * on the message.
20977c478bd9Sstevel@tonic-gate 			 */
20987c478bd9Sstevel@tonic-gate 
20997c478bd9Sstevel@tonic-gate 			if (mir->mir_listen_stream)
21007c478bd9Sstevel@tonic-gate 				break;
21017c478bd9Sstevel@tonic-gate 
21027c478bd9Sstevel@tonic-gate 			mutex_enter(&mir->mir_mutex);
21037c478bd9Sstevel@tonic-gate 
21047c478bd9Sstevel@tonic-gate 			/*
21057c478bd9Sstevel@tonic-gate 			 * If client wants to break off connection, record
21067c478bd9Sstevel@tonic-gate 			 * that fact.
21077c478bd9Sstevel@tonic-gate 			 */
21087c478bd9Sstevel@tonic-gate 			mir_svc_start_close(WR(q), mir);
21097c478bd9Sstevel@tonic-gate 
21107c478bd9Sstevel@tonic-gate 			/*
21117c478bd9Sstevel@tonic-gate 			 * If we are idle, then send the orderly release
21127c478bd9Sstevel@tonic-gate 			 * or disconnect indication to nfsd.
21137c478bd9Sstevel@tonic-gate 			 */
21147c478bd9Sstevel@tonic-gate 			if (MIR_SVC_QUIESCED(mir)) {
21157c478bd9Sstevel@tonic-gate 				mutex_exit(&mir->mir_mutex);
21167c478bd9Sstevel@tonic-gate 				break;
21177c478bd9Sstevel@tonic-gate 			}
21187c478bd9Sstevel@tonic-gate 
21197c478bd9Sstevel@tonic-gate 			RPCLOG(16, "mir_rput_proto: not idle, so "
21207c478bd9Sstevel@tonic-gate 			    "disconnect/ord rel indication not passed "
21217c478bd9Sstevel@tonic-gate 			    "upstream on 0x%p\n", (void *)q);
21227c478bd9Sstevel@tonic-gate 
21237c478bd9Sstevel@tonic-gate 			/*
21247c478bd9Sstevel@tonic-gate 			 * Hold the indication until we get idle
21257c478bd9Sstevel@tonic-gate 			 * If there already is an indication stored,
21267c478bd9Sstevel@tonic-gate 			 * replace it if the new one is a disconnect. The
21277c478bd9Sstevel@tonic-gate 			 * reasoning is that disconnection takes less time
21287c478bd9Sstevel@tonic-gate 			 * to process, and once a client decides to
21297c478bd9Sstevel@tonic-gate 			 * disconnect, we should do that.
21307c478bd9Sstevel@tonic-gate 			 */
21317c478bd9Sstevel@tonic-gate 			if (mir->mir_svc_pend_mp) {
21327c478bd9Sstevel@tonic-gate 				if (type == T_DISCON_IND) {
21337c478bd9Sstevel@tonic-gate 					RPCLOG(16, "mir_rput_proto: replacing"
21347c478bd9Sstevel@tonic-gate 					    " held disconnect/ord rel"
21357c478bd9Sstevel@tonic-gate 					    " indication with disconnect on"
21367c478bd9Sstevel@tonic-gate 					    " 0x%p\n", (void *)q);
21377c478bd9Sstevel@tonic-gate 
21387c478bd9Sstevel@tonic-gate 					freemsg(mir->mir_svc_pend_mp);
21397c478bd9Sstevel@tonic-gate 					mir->mir_svc_pend_mp = mp;
21407c478bd9Sstevel@tonic-gate 				} else {
21417c478bd9Sstevel@tonic-gate 					RPCLOG(16, "mir_rput_proto: already "
21427c478bd9Sstevel@tonic-gate 					    "held a disconnect/ord rel "
21437c478bd9Sstevel@tonic-gate 					    "indication. freeing ord rel "
21447c478bd9Sstevel@tonic-gate 					    "ind on 0x%p\n", (void *)q);
21457c478bd9Sstevel@tonic-gate 					freemsg(mp);
21467c478bd9Sstevel@tonic-gate 				}
21477c478bd9Sstevel@tonic-gate 			} else
21487c478bd9Sstevel@tonic-gate 				mir->mir_svc_pend_mp = mp;
21497c478bd9Sstevel@tonic-gate 
21507c478bd9Sstevel@tonic-gate 			mutex_exit(&mir->mir_mutex);
21517c478bd9Sstevel@tonic-gate 			return;
21527c478bd9Sstevel@tonic-gate 
21537c478bd9Sstevel@tonic-gate 		default:
21547c478bd9Sstevel@tonic-gate 			/* nfsd handles server-side non-data messages. */
21557c478bd9Sstevel@tonic-gate 			break;
21567c478bd9Sstevel@tonic-gate 		}
21577c478bd9Sstevel@tonic-gate 		break;
21587c478bd9Sstevel@tonic-gate 
21597c478bd9Sstevel@tonic-gate 	default:
21607c478bd9Sstevel@tonic-gate 		break;
21617c478bd9Sstevel@tonic-gate 	}
21627c478bd9Sstevel@tonic-gate 
21637c478bd9Sstevel@tonic-gate 	putnext(q, mp);
21647c478bd9Sstevel@tonic-gate }
21657c478bd9Sstevel@tonic-gate 
21667c478bd9Sstevel@tonic-gate /*
21677c478bd9Sstevel@tonic-gate  * The server-side read queues are used to hold inbound messages while
21687c478bd9Sstevel@tonic-gate  * outbound flow control is exerted.  When outbound flow control is
21697c478bd9Sstevel@tonic-gate  * relieved, mir_wsrv qenables the read-side queue.  Read-side queues
21707c478bd9Sstevel@tonic-gate  * are not enabled by STREAMS and are explicitly noenable'ed in mir_open.
21717c478bd9Sstevel@tonic-gate  *
21727c478bd9Sstevel@tonic-gate  * For the server side,  we have two types of messages queued. The first type
21737c478bd9Sstevel@tonic-gate  * are messages that are ready to be XDR decoded and and then sent to the
21747c478bd9Sstevel@tonic-gate  * RPC program's dispatch routine. The second type are "raw" messages that
21757c478bd9Sstevel@tonic-gate  * haven't been processed, i.e. assembled from rpc record fragements into
21767c478bd9Sstevel@tonic-gate  * full requests. The only time we will see the second type of message
21777c478bd9Sstevel@tonic-gate  * queued is if we have a memory allocation failure while processing a
21787c478bd9Sstevel@tonic-gate  * a raw message. The field mir_first_non_processed_mblk will mark the
21797c478bd9Sstevel@tonic-gate  * first such raw message. So the flow for server side is:
21807c478bd9Sstevel@tonic-gate  *
21817c478bd9Sstevel@tonic-gate  *	- send processed queued messages to kRPC until we run out or find
21827c478bd9Sstevel@tonic-gate  *	  one that needs additional processing because we were short on memory
21837c478bd9Sstevel@tonic-gate  *	  earlier
21847c478bd9Sstevel@tonic-gate  *	- process a message that was deferred because of lack of
21857c478bd9Sstevel@tonic-gate  *	  memory
21867c478bd9Sstevel@tonic-gate  *	- continue processing messages until the queue empties or we
21877c478bd9Sstevel@tonic-gate  *	  have to stop because of lack of memory
21887c478bd9Sstevel@tonic-gate  *	- during each of the above phase, if the queue is empty and
21897c478bd9Sstevel@tonic-gate  *	  there are no pending messages that were passed to the RPC
21907c478bd9Sstevel@tonic-gate  *	  layer, send upstream the pending disconnect/ordrel indication if
21917c478bd9Sstevel@tonic-gate  *	  there is one
21927c478bd9Sstevel@tonic-gate  *
21937c478bd9Sstevel@tonic-gate  * The read-side queue is also enabled by a bufcall callback if dupmsg
21947c478bd9Sstevel@tonic-gate  * fails in mir_rput.
21957c478bd9Sstevel@tonic-gate  */
21967c478bd9Sstevel@tonic-gate static void
21977c478bd9Sstevel@tonic-gate mir_rsrv(queue_t *q)
21987c478bd9Sstevel@tonic-gate {
21997c478bd9Sstevel@tonic-gate 	mir_t	*mir;
22007c478bd9Sstevel@tonic-gate 	mblk_t	*mp;
22017c478bd9Sstevel@tonic-gate 	mblk_t	*cmp = NULL;
22027c478bd9Sstevel@tonic-gate 	boolean_t stop_timer = B_FALSE;
22037c478bd9Sstevel@tonic-gate 
22047c478bd9Sstevel@tonic-gate 	mir = (mir_t *)q->q_ptr;
22057c478bd9Sstevel@tonic-gate 	mutex_enter(&mir->mir_mutex);
22067c478bd9Sstevel@tonic-gate 
22077c478bd9Sstevel@tonic-gate 	mp = NULL;
22087c478bd9Sstevel@tonic-gate 	switch (mir->mir_type) {
22097c478bd9Sstevel@tonic-gate 	case RPC_SERVER:
22107c478bd9Sstevel@tonic-gate 		if (mir->mir_ref_cnt == 0)
22117c478bd9Sstevel@tonic-gate 			mir->mir_hold_inbound = 0;
22127c478bd9Sstevel@tonic-gate 		if (mir->mir_hold_inbound) {
22137c478bd9Sstevel@tonic-gate 
22147c478bd9Sstevel@tonic-gate 			ASSERT(cmp == NULL);
22157c478bd9Sstevel@tonic-gate 			if (q->q_first == NULL) {
22167c478bd9Sstevel@tonic-gate 
22177c478bd9Sstevel@tonic-gate 				MIR_CLEAR_INRSRV(mir);
22187c478bd9Sstevel@tonic-gate 
22197c478bd9Sstevel@tonic-gate 				if (MIR_SVC_QUIESCED(mir)) {
22207c478bd9Sstevel@tonic-gate 					cmp = mir->mir_svc_pend_mp;
22217c478bd9Sstevel@tonic-gate 					mir->mir_svc_pend_mp = NULL;
22227c478bd9Sstevel@tonic-gate 				}
22237c478bd9Sstevel@tonic-gate 			}
22247c478bd9Sstevel@tonic-gate 
22257c478bd9Sstevel@tonic-gate 			mutex_exit(&mir->mir_mutex);
22267c478bd9Sstevel@tonic-gate 
22277c478bd9Sstevel@tonic-gate 			if (cmp != NULL) {
22287c478bd9Sstevel@tonic-gate 				RPCLOG(16, "mir_rsrv: line %d: sending a held "
22297c478bd9Sstevel@tonic-gate 				    "disconnect/ord rel indication upstream\n",
22307c478bd9Sstevel@tonic-gate 				    __LINE__);
22317c478bd9Sstevel@tonic-gate 				putnext(q, cmp);
22327c478bd9Sstevel@tonic-gate 			}
22337c478bd9Sstevel@tonic-gate 
22347c478bd9Sstevel@tonic-gate 			return;
22357c478bd9Sstevel@tonic-gate 		}
22367c478bd9Sstevel@tonic-gate 		while (mp = getq(q)) {
2237*07e75131Sgt29601 			if (mir->mir_krpc_cell &&
2238*07e75131Sgt29601 			    (mir->mir_svc_no_more_msgs == 0)) {
22397c478bd9Sstevel@tonic-gate 				/*
22407c478bd9Sstevel@tonic-gate 				 * If we were idle, turn off idle timer since
22417c478bd9Sstevel@tonic-gate 				 * we aren't idle any more.
22427c478bd9Sstevel@tonic-gate 				 */
22437c478bd9Sstevel@tonic-gate 				if (mir->mir_ref_cnt++ == 0)
22447c478bd9Sstevel@tonic-gate 					stop_timer = B_TRUE;
22457c478bd9Sstevel@tonic-gate 				if (mir_check_len(q,
22467c478bd9Sstevel@tonic-gate 				    (int32_t)msgdsize(mp), mp))
22477c478bd9Sstevel@tonic-gate 					return;
22487c478bd9Sstevel@tonic-gate 				svc_queuereq(q, mp);
22497c478bd9Sstevel@tonic-gate 			} else {
22507c478bd9Sstevel@tonic-gate 				/*
22517c478bd9Sstevel@tonic-gate 				 * Count # of times this happens. Should be
22527c478bd9Sstevel@tonic-gate 				 * never, but experience shows otherwise.
22537c478bd9Sstevel@tonic-gate 				 */
2254*07e75131Sgt29601 				if (mir->mir_krpc_cell == NULL)
22557c478bd9Sstevel@tonic-gate 					mir_krpc_cell_null++;
22567c478bd9Sstevel@tonic-gate 				freemsg(mp);
22577c478bd9Sstevel@tonic-gate 			}
22587c478bd9Sstevel@tonic-gate 		}
22597c478bd9Sstevel@tonic-gate 		break;
22607c478bd9Sstevel@tonic-gate 	case RPC_CLIENT:
22617c478bd9Sstevel@tonic-gate 		break;
22627c478bd9Sstevel@tonic-gate 	default:
22637c478bd9Sstevel@tonic-gate 		RPCLOG(1, "mir_rsrv: unexpected mir_type %d\n", mir->mir_type);
22647c478bd9Sstevel@tonic-gate 
22657c478bd9Sstevel@tonic-gate 		if (q->q_first == NULL)
22667c478bd9Sstevel@tonic-gate 			MIR_CLEAR_INRSRV(mir);
22677c478bd9Sstevel@tonic-gate 
22687c478bd9Sstevel@tonic-gate 		mutex_exit(&mir->mir_mutex);
22697c478bd9Sstevel@tonic-gate 
22707c478bd9Sstevel@tonic-gate 		return;
22717c478bd9Sstevel@tonic-gate 	}
22727c478bd9Sstevel@tonic-gate 
22737c478bd9Sstevel@tonic-gate 	/*
22747c478bd9Sstevel@tonic-gate 	 * The timer is stopped after all the messages are processed.
22757c478bd9Sstevel@tonic-gate 	 * The reason is that stopping the timer releases the mir_mutex
22767c478bd9Sstevel@tonic-gate 	 * lock temporarily.  This means that the request can be serviced
22777c478bd9Sstevel@tonic-gate 	 * while we are still processing the message queue.  This is not
22787c478bd9Sstevel@tonic-gate 	 * good.  So we stop the timer here instead.
22797c478bd9Sstevel@tonic-gate 	 */
22807c478bd9Sstevel@tonic-gate 	if (stop_timer)  {
22817c478bd9Sstevel@tonic-gate 		RPCLOG(16, "mir_rsrv stopping idle timer on 0x%p because ref "
22827c478bd9Sstevel@tonic-gate 		    "cnt going to non zero\n", (void *)WR(q));
22837c478bd9Sstevel@tonic-gate 		mir_svc_idle_stop(WR(q), mir);
22847c478bd9Sstevel@tonic-gate 	}
22857c478bd9Sstevel@tonic-gate 
22867c478bd9Sstevel@tonic-gate 	if (q->q_first == NULL) {
22877c478bd9Sstevel@tonic-gate 
22887c478bd9Sstevel@tonic-gate 		MIR_CLEAR_INRSRV(mir);
22897c478bd9Sstevel@tonic-gate 
22907c478bd9Sstevel@tonic-gate 		ASSERT(cmp == NULL);
22917c478bd9Sstevel@tonic-gate 		if (mir->mir_type == RPC_SERVER && MIR_SVC_QUIESCED(mir)) {
22927c478bd9Sstevel@tonic-gate 			cmp = mir->mir_svc_pend_mp;
22937c478bd9Sstevel@tonic-gate 			mir->mir_svc_pend_mp = NULL;
22947c478bd9Sstevel@tonic-gate 		}
22957c478bd9Sstevel@tonic-gate 
22967c478bd9Sstevel@tonic-gate 		mutex_exit(&mir->mir_mutex);
22977c478bd9Sstevel@tonic-gate 
22987c478bd9Sstevel@tonic-gate 		if (cmp != NULL) {
22997c478bd9Sstevel@tonic-gate 			RPCLOG(16, "mir_rsrv: line %d: sending a held "
23007c478bd9Sstevel@tonic-gate 			    "disconnect/ord rel indication upstream\n",
23017c478bd9Sstevel@tonic-gate 			    __LINE__);
23027c478bd9Sstevel@tonic-gate 			putnext(q, cmp);
23037c478bd9Sstevel@tonic-gate 		}
23047c478bd9Sstevel@tonic-gate 
23057c478bd9Sstevel@tonic-gate 		return;
23067c478bd9Sstevel@tonic-gate 	}
23077c478bd9Sstevel@tonic-gate 	mutex_exit(&mir->mir_mutex);
23087c478bd9Sstevel@tonic-gate }
23097c478bd9Sstevel@tonic-gate 
23107c478bd9Sstevel@tonic-gate static int mir_svc_policy_fails;
23117c478bd9Sstevel@tonic-gate 
23127c478bd9Sstevel@tonic-gate /*
23137c478bd9Sstevel@tonic-gate  * Called to send an event code to nfsd/lockd so that it initiates
23147c478bd9Sstevel@tonic-gate  * connection close.
23157c478bd9Sstevel@tonic-gate  */
23167c478bd9Sstevel@tonic-gate static int
23177c478bd9Sstevel@tonic-gate mir_svc_policy_notify(queue_t *q, int event)
23187c478bd9Sstevel@tonic-gate {
23197c478bd9Sstevel@tonic-gate 	mblk_t	*mp;
23207c478bd9Sstevel@tonic-gate #ifdef DEBUG
23217c478bd9Sstevel@tonic-gate 	mir_t *mir = (mir_t *)q->q_ptr;
23227c478bd9Sstevel@tonic-gate 	ASSERT(MUTEX_NOT_HELD(&mir->mir_mutex));
23237c478bd9Sstevel@tonic-gate #endif
23247c478bd9Sstevel@tonic-gate 	ASSERT(q->q_flag & QREADR);
23257c478bd9Sstevel@tonic-gate 
23267c478bd9Sstevel@tonic-gate 	/*
23277c478bd9Sstevel@tonic-gate 	 * Create an M_DATA message with the event code and pass it to the
23287c478bd9Sstevel@tonic-gate 	 * Stream head (nfsd or whoever created the stream will consume it).
23297c478bd9Sstevel@tonic-gate 	 */
23307c478bd9Sstevel@tonic-gate 	mp = allocb(sizeof (int), BPRI_HI);
23317c478bd9Sstevel@tonic-gate 
23327c478bd9Sstevel@tonic-gate 	if (!mp) {
23337c478bd9Sstevel@tonic-gate 
23347c478bd9Sstevel@tonic-gate 		mir_svc_policy_fails++;
23357c478bd9Sstevel@tonic-gate 		RPCLOG(16, "mir_svc_policy_notify: could not allocate event "
23367c478bd9Sstevel@tonic-gate 		    "%d\n", event);
23377c478bd9Sstevel@tonic-gate 		return (ENOMEM);
23387c478bd9Sstevel@tonic-gate 	}
23397c478bd9Sstevel@tonic-gate 
23407c478bd9Sstevel@tonic-gate 	U32_TO_BE32(event, mp->b_rptr);
23417c478bd9Sstevel@tonic-gate 	mp->b_wptr = mp->b_rptr + sizeof (int);
23427c478bd9Sstevel@tonic-gate 	putnext(q, mp);
23437c478bd9Sstevel@tonic-gate 	return (0);
23447c478bd9Sstevel@tonic-gate }
23457c478bd9Sstevel@tonic-gate 
23467c478bd9Sstevel@tonic-gate /*
23477c478bd9Sstevel@tonic-gate  * Server side: start the close phase. We want to get this rpcmod slot in an
23487c478bd9Sstevel@tonic-gate  * idle state before mir_close() is called.
23497c478bd9Sstevel@tonic-gate  */
23507c478bd9Sstevel@tonic-gate static void
23517c478bd9Sstevel@tonic-gate mir_svc_start_close(queue_t *wq, mir_t *mir)
23527c478bd9Sstevel@tonic-gate {
23537c478bd9Sstevel@tonic-gate 	ASSERT(MUTEX_HELD(&mir->mir_mutex));
23547c478bd9Sstevel@tonic-gate 	ASSERT((wq->q_flag & QREADR) == 0);
23557c478bd9Sstevel@tonic-gate 	ASSERT(mir->mir_type == RPC_SERVER);
23567c478bd9Sstevel@tonic-gate 
23577c478bd9Sstevel@tonic-gate 
23587c478bd9Sstevel@tonic-gate 	/*
23597c478bd9Sstevel@tonic-gate 	 * Do not accept any more messages.
23607c478bd9Sstevel@tonic-gate 	 */
23617c478bd9Sstevel@tonic-gate 	mir->mir_svc_no_more_msgs = 1;
23627c478bd9Sstevel@tonic-gate 
23637c478bd9Sstevel@tonic-gate 	/*
23647c478bd9Sstevel@tonic-gate 	 * Next two statements will make the read service procedure invoke
23657c478bd9Sstevel@tonic-gate 	 * svc_queuereq() on everything stuck in the streams read queue.
23667c478bd9Sstevel@tonic-gate 	 * It's not necessary because enabling the write queue will
23677c478bd9Sstevel@tonic-gate 	 * have the same effect, but why not speed the process along?
23687c478bd9Sstevel@tonic-gate 	 */
23697c478bd9Sstevel@tonic-gate 	mir->mir_hold_inbound = 0;
23707c478bd9Sstevel@tonic-gate 	qenable(RD(wq));
23717c478bd9Sstevel@tonic-gate 
23727c478bd9Sstevel@tonic-gate 	/*
23737c478bd9Sstevel@tonic-gate 	 * Meanwhile force the write service procedure to send the
23747c478bd9Sstevel@tonic-gate 	 * responses downstream, regardless of flow control.
23757c478bd9Sstevel@tonic-gate 	 */
23767c478bd9Sstevel@tonic-gate 	qenable(wq);
23777c478bd9Sstevel@tonic-gate }
23787c478bd9Sstevel@tonic-gate 
23797c478bd9Sstevel@tonic-gate /*
23807c478bd9Sstevel@tonic-gate  * This routine is called directly by KRPC after a request is completed,
23817c478bd9Sstevel@tonic-gate  * whether a reply was sent or the request was dropped.
23827c478bd9Sstevel@tonic-gate  */
23837c478bd9Sstevel@tonic-gate static void
23847c478bd9Sstevel@tonic-gate mir_svc_release(queue_t *wq, mblk_t *mp)
23857c478bd9Sstevel@tonic-gate {
23867c478bd9Sstevel@tonic-gate 	mir_t   *mir = (mir_t *)wq->q_ptr;
23877c478bd9Sstevel@tonic-gate 	mblk_t	*cmp = NULL;
23887c478bd9Sstevel@tonic-gate 
23897c478bd9Sstevel@tonic-gate 	ASSERT((wq->q_flag & QREADR) == 0);
23907c478bd9Sstevel@tonic-gate 	if (mp)
23917c478bd9Sstevel@tonic-gate 		freemsg(mp);
23927c478bd9Sstevel@tonic-gate 
23937c478bd9Sstevel@tonic-gate 	mutex_enter(&mir->mir_mutex);
23947c478bd9Sstevel@tonic-gate 
23957c478bd9Sstevel@tonic-gate 	/*
23967c478bd9Sstevel@tonic-gate 	 * Start idle processing if this is the last reference.
23977c478bd9Sstevel@tonic-gate 	 */
239893132ae0Smaheshvs 	if ((mir->mir_ref_cnt == 1) && (mir->mir_inrservice == 0)) {
23997c478bd9Sstevel@tonic-gate 
24007c478bd9Sstevel@tonic-gate 		RPCLOG(16, "mir_svc_release starting idle timer on 0x%p "
24017c478bd9Sstevel@tonic-gate 		    "because ref cnt is zero\n", (void *) wq);
24027c478bd9Sstevel@tonic-gate 
24037c478bd9Sstevel@tonic-gate 		cmp = mir->mir_svc_pend_mp;
24047c478bd9Sstevel@tonic-gate 		mir->mir_svc_pend_mp = NULL;
24057c478bd9Sstevel@tonic-gate 		mir_svc_idle_start(wq, mir);
24067c478bd9Sstevel@tonic-gate 	}
24077c478bd9Sstevel@tonic-gate 
240893132ae0Smaheshvs 	mir->mir_ref_cnt--;
240993132ae0Smaheshvs 	ASSERT(mir->mir_ref_cnt >= 0);
241093132ae0Smaheshvs 
241193132ae0Smaheshvs 	/*
241293132ae0Smaheshvs 	 * Wake up the thread waiting to close.
241393132ae0Smaheshvs 	 */
241493132ae0Smaheshvs 
241593132ae0Smaheshvs 	if ((mir->mir_ref_cnt == 0) && mir->mir_closing)
241693132ae0Smaheshvs 		cv_signal(&mir->mir_condvar);
241793132ae0Smaheshvs 
24187c478bd9Sstevel@tonic-gate 	mutex_exit(&mir->mir_mutex);
24197c478bd9Sstevel@tonic-gate 
24207c478bd9Sstevel@tonic-gate 	if (cmp) {
24217c478bd9Sstevel@tonic-gate 		RPCLOG(16, "mir_svc_release: sending a held "
24227c478bd9Sstevel@tonic-gate 		    "disconnect/ord rel indication upstream on queue 0x%p\n",
24237c478bd9Sstevel@tonic-gate 		    (void *)RD(wq));
24247c478bd9Sstevel@tonic-gate 
24257c478bd9Sstevel@tonic-gate 		putnext(RD(wq), cmp);
24267c478bd9Sstevel@tonic-gate 	}
24277c478bd9Sstevel@tonic-gate }
24287c478bd9Sstevel@tonic-gate 
24297c478bd9Sstevel@tonic-gate /*
24307c478bd9Sstevel@tonic-gate  * This routine is called by server-side KRPC when it is ready to
24317c478bd9Sstevel@tonic-gate  * handle inbound messages on the stream.
24327c478bd9Sstevel@tonic-gate  */
24337c478bd9Sstevel@tonic-gate static void
24347c478bd9Sstevel@tonic-gate mir_svc_start(queue_t *wq)
24357c478bd9Sstevel@tonic-gate {
24367c478bd9Sstevel@tonic-gate 	mir_t   *mir = (mir_t *)wq->q_ptr;
24377c478bd9Sstevel@tonic-gate 
2438a26eed27Sgt29601 	/*
2439a26eed27Sgt29601 	 * no longer need to take the mir_mutex because the
2440a26eed27Sgt29601 	 * mir_setup_complete field has been moved out of
2441a26eed27Sgt29601 	 * the binary field protected by the mir_mutex.
2442a26eed27Sgt29601 	 */
2443a26eed27Sgt29601 
24447c478bd9Sstevel@tonic-gate 	mir->mir_setup_complete = 1;
24457c478bd9Sstevel@tonic-gate 	qenable(RD(wq));
24467c478bd9Sstevel@tonic-gate }
24477c478bd9Sstevel@tonic-gate 
24487c478bd9Sstevel@tonic-gate /*
24497c478bd9Sstevel@tonic-gate  * client side wrapper for stopping timer with normal idle timeout.
24507c478bd9Sstevel@tonic-gate  */
24517c478bd9Sstevel@tonic-gate static void
24527c478bd9Sstevel@tonic-gate mir_clnt_idle_stop(queue_t *wq, mir_t *mir)
24537c478bd9Sstevel@tonic-gate {
24547c478bd9Sstevel@tonic-gate 	ASSERT(MUTEX_HELD(&mir->mir_mutex));
24557c478bd9Sstevel@tonic-gate 	ASSERT((wq->q_flag & QREADR) == 0);
24567c478bd9Sstevel@tonic-gate 	ASSERT(mir->mir_type == RPC_CLIENT);
24577c478bd9Sstevel@tonic-gate 
24587c478bd9Sstevel@tonic-gate 	mir_timer_stop(mir);
24597c478bd9Sstevel@tonic-gate }
24607c478bd9Sstevel@tonic-gate 
24617c478bd9Sstevel@tonic-gate /*
24627c478bd9Sstevel@tonic-gate  * client side wrapper for stopping timer with normal idle timeout.
24637c478bd9Sstevel@tonic-gate  */
24647c478bd9Sstevel@tonic-gate static void
24657c478bd9Sstevel@tonic-gate mir_clnt_idle_start(queue_t *wq, mir_t *mir)
24667c478bd9Sstevel@tonic-gate {
24677c478bd9Sstevel@tonic-gate 	ASSERT(MUTEX_HELD(&mir->mir_mutex));
24687c478bd9Sstevel@tonic-gate 	ASSERT((wq->q_flag & QREADR) == 0);
24697c478bd9Sstevel@tonic-gate 	ASSERT(mir->mir_type == RPC_CLIENT);
24707c478bd9Sstevel@tonic-gate 
24717c478bd9Sstevel@tonic-gate 	mir_timer_start(wq, mir, mir->mir_idle_timeout);
24727c478bd9Sstevel@tonic-gate }
24737c478bd9Sstevel@tonic-gate 
24747c478bd9Sstevel@tonic-gate /*
24757c478bd9Sstevel@tonic-gate  * client side only. Forces rpcmod to stop sending T_ORDREL_REQs on
24767c478bd9Sstevel@tonic-gate  * end-points that aren't connected.
24777c478bd9Sstevel@tonic-gate  */
24787c478bd9Sstevel@tonic-gate static void
24797c478bd9Sstevel@tonic-gate mir_clnt_idle_do_stop(queue_t *wq)
24807c478bd9Sstevel@tonic-gate {
24817c478bd9Sstevel@tonic-gate 	mir_t   *mir = (mir_t *)wq->q_ptr;
24827c478bd9Sstevel@tonic-gate 
24837c478bd9Sstevel@tonic-gate 	RPCLOG(1, "mir_clnt_idle_do_stop: wq 0x%p\n", (void *)wq);
24847c478bd9Sstevel@tonic-gate 	ASSERT(MUTEX_NOT_HELD(&mir->mir_mutex));
24857c478bd9Sstevel@tonic-gate 	mutex_enter(&mir->mir_mutex);
24867c478bd9Sstevel@tonic-gate 	mir_clnt_idle_stop(wq, mir);
24877c478bd9Sstevel@tonic-gate 	mutex_exit(&mir->mir_mutex);
24887c478bd9Sstevel@tonic-gate }
24897c478bd9Sstevel@tonic-gate 
24907c478bd9Sstevel@tonic-gate /*
24917c478bd9Sstevel@tonic-gate  * Timer handler.  It handles idle timeout and memory shortage problem.
24927c478bd9Sstevel@tonic-gate  */
24937c478bd9Sstevel@tonic-gate static void
24947c478bd9Sstevel@tonic-gate mir_timer(void *arg)
24957c478bd9Sstevel@tonic-gate {
24967c478bd9Sstevel@tonic-gate 	queue_t *wq = (queue_t *)arg;
24977c478bd9Sstevel@tonic-gate 	mir_t *mir = (mir_t *)wq->q_ptr;
24987c478bd9Sstevel@tonic-gate 	boolean_t notify;
24997c478bd9Sstevel@tonic-gate 
25007c478bd9Sstevel@tonic-gate 	mutex_enter(&mir->mir_mutex);
25017c478bd9Sstevel@tonic-gate 
25027c478bd9Sstevel@tonic-gate 	/*
25037c478bd9Sstevel@tonic-gate 	 * mir_timer_call is set only when either mir_timer_[start|stop]
25047c478bd9Sstevel@tonic-gate 	 * is progressing.  And mir_timer() can only be run while they
25057c478bd9Sstevel@tonic-gate 	 * are progressing if the timer is being stopped.  So just
25067c478bd9Sstevel@tonic-gate 	 * return.
25077c478bd9Sstevel@tonic-gate 	 */
25087c478bd9Sstevel@tonic-gate 	if (mir->mir_timer_call) {
25097c478bd9Sstevel@tonic-gate 		mutex_exit(&mir->mir_mutex);
25107c478bd9Sstevel@tonic-gate 		return;
25117c478bd9Sstevel@tonic-gate 	}
25127c478bd9Sstevel@tonic-gate 	mir->mir_timer_id = 0;
25137c478bd9Sstevel@tonic-gate 
25147c478bd9Sstevel@tonic-gate 	switch (mir->mir_type) {
25157c478bd9Sstevel@tonic-gate 	case RPC_CLIENT:
25167c478bd9Sstevel@tonic-gate 
25177c478bd9Sstevel@tonic-gate 		/*
25187c478bd9Sstevel@tonic-gate 		 * For clients, the timer fires at clnt_idle_timeout
25197c478bd9Sstevel@tonic-gate 		 * intervals.  If the activity marker (mir_clntreq) is
25207c478bd9Sstevel@tonic-gate 		 * zero, then the stream has been idle since the last
25217c478bd9Sstevel@tonic-gate 		 * timer event and we notify KRPC.  If mir_clntreq is
25227c478bd9Sstevel@tonic-gate 		 * non-zero, then the stream is active and we just
25237c478bd9Sstevel@tonic-gate 		 * restart the timer for another interval.  mir_clntreq
25247c478bd9Sstevel@tonic-gate 		 * is set to 1 in mir_wput for every request passed
25257c478bd9Sstevel@tonic-gate 		 * downstream.
25267c478bd9Sstevel@tonic-gate 		 *
25277c478bd9Sstevel@tonic-gate 		 * If this was a memory shortage timer reset the idle
25287c478bd9Sstevel@tonic-gate 		 * timeout regardless; the mir_clntreq will not be a
25297c478bd9Sstevel@tonic-gate 		 * valid indicator.
25307c478bd9Sstevel@tonic-gate 		 *
25317c478bd9Sstevel@tonic-gate 		 * The timer is initially started in mir_wput during
25327c478bd9Sstevel@tonic-gate 		 * RPC_CLIENT ioctl processing.
25337c478bd9Sstevel@tonic-gate 		 *
25347c478bd9Sstevel@tonic-gate 		 * The timer interval can be changed for individual
25357c478bd9Sstevel@tonic-gate 		 * streams with the ND variable "mir_idle_timeout".
25367c478bd9Sstevel@tonic-gate 		 */
25377c478bd9Sstevel@tonic-gate 		if (mir->mir_clntreq > 0 && mir->mir_use_timestamp +
25387c478bd9Sstevel@tonic-gate 		    MSEC_TO_TICK(mir->mir_idle_timeout) - lbolt >= 0) {
25397c478bd9Sstevel@tonic-gate 			clock_t tout;
25407c478bd9Sstevel@tonic-gate 
25417c478bd9Sstevel@tonic-gate 			tout = mir->mir_idle_timeout -
25427c478bd9Sstevel@tonic-gate 			    TICK_TO_MSEC(lbolt - mir->mir_use_timestamp);
25437c478bd9Sstevel@tonic-gate 			if (tout < 0)
25447c478bd9Sstevel@tonic-gate 				tout = 1000;
25457c478bd9Sstevel@tonic-gate #if 0
2546*07e75131Sgt29601 			printf("mir_timer[%d < %d + %d]: reset client timer "
2547*07e75131Sgt29601 			    "to %d (ms)\n", TICK_TO_MSEC(lbolt),
2548*07e75131Sgt29601 			    TICK_TO_MSEC(mir->mir_use_timestamp),
25497c478bd9Sstevel@tonic-gate 			    mir->mir_idle_timeout, tout);
25507c478bd9Sstevel@tonic-gate #endif
25517c478bd9Sstevel@tonic-gate 			mir->mir_clntreq = 0;
25527c478bd9Sstevel@tonic-gate 			mir_timer_start(wq, mir, tout);
25537c478bd9Sstevel@tonic-gate 			mutex_exit(&mir->mir_mutex);
25547c478bd9Sstevel@tonic-gate 			return;
25557c478bd9Sstevel@tonic-gate 		}
25567c478bd9Sstevel@tonic-gate #if 0
25577c478bd9Sstevel@tonic-gate printf("mir_timer[%d]: doing client timeout\n", lbolt / hz);
25587c478bd9Sstevel@tonic-gate #endif
25597c478bd9Sstevel@tonic-gate 		/*
25607c478bd9Sstevel@tonic-gate 		 * We are disconnecting, but not necessarily
25617c478bd9Sstevel@tonic-gate 		 * closing. By not closing, we will fail to
25627c478bd9Sstevel@tonic-gate 		 * pick up a possibly changed global timeout value,
25637c478bd9Sstevel@tonic-gate 		 * unless we store it now.
25647c478bd9Sstevel@tonic-gate 		 */
25657c478bd9Sstevel@tonic-gate 		mir->mir_idle_timeout = clnt_idle_timeout;
25667c478bd9Sstevel@tonic-gate 		mir_clnt_idle_start(wq, mir);
25677c478bd9Sstevel@tonic-gate 
25687c478bd9Sstevel@tonic-gate 		mutex_exit(&mir->mir_mutex);
25697c478bd9Sstevel@tonic-gate 		/*
25707c478bd9Sstevel@tonic-gate 		 * We pass T_ORDREL_REQ as an integer value
25717c478bd9Sstevel@tonic-gate 		 * to KRPC as the indication that the stream
25727c478bd9Sstevel@tonic-gate 		 * is idle.  This is not a T_ORDREL_REQ message,
25737c478bd9Sstevel@tonic-gate 		 * it is just a convenient value since we call
25747c478bd9Sstevel@tonic-gate 		 * the same KRPC routine for T_ORDREL_INDs and
25757c478bd9Sstevel@tonic-gate 		 * T_DISCON_INDs.
25767c478bd9Sstevel@tonic-gate 		 */
25777c478bd9Sstevel@tonic-gate 		clnt_dispatch_notifyall(wq, T_ORDREL_REQ, 0);
25787c478bd9Sstevel@tonic-gate 		return;
25797c478bd9Sstevel@tonic-gate 
25807c478bd9Sstevel@tonic-gate 	case RPC_SERVER:
25817c478bd9Sstevel@tonic-gate 
25827c478bd9Sstevel@tonic-gate 		/*
25837c478bd9Sstevel@tonic-gate 		 * For servers, the timer is only running when the stream
25847c478bd9Sstevel@tonic-gate 		 * is really idle or memory is short.  The timer is started
25857c478bd9Sstevel@tonic-gate 		 * by mir_wput when mir_type is set to RPC_SERVER and
25867c478bd9Sstevel@tonic-gate 		 * by mir_svc_idle_start whenever the stream goes idle
25877c478bd9Sstevel@tonic-gate 		 * (mir_ref_cnt == 0).  The timer is cancelled in
25887c478bd9Sstevel@tonic-gate 		 * mir_rput whenever a new inbound request is passed to KRPC
25897c478bd9Sstevel@tonic-gate 		 * and the stream was previously idle.
25907c478bd9Sstevel@tonic-gate 		 *
25917c478bd9Sstevel@tonic-gate 		 * The timer interval can be changed for individual
25927c478bd9Sstevel@tonic-gate 		 * streams with the ND variable "mir_idle_timeout".
25937c478bd9Sstevel@tonic-gate 		 *
25947c478bd9Sstevel@tonic-gate 		 * If the stream is not idle do nothing.
25957c478bd9Sstevel@tonic-gate 		 */
25967c478bd9Sstevel@tonic-gate 		if (!MIR_SVC_QUIESCED(mir)) {
25977c478bd9Sstevel@tonic-gate 			mutex_exit(&mir->mir_mutex);
25987c478bd9Sstevel@tonic-gate 			return;
25997c478bd9Sstevel@tonic-gate 		}
26007c478bd9Sstevel@tonic-gate 
26017c478bd9Sstevel@tonic-gate 		notify = !mir->mir_inrservice;
26027c478bd9Sstevel@tonic-gate 		mutex_exit(&mir->mir_mutex);
26037c478bd9Sstevel@tonic-gate 
26047c478bd9Sstevel@tonic-gate 		/*
26057c478bd9Sstevel@tonic-gate 		 * If there is no packet queued up in read queue, the stream
26067c478bd9Sstevel@tonic-gate 		 * is really idle so notify nfsd to close it.
26077c478bd9Sstevel@tonic-gate 		 */
26087c478bd9Sstevel@tonic-gate 		if (notify) {
26097c478bd9Sstevel@tonic-gate 			RPCLOG(16, "mir_timer: telling stream head listener "
26107c478bd9Sstevel@tonic-gate 			    "to close stream (0x%p)\n", (void *) RD(wq));
26117c478bd9Sstevel@tonic-gate 			(void) mir_svc_policy_notify(RD(wq), 1);
26127c478bd9Sstevel@tonic-gate 		}
26137c478bd9Sstevel@tonic-gate 		return;
26147c478bd9Sstevel@tonic-gate 	default:
26157c478bd9Sstevel@tonic-gate 		RPCLOG(1, "mir_timer: unexpected mir_type %d\n",
26167c478bd9Sstevel@tonic-gate 		    mir->mir_type);
26177c478bd9Sstevel@tonic-gate 		mutex_exit(&mir->mir_mutex);
26187c478bd9Sstevel@tonic-gate 		return;
26197c478bd9Sstevel@tonic-gate 	}
26207c478bd9Sstevel@tonic-gate }
26217c478bd9Sstevel@tonic-gate 
26227c478bd9Sstevel@tonic-gate /*
26237c478bd9Sstevel@tonic-gate  * Called by the RPC package to send either a call or a return, or a
26247c478bd9Sstevel@tonic-gate  * transport connection request.  Adds the record marking header.
26257c478bd9Sstevel@tonic-gate  */
26267c478bd9Sstevel@tonic-gate static void
26277c478bd9Sstevel@tonic-gate mir_wput(queue_t *q, mblk_t *mp)
26287c478bd9Sstevel@tonic-gate {
26297c478bd9Sstevel@tonic-gate 	uint_t	frag_header;
26307c478bd9Sstevel@tonic-gate 	mir_t	*mir = (mir_t *)q->q_ptr;
26317c478bd9Sstevel@tonic-gate 	uchar_t	*rptr = mp->b_rptr;
26327c478bd9Sstevel@tonic-gate 
26337c478bd9Sstevel@tonic-gate 	if (!mir) {
26347c478bd9Sstevel@tonic-gate 		freemsg(mp);
26357c478bd9Sstevel@tonic-gate 		return;
26367c478bd9Sstevel@tonic-gate 	}
26377c478bd9Sstevel@tonic-gate 
26387c478bd9Sstevel@tonic-gate 	if (mp->b_datap->db_type != M_DATA) {
26397c478bd9Sstevel@tonic-gate 		mir_wput_other(q, mp);
26407c478bd9Sstevel@tonic-gate 		return;
26417c478bd9Sstevel@tonic-gate 	}
26427c478bd9Sstevel@tonic-gate 
26437c478bd9Sstevel@tonic-gate 	if (mir->mir_ordrel_pending == 1) {
26447c478bd9Sstevel@tonic-gate 		freemsg(mp);
26457c478bd9Sstevel@tonic-gate 		RPCLOG(16, "mir_wput wq 0x%p: got data after T_ORDREL_REQ\n",
26467c478bd9Sstevel@tonic-gate 		    (void *)q);
26477c478bd9Sstevel@tonic-gate 		return;
26487c478bd9Sstevel@tonic-gate 	}
26497c478bd9Sstevel@tonic-gate 
26507c478bd9Sstevel@tonic-gate 	frag_header = (uint_t)DLEN(mp);
26517c478bd9Sstevel@tonic-gate 	frag_header |= MIR_LASTFRAG;
26527c478bd9Sstevel@tonic-gate 
26537c478bd9Sstevel@tonic-gate 	/* Stick in the 4 byte record marking header. */
26547c478bd9Sstevel@tonic-gate 	if ((rptr - mp->b_datap->db_base) < sizeof (uint32_t) ||
26557c478bd9Sstevel@tonic-gate 	    !IS_P2ALIGNED(mp->b_rptr, sizeof (uint32_t))) {
26567c478bd9Sstevel@tonic-gate 		/*
26577c478bd9Sstevel@tonic-gate 		 * Since we know that M_DATA messages are created exclusively
26587c478bd9Sstevel@tonic-gate 		 * by KRPC, we expect that KRPC will leave room for our header
26597c478bd9Sstevel@tonic-gate 		 * and 4 byte align which is normal for XDR.
26607c478bd9Sstevel@tonic-gate 		 * If KRPC (or someone else) does not cooperate, then we
26617c478bd9Sstevel@tonic-gate 		 * just throw away the message.
26627c478bd9Sstevel@tonic-gate 		 */
26637c478bd9Sstevel@tonic-gate 		RPCLOG(1, "mir_wput: KRPC did not leave space for record "
26647c478bd9Sstevel@tonic-gate 		    "fragment header (%d bytes left)\n",
26657c478bd9Sstevel@tonic-gate 		    (int)(rptr - mp->b_datap->db_base));
26667c478bd9Sstevel@tonic-gate 		freemsg(mp);
26677c478bd9Sstevel@tonic-gate 		return;
26687c478bd9Sstevel@tonic-gate 	}
26697c478bd9Sstevel@tonic-gate 	rptr -= sizeof (uint32_t);
26707c478bd9Sstevel@tonic-gate 	*(uint32_t *)rptr = htonl(frag_header);
26717c478bd9Sstevel@tonic-gate 	mp->b_rptr = rptr;
26727c478bd9Sstevel@tonic-gate 
26737c478bd9Sstevel@tonic-gate 	mutex_enter(&mir->mir_mutex);
26747c478bd9Sstevel@tonic-gate 	if (mir->mir_type == RPC_CLIENT) {
26757c478bd9Sstevel@tonic-gate 		/*
26767c478bd9Sstevel@tonic-gate 		 * For the client, set mir_clntreq to indicate that the
26777c478bd9Sstevel@tonic-gate 		 * connection is active.
26787c478bd9Sstevel@tonic-gate 		 */
26797c478bd9Sstevel@tonic-gate 		mir->mir_clntreq = 1;
26807c478bd9Sstevel@tonic-gate 		mir->mir_use_timestamp = lbolt;
26817c478bd9Sstevel@tonic-gate 	}
26827c478bd9Sstevel@tonic-gate 
26837c478bd9Sstevel@tonic-gate 	/*
26847c478bd9Sstevel@tonic-gate 	 * If we haven't already queued some data and the downstream module
26857c478bd9Sstevel@tonic-gate 	 * can accept more data, send it on, otherwise we queue the message
26867c478bd9Sstevel@tonic-gate 	 * and take other actions depending on mir_type.
26877c478bd9Sstevel@tonic-gate 	 */
26887c478bd9Sstevel@tonic-gate 	if (!mir->mir_inwservice && MIR_WCANPUTNEXT(mir, q)) {
26897c478bd9Sstevel@tonic-gate 		mutex_exit(&mir->mir_mutex);
26907c478bd9Sstevel@tonic-gate 
26917c478bd9Sstevel@tonic-gate 		/*
26927c478bd9Sstevel@tonic-gate 		 * Now we pass the RPC message downstream.
26937c478bd9Sstevel@tonic-gate 		 */
26947c478bd9Sstevel@tonic-gate 		putnext(q, mp);
26957c478bd9Sstevel@tonic-gate 		return;
26967c478bd9Sstevel@tonic-gate 	}
26977c478bd9Sstevel@tonic-gate 
26987c478bd9Sstevel@tonic-gate 	switch (mir->mir_type) {
26997c478bd9Sstevel@tonic-gate 	case RPC_CLIENT:
27007c478bd9Sstevel@tonic-gate 		/*
27017c478bd9Sstevel@tonic-gate 		 * Check for a previous duplicate request on the
27027c478bd9Sstevel@tonic-gate 		 * queue.  If there is one, then we throw away
27037c478bd9Sstevel@tonic-gate 		 * the current message and let the previous one
27047c478bd9Sstevel@tonic-gate 		 * go through.  If we can't find a duplicate, then
27057c478bd9Sstevel@tonic-gate 		 * send this one.  This tap dance is an effort
27067c478bd9Sstevel@tonic-gate 		 * to reduce traffic and processing requirements
27077c478bd9Sstevel@tonic-gate 		 * under load conditions.
27087c478bd9Sstevel@tonic-gate 		 */
27097c478bd9Sstevel@tonic-gate 		if (mir_clnt_dup_request(q, mp)) {
27107c478bd9Sstevel@tonic-gate 			mutex_exit(&mir->mir_mutex);
27117c478bd9Sstevel@tonic-gate 			freemsg(mp);
27127c478bd9Sstevel@tonic-gate 			return;
27137c478bd9Sstevel@tonic-gate 		}
27147c478bd9Sstevel@tonic-gate 		break;
27157c478bd9Sstevel@tonic-gate 	case RPC_SERVER:
27167c478bd9Sstevel@tonic-gate 		/*
27177c478bd9Sstevel@tonic-gate 		 * Set mir_hold_inbound so that new inbound RPC
27187c478bd9Sstevel@tonic-gate 		 * messages will be held until the client catches
27197c478bd9Sstevel@tonic-gate 		 * up on the earlier replies.  This flag is cleared
27207c478bd9Sstevel@tonic-gate 		 * in mir_wsrv after flow control is relieved;
27217c478bd9Sstevel@tonic-gate 		 * the read-side queue is also enabled at that time.
27227c478bd9Sstevel@tonic-gate 		 */
27237c478bd9Sstevel@tonic-gate 		mir->mir_hold_inbound = 1;
27247c478bd9Sstevel@tonic-gate 		break;
27257c478bd9Sstevel@tonic-gate 	default:
27267c478bd9Sstevel@tonic-gate 		RPCLOG(1, "mir_wput: unexpected mir_type %d\n", mir->mir_type);
27277c478bd9Sstevel@tonic-gate 		break;
27287c478bd9Sstevel@tonic-gate 	}
27297c478bd9Sstevel@tonic-gate 	mir->mir_inwservice = 1;
27307c478bd9Sstevel@tonic-gate 	(void) putq(q, mp);
27317c478bd9Sstevel@tonic-gate 	mutex_exit(&mir->mir_mutex);
27327c478bd9Sstevel@tonic-gate }
27337c478bd9Sstevel@tonic-gate 
27347c478bd9Sstevel@tonic-gate static void
27357c478bd9Sstevel@tonic-gate mir_wput_other(queue_t *q, mblk_t *mp)
27367c478bd9Sstevel@tonic-gate {
27377c478bd9Sstevel@tonic-gate 	mir_t	*mir = (mir_t *)q->q_ptr;
27387c478bd9Sstevel@tonic-gate 	struct iocblk	*iocp;
27397c478bd9Sstevel@tonic-gate 	uchar_t	*rptr = mp->b_rptr;
27407c478bd9Sstevel@tonic-gate 	bool_t	flush_in_svc = FALSE;
27417c478bd9Sstevel@tonic-gate 
27427c478bd9Sstevel@tonic-gate 	ASSERT(MUTEX_NOT_HELD(&mir->mir_mutex));
27437c478bd9Sstevel@tonic-gate 	switch (mp->b_datap->db_type) {
27447c478bd9Sstevel@tonic-gate 	case M_IOCTL:
27457c478bd9Sstevel@tonic-gate 		iocp = (struct iocblk *)rptr;
27467c478bd9Sstevel@tonic-gate 		switch (iocp->ioc_cmd) {
27477c478bd9Sstevel@tonic-gate 		case RPC_CLIENT:
27487c478bd9Sstevel@tonic-gate 			mutex_enter(&mir->mir_mutex);
27497c478bd9Sstevel@tonic-gate 			if (mir->mir_type != 0 &&
27507c478bd9Sstevel@tonic-gate 			    mir->mir_type != iocp->ioc_cmd) {
27517c478bd9Sstevel@tonic-gate ioc_eperm:
27527c478bd9Sstevel@tonic-gate 				mutex_exit(&mir->mir_mutex);
27537c478bd9Sstevel@tonic-gate 				iocp->ioc_error = EPERM;
27547c478bd9Sstevel@tonic-gate 				iocp->ioc_count = 0;
27557c478bd9Sstevel@tonic-gate 				mp->b_datap->db_type = M_IOCACK;
27567c478bd9Sstevel@tonic-gate 				qreply(q, mp);
27577c478bd9Sstevel@tonic-gate 				return;
27587c478bd9Sstevel@tonic-gate 			}
27597c478bd9Sstevel@tonic-gate 
27607c478bd9Sstevel@tonic-gate 			mir->mir_type = iocp->ioc_cmd;
27617c478bd9Sstevel@tonic-gate 
27627c478bd9Sstevel@tonic-gate 			/*
27637c478bd9Sstevel@tonic-gate 			 * Clear mir_hold_inbound which was set to 1 by
27647c478bd9Sstevel@tonic-gate 			 * mir_open.  This flag is not used on client
27657c478bd9Sstevel@tonic-gate 			 * streams.
27667c478bd9Sstevel@tonic-gate 			 */
27677c478bd9Sstevel@tonic-gate 			mir->mir_hold_inbound = 0;
27687c478bd9Sstevel@tonic-gate 			mir->mir_max_msg_sizep = &clnt_max_msg_size;
27697c478bd9Sstevel@tonic-gate 
27707c478bd9Sstevel@tonic-gate 			/*
27717c478bd9Sstevel@tonic-gate 			 * Start the idle timer.  See mir_timer() for more
27727c478bd9Sstevel@tonic-gate 			 * information on how client timers work.
27737c478bd9Sstevel@tonic-gate 			 */
27747c478bd9Sstevel@tonic-gate 			mir->mir_idle_timeout = clnt_idle_timeout;
27757c478bd9Sstevel@tonic-gate 			mir_clnt_idle_start(q, mir);
27767c478bd9Sstevel@tonic-gate 			mutex_exit(&mir->mir_mutex);
27777c478bd9Sstevel@tonic-gate 
27787c478bd9Sstevel@tonic-gate 			mp->b_datap->db_type = M_IOCACK;
27797c478bd9Sstevel@tonic-gate 			qreply(q, mp);
27807c478bd9Sstevel@tonic-gate 			return;
27817c478bd9Sstevel@tonic-gate 		case RPC_SERVER:
27827c478bd9Sstevel@tonic-gate 			mutex_enter(&mir->mir_mutex);
27837c478bd9Sstevel@tonic-gate 			if (mir->mir_type != 0 &&
27847c478bd9Sstevel@tonic-gate 			    mir->mir_type != iocp->ioc_cmd)
27857c478bd9Sstevel@tonic-gate 				goto ioc_eperm;
27867c478bd9Sstevel@tonic-gate 
27877c478bd9Sstevel@tonic-gate 			/*
27887c478bd9Sstevel@tonic-gate 			 * We don't clear mir_hold_inbound here because
27897c478bd9Sstevel@tonic-gate 			 * mir_hold_inbound is used in the flow control
27907c478bd9Sstevel@tonic-gate 			 * model. If we cleared it here, then we'd commit
27917c478bd9Sstevel@tonic-gate 			 * a small violation to the model where the transport
27927c478bd9Sstevel@tonic-gate 			 * might immediately block downstream flow.
27937c478bd9Sstevel@tonic-gate 			 */
27947c478bd9Sstevel@tonic-gate 
27957c478bd9Sstevel@tonic-gate 			mir->mir_type = iocp->ioc_cmd;
27967c478bd9Sstevel@tonic-gate 			mir->mir_max_msg_sizep = &svc_max_msg_size;
27977c478bd9Sstevel@tonic-gate 
27987c478bd9Sstevel@tonic-gate 			/*
27997c478bd9Sstevel@tonic-gate 			 * Start the idle timer.  See mir_timer() for more
28007c478bd9Sstevel@tonic-gate 			 * information on how server timers work.
28017c478bd9Sstevel@tonic-gate 			 *
28027c478bd9Sstevel@tonic-gate 			 * Note that it is important to start the idle timer
28037c478bd9Sstevel@tonic-gate 			 * here so that connections time out even if we
28047c478bd9Sstevel@tonic-gate 			 * never receive any data on them.
28057c478bd9Sstevel@tonic-gate 			 */
28067c478bd9Sstevel@tonic-gate 			mir->mir_idle_timeout = svc_idle_timeout;
28077c478bd9Sstevel@tonic-gate 			RPCLOG(16, "mir_wput_other starting idle timer on 0x%p "
28087c478bd9Sstevel@tonic-gate 			    "because we got RPC_SERVER ioctl\n", (void *)q);
28097c478bd9Sstevel@tonic-gate 			mir_svc_idle_start(q, mir);
28107c478bd9Sstevel@tonic-gate 			mutex_exit(&mir->mir_mutex);
28117c478bd9Sstevel@tonic-gate 
28127c478bd9Sstevel@tonic-gate 			mp->b_datap->db_type = M_IOCACK;
28137c478bd9Sstevel@tonic-gate 			qreply(q, mp);
28147c478bd9Sstevel@tonic-gate 			return;
28157c478bd9Sstevel@tonic-gate 		default:
28167c478bd9Sstevel@tonic-gate 			break;
28177c478bd9Sstevel@tonic-gate 		}
28187c478bd9Sstevel@tonic-gate 		break;
28197c478bd9Sstevel@tonic-gate 
28207c478bd9Sstevel@tonic-gate 	case M_PROTO:
28217c478bd9Sstevel@tonic-gate 		if (mir->mir_type == RPC_CLIENT) {
28227c478bd9Sstevel@tonic-gate 			/*
28237c478bd9Sstevel@tonic-gate 			 * We are likely being called from the context of a
28247c478bd9Sstevel@tonic-gate 			 * service procedure. So we need to enqueue. However
28257c478bd9Sstevel@tonic-gate 			 * enqueing may put our message behind data messages.
28267c478bd9Sstevel@tonic-gate 			 * So flush the data first.
28277c478bd9Sstevel@tonic-gate 			 */
28287c478bd9Sstevel@tonic-gate 			flush_in_svc = TRUE;
28297c478bd9Sstevel@tonic-gate 		}
28307c478bd9Sstevel@tonic-gate 		if ((mp->b_wptr - rptr) < sizeof (uint32_t) ||
28317c478bd9Sstevel@tonic-gate 		    !IS_P2ALIGNED(rptr, sizeof (uint32_t)))
28327c478bd9Sstevel@tonic-gate 			break;
28337c478bd9Sstevel@tonic-gate 
28347c478bd9Sstevel@tonic-gate 		switch (((union T_primitives *)rptr)->type) {
28357c478bd9Sstevel@tonic-gate 		case T_DATA_REQ:
28367c478bd9Sstevel@tonic-gate 			/* Don't pass T_DATA_REQ messages downstream. */
28377c478bd9Sstevel@tonic-gate 			freemsg(mp);
28387c478bd9Sstevel@tonic-gate 			return;
28397c478bd9Sstevel@tonic-gate 		case T_ORDREL_REQ:
28407c478bd9Sstevel@tonic-gate 			RPCLOG(8, "mir_wput_other wq 0x%p: got T_ORDREL_REQ\n",
28417c478bd9Sstevel@tonic-gate 			    (void *)q);
28427c478bd9Sstevel@tonic-gate 			mutex_enter(&mir->mir_mutex);
28437c478bd9Sstevel@tonic-gate 			if (mir->mir_type != RPC_SERVER) {
28447c478bd9Sstevel@tonic-gate 				/*
28457c478bd9Sstevel@tonic-gate 				 * We are likely being called from
28467c478bd9Sstevel@tonic-gate 				 * clnt_dispatch_notifyall(). Sending
28477c478bd9Sstevel@tonic-gate 				 * a T_ORDREL_REQ will result in
28487c478bd9Sstevel@tonic-gate 				 * a some kind of _IND message being sent,
28497c478bd9Sstevel@tonic-gate 				 * will be another call to
28507c478bd9Sstevel@tonic-gate 				 * clnt_dispatch_notifyall(). To keep the stack
28517c478bd9Sstevel@tonic-gate 				 * lean, queue this message.
28527c478bd9Sstevel@tonic-gate 				 */
28537c478bd9Sstevel@tonic-gate 				mir->mir_inwservice = 1;
28547c478bd9Sstevel@tonic-gate 				(void) putq(q, mp);
28557c478bd9Sstevel@tonic-gate 				mutex_exit(&mir->mir_mutex);
28567c478bd9Sstevel@tonic-gate 				return;
28577c478bd9Sstevel@tonic-gate 			}
28587c478bd9Sstevel@tonic-gate 
28597c478bd9Sstevel@tonic-gate 			/*
28607c478bd9Sstevel@tonic-gate 			 * Mark the structure such that we don't accept any
28617c478bd9Sstevel@tonic-gate 			 * more requests from client. We could defer this
28627c478bd9Sstevel@tonic-gate 			 * until we actually send the orderly release
28637c478bd9Sstevel@tonic-gate 			 * request downstream, but all that does is delay
28647c478bd9Sstevel@tonic-gate 			 * the closing of this stream.
28657c478bd9Sstevel@tonic-gate 			 */
28667c478bd9Sstevel@tonic-gate 			RPCLOG(16, "mir_wput_other wq 0x%p: got T_ORDREL_REQ "
28677c478bd9Sstevel@tonic-gate 			    " so calling mir_svc_start_close\n", (void *)q);
28687c478bd9Sstevel@tonic-gate 
28697c478bd9Sstevel@tonic-gate 			mir_svc_start_close(q, mir);
28707c478bd9Sstevel@tonic-gate 
28717c478bd9Sstevel@tonic-gate 			/*
28727c478bd9Sstevel@tonic-gate 			 * If we have sent down a T_ORDREL_REQ, don't send
28737c478bd9Sstevel@tonic-gate 			 * any more.
28747c478bd9Sstevel@tonic-gate 			 */
28757c478bd9Sstevel@tonic-gate 			if (mir->mir_ordrel_pending) {
28767c478bd9Sstevel@tonic-gate 				freemsg(mp);
28777c478bd9Sstevel@tonic-gate 				mutex_exit(&mir->mir_mutex);
28787c478bd9Sstevel@tonic-gate 				return;
28797c478bd9Sstevel@tonic-gate 			}
28807c478bd9Sstevel@tonic-gate 
28817c478bd9Sstevel@tonic-gate 			/*
28827c478bd9Sstevel@tonic-gate 			 * If the stream is not idle, then we hold the
28837c478bd9Sstevel@tonic-gate 			 * orderly release until it becomes idle.  This
28847c478bd9Sstevel@tonic-gate 			 * ensures that KRPC will be able to reply to
28857c478bd9Sstevel@tonic-gate 			 * all requests that we have passed to it.
28867c478bd9Sstevel@tonic-gate 			 *
28877c478bd9Sstevel@tonic-gate 			 * We also queue the request if there is data already
28887c478bd9Sstevel@tonic-gate 			 * queued, because we cannot allow the T_ORDREL_REQ
28897c478bd9Sstevel@tonic-gate 			 * to go before data. When we had a separate reply
28907c478bd9Sstevel@tonic-gate 			 * count, this was not a problem, because the
28917c478bd9Sstevel@tonic-gate 			 * reply count was reconciled when mir_wsrv()
28927c478bd9Sstevel@tonic-gate 			 * completed.
28937c478bd9Sstevel@tonic-gate 			 */
28947c478bd9Sstevel@tonic-gate 			if (!MIR_SVC_QUIESCED(mir) ||
28957c478bd9Sstevel@tonic-gate 			    mir->mir_inwservice == 1) {
28967c478bd9Sstevel@tonic-gate 				mir->mir_inwservice = 1;
28977c478bd9Sstevel@tonic-gate 				(void) putq(q, mp);
28987c478bd9Sstevel@tonic-gate 
28997c478bd9Sstevel@tonic-gate 				RPCLOG(16, "mir_wput_other: queuing "
29007c478bd9Sstevel@tonic-gate 				    "T_ORDREL_REQ on 0x%p\n", (void *)q);
29017c478bd9Sstevel@tonic-gate 
29027c478bd9Sstevel@tonic-gate 				mutex_exit(&mir->mir_mutex);
29037c478bd9Sstevel@tonic-gate 				return;
29047c478bd9Sstevel@tonic-gate 			}
29057c478bd9Sstevel@tonic-gate 
29067c478bd9Sstevel@tonic-gate 			/*
29077c478bd9Sstevel@tonic-gate 			 * Mark the structure so that we know we sent
29087c478bd9Sstevel@tonic-gate 			 * an orderly release request, and reset the idle timer.
29097c478bd9Sstevel@tonic-gate 			 */
29107c478bd9Sstevel@tonic-gate 			mir->mir_ordrel_pending = 1;
29117c478bd9Sstevel@tonic-gate 
29127c478bd9Sstevel@tonic-gate 			RPCLOG(16, "mir_wput_other: calling mir_svc_idle_start"
29137c478bd9Sstevel@tonic-gate 			    " on 0x%p because we got T_ORDREL_REQ\n",
29147c478bd9Sstevel@tonic-gate 			    (void *)q);
29157c478bd9Sstevel@tonic-gate 
29167c478bd9Sstevel@tonic-gate 			mir_svc_idle_start(q, mir);
29177c478bd9Sstevel@tonic-gate 			mutex_exit(&mir->mir_mutex);
29187c478bd9Sstevel@tonic-gate 
29197c478bd9Sstevel@tonic-gate 			/*
29207c478bd9Sstevel@tonic-gate 			 * When we break, we will putnext the T_ORDREL_REQ.
29217c478bd9Sstevel@tonic-gate 			 */
29227c478bd9Sstevel@tonic-gate 			break;
29237c478bd9Sstevel@tonic-gate 
29247c478bd9Sstevel@tonic-gate 		case T_CONN_REQ:
29257c478bd9Sstevel@tonic-gate 			mutex_enter(&mir->mir_mutex);
29267c478bd9Sstevel@tonic-gate 			if (mir->mir_head_mp != NULL) {
29277c478bd9Sstevel@tonic-gate 				freemsg(mir->mir_head_mp);
29287c478bd9Sstevel@tonic-gate 				mir->mir_head_mp = NULL;
29297c478bd9Sstevel@tonic-gate 				mir->mir_tail_mp = NULL;
29307c478bd9Sstevel@tonic-gate 			}
29317c478bd9Sstevel@tonic-gate 			mir->mir_frag_len = -(int32_t)sizeof (uint32_t);
29327c478bd9Sstevel@tonic-gate 			/*
29337c478bd9Sstevel@tonic-gate 			 * Restart timer in case mir_clnt_idle_do_stop() was
29347c478bd9Sstevel@tonic-gate 			 * called.
29357c478bd9Sstevel@tonic-gate 			 */
29367c478bd9Sstevel@tonic-gate 			mir->mir_idle_timeout = clnt_idle_timeout;
29377c478bd9Sstevel@tonic-gate 			mir_clnt_idle_stop(q, mir);
29387c478bd9Sstevel@tonic-gate 			mir_clnt_idle_start(q, mir);
29397c478bd9Sstevel@tonic-gate 			mutex_exit(&mir->mir_mutex);
29407c478bd9Sstevel@tonic-gate 			break;
29417c478bd9Sstevel@tonic-gate 
29427c478bd9Sstevel@tonic-gate 		default:
29437c478bd9Sstevel@tonic-gate 			/*
29447c478bd9Sstevel@tonic-gate 			 * T_DISCON_REQ is one of the interesting default
29457c478bd9Sstevel@tonic-gate 			 * cases here. Ideally, an M_FLUSH is done before
29467c478bd9Sstevel@tonic-gate 			 * T_DISCON_REQ is done. However, that is somewhat
29477c478bd9Sstevel@tonic-gate 			 * cumbersome for clnt_cots.c to do. So we queue
29487c478bd9Sstevel@tonic-gate 			 * T_DISCON_REQ, and let the service procedure
29497c478bd9Sstevel@tonic-gate 			 * flush all M_DATA.
29507c478bd9Sstevel@tonic-gate 			 */
29517c478bd9Sstevel@tonic-gate 			break;
29527c478bd9Sstevel@tonic-gate 		}
29537c478bd9Sstevel@tonic-gate 		/* fallthru */;
29547c478bd9Sstevel@tonic-gate 	default:
29557c478bd9Sstevel@tonic-gate 		if (mp->b_datap->db_type >= QPCTL) {
29567c478bd9Sstevel@tonic-gate 			if (mp->b_datap->db_type == M_FLUSH) {
29577c478bd9Sstevel@tonic-gate 				if (mir->mir_type == RPC_CLIENT &&
29587c478bd9Sstevel@tonic-gate 				    *mp->b_rptr & FLUSHW) {
29597c478bd9Sstevel@tonic-gate 					RPCLOG(32, "mir_wput_other: flushing "
29607c478bd9Sstevel@tonic-gate 					    "wq 0x%p\n", (void *)q);
29617c478bd9Sstevel@tonic-gate 					if (*mp->b_rptr & FLUSHBAND) {
29627c478bd9Sstevel@tonic-gate 						flushband(q, *(mp->b_rptr + 1),
29637c478bd9Sstevel@tonic-gate 						    FLUSHDATA);
29647c478bd9Sstevel@tonic-gate 					} else {
29657c478bd9Sstevel@tonic-gate 						flushq(q, FLUSHDATA);
29667c478bd9Sstevel@tonic-gate 					}
29677c478bd9Sstevel@tonic-gate 				} else {
29687c478bd9Sstevel@tonic-gate 					RPCLOG(32, "mir_wput_other: ignoring "
29697c478bd9Sstevel@tonic-gate 					    "M_FLUSH on wq 0x%p\n", (void *)q);
29707c478bd9Sstevel@tonic-gate 				}
29717c478bd9Sstevel@tonic-gate 			}
29727c478bd9Sstevel@tonic-gate 			break;
29737c478bd9Sstevel@tonic-gate 		}
29747c478bd9Sstevel@tonic-gate 
29757c478bd9Sstevel@tonic-gate 		mutex_enter(&mir->mir_mutex);
29767c478bd9Sstevel@tonic-gate 		if (mir->mir_inwservice == 0 && MIR_WCANPUTNEXT(mir, q)) {
29777c478bd9Sstevel@tonic-gate 			mutex_exit(&mir->mir_mutex);
29787c478bd9Sstevel@tonic-gate 			break;
29797c478bd9Sstevel@tonic-gate 		}
29807c478bd9Sstevel@tonic-gate 		mir->mir_inwservice = 1;
29817c478bd9Sstevel@tonic-gate 		mir->mir_inwflushdata = flush_in_svc;
29827c478bd9Sstevel@tonic-gate 		(void) putq(q, mp);
29837c478bd9Sstevel@tonic-gate 		mutex_exit(&mir->mir_mutex);
29847c478bd9Sstevel@tonic-gate 		qenable(q);
29857c478bd9Sstevel@tonic-gate 
29867c478bd9Sstevel@tonic-gate 		return;
29877c478bd9Sstevel@tonic-gate 	}
29887c478bd9Sstevel@tonic-gate 	putnext(q, mp);
29897c478bd9Sstevel@tonic-gate }
29907c478bd9Sstevel@tonic-gate 
29917c478bd9Sstevel@tonic-gate static void
29927c478bd9Sstevel@tonic-gate mir_wsrv(queue_t *q)
29937c478bd9Sstevel@tonic-gate {
29947c478bd9Sstevel@tonic-gate 	mblk_t	*mp;
29957c478bd9Sstevel@tonic-gate 	mir_t	*mir;
29967c478bd9Sstevel@tonic-gate 	bool_t flushdata;
29977c478bd9Sstevel@tonic-gate 
29987c478bd9Sstevel@tonic-gate 	mir = (mir_t *)q->q_ptr;
29997c478bd9Sstevel@tonic-gate 	mutex_enter(&mir->mir_mutex);
30007c478bd9Sstevel@tonic-gate 
30017c478bd9Sstevel@tonic-gate 	flushdata = mir->mir_inwflushdata;
30027c478bd9Sstevel@tonic-gate 	mir->mir_inwflushdata = 0;
30037c478bd9Sstevel@tonic-gate 
30047c478bd9Sstevel@tonic-gate 	while (mp = getq(q)) {
30057c478bd9Sstevel@tonic-gate 		if (mp->b_datap->db_type == M_DATA) {
30067c478bd9Sstevel@tonic-gate 			/*
30077c478bd9Sstevel@tonic-gate 			 * Do not send any more data if we have sent
30087c478bd9Sstevel@tonic-gate 			 * a T_ORDREL_REQ.
30097c478bd9Sstevel@tonic-gate 			 */
30107c478bd9Sstevel@tonic-gate 			if (flushdata || mir->mir_ordrel_pending == 1) {
30117c478bd9Sstevel@tonic-gate 				freemsg(mp);
30127c478bd9Sstevel@tonic-gate 				continue;
30137c478bd9Sstevel@tonic-gate 			}
30147c478bd9Sstevel@tonic-gate 
30157c478bd9Sstevel@tonic-gate 			/*
30167c478bd9Sstevel@tonic-gate 			 * Make sure that the stream can really handle more
30177c478bd9Sstevel@tonic-gate 			 * data.
30187c478bd9Sstevel@tonic-gate 			 */
30197c478bd9Sstevel@tonic-gate 			if (!MIR_WCANPUTNEXT(mir, q)) {
30207c478bd9Sstevel@tonic-gate 				(void) putbq(q, mp);
30217c478bd9Sstevel@tonic-gate 				mutex_exit(&mir->mir_mutex);
30227c478bd9Sstevel@tonic-gate 				return;
30237c478bd9Sstevel@tonic-gate 			}
30247c478bd9Sstevel@tonic-gate 
30257c478bd9Sstevel@tonic-gate 			/*
30267c478bd9Sstevel@tonic-gate 			 * Now we pass the RPC message downstream.
30277c478bd9Sstevel@tonic-gate 			 */
30287c478bd9Sstevel@tonic-gate 			mutex_exit(&mir->mir_mutex);
30297c478bd9Sstevel@tonic-gate 			putnext(q, mp);
30307c478bd9Sstevel@tonic-gate 			mutex_enter(&mir->mir_mutex);
30317c478bd9Sstevel@tonic-gate 			continue;
30327c478bd9Sstevel@tonic-gate 		}
30337c478bd9Sstevel@tonic-gate 
30347c478bd9Sstevel@tonic-gate 		/*
30357c478bd9Sstevel@tonic-gate 		 * This is not an RPC message, pass it downstream
30367c478bd9Sstevel@tonic-gate 		 * (ignoring flow control) if the server side is not sending a
30377c478bd9Sstevel@tonic-gate 		 * T_ORDREL_REQ downstream.
30387c478bd9Sstevel@tonic-gate 		 */
30397c478bd9Sstevel@tonic-gate 		if (mir->mir_type != RPC_SERVER ||
30407c478bd9Sstevel@tonic-gate 		    ((union T_primitives *)mp->b_rptr)->type !=
30417c478bd9Sstevel@tonic-gate 		    T_ORDREL_REQ) {
30427c478bd9Sstevel@tonic-gate 			mutex_exit(&mir->mir_mutex);
30437c478bd9Sstevel@tonic-gate 			putnext(q, mp);
30447c478bd9Sstevel@tonic-gate 			mutex_enter(&mir->mir_mutex);
30457c478bd9Sstevel@tonic-gate 			continue;
30467c478bd9Sstevel@tonic-gate 		}
30477c478bd9Sstevel@tonic-gate 
30487c478bd9Sstevel@tonic-gate 		if (mir->mir_ordrel_pending == 1) {
30497c478bd9Sstevel@tonic-gate 			/*
30507c478bd9Sstevel@tonic-gate 			 * Don't send two T_ORDRELs
30517c478bd9Sstevel@tonic-gate 			 */
30527c478bd9Sstevel@tonic-gate 			freemsg(mp);
30537c478bd9Sstevel@tonic-gate 			continue;
30547c478bd9Sstevel@tonic-gate 		}
30557c478bd9Sstevel@tonic-gate 
30567c478bd9Sstevel@tonic-gate 		/*
30577c478bd9Sstevel@tonic-gate 		 * Mark the structure so that we know we sent an orderly
30587c478bd9Sstevel@tonic-gate 		 * release request.  We will check to see slot is idle at the
30597c478bd9Sstevel@tonic-gate 		 * end of this routine, and if so, reset the idle timer to
30607c478bd9Sstevel@tonic-gate 		 * handle orderly release timeouts.
30617c478bd9Sstevel@tonic-gate 		 */
30627c478bd9Sstevel@tonic-gate 		mir->mir_ordrel_pending = 1;
30637c478bd9Sstevel@tonic-gate 		RPCLOG(16, "mir_wsrv: sending ordrel req on q 0x%p\n",
30647c478bd9Sstevel@tonic-gate 		    (void *)q);
30657c478bd9Sstevel@tonic-gate 		/*
30667c478bd9Sstevel@tonic-gate 		 * Send the orderly release downstream. If there are other
30677c478bd9Sstevel@tonic-gate 		 * pending replies we won't be able to send them.  However,
30687c478bd9Sstevel@tonic-gate 		 * the only reason we should send the orderly release is if
30697c478bd9Sstevel@tonic-gate 		 * we were idle, or if an unusual event occurred.
30707c478bd9Sstevel@tonic-gate 		 */
30717c478bd9Sstevel@tonic-gate 		mutex_exit(&mir->mir_mutex);
30727c478bd9Sstevel@tonic-gate 		putnext(q, mp);
30737c478bd9Sstevel@tonic-gate 		mutex_enter(&mir->mir_mutex);
30747c478bd9Sstevel@tonic-gate 	}
30757c478bd9Sstevel@tonic-gate 
30767c478bd9Sstevel@tonic-gate 	if (q->q_first == NULL)
30777c478bd9Sstevel@tonic-gate 		/*
30787c478bd9Sstevel@tonic-gate 		 * If we call mir_svc_idle_start() below, then
30797c478bd9Sstevel@tonic-gate 		 * clearing mir_inwservice here will also result in
30807c478bd9Sstevel@tonic-gate 		 * any thread waiting in mir_close() to be signaled.
30817c478bd9Sstevel@tonic-gate 		 */
30827c478bd9Sstevel@tonic-gate 		mir->mir_inwservice = 0;
30837c478bd9Sstevel@tonic-gate 
30847c478bd9Sstevel@tonic-gate 	if (mir->mir_type != RPC_SERVER) {
30857c478bd9Sstevel@tonic-gate 		mutex_exit(&mir->mir_mutex);
30867c478bd9Sstevel@tonic-gate 		return;
30877c478bd9Sstevel@tonic-gate 	}
30887c478bd9Sstevel@tonic-gate 
30897c478bd9Sstevel@tonic-gate 	/*
30907c478bd9Sstevel@tonic-gate 	 * If idle we call mir_svc_idle_start to start the timer (or wakeup
30917c478bd9Sstevel@tonic-gate 	 * a close). Also make sure not to start the idle timer on the
30927c478bd9Sstevel@tonic-gate 	 * listener stream. This can cause nfsd to send an orderly release
30937c478bd9Sstevel@tonic-gate 	 * command on the listener stream.
30947c478bd9Sstevel@tonic-gate 	 */
30957c478bd9Sstevel@tonic-gate 	if (MIR_SVC_QUIESCED(mir) && !(mir->mir_listen_stream)) {
30967c478bd9Sstevel@tonic-gate 		RPCLOG(16, "mir_wsrv: calling mir_svc_idle_start on 0x%p "
30977c478bd9Sstevel@tonic-gate 		    "because mir slot is idle\n", (void *)q);
30987c478bd9Sstevel@tonic-gate 		mir_svc_idle_start(q, mir);
30997c478bd9Sstevel@tonic-gate 	}
31007c478bd9Sstevel@tonic-gate 
31017c478bd9Sstevel@tonic-gate 	/*
31027c478bd9Sstevel@tonic-gate 	 * If outbound flow control has been relieved, then allow new
31037c478bd9Sstevel@tonic-gate 	 * inbound requests to be processed.
31047c478bd9Sstevel@tonic-gate 	 */
31057c478bd9Sstevel@tonic-gate 	if (mir->mir_hold_inbound) {
31067c478bd9Sstevel@tonic-gate 		mir->mir_hold_inbound = 0;
31077c478bd9Sstevel@tonic-gate 		qenable(RD(q));
31087c478bd9Sstevel@tonic-gate 	}
31097c478bd9Sstevel@tonic-gate 	mutex_exit(&mir->mir_mutex);
31107c478bd9Sstevel@tonic-gate }
31117c478bd9Sstevel@tonic-gate 
31127c478bd9Sstevel@tonic-gate static void
31137c478bd9Sstevel@tonic-gate mir_disconnect(queue_t *q, mir_t *mir)
31147c478bd9Sstevel@tonic-gate {
31157c478bd9Sstevel@tonic-gate 	ASSERT(MUTEX_HELD(&mir->mir_mutex));
31167c478bd9Sstevel@tonic-gate 
31177c478bd9Sstevel@tonic-gate 	switch (mir->mir_type) {
31187c478bd9Sstevel@tonic-gate 	case RPC_CLIENT:
31197c478bd9Sstevel@tonic-gate 		/*
31207c478bd9Sstevel@tonic-gate 		 * We are disconnecting, but not necessarily
31217c478bd9Sstevel@tonic-gate 		 * closing. By not closing, we will fail to
31227c478bd9Sstevel@tonic-gate 		 * pick up a possibly changed global timeout value,
31237c478bd9Sstevel@tonic-gate 		 * unless we store it now.
31247c478bd9Sstevel@tonic-gate 		 */
31257c478bd9Sstevel@tonic-gate 		mir->mir_idle_timeout = clnt_idle_timeout;
31267c478bd9Sstevel@tonic-gate 		mir_clnt_idle_start(WR(q), mir);
31277c478bd9Sstevel@tonic-gate 		mutex_exit(&mir->mir_mutex);
31287c478bd9Sstevel@tonic-gate 
31297c478bd9Sstevel@tonic-gate 		/*
31307c478bd9Sstevel@tonic-gate 		 * T_DISCON_REQ is passed to KRPC as an integer value
31317c478bd9Sstevel@tonic-gate 		 * (this is not a TPI message).  It is used as a
31327c478bd9Sstevel@tonic-gate 		 * convenient value to indicate a sanity check
31337c478bd9Sstevel@tonic-gate 		 * failure -- the same KRPC routine is also called
31347c478bd9Sstevel@tonic-gate 		 * for T_DISCON_INDs and T_ORDREL_INDs.
31357c478bd9Sstevel@tonic-gate 		 */
31367c478bd9Sstevel@tonic-gate 		clnt_dispatch_notifyall(WR(q), T_DISCON_REQ, 0);
31377c478bd9Sstevel@tonic-gate 		break;
31387c478bd9Sstevel@tonic-gate 
31397c478bd9Sstevel@tonic-gate 	case RPC_SERVER:
31407c478bd9Sstevel@tonic-gate 		mir->mir_svc_no_more_msgs = 1;
31417c478bd9Sstevel@tonic-gate 		mir_svc_idle_stop(WR(q), mir);
31427c478bd9Sstevel@tonic-gate 		mutex_exit(&mir->mir_mutex);
31437c478bd9Sstevel@tonic-gate 		RPCLOG(16, "mir_disconnect: telling "
31447c478bd9Sstevel@tonic-gate 		    "stream head listener to disconnect stream "
31457c478bd9Sstevel@tonic-gate 		    "(0x%p)\n", (void *) q);
31467c478bd9Sstevel@tonic-gate 		(void) mir_svc_policy_notify(q, 2);
31477c478bd9Sstevel@tonic-gate 		break;
31487c478bd9Sstevel@tonic-gate 
31497c478bd9Sstevel@tonic-gate 	default:
31507c478bd9Sstevel@tonic-gate 		mutex_exit(&mir->mir_mutex);
31517c478bd9Sstevel@tonic-gate 		break;
31527c478bd9Sstevel@tonic-gate 	}
31537c478bd9Sstevel@tonic-gate }
31547c478bd9Sstevel@tonic-gate 
31557c478bd9Sstevel@tonic-gate /*
31567c478bd9Sstevel@tonic-gate  * do a sanity check on the length of the fragment.
31577c478bd9Sstevel@tonic-gate  * returns 1 if bad else 0.
31587c478bd9Sstevel@tonic-gate  */
31597c478bd9Sstevel@tonic-gate static int
31607c478bd9Sstevel@tonic-gate mir_check_len(queue_t *q, int32_t frag_len,
31617c478bd9Sstevel@tonic-gate     mblk_t *head_mp)
31627c478bd9Sstevel@tonic-gate {
31637c478bd9Sstevel@tonic-gate 	mir_t   *mir;
31647c478bd9Sstevel@tonic-gate 
31657c478bd9Sstevel@tonic-gate 	mir = (mir_t *)q->q_ptr;
31667c478bd9Sstevel@tonic-gate 
31677c478bd9Sstevel@tonic-gate 	/*
31687c478bd9Sstevel@tonic-gate 	 * Do a sanity check on the message length.  If this message is
31697c478bd9Sstevel@tonic-gate 	 * getting excessively large, shut down the connection.
31707c478bd9Sstevel@tonic-gate 	 */
31717c478bd9Sstevel@tonic-gate 
31727c478bd9Sstevel@tonic-gate 	if ((frag_len <= 0) || (mir->mir_max_msg_sizep == NULL) ||
31737c478bd9Sstevel@tonic-gate 	    (frag_len <= *mir->mir_max_msg_sizep)) {
31747c478bd9Sstevel@tonic-gate 		return (0);
31757c478bd9Sstevel@tonic-gate 	}
31767c478bd9Sstevel@tonic-gate 
31777c478bd9Sstevel@tonic-gate 	freemsg(head_mp);
31787c478bd9Sstevel@tonic-gate 	mir->mir_head_mp = (mblk_t *)0;
31797c478bd9Sstevel@tonic-gate 	mir->mir_frag_len = -(int)sizeof (uint32_t);
31807c478bd9Sstevel@tonic-gate 	if (mir->mir_type != RPC_SERVER || mir->mir_setup_complete) {
31817c478bd9Sstevel@tonic-gate 		cmn_err(CE_NOTE,
31827c478bd9Sstevel@tonic-gate 		    "KRPC: record fragment from %s of size(%d) exceeds "
31837c478bd9Sstevel@tonic-gate 		    "maximum (%u). Disconnecting",
31847c478bd9Sstevel@tonic-gate 		    (mir->mir_type == RPC_CLIENT) ? "server" :
31857c478bd9Sstevel@tonic-gate 		    (mir->mir_type == RPC_SERVER) ? "client" :
31867c478bd9Sstevel@tonic-gate 		    "test tool",
31877c478bd9Sstevel@tonic-gate 		    frag_len, *mir->mir_max_msg_sizep);
31887c478bd9Sstevel@tonic-gate 	}
31897c478bd9Sstevel@tonic-gate 
31907c478bd9Sstevel@tonic-gate 	mir_disconnect(q, mir);
31917c478bd9Sstevel@tonic-gate 	return (1);
31927c478bd9Sstevel@tonic-gate }
3193