xref: /titanic_51/usr/src/uts/common/os/sunmdi.c (revision ab412e7222cc32794594e5ad31919652d757c81f)
17c478bd9Sstevel@tonic-gate /*
27c478bd9Sstevel@tonic-gate  * CDDL HEADER START
37c478bd9Sstevel@tonic-gate  *
47c478bd9Sstevel@tonic-gate  * The contents of this file are subject to the terms of the
5ee28b439Scm136836  * Common Development and Distribution License (the "License").
6ee28b439Scm136836  * You may not use this file except in compliance with the License.
77c478bd9Sstevel@tonic-gate  *
87c478bd9Sstevel@tonic-gate  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
97c478bd9Sstevel@tonic-gate  * or http://www.opensolaris.org/os/licensing.
107c478bd9Sstevel@tonic-gate  * See the License for the specific language governing permissions
117c478bd9Sstevel@tonic-gate  * and limitations under the License.
127c478bd9Sstevel@tonic-gate  *
137c478bd9Sstevel@tonic-gate  * When distributing Covered Code, include this CDDL HEADER in each
147c478bd9Sstevel@tonic-gate  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
157c478bd9Sstevel@tonic-gate  * If applicable, add the following below this CDDL HEADER, with the
167c478bd9Sstevel@tonic-gate  * fields enclosed by brackets "[]" replaced with your own identifying
177c478bd9Sstevel@tonic-gate  * information: Portions Copyright [yyyy] [name of copyright owner]
187c478bd9Sstevel@tonic-gate  *
197c478bd9Sstevel@tonic-gate  * CDDL HEADER END
207c478bd9Sstevel@tonic-gate  */
217c478bd9Sstevel@tonic-gate /*
2255e592a2SRandall Ralphs  * Copyright 2009 Sun Microsystems, Inc.  All rights reserved.
237c478bd9Sstevel@tonic-gate  * Use is subject to license terms.
247c478bd9Sstevel@tonic-gate  */
257c478bd9Sstevel@tonic-gate 
267c478bd9Sstevel@tonic-gate /*
277c478bd9Sstevel@tonic-gate  * Multipath driver interface (MDI) implementation; see mdi_impl.h for a more
287c478bd9Sstevel@tonic-gate  * detailed discussion of the overall mpxio architecture.
297c478bd9Sstevel@tonic-gate  *
307c478bd9Sstevel@tonic-gate  * Default locking order:
317c478bd9Sstevel@tonic-gate  *
325e3986cbScth  * _NOTE(LOCK_ORDER(mdi_mutex, mdi_vhci:vh_phci_mutex);
335e3986cbScth  * _NOTE(LOCK_ORDER(mdi_mutex, mdi_vhci:vh_client_mutex);
345e3986cbScth  * _NOTE(LOCK_ORDER(mdi_vhci:vh_phci_mutex, mdi_phci::ph_mutex);
355e3986cbScth  * _NOTE(LOCK_ORDER(mdi_vhci:vh_client_mutex, mdi_client::ct_mutex);
367c478bd9Sstevel@tonic-gate  * _NOTE(LOCK_ORDER(mdi_phci::ph_mutex mdi_pathinfo::pi_mutex))
377c478bd9Sstevel@tonic-gate  * _NOTE(LOCK_ORDER(mdi_phci::ph_mutex mdi_client::ct_mutex))
387c478bd9Sstevel@tonic-gate  * _NOTE(LOCK_ORDER(mdi_client::ct_mutex mdi_pathinfo::pi_mutex))
397c478bd9Sstevel@tonic-gate  */
407c478bd9Sstevel@tonic-gate 
417c478bd9Sstevel@tonic-gate #include <sys/note.h>
427c478bd9Sstevel@tonic-gate #include <sys/types.h>
437c478bd9Sstevel@tonic-gate #include <sys/varargs.h>
447c478bd9Sstevel@tonic-gate #include <sys/param.h>
457c478bd9Sstevel@tonic-gate #include <sys/errno.h>
467c478bd9Sstevel@tonic-gate #include <sys/uio.h>
477c478bd9Sstevel@tonic-gate #include <sys/buf.h>
487c478bd9Sstevel@tonic-gate #include <sys/modctl.h>
497c478bd9Sstevel@tonic-gate #include <sys/open.h>
507c478bd9Sstevel@tonic-gate #include <sys/kmem.h>
517c478bd9Sstevel@tonic-gate #include <sys/poll.h>
527c478bd9Sstevel@tonic-gate #include <sys/conf.h>
537c478bd9Sstevel@tonic-gate #include <sys/bootconf.h>
547c478bd9Sstevel@tonic-gate #include <sys/cmn_err.h>
557c478bd9Sstevel@tonic-gate #include <sys/stat.h>
567c478bd9Sstevel@tonic-gate #include <sys/ddi.h>
577c478bd9Sstevel@tonic-gate #include <sys/sunddi.h>
587c478bd9Sstevel@tonic-gate #include <sys/ddipropdefs.h>
597c478bd9Sstevel@tonic-gate #include <sys/sunndi.h>
607c478bd9Sstevel@tonic-gate #include <sys/ndi_impldefs.h>
617c478bd9Sstevel@tonic-gate #include <sys/promif.h>
627c478bd9Sstevel@tonic-gate #include <sys/sunmdi.h>
637c478bd9Sstevel@tonic-gate #include <sys/mdi_impldefs.h>
647c478bd9Sstevel@tonic-gate #include <sys/taskq.h>
657c478bd9Sstevel@tonic-gate #include <sys/epm.h>
667c478bd9Sstevel@tonic-gate #include <sys/sunpm.h>
673c34adc5Sramat #include <sys/modhash.h>
688c4f8890Srs135747 #include <sys/disp.h>
698c4f8890Srs135747 #include <sys/autoconf.h>
70f7209cf2Spramodbg #include <sys/sysmacros.h>
717c478bd9Sstevel@tonic-gate 
727c478bd9Sstevel@tonic-gate #ifdef	DEBUG
737c478bd9Sstevel@tonic-gate #include <sys/debug.h>
747c478bd9Sstevel@tonic-gate int	mdi_debug = 1;
755e3986cbScth int	mdi_debug_logonly = 0;
764c06356bSdh142964 #define	MDI_DEBUG(dbglevel, pargs) if (mdi_debug >= (dbglevel))	i_mdi_log pargs
774c06356bSdh142964 #define	MDI_WARN	CE_WARN, __func__
784c06356bSdh142964 #define	MDI_NOTE	CE_NOTE, __func__
794c06356bSdh142964 #define	MDI_CONT	CE_CONT, __func__
804c06356bSdh142964 static void i_mdi_log(int, const char *, dev_info_t *, const char *, ...);
817c478bd9Sstevel@tonic-gate #else	/* !DEBUG */
824c06356bSdh142964 #define	MDI_DEBUG(dbglevel, pargs)
837c478bd9Sstevel@tonic-gate #endif	/* DEBUG */
844c06356bSdh142964 int	mdi_debug_consoleonly = 0;
857c478bd9Sstevel@tonic-gate 
867c478bd9Sstevel@tonic-gate extern pri_t	minclsyspri;
877c478bd9Sstevel@tonic-gate extern int	modrootloaded;
887c478bd9Sstevel@tonic-gate 
897c478bd9Sstevel@tonic-gate /*
907c478bd9Sstevel@tonic-gate  * Global mutex:
915e3986cbScth  * Protects vHCI list and structure members.
927c478bd9Sstevel@tonic-gate  */
937c478bd9Sstevel@tonic-gate kmutex_t	mdi_mutex;
947c478bd9Sstevel@tonic-gate 
957c478bd9Sstevel@tonic-gate /*
967c478bd9Sstevel@tonic-gate  * Registered vHCI class driver lists
977c478bd9Sstevel@tonic-gate  */
987c478bd9Sstevel@tonic-gate int		mdi_vhci_count;
997c478bd9Sstevel@tonic-gate mdi_vhci_t	*mdi_vhci_head;
1007c478bd9Sstevel@tonic-gate mdi_vhci_t	*mdi_vhci_tail;
1017c478bd9Sstevel@tonic-gate 
1027c478bd9Sstevel@tonic-gate /*
1037c478bd9Sstevel@tonic-gate  * Client Hash Table size
1047c478bd9Sstevel@tonic-gate  */
1057c478bd9Sstevel@tonic-gate static int	mdi_client_table_size = CLIENT_HASH_TABLE_SIZE;
1067c478bd9Sstevel@tonic-gate 
1077c478bd9Sstevel@tonic-gate /*
1087c478bd9Sstevel@tonic-gate  * taskq interface definitions
1097c478bd9Sstevel@tonic-gate  */
1107c478bd9Sstevel@tonic-gate #define	MDI_TASKQ_N_THREADS	8
1117c478bd9Sstevel@tonic-gate #define	MDI_TASKQ_PRI		minclsyspri
1127c478bd9Sstevel@tonic-gate #define	MDI_TASKQ_MINALLOC	(4*mdi_taskq_n_threads)
1137c478bd9Sstevel@tonic-gate #define	MDI_TASKQ_MAXALLOC	(500*mdi_taskq_n_threads)
1147c478bd9Sstevel@tonic-gate 
1157c478bd9Sstevel@tonic-gate taskq_t				*mdi_taskq;
1167c478bd9Sstevel@tonic-gate static uint_t			mdi_taskq_n_threads = MDI_TASKQ_N_THREADS;
1177c478bd9Sstevel@tonic-gate 
1183c34adc5Sramat #define	TICKS_PER_SECOND	(drv_usectohz(1000000))
1193c34adc5Sramat 
1207c478bd9Sstevel@tonic-gate /*
1213c34adc5Sramat  * The data should be "quiet" for this interval (in seconds) before the
1223c34adc5Sramat  * vhci cached data is flushed to the disk.
1237c478bd9Sstevel@tonic-gate  */
1243c34adc5Sramat static int mdi_vhcache_flush_delay = 10;
1253c34adc5Sramat 
1263c34adc5Sramat /* number of seconds the vhcache flush daemon will sleep idle before exiting */
1273c34adc5Sramat static int mdi_vhcache_flush_daemon_idle_time = 60;
1283c34adc5Sramat 
1293c34adc5Sramat /*
13067e56d35Sramat  * MDI falls back to discovery of all paths when a bus_config_one fails.
13167e56d35Sramat  * The following parameters can be used to tune this operation.
13267e56d35Sramat  *
13367e56d35Sramat  * mdi_path_discovery_boot
13467e56d35Sramat  *	Number of times path discovery will be attempted during early boot.
13567e56d35Sramat  *	Probably there is no reason to ever set this value to greater than one.
13667e56d35Sramat  *
13767e56d35Sramat  * mdi_path_discovery_postboot
13867e56d35Sramat  *	Number of times path discovery will be attempted after early boot.
13967e56d35Sramat  *	Set it to a minimum of two to allow for discovery of iscsi paths which
14067e56d35Sramat  *	may happen very late during booting.
14167e56d35Sramat  *
14267e56d35Sramat  * mdi_path_discovery_interval
14367e56d35Sramat  *	Minimum number of seconds MDI will wait between successive discovery
14467e56d35Sramat  *	of all paths. Set it to -1 to disable discovery of all paths.
14567e56d35Sramat  */
14667e56d35Sramat static int mdi_path_discovery_boot = 1;
14767e56d35Sramat static int mdi_path_discovery_postboot = 2;
14867e56d35Sramat static int mdi_path_discovery_interval = 10;
14967e56d35Sramat 
15067e56d35Sramat /*
1513c34adc5Sramat  * number of seconds the asynchronous configuration thread will sleep idle
1523c34adc5Sramat  * before exiting.
1533c34adc5Sramat  */
1543c34adc5Sramat static int mdi_async_config_idle_time = 600;
1553c34adc5Sramat 
1563c34adc5Sramat static int mdi_bus_config_cache_hash_size = 256;
1573c34adc5Sramat 
1583c34adc5Sramat /* turns off multithreaded configuration for certain operations */
1593c34adc5Sramat static int mdi_mtc_off = 0;
1607c478bd9Sstevel@tonic-gate 
1617c478bd9Sstevel@tonic-gate /*
162602ca9eaScth  * The "path" to a pathinfo node is identical to the /devices path to a
163602ca9eaScth  * devinfo node had the device been enumerated under a pHCI instead of
164602ca9eaScth  * a vHCI.  This pathinfo "path" is associated with a 'path_instance'.
165602ca9eaScth  * This association persists across create/delete of the pathinfo nodes,
166602ca9eaScth  * but not across reboot.
167602ca9eaScth  */
168602ca9eaScth static uint_t		mdi_pathmap_instance = 1;	/* 0 -> any path */
169602ca9eaScth static int		mdi_pathmap_hash_size = 256;
170602ca9eaScth static kmutex_t		mdi_pathmap_mutex;
171602ca9eaScth static mod_hash_t	*mdi_pathmap_bypath;		/* "path"->instance */
172602ca9eaScth static mod_hash_t	*mdi_pathmap_byinstance;	/* instance->"path" */
1734c06356bSdh142964 static mod_hash_t	*mdi_pathmap_sbyinstance;	/* inst->shortpath */
174602ca9eaScth 
175602ca9eaScth /*
1767c478bd9Sstevel@tonic-gate  * MDI component property name/value string definitions
1777c478bd9Sstevel@tonic-gate  */
1787c478bd9Sstevel@tonic-gate const char 		*mdi_component_prop = "mpxio-component";
1797c478bd9Sstevel@tonic-gate const char		*mdi_component_prop_vhci = "vhci";
1807c478bd9Sstevel@tonic-gate const char		*mdi_component_prop_phci = "phci";
1817c478bd9Sstevel@tonic-gate const char		*mdi_component_prop_client = "client";
1827c478bd9Sstevel@tonic-gate 
1837c478bd9Sstevel@tonic-gate /*
1847c478bd9Sstevel@tonic-gate  * MDI client global unique identifier property name
1857c478bd9Sstevel@tonic-gate  */
1867c478bd9Sstevel@tonic-gate const char		*mdi_client_guid_prop = "client-guid";
1877c478bd9Sstevel@tonic-gate 
1887c478bd9Sstevel@tonic-gate /*
1897c478bd9Sstevel@tonic-gate  * MDI client load balancing property name/value string definitions
1907c478bd9Sstevel@tonic-gate  */
1917c478bd9Sstevel@tonic-gate const char		*mdi_load_balance = "load-balance";
1927c478bd9Sstevel@tonic-gate const char		*mdi_load_balance_none = "none";
1937c478bd9Sstevel@tonic-gate const char		*mdi_load_balance_rr = "round-robin";
1947c478bd9Sstevel@tonic-gate const char		*mdi_load_balance_lba = "logical-block";
1957c478bd9Sstevel@tonic-gate 
1967c478bd9Sstevel@tonic-gate /*
1977c478bd9Sstevel@tonic-gate  * Obsolete vHCI class definition; to be removed after Leadville update
1987c478bd9Sstevel@tonic-gate  */
1997c478bd9Sstevel@tonic-gate const char *mdi_vhci_class_scsi = MDI_HCI_CLASS_SCSI;
2007c478bd9Sstevel@tonic-gate 
2017c478bd9Sstevel@tonic-gate static char vhci_greeting[] =
2027c478bd9Sstevel@tonic-gate 	"\tThere already exists one vHCI driver for class %s\n"
2037c478bd9Sstevel@tonic-gate 	"\tOnly one vHCI driver for each class is allowed\n";
2047c478bd9Sstevel@tonic-gate 
2057c478bd9Sstevel@tonic-gate /*
2067c478bd9Sstevel@tonic-gate  * Static function prototypes
2077c478bd9Sstevel@tonic-gate  */
2087c478bd9Sstevel@tonic-gate static int		i_mdi_phci_offline(dev_info_t *, uint_t);
2097c478bd9Sstevel@tonic-gate static int		i_mdi_client_offline(dev_info_t *, uint_t);
2107c478bd9Sstevel@tonic-gate static int		i_mdi_phci_pre_detach(dev_info_t *, ddi_detach_cmd_t);
2117c478bd9Sstevel@tonic-gate static void		i_mdi_phci_post_detach(dev_info_t *,
2127c478bd9Sstevel@tonic-gate 			    ddi_detach_cmd_t, int);
2137c478bd9Sstevel@tonic-gate static int		i_mdi_client_pre_detach(dev_info_t *,
2147c478bd9Sstevel@tonic-gate 			    ddi_detach_cmd_t);
2157c478bd9Sstevel@tonic-gate static void		i_mdi_client_post_detach(dev_info_t *,
2167c478bd9Sstevel@tonic-gate 			    ddi_detach_cmd_t, int);
2177c478bd9Sstevel@tonic-gate static void		i_mdi_pm_hold_pip(mdi_pathinfo_t *);
2187c478bd9Sstevel@tonic-gate static void		i_mdi_pm_rele_pip(mdi_pathinfo_t *);
2197c478bd9Sstevel@tonic-gate static int 		i_mdi_lba_lb(mdi_client_t *ct,
2207c478bd9Sstevel@tonic-gate 			    mdi_pathinfo_t **ret_pip, struct buf *buf);
2217c478bd9Sstevel@tonic-gate static void		i_mdi_pm_hold_client(mdi_client_t *, int);
2227c478bd9Sstevel@tonic-gate static void		i_mdi_pm_rele_client(mdi_client_t *, int);
2237c478bd9Sstevel@tonic-gate static void		i_mdi_pm_reset_client(mdi_client_t *);
2247c478bd9Sstevel@tonic-gate static int		i_mdi_power_all_phci(mdi_client_t *);
2258c4f8890Srs135747 static void		i_mdi_log_sysevent(dev_info_t *, char *, char *);
2267c478bd9Sstevel@tonic-gate 
2277c478bd9Sstevel@tonic-gate 
2287c478bd9Sstevel@tonic-gate /*
2297c478bd9Sstevel@tonic-gate  * Internal mdi_pathinfo node functions
2307c478bd9Sstevel@tonic-gate  */
2317c478bd9Sstevel@tonic-gate static void		i_mdi_pi_kstat_destroy(mdi_pathinfo_t *);
2327c478bd9Sstevel@tonic-gate 
2337c478bd9Sstevel@tonic-gate static mdi_vhci_t	*i_mdi_vhci_class2vhci(char *);
2347c478bd9Sstevel@tonic-gate static mdi_vhci_t	*i_devi_get_vhci(dev_info_t *);
2357c478bd9Sstevel@tonic-gate static mdi_phci_t	*i_devi_get_phci(dev_info_t *);
2367c478bd9Sstevel@tonic-gate static void		i_mdi_phci_lock(mdi_phci_t *, mdi_pathinfo_t *);
2377c478bd9Sstevel@tonic-gate static void		i_mdi_phci_unlock(mdi_phci_t *);
2383c34adc5Sramat static mdi_pathinfo_t	*i_mdi_pi_alloc(mdi_phci_t *, char *, mdi_client_t *);
2397c478bd9Sstevel@tonic-gate static void		i_mdi_phci_add_path(mdi_phci_t *, mdi_pathinfo_t *);
2407c478bd9Sstevel@tonic-gate static void		i_mdi_client_add_path(mdi_client_t *, mdi_pathinfo_t *);
2417c478bd9Sstevel@tonic-gate static void		i_mdi_pi_free(mdi_phci_t *ph, mdi_pathinfo_t *,
2427c478bd9Sstevel@tonic-gate 			    mdi_client_t *);
2437c478bd9Sstevel@tonic-gate static void		i_mdi_phci_remove_path(mdi_phci_t *, mdi_pathinfo_t *);
2447c478bd9Sstevel@tonic-gate static void		i_mdi_client_remove_path(mdi_client_t *,
2457c478bd9Sstevel@tonic-gate 			    mdi_pathinfo_t *);
2467c478bd9Sstevel@tonic-gate 
2477c478bd9Sstevel@tonic-gate static int		i_mdi_pi_state_change(mdi_pathinfo_t *,
2487c478bd9Sstevel@tonic-gate 			    mdi_pathinfo_state_t, int);
2497c478bd9Sstevel@tonic-gate static int		i_mdi_pi_offline(mdi_pathinfo_t *, int);
2507c478bd9Sstevel@tonic-gate static dev_info_t	*i_mdi_devinfo_create(mdi_vhci_t *, char *, char *,
2513c34adc5Sramat 			    char **, int);
2527c478bd9Sstevel@tonic-gate static dev_info_t	*i_mdi_devinfo_find(mdi_vhci_t *, char *, char *);
2537c478bd9Sstevel@tonic-gate static int		i_mdi_devinfo_remove(dev_info_t *, dev_info_t *, int);
2547c478bd9Sstevel@tonic-gate static int		i_mdi_is_child_present(dev_info_t *, dev_info_t *);
2553c34adc5Sramat static mdi_client_t	*i_mdi_client_alloc(mdi_vhci_t *, char *, char *);
2567c478bd9Sstevel@tonic-gate static void		i_mdi_client_enlist_table(mdi_vhci_t *, mdi_client_t *);
2577c478bd9Sstevel@tonic-gate static void		i_mdi_client_delist_table(mdi_vhci_t *, mdi_client_t *);
2583c34adc5Sramat static mdi_client_t	*i_mdi_client_find(mdi_vhci_t *, char *, char *);
2597c478bd9Sstevel@tonic-gate static void		i_mdi_client_update_state(mdi_client_t *);
2607c478bd9Sstevel@tonic-gate static int		i_mdi_client_compute_state(mdi_client_t *,
2617c478bd9Sstevel@tonic-gate 			    mdi_phci_t *);
2627c478bd9Sstevel@tonic-gate static void		i_mdi_client_lock(mdi_client_t *, mdi_pathinfo_t *);
2637c478bd9Sstevel@tonic-gate static void		i_mdi_client_unlock(mdi_client_t *);
2647c478bd9Sstevel@tonic-gate static int		i_mdi_client_free(mdi_vhci_t *, mdi_client_t *);
2657c478bd9Sstevel@tonic-gate static mdi_client_t	*i_devi_get_client(dev_info_t *);
266ee28b439Scm136836 /*
267ee28b439Scm136836  * NOTE: this will be removed once the NWS files are changed to use the new
268ee28b439Scm136836  * mdi_{enable,disable}_path interfaces
269ee28b439Scm136836  */
270ee28b439Scm136836 static int		i_mdi_pi_enable_disable(dev_info_t *, dev_info_t *,
271ee28b439Scm136836 				int, int);
272ee28b439Scm136836 static mdi_pathinfo_t 	*i_mdi_enable_disable_path(mdi_pathinfo_t *pip,
273ee28b439Scm136836 				mdi_vhci_t *vh, int flags, int op);
2747c478bd9Sstevel@tonic-gate /*
2757c478bd9Sstevel@tonic-gate  * Failover related function prototypes
2767c478bd9Sstevel@tonic-gate  */
2777c478bd9Sstevel@tonic-gate static int		i_mdi_failover(void *);
2787c478bd9Sstevel@tonic-gate 
2797c478bd9Sstevel@tonic-gate /*
2807c478bd9Sstevel@tonic-gate  * misc internal functions
2817c478bd9Sstevel@tonic-gate  */
2827c478bd9Sstevel@tonic-gate static int		i_mdi_get_hash_key(char *);
2837c478bd9Sstevel@tonic-gate static int		i_map_nvlist_error_to_mdi(int);
2847c478bd9Sstevel@tonic-gate static void		i_mdi_report_path_state(mdi_client_t *,
2857c478bd9Sstevel@tonic-gate 			    mdi_pathinfo_t *);
2867c478bd9Sstevel@tonic-gate 
2873c34adc5Sramat static void		setup_vhci_cache(mdi_vhci_t *);
2883c34adc5Sramat static int		destroy_vhci_cache(mdi_vhci_t *);
2893c34adc5Sramat static int		stop_vhcache_async_threads(mdi_vhci_config_t *);
2903c34adc5Sramat static boolean_t	stop_vhcache_flush_thread(void *, int);
2913c34adc5Sramat static void		free_string_array(char **, int);
2923c34adc5Sramat static void		free_vhcache_phci(mdi_vhcache_phci_t *);
2933c34adc5Sramat static void		free_vhcache_pathinfo(mdi_vhcache_pathinfo_t *);
2943c34adc5Sramat static void		free_vhcache_client(mdi_vhcache_client_t *);
2953c34adc5Sramat static int		mainnvl_to_vhcache(mdi_vhci_cache_t *, nvlist_t *);
2963c34adc5Sramat static nvlist_t		*vhcache_to_mainnvl(mdi_vhci_cache_t *);
2973c34adc5Sramat static void		vhcache_phci_add(mdi_vhci_config_t *, mdi_phci_t *);
2983c34adc5Sramat static void		vhcache_phci_remove(mdi_vhci_config_t *, mdi_phci_t *);
2993c34adc5Sramat static void		vhcache_pi_add(mdi_vhci_config_t *,
3003c34adc5Sramat 			    struct mdi_pathinfo *);
3013c34adc5Sramat static void		vhcache_pi_remove(mdi_vhci_config_t *,
3023c34adc5Sramat 			    struct mdi_pathinfo *);
3033c34adc5Sramat static void		free_phclient_path_list(mdi_phys_path_t *);
3043c34adc5Sramat static void		sort_vhcache_paths(mdi_vhcache_client_t *);
3053c34adc5Sramat static int		flush_vhcache(mdi_vhci_config_t *, int);
3063c34adc5Sramat static void		vhcache_dirty(mdi_vhci_config_t *);
3073c34adc5Sramat static void		free_async_client_config(mdi_async_client_config_t *);
30867e56d35Sramat static void		single_threaded_vhconfig_enter(mdi_vhci_config_t *);
30967e56d35Sramat static void		single_threaded_vhconfig_exit(mdi_vhci_config_t *);
3103c34adc5Sramat static nvlist_t		*read_on_disk_vhci_cache(char *);
3113c34adc5Sramat extern int		fread_nvlist(char *, nvlist_t **);
3123c34adc5Sramat extern int		fwrite_nvlist(char *, nvlist_t *);
3133c34adc5Sramat 
3147c478bd9Sstevel@tonic-gate /* called once when first vhci registers with mdi */
3157c478bd9Sstevel@tonic-gate static void
3167c478bd9Sstevel@tonic-gate i_mdi_init()
3177c478bd9Sstevel@tonic-gate {
3187c478bd9Sstevel@tonic-gate 	static int initialized = 0;
3197c478bd9Sstevel@tonic-gate 
3207c478bd9Sstevel@tonic-gate 	if (initialized)
3217c478bd9Sstevel@tonic-gate 		return;
3227c478bd9Sstevel@tonic-gate 	initialized = 1;
3237c478bd9Sstevel@tonic-gate 
3247c478bd9Sstevel@tonic-gate 	mutex_init(&mdi_mutex, NULL, MUTEX_DEFAULT, NULL);
325602ca9eaScth 
326602ca9eaScth 	/* Create our taskq resources */
3277c478bd9Sstevel@tonic-gate 	mdi_taskq = taskq_create("mdi_taskq", mdi_taskq_n_threads,
3287c478bd9Sstevel@tonic-gate 	    MDI_TASKQ_PRI, MDI_TASKQ_MINALLOC, MDI_TASKQ_MAXALLOC,
3297c478bd9Sstevel@tonic-gate 	    TASKQ_PREPOPULATE | TASKQ_CPR_SAFE);
3307c478bd9Sstevel@tonic-gate 	ASSERT(mdi_taskq != NULL);	/* taskq_create never fails */
331602ca9eaScth 
332602ca9eaScth 	/* Allocate ['path_instance' <-> "path"] maps */
333602ca9eaScth 	mutex_init(&mdi_pathmap_mutex, NULL, MUTEX_DRIVER, NULL);
334602ca9eaScth 	mdi_pathmap_bypath = mod_hash_create_strhash(
335602ca9eaScth 	    "mdi_pathmap_bypath", mdi_pathmap_hash_size,
336602ca9eaScth 	    mod_hash_null_valdtor);
337602ca9eaScth 	mdi_pathmap_byinstance = mod_hash_create_idhash(
338602ca9eaScth 	    "mdi_pathmap_byinstance", mdi_pathmap_hash_size,
339602ca9eaScth 	    mod_hash_null_valdtor);
3404c06356bSdh142964 	mdi_pathmap_sbyinstance = mod_hash_create_idhash(
3414c06356bSdh142964 	    "mdi_pathmap_sbyinstance", mdi_pathmap_hash_size,
3424c06356bSdh142964 	    mod_hash_null_valdtor);
3437c478bd9Sstevel@tonic-gate }
3447c478bd9Sstevel@tonic-gate 
3457c478bd9Sstevel@tonic-gate /*
3467c478bd9Sstevel@tonic-gate  * mdi_get_component_type():
3477c478bd9Sstevel@tonic-gate  *		Return mpxio component type
3487c478bd9Sstevel@tonic-gate  * Return Values:
3497c478bd9Sstevel@tonic-gate  *		MDI_COMPONENT_NONE
3507c478bd9Sstevel@tonic-gate  *		MDI_COMPONENT_VHCI
3517c478bd9Sstevel@tonic-gate  *		MDI_COMPONENT_PHCI
3527c478bd9Sstevel@tonic-gate  *		MDI_COMPONENT_CLIENT
3537c478bd9Sstevel@tonic-gate  * XXX This doesn't work under multi-level MPxIO and should be
3545e3986cbScth  *	removed when clients migrate mdi_component_is_*() interfaces.
3557c478bd9Sstevel@tonic-gate  */
3567c478bd9Sstevel@tonic-gate int
3577c478bd9Sstevel@tonic-gate mdi_get_component_type(dev_info_t *dip)
3587c478bd9Sstevel@tonic-gate {
3597c478bd9Sstevel@tonic-gate 	return (DEVI(dip)->devi_mdi_component);
3607c478bd9Sstevel@tonic-gate }
3617c478bd9Sstevel@tonic-gate 
3627c478bd9Sstevel@tonic-gate /*
3637c478bd9Sstevel@tonic-gate  * mdi_vhci_register():
3647c478bd9Sstevel@tonic-gate  *		Register a vHCI module with the mpxio framework
3657c478bd9Sstevel@tonic-gate  *		mdi_vhci_register() is called by vHCI drivers to register the
3667c478bd9Sstevel@tonic-gate  *		'class_driver' vHCI driver and its MDI entrypoints with the
3677c478bd9Sstevel@tonic-gate  *		mpxio framework.  The vHCI driver must call this interface as
3687c478bd9Sstevel@tonic-gate  *		part of its attach(9e) handler.
3697c478bd9Sstevel@tonic-gate  *		Competing threads may try to attach mdi_vhci_register() as
3707c478bd9Sstevel@tonic-gate  *		the vHCI drivers are loaded and attached as a result of pHCI
3717c478bd9Sstevel@tonic-gate  *		driver instance registration (mdi_phci_register()) with the
3727c478bd9Sstevel@tonic-gate  *		framework.
3737c478bd9Sstevel@tonic-gate  * Return Values:
3747c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
3757c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
3767c478bd9Sstevel@tonic-gate  */
3777c478bd9Sstevel@tonic-gate /*ARGSUSED*/
3787c478bd9Sstevel@tonic-gate int
3797c478bd9Sstevel@tonic-gate mdi_vhci_register(char *class, dev_info_t *vdip, mdi_vhci_ops_t *vops,
3807c478bd9Sstevel@tonic-gate     int flags)
3817c478bd9Sstevel@tonic-gate {
3827c478bd9Sstevel@tonic-gate 	mdi_vhci_t		*vh = NULL;
3837c478bd9Sstevel@tonic-gate 
38455e592a2SRandall Ralphs 	/* Registrant can't be older */
38555e592a2SRandall Ralphs 	ASSERT(vops->vo_revision <= MDI_VHCI_OPS_REV);
38655e592a2SRandall Ralphs 
38700a3eaf3SRamaswamy Tummala #ifdef DEBUG
38800a3eaf3SRamaswamy Tummala 	/*
38900a3eaf3SRamaswamy Tummala 	 * IB nexus driver is loaded only when IB hardware is present.
39000a3eaf3SRamaswamy Tummala 	 * In order to be able to do this there is a need to drive the loading
39100a3eaf3SRamaswamy Tummala 	 * and attaching of the IB nexus driver (especially when an IB hardware
39200a3eaf3SRamaswamy Tummala 	 * is dynamically plugged in) when an IB HCA driver (PHCI)
39300a3eaf3SRamaswamy Tummala 	 * is being attached. Unfortunately this gets into the limitations
39400a3eaf3SRamaswamy Tummala 	 * of devfs as there seems to be no clean way to drive configuration
39500a3eaf3SRamaswamy Tummala 	 * of a subtree from another subtree of a devfs. Hence, do not ASSERT
39600a3eaf3SRamaswamy Tummala 	 * for IB.
39700a3eaf3SRamaswamy Tummala 	 */
39800a3eaf3SRamaswamy Tummala 	if (strcmp(class, MDI_HCI_CLASS_IB) != 0)
3995e3986cbScth 		ASSERT(DEVI_BUSY_OWNED(ddi_get_parent(vdip)));
40000a3eaf3SRamaswamy Tummala #endif
4017c478bd9Sstevel@tonic-gate 
4027c478bd9Sstevel@tonic-gate 	i_mdi_init();
4037c478bd9Sstevel@tonic-gate 
4047c478bd9Sstevel@tonic-gate 	mutex_enter(&mdi_mutex);
4057c478bd9Sstevel@tonic-gate 	/*
4067c478bd9Sstevel@tonic-gate 	 * Scan for already registered vhci
4077c478bd9Sstevel@tonic-gate 	 */
4087c478bd9Sstevel@tonic-gate 	for (vh = mdi_vhci_head; vh != NULL; vh = vh->vh_next) {
4097c478bd9Sstevel@tonic-gate 		if (strcmp(vh->vh_class, class) == 0) {
4107c478bd9Sstevel@tonic-gate 			/*
4117c478bd9Sstevel@tonic-gate 			 * vHCI has already been created.  Check for valid
4127c478bd9Sstevel@tonic-gate 			 * vHCI ops registration.  We only support one vHCI
4137c478bd9Sstevel@tonic-gate 			 * module per class
4147c478bd9Sstevel@tonic-gate 			 */
4157c478bd9Sstevel@tonic-gate 			if (vh->vh_ops != NULL) {
4167c478bd9Sstevel@tonic-gate 				mutex_exit(&mdi_mutex);
4177c478bd9Sstevel@tonic-gate 				cmn_err(CE_NOTE, vhci_greeting, class);
4187c478bd9Sstevel@tonic-gate 				return (MDI_FAILURE);
4197c478bd9Sstevel@tonic-gate 			}
4207c478bd9Sstevel@tonic-gate 			break;
4217c478bd9Sstevel@tonic-gate 		}
4227c478bd9Sstevel@tonic-gate 	}
4237c478bd9Sstevel@tonic-gate 
4247c478bd9Sstevel@tonic-gate 	/*
4257c478bd9Sstevel@tonic-gate 	 * if not yet created, create the vHCI component
4267c478bd9Sstevel@tonic-gate 	 */
4277c478bd9Sstevel@tonic-gate 	if (vh == NULL) {
4287c478bd9Sstevel@tonic-gate 		struct client_hash	*hash = NULL;
4297c478bd9Sstevel@tonic-gate 		char			*load_balance;
4307c478bd9Sstevel@tonic-gate 
4317c478bd9Sstevel@tonic-gate 		/*
4327c478bd9Sstevel@tonic-gate 		 * Allocate and initialize the mdi extensions
4337c478bd9Sstevel@tonic-gate 		 */
4347c478bd9Sstevel@tonic-gate 		vh = kmem_zalloc(sizeof (mdi_vhci_t), KM_SLEEP);
4357c478bd9Sstevel@tonic-gate 		hash = kmem_zalloc(mdi_client_table_size * sizeof (*hash),
4367c478bd9Sstevel@tonic-gate 		    KM_SLEEP);
4377c478bd9Sstevel@tonic-gate 		vh->vh_client_table = hash;
4387c478bd9Sstevel@tonic-gate 		vh->vh_class = kmem_zalloc(strlen(class) + 1, KM_SLEEP);
4397c478bd9Sstevel@tonic-gate 		(void) strcpy(vh->vh_class, class);
4407c478bd9Sstevel@tonic-gate 		vh->vh_lb = LOAD_BALANCE_RR;
4417c478bd9Sstevel@tonic-gate 		if (ddi_prop_lookup_string(DDI_DEV_T_ANY, vdip,
4427c478bd9Sstevel@tonic-gate 		    0, LOAD_BALANCE_PROP, &load_balance) == DDI_SUCCESS) {
4437c478bd9Sstevel@tonic-gate 			if (strcmp(load_balance, LOAD_BALANCE_PROP_NONE) == 0) {
4447c478bd9Sstevel@tonic-gate 				vh->vh_lb = LOAD_BALANCE_NONE;
4457c478bd9Sstevel@tonic-gate 			} else if (strcmp(load_balance, LOAD_BALANCE_PROP_LBA)
4467c478bd9Sstevel@tonic-gate 				    == 0) {
4477c478bd9Sstevel@tonic-gate 				vh->vh_lb = LOAD_BALANCE_LBA;
4487c478bd9Sstevel@tonic-gate 			}
4497c478bd9Sstevel@tonic-gate 			ddi_prop_free(load_balance);
4507c478bd9Sstevel@tonic-gate 		}
4517c478bd9Sstevel@tonic-gate 
4525e3986cbScth 		mutex_init(&vh->vh_phci_mutex, NULL, MUTEX_DEFAULT, NULL);
4535e3986cbScth 		mutex_init(&vh->vh_client_mutex, NULL, MUTEX_DEFAULT, NULL);
4545e3986cbScth 
4557c478bd9Sstevel@tonic-gate 		/*
4567c478bd9Sstevel@tonic-gate 		 * Store the vHCI ops vectors
4577c478bd9Sstevel@tonic-gate 		 */
4587c478bd9Sstevel@tonic-gate 		vh->vh_dip = vdip;
4597c478bd9Sstevel@tonic-gate 		vh->vh_ops = vops;
4607c478bd9Sstevel@tonic-gate 
4613c34adc5Sramat 		setup_vhci_cache(vh);
4627c478bd9Sstevel@tonic-gate 
4637c478bd9Sstevel@tonic-gate 		if (mdi_vhci_head == NULL) {
4647c478bd9Sstevel@tonic-gate 			mdi_vhci_head = vh;
4657c478bd9Sstevel@tonic-gate 		}
4667c478bd9Sstevel@tonic-gate 		if (mdi_vhci_tail) {
4677c478bd9Sstevel@tonic-gate 			mdi_vhci_tail->vh_next = vh;
4687c478bd9Sstevel@tonic-gate 		}
4697c478bd9Sstevel@tonic-gate 		mdi_vhci_tail = vh;
4707c478bd9Sstevel@tonic-gate 		mdi_vhci_count++;
4717c478bd9Sstevel@tonic-gate 	}
4727c478bd9Sstevel@tonic-gate 
4737c478bd9Sstevel@tonic-gate 	/*
4747c478bd9Sstevel@tonic-gate 	 * Claim the devfs node as a vhci component
4757c478bd9Sstevel@tonic-gate 	 */
4767c478bd9Sstevel@tonic-gate 	DEVI(vdip)->devi_mdi_component |= MDI_COMPONENT_VHCI;
4777c478bd9Sstevel@tonic-gate 
4787c478bd9Sstevel@tonic-gate 	/*
4797c478bd9Sstevel@tonic-gate 	 * Initialize our back reference from dev_info node
4807c478bd9Sstevel@tonic-gate 	 */
4817c478bd9Sstevel@tonic-gate 	DEVI(vdip)->devi_mdi_xhci = (caddr_t)vh;
4827c478bd9Sstevel@tonic-gate 	mutex_exit(&mdi_mutex);
4837c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
4847c478bd9Sstevel@tonic-gate }
4857c478bd9Sstevel@tonic-gate 
4867c478bd9Sstevel@tonic-gate /*
4877c478bd9Sstevel@tonic-gate  * mdi_vhci_unregister():
4887c478bd9Sstevel@tonic-gate  *		Unregister a vHCI module from mpxio framework
4897c478bd9Sstevel@tonic-gate  *		mdi_vhci_unregister() is called from the detach(9E) entrypoint
4907c478bd9Sstevel@tonic-gate  * 		of a vhci to unregister it from the framework.
4917c478bd9Sstevel@tonic-gate  * Return Values:
4927c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
4937c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
4947c478bd9Sstevel@tonic-gate  */
4957c478bd9Sstevel@tonic-gate /*ARGSUSED*/
4967c478bd9Sstevel@tonic-gate int
4977c478bd9Sstevel@tonic-gate mdi_vhci_unregister(dev_info_t *vdip, int flags)
4987c478bd9Sstevel@tonic-gate {
4997c478bd9Sstevel@tonic-gate 	mdi_vhci_t	*found, *vh, *prev = NULL;
5007c478bd9Sstevel@tonic-gate 
5015e3986cbScth 	ASSERT(DEVI_BUSY_OWNED(ddi_get_parent(vdip)));
5025e3986cbScth 
5037c478bd9Sstevel@tonic-gate 	/*
5047c478bd9Sstevel@tonic-gate 	 * Check for invalid VHCI
5057c478bd9Sstevel@tonic-gate 	 */
5067c478bd9Sstevel@tonic-gate 	if ((vh = i_devi_get_vhci(vdip)) == NULL)
5077c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
5087c478bd9Sstevel@tonic-gate 
5097c478bd9Sstevel@tonic-gate 	/*
5107c478bd9Sstevel@tonic-gate 	 * Scan the list of registered vHCIs for a match
5117c478bd9Sstevel@tonic-gate 	 */
5125e3986cbScth 	mutex_enter(&mdi_mutex);
5137c478bd9Sstevel@tonic-gate 	for (found = mdi_vhci_head; found != NULL; found = found->vh_next) {
5147c478bd9Sstevel@tonic-gate 		if (found == vh)
5157c478bd9Sstevel@tonic-gate 			break;
5167c478bd9Sstevel@tonic-gate 		prev = found;
5177c478bd9Sstevel@tonic-gate 	}
5187c478bd9Sstevel@tonic-gate 
5197c478bd9Sstevel@tonic-gate 	if (found == NULL) {
5207c478bd9Sstevel@tonic-gate 		mutex_exit(&mdi_mutex);
5217c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
5227c478bd9Sstevel@tonic-gate 	}
5237c478bd9Sstevel@tonic-gate 
5247c478bd9Sstevel@tonic-gate 	/*
5258c4f8890Srs135747 	 * Check the vHCI, pHCI and client count. All the pHCIs and clients
5267c478bd9Sstevel@tonic-gate 	 * should have been unregistered, before a vHCI can be
5277c478bd9Sstevel@tonic-gate 	 * unregistered.
5287c478bd9Sstevel@tonic-gate 	 */
5295e3986cbScth 	MDI_VHCI_PHCI_LOCK(vh);
5305e3986cbScth 	if (vh->vh_refcnt || vh->vh_phci_count || vh->vh_client_count) {
5315e3986cbScth 		MDI_VHCI_PHCI_UNLOCK(vh);
5325e3986cbScth 		mutex_exit(&mdi_mutex);
5335e3986cbScth 		return (MDI_FAILURE);
5345e3986cbScth 	}
5355e3986cbScth 	MDI_VHCI_PHCI_UNLOCK(vh);
5365e3986cbScth 
5375e3986cbScth 	if (destroy_vhci_cache(vh) != MDI_SUCCESS) {
5387c478bd9Sstevel@tonic-gate 		mutex_exit(&mdi_mutex);
5397c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
5407c478bd9Sstevel@tonic-gate 	}
5417c478bd9Sstevel@tonic-gate 
5427c478bd9Sstevel@tonic-gate 	/*
5437c478bd9Sstevel@tonic-gate 	 * Remove the vHCI from the global list
5447c478bd9Sstevel@tonic-gate 	 */
5457c478bd9Sstevel@tonic-gate 	if (vh == mdi_vhci_head) {
5467c478bd9Sstevel@tonic-gate 		mdi_vhci_head = vh->vh_next;
5477c478bd9Sstevel@tonic-gate 	} else {
5487c478bd9Sstevel@tonic-gate 		prev->vh_next = vh->vh_next;
5497c478bd9Sstevel@tonic-gate 	}
5507c478bd9Sstevel@tonic-gate 	if (vh == mdi_vhci_tail) {
5517c478bd9Sstevel@tonic-gate 		mdi_vhci_tail = prev;
5527c478bd9Sstevel@tonic-gate 	}
5537c478bd9Sstevel@tonic-gate 	mdi_vhci_count--;
5547c478bd9Sstevel@tonic-gate 	mutex_exit(&mdi_mutex);
5553c34adc5Sramat 
5563c34adc5Sramat 	vh->vh_ops = NULL;
5577c478bd9Sstevel@tonic-gate 	DEVI(vdip)->devi_mdi_component &= ~MDI_COMPONENT_VHCI;
5587c478bd9Sstevel@tonic-gate 	DEVI(vdip)->devi_mdi_xhci = NULL;
5597c478bd9Sstevel@tonic-gate 	kmem_free(vh->vh_class, strlen(vh->vh_class)+1);
5607c478bd9Sstevel@tonic-gate 	kmem_free(vh->vh_client_table,
5617c478bd9Sstevel@tonic-gate 	    mdi_client_table_size * sizeof (struct client_hash));
5625e3986cbScth 	mutex_destroy(&vh->vh_phci_mutex);
5635e3986cbScth 	mutex_destroy(&vh->vh_client_mutex);
56478dc6db2Sllai1 
5657c478bd9Sstevel@tonic-gate 	kmem_free(vh, sizeof (mdi_vhci_t));
5667c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
5677c478bd9Sstevel@tonic-gate }
5687c478bd9Sstevel@tonic-gate 
5697c478bd9Sstevel@tonic-gate /*
5707c478bd9Sstevel@tonic-gate  * i_mdi_vhci_class2vhci():
5717c478bd9Sstevel@tonic-gate  *		Look for a matching vHCI module given a vHCI class name
5727c478bd9Sstevel@tonic-gate  * Return Values:
5737c478bd9Sstevel@tonic-gate  *		Handle to a vHCI component
5747c478bd9Sstevel@tonic-gate  *		NULL
5757c478bd9Sstevel@tonic-gate  */
5767c478bd9Sstevel@tonic-gate static mdi_vhci_t *
5777c478bd9Sstevel@tonic-gate i_mdi_vhci_class2vhci(char *class)
5787c478bd9Sstevel@tonic-gate {
5797c478bd9Sstevel@tonic-gate 	mdi_vhci_t	*vh = NULL;
5807c478bd9Sstevel@tonic-gate 
5817c478bd9Sstevel@tonic-gate 	ASSERT(!MUTEX_HELD(&mdi_mutex));
5827c478bd9Sstevel@tonic-gate 
5837c478bd9Sstevel@tonic-gate 	mutex_enter(&mdi_mutex);
5847c478bd9Sstevel@tonic-gate 	for (vh = mdi_vhci_head; vh != NULL; vh = vh->vh_next) {
5857c478bd9Sstevel@tonic-gate 		if (strcmp(vh->vh_class, class) == 0) {
5867c478bd9Sstevel@tonic-gate 			break;
5877c478bd9Sstevel@tonic-gate 		}
5887c478bd9Sstevel@tonic-gate 	}
5897c478bd9Sstevel@tonic-gate 	mutex_exit(&mdi_mutex);
5907c478bd9Sstevel@tonic-gate 	return (vh);
5917c478bd9Sstevel@tonic-gate }
5927c478bd9Sstevel@tonic-gate 
5937c478bd9Sstevel@tonic-gate /*
5947c478bd9Sstevel@tonic-gate  * i_devi_get_vhci():
5957c478bd9Sstevel@tonic-gate  *		Utility function to get the handle to a vHCI component
5967c478bd9Sstevel@tonic-gate  * Return Values:
5977c478bd9Sstevel@tonic-gate  *		Handle to a vHCI component
5987c478bd9Sstevel@tonic-gate  *		NULL
5997c478bd9Sstevel@tonic-gate  */
6007c478bd9Sstevel@tonic-gate mdi_vhci_t *
6017c478bd9Sstevel@tonic-gate i_devi_get_vhci(dev_info_t *vdip)
6027c478bd9Sstevel@tonic-gate {
6037c478bd9Sstevel@tonic-gate 	mdi_vhci_t	*vh = NULL;
6047c478bd9Sstevel@tonic-gate 	if (MDI_VHCI(vdip)) {
6057c478bd9Sstevel@tonic-gate 		vh = (mdi_vhci_t *)DEVI(vdip)->devi_mdi_xhci;
6067c478bd9Sstevel@tonic-gate 	}
6077c478bd9Sstevel@tonic-gate 	return (vh);
6087c478bd9Sstevel@tonic-gate }
6097c478bd9Sstevel@tonic-gate 
6107c478bd9Sstevel@tonic-gate /*
6117c478bd9Sstevel@tonic-gate  * mdi_phci_register():
6127c478bd9Sstevel@tonic-gate  *		Register a pHCI module with mpxio framework
6137c478bd9Sstevel@tonic-gate  *		mdi_phci_register() is called by pHCI drivers to register with
6147c478bd9Sstevel@tonic-gate  *		the mpxio framework and a specific 'class_driver' vHCI.  The
6157c478bd9Sstevel@tonic-gate  *		pHCI driver must call this interface as part of its attach(9e)
6167c478bd9Sstevel@tonic-gate  *		handler.
6177c478bd9Sstevel@tonic-gate  * Return Values:
6187c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
6197c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
6207c478bd9Sstevel@tonic-gate  */
6217c478bd9Sstevel@tonic-gate /*ARGSUSED*/
6227c478bd9Sstevel@tonic-gate int
6237c478bd9Sstevel@tonic-gate mdi_phci_register(char *class, dev_info_t *pdip, int flags)
6247c478bd9Sstevel@tonic-gate {
6257c478bd9Sstevel@tonic-gate 	mdi_phci_t		*ph;
6267c478bd9Sstevel@tonic-gate 	mdi_vhci_t		*vh;
6277c478bd9Sstevel@tonic-gate 	char			*data;
6287c478bd9Sstevel@tonic-gate 
6295e3986cbScth 	/*
6305e3986cbScth 	 * Some subsystems, like fcp, perform pHCI registration from a
6315e3986cbScth 	 * different thread than the one doing the pHCI attach(9E) - the
6325e3986cbScth 	 * driver attach code is waiting for this other thread to complete.
6335e3986cbScth 	 * This means we can only ASSERT DEVI_BUSY_CHANGING of parent
6345e3986cbScth 	 * (indicating that some thread has done an ndi_devi_enter of parent)
6355e3986cbScth 	 * not DEVI_BUSY_OWNED (which would indicate that we did the enter).
6365e3986cbScth 	 */
6375e3986cbScth 	ASSERT(DEVI_BUSY_CHANGING(ddi_get_parent(pdip)));
6385e3986cbScth 
6397c478bd9Sstevel@tonic-gate 	/*
6407c478bd9Sstevel@tonic-gate 	 * Check for mpxio-disable property. Enable mpxio if the property is
6417c478bd9Sstevel@tonic-gate 	 * missing or not set to "yes".
6427c478bd9Sstevel@tonic-gate 	 * If the property is set to "yes" then emit a brief message.
6437c478bd9Sstevel@tonic-gate 	 */
6447c478bd9Sstevel@tonic-gate 	if ((ddi_prop_lookup_string(DDI_DEV_T_ANY, pdip, 0, "mpxio-disable",
6457c478bd9Sstevel@tonic-gate 	    &data) == DDI_SUCCESS)) {
6467c478bd9Sstevel@tonic-gate 		if (strcmp(data, "yes") == 0) {
6474c06356bSdh142964 			MDI_DEBUG(1, (MDI_CONT, pdip,
6484c06356bSdh142964 			    "?multipath capabilities disabled via %s.conf.",
6497c478bd9Sstevel@tonic-gate 			    ddi_driver_name(pdip)));
6507c478bd9Sstevel@tonic-gate 			ddi_prop_free(data);
6517c478bd9Sstevel@tonic-gate 			return (MDI_FAILURE);
6527c478bd9Sstevel@tonic-gate 		}
6537c478bd9Sstevel@tonic-gate 		ddi_prop_free(data);
6547c478bd9Sstevel@tonic-gate 	}
6557c478bd9Sstevel@tonic-gate 
6567c478bd9Sstevel@tonic-gate 	/*
6577c478bd9Sstevel@tonic-gate 	 * Search for a matching vHCI
6587c478bd9Sstevel@tonic-gate 	 */
6597c478bd9Sstevel@tonic-gate 	vh = (mdi_vhci_t *)i_mdi_vhci_class2vhci(class);
6607c478bd9Sstevel@tonic-gate 	if (vh == NULL) {
6617c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
6627c478bd9Sstevel@tonic-gate 	}
6637c478bd9Sstevel@tonic-gate 
6647c478bd9Sstevel@tonic-gate 	ph = kmem_zalloc(sizeof (mdi_phci_t), KM_SLEEP);
6657c478bd9Sstevel@tonic-gate 	mutex_init(&ph->ph_mutex, NULL, MUTEX_DEFAULT, NULL);
6667c478bd9Sstevel@tonic-gate 	ph->ph_dip = pdip;
6677c478bd9Sstevel@tonic-gate 	ph->ph_vhci = vh;
6687c478bd9Sstevel@tonic-gate 	ph->ph_next = NULL;
6697c478bd9Sstevel@tonic-gate 	ph->ph_unstable = 0;
6707c478bd9Sstevel@tonic-gate 	ph->ph_vprivate = 0;
6717c478bd9Sstevel@tonic-gate 	cv_init(&ph->ph_unstable_cv, NULL, CV_DRIVER, NULL);
6727c478bd9Sstevel@tonic-gate 
6735e3986cbScth 	MDI_PHCI_LOCK(ph);
6747c478bd9Sstevel@tonic-gate 	MDI_PHCI_SET_POWER_UP(ph);
6755e3986cbScth 	MDI_PHCI_UNLOCK(ph);
6767c478bd9Sstevel@tonic-gate 	DEVI(pdip)->devi_mdi_component |= MDI_COMPONENT_PHCI;
6777c478bd9Sstevel@tonic-gate 	DEVI(pdip)->devi_mdi_xhci = (caddr_t)ph;
6787c478bd9Sstevel@tonic-gate 
6793c34adc5Sramat 	vhcache_phci_add(vh->vh_config, ph);
6803c34adc5Sramat 
6815e3986cbScth 	MDI_VHCI_PHCI_LOCK(vh);
6827c478bd9Sstevel@tonic-gate 	if (vh->vh_phci_head == NULL) {
6837c478bd9Sstevel@tonic-gate 		vh->vh_phci_head = ph;
6847c478bd9Sstevel@tonic-gate 	}
6857c478bd9Sstevel@tonic-gate 	if (vh->vh_phci_tail) {
6867c478bd9Sstevel@tonic-gate 		vh->vh_phci_tail->ph_next = ph;
6877c478bd9Sstevel@tonic-gate 	}
6887c478bd9Sstevel@tonic-gate 	vh->vh_phci_tail = ph;
6897c478bd9Sstevel@tonic-gate 	vh->vh_phci_count++;
6905e3986cbScth 	MDI_VHCI_PHCI_UNLOCK(vh);
6915e3986cbScth 
6928c4f8890Srs135747 	i_mdi_log_sysevent(pdip, class, ESC_DDI_INITIATOR_REGISTER);
6937c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
6947c478bd9Sstevel@tonic-gate }
6957c478bd9Sstevel@tonic-gate 
6967c478bd9Sstevel@tonic-gate /*
6977c478bd9Sstevel@tonic-gate  * mdi_phci_unregister():
6987c478bd9Sstevel@tonic-gate  *		Unregister a pHCI module from mpxio framework
6997c478bd9Sstevel@tonic-gate  *		mdi_phci_unregister() is called by the pHCI drivers from their
7007c478bd9Sstevel@tonic-gate  *		detach(9E) handler to unregister their instances from the
7017c478bd9Sstevel@tonic-gate  *		framework.
7027c478bd9Sstevel@tonic-gate  * Return Values:
7037c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
7047c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
7057c478bd9Sstevel@tonic-gate  */
7067c478bd9Sstevel@tonic-gate /*ARGSUSED*/
7077c478bd9Sstevel@tonic-gate int
7087c478bd9Sstevel@tonic-gate mdi_phci_unregister(dev_info_t *pdip, int flags)
7097c478bd9Sstevel@tonic-gate {
7107c478bd9Sstevel@tonic-gate 	mdi_vhci_t		*vh;
7117c478bd9Sstevel@tonic-gate 	mdi_phci_t		*ph;
7127c478bd9Sstevel@tonic-gate 	mdi_phci_t		*tmp;
7137c478bd9Sstevel@tonic-gate 	mdi_phci_t		*prev = NULL;
7144c06356bSdh142964 	mdi_pathinfo_t		*pip;
7157c478bd9Sstevel@tonic-gate 
7165e3986cbScth 	ASSERT(DEVI_BUSY_CHANGING(ddi_get_parent(pdip)));
7175e3986cbScth 
7187c478bd9Sstevel@tonic-gate 	ph = i_devi_get_phci(pdip);
7197c478bd9Sstevel@tonic-gate 	if (ph == NULL) {
7204c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, pdip, "!not a valid pHCI"));
7217c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
7227c478bd9Sstevel@tonic-gate 	}
7237c478bd9Sstevel@tonic-gate 
7247c478bd9Sstevel@tonic-gate 	vh = ph->ph_vhci;
7257c478bd9Sstevel@tonic-gate 	ASSERT(vh != NULL);
7267c478bd9Sstevel@tonic-gate 	if (vh == NULL) {
7274c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, pdip, "!not a valid vHCI"));
7287c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
7297c478bd9Sstevel@tonic-gate 	}
7307c478bd9Sstevel@tonic-gate 
7315e3986cbScth 	MDI_VHCI_PHCI_LOCK(vh);
7327c478bd9Sstevel@tonic-gate 	tmp = vh->vh_phci_head;
7337c478bd9Sstevel@tonic-gate 	while (tmp) {
7347c478bd9Sstevel@tonic-gate 		if (tmp == ph) {
7357c478bd9Sstevel@tonic-gate 			break;
7367c478bd9Sstevel@tonic-gate 		}
7377c478bd9Sstevel@tonic-gate 		prev = tmp;
7387c478bd9Sstevel@tonic-gate 		tmp = tmp->ph_next;
7397c478bd9Sstevel@tonic-gate 	}
7407c478bd9Sstevel@tonic-gate 
7417c478bd9Sstevel@tonic-gate 	if (ph == vh->vh_phci_head) {
7427c478bd9Sstevel@tonic-gate 		vh->vh_phci_head = ph->ph_next;
7437c478bd9Sstevel@tonic-gate 	} else {
7447c478bd9Sstevel@tonic-gate 		prev->ph_next = ph->ph_next;
7457c478bd9Sstevel@tonic-gate 	}
7467c478bd9Sstevel@tonic-gate 
7477c478bd9Sstevel@tonic-gate 	if (ph == vh->vh_phci_tail) {
7487c478bd9Sstevel@tonic-gate 		vh->vh_phci_tail = prev;
7497c478bd9Sstevel@tonic-gate 	}
7507c478bd9Sstevel@tonic-gate 
7517c478bd9Sstevel@tonic-gate 	vh->vh_phci_count--;
7525e3986cbScth 	MDI_VHCI_PHCI_UNLOCK(vh);
7537c478bd9Sstevel@tonic-gate 
7544c06356bSdh142964 	/* Walk remaining pathinfo nodes and disassociate them from pHCI */
7554c06356bSdh142964 	MDI_PHCI_LOCK(ph);
7564c06356bSdh142964 	for (pip = (mdi_pathinfo_t *)ph->ph_path_head; pip;
7574c06356bSdh142964 	    pip = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link)
7584c06356bSdh142964 		MDI_PI(pip)->pi_phci = NULL;
7594c06356bSdh142964 	MDI_PHCI_UNLOCK(ph);
7604c06356bSdh142964 
7618c4f8890Srs135747 	i_mdi_log_sysevent(pdip, ph->ph_vhci->vh_class,
7628c4f8890Srs135747 	    ESC_DDI_INITIATOR_UNREGISTER);
7633c34adc5Sramat 	vhcache_phci_remove(vh->vh_config, ph);
7647c478bd9Sstevel@tonic-gate 	cv_destroy(&ph->ph_unstable_cv);
7657c478bd9Sstevel@tonic-gate 	mutex_destroy(&ph->ph_mutex);
7667c478bd9Sstevel@tonic-gate 	kmem_free(ph, sizeof (mdi_phci_t));
7677c478bd9Sstevel@tonic-gate 	DEVI(pdip)->devi_mdi_component &= ~MDI_COMPONENT_PHCI;
7687c478bd9Sstevel@tonic-gate 	DEVI(pdip)->devi_mdi_xhci = NULL;
7697c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
7707c478bd9Sstevel@tonic-gate }
7717c478bd9Sstevel@tonic-gate 
7727c478bd9Sstevel@tonic-gate /*
7737c478bd9Sstevel@tonic-gate  * i_devi_get_phci():
7747c478bd9Sstevel@tonic-gate  * 		Utility function to return the phci extensions.
7757c478bd9Sstevel@tonic-gate  */
7767c478bd9Sstevel@tonic-gate static mdi_phci_t *
7777c478bd9Sstevel@tonic-gate i_devi_get_phci(dev_info_t *pdip)
7787c478bd9Sstevel@tonic-gate {
7797c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph = NULL;
78055e592a2SRandall Ralphs 
7817c478bd9Sstevel@tonic-gate 	if (MDI_PHCI(pdip)) {
7827c478bd9Sstevel@tonic-gate 		ph = (mdi_phci_t *)DEVI(pdip)->devi_mdi_xhci;
7837c478bd9Sstevel@tonic-gate 	}
7847c478bd9Sstevel@tonic-gate 	return (ph);
7857c478bd9Sstevel@tonic-gate }
7867c478bd9Sstevel@tonic-gate 
7877c478bd9Sstevel@tonic-gate /*
7885e3986cbScth  * Single thread mdi entry into devinfo node for modifying its children.
7895e3986cbScth  * If necessary we perform an ndi_devi_enter of the vHCI before doing
7905e3986cbScth  * an ndi_devi_enter of 'dip'.  We maintain circular in two parts: one
7915e3986cbScth  * for the vHCI and one for the pHCI.
7925e3986cbScth  */
7935e3986cbScth void
7945e3986cbScth mdi_devi_enter(dev_info_t *phci_dip, int *circular)
7955e3986cbScth {
7965e3986cbScth 	dev_info_t	*vdip;
7975e3986cbScth 	int		vcircular, pcircular;
7985e3986cbScth 
7995e3986cbScth 	/* Verify calling context */
8005e3986cbScth 	ASSERT(MDI_PHCI(phci_dip));
8015e3986cbScth 	vdip = mdi_devi_get_vdip(phci_dip);
8025e3986cbScth 	ASSERT(vdip);			/* A pHCI always has a vHCI */
8035e3986cbScth 
8045e3986cbScth 	/*
8055e3986cbScth 	 * If pHCI is detaching then the framework has already entered the
8065e3986cbScth 	 * vHCI on a threads that went down the code path leading to
8075e3986cbScth 	 * detach_node().  This framework enter of the vHCI during pHCI
8085e3986cbScth 	 * detach is done to avoid deadlock with vHCI power management
8095e3986cbScth 	 * operations which enter the vHCI and the enter down the path
8105e3986cbScth 	 * to the pHCI. If pHCI is detaching then we piggyback this calls
8115e3986cbScth 	 * enter of the vHCI on frameworks vHCI enter that has already
8125e3986cbScth 	 * occurred - this is OK because we know that the framework thread
8135e3986cbScth 	 * doing detach is waiting for our completion.
8145e3986cbScth 	 *
8155e3986cbScth 	 * We should DEVI_IS_DETACHING under an enter of the parent to avoid
8165e3986cbScth 	 * race with detach - but we can't do that because the framework has
8175e3986cbScth 	 * already entered the parent, so we have some complexity instead.
8185e3986cbScth 	 */
8195e3986cbScth 	for (;;) {
8205e3986cbScth 		if (ndi_devi_tryenter(vdip, &vcircular)) {
8215e3986cbScth 			ASSERT(vcircular != -1);
8225e3986cbScth 			if (DEVI_IS_DETACHING(phci_dip)) {
8235e3986cbScth 				ndi_devi_exit(vdip, vcircular);
8245e3986cbScth 				vcircular = -1;
8255e3986cbScth 			}
8265e3986cbScth 			break;
8275e3986cbScth 		} else if (DEVI_IS_DETACHING(phci_dip)) {
8285e3986cbScth 			vcircular = -1;
8295e3986cbScth 			break;
8304c06356bSdh142964 		} else if (servicing_interrupt()) {
8314c06356bSdh142964 			/*
8324c06356bSdh142964 			 * Don't delay an interrupt (and ensure adaptive
8334c06356bSdh142964 			 * mutex inversion support).
8344c06356bSdh142964 			 */
8354c06356bSdh142964 			ndi_devi_enter(vdip, &vcircular);
8364c06356bSdh142964 			break;
8375e3986cbScth 		} else {
8384c06356bSdh142964 			delay_random(2);
8395e3986cbScth 		}
8405e3986cbScth 	}
8415e3986cbScth 
8425e3986cbScth 	ndi_devi_enter(phci_dip, &pcircular);
8435e3986cbScth 	*circular = (vcircular << 16) | (pcircular & 0xFFFF);
8445e3986cbScth }
8455e3986cbScth 
8465e3986cbScth /*
84755e592a2SRandall Ralphs  * Attempt to mdi_devi_enter.
84855e592a2SRandall Ralphs  */
84955e592a2SRandall Ralphs int
85055e592a2SRandall Ralphs mdi_devi_tryenter(dev_info_t *phci_dip, int *circular)
85155e592a2SRandall Ralphs {
85255e592a2SRandall Ralphs 	dev_info_t	*vdip;
85355e592a2SRandall Ralphs 	int		vcircular, pcircular;
85455e592a2SRandall Ralphs 
85555e592a2SRandall Ralphs 	/* Verify calling context */
85655e592a2SRandall Ralphs 	ASSERT(MDI_PHCI(phci_dip));
85755e592a2SRandall Ralphs 	vdip = mdi_devi_get_vdip(phci_dip);
85855e592a2SRandall Ralphs 	ASSERT(vdip);			/* A pHCI always has a vHCI */
85955e592a2SRandall Ralphs 
86055e592a2SRandall Ralphs 	if (ndi_devi_tryenter(vdip, &vcircular)) {
86155e592a2SRandall Ralphs 		if (ndi_devi_tryenter(phci_dip, &pcircular)) {
86255e592a2SRandall Ralphs 			*circular = (vcircular << 16) | (pcircular & 0xFFFF);
86355e592a2SRandall Ralphs 			return (1);	/* locked */
86455e592a2SRandall Ralphs 		}
86555e592a2SRandall Ralphs 		ndi_devi_exit(vdip, vcircular);
86655e592a2SRandall Ralphs 	}
86755e592a2SRandall Ralphs 	return (0);			/* busy */
86855e592a2SRandall Ralphs }
86955e592a2SRandall Ralphs 
87055e592a2SRandall Ralphs /*
8715e3986cbScth  * Release mdi_devi_enter or successful mdi_devi_tryenter.
8725e3986cbScth  */
8735e3986cbScth void
8745e3986cbScth mdi_devi_exit(dev_info_t *phci_dip, int circular)
8755e3986cbScth {
8765e3986cbScth 	dev_info_t	*vdip;
8775e3986cbScth 	int		vcircular, pcircular;
8785e3986cbScth 
8795e3986cbScth 	/* Verify calling context */
8805e3986cbScth 	ASSERT(MDI_PHCI(phci_dip));
8815e3986cbScth 	vdip = mdi_devi_get_vdip(phci_dip);
8825e3986cbScth 	ASSERT(vdip);			/* A pHCI always has a vHCI */
8835e3986cbScth 
8845e3986cbScth 	/* extract two circular recursion values from single int */
8855e3986cbScth 	pcircular = (short)(circular & 0xFFFF);
8865e3986cbScth 	vcircular = (short)((circular >> 16) & 0xFFFF);
8875e3986cbScth 
8885e3986cbScth 	ndi_devi_exit(phci_dip, pcircular);
8895e3986cbScth 	if (vcircular != -1)
8905e3986cbScth 		ndi_devi_exit(vdip, vcircular);
8915e3986cbScth }
8925e3986cbScth 
8935e3986cbScth /*
8945e3986cbScth  * The functions mdi_devi_exit_phci() and mdi_devi_enter_phci() are used
8955e3986cbScth  * around a pHCI drivers calls to mdi_pi_online/offline, after holding
8965e3986cbScth  * the pathinfo node via mdi_hold_path/mdi_rele_path, to avoid deadlock
8975e3986cbScth  * with vHCI power management code during path online/offline.  Each
8985e3986cbScth  * mdi_devi_exit_phci must have a matching mdi_devi_enter_phci, and both must
8995e3986cbScth  * occur within the scope of an active mdi_devi_enter that establishes the
9005e3986cbScth  * circular value.
9015e3986cbScth  */
9025e3986cbScth void
9035e3986cbScth mdi_devi_exit_phci(dev_info_t *phci_dip, int circular)
9045e3986cbScth {
9055e3986cbScth 	int		pcircular;
9065e3986cbScth 
9075e3986cbScth 	/* Verify calling context */
9085e3986cbScth 	ASSERT(MDI_PHCI(phci_dip));
9095e3986cbScth 
9104c06356bSdh142964 	/* Keep hold on pHCI until we reenter in mdi_devi_enter_phci */
9114c06356bSdh142964 	ndi_hold_devi(phci_dip);
9124c06356bSdh142964 
9135e3986cbScth 	pcircular = (short)(circular & 0xFFFF);
9145e3986cbScth 	ndi_devi_exit(phci_dip, pcircular);
9155e3986cbScth }
9165e3986cbScth 
9175e3986cbScth void
9185e3986cbScth mdi_devi_enter_phci(dev_info_t *phci_dip, int *circular)
9195e3986cbScth {
9205e3986cbScth 	int		pcircular;
9215e3986cbScth 
9225e3986cbScth 	/* Verify calling context */
9235e3986cbScth 	ASSERT(MDI_PHCI(phci_dip));
9245e3986cbScth 
9255e3986cbScth 	ndi_devi_enter(phci_dip, &pcircular);
9265e3986cbScth 
9274c06356bSdh142964 	/* Drop hold from mdi_devi_exit_phci. */
9284c06356bSdh142964 	ndi_rele_devi(phci_dip);
9294c06356bSdh142964 
9305e3986cbScth 	/* verify matching mdi_devi_exit_phci/mdi_devi_enter_phci use */
9315e3986cbScth 	ASSERT(pcircular == ((short)(*circular & 0xFFFF)));
9325e3986cbScth }
9335e3986cbScth 
9345e3986cbScth /*
9355e3986cbScth  * mdi_devi_get_vdip():
9365e3986cbScth  *		given a pHCI dip return vHCI dip
9375e3986cbScth  */
9385e3986cbScth dev_info_t *
9395e3986cbScth mdi_devi_get_vdip(dev_info_t *pdip)
9405e3986cbScth {
9415e3986cbScth 	mdi_phci_t	*ph;
9425e3986cbScth 
9435e3986cbScth 	ph = i_devi_get_phci(pdip);
9445e3986cbScth 	if (ph && ph->ph_vhci)
9455e3986cbScth 		return (ph->ph_vhci->vh_dip);
9465e3986cbScth 	return (NULL);
9475e3986cbScth }
9485e3986cbScth 
9495e3986cbScth /*
9505e3986cbScth  * mdi_devi_pdip_entered():
9515e3986cbScth  *		Return 1 if we are vHCI and have done an ndi_devi_enter
9525e3986cbScth  *		of a pHCI
9535e3986cbScth  */
9545e3986cbScth int
9555e3986cbScth mdi_devi_pdip_entered(dev_info_t *vdip)
9565e3986cbScth {
9575e3986cbScth 	mdi_vhci_t	*vh;
9585e3986cbScth 	mdi_phci_t	*ph;
9595e3986cbScth 
9605e3986cbScth 	vh = i_devi_get_vhci(vdip);
9615e3986cbScth 	if (vh == NULL)
9625e3986cbScth 		return (0);
9635e3986cbScth 
9645e3986cbScth 	MDI_VHCI_PHCI_LOCK(vh);
9655e3986cbScth 	ph = vh->vh_phci_head;
9665e3986cbScth 	while (ph) {
9675e3986cbScth 		if (ph->ph_dip && DEVI_BUSY_OWNED(ph->ph_dip)) {
9685e3986cbScth 			MDI_VHCI_PHCI_UNLOCK(vh);
9695e3986cbScth 			return (1);
9705e3986cbScth 		}
9715e3986cbScth 		ph = ph->ph_next;
9725e3986cbScth 	}
9735e3986cbScth 	MDI_VHCI_PHCI_UNLOCK(vh);
9745e3986cbScth 	return (0);
9755e3986cbScth }
9765e3986cbScth 
9775e3986cbScth /*
9787c478bd9Sstevel@tonic-gate  * mdi_phci_path2devinfo():
9797c478bd9Sstevel@tonic-gate  * 		Utility function to search for a valid phci device given
9807c478bd9Sstevel@tonic-gate  *		the devfs pathname.
9817c478bd9Sstevel@tonic-gate  */
9827c478bd9Sstevel@tonic-gate dev_info_t *
9837c478bd9Sstevel@tonic-gate mdi_phci_path2devinfo(dev_info_t *vdip, caddr_t pathname)
9847c478bd9Sstevel@tonic-gate {
9857c478bd9Sstevel@tonic-gate 	char		*temp_pathname;
9867c478bd9Sstevel@tonic-gate 	mdi_vhci_t	*vh;
9877c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
9887c478bd9Sstevel@tonic-gate 	dev_info_t 	*pdip = NULL;
9897c478bd9Sstevel@tonic-gate 
9907c478bd9Sstevel@tonic-gate 	vh = i_devi_get_vhci(vdip);
9917c478bd9Sstevel@tonic-gate 	ASSERT(vh != NULL);
9927c478bd9Sstevel@tonic-gate 
9937c478bd9Sstevel@tonic-gate 	if (vh == NULL) {
9947c478bd9Sstevel@tonic-gate 		/*
9957c478bd9Sstevel@tonic-gate 		 * Invalid vHCI component, return failure
9967c478bd9Sstevel@tonic-gate 		 */
9977c478bd9Sstevel@tonic-gate 		return (NULL);
9987c478bd9Sstevel@tonic-gate 	}
9997c478bd9Sstevel@tonic-gate 
10007c478bd9Sstevel@tonic-gate 	temp_pathname = kmem_zalloc(MAXPATHLEN, KM_SLEEP);
10015e3986cbScth 	MDI_VHCI_PHCI_LOCK(vh);
10027c478bd9Sstevel@tonic-gate 	ph = vh->vh_phci_head;
10037c478bd9Sstevel@tonic-gate 	while (ph != NULL) {
10047c478bd9Sstevel@tonic-gate 		pdip = ph->ph_dip;
10057c478bd9Sstevel@tonic-gate 		ASSERT(pdip != NULL);
10067c478bd9Sstevel@tonic-gate 		*temp_pathname = '\0';
10077c478bd9Sstevel@tonic-gate 		(void) ddi_pathname(pdip, temp_pathname);
10087c478bd9Sstevel@tonic-gate 		if (strcmp(temp_pathname, pathname) == 0) {
10097c478bd9Sstevel@tonic-gate 			break;
10107c478bd9Sstevel@tonic-gate 		}
10117c478bd9Sstevel@tonic-gate 		ph = ph->ph_next;
10127c478bd9Sstevel@tonic-gate 	}
10137c478bd9Sstevel@tonic-gate 	if (ph == NULL) {
10147c478bd9Sstevel@tonic-gate 		pdip = NULL;
10157c478bd9Sstevel@tonic-gate 	}
10165e3986cbScth 	MDI_VHCI_PHCI_UNLOCK(vh);
10177c478bd9Sstevel@tonic-gate 	kmem_free(temp_pathname, MAXPATHLEN);
10187c478bd9Sstevel@tonic-gate 	return (pdip);
10197c478bd9Sstevel@tonic-gate }
10207c478bd9Sstevel@tonic-gate 
10217c478bd9Sstevel@tonic-gate /*
10227c478bd9Sstevel@tonic-gate  * mdi_phci_get_path_count():
10237c478bd9Sstevel@tonic-gate  * 		get number of path information nodes associated with a given
10247c478bd9Sstevel@tonic-gate  *		pHCI device.
10257c478bd9Sstevel@tonic-gate  */
10267c478bd9Sstevel@tonic-gate int
10277c478bd9Sstevel@tonic-gate mdi_phci_get_path_count(dev_info_t *pdip)
10287c478bd9Sstevel@tonic-gate {
10297c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
10307c478bd9Sstevel@tonic-gate 	int		count = 0;
10317c478bd9Sstevel@tonic-gate 
10327c478bd9Sstevel@tonic-gate 	ph = i_devi_get_phci(pdip);
10337c478bd9Sstevel@tonic-gate 	if (ph != NULL) {
10347c478bd9Sstevel@tonic-gate 		count = ph->ph_path_count;
10357c478bd9Sstevel@tonic-gate 	}
10367c478bd9Sstevel@tonic-gate 	return (count);
10377c478bd9Sstevel@tonic-gate }
10387c478bd9Sstevel@tonic-gate 
10397c478bd9Sstevel@tonic-gate /*
10407c478bd9Sstevel@tonic-gate  * i_mdi_phci_lock():
10417c478bd9Sstevel@tonic-gate  *		Lock a pHCI device
10427c478bd9Sstevel@tonic-gate  * Return Values:
10437c478bd9Sstevel@tonic-gate  *		None
10447c478bd9Sstevel@tonic-gate  * Note:
10457c478bd9Sstevel@tonic-gate  *		The default locking order is:
10467c478bd9Sstevel@tonic-gate  *		_NOTE(LOCK_ORDER(mdi_phci::ph_mutex mdi_pathinfo::pi_mutex))
10477c478bd9Sstevel@tonic-gate  *		But there are number of situations where locks need to be
10487c478bd9Sstevel@tonic-gate  *		grabbed in reverse order.  This routine implements try and lock
10497c478bd9Sstevel@tonic-gate  *		mechanism depending on the requested parameter option.
10507c478bd9Sstevel@tonic-gate  */
10517c478bd9Sstevel@tonic-gate static void
10527c478bd9Sstevel@tonic-gate i_mdi_phci_lock(mdi_phci_t *ph, mdi_pathinfo_t *pip)
10537c478bd9Sstevel@tonic-gate {
10547c478bd9Sstevel@tonic-gate 	if (pip) {
10557c478bd9Sstevel@tonic-gate 		/* Reverse locking is requested. */
10567c478bd9Sstevel@tonic-gate 		while (MDI_PHCI_TRYLOCK(ph) == 0) {
10574c06356bSdh142964 			if (servicing_interrupt()) {
10584c06356bSdh142964 				MDI_PI_HOLD(pip);
10594c06356bSdh142964 				MDI_PI_UNLOCK(pip);
10604c06356bSdh142964 				MDI_PHCI_LOCK(ph);
10614c06356bSdh142964 				MDI_PI_LOCK(pip);
10624c06356bSdh142964 				MDI_PI_RELE(pip);
10634c06356bSdh142964 				break;
10644c06356bSdh142964 			} else {
10657c478bd9Sstevel@tonic-gate 				/*
10667c478bd9Sstevel@tonic-gate 				 * tryenter failed. Try to grab again
10677c478bd9Sstevel@tonic-gate 				 * after a small delay
10687c478bd9Sstevel@tonic-gate 				 */
10697c478bd9Sstevel@tonic-gate 				MDI_PI_HOLD(pip);
10707c478bd9Sstevel@tonic-gate 				MDI_PI_UNLOCK(pip);
10714c06356bSdh142964 				delay_random(2);
10727c478bd9Sstevel@tonic-gate 				MDI_PI_LOCK(pip);
10737c478bd9Sstevel@tonic-gate 				MDI_PI_RELE(pip);
10747c478bd9Sstevel@tonic-gate 			}
10754c06356bSdh142964 		}
10767c478bd9Sstevel@tonic-gate 	} else {
10777c478bd9Sstevel@tonic-gate 		MDI_PHCI_LOCK(ph);
10787c478bd9Sstevel@tonic-gate 	}
10797c478bd9Sstevel@tonic-gate }
10807c478bd9Sstevel@tonic-gate 
10817c478bd9Sstevel@tonic-gate /*
10827c478bd9Sstevel@tonic-gate  * i_mdi_phci_unlock():
10837c478bd9Sstevel@tonic-gate  *		Unlock the pHCI component
10847c478bd9Sstevel@tonic-gate  */
10857c478bd9Sstevel@tonic-gate static void
10867c478bd9Sstevel@tonic-gate i_mdi_phci_unlock(mdi_phci_t *ph)
10877c478bd9Sstevel@tonic-gate {
10887c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNLOCK(ph);
10897c478bd9Sstevel@tonic-gate }
10907c478bd9Sstevel@tonic-gate 
10917c478bd9Sstevel@tonic-gate /*
10927c478bd9Sstevel@tonic-gate  * i_mdi_devinfo_create():
10937c478bd9Sstevel@tonic-gate  *		create client device's devinfo node
10947c478bd9Sstevel@tonic-gate  * Return Values:
10957c478bd9Sstevel@tonic-gate  *		dev_info
10967c478bd9Sstevel@tonic-gate  *		NULL
10977c478bd9Sstevel@tonic-gate  * Notes:
10987c478bd9Sstevel@tonic-gate  */
10997c478bd9Sstevel@tonic-gate static dev_info_t *
11007c478bd9Sstevel@tonic-gate i_mdi_devinfo_create(mdi_vhci_t *vh, char *name, char *guid,
11013c34adc5Sramat 	char **compatible, int ncompatible)
11027c478bd9Sstevel@tonic-gate {
11037c478bd9Sstevel@tonic-gate 	dev_info_t *cdip = NULL;
11047c478bd9Sstevel@tonic-gate 
11055e3986cbScth 	ASSERT(MDI_VHCI_CLIENT_LOCKED(vh));
11067c478bd9Sstevel@tonic-gate 
11077c478bd9Sstevel@tonic-gate 	/* Verify for duplicate entry */
11087c478bd9Sstevel@tonic-gate 	cdip = i_mdi_devinfo_find(vh, name, guid);
11097c478bd9Sstevel@tonic-gate 	ASSERT(cdip == NULL);
11107c478bd9Sstevel@tonic-gate 	if (cdip) {
11117c478bd9Sstevel@tonic-gate 		cmn_err(CE_WARN,
11124c06356bSdh142964 		    "i_mdi_devinfo_create: client %s@%s already exists",
11134c06356bSdh142964 			name ? name : "", guid ? guid : "");
11147c478bd9Sstevel@tonic-gate 	}
11157c478bd9Sstevel@tonic-gate 
11163c34adc5Sramat 	ndi_devi_alloc_sleep(vh->vh_dip, name, DEVI_SID_NODEID, &cdip);
11177c478bd9Sstevel@tonic-gate 	if (cdip == NULL)
11187c478bd9Sstevel@tonic-gate 		goto fail;
11197c478bd9Sstevel@tonic-gate 
11207c478bd9Sstevel@tonic-gate 	/*
11217c478bd9Sstevel@tonic-gate 	 * Create component type and Global unique identifier
11227c478bd9Sstevel@tonic-gate 	 * properties
11237c478bd9Sstevel@tonic-gate 	 */
11247c478bd9Sstevel@tonic-gate 	if (ndi_prop_update_string(DDI_DEV_T_NONE, cdip,
11257c478bd9Sstevel@tonic-gate 	    MDI_CLIENT_GUID_PROP, guid) != DDI_PROP_SUCCESS) {
11267c478bd9Sstevel@tonic-gate 		goto fail;
11277c478bd9Sstevel@tonic-gate 	}
11287c478bd9Sstevel@tonic-gate 
11297c478bd9Sstevel@tonic-gate 	/* Decorate the node with compatible property */
11307c478bd9Sstevel@tonic-gate 	if (compatible &&
11317c478bd9Sstevel@tonic-gate 	    (ndi_prop_update_string_array(DDI_DEV_T_NONE, cdip,
11327c478bd9Sstevel@tonic-gate 	    "compatible", compatible, ncompatible) != DDI_PROP_SUCCESS)) {
11337c478bd9Sstevel@tonic-gate 		goto fail;
11347c478bd9Sstevel@tonic-gate 	}
11357c478bd9Sstevel@tonic-gate 
11367c478bd9Sstevel@tonic-gate 	return (cdip);
11377c478bd9Sstevel@tonic-gate 
11387c478bd9Sstevel@tonic-gate fail:
11397c478bd9Sstevel@tonic-gate 	if (cdip) {
11407c478bd9Sstevel@tonic-gate 		(void) ndi_prop_remove_all(cdip);
11417c478bd9Sstevel@tonic-gate 		(void) ndi_devi_free(cdip);
11427c478bd9Sstevel@tonic-gate 	}
11437c478bd9Sstevel@tonic-gate 	return (NULL);
11447c478bd9Sstevel@tonic-gate }
11457c478bd9Sstevel@tonic-gate 
11467c478bd9Sstevel@tonic-gate /*
11477c478bd9Sstevel@tonic-gate  * i_mdi_devinfo_find():
11487c478bd9Sstevel@tonic-gate  *		Find a matching devinfo node for given client node name
11497c478bd9Sstevel@tonic-gate  *		and its guid.
11507c478bd9Sstevel@tonic-gate  * Return Values:
11517c478bd9Sstevel@tonic-gate  *		Handle to a dev_info node or NULL
11527c478bd9Sstevel@tonic-gate  */
11537c478bd9Sstevel@tonic-gate static dev_info_t *
11547c478bd9Sstevel@tonic-gate i_mdi_devinfo_find(mdi_vhci_t *vh, caddr_t name, char *guid)
11557c478bd9Sstevel@tonic-gate {
11567c478bd9Sstevel@tonic-gate 	char			*data;
11577c478bd9Sstevel@tonic-gate 	dev_info_t 		*cdip = NULL;
11587c478bd9Sstevel@tonic-gate 	dev_info_t 		*ndip = NULL;
11597c478bd9Sstevel@tonic-gate 	int			circular;
11607c478bd9Sstevel@tonic-gate 
11617c478bd9Sstevel@tonic-gate 	ndi_devi_enter(vh->vh_dip, &circular);
11627c478bd9Sstevel@tonic-gate 	ndip = (dev_info_t *)DEVI(vh->vh_dip)->devi_child;
11637c478bd9Sstevel@tonic-gate 	while ((cdip = ndip) != NULL) {
11647c478bd9Sstevel@tonic-gate 		ndip = (dev_info_t *)DEVI(cdip)->devi_sibling;
11657c478bd9Sstevel@tonic-gate 
11667c478bd9Sstevel@tonic-gate 		if (strcmp(DEVI(cdip)->devi_node_name, name)) {
11677c478bd9Sstevel@tonic-gate 			continue;
11687c478bd9Sstevel@tonic-gate 		}
11697c478bd9Sstevel@tonic-gate 
11707c478bd9Sstevel@tonic-gate 		if (ddi_prop_lookup_string(DDI_DEV_T_ANY, cdip,
11717c478bd9Sstevel@tonic-gate 		    DDI_PROP_DONTPASS, MDI_CLIENT_GUID_PROP,
11727c478bd9Sstevel@tonic-gate 		    &data) != DDI_PROP_SUCCESS) {
11737c478bd9Sstevel@tonic-gate 			continue;
11747c478bd9Sstevel@tonic-gate 		}
11757c478bd9Sstevel@tonic-gate 
11767c478bd9Sstevel@tonic-gate 		if (strcmp(data, guid) != 0) {
11777c478bd9Sstevel@tonic-gate 			ddi_prop_free(data);
11787c478bd9Sstevel@tonic-gate 			continue;
11797c478bd9Sstevel@tonic-gate 		}
11807c478bd9Sstevel@tonic-gate 		ddi_prop_free(data);
11817c478bd9Sstevel@tonic-gate 		break;
11827c478bd9Sstevel@tonic-gate 	}
11837c478bd9Sstevel@tonic-gate 	ndi_devi_exit(vh->vh_dip, circular);
11847c478bd9Sstevel@tonic-gate 	return (cdip);
11857c478bd9Sstevel@tonic-gate }
11867c478bd9Sstevel@tonic-gate 
11877c478bd9Sstevel@tonic-gate /*
11887c478bd9Sstevel@tonic-gate  * i_mdi_devinfo_remove():
11897c478bd9Sstevel@tonic-gate  *		Remove a client device node
11907c478bd9Sstevel@tonic-gate  */
11917c478bd9Sstevel@tonic-gate static int
11927c478bd9Sstevel@tonic-gate i_mdi_devinfo_remove(dev_info_t *vdip, dev_info_t *cdip, int flags)
11937c478bd9Sstevel@tonic-gate {
11947c478bd9Sstevel@tonic-gate 	int	rv = MDI_SUCCESS;
11955e3986cbScth 
11967c478bd9Sstevel@tonic-gate 	if (i_mdi_is_child_present(vdip, cdip) == MDI_SUCCESS ||
11977c478bd9Sstevel@tonic-gate 	    (flags & MDI_CLIENT_FLAGS_DEV_NOT_SUPPORTED)) {
11984c06356bSdh142964 		rv = ndi_devi_offline(cdip, NDI_DEVFS_CLEAN | NDI_DEVI_REMOVE);
11997c478bd9Sstevel@tonic-gate 		if (rv != NDI_SUCCESS) {
12004c06356bSdh142964 			MDI_DEBUG(1, (MDI_NOTE, cdip,
12014c06356bSdh142964 			    "!failed: cdip %p", (void *)cdip));
12027c478bd9Sstevel@tonic-gate 		}
12037c478bd9Sstevel@tonic-gate 		/*
12047c478bd9Sstevel@tonic-gate 		 * Convert to MDI error code
12057c478bd9Sstevel@tonic-gate 		 */
12067c478bd9Sstevel@tonic-gate 		switch (rv) {
12077c478bd9Sstevel@tonic-gate 		case NDI_SUCCESS:
12087c478bd9Sstevel@tonic-gate 			rv = MDI_SUCCESS;
12097c478bd9Sstevel@tonic-gate 			break;
12107c478bd9Sstevel@tonic-gate 		case NDI_BUSY:
12117c478bd9Sstevel@tonic-gate 			rv = MDI_BUSY;
12127c478bd9Sstevel@tonic-gate 			break;
12137c478bd9Sstevel@tonic-gate 		default:
12147c478bd9Sstevel@tonic-gate 			rv = MDI_FAILURE;
12157c478bd9Sstevel@tonic-gate 			break;
12167c478bd9Sstevel@tonic-gate 		}
12177c478bd9Sstevel@tonic-gate 	}
12187c478bd9Sstevel@tonic-gate 	return (rv);
12197c478bd9Sstevel@tonic-gate }
12207c478bd9Sstevel@tonic-gate 
12217c478bd9Sstevel@tonic-gate /*
12227c478bd9Sstevel@tonic-gate  * i_devi_get_client()
12237c478bd9Sstevel@tonic-gate  *		Utility function to get mpxio component extensions
12247c478bd9Sstevel@tonic-gate  */
12257c478bd9Sstevel@tonic-gate static mdi_client_t *
12267c478bd9Sstevel@tonic-gate i_devi_get_client(dev_info_t *cdip)
12277c478bd9Sstevel@tonic-gate {
12287c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct = NULL;
12295e3986cbScth 
12307c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT(cdip)) {
12317c478bd9Sstevel@tonic-gate 		ct = (mdi_client_t *)DEVI(cdip)->devi_mdi_client;
12327c478bd9Sstevel@tonic-gate 	}
12337c478bd9Sstevel@tonic-gate 	return (ct);
12347c478bd9Sstevel@tonic-gate }
12357c478bd9Sstevel@tonic-gate 
12367c478bd9Sstevel@tonic-gate /*
12377c478bd9Sstevel@tonic-gate  * i_mdi_is_child_present():
12387c478bd9Sstevel@tonic-gate  *		Search for the presence of client device dev_info node
12397c478bd9Sstevel@tonic-gate  */
12407c478bd9Sstevel@tonic-gate static int
12417c478bd9Sstevel@tonic-gate i_mdi_is_child_present(dev_info_t *vdip, dev_info_t *cdip)
12427c478bd9Sstevel@tonic-gate {
12437c478bd9Sstevel@tonic-gate 	int		rv = MDI_FAILURE;
12447c478bd9Sstevel@tonic-gate 	struct dev_info	*dip;
12457c478bd9Sstevel@tonic-gate 	int		circular;
12467c478bd9Sstevel@tonic-gate 
12477c478bd9Sstevel@tonic-gate 	ndi_devi_enter(vdip, &circular);
12487c478bd9Sstevel@tonic-gate 	dip = DEVI(vdip)->devi_child;
12497c478bd9Sstevel@tonic-gate 	while (dip) {
12507c478bd9Sstevel@tonic-gate 		if (dip == DEVI(cdip)) {
12517c478bd9Sstevel@tonic-gate 			rv = MDI_SUCCESS;
12527c478bd9Sstevel@tonic-gate 			break;
12537c478bd9Sstevel@tonic-gate 		}
12547c478bd9Sstevel@tonic-gate 		dip = dip->devi_sibling;
12557c478bd9Sstevel@tonic-gate 	}
12567c478bd9Sstevel@tonic-gate 	ndi_devi_exit(vdip, circular);
12577c478bd9Sstevel@tonic-gate 	return (rv);
12587c478bd9Sstevel@tonic-gate }
12597c478bd9Sstevel@tonic-gate 
12607c478bd9Sstevel@tonic-gate 
12617c478bd9Sstevel@tonic-gate /*
12627c478bd9Sstevel@tonic-gate  * i_mdi_client_lock():
12637c478bd9Sstevel@tonic-gate  *		Grab client component lock
12647c478bd9Sstevel@tonic-gate  * Return Values:
12657c478bd9Sstevel@tonic-gate  *		None
12667c478bd9Sstevel@tonic-gate  * Note:
12677c478bd9Sstevel@tonic-gate  *		The default locking order is:
12687c478bd9Sstevel@tonic-gate  *		_NOTE(LOCK_ORDER(mdi_client::ct_mutex mdi_pathinfo::pi_mutex))
12697c478bd9Sstevel@tonic-gate  *		But there are number of situations where locks need to be
12707c478bd9Sstevel@tonic-gate  *		grabbed in reverse order.  This routine implements try and lock
12717c478bd9Sstevel@tonic-gate  *		mechanism depending on the requested parameter option.
12727c478bd9Sstevel@tonic-gate  */
12737c478bd9Sstevel@tonic-gate static void
12747c478bd9Sstevel@tonic-gate i_mdi_client_lock(mdi_client_t *ct, mdi_pathinfo_t *pip)
12757c478bd9Sstevel@tonic-gate {
12767c478bd9Sstevel@tonic-gate 	if (pip) {
12777c478bd9Sstevel@tonic-gate 		/*
12787c478bd9Sstevel@tonic-gate 		 * Reverse locking is requested.
12797c478bd9Sstevel@tonic-gate 		 */
12807c478bd9Sstevel@tonic-gate 		while (MDI_CLIENT_TRYLOCK(ct) == 0) {
12814c06356bSdh142964 			if (servicing_interrupt()) {
12824c06356bSdh142964 				MDI_PI_HOLD(pip);
12834c06356bSdh142964 				MDI_PI_UNLOCK(pip);
12844c06356bSdh142964 				MDI_CLIENT_LOCK(ct);
12854c06356bSdh142964 				MDI_PI_LOCK(pip);
12864c06356bSdh142964 				MDI_PI_RELE(pip);
12874c06356bSdh142964 				break;
12884c06356bSdh142964 			} else {
12897c478bd9Sstevel@tonic-gate 				/*
12907c478bd9Sstevel@tonic-gate 				 * tryenter failed. Try to grab again
12917c478bd9Sstevel@tonic-gate 				 * after a small delay
12927c478bd9Sstevel@tonic-gate 				 */
12937c478bd9Sstevel@tonic-gate 				MDI_PI_HOLD(pip);
12947c478bd9Sstevel@tonic-gate 				MDI_PI_UNLOCK(pip);
12954c06356bSdh142964 				delay_random(2);
12967c478bd9Sstevel@tonic-gate 				MDI_PI_LOCK(pip);
12977c478bd9Sstevel@tonic-gate 				MDI_PI_RELE(pip);
12987c478bd9Sstevel@tonic-gate 			}
12994c06356bSdh142964 		}
13007c478bd9Sstevel@tonic-gate 	} else {
13017c478bd9Sstevel@tonic-gate 		MDI_CLIENT_LOCK(ct);
13027c478bd9Sstevel@tonic-gate 	}
13037c478bd9Sstevel@tonic-gate }
13047c478bd9Sstevel@tonic-gate 
13057c478bd9Sstevel@tonic-gate /*
13067c478bd9Sstevel@tonic-gate  * i_mdi_client_unlock():
13077c478bd9Sstevel@tonic-gate  *		Unlock a client component
13087c478bd9Sstevel@tonic-gate  */
13097c478bd9Sstevel@tonic-gate static void
13107c478bd9Sstevel@tonic-gate i_mdi_client_unlock(mdi_client_t *ct)
13117c478bd9Sstevel@tonic-gate {
13127c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
13137c478bd9Sstevel@tonic-gate }
13147c478bd9Sstevel@tonic-gate 
13157c478bd9Sstevel@tonic-gate /*
13167c478bd9Sstevel@tonic-gate  * i_mdi_client_alloc():
13177c478bd9Sstevel@tonic-gate  * 		Allocate and initialize a client structure.  Caller should
13185e3986cbScth  *		hold the vhci client lock.
13197c478bd9Sstevel@tonic-gate  * Return Values:
13207c478bd9Sstevel@tonic-gate  *		Handle to a client component
13217c478bd9Sstevel@tonic-gate  */
13227c478bd9Sstevel@tonic-gate /*ARGSUSED*/
13237c478bd9Sstevel@tonic-gate static mdi_client_t *
13243c34adc5Sramat i_mdi_client_alloc(mdi_vhci_t *vh, char *name, char *lguid)
13257c478bd9Sstevel@tonic-gate {
13267c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
13277c478bd9Sstevel@tonic-gate 
13285e3986cbScth 	ASSERT(MDI_VHCI_CLIENT_LOCKED(vh));
13297c478bd9Sstevel@tonic-gate 
13307c478bd9Sstevel@tonic-gate 	/*
13317c478bd9Sstevel@tonic-gate 	 * Allocate and initialize a component structure.
13327c478bd9Sstevel@tonic-gate 	 */
13333c34adc5Sramat 	ct = kmem_zalloc(sizeof (*ct), KM_SLEEP);
13347c478bd9Sstevel@tonic-gate 	mutex_init(&ct->ct_mutex, NULL, MUTEX_DEFAULT, NULL);
13357c478bd9Sstevel@tonic-gate 	ct->ct_hnext = NULL;
13367c478bd9Sstevel@tonic-gate 	ct->ct_hprev = NULL;
13377c478bd9Sstevel@tonic-gate 	ct->ct_dip = NULL;
13387c478bd9Sstevel@tonic-gate 	ct->ct_vhci = vh;
13393c34adc5Sramat 	ct->ct_drvname = kmem_alloc(strlen(name) + 1, KM_SLEEP);
13407c478bd9Sstevel@tonic-gate 	(void) strcpy(ct->ct_drvname, name);
13413c34adc5Sramat 	ct->ct_guid = kmem_alloc(strlen(lguid) + 1, KM_SLEEP);
13427c478bd9Sstevel@tonic-gate 	(void) strcpy(ct->ct_guid, lguid);
13437c478bd9Sstevel@tonic-gate 	ct->ct_cprivate = NULL;
13447c478bd9Sstevel@tonic-gate 	ct->ct_vprivate = NULL;
13457c478bd9Sstevel@tonic-gate 	ct->ct_flags = 0;
13467c478bd9Sstevel@tonic-gate 	ct->ct_state = MDI_CLIENT_STATE_FAILED;
13475e3986cbScth 	MDI_CLIENT_LOCK(ct);
13487c478bd9Sstevel@tonic-gate 	MDI_CLIENT_SET_OFFLINE(ct);
13497c478bd9Sstevel@tonic-gate 	MDI_CLIENT_SET_DETACH(ct);
13507c478bd9Sstevel@tonic-gate 	MDI_CLIENT_SET_POWER_UP(ct);
13515e3986cbScth 	MDI_CLIENT_UNLOCK(ct);
13527c478bd9Sstevel@tonic-gate 	ct->ct_failover_flags = 0;
13537c478bd9Sstevel@tonic-gate 	ct->ct_failover_status = 0;
13547c478bd9Sstevel@tonic-gate 	cv_init(&ct->ct_failover_cv, NULL, CV_DRIVER, NULL);
13557c478bd9Sstevel@tonic-gate 	ct->ct_unstable = 0;
13567c478bd9Sstevel@tonic-gate 	cv_init(&ct->ct_unstable_cv, NULL, CV_DRIVER, NULL);
13577c478bd9Sstevel@tonic-gate 	cv_init(&ct->ct_powerchange_cv, NULL, CV_DRIVER, NULL);
13587c478bd9Sstevel@tonic-gate 	ct->ct_lb = vh->vh_lb;
13593c34adc5Sramat 	ct->ct_lb_args =  kmem_zalloc(sizeof (client_lb_args_t), KM_SLEEP);
13607c478bd9Sstevel@tonic-gate 	ct->ct_lb_args->region_size = LOAD_BALANCE_DEFAULT_REGION_SIZE;
13617c478bd9Sstevel@tonic-gate 	ct->ct_path_count = 0;
13627c478bd9Sstevel@tonic-gate 	ct->ct_path_head = NULL;
13637c478bd9Sstevel@tonic-gate 	ct->ct_path_tail = NULL;
13647c478bd9Sstevel@tonic-gate 	ct->ct_path_last = NULL;
13657c478bd9Sstevel@tonic-gate 
13667c478bd9Sstevel@tonic-gate 	/*
13677c478bd9Sstevel@tonic-gate 	 * Add this client component to our client hash queue
13687c478bd9Sstevel@tonic-gate 	 */
13697c478bd9Sstevel@tonic-gate 	i_mdi_client_enlist_table(vh, ct);
13707c478bd9Sstevel@tonic-gate 	return (ct);
13717c478bd9Sstevel@tonic-gate }
13727c478bd9Sstevel@tonic-gate 
13737c478bd9Sstevel@tonic-gate /*
13747c478bd9Sstevel@tonic-gate  * i_mdi_client_enlist_table():
13757c478bd9Sstevel@tonic-gate  *		Attach the client device to the client hash table. Caller
13765e3986cbScth  *		should hold the vhci client lock.
13777c478bd9Sstevel@tonic-gate  */
13787c478bd9Sstevel@tonic-gate static void
13797c478bd9Sstevel@tonic-gate i_mdi_client_enlist_table(mdi_vhci_t *vh, mdi_client_t *ct)
13807c478bd9Sstevel@tonic-gate {
13817c478bd9Sstevel@tonic-gate 	int 			index;
13827c478bd9Sstevel@tonic-gate 	struct client_hash	*head;
13837c478bd9Sstevel@tonic-gate 
13845e3986cbScth 	ASSERT(MDI_VHCI_CLIENT_LOCKED(vh));
13855e3986cbScth 
13867c478bd9Sstevel@tonic-gate 	index = i_mdi_get_hash_key(ct->ct_guid);
13877c478bd9Sstevel@tonic-gate 	head = &vh->vh_client_table[index];
13887c478bd9Sstevel@tonic-gate 	ct->ct_hnext = (mdi_client_t *)head->ct_hash_head;
13897c478bd9Sstevel@tonic-gate 	head->ct_hash_head = ct;
13907c478bd9Sstevel@tonic-gate 	head->ct_hash_count++;
13917c478bd9Sstevel@tonic-gate 	vh->vh_client_count++;
13927c478bd9Sstevel@tonic-gate }
13937c478bd9Sstevel@tonic-gate 
13947c478bd9Sstevel@tonic-gate /*
13957c478bd9Sstevel@tonic-gate  * i_mdi_client_delist_table():
13967c478bd9Sstevel@tonic-gate  *		Attach the client device to the client hash table.
13975e3986cbScth  *		Caller should hold the vhci client lock.
13987c478bd9Sstevel@tonic-gate  */
13997c478bd9Sstevel@tonic-gate static void
14007c478bd9Sstevel@tonic-gate i_mdi_client_delist_table(mdi_vhci_t *vh, mdi_client_t *ct)
14017c478bd9Sstevel@tonic-gate {
14027c478bd9Sstevel@tonic-gate 	int			index;
14037c478bd9Sstevel@tonic-gate 	char			*guid;
14047c478bd9Sstevel@tonic-gate 	struct client_hash 	*head;
14057c478bd9Sstevel@tonic-gate 	mdi_client_t		*next;
14067c478bd9Sstevel@tonic-gate 	mdi_client_t		*last;
14077c478bd9Sstevel@tonic-gate 
14085e3986cbScth 	ASSERT(MDI_VHCI_CLIENT_LOCKED(vh));
14095e3986cbScth 
14107c478bd9Sstevel@tonic-gate 	guid = ct->ct_guid;
14117c478bd9Sstevel@tonic-gate 	index = i_mdi_get_hash_key(guid);
14127c478bd9Sstevel@tonic-gate 	head = &vh->vh_client_table[index];
14137c478bd9Sstevel@tonic-gate 
14147c478bd9Sstevel@tonic-gate 	last = NULL;
14157c478bd9Sstevel@tonic-gate 	next = (mdi_client_t *)head->ct_hash_head;
14167c478bd9Sstevel@tonic-gate 	while (next != NULL) {
14177c478bd9Sstevel@tonic-gate 		if (next == ct) {
14187c478bd9Sstevel@tonic-gate 			break;
14197c478bd9Sstevel@tonic-gate 		}
14207c478bd9Sstevel@tonic-gate 		last = next;
14217c478bd9Sstevel@tonic-gate 		next = next->ct_hnext;
14227c478bd9Sstevel@tonic-gate 	}
14237c478bd9Sstevel@tonic-gate 
14247c478bd9Sstevel@tonic-gate 	if (next) {
14257c478bd9Sstevel@tonic-gate 		head->ct_hash_count--;
14267c478bd9Sstevel@tonic-gate 		if (last == NULL) {
14277c478bd9Sstevel@tonic-gate 			head->ct_hash_head = ct->ct_hnext;
14287c478bd9Sstevel@tonic-gate 		} else {
14297c478bd9Sstevel@tonic-gate 			last->ct_hnext = ct->ct_hnext;
14307c478bd9Sstevel@tonic-gate 		}
14317c478bd9Sstevel@tonic-gate 		ct->ct_hnext = NULL;
14327c478bd9Sstevel@tonic-gate 		vh->vh_client_count--;
14337c478bd9Sstevel@tonic-gate 	}
14347c478bd9Sstevel@tonic-gate }
14357c478bd9Sstevel@tonic-gate 
14367c478bd9Sstevel@tonic-gate 
14377c478bd9Sstevel@tonic-gate /*
14387c478bd9Sstevel@tonic-gate  * i_mdi_client_free():
14397c478bd9Sstevel@tonic-gate  *		Free a client component
14407c478bd9Sstevel@tonic-gate  */
14417c478bd9Sstevel@tonic-gate static int
14427c478bd9Sstevel@tonic-gate i_mdi_client_free(mdi_vhci_t *vh, mdi_client_t *ct)
14437c478bd9Sstevel@tonic-gate {
14447c478bd9Sstevel@tonic-gate 	int		rv = MDI_SUCCESS;
14457c478bd9Sstevel@tonic-gate 	int		flags = ct->ct_flags;
14467c478bd9Sstevel@tonic-gate 	dev_info_t	*cdip;
14477c478bd9Sstevel@tonic-gate 	dev_info_t	*vdip;
14487c478bd9Sstevel@tonic-gate 
14495e3986cbScth 	ASSERT(MDI_VHCI_CLIENT_LOCKED(vh));
14505e3986cbScth 
14517c478bd9Sstevel@tonic-gate 	vdip = vh->vh_dip;
14527c478bd9Sstevel@tonic-gate 	cdip = ct->ct_dip;
14537c478bd9Sstevel@tonic-gate 
14547c478bd9Sstevel@tonic-gate 	(void) ndi_prop_remove(DDI_DEV_T_NONE, cdip, MDI_CLIENT_GUID_PROP);
14557c478bd9Sstevel@tonic-gate 	DEVI(cdip)->devi_mdi_component &= ~MDI_COMPONENT_CLIENT;
14567c478bd9Sstevel@tonic-gate 	DEVI(cdip)->devi_mdi_client = NULL;
14577c478bd9Sstevel@tonic-gate 
14587c478bd9Sstevel@tonic-gate 	/*
14597c478bd9Sstevel@tonic-gate 	 * Clear out back ref. to dev_info_t node
14607c478bd9Sstevel@tonic-gate 	 */
14617c478bd9Sstevel@tonic-gate 	ct->ct_dip = NULL;
14627c478bd9Sstevel@tonic-gate 
14637c478bd9Sstevel@tonic-gate 	/*
14647c478bd9Sstevel@tonic-gate 	 * Remove this client from our hash queue
14657c478bd9Sstevel@tonic-gate 	 */
14667c478bd9Sstevel@tonic-gate 	i_mdi_client_delist_table(vh, ct);
14677c478bd9Sstevel@tonic-gate 
14687c478bd9Sstevel@tonic-gate 	/*
14697c478bd9Sstevel@tonic-gate 	 * Uninitialize and free the component
14707c478bd9Sstevel@tonic-gate 	 */
14717c478bd9Sstevel@tonic-gate 	kmem_free(ct->ct_drvname, strlen(ct->ct_drvname) + 1);
14727c478bd9Sstevel@tonic-gate 	kmem_free(ct->ct_guid, strlen(ct->ct_guid) + 1);
14737c478bd9Sstevel@tonic-gate 	kmem_free(ct->ct_lb_args, sizeof (client_lb_args_t));
14747c478bd9Sstevel@tonic-gate 	cv_destroy(&ct->ct_failover_cv);
14757c478bd9Sstevel@tonic-gate 	cv_destroy(&ct->ct_unstable_cv);
14767c478bd9Sstevel@tonic-gate 	cv_destroy(&ct->ct_powerchange_cv);
14777c478bd9Sstevel@tonic-gate 	mutex_destroy(&ct->ct_mutex);
14787c478bd9Sstevel@tonic-gate 	kmem_free(ct, sizeof (*ct));
14797c478bd9Sstevel@tonic-gate 
14807c478bd9Sstevel@tonic-gate 	if (cdip != NULL) {
14815e3986cbScth 		MDI_VHCI_CLIENT_UNLOCK(vh);
14827c478bd9Sstevel@tonic-gate 		(void) i_mdi_devinfo_remove(vdip, cdip, flags);
14835e3986cbScth 		MDI_VHCI_CLIENT_LOCK(vh);
14847c478bd9Sstevel@tonic-gate 	}
14857c478bd9Sstevel@tonic-gate 	return (rv);
14867c478bd9Sstevel@tonic-gate }
14877c478bd9Sstevel@tonic-gate 
14887c478bd9Sstevel@tonic-gate /*
14897c478bd9Sstevel@tonic-gate  * i_mdi_client_find():
14907c478bd9Sstevel@tonic-gate  * 		Find the client structure corresponding to a given guid
14915e3986cbScth  *		Caller should hold the vhci client lock.
14927c478bd9Sstevel@tonic-gate  */
14937c478bd9Sstevel@tonic-gate static mdi_client_t *
14943c34adc5Sramat i_mdi_client_find(mdi_vhci_t *vh, char *cname, char *guid)
14957c478bd9Sstevel@tonic-gate {
14967c478bd9Sstevel@tonic-gate 	int			index;
14977c478bd9Sstevel@tonic-gate 	struct client_hash	*head;
14987c478bd9Sstevel@tonic-gate 	mdi_client_t		*ct;
14997c478bd9Sstevel@tonic-gate 
15005e3986cbScth 	ASSERT(MDI_VHCI_CLIENT_LOCKED(vh));
15015e3986cbScth 
15027c478bd9Sstevel@tonic-gate 	index = i_mdi_get_hash_key(guid);
15037c478bd9Sstevel@tonic-gate 	head = &vh->vh_client_table[index];
15047c478bd9Sstevel@tonic-gate 
15057c478bd9Sstevel@tonic-gate 	ct = head->ct_hash_head;
15067c478bd9Sstevel@tonic-gate 	while (ct != NULL) {
15073c34adc5Sramat 		if (strcmp(ct->ct_guid, guid) == 0 &&
15083c34adc5Sramat 		    (cname == NULL || strcmp(ct->ct_drvname, cname) == 0)) {
15097c478bd9Sstevel@tonic-gate 			break;
15107c478bd9Sstevel@tonic-gate 		}
15117c478bd9Sstevel@tonic-gate 		ct = ct->ct_hnext;
15127c478bd9Sstevel@tonic-gate 	}
15137c478bd9Sstevel@tonic-gate 	return (ct);
15147c478bd9Sstevel@tonic-gate }
15157c478bd9Sstevel@tonic-gate 
15167c478bd9Sstevel@tonic-gate /*
15177c478bd9Sstevel@tonic-gate  * i_mdi_client_update_state():
15187c478bd9Sstevel@tonic-gate  *		Compute and update client device state
15197c478bd9Sstevel@tonic-gate  * Notes:
15207c478bd9Sstevel@tonic-gate  *		A client device can be in any of three possible states:
15217c478bd9Sstevel@tonic-gate  *
15227c478bd9Sstevel@tonic-gate  *		MDI_CLIENT_STATE_OPTIMAL - Client in optimal state with more
15237c478bd9Sstevel@tonic-gate  *		one online/standby paths. Can tolerate failures.
15247c478bd9Sstevel@tonic-gate  *		MDI_CLIENT_STATE_DEGRADED - Client device in degraded state with
15257c478bd9Sstevel@tonic-gate  *		no alternate paths available as standby. A failure on the online
15267c478bd9Sstevel@tonic-gate  *		would result in loss of access to device data.
15277c478bd9Sstevel@tonic-gate  *		MDI_CLIENT_STATE_FAILED - Client device in failed state with
15287c478bd9Sstevel@tonic-gate  *		no paths available to access the device.
15297c478bd9Sstevel@tonic-gate  */
15307c478bd9Sstevel@tonic-gate static void
15317c478bd9Sstevel@tonic-gate i_mdi_client_update_state(mdi_client_t *ct)
15327c478bd9Sstevel@tonic-gate {
15337c478bd9Sstevel@tonic-gate 	int state;
15345e3986cbScth 
15355e3986cbScth 	ASSERT(MDI_CLIENT_LOCKED(ct));
15367c478bd9Sstevel@tonic-gate 	state = i_mdi_client_compute_state(ct, NULL);
15377c478bd9Sstevel@tonic-gate 	MDI_CLIENT_SET_STATE(ct, state);
15387c478bd9Sstevel@tonic-gate }
15397c478bd9Sstevel@tonic-gate 
15407c478bd9Sstevel@tonic-gate /*
15417c478bd9Sstevel@tonic-gate  * i_mdi_client_compute_state():
15427c478bd9Sstevel@tonic-gate  *		Compute client device state
15437c478bd9Sstevel@tonic-gate  *
15447c478bd9Sstevel@tonic-gate  *		mdi_phci_t *	Pointer to pHCI structure which should
15457c478bd9Sstevel@tonic-gate  *				while computing the new value.  Used by
15467c478bd9Sstevel@tonic-gate  *				i_mdi_phci_offline() to find the new
15477c478bd9Sstevel@tonic-gate  *				client state after DR of a pHCI.
15487c478bd9Sstevel@tonic-gate  */
15497c478bd9Sstevel@tonic-gate static int
15507c478bd9Sstevel@tonic-gate i_mdi_client_compute_state(mdi_client_t *ct, mdi_phci_t *ph)
15517c478bd9Sstevel@tonic-gate {
15527c478bd9Sstevel@tonic-gate 	int		state;
15537c478bd9Sstevel@tonic-gate 	int		online_count = 0;
15547c478bd9Sstevel@tonic-gate 	int		standby_count = 0;
15557c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*pip, *next;
15567c478bd9Sstevel@tonic-gate 
15575e3986cbScth 	ASSERT(MDI_CLIENT_LOCKED(ct));
15587c478bd9Sstevel@tonic-gate 	pip = ct->ct_path_head;
15597c478bd9Sstevel@tonic-gate 	while (pip != NULL) {
15607c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
15617c478bd9Sstevel@tonic-gate 		next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link;
15627c478bd9Sstevel@tonic-gate 		if (MDI_PI(pip)->pi_phci == ph) {
15637c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
15647c478bd9Sstevel@tonic-gate 			pip = next;
15657c478bd9Sstevel@tonic-gate 			continue;
15667c478bd9Sstevel@tonic-gate 		}
15675e3986cbScth 
15687c478bd9Sstevel@tonic-gate 		if ((MDI_PI(pip)->pi_state & MDI_PATHINFO_STATE_MASK)
15697c478bd9Sstevel@tonic-gate 				== MDI_PATHINFO_STATE_ONLINE)
15707c478bd9Sstevel@tonic-gate 			online_count++;
15717c478bd9Sstevel@tonic-gate 		else if ((MDI_PI(pip)->pi_state & MDI_PATHINFO_STATE_MASK)
15727c478bd9Sstevel@tonic-gate 				== MDI_PATHINFO_STATE_STANDBY)
15737c478bd9Sstevel@tonic-gate 			standby_count++;
15747c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
15757c478bd9Sstevel@tonic-gate 		pip = next;
15767c478bd9Sstevel@tonic-gate 	}
15777c478bd9Sstevel@tonic-gate 
15787c478bd9Sstevel@tonic-gate 	if (online_count == 0) {
15797c478bd9Sstevel@tonic-gate 		if (standby_count == 0) {
15807c478bd9Sstevel@tonic-gate 			state = MDI_CLIENT_STATE_FAILED;
15814c06356bSdh142964 			MDI_DEBUG(2, (MDI_NOTE, ct->ct_dip,
15824c06356bSdh142964 			    "client state failed: ct = %p", (void *)ct));
15837c478bd9Sstevel@tonic-gate 		} else if (standby_count == 1) {
15847c478bd9Sstevel@tonic-gate 			state = MDI_CLIENT_STATE_DEGRADED;
15857c478bd9Sstevel@tonic-gate 		} else {
15867c478bd9Sstevel@tonic-gate 			state = MDI_CLIENT_STATE_OPTIMAL;
15877c478bd9Sstevel@tonic-gate 		}
15887c478bd9Sstevel@tonic-gate 	} else if (online_count == 1) {
15897c478bd9Sstevel@tonic-gate 		if (standby_count == 0) {
15907c478bd9Sstevel@tonic-gate 			state = MDI_CLIENT_STATE_DEGRADED;
15917c478bd9Sstevel@tonic-gate 		} else {
15927c478bd9Sstevel@tonic-gate 			state = MDI_CLIENT_STATE_OPTIMAL;
15937c478bd9Sstevel@tonic-gate 		}
15947c478bd9Sstevel@tonic-gate 	} else {
15957c478bd9Sstevel@tonic-gate 		state = MDI_CLIENT_STATE_OPTIMAL;
15967c478bd9Sstevel@tonic-gate 	}
15977c478bd9Sstevel@tonic-gate 	return (state);
15987c478bd9Sstevel@tonic-gate }
15997c478bd9Sstevel@tonic-gate 
16007c478bd9Sstevel@tonic-gate /*
16017c478bd9Sstevel@tonic-gate  * i_mdi_client2devinfo():
16027c478bd9Sstevel@tonic-gate  *		Utility function
16037c478bd9Sstevel@tonic-gate  */
16047c478bd9Sstevel@tonic-gate dev_info_t *
16057c478bd9Sstevel@tonic-gate i_mdi_client2devinfo(mdi_client_t *ct)
16067c478bd9Sstevel@tonic-gate {
16077c478bd9Sstevel@tonic-gate 	return (ct->ct_dip);
16087c478bd9Sstevel@tonic-gate }
16097c478bd9Sstevel@tonic-gate 
16107c478bd9Sstevel@tonic-gate /*
16117c478bd9Sstevel@tonic-gate  * mdi_client_path2_devinfo():
16127c478bd9Sstevel@tonic-gate  * 		Given the parent devinfo and child devfs pathname, search for
16137c478bd9Sstevel@tonic-gate  *		a valid devfs node handle.
16147c478bd9Sstevel@tonic-gate  */
16157c478bd9Sstevel@tonic-gate dev_info_t *
16167c478bd9Sstevel@tonic-gate mdi_client_path2devinfo(dev_info_t *vdip, char *pathname)
16177c478bd9Sstevel@tonic-gate {
16187c478bd9Sstevel@tonic-gate 	dev_info_t 	*cdip = NULL;
16197c478bd9Sstevel@tonic-gate 	dev_info_t 	*ndip = NULL;
16207c478bd9Sstevel@tonic-gate 	char		*temp_pathname;
16217c478bd9Sstevel@tonic-gate 	int		circular;
16227c478bd9Sstevel@tonic-gate 
16237c478bd9Sstevel@tonic-gate 	/*
16247c478bd9Sstevel@tonic-gate 	 * Allocate temp buffer
16257c478bd9Sstevel@tonic-gate 	 */
16267c478bd9Sstevel@tonic-gate 	temp_pathname = kmem_zalloc(MAXPATHLEN, KM_SLEEP);
16277c478bd9Sstevel@tonic-gate 
16287c478bd9Sstevel@tonic-gate 	/*
16297c478bd9Sstevel@tonic-gate 	 * Lock parent against changes
16307c478bd9Sstevel@tonic-gate 	 */
16317c478bd9Sstevel@tonic-gate 	ndi_devi_enter(vdip, &circular);
16327c478bd9Sstevel@tonic-gate 	ndip = (dev_info_t *)DEVI(vdip)->devi_child;
16337c478bd9Sstevel@tonic-gate 	while ((cdip = ndip) != NULL) {
16347c478bd9Sstevel@tonic-gate 		ndip = (dev_info_t *)DEVI(cdip)->devi_sibling;
16357c478bd9Sstevel@tonic-gate 
16367c478bd9Sstevel@tonic-gate 		*temp_pathname = '\0';
16377c478bd9Sstevel@tonic-gate 		(void) ddi_pathname(cdip, temp_pathname);
16387c478bd9Sstevel@tonic-gate 		if (strcmp(temp_pathname, pathname) == 0) {
16397c478bd9Sstevel@tonic-gate 			break;
16407c478bd9Sstevel@tonic-gate 		}
16417c478bd9Sstevel@tonic-gate 	}
16427c478bd9Sstevel@tonic-gate 	/*
16437c478bd9Sstevel@tonic-gate 	 * Release devinfo lock
16447c478bd9Sstevel@tonic-gate 	 */
16457c478bd9Sstevel@tonic-gate 	ndi_devi_exit(vdip, circular);
16467c478bd9Sstevel@tonic-gate 
16477c478bd9Sstevel@tonic-gate 	/*
16487c478bd9Sstevel@tonic-gate 	 * Free the temp buffer
16497c478bd9Sstevel@tonic-gate 	 */
16507c478bd9Sstevel@tonic-gate 	kmem_free(temp_pathname, MAXPATHLEN);
16517c478bd9Sstevel@tonic-gate 	return (cdip);
16527c478bd9Sstevel@tonic-gate }
16537c478bd9Sstevel@tonic-gate 
16547c478bd9Sstevel@tonic-gate /*
16557c478bd9Sstevel@tonic-gate  * mdi_client_get_path_count():
16567c478bd9Sstevel@tonic-gate  * 		Utility function to get number of path information nodes
16577c478bd9Sstevel@tonic-gate  *		associated with a given client device.
16587c478bd9Sstevel@tonic-gate  */
16597c478bd9Sstevel@tonic-gate int
16607c478bd9Sstevel@tonic-gate mdi_client_get_path_count(dev_info_t *cdip)
16617c478bd9Sstevel@tonic-gate {
16627c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
16637c478bd9Sstevel@tonic-gate 	int		count = 0;
16647c478bd9Sstevel@tonic-gate 
16657c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(cdip);
16667c478bd9Sstevel@tonic-gate 	if (ct != NULL) {
16677c478bd9Sstevel@tonic-gate 		count = ct->ct_path_count;
16687c478bd9Sstevel@tonic-gate 	}
16697c478bd9Sstevel@tonic-gate 	return (count);
16707c478bd9Sstevel@tonic-gate }
16717c478bd9Sstevel@tonic-gate 
16727c478bd9Sstevel@tonic-gate 
16737c478bd9Sstevel@tonic-gate /*
16747c478bd9Sstevel@tonic-gate  * i_mdi_get_hash_key():
16757c478bd9Sstevel@tonic-gate  * 		Create a hash using strings as keys
16767c478bd9Sstevel@tonic-gate  *
16777c478bd9Sstevel@tonic-gate  */
16787c478bd9Sstevel@tonic-gate static int
16797c478bd9Sstevel@tonic-gate i_mdi_get_hash_key(char *str)
16807c478bd9Sstevel@tonic-gate {
16817c478bd9Sstevel@tonic-gate 	uint32_t	g, hash = 0;
16827c478bd9Sstevel@tonic-gate 	char		*p;
16837c478bd9Sstevel@tonic-gate 
16847c478bd9Sstevel@tonic-gate 	for (p = str; *p != '\0'; p++) {
16857c478bd9Sstevel@tonic-gate 		g = *p;
16867c478bd9Sstevel@tonic-gate 		hash += g;
16877c478bd9Sstevel@tonic-gate 	}
16887c478bd9Sstevel@tonic-gate 	return (hash % (CLIENT_HASH_TABLE_SIZE - 1));
16897c478bd9Sstevel@tonic-gate }
16907c478bd9Sstevel@tonic-gate 
16917c478bd9Sstevel@tonic-gate /*
16927c478bd9Sstevel@tonic-gate  * mdi_get_lb_policy():
16937c478bd9Sstevel@tonic-gate  * 		Get current load balancing policy for a given client device
16947c478bd9Sstevel@tonic-gate  */
16957c478bd9Sstevel@tonic-gate client_lb_t
16967c478bd9Sstevel@tonic-gate mdi_get_lb_policy(dev_info_t *cdip)
16977c478bd9Sstevel@tonic-gate {
16987c478bd9Sstevel@tonic-gate 	client_lb_t	lb = LOAD_BALANCE_NONE;
16997c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
17007c478bd9Sstevel@tonic-gate 
17017c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(cdip);
17027c478bd9Sstevel@tonic-gate 	if (ct != NULL) {
17037c478bd9Sstevel@tonic-gate 		lb = ct->ct_lb;
17047c478bd9Sstevel@tonic-gate 	}
17057c478bd9Sstevel@tonic-gate 	return (lb);
17067c478bd9Sstevel@tonic-gate }
17077c478bd9Sstevel@tonic-gate 
17087c478bd9Sstevel@tonic-gate /*
17097c478bd9Sstevel@tonic-gate  * mdi_set_lb_region_size():
17107c478bd9Sstevel@tonic-gate  * 		Set current region size for the load-balance
17117c478bd9Sstevel@tonic-gate  */
17127c478bd9Sstevel@tonic-gate int
17137c478bd9Sstevel@tonic-gate mdi_set_lb_region_size(dev_info_t *cdip, int region_size)
17147c478bd9Sstevel@tonic-gate {
17157c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
17167c478bd9Sstevel@tonic-gate 	int		rv = MDI_FAILURE;
17177c478bd9Sstevel@tonic-gate 
17187c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(cdip);
17197c478bd9Sstevel@tonic-gate 	if (ct != NULL && ct->ct_lb_args != NULL) {
17207c478bd9Sstevel@tonic-gate 		ct->ct_lb_args->region_size = region_size;
17217c478bd9Sstevel@tonic-gate 		rv = MDI_SUCCESS;
17227c478bd9Sstevel@tonic-gate 	}
17237c478bd9Sstevel@tonic-gate 	return (rv);
17247c478bd9Sstevel@tonic-gate }
17257c478bd9Sstevel@tonic-gate 
17267c478bd9Sstevel@tonic-gate /*
17277c478bd9Sstevel@tonic-gate  * mdi_Set_lb_policy():
17287c478bd9Sstevel@tonic-gate  * 		Set current load balancing policy for a given client device
17297c478bd9Sstevel@tonic-gate  */
17307c478bd9Sstevel@tonic-gate int
17317c478bd9Sstevel@tonic-gate mdi_set_lb_policy(dev_info_t *cdip, client_lb_t lb)
17327c478bd9Sstevel@tonic-gate {
17337c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
17347c478bd9Sstevel@tonic-gate 	int		rv = MDI_FAILURE;
17357c478bd9Sstevel@tonic-gate 
17367c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(cdip);
17377c478bd9Sstevel@tonic-gate 	if (ct != NULL) {
17387c478bd9Sstevel@tonic-gate 		ct->ct_lb = lb;
17397c478bd9Sstevel@tonic-gate 		rv = MDI_SUCCESS;
17407c478bd9Sstevel@tonic-gate 	}
17417c478bd9Sstevel@tonic-gate 	return (rv);
17427c478bd9Sstevel@tonic-gate }
17437c478bd9Sstevel@tonic-gate 
17447c478bd9Sstevel@tonic-gate /*
17457c478bd9Sstevel@tonic-gate  * mdi_failover():
17467c478bd9Sstevel@tonic-gate  *		failover function called by the vHCI drivers to initiate
17477c478bd9Sstevel@tonic-gate  *		a failover operation.  This is typically due to non-availability
17487c478bd9Sstevel@tonic-gate  *		of online paths to route I/O requests.  Failover can be
17497c478bd9Sstevel@tonic-gate  *		triggered through user application also.
17507c478bd9Sstevel@tonic-gate  *
17517c478bd9Sstevel@tonic-gate  *		The vHCI driver calls mdi_failover() to initiate a failover
17527c478bd9Sstevel@tonic-gate  *		operation. mdi_failover() calls back into the vHCI driver's
17537c478bd9Sstevel@tonic-gate  *		vo_failover() entry point to perform the actual failover
17547c478bd9Sstevel@tonic-gate  *		operation.  The reason for requiring the vHCI driver to
17557c478bd9Sstevel@tonic-gate  *		initiate failover by calling mdi_failover(), instead of directly
17567c478bd9Sstevel@tonic-gate  *		executing vo_failover() itself, is to ensure that the mdi
17577c478bd9Sstevel@tonic-gate  *		framework can keep track of the client state properly.
17587c478bd9Sstevel@tonic-gate  *		Additionally, mdi_failover() provides as a convenience the
17597c478bd9Sstevel@tonic-gate  *		option of performing the failover operation synchronously or
17607c478bd9Sstevel@tonic-gate  *		asynchronously
17617c478bd9Sstevel@tonic-gate  *
17627c478bd9Sstevel@tonic-gate  *		Upon successful completion of the failover operation, the
17637c478bd9Sstevel@tonic-gate  *		paths that were previously ONLINE will be in the STANDBY state,
17647c478bd9Sstevel@tonic-gate  *		and the newly activated paths will be in the ONLINE state.
17657c478bd9Sstevel@tonic-gate  *
17667c478bd9Sstevel@tonic-gate  *		The flags modifier determines whether the activation is done
17677c478bd9Sstevel@tonic-gate  *		synchronously: MDI_FAILOVER_SYNC
17687c478bd9Sstevel@tonic-gate  * Return Values:
17697c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
17707c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
17717c478bd9Sstevel@tonic-gate  *		MDI_BUSY
17727c478bd9Sstevel@tonic-gate  */
17737c478bd9Sstevel@tonic-gate /*ARGSUSED*/
17747c478bd9Sstevel@tonic-gate int
17757c478bd9Sstevel@tonic-gate mdi_failover(dev_info_t *vdip, dev_info_t *cdip, int flags)
17767c478bd9Sstevel@tonic-gate {
17777c478bd9Sstevel@tonic-gate 	int			rv;
17787c478bd9Sstevel@tonic-gate 	mdi_client_t		*ct;
17797c478bd9Sstevel@tonic-gate 
17807c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(cdip);
17817c478bd9Sstevel@tonic-gate 	ASSERT(ct != NULL);
17827c478bd9Sstevel@tonic-gate 	if (ct == NULL) {
17837c478bd9Sstevel@tonic-gate 		/* cdip is not a valid client device. Nothing more to do. */
17847c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
17857c478bd9Sstevel@tonic-gate 	}
17867c478bd9Sstevel@tonic-gate 
17877c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
17887c478bd9Sstevel@tonic-gate 
17897c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT_IS_PATH_FREE_IN_PROGRESS(ct)) {
17907c478bd9Sstevel@tonic-gate 		/* A path to the client is being freed */
17917c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
17927c478bd9Sstevel@tonic-gate 		return (MDI_BUSY);
17937c478bd9Sstevel@tonic-gate 	}
17947c478bd9Sstevel@tonic-gate 
17957c478bd9Sstevel@tonic-gate 
17967c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT_IS_FAILED(ct)) {
17977c478bd9Sstevel@tonic-gate 		/*
17987c478bd9Sstevel@tonic-gate 		 * Client is in failed state. Nothing more to do.
17997c478bd9Sstevel@tonic-gate 		 */
18007c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
18017c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
18027c478bd9Sstevel@tonic-gate 	}
18037c478bd9Sstevel@tonic-gate 
18047c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT_IS_FAILOVER_IN_PROGRESS(ct)) {
18057c478bd9Sstevel@tonic-gate 		/*
18067c478bd9Sstevel@tonic-gate 		 * Failover is already in progress; return BUSY
18077c478bd9Sstevel@tonic-gate 		 */
18087c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
18097c478bd9Sstevel@tonic-gate 		return (MDI_BUSY);
18107c478bd9Sstevel@tonic-gate 	}
18117c478bd9Sstevel@tonic-gate 	/*
18127c478bd9Sstevel@tonic-gate 	 * Make sure that mdi_pathinfo node state changes are processed.
18137c478bd9Sstevel@tonic-gate 	 * We do not allow failovers to progress while client path state
18147c478bd9Sstevel@tonic-gate 	 * changes are in progress
18157c478bd9Sstevel@tonic-gate 	 */
18167c478bd9Sstevel@tonic-gate 	if (ct->ct_unstable) {
18177c478bd9Sstevel@tonic-gate 		if (flags == MDI_FAILOVER_ASYNC) {
18187c478bd9Sstevel@tonic-gate 			MDI_CLIENT_UNLOCK(ct);
18197c478bd9Sstevel@tonic-gate 			return (MDI_BUSY);
18207c478bd9Sstevel@tonic-gate 		} else {
18217c478bd9Sstevel@tonic-gate 			while (ct->ct_unstable)
18227c478bd9Sstevel@tonic-gate 				cv_wait(&ct->ct_unstable_cv, &ct->ct_mutex);
18237c478bd9Sstevel@tonic-gate 		}
18247c478bd9Sstevel@tonic-gate 	}
18257c478bd9Sstevel@tonic-gate 
18267c478bd9Sstevel@tonic-gate 	/*
18277c478bd9Sstevel@tonic-gate 	 * Client device is in stable state. Before proceeding, perform sanity
18287c478bd9Sstevel@tonic-gate 	 * checks again.
18297c478bd9Sstevel@tonic-gate 	 */
18307c478bd9Sstevel@tonic-gate 	if ((MDI_CLIENT_IS_DETACHED(ct)) || (MDI_CLIENT_IS_FAILED(ct)) ||
1831737d277aScth 	    (!i_ddi_devi_attached(ct->ct_dip))) {
18327c478bd9Sstevel@tonic-gate 		/*
18337c478bd9Sstevel@tonic-gate 		 * Client is in failed state. Nothing more to do.
18347c478bd9Sstevel@tonic-gate 		 */
18357c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
18367c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
18377c478bd9Sstevel@tonic-gate 	}
18387c478bd9Sstevel@tonic-gate 
18397c478bd9Sstevel@tonic-gate 	/*
18407c478bd9Sstevel@tonic-gate 	 * Set the client state as failover in progress.
18417c478bd9Sstevel@tonic-gate 	 */
18427c478bd9Sstevel@tonic-gate 	MDI_CLIENT_SET_FAILOVER_IN_PROGRESS(ct);
18437c478bd9Sstevel@tonic-gate 	ct->ct_failover_flags = flags;
18447c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
18457c478bd9Sstevel@tonic-gate 
18467c478bd9Sstevel@tonic-gate 	if (flags == MDI_FAILOVER_ASYNC) {
18477c478bd9Sstevel@tonic-gate 		/*
18487c478bd9Sstevel@tonic-gate 		 * Submit the initiate failover request via CPR safe
18497c478bd9Sstevel@tonic-gate 		 * taskq threads.
18507c478bd9Sstevel@tonic-gate 		 */
18517c478bd9Sstevel@tonic-gate 		(void) taskq_dispatch(mdi_taskq, (task_func_t *)i_mdi_failover,
18527c478bd9Sstevel@tonic-gate 		    ct, KM_SLEEP);
18537c478bd9Sstevel@tonic-gate 		return (MDI_ACCEPT);
18547c478bd9Sstevel@tonic-gate 	} else {
18557c478bd9Sstevel@tonic-gate 		/*
18567c478bd9Sstevel@tonic-gate 		 * Synchronous failover mode.  Typically invoked from the user
18577c478bd9Sstevel@tonic-gate 		 * land.
18587c478bd9Sstevel@tonic-gate 		 */
18597c478bd9Sstevel@tonic-gate 		rv = i_mdi_failover(ct);
18607c478bd9Sstevel@tonic-gate 	}
18617c478bd9Sstevel@tonic-gate 	return (rv);
18627c478bd9Sstevel@tonic-gate }
18637c478bd9Sstevel@tonic-gate 
18647c478bd9Sstevel@tonic-gate /*
18657c478bd9Sstevel@tonic-gate  * i_mdi_failover():
18667c478bd9Sstevel@tonic-gate  *		internal failover function. Invokes vHCI drivers failover
18677c478bd9Sstevel@tonic-gate  *		callback function and process the failover status
18687c478bd9Sstevel@tonic-gate  * Return Values:
18697c478bd9Sstevel@tonic-gate  *		None
18707c478bd9Sstevel@tonic-gate  *
18717c478bd9Sstevel@tonic-gate  * Note: A client device in failover state can not be detached or freed.
18727c478bd9Sstevel@tonic-gate  */
18737c478bd9Sstevel@tonic-gate static int
18747c478bd9Sstevel@tonic-gate i_mdi_failover(void *arg)
18757c478bd9Sstevel@tonic-gate {
18767c478bd9Sstevel@tonic-gate 	int		rv = MDI_SUCCESS;
18777c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct = (mdi_client_t *)arg;
18787c478bd9Sstevel@tonic-gate 	mdi_vhci_t	*vh = ct->ct_vhci;
18797c478bd9Sstevel@tonic-gate 
18805e3986cbScth 	ASSERT(!MDI_CLIENT_LOCKED(ct));
18817c478bd9Sstevel@tonic-gate 
18827c478bd9Sstevel@tonic-gate 	if (vh->vh_ops->vo_failover != NULL) {
18837c478bd9Sstevel@tonic-gate 		/*
18847c478bd9Sstevel@tonic-gate 		 * Call vHCI drivers callback routine
18857c478bd9Sstevel@tonic-gate 		 */
18867c478bd9Sstevel@tonic-gate 		rv = (*vh->vh_ops->vo_failover)(vh->vh_dip, ct->ct_dip,
18877c478bd9Sstevel@tonic-gate 		    ct->ct_failover_flags);
18887c478bd9Sstevel@tonic-gate 	}
18897c478bd9Sstevel@tonic-gate 
18907c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
18917c478bd9Sstevel@tonic-gate 	MDI_CLIENT_CLEAR_FAILOVER_IN_PROGRESS(ct);
18927c478bd9Sstevel@tonic-gate 
18937c478bd9Sstevel@tonic-gate 	/*
18947c478bd9Sstevel@tonic-gate 	 * Save the failover return status
18957c478bd9Sstevel@tonic-gate 	 */
18967c478bd9Sstevel@tonic-gate 	ct->ct_failover_status = rv;
18977c478bd9Sstevel@tonic-gate 
18987c478bd9Sstevel@tonic-gate 	/*
18997c478bd9Sstevel@tonic-gate 	 * As a result of failover, client status would have been changed.
19007c478bd9Sstevel@tonic-gate 	 * Update the client state and wake up anyone waiting on this client
19017c478bd9Sstevel@tonic-gate 	 * device.
19027c478bd9Sstevel@tonic-gate 	 */
19037c478bd9Sstevel@tonic-gate 	i_mdi_client_update_state(ct);
19047c478bd9Sstevel@tonic-gate 
19057c478bd9Sstevel@tonic-gate 	cv_broadcast(&ct->ct_failover_cv);
19067c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
19077c478bd9Sstevel@tonic-gate 	return (rv);
19087c478bd9Sstevel@tonic-gate }
19097c478bd9Sstevel@tonic-gate 
19107c478bd9Sstevel@tonic-gate /*
19117c478bd9Sstevel@tonic-gate  * Load balancing is logical block.
19127c478bd9Sstevel@tonic-gate  * IOs within the range described by region_size
19137c478bd9Sstevel@tonic-gate  * would go on the same path. This would improve the
19147c478bd9Sstevel@tonic-gate  * performance by cache-hit on some of the RAID devices.
19157c478bd9Sstevel@tonic-gate  * Search only for online paths(At some point we
19167c478bd9Sstevel@tonic-gate  * may want to balance across target ports).
19177c478bd9Sstevel@tonic-gate  * If no paths are found then default to round-robin.
19187c478bd9Sstevel@tonic-gate  */
19197c478bd9Sstevel@tonic-gate static int
19207c478bd9Sstevel@tonic-gate i_mdi_lba_lb(mdi_client_t *ct, mdi_pathinfo_t **ret_pip, struct buf *bp)
19217c478bd9Sstevel@tonic-gate {
19227c478bd9Sstevel@tonic-gate 	int		path_index = -1;
19237c478bd9Sstevel@tonic-gate 	int		online_path_count = 0;
19247c478bd9Sstevel@tonic-gate 	int		online_nonpref_path_count = 0;
19257c478bd9Sstevel@tonic-gate 	int 		region_size = ct->ct_lb_args->region_size;
19267c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*pip;
19277c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*next;
19287c478bd9Sstevel@tonic-gate 	int		preferred, path_cnt;
19297c478bd9Sstevel@tonic-gate 
19307c478bd9Sstevel@tonic-gate 	pip = ct->ct_path_head;
19317c478bd9Sstevel@tonic-gate 	while (pip) {
19327c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
19337c478bd9Sstevel@tonic-gate 		if (MDI_PI(pip)->pi_state ==
19347c478bd9Sstevel@tonic-gate 		    MDI_PATHINFO_STATE_ONLINE && MDI_PI(pip)->pi_preferred) {
19357c478bd9Sstevel@tonic-gate 			online_path_count++;
19367c478bd9Sstevel@tonic-gate 		} else if (MDI_PI(pip)->pi_state ==
19377c478bd9Sstevel@tonic-gate 		    MDI_PATHINFO_STATE_ONLINE && !MDI_PI(pip)->pi_preferred) {
19387c478bd9Sstevel@tonic-gate 			online_nonpref_path_count++;
19397c478bd9Sstevel@tonic-gate 		}
19407c478bd9Sstevel@tonic-gate 		next = (mdi_pathinfo_t *)
19417c478bd9Sstevel@tonic-gate 		    MDI_PI(pip)->pi_client_link;
19427c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
19437c478bd9Sstevel@tonic-gate 		pip = next;
19447c478bd9Sstevel@tonic-gate 	}
19457c478bd9Sstevel@tonic-gate 	/* if found any online/preferred then use this type */
19467c478bd9Sstevel@tonic-gate 	if (online_path_count > 0) {
19477c478bd9Sstevel@tonic-gate 		path_cnt = online_path_count;
19487c478bd9Sstevel@tonic-gate 		preferred = 1;
19497c478bd9Sstevel@tonic-gate 	} else if (online_nonpref_path_count > 0) {
19507c478bd9Sstevel@tonic-gate 		path_cnt = online_nonpref_path_count;
19517c478bd9Sstevel@tonic-gate 		preferred = 0;
19527c478bd9Sstevel@tonic-gate 	} else {
19537c478bd9Sstevel@tonic-gate 		path_cnt = 0;
19547c478bd9Sstevel@tonic-gate 	}
19557c478bd9Sstevel@tonic-gate 	if (path_cnt) {
19567c478bd9Sstevel@tonic-gate 		path_index = (bp->b_blkno >> region_size) % path_cnt;
19577c478bd9Sstevel@tonic-gate 		pip = ct->ct_path_head;
19587c478bd9Sstevel@tonic-gate 		while (pip && path_index != -1) {
19597c478bd9Sstevel@tonic-gate 			MDI_PI_LOCK(pip);
19607c478bd9Sstevel@tonic-gate 			if (path_index == 0 &&
19617c478bd9Sstevel@tonic-gate 			    (MDI_PI(pip)->pi_state ==
19627c478bd9Sstevel@tonic-gate 			    MDI_PATHINFO_STATE_ONLINE) &&
19637c478bd9Sstevel@tonic-gate 				MDI_PI(pip)->pi_preferred == preferred) {
19647c478bd9Sstevel@tonic-gate 				MDI_PI_HOLD(pip);
19657c478bd9Sstevel@tonic-gate 				MDI_PI_UNLOCK(pip);
19667c478bd9Sstevel@tonic-gate 				*ret_pip = pip;
19677c478bd9Sstevel@tonic-gate 				return (MDI_SUCCESS);
19687c478bd9Sstevel@tonic-gate 			}
19697c478bd9Sstevel@tonic-gate 			path_index --;
19707c478bd9Sstevel@tonic-gate 			next = (mdi_pathinfo_t *)
19717c478bd9Sstevel@tonic-gate 			    MDI_PI(pip)->pi_client_link;
19727c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
19737c478bd9Sstevel@tonic-gate 			pip = next;
19747c478bd9Sstevel@tonic-gate 		}
19754c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, ct->ct_dip,
19764c06356bSdh142964 		    "lba %llx: path %s %p",
19774c06356bSdh142964 		    bp->b_lblkno, mdi_pi_spathname(pip), (void *)pip));
19787c478bd9Sstevel@tonic-gate 	}
19797c478bd9Sstevel@tonic-gate 	return (MDI_FAILURE);
19807c478bd9Sstevel@tonic-gate }
19817c478bd9Sstevel@tonic-gate 
19827c478bd9Sstevel@tonic-gate /*
19837c478bd9Sstevel@tonic-gate  * mdi_select_path():
19847c478bd9Sstevel@tonic-gate  *		select a path to access a client device.
19857c478bd9Sstevel@tonic-gate  *
19867c478bd9Sstevel@tonic-gate  *		mdi_select_path() function is called by the vHCI drivers to
19877c478bd9Sstevel@tonic-gate  *		select a path to route the I/O request to.  The caller passes
19887c478bd9Sstevel@tonic-gate  *		the block I/O data transfer structure ("buf") as one of the
19897c478bd9Sstevel@tonic-gate  *		parameters.  The mpxio framework uses the buf structure
19907c478bd9Sstevel@tonic-gate  *		contents to maintain per path statistics (total I/O size /
19917c478bd9Sstevel@tonic-gate  *		count pending).  If more than one online paths are available to
19927c478bd9Sstevel@tonic-gate  *		select, the framework automatically selects a suitable path
19937c478bd9Sstevel@tonic-gate  *		for routing I/O request. If a failover operation is active for
19947c478bd9Sstevel@tonic-gate  *		this client device the call shall be failed with MDI_BUSY error
19957c478bd9Sstevel@tonic-gate  *		code.
19967c478bd9Sstevel@tonic-gate  *
19977c478bd9Sstevel@tonic-gate  *		By default this function returns a suitable path in online
19987c478bd9Sstevel@tonic-gate  *		state based on the current load balancing policy.  Currently
19997c478bd9Sstevel@tonic-gate  *		we support LOAD_BALANCE_NONE (Previously selected online path
20007c478bd9Sstevel@tonic-gate  *		will continue to be used till the path is usable) and
20017c478bd9Sstevel@tonic-gate  *		LOAD_BALANCE_RR (Online paths will be selected in a round
20027c478bd9Sstevel@tonic-gate  *		robin fashion), LOAD_BALANCE_LB(Online paths will be selected
20037c478bd9Sstevel@tonic-gate  *		based on the logical block).  The load balancing
20047c478bd9Sstevel@tonic-gate  *		through vHCI drivers configuration file (driver.conf).
20057c478bd9Sstevel@tonic-gate  *
20067c478bd9Sstevel@tonic-gate  *		vHCI drivers may override this default behavior by specifying
2007602ca9eaScth  *		appropriate flags.  The meaning of the thrid argument depends
2008602ca9eaScth  *		on the flags specified. If MDI_SELECT_PATH_INSTANCE is set
2009602ca9eaScth  *		then the argument is the "path instance" of the path to select.
2010602ca9eaScth  *		If MDI_SELECT_PATH_INSTANCE is not set then the argument is
2011602ca9eaScth  *		"start_pip". A non NULL "start_pip" is the starting point to
2012602ca9eaScth  *		walk and find the next appropriate path.  The following values
2013602ca9eaScth  *		are currently defined: MDI_SELECT_ONLINE_PATH (to select an
2014602ca9eaScth  *		ONLINE path) and/or MDI_SELECT_STANDBY_PATH (to select an
2015602ca9eaScth  *		STANDBY path).
20167c478bd9Sstevel@tonic-gate  *
20177c478bd9Sstevel@tonic-gate  *		The non-standard behavior is used by the scsi_vhci driver,
20187c478bd9Sstevel@tonic-gate  *		whenever it has to use a STANDBY/FAULTED path.  Eg. during
20197c478bd9Sstevel@tonic-gate  *		attach of client devices (to avoid an unnecessary failover
20207c478bd9Sstevel@tonic-gate  *		when the STANDBY path comes up first), during failover
20217c478bd9Sstevel@tonic-gate  *		(to activate a STANDBY path as ONLINE).
20227c478bd9Sstevel@tonic-gate  *
20235e3986cbScth  *		The selected path is returned in a a mdi_hold_path() state
20245e3986cbScth  *		(pi_ref_cnt). Caller should release the hold by calling
20255e3986cbScth  *		mdi_rele_path().
20267c478bd9Sstevel@tonic-gate  *
20277c478bd9Sstevel@tonic-gate  * Return Values:
20287c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS	- Completed successfully
20297c478bd9Sstevel@tonic-gate  *		MDI_BUSY 	- Client device is busy failing over
20307c478bd9Sstevel@tonic-gate  *		MDI_NOPATH	- Client device is online, but no valid path are
20317c478bd9Sstevel@tonic-gate  *				  available to access this client device
20327c478bd9Sstevel@tonic-gate  *		MDI_FAILURE	- Invalid client device or state
20337c478bd9Sstevel@tonic-gate  *		MDI_DEVI_ONLINING
20347c478bd9Sstevel@tonic-gate  *				- Client device (struct dev_info state) is in
20357c478bd9Sstevel@tonic-gate  *				  onlining state.
20367c478bd9Sstevel@tonic-gate  */
20377c478bd9Sstevel@tonic-gate 
20387c478bd9Sstevel@tonic-gate /*ARGSUSED*/
20397c478bd9Sstevel@tonic-gate int
20407c478bd9Sstevel@tonic-gate mdi_select_path(dev_info_t *cdip, struct buf *bp, int flags,
2041602ca9eaScth     void *arg, mdi_pathinfo_t **ret_pip)
20427c478bd9Sstevel@tonic-gate {
20437c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
20447c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*pip;
20457c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*next;
20467c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*head;
20477c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*start;
20487c478bd9Sstevel@tonic-gate 	client_lb_t	lbp;	/* load balancing policy */
20497c478bd9Sstevel@tonic-gate 	int		sb = 1;	/* standard behavior */
20507c478bd9Sstevel@tonic-gate 	int		preferred = 1;	/* preferred path */
20517c478bd9Sstevel@tonic-gate 	int		cond, cont = 1;
20527c478bd9Sstevel@tonic-gate 	int		retry = 0;
2053602ca9eaScth 	mdi_pathinfo_t	*start_pip;	/* request starting pathinfo */
2054602ca9eaScth 	int		path_instance;	/* request specific path instance */
2055602ca9eaScth 
2056602ca9eaScth 	/* determine type of arg based on flags */
2057602ca9eaScth 	if (flags & MDI_SELECT_PATH_INSTANCE) {
2058602ca9eaScth 		path_instance = (int)(intptr_t)arg;
2059602ca9eaScth 		start_pip = NULL;
2060602ca9eaScth 	} else {
2061602ca9eaScth 		path_instance = 0;
2062602ca9eaScth 		start_pip = (mdi_pathinfo_t *)arg;
2063602ca9eaScth 	}
20647c478bd9Sstevel@tonic-gate 
20657c478bd9Sstevel@tonic-gate 	if (flags != 0) {
20667c478bd9Sstevel@tonic-gate 		/*
20677c478bd9Sstevel@tonic-gate 		 * disable default behavior
20687c478bd9Sstevel@tonic-gate 		 */
20697c478bd9Sstevel@tonic-gate 		sb = 0;
20707c478bd9Sstevel@tonic-gate 	}
20717c478bd9Sstevel@tonic-gate 
20727c478bd9Sstevel@tonic-gate 	*ret_pip = NULL;
20737c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(cdip);
20747c478bd9Sstevel@tonic-gate 	if (ct == NULL) {
20757c478bd9Sstevel@tonic-gate 		/* mdi extensions are NULL, Nothing more to do */
20767c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
20777c478bd9Sstevel@tonic-gate 	}
20787c478bd9Sstevel@tonic-gate 
20797c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
20807c478bd9Sstevel@tonic-gate 
20817c478bd9Sstevel@tonic-gate 	if (sb) {
20827c478bd9Sstevel@tonic-gate 		if (MDI_CLIENT_IS_FAILED(ct)) {
20837c478bd9Sstevel@tonic-gate 			/*
20847c478bd9Sstevel@tonic-gate 			 * Client is not ready to accept any I/O requests.
20857c478bd9Sstevel@tonic-gate 			 * Fail this request.
20867c478bd9Sstevel@tonic-gate 			 */
20874c06356bSdh142964 			MDI_DEBUG(2, (MDI_NOTE, cdip,
20884c06356bSdh142964 			    "client state offline ct = %p", (void *)ct));
20897c478bd9Sstevel@tonic-gate 			MDI_CLIENT_UNLOCK(ct);
20907c478bd9Sstevel@tonic-gate 			return (MDI_FAILURE);
20917c478bd9Sstevel@tonic-gate 		}
20927c478bd9Sstevel@tonic-gate 
20937c478bd9Sstevel@tonic-gate 		if (MDI_CLIENT_IS_FAILOVER_IN_PROGRESS(ct)) {
20947c478bd9Sstevel@tonic-gate 			/*
20957c478bd9Sstevel@tonic-gate 			 * Check for Failover is in progress. If so tell the
20967c478bd9Sstevel@tonic-gate 			 * caller that this device is busy.
20977c478bd9Sstevel@tonic-gate 			 */
20984c06356bSdh142964 			MDI_DEBUG(2, (MDI_NOTE, cdip,
20994c06356bSdh142964 			    "client failover in progress ct = %p",
21005e3986cbScth 			    (void *)ct));
21017c478bd9Sstevel@tonic-gate 			MDI_CLIENT_UNLOCK(ct);
21027c478bd9Sstevel@tonic-gate 			return (MDI_BUSY);
21037c478bd9Sstevel@tonic-gate 		}
21047c478bd9Sstevel@tonic-gate 
21057c478bd9Sstevel@tonic-gate 		/*
21067c478bd9Sstevel@tonic-gate 		 * Check to see whether the client device is attached.
21077c478bd9Sstevel@tonic-gate 		 * If not so, let the vHCI driver manually select a path
21087c478bd9Sstevel@tonic-gate 		 * (standby) and let the probe/attach process to continue.
21097c478bd9Sstevel@tonic-gate 		 */
2110737d277aScth 		if (MDI_CLIENT_IS_DETACHED(ct) || !i_ddi_devi_attached(cdip)) {
21114c06356bSdh142964 			MDI_DEBUG(4, (MDI_NOTE, cdip,
21124c06356bSdh142964 			    "devi is onlining ct = %p", (void *)ct));
21137c478bd9Sstevel@tonic-gate 			MDI_CLIENT_UNLOCK(ct);
21147c478bd9Sstevel@tonic-gate 			return (MDI_DEVI_ONLINING);
21157c478bd9Sstevel@tonic-gate 		}
21167c478bd9Sstevel@tonic-gate 	}
21177c478bd9Sstevel@tonic-gate 
21187c478bd9Sstevel@tonic-gate 	/*
21197c478bd9Sstevel@tonic-gate 	 * Cache in the client list head.  If head of the list is NULL
21207c478bd9Sstevel@tonic-gate 	 * return MDI_NOPATH
21217c478bd9Sstevel@tonic-gate 	 */
21227c478bd9Sstevel@tonic-gate 	head = ct->ct_path_head;
21237c478bd9Sstevel@tonic-gate 	if (head == NULL) {
21247c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
21257c478bd9Sstevel@tonic-gate 		return (MDI_NOPATH);
21267c478bd9Sstevel@tonic-gate 	}
21277c478bd9Sstevel@tonic-gate 
2128602ca9eaScth 	/* Caller is specifying a specific pathinfo path by path_instance */
2129602ca9eaScth 	if (path_instance) {
2130602ca9eaScth 		/* search for pathinfo with correct path_instance */
2131602ca9eaScth 		for (pip = head;
2132602ca9eaScth 		    pip && (mdi_pi_get_path_instance(pip) != path_instance);
2133602ca9eaScth 		    pip = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link)
2134602ca9eaScth 			;
2135602ca9eaScth 
2136*ab412e72SSrikanth, Ramana 		/* If path can't be selected then MDI_NOPATH is returned. */
2137602ca9eaScth 		if (pip == NULL) {
2138602ca9eaScth 			MDI_CLIENT_UNLOCK(ct);
2139*ab412e72SSrikanth, Ramana 			return (MDI_NOPATH);
2140602ca9eaScth 		}
2141602ca9eaScth 
21424c06356bSdh142964 		/*
21434c06356bSdh142964 		 * Verify state of path. When asked to select a specific
21444c06356bSdh142964 		 * path_instance, we select the requested path in any
21454c06356bSdh142964 		 * state (ONLINE, OFFLINE, STANDBY, FAULT) other than INIT.
21464c06356bSdh142964 		 * We don't however select paths where the pHCI has detached.
21474c06356bSdh142964 		 * NOTE: last pathinfo node of an opened client device may
21484c06356bSdh142964 		 * exist in an OFFLINE state after the pHCI associated with
21494c06356bSdh142964 		 * that path has detached (but pi_phci will be NULL if that
21504c06356bSdh142964 		 * has occurred).
21514c06356bSdh142964 		 */
2152602ca9eaScth 		MDI_PI_LOCK(pip);
21534c06356bSdh142964 		if ((MDI_PI(pip)->pi_state == MDI_PATHINFO_STATE_INIT) ||
21544c06356bSdh142964 		    (MDI_PI(pip)->pi_phci == NULL)) {
2155602ca9eaScth 			MDI_PI_UNLOCK(pip);
2156602ca9eaScth 			MDI_CLIENT_UNLOCK(ct);
2157602ca9eaScth 			return (MDI_FAILURE);
2158602ca9eaScth 		}
2159602ca9eaScth 
2160*ab412e72SSrikanth, Ramana 		/* Return MDI_BUSY if we have a transient condition */
2161*ab412e72SSrikanth, Ramana 		if (MDI_PI_IS_TRANSIENT(pip)) {
2162*ab412e72SSrikanth, Ramana 			MDI_PI_UNLOCK(pip);
2163*ab412e72SSrikanth, Ramana 			MDI_CLIENT_UNLOCK(ct);
2164*ab412e72SSrikanth, Ramana 			return (MDI_BUSY);
2165*ab412e72SSrikanth, Ramana 		}
2166*ab412e72SSrikanth, Ramana 
2167602ca9eaScth 		/*
2168602ca9eaScth 		 * Return the path in hold state. Caller should release the
2169602ca9eaScth 		 * lock by calling mdi_rele_path()
2170602ca9eaScth 		 */
2171602ca9eaScth 		MDI_PI_HOLD(pip);
2172602ca9eaScth 		MDI_PI_UNLOCK(pip);
2173602ca9eaScth 		*ret_pip = pip;
2174602ca9eaScth 		MDI_CLIENT_UNLOCK(ct);
2175602ca9eaScth 		return (MDI_SUCCESS);
2176602ca9eaScth 	}
2177602ca9eaScth 
21787c478bd9Sstevel@tonic-gate 	/*
21797c478bd9Sstevel@tonic-gate 	 * for non default behavior, bypass current
21807c478bd9Sstevel@tonic-gate 	 * load balancing policy and always use LOAD_BALANCE_RR
21817c478bd9Sstevel@tonic-gate 	 * except that the start point will be adjusted based
21827c478bd9Sstevel@tonic-gate 	 * on the provided start_pip
21837c478bd9Sstevel@tonic-gate 	 */
21847c478bd9Sstevel@tonic-gate 	lbp = sb ? ct->ct_lb : LOAD_BALANCE_RR;
21857c478bd9Sstevel@tonic-gate 
21867c478bd9Sstevel@tonic-gate 	switch (lbp) {
21877c478bd9Sstevel@tonic-gate 	case LOAD_BALANCE_NONE:
21887c478bd9Sstevel@tonic-gate 		/*
21897c478bd9Sstevel@tonic-gate 		 * Load balancing is None  or Alternate path mode
21907c478bd9Sstevel@tonic-gate 		 * Start looking for a online mdi_pathinfo node starting from
21917c478bd9Sstevel@tonic-gate 		 * last known selected path
21927c478bd9Sstevel@tonic-gate 		 */
21937c478bd9Sstevel@tonic-gate 		preferred = 1;
21947c478bd9Sstevel@tonic-gate 		pip = (mdi_pathinfo_t *)ct->ct_path_last;
21957c478bd9Sstevel@tonic-gate 		if (pip == NULL) {
21967c478bd9Sstevel@tonic-gate 			pip = head;
21977c478bd9Sstevel@tonic-gate 		}
21987c478bd9Sstevel@tonic-gate 		start = pip;
21997c478bd9Sstevel@tonic-gate 		do {
22007c478bd9Sstevel@tonic-gate 			MDI_PI_LOCK(pip);
22017c478bd9Sstevel@tonic-gate 			/*
22027c478bd9Sstevel@tonic-gate 			 * No need to explicitly check if the path is disabled.
22037c478bd9Sstevel@tonic-gate 			 * Since we are checking for state == ONLINE and the
220455e592a2SRandall Ralphs 			 * same variable is used for DISABLE/ENABLE information.
22057c478bd9Sstevel@tonic-gate 			 */
2206ee28b439Scm136836 			if ((MDI_PI(pip)->pi_state  ==
2207ee28b439Scm136836 				MDI_PATHINFO_STATE_ONLINE) &&
22087c478bd9Sstevel@tonic-gate 				preferred == MDI_PI(pip)->pi_preferred) {
22097c478bd9Sstevel@tonic-gate 				/*
22107c478bd9Sstevel@tonic-gate 				 * Return the path in hold state. Caller should
22117c478bd9Sstevel@tonic-gate 				 * release the lock by calling mdi_rele_path()
22127c478bd9Sstevel@tonic-gate 				 */
22137c478bd9Sstevel@tonic-gate 				MDI_PI_HOLD(pip);
22147c478bd9Sstevel@tonic-gate 				MDI_PI_UNLOCK(pip);
22157c478bd9Sstevel@tonic-gate 				ct->ct_path_last = pip;
22167c478bd9Sstevel@tonic-gate 				*ret_pip = pip;
22177c478bd9Sstevel@tonic-gate 				MDI_CLIENT_UNLOCK(ct);
22187c478bd9Sstevel@tonic-gate 				return (MDI_SUCCESS);
22197c478bd9Sstevel@tonic-gate 			}
22207c478bd9Sstevel@tonic-gate 
22217c478bd9Sstevel@tonic-gate 			/*
22227c478bd9Sstevel@tonic-gate 			 * Path is busy.
22237c478bd9Sstevel@tonic-gate 			 */
22247c478bd9Sstevel@tonic-gate 			if (MDI_PI_IS_DRV_DISABLE_TRANSIENT(pip) ||
22257c478bd9Sstevel@tonic-gate 			    MDI_PI_IS_TRANSIENT(pip))
22267c478bd9Sstevel@tonic-gate 				retry = 1;
22277c478bd9Sstevel@tonic-gate 			/*
22287c478bd9Sstevel@tonic-gate 			 * Keep looking for a next available online path
22297c478bd9Sstevel@tonic-gate 			 */
22307c478bd9Sstevel@tonic-gate 			next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link;
22317c478bd9Sstevel@tonic-gate 			if (next == NULL) {
22327c478bd9Sstevel@tonic-gate 				next = head;
22337c478bd9Sstevel@tonic-gate 			}
22347c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
22357c478bd9Sstevel@tonic-gate 			pip = next;
22367c478bd9Sstevel@tonic-gate 			if (start == pip && preferred) {
22377c478bd9Sstevel@tonic-gate 				preferred = 0;
22387c478bd9Sstevel@tonic-gate 			} else if (start == pip && !preferred) {
22397c478bd9Sstevel@tonic-gate 				cont = 0;
22407c478bd9Sstevel@tonic-gate 			}
22417c478bd9Sstevel@tonic-gate 		} while (cont);
22427c478bd9Sstevel@tonic-gate 		break;
22437c478bd9Sstevel@tonic-gate 
22447c478bd9Sstevel@tonic-gate 	case LOAD_BALANCE_LBA:
22457c478bd9Sstevel@tonic-gate 		/*
22467c478bd9Sstevel@tonic-gate 		 * Make sure we are looking
22477c478bd9Sstevel@tonic-gate 		 * for an online path. Otherwise, if it is for a STANDBY
22487c478bd9Sstevel@tonic-gate 		 * path request, it will go through and fetch an ONLINE
22497c478bd9Sstevel@tonic-gate 		 * path which is not desirable.
22507c478bd9Sstevel@tonic-gate 		 */
22517c478bd9Sstevel@tonic-gate 		if ((ct->ct_lb_args != NULL) &&
22527c478bd9Sstevel@tonic-gate 			    (ct->ct_lb_args->region_size) && bp &&
22537c478bd9Sstevel@tonic-gate 				(sb || (flags == MDI_SELECT_ONLINE_PATH))) {
22547c478bd9Sstevel@tonic-gate 			if (i_mdi_lba_lb(ct, ret_pip, bp)
22557c478bd9Sstevel@tonic-gate 				    == MDI_SUCCESS) {
22567c478bd9Sstevel@tonic-gate 				MDI_CLIENT_UNLOCK(ct);
22577c478bd9Sstevel@tonic-gate 				return (MDI_SUCCESS);
22587c478bd9Sstevel@tonic-gate 			}
22597c478bd9Sstevel@tonic-gate 		}
22607c478bd9Sstevel@tonic-gate 		/* FALLTHROUGH */
22617c478bd9Sstevel@tonic-gate 	case LOAD_BALANCE_RR:
22627c478bd9Sstevel@tonic-gate 		/*
22637c478bd9Sstevel@tonic-gate 		 * Load balancing is Round Robin. Start looking for a online
22647c478bd9Sstevel@tonic-gate 		 * mdi_pathinfo node starting from last known selected path
22657c478bd9Sstevel@tonic-gate 		 * as the start point.  If override flags are specified,
22667c478bd9Sstevel@tonic-gate 		 * process accordingly.
22677c478bd9Sstevel@tonic-gate 		 * If the search is already in effect(start_pip not null),
22687c478bd9Sstevel@tonic-gate 		 * then lets just use the same path preference to continue the
22697c478bd9Sstevel@tonic-gate 		 * traversal.
22707c478bd9Sstevel@tonic-gate 		 */
22717c478bd9Sstevel@tonic-gate 
22727c478bd9Sstevel@tonic-gate 		if (start_pip != NULL) {
22737c478bd9Sstevel@tonic-gate 			preferred = MDI_PI(start_pip)->pi_preferred;
22747c478bd9Sstevel@tonic-gate 		} else {
22757c478bd9Sstevel@tonic-gate 			preferred = 1;
22767c478bd9Sstevel@tonic-gate 		}
22777c478bd9Sstevel@tonic-gate 
22787c478bd9Sstevel@tonic-gate 		start = sb ? (mdi_pathinfo_t *)ct->ct_path_last : start_pip;
22797c478bd9Sstevel@tonic-gate 		if (start == NULL) {
22807c478bd9Sstevel@tonic-gate 			pip = head;
22817c478bd9Sstevel@tonic-gate 		} else {
22827c478bd9Sstevel@tonic-gate 			pip = (mdi_pathinfo_t *)MDI_PI(start)->pi_client_link;
22837c478bd9Sstevel@tonic-gate 			if (pip == NULL) {
2284b08fdaf7SSheshadri Vasudevan 				if ( flags & MDI_SELECT_NO_PREFERRED) {
2285b08fdaf7SSheshadri Vasudevan 					/*
2286b08fdaf7SSheshadri Vasudevan 					 * Return since we hit the end of list
2287b08fdaf7SSheshadri Vasudevan 					 */
2288b08fdaf7SSheshadri Vasudevan 					MDI_CLIENT_UNLOCK(ct);
2289b08fdaf7SSheshadri Vasudevan 					return (MDI_NOPATH);
2290b08fdaf7SSheshadri Vasudevan 				}
2291b08fdaf7SSheshadri Vasudevan 
22927c478bd9Sstevel@tonic-gate 				if (!sb) {
22937c478bd9Sstevel@tonic-gate 					if (preferred == 0) {
22947c478bd9Sstevel@tonic-gate 						/*
22957c478bd9Sstevel@tonic-gate 						 * Looks like we have completed
22967c478bd9Sstevel@tonic-gate 						 * the traversal as preferred
22977c478bd9Sstevel@tonic-gate 						 * value is 0. Time to bail out.
22987c478bd9Sstevel@tonic-gate 						 */
22997c478bd9Sstevel@tonic-gate 						*ret_pip = NULL;
23007c478bd9Sstevel@tonic-gate 						MDI_CLIENT_UNLOCK(ct);
23017c478bd9Sstevel@tonic-gate 						return (MDI_NOPATH);
23027c478bd9Sstevel@tonic-gate 					} else {
23037c478bd9Sstevel@tonic-gate 						/*
23047c478bd9Sstevel@tonic-gate 						 * Looks like we reached the
23057c478bd9Sstevel@tonic-gate 						 * end of the list. Lets enable
23067c478bd9Sstevel@tonic-gate 						 * traversal of non preferred
23077c478bd9Sstevel@tonic-gate 						 * paths.
23087c478bd9Sstevel@tonic-gate 						 */
23097c478bd9Sstevel@tonic-gate 						preferred = 0;
23107c478bd9Sstevel@tonic-gate 					}
23117c478bd9Sstevel@tonic-gate 				}
23127c478bd9Sstevel@tonic-gate 				pip = head;
23137c478bd9Sstevel@tonic-gate 			}
23147c478bd9Sstevel@tonic-gate 		}
23157c478bd9Sstevel@tonic-gate 		start = pip;
23167c478bd9Sstevel@tonic-gate 		do {
23177c478bd9Sstevel@tonic-gate 			MDI_PI_LOCK(pip);
23187c478bd9Sstevel@tonic-gate 			if (sb) {
23197c478bd9Sstevel@tonic-gate 				cond = ((MDI_PI(pip)->pi_state ==
23207c478bd9Sstevel@tonic-gate 				    MDI_PATHINFO_STATE_ONLINE &&
23217c478bd9Sstevel@tonic-gate 					MDI_PI(pip)->pi_preferred ==
23227c478bd9Sstevel@tonic-gate 						preferred) ? 1 : 0);
23237c478bd9Sstevel@tonic-gate 			} else {
23247c478bd9Sstevel@tonic-gate 				if (flags == MDI_SELECT_ONLINE_PATH) {
23257c478bd9Sstevel@tonic-gate 					cond = ((MDI_PI(pip)->pi_state ==
23267c478bd9Sstevel@tonic-gate 					    MDI_PATHINFO_STATE_ONLINE &&
23277c478bd9Sstevel@tonic-gate 						MDI_PI(pip)->pi_preferred ==
23287c478bd9Sstevel@tonic-gate 						preferred) ? 1 : 0);
23297c478bd9Sstevel@tonic-gate 				} else if (flags == MDI_SELECT_STANDBY_PATH) {
23307c478bd9Sstevel@tonic-gate 					cond = ((MDI_PI(pip)->pi_state ==
23317c478bd9Sstevel@tonic-gate 					    MDI_PATHINFO_STATE_STANDBY &&
23327c478bd9Sstevel@tonic-gate 						MDI_PI(pip)->pi_preferred ==
23337c478bd9Sstevel@tonic-gate 						preferred) ? 1 : 0);
23347c478bd9Sstevel@tonic-gate 				} else if (flags == (MDI_SELECT_ONLINE_PATH |
23357c478bd9Sstevel@tonic-gate 				    MDI_SELECT_STANDBY_PATH)) {
23367c478bd9Sstevel@tonic-gate 					cond = (((MDI_PI(pip)->pi_state ==
23377c478bd9Sstevel@tonic-gate 					    MDI_PATHINFO_STATE_ONLINE ||
23387c478bd9Sstevel@tonic-gate 					    (MDI_PI(pip)->pi_state ==
23397c478bd9Sstevel@tonic-gate 					    MDI_PATHINFO_STATE_STANDBY)) &&
23407c478bd9Sstevel@tonic-gate 						MDI_PI(pip)->pi_preferred ==
23417c478bd9Sstevel@tonic-gate 						preferred) ? 1 : 0);
2342ee28b439Scm136836 				} else if (flags ==
2343ee28b439Scm136836 					(MDI_SELECT_STANDBY_PATH |
2344ee28b439Scm136836 					MDI_SELECT_ONLINE_PATH |
2345ee28b439Scm136836 					MDI_SELECT_USER_DISABLE_PATH)) {
2346ee28b439Scm136836 					cond = (((MDI_PI(pip)->pi_state ==
2347ee28b439Scm136836 					    MDI_PATHINFO_STATE_ONLINE ||
2348ee28b439Scm136836 					    (MDI_PI(pip)->pi_state ==
2349ee28b439Scm136836 					    MDI_PATHINFO_STATE_STANDBY) ||
2350ee28b439Scm136836 						(MDI_PI(pip)->pi_state ==
2351ee28b439Scm136836 					    (MDI_PATHINFO_STATE_ONLINE|
2352ee28b439Scm136836 					    MDI_PATHINFO_STATE_USER_DISABLE)) ||
2353ee28b439Scm136836 						(MDI_PI(pip)->pi_state ==
2354ee28b439Scm136836 					    (MDI_PATHINFO_STATE_STANDBY |
2355ee28b439Scm136836 					    MDI_PATHINFO_STATE_USER_DISABLE)))&&
2356ee28b439Scm136836 						MDI_PI(pip)->pi_preferred ==
2357ee28b439Scm136836 						preferred) ? 1 : 0);
2358b08fdaf7SSheshadri Vasudevan 				} else if (flags ==
2359b08fdaf7SSheshadri Vasudevan 				    (MDI_SELECT_STANDBY_PATH |
2360b08fdaf7SSheshadri Vasudevan 				    MDI_SELECT_ONLINE_PATH |
2361b08fdaf7SSheshadri Vasudevan 				    MDI_SELECT_NO_PREFERRED)) {
2362b08fdaf7SSheshadri Vasudevan 					cond = (((MDI_PI(pip)->pi_state ==
2363b08fdaf7SSheshadri Vasudevan 					    MDI_PATHINFO_STATE_ONLINE) ||
2364b08fdaf7SSheshadri Vasudevan 					    (MDI_PI(pip)->pi_state ==
2365b08fdaf7SSheshadri Vasudevan 					    MDI_PATHINFO_STATE_STANDBY))
2366b08fdaf7SSheshadri Vasudevan 					    ? 1 : 0);
23677c478bd9Sstevel@tonic-gate 				} else {
23687c478bd9Sstevel@tonic-gate 					cond = 0;
23697c478bd9Sstevel@tonic-gate 				}
23707c478bd9Sstevel@tonic-gate 			}
23717c478bd9Sstevel@tonic-gate 			/*
23727c478bd9Sstevel@tonic-gate 			 * No need to explicitly check if the path is disabled.
23737c478bd9Sstevel@tonic-gate 			 * Since we are checking for state == ONLINE and the
237455e592a2SRandall Ralphs 			 * same variable is used for DISABLE/ENABLE information.
23757c478bd9Sstevel@tonic-gate 			 */
23767c478bd9Sstevel@tonic-gate 			if (cond) {
23777c478bd9Sstevel@tonic-gate 				/*
23787c478bd9Sstevel@tonic-gate 				 * Return the path in hold state. Caller should
23797c478bd9Sstevel@tonic-gate 				 * release the lock by calling mdi_rele_path()
23807c478bd9Sstevel@tonic-gate 				 */
23817c478bd9Sstevel@tonic-gate 				MDI_PI_HOLD(pip);
23827c478bd9Sstevel@tonic-gate 				MDI_PI_UNLOCK(pip);
23837c478bd9Sstevel@tonic-gate 				if (sb)
23847c478bd9Sstevel@tonic-gate 					ct->ct_path_last = pip;
23857c478bd9Sstevel@tonic-gate 				*ret_pip = pip;
23867c478bd9Sstevel@tonic-gate 				MDI_CLIENT_UNLOCK(ct);
23877c478bd9Sstevel@tonic-gate 				return (MDI_SUCCESS);
23887c478bd9Sstevel@tonic-gate 			}
23897c478bd9Sstevel@tonic-gate 			/*
23907c478bd9Sstevel@tonic-gate 			 * Path is busy.
23917c478bd9Sstevel@tonic-gate 			 */
23927c478bd9Sstevel@tonic-gate 			if (MDI_PI_IS_DRV_DISABLE_TRANSIENT(pip) ||
23937c478bd9Sstevel@tonic-gate 			    MDI_PI_IS_TRANSIENT(pip))
23947c478bd9Sstevel@tonic-gate 				retry = 1;
23957c478bd9Sstevel@tonic-gate 
23967c478bd9Sstevel@tonic-gate 			/*
23977c478bd9Sstevel@tonic-gate 			 * Keep looking for a next available online path
23987c478bd9Sstevel@tonic-gate 			 */
23997c478bd9Sstevel@tonic-gate do_again:
24007c478bd9Sstevel@tonic-gate 			next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link;
24017c478bd9Sstevel@tonic-gate 			if (next == NULL) {
2402b08fdaf7SSheshadri Vasudevan 				if ( flags & MDI_SELECT_NO_PREFERRED) {
2403b08fdaf7SSheshadri Vasudevan 					/*
2404b08fdaf7SSheshadri Vasudevan 					 * Bail out since we hit the end of list
2405b08fdaf7SSheshadri Vasudevan 					 */
2406b08fdaf7SSheshadri Vasudevan 					MDI_PI_UNLOCK(pip);
2407b08fdaf7SSheshadri Vasudevan 					break;
2408b08fdaf7SSheshadri Vasudevan 				}
2409b08fdaf7SSheshadri Vasudevan 
24107c478bd9Sstevel@tonic-gate 				if (!sb) {
24117c478bd9Sstevel@tonic-gate 					if (preferred == 1) {
24127c478bd9Sstevel@tonic-gate 						/*
24137c478bd9Sstevel@tonic-gate 						 * Looks like we reached the
24147c478bd9Sstevel@tonic-gate 						 * end of the list. Lets enable
24157c478bd9Sstevel@tonic-gate 						 * traversal of non preferred
24167c478bd9Sstevel@tonic-gate 						 * paths.
24177c478bd9Sstevel@tonic-gate 						 */
24187c478bd9Sstevel@tonic-gate 						preferred = 0;
24197c478bd9Sstevel@tonic-gate 						next = head;
24207c478bd9Sstevel@tonic-gate 					} else {
24217c478bd9Sstevel@tonic-gate 						/*
24227c478bd9Sstevel@tonic-gate 						 * We have done both the passes
24237c478bd9Sstevel@tonic-gate 						 * Preferred as well as for
24247c478bd9Sstevel@tonic-gate 						 * Non-preferred. Bail out now.
24257c478bd9Sstevel@tonic-gate 						 */
24267c478bd9Sstevel@tonic-gate 						cont = 0;
24277c478bd9Sstevel@tonic-gate 					}
24287c478bd9Sstevel@tonic-gate 				} else {
24297c478bd9Sstevel@tonic-gate 					/*
24307c478bd9Sstevel@tonic-gate 					 * Standard behavior case.
24317c478bd9Sstevel@tonic-gate 					 */
24327c478bd9Sstevel@tonic-gate 					next = head;
24337c478bd9Sstevel@tonic-gate 				}
24347c478bd9Sstevel@tonic-gate 			}
24357c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
24367c478bd9Sstevel@tonic-gate 			if (cont == 0) {
24377c478bd9Sstevel@tonic-gate 				break;
24387c478bd9Sstevel@tonic-gate 			}
24397c478bd9Sstevel@tonic-gate 			pip = next;
24407c478bd9Sstevel@tonic-gate 
24417c478bd9Sstevel@tonic-gate 			if (!sb) {
24427c478bd9Sstevel@tonic-gate 				/*
24437c478bd9Sstevel@tonic-gate 				 * We need to handle the selection of
24447c478bd9Sstevel@tonic-gate 				 * non-preferred path in the following
24457c478bd9Sstevel@tonic-gate 				 * case:
24467c478bd9Sstevel@tonic-gate 				 *
24477c478bd9Sstevel@tonic-gate 				 * +------+   +------+   +------+   +-----+
24487c478bd9Sstevel@tonic-gate 				 * | A : 1| - | B : 1| - | C : 0| - |NULL |
24497c478bd9Sstevel@tonic-gate 				 * +------+   +------+   +------+   +-----+
24507c478bd9Sstevel@tonic-gate 				 *
24517c478bd9Sstevel@tonic-gate 				 * If we start the search with B, we need to
24527c478bd9Sstevel@tonic-gate 				 * skip beyond B to pick C which is non -
24537c478bd9Sstevel@tonic-gate 				 * preferred in the second pass. The following
24547c478bd9Sstevel@tonic-gate 				 * test, if true, will allow us to skip over
24557c478bd9Sstevel@tonic-gate 				 * the 'start'(B in the example) to select
24567c478bd9Sstevel@tonic-gate 				 * other non preferred elements.
24577c478bd9Sstevel@tonic-gate 				 */
24587c478bd9Sstevel@tonic-gate 				if ((start_pip != NULL) && (start_pip == pip) &&
24597c478bd9Sstevel@tonic-gate 				    (MDI_PI(start_pip)->pi_preferred
24607c478bd9Sstevel@tonic-gate 				    != preferred)) {
24617c478bd9Sstevel@tonic-gate 					/*
24627c478bd9Sstevel@tonic-gate 					 * try again after going past the start
24637c478bd9Sstevel@tonic-gate 					 * pip
24647c478bd9Sstevel@tonic-gate 					 */
24657c478bd9Sstevel@tonic-gate 					MDI_PI_LOCK(pip);
24667c478bd9Sstevel@tonic-gate 					goto do_again;
24677c478bd9Sstevel@tonic-gate 				}
24687c478bd9Sstevel@tonic-gate 			} else {
24697c478bd9Sstevel@tonic-gate 				/*
24707c478bd9Sstevel@tonic-gate 				 * Standard behavior case
24717c478bd9Sstevel@tonic-gate 				 */
24727c478bd9Sstevel@tonic-gate 				if (start == pip && preferred) {
24737c478bd9Sstevel@tonic-gate 					/* look for nonpreferred paths */
24747c478bd9Sstevel@tonic-gate 					preferred = 0;
24757c478bd9Sstevel@tonic-gate 				} else if (start == pip && !preferred) {
24767c478bd9Sstevel@tonic-gate 					/*
24777c478bd9Sstevel@tonic-gate 					 * Exit condition
24787c478bd9Sstevel@tonic-gate 					 */
24797c478bd9Sstevel@tonic-gate 					cont = 0;
24807c478bd9Sstevel@tonic-gate 				}
24817c478bd9Sstevel@tonic-gate 			}
24827c478bd9Sstevel@tonic-gate 		} while (cont);
24837c478bd9Sstevel@tonic-gate 		break;
24847c478bd9Sstevel@tonic-gate 	}
24857c478bd9Sstevel@tonic-gate 
24867c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
24877c478bd9Sstevel@tonic-gate 	if (retry == 1) {
24887c478bd9Sstevel@tonic-gate 		return (MDI_BUSY);
24897c478bd9Sstevel@tonic-gate 	} else {
24907c478bd9Sstevel@tonic-gate 		return (MDI_NOPATH);
24917c478bd9Sstevel@tonic-gate 	}
24927c478bd9Sstevel@tonic-gate }
24937c478bd9Sstevel@tonic-gate 
24947c478bd9Sstevel@tonic-gate /*
24957c478bd9Sstevel@tonic-gate  * For a client, return the next available path to any phci
24967c478bd9Sstevel@tonic-gate  *
24977c478bd9Sstevel@tonic-gate  * Note:
24987c478bd9Sstevel@tonic-gate  *		Caller should hold the branch's devinfo node to get a consistent
24997c478bd9Sstevel@tonic-gate  *		snap shot of the mdi_pathinfo nodes.
25007c478bd9Sstevel@tonic-gate  *
25017c478bd9Sstevel@tonic-gate  *		Please note that even the list is stable the mdi_pathinfo
25027c478bd9Sstevel@tonic-gate  *		node state and properties are volatile.  The caller should lock
25037c478bd9Sstevel@tonic-gate  *		and unlock the nodes by calling mdi_pi_lock() and
25047c478bd9Sstevel@tonic-gate  *		mdi_pi_unlock() functions to get a stable properties.
25057c478bd9Sstevel@tonic-gate  *
25067c478bd9Sstevel@tonic-gate  *		If there is a need to use the nodes beyond the hold of the
25077c478bd9Sstevel@tonic-gate  *		devinfo node period (For ex. I/O), then mdi_pathinfo node
25087c478bd9Sstevel@tonic-gate  *		need to be held against unexpected removal by calling
25097c478bd9Sstevel@tonic-gate  *		mdi_hold_path() and should be released by calling
25107c478bd9Sstevel@tonic-gate  *		mdi_rele_path() on completion.
25117c478bd9Sstevel@tonic-gate  */
25127c478bd9Sstevel@tonic-gate mdi_pathinfo_t *
25137c478bd9Sstevel@tonic-gate mdi_get_next_phci_path(dev_info_t *ct_dip, mdi_pathinfo_t *pip)
25147c478bd9Sstevel@tonic-gate {
25157c478bd9Sstevel@tonic-gate 	mdi_client_t *ct;
25167c478bd9Sstevel@tonic-gate 
25177c478bd9Sstevel@tonic-gate 	if (!MDI_CLIENT(ct_dip))
25187c478bd9Sstevel@tonic-gate 		return (NULL);
25197c478bd9Sstevel@tonic-gate 
25207c478bd9Sstevel@tonic-gate 	/*
25217c478bd9Sstevel@tonic-gate 	 * Walk through client link
25227c478bd9Sstevel@tonic-gate 	 */
25237c478bd9Sstevel@tonic-gate 	ct = (mdi_client_t *)DEVI(ct_dip)->devi_mdi_client;
25247c478bd9Sstevel@tonic-gate 	ASSERT(ct != NULL);
25257c478bd9Sstevel@tonic-gate 
25267c478bd9Sstevel@tonic-gate 	if (pip == NULL)
25277c478bd9Sstevel@tonic-gate 		return ((mdi_pathinfo_t *)ct->ct_path_head);
25287c478bd9Sstevel@tonic-gate 
25297c478bd9Sstevel@tonic-gate 	return ((mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link);
25307c478bd9Sstevel@tonic-gate }
25317c478bd9Sstevel@tonic-gate 
25327c478bd9Sstevel@tonic-gate /*
25337c478bd9Sstevel@tonic-gate  * For a phci, return the next available path to any client
25347c478bd9Sstevel@tonic-gate  * Note: ditto mdi_get_next_phci_path()
25357c478bd9Sstevel@tonic-gate  */
25367c478bd9Sstevel@tonic-gate mdi_pathinfo_t *
25377c478bd9Sstevel@tonic-gate mdi_get_next_client_path(dev_info_t *ph_dip, mdi_pathinfo_t *pip)
25387c478bd9Sstevel@tonic-gate {
25397c478bd9Sstevel@tonic-gate 	mdi_phci_t *ph;
25407c478bd9Sstevel@tonic-gate 
25417c478bd9Sstevel@tonic-gate 	if (!MDI_PHCI(ph_dip))
25427c478bd9Sstevel@tonic-gate 		return (NULL);
25437c478bd9Sstevel@tonic-gate 
25447c478bd9Sstevel@tonic-gate 	/*
25457c478bd9Sstevel@tonic-gate 	 * Walk through pHCI link
25467c478bd9Sstevel@tonic-gate 	 */
25477c478bd9Sstevel@tonic-gate 	ph = (mdi_phci_t *)DEVI(ph_dip)->devi_mdi_xhci;
25487c478bd9Sstevel@tonic-gate 	ASSERT(ph != NULL);
25497c478bd9Sstevel@tonic-gate 
25507c478bd9Sstevel@tonic-gate 	if (pip == NULL)
25517c478bd9Sstevel@tonic-gate 		return ((mdi_pathinfo_t *)ph->ph_path_head);
25527c478bd9Sstevel@tonic-gate 
25537c478bd9Sstevel@tonic-gate 	return ((mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link);
25547c478bd9Sstevel@tonic-gate }
25557c478bd9Sstevel@tonic-gate 
25567c478bd9Sstevel@tonic-gate /*
25577c478bd9Sstevel@tonic-gate  * mdi_hold_path():
25587c478bd9Sstevel@tonic-gate  *		Hold the mdi_pathinfo node against unwanted unexpected free.
25597c478bd9Sstevel@tonic-gate  * Return Values:
25607c478bd9Sstevel@tonic-gate  *		None
25617c478bd9Sstevel@tonic-gate  */
25627c478bd9Sstevel@tonic-gate void
25637c478bd9Sstevel@tonic-gate mdi_hold_path(mdi_pathinfo_t *pip)
25647c478bd9Sstevel@tonic-gate {
25657c478bd9Sstevel@tonic-gate 	if (pip) {
25667c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
25677c478bd9Sstevel@tonic-gate 		MDI_PI_HOLD(pip);
25687c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
25697c478bd9Sstevel@tonic-gate 	}
25707c478bd9Sstevel@tonic-gate }
25717c478bd9Sstevel@tonic-gate 
25727c478bd9Sstevel@tonic-gate 
25737c478bd9Sstevel@tonic-gate /*
25747c478bd9Sstevel@tonic-gate  * mdi_rele_path():
25757c478bd9Sstevel@tonic-gate  *		Release the mdi_pathinfo node which was selected
25767c478bd9Sstevel@tonic-gate  *		through mdi_select_path() mechanism or manually held by
25777c478bd9Sstevel@tonic-gate  *		calling mdi_hold_path().
25787c478bd9Sstevel@tonic-gate  * Return Values:
25797c478bd9Sstevel@tonic-gate  *		None
25807c478bd9Sstevel@tonic-gate  */
25817c478bd9Sstevel@tonic-gate void
25827c478bd9Sstevel@tonic-gate mdi_rele_path(mdi_pathinfo_t *pip)
25837c478bd9Sstevel@tonic-gate {
25847c478bd9Sstevel@tonic-gate 	if (pip) {
25857c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
25867c478bd9Sstevel@tonic-gate 		MDI_PI_RELE(pip);
25877c478bd9Sstevel@tonic-gate 		if (MDI_PI(pip)->pi_ref_cnt == 0) {
25887c478bd9Sstevel@tonic-gate 			cv_broadcast(&MDI_PI(pip)->pi_ref_cv);
25897c478bd9Sstevel@tonic-gate 		}
25907c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
25917c478bd9Sstevel@tonic-gate 	}
25927c478bd9Sstevel@tonic-gate }
25937c478bd9Sstevel@tonic-gate 
25947c478bd9Sstevel@tonic-gate /*
25957c478bd9Sstevel@tonic-gate  * mdi_pi_lock():
25967c478bd9Sstevel@tonic-gate  * 		Lock the mdi_pathinfo node.
25977c478bd9Sstevel@tonic-gate  * Note:
25987c478bd9Sstevel@tonic-gate  *		The caller should release the lock by calling mdi_pi_unlock()
25997c478bd9Sstevel@tonic-gate  */
26007c478bd9Sstevel@tonic-gate void
26017c478bd9Sstevel@tonic-gate mdi_pi_lock(mdi_pathinfo_t *pip)
26027c478bd9Sstevel@tonic-gate {
26037c478bd9Sstevel@tonic-gate 	ASSERT(pip != NULL);
26047c478bd9Sstevel@tonic-gate 	if (pip) {
26057c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
26067c478bd9Sstevel@tonic-gate 	}
26077c478bd9Sstevel@tonic-gate }
26087c478bd9Sstevel@tonic-gate 
26097c478bd9Sstevel@tonic-gate 
26107c478bd9Sstevel@tonic-gate /*
26117c478bd9Sstevel@tonic-gate  * mdi_pi_unlock():
26127c478bd9Sstevel@tonic-gate  * 		Unlock the mdi_pathinfo node.
26137c478bd9Sstevel@tonic-gate  * Note:
26147c478bd9Sstevel@tonic-gate  *		The mdi_pathinfo node should have been locked with mdi_pi_lock()
26157c478bd9Sstevel@tonic-gate  */
26167c478bd9Sstevel@tonic-gate void
26177c478bd9Sstevel@tonic-gate mdi_pi_unlock(mdi_pathinfo_t *pip)
26187c478bd9Sstevel@tonic-gate {
26197c478bd9Sstevel@tonic-gate 	ASSERT(pip != NULL);
26207c478bd9Sstevel@tonic-gate 	if (pip) {
26217c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
26227c478bd9Sstevel@tonic-gate 	}
26237c478bd9Sstevel@tonic-gate }
26247c478bd9Sstevel@tonic-gate 
26257c478bd9Sstevel@tonic-gate /*
26267c478bd9Sstevel@tonic-gate  * mdi_pi_find():
26277c478bd9Sstevel@tonic-gate  *		Search the list of mdi_pathinfo nodes attached to the
26287c478bd9Sstevel@tonic-gate  *		pHCI/Client device node whose path address matches "paddr".
26297c478bd9Sstevel@tonic-gate  *		Returns a pointer to the mdi_pathinfo node if a matching node is
26307c478bd9Sstevel@tonic-gate  *		found.
26317c478bd9Sstevel@tonic-gate  * Return Values:
26327c478bd9Sstevel@tonic-gate  *		mdi_pathinfo node handle
26337c478bd9Sstevel@tonic-gate  *		NULL
26347c478bd9Sstevel@tonic-gate  * Notes:
26357c478bd9Sstevel@tonic-gate  *		Caller need not hold any locks to call this function.
26367c478bd9Sstevel@tonic-gate  */
26377c478bd9Sstevel@tonic-gate mdi_pathinfo_t *
26387c478bd9Sstevel@tonic-gate mdi_pi_find(dev_info_t *pdip, char *caddr, char *paddr)
26397c478bd9Sstevel@tonic-gate {
26407c478bd9Sstevel@tonic-gate 	mdi_phci_t		*ph;
26417c478bd9Sstevel@tonic-gate 	mdi_vhci_t		*vh;
26427c478bd9Sstevel@tonic-gate 	mdi_client_t		*ct;
26437c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t		*pip = NULL;
26447c478bd9Sstevel@tonic-gate 
26454c06356bSdh142964 	MDI_DEBUG(2, (MDI_NOTE, pdip,
26464c06356bSdh142964 	    "caddr@%s paddr@%s", caddr ? caddr : "", paddr ? paddr : ""));
26477c478bd9Sstevel@tonic-gate 	if ((pdip == NULL) || (paddr == NULL)) {
26487c478bd9Sstevel@tonic-gate 		return (NULL);
26497c478bd9Sstevel@tonic-gate 	}
26507c478bd9Sstevel@tonic-gate 	ph = i_devi_get_phci(pdip);
26517c478bd9Sstevel@tonic-gate 	if (ph == NULL) {
26527c478bd9Sstevel@tonic-gate 		/*
26537c478bd9Sstevel@tonic-gate 		 * Invalid pHCI device, Nothing more to do.
26547c478bd9Sstevel@tonic-gate 		 */
26554c06356bSdh142964 		MDI_DEBUG(2, (MDI_WARN, pdip, "invalid phci"));
26567c478bd9Sstevel@tonic-gate 		return (NULL);
26577c478bd9Sstevel@tonic-gate 	}
26587c478bd9Sstevel@tonic-gate 
26597c478bd9Sstevel@tonic-gate 	vh = ph->ph_vhci;
26607c478bd9Sstevel@tonic-gate 	if (vh == NULL) {
26617c478bd9Sstevel@tonic-gate 		/*
26627c478bd9Sstevel@tonic-gate 		 * Invalid vHCI device, Nothing more to do.
26637c478bd9Sstevel@tonic-gate 		 */
26644c06356bSdh142964 		MDI_DEBUG(2, (MDI_WARN, pdip, "invalid vhci"));
26657c478bd9Sstevel@tonic-gate 		return (NULL);
26667c478bd9Sstevel@tonic-gate 	}
26677c478bd9Sstevel@tonic-gate 
26687c478bd9Sstevel@tonic-gate 	/*
26695e3986cbScth 	 * Look for pathinfo node identified by paddr.
26707c478bd9Sstevel@tonic-gate 	 */
26717c478bd9Sstevel@tonic-gate 	if (caddr == NULL) {
26727c478bd9Sstevel@tonic-gate 		/*
26737c478bd9Sstevel@tonic-gate 		 * Find a mdi_pathinfo node under pHCI list for a matching
26747c478bd9Sstevel@tonic-gate 		 * unit address.
26757c478bd9Sstevel@tonic-gate 		 */
26765e3986cbScth 		MDI_PHCI_LOCK(ph);
26775e3986cbScth 		if (MDI_PHCI_IS_OFFLINE(ph)) {
26784c06356bSdh142964 			MDI_DEBUG(2, (MDI_WARN, pdip,
26794c06356bSdh142964 			    "offline phci %p", (void *)ph));
26805e3986cbScth 			MDI_PHCI_UNLOCK(ph);
26815e3986cbScth 			return (NULL);
26825e3986cbScth 		}
26837c478bd9Sstevel@tonic-gate 		pip = (mdi_pathinfo_t *)ph->ph_path_head;
26847c478bd9Sstevel@tonic-gate 
26857c478bd9Sstevel@tonic-gate 		while (pip != NULL) {
26867c478bd9Sstevel@tonic-gate 			if (strcmp(MDI_PI(pip)->pi_addr, paddr) == 0) {
26877c478bd9Sstevel@tonic-gate 				break;
26887c478bd9Sstevel@tonic-gate 			}
26897c478bd9Sstevel@tonic-gate 			pip = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
26907c478bd9Sstevel@tonic-gate 		}
26915e3986cbScth 		MDI_PHCI_UNLOCK(ph);
26924c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, pdip,
26934c06356bSdh142964 		    "found %s %p", mdi_pi_spathname(pip), (void *)pip));
26947c478bd9Sstevel@tonic-gate 		return (pip);
26957c478bd9Sstevel@tonic-gate 	}
26967c478bd9Sstevel@tonic-gate 
26977c478bd9Sstevel@tonic-gate 	/*
26983c34adc5Sramat 	 * XXX - Is the rest of the code in this function really necessary?
26993c34adc5Sramat 	 * The consumers of mdi_pi_find() can search for the desired pathinfo
27003c34adc5Sramat 	 * node by calling mdi_pi_find(pdip, NULL, paddr). Irrespective of
27013c34adc5Sramat 	 * whether the search is based on the pathinfo nodes attached to
27023c34adc5Sramat 	 * the pHCI or the client node, the result will be the same.
27033c34adc5Sramat 	 */
27043c34adc5Sramat 
27053c34adc5Sramat 	/*
27067c478bd9Sstevel@tonic-gate 	 * Find the client device corresponding to 'caddr'
27077c478bd9Sstevel@tonic-gate 	 */
27085e3986cbScth 	MDI_VHCI_CLIENT_LOCK(vh);
27093c34adc5Sramat 
27103c34adc5Sramat 	/*
27113c34adc5Sramat 	 * XXX - Passing NULL to the following function works as long as the
27123c34adc5Sramat 	 * the client addresses (caddr) are unique per vhci basis.
27133c34adc5Sramat 	 */
27143c34adc5Sramat 	ct = i_mdi_client_find(vh, NULL, caddr);
27157c478bd9Sstevel@tonic-gate 	if (ct == NULL) {
27167c478bd9Sstevel@tonic-gate 		/*
27177c478bd9Sstevel@tonic-gate 		 * Client not found, Obviously mdi_pathinfo node has not been
27187c478bd9Sstevel@tonic-gate 		 * created yet.
27197c478bd9Sstevel@tonic-gate 		 */
27205e3986cbScth 		MDI_VHCI_CLIENT_UNLOCK(vh);
27214c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, pdip,
27224c06356bSdh142964 		    "client not found for caddr @%s", caddr ? caddr : ""));
27235e3986cbScth 		return (NULL);
27247c478bd9Sstevel@tonic-gate 	}
27257c478bd9Sstevel@tonic-gate 
27267c478bd9Sstevel@tonic-gate 	/*
27277c478bd9Sstevel@tonic-gate 	 * Hold the client lock and look for a mdi_pathinfo node with matching
27287c478bd9Sstevel@tonic-gate 	 * pHCI and paddr
27297c478bd9Sstevel@tonic-gate 	 */
27307c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
27317c478bd9Sstevel@tonic-gate 
27327c478bd9Sstevel@tonic-gate 	/*
27337c478bd9Sstevel@tonic-gate 	 * Release the global mutex as it is no more needed. Note: We always
27347c478bd9Sstevel@tonic-gate 	 * respect the locking order while acquiring.
27357c478bd9Sstevel@tonic-gate 	 */
27365e3986cbScth 	MDI_VHCI_CLIENT_UNLOCK(vh);
27377c478bd9Sstevel@tonic-gate 
27387c478bd9Sstevel@tonic-gate 	pip = (mdi_pathinfo_t *)ct->ct_path_head;
27397c478bd9Sstevel@tonic-gate 	while (pip != NULL) {
27407c478bd9Sstevel@tonic-gate 		/*
27417c478bd9Sstevel@tonic-gate 		 * Compare the unit address
27427c478bd9Sstevel@tonic-gate 		 */
27437c478bd9Sstevel@tonic-gate 		if ((MDI_PI(pip)->pi_phci == ph) &&
27447c478bd9Sstevel@tonic-gate 		    strcmp(MDI_PI(pip)->pi_addr, paddr) == 0) {
27457c478bd9Sstevel@tonic-gate 			break;
27467c478bd9Sstevel@tonic-gate 		}
27477c478bd9Sstevel@tonic-gate 		pip = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link;
27487c478bd9Sstevel@tonic-gate 	}
27497c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
27504c06356bSdh142964 	MDI_DEBUG(2, (MDI_NOTE, pdip,
27514c06356bSdh142964 	    "found: %s %p", mdi_pi_spathname(pip), (void *)pip));
27527c478bd9Sstevel@tonic-gate 	return (pip);
27537c478bd9Sstevel@tonic-gate }
27547c478bd9Sstevel@tonic-gate 
27557c478bd9Sstevel@tonic-gate /*
27567c478bd9Sstevel@tonic-gate  * mdi_pi_alloc():
27577c478bd9Sstevel@tonic-gate  *		Allocate and initialize a new instance of a mdi_pathinfo node.
27587c478bd9Sstevel@tonic-gate  *		The mdi_pathinfo node returned by this function identifies a
27597c478bd9Sstevel@tonic-gate  *		unique device path is capable of having properties attached
27607c478bd9Sstevel@tonic-gate  *		and passed to mdi_pi_online() to fully attach and online the
27617c478bd9Sstevel@tonic-gate  *		path and client device node.
27627c478bd9Sstevel@tonic-gate  *		The mdi_pathinfo node returned by this function must be
27637c478bd9Sstevel@tonic-gate  *		destroyed using mdi_pi_free() if the path is no longer
27647c478bd9Sstevel@tonic-gate  *		operational or if the caller fails to attach a client device
27657c478bd9Sstevel@tonic-gate  *		node when calling mdi_pi_online(). The framework will not free
27667c478bd9Sstevel@tonic-gate  *		the resources allocated.
27677c478bd9Sstevel@tonic-gate  *		This function can be called from both interrupt and kernel
27687c478bd9Sstevel@tonic-gate  *		contexts.  DDI_NOSLEEP flag should be used while calling
27697c478bd9Sstevel@tonic-gate  *		from interrupt contexts.
27707c478bd9Sstevel@tonic-gate  * Return Values:
27717c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
27727c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
27737c478bd9Sstevel@tonic-gate  *		MDI_NOMEM
27747c478bd9Sstevel@tonic-gate  */
27757c478bd9Sstevel@tonic-gate /*ARGSUSED*/
27767c478bd9Sstevel@tonic-gate int
27777c478bd9Sstevel@tonic-gate mdi_pi_alloc_compatible(dev_info_t *pdip, char *cname, char *caddr, char *paddr,
27787c478bd9Sstevel@tonic-gate     char **compatible, int ncompatible, int flags, mdi_pathinfo_t **ret_pip)
27797c478bd9Sstevel@tonic-gate {
27807c478bd9Sstevel@tonic-gate 	mdi_vhci_t	*vh;
27817c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
27827c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
27837c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*pip = NULL;
27847c478bd9Sstevel@tonic-gate 	dev_info_t	*cdip;
27857c478bd9Sstevel@tonic-gate 	int		rv = MDI_NOMEM;
27863c34adc5Sramat 	int		path_allocated = 0;
27877c478bd9Sstevel@tonic-gate 
27884c06356bSdh142964 	MDI_DEBUG(2, (MDI_NOTE, pdip,
27894c06356bSdh142964 	    "cname %s: caddr@%s paddr@%s",
27904c06356bSdh142964 	    cname ? cname : "", caddr ? caddr : "", paddr ? paddr : ""));
27915e3986cbScth 
27927c478bd9Sstevel@tonic-gate 	if (pdip == NULL || cname == NULL || caddr == NULL || paddr == NULL ||
27937c478bd9Sstevel@tonic-gate 	    ret_pip == NULL) {
27947c478bd9Sstevel@tonic-gate 		/* Nothing more to do */
27957c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
27967c478bd9Sstevel@tonic-gate 	}
27977c478bd9Sstevel@tonic-gate 
27987c478bd9Sstevel@tonic-gate 	*ret_pip = NULL;
27995e3986cbScth 
28005e3986cbScth 	/* No allocations on detaching pHCI */
28015e3986cbScth 	if (DEVI_IS_DETACHING(pdip)) {
28025e3986cbScth 		/* Invalid pHCI device, return failure */
28034c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, pdip,
28044c06356bSdh142964 		    "!detaching pHCI=%p", (void *)pdip));
28055e3986cbScth 		return (MDI_FAILURE);
28065e3986cbScth 	}
28075e3986cbScth 
28087c478bd9Sstevel@tonic-gate 	ph = i_devi_get_phci(pdip);
28097c478bd9Sstevel@tonic-gate 	ASSERT(ph != NULL);
28107c478bd9Sstevel@tonic-gate 	if (ph == NULL) {
28117c478bd9Sstevel@tonic-gate 		/* Invalid pHCI device, return failure */
28124c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, pdip,
28134c06356bSdh142964 		    "!invalid pHCI=%p", (void *)pdip));
28147c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
28157c478bd9Sstevel@tonic-gate 	}
28167c478bd9Sstevel@tonic-gate 
28177c478bd9Sstevel@tonic-gate 	MDI_PHCI_LOCK(ph);
28187c478bd9Sstevel@tonic-gate 	vh = ph->ph_vhci;
28197c478bd9Sstevel@tonic-gate 	if (vh == NULL) {
28207c478bd9Sstevel@tonic-gate 		/* Invalid vHCI device, return failure */
28214c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, pdip,
28224c06356bSdh142964 		    "!invalid vHCI=%p", (void *)pdip));
28237c478bd9Sstevel@tonic-gate 		MDI_PHCI_UNLOCK(ph);
28247c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
28257c478bd9Sstevel@tonic-gate 	}
28267c478bd9Sstevel@tonic-gate 
28277c478bd9Sstevel@tonic-gate 	if (MDI_PHCI_IS_READY(ph) == 0) {
28287c478bd9Sstevel@tonic-gate 		/*
28297c478bd9Sstevel@tonic-gate 		 * Do not allow new node creation when pHCI is in
28307c478bd9Sstevel@tonic-gate 		 * offline/suspended states
28317c478bd9Sstevel@tonic-gate 		 */
28324c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, pdip,
28334c06356bSdh142964 		    "pHCI=%p is not ready", (void *)ph));
28347c478bd9Sstevel@tonic-gate 		MDI_PHCI_UNLOCK(ph);
28357c478bd9Sstevel@tonic-gate 		return (MDI_BUSY);
28367c478bd9Sstevel@tonic-gate 	}
28377c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNSTABLE(ph);
28387c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNLOCK(ph);
28397c478bd9Sstevel@tonic-gate 
28403c34adc5Sramat 	/* look for a matching client, create one if not found */
28415e3986cbScth 	MDI_VHCI_CLIENT_LOCK(vh);
28423c34adc5Sramat 	ct = i_mdi_client_find(vh, cname, caddr);
28437c478bd9Sstevel@tonic-gate 	if (ct == NULL) {
28443c34adc5Sramat 		ct = i_mdi_client_alloc(vh, cname, caddr);
28453c34adc5Sramat 		ASSERT(ct != NULL);
28467c478bd9Sstevel@tonic-gate 	}
28477c478bd9Sstevel@tonic-gate 
28487c478bd9Sstevel@tonic-gate 	if (ct->ct_dip == NULL) {
28497c478bd9Sstevel@tonic-gate 		/*
28507c478bd9Sstevel@tonic-gate 		 * Allocate a devinfo node
28517c478bd9Sstevel@tonic-gate 		 */
28527c478bd9Sstevel@tonic-gate 		ct->ct_dip = i_mdi_devinfo_create(vh, cname, caddr,
28533c34adc5Sramat 		    compatible, ncompatible);
28547c478bd9Sstevel@tonic-gate 		if (ct->ct_dip == NULL) {
28557c478bd9Sstevel@tonic-gate 			(void) i_mdi_client_free(vh, ct);
28567c478bd9Sstevel@tonic-gate 			goto fail;
28577c478bd9Sstevel@tonic-gate 		}
28587c478bd9Sstevel@tonic-gate 	}
28597c478bd9Sstevel@tonic-gate 	cdip = ct->ct_dip;
28607c478bd9Sstevel@tonic-gate 
28617c478bd9Sstevel@tonic-gate 	DEVI(cdip)->devi_mdi_component |= MDI_COMPONENT_CLIENT;
28627c478bd9Sstevel@tonic-gate 	DEVI(cdip)->devi_mdi_client = (caddr_t)ct;
28637c478bd9Sstevel@tonic-gate 
28645e3986cbScth 	MDI_CLIENT_LOCK(ct);
28657c478bd9Sstevel@tonic-gate 	pip = (mdi_pathinfo_t *)ct->ct_path_head;
28667c478bd9Sstevel@tonic-gate 	while (pip != NULL) {
28677c478bd9Sstevel@tonic-gate 		/*
28687c478bd9Sstevel@tonic-gate 		 * Compare the unit address
28697c478bd9Sstevel@tonic-gate 		 */
28707c478bd9Sstevel@tonic-gate 		if ((MDI_PI(pip)->pi_phci == ph) &&
28717c478bd9Sstevel@tonic-gate 		    strcmp(MDI_PI(pip)->pi_addr, paddr) == 0) {
28727c478bd9Sstevel@tonic-gate 			break;
28737c478bd9Sstevel@tonic-gate 		}
28747c478bd9Sstevel@tonic-gate 		pip = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link;
28757c478bd9Sstevel@tonic-gate 	}
28765e3986cbScth 	MDI_CLIENT_UNLOCK(ct);
28777c478bd9Sstevel@tonic-gate 
28787c478bd9Sstevel@tonic-gate 	if (pip == NULL) {
28797c478bd9Sstevel@tonic-gate 		/*
28807c478bd9Sstevel@tonic-gate 		 * This is a new path for this client device.  Allocate and
28817c478bd9Sstevel@tonic-gate 		 * initialize a new pathinfo node
28827c478bd9Sstevel@tonic-gate 		 */
28833c34adc5Sramat 		pip = i_mdi_pi_alloc(ph, paddr, ct);
28843c34adc5Sramat 		ASSERT(pip != NULL);
28853c34adc5Sramat 		path_allocated = 1;
28867c478bd9Sstevel@tonic-gate 	}
28877c478bd9Sstevel@tonic-gate 	rv = MDI_SUCCESS;
28887c478bd9Sstevel@tonic-gate 
28897c478bd9Sstevel@tonic-gate fail:
28907c478bd9Sstevel@tonic-gate 	/*
28917c478bd9Sstevel@tonic-gate 	 * Release the global mutex.
28927c478bd9Sstevel@tonic-gate 	 */
28935e3986cbScth 	MDI_VHCI_CLIENT_UNLOCK(vh);
28947c478bd9Sstevel@tonic-gate 
28957c478bd9Sstevel@tonic-gate 	/*
28967c478bd9Sstevel@tonic-gate 	 * Mark the pHCI as stable
28977c478bd9Sstevel@tonic-gate 	 */
28987c478bd9Sstevel@tonic-gate 	MDI_PHCI_LOCK(ph);
28997c478bd9Sstevel@tonic-gate 	MDI_PHCI_STABLE(ph);
29007c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNLOCK(ph);
29017c478bd9Sstevel@tonic-gate 	*ret_pip = pip;
29023c34adc5Sramat 
29034c06356bSdh142964 	MDI_DEBUG(2, (MDI_NOTE, pdip,
29044c06356bSdh142964 	    "alloc %s %p", mdi_pi_spathname(pip), (void *)pip));
29055e3986cbScth 
29063c34adc5Sramat 	if (path_allocated)
29073c34adc5Sramat 		vhcache_pi_add(vh->vh_config, MDI_PI(pip));
29083c34adc5Sramat 
29097c478bd9Sstevel@tonic-gate 	return (rv);
29107c478bd9Sstevel@tonic-gate }
29117c478bd9Sstevel@tonic-gate 
29127c478bd9Sstevel@tonic-gate /*ARGSUSED*/
29137c478bd9Sstevel@tonic-gate int
29147c478bd9Sstevel@tonic-gate mdi_pi_alloc(dev_info_t *pdip, char *cname, char *caddr, char *paddr,
29157c478bd9Sstevel@tonic-gate     int flags, mdi_pathinfo_t **ret_pip)
29167c478bd9Sstevel@tonic-gate {
29177c478bd9Sstevel@tonic-gate 	return (mdi_pi_alloc_compatible(pdip, cname, caddr, paddr, NULL, 0,
29187c478bd9Sstevel@tonic-gate 	    flags, ret_pip));
29197c478bd9Sstevel@tonic-gate }
29207c478bd9Sstevel@tonic-gate 
29217c478bd9Sstevel@tonic-gate /*
29227c478bd9Sstevel@tonic-gate  * i_mdi_pi_alloc():
29237c478bd9Sstevel@tonic-gate  *		Allocate a mdi_pathinfo node and add to the pHCI path list
29247c478bd9Sstevel@tonic-gate  * Return Values:
29257c478bd9Sstevel@tonic-gate  *		mdi_pathinfo
29267c478bd9Sstevel@tonic-gate  */
29277c478bd9Sstevel@tonic-gate /*ARGSUSED*/
29287c478bd9Sstevel@tonic-gate static mdi_pathinfo_t *
29293c34adc5Sramat i_mdi_pi_alloc(mdi_phci_t *ph, char *paddr, mdi_client_t *ct)
29307c478bd9Sstevel@tonic-gate {
29313c34adc5Sramat 	mdi_pathinfo_t	*pip;
29327c478bd9Sstevel@tonic-gate 	int		ct_circular;
29337c478bd9Sstevel@tonic-gate 	int		ph_circular;
29344c06356bSdh142964 	static char	path[MAXPATHLEN];	/* mdi_pathmap_mutex protects */
2935602ca9eaScth 	char		*path_persistent;
2936602ca9eaScth 	int		path_instance;
2937602ca9eaScth 	mod_hash_val_t	hv;
29387c478bd9Sstevel@tonic-gate 
29395e3986cbScth 	ASSERT(MDI_VHCI_CLIENT_LOCKED(ph->ph_vhci));
29405e3986cbScth 
29413c34adc5Sramat 	pip = kmem_zalloc(sizeof (struct mdi_pathinfo), KM_SLEEP);
29427c478bd9Sstevel@tonic-gate 	mutex_init(&MDI_PI(pip)->pi_mutex, NULL, MUTEX_DEFAULT, NULL);
29437c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_state = MDI_PATHINFO_STATE_INIT |
29447c478bd9Sstevel@tonic-gate 	    MDI_PATHINFO_STATE_TRANSIENT;
29457c478bd9Sstevel@tonic-gate 
29467c478bd9Sstevel@tonic-gate 	if (MDI_PHCI_IS_USER_DISABLED(ph))
29477c478bd9Sstevel@tonic-gate 		MDI_PI_SET_USER_DISABLE(pip);
29487c478bd9Sstevel@tonic-gate 
29497c478bd9Sstevel@tonic-gate 	if (MDI_PHCI_IS_DRV_DISABLED_TRANSIENT(ph))
29507c478bd9Sstevel@tonic-gate 		MDI_PI_SET_DRV_DISABLE_TRANS(pip);
29517c478bd9Sstevel@tonic-gate 
29527c478bd9Sstevel@tonic-gate 	if (MDI_PHCI_IS_DRV_DISABLED(ph))
29537c478bd9Sstevel@tonic-gate 		MDI_PI_SET_DRV_DISABLE(pip);
29547c478bd9Sstevel@tonic-gate 
29557c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_old_state = MDI_PATHINFO_STATE_INIT;
29567c478bd9Sstevel@tonic-gate 	cv_init(&MDI_PI(pip)->pi_state_cv, NULL, CV_DEFAULT, NULL);
29577c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_client = ct;
29587c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_phci = ph;
29593c34adc5Sramat 	MDI_PI(pip)->pi_addr = kmem_alloc(strlen(paddr) + 1, KM_SLEEP);
29607c478bd9Sstevel@tonic-gate 	(void) strcpy(MDI_PI(pip)->pi_addr, paddr);
2961602ca9eaScth 
2962602ca9eaScth         /*
2963602ca9eaScth 	 * We form the "path" to the pathinfo node, and see if we have
2964602ca9eaScth 	 * already allocated a 'path_instance' for that "path".  If so,
2965602ca9eaScth 	 * we use the already allocated 'path_instance'.  If not, we
2966602ca9eaScth 	 * allocate a new 'path_instance' and associate it with a copy of
2967602ca9eaScth 	 * the "path" string (which is never freed). The association
2968602ca9eaScth 	 * between a 'path_instance' this "path" string persists until
2969602ca9eaScth 	 * reboot.
2970602ca9eaScth 	 */
2971602ca9eaScth         mutex_enter(&mdi_pathmap_mutex);
2972602ca9eaScth 	(void) ddi_pathname(ph->ph_dip, path);
2973602ca9eaScth 	(void) sprintf(path + strlen(path), "/%s@%s",
297455e592a2SRandall Ralphs 	    mdi_pi_get_node_name(pip), mdi_pi_get_addr(pip));
2975602ca9eaScth         if (mod_hash_find(mdi_pathmap_bypath, (mod_hash_key_t)path, &hv) == 0) {
2976602ca9eaScth                 path_instance = (uint_t)(intptr_t)hv;
2977602ca9eaScth         } else {
2978602ca9eaScth 		/* allocate a new 'path_instance' and persistent "path" */
2979602ca9eaScth 		path_instance = mdi_pathmap_instance++;
2980602ca9eaScth 		path_persistent = i_ddi_strdup(path, KM_SLEEP);
2981602ca9eaScth                 (void) mod_hash_insert(mdi_pathmap_bypath,
2982602ca9eaScth                     (mod_hash_key_t)path_persistent,
2983602ca9eaScth                     (mod_hash_val_t)(intptr_t)path_instance);
2984602ca9eaScth 		(void) mod_hash_insert(mdi_pathmap_byinstance,
2985602ca9eaScth 		    (mod_hash_key_t)(intptr_t)path_instance,
2986602ca9eaScth 		    (mod_hash_val_t)path_persistent);
29874c06356bSdh142964 
29884c06356bSdh142964 		/* create shortpath name */
29894c06356bSdh142964 		(void) snprintf(path, sizeof(path), "%s%d/%s@%s",
29904c06356bSdh142964 		    ddi_driver_name(ph->ph_dip), ddi_get_instance(ph->ph_dip),
29914c06356bSdh142964 		    mdi_pi_get_node_name(pip), mdi_pi_get_addr(pip));
29924c06356bSdh142964 		path_persistent = i_ddi_strdup(path, KM_SLEEP);
29934c06356bSdh142964 		(void) mod_hash_insert(mdi_pathmap_sbyinstance,
29944c06356bSdh142964 		    (mod_hash_key_t)(intptr_t)path_instance,
29954c06356bSdh142964 		    (mod_hash_val_t)path_persistent);
2996602ca9eaScth         }
2997602ca9eaScth         mutex_exit(&mdi_pathmap_mutex);
2998602ca9eaScth 	MDI_PI(pip)->pi_path_instance = path_instance;
2999602ca9eaScth 
30003c34adc5Sramat 	(void) nvlist_alloc(&MDI_PI(pip)->pi_prop, NV_UNIQUE_NAME, KM_SLEEP);
30013c34adc5Sramat 	ASSERT(MDI_PI(pip)->pi_prop != NULL);
30027c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_pprivate = NULL;
30037c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_cprivate = NULL;
30047c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_vprivate = NULL;
30057c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_client_link = NULL;
30067c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_phci_link = NULL;
30077c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_ref_cnt = 0;
30087c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_kstats = NULL;
30097c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_preferred = 1;
30107c478bd9Sstevel@tonic-gate 	cv_init(&MDI_PI(pip)->pi_ref_cv, NULL, CV_DEFAULT, NULL);
30117c478bd9Sstevel@tonic-gate 
30127c478bd9Sstevel@tonic-gate 	/*
30137c478bd9Sstevel@tonic-gate 	 * Lock both dev_info nodes against changes in parallel.
30145e3986cbScth 	 *
30155e3986cbScth 	 * The ndi_devi_enter(Client), is atypical since the client is a leaf.
30165e3986cbScth 	 * This atypical operation is done to synchronize pathinfo nodes
30175e3986cbScth 	 * during devinfo snapshot (see di_register_pip) by 'pretending' that
30185e3986cbScth 	 * the pathinfo nodes are children of the Client.
30197c478bd9Sstevel@tonic-gate 	 */
30207c478bd9Sstevel@tonic-gate 	ndi_devi_enter(ct->ct_dip, &ct_circular);
30217c478bd9Sstevel@tonic-gate 	ndi_devi_enter(ph->ph_dip, &ph_circular);
30227c478bd9Sstevel@tonic-gate 
30237c478bd9Sstevel@tonic-gate 	i_mdi_phci_add_path(ph, pip);
30247c478bd9Sstevel@tonic-gate 	i_mdi_client_add_path(ct, pip);
30257c478bd9Sstevel@tonic-gate 
30267c478bd9Sstevel@tonic-gate 	ndi_devi_exit(ph->ph_dip, ph_circular);
30277c478bd9Sstevel@tonic-gate 	ndi_devi_exit(ct->ct_dip, ct_circular);
30287c478bd9Sstevel@tonic-gate 
30297c478bd9Sstevel@tonic-gate 	return (pip);
30307c478bd9Sstevel@tonic-gate }
30317c478bd9Sstevel@tonic-gate 
30327c478bd9Sstevel@tonic-gate /*
3033602ca9eaScth  * mdi_pi_pathname_by_instance():
3034602ca9eaScth  *	Lookup of "path" by 'path_instance'. Return "path".
3035602ca9eaScth  *	NOTE: returned "path" remains valid forever (until reboot).
3036602ca9eaScth  */
3037602ca9eaScth char *
3038602ca9eaScth mdi_pi_pathname_by_instance(int path_instance)
3039602ca9eaScth {
3040602ca9eaScth 	char		*path;
3041602ca9eaScth 	mod_hash_val_t	hv;
3042602ca9eaScth 
3043602ca9eaScth 	/* mdi_pathmap lookup of "path" by 'path_instance' */
3044602ca9eaScth 	mutex_enter(&mdi_pathmap_mutex);
3045602ca9eaScth 	if (mod_hash_find(mdi_pathmap_byinstance,
3046602ca9eaScth 	    (mod_hash_key_t)(intptr_t)path_instance, &hv) == 0)
3047602ca9eaScth 		path = (char *)hv;
3048602ca9eaScth 	else
3049602ca9eaScth 		path = NULL;
3050602ca9eaScth 	mutex_exit(&mdi_pathmap_mutex);
3051602ca9eaScth 	return (path);
3052602ca9eaScth }
3053602ca9eaScth 
3054602ca9eaScth /*
30554c06356bSdh142964  * mdi_pi_spathname_by_instance():
30564c06356bSdh142964  *	Lookup of "shortpath" by 'path_instance'. Return "shortpath".
30574c06356bSdh142964  *	NOTE: returned "shortpath" remains valid forever (until reboot).
30584c06356bSdh142964  */
30594c06356bSdh142964 char *
30604c06356bSdh142964 mdi_pi_spathname_by_instance(int path_instance)
30614c06356bSdh142964 {
30624c06356bSdh142964 	char		*path;
30634c06356bSdh142964 	mod_hash_val_t	hv;
30644c06356bSdh142964 
30654c06356bSdh142964 	/* mdi_pathmap lookup of "path" by 'path_instance' */
30664c06356bSdh142964 	mutex_enter(&mdi_pathmap_mutex);
30674c06356bSdh142964 	if (mod_hash_find(mdi_pathmap_sbyinstance,
30684c06356bSdh142964 	    (mod_hash_key_t)(intptr_t)path_instance, &hv) == 0)
30694c06356bSdh142964 		path = (char *)hv;
30704c06356bSdh142964 	else
30714c06356bSdh142964 		path = NULL;
30724c06356bSdh142964 	mutex_exit(&mdi_pathmap_mutex);
30734c06356bSdh142964 	return (path);
30744c06356bSdh142964 }
30754c06356bSdh142964 
30764c06356bSdh142964 
30774c06356bSdh142964 /*
30787c478bd9Sstevel@tonic-gate  * i_mdi_phci_add_path():
30797c478bd9Sstevel@tonic-gate  * 		Add a mdi_pathinfo node to pHCI list.
30807c478bd9Sstevel@tonic-gate  * Notes:
30817c478bd9Sstevel@tonic-gate  *		Caller should per-pHCI mutex
30827c478bd9Sstevel@tonic-gate  */
30837c478bd9Sstevel@tonic-gate static void
30847c478bd9Sstevel@tonic-gate i_mdi_phci_add_path(mdi_phci_t *ph, mdi_pathinfo_t *pip)
30857c478bd9Sstevel@tonic-gate {
30867c478bd9Sstevel@tonic-gate 	ASSERT(DEVI_BUSY_OWNED(ph->ph_dip));
30877c478bd9Sstevel@tonic-gate 
30885e3986cbScth 	MDI_PHCI_LOCK(ph);
30897c478bd9Sstevel@tonic-gate 	if (ph->ph_path_head == NULL) {
30907c478bd9Sstevel@tonic-gate 		ph->ph_path_head = pip;
30917c478bd9Sstevel@tonic-gate 	} else {
30927c478bd9Sstevel@tonic-gate 		MDI_PI(ph->ph_path_tail)->pi_phci_link = MDI_PI(pip);
30937c478bd9Sstevel@tonic-gate 	}
30947c478bd9Sstevel@tonic-gate 	ph->ph_path_tail = pip;
30957c478bd9Sstevel@tonic-gate 	ph->ph_path_count++;
30965e3986cbScth 	MDI_PHCI_UNLOCK(ph);
30977c478bd9Sstevel@tonic-gate }
30987c478bd9Sstevel@tonic-gate 
30997c478bd9Sstevel@tonic-gate /*
31007c478bd9Sstevel@tonic-gate  * i_mdi_client_add_path():
31017c478bd9Sstevel@tonic-gate  *		Add mdi_pathinfo node to client list
31027c478bd9Sstevel@tonic-gate  */
31037c478bd9Sstevel@tonic-gate static void
31047c478bd9Sstevel@tonic-gate i_mdi_client_add_path(mdi_client_t *ct, mdi_pathinfo_t *pip)
31057c478bd9Sstevel@tonic-gate {
31067c478bd9Sstevel@tonic-gate 	ASSERT(DEVI_BUSY_OWNED(ct->ct_dip));
31077c478bd9Sstevel@tonic-gate 
31085e3986cbScth 	MDI_CLIENT_LOCK(ct);
31097c478bd9Sstevel@tonic-gate 	if (ct->ct_path_head == NULL) {
31107c478bd9Sstevel@tonic-gate 		ct->ct_path_head = pip;
31117c478bd9Sstevel@tonic-gate 	} else {
31127c478bd9Sstevel@tonic-gate 		MDI_PI(ct->ct_path_tail)->pi_client_link = MDI_PI(pip);
31137c478bd9Sstevel@tonic-gate 	}
31147c478bd9Sstevel@tonic-gate 	ct->ct_path_tail = pip;
31157c478bd9Sstevel@tonic-gate 	ct->ct_path_count++;
31165e3986cbScth 	MDI_CLIENT_UNLOCK(ct);
31177c478bd9Sstevel@tonic-gate }
31187c478bd9Sstevel@tonic-gate 
31197c478bd9Sstevel@tonic-gate /*
31207c478bd9Sstevel@tonic-gate  * mdi_pi_free():
31217c478bd9Sstevel@tonic-gate  *		Free the mdi_pathinfo node and also client device node if this
31227c478bd9Sstevel@tonic-gate  *		is the last path to the device
31237c478bd9Sstevel@tonic-gate  * Return Values:
31247c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
31257c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
31267c478bd9Sstevel@tonic-gate  *		MDI_BUSY
31277c478bd9Sstevel@tonic-gate  */
31287c478bd9Sstevel@tonic-gate /*ARGSUSED*/
31297c478bd9Sstevel@tonic-gate int
31307c478bd9Sstevel@tonic-gate mdi_pi_free(mdi_pathinfo_t *pip, int flags)
31317c478bd9Sstevel@tonic-gate {
3132e9b79356Srs135747 	int		rv = MDI_FAILURE;
31337c478bd9Sstevel@tonic-gate 	mdi_vhci_t	*vh;
31347c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
31357c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
31367c478bd9Sstevel@tonic-gate 	int		(*f)();
31377c478bd9Sstevel@tonic-gate 	int		client_held = 0;
31387c478bd9Sstevel@tonic-gate 
31397c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
31407c478bd9Sstevel@tonic-gate 	ph = MDI_PI(pip)->pi_phci;
31417c478bd9Sstevel@tonic-gate 	ASSERT(ph != NULL);
31427c478bd9Sstevel@tonic-gate 	if (ph == NULL) {
31437c478bd9Sstevel@tonic-gate 		/*
31447c478bd9Sstevel@tonic-gate 		 * Invalid pHCI device, return failure
31457c478bd9Sstevel@tonic-gate 		 */
31464c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, NULL,
31474c06356bSdh142964 		    "!invalid pHCI: pip %s %p",
31484c06356bSdh142964 		    mdi_pi_spathname(pip), (void *)pip));
31497c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
31507c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
31517c478bd9Sstevel@tonic-gate 	}
31527c478bd9Sstevel@tonic-gate 
31537c478bd9Sstevel@tonic-gate 	vh = ph->ph_vhci;
31547c478bd9Sstevel@tonic-gate 	ASSERT(vh != NULL);
31557c478bd9Sstevel@tonic-gate 	if (vh == NULL) {
31567c478bd9Sstevel@tonic-gate 		/* Invalid pHCI device, return failure */
31574c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, ph->ph_dip,
31584c06356bSdh142964 		    "!invalid vHCI: pip %s %p",
31594c06356bSdh142964 		    mdi_pi_spathname(pip), (void *)pip));
31607c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
31617c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
31627c478bd9Sstevel@tonic-gate 	}
31637c478bd9Sstevel@tonic-gate 
31647c478bd9Sstevel@tonic-gate 	ct = MDI_PI(pip)->pi_client;
31657c478bd9Sstevel@tonic-gate 	ASSERT(ct != NULL);
31667c478bd9Sstevel@tonic-gate 	if (ct == NULL) {
31677c478bd9Sstevel@tonic-gate 		/*
31687c478bd9Sstevel@tonic-gate 		 * Invalid Client device, return failure
31697c478bd9Sstevel@tonic-gate 		 */
31704c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, ph->ph_dip,
31714c06356bSdh142964 		    "!invalid client: pip %s %p",
31724c06356bSdh142964 		    mdi_pi_spathname(pip), (void *)pip));
31737c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
31747c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
31757c478bd9Sstevel@tonic-gate 	}
31767c478bd9Sstevel@tonic-gate 
31777c478bd9Sstevel@tonic-gate 	/*
31787c478bd9Sstevel@tonic-gate 	 * Check to see for busy condition.  A mdi_pathinfo can only be freed
31797c478bd9Sstevel@tonic-gate 	 * if the node state is either offline or init and the reference count
31807c478bd9Sstevel@tonic-gate 	 * is zero.
31817c478bd9Sstevel@tonic-gate 	 */
31827c478bd9Sstevel@tonic-gate 	if (!(MDI_PI_IS_OFFLINE(pip) || MDI_PI_IS_INIT(pip) ||
31837c478bd9Sstevel@tonic-gate 	    MDI_PI_IS_INITING(pip))) {
31847c478bd9Sstevel@tonic-gate 		/*
31857c478bd9Sstevel@tonic-gate 		 * Node is busy
31867c478bd9Sstevel@tonic-gate 		 */
31874c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, ct->ct_dip,
31884c06356bSdh142964 		    "!busy: pip %s %p", mdi_pi_spathname(pip), (void *)pip));
31897c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
31907c478bd9Sstevel@tonic-gate 		return (MDI_BUSY);
31917c478bd9Sstevel@tonic-gate 	}
31927c478bd9Sstevel@tonic-gate 
31937c478bd9Sstevel@tonic-gate 	while (MDI_PI(pip)->pi_ref_cnt != 0) {
31947c478bd9Sstevel@tonic-gate 		/*
31957c478bd9Sstevel@tonic-gate 		 * Give a chance for pending I/Os to complete.
31967c478bd9Sstevel@tonic-gate 		 */
31974c06356bSdh142964 		MDI_DEBUG(1, (MDI_NOTE, ct->ct_dip,
31984c06356bSdh142964 		    "!%d cmds still pending on path: %s %p",
31994c06356bSdh142964 		    MDI_PI(pip)->pi_ref_cnt,
32004c06356bSdh142964 		    mdi_pi_spathname(pip), (void *)pip));
32017c478bd9Sstevel@tonic-gate 		if (cv_timedwait(&MDI_PI(pip)->pi_ref_cv,
32027c478bd9Sstevel@tonic-gate 		    &MDI_PI(pip)->pi_mutex,
32037c478bd9Sstevel@tonic-gate 		    ddi_get_lbolt() + drv_usectohz(60 * 1000000)) == -1) {
32047c478bd9Sstevel@tonic-gate 			/*
32057c478bd9Sstevel@tonic-gate 			 * The timeout time reached without ref_cnt being zero
32067c478bd9Sstevel@tonic-gate 			 * being signaled.
32077c478bd9Sstevel@tonic-gate 			 */
32084c06356bSdh142964 			MDI_DEBUG(1, (MDI_NOTE, ct->ct_dip,
32094c06356bSdh142964 			    "!Timeout reached on path %s %p without the cond",
32104c06356bSdh142964 			    mdi_pi_spathname(pip), (void *)pip));
32114c06356bSdh142964 			MDI_DEBUG(1, (MDI_NOTE, ct->ct_dip,
32124c06356bSdh142964 			    "!%d cmds still pending on path %s %p",
32134c06356bSdh142964 			    MDI_PI(pip)->pi_ref_cnt,
32144c06356bSdh142964 			    mdi_pi_spathname(pip), (void *)pip));
32157c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
32167c478bd9Sstevel@tonic-gate 			return (MDI_BUSY);
32177c478bd9Sstevel@tonic-gate 		}
32187c478bd9Sstevel@tonic-gate 	}
32197c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_pm_held) {
32207c478bd9Sstevel@tonic-gate 		client_held = 1;
32217c478bd9Sstevel@tonic-gate 	}
32227c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
32237c478bd9Sstevel@tonic-gate 
32243c34adc5Sramat 	vhcache_pi_remove(vh->vh_config, MDI_PI(pip));
32253c34adc5Sramat 
32267c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
32277c478bd9Sstevel@tonic-gate 
32285e3986cbScth 	/* Prevent further failovers till MDI_VHCI_CLIENT_LOCK is held */
32297c478bd9Sstevel@tonic-gate 	MDI_CLIENT_SET_PATH_FREE_IN_PROGRESS(ct);
32307c478bd9Sstevel@tonic-gate 
32317c478bd9Sstevel@tonic-gate 	/*
32327c478bd9Sstevel@tonic-gate 	 * Wait till failover is complete before removing this node.
32337c478bd9Sstevel@tonic-gate 	 */
32347c478bd9Sstevel@tonic-gate 	while (MDI_CLIENT_IS_FAILOVER_IN_PROGRESS(ct))
32357c478bd9Sstevel@tonic-gate 		cv_wait(&ct->ct_failover_cv, &ct->ct_mutex);
32367c478bd9Sstevel@tonic-gate 
32377c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
32385e3986cbScth 	MDI_VHCI_CLIENT_LOCK(vh);
32397c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
32407c478bd9Sstevel@tonic-gate 	MDI_CLIENT_CLEAR_PATH_FREE_IN_PROGRESS(ct);
32417c478bd9Sstevel@tonic-gate 
32427c478bd9Sstevel@tonic-gate 	if (!MDI_PI_IS_INITING(pip)) {
32437c478bd9Sstevel@tonic-gate 		f = vh->vh_ops->vo_pi_uninit;
32447c478bd9Sstevel@tonic-gate 		if (f != NULL) {
32457c478bd9Sstevel@tonic-gate 			rv = (*f)(vh->vh_dip, pip, 0);
32467c478bd9Sstevel@tonic-gate 		}
32477c478bd9Sstevel@tonic-gate 	}
32487c478bd9Sstevel@tonic-gate 	/*
32497c478bd9Sstevel@tonic-gate 	 * If vo_pi_uninit() completed successfully.
32507c478bd9Sstevel@tonic-gate 	 */
32517c478bd9Sstevel@tonic-gate 	if (rv == MDI_SUCCESS) {
32527c478bd9Sstevel@tonic-gate 		if (client_held) {
32534c06356bSdh142964 			MDI_DEBUG(4, (MDI_NOTE, ct->ct_dip,
32547c478bd9Sstevel@tonic-gate 			    "i_mdi_pm_rele_client\n"));
32557c478bd9Sstevel@tonic-gate 			i_mdi_pm_rele_client(ct, 1);
32567c478bd9Sstevel@tonic-gate 		}
32577c478bd9Sstevel@tonic-gate 		i_mdi_pi_free(ph, pip, ct);
32587c478bd9Sstevel@tonic-gate 		if (ct->ct_path_count == 0) {
32597c478bd9Sstevel@tonic-gate 			/*
32607c478bd9Sstevel@tonic-gate 			 * Client lost its last path.
32617c478bd9Sstevel@tonic-gate 			 * Clean up the client device
32627c478bd9Sstevel@tonic-gate 			 */
32637c478bd9Sstevel@tonic-gate 			MDI_CLIENT_UNLOCK(ct);
32647c478bd9Sstevel@tonic-gate 			(void) i_mdi_client_free(ct->ct_vhci, ct);
32655e3986cbScth 			MDI_VHCI_CLIENT_UNLOCK(vh);
32667c478bd9Sstevel@tonic-gate 			return (rv);
32677c478bd9Sstevel@tonic-gate 		}
32687c478bd9Sstevel@tonic-gate 	}
32697c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
32705e3986cbScth 	MDI_VHCI_CLIENT_UNLOCK(vh);
32713c34adc5Sramat 
32723c34adc5Sramat 	if (rv == MDI_FAILURE)
32733c34adc5Sramat 		vhcache_pi_add(vh->vh_config, MDI_PI(pip));
32743c34adc5Sramat 
32757c478bd9Sstevel@tonic-gate 	return (rv);
32767c478bd9Sstevel@tonic-gate }
32777c478bd9Sstevel@tonic-gate 
32787c478bd9Sstevel@tonic-gate /*
32797c478bd9Sstevel@tonic-gate  * i_mdi_pi_free():
32807c478bd9Sstevel@tonic-gate  *		Free the mdi_pathinfo node
32817c478bd9Sstevel@tonic-gate  */
32827c478bd9Sstevel@tonic-gate static void
32837c478bd9Sstevel@tonic-gate i_mdi_pi_free(mdi_phci_t *ph, mdi_pathinfo_t *pip, mdi_client_t *ct)
32847c478bd9Sstevel@tonic-gate {
32857c478bd9Sstevel@tonic-gate 	int	ct_circular;
32867c478bd9Sstevel@tonic-gate 	int	ph_circular;
32877c478bd9Sstevel@tonic-gate 
32885e3986cbScth 	ASSERT(MDI_CLIENT_LOCKED(ct));
32895e3986cbScth 
32907c478bd9Sstevel@tonic-gate 	/*
32917c478bd9Sstevel@tonic-gate 	 * remove any per-path kstats
32927c478bd9Sstevel@tonic-gate 	 */
32937c478bd9Sstevel@tonic-gate 	i_mdi_pi_kstat_destroy(pip);
32947c478bd9Sstevel@tonic-gate 
32955e3986cbScth 	/* See comments in i_mdi_pi_alloc() */
32967c478bd9Sstevel@tonic-gate 	ndi_devi_enter(ct->ct_dip, &ct_circular);
32977c478bd9Sstevel@tonic-gate 	ndi_devi_enter(ph->ph_dip, &ph_circular);
32987c478bd9Sstevel@tonic-gate 
32997c478bd9Sstevel@tonic-gate 	i_mdi_client_remove_path(ct, pip);
33007c478bd9Sstevel@tonic-gate 	i_mdi_phci_remove_path(ph, pip);
33017c478bd9Sstevel@tonic-gate 
33027c478bd9Sstevel@tonic-gate 	ndi_devi_exit(ph->ph_dip, ph_circular);
33037c478bd9Sstevel@tonic-gate 	ndi_devi_exit(ct->ct_dip, ct_circular);
33047c478bd9Sstevel@tonic-gate 
33057c478bd9Sstevel@tonic-gate 	mutex_destroy(&MDI_PI(pip)->pi_mutex);
33067c478bd9Sstevel@tonic-gate 	cv_destroy(&MDI_PI(pip)->pi_state_cv);
33077c478bd9Sstevel@tonic-gate 	cv_destroy(&MDI_PI(pip)->pi_ref_cv);
33087c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_addr) {
33097c478bd9Sstevel@tonic-gate 		kmem_free(MDI_PI(pip)->pi_addr,
33107c478bd9Sstevel@tonic-gate 		    strlen(MDI_PI(pip)->pi_addr) + 1);
33117c478bd9Sstevel@tonic-gate 		MDI_PI(pip)->pi_addr = NULL;
33127c478bd9Sstevel@tonic-gate 	}
33137c478bd9Sstevel@tonic-gate 
33147c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_prop) {
33157c478bd9Sstevel@tonic-gate 		(void) nvlist_free(MDI_PI(pip)->pi_prop);
33167c478bd9Sstevel@tonic-gate 		MDI_PI(pip)->pi_prop = NULL;
33177c478bd9Sstevel@tonic-gate 	}
33187c478bd9Sstevel@tonic-gate 	kmem_free(pip, sizeof (struct mdi_pathinfo));
33197c478bd9Sstevel@tonic-gate }
33207c478bd9Sstevel@tonic-gate 
33217c478bd9Sstevel@tonic-gate 
33227c478bd9Sstevel@tonic-gate /*
33237c478bd9Sstevel@tonic-gate  * i_mdi_phci_remove_path():
33247c478bd9Sstevel@tonic-gate  * 		Remove a mdi_pathinfo node from pHCI list.
33257c478bd9Sstevel@tonic-gate  * Notes:
33267c478bd9Sstevel@tonic-gate  *		Caller should hold per-pHCI mutex
33277c478bd9Sstevel@tonic-gate  */
33287c478bd9Sstevel@tonic-gate static void
33297c478bd9Sstevel@tonic-gate i_mdi_phci_remove_path(mdi_phci_t *ph, mdi_pathinfo_t *pip)
33307c478bd9Sstevel@tonic-gate {
33317c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*prev = NULL;
33327c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*path = NULL;
33337c478bd9Sstevel@tonic-gate 
33347c478bd9Sstevel@tonic-gate 	ASSERT(DEVI_BUSY_OWNED(ph->ph_dip));
33357c478bd9Sstevel@tonic-gate 
33365e3986cbScth 	MDI_PHCI_LOCK(ph);
33377c478bd9Sstevel@tonic-gate 	path = ph->ph_path_head;
33387c478bd9Sstevel@tonic-gate 	while (path != NULL) {
33397c478bd9Sstevel@tonic-gate 		if (path == pip) {
33407c478bd9Sstevel@tonic-gate 			break;
33417c478bd9Sstevel@tonic-gate 		}
33427c478bd9Sstevel@tonic-gate 		prev = path;
33437c478bd9Sstevel@tonic-gate 		path = (mdi_pathinfo_t *)MDI_PI(path)->pi_phci_link;
33447c478bd9Sstevel@tonic-gate 	}
33457c478bd9Sstevel@tonic-gate 
33467c478bd9Sstevel@tonic-gate 	if (path) {
33477c478bd9Sstevel@tonic-gate 		ph->ph_path_count--;
33487c478bd9Sstevel@tonic-gate 		if (prev) {
33497c478bd9Sstevel@tonic-gate 			MDI_PI(prev)->pi_phci_link = MDI_PI(path)->pi_phci_link;
33507c478bd9Sstevel@tonic-gate 		} else {
33517c478bd9Sstevel@tonic-gate 			ph->ph_path_head =
33527c478bd9Sstevel@tonic-gate 			    (mdi_pathinfo_t *)MDI_PI(path)->pi_phci_link;
33537c478bd9Sstevel@tonic-gate 		}
33547c478bd9Sstevel@tonic-gate 		if (ph->ph_path_tail == path) {
33557c478bd9Sstevel@tonic-gate 			ph->ph_path_tail = prev;
33567c478bd9Sstevel@tonic-gate 		}
33577c478bd9Sstevel@tonic-gate 	}
33587c478bd9Sstevel@tonic-gate 
33597c478bd9Sstevel@tonic-gate 	/*
33607c478bd9Sstevel@tonic-gate 	 * Clear the pHCI link
33617c478bd9Sstevel@tonic-gate 	 */
33627c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_phci_link = NULL;
33637c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_phci = NULL;
33645e3986cbScth 	MDI_PHCI_UNLOCK(ph);
33657c478bd9Sstevel@tonic-gate }
33667c478bd9Sstevel@tonic-gate 
33677c478bd9Sstevel@tonic-gate /*
33687c478bd9Sstevel@tonic-gate  * i_mdi_client_remove_path():
33697c478bd9Sstevel@tonic-gate  * 		Remove a mdi_pathinfo node from client path list.
33707c478bd9Sstevel@tonic-gate  */
33717c478bd9Sstevel@tonic-gate static void
33727c478bd9Sstevel@tonic-gate i_mdi_client_remove_path(mdi_client_t *ct, mdi_pathinfo_t *pip)
33737c478bd9Sstevel@tonic-gate {
33747c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*prev = NULL;
33757c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*path;
33767c478bd9Sstevel@tonic-gate 
33777c478bd9Sstevel@tonic-gate 	ASSERT(DEVI_BUSY_OWNED(ct->ct_dip));
33787c478bd9Sstevel@tonic-gate 
33795e3986cbScth 	ASSERT(MDI_CLIENT_LOCKED(ct));
33807c478bd9Sstevel@tonic-gate 	path = ct->ct_path_head;
33817c478bd9Sstevel@tonic-gate 	while (path != NULL) {
33827c478bd9Sstevel@tonic-gate 		if (path == pip) {
33837c478bd9Sstevel@tonic-gate 			break;
33847c478bd9Sstevel@tonic-gate 		}
33857c478bd9Sstevel@tonic-gate 		prev = path;
33867c478bd9Sstevel@tonic-gate 		path = (mdi_pathinfo_t *)MDI_PI(path)->pi_client_link;
33877c478bd9Sstevel@tonic-gate 	}
33887c478bd9Sstevel@tonic-gate 
33897c478bd9Sstevel@tonic-gate 	if (path) {
33907c478bd9Sstevel@tonic-gate 		ct->ct_path_count--;
33917c478bd9Sstevel@tonic-gate 		if (prev) {
33927c478bd9Sstevel@tonic-gate 			MDI_PI(prev)->pi_client_link =
33937c478bd9Sstevel@tonic-gate 			    MDI_PI(path)->pi_client_link;
33947c478bd9Sstevel@tonic-gate 		} else {
33957c478bd9Sstevel@tonic-gate 			ct->ct_path_head =
33967c478bd9Sstevel@tonic-gate 			    (mdi_pathinfo_t *)MDI_PI(path)->pi_client_link;
33977c478bd9Sstevel@tonic-gate 		}
33987c478bd9Sstevel@tonic-gate 		if (ct->ct_path_tail == path) {
33997c478bd9Sstevel@tonic-gate 			ct->ct_path_tail = prev;
34007c478bd9Sstevel@tonic-gate 		}
34017c478bd9Sstevel@tonic-gate 		if (ct->ct_path_last == path) {
34027c478bd9Sstevel@tonic-gate 			ct->ct_path_last = ct->ct_path_head;
34037c478bd9Sstevel@tonic-gate 		}
34047c478bd9Sstevel@tonic-gate 	}
34057c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_client_link = NULL;
34067c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_client = NULL;
34077c478bd9Sstevel@tonic-gate }
34087c478bd9Sstevel@tonic-gate 
34097c478bd9Sstevel@tonic-gate /*
34107c478bd9Sstevel@tonic-gate  * i_mdi_pi_state_change():
34117c478bd9Sstevel@tonic-gate  *		online a mdi_pathinfo node
34127c478bd9Sstevel@tonic-gate  *
34137c478bd9Sstevel@tonic-gate  * Return Values:
34147c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
34157c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
34167c478bd9Sstevel@tonic-gate  */
34177c478bd9Sstevel@tonic-gate /*ARGSUSED*/
34187c478bd9Sstevel@tonic-gate static int
34197c478bd9Sstevel@tonic-gate i_mdi_pi_state_change(mdi_pathinfo_t *pip, mdi_pathinfo_state_t state, int flag)
34207c478bd9Sstevel@tonic-gate {
34217c478bd9Sstevel@tonic-gate 	int		rv = MDI_SUCCESS;
34227c478bd9Sstevel@tonic-gate 	mdi_vhci_t	*vh;
34237c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
34247c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
34257c478bd9Sstevel@tonic-gate 	int		(*f)();
34267c478bd9Sstevel@tonic-gate 	dev_info_t	*cdip;
34277c478bd9Sstevel@tonic-gate 
34287c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
34297c478bd9Sstevel@tonic-gate 
34307c478bd9Sstevel@tonic-gate 	ph = MDI_PI(pip)->pi_phci;
34317c478bd9Sstevel@tonic-gate 	ASSERT(ph);
34327c478bd9Sstevel@tonic-gate 	if (ph == NULL) {
34337c478bd9Sstevel@tonic-gate 		/*
34347c478bd9Sstevel@tonic-gate 		 * Invalid pHCI device, fail the request
34357c478bd9Sstevel@tonic-gate 		 */
34367c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
34374c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, NULL,
34384c06356bSdh142964 		    "!invalid phci: pip %s %p",
34394c06356bSdh142964 		    mdi_pi_spathname(pip), (void *)pip));
34407c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
34417c478bd9Sstevel@tonic-gate 	}
34427c478bd9Sstevel@tonic-gate 
34437c478bd9Sstevel@tonic-gate 	vh = ph->ph_vhci;
34447c478bd9Sstevel@tonic-gate 	ASSERT(vh);
34457c478bd9Sstevel@tonic-gate 	if (vh == NULL) {
34467c478bd9Sstevel@tonic-gate 		/*
34477c478bd9Sstevel@tonic-gate 		 * Invalid vHCI device, fail the request
34487c478bd9Sstevel@tonic-gate 		 */
34497c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
34504c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, ph->ph_dip,
34514c06356bSdh142964 		    "!invalid vhci: pip %s %p",
34524c06356bSdh142964 		    mdi_pi_spathname(pip), (void *)pip));
34537c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
34547c478bd9Sstevel@tonic-gate 	}
34557c478bd9Sstevel@tonic-gate 
34567c478bd9Sstevel@tonic-gate 	ct = MDI_PI(pip)->pi_client;
34577c478bd9Sstevel@tonic-gate 	ASSERT(ct != NULL);
34587c478bd9Sstevel@tonic-gate 	if (ct == NULL) {
34597c478bd9Sstevel@tonic-gate 		/*
34607c478bd9Sstevel@tonic-gate 		 * Invalid client device, fail the request
34617c478bd9Sstevel@tonic-gate 		 */
34627c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
34634c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, ph->ph_dip,
34644c06356bSdh142964 		    "!invalid client: pip %s %p",
34654c06356bSdh142964 		    mdi_pi_spathname(pip), (void *)pip));
34667c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
34677c478bd9Sstevel@tonic-gate 	}
34687c478bd9Sstevel@tonic-gate 
34697c478bd9Sstevel@tonic-gate 	/*
34707c478bd9Sstevel@tonic-gate 	 * If this path has not been initialized yet, Callback vHCI driver's
34717c478bd9Sstevel@tonic-gate 	 * pathinfo node initialize entry point
34727c478bd9Sstevel@tonic-gate 	 */
34737c478bd9Sstevel@tonic-gate 
34747c478bd9Sstevel@tonic-gate 	if (MDI_PI_IS_INITING(pip)) {
34757c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
34767c478bd9Sstevel@tonic-gate 		f = vh->vh_ops->vo_pi_init;
34777c478bd9Sstevel@tonic-gate 		if (f != NULL) {
34787c478bd9Sstevel@tonic-gate 			rv = (*f)(vh->vh_dip, pip, 0);
34797c478bd9Sstevel@tonic-gate 			if (rv != MDI_SUCCESS) {
34804c06356bSdh142964 				MDI_DEBUG(1, (MDI_WARN, ct->ct_dip,
34814c06356bSdh142964 				    "!vo_pi_init failed: vHCI %p, pip %s %p",
34824c06356bSdh142964 				    (void *)vh, mdi_pi_spathname(pip),
34834c06356bSdh142964 				    (void *)pip));
34847c478bd9Sstevel@tonic-gate 				return (MDI_FAILURE);
34857c478bd9Sstevel@tonic-gate 			}
34867c478bd9Sstevel@tonic-gate 		}
34877c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
34887c478bd9Sstevel@tonic-gate 		MDI_PI_CLEAR_TRANSIENT(pip);
34897c478bd9Sstevel@tonic-gate 	}
34907c478bd9Sstevel@tonic-gate 
34917c478bd9Sstevel@tonic-gate 	/*
34927c478bd9Sstevel@tonic-gate 	 * Do not allow state transition when pHCI is in offline/suspended
34937c478bd9Sstevel@tonic-gate 	 * states
34947c478bd9Sstevel@tonic-gate 	 */
34957c478bd9Sstevel@tonic-gate 	i_mdi_phci_lock(ph, pip);
34967c478bd9Sstevel@tonic-gate 	if (MDI_PHCI_IS_READY(ph) == 0) {
34974c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, ct->ct_dip,
34984c06356bSdh142964 		    "!pHCI not ready, pHCI=%p", (void *)ph));
34997c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
35007c478bd9Sstevel@tonic-gate 		i_mdi_phci_unlock(ph);
35017c478bd9Sstevel@tonic-gate 		return (MDI_BUSY);
35027c478bd9Sstevel@tonic-gate 	}
35037c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNSTABLE(ph);
35047c478bd9Sstevel@tonic-gate 	i_mdi_phci_unlock(ph);
35057c478bd9Sstevel@tonic-gate 
35067c478bd9Sstevel@tonic-gate 	/*
35077c478bd9Sstevel@tonic-gate 	 * Check if mdi_pathinfo state is in transient state.
35087c478bd9Sstevel@tonic-gate 	 * If yes, offlining is in progress and wait till transient state is
35097c478bd9Sstevel@tonic-gate 	 * cleared.
35107c478bd9Sstevel@tonic-gate 	 */
35117c478bd9Sstevel@tonic-gate 	if (MDI_PI_IS_TRANSIENT(pip)) {
35127c478bd9Sstevel@tonic-gate 		while (MDI_PI_IS_TRANSIENT(pip)) {
35137c478bd9Sstevel@tonic-gate 			cv_wait(&MDI_PI(pip)->pi_state_cv,
35147c478bd9Sstevel@tonic-gate 			    &MDI_PI(pip)->pi_mutex);
35157c478bd9Sstevel@tonic-gate 		}
35167c478bd9Sstevel@tonic-gate 	}
35177c478bd9Sstevel@tonic-gate 
35187c478bd9Sstevel@tonic-gate 	/*
35197c478bd9Sstevel@tonic-gate 	 * Grab the client lock in reverse order sequence and release the
35207c478bd9Sstevel@tonic-gate 	 * mdi_pathinfo mutex.
35217c478bd9Sstevel@tonic-gate 	 */
35227c478bd9Sstevel@tonic-gate 	i_mdi_client_lock(ct, pip);
35237c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
35247c478bd9Sstevel@tonic-gate 
35257c478bd9Sstevel@tonic-gate 	/*
35267c478bd9Sstevel@tonic-gate 	 * Wait till failover state is cleared
35277c478bd9Sstevel@tonic-gate 	 */
35287c478bd9Sstevel@tonic-gate 	while (MDI_CLIENT_IS_FAILOVER_IN_PROGRESS(ct))
35297c478bd9Sstevel@tonic-gate 		cv_wait(&ct->ct_failover_cv, &ct->ct_mutex);
35307c478bd9Sstevel@tonic-gate 
35317c478bd9Sstevel@tonic-gate 	/*
35327c478bd9Sstevel@tonic-gate 	 * Mark the mdi_pathinfo node state as transient
35337c478bd9Sstevel@tonic-gate 	 */
35347c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
35357c478bd9Sstevel@tonic-gate 	switch (state) {
35367c478bd9Sstevel@tonic-gate 	case MDI_PATHINFO_STATE_ONLINE:
35377c478bd9Sstevel@tonic-gate 		MDI_PI_SET_ONLINING(pip);
35387c478bd9Sstevel@tonic-gate 		break;
35397c478bd9Sstevel@tonic-gate 
35407c478bd9Sstevel@tonic-gate 	case MDI_PATHINFO_STATE_STANDBY:
35417c478bd9Sstevel@tonic-gate 		MDI_PI_SET_STANDBYING(pip);
35427c478bd9Sstevel@tonic-gate 		break;
35437c478bd9Sstevel@tonic-gate 
35447c478bd9Sstevel@tonic-gate 	case MDI_PATHINFO_STATE_FAULT:
35457c478bd9Sstevel@tonic-gate 		/*
35467c478bd9Sstevel@tonic-gate 		 * Mark the pathinfo state as FAULTED
35477c478bd9Sstevel@tonic-gate 		 */
35487c478bd9Sstevel@tonic-gate 		MDI_PI_SET_FAULTING(pip);
35497c478bd9Sstevel@tonic-gate 		MDI_PI_ERRSTAT(pip, MDI_PI_HARDERR);
35507c478bd9Sstevel@tonic-gate 		break;
35517c478bd9Sstevel@tonic-gate 
35527c478bd9Sstevel@tonic-gate 	case MDI_PATHINFO_STATE_OFFLINE:
35537c478bd9Sstevel@tonic-gate 		/*
35547c478bd9Sstevel@tonic-gate 		 * ndi_devi_offline() cannot hold pip or ct locks.
35557c478bd9Sstevel@tonic-gate 		 */
35567c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
35574c06356bSdh142964 
35587c478bd9Sstevel@tonic-gate 		/*
35594c06356bSdh142964 		 * If this is a user initiated path online->offline operation
35604c06356bSdh142964 		 * who's success would transition a client from DEGRADED to
35614c06356bSdh142964 		 * FAILED then only proceed if we can offline the client first.
35627c478bd9Sstevel@tonic-gate 		 */
35637c478bd9Sstevel@tonic-gate 		cdip = ct->ct_dip;
35644c06356bSdh142964 		if ((flag & NDI_USER_REQ) &&
35654c06356bSdh142964 		    MDI_PI_IS_ONLINE(pip) &&
35664c06356bSdh142964 		    (MDI_CLIENT_STATE(ct) == MDI_CLIENT_STATE_DEGRADED)) {
35677c478bd9Sstevel@tonic-gate 			i_mdi_client_unlock(ct);
35684c06356bSdh142964 			rv = ndi_devi_offline(cdip, NDI_DEVFS_CLEAN);
35697c478bd9Sstevel@tonic-gate 			if (rv != NDI_SUCCESS) {
35707c478bd9Sstevel@tonic-gate 				/*
35717c478bd9Sstevel@tonic-gate 				 * Convert to MDI error code
35727c478bd9Sstevel@tonic-gate 				 */
35737c478bd9Sstevel@tonic-gate 				switch (rv) {
35747c478bd9Sstevel@tonic-gate 				case NDI_BUSY:
35757c478bd9Sstevel@tonic-gate 					rv = MDI_BUSY;
35767c478bd9Sstevel@tonic-gate 					break;
35777c478bd9Sstevel@tonic-gate 				default:
35787c478bd9Sstevel@tonic-gate 					rv = MDI_FAILURE;
35797c478bd9Sstevel@tonic-gate 					break;
35807c478bd9Sstevel@tonic-gate 				}
35817c478bd9Sstevel@tonic-gate 				goto state_change_exit;
35827c478bd9Sstevel@tonic-gate 			} else {
35837c478bd9Sstevel@tonic-gate 				i_mdi_client_lock(ct, NULL);
35847c478bd9Sstevel@tonic-gate 			}
35857c478bd9Sstevel@tonic-gate 		}
35867c478bd9Sstevel@tonic-gate 		/*
35877c478bd9Sstevel@tonic-gate 		 * Mark the mdi_pathinfo node state as transient
35887c478bd9Sstevel@tonic-gate 		 */
35897c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
35907c478bd9Sstevel@tonic-gate 		MDI_PI_SET_OFFLINING(pip);
35917c478bd9Sstevel@tonic-gate 		break;
35927c478bd9Sstevel@tonic-gate 	}
35937c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
35947c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNSTABLE(ct);
35957c478bd9Sstevel@tonic-gate 	i_mdi_client_unlock(ct);
35967c478bd9Sstevel@tonic-gate 
35977c478bd9Sstevel@tonic-gate 	f = vh->vh_ops->vo_pi_state_change;
35985e3986cbScth 	if (f != NULL)
35997c478bd9Sstevel@tonic-gate 		rv = (*f)(vh->vh_dip, pip, state, 0, flag);
36005e3986cbScth 
36015e3986cbScth 	MDI_CLIENT_LOCK(ct);
36025e3986cbScth 	MDI_PI_LOCK(pip);
36037c478bd9Sstevel@tonic-gate 	if (rv == MDI_NOT_SUPPORTED) {
36047c478bd9Sstevel@tonic-gate 		MDI_CLIENT_SET_DEV_NOT_SUPPORTED(ct);
36057c478bd9Sstevel@tonic-gate 	}
36067c478bd9Sstevel@tonic-gate 	if (rv != MDI_SUCCESS) {
36074c06356bSdh142964 		MDI_DEBUG(2, (MDI_WARN, ct->ct_dip,
36084c06356bSdh142964 		    "vo_pi_state_change failed: rv %x", rv));
36097c478bd9Sstevel@tonic-gate 	}
36107c478bd9Sstevel@tonic-gate 	if (MDI_PI_IS_TRANSIENT(pip)) {
36117c478bd9Sstevel@tonic-gate 		if (rv == MDI_SUCCESS) {
36127c478bd9Sstevel@tonic-gate 			MDI_PI_CLEAR_TRANSIENT(pip);
36137c478bd9Sstevel@tonic-gate 		} else {
36147c478bd9Sstevel@tonic-gate 			MDI_PI(pip)->pi_state = MDI_PI_OLD_STATE(pip);
36157c478bd9Sstevel@tonic-gate 		}
36167c478bd9Sstevel@tonic-gate 	}
36177c478bd9Sstevel@tonic-gate 
36187c478bd9Sstevel@tonic-gate 	/*
36197c478bd9Sstevel@tonic-gate 	 * Wake anyone waiting for this mdi_pathinfo node
36207c478bd9Sstevel@tonic-gate 	 */
36217c478bd9Sstevel@tonic-gate 	cv_broadcast(&MDI_PI(pip)->pi_state_cv);
36227c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
36237c478bd9Sstevel@tonic-gate 
36247c478bd9Sstevel@tonic-gate 	/*
36257c478bd9Sstevel@tonic-gate 	 * Mark the client device as stable
36267c478bd9Sstevel@tonic-gate 	 */
36277c478bd9Sstevel@tonic-gate 	MDI_CLIENT_STABLE(ct);
36287c478bd9Sstevel@tonic-gate 	if (rv == MDI_SUCCESS) {
36297c478bd9Sstevel@tonic-gate 		if (ct->ct_unstable == 0) {
36307c478bd9Sstevel@tonic-gate 			cdip = ct->ct_dip;
36317c478bd9Sstevel@tonic-gate 
36327c478bd9Sstevel@tonic-gate 			/*
36337c478bd9Sstevel@tonic-gate 			 * Onlining the mdi_pathinfo node will impact the
36347c478bd9Sstevel@tonic-gate 			 * client state Update the client and dev_info node
36357c478bd9Sstevel@tonic-gate 			 * state accordingly
36367c478bd9Sstevel@tonic-gate 			 */
36377c478bd9Sstevel@tonic-gate 			rv = NDI_SUCCESS;
36387c478bd9Sstevel@tonic-gate 			i_mdi_client_update_state(ct);
36397c478bd9Sstevel@tonic-gate 			switch (MDI_CLIENT_STATE(ct)) {
36407c478bd9Sstevel@tonic-gate 			case MDI_CLIENT_STATE_OPTIMAL:
36417c478bd9Sstevel@tonic-gate 			case MDI_CLIENT_STATE_DEGRADED:
3642737d277aScth 				if (cdip && !i_ddi_devi_attached(cdip) &&
36437c478bd9Sstevel@tonic-gate 				    ((state == MDI_PATHINFO_STATE_ONLINE) ||
36447c478bd9Sstevel@tonic-gate 				    (state == MDI_PATHINFO_STATE_STANDBY))) {
36457c478bd9Sstevel@tonic-gate 
36467c478bd9Sstevel@tonic-gate 					/*
36477c478bd9Sstevel@tonic-gate 					 * Must do ndi_devi_online() through
36487c478bd9Sstevel@tonic-gate 					 * hotplug thread for deferred
36497c478bd9Sstevel@tonic-gate 					 * attach mechanism to work
36507c478bd9Sstevel@tonic-gate 					 */
36515e3986cbScth 					MDI_CLIENT_UNLOCK(ct);
36527c478bd9Sstevel@tonic-gate 					rv = ndi_devi_online(cdip, 0);
36535e3986cbScth 					MDI_CLIENT_LOCK(ct);
36547c478bd9Sstevel@tonic-gate 					if ((rv != NDI_SUCCESS) &&
36557c478bd9Sstevel@tonic-gate 					    (MDI_CLIENT_STATE(ct) ==
36567c478bd9Sstevel@tonic-gate 					    MDI_CLIENT_STATE_DEGRADED)) {
36577c478bd9Sstevel@tonic-gate 						/*
36587c478bd9Sstevel@tonic-gate 						 * ndi_devi_online failed.
36597c478bd9Sstevel@tonic-gate 						 * Reset client flags to
36607c478bd9Sstevel@tonic-gate 						 * offline.
36617c478bd9Sstevel@tonic-gate 						 */
36624c06356bSdh142964 						MDI_DEBUG(1, (MDI_WARN, cdip,
36634c06356bSdh142964 						    "!ndi_devi_online failed "
36644c06356bSdh142964 						    "error %x", rv));
36657c478bd9Sstevel@tonic-gate 						MDI_CLIENT_SET_OFFLINE(ct);
36667c478bd9Sstevel@tonic-gate 					}
36677c478bd9Sstevel@tonic-gate 					if (rv != NDI_SUCCESS) {
36687c478bd9Sstevel@tonic-gate 						/* Reset the path state */
36697c478bd9Sstevel@tonic-gate 						MDI_PI_LOCK(pip);
36707c478bd9Sstevel@tonic-gate 						MDI_PI(pip)->pi_state =
36717c478bd9Sstevel@tonic-gate 						    MDI_PI_OLD_STATE(pip);
36727c478bd9Sstevel@tonic-gate 						MDI_PI_UNLOCK(pip);
36737c478bd9Sstevel@tonic-gate 					}
36747c478bd9Sstevel@tonic-gate 				}
36757c478bd9Sstevel@tonic-gate 				break;
36767c478bd9Sstevel@tonic-gate 
36777c478bd9Sstevel@tonic-gate 			case MDI_CLIENT_STATE_FAILED:
36787c478bd9Sstevel@tonic-gate 				/*
36797c478bd9Sstevel@tonic-gate 				 * This is the last path case for
36807c478bd9Sstevel@tonic-gate 				 * non-user initiated events.
36817c478bd9Sstevel@tonic-gate 				 */
36824c06356bSdh142964 				if (((flag & NDI_USER_REQ) == 0) &&
36837c478bd9Sstevel@tonic-gate 				    cdip && (i_ddi_node_state(cdip) >=
36847c478bd9Sstevel@tonic-gate 				    DS_INITIALIZED)) {
36855e3986cbScth 					MDI_CLIENT_UNLOCK(ct);
36864c06356bSdh142964 					rv = ndi_devi_offline(cdip,
36874c06356bSdh142964 					    NDI_DEVFS_CLEAN);
36885e3986cbScth 					MDI_CLIENT_LOCK(ct);
36897c478bd9Sstevel@tonic-gate 
36907c478bd9Sstevel@tonic-gate 					if (rv != NDI_SUCCESS) {
36917c478bd9Sstevel@tonic-gate 						/*
36927c478bd9Sstevel@tonic-gate 						 * ndi_devi_offline failed.
36937c478bd9Sstevel@tonic-gate 						 * Reset client flags to
36947c478bd9Sstevel@tonic-gate 						 * online as the path could not
36957c478bd9Sstevel@tonic-gate 						 * be offlined.
36967c478bd9Sstevel@tonic-gate 						 */
36974c06356bSdh142964 						MDI_DEBUG(1, (MDI_WARN, cdip,
36984c06356bSdh142964 						    "!ndi_devi_offline failed: "
36994c06356bSdh142964 						    "error %x", rv));
37007c478bd9Sstevel@tonic-gate 						MDI_CLIENT_SET_ONLINE(ct);
37017c478bd9Sstevel@tonic-gate 					}
37027c478bd9Sstevel@tonic-gate 				}
37037c478bd9Sstevel@tonic-gate 				break;
37047c478bd9Sstevel@tonic-gate 			}
37057c478bd9Sstevel@tonic-gate 			/*
37067c478bd9Sstevel@tonic-gate 			 * Convert to MDI error code
37077c478bd9Sstevel@tonic-gate 			 */
37087c478bd9Sstevel@tonic-gate 			switch (rv) {
37097c478bd9Sstevel@tonic-gate 			case NDI_SUCCESS:
37107c478bd9Sstevel@tonic-gate 				MDI_CLIENT_SET_REPORT_DEV_NEEDED(ct);
37117c478bd9Sstevel@tonic-gate 				i_mdi_report_path_state(ct, pip);
37127c478bd9Sstevel@tonic-gate 				rv = MDI_SUCCESS;
37137c478bd9Sstevel@tonic-gate 				break;
37147c478bd9Sstevel@tonic-gate 			case NDI_BUSY:
37157c478bd9Sstevel@tonic-gate 				rv = MDI_BUSY;
37167c478bd9Sstevel@tonic-gate 				break;
37177c478bd9Sstevel@tonic-gate 			default:
37187c478bd9Sstevel@tonic-gate 				rv = MDI_FAILURE;
37197c478bd9Sstevel@tonic-gate 				break;
37207c478bd9Sstevel@tonic-gate 			}
37217c478bd9Sstevel@tonic-gate 		}
37227c478bd9Sstevel@tonic-gate 	}
37237c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
37247c478bd9Sstevel@tonic-gate 
37257c478bd9Sstevel@tonic-gate state_change_exit:
37267c478bd9Sstevel@tonic-gate 	/*
37277c478bd9Sstevel@tonic-gate 	 * Mark the pHCI as stable again.
37287c478bd9Sstevel@tonic-gate 	 */
37297c478bd9Sstevel@tonic-gate 	MDI_PHCI_LOCK(ph);
37307c478bd9Sstevel@tonic-gate 	MDI_PHCI_STABLE(ph);
37317c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNLOCK(ph);
37327c478bd9Sstevel@tonic-gate 	return (rv);
37337c478bd9Sstevel@tonic-gate }
37347c478bd9Sstevel@tonic-gate 
37357c478bd9Sstevel@tonic-gate /*
37367c478bd9Sstevel@tonic-gate  * mdi_pi_online():
37377c478bd9Sstevel@tonic-gate  *		Place the path_info node in the online state.  The path is
37387c478bd9Sstevel@tonic-gate  *		now available to be selected by mdi_select_path() for
37397c478bd9Sstevel@tonic-gate  *		transporting I/O requests to client devices.
37407c478bd9Sstevel@tonic-gate  * Return Values:
37417c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
37427c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
37437c478bd9Sstevel@tonic-gate  */
37447c478bd9Sstevel@tonic-gate int
37457c478bd9Sstevel@tonic-gate mdi_pi_online(mdi_pathinfo_t *pip, int flags)
37467c478bd9Sstevel@tonic-gate {
37477c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct = MDI_PI(pip)->pi_client;
37487c478bd9Sstevel@tonic-gate 	int		client_held = 0;
37497c478bd9Sstevel@tonic-gate 	int		rv;
37507c478bd9Sstevel@tonic-gate 
37517c478bd9Sstevel@tonic-gate 	ASSERT(ct != NULL);
37527c478bd9Sstevel@tonic-gate 	rv = i_mdi_pi_state_change(pip, MDI_PATHINFO_STATE_ONLINE, flags);
37537c478bd9Sstevel@tonic-gate 	if (rv != MDI_SUCCESS)
37547c478bd9Sstevel@tonic-gate 		return (rv);
37557c478bd9Sstevel@tonic-gate 
37567c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
37577c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_pm_held == 0) {
37584c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, ct->ct_dip,
37594c06356bSdh142964 		    "i_mdi_pm_hold_pip %p", (void *)pip));
37607c478bd9Sstevel@tonic-gate 		i_mdi_pm_hold_pip(pip);
37617c478bd9Sstevel@tonic-gate 		client_held = 1;
37627c478bd9Sstevel@tonic-gate 	}
37637c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
37647c478bd9Sstevel@tonic-gate 
37657c478bd9Sstevel@tonic-gate 	if (client_held) {
37667c478bd9Sstevel@tonic-gate 		MDI_CLIENT_LOCK(ct);
37677c478bd9Sstevel@tonic-gate 		if (ct->ct_power_cnt == 0) {
37687c478bd9Sstevel@tonic-gate 			rv = i_mdi_power_all_phci(ct);
37697c478bd9Sstevel@tonic-gate 		}
37707c478bd9Sstevel@tonic-gate 
37714c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, ct->ct_dip,
37724c06356bSdh142964 		    "i_mdi_pm_hold_client %p", (void *)ct));
37737c478bd9Sstevel@tonic-gate 		i_mdi_pm_hold_client(ct, 1);
37747c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
37757c478bd9Sstevel@tonic-gate 	}
37767c478bd9Sstevel@tonic-gate 
37777c478bd9Sstevel@tonic-gate 	return (rv);
37787c478bd9Sstevel@tonic-gate }
37797c478bd9Sstevel@tonic-gate 
37807c478bd9Sstevel@tonic-gate /*
37817c478bd9Sstevel@tonic-gate  * mdi_pi_standby():
37827c478bd9Sstevel@tonic-gate  *		Place the mdi_pathinfo node in standby state
37837c478bd9Sstevel@tonic-gate  *
37847c478bd9Sstevel@tonic-gate  * Return Values:
37857c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
37867c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
37877c478bd9Sstevel@tonic-gate  */
37887c478bd9Sstevel@tonic-gate int
37897c478bd9Sstevel@tonic-gate mdi_pi_standby(mdi_pathinfo_t *pip, int flags)
37907c478bd9Sstevel@tonic-gate {
37917c478bd9Sstevel@tonic-gate 	return (i_mdi_pi_state_change(pip, MDI_PATHINFO_STATE_STANDBY, flags));
37927c478bd9Sstevel@tonic-gate }
37937c478bd9Sstevel@tonic-gate 
37947c478bd9Sstevel@tonic-gate /*
37957c478bd9Sstevel@tonic-gate  * mdi_pi_fault():
37967c478bd9Sstevel@tonic-gate  *		Place the mdi_pathinfo node in fault'ed state
37977c478bd9Sstevel@tonic-gate  * Return Values:
37987c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
37997c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
38007c478bd9Sstevel@tonic-gate  */
38017c478bd9Sstevel@tonic-gate int
38027c478bd9Sstevel@tonic-gate mdi_pi_fault(mdi_pathinfo_t *pip, int flags)
38037c478bd9Sstevel@tonic-gate {
38047c478bd9Sstevel@tonic-gate 	return (i_mdi_pi_state_change(pip, MDI_PATHINFO_STATE_FAULT, flags));
38057c478bd9Sstevel@tonic-gate }
38067c478bd9Sstevel@tonic-gate 
38077c478bd9Sstevel@tonic-gate /*
38087c478bd9Sstevel@tonic-gate  * mdi_pi_offline():
38097c478bd9Sstevel@tonic-gate  *		Offline a mdi_pathinfo node.
38107c478bd9Sstevel@tonic-gate  * Return Values:
38117c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
38127c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
38137c478bd9Sstevel@tonic-gate  */
38147c478bd9Sstevel@tonic-gate int
38157c478bd9Sstevel@tonic-gate mdi_pi_offline(mdi_pathinfo_t *pip, int flags)
38167c478bd9Sstevel@tonic-gate {
38177c478bd9Sstevel@tonic-gate 	int	ret, client_held = 0;
38187c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
38194c06356bSdh142964 
38204c06356bSdh142964 	/*
38214c06356bSdh142964 	 * Original code overloaded NDI_DEVI_REMOVE to this interface, and
38224c06356bSdh142964 	 * used it to mean "user initiated operation" (i.e. devctl). Callers
38234c06356bSdh142964 	 * should now just use NDI_USER_REQ.
38244c06356bSdh142964 	 */
38254c06356bSdh142964 	if (flags & NDI_DEVI_REMOVE) {
38264c06356bSdh142964 		flags &= ~NDI_DEVI_REMOVE;
38274c06356bSdh142964 		flags |= NDI_USER_REQ;
38284c06356bSdh142964 	}
38297c478bd9Sstevel@tonic-gate 
38307c478bd9Sstevel@tonic-gate 	ret = i_mdi_pi_state_change(pip, MDI_PATHINFO_STATE_OFFLINE, flags);
38317c478bd9Sstevel@tonic-gate 
38327c478bd9Sstevel@tonic-gate 	if (ret == MDI_SUCCESS) {
38337c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
38347c478bd9Sstevel@tonic-gate 		if (MDI_PI(pip)->pi_pm_held) {
38357c478bd9Sstevel@tonic-gate 			client_held = 1;
38367c478bd9Sstevel@tonic-gate 		}
38377c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
38387c478bd9Sstevel@tonic-gate 
38397c478bd9Sstevel@tonic-gate 		if (client_held) {
38407c478bd9Sstevel@tonic-gate 			ct = MDI_PI(pip)->pi_client;
38417c478bd9Sstevel@tonic-gate 			MDI_CLIENT_LOCK(ct);
38424c06356bSdh142964 			MDI_DEBUG(4, (MDI_NOTE, ct->ct_dip,
38434c06356bSdh142964 			    "i_mdi_pm_rele_client\n"));
38447c478bd9Sstevel@tonic-gate 			i_mdi_pm_rele_client(ct, 1);
38457c478bd9Sstevel@tonic-gate 			MDI_CLIENT_UNLOCK(ct);
38467c478bd9Sstevel@tonic-gate 		}
38477c478bd9Sstevel@tonic-gate 	}
38487c478bd9Sstevel@tonic-gate 
38497c478bd9Sstevel@tonic-gate 	return (ret);
38507c478bd9Sstevel@tonic-gate }
38517c478bd9Sstevel@tonic-gate 
38527c478bd9Sstevel@tonic-gate /*
38537c478bd9Sstevel@tonic-gate  * i_mdi_pi_offline():
38547c478bd9Sstevel@tonic-gate  *		Offline a mdi_pathinfo node and call the vHCI driver's callback
38557c478bd9Sstevel@tonic-gate  */
38567c478bd9Sstevel@tonic-gate static int
38577c478bd9Sstevel@tonic-gate i_mdi_pi_offline(mdi_pathinfo_t *pip, int flags)
38587c478bd9Sstevel@tonic-gate {
38597c478bd9Sstevel@tonic-gate 	dev_info_t	*vdip = NULL;
38607c478bd9Sstevel@tonic-gate 	mdi_vhci_t	*vh = NULL;
38617c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct = NULL;
38627c478bd9Sstevel@tonic-gate 	int		(*f)();
38637c478bd9Sstevel@tonic-gate 	int		rv;
38647c478bd9Sstevel@tonic-gate 
38657c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
38667c478bd9Sstevel@tonic-gate 	ct = MDI_PI(pip)->pi_client;
38677c478bd9Sstevel@tonic-gate 	ASSERT(ct != NULL);
38687c478bd9Sstevel@tonic-gate 
38697c478bd9Sstevel@tonic-gate 	while (MDI_PI(pip)->pi_ref_cnt != 0) {
38707c478bd9Sstevel@tonic-gate 		/*
38717c478bd9Sstevel@tonic-gate 		 * Give a chance for pending I/Os to complete.
38727c478bd9Sstevel@tonic-gate 		 */
38734c06356bSdh142964 		MDI_DEBUG(1, (MDI_NOTE, ct->ct_dip,
38744c06356bSdh142964 		    "!%d cmds still pending on path %s %p",
38754c06356bSdh142964 		    MDI_PI(pip)->pi_ref_cnt, mdi_pi_spathname(pip),
38764c06356bSdh142964 		    (void *)pip));
38777c478bd9Sstevel@tonic-gate 		if (cv_timedwait(&MDI_PI(pip)->pi_ref_cv,
38787c478bd9Sstevel@tonic-gate 		    &MDI_PI(pip)->pi_mutex,
38797c478bd9Sstevel@tonic-gate 		    ddi_get_lbolt() + drv_usectohz(60 * 1000000)) == -1) {
38807c478bd9Sstevel@tonic-gate 			/*
38817c478bd9Sstevel@tonic-gate 			 * The timeout time reached without ref_cnt being zero
38827c478bd9Sstevel@tonic-gate 			 * being signaled.
38837c478bd9Sstevel@tonic-gate 			 */
38844c06356bSdh142964 			MDI_DEBUG(1, (MDI_NOTE, ct->ct_dip,
38854c06356bSdh142964 			    "!Timeout reached on path %s %p without the cond",
38864c06356bSdh142964 			    mdi_pi_spathname(pip), (void *)pip));
38874c06356bSdh142964 			MDI_DEBUG(1, (MDI_NOTE, ct->ct_dip,
38884c06356bSdh142964 			    "!%d cmds still pending on path %s %p",
38894c06356bSdh142964 			    MDI_PI(pip)->pi_ref_cnt,
38904c06356bSdh142964 			    mdi_pi_spathname(pip), (void *)pip));
38917c478bd9Sstevel@tonic-gate 		}
38927c478bd9Sstevel@tonic-gate 	}
38937c478bd9Sstevel@tonic-gate 	vh = ct->ct_vhci;
38947c478bd9Sstevel@tonic-gate 	vdip = vh->vh_dip;
38957c478bd9Sstevel@tonic-gate 
38967c478bd9Sstevel@tonic-gate 	/*
38977c478bd9Sstevel@tonic-gate 	 * Notify vHCI that has registered this event
38987c478bd9Sstevel@tonic-gate 	 */
38997c478bd9Sstevel@tonic-gate 	ASSERT(vh->vh_ops);
39007c478bd9Sstevel@tonic-gate 	f = vh->vh_ops->vo_pi_state_change;
39017c478bd9Sstevel@tonic-gate 
39027c478bd9Sstevel@tonic-gate 	if (f != NULL) {
39037c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
39047c478bd9Sstevel@tonic-gate 		if ((rv = (*f)(vdip, pip, MDI_PATHINFO_STATE_OFFLINE, 0,
39057c478bd9Sstevel@tonic-gate 		    flags)) != MDI_SUCCESS) {
39064c06356bSdh142964 			MDI_DEBUG(1, (MDI_WARN, ct->ct_dip,
39074c06356bSdh142964 			    "!vo_path_offline failed: vdip %s%d %p: path %s %p",
39084c06356bSdh142964 			    ddi_driver_name(vdip), ddi_get_instance(vdip),
39094c06356bSdh142964 			    (void *)vdip, mdi_pi_spathname(pip), (void *)pip));
39107c478bd9Sstevel@tonic-gate 		}
39117c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
39127c478bd9Sstevel@tonic-gate 	}
39137c478bd9Sstevel@tonic-gate 
39147c478bd9Sstevel@tonic-gate 	/*
39157c478bd9Sstevel@tonic-gate 	 * Set the mdi_pathinfo node state and clear the transient condition
39167c478bd9Sstevel@tonic-gate 	 */
39177c478bd9Sstevel@tonic-gate 	MDI_PI_SET_OFFLINE(pip);
39187c478bd9Sstevel@tonic-gate 	cv_broadcast(&MDI_PI(pip)->pi_state_cv);
39197c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
39207c478bd9Sstevel@tonic-gate 
39217c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
39227c478bd9Sstevel@tonic-gate 	if (rv == MDI_SUCCESS) {
39237c478bd9Sstevel@tonic-gate 		if (ct->ct_unstable == 0) {
39247c478bd9Sstevel@tonic-gate 			dev_info_t	*cdip = ct->ct_dip;
39257c478bd9Sstevel@tonic-gate 
39267c478bd9Sstevel@tonic-gate 			/*
39277c478bd9Sstevel@tonic-gate 			 * Onlining the mdi_pathinfo node will impact the
39287c478bd9Sstevel@tonic-gate 			 * client state Update the client and dev_info node
39297c478bd9Sstevel@tonic-gate 			 * state accordingly
39307c478bd9Sstevel@tonic-gate 			 */
39317c478bd9Sstevel@tonic-gate 			i_mdi_client_update_state(ct);
39327c478bd9Sstevel@tonic-gate 			rv = NDI_SUCCESS;
39337c478bd9Sstevel@tonic-gate 			if (MDI_CLIENT_STATE(ct) == MDI_CLIENT_STATE_FAILED) {
39347c478bd9Sstevel@tonic-gate 				if (cdip &&
39357c478bd9Sstevel@tonic-gate 				    (i_ddi_node_state(cdip) >=
39367c478bd9Sstevel@tonic-gate 				    DS_INITIALIZED)) {
39377c478bd9Sstevel@tonic-gate 					MDI_CLIENT_UNLOCK(ct);
39384c06356bSdh142964 					rv = ndi_devi_offline(cdip,
39394c06356bSdh142964 					    NDI_DEVFS_CLEAN);
39407c478bd9Sstevel@tonic-gate 					MDI_CLIENT_LOCK(ct);
39417c478bd9Sstevel@tonic-gate 					if (rv != NDI_SUCCESS) {
39427c478bd9Sstevel@tonic-gate 						/*
39437c478bd9Sstevel@tonic-gate 						 * ndi_devi_offline failed.
39447c478bd9Sstevel@tonic-gate 						 * Reset client flags to
39457c478bd9Sstevel@tonic-gate 						 * online.
39467c478bd9Sstevel@tonic-gate 						 */
39474c06356bSdh142964 						MDI_DEBUG(4, (MDI_WARN, cdip,
39484c06356bSdh142964 						    "ndi_devi_offline failed: "
39494c06356bSdh142964 						    "error %x", rv));
39507c478bd9Sstevel@tonic-gate 						MDI_CLIENT_SET_ONLINE(ct);
39517c478bd9Sstevel@tonic-gate 					}
39527c478bd9Sstevel@tonic-gate 				}
39537c478bd9Sstevel@tonic-gate 			}
39547c478bd9Sstevel@tonic-gate 			/*
39557c478bd9Sstevel@tonic-gate 			 * Convert to MDI error code
39567c478bd9Sstevel@tonic-gate 			 */
39577c478bd9Sstevel@tonic-gate 			switch (rv) {
39587c478bd9Sstevel@tonic-gate 			case NDI_SUCCESS:
39597c478bd9Sstevel@tonic-gate 				rv = MDI_SUCCESS;
39607c478bd9Sstevel@tonic-gate 				break;
39617c478bd9Sstevel@tonic-gate 			case NDI_BUSY:
39627c478bd9Sstevel@tonic-gate 				rv = MDI_BUSY;
39637c478bd9Sstevel@tonic-gate 				break;
39647c478bd9Sstevel@tonic-gate 			default:
39657c478bd9Sstevel@tonic-gate 				rv = MDI_FAILURE;
39667c478bd9Sstevel@tonic-gate 				break;
39677c478bd9Sstevel@tonic-gate 			}
39687c478bd9Sstevel@tonic-gate 		}
39697c478bd9Sstevel@tonic-gate 		MDI_CLIENT_SET_REPORT_DEV_NEEDED(ct);
39707c478bd9Sstevel@tonic-gate 		i_mdi_report_path_state(ct, pip);
39717c478bd9Sstevel@tonic-gate 	}
39727c478bd9Sstevel@tonic-gate 
39737c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
39747c478bd9Sstevel@tonic-gate 
39757c478bd9Sstevel@tonic-gate 	/*
39767c478bd9Sstevel@tonic-gate 	 * Change in the mdi_pathinfo node state will impact the client state
39777c478bd9Sstevel@tonic-gate 	 */
39784c06356bSdh142964 	MDI_DEBUG(2, (MDI_NOTE, ct->ct_dip,
39794c06356bSdh142964 	    "ct = %p pip = %p", (void *)ct, (void *)pip));
39807c478bd9Sstevel@tonic-gate 	return (rv);
39817c478bd9Sstevel@tonic-gate }
39827c478bd9Sstevel@tonic-gate 
398355e592a2SRandall Ralphs /*
398455e592a2SRandall Ralphs  * mdi_pi_get_node_name():
398555e592a2SRandall Ralphs  *              Get the name associated with a mdi_pathinfo node.
398655e592a2SRandall Ralphs  *              Since pathinfo nodes are not directly named, we
398755e592a2SRandall Ralphs  *              return the node_name of the client.
398855e592a2SRandall Ralphs  *
398955e592a2SRandall Ralphs  * Return Values:
399055e592a2SRandall Ralphs  *              char *
399155e592a2SRandall Ralphs  */
399255e592a2SRandall Ralphs char *
399355e592a2SRandall Ralphs mdi_pi_get_node_name(mdi_pathinfo_t *pip)
399455e592a2SRandall Ralphs {
399555e592a2SRandall Ralphs 	mdi_client_t    *ct;
399655e592a2SRandall Ralphs 
399755e592a2SRandall Ralphs 	if (pip == NULL)
399855e592a2SRandall Ralphs 		return (NULL);
399955e592a2SRandall Ralphs 	ct = MDI_PI(pip)->pi_client;
400055e592a2SRandall Ralphs 	if ((ct == NULL) || (ct->ct_dip == NULL))
400155e592a2SRandall Ralphs 		return (NULL);
400255e592a2SRandall Ralphs 	return (ddi_node_name(ct->ct_dip));
400355e592a2SRandall Ralphs }
40047c478bd9Sstevel@tonic-gate 
40057c478bd9Sstevel@tonic-gate /*
40067c478bd9Sstevel@tonic-gate  * mdi_pi_get_addr():
40077c478bd9Sstevel@tonic-gate  *		Get the unit address associated with a mdi_pathinfo node
40087c478bd9Sstevel@tonic-gate  *
40097c478bd9Sstevel@tonic-gate  * Return Values:
40107c478bd9Sstevel@tonic-gate  *		char *
40117c478bd9Sstevel@tonic-gate  */
40127c478bd9Sstevel@tonic-gate char *
40137c478bd9Sstevel@tonic-gate mdi_pi_get_addr(mdi_pathinfo_t *pip)
40147c478bd9Sstevel@tonic-gate {
40157c478bd9Sstevel@tonic-gate 	if (pip == NULL)
40167c478bd9Sstevel@tonic-gate 		return (NULL);
40177c478bd9Sstevel@tonic-gate 
401872a50065Scth 	return (MDI_PI(pip)->pi_addr);
40197c478bd9Sstevel@tonic-gate }
40207c478bd9Sstevel@tonic-gate 
40217c478bd9Sstevel@tonic-gate /*
4022602ca9eaScth  * mdi_pi_get_path_instance():
4023602ca9eaScth  *		Get the 'path_instance' of a mdi_pathinfo node
4024602ca9eaScth  *
4025602ca9eaScth  * Return Values:
4026602ca9eaScth  *		path_instance
4027602ca9eaScth  */
4028602ca9eaScth int
4029602ca9eaScth mdi_pi_get_path_instance(mdi_pathinfo_t *pip)
4030602ca9eaScth {
4031602ca9eaScth 	if (pip == NULL)
4032602ca9eaScth 		return (0);
4033602ca9eaScth 
4034602ca9eaScth 	return (MDI_PI(pip)->pi_path_instance);
4035602ca9eaScth }
4036602ca9eaScth 
4037602ca9eaScth /*
4038602ca9eaScth  * mdi_pi_pathname():
4039602ca9eaScth  *		Return pointer to path to pathinfo node.
4040602ca9eaScth  */
4041602ca9eaScth char *
4042602ca9eaScth mdi_pi_pathname(mdi_pathinfo_t *pip)
4043602ca9eaScth {
4044602ca9eaScth 	if (pip == NULL)
4045602ca9eaScth 		return (NULL);
4046602ca9eaScth 	return (mdi_pi_pathname_by_instance(mdi_pi_get_path_instance(pip)));
4047602ca9eaScth }
4048602ca9eaScth 
40494c06356bSdh142964 /*
40504c06356bSdh142964  * mdi_pi_spathname():
40514c06356bSdh142964  *		Return pointer to shortpath to pathinfo node. Used for debug
40524c06356bSdh142964  *		messages, so return "" instead of NULL when unknown.
40534c06356bSdh142964  */
40544c06356bSdh142964 char *
40554c06356bSdh142964 mdi_pi_spathname(mdi_pathinfo_t *pip)
40564c06356bSdh142964 {
40574c06356bSdh142964 	char	*spath = "";
40584c06356bSdh142964 
40594c06356bSdh142964 	if (pip) {
40604c06356bSdh142964 		spath = mdi_pi_spathname_by_instance(
40614c06356bSdh142964 		    mdi_pi_get_path_instance(pip));
40624c06356bSdh142964 		if (spath == NULL)
40634c06356bSdh142964 			spath = "";
40644c06356bSdh142964 	}
40654c06356bSdh142964 	return (spath);
40664c06356bSdh142964 }
40674c06356bSdh142964 
406838c67cbdSjiang wu - Sun Microsystems - Beijing China char *
406938c67cbdSjiang wu - Sun Microsystems - Beijing China mdi_pi_pathname_obp(mdi_pathinfo_t *pip, char *path)
407038c67cbdSjiang wu - Sun Microsystems - Beijing China {
407138c67cbdSjiang wu - Sun Microsystems - Beijing China 	char *obp_path = NULL;
407238c67cbdSjiang wu - Sun Microsystems - Beijing China 	if ((pip == NULL) || (path == NULL))
407338c67cbdSjiang wu - Sun Microsystems - Beijing China 		return (NULL);
407438c67cbdSjiang wu - Sun Microsystems - Beijing China 
407538c67cbdSjiang wu - Sun Microsystems - Beijing China 	if (mdi_prop_lookup_string(pip, "obp-path", &obp_path) == MDI_SUCCESS) {
407638c67cbdSjiang wu - Sun Microsystems - Beijing China 		(void) strcpy(path, obp_path);
407738c67cbdSjiang wu - Sun Microsystems - Beijing China 		(void) mdi_prop_free(obp_path);
407838c67cbdSjiang wu - Sun Microsystems - Beijing China 	} else {
407938c67cbdSjiang wu - Sun Microsystems - Beijing China 		path = NULL;
408038c67cbdSjiang wu - Sun Microsystems - Beijing China 	}
408138c67cbdSjiang wu - Sun Microsystems - Beijing China 	return (path);
408238c67cbdSjiang wu - Sun Microsystems - Beijing China }
408338c67cbdSjiang wu - Sun Microsystems - Beijing China 
408438c67cbdSjiang wu - Sun Microsystems - Beijing China int
408538c67cbdSjiang wu - Sun Microsystems - Beijing China mdi_pi_pathname_obp_set(mdi_pathinfo_t *pip, char *component)
408638c67cbdSjiang wu - Sun Microsystems - Beijing China {
408738c67cbdSjiang wu - Sun Microsystems - Beijing China 	dev_info_t *pdip;
4088caa9369fSjiang wu - Sun Microsystems - Beijing China 	char *obp_path = NULL;
4089caa9369fSjiang wu - Sun Microsystems - Beijing China 	int rc = MDI_FAILURE;
409038c67cbdSjiang wu - Sun Microsystems - Beijing China 
409138c67cbdSjiang wu - Sun Microsystems - Beijing China 	if (pip == NULL)
409238c67cbdSjiang wu - Sun Microsystems - Beijing China 		return (MDI_FAILURE);
409338c67cbdSjiang wu - Sun Microsystems - Beijing China 
409438c67cbdSjiang wu - Sun Microsystems - Beijing China 	pdip = mdi_pi_get_phci(pip);
409538c67cbdSjiang wu - Sun Microsystems - Beijing China 	if (pdip == NULL)
409638c67cbdSjiang wu - Sun Microsystems - Beijing China 		return (MDI_FAILURE);
409738c67cbdSjiang wu - Sun Microsystems - Beijing China 
4098caa9369fSjiang wu - Sun Microsystems - Beijing China 	obp_path = kmem_zalloc(MAXPATHLEN, KM_SLEEP);
4099caa9369fSjiang wu - Sun Microsystems - Beijing China 
410038c67cbdSjiang wu - Sun Microsystems - Beijing China 	if (ddi_pathname_obp(pdip, obp_path) == NULL) {
410138c67cbdSjiang wu - Sun Microsystems - Beijing China 		(void) ddi_pathname(pdip, obp_path);
410238c67cbdSjiang wu - Sun Microsystems - Beijing China 	}
410338c67cbdSjiang wu - Sun Microsystems - Beijing China 
410438c67cbdSjiang wu - Sun Microsystems - Beijing China 	if (component) {
4105caa9369fSjiang wu - Sun Microsystems - Beijing China 		(void) strncat(obp_path, "/", MAXPATHLEN);
4106caa9369fSjiang wu - Sun Microsystems - Beijing China 		(void) strncat(obp_path, component, MAXPATHLEN);
410738c67cbdSjiang wu - Sun Microsystems - Beijing China 	}
4108caa9369fSjiang wu - Sun Microsystems - Beijing China 	rc = mdi_prop_update_string(pip, "obp-path", obp_path);
410938c67cbdSjiang wu - Sun Microsystems - Beijing China 
4110caa9369fSjiang wu - Sun Microsystems - Beijing China 	if (obp_path)
4111caa9369fSjiang wu - Sun Microsystems - Beijing China 		kmem_free(obp_path, MAXPATHLEN);
4112caa9369fSjiang wu - Sun Microsystems - Beijing China 	return (rc);
411338c67cbdSjiang wu - Sun Microsystems - Beijing China }
411438c67cbdSjiang wu - Sun Microsystems - Beijing China 
4115602ca9eaScth /*
41167c478bd9Sstevel@tonic-gate  * mdi_pi_get_client():
41177c478bd9Sstevel@tonic-gate  *		Get the client devinfo associated with a mdi_pathinfo node
41187c478bd9Sstevel@tonic-gate  *
41197c478bd9Sstevel@tonic-gate  * Return Values:
41207c478bd9Sstevel@tonic-gate  *		Handle to client device dev_info node
41217c478bd9Sstevel@tonic-gate  */
41227c478bd9Sstevel@tonic-gate dev_info_t *
41237c478bd9Sstevel@tonic-gate mdi_pi_get_client(mdi_pathinfo_t *pip)
41247c478bd9Sstevel@tonic-gate {
41257c478bd9Sstevel@tonic-gate 	dev_info_t	*dip = NULL;
41267c478bd9Sstevel@tonic-gate 	if (pip) {
41277c478bd9Sstevel@tonic-gate 		dip = MDI_PI(pip)->pi_client->ct_dip;
41287c478bd9Sstevel@tonic-gate 	}
41297c478bd9Sstevel@tonic-gate 	return (dip);
41307c478bd9Sstevel@tonic-gate }
41317c478bd9Sstevel@tonic-gate 
41327c478bd9Sstevel@tonic-gate /*
41337c478bd9Sstevel@tonic-gate  * mdi_pi_get_phci():
41347c478bd9Sstevel@tonic-gate  *		Get the pHCI devinfo associated with the mdi_pathinfo node
41357c478bd9Sstevel@tonic-gate  * Return Values:
41367c478bd9Sstevel@tonic-gate  *		Handle to dev_info node
41377c478bd9Sstevel@tonic-gate  */
41387c478bd9Sstevel@tonic-gate dev_info_t *
41397c478bd9Sstevel@tonic-gate mdi_pi_get_phci(mdi_pathinfo_t *pip)
41407c478bd9Sstevel@tonic-gate {
41417c478bd9Sstevel@tonic-gate 	dev_info_t	*dip = NULL;
41424c06356bSdh142964 	mdi_phci_t	*ph;
41434c06356bSdh142964 
41447c478bd9Sstevel@tonic-gate 	if (pip) {
41454c06356bSdh142964 		ph = MDI_PI(pip)->pi_phci;
41464c06356bSdh142964 		if (ph)
41474c06356bSdh142964 			dip = ph->ph_dip;
41487c478bd9Sstevel@tonic-gate 	}
41497c478bd9Sstevel@tonic-gate 	return (dip);
41507c478bd9Sstevel@tonic-gate }
41517c478bd9Sstevel@tonic-gate 
41527c478bd9Sstevel@tonic-gate /*
41537c478bd9Sstevel@tonic-gate  * mdi_pi_get_client_private():
41547c478bd9Sstevel@tonic-gate  *		Get the client private information associated with the
41557c478bd9Sstevel@tonic-gate  *		mdi_pathinfo node
41567c478bd9Sstevel@tonic-gate  */
41577c478bd9Sstevel@tonic-gate void *
41587c478bd9Sstevel@tonic-gate mdi_pi_get_client_private(mdi_pathinfo_t *pip)
41597c478bd9Sstevel@tonic-gate {
41607c478bd9Sstevel@tonic-gate 	void *cprivate = NULL;
41617c478bd9Sstevel@tonic-gate 	if (pip) {
41627c478bd9Sstevel@tonic-gate 		cprivate = MDI_PI(pip)->pi_cprivate;
41637c478bd9Sstevel@tonic-gate 	}
41647c478bd9Sstevel@tonic-gate 	return (cprivate);
41657c478bd9Sstevel@tonic-gate }
41667c478bd9Sstevel@tonic-gate 
41677c478bd9Sstevel@tonic-gate /*
41687c478bd9Sstevel@tonic-gate  * mdi_pi_set_client_private():
41697c478bd9Sstevel@tonic-gate  *		Set the client private information in the mdi_pathinfo node
41707c478bd9Sstevel@tonic-gate  */
41717c478bd9Sstevel@tonic-gate void
41727c478bd9Sstevel@tonic-gate mdi_pi_set_client_private(mdi_pathinfo_t *pip, void *priv)
41737c478bd9Sstevel@tonic-gate {
41747c478bd9Sstevel@tonic-gate 	if (pip) {
41757c478bd9Sstevel@tonic-gate 		MDI_PI(pip)->pi_cprivate = priv;
41767c478bd9Sstevel@tonic-gate 	}
41777c478bd9Sstevel@tonic-gate }
41787c478bd9Sstevel@tonic-gate 
41797c478bd9Sstevel@tonic-gate /*
41807c478bd9Sstevel@tonic-gate  * mdi_pi_get_phci_private():
41817c478bd9Sstevel@tonic-gate  *		Get the pHCI private information associated with the
41827c478bd9Sstevel@tonic-gate  *		mdi_pathinfo node
41837c478bd9Sstevel@tonic-gate  */
41847c478bd9Sstevel@tonic-gate caddr_t
41857c478bd9Sstevel@tonic-gate mdi_pi_get_phci_private(mdi_pathinfo_t *pip)
41867c478bd9Sstevel@tonic-gate {
41877c478bd9Sstevel@tonic-gate 	caddr_t	pprivate = NULL;
41884c06356bSdh142964 
41897c478bd9Sstevel@tonic-gate 	if (pip) {
41907c478bd9Sstevel@tonic-gate 		pprivate = MDI_PI(pip)->pi_pprivate;
41917c478bd9Sstevel@tonic-gate 	}
41927c478bd9Sstevel@tonic-gate 	return (pprivate);
41937c478bd9Sstevel@tonic-gate }
41947c478bd9Sstevel@tonic-gate 
41957c478bd9Sstevel@tonic-gate /*
41967c478bd9Sstevel@tonic-gate  * mdi_pi_set_phci_private():
41977c478bd9Sstevel@tonic-gate  *		Set the pHCI private information in the mdi_pathinfo node
41987c478bd9Sstevel@tonic-gate  */
41997c478bd9Sstevel@tonic-gate void
42007c478bd9Sstevel@tonic-gate mdi_pi_set_phci_private(mdi_pathinfo_t *pip, caddr_t priv)
42017c478bd9Sstevel@tonic-gate {
42027c478bd9Sstevel@tonic-gate 	if (pip) {
42037c478bd9Sstevel@tonic-gate 		MDI_PI(pip)->pi_pprivate = priv;
42047c478bd9Sstevel@tonic-gate 	}
42057c478bd9Sstevel@tonic-gate }
42067c478bd9Sstevel@tonic-gate 
42077c478bd9Sstevel@tonic-gate /*
42087c478bd9Sstevel@tonic-gate  * mdi_pi_get_state():
42097c478bd9Sstevel@tonic-gate  *		Get the mdi_pathinfo node state. Transient states are internal
42107c478bd9Sstevel@tonic-gate  *		and not provided to the users
42117c478bd9Sstevel@tonic-gate  */
42127c478bd9Sstevel@tonic-gate mdi_pathinfo_state_t
42137c478bd9Sstevel@tonic-gate mdi_pi_get_state(mdi_pathinfo_t *pip)
42147c478bd9Sstevel@tonic-gate {
42157c478bd9Sstevel@tonic-gate 	mdi_pathinfo_state_t    state = MDI_PATHINFO_STATE_INIT;
42167c478bd9Sstevel@tonic-gate 
42177c478bd9Sstevel@tonic-gate 	if (pip) {
42187c478bd9Sstevel@tonic-gate 		if (MDI_PI_IS_TRANSIENT(pip)) {
42197c478bd9Sstevel@tonic-gate 			/*
42207c478bd9Sstevel@tonic-gate 			 * mdi_pathinfo is in state transition.  Return the
42217c478bd9Sstevel@tonic-gate 			 * last good state.
42227c478bd9Sstevel@tonic-gate 			 */
42237c478bd9Sstevel@tonic-gate 			state = MDI_PI_OLD_STATE(pip);
42247c478bd9Sstevel@tonic-gate 		} else {
42257c478bd9Sstevel@tonic-gate 			state = MDI_PI_STATE(pip);
42267c478bd9Sstevel@tonic-gate 		}
42277c478bd9Sstevel@tonic-gate 	}
42287c478bd9Sstevel@tonic-gate 	return (state);
42297c478bd9Sstevel@tonic-gate }
42307c478bd9Sstevel@tonic-gate 
42317c478bd9Sstevel@tonic-gate /*
42324c06356bSdh142964  * mdi_pi_get_flags():
42334c06356bSdh142964  *		Get the mdi_pathinfo node flags.
42344c06356bSdh142964  */
42354c06356bSdh142964 uint_t
42364c06356bSdh142964 mdi_pi_get_flags(mdi_pathinfo_t *pip)
42374c06356bSdh142964 {
42384c06356bSdh142964 	return (pip ? MDI_PI(pip)->pi_flags : 0);
42394c06356bSdh142964 }
42404c06356bSdh142964 
42414c06356bSdh142964 /*
42427c478bd9Sstevel@tonic-gate  * Note that the following function needs to be the new interface for
42437c478bd9Sstevel@tonic-gate  * mdi_pi_get_state when mpxio gets integrated to ON.
42447c478bd9Sstevel@tonic-gate  */
42457c478bd9Sstevel@tonic-gate int
42467c478bd9Sstevel@tonic-gate mdi_pi_get_state2(mdi_pathinfo_t *pip, mdi_pathinfo_state_t *state,
42477c478bd9Sstevel@tonic-gate 		uint32_t *ext_state)
42487c478bd9Sstevel@tonic-gate {
42497c478bd9Sstevel@tonic-gate 	*state = MDI_PATHINFO_STATE_INIT;
42507c478bd9Sstevel@tonic-gate 
42517c478bd9Sstevel@tonic-gate 	if (pip) {
42527c478bd9Sstevel@tonic-gate 		if (MDI_PI_IS_TRANSIENT(pip)) {
42537c478bd9Sstevel@tonic-gate 			/*
42547c478bd9Sstevel@tonic-gate 			 * mdi_pathinfo is in state transition.  Return the
42557c478bd9Sstevel@tonic-gate 			 * last good state.
42567c478bd9Sstevel@tonic-gate 			 */
42577c478bd9Sstevel@tonic-gate 			*state = MDI_PI_OLD_STATE(pip);
42587c478bd9Sstevel@tonic-gate 			*ext_state = MDI_PI_OLD_EXT_STATE(pip);
42597c478bd9Sstevel@tonic-gate 		} else {
42607c478bd9Sstevel@tonic-gate 			*state = MDI_PI_STATE(pip);
42617c478bd9Sstevel@tonic-gate 			*ext_state = MDI_PI_EXT_STATE(pip);
42627c478bd9Sstevel@tonic-gate 		}
42637c478bd9Sstevel@tonic-gate 	}
42647c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
42657c478bd9Sstevel@tonic-gate }
42667c478bd9Sstevel@tonic-gate 
42677c478bd9Sstevel@tonic-gate /*
42687c478bd9Sstevel@tonic-gate  * mdi_pi_get_preferred:
42697c478bd9Sstevel@tonic-gate  *	Get the preferred path flag
42707c478bd9Sstevel@tonic-gate  */
42717c478bd9Sstevel@tonic-gate int
42727c478bd9Sstevel@tonic-gate mdi_pi_get_preferred(mdi_pathinfo_t *pip)
42737c478bd9Sstevel@tonic-gate {
42747c478bd9Sstevel@tonic-gate 	if (pip) {
42757c478bd9Sstevel@tonic-gate 		return (MDI_PI(pip)->pi_preferred);
42767c478bd9Sstevel@tonic-gate 	}
42777c478bd9Sstevel@tonic-gate 	return (0);
42787c478bd9Sstevel@tonic-gate }
42797c478bd9Sstevel@tonic-gate 
42807c478bd9Sstevel@tonic-gate /*
42817c478bd9Sstevel@tonic-gate  * mdi_pi_set_preferred:
42827c478bd9Sstevel@tonic-gate  *	Set the preferred path flag
42837c478bd9Sstevel@tonic-gate  */
42847c478bd9Sstevel@tonic-gate void
42857c478bd9Sstevel@tonic-gate mdi_pi_set_preferred(mdi_pathinfo_t *pip, int preferred)
42867c478bd9Sstevel@tonic-gate {
42877c478bd9Sstevel@tonic-gate 	if (pip) {
42887c478bd9Sstevel@tonic-gate 		MDI_PI(pip)->pi_preferred = preferred;
42897c478bd9Sstevel@tonic-gate 	}
42907c478bd9Sstevel@tonic-gate }
42917c478bd9Sstevel@tonic-gate 
42927c478bd9Sstevel@tonic-gate /*
42937c478bd9Sstevel@tonic-gate  * mdi_pi_set_state():
42947c478bd9Sstevel@tonic-gate  *		Set the mdi_pathinfo node state
42957c478bd9Sstevel@tonic-gate  */
42967c478bd9Sstevel@tonic-gate void
42977c478bd9Sstevel@tonic-gate mdi_pi_set_state(mdi_pathinfo_t *pip, mdi_pathinfo_state_t state)
42987c478bd9Sstevel@tonic-gate {
42997c478bd9Sstevel@tonic-gate 	uint32_t	ext_state;
43007c478bd9Sstevel@tonic-gate 
43017c478bd9Sstevel@tonic-gate 	if (pip) {
43027c478bd9Sstevel@tonic-gate 		ext_state = MDI_PI(pip)->pi_state & MDI_PATHINFO_EXT_STATE_MASK;
43037c478bd9Sstevel@tonic-gate 		MDI_PI(pip)->pi_state = state;
43047c478bd9Sstevel@tonic-gate 		MDI_PI(pip)->pi_state |= ext_state;
43054c06356bSdh142964 
43064c06356bSdh142964 		/* Path has changed state, invalidate DINFOCACHE snap shot. */
43074c06356bSdh142964 		i_ddi_di_cache_invalidate();
43087c478bd9Sstevel@tonic-gate 	}
43097c478bd9Sstevel@tonic-gate }
43107c478bd9Sstevel@tonic-gate 
43117c478bd9Sstevel@tonic-gate /*
43127c478bd9Sstevel@tonic-gate  * Property functions:
43137c478bd9Sstevel@tonic-gate  */
43147c478bd9Sstevel@tonic-gate int
43157c478bd9Sstevel@tonic-gate i_map_nvlist_error_to_mdi(int val)
43167c478bd9Sstevel@tonic-gate {
43177c478bd9Sstevel@tonic-gate 	int rv;
43187c478bd9Sstevel@tonic-gate 
43197c478bd9Sstevel@tonic-gate 	switch (val) {
43207c478bd9Sstevel@tonic-gate 	case 0:
43217c478bd9Sstevel@tonic-gate 		rv = DDI_PROP_SUCCESS;
43227c478bd9Sstevel@tonic-gate 		break;
43237c478bd9Sstevel@tonic-gate 	case EINVAL:
43247c478bd9Sstevel@tonic-gate 	case ENOTSUP:
43257c478bd9Sstevel@tonic-gate 		rv = DDI_PROP_INVAL_ARG;
43267c478bd9Sstevel@tonic-gate 		break;
43277c478bd9Sstevel@tonic-gate 	case ENOMEM:
43287c478bd9Sstevel@tonic-gate 		rv = DDI_PROP_NO_MEMORY;
43297c478bd9Sstevel@tonic-gate 		break;
43307c478bd9Sstevel@tonic-gate 	default:
43317c478bd9Sstevel@tonic-gate 		rv = DDI_PROP_NOT_FOUND;
43327c478bd9Sstevel@tonic-gate 		break;
43337c478bd9Sstevel@tonic-gate 	}
43347c478bd9Sstevel@tonic-gate 	return (rv);
43357c478bd9Sstevel@tonic-gate }
43367c478bd9Sstevel@tonic-gate 
43377c478bd9Sstevel@tonic-gate /*
43387c478bd9Sstevel@tonic-gate  * mdi_pi_get_next_prop():
43397c478bd9Sstevel@tonic-gate  * 		Property walk function.  The caller should hold mdi_pi_lock()
43407c478bd9Sstevel@tonic-gate  *		and release by calling mdi_pi_unlock() at the end of walk to
43417c478bd9Sstevel@tonic-gate  *		get a consistent value.
43427c478bd9Sstevel@tonic-gate  */
43437c478bd9Sstevel@tonic-gate nvpair_t *
43447c478bd9Sstevel@tonic-gate mdi_pi_get_next_prop(mdi_pathinfo_t *pip, nvpair_t *prev)
43457c478bd9Sstevel@tonic-gate {
43467c478bd9Sstevel@tonic-gate 	if ((pip == NULL) || (MDI_PI(pip)->pi_prop == NULL)) {
43477c478bd9Sstevel@tonic-gate 		return (NULL);
43487c478bd9Sstevel@tonic-gate 	}
43495e3986cbScth 	ASSERT(MDI_PI_LOCKED(pip));
43507c478bd9Sstevel@tonic-gate 	return (nvlist_next_nvpair(MDI_PI(pip)->pi_prop, prev));
43517c478bd9Sstevel@tonic-gate }
43527c478bd9Sstevel@tonic-gate 
43537c478bd9Sstevel@tonic-gate /*
43547c478bd9Sstevel@tonic-gate  * mdi_prop_remove():
43557c478bd9Sstevel@tonic-gate  * 		Remove the named property from the named list.
43567c478bd9Sstevel@tonic-gate  */
43577c478bd9Sstevel@tonic-gate int
43587c478bd9Sstevel@tonic-gate mdi_prop_remove(mdi_pathinfo_t *pip, char *name)
43597c478bd9Sstevel@tonic-gate {
43607c478bd9Sstevel@tonic-gate 	if (pip == NULL) {
43617c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
43627c478bd9Sstevel@tonic-gate 	}
43635e3986cbScth 	ASSERT(!MDI_PI_LOCKED(pip));
43647c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
43657c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_prop == NULL) {
43667c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
43677c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
43687c478bd9Sstevel@tonic-gate 	}
43697c478bd9Sstevel@tonic-gate 	if (name) {
43707c478bd9Sstevel@tonic-gate 		(void) nvlist_remove_all(MDI_PI(pip)->pi_prop, name);
43717c478bd9Sstevel@tonic-gate 	} else {
43727c478bd9Sstevel@tonic-gate 		char		nvp_name[MAXNAMELEN];
43737c478bd9Sstevel@tonic-gate 		nvpair_t	*nvp;
43747c478bd9Sstevel@tonic-gate 		nvp = nvlist_next_nvpair(MDI_PI(pip)->pi_prop, NULL);
43757c478bd9Sstevel@tonic-gate 		while (nvp) {
43767c478bd9Sstevel@tonic-gate 			nvpair_t	*next;
43777c478bd9Sstevel@tonic-gate 			next = nvlist_next_nvpair(MDI_PI(pip)->pi_prop, nvp);
43784c06356bSdh142964 			(void) snprintf(nvp_name, sizeof(nvp_name), "%s",
43797c478bd9Sstevel@tonic-gate 			    nvpair_name(nvp));
43807c478bd9Sstevel@tonic-gate 			(void) nvlist_remove_all(MDI_PI(pip)->pi_prop,
43817c478bd9Sstevel@tonic-gate 			    nvp_name);
43827c478bd9Sstevel@tonic-gate 			nvp = next;
43837c478bd9Sstevel@tonic-gate 		}
43847c478bd9Sstevel@tonic-gate 	}
43857c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
43867c478bd9Sstevel@tonic-gate 	return (DDI_PROP_SUCCESS);
43877c478bd9Sstevel@tonic-gate }
43887c478bd9Sstevel@tonic-gate 
43897c478bd9Sstevel@tonic-gate /*
43907c478bd9Sstevel@tonic-gate  * mdi_prop_size():
43917c478bd9Sstevel@tonic-gate  * 		Get buffer size needed to pack the property data.
43927c478bd9Sstevel@tonic-gate  * 		Caller should hold the mdi_pathinfo_t lock to get a consistent
43937c478bd9Sstevel@tonic-gate  *		buffer size.
43947c478bd9Sstevel@tonic-gate  */
43957c478bd9Sstevel@tonic-gate int
43967c478bd9Sstevel@tonic-gate mdi_prop_size(mdi_pathinfo_t *pip, size_t *buflenp)
43977c478bd9Sstevel@tonic-gate {
43987c478bd9Sstevel@tonic-gate 	int	rv;
43997c478bd9Sstevel@tonic-gate 	size_t	bufsize;
44007c478bd9Sstevel@tonic-gate 
44017c478bd9Sstevel@tonic-gate 	*buflenp = 0;
44027c478bd9Sstevel@tonic-gate 	if ((pip == NULL) || (MDI_PI(pip)->pi_prop == NULL)) {
44037c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
44047c478bd9Sstevel@tonic-gate 	}
44055e3986cbScth 	ASSERT(MDI_PI_LOCKED(pip));
44067c478bd9Sstevel@tonic-gate 	rv = nvlist_size(MDI_PI(pip)->pi_prop,
44077c478bd9Sstevel@tonic-gate 	    &bufsize, NV_ENCODE_NATIVE);
44087c478bd9Sstevel@tonic-gate 	*buflenp = bufsize;
44097c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
44107c478bd9Sstevel@tonic-gate }
44117c478bd9Sstevel@tonic-gate 
44127c478bd9Sstevel@tonic-gate /*
44137c478bd9Sstevel@tonic-gate  * mdi_prop_pack():
44147c478bd9Sstevel@tonic-gate  * 		pack the property list.  The caller should hold the
44157c478bd9Sstevel@tonic-gate  *		mdi_pathinfo_t node to get a consistent data
44167c478bd9Sstevel@tonic-gate  */
44177c478bd9Sstevel@tonic-gate int
44187c478bd9Sstevel@tonic-gate mdi_prop_pack(mdi_pathinfo_t *pip, char **bufp, uint_t buflen)
44197c478bd9Sstevel@tonic-gate {
44207c478bd9Sstevel@tonic-gate 	int	rv;
44217c478bd9Sstevel@tonic-gate 	size_t	bufsize;
44227c478bd9Sstevel@tonic-gate 
44237c478bd9Sstevel@tonic-gate 	if ((pip == NULL) || MDI_PI(pip)->pi_prop == NULL) {
44247c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
44257c478bd9Sstevel@tonic-gate 	}
44267c478bd9Sstevel@tonic-gate 
44275e3986cbScth 	ASSERT(MDI_PI_LOCKED(pip));
44287c478bd9Sstevel@tonic-gate 
44297c478bd9Sstevel@tonic-gate 	bufsize = buflen;
44307c478bd9Sstevel@tonic-gate 	rv = nvlist_pack(MDI_PI(pip)->pi_prop, bufp, (size_t *)&bufsize,
44317c478bd9Sstevel@tonic-gate 	    NV_ENCODE_NATIVE, KM_SLEEP);
44327c478bd9Sstevel@tonic-gate 
44337c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
44347c478bd9Sstevel@tonic-gate }
44357c478bd9Sstevel@tonic-gate 
44367c478bd9Sstevel@tonic-gate /*
44377c478bd9Sstevel@tonic-gate  * mdi_prop_update_byte():
44387c478bd9Sstevel@tonic-gate  *		Create/Update a byte property
44397c478bd9Sstevel@tonic-gate  */
44407c478bd9Sstevel@tonic-gate int
44417c478bd9Sstevel@tonic-gate mdi_prop_update_byte(mdi_pathinfo_t *pip, char *name, uchar_t data)
44427c478bd9Sstevel@tonic-gate {
44437c478bd9Sstevel@tonic-gate 	int rv;
44447c478bd9Sstevel@tonic-gate 
44457c478bd9Sstevel@tonic-gate 	if (pip == NULL) {
44467c478bd9Sstevel@tonic-gate 		return (DDI_PROP_INVAL_ARG);
44477c478bd9Sstevel@tonic-gate 	}
44485e3986cbScth 	ASSERT(!MDI_PI_LOCKED(pip));
44497c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
44507c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_prop == NULL) {
44517c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
44527c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
44537c478bd9Sstevel@tonic-gate 	}
44547c478bd9Sstevel@tonic-gate 	rv = nvlist_add_byte(MDI_PI(pip)->pi_prop, name, data);
44557c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
44567c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
44577c478bd9Sstevel@tonic-gate }
44587c478bd9Sstevel@tonic-gate 
44597c478bd9Sstevel@tonic-gate /*
44607c478bd9Sstevel@tonic-gate  * mdi_prop_update_byte_array():
44617c478bd9Sstevel@tonic-gate  *		Create/Update a byte array property
44627c478bd9Sstevel@tonic-gate  */
44637c478bd9Sstevel@tonic-gate int
44647c478bd9Sstevel@tonic-gate mdi_prop_update_byte_array(mdi_pathinfo_t *pip, char *name, uchar_t *data,
44657c478bd9Sstevel@tonic-gate     uint_t nelements)
44667c478bd9Sstevel@tonic-gate {
44677c478bd9Sstevel@tonic-gate 	int rv;
44687c478bd9Sstevel@tonic-gate 
44697c478bd9Sstevel@tonic-gate 	if (pip == NULL) {
44707c478bd9Sstevel@tonic-gate 		return (DDI_PROP_INVAL_ARG);
44717c478bd9Sstevel@tonic-gate 	}
44725e3986cbScth 	ASSERT(!MDI_PI_LOCKED(pip));
44737c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
44747c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_prop == NULL) {
44757c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
44767c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
44777c478bd9Sstevel@tonic-gate 	}
44787c478bd9Sstevel@tonic-gate 	rv = nvlist_add_byte_array(MDI_PI(pip)->pi_prop, name, data, nelements);
44797c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
44807c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
44817c478bd9Sstevel@tonic-gate }
44827c478bd9Sstevel@tonic-gate 
44837c478bd9Sstevel@tonic-gate /*
44847c478bd9Sstevel@tonic-gate  * mdi_prop_update_int():
44857c478bd9Sstevel@tonic-gate  *		Create/Update a 32 bit integer property
44867c478bd9Sstevel@tonic-gate  */
44877c478bd9Sstevel@tonic-gate int
44887c478bd9Sstevel@tonic-gate mdi_prop_update_int(mdi_pathinfo_t *pip, char *name, int data)
44897c478bd9Sstevel@tonic-gate {
44907c478bd9Sstevel@tonic-gate 	int rv;
44917c478bd9Sstevel@tonic-gate 
44927c478bd9Sstevel@tonic-gate 	if (pip == NULL) {
44937c478bd9Sstevel@tonic-gate 		return (DDI_PROP_INVAL_ARG);
44947c478bd9Sstevel@tonic-gate 	}
44955e3986cbScth 	ASSERT(!MDI_PI_LOCKED(pip));
44967c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
44977c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_prop == NULL) {
44987c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
44997c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
45007c478bd9Sstevel@tonic-gate 	}
45017c478bd9Sstevel@tonic-gate 	rv = nvlist_add_int32(MDI_PI(pip)->pi_prop, name, (int32_t)data);
45027c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
45037c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
45047c478bd9Sstevel@tonic-gate }
45057c478bd9Sstevel@tonic-gate 
45067c478bd9Sstevel@tonic-gate /*
45077c478bd9Sstevel@tonic-gate  * mdi_prop_update_int64():
45087c478bd9Sstevel@tonic-gate  *		Create/Update a 64 bit integer property
45097c478bd9Sstevel@tonic-gate  */
45107c478bd9Sstevel@tonic-gate int
45117c478bd9Sstevel@tonic-gate mdi_prop_update_int64(mdi_pathinfo_t *pip, char *name, int64_t data)
45127c478bd9Sstevel@tonic-gate {
45137c478bd9Sstevel@tonic-gate 	int rv;
45147c478bd9Sstevel@tonic-gate 
45157c478bd9Sstevel@tonic-gate 	if (pip == NULL) {
45167c478bd9Sstevel@tonic-gate 		return (DDI_PROP_INVAL_ARG);
45177c478bd9Sstevel@tonic-gate 	}
45185e3986cbScth 	ASSERT(!MDI_PI_LOCKED(pip));
45197c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
45207c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_prop == NULL) {
45217c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
45227c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
45237c478bd9Sstevel@tonic-gate 	}
45247c478bd9Sstevel@tonic-gate 	rv = nvlist_add_int64(MDI_PI(pip)->pi_prop, name, data);
45257c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
45267c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
45277c478bd9Sstevel@tonic-gate }
45287c478bd9Sstevel@tonic-gate 
45297c478bd9Sstevel@tonic-gate /*
45307c478bd9Sstevel@tonic-gate  * mdi_prop_update_int_array():
45317c478bd9Sstevel@tonic-gate  *		Create/Update a int array property
45327c478bd9Sstevel@tonic-gate  */
45337c478bd9Sstevel@tonic-gate int
45347c478bd9Sstevel@tonic-gate mdi_prop_update_int_array(mdi_pathinfo_t *pip, char *name, int *data,
45357c478bd9Sstevel@tonic-gate 	    uint_t nelements)
45367c478bd9Sstevel@tonic-gate {
45377c478bd9Sstevel@tonic-gate 	int rv;
45387c478bd9Sstevel@tonic-gate 
45397c478bd9Sstevel@tonic-gate 	if (pip == NULL) {
45407c478bd9Sstevel@tonic-gate 		return (DDI_PROP_INVAL_ARG);
45417c478bd9Sstevel@tonic-gate 	}
45425e3986cbScth 	ASSERT(!MDI_PI_LOCKED(pip));
45437c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
45447c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_prop == NULL) {
45457c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
45467c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
45477c478bd9Sstevel@tonic-gate 	}
45487c478bd9Sstevel@tonic-gate 	rv = nvlist_add_int32_array(MDI_PI(pip)->pi_prop, name, (int32_t *)data,
45497c478bd9Sstevel@tonic-gate 	    nelements);
45507c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
45517c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
45527c478bd9Sstevel@tonic-gate }
45537c478bd9Sstevel@tonic-gate 
45547c478bd9Sstevel@tonic-gate /*
45557c478bd9Sstevel@tonic-gate  * mdi_prop_update_string():
45567c478bd9Sstevel@tonic-gate  *		Create/Update a string property
45577c478bd9Sstevel@tonic-gate  */
45587c478bd9Sstevel@tonic-gate int
45597c478bd9Sstevel@tonic-gate mdi_prop_update_string(mdi_pathinfo_t *pip, char *name, char *data)
45607c478bd9Sstevel@tonic-gate {
45617c478bd9Sstevel@tonic-gate 	int rv;
45627c478bd9Sstevel@tonic-gate 
45637c478bd9Sstevel@tonic-gate 	if (pip == NULL) {
45647c478bd9Sstevel@tonic-gate 		return (DDI_PROP_INVAL_ARG);
45657c478bd9Sstevel@tonic-gate 	}
45665e3986cbScth 	ASSERT(!MDI_PI_LOCKED(pip));
45677c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
45687c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_prop == NULL) {
45697c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
45707c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
45717c478bd9Sstevel@tonic-gate 	}
45727c478bd9Sstevel@tonic-gate 	rv = nvlist_add_string(MDI_PI(pip)->pi_prop, name, data);
45737c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
45747c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
45757c478bd9Sstevel@tonic-gate }
45767c478bd9Sstevel@tonic-gate 
45777c478bd9Sstevel@tonic-gate /*
45787c478bd9Sstevel@tonic-gate  * mdi_prop_update_string_array():
45797c478bd9Sstevel@tonic-gate  *		Create/Update a string array property
45807c478bd9Sstevel@tonic-gate  */
45817c478bd9Sstevel@tonic-gate int
45827c478bd9Sstevel@tonic-gate mdi_prop_update_string_array(mdi_pathinfo_t *pip, char *name, char **data,
45837c478bd9Sstevel@tonic-gate     uint_t nelements)
45847c478bd9Sstevel@tonic-gate {
45857c478bd9Sstevel@tonic-gate 	int rv;
45867c478bd9Sstevel@tonic-gate 
45877c478bd9Sstevel@tonic-gate 	if (pip == NULL) {
45887c478bd9Sstevel@tonic-gate 		return (DDI_PROP_INVAL_ARG);
45897c478bd9Sstevel@tonic-gate 	}
45905e3986cbScth 	ASSERT(!MDI_PI_LOCKED(pip));
45917c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
45927c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_prop == NULL) {
45937c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
45947c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
45957c478bd9Sstevel@tonic-gate 	}
45967c478bd9Sstevel@tonic-gate 	rv = nvlist_add_string_array(MDI_PI(pip)->pi_prop, name, data,
45977c478bd9Sstevel@tonic-gate 	    nelements);
45987c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
45997c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
46007c478bd9Sstevel@tonic-gate }
46017c478bd9Sstevel@tonic-gate 
46027c478bd9Sstevel@tonic-gate /*
46037c478bd9Sstevel@tonic-gate  * mdi_prop_lookup_byte():
46047c478bd9Sstevel@tonic-gate  * 		Look for byte property identified by name.  The data returned
46057c478bd9Sstevel@tonic-gate  *		is the actual property and valid as long as mdi_pathinfo_t node
46067c478bd9Sstevel@tonic-gate  *		is alive.
46077c478bd9Sstevel@tonic-gate  */
46087c478bd9Sstevel@tonic-gate int
46097c478bd9Sstevel@tonic-gate mdi_prop_lookup_byte(mdi_pathinfo_t *pip, char *name, uchar_t *data)
46107c478bd9Sstevel@tonic-gate {
46117c478bd9Sstevel@tonic-gate 	int rv;
46127c478bd9Sstevel@tonic-gate 
46137c478bd9Sstevel@tonic-gate 	if ((pip == NULL) || (MDI_PI(pip)->pi_prop == NULL)) {
46147c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
46157c478bd9Sstevel@tonic-gate 	}
46167c478bd9Sstevel@tonic-gate 	rv = nvlist_lookup_byte(MDI_PI(pip)->pi_prop, name, data);
46177c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
46187c478bd9Sstevel@tonic-gate }
46197c478bd9Sstevel@tonic-gate 
46207c478bd9Sstevel@tonic-gate 
46217c478bd9Sstevel@tonic-gate /*
46227c478bd9Sstevel@tonic-gate  * mdi_prop_lookup_byte_array():
46237c478bd9Sstevel@tonic-gate  * 		Look for byte array property identified by name.  The data
46247c478bd9Sstevel@tonic-gate  *		returned is the actual property and valid as long as
46257c478bd9Sstevel@tonic-gate  *		mdi_pathinfo_t node is alive.
46267c478bd9Sstevel@tonic-gate  */
46277c478bd9Sstevel@tonic-gate int
46287c478bd9Sstevel@tonic-gate mdi_prop_lookup_byte_array(mdi_pathinfo_t *pip, char *name, uchar_t **data,
46297c478bd9Sstevel@tonic-gate     uint_t *nelements)
46307c478bd9Sstevel@tonic-gate {
46317c478bd9Sstevel@tonic-gate 	int rv;
46327c478bd9Sstevel@tonic-gate 
46337c478bd9Sstevel@tonic-gate 	if ((pip == NULL) || (MDI_PI(pip)->pi_prop == NULL)) {
46347c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
46357c478bd9Sstevel@tonic-gate 	}
46367c478bd9Sstevel@tonic-gate 	rv = nvlist_lookup_byte_array(MDI_PI(pip)->pi_prop, name, data,
46377c478bd9Sstevel@tonic-gate 	    nelements);
46387c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
46397c478bd9Sstevel@tonic-gate }
46407c478bd9Sstevel@tonic-gate 
46417c478bd9Sstevel@tonic-gate /*
46427c478bd9Sstevel@tonic-gate  * mdi_prop_lookup_int():
46437c478bd9Sstevel@tonic-gate  * 		Look for int property identified by name.  The data returned
46447c478bd9Sstevel@tonic-gate  *		is the actual property and valid as long as mdi_pathinfo_t
46457c478bd9Sstevel@tonic-gate  *		node is alive.
46467c478bd9Sstevel@tonic-gate  */
46477c478bd9Sstevel@tonic-gate int
46487c478bd9Sstevel@tonic-gate mdi_prop_lookup_int(mdi_pathinfo_t *pip, char *name, int *data)
46497c478bd9Sstevel@tonic-gate {
46507c478bd9Sstevel@tonic-gate 	int rv;
46517c478bd9Sstevel@tonic-gate 
46527c478bd9Sstevel@tonic-gate 	if ((pip == NULL) || (MDI_PI(pip)->pi_prop == NULL)) {
46537c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
46547c478bd9Sstevel@tonic-gate 	}
46557c478bd9Sstevel@tonic-gate 	rv = nvlist_lookup_int32(MDI_PI(pip)->pi_prop, name, (int32_t *)data);
46567c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
46577c478bd9Sstevel@tonic-gate }
46587c478bd9Sstevel@tonic-gate 
46597c478bd9Sstevel@tonic-gate /*
46607c478bd9Sstevel@tonic-gate  * mdi_prop_lookup_int64():
46617c478bd9Sstevel@tonic-gate  * 		Look for int64 property identified by name.  The data returned
46627c478bd9Sstevel@tonic-gate  *		is the actual property and valid as long as mdi_pathinfo_t node
46637c478bd9Sstevel@tonic-gate  *		is alive.
46647c478bd9Sstevel@tonic-gate  */
46657c478bd9Sstevel@tonic-gate int
46667c478bd9Sstevel@tonic-gate mdi_prop_lookup_int64(mdi_pathinfo_t *pip, char *name, int64_t *data)
46677c478bd9Sstevel@tonic-gate {
46687c478bd9Sstevel@tonic-gate 	int rv;
46697c478bd9Sstevel@tonic-gate 	if ((pip == NULL) || (MDI_PI(pip)->pi_prop == NULL)) {
46707c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
46717c478bd9Sstevel@tonic-gate 	}
46727c478bd9Sstevel@tonic-gate 	rv = nvlist_lookup_int64(MDI_PI(pip)->pi_prop, name, data);
46737c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
46747c478bd9Sstevel@tonic-gate }
46757c478bd9Sstevel@tonic-gate 
46767c478bd9Sstevel@tonic-gate /*
46777c478bd9Sstevel@tonic-gate  * mdi_prop_lookup_int_array():
46787c478bd9Sstevel@tonic-gate  * 		Look for int array property identified by name.  The data
46797c478bd9Sstevel@tonic-gate  *		returned is the actual property and valid as long as
46807c478bd9Sstevel@tonic-gate  *		mdi_pathinfo_t node is alive.
46817c478bd9Sstevel@tonic-gate  */
46827c478bd9Sstevel@tonic-gate int
46837c478bd9Sstevel@tonic-gate mdi_prop_lookup_int_array(mdi_pathinfo_t *pip, char *name, int **data,
46847c478bd9Sstevel@tonic-gate     uint_t *nelements)
46857c478bd9Sstevel@tonic-gate {
46867c478bd9Sstevel@tonic-gate 	int rv;
46877c478bd9Sstevel@tonic-gate 
46887c478bd9Sstevel@tonic-gate 	if ((pip == NULL) || (MDI_PI(pip)->pi_prop == NULL)) {
46897c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
46907c478bd9Sstevel@tonic-gate 	}
46917c478bd9Sstevel@tonic-gate 	rv = nvlist_lookup_int32_array(MDI_PI(pip)->pi_prop, name,
46927c478bd9Sstevel@tonic-gate 	    (int32_t **)data, nelements);
46937c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
46947c478bd9Sstevel@tonic-gate }
46957c478bd9Sstevel@tonic-gate 
46967c478bd9Sstevel@tonic-gate /*
46977c478bd9Sstevel@tonic-gate  * mdi_prop_lookup_string():
46987c478bd9Sstevel@tonic-gate  * 		Look for string property identified by name.  The data
46997c478bd9Sstevel@tonic-gate  *		returned is the actual property and valid as long as
47007c478bd9Sstevel@tonic-gate  *		mdi_pathinfo_t node is alive.
47017c478bd9Sstevel@tonic-gate  */
47027c478bd9Sstevel@tonic-gate int
47037c478bd9Sstevel@tonic-gate mdi_prop_lookup_string(mdi_pathinfo_t *pip, char *name, char **data)
47047c478bd9Sstevel@tonic-gate {
47057c478bd9Sstevel@tonic-gate 	int rv;
47067c478bd9Sstevel@tonic-gate 
47077c478bd9Sstevel@tonic-gate 	if ((pip == NULL) || (MDI_PI(pip)->pi_prop == NULL)) {
47087c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
47097c478bd9Sstevel@tonic-gate 	}
47107c478bd9Sstevel@tonic-gate 	rv = nvlist_lookup_string(MDI_PI(pip)->pi_prop, name, data);
47117c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
47127c478bd9Sstevel@tonic-gate }
47137c478bd9Sstevel@tonic-gate 
47147c478bd9Sstevel@tonic-gate /*
47157c478bd9Sstevel@tonic-gate  * mdi_prop_lookup_string_array():
47167c478bd9Sstevel@tonic-gate  * 		Look for string array property identified by name.  The data
47177c478bd9Sstevel@tonic-gate  *		returned is the actual property and valid as long as
47187c478bd9Sstevel@tonic-gate  *		mdi_pathinfo_t node is alive.
47197c478bd9Sstevel@tonic-gate  */
47207c478bd9Sstevel@tonic-gate int
47217c478bd9Sstevel@tonic-gate mdi_prop_lookup_string_array(mdi_pathinfo_t *pip, char *name, char ***data,
47227c478bd9Sstevel@tonic-gate     uint_t *nelements)
47237c478bd9Sstevel@tonic-gate {
47247c478bd9Sstevel@tonic-gate 	int rv;
47257c478bd9Sstevel@tonic-gate 
47267c478bd9Sstevel@tonic-gate 	if ((pip == NULL) || (MDI_PI(pip)->pi_prop == NULL)) {
47277c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
47287c478bd9Sstevel@tonic-gate 	}
47297c478bd9Sstevel@tonic-gate 	rv = nvlist_lookup_string_array(MDI_PI(pip)->pi_prop, name, data,
47307c478bd9Sstevel@tonic-gate 	    nelements);
47317c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
47327c478bd9Sstevel@tonic-gate }
47337c478bd9Sstevel@tonic-gate 
47347c478bd9Sstevel@tonic-gate /*
47357c478bd9Sstevel@tonic-gate  * mdi_prop_free():
47367c478bd9Sstevel@tonic-gate  * 		Symmetrical function to ddi_prop_free(). nvlist_lookup_xx()
47377c478bd9Sstevel@tonic-gate  *		functions return the pointer to actual property data and not a
47387c478bd9Sstevel@tonic-gate  *		copy of it.  So the data returned is valid as long as
47397c478bd9Sstevel@tonic-gate  *		mdi_pathinfo_t node is valid.
47407c478bd9Sstevel@tonic-gate  */
47417c478bd9Sstevel@tonic-gate /*ARGSUSED*/
47427c478bd9Sstevel@tonic-gate int
47437c478bd9Sstevel@tonic-gate mdi_prop_free(void *data)
47447c478bd9Sstevel@tonic-gate {
47457c478bd9Sstevel@tonic-gate 	return (DDI_PROP_SUCCESS);
47467c478bd9Sstevel@tonic-gate }
47477c478bd9Sstevel@tonic-gate 
47487c478bd9Sstevel@tonic-gate /*ARGSUSED*/
47497c478bd9Sstevel@tonic-gate static void
47507c478bd9Sstevel@tonic-gate i_mdi_report_path_state(mdi_client_t *ct, mdi_pathinfo_t *pip)
47517c478bd9Sstevel@tonic-gate {
47524c06356bSdh142964 	char		*ct_path;
47537c478bd9Sstevel@tonic-gate 	char		*ct_status;
47547c478bd9Sstevel@tonic-gate 	char		*status;
47554c06356bSdh142964 	dev_info_t	*cdip = ct->ct_dip;
47567c478bd9Sstevel@tonic-gate 	char		lb_buf[64];
47574c06356bSdh142964 	int		report_lb_c = 0, report_lb_p = 0;
47587c478bd9Sstevel@tonic-gate 
47595e3986cbScth 	ASSERT(MDI_CLIENT_LOCKED(ct));
47604c06356bSdh142964 	if ((cdip == NULL) || (ddi_get_instance(cdip) == -1) ||
47617c478bd9Sstevel@tonic-gate 	    (MDI_CLIENT_IS_REPORT_DEV_NEEDED(ct) == 0)) {
47627c478bd9Sstevel@tonic-gate 		return;
47637c478bd9Sstevel@tonic-gate 	}
47647c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT_STATE(ct) == MDI_CLIENT_STATE_OPTIMAL) {
47657c478bd9Sstevel@tonic-gate 		ct_status = "optimal";
47664c06356bSdh142964 		report_lb_c = 1;
47677c478bd9Sstevel@tonic-gate 	} else if (MDI_CLIENT_STATE(ct) == MDI_CLIENT_STATE_DEGRADED) {
47687c478bd9Sstevel@tonic-gate 		ct_status = "degraded";
47697c478bd9Sstevel@tonic-gate 	} else if (MDI_CLIENT_STATE(ct) == MDI_CLIENT_STATE_FAILED) {
47707c478bd9Sstevel@tonic-gate 		ct_status = "failed";
47717c478bd9Sstevel@tonic-gate 	} else {
47727c478bd9Sstevel@tonic-gate 		ct_status = "unknown";
47737c478bd9Sstevel@tonic-gate 	}
47747c478bd9Sstevel@tonic-gate 
47754c06356bSdh142964 	lb_buf[0] = 0;		/* not interested in load balancing config */
47764c06356bSdh142964 
47774c06356bSdh142964 	if (MDI_PI_FLAGS_IS_DEVICE_REMOVED(pip)) {
47784c06356bSdh142964 		status = "removed";
47794c06356bSdh142964 	} else if (MDI_PI_IS_OFFLINE(pip)) {
47807c478bd9Sstevel@tonic-gate 		status = "offline";
47817c478bd9Sstevel@tonic-gate 	} else if (MDI_PI_IS_ONLINE(pip)) {
47827c478bd9Sstevel@tonic-gate 		status = "online";
47834c06356bSdh142964 		report_lb_p = 1;
47847c478bd9Sstevel@tonic-gate 	} else if (MDI_PI_IS_STANDBY(pip)) {
47857c478bd9Sstevel@tonic-gate 		status = "standby";
47867c478bd9Sstevel@tonic-gate 	} else if (MDI_PI_IS_FAULT(pip)) {
47877c478bd9Sstevel@tonic-gate 		status = "faulted";
47887c478bd9Sstevel@tonic-gate 	} else {
47897c478bd9Sstevel@tonic-gate 		status = "unknown";
47907c478bd9Sstevel@tonic-gate 	}
47917c478bd9Sstevel@tonic-gate 
47924c06356bSdh142964 	if (cdip) {
47934c06356bSdh142964 		ct_path = kmem_alloc(MAXPATHLEN, KM_SLEEP);
47944c06356bSdh142964 
47954c06356bSdh142964 		/*
47964c06356bSdh142964 		 * NOTE: Keeping "multipath status: %s" and
47974c06356bSdh142964 		 * "Load balancing: %s" format unchanged in case someone
47984c06356bSdh142964 		 * scrubs /var/adm/messages looking for these messages.
47994c06356bSdh142964 		 */
48004c06356bSdh142964 		if (report_lb_c && report_lb_p) {
48017c478bd9Sstevel@tonic-gate 			if (ct->ct_lb == LOAD_BALANCE_LBA) {
48027c478bd9Sstevel@tonic-gate 				(void) snprintf(lb_buf, sizeof (lb_buf),
48037c478bd9Sstevel@tonic-gate 				    "%s, region-size: %d", mdi_load_balance_lba,
48047c478bd9Sstevel@tonic-gate 				    ct->ct_lb_args->region_size);
48057c478bd9Sstevel@tonic-gate 			} else if (ct->ct_lb == LOAD_BALANCE_NONE) {
48067c478bd9Sstevel@tonic-gate 				(void) snprintf(lb_buf, sizeof (lb_buf),
48077c478bd9Sstevel@tonic-gate 				    "%s", mdi_load_balance_none);
48087c478bd9Sstevel@tonic-gate 			} else {
48097c478bd9Sstevel@tonic-gate 				(void) snprintf(lb_buf, sizeof (lb_buf), "%s",
48107c478bd9Sstevel@tonic-gate 				    mdi_load_balance_rr);
48117c478bd9Sstevel@tonic-gate 			}
48127c478bd9Sstevel@tonic-gate 
48134c06356bSdh142964 			cmn_err(mdi_debug_consoleonly ? CE_NOTE : CE_CONT,
48144c06356bSdh142964 			    "?%s (%s%d) multipath status: %s: "
48154c06356bSdh142964 			    "path %d %s is %s: Load balancing: %s\n",
48164c06356bSdh142964 			    ddi_pathname(cdip, ct_path), ddi_driver_name(cdip),
48174c06356bSdh142964 			    ddi_get_instance(cdip), ct_status,
48184c06356bSdh142964 			    mdi_pi_get_path_instance(pip),
48194c06356bSdh142964 			    mdi_pi_spathname(pip), status, lb_buf);
48204c06356bSdh142964 		} else {
48214c06356bSdh142964 			cmn_err(mdi_debug_consoleonly ? CE_NOTE : CE_CONT,
48224c06356bSdh142964 			    "?%s (%s%d) multipath status: %s: "
48234c06356bSdh142964 			    "path %d %s is %s\n",
48244c06356bSdh142964 			    ddi_pathname(cdip, ct_path), ddi_driver_name(cdip),
48254c06356bSdh142964 			    ddi_get_instance(cdip), ct_status,
48264c06356bSdh142964 			    mdi_pi_get_path_instance(pip),
48274c06356bSdh142964 			    mdi_pi_spathname(pip), status);
48284c06356bSdh142964 		}
48294c06356bSdh142964 
48307c478bd9Sstevel@tonic-gate 		kmem_free(ct_path, MAXPATHLEN);
48317c478bd9Sstevel@tonic-gate 		MDI_CLIENT_CLEAR_REPORT_DEV_NEEDED(ct);
48327c478bd9Sstevel@tonic-gate 	}
48337c478bd9Sstevel@tonic-gate }
48347c478bd9Sstevel@tonic-gate 
48357c478bd9Sstevel@tonic-gate #ifdef	DEBUG
48367c478bd9Sstevel@tonic-gate /*
48377c478bd9Sstevel@tonic-gate  * i_mdi_log():
48387c478bd9Sstevel@tonic-gate  *		Utility function for error message management
48397c478bd9Sstevel@tonic-gate  *
48404c06356bSdh142964  *		NOTE: Implementation takes care of trailing \n for cmn_err,
48414c06356bSdh142964  *		MDI_DEBUG should not terminate fmt strings with \n.
48424c06356bSdh142964  *
48434c06356bSdh142964  *		NOTE: If the level is >= 2, and there is no leading !?^
48444c06356bSdh142964  *		then a leading ! is implied (but can be overriden via
48454c06356bSdh142964  *		mdi_debug_consoleonly). If you are using kmdb on the console,
48464c06356bSdh142964  *		consider setting mdi_debug_consoleonly to 1 as an aid.
48477c478bd9Sstevel@tonic-gate  */
48484c06356bSdh142964 /*PRINTFLIKE4*/
48497c478bd9Sstevel@tonic-gate static void
48504c06356bSdh142964 i_mdi_log(int level, const char *func, dev_info_t *dip, const char *fmt, ...)
48517c478bd9Sstevel@tonic-gate {
4852c73a93f2Sdm120769 	char		name[MAXNAMELEN];
48534c06356bSdh142964 	char		buf[512];
48545e3986cbScth 	char		*bp;
48557c478bd9Sstevel@tonic-gate 	va_list		ap;
48567c478bd9Sstevel@tonic-gate 	int		log_only = 0;
48577c478bd9Sstevel@tonic-gate 	int		boot_only = 0;
48587c478bd9Sstevel@tonic-gate 	int		console_only = 0;
48597c478bd9Sstevel@tonic-gate 
48607c478bd9Sstevel@tonic-gate 	if (dip) {
48614c06356bSdh142964 		(void) snprintf(name, sizeof(name), "%s%d: ",
486255e592a2SRandall Ralphs 		    ddi_driver_name(dip), ddi_get_instance(dip));
4863c73a93f2Sdm120769 	} else {
48645e3986cbScth 		name[0] = 0;
48657c478bd9Sstevel@tonic-gate 	}
48667c478bd9Sstevel@tonic-gate 
48677c478bd9Sstevel@tonic-gate 	va_start(ap, fmt);
48684c06356bSdh142964 	(void) vsnprintf(buf, sizeof(buf), fmt, ap);
48697c478bd9Sstevel@tonic-gate 	va_end(ap);
48707c478bd9Sstevel@tonic-gate 
48717c478bd9Sstevel@tonic-gate 	switch (buf[0]) {
48727c478bd9Sstevel@tonic-gate 	case '!':
48735e3986cbScth 		bp = &buf[1];
48747c478bd9Sstevel@tonic-gate 		log_only = 1;
48757c478bd9Sstevel@tonic-gate 		break;
48767c478bd9Sstevel@tonic-gate 	case '?':
48775e3986cbScth 		bp = &buf[1];
48787c478bd9Sstevel@tonic-gate 		boot_only = 1;
48797c478bd9Sstevel@tonic-gate 		break;
48807c478bd9Sstevel@tonic-gate 	case '^':
48815e3986cbScth 		bp = &buf[1];
48827c478bd9Sstevel@tonic-gate 		console_only = 1;
48837c478bd9Sstevel@tonic-gate 		break;
48845e3986cbScth 	default:
48854c06356bSdh142964 		if (level >= 2)
48864c06356bSdh142964 			log_only = 1;		/* ! implied */
48875e3986cbScth 		bp = buf;
48885e3986cbScth 		break;
48895e3986cbScth 	}
48905e3986cbScth 	if (mdi_debug_logonly) {
48915e3986cbScth 		log_only = 1;
48925e3986cbScth 		boot_only = 0;
48935e3986cbScth 		console_only = 0;
48947c478bd9Sstevel@tonic-gate 	}
48954c06356bSdh142964 	if (mdi_debug_consoleonly) {
48964c06356bSdh142964 		log_only = 0;
48974c06356bSdh142964 		boot_only = 0;
48984c06356bSdh142964 		console_only = 1;
48994c06356bSdh142964 		level = CE_NOTE;
49004c06356bSdh142964 		goto console;
49014c06356bSdh142964 	}
49027c478bd9Sstevel@tonic-gate 
49037c478bd9Sstevel@tonic-gate 	switch (level) {
49047c478bd9Sstevel@tonic-gate 	case CE_NOTE:
49057c478bd9Sstevel@tonic-gate 		level = CE_CONT;
49067c478bd9Sstevel@tonic-gate 		/* FALLTHROUGH */
49077c478bd9Sstevel@tonic-gate 	case CE_CONT:
49084c06356bSdh142964 		if (boot_only) {
49094c06356bSdh142964 			cmn_err(level, "?mdi: %s%s: %s\n", name, func, bp);
49104c06356bSdh142964 		} else if (console_only) {
49114c06356bSdh142964 			cmn_err(level, "^mdi: %s%s: %s\n", name, func, bp);
49124c06356bSdh142964 		} else if (log_only) {
49134c06356bSdh142964 			cmn_err(level, "!mdi: %s%s: %s\n", name, func, bp);
49144c06356bSdh142964 		} else {
49154c06356bSdh142964 			cmn_err(level, "mdi: %s%s: %s\n", name, func, bp);
49164c06356bSdh142964 		}
49174c06356bSdh142964 		break;
49184c06356bSdh142964 
49197c478bd9Sstevel@tonic-gate 	case CE_WARN:
49207c478bd9Sstevel@tonic-gate 	case CE_PANIC:
49214c06356bSdh142964 	console:
49227c478bd9Sstevel@tonic-gate 		if (boot_only) {
49234c06356bSdh142964 			cmn_err(level, "?mdi: %s%s: %s", name, func, bp);
49247c478bd9Sstevel@tonic-gate 		} else if (console_only) {
49254c06356bSdh142964 			cmn_err(level, "^mdi: %s%s: %s", name, func, bp);
49267c478bd9Sstevel@tonic-gate 		} else if (log_only) {
49274c06356bSdh142964 			cmn_err(level, "!mdi: %s%s: %s", name, func, bp);
49287c478bd9Sstevel@tonic-gate 		} else {
49294c06356bSdh142964 			cmn_err(level, "mdi: %s%s: %s", name, func, bp);
49307c478bd9Sstevel@tonic-gate 		}
49317c478bd9Sstevel@tonic-gate 		break;
49327c478bd9Sstevel@tonic-gate 	default:
49335e3986cbScth 		cmn_err(level, "mdi: %s%s", name, bp);
49347c478bd9Sstevel@tonic-gate 		break;
49357c478bd9Sstevel@tonic-gate 	}
49367c478bd9Sstevel@tonic-gate }
49377c478bd9Sstevel@tonic-gate #endif	/* DEBUG */
49387c478bd9Sstevel@tonic-gate 
49397c478bd9Sstevel@tonic-gate void
49407c478bd9Sstevel@tonic-gate i_mdi_client_online(dev_info_t *ct_dip)
49417c478bd9Sstevel@tonic-gate {
49427c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
49437c478bd9Sstevel@tonic-gate 
49447c478bd9Sstevel@tonic-gate 	/*
49457c478bd9Sstevel@tonic-gate 	 * Client online notification. Mark client state as online
49467c478bd9Sstevel@tonic-gate 	 * restore our binding with dev_info node
49477c478bd9Sstevel@tonic-gate 	 */
49487c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(ct_dip);
49497c478bd9Sstevel@tonic-gate 	ASSERT(ct != NULL);
49507c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
49517c478bd9Sstevel@tonic-gate 	MDI_CLIENT_SET_ONLINE(ct);
49527c478bd9Sstevel@tonic-gate 	/* catch for any memory leaks */
49537c478bd9Sstevel@tonic-gate 	ASSERT((ct->ct_dip == NULL) || (ct->ct_dip == ct_dip));
49547c478bd9Sstevel@tonic-gate 	ct->ct_dip = ct_dip;
49557c478bd9Sstevel@tonic-gate 
49567c478bd9Sstevel@tonic-gate 	if (ct->ct_power_cnt == 0)
49577c478bd9Sstevel@tonic-gate 		(void) i_mdi_power_all_phci(ct);
49587c478bd9Sstevel@tonic-gate 
49594c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, ct_dip,
49604c06356bSdh142964 	    "i_mdi_pm_hold_client %p", (void *)ct));
49617c478bd9Sstevel@tonic-gate 	i_mdi_pm_hold_client(ct, 1);
49627c478bd9Sstevel@tonic-gate 
49637c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
49647c478bd9Sstevel@tonic-gate }
49657c478bd9Sstevel@tonic-gate 
49667c478bd9Sstevel@tonic-gate void
49677c478bd9Sstevel@tonic-gate i_mdi_phci_online(dev_info_t *ph_dip)
49687c478bd9Sstevel@tonic-gate {
49697c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
49707c478bd9Sstevel@tonic-gate 
49717c478bd9Sstevel@tonic-gate 	/* pHCI online notification. Mark state accordingly */
49727c478bd9Sstevel@tonic-gate 	ph = i_devi_get_phci(ph_dip);
49737c478bd9Sstevel@tonic-gate 	ASSERT(ph != NULL);
49747c478bd9Sstevel@tonic-gate 	MDI_PHCI_LOCK(ph);
49757c478bd9Sstevel@tonic-gate 	MDI_PHCI_SET_ONLINE(ph);
49767c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNLOCK(ph);
49777c478bd9Sstevel@tonic-gate }
49787c478bd9Sstevel@tonic-gate 
49797c478bd9Sstevel@tonic-gate /*
49807c478bd9Sstevel@tonic-gate  * mdi_devi_online():
49817c478bd9Sstevel@tonic-gate  * 		Online notification from NDI framework on pHCI/client
49827c478bd9Sstevel@tonic-gate  *		device online.
49837c478bd9Sstevel@tonic-gate  * Return Values:
49847c478bd9Sstevel@tonic-gate  *		NDI_SUCCESS
49857c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
49867c478bd9Sstevel@tonic-gate  */
49877c478bd9Sstevel@tonic-gate /*ARGSUSED*/
49887c478bd9Sstevel@tonic-gate int
49897c478bd9Sstevel@tonic-gate mdi_devi_online(dev_info_t *dip, uint_t flags)
49907c478bd9Sstevel@tonic-gate {
49917c478bd9Sstevel@tonic-gate 	if (MDI_PHCI(dip)) {
49927c478bd9Sstevel@tonic-gate 		i_mdi_phci_online(dip);
49937c478bd9Sstevel@tonic-gate 	}
49947c478bd9Sstevel@tonic-gate 
49957c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT(dip)) {
49967c478bd9Sstevel@tonic-gate 		i_mdi_client_online(dip);
49977c478bd9Sstevel@tonic-gate 	}
49987c478bd9Sstevel@tonic-gate 	return (NDI_SUCCESS);
49997c478bd9Sstevel@tonic-gate }
50007c478bd9Sstevel@tonic-gate 
50017c478bd9Sstevel@tonic-gate /*
50027c478bd9Sstevel@tonic-gate  * mdi_devi_offline():
50037c478bd9Sstevel@tonic-gate  * 		Offline notification from NDI framework on pHCI/Client device
50047c478bd9Sstevel@tonic-gate  *		offline.
50057c478bd9Sstevel@tonic-gate  *
50067c478bd9Sstevel@tonic-gate  * Return Values:
50077c478bd9Sstevel@tonic-gate  *		NDI_SUCCESS
50087c478bd9Sstevel@tonic-gate  *		NDI_FAILURE
50097c478bd9Sstevel@tonic-gate  */
50107c478bd9Sstevel@tonic-gate /*ARGSUSED*/
50117c478bd9Sstevel@tonic-gate int
50127c478bd9Sstevel@tonic-gate mdi_devi_offline(dev_info_t *dip, uint_t flags)
50137c478bd9Sstevel@tonic-gate {
50147c478bd9Sstevel@tonic-gate 	int		rv = NDI_SUCCESS;
50157c478bd9Sstevel@tonic-gate 
50167c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT(dip)) {
50177c478bd9Sstevel@tonic-gate 		rv = i_mdi_client_offline(dip, flags);
50187c478bd9Sstevel@tonic-gate 		if (rv != NDI_SUCCESS)
50197c478bd9Sstevel@tonic-gate 			return (rv);
50207c478bd9Sstevel@tonic-gate 	}
50217c478bd9Sstevel@tonic-gate 
50227c478bd9Sstevel@tonic-gate 	if (MDI_PHCI(dip)) {
50237c478bd9Sstevel@tonic-gate 		rv = i_mdi_phci_offline(dip, flags);
50245e3986cbScth 
50257c478bd9Sstevel@tonic-gate 		if ((rv != NDI_SUCCESS) && MDI_CLIENT(dip)) {
50267c478bd9Sstevel@tonic-gate 			/* set client back online */
50277c478bd9Sstevel@tonic-gate 			i_mdi_client_online(dip);
50287c478bd9Sstevel@tonic-gate 		}
50297c478bd9Sstevel@tonic-gate 	}
50307c478bd9Sstevel@tonic-gate 
50317c478bd9Sstevel@tonic-gate 	return (rv);
50327c478bd9Sstevel@tonic-gate }
50337c478bd9Sstevel@tonic-gate 
50347c478bd9Sstevel@tonic-gate /*ARGSUSED*/
50357c478bd9Sstevel@tonic-gate static int
50367c478bd9Sstevel@tonic-gate i_mdi_phci_offline(dev_info_t *dip, uint_t flags)
50377c478bd9Sstevel@tonic-gate {
50387c478bd9Sstevel@tonic-gate 	int		rv = NDI_SUCCESS;
50397c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
50407c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
50417c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*pip;
50427c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*next;
50437c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*failed_pip = NULL;
50447c478bd9Sstevel@tonic-gate 	dev_info_t	*cdip;
50457c478bd9Sstevel@tonic-gate 
50467c478bd9Sstevel@tonic-gate 	/*
50477c478bd9Sstevel@tonic-gate 	 * pHCI component offline notification
50487c478bd9Sstevel@tonic-gate 	 * Make sure that this pHCI instance is free to be offlined.
50497c478bd9Sstevel@tonic-gate 	 * If it is OK to proceed, Offline and remove all the child
50507c478bd9Sstevel@tonic-gate 	 * mdi_pathinfo nodes.  This process automatically offlines
50517c478bd9Sstevel@tonic-gate 	 * corresponding client devices, for which this pHCI provides
50527c478bd9Sstevel@tonic-gate 	 * critical services.
50537c478bd9Sstevel@tonic-gate 	 */
50547c478bd9Sstevel@tonic-gate 	ph = i_devi_get_phci(dip);
50554c06356bSdh142964 	MDI_DEBUG(2, (MDI_NOTE, dip,
50564c06356bSdh142964 	    "called %p %p", (void *)dip, (void *)ph));
50577c478bd9Sstevel@tonic-gate 	if (ph == NULL) {
50587c478bd9Sstevel@tonic-gate 		return (rv);
50597c478bd9Sstevel@tonic-gate 	}
50607c478bd9Sstevel@tonic-gate 
50617c478bd9Sstevel@tonic-gate 	MDI_PHCI_LOCK(ph);
50627c478bd9Sstevel@tonic-gate 
50637c478bd9Sstevel@tonic-gate 	if (MDI_PHCI_IS_OFFLINE(ph)) {
50644c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, dip,
50654c06356bSdh142964 		    "!pHCI already offlined: %p", (void *)dip));
50667c478bd9Sstevel@tonic-gate 		MDI_PHCI_UNLOCK(ph);
50677c478bd9Sstevel@tonic-gate 		return (NDI_SUCCESS);
50687c478bd9Sstevel@tonic-gate 	}
50697c478bd9Sstevel@tonic-gate 
50707c478bd9Sstevel@tonic-gate 	/*
50717c478bd9Sstevel@tonic-gate 	 * Check to see if the pHCI can be offlined
50727c478bd9Sstevel@tonic-gate 	 */
50737c478bd9Sstevel@tonic-gate 	if (ph->ph_unstable) {
50744c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, dip,
50754c06356bSdh142964 		    "!One or more target devices are in transient state. "
50764c06356bSdh142964 		    "This device can not be removed at this moment. "
50774c06356bSdh142964 		    "Please try again later."));
50787c478bd9Sstevel@tonic-gate 		MDI_PHCI_UNLOCK(ph);
50797c478bd9Sstevel@tonic-gate 		return (NDI_BUSY);
50807c478bd9Sstevel@tonic-gate 	}
50817c478bd9Sstevel@tonic-gate 
50827c478bd9Sstevel@tonic-gate 	pip = ph->ph_path_head;
50837c478bd9Sstevel@tonic-gate 	while (pip != NULL) {
50847c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
50857c478bd9Sstevel@tonic-gate 		next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
50865e3986cbScth 
50877c478bd9Sstevel@tonic-gate 		/*
50887c478bd9Sstevel@tonic-gate 		 * The mdi_pathinfo state is OK. Check the client state.
50897c478bd9Sstevel@tonic-gate 		 * If failover in progress fail the pHCI from offlining
50907c478bd9Sstevel@tonic-gate 		 */
50917c478bd9Sstevel@tonic-gate 		ct = MDI_PI(pip)->pi_client;
50927c478bd9Sstevel@tonic-gate 		i_mdi_client_lock(ct, pip);
50937c478bd9Sstevel@tonic-gate 		if ((MDI_CLIENT_IS_FAILOVER_IN_PROGRESS(ct)) ||
50947c478bd9Sstevel@tonic-gate 		    (ct->ct_unstable)) {
50957c478bd9Sstevel@tonic-gate 			/*
50967c478bd9Sstevel@tonic-gate 			 * Failover is in progress, Fail the DR
50977c478bd9Sstevel@tonic-gate 			 */
50984c06356bSdh142964 			MDI_DEBUG(1, (MDI_WARN, dip,
50994c06356bSdh142964 			    "!pHCI device is busy. "
51004c06356bSdh142964 			    "This device can not be removed at this moment. "
51014c06356bSdh142964 			    "Please try again later."));
51027c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
51035e3986cbScth 			i_mdi_client_unlock(ct);
51047c478bd9Sstevel@tonic-gate 			MDI_PHCI_UNLOCK(ph);
51057c478bd9Sstevel@tonic-gate 			return (NDI_BUSY);
51067c478bd9Sstevel@tonic-gate 		}
51077c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
51087c478bd9Sstevel@tonic-gate 
51097c478bd9Sstevel@tonic-gate 		/*
51107c478bd9Sstevel@tonic-gate 		 * Check to see of we are removing the last path of this
51117c478bd9Sstevel@tonic-gate 		 * client device...
51127c478bd9Sstevel@tonic-gate 		 */
51137c478bd9Sstevel@tonic-gate 		cdip = ct->ct_dip;
51147c478bd9Sstevel@tonic-gate 		if (cdip && (i_ddi_node_state(cdip) >= DS_INITIALIZED) &&
51157c478bd9Sstevel@tonic-gate 		    (i_mdi_client_compute_state(ct, ph) ==
51167c478bd9Sstevel@tonic-gate 		    MDI_CLIENT_STATE_FAILED)) {
51177c478bd9Sstevel@tonic-gate 			i_mdi_client_unlock(ct);
51187c478bd9Sstevel@tonic-gate 			MDI_PHCI_UNLOCK(ph);
51194c06356bSdh142964 			if (ndi_devi_offline(cdip,
51204c06356bSdh142964 			    NDI_DEVFS_CLEAN) != NDI_SUCCESS) {
51217c478bd9Sstevel@tonic-gate 				/*
51227c478bd9Sstevel@tonic-gate 				 * ndi_devi_offline() failed.
51237c478bd9Sstevel@tonic-gate 				 * This pHCI provides the critical path
51247c478bd9Sstevel@tonic-gate 				 * to one or more client devices.
51257c478bd9Sstevel@tonic-gate 				 * Return busy.
51267c478bd9Sstevel@tonic-gate 				 */
51277c478bd9Sstevel@tonic-gate 				MDI_PHCI_LOCK(ph);
51284c06356bSdh142964 				MDI_DEBUG(1, (MDI_WARN, dip,
51294c06356bSdh142964 				    "!pHCI device is busy. "
51304c06356bSdh142964 				    "This device can not be removed at this "
51314c06356bSdh142964 				    "moment. Please try again later."));
51327c478bd9Sstevel@tonic-gate 				failed_pip = pip;
51337c478bd9Sstevel@tonic-gate 				break;
51347c478bd9Sstevel@tonic-gate 			} else {
51357c478bd9Sstevel@tonic-gate 				MDI_PHCI_LOCK(ph);
51367c478bd9Sstevel@tonic-gate 				pip = next;
51377c478bd9Sstevel@tonic-gate 			}
51387c478bd9Sstevel@tonic-gate 		} else {
51397c478bd9Sstevel@tonic-gate 			i_mdi_client_unlock(ct);
51407c478bd9Sstevel@tonic-gate 			pip = next;
51417c478bd9Sstevel@tonic-gate 		}
51427c478bd9Sstevel@tonic-gate 	}
51437c478bd9Sstevel@tonic-gate 
51447c478bd9Sstevel@tonic-gate 	if (failed_pip) {
51457c478bd9Sstevel@tonic-gate 		pip = ph->ph_path_head;
51467c478bd9Sstevel@tonic-gate 		while (pip != failed_pip) {
51477c478bd9Sstevel@tonic-gate 			MDI_PI_LOCK(pip);
51487c478bd9Sstevel@tonic-gate 			next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
51497c478bd9Sstevel@tonic-gate 			ct = MDI_PI(pip)->pi_client;
51507c478bd9Sstevel@tonic-gate 			i_mdi_client_lock(ct, pip);
51517c478bd9Sstevel@tonic-gate 			cdip = ct->ct_dip;
51527c478bd9Sstevel@tonic-gate 			switch (MDI_CLIENT_STATE(ct)) {
51537c478bd9Sstevel@tonic-gate 			case MDI_CLIENT_STATE_OPTIMAL:
51547c478bd9Sstevel@tonic-gate 			case MDI_CLIENT_STATE_DEGRADED:
51557c478bd9Sstevel@tonic-gate 				if (cdip) {
51567c478bd9Sstevel@tonic-gate 					MDI_PI_UNLOCK(pip);
51577c478bd9Sstevel@tonic-gate 					i_mdi_client_unlock(ct);
51587c478bd9Sstevel@tonic-gate 					MDI_PHCI_UNLOCK(ph);
51597c478bd9Sstevel@tonic-gate 					(void) ndi_devi_online(cdip, 0);
51607c478bd9Sstevel@tonic-gate 					MDI_PHCI_LOCK(ph);
51617c478bd9Sstevel@tonic-gate 					pip = next;
51627c478bd9Sstevel@tonic-gate 					continue;
51637c478bd9Sstevel@tonic-gate 				}
51647c478bd9Sstevel@tonic-gate 				break;
51657c478bd9Sstevel@tonic-gate 
51667c478bd9Sstevel@tonic-gate 			case MDI_CLIENT_STATE_FAILED:
51677c478bd9Sstevel@tonic-gate 				if (cdip) {
51687c478bd9Sstevel@tonic-gate 					MDI_PI_UNLOCK(pip);
51697c478bd9Sstevel@tonic-gate 					i_mdi_client_unlock(ct);
51707c478bd9Sstevel@tonic-gate 					MDI_PHCI_UNLOCK(ph);
51714c06356bSdh142964 					(void) ndi_devi_offline(cdip,
51724c06356bSdh142964 						NDI_DEVFS_CLEAN);
51737c478bd9Sstevel@tonic-gate 					MDI_PHCI_LOCK(ph);
51747c478bd9Sstevel@tonic-gate 					pip = next;
51757c478bd9Sstevel@tonic-gate 					continue;
51767c478bd9Sstevel@tonic-gate 				}
51777c478bd9Sstevel@tonic-gate 				break;
51787c478bd9Sstevel@tonic-gate 			}
51797c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
51807c478bd9Sstevel@tonic-gate 			i_mdi_client_unlock(ct);
51817c478bd9Sstevel@tonic-gate 			pip = next;
51827c478bd9Sstevel@tonic-gate 		}
51837c478bd9Sstevel@tonic-gate 		MDI_PHCI_UNLOCK(ph);
51847c478bd9Sstevel@tonic-gate 		return (NDI_BUSY);
51857c478bd9Sstevel@tonic-gate 	}
51867c478bd9Sstevel@tonic-gate 
51877c478bd9Sstevel@tonic-gate 	/*
51887c478bd9Sstevel@tonic-gate 	 * Mark the pHCI as offline
51897c478bd9Sstevel@tonic-gate 	 */
51907c478bd9Sstevel@tonic-gate 	MDI_PHCI_SET_OFFLINE(ph);
51917c478bd9Sstevel@tonic-gate 
51927c478bd9Sstevel@tonic-gate 	/*
51937c478bd9Sstevel@tonic-gate 	 * Mark the child mdi_pathinfo nodes as transient
51947c478bd9Sstevel@tonic-gate 	 */
51957c478bd9Sstevel@tonic-gate 	pip = ph->ph_path_head;
51967c478bd9Sstevel@tonic-gate 	while (pip != NULL) {
51977c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
51987c478bd9Sstevel@tonic-gate 		next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
51997c478bd9Sstevel@tonic-gate 		MDI_PI_SET_OFFLINING(pip);
52007c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
52017c478bd9Sstevel@tonic-gate 		pip = next;
52027c478bd9Sstevel@tonic-gate 	}
52037c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNLOCK(ph);
52047c478bd9Sstevel@tonic-gate 	/*
52057c478bd9Sstevel@tonic-gate 	 * Give a chance for any pending commands to execute
52067c478bd9Sstevel@tonic-gate 	 */
52074c06356bSdh142964 	delay_random(5);
52087c478bd9Sstevel@tonic-gate 	MDI_PHCI_LOCK(ph);
52097c478bd9Sstevel@tonic-gate 	pip = ph->ph_path_head;
52107c478bd9Sstevel@tonic-gate 	while (pip != NULL) {
52117c478bd9Sstevel@tonic-gate 		next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
52127c478bd9Sstevel@tonic-gate 		(void) i_mdi_pi_offline(pip, flags);
52137c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
52147c478bd9Sstevel@tonic-gate 		ct = MDI_PI(pip)->pi_client;
52157c478bd9Sstevel@tonic-gate 		if (!MDI_PI_IS_OFFLINE(pip)) {
52164c06356bSdh142964 			MDI_DEBUG(1, (MDI_WARN, dip,
52174c06356bSdh142964 			    "!pHCI device is busy. "
52184c06356bSdh142964 			    "This device can not be removed at this moment. "
52194c06356bSdh142964 			    "Please try again later."));
52207c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
52217c478bd9Sstevel@tonic-gate 			MDI_PHCI_SET_ONLINE(ph);
52227c478bd9Sstevel@tonic-gate 			MDI_PHCI_UNLOCK(ph);
52237c478bd9Sstevel@tonic-gate 			return (NDI_BUSY);
52247c478bd9Sstevel@tonic-gate 		}
52257c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
52267c478bd9Sstevel@tonic-gate 		pip = next;
52277c478bd9Sstevel@tonic-gate 	}
52287c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNLOCK(ph);
52297c478bd9Sstevel@tonic-gate 
52307c478bd9Sstevel@tonic-gate 	return (rv);
52317c478bd9Sstevel@tonic-gate }
52327c478bd9Sstevel@tonic-gate 
523325e8c5aaSvikram void
523425e8c5aaSvikram mdi_phci_mark_retiring(dev_info_t *dip, char **cons_array)
523525e8c5aaSvikram {
523625e8c5aaSvikram 	mdi_phci_t	*ph;
523725e8c5aaSvikram 	mdi_client_t	*ct;
523825e8c5aaSvikram 	mdi_pathinfo_t	*pip;
523925e8c5aaSvikram 	mdi_pathinfo_t	*next;
524025e8c5aaSvikram 	dev_info_t	*cdip;
524125e8c5aaSvikram 
524225e8c5aaSvikram 	if (!MDI_PHCI(dip))
524325e8c5aaSvikram 		return;
524425e8c5aaSvikram 
524525e8c5aaSvikram 	ph = i_devi_get_phci(dip);
524625e8c5aaSvikram 	if (ph == NULL) {
524725e8c5aaSvikram 		return;
524825e8c5aaSvikram 	}
524925e8c5aaSvikram 
525025e8c5aaSvikram 	MDI_PHCI_LOCK(ph);
525125e8c5aaSvikram 
525225e8c5aaSvikram 	if (MDI_PHCI_IS_OFFLINE(ph)) {
525325e8c5aaSvikram 		/* has no last path */
525425e8c5aaSvikram 		MDI_PHCI_UNLOCK(ph);
525525e8c5aaSvikram 		return;
525625e8c5aaSvikram 	}
525725e8c5aaSvikram 
525825e8c5aaSvikram 	pip = ph->ph_path_head;
525925e8c5aaSvikram 	while (pip != NULL) {
526025e8c5aaSvikram 		MDI_PI_LOCK(pip);
526125e8c5aaSvikram 		next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
526225e8c5aaSvikram 
526325e8c5aaSvikram 		ct = MDI_PI(pip)->pi_client;
526425e8c5aaSvikram 		i_mdi_client_lock(ct, pip);
526525e8c5aaSvikram 		MDI_PI_UNLOCK(pip);
526625e8c5aaSvikram 
526725e8c5aaSvikram 		cdip = ct->ct_dip;
526825e8c5aaSvikram 		if (cdip && (i_ddi_node_state(cdip) >= DS_INITIALIZED) &&
526925e8c5aaSvikram 		    (i_mdi_client_compute_state(ct, ph) ==
527025e8c5aaSvikram 		    MDI_CLIENT_STATE_FAILED)) {
527125e8c5aaSvikram 			/* Last path. Mark client dip as retiring */
527225e8c5aaSvikram 			i_mdi_client_unlock(ct);
527325e8c5aaSvikram 			MDI_PHCI_UNLOCK(ph);
527425e8c5aaSvikram 			(void) e_ddi_mark_retiring(cdip, cons_array);
527525e8c5aaSvikram 			MDI_PHCI_LOCK(ph);
527625e8c5aaSvikram 			pip = next;
527725e8c5aaSvikram 		} else {
527825e8c5aaSvikram 			i_mdi_client_unlock(ct);
527925e8c5aaSvikram 			pip = next;
528025e8c5aaSvikram 		}
528125e8c5aaSvikram 	}
528225e8c5aaSvikram 
528325e8c5aaSvikram 	MDI_PHCI_UNLOCK(ph);
528425e8c5aaSvikram 
528525e8c5aaSvikram 	return;
528625e8c5aaSvikram }
528725e8c5aaSvikram 
528825e8c5aaSvikram void
528925e8c5aaSvikram mdi_phci_retire_notify(dev_info_t *dip, int *constraint)
529025e8c5aaSvikram {
529125e8c5aaSvikram 	mdi_phci_t	*ph;
529225e8c5aaSvikram 	mdi_client_t	*ct;
529325e8c5aaSvikram 	mdi_pathinfo_t	*pip;
529425e8c5aaSvikram 	mdi_pathinfo_t	*next;
529525e8c5aaSvikram 	dev_info_t	*cdip;
529625e8c5aaSvikram 
529725e8c5aaSvikram 	if (!MDI_PHCI(dip))
529825e8c5aaSvikram 		return;
529925e8c5aaSvikram 
530025e8c5aaSvikram 	ph = i_devi_get_phci(dip);
530125e8c5aaSvikram 	if (ph == NULL)
530225e8c5aaSvikram 		return;
530325e8c5aaSvikram 
530425e8c5aaSvikram 	MDI_PHCI_LOCK(ph);
530525e8c5aaSvikram 
530625e8c5aaSvikram 	if (MDI_PHCI_IS_OFFLINE(ph)) {
530725e8c5aaSvikram 		MDI_PHCI_UNLOCK(ph);
530825e8c5aaSvikram 		/* not last path */
530925e8c5aaSvikram 		return;
531025e8c5aaSvikram 	}
531125e8c5aaSvikram 
531225e8c5aaSvikram 	if (ph->ph_unstable) {
531325e8c5aaSvikram 		MDI_PHCI_UNLOCK(ph);
531425e8c5aaSvikram 		/* can't check for constraints */
531525e8c5aaSvikram 		*constraint = 0;
531625e8c5aaSvikram 		return;
531725e8c5aaSvikram 	}
531825e8c5aaSvikram 
531925e8c5aaSvikram 	pip = ph->ph_path_head;
532025e8c5aaSvikram 	while (pip != NULL) {
532125e8c5aaSvikram 		MDI_PI_LOCK(pip);
532225e8c5aaSvikram 		next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
532325e8c5aaSvikram 
532425e8c5aaSvikram 		/*
532525e8c5aaSvikram 		 * The mdi_pathinfo state is OK. Check the client state.
532625e8c5aaSvikram 		 * If failover in progress fail the pHCI from offlining
532725e8c5aaSvikram 		 */
532825e8c5aaSvikram 		ct = MDI_PI(pip)->pi_client;
532925e8c5aaSvikram 		i_mdi_client_lock(ct, pip);
533025e8c5aaSvikram 		if ((MDI_CLIENT_IS_FAILOVER_IN_PROGRESS(ct)) ||
533125e8c5aaSvikram 		    (ct->ct_unstable)) {
533225e8c5aaSvikram 			/*
533325e8c5aaSvikram 			 * Failover is in progress, can't check for constraints
533425e8c5aaSvikram 			 */
533525e8c5aaSvikram 			MDI_PI_UNLOCK(pip);
533625e8c5aaSvikram 			i_mdi_client_unlock(ct);
533725e8c5aaSvikram 			MDI_PHCI_UNLOCK(ph);
533825e8c5aaSvikram 			*constraint = 0;
533925e8c5aaSvikram 			return;
534025e8c5aaSvikram 		}
534125e8c5aaSvikram 		MDI_PI_UNLOCK(pip);
534225e8c5aaSvikram 
534325e8c5aaSvikram 		/*
534425e8c5aaSvikram 		 * Check to see of we are retiring the last path of this
534525e8c5aaSvikram 		 * client device...
534625e8c5aaSvikram 		 */
534725e8c5aaSvikram 		cdip = ct->ct_dip;
534825e8c5aaSvikram 		if (cdip && (i_ddi_node_state(cdip) >= DS_INITIALIZED) &&
534925e8c5aaSvikram 		    (i_mdi_client_compute_state(ct, ph) ==
535025e8c5aaSvikram 		    MDI_CLIENT_STATE_FAILED)) {
535125e8c5aaSvikram 			i_mdi_client_unlock(ct);
535225e8c5aaSvikram 			MDI_PHCI_UNLOCK(ph);
535325e8c5aaSvikram 			(void) e_ddi_retire_notify(cdip, constraint);
535425e8c5aaSvikram 			MDI_PHCI_LOCK(ph);
535525e8c5aaSvikram 			pip = next;
535625e8c5aaSvikram 		} else {
535725e8c5aaSvikram 			i_mdi_client_unlock(ct);
535825e8c5aaSvikram 			pip = next;
535925e8c5aaSvikram 		}
536025e8c5aaSvikram 	}
536125e8c5aaSvikram 
536225e8c5aaSvikram 	MDI_PHCI_UNLOCK(ph);
536325e8c5aaSvikram 
536425e8c5aaSvikram 	return;
536525e8c5aaSvikram }
536625e8c5aaSvikram 
536725e8c5aaSvikram /*
53684c06356bSdh142964  * offline the path(s) hanging off the pHCI. If the
536925e8c5aaSvikram  * last path to any client, check that constraints
537025e8c5aaSvikram  * have been applied.
537125e8c5aaSvikram  */
537225e8c5aaSvikram void
537325e8c5aaSvikram mdi_phci_retire_finalize(dev_info_t *dip, int phci_only)
537425e8c5aaSvikram {
537525e8c5aaSvikram 	mdi_phci_t	*ph;
537625e8c5aaSvikram 	mdi_client_t	*ct;
537725e8c5aaSvikram 	mdi_pathinfo_t	*pip;
537825e8c5aaSvikram 	mdi_pathinfo_t	*next;
537925e8c5aaSvikram 	dev_info_t	*cdip;
538025e8c5aaSvikram 	int		unstable = 0;
538125e8c5aaSvikram 	int		constraint;
538225e8c5aaSvikram 
538325e8c5aaSvikram 	if (!MDI_PHCI(dip))
538425e8c5aaSvikram 		return;
538525e8c5aaSvikram 
538625e8c5aaSvikram 	ph = i_devi_get_phci(dip);
538725e8c5aaSvikram 	if (ph == NULL) {
538825e8c5aaSvikram 		/* no last path and no pips */
538925e8c5aaSvikram 		return;
539025e8c5aaSvikram 	}
539125e8c5aaSvikram 
539225e8c5aaSvikram 	MDI_PHCI_LOCK(ph);
539325e8c5aaSvikram 
539425e8c5aaSvikram 	if (MDI_PHCI_IS_OFFLINE(ph)) {
539525e8c5aaSvikram 		MDI_PHCI_UNLOCK(ph);
539625e8c5aaSvikram 		/* no last path and no pips */
539725e8c5aaSvikram 		return;
539825e8c5aaSvikram 	}
539925e8c5aaSvikram 
540025e8c5aaSvikram 	/*
540125e8c5aaSvikram 	 * Check to see if the pHCI can be offlined
540225e8c5aaSvikram 	 */
540325e8c5aaSvikram 	if (ph->ph_unstable) {
540425e8c5aaSvikram 		unstable = 1;
540525e8c5aaSvikram 	}
540625e8c5aaSvikram 
540725e8c5aaSvikram 	pip = ph->ph_path_head;
540825e8c5aaSvikram 	while (pip != NULL) {
540925e8c5aaSvikram 		MDI_PI_LOCK(pip);
541025e8c5aaSvikram 		next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
541125e8c5aaSvikram 
541225e8c5aaSvikram 		/*
541325e8c5aaSvikram 		 * if failover in progress fail the pHCI from offlining
541425e8c5aaSvikram 		 */
541525e8c5aaSvikram 		ct = MDI_PI(pip)->pi_client;
541625e8c5aaSvikram 		i_mdi_client_lock(ct, pip);
541725e8c5aaSvikram 		if ((MDI_CLIENT_IS_FAILOVER_IN_PROGRESS(ct)) ||
541825e8c5aaSvikram 		    (ct->ct_unstable)) {
541925e8c5aaSvikram 			unstable = 1;
542025e8c5aaSvikram 		}
542125e8c5aaSvikram 		MDI_PI_UNLOCK(pip);
542225e8c5aaSvikram 
542325e8c5aaSvikram 		/*
542425e8c5aaSvikram 		 * Check to see of we are removing the last path of this
542525e8c5aaSvikram 		 * client device...
542625e8c5aaSvikram 		 */
542725e8c5aaSvikram 		cdip = ct->ct_dip;
542825e8c5aaSvikram 		if (!phci_only && cdip &&
542925e8c5aaSvikram 		    (i_ddi_node_state(cdip) >= DS_INITIALIZED) &&
543025e8c5aaSvikram 		    (i_mdi_client_compute_state(ct, ph) ==
543125e8c5aaSvikram 		    MDI_CLIENT_STATE_FAILED)) {
543225e8c5aaSvikram 			i_mdi_client_unlock(ct);
543325e8c5aaSvikram 			MDI_PHCI_UNLOCK(ph);
543425e8c5aaSvikram 			/*
543525e8c5aaSvikram 			 * We don't retire clients we just retire the
543625e8c5aaSvikram 			 * path to a client. If it is the last path
543725e8c5aaSvikram 			 * to a client, constraints are checked and
543825e8c5aaSvikram 			 * if we pass the last path is offlined. MPXIO will
543925e8c5aaSvikram 			 * then fail all I/Os to the client. Since we don't
544025e8c5aaSvikram 			 * want to retire the client on a path error
544125e8c5aaSvikram 			 * set constraint = 0 so that the client dip
544225e8c5aaSvikram 			 * is not retired.
544325e8c5aaSvikram 			 */
544425e8c5aaSvikram 			constraint = 0;
544525e8c5aaSvikram 			(void) e_ddi_retire_finalize(cdip, &constraint);
544625e8c5aaSvikram 			MDI_PHCI_LOCK(ph);
544725e8c5aaSvikram 			pip = next;
544825e8c5aaSvikram 		} else {
544925e8c5aaSvikram 			i_mdi_client_unlock(ct);
545025e8c5aaSvikram 			pip = next;
545125e8c5aaSvikram 		}
545225e8c5aaSvikram 	}
545325e8c5aaSvikram 
545425e8c5aaSvikram 	/*
545525e8c5aaSvikram 	 * Cannot offline pip(s)
545625e8c5aaSvikram 	 */
545725e8c5aaSvikram 	if (unstable) {
54584c06356bSdh142964 		cmn_err(CE_WARN, "%s%d: mdi_phci_retire_finalize: "
54594c06356bSdh142964 		    "pHCI in transient state, cannot retire",
54604c06356bSdh142964 		    ddi_driver_name(dip), ddi_get_instance(dip));
546125e8c5aaSvikram 		MDI_PHCI_UNLOCK(ph);
546225e8c5aaSvikram 		return;
546325e8c5aaSvikram 	}
546425e8c5aaSvikram 
546525e8c5aaSvikram 	/*
546625e8c5aaSvikram 	 * Mark the pHCI as offline
546725e8c5aaSvikram 	 */
546825e8c5aaSvikram 	MDI_PHCI_SET_OFFLINE(ph);
546925e8c5aaSvikram 
547025e8c5aaSvikram 	/*
547125e8c5aaSvikram 	 * Mark the child mdi_pathinfo nodes as transient
547225e8c5aaSvikram 	 */
547325e8c5aaSvikram 	pip = ph->ph_path_head;
547425e8c5aaSvikram 	while (pip != NULL) {
547525e8c5aaSvikram 		MDI_PI_LOCK(pip);
547625e8c5aaSvikram 		next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
547725e8c5aaSvikram 		MDI_PI_SET_OFFLINING(pip);
547825e8c5aaSvikram 		MDI_PI_UNLOCK(pip);
547925e8c5aaSvikram 		pip = next;
548025e8c5aaSvikram 	}
548125e8c5aaSvikram 	MDI_PHCI_UNLOCK(ph);
548225e8c5aaSvikram 	/*
548325e8c5aaSvikram 	 * Give a chance for any pending commands to execute
548425e8c5aaSvikram 	 */
54854c06356bSdh142964 	delay_random(5);
548625e8c5aaSvikram 	MDI_PHCI_LOCK(ph);
548725e8c5aaSvikram 	pip = ph->ph_path_head;
548825e8c5aaSvikram 	while (pip != NULL) {
548925e8c5aaSvikram 		next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
549025e8c5aaSvikram 		(void) i_mdi_pi_offline(pip, 0);
549125e8c5aaSvikram 		MDI_PI_LOCK(pip);
549225e8c5aaSvikram 		ct = MDI_PI(pip)->pi_client;
549325e8c5aaSvikram 		if (!MDI_PI_IS_OFFLINE(pip)) {
54944c06356bSdh142964 			cmn_err(CE_WARN, "mdi_phci_retire_finalize: "
54954c06356bSdh142964 			    "path %d %s busy, cannot offline",
54964c06356bSdh142964 			    mdi_pi_get_path_instance(pip),
54974c06356bSdh142964 			    mdi_pi_spathname(pip));
549825e8c5aaSvikram 			MDI_PI_UNLOCK(pip);
549925e8c5aaSvikram 			MDI_PHCI_SET_ONLINE(ph);
550025e8c5aaSvikram 			MDI_PHCI_UNLOCK(ph);
550125e8c5aaSvikram 			return;
550225e8c5aaSvikram 		}
550325e8c5aaSvikram 		MDI_PI_UNLOCK(pip);
550425e8c5aaSvikram 		pip = next;
550525e8c5aaSvikram 	}
550625e8c5aaSvikram 	MDI_PHCI_UNLOCK(ph);
550725e8c5aaSvikram 
550825e8c5aaSvikram 	return;
550925e8c5aaSvikram }
551025e8c5aaSvikram 
551125e8c5aaSvikram void
551225e8c5aaSvikram mdi_phci_unretire(dev_info_t *dip)
551325e8c5aaSvikram {
551425e8c5aaSvikram 	ASSERT(MDI_PHCI(dip));
551525e8c5aaSvikram 
551625e8c5aaSvikram 	/*
551725e8c5aaSvikram 	 * Online the phci
551825e8c5aaSvikram 	 */
551925e8c5aaSvikram 	i_mdi_phci_online(dip);
552025e8c5aaSvikram }
552125e8c5aaSvikram 
55227c478bd9Sstevel@tonic-gate /*ARGSUSED*/
55237c478bd9Sstevel@tonic-gate static int
55247c478bd9Sstevel@tonic-gate i_mdi_client_offline(dev_info_t *dip, uint_t flags)
55257c478bd9Sstevel@tonic-gate {
55267c478bd9Sstevel@tonic-gate 	int		rv = NDI_SUCCESS;
55277c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
55287c478bd9Sstevel@tonic-gate 
55297c478bd9Sstevel@tonic-gate 	/*
55307c478bd9Sstevel@tonic-gate 	 * Client component to go offline.  Make sure that we are
55317c478bd9Sstevel@tonic-gate 	 * not in failing over state and update client state
55327c478bd9Sstevel@tonic-gate 	 * accordingly
55337c478bd9Sstevel@tonic-gate 	 */
55347c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(dip);
55354c06356bSdh142964 	MDI_DEBUG(2, (MDI_NOTE, dip,
55364c06356bSdh142964 	    "called %p %p", (void *)dip, (void *)ct));
55377c478bd9Sstevel@tonic-gate 	if (ct != NULL) {
55387c478bd9Sstevel@tonic-gate 		MDI_CLIENT_LOCK(ct);
55397c478bd9Sstevel@tonic-gate 		if (ct->ct_unstable) {
55407c478bd9Sstevel@tonic-gate 			/*
55417c478bd9Sstevel@tonic-gate 			 * One or more paths are in transient state,
55427c478bd9Sstevel@tonic-gate 			 * Dont allow offline of a client device
55437c478bd9Sstevel@tonic-gate 			 */
55444c06356bSdh142964 			MDI_DEBUG(1, (MDI_WARN, dip,
55454c06356bSdh142964 			    "!One or more paths to "
55464c06356bSdh142964 			    "this device are in transient state. "
55474c06356bSdh142964 			    "This device can not be removed at this moment. "
55487c478bd9Sstevel@tonic-gate 			    "Please try again later."));
55497c478bd9Sstevel@tonic-gate 			MDI_CLIENT_UNLOCK(ct);
55507c478bd9Sstevel@tonic-gate 			return (NDI_BUSY);
55517c478bd9Sstevel@tonic-gate 		}
55527c478bd9Sstevel@tonic-gate 		if (MDI_CLIENT_IS_FAILOVER_IN_PROGRESS(ct)) {
55537c478bd9Sstevel@tonic-gate 			/*
55547c478bd9Sstevel@tonic-gate 			 * Failover is in progress, Dont allow DR of
55557c478bd9Sstevel@tonic-gate 			 * a client device
55567c478bd9Sstevel@tonic-gate 			 */
55574c06356bSdh142964 			MDI_DEBUG(1, (MDI_WARN, dip,
55584c06356bSdh142964 			    "!Client device is Busy. "
55594c06356bSdh142964 			    "This device can not be removed at this moment. "
55604c06356bSdh142964 			    "Please try again later."));
55617c478bd9Sstevel@tonic-gate 			MDI_CLIENT_UNLOCK(ct);
55627c478bd9Sstevel@tonic-gate 			return (NDI_BUSY);
55637c478bd9Sstevel@tonic-gate 		}
55647c478bd9Sstevel@tonic-gate 		MDI_CLIENT_SET_OFFLINE(ct);
55657c478bd9Sstevel@tonic-gate 
55667c478bd9Sstevel@tonic-gate 		/*
55677c478bd9Sstevel@tonic-gate 		 * Unbind our relationship with the dev_info node
55687c478bd9Sstevel@tonic-gate 		 */
55697c478bd9Sstevel@tonic-gate 		if (flags & NDI_DEVI_REMOVE) {
55707c478bd9Sstevel@tonic-gate 			ct->ct_dip = NULL;
55717c478bd9Sstevel@tonic-gate 		}
55727c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
55737c478bd9Sstevel@tonic-gate 	}
55747c478bd9Sstevel@tonic-gate 	return (rv);
55757c478bd9Sstevel@tonic-gate }
55767c478bd9Sstevel@tonic-gate 
55777c478bd9Sstevel@tonic-gate /*
55787c478bd9Sstevel@tonic-gate  * mdi_pre_attach():
55797c478bd9Sstevel@tonic-gate  *		Pre attach() notification handler
55807c478bd9Sstevel@tonic-gate  */
55817c478bd9Sstevel@tonic-gate /*ARGSUSED*/
55827c478bd9Sstevel@tonic-gate int
55837c478bd9Sstevel@tonic-gate mdi_pre_attach(dev_info_t *dip, ddi_attach_cmd_t cmd)
55847c478bd9Sstevel@tonic-gate {
55857c478bd9Sstevel@tonic-gate 	/* don't support old DDI_PM_RESUME */
55867c478bd9Sstevel@tonic-gate 	if ((DEVI(dip)->devi_mdi_component != MDI_COMPONENT_NONE) &&
55877c478bd9Sstevel@tonic-gate 	    (cmd == DDI_PM_RESUME))
55887c478bd9Sstevel@tonic-gate 		return (DDI_FAILURE);
55897c478bd9Sstevel@tonic-gate 
55907c478bd9Sstevel@tonic-gate 	return (DDI_SUCCESS);
55917c478bd9Sstevel@tonic-gate }
55927c478bd9Sstevel@tonic-gate 
55937c478bd9Sstevel@tonic-gate /*
55947c478bd9Sstevel@tonic-gate  * mdi_post_attach():
55957c478bd9Sstevel@tonic-gate  *		Post attach() notification handler
55967c478bd9Sstevel@tonic-gate  */
55977c478bd9Sstevel@tonic-gate /*ARGSUSED*/
55987c478bd9Sstevel@tonic-gate void
55997c478bd9Sstevel@tonic-gate mdi_post_attach(dev_info_t *dip, ddi_attach_cmd_t cmd, int error)
56007c478bd9Sstevel@tonic-gate {
56017c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
56027c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
560337fbbce5Scth 	mdi_vhci_t	*vh;
56047c478bd9Sstevel@tonic-gate 
56057c478bd9Sstevel@tonic-gate 	if (MDI_PHCI(dip)) {
56067c478bd9Sstevel@tonic-gate 		ph = i_devi_get_phci(dip);
56077c478bd9Sstevel@tonic-gate 		ASSERT(ph != NULL);
56087c478bd9Sstevel@tonic-gate 
56097c478bd9Sstevel@tonic-gate 		MDI_PHCI_LOCK(ph);
56107c478bd9Sstevel@tonic-gate 		switch (cmd) {
56117c478bd9Sstevel@tonic-gate 		case DDI_ATTACH:
56124c06356bSdh142964 			MDI_DEBUG(2, (MDI_NOTE, dip,
56134c06356bSdh142964 			    "phci post_attach called %p", (void *)ph));
56147c478bd9Sstevel@tonic-gate 			if (error == DDI_SUCCESS) {
56157c478bd9Sstevel@tonic-gate 				MDI_PHCI_SET_ATTACH(ph);
56167c478bd9Sstevel@tonic-gate 			} else {
56174c06356bSdh142964 				MDI_DEBUG(1, (MDI_NOTE, dip,
56184c06356bSdh142964 				    "!pHCI post_attach failed: error %d",
56197c478bd9Sstevel@tonic-gate 				    error));
56207c478bd9Sstevel@tonic-gate 				MDI_PHCI_SET_DETACH(ph);
56217c478bd9Sstevel@tonic-gate 			}
56227c478bd9Sstevel@tonic-gate 			break;
56237c478bd9Sstevel@tonic-gate 
56247c478bd9Sstevel@tonic-gate 		case DDI_RESUME:
56254c06356bSdh142964 			MDI_DEBUG(2, (MDI_NOTE, dip,
56264c06356bSdh142964 			    "pHCI post_resume: called %p", (void *)ph));
56277c478bd9Sstevel@tonic-gate 			if (error == DDI_SUCCESS) {
56287c478bd9Sstevel@tonic-gate 				MDI_PHCI_SET_RESUME(ph);
56297c478bd9Sstevel@tonic-gate 			} else {
56304c06356bSdh142964 				MDI_DEBUG(1, (MDI_NOTE, dip,
56314c06356bSdh142964 				    "!pHCI post_resume failed: error %d",
56327c478bd9Sstevel@tonic-gate 				    error));
56337c478bd9Sstevel@tonic-gate 				MDI_PHCI_SET_SUSPEND(ph);
56347c478bd9Sstevel@tonic-gate 			}
56357c478bd9Sstevel@tonic-gate 			break;
56367c478bd9Sstevel@tonic-gate 		}
56377c478bd9Sstevel@tonic-gate 		MDI_PHCI_UNLOCK(ph);
56387c478bd9Sstevel@tonic-gate 	}
56397c478bd9Sstevel@tonic-gate 
56407c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT(dip)) {
56417c478bd9Sstevel@tonic-gate 		ct = i_devi_get_client(dip);
56427c478bd9Sstevel@tonic-gate 		ASSERT(ct != NULL);
56437c478bd9Sstevel@tonic-gate 
56447c478bd9Sstevel@tonic-gate 		MDI_CLIENT_LOCK(ct);
56457c478bd9Sstevel@tonic-gate 		switch (cmd) {
56467c478bd9Sstevel@tonic-gate 		case DDI_ATTACH:
56474c06356bSdh142964 			MDI_DEBUG(2, (MDI_NOTE, dip,
56484c06356bSdh142964 			    "client post_attach called %p", (void *)ct));
56497c478bd9Sstevel@tonic-gate 			if (error != DDI_SUCCESS) {
56504c06356bSdh142964 				MDI_DEBUG(1, (MDI_NOTE, dip,
56514c06356bSdh142964 				    "!client post_attach failed: error %d",
56527c478bd9Sstevel@tonic-gate 				    error));
56537c478bd9Sstevel@tonic-gate 				MDI_CLIENT_SET_DETACH(ct);
56544c06356bSdh142964 				MDI_DEBUG(4, (MDI_WARN, dip,
56554c06356bSdh142964 				    "i_mdi_pm_reset_client"));
56567c478bd9Sstevel@tonic-gate 				i_mdi_pm_reset_client(ct);
56577c478bd9Sstevel@tonic-gate 				break;
56587c478bd9Sstevel@tonic-gate 			}
56597c478bd9Sstevel@tonic-gate 
56607c478bd9Sstevel@tonic-gate 			/*
566137fbbce5Scth 			 * Client device has successfully attached, inform
566237fbbce5Scth 			 * the vhci.
56637c478bd9Sstevel@tonic-gate 			 */
566437fbbce5Scth 			vh = ct->ct_vhci;
566537fbbce5Scth 			if (vh->vh_ops->vo_client_attached)
566637fbbce5Scth 				(*vh->vh_ops->vo_client_attached)(dip);
566737fbbce5Scth 
56687c478bd9Sstevel@tonic-gate 			MDI_CLIENT_SET_ATTACH(ct);
56697c478bd9Sstevel@tonic-gate 			break;
56707c478bd9Sstevel@tonic-gate 
56717c478bd9Sstevel@tonic-gate 		case DDI_RESUME:
56724c06356bSdh142964 			MDI_DEBUG(2, (MDI_NOTE, dip,
56734c06356bSdh142964 			    "client post_attach: called %p", (void *)ct));
56747c478bd9Sstevel@tonic-gate 			if (error == DDI_SUCCESS) {
56757c478bd9Sstevel@tonic-gate 				MDI_CLIENT_SET_RESUME(ct);
56767c478bd9Sstevel@tonic-gate 			} else {
56774c06356bSdh142964 				MDI_DEBUG(1, (MDI_NOTE, dip,
56784c06356bSdh142964 				    "!client post_resume failed: error %d",
56797c478bd9Sstevel@tonic-gate 				    error));
56807c478bd9Sstevel@tonic-gate 				MDI_CLIENT_SET_SUSPEND(ct);
56817c478bd9Sstevel@tonic-gate 			}
56827c478bd9Sstevel@tonic-gate 			break;
56837c478bd9Sstevel@tonic-gate 		}
56847c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
56857c478bd9Sstevel@tonic-gate 	}
56867c478bd9Sstevel@tonic-gate }
56877c478bd9Sstevel@tonic-gate 
56887c478bd9Sstevel@tonic-gate /*
56897c478bd9Sstevel@tonic-gate  * mdi_pre_detach():
56907c478bd9Sstevel@tonic-gate  *		Pre detach notification handler
56917c478bd9Sstevel@tonic-gate  */
56927c478bd9Sstevel@tonic-gate /*ARGSUSED*/
56937c478bd9Sstevel@tonic-gate int
56947c478bd9Sstevel@tonic-gate mdi_pre_detach(dev_info_t *dip, ddi_detach_cmd_t cmd)
56957c478bd9Sstevel@tonic-gate {
56967c478bd9Sstevel@tonic-gate 	int rv = DDI_SUCCESS;
56977c478bd9Sstevel@tonic-gate 
56987c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT(dip)) {
56997c478bd9Sstevel@tonic-gate 		(void) i_mdi_client_pre_detach(dip, cmd);
57007c478bd9Sstevel@tonic-gate 	}
57017c478bd9Sstevel@tonic-gate 
57027c478bd9Sstevel@tonic-gate 	if (MDI_PHCI(dip)) {
57037c478bd9Sstevel@tonic-gate 		rv = i_mdi_phci_pre_detach(dip, cmd);
57047c478bd9Sstevel@tonic-gate 	}
57057c478bd9Sstevel@tonic-gate 
57067c478bd9Sstevel@tonic-gate 	return (rv);
57077c478bd9Sstevel@tonic-gate }
57087c478bd9Sstevel@tonic-gate 
57097c478bd9Sstevel@tonic-gate /*ARGSUSED*/
57107c478bd9Sstevel@tonic-gate static int
57117c478bd9Sstevel@tonic-gate i_mdi_phci_pre_detach(dev_info_t *dip, ddi_detach_cmd_t cmd)
57127c478bd9Sstevel@tonic-gate {
57137c478bd9Sstevel@tonic-gate 	int		rv = DDI_SUCCESS;
57147c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
57157c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
57167c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*pip;
57177c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*failed_pip = NULL;
57187c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*next;
57197c478bd9Sstevel@tonic-gate 
57207c478bd9Sstevel@tonic-gate 	ph = i_devi_get_phci(dip);
57217c478bd9Sstevel@tonic-gate 	if (ph == NULL) {
57227c478bd9Sstevel@tonic-gate 		return (rv);
57237c478bd9Sstevel@tonic-gate 	}
57247c478bd9Sstevel@tonic-gate 
57257c478bd9Sstevel@tonic-gate 	MDI_PHCI_LOCK(ph);
57267c478bd9Sstevel@tonic-gate 	switch (cmd) {
57277c478bd9Sstevel@tonic-gate 	case DDI_DETACH:
57284c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, dip,
57294c06356bSdh142964 		    "pHCI pre_detach: called %p", (void *)ph));
57307c478bd9Sstevel@tonic-gate 		if (!MDI_PHCI_IS_OFFLINE(ph)) {
57317c478bd9Sstevel@tonic-gate 			/*
57327c478bd9Sstevel@tonic-gate 			 * mdi_pathinfo nodes are still attached to
57337c478bd9Sstevel@tonic-gate 			 * this pHCI. Fail the detach for this pHCI.
57347c478bd9Sstevel@tonic-gate 			 */
57354c06356bSdh142964 			MDI_DEBUG(2, (MDI_WARN, dip,
57364c06356bSdh142964 			    "pHCI pre_detach: paths are still attached %p",
57374c06356bSdh142964 			    (void *)ph));
57387c478bd9Sstevel@tonic-gate 			rv = DDI_FAILURE;
57397c478bd9Sstevel@tonic-gate 			break;
57407c478bd9Sstevel@tonic-gate 		}
57417c478bd9Sstevel@tonic-gate 		MDI_PHCI_SET_DETACH(ph);
57427c478bd9Sstevel@tonic-gate 		break;
57437c478bd9Sstevel@tonic-gate 
57447c478bd9Sstevel@tonic-gate 	case DDI_SUSPEND:
57457c478bd9Sstevel@tonic-gate 		/*
57467c478bd9Sstevel@tonic-gate 		 * pHCI is getting suspended.  Since mpxio client
57477c478bd9Sstevel@tonic-gate 		 * devices may not be suspended at this point, to avoid
57487c478bd9Sstevel@tonic-gate 		 * a potential stack overflow, it is important to suspend
57497c478bd9Sstevel@tonic-gate 		 * client devices before pHCI can be suspended.
57507c478bd9Sstevel@tonic-gate 		 */
57517c478bd9Sstevel@tonic-gate 
57524c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, dip,
57534c06356bSdh142964 		    "pHCI pre_suspend: called %p", (void *)ph));
57547c478bd9Sstevel@tonic-gate 		/*
57557c478bd9Sstevel@tonic-gate 		 * Suspend all the client devices accessible through this pHCI
57567c478bd9Sstevel@tonic-gate 		 */
57577c478bd9Sstevel@tonic-gate 		pip = ph->ph_path_head;
57587c478bd9Sstevel@tonic-gate 		while (pip != NULL && rv == DDI_SUCCESS) {
57597c478bd9Sstevel@tonic-gate 			dev_info_t *cdip;
57607c478bd9Sstevel@tonic-gate 			MDI_PI_LOCK(pip);
57617c478bd9Sstevel@tonic-gate 			next =
57627c478bd9Sstevel@tonic-gate 			    (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
57637c478bd9Sstevel@tonic-gate 			ct = MDI_PI(pip)->pi_client;
57647c478bd9Sstevel@tonic-gate 			i_mdi_client_lock(ct, pip);
57657c478bd9Sstevel@tonic-gate 			cdip = ct->ct_dip;
57667c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
57677c478bd9Sstevel@tonic-gate 			if ((MDI_CLIENT_IS_DETACHED(ct) == 0) &&
57687c478bd9Sstevel@tonic-gate 			    MDI_CLIENT_IS_SUSPENDED(ct) == 0) {
57697c478bd9Sstevel@tonic-gate 				i_mdi_client_unlock(ct);
57707c478bd9Sstevel@tonic-gate 				if ((rv = devi_detach(cdip, DDI_SUSPEND)) !=
57717c478bd9Sstevel@tonic-gate 				    DDI_SUCCESS) {
57727c478bd9Sstevel@tonic-gate 					/*
57737c478bd9Sstevel@tonic-gate 					 * Suspend of one of the client
57747c478bd9Sstevel@tonic-gate 					 * device has failed.
57757c478bd9Sstevel@tonic-gate 					 */
57764c06356bSdh142964 					MDI_DEBUG(1, (MDI_WARN, dip,
57774c06356bSdh142964 					    "!suspend of device (%s%d) failed.",
57787c478bd9Sstevel@tonic-gate 					    ddi_driver_name(cdip),
57797c478bd9Sstevel@tonic-gate 					    ddi_get_instance(cdip)));
57807c478bd9Sstevel@tonic-gate 					failed_pip = pip;
57817c478bd9Sstevel@tonic-gate 					break;
57827c478bd9Sstevel@tonic-gate 				}
57837c478bd9Sstevel@tonic-gate 			} else {
57847c478bd9Sstevel@tonic-gate 				i_mdi_client_unlock(ct);
57857c478bd9Sstevel@tonic-gate 			}
57867c478bd9Sstevel@tonic-gate 			pip = next;
57877c478bd9Sstevel@tonic-gate 		}
57887c478bd9Sstevel@tonic-gate 
57897c478bd9Sstevel@tonic-gate 		if (rv == DDI_SUCCESS) {
57907c478bd9Sstevel@tonic-gate 			/*
57917c478bd9Sstevel@tonic-gate 			 * Suspend of client devices is complete. Proceed
57927c478bd9Sstevel@tonic-gate 			 * with pHCI suspend.
57937c478bd9Sstevel@tonic-gate 			 */
57947c478bd9Sstevel@tonic-gate 			MDI_PHCI_SET_SUSPEND(ph);
57957c478bd9Sstevel@tonic-gate 		} else {
57967c478bd9Sstevel@tonic-gate 			/*
57977c478bd9Sstevel@tonic-gate 			 * Revert back all the suspended client device states
57987c478bd9Sstevel@tonic-gate 			 * to converse.
57997c478bd9Sstevel@tonic-gate 			 */
58007c478bd9Sstevel@tonic-gate 			pip = ph->ph_path_head;
58017c478bd9Sstevel@tonic-gate 			while (pip != failed_pip) {
58027c478bd9Sstevel@tonic-gate 				dev_info_t *cdip;
58037c478bd9Sstevel@tonic-gate 				MDI_PI_LOCK(pip);
58047c478bd9Sstevel@tonic-gate 				next =
58057c478bd9Sstevel@tonic-gate 				    (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
58067c478bd9Sstevel@tonic-gate 				ct = MDI_PI(pip)->pi_client;
58077c478bd9Sstevel@tonic-gate 				i_mdi_client_lock(ct, pip);
58087c478bd9Sstevel@tonic-gate 				cdip = ct->ct_dip;
58097c478bd9Sstevel@tonic-gate 				MDI_PI_UNLOCK(pip);
58107c478bd9Sstevel@tonic-gate 				if (MDI_CLIENT_IS_SUSPENDED(ct)) {
58117c478bd9Sstevel@tonic-gate 					i_mdi_client_unlock(ct);
58127c478bd9Sstevel@tonic-gate 					(void) devi_attach(cdip, DDI_RESUME);
58137c478bd9Sstevel@tonic-gate 				} else {
58147c478bd9Sstevel@tonic-gate 					i_mdi_client_unlock(ct);
58157c478bd9Sstevel@tonic-gate 				}
58167c478bd9Sstevel@tonic-gate 				pip = next;
58177c478bd9Sstevel@tonic-gate 			}
58187c478bd9Sstevel@tonic-gate 		}
58197c478bd9Sstevel@tonic-gate 		break;
58207c478bd9Sstevel@tonic-gate 
58217c478bd9Sstevel@tonic-gate 	default:
58227c478bd9Sstevel@tonic-gate 		rv = DDI_FAILURE;
58237c478bd9Sstevel@tonic-gate 		break;
58247c478bd9Sstevel@tonic-gate 	}
58257c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNLOCK(ph);
58267c478bd9Sstevel@tonic-gate 	return (rv);
58277c478bd9Sstevel@tonic-gate }
58287c478bd9Sstevel@tonic-gate 
58297c478bd9Sstevel@tonic-gate /*ARGSUSED*/
58307c478bd9Sstevel@tonic-gate static int
58317c478bd9Sstevel@tonic-gate i_mdi_client_pre_detach(dev_info_t *dip, ddi_detach_cmd_t cmd)
58327c478bd9Sstevel@tonic-gate {
58337c478bd9Sstevel@tonic-gate 	int		rv = DDI_SUCCESS;
58347c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
58357c478bd9Sstevel@tonic-gate 
58367c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(dip);
58377c478bd9Sstevel@tonic-gate 	if (ct == NULL) {
58387c478bd9Sstevel@tonic-gate 		return (rv);
58397c478bd9Sstevel@tonic-gate 	}
58407c478bd9Sstevel@tonic-gate 
58417c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
58427c478bd9Sstevel@tonic-gate 	switch (cmd) {
58437c478bd9Sstevel@tonic-gate 	case DDI_DETACH:
58444c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, dip,
58454c06356bSdh142964 		    "client pre_detach: called %p",
58464c06356bSdh142964 		     (void *)ct));
58477c478bd9Sstevel@tonic-gate 		MDI_CLIENT_SET_DETACH(ct);
58487c478bd9Sstevel@tonic-gate 		break;
58497c478bd9Sstevel@tonic-gate 
58507c478bd9Sstevel@tonic-gate 	case DDI_SUSPEND:
58514c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, dip,
58524c06356bSdh142964 		    "client pre_suspend: called %p",
58534c06356bSdh142964 		    (void *)ct));
58547c478bd9Sstevel@tonic-gate 		MDI_CLIENT_SET_SUSPEND(ct);
58557c478bd9Sstevel@tonic-gate 		break;
58567c478bd9Sstevel@tonic-gate 
58577c478bd9Sstevel@tonic-gate 	default:
58587c478bd9Sstevel@tonic-gate 		rv = DDI_FAILURE;
58597c478bd9Sstevel@tonic-gate 		break;
58607c478bd9Sstevel@tonic-gate 	}
58617c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
58627c478bd9Sstevel@tonic-gate 	return (rv);
58637c478bd9Sstevel@tonic-gate }
58647c478bd9Sstevel@tonic-gate 
58657c478bd9Sstevel@tonic-gate /*
58667c478bd9Sstevel@tonic-gate  * mdi_post_detach():
58677c478bd9Sstevel@tonic-gate  *		Post detach notification handler
58687c478bd9Sstevel@tonic-gate  */
58697c478bd9Sstevel@tonic-gate /*ARGSUSED*/
58707c478bd9Sstevel@tonic-gate void
58717c478bd9Sstevel@tonic-gate mdi_post_detach(dev_info_t *dip, ddi_detach_cmd_t cmd, int error)
58727c478bd9Sstevel@tonic-gate {
58737c478bd9Sstevel@tonic-gate 	/*
58747c478bd9Sstevel@tonic-gate 	 * Detach/Suspend of mpxio component failed. Update our state
58757c478bd9Sstevel@tonic-gate 	 * too
58767c478bd9Sstevel@tonic-gate 	 */
58777c478bd9Sstevel@tonic-gate 	if (MDI_PHCI(dip))
58787c478bd9Sstevel@tonic-gate 		i_mdi_phci_post_detach(dip, cmd, error);
58797c478bd9Sstevel@tonic-gate 
58807c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT(dip))
58817c478bd9Sstevel@tonic-gate 		i_mdi_client_post_detach(dip, cmd, error);
58827c478bd9Sstevel@tonic-gate }
58837c478bd9Sstevel@tonic-gate 
58847c478bd9Sstevel@tonic-gate /*ARGSUSED*/
58857c478bd9Sstevel@tonic-gate static void
58867c478bd9Sstevel@tonic-gate i_mdi_phci_post_detach(dev_info_t *dip, ddi_detach_cmd_t cmd, int error)
58877c478bd9Sstevel@tonic-gate {
58887c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
58897c478bd9Sstevel@tonic-gate 
58907c478bd9Sstevel@tonic-gate 	/*
58917c478bd9Sstevel@tonic-gate 	 * Detach/Suspend of phci component failed. Update our state
58927c478bd9Sstevel@tonic-gate 	 * too
58937c478bd9Sstevel@tonic-gate 	 */
58947c478bd9Sstevel@tonic-gate 	ph = i_devi_get_phci(dip);
58957c478bd9Sstevel@tonic-gate 	if (ph == NULL) {
58967c478bd9Sstevel@tonic-gate 		return;
58977c478bd9Sstevel@tonic-gate 	}
58987c478bd9Sstevel@tonic-gate 
58997c478bd9Sstevel@tonic-gate 	MDI_PHCI_LOCK(ph);
59007c478bd9Sstevel@tonic-gate 	/*
59017c478bd9Sstevel@tonic-gate 	 * Detach of pHCI failed. Restore back converse
59027c478bd9Sstevel@tonic-gate 	 * state
59037c478bd9Sstevel@tonic-gate 	 */
59047c478bd9Sstevel@tonic-gate 	switch (cmd) {
59057c478bd9Sstevel@tonic-gate 	case DDI_DETACH:
59064c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, dip,
59074c06356bSdh142964 		    "pHCI post_detach: called %p",
59084c06356bSdh142964 		    (void *)ph));
59097c478bd9Sstevel@tonic-gate 		if (error != DDI_SUCCESS)
59107c478bd9Sstevel@tonic-gate 			MDI_PHCI_SET_ATTACH(ph);
59117c478bd9Sstevel@tonic-gate 		break;
59127c478bd9Sstevel@tonic-gate 
59137c478bd9Sstevel@tonic-gate 	case DDI_SUSPEND:
59144c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, dip,
59154c06356bSdh142964 		    "pHCI post_suspend: called %p",
59164c06356bSdh142964 		    (void *)ph));
59177c478bd9Sstevel@tonic-gate 		if (error != DDI_SUCCESS)
59187c478bd9Sstevel@tonic-gate 			MDI_PHCI_SET_RESUME(ph);
59197c478bd9Sstevel@tonic-gate 		break;
59207c478bd9Sstevel@tonic-gate 	}
59217c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNLOCK(ph);
59227c478bd9Sstevel@tonic-gate }
59237c478bd9Sstevel@tonic-gate 
59247c478bd9Sstevel@tonic-gate /*ARGSUSED*/
59257c478bd9Sstevel@tonic-gate static void
59267c478bd9Sstevel@tonic-gate i_mdi_client_post_detach(dev_info_t *dip, ddi_detach_cmd_t cmd, int error)
59277c478bd9Sstevel@tonic-gate {
59287c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
59297c478bd9Sstevel@tonic-gate 
59307c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(dip);
59317c478bd9Sstevel@tonic-gate 	if (ct == NULL) {
59327c478bd9Sstevel@tonic-gate 		return;
59337c478bd9Sstevel@tonic-gate 	}
59347c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
59357c478bd9Sstevel@tonic-gate 	/*
59367c478bd9Sstevel@tonic-gate 	 * Detach of Client failed. Restore back converse
59377c478bd9Sstevel@tonic-gate 	 * state
59387c478bd9Sstevel@tonic-gate 	 */
59397c478bd9Sstevel@tonic-gate 	switch (cmd) {
59407c478bd9Sstevel@tonic-gate 	case DDI_DETACH:
59414c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, dip,
59424c06356bSdh142964 		    "client post_detach: called %p", (void *)ct));
59437c478bd9Sstevel@tonic-gate 		if (DEVI_IS_ATTACHING(ct->ct_dip)) {
59444c06356bSdh142964 			MDI_DEBUG(4, (MDI_NOTE, dip,
59457c478bd9Sstevel@tonic-gate 			    "i_mdi_pm_rele_client\n"));
59467c478bd9Sstevel@tonic-gate 			i_mdi_pm_rele_client(ct, ct->ct_path_count);
59477c478bd9Sstevel@tonic-gate 		} else {
59484c06356bSdh142964 			MDI_DEBUG(4, (MDI_NOTE, dip,
59497c478bd9Sstevel@tonic-gate 			    "i_mdi_pm_reset_client\n"));
59507c478bd9Sstevel@tonic-gate 			i_mdi_pm_reset_client(ct);
59517c478bd9Sstevel@tonic-gate 		}
59527c478bd9Sstevel@tonic-gate 		if (error != DDI_SUCCESS)
59537c478bd9Sstevel@tonic-gate 			MDI_CLIENT_SET_ATTACH(ct);
59547c478bd9Sstevel@tonic-gate 		break;
59557c478bd9Sstevel@tonic-gate 
59567c478bd9Sstevel@tonic-gate 	case DDI_SUSPEND:
59574c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, dip,
59584c06356bSdh142964 		    "called %p", (void *)ct));
59597c478bd9Sstevel@tonic-gate 		if (error != DDI_SUCCESS)
59607c478bd9Sstevel@tonic-gate 			MDI_CLIENT_SET_RESUME(ct);
59617c478bd9Sstevel@tonic-gate 		break;
59627c478bd9Sstevel@tonic-gate 	}
59637c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
59647c478bd9Sstevel@tonic-gate }
59657c478bd9Sstevel@tonic-gate 
596637fbbce5Scth int
596737fbbce5Scth mdi_pi_kstat_exists(mdi_pathinfo_t *pip)
596837fbbce5Scth {
596937fbbce5Scth 	return (MDI_PI(pip)->pi_kstats ? 1 : 0);
597037fbbce5Scth }
597137fbbce5Scth 
59727c478bd9Sstevel@tonic-gate /*
59737c478bd9Sstevel@tonic-gate  * create and install per-path (client - pHCI) statistics
59747c478bd9Sstevel@tonic-gate  * I/O stats supported: nread, nwritten, reads, and writes
59757c478bd9Sstevel@tonic-gate  * Error stats - hard errors, soft errors, & transport errors
59767c478bd9Sstevel@tonic-gate  */
597737fbbce5Scth int
597837fbbce5Scth mdi_pi_kstat_create(mdi_pathinfo_t *pip, char *ksname)
59797c478bd9Sstevel@tonic-gate {
59807c478bd9Sstevel@tonic-gate 	kstat_t			*kiosp, *kerrsp;
59817c478bd9Sstevel@tonic-gate 	struct pi_errs		*nsp;
59827c478bd9Sstevel@tonic-gate 	struct mdi_pi_kstats	*mdi_statp;
59837c478bd9Sstevel@tonic-gate 
59847c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_kstats != NULL)
59857c478bd9Sstevel@tonic-gate 		return (MDI_SUCCESS);
59867c478bd9Sstevel@tonic-gate 
59877c478bd9Sstevel@tonic-gate 	if ((kiosp = kstat_create("mdi", 0, ksname, "iopath",
598837fbbce5Scth 	    KSTAT_TYPE_IO, 1, KSTAT_FLAG_PERSISTENT)) == NULL) {
59897c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
59907c478bd9Sstevel@tonic-gate 	}
59917c478bd9Sstevel@tonic-gate 
599237fbbce5Scth 	(void) strcat(ksname, ",err");
59937c478bd9Sstevel@tonic-gate 	kerrsp = kstat_create("mdi", 0, ksname, "iopath_errors",
59947c478bd9Sstevel@tonic-gate 	    KSTAT_TYPE_NAMED,
59957c478bd9Sstevel@tonic-gate 	    sizeof (struct pi_errs) / sizeof (kstat_named_t), 0);
59967c478bd9Sstevel@tonic-gate 	if (kerrsp == NULL) {
59977c478bd9Sstevel@tonic-gate 		kstat_delete(kiosp);
59987c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
59997c478bd9Sstevel@tonic-gate 	}
60007c478bd9Sstevel@tonic-gate 
60017c478bd9Sstevel@tonic-gate 	nsp = (struct pi_errs *)kerrsp->ks_data;
60027c478bd9Sstevel@tonic-gate 	kstat_named_init(&nsp->pi_softerrs, "Soft Errors", KSTAT_DATA_UINT32);
60037c478bd9Sstevel@tonic-gate 	kstat_named_init(&nsp->pi_harderrs, "Hard Errors", KSTAT_DATA_UINT32);
60047c478bd9Sstevel@tonic-gate 	kstat_named_init(&nsp->pi_transerrs, "Transport Errors",
60057c478bd9Sstevel@tonic-gate 	    KSTAT_DATA_UINT32);
60067c478bd9Sstevel@tonic-gate 	kstat_named_init(&nsp->pi_icnt_busy, "Interconnect Busy",
60077c478bd9Sstevel@tonic-gate 	    KSTAT_DATA_UINT32);
60087c478bd9Sstevel@tonic-gate 	kstat_named_init(&nsp->pi_icnt_errors, "Interconnect Errors",
60097c478bd9Sstevel@tonic-gate 	    KSTAT_DATA_UINT32);
60107c478bd9Sstevel@tonic-gate 	kstat_named_init(&nsp->pi_phci_rsrc, "pHCI No Resources",
60117c478bd9Sstevel@tonic-gate 	    KSTAT_DATA_UINT32);
60127c478bd9Sstevel@tonic-gate 	kstat_named_init(&nsp->pi_phci_localerr, "pHCI Local Errors",
60137c478bd9Sstevel@tonic-gate 	    KSTAT_DATA_UINT32);
60147c478bd9Sstevel@tonic-gate 	kstat_named_init(&nsp->pi_phci_invstate, "pHCI Invalid State",
60157c478bd9Sstevel@tonic-gate 	    KSTAT_DATA_UINT32);
60167c478bd9Sstevel@tonic-gate 	kstat_named_init(&nsp->pi_failedfrom, "Failed From",
60177c478bd9Sstevel@tonic-gate 	    KSTAT_DATA_UINT32);
60187c478bd9Sstevel@tonic-gate 	kstat_named_init(&nsp->pi_failedto, "Failed To", KSTAT_DATA_UINT32);
60197c478bd9Sstevel@tonic-gate 
60207c478bd9Sstevel@tonic-gate 	mdi_statp = kmem_alloc(sizeof (*mdi_statp), KM_SLEEP);
60217c478bd9Sstevel@tonic-gate 	mdi_statp->pi_kstat_ref = 1;
60227c478bd9Sstevel@tonic-gate 	mdi_statp->pi_kstat_iostats = kiosp;
60237c478bd9Sstevel@tonic-gate 	mdi_statp->pi_kstat_errstats = kerrsp;
60247c478bd9Sstevel@tonic-gate 	kstat_install(kiosp);
60257c478bd9Sstevel@tonic-gate 	kstat_install(kerrsp);
60267c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_kstats = mdi_statp;
60277c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
60287c478bd9Sstevel@tonic-gate }
60297c478bd9Sstevel@tonic-gate 
60307c478bd9Sstevel@tonic-gate /*
60317c478bd9Sstevel@tonic-gate  * destroy per-path properties
60327c478bd9Sstevel@tonic-gate  */
60337c478bd9Sstevel@tonic-gate static void
60347c478bd9Sstevel@tonic-gate i_mdi_pi_kstat_destroy(mdi_pathinfo_t *pip)
60357c478bd9Sstevel@tonic-gate {
60367c478bd9Sstevel@tonic-gate 
60377c478bd9Sstevel@tonic-gate 	struct mdi_pi_kstats *mdi_statp;
60387c478bd9Sstevel@tonic-gate 
603937fbbce5Scth 	if (MDI_PI(pip)->pi_kstats == NULL)
604037fbbce5Scth 		return;
60417c478bd9Sstevel@tonic-gate 	if ((mdi_statp = MDI_PI(pip)->pi_kstats) == NULL)
60427c478bd9Sstevel@tonic-gate 		return;
60437c478bd9Sstevel@tonic-gate 
60447c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_kstats = NULL;
60457c478bd9Sstevel@tonic-gate 
60467c478bd9Sstevel@tonic-gate 	/*
60477c478bd9Sstevel@tonic-gate 	 * the kstat may be shared between multiple pathinfo nodes
60487c478bd9Sstevel@tonic-gate 	 * decrement this pathinfo's usage, removing the kstats
60497c478bd9Sstevel@tonic-gate 	 * themselves when the last pathinfo reference is removed.
60507c478bd9Sstevel@tonic-gate 	 */
60517c478bd9Sstevel@tonic-gate 	ASSERT(mdi_statp->pi_kstat_ref > 0);
60527c478bd9Sstevel@tonic-gate 	if (--mdi_statp->pi_kstat_ref != 0)
60537c478bd9Sstevel@tonic-gate 		return;
60547c478bd9Sstevel@tonic-gate 
60557c478bd9Sstevel@tonic-gate 	kstat_delete(mdi_statp->pi_kstat_iostats);
60567c478bd9Sstevel@tonic-gate 	kstat_delete(mdi_statp->pi_kstat_errstats);
60577c478bd9Sstevel@tonic-gate 	kmem_free(mdi_statp, sizeof (*mdi_statp));
60587c478bd9Sstevel@tonic-gate }
60597c478bd9Sstevel@tonic-gate 
60607c478bd9Sstevel@tonic-gate /*
60617c478bd9Sstevel@tonic-gate  * update I/O paths KSTATS
60627c478bd9Sstevel@tonic-gate  */
60637c478bd9Sstevel@tonic-gate void
60647c478bd9Sstevel@tonic-gate mdi_pi_kstat_iosupdate(mdi_pathinfo_t *pip, struct buf *bp)
60657c478bd9Sstevel@tonic-gate {
60667c478bd9Sstevel@tonic-gate 	kstat_t *iostatp;
60677c478bd9Sstevel@tonic-gate 	size_t xfer_cnt;
60687c478bd9Sstevel@tonic-gate 
60697c478bd9Sstevel@tonic-gate 	ASSERT(pip != NULL);
60707c478bd9Sstevel@tonic-gate 
60717c478bd9Sstevel@tonic-gate 	/*
60727c478bd9Sstevel@tonic-gate 	 * I/O can be driven across a path prior to having path
60737c478bd9Sstevel@tonic-gate 	 * statistics available, i.e. probe(9e).
60747c478bd9Sstevel@tonic-gate 	 */
60757c478bd9Sstevel@tonic-gate 	if (bp != NULL && MDI_PI(pip)->pi_kstats != NULL) {
60767c478bd9Sstevel@tonic-gate 		iostatp = MDI_PI(pip)->pi_kstats->pi_kstat_iostats;
60777c478bd9Sstevel@tonic-gate 		xfer_cnt = bp->b_bcount - bp->b_resid;
60787c478bd9Sstevel@tonic-gate 		if (bp->b_flags & B_READ) {
60797c478bd9Sstevel@tonic-gate 			KSTAT_IO_PTR(iostatp)->reads++;
60807c478bd9Sstevel@tonic-gate 			KSTAT_IO_PTR(iostatp)->nread += xfer_cnt;
60817c478bd9Sstevel@tonic-gate 		} else {
60827c478bd9Sstevel@tonic-gate 			KSTAT_IO_PTR(iostatp)->writes++;
60837c478bd9Sstevel@tonic-gate 			KSTAT_IO_PTR(iostatp)->nwritten += xfer_cnt;
60847c478bd9Sstevel@tonic-gate 		}
60857c478bd9Sstevel@tonic-gate 	}
60867c478bd9Sstevel@tonic-gate }
60877c478bd9Sstevel@tonic-gate 
60887c478bd9Sstevel@tonic-gate /*
6089ee28b439Scm136836  * Enable the path(specific client/target/initiator)
6090ee28b439Scm136836  * Enabling a path means that MPxIO may select the enabled path for routing
6091ee28b439Scm136836  * future I/O requests, subject to other path state constraints.
6092ee28b439Scm136836  */
6093ee28b439Scm136836 int
6094ee28b439Scm136836 mdi_pi_enable_path(mdi_pathinfo_t *pip, int flags)
6095ee28b439Scm136836 {
6096ee28b439Scm136836 	mdi_phci_t	*ph;
6097ee28b439Scm136836 
60984c06356bSdh142964 	ph = MDI_PI(pip)->pi_phci;
6099ee28b439Scm136836 	if (ph == NULL) {
61004c06356bSdh142964 		MDI_DEBUG(1, (MDI_NOTE, mdi_pi_get_phci(pip),
61014c06356bSdh142964 		    "!failed: path %s %p: NULL ph",
61024c06356bSdh142964 		    mdi_pi_spathname(pip), (void *)pip));
6103ee28b439Scm136836 		return (MDI_FAILURE);
6104ee28b439Scm136836 	}
6105ee28b439Scm136836 
6106ee28b439Scm136836 	(void) i_mdi_enable_disable_path(pip, ph->ph_vhci, flags,
6107ee28b439Scm136836 		MDI_ENABLE_OP);
61084c06356bSdh142964 	MDI_DEBUG(5, (MDI_NOTE, ph->ph_dip,
61094c06356bSdh142964 	    "!returning success pip = %p. ph = %p",
61105e3986cbScth 	    (void *)pip, (void *)ph));
6111ee28b439Scm136836 	return (MDI_SUCCESS);
6112ee28b439Scm136836 
6113ee28b439Scm136836 }
6114ee28b439Scm136836 
6115ee28b439Scm136836 /*
6116ee28b439Scm136836  * Disable the path (specific client/target/initiator)
6117ee28b439Scm136836  * Disabling a path means that MPxIO will not select the disabled path for
6118ee28b439Scm136836  * routing any new I/O requests.
6119ee28b439Scm136836  */
6120ee28b439Scm136836 int
6121ee28b439Scm136836 mdi_pi_disable_path(mdi_pathinfo_t *pip, int flags)
6122ee28b439Scm136836 {
6123ee28b439Scm136836 	mdi_phci_t	*ph;
6124ee28b439Scm136836 
61254c06356bSdh142964 	ph = MDI_PI(pip)->pi_phci;
6126ee28b439Scm136836 	if (ph == NULL) {
61274c06356bSdh142964 		MDI_DEBUG(1, (MDI_NOTE, mdi_pi_get_phci(pip),
61284c06356bSdh142964 		    "!failed: path %s %p: NULL ph",
61294c06356bSdh142964 		    mdi_pi_spathname(pip), (void *)pip));
6130ee28b439Scm136836 		return (MDI_FAILURE);
6131ee28b439Scm136836 	}
6132ee28b439Scm136836 
6133ee28b439Scm136836 	(void) i_mdi_enable_disable_path(pip,
6134ee28b439Scm136836 	    ph->ph_vhci, flags, MDI_DISABLE_OP);
61354c06356bSdh142964 	MDI_DEBUG(5, (MDI_NOTE, ph->ph_dip,
61364c06356bSdh142964 	    "!returning success pip = %p. ph = %p",
61375e3986cbScth 	    (void *)pip, (void *)ph));
6138ee28b439Scm136836 	return (MDI_SUCCESS);
6139ee28b439Scm136836 }
6140ee28b439Scm136836 
6141ee28b439Scm136836 /*
61427c478bd9Sstevel@tonic-gate  * disable the path to a particular pHCI (pHCI specified in the phci_path
61437c478bd9Sstevel@tonic-gate  * argument) for a particular client (specified in the client_path argument).
61447c478bd9Sstevel@tonic-gate  * Disabling a path means that MPxIO will not select the disabled path for
61457c478bd9Sstevel@tonic-gate  * routing any new I/O requests.
6146ee28b439Scm136836  * NOTE: this will be removed once the NWS files are changed to use the new
6147ee28b439Scm136836  * mdi_{enable,disable}_path interfaces
61487c478bd9Sstevel@tonic-gate  */
61497c478bd9Sstevel@tonic-gate int
61507c478bd9Sstevel@tonic-gate mdi_pi_disable(dev_info_t *cdip, dev_info_t *pdip, int flags)
61517c478bd9Sstevel@tonic-gate {
61527c478bd9Sstevel@tonic-gate 	return (i_mdi_pi_enable_disable(cdip, pdip, flags, MDI_DISABLE_OP));
61537c478bd9Sstevel@tonic-gate }
61547c478bd9Sstevel@tonic-gate 
61557c478bd9Sstevel@tonic-gate /*
61567c478bd9Sstevel@tonic-gate  * Enable the path to a particular pHCI (pHCI specified in the phci_path
61577c478bd9Sstevel@tonic-gate  * argument) for a particular client (specified in the client_path argument).
61587c478bd9Sstevel@tonic-gate  * Enabling a path means that MPxIO may select the enabled path for routing
61597c478bd9Sstevel@tonic-gate  * future I/O requests, subject to other path state constraints.
6160ee28b439Scm136836  * NOTE: this will be removed once the NWS files are changed to use the new
6161ee28b439Scm136836  * mdi_{enable,disable}_path interfaces
61627c478bd9Sstevel@tonic-gate  */
61637c478bd9Sstevel@tonic-gate 
61647c478bd9Sstevel@tonic-gate int
61657c478bd9Sstevel@tonic-gate mdi_pi_enable(dev_info_t *cdip, dev_info_t *pdip, int flags)
61667c478bd9Sstevel@tonic-gate {
61677c478bd9Sstevel@tonic-gate 	return (i_mdi_pi_enable_disable(cdip, pdip, flags, MDI_ENABLE_OP));
61687c478bd9Sstevel@tonic-gate }
61697c478bd9Sstevel@tonic-gate 
6170ee28b439Scm136836 /*
6171ee28b439Scm136836  * Common routine for doing enable/disable.
6172ee28b439Scm136836  */
6173ee28b439Scm136836 static mdi_pathinfo_t *
6174ee28b439Scm136836 i_mdi_enable_disable_path(mdi_pathinfo_t *pip, mdi_vhci_t *vh, int flags,
6175ee28b439Scm136836 		int op)
6176ee28b439Scm136836 {
6177ee28b439Scm136836 	int		sync_flag = 0;
6178ee28b439Scm136836 	int		rv;
6179ee28b439Scm136836 	mdi_pathinfo_t 	*next;
6180ee28b439Scm136836 	int		(*f)() = NULL;
6181ee28b439Scm136836 
61826c8e19d4SZach Kissel 	/*
61836c8e19d4SZach Kissel 	 * Check to make sure the path is not already in the
61846c8e19d4SZach Kissel 	 * requested state. If it is just return the next path
61856c8e19d4SZach Kissel 	 * as we have nothing to do here.
61866c8e19d4SZach Kissel 	 */
61876c8e19d4SZach Kissel 	if ((MDI_PI_IS_DISABLE(pip) && op == MDI_DISABLE_OP) ||
61886c8e19d4SZach Kissel 	    (!MDI_PI_IS_DISABLE(pip) && op == MDI_ENABLE_OP)) {
61896c8e19d4SZach Kissel 		MDI_PI_LOCK(pip);
61906c8e19d4SZach Kissel 		next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
61916c8e19d4SZach Kissel 		MDI_PI_UNLOCK(pip);
61926c8e19d4SZach Kissel 		return (next);
61936c8e19d4SZach Kissel 	}
61946c8e19d4SZach Kissel 
6195ee28b439Scm136836 	f = vh->vh_ops->vo_pi_state_change;
6196ee28b439Scm136836 
6197ee28b439Scm136836 	sync_flag = (flags << 8) & 0xf00;
6198ee28b439Scm136836 
6199ee28b439Scm136836 	/*
6200ee28b439Scm136836 	 * Do a callback into the mdi consumer to let it
6201ee28b439Scm136836 	 * know that path is about to get enabled/disabled.
6202ee28b439Scm136836 	 */
6203ee28b439Scm136836 	if (f != NULL) {
6204ee28b439Scm136836 		rv = (*f)(vh->vh_dip, pip, 0,
6205ee28b439Scm136836 			MDI_PI_EXT_STATE(pip),
6206ee28b439Scm136836 			MDI_EXT_STATE_CHANGE | sync_flag |
6207ee28b439Scm136836 			op | MDI_BEFORE_STATE_CHANGE);
6208ee28b439Scm136836 		if (rv != MDI_SUCCESS) {
62094c06356bSdh142964 			MDI_DEBUG(2, (MDI_WARN, vh->vh_dip,
62104c06356bSdh142964 			    "vo_pi_state_change: failed rv = %x", rv));
6211ee28b439Scm136836 		}
6212ee28b439Scm136836 	}
6213ee28b439Scm136836 	MDI_PI_LOCK(pip);
6214ee28b439Scm136836 	next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
6215ee28b439Scm136836 
6216ee28b439Scm136836 	switch (flags) {
6217ee28b439Scm136836 		case USER_DISABLE:
62185e3986cbScth 			if (op == MDI_DISABLE_OP) {
6219ee28b439Scm136836 				MDI_PI_SET_USER_DISABLE(pip);
62205e3986cbScth 			} else {
6221ee28b439Scm136836 				MDI_PI_SET_USER_ENABLE(pip);
62225e3986cbScth 			}
6223ee28b439Scm136836 			break;
6224ee28b439Scm136836 		case DRIVER_DISABLE:
62255e3986cbScth 			if (op == MDI_DISABLE_OP) {
6226ee28b439Scm136836 				MDI_PI_SET_DRV_DISABLE(pip);
62275e3986cbScth 			} else {
6228ee28b439Scm136836 				MDI_PI_SET_DRV_ENABLE(pip);
62295e3986cbScth 			}
6230ee28b439Scm136836 			break;
6231ee28b439Scm136836 		case DRIVER_DISABLE_TRANSIENT:
62325e3986cbScth 			if (op == MDI_DISABLE_OP && rv == MDI_SUCCESS) {
6233ee28b439Scm136836 				MDI_PI_SET_DRV_DISABLE_TRANS(pip);
62345e3986cbScth 			} else {
6235ee28b439Scm136836 				MDI_PI_SET_DRV_ENABLE_TRANS(pip);
62365e3986cbScth 			}
6237ee28b439Scm136836 			break;
6238ee28b439Scm136836 	}
6239ee28b439Scm136836 	MDI_PI_UNLOCK(pip);
6240ee28b439Scm136836 	/*
6241ee28b439Scm136836 	 * Do a callback into the mdi consumer to let it
6242ee28b439Scm136836 	 * know that path is now enabled/disabled.
6243ee28b439Scm136836 	 */
6244ee28b439Scm136836 	if (f != NULL) {
6245ee28b439Scm136836 		rv = (*f)(vh->vh_dip, pip, 0,
6246ee28b439Scm136836 			MDI_PI_EXT_STATE(pip),
6247ee28b439Scm136836 			MDI_EXT_STATE_CHANGE | sync_flag |
6248ee28b439Scm136836 			op | MDI_AFTER_STATE_CHANGE);
6249ee28b439Scm136836 		if (rv != MDI_SUCCESS) {
62504c06356bSdh142964 			MDI_DEBUG(2, (MDI_WARN, vh->vh_dip,
62514c06356bSdh142964 			    "vo_pi_state_change failed: rv = %x", rv));
6252ee28b439Scm136836 		}
6253ee28b439Scm136836 	}
6254ee28b439Scm136836 	return (next);
6255ee28b439Scm136836 }
62567c478bd9Sstevel@tonic-gate 
62577c478bd9Sstevel@tonic-gate /*
62587c478bd9Sstevel@tonic-gate  * Common routine for doing enable/disable.
6259ee28b439Scm136836  * NOTE: this will be removed once the NWS files are changed to use the new
6260ee28b439Scm136836  * mdi_{enable,disable}_path has been putback
62617c478bd9Sstevel@tonic-gate  */
62627c478bd9Sstevel@tonic-gate int
62637c478bd9Sstevel@tonic-gate i_mdi_pi_enable_disable(dev_info_t *cdip, dev_info_t *pdip, int flags, int op)
62647c478bd9Sstevel@tonic-gate {
62657c478bd9Sstevel@tonic-gate 
62667c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
62677c478bd9Sstevel@tonic-gate 	mdi_vhci_t	*vh = NULL;
62687c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
62697c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*next, *pip;
62707c478bd9Sstevel@tonic-gate 	int		found_it;
62717c478bd9Sstevel@tonic-gate 
62727c478bd9Sstevel@tonic-gate 	ph = i_devi_get_phci(pdip);
62734c06356bSdh142964 	MDI_DEBUG(5, (MDI_NOTE, cdip ? cdip : pdip,
62744c06356bSdh142964 	    "!op = %d pdip = %p cdip = %p", op, (void *)pdip,
62755e3986cbScth 	    (void *)cdip));
62767c478bd9Sstevel@tonic-gate 	if (ph == NULL) {
62774c06356bSdh142964 		MDI_DEBUG(1, (MDI_NOTE, cdip ? cdip : pdip,
62784c06356bSdh142964 		    "!failed: operation %d: NULL ph", op));
62797c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
62807c478bd9Sstevel@tonic-gate 	}
62817c478bd9Sstevel@tonic-gate 
62827c478bd9Sstevel@tonic-gate 	if ((op != MDI_ENABLE_OP) && (op != MDI_DISABLE_OP)) {
62834c06356bSdh142964 		MDI_DEBUG(1, (MDI_NOTE, cdip ? cdip : pdip,
62844c06356bSdh142964 		    "!failed: invalid operation %d", op));
62857c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
62867c478bd9Sstevel@tonic-gate 	}
62877c478bd9Sstevel@tonic-gate 
62887c478bd9Sstevel@tonic-gate 	vh = ph->ph_vhci;
62897c478bd9Sstevel@tonic-gate 
62907c478bd9Sstevel@tonic-gate 	if (cdip == NULL) {
62917c478bd9Sstevel@tonic-gate 		/*
62927c478bd9Sstevel@tonic-gate 		 * Need to mark the Phci as enabled/disabled.
62937c478bd9Sstevel@tonic-gate 		 */
62944c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, cdip ? cdip : pdip,
62954c06356bSdh142964 		    "op %d for the phci", op));
62967c478bd9Sstevel@tonic-gate 		MDI_PHCI_LOCK(ph);
62977c478bd9Sstevel@tonic-gate 		switch (flags) {
62987c478bd9Sstevel@tonic-gate 			case USER_DISABLE:
62995e3986cbScth 				if (op == MDI_DISABLE_OP) {
63007c478bd9Sstevel@tonic-gate 					MDI_PHCI_SET_USER_DISABLE(ph);
63015e3986cbScth 				} else {
63027c478bd9Sstevel@tonic-gate 					MDI_PHCI_SET_USER_ENABLE(ph);
63035e3986cbScth 				}
63047c478bd9Sstevel@tonic-gate 				break;
63057c478bd9Sstevel@tonic-gate 			case DRIVER_DISABLE:
63065e3986cbScth 				if (op == MDI_DISABLE_OP) {
63077c478bd9Sstevel@tonic-gate 					MDI_PHCI_SET_DRV_DISABLE(ph);
63085e3986cbScth 				} else {
63097c478bd9Sstevel@tonic-gate 					MDI_PHCI_SET_DRV_ENABLE(ph);
63105e3986cbScth 				}
63117c478bd9Sstevel@tonic-gate 				break;
63127c478bd9Sstevel@tonic-gate 			case DRIVER_DISABLE_TRANSIENT:
63135e3986cbScth 				if (op == MDI_DISABLE_OP) {
63147c478bd9Sstevel@tonic-gate 					MDI_PHCI_SET_DRV_DISABLE_TRANSIENT(ph);
63155e3986cbScth 				} else {
63167c478bd9Sstevel@tonic-gate 					MDI_PHCI_SET_DRV_ENABLE_TRANSIENT(ph);
63175e3986cbScth 				}
63187c478bd9Sstevel@tonic-gate 				break;
63197c478bd9Sstevel@tonic-gate 			default:
63207c478bd9Sstevel@tonic-gate 				MDI_PHCI_UNLOCK(ph);
63214c06356bSdh142964 				MDI_DEBUG(1, (MDI_NOTE, cdip ? cdip : pdip,
63224c06356bSdh142964 				    "!invalid flag argument= %d", flags));
63237c478bd9Sstevel@tonic-gate 		}
63247c478bd9Sstevel@tonic-gate 
63257c478bd9Sstevel@tonic-gate 		/*
63267c478bd9Sstevel@tonic-gate 		 * Phci has been disabled. Now try to enable/disable
63277c478bd9Sstevel@tonic-gate 		 * path info's to each client.
63287c478bd9Sstevel@tonic-gate 		 */
63297c478bd9Sstevel@tonic-gate 		pip = ph->ph_path_head;
63307c478bd9Sstevel@tonic-gate 		while (pip != NULL) {
6331ee28b439Scm136836 			pip = i_mdi_enable_disable_path(pip, vh, flags, op);
63327c478bd9Sstevel@tonic-gate 		}
63337c478bd9Sstevel@tonic-gate 		MDI_PHCI_UNLOCK(ph);
63347c478bd9Sstevel@tonic-gate 	} else {
63357c478bd9Sstevel@tonic-gate 
63367c478bd9Sstevel@tonic-gate 		/*
63377c478bd9Sstevel@tonic-gate 		 * Disable a specific client.
63387c478bd9Sstevel@tonic-gate 		 */
63397c478bd9Sstevel@tonic-gate 		ct = i_devi_get_client(cdip);
63407c478bd9Sstevel@tonic-gate 		if (ct == NULL) {
63414c06356bSdh142964 			MDI_DEBUG(1, (MDI_NOTE, cdip ? cdip : pdip,
63424c06356bSdh142964 			    "!failed: operation = %d: NULL ct", op));
63437c478bd9Sstevel@tonic-gate 			return (MDI_FAILURE);
63447c478bd9Sstevel@tonic-gate 		}
63457c478bd9Sstevel@tonic-gate 
63467c478bd9Sstevel@tonic-gate 		MDI_CLIENT_LOCK(ct);
63477c478bd9Sstevel@tonic-gate 		pip = ct->ct_path_head;
63487c478bd9Sstevel@tonic-gate 		found_it = 0;
63497c478bd9Sstevel@tonic-gate 		while (pip != NULL) {
63507c478bd9Sstevel@tonic-gate 			MDI_PI_LOCK(pip);
63517c478bd9Sstevel@tonic-gate 			next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link;
63527c478bd9Sstevel@tonic-gate 			if (MDI_PI(pip)->pi_phci == ph) {
63537c478bd9Sstevel@tonic-gate 				MDI_PI_UNLOCK(pip);
63547c478bd9Sstevel@tonic-gate 				found_it = 1;
63557c478bd9Sstevel@tonic-gate 				break;
63567c478bd9Sstevel@tonic-gate 			}
63577c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
63587c478bd9Sstevel@tonic-gate 			pip = next;
63597c478bd9Sstevel@tonic-gate 		}
63607c478bd9Sstevel@tonic-gate 
6361ee28b439Scm136836 
63627c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
63637c478bd9Sstevel@tonic-gate 		if (found_it == 0) {
63644c06356bSdh142964 			MDI_DEBUG(1, (MDI_NOTE, cdip ? cdip : pdip,
63654c06356bSdh142964 			    "!failed. Could not find corresponding pip\n"));
63667c478bd9Sstevel@tonic-gate 			return (MDI_FAILURE);
63677c478bd9Sstevel@tonic-gate 		}
6368ee28b439Scm136836 
6369ee28b439Scm136836 		(void) i_mdi_enable_disable_path(pip, vh, flags, op);
63707c478bd9Sstevel@tonic-gate 	}
63717c478bd9Sstevel@tonic-gate 
63724c06356bSdh142964 	MDI_DEBUG(5, (MDI_NOTE, cdip ? cdip : pdip,
63734c06356bSdh142964 	    "!op %d returning success pdip = %p cdip = %p",
63745e3986cbScth 	    op, (void *)pdip, (void *)cdip));
63757c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
63767c478bd9Sstevel@tonic-gate }
63777c478bd9Sstevel@tonic-gate 
63787c478bd9Sstevel@tonic-gate /*
63797c478bd9Sstevel@tonic-gate  * Ensure phci powered up
63807c478bd9Sstevel@tonic-gate  */
63817c478bd9Sstevel@tonic-gate static void
63827c478bd9Sstevel@tonic-gate i_mdi_pm_hold_pip(mdi_pathinfo_t *pip)
63837c478bd9Sstevel@tonic-gate {
63847c478bd9Sstevel@tonic-gate 	dev_info_t	*ph_dip;
63857c478bd9Sstevel@tonic-gate 
63867c478bd9Sstevel@tonic-gate 	ASSERT(pip != NULL);
63875e3986cbScth 	ASSERT(MDI_PI_LOCKED(pip));
63887c478bd9Sstevel@tonic-gate 
63897c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_pm_held) {
63907c478bd9Sstevel@tonic-gate 		return;
63917c478bd9Sstevel@tonic-gate 	}
63927c478bd9Sstevel@tonic-gate 
63937c478bd9Sstevel@tonic-gate 	ph_dip = mdi_pi_get_phci(pip);
63944c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, ph_dip,
63954c06356bSdh142964 	    "%s %p", mdi_pi_spathname(pip), (void *)pip));
63967c478bd9Sstevel@tonic-gate 	if (ph_dip == NULL) {
63977c478bd9Sstevel@tonic-gate 		return;
63987c478bd9Sstevel@tonic-gate 	}
63997c478bd9Sstevel@tonic-gate 
64007c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
64014c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, ph_dip, "kidsupcnt was %d",
64027c478bd9Sstevel@tonic-gate 	    DEVI(ph_dip)->devi_pm_kidsupcnt));
64037c478bd9Sstevel@tonic-gate 	pm_hold_power(ph_dip);
64044c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, ph_dip, "kidsupcnt is %d",
64057c478bd9Sstevel@tonic-gate 	    DEVI(ph_dip)->devi_pm_kidsupcnt));
64067c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
64077c478bd9Sstevel@tonic-gate 
64085e3986cbScth 	/* If PM_GET_PM_INFO is NULL the pm_hold_power above was a noop */
64095e3986cbScth 	if (DEVI(ph_dip)->devi_pm_info)
64107c478bd9Sstevel@tonic-gate 		MDI_PI(pip)->pi_pm_held = 1;
64117c478bd9Sstevel@tonic-gate }
64127c478bd9Sstevel@tonic-gate 
64137c478bd9Sstevel@tonic-gate /*
64147c478bd9Sstevel@tonic-gate  * Allow phci powered down
64157c478bd9Sstevel@tonic-gate  */
64167c478bd9Sstevel@tonic-gate static void
64177c478bd9Sstevel@tonic-gate i_mdi_pm_rele_pip(mdi_pathinfo_t *pip)
64187c478bd9Sstevel@tonic-gate {
64197c478bd9Sstevel@tonic-gate 	dev_info_t	*ph_dip = NULL;
64207c478bd9Sstevel@tonic-gate 
64217c478bd9Sstevel@tonic-gate 	ASSERT(pip != NULL);
64225e3986cbScth 	ASSERT(MDI_PI_LOCKED(pip));
64237c478bd9Sstevel@tonic-gate 
64247c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_pm_held == 0) {
64257c478bd9Sstevel@tonic-gate 		return;
64267c478bd9Sstevel@tonic-gate 	}
64277c478bd9Sstevel@tonic-gate 
64287c478bd9Sstevel@tonic-gate 	ph_dip = mdi_pi_get_phci(pip);
64297c478bd9Sstevel@tonic-gate 	ASSERT(ph_dip != NULL);
64307c478bd9Sstevel@tonic-gate 
64314c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, ph_dip,
64324c06356bSdh142964 	    "%s %p", mdi_pi_spathname(pip), (void *)pip));
64334c06356bSdh142964 
64347c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
64354c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, ph_dip,
64364c06356bSdh142964 	    "kidsupcnt was %d", DEVI(ph_dip)->devi_pm_kidsupcnt));
64377c478bd9Sstevel@tonic-gate 	pm_rele_power(ph_dip);
64384c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, ph_dip,
64394c06356bSdh142964 	    "kidsupcnt is %d", DEVI(ph_dip)->devi_pm_kidsupcnt));
64407c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
64414c06356bSdh142964 
64427c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_pm_held = 0;
64437c478bd9Sstevel@tonic-gate }
64447c478bd9Sstevel@tonic-gate 
64457c478bd9Sstevel@tonic-gate static void
64467c478bd9Sstevel@tonic-gate i_mdi_pm_hold_client(mdi_client_t *ct, int incr)
64477c478bd9Sstevel@tonic-gate {
64485e3986cbScth 	ASSERT(MDI_CLIENT_LOCKED(ct));
64497c478bd9Sstevel@tonic-gate 
64507c478bd9Sstevel@tonic-gate 	ct->ct_power_cnt += incr;
64514c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, ct->ct_dip,
64524c06356bSdh142964 	    "%p ct_power_cnt = %d incr = %d",
64534c06356bSdh142964 	    (void *)ct, ct->ct_power_cnt, incr));
64547c478bd9Sstevel@tonic-gate 	ASSERT(ct->ct_power_cnt >= 0);
64557c478bd9Sstevel@tonic-gate }
64567c478bd9Sstevel@tonic-gate 
64577c478bd9Sstevel@tonic-gate static void
64587c478bd9Sstevel@tonic-gate i_mdi_rele_all_phci(mdi_client_t *ct)
64597c478bd9Sstevel@tonic-gate {
64607c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t  *pip;
64617c478bd9Sstevel@tonic-gate 
64625e3986cbScth 	ASSERT(MDI_CLIENT_LOCKED(ct));
64637c478bd9Sstevel@tonic-gate 	pip = (mdi_pathinfo_t *)ct->ct_path_head;
64647c478bd9Sstevel@tonic-gate 	while (pip != NULL) {
64657c478bd9Sstevel@tonic-gate 		mdi_hold_path(pip);
64667c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
64677c478bd9Sstevel@tonic-gate 		i_mdi_pm_rele_pip(pip);
64687c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
64697c478bd9Sstevel@tonic-gate 		mdi_rele_path(pip);
64707c478bd9Sstevel@tonic-gate 		pip = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link;
64717c478bd9Sstevel@tonic-gate 	}
64727c478bd9Sstevel@tonic-gate }
64737c478bd9Sstevel@tonic-gate 
64747c478bd9Sstevel@tonic-gate static void
64757c478bd9Sstevel@tonic-gate i_mdi_pm_rele_client(mdi_client_t *ct, int decr)
64767c478bd9Sstevel@tonic-gate {
64775e3986cbScth 	ASSERT(MDI_CLIENT_LOCKED(ct));
64787c478bd9Sstevel@tonic-gate 
6479737d277aScth 	if (i_ddi_devi_attached(ct->ct_dip)) {
64807c478bd9Sstevel@tonic-gate 		ct->ct_power_cnt -= decr;
64814c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, ct->ct_dip,
64824c06356bSdh142964 		    "%p ct_power_cnt = %d decr = %d",
64835e3986cbScth 		    (void *)ct, ct->ct_power_cnt, decr));
64847c478bd9Sstevel@tonic-gate 	}
64857c478bd9Sstevel@tonic-gate 
64867c478bd9Sstevel@tonic-gate 	ASSERT(ct->ct_power_cnt >= 0);
64877c478bd9Sstevel@tonic-gate 	if (ct->ct_power_cnt == 0) {
64887c478bd9Sstevel@tonic-gate 		i_mdi_rele_all_phci(ct);
64897c478bd9Sstevel@tonic-gate 		return;
64907c478bd9Sstevel@tonic-gate 	}
64917c478bd9Sstevel@tonic-gate }
64927c478bd9Sstevel@tonic-gate 
64937c478bd9Sstevel@tonic-gate static void
64947c478bd9Sstevel@tonic-gate i_mdi_pm_reset_client(mdi_client_t *ct)
64957c478bd9Sstevel@tonic-gate {
64964c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, ct->ct_dip,
64974c06356bSdh142964 	    "%p ct_power_cnt = %d", (void *)ct, ct->ct_power_cnt));
64985e3986cbScth 	ASSERT(MDI_CLIENT_LOCKED(ct));
64997c478bd9Sstevel@tonic-gate 	ct->ct_power_cnt = 0;
65007c478bd9Sstevel@tonic-gate 	i_mdi_rele_all_phci(ct);
650178dc6db2Sllai1 	ct->ct_powercnt_config = 0;
650278dc6db2Sllai1 	ct->ct_powercnt_unconfig = 0;
65037c478bd9Sstevel@tonic-gate 	ct->ct_powercnt_reset = 1;
65047c478bd9Sstevel@tonic-gate }
65057c478bd9Sstevel@tonic-gate 
65067c478bd9Sstevel@tonic-gate static int
65077c478bd9Sstevel@tonic-gate i_mdi_power_one_phci(mdi_pathinfo_t *pip)
65087c478bd9Sstevel@tonic-gate {
65097c478bd9Sstevel@tonic-gate 	int		ret;
65107c478bd9Sstevel@tonic-gate 	dev_info_t	*ph_dip;
65117c478bd9Sstevel@tonic-gate 
65127c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
65137c478bd9Sstevel@tonic-gate 	i_mdi_pm_hold_pip(pip);
65147c478bd9Sstevel@tonic-gate 
65157c478bd9Sstevel@tonic-gate 	ph_dip = mdi_pi_get_phci(pip);
65167c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
65177c478bd9Sstevel@tonic-gate 
65187c478bd9Sstevel@tonic-gate 	/* bring all components of phci to full power */
65194c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, ph_dip,
65204c06356bSdh142964 	    "pm_powerup for %s%d %p", ddi_driver_name(ph_dip),
65215e3986cbScth 	    ddi_get_instance(ph_dip), (void *)pip));
65227c478bd9Sstevel@tonic-gate 
65237c478bd9Sstevel@tonic-gate 	ret = pm_powerup(ph_dip);
65247c478bd9Sstevel@tonic-gate 
65257c478bd9Sstevel@tonic-gate 	if (ret == DDI_FAILURE) {
65264c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, ph_dip,
65274c06356bSdh142964 		    "pm_powerup FAILED for %s%d %p",
652855e592a2SRandall Ralphs 		    ddi_driver_name(ph_dip), ddi_get_instance(ph_dip),
65295e3986cbScth 		    (void *)pip));
65307c478bd9Sstevel@tonic-gate 
65317c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
65327c478bd9Sstevel@tonic-gate 		i_mdi_pm_rele_pip(pip);
65337c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
65347c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
65357c478bd9Sstevel@tonic-gate 	}
65367c478bd9Sstevel@tonic-gate 
65377c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
65387c478bd9Sstevel@tonic-gate }
65397c478bd9Sstevel@tonic-gate 
65407c478bd9Sstevel@tonic-gate static int
65417c478bd9Sstevel@tonic-gate i_mdi_power_all_phci(mdi_client_t *ct)
65427c478bd9Sstevel@tonic-gate {
65437c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t  *pip;
65447c478bd9Sstevel@tonic-gate 	int		succeeded = 0;
65457c478bd9Sstevel@tonic-gate 
65465e3986cbScth 	ASSERT(MDI_CLIENT_LOCKED(ct));
65477c478bd9Sstevel@tonic-gate 	pip = (mdi_pathinfo_t *)ct->ct_path_head;
65487c478bd9Sstevel@tonic-gate 	while (pip != NULL) {
65495e3986cbScth 		/*
65505e3986cbScth 		 * Don't power if MDI_PATHINFO_STATE_FAULT
65515e3986cbScth 		 * or MDI_PATHINFO_STATE_OFFLINE.
65525e3986cbScth 		 */
65535e3986cbScth 		if (MDI_PI_IS_INIT(pip) ||
65545e3986cbScth 		    MDI_PI_IS_ONLINE(pip) || MDI_PI_IS_STANDBY(pip)) {
65557c478bd9Sstevel@tonic-gate 			mdi_hold_path(pip);
65567c478bd9Sstevel@tonic-gate 			MDI_CLIENT_UNLOCK(ct);
65577c478bd9Sstevel@tonic-gate 			if (i_mdi_power_one_phci(pip) == MDI_SUCCESS)
65587c478bd9Sstevel@tonic-gate 				succeeded = 1;
65597c478bd9Sstevel@tonic-gate 
65607c478bd9Sstevel@tonic-gate 			ASSERT(ct == MDI_PI(pip)->pi_client);
65617c478bd9Sstevel@tonic-gate 			MDI_CLIENT_LOCK(ct);
65627c478bd9Sstevel@tonic-gate 			mdi_rele_path(pip);
65635e3986cbScth 		}
65647c478bd9Sstevel@tonic-gate 		pip = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link;
65657c478bd9Sstevel@tonic-gate 	}
65667c478bd9Sstevel@tonic-gate 
65677c478bd9Sstevel@tonic-gate 	return (succeeded ? MDI_SUCCESS : MDI_FAILURE);
65687c478bd9Sstevel@tonic-gate }
65697c478bd9Sstevel@tonic-gate 
65707c478bd9Sstevel@tonic-gate /*
65717c478bd9Sstevel@tonic-gate  * mdi_bus_power():
65727c478bd9Sstevel@tonic-gate  *		1. Place the phci(s) into powered up state so that
65737c478bd9Sstevel@tonic-gate  *		   client can do power management
65747c478bd9Sstevel@tonic-gate  *		2. Ensure phci powered up as client power managing
65757c478bd9Sstevel@tonic-gate  * Return Values:
65767c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
65777c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
65787c478bd9Sstevel@tonic-gate  */
65797c478bd9Sstevel@tonic-gate int
65807c478bd9Sstevel@tonic-gate mdi_bus_power(dev_info_t *parent, void *impl_arg, pm_bus_power_op_t op,
65817c478bd9Sstevel@tonic-gate     void *arg, void *result)
65827c478bd9Sstevel@tonic-gate {
65837c478bd9Sstevel@tonic-gate 	int			ret = MDI_SUCCESS;
65847c478bd9Sstevel@tonic-gate 	pm_bp_child_pwrchg_t	*bpc;
65857c478bd9Sstevel@tonic-gate 	mdi_client_t		*ct;
65867c478bd9Sstevel@tonic-gate 	dev_info_t		*cdip;
65877c478bd9Sstevel@tonic-gate 	pm_bp_has_changed_t	*bphc;
65887c478bd9Sstevel@tonic-gate 
65897c478bd9Sstevel@tonic-gate 	/*
65907c478bd9Sstevel@tonic-gate 	 * BUS_POWER_NOINVOL not supported
65917c478bd9Sstevel@tonic-gate 	 */
65927c478bd9Sstevel@tonic-gate 	if (op == BUS_POWER_NOINVOL)
65937c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
65947c478bd9Sstevel@tonic-gate 
65957c478bd9Sstevel@tonic-gate 	/*
65967c478bd9Sstevel@tonic-gate 	 * ignore other OPs.
65977c478bd9Sstevel@tonic-gate 	 * return quickly to save cou cycles on the ct processing
65987c478bd9Sstevel@tonic-gate 	 */
65997c478bd9Sstevel@tonic-gate 	switch (op) {
66007c478bd9Sstevel@tonic-gate 	case BUS_POWER_PRE_NOTIFICATION:
66017c478bd9Sstevel@tonic-gate 	case BUS_POWER_POST_NOTIFICATION:
66027c478bd9Sstevel@tonic-gate 		bpc = (pm_bp_child_pwrchg_t *)arg;
66037c478bd9Sstevel@tonic-gate 		cdip = bpc->bpc_dip;
66047c478bd9Sstevel@tonic-gate 		break;
66057c478bd9Sstevel@tonic-gate 	case BUS_POWER_HAS_CHANGED:
66067c478bd9Sstevel@tonic-gate 		bphc = (pm_bp_has_changed_t *)arg;
66077c478bd9Sstevel@tonic-gate 		cdip = bphc->bphc_dip;
66087c478bd9Sstevel@tonic-gate 		break;
66097c478bd9Sstevel@tonic-gate 	default:
66107c478bd9Sstevel@tonic-gate 		return (pm_busop_bus_power(parent, impl_arg, op, arg, result));
66117c478bd9Sstevel@tonic-gate 	}
66127c478bd9Sstevel@tonic-gate 
66137c478bd9Sstevel@tonic-gate 	ASSERT(MDI_CLIENT(cdip));
66147c478bd9Sstevel@tonic-gate 
66157c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(cdip);
66167c478bd9Sstevel@tonic-gate 	if (ct == NULL)
66177c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
66187c478bd9Sstevel@tonic-gate 
66197c478bd9Sstevel@tonic-gate 	/*
66207c478bd9Sstevel@tonic-gate 	 * wait till the mdi_pathinfo node state change are processed
66217c478bd9Sstevel@tonic-gate 	 */
66227c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
66237c478bd9Sstevel@tonic-gate 	switch (op) {
66247c478bd9Sstevel@tonic-gate 	case BUS_POWER_PRE_NOTIFICATION:
66254c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, bpc->bpc_dip,
66267c478bd9Sstevel@tonic-gate 		    "BUS_POWER_PRE_NOTIFICATION:"
66274c06356bSdh142964 		    "%s@%s, olevel=%d, nlevel=%d, comp=%d",
66284c06356bSdh142964 		    ddi_node_name(bpc->bpc_dip), PM_ADDR(bpc->bpc_dip),
66297c478bd9Sstevel@tonic-gate 		    bpc->bpc_olevel, bpc->bpc_nlevel, bpc->bpc_comp));
66307c478bd9Sstevel@tonic-gate 
66317c478bd9Sstevel@tonic-gate 		/* serialize power level change per client */
66327c478bd9Sstevel@tonic-gate 		while (MDI_CLIENT_IS_POWER_TRANSITION(ct))
66337c478bd9Sstevel@tonic-gate 			cv_wait(&ct->ct_powerchange_cv, &ct->ct_mutex);
66347c478bd9Sstevel@tonic-gate 
66357c478bd9Sstevel@tonic-gate 		MDI_CLIENT_SET_POWER_TRANSITION(ct);
66367c478bd9Sstevel@tonic-gate 
66377c478bd9Sstevel@tonic-gate 		if (ct->ct_power_cnt == 0) {
66387c478bd9Sstevel@tonic-gate 			ret = i_mdi_power_all_phci(ct);
66397c478bd9Sstevel@tonic-gate 		}
66407c478bd9Sstevel@tonic-gate 
66417c478bd9Sstevel@tonic-gate 		/*
66427c478bd9Sstevel@tonic-gate 		 * if new_level > 0:
66437c478bd9Sstevel@tonic-gate 		 *	- hold phci(s)
66447c478bd9Sstevel@tonic-gate 		 *	- power up phci(s) if not already
66457c478bd9Sstevel@tonic-gate 		 * ignore power down
66467c478bd9Sstevel@tonic-gate 		 */
66477c478bd9Sstevel@tonic-gate 		if (bpc->bpc_nlevel > 0) {
66487c478bd9Sstevel@tonic-gate 			if (!DEVI_IS_ATTACHING(ct->ct_dip)) {
66494c06356bSdh142964 				MDI_DEBUG(4, (MDI_NOTE, bpc->bpc_dip,
66504c06356bSdh142964 				    "i_mdi_pm_hold_client\n"));
66517c478bd9Sstevel@tonic-gate 				i_mdi_pm_hold_client(ct, ct->ct_path_count);
66527c478bd9Sstevel@tonic-gate 			}
66537c478bd9Sstevel@tonic-gate 		}
66547c478bd9Sstevel@tonic-gate 		break;
66557c478bd9Sstevel@tonic-gate 	case BUS_POWER_POST_NOTIFICATION:
66564c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, bpc->bpc_dip,
66577c478bd9Sstevel@tonic-gate 		    "BUS_POWER_POST_NOTIFICATION:"
66584c06356bSdh142964 		    "%s@%s, olevel=%d, nlevel=%d, comp=%d result=%d",
66594c06356bSdh142964 		    ddi_node_name(bpc->bpc_dip), PM_ADDR(bpc->bpc_dip),
66607c478bd9Sstevel@tonic-gate 		    bpc->bpc_olevel, bpc->bpc_nlevel, bpc->bpc_comp,
66617c478bd9Sstevel@tonic-gate 		    *(int *)result));
66627c478bd9Sstevel@tonic-gate 
66637c478bd9Sstevel@tonic-gate 		if (*(int *)result == DDI_SUCCESS) {
66647c478bd9Sstevel@tonic-gate 			if (bpc->bpc_nlevel > 0) {
66657c478bd9Sstevel@tonic-gate 				MDI_CLIENT_SET_POWER_UP(ct);
66667c478bd9Sstevel@tonic-gate 			} else {
66677c478bd9Sstevel@tonic-gate 				MDI_CLIENT_SET_POWER_DOWN(ct);
66687c478bd9Sstevel@tonic-gate 			}
66697c478bd9Sstevel@tonic-gate 		}
66707c478bd9Sstevel@tonic-gate 
66717c478bd9Sstevel@tonic-gate 		/* release the hold we did in pre-notification */
66727c478bd9Sstevel@tonic-gate 		if (bpc->bpc_nlevel > 0 && (*(int *)result != DDI_SUCCESS) &&
66737c478bd9Sstevel@tonic-gate 		    !DEVI_IS_ATTACHING(ct->ct_dip)) {
66744c06356bSdh142964 			MDI_DEBUG(4, (MDI_NOTE, bpc->bpc_dip,
66754c06356bSdh142964 			    "i_mdi_pm_rele_client\n"));
66767c478bd9Sstevel@tonic-gate 			i_mdi_pm_rele_client(ct, ct->ct_path_count);
66777c478bd9Sstevel@tonic-gate 		}
66787c478bd9Sstevel@tonic-gate 
66797c478bd9Sstevel@tonic-gate 		if (bpc->bpc_nlevel == 0 && (*(int *)result == DDI_SUCCESS)) {
66807c478bd9Sstevel@tonic-gate 			/* another thread might started attaching */
66817c478bd9Sstevel@tonic-gate 			if (DEVI_IS_ATTACHING(ct->ct_dip)) {
66824c06356bSdh142964 				MDI_DEBUG(4, (MDI_NOTE, bpc->bpc_dip,
66834c06356bSdh142964 				    "i_mdi_pm_rele_client\n"));
66847c478bd9Sstevel@tonic-gate 				i_mdi_pm_rele_client(ct, ct->ct_path_count);
66857c478bd9Sstevel@tonic-gate 			/* detaching has been taken care in pm_post_unconfig */
66867c478bd9Sstevel@tonic-gate 			} else if (!DEVI_IS_DETACHING(ct->ct_dip)) {
66874c06356bSdh142964 				MDI_DEBUG(4, (MDI_NOTE, bpc->bpc_dip,
66884c06356bSdh142964 				    "i_mdi_pm_reset_client\n"));
66897c478bd9Sstevel@tonic-gate 				i_mdi_pm_reset_client(ct);
66907c478bd9Sstevel@tonic-gate 			}
66917c478bd9Sstevel@tonic-gate 		}
66927c478bd9Sstevel@tonic-gate 
66937c478bd9Sstevel@tonic-gate 		MDI_CLIENT_CLEAR_POWER_TRANSITION(ct);
66947c478bd9Sstevel@tonic-gate 		cv_broadcast(&ct->ct_powerchange_cv);
66957c478bd9Sstevel@tonic-gate 
66967c478bd9Sstevel@tonic-gate 		break;
66977c478bd9Sstevel@tonic-gate 
66987c478bd9Sstevel@tonic-gate 	/* need to do more */
66997c478bd9Sstevel@tonic-gate 	case BUS_POWER_HAS_CHANGED:
67004c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, bphc->bphc_dip,
67017c478bd9Sstevel@tonic-gate 		    "BUS_POWER_HAS_CHANGED:"
67024c06356bSdh142964 		    "%s@%s, olevel=%d, nlevel=%d, comp=%d",
67034c06356bSdh142964 		    ddi_node_name(bphc->bphc_dip), PM_ADDR(bphc->bphc_dip),
67047c478bd9Sstevel@tonic-gate 		    bphc->bphc_olevel, bphc->bphc_nlevel, bphc->bphc_comp));
67057c478bd9Sstevel@tonic-gate 
67067c478bd9Sstevel@tonic-gate 		if (bphc->bphc_nlevel > 0 &&
67077c478bd9Sstevel@tonic-gate 		    bphc->bphc_nlevel > bphc->bphc_olevel) {
67087c478bd9Sstevel@tonic-gate 			if (ct->ct_power_cnt == 0) {
67097c478bd9Sstevel@tonic-gate 				ret = i_mdi_power_all_phci(ct);
67107c478bd9Sstevel@tonic-gate 			}
67114c06356bSdh142964 			MDI_DEBUG(4, (MDI_NOTE, bphc->bphc_dip,
67124c06356bSdh142964 			    "i_mdi_pm_hold_client\n"));
67137c478bd9Sstevel@tonic-gate 			i_mdi_pm_hold_client(ct, ct->ct_path_count);
67147c478bd9Sstevel@tonic-gate 		}
67157c478bd9Sstevel@tonic-gate 
67167c478bd9Sstevel@tonic-gate 		if (bphc->bphc_nlevel == 0 && bphc->bphc_olevel != -1) {
67174c06356bSdh142964 			MDI_DEBUG(4, (MDI_NOTE, bphc->bphc_dip,
67184c06356bSdh142964 			    "i_mdi_pm_rele_client\n"));
67197c478bd9Sstevel@tonic-gate 			i_mdi_pm_rele_client(ct, ct->ct_path_count);
67207c478bd9Sstevel@tonic-gate 		}
67217c478bd9Sstevel@tonic-gate 		break;
67227c478bd9Sstevel@tonic-gate 	}
67237c478bd9Sstevel@tonic-gate 
67247c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
67257c478bd9Sstevel@tonic-gate 	return (ret);
67267c478bd9Sstevel@tonic-gate }
67277c478bd9Sstevel@tonic-gate 
67287c478bd9Sstevel@tonic-gate static int
67297c478bd9Sstevel@tonic-gate i_mdi_pm_pre_config_one(dev_info_t *child)
67307c478bd9Sstevel@tonic-gate {
67317c478bd9Sstevel@tonic-gate 	int		ret = MDI_SUCCESS;
67327c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
67337c478bd9Sstevel@tonic-gate 
67347c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(child);
67357c478bd9Sstevel@tonic-gate 	if (ct == NULL)
67367c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
67377c478bd9Sstevel@tonic-gate 
67387c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
67397c478bd9Sstevel@tonic-gate 	while (MDI_CLIENT_IS_POWER_TRANSITION(ct))
67407c478bd9Sstevel@tonic-gate 		cv_wait(&ct->ct_powerchange_cv, &ct->ct_mutex);
67417c478bd9Sstevel@tonic-gate 
67427c478bd9Sstevel@tonic-gate 	if (!MDI_CLIENT_IS_FAILED(ct)) {
67437c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
67444c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "already configured\n"));
67457c478bd9Sstevel@tonic-gate 		return (MDI_SUCCESS);
67467c478bd9Sstevel@tonic-gate 	}
67477c478bd9Sstevel@tonic-gate 
674878dc6db2Sllai1 	if (ct->ct_powercnt_config) {
67497c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
67504c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "already held\n"));
67517c478bd9Sstevel@tonic-gate 		return (MDI_SUCCESS);
67527c478bd9Sstevel@tonic-gate 	}
67537c478bd9Sstevel@tonic-gate 
67547c478bd9Sstevel@tonic-gate 	if (ct->ct_power_cnt == 0) {
67557c478bd9Sstevel@tonic-gate 		ret = i_mdi_power_all_phci(ct);
67567c478bd9Sstevel@tonic-gate 	}
67574c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, child, "i_mdi_pm_hold_client\n"));
67587c478bd9Sstevel@tonic-gate 	i_mdi_pm_hold_client(ct, ct->ct_path_count);
675978dc6db2Sllai1 	ct->ct_powercnt_config = 1;
67607c478bd9Sstevel@tonic-gate 	ct->ct_powercnt_reset = 0;
67617c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
67627c478bd9Sstevel@tonic-gate 	return (ret);
67637c478bd9Sstevel@tonic-gate }
67647c478bd9Sstevel@tonic-gate 
67657c478bd9Sstevel@tonic-gate static int
67665e3986cbScth i_mdi_pm_pre_config(dev_info_t *vdip, dev_info_t *child)
67677c478bd9Sstevel@tonic-gate {
67687c478bd9Sstevel@tonic-gate 	int			ret = MDI_SUCCESS;
67697c478bd9Sstevel@tonic-gate 	dev_info_t		*cdip;
67707c478bd9Sstevel@tonic-gate 	int			circ;
67717c478bd9Sstevel@tonic-gate 
67725e3986cbScth 	ASSERT(MDI_VHCI(vdip));
67737c478bd9Sstevel@tonic-gate 
67747c478bd9Sstevel@tonic-gate 	/* ndi_devi_config_one */
67757c478bd9Sstevel@tonic-gate 	if (child) {
67765e3986cbScth 		ASSERT(DEVI_BUSY_OWNED(vdip));
67777c478bd9Sstevel@tonic-gate 		return (i_mdi_pm_pre_config_one(child));
67787c478bd9Sstevel@tonic-gate 	}
67797c478bd9Sstevel@tonic-gate 
67807c478bd9Sstevel@tonic-gate 	/* devi_config_common */
67815e3986cbScth 	ndi_devi_enter(vdip, &circ);
67825e3986cbScth 	cdip = ddi_get_child(vdip);
67837c478bd9Sstevel@tonic-gate 	while (cdip) {
67847c478bd9Sstevel@tonic-gate 		dev_info_t *next = ddi_get_next_sibling(cdip);
67857c478bd9Sstevel@tonic-gate 
67867c478bd9Sstevel@tonic-gate 		ret = i_mdi_pm_pre_config_one(cdip);
67877c478bd9Sstevel@tonic-gate 		if (ret != MDI_SUCCESS)
67887c478bd9Sstevel@tonic-gate 			break;
67897c478bd9Sstevel@tonic-gate 		cdip = next;
67907c478bd9Sstevel@tonic-gate 	}
67915e3986cbScth 	ndi_devi_exit(vdip, circ);
67927c478bd9Sstevel@tonic-gate 	return (ret);
67937c478bd9Sstevel@tonic-gate }
67947c478bd9Sstevel@tonic-gate 
67957c478bd9Sstevel@tonic-gate static int
67967c478bd9Sstevel@tonic-gate i_mdi_pm_pre_unconfig_one(dev_info_t *child, int *held, int flags)
67977c478bd9Sstevel@tonic-gate {
67987c478bd9Sstevel@tonic-gate 	int		ret = MDI_SUCCESS;
67997c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
68007c478bd9Sstevel@tonic-gate 
68017c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(child);
68027c478bd9Sstevel@tonic-gate 	if (ct == NULL)
68037c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
68047c478bd9Sstevel@tonic-gate 
68057c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
68067c478bd9Sstevel@tonic-gate 	while (MDI_CLIENT_IS_POWER_TRANSITION(ct))
68077c478bd9Sstevel@tonic-gate 		cv_wait(&ct->ct_powerchange_cv, &ct->ct_mutex);
68087c478bd9Sstevel@tonic-gate 
6809737d277aScth 	if (!i_ddi_devi_attached(ct->ct_dip)) {
68104c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "node detached already\n"));
68117c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
68127c478bd9Sstevel@tonic-gate 		return (MDI_SUCCESS);
68137c478bd9Sstevel@tonic-gate 	}
68147c478bd9Sstevel@tonic-gate 
68157c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT_IS_POWERED_DOWN(ct) &&
68167c478bd9Sstevel@tonic-gate 	    (flags & NDI_AUTODETACH)) {
68174c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "auto-modunload\n"));
68187c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
68197c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
68207c478bd9Sstevel@tonic-gate 	}
68217c478bd9Sstevel@tonic-gate 
682278dc6db2Sllai1 	if (ct->ct_powercnt_unconfig) {
68234c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "ct_powercnt_held\n"));
68247c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
68257c478bd9Sstevel@tonic-gate 		*held = 1;
68267c478bd9Sstevel@tonic-gate 		return (MDI_SUCCESS);
68277c478bd9Sstevel@tonic-gate 	}
68287c478bd9Sstevel@tonic-gate 
68297c478bd9Sstevel@tonic-gate 	if (ct->ct_power_cnt == 0) {
68307c478bd9Sstevel@tonic-gate 		ret = i_mdi_power_all_phci(ct);
68317c478bd9Sstevel@tonic-gate 	}
68324c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, child, "i_mdi_pm_hold_client\n"));
68337c478bd9Sstevel@tonic-gate 	i_mdi_pm_hold_client(ct, ct->ct_path_count);
683478dc6db2Sllai1 	ct->ct_powercnt_unconfig = 1;
68357c478bd9Sstevel@tonic-gate 	ct->ct_powercnt_reset = 0;
68367c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
68377c478bd9Sstevel@tonic-gate 	if (ret == MDI_SUCCESS)
68387c478bd9Sstevel@tonic-gate 		*held = 1;
68397c478bd9Sstevel@tonic-gate 	return (ret);
68407c478bd9Sstevel@tonic-gate }
68417c478bd9Sstevel@tonic-gate 
68427c478bd9Sstevel@tonic-gate static int
68435e3986cbScth i_mdi_pm_pre_unconfig(dev_info_t *vdip, dev_info_t *child, int *held,
68447c478bd9Sstevel@tonic-gate     int flags)
68457c478bd9Sstevel@tonic-gate {
68467c478bd9Sstevel@tonic-gate 	int			ret = MDI_SUCCESS;
68477c478bd9Sstevel@tonic-gate 	dev_info_t		*cdip;
68487c478bd9Sstevel@tonic-gate 	int			circ;
68497c478bd9Sstevel@tonic-gate 
68505e3986cbScth 	ASSERT(MDI_VHCI(vdip));
68517c478bd9Sstevel@tonic-gate 	*held = 0;
68527c478bd9Sstevel@tonic-gate 
68537c478bd9Sstevel@tonic-gate 	/* ndi_devi_unconfig_one */
68547c478bd9Sstevel@tonic-gate 	if (child) {
68555e3986cbScth 		ASSERT(DEVI_BUSY_OWNED(vdip));
68567c478bd9Sstevel@tonic-gate 		return (i_mdi_pm_pre_unconfig_one(child, held, flags));
68577c478bd9Sstevel@tonic-gate 	}
68587c478bd9Sstevel@tonic-gate 
68597c478bd9Sstevel@tonic-gate 	/* devi_unconfig_common */
68605e3986cbScth 	ndi_devi_enter(vdip, &circ);
68615e3986cbScth 	cdip = ddi_get_child(vdip);
68627c478bd9Sstevel@tonic-gate 	while (cdip) {
68637c478bd9Sstevel@tonic-gate 		dev_info_t *next = ddi_get_next_sibling(cdip);
68647c478bd9Sstevel@tonic-gate 
68657c478bd9Sstevel@tonic-gate 		ret = i_mdi_pm_pre_unconfig_one(cdip, held, flags);
68667c478bd9Sstevel@tonic-gate 		cdip = next;
68677c478bd9Sstevel@tonic-gate 	}
68685e3986cbScth 	ndi_devi_exit(vdip, circ);
68697c478bd9Sstevel@tonic-gate 
68707c478bd9Sstevel@tonic-gate 	if (*held)
68717c478bd9Sstevel@tonic-gate 		ret = MDI_SUCCESS;
68727c478bd9Sstevel@tonic-gate 
68737c478bd9Sstevel@tonic-gate 	return (ret);
68747c478bd9Sstevel@tonic-gate }
68757c478bd9Sstevel@tonic-gate 
68767c478bd9Sstevel@tonic-gate static void
68777c478bd9Sstevel@tonic-gate i_mdi_pm_post_config_one(dev_info_t *child)
68787c478bd9Sstevel@tonic-gate {
68797c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
68807c478bd9Sstevel@tonic-gate 
68817c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(child);
68827c478bd9Sstevel@tonic-gate 	if (ct == NULL)
68837c478bd9Sstevel@tonic-gate 		return;
68847c478bd9Sstevel@tonic-gate 
68857c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
68867c478bd9Sstevel@tonic-gate 	while (MDI_CLIENT_IS_POWER_TRANSITION(ct))
68877c478bd9Sstevel@tonic-gate 		cv_wait(&ct->ct_powerchange_cv, &ct->ct_mutex);
68887c478bd9Sstevel@tonic-gate 
688978dc6db2Sllai1 	if (ct->ct_powercnt_reset || !ct->ct_powercnt_config) {
68904c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "not configured\n"));
68917c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
68927c478bd9Sstevel@tonic-gate 		return;
68937c478bd9Sstevel@tonic-gate 	}
68947c478bd9Sstevel@tonic-gate 
68957c478bd9Sstevel@tonic-gate 	/* client has not been updated */
68967c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT_IS_FAILED(ct)) {
68974c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "client failed\n"));
68987c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
68997c478bd9Sstevel@tonic-gate 		return;
69007c478bd9Sstevel@tonic-gate 	}
69017c478bd9Sstevel@tonic-gate 
69027c478bd9Sstevel@tonic-gate 	/* another thread might have powered it down or detached it */
69037c478bd9Sstevel@tonic-gate 	if ((MDI_CLIENT_IS_POWERED_DOWN(ct) &&
69047c478bd9Sstevel@tonic-gate 	    !DEVI_IS_ATTACHING(ct->ct_dip)) ||
6905737d277aScth 	    (!i_ddi_devi_attached(ct->ct_dip) &&
69067c478bd9Sstevel@tonic-gate 	    !DEVI_IS_ATTACHING(ct->ct_dip))) {
69074c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "i_mdi_pm_reset_client\n"));
69087c478bd9Sstevel@tonic-gate 		i_mdi_pm_reset_client(ct);
69097c478bd9Sstevel@tonic-gate 	} else {
69107c478bd9Sstevel@tonic-gate 		mdi_pathinfo_t  *pip, *next;
69117c478bd9Sstevel@tonic-gate 		int	valid_path_count = 0;
69127c478bd9Sstevel@tonic-gate 
69134c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "i_mdi_pm_rele_client\n"));
69147c478bd9Sstevel@tonic-gate 		pip = ct->ct_path_head;
69157c478bd9Sstevel@tonic-gate 		while (pip != NULL) {
69167c478bd9Sstevel@tonic-gate 			MDI_PI_LOCK(pip);
69177c478bd9Sstevel@tonic-gate 			next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link;
691878dc6db2Sllai1 			if (MDI_PI_IS_ONLINE(pip) || MDI_PI_IS_STANDBY(pip))
69197c478bd9Sstevel@tonic-gate 				valid_path_count ++;
69207c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
69217c478bd9Sstevel@tonic-gate 			pip = next;
69227c478bd9Sstevel@tonic-gate 		}
69237c478bd9Sstevel@tonic-gate 		i_mdi_pm_rele_client(ct, valid_path_count);
69247c478bd9Sstevel@tonic-gate 	}
692578dc6db2Sllai1 	ct->ct_powercnt_config = 0;
69267c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
69277c478bd9Sstevel@tonic-gate }
69287c478bd9Sstevel@tonic-gate 
69297c478bd9Sstevel@tonic-gate static void
69305e3986cbScth i_mdi_pm_post_config(dev_info_t *vdip, dev_info_t *child)
69317c478bd9Sstevel@tonic-gate {
69327c478bd9Sstevel@tonic-gate 	int		circ;
69337c478bd9Sstevel@tonic-gate 	dev_info_t	*cdip;
69345e3986cbScth 
69355e3986cbScth 	ASSERT(MDI_VHCI(vdip));
69367c478bd9Sstevel@tonic-gate 
69377c478bd9Sstevel@tonic-gate 	/* ndi_devi_config_one */
69387c478bd9Sstevel@tonic-gate 	if (child) {
69395e3986cbScth 		ASSERT(DEVI_BUSY_OWNED(vdip));
69407c478bd9Sstevel@tonic-gate 		i_mdi_pm_post_config_one(child);
69417c478bd9Sstevel@tonic-gate 		return;
69427c478bd9Sstevel@tonic-gate 	}
69437c478bd9Sstevel@tonic-gate 
69447c478bd9Sstevel@tonic-gate 	/* devi_config_common */
69455e3986cbScth 	ndi_devi_enter(vdip, &circ);
69465e3986cbScth 	cdip = ddi_get_child(vdip);
69477c478bd9Sstevel@tonic-gate 	while (cdip) {
69487c478bd9Sstevel@tonic-gate 		dev_info_t *next = ddi_get_next_sibling(cdip);
69497c478bd9Sstevel@tonic-gate 
69507c478bd9Sstevel@tonic-gate 		i_mdi_pm_post_config_one(cdip);
69517c478bd9Sstevel@tonic-gate 		cdip = next;
69527c478bd9Sstevel@tonic-gate 	}
69535e3986cbScth 	ndi_devi_exit(vdip, circ);
69547c478bd9Sstevel@tonic-gate }
69557c478bd9Sstevel@tonic-gate 
69567c478bd9Sstevel@tonic-gate static void
69577c478bd9Sstevel@tonic-gate i_mdi_pm_post_unconfig_one(dev_info_t *child)
69587c478bd9Sstevel@tonic-gate {
69597c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
69607c478bd9Sstevel@tonic-gate 
69617c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(child);
69627c478bd9Sstevel@tonic-gate 	if (ct == NULL)
69637c478bd9Sstevel@tonic-gate 		return;
69647c478bd9Sstevel@tonic-gate 
69657c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
69667c478bd9Sstevel@tonic-gate 	while (MDI_CLIENT_IS_POWER_TRANSITION(ct))
69677c478bd9Sstevel@tonic-gate 		cv_wait(&ct->ct_powerchange_cv, &ct->ct_mutex);
69687c478bd9Sstevel@tonic-gate 
696978dc6db2Sllai1 	if (!ct->ct_powercnt_unconfig || ct->ct_powercnt_reset) {
69704c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "not held\n"));
69717c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
69727c478bd9Sstevel@tonic-gate 		return;
69737c478bd9Sstevel@tonic-gate 	}
69747c478bd9Sstevel@tonic-gate 
69757c478bd9Sstevel@tonic-gate 	/* failure detaching or another thread just attached it */
69767c478bd9Sstevel@tonic-gate 	if ((MDI_CLIENT_IS_POWERED_DOWN(ct) &&
6977737d277aScth 	    i_ddi_devi_attached(ct->ct_dip)) ||
6978737d277aScth 	    (!i_ddi_devi_attached(ct->ct_dip) &&
69797c478bd9Sstevel@tonic-gate 	    !DEVI_IS_ATTACHING(ct->ct_dip))) {
69804c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "i_mdi_pm_reset_client\n"));
69817c478bd9Sstevel@tonic-gate 		i_mdi_pm_reset_client(ct);
698278dc6db2Sllai1 	} else {
698378dc6db2Sllai1 		mdi_pathinfo_t  *pip, *next;
698478dc6db2Sllai1 		int	valid_path_count = 0;
69857c478bd9Sstevel@tonic-gate 
69864c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "i_mdi_pm_rele_client\n"));
698778dc6db2Sllai1 		pip = ct->ct_path_head;
698878dc6db2Sllai1 		while (pip != NULL) {
698978dc6db2Sllai1 			MDI_PI_LOCK(pip);
699078dc6db2Sllai1 			next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link;
699178dc6db2Sllai1 			if (MDI_PI_IS_ONLINE(pip) || MDI_PI_IS_STANDBY(pip))
699278dc6db2Sllai1 				valid_path_count ++;
699378dc6db2Sllai1 			MDI_PI_UNLOCK(pip);
699478dc6db2Sllai1 			pip = next;
699578dc6db2Sllai1 		}
699678dc6db2Sllai1 		i_mdi_pm_rele_client(ct, valid_path_count);
699778dc6db2Sllai1 		ct->ct_powercnt_unconfig = 0;
699878dc6db2Sllai1 	}
699978dc6db2Sllai1 
70007c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
70017c478bd9Sstevel@tonic-gate }
70027c478bd9Sstevel@tonic-gate 
70037c478bd9Sstevel@tonic-gate static void
70045e3986cbScth i_mdi_pm_post_unconfig(dev_info_t *vdip, dev_info_t *child, int held)
70057c478bd9Sstevel@tonic-gate {
70067c478bd9Sstevel@tonic-gate 	int			circ;
70077c478bd9Sstevel@tonic-gate 	dev_info_t		*cdip;
70087c478bd9Sstevel@tonic-gate 
70095e3986cbScth 	ASSERT(MDI_VHCI(vdip));
70107c478bd9Sstevel@tonic-gate 
70117c478bd9Sstevel@tonic-gate 	if (!held) {
70124c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, vdip, "held = %d", held));
70137c478bd9Sstevel@tonic-gate 		return;
70147c478bd9Sstevel@tonic-gate 	}
70157c478bd9Sstevel@tonic-gate 
70167c478bd9Sstevel@tonic-gate 	if (child) {
70175e3986cbScth 		ASSERT(DEVI_BUSY_OWNED(vdip));
70187c478bd9Sstevel@tonic-gate 		i_mdi_pm_post_unconfig_one(child);
70197c478bd9Sstevel@tonic-gate 		return;
70207c478bd9Sstevel@tonic-gate 	}
70217c478bd9Sstevel@tonic-gate 
70225e3986cbScth 	ndi_devi_enter(vdip, &circ);
70235e3986cbScth 	cdip = ddi_get_child(vdip);
70247c478bd9Sstevel@tonic-gate 	while (cdip) {
70257c478bd9Sstevel@tonic-gate 		dev_info_t *next = ddi_get_next_sibling(cdip);
70267c478bd9Sstevel@tonic-gate 
70277c478bd9Sstevel@tonic-gate 		i_mdi_pm_post_unconfig_one(cdip);
70287c478bd9Sstevel@tonic-gate 		cdip = next;
70297c478bd9Sstevel@tonic-gate 	}
70305e3986cbScth 	ndi_devi_exit(vdip, circ);
70317c478bd9Sstevel@tonic-gate }
70327c478bd9Sstevel@tonic-gate 
70337c478bd9Sstevel@tonic-gate int
70347c478bd9Sstevel@tonic-gate mdi_power(dev_info_t *vdip, mdi_pm_op_t op, void *args, char *devnm, int flags)
70357c478bd9Sstevel@tonic-gate {
70367c478bd9Sstevel@tonic-gate 	int			circ, ret = MDI_SUCCESS;
70377c478bd9Sstevel@tonic-gate 	dev_info_t		*client_dip = NULL;
70387c478bd9Sstevel@tonic-gate 	mdi_client_t		*ct;
70397c478bd9Sstevel@tonic-gate 
70407c478bd9Sstevel@tonic-gate 	/*
70417c478bd9Sstevel@tonic-gate 	 * Handling ndi_devi_config_one and ndi_devi_unconfig_one.
70427c478bd9Sstevel@tonic-gate 	 * Power up pHCI for the named client device.
70437c478bd9Sstevel@tonic-gate 	 * Note: Before the client is enumerated under vhci by phci,
70447c478bd9Sstevel@tonic-gate 	 * client_dip can be NULL. Then proceed to power up all the
70457c478bd9Sstevel@tonic-gate 	 * pHCIs.
70467c478bd9Sstevel@tonic-gate 	 */
70477c478bd9Sstevel@tonic-gate 	if (devnm != NULL) {
70487c478bd9Sstevel@tonic-gate 		ndi_devi_enter(vdip, &circ);
70497c478bd9Sstevel@tonic-gate 		client_dip = ndi_devi_findchild(vdip, devnm);
70507c478bd9Sstevel@tonic-gate 	}
70517c478bd9Sstevel@tonic-gate 
70524c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, vdip,
70534c06356bSdh142964 	    "op = %d %s %p", op, devnm ? devnm : "", (void *)client_dip));
70547c478bd9Sstevel@tonic-gate 
70557c478bd9Sstevel@tonic-gate 	switch (op) {
70567c478bd9Sstevel@tonic-gate 	case MDI_PM_PRE_CONFIG:
70577c478bd9Sstevel@tonic-gate 		ret = i_mdi_pm_pre_config(vdip, client_dip);
7058c73a93f2Sdm120769 		break;
70595e3986cbScth 
70607c478bd9Sstevel@tonic-gate 	case MDI_PM_PRE_UNCONFIG:
70617c478bd9Sstevel@tonic-gate 		ret = i_mdi_pm_pre_unconfig(vdip, client_dip, (int *)args,
70627c478bd9Sstevel@tonic-gate 		    flags);
7063c73a93f2Sdm120769 		break;
70645e3986cbScth 
70657c478bd9Sstevel@tonic-gate 	case MDI_PM_POST_CONFIG:
70667c478bd9Sstevel@tonic-gate 		i_mdi_pm_post_config(vdip, client_dip);
7067c73a93f2Sdm120769 		break;
70685e3986cbScth 
70697c478bd9Sstevel@tonic-gate 	case MDI_PM_POST_UNCONFIG:
70707c478bd9Sstevel@tonic-gate 		i_mdi_pm_post_unconfig(vdip, client_dip, *(int *)args);
7071c73a93f2Sdm120769 		break;
70725e3986cbScth 
70737c478bd9Sstevel@tonic-gate 	case MDI_PM_HOLD_POWER:
70747c478bd9Sstevel@tonic-gate 	case MDI_PM_RELE_POWER:
70757c478bd9Sstevel@tonic-gate 		ASSERT(args);
70767c478bd9Sstevel@tonic-gate 
70777c478bd9Sstevel@tonic-gate 		client_dip = (dev_info_t *)args;
70787c478bd9Sstevel@tonic-gate 		ASSERT(MDI_CLIENT(client_dip));
70797c478bd9Sstevel@tonic-gate 
70807c478bd9Sstevel@tonic-gate 		ct = i_devi_get_client(client_dip);
70817c478bd9Sstevel@tonic-gate 		MDI_CLIENT_LOCK(ct);
70827c478bd9Sstevel@tonic-gate 
70837c478bd9Sstevel@tonic-gate 		if (op == MDI_PM_HOLD_POWER) {
70847c478bd9Sstevel@tonic-gate 			if (ct->ct_power_cnt == 0) {
70857c478bd9Sstevel@tonic-gate 				(void) i_mdi_power_all_phci(ct);
70864c06356bSdh142964 				MDI_DEBUG(4, (MDI_NOTE, client_dip,
70874c06356bSdh142964 				    "i_mdi_pm_hold_client\n"));
70887c478bd9Sstevel@tonic-gate 				i_mdi_pm_hold_client(ct, ct->ct_path_count);
70897c478bd9Sstevel@tonic-gate 			}
70907c478bd9Sstevel@tonic-gate 		} else {
70917c478bd9Sstevel@tonic-gate 			if (DEVI_IS_ATTACHING(ct->ct_dip)) {
70924c06356bSdh142964 				MDI_DEBUG(4, (MDI_NOTE, client_dip,
70934c06356bSdh142964 				    "i_mdi_pm_rele_client\n"));
70947c478bd9Sstevel@tonic-gate 				i_mdi_pm_rele_client(ct, ct->ct_path_count);
70957c478bd9Sstevel@tonic-gate 			} else {
70964c06356bSdh142964 				MDI_DEBUG(4, (MDI_NOTE, client_dip,
70974c06356bSdh142964 				    "i_mdi_pm_reset_client\n"));
70987c478bd9Sstevel@tonic-gate 				i_mdi_pm_reset_client(ct);
70997c478bd9Sstevel@tonic-gate 			}
71007c478bd9Sstevel@tonic-gate 		}
71017c478bd9Sstevel@tonic-gate 
71027c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
71037c478bd9Sstevel@tonic-gate 		break;
71045e3986cbScth 
71057c478bd9Sstevel@tonic-gate 	default:
71067c478bd9Sstevel@tonic-gate 		break;
71077c478bd9Sstevel@tonic-gate 	}
71087c478bd9Sstevel@tonic-gate 
71095e3986cbScth 	if (devnm)
71105e3986cbScth 		ndi_devi_exit(vdip, circ);
71115e3986cbScth 
71127c478bd9Sstevel@tonic-gate 	return (ret);
71137c478bd9Sstevel@tonic-gate }
71147c478bd9Sstevel@tonic-gate 
71157c478bd9Sstevel@tonic-gate int
71167c478bd9Sstevel@tonic-gate mdi_component_is_vhci(dev_info_t *dip, const char **mdi_class)
71177c478bd9Sstevel@tonic-gate {
71187c478bd9Sstevel@tonic-gate 	mdi_vhci_t *vhci;
71197c478bd9Sstevel@tonic-gate 
71207c478bd9Sstevel@tonic-gate 	if (!MDI_VHCI(dip))
71217c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
71227c478bd9Sstevel@tonic-gate 
71237c478bd9Sstevel@tonic-gate 	if (mdi_class) {
71247c478bd9Sstevel@tonic-gate 		vhci = DEVI(dip)->devi_mdi_xhci;
71257c478bd9Sstevel@tonic-gate 		ASSERT(vhci);
71267c478bd9Sstevel@tonic-gate 		*mdi_class = vhci->vh_class;
71277c478bd9Sstevel@tonic-gate 	}
71287c478bd9Sstevel@tonic-gate 
71297c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
71307c478bd9Sstevel@tonic-gate }
71317c478bd9Sstevel@tonic-gate 
71327c478bd9Sstevel@tonic-gate int
71337c478bd9Sstevel@tonic-gate mdi_component_is_phci(dev_info_t *dip, const char **mdi_class)
71347c478bd9Sstevel@tonic-gate {
71357c478bd9Sstevel@tonic-gate 	mdi_phci_t *phci;
71367c478bd9Sstevel@tonic-gate 
71377c478bd9Sstevel@tonic-gate 	if (!MDI_PHCI(dip))
71387c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
71397c478bd9Sstevel@tonic-gate 
71407c478bd9Sstevel@tonic-gate 	if (mdi_class) {
71417c478bd9Sstevel@tonic-gate 		phci = DEVI(dip)->devi_mdi_xhci;
71427c478bd9Sstevel@tonic-gate 		ASSERT(phci);
71437c478bd9Sstevel@tonic-gate 		*mdi_class = phci->ph_vhci->vh_class;
71447c478bd9Sstevel@tonic-gate 	}
71457c478bd9Sstevel@tonic-gate 
71467c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
71477c478bd9Sstevel@tonic-gate }
71487c478bd9Sstevel@tonic-gate 
71497c478bd9Sstevel@tonic-gate int
71507c478bd9Sstevel@tonic-gate mdi_component_is_client(dev_info_t *dip, const char **mdi_class)
71517c478bd9Sstevel@tonic-gate {
71527c478bd9Sstevel@tonic-gate 	mdi_client_t *client;
71537c478bd9Sstevel@tonic-gate 
71547c478bd9Sstevel@tonic-gate 	if (!MDI_CLIENT(dip))
71557c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
71567c478bd9Sstevel@tonic-gate 
71577c478bd9Sstevel@tonic-gate 	if (mdi_class) {
71587c478bd9Sstevel@tonic-gate 		client = DEVI(dip)->devi_mdi_client;
71597c478bd9Sstevel@tonic-gate 		ASSERT(client);
71607c478bd9Sstevel@tonic-gate 		*mdi_class = client->ct_vhci->vh_class;
71617c478bd9Sstevel@tonic-gate 	}
71627c478bd9Sstevel@tonic-gate 
71637c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
71647c478bd9Sstevel@tonic-gate }
71657c478bd9Sstevel@tonic-gate 
71667c478bd9Sstevel@tonic-gate void *
71677c478bd9Sstevel@tonic-gate mdi_client_get_vhci_private(dev_info_t *dip)
71687c478bd9Sstevel@tonic-gate {
71697c478bd9Sstevel@tonic-gate 	ASSERT(mdi_component_is_client(dip, NULL) == MDI_SUCCESS);
71707c478bd9Sstevel@tonic-gate 	if (mdi_component_is_client(dip, NULL) == MDI_SUCCESS) {
71717c478bd9Sstevel@tonic-gate 		mdi_client_t	*ct;
71727c478bd9Sstevel@tonic-gate 		ct = i_devi_get_client(dip);
71737c478bd9Sstevel@tonic-gate 		return (ct->ct_vprivate);
71747c478bd9Sstevel@tonic-gate 	}
71757c478bd9Sstevel@tonic-gate 	return (NULL);
71767c478bd9Sstevel@tonic-gate }
71777c478bd9Sstevel@tonic-gate 
71787c478bd9Sstevel@tonic-gate void
71797c478bd9Sstevel@tonic-gate mdi_client_set_vhci_private(dev_info_t *dip, void *data)
71807c478bd9Sstevel@tonic-gate {
71817c478bd9Sstevel@tonic-gate 	ASSERT(mdi_component_is_client(dip, NULL) == MDI_SUCCESS);
71827c478bd9Sstevel@tonic-gate 	if (mdi_component_is_client(dip, NULL) == MDI_SUCCESS) {
71837c478bd9Sstevel@tonic-gate 		mdi_client_t	*ct;
71847c478bd9Sstevel@tonic-gate 		ct = i_devi_get_client(dip);
71857c478bd9Sstevel@tonic-gate 		ct->ct_vprivate = data;
71867c478bd9Sstevel@tonic-gate 	}
71877c478bd9Sstevel@tonic-gate }
71887c478bd9Sstevel@tonic-gate /*
71897c478bd9Sstevel@tonic-gate  * mdi_pi_get_vhci_private():
71907c478bd9Sstevel@tonic-gate  *		Get the vhci private information associated with the
71917c478bd9Sstevel@tonic-gate  *		mdi_pathinfo node
71927c478bd9Sstevel@tonic-gate  */
71937c478bd9Sstevel@tonic-gate void *
71947c478bd9Sstevel@tonic-gate mdi_pi_get_vhci_private(mdi_pathinfo_t *pip)
71957c478bd9Sstevel@tonic-gate {
71967c478bd9Sstevel@tonic-gate 	caddr_t	vprivate = NULL;
71977c478bd9Sstevel@tonic-gate 	if (pip) {
71987c478bd9Sstevel@tonic-gate 		vprivate = MDI_PI(pip)->pi_vprivate;
71997c478bd9Sstevel@tonic-gate 	}
72007c478bd9Sstevel@tonic-gate 	return (vprivate);
72017c478bd9Sstevel@tonic-gate }
72027c478bd9Sstevel@tonic-gate 
72037c478bd9Sstevel@tonic-gate /*
72047c478bd9Sstevel@tonic-gate  * mdi_pi_set_vhci_private():
72057c478bd9Sstevel@tonic-gate  *		Set the vhci private information in the mdi_pathinfo node
72067c478bd9Sstevel@tonic-gate  */
72077c478bd9Sstevel@tonic-gate void
72087c478bd9Sstevel@tonic-gate mdi_pi_set_vhci_private(mdi_pathinfo_t *pip, void *priv)
72097c478bd9Sstevel@tonic-gate {
72107c478bd9Sstevel@tonic-gate 	if (pip) {
72117c478bd9Sstevel@tonic-gate 		MDI_PI(pip)->pi_vprivate = priv;
72127c478bd9Sstevel@tonic-gate 	}
72137c478bd9Sstevel@tonic-gate }
72147c478bd9Sstevel@tonic-gate 
72157c478bd9Sstevel@tonic-gate /*
72167c478bd9Sstevel@tonic-gate  * mdi_phci_get_vhci_private():
72177c478bd9Sstevel@tonic-gate  *		Get the vhci private information associated with the
72187c478bd9Sstevel@tonic-gate  *		mdi_phci node
72197c478bd9Sstevel@tonic-gate  */
72207c478bd9Sstevel@tonic-gate void *
72217c478bd9Sstevel@tonic-gate mdi_phci_get_vhci_private(dev_info_t *dip)
72227c478bd9Sstevel@tonic-gate {
72237c478bd9Sstevel@tonic-gate 	ASSERT(mdi_component_is_phci(dip, NULL) == MDI_SUCCESS);
72247c478bd9Sstevel@tonic-gate 	if (mdi_component_is_phci(dip, NULL) == MDI_SUCCESS) {
72257c478bd9Sstevel@tonic-gate 		mdi_phci_t	*ph;
72267c478bd9Sstevel@tonic-gate 		ph = i_devi_get_phci(dip);
72277c478bd9Sstevel@tonic-gate 		return (ph->ph_vprivate);
72287c478bd9Sstevel@tonic-gate 	}
72297c478bd9Sstevel@tonic-gate 	return (NULL);
72307c478bd9Sstevel@tonic-gate }
72317c478bd9Sstevel@tonic-gate 
72327c478bd9Sstevel@tonic-gate /*
72337c478bd9Sstevel@tonic-gate  * mdi_phci_set_vhci_private():
72347c478bd9Sstevel@tonic-gate  *		Set the vhci private information in the mdi_phci node
72357c478bd9Sstevel@tonic-gate  */
72367c478bd9Sstevel@tonic-gate void
72377c478bd9Sstevel@tonic-gate mdi_phci_set_vhci_private(dev_info_t *dip, void *priv)
72387c478bd9Sstevel@tonic-gate {
72397c478bd9Sstevel@tonic-gate 	ASSERT(mdi_component_is_phci(dip, NULL) == MDI_SUCCESS);
72407c478bd9Sstevel@tonic-gate 	if (mdi_component_is_phci(dip, NULL) == MDI_SUCCESS) {
72417c478bd9Sstevel@tonic-gate 		mdi_phci_t	*ph;
72427c478bd9Sstevel@tonic-gate 		ph = i_devi_get_phci(dip);
72437c478bd9Sstevel@tonic-gate 		ph->ph_vprivate = priv;
72447c478bd9Sstevel@tonic-gate 	}
72457c478bd9Sstevel@tonic-gate }
72463c34adc5Sramat 
72474c06356bSdh142964 int
72484c06356bSdh142964 mdi_pi_ishidden(mdi_pathinfo_t *pip)
72494c06356bSdh142964 {
72504c06356bSdh142964 	return (MDI_PI_FLAGS_IS_HIDDEN(pip));
72514c06356bSdh142964 }
72524c06356bSdh142964 
72534c06356bSdh142964 int
72544c06356bSdh142964 mdi_pi_device_isremoved(mdi_pathinfo_t *pip)
72554c06356bSdh142964 {
72564c06356bSdh142964 	return (MDI_PI_FLAGS_IS_DEVICE_REMOVED(pip));
72574c06356bSdh142964 }
72584c06356bSdh142964 
72594c06356bSdh142964 /*
72604c06356bSdh142964  * When processing hotplug, if mdi_pi_offline-mdi_pi_free fails then this
72614c06356bSdh142964  * interface is used to represent device removal.
72624c06356bSdh142964  */
72634c06356bSdh142964 int
72644c06356bSdh142964 mdi_pi_device_remove(mdi_pathinfo_t *pip)
72654c06356bSdh142964 {
72664c06356bSdh142964 	MDI_PI_LOCK(pip);
72674c06356bSdh142964 	if (mdi_pi_device_isremoved(pip)) {
72684c06356bSdh142964 		MDI_PI_UNLOCK(pip);
72694c06356bSdh142964 		return (0);
72704c06356bSdh142964 	}
72714c06356bSdh142964 	MDI_PI_FLAGS_SET_DEVICE_REMOVED(pip);
72724c06356bSdh142964 	MDI_PI_FLAGS_SET_HIDDEN(pip);
72734c06356bSdh142964 	MDI_PI_UNLOCK(pip);
72744c06356bSdh142964 
72754c06356bSdh142964 	i_ddi_di_cache_invalidate();
72764c06356bSdh142964 
72774c06356bSdh142964 	return (1);
72784c06356bSdh142964 }
72794c06356bSdh142964 
72804c06356bSdh142964 /*
72814c06356bSdh142964  * When processing hotplug, if a path marked mdi_pi_device_isremoved()
72824c06356bSdh142964  * is now accessible then this interfaces is used to represent device insertion.
72834c06356bSdh142964  */
72844c06356bSdh142964 int
72854c06356bSdh142964 mdi_pi_device_insert(mdi_pathinfo_t *pip)
72864c06356bSdh142964 {
72874c06356bSdh142964 	MDI_PI_LOCK(pip);
72884c06356bSdh142964 	if (!mdi_pi_device_isremoved(pip)) {
72894c06356bSdh142964 		MDI_PI_UNLOCK(pip);
72904c06356bSdh142964 		return (0);
72914c06356bSdh142964 	}
72924c06356bSdh142964 	MDI_PI_FLAGS_CLR_DEVICE_REMOVED(pip);
72934c06356bSdh142964 	MDI_PI_FLAGS_CLR_HIDDEN(pip);
72944c06356bSdh142964 	MDI_PI_UNLOCK(pip);
72954c06356bSdh142964 
72964c06356bSdh142964 	i_ddi_di_cache_invalidate();
72974c06356bSdh142964 
72984c06356bSdh142964 	return (1);
72994c06356bSdh142964 }
73004c06356bSdh142964 
73013c34adc5Sramat /*
73023c34adc5Sramat  * List of vhci class names:
73033c34adc5Sramat  * A vhci class name must be in this list only if the corresponding vhci
73043c34adc5Sramat  * driver intends to use the mdi provided bus config implementation
73053c34adc5Sramat  * (i.e., mdi_vhci_bus_config()).
73063c34adc5Sramat  */
73073c34adc5Sramat static char *vhci_class_list[] = { MDI_HCI_CLASS_SCSI, MDI_HCI_CLASS_IB };
73083c34adc5Sramat #define	N_VHCI_CLASSES	(sizeof (vhci_class_list) / sizeof (char *))
73093c34adc5Sramat 
73103c34adc5Sramat /*
73113c34adc5Sramat  * During boot time, the on-disk vhci cache for every vhci class is read
73123c34adc5Sramat  * in the form of an nvlist and stored here.
73133c34adc5Sramat  */
73143c34adc5Sramat static nvlist_t *vhcache_nvl[N_VHCI_CLASSES];
73153c34adc5Sramat 
73163c34adc5Sramat /* nvpair names in vhci cache nvlist */
73173c34adc5Sramat #define	MDI_VHCI_CACHE_VERSION	1
73183c34adc5Sramat #define	MDI_NVPNAME_VERSION	"version"
73193c34adc5Sramat #define	MDI_NVPNAME_PHCIS	"phcis"
73203c34adc5Sramat #define	MDI_NVPNAME_CTADDRMAP	"clientaddrmap"
73213c34adc5Sramat 
73223c34adc5Sramat /*
73233c34adc5Sramat  * Given vhci class name, return its on-disk vhci cache filename.
73243c34adc5Sramat  * Memory for the returned filename which includes the full path is allocated
73253c34adc5Sramat  * by this function.
73263c34adc5Sramat  */
73273c34adc5Sramat static char *
73283c34adc5Sramat vhclass2vhcache_filename(char *vhclass)
73293c34adc5Sramat {
73303c34adc5Sramat 	char *filename;
73313c34adc5Sramat 	int len;
73323c34adc5Sramat 	static char *fmt = "/etc/devices/mdi_%s_cache";
73333c34adc5Sramat 
73343c34adc5Sramat 	/*
73353c34adc5Sramat 	 * fmt contains the on-disk vhci cache file name format;
73363c34adc5Sramat 	 * for scsi_vhci the filename is "/etc/devices/mdi_scsi_vhci_cache".
73373c34adc5Sramat 	 */
73383c34adc5Sramat 
73393c34adc5Sramat 	/* the -1 below is to account for "%s" in the format string */
73403c34adc5Sramat 	len = strlen(fmt) + strlen(vhclass) - 1;
73413c34adc5Sramat 	filename = kmem_alloc(len, KM_SLEEP);
73423c34adc5Sramat 	(void) snprintf(filename, len, fmt, vhclass);
73433c34adc5Sramat 	ASSERT(len == (strlen(filename) + 1));
73443c34adc5Sramat 	return (filename);
73453c34adc5Sramat }
73463c34adc5Sramat 
73473c34adc5Sramat /*
73483c34adc5Sramat  * initialize the vhci cache related data structures and read the on-disk
73493c34adc5Sramat  * vhci cached data into memory.
73503c34adc5Sramat  */
73513c34adc5Sramat static void
73523c34adc5Sramat setup_vhci_cache(mdi_vhci_t *vh)
73533c34adc5Sramat {
73543c34adc5Sramat 	mdi_vhci_config_t *vhc;
73553c34adc5Sramat 	mdi_vhci_cache_t *vhcache;
73563c34adc5Sramat 	int i;
73573c34adc5Sramat 	nvlist_t *nvl = NULL;
73583c34adc5Sramat 
73593c34adc5Sramat 	vhc = kmem_zalloc(sizeof (mdi_vhci_config_t), KM_SLEEP);
73603c34adc5Sramat 	vh->vh_config = vhc;
73613c34adc5Sramat 	vhcache = &vhc->vhc_vhcache;
73623c34adc5Sramat 
73633c34adc5Sramat 	vhc->vhc_vhcache_filename = vhclass2vhcache_filename(vh->vh_class);
73643c34adc5Sramat 
73653c34adc5Sramat 	mutex_init(&vhc->vhc_lock, NULL, MUTEX_DEFAULT, NULL);
73663c34adc5Sramat 	cv_init(&vhc->vhc_cv, NULL, CV_DRIVER, NULL);
73673c34adc5Sramat 
73683c34adc5Sramat 	rw_init(&vhcache->vhcache_lock, NULL, RW_DRIVER, NULL);
73693c34adc5Sramat 
73703c34adc5Sramat 	/*
73713c34adc5Sramat 	 * Create string hash; same as mod_hash_create_strhash() except that
73723c34adc5Sramat 	 * we use NULL key destructor.
73733c34adc5Sramat 	 */
73743c34adc5Sramat 	vhcache->vhcache_client_hash = mod_hash_create_extended(vh->vh_class,
73753c34adc5Sramat 	    mdi_bus_config_cache_hash_size,
73763c34adc5Sramat 	    mod_hash_null_keydtor, mod_hash_null_valdtor,
73773c34adc5Sramat 	    mod_hash_bystr, NULL, mod_hash_strkey_cmp, KM_SLEEP);
73783c34adc5Sramat 
73793c34adc5Sramat 	/*
73803c34adc5Sramat 	 * The on-disk vhci cache is read during booting prior to the
73813c34adc5Sramat 	 * lights-out period by mdi_read_devices_files().
73823c34adc5Sramat 	 */
73833c34adc5Sramat 	for (i = 0; i < N_VHCI_CLASSES; i++) {
73843c34adc5Sramat 		if (strcmp(vhci_class_list[i], vh->vh_class) == 0) {
73853c34adc5Sramat 			nvl = vhcache_nvl[i];
73863c34adc5Sramat 			vhcache_nvl[i] = NULL;
73873c34adc5Sramat 			break;
73883c34adc5Sramat 		}
73893c34adc5Sramat 	}
73903c34adc5Sramat 
73913c34adc5Sramat 	/*
73923c34adc5Sramat 	 * this is to cover the case of some one manually causing unloading
73933c34adc5Sramat 	 * (or detaching) and reloading (or attaching) of a vhci driver.
73943c34adc5Sramat 	 */
73953c34adc5Sramat 	if (nvl == NULL && modrootloaded)
73963c34adc5Sramat 		nvl = read_on_disk_vhci_cache(vh->vh_class);
73973c34adc5Sramat 
73983c34adc5Sramat 	if (nvl != NULL) {
73993c34adc5Sramat 		rw_enter(&vhcache->vhcache_lock, RW_WRITER);
74003c34adc5Sramat 		if (mainnvl_to_vhcache(vhcache, nvl) == MDI_SUCCESS)
74013c34adc5Sramat 			vhcache->vhcache_flags |= MDI_VHCI_CACHE_SETUP_DONE;
74023c34adc5Sramat 		else  {
74033c34adc5Sramat 			cmn_err(CE_WARN,
74044c06356bSdh142964 			    "%s: data file corrupted, will recreate",
74053c34adc5Sramat 			    vhc->vhc_vhcache_filename);
74063c34adc5Sramat 		}
74073c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
74083c34adc5Sramat 		nvlist_free(nvl);
74093c34adc5Sramat 	}
74103c34adc5Sramat 
74113c34adc5Sramat 	vhc->vhc_cbid = callb_add(stop_vhcache_flush_thread, vhc,
74123c34adc5Sramat 	    CB_CL_UADMIN_PRE_VFS, "mdi_vhcache_flush");
741367e56d35Sramat 
741467e56d35Sramat 	vhc->vhc_path_discovery_boot = mdi_path_discovery_boot;
741567e56d35Sramat 	vhc->vhc_path_discovery_postboot = mdi_path_discovery_postboot;
74163c34adc5Sramat }
74173c34adc5Sramat 
74183c34adc5Sramat /*
74193c34adc5Sramat  * free all vhci cache related resources
74203c34adc5Sramat  */
74213c34adc5Sramat static int
74223c34adc5Sramat destroy_vhci_cache(mdi_vhci_t *vh)
74233c34adc5Sramat {
74243c34adc5Sramat 	mdi_vhci_config_t *vhc = vh->vh_config;
74253c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
74263c34adc5Sramat 	mdi_vhcache_phci_t *cphci, *cphci_next;
74273c34adc5Sramat 	mdi_vhcache_client_t *cct, *cct_next;
74283c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi, *cpi_next;
74293c34adc5Sramat 
74303c34adc5Sramat 	if (stop_vhcache_async_threads(vhc) != MDI_SUCCESS)
74313c34adc5Sramat 		return (MDI_FAILURE);
74323c34adc5Sramat 
74333c34adc5Sramat 	kmem_free(vhc->vhc_vhcache_filename,
74343c34adc5Sramat 	    strlen(vhc->vhc_vhcache_filename) + 1);
74353c34adc5Sramat 
74363c34adc5Sramat 	mod_hash_destroy_strhash(vhcache->vhcache_client_hash);
74373c34adc5Sramat 
74383c34adc5Sramat 	for (cphci = vhcache->vhcache_phci_head; cphci != NULL;
74393c34adc5Sramat 	    cphci = cphci_next) {
74403c34adc5Sramat 		cphci_next = cphci->cphci_next;
74413c34adc5Sramat 		free_vhcache_phci(cphci);
74423c34adc5Sramat 	}
74433c34adc5Sramat 
74443c34adc5Sramat 	for (cct = vhcache->vhcache_client_head; cct != NULL; cct = cct_next) {
74453c34adc5Sramat 		cct_next = cct->cct_next;
74463c34adc5Sramat 		for (cpi = cct->cct_cpi_head; cpi != NULL; cpi = cpi_next) {
74473c34adc5Sramat 			cpi_next = cpi->cpi_next;
74483c34adc5Sramat 			free_vhcache_pathinfo(cpi);
74493c34adc5Sramat 		}
74503c34adc5Sramat 		free_vhcache_client(cct);
74513c34adc5Sramat 	}
74523c34adc5Sramat 
74533c34adc5Sramat 	rw_destroy(&vhcache->vhcache_lock);
74543c34adc5Sramat 
74553c34adc5Sramat 	mutex_destroy(&vhc->vhc_lock);
74563c34adc5Sramat 	cv_destroy(&vhc->vhc_cv);
74573c34adc5Sramat 	kmem_free(vhc, sizeof (mdi_vhci_config_t));
74583c34adc5Sramat 	return (MDI_SUCCESS);
74593c34adc5Sramat }
74603c34adc5Sramat 
74613c34adc5Sramat /*
74623c34adc5Sramat  * Stop all vhci cache related async threads and free their resources.
74633c34adc5Sramat  */
74643c34adc5Sramat static int
74653c34adc5Sramat stop_vhcache_async_threads(mdi_vhci_config_t *vhc)
74663c34adc5Sramat {
74673c34adc5Sramat 	mdi_async_client_config_t *acc, *acc_next;
74683c34adc5Sramat 
74693c34adc5Sramat 	mutex_enter(&vhc->vhc_lock);
74703c34adc5Sramat 	vhc->vhc_flags |= MDI_VHC_EXIT;
74713c34adc5Sramat 	ASSERT(vhc->vhc_acc_thrcount >= 0);
74723c34adc5Sramat 	cv_broadcast(&vhc->vhc_cv);
74733c34adc5Sramat 
74743c34adc5Sramat 	while ((vhc->vhc_flags & MDI_VHC_VHCACHE_FLUSH_THREAD) ||
74753c34adc5Sramat 	    vhc->vhc_acc_thrcount != 0) {
74763c34adc5Sramat 		mutex_exit(&vhc->vhc_lock);
74774c06356bSdh142964 		delay_random(5);
74783c34adc5Sramat 		mutex_enter(&vhc->vhc_lock);
74793c34adc5Sramat 	}
74803c34adc5Sramat 
74813c34adc5Sramat 	vhc->vhc_flags &= ~MDI_VHC_EXIT;
74823c34adc5Sramat 
74833c34adc5Sramat 	for (acc = vhc->vhc_acc_list_head; acc != NULL; acc = acc_next) {
74843c34adc5Sramat 		acc_next = acc->acc_next;
74853c34adc5Sramat 		free_async_client_config(acc);
74863c34adc5Sramat 	}
74873c34adc5Sramat 	vhc->vhc_acc_list_head = NULL;
74883c34adc5Sramat 	vhc->vhc_acc_list_tail = NULL;
74893c34adc5Sramat 	vhc->vhc_acc_count = 0;
74903c34adc5Sramat 
74913c34adc5Sramat 	if (vhc->vhc_flags & MDI_VHC_VHCACHE_DIRTY) {
74923c34adc5Sramat 		vhc->vhc_flags &= ~MDI_VHC_VHCACHE_DIRTY;
74933c34adc5Sramat 		mutex_exit(&vhc->vhc_lock);
74943c34adc5Sramat 		if (flush_vhcache(vhc, 0) != MDI_SUCCESS) {
74953c34adc5Sramat 			vhcache_dirty(vhc);
74963c34adc5Sramat 			return (MDI_FAILURE);
74973c34adc5Sramat 		}
74983c34adc5Sramat 	} else
74993c34adc5Sramat 		mutex_exit(&vhc->vhc_lock);
75003c34adc5Sramat 
75013c34adc5Sramat 	if (callb_delete(vhc->vhc_cbid) != 0)
75023c34adc5Sramat 		return (MDI_FAILURE);
75033c34adc5Sramat 
75043c34adc5Sramat 	return (MDI_SUCCESS);
75053c34adc5Sramat }
75063c34adc5Sramat 
75073c34adc5Sramat /*
75083c34adc5Sramat  * Stop vhci cache flush thread
75093c34adc5Sramat  */
75103c34adc5Sramat /* ARGSUSED */
75113c34adc5Sramat static boolean_t
75123c34adc5Sramat stop_vhcache_flush_thread(void *arg, int code)
75133c34adc5Sramat {
75143c34adc5Sramat 	mdi_vhci_config_t *vhc = (mdi_vhci_config_t *)arg;
75153c34adc5Sramat 
75163c34adc5Sramat 	mutex_enter(&vhc->vhc_lock);
75173c34adc5Sramat 	vhc->vhc_flags |= MDI_VHC_EXIT;
75183c34adc5Sramat 	cv_broadcast(&vhc->vhc_cv);
75193c34adc5Sramat 
75203c34adc5Sramat 	while (vhc->vhc_flags & MDI_VHC_VHCACHE_FLUSH_THREAD) {
75213c34adc5Sramat 		mutex_exit(&vhc->vhc_lock);
75224c06356bSdh142964 		delay_random(5);
75233c34adc5Sramat 		mutex_enter(&vhc->vhc_lock);
75243c34adc5Sramat 	}
75253c34adc5Sramat 
75263c34adc5Sramat 	if (vhc->vhc_flags & MDI_VHC_VHCACHE_DIRTY) {
75273c34adc5Sramat 		vhc->vhc_flags &= ~MDI_VHC_VHCACHE_DIRTY;
75283c34adc5Sramat 		mutex_exit(&vhc->vhc_lock);
75293c34adc5Sramat 		(void) flush_vhcache(vhc, 1);
75303c34adc5Sramat 	} else
75313c34adc5Sramat 		mutex_exit(&vhc->vhc_lock);
75323c34adc5Sramat 
75333c34adc5Sramat 	return (B_TRUE);
75343c34adc5Sramat }
75353c34adc5Sramat 
75363c34adc5Sramat /*
75373c34adc5Sramat  * Enqueue the vhcache phci (cphci) at the tail of the list
75383c34adc5Sramat  */
75393c34adc5Sramat static void
75403c34adc5Sramat enqueue_vhcache_phci(mdi_vhci_cache_t *vhcache, mdi_vhcache_phci_t *cphci)
75413c34adc5Sramat {
75423c34adc5Sramat 	cphci->cphci_next = NULL;
75433c34adc5Sramat 	if (vhcache->vhcache_phci_head == NULL)
75443c34adc5Sramat 		vhcache->vhcache_phci_head = cphci;
75453c34adc5Sramat 	else
75463c34adc5Sramat 		vhcache->vhcache_phci_tail->cphci_next = cphci;
75473c34adc5Sramat 	vhcache->vhcache_phci_tail = cphci;
75483c34adc5Sramat }
75493c34adc5Sramat 
75503c34adc5Sramat /*
75513c34adc5Sramat  * Enqueue the vhcache pathinfo (cpi) at the tail of the list
75523c34adc5Sramat  */
75533c34adc5Sramat static void
75543c34adc5Sramat enqueue_tail_vhcache_pathinfo(mdi_vhcache_client_t *cct,
75553c34adc5Sramat     mdi_vhcache_pathinfo_t *cpi)
75563c34adc5Sramat {
75573c34adc5Sramat 	cpi->cpi_next = NULL;
75583c34adc5Sramat 	if (cct->cct_cpi_head == NULL)
75593c34adc5Sramat 		cct->cct_cpi_head = cpi;
75603c34adc5Sramat 	else
75613c34adc5Sramat 		cct->cct_cpi_tail->cpi_next = cpi;
75623c34adc5Sramat 	cct->cct_cpi_tail = cpi;
75633c34adc5Sramat }
75643c34adc5Sramat 
75653c34adc5Sramat /*
75663c34adc5Sramat  * Enqueue the vhcache pathinfo (cpi) at the correct location in the
75673c34adc5Sramat  * ordered list. All cpis which do not have MDI_CPI_HINT_PATH_DOES_NOT_EXIST
75683c34adc5Sramat  * flag set come at the beginning of the list. All cpis which have this
75693c34adc5Sramat  * flag set come at the end of the list.
75703c34adc5Sramat  */
75713c34adc5Sramat static void
75723c34adc5Sramat enqueue_vhcache_pathinfo(mdi_vhcache_client_t *cct,
75733c34adc5Sramat     mdi_vhcache_pathinfo_t *newcpi)
75743c34adc5Sramat {
75753c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi, *prev_cpi;
75763c34adc5Sramat 
75773c34adc5Sramat 	if (cct->cct_cpi_head == NULL ||
75783c34adc5Sramat 	    (newcpi->cpi_flags & MDI_CPI_HINT_PATH_DOES_NOT_EXIST))
75793c34adc5Sramat 		enqueue_tail_vhcache_pathinfo(cct, newcpi);
75803c34adc5Sramat 	else {
75813c34adc5Sramat 		for (cpi = cct->cct_cpi_head, prev_cpi = NULL; cpi != NULL &&
75823c34adc5Sramat 		    !(cpi->cpi_flags & MDI_CPI_HINT_PATH_DOES_NOT_EXIST);
75833c34adc5Sramat 		    prev_cpi = cpi, cpi = cpi->cpi_next)
75843c34adc5Sramat 			;
75853c34adc5Sramat 
75863c34adc5Sramat 		if (prev_cpi == NULL)
75873c34adc5Sramat 			cct->cct_cpi_head = newcpi;
75883c34adc5Sramat 		else
75893c34adc5Sramat 			prev_cpi->cpi_next = newcpi;
75903c34adc5Sramat 
75913c34adc5Sramat 		newcpi->cpi_next = cpi;
75923c34adc5Sramat 
75933c34adc5Sramat 		if (cpi == NULL)
75943c34adc5Sramat 			cct->cct_cpi_tail = newcpi;
75953c34adc5Sramat 	}
75963c34adc5Sramat }
75973c34adc5Sramat 
75983c34adc5Sramat /*
75993c34adc5Sramat  * Enqueue the vhcache client (cct) at the tail of the list
76003c34adc5Sramat  */
76013c34adc5Sramat static void
76023c34adc5Sramat enqueue_vhcache_client(mdi_vhci_cache_t *vhcache,
76033c34adc5Sramat     mdi_vhcache_client_t *cct)
76043c34adc5Sramat {
76053c34adc5Sramat 	cct->cct_next = NULL;
76063c34adc5Sramat 	if (vhcache->vhcache_client_head == NULL)
76073c34adc5Sramat 		vhcache->vhcache_client_head = cct;
76083c34adc5Sramat 	else
76093c34adc5Sramat 		vhcache->vhcache_client_tail->cct_next = cct;
76103c34adc5Sramat 	vhcache->vhcache_client_tail = cct;
76113c34adc5Sramat }
76123c34adc5Sramat 
76133c34adc5Sramat static void
76143c34adc5Sramat free_string_array(char **str, int nelem)
76153c34adc5Sramat {
76163c34adc5Sramat 	int i;
76173c34adc5Sramat 
76183c34adc5Sramat 	if (str) {
76193c34adc5Sramat 		for (i = 0; i < nelem; i++) {
76203c34adc5Sramat 			if (str[i])
76213c34adc5Sramat 				kmem_free(str[i], strlen(str[i]) + 1);
76223c34adc5Sramat 		}
76233c34adc5Sramat 		kmem_free(str, sizeof (char *) * nelem);
76243c34adc5Sramat 	}
76253c34adc5Sramat }
76263c34adc5Sramat 
76273c34adc5Sramat static void
76283c34adc5Sramat free_vhcache_phci(mdi_vhcache_phci_t *cphci)
76293c34adc5Sramat {
76303c34adc5Sramat 	kmem_free(cphci->cphci_path, strlen(cphci->cphci_path) + 1);
76313c34adc5Sramat 	kmem_free(cphci, sizeof (*cphci));
76323c34adc5Sramat }
76333c34adc5Sramat 
76343c34adc5Sramat static void
76353c34adc5Sramat free_vhcache_pathinfo(mdi_vhcache_pathinfo_t *cpi)
76363c34adc5Sramat {
76373c34adc5Sramat 	kmem_free(cpi->cpi_addr, strlen(cpi->cpi_addr) + 1);
76383c34adc5Sramat 	kmem_free(cpi, sizeof (*cpi));
76393c34adc5Sramat }
76403c34adc5Sramat 
76413c34adc5Sramat static void
76423c34adc5Sramat free_vhcache_client(mdi_vhcache_client_t *cct)
76433c34adc5Sramat {
76443c34adc5Sramat 	kmem_free(cct->cct_name_addr, strlen(cct->cct_name_addr) + 1);
76453c34adc5Sramat 	kmem_free(cct, sizeof (*cct));
76463c34adc5Sramat }
76473c34adc5Sramat 
76483c34adc5Sramat static char *
76493c34adc5Sramat vhcache_mknameaddr(char *ct_name, char *ct_addr, int *ret_len)
76503c34adc5Sramat {
76513c34adc5Sramat 	char *name_addr;
76523c34adc5Sramat 	int len;
76533c34adc5Sramat 
76543c34adc5Sramat 	len = strlen(ct_name) + strlen(ct_addr) + 2;
76553c34adc5Sramat 	name_addr = kmem_alloc(len, KM_SLEEP);
76563c34adc5Sramat 	(void) snprintf(name_addr, len, "%s@%s", ct_name, ct_addr);
76573c34adc5Sramat 
76583c34adc5Sramat 	if (ret_len)
76593c34adc5Sramat 		*ret_len = len;
76603c34adc5Sramat 	return (name_addr);
76613c34adc5Sramat }
76623c34adc5Sramat 
76633c34adc5Sramat /*
76643c34adc5Sramat  * Copy the contents of paddrnvl to vhci cache.
76653c34adc5Sramat  * paddrnvl nvlist contains path information for a vhci client.
76663c34adc5Sramat  * See the comment in mainnvl_to_vhcache() for the format of this nvlist.
76673c34adc5Sramat  */
76683c34adc5Sramat static void
76693c34adc5Sramat paddrnvl_to_vhcache(nvlist_t *nvl, mdi_vhcache_phci_t *cphci_list[],
76703c34adc5Sramat     mdi_vhcache_client_t *cct)
76713c34adc5Sramat {
76723c34adc5Sramat 	nvpair_t *nvp = NULL;
76733c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi;
76743c34adc5Sramat 	uint_t nelem;
76753c34adc5Sramat 	uint32_t *val;
76763c34adc5Sramat 
76773c34adc5Sramat 	while ((nvp = nvlist_next_nvpair(nvl, nvp)) != NULL) {
76783c34adc5Sramat 		ASSERT(nvpair_type(nvp) == DATA_TYPE_UINT32_ARRAY);
76793c34adc5Sramat 		cpi = kmem_zalloc(sizeof (*cpi), KM_SLEEP);
76803c34adc5Sramat 		cpi->cpi_addr = i_ddi_strdup(nvpair_name(nvp), KM_SLEEP);
76813c34adc5Sramat 		(void) nvpair_value_uint32_array(nvp, &val, &nelem);
76823c34adc5Sramat 		ASSERT(nelem == 2);
76833c34adc5Sramat 		cpi->cpi_cphci = cphci_list[val[0]];
76843c34adc5Sramat 		cpi->cpi_flags = val[1];
76853c34adc5Sramat 		enqueue_tail_vhcache_pathinfo(cct, cpi);
76863c34adc5Sramat 	}
76873c34adc5Sramat }
76883c34adc5Sramat 
76893c34adc5Sramat /*
76903c34adc5Sramat  * Copy the contents of caddrmapnvl to vhci cache.
76913c34adc5Sramat  * caddrmapnvl nvlist contains vhci client address to phci client address
76923c34adc5Sramat  * mappings. See the comment in mainnvl_to_vhcache() for the format of
76933c34adc5Sramat  * this nvlist.
76943c34adc5Sramat  */
76953c34adc5Sramat static void
76963c34adc5Sramat caddrmapnvl_to_vhcache(mdi_vhci_cache_t *vhcache, nvlist_t *nvl,
76973c34adc5Sramat     mdi_vhcache_phci_t *cphci_list[])
76983c34adc5Sramat {
76993c34adc5Sramat 	nvpair_t *nvp = NULL;
77003c34adc5Sramat 	nvlist_t *paddrnvl;
77013c34adc5Sramat 	mdi_vhcache_client_t *cct;
77023c34adc5Sramat 
77033c34adc5Sramat 	while ((nvp = nvlist_next_nvpair(nvl, nvp)) != NULL) {
77043c34adc5Sramat 		ASSERT(nvpair_type(nvp) == DATA_TYPE_NVLIST);
77053c34adc5Sramat 		cct = kmem_zalloc(sizeof (*cct), KM_SLEEP);
77063c34adc5Sramat 		cct->cct_name_addr = i_ddi_strdup(nvpair_name(nvp), KM_SLEEP);
77073c34adc5Sramat 		(void) nvpair_value_nvlist(nvp, &paddrnvl);
77083c34adc5Sramat 		paddrnvl_to_vhcache(paddrnvl, cphci_list, cct);
77093c34adc5Sramat 		/* the client must contain at least one path */
77103c34adc5Sramat 		ASSERT(cct->cct_cpi_head != NULL);
77113c34adc5Sramat 
77123c34adc5Sramat 		enqueue_vhcache_client(vhcache, cct);
77133c34adc5Sramat 		(void) mod_hash_insert(vhcache->vhcache_client_hash,
77143c34adc5Sramat 		    (mod_hash_key_t)cct->cct_name_addr, (mod_hash_val_t)cct);
77153c34adc5Sramat 	}
77163c34adc5Sramat }
77173c34adc5Sramat 
77183c34adc5Sramat /*
77193c34adc5Sramat  * Copy the contents of the main nvlist to vhci cache.
77203c34adc5Sramat  *
77213c34adc5Sramat  * VHCI busconfig cached data is stored in the form of a nvlist on the disk.
77223c34adc5Sramat  * The nvlist contains the mappings between the vhci client addresses and
77233c34adc5Sramat  * their corresponding phci client addresses.
77243c34adc5Sramat  *
77253c34adc5Sramat  * The structure of the nvlist is as follows:
77263c34adc5Sramat  *
77273c34adc5Sramat  * Main nvlist:
77283c34adc5Sramat  *	NAME		TYPE		DATA
77293c34adc5Sramat  *	version		int32		version number
77303c34adc5Sramat  *	phcis		string array	array of phci paths
77313c34adc5Sramat  *	clientaddrmap	nvlist_t	c2paddrs_nvl (see below)
77323c34adc5Sramat  *
77333c34adc5Sramat  * structure of c2paddrs_nvl:
77343c34adc5Sramat  *	NAME		TYPE		DATA
77353c34adc5Sramat  *	caddr1		nvlist_t	paddrs_nvl1
77363c34adc5Sramat  *	caddr2		nvlist_t	paddrs_nvl2
77373c34adc5Sramat  *	...
77383c34adc5Sramat  * where caddr1, caddr2, ... are vhci client name and addresses in the
77393c34adc5Sramat  * form of "<clientname>@<clientaddress>".
77403c34adc5Sramat  * (for example: "ssd@2000002037cd9f72");
77413c34adc5Sramat  * paddrs_nvl1, paddrs_nvl2, .. are nvlists that contain path information.
77423c34adc5Sramat  *
77433c34adc5Sramat  * structure of paddrs_nvl:
77443c34adc5Sramat  *	NAME		TYPE		DATA
77453c34adc5Sramat  *	pi_addr1	uint32_array	(phci-id, cpi_flags)
77463c34adc5Sramat  *	pi_addr2	uint32_array	(phci-id, cpi_flags)
77473c34adc5Sramat  *	...
77483c34adc5Sramat  * where pi_addr1, pi_addr2, ... are bus specific addresses of pathinfo nodes
77493c34adc5Sramat  * (so called pi_addrs, for example: "w2100002037cd9f72,0");
77504c06356bSdh142964  * phci-ids are integers that identify pHCIs to which the
77513c34adc5Sramat  * the bus specific address belongs to. These integers are used as an index
77524c06356bSdh142964  * into to the phcis string array in the main nvlist to get the pHCI path.
77533c34adc5Sramat  */
77543c34adc5Sramat static int
77553c34adc5Sramat mainnvl_to_vhcache(mdi_vhci_cache_t *vhcache, nvlist_t *nvl)
77563c34adc5Sramat {
77573c34adc5Sramat 	char **phcis, **phci_namep;
77583c34adc5Sramat 	uint_t nphcis;
77593c34adc5Sramat 	mdi_vhcache_phci_t *cphci, **cphci_list;
77603c34adc5Sramat 	nvlist_t *caddrmapnvl;
77613c34adc5Sramat 	int32_t ver;
77623c34adc5Sramat 	int i;
77633c34adc5Sramat 	size_t cphci_list_size;
77643c34adc5Sramat 
77653c34adc5Sramat 	ASSERT(RW_WRITE_HELD(&vhcache->vhcache_lock));
77663c34adc5Sramat 
77673c34adc5Sramat 	if (nvlist_lookup_int32(nvl, MDI_NVPNAME_VERSION, &ver) != 0 ||
77683c34adc5Sramat 	    ver != MDI_VHCI_CACHE_VERSION)
77693c34adc5Sramat 		return (MDI_FAILURE);
77703c34adc5Sramat 
77713c34adc5Sramat 	if (nvlist_lookup_string_array(nvl, MDI_NVPNAME_PHCIS, &phcis,
77723c34adc5Sramat 	    &nphcis) != 0)
77733c34adc5Sramat 		return (MDI_SUCCESS);
77743c34adc5Sramat 
77753c34adc5Sramat 	ASSERT(nphcis > 0);
77763c34adc5Sramat 
77773c34adc5Sramat 	cphci_list_size = sizeof (mdi_vhcache_phci_t *) * nphcis;
77783c34adc5Sramat 	cphci_list = kmem_alloc(cphci_list_size, KM_SLEEP);
77793c34adc5Sramat 	for (i = 0, phci_namep = phcis; i < nphcis; i++, phci_namep++) {
77803c34adc5Sramat 		cphci = kmem_zalloc(sizeof (mdi_vhcache_phci_t), KM_SLEEP);
77813c34adc5Sramat 		cphci->cphci_path = i_ddi_strdup(*phci_namep, KM_SLEEP);
77823c34adc5Sramat 		enqueue_vhcache_phci(vhcache, cphci);
77833c34adc5Sramat 		cphci_list[i] = cphci;
77843c34adc5Sramat 	}
77853c34adc5Sramat 
77863c34adc5Sramat 	ASSERT(vhcache->vhcache_phci_head != NULL);
77873c34adc5Sramat 
77883c34adc5Sramat 	if (nvlist_lookup_nvlist(nvl, MDI_NVPNAME_CTADDRMAP, &caddrmapnvl) == 0)
77893c34adc5Sramat 		caddrmapnvl_to_vhcache(vhcache, caddrmapnvl, cphci_list);
77903c34adc5Sramat 
77913c34adc5Sramat 	kmem_free(cphci_list, cphci_list_size);
77923c34adc5Sramat 	return (MDI_SUCCESS);
77933c34adc5Sramat }
77943c34adc5Sramat 
77953c34adc5Sramat /*
77963c34adc5Sramat  * Build paddrnvl for the specified client using the information in the
77973c34adc5Sramat  * vhci cache and add it to the caddrmapnnvl.
77983c34adc5Sramat  * Returns 0 on success, errno on failure.
77993c34adc5Sramat  */
78003c34adc5Sramat static int
78013c34adc5Sramat vhcache_to_paddrnvl(mdi_vhci_cache_t *vhcache, mdi_vhcache_client_t *cct,
78023c34adc5Sramat     nvlist_t *caddrmapnvl)
78033c34adc5Sramat {
78043c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi;
78053c34adc5Sramat 	nvlist_t *nvl;
78063c34adc5Sramat 	int err;
78073c34adc5Sramat 	uint32_t val[2];
78083c34adc5Sramat 
78093c34adc5Sramat 	ASSERT(RW_LOCK_HELD(&vhcache->vhcache_lock));
78103c34adc5Sramat 
78113c34adc5Sramat 	if ((err = nvlist_alloc(&nvl, 0, KM_SLEEP)) != 0)
78123c34adc5Sramat 		return (err);
78133c34adc5Sramat 
78143c34adc5Sramat 	for (cpi = cct->cct_cpi_head; cpi != NULL; cpi = cpi->cpi_next) {
78153c34adc5Sramat 		val[0] = cpi->cpi_cphci->cphci_id;
78163c34adc5Sramat 		val[1] = cpi->cpi_flags;
78173c34adc5Sramat 		if ((err = nvlist_add_uint32_array(nvl, cpi->cpi_addr, val, 2))
78183c34adc5Sramat 		    != 0)
78193c34adc5Sramat 			goto out;
78203c34adc5Sramat 	}
78213c34adc5Sramat 
78223c34adc5Sramat 	err = nvlist_add_nvlist(caddrmapnvl, cct->cct_name_addr, nvl);
78233c34adc5Sramat out:
78243c34adc5Sramat 	nvlist_free(nvl);
78253c34adc5Sramat 	return (err);
78263c34adc5Sramat }
78273c34adc5Sramat 
78283c34adc5Sramat /*
78293c34adc5Sramat  * Build caddrmapnvl using the information in the vhci cache
78303c34adc5Sramat  * and add it to the mainnvl.
78313c34adc5Sramat  * Returns 0 on success, errno on failure.
78323c34adc5Sramat  */
78333c34adc5Sramat static int
78343c34adc5Sramat vhcache_to_caddrmapnvl(mdi_vhci_cache_t *vhcache, nvlist_t *mainnvl)
78353c34adc5Sramat {
78363c34adc5Sramat 	mdi_vhcache_client_t *cct;
78373c34adc5Sramat 	nvlist_t *nvl;
78383c34adc5Sramat 	int err;
78393c34adc5Sramat 
78403c34adc5Sramat 	ASSERT(RW_LOCK_HELD(&vhcache->vhcache_lock));
78413c34adc5Sramat 
78423c34adc5Sramat 	if ((err = nvlist_alloc(&nvl, NV_UNIQUE_NAME, KM_SLEEP)) != 0)
78433c34adc5Sramat 		return (err);
78443c34adc5Sramat 
78453c34adc5Sramat 	for (cct = vhcache->vhcache_client_head; cct != NULL;
78463c34adc5Sramat 	    cct = cct->cct_next) {
78473c34adc5Sramat 		if ((err = vhcache_to_paddrnvl(vhcache, cct, nvl)) != 0)
78483c34adc5Sramat 			goto out;
78493c34adc5Sramat 	}
78503c34adc5Sramat 
78513c34adc5Sramat 	err = nvlist_add_nvlist(mainnvl, MDI_NVPNAME_CTADDRMAP, nvl);
78523c34adc5Sramat out:
78533c34adc5Sramat 	nvlist_free(nvl);
78543c34adc5Sramat 	return (err);
78553c34adc5Sramat }
78563c34adc5Sramat 
78573c34adc5Sramat /*
78583c34adc5Sramat  * Build nvlist using the information in the vhci cache.
78593c34adc5Sramat  * See the comment in mainnvl_to_vhcache() for the format of the nvlist.
78603c34adc5Sramat  * Returns nvl on success, NULL on failure.
78613c34adc5Sramat  */
78623c34adc5Sramat static nvlist_t *
78633c34adc5Sramat vhcache_to_mainnvl(mdi_vhci_cache_t *vhcache)
78643c34adc5Sramat {
78653c34adc5Sramat 	mdi_vhcache_phci_t *cphci;
78663c34adc5Sramat 	uint_t phci_count;
78673c34adc5Sramat 	char **phcis;
78683c34adc5Sramat 	nvlist_t *nvl;
78693c34adc5Sramat 	int err, i;
78703c34adc5Sramat 
78713c34adc5Sramat 	if ((err = nvlist_alloc(&nvl, NV_UNIQUE_NAME, KM_SLEEP)) != 0) {
78723c34adc5Sramat 		nvl = NULL;
78733c34adc5Sramat 		goto out;
78743c34adc5Sramat 	}
78753c34adc5Sramat 
78763c34adc5Sramat 	if ((err = nvlist_add_int32(nvl, MDI_NVPNAME_VERSION,
78773c34adc5Sramat 	    MDI_VHCI_CACHE_VERSION)) != 0)
78783c34adc5Sramat 		goto out;
78793c34adc5Sramat 
78803c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_READER);
78813c34adc5Sramat 	if (vhcache->vhcache_phci_head == NULL) {
78823c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
78833c34adc5Sramat 		return (nvl);
78843c34adc5Sramat 	}
78853c34adc5Sramat 
78863c34adc5Sramat 	phci_count = 0;
78873c34adc5Sramat 	for (cphci = vhcache->vhcache_phci_head; cphci != NULL;
78883c34adc5Sramat 	    cphci = cphci->cphci_next)
78893c34adc5Sramat 		cphci->cphci_id = phci_count++;
78903c34adc5Sramat 
78913c34adc5Sramat 	/* build phci pathname list */
78923c34adc5Sramat 	phcis = kmem_alloc(sizeof (char *) * phci_count, KM_SLEEP);
78933c34adc5Sramat 	for (cphci = vhcache->vhcache_phci_head, i = 0; cphci != NULL;
78943c34adc5Sramat 	    cphci = cphci->cphci_next, i++)
78953c34adc5Sramat 		phcis[i] = i_ddi_strdup(cphci->cphci_path, KM_SLEEP);
78963c34adc5Sramat 
78973c34adc5Sramat 	err = nvlist_add_string_array(nvl, MDI_NVPNAME_PHCIS, phcis,
78983c34adc5Sramat 	    phci_count);
78993c34adc5Sramat 	free_string_array(phcis, phci_count);
79003c34adc5Sramat 
79013c34adc5Sramat 	if (err == 0 &&
79023c34adc5Sramat 	    (err = vhcache_to_caddrmapnvl(vhcache, nvl)) == 0) {
79033c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
79043c34adc5Sramat 		return (nvl);
79053c34adc5Sramat 	}
79063c34adc5Sramat 
79073c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
79083c34adc5Sramat out:
79093c34adc5Sramat 	if (nvl)
79103c34adc5Sramat 		nvlist_free(nvl);
79113c34adc5Sramat 	return (NULL);
79123c34adc5Sramat }
79133c34adc5Sramat 
79143c34adc5Sramat /*
79153c34adc5Sramat  * Lookup vhcache phci structure for the specified phci path.
79163c34adc5Sramat  */
79173c34adc5Sramat static mdi_vhcache_phci_t *
79183c34adc5Sramat lookup_vhcache_phci_by_name(mdi_vhci_cache_t *vhcache, char *phci_path)
79193c34adc5Sramat {
79203c34adc5Sramat 	mdi_vhcache_phci_t *cphci;
79213c34adc5Sramat 
79223c34adc5Sramat 	ASSERT(RW_LOCK_HELD(&vhcache->vhcache_lock));
79233c34adc5Sramat 
79243c34adc5Sramat 	for (cphci = vhcache->vhcache_phci_head; cphci != NULL;
79253c34adc5Sramat 	    cphci = cphci->cphci_next) {
79263c34adc5Sramat 		if (strcmp(cphci->cphci_path, phci_path) == 0)
79273c34adc5Sramat 			return (cphci);
79283c34adc5Sramat 	}
79293c34adc5Sramat 
79303c34adc5Sramat 	return (NULL);
79313c34adc5Sramat }
79323c34adc5Sramat 
79333c34adc5Sramat /*
79343c34adc5Sramat  * Lookup vhcache phci structure for the specified phci.
79353c34adc5Sramat  */
79363c34adc5Sramat static mdi_vhcache_phci_t *
79373c34adc5Sramat lookup_vhcache_phci_by_addr(mdi_vhci_cache_t *vhcache, mdi_phci_t *ph)
79383c34adc5Sramat {
79393c34adc5Sramat 	mdi_vhcache_phci_t *cphci;
79403c34adc5Sramat 
79413c34adc5Sramat 	ASSERT(RW_LOCK_HELD(&vhcache->vhcache_lock));
79423c34adc5Sramat 
79433c34adc5Sramat 	for (cphci = vhcache->vhcache_phci_head; cphci != NULL;
79443c34adc5Sramat 	    cphci = cphci->cphci_next) {
79453c34adc5Sramat 		if (cphci->cphci_phci == ph)
79463c34adc5Sramat 			return (cphci);
79473c34adc5Sramat 	}
79483c34adc5Sramat 
79493c34adc5Sramat 	return (NULL);
79503c34adc5Sramat }
79513c34adc5Sramat 
79523c34adc5Sramat /*
79533c34adc5Sramat  * Add the specified phci to the vhci cache if not already present.
79543c34adc5Sramat  */
79553c34adc5Sramat static void
79563c34adc5Sramat vhcache_phci_add(mdi_vhci_config_t *vhc, mdi_phci_t *ph)
79573c34adc5Sramat {
79583c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
79593c34adc5Sramat 	mdi_vhcache_phci_t *cphci;
79603c34adc5Sramat 	char *pathname;
79613c34adc5Sramat 	int cache_updated;
79623c34adc5Sramat 
79633c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_WRITER);
79643c34adc5Sramat 
79653c34adc5Sramat 	pathname = kmem_alloc(MAXPATHLEN, KM_SLEEP);
79663c34adc5Sramat 	(void) ddi_pathname(ph->ph_dip, pathname);
79673c34adc5Sramat 	if ((cphci = lookup_vhcache_phci_by_name(vhcache, pathname))
79683c34adc5Sramat 	    != NULL) {
79693c34adc5Sramat 		cphci->cphci_phci = ph;
79703c34adc5Sramat 		cache_updated = 0;
79713c34adc5Sramat 	} else {
79723c34adc5Sramat 		cphci = kmem_zalloc(sizeof (*cphci), KM_SLEEP);
79733c34adc5Sramat 		cphci->cphci_path = i_ddi_strdup(pathname, KM_SLEEP);
79743c34adc5Sramat 		cphci->cphci_phci = ph;
79753c34adc5Sramat 		enqueue_vhcache_phci(vhcache, cphci);
79763c34adc5Sramat 		cache_updated = 1;
79773c34adc5Sramat 	}
797867e56d35Sramat 
79793c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
79803c34adc5Sramat 
798167e56d35Sramat 	/*
798267e56d35Sramat 	 * Since a new phci has been added, reset
798367e56d35Sramat 	 * vhc_path_discovery_cutoff_time to allow for discovery of paths
798467e56d35Sramat 	 * during next vhcache_discover_paths().
798567e56d35Sramat 	 */
798667e56d35Sramat 	mutex_enter(&vhc->vhc_lock);
798767e56d35Sramat 	vhc->vhc_path_discovery_cutoff_time = 0;
798867e56d35Sramat 	mutex_exit(&vhc->vhc_lock);
798967e56d35Sramat 
79903c34adc5Sramat 	kmem_free(pathname, MAXPATHLEN);
79913c34adc5Sramat 	if (cache_updated)
79923c34adc5Sramat 		vhcache_dirty(vhc);
79933c34adc5Sramat }
79943c34adc5Sramat 
79953c34adc5Sramat /*
79963c34adc5Sramat  * Remove the reference to the specified phci from the vhci cache.
79973c34adc5Sramat  */
79983c34adc5Sramat static void
79993c34adc5Sramat vhcache_phci_remove(mdi_vhci_config_t *vhc, mdi_phci_t *ph)
80003c34adc5Sramat {
80013c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
80023c34adc5Sramat 	mdi_vhcache_phci_t *cphci;
80033c34adc5Sramat 
80043c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_WRITER);
80053c34adc5Sramat 	if ((cphci = lookup_vhcache_phci_by_addr(vhcache, ph)) != NULL) {
80063c34adc5Sramat 		/* do not remove the actual mdi_vhcache_phci structure */
80073c34adc5Sramat 		cphci->cphci_phci = NULL;
80083c34adc5Sramat 	}
80093c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
80103c34adc5Sramat }
80113c34adc5Sramat 
80123c34adc5Sramat static void
80133c34adc5Sramat init_vhcache_lookup_token(mdi_vhcache_lookup_token_t *dst,
80143c34adc5Sramat     mdi_vhcache_lookup_token_t *src)
80153c34adc5Sramat {
80163c34adc5Sramat 	if (src == NULL) {
80173c34adc5Sramat 		dst->lt_cct = NULL;
80183c34adc5Sramat 		dst->lt_cct_lookup_time = 0;
80193c34adc5Sramat 	} else {
80203c34adc5Sramat 		dst->lt_cct = src->lt_cct;
80213c34adc5Sramat 		dst->lt_cct_lookup_time = src->lt_cct_lookup_time;
80223c34adc5Sramat 	}
80233c34adc5Sramat }
80243c34adc5Sramat 
80253c34adc5Sramat /*
80263c34adc5Sramat  * Look up vhcache client for the specified client.
80273c34adc5Sramat  */
80283c34adc5Sramat static mdi_vhcache_client_t *
80293c34adc5Sramat lookup_vhcache_client(mdi_vhci_cache_t *vhcache, char *ct_name, char *ct_addr,
80303c34adc5Sramat     mdi_vhcache_lookup_token_t *token)
80313c34adc5Sramat {
80323c34adc5Sramat 	mod_hash_val_t hv;
80333c34adc5Sramat 	char *name_addr;
80343c34adc5Sramat 	int len;
80353c34adc5Sramat 
80363c34adc5Sramat 	ASSERT(RW_LOCK_HELD(&vhcache->vhcache_lock));
80373c34adc5Sramat 
80383c34adc5Sramat 	/*
80393c34adc5Sramat 	 * If no vhcache clean occurred since the last lookup, we can
80403c34adc5Sramat 	 * simply return the cct from the last lookup operation.
80413c34adc5Sramat 	 * It works because ccts are never freed except during the vhcache
80423c34adc5Sramat 	 * cleanup operation.
80433c34adc5Sramat 	 */
80443c34adc5Sramat 	if (token != NULL &&
80453c34adc5Sramat 	    vhcache->vhcache_clean_time < token->lt_cct_lookup_time)
80463c34adc5Sramat 		return (token->lt_cct);
80473c34adc5Sramat 
80483c34adc5Sramat 	name_addr = vhcache_mknameaddr(ct_name, ct_addr, &len);
80493c34adc5Sramat 	if (mod_hash_find(vhcache->vhcache_client_hash,
80503c34adc5Sramat 	    (mod_hash_key_t)name_addr, &hv) == 0) {
80513c34adc5Sramat 		if (token) {
80523c34adc5Sramat 			token->lt_cct = (mdi_vhcache_client_t *)hv;
80533c34adc5Sramat 			token->lt_cct_lookup_time = lbolt64;
80543c34adc5Sramat 		}
80553c34adc5Sramat 	} else {
80563c34adc5Sramat 		if (token) {
80573c34adc5Sramat 			token->lt_cct = NULL;
80583c34adc5Sramat 			token->lt_cct_lookup_time = 0;
80593c34adc5Sramat 		}
80603c34adc5Sramat 		hv = NULL;
80613c34adc5Sramat 	}
80623c34adc5Sramat 	kmem_free(name_addr, len);
80633c34adc5Sramat 	return ((mdi_vhcache_client_t *)hv);
80643c34adc5Sramat }
80653c34adc5Sramat 
80663c34adc5Sramat /*
80673c34adc5Sramat  * Add the specified path to the vhci cache if not already present.
80683c34adc5Sramat  * Also add the vhcache client for the client corresponding to this path
80693c34adc5Sramat  * if it doesn't already exist.
80703c34adc5Sramat  */
80713c34adc5Sramat static void
80723c34adc5Sramat vhcache_pi_add(mdi_vhci_config_t *vhc, struct mdi_pathinfo *pip)
80733c34adc5Sramat {
80743c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
80753c34adc5Sramat 	mdi_vhcache_client_t *cct;
80763c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi;
80773c34adc5Sramat 	mdi_phci_t *ph = pip->pi_phci;
80783c34adc5Sramat 	mdi_client_t *ct = pip->pi_client;
80793c34adc5Sramat 	int cache_updated = 0;
80803c34adc5Sramat 
80813c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_WRITER);
80823c34adc5Sramat 
80833c34adc5Sramat 	/* if vhcache client for this pip doesn't already exist, add it */
80843c34adc5Sramat 	if ((cct = lookup_vhcache_client(vhcache, ct->ct_drvname, ct->ct_guid,
80853c34adc5Sramat 	    NULL)) == NULL) {
80863c34adc5Sramat 		cct = kmem_zalloc(sizeof (*cct), KM_SLEEP);
80873c34adc5Sramat 		cct->cct_name_addr = vhcache_mknameaddr(ct->ct_drvname,
80883c34adc5Sramat 		    ct->ct_guid, NULL);
80893c34adc5Sramat 		enqueue_vhcache_client(vhcache, cct);
80903c34adc5Sramat 		(void) mod_hash_insert(vhcache->vhcache_client_hash,
80913c34adc5Sramat 		    (mod_hash_key_t)cct->cct_name_addr, (mod_hash_val_t)cct);
80923c34adc5Sramat 		cache_updated = 1;
80933c34adc5Sramat 	}
80943c34adc5Sramat 
80953c34adc5Sramat 	for (cpi = cct->cct_cpi_head; cpi != NULL; cpi = cpi->cpi_next) {
80963c34adc5Sramat 		if (cpi->cpi_cphci->cphci_phci == ph &&
80973c34adc5Sramat 		    strcmp(cpi->cpi_addr, pip->pi_addr) == 0) {
80983c34adc5Sramat 			cpi->cpi_pip = pip;
80993c34adc5Sramat 			if (cpi->cpi_flags & MDI_CPI_HINT_PATH_DOES_NOT_EXIST) {
81003c34adc5Sramat 				cpi->cpi_flags &=
81013c34adc5Sramat 				    ~MDI_CPI_HINT_PATH_DOES_NOT_EXIST;
81023c34adc5Sramat 				sort_vhcache_paths(cct);
81033c34adc5Sramat 				cache_updated = 1;
81043c34adc5Sramat 			}
81053c34adc5Sramat 			break;
81063c34adc5Sramat 		}
81073c34adc5Sramat 	}
81083c34adc5Sramat 
81093c34adc5Sramat 	if (cpi == NULL) {
81103c34adc5Sramat 		cpi = kmem_zalloc(sizeof (*cpi), KM_SLEEP);
81113c34adc5Sramat 		cpi->cpi_addr = i_ddi_strdup(pip->pi_addr, KM_SLEEP);
81123c34adc5Sramat 		cpi->cpi_cphci = lookup_vhcache_phci_by_addr(vhcache, ph);
81133c34adc5Sramat 		ASSERT(cpi->cpi_cphci != NULL);
81143c34adc5Sramat 		cpi->cpi_pip = pip;
81153c34adc5Sramat 		enqueue_vhcache_pathinfo(cct, cpi);
81163c34adc5Sramat 		cache_updated = 1;
81173c34adc5Sramat 	}
81183c34adc5Sramat 
81193c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
81203c34adc5Sramat 
81213c34adc5Sramat 	if (cache_updated)
81223c34adc5Sramat 		vhcache_dirty(vhc);
81233c34adc5Sramat }
81243c34adc5Sramat 
81253c34adc5Sramat /*
81263c34adc5Sramat  * Remove the reference to the specified path from the vhci cache.
81273c34adc5Sramat  */
81283c34adc5Sramat static void
81293c34adc5Sramat vhcache_pi_remove(mdi_vhci_config_t *vhc, struct mdi_pathinfo *pip)
81303c34adc5Sramat {
81313c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
81323c34adc5Sramat 	mdi_client_t *ct = pip->pi_client;
81333c34adc5Sramat 	mdi_vhcache_client_t *cct;
81343c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi;
81353c34adc5Sramat 
81363c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_WRITER);
81373c34adc5Sramat 	if ((cct = lookup_vhcache_client(vhcache, ct->ct_drvname, ct->ct_guid,
81383c34adc5Sramat 	    NULL)) != NULL) {
81393c34adc5Sramat 		for (cpi = cct->cct_cpi_head; cpi != NULL;
81403c34adc5Sramat 		    cpi = cpi->cpi_next) {
81413c34adc5Sramat 			if (cpi->cpi_pip == pip) {
81423c34adc5Sramat 				cpi->cpi_pip = NULL;
81433c34adc5Sramat 				break;
81443c34adc5Sramat 			}
81453c34adc5Sramat 		}
81463c34adc5Sramat 	}
81473c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
81483c34adc5Sramat }
81493c34adc5Sramat 
81503c34adc5Sramat /*
81513c34adc5Sramat  * Flush the vhci cache to disk.
81523c34adc5Sramat  * Returns MDI_SUCCESS on success, MDI_FAILURE on failure.
81533c34adc5Sramat  */
81543c34adc5Sramat static int
81553c34adc5Sramat flush_vhcache(mdi_vhci_config_t *vhc, int force_flag)
81563c34adc5Sramat {
81573c34adc5Sramat 	nvlist_t *nvl;
81583c34adc5Sramat 	int err;
81593c34adc5Sramat 	int rv;
81603c34adc5Sramat 
81613c34adc5Sramat 	/*
81623c34adc5Sramat 	 * It is possible that the system may shutdown before
81633c34adc5Sramat 	 * i_ddi_io_initialized (during stmsboot for example). To allow for
81643c34adc5Sramat 	 * flushing the cache in this case do not check for
81653c34adc5Sramat 	 * i_ddi_io_initialized when force flag is set.
81663c34adc5Sramat 	 */
81673c34adc5Sramat 	if (force_flag == 0 && !i_ddi_io_initialized())
81683c34adc5Sramat 		return (MDI_FAILURE);
81693c34adc5Sramat 
81703c34adc5Sramat 	if ((nvl = vhcache_to_mainnvl(&vhc->vhc_vhcache)) != NULL) {
81713c34adc5Sramat 		err = fwrite_nvlist(vhc->vhc_vhcache_filename, nvl);
81723c34adc5Sramat 		nvlist_free(nvl);
81733c34adc5Sramat 	} else
81743c34adc5Sramat 		err = EFAULT;
81753c34adc5Sramat 
81763c34adc5Sramat 	rv = MDI_SUCCESS;
81773c34adc5Sramat 	mutex_enter(&vhc->vhc_lock);
81783c34adc5Sramat 	if (err != 0) {
81793c34adc5Sramat 		if (err == EROFS) {
81803c34adc5Sramat 			vhc->vhc_flags |= MDI_VHC_READONLY_FS;
81813c34adc5Sramat 			vhc->vhc_flags &= ~(MDI_VHC_VHCACHE_FLUSH_ERROR |
81823c34adc5Sramat 			    MDI_VHC_VHCACHE_DIRTY);
81833c34adc5Sramat 		} else {
81843c34adc5Sramat 			if (!(vhc->vhc_flags & MDI_VHC_VHCACHE_FLUSH_ERROR)) {
81853c34adc5Sramat 				cmn_err(CE_CONT, "%s: update failed\n",
81863c34adc5Sramat 				    vhc->vhc_vhcache_filename);
81873c34adc5Sramat 				vhc->vhc_flags |= MDI_VHC_VHCACHE_FLUSH_ERROR;
81883c34adc5Sramat 			}
81893c34adc5Sramat 			rv = MDI_FAILURE;
81903c34adc5Sramat 		}
81913c34adc5Sramat 	} else if (vhc->vhc_flags & MDI_VHC_VHCACHE_FLUSH_ERROR) {
81923c34adc5Sramat 		cmn_err(CE_CONT,
81933c34adc5Sramat 		    "%s: update now ok\n", vhc->vhc_vhcache_filename);
81943c34adc5Sramat 		vhc->vhc_flags &= ~MDI_VHC_VHCACHE_FLUSH_ERROR;
81953c34adc5Sramat 	}
81963c34adc5Sramat 	mutex_exit(&vhc->vhc_lock);
81973c34adc5Sramat 
81983c34adc5Sramat 	return (rv);
81993c34adc5Sramat }
82003c34adc5Sramat 
82013c34adc5Sramat /*
82023c34adc5Sramat  * Call flush_vhcache() to flush the vhci cache at the scheduled time.
82033c34adc5Sramat  * Exits itself if left idle for the idle timeout period.
82043c34adc5Sramat  */
82053c34adc5Sramat static void
82063c34adc5Sramat vhcache_flush_thread(void *arg)
82073c34adc5Sramat {
82083c34adc5Sramat 	mdi_vhci_config_t *vhc = (mdi_vhci_config_t *)arg;
82093c34adc5Sramat 	clock_t idle_time, quit_at_ticks;
82103c34adc5Sramat 	callb_cpr_t cprinfo;
82113c34adc5Sramat 
82123c34adc5Sramat 	/* number of seconds to sleep idle before exiting */
82133c34adc5Sramat 	idle_time = mdi_vhcache_flush_daemon_idle_time * TICKS_PER_SECOND;
82143c34adc5Sramat 
82153c34adc5Sramat 	CALLB_CPR_INIT(&cprinfo, &vhc->vhc_lock, callb_generic_cpr,
82163c34adc5Sramat 	    "mdi_vhcache_flush");
82173c34adc5Sramat 	mutex_enter(&vhc->vhc_lock);
82183c34adc5Sramat 	for (; ; ) {
82193c34adc5Sramat 		while (!(vhc->vhc_flags & MDI_VHC_EXIT) &&
82203c34adc5Sramat 		    (vhc->vhc_flags & MDI_VHC_VHCACHE_DIRTY)) {
82213c34adc5Sramat 			if (ddi_get_lbolt() < vhc->vhc_flush_at_ticks) {
82223c34adc5Sramat 				CALLB_CPR_SAFE_BEGIN(&cprinfo);
82233c34adc5Sramat 				(void) cv_timedwait(&vhc->vhc_cv,
82243c34adc5Sramat 				    &vhc->vhc_lock, vhc->vhc_flush_at_ticks);
82253c34adc5Sramat 				CALLB_CPR_SAFE_END(&cprinfo, &vhc->vhc_lock);
82263c34adc5Sramat 			} else {
82273c34adc5Sramat 				vhc->vhc_flags &= ~MDI_VHC_VHCACHE_DIRTY;
82283c34adc5Sramat 				mutex_exit(&vhc->vhc_lock);
82293c34adc5Sramat 
82303c34adc5Sramat 				if (flush_vhcache(vhc, 0) != MDI_SUCCESS)
82313c34adc5Sramat 					vhcache_dirty(vhc);
82323c34adc5Sramat 
82333c34adc5Sramat 				mutex_enter(&vhc->vhc_lock);
82343c34adc5Sramat 			}
82353c34adc5Sramat 		}
82363c34adc5Sramat 
82373c34adc5Sramat 		quit_at_ticks = ddi_get_lbolt() + idle_time;
82383c34adc5Sramat 
82393c34adc5Sramat 		while (!(vhc->vhc_flags & MDI_VHC_EXIT) &&
82403c34adc5Sramat 		    !(vhc->vhc_flags & MDI_VHC_VHCACHE_DIRTY) &&
82413c34adc5Sramat 		    ddi_get_lbolt() < quit_at_ticks) {
82423c34adc5Sramat 			CALLB_CPR_SAFE_BEGIN(&cprinfo);
82433c34adc5Sramat 			(void) cv_timedwait(&vhc->vhc_cv, &vhc->vhc_lock,
82443c34adc5Sramat 			    quit_at_ticks);
82453c34adc5Sramat 			CALLB_CPR_SAFE_END(&cprinfo, &vhc->vhc_lock);
82463c34adc5Sramat 		}
82473c34adc5Sramat 
82483c34adc5Sramat 		if ((vhc->vhc_flags & MDI_VHC_EXIT) ||
82493c34adc5Sramat 		    !(vhc->vhc_flags & MDI_VHC_VHCACHE_DIRTY))
82503c34adc5Sramat 			goto out;
82513c34adc5Sramat 	}
82523c34adc5Sramat 
82533c34adc5Sramat out:
82543c34adc5Sramat 	vhc->vhc_flags &= ~MDI_VHC_VHCACHE_FLUSH_THREAD;
82553c34adc5Sramat 	/* CALLB_CPR_EXIT releases the vhc->vhc_lock */
82563c34adc5Sramat 	CALLB_CPR_EXIT(&cprinfo);
82573c34adc5Sramat }
82583c34adc5Sramat 
82593c34adc5Sramat /*
82603c34adc5Sramat  * Make vhci cache dirty and schedule flushing by vhcache flush thread.
82613c34adc5Sramat  */
82623c34adc5Sramat static void
82633c34adc5Sramat vhcache_dirty(mdi_vhci_config_t *vhc)
82643c34adc5Sramat {
82653c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
82663c34adc5Sramat 	int create_thread;
82673c34adc5Sramat 
82683c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_READER);
82693c34adc5Sramat 	/* do not flush cache until the cache is fully built */
82703c34adc5Sramat 	if (!(vhcache->vhcache_flags & MDI_VHCI_CACHE_SETUP_DONE)) {
82713c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
82723c34adc5Sramat 		return;
82733c34adc5Sramat 	}
82743c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
82753c34adc5Sramat 
82763c34adc5Sramat 	mutex_enter(&vhc->vhc_lock);
82773c34adc5Sramat 	if (vhc->vhc_flags & MDI_VHC_READONLY_FS) {
82783c34adc5Sramat 		mutex_exit(&vhc->vhc_lock);
82793c34adc5Sramat 		return;
82803c34adc5Sramat 	}
82813c34adc5Sramat 
82823c34adc5Sramat 	vhc->vhc_flags |= MDI_VHC_VHCACHE_DIRTY;
82833c34adc5Sramat 	vhc->vhc_flush_at_ticks = ddi_get_lbolt() +
82843c34adc5Sramat 	    mdi_vhcache_flush_delay * TICKS_PER_SECOND;
82853c34adc5Sramat 	if (vhc->vhc_flags & MDI_VHC_VHCACHE_FLUSH_THREAD) {
82863c34adc5Sramat 		cv_broadcast(&vhc->vhc_cv);
82873c34adc5Sramat 		create_thread = 0;
82883c34adc5Sramat 	} else {
82893c34adc5Sramat 		vhc->vhc_flags |= MDI_VHC_VHCACHE_FLUSH_THREAD;
82903c34adc5Sramat 		create_thread = 1;
82913c34adc5Sramat 	}
82923c34adc5Sramat 	mutex_exit(&vhc->vhc_lock);
82933c34adc5Sramat 
82943c34adc5Sramat 	if (create_thread)
82953c34adc5Sramat 		(void) thread_create(NULL, 0, vhcache_flush_thread, vhc,
82963c34adc5Sramat 		    0, &p0, TS_RUN, minclsyspri);
82973c34adc5Sramat }
82983c34adc5Sramat 
82993c34adc5Sramat /*
83003c34adc5Sramat  * phci bus config structure - one for for each phci bus config operation that
83013c34adc5Sramat  * we initiate on behalf of a vhci.
83023c34adc5Sramat  */
83033c34adc5Sramat typedef struct mdi_phci_bus_config_s {
83043c34adc5Sramat 	char *phbc_phci_path;
83053c34adc5Sramat 	struct mdi_vhci_bus_config_s *phbc_vhbusconfig;	/* vhci bus config */
83063c34adc5Sramat 	struct mdi_phci_bus_config_s *phbc_next;
83073c34adc5Sramat } mdi_phci_bus_config_t;
83083c34adc5Sramat 
83093c34adc5Sramat /* vhci bus config structure - one for each vhci bus config operation */
83103c34adc5Sramat typedef struct mdi_vhci_bus_config_s {
83113c34adc5Sramat 	ddi_bus_config_op_t vhbc_op;	/* bus config op */
83123c34adc5Sramat 	major_t vhbc_op_major;		/* bus config op major */
83133c34adc5Sramat 	uint_t vhbc_op_flags;		/* bus config op flags */
83143c34adc5Sramat 	kmutex_t vhbc_lock;
83153c34adc5Sramat 	kcondvar_t vhbc_cv;
83163c34adc5Sramat 	int vhbc_thr_count;
83173c34adc5Sramat } mdi_vhci_bus_config_t;
83183c34adc5Sramat 
83193c34adc5Sramat /*
83203c34adc5Sramat  * bus config the specified phci
83213c34adc5Sramat  */
83223c34adc5Sramat static void
83233c34adc5Sramat bus_config_phci(void *arg)
83243c34adc5Sramat {
83253c34adc5Sramat 	mdi_phci_bus_config_t *phbc = (mdi_phci_bus_config_t *)arg;
83263c34adc5Sramat 	mdi_vhci_bus_config_t *vhbc = phbc->phbc_vhbusconfig;
83273c34adc5Sramat 	dev_info_t *ph_dip;
83283c34adc5Sramat 
83293c34adc5Sramat 	/*
83303c34adc5Sramat 	 * first configure all path components upto phci and then configure
83313c34adc5Sramat 	 * the phci children.
83323c34adc5Sramat 	 */
83333c34adc5Sramat 	if ((ph_dip = e_ddi_hold_devi_by_path(phbc->phbc_phci_path, 0))
83343c34adc5Sramat 	    != NULL) {
83353c34adc5Sramat 		if (vhbc->vhbc_op == BUS_CONFIG_DRIVER ||
83363c34adc5Sramat 		    vhbc->vhbc_op == BUS_UNCONFIG_DRIVER) {
83373c34adc5Sramat 			(void) ndi_devi_config_driver(ph_dip,
83383c34adc5Sramat 			    vhbc->vhbc_op_flags,
83393c34adc5Sramat 			    vhbc->vhbc_op_major);
83403c34adc5Sramat 		} else
83413c34adc5Sramat 			(void) ndi_devi_config(ph_dip,
83423c34adc5Sramat 			    vhbc->vhbc_op_flags);
83433c34adc5Sramat 
83443c34adc5Sramat 		/* release the hold that e_ddi_hold_devi_by_path() placed */
83453c34adc5Sramat 		ndi_rele_devi(ph_dip);
83463c34adc5Sramat 	}
83473c34adc5Sramat 
83483c34adc5Sramat 	kmem_free(phbc->phbc_phci_path, strlen(phbc->phbc_phci_path) + 1);
83493c34adc5Sramat 	kmem_free(phbc, sizeof (*phbc));
83503c34adc5Sramat 
83513c34adc5Sramat 	mutex_enter(&vhbc->vhbc_lock);
83523c34adc5Sramat 	vhbc->vhbc_thr_count--;
83533c34adc5Sramat 	if (vhbc->vhbc_thr_count == 0)
83543c34adc5Sramat 		cv_broadcast(&vhbc->vhbc_cv);
83553c34adc5Sramat 	mutex_exit(&vhbc->vhbc_lock);
83563c34adc5Sramat }
83573c34adc5Sramat 
83583c34adc5Sramat /*
83593c34adc5Sramat  * Bus config all phcis associated with the vhci in parallel.
83603c34adc5Sramat  * op must be BUS_CONFIG_DRIVER or BUS_CONFIG_ALL.
83613c34adc5Sramat  */
83623c34adc5Sramat static void
83633c34adc5Sramat bus_config_all_phcis(mdi_vhci_cache_t *vhcache, uint_t flags,
83643c34adc5Sramat     ddi_bus_config_op_t op, major_t maj)
83653c34adc5Sramat {
83663c34adc5Sramat 	mdi_phci_bus_config_t *phbc_head = NULL, *phbc, *phbc_next;
83673c34adc5Sramat 	mdi_vhci_bus_config_t *vhbc;
83683c34adc5Sramat 	mdi_vhcache_phci_t *cphci;
83693c34adc5Sramat 
83703c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_READER);
83713c34adc5Sramat 	if (vhcache->vhcache_phci_head == NULL) {
83723c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
83733c34adc5Sramat 		return;
83743c34adc5Sramat 	}
83753c34adc5Sramat 
83763c34adc5Sramat 	vhbc = kmem_zalloc(sizeof (*vhbc), KM_SLEEP);
83773c34adc5Sramat 
83783c34adc5Sramat 	for (cphci = vhcache->vhcache_phci_head; cphci != NULL;
83793c34adc5Sramat 	    cphci = cphci->cphci_next) {
8380273f4511Sgp87344 		/* skip phcis that haven't attached before root is available */
8381273f4511Sgp87344 		if (!modrootloaded && (cphci->cphci_phci == NULL))
8382273f4511Sgp87344 			continue;
83833c34adc5Sramat 		phbc = kmem_zalloc(sizeof (*phbc), KM_SLEEP);
83843c34adc5Sramat 		phbc->phbc_phci_path = i_ddi_strdup(cphci->cphci_path,
83853c34adc5Sramat 		    KM_SLEEP);
83863c34adc5Sramat 		phbc->phbc_vhbusconfig = vhbc;
83873c34adc5Sramat 		phbc->phbc_next = phbc_head;
83883c34adc5Sramat 		phbc_head = phbc;
83893c34adc5Sramat 		vhbc->vhbc_thr_count++;
83903c34adc5Sramat 	}
83913c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
83923c34adc5Sramat 
83933c34adc5Sramat 	vhbc->vhbc_op = op;
83943c34adc5Sramat 	vhbc->vhbc_op_major = maj;
83953c34adc5Sramat 	vhbc->vhbc_op_flags = NDI_NO_EVENT |
83963c34adc5Sramat 	    (flags & (NDI_CONFIG_REPROBE | NDI_DRV_CONF_REPROBE));
83973c34adc5Sramat 	mutex_init(&vhbc->vhbc_lock, NULL, MUTEX_DEFAULT, NULL);
83983c34adc5Sramat 	cv_init(&vhbc->vhbc_cv, NULL, CV_DRIVER, NULL);
83993c34adc5Sramat 
84003c34adc5Sramat 	/* now create threads to initiate bus config on all phcis in parallel */
84013c34adc5Sramat 	for (phbc = phbc_head; phbc != NULL; phbc = phbc_next) {
84023c34adc5Sramat 		phbc_next = phbc->phbc_next;
84033c34adc5Sramat 		if (mdi_mtc_off)
84043c34adc5Sramat 			bus_config_phci((void *)phbc);
84053c34adc5Sramat 		else
84063c34adc5Sramat 			(void) thread_create(NULL, 0, bus_config_phci, phbc,
84073c34adc5Sramat 			    0, &p0, TS_RUN, minclsyspri);
84083c34adc5Sramat 	}
84093c34adc5Sramat 
84103c34adc5Sramat 	mutex_enter(&vhbc->vhbc_lock);
84113c34adc5Sramat 	/* wait until all threads exit */
84123c34adc5Sramat 	while (vhbc->vhbc_thr_count > 0)
84133c34adc5Sramat 		cv_wait(&vhbc->vhbc_cv, &vhbc->vhbc_lock);
84143c34adc5Sramat 	mutex_exit(&vhbc->vhbc_lock);
84153c34adc5Sramat 
84163c34adc5Sramat 	mutex_destroy(&vhbc->vhbc_lock);
84173c34adc5Sramat 	cv_destroy(&vhbc->vhbc_cv);
84183c34adc5Sramat 	kmem_free(vhbc, sizeof (*vhbc));
84193c34adc5Sramat }
84203c34adc5Sramat 
84213c34adc5Sramat /*
842267e56d35Sramat  * Single threaded version of bus_config_all_phcis()
842367e56d35Sramat  */
842467e56d35Sramat static void
842567e56d35Sramat st_bus_config_all_phcis(mdi_vhci_config_t *vhc, uint_t flags,
842667e56d35Sramat     ddi_bus_config_op_t op, major_t maj)
842767e56d35Sramat {
842867e56d35Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
842967e56d35Sramat 
843067e56d35Sramat 	single_threaded_vhconfig_enter(vhc);
843167e56d35Sramat 	bus_config_all_phcis(vhcache, flags, op, maj);
843267e56d35Sramat 	single_threaded_vhconfig_exit(vhc);
843367e56d35Sramat }
843467e56d35Sramat 
843567e56d35Sramat /*
84363c34adc5Sramat  * Perform BUS_CONFIG_ONE on the specified child of the phci.
84373c34adc5Sramat  * The path includes the child component in addition to the phci path.
84383c34adc5Sramat  */
84393c34adc5Sramat static int
84403c34adc5Sramat bus_config_one_phci_child(char *path)
84413c34adc5Sramat {
84423c34adc5Sramat 	dev_info_t *ph_dip, *child;
84433c34adc5Sramat 	char *devnm;
84443c34adc5Sramat 	int rv = MDI_FAILURE;
84453c34adc5Sramat 
84463c34adc5Sramat 	/* extract the child component of the phci */
84473c34adc5Sramat 	devnm = strrchr(path, '/');
84483c34adc5Sramat 	*devnm++ = '\0';
84493c34adc5Sramat 
84503c34adc5Sramat 	/*
84513c34adc5Sramat 	 * first configure all path components upto phci and then
84523c34adc5Sramat 	 * configure the phci child.
84533c34adc5Sramat 	 */
84543c34adc5Sramat 	if ((ph_dip = e_ddi_hold_devi_by_path(path, 0)) != NULL) {
84553c34adc5Sramat 		if (ndi_devi_config_one(ph_dip, devnm, &child, NDI_NO_EVENT) ==
84563c34adc5Sramat 		    NDI_SUCCESS) {
84573c34adc5Sramat 			/*
84583c34adc5Sramat 			 * release the hold that ndi_devi_config_one() placed
84593c34adc5Sramat 			 */
84603c34adc5Sramat 			ndi_rele_devi(child);
84613c34adc5Sramat 			rv = MDI_SUCCESS;
84623c34adc5Sramat 		}
84633c34adc5Sramat 
84643c34adc5Sramat 		/* release the hold that e_ddi_hold_devi_by_path() placed */
84653c34adc5Sramat 		ndi_rele_devi(ph_dip);
84663c34adc5Sramat 	}
84673c34adc5Sramat 
84683c34adc5Sramat 	devnm--;
84693c34adc5Sramat 	*devnm = '/';
84703c34adc5Sramat 	return (rv);
84713c34adc5Sramat }
84723c34adc5Sramat 
84733c34adc5Sramat /*
84743c34adc5Sramat  * Build a list of phci client paths for the specified vhci client.
84753c34adc5Sramat  * The list includes only those phci client paths which aren't configured yet.
84763c34adc5Sramat  */
84773c34adc5Sramat static mdi_phys_path_t *
84783c34adc5Sramat build_phclient_path_list(mdi_vhcache_client_t *cct, char *ct_name)
84793c34adc5Sramat {
84803c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi;
84813c34adc5Sramat 	mdi_phys_path_t *pp_head = NULL, *pp_tail = NULL, *pp;
84823c34adc5Sramat 	int config_path, len;
84833c34adc5Sramat 
84843c34adc5Sramat 	for (cpi = cct->cct_cpi_head; cpi != NULL; cpi = cpi->cpi_next) {
84853c34adc5Sramat 		/*
84863c34adc5Sramat 		 * include only those paths that aren't configured.
84873c34adc5Sramat 		 */
84883c34adc5Sramat 		config_path = 0;
84893c34adc5Sramat 		if (cpi->cpi_pip == NULL)
84903c34adc5Sramat 			config_path = 1;
84913c34adc5Sramat 		else {
84923c34adc5Sramat 			MDI_PI_LOCK(cpi->cpi_pip);
84933c34adc5Sramat 			if (MDI_PI_IS_INIT(cpi->cpi_pip))
84943c34adc5Sramat 				config_path = 1;
84953c34adc5Sramat 			MDI_PI_UNLOCK(cpi->cpi_pip);
84963c34adc5Sramat 		}
84973c34adc5Sramat 
84983c34adc5Sramat 		if (config_path) {
84993c34adc5Sramat 			pp = kmem_alloc(sizeof (*pp), KM_SLEEP);
85003c34adc5Sramat 			len = strlen(cpi->cpi_cphci->cphci_path) +
85013c34adc5Sramat 			    strlen(ct_name) + strlen(cpi->cpi_addr) + 3;
85023c34adc5Sramat 			pp->phys_path = kmem_alloc(len, KM_SLEEP);
85033c34adc5Sramat 			(void) snprintf(pp->phys_path, len, "%s/%s@%s",
85043c34adc5Sramat 			    cpi->cpi_cphci->cphci_path, ct_name,
85053c34adc5Sramat 			    cpi->cpi_addr);
85063c34adc5Sramat 			pp->phys_path_next = NULL;
85073c34adc5Sramat 
85083c34adc5Sramat 			if (pp_head == NULL)
85093c34adc5Sramat 				pp_head = pp;
85103c34adc5Sramat 			else
85113c34adc5Sramat 				pp_tail->phys_path_next = pp;
85123c34adc5Sramat 			pp_tail = pp;
85133c34adc5Sramat 		}
85143c34adc5Sramat 	}
85153c34adc5Sramat 
85163c34adc5Sramat 	return (pp_head);
85173c34adc5Sramat }
85183c34adc5Sramat 
85193c34adc5Sramat /*
85203c34adc5Sramat  * Free the memory allocated for phci client path list.
85213c34adc5Sramat  */
85223c34adc5Sramat static void
85233c34adc5Sramat free_phclient_path_list(mdi_phys_path_t *pp_head)
85243c34adc5Sramat {
85253c34adc5Sramat 	mdi_phys_path_t *pp, *pp_next;
85263c34adc5Sramat 
85273c34adc5Sramat 	for (pp = pp_head; pp != NULL; pp = pp_next) {
85283c34adc5Sramat 		pp_next = pp->phys_path_next;
85293c34adc5Sramat 		kmem_free(pp->phys_path, strlen(pp->phys_path) + 1);
85303c34adc5Sramat 		kmem_free(pp, sizeof (*pp));
85313c34adc5Sramat 	}
85323c34adc5Sramat }
85333c34adc5Sramat 
85343c34adc5Sramat /*
85353c34adc5Sramat  * Allocated async client structure and initialize with the specified values.
85363c34adc5Sramat  */
85373c34adc5Sramat static mdi_async_client_config_t *
85383c34adc5Sramat alloc_async_client_config(char *ct_name, char *ct_addr,
85393c34adc5Sramat     mdi_phys_path_t *pp_head, mdi_vhcache_lookup_token_t *tok)
85403c34adc5Sramat {
85413c34adc5Sramat 	mdi_async_client_config_t *acc;
85423c34adc5Sramat 
85433c34adc5Sramat 	acc = kmem_alloc(sizeof (*acc), KM_SLEEP);
85443c34adc5Sramat 	acc->acc_ct_name = i_ddi_strdup(ct_name, KM_SLEEP);
85453c34adc5Sramat 	acc->acc_ct_addr = i_ddi_strdup(ct_addr, KM_SLEEP);
85463c34adc5Sramat 	acc->acc_phclient_path_list_head = pp_head;
85473c34adc5Sramat 	init_vhcache_lookup_token(&acc->acc_token, tok);
85483c34adc5Sramat 	acc->acc_next = NULL;
85493c34adc5Sramat 	return (acc);
85503c34adc5Sramat }
85513c34adc5Sramat 
85523c34adc5Sramat /*
85533c34adc5Sramat  * Free the memory allocated for the async client structure and their members.
85543c34adc5Sramat  */
85553c34adc5Sramat static void
85563c34adc5Sramat free_async_client_config(mdi_async_client_config_t *acc)
85573c34adc5Sramat {
85583c34adc5Sramat 	if (acc->acc_phclient_path_list_head)
85593c34adc5Sramat 		free_phclient_path_list(acc->acc_phclient_path_list_head);
85603c34adc5Sramat 	kmem_free(acc->acc_ct_name, strlen(acc->acc_ct_name) + 1);
85613c34adc5Sramat 	kmem_free(acc->acc_ct_addr, strlen(acc->acc_ct_addr) + 1);
85623c34adc5Sramat 	kmem_free(acc, sizeof (*acc));
85633c34adc5Sramat }
85643c34adc5Sramat 
85653c34adc5Sramat /*
85663c34adc5Sramat  * Sort vhcache pathinfos (cpis) of the specified client.
85673c34adc5Sramat  * All cpis which do not have MDI_CPI_HINT_PATH_DOES_NOT_EXIST
85683c34adc5Sramat  * flag set come at the beginning of the list. All cpis which have this
85693c34adc5Sramat  * flag set come at the end of the list.
85703c34adc5Sramat  */
85713c34adc5Sramat static void
85723c34adc5Sramat sort_vhcache_paths(mdi_vhcache_client_t *cct)
85733c34adc5Sramat {
85743c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi, *cpi_next, *cpi_head;
85753c34adc5Sramat 
85763c34adc5Sramat 	cpi_head = cct->cct_cpi_head;
85773c34adc5Sramat 	cct->cct_cpi_head = cct->cct_cpi_tail = NULL;
85783c34adc5Sramat 	for (cpi = cpi_head; cpi != NULL; cpi = cpi_next) {
85793c34adc5Sramat 		cpi_next = cpi->cpi_next;
85803c34adc5Sramat 		enqueue_vhcache_pathinfo(cct, cpi);
85813c34adc5Sramat 	}
85823c34adc5Sramat }
85833c34adc5Sramat 
85843c34adc5Sramat /*
85853c34adc5Sramat  * Verify whether MDI_CPI_HINT_PATH_DOES_NOT_EXIST flag setting is correct for
85863c34adc5Sramat  * every vhcache pathinfo of the specified client. If not adjust the flag
85873c34adc5Sramat  * setting appropriately.
85883c34adc5Sramat  *
85893c34adc5Sramat  * Note that MDI_CPI_HINT_PATH_DOES_NOT_EXIST flag is persisted in the
85903c34adc5Sramat  * on-disk vhci cache. So every time this flag is updated the cache must be
85913c34adc5Sramat  * flushed.
85923c34adc5Sramat  */
85933c34adc5Sramat static void
85943c34adc5Sramat adjust_sort_vhcache_paths(mdi_vhci_config_t *vhc, char *ct_name, char *ct_addr,
85953c34adc5Sramat     mdi_vhcache_lookup_token_t *tok)
85963c34adc5Sramat {
85973c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
85983c34adc5Sramat 	mdi_vhcache_client_t *cct;
85993c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi;
86003c34adc5Sramat 
86013c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_READER);
86023c34adc5Sramat 	if ((cct = lookup_vhcache_client(vhcache, ct_name, ct_addr, tok))
86033c34adc5Sramat 	    == NULL) {
86043c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
86053c34adc5Sramat 		return;
86063c34adc5Sramat 	}
86073c34adc5Sramat 
86083c34adc5Sramat 	/*
86093c34adc5Sramat 	 * to avoid unnecessary on-disk cache updates, first check if an
86103c34adc5Sramat 	 * update is really needed. If no update is needed simply return.
86113c34adc5Sramat 	 */
86123c34adc5Sramat 	for (cpi = cct->cct_cpi_head; cpi != NULL; cpi = cpi->cpi_next) {
86133c34adc5Sramat 		if ((cpi->cpi_pip != NULL &&
86143c34adc5Sramat 		    (cpi->cpi_flags & MDI_CPI_HINT_PATH_DOES_NOT_EXIST)) ||
86153c34adc5Sramat 		    (cpi->cpi_pip == NULL &&
86163c34adc5Sramat 		    !(cpi->cpi_flags & MDI_CPI_HINT_PATH_DOES_NOT_EXIST))) {
86173c34adc5Sramat 			break;
86183c34adc5Sramat 		}
86193c34adc5Sramat 	}
86203c34adc5Sramat 	if (cpi == NULL) {
86213c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
86223c34adc5Sramat 		return;
86233c34adc5Sramat 	}
86243c34adc5Sramat 
86253c34adc5Sramat 	if (rw_tryupgrade(&vhcache->vhcache_lock) == 0) {
86263c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
86273c34adc5Sramat 		rw_enter(&vhcache->vhcache_lock, RW_WRITER);
86283c34adc5Sramat 		if ((cct = lookup_vhcache_client(vhcache, ct_name, ct_addr,
86293c34adc5Sramat 		    tok)) == NULL) {
86303c34adc5Sramat 			rw_exit(&vhcache->vhcache_lock);
86313c34adc5Sramat 			return;
86323c34adc5Sramat 		}
86333c34adc5Sramat 	}
86343c34adc5Sramat 
86353c34adc5Sramat 	for (cpi = cct->cct_cpi_head; cpi != NULL; cpi = cpi->cpi_next) {
86363c34adc5Sramat 		if (cpi->cpi_pip != NULL)
86373c34adc5Sramat 			cpi->cpi_flags &= ~MDI_CPI_HINT_PATH_DOES_NOT_EXIST;
86383c34adc5Sramat 		else
86393c34adc5Sramat 			cpi->cpi_flags |= MDI_CPI_HINT_PATH_DOES_NOT_EXIST;
86403c34adc5Sramat 	}
86413c34adc5Sramat 	sort_vhcache_paths(cct);
86423c34adc5Sramat 
86433c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
86443c34adc5Sramat 	vhcache_dirty(vhc);
86453c34adc5Sramat }
86463c34adc5Sramat 
86473c34adc5Sramat /*
86483c34adc5Sramat  * Configure all specified paths of the client.
86493c34adc5Sramat  */
86503c34adc5Sramat static void
86513c34adc5Sramat config_client_paths_sync(mdi_vhci_config_t *vhc, char *ct_name, char *ct_addr,
86523c34adc5Sramat     mdi_phys_path_t *pp_head, mdi_vhcache_lookup_token_t *tok)
86533c34adc5Sramat {
86543c34adc5Sramat 	mdi_phys_path_t *pp;
86553c34adc5Sramat 
86563c34adc5Sramat 	for (pp = pp_head; pp != NULL; pp = pp->phys_path_next)
86573c34adc5Sramat 		(void) bus_config_one_phci_child(pp->phys_path);
86583c34adc5Sramat 	adjust_sort_vhcache_paths(vhc, ct_name, ct_addr, tok);
86593c34adc5Sramat }
86603c34adc5Sramat 
86613c34adc5Sramat /*
86623c34adc5Sramat  * Dequeue elements from vhci async client config list and bus configure
86633c34adc5Sramat  * their corresponding phci clients.
86643c34adc5Sramat  */
86653c34adc5Sramat static void
86663c34adc5Sramat config_client_paths_thread(void *arg)
86673c34adc5Sramat {
86683c34adc5Sramat 	mdi_vhci_config_t *vhc = (mdi_vhci_config_t *)arg;
86693c34adc5Sramat 	mdi_async_client_config_t *acc;
86703c34adc5Sramat 	clock_t quit_at_ticks;
86713c34adc5Sramat 	clock_t idle_time = mdi_async_config_idle_time * TICKS_PER_SECOND;
86723c34adc5Sramat 	callb_cpr_t cprinfo;
86733c34adc5Sramat 
86743c34adc5Sramat 	CALLB_CPR_INIT(&cprinfo, &vhc->vhc_lock, callb_generic_cpr,
86753c34adc5Sramat 	    "mdi_config_client_paths");
86763c34adc5Sramat 
86773c34adc5Sramat 	for (; ; ) {
86783c34adc5Sramat 		quit_at_ticks = ddi_get_lbolt() + idle_time;
86793c34adc5Sramat 
86803c34adc5Sramat 		mutex_enter(&vhc->vhc_lock);
86813c34adc5Sramat 		while (!(vhc->vhc_flags & MDI_VHC_EXIT) &&
86823c34adc5Sramat 		    vhc->vhc_acc_list_head == NULL &&
86833c34adc5Sramat 		    ddi_get_lbolt() < quit_at_ticks) {
86843c34adc5Sramat 			CALLB_CPR_SAFE_BEGIN(&cprinfo);
86853c34adc5Sramat 			(void) cv_timedwait(&vhc->vhc_cv, &vhc->vhc_lock,
86863c34adc5Sramat 			    quit_at_ticks);
86873c34adc5Sramat 			CALLB_CPR_SAFE_END(&cprinfo, &vhc->vhc_lock);
86883c34adc5Sramat 		}
86893c34adc5Sramat 
86903c34adc5Sramat 		if ((vhc->vhc_flags & MDI_VHC_EXIT) ||
86913c34adc5Sramat 		    vhc->vhc_acc_list_head == NULL)
86923c34adc5Sramat 			goto out;
86933c34adc5Sramat 
86943c34adc5Sramat 		acc = vhc->vhc_acc_list_head;
86953c34adc5Sramat 		vhc->vhc_acc_list_head = acc->acc_next;
86963c34adc5Sramat 		if (vhc->vhc_acc_list_head == NULL)
86973c34adc5Sramat 			vhc->vhc_acc_list_tail = NULL;
86983c34adc5Sramat 		vhc->vhc_acc_count--;
86993c34adc5Sramat 		mutex_exit(&vhc->vhc_lock);
87003c34adc5Sramat 
87013c34adc5Sramat 		config_client_paths_sync(vhc, acc->acc_ct_name,
87023c34adc5Sramat 		    acc->acc_ct_addr, acc->acc_phclient_path_list_head,
87033c34adc5Sramat 		    &acc->acc_token);
87043c34adc5Sramat 
87053c34adc5Sramat 		free_async_client_config(acc);
87063c34adc5Sramat 	}
87073c34adc5Sramat 
87083c34adc5Sramat out:
87093c34adc5Sramat 	vhc->vhc_acc_thrcount--;
87103c34adc5Sramat 	/* CALLB_CPR_EXIT releases the vhc->vhc_lock */
87113c34adc5Sramat 	CALLB_CPR_EXIT(&cprinfo);
87123c34adc5Sramat }
87133c34adc5Sramat 
87143c34adc5Sramat /*
87153c34adc5Sramat  * Arrange for all the phci client paths (pp_head) for the specified client
87163c34adc5Sramat  * to be bus configured asynchronously by a thread.
87173c34adc5Sramat  */
87183c34adc5Sramat static void
87193c34adc5Sramat config_client_paths_async(mdi_vhci_config_t *vhc, char *ct_name, char *ct_addr,
87203c34adc5Sramat     mdi_phys_path_t *pp_head, mdi_vhcache_lookup_token_t *tok)
87213c34adc5Sramat {
87223c34adc5Sramat 	mdi_async_client_config_t *acc, *newacc;
87233c34adc5Sramat 	int create_thread;
87243c34adc5Sramat 
87253c34adc5Sramat 	if (pp_head == NULL)
87263c34adc5Sramat 		return;
87273c34adc5Sramat 
87283c34adc5Sramat 	if (mdi_mtc_off) {
87293c34adc5Sramat 		config_client_paths_sync(vhc, ct_name, ct_addr, pp_head, tok);
87303c34adc5Sramat 		free_phclient_path_list(pp_head);
87313c34adc5Sramat 		return;
87323c34adc5Sramat 	}
87333c34adc5Sramat 
87343c34adc5Sramat 	newacc = alloc_async_client_config(ct_name, ct_addr, pp_head, tok);
87353c34adc5Sramat 	ASSERT(newacc);
87363c34adc5Sramat 
87373c34adc5Sramat 	mutex_enter(&vhc->vhc_lock);
87383c34adc5Sramat 	for (acc = vhc->vhc_acc_list_head; acc != NULL; acc = acc->acc_next) {
87393c34adc5Sramat 		if (strcmp(ct_name, acc->acc_ct_name) == 0 &&
87403c34adc5Sramat 		    strcmp(ct_addr, acc->acc_ct_addr) == 0) {
87413c34adc5Sramat 			free_async_client_config(newacc);
87423c34adc5Sramat 			mutex_exit(&vhc->vhc_lock);
87433c34adc5Sramat 			return;
87443c34adc5Sramat 		}
87453c34adc5Sramat 	}
87463c34adc5Sramat 
87473c34adc5Sramat 	if (vhc->vhc_acc_list_head == NULL)
87483c34adc5Sramat 		vhc->vhc_acc_list_head = newacc;
87493c34adc5Sramat 	else
87503c34adc5Sramat 		vhc->vhc_acc_list_tail->acc_next = newacc;
87513c34adc5Sramat 	vhc->vhc_acc_list_tail = newacc;
87523c34adc5Sramat 	vhc->vhc_acc_count++;
87533c34adc5Sramat 	if (vhc->vhc_acc_count <= vhc->vhc_acc_thrcount) {
87543c34adc5Sramat 		cv_broadcast(&vhc->vhc_cv);
87553c34adc5Sramat 		create_thread = 0;
87563c34adc5Sramat 	} else {
87573c34adc5Sramat 		vhc->vhc_acc_thrcount++;
87583c34adc5Sramat 		create_thread = 1;
87593c34adc5Sramat 	}
87603c34adc5Sramat 	mutex_exit(&vhc->vhc_lock);
87613c34adc5Sramat 
87623c34adc5Sramat 	if (create_thread)
87633c34adc5Sramat 		(void) thread_create(NULL, 0, config_client_paths_thread, vhc,
87643c34adc5Sramat 		    0, &p0, TS_RUN, minclsyspri);
87653c34adc5Sramat }
87663c34adc5Sramat 
87673c34adc5Sramat /*
87683c34adc5Sramat  * Return number of online paths for the specified client.
87693c34adc5Sramat  */
87703c34adc5Sramat static int
87713c34adc5Sramat nonline_paths(mdi_vhcache_client_t *cct)
87723c34adc5Sramat {
87733c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi;
87743c34adc5Sramat 	int online_count = 0;
87753c34adc5Sramat 
87763c34adc5Sramat 	for (cpi = cct->cct_cpi_head; cpi != NULL; cpi = cpi->cpi_next) {
87773c34adc5Sramat 		if (cpi->cpi_pip != NULL) {
87783c34adc5Sramat 			MDI_PI_LOCK(cpi->cpi_pip);
87793c34adc5Sramat 			if (cpi->cpi_pip->pi_state == MDI_PATHINFO_STATE_ONLINE)
87803c34adc5Sramat 				online_count++;
87813c34adc5Sramat 			MDI_PI_UNLOCK(cpi->cpi_pip);
87823c34adc5Sramat 		}
87833c34adc5Sramat 	}
87843c34adc5Sramat 
87853c34adc5Sramat 	return (online_count);
87863c34adc5Sramat }
87873c34adc5Sramat 
87883c34adc5Sramat /*
87893c34adc5Sramat  * Bus configure all paths for the specified vhci client.
87903c34adc5Sramat  * If at least one path for the client is already online, the remaining paths
87913c34adc5Sramat  * will be configured asynchronously. Otherwise, it synchronously configures
87923c34adc5Sramat  * the paths until at least one path is online and then rest of the paths
87933c34adc5Sramat  * will be configured asynchronously.
87943c34adc5Sramat  */
87953c34adc5Sramat static void
87963c34adc5Sramat config_client_paths(mdi_vhci_config_t *vhc, char *ct_name, char *ct_addr)
87973c34adc5Sramat {
87983c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
87993c34adc5Sramat 	mdi_phys_path_t *pp_head, *pp;
88003c34adc5Sramat 	mdi_vhcache_client_t *cct;
88013c34adc5Sramat 	mdi_vhcache_lookup_token_t tok;
88023c34adc5Sramat 
88033c34adc5Sramat 	ASSERT(RW_LOCK_HELD(&vhcache->vhcache_lock));
88043c34adc5Sramat 
88053c34adc5Sramat 	init_vhcache_lookup_token(&tok, NULL);
88063c34adc5Sramat 
88073c34adc5Sramat 	if (ct_name == NULL || ct_addr == NULL ||
88083c34adc5Sramat 	    (cct = lookup_vhcache_client(vhcache, ct_name, ct_addr, &tok))
88093c34adc5Sramat 	    == NULL ||
88103c34adc5Sramat 	    (pp_head = build_phclient_path_list(cct, ct_name)) == NULL) {
88113c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
88123c34adc5Sramat 		return;
88133c34adc5Sramat 	}
88143c34adc5Sramat 
88153c34adc5Sramat 	/* if at least one path is online, configure the rest asynchronously */
88163c34adc5Sramat 	if (nonline_paths(cct) > 0) {
88173c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
88183c34adc5Sramat 		config_client_paths_async(vhc, ct_name, ct_addr, pp_head, &tok);
88193c34adc5Sramat 		return;
88203c34adc5Sramat 	}
88213c34adc5Sramat 
88223c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
88233c34adc5Sramat 
88243c34adc5Sramat 	for (pp = pp_head; pp != NULL; pp = pp->phys_path_next) {
88253c34adc5Sramat 		if (bus_config_one_phci_child(pp->phys_path) == MDI_SUCCESS) {
88263c34adc5Sramat 			rw_enter(&vhcache->vhcache_lock, RW_READER);
88273c34adc5Sramat 
88283c34adc5Sramat 			if ((cct = lookup_vhcache_client(vhcache, ct_name,
88293c34adc5Sramat 			    ct_addr, &tok)) == NULL) {
88303c34adc5Sramat 				rw_exit(&vhcache->vhcache_lock);
88313c34adc5Sramat 				goto out;
88323c34adc5Sramat 			}
88333c34adc5Sramat 
88343c34adc5Sramat 			if (nonline_paths(cct) > 0 &&
88353c34adc5Sramat 			    pp->phys_path_next != NULL) {
88363c34adc5Sramat 				rw_exit(&vhcache->vhcache_lock);
88373c34adc5Sramat 				config_client_paths_async(vhc, ct_name, ct_addr,
88383c34adc5Sramat 				    pp->phys_path_next, &tok);
88393c34adc5Sramat 				pp->phys_path_next = NULL;
88403c34adc5Sramat 				goto out;
88413c34adc5Sramat 			}
88423c34adc5Sramat 
88433c34adc5Sramat 			rw_exit(&vhcache->vhcache_lock);
88443c34adc5Sramat 		}
88453c34adc5Sramat 	}
88463c34adc5Sramat 
88473c34adc5Sramat 	adjust_sort_vhcache_paths(vhc, ct_name, ct_addr, &tok);
88483c34adc5Sramat out:
88493c34adc5Sramat 	free_phclient_path_list(pp_head);
88503c34adc5Sramat }
88513c34adc5Sramat 
88523c34adc5Sramat static void
88533c34adc5Sramat single_threaded_vhconfig_enter(mdi_vhci_config_t *vhc)
88543c34adc5Sramat {
88553c34adc5Sramat 	mutex_enter(&vhc->vhc_lock);
88563c34adc5Sramat 	while (vhc->vhc_flags & MDI_VHC_SINGLE_THREADED)
88573c34adc5Sramat 		cv_wait(&vhc->vhc_cv, &vhc->vhc_lock);
88583c34adc5Sramat 	vhc->vhc_flags |= MDI_VHC_SINGLE_THREADED;
88593c34adc5Sramat 	mutex_exit(&vhc->vhc_lock);
88603c34adc5Sramat }
88613c34adc5Sramat 
88623c34adc5Sramat static void
88633c34adc5Sramat single_threaded_vhconfig_exit(mdi_vhci_config_t *vhc)
88643c34adc5Sramat {
88653c34adc5Sramat 	mutex_enter(&vhc->vhc_lock);
88663c34adc5Sramat 	vhc->vhc_flags &= ~MDI_VHC_SINGLE_THREADED;
88673c34adc5Sramat 	cv_broadcast(&vhc->vhc_cv);
88683c34adc5Sramat 	mutex_exit(&vhc->vhc_lock);
88693c34adc5Sramat }
88703c34adc5Sramat 
887152cac543Sramat typedef struct mdi_phci_driver_info {
887252cac543Sramat 	char	*phdriver_name;	/* name of the phci driver */
887352cac543Sramat 
887452cac543Sramat 	/* set to non zero if the phci driver supports root device */
887552cac543Sramat 	int	phdriver_root_support;
887652cac543Sramat } mdi_phci_driver_info_t;
887752cac543Sramat 
88783c34adc5Sramat /*
887952cac543Sramat  * vhci class and root support capability of a phci driver can be
888052cac543Sramat  * specified using ddi-vhci-class and ddi-no-root-support properties in the
888152cac543Sramat  * phci driver.conf file. The built-in tables below contain this information
888252cac543Sramat  * for those phci drivers whose driver.conf files don't yet contain this info.
888352cac543Sramat  *
888452cac543Sramat  * All phci drivers expect iscsi have root device support.
888552cac543Sramat  */
888652cac543Sramat static mdi_phci_driver_info_t scsi_phci_driver_list[] = {
888752cac543Sramat 	{ "fp", 1 },
888852cac543Sramat 	{ "iscsi", 0 },
888952cac543Sramat 	{ "ibsrp", 1 }
889052cac543Sramat 	};
889152cac543Sramat 
889252cac543Sramat static mdi_phci_driver_info_t ib_phci_driver_list[] = { "tavor", 1 };
889352cac543Sramat 
889452cac543Sramat static void *
889552cac543Sramat mdi_realloc(void *old_ptr, size_t old_size, size_t new_size)
889652cac543Sramat {
889752cac543Sramat 	void *new_ptr;
889852cac543Sramat 
889952cac543Sramat 	new_ptr = kmem_zalloc(new_size, KM_SLEEP);
890052cac543Sramat 	if (old_ptr) {
8901f7209cf2Spramodbg 		bcopy(old_ptr, new_ptr, MIN(old_size, new_size));
890252cac543Sramat 		kmem_free(old_ptr, old_size);
890352cac543Sramat 	}
890452cac543Sramat 	return (new_ptr);
890552cac543Sramat }
890652cac543Sramat 
890752cac543Sramat static void
890852cac543Sramat add_to_phci_list(char ***driver_list, int **root_support_list,
890952cac543Sramat     int *cur_elements, int *max_elements, char *driver_name, int root_support)
891052cac543Sramat {
891152cac543Sramat 	ASSERT(*cur_elements <= *max_elements);
891252cac543Sramat 	if (*cur_elements == *max_elements) {
891352cac543Sramat 		*max_elements += 10;
891452cac543Sramat 		*driver_list = mdi_realloc(*driver_list,
891552cac543Sramat 		    sizeof (char *) * (*cur_elements),
891652cac543Sramat 		    sizeof (char *) * (*max_elements));
891752cac543Sramat 		*root_support_list = mdi_realloc(*root_support_list,
891852cac543Sramat 		    sizeof (int) * (*cur_elements),
891952cac543Sramat 		    sizeof (int) * (*max_elements));
892052cac543Sramat 	}
892152cac543Sramat 	(*driver_list)[*cur_elements] = i_ddi_strdup(driver_name, KM_SLEEP);
892252cac543Sramat 	(*root_support_list)[*cur_elements] = root_support;
892352cac543Sramat 	(*cur_elements)++;
892452cac543Sramat }
892552cac543Sramat 
892652cac543Sramat static void
892752cac543Sramat get_phci_driver_list(char *vhci_class, char ***driver_list,
892852cac543Sramat     int **root_support_list, int *cur_elements, int *max_elements)
892952cac543Sramat {
893052cac543Sramat 	mdi_phci_driver_info_t	*st_driver_list, *p;
893152cac543Sramat 	int		st_ndrivers, root_support, i, j, driver_conf_count;
893252cac543Sramat 	major_t		m;
893352cac543Sramat 	struct devnames	*dnp;
893452cac543Sramat 	ddi_prop_t	*propp;
893552cac543Sramat 
893652cac543Sramat 	*driver_list = NULL;
893752cac543Sramat 	*root_support_list = NULL;
893852cac543Sramat 	*cur_elements = 0;
893952cac543Sramat 	*max_elements = 0;
894052cac543Sramat 
894152cac543Sramat 	/* add the phci drivers derived from the phci driver.conf files */
894252cac543Sramat 	for (m = 0; m < devcnt; m++) {
894352cac543Sramat 		dnp = &devnamesp[m];
894452cac543Sramat 
894552cac543Sramat 		if (dnp->dn_flags & DN_PHCI_DRIVER) {
894652cac543Sramat 			LOCK_DEV_OPS(&dnp->dn_lock);
894752cac543Sramat 			if (dnp->dn_global_prop_ptr != NULL &&
894852cac543Sramat 			    (propp = i_ddi_prop_search(DDI_DEV_T_ANY,
894952cac543Sramat 			    DDI_VHCI_CLASS, DDI_PROP_TYPE_STRING,
895052cac543Sramat 			    &dnp->dn_global_prop_ptr->prop_list)) != NULL &&
895152cac543Sramat 			    strcmp(propp->prop_val, vhci_class) == 0) {
895252cac543Sramat 
895352cac543Sramat 				root_support = (i_ddi_prop_search(DDI_DEV_T_ANY,
895452cac543Sramat 				    DDI_NO_ROOT_SUPPORT, DDI_PROP_TYPE_INT,
895552cac543Sramat 				    &dnp->dn_global_prop_ptr->prop_list)
895652cac543Sramat 				    == NULL) ? 1 : 0;
895752cac543Sramat 
895852cac543Sramat 				add_to_phci_list(driver_list, root_support_list,
895952cac543Sramat 				    cur_elements, max_elements, dnp->dn_name,
896052cac543Sramat 				    root_support);
896152cac543Sramat 
896252cac543Sramat 				UNLOCK_DEV_OPS(&dnp->dn_lock);
896352cac543Sramat 			} else
896452cac543Sramat 				UNLOCK_DEV_OPS(&dnp->dn_lock);
896552cac543Sramat 		}
896652cac543Sramat 	}
896752cac543Sramat 
896852cac543Sramat 	driver_conf_count = *cur_elements;
896952cac543Sramat 
897052cac543Sramat 	/* add the phci drivers specified in the built-in tables */
897152cac543Sramat 	if (strcmp(vhci_class, MDI_HCI_CLASS_SCSI) == 0) {
897252cac543Sramat 		st_driver_list = scsi_phci_driver_list;
897352cac543Sramat 		st_ndrivers = sizeof (scsi_phci_driver_list) /
897452cac543Sramat 		    sizeof (mdi_phci_driver_info_t);
897552cac543Sramat 	} else if (strcmp(vhci_class, MDI_HCI_CLASS_IB) == 0) {
897652cac543Sramat 		st_driver_list = ib_phci_driver_list;
897752cac543Sramat 		st_ndrivers = sizeof (ib_phci_driver_list) /
897852cac543Sramat 		    sizeof (mdi_phci_driver_info_t);
897952cac543Sramat 	} else {
898052cac543Sramat 		st_driver_list = NULL;
898152cac543Sramat 		st_ndrivers = 0;
898252cac543Sramat 	}
898352cac543Sramat 
898452cac543Sramat 	for (i = 0, p = st_driver_list; i < st_ndrivers; i++, p++) {
898552cac543Sramat 		/* add this phci driver if not already added before */
898652cac543Sramat 		for (j = 0; j < driver_conf_count; j++) {
898752cac543Sramat 			if (strcmp((*driver_list)[j], p->phdriver_name) == 0)
898852cac543Sramat 				break;
898952cac543Sramat 		}
899052cac543Sramat 		if (j == driver_conf_count) {
899152cac543Sramat 			add_to_phci_list(driver_list, root_support_list,
899252cac543Sramat 			    cur_elements, max_elements, p->phdriver_name,
899352cac543Sramat 			    p->phdriver_root_support);
899452cac543Sramat 		}
899552cac543Sramat 	}
899652cac543Sramat }
899752cac543Sramat 
899852cac543Sramat /*
899952cac543Sramat  * Attach the phci driver instances associated with the specified vhci class.
90003c34adc5Sramat  * If root is mounted attach all phci driver instances.
90013c34adc5Sramat  * If root is not mounted, attach the instances of only those phci
90023c34adc5Sramat  * drivers that have the root support.
90033c34adc5Sramat  */
90043c34adc5Sramat static void
900552cac543Sramat attach_phci_drivers(char *vhci_class)
90063c34adc5Sramat {
900752cac543Sramat 	char	**driver_list, **p;
900852cac543Sramat 	int	*root_support_list;
900952cac543Sramat 	int	cur_elements, max_elements, i;
90103c34adc5Sramat 	major_t	m;
90113c34adc5Sramat 
901252cac543Sramat 	get_phci_driver_list(vhci_class, &driver_list, &root_support_list,
901352cac543Sramat 	    &cur_elements, &max_elements);
90143c34adc5Sramat 
901552cac543Sramat 	for (i = 0; i < cur_elements; i++) {
901652cac543Sramat 		if (modrootloaded || root_support_list[i]) {
901752cac543Sramat 			m = ddi_name_to_major(driver_list[i]);
9018a204de77Scth 			if (m != DDI_MAJOR_T_NONE &&
9019a204de77Scth 			    ddi_hold_installed_driver(m))
90203c34adc5Sramat 				ddi_rele_driver(m);
90213c34adc5Sramat 		}
90223c34adc5Sramat 	}
902352cac543Sramat 
902452cac543Sramat 	if (driver_list) {
902552cac543Sramat 		for (i = 0, p = driver_list; i < cur_elements; i++, p++)
902652cac543Sramat 			kmem_free(*p, strlen(*p) + 1);
902752cac543Sramat 		kmem_free(driver_list, sizeof (char *) * max_elements);
902852cac543Sramat 		kmem_free(root_support_list, sizeof (int) * max_elements);
902952cac543Sramat 	}
90303c34adc5Sramat }
90313c34adc5Sramat 
90323c34adc5Sramat /*
90333c34adc5Sramat  * Build vhci cache:
90343c34adc5Sramat  *
90353c34adc5Sramat  * Attach phci driver instances and then drive BUS_CONFIG_ALL on
90363c34adc5Sramat  * the phci driver instances. During this process the cache gets built.
90373c34adc5Sramat  *
903867e56d35Sramat  * Cache is built fully if the root is mounted.
90393c34adc5Sramat  * If the root is not mounted, phci drivers that do not have root support
90403c34adc5Sramat  * are not attached. As a result the cache is built partially. The entries
90413c34adc5Sramat  * in the cache reflect only those phci drivers that have root support.
90423c34adc5Sramat  */
904367e56d35Sramat static int
904452cac543Sramat build_vhci_cache(mdi_vhci_t *vh)
90453c34adc5Sramat {
904652cac543Sramat 	mdi_vhci_config_t *vhc = vh->vh_config;
90473c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
90483c34adc5Sramat 
904967e56d35Sramat 	single_threaded_vhconfig_enter(vhc);
905067e56d35Sramat 
90513c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_READER);
90523c34adc5Sramat 	if (vhcache->vhcache_flags & MDI_VHCI_CACHE_SETUP_DONE) {
90533c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
905467e56d35Sramat 		single_threaded_vhconfig_exit(vhc);
905567e56d35Sramat 		return (0);
90563c34adc5Sramat 	}
90573c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
90583c34adc5Sramat 
905952cac543Sramat 	attach_phci_drivers(vh->vh_class);
90603c34adc5Sramat 	bus_config_all_phcis(vhcache, NDI_DRV_CONF_REPROBE | NDI_NO_EVENT,
9061a204de77Scth 	    BUS_CONFIG_ALL, DDI_MAJOR_T_NONE);
90623c34adc5Sramat 
90633c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_WRITER);
90643c34adc5Sramat 	vhcache->vhcache_flags |= MDI_VHCI_CACHE_SETUP_DONE;
90653c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
906667e56d35Sramat 
906767e56d35Sramat 	single_threaded_vhconfig_exit(vhc);
90683c34adc5Sramat 	vhcache_dirty(vhc);
906967e56d35Sramat 	return (1);
90703c34adc5Sramat }
90713c34adc5Sramat 
90723c34adc5Sramat /*
907367e56d35Sramat  * Determine if discovery of paths is needed.
90743c34adc5Sramat  */
90753c34adc5Sramat static int
907667e56d35Sramat vhcache_do_discovery(mdi_vhci_config_t *vhc)
90773c34adc5Sramat {
907867e56d35Sramat 	int rv = 1;
907967e56d35Sramat 
908067e56d35Sramat 	mutex_enter(&vhc->vhc_lock);
908167e56d35Sramat 	if (i_ddi_io_initialized() == 0) {
908267e56d35Sramat 		if (vhc->vhc_path_discovery_boot > 0) {
908367e56d35Sramat 			vhc->vhc_path_discovery_boot--;
908467e56d35Sramat 			goto out;
908567e56d35Sramat 		}
908667e56d35Sramat 	} else {
908767e56d35Sramat 		if (vhc->vhc_path_discovery_postboot > 0) {
908867e56d35Sramat 			vhc->vhc_path_discovery_postboot--;
908967e56d35Sramat 			goto out;
909067e56d35Sramat 		}
909167e56d35Sramat 	}
909267e56d35Sramat 
909367e56d35Sramat 	/*
909467e56d35Sramat 	 * Do full path discovery at most once per mdi_path_discovery_interval.
909567e56d35Sramat 	 * This is to avoid a series of full path discoveries when opening
909667e56d35Sramat 	 * stale /dev/[r]dsk links.
909767e56d35Sramat 	 */
909867e56d35Sramat 	if (mdi_path_discovery_interval != -1 &&
909967e56d35Sramat 	    lbolt64 >= vhc->vhc_path_discovery_cutoff_time)
910067e56d35Sramat 		goto out;
910167e56d35Sramat 
910267e56d35Sramat 	rv = 0;
910367e56d35Sramat out:
910467e56d35Sramat 	mutex_exit(&vhc->vhc_lock);
910567e56d35Sramat 	return (rv);
910667e56d35Sramat }
910767e56d35Sramat 
910867e56d35Sramat /*
910967e56d35Sramat  * Discover all paths:
911067e56d35Sramat  *
911167e56d35Sramat  * Attach phci driver instances and then drive BUS_CONFIG_ALL on all the phci
911267e56d35Sramat  * driver instances. During this process all paths will be discovered.
911367e56d35Sramat  */
911467e56d35Sramat static int
911552cac543Sramat vhcache_discover_paths(mdi_vhci_t *vh)
911667e56d35Sramat {
911752cac543Sramat 	mdi_vhci_config_t *vhc = vh->vh_config;
911867e56d35Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
911967e56d35Sramat 	int rv = 0;
91203c34adc5Sramat 
91213c34adc5Sramat 	single_threaded_vhconfig_enter(vhc);
91223c34adc5Sramat 
912367e56d35Sramat 	if (vhcache_do_discovery(vhc)) {
912452cac543Sramat 		attach_phci_drivers(vh->vh_class);
912567e56d35Sramat 		bus_config_all_phcis(vhcache, NDI_DRV_CONF_REPROBE |
9126a204de77Scth 		    NDI_NO_EVENT, BUS_CONFIG_ALL, DDI_MAJOR_T_NONE);
912767e56d35Sramat 
91283c34adc5Sramat 		mutex_enter(&vhc->vhc_lock);
912967e56d35Sramat 		vhc->vhc_path_discovery_cutoff_time = lbolt64 +
913067e56d35Sramat 		    mdi_path_discovery_interval * TICKS_PER_SECOND;
91313c34adc5Sramat 		mutex_exit(&vhc->vhc_lock);
913267e56d35Sramat 		rv = 1;
91333c34adc5Sramat 	}
91343c34adc5Sramat 
91353c34adc5Sramat 	single_threaded_vhconfig_exit(vhc);
91363c34adc5Sramat 	return (rv);
91373c34adc5Sramat }
91383c34adc5Sramat 
91393c34adc5Sramat /*
91403c34adc5Sramat  * Generic vhci bus config implementation:
91413c34adc5Sramat  *
91423c34adc5Sramat  * Parameters
91433c34adc5Sramat  *	vdip	vhci dip
91443c34adc5Sramat  *	flags	bus config flags
91453c34adc5Sramat  *	op	bus config operation
91463c34adc5Sramat  *	The remaining parameters are bus config operation specific
91473c34adc5Sramat  *
91483c34adc5Sramat  * for BUS_CONFIG_ONE
91493c34adc5Sramat  *	arg	pointer to name@addr
91503c34adc5Sramat  *	child	upon successful return from this function, *child will be
91513c34adc5Sramat  *		set to the configured and held devinfo child node of vdip.
91523c34adc5Sramat  *	ct_addr	pointer to client address (i.e. GUID)
91533c34adc5Sramat  *
91543c34adc5Sramat  * for BUS_CONFIG_DRIVER
91553c34adc5Sramat  *	arg	major number of the driver
91563c34adc5Sramat  *	child and ct_addr parameters are ignored
91573c34adc5Sramat  *
91583c34adc5Sramat  * for BUS_CONFIG_ALL
91593c34adc5Sramat  *	arg, child, and ct_addr parameters are ignored
91603c34adc5Sramat  *
91613c34adc5Sramat  * Note that for the rest of the bus config operations, this function simply
91623c34adc5Sramat  * calls the framework provided default bus config routine.
91633c34adc5Sramat  */
91643c34adc5Sramat int
91653c34adc5Sramat mdi_vhci_bus_config(dev_info_t *vdip, uint_t flags, ddi_bus_config_op_t op,
91663c34adc5Sramat     void *arg, dev_info_t **child, char *ct_addr)
91673c34adc5Sramat {
91683c34adc5Sramat 	mdi_vhci_t *vh = i_devi_get_vhci(vdip);
91693c34adc5Sramat 	mdi_vhci_config_t *vhc = vh->vh_config;
91703c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
917167e56d35Sramat 	int rv = 0;
917267e56d35Sramat 	int params_valid = 0;
91733c34adc5Sramat 	char *cp;
91743c34adc5Sramat 
91753c34adc5Sramat 	/*
91765e3986cbScth 	 * To bus config vhcis we relay operation, possibly using another
91775e3986cbScth 	 * thread, to phcis. The phci driver then interacts with MDI to cause
91785e3986cbScth 	 * vhci child nodes to be enumerated under the vhci node.  Adding a
91795e3986cbScth 	 * vhci child requires an ndi_devi_enter of the vhci. Since another
91805e3986cbScth 	 * thread may be adding the child, to avoid deadlock we can't wait
91815e3986cbScth 	 * for the relayed operations to complete if we have already entered
91825e3986cbScth 	 * the vhci node.
91833c34adc5Sramat 	 */
91843c34adc5Sramat 	if (DEVI_BUSY_OWNED(vdip)) {
91854c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, vdip,
91864c06356bSdh142964 		    "vhci dip is busy owned %p", (void *)vdip));
91873c34adc5Sramat 		goto default_bus_config;
91883c34adc5Sramat 	}
91893c34adc5Sramat 
91903c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_READER);
91913c34adc5Sramat 	if (!(vhcache->vhcache_flags & MDI_VHCI_CACHE_SETUP_DONE)) {
91923c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
919352cac543Sramat 		rv = build_vhci_cache(vh);
91943c34adc5Sramat 		rw_enter(&vhcache->vhcache_lock, RW_READER);
91953c34adc5Sramat 	}
91963c34adc5Sramat 
91973c34adc5Sramat 	switch (op) {
91983c34adc5Sramat 	case BUS_CONFIG_ONE:
919967e56d35Sramat 		if (arg != NULL && ct_addr != NULL) {
92003c34adc5Sramat 			/* extract node name */
92013c34adc5Sramat 			cp = (char *)arg;
92023c34adc5Sramat 			while (*cp != '\0' && *cp != '@')
92033c34adc5Sramat 				cp++;
92043c34adc5Sramat 			if (*cp == '@') {
920567e56d35Sramat 				params_valid = 1;
92063c34adc5Sramat 				*cp = '\0';
92073c34adc5Sramat 				config_client_paths(vhc, (char *)arg, ct_addr);
920867e56d35Sramat 				/* config_client_paths() releases cache_lock */
92093c34adc5Sramat 				*cp = '@';
921067e56d35Sramat 				break;
921167e56d35Sramat 			}
921267e56d35Sramat 		}
921367e56d35Sramat 
92143c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
92153c34adc5Sramat 		break;
92163c34adc5Sramat 
92173c34adc5Sramat 	case BUS_CONFIG_DRIVER:
92183c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
921967e56d35Sramat 		if (rv == 0)
922067e56d35Sramat 			st_bus_config_all_phcis(vhc, flags, op,
92213c34adc5Sramat 			    (major_t)(uintptr_t)arg);
92223c34adc5Sramat 		break;
92233c34adc5Sramat 
92243c34adc5Sramat 	case BUS_CONFIG_ALL:
92253c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
922667e56d35Sramat 		if (rv == 0)
922767e56d35Sramat 			st_bus_config_all_phcis(vhc, flags, op, -1);
92283c34adc5Sramat 		break;
92293c34adc5Sramat 
92303c34adc5Sramat 	default:
92313c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
92323c34adc5Sramat 		break;
92333c34adc5Sramat 	}
92343c34adc5Sramat 
92353c34adc5Sramat 
92363c34adc5Sramat default_bus_config:
92373c34adc5Sramat 	/*
92383c34adc5Sramat 	 * All requested child nodes are enumerated under the vhci.
92393c34adc5Sramat 	 * Now configure them.
92403c34adc5Sramat 	 */
92413c34adc5Sramat 	if (ndi_busop_bus_config(vdip, flags, op, arg, child, 0) ==
92423c34adc5Sramat 	    NDI_SUCCESS) {
92433c34adc5Sramat 		return (MDI_SUCCESS);
924467e56d35Sramat 	} else if (op == BUS_CONFIG_ONE && rv == 0 && params_valid) {
924567e56d35Sramat 		/* discover all paths and try configuring again */
924652cac543Sramat 		if (vhcache_discover_paths(vh) &&
924767e56d35Sramat 		    ndi_busop_bus_config(vdip, flags, op, arg, child, 0) ==
924867e56d35Sramat 		    NDI_SUCCESS)
924967e56d35Sramat 			return (MDI_SUCCESS);
92503c34adc5Sramat 	}
92513c34adc5Sramat 
92523c34adc5Sramat 	return (MDI_FAILURE);
92533c34adc5Sramat }
92543c34adc5Sramat 
92553c34adc5Sramat /*
92563c34adc5Sramat  * Read the on-disk vhci cache into an nvlist for the specified vhci class.
92573c34adc5Sramat  */
92583c34adc5Sramat static nvlist_t *
92593c34adc5Sramat read_on_disk_vhci_cache(char *vhci_class)
92603c34adc5Sramat {
92613c34adc5Sramat 	nvlist_t *nvl;
92623c34adc5Sramat 	int err;
92633c34adc5Sramat 	char *filename;
92643c34adc5Sramat 
92653c34adc5Sramat 	filename = vhclass2vhcache_filename(vhci_class);
92663c34adc5Sramat 
92673c34adc5Sramat 	if ((err = fread_nvlist(filename, &nvl)) == 0) {
92683c34adc5Sramat 		kmem_free(filename, strlen(filename) + 1);
92693c34adc5Sramat 		return (nvl);
92703c34adc5Sramat 	} else if (err == EIO)
92714c06356bSdh142964 		cmn_err(CE_WARN, "%s: I/O error, will recreate", filename);
92723c34adc5Sramat 	else if (err == EINVAL)
92733c34adc5Sramat 		cmn_err(CE_WARN,
92744c06356bSdh142964 		    "%s: data file corrupted, will recreate", filename);
92753c34adc5Sramat 
92763c34adc5Sramat 	kmem_free(filename, strlen(filename) + 1);
92773c34adc5Sramat 	return (NULL);
92783c34adc5Sramat }
92793c34adc5Sramat 
92803c34adc5Sramat /*
92813c34adc5Sramat  * Read on-disk vhci cache into nvlists for all vhci classes.
92823c34adc5Sramat  * Called during booting by i_ddi_read_devices_files().
92833c34adc5Sramat  */
92843c34adc5Sramat void
92853c34adc5Sramat mdi_read_devices_files(void)
92863c34adc5Sramat {
92873c34adc5Sramat 	int i;
92883c34adc5Sramat 
92893c34adc5Sramat 	for (i = 0; i < N_VHCI_CLASSES; i++)
92903c34adc5Sramat 		vhcache_nvl[i] = read_on_disk_vhci_cache(vhci_class_list[i]);
92913c34adc5Sramat }
92923c34adc5Sramat 
92933c34adc5Sramat /*
92943c34adc5Sramat  * Remove all stale entries from vhci cache.
92953c34adc5Sramat  */
92963c34adc5Sramat static void
92973c34adc5Sramat clean_vhcache(mdi_vhci_config_t *vhc)
92983c34adc5Sramat {
92993c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
93003c34adc5Sramat 	mdi_vhcache_phci_t *cphci, *cphci_head, *cphci_next;
93013c34adc5Sramat 	mdi_vhcache_client_t *cct, *cct_head, *cct_next;
93023c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi, *cpi_head, *cpi_next;
93033c34adc5Sramat 
93043c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_WRITER);
93053c34adc5Sramat 
93063c34adc5Sramat 	cct_head = vhcache->vhcache_client_head;
93073c34adc5Sramat 	vhcache->vhcache_client_head = vhcache->vhcache_client_tail = NULL;
93083c34adc5Sramat 	for (cct = cct_head; cct != NULL; cct = cct_next) {
93093c34adc5Sramat 		cct_next = cct->cct_next;
93103c34adc5Sramat 
93113c34adc5Sramat 		cpi_head = cct->cct_cpi_head;
93123c34adc5Sramat 		cct->cct_cpi_head = cct->cct_cpi_tail = NULL;
93133c34adc5Sramat 		for (cpi = cpi_head; cpi != NULL; cpi = cpi_next) {
93143c34adc5Sramat 			cpi_next = cpi->cpi_next;
93153c34adc5Sramat 			if (cpi->cpi_pip != NULL) {
93163c34adc5Sramat 				ASSERT(cpi->cpi_cphci->cphci_phci != NULL);
93173c34adc5Sramat 				enqueue_tail_vhcache_pathinfo(cct, cpi);
93183c34adc5Sramat 			} else
93193c34adc5Sramat 				free_vhcache_pathinfo(cpi);
93203c34adc5Sramat 		}
93213c34adc5Sramat 
93223c34adc5Sramat 		if (cct->cct_cpi_head != NULL)
93233c34adc5Sramat 			enqueue_vhcache_client(vhcache, cct);
93243c34adc5Sramat 		else {
93253c34adc5Sramat 			(void) mod_hash_destroy(vhcache->vhcache_client_hash,
93263c34adc5Sramat 			    (mod_hash_key_t)cct->cct_name_addr);
93273c34adc5Sramat 			free_vhcache_client(cct);
93283c34adc5Sramat 		}
93293c34adc5Sramat 	}
93303c34adc5Sramat 
93313c34adc5Sramat 	cphci_head = vhcache->vhcache_phci_head;
93323c34adc5Sramat 	vhcache->vhcache_phci_head = vhcache->vhcache_phci_tail = NULL;
93333c34adc5Sramat 	for (cphci = cphci_head; cphci != NULL; cphci = cphci_next) {
93343c34adc5Sramat 		cphci_next = cphci->cphci_next;
93353c34adc5Sramat 		if (cphci->cphci_phci != NULL)
93363c34adc5Sramat 			enqueue_vhcache_phci(vhcache, cphci);
93373c34adc5Sramat 		else
93383c34adc5Sramat 			free_vhcache_phci(cphci);
93393c34adc5Sramat 	}
93403c34adc5Sramat 
93413c34adc5Sramat 	vhcache->vhcache_clean_time = lbolt64;
93423c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
93433c34adc5Sramat 	vhcache_dirty(vhc);
93443c34adc5Sramat }
93453c34adc5Sramat 
93463c34adc5Sramat /*
93473c34adc5Sramat  * Remove all stale entries from vhci cache.
93483c34adc5Sramat  * Called by i_ddi_clean_devices_files() during the execution of devfsadm -C
93493c34adc5Sramat  */
93503c34adc5Sramat void
93513c34adc5Sramat mdi_clean_vhcache(void)
93523c34adc5Sramat {
93533c34adc5Sramat 	mdi_vhci_t *vh;
93543c34adc5Sramat 
93553c34adc5Sramat 	mutex_enter(&mdi_mutex);
93563c34adc5Sramat 	for (vh = mdi_vhci_head; vh != NULL; vh = vh->vh_next) {
93573c34adc5Sramat 		vh->vh_refcnt++;
93583c34adc5Sramat 		mutex_exit(&mdi_mutex);
93593c34adc5Sramat 		clean_vhcache(vh->vh_config);
93603c34adc5Sramat 		mutex_enter(&mdi_mutex);
93613c34adc5Sramat 		vh->vh_refcnt--;
93623c34adc5Sramat 	}
93633c34adc5Sramat 	mutex_exit(&mdi_mutex);
93643c34adc5Sramat }
93658c4f8890Srs135747 
93668c4f8890Srs135747 /*
93678c4f8890Srs135747  * mdi_vhci_walk_clients():
93688c4f8890Srs135747  *		Walker routine to traverse client dev_info nodes
93698c4f8890Srs135747  * ddi_walk_devs(ddi_get_child(vdip), f, arg) returns the entire tree
93708c4f8890Srs135747  * below the client, including nexus devices, which we dont want.
93718c4f8890Srs135747  * So we just traverse the immediate siblings, starting from 1st client.
93728c4f8890Srs135747  */
93738c4f8890Srs135747 void
93748c4f8890Srs135747 mdi_vhci_walk_clients(dev_info_t *vdip,
93758c4f8890Srs135747     int (*f)(dev_info_t *, void *), void *arg)
93768c4f8890Srs135747 {
93775e3986cbScth 	mdi_vhci_t	*vh = i_devi_get_vhci(vdip);
93788c4f8890Srs135747 	dev_info_t	*cdip;
93798c4f8890Srs135747 	mdi_client_t	*ct;
93808c4f8890Srs135747 
93815e3986cbScth 	MDI_VHCI_CLIENT_LOCK(vh);
93828c4f8890Srs135747 	cdip = ddi_get_child(vdip);
93838c4f8890Srs135747 	while (cdip) {
93848c4f8890Srs135747 		ct = i_devi_get_client(cdip);
93858c4f8890Srs135747 		MDI_CLIENT_LOCK(ct);
93868c4f8890Srs135747 
93875e3986cbScth 		if (((*f)(cdip, arg)) == DDI_WALK_CONTINUE)
93888c4f8890Srs135747 			cdip = ddi_get_next_sibling(cdip);
93895e3986cbScth 		else
93905e3986cbScth 			cdip = NULL;
9391c73a93f2Sdm120769 
9392c73a93f2Sdm120769 		MDI_CLIENT_UNLOCK(ct);
93938c4f8890Srs135747 	}
93945e3986cbScth 	MDI_VHCI_CLIENT_UNLOCK(vh);
93958c4f8890Srs135747 }
93968c4f8890Srs135747 
93978c4f8890Srs135747 /*
93988c4f8890Srs135747  * mdi_vhci_walk_phcis():
93998c4f8890Srs135747  *		Walker routine to traverse phci dev_info nodes
94008c4f8890Srs135747  */
94018c4f8890Srs135747 void
94028c4f8890Srs135747 mdi_vhci_walk_phcis(dev_info_t *vdip,
94038c4f8890Srs135747     int (*f)(dev_info_t *, void *), void *arg)
94048c4f8890Srs135747 {
94055e3986cbScth 	mdi_vhci_t	*vh = i_devi_get_vhci(vdip);
94065e3986cbScth 	mdi_phci_t	*ph, *next;
94078c4f8890Srs135747 
94085e3986cbScth 	MDI_VHCI_PHCI_LOCK(vh);
94098c4f8890Srs135747 	ph = vh->vh_phci_head;
94108c4f8890Srs135747 	while (ph) {
94118c4f8890Srs135747 		MDI_PHCI_LOCK(ph);
94128c4f8890Srs135747 
94135e3986cbScth 		if (((*f)(ph->ph_dip, arg)) == DDI_WALK_CONTINUE)
94145e3986cbScth 			next = ph->ph_next;
94155e3986cbScth 		else
94165e3986cbScth 			next = NULL;
9417c73a93f2Sdm120769 
9418c73a93f2Sdm120769 		MDI_PHCI_UNLOCK(ph);
94195e3986cbScth 		ph = next;
94208c4f8890Srs135747 	}
94215e3986cbScth 	MDI_VHCI_PHCI_UNLOCK(vh);
94228c4f8890Srs135747 }
94238c4f8890Srs135747 
94248c4f8890Srs135747 
94258c4f8890Srs135747 /*
94268c4f8890Srs135747  * mdi_walk_vhcis():
94278c4f8890Srs135747  *		Walker routine to traverse vhci dev_info nodes
94288c4f8890Srs135747  */
94298c4f8890Srs135747 void
94308c4f8890Srs135747 mdi_walk_vhcis(int (*f)(dev_info_t *, void *), void *arg)
94318c4f8890Srs135747 {
94328c4f8890Srs135747 	mdi_vhci_t	*vh = NULL;
94338c4f8890Srs135747 
94348c4f8890Srs135747 	mutex_enter(&mdi_mutex);
94358c4f8890Srs135747 	/*
94368c4f8890Srs135747 	 * Scan for already registered vhci
94378c4f8890Srs135747 	 */
94388c4f8890Srs135747 	for (vh = mdi_vhci_head; vh != NULL; vh = vh->vh_next) {
94398c4f8890Srs135747 		vh->vh_refcnt++;
94408c4f8890Srs135747 		mutex_exit(&mdi_mutex);
94418c4f8890Srs135747 		if (((*f)(vh->vh_dip, arg)) != DDI_WALK_CONTINUE) {
94428c4f8890Srs135747 			mutex_enter(&mdi_mutex);
94438c4f8890Srs135747 			vh->vh_refcnt--;
94448c4f8890Srs135747 			break;
94458c4f8890Srs135747 		} else {
94468c4f8890Srs135747 			mutex_enter(&mdi_mutex);
94478c4f8890Srs135747 			vh->vh_refcnt--;
94488c4f8890Srs135747 		}
94498c4f8890Srs135747 	}
94508c4f8890Srs135747 
94518c4f8890Srs135747 	mutex_exit(&mdi_mutex);
94528c4f8890Srs135747 }
94538c4f8890Srs135747 
94548c4f8890Srs135747 /*
94558c4f8890Srs135747  * i_mdi_log_sysevent():
94568c4f8890Srs135747  *		Logs events for pickup by syseventd
94578c4f8890Srs135747  */
94588c4f8890Srs135747 static void
94598c4f8890Srs135747 i_mdi_log_sysevent(dev_info_t *dip, char *ph_vh_class, char *subclass)
94608c4f8890Srs135747 {
94618c4f8890Srs135747 	char		*path_name;
94628c4f8890Srs135747 	nvlist_t	*attr_list;
94638c4f8890Srs135747 
94648c4f8890Srs135747 	if (nvlist_alloc(&attr_list, NV_UNIQUE_NAME_TYPE,
94658c4f8890Srs135747 	    KM_SLEEP) != DDI_SUCCESS) {
94668c4f8890Srs135747 		goto alloc_failed;
94678c4f8890Srs135747 	}
94688c4f8890Srs135747 
94698c4f8890Srs135747 	path_name = kmem_zalloc(MAXPATHLEN, KM_SLEEP);
94708c4f8890Srs135747 	(void) ddi_pathname(dip, path_name);
94718c4f8890Srs135747 
94728c4f8890Srs135747 	if (nvlist_add_string(attr_list, DDI_DRIVER_NAME,
94738c4f8890Srs135747 	    ddi_driver_name(dip)) != DDI_SUCCESS) {
94748c4f8890Srs135747 		goto error;
94758c4f8890Srs135747 	}
94768c4f8890Srs135747 
94778c4f8890Srs135747 	if (nvlist_add_int32(attr_list, DDI_DRIVER_MAJOR,
94788c4f8890Srs135747 	    (int32_t)ddi_driver_major(dip)) != DDI_SUCCESS) {
94798c4f8890Srs135747 		goto error;
94808c4f8890Srs135747 	}
94818c4f8890Srs135747 
94828c4f8890Srs135747 	if (nvlist_add_int32(attr_list, DDI_INSTANCE,
94838c4f8890Srs135747 	    (int32_t)ddi_get_instance(dip)) != DDI_SUCCESS) {
94848c4f8890Srs135747 		goto error;
94858c4f8890Srs135747 	}
94868c4f8890Srs135747 
94878c4f8890Srs135747 	if (nvlist_add_string(attr_list, DDI_PATHNAME,
94888c4f8890Srs135747 	    path_name) != DDI_SUCCESS) {
94898c4f8890Srs135747 		goto error;
94908c4f8890Srs135747 	}
94918c4f8890Srs135747 
94928c4f8890Srs135747 	if (nvlist_add_string(attr_list, DDI_CLASS,
94938c4f8890Srs135747 	    ph_vh_class) != DDI_SUCCESS) {
94948c4f8890Srs135747 		goto error;
94958c4f8890Srs135747 	}
94968c4f8890Srs135747 
94978c4f8890Srs135747 	(void) ddi_log_sysevent(dip, DDI_VENDOR_SUNW, EC_DDI, subclass,
94988c4f8890Srs135747 	    attr_list, NULL, DDI_SLEEP);
94998c4f8890Srs135747 
95008c4f8890Srs135747 error:
95018c4f8890Srs135747 	kmem_free(path_name, MAXPATHLEN);
95028c4f8890Srs135747 	nvlist_free(attr_list);
95038c4f8890Srs135747 	return;
95048c4f8890Srs135747 
95058c4f8890Srs135747 alloc_failed:
95064c06356bSdh142964 	MDI_DEBUG(1, (MDI_WARN, dip, "!unable to send sysevent"));
95078c4f8890Srs135747 }
9508f7209cf2Spramodbg 
9509f7209cf2Spramodbg char **
9510f7209cf2Spramodbg mdi_get_phci_driver_list(char *vhci_class, int	*ndrivers)
9511f7209cf2Spramodbg {
9512f7209cf2Spramodbg 	char	**driver_list, **ret_driver_list = NULL;
9513f7209cf2Spramodbg 	int	*root_support_list;
9514f7209cf2Spramodbg 	int	cur_elements, max_elements;
9515f7209cf2Spramodbg 
9516f7209cf2Spramodbg 	get_phci_driver_list(vhci_class, &driver_list, &root_support_list,
9517f7209cf2Spramodbg 	    &cur_elements, &max_elements);
9518f7209cf2Spramodbg 
9519f7209cf2Spramodbg 
9520f7209cf2Spramodbg 	if (driver_list) {
9521f7209cf2Spramodbg 		kmem_free(root_support_list, sizeof (int) * max_elements);
9522f7209cf2Spramodbg 		ret_driver_list = mdi_realloc(driver_list, sizeof (char *)
9523f7209cf2Spramodbg 		    * max_elements, sizeof (char *) * cur_elements);
9524f7209cf2Spramodbg 	}
9525f7209cf2Spramodbg 	*ndrivers = cur_elements;
9526f7209cf2Spramodbg 
9527f7209cf2Spramodbg 	return (ret_driver_list);
9528f7209cf2Spramodbg 
9529f7209cf2Spramodbg }
9530f7209cf2Spramodbg 
9531f7209cf2Spramodbg void
9532f7209cf2Spramodbg mdi_free_phci_driver_list(char **driver_list, int ndrivers)
9533f7209cf2Spramodbg {
9534f7209cf2Spramodbg 	char	**p;
9535f7209cf2Spramodbg 	int	i;
9536f7209cf2Spramodbg 
9537f7209cf2Spramodbg 	if (driver_list) {
9538f7209cf2Spramodbg 		for (i = 0, p = driver_list; i < ndrivers; i++, p++)
9539f7209cf2Spramodbg 			kmem_free(*p, strlen(*p) + 1);
9540f7209cf2Spramodbg 		kmem_free(driver_list, sizeof (char *) * ndrivers);
9541f7209cf2Spramodbg 	}
9542f7209cf2Spramodbg }
954355e592a2SRandall Ralphs 
954455e592a2SRandall Ralphs /*
954555e592a2SRandall Ralphs  * mdi_is_dev_supported():
954655e592a2SRandall Ralphs  *		function called by pHCI bus config operation to determine if a
954755e592a2SRandall Ralphs  *		device should be represented as a child of the vHCI or the
954855e592a2SRandall Ralphs  *		pHCI.  This decision is made by the vHCI, using cinfo idenity
954955e592a2SRandall Ralphs  *		information passed by the pHCI - specifics of the cinfo
955055e592a2SRandall Ralphs  *		representation are by agreement between the pHCI and vHCI.
955155e592a2SRandall Ralphs  * Return Values:
955255e592a2SRandall Ralphs  *		MDI_SUCCESS
955355e592a2SRandall Ralphs  *		MDI_FAILURE
955455e592a2SRandall Ralphs  */
955555e592a2SRandall Ralphs int
955655e592a2SRandall Ralphs mdi_is_dev_supported(char *class, dev_info_t *pdip, void *cinfo)
955755e592a2SRandall Ralphs {
955855e592a2SRandall Ralphs 	mdi_vhci_t	*vh;
955955e592a2SRandall Ralphs 
956055e592a2SRandall Ralphs 	ASSERT(class && pdip);
956155e592a2SRandall Ralphs 
956255e592a2SRandall Ralphs 	/*
956355e592a2SRandall Ralphs 	 * For dev_supported, mdi_phci_register() must have established pdip as
956455e592a2SRandall Ralphs 	 * a pHCI.
956555e592a2SRandall Ralphs 	 *
956655e592a2SRandall Ralphs 	 * NOTE: mdi_phci_register() does "mpxio-disable" processing, and
956755e592a2SRandall Ralphs 	 * MDI_PHCI(pdip) will return false if mpxio is disabled.
956855e592a2SRandall Ralphs 	 */
956955e592a2SRandall Ralphs 	if (!MDI_PHCI(pdip))
957055e592a2SRandall Ralphs 		return (MDI_FAILURE);
957155e592a2SRandall Ralphs 
957255e592a2SRandall Ralphs 	/* Return MDI_FAILURE if vHCI does not support asking the question. */
957355e592a2SRandall Ralphs 	vh = (mdi_vhci_t *)i_mdi_vhci_class2vhci(class);
957455e592a2SRandall Ralphs 	if ((vh == NULL) || (vh->vh_ops->vo_is_dev_supported == NULL)) {
957555e592a2SRandall Ralphs 		return (MDI_FAILURE);
957655e592a2SRandall Ralphs 	}
957755e592a2SRandall Ralphs 
957855e592a2SRandall Ralphs 	/* Return vHCI answer */
957955e592a2SRandall Ralphs 	return (vh->vh_ops->vo_is_dev_supported(vh->vh_dip, pdip, cinfo));
958055e592a2SRandall Ralphs }
958155e592a2SRandall Ralphs 
958255e592a2SRandall Ralphs int
958355e592a2SRandall Ralphs mdi_dc_return_dev_state(mdi_pathinfo_t *pip, struct devctl_iocdata *dcp)
958455e592a2SRandall Ralphs {
958555e592a2SRandall Ralphs 	uint_t devstate = 0;
958655e592a2SRandall Ralphs 	dev_info_t *cdip;
958755e592a2SRandall Ralphs 
958855e592a2SRandall Ralphs 	if ((pip == NULL) || (dcp == NULL))
958955e592a2SRandall Ralphs 		return (MDI_FAILURE);
959055e592a2SRandall Ralphs 
959155e592a2SRandall Ralphs 	cdip = mdi_pi_get_client(pip);
959255e592a2SRandall Ralphs 
959355e592a2SRandall Ralphs 	switch (mdi_pi_get_state(pip)) {
959455e592a2SRandall Ralphs 	case MDI_PATHINFO_STATE_INIT:
959555e592a2SRandall Ralphs 		devstate = DEVICE_DOWN;
959655e592a2SRandall Ralphs 		break;
959755e592a2SRandall Ralphs 	case MDI_PATHINFO_STATE_ONLINE:
959855e592a2SRandall Ralphs 		devstate = DEVICE_ONLINE;
959955e592a2SRandall Ralphs 		if ((cdip) && (devi_stillreferenced(cdip) == DEVI_REFERENCED))
960055e592a2SRandall Ralphs 			devstate |= DEVICE_BUSY;
960155e592a2SRandall Ralphs 		break;
960255e592a2SRandall Ralphs 	case MDI_PATHINFO_STATE_STANDBY:
960355e592a2SRandall Ralphs 		devstate = DEVICE_ONLINE;
960455e592a2SRandall Ralphs 		break;
960555e592a2SRandall Ralphs 	case MDI_PATHINFO_STATE_FAULT:
960655e592a2SRandall Ralphs 		devstate = DEVICE_DOWN;
960755e592a2SRandall Ralphs 		break;
960855e592a2SRandall Ralphs 	case MDI_PATHINFO_STATE_OFFLINE:
960955e592a2SRandall Ralphs 		devstate = DEVICE_OFFLINE;
961055e592a2SRandall Ralphs 		break;
961155e592a2SRandall Ralphs 	default:
961255e592a2SRandall Ralphs 		ASSERT(MDI_PI(pip)->pi_state);
961355e592a2SRandall Ralphs 	}
961455e592a2SRandall Ralphs 
961555e592a2SRandall Ralphs 	if (copyout(&devstate, dcp->cpyout_buf, sizeof (uint_t)) != 0)
961655e592a2SRandall Ralphs 		return (MDI_FAILURE);
961755e592a2SRandall Ralphs 
961855e592a2SRandall Ralphs 	return (MDI_SUCCESS);
961955e592a2SRandall Ralphs }
9620