xref: /titanic_51/usr/src/uts/common/os/sunmdi.c (revision d3d50737e566cade9a08d73d2af95105ac7cd960)
17c478bd9Sstevel@tonic-gate /*
27c478bd9Sstevel@tonic-gate  * CDDL HEADER START
37c478bd9Sstevel@tonic-gate  *
47c478bd9Sstevel@tonic-gate  * The contents of this file are subject to the terms of the
5ee28b439Scm136836  * Common Development and Distribution License (the "License").
6ee28b439Scm136836  * You may not use this file except in compliance with the License.
77c478bd9Sstevel@tonic-gate  *
87c478bd9Sstevel@tonic-gate  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
97c478bd9Sstevel@tonic-gate  * or http://www.opensolaris.org/os/licensing.
107c478bd9Sstevel@tonic-gate  * See the License for the specific language governing permissions
117c478bd9Sstevel@tonic-gate  * and limitations under the License.
127c478bd9Sstevel@tonic-gate  *
137c478bd9Sstevel@tonic-gate  * When distributing Covered Code, include this CDDL HEADER in each
147c478bd9Sstevel@tonic-gate  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
157c478bd9Sstevel@tonic-gate  * If applicable, add the following below this CDDL HEADER, with the
167c478bd9Sstevel@tonic-gate  * fields enclosed by brackets "[]" replaced with your own identifying
177c478bd9Sstevel@tonic-gate  * information: Portions Copyright [yyyy] [name of copyright owner]
187c478bd9Sstevel@tonic-gate  *
197c478bd9Sstevel@tonic-gate  * CDDL HEADER END
207c478bd9Sstevel@tonic-gate  */
217c478bd9Sstevel@tonic-gate /*
2255e592a2SRandall Ralphs  * Copyright 2009 Sun Microsystems, Inc.  All rights reserved.
237c478bd9Sstevel@tonic-gate  * Use is subject to license terms.
247c478bd9Sstevel@tonic-gate  */
257c478bd9Sstevel@tonic-gate 
267c478bd9Sstevel@tonic-gate /*
277c478bd9Sstevel@tonic-gate  * Multipath driver interface (MDI) implementation; see mdi_impl.h for a more
287c478bd9Sstevel@tonic-gate  * detailed discussion of the overall mpxio architecture.
297c478bd9Sstevel@tonic-gate  *
307c478bd9Sstevel@tonic-gate  * Default locking order:
317c478bd9Sstevel@tonic-gate  *
325e3986cbScth  * _NOTE(LOCK_ORDER(mdi_mutex, mdi_vhci:vh_phci_mutex);
335e3986cbScth  * _NOTE(LOCK_ORDER(mdi_mutex, mdi_vhci:vh_client_mutex);
345e3986cbScth  * _NOTE(LOCK_ORDER(mdi_vhci:vh_phci_mutex, mdi_phci::ph_mutex);
355e3986cbScth  * _NOTE(LOCK_ORDER(mdi_vhci:vh_client_mutex, mdi_client::ct_mutex);
367c478bd9Sstevel@tonic-gate  * _NOTE(LOCK_ORDER(mdi_phci::ph_mutex mdi_pathinfo::pi_mutex))
377c478bd9Sstevel@tonic-gate  * _NOTE(LOCK_ORDER(mdi_phci::ph_mutex mdi_client::ct_mutex))
387c478bd9Sstevel@tonic-gate  * _NOTE(LOCK_ORDER(mdi_client::ct_mutex mdi_pathinfo::pi_mutex))
397c478bd9Sstevel@tonic-gate  */
407c478bd9Sstevel@tonic-gate 
417c478bd9Sstevel@tonic-gate #include <sys/note.h>
427c478bd9Sstevel@tonic-gate #include <sys/types.h>
437c478bd9Sstevel@tonic-gate #include <sys/varargs.h>
447c478bd9Sstevel@tonic-gate #include <sys/param.h>
457c478bd9Sstevel@tonic-gate #include <sys/errno.h>
467c478bd9Sstevel@tonic-gate #include <sys/uio.h>
477c478bd9Sstevel@tonic-gate #include <sys/buf.h>
487c478bd9Sstevel@tonic-gate #include <sys/modctl.h>
497c478bd9Sstevel@tonic-gate #include <sys/open.h>
507c478bd9Sstevel@tonic-gate #include <sys/kmem.h>
517c478bd9Sstevel@tonic-gate #include <sys/poll.h>
527c478bd9Sstevel@tonic-gate #include <sys/conf.h>
537c478bd9Sstevel@tonic-gate #include <sys/bootconf.h>
547c478bd9Sstevel@tonic-gate #include <sys/cmn_err.h>
557c478bd9Sstevel@tonic-gate #include <sys/stat.h>
567c478bd9Sstevel@tonic-gate #include <sys/ddi.h>
577c478bd9Sstevel@tonic-gate #include <sys/sunddi.h>
587c478bd9Sstevel@tonic-gate #include <sys/ddipropdefs.h>
597c478bd9Sstevel@tonic-gate #include <sys/sunndi.h>
607c478bd9Sstevel@tonic-gate #include <sys/ndi_impldefs.h>
617c478bd9Sstevel@tonic-gate #include <sys/promif.h>
627c478bd9Sstevel@tonic-gate #include <sys/sunmdi.h>
637c478bd9Sstevel@tonic-gate #include <sys/mdi_impldefs.h>
647c478bd9Sstevel@tonic-gate #include <sys/taskq.h>
657c478bd9Sstevel@tonic-gate #include <sys/epm.h>
667c478bd9Sstevel@tonic-gate #include <sys/sunpm.h>
673c34adc5Sramat #include <sys/modhash.h>
688c4f8890Srs135747 #include <sys/disp.h>
698c4f8890Srs135747 #include <sys/autoconf.h>
70f7209cf2Spramodbg #include <sys/sysmacros.h>
717c478bd9Sstevel@tonic-gate 
727c478bd9Sstevel@tonic-gate #ifdef	DEBUG
737c478bd9Sstevel@tonic-gate #include <sys/debug.h>
747c478bd9Sstevel@tonic-gate int	mdi_debug = 1;
755e3986cbScth int	mdi_debug_logonly = 0;
764c06356bSdh142964 #define	MDI_DEBUG(dbglevel, pargs) if (mdi_debug >= (dbglevel))	i_mdi_log pargs
774c06356bSdh142964 #define	MDI_WARN	CE_WARN, __func__
784c06356bSdh142964 #define	MDI_NOTE	CE_NOTE, __func__
794c06356bSdh142964 #define	MDI_CONT	CE_CONT, __func__
804c06356bSdh142964 static void i_mdi_log(int, const char *, dev_info_t *, const char *, ...);
817c478bd9Sstevel@tonic-gate #else	/* !DEBUG */
824c06356bSdh142964 #define	MDI_DEBUG(dbglevel, pargs)
837c478bd9Sstevel@tonic-gate #endif	/* DEBUG */
844c06356bSdh142964 int	mdi_debug_consoleonly = 0;
8596c4a178SChris Horne int	mdi_delay = 3;
867c478bd9Sstevel@tonic-gate 
877c478bd9Sstevel@tonic-gate extern pri_t	minclsyspri;
887c478bd9Sstevel@tonic-gate extern int	modrootloaded;
897c478bd9Sstevel@tonic-gate 
907c478bd9Sstevel@tonic-gate /*
917c478bd9Sstevel@tonic-gate  * Global mutex:
925e3986cbScth  * Protects vHCI list and structure members.
937c478bd9Sstevel@tonic-gate  */
947c478bd9Sstevel@tonic-gate kmutex_t	mdi_mutex;
957c478bd9Sstevel@tonic-gate 
967c478bd9Sstevel@tonic-gate /*
977c478bd9Sstevel@tonic-gate  * Registered vHCI class driver lists
987c478bd9Sstevel@tonic-gate  */
997c478bd9Sstevel@tonic-gate int		mdi_vhci_count;
1007c478bd9Sstevel@tonic-gate mdi_vhci_t	*mdi_vhci_head;
1017c478bd9Sstevel@tonic-gate mdi_vhci_t	*mdi_vhci_tail;
1027c478bd9Sstevel@tonic-gate 
1037c478bd9Sstevel@tonic-gate /*
1047c478bd9Sstevel@tonic-gate  * Client Hash Table size
1057c478bd9Sstevel@tonic-gate  */
1067c478bd9Sstevel@tonic-gate static int	mdi_client_table_size = CLIENT_HASH_TABLE_SIZE;
1077c478bd9Sstevel@tonic-gate 
1087c478bd9Sstevel@tonic-gate /*
1097c478bd9Sstevel@tonic-gate  * taskq interface definitions
1107c478bd9Sstevel@tonic-gate  */
1117c478bd9Sstevel@tonic-gate #define	MDI_TASKQ_N_THREADS	8
1127c478bd9Sstevel@tonic-gate #define	MDI_TASKQ_PRI		minclsyspri
1137c478bd9Sstevel@tonic-gate #define	MDI_TASKQ_MINALLOC	(4*mdi_taskq_n_threads)
1147c478bd9Sstevel@tonic-gate #define	MDI_TASKQ_MAXALLOC	(500*mdi_taskq_n_threads)
1157c478bd9Sstevel@tonic-gate 
1167c478bd9Sstevel@tonic-gate taskq_t				*mdi_taskq;
1177c478bd9Sstevel@tonic-gate static uint_t			mdi_taskq_n_threads = MDI_TASKQ_N_THREADS;
1187c478bd9Sstevel@tonic-gate 
1193c34adc5Sramat #define	TICKS_PER_SECOND	(drv_usectohz(1000000))
1203c34adc5Sramat 
1217c478bd9Sstevel@tonic-gate /*
1223c34adc5Sramat  * The data should be "quiet" for this interval (in seconds) before the
1233c34adc5Sramat  * vhci cached data is flushed to the disk.
1247c478bd9Sstevel@tonic-gate  */
1253c34adc5Sramat static int mdi_vhcache_flush_delay = 10;
1263c34adc5Sramat 
1273c34adc5Sramat /* number of seconds the vhcache flush daemon will sleep idle before exiting */
1283c34adc5Sramat static int mdi_vhcache_flush_daemon_idle_time = 60;
1293c34adc5Sramat 
1303c34adc5Sramat /*
13167e56d35Sramat  * MDI falls back to discovery of all paths when a bus_config_one fails.
13267e56d35Sramat  * The following parameters can be used to tune this operation.
13367e56d35Sramat  *
13467e56d35Sramat  * mdi_path_discovery_boot
13567e56d35Sramat  *	Number of times path discovery will be attempted during early boot.
13667e56d35Sramat  *	Probably there is no reason to ever set this value to greater than one.
13767e56d35Sramat  *
13867e56d35Sramat  * mdi_path_discovery_postboot
13967e56d35Sramat  *	Number of times path discovery will be attempted after early boot.
14067e56d35Sramat  *	Set it to a minimum of two to allow for discovery of iscsi paths which
14167e56d35Sramat  *	may happen very late during booting.
14267e56d35Sramat  *
14367e56d35Sramat  * mdi_path_discovery_interval
14467e56d35Sramat  *	Minimum number of seconds MDI will wait between successive discovery
14567e56d35Sramat  *	of all paths. Set it to -1 to disable discovery of all paths.
14667e56d35Sramat  */
14767e56d35Sramat static int mdi_path_discovery_boot = 1;
14867e56d35Sramat static int mdi_path_discovery_postboot = 2;
14967e56d35Sramat static int mdi_path_discovery_interval = 10;
15067e56d35Sramat 
15167e56d35Sramat /*
1523c34adc5Sramat  * number of seconds the asynchronous configuration thread will sleep idle
1533c34adc5Sramat  * before exiting.
1543c34adc5Sramat  */
1553c34adc5Sramat static int mdi_async_config_idle_time = 600;
1563c34adc5Sramat 
1573c34adc5Sramat static int mdi_bus_config_cache_hash_size = 256;
1583c34adc5Sramat 
1593c34adc5Sramat /* turns off multithreaded configuration for certain operations */
1603c34adc5Sramat static int mdi_mtc_off = 0;
1617c478bd9Sstevel@tonic-gate 
1627c478bd9Sstevel@tonic-gate /*
163602ca9eaScth  * The "path" to a pathinfo node is identical to the /devices path to a
164602ca9eaScth  * devinfo node had the device been enumerated under a pHCI instead of
165602ca9eaScth  * a vHCI.  This pathinfo "path" is associated with a 'path_instance'.
166602ca9eaScth  * This association persists across create/delete of the pathinfo nodes,
167602ca9eaScth  * but not across reboot.
168602ca9eaScth  */
169602ca9eaScth static uint_t		mdi_pathmap_instance = 1;	/* 0 -> any path */
170602ca9eaScth static int		mdi_pathmap_hash_size = 256;
171602ca9eaScth static kmutex_t		mdi_pathmap_mutex;
172602ca9eaScth static mod_hash_t	*mdi_pathmap_bypath;		/* "path"->instance */
173602ca9eaScth static mod_hash_t	*mdi_pathmap_byinstance;	/* instance->"path" */
1744c06356bSdh142964 static mod_hash_t	*mdi_pathmap_sbyinstance;	/* inst->shortpath */
175602ca9eaScth 
176602ca9eaScth /*
1777c478bd9Sstevel@tonic-gate  * MDI component property name/value string definitions
1787c478bd9Sstevel@tonic-gate  */
1797c478bd9Sstevel@tonic-gate const char 		*mdi_component_prop = "mpxio-component";
1807c478bd9Sstevel@tonic-gate const char		*mdi_component_prop_vhci = "vhci";
1817c478bd9Sstevel@tonic-gate const char		*mdi_component_prop_phci = "phci";
1827c478bd9Sstevel@tonic-gate const char		*mdi_component_prop_client = "client";
1837c478bd9Sstevel@tonic-gate 
1847c478bd9Sstevel@tonic-gate /*
1857c478bd9Sstevel@tonic-gate  * MDI client global unique identifier property name
1867c478bd9Sstevel@tonic-gate  */
1877c478bd9Sstevel@tonic-gate const char		*mdi_client_guid_prop = "client-guid";
1887c478bd9Sstevel@tonic-gate 
1897c478bd9Sstevel@tonic-gate /*
1907c478bd9Sstevel@tonic-gate  * MDI client load balancing property name/value string definitions
1917c478bd9Sstevel@tonic-gate  */
1927c478bd9Sstevel@tonic-gate const char		*mdi_load_balance = "load-balance";
1937c478bd9Sstevel@tonic-gate const char		*mdi_load_balance_none = "none";
1947c478bd9Sstevel@tonic-gate const char		*mdi_load_balance_rr = "round-robin";
1957c478bd9Sstevel@tonic-gate const char		*mdi_load_balance_lba = "logical-block";
1967c478bd9Sstevel@tonic-gate 
1977c478bd9Sstevel@tonic-gate /*
1987c478bd9Sstevel@tonic-gate  * Obsolete vHCI class definition; to be removed after Leadville update
1997c478bd9Sstevel@tonic-gate  */
2007c478bd9Sstevel@tonic-gate const char *mdi_vhci_class_scsi = MDI_HCI_CLASS_SCSI;
2017c478bd9Sstevel@tonic-gate 
2027c478bd9Sstevel@tonic-gate static char vhci_greeting[] =
2037c478bd9Sstevel@tonic-gate 	"\tThere already exists one vHCI driver for class %s\n"
2047c478bd9Sstevel@tonic-gate 	"\tOnly one vHCI driver for each class is allowed\n";
2057c478bd9Sstevel@tonic-gate 
2067c478bd9Sstevel@tonic-gate /*
2077c478bd9Sstevel@tonic-gate  * Static function prototypes
2087c478bd9Sstevel@tonic-gate  */
2097c478bd9Sstevel@tonic-gate static int		i_mdi_phci_offline(dev_info_t *, uint_t);
2107c478bd9Sstevel@tonic-gate static int		i_mdi_client_offline(dev_info_t *, uint_t);
2117c478bd9Sstevel@tonic-gate static int		i_mdi_phci_pre_detach(dev_info_t *, ddi_detach_cmd_t);
2127c478bd9Sstevel@tonic-gate static void		i_mdi_phci_post_detach(dev_info_t *,
2137c478bd9Sstevel@tonic-gate 			    ddi_detach_cmd_t, int);
2147c478bd9Sstevel@tonic-gate static int		i_mdi_client_pre_detach(dev_info_t *,
2157c478bd9Sstevel@tonic-gate 			    ddi_detach_cmd_t);
2167c478bd9Sstevel@tonic-gate static void		i_mdi_client_post_detach(dev_info_t *,
2177c478bd9Sstevel@tonic-gate 			    ddi_detach_cmd_t, int);
2187c478bd9Sstevel@tonic-gate static void		i_mdi_pm_hold_pip(mdi_pathinfo_t *);
2197c478bd9Sstevel@tonic-gate static void		i_mdi_pm_rele_pip(mdi_pathinfo_t *);
2207c478bd9Sstevel@tonic-gate static int 		i_mdi_lba_lb(mdi_client_t *ct,
2217c478bd9Sstevel@tonic-gate 			    mdi_pathinfo_t **ret_pip, struct buf *buf);
2227c478bd9Sstevel@tonic-gate static void		i_mdi_pm_hold_client(mdi_client_t *, int);
2237c478bd9Sstevel@tonic-gate static void		i_mdi_pm_rele_client(mdi_client_t *, int);
2247c478bd9Sstevel@tonic-gate static void		i_mdi_pm_reset_client(mdi_client_t *);
2257c478bd9Sstevel@tonic-gate static int		i_mdi_power_all_phci(mdi_client_t *);
2268c4f8890Srs135747 static void		i_mdi_log_sysevent(dev_info_t *, char *, char *);
2277c478bd9Sstevel@tonic-gate 
2287c478bd9Sstevel@tonic-gate 
2297c478bd9Sstevel@tonic-gate /*
2307c478bd9Sstevel@tonic-gate  * Internal mdi_pathinfo node functions
2317c478bd9Sstevel@tonic-gate  */
2327c478bd9Sstevel@tonic-gate static void		i_mdi_pi_kstat_destroy(mdi_pathinfo_t *);
2337c478bd9Sstevel@tonic-gate 
2347c478bd9Sstevel@tonic-gate static mdi_vhci_t	*i_mdi_vhci_class2vhci(char *);
2357c478bd9Sstevel@tonic-gate static mdi_vhci_t	*i_devi_get_vhci(dev_info_t *);
2367c478bd9Sstevel@tonic-gate static mdi_phci_t	*i_devi_get_phci(dev_info_t *);
2377c478bd9Sstevel@tonic-gate static void		i_mdi_phci_lock(mdi_phci_t *, mdi_pathinfo_t *);
2387c478bd9Sstevel@tonic-gate static void		i_mdi_phci_unlock(mdi_phci_t *);
2393c34adc5Sramat static mdi_pathinfo_t	*i_mdi_pi_alloc(mdi_phci_t *, char *, mdi_client_t *);
2407c478bd9Sstevel@tonic-gate static void		i_mdi_phci_add_path(mdi_phci_t *, mdi_pathinfo_t *);
2417c478bd9Sstevel@tonic-gate static void		i_mdi_client_add_path(mdi_client_t *, mdi_pathinfo_t *);
2427c478bd9Sstevel@tonic-gate static void		i_mdi_pi_free(mdi_phci_t *ph, mdi_pathinfo_t *,
2437c478bd9Sstevel@tonic-gate 			    mdi_client_t *);
2447c478bd9Sstevel@tonic-gate static void		i_mdi_phci_remove_path(mdi_phci_t *, mdi_pathinfo_t *);
2457c478bd9Sstevel@tonic-gate static void		i_mdi_client_remove_path(mdi_client_t *,
2467c478bd9Sstevel@tonic-gate 			    mdi_pathinfo_t *);
2477c478bd9Sstevel@tonic-gate 
2487c478bd9Sstevel@tonic-gate static int		i_mdi_pi_state_change(mdi_pathinfo_t *,
2497c478bd9Sstevel@tonic-gate 			    mdi_pathinfo_state_t, int);
2507c478bd9Sstevel@tonic-gate static int		i_mdi_pi_offline(mdi_pathinfo_t *, int);
2517c478bd9Sstevel@tonic-gate static dev_info_t	*i_mdi_devinfo_create(mdi_vhci_t *, char *, char *,
2523c34adc5Sramat 			    char **, int);
2537c478bd9Sstevel@tonic-gate static dev_info_t	*i_mdi_devinfo_find(mdi_vhci_t *, char *, char *);
2547c478bd9Sstevel@tonic-gate static int		i_mdi_devinfo_remove(dev_info_t *, dev_info_t *, int);
2557c478bd9Sstevel@tonic-gate static int		i_mdi_is_child_present(dev_info_t *, dev_info_t *);
2563c34adc5Sramat static mdi_client_t	*i_mdi_client_alloc(mdi_vhci_t *, char *, char *);
2577c478bd9Sstevel@tonic-gate static void		i_mdi_client_enlist_table(mdi_vhci_t *, mdi_client_t *);
2587c478bd9Sstevel@tonic-gate static void		i_mdi_client_delist_table(mdi_vhci_t *, mdi_client_t *);
2593c34adc5Sramat static mdi_client_t	*i_mdi_client_find(mdi_vhci_t *, char *, char *);
2607c478bd9Sstevel@tonic-gate static void		i_mdi_client_update_state(mdi_client_t *);
2617c478bd9Sstevel@tonic-gate static int		i_mdi_client_compute_state(mdi_client_t *,
2627c478bd9Sstevel@tonic-gate 			    mdi_phci_t *);
2637c478bd9Sstevel@tonic-gate static void		i_mdi_client_lock(mdi_client_t *, mdi_pathinfo_t *);
2647c478bd9Sstevel@tonic-gate static void		i_mdi_client_unlock(mdi_client_t *);
2657c478bd9Sstevel@tonic-gate static int		i_mdi_client_free(mdi_vhci_t *, mdi_client_t *);
2667c478bd9Sstevel@tonic-gate static mdi_client_t	*i_devi_get_client(dev_info_t *);
267ee28b439Scm136836 /*
268ee28b439Scm136836  * NOTE: this will be removed once the NWS files are changed to use the new
269ee28b439Scm136836  * mdi_{enable,disable}_path interfaces
270ee28b439Scm136836  */
271ee28b439Scm136836 static int		i_mdi_pi_enable_disable(dev_info_t *, dev_info_t *,
272ee28b439Scm136836 				int, int);
273ee28b439Scm136836 static mdi_pathinfo_t 	*i_mdi_enable_disable_path(mdi_pathinfo_t *pip,
274ee28b439Scm136836 				mdi_vhci_t *vh, int flags, int op);
2757c478bd9Sstevel@tonic-gate /*
2767c478bd9Sstevel@tonic-gate  * Failover related function prototypes
2777c478bd9Sstevel@tonic-gate  */
2787c478bd9Sstevel@tonic-gate static int		i_mdi_failover(void *);
2797c478bd9Sstevel@tonic-gate 
2807c478bd9Sstevel@tonic-gate /*
2817c478bd9Sstevel@tonic-gate  * misc internal functions
2827c478bd9Sstevel@tonic-gate  */
2837c478bd9Sstevel@tonic-gate static int		i_mdi_get_hash_key(char *);
2847c478bd9Sstevel@tonic-gate static int		i_map_nvlist_error_to_mdi(int);
2857c478bd9Sstevel@tonic-gate static void		i_mdi_report_path_state(mdi_client_t *,
2867c478bd9Sstevel@tonic-gate 			    mdi_pathinfo_t *);
2877c478bd9Sstevel@tonic-gate 
2883c34adc5Sramat static void		setup_vhci_cache(mdi_vhci_t *);
2893c34adc5Sramat static int		destroy_vhci_cache(mdi_vhci_t *);
2903c34adc5Sramat static int		stop_vhcache_async_threads(mdi_vhci_config_t *);
2913c34adc5Sramat static boolean_t	stop_vhcache_flush_thread(void *, int);
2923c34adc5Sramat static void		free_string_array(char **, int);
2933c34adc5Sramat static void		free_vhcache_phci(mdi_vhcache_phci_t *);
2943c34adc5Sramat static void		free_vhcache_pathinfo(mdi_vhcache_pathinfo_t *);
2953c34adc5Sramat static void		free_vhcache_client(mdi_vhcache_client_t *);
2963c34adc5Sramat static int		mainnvl_to_vhcache(mdi_vhci_cache_t *, nvlist_t *);
2973c34adc5Sramat static nvlist_t		*vhcache_to_mainnvl(mdi_vhci_cache_t *);
2983c34adc5Sramat static void		vhcache_phci_add(mdi_vhci_config_t *, mdi_phci_t *);
2993c34adc5Sramat static void		vhcache_phci_remove(mdi_vhci_config_t *, mdi_phci_t *);
3003c34adc5Sramat static void		vhcache_pi_add(mdi_vhci_config_t *,
3013c34adc5Sramat 			    struct mdi_pathinfo *);
3023c34adc5Sramat static void		vhcache_pi_remove(mdi_vhci_config_t *,
3033c34adc5Sramat 			    struct mdi_pathinfo *);
3043c34adc5Sramat static void		free_phclient_path_list(mdi_phys_path_t *);
3053c34adc5Sramat static void		sort_vhcache_paths(mdi_vhcache_client_t *);
3063c34adc5Sramat static int		flush_vhcache(mdi_vhci_config_t *, int);
3073c34adc5Sramat static void		vhcache_dirty(mdi_vhci_config_t *);
3083c34adc5Sramat static void		free_async_client_config(mdi_async_client_config_t *);
30967e56d35Sramat static void		single_threaded_vhconfig_enter(mdi_vhci_config_t *);
31067e56d35Sramat static void		single_threaded_vhconfig_exit(mdi_vhci_config_t *);
3113c34adc5Sramat static nvlist_t		*read_on_disk_vhci_cache(char *);
3123c34adc5Sramat extern int		fread_nvlist(char *, nvlist_t **);
3133c34adc5Sramat extern int		fwrite_nvlist(char *, nvlist_t *);
3143c34adc5Sramat 
3157c478bd9Sstevel@tonic-gate /* called once when first vhci registers with mdi */
3167c478bd9Sstevel@tonic-gate static void
3177c478bd9Sstevel@tonic-gate i_mdi_init()
3187c478bd9Sstevel@tonic-gate {
3197c478bd9Sstevel@tonic-gate 	static int initialized = 0;
3207c478bd9Sstevel@tonic-gate 
3217c478bd9Sstevel@tonic-gate 	if (initialized)
3227c478bd9Sstevel@tonic-gate 		return;
3237c478bd9Sstevel@tonic-gate 	initialized = 1;
3247c478bd9Sstevel@tonic-gate 
3257c478bd9Sstevel@tonic-gate 	mutex_init(&mdi_mutex, NULL, MUTEX_DEFAULT, NULL);
326602ca9eaScth 
327602ca9eaScth 	/* Create our taskq resources */
3287c478bd9Sstevel@tonic-gate 	mdi_taskq = taskq_create("mdi_taskq", mdi_taskq_n_threads,
3297c478bd9Sstevel@tonic-gate 	    MDI_TASKQ_PRI, MDI_TASKQ_MINALLOC, MDI_TASKQ_MAXALLOC,
3307c478bd9Sstevel@tonic-gate 	    TASKQ_PREPOPULATE | TASKQ_CPR_SAFE);
3317c478bd9Sstevel@tonic-gate 	ASSERT(mdi_taskq != NULL);	/* taskq_create never fails */
332602ca9eaScth 
333602ca9eaScth 	/* Allocate ['path_instance' <-> "path"] maps */
334602ca9eaScth 	mutex_init(&mdi_pathmap_mutex, NULL, MUTEX_DRIVER, NULL);
335602ca9eaScth 	mdi_pathmap_bypath = mod_hash_create_strhash(
336602ca9eaScth 	    "mdi_pathmap_bypath", mdi_pathmap_hash_size,
337602ca9eaScth 	    mod_hash_null_valdtor);
338602ca9eaScth 	mdi_pathmap_byinstance = mod_hash_create_idhash(
339602ca9eaScth 	    "mdi_pathmap_byinstance", mdi_pathmap_hash_size,
340602ca9eaScth 	    mod_hash_null_valdtor);
3414c06356bSdh142964 	mdi_pathmap_sbyinstance = mod_hash_create_idhash(
3424c06356bSdh142964 	    "mdi_pathmap_sbyinstance", mdi_pathmap_hash_size,
3434c06356bSdh142964 	    mod_hash_null_valdtor);
3447c478bd9Sstevel@tonic-gate }
3457c478bd9Sstevel@tonic-gate 
3467c478bd9Sstevel@tonic-gate /*
3477c478bd9Sstevel@tonic-gate  * mdi_get_component_type():
3487c478bd9Sstevel@tonic-gate  *		Return mpxio component type
3497c478bd9Sstevel@tonic-gate  * Return Values:
3507c478bd9Sstevel@tonic-gate  *		MDI_COMPONENT_NONE
3517c478bd9Sstevel@tonic-gate  *		MDI_COMPONENT_VHCI
3527c478bd9Sstevel@tonic-gate  *		MDI_COMPONENT_PHCI
3537c478bd9Sstevel@tonic-gate  *		MDI_COMPONENT_CLIENT
3547c478bd9Sstevel@tonic-gate  * XXX This doesn't work under multi-level MPxIO and should be
3555e3986cbScth  *	removed when clients migrate mdi_component_is_*() interfaces.
3567c478bd9Sstevel@tonic-gate  */
3577c478bd9Sstevel@tonic-gate int
3587c478bd9Sstevel@tonic-gate mdi_get_component_type(dev_info_t *dip)
3597c478bd9Sstevel@tonic-gate {
3607c478bd9Sstevel@tonic-gate 	return (DEVI(dip)->devi_mdi_component);
3617c478bd9Sstevel@tonic-gate }
3627c478bd9Sstevel@tonic-gate 
3637c478bd9Sstevel@tonic-gate /*
3647c478bd9Sstevel@tonic-gate  * mdi_vhci_register():
3657c478bd9Sstevel@tonic-gate  *		Register a vHCI module with the mpxio framework
3667c478bd9Sstevel@tonic-gate  *		mdi_vhci_register() is called by vHCI drivers to register the
3677c478bd9Sstevel@tonic-gate  *		'class_driver' vHCI driver and its MDI entrypoints with the
3687c478bd9Sstevel@tonic-gate  *		mpxio framework.  The vHCI driver must call this interface as
3697c478bd9Sstevel@tonic-gate  *		part of its attach(9e) handler.
3707c478bd9Sstevel@tonic-gate  *		Competing threads may try to attach mdi_vhci_register() as
3717c478bd9Sstevel@tonic-gate  *		the vHCI drivers are loaded and attached as a result of pHCI
3727c478bd9Sstevel@tonic-gate  *		driver instance registration (mdi_phci_register()) with the
3737c478bd9Sstevel@tonic-gate  *		framework.
3747c478bd9Sstevel@tonic-gate  * Return Values:
3757c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
3767c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
3777c478bd9Sstevel@tonic-gate  */
3787c478bd9Sstevel@tonic-gate /*ARGSUSED*/
3797c478bd9Sstevel@tonic-gate int
3807c478bd9Sstevel@tonic-gate mdi_vhci_register(char *class, dev_info_t *vdip, mdi_vhci_ops_t *vops,
3817c478bd9Sstevel@tonic-gate     int flags)
3827c478bd9Sstevel@tonic-gate {
3837c478bd9Sstevel@tonic-gate 	mdi_vhci_t		*vh = NULL;
3847c478bd9Sstevel@tonic-gate 
38555e592a2SRandall Ralphs 	/* Registrant can't be older */
38655e592a2SRandall Ralphs 	ASSERT(vops->vo_revision <= MDI_VHCI_OPS_REV);
38755e592a2SRandall Ralphs 
38800a3eaf3SRamaswamy Tummala #ifdef DEBUG
38900a3eaf3SRamaswamy Tummala 	/*
39000a3eaf3SRamaswamy Tummala 	 * IB nexus driver is loaded only when IB hardware is present.
39100a3eaf3SRamaswamy Tummala 	 * In order to be able to do this there is a need to drive the loading
39200a3eaf3SRamaswamy Tummala 	 * and attaching of the IB nexus driver (especially when an IB hardware
39300a3eaf3SRamaswamy Tummala 	 * is dynamically plugged in) when an IB HCA driver (PHCI)
39400a3eaf3SRamaswamy Tummala 	 * is being attached. Unfortunately this gets into the limitations
39500a3eaf3SRamaswamy Tummala 	 * of devfs as there seems to be no clean way to drive configuration
39600a3eaf3SRamaswamy Tummala 	 * of a subtree from another subtree of a devfs. Hence, do not ASSERT
39700a3eaf3SRamaswamy Tummala 	 * for IB.
39800a3eaf3SRamaswamy Tummala 	 */
39900a3eaf3SRamaswamy Tummala 	if (strcmp(class, MDI_HCI_CLASS_IB) != 0)
4005e3986cbScth 		ASSERT(DEVI_BUSY_OWNED(ddi_get_parent(vdip)));
40100a3eaf3SRamaswamy Tummala #endif
4027c478bd9Sstevel@tonic-gate 
4037c478bd9Sstevel@tonic-gate 	i_mdi_init();
4047c478bd9Sstevel@tonic-gate 
4057c478bd9Sstevel@tonic-gate 	mutex_enter(&mdi_mutex);
4067c478bd9Sstevel@tonic-gate 	/*
4077c478bd9Sstevel@tonic-gate 	 * Scan for already registered vhci
4087c478bd9Sstevel@tonic-gate 	 */
4097c478bd9Sstevel@tonic-gate 	for (vh = mdi_vhci_head; vh != NULL; vh = vh->vh_next) {
4107c478bd9Sstevel@tonic-gate 		if (strcmp(vh->vh_class, class) == 0) {
4117c478bd9Sstevel@tonic-gate 			/*
4127c478bd9Sstevel@tonic-gate 			 * vHCI has already been created.  Check for valid
4137c478bd9Sstevel@tonic-gate 			 * vHCI ops registration.  We only support one vHCI
4147c478bd9Sstevel@tonic-gate 			 * module per class
4157c478bd9Sstevel@tonic-gate 			 */
4167c478bd9Sstevel@tonic-gate 			if (vh->vh_ops != NULL) {
4177c478bd9Sstevel@tonic-gate 				mutex_exit(&mdi_mutex);
4187c478bd9Sstevel@tonic-gate 				cmn_err(CE_NOTE, vhci_greeting, class);
4197c478bd9Sstevel@tonic-gate 				return (MDI_FAILURE);
4207c478bd9Sstevel@tonic-gate 			}
4217c478bd9Sstevel@tonic-gate 			break;
4227c478bd9Sstevel@tonic-gate 		}
4237c478bd9Sstevel@tonic-gate 	}
4247c478bd9Sstevel@tonic-gate 
4257c478bd9Sstevel@tonic-gate 	/*
4267c478bd9Sstevel@tonic-gate 	 * if not yet created, create the vHCI component
4277c478bd9Sstevel@tonic-gate 	 */
4287c478bd9Sstevel@tonic-gate 	if (vh == NULL) {
4297c478bd9Sstevel@tonic-gate 		struct client_hash	*hash = NULL;
4307c478bd9Sstevel@tonic-gate 		char			*load_balance;
4317c478bd9Sstevel@tonic-gate 
4327c478bd9Sstevel@tonic-gate 		/*
4337c478bd9Sstevel@tonic-gate 		 * Allocate and initialize the mdi extensions
4347c478bd9Sstevel@tonic-gate 		 */
4357c478bd9Sstevel@tonic-gate 		vh = kmem_zalloc(sizeof (mdi_vhci_t), KM_SLEEP);
4367c478bd9Sstevel@tonic-gate 		hash = kmem_zalloc(mdi_client_table_size * sizeof (*hash),
4377c478bd9Sstevel@tonic-gate 		    KM_SLEEP);
4387c478bd9Sstevel@tonic-gate 		vh->vh_client_table = hash;
4397c478bd9Sstevel@tonic-gate 		vh->vh_class = kmem_zalloc(strlen(class) + 1, KM_SLEEP);
4407c478bd9Sstevel@tonic-gate 		(void) strcpy(vh->vh_class, class);
4417c478bd9Sstevel@tonic-gate 		vh->vh_lb = LOAD_BALANCE_RR;
4427c478bd9Sstevel@tonic-gate 		if (ddi_prop_lookup_string(DDI_DEV_T_ANY, vdip,
4437c478bd9Sstevel@tonic-gate 		    0, LOAD_BALANCE_PROP, &load_balance) == DDI_SUCCESS) {
4447c478bd9Sstevel@tonic-gate 			if (strcmp(load_balance, LOAD_BALANCE_PROP_NONE) == 0) {
4457c478bd9Sstevel@tonic-gate 				vh->vh_lb = LOAD_BALANCE_NONE;
4467c478bd9Sstevel@tonic-gate 			} else if (strcmp(load_balance, LOAD_BALANCE_PROP_LBA)
4477c478bd9Sstevel@tonic-gate 				    == 0) {
4487c478bd9Sstevel@tonic-gate 				vh->vh_lb = LOAD_BALANCE_LBA;
4497c478bd9Sstevel@tonic-gate 			}
4507c478bd9Sstevel@tonic-gate 			ddi_prop_free(load_balance);
4517c478bd9Sstevel@tonic-gate 		}
4527c478bd9Sstevel@tonic-gate 
4535e3986cbScth 		mutex_init(&vh->vh_phci_mutex, NULL, MUTEX_DEFAULT, NULL);
4545e3986cbScth 		mutex_init(&vh->vh_client_mutex, NULL, MUTEX_DEFAULT, NULL);
4555e3986cbScth 
4567c478bd9Sstevel@tonic-gate 		/*
4577c478bd9Sstevel@tonic-gate 		 * Store the vHCI ops vectors
4587c478bd9Sstevel@tonic-gate 		 */
4597c478bd9Sstevel@tonic-gate 		vh->vh_dip = vdip;
4607c478bd9Sstevel@tonic-gate 		vh->vh_ops = vops;
4617c478bd9Sstevel@tonic-gate 
4623c34adc5Sramat 		setup_vhci_cache(vh);
4637c478bd9Sstevel@tonic-gate 
4647c478bd9Sstevel@tonic-gate 		if (mdi_vhci_head == NULL) {
4657c478bd9Sstevel@tonic-gate 			mdi_vhci_head = vh;
4667c478bd9Sstevel@tonic-gate 		}
4677c478bd9Sstevel@tonic-gate 		if (mdi_vhci_tail) {
4687c478bd9Sstevel@tonic-gate 			mdi_vhci_tail->vh_next = vh;
4697c478bd9Sstevel@tonic-gate 		}
4707c478bd9Sstevel@tonic-gate 		mdi_vhci_tail = vh;
4717c478bd9Sstevel@tonic-gate 		mdi_vhci_count++;
4727c478bd9Sstevel@tonic-gate 	}
4737c478bd9Sstevel@tonic-gate 
4747c478bd9Sstevel@tonic-gate 	/*
4757c478bd9Sstevel@tonic-gate 	 * Claim the devfs node as a vhci component
4767c478bd9Sstevel@tonic-gate 	 */
4777c478bd9Sstevel@tonic-gate 	DEVI(vdip)->devi_mdi_component |= MDI_COMPONENT_VHCI;
4787c478bd9Sstevel@tonic-gate 
4797c478bd9Sstevel@tonic-gate 	/*
4807c478bd9Sstevel@tonic-gate 	 * Initialize our back reference from dev_info node
4817c478bd9Sstevel@tonic-gate 	 */
4827c478bd9Sstevel@tonic-gate 	DEVI(vdip)->devi_mdi_xhci = (caddr_t)vh;
4837c478bd9Sstevel@tonic-gate 	mutex_exit(&mdi_mutex);
4847c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
4857c478bd9Sstevel@tonic-gate }
4867c478bd9Sstevel@tonic-gate 
4877c478bd9Sstevel@tonic-gate /*
4887c478bd9Sstevel@tonic-gate  * mdi_vhci_unregister():
4897c478bd9Sstevel@tonic-gate  *		Unregister a vHCI module from mpxio framework
4907c478bd9Sstevel@tonic-gate  *		mdi_vhci_unregister() is called from the detach(9E) entrypoint
4917c478bd9Sstevel@tonic-gate  * 		of a vhci to unregister it from the framework.
4927c478bd9Sstevel@tonic-gate  * Return Values:
4937c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
4947c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
4957c478bd9Sstevel@tonic-gate  */
4967c478bd9Sstevel@tonic-gate /*ARGSUSED*/
4977c478bd9Sstevel@tonic-gate int
4987c478bd9Sstevel@tonic-gate mdi_vhci_unregister(dev_info_t *vdip, int flags)
4997c478bd9Sstevel@tonic-gate {
5007c478bd9Sstevel@tonic-gate 	mdi_vhci_t	*found, *vh, *prev = NULL;
5017c478bd9Sstevel@tonic-gate 
5025e3986cbScth 	ASSERT(DEVI_BUSY_OWNED(ddi_get_parent(vdip)));
5035e3986cbScth 
5047c478bd9Sstevel@tonic-gate 	/*
5057c478bd9Sstevel@tonic-gate 	 * Check for invalid VHCI
5067c478bd9Sstevel@tonic-gate 	 */
5077c478bd9Sstevel@tonic-gate 	if ((vh = i_devi_get_vhci(vdip)) == NULL)
5087c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
5097c478bd9Sstevel@tonic-gate 
5107c478bd9Sstevel@tonic-gate 	/*
5117c478bd9Sstevel@tonic-gate 	 * Scan the list of registered vHCIs for a match
5127c478bd9Sstevel@tonic-gate 	 */
5135e3986cbScth 	mutex_enter(&mdi_mutex);
5147c478bd9Sstevel@tonic-gate 	for (found = mdi_vhci_head; found != NULL; found = found->vh_next) {
5157c478bd9Sstevel@tonic-gate 		if (found == vh)
5167c478bd9Sstevel@tonic-gate 			break;
5177c478bd9Sstevel@tonic-gate 		prev = found;
5187c478bd9Sstevel@tonic-gate 	}
5197c478bd9Sstevel@tonic-gate 
5207c478bd9Sstevel@tonic-gate 	if (found == NULL) {
5217c478bd9Sstevel@tonic-gate 		mutex_exit(&mdi_mutex);
5227c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
5237c478bd9Sstevel@tonic-gate 	}
5247c478bd9Sstevel@tonic-gate 
5257c478bd9Sstevel@tonic-gate 	/*
5268c4f8890Srs135747 	 * Check the vHCI, pHCI and client count. All the pHCIs and clients
5277c478bd9Sstevel@tonic-gate 	 * should have been unregistered, before a vHCI can be
5287c478bd9Sstevel@tonic-gate 	 * unregistered.
5297c478bd9Sstevel@tonic-gate 	 */
5305e3986cbScth 	MDI_VHCI_PHCI_LOCK(vh);
5315e3986cbScth 	if (vh->vh_refcnt || vh->vh_phci_count || vh->vh_client_count) {
5325e3986cbScth 		MDI_VHCI_PHCI_UNLOCK(vh);
5335e3986cbScth 		mutex_exit(&mdi_mutex);
5345e3986cbScth 		return (MDI_FAILURE);
5355e3986cbScth 	}
5365e3986cbScth 	MDI_VHCI_PHCI_UNLOCK(vh);
5375e3986cbScth 
5385e3986cbScth 	if (destroy_vhci_cache(vh) != MDI_SUCCESS) {
5397c478bd9Sstevel@tonic-gate 		mutex_exit(&mdi_mutex);
5407c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
5417c478bd9Sstevel@tonic-gate 	}
5427c478bd9Sstevel@tonic-gate 
5437c478bd9Sstevel@tonic-gate 	/*
5447c478bd9Sstevel@tonic-gate 	 * Remove the vHCI from the global list
5457c478bd9Sstevel@tonic-gate 	 */
5467c478bd9Sstevel@tonic-gate 	if (vh == mdi_vhci_head) {
5477c478bd9Sstevel@tonic-gate 		mdi_vhci_head = vh->vh_next;
5487c478bd9Sstevel@tonic-gate 	} else {
5497c478bd9Sstevel@tonic-gate 		prev->vh_next = vh->vh_next;
5507c478bd9Sstevel@tonic-gate 	}
5517c478bd9Sstevel@tonic-gate 	if (vh == mdi_vhci_tail) {
5527c478bd9Sstevel@tonic-gate 		mdi_vhci_tail = prev;
5537c478bd9Sstevel@tonic-gate 	}
5547c478bd9Sstevel@tonic-gate 	mdi_vhci_count--;
5557c478bd9Sstevel@tonic-gate 	mutex_exit(&mdi_mutex);
5563c34adc5Sramat 
5573c34adc5Sramat 	vh->vh_ops = NULL;
5587c478bd9Sstevel@tonic-gate 	DEVI(vdip)->devi_mdi_component &= ~MDI_COMPONENT_VHCI;
5597c478bd9Sstevel@tonic-gate 	DEVI(vdip)->devi_mdi_xhci = NULL;
5607c478bd9Sstevel@tonic-gate 	kmem_free(vh->vh_class, strlen(vh->vh_class)+1);
5617c478bd9Sstevel@tonic-gate 	kmem_free(vh->vh_client_table,
5627c478bd9Sstevel@tonic-gate 	    mdi_client_table_size * sizeof (struct client_hash));
5635e3986cbScth 	mutex_destroy(&vh->vh_phci_mutex);
5645e3986cbScth 	mutex_destroy(&vh->vh_client_mutex);
56578dc6db2Sllai1 
5667c478bd9Sstevel@tonic-gate 	kmem_free(vh, sizeof (mdi_vhci_t));
5677c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
5687c478bd9Sstevel@tonic-gate }
5697c478bd9Sstevel@tonic-gate 
5707c478bd9Sstevel@tonic-gate /*
5717c478bd9Sstevel@tonic-gate  * i_mdi_vhci_class2vhci():
5727c478bd9Sstevel@tonic-gate  *		Look for a matching vHCI module given a vHCI class name
5737c478bd9Sstevel@tonic-gate  * Return Values:
5747c478bd9Sstevel@tonic-gate  *		Handle to a vHCI component
5757c478bd9Sstevel@tonic-gate  *		NULL
5767c478bd9Sstevel@tonic-gate  */
5777c478bd9Sstevel@tonic-gate static mdi_vhci_t *
5787c478bd9Sstevel@tonic-gate i_mdi_vhci_class2vhci(char *class)
5797c478bd9Sstevel@tonic-gate {
5807c478bd9Sstevel@tonic-gate 	mdi_vhci_t	*vh = NULL;
5817c478bd9Sstevel@tonic-gate 
5827c478bd9Sstevel@tonic-gate 	ASSERT(!MUTEX_HELD(&mdi_mutex));
5837c478bd9Sstevel@tonic-gate 
5847c478bd9Sstevel@tonic-gate 	mutex_enter(&mdi_mutex);
5857c478bd9Sstevel@tonic-gate 	for (vh = mdi_vhci_head; vh != NULL; vh = vh->vh_next) {
5867c478bd9Sstevel@tonic-gate 		if (strcmp(vh->vh_class, class) == 0) {
5877c478bd9Sstevel@tonic-gate 			break;
5887c478bd9Sstevel@tonic-gate 		}
5897c478bd9Sstevel@tonic-gate 	}
5907c478bd9Sstevel@tonic-gate 	mutex_exit(&mdi_mutex);
5917c478bd9Sstevel@tonic-gate 	return (vh);
5927c478bd9Sstevel@tonic-gate }
5937c478bd9Sstevel@tonic-gate 
5947c478bd9Sstevel@tonic-gate /*
5957c478bd9Sstevel@tonic-gate  * i_devi_get_vhci():
5967c478bd9Sstevel@tonic-gate  *		Utility function to get the handle to a vHCI component
5977c478bd9Sstevel@tonic-gate  * Return Values:
5987c478bd9Sstevel@tonic-gate  *		Handle to a vHCI component
5997c478bd9Sstevel@tonic-gate  *		NULL
6007c478bd9Sstevel@tonic-gate  */
6017c478bd9Sstevel@tonic-gate mdi_vhci_t *
6027c478bd9Sstevel@tonic-gate i_devi_get_vhci(dev_info_t *vdip)
6037c478bd9Sstevel@tonic-gate {
6047c478bd9Sstevel@tonic-gate 	mdi_vhci_t	*vh = NULL;
6057c478bd9Sstevel@tonic-gate 	if (MDI_VHCI(vdip)) {
6067c478bd9Sstevel@tonic-gate 		vh = (mdi_vhci_t *)DEVI(vdip)->devi_mdi_xhci;
6077c478bd9Sstevel@tonic-gate 	}
6087c478bd9Sstevel@tonic-gate 	return (vh);
6097c478bd9Sstevel@tonic-gate }
6107c478bd9Sstevel@tonic-gate 
6117c478bd9Sstevel@tonic-gate /*
6127c478bd9Sstevel@tonic-gate  * mdi_phci_register():
6137c478bd9Sstevel@tonic-gate  *		Register a pHCI module with mpxio framework
6147c478bd9Sstevel@tonic-gate  *		mdi_phci_register() is called by pHCI drivers to register with
6157c478bd9Sstevel@tonic-gate  *		the mpxio framework and a specific 'class_driver' vHCI.  The
6167c478bd9Sstevel@tonic-gate  *		pHCI driver must call this interface as part of its attach(9e)
6177c478bd9Sstevel@tonic-gate  *		handler.
6187c478bd9Sstevel@tonic-gate  * Return Values:
6197c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
6207c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
6217c478bd9Sstevel@tonic-gate  */
6227c478bd9Sstevel@tonic-gate /*ARGSUSED*/
6237c478bd9Sstevel@tonic-gate int
6247c478bd9Sstevel@tonic-gate mdi_phci_register(char *class, dev_info_t *pdip, int flags)
6257c478bd9Sstevel@tonic-gate {
6267c478bd9Sstevel@tonic-gate 	mdi_phci_t		*ph;
6277c478bd9Sstevel@tonic-gate 	mdi_vhci_t		*vh;
6287c478bd9Sstevel@tonic-gate 	char			*data;
6297c478bd9Sstevel@tonic-gate 
6305e3986cbScth 	/*
6315e3986cbScth 	 * Some subsystems, like fcp, perform pHCI registration from a
6325e3986cbScth 	 * different thread than the one doing the pHCI attach(9E) - the
6335e3986cbScth 	 * driver attach code is waiting for this other thread to complete.
6345e3986cbScth 	 * This means we can only ASSERT DEVI_BUSY_CHANGING of parent
6355e3986cbScth 	 * (indicating that some thread has done an ndi_devi_enter of parent)
6365e3986cbScth 	 * not DEVI_BUSY_OWNED (which would indicate that we did the enter).
6375e3986cbScth 	 */
6385e3986cbScth 	ASSERT(DEVI_BUSY_CHANGING(ddi_get_parent(pdip)));
6395e3986cbScth 
6407c478bd9Sstevel@tonic-gate 	/*
6417c478bd9Sstevel@tonic-gate 	 * Check for mpxio-disable property. Enable mpxio if the property is
6427c478bd9Sstevel@tonic-gate 	 * missing or not set to "yes".
6437c478bd9Sstevel@tonic-gate 	 * If the property is set to "yes" then emit a brief message.
6447c478bd9Sstevel@tonic-gate 	 */
6457c478bd9Sstevel@tonic-gate 	if ((ddi_prop_lookup_string(DDI_DEV_T_ANY, pdip, 0, "mpxio-disable",
6467c478bd9Sstevel@tonic-gate 	    &data) == DDI_SUCCESS)) {
6477c478bd9Sstevel@tonic-gate 		if (strcmp(data, "yes") == 0) {
6484c06356bSdh142964 			MDI_DEBUG(1, (MDI_CONT, pdip,
6494c06356bSdh142964 			    "?multipath capabilities disabled via %s.conf.",
6507c478bd9Sstevel@tonic-gate 			    ddi_driver_name(pdip)));
6517c478bd9Sstevel@tonic-gate 			ddi_prop_free(data);
6527c478bd9Sstevel@tonic-gate 			return (MDI_FAILURE);
6537c478bd9Sstevel@tonic-gate 		}
6547c478bd9Sstevel@tonic-gate 		ddi_prop_free(data);
6557c478bd9Sstevel@tonic-gate 	}
6567c478bd9Sstevel@tonic-gate 
6577c478bd9Sstevel@tonic-gate 	/*
6587c478bd9Sstevel@tonic-gate 	 * Search for a matching vHCI
6597c478bd9Sstevel@tonic-gate 	 */
6607c478bd9Sstevel@tonic-gate 	vh = (mdi_vhci_t *)i_mdi_vhci_class2vhci(class);
6617c478bd9Sstevel@tonic-gate 	if (vh == NULL) {
6627c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
6637c478bd9Sstevel@tonic-gate 	}
6647c478bd9Sstevel@tonic-gate 
6657c478bd9Sstevel@tonic-gate 	ph = kmem_zalloc(sizeof (mdi_phci_t), KM_SLEEP);
6667c478bd9Sstevel@tonic-gate 	mutex_init(&ph->ph_mutex, NULL, MUTEX_DEFAULT, NULL);
6677c478bd9Sstevel@tonic-gate 	ph->ph_dip = pdip;
6687c478bd9Sstevel@tonic-gate 	ph->ph_vhci = vh;
6697c478bd9Sstevel@tonic-gate 	ph->ph_next = NULL;
6707c478bd9Sstevel@tonic-gate 	ph->ph_unstable = 0;
6717c478bd9Sstevel@tonic-gate 	ph->ph_vprivate = 0;
6727c478bd9Sstevel@tonic-gate 	cv_init(&ph->ph_unstable_cv, NULL, CV_DRIVER, NULL);
6737c478bd9Sstevel@tonic-gate 
6745e3986cbScth 	MDI_PHCI_LOCK(ph);
6757c478bd9Sstevel@tonic-gate 	MDI_PHCI_SET_POWER_UP(ph);
6765e3986cbScth 	MDI_PHCI_UNLOCK(ph);
6777c478bd9Sstevel@tonic-gate 	DEVI(pdip)->devi_mdi_component |= MDI_COMPONENT_PHCI;
6787c478bd9Sstevel@tonic-gate 	DEVI(pdip)->devi_mdi_xhci = (caddr_t)ph;
6797c478bd9Sstevel@tonic-gate 
6803c34adc5Sramat 	vhcache_phci_add(vh->vh_config, ph);
6813c34adc5Sramat 
6825e3986cbScth 	MDI_VHCI_PHCI_LOCK(vh);
6837c478bd9Sstevel@tonic-gate 	if (vh->vh_phci_head == NULL) {
6847c478bd9Sstevel@tonic-gate 		vh->vh_phci_head = ph;
6857c478bd9Sstevel@tonic-gate 	}
6867c478bd9Sstevel@tonic-gate 	if (vh->vh_phci_tail) {
6877c478bd9Sstevel@tonic-gate 		vh->vh_phci_tail->ph_next = ph;
6887c478bd9Sstevel@tonic-gate 	}
6897c478bd9Sstevel@tonic-gate 	vh->vh_phci_tail = ph;
6907c478bd9Sstevel@tonic-gate 	vh->vh_phci_count++;
6915e3986cbScth 	MDI_VHCI_PHCI_UNLOCK(vh);
6925e3986cbScth 
6938c4f8890Srs135747 	i_mdi_log_sysevent(pdip, class, ESC_DDI_INITIATOR_REGISTER);
6947c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
6957c478bd9Sstevel@tonic-gate }
6967c478bd9Sstevel@tonic-gate 
6977c478bd9Sstevel@tonic-gate /*
6987c478bd9Sstevel@tonic-gate  * mdi_phci_unregister():
6997c478bd9Sstevel@tonic-gate  *		Unregister a pHCI module from mpxio framework
7007c478bd9Sstevel@tonic-gate  *		mdi_phci_unregister() is called by the pHCI drivers from their
7017c478bd9Sstevel@tonic-gate  *		detach(9E) handler to unregister their instances from the
7027c478bd9Sstevel@tonic-gate  *		framework.
7037c478bd9Sstevel@tonic-gate  * Return Values:
7047c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
7057c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
7067c478bd9Sstevel@tonic-gate  */
7077c478bd9Sstevel@tonic-gate /*ARGSUSED*/
7087c478bd9Sstevel@tonic-gate int
7097c478bd9Sstevel@tonic-gate mdi_phci_unregister(dev_info_t *pdip, int flags)
7107c478bd9Sstevel@tonic-gate {
7117c478bd9Sstevel@tonic-gate 	mdi_vhci_t		*vh;
7127c478bd9Sstevel@tonic-gate 	mdi_phci_t		*ph;
7137c478bd9Sstevel@tonic-gate 	mdi_phci_t		*tmp;
7147c478bd9Sstevel@tonic-gate 	mdi_phci_t		*prev = NULL;
7154c06356bSdh142964 	mdi_pathinfo_t		*pip;
7167c478bd9Sstevel@tonic-gate 
7175e3986cbScth 	ASSERT(DEVI_BUSY_CHANGING(ddi_get_parent(pdip)));
7185e3986cbScth 
7197c478bd9Sstevel@tonic-gate 	ph = i_devi_get_phci(pdip);
7207c478bd9Sstevel@tonic-gate 	if (ph == NULL) {
7214c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, pdip, "!not a valid pHCI"));
7227c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
7237c478bd9Sstevel@tonic-gate 	}
7247c478bd9Sstevel@tonic-gate 
7257c478bd9Sstevel@tonic-gate 	vh = ph->ph_vhci;
7267c478bd9Sstevel@tonic-gate 	ASSERT(vh != NULL);
7277c478bd9Sstevel@tonic-gate 	if (vh == NULL) {
7284c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, pdip, "!not a valid vHCI"));
7297c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
7307c478bd9Sstevel@tonic-gate 	}
7317c478bd9Sstevel@tonic-gate 
7325e3986cbScth 	MDI_VHCI_PHCI_LOCK(vh);
7337c478bd9Sstevel@tonic-gate 	tmp = vh->vh_phci_head;
7347c478bd9Sstevel@tonic-gate 	while (tmp) {
7357c478bd9Sstevel@tonic-gate 		if (tmp == ph) {
7367c478bd9Sstevel@tonic-gate 			break;
7377c478bd9Sstevel@tonic-gate 		}
7387c478bd9Sstevel@tonic-gate 		prev = tmp;
7397c478bd9Sstevel@tonic-gate 		tmp = tmp->ph_next;
7407c478bd9Sstevel@tonic-gate 	}
7417c478bd9Sstevel@tonic-gate 
7427c478bd9Sstevel@tonic-gate 	if (ph == vh->vh_phci_head) {
7437c478bd9Sstevel@tonic-gate 		vh->vh_phci_head = ph->ph_next;
7447c478bd9Sstevel@tonic-gate 	} else {
7457c478bd9Sstevel@tonic-gate 		prev->ph_next = ph->ph_next;
7467c478bd9Sstevel@tonic-gate 	}
7477c478bd9Sstevel@tonic-gate 
7487c478bd9Sstevel@tonic-gate 	if (ph == vh->vh_phci_tail) {
7497c478bd9Sstevel@tonic-gate 		vh->vh_phci_tail = prev;
7507c478bd9Sstevel@tonic-gate 	}
7517c478bd9Sstevel@tonic-gate 
7527c478bd9Sstevel@tonic-gate 	vh->vh_phci_count--;
7535e3986cbScth 	MDI_VHCI_PHCI_UNLOCK(vh);
7547c478bd9Sstevel@tonic-gate 
7554c06356bSdh142964 	/* Walk remaining pathinfo nodes and disassociate them from pHCI */
7564c06356bSdh142964 	MDI_PHCI_LOCK(ph);
7574c06356bSdh142964 	for (pip = (mdi_pathinfo_t *)ph->ph_path_head; pip;
7584c06356bSdh142964 	    pip = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link)
7594c06356bSdh142964 		MDI_PI(pip)->pi_phci = NULL;
7604c06356bSdh142964 	MDI_PHCI_UNLOCK(ph);
7614c06356bSdh142964 
7628c4f8890Srs135747 	i_mdi_log_sysevent(pdip, ph->ph_vhci->vh_class,
7638c4f8890Srs135747 	    ESC_DDI_INITIATOR_UNREGISTER);
7643c34adc5Sramat 	vhcache_phci_remove(vh->vh_config, ph);
7657c478bd9Sstevel@tonic-gate 	cv_destroy(&ph->ph_unstable_cv);
7667c478bd9Sstevel@tonic-gate 	mutex_destroy(&ph->ph_mutex);
7677c478bd9Sstevel@tonic-gate 	kmem_free(ph, sizeof (mdi_phci_t));
7687c478bd9Sstevel@tonic-gate 	DEVI(pdip)->devi_mdi_component &= ~MDI_COMPONENT_PHCI;
7697c478bd9Sstevel@tonic-gate 	DEVI(pdip)->devi_mdi_xhci = NULL;
7707c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
7717c478bd9Sstevel@tonic-gate }
7727c478bd9Sstevel@tonic-gate 
7737c478bd9Sstevel@tonic-gate /*
7747c478bd9Sstevel@tonic-gate  * i_devi_get_phci():
7757c478bd9Sstevel@tonic-gate  * 		Utility function to return the phci extensions.
7767c478bd9Sstevel@tonic-gate  */
7777c478bd9Sstevel@tonic-gate static mdi_phci_t *
7787c478bd9Sstevel@tonic-gate i_devi_get_phci(dev_info_t *pdip)
7797c478bd9Sstevel@tonic-gate {
7807c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph = NULL;
78155e592a2SRandall Ralphs 
7827c478bd9Sstevel@tonic-gate 	if (MDI_PHCI(pdip)) {
7837c478bd9Sstevel@tonic-gate 		ph = (mdi_phci_t *)DEVI(pdip)->devi_mdi_xhci;
7847c478bd9Sstevel@tonic-gate 	}
7857c478bd9Sstevel@tonic-gate 	return (ph);
7867c478bd9Sstevel@tonic-gate }
7877c478bd9Sstevel@tonic-gate 
7887c478bd9Sstevel@tonic-gate /*
7895e3986cbScth  * Single thread mdi entry into devinfo node for modifying its children.
7905e3986cbScth  * If necessary we perform an ndi_devi_enter of the vHCI before doing
7915e3986cbScth  * an ndi_devi_enter of 'dip'.  We maintain circular in two parts: one
7925e3986cbScth  * for the vHCI and one for the pHCI.
7935e3986cbScth  */
7945e3986cbScth void
7955e3986cbScth mdi_devi_enter(dev_info_t *phci_dip, int *circular)
7965e3986cbScth {
7975e3986cbScth 	dev_info_t	*vdip;
7985e3986cbScth 	int		vcircular, pcircular;
7995e3986cbScth 
8005e3986cbScth 	/* Verify calling context */
8015e3986cbScth 	ASSERT(MDI_PHCI(phci_dip));
8025e3986cbScth 	vdip = mdi_devi_get_vdip(phci_dip);
8035e3986cbScth 	ASSERT(vdip);			/* A pHCI always has a vHCI */
8045e3986cbScth 
8055e3986cbScth 	/*
8065e3986cbScth 	 * If pHCI is detaching then the framework has already entered the
8075e3986cbScth 	 * vHCI on a threads that went down the code path leading to
8085e3986cbScth 	 * detach_node().  This framework enter of the vHCI during pHCI
8095e3986cbScth 	 * detach is done to avoid deadlock with vHCI power management
8105e3986cbScth 	 * operations which enter the vHCI and the enter down the path
8115e3986cbScth 	 * to the pHCI. If pHCI is detaching then we piggyback this calls
8125e3986cbScth 	 * enter of the vHCI on frameworks vHCI enter that has already
8135e3986cbScth 	 * occurred - this is OK because we know that the framework thread
8145e3986cbScth 	 * doing detach is waiting for our completion.
8155e3986cbScth 	 *
8165e3986cbScth 	 * We should DEVI_IS_DETACHING under an enter of the parent to avoid
8175e3986cbScth 	 * race with detach - but we can't do that because the framework has
8185e3986cbScth 	 * already entered the parent, so we have some complexity instead.
8195e3986cbScth 	 */
8205e3986cbScth 	for (;;) {
8215e3986cbScth 		if (ndi_devi_tryenter(vdip, &vcircular)) {
8225e3986cbScth 			ASSERT(vcircular != -1);
8235e3986cbScth 			if (DEVI_IS_DETACHING(phci_dip)) {
8245e3986cbScth 				ndi_devi_exit(vdip, vcircular);
8255e3986cbScth 				vcircular = -1;
8265e3986cbScth 			}
8275e3986cbScth 			break;
8285e3986cbScth 		} else if (DEVI_IS_DETACHING(phci_dip)) {
8295e3986cbScth 			vcircular = -1;
8305e3986cbScth 			break;
8314c06356bSdh142964 		} else if (servicing_interrupt()) {
8324c06356bSdh142964 			/*
8334c06356bSdh142964 			 * Don't delay an interrupt (and ensure adaptive
8344c06356bSdh142964 			 * mutex inversion support).
8354c06356bSdh142964 			 */
8364c06356bSdh142964 			ndi_devi_enter(vdip, &vcircular);
8374c06356bSdh142964 			break;
8385e3986cbScth 		} else {
83996c4a178SChris Horne 			delay_random(mdi_delay);
8405e3986cbScth 		}
8415e3986cbScth 	}
8425e3986cbScth 
8435e3986cbScth 	ndi_devi_enter(phci_dip, &pcircular);
8445e3986cbScth 	*circular = (vcircular << 16) | (pcircular & 0xFFFF);
8455e3986cbScth }
8465e3986cbScth 
8475e3986cbScth /*
84855e592a2SRandall Ralphs  * Attempt to mdi_devi_enter.
84955e592a2SRandall Ralphs  */
85055e592a2SRandall Ralphs int
85155e592a2SRandall Ralphs mdi_devi_tryenter(dev_info_t *phci_dip, int *circular)
85255e592a2SRandall Ralphs {
85355e592a2SRandall Ralphs 	dev_info_t	*vdip;
85455e592a2SRandall Ralphs 	int		vcircular, pcircular;
85555e592a2SRandall Ralphs 
85655e592a2SRandall Ralphs 	/* Verify calling context */
85755e592a2SRandall Ralphs 	ASSERT(MDI_PHCI(phci_dip));
85855e592a2SRandall Ralphs 	vdip = mdi_devi_get_vdip(phci_dip);
85955e592a2SRandall Ralphs 	ASSERT(vdip);			/* A pHCI always has a vHCI */
86055e592a2SRandall Ralphs 
86155e592a2SRandall Ralphs 	if (ndi_devi_tryenter(vdip, &vcircular)) {
86255e592a2SRandall Ralphs 		if (ndi_devi_tryenter(phci_dip, &pcircular)) {
86355e592a2SRandall Ralphs 			*circular = (vcircular << 16) | (pcircular & 0xFFFF);
86455e592a2SRandall Ralphs 			return (1);	/* locked */
86555e592a2SRandall Ralphs 		}
86655e592a2SRandall Ralphs 		ndi_devi_exit(vdip, vcircular);
86755e592a2SRandall Ralphs 	}
86855e592a2SRandall Ralphs 	return (0);			/* busy */
86955e592a2SRandall Ralphs }
87055e592a2SRandall Ralphs 
87155e592a2SRandall Ralphs /*
8725e3986cbScth  * Release mdi_devi_enter or successful mdi_devi_tryenter.
8735e3986cbScth  */
8745e3986cbScth void
8755e3986cbScth mdi_devi_exit(dev_info_t *phci_dip, int circular)
8765e3986cbScth {
8775e3986cbScth 	dev_info_t	*vdip;
8785e3986cbScth 	int		vcircular, pcircular;
8795e3986cbScth 
8805e3986cbScth 	/* Verify calling context */
8815e3986cbScth 	ASSERT(MDI_PHCI(phci_dip));
8825e3986cbScth 	vdip = mdi_devi_get_vdip(phci_dip);
8835e3986cbScth 	ASSERT(vdip);			/* A pHCI always has a vHCI */
8845e3986cbScth 
8855e3986cbScth 	/* extract two circular recursion values from single int */
8865e3986cbScth 	pcircular = (short)(circular & 0xFFFF);
8875e3986cbScth 	vcircular = (short)((circular >> 16) & 0xFFFF);
8885e3986cbScth 
8895e3986cbScth 	ndi_devi_exit(phci_dip, pcircular);
8905e3986cbScth 	if (vcircular != -1)
8915e3986cbScth 		ndi_devi_exit(vdip, vcircular);
8925e3986cbScth }
8935e3986cbScth 
8945e3986cbScth /*
8955e3986cbScth  * The functions mdi_devi_exit_phci() and mdi_devi_enter_phci() are used
8965e3986cbScth  * around a pHCI drivers calls to mdi_pi_online/offline, after holding
8975e3986cbScth  * the pathinfo node via mdi_hold_path/mdi_rele_path, to avoid deadlock
8985e3986cbScth  * with vHCI power management code during path online/offline.  Each
8995e3986cbScth  * mdi_devi_exit_phci must have a matching mdi_devi_enter_phci, and both must
9005e3986cbScth  * occur within the scope of an active mdi_devi_enter that establishes the
9015e3986cbScth  * circular value.
9025e3986cbScth  */
9035e3986cbScth void
9045e3986cbScth mdi_devi_exit_phci(dev_info_t *phci_dip, int circular)
9055e3986cbScth {
9065e3986cbScth 	int		pcircular;
9075e3986cbScth 
9085e3986cbScth 	/* Verify calling context */
9095e3986cbScth 	ASSERT(MDI_PHCI(phci_dip));
9105e3986cbScth 
9114c06356bSdh142964 	/* Keep hold on pHCI until we reenter in mdi_devi_enter_phci */
9124c06356bSdh142964 	ndi_hold_devi(phci_dip);
9134c06356bSdh142964 
9145e3986cbScth 	pcircular = (short)(circular & 0xFFFF);
9155e3986cbScth 	ndi_devi_exit(phci_dip, pcircular);
9165e3986cbScth }
9175e3986cbScth 
9185e3986cbScth void
9195e3986cbScth mdi_devi_enter_phci(dev_info_t *phci_dip, int *circular)
9205e3986cbScth {
9215e3986cbScth 	int		pcircular;
9225e3986cbScth 
9235e3986cbScth 	/* Verify calling context */
9245e3986cbScth 	ASSERT(MDI_PHCI(phci_dip));
9255e3986cbScth 
9265e3986cbScth 	ndi_devi_enter(phci_dip, &pcircular);
9275e3986cbScth 
9284c06356bSdh142964 	/* Drop hold from mdi_devi_exit_phci. */
9294c06356bSdh142964 	ndi_rele_devi(phci_dip);
9304c06356bSdh142964 
9315e3986cbScth 	/* verify matching mdi_devi_exit_phci/mdi_devi_enter_phci use */
9325e3986cbScth 	ASSERT(pcircular == ((short)(*circular & 0xFFFF)));
9335e3986cbScth }
9345e3986cbScth 
9355e3986cbScth /*
9365e3986cbScth  * mdi_devi_get_vdip():
9375e3986cbScth  *		given a pHCI dip return vHCI dip
9385e3986cbScth  */
9395e3986cbScth dev_info_t *
9405e3986cbScth mdi_devi_get_vdip(dev_info_t *pdip)
9415e3986cbScth {
9425e3986cbScth 	mdi_phci_t	*ph;
9435e3986cbScth 
9445e3986cbScth 	ph = i_devi_get_phci(pdip);
9455e3986cbScth 	if (ph && ph->ph_vhci)
9465e3986cbScth 		return (ph->ph_vhci->vh_dip);
9475e3986cbScth 	return (NULL);
9485e3986cbScth }
9495e3986cbScth 
9505e3986cbScth /*
9515e3986cbScth  * mdi_devi_pdip_entered():
9525e3986cbScth  *		Return 1 if we are vHCI and have done an ndi_devi_enter
9535e3986cbScth  *		of a pHCI
9545e3986cbScth  */
9555e3986cbScth int
9565e3986cbScth mdi_devi_pdip_entered(dev_info_t *vdip)
9575e3986cbScth {
9585e3986cbScth 	mdi_vhci_t	*vh;
9595e3986cbScth 	mdi_phci_t	*ph;
9605e3986cbScth 
9615e3986cbScth 	vh = i_devi_get_vhci(vdip);
9625e3986cbScth 	if (vh == NULL)
9635e3986cbScth 		return (0);
9645e3986cbScth 
9655e3986cbScth 	MDI_VHCI_PHCI_LOCK(vh);
9665e3986cbScth 	ph = vh->vh_phci_head;
9675e3986cbScth 	while (ph) {
9685e3986cbScth 		if (ph->ph_dip && DEVI_BUSY_OWNED(ph->ph_dip)) {
9695e3986cbScth 			MDI_VHCI_PHCI_UNLOCK(vh);
9705e3986cbScth 			return (1);
9715e3986cbScth 		}
9725e3986cbScth 		ph = ph->ph_next;
9735e3986cbScth 	}
9745e3986cbScth 	MDI_VHCI_PHCI_UNLOCK(vh);
9755e3986cbScth 	return (0);
9765e3986cbScth }
9775e3986cbScth 
9785e3986cbScth /*
9797c478bd9Sstevel@tonic-gate  * mdi_phci_path2devinfo():
9807c478bd9Sstevel@tonic-gate  * 		Utility function to search for a valid phci device given
9817c478bd9Sstevel@tonic-gate  *		the devfs pathname.
9827c478bd9Sstevel@tonic-gate  */
9837c478bd9Sstevel@tonic-gate dev_info_t *
9847c478bd9Sstevel@tonic-gate mdi_phci_path2devinfo(dev_info_t *vdip, caddr_t pathname)
9857c478bd9Sstevel@tonic-gate {
9867c478bd9Sstevel@tonic-gate 	char		*temp_pathname;
9877c478bd9Sstevel@tonic-gate 	mdi_vhci_t	*vh;
9887c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
9897c478bd9Sstevel@tonic-gate 	dev_info_t 	*pdip = NULL;
9907c478bd9Sstevel@tonic-gate 
9917c478bd9Sstevel@tonic-gate 	vh = i_devi_get_vhci(vdip);
9927c478bd9Sstevel@tonic-gate 	ASSERT(vh != NULL);
9937c478bd9Sstevel@tonic-gate 
9947c478bd9Sstevel@tonic-gate 	if (vh == NULL) {
9957c478bd9Sstevel@tonic-gate 		/*
9967c478bd9Sstevel@tonic-gate 		 * Invalid vHCI component, return failure
9977c478bd9Sstevel@tonic-gate 		 */
9987c478bd9Sstevel@tonic-gate 		return (NULL);
9997c478bd9Sstevel@tonic-gate 	}
10007c478bd9Sstevel@tonic-gate 
10017c478bd9Sstevel@tonic-gate 	temp_pathname = kmem_zalloc(MAXPATHLEN, KM_SLEEP);
10025e3986cbScth 	MDI_VHCI_PHCI_LOCK(vh);
10037c478bd9Sstevel@tonic-gate 	ph = vh->vh_phci_head;
10047c478bd9Sstevel@tonic-gate 	while (ph != NULL) {
10057c478bd9Sstevel@tonic-gate 		pdip = ph->ph_dip;
10067c478bd9Sstevel@tonic-gate 		ASSERT(pdip != NULL);
10077c478bd9Sstevel@tonic-gate 		*temp_pathname = '\0';
10087c478bd9Sstevel@tonic-gate 		(void) ddi_pathname(pdip, temp_pathname);
10097c478bd9Sstevel@tonic-gate 		if (strcmp(temp_pathname, pathname) == 0) {
10107c478bd9Sstevel@tonic-gate 			break;
10117c478bd9Sstevel@tonic-gate 		}
10127c478bd9Sstevel@tonic-gate 		ph = ph->ph_next;
10137c478bd9Sstevel@tonic-gate 	}
10147c478bd9Sstevel@tonic-gate 	if (ph == NULL) {
10157c478bd9Sstevel@tonic-gate 		pdip = NULL;
10167c478bd9Sstevel@tonic-gate 	}
10175e3986cbScth 	MDI_VHCI_PHCI_UNLOCK(vh);
10187c478bd9Sstevel@tonic-gate 	kmem_free(temp_pathname, MAXPATHLEN);
10197c478bd9Sstevel@tonic-gate 	return (pdip);
10207c478bd9Sstevel@tonic-gate }
10217c478bd9Sstevel@tonic-gate 
10227c478bd9Sstevel@tonic-gate /*
10237c478bd9Sstevel@tonic-gate  * mdi_phci_get_path_count():
10247c478bd9Sstevel@tonic-gate  * 		get number of path information nodes associated with a given
10257c478bd9Sstevel@tonic-gate  *		pHCI device.
10267c478bd9Sstevel@tonic-gate  */
10277c478bd9Sstevel@tonic-gate int
10287c478bd9Sstevel@tonic-gate mdi_phci_get_path_count(dev_info_t *pdip)
10297c478bd9Sstevel@tonic-gate {
10307c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
10317c478bd9Sstevel@tonic-gate 	int		count = 0;
10327c478bd9Sstevel@tonic-gate 
10337c478bd9Sstevel@tonic-gate 	ph = i_devi_get_phci(pdip);
10347c478bd9Sstevel@tonic-gate 	if (ph != NULL) {
10357c478bd9Sstevel@tonic-gate 		count = ph->ph_path_count;
10367c478bd9Sstevel@tonic-gate 	}
10377c478bd9Sstevel@tonic-gate 	return (count);
10387c478bd9Sstevel@tonic-gate }
10397c478bd9Sstevel@tonic-gate 
10407c478bd9Sstevel@tonic-gate /*
10417c478bd9Sstevel@tonic-gate  * i_mdi_phci_lock():
10427c478bd9Sstevel@tonic-gate  *		Lock a pHCI device
10437c478bd9Sstevel@tonic-gate  * Return Values:
10447c478bd9Sstevel@tonic-gate  *		None
10457c478bd9Sstevel@tonic-gate  * Note:
10467c478bd9Sstevel@tonic-gate  *		The default locking order is:
10477c478bd9Sstevel@tonic-gate  *		_NOTE(LOCK_ORDER(mdi_phci::ph_mutex mdi_pathinfo::pi_mutex))
10487c478bd9Sstevel@tonic-gate  *		But there are number of situations where locks need to be
10497c478bd9Sstevel@tonic-gate  *		grabbed in reverse order.  This routine implements try and lock
10507c478bd9Sstevel@tonic-gate  *		mechanism depending on the requested parameter option.
10517c478bd9Sstevel@tonic-gate  */
10527c478bd9Sstevel@tonic-gate static void
10537c478bd9Sstevel@tonic-gate i_mdi_phci_lock(mdi_phci_t *ph, mdi_pathinfo_t *pip)
10547c478bd9Sstevel@tonic-gate {
10557c478bd9Sstevel@tonic-gate 	if (pip) {
10567c478bd9Sstevel@tonic-gate 		/* Reverse locking is requested. */
10577c478bd9Sstevel@tonic-gate 		while (MDI_PHCI_TRYLOCK(ph) == 0) {
10584c06356bSdh142964 			if (servicing_interrupt()) {
10594c06356bSdh142964 				MDI_PI_HOLD(pip);
10604c06356bSdh142964 				MDI_PI_UNLOCK(pip);
10614c06356bSdh142964 				MDI_PHCI_LOCK(ph);
10624c06356bSdh142964 				MDI_PI_LOCK(pip);
10634c06356bSdh142964 				MDI_PI_RELE(pip);
10644c06356bSdh142964 				break;
10654c06356bSdh142964 			} else {
10667c478bd9Sstevel@tonic-gate 				/*
10677c478bd9Sstevel@tonic-gate 				 * tryenter failed. Try to grab again
10687c478bd9Sstevel@tonic-gate 				 * after a small delay
10697c478bd9Sstevel@tonic-gate 				 */
10707c478bd9Sstevel@tonic-gate 				MDI_PI_HOLD(pip);
10717c478bd9Sstevel@tonic-gate 				MDI_PI_UNLOCK(pip);
107296c4a178SChris Horne 				delay_random(mdi_delay);
10737c478bd9Sstevel@tonic-gate 				MDI_PI_LOCK(pip);
10747c478bd9Sstevel@tonic-gate 				MDI_PI_RELE(pip);
10757c478bd9Sstevel@tonic-gate 			}
10764c06356bSdh142964 		}
10777c478bd9Sstevel@tonic-gate 	} else {
10787c478bd9Sstevel@tonic-gate 		MDI_PHCI_LOCK(ph);
10797c478bd9Sstevel@tonic-gate 	}
10807c478bd9Sstevel@tonic-gate }
10817c478bd9Sstevel@tonic-gate 
10827c478bd9Sstevel@tonic-gate /*
10837c478bd9Sstevel@tonic-gate  * i_mdi_phci_unlock():
10847c478bd9Sstevel@tonic-gate  *		Unlock the pHCI component
10857c478bd9Sstevel@tonic-gate  */
10867c478bd9Sstevel@tonic-gate static void
10877c478bd9Sstevel@tonic-gate i_mdi_phci_unlock(mdi_phci_t *ph)
10887c478bd9Sstevel@tonic-gate {
10897c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNLOCK(ph);
10907c478bd9Sstevel@tonic-gate }
10917c478bd9Sstevel@tonic-gate 
10927c478bd9Sstevel@tonic-gate /*
10937c478bd9Sstevel@tonic-gate  * i_mdi_devinfo_create():
10947c478bd9Sstevel@tonic-gate  *		create client device's devinfo node
10957c478bd9Sstevel@tonic-gate  * Return Values:
10967c478bd9Sstevel@tonic-gate  *		dev_info
10977c478bd9Sstevel@tonic-gate  *		NULL
10987c478bd9Sstevel@tonic-gate  * Notes:
10997c478bd9Sstevel@tonic-gate  */
11007c478bd9Sstevel@tonic-gate static dev_info_t *
11017c478bd9Sstevel@tonic-gate i_mdi_devinfo_create(mdi_vhci_t *vh, char *name, char *guid,
11023c34adc5Sramat 	char **compatible, int ncompatible)
11037c478bd9Sstevel@tonic-gate {
11047c478bd9Sstevel@tonic-gate 	dev_info_t *cdip = NULL;
11057c478bd9Sstevel@tonic-gate 
11065e3986cbScth 	ASSERT(MDI_VHCI_CLIENT_LOCKED(vh));
11077c478bd9Sstevel@tonic-gate 
11087c478bd9Sstevel@tonic-gate 	/* Verify for duplicate entry */
11097c478bd9Sstevel@tonic-gate 	cdip = i_mdi_devinfo_find(vh, name, guid);
11107c478bd9Sstevel@tonic-gate 	ASSERT(cdip == NULL);
11117c478bd9Sstevel@tonic-gate 	if (cdip) {
11127c478bd9Sstevel@tonic-gate 		cmn_err(CE_WARN,
11134c06356bSdh142964 		    "i_mdi_devinfo_create: client %s@%s already exists",
11144c06356bSdh142964 			name ? name : "", guid ? guid : "");
11157c478bd9Sstevel@tonic-gate 	}
11167c478bd9Sstevel@tonic-gate 
11173c34adc5Sramat 	ndi_devi_alloc_sleep(vh->vh_dip, name, DEVI_SID_NODEID, &cdip);
11187c478bd9Sstevel@tonic-gate 	if (cdip == NULL)
11197c478bd9Sstevel@tonic-gate 		goto fail;
11207c478bd9Sstevel@tonic-gate 
11217c478bd9Sstevel@tonic-gate 	/*
11227c478bd9Sstevel@tonic-gate 	 * Create component type and Global unique identifier
11237c478bd9Sstevel@tonic-gate 	 * properties
11247c478bd9Sstevel@tonic-gate 	 */
11257c478bd9Sstevel@tonic-gate 	if (ndi_prop_update_string(DDI_DEV_T_NONE, cdip,
11267c478bd9Sstevel@tonic-gate 	    MDI_CLIENT_GUID_PROP, guid) != DDI_PROP_SUCCESS) {
11277c478bd9Sstevel@tonic-gate 		goto fail;
11287c478bd9Sstevel@tonic-gate 	}
11297c478bd9Sstevel@tonic-gate 
11307c478bd9Sstevel@tonic-gate 	/* Decorate the node with compatible property */
11317c478bd9Sstevel@tonic-gate 	if (compatible &&
11327c478bd9Sstevel@tonic-gate 	    (ndi_prop_update_string_array(DDI_DEV_T_NONE, cdip,
11337c478bd9Sstevel@tonic-gate 	    "compatible", compatible, ncompatible) != DDI_PROP_SUCCESS)) {
11347c478bd9Sstevel@tonic-gate 		goto fail;
11357c478bd9Sstevel@tonic-gate 	}
11367c478bd9Sstevel@tonic-gate 
11377c478bd9Sstevel@tonic-gate 	return (cdip);
11387c478bd9Sstevel@tonic-gate 
11397c478bd9Sstevel@tonic-gate fail:
11407c478bd9Sstevel@tonic-gate 	if (cdip) {
11417c478bd9Sstevel@tonic-gate 		(void) ndi_prop_remove_all(cdip);
11427c478bd9Sstevel@tonic-gate 		(void) ndi_devi_free(cdip);
11437c478bd9Sstevel@tonic-gate 	}
11447c478bd9Sstevel@tonic-gate 	return (NULL);
11457c478bd9Sstevel@tonic-gate }
11467c478bd9Sstevel@tonic-gate 
11477c478bd9Sstevel@tonic-gate /*
11487c478bd9Sstevel@tonic-gate  * i_mdi_devinfo_find():
11497c478bd9Sstevel@tonic-gate  *		Find a matching devinfo node for given client node name
11507c478bd9Sstevel@tonic-gate  *		and its guid.
11517c478bd9Sstevel@tonic-gate  * Return Values:
11527c478bd9Sstevel@tonic-gate  *		Handle to a dev_info node or NULL
11537c478bd9Sstevel@tonic-gate  */
11547c478bd9Sstevel@tonic-gate static dev_info_t *
11557c478bd9Sstevel@tonic-gate i_mdi_devinfo_find(mdi_vhci_t *vh, caddr_t name, char *guid)
11567c478bd9Sstevel@tonic-gate {
11577c478bd9Sstevel@tonic-gate 	char			*data;
11587c478bd9Sstevel@tonic-gate 	dev_info_t 		*cdip = NULL;
11597c478bd9Sstevel@tonic-gate 	dev_info_t 		*ndip = NULL;
11607c478bd9Sstevel@tonic-gate 	int			circular;
11617c478bd9Sstevel@tonic-gate 
11627c478bd9Sstevel@tonic-gate 	ndi_devi_enter(vh->vh_dip, &circular);
11637c478bd9Sstevel@tonic-gate 	ndip = (dev_info_t *)DEVI(vh->vh_dip)->devi_child;
11647c478bd9Sstevel@tonic-gate 	while ((cdip = ndip) != NULL) {
11657c478bd9Sstevel@tonic-gate 		ndip = (dev_info_t *)DEVI(cdip)->devi_sibling;
11667c478bd9Sstevel@tonic-gate 
11677c478bd9Sstevel@tonic-gate 		if (strcmp(DEVI(cdip)->devi_node_name, name)) {
11687c478bd9Sstevel@tonic-gate 			continue;
11697c478bd9Sstevel@tonic-gate 		}
11707c478bd9Sstevel@tonic-gate 
11717c478bd9Sstevel@tonic-gate 		if (ddi_prop_lookup_string(DDI_DEV_T_ANY, cdip,
11727c478bd9Sstevel@tonic-gate 		    DDI_PROP_DONTPASS, MDI_CLIENT_GUID_PROP,
11737c478bd9Sstevel@tonic-gate 		    &data) != DDI_PROP_SUCCESS) {
11747c478bd9Sstevel@tonic-gate 			continue;
11757c478bd9Sstevel@tonic-gate 		}
11767c478bd9Sstevel@tonic-gate 
11777c478bd9Sstevel@tonic-gate 		if (strcmp(data, guid) != 0) {
11787c478bd9Sstevel@tonic-gate 			ddi_prop_free(data);
11797c478bd9Sstevel@tonic-gate 			continue;
11807c478bd9Sstevel@tonic-gate 		}
11817c478bd9Sstevel@tonic-gate 		ddi_prop_free(data);
11827c478bd9Sstevel@tonic-gate 		break;
11837c478bd9Sstevel@tonic-gate 	}
11847c478bd9Sstevel@tonic-gate 	ndi_devi_exit(vh->vh_dip, circular);
11857c478bd9Sstevel@tonic-gate 	return (cdip);
11867c478bd9Sstevel@tonic-gate }
11877c478bd9Sstevel@tonic-gate 
11887c478bd9Sstevel@tonic-gate /*
11897c478bd9Sstevel@tonic-gate  * i_mdi_devinfo_remove():
11907c478bd9Sstevel@tonic-gate  *		Remove a client device node
11917c478bd9Sstevel@tonic-gate  */
11927c478bd9Sstevel@tonic-gate static int
11937c478bd9Sstevel@tonic-gate i_mdi_devinfo_remove(dev_info_t *vdip, dev_info_t *cdip, int flags)
11947c478bd9Sstevel@tonic-gate {
11957c478bd9Sstevel@tonic-gate 	int	rv = MDI_SUCCESS;
11965e3986cbScth 
11977c478bd9Sstevel@tonic-gate 	if (i_mdi_is_child_present(vdip, cdip) == MDI_SUCCESS ||
11987c478bd9Sstevel@tonic-gate 	    (flags & MDI_CLIENT_FLAGS_DEV_NOT_SUPPORTED)) {
11994c06356bSdh142964 		rv = ndi_devi_offline(cdip, NDI_DEVFS_CLEAN | NDI_DEVI_REMOVE);
12007c478bd9Sstevel@tonic-gate 		if (rv != NDI_SUCCESS) {
12014c06356bSdh142964 			MDI_DEBUG(1, (MDI_NOTE, cdip,
12024c06356bSdh142964 			    "!failed: cdip %p", (void *)cdip));
12037c478bd9Sstevel@tonic-gate 		}
12047c478bd9Sstevel@tonic-gate 		/*
12057c478bd9Sstevel@tonic-gate 		 * Convert to MDI error code
12067c478bd9Sstevel@tonic-gate 		 */
12077c478bd9Sstevel@tonic-gate 		switch (rv) {
12087c478bd9Sstevel@tonic-gate 		case NDI_SUCCESS:
12097c478bd9Sstevel@tonic-gate 			rv = MDI_SUCCESS;
12107c478bd9Sstevel@tonic-gate 			break;
12117c478bd9Sstevel@tonic-gate 		case NDI_BUSY:
12127c478bd9Sstevel@tonic-gate 			rv = MDI_BUSY;
12137c478bd9Sstevel@tonic-gate 			break;
12147c478bd9Sstevel@tonic-gate 		default:
12157c478bd9Sstevel@tonic-gate 			rv = MDI_FAILURE;
12167c478bd9Sstevel@tonic-gate 			break;
12177c478bd9Sstevel@tonic-gate 		}
12187c478bd9Sstevel@tonic-gate 	}
12197c478bd9Sstevel@tonic-gate 	return (rv);
12207c478bd9Sstevel@tonic-gate }
12217c478bd9Sstevel@tonic-gate 
12227c478bd9Sstevel@tonic-gate /*
12237c478bd9Sstevel@tonic-gate  * i_devi_get_client()
12247c478bd9Sstevel@tonic-gate  *		Utility function to get mpxio component extensions
12257c478bd9Sstevel@tonic-gate  */
12267c478bd9Sstevel@tonic-gate static mdi_client_t *
12277c478bd9Sstevel@tonic-gate i_devi_get_client(dev_info_t *cdip)
12287c478bd9Sstevel@tonic-gate {
12297c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct = NULL;
12305e3986cbScth 
12317c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT(cdip)) {
12327c478bd9Sstevel@tonic-gate 		ct = (mdi_client_t *)DEVI(cdip)->devi_mdi_client;
12337c478bd9Sstevel@tonic-gate 	}
12347c478bd9Sstevel@tonic-gate 	return (ct);
12357c478bd9Sstevel@tonic-gate }
12367c478bd9Sstevel@tonic-gate 
12377c478bd9Sstevel@tonic-gate /*
12387c478bd9Sstevel@tonic-gate  * i_mdi_is_child_present():
12397c478bd9Sstevel@tonic-gate  *		Search for the presence of client device dev_info node
12407c478bd9Sstevel@tonic-gate  */
12417c478bd9Sstevel@tonic-gate static int
12427c478bd9Sstevel@tonic-gate i_mdi_is_child_present(dev_info_t *vdip, dev_info_t *cdip)
12437c478bd9Sstevel@tonic-gate {
12447c478bd9Sstevel@tonic-gate 	int		rv = MDI_FAILURE;
12457c478bd9Sstevel@tonic-gate 	struct dev_info	*dip;
12467c478bd9Sstevel@tonic-gate 	int		circular;
12477c478bd9Sstevel@tonic-gate 
12487c478bd9Sstevel@tonic-gate 	ndi_devi_enter(vdip, &circular);
12497c478bd9Sstevel@tonic-gate 	dip = DEVI(vdip)->devi_child;
12507c478bd9Sstevel@tonic-gate 	while (dip) {
12517c478bd9Sstevel@tonic-gate 		if (dip == DEVI(cdip)) {
12527c478bd9Sstevel@tonic-gate 			rv = MDI_SUCCESS;
12537c478bd9Sstevel@tonic-gate 			break;
12547c478bd9Sstevel@tonic-gate 		}
12557c478bd9Sstevel@tonic-gate 		dip = dip->devi_sibling;
12567c478bd9Sstevel@tonic-gate 	}
12577c478bd9Sstevel@tonic-gate 	ndi_devi_exit(vdip, circular);
12587c478bd9Sstevel@tonic-gate 	return (rv);
12597c478bd9Sstevel@tonic-gate }
12607c478bd9Sstevel@tonic-gate 
12617c478bd9Sstevel@tonic-gate 
12627c478bd9Sstevel@tonic-gate /*
12637c478bd9Sstevel@tonic-gate  * i_mdi_client_lock():
12647c478bd9Sstevel@tonic-gate  *		Grab client component lock
12657c478bd9Sstevel@tonic-gate  * Return Values:
12667c478bd9Sstevel@tonic-gate  *		None
12677c478bd9Sstevel@tonic-gate  * Note:
12687c478bd9Sstevel@tonic-gate  *		The default locking order is:
12697c478bd9Sstevel@tonic-gate  *		_NOTE(LOCK_ORDER(mdi_client::ct_mutex mdi_pathinfo::pi_mutex))
12707c478bd9Sstevel@tonic-gate  *		But there are number of situations where locks need to be
12717c478bd9Sstevel@tonic-gate  *		grabbed in reverse order.  This routine implements try and lock
12727c478bd9Sstevel@tonic-gate  *		mechanism depending on the requested parameter option.
12737c478bd9Sstevel@tonic-gate  */
12747c478bd9Sstevel@tonic-gate static void
12757c478bd9Sstevel@tonic-gate i_mdi_client_lock(mdi_client_t *ct, mdi_pathinfo_t *pip)
12767c478bd9Sstevel@tonic-gate {
12777c478bd9Sstevel@tonic-gate 	if (pip) {
12787c478bd9Sstevel@tonic-gate 		/*
12797c478bd9Sstevel@tonic-gate 		 * Reverse locking is requested.
12807c478bd9Sstevel@tonic-gate 		 */
12817c478bd9Sstevel@tonic-gate 		while (MDI_CLIENT_TRYLOCK(ct) == 0) {
12824c06356bSdh142964 			if (servicing_interrupt()) {
12834c06356bSdh142964 				MDI_PI_HOLD(pip);
12844c06356bSdh142964 				MDI_PI_UNLOCK(pip);
12854c06356bSdh142964 				MDI_CLIENT_LOCK(ct);
12864c06356bSdh142964 				MDI_PI_LOCK(pip);
12874c06356bSdh142964 				MDI_PI_RELE(pip);
12884c06356bSdh142964 				break;
12894c06356bSdh142964 			} else {
12907c478bd9Sstevel@tonic-gate 				/*
12917c478bd9Sstevel@tonic-gate 				 * tryenter failed. Try to grab again
12927c478bd9Sstevel@tonic-gate 				 * after a small delay
12937c478bd9Sstevel@tonic-gate 				 */
12947c478bd9Sstevel@tonic-gate 				MDI_PI_HOLD(pip);
12957c478bd9Sstevel@tonic-gate 				MDI_PI_UNLOCK(pip);
129696c4a178SChris Horne 				delay_random(mdi_delay);
12977c478bd9Sstevel@tonic-gate 				MDI_PI_LOCK(pip);
12987c478bd9Sstevel@tonic-gate 				MDI_PI_RELE(pip);
12997c478bd9Sstevel@tonic-gate 			}
13004c06356bSdh142964 		}
13017c478bd9Sstevel@tonic-gate 	} else {
13027c478bd9Sstevel@tonic-gate 		MDI_CLIENT_LOCK(ct);
13037c478bd9Sstevel@tonic-gate 	}
13047c478bd9Sstevel@tonic-gate }
13057c478bd9Sstevel@tonic-gate 
13067c478bd9Sstevel@tonic-gate /*
13077c478bd9Sstevel@tonic-gate  * i_mdi_client_unlock():
13087c478bd9Sstevel@tonic-gate  *		Unlock a client component
13097c478bd9Sstevel@tonic-gate  */
13107c478bd9Sstevel@tonic-gate static void
13117c478bd9Sstevel@tonic-gate i_mdi_client_unlock(mdi_client_t *ct)
13127c478bd9Sstevel@tonic-gate {
13137c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
13147c478bd9Sstevel@tonic-gate }
13157c478bd9Sstevel@tonic-gate 
13167c478bd9Sstevel@tonic-gate /*
13177c478bd9Sstevel@tonic-gate  * i_mdi_client_alloc():
13187c478bd9Sstevel@tonic-gate  * 		Allocate and initialize a client structure.  Caller should
13195e3986cbScth  *		hold the vhci client lock.
13207c478bd9Sstevel@tonic-gate  * Return Values:
13217c478bd9Sstevel@tonic-gate  *		Handle to a client component
13227c478bd9Sstevel@tonic-gate  */
13237c478bd9Sstevel@tonic-gate /*ARGSUSED*/
13247c478bd9Sstevel@tonic-gate static mdi_client_t *
13253c34adc5Sramat i_mdi_client_alloc(mdi_vhci_t *vh, char *name, char *lguid)
13267c478bd9Sstevel@tonic-gate {
13277c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
13287c478bd9Sstevel@tonic-gate 
13295e3986cbScth 	ASSERT(MDI_VHCI_CLIENT_LOCKED(vh));
13307c478bd9Sstevel@tonic-gate 
13317c478bd9Sstevel@tonic-gate 	/*
13327c478bd9Sstevel@tonic-gate 	 * Allocate and initialize a component structure.
13337c478bd9Sstevel@tonic-gate 	 */
13343c34adc5Sramat 	ct = kmem_zalloc(sizeof (*ct), KM_SLEEP);
13357c478bd9Sstevel@tonic-gate 	mutex_init(&ct->ct_mutex, NULL, MUTEX_DEFAULT, NULL);
13367c478bd9Sstevel@tonic-gate 	ct->ct_hnext = NULL;
13377c478bd9Sstevel@tonic-gate 	ct->ct_hprev = NULL;
13387c478bd9Sstevel@tonic-gate 	ct->ct_dip = NULL;
13397c478bd9Sstevel@tonic-gate 	ct->ct_vhci = vh;
13403c34adc5Sramat 	ct->ct_drvname = kmem_alloc(strlen(name) + 1, KM_SLEEP);
13417c478bd9Sstevel@tonic-gate 	(void) strcpy(ct->ct_drvname, name);
13423c34adc5Sramat 	ct->ct_guid = kmem_alloc(strlen(lguid) + 1, KM_SLEEP);
13437c478bd9Sstevel@tonic-gate 	(void) strcpy(ct->ct_guid, lguid);
13447c478bd9Sstevel@tonic-gate 	ct->ct_cprivate = NULL;
13457c478bd9Sstevel@tonic-gate 	ct->ct_vprivate = NULL;
13467c478bd9Sstevel@tonic-gate 	ct->ct_flags = 0;
13477c478bd9Sstevel@tonic-gate 	ct->ct_state = MDI_CLIENT_STATE_FAILED;
13485e3986cbScth 	MDI_CLIENT_LOCK(ct);
13497c478bd9Sstevel@tonic-gate 	MDI_CLIENT_SET_OFFLINE(ct);
13507c478bd9Sstevel@tonic-gate 	MDI_CLIENT_SET_DETACH(ct);
13517c478bd9Sstevel@tonic-gate 	MDI_CLIENT_SET_POWER_UP(ct);
13525e3986cbScth 	MDI_CLIENT_UNLOCK(ct);
13537c478bd9Sstevel@tonic-gate 	ct->ct_failover_flags = 0;
13547c478bd9Sstevel@tonic-gate 	ct->ct_failover_status = 0;
13557c478bd9Sstevel@tonic-gate 	cv_init(&ct->ct_failover_cv, NULL, CV_DRIVER, NULL);
13567c478bd9Sstevel@tonic-gate 	ct->ct_unstable = 0;
13577c478bd9Sstevel@tonic-gate 	cv_init(&ct->ct_unstable_cv, NULL, CV_DRIVER, NULL);
13587c478bd9Sstevel@tonic-gate 	cv_init(&ct->ct_powerchange_cv, NULL, CV_DRIVER, NULL);
13597c478bd9Sstevel@tonic-gate 	ct->ct_lb = vh->vh_lb;
13603c34adc5Sramat 	ct->ct_lb_args =  kmem_zalloc(sizeof (client_lb_args_t), KM_SLEEP);
13617c478bd9Sstevel@tonic-gate 	ct->ct_lb_args->region_size = LOAD_BALANCE_DEFAULT_REGION_SIZE;
13627c478bd9Sstevel@tonic-gate 	ct->ct_path_count = 0;
13637c478bd9Sstevel@tonic-gate 	ct->ct_path_head = NULL;
13647c478bd9Sstevel@tonic-gate 	ct->ct_path_tail = NULL;
13657c478bd9Sstevel@tonic-gate 	ct->ct_path_last = NULL;
13667c478bd9Sstevel@tonic-gate 
13677c478bd9Sstevel@tonic-gate 	/*
13687c478bd9Sstevel@tonic-gate 	 * Add this client component to our client hash queue
13697c478bd9Sstevel@tonic-gate 	 */
13707c478bd9Sstevel@tonic-gate 	i_mdi_client_enlist_table(vh, ct);
13717c478bd9Sstevel@tonic-gate 	return (ct);
13727c478bd9Sstevel@tonic-gate }
13737c478bd9Sstevel@tonic-gate 
13747c478bd9Sstevel@tonic-gate /*
13757c478bd9Sstevel@tonic-gate  * i_mdi_client_enlist_table():
13767c478bd9Sstevel@tonic-gate  *		Attach the client device to the client hash table. Caller
13775e3986cbScth  *		should hold the vhci client lock.
13787c478bd9Sstevel@tonic-gate  */
13797c478bd9Sstevel@tonic-gate static void
13807c478bd9Sstevel@tonic-gate i_mdi_client_enlist_table(mdi_vhci_t *vh, mdi_client_t *ct)
13817c478bd9Sstevel@tonic-gate {
13827c478bd9Sstevel@tonic-gate 	int 			index;
13837c478bd9Sstevel@tonic-gate 	struct client_hash	*head;
13847c478bd9Sstevel@tonic-gate 
13855e3986cbScth 	ASSERT(MDI_VHCI_CLIENT_LOCKED(vh));
13865e3986cbScth 
13877c478bd9Sstevel@tonic-gate 	index = i_mdi_get_hash_key(ct->ct_guid);
13887c478bd9Sstevel@tonic-gate 	head = &vh->vh_client_table[index];
13897c478bd9Sstevel@tonic-gate 	ct->ct_hnext = (mdi_client_t *)head->ct_hash_head;
13907c478bd9Sstevel@tonic-gate 	head->ct_hash_head = ct;
13917c478bd9Sstevel@tonic-gate 	head->ct_hash_count++;
13927c478bd9Sstevel@tonic-gate 	vh->vh_client_count++;
13937c478bd9Sstevel@tonic-gate }
13947c478bd9Sstevel@tonic-gate 
13957c478bd9Sstevel@tonic-gate /*
13967c478bd9Sstevel@tonic-gate  * i_mdi_client_delist_table():
13977c478bd9Sstevel@tonic-gate  *		Attach the client device to the client hash table.
13985e3986cbScth  *		Caller should hold the vhci client lock.
13997c478bd9Sstevel@tonic-gate  */
14007c478bd9Sstevel@tonic-gate static void
14017c478bd9Sstevel@tonic-gate i_mdi_client_delist_table(mdi_vhci_t *vh, mdi_client_t *ct)
14027c478bd9Sstevel@tonic-gate {
14037c478bd9Sstevel@tonic-gate 	int			index;
14047c478bd9Sstevel@tonic-gate 	char			*guid;
14057c478bd9Sstevel@tonic-gate 	struct client_hash 	*head;
14067c478bd9Sstevel@tonic-gate 	mdi_client_t		*next;
14077c478bd9Sstevel@tonic-gate 	mdi_client_t		*last;
14087c478bd9Sstevel@tonic-gate 
14095e3986cbScth 	ASSERT(MDI_VHCI_CLIENT_LOCKED(vh));
14105e3986cbScth 
14117c478bd9Sstevel@tonic-gate 	guid = ct->ct_guid;
14127c478bd9Sstevel@tonic-gate 	index = i_mdi_get_hash_key(guid);
14137c478bd9Sstevel@tonic-gate 	head = &vh->vh_client_table[index];
14147c478bd9Sstevel@tonic-gate 
14157c478bd9Sstevel@tonic-gate 	last = NULL;
14167c478bd9Sstevel@tonic-gate 	next = (mdi_client_t *)head->ct_hash_head;
14177c478bd9Sstevel@tonic-gate 	while (next != NULL) {
14187c478bd9Sstevel@tonic-gate 		if (next == ct) {
14197c478bd9Sstevel@tonic-gate 			break;
14207c478bd9Sstevel@tonic-gate 		}
14217c478bd9Sstevel@tonic-gate 		last = next;
14227c478bd9Sstevel@tonic-gate 		next = next->ct_hnext;
14237c478bd9Sstevel@tonic-gate 	}
14247c478bd9Sstevel@tonic-gate 
14257c478bd9Sstevel@tonic-gate 	if (next) {
14267c478bd9Sstevel@tonic-gate 		head->ct_hash_count--;
14277c478bd9Sstevel@tonic-gate 		if (last == NULL) {
14287c478bd9Sstevel@tonic-gate 			head->ct_hash_head = ct->ct_hnext;
14297c478bd9Sstevel@tonic-gate 		} else {
14307c478bd9Sstevel@tonic-gate 			last->ct_hnext = ct->ct_hnext;
14317c478bd9Sstevel@tonic-gate 		}
14327c478bd9Sstevel@tonic-gate 		ct->ct_hnext = NULL;
14337c478bd9Sstevel@tonic-gate 		vh->vh_client_count--;
14347c478bd9Sstevel@tonic-gate 	}
14357c478bd9Sstevel@tonic-gate }
14367c478bd9Sstevel@tonic-gate 
14377c478bd9Sstevel@tonic-gate 
14387c478bd9Sstevel@tonic-gate /*
14397c478bd9Sstevel@tonic-gate  * i_mdi_client_free():
14407c478bd9Sstevel@tonic-gate  *		Free a client component
14417c478bd9Sstevel@tonic-gate  */
14427c478bd9Sstevel@tonic-gate static int
14437c478bd9Sstevel@tonic-gate i_mdi_client_free(mdi_vhci_t *vh, mdi_client_t *ct)
14447c478bd9Sstevel@tonic-gate {
14457c478bd9Sstevel@tonic-gate 	int		rv = MDI_SUCCESS;
14467c478bd9Sstevel@tonic-gate 	int		flags = ct->ct_flags;
14477c478bd9Sstevel@tonic-gate 	dev_info_t	*cdip;
14487c478bd9Sstevel@tonic-gate 	dev_info_t	*vdip;
14497c478bd9Sstevel@tonic-gate 
14505e3986cbScth 	ASSERT(MDI_VHCI_CLIENT_LOCKED(vh));
14515e3986cbScth 
14527c478bd9Sstevel@tonic-gate 	vdip = vh->vh_dip;
14537c478bd9Sstevel@tonic-gate 	cdip = ct->ct_dip;
14547c478bd9Sstevel@tonic-gate 
14557c478bd9Sstevel@tonic-gate 	(void) ndi_prop_remove(DDI_DEV_T_NONE, cdip, MDI_CLIENT_GUID_PROP);
14567c478bd9Sstevel@tonic-gate 	DEVI(cdip)->devi_mdi_component &= ~MDI_COMPONENT_CLIENT;
14577c478bd9Sstevel@tonic-gate 	DEVI(cdip)->devi_mdi_client = NULL;
14587c478bd9Sstevel@tonic-gate 
14597c478bd9Sstevel@tonic-gate 	/*
14607c478bd9Sstevel@tonic-gate 	 * Clear out back ref. to dev_info_t node
14617c478bd9Sstevel@tonic-gate 	 */
14627c478bd9Sstevel@tonic-gate 	ct->ct_dip = NULL;
14637c478bd9Sstevel@tonic-gate 
14647c478bd9Sstevel@tonic-gate 	/*
14657c478bd9Sstevel@tonic-gate 	 * Remove this client from our hash queue
14667c478bd9Sstevel@tonic-gate 	 */
14677c478bd9Sstevel@tonic-gate 	i_mdi_client_delist_table(vh, ct);
14687c478bd9Sstevel@tonic-gate 
14697c478bd9Sstevel@tonic-gate 	/*
14707c478bd9Sstevel@tonic-gate 	 * Uninitialize and free the component
14717c478bd9Sstevel@tonic-gate 	 */
14727c478bd9Sstevel@tonic-gate 	kmem_free(ct->ct_drvname, strlen(ct->ct_drvname) + 1);
14737c478bd9Sstevel@tonic-gate 	kmem_free(ct->ct_guid, strlen(ct->ct_guid) + 1);
14747c478bd9Sstevel@tonic-gate 	kmem_free(ct->ct_lb_args, sizeof (client_lb_args_t));
14757c478bd9Sstevel@tonic-gate 	cv_destroy(&ct->ct_failover_cv);
14767c478bd9Sstevel@tonic-gate 	cv_destroy(&ct->ct_unstable_cv);
14777c478bd9Sstevel@tonic-gate 	cv_destroy(&ct->ct_powerchange_cv);
14787c478bd9Sstevel@tonic-gate 	mutex_destroy(&ct->ct_mutex);
14797c478bd9Sstevel@tonic-gate 	kmem_free(ct, sizeof (*ct));
14807c478bd9Sstevel@tonic-gate 
14817c478bd9Sstevel@tonic-gate 	if (cdip != NULL) {
14825e3986cbScth 		MDI_VHCI_CLIENT_UNLOCK(vh);
14837c478bd9Sstevel@tonic-gate 		(void) i_mdi_devinfo_remove(vdip, cdip, flags);
14845e3986cbScth 		MDI_VHCI_CLIENT_LOCK(vh);
14857c478bd9Sstevel@tonic-gate 	}
14867c478bd9Sstevel@tonic-gate 	return (rv);
14877c478bd9Sstevel@tonic-gate }
14887c478bd9Sstevel@tonic-gate 
14897c478bd9Sstevel@tonic-gate /*
14907c478bd9Sstevel@tonic-gate  * i_mdi_client_find():
14917c478bd9Sstevel@tonic-gate  * 		Find the client structure corresponding to a given guid
14925e3986cbScth  *		Caller should hold the vhci client lock.
14937c478bd9Sstevel@tonic-gate  */
14947c478bd9Sstevel@tonic-gate static mdi_client_t *
14953c34adc5Sramat i_mdi_client_find(mdi_vhci_t *vh, char *cname, char *guid)
14967c478bd9Sstevel@tonic-gate {
14977c478bd9Sstevel@tonic-gate 	int			index;
14987c478bd9Sstevel@tonic-gate 	struct client_hash	*head;
14997c478bd9Sstevel@tonic-gate 	mdi_client_t		*ct;
15007c478bd9Sstevel@tonic-gate 
15015e3986cbScth 	ASSERT(MDI_VHCI_CLIENT_LOCKED(vh));
15025e3986cbScth 
15037c478bd9Sstevel@tonic-gate 	index = i_mdi_get_hash_key(guid);
15047c478bd9Sstevel@tonic-gate 	head = &vh->vh_client_table[index];
15057c478bd9Sstevel@tonic-gate 
15067c478bd9Sstevel@tonic-gate 	ct = head->ct_hash_head;
15077c478bd9Sstevel@tonic-gate 	while (ct != NULL) {
15083c34adc5Sramat 		if (strcmp(ct->ct_guid, guid) == 0 &&
15093c34adc5Sramat 		    (cname == NULL || strcmp(ct->ct_drvname, cname) == 0)) {
15107c478bd9Sstevel@tonic-gate 			break;
15117c478bd9Sstevel@tonic-gate 		}
15127c478bd9Sstevel@tonic-gate 		ct = ct->ct_hnext;
15137c478bd9Sstevel@tonic-gate 	}
15147c478bd9Sstevel@tonic-gate 	return (ct);
15157c478bd9Sstevel@tonic-gate }
15167c478bd9Sstevel@tonic-gate 
15177c478bd9Sstevel@tonic-gate /*
15187c478bd9Sstevel@tonic-gate  * i_mdi_client_update_state():
15197c478bd9Sstevel@tonic-gate  *		Compute and update client device state
15207c478bd9Sstevel@tonic-gate  * Notes:
15217c478bd9Sstevel@tonic-gate  *		A client device can be in any of three possible states:
15227c478bd9Sstevel@tonic-gate  *
15237c478bd9Sstevel@tonic-gate  *		MDI_CLIENT_STATE_OPTIMAL - Client in optimal state with more
15247c478bd9Sstevel@tonic-gate  *		one online/standby paths. Can tolerate failures.
15257c478bd9Sstevel@tonic-gate  *		MDI_CLIENT_STATE_DEGRADED - Client device in degraded state with
15267c478bd9Sstevel@tonic-gate  *		no alternate paths available as standby. A failure on the online
15277c478bd9Sstevel@tonic-gate  *		would result in loss of access to device data.
15287c478bd9Sstevel@tonic-gate  *		MDI_CLIENT_STATE_FAILED - Client device in failed state with
15297c478bd9Sstevel@tonic-gate  *		no paths available to access the device.
15307c478bd9Sstevel@tonic-gate  */
15317c478bd9Sstevel@tonic-gate static void
15327c478bd9Sstevel@tonic-gate i_mdi_client_update_state(mdi_client_t *ct)
15337c478bd9Sstevel@tonic-gate {
15347c478bd9Sstevel@tonic-gate 	int state;
15355e3986cbScth 
15365e3986cbScth 	ASSERT(MDI_CLIENT_LOCKED(ct));
15377c478bd9Sstevel@tonic-gate 	state = i_mdi_client_compute_state(ct, NULL);
15387c478bd9Sstevel@tonic-gate 	MDI_CLIENT_SET_STATE(ct, state);
15397c478bd9Sstevel@tonic-gate }
15407c478bd9Sstevel@tonic-gate 
15417c478bd9Sstevel@tonic-gate /*
15427c478bd9Sstevel@tonic-gate  * i_mdi_client_compute_state():
15437c478bd9Sstevel@tonic-gate  *		Compute client device state
15447c478bd9Sstevel@tonic-gate  *
15457c478bd9Sstevel@tonic-gate  *		mdi_phci_t *	Pointer to pHCI structure which should
15467c478bd9Sstevel@tonic-gate  *				while computing the new value.  Used by
15477c478bd9Sstevel@tonic-gate  *				i_mdi_phci_offline() to find the new
15487c478bd9Sstevel@tonic-gate  *				client state after DR of a pHCI.
15497c478bd9Sstevel@tonic-gate  */
15507c478bd9Sstevel@tonic-gate static int
15517c478bd9Sstevel@tonic-gate i_mdi_client_compute_state(mdi_client_t *ct, mdi_phci_t *ph)
15527c478bd9Sstevel@tonic-gate {
15537c478bd9Sstevel@tonic-gate 	int		state;
15547c478bd9Sstevel@tonic-gate 	int		online_count = 0;
15557c478bd9Sstevel@tonic-gate 	int		standby_count = 0;
15567c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*pip, *next;
15577c478bd9Sstevel@tonic-gate 
15585e3986cbScth 	ASSERT(MDI_CLIENT_LOCKED(ct));
15597c478bd9Sstevel@tonic-gate 	pip = ct->ct_path_head;
15607c478bd9Sstevel@tonic-gate 	while (pip != NULL) {
15617c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
15627c478bd9Sstevel@tonic-gate 		next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link;
15637c478bd9Sstevel@tonic-gate 		if (MDI_PI(pip)->pi_phci == ph) {
15647c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
15657c478bd9Sstevel@tonic-gate 			pip = next;
15667c478bd9Sstevel@tonic-gate 			continue;
15677c478bd9Sstevel@tonic-gate 		}
15685e3986cbScth 
15697c478bd9Sstevel@tonic-gate 		if ((MDI_PI(pip)->pi_state & MDI_PATHINFO_STATE_MASK)
15707c478bd9Sstevel@tonic-gate 				== MDI_PATHINFO_STATE_ONLINE)
15717c478bd9Sstevel@tonic-gate 			online_count++;
15727c478bd9Sstevel@tonic-gate 		else if ((MDI_PI(pip)->pi_state & MDI_PATHINFO_STATE_MASK)
15737c478bd9Sstevel@tonic-gate 				== MDI_PATHINFO_STATE_STANDBY)
15747c478bd9Sstevel@tonic-gate 			standby_count++;
15757c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
15767c478bd9Sstevel@tonic-gate 		pip = next;
15777c478bd9Sstevel@tonic-gate 	}
15787c478bd9Sstevel@tonic-gate 
15797c478bd9Sstevel@tonic-gate 	if (online_count == 0) {
15807c478bd9Sstevel@tonic-gate 		if (standby_count == 0) {
15817c478bd9Sstevel@tonic-gate 			state = MDI_CLIENT_STATE_FAILED;
15824c06356bSdh142964 			MDI_DEBUG(2, (MDI_NOTE, ct->ct_dip,
15834c06356bSdh142964 			    "client state failed: ct = %p", (void *)ct));
15847c478bd9Sstevel@tonic-gate 		} else if (standby_count == 1) {
15857c478bd9Sstevel@tonic-gate 			state = MDI_CLIENT_STATE_DEGRADED;
15867c478bd9Sstevel@tonic-gate 		} else {
15877c478bd9Sstevel@tonic-gate 			state = MDI_CLIENT_STATE_OPTIMAL;
15887c478bd9Sstevel@tonic-gate 		}
15897c478bd9Sstevel@tonic-gate 	} else if (online_count == 1) {
15907c478bd9Sstevel@tonic-gate 		if (standby_count == 0) {
15917c478bd9Sstevel@tonic-gate 			state = MDI_CLIENT_STATE_DEGRADED;
15927c478bd9Sstevel@tonic-gate 		} else {
15937c478bd9Sstevel@tonic-gate 			state = MDI_CLIENT_STATE_OPTIMAL;
15947c478bd9Sstevel@tonic-gate 		}
15957c478bd9Sstevel@tonic-gate 	} else {
15967c478bd9Sstevel@tonic-gate 		state = MDI_CLIENT_STATE_OPTIMAL;
15977c478bd9Sstevel@tonic-gate 	}
15987c478bd9Sstevel@tonic-gate 	return (state);
15997c478bd9Sstevel@tonic-gate }
16007c478bd9Sstevel@tonic-gate 
16017c478bd9Sstevel@tonic-gate /*
16027c478bd9Sstevel@tonic-gate  * i_mdi_client2devinfo():
16037c478bd9Sstevel@tonic-gate  *		Utility function
16047c478bd9Sstevel@tonic-gate  */
16057c478bd9Sstevel@tonic-gate dev_info_t *
16067c478bd9Sstevel@tonic-gate i_mdi_client2devinfo(mdi_client_t *ct)
16077c478bd9Sstevel@tonic-gate {
16087c478bd9Sstevel@tonic-gate 	return (ct->ct_dip);
16097c478bd9Sstevel@tonic-gate }
16107c478bd9Sstevel@tonic-gate 
16117c478bd9Sstevel@tonic-gate /*
16127c478bd9Sstevel@tonic-gate  * mdi_client_path2_devinfo():
16137c478bd9Sstevel@tonic-gate  * 		Given the parent devinfo and child devfs pathname, search for
16147c478bd9Sstevel@tonic-gate  *		a valid devfs node handle.
16157c478bd9Sstevel@tonic-gate  */
16167c478bd9Sstevel@tonic-gate dev_info_t *
16177c478bd9Sstevel@tonic-gate mdi_client_path2devinfo(dev_info_t *vdip, char *pathname)
16187c478bd9Sstevel@tonic-gate {
16197c478bd9Sstevel@tonic-gate 	dev_info_t 	*cdip = NULL;
16207c478bd9Sstevel@tonic-gate 	dev_info_t 	*ndip = NULL;
16217c478bd9Sstevel@tonic-gate 	char		*temp_pathname;
16227c478bd9Sstevel@tonic-gate 	int		circular;
16237c478bd9Sstevel@tonic-gate 
16247c478bd9Sstevel@tonic-gate 	/*
16257c478bd9Sstevel@tonic-gate 	 * Allocate temp buffer
16267c478bd9Sstevel@tonic-gate 	 */
16277c478bd9Sstevel@tonic-gate 	temp_pathname = kmem_zalloc(MAXPATHLEN, KM_SLEEP);
16287c478bd9Sstevel@tonic-gate 
16297c478bd9Sstevel@tonic-gate 	/*
16307c478bd9Sstevel@tonic-gate 	 * Lock parent against changes
16317c478bd9Sstevel@tonic-gate 	 */
16327c478bd9Sstevel@tonic-gate 	ndi_devi_enter(vdip, &circular);
16337c478bd9Sstevel@tonic-gate 	ndip = (dev_info_t *)DEVI(vdip)->devi_child;
16347c478bd9Sstevel@tonic-gate 	while ((cdip = ndip) != NULL) {
16357c478bd9Sstevel@tonic-gate 		ndip = (dev_info_t *)DEVI(cdip)->devi_sibling;
16367c478bd9Sstevel@tonic-gate 
16377c478bd9Sstevel@tonic-gate 		*temp_pathname = '\0';
16387c478bd9Sstevel@tonic-gate 		(void) ddi_pathname(cdip, temp_pathname);
16397c478bd9Sstevel@tonic-gate 		if (strcmp(temp_pathname, pathname) == 0) {
16407c478bd9Sstevel@tonic-gate 			break;
16417c478bd9Sstevel@tonic-gate 		}
16427c478bd9Sstevel@tonic-gate 	}
16437c478bd9Sstevel@tonic-gate 	/*
16447c478bd9Sstevel@tonic-gate 	 * Release devinfo lock
16457c478bd9Sstevel@tonic-gate 	 */
16467c478bd9Sstevel@tonic-gate 	ndi_devi_exit(vdip, circular);
16477c478bd9Sstevel@tonic-gate 
16487c478bd9Sstevel@tonic-gate 	/*
16497c478bd9Sstevel@tonic-gate 	 * Free the temp buffer
16507c478bd9Sstevel@tonic-gate 	 */
16517c478bd9Sstevel@tonic-gate 	kmem_free(temp_pathname, MAXPATHLEN);
16527c478bd9Sstevel@tonic-gate 	return (cdip);
16537c478bd9Sstevel@tonic-gate }
16547c478bd9Sstevel@tonic-gate 
16557c478bd9Sstevel@tonic-gate /*
16567c478bd9Sstevel@tonic-gate  * mdi_client_get_path_count():
16577c478bd9Sstevel@tonic-gate  * 		Utility function to get number of path information nodes
16587c478bd9Sstevel@tonic-gate  *		associated with a given client device.
16597c478bd9Sstevel@tonic-gate  */
16607c478bd9Sstevel@tonic-gate int
16617c478bd9Sstevel@tonic-gate mdi_client_get_path_count(dev_info_t *cdip)
16627c478bd9Sstevel@tonic-gate {
16637c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
16647c478bd9Sstevel@tonic-gate 	int		count = 0;
16657c478bd9Sstevel@tonic-gate 
16667c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(cdip);
16677c478bd9Sstevel@tonic-gate 	if (ct != NULL) {
16687c478bd9Sstevel@tonic-gate 		count = ct->ct_path_count;
16697c478bd9Sstevel@tonic-gate 	}
16707c478bd9Sstevel@tonic-gate 	return (count);
16717c478bd9Sstevel@tonic-gate }
16727c478bd9Sstevel@tonic-gate 
16737c478bd9Sstevel@tonic-gate 
16747c478bd9Sstevel@tonic-gate /*
16757c478bd9Sstevel@tonic-gate  * i_mdi_get_hash_key():
16767c478bd9Sstevel@tonic-gate  * 		Create a hash using strings as keys
16777c478bd9Sstevel@tonic-gate  *
16787c478bd9Sstevel@tonic-gate  */
16797c478bd9Sstevel@tonic-gate static int
16807c478bd9Sstevel@tonic-gate i_mdi_get_hash_key(char *str)
16817c478bd9Sstevel@tonic-gate {
16827c478bd9Sstevel@tonic-gate 	uint32_t	g, hash = 0;
16837c478bd9Sstevel@tonic-gate 	char		*p;
16847c478bd9Sstevel@tonic-gate 
16857c478bd9Sstevel@tonic-gate 	for (p = str; *p != '\0'; p++) {
16867c478bd9Sstevel@tonic-gate 		g = *p;
16877c478bd9Sstevel@tonic-gate 		hash += g;
16887c478bd9Sstevel@tonic-gate 	}
16897c478bd9Sstevel@tonic-gate 	return (hash % (CLIENT_HASH_TABLE_SIZE - 1));
16907c478bd9Sstevel@tonic-gate }
16917c478bd9Sstevel@tonic-gate 
16927c478bd9Sstevel@tonic-gate /*
16937c478bd9Sstevel@tonic-gate  * mdi_get_lb_policy():
16947c478bd9Sstevel@tonic-gate  * 		Get current load balancing policy for a given client device
16957c478bd9Sstevel@tonic-gate  */
16967c478bd9Sstevel@tonic-gate client_lb_t
16977c478bd9Sstevel@tonic-gate mdi_get_lb_policy(dev_info_t *cdip)
16987c478bd9Sstevel@tonic-gate {
16997c478bd9Sstevel@tonic-gate 	client_lb_t	lb = LOAD_BALANCE_NONE;
17007c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
17017c478bd9Sstevel@tonic-gate 
17027c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(cdip);
17037c478bd9Sstevel@tonic-gate 	if (ct != NULL) {
17047c478bd9Sstevel@tonic-gate 		lb = ct->ct_lb;
17057c478bd9Sstevel@tonic-gate 	}
17067c478bd9Sstevel@tonic-gate 	return (lb);
17077c478bd9Sstevel@tonic-gate }
17087c478bd9Sstevel@tonic-gate 
17097c478bd9Sstevel@tonic-gate /*
17107c478bd9Sstevel@tonic-gate  * mdi_set_lb_region_size():
17117c478bd9Sstevel@tonic-gate  * 		Set current region size for the load-balance
17127c478bd9Sstevel@tonic-gate  */
17137c478bd9Sstevel@tonic-gate int
17147c478bd9Sstevel@tonic-gate mdi_set_lb_region_size(dev_info_t *cdip, int region_size)
17157c478bd9Sstevel@tonic-gate {
17167c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
17177c478bd9Sstevel@tonic-gate 	int		rv = MDI_FAILURE;
17187c478bd9Sstevel@tonic-gate 
17197c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(cdip);
17207c478bd9Sstevel@tonic-gate 	if (ct != NULL && ct->ct_lb_args != NULL) {
17217c478bd9Sstevel@tonic-gate 		ct->ct_lb_args->region_size = region_size;
17227c478bd9Sstevel@tonic-gate 		rv = MDI_SUCCESS;
17237c478bd9Sstevel@tonic-gate 	}
17247c478bd9Sstevel@tonic-gate 	return (rv);
17257c478bd9Sstevel@tonic-gate }
17267c478bd9Sstevel@tonic-gate 
17277c478bd9Sstevel@tonic-gate /*
17287c478bd9Sstevel@tonic-gate  * mdi_Set_lb_policy():
17297c478bd9Sstevel@tonic-gate  * 		Set current load balancing policy for a given client device
17307c478bd9Sstevel@tonic-gate  */
17317c478bd9Sstevel@tonic-gate int
17327c478bd9Sstevel@tonic-gate mdi_set_lb_policy(dev_info_t *cdip, client_lb_t lb)
17337c478bd9Sstevel@tonic-gate {
17347c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
17357c478bd9Sstevel@tonic-gate 	int		rv = MDI_FAILURE;
17367c478bd9Sstevel@tonic-gate 
17377c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(cdip);
17387c478bd9Sstevel@tonic-gate 	if (ct != NULL) {
17397c478bd9Sstevel@tonic-gate 		ct->ct_lb = lb;
17407c478bd9Sstevel@tonic-gate 		rv = MDI_SUCCESS;
17417c478bd9Sstevel@tonic-gate 	}
17427c478bd9Sstevel@tonic-gate 	return (rv);
17437c478bd9Sstevel@tonic-gate }
17447c478bd9Sstevel@tonic-gate 
17457c478bd9Sstevel@tonic-gate /*
17467c478bd9Sstevel@tonic-gate  * mdi_failover():
17477c478bd9Sstevel@tonic-gate  *		failover function called by the vHCI drivers to initiate
17487c478bd9Sstevel@tonic-gate  *		a failover operation.  This is typically due to non-availability
17497c478bd9Sstevel@tonic-gate  *		of online paths to route I/O requests.  Failover can be
17507c478bd9Sstevel@tonic-gate  *		triggered through user application also.
17517c478bd9Sstevel@tonic-gate  *
17527c478bd9Sstevel@tonic-gate  *		The vHCI driver calls mdi_failover() to initiate a failover
17537c478bd9Sstevel@tonic-gate  *		operation. mdi_failover() calls back into the vHCI driver's
17547c478bd9Sstevel@tonic-gate  *		vo_failover() entry point to perform the actual failover
17557c478bd9Sstevel@tonic-gate  *		operation.  The reason for requiring the vHCI driver to
17567c478bd9Sstevel@tonic-gate  *		initiate failover by calling mdi_failover(), instead of directly
17577c478bd9Sstevel@tonic-gate  *		executing vo_failover() itself, is to ensure that the mdi
17587c478bd9Sstevel@tonic-gate  *		framework can keep track of the client state properly.
17597c478bd9Sstevel@tonic-gate  *		Additionally, mdi_failover() provides as a convenience the
17607c478bd9Sstevel@tonic-gate  *		option of performing the failover operation synchronously or
17617c478bd9Sstevel@tonic-gate  *		asynchronously
17627c478bd9Sstevel@tonic-gate  *
17637c478bd9Sstevel@tonic-gate  *		Upon successful completion of the failover operation, the
17647c478bd9Sstevel@tonic-gate  *		paths that were previously ONLINE will be in the STANDBY state,
17657c478bd9Sstevel@tonic-gate  *		and the newly activated paths will be in the ONLINE state.
17667c478bd9Sstevel@tonic-gate  *
17677c478bd9Sstevel@tonic-gate  *		The flags modifier determines whether the activation is done
17687c478bd9Sstevel@tonic-gate  *		synchronously: MDI_FAILOVER_SYNC
17697c478bd9Sstevel@tonic-gate  * Return Values:
17707c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
17717c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
17727c478bd9Sstevel@tonic-gate  *		MDI_BUSY
17737c478bd9Sstevel@tonic-gate  */
17747c478bd9Sstevel@tonic-gate /*ARGSUSED*/
17757c478bd9Sstevel@tonic-gate int
17767c478bd9Sstevel@tonic-gate mdi_failover(dev_info_t *vdip, dev_info_t *cdip, int flags)
17777c478bd9Sstevel@tonic-gate {
17787c478bd9Sstevel@tonic-gate 	int			rv;
17797c478bd9Sstevel@tonic-gate 	mdi_client_t		*ct;
17807c478bd9Sstevel@tonic-gate 
17817c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(cdip);
17827c478bd9Sstevel@tonic-gate 	ASSERT(ct != NULL);
17837c478bd9Sstevel@tonic-gate 	if (ct == NULL) {
17847c478bd9Sstevel@tonic-gate 		/* cdip is not a valid client device. Nothing more to do. */
17857c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
17867c478bd9Sstevel@tonic-gate 	}
17877c478bd9Sstevel@tonic-gate 
17887c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
17897c478bd9Sstevel@tonic-gate 
17907c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT_IS_PATH_FREE_IN_PROGRESS(ct)) {
17917c478bd9Sstevel@tonic-gate 		/* A path to the client is being freed */
17927c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
17937c478bd9Sstevel@tonic-gate 		return (MDI_BUSY);
17947c478bd9Sstevel@tonic-gate 	}
17957c478bd9Sstevel@tonic-gate 
17967c478bd9Sstevel@tonic-gate 
17977c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT_IS_FAILED(ct)) {
17987c478bd9Sstevel@tonic-gate 		/*
17997c478bd9Sstevel@tonic-gate 		 * Client is in failed state. Nothing more to do.
18007c478bd9Sstevel@tonic-gate 		 */
18017c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
18027c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
18037c478bd9Sstevel@tonic-gate 	}
18047c478bd9Sstevel@tonic-gate 
18057c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT_IS_FAILOVER_IN_PROGRESS(ct)) {
18067c478bd9Sstevel@tonic-gate 		/*
18077c478bd9Sstevel@tonic-gate 		 * Failover is already in progress; return BUSY
18087c478bd9Sstevel@tonic-gate 		 */
18097c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
18107c478bd9Sstevel@tonic-gate 		return (MDI_BUSY);
18117c478bd9Sstevel@tonic-gate 	}
18127c478bd9Sstevel@tonic-gate 	/*
18137c478bd9Sstevel@tonic-gate 	 * Make sure that mdi_pathinfo node state changes are processed.
18147c478bd9Sstevel@tonic-gate 	 * We do not allow failovers to progress while client path state
18157c478bd9Sstevel@tonic-gate 	 * changes are in progress
18167c478bd9Sstevel@tonic-gate 	 */
18177c478bd9Sstevel@tonic-gate 	if (ct->ct_unstable) {
18187c478bd9Sstevel@tonic-gate 		if (flags == MDI_FAILOVER_ASYNC) {
18197c478bd9Sstevel@tonic-gate 			MDI_CLIENT_UNLOCK(ct);
18207c478bd9Sstevel@tonic-gate 			return (MDI_BUSY);
18217c478bd9Sstevel@tonic-gate 		} else {
18227c478bd9Sstevel@tonic-gate 			while (ct->ct_unstable)
18237c478bd9Sstevel@tonic-gate 				cv_wait(&ct->ct_unstable_cv, &ct->ct_mutex);
18247c478bd9Sstevel@tonic-gate 		}
18257c478bd9Sstevel@tonic-gate 	}
18267c478bd9Sstevel@tonic-gate 
18277c478bd9Sstevel@tonic-gate 	/*
18287c478bd9Sstevel@tonic-gate 	 * Client device is in stable state. Before proceeding, perform sanity
18297c478bd9Sstevel@tonic-gate 	 * checks again.
18307c478bd9Sstevel@tonic-gate 	 */
18317c478bd9Sstevel@tonic-gate 	if ((MDI_CLIENT_IS_DETACHED(ct)) || (MDI_CLIENT_IS_FAILED(ct)) ||
1832737d277aScth 	    (!i_ddi_devi_attached(ct->ct_dip))) {
18337c478bd9Sstevel@tonic-gate 		/*
18347c478bd9Sstevel@tonic-gate 		 * Client is in failed state. Nothing more to do.
18357c478bd9Sstevel@tonic-gate 		 */
18367c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
18377c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
18387c478bd9Sstevel@tonic-gate 	}
18397c478bd9Sstevel@tonic-gate 
18407c478bd9Sstevel@tonic-gate 	/*
18417c478bd9Sstevel@tonic-gate 	 * Set the client state as failover in progress.
18427c478bd9Sstevel@tonic-gate 	 */
18437c478bd9Sstevel@tonic-gate 	MDI_CLIENT_SET_FAILOVER_IN_PROGRESS(ct);
18447c478bd9Sstevel@tonic-gate 	ct->ct_failover_flags = flags;
18457c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
18467c478bd9Sstevel@tonic-gate 
18477c478bd9Sstevel@tonic-gate 	if (flags == MDI_FAILOVER_ASYNC) {
18487c478bd9Sstevel@tonic-gate 		/*
18497c478bd9Sstevel@tonic-gate 		 * Submit the initiate failover request via CPR safe
18507c478bd9Sstevel@tonic-gate 		 * taskq threads.
18517c478bd9Sstevel@tonic-gate 		 */
18527c478bd9Sstevel@tonic-gate 		(void) taskq_dispatch(mdi_taskq, (task_func_t *)i_mdi_failover,
18537c478bd9Sstevel@tonic-gate 		    ct, KM_SLEEP);
18547c478bd9Sstevel@tonic-gate 		return (MDI_ACCEPT);
18557c478bd9Sstevel@tonic-gate 	} else {
18567c478bd9Sstevel@tonic-gate 		/*
18577c478bd9Sstevel@tonic-gate 		 * Synchronous failover mode.  Typically invoked from the user
18587c478bd9Sstevel@tonic-gate 		 * land.
18597c478bd9Sstevel@tonic-gate 		 */
18607c478bd9Sstevel@tonic-gate 		rv = i_mdi_failover(ct);
18617c478bd9Sstevel@tonic-gate 	}
18627c478bd9Sstevel@tonic-gate 	return (rv);
18637c478bd9Sstevel@tonic-gate }
18647c478bd9Sstevel@tonic-gate 
18657c478bd9Sstevel@tonic-gate /*
18667c478bd9Sstevel@tonic-gate  * i_mdi_failover():
18677c478bd9Sstevel@tonic-gate  *		internal failover function. Invokes vHCI drivers failover
18687c478bd9Sstevel@tonic-gate  *		callback function and process the failover status
18697c478bd9Sstevel@tonic-gate  * Return Values:
18707c478bd9Sstevel@tonic-gate  *		None
18717c478bd9Sstevel@tonic-gate  *
18727c478bd9Sstevel@tonic-gate  * Note: A client device in failover state can not be detached or freed.
18737c478bd9Sstevel@tonic-gate  */
18747c478bd9Sstevel@tonic-gate static int
18757c478bd9Sstevel@tonic-gate i_mdi_failover(void *arg)
18767c478bd9Sstevel@tonic-gate {
18777c478bd9Sstevel@tonic-gate 	int		rv = MDI_SUCCESS;
18787c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct = (mdi_client_t *)arg;
18797c478bd9Sstevel@tonic-gate 	mdi_vhci_t	*vh = ct->ct_vhci;
18807c478bd9Sstevel@tonic-gate 
18815e3986cbScth 	ASSERT(!MDI_CLIENT_LOCKED(ct));
18827c478bd9Sstevel@tonic-gate 
18837c478bd9Sstevel@tonic-gate 	if (vh->vh_ops->vo_failover != NULL) {
18847c478bd9Sstevel@tonic-gate 		/*
18857c478bd9Sstevel@tonic-gate 		 * Call vHCI drivers callback routine
18867c478bd9Sstevel@tonic-gate 		 */
18877c478bd9Sstevel@tonic-gate 		rv = (*vh->vh_ops->vo_failover)(vh->vh_dip, ct->ct_dip,
18887c478bd9Sstevel@tonic-gate 		    ct->ct_failover_flags);
18897c478bd9Sstevel@tonic-gate 	}
18907c478bd9Sstevel@tonic-gate 
18917c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
18927c478bd9Sstevel@tonic-gate 	MDI_CLIENT_CLEAR_FAILOVER_IN_PROGRESS(ct);
18937c478bd9Sstevel@tonic-gate 
18947c478bd9Sstevel@tonic-gate 	/*
18957c478bd9Sstevel@tonic-gate 	 * Save the failover return status
18967c478bd9Sstevel@tonic-gate 	 */
18977c478bd9Sstevel@tonic-gate 	ct->ct_failover_status = rv;
18987c478bd9Sstevel@tonic-gate 
18997c478bd9Sstevel@tonic-gate 	/*
19007c478bd9Sstevel@tonic-gate 	 * As a result of failover, client status would have been changed.
19017c478bd9Sstevel@tonic-gate 	 * Update the client state and wake up anyone waiting on this client
19027c478bd9Sstevel@tonic-gate 	 * device.
19037c478bd9Sstevel@tonic-gate 	 */
19047c478bd9Sstevel@tonic-gate 	i_mdi_client_update_state(ct);
19057c478bd9Sstevel@tonic-gate 
19067c478bd9Sstevel@tonic-gate 	cv_broadcast(&ct->ct_failover_cv);
19077c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
19087c478bd9Sstevel@tonic-gate 	return (rv);
19097c478bd9Sstevel@tonic-gate }
19107c478bd9Sstevel@tonic-gate 
19117c478bd9Sstevel@tonic-gate /*
19127c478bd9Sstevel@tonic-gate  * Load balancing is logical block.
19137c478bd9Sstevel@tonic-gate  * IOs within the range described by region_size
19147c478bd9Sstevel@tonic-gate  * would go on the same path. This would improve the
19157c478bd9Sstevel@tonic-gate  * performance by cache-hit on some of the RAID devices.
19167c478bd9Sstevel@tonic-gate  * Search only for online paths(At some point we
19177c478bd9Sstevel@tonic-gate  * may want to balance across target ports).
19187c478bd9Sstevel@tonic-gate  * If no paths are found then default to round-robin.
19197c478bd9Sstevel@tonic-gate  */
19207c478bd9Sstevel@tonic-gate static int
19217c478bd9Sstevel@tonic-gate i_mdi_lba_lb(mdi_client_t *ct, mdi_pathinfo_t **ret_pip, struct buf *bp)
19227c478bd9Sstevel@tonic-gate {
19237c478bd9Sstevel@tonic-gate 	int		path_index = -1;
19247c478bd9Sstevel@tonic-gate 	int		online_path_count = 0;
19257c478bd9Sstevel@tonic-gate 	int		online_nonpref_path_count = 0;
19267c478bd9Sstevel@tonic-gate 	int 		region_size = ct->ct_lb_args->region_size;
19277c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*pip;
19287c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*next;
19297c478bd9Sstevel@tonic-gate 	int		preferred, path_cnt;
19307c478bd9Sstevel@tonic-gate 
19317c478bd9Sstevel@tonic-gate 	pip = ct->ct_path_head;
19327c478bd9Sstevel@tonic-gate 	while (pip) {
19337c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
19347c478bd9Sstevel@tonic-gate 		if (MDI_PI(pip)->pi_state ==
19357c478bd9Sstevel@tonic-gate 		    MDI_PATHINFO_STATE_ONLINE && MDI_PI(pip)->pi_preferred) {
19367c478bd9Sstevel@tonic-gate 			online_path_count++;
19377c478bd9Sstevel@tonic-gate 		} else if (MDI_PI(pip)->pi_state ==
19387c478bd9Sstevel@tonic-gate 		    MDI_PATHINFO_STATE_ONLINE && !MDI_PI(pip)->pi_preferred) {
19397c478bd9Sstevel@tonic-gate 			online_nonpref_path_count++;
19407c478bd9Sstevel@tonic-gate 		}
19417c478bd9Sstevel@tonic-gate 		next = (mdi_pathinfo_t *)
19427c478bd9Sstevel@tonic-gate 		    MDI_PI(pip)->pi_client_link;
19437c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
19447c478bd9Sstevel@tonic-gate 		pip = next;
19457c478bd9Sstevel@tonic-gate 	}
19467c478bd9Sstevel@tonic-gate 	/* if found any online/preferred then use this type */
19477c478bd9Sstevel@tonic-gate 	if (online_path_count > 0) {
19487c478bd9Sstevel@tonic-gate 		path_cnt = online_path_count;
19497c478bd9Sstevel@tonic-gate 		preferred = 1;
19507c478bd9Sstevel@tonic-gate 	} else if (online_nonpref_path_count > 0) {
19517c478bd9Sstevel@tonic-gate 		path_cnt = online_nonpref_path_count;
19527c478bd9Sstevel@tonic-gate 		preferred = 0;
19537c478bd9Sstevel@tonic-gate 	} else {
19547c478bd9Sstevel@tonic-gate 		path_cnt = 0;
19557c478bd9Sstevel@tonic-gate 	}
19567c478bd9Sstevel@tonic-gate 	if (path_cnt) {
19577c478bd9Sstevel@tonic-gate 		path_index = (bp->b_blkno >> region_size) % path_cnt;
19587c478bd9Sstevel@tonic-gate 		pip = ct->ct_path_head;
19597c478bd9Sstevel@tonic-gate 		while (pip && path_index != -1) {
19607c478bd9Sstevel@tonic-gate 			MDI_PI_LOCK(pip);
19617c478bd9Sstevel@tonic-gate 			if (path_index == 0 &&
19627c478bd9Sstevel@tonic-gate 			    (MDI_PI(pip)->pi_state ==
19637c478bd9Sstevel@tonic-gate 			    MDI_PATHINFO_STATE_ONLINE) &&
19647c478bd9Sstevel@tonic-gate 				MDI_PI(pip)->pi_preferred == preferred) {
19657c478bd9Sstevel@tonic-gate 				MDI_PI_HOLD(pip);
19667c478bd9Sstevel@tonic-gate 				MDI_PI_UNLOCK(pip);
19677c478bd9Sstevel@tonic-gate 				*ret_pip = pip;
19687c478bd9Sstevel@tonic-gate 				return (MDI_SUCCESS);
19697c478bd9Sstevel@tonic-gate 			}
19707c478bd9Sstevel@tonic-gate 			path_index --;
19717c478bd9Sstevel@tonic-gate 			next = (mdi_pathinfo_t *)
19727c478bd9Sstevel@tonic-gate 			    MDI_PI(pip)->pi_client_link;
19737c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
19747c478bd9Sstevel@tonic-gate 			pip = next;
19757c478bd9Sstevel@tonic-gate 		}
19764c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, ct->ct_dip,
19774c06356bSdh142964 		    "lba %llx: path %s %p",
19784c06356bSdh142964 		    bp->b_lblkno, mdi_pi_spathname(pip), (void *)pip));
19797c478bd9Sstevel@tonic-gate 	}
19807c478bd9Sstevel@tonic-gate 	return (MDI_FAILURE);
19817c478bd9Sstevel@tonic-gate }
19827c478bd9Sstevel@tonic-gate 
19837c478bd9Sstevel@tonic-gate /*
19847c478bd9Sstevel@tonic-gate  * mdi_select_path():
19857c478bd9Sstevel@tonic-gate  *		select a path to access a client device.
19867c478bd9Sstevel@tonic-gate  *
19877c478bd9Sstevel@tonic-gate  *		mdi_select_path() function is called by the vHCI drivers to
19887c478bd9Sstevel@tonic-gate  *		select a path to route the I/O request to.  The caller passes
19897c478bd9Sstevel@tonic-gate  *		the block I/O data transfer structure ("buf") as one of the
19907c478bd9Sstevel@tonic-gate  *		parameters.  The mpxio framework uses the buf structure
19917c478bd9Sstevel@tonic-gate  *		contents to maintain per path statistics (total I/O size /
19927c478bd9Sstevel@tonic-gate  *		count pending).  If more than one online paths are available to
19937c478bd9Sstevel@tonic-gate  *		select, the framework automatically selects a suitable path
19947c478bd9Sstevel@tonic-gate  *		for routing I/O request. If a failover operation is active for
19957c478bd9Sstevel@tonic-gate  *		this client device the call shall be failed with MDI_BUSY error
19967c478bd9Sstevel@tonic-gate  *		code.
19977c478bd9Sstevel@tonic-gate  *
19987c478bd9Sstevel@tonic-gate  *		By default this function returns a suitable path in online
19997c478bd9Sstevel@tonic-gate  *		state based on the current load balancing policy.  Currently
20007c478bd9Sstevel@tonic-gate  *		we support LOAD_BALANCE_NONE (Previously selected online path
20017c478bd9Sstevel@tonic-gate  *		will continue to be used till the path is usable) and
20027c478bd9Sstevel@tonic-gate  *		LOAD_BALANCE_RR (Online paths will be selected in a round
20037c478bd9Sstevel@tonic-gate  *		robin fashion), LOAD_BALANCE_LB(Online paths will be selected
20047c478bd9Sstevel@tonic-gate  *		based on the logical block).  The load balancing
20057c478bd9Sstevel@tonic-gate  *		through vHCI drivers configuration file (driver.conf).
20067c478bd9Sstevel@tonic-gate  *
20077c478bd9Sstevel@tonic-gate  *		vHCI drivers may override this default behavior by specifying
2008602ca9eaScth  *		appropriate flags.  The meaning of the thrid argument depends
2009602ca9eaScth  *		on the flags specified. If MDI_SELECT_PATH_INSTANCE is set
2010602ca9eaScth  *		then the argument is the "path instance" of the path to select.
2011602ca9eaScth  *		If MDI_SELECT_PATH_INSTANCE is not set then the argument is
2012602ca9eaScth  *		"start_pip". A non NULL "start_pip" is the starting point to
2013602ca9eaScth  *		walk and find the next appropriate path.  The following values
2014602ca9eaScth  *		are currently defined: MDI_SELECT_ONLINE_PATH (to select an
2015602ca9eaScth  *		ONLINE path) and/or MDI_SELECT_STANDBY_PATH (to select an
2016602ca9eaScth  *		STANDBY path).
20177c478bd9Sstevel@tonic-gate  *
20187c478bd9Sstevel@tonic-gate  *		The non-standard behavior is used by the scsi_vhci driver,
20197c478bd9Sstevel@tonic-gate  *		whenever it has to use a STANDBY/FAULTED path.  Eg. during
20207c478bd9Sstevel@tonic-gate  *		attach of client devices (to avoid an unnecessary failover
20217c478bd9Sstevel@tonic-gate  *		when the STANDBY path comes up first), during failover
20227c478bd9Sstevel@tonic-gate  *		(to activate a STANDBY path as ONLINE).
20237c478bd9Sstevel@tonic-gate  *
20245e3986cbScth  *		The selected path is returned in a a mdi_hold_path() state
20255e3986cbScth  *		(pi_ref_cnt). Caller should release the hold by calling
20265e3986cbScth  *		mdi_rele_path().
20277c478bd9Sstevel@tonic-gate  *
20287c478bd9Sstevel@tonic-gate  * Return Values:
20297c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS	- Completed successfully
20307c478bd9Sstevel@tonic-gate  *		MDI_BUSY 	- Client device is busy failing over
20317c478bd9Sstevel@tonic-gate  *		MDI_NOPATH	- Client device is online, but no valid path are
20327c478bd9Sstevel@tonic-gate  *				  available to access this client device
20337c478bd9Sstevel@tonic-gate  *		MDI_FAILURE	- Invalid client device or state
20347c478bd9Sstevel@tonic-gate  *		MDI_DEVI_ONLINING
20357c478bd9Sstevel@tonic-gate  *				- Client device (struct dev_info state) is in
20367c478bd9Sstevel@tonic-gate  *				  onlining state.
20377c478bd9Sstevel@tonic-gate  */
20387c478bd9Sstevel@tonic-gate 
20397c478bd9Sstevel@tonic-gate /*ARGSUSED*/
20407c478bd9Sstevel@tonic-gate int
20417c478bd9Sstevel@tonic-gate mdi_select_path(dev_info_t *cdip, struct buf *bp, int flags,
2042602ca9eaScth     void *arg, mdi_pathinfo_t **ret_pip)
20437c478bd9Sstevel@tonic-gate {
20447c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
20457c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*pip;
20467c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*next;
20477c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*head;
20487c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*start;
20497c478bd9Sstevel@tonic-gate 	client_lb_t	lbp;	/* load balancing policy */
20507c478bd9Sstevel@tonic-gate 	int		sb = 1;	/* standard behavior */
20517c478bd9Sstevel@tonic-gate 	int		preferred = 1;	/* preferred path */
20527c478bd9Sstevel@tonic-gate 	int		cond, cont = 1;
20537c478bd9Sstevel@tonic-gate 	int		retry = 0;
2054602ca9eaScth 	mdi_pathinfo_t	*start_pip;	/* request starting pathinfo */
2055602ca9eaScth 	int		path_instance;	/* request specific path instance */
2056602ca9eaScth 
2057602ca9eaScth 	/* determine type of arg based on flags */
2058602ca9eaScth 	if (flags & MDI_SELECT_PATH_INSTANCE) {
2059602ca9eaScth 		path_instance = (int)(intptr_t)arg;
2060602ca9eaScth 		start_pip = NULL;
2061602ca9eaScth 	} else {
2062602ca9eaScth 		path_instance = 0;
2063602ca9eaScth 		start_pip = (mdi_pathinfo_t *)arg;
2064602ca9eaScth 	}
20657c478bd9Sstevel@tonic-gate 
20667c478bd9Sstevel@tonic-gate 	if (flags != 0) {
20677c478bd9Sstevel@tonic-gate 		/*
20687c478bd9Sstevel@tonic-gate 		 * disable default behavior
20697c478bd9Sstevel@tonic-gate 		 */
20707c478bd9Sstevel@tonic-gate 		sb = 0;
20717c478bd9Sstevel@tonic-gate 	}
20727c478bd9Sstevel@tonic-gate 
20737c478bd9Sstevel@tonic-gate 	*ret_pip = NULL;
20747c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(cdip);
20757c478bd9Sstevel@tonic-gate 	if (ct == NULL) {
20767c478bd9Sstevel@tonic-gate 		/* mdi extensions are NULL, Nothing more to do */
20777c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
20787c478bd9Sstevel@tonic-gate 	}
20797c478bd9Sstevel@tonic-gate 
20807c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
20817c478bd9Sstevel@tonic-gate 
20827c478bd9Sstevel@tonic-gate 	if (sb) {
20837c478bd9Sstevel@tonic-gate 		if (MDI_CLIENT_IS_FAILED(ct)) {
20847c478bd9Sstevel@tonic-gate 			/*
20857c478bd9Sstevel@tonic-gate 			 * Client is not ready to accept any I/O requests.
20867c478bd9Sstevel@tonic-gate 			 * Fail this request.
20877c478bd9Sstevel@tonic-gate 			 */
20884c06356bSdh142964 			MDI_DEBUG(2, (MDI_NOTE, cdip,
20894c06356bSdh142964 			    "client state offline ct = %p", (void *)ct));
20907c478bd9Sstevel@tonic-gate 			MDI_CLIENT_UNLOCK(ct);
20917c478bd9Sstevel@tonic-gate 			return (MDI_FAILURE);
20927c478bd9Sstevel@tonic-gate 		}
20937c478bd9Sstevel@tonic-gate 
20947c478bd9Sstevel@tonic-gate 		if (MDI_CLIENT_IS_FAILOVER_IN_PROGRESS(ct)) {
20957c478bd9Sstevel@tonic-gate 			/*
20967c478bd9Sstevel@tonic-gate 			 * Check for Failover is in progress. If so tell the
20977c478bd9Sstevel@tonic-gate 			 * caller that this device is busy.
20987c478bd9Sstevel@tonic-gate 			 */
20994c06356bSdh142964 			MDI_DEBUG(2, (MDI_NOTE, cdip,
21004c06356bSdh142964 			    "client failover in progress ct = %p",
21015e3986cbScth 			    (void *)ct));
21027c478bd9Sstevel@tonic-gate 			MDI_CLIENT_UNLOCK(ct);
21037c478bd9Sstevel@tonic-gate 			return (MDI_BUSY);
21047c478bd9Sstevel@tonic-gate 		}
21057c478bd9Sstevel@tonic-gate 
21067c478bd9Sstevel@tonic-gate 		/*
21077c478bd9Sstevel@tonic-gate 		 * Check to see whether the client device is attached.
21087c478bd9Sstevel@tonic-gate 		 * If not so, let the vHCI driver manually select a path
21097c478bd9Sstevel@tonic-gate 		 * (standby) and let the probe/attach process to continue.
21107c478bd9Sstevel@tonic-gate 		 */
2111737d277aScth 		if (MDI_CLIENT_IS_DETACHED(ct) || !i_ddi_devi_attached(cdip)) {
21124c06356bSdh142964 			MDI_DEBUG(4, (MDI_NOTE, cdip,
21134c06356bSdh142964 			    "devi is onlining ct = %p", (void *)ct));
21147c478bd9Sstevel@tonic-gate 			MDI_CLIENT_UNLOCK(ct);
21157c478bd9Sstevel@tonic-gate 			return (MDI_DEVI_ONLINING);
21167c478bd9Sstevel@tonic-gate 		}
21177c478bd9Sstevel@tonic-gate 	}
21187c478bd9Sstevel@tonic-gate 
21197c478bd9Sstevel@tonic-gate 	/*
21207c478bd9Sstevel@tonic-gate 	 * Cache in the client list head.  If head of the list is NULL
21217c478bd9Sstevel@tonic-gate 	 * return MDI_NOPATH
21227c478bd9Sstevel@tonic-gate 	 */
21237c478bd9Sstevel@tonic-gate 	head = ct->ct_path_head;
21247c478bd9Sstevel@tonic-gate 	if (head == NULL) {
21257c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
21267c478bd9Sstevel@tonic-gate 		return (MDI_NOPATH);
21277c478bd9Sstevel@tonic-gate 	}
21287c478bd9Sstevel@tonic-gate 
2129602ca9eaScth 	/* Caller is specifying a specific pathinfo path by path_instance */
2130602ca9eaScth 	if (path_instance) {
2131602ca9eaScth 		/* search for pathinfo with correct path_instance */
2132602ca9eaScth 		for (pip = head;
2133602ca9eaScth 		    pip && (mdi_pi_get_path_instance(pip) != path_instance);
2134602ca9eaScth 		    pip = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link)
2135602ca9eaScth 			;
2136602ca9eaScth 
2137ab412e72SSrikanth, Ramana 		/* If path can't be selected then MDI_NOPATH is returned. */
2138602ca9eaScth 		if (pip == NULL) {
2139602ca9eaScth 			MDI_CLIENT_UNLOCK(ct);
2140ab412e72SSrikanth, Ramana 			return (MDI_NOPATH);
2141602ca9eaScth 		}
2142602ca9eaScth 
21434c06356bSdh142964 		/*
21444c06356bSdh142964 		 * Verify state of path. When asked to select a specific
21454c06356bSdh142964 		 * path_instance, we select the requested path in any
21464c06356bSdh142964 		 * state (ONLINE, OFFLINE, STANDBY, FAULT) other than INIT.
21474c06356bSdh142964 		 * We don't however select paths where the pHCI has detached.
21484c06356bSdh142964 		 * NOTE: last pathinfo node of an opened client device may
21494c06356bSdh142964 		 * exist in an OFFLINE state after the pHCI associated with
21504c06356bSdh142964 		 * that path has detached (but pi_phci will be NULL if that
21514c06356bSdh142964 		 * has occurred).
21524c06356bSdh142964 		 */
2153602ca9eaScth 		MDI_PI_LOCK(pip);
21544c06356bSdh142964 		if ((MDI_PI(pip)->pi_state == MDI_PATHINFO_STATE_INIT) ||
21554c06356bSdh142964 		    (MDI_PI(pip)->pi_phci == NULL)) {
2156602ca9eaScth 			MDI_PI_UNLOCK(pip);
2157602ca9eaScth 			MDI_CLIENT_UNLOCK(ct);
2158602ca9eaScth 			return (MDI_FAILURE);
2159602ca9eaScth 		}
2160602ca9eaScth 
2161ab412e72SSrikanth, Ramana 		/* Return MDI_BUSY if we have a transient condition */
2162ab412e72SSrikanth, Ramana 		if (MDI_PI_IS_TRANSIENT(pip)) {
2163ab412e72SSrikanth, Ramana 			MDI_PI_UNLOCK(pip);
2164ab412e72SSrikanth, Ramana 			MDI_CLIENT_UNLOCK(ct);
2165ab412e72SSrikanth, Ramana 			return (MDI_BUSY);
2166ab412e72SSrikanth, Ramana 		}
2167ab412e72SSrikanth, Ramana 
2168602ca9eaScth 		/*
2169602ca9eaScth 		 * Return the path in hold state. Caller should release the
2170602ca9eaScth 		 * lock by calling mdi_rele_path()
2171602ca9eaScth 		 */
2172602ca9eaScth 		MDI_PI_HOLD(pip);
2173602ca9eaScth 		MDI_PI_UNLOCK(pip);
2174602ca9eaScth 		*ret_pip = pip;
2175602ca9eaScth 		MDI_CLIENT_UNLOCK(ct);
2176602ca9eaScth 		return (MDI_SUCCESS);
2177602ca9eaScth 	}
2178602ca9eaScth 
21797c478bd9Sstevel@tonic-gate 	/*
21807c478bd9Sstevel@tonic-gate 	 * for non default behavior, bypass current
21817c478bd9Sstevel@tonic-gate 	 * load balancing policy and always use LOAD_BALANCE_RR
21827c478bd9Sstevel@tonic-gate 	 * except that the start point will be adjusted based
21837c478bd9Sstevel@tonic-gate 	 * on the provided start_pip
21847c478bd9Sstevel@tonic-gate 	 */
21857c478bd9Sstevel@tonic-gate 	lbp = sb ? ct->ct_lb : LOAD_BALANCE_RR;
21867c478bd9Sstevel@tonic-gate 
21877c478bd9Sstevel@tonic-gate 	switch (lbp) {
21887c478bd9Sstevel@tonic-gate 	case LOAD_BALANCE_NONE:
21897c478bd9Sstevel@tonic-gate 		/*
21907c478bd9Sstevel@tonic-gate 		 * Load balancing is None  or Alternate path mode
21917c478bd9Sstevel@tonic-gate 		 * Start looking for a online mdi_pathinfo node starting from
21927c478bd9Sstevel@tonic-gate 		 * last known selected path
21937c478bd9Sstevel@tonic-gate 		 */
21947c478bd9Sstevel@tonic-gate 		preferred = 1;
21957c478bd9Sstevel@tonic-gate 		pip = (mdi_pathinfo_t *)ct->ct_path_last;
21967c478bd9Sstevel@tonic-gate 		if (pip == NULL) {
21977c478bd9Sstevel@tonic-gate 			pip = head;
21987c478bd9Sstevel@tonic-gate 		}
21997c478bd9Sstevel@tonic-gate 		start = pip;
22007c478bd9Sstevel@tonic-gate 		do {
22017c478bd9Sstevel@tonic-gate 			MDI_PI_LOCK(pip);
22027c478bd9Sstevel@tonic-gate 			/*
22037c478bd9Sstevel@tonic-gate 			 * No need to explicitly check if the path is disabled.
22047c478bd9Sstevel@tonic-gate 			 * Since we are checking for state == ONLINE and the
220555e592a2SRandall Ralphs 			 * same variable is used for DISABLE/ENABLE information.
22067c478bd9Sstevel@tonic-gate 			 */
2207ee28b439Scm136836 			if ((MDI_PI(pip)->pi_state  ==
2208ee28b439Scm136836 				MDI_PATHINFO_STATE_ONLINE) &&
22097c478bd9Sstevel@tonic-gate 				preferred == MDI_PI(pip)->pi_preferred) {
22107c478bd9Sstevel@tonic-gate 				/*
22117c478bd9Sstevel@tonic-gate 				 * Return the path in hold state. Caller should
22127c478bd9Sstevel@tonic-gate 				 * release the lock by calling mdi_rele_path()
22137c478bd9Sstevel@tonic-gate 				 */
22147c478bd9Sstevel@tonic-gate 				MDI_PI_HOLD(pip);
22157c478bd9Sstevel@tonic-gate 				MDI_PI_UNLOCK(pip);
22167c478bd9Sstevel@tonic-gate 				ct->ct_path_last = pip;
22177c478bd9Sstevel@tonic-gate 				*ret_pip = pip;
22187c478bd9Sstevel@tonic-gate 				MDI_CLIENT_UNLOCK(ct);
22197c478bd9Sstevel@tonic-gate 				return (MDI_SUCCESS);
22207c478bd9Sstevel@tonic-gate 			}
22217c478bd9Sstevel@tonic-gate 
22227c478bd9Sstevel@tonic-gate 			/*
22237c478bd9Sstevel@tonic-gate 			 * Path is busy.
22247c478bd9Sstevel@tonic-gate 			 */
22257c478bd9Sstevel@tonic-gate 			if (MDI_PI_IS_DRV_DISABLE_TRANSIENT(pip) ||
22267c478bd9Sstevel@tonic-gate 			    MDI_PI_IS_TRANSIENT(pip))
22277c478bd9Sstevel@tonic-gate 				retry = 1;
22287c478bd9Sstevel@tonic-gate 			/*
22297c478bd9Sstevel@tonic-gate 			 * Keep looking for a next available online path
22307c478bd9Sstevel@tonic-gate 			 */
22317c478bd9Sstevel@tonic-gate 			next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link;
22327c478bd9Sstevel@tonic-gate 			if (next == NULL) {
22337c478bd9Sstevel@tonic-gate 				next = head;
22347c478bd9Sstevel@tonic-gate 			}
22357c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
22367c478bd9Sstevel@tonic-gate 			pip = next;
22377c478bd9Sstevel@tonic-gate 			if (start == pip && preferred) {
22387c478bd9Sstevel@tonic-gate 				preferred = 0;
22397c478bd9Sstevel@tonic-gate 			} else if (start == pip && !preferred) {
22407c478bd9Sstevel@tonic-gate 				cont = 0;
22417c478bd9Sstevel@tonic-gate 			}
22427c478bd9Sstevel@tonic-gate 		} while (cont);
22437c478bd9Sstevel@tonic-gate 		break;
22447c478bd9Sstevel@tonic-gate 
22457c478bd9Sstevel@tonic-gate 	case LOAD_BALANCE_LBA:
22467c478bd9Sstevel@tonic-gate 		/*
22477c478bd9Sstevel@tonic-gate 		 * Make sure we are looking
22487c478bd9Sstevel@tonic-gate 		 * for an online path. Otherwise, if it is for a STANDBY
22497c478bd9Sstevel@tonic-gate 		 * path request, it will go through and fetch an ONLINE
22507c478bd9Sstevel@tonic-gate 		 * path which is not desirable.
22517c478bd9Sstevel@tonic-gate 		 */
22527c478bd9Sstevel@tonic-gate 		if ((ct->ct_lb_args != NULL) &&
22537c478bd9Sstevel@tonic-gate 			    (ct->ct_lb_args->region_size) && bp &&
22547c478bd9Sstevel@tonic-gate 				(sb || (flags == MDI_SELECT_ONLINE_PATH))) {
22557c478bd9Sstevel@tonic-gate 			if (i_mdi_lba_lb(ct, ret_pip, bp)
22567c478bd9Sstevel@tonic-gate 				    == MDI_SUCCESS) {
22577c478bd9Sstevel@tonic-gate 				MDI_CLIENT_UNLOCK(ct);
22587c478bd9Sstevel@tonic-gate 				return (MDI_SUCCESS);
22597c478bd9Sstevel@tonic-gate 			}
22607c478bd9Sstevel@tonic-gate 		}
22617c478bd9Sstevel@tonic-gate 		/* FALLTHROUGH */
22627c478bd9Sstevel@tonic-gate 	case LOAD_BALANCE_RR:
22637c478bd9Sstevel@tonic-gate 		/*
22647c478bd9Sstevel@tonic-gate 		 * Load balancing is Round Robin. Start looking for a online
22657c478bd9Sstevel@tonic-gate 		 * mdi_pathinfo node starting from last known selected path
22667c478bd9Sstevel@tonic-gate 		 * as the start point.  If override flags are specified,
22677c478bd9Sstevel@tonic-gate 		 * process accordingly.
22687c478bd9Sstevel@tonic-gate 		 * If the search is already in effect(start_pip not null),
22697c478bd9Sstevel@tonic-gate 		 * then lets just use the same path preference to continue the
22707c478bd9Sstevel@tonic-gate 		 * traversal.
22717c478bd9Sstevel@tonic-gate 		 */
22727c478bd9Sstevel@tonic-gate 
22737c478bd9Sstevel@tonic-gate 		if (start_pip != NULL) {
22747c478bd9Sstevel@tonic-gate 			preferred = MDI_PI(start_pip)->pi_preferred;
22757c478bd9Sstevel@tonic-gate 		} else {
22767c478bd9Sstevel@tonic-gate 			preferred = 1;
22777c478bd9Sstevel@tonic-gate 		}
22787c478bd9Sstevel@tonic-gate 
22797c478bd9Sstevel@tonic-gate 		start = sb ? (mdi_pathinfo_t *)ct->ct_path_last : start_pip;
22807c478bd9Sstevel@tonic-gate 		if (start == NULL) {
22817c478bd9Sstevel@tonic-gate 			pip = head;
22827c478bd9Sstevel@tonic-gate 		} else {
22837c478bd9Sstevel@tonic-gate 			pip = (mdi_pathinfo_t *)MDI_PI(start)->pi_client_link;
22847c478bd9Sstevel@tonic-gate 			if (pip == NULL) {
2285b08fdaf7SSheshadri Vasudevan 				if ( flags & MDI_SELECT_NO_PREFERRED) {
2286b08fdaf7SSheshadri Vasudevan 					/*
2287b08fdaf7SSheshadri Vasudevan 					 * Return since we hit the end of list
2288b08fdaf7SSheshadri Vasudevan 					 */
2289b08fdaf7SSheshadri Vasudevan 					MDI_CLIENT_UNLOCK(ct);
2290b08fdaf7SSheshadri Vasudevan 					return (MDI_NOPATH);
2291b08fdaf7SSheshadri Vasudevan 				}
2292b08fdaf7SSheshadri Vasudevan 
22937c478bd9Sstevel@tonic-gate 				if (!sb) {
22947c478bd9Sstevel@tonic-gate 					if (preferred == 0) {
22957c478bd9Sstevel@tonic-gate 						/*
22967c478bd9Sstevel@tonic-gate 						 * Looks like we have completed
22977c478bd9Sstevel@tonic-gate 						 * the traversal as preferred
22987c478bd9Sstevel@tonic-gate 						 * value is 0. Time to bail out.
22997c478bd9Sstevel@tonic-gate 						 */
23007c478bd9Sstevel@tonic-gate 						*ret_pip = NULL;
23017c478bd9Sstevel@tonic-gate 						MDI_CLIENT_UNLOCK(ct);
23027c478bd9Sstevel@tonic-gate 						return (MDI_NOPATH);
23037c478bd9Sstevel@tonic-gate 					} else {
23047c478bd9Sstevel@tonic-gate 						/*
23057c478bd9Sstevel@tonic-gate 						 * Looks like we reached the
23067c478bd9Sstevel@tonic-gate 						 * end of the list. Lets enable
23077c478bd9Sstevel@tonic-gate 						 * traversal of non preferred
23087c478bd9Sstevel@tonic-gate 						 * paths.
23097c478bd9Sstevel@tonic-gate 						 */
23107c478bd9Sstevel@tonic-gate 						preferred = 0;
23117c478bd9Sstevel@tonic-gate 					}
23127c478bd9Sstevel@tonic-gate 				}
23137c478bd9Sstevel@tonic-gate 				pip = head;
23147c478bd9Sstevel@tonic-gate 			}
23157c478bd9Sstevel@tonic-gate 		}
23167c478bd9Sstevel@tonic-gate 		start = pip;
23177c478bd9Sstevel@tonic-gate 		do {
23187c478bd9Sstevel@tonic-gate 			MDI_PI_LOCK(pip);
23197c478bd9Sstevel@tonic-gate 			if (sb) {
23207c478bd9Sstevel@tonic-gate 				cond = ((MDI_PI(pip)->pi_state ==
23217c478bd9Sstevel@tonic-gate 				    MDI_PATHINFO_STATE_ONLINE &&
23227c478bd9Sstevel@tonic-gate 					MDI_PI(pip)->pi_preferred ==
23237c478bd9Sstevel@tonic-gate 						preferred) ? 1 : 0);
23247c478bd9Sstevel@tonic-gate 			} else {
23257c478bd9Sstevel@tonic-gate 				if (flags == MDI_SELECT_ONLINE_PATH) {
23267c478bd9Sstevel@tonic-gate 					cond = ((MDI_PI(pip)->pi_state ==
23277c478bd9Sstevel@tonic-gate 					    MDI_PATHINFO_STATE_ONLINE &&
23287c478bd9Sstevel@tonic-gate 						MDI_PI(pip)->pi_preferred ==
23297c478bd9Sstevel@tonic-gate 						preferred) ? 1 : 0);
23307c478bd9Sstevel@tonic-gate 				} else if (flags == MDI_SELECT_STANDBY_PATH) {
23317c478bd9Sstevel@tonic-gate 					cond = ((MDI_PI(pip)->pi_state ==
23327c478bd9Sstevel@tonic-gate 					    MDI_PATHINFO_STATE_STANDBY &&
23337c478bd9Sstevel@tonic-gate 						MDI_PI(pip)->pi_preferred ==
23347c478bd9Sstevel@tonic-gate 						preferred) ? 1 : 0);
23357c478bd9Sstevel@tonic-gate 				} else if (flags == (MDI_SELECT_ONLINE_PATH |
23367c478bd9Sstevel@tonic-gate 				    MDI_SELECT_STANDBY_PATH)) {
23377c478bd9Sstevel@tonic-gate 					cond = (((MDI_PI(pip)->pi_state ==
23387c478bd9Sstevel@tonic-gate 					    MDI_PATHINFO_STATE_ONLINE ||
23397c478bd9Sstevel@tonic-gate 					    (MDI_PI(pip)->pi_state ==
23407c478bd9Sstevel@tonic-gate 					    MDI_PATHINFO_STATE_STANDBY)) &&
23417c478bd9Sstevel@tonic-gate 						MDI_PI(pip)->pi_preferred ==
23427c478bd9Sstevel@tonic-gate 						preferred) ? 1 : 0);
2343ee28b439Scm136836 				} else if (flags ==
2344ee28b439Scm136836 					(MDI_SELECT_STANDBY_PATH |
2345ee28b439Scm136836 					MDI_SELECT_ONLINE_PATH |
2346ee28b439Scm136836 					MDI_SELECT_USER_DISABLE_PATH)) {
2347ee28b439Scm136836 					cond = (((MDI_PI(pip)->pi_state ==
2348ee28b439Scm136836 					    MDI_PATHINFO_STATE_ONLINE ||
2349ee28b439Scm136836 					    (MDI_PI(pip)->pi_state ==
2350ee28b439Scm136836 					    MDI_PATHINFO_STATE_STANDBY) ||
2351ee28b439Scm136836 						(MDI_PI(pip)->pi_state ==
2352ee28b439Scm136836 					    (MDI_PATHINFO_STATE_ONLINE|
2353ee28b439Scm136836 					    MDI_PATHINFO_STATE_USER_DISABLE)) ||
2354ee28b439Scm136836 						(MDI_PI(pip)->pi_state ==
2355ee28b439Scm136836 					    (MDI_PATHINFO_STATE_STANDBY |
2356ee28b439Scm136836 					    MDI_PATHINFO_STATE_USER_DISABLE)))&&
2357ee28b439Scm136836 						MDI_PI(pip)->pi_preferred ==
2358ee28b439Scm136836 						preferred) ? 1 : 0);
2359b08fdaf7SSheshadri Vasudevan 				} else if (flags ==
2360b08fdaf7SSheshadri Vasudevan 				    (MDI_SELECT_STANDBY_PATH |
2361b08fdaf7SSheshadri Vasudevan 				    MDI_SELECT_ONLINE_PATH |
2362b08fdaf7SSheshadri Vasudevan 				    MDI_SELECT_NO_PREFERRED)) {
2363b08fdaf7SSheshadri Vasudevan 					cond = (((MDI_PI(pip)->pi_state ==
2364b08fdaf7SSheshadri Vasudevan 					    MDI_PATHINFO_STATE_ONLINE) ||
2365b08fdaf7SSheshadri Vasudevan 					    (MDI_PI(pip)->pi_state ==
2366b08fdaf7SSheshadri Vasudevan 					    MDI_PATHINFO_STATE_STANDBY))
2367b08fdaf7SSheshadri Vasudevan 					    ? 1 : 0);
23687c478bd9Sstevel@tonic-gate 				} else {
23697c478bd9Sstevel@tonic-gate 					cond = 0;
23707c478bd9Sstevel@tonic-gate 				}
23717c478bd9Sstevel@tonic-gate 			}
23727c478bd9Sstevel@tonic-gate 			/*
23737c478bd9Sstevel@tonic-gate 			 * No need to explicitly check if the path is disabled.
23747c478bd9Sstevel@tonic-gate 			 * Since we are checking for state == ONLINE and the
237555e592a2SRandall Ralphs 			 * same variable is used for DISABLE/ENABLE information.
23767c478bd9Sstevel@tonic-gate 			 */
23777c478bd9Sstevel@tonic-gate 			if (cond) {
23787c478bd9Sstevel@tonic-gate 				/*
23797c478bd9Sstevel@tonic-gate 				 * Return the path in hold state. Caller should
23807c478bd9Sstevel@tonic-gate 				 * release the lock by calling mdi_rele_path()
23817c478bd9Sstevel@tonic-gate 				 */
23827c478bd9Sstevel@tonic-gate 				MDI_PI_HOLD(pip);
23837c478bd9Sstevel@tonic-gate 				MDI_PI_UNLOCK(pip);
23847c478bd9Sstevel@tonic-gate 				if (sb)
23857c478bd9Sstevel@tonic-gate 					ct->ct_path_last = pip;
23867c478bd9Sstevel@tonic-gate 				*ret_pip = pip;
23877c478bd9Sstevel@tonic-gate 				MDI_CLIENT_UNLOCK(ct);
23887c478bd9Sstevel@tonic-gate 				return (MDI_SUCCESS);
23897c478bd9Sstevel@tonic-gate 			}
23907c478bd9Sstevel@tonic-gate 			/*
23917c478bd9Sstevel@tonic-gate 			 * Path is busy.
23927c478bd9Sstevel@tonic-gate 			 */
23937c478bd9Sstevel@tonic-gate 			if (MDI_PI_IS_DRV_DISABLE_TRANSIENT(pip) ||
23947c478bd9Sstevel@tonic-gate 			    MDI_PI_IS_TRANSIENT(pip))
23957c478bd9Sstevel@tonic-gate 				retry = 1;
23967c478bd9Sstevel@tonic-gate 
23977c478bd9Sstevel@tonic-gate 			/*
23987c478bd9Sstevel@tonic-gate 			 * Keep looking for a next available online path
23997c478bd9Sstevel@tonic-gate 			 */
24007c478bd9Sstevel@tonic-gate do_again:
24017c478bd9Sstevel@tonic-gate 			next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link;
24027c478bd9Sstevel@tonic-gate 			if (next == NULL) {
2403b08fdaf7SSheshadri Vasudevan 				if ( flags & MDI_SELECT_NO_PREFERRED) {
2404b08fdaf7SSheshadri Vasudevan 					/*
2405b08fdaf7SSheshadri Vasudevan 					 * Bail out since we hit the end of list
2406b08fdaf7SSheshadri Vasudevan 					 */
2407b08fdaf7SSheshadri Vasudevan 					MDI_PI_UNLOCK(pip);
2408b08fdaf7SSheshadri Vasudevan 					break;
2409b08fdaf7SSheshadri Vasudevan 				}
2410b08fdaf7SSheshadri Vasudevan 
24117c478bd9Sstevel@tonic-gate 				if (!sb) {
24127c478bd9Sstevel@tonic-gate 					if (preferred == 1) {
24137c478bd9Sstevel@tonic-gate 						/*
24147c478bd9Sstevel@tonic-gate 						 * Looks like we reached the
24157c478bd9Sstevel@tonic-gate 						 * end of the list. Lets enable
24167c478bd9Sstevel@tonic-gate 						 * traversal of non preferred
24177c478bd9Sstevel@tonic-gate 						 * paths.
24187c478bd9Sstevel@tonic-gate 						 */
24197c478bd9Sstevel@tonic-gate 						preferred = 0;
24207c478bd9Sstevel@tonic-gate 						next = head;
24217c478bd9Sstevel@tonic-gate 					} else {
24227c478bd9Sstevel@tonic-gate 						/*
24237c478bd9Sstevel@tonic-gate 						 * We have done both the passes
24247c478bd9Sstevel@tonic-gate 						 * Preferred as well as for
24257c478bd9Sstevel@tonic-gate 						 * Non-preferred. Bail out now.
24267c478bd9Sstevel@tonic-gate 						 */
24277c478bd9Sstevel@tonic-gate 						cont = 0;
24287c478bd9Sstevel@tonic-gate 					}
24297c478bd9Sstevel@tonic-gate 				} else {
24307c478bd9Sstevel@tonic-gate 					/*
24317c478bd9Sstevel@tonic-gate 					 * Standard behavior case.
24327c478bd9Sstevel@tonic-gate 					 */
24337c478bd9Sstevel@tonic-gate 					next = head;
24347c478bd9Sstevel@tonic-gate 				}
24357c478bd9Sstevel@tonic-gate 			}
24367c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
24377c478bd9Sstevel@tonic-gate 			if (cont == 0) {
24387c478bd9Sstevel@tonic-gate 				break;
24397c478bd9Sstevel@tonic-gate 			}
24407c478bd9Sstevel@tonic-gate 			pip = next;
24417c478bd9Sstevel@tonic-gate 
24427c478bd9Sstevel@tonic-gate 			if (!sb) {
24437c478bd9Sstevel@tonic-gate 				/*
24447c478bd9Sstevel@tonic-gate 				 * We need to handle the selection of
24457c478bd9Sstevel@tonic-gate 				 * non-preferred path in the following
24467c478bd9Sstevel@tonic-gate 				 * case:
24477c478bd9Sstevel@tonic-gate 				 *
24487c478bd9Sstevel@tonic-gate 				 * +------+   +------+   +------+   +-----+
24497c478bd9Sstevel@tonic-gate 				 * | A : 1| - | B : 1| - | C : 0| - |NULL |
24507c478bd9Sstevel@tonic-gate 				 * +------+   +------+   +------+   +-----+
24517c478bd9Sstevel@tonic-gate 				 *
24527c478bd9Sstevel@tonic-gate 				 * If we start the search with B, we need to
24537c478bd9Sstevel@tonic-gate 				 * skip beyond B to pick C which is non -
24547c478bd9Sstevel@tonic-gate 				 * preferred in the second pass. The following
24557c478bd9Sstevel@tonic-gate 				 * test, if true, will allow us to skip over
24567c478bd9Sstevel@tonic-gate 				 * the 'start'(B in the example) to select
24577c478bd9Sstevel@tonic-gate 				 * other non preferred elements.
24587c478bd9Sstevel@tonic-gate 				 */
24597c478bd9Sstevel@tonic-gate 				if ((start_pip != NULL) && (start_pip == pip) &&
24607c478bd9Sstevel@tonic-gate 				    (MDI_PI(start_pip)->pi_preferred
24617c478bd9Sstevel@tonic-gate 				    != preferred)) {
24627c478bd9Sstevel@tonic-gate 					/*
24637c478bd9Sstevel@tonic-gate 					 * try again after going past the start
24647c478bd9Sstevel@tonic-gate 					 * pip
24657c478bd9Sstevel@tonic-gate 					 */
24667c478bd9Sstevel@tonic-gate 					MDI_PI_LOCK(pip);
24677c478bd9Sstevel@tonic-gate 					goto do_again;
24687c478bd9Sstevel@tonic-gate 				}
24697c478bd9Sstevel@tonic-gate 			} else {
24707c478bd9Sstevel@tonic-gate 				/*
24717c478bd9Sstevel@tonic-gate 				 * Standard behavior case
24727c478bd9Sstevel@tonic-gate 				 */
24737c478bd9Sstevel@tonic-gate 				if (start == pip && preferred) {
24747c478bd9Sstevel@tonic-gate 					/* look for nonpreferred paths */
24757c478bd9Sstevel@tonic-gate 					preferred = 0;
24767c478bd9Sstevel@tonic-gate 				} else if (start == pip && !preferred) {
24777c478bd9Sstevel@tonic-gate 					/*
24787c478bd9Sstevel@tonic-gate 					 * Exit condition
24797c478bd9Sstevel@tonic-gate 					 */
24807c478bd9Sstevel@tonic-gate 					cont = 0;
24817c478bd9Sstevel@tonic-gate 				}
24827c478bd9Sstevel@tonic-gate 			}
24837c478bd9Sstevel@tonic-gate 		} while (cont);
24847c478bd9Sstevel@tonic-gate 		break;
24857c478bd9Sstevel@tonic-gate 	}
24867c478bd9Sstevel@tonic-gate 
24877c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
24887c478bd9Sstevel@tonic-gate 	if (retry == 1) {
24897c478bd9Sstevel@tonic-gate 		return (MDI_BUSY);
24907c478bd9Sstevel@tonic-gate 	} else {
24917c478bd9Sstevel@tonic-gate 		return (MDI_NOPATH);
24927c478bd9Sstevel@tonic-gate 	}
24937c478bd9Sstevel@tonic-gate }
24947c478bd9Sstevel@tonic-gate 
24957c478bd9Sstevel@tonic-gate /*
24967c478bd9Sstevel@tonic-gate  * For a client, return the next available path to any phci
24977c478bd9Sstevel@tonic-gate  *
24987c478bd9Sstevel@tonic-gate  * Note:
24997c478bd9Sstevel@tonic-gate  *		Caller should hold the branch's devinfo node to get a consistent
25007c478bd9Sstevel@tonic-gate  *		snap shot of the mdi_pathinfo nodes.
25017c478bd9Sstevel@tonic-gate  *
25027c478bd9Sstevel@tonic-gate  *		Please note that even the list is stable the mdi_pathinfo
25037c478bd9Sstevel@tonic-gate  *		node state and properties are volatile.  The caller should lock
25047c478bd9Sstevel@tonic-gate  *		and unlock the nodes by calling mdi_pi_lock() and
25057c478bd9Sstevel@tonic-gate  *		mdi_pi_unlock() functions to get a stable properties.
25067c478bd9Sstevel@tonic-gate  *
25077c478bd9Sstevel@tonic-gate  *		If there is a need to use the nodes beyond the hold of the
25087c478bd9Sstevel@tonic-gate  *		devinfo node period (For ex. I/O), then mdi_pathinfo node
25097c478bd9Sstevel@tonic-gate  *		need to be held against unexpected removal by calling
25107c478bd9Sstevel@tonic-gate  *		mdi_hold_path() and should be released by calling
25117c478bd9Sstevel@tonic-gate  *		mdi_rele_path() on completion.
25127c478bd9Sstevel@tonic-gate  */
25137c478bd9Sstevel@tonic-gate mdi_pathinfo_t *
25147c478bd9Sstevel@tonic-gate mdi_get_next_phci_path(dev_info_t *ct_dip, mdi_pathinfo_t *pip)
25157c478bd9Sstevel@tonic-gate {
25167c478bd9Sstevel@tonic-gate 	mdi_client_t *ct;
25177c478bd9Sstevel@tonic-gate 
25187c478bd9Sstevel@tonic-gate 	if (!MDI_CLIENT(ct_dip))
25197c478bd9Sstevel@tonic-gate 		return (NULL);
25207c478bd9Sstevel@tonic-gate 
25217c478bd9Sstevel@tonic-gate 	/*
25227c478bd9Sstevel@tonic-gate 	 * Walk through client link
25237c478bd9Sstevel@tonic-gate 	 */
25247c478bd9Sstevel@tonic-gate 	ct = (mdi_client_t *)DEVI(ct_dip)->devi_mdi_client;
25257c478bd9Sstevel@tonic-gate 	ASSERT(ct != NULL);
25267c478bd9Sstevel@tonic-gate 
25277c478bd9Sstevel@tonic-gate 	if (pip == NULL)
25287c478bd9Sstevel@tonic-gate 		return ((mdi_pathinfo_t *)ct->ct_path_head);
25297c478bd9Sstevel@tonic-gate 
25307c478bd9Sstevel@tonic-gate 	return ((mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link);
25317c478bd9Sstevel@tonic-gate }
25327c478bd9Sstevel@tonic-gate 
25337c478bd9Sstevel@tonic-gate /*
25347c478bd9Sstevel@tonic-gate  * For a phci, return the next available path to any client
25357c478bd9Sstevel@tonic-gate  * Note: ditto mdi_get_next_phci_path()
25367c478bd9Sstevel@tonic-gate  */
25377c478bd9Sstevel@tonic-gate mdi_pathinfo_t *
25387c478bd9Sstevel@tonic-gate mdi_get_next_client_path(dev_info_t *ph_dip, mdi_pathinfo_t *pip)
25397c478bd9Sstevel@tonic-gate {
25407c478bd9Sstevel@tonic-gate 	mdi_phci_t *ph;
25417c478bd9Sstevel@tonic-gate 
25427c478bd9Sstevel@tonic-gate 	if (!MDI_PHCI(ph_dip))
25437c478bd9Sstevel@tonic-gate 		return (NULL);
25447c478bd9Sstevel@tonic-gate 
25457c478bd9Sstevel@tonic-gate 	/*
25467c478bd9Sstevel@tonic-gate 	 * Walk through pHCI link
25477c478bd9Sstevel@tonic-gate 	 */
25487c478bd9Sstevel@tonic-gate 	ph = (mdi_phci_t *)DEVI(ph_dip)->devi_mdi_xhci;
25497c478bd9Sstevel@tonic-gate 	ASSERT(ph != NULL);
25507c478bd9Sstevel@tonic-gate 
25517c478bd9Sstevel@tonic-gate 	if (pip == NULL)
25527c478bd9Sstevel@tonic-gate 		return ((mdi_pathinfo_t *)ph->ph_path_head);
25537c478bd9Sstevel@tonic-gate 
25547c478bd9Sstevel@tonic-gate 	return ((mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link);
25557c478bd9Sstevel@tonic-gate }
25567c478bd9Sstevel@tonic-gate 
25577c478bd9Sstevel@tonic-gate /*
25587c478bd9Sstevel@tonic-gate  * mdi_hold_path():
25597c478bd9Sstevel@tonic-gate  *		Hold the mdi_pathinfo node against unwanted unexpected free.
25607c478bd9Sstevel@tonic-gate  * Return Values:
25617c478bd9Sstevel@tonic-gate  *		None
25627c478bd9Sstevel@tonic-gate  */
25637c478bd9Sstevel@tonic-gate void
25647c478bd9Sstevel@tonic-gate mdi_hold_path(mdi_pathinfo_t *pip)
25657c478bd9Sstevel@tonic-gate {
25667c478bd9Sstevel@tonic-gate 	if (pip) {
25677c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
25687c478bd9Sstevel@tonic-gate 		MDI_PI_HOLD(pip);
25697c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
25707c478bd9Sstevel@tonic-gate 	}
25717c478bd9Sstevel@tonic-gate }
25727c478bd9Sstevel@tonic-gate 
25737c478bd9Sstevel@tonic-gate 
25747c478bd9Sstevel@tonic-gate /*
25757c478bd9Sstevel@tonic-gate  * mdi_rele_path():
25767c478bd9Sstevel@tonic-gate  *		Release the mdi_pathinfo node which was selected
25777c478bd9Sstevel@tonic-gate  *		through mdi_select_path() mechanism or manually held by
25787c478bd9Sstevel@tonic-gate  *		calling mdi_hold_path().
25797c478bd9Sstevel@tonic-gate  * Return Values:
25807c478bd9Sstevel@tonic-gate  *		None
25817c478bd9Sstevel@tonic-gate  */
25827c478bd9Sstevel@tonic-gate void
25837c478bd9Sstevel@tonic-gate mdi_rele_path(mdi_pathinfo_t *pip)
25847c478bd9Sstevel@tonic-gate {
25857c478bd9Sstevel@tonic-gate 	if (pip) {
25867c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
25877c478bd9Sstevel@tonic-gate 		MDI_PI_RELE(pip);
25887c478bd9Sstevel@tonic-gate 		if (MDI_PI(pip)->pi_ref_cnt == 0) {
25897c478bd9Sstevel@tonic-gate 			cv_broadcast(&MDI_PI(pip)->pi_ref_cv);
25907c478bd9Sstevel@tonic-gate 		}
25917c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
25927c478bd9Sstevel@tonic-gate 	}
25937c478bd9Sstevel@tonic-gate }
25947c478bd9Sstevel@tonic-gate 
25957c478bd9Sstevel@tonic-gate /*
25967c478bd9Sstevel@tonic-gate  * mdi_pi_lock():
25977c478bd9Sstevel@tonic-gate  * 		Lock the mdi_pathinfo node.
25987c478bd9Sstevel@tonic-gate  * Note:
25997c478bd9Sstevel@tonic-gate  *		The caller should release the lock by calling mdi_pi_unlock()
26007c478bd9Sstevel@tonic-gate  */
26017c478bd9Sstevel@tonic-gate void
26027c478bd9Sstevel@tonic-gate mdi_pi_lock(mdi_pathinfo_t *pip)
26037c478bd9Sstevel@tonic-gate {
26047c478bd9Sstevel@tonic-gate 	ASSERT(pip != NULL);
26057c478bd9Sstevel@tonic-gate 	if (pip) {
26067c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
26077c478bd9Sstevel@tonic-gate 	}
26087c478bd9Sstevel@tonic-gate }
26097c478bd9Sstevel@tonic-gate 
26107c478bd9Sstevel@tonic-gate 
26117c478bd9Sstevel@tonic-gate /*
26127c478bd9Sstevel@tonic-gate  * mdi_pi_unlock():
26137c478bd9Sstevel@tonic-gate  * 		Unlock the mdi_pathinfo node.
26147c478bd9Sstevel@tonic-gate  * Note:
26157c478bd9Sstevel@tonic-gate  *		The mdi_pathinfo node should have been locked with mdi_pi_lock()
26167c478bd9Sstevel@tonic-gate  */
26177c478bd9Sstevel@tonic-gate void
26187c478bd9Sstevel@tonic-gate mdi_pi_unlock(mdi_pathinfo_t *pip)
26197c478bd9Sstevel@tonic-gate {
26207c478bd9Sstevel@tonic-gate 	ASSERT(pip != NULL);
26217c478bd9Sstevel@tonic-gate 	if (pip) {
26227c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
26237c478bd9Sstevel@tonic-gate 	}
26247c478bd9Sstevel@tonic-gate }
26257c478bd9Sstevel@tonic-gate 
26267c478bd9Sstevel@tonic-gate /*
26277c478bd9Sstevel@tonic-gate  * mdi_pi_find():
26287c478bd9Sstevel@tonic-gate  *		Search the list of mdi_pathinfo nodes attached to the
26297c478bd9Sstevel@tonic-gate  *		pHCI/Client device node whose path address matches "paddr".
26307c478bd9Sstevel@tonic-gate  *		Returns a pointer to the mdi_pathinfo node if a matching node is
26317c478bd9Sstevel@tonic-gate  *		found.
26327c478bd9Sstevel@tonic-gate  * Return Values:
26337c478bd9Sstevel@tonic-gate  *		mdi_pathinfo node handle
26347c478bd9Sstevel@tonic-gate  *		NULL
26357c478bd9Sstevel@tonic-gate  * Notes:
26367c478bd9Sstevel@tonic-gate  *		Caller need not hold any locks to call this function.
26377c478bd9Sstevel@tonic-gate  */
26387c478bd9Sstevel@tonic-gate mdi_pathinfo_t *
26397c478bd9Sstevel@tonic-gate mdi_pi_find(dev_info_t *pdip, char *caddr, char *paddr)
26407c478bd9Sstevel@tonic-gate {
26417c478bd9Sstevel@tonic-gate 	mdi_phci_t		*ph;
26427c478bd9Sstevel@tonic-gate 	mdi_vhci_t		*vh;
26437c478bd9Sstevel@tonic-gate 	mdi_client_t		*ct;
26447c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t		*pip = NULL;
26457c478bd9Sstevel@tonic-gate 
26464c06356bSdh142964 	MDI_DEBUG(2, (MDI_NOTE, pdip,
26474c06356bSdh142964 	    "caddr@%s paddr@%s", caddr ? caddr : "", paddr ? paddr : ""));
26487c478bd9Sstevel@tonic-gate 	if ((pdip == NULL) || (paddr == NULL)) {
26497c478bd9Sstevel@tonic-gate 		return (NULL);
26507c478bd9Sstevel@tonic-gate 	}
26517c478bd9Sstevel@tonic-gate 	ph = i_devi_get_phci(pdip);
26527c478bd9Sstevel@tonic-gate 	if (ph == NULL) {
26537c478bd9Sstevel@tonic-gate 		/*
26547c478bd9Sstevel@tonic-gate 		 * Invalid pHCI device, Nothing more to do.
26557c478bd9Sstevel@tonic-gate 		 */
26564c06356bSdh142964 		MDI_DEBUG(2, (MDI_WARN, pdip, "invalid phci"));
26577c478bd9Sstevel@tonic-gate 		return (NULL);
26587c478bd9Sstevel@tonic-gate 	}
26597c478bd9Sstevel@tonic-gate 
26607c478bd9Sstevel@tonic-gate 	vh = ph->ph_vhci;
26617c478bd9Sstevel@tonic-gate 	if (vh == NULL) {
26627c478bd9Sstevel@tonic-gate 		/*
26637c478bd9Sstevel@tonic-gate 		 * Invalid vHCI device, Nothing more to do.
26647c478bd9Sstevel@tonic-gate 		 */
26654c06356bSdh142964 		MDI_DEBUG(2, (MDI_WARN, pdip, "invalid vhci"));
26667c478bd9Sstevel@tonic-gate 		return (NULL);
26677c478bd9Sstevel@tonic-gate 	}
26687c478bd9Sstevel@tonic-gate 
26697c478bd9Sstevel@tonic-gate 	/*
26705e3986cbScth 	 * Look for pathinfo node identified by paddr.
26717c478bd9Sstevel@tonic-gate 	 */
26727c478bd9Sstevel@tonic-gate 	if (caddr == NULL) {
26737c478bd9Sstevel@tonic-gate 		/*
26747c478bd9Sstevel@tonic-gate 		 * Find a mdi_pathinfo node under pHCI list for a matching
26757c478bd9Sstevel@tonic-gate 		 * unit address.
26767c478bd9Sstevel@tonic-gate 		 */
26775e3986cbScth 		MDI_PHCI_LOCK(ph);
26785e3986cbScth 		if (MDI_PHCI_IS_OFFLINE(ph)) {
26794c06356bSdh142964 			MDI_DEBUG(2, (MDI_WARN, pdip,
26804c06356bSdh142964 			    "offline phci %p", (void *)ph));
26815e3986cbScth 			MDI_PHCI_UNLOCK(ph);
26825e3986cbScth 			return (NULL);
26835e3986cbScth 		}
26847c478bd9Sstevel@tonic-gate 		pip = (mdi_pathinfo_t *)ph->ph_path_head;
26857c478bd9Sstevel@tonic-gate 
26867c478bd9Sstevel@tonic-gate 		while (pip != NULL) {
26877c478bd9Sstevel@tonic-gate 			if (strcmp(MDI_PI(pip)->pi_addr, paddr) == 0) {
26887c478bd9Sstevel@tonic-gate 				break;
26897c478bd9Sstevel@tonic-gate 			}
26907c478bd9Sstevel@tonic-gate 			pip = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
26917c478bd9Sstevel@tonic-gate 		}
26925e3986cbScth 		MDI_PHCI_UNLOCK(ph);
26934c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, pdip,
26944c06356bSdh142964 		    "found %s %p", mdi_pi_spathname(pip), (void *)pip));
26957c478bd9Sstevel@tonic-gate 		return (pip);
26967c478bd9Sstevel@tonic-gate 	}
26977c478bd9Sstevel@tonic-gate 
26987c478bd9Sstevel@tonic-gate 	/*
26993c34adc5Sramat 	 * XXX - Is the rest of the code in this function really necessary?
27003c34adc5Sramat 	 * The consumers of mdi_pi_find() can search for the desired pathinfo
27013c34adc5Sramat 	 * node by calling mdi_pi_find(pdip, NULL, paddr). Irrespective of
27023c34adc5Sramat 	 * whether the search is based on the pathinfo nodes attached to
27033c34adc5Sramat 	 * the pHCI or the client node, the result will be the same.
27043c34adc5Sramat 	 */
27053c34adc5Sramat 
27063c34adc5Sramat 	/*
27077c478bd9Sstevel@tonic-gate 	 * Find the client device corresponding to 'caddr'
27087c478bd9Sstevel@tonic-gate 	 */
27095e3986cbScth 	MDI_VHCI_CLIENT_LOCK(vh);
27103c34adc5Sramat 
27113c34adc5Sramat 	/*
27123c34adc5Sramat 	 * XXX - Passing NULL to the following function works as long as the
27133c34adc5Sramat 	 * the client addresses (caddr) are unique per vhci basis.
27143c34adc5Sramat 	 */
27153c34adc5Sramat 	ct = i_mdi_client_find(vh, NULL, caddr);
27167c478bd9Sstevel@tonic-gate 	if (ct == NULL) {
27177c478bd9Sstevel@tonic-gate 		/*
27187c478bd9Sstevel@tonic-gate 		 * Client not found, Obviously mdi_pathinfo node has not been
27197c478bd9Sstevel@tonic-gate 		 * created yet.
27207c478bd9Sstevel@tonic-gate 		 */
27215e3986cbScth 		MDI_VHCI_CLIENT_UNLOCK(vh);
27224c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, pdip,
27234c06356bSdh142964 		    "client not found for caddr @%s", caddr ? caddr : ""));
27245e3986cbScth 		return (NULL);
27257c478bd9Sstevel@tonic-gate 	}
27267c478bd9Sstevel@tonic-gate 
27277c478bd9Sstevel@tonic-gate 	/*
27287c478bd9Sstevel@tonic-gate 	 * Hold the client lock and look for a mdi_pathinfo node with matching
27297c478bd9Sstevel@tonic-gate 	 * pHCI and paddr
27307c478bd9Sstevel@tonic-gate 	 */
27317c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
27327c478bd9Sstevel@tonic-gate 
27337c478bd9Sstevel@tonic-gate 	/*
27347c478bd9Sstevel@tonic-gate 	 * Release the global mutex as it is no more needed. Note: We always
27357c478bd9Sstevel@tonic-gate 	 * respect the locking order while acquiring.
27367c478bd9Sstevel@tonic-gate 	 */
27375e3986cbScth 	MDI_VHCI_CLIENT_UNLOCK(vh);
27387c478bd9Sstevel@tonic-gate 
27397c478bd9Sstevel@tonic-gate 	pip = (mdi_pathinfo_t *)ct->ct_path_head;
27407c478bd9Sstevel@tonic-gate 	while (pip != NULL) {
27417c478bd9Sstevel@tonic-gate 		/*
27427c478bd9Sstevel@tonic-gate 		 * Compare the unit address
27437c478bd9Sstevel@tonic-gate 		 */
27447c478bd9Sstevel@tonic-gate 		if ((MDI_PI(pip)->pi_phci == ph) &&
27457c478bd9Sstevel@tonic-gate 		    strcmp(MDI_PI(pip)->pi_addr, paddr) == 0) {
27467c478bd9Sstevel@tonic-gate 			break;
27477c478bd9Sstevel@tonic-gate 		}
27487c478bd9Sstevel@tonic-gate 		pip = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link;
27497c478bd9Sstevel@tonic-gate 	}
27507c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
27514c06356bSdh142964 	MDI_DEBUG(2, (MDI_NOTE, pdip,
27524c06356bSdh142964 	    "found: %s %p", mdi_pi_spathname(pip), (void *)pip));
27537c478bd9Sstevel@tonic-gate 	return (pip);
27547c478bd9Sstevel@tonic-gate }
27557c478bd9Sstevel@tonic-gate 
27567c478bd9Sstevel@tonic-gate /*
27577c478bd9Sstevel@tonic-gate  * mdi_pi_alloc():
27587c478bd9Sstevel@tonic-gate  *		Allocate and initialize a new instance of a mdi_pathinfo node.
27597c478bd9Sstevel@tonic-gate  *		The mdi_pathinfo node returned by this function identifies a
27607c478bd9Sstevel@tonic-gate  *		unique device path is capable of having properties attached
27617c478bd9Sstevel@tonic-gate  *		and passed to mdi_pi_online() to fully attach and online the
27627c478bd9Sstevel@tonic-gate  *		path and client device node.
27637c478bd9Sstevel@tonic-gate  *		The mdi_pathinfo node returned by this function must be
27647c478bd9Sstevel@tonic-gate  *		destroyed using mdi_pi_free() if the path is no longer
27657c478bd9Sstevel@tonic-gate  *		operational or if the caller fails to attach a client device
27667c478bd9Sstevel@tonic-gate  *		node when calling mdi_pi_online(). The framework will not free
27677c478bd9Sstevel@tonic-gate  *		the resources allocated.
27687c478bd9Sstevel@tonic-gate  *		This function can be called from both interrupt and kernel
27697c478bd9Sstevel@tonic-gate  *		contexts.  DDI_NOSLEEP flag should be used while calling
27707c478bd9Sstevel@tonic-gate  *		from interrupt contexts.
27717c478bd9Sstevel@tonic-gate  * Return Values:
27727c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
27737c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
27747c478bd9Sstevel@tonic-gate  *		MDI_NOMEM
27757c478bd9Sstevel@tonic-gate  */
27767c478bd9Sstevel@tonic-gate /*ARGSUSED*/
27777c478bd9Sstevel@tonic-gate int
27787c478bd9Sstevel@tonic-gate mdi_pi_alloc_compatible(dev_info_t *pdip, char *cname, char *caddr, char *paddr,
27797c478bd9Sstevel@tonic-gate     char **compatible, int ncompatible, int flags, mdi_pathinfo_t **ret_pip)
27807c478bd9Sstevel@tonic-gate {
27817c478bd9Sstevel@tonic-gate 	mdi_vhci_t	*vh;
27827c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
27837c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
27847c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*pip = NULL;
27857c478bd9Sstevel@tonic-gate 	dev_info_t	*cdip;
27867c478bd9Sstevel@tonic-gate 	int		rv = MDI_NOMEM;
27873c34adc5Sramat 	int		path_allocated = 0;
27887c478bd9Sstevel@tonic-gate 
27894c06356bSdh142964 	MDI_DEBUG(2, (MDI_NOTE, pdip,
27904c06356bSdh142964 	    "cname %s: caddr@%s paddr@%s",
27914c06356bSdh142964 	    cname ? cname : "", caddr ? caddr : "", paddr ? paddr : ""));
27925e3986cbScth 
27937c478bd9Sstevel@tonic-gate 	if (pdip == NULL || cname == NULL || caddr == NULL || paddr == NULL ||
27947c478bd9Sstevel@tonic-gate 	    ret_pip == NULL) {
27957c478bd9Sstevel@tonic-gate 		/* Nothing more to do */
27967c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
27977c478bd9Sstevel@tonic-gate 	}
27987c478bd9Sstevel@tonic-gate 
27997c478bd9Sstevel@tonic-gate 	*ret_pip = NULL;
28005e3986cbScth 
28015e3986cbScth 	/* No allocations on detaching pHCI */
28025e3986cbScth 	if (DEVI_IS_DETACHING(pdip)) {
28035e3986cbScth 		/* Invalid pHCI device, return failure */
28044c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, pdip,
28054c06356bSdh142964 		    "!detaching pHCI=%p", (void *)pdip));
28065e3986cbScth 		return (MDI_FAILURE);
28075e3986cbScth 	}
28085e3986cbScth 
28097c478bd9Sstevel@tonic-gate 	ph = i_devi_get_phci(pdip);
28107c478bd9Sstevel@tonic-gate 	ASSERT(ph != NULL);
28117c478bd9Sstevel@tonic-gate 	if (ph == NULL) {
28127c478bd9Sstevel@tonic-gate 		/* Invalid pHCI device, return failure */
28134c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, pdip,
28144c06356bSdh142964 		    "!invalid pHCI=%p", (void *)pdip));
28157c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
28167c478bd9Sstevel@tonic-gate 	}
28177c478bd9Sstevel@tonic-gate 
28187c478bd9Sstevel@tonic-gate 	MDI_PHCI_LOCK(ph);
28197c478bd9Sstevel@tonic-gate 	vh = ph->ph_vhci;
28207c478bd9Sstevel@tonic-gate 	if (vh == NULL) {
28217c478bd9Sstevel@tonic-gate 		/* Invalid vHCI device, return failure */
28224c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, pdip,
28234c06356bSdh142964 		    "!invalid vHCI=%p", (void *)pdip));
28247c478bd9Sstevel@tonic-gate 		MDI_PHCI_UNLOCK(ph);
28257c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
28267c478bd9Sstevel@tonic-gate 	}
28277c478bd9Sstevel@tonic-gate 
28287c478bd9Sstevel@tonic-gate 	if (MDI_PHCI_IS_READY(ph) == 0) {
28297c478bd9Sstevel@tonic-gate 		/*
28307c478bd9Sstevel@tonic-gate 		 * Do not allow new node creation when pHCI is in
28317c478bd9Sstevel@tonic-gate 		 * offline/suspended states
28327c478bd9Sstevel@tonic-gate 		 */
28334c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, pdip,
28344c06356bSdh142964 		    "pHCI=%p is not ready", (void *)ph));
28357c478bd9Sstevel@tonic-gate 		MDI_PHCI_UNLOCK(ph);
28367c478bd9Sstevel@tonic-gate 		return (MDI_BUSY);
28377c478bd9Sstevel@tonic-gate 	}
28387c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNSTABLE(ph);
28397c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNLOCK(ph);
28407c478bd9Sstevel@tonic-gate 
28413c34adc5Sramat 	/* look for a matching client, create one if not found */
28425e3986cbScth 	MDI_VHCI_CLIENT_LOCK(vh);
28433c34adc5Sramat 	ct = i_mdi_client_find(vh, cname, caddr);
28447c478bd9Sstevel@tonic-gate 	if (ct == NULL) {
28453c34adc5Sramat 		ct = i_mdi_client_alloc(vh, cname, caddr);
28463c34adc5Sramat 		ASSERT(ct != NULL);
28477c478bd9Sstevel@tonic-gate 	}
28487c478bd9Sstevel@tonic-gate 
28497c478bd9Sstevel@tonic-gate 	if (ct->ct_dip == NULL) {
28507c478bd9Sstevel@tonic-gate 		/*
28517c478bd9Sstevel@tonic-gate 		 * Allocate a devinfo node
28527c478bd9Sstevel@tonic-gate 		 */
28537c478bd9Sstevel@tonic-gate 		ct->ct_dip = i_mdi_devinfo_create(vh, cname, caddr,
28543c34adc5Sramat 		    compatible, ncompatible);
28557c478bd9Sstevel@tonic-gate 		if (ct->ct_dip == NULL) {
28567c478bd9Sstevel@tonic-gate 			(void) i_mdi_client_free(vh, ct);
28577c478bd9Sstevel@tonic-gate 			goto fail;
28587c478bd9Sstevel@tonic-gate 		}
28597c478bd9Sstevel@tonic-gate 	}
28607c478bd9Sstevel@tonic-gate 	cdip = ct->ct_dip;
28617c478bd9Sstevel@tonic-gate 
28627c478bd9Sstevel@tonic-gate 	DEVI(cdip)->devi_mdi_component |= MDI_COMPONENT_CLIENT;
28637c478bd9Sstevel@tonic-gate 	DEVI(cdip)->devi_mdi_client = (caddr_t)ct;
28647c478bd9Sstevel@tonic-gate 
28655e3986cbScth 	MDI_CLIENT_LOCK(ct);
28667c478bd9Sstevel@tonic-gate 	pip = (mdi_pathinfo_t *)ct->ct_path_head;
28677c478bd9Sstevel@tonic-gate 	while (pip != NULL) {
28687c478bd9Sstevel@tonic-gate 		/*
28697c478bd9Sstevel@tonic-gate 		 * Compare the unit address
28707c478bd9Sstevel@tonic-gate 		 */
28717c478bd9Sstevel@tonic-gate 		if ((MDI_PI(pip)->pi_phci == ph) &&
28727c478bd9Sstevel@tonic-gate 		    strcmp(MDI_PI(pip)->pi_addr, paddr) == 0) {
28737c478bd9Sstevel@tonic-gate 			break;
28747c478bd9Sstevel@tonic-gate 		}
28757c478bd9Sstevel@tonic-gate 		pip = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link;
28767c478bd9Sstevel@tonic-gate 	}
28775e3986cbScth 	MDI_CLIENT_UNLOCK(ct);
28787c478bd9Sstevel@tonic-gate 
28797c478bd9Sstevel@tonic-gate 	if (pip == NULL) {
28807c478bd9Sstevel@tonic-gate 		/*
28817c478bd9Sstevel@tonic-gate 		 * This is a new path for this client device.  Allocate and
28827c478bd9Sstevel@tonic-gate 		 * initialize a new pathinfo node
28837c478bd9Sstevel@tonic-gate 		 */
28843c34adc5Sramat 		pip = i_mdi_pi_alloc(ph, paddr, ct);
28853c34adc5Sramat 		ASSERT(pip != NULL);
28863c34adc5Sramat 		path_allocated = 1;
28877c478bd9Sstevel@tonic-gate 	}
28887c478bd9Sstevel@tonic-gate 	rv = MDI_SUCCESS;
28897c478bd9Sstevel@tonic-gate 
28907c478bd9Sstevel@tonic-gate fail:
28917c478bd9Sstevel@tonic-gate 	/*
28927c478bd9Sstevel@tonic-gate 	 * Release the global mutex.
28937c478bd9Sstevel@tonic-gate 	 */
28945e3986cbScth 	MDI_VHCI_CLIENT_UNLOCK(vh);
28957c478bd9Sstevel@tonic-gate 
28967c478bd9Sstevel@tonic-gate 	/*
28977c478bd9Sstevel@tonic-gate 	 * Mark the pHCI as stable
28987c478bd9Sstevel@tonic-gate 	 */
28997c478bd9Sstevel@tonic-gate 	MDI_PHCI_LOCK(ph);
29007c478bd9Sstevel@tonic-gate 	MDI_PHCI_STABLE(ph);
29017c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNLOCK(ph);
29027c478bd9Sstevel@tonic-gate 	*ret_pip = pip;
29033c34adc5Sramat 
29044c06356bSdh142964 	MDI_DEBUG(2, (MDI_NOTE, pdip,
29054c06356bSdh142964 	    "alloc %s %p", mdi_pi_spathname(pip), (void *)pip));
29065e3986cbScth 
29073c34adc5Sramat 	if (path_allocated)
29083c34adc5Sramat 		vhcache_pi_add(vh->vh_config, MDI_PI(pip));
29093c34adc5Sramat 
29107c478bd9Sstevel@tonic-gate 	return (rv);
29117c478bd9Sstevel@tonic-gate }
29127c478bd9Sstevel@tonic-gate 
29137c478bd9Sstevel@tonic-gate /*ARGSUSED*/
29147c478bd9Sstevel@tonic-gate int
29157c478bd9Sstevel@tonic-gate mdi_pi_alloc(dev_info_t *pdip, char *cname, char *caddr, char *paddr,
29167c478bd9Sstevel@tonic-gate     int flags, mdi_pathinfo_t **ret_pip)
29177c478bd9Sstevel@tonic-gate {
29187c478bd9Sstevel@tonic-gate 	return (mdi_pi_alloc_compatible(pdip, cname, caddr, paddr, NULL, 0,
29197c478bd9Sstevel@tonic-gate 	    flags, ret_pip));
29207c478bd9Sstevel@tonic-gate }
29217c478bd9Sstevel@tonic-gate 
29227c478bd9Sstevel@tonic-gate /*
29237c478bd9Sstevel@tonic-gate  * i_mdi_pi_alloc():
29247c478bd9Sstevel@tonic-gate  *		Allocate a mdi_pathinfo node and add to the pHCI path list
29257c478bd9Sstevel@tonic-gate  * Return Values:
29267c478bd9Sstevel@tonic-gate  *		mdi_pathinfo
29277c478bd9Sstevel@tonic-gate  */
29287c478bd9Sstevel@tonic-gate /*ARGSUSED*/
29297c478bd9Sstevel@tonic-gate static mdi_pathinfo_t *
29303c34adc5Sramat i_mdi_pi_alloc(mdi_phci_t *ph, char *paddr, mdi_client_t *ct)
29317c478bd9Sstevel@tonic-gate {
29323c34adc5Sramat 	mdi_pathinfo_t	*pip;
29337c478bd9Sstevel@tonic-gate 	int		ct_circular;
29347c478bd9Sstevel@tonic-gate 	int		ph_circular;
29354c06356bSdh142964 	static char	path[MAXPATHLEN];	/* mdi_pathmap_mutex protects */
2936602ca9eaScth 	char		*path_persistent;
2937602ca9eaScth 	int		path_instance;
2938602ca9eaScth 	mod_hash_val_t	hv;
29397c478bd9Sstevel@tonic-gate 
29405e3986cbScth 	ASSERT(MDI_VHCI_CLIENT_LOCKED(ph->ph_vhci));
29415e3986cbScth 
29423c34adc5Sramat 	pip = kmem_zalloc(sizeof (struct mdi_pathinfo), KM_SLEEP);
29437c478bd9Sstevel@tonic-gate 	mutex_init(&MDI_PI(pip)->pi_mutex, NULL, MUTEX_DEFAULT, NULL);
29447c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_state = MDI_PATHINFO_STATE_INIT |
29457c478bd9Sstevel@tonic-gate 	    MDI_PATHINFO_STATE_TRANSIENT;
29467c478bd9Sstevel@tonic-gate 
29477c478bd9Sstevel@tonic-gate 	if (MDI_PHCI_IS_USER_DISABLED(ph))
29487c478bd9Sstevel@tonic-gate 		MDI_PI_SET_USER_DISABLE(pip);
29497c478bd9Sstevel@tonic-gate 
29507c478bd9Sstevel@tonic-gate 	if (MDI_PHCI_IS_DRV_DISABLED_TRANSIENT(ph))
29517c478bd9Sstevel@tonic-gate 		MDI_PI_SET_DRV_DISABLE_TRANS(pip);
29527c478bd9Sstevel@tonic-gate 
29537c478bd9Sstevel@tonic-gate 	if (MDI_PHCI_IS_DRV_DISABLED(ph))
29547c478bd9Sstevel@tonic-gate 		MDI_PI_SET_DRV_DISABLE(pip);
29557c478bd9Sstevel@tonic-gate 
29567c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_old_state = MDI_PATHINFO_STATE_INIT;
29577c478bd9Sstevel@tonic-gate 	cv_init(&MDI_PI(pip)->pi_state_cv, NULL, CV_DEFAULT, NULL);
29587c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_client = ct;
29597c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_phci = ph;
29603c34adc5Sramat 	MDI_PI(pip)->pi_addr = kmem_alloc(strlen(paddr) + 1, KM_SLEEP);
29617c478bd9Sstevel@tonic-gate 	(void) strcpy(MDI_PI(pip)->pi_addr, paddr);
2962602ca9eaScth 
2963602ca9eaScth         /*
2964602ca9eaScth 	 * We form the "path" to the pathinfo node, and see if we have
2965602ca9eaScth 	 * already allocated a 'path_instance' for that "path".  If so,
2966602ca9eaScth 	 * we use the already allocated 'path_instance'.  If not, we
2967602ca9eaScth 	 * allocate a new 'path_instance' and associate it with a copy of
2968602ca9eaScth 	 * the "path" string (which is never freed). The association
2969602ca9eaScth 	 * between a 'path_instance' this "path" string persists until
2970602ca9eaScth 	 * reboot.
2971602ca9eaScth 	 */
2972602ca9eaScth         mutex_enter(&mdi_pathmap_mutex);
2973602ca9eaScth 	(void) ddi_pathname(ph->ph_dip, path);
2974602ca9eaScth 	(void) sprintf(path + strlen(path), "/%s@%s",
297555e592a2SRandall Ralphs 	    mdi_pi_get_node_name(pip), mdi_pi_get_addr(pip));
2976602ca9eaScth         if (mod_hash_find(mdi_pathmap_bypath, (mod_hash_key_t)path, &hv) == 0) {
2977602ca9eaScth                 path_instance = (uint_t)(intptr_t)hv;
2978602ca9eaScth         } else {
2979602ca9eaScth 		/* allocate a new 'path_instance' and persistent "path" */
2980602ca9eaScth 		path_instance = mdi_pathmap_instance++;
2981602ca9eaScth 		path_persistent = i_ddi_strdup(path, KM_SLEEP);
2982602ca9eaScth                 (void) mod_hash_insert(mdi_pathmap_bypath,
2983602ca9eaScth                     (mod_hash_key_t)path_persistent,
2984602ca9eaScth                     (mod_hash_val_t)(intptr_t)path_instance);
2985602ca9eaScth 		(void) mod_hash_insert(mdi_pathmap_byinstance,
2986602ca9eaScth 		    (mod_hash_key_t)(intptr_t)path_instance,
2987602ca9eaScth 		    (mod_hash_val_t)path_persistent);
29884c06356bSdh142964 
29894c06356bSdh142964 		/* create shortpath name */
29904c06356bSdh142964 		(void) snprintf(path, sizeof(path), "%s%d/%s@%s",
29914c06356bSdh142964 		    ddi_driver_name(ph->ph_dip), ddi_get_instance(ph->ph_dip),
29924c06356bSdh142964 		    mdi_pi_get_node_name(pip), mdi_pi_get_addr(pip));
29934c06356bSdh142964 		path_persistent = i_ddi_strdup(path, KM_SLEEP);
29944c06356bSdh142964 		(void) mod_hash_insert(mdi_pathmap_sbyinstance,
29954c06356bSdh142964 		    (mod_hash_key_t)(intptr_t)path_instance,
29964c06356bSdh142964 		    (mod_hash_val_t)path_persistent);
2997602ca9eaScth         }
2998602ca9eaScth         mutex_exit(&mdi_pathmap_mutex);
2999602ca9eaScth 	MDI_PI(pip)->pi_path_instance = path_instance;
3000602ca9eaScth 
30013c34adc5Sramat 	(void) nvlist_alloc(&MDI_PI(pip)->pi_prop, NV_UNIQUE_NAME, KM_SLEEP);
30023c34adc5Sramat 	ASSERT(MDI_PI(pip)->pi_prop != NULL);
30037c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_pprivate = NULL;
30047c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_cprivate = NULL;
30057c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_vprivate = NULL;
30067c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_client_link = NULL;
30077c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_phci_link = NULL;
30087c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_ref_cnt = 0;
30097c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_kstats = NULL;
30107c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_preferred = 1;
30117c478bd9Sstevel@tonic-gate 	cv_init(&MDI_PI(pip)->pi_ref_cv, NULL, CV_DEFAULT, NULL);
30127c478bd9Sstevel@tonic-gate 
30137c478bd9Sstevel@tonic-gate 	/*
30147c478bd9Sstevel@tonic-gate 	 * Lock both dev_info nodes against changes in parallel.
30155e3986cbScth 	 *
30165e3986cbScth 	 * The ndi_devi_enter(Client), is atypical since the client is a leaf.
30175e3986cbScth 	 * This atypical operation is done to synchronize pathinfo nodes
30185e3986cbScth 	 * during devinfo snapshot (see di_register_pip) by 'pretending' that
30195e3986cbScth 	 * the pathinfo nodes are children of the Client.
30207c478bd9Sstevel@tonic-gate 	 */
30217c478bd9Sstevel@tonic-gate 	ndi_devi_enter(ct->ct_dip, &ct_circular);
30227c478bd9Sstevel@tonic-gate 	ndi_devi_enter(ph->ph_dip, &ph_circular);
30237c478bd9Sstevel@tonic-gate 
30247c478bd9Sstevel@tonic-gate 	i_mdi_phci_add_path(ph, pip);
30257c478bd9Sstevel@tonic-gate 	i_mdi_client_add_path(ct, pip);
30267c478bd9Sstevel@tonic-gate 
30277c478bd9Sstevel@tonic-gate 	ndi_devi_exit(ph->ph_dip, ph_circular);
30287c478bd9Sstevel@tonic-gate 	ndi_devi_exit(ct->ct_dip, ct_circular);
30297c478bd9Sstevel@tonic-gate 
30307c478bd9Sstevel@tonic-gate 	return (pip);
30317c478bd9Sstevel@tonic-gate }
30327c478bd9Sstevel@tonic-gate 
30337c478bd9Sstevel@tonic-gate /*
3034602ca9eaScth  * mdi_pi_pathname_by_instance():
3035602ca9eaScth  *	Lookup of "path" by 'path_instance'. Return "path".
3036602ca9eaScth  *	NOTE: returned "path" remains valid forever (until reboot).
3037602ca9eaScth  */
3038602ca9eaScth char *
3039602ca9eaScth mdi_pi_pathname_by_instance(int path_instance)
3040602ca9eaScth {
3041602ca9eaScth 	char		*path;
3042602ca9eaScth 	mod_hash_val_t	hv;
3043602ca9eaScth 
3044602ca9eaScth 	/* mdi_pathmap lookup of "path" by 'path_instance' */
3045602ca9eaScth 	mutex_enter(&mdi_pathmap_mutex);
3046602ca9eaScth 	if (mod_hash_find(mdi_pathmap_byinstance,
3047602ca9eaScth 	    (mod_hash_key_t)(intptr_t)path_instance, &hv) == 0)
3048602ca9eaScth 		path = (char *)hv;
3049602ca9eaScth 	else
3050602ca9eaScth 		path = NULL;
3051602ca9eaScth 	mutex_exit(&mdi_pathmap_mutex);
3052602ca9eaScth 	return (path);
3053602ca9eaScth }
3054602ca9eaScth 
3055602ca9eaScth /*
30564c06356bSdh142964  * mdi_pi_spathname_by_instance():
30574c06356bSdh142964  *	Lookup of "shortpath" by 'path_instance'. Return "shortpath".
30584c06356bSdh142964  *	NOTE: returned "shortpath" remains valid forever (until reboot).
30594c06356bSdh142964  */
30604c06356bSdh142964 char *
30614c06356bSdh142964 mdi_pi_spathname_by_instance(int path_instance)
30624c06356bSdh142964 {
30634c06356bSdh142964 	char		*path;
30644c06356bSdh142964 	mod_hash_val_t	hv;
30654c06356bSdh142964 
30664c06356bSdh142964 	/* mdi_pathmap lookup of "path" by 'path_instance' */
30674c06356bSdh142964 	mutex_enter(&mdi_pathmap_mutex);
30684c06356bSdh142964 	if (mod_hash_find(mdi_pathmap_sbyinstance,
30694c06356bSdh142964 	    (mod_hash_key_t)(intptr_t)path_instance, &hv) == 0)
30704c06356bSdh142964 		path = (char *)hv;
30714c06356bSdh142964 	else
30724c06356bSdh142964 		path = NULL;
30734c06356bSdh142964 	mutex_exit(&mdi_pathmap_mutex);
30744c06356bSdh142964 	return (path);
30754c06356bSdh142964 }
30764c06356bSdh142964 
30774c06356bSdh142964 
30784c06356bSdh142964 /*
30797c478bd9Sstevel@tonic-gate  * i_mdi_phci_add_path():
30807c478bd9Sstevel@tonic-gate  * 		Add a mdi_pathinfo node to pHCI list.
30817c478bd9Sstevel@tonic-gate  * Notes:
30827c478bd9Sstevel@tonic-gate  *		Caller should per-pHCI mutex
30837c478bd9Sstevel@tonic-gate  */
30847c478bd9Sstevel@tonic-gate static void
30857c478bd9Sstevel@tonic-gate i_mdi_phci_add_path(mdi_phci_t *ph, mdi_pathinfo_t *pip)
30867c478bd9Sstevel@tonic-gate {
30877c478bd9Sstevel@tonic-gate 	ASSERT(DEVI_BUSY_OWNED(ph->ph_dip));
30887c478bd9Sstevel@tonic-gate 
30895e3986cbScth 	MDI_PHCI_LOCK(ph);
30907c478bd9Sstevel@tonic-gate 	if (ph->ph_path_head == NULL) {
30917c478bd9Sstevel@tonic-gate 		ph->ph_path_head = pip;
30927c478bd9Sstevel@tonic-gate 	} else {
30937c478bd9Sstevel@tonic-gate 		MDI_PI(ph->ph_path_tail)->pi_phci_link = MDI_PI(pip);
30947c478bd9Sstevel@tonic-gate 	}
30957c478bd9Sstevel@tonic-gate 	ph->ph_path_tail = pip;
30967c478bd9Sstevel@tonic-gate 	ph->ph_path_count++;
30975e3986cbScth 	MDI_PHCI_UNLOCK(ph);
30987c478bd9Sstevel@tonic-gate }
30997c478bd9Sstevel@tonic-gate 
31007c478bd9Sstevel@tonic-gate /*
31017c478bd9Sstevel@tonic-gate  * i_mdi_client_add_path():
31027c478bd9Sstevel@tonic-gate  *		Add mdi_pathinfo node to client list
31037c478bd9Sstevel@tonic-gate  */
31047c478bd9Sstevel@tonic-gate static void
31057c478bd9Sstevel@tonic-gate i_mdi_client_add_path(mdi_client_t *ct, mdi_pathinfo_t *pip)
31067c478bd9Sstevel@tonic-gate {
31077c478bd9Sstevel@tonic-gate 	ASSERT(DEVI_BUSY_OWNED(ct->ct_dip));
31087c478bd9Sstevel@tonic-gate 
31095e3986cbScth 	MDI_CLIENT_LOCK(ct);
31107c478bd9Sstevel@tonic-gate 	if (ct->ct_path_head == NULL) {
31117c478bd9Sstevel@tonic-gate 		ct->ct_path_head = pip;
31127c478bd9Sstevel@tonic-gate 	} else {
31137c478bd9Sstevel@tonic-gate 		MDI_PI(ct->ct_path_tail)->pi_client_link = MDI_PI(pip);
31147c478bd9Sstevel@tonic-gate 	}
31157c478bd9Sstevel@tonic-gate 	ct->ct_path_tail = pip;
31167c478bd9Sstevel@tonic-gate 	ct->ct_path_count++;
31175e3986cbScth 	MDI_CLIENT_UNLOCK(ct);
31187c478bd9Sstevel@tonic-gate }
31197c478bd9Sstevel@tonic-gate 
31207c478bd9Sstevel@tonic-gate /*
31217c478bd9Sstevel@tonic-gate  * mdi_pi_free():
31227c478bd9Sstevel@tonic-gate  *		Free the mdi_pathinfo node and also client device node if this
31237c478bd9Sstevel@tonic-gate  *		is the last path to the device
31247c478bd9Sstevel@tonic-gate  * Return Values:
31257c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
31267c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
31277c478bd9Sstevel@tonic-gate  *		MDI_BUSY
31287c478bd9Sstevel@tonic-gate  */
31297c478bd9Sstevel@tonic-gate /*ARGSUSED*/
31307c478bd9Sstevel@tonic-gate int
31317c478bd9Sstevel@tonic-gate mdi_pi_free(mdi_pathinfo_t *pip, int flags)
31327c478bd9Sstevel@tonic-gate {
3133e9b79356Srs135747 	int		rv = MDI_FAILURE;
31347c478bd9Sstevel@tonic-gate 	mdi_vhci_t	*vh;
31357c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
31367c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
31377c478bd9Sstevel@tonic-gate 	int		(*f)();
31387c478bd9Sstevel@tonic-gate 	int		client_held = 0;
31397c478bd9Sstevel@tonic-gate 
31407c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
31417c478bd9Sstevel@tonic-gate 	ph = MDI_PI(pip)->pi_phci;
31427c478bd9Sstevel@tonic-gate 	ASSERT(ph != NULL);
31437c478bd9Sstevel@tonic-gate 	if (ph == NULL) {
31447c478bd9Sstevel@tonic-gate 		/*
31457c478bd9Sstevel@tonic-gate 		 * Invalid pHCI device, return failure
31467c478bd9Sstevel@tonic-gate 		 */
31474c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, NULL,
31484c06356bSdh142964 		    "!invalid pHCI: pip %s %p",
31494c06356bSdh142964 		    mdi_pi_spathname(pip), (void *)pip));
31507c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
31517c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
31527c478bd9Sstevel@tonic-gate 	}
31537c478bd9Sstevel@tonic-gate 
31547c478bd9Sstevel@tonic-gate 	vh = ph->ph_vhci;
31557c478bd9Sstevel@tonic-gate 	ASSERT(vh != NULL);
31567c478bd9Sstevel@tonic-gate 	if (vh == NULL) {
31577c478bd9Sstevel@tonic-gate 		/* Invalid pHCI device, return failure */
31584c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, ph->ph_dip,
31594c06356bSdh142964 		    "!invalid vHCI: pip %s %p",
31604c06356bSdh142964 		    mdi_pi_spathname(pip), (void *)pip));
31617c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
31627c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
31637c478bd9Sstevel@tonic-gate 	}
31647c478bd9Sstevel@tonic-gate 
31657c478bd9Sstevel@tonic-gate 	ct = MDI_PI(pip)->pi_client;
31667c478bd9Sstevel@tonic-gate 	ASSERT(ct != NULL);
31677c478bd9Sstevel@tonic-gate 	if (ct == NULL) {
31687c478bd9Sstevel@tonic-gate 		/*
31697c478bd9Sstevel@tonic-gate 		 * Invalid Client device, return failure
31707c478bd9Sstevel@tonic-gate 		 */
31714c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, ph->ph_dip,
31724c06356bSdh142964 		    "!invalid client: pip %s %p",
31734c06356bSdh142964 		    mdi_pi_spathname(pip), (void *)pip));
31747c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
31757c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
31767c478bd9Sstevel@tonic-gate 	}
31777c478bd9Sstevel@tonic-gate 
31787c478bd9Sstevel@tonic-gate 	/*
31797c478bd9Sstevel@tonic-gate 	 * Check to see for busy condition.  A mdi_pathinfo can only be freed
31807c478bd9Sstevel@tonic-gate 	 * if the node state is either offline or init and the reference count
31817c478bd9Sstevel@tonic-gate 	 * is zero.
31827c478bd9Sstevel@tonic-gate 	 */
31837c478bd9Sstevel@tonic-gate 	if (!(MDI_PI_IS_OFFLINE(pip) || MDI_PI_IS_INIT(pip) ||
31847c478bd9Sstevel@tonic-gate 	    MDI_PI_IS_INITING(pip))) {
31857c478bd9Sstevel@tonic-gate 		/*
31867c478bd9Sstevel@tonic-gate 		 * Node is busy
31877c478bd9Sstevel@tonic-gate 		 */
31884c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, ct->ct_dip,
31894c06356bSdh142964 		    "!busy: pip %s %p", mdi_pi_spathname(pip), (void *)pip));
31907c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
31917c478bd9Sstevel@tonic-gate 		return (MDI_BUSY);
31927c478bd9Sstevel@tonic-gate 	}
31937c478bd9Sstevel@tonic-gate 
31947c478bd9Sstevel@tonic-gate 	while (MDI_PI(pip)->pi_ref_cnt != 0) {
31957c478bd9Sstevel@tonic-gate 		/*
31967c478bd9Sstevel@tonic-gate 		 * Give a chance for pending I/Os to complete.
31977c478bd9Sstevel@tonic-gate 		 */
31984c06356bSdh142964 		MDI_DEBUG(1, (MDI_NOTE, ct->ct_dip,
31994c06356bSdh142964 		    "!%d cmds still pending on path: %s %p",
32004c06356bSdh142964 		    MDI_PI(pip)->pi_ref_cnt,
32014c06356bSdh142964 		    mdi_pi_spathname(pip), (void *)pip));
3202*d3d50737SRafael Vanoni 		if (cv_reltimedwait(&MDI_PI(pip)->pi_ref_cv,
3203*d3d50737SRafael Vanoni 		    &MDI_PI(pip)->pi_mutex, drv_usectohz(60 * 1000000),
3204*d3d50737SRafael Vanoni 		    TR_CLOCK_TICK) == -1) {
32057c478bd9Sstevel@tonic-gate 			/*
32067c478bd9Sstevel@tonic-gate 			 * The timeout time reached without ref_cnt being zero
32077c478bd9Sstevel@tonic-gate 			 * being signaled.
32087c478bd9Sstevel@tonic-gate 			 */
32094c06356bSdh142964 			MDI_DEBUG(1, (MDI_NOTE, ct->ct_dip,
32104c06356bSdh142964 			    "!Timeout reached on path %s %p without the cond",
32114c06356bSdh142964 			    mdi_pi_spathname(pip), (void *)pip));
32124c06356bSdh142964 			MDI_DEBUG(1, (MDI_NOTE, ct->ct_dip,
32134c06356bSdh142964 			    "!%d cmds still pending on path %s %p",
32144c06356bSdh142964 			    MDI_PI(pip)->pi_ref_cnt,
32154c06356bSdh142964 			    mdi_pi_spathname(pip), (void *)pip));
32167c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
32177c478bd9Sstevel@tonic-gate 			return (MDI_BUSY);
32187c478bd9Sstevel@tonic-gate 		}
32197c478bd9Sstevel@tonic-gate 	}
32207c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_pm_held) {
32217c478bd9Sstevel@tonic-gate 		client_held = 1;
32227c478bd9Sstevel@tonic-gate 	}
32237c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
32247c478bd9Sstevel@tonic-gate 
32253c34adc5Sramat 	vhcache_pi_remove(vh->vh_config, MDI_PI(pip));
32263c34adc5Sramat 
32277c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
32287c478bd9Sstevel@tonic-gate 
32295e3986cbScth 	/* Prevent further failovers till MDI_VHCI_CLIENT_LOCK is held */
32307c478bd9Sstevel@tonic-gate 	MDI_CLIENT_SET_PATH_FREE_IN_PROGRESS(ct);
32317c478bd9Sstevel@tonic-gate 
32327c478bd9Sstevel@tonic-gate 	/*
32337c478bd9Sstevel@tonic-gate 	 * Wait till failover is complete before removing this node.
32347c478bd9Sstevel@tonic-gate 	 */
32357c478bd9Sstevel@tonic-gate 	while (MDI_CLIENT_IS_FAILOVER_IN_PROGRESS(ct))
32367c478bd9Sstevel@tonic-gate 		cv_wait(&ct->ct_failover_cv, &ct->ct_mutex);
32377c478bd9Sstevel@tonic-gate 
32387c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
32395e3986cbScth 	MDI_VHCI_CLIENT_LOCK(vh);
32407c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
32417c478bd9Sstevel@tonic-gate 	MDI_CLIENT_CLEAR_PATH_FREE_IN_PROGRESS(ct);
32427c478bd9Sstevel@tonic-gate 
32437c478bd9Sstevel@tonic-gate 	if (!MDI_PI_IS_INITING(pip)) {
32447c478bd9Sstevel@tonic-gate 		f = vh->vh_ops->vo_pi_uninit;
32457c478bd9Sstevel@tonic-gate 		if (f != NULL) {
32467c478bd9Sstevel@tonic-gate 			rv = (*f)(vh->vh_dip, pip, 0);
32477c478bd9Sstevel@tonic-gate 		}
32487c478bd9Sstevel@tonic-gate 	}
32497c478bd9Sstevel@tonic-gate 	/*
32507c478bd9Sstevel@tonic-gate 	 * If vo_pi_uninit() completed successfully.
32517c478bd9Sstevel@tonic-gate 	 */
32527c478bd9Sstevel@tonic-gate 	if (rv == MDI_SUCCESS) {
32537c478bd9Sstevel@tonic-gate 		if (client_held) {
32544c06356bSdh142964 			MDI_DEBUG(4, (MDI_NOTE, ct->ct_dip,
32557c478bd9Sstevel@tonic-gate 			    "i_mdi_pm_rele_client\n"));
32567c478bd9Sstevel@tonic-gate 			i_mdi_pm_rele_client(ct, 1);
32577c478bd9Sstevel@tonic-gate 		}
32587c478bd9Sstevel@tonic-gate 		i_mdi_pi_free(ph, pip, ct);
32597c478bd9Sstevel@tonic-gate 		if (ct->ct_path_count == 0) {
32607c478bd9Sstevel@tonic-gate 			/*
32617c478bd9Sstevel@tonic-gate 			 * Client lost its last path.
32627c478bd9Sstevel@tonic-gate 			 * Clean up the client device
32637c478bd9Sstevel@tonic-gate 			 */
32647c478bd9Sstevel@tonic-gate 			MDI_CLIENT_UNLOCK(ct);
32657c478bd9Sstevel@tonic-gate 			(void) i_mdi_client_free(ct->ct_vhci, ct);
32665e3986cbScth 			MDI_VHCI_CLIENT_UNLOCK(vh);
32677c478bd9Sstevel@tonic-gate 			return (rv);
32687c478bd9Sstevel@tonic-gate 		}
32697c478bd9Sstevel@tonic-gate 	}
32707c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
32715e3986cbScth 	MDI_VHCI_CLIENT_UNLOCK(vh);
32723c34adc5Sramat 
32733c34adc5Sramat 	if (rv == MDI_FAILURE)
32743c34adc5Sramat 		vhcache_pi_add(vh->vh_config, MDI_PI(pip));
32753c34adc5Sramat 
32767c478bd9Sstevel@tonic-gate 	return (rv);
32777c478bd9Sstevel@tonic-gate }
32787c478bd9Sstevel@tonic-gate 
32797c478bd9Sstevel@tonic-gate /*
32807c478bd9Sstevel@tonic-gate  * i_mdi_pi_free():
32817c478bd9Sstevel@tonic-gate  *		Free the mdi_pathinfo node
32827c478bd9Sstevel@tonic-gate  */
32837c478bd9Sstevel@tonic-gate static void
32847c478bd9Sstevel@tonic-gate i_mdi_pi_free(mdi_phci_t *ph, mdi_pathinfo_t *pip, mdi_client_t *ct)
32857c478bd9Sstevel@tonic-gate {
32867c478bd9Sstevel@tonic-gate 	int	ct_circular;
32877c478bd9Sstevel@tonic-gate 	int	ph_circular;
32887c478bd9Sstevel@tonic-gate 
32895e3986cbScth 	ASSERT(MDI_CLIENT_LOCKED(ct));
32905e3986cbScth 
32917c478bd9Sstevel@tonic-gate 	/*
32927c478bd9Sstevel@tonic-gate 	 * remove any per-path kstats
32937c478bd9Sstevel@tonic-gate 	 */
32947c478bd9Sstevel@tonic-gate 	i_mdi_pi_kstat_destroy(pip);
32957c478bd9Sstevel@tonic-gate 
32965e3986cbScth 	/* See comments in i_mdi_pi_alloc() */
32977c478bd9Sstevel@tonic-gate 	ndi_devi_enter(ct->ct_dip, &ct_circular);
32987c478bd9Sstevel@tonic-gate 	ndi_devi_enter(ph->ph_dip, &ph_circular);
32997c478bd9Sstevel@tonic-gate 
33007c478bd9Sstevel@tonic-gate 	i_mdi_client_remove_path(ct, pip);
33017c478bd9Sstevel@tonic-gate 	i_mdi_phci_remove_path(ph, pip);
33027c478bd9Sstevel@tonic-gate 
33037c478bd9Sstevel@tonic-gate 	ndi_devi_exit(ph->ph_dip, ph_circular);
33047c478bd9Sstevel@tonic-gate 	ndi_devi_exit(ct->ct_dip, ct_circular);
33057c478bd9Sstevel@tonic-gate 
33067c478bd9Sstevel@tonic-gate 	mutex_destroy(&MDI_PI(pip)->pi_mutex);
33077c478bd9Sstevel@tonic-gate 	cv_destroy(&MDI_PI(pip)->pi_state_cv);
33087c478bd9Sstevel@tonic-gate 	cv_destroy(&MDI_PI(pip)->pi_ref_cv);
33097c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_addr) {
33107c478bd9Sstevel@tonic-gate 		kmem_free(MDI_PI(pip)->pi_addr,
33117c478bd9Sstevel@tonic-gate 		    strlen(MDI_PI(pip)->pi_addr) + 1);
33127c478bd9Sstevel@tonic-gate 		MDI_PI(pip)->pi_addr = NULL;
33137c478bd9Sstevel@tonic-gate 	}
33147c478bd9Sstevel@tonic-gate 
33157c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_prop) {
33167c478bd9Sstevel@tonic-gate 		(void) nvlist_free(MDI_PI(pip)->pi_prop);
33177c478bd9Sstevel@tonic-gate 		MDI_PI(pip)->pi_prop = NULL;
33187c478bd9Sstevel@tonic-gate 	}
33197c478bd9Sstevel@tonic-gate 	kmem_free(pip, sizeof (struct mdi_pathinfo));
33207c478bd9Sstevel@tonic-gate }
33217c478bd9Sstevel@tonic-gate 
33227c478bd9Sstevel@tonic-gate 
33237c478bd9Sstevel@tonic-gate /*
33247c478bd9Sstevel@tonic-gate  * i_mdi_phci_remove_path():
33257c478bd9Sstevel@tonic-gate  * 		Remove a mdi_pathinfo node from pHCI list.
33267c478bd9Sstevel@tonic-gate  * Notes:
33277c478bd9Sstevel@tonic-gate  *		Caller should hold per-pHCI mutex
33287c478bd9Sstevel@tonic-gate  */
33297c478bd9Sstevel@tonic-gate static void
33307c478bd9Sstevel@tonic-gate i_mdi_phci_remove_path(mdi_phci_t *ph, mdi_pathinfo_t *pip)
33317c478bd9Sstevel@tonic-gate {
33327c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*prev = NULL;
33337c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*path = NULL;
33347c478bd9Sstevel@tonic-gate 
33357c478bd9Sstevel@tonic-gate 	ASSERT(DEVI_BUSY_OWNED(ph->ph_dip));
33367c478bd9Sstevel@tonic-gate 
33375e3986cbScth 	MDI_PHCI_LOCK(ph);
33387c478bd9Sstevel@tonic-gate 	path = ph->ph_path_head;
33397c478bd9Sstevel@tonic-gate 	while (path != NULL) {
33407c478bd9Sstevel@tonic-gate 		if (path == pip) {
33417c478bd9Sstevel@tonic-gate 			break;
33427c478bd9Sstevel@tonic-gate 		}
33437c478bd9Sstevel@tonic-gate 		prev = path;
33447c478bd9Sstevel@tonic-gate 		path = (mdi_pathinfo_t *)MDI_PI(path)->pi_phci_link;
33457c478bd9Sstevel@tonic-gate 	}
33467c478bd9Sstevel@tonic-gate 
33477c478bd9Sstevel@tonic-gate 	if (path) {
33487c478bd9Sstevel@tonic-gate 		ph->ph_path_count--;
33497c478bd9Sstevel@tonic-gate 		if (prev) {
33507c478bd9Sstevel@tonic-gate 			MDI_PI(prev)->pi_phci_link = MDI_PI(path)->pi_phci_link;
33517c478bd9Sstevel@tonic-gate 		} else {
33527c478bd9Sstevel@tonic-gate 			ph->ph_path_head =
33537c478bd9Sstevel@tonic-gate 			    (mdi_pathinfo_t *)MDI_PI(path)->pi_phci_link;
33547c478bd9Sstevel@tonic-gate 		}
33557c478bd9Sstevel@tonic-gate 		if (ph->ph_path_tail == path) {
33567c478bd9Sstevel@tonic-gate 			ph->ph_path_tail = prev;
33577c478bd9Sstevel@tonic-gate 		}
33587c478bd9Sstevel@tonic-gate 	}
33597c478bd9Sstevel@tonic-gate 
33607c478bd9Sstevel@tonic-gate 	/*
33617c478bd9Sstevel@tonic-gate 	 * Clear the pHCI link
33627c478bd9Sstevel@tonic-gate 	 */
33637c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_phci_link = NULL;
33647c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_phci = NULL;
33655e3986cbScth 	MDI_PHCI_UNLOCK(ph);
33667c478bd9Sstevel@tonic-gate }
33677c478bd9Sstevel@tonic-gate 
33687c478bd9Sstevel@tonic-gate /*
33697c478bd9Sstevel@tonic-gate  * i_mdi_client_remove_path():
33707c478bd9Sstevel@tonic-gate  * 		Remove a mdi_pathinfo node from client path list.
33717c478bd9Sstevel@tonic-gate  */
33727c478bd9Sstevel@tonic-gate static void
33737c478bd9Sstevel@tonic-gate i_mdi_client_remove_path(mdi_client_t *ct, mdi_pathinfo_t *pip)
33747c478bd9Sstevel@tonic-gate {
33757c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*prev = NULL;
33767c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*path;
33777c478bd9Sstevel@tonic-gate 
33787c478bd9Sstevel@tonic-gate 	ASSERT(DEVI_BUSY_OWNED(ct->ct_dip));
33797c478bd9Sstevel@tonic-gate 
33805e3986cbScth 	ASSERT(MDI_CLIENT_LOCKED(ct));
33817c478bd9Sstevel@tonic-gate 	path = ct->ct_path_head;
33827c478bd9Sstevel@tonic-gate 	while (path != NULL) {
33837c478bd9Sstevel@tonic-gate 		if (path == pip) {
33847c478bd9Sstevel@tonic-gate 			break;
33857c478bd9Sstevel@tonic-gate 		}
33867c478bd9Sstevel@tonic-gate 		prev = path;
33877c478bd9Sstevel@tonic-gate 		path = (mdi_pathinfo_t *)MDI_PI(path)->pi_client_link;
33887c478bd9Sstevel@tonic-gate 	}
33897c478bd9Sstevel@tonic-gate 
33907c478bd9Sstevel@tonic-gate 	if (path) {
33917c478bd9Sstevel@tonic-gate 		ct->ct_path_count--;
33927c478bd9Sstevel@tonic-gate 		if (prev) {
33937c478bd9Sstevel@tonic-gate 			MDI_PI(prev)->pi_client_link =
33947c478bd9Sstevel@tonic-gate 			    MDI_PI(path)->pi_client_link;
33957c478bd9Sstevel@tonic-gate 		} else {
33967c478bd9Sstevel@tonic-gate 			ct->ct_path_head =
33977c478bd9Sstevel@tonic-gate 			    (mdi_pathinfo_t *)MDI_PI(path)->pi_client_link;
33987c478bd9Sstevel@tonic-gate 		}
33997c478bd9Sstevel@tonic-gate 		if (ct->ct_path_tail == path) {
34007c478bd9Sstevel@tonic-gate 			ct->ct_path_tail = prev;
34017c478bd9Sstevel@tonic-gate 		}
34027c478bd9Sstevel@tonic-gate 		if (ct->ct_path_last == path) {
34037c478bd9Sstevel@tonic-gate 			ct->ct_path_last = ct->ct_path_head;
34047c478bd9Sstevel@tonic-gate 		}
34057c478bd9Sstevel@tonic-gate 	}
34067c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_client_link = NULL;
34077c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_client = NULL;
34087c478bd9Sstevel@tonic-gate }
34097c478bd9Sstevel@tonic-gate 
34107c478bd9Sstevel@tonic-gate /*
34117c478bd9Sstevel@tonic-gate  * i_mdi_pi_state_change():
34127c478bd9Sstevel@tonic-gate  *		online a mdi_pathinfo node
34137c478bd9Sstevel@tonic-gate  *
34147c478bd9Sstevel@tonic-gate  * Return Values:
34157c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
34167c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
34177c478bd9Sstevel@tonic-gate  */
34187c478bd9Sstevel@tonic-gate /*ARGSUSED*/
34197c478bd9Sstevel@tonic-gate static int
34207c478bd9Sstevel@tonic-gate i_mdi_pi_state_change(mdi_pathinfo_t *pip, mdi_pathinfo_state_t state, int flag)
34217c478bd9Sstevel@tonic-gate {
34227c478bd9Sstevel@tonic-gate 	int		rv = MDI_SUCCESS;
34237c478bd9Sstevel@tonic-gate 	mdi_vhci_t	*vh;
34247c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
34257c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
34267c478bd9Sstevel@tonic-gate 	int		(*f)();
34277c478bd9Sstevel@tonic-gate 	dev_info_t	*cdip;
34287c478bd9Sstevel@tonic-gate 
34297c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
34307c478bd9Sstevel@tonic-gate 
34317c478bd9Sstevel@tonic-gate 	ph = MDI_PI(pip)->pi_phci;
34327c478bd9Sstevel@tonic-gate 	ASSERT(ph);
34337c478bd9Sstevel@tonic-gate 	if (ph == NULL) {
34347c478bd9Sstevel@tonic-gate 		/*
34357c478bd9Sstevel@tonic-gate 		 * Invalid pHCI device, fail the request
34367c478bd9Sstevel@tonic-gate 		 */
34377c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
34384c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, NULL,
34394c06356bSdh142964 		    "!invalid phci: pip %s %p",
34404c06356bSdh142964 		    mdi_pi_spathname(pip), (void *)pip));
34417c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
34427c478bd9Sstevel@tonic-gate 	}
34437c478bd9Sstevel@tonic-gate 
34447c478bd9Sstevel@tonic-gate 	vh = ph->ph_vhci;
34457c478bd9Sstevel@tonic-gate 	ASSERT(vh);
34467c478bd9Sstevel@tonic-gate 	if (vh == NULL) {
34477c478bd9Sstevel@tonic-gate 		/*
34487c478bd9Sstevel@tonic-gate 		 * Invalid vHCI device, fail the request
34497c478bd9Sstevel@tonic-gate 		 */
34507c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
34514c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, ph->ph_dip,
34524c06356bSdh142964 		    "!invalid vhci: pip %s %p",
34534c06356bSdh142964 		    mdi_pi_spathname(pip), (void *)pip));
34547c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
34557c478bd9Sstevel@tonic-gate 	}
34567c478bd9Sstevel@tonic-gate 
34577c478bd9Sstevel@tonic-gate 	ct = MDI_PI(pip)->pi_client;
34587c478bd9Sstevel@tonic-gate 	ASSERT(ct != NULL);
34597c478bd9Sstevel@tonic-gate 	if (ct == NULL) {
34607c478bd9Sstevel@tonic-gate 		/*
34617c478bd9Sstevel@tonic-gate 		 * Invalid client device, fail the request
34627c478bd9Sstevel@tonic-gate 		 */
34637c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
34644c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, ph->ph_dip,
34654c06356bSdh142964 		    "!invalid client: pip %s %p",
34664c06356bSdh142964 		    mdi_pi_spathname(pip), (void *)pip));
34677c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
34687c478bd9Sstevel@tonic-gate 	}
34697c478bd9Sstevel@tonic-gate 
34707c478bd9Sstevel@tonic-gate 	/*
34717c478bd9Sstevel@tonic-gate 	 * If this path has not been initialized yet, Callback vHCI driver's
34727c478bd9Sstevel@tonic-gate 	 * pathinfo node initialize entry point
34737c478bd9Sstevel@tonic-gate 	 */
34747c478bd9Sstevel@tonic-gate 
34757c478bd9Sstevel@tonic-gate 	if (MDI_PI_IS_INITING(pip)) {
34767c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
34777c478bd9Sstevel@tonic-gate 		f = vh->vh_ops->vo_pi_init;
34787c478bd9Sstevel@tonic-gate 		if (f != NULL) {
34797c478bd9Sstevel@tonic-gate 			rv = (*f)(vh->vh_dip, pip, 0);
34807c478bd9Sstevel@tonic-gate 			if (rv != MDI_SUCCESS) {
34814c06356bSdh142964 				MDI_DEBUG(1, (MDI_WARN, ct->ct_dip,
34824c06356bSdh142964 				    "!vo_pi_init failed: vHCI %p, pip %s %p",
34834c06356bSdh142964 				    (void *)vh, mdi_pi_spathname(pip),
34844c06356bSdh142964 				    (void *)pip));
34857c478bd9Sstevel@tonic-gate 				return (MDI_FAILURE);
34867c478bd9Sstevel@tonic-gate 			}
34877c478bd9Sstevel@tonic-gate 		}
34887c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
34897c478bd9Sstevel@tonic-gate 		MDI_PI_CLEAR_TRANSIENT(pip);
34907c478bd9Sstevel@tonic-gate 	}
34917c478bd9Sstevel@tonic-gate 
34927c478bd9Sstevel@tonic-gate 	/*
34937c478bd9Sstevel@tonic-gate 	 * Do not allow state transition when pHCI is in offline/suspended
34947c478bd9Sstevel@tonic-gate 	 * states
34957c478bd9Sstevel@tonic-gate 	 */
34967c478bd9Sstevel@tonic-gate 	i_mdi_phci_lock(ph, pip);
34977c478bd9Sstevel@tonic-gate 	if (MDI_PHCI_IS_READY(ph) == 0) {
34984c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, ct->ct_dip,
34994c06356bSdh142964 		    "!pHCI not ready, pHCI=%p", (void *)ph));
35007c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
35017c478bd9Sstevel@tonic-gate 		i_mdi_phci_unlock(ph);
35027c478bd9Sstevel@tonic-gate 		return (MDI_BUSY);
35037c478bd9Sstevel@tonic-gate 	}
35047c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNSTABLE(ph);
35057c478bd9Sstevel@tonic-gate 	i_mdi_phci_unlock(ph);
35067c478bd9Sstevel@tonic-gate 
35077c478bd9Sstevel@tonic-gate 	/*
35087c478bd9Sstevel@tonic-gate 	 * Check if mdi_pathinfo state is in transient state.
35097c478bd9Sstevel@tonic-gate 	 * If yes, offlining is in progress and wait till transient state is
35107c478bd9Sstevel@tonic-gate 	 * cleared.
35117c478bd9Sstevel@tonic-gate 	 */
35127c478bd9Sstevel@tonic-gate 	if (MDI_PI_IS_TRANSIENT(pip)) {
35137c478bd9Sstevel@tonic-gate 		while (MDI_PI_IS_TRANSIENT(pip)) {
35147c478bd9Sstevel@tonic-gate 			cv_wait(&MDI_PI(pip)->pi_state_cv,
35157c478bd9Sstevel@tonic-gate 			    &MDI_PI(pip)->pi_mutex);
35167c478bd9Sstevel@tonic-gate 		}
35177c478bd9Sstevel@tonic-gate 	}
35187c478bd9Sstevel@tonic-gate 
35197c478bd9Sstevel@tonic-gate 	/*
35207c478bd9Sstevel@tonic-gate 	 * Grab the client lock in reverse order sequence and release the
35217c478bd9Sstevel@tonic-gate 	 * mdi_pathinfo mutex.
35227c478bd9Sstevel@tonic-gate 	 */
35237c478bd9Sstevel@tonic-gate 	i_mdi_client_lock(ct, pip);
35247c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
35257c478bd9Sstevel@tonic-gate 
35267c478bd9Sstevel@tonic-gate 	/*
35277c478bd9Sstevel@tonic-gate 	 * Wait till failover state is cleared
35287c478bd9Sstevel@tonic-gate 	 */
35297c478bd9Sstevel@tonic-gate 	while (MDI_CLIENT_IS_FAILOVER_IN_PROGRESS(ct))
35307c478bd9Sstevel@tonic-gate 		cv_wait(&ct->ct_failover_cv, &ct->ct_mutex);
35317c478bd9Sstevel@tonic-gate 
35327c478bd9Sstevel@tonic-gate 	/*
35337c478bd9Sstevel@tonic-gate 	 * Mark the mdi_pathinfo node state as transient
35347c478bd9Sstevel@tonic-gate 	 */
35357c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
35367c478bd9Sstevel@tonic-gate 	switch (state) {
35377c478bd9Sstevel@tonic-gate 	case MDI_PATHINFO_STATE_ONLINE:
35387c478bd9Sstevel@tonic-gate 		MDI_PI_SET_ONLINING(pip);
35397c478bd9Sstevel@tonic-gate 		break;
35407c478bd9Sstevel@tonic-gate 
35417c478bd9Sstevel@tonic-gate 	case MDI_PATHINFO_STATE_STANDBY:
35427c478bd9Sstevel@tonic-gate 		MDI_PI_SET_STANDBYING(pip);
35437c478bd9Sstevel@tonic-gate 		break;
35447c478bd9Sstevel@tonic-gate 
35457c478bd9Sstevel@tonic-gate 	case MDI_PATHINFO_STATE_FAULT:
35467c478bd9Sstevel@tonic-gate 		/*
35477c478bd9Sstevel@tonic-gate 		 * Mark the pathinfo state as FAULTED
35487c478bd9Sstevel@tonic-gate 		 */
35497c478bd9Sstevel@tonic-gate 		MDI_PI_SET_FAULTING(pip);
35507c478bd9Sstevel@tonic-gate 		MDI_PI_ERRSTAT(pip, MDI_PI_HARDERR);
35517c478bd9Sstevel@tonic-gate 		break;
35527c478bd9Sstevel@tonic-gate 
35537c478bd9Sstevel@tonic-gate 	case MDI_PATHINFO_STATE_OFFLINE:
35547c478bd9Sstevel@tonic-gate 		/*
35557c478bd9Sstevel@tonic-gate 		 * ndi_devi_offline() cannot hold pip or ct locks.
35567c478bd9Sstevel@tonic-gate 		 */
35577c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
35584c06356bSdh142964 
35597c478bd9Sstevel@tonic-gate 		/*
35604c06356bSdh142964 		 * If this is a user initiated path online->offline operation
35614c06356bSdh142964 		 * who's success would transition a client from DEGRADED to
35624c06356bSdh142964 		 * FAILED then only proceed if we can offline the client first.
35637c478bd9Sstevel@tonic-gate 		 */
35647c478bd9Sstevel@tonic-gate 		cdip = ct->ct_dip;
35654c06356bSdh142964 		if ((flag & NDI_USER_REQ) &&
35664c06356bSdh142964 		    MDI_PI_IS_ONLINE(pip) &&
35674c06356bSdh142964 		    (MDI_CLIENT_STATE(ct) == MDI_CLIENT_STATE_DEGRADED)) {
35687c478bd9Sstevel@tonic-gate 			i_mdi_client_unlock(ct);
35694c06356bSdh142964 			rv = ndi_devi_offline(cdip, NDI_DEVFS_CLEAN);
35707c478bd9Sstevel@tonic-gate 			if (rv != NDI_SUCCESS) {
35717c478bd9Sstevel@tonic-gate 				/*
35727c478bd9Sstevel@tonic-gate 				 * Convert to MDI error code
35737c478bd9Sstevel@tonic-gate 				 */
35747c478bd9Sstevel@tonic-gate 				switch (rv) {
35757c478bd9Sstevel@tonic-gate 				case NDI_BUSY:
35767c478bd9Sstevel@tonic-gate 					rv = MDI_BUSY;
35777c478bd9Sstevel@tonic-gate 					break;
35787c478bd9Sstevel@tonic-gate 				default:
35797c478bd9Sstevel@tonic-gate 					rv = MDI_FAILURE;
35807c478bd9Sstevel@tonic-gate 					break;
35817c478bd9Sstevel@tonic-gate 				}
35827c478bd9Sstevel@tonic-gate 				goto state_change_exit;
35837c478bd9Sstevel@tonic-gate 			} else {
35847c478bd9Sstevel@tonic-gate 				i_mdi_client_lock(ct, NULL);
35857c478bd9Sstevel@tonic-gate 			}
35867c478bd9Sstevel@tonic-gate 		}
35877c478bd9Sstevel@tonic-gate 		/*
35887c478bd9Sstevel@tonic-gate 		 * Mark the mdi_pathinfo node state as transient
35897c478bd9Sstevel@tonic-gate 		 */
35907c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
35917c478bd9Sstevel@tonic-gate 		MDI_PI_SET_OFFLINING(pip);
35927c478bd9Sstevel@tonic-gate 		break;
35937c478bd9Sstevel@tonic-gate 	}
35947c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
35957c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNSTABLE(ct);
35967c478bd9Sstevel@tonic-gate 	i_mdi_client_unlock(ct);
35977c478bd9Sstevel@tonic-gate 
35987c478bd9Sstevel@tonic-gate 	f = vh->vh_ops->vo_pi_state_change;
35995e3986cbScth 	if (f != NULL)
36007c478bd9Sstevel@tonic-gate 		rv = (*f)(vh->vh_dip, pip, state, 0, flag);
36015e3986cbScth 
36025e3986cbScth 	MDI_CLIENT_LOCK(ct);
36035e3986cbScth 	MDI_PI_LOCK(pip);
36047c478bd9Sstevel@tonic-gate 	if (rv == MDI_NOT_SUPPORTED) {
36057c478bd9Sstevel@tonic-gate 		MDI_CLIENT_SET_DEV_NOT_SUPPORTED(ct);
36067c478bd9Sstevel@tonic-gate 	}
36077c478bd9Sstevel@tonic-gate 	if (rv != MDI_SUCCESS) {
36084c06356bSdh142964 		MDI_DEBUG(2, (MDI_WARN, ct->ct_dip,
36094c06356bSdh142964 		    "vo_pi_state_change failed: rv %x", rv));
36107c478bd9Sstevel@tonic-gate 	}
36117c478bd9Sstevel@tonic-gate 	if (MDI_PI_IS_TRANSIENT(pip)) {
36127c478bd9Sstevel@tonic-gate 		if (rv == MDI_SUCCESS) {
36137c478bd9Sstevel@tonic-gate 			MDI_PI_CLEAR_TRANSIENT(pip);
36147c478bd9Sstevel@tonic-gate 		} else {
36157c478bd9Sstevel@tonic-gate 			MDI_PI(pip)->pi_state = MDI_PI_OLD_STATE(pip);
36167c478bd9Sstevel@tonic-gate 		}
36177c478bd9Sstevel@tonic-gate 	}
36187c478bd9Sstevel@tonic-gate 
36197c478bd9Sstevel@tonic-gate 	/*
36207c478bd9Sstevel@tonic-gate 	 * Wake anyone waiting for this mdi_pathinfo node
36217c478bd9Sstevel@tonic-gate 	 */
36227c478bd9Sstevel@tonic-gate 	cv_broadcast(&MDI_PI(pip)->pi_state_cv);
36237c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
36247c478bd9Sstevel@tonic-gate 
36257c478bd9Sstevel@tonic-gate 	/*
36267c478bd9Sstevel@tonic-gate 	 * Mark the client device as stable
36277c478bd9Sstevel@tonic-gate 	 */
36287c478bd9Sstevel@tonic-gate 	MDI_CLIENT_STABLE(ct);
36297c478bd9Sstevel@tonic-gate 	if (rv == MDI_SUCCESS) {
36307c478bd9Sstevel@tonic-gate 		if (ct->ct_unstable == 0) {
36317c478bd9Sstevel@tonic-gate 			cdip = ct->ct_dip;
36327c478bd9Sstevel@tonic-gate 
36337c478bd9Sstevel@tonic-gate 			/*
36347c478bd9Sstevel@tonic-gate 			 * Onlining the mdi_pathinfo node will impact the
36357c478bd9Sstevel@tonic-gate 			 * client state Update the client and dev_info node
36367c478bd9Sstevel@tonic-gate 			 * state accordingly
36377c478bd9Sstevel@tonic-gate 			 */
36387c478bd9Sstevel@tonic-gate 			rv = NDI_SUCCESS;
36397c478bd9Sstevel@tonic-gate 			i_mdi_client_update_state(ct);
36407c478bd9Sstevel@tonic-gate 			switch (MDI_CLIENT_STATE(ct)) {
36417c478bd9Sstevel@tonic-gate 			case MDI_CLIENT_STATE_OPTIMAL:
36427c478bd9Sstevel@tonic-gate 			case MDI_CLIENT_STATE_DEGRADED:
3643737d277aScth 				if (cdip && !i_ddi_devi_attached(cdip) &&
36447c478bd9Sstevel@tonic-gate 				    ((state == MDI_PATHINFO_STATE_ONLINE) ||
36457c478bd9Sstevel@tonic-gate 				    (state == MDI_PATHINFO_STATE_STANDBY))) {
36467c478bd9Sstevel@tonic-gate 
36477c478bd9Sstevel@tonic-gate 					/*
36487c478bd9Sstevel@tonic-gate 					 * Must do ndi_devi_online() through
36497c478bd9Sstevel@tonic-gate 					 * hotplug thread for deferred
36507c478bd9Sstevel@tonic-gate 					 * attach mechanism to work
36517c478bd9Sstevel@tonic-gate 					 */
36525e3986cbScth 					MDI_CLIENT_UNLOCK(ct);
36537c478bd9Sstevel@tonic-gate 					rv = ndi_devi_online(cdip, 0);
36545e3986cbScth 					MDI_CLIENT_LOCK(ct);
36557c478bd9Sstevel@tonic-gate 					if ((rv != NDI_SUCCESS) &&
36567c478bd9Sstevel@tonic-gate 					    (MDI_CLIENT_STATE(ct) ==
36577c478bd9Sstevel@tonic-gate 					    MDI_CLIENT_STATE_DEGRADED)) {
36587c478bd9Sstevel@tonic-gate 						/*
36597c478bd9Sstevel@tonic-gate 						 * ndi_devi_online failed.
36607c478bd9Sstevel@tonic-gate 						 * Reset client flags to
36617c478bd9Sstevel@tonic-gate 						 * offline.
36627c478bd9Sstevel@tonic-gate 						 */
36634c06356bSdh142964 						MDI_DEBUG(1, (MDI_WARN, cdip,
36644c06356bSdh142964 						    "!ndi_devi_online failed "
36654c06356bSdh142964 						    "error %x", rv));
36667c478bd9Sstevel@tonic-gate 						MDI_CLIENT_SET_OFFLINE(ct);
36677c478bd9Sstevel@tonic-gate 					}
36687c478bd9Sstevel@tonic-gate 					if (rv != NDI_SUCCESS) {
36697c478bd9Sstevel@tonic-gate 						/* Reset the path state */
36707c478bd9Sstevel@tonic-gate 						MDI_PI_LOCK(pip);
36717c478bd9Sstevel@tonic-gate 						MDI_PI(pip)->pi_state =
36727c478bd9Sstevel@tonic-gate 						    MDI_PI_OLD_STATE(pip);
36737c478bd9Sstevel@tonic-gate 						MDI_PI_UNLOCK(pip);
36747c478bd9Sstevel@tonic-gate 					}
36757c478bd9Sstevel@tonic-gate 				}
36767c478bd9Sstevel@tonic-gate 				break;
36777c478bd9Sstevel@tonic-gate 
36787c478bd9Sstevel@tonic-gate 			case MDI_CLIENT_STATE_FAILED:
36797c478bd9Sstevel@tonic-gate 				/*
36807c478bd9Sstevel@tonic-gate 				 * This is the last path case for
36817c478bd9Sstevel@tonic-gate 				 * non-user initiated events.
36827c478bd9Sstevel@tonic-gate 				 */
36834c06356bSdh142964 				if (((flag & NDI_USER_REQ) == 0) &&
36847c478bd9Sstevel@tonic-gate 				    cdip && (i_ddi_node_state(cdip) >=
36857c478bd9Sstevel@tonic-gate 				    DS_INITIALIZED)) {
36865e3986cbScth 					MDI_CLIENT_UNLOCK(ct);
36874c06356bSdh142964 					rv = ndi_devi_offline(cdip,
36884c06356bSdh142964 					    NDI_DEVFS_CLEAN);
36895e3986cbScth 					MDI_CLIENT_LOCK(ct);
36907c478bd9Sstevel@tonic-gate 
36917c478bd9Sstevel@tonic-gate 					if (rv != NDI_SUCCESS) {
36927c478bd9Sstevel@tonic-gate 						/*
36937c478bd9Sstevel@tonic-gate 						 * ndi_devi_offline failed.
36947c478bd9Sstevel@tonic-gate 						 * Reset client flags to
36957c478bd9Sstevel@tonic-gate 						 * online as the path could not
36967c478bd9Sstevel@tonic-gate 						 * be offlined.
36977c478bd9Sstevel@tonic-gate 						 */
36984c06356bSdh142964 						MDI_DEBUG(1, (MDI_WARN, cdip,
36994c06356bSdh142964 						    "!ndi_devi_offline failed: "
37004c06356bSdh142964 						    "error %x", rv));
37017c478bd9Sstevel@tonic-gate 						MDI_CLIENT_SET_ONLINE(ct);
37027c478bd9Sstevel@tonic-gate 					}
37037c478bd9Sstevel@tonic-gate 				}
37047c478bd9Sstevel@tonic-gate 				break;
37057c478bd9Sstevel@tonic-gate 			}
37067c478bd9Sstevel@tonic-gate 			/*
37077c478bd9Sstevel@tonic-gate 			 * Convert to MDI error code
37087c478bd9Sstevel@tonic-gate 			 */
37097c478bd9Sstevel@tonic-gate 			switch (rv) {
37107c478bd9Sstevel@tonic-gate 			case NDI_SUCCESS:
37117c478bd9Sstevel@tonic-gate 				MDI_CLIENT_SET_REPORT_DEV_NEEDED(ct);
37127c478bd9Sstevel@tonic-gate 				i_mdi_report_path_state(ct, pip);
37137c478bd9Sstevel@tonic-gate 				rv = MDI_SUCCESS;
37147c478bd9Sstevel@tonic-gate 				break;
37157c478bd9Sstevel@tonic-gate 			case NDI_BUSY:
37167c478bd9Sstevel@tonic-gate 				rv = MDI_BUSY;
37177c478bd9Sstevel@tonic-gate 				break;
37187c478bd9Sstevel@tonic-gate 			default:
37197c478bd9Sstevel@tonic-gate 				rv = MDI_FAILURE;
37207c478bd9Sstevel@tonic-gate 				break;
37217c478bd9Sstevel@tonic-gate 			}
37227c478bd9Sstevel@tonic-gate 		}
37237c478bd9Sstevel@tonic-gate 	}
37247c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
37257c478bd9Sstevel@tonic-gate 
37267c478bd9Sstevel@tonic-gate state_change_exit:
37277c478bd9Sstevel@tonic-gate 	/*
37287c478bd9Sstevel@tonic-gate 	 * Mark the pHCI as stable again.
37297c478bd9Sstevel@tonic-gate 	 */
37307c478bd9Sstevel@tonic-gate 	MDI_PHCI_LOCK(ph);
37317c478bd9Sstevel@tonic-gate 	MDI_PHCI_STABLE(ph);
37327c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNLOCK(ph);
37337c478bd9Sstevel@tonic-gate 	return (rv);
37347c478bd9Sstevel@tonic-gate }
37357c478bd9Sstevel@tonic-gate 
37367c478bd9Sstevel@tonic-gate /*
37377c478bd9Sstevel@tonic-gate  * mdi_pi_online():
37387c478bd9Sstevel@tonic-gate  *		Place the path_info node in the online state.  The path is
37397c478bd9Sstevel@tonic-gate  *		now available to be selected by mdi_select_path() for
37407c478bd9Sstevel@tonic-gate  *		transporting I/O requests to client devices.
37417c478bd9Sstevel@tonic-gate  * Return Values:
37427c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
37437c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
37447c478bd9Sstevel@tonic-gate  */
37457c478bd9Sstevel@tonic-gate int
37467c478bd9Sstevel@tonic-gate mdi_pi_online(mdi_pathinfo_t *pip, int flags)
37477c478bd9Sstevel@tonic-gate {
37487c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct = MDI_PI(pip)->pi_client;
37497c478bd9Sstevel@tonic-gate 	int		client_held = 0;
37507c478bd9Sstevel@tonic-gate 	int		rv;
37517c478bd9Sstevel@tonic-gate 
37527c478bd9Sstevel@tonic-gate 	ASSERT(ct != NULL);
37537c478bd9Sstevel@tonic-gate 	rv = i_mdi_pi_state_change(pip, MDI_PATHINFO_STATE_ONLINE, flags);
37547c478bd9Sstevel@tonic-gate 	if (rv != MDI_SUCCESS)
37557c478bd9Sstevel@tonic-gate 		return (rv);
37567c478bd9Sstevel@tonic-gate 
37577c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
37587c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_pm_held == 0) {
37594c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, ct->ct_dip,
37604c06356bSdh142964 		    "i_mdi_pm_hold_pip %p", (void *)pip));
37617c478bd9Sstevel@tonic-gate 		i_mdi_pm_hold_pip(pip);
37627c478bd9Sstevel@tonic-gate 		client_held = 1;
37637c478bd9Sstevel@tonic-gate 	}
37647c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
37657c478bd9Sstevel@tonic-gate 
37667c478bd9Sstevel@tonic-gate 	if (client_held) {
37677c478bd9Sstevel@tonic-gate 		MDI_CLIENT_LOCK(ct);
37687c478bd9Sstevel@tonic-gate 		if (ct->ct_power_cnt == 0) {
37697c478bd9Sstevel@tonic-gate 			rv = i_mdi_power_all_phci(ct);
37707c478bd9Sstevel@tonic-gate 		}
37717c478bd9Sstevel@tonic-gate 
37724c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, ct->ct_dip,
37734c06356bSdh142964 		    "i_mdi_pm_hold_client %p", (void *)ct));
37747c478bd9Sstevel@tonic-gate 		i_mdi_pm_hold_client(ct, 1);
37757c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
37767c478bd9Sstevel@tonic-gate 	}
37777c478bd9Sstevel@tonic-gate 
37787c478bd9Sstevel@tonic-gate 	return (rv);
37797c478bd9Sstevel@tonic-gate }
37807c478bd9Sstevel@tonic-gate 
37817c478bd9Sstevel@tonic-gate /*
37827c478bd9Sstevel@tonic-gate  * mdi_pi_standby():
37837c478bd9Sstevel@tonic-gate  *		Place the mdi_pathinfo node in standby state
37847c478bd9Sstevel@tonic-gate  *
37857c478bd9Sstevel@tonic-gate  * Return Values:
37867c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
37877c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
37887c478bd9Sstevel@tonic-gate  */
37897c478bd9Sstevel@tonic-gate int
37907c478bd9Sstevel@tonic-gate mdi_pi_standby(mdi_pathinfo_t *pip, int flags)
37917c478bd9Sstevel@tonic-gate {
37927c478bd9Sstevel@tonic-gate 	return (i_mdi_pi_state_change(pip, MDI_PATHINFO_STATE_STANDBY, flags));
37937c478bd9Sstevel@tonic-gate }
37947c478bd9Sstevel@tonic-gate 
37957c478bd9Sstevel@tonic-gate /*
37967c478bd9Sstevel@tonic-gate  * mdi_pi_fault():
37977c478bd9Sstevel@tonic-gate  *		Place the mdi_pathinfo node in fault'ed state
37987c478bd9Sstevel@tonic-gate  * Return Values:
37997c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
38007c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
38017c478bd9Sstevel@tonic-gate  */
38027c478bd9Sstevel@tonic-gate int
38037c478bd9Sstevel@tonic-gate mdi_pi_fault(mdi_pathinfo_t *pip, int flags)
38047c478bd9Sstevel@tonic-gate {
38057c478bd9Sstevel@tonic-gate 	return (i_mdi_pi_state_change(pip, MDI_PATHINFO_STATE_FAULT, flags));
38067c478bd9Sstevel@tonic-gate }
38077c478bd9Sstevel@tonic-gate 
38087c478bd9Sstevel@tonic-gate /*
38097c478bd9Sstevel@tonic-gate  * mdi_pi_offline():
38107c478bd9Sstevel@tonic-gate  *		Offline a mdi_pathinfo node.
38117c478bd9Sstevel@tonic-gate  * Return Values:
38127c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
38137c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
38147c478bd9Sstevel@tonic-gate  */
38157c478bd9Sstevel@tonic-gate int
38167c478bd9Sstevel@tonic-gate mdi_pi_offline(mdi_pathinfo_t *pip, int flags)
38177c478bd9Sstevel@tonic-gate {
38187c478bd9Sstevel@tonic-gate 	int	ret, client_held = 0;
38197c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
38204c06356bSdh142964 
38214c06356bSdh142964 	/*
38224c06356bSdh142964 	 * Original code overloaded NDI_DEVI_REMOVE to this interface, and
38234c06356bSdh142964 	 * used it to mean "user initiated operation" (i.e. devctl). Callers
38244c06356bSdh142964 	 * should now just use NDI_USER_REQ.
38254c06356bSdh142964 	 */
38264c06356bSdh142964 	if (flags & NDI_DEVI_REMOVE) {
38274c06356bSdh142964 		flags &= ~NDI_DEVI_REMOVE;
38284c06356bSdh142964 		flags |= NDI_USER_REQ;
38294c06356bSdh142964 	}
38307c478bd9Sstevel@tonic-gate 
38317c478bd9Sstevel@tonic-gate 	ret = i_mdi_pi_state_change(pip, MDI_PATHINFO_STATE_OFFLINE, flags);
38327c478bd9Sstevel@tonic-gate 
38337c478bd9Sstevel@tonic-gate 	if (ret == MDI_SUCCESS) {
38347c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
38357c478bd9Sstevel@tonic-gate 		if (MDI_PI(pip)->pi_pm_held) {
38367c478bd9Sstevel@tonic-gate 			client_held = 1;
38377c478bd9Sstevel@tonic-gate 		}
38387c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
38397c478bd9Sstevel@tonic-gate 
38407c478bd9Sstevel@tonic-gate 		if (client_held) {
38417c478bd9Sstevel@tonic-gate 			ct = MDI_PI(pip)->pi_client;
38427c478bd9Sstevel@tonic-gate 			MDI_CLIENT_LOCK(ct);
38434c06356bSdh142964 			MDI_DEBUG(4, (MDI_NOTE, ct->ct_dip,
38444c06356bSdh142964 			    "i_mdi_pm_rele_client\n"));
38457c478bd9Sstevel@tonic-gate 			i_mdi_pm_rele_client(ct, 1);
38467c478bd9Sstevel@tonic-gate 			MDI_CLIENT_UNLOCK(ct);
38477c478bd9Sstevel@tonic-gate 		}
38487c478bd9Sstevel@tonic-gate 	}
38497c478bd9Sstevel@tonic-gate 
38507c478bd9Sstevel@tonic-gate 	return (ret);
38517c478bd9Sstevel@tonic-gate }
38527c478bd9Sstevel@tonic-gate 
38537c478bd9Sstevel@tonic-gate /*
38547c478bd9Sstevel@tonic-gate  * i_mdi_pi_offline():
38557c478bd9Sstevel@tonic-gate  *		Offline a mdi_pathinfo node and call the vHCI driver's callback
38567c478bd9Sstevel@tonic-gate  */
38577c478bd9Sstevel@tonic-gate static int
38587c478bd9Sstevel@tonic-gate i_mdi_pi_offline(mdi_pathinfo_t *pip, int flags)
38597c478bd9Sstevel@tonic-gate {
38607c478bd9Sstevel@tonic-gate 	dev_info_t	*vdip = NULL;
38617c478bd9Sstevel@tonic-gate 	mdi_vhci_t	*vh = NULL;
38627c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct = NULL;
38637c478bd9Sstevel@tonic-gate 	int		(*f)();
38647c478bd9Sstevel@tonic-gate 	int		rv;
38657c478bd9Sstevel@tonic-gate 
38667c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
38677c478bd9Sstevel@tonic-gate 	ct = MDI_PI(pip)->pi_client;
38687c478bd9Sstevel@tonic-gate 	ASSERT(ct != NULL);
38697c478bd9Sstevel@tonic-gate 
38707c478bd9Sstevel@tonic-gate 	while (MDI_PI(pip)->pi_ref_cnt != 0) {
38717c478bd9Sstevel@tonic-gate 		/*
38727c478bd9Sstevel@tonic-gate 		 * Give a chance for pending I/Os to complete.
38737c478bd9Sstevel@tonic-gate 		 */
38744c06356bSdh142964 		MDI_DEBUG(1, (MDI_NOTE, ct->ct_dip,
38754c06356bSdh142964 		    "!%d cmds still pending on path %s %p",
38764c06356bSdh142964 		    MDI_PI(pip)->pi_ref_cnt, mdi_pi_spathname(pip),
38774c06356bSdh142964 		    (void *)pip));
3878*d3d50737SRafael Vanoni 		if (cv_reltimedwait(&MDI_PI(pip)->pi_ref_cv,
3879*d3d50737SRafael Vanoni 		    &MDI_PI(pip)->pi_mutex, drv_usectohz(60 * 1000000),
3880*d3d50737SRafael Vanoni 		    TR_CLOCK_TICK) == -1) {
38817c478bd9Sstevel@tonic-gate 			/*
38827c478bd9Sstevel@tonic-gate 			 * The timeout time reached without ref_cnt being zero
38837c478bd9Sstevel@tonic-gate 			 * being signaled.
38847c478bd9Sstevel@tonic-gate 			 */
38854c06356bSdh142964 			MDI_DEBUG(1, (MDI_NOTE, ct->ct_dip,
38864c06356bSdh142964 			    "!Timeout reached on path %s %p without the cond",
38874c06356bSdh142964 			    mdi_pi_spathname(pip), (void *)pip));
38884c06356bSdh142964 			MDI_DEBUG(1, (MDI_NOTE, ct->ct_dip,
38894c06356bSdh142964 			    "!%d cmds still pending on path %s %p",
38904c06356bSdh142964 			    MDI_PI(pip)->pi_ref_cnt,
38914c06356bSdh142964 			    mdi_pi_spathname(pip), (void *)pip));
38927c478bd9Sstevel@tonic-gate 		}
38937c478bd9Sstevel@tonic-gate 	}
38947c478bd9Sstevel@tonic-gate 	vh = ct->ct_vhci;
38957c478bd9Sstevel@tonic-gate 	vdip = vh->vh_dip;
38967c478bd9Sstevel@tonic-gate 
38977c478bd9Sstevel@tonic-gate 	/*
38987c478bd9Sstevel@tonic-gate 	 * Notify vHCI that has registered this event
38997c478bd9Sstevel@tonic-gate 	 */
39007c478bd9Sstevel@tonic-gate 	ASSERT(vh->vh_ops);
39017c478bd9Sstevel@tonic-gate 	f = vh->vh_ops->vo_pi_state_change;
39027c478bd9Sstevel@tonic-gate 
39037c478bd9Sstevel@tonic-gate 	if (f != NULL) {
39047c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
39057c478bd9Sstevel@tonic-gate 		if ((rv = (*f)(vdip, pip, MDI_PATHINFO_STATE_OFFLINE, 0,
39067c478bd9Sstevel@tonic-gate 		    flags)) != MDI_SUCCESS) {
39074c06356bSdh142964 			MDI_DEBUG(1, (MDI_WARN, ct->ct_dip,
39084c06356bSdh142964 			    "!vo_path_offline failed: vdip %s%d %p: path %s %p",
39094c06356bSdh142964 			    ddi_driver_name(vdip), ddi_get_instance(vdip),
39104c06356bSdh142964 			    (void *)vdip, mdi_pi_spathname(pip), (void *)pip));
39117c478bd9Sstevel@tonic-gate 		}
39127c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
39137c478bd9Sstevel@tonic-gate 	}
39147c478bd9Sstevel@tonic-gate 
39157c478bd9Sstevel@tonic-gate 	/*
39167c478bd9Sstevel@tonic-gate 	 * Set the mdi_pathinfo node state and clear the transient condition
39177c478bd9Sstevel@tonic-gate 	 */
39187c478bd9Sstevel@tonic-gate 	MDI_PI_SET_OFFLINE(pip);
39197c478bd9Sstevel@tonic-gate 	cv_broadcast(&MDI_PI(pip)->pi_state_cv);
39207c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
39217c478bd9Sstevel@tonic-gate 
39227c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
39237c478bd9Sstevel@tonic-gate 	if (rv == MDI_SUCCESS) {
39247c478bd9Sstevel@tonic-gate 		if (ct->ct_unstable == 0) {
39257c478bd9Sstevel@tonic-gate 			dev_info_t	*cdip = ct->ct_dip;
39267c478bd9Sstevel@tonic-gate 
39277c478bd9Sstevel@tonic-gate 			/*
39287c478bd9Sstevel@tonic-gate 			 * Onlining the mdi_pathinfo node will impact the
39297c478bd9Sstevel@tonic-gate 			 * client state Update the client and dev_info node
39307c478bd9Sstevel@tonic-gate 			 * state accordingly
39317c478bd9Sstevel@tonic-gate 			 */
39327c478bd9Sstevel@tonic-gate 			i_mdi_client_update_state(ct);
39337c478bd9Sstevel@tonic-gate 			rv = NDI_SUCCESS;
39347c478bd9Sstevel@tonic-gate 			if (MDI_CLIENT_STATE(ct) == MDI_CLIENT_STATE_FAILED) {
39357c478bd9Sstevel@tonic-gate 				if (cdip &&
39367c478bd9Sstevel@tonic-gate 				    (i_ddi_node_state(cdip) >=
39377c478bd9Sstevel@tonic-gate 				    DS_INITIALIZED)) {
39387c478bd9Sstevel@tonic-gate 					MDI_CLIENT_UNLOCK(ct);
39394c06356bSdh142964 					rv = ndi_devi_offline(cdip,
39404c06356bSdh142964 					    NDI_DEVFS_CLEAN);
39417c478bd9Sstevel@tonic-gate 					MDI_CLIENT_LOCK(ct);
39427c478bd9Sstevel@tonic-gate 					if (rv != NDI_SUCCESS) {
39437c478bd9Sstevel@tonic-gate 						/*
39447c478bd9Sstevel@tonic-gate 						 * ndi_devi_offline failed.
39457c478bd9Sstevel@tonic-gate 						 * Reset client flags to
39467c478bd9Sstevel@tonic-gate 						 * online.
39477c478bd9Sstevel@tonic-gate 						 */
39484c06356bSdh142964 						MDI_DEBUG(4, (MDI_WARN, cdip,
39494c06356bSdh142964 						    "ndi_devi_offline failed: "
39504c06356bSdh142964 						    "error %x", rv));
39517c478bd9Sstevel@tonic-gate 						MDI_CLIENT_SET_ONLINE(ct);
39527c478bd9Sstevel@tonic-gate 					}
39537c478bd9Sstevel@tonic-gate 				}
39547c478bd9Sstevel@tonic-gate 			}
39557c478bd9Sstevel@tonic-gate 			/*
39567c478bd9Sstevel@tonic-gate 			 * Convert to MDI error code
39577c478bd9Sstevel@tonic-gate 			 */
39587c478bd9Sstevel@tonic-gate 			switch (rv) {
39597c478bd9Sstevel@tonic-gate 			case NDI_SUCCESS:
39607c478bd9Sstevel@tonic-gate 				rv = MDI_SUCCESS;
39617c478bd9Sstevel@tonic-gate 				break;
39627c478bd9Sstevel@tonic-gate 			case NDI_BUSY:
39637c478bd9Sstevel@tonic-gate 				rv = MDI_BUSY;
39647c478bd9Sstevel@tonic-gate 				break;
39657c478bd9Sstevel@tonic-gate 			default:
39667c478bd9Sstevel@tonic-gate 				rv = MDI_FAILURE;
39677c478bd9Sstevel@tonic-gate 				break;
39687c478bd9Sstevel@tonic-gate 			}
39697c478bd9Sstevel@tonic-gate 		}
39707c478bd9Sstevel@tonic-gate 		MDI_CLIENT_SET_REPORT_DEV_NEEDED(ct);
39717c478bd9Sstevel@tonic-gate 		i_mdi_report_path_state(ct, pip);
39727c478bd9Sstevel@tonic-gate 	}
39737c478bd9Sstevel@tonic-gate 
39747c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
39757c478bd9Sstevel@tonic-gate 
39767c478bd9Sstevel@tonic-gate 	/*
39777c478bd9Sstevel@tonic-gate 	 * Change in the mdi_pathinfo node state will impact the client state
39787c478bd9Sstevel@tonic-gate 	 */
39794c06356bSdh142964 	MDI_DEBUG(2, (MDI_NOTE, ct->ct_dip,
39804c06356bSdh142964 	    "ct = %p pip = %p", (void *)ct, (void *)pip));
39817c478bd9Sstevel@tonic-gate 	return (rv);
39827c478bd9Sstevel@tonic-gate }
39837c478bd9Sstevel@tonic-gate 
398455e592a2SRandall Ralphs /*
398555e592a2SRandall Ralphs  * mdi_pi_get_node_name():
398655e592a2SRandall Ralphs  *              Get the name associated with a mdi_pathinfo node.
398755e592a2SRandall Ralphs  *              Since pathinfo nodes are not directly named, we
398855e592a2SRandall Ralphs  *              return the node_name of the client.
398955e592a2SRandall Ralphs  *
399055e592a2SRandall Ralphs  * Return Values:
399155e592a2SRandall Ralphs  *              char *
399255e592a2SRandall Ralphs  */
399355e592a2SRandall Ralphs char *
399455e592a2SRandall Ralphs mdi_pi_get_node_name(mdi_pathinfo_t *pip)
399555e592a2SRandall Ralphs {
399655e592a2SRandall Ralphs 	mdi_client_t    *ct;
399755e592a2SRandall Ralphs 
399855e592a2SRandall Ralphs 	if (pip == NULL)
399955e592a2SRandall Ralphs 		return (NULL);
400055e592a2SRandall Ralphs 	ct = MDI_PI(pip)->pi_client;
400155e592a2SRandall Ralphs 	if ((ct == NULL) || (ct->ct_dip == NULL))
400255e592a2SRandall Ralphs 		return (NULL);
400355e592a2SRandall Ralphs 	return (ddi_node_name(ct->ct_dip));
400455e592a2SRandall Ralphs }
40057c478bd9Sstevel@tonic-gate 
40067c478bd9Sstevel@tonic-gate /*
40077c478bd9Sstevel@tonic-gate  * mdi_pi_get_addr():
40087c478bd9Sstevel@tonic-gate  *		Get the unit address associated with a mdi_pathinfo node
40097c478bd9Sstevel@tonic-gate  *
40107c478bd9Sstevel@tonic-gate  * Return Values:
40117c478bd9Sstevel@tonic-gate  *		char *
40127c478bd9Sstevel@tonic-gate  */
40137c478bd9Sstevel@tonic-gate char *
40147c478bd9Sstevel@tonic-gate mdi_pi_get_addr(mdi_pathinfo_t *pip)
40157c478bd9Sstevel@tonic-gate {
40167c478bd9Sstevel@tonic-gate 	if (pip == NULL)
40177c478bd9Sstevel@tonic-gate 		return (NULL);
40187c478bd9Sstevel@tonic-gate 
401972a50065Scth 	return (MDI_PI(pip)->pi_addr);
40207c478bd9Sstevel@tonic-gate }
40217c478bd9Sstevel@tonic-gate 
40227c478bd9Sstevel@tonic-gate /*
4023602ca9eaScth  * mdi_pi_get_path_instance():
4024602ca9eaScth  *		Get the 'path_instance' of a mdi_pathinfo node
4025602ca9eaScth  *
4026602ca9eaScth  * Return Values:
4027602ca9eaScth  *		path_instance
4028602ca9eaScth  */
4029602ca9eaScth int
4030602ca9eaScth mdi_pi_get_path_instance(mdi_pathinfo_t *pip)
4031602ca9eaScth {
4032602ca9eaScth 	if (pip == NULL)
4033602ca9eaScth 		return (0);
4034602ca9eaScth 
4035602ca9eaScth 	return (MDI_PI(pip)->pi_path_instance);
4036602ca9eaScth }
4037602ca9eaScth 
4038602ca9eaScth /*
4039602ca9eaScth  * mdi_pi_pathname():
4040602ca9eaScth  *		Return pointer to path to pathinfo node.
4041602ca9eaScth  */
4042602ca9eaScth char *
4043602ca9eaScth mdi_pi_pathname(mdi_pathinfo_t *pip)
4044602ca9eaScth {
4045602ca9eaScth 	if (pip == NULL)
4046602ca9eaScth 		return (NULL);
4047602ca9eaScth 	return (mdi_pi_pathname_by_instance(mdi_pi_get_path_instance(pip)));
4048602ca9eaScth }
4049602ca9eaScth 
40504c06356bSdh142964 /*
40514c06356bSdh142964  * mdi_pi_spathname():
40524c06356bSdh142964  *		Return pointer to shortpath to pathinfo node. Used for debug
40534c06356bSdh142964  *		messages, so return "" instead of NULL when unknown.
40544c06356bSdh142964  */
40554c06356bSdh142964 char *
40564c06356bSdh142964 mdi_pi_spathname(mdi_pathinfo_t *pip)
40574c06356bSdh142964 {
40584c06356bSdh142964 	char	*spath = "";
40594c06356bSdh142964 
40604c06356bSdh142964 	if (pip) {
40614c06356bSdh142964 		spath = mdi_pi_spathname_by_instance(
40624c06356bSdh142964 		    mdi_pi_get_path_instance(pip));
40634c06356bSdh142964 		if (spath == NULL)
40644c06356bSdh142964 			spath = "";
40654c06356bSdh142964 	}
40664c06356bSdh142964 	return (spath);
40674c06356bSdh142964 }
40684c06356bSdh142964 
406938c67cbdSjiang wu - Sun Microsystems - Beijing China char *
407038c67cbdSjiang wu - Sun Microsystems - Beijing China mdi_pi_pathname_obp(mdi_pathinfo_t *pip, char *path)
407138c67cbdSjiang wu - Sun Microsystems - Beijing China {
407238c67cbdSjiang wu - Sun Microsystems - Beijing China 	char *obp_path = NULL;
407338c67cbdSjiang wu - Sun Microsystems - Beijing China 	if ((pip == NULL) || (path == NULL))
407438c67cbdSjiang wu - Sun Microsystems - Beijing China 		return (NULL);
407538c67cbdSjiang wu - Sun Microsystems - Beijing China 
407638c67cbdSjiang wu - Sun Microsystems - Beijing China 	if (mdi_prop_lookup_string(pip, "obp-path", &obp_path) == MDI_SUCCESS) {
407738c67cbdSjiang wu - Sun Microsystems - Beijing China 		(void) strcpy(path, obp_path);
407838c67cbdSjiang wu - Sun Microsystems - Beijing China 		(void) mdi_prop_free(obp_path);
407938c67cbdSjiang wu - Sun Microsystems - Beijing China 	} else {
408038c67cbdSjiang wu - Sun Microsystems - Beijing China 		path = NULL;
408138c67cbdSjiang wu - Sun Microsystems - Beijing China 	}
408238c67cbdSjiang wu - Sun Microsystems - Beijing China 	return (path);
408338c67cbdSjiang wu - Sun Microsystems - Beijing China }
408438c67cbdSjiang wu - Sun Microsystems - Beijing China 
408538c67cbdSjiang wu - Sun Microsystems - Beijing China int
408638c67cbdSjiang wu - Sun Microsystems - Beijing China mdi_pi_pathname_obp_set(mdi_pathinfo_t *pip, char *component)
408738c67cbdSjiang wu - Sun Microsystems - Beijing China {
408838c67cbdSjiang wu - Sun Microsystems - Beijing China 	dev_info_t *pdip;
4089caa9369fSjiang wu - Sun Microsystems - Beijing China 	char *obp_path = NULL;
4090caa9369fSjiang wu - Sun Microsystems - Beijing China 	int rc = MDI_FAILURE;
409138c67cbdSjiang wu - Sun Microsystems - Beijing China 
409238c67cbdSjiang wu - Sun Microsystems - Beijing China 	if (pip == NULL)
409338c67cbdSjiang wu - Sun Microsystems - Beijing China 		return (MDI_FAILURE);
409438c67cbdSjiang wu - Sun Microsystems - Beijing China 
409538c67cbdSjiang wu - Sun Microsystems - Beijing China 	pdip = mdi_pi_get_phci(pip);
409638c67cbdSjiang wu - Sun Microsystems - Beijing China 	if (pdip == NULL)
409738c67cbdSjiang wu - Sun Microsystems - Beijing China 		return (MDI_FAILURE);
409838c67cbdSjiang wu - Sun Microsystems - Beijing China 
4099caa9369fSjiang wu - Sun Microsystems - Beijing China 	obp_path = kmem_zalloc(MAXPATHLEN, KM_SLEEP);
4100caa9369fSjiang wu - Sun Microsystems - Beijing China 
410138c67cbdSjiang wu - Sun Microsystems - Beijing China 	if (ddi_pathname_obp(pdip, obp_path) == NULL) {
410238c67cbdSjiang wu - Sun Microsystems - Beijing China 		(void) ddi_pathname(pdip, obp_path);
410338c67cbdSjiang wu - Sun Microsystems - Beijing China 	}
410438c67cbdSjiang wu - Sun Microsystems - Beijing China 
410538c67cbdSjiang wu - Sun Microsystems - Beijing China 	if (component) {
4106caa9369fSjiang wu - Sun Microsystems - Beijing China 		(void) strncat(obp_path, "/", MAXPATHLEN);
4107caa9369fSjiang wu - Sun Microsystems - Beijing China 		(void) strncat(obp_path, component, MAXPATHLEN);
410838c67cbdSjiang wu - Sun Microsystems - Beijing China 	}
4109caa9369fSjiang wu - Sun Microsystems - Beijing China 	rc = mdi_prop_update_string(pip, "obp-path", obp_path);
411038c67cbdSjiang wu - Sun Microsystems - Beijing China 
4111caa9369fSjiang wu - Sun Microsystems - Beijing China 	if (obp_path)
4112caa9369fSjiang wu - Sun Microsystems - Beijing China 		kmem_free(obp_path, MAXPATHLEN);
4113caa9369fSjiang wu - Sun Microsystems - Beijing China 	return (rc);
411438c67cbdSjiang wu - Sun Microsystems - Beijing China }
411538c67cbdSjiang wu - Sun Microsystems - Beijing China 
4116602ca9eaScth /*
41177c478bd9Sstevel@tonic-gate  * mdi_pi_get_client():
41187c478bd9Sstevel@tonic-gate  *		Get the client devinfo associated with a mdi_pathinfo node
41197c478bd9Sstevel@tonic-gate  *
41207c478bd9Sstevel@tonic-gate  * Return Values:
41217c478bd9Sstevel@tonic-gate  *		Handle to client device dev_info node
41227c478bd9Sstevel@tonic-gate  */
41237c478bd9Sstevel@tonic-gate dev_info_t *
41247c478bd9Sstevel@tonic-gate mdi_pi_get_client(mdi_pathinfo_t *pip)
41257c478bd9Sstevel@tonic-gate {
41267c478bd9Sstevel@tonic-gate 	dev_info_t	*dip = NULL;
41277c478bd9Sstevel@tonic-gate 	if (pip) {
41287c478bd9Sstevel@tonic-gate 		dip = MDI_PI(pip)->pi_client->ct_dip;
41297c478bd9Sstevel@tonic-gate 	}
41307c478bd9Sstevel@tonic-gate 	return (dip);
41317c478bd9Sstevel@tonic-gate }
41327c478bd9Sstevel@tonic-gate 
41337c478bd9Sstevel@tonic-gate /*
41347c478bd9Sstevel@tonic-gate  * mdi_pi_get_phci():
41357c478bd9Sstevel@tonic-gate  *		Get the pHCI devinfo associated with the mdi_pathinfo node
41367c478bd9Sstevel@tonic-gate  * Return Values:
41377c478bd9Sstevel@tonic-gate  *		Handle to dev_info node
41387c478bd9Sstevel@tonic-gate  */
41397c478bd9Sstevel@tonic-gate dev_info_t *
41407c478bd9Sstevel@tonic-gate mdi_pi_get_phci(mdi_pathinfo_t *pip)
41417c478bd9Sstevel@tonic-gate {
41427c478bd9Sstevel@tonic-gate 	dev_info_t	*dip = NULL;
41434c06356bSdh142964 	mdi_phci_t	*ph;
41444c06356bSdh142964 
41457c478bd9Sstevel@tonic-gate 	if (pip) {
41464c06356bSdh142964 		ph = MDI_PI(pip)->pi_phci;
41474c06356bSdh142964 		if (ph)
41484c06356bSdh142964 			dip = ph->ph_dip;
41497c478bd9Sstevel@tonic-gate 	}
41507c478bd9Sstevel@tonic-gate 	return (dip);
41517c478bd9Sstevel@tonic-gate }
41527c478bd9Sstevel@tonic-gate 
41537c478bd9Sstevel@tonic-gate /*
41547c478bd9Sstevel@tonic-gate  * mdi_pi_get_client_private():
41557c478bd9Sstevel@tonic-gate  *		Get the client private information associated with the
41567c478bd9Sstevel@tonic-gate  *		mdi_pathinfo node
41577c478bd9Sstevel@tonic-gate  */
41587c478bd9Sstevel@tonic-gate void *
41597c478bd9Sstevel@tonic-gate mdi_pi_get_client_private(mdi_pathinfo_t *pip)
41607c478bd9Sstevel@tonic-gate {
41617c478bd9Sstevel@tonic-gate 	void *cprivate = NULL;
41627c478bd9Sstevel@tonic-gate 	if (pip) {
41637c478bd9Sstevel@tonic-gate 		cprivate = MDI_PI(pip)->pi_cprivate;
41647c478bd9Sstevel@tonic-gate 	}
41657c478bd9Sstevel@tonic-gate 	return (cprivate);
41667c478bd9Sstevel@tonic-gate }
41677c478bd9Sstevel@tonic-gate 
41687c478bd9Sstevel@tonic-gate /*
41697c478bd9Sstevel@tonic-gate  * mdi_pi_set_client_private():
41707c478bd9Sstevel@tonic-gate  *		Set the client private information in the mdi_pathinfo node
41717c478bd9Sstevel@tonic-gate  */
41727c478bd9Sstevel@tonic-gate void
41737c478bd9Sstevel@tonic-gate mdi_pi_set_client_private(mdi_pathinfo_t *pip, void *priv)
41747c478bd9Sstevel@tonic-gate {
41757c478bd9Sstevel@tonic-gate 	if (pip) {
41767c478bd9Sstevel@tonic-gate 		MDI_PI(pip)->pi_cprivate = priv;
41777c478bd9Sstevel@tonic-gate 	}
41787c478bd9Sstevel@tonic-gate }
41797c478bd9Sstevel@tonic-gate 
41807c478bd9Sstevel@tonic-gate /*
41817c478bd9Sstevel@tonic-gate  * mdi_pi_get_phci_private():
41827c478bd9Sstevel@tonic-gate  *		Get the pHCI private information associated with the
41837c478bd9Sstevel@tonic-gate  *		mdi_pathinfo node
41847c478bd9Sstevel@tonic-gate  */
41857c478bd9Sstevel@tonic-gate caddr_t
41867c478bd9Sstevel@tonic-gate mdi_pi_get_phci_private(mdi_pathinfo_t *pip)
41877c478bd9Sstevel@tonic-gate {
41887c478bd9Sstevel@tonic-gate 	caddr_t	pprivate = NULL;
41894c06356bSdh142964 
41907c478bd9Sstevel@tonic-gate 	if (pip) {
41917c478bd9Sstevel@tonic-gate 		pprivate = MDI_PI(pip)->pi_pprivate;
41927c478bd9Sstevel@tonic-gate 	}
41937c478bd9Sstevel@tonic-gate 	return (pprivate);
41947c478bd9Sstevel@tonic-gate }
41957c478bd9Sstevel@tonic-gate 
41967c478bd9Sstevel@tonic-gate /*
41977c478bd9Sstevel@tonic-gate  * mdi_pi_set_phci_private():
41987c478bd9Sstevel@tonic-gate  *		Set the pHCI private information in the mdi_pathinfo node
41997c478bd9Sstevel@tonic-gate  */
42007c478bd9Sstevel@tonic-gate void
42017c478bd9Sstevel@tonic-gate mdi_pi_set_phci_private(mdi_pathinfo_t *pip, caddr_t priv)
42027c478bd9Sstevel@tonic-gate {
42037c478bd9Sstevel@tonic-gate 	if (pip) {
42047c478bd9Sstevel@tonic-gate 		MDI_PI(pip)->pi_pprivate = priv;
42057c478bd9Sstevel@tonic-gate 	}
42067c478bd9Sstevel@tonic-gate }
42077c478bd9Sstevel@tonic-gate 
42087c478bd9Sstevel@tonic-gate /*
42097c478bd9Sstevel@tonic-gate  * mdi_pi_get_state():
42107c478bd9Sstevel@tonic-gate  *		Get the mdi_pathinfo node state. Transient states are internal
42117c478bd9Sstevel@tonic-gate  *		and not provided to the users
42127c478bd9Sstevel@tonic-gate  */
42137c478bd9Sstevel@tonic-gate mdi_pathinfo_state_t
42147c478bd9Sstevel@tonic-gate mdi_pi_get_state(mdi_pathinfo_t *pip)
42157c478bd9Sstevel@tonic-gate {
42167c478bd9Sstevel@tonic-gate 	mdi_pathinfo_state_t    state = MDI_PATHINFO_STATE_INIT;
42177c478bd9Sstevel@tonic-gate 
42187c478bd9Sstevel@tonic-gate 	if (pip) {
42197c478bd9Sstevel@tonic-gate 		if (MDI_PI_IS_TRANSIENT(pip)) {
42207c478bd9Sstevel@tonic-gate 			/*
42217c478bd9Sstevel@tonic-gate 			 * mdi_pathinfo is in state transition.  Return the
42227c478bd9Sstevel@tonic-gate 			 * last good state.
42237c478bd9Sstevel@tonic-gate 			 */
42247c478bd9Sstevel@tonic-gate 			state = MDI_PI_OLD_STATE(pip);
42257c478bd9Sstevel@tonic-gate 		} else {
42267c478bd9Sstevel@tonic-gate 			state = MDI_PI_STATE(pip);
42277c478bd9Sstevel@tonic-gate 		}
42287c478bd9Sstevel@tonic-gate 	}
42297c478bd9Sstevel@tonic-gate 	return (state);
42307c478bd9Sstevel@tonic-gate }
42317c478bd9Sstevel@tonic-gate 
42327c478bd9Sstevel@tonic-gate /*
42334c06356bSdh142964  * mdi_pi_get_flags():
42344c06356bSdh142964  *		Get the mdi_pathinfo node flags.
42354c06356bSdh142964  */
42364c06356bSdh142964 uint_t
42374c06356bSdh142964 mdi_pi_get_flags(mdi_pathinfo_t *pip)
42384c06356bSdh142964 {
42394c06356bSdh142964 	return (pip ? MDI_PI(pip)->pi_flags : 0);
42404c06356bSdh142964 }
42414c06356bSdh142964 
42424c06356bSdh142964 /*
42437c478bd9Sstevel@tonic-gate  * Note that the following function needs to be the new interface for
42447c478bd9Sstevel@tonic-gate  * mdi_pi_get_state when mpxio gets integrated to ON.
42457c478bd9Sstevel@tonic-gate  */
42467c478bd9Sstevel@tonic-gate int
42477c478bd9Sstevel@tonic-gate mdi_pi_get_state2(mdi_pathinfo_t *pip, mdi_pathinfo_state_t *state,
42487c478bd9Sstevel@tonic-gate 		uint32_t *ext_state)
42497c478bd9Sstevel@tonic-gate {
42507c478bd9Sstevel@tonic-gate 	*state = MDI_PATHINFO_STATE_INIT;
42517c478bd9Sstevel@tonic-gate 
42527c478bd9Sstevel@tonic-gate 	if (pip) {
42537c478bd9Sstevel@tonic-gate 		if (MDI_PI_IS_TRANSIENT(pip)) {
42547c478bd9Sstevel@tonic-gate 			/*
42557c478bd9Sstevel@tonic-gate 			 * mdi_pathinfo is in state transition.  Return the
42567c478bd9Sstevel@tonic-gate 			 * last good state.
42577c478bd9Sstevel@tonic-gate 			 */
42587c478bd9Sstevel@tonic-gate 			*state = MDI_PI_OLD_STATE(pip);
42597c478bd9Sstevel@tonic-gate 			*ext_state = MDI_PI_OLD_EXT_STATE(pip);
42607c478bd9Sstevel@tonic-gate 		} else {
42617c478bd9Sstevel@tonic-gate 			*state = MDI_PI_STATE(pip);
42627c478bd9Sstevel@tonic-gate 			*ext_state = MDI_PI_EXT_STATE(pip);
42637c478bd9Sstevel@tonic-gate 		}
42647c478bd9Sstevel@tonic-gate 	}
42657c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
42667c478bd9Sstevel@tonic-gate }
42677c478bd9Sstevel@tonic-gate 
42687c478bd9Sstevel@tonic-gate /*
42697c478bd9Sstevel@tonic-gate  * mdi_pi_get_preferred:
42707c478bd9Sstevel@tonic-gate  *	Get the preferred path flag
42717c478bd9Sstevel@tonic-gate  */
42727c478bd9Sstevel@tonic-gate int
42737c478bd9Sstevel@tonic-gate mdi_pi_get_preferred(mdi_pathinfo_t *pip)
42747c478bd9Sstevel@tonic-gate {
42757c478bd9Sstevel@tonic-gate 	if (pip) {
42767c478bd9Sstevel@tonic-gate 		return (MDI_PI(pip)->pi_preferred);
42777c478bd9Sstevel@tonic-gate 	}
42787c478bd9Sstevel@tonic-gate 	return (0);
42797c478bd9Sstevel@tonic-gate }
42807c478bd9Sstevel@tonic-gate 
42817c478bd9Sstevel@tonic-gate /*
42827c478bd9Sstevel@tonic-gate  * mdi_pi_set_preferred:
42837c478bd9Sstevel@tonic-gate  *	Set the preferred path flag
42847c478bd9Sstevel@tonic-gate  */
42857c478bd9Sstevel@tonic-gate void
42867c478bd9Sstevel@tonic-gate mdi_pi_set_preferred(mdi_pathinfo_t *pip, int preferred)
42877c478bd9Sstevel@tonic-gate {
42887c478bd9Sstevel@tonic-gate 	if (pip) {
42897c478bd9Sstevel@tonic-gate 		MDI_PI(pip)->pi_preferred = preferred;
42907c478bd9Sstevel@tonic-gate 	}
42917c478bd9Sstevel@tonic-gate }
42927c478bd9Sstevel@tonic-gate 
42937c478bd9Sstevel@tonic-gate /*
42947c478bd9Sstevel@tonic-gate  * mdi_pi_set_state():
42957c478bd9Sstevel@tonic-gate  *		Set the mdi_pathinfo node state
42967c478bd9Sstevel@tonic-gate  */
42977c478bd9Sstevel@tonic-gate void
42987c478bd9Sstevel@tonic-gate mdi_pi_set_state(mdi_pathinfo_t *pip, mdi_pathinfo_state_t state)
42997c478bd9Sstevel@tonic-gate {
43007c478bd9Sstevel@tonic-gate 	uint32_t	ext_state;
43017c478bd9Sstevel@tonic-gate 
43027c478bd9Sstevel@tonic-gate 	if (pip) {
43037c478bd9Sstevel@tonic-gate 		ext_state = MDI_PI(pip)->pi_state & MDI_PATHINFO_EXT_STATE_MASK;
43047c478bd9Sstevel@tonic-gate 		MDI_PI(pip)->pi_state = state;
43057c478bd9Sstevel@tonic-gate 		MDI_PI(pip)->pi_state |= ext_state;
43064c06356bSdh142964 
43074c06356bSdh142964 		/* Path has changed state, invalidate DINFOCACHE snap shot. */
43084c06356bSdh142964 		i_ddi_di_cache_invalidate();
43097c478bd9Sstevel@tonic-gate 	}
43107c478bd9Sstevel@tonic-gate }
43117c478bd9Sstevel@tonic-gate 
43127c478bd9Sstevel@tonic-gate /*
43137c478bd9Sstevel@tonic-gate  * Property functions:
43147c478bd9Sstevel@tonic-gate  */
43157c478bd9Sstevel@tonic-gate int
43167c478bd9Sstevel@tonic-gate i_map_nvlist_error_to_mdi(int val)
43177c478bd9Sstevel@tonic-gate {
43187c478bd9Sstevel@tonic-gate 	int rv;
43197c478bd9Sstevel@tonic-gate 
43207c478bd9Sstevel@tonic-gate 	switch (val) {
43217c478bd9Sstevel@tonic-gate 	case 0:
43227c478bd9Sstevel@tonic-gate 		rv = DDI_PROP_SUCCESS;
43237c478bd9Sstevel@tonic-gate 		break;
43247c478bd9Sstevel@tonic-gate 	case EINVAL:
43257c478bd9Sstevel@tonic-gate 	case ENOTSUP:
43267c478bd9Sstevel@tonic-gate 		rv = DDI_PROP_INVAL_ARG;
43277c478bd9Sstevel@tonic-gate 		break;
43287c478bd9Sstevel@tonic-gate 	case ENOMEM:
43297c478bd9Sstevel@tonic-gate 		rv = DDI_PROP_NO_MEMORY;
43307c478bd9Sstevel@tonic-gate 		break;
43317c478bd9Sstevel@tonic-gate 	default:
43327c478bd9Sstevel@tonic-gate 		rv = DDI_PROP_NOT_FOUND;
43337c478bd9Sstevel@tonic-gate 		break;
43347c478bd9Sstevel@tonic-gate 	}
43357c478bd9Sstevel@tonic-gate 	return (rv);
43367c478bd9Sstevel@tonic-gate }
43377c478bd9Sstevel@tonic-gate 
43387c478bd9Sstevel@tonic-gate /*
43397c478bd9Sstevel@tonic-gate  * mdi_pi_get_next_prop():
43407c478bd9Sstevel@tonic-gate  * 		Property walk function.  The caller should hold mdi_pi_lock()
43417c478bd9Sstevel@tonic-gate  *		and release by calling mdi_pi_unlock() at the end of walk to
43427c478bd9Sstevel@tonic-gate  *		get a consistent value.
43437c478bd9Sstevel@tonic-gate  */
43447c478bd9Sstevel@tonic-gate nvpair_t *
43457c478bd9Sstevel@tonic-gate mdi_pi_get_next_prop(mdi_pathinfo_t *pip, nvpair_t *prev)
43467c478bd9Sstevel@tonic-gate {
43477c478bd9Sstevel@tonic-gate 	if ((pip == NULL) || (MDI_PI(pip)->pi_prop == NULL)) {
43487c478bd9Sstevel@tonic-gate 		return (NULL);
43497c478bd9Sstevel@tonic-gate 	}
43505e3986cbScth 	ASSERT(MDI_PI_LOCKED(pip));
43517c478bd9Sstevel@tonic-gate 	return (nvlist_next_nvpair(MDI_PI(pip)->pi_prop, prev));
43527c478bd9Sstevel@tonic-gate }
43537c478bd9Sstevel@tonic-gate 
43547c478bd9Sstevel@tonic-gate /*
43557c478bd9Sstevel@tonic-gate  * mdi_prop_remove():
43567c478bd9Sstevel@tonic-gate  * 		Remove the named property from the named list.
43577c478bd9Sstevel@tonic-gate  */
43587c478bd9Sstevel@tonic-gate int
43597c478bd9Sstevel@tonic-gate mdi_prop_remove(mdi_pathinfo_t *pip, char *name)
43607c478bd9Sstevel@tonic-gate {
43617c478bd9Sstevel@tonic-gate 	if (pip == NULL) {
43627c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
43637c478bd9Sstevel@tonic-gate 	}
43645e3986cbScth 	ASSERT(!MDI_PI_LOCKED(pip));
43657c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
43667c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_prop == NULL) {
43677c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
43687c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
43697c478bd9Sstevel@tonic-gate 	}
43707c478bd9Sstevel@tonic-gate 	if (name) {
43717c478bd9Sstevel@tonic-gate 		(void) nvlist_remove_all(MDI_PI(pip)->pi_prop, name);
43727c478bd9Sstevel@tonic-gate 	} else {
43737c478bd9Sstevel@tonic-gate 		char		nvp_name[MAXNAMELEN];
43747c478bd9Sstevel@tonic-gate 		nvpair_t	*nvp;
43757c478bd9Sstevel@tonic-gate 		nvp = nvlist_next_nvpair(MDI_PI(pip)->pi_prop, NULL);
43767c478bd9Sstevel@tonic-gate 		while (nvp) {
43777c478bd9Sstevel@tonic-gate 			nvpair_t	*next;
43787c478bd9Sstevel@tonic-gate 			next = nvlist_next_nvpair(MDI_PI(pip)->pi_prop, nvp);
43794c06356bSdh142964 			(void) snprintf(nvp_name, sizeof(nvp_name), "%s",
43807c478bd9Sstevel@tonic-gate 			    nvpair_name(nvp));
43817c478bd9Sstevel@tonic-gate 			(void) nvlist_remove_all(MDI_PI(pip)->pi_prop,
43827c478bd9Sstevel@tonic-gate 			    nvp_name);
43837c478bd9Sstevel@tonic-gate 			nvp = next;
43847c478bd9Sstevel@tonic-gate 		}
43857c478bd9Sstevel@tonic-gate 	}
43867c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
43877c478bd9Sstevel@tonic-gate 	return (DDI_PROP_SUCCESS);
43887c478bd9Sstevel@tonic-gate }
43897c478bd9Sstevel@tonic-gate 
43907c478bd9Sstevel@tonic-gate /*
43917c478bd9Sstevel@tonic-gate  * mdi_prop_size():
43927c478bd9Sstevel@tonic-gate  * 		Get buffer size needed to pack the property data.
43937c478bd9Sstevel@tonic-gate  * 		Caller should hold the mdi_pathinfo_t lock to get a consistent
43947c478bd9Sstevel@tonic-gate  *		buffer size.
43957c478bd9Sstevel@tonic-gate  */
43967c478bd9Sstevel@tonic-gate int
43977c478bd9Sstevel@tonic-gate mdi_prop_size(mdi_pathinfo_t *pip, size_t *buflenp)
43987c478bd9Sstevel@tonic-gate {
43997c478bd9Sstevel@tonic-gate 	int	rv;
44007c478bd9Sstevel@tonic-gate 	size_t	bufsize;
44017c478bd9Sstevel@tonic-gate 
44027c478bd9Sstevel@tonic-gate 	*buflenp = 0;
44037c478bd9Sstevel@tonic-gate 	if ((pip == NULL) || (MDI_PI(pip)->pi_prop == NULL)) {
44047c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
44057c478bd9Sstevel@tonic-gate 	}
44065e3986cbScth 	ASSERT(MDI_PI_LOCKED(pip));
44077c478bd9Sstevel@tonic-gate 	rv = nvlist_size(MDI_PI(pip)->pi_prop,
44087c478bd9Sstevel@tonic-gate 	    &bufsize, NV_ENCODE_NATIVE);
44097c478bd9Sstevel@tonic-gate 	*buflenp = bufsize;
44107c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
44117c478bd9Sstevel@tonic-gate }
44127c478bd9Sstevel@tonic-gate 
44137c478bd9Sstevel@tonic-gate /*
44147c478bd9Sstevel@tonic-gate  * mdi_prop_pack():
44157c478bd9Sstevel@tonic-gate  * 		pack the property list.  The caller should hold the
44167c478bd9Sstevel@tonic-gate  *		mdi_pathinfo_t node to get a consistent data
44177c478bd9Sstevel@tonic-gate  */
44187c478bd9Sstevel@tonic-gate int
44197c478bd9Sstevel@tonic-gate mdi_prop_pack(mdi_pathinfo_t *pip, char **bufp, uint_t buflen)
44207c478bd9Sstevel@tonic-gate {
44217c478bd9Sstevel@tonic-gate 	int	rv;
44227c478bd9Sstevel@tonic-gate 	size_t	bufsize;
44237c478bd9Sstevel@tonic-gate 
44247c478bd9Sstevel@tonic-gate 	if ((pip == NULL) || MDI_PI(pip)->pi_prop == NULL) {
44257c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
44267c478bd9Sstevel@tonic-gate 	}
44277c478bd9Sstevel@tonic-gate 
44285e3986cbScth 	ASSERT(MDI_PI_LOCKED(pip));
44297c478bd9Sstevel@tonic-gate 
44307c478bd9Sstevel@tonic-gate 	bufsize = buflen;
44317c478bd9Sstevel@tonic-gate 	rv = nvlist_pack(MDI_PI(pip)->pi_prop, bufp, (size_t *)&bufsize,
44327c478bd9Sstevel@tonic-gate 	    NV_ENCODE_NATIVE, KM_SLEEP);
44337c478bd9Sstevel@tonic-gate 
44347c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
44357c478bd9Sstevel@tonic-gate }
44367c478bd9Sstevel@tonic-gate 
44377c478bd9Sstevel@tonic-gate /*
44387c478bd9Sstevel@tonic-gate  * mdi_prop_update_byte():
44397c478bd9Sstevel@tonic-gate  *		Create/Update a byte property
44407c478bd9Sstevel@tonic-gate  */
44417c478bd9Sstevel@tonic-gate int
44427c478bd9Sstevel@tonic-gate mdi_prop_update_byte(mdi_pathinfo_t *pip, char *name, uchar_t data)
44437c478bd9Sstevel@tonic-gate {
44447c478bd9Sstevel@tonic-gate 	int rv;
44457c478bd9Sstevel@tonic-gate 
44467c478bd9Sstevel@tonic-gate 	if (pip == NULL) {
44477c478bd9Sstevel@tonic-gate 		return (DDI_PROP_INVAL_ARG);
44487c478bd9Sstevel@tonic-gate 	}
44495e3986cbScth 	ASSERT(!MDI_PI_LOCKED(pip));
44507c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
44517c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_prop == NULL) {
44527c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
44537c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
44547c478bd9Sstevel@tonic-gate 	}
44557c478bd9Sstevel@tonic-gate 	rv = nvlist_add_byte(MDI_PI(pip)->pi_prop, name, data);
44567c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
44577c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
44587c478bd9Sstevel@tonic-gate }
44597c478bd9Sstevel@tonic-gate 
44607c478bd9Sstevel@tonic-gate /*
44617c478bd9Sstevel@tonic-gate  * mdi_prop_update_byte_array():
44627c478bd9Sstevel@tonic-gate  *		Create/Update a byte array property
44637c478bd9Sstevel@tonic-gate  */
44647c478bd9Sstevel@tonic-gate int
44657c478bd9Sstevel@tonic-gate mdi_prop_update_byte_array(mdi_pathinfo_t *pip, char *name, uchar_t *data,
44667c478bd9Sstevel@tonic-gate     uint_t nelements)
44677c478bd9Sstevel@tonic-gate {
44687c478bd9Sstevel@tonic-gate 	int rv;
44697c478bd9Sstevel@tonic-gate 
44707c478bd9Sstevel@tonic-gate 	if (pip == NULL) {
44717c478bd9Sstevel@tonic-gate 		return (DDI_PROP_INVAL_ARG);
44727c478bd9Sstevel@tonic-gate 	}
44735e3986cbScth 	ASSERT(!MDI_PI_LOCKED(pip));
44747c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
44757c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_prop == NULL) {
44767c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
44777c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
44787c478bd9Sstevel@tonic-gate 	}
44797c478bd9Sstevel@tonic-gate 	rv = nvlist_add_byte_array(MDI_PI(pip)->pi_prop, name, data, nelements);
44807c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
44817c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
44827c478bd9Sstevel@tonic-gate }
44837c478bd9Sstevel@tonic-gate 
44847c478bd9Sstevel@tonic-gate /*
44857c478bd9Sstevel@tonic-gate  * mdi_prop_update_int():
44867c478bd9Sstevel@tonic-gate  *		Create/Update a 32 bit integer property
44877c478bd9Sstevel@tonic-gate  */
44887c478bd9Sstevel@tonic-gate int
44897c478bd9Sstevel@tonic-gate mdi_prop_update_int(mdi_pathinfo_t *pip, char *name, int data)
44907c478bd9Sstevel@tonic-gate {
44917c478bd9Sstevel@tonic-gate 	int rv;
44927c478bd9Sstevel@tonic-gate 
44937c478bd9Sstevel@tonic-gate 	if (pip == NULL) {
44947c478bd9Sstevel@tonic-gate 		return (DDI_PROP_INVAL_ARG);
44957c478bd9Sstevel@tonic-gate 	}
44965e3986cbScth 	ASSERT(!MDI_PI_LOCKED(pip));
44977c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
44987c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_prop == NULL) {
44997c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
45007c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
45017c478bd9Sstevel@tonic-gate 	}
45027c478bd9Sstevel@tonic-gate 	rv = nvlist_add_int32(MDI_PI(pip)->pi_prop, name, (int32_t)data);
45037c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
45047c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
45057c478bd9Sstevel@tonic-gate }
45067c478bd9Sstevel@tonic-gate 
45077c478bd9Sstevel@tonic-gate /*
45087c478bd9Sstevel@tonic-gate  * mdi_prop_update_int64():
45097c478bd9Sstevel@tonic-gate  *		Create/Update a 64 bit integer property
45107c478bd9Sstevel@tonic-gate  */
45117c478bd9Sstevel@tonic-gate int
45127c478bd9Sstevel@tonic-gate mdi_prop_update_int64(mdi_pathinfo_t *pip, char *name, int64_t data)
45137c478bd9Sstevel@tonic-gate {
45147c478bd9Sstevel@tonic-gate 	int rv;
45157c478bd9Sstevel@tonic-gate 
45167c478bd9Sstevel@tonic-gate 	if (pip == NULL) {
45177c478bd9Sstevel@tonic-gate 		return (DDI_PROP_INVAL_ARG);
45187c478bd9Sstevel@tonic-gate 	}
45195e3986cbScth 	ASSERT(!MDI_PI_LOCKED(pip));
45207c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
45217c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_prop == NULL) {
45227c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
45237c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
45247c478bd9Sstevel@tonic-gate 	}
45257c478bd9Sstevel@tonic-gate 	rv = nvlist_add_int64(MDI_PI(pip)->pi_prop, name, data);
45267c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
45277c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
45287c478bd9Sstevel@tonic-gate }
45297c478bd9Sstevel@tonic-gate 
45307c478bd9Sstevel@tonic-gate /*
45317c478bd9Sstevel@tonic-gate  * mdi_prop_update_int_array():
45327c478bd9Sstevel@tonic-gate  *		Create/Update a int array property
45337c478bd9Sstevel@tonic-gate  */
45347c478bd9Sstevel@tonic-gate int
45357c478bd9Sstevel@tonic-gate mdi_prop_update_int_array(mdi_pathinfo_t *pip, char *name, int *data,
45367c478bd9Sstevel@tonic-gate 	    uint_t nelements)
45377c478bd9Sstevel@tonic-gate {
45387c478bd9Sstevel@tonic-gate 	int rv;
45397c478bd9Sstevel@tonic-gate 
45407c478bd9Sstevel@tonic-gate 	if (pip == NULL) {
45417c478bd9Sstevel@tonic-gate 		return (DDI_PROP_INVAL_ARG);
45427c478bd9Sstevel@tonic-gate 	}
45435e3986cbScth 	ASSERT(!MDI_PI_LOCKED(pip));
45447c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
45457c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_prop == NULL) {
45467c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
45477c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
45487c478bd9Sstevel@tonic-gate 	}
45497c478bd9Sstevel@tonic-gate 	rv = nvlist_add_int32_array(MDI_PI(pip)->pi_prop, name, (int32_t *)data,
45507c478bd9Sstevel@tonic-gate 	    nelements);
45517c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
45527c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
45537c478bd9Sstevel@tonic-gate }
45547c478bd9Sstevel@tonic-gate 
45557c478bd9Sstevel@tonic-gate /*
45567c478bd9Sstevel@tonic-gate  * mdi_prop_update_string():
45577c478bd9Sstevel@tonic-gate  *		Create/Update a string property
45587c478bd9Sstevel@tonic-gate  */
45597c478bd9Sstevel@tonic-gate int
45607c478bd9Sstevel@tonic-gate mdi_prop_update_string(mdi_pathinfo_t *pip, char *name, char *data)
45617c478bd9Sstevel@tonic-gate {
45627c478bd9Sstevel@tonic-gate 	int rv;
45637c478bd9Sstevel@tonic-gate 
45647c478bd9Sstevel@tonic-gate 	if (pip == NULL) {
45657c478bd9Sstevel@tonic-gate 		return (DDI_PROP_INVAL_ARG);
45667c478bd9Sstevel@tonic-gate 	}
45675e3986cbScth 	ASSERT(!MDI_PI_LOCKED(pip));
45687c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
45697c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_prop == NULL) {
45707c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
45717c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
45727c478bd9Sstevel@tonic-gate 	}
45737c478bd9Sstevel@tonic-gate 	rv = nvlist_add_string(MDI_PI(pip)->pi_prop, name, data);
45747c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
45757c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
45767c478bd9Sstevel@tonic-gate }
45777c478bd9Sstevel@tonic-gate 
45787c478bd9Sstevel@tonic-gate /*
45797c478bd9Sstevel@tonic-gate  * mdi_prop_update_string_array():
45807c478bd9Sstevel@tonic-gate  *		Create/Update a string array property
45817c478bd9Sstevel@tonic-gate  */
45827c478bd9Sstevel@tonic-gate int
45837c478bd9Sstevel@tonic-gate mdi_prop_update_string_array(mdi_pathinfo_t *pip, char *name, char **data,
45847c478bd9Sstevel@tonic-gate     uint_t nelements)
45857c478bd9Sstevel@tonic-gate {
45867c478bd9Sstevel@tonic-gate 	int rv;
45877c478bd9Sstevel@tonic-gate 
45887c478bd9Sstevel@tonic-gate 	if (pip == NULL) {
45897c478bd9Sstevel@tonic-gate 		return (DDI_PROP_INVAL_ARG);
45907c478bd9Sstevel@tonic-gate 	}
45915e3986cbScth 	ASSERT(!MDI_PI_LOCKED(pip));
45927c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
45937c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_prop == NULL) {
45947c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
45957c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
45967c478bd9Sstevel@tonic-gate 	}
45977c478bd9Sstevel@tonic-gate 	rv = nvlist_add_string_array(MDI_PI(pip)->pi_prop, name, data,
45987c478bd9Sstevel@tonic-gate 	    nelements);
45997c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
46007c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
46017c478bd9Sstevel@tonic-gate }
46027c478bd9Sstevel@tonic-gate 
46037c478bd9Sstevel@tonic-gate /*
46047c478bd9Sstevel@tonic-gate  * mdi_prop_lookup_byte():
46057c478bd9Sstevel@tonic-gate  * 		Look for byte property identified by name.  The data returned
46067c478bd9Sstevel@tonic-gate  *		is the actual property and valid as long as mdi_pathinfo_t node
46077c478bd9Sstevel@tonic-gate  *		is alive.
46087c478bd9Sstevel@tonic-gate  */
46097c478bd9Sstevel@tonic-gate int
46107c478bd9Sstevel@tonic-gate mdi_prop_lookup_byte(mdi_pathinfo_t *pip, char *name, uchar_t *data)
46117c478bd9Sstevel@tonic-gate {
46127c478bd9Sstevel@tonic-gate 	int rv;
46137c478bd9Sstevel@tonic-gate 
46147c478bd9Sstevel@tonic-gate 	if ((pip == NULL) || (MDI_PI(pip)->pi_prop == NULL)) {
46157c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
46167c478bd9Sstevel@tonic-gate 	}
46177c478bd9Sstevel@tonic-gate 	rv = nvlist_lookup_byte(MDI_PI(pip)->pi_prop, name, data);
46187c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
46197c478bd9Sstevel@tonic-gate }
46207c478bd9Sstevel@tonic-gate 
46217c478bd9Sstevel@tonic-gate 
46227c478bd9Sstevel@tonic-gate /*
46237c478bd9Sstevel@tonic-gate  * mdi_prop_lookup_byte_array():
46247c478bd9Sstevel@tonic-gate  * 		Look for byte array property identified by name.  The data
46257c478bd9Sstevel@tonic-gate  *		returned is the actual property and valid as long as
46267c478bd9Sstevel@tonic-gate  *		mdi_pathinfo_t node is alive.
46277c478bd9Sstevel@tonic-gate  */
46287c478bd9Sstevel@tonic-gate int
46297c478bd9Sstevel@tonic-gate mdi_prop_lookup_byte_array(mdi_pathinfo_t *pip, char *name, uchar_t **data,
46307c478bd9Sstevel@tonic-gate     uint_t *nelements)
46317c478bd9Sstevel@tonic-gate {
46327c478bd9Sstevel@tonic-gate 	int rv;
46337c478bd9Sstevel@tonic-gate 
46347c478bd9Sstevel@tonic-gate 	if ((pip == NULL) || (MDI_PI(pip)->pi_prop == NULL)) {
46357c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
46367c478bd9Sstevel@tonic-gate 	}
46377c478bd9Sstevel@tonic-gate 	rv = nvlist_lookup_byte_array(MDI_PI(pip)->pi_prop, name, data,
46387c478bd9Sstevel@tonic-gate 	    nelements);
46397c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
46407c478bd9Sstevel@tonic-gate }
46417c478bd9Sstevel@tonic-gate 
46427c478bd9Sstevel@tonic-gate /*
46437c478bd9Sstevel@tonic-gate  * mdi_prop_lookup_int():
46447c478bd9Sstevel@tonic-gate  * 		Look for int property identified by name.  The data returned
46457c478bd9Sstevel@tonic-gate  *		is the actual property and valid as long as mdi_pathinfo_t
46467c478bd9Sstevel@tonic-gate  *		node is alive.
46477c478bd9Sstevel@tonic-gate  */
46487c478bd9Sstevel@tonic-gate int
46497c478bd9Sstevel@tonic-gate mdi_prop_lookup_int(mdi_pathinfo_t *pip, char *name, int *data)
46507c478bd9Sstevel@tonic-gate {
46517c478bd9Sstevel@tonic-gate 	int rv;
46527c478bd9Sstevel@tonic-gate 
46537c478bd9Sstevel@tonic-gate 	if ((pip == NULL) || (MDI_PI(pip)->pi_prop == NULL)) {
46547c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
46557c478bd9Sstevel@tonic-gate 	}
46567c478bd9Sstevel@tonic-gate 	rv = nvlist_lookup_int32(MDI_PI(pip)->pi_prop, name, (int32_t *)data);
46577c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
46587c478bd9Sstevel@tonic-gate }
46597c478bd9Sstevel@tonic-gate 
46607c478bd9Sstevel@tonic-gate /*
46617c478bd9Sstevel@tonic-gate  * mdi_prop_lookup_int64():
46627c478bd9Sstevel@tonic-gate  * 		Look for int64 property identified by name.  The data returned
46637c478bd9Sstevel@tonic-gate  *		is the actual property and valid as long as mdi_pathinfo_t node
46647c478bd9Sstevel@tonic-gate  *		is alive.
46657c478bd9Sstevel@tonic-gate  */
46667c478bd9Sstevel@tonic-gate int
46677c478bd9Sstevel@tonic-gate mdi_prop_lookup_int64(mdi_pathinfo_t *pip, char *name, int64_t *data)
46687c478bd9Sstevel@tonic-gate {
46697c478bd9Sstevel@tonic-gate 	int rv;
46707c478bd9Sstevel@tonic-gate 	if ((pip == NULL) || (MDI_PI(pip)->pi_prop == NULL)) {
46717c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
46727c478bd9Sstevel@tonic-gate 	}
46737c478bd9Sstevel@tonic-gate 	rv = nvlist_lookup_int64(MDI_PI(pip)->pi_prop, name, data);
46747c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
46757c478bd9Sstevel@tonic-gate }
46767c478bd9Sstevel@tonic-gate 
46777c478bd9Sstevel@tonic-gate /*
46787c478bd9Sstevel@tonic-gate  * mdi_prop_lookup_int_array():
46797c478bd9Sstevel@tonic-gate  * 		Look for int array property identified by name.  The data
46807c478bd9Sstevel@tonic-gate  *		returned is the actual property and valid as long as
46817c478bd9Sstevel@tonic-gate  *		mdi_pathinfo_t node is alive.
46827c478bd9Sstevel@tonic-gate  */
46837c478bd9Sstevel@tonic-gate int
46847c478bd9Sstevel@tonic-gate mdi_prop_lookup_int_array(mdi_pathinfo_t *pip, char *name, int **data,
46857c478bd9Sstevel@tonic-gate     uint_t *nelements)
46867c478bd9Sstevel@tonic-gate {
46877c478bd9Sstevel@tonic-gate 	int rv;
46887c478bd9Sstevel@tonic-gate 
46897c478bd9Sstevel@tonic-gate 	if ((pip == NULL) || (MDI_PI(pip)->pi_prop == NULL)) {
46907c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
46917c478bd9Sstevel@tonic-gate 	}
46927c478bd9Sstevel@tonic-gate 	rv = nvlist_lookup_int32_array(MDI_PI(pip)->pi_prop, name,
46937c478bd9Sstevel@tonic-gate 	    (int32_t **)data, nelements);
46947c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
46957c478bd9Sstevel@tonic-gate }
46967c478bd9Sstevel@tonic-gate 
46977c478bd9Sstevel@tonic-gate /*
46987c478bd9Sstevel@tonic-gate  * mdi_prop_lookup_string():
46997c478bd9Sstevel@tonic-gate  * 		Look for string property identified by name.  The data
47007c478bd9Sstevel@tonic-gate  *		returned is the actual property and valid as long as
47017c478bd9Sstevel@tonic-gate  *		mdi_pathinfo_t node is alive.
47027c478bd9Sstevel@tonic-gate  */
47037c478bd9Sstevel@tonic-gate int
47047c478bd9Sstevel@tonic-gate mdi_prop_lookup_string(mdi_pathinfo_t *pip, char *name, char **data)
47057c478bd9Sstevel@tonic-gate {
47067c478bd9Sstevel@tonic-gate 	int rv;
47077c478bd9Sstevel@tonic-gate 
47087c478bd9Sstevel@tonic-gate 	if ((pip == NULL) || (MDI_PI(pip)->pi_prop == NULL)) {
47097c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
47107c478bd9Sstevel@tonic-gate 	}
47117c478bd9Sstevel@tonic-gate 	rv = nvlist_lookup_string(MDI_PI(pip)->pi_prop, name, data);
47127c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
47137c478bd9Sstevel@tonic-gate }
47147c478bd9Sstevel@tonic-gate 
47157c478bd9Sstevel@tonic-gate /*
47167c478bd9Sstevel@tonic-gate  * mdi_prop_lookup_string_array():
47177c478bd9Sstevel@tonic-gate  * 		Look for string array property identified by name.  The data
47187c478bd9Sstevel@tonic-gate  *		returned is the actual property and valid as long as
47197c478bd9Sstevel@tonic-gate  *		mdi_pathinfo_t node is alive.
47207c478bd9Sstevel@tonic-gate  */
47217c478bd9Sstevel@tonic-gate int
47227c478bd9Sstevel@tonic-gate mdi_prop_lookup_string_array(mdi_pathinfo_t *pip, char *name, char ***data,
47237c478bd9Sstevel@tonic-gate     uint_t *nelements)
47247c478bd9Sstevel@tonic-gate {
47257c478bd9Sstevel@tonic-gate 	int rv;
47267c478bd9Sstevel@tonic-gate 
47277c478bd9Sstevel@tonic-gate 	if ((pip == NULL) || (MDI_PI(pip)->pi_prop == NULL)) {
47287c478bd9Sstevel@tonic-gate 		return (DDI_PROP_NOT_FOUND);
47297c478bd9Sstevel@tonic-gate 	}
47307c478bd9Sstevel@tonic-gate 	rv = nvlist_lookup_string_array(MDI_PI(pip)->pi_prop, name, data,
47317c478bd9Sstevel@tonic-gate 	    nelements);
47327c478bd9Sstevel@tonic-gate 	return (i_map_nvlist_error_to_mdi(rv));
47337c478bd9Sstevel@tonic-gate }
47347c478bd9Sstevel@tonic-gate 
47357c478bd9Sstevel@tonic-gate /*
47367c478bd9Sstevel@tonic-gate  * mdi_prop_free():
47377c478bd9Sstevel@tonic-gate  * 		Symmetrical function to ddi_prop_free(). nvlist_lookup_xx()
47387c478bd9Sstevel@tonic-gate  *		functions return the pointer to actual property data and not a
47397c478bd9Sstevel@tonic-gate  *		copy of it.  So the data returned is valid as long as
47407c478bd9Sstevel@tonic-gate  *		mdi_pathinfo_t node is valid.
47417c478bd9Sstevel@tonic-gate  */
47427c478bd9Sstevel@tonic-gate /*ARGSUSED*/
47437c478bd9Sstevel@tonic-gate int
47447c478bd9Sstevel@tonic-gate mdi_prop_free(void *data)
47457c478bd9Sstevel@tonic-gate {
47467c478bd9Sstevel@tonic-gate 	return (DDI_PROP_SUCCESS);
47477c478bd9Sstevel@tonic-gate }
47487c478bd9Sstevel@tonic-gate 
47497c478bd9Sstevel@tonic-gate /*ARGSUSED*/
47507c478bd9Sstevel@tonic-gate static void
47517c478bd9Sstevel@tonic-gate i_mdi_report_path_state(mdi_client_t *ct, mdi_pathinfo_t *pip)
47527c478bd9Sstevel@tonic-gate {
47534c06356bSdh142964 	char		*ct_path;
47547c478bd9Sstevel@tonic-gate 	char		*ct_status;
47557c478bd9Sstevel@tonic-gate 	char		*status;
47564c06356bSdh142964 	dev_info_t	*cdip = ct->ct_dip;
47577c478bd9Sstevel@tonic-gate 	char		lb_buf[64];
47584c06356bSdh142964 	int		report_lb_c = 0, report_lb_p = 0;
47597c478bd9Sstevel@tonic-gate 
47605e3986cbScth 	ASSERT(MDI_CLIENT_LOCKED(ct));
47614c06356bSdh142964 	if ((cdip == NULL) || (ddi_get_instance(cdip) == -1) ||
47627c478bd9Sstevel@tonic-gate 	    (MDI_CLIENT_IS_REPORT_DEV_NEEDED(ct) == 0)) {
47637c478bd9Sstevel@tonic-gate 		return;
47647c478bd9Sstevel@tonic-gate 	}
47657c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT_STATE(ct) == MDI_CLIENT_STATE_OPTIMAL) {
47667c478bd9Sstevel@tonic-gate 		ct_status = "optimal";
47674c06356bSdh142964 		report_lb_c = 1;
47687c478bd9Sstevel@tonic-gate 	} else if (MDI_CLIENT_STATE(ct) == MDI_CLIENT_STATE_DEGRADED) {
47697c478bd9Sstevel@tonic-gate 		ct_status = "degraded";
47707c478bd9Sstevel@tonic-gate 	} else if (MDI_CLIENT_STATE(ct) == MDI_CLIENT_STATE_FAILED) {
47717c478bd9Sstevel@tonic-gate 		ct_status = "failed";
47727c478bd9Sstevel@tonic-gate 	} else {
47737c478bd9Sstevel@tonic-gate 		ct_status = "unknown";
47747c478bd9Sstevel@tonic-gate 	}
47757c478bd9Sstevel@tonic-gate 
47764c06356bSdh142964 	lb_buf[0] = 0;		/* not interested in load balancing config */
47774c06356bSdh142964 
47784c06356bSdh142964 	if (MDI_PI_FLAGS_IS_DEVICE_REMOVED(pip)) {
47794c06356bSdh142964 		status = "removed";
47804c06356bSdh142964 	} else if (MDI_PI_IS_OFFLINE(pip)) {
47817c478bd9Sstevel@tonic-gate 		status = "offline";
47827c478bd9Sstevel@tonic-gate 	} else if (MDI_PI_IS_ONLINE(pip)) {
47837c478bd9Sstevel@tonic-gate 		status = "online";
47844c06356bSdh142964 		report_lb_p = 1;
47857c478bd9Sstevel@tonic-gate 	} else if (MDI_PI_IS_STANDBY(pip)) {
47867c478bd9Sstevel@tonic-gate 		status = "standby";
47877c478bd9Sstevel@tonic-gate 	} else if (MDI_PI_IS_FAULT(pip)) {
47887c478bd9Sstevel@tonic-gate 		status = "faulted";
47897c478bd9Sstevel@tonic-gate 	} else {
47907c478bd9Sstevel@tonic-gate 		status = "unknown";
47917c478bd9Sstevel@tonic-gate 	}
47927c478bd9Sstevel@tonic-gate 
47934c06356bSdh142964 	if (cdip) {
47944c06356bSdh142964 		ct_path = kmem_alloc(MAXPATHLEN, KM_SLEEP);
47954c06356bSdh142964 
47964c06356bSdh142964 		/*
47974c06356bSdh142964 		 * NOTE: Keeping "multipath status: %s" and
47984c06356bSdh142964 		 * "Load balancing: %s" format unchanged in case someone
47994c06356bSdh142964 		 * scrubs /var/adm/messages looking for these messages.
48004c06356bSdh142964 		 */
48014c06356bSdh142964 		if (report_lb_c && report_lb_p) {
48027c478bd9Sstevel@tonic-gate 			if (ct->ct_lb == LOAD_BALANCE_LBA) {
48037c478bd9Sstevel@tonic-gate 				(void) snprintf(lb_buf, sizeof (lb_buf),
48047c478bd9Sstevel@tonic-gate 				    "%s, region-size: %d", mdi_load_balance_lba,
48057c478bd9Sstevel@tonic-gate 				    ct->ct_lb_args->region_size);
48067c478bd9Sstevel@tonic-gate 			} else if (ct->ct_lb == LOAD_BALANCE_NONE) {
48077c478bd9Sstevel@tonic-gate 				(void) snprintf(lb_buf, sizeof (lb_buf),
48087c478bd9Sstevel@tonic-gate 				    "%s", mdi_load_balance_none);
48097c478bd9Sstevel@tonic-gate 			} else {
48107c478bd9Sstevel@tonic-gate 				(void) snprintf(lb_buf, sizeof (lb_buf), "%s",
48117c478bd9Sstevel@tonic-gate 				    mdi_load_balance_rr);
48127c478bd9Sstevel@tonic-gate 			}
48137c478bd9Sstevel@tonic-gate 
48144c06356bSdh142964 			cmn_err(mdi_debug_consoleonly ? CE_NOTE : CE_CONT,
48154c06356bSdh142964 			    "?%s (%s%d) multipath status: %s: "
48164c06356bSdh142964 			    "path %d %s is %s: Load balancing: %s\n",
48174c06356bSdh142964 			    ddi_pathname(cdip, ct_path), ddi_driver_name(cdip),
48184c06356bSdh142964 			    ddi_get_instance(cdip), ct_status,
48194c06356bSdh142964 			    mdi_pi_get_path_instance(pip),
48204c06356bSdh142964 			    mdi_pi_spathname(pip), status, lb_buf);
48214c06356bSdh142964 		} else {
48224c06356bSdh142964 			cmn_err(mdi_debug_consoleonly ? CE_NOTE : CE_CONT,
48234c06356bSdh142964 			    "?%s (%s%d) multipath status: %s: "
48244c06356bSdh142964 			    "path %d %s is %s\n",
48254c06356bSdh142964 			    ddi_pathname(cdip, ct_path), ddi_driver_name(cdip),
48264c06356bSdh142964 			    ddi_get_instance(cdip), ct_status,
48274c06356bSdh142964 			    mdi_pi_get_path_instance(pip),
48284c06356bSdh142964 			    mdi_pi_spathname(pip), status);
48294c06356bSdh142964 		}
48304c06356bSdh142964 
48317c478bd9Sstevel@tonic-gate 		kmem_free(ct_path, MAXPATHLEN);
48327c478bd9Sstevel@tonic-gate 		MDI_CLIENT_CLEAR_REPORT_DEV_NEEDED(ct);
48337c478bd9Sstevel@tonic-gate 	}
48347c478bd9Sstevel@tonic-gate }
48357c478bd9Sstevel@tonic-gate 
48367c478bd9Sstevel@tonic-gate #ifdef	DEBUG
48377c478bd9Sstevel@tonic-gate /*
48387c478bd9Sstevel@tonic-gate  * i_mdi_log():
48397c478bd9Sstevel@tonic-gate  *		Utility function for error message management
48407c478bd9Sstevel@tonic-gate  *
48414c06356bSdh142964  *		NOTE: Implementation takes care of trailing \n for cmn_err,
48424c06356bSdh142964  *		MDI_DEBUG should not terminate fmt strings with \n.
48434c06356bSdh142964  *
48444c06356bSdh142964  *		NOTE: If the level is >= 2, and there is no leading !?^
48454c06356bSdh142964  *		then a leading ! is implied (but can be overriden via
48464c06356bSdh142964  *		mdi_debug_consoleonly). If you are using kmdb on the console,
48474c06356bSdh142964  *		consider setting mdi_debug_consoleonly to 1 as an aid.
48487c478bd9Sstevel@tonic-gate  */
48494c06356bSdh142964 /*PRINTFLIKE4*/
48507c478bd9Sstevel@tonic-gate static void
48514c06356bSdh142964 i_mdi_log(int level, const char *func, dev_info_t *dip, const char *fmt, ...)
48527c478bd9Sstevel@tonic-gate {
4853c73a93f2Sdm120769 	char		name[MAXNAMELEN];
48544c06356bSdh142964 	char		buf[512];
48555e3986cbScth 	char		*bp;
48567c478bd9Sstevel@tonic-gate 	va_list		ap;
48577c478bd9Sstevel@tonic-gate 	int		log_only = 0;
48587c478bd9Sstevel@tonic-gate 	int		boot_only = 0;
48597c478bd9Sstevel@tonic-gate 	int		console_only = 0;
48607c478bd9Sstevel@tonic-gate 
48617c478bd9Sstevel@tonic-gate 	if (dip) {
48624c06356bSdh142964 		(void) snprintf(name, sizeof(name), "%s%d: ",
486355e592a2SRandall Ralphs 		    ddi_driver_name(dip), ddi_get_instance(dip));
4864c73a93f2Sdm120769 	} else {
48655e3986cbScth 		name[0] = 0;
48667c478bd9Sstevel@tonic-gate 	}
48677c478bd9Sstevel@tonic-gate 
48687c478bd9Sstevel@tonic-gate 	va_start(ap, fmt);
48694c06356bSdh142964 	(void) vsnprintf(buf, sizeof(buf), fmt, ap);
48707c478bd9Sstevel@tonic-gate 	va_end(ap);
48717c478bd9Sstevel@tonic-gate 
48727c478bd9Sstevel@tonic-gate 	switch (buf[0]) {
48737c478bd9Sstevel@tonic-gate 	case '!':
48745e3986cbScth 		bp = &buf[1];
48757c478bd9Sstevel@tonic-gate 		log_only = 1;
48767c478bd9Sstevel@tonic-gate 		break;
48777c478bd9Sstevel@tonic-gate 	case '?':
48785e3986cbScth 		bp = &buf[1];
48797c478bd9Sstevel@tonic-gate 		boot_only = 1;
48807c478bd9Sstevel@tonic-gate 		break;
48817c478bd9Sstevel@tonic-gate 	case '^':
48825e3986cbScth 		bp = &buf[1];
48837c478bd9Sstevel@tonic-gate 		console_only = 1;
48847c478bd9Sstevel@tonic-gate 		break;
48855e3986cbScth 	default:
48864c06356bSdh142964 		if (level >= 2)
48874c06356bSdh142964 			log_only = 1;		/* ! implied */
48885e3986cbScth 		bp = buf;
48895e3986cbScth 		break;
48905e3986cbScth 	}
48915e3986cbScth 	if (mdi_debug_logonly) {
48925e3986cbScth 		log_only = 1;
48935e3986cbScth 		boot_only = 0;
48945e3986cbScth 		console_only = 0;
48957c478bd9Sstevel@tonic-gate 	}
48964c06356bSdh142964 	if (mdi_debug_consoleonly) {
48974c06356bSdh142964 		log_only = 0;
48984c06356bSdh142964 		boot_only = 0;
48994c06356bSdh142964 		console_only = 1;
49004c06356bSdh142964 		level = CE_NOTE;
49014c06356bSdh142964 		goto console;
49024c06356bSdh142964 	}
49037c478bd9Sstevel@tonic-gate 
49047c478bd9Sstevel@tonic-gate 	switch (level) {
49057c478bd9Sstevel@tonic-gate 	case CE_NOTE:
49067c478bd9Sstevel@tonic-gate 		level = CE_CONT;
49077c478bd9Sstevel@tonic-gate 		/* FALLTHROUGH */
49087c478bd9Sstevel@tonic-gate 	case CE_CONT:
49094c06356bSdh142964 		if (boot_only) {
49104c06356bSdh142964 			cmn_err(level, "?mdi: %s%s: %s\n", name, func, bp);
49114c06356bSdh142964 		} else if (console_only) {
49124c06356bSdh142964 			cmn_err(level, "^mdi: %s%s: %s\n", name, func, bp);
49134c06356bSdh142964 		} else if (log_only) {
49144c06356bSdh142964 			cmn_err(level, "!mdi: %s%s: %s\n", name, func, bp);
49154c06356bSdh142964 		} else {
49164c06356bSdh142964 			cmn_err(level, "mdi: %s%s: %s\n", name, func, bp);
49174c06356bSdh142964 		}
49184c06356bSdh142964 		break;
49194c06356bSdh142964 
49207c478bd9Sstevel@tonic-gate 	case CE_WARN:
49217c478bd9Sstevel@tonic-gate 	case CE_PANIC:
49224c06356bSdh142964 	console:
49237c478bd9Sstevel@tonic-gate 		if (boot_only) {
49244c06356bSdh142964 			cmn_err(level, "?mdi: %s%s: %s", name, func, bp);
49257c478bd9Sstevel@tonic-gate 		} else if (console_only) {
49264c06356bSdh142964 			cmn_err(level, "^mdi: %s%s: %s", name, func, bp);
49277c478bd9Sstevel@tonic-gate 		} else if (log_only) {
49284c06356bSdh142964 			cmn_err(level, "!mdi: %s%s: %s", name, func, bp);
49297c478bd9Sstevel@tonic-gate 		} else {
49304c06356bSdh142964 			cmn_err(level, "mdi: %s%s: %s", name, func, bp);
49317c478bd9Sstevel@tonic-gate 		}
49327c478bd9Sstevel@tonic-gate 		break;
49337c478bd9Sstevel@tonic-gate 	default:
49345e3986cbScth 		cmn_err(level, "mdi: %s%s", name, bp);
49357c478bd9Sstevel@tonic-gate 		break;
49367c478bd9Sstevel@tonic-gate 	}
49377c478bd9Sstevel@tonic-gate }
49387c478bd9Sstevel@tonic-gate #endif	/* DEBUG */
49397c478bd9Sstevel@tonic-gate 
49407c478bd9Sstevel@tonic-gate void
49417c478bd9Sstevel@tonic-gate i_mdi_client_online(dev_info_t *ct_dip)
49427c478bd9Sstevel@tonic-gate {
49437c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
49447c478bd9Sstevel@tonic-gate 
49457c478bd9Sstevel@tonic-gate 	/*
49467c478bd9Sstevel@tonic-gate 	 * Client online notification. Mark client state as online
49477c478bd9Sstevel@tonic-gate 	 * restore our binding with dev_info node
49487c478bd9Sstevel@tonic-gate 	 */
49497c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(ct_dip);
49507c478bd9Sstevel@tonic-gate 	ASSERT(ct != NULL);
49517c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
49527c478bd9Sstevel@tonic-gate 	MDI_CLIENT_SET_ONLINE(ct);
49537c478bd9Sstevel@tonic-gate 	/* catch for any memory leaks */
49547c478bd9Sstevel@tonic-gate 	ASSERT((ct->ct_dip == NULL) || (ct->ct_dip == ct_dip));
49557c478bd9Sstevel@tonic-gate 	ct->ct_dip = ct_dip;
49567c478bd9Sstevel@tonic-gate 
49577c478bd9Sstevel@tonic-gate 	if (ct->ct_power_cnt == 0)
49587c478bd9Sstevel@tonic-gate 		(void) i_mdi_power_all_phci(ct);
49597c478bd9Sstevel@tonic-gate 
49604c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, ct_dip,
49614c06356bSdh142964 	    "i_mdi_pm_hold_client %p", (void *)ct));
49627c478bd9Sstevel@tonic-gate 	i_mdi_pm_hold_client(ct, 1);
49637c478bd9Sstevel@tonic-gate 
49647c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
49657c478bd9Sstevel@tonic-gate }
49667c478bd9Sstevel@tonic-gate 
49677c478bd9Sstevel@tonic-gate void
49687c478bd9Sstevel@tonic-gate i_mdi_phci_online(dev_info_t *ph_dip)
49697c478bd9Sstevel@tonic-gate {
49707c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
49717c478bd9Sstevel@tonic-gate 
49727c478bd9Sstevel@tonic-gate 	/* pHCI online notification. Mark state accordingly */
49737c478bd9Sstevel@tonic-gate 	ph = i_devi_get_phci(ph_dip);
49747c478bd9Sstevel@tonic-gate 	ASSERT(ph != NULL);
49757c478bd9Sstevel@tonic-gate 	MDI_PHCI_LOCK(ph);
49767c478bd9Sstevel@tonic-gate 	MDI_PHCI_SET_ONLINE(ph);
49777c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNLOCK(ph);
49787c478bd9Sstevel@tonic-gate }
49797c478bd9Sstevel@tonic-gate 
49807c478bd9Sstevel@tonic-gate /*
49817c478bd9Sstevel@tonic-gate  * mdi_devi_online():
49827c478bd9Sstevel@tonic-gate  * 		Online notification from NDI framework on pHCI/client
49837c478bd9Sstevel@tonic-gate  *		device online.
49847c478bd9Sstevel@tonic-gate  * Return Values:
49857c478bd9Sstevel@tonic-gate  *		NDI_SUCCESS
49867c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
49877c478bd9Sstevel@tonic-gate  */
49887c478bd9Sstevel@tonic-gate /*ARGSUSED*/
49897c478bd9Sstevel@tonic-gate int
49907c478bd9Sstevel@tonic-gate mdi_devi_online(dev_info_t *dip, uint_t flags)
49917c478bd9Sstevel@tonic-gate {
49927c478bd9Sstevel@tonic-gate 	if (MDI_PHCI(dip)) {
49937c478bd9Sstevel@tonic-gate 		i_mdi_phci_online(dip);
49947c478bd9Sstevel@tonic-gate 	}
49957c478bd9Sstevel@tonic-gate 
49967c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT(dip)) {
49977c478bd9Sstevel@tonic-gate 		i_mdi_client_online(dip);
49987c478bd9Sstevel@tonic-gate 	}
49997c478bd9Sstevel@tonic-gate 	return (NDI_SUCCESS);
50007c478bd9Sstevel@tonic-gate }
50017c478bd9Sstevel@tonic-gate 
50027c478bd9Sstevel@tonic-gate /*
50037c478bd9Sstevel@tonic-gate  * mdi_devi_offline():
50047c478bd9Sstevel@tonic-gate  * 		Offline notification from NDI framework on pHCI/Client device
50057c478bd9Sstevel@tonic-gate  *		offline.
50067c478bd9Sstevel@tonic-gate  *
50077c478bd9Sstevel@tonic-gate  * Return Values:
50087c478bd9Sstevel@tonic-gate  *		NDI_SUCCESS
50097c478bd9Sstevel@tonic-gate  *		NDI_FAILURE
50107c478bd9Sstevel@tonic-gate  */
50117c478bd9Sstevel@tonic-gate /*ARGSUSED*/
50127c478bd9Sstevel@tonic-gate int
50137c478bd9Sstevel@tonic-gate mdi_devi_offline(dev_info_t *dip, uint_t flags)
50147c478bd9Sstevel@tonic-gate {
50157c478bd9Sstevel@tonic-gate 	int		rv = NDI_SUCCESS;
50167c478bd9Sstevel@tonic-gate 
50177c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT(dip)) {
50187c478bd9Sstevel@tonic-gate 		rv = i_mdi_client_offline(dip, flags);
50197c478bd9Sstevel@tonic-gate 		if (rv != NDI_SUCCESS)
50207c478bd9Sstevel@tonic-gate 			return (rv);
50217c478bd9Sstevel@tonic-gate 	}
50227c478bd9Sstevel@tonic-gate 
50237c478bd9Sstevel@tonic-gate 	if (MDI_PHCI(dip)) {
50247c478bd9Sstevel@tonic-gate 		rv = i_mdi_phci_offline(dip, flags);
50255e3986cbScth 
50267c478bd9Sstevel@tonic-gate 		if ((rv != NDI_SUCCESS) && MDI_CLIENT(dip)) {
50277c478bd9Sstevel@tonic-gate 			/* set client back online */
50287c478bd9Sstevel@tonic-gate 			i_mdi_client_online(dip);
50297c478bd9Sstevel@tonic-gate 		}
50307c478bd9Sstevel@tonic-gate 	}
50317c478bd9Sstevel@tonic-gate 
50327c478bd9Sstevel@tonic-gate 	return (rv);
50337c478bd9Sstevel@tonic-gate }
50347c478bd9Sstevel@tonic-gate 
50357c478bd9Sstevel@tonic-gate /*ARGSUSED*/
50367c478bd9Sstevel@tonic-gate static int
50377c478bd9Sstevel@tonic-gate i_mdi_phci_offline(dev_info_t *dip, uint_t flags)
50387c478bd9Sstevel@tonic-gate {
50397c478bd9Sstevel@tonic-gate 	int		rv = NDI_SUCCESS;
50407c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
50417c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
50427c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*pip;
50437c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*next;
50447c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*failed_pip = NULL;
50457c478bd9Sstevel@tonic-gate 	dev_info_t	*cdip;
50467c478bd9Sstevel@tonic-gate 
50477c478bd9Sstevel@tonic-gate 	/*
50487c478bd9Sstevel@tonic-gate 	 * pHCI component offline notification
50497c478bd9Sstevel@tonic-gate 	 * Make sure that this pHCI instance is free to be offlined.
50507c478bd9Sstevel@tonic-gate 	 * If it is OK to proceed, Offline and remove all the child
50517c478bd9Sstevel@tonic-gate 	 * mdi_pathinfo nodes.  This process automatically offlines
50527c478bd9Sstevel@tonic-gate 	 * corresponding client devices, for which this pHCI provides
50537c478bd9Sstevel@tonic-gate 	 * critical services.
50547c478bd9Sstevel@tonic-gate 	 */
50557c478bd9Sstevel@tonic-gate 	ph = i_devi_get_phci(dip);
50564c06356bSdh142964 	MDI_DEBUG(2, (MDI_NOTE, dip,
50574c06356bSdh142964 	    "called %p %p", (void *)dip, (void *)ph));
50587c478bd9Sstevel@tonic-gate 	if (ph == NULL) {
50597c478bd9Sstevel@tonic-gate 		return (rv);
50607c478bd9Sstevel@tonic-gate 	}
50617c478bd9Sstevel@tonic-gate 
50627c478bd9Sstevel@tonic-gate 	MDI_PHCI_LOCK(ph);
50637c478bd9Sstevel@tonic-gate 
50647c478bd9Sstevel@tonic-gate 	if (MDI_PHCI_IS_OFFLINE(ph)) {
50654c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, dip,
50664c06356bSdh142964 		    "!pHCI already offlined: %p", (void *)dip));
50677c478bd9Sstevel@tonic-gate 		MDI_PHCI_UNLOCK(ph);
50687c478bd9Sstevel@tonic-gate 		return (NDI_SUCCESS);
50697c478bd9Sstevel@tonic-gate 	}
50707c478bd9Sstevel@tonic-gate 
50717c478bd9Sstevel@tonic-gate 	/*
50727c478bd9Sstevel@tonic-gate 	 * Check to see if the pHCI can be offlined
50737c478bd9Sstevel@tonic-gate 	 */
50747c478bd9Sstevel@tonic-gate 	if (ph->ph_unstable) {
50754c06356bSdh142964 		MDI_DEBUG(1, (MDI_WARN, dip,
50764c06356bSdh142964 		    "!One or more target devices are in transient state. "
50774c06356bSdh142964 		    "This device can not be removed at this moment. "
50784c06356bSdh142964 		    "Please try again later."));
50797c478bd9Sstevel@tonic-gate 		MDI_PHCI_UNLOCK(ph);
50807c478bd9Sstevel@tonic-gate 		return (NDI_BUSY);
50817c478bd9Sstevel@tonic-gate 	}
50827c478bd9Sstevel@tonic-gate 
50837c478bd9Sstevel@tonic-gate 	pip = ph->ph_path_head;
50847c478bd9Sstevel@tonic-gate 	while (pip != NULL) {
50857c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
50867c478bd9Sstevel@tonic-gate 		next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
50875e3986cbScth 
50887c478bd9Sstevel@tonic-gate 		/*
50897c478bd9Sstevel@tonic-gate 		 * The mdi_pathinfo state is OK. Check the client state.
50907c478bd9Sstevel@tonic-gate 		 * If failover in progress fail the pHCI from offlining
50917c478bd9Sstevel@tonic-gate 		 */
50927c478bd9Sstevel@tonic-gate 		ct = MDI_PI(pip)->pi_client;
50937c478bd9Sstevel@tonic-gate 		i_mdi_client_lock(ct, pip);
50947c478bd9Sstevel@tonic-gate 		if ((MDI_CLIENT_IS_FAILOVER_IN_PROGRESS(ct)) ||
50957c478bd9Sstevel@tonic-gate 		    (ct->ct_unstable)) {
50967c478bd9Sstevel@tonic-gate 			/*
50977c478bd9Sstevel@tonic-gate 			 * Failover is in progress, Fail the DR
50987c478bd9Sstevel@tonic-gate 			 */
50994c06356bSdh142964 			MDI_DEBUG(1, (MDI_WARN, dip,
51004c06356bSdh142964 			    "!pHCI device is busy. "
51014c06356bSdh142964 			    "This device can not be removed at this moment. "
51024c06356bSdh142964 			    "Please try again later."));
51037c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
51045e3986cbScth 			i_mdi_client_unlock(ct);
51057c478bd9Sstevel@tonic-gate 			MDI_PHCI_UNLOCK(ph);
51067c478bd9Sstevel@tonic-gate 			return (NDI_BUSY);
51077c478bd9Sstevel@tonic-gate 		}
51087c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
51097c478bd9Sstevel@tonic-gate 
51107c478bd9Sstevel@tonic-gate 		/*
51117c478bd9Sstevel@tonic-gate 		 * Check to see of we are removing the last path of this
51127c478bd9Sstevel@tonic-gate 		 * client device...
51137c478bd9Sstevel@tonic-gate 		 */
51147c478bd9Sstevel@tonic-gate 		cdip = ct->ct_dip;
51157c478bd9Sstevel@tonic-gate 		if (cdip && (i_ddi_node_state(cdip) >= DS_INITIALIZED) &&
51167c478bd9Sstevel@tonic-gate 		    (i_mdi_client_compute_state(ct, ph) ==
51177c478bd9Sstevel@tonic-gate 		    MDI_CLIENT_STATE_FAILED)) {
51187c478bd9Sstevel@tonic-gate 			i_mdi_client_unlock(ct);
51197c478bd9Sstevel@tonic-gate 			MDI_PHCI_UNLOCK(ph);
51204c06356bSdh142964 			if (ndi_devi_offline(cdip,
51214c06356bSdh142964 			    NDI_DEVFS_CLEAN) != NDI_SUCCESS) {
51227c478bd9Sstevel@tonic-gate 				/*
51237c478bd9Sstevel@tonic-gate 				 * ndi_devi_offline() failed.
51247c478bd9Sstevel@tonic-gate 				 * This pHCI provides the critical path
51257c478bd9Sstevel@tonic-gate 				 * to one or more client devices.
51267c478bd9Sstevel@tonic-gate 				 * Return busy.
51277c478bd9Sstevel@tonic-gate 				 */
51287c478bd9Sstevel@tonic-gate 				MDI_PHCI_LOCK(ph);
51294c06356bSdh142964 				MDI_DEBUG(1, (MDI_WARN, dip,
51304c06356bSdh142964 				    "!pHCI device is busy. "
51314c06356bSdh142964 				    "This device can not be removed at this "
51324c06356bSdh142964 				    "moment. Please try again later."));
51337c478bd9Sstevel@tonic-gate 				failed_pip = pip;
51347c478bd9Sstevel@tonic-gate 				break;
51357c478bd9Sstevel@tonic-gate 			} else {
51367c478bd9Sstevel@tonic-gate 				MDI_PHCI_LOCK(ph);
51377c478bd9Sstevel@tonic-gate 				pip = next;
51387c478bd9Sstevel@tonic-gate 			}
51397c478bd9Sstevel@tonic-gate 		} else {
51407c478bd9Sstevel@tonic-gate 			i_mdi_client_unlock(ct);
51417c478bd9Sstevel@tonic-gate 			pip = next;
51427c478bd9Sstevel@tonic-gate 		}
51437c478bd9Sstevel@tonic-gate 	}
51447c478bd9Sstevel@tonic-gate 
51457c478bd9Sstevel@tonic-gate 	if (failed_pip) {
51467c478bd9Sstevel@tonic-gate 		pip = ph->ph_path_head;
51477c478bd9Sstevel@tonic-gate 		while (pip != failed_pip) {
51487c478bd9Sstevel@tonic-gate 			MDI_PI_LOCK(pip);
51497c478bd9Sstevel@tonic-gate 			next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
51507c478bd9Sstevel@tonic-gate 			ct = MDI_PI(pip)->pi_client;
51517c478bd9Sstevel@tonic-gate 			i_mdi_client_lock(ct, pip);
51527c478bd9Sstevel@tonic-gate 			cdip = ct->ct_dip;
51537c478bd9Sstevel@tonic-gate 			switch (MDI_CLIENT_STATE(ct)) {
51547c478bd9Sstevel@tonic-gate 			case MDI_CLIENT_STATE_OPTIMAL:
51557c478bd9Sstevel@tonic-gate 			case MDI_CLIENT_STATE_DEGRADED:
51567c478bd9Sstevel@tonic-gate 				if (cdip) {
51577c478bd9Sstevel@tonic-gate 					MDI_PI_UNLOCK(pip);
51587c478bd9Sstevel@tonic-gate 					i_mdi_client_unlock(ct);
51597c478bd9Sstevel@tonic-gate 					MDI_PHCI_UNLOCK(ph);
51607c478bd9Sstevel@tonic-gate 					(void) ndi_devi_online(cdip, 0);
51617c478bd9Sstevel@tonic-gate 					MDI_PHCI_LOCK(ph);
51627c478bd9Sstevel@tonic-gate 					pip = next;
51637c478bd9Sstevel@tonic-gate 					continue;
51647c478bd9Sstevel@tonic-gate 				}
51657c478bd9Sstevel@tonic-gate 				break;
51667c478bd9Sstevel@tonic-gate 
51677c478bd9Sstevel@tonic-gate 			case MDI_CLIENT_STATE_FAILED:
51687c478bd9Sstevel@tonic-gate 				if (cdip) {
51697c478bd9Sstevel@tonic-gate 					MDI_PI_UNLOCK(pip);
51707c478bd9Sstevel@tonic-gate 					i_mdi_client_unlock(ct);
51717c478bd9Sstevel@tonic-gate 					MDI_PHCI_UNLOCK(ph);
51724c06356bSdh142964 					(void) ndi_devi_offline(cdip,
51734c06356bSdh142964 						NDI_DEVFS_CLEAN);
51747c478bd9Sstevel@tonic-gate 					MDI_PHCI_LOCK(ph);
51757c478bd9Sstevel@tonic-gate 					pip = next;
51767c478bd9Sstevel@tonic-gate 					continue;
51777c478bd9Sstevel@tonic-gate 				}
51787c478bd9Sstevel@tonic-gate 				break;
51797c478bd9Sstevel@tonic-gate 			}
51807c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
51817c478bd9Sstevel@tonic-gate 			i_mdi_client_unlock(ct);
51827c478bd9Sstevel@tonic-gate 			pip = next;
51837c478bd9Sstevel@tonic-gate 		}
51847c478bd9Sstevel@tonic-gate 		MDI_PHCI_UNLOCK(ph);
51857c478bd9Sstevel@tonic-gate 		return (NDI_BUSY);
51867c478bd9Sstevel@tonic-gate 	}
51877c478bd9Sstevel@tonic-gate 
51887c478bd9Sstevel@tonic-gate 	/*
51897c478bd9Sstevel@tonic-gate 	 * Mark the pHCI as offline
51907c478bd9Sstevel@tonic-gate 	 */
51917c478bd9Sstevel@tonic-gate 	MDI_PHCI_SET_OFFLINE(ph);
51927c478bd9Sstevel@tonic-gate 
51937c478bd9Sstevel@tonic-gate 	/*
51947c478bd9Sstevel@tonic-gate 	 * Mark the child mdi_pathinfo nodes as transient
51957c478bd9Sstevel@tonic-gate 	 */
51967c478bd9Sstevel@tonic-gate 	pip = ph->ph_path_head;
51977c478bd9Sstevel@tonic-gate 	while (pip != NULL) {
51987c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
51997c478bd9Sstevel@tonic-gate 		next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
52007c478bd9Sstevel@tonic-gate 		MDI_PI_SET_OFFLINING(pip);
52017c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
52027c478bd9Sstevel@tonic-gate 		pip = next;
52037c478bd9Sstevel@tonic-gate 	}
52047c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNLOCK(ph);
52057c478bd9Sstevel@tonic-gate 	/*
52067c478bd9Sstevel@tonic-gate 	 * Give a chance for any pending commands to execute
52077c478bd9Sstevel@tonic-gate 	 */
520896c4a178SChris Horne 	delay_random(mdi_delay);
52097c478bd9Sstevel@tonic-gate 	MDI_PHCI_LOCK(ph);
52107c478bd9Sstevel@tonic-gate 	pip = ph->ph_path_head;
52117c478bd9Sstevel@tonic-gate 	while (pip != NULL) {
52127c478bd9Sstevel@tonic-gate 		next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
52137c478bd9Sstevel@tonic-gate 		(void) i_mdi_pi_offline(pip, flags);
52147c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
52157c478bd9Sstevel@tonic-gate 		ct = MDI_PI(pip)->pi_client;
52167c478bd9Sstevel@tonic-gate 		if (!MDI_PI_IS_OFFLINE(pip)) {
52174c06356bSdh142964 			MDI_DEBUG(1, (MDI_WARN, dip,
52184c06356bSdh142964 			    "!pHCI device is busy. "
52194c06356bSdh142964 			    "This device can not be removed at this moment. "
52204c06356bSdh142964 			    "Please try again later."));
52217c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
52227c478bd9Sstevel@tonic-gate 			MDI_PHCI_SET_ONLINE(ph);
52237c478bd9Sstevel@tonic-gate 			MDI_PHCI_UNLOCK(ph);
52247c478bd9Sstevel@tonic-gate 			return (NDI_BUSY);
52257c478bd9Sstevel@tonic-gate 		}
52267c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
52277c478bd9Sstevel@tonic-gate 		pip = next;
52287c478bd9Sstevel@tonic-gate 	}
52297c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNLOCK(ph);
52307c478bd9Sstevel@tonic-gate 
52317c478bd9Sstevel@tonic-gate 	return (rv);
52327c478bd9Sstevel@tonic-gate }
52337c478bd9Sstevel@tonic-gate 
523425e8c5aaSvikram void
523525e8c5aaSvikram mdi_phci_mark_retiring(dev_info_t *dip, char **cons_array)
523625e8c5aaSvikram {
523725e8c5aaSvikram 	mdi_phci_t	*ph;
523825e8c5aaSvikram 	mdi_client_t	*ct;
523925e8c5aaSvikram 	mdi_pathinfo_t	*pip;
524025e8c5aaSvikram 	mdi_pathinfo_t	*next;
524125e8c5aaSvikram 	dev_info_t	*cdip;
524225e8c5aaSvikram 
524325e8c5aaSvikram 	if (!MDI_PHCI(dip))
524425e8c5aaSvikram 		return;
524525e8c5aaSvikram 
524625e8c5aaSvikram 	ph = i_devi_get_phci(dip);
524725e8c5aaSvikram 	if (ph == NULL) {
524825e8c5aaSvikram 		return;
524925e8c5aaSvikram 	}
525025e8c5aaSvikram 
525125e8c5aaSvikram 	MDI_PHCI_LOCK(ph);
525225e8c5aaSvikram 
525325e8c5aaSvikram 	if (MDI_PHCI_IS_OFFLINE(ph)) {
525425e8c5aaSvikram 		/* has no last path */
525525e8c5aaSvikram 		MDI_PHCI_UNLOCK(ph);
525625e8c5aaSvikram 		return;
525725e8c5aaSvikram 	}
525825e8c5aaSvikram 
525925e8c5aaSvikram 	pip = ph->ph_path_head;
526025e8c5aaSvikram 	while (pip != NULL) {
526125e8c5aaSvikram 		MDI_PI_LOCK(pip);
526225e8c5aaSvikram 		next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
526325e8c5aaSvikram 
526425e8c5aaSvikram 		ct = MDI_PI(pip)->pi_client;
526525e8c5aaSvikram 		i_mdi_client_lock(ct, pip);
526625e8c5aaSvikram 		MDI_PI_UNLOCK(pip);
526725e8c5aaSvikram 
526825e8c5aaSvikram 		cdip = ct->ct_dip;
526925e8c5aaSvikram 		if (cdip && (i_ddi_node_state(cdip) >= DS_INITIALIZED) &&
527025e8c5aaSvikram 		    (i_mdi_client_compute_state(ct, ph) ==
527125e8c5aaSvikram 		    MDI_CLIENT_STATE_FAILED)) {
527225e8c5aaSvikram 			/* Last path. Mark client dip as retiring */
527325e8c5aaSvikram 			i_mdi_client_unlock(ct);
527425e8c5aaSvikram 			MDI_PHCI_UNLOCK(ph);
527525e8c5aaSvikram 			(void) e_ddi_mark_retiring(cdip, cons_array);
527625e8c5aaSvikram 			MDI_PHCI_LOCK(ph);
527725e8c5aaSvikram 			pip = next;
527825e8c5aaSvikram 		} else {
527925e8c5aaSvikram 			i_mdi_client_unlock(ct);
528025e8c5aaSvikram 			pip = next;
528125e8c5aaSvikram 		}
528225e8c5aaSvikram 	}
528325e8c5aaSvikram 
528425e8c5aaSvikram 	MDI_PHCI_UNLOCK(ph);
528525e8c5aaSvikram 
528625e8c5aaSvikram 	return;
528725e8c5aaSvikram }
528825e8c5aaSvikram 
528925e8c5aaSvikram void
529025e8c5aaSvikram mdi_phci_retire_notify(dev_info_t *dip, int *constraint)
529125e8c5aaSvikram {
529225e8c5aaSvikram 	mdi_phci_t	*ph;
529325e8c5aaSvikram 	mdi_client_t	*ct;
529425e8c5aaSvikram 	mdi_pathinfo_t	*pip;
529525e8c5aaSvikram 	mdi_pathinfo_t	*next;
529625e8c5aaSvikram 	dev_info_t	*cdip;
529725e8c5aaSvikram 
529825e8c5aaSvikram 	if (!MDI_PHCI(dip))
529925e8c5aaSvikram 		return;
530025e8c5aaSvikram 
530125e8c5aaSvikram 	ph = i_devi_get_phci(dip);
530225e8c5aaSvikram 	if (ph == NULL)
530325e8c5aaSvikram 		return;
530425e8c5aaSvikram 
530525e8c5aaSvikram 	MDI_PHCI_LOCK(ph);
530625e8c5aaSvikram 
530725e8c5aaSvikram 	if (MDI_PHCI_IS_OFFLINE(ph)) {
530825e8c5aaSvikram 		MDI_PHCI_UNLOCK(ph);
530925e8c5aaSvikram 		/* not last path */
531025e8c5aaSvikram 		return;
531125e8c5aaSvikram 	}
531225e8c5aaSvikram 
531325e8c5aaSvikram 	if (ph->ph_unstable) {
531425e8c5aaSvikram 		MDI_PHCI_UNLOCK(ph);
531525e8c5aaSvikram 		/* can't check for constraints */
531625e8c5aaSvikram 		*constraint = 0;
531725e8c5aaSvikram 		return;
531825e8c5aaSvikram 	}
531925e8c5aaSvikram 
532025e8c5aaSvikram 	pip = ph->ph_path_head;
532125e8c5aaSvikram 	while (pip != NULL) {
532225e8c5aaSvikram 		MDI_PI_LOCK(pip);
532325e8c5aaSvikram 		next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
532425e8c5aaSvikram 
532525e8c5aaSvikram 		/*
532625e8c5aaSvikram 		 * The mdi_pathinfo state is OK. Check the client state.
532725e8c5aaSvikram 		 * If failover in progress fail the pHCI from offlining
532825e8c5aaSvikram 		 */
532925e8c5aaSvikram 		ct = MDI_PI(pip)->pi_client;
533025e8c5aaSvikram 		i_mdi_client_lock(ct, pip);
533125e8c5aaSvikram 		if ((MDI_CLIENT_IS_FAILOVER_IN_PROGRESS(ct)) ||
533225e8c5aaSvikram 		    (ct->ct_unstable)) {
533325e8c5aaSvikram 			/*
533425e8c5aaSvikram 			 * Failover is in progress, can't check for constraints
533525e8c5aaSvikram 			 */
533625e8c5aaSvikram 			MDI_PI_UNLOCK(pip);
533725e8c5aaSvikram 			i_mdi_client_unlock(ct);
533825e8c5aaSvikram 			MDI_PHCI_UNLOCK(ph);
533925e8c5aaSvikram 			*constraint = 0;
534025e8c5aaSvikram 			return;
534125e8c5aaSvikram 		}
534225e8c5aaSvikram 		MDI_PI_UNLOCK(pip);
534325e8c5aaSvikram 
534425e8c5aaSvikram 		/*
534525e8c5aaSvikram 		 * Check to see of we are retiring the last path of this
534625e8c5aaSvikram 		 * client device...
534725e8c5aaSvikram 		 */
534825e8c5aaSvikram 		cdip = ct->ct_dip;
534925e8c5aaSvikram 		if (cdip && (i_ddi_node_state(cdip) >= DS_INITIALIZED) &&
535025e8c5aaSvikram 		    (i_mdi_client_compute_state(ct, ph) ==
535125e8c5aaSvikram 		    MDI_CLIENT_STATE_FAILED)) {
535225e8c5aaSvikram 			i_mdi_client_unlock(ct);
535325e8c5aaSvikram 			MDI_PHCI_UNLOCK(ph);
535425e8c5aaSvikram 			(void) e_ddi_retire_notify(cdip, constraint);
535525e8c5aaSvikram 			MDI_PHCI_LOCK(ph);
535625e8c5aaSvikram 			pip = next;
535725e8c5aaSvikram 		} else {
535825e8c5aaSvikram 			i_mdi_client_unlock(ct);
535925e8c5aaSvikram 			pip = next;
536025e8c5aaSvikram 		}
536125e8c5aaSvikram 	}
536225e8c5aaSvikram 
536325e8c5aaSvikram 	MDI_PHCI_UNLOCK(ph);
536425e8c5aaSvikram 
536525e8c5aaSvikram 	return;
536625e8c5aaSvikram }
536725e8c5aaSvikram 
536825e8c5aaSvikram /*
53694c06356bSdh142964  * offline the path(s) hanging off the pHCI. If the
537025e8c5aaSvikram  * last path to any client, check that constraints
537125e8c5aaSvikram  * have been applied.
537225e8c5aaSvikram  */
537325e8c5aaSvikram void
537425e8c5aaSvikram mdi_phci_retire_finalize(dev_info_t *dip, int phci_only)
537525e8c5aaSvikram {
537625e8c5aaSvikram 	mdi_phci_t	*ph;
537725e8c5aaSvikram 	mdi_client_t	*ct;
537825e8c5aaSvikram 	mdi_pathinfo_t	*pip;
537925e8c5aaSvikram 	mdi_pathinfo_t	*next;
538025e8c5aaSvikram 	dev_info_t	*cdip;
538125e8c5aaSvikram 	int		unstable = 0;
538225e8c5aaSvikram 	int		constraint;
538325e8c5aaSvikram 
538425e8c5aaSvikram 	if (!MDI_PHCI(dip))
538525e8c5aaSvikram 		return;
538625e8c5aaSvikram 
538725e8c5aaSvikram 	ph = i_devi_get_phci(dip);
538825e8c5aaSvikram 	if (ph == NULL) {
538925e8c5aaSvikram 		/* no last path and no pips */
539025e8c5aaSvikram 		return;
539125e8c5aaSvikram 	}
539225e8c5aaSvikram 
539325e8c5aaSvikram 	MDI_PHCI_LOCK(ph);
539425e8c5aaSvikram 
539525e8c5aaSvikram 	if (MDI_PHCI_IS_OFFLINE(ph)) {
539625e8c5aaSvikram 		MDI_PHCI_UNLOCK(ph);
539725e8c5aaSvikram 		/* no last path and no pips */
539825e8c5aaSvikram 		return;
539925e8c5aaSvikram 	}
540025e8c5aaSvikram 
540125e8c5aaSvikram 	/*
540225e8c5aaSvikram 	 * Check to see if the pHCI can be offlined
540325e8c5aaSvikram 	 */
540425e8c5aaSvikram 	if (ph->ph_unstable) {
540525e8c5aaSvikram 		unstable = 1;
540625e8c5aaSvikram 	}
540725e8c5aaSvikram 
540825e8c5aaSvikram 	pip = ph->ph_path_head;
540925e8c5aaSvikram 	while (pip != NULL) {
541025e8c5aaSvikram 		MDI_PI_LOCK(pip);
541125e8c5aaSvikram 		next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
541225e8c5aaSvikram 
541325e8c5aaSvikram 		/*
541425e8c5aaSvikram 		 * if failover in progress fail the pHCI from offlining
541525e8c5aaSvikram 		 */
541625e8c5aaSvikram 		ct = MDI_PI(pip)->pi_client;
541725e8c5aaSvikram 		i_mdi_client_lock(ct, pip);
541825e8c5aaSvikram 		if ((MDI_CLIENT_IS_FAILOVER_IN_PROGRESS(ct)) ||
541925e8c5aaSvikram 		    (ct->ct_unstable)) {
542025e8c5aaSvikram 			unstable = 1;
542125e8c5aaSvikram 		}
542225e8c5aaSvikram 		MDI_PI_UNLOCK(pip);
542325e8c5aaSvikram 
542425e8c5aaSvikram 		/*
542525e8c5aaSvikram 		 * Check to see of we are removing the last path of this
542625e8c5aaSvikram 		 * client device...
542725e8c5aaSvikram 		 */
542825e8c5aaSvikram 		cdip = ct->ct_dip;
542925e8c5aaSvikram 		if (!phci_only && cdip &&
543025e8c5aaSvikram 		    (i_ddi_node_state(cdip) >= DS_INITIALIZED) &&
543125e8c5aaSvikram 		    (i_mdi_client_compute_state(ct, ph) ==
543225e8c5aaSvikram 		    MDI_CLIENT_STATE_FAILED)) {
543325e8c5aaSvikram 			i_mdi_client_unlock(ct);
543425e8c5aaSvikram 			MDI_PHCI_UNLOCK(ph);
543525e8c5aaSvikram 			/*
543625e8c5aaSvikram 			 * We don't retire clients we just retire the
543725e8c5aaSvikram 			 * path to a client. If it is the last path
543825e8c5aaSvikram 			 * to a client, constraints are checked and
543925e8c5aaSvikram 			 * if we pass the last path is offlined. MPXIO will
544025e8c5aaSvikram 			 * then fail all I/Os to the client. Since we don't
544125e8c5aaSvikram 			 * want to retire the client on a path error
544225e8c5aaSvikram 			 * set constraint = 0 so that the client dip
544325e8c5aaSvikram 			 * is not retired.
544425e8c5aaSvikram 			 */
544525e8c5aaSvikram 			constraint = 0;
544625e8c5aaSvikram 			(void) e_ddi_retire_finalize(cdip, &constraint);
544725e8c5aaSvikram 			MDI_PHCI_LOCK(ph);
544825e8c5aaSvikram 			pip = next;
544925e8c5aaSvikram 		} else {
545025e8c5aaSvikram 			i_mdi_client_unlock(ct);
545125e8c5aaSvikram 			pip = next;
545225e8c5aaSvikram 		}
545325e8c5aaSvikram 	}
545425e8c5aaSvikram 
545525e8c5aaSvikram 	/*
545625e8c5aaSvikram 	 * Cannot offline pip(s)
545725e8c5aaSvikram 	 */
545825e8c5aaSvikram 	if (unstable) {
54594c06356bSdh142964 		cmn_err(CE_WARN, "%s%d: mdi_phci_retire_finalize: "
54604c06356bSdh142964 		    "pHCI in transient state, cannot retire",
54614c06356bSdh142964 		    ddi_driver_name(dip), ddi_get_instance(dip));
546225e8c5aaSvikram 		MDI_PHCI_UNLOCK(ph);
546325e8c5aaSvikram 		return;
546425e8c5aaSvikram 	}
546525e8c5aaSvikram 
546625e8c5aaSvikram 	/*
546725e8c5aaSvikram 	 * Mark the pHCI as offline
546825e8c5aaSvikram 	 */
546925e8c5aaSvikram 	MDI_PHCI_SET_OFFLINE(ph);
547025e8c5aaSvikram 
547125e8c5aaSvikram 	/*
547225e8c5aaSvikram 	 * Mark the child mdi_pathinfo nodes as transient
547325e8c5aaSvikram 	 */
547425e8c5aaSvikram 	pip = ph->ph_path_head;
547525e8c5aaSvikram 	while (pip != NULL) {
547625e8c5aaSvikram 		MDI_PI_LOCK(pip);
547725e8c5aaSvikram 		next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
547825e8c5aaSvikram 		MDI_PI_SET_OFFLINING(pip);
547925e8c5aaSvikram 		MDI_PI_UNLOCK(pip);
548025e8c5aaSvikram 		pip = next;
548125e8c5aaSvikram 	}
548225e8c5aaSvikram 	MDI_PHCI_UNLOCK(ph);
548325e8c5aaSvikram 	/*
548425e8c5aaSvikram 	 * Give a chance for any pending commands to execute
548525e8c5aaSvikram 	 */
548696c4a178SChris Horne 	delay_random(mdi_delay);
548725e8c5aaSvikram 	MDI_PHCI_LOCK(ph);
548825e8c5aaSvikram 	pip = ph->ph_path_head;
548925e8c5aaSvikram 	while (pip != NULL) {
549025e8c5aaSvikram 		next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
549125e8c5aaSvikram 		(void) i_mdi_pi_offline(pip, 0);
549225e8c5aaSvikram 		MDI_PI_LOCK(pip);
549325e8c5aaSvikram 		ct = MDI_PI(pip)->pi_client;
549425e8c5aaSvikram 		if (!MDI_PI_IS_OFFLINE(pip)) {
54954c06356bSdh142964 			cmn_err(CE_WARN, "mdi_phci_retire_finalize: "
54964c06356bSdh142964 			    "path %d %s busy, cannot offline",
54974c06356bSdh142964 			    mdi_pi_get_path_instance(pip),
54984c06356bSdh142964 			    mdi_pi_spathname(pip));
549925e8c5aaSvikram 			MDI_PI_UNLOCK(pip);
550025e8c5aaSvikram 			MDI_PHCI_SET_ONLINE(ph);
550125e8c5aaSvikram 			MDI_PHCI_UNLOCK(ph);
550225e8c5aaSvikram 			return;
550325e8c5aaSvikram 		}
550425e8c5aaSvikram 		MDI_PI_UNLOCK(pip);
550525e8c5aaSvikram 		pip = next;
550625e8c5aaSvikram 	}
550725e8c5aaSvikram 	MDI_PHCI_UNLOCK(ph);
550825e8c5aaSvikram 
550925e8c5aaSvikram 	return;
551025e8c5aaSvikram }
551125e8c5aaSvikram 
551225e8c5aaSvikram void
551325e8c5aaSvikram mdi_phci_unretire(dev_info_t *dip)
551425e8c5aaSvikram {
551525e8c5aaSvikram 	ASSERT(MDI_PHCI(dip));
551625e8c5aaSvikram 
551725e8c5aaSvikram 	/*
551825e8c5aaSvikram 	 * Online the phci
551925e8c5aaSvikram 	 */
552025e8c5aaSvikram 	i_mdi_phci_online(dip);
552125e8c5aaSvikram }
552225e8c5aaSvikram 
55237c478bd9Sstevel@tonic-gate /*ARGSUSED*/
55247c478bd9Sstevel@tonic-gate static int
55257c478bd9Sstevel@tonic-gate i_mdi_client_offline(dev_info_t *dip, uint_t flags)
55267c478bd9Sstevel@tonic-gate {
55277c478bd9Sstevel@tonic-gate 	int		rv = NDI_SUCCESS;
55287c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
55297c478bd9Sstevel@tonic-gate 
55307c478bd9Sstevel@tonic-gate 	/*
55317c478bd9Sstevel@tonic-gate 	 * Client component to go offline.  Make sure that we are
55327c478bd9Sstevel@tonic-gate 	 * not in failing over state and update client state
55337c478bd9Sstevel@tonic-gate 	 * accordingly
55347c478bd9Sstevel@tonic-gate 	 */
55357c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(dip);
55364c06356bSdh142964 	MDI_DEBUG(2, (MDI_NOTE, dip,
55374c06356bSdh142964 	    "called %p %p", (void *)dip, (void *)ct));
55387c478bd9Sstevel@tonic-gate 	if (ct != NULL) {
55397c478bd9Sstevel@tonic-gate 		MDI_CLIENT_LOCK(ct);
55407c478bd9Sstevel@tonic-gate 		if (ct->ct_unstable) {
55417c478bd9Sstevel@tonic-gate 			/*
55427c478bd9Sstevel@tonic-gate 			 * One or more paths are in transient state,
55437c478bd9Sstevel@tonic-gate 			 * Dont allow offline of a client device
55447c478bd9Sstevel@tonic-gate 			 */
55454c06356bSdh142964 			MDI_DEBUG(1, (MDI_WARN, dip,
55464c06356bSdh142964 			    "!One or more paths to "
55474c06356bSdh142964 			    "this device are in transient state. "
55484c06356bSdh142964 			    "This device can not be removed at this moment. "
55497c478bd9Sstevel@tonic-gate 			    "Please try again later."));
55507c478bd9Sstevel@tonic-gate 			MDI_CLIENT_UNLOCK(ct);
55517c478bd9Sstevel@tonic-gate 			return (NDI_BUSY);
55527c478bd9Sstevel@tonic-gate 		}
55537c478bd9Sstevel@tonic-gate 		if (MDI_CLIENT_IS_FAILOVER_IN_PROGRESS(ct)) {
55547c478bd9Sstevel@tonic-gate 			/*
55557c478bd9Sstevel@tonic-gate 			 * Failover is in progress, Dont allow DR of
55567c478bd9Sstevel@tonic-gate 			 * a client device
55577c478bd9Sstevel@tonic-gate 			 */
55584c06356bSdh142964 			MDI_DEBUG(1, (MDI_WARN, dip,
55594c06356bSdh142964 			    "!Client device is Busy. "
55604c06356bSdh142964 			    "This device can not be removed at this moment. "
55614c06356bSdh142964 			    "Please try again later."));
55627c478bd9Sstevel@tonic-gate 			MDI_CLIENT_UNLOCK(ct);
55637c478bd9Sstevel@tonic-gate 			return (NDI_BUSY);
55647c478bd9Sstevel@tonic-gate 		}
55657c478bd9Sstevel@tonic-gate 		MDI_CLIENT_SET_OFFLINE(ct);
55667c478bd9Sstevel@tonic-gate 
55677c478bd9Sstevel@tonic-gate 		/*
55687c478bd9Sstevel@tonic-gate 		 * Unbind our relationship with the dev_info node
55697c478bd9Sstevel@tonic-gate 		 */
55707c478bd9Sstevel@tonic-gate 		if (flags & NDI_DEVI_REMOVE) {
55717c478bd9Sstevel@tonic-gate 			ct->ct_dip = NULL;
55727c478bd9Sstevel@tonic-gate 		}
55737c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
55747c478bd9Sstevel@tonic-gate 	}
55757c478bd9Sstevel@tonic-gate 	return (rv);
55767c478bd9Sstevel@tonic-gate }
55777c478bd9Sstevel@tonic-gate 
55787c478bd9Sstevel@tonic-gate /*
55797c478bd9Sstevel@tonic-gate  * mdi_pre_attach():
55807c478bd9Sstevel@tonic-gate  *		Pre attach() notification handler
55817c478bd9Sstevel@tonic-gate  */
55827c478bd9Sstevel@tonic-gate /*ARGSUSED*/
55837c478bd9Sstevel@tonic-gate int
55847c478bd9Sstevel@tonic-gate mdi_pre_attach(dev_info_t *dip, ddi_attach_cmd_t cmd)
55857c478bd9Sstevel@tonic-gate {
55867c478bd9Sstevel@tonic-gate 	/* don't support old DDI_PM_RESUME */
55877c478bd9Sstevel@tonic-gate 	if ((DEVI(dip)->devi_mdi_component != MDI_COMPONENT_NONE) &&
55887c478bd9Sstevel@tonic-gate 	    (cmd == DDI_PM_RESUME))
55897c478bd9Sstevel@tonic-gate 		return (DDI_FAILURE);
55907c478bd9Sstevel@tonic-gate 
55917c478bd9Sstevel@tonic-gate 	return (DDI_SUCCESS);
55927c478bd9Sstevel@tonic-gate }
55937c478bd9Sstevel@tonic-gate 
55947c478bd9Sstevel@tonic-gate /*
55957c478bd9Sstevel@tonic-gate  * mdi_post_attach():
55967c478bd9Sstevel@tonic-gate  *		Post attach() notification handler
55977c478bd9Sstevel@tonic-gate  */
55987c478bd9Sstevel@tonic-gate /*ARGSUSED*/
55997c478bd9Sstevel@tonic-gate void
56007c478bd9Sstevel@tonic-gate mdi_post_attach(dev_info_t *dip, ddi_attach_cmd_t cmd, int error)
56017c478bd9Sstevel@tonic-gate {
56027c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
56037c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
560437fbbce5Scth 	mdi_vhci_t	*vh;
56057c478bd9Sstevel@tonic-gate 
56067c478bd9Sstevel@tonic-gate 	if (MDI_PHCI(dip)) {
56077c478bd9Sstevel@tonic-gate 		ph = i_devi_get_phci(dip);
56087c478bd9Sstevel@tonic-gate 		ASSERT(ph != NULL);
56097c478bd9Sstevel@tonic-gate 
56107c478bd9Sstevel@tonic-gate 		MDI_PHCI_LOCK(ph);
56117c478bd9Sstevel@tonic-gate 		switch (cmd) {
56127c478bd9Sstevel@tonic-gate 		case DDI_ATTACH:
56134c06356bSdh142964 			MDI_DEBUG(2, (MDI_NOTE, dip,
56144c06356bSdh142964 			    "phci post_attach called %p", (void *)ph));
56157c478bd9Sstevel@tonic-gate 			if (error == DDI_SUCCESS) {
56167c478bd9Sstevel@tonic-gate 				MDI_PHCI_SET_ATTACH(ph);
56177c478bd9Sstevel@tonic-gate 			} else {
56184c06356bSdh142964 				MDI_DEBUG(1, (MDI_NOTE, dip,
56194c06356bSdh142964 				    "!pHCI post_attach failed: error %d",
56207c478bd9Sstevel@tonic-gate 				    error));
56217c478bd9Sstevel@tonic-gate 				MDI_PHCI_SET_DETACH(ph);
56227c478bd9Sstevel@tonic-gate 			}
56237c478bd9Sstevel@tonic-gate 			break;
56247c478bd9Sstevel@tonic-gate 
56257c478bd9Sstevel@tonic-gate 		case DDI_RESUME:
56264c06356bSdh142964 			MDI_DEBUG(2, (MDI_NOTE, dip,
56274c06356bSdh142964 			    "pHCI post_resume: called %p", (void *)ph));
56287c478bd9Sstevel@tonic-gate 			if (error == DDI_SUCCESS) {
56297c478bd9Sstevel@tonic-gate 				MDI_PHCI_SET_RESUME(ph);
56307c478bd9Sstevel@tonic-gate 			} else {
56314c06356bSdh142964 				MDI_DEBUG(1, (MDI_NOTE, dip,
56324c06356bSdh142964 				    "!pHCI post_resume failed: error %d",
56337c478bd9Sstevel@tonic-gate 				    error));
56347c478bd9Sstevel@tonic-gate 				MDI_PHCI_SET_SUSPEND(ph);
56357c478bd9Sstevel@tonic-gate 			}
56367c478bd9Sstevel@tonic-gate 			break;
56377c478bd9Sstevel@tonic-gate 		}
56387c478bd9Sstevel@tonic-gate 		MDI_PHCI_UNLOCK(ph);
56397c478bd9Sstevel@tonic-gate 	}
56407c478bd9Sstevel@tonic-gate 
56417c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT(dip)) {
56427c478bd9Sstevel@tonic-gate 		ct = i_devi_get_client(dip);
56437c478bd9Sstevel@tonic-gate 		ASSERT(ct != NULL);
56447c478bd9Sstevel@tonic-gate 
56457c478bd9Sstevel@tonic-gate 		MDI_CLIENT_LOCK(ct);
56467c478bd9Sstevel@tonic-gate 		switch (cmd) {
56477c478bd9Sstevel@tonic-gate 		case DDI_ATTACH:
56484c06356bSdh142964 			MDI_DEBUG(2, (MDI_NOTE, dip,
56494c06356bSdh142964 			    "client post_attach called %p", (void *)ct));
56507c478bd9Sstevel@tonic-gate 			if (error != DDI_SUCCESS) {
56514c06356bSdh142964 				MDI_DEBUG(1, (MDI_NOTE, dip,
56524c06356bSdh142964 				    "!client post_attach failed: error %d",
56537c478bd9Sstevel@tonic-gate 				    error));
56547c478bd9Sstevel@tonic-gate 				MDI_CLIENT_SET_DETACH(ct);
56554c06356bSdh142964 				MDI_DEBUG(4, (MDI_WARN, dip,
56564c06356bSdh142964 				    "i_mdi_pm_reset_client"));
56577c478bd9Sstevel@tonic-gate 				i_mdi_pm_reset_client(ct);
56587c478bd9Sstevel@tonic-gate 				break;
56597c478bd9Sstevel@tonic-gate 			}
56607c478bd9Sstevel@tonic-gate 
56617c478bd9Sstevel@tonic-gate 			/*
566237fbbce5Scth 			 * Client device has successfully attached, inform
566337fbbce5Scth 			 * the vhci.
56647c478bd9Sstevel@tonic-gate 			 */
566537fbbce5Scth 			vh = ct->ct_vhci;
566637fbbce5Scth 			if (vh->vh_ops->vo_client_attached)
566737fbbce5Scth 				(*vh->vh_ops->vo_client_attached)(dip);
566837fbbce5Scth 
56697c478bd9Sstevel@tonic-gate 			MDI_CLIENT_SET_ATTACH(ct);
56707c478bd9Sstevel@tonic-gate 			break;
56717c478bd9Sstevel@tonic-gate 
56727c478bd9Sstevel@tonic-gate 		case DDI_RESUME:
56734c06356bSdh142964 			MDI_DEBUG(2, (MDI_NOTE, dip,
56744c06356bSdh142964 			    "client post_attach: called %p", (void *)ct));
56757c478bd9Sstevel@tonic-gate 			if (error == DDI_SUCCESS) {
56767c478bd9Sstevel@tonic-gate 				MDI_CLIENT_SET_RESUME(ct);
56777c478bd9Sstevel@tonic-gate 			} else {
56784c06356bSdh142964 				MDI_DEBUG(1, (MDI_NOTE, dip,
56794c06356bSdh142964 				    "!client post_resume failed: error %d",
56807c478bd9Sstevel@tonic-gate 				    error));
56817c478bd9Sstevel@tonic-gate 				MDI_CLIENT_SET_SUSPEND(ct);
56827c478bd9Sstevel@tonic-gate 			}
56837c478bd9Sstevel@tonic-gate 			break;
56847c478bd9Sstevel@tonic-gate 		}
56857c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
56867c478bd9Sstevel@tonic-gate 	}
56877c478bd9Sstevel@tonic-gate }
56887c478bd9Sstevel@tonic-gate 
56897c478bd9Sstevel@tonic-gate /*
56907c478bd9Sstevel@tonic-gate  * mdi_pre_detach():
56917c478bd9Sstevel@tonic-gate  *		Pre detach notification handler
56927c478bd9Sstevel@tonic-gate  */
56937c478bd9Sstevel@tonic-gate /*ARGSUSED*/
56947c478bd9Sstevel@tonic-gate int
56957c478bd9Sstevel@tonic-gate mdi_pre_detach(dev_info_t *dip, ddi_detach_cmd_t cmd)
56967c478bd9Sstevel@tonic-gate {
56977c478bd9Sstevel@tonic-gate 	int rv = DDI_SUCCESS;
56987c478bd9Sstevel@tonic-gate 
56997c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT(dip)) {
57007c478bd9Sstevel@tonic-gate 		(void) i_mdi_client_pre_detach(dip, cmd);
57017c478bd9Sstevel@tonic-gate 	}
57027c478bd9Sstevel@tonic-gate 
57037c478bd9Sstevel@tonic-gate 	if (MDI_PHCI(dip)) {
57047c478bd9Sstevel@tonic-gate 		rv = i_mdi_phci_pre_detach(dip, cmd);
57057c478bd9Sstevel@tonic-gate 	}
57067c478bd9Sstevel@tonic-gate 
57077c478bd9Sstevel@tonic-gate 	return (rv);
57087c478bd9Sstevel@tonic-gate }
57097c478bd9Sstevel@tonic-gate 
57107c478bd9Sstevel@tonic-gate /*ARGSUSED*/
57117c478bd9Sstevel@tonic-gate static int
57127c478bd9Sstevel@tonic-gate i_mdi_phci_pre_detach(dev_info_t *dip, ddi_detach_cmd_t cmd)
57137c478bd9Sstevel@tonic-gate {
57147c478bd9Sstevel@tonic-gate 	int		rv = DDI_SUCCESS;
57157c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
57167c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
57177c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*pip;
57187c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*failed_pip = NULL;
57197c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*next;
57207c478bd9Sstevel@tonic-gate 
57217c478bd9Sstevel@tonic-gate 	ph = i_devi_get_phci(dip);
57227c478bd9Sstevel@tonic-gate 	if (ph == NULL) {
57237c478bd9Sstevel@tonic-gate 		return (rv);
57247c478bd9Sstevel@tonic-gate 	}
57257c478bd9Sstevel@tonic-gate 
57267c478bd9Sstevel@tonic-gate 	MDI_PHCI_LOCK(ph);
57277c478bd9Sstevel@tonic-gate 	switch (cmd) {
57287c478bd9Sstevel@tonic-gate 	case DDI_DETACH:
57294c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, dip,
57304c06356bSdh142964 		    "pHCI pre_detach: called %p", (void *)ph));
57317c478bd9Sstevel@tonic-gate 		if (!MDI_PHCI_IS_OFFLINE(ph)) {
57327c478bd9Sstevel@tonic-gate 			/*
57337c478bd9Sstevel@tonic-gate 			 * mdi_pathinfo nodes are still attached to
57347c478bd9Sstevel@tonic-gate 			 * this pHCI. Fail the detach for this pHCI.
57357c478bd9Sstevel@tonic-gate 			 */
57364c06356bSdh142964 			MDI_DEBUG(2, (MDI_WARN, dip,
57374c06356bSdh142964 			    "pHCI pre_detach: paths are still attached %p",
57384c06356bSdh142964 			    (void *)ph));
57397c478bd9Sstevel@tonic-gate 			rv = DDI_FAILURE;
57407c478bd9Sstevel@tonic-gate 			break;
57417c478bd9Sstevel@tonic-gate 		}
57427c478bd9Sstevel@tonic-gate 		MDI_PHCI_SET_DETACH(ph);
57437c478bd9Sstevel@tonic-gate 		break;
57447c478bd9Sstevel@tonic-gate 
57457c478bd9Sstevel@tonic-gate 	case DDI_SUSPEND:
57467c478bd9Sstevel@tonic-gate 		/*
57477c478bd9Sstevel@tonic-gate 		 * pHCI is getting suspended.  Since mpxio client
57487c478bd9Sstevel@tonic-gate 		 * devices may not be suspended at this point, to avoid
57497c478bd9Sstevel@tonic-gate 		 * a potential stack overflow, it is important to suspend
57507c478bd9Sstevel@tonic-gate 		 * client devices before pHCI can be suspended.
57517c478bd9Sstevel@tonic-gate 		 */
57527c478bd9Sstevel@tonic-gate 
57534c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, dip,
57544c06356bSdh142964 		    "pHCI pre_suspend: called %p", (void *)ph));
57557c478bd9Sstevel@tonic-gate 		/*
57567c478bd9Sstevel@tonic-gate 		 * Suspend all the client devices accessible through this pHCI
57577c478bd9Sstevel@tonic-gate 		 */
57587c478bd9Sstevel@tonic-gate 		pip = ph->ph_path_head;
57597c478bd9Sstevel@tonic-gate 		while (pip != NULL && rv == DDI_SUCCESS) {
57607c478bd9Sstevel@tonic-gate 			dev_info_t *cdip;
57617c478bd9Sstevel@tonic-gate 			MDI_PI_LOCK(pip);
57627c478bd9Sstevel@tonic-gate 			next =
57637c478bd9Sstevel@tonic-gate 			    (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
57647c478bd9Sstevel@tonic-gate 			ct = MDI_PI(pip)->pi_client;
57657c478bd9Sstevel@tonic-gate 			i_mdi_client_lock(ct, pip);
57667c478bd9Sstevel@tonic-gate 			cdip = ct->ct_dip;
57677c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
57687c478bd9Sstevel@tonic-gate 			if ((MDI_CLIENT_IS_DETACHED(ct) == 0) &&
57697c478bd9Sstevel@tonic-gate 			    MDI_CLIENT_IS_SUSPENDED(ct) == 0) {
57707c478bd9Sstevel@tonic-gate 				i_mdi_client_unlock(ct);
57717c478bd9Sstevel@tonic-gate 				if ((rv = devi_detach(cdip, DDI_SUSPEND)) !=
57727c478bd9Sstevel@tonic-gate 				    DDI_SUCCESS) {
57737c478bd9Sstevel@tonic-gate 					/*
57747c478bd9Sstevel@tonic-gate 					 * Suspend of one of the client
57757c478bd9Sstevel@tonic-gate 					 * device has failed.
57767c478bd9Sstevel@tonic-gate 					 */
57774c06356bSdh142964 					MDI_DEBUG(1, (MDI_WARN, dip,
57784c06356bSdh142964 					    "!suspend of device (%s%d) failed.",
57797c478bd9Sstevel@tonic-gate 					    ddi_driver_name(cdip),
57807c478bd9Sstevel@tonic-gate 					    ddi_get_instance(cdip)));
57817c478bd9Sstevel@tonic-gate 					failed_pip = pip;
57827c478bd9Sstevel@tonic-gate 					break;
57837c478bd9Sstevel@tonic-gate 				}
57847c478bd9Sstevel@tonic-gate 			} else {
57857c478bd9Sstevel@tonic-gate 				i_mdi_client_unlock(ct);
57867c478bd9Sstevel@tonic-gate 			}
57877c478bd9Sstevel@tonic-gate 			pip = next;
57887c478bd9Sstevel@tonic-gate 		}
57897c478bd9Sstevel@tonic-gate 
57907c478bd9Sstevel@tonic-gate 		if (rv == DDI_SUCCESS) {
57917c478bd9Sstevel@tonic-gate 			/*
57927c478bd9Sstevel@tonic-gate 			 * Suspend of client devices is complete. Proceed
57937c478bd9Sstevel@tonic-gate 			 * with pHCI suspend.
57947c478bd9Sstevel@tonic-gate 			 */
57957c478bd9Sstevel@tonic-gate 			MDI_PHCI_SET_SUSPEND(ph);
57967c478bd9Sstevel@tonic-gate 		} else {
57977c478bd9Sstevel@tonic-gate 			/*
57987c478bd9Sstevel@tonic-gate 			 * Revert back all the suspended client device states
57997c478bd9Sstevel@tonic-gate 			 * to converse.
58007c478bd9Sstevel@tonic-gate 			 */
58017c478bd9Sstevel@tonic-gate 			pip = ph->ph_path_head;
58027c478bd9Sstevel@tonic-gate 			while (pip != failed_pip) {
58037c478bd9Sstevel@tonic-gate 				dev_info_t *cdip;
58047c478bd9Sstevel@tonic-gate 				MDI_PI_LOCK(pip);
58057c478bd9Sstevel@tonic-gate 				next =
58067c478bd9Sstevel@tonic-gate 				    (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
58077c478bd9Sstevel@tonic-gate 				ct = MDI_PI(pip)->pi_client;
58087c478bd9Sstevel@tonic-gate 				i_mdi_client_lock(ct, pip);
58097c478bd9Sstevel@tonic-gate 				cdip = ct->ct_dip;
58107c478bd9Sstevel@tonic-gate 				MDI_PI_UNLOCK(pip);
58117c478bd9Sstevel@tonic-gate 				if (MDI_CLIENT_IS_SUSPENDED(ct)) {
58127c478bd9Sstevel@tonic-gate 					i_mdi_client_unlock(ct);
58137c478bd9Sstevel@tonic-gate 					(void) devi_attach(cdip, DDI_RESUME);
58147c478bd9Sstevel@tonic-gate 				} else {
58157c478bd9Sstevel@tonic-gate 					i_mdi_client_unlock(ct);
58167c478bd9Sstevel@tonic-gate 				}
58177c478bd9Sstevel@tonic-gate 				pip = next;
58187c478bd9Sstevel@tonic-gate 			}
58197c478bd9Sstevel@tonic-gate 		}
58207c478bd9Sstevel@tonic-gate 		break;
58217c478bd9Sstevel@tonic-gate 
58227c478bd9Sstevel@tonic-gate 	default:
58237c478bd9Sstevel@tonic-gate 		rv = DDI_FAILURE;
58247c478bd9Sstevel@tonic-gate 		break;
58257c478bd9Sstevel@tonic-gate 	}
58267c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNLOCK(ph);
58277c478bd9Sstevel@tonic-gate 	return (rv);
58287c478bd9Sstevel@tonic-gate }
58297c478bd9Sstevel@tonic-gate 
58307c478bd9Sstevel@tonic-gate /*ARGSUSED*/
58317c478bd9Sstevel@tonic-gate static int
58327c478bd9Sstevel@tonic-gate i_mdi_client_pre_detach(dev_info_t *dip, ddi_detach_cmd_t cmd)
58337c478bd9Sstevel@tonic-gate {
58347c478bd9Sstevel@tonic-gate 	int		rv = DDI_SUCCESS;
58357c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
58367c478bd9Sstevel@tonic-gate 
58377c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(dip);
58387c478bd9Sstevel@tonic-gate 	if (ct == NULL) {
58397c478bd9Sstevel@tonic-gate 		return (rv);
58407c478bd9Sstevel@tonic-gate 	}
58417c478bd9Sstevel@tonic-gate 
58427c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
58437c478bd9Sstevel@tonic-gate 	switch (cmd) {
58447c478bd9Sstevel@tonic-gate 	case DDI_DETACH:
58454c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, dip,
58464c06356bSdh142964 		    "client pre_detach: called %p",
58474c06356bSdh142964 		     (void *)ct));
58487c478bd9Sstevel@tonic-gate 		MDI_CLIENT_SET_DETACH(ct);
58497c478bd9Sstevel@tonic-gate 		break;
58507c478bd9Sstevel@tonic-gate 
58517c478bd9Sstevel@tonic-gate 	case DDI_SUSPEND:
58524c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, dip,
58534c06356bSdh142964 		    "client pre_suspend: called %p",
58544c06356bSdh142964 		    (void *)ct));
58557c478bd9Sstevel@tonic-gate 		MDI_CLIENT_SET_SUSPEND(ct);
58567c478bd9Sstevel@tonic-gate 		break;
58577c478bd9Sstevel@tonic-gate 
58587c478bd9Sstevel@tonic-gate 	default:
58597c478bd9Sstevel@tonic-gate 		rv = DDI_FAILURE;
58607c478bd9Sstevel@tonic-gate 		break;
58617c478bd9Sstevel@tonic-gate 	}
58627c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
58637c478bd9Sstevel@tonic-gate 	return (rv);
58647c478bd9Sstevel@tonic-gate }
58657c478bd9Sstevel@tonic-gate 
58667c478bd9Sstevel@tonic-gate /*
58677c478bd9Sstevel@tonic-gate  * mdi_post_detach():
58687c478bd9Sstevel@tonic-gate  *		Post detach notification handler
58697c478bd9Sstevel@tonic-gate  */
58707c478bd9Sstevel@tonic-gate /*ARGSUSED*/
58717c478bd9Sstevel@tonic-gate void
58727c478bd9Sstevel@tonic-gate mdi_post_detach(dev_info_t *dip, ddi_detach_cmd_t cmd, int error)
58737c478bd9Sstevel@tonic-gate {
58747c478bd9Sstevel@tonic-gate 	/*
58757c478bd9Sstevel@tonic-gate 	 * Detach/Suspend of mpxio component failed. Update our state
58767c478bd9Sstevel@tonic-gate 	 * too
58777c478bd9Sstevel@tonic-gate 	 */
58787c478bd9Sstevel@tonic-gate 	if (MDI_PHCI(dip))
58797c478bd9Sstevel@tonic-gate 		i_mdi_phci_post_detach(dip, cmd, error);
58807c478bd9Sstevel@tonic-gate 
58817c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT(dip))
58827c478bd9Sstevel@tonic-gate 		i_mdi_client_post_detach(dip, cmd, error);
58837c478bd9Sstevel@tonic-gate }
58847c478bd9Sstevel@tonic-gate 
58857c478bd9Sstevel@tonic-gate /*ARGSUSED*/
58867c478bd9Sstevel@tonic-gate static void
58877c478bd9Sstevel@tonic-gate i_mdi_phci_post_detach(dev_info_t *dip, ddi_detach_cmd_t cmd, int error)
58887c478bd9Sstevel@tonic-gate {
58897c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
58907c478bd9Sstevel@tonic-gate 
58917c478bd9Sstevel@tonic-gate 	/*
58927c478bd9Sstevel@tonic-gate 	 * Detach/Suspend of phci component failed. Update our state
58937c478bd9Sstevel@tonic-gate 	 * too
58947c478bd9Sstevel@tonic-gate 	 */
58957c478bd9Sstevel@tonic-gate 	ph = i_devi_get_phci(dip);
58967c478bd9Sstevel@tonic-gate 	if (ph == NULL) {
58977c478bd9Sstevel@tonic-gate 		return;
58987c478bd9Sstevel@tonic-gate 	}
58997c478bd9Sstevel@tonic-gate 
59007c478bd9Sstevel@tonic-gate 	MDI_PHCI_LOCK(ph);
59017c478bd9Sstevel@tonic-gate 	/*
59027c478bd9Sstevel@tonic-gate 	 * Detach of pHCI failed. Restore back converse
59037c478bd9Sstevel@tonic-gate 	 * state
59047c478bd9Sstevel@tonic-gate 	 */
59057c478bd9Sstevel@tonic-gate 	switch (cmd) {
59067c478bd9Sstevel@tonic-gate 	case DDI_DETACH:
59074c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, dip,
59084c06356bSdh142964 		    "pHCI post_detach: called %p",
59094c06356bSdh142964 		    (void *)ph));
59107c478bd9Sstevel@tonic-gate 		if (error != DDI_SUCCESS)
59117c478bd9Sstevel@tonic-gate 			MDI_PHCI_SET_ATTACH(ph);
59127c478bd9Sstevel@tonic-gate 		break;
59137c478bd9Sstevel@tonic-gate 
59147c478bd9Sstevel@tonic-gate 	case DDI_SUSPEND:
59154c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, dip,
59164c06356bSdh142964 		    "pHCI post_suspend: called %p",
59174c06356bSdh142964 		    (void *)ph));
59187c478bd9Sstevel@tonic-gate 		if (error != DDI_SUCCESS)
59197c478bd9Sstevel@tonic-gate 			MDI_PHCI_SET_RESUME(ph);
59207c478bd9Sstevel@tonic-gate 		break;
59217c478bd9Sstevel@tonic-gate 	}
59227c478bd9Sstevel@tonic-gate 	MDI_PHCI_UNLOCK(ph);
59237c478bd9Sstevel@tonic-gate }
59247c478bd9Sstevel@tonic-gate 
59257c478bd9Sstevel@tonic-gate /*ARGSUSED*/
59267c478bd9Sstevel@tonic-gate static void
59277c478bd9Sstevel@tonic-gate i_mdi_client_post_detach(dev_info_t *dip, ddi_detach_cmd_t cmd, int error)
59287c478bd9Sstevel@tonic-gate {
59297c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
59307c478bd9Sstevel@tonic-gate 
59317c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(dip);
59327c478bd9Sstevel@tonic-gate 	if (ct == NULL) {
59337c478bd9Sstevel@tonic-gate 		return;
59347c478bd9Sstevel@tonic-gate 	}
59357c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
59367c478bd9Sstevel@tonic-gate 	/*
59377c478bd9Sstevel@tonic-gate 	 * Detach of Client failed. Restore back converse
59387c478bd9Sstevel@tonic-gate 	 * state
59397c478bd9Sstevel@tonic-gate 	 */
59407c478bd9Sstevel@tonic-gate 	switch (cmd) {
59417c478bd9Sstevel@tonic-gate 	case DDI_DETACH:
59424c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, dip,
59434c06356bSdh142964 		    "client post_detach: called %p", (void *)ct));
59447c478bd9Sstevel@tonic-gate 		if (DEVI_IS_ATTACHING(ct->ct_dip)) {
59454c06356bSdh142964 			MDI_DEBUG(4, (MDI_NOTE, dip,
59467c478bd9Sstevel@tonic-gate 			    "i_mdi_pm_rele_client\n"));
59477c478bd9Sstevel@tonic-gate 			i_mdi_pm_rele_client(ct, ct->ct_path_count);
59487c478bd9Sstevel@tonic-gate 		} else {
59494c06356bSdh142964 			MDI_DEBUG(4, (MDI_NOTE, dip,
59507c478bd9Sstevel@tonic-gate 			    "i_mdi_pm_reset_client\n"));
59517c478bd9Sstevel@tonic-gate 			i_mdi_pm_reset_client(ct);
59527c478bd9Sstevel@tonic-gate 		}
59537c478bd9Sstevel@tonic-gate 		if (error != DDI_SUCCESS)
59547c478bd9Sstevel@tonic-gate 			MDI_CLIENT_SET_ATTACH(ct);
59557c478bd9Sstevel@tonic-gate 		break;
59567c478bd9Sstevel@tonic-gate 
59577c478bd9Sstevel@tonic-gate 	case DDI_SUSPEND:
59584c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, dip,
59594c06356bSdh142964 		    "called %p", (void *)ct));
59607c478bd9Sstevel@tonic-gate 		if (error != DDI_SUCCESS)
59617c478bd9Sstevel@tonic-gate 			MDI_CLIENT_SET_RESUME(ct);
59627c478bd9Sstevel@tonic-gate 		break;
59637c478bd9Sstevel@tonic-gate 	}
59647c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
59657c478bd9Sstevel@tonic-gate }
59667c478bd9Sstevel@tonic-gate 
596737fbbce5Scth int
596837fbbce5Scth mdi_pi_kstat_exists(mdi_pathinfo_t *pip)
596937fbbce5Scth {
597037fbbce5Scth 	return (MDI_PI(pip)->pi_kstats ? 1 : 0);
597137fbbce5Scth }
597237fbbce5Scth 
59737c478bd9Sstevel@tonic-gate /*
59747c478bd9Sstevel@tonic-gate  * create and install per-path (client - pHCI) statistics
59757c478bd9Sstevel@tonic-gate  * I/O stats supported: nread, nwritten, reads, and writes
59767c478bd9Sstevel@tonic-gate  * Error stats - hard errors, soft errors, & transport errors
59777c478bd9Sstevel@tonic-gate  */
597837fbbce5Scth int
597937fbbce5Scth mdi_pi_kstat_create(mdi_pathinfo_t *pip, char *ksname)
59807c478bd9Sstevel@tonic-gate {
59817c478bd9Sstevel@tonic-gate 	kstat_t			*kiosp, *kerrsp;
59827c478bd9Sstevel@tonic-gate 	struct pi_errs		*nsp;
59837c478bd9Sstevel@tonic-gate 	struct mdi_pi_kstats	*mdi_statp;
59847c478bd9Sstevel@tonic-gate 
59857c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_kstats != NULL)
59867c478bd9Sstevel@tonic-gate 		return (MDI_SUCCESS);
59877c478bd9Sstevel@tonic-gate 
59887c478bd9Sstevel@tonic-gate 	if ((kiosp = kstat_create("mdi", 0, ksname, "iopath",
598937fbbce5Scth 	    KSTAT_TYPE_IO, 1, KSTAT_FLAG_PERSISTENT)) == NULL) {
59907c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
59917c478bd9Sstevel@tonic-gate 	}
59927c478bd9Sstevel@tonic-gate 
599337fbbce5Scth 	(void) strcat(ksname, ",err");
59947c478bd9Sstevel@tonic-gate 	kerrsp = kstat_create("mdi", 0, ksname, "iopath_errors",
59957c478bd9Sstevel@tonic-gate 	    KSTAT_TYPE_NAMED,
59967c478bd9Sstevel@tonic-gate 	    sizeof (struct pi_errs) / sizeof (kstat_named_t), 0);
59977c478bd9Sstevel@tonic-gate 	if (kerrsp == NULL) {
59987c478bd9Sstevel@tonic-gate 		kstat_delete(kiosp);
59997c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
60007c478bd9Sstevel@tonic-gate 	}
60017c478bd9Sstevel@tonic-gate 
60027c478bd9Sstevel@tonic-gate 	nsp = (struct pi_errs *)kerrsp->ks_data;
60037c478bd9Sstevel@tonic-gate 	kstat_named_init(&nsp->pi_softerrs, "Soft Errors", KSTAT_DATA_UINT32);
60047c478bd9Sstevel@tonic-gate 	kstat_named_init(&nsp->pi_harderrs, "Hard Errors", KSTAT_DATA_UINT32);
60057c478bd9Sstevel@tonic-gate 	kstat_named_init(&nsp->pi_transerrs, "Transport Errors",
60067c478bd9Sstevel@tonic-gate 	    KSTAT_DATA_UINT32);
60077c478bd9Sstevel@tonic-gate 	kstat_named_init(&nsp->pi_icnt_busy, "Interconnect Busy",
60087c478bd9Sstevel@tonic-gate 	    KSTAT_DATA_UINT32);
60097c478bd9Sstevel@tonic-gate 	kstat_named_init(&nsp->pi_icnt_errors, "Interconnect Errors",
60107c478bd9Sstevel@tonic-gate 	    KSTAT_DATA_UINT32);
60117c478bd9Sstevel@tonic-gate 	kstat_named_init(&nsp->pi_phci_rsrc, "pHCI No Resources",
60127c478bd9Sstevel@tonic-gate 	    KSTAT_DATA_UINT32);
60137c478bd9Sstevel@tonic-gate 	kstat_named_init(&nsp->pi_phci_localerr, "pHCI Local Errors",
60147c478bd9Sstevel@tonic-gate 	    KSTAT_DATA_UINT32);
60157c478bd9Sstevel@tonic-gate 	kstat_named_init(&nsp->pi_phci_invstate, "pHCI Invalid State",
60167c478bd9Sstevel@tonic-gate 	    KSTAT_DATA_UINT32);
60177c478bd9Sstevel@tonic-gate 	kstat_named_init(&nsp->pi_failedfrom, "Failed From",
60187c478bd9Sstevel@tonic-gate 	    KSTAT_DATA_UINT32);
60197c478bd9Sstevel@tonic-gate 	kstat_named_init(&nsp->pi_failedto, "Failed To", KSTAT_DATA_UINT32);
60207c478bd9Sstevel@tonic-gate 
60217c478bd9Sstevel@tonic-gate 	mdi_statp = kmem_alloc(sizeof (*mdi_statp), KM_SLEEP);
60227c478bd9Sstevel@tonic-gate 	mdi_statp->pi_kstat_ref = 1;
60237c478bd9Sstevel@tonic-gate 	mdi_statp->pi_kstat_iostats = kiosp;
60247c478bd9Sstevel@tonic-gate 	mdi_statp->pi_kstat_errstats = kerrsp;
60257c478bd9Sstevel@tonic-gate 	kstat_install(kiosp);
60267c478bd9Sstevel@tonic-gate 	kstat_install(kerrsp);
60277c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_kstats = mdi_statp;
60287c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
60297c478bd9Sstevel@tonic-gate }
60307c478bd9Sstevel@tonic-gate 
60317c478bd9Sstevel@tonic-gate /*
60327c478bd9Sstevel@tonic-gate  * destroy per-path properties
60337c478bd9Sstevel@tonic-gate  */
60347c478bd9Sstevel@tonic-gate static void
60357c478bd9Sstevel@tonic-gate i_mdi_pi_kstat_destroy(mdi_pathinfo_t *pip)
60367c478bd9Sstevel@tonic-gate {
60377c478bd9Sstevel@tonic-gate 
60387c478bd9Sstevel@tonic-gate 	struct mdi_pi_kstats *mdi_statp;
60397c478bd9Sstevel@tonic-gate 
604037fbbce5Scth 	if (MDI_PI(pip)->pi_kstats == NULL)
604137fbbce5Scth 		return;
60427c478bd9Sstevel@tonic-gate 	if ((mdi_statp = MDI_PI(pip)->pi_kstats) == NULL)
60437c478bd9Sstevel@tonic-gate 		return;
60447c478bd9Sstevel@tonic-gate 
60457c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_kstats = NULL;
60467c478bd9Sstevel@tonic-gate 
60477c478bd9Sstevel@tonic-gate 	/*
60487c478bd9Sstevel@tonic-gate 	 * the kstat may be shared between multiple pathinfo nodes
60497c478bd9Sstevel@tonic-gate 	 * decrement this pathinfo's usage, removing the kstats
60507c478bd9Sstevel@tonic-gate 	 * themselves when the last pathinfo reference is removed.
60517c478bd9Sstevel@tonic-gate 	 */
60527c478bd9Sstevel@tonic-gate 	ASSERT(mdi_statp->pi_kstat_ref > 0);
60537c478bd9Sstevel@tonic-gate 	if (--mdi_statp->pi_kstat_ref != 0)
60547c478bd9Sstevel@tonic-gate 		return;
60557c478bd9Sstevel@tonic-gate 
60567c478bd9Sstevel@tonic-gate 	kstat_delete(mdi_statp->pi_kstat_iostats);
60577c478bd9Sstevel@tonic-gate 	kstat_delete(mdi_statp->pi_kstat_errstats);
60587c478bd9Sstevel@tonic-gate 	kmem_free(mdi_statp, sizeof (*mdi_statp));
60597c478bd9Sstevel@tonic-gate }
60607c478bd9Sstevel@tonic-gate 
60617c478bd9Sstevel@tonic-gate /*
60627c478bd9Sstevel@tonic-gate  * update I/O paths KSTATS
60637c478bd9Sstevel@tonic-gate  */
60647c478bd9Sstevel@tonic-gate void
60657c478bd9Sstevel@tonic-gate mdi_pi_kstat_iosupdate(mdi_pathinfo_t *pip, struct buf *bp)
60667c478bd9Sstevel@tonic-gate {
60677c478bd9Sstevel@tonic-gate 	kstat_t *iostatp;
60687c478bd9Sstevel@tonic-gate 	size_t xfer_cnt;
60697c478bd9Sstevel@tonic-gate 
60707c478bd9Sstevel@tonic-gate 	ASSERT(pip != NULL);
60717c478bd9Sstevel@tonic-gate 
60727c478bd9Sstevel@tonic-gate 	/*
60737c478bd9Sstevel@tonic-gate 	 * I/O can be driven across a path prior to having path
60747c478bd9Sstevel@tonic-gate 	 * statistics available, i.e. probe(9e).
60757c478bd9Sstevel@tonic-gate 	 */
60767c478bd9Sstevel@tonic-gate 	if (bp != NULL && MDI_PI(pip)->pi_kstats != NULL) {
60777c478bd9Sstevel@tonic-gate 		iostatp = MDI_PI(pip)->pi_kstats->pi_kstat_iostats;
60787c478bd9Sstevel@tonic-gate 		xfer_cnt = bp->b_bcount - bp->b_resid;
60797c478bd9Sstevel@tonic-gate 		if (bp->b_flags & B_READ) {
60807c478bd9Sstevel@tonic-gate 			KSTAT_IO_PTR(iostatp)->reads++;
60817c478bd9Sstevel@tonic-gate 			KSTAT_IO_PTR(iostatp)->nread += xfer_cnt;
60827c478bd9Sstevel@tonic-gate 		} else {
60837c478bd9Sstevel@tonic-gate 			KSTAT_IO_PTR(iostatp)->writes++;
60847c478bd9Sstevel@tonic-gate 			KSTAT_IO_PTR(iostatp)->nwritten += xfer_cnt;
60857c478bd9Sstevel@tonic-gate 		}
60867c478bd9Sstevel@tonic-gate 	}
60877c478bd9Sstevel@tonic-gate }
60887c478bd9Sstevel@tonic-gate 
60897c478bd9Sstevel@tonic-gate /*
6090ee28b439Scm136836  * Enable the path(specific client/target/initiator)
6091ee28b439Scm136836  * Enabling a path means that MPxIO may select the enabled path for routing
6092ee28b439Scm136836  * future I/O requests, subject to other path state constraints.
6093ee28b439Scm136836  */
6094ee28b439Scm136836 int
6095ee28b439Scm136836 mdi_pi_enable_path(mdi_pathinfo_t *pip, int flags)
6096ee28b439Scm136836 {
6097ee28b439Scm136836 	mdi_phci_t	*ph;
6098ee28b439Scm136836 
60994c06356bSdh142964 	ph = MDI_PI(pip)->pi_phci;
6100ee28b439Scm136836 	if (ph == NULL) {
61014c06356bSdh142964 		MDI_DEBUG(1, (MDI_NOTE, mdi_pi_get_phci(pip),
61024c06356bSdh142964 		    "!failed: path %s %p: NULL ph",
61034c06356bSdh142964 		    mdi_pi_spathname(pip), (void *)pip));
6104ee28b439Scm136836 		return (MDI_FAILURE);
6105ee28b439Scm136836 	}
6106ee28b439Scm136836 
6107ee28b439Scm136836 	(void) i_mdi_enable_disable_path(pip, ph->ph_vhci, flags,
6108ee28b439Scm136836 		MDI_ENABLE_OP);
61094c06356bSdh142964 	MDI_DEBUG(5, (MDI_NOTE, ph->ph_dip,
61104c06356bSdh142964 	    "!returning success pip = %p. ph = %p",
61115e3986cbScth 	    (void *)pip, (void *)ph));
6112ee28b439Scm136836 	return (MDI_SUCCESS);
6113ee28b439Scm136836 
6114ee28b439Scm136836 }
6115ee28b439Scm136836 
6116ee28b439Scm136836 /*
6117ee28b439Scm136836  * Disable the path (specific client/target/initiator)
6118ee28b439Scm136836  * Disabling a path means that MPxIO will not select the disabled path for
6119ee28b439Scm136836  * routing any new I/O requests.
6120ee28b439Scm136836  */
6121ee28b439Scm136836 int
6122ee28b439Scm136836 mdi_pi_disable_path(mdi_pathinfo_t *pip, int flags)
6123ee28b439Scm136836 {
6124ee28b439Scm136836 	mdi_phci_t	*ph;
6125ee28b439Scm136836 
61264c06356bSdh142964 	ph = MDI_PI(pip)->pi_phci;
6127ee28b439Scm136836 	if (ph == NULL) {
61284c06356bSdh142964 		MDI_DEBUG(1, (MDI_NOTE, mdi_pi_get_phci(pip),
61294c06356bSdh142964 		    "!failed: path %s %p: NULL ph",
61304c06356bSdh142964 		    mdi_pi_spathname(pip), (void *)pip));
6131ee28b439Scm136836 		return (MDI_FAILURE);
6132ee28b439Scm136836 	}
6133ee28b439Scm136836 
6134ee28b439Scm136836 	(void) i_mdi_enable_disable_path(pip,
6135ee28b439Scm136836 	    ph->ph_vhci, flags, MDI_DISABLE_OP);
61364c06356bSdh142964 	MDI_DEBUG(5, (MDI_NOTE, ph->ph_dip,
61374c06356bSdh142964 	    "!returning success pip = %p. ph = %p",
61385e3986cbScth 	    (void *)pip, (void *)ph));
6139ee28b439Scm136836 	return (MDI_SUCCESS);
6140ee28b439Scm136836 }
6141ee28b439Scm136836 
6142ee28b439Scm136836 /*
61437c478bd9Sstevel@tonic-gate  * disable the path to a particular pHCI (pHCI specified in the phci_path
61447c478bd9Sstevel@tonic-gate  * argument) for a particular client (specified in the client_path argument).
61457c478bd9Sstevel@tonic-gate  * Disabling a path means that MPxIO will not select the disabled path for
61467c478bd9Sstevel@tonic-gate  * routing any new I/O requests.
6147ee28b439Scm136836  * NOTE: this will be removed once the NWS files are changed to use the new
6148ee28b439Scm136836  * mdi_{enable,disable}_path interfaces
61497c478bd9Sstevel@tonic-gate  */
61507c478bd9Sstevel@tonic-gate int
61517c478bd9Sstevel@tonic-gate mdi_pi_disable(dev_info_t *cdip, dev_info_t *pdip, int flags)
61527c478bd9Sstevel@tonic-gate {
61537c478bd9Sstevel@tonic-gate 	return (i_mdi_pi_enable_disable(cdip, pdip, flags, MDI_DISABLE_OP));
61547c478bd9Sstevel@tonic-gate }
61557c478bd9Sstevel@tonic-gate 
61567c478bd9Sstevel@tonic-gate /*
61577c478bd9Sstevel@tonic-gate  * Enable the path to a particular pHCI (pHCI specified in the phci_path
61587c478bd9Sstevel@tonic-gate  * argument) for a particular client (specified in the client_path argument).
61597c478bd9Sstevel@tonic-gate  * Enabling a path means that MPxIO may select the enabled path for routing
61607c478bd9Sstevel@tonic-gate  * future I/O requests, subject to other path state constraints.
6161ee28b439Scm136836  * NOTE: this will be removed once the NWS files are changed to use the new
6162ee28b439Scm136836  * mdi_{enable,disable}_path interfaces
61637c478bd9Sstevel@tonic-gate  */
61647c478bd9Sstevel@tonic-gate 
61657c478bd9Sstevel@tonic-gate int
61667c478bd9Sstevel@tonic-gate mdi_pi_enable(dev_info_t *cdip, dev_info_t *pdip, int flags)
61677c478bd9Sstevel@tonic-gate {
61687c478bd9Sstevel@tonic-gate 	return (i_mdi_pi_enable_disable(cdip, pdip, flags, MDI_ENABLE_OP));
61697c478bd9Sstevel@tonic-gate }
61707c478bd9Sstevel@tonic-gate 
6171ee28b439Scm136836 /*
6172ee28b439Scm136836  * Common routine for doing enable/disable.
6173ee28b439Scm136836  */
6174ee28b439Scm136836 static mdi_pathinfo_t *
6175ee28b439Scm136836 i_mdi_enable_disable_path(mdi_pathinfo_t *pip, mdi_vhci_t *vh, int flags,
6176ee28b439Scm136836 		int op)
6177ee28b439Scm136836 {
6178ee28b439Scm136836 	int		sync_flag = 0;
6179ee28b439Scm136836 	int		rv;
6180ee28b439Scm136836 	mdi_pathinfo_t 	*next;
6181ee28b439Scm136836 	int		(*f)() = NULL;
6182ee28b439Scm136836 
61836c8e19d4SZach Kissel 	/*
61846c8e19d4SZach Kissel 	 * Check to make sure the path is not already in the
61856c8e19d4SZach Kissel 	 * requested state. If it is just return the next path
61866c8e19d4SZach Kissel 	 * as we have nothing to do here.
61876c8e19d4SZach Kissel 	 */
61886c8e19d4SZach Kissel 	if ((MDI_PI_IS_DISABLE(pip) && op == MDI_DISABLE_OP) ||
61896c8e19d4SZach Kissel 	    (!MDI_PI_IS_DISABLE(pip) && op == MDI_ENABLE_OP)) {
61906c8e19d4SZach Kissel 		MDI_PI_LOCK(pip);
61916c8e19d4SZach Kissel 		next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
61926c8e19d4SZach Kissel 		MDI_PI_UNLOCK(pip);
61936c8e19d4SZach Kissel 		return (next);
61946c8e19d4SZach Kissel 	}
61956c8e19d4SZach Kissel 
6196ee28b439Scm136836 	f = vh->vh_ops->vo_pi_state_change;
6197ee28b439Scm136836 
6198ee28b439Scm136836 	sync_flag = (flags << 8) & 0xf00;
6199ee28b439Scm136836 
6200ee28b439Scm136836 	/*
6201ee28b439Scm136836 	 * Do a callback into the mdi consumer to let it
6202ee28b439Scm136836 	 * know that path is about to get enabled/disabled.
6203ee28b439Scm136836 	 */
6204ee28b439Scm136836 	if (f != NULL) {
6205ee28b439Scm136836 		rv = (*f)(vh->vh_dip, pip, 0,
6206ee28b439Scm136836 			MDI_PI_EXT_STATE(pip),
6207ee28b439Scm136836 			MDI_EXT_STATE_CHANGE | sync_flag |
6208ee28b439Scm136836 			op | MDI_BEFORE_STATE_CHANGE);
6209ee28b439Scm136836 		if (rv != MDI_SUCCESS) {
62104c06356bSdh142964 			MDI_DEBUG(2, (MDI_WARN, vh->vh_dip,
62114c06356bSdh142964 			    "vo_pi_state_change: failed rv = %x", rv));
6212ee28b439Scm136836 		}
6213ee28b439Scm136836 	}
6214ee28b439Scm136836 	MDI_PI_LOCK(pip);
6215ee28b439Scm136836 	next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_phci_link;
6216ee28b439Scm136836 
6217ee28b439Scm136836 	switch (flags) {
6218ee28b439Scm136836 		case USER_DISABLE:
62195e3986cbScth 			if (op == MDI_DISABLE_OP) {
6220ee28b439Scm136836 				MDI_PI_SET_USER_DISABLE(pip);
62215e3986cbScth 			} else {
6222ee28b439Scm136836 				MDI_PI_SET_USER_ENABLE(pip);
62235e3986cbScth 			}
6224ee28b439Scm136836 			break;
6225ee28b439Scm136836 		case DRIVER_DISABLE:
62265e3986cbScth 			if (op == MDI_DISABLE_OP) {
6227ee28b439Scm136836 				MDI_PI_SET_DRV_DISABLE(pip);
62285e3986cbScth 			} else {
6229ee28b439Scm136836 				MDI_PI_SET_DRV_ENABLE(pip);
62305e3986cbScth 			}
6231ee28b439Scm136836 			break;
6232ee28b439Scm136836 		case DRIVER_DISABLE_TRANSIENT:
62335e3986cbScth 			if (op == MDI_DISABLE_OP && rv == MDI_SUCCESS) {
6234ee28b439Scm136836 				MDI_PI_SET_DRV_DISABLE_TRANS(pip);
62355e3986cbScth 			} else {
6236ee28b439Scm136836 				MDI_PI_SET_DRV_ENABLE_TRANS(pip);
62375e3986cbScth 			}
6238ee28b439Scm136836 			break;
6239ee28b439Scm136836 	}
6240ee28b439Scm136836 	MDI_PI_UNLOCK(pip);
6241ee28b439Scm136836 	/*
6242ee28b439Scm136836 	 * Do a callback into the mdi consumer to let it
6243ee28b439Scm136836 	 * know that path is now enabled/disabled.
6244ee28b439Scm136836 	 */
6245ee28b439Scm136836 	if (f != NULL) {
6246ee28b439Scm136836 		rv = (*f)(vh->vh_dip, pip, 0,
6247ee28b439Scm136836 			MDI_PI_EXT_STATE(pip),
6248ee28b439Scm136836 			MDI_EXT_STATE_CHANGE | sync_flag |
6249ee28b439Scm136836 			op | MDI_AFTER_STATE_CHANGE);
6250ee28b439Scm136836 		if (rv != MDI_SUCCESS) {
62514c06356bSdh142964 			MDI_DEBUG(2, (MDI_WARN, vh->vh_dip,
62524c06356bSdh142964 			    "vo_pi_state_change failed: rv = %x", rv));
6253ee28b439Scm136836 		}
6254ee28b439Scm136836 	}
6255ee28b439Scm136836 	return (next);
6256ee28b439Scm136836 }
62577c478bd9Sstevel@tonic-gate 
62587c478bd9Sstevel@tonic-gate /*
62597c478bd9Sstevel@tonic-gate  * Common routine for doing enable/disable.
6260ee28b439Scm136836  * NOTE: this will be removed once the NWS files are changed to use the new
6261ee28b439Scm136836  * mdi_{enable,disable}_path has been putback
62627c478bd9Sstevel@tonic-gate  */
62637c478bd9Sstevel@tonic-gate int
62647c478bd9Sstevel@tonic-gate i_mdi_pi_enable_disable(dev_info_t *cdip, dev_info_t *pdip, int flags, int op)
62657c478bd9Sstevel@tonic-gate {
62667c478bd9Sstevel@tonic-gate 
62677c478bd9Sstevel@tonic-gate 	mdi_phci_t	*ph;
62687c478bd9Sstevel@tonic-gate 	mdi_vhci_t	*vh = NULL;
62697c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
62707c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t	*next, *pip;
62717c478bd9Sstevel@tonic-gate 	int		found_it;
62727c478bd9Sstevel@tonic-gate 
62737c478bd9Sstevel@tonic-gate 	ph = i_devi_get_phci(pdip);
62744c06356bSdh142964 	MDI_DEBUG(5, (MDI_NOTE, cdip ? cdip : pdip,
62754c06356bSdh142964 	    "!op = %d pdip = %p cdip = %p", op, (void *)pdip,
62765e3986cbScth 	    (void *)cdip));
62777c478bd9Sstevel@tonic-gate 	if (ph == NULL) {
62784c06356bSdh142964 		MDI_DEBUG(1, (MDI_NOTE, cdip ? cdip : pdip,
62794c06356bSdh142964 		    "!failed: operation %d: NULL ph", op));
62807c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
62817c478bd9Sstevel@tonic-gate 	}
62827c478bd9Sstevel@tonic-gate 
62837c478bd9Sstevel@tonic-gate 	if ((op != MDI_ENABLE_OP) && (op != MDI_DISABLE_OP)) {
62844c06356bSdh142964 		MDI_DEBUG(1, (MDI_NOTE, cdip ? cdip : pdip,
62854c06356bSdh142964 		    "!failed: invalid operation %d", op));
62867c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
62877c478bd9Sstevel@tonic-gate 	}
62887c478bd9Sstevel@tonic-gate 
62897c478bd9Sstevel@tonic-gate 	vh = ph->ph_vhci;
62907c478bd9Sstevel@tonic-gate 
62917c478bd9Sstevel@tonic-gate 	if (cdip == NULL) {
62927c478bd9Sstevel@tonic-gate 		/*
62937c478bd9Sstevel@tonic-gate 		 * Need to mark the Phci as enabled/disabled.
62947c478bd9Sstevel@tonic-gate 		 */
62954c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, cdip ? cdip : pdip,
62964c06356bSdh142964 		    "op %d for the phci", op));
62977c478bd9Sstevel@tonic-gate 		MDI_PHCI_LOCK(ph);
62987c478bd9Sstevel@tonic-gate 		switch (flags) {
62997c478bd9Sstevel@tonic-gate 			case USER_DISABLE:
63005e3986cbScth 				if (op == MDI_DISABLE_OP) {
63017c478bd9Sstevel@tonic-gate 					MDI_PHCI_SET_USER_DISABLE(ph);
63025e3986cbScth 				} else {
63037c478bd9Sstevel@tonic-gate 					MDI_PHCI_SET_USER_ENABLE(ph);
63045e3986cbScth 				}
63057c478bd9Sstevel@tonic-gate 				break;
63067c478bd9Sstevel@tonic-gate 			case DRIVER_DISABLE:
63075e3986cbScth 				if (op == MDI_DISABLE_OP) {
63087c478bd9Sstevel@tonic-gate 					MDI_PHCI_SET_DRV_DISABLE(ph);
63095e3986cbScth 				} else {
63107c478bd9Sstevel@tonic-gate 					MDI_PHCI_SET_DRV_ENABLE(ph);
63115e3986cbScth 				}
63127c478bd9Sstevel@tonic-gate 				break;
63137c478bd9Sstevel@tonic-gate 			case DRIVER_DISABLE_TRANSIENT:
63145e3986cbScth 				if (op == MDI_DISABLE_OP) {
63157c478bd9Sstevel@tonic-gate 					MDI_PHCI_SET_DRV_DISABLE_TRANSIENT(ph);
63165e3986cbScth 				} else {
63177c478bd9Sstevel@tonic-gate 					MDI_PHCI_SET_DRV_ENABLE_TRANSIENT(ph);
63185e3986cbScth 				}
63197c478bd9Sstevel@tonic-gate 				break;
63207c478bd9Sstevel@tonic-gate 			default:
63217c478bd9Sstevel@tonic-gate 				MDI_PHCI_UNLOCK(ph);
63224c06356bSdh142964 				MDI_DEBUG(1, (MDI_NOTE, cdip ? cdip : pdip,
63234c06356bSdh142964 				    "!invalid flag argument= %d", flags));
63247c478bd9Sstevel@tonic-gate 		}
63257c478bd9Sstevel@tonic-gate 
63267c478bd9Sstevel@tonic-gate 		/*
63277c478bd9Sstevel@tonic-gate 		 * Phci has been disabled. Now try to enable/disable
63287c478bd9Sstevel@tonic-gate 		 * path info's to each client.
63297c478bd9Sstevel@tonic-gate 		 */
63307c478bd9Sstevel@tonic-gate 		pip = ph->ph_path_head;
63317c478bd9Sstevel@tonic-gate 		while (pip != NULL) {
6332ee28b439Scm136836 			pip = i_mdi_enable_disable_path(pip, vh, flags, op);
63337c478bd9Sstevel@tonic-gate 		}
63347c478bd9Sstevel@tonic-gate 		MDI_PHCI_UNLOCK(ph);
63357c478bd9Sstevel@tonic-gate 	} else {
63367c478bd9Sstevel@tonic-gate 
63377c478bd9Sstevel@tonic-gate 		/*
63387c478bd9Sstevel@tonic-gate 		 * Disable a specific client.
63397c478bd9Sstevel@tonic-gate 		 */
63407c478bd9Sstevel@tonic-gate 		ct = i_devi_get_client(cdip);
63417c478bd9Sstevel@tonic-gate 		if (ct == NULL) {
63424c06356bSdh142964 			MDI_DEBUG(1, (MDI_NOTE, cdip ? cdip : pdip,
63434c06356bSdh142964 			    "!failed: operation = %d: NULL ct", op));
63447c478bd9Sstevel@tonic-gate 			return (MDI_FAILURE);
63457c478bd9Sstevel@tonic-gate 		}
63467c478bd9Sstevel@tonic-gate 
63477c478bd9Sstevel@tonic-gate 		MDI_CLIENT_LOCK(ct);
63487c478bd9Sstevel@tonic-gate 		pip = ct->ct_path_head;
63497c478bd9Sstevel@tonic-gate 		found_it = 0;
63507c478bd9Sstevel@tonic-gate 		while (pip != NULL) {
63517c478bd9Sstevel@tonic-gate 			MDI_PI_LOCK(pip);
63527c478bd9Sstevel@tonic-gate 			next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link;
63537c478bd9Sstevel@tonic-gate 			if (MDI_PI(pip)->pi_phci == ph) {
63547c478bd9Sstevel@tonic-gate 				MDI_PI_UNLOCK(pip);
63557c478bd9Sstevel@tonic-gate 				found_it = 1;
63567c478bd9Sstevel@tonic-gate 				break;
63577c478bd9Sstevel@tonic-gate 			}
63587c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
63597c478bd9Sstevel@tonic-gate 			pip = next;
63607c478bd9Sstevel@tonic-gate 		}
63617c478bd9Sstevel@tonic-gate 
6362ee28b439Scm136836 
63637c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
63647c478bd9Sstevel@tonic-gate 		if (found_it == 0) {
63654c06356bSdh142964 			MDI_DEBUG(1, (MDI_NOTE, cdip ? cdip : pdip,
63664c06356bSdh142964 			    "!failed. Could not find corresponding pip\n"));
63677c478bd9Sstevel@tonic-gate 			return (MDI_FAILURE);
63687c478bd9Sstevel@tonic-gate 		}
6369ee28b439Scm136836 
6370ee28b439Scm136836 		(void) i_mdi_enable_disable_path(pip, vh, flags, op);
63717c478bd9Sstevel@tonic-gate 	}
63727c478bd9Sstevel@tonic-gate 
63734c06356bSdh142964 	MDI_DEBUG(5, (MDI_NOTE, cdip ? cdip : pdip,
63744c06356bSdh142964 	    "!op %d returning success pdip = %p cdip = %p",
63755e3986cbScth 	    op, (void *)pdip, (void *)cdip));
63767c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
63777c478bd9Sstevel@tonic-gate }
63787c478bd9Sstevel@tonic-gate 
63797c478bd9Sstevel@tonic-gate /*
63807c478bd9Sstevel@tonic-gate  * Ensure phci powered up
63817c478bd9Sstevel@tonic-gate  */
63827c478bd9Sstevel@tonic-gate static void
63837c478bd9Sstevel@tonic-gate i_mdi_pm_hold_pip(mdi_pathinfo_t *pip)
63847c478bd9Sstevel@tonic-gate {
63857c478bd9Sstevel@tonic-gate 	dev_info_t	*ph_dip;
63867c478bd9Sstevel@tonic-gate 
63877c478bd9Sstevel@tonic-gate 	ASSERT(pip != NULL);
63885e3986cbScth 	ASSERT(MDI_PI_LOCKED(pip));
63897c478bd9Sstevel@tonic-gate 
63907c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_pm_held) {
63917c478bd9Sstevel@tonic-gate 		return;
63927c478bd9Sstevel@tonic-gate 	}
63937c478bd9Sstevel@tonic-gate 
63947c478bd9Sstevel@tonic-gate 	ph_dip = mdi_pi_get_phci(pip);
63954c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, ph_dip,
63964c06356bSdh142964 	    "%s %p", mdi_pi_spathname(pip), (void *)pip));
63977c478bd9Sstevel@tonic-gate 	if (ph_dip == NULL) {
63987c478bd9Sstevel@tonic-gate 		return;
63997c478bd9Sstevel@tonic-gate 	}
64007c478bd9Sstevel@tonic-gate 
64017c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
64024c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, ph_dip, "kidsupcnt was %d",
64037c478bd9Sstevel@tonic-gate 	    DEVI(ph_dip)->devi_pm_kidsupcnt));
64047c478bd9Sstevel@tonic-gate 	pm_hold_power(ph_dip);
64054c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, ph_dip, "kidsupcnt is %d",
64067c478bd9Sstevel@tonic-gate 	    DEVI(ph_dip)->devi_pm_kidsupcnt));
64077c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
64087c478bd9Sstevel@tonic-gate 
64095e3986cbScth 	/* If PM_GET_PM_INFO is NULL the pm_hold_power above was a noop */
64105e3986cbScth 	if (DEVI(ph_dip)->devi_pm_info)
64117c478bd9Sstevel@tonic-gate 		MDI_PI(pip)->pi_pm_held = 1;
64127c478bd9Sstevel@tonic-gate }
64137c478bd9Sstevel@tonic-gate 
64147c478bd9Sstevel@tonic-gate /*
64157c478bd9Sstevel@tonic-gate  * Allow phci powered down
64167c478bd9Sstevel@tonic-gate  */
64177c478bd9Sstevel@tonic-gate static void
64187c478bd9Sstevel@tonic-gate i_mdi_pm_rele_pip(mdi_pathinfo_t *pip)
64197c478bd9Sstevel@tonic-gate {
64207c478bd9Sstevel@tonic-gate 	dev_info_t	*ph_dip = NULL;
64217c478bd9Sstevel@tonic-gate 
64227c478bd9Sstevel@tonic-gate 	ASSERT(pip != NULL);
64235e3986cbScth 	ASSERT(MDI_PI_LOCKED(pip));
64247c478bd9Sstevel@tonic-gate 
64257c478bd9Sstevel@tonic-gate 	if (MDI_PI(pip)->pi_pm_held == 0) {
64267c478bd9Sstevel@tonic-gate 		return;
64277c478bd9Sstevel@tonic-gate 	}
64287c478bd9Sstevel@tonic-gate 
64297c478bd9Sstevel@tonic-gate 	ph_dip = mdi_pi_get_phci(pip);
64307c478bd9Sstevel@tonic-gate 	ASSERT(ph_dip != NULL);
64317c478bd9Sstevel@tonic-gate 
64324c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, ph_dip,
64334c06356bSdh142964 	    "%s %p", mdi_pi_spathname(pip), (void *)pip));
64344c06356bSdh142964 
64357c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
64364c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, ph_dip,
64374c06356bSdh142964 	    "kidsupcnt was %d", DEVI(ph_dip)->devi_pm_kidsupcnt));
64387c478bd9Sstevel@tonic-gate 	pm_rele_power(ph_dip);
64394c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, ph_dip,
64404c06356bSdh142964 	    "kidsupcnt is %d", DEVI(ph_dip)->devi_pm_kidsupcnt));
64417c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
64424c06356bSdh142964 
64437c478bd9Sstevel@tonic-gate 	MDI_PI(pip)->pi_pm_held = 0;
64447c478bd9Sstevel@tonic-gate }
64457c478bd9Sstevel@tonic-gate 
64467c478bd9Sstevel@tonic-gate static void
64477c478bd9Sstevel@tonic-gate i_mdi_pm_hold_client(mdi_client_t *ct, int incr)
64487c478bd9Sstevel@tonic-gate {
64495e3986cbScth 	ASSERT(MDI_CLIENT_LOCKED(ct));
64507c478bd9Sstevel@tonic-gate 
64517c478bd9Sstevel@tonic-gate 	ct->ct_power_cnt += incr;
64524c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, ct->ct_dip,
64534c06356bSdh142964 	    "%p ct_power_cnt = %d incr = %d",
64544c06356bSdh142964 	    (void *)ct, ct->ct_power_cnt, incr));
64557c478bd9Sstevel@tonic-gate 	ASSERT(ct->ct_power_cnt >= 0);
64567c478bd9Sstevel@tonic-gate }
64577c478bd9Sstevel@tonic-gate 
64587c478bd9Sstevel@tonic-gate static void
64597c478bd9Sstevel@tonic-gate i_mdi_rele_all_phci(mdi_client_t *ct)
64607c478bd9Sstevel@tonic-gate {
64617c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t  *pip;
64627c478bd9Sstevel@tonic-gate 
64635e3986cbScth 	ASSERT(MDI_CLIENT_LOCKED(ct));
64647c478bd9Sstevel@tonic-gate 	pip = (mdi_pathinfo_t *)ct->ct_path_head;
64657c478bd9Sstevel@tonic-gate 	while (pip != NULL) {
64667c478bd9Sstevel@tonic-gate 		mdi_hold_path(pip);
64677c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
64687c478bd9Sstevel@tonic-gate 		i_mdi_pm_rele_pip(pip);
64697c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
64707c478bd9Sstevel@tonic-gate 		mdi_rele_path(pip);
64717c478bd9Sstevel@tonic-gate 		pip = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link;
64727c478bd9Sstevel@tonic-gate 	}
64737c478bd9Sstevel@tonic-gate }
64747c478bd9Sstevel@tonic-gate 
64757c478bd9Sstevel@tonic-gate static void
64767c478bd9Sstevel@tonic-gate i_mdi_pm_rele_client(mdi_client_t *ct, int decr)
64777c478bd9Sstevel@tonic-gate {
64785e3986cbScth 	ASSERT(MDI_CLIENT_LOCKED(ct));
64797c478bd9Sstevel@tonic-gate 
6480737d277aScth 	if (i_ddi_devi_attached(ct->ct_dip)) {
64817c478bd9Sstevel@tonic-gate 		ct->ct_power_cnt -= decr;
64824c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, ct->ct_dip,
64834c06356bSdh142964 		    "%p ct_power_cnt = %d decr = %d",
64845e3986cbScth 		    (void *)ct, ct->ct_power_cnt, decr));
64857c478bd9Sstevel@tonic-gate 	}
64867c478bd9Sstevel@tonic-gate 
64877c478bd9Sstevel@tonic-gate 	ASSERT(ct->ct_power_cnt >= 0);
64887c478bd9Sstevel@tonic-gate 	if (ct->ct_power_cnt == 0) {
64897c478bd9Sstevel@tonic-gate 		i_mdi_rele_all_phci(ct);
64907c478bd9Sstevel@tonic-gate 		return;
64917c478bd9Sstevel@tonic-gate 	}
64927c478bd9Sstevel@tonic-gate }
64937c478bd9Sstevel@tonic-gate 
64947c478bd9Sstevel@tonic-gate static void
64957c478bd9Sstevel@tonic-gate i_mdi_pm_reset_client(mdi_client_t *ct)
64967c478bd9Sstevel@tonic-gate {
64974c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, ct->ct_dip,
64984c06356bSdh142964 	    "%p ct_power_cnt = %d", (void *)ct, ct->ct_power_cnt));
64995e3986cbScth 	ASSERT(MDI_CLIENT_LOCKED(ct));
65007c478bd9Sstevel@tonic-gate 	ct->ct_power_cnt = 0;
65017c478bd9Sstevel@tonic-gate 	i_mdi_rele_all_phci(ct);
650278dc6db2Sllai1 	ct->ct_powercnt_config = 0;
650378dc6db2Sllai1 	ct->ct_powercnt_unconfig = 0;
65047c478bd9Sstevel@tonic-gate 	ct->ct_powercnt_reset = 1;
65057c478bd9Sstevel@tonic-gate }
65067c478bd9Sstevel@tonic-gate 
65077c478bd9Sstevel@tonic-gate static int
65087c478bd9Sstevel@tonic-gate i_mdi_power_one_phci(mdi_pathinfo_t *pip)
65097c478bd9Sstevel@tonic-gate {
65107c478bd9Sstevel@tonic-gate 	int		ret;
65117c478bd9Sstevel@tonic-gate 	dev_info_t	*ph_dip;
65127c478bd9Sstevel@tonic-gate 
65137c478bd9Sstevel@tonic-gate 	MDI_PI_LOCK(pip);
65147c478bd9Sstevel@tonic-gate 	i_mdi_pm_hold_pip(pip);
65157c478bd9Sstevel@tonic-gate 
65167c478bd9Sstevel@tonic-gate 	ph_dip = mdi_pi_get_phci(pip);
65177c478bd9Sstevel@tonic-gate 	MDI_PI_UNLOCK(pip);
65187c478bd9Sstevel@tonic-gate 
65197c478bd9Sstevel@tonic-gate 	/* bring all components of phci to full power */
65204c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, ph_dip,
65214c06356bSdh142964 	    "pm_powerup for %s%d %p", ddi_driver_name(ph_dip),
65225e3986cbScth 	    ddi_get_instance(ph_dip), (void *)pip));
65237c478bd9Sstevel@tonic-gate 
65247c478bd9Sstevel@tonic-gate 	ret = pm_powerup(ph_dip);
65257c478bd9Sstevel@tonic-gate 
65267c478bd9Sstevel@tonic-gate 	if (ret == DDI_FAILURE) {
65274c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, ph_dip,
65284c06356bSdh142964 		    "pm_powerup FAILED for %s%d %p",
652955e592a2SRandall Ralphs 		    ddi_driver_name(ph_dip), ddi_get_instance(ph_dip),
65305e3986cbScth 		    (void *)pip));
65317c478bd9Sstevel@tonic-gate 
65327c478bd9Sstevel@tonic-gate 		MDI_PI_LOCK(pip);
65337c478bd9Sstevel@tonic-gate 		i_mdi_pm_rele_pip(pip);
65347c478bd9Sstevel@tonic-gate 		MDI_PI_UNLOCK(pip);
65357c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
65367c478bd9Sstevel@tonic-gate 	}
65377c478bd9Sstevel@tonic-gate 
65387c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
65397c478bd9Sstevel@tonic-gate }
65407c478bd9Sstevel@tonic-gate 
65417c478bd9Sstevel@tonic-gate static int
65427c478bd9Sstevel@tonic-gate i_mdi_power_all_phci(mdi_client_t *ct)
65437c478bd9Sstevel@tonic-gate {
65447c478bd9Sstevel@tonic-gate 	mdi_pathinfo_t  *pip;
65457c478bd9Sstevel@tonic-gate 	int		succeeded = 0;
65467c478bd9Sstevel@tonic-gate 
65475e3986cbScth 	ASSERT(MDI_CLIENT_LOCKED(ct));
65487c478bd9Sstevel@tonic-gate 	pip = (mdi_pathinfo_t *)ct->ct_path_head;
65497c478bd9Sstevel@tonic-gate 	while (pip != NULL) {
65505e3986cbScth 		/*
65515e3986cbScth 		 * Don't power if MDI_PATHINFO_STATE_FAULT
65525e3986cbScth 		 * or MDI_PATHINFO_STATE_OFFLINE.
65535e3986cbScth 		 */
65545e3986cbScth 		if (MDI_PI_IS_INIT(pip) ||
65555e3986cbScth 		    MDI_PI_IS_ONLINE(pip) || MDI_PI_IS_STANDBY(pip)) {
65567c478bd9Sstevel@tonic-gate 			mdi_hold_path(pip);
65577c478bd9Sstevel@tonic-gate 			MDI_CLIENT_UNLOCK(ct);
65587c478bd9Sstevel@tonic-gate 			if (i_mdi_power_one_phci(pip) == MDI_SUCCESS)
65597c478bd9Sstevel@tonic-gate 				succeeded = 1;
65607c478bd9Sstevel@tonic-gate 
65617c478bd9Sstevel@tonic-gate 			ASSERT(ct == MDI_PI(pip)->pi_client);
65627c478bd9Sstevel@tonic-gate 			MDI_CLIENT_LOCK(ct);
65637c478bd9Sstevel@tonic-gate 			mdi_rele_path(pip);
65645e3986cbScth 		}
65657c478bd9Sstevel@tonic-gate 		pip = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link;
65667c478bd9Sstevel@tonic-gate 	}
65677c478bd9Sstevel@tonic-gate 
65687c478bd9Sstevel@tonic-gate 	return (succeeded ? MDI_SUCCESS : MDI_FAILURE);
65697c478bd9Sstevel@tonic-gate }
65707c478bd9Sstevel@tonic-gate 
65717c478bd9Sstevel@tonic-gate /*
65727c478bd9Sstevel@tonic-gate  * mdi_bus_power():
65737c478bd9Sstevel@tonic-gate  *		1. Place the phci(s) into powered up state so that
65747c478bd9Sstevel@tonic-gate  *		   client can do power management
65757c478bd9Sstevel@tonic-gate  *		2. Ensure phci powered up as client power managing
65767c478bd9Sstevel@tonic-gate  * Return Values:
65777c478bd9Sstevel@tonic-gate  *		MDI_SUCCESS
65787c478bd9Sstevel@tonic-gate  *		MDI_FAILURE
65797c478bd9Sstevel@tonic-gate  */
65807c478bd9Sstevel@tonic-gate int
65817c478bd9Sstevel@tonic-gate mdi_bus_power(dev_info_t *parent, void *impl_arg, pm_bus_power_op_t op,
65827c478bd9Sstevel@tonic-gate     void *arg, void *result)
65837c478bd9Sstevel@tonic-gate {
65847c478bd9Sstevel@tonic-gate 	int			ret = MDI_SUCCESS;
65857c478bd9Sstevel@tonic-gate 	pm_bp_child_pwrchg_t	*bpc;
65867c478bd9Sstevel@tonic-gate 	mdi_client_t		*ct;
65877c478bd9Sstevel@tonic-gate 	dev_info_t		*cdip;
65887c478bd9Sstevel@tonic-gate 	pm_bp_has_changed_t	*bphc;
65897c478bd9Sstevel@tonic-gate 
65907c478bd9Sstevel@tonic-gate 	/*
65917c478bd9Sstevel@tonic-gate 	 * BUS_POWER_NOINVOL not supported
65927c478bd9Sstevel@tonic-gate 	 */
65937c478bd9Sstevel@tonic-gate 	if (op == BUS_POWER_NOINVOL)
65947c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
65957c478bd9Sstevel@tonic-gate 
65967c478bd9Sstevel@tonic-gate 	/*
65977c478bd9Sstevel@tonic-gate 	 * ignore other OPs.
65987c478bd9Sstevel@tonic-gate 	 * return quickly to save cou cycles on the ct processing
65997c478bd9Sstevel@tonic-gate 	 */
66007c478bd9Sstevel@tonic-gate 	switch (op) {
66017c478bd9Sstevel@tonic-gate 	case BUS_POWER_PRE_NOTIFICATION:
66027c478bd9Sstevel@tonic-gate 	case BUS_POWER_POST_NOTIFICATION:
66037c478bd9Sstevel@tonic-gate 		bpc = (pm_bp_child_pwrchg_t *)arg;
66047c478bd9Sstevel@tonic-gate 		cdip = bpc->bpc_dip;
66057c478bd9Sstevel@tonic-gate 		break;
66067c478bd9Sstevel@tonic-gate 	case BUS_POWER_HAS_CHANGED:
66077c478bd9Sstevel@tonic-gate 		bphc = (pm_bp_has_changed_t *)arg;
66087c478bd9Sstevel@tonic-gate 		cdip = bphc->bphc_dip;
66097c478bd9Sstevel@tonic-gate 		break;
66107c478bd9Sstevel@tonic-gate 	default:
66117c478bd9Sstevel@tonic-gate 		return (pm_busop_bus_power(parent, impl_arg, op, arg, result));
66127c478bd9Sstevel@tonic-gate 	}
66137c478bd9Sstevel@tonic-gate 
66147c478bd9Sstevel@tonic-gate 	ASSERT(MDI_CLIENT(cdip));
66157c478bd9Sstevel@tonic-gate 
66167c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(cdip);
66177c478bd9Sstevel@tonic-gate 	if (ct == NULL)
66187c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
66197c478bd9Sstevel@tonic-gate 
66207c478bd9Sstevel@tonic-gate 	/*
66217c478bd9Sstevel@tonic-gate 	 * wait till the mdi_pathinfo node state change are processed
66227c478bd9Sstevel@tonic-gate 	 */
66237c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
66247c478bd9Sstevel@tonic-gate 	switch (op) {
66257c478bd9Sstevel@tonic-gate 	case BUS_POWER_PRE_NOTIFICATION:
66264c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, bpc->bpc_dip,
66277c478bd9Sstevel@tonic-gate 		    "BUS_POWER_PRE_NOTIFICATION:"
66284c06356bSdh142964 		    "%s@%s, olevel=%d, nlevel=%d, comp=%d",
66294c06356bSdh142964 		    ddi_node_name(bpc->bpc_dip), PM_ADDR(bpc->bpc_dip),
66307c478bd9Sstevel@tonic-gate 		    bpc->bpc_olevel, bpc->bpc_nlevel, bpc->bpc_comp));
66317c478bd9Sstevel@tonic-gate 
66327c478bd9Sstevel@tonic-gate 		/* serialize power level change per client */
66337c478bd9Sstevel@tonic-gate 		while (MDI_CLIENT_IS_POWER_TRANSITION(ct))
66347c478bd9Sstevel@tonic-gate 			cv_wait(&ct->ct_powerchange_cv, &ct->ct_mutex);
66357c478bd9Sstevel@tonic-gate 
66367c478bd9Sstevel@tonic-gate 		MDI_CLIENT_SET_POWER_TRANSITION(ct);
66377c478bd9Sstevel@tonic-gate 
66387c478bd9Sstevel@tonic-gate 		if (ct->ct_power_cnt == 0) {
66397c478bd9Sstevel@tonic-gate 			ret = i_mdi_power_all_phci(ct);
66407c478bd9Sstevel@tonic-gate 		}
66417c478bd9Sstevel@tonic-gate 
66427c478bd9Sstevel@tonic-gate 		/*
66437c478bd9Sstevel@tonic-gate 		 * if new_level > 0:
66447c478bd9Sstevel@tonic-gate 		 *	- hold phci(s)
66457c478bd9Sstevel@tonic-gate 		 *	- power up phci(s) if not already
66467c478bd9Sstevel@tonic-gate 		 * ignore power down
66477c478bd9Sstevel@tonic-gate 		 */
66487c478bd9Sstevel@tonic-gate 		if (bpc->bpc_nlevel > 0) {
66497c478bd9Sstevel@tonic-gate 			if (!DEVI_IS_ATTACHING(ct->ct_dip)) {
66504c06356bSdh142964 				MDI_DEBUG(4, (MDI_NOTE, bpc->bpc_dip,
66514c06356bSdh142964 				    "i_mdi_pm_hold_client\n"));
66527c478bd9Sstevel@tonic-gate 				i_mdi_pm_hold_client(ct, ct->ct_path_count);
66537c478bd9Sstevel@tonic-gate 			}
66547c478bd9Sstevel@tonic-gate 		}
66557c478bd9Sstevel@tonic-gate 		break;
66567c478bd9Sstevel@tonic-gate 	case BUS_POWER_POST_NOTIFICATION:
66574c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, bpc->bpc_dip,
66587c478bd9Sstevel@tonic-gate 		    "BUS_POWER_POST_NOTIFICATION:"
66594c06356bSdh142964 		    "%s@%s, olevel=%d, nlevel=%d, comp=%d result=%d",
66604c06356bSdh142964 		    ddi_node_name(bpc->bpc_dip), PM_ADDR(bpc->bpc_dip),
66617c478bd9Sstevel@tonic-gate 		    bpc->bpc_olevel, bpc->bpc_nlevel, bpc->bpc_comp,
66627c478bd9Sstevel@tonic-gate 		    *(int *)result));
66637c478bd9Sstevel@tonic-gate 
66647c478bd9Sstevel@tonic-gate 		if (*(int *)result == DDI_SUCCESS) {
66657c478bd9Sstevel@tonic-gate 			if (bpc->bpc_nlevel > 0) {
66667c478bd9Sstevel@tonic-gate 				MDI_CLIENT_SET_POWER_UP(ct);
66677c478bd9Sstevel@tonic-gate 			} else {
66687c478bd9Sstevel@tonic-gate 				MDI_CLIENT_SET_POWER_DOWN(ct);
66697c478bd9Sstevel@tonic-gate 			}
66707c478bd9Sstevel@tonic-gate 		}
66717c478bd9Sstevel@tonic-gate 
66727c478bd9Sstevel@tonic-gate 		/* release the hold we did in pre-notification */
66737c478bd9Sstevel@tonic-gate 		if (bpc->bpc_nlevel > 0 && (*(int *)result != DDI_SUCCESS) &&
66747c478bd9Sstevel@tonic-gate 		    !DEVI_IS_ATTACHING(ct->ct_dip)) {
66754c06356bSdh142964 			MDI_DEBUG(4, (MDI_NOTE, bpc->bpc_dip,
66764c06356bSdh142964 			    "i_mdi_pm_rele_client\n"));
66777c478bd9Sstevel@tonic-gate 			i_mdi_pm_rele_client(ct, ct->ct_path_count);
66787c478bd9Sstevel@tonic-gate 		}
66797c478bd9Sstevel@tonic-gate 
66807c478bd9Sstevel@tonic-gate 		if (bpc->bpc_nlevel == 0 && (*(int *)result == DDI_SUCCESS)) {
66817c478bd9Sstevel@tonic-gate 			/* another thread might started attaching */
66827c478bd9Sstevel@tonic-gate 			if (DEVI_IS_ATTACHING(ct->ct_dip)) {
66834c06356bSdh142964 				MDI_DEBUG(4, (MDI_NOTE, bpc->bpc_dip,
66844c06356bSdh142964 				    "i_mdi_pm_rele_client\n"));
66857c478bd9Sstevel@tonic-gate 				i_mdi_pm_rele_client(ct, ct->ct_path_count);
66867c478bd9Sstevel@tonic-gate 			/* detaching has been taken care in pm_post_unconfig */
66877c478bd9Sstevel@tonic-gate 			} else if (!DEVI_IS_DETACHING(ct->ct_dip)) {
66884c06356bSdh142964 				MDI_DEBUG(4, (MDI_NOTE, bpc->bpc_dip,
66894c06356bSdh142964 				    "i_mdi_pm_reset_client\n"));
66907c478bd9Sstevel@tonic-gate 				i_mdi_pm_reset_client(ct);
66917c478bd9Sstevel@tonic-gate 			}
66927c478bd9Sstevel@tonic-gate 		}
66937c478bd9Sstevel@tonic-gate 
66947c478bd9Sstevel@tonic-gate 		MDI_CLIENT_CLEAR_POWER_TRANSITION(ct);
66957c478bd9Sstevel@tonic-gate 		cv_broadcast(&ct->ct_powerchange_cv);
66967c478bd9Sstevel@tonic-gate 
66977c478bd9Sstevel@tonic-gate 		break;
66987c478bd9Sstevel@tonic-gate 
66997c478bd9Sstevel@tonic-gate 	/* need to do more */
67007c478bd9Sstevel@tonic-gate 	case BUS_POWER_HAS_CHANGED:
67014c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, bphc->bphc_dip,
67027c478bd9Sstevel@tonic-gate 		    "BUS_POWER_HAS_CHANGED:"
67034c06356bSdh142964 		    "%s@%s, olevel=%d, nlevel=%d, comp=%d",
67044c06356bSdh142964 		    ddi_node_name(bphc->bphc_dip), PM_ADDR(bphc->bphc_dip),
67057c478bd9Sstevel@tonic-gate 		    bphc->bphc_olevel, bphc->bphc_nlevel, bphc->bphc_comp));
67067c478bd9Sstevel@tonic-gate 
67077c478bd9Sstevel@tonic-gate 		if (bphc->bphc_nlevel > 0 &&
67087c478bd9Sstevel@tonic-gate 		    bphc->bphc_nlevel > bphc->bphc_olevel) {
67097c478bd9Sstevel@tonic-gate 			if (ct->ct_power_cnt == 0) {
67107c478bd9Sstevel@tonic-gate 				ret = i_mdi_power_all_phci(ct);
67117c478bd9Sstevel@tonic-gate 			}
67124c06356bSdh142964 			MDI_DEBUG(4, (MDI_NOTE, bphc->bphc_dip,
67134c06356bSdh142964 			    "i_mdi_pm_hold_client\n"));
67147c478bd9Sstevel@tonic-gate 			i_mdi_pm_hold_client(ct, ct->ct_path_count);
67157c478bd9Sstevel@tonic-gate 		}
67167c478bd9Sstevel@tonic-gate 
67177c478bd9Sstevel@tonic-gate 		if (bphc->bphc_nlevel == 0 && bphc->bphc_olevel != -1) {
67184c06356bSdh142964 			MDI_DEBUG(4, (MDI_NOTE, bphc->bphc_dip,
67194c06356bSdh142964 			    "i_mdi_pm_rele_client\n"));
67207c478bd9Sstevel@tonic-gate 			i_mdi_pm_rele_client(ct, ct->ct_path_count);
67217c478bd9Sstevel@tonic-gate 		}
67227c478bd9Sstevel@tonic-gate 		break;
67237c478bd9Sstevel@tonic-gate 	}
67247c478bd9Sstevel@tonic-gate 
67257c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
67267c478bd9Sstevel@tonic-gate 	return (ret);
67277c478bd9Sstevel@tonic-gate }
67287c478bd9Sstevel@tonic-gate 
67297c478bd9Sstevel@tonic-gate static int
67307c478bd9Sstevel@tonic-gate i_mdi_pm_pre_config_one(dev_info_t *child)
67317c478bd9Sstevel@tonic-gate {
67327c478bd9Sstevel@tonic-gate 	int		ret = MDI_SUCCESS;
67337c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
67347c478bd9Sstevel@tonic-gate 
67357c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(child);
67367c478bd9Sstevel@tonic-gate 	if (ct == NULL)
67377c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
67387c478bd9Sstevel@tonic-gate 
67397c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
67407c478bd9Sstevel@tonic-gate 	while (MDI_CLIENT_IS_POWER_TRANSITION(ct))
67417c478bd9Sstevel@tonic-gate 		cv_wait(&ct->ct_powerchange_cv, &ct->ct_mutex);
67427c478bd9Sstevel@tonic-gate 
67437c478bd9Sstevel@tonic-gate 	if (!MDI_CLIENT_IS_FAILED(ct)) {
67447c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
67454c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "already configured\n"));
67467c478bd9Sstevel@tonic-gate 		return (MDI_SUCCESS);
67477c478bd9Sstevel@tonic-gate 	}
67487c478bd9Sstevel@tonic-gate 
674978dc6db2Sllai1 	if (ct->ct_powercnt_config) {
67507c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
67514c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "already held\n"));
67527c478bd9Sstevel@tonic-gate 		return (MDI_SUCCESS);
67537c478bd9Sstevel@tonic-gate 	}
67547c478bd9Sstevel@tonic-gate 
67557c478bd9Sstevel@tonic-gate 	if (ct->ct_power_cnt == 0) {
67567c478bd9Sstevel@tonic-gate 		ret = i_mdi_power_all_phci(ct);
67577c478bd9Sstevel@tonic-gate 	}
67584c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, child, "i_mdi_pm_hold_client\n"));
67597c478bd9Sstevel@tonic-gate 	i_mdi_pm_hold_client(ct, ct->ct_path_count);
676078dc6db2Sllai1 	ct->ct_powercnt_config = 1;
67617c478bd9Sstevel@tonic-gate 	ct->ct_powercnt_reset = 0;
67627c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
67637c478bd9Sstevel@tonic-gate 	return (ret);
67647c478bd9Sstevel@tonic-gate }
67657c478bd9Sstevel@tonic-gate 
67667c478bd9Sstevel@tonic-gate static int
67675e3986cbScth i_mdi_pm_pre_config(dev_info_t *vdip, dev_info_t *child)
67687c478bd9Sstevel@tonic-gate {
67697c478bd9Sstevel@tonic-gate 	int			ret = MDI_SUCCESS;
67707c478bd9Sstevel@tonic-gate 	dev_info_t		*cdip;
67717c478bd9Sstevel@tonic-gate 	int			circ;
67727c478bd9Sstevel@tonic-gate 
67735e3986cbScth 	ASSERT(MDI_VHCI(vdip));
67747c478bd9Sstevel@tonic-gate 
67757c478bd9Sstevel@tonic-gate 	/* ndi_devi_config_one */
67767c478bd9Sstevel@tonic-gate 	if (child) {
67775e3986cbScth 		ASSERT(DEVI_BUSY_OWNED(vdip));
67787c478bd9Sstevel@tonic-gate 		return (i_mdi_pm_pre_config_one(child));
67797c478bd9Sstevel@tonic-gate 	}
67807c478bd9Sstevel@tonic-gate 
67817c478bd9Sstevel@tonic-gate 	/* devi_config_common */
67825e3986cbScth 	ndi_devi_enter(vdip, &circ);
67835e3986cbScth 	cdip = ddi_get_child(vdip);
67847c478bd9Sstevel@tonic-gate 	while (cdip) {
67857c478bd9Sstevel@tonic-gate 		dev_info_t *next = ddi_get_next_sibling(cdip);
67867c478bd9Sstevel@tonic-gate 
67877c478bd9Sstevel@tonic-gate 		ret = i_mdi_pm_pre_config_one(cdip);
67887c478bd9Sstevel@tonic-gate 		if (ret != MDI_SUCCESS)
67897c478bd9Sstevel@tonic-gate 			break;
67907c478bd9Sstevel@tonic-gate 		cdip = next;
67917c478bd9Sstevel@tonic-gate 	}
67925e3986cbScth 	ndi_devi_exit(vdip, circ);
67937c478bd9Sstevel@tonic-gate 	return (ret);
67947c478bd9Sstevel@tonic-gate }
67957c478bd9Sstevel@tonic-gate 
67967c478bd9Sstevel@tonic-gate static int
67977c478bd9Sstevel@tonic-gate i_mdi_pm_pre_unconfig_one(dev_info_t *child, int *held, int flags)
67987c478bd9Sstevel@tonic-gate {
67997c478bd9Sstevel@tonic-gate 	int		ret = MDI_SUCCESS;
68007c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
68017c478bd9Sstevel@tonic-gate 
68027c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(child);
68037c478bd9Sstevel@tonic-gate 	if (ct == NULL)
68047c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
68057c478bd9Sstevel@tonic-gate 
68067c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
68077c478bd9Sstevel@tonic-gate 	while (MDI_CLIENT_IS_POWER_TRANSITION(ct))
68087c478bd9Sstevel@tonic-gate 		cv_wait(&ct->ct_powerchange_cv, &ct->ct_mutex);
68097c478bd9Sstevel@tonic-gate 
6810737d277aScth 	if (!i_ddi_devi_attached(ct->ct_dip)) {
68114c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "node detached already\n"));
68127c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
68137c478bd9Sstevel@tonic-gate 		return (MDI_SUCCESS);
68147c478bd9Sstevel@tonic-gate 	}
68157c478bd9Sstevel@tonic-gate 
68167c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT_IS_POWERED_DOWN(ct) &&
68177c478bd9Sstevel@tonic-gate 	    (flags & NDI_AUTODETACH)) {
68184c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "auto-modunload\n"));
68197c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
68207c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
68217c478bd9Sstevel@tonic-gate 	}
68227c478bd9Sstevel@tonic-gate 
682378dc6db2Sllai1 	if (ct->ct_powercnt_unconfig) {
68244c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "ct_powercnt_held\n"));
68257c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
68267c478bd9Sstevel@tonic-gate 		*held = 1;
68277c478bd9Sstevel@tonic-gate 		return (MDI_SUCCESS);
68287c478bd9Sstevel@tonic-gate 	}
68297c478bd9Sstevel@tonic-gate 
68307c478bd9Sstevel@tonic-gate 	if (ct->ct_power_cnt == 0) {
68317c478bd9Sstevel@tonic-gate 		ret = i_mdi_power_all_phci(ct);
68327c478bd9Sstevel@tonic-gate 	}
68334c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, child, "i_mdi_pm_hold_client\n"));
68347c478bd9Sstevel@tonic-gate 	i_mdi_pm_hold_client(ct, ct->ct_path_count);
683578dc6db2Sllai1 	ct->ct_powercnt_unconfig = 1;
68367c478bd9Sstevel@tonic-gate 	ct->ct_powercnt_reset = 0;
68377c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
68387c478bd9Sstevel@tonic-gate 	if (ret == MDI_SUCCESS)
68397c478bd9Sstevel@tonic-gate 		*held = 1;
68407c478bd9Sstevel@tonic-gate 	return (ret);
68417c478bd9Sstevel@tonic-gate }
68427c478bd9Sstevel@tonic-gate 
68437c478bd9Sstevel@tonic-gate static int
68445e3986cbScth i_mdi_pm_pre_unconfig(dev_info_t *vdip, dev_info_t *child, int *held,
68457c478bd9Sstevel@tonic-gate     int flags)
68467c478bd9Sstevel@tonic-gate {
68477c478bd9Sstevel@tonic-gate 	int			ret = MDI_SUCCESS;
68487c478bd9Sstevel@tonic-gate 	dev_info_t		*cdip;
68497c478bd9Sstevel@tonic-gate 	int			circ;
68507c478bd9Sstevel@tonic-gate 
68515e3986cbScth 	ASSERT(MDI_VHCI(vdip));
68527c478bd9Sstevel@tonic-gate 	*held = 0;
68537c478bd9Sstevel@tonic-gate 
68547c478bd9Sstevel@tonic-gate 	/* ndi_devi_unconfig_one */
68557c478bd9Sstevel@tonic-gate 	if (child) {
68565e3986cbScth 		ASSERT(DEVI_BUSY_OWNED(vdip));
68577c478bd9Sstevel@tonic-gate 		return (i_mdi_pm_pre_unconfig_one(child, held, flags));
68587c478bd9Sstevel@tonic-gate 	}
68597c478bd9Sstevel@tonic-gate 
68607c478bd9Sstevel@tonic-gate 	/* devi_unconfig_common */
68615e3986cbScth 	ndi_devi_enter(vdip, &circ);
68625e3986cbScth 	cdip = ddi_get_child(vdip);
68637c478bd9Sstevel@tonic-gate 	while (cdip) {
68647c478bd9Sstevel@tonic-gate 		dev_info_t *next = ddi_get_next_sibling(cdip);
68657c478bd9Sstevel@tonic-gate 
68667c478bd9Sstevel@tonic-gate 		ret = i_mdi_pm_pre_unconfig_one(cdip, held, flags);
68677c478bd9Sstevel@tonic-gate 		cdip = next;
68687c478bd9Sstevel@tonic-gate 	}
68695e3986cbScth 	ndi_devi_exit(vdip, circ);
68707c478bd9Sstevel@tonic-gate 
68717c478bd9Sstevel@tonic-gate 	if (*held)
68727c478bd9Sstevel@tonic-gate 		ret = MDI_SUCCESS;
68737c478bd9Sstevel@tonic-gate 
68747c478bd9Sstevel@tonic-gate 	return (ret);
68757c478bd9Sstevel@tonic-gate }
68767c478bd9Sstevel@tonic-gate 
68777c478bd9Sstevel@tonic-gate static void
68787c478bd9Sstevel@tonic-gate i_mdi_pm_post_config_one(dev_info_t *child)
68797c478bd9Sstevel@tonic-gate {
68807c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
68817c478bd9Sstevel@tonic-gate 
68827c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(child);
68837c478bd9Sstevel@tonic-gate 	if (ct == NULL)
68847c478bd9Sstevel@tonic-gate 		return;
68857c478bd9Sstevel@tonic-gate 
68867c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
68877c478bd9Sstevel@tonic-gate 	while (MDI_CLIENT_IS_POWER_TRANSITION(ct))
68887c478bd9Sstevel@tonic-gate 		cv_wait(&ct->ct_powerchange_cv, &ct->ct_mutex);
68897c478bd9Sstevel@tonic-gate 
689078dc6db2Sllai1 	if (ct->ct_powercnt_reset || !ct->ct_powercnt_config) {
68914c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "not configured\n"));
68927c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
68937c478bd9Sstevel@tonic-gate 		return;
68947c478bd9Sstevel@tonic-gate 	}
68957c478bd9Sstevel@tonic-gate 
68967c478bd9Sstevel@tonic-gate 	/* client has not been updated */
68977c478bd9Sstevel@tonic-gate 	if (MDI_CLIENT_IS_FAILED(ct)) {
68984c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "client failed\n"));
68997c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
69007c478bd9Sstevel@tonic-gate 		return;
69017c478bd9Sstevel@tonic-gate 	}
69027c478bd9Sstevel@tonic-gate 
69037c478bd9Sstevel@tonic-gate 	/* another thread might have powered it down or detached it */
69047c478bd9Sstevel@tonic-gate 	if ((MDI_CLIENT_IS_POWERED_DOWN(ct) &&
69057c478bd9Sstevel@tonic-gate 	    !DEVI_IS_ATTACHING(ct->ct_dip)) ||
6906737d277aScth 	    (!i_ddi_devi_attached(ct->ct_dip) &&
69077c478bd9Sstevel@tonic-gate 	    !DEVI_IS_ATTACHING(ct->ct_dip))) {
69084c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "i_mdi_pm_reset_client\n"));
69097c478bd9Sstevel@tonic-gate 		i_mdi_pm_reset_client(ct);
69107c478bd9Sstevel@tonic-gate 	} else {
69117c478bd9Sstevel@tonic-gate 		mdi_pathinfo_t  *pip, *next;
69127c478bd9Sstevel@tonic-gate 		int	valid_path_count = 0;
69137c478bd9Sstevel@tonic-gate 
69144c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "i_mdi_pm_rele_client\n"));
69157c478bd9Sstevel@tonic-gate 		pip = ct->ct_path_head;
69167c478bd9Sstevel@tonic-gate 		while (pip != NULL) {
69177c478bd9Sstevel@tonic-gate 			MDI_PI_LOCK(pip);
69187c478bd9Sstevel@tonic-gate 			next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link;
691978dc6db2Sllai1 			if (MDI_PI_IS_ONLINE(pip) || MDI_PI_IS_STANDBY(pip))
69207c478bd9Sstevel@tonic-gate 				valid_path_count ++;
69217c478bd9Sstevel@tonic-gate 			MDI_PI_UNLOCK(pip);
69227c478bd9Sstevel@tonic-gate 			pip = next;
69237c478bd9Sstevel@tonic-gate 		}
69247c478bd9Sstevel@tonic-gate 		i_mdi_pm_rele_client(ct, valid_path_count);
69257c478bd9Sstevel@tonic-gate 	}
692678dc6db2Sllai1 	ct->ct_powercnt_config = 0;
69277c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
69287c478bd9Sstevel@tonic-gate }
69297c478bd9Sstevel@tonic-gate 
69307c478bd9Sstevel@tonic-gate static void
69315e3986cbScth i_mdi_pm_post_config(dev_info_t *vdip, dev_info_t *child)
69327c478bd9Sstevel@tonic-gate {
69337c478bd9Sstevel@tonic-gate 	int		circ;
69347c478bd9Sstevel@tonic-gate 	dev_info_t	*cdip;
69355e3986cbScth 
69365e3986cbScth 	ASSERT(MDI_VHCI(vdip));
69377c478bd9Sstevel@tonic-gate 
69387c478bd9Sstevel@tonic-gate 	/* ndi_devi_config_one */
69397c478bd9Sstevel@tonic-gate 	if (child) {
69405e3986cbScth 		ASSERT(DEVI_BUSY_OWNED(vdip));
69417c478bd9Sstevel@tonic-gate 		i_mdi_pm_post_config_one(child);
69427c478bd9Sstevel@tonic-gate 		return;
69437c478bd9Sstevel@tonic-gate 	}
69447c478bd9Sstevel@tonic-gate 
69457c478bd9Sstevel@tonic-gate 	/* devi_config_common */
69465e3986cbScth 	ndi_devi_enter(vdip, &circ);
69475e3986cbScth 	cdip = ddi_get_child(vdip);
69487c478bd9Sstevel@tonic-gate 	while (cdip) {
69497c478bd9Sstevel@tonic-gate 		dev_info_t *next = ddi_get_next_sibling(cdip);
69507c478bd9Sstevel@tonic-gate 
69517c478bd9Sstevel@tonic-gate 		i_mdi_pm_post_config_one(cdip);
69527c478bd9Sstevel@tonic-gate 		cdip = next;
69537c478bd9Sstevel@tonic-gate 	}
69545e3986cbScth 	ndi_devi_exit(vdip, circ);
69557c478bd9Sstevel@tonic-gate }
69567c478bd9Sstevel@tonic-gate 
69577c478bd9Sstevel@tonic-gate static void
69587c478bd9Sstevel@tonic-gate i_mdi_pm_post_unconfig_one(dev_info_t *child)
69597c478bd9Sstevel@tonic-gate {
69607c478bd9Sstevel@tonic-gate 	mdi_client_t	*ct;
69617c478bd9Sstevel@tonic-gate 
69627c478bd9Sstevel@tonic-gate 	ct = i_devi_get_client(child);
69637c478bd9Sstevel@tonic-gate 	if (ct == NULL)
69647c478bd9Sstevel@tonic-gate 		return;
69657c478bd9Sstevel@tonic-gate 
69667c478bd9Sstevel@tonic-gate 	MDI_CLIENT_LOCK(ct);
69677c478bd9Sstevel@tonic-gate 	while (MDI_CLIENT_IS_POWER_TRANSITION(ct))
69687c478bd9Sstevel@tonic-gate 		cv_wait(&ct->ct_powerchange_cv, &ct->ct_mutex);
69697c478bd9Sstevel@tonic-gate 
697078dc6db2Sllai1 	if (!ct->ct_powercnt_unconfig || ct->ct_powercnt_reset) {
69714c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "not held\n"));
69727c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
69737c478bd9Sstevel@tonic-gate 		return;
69747c478bd9Sstevel@tonic-gate 	}
69757c478bd9Sstevel@tonic-gate 
69767c478bd9Sstevel@tonic-gate 	/* failure detaching or another thread just attached it */
69777c478bd9Sstevel@tonic-gate 	if ((MDI_CLIENT_IS_POWERED_DOWN(ct) &&
6978737d277aScth 	    i_ddi_devi_attached(ct->ct_dip)) ||
6979737d277aScth 	    (!i_ddi_devi_attached(ct->ct_dip) &&
69807c478bd9Sstevel@tonic-gate 	    !DEVI_IS_ATTACHING(ct->ct_dip))) {
69814c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "i_mdi_pm_reset_client\n"));
69827c478bd9Sstevel@tonic-gate 		i_mdi_pm_reset_client(ct);
698378dc6db2Sllai1 	} else {
698478dc6db2Sllai1 		mdi_pathinfo_t  *pip, *next;
698578dc6db2Sllai1 		int	valid_path_count = 0;
69867c478bd9Sstevel@tonic-gate 
69874c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, child, "i_mdi_pm_rele_client\n"));
698878dc6db2Sllai1 		pip = ct->ct_path_head;
698978dc6db2Sllai1 		while (pip != NULL) {
699078dc6db2Sllai1 			MDI_PI_LOCK(pip);
699178dc6db2Sllai1 			next = (mdi_pathinfo_t *)MDI_PI(pip)->pi_client_link;
699278dc6db2Sllai1 			if (MDI_PI_IS_ONLINE(pip) || MDI_PI_IS_STANDBY(pip))
699378dc6db2Sllai1 				valid_path_count ++;
699478dc6db2Sllai1 			MDI_PI_UNLOCK(pip);
699578dc6db2Sllai1 			pip = next;
699678dc6db2Sllai1 		}
699778dc6db2Sllai1 		i_mdi_pm_rele_client(ct, valid_path_count);
699878dc6db2Sllai1 		ct->ct_powercnt_unconfig = 0;
699978dc6db2Sllai1 	}
700078dc6db2Sllai1 
70017c478bd9Sstevel@tonic-gate 	MDI_CLIENT_UNLOCK(ct);
70027c478bd9Sstevel@tonic-gate }
70037c478bd9Sstevel@tonic-gate 
70047c478bd9Sstevel@tonic-gate static void
70055e3986cbScth i_mdi_pm_post_unconfig(dev_info_t *vdip, dev_info_t *child, int held)
70067c478bd9Sstevel@tonic-gate {
70077c478bd9Sstevel@tonic-gate 	int			circ;
70087c478bd9Sstevel@tonic-gate 	dev_info_t		*cdip;
70097c478bd9Sstevel@tonic-gate 
70105e3986cbScth 	ASSERT(MDI_VHCI(vdip));
70117c478bd9Sstevel@tonic-gate 
70127c478bd9Sstevel@tonic-gate 	if (!held) {
70134c06356bSdh142964 		MDI_DEBUG(4, (MDI_NOTE, vdip, "held = %d", held));
70147c478bd9Sstevel@tonic-gate 		return;
70157c478bd9Sstevel@tonic-gate 	}
70167c478bd9Sstevel@tonic-gate 
70177c478bd9Sstevel@tonic-gate 	if (child) {
70185e3986cbScth 		ASSERT(DEVI_BUSY_OWNED(vdip));
70197c478bd9Sstevel@tonic-gate 		i_mdi_pm_post_unconfig_one(child);
70207c478bd9Sstevel@tonic-gate 		return;
70217c478bd9Sstevel@tonic-gate 	}
70227c478bd9Sstevel@tonic-gate 
70235e3986cbScth 	ndi_devi_enter(vdip, &circ);
70245e3986cbScth 	cdip = ddi_get_child(vdip);
70257c478bd9Sstevel@tonic-gate 	while (cdip) {
70267c478bd9Sstevel@tonic-gate 		dev_info_t *next = ddi_get_next_sibling(cdip);
70277c478bd9Sstevel@tonic-gate 
70287c478bd9Sstevel@tonic-gate 		i_mdi_pm_post_unconfig_one(cdip);
70297c478bd9Sstevel@tonic-gate 		cdip = next;
70307c478bd9Sstevel@tonic-gate 	}
70315e3986cbScth 	ndi_devi_exit(vdip, circ);
70327c478bd9Sstevel@tonic-gate }
70337c478bd9Sstevel@tonic-gate 
70347c478bd9Sstevel@tonic-gate int
70357c478bd9Sstevel@tonic-gate mdi_power(dev_info_t *vdip, mdi_pm_op_t op, void *args, char *devnm, int flags)
70367c478bd9Sstevel@tonic-gate {
70377c478bd9Sstevel@tonic-gate 	int			circ, ret = MDI_SUCCESS;
70387c478bd9Sstevel@tonic-gate 	dev_info_t		*client_dip = NULL;
70397c478bd9Sstevel@tonic-gate 	mdi_client_t		*ct;
70407c478bd9Sstevel@tonic-gate 
70417c478bd9Sstevel@tonic-gate 	/*
70427c478bd9Sstevel@tonic-gate 	 * Handling ndi_devi_config_one and ndi_devi_unconfig_one.
70437c478bd9Sstevel@tonic-gate 	 * Power up pHCI for the named client device.
70447c478bd9Sstevel@tonic-gate 	 * Note: Before the client is enumerated under vhci by phci,
70457c478bd9Sstevel@tonic-gate 	 * client_dip can be NULL. Then proceed to power up all the
70467c478bd9Sstevel@tonic-gate 	 * pHCIs.
70477c478bd9Sstevel@tonic-gate 	 */
70487c478bd9Sstevel@tonic-gate 	if (devnm != NULL) {
70497c478bd9Sstevel@tonic-gate 		ndi_devi_enter(vdip, &circ);
70507c478bd9Sstevel@tonic-gate 		client_dip = ndi_devi_findchild(vdip, devnm);
70517c478bd9Sstevel@tonic-gate 	}
70527c478bd9Sstevel@tonic-gate 
70534c06356bSdh142964 	MDI_DEBUG(4, (MDI_NOTE, vdip,
70544c06356bSdh142964 	    "op = %d %s %p", op, devnm ? devnm : "", (void *)client_dip));
70557c478bd9Sstevel@tonic-gate 
70567c478bd9Sstevel@tonic-gate 	switch (op) {
70577c478bd9Sstevel@tonic-gate 	case MDI_PM_PRE_CONFIG:
70587c478bd9Sstevel@tonic-gate 		ret = i_mdi_pm_pre_config(vdip, client_dip);
7059c73a93f2Sdm120769 		break;
70605e3986cbScth 
70617c478bd9Sstevel@tonic-gate 	case MDI_PM_PRE_UNCONFIG:
70627c478bd9Sstevel@tonic-gate 		ret = i_mdi_pm_pre_unconfig(vdip, client_dip, (int *)args,
70637c478bd9Sstevel@tonic-gate 		    flags);
7064c73a93f2Sdm120769 		break;
70655e3986cbScth 
70667c478bd9Sstevel@tonic-gate 	case MDI_PM_POST_CONFIG:
70677c478bd9Sstevel@tonic-gate 		i_mdi_pm_post_config(vdip, client_dip);
7068c73a93f2Sdm120769 		break;
70695e3986cbScth 
70707c478bd9Sstevel@tonic-gate 	case MDI_PM_POST_UNCONFIG:
70717c478bd9Sstevel@tonic-gate 		i_mdi_pm_post_unconfig(vdip, client_dip, *(int *)args);
7072c73a93f2Sdm120769 		break;
70735e3986cbScth 
70747c478bd9Sstevel@tonic-gate 	case MDI_PM_HOLD_POWER:
70757c478bd9Sstevel@tonic-gate 	case MDI_PM_RELE_POWER:
70767c478bd9Sstevel@tonic-gate 		ASSERT(args);
70777c478bd9Sstevel@tonic-gate 
70787c478bd9Sstevel@tonic-gate 		client_dip = (dev_info_t *)args;
70797c478bd9Sstevel@tonic-gate 		ASSERT(MDI_CLIENT(client_dip));
70807c478bd9Sstevel@tonic-gate 
70817c478bd9Sstevel@tonic-gate 		ct = i_devi_get_client(client_dip);
70827c478bd9Sstevel@tonic-gate 		MDI_CLIENT_LOCK(ct);
70837c478bd9Sstevel@tonic-gate 
70847c478bd9Sstevel@tonic-gate 		if (op == MDI_PM_HOLD_POWER) {
70857c478bd9Sstevel@tonic-gate 			if (ct->ct_power_cnt == 0) {
70867c478bd9Sstevel@tonic-gate 				(void) i_mdi_power_all_phci(ct);
70874c06356bSdh142964 				MDI_DEBUG(4, (MDI_NOTE, client_dip,
70884c06356bSdh142964 				    "i_mdi_pm_hold_client\n"));
70897c478bd9Sstevel@tonic-gate 				i_mdi_pm_hold_client(ct, ct->ct_path_count);
70907c478bd9Sstevel@tonic-gate 			}
70917c478bd9Sstevel@tonic-gate 		} else {
70927c478bd9Sstevel@tonic-gate 			if (DEVI_IS_ATTACHING(ct->ct_dip)) {
70934c06356bSdh142964 				MDI_DEBUG(4, (MDI_NOTE, client_dip,
70944c06356bSdh142964 				    "i_mdi_pm_rele_client\n"));
70957c478bd9Sstevel@tonic-gate 				i_mdi_pm_rele_client(ct, ct->ct_path_count);
70967c478bd9Sstevel@tonic-gate 			} else {
70974c06356bSdh142964 				MDI_DEBUG(4, (MDI_NOTE, client_dip,
70984c06356bSdh142964 				    "i_mdi_pm_reset_client\n"));
70997c478bd9Sstevel@tonic-gate 				i_mdi_pm_reset_client(ct);
71007c478bd9Sstevel@tonic-gate 			}
71017c478bd9Sstevel@tonic-gate 		}
71027c478bd9Sstevel@tonic-gate 
71037c478bd9Sstevel@tonic-gate 		MDI_CLIENT_UNLOCK(ct);
71047c478bd9Sstevel@tonic-gate 		break;
71055e3986cbScth 
71067c478bd9Sstevel@tonic-gate 	default:
71077c478bd9Sstevel@tonic-gate 		break;
71087c478bd9Sstevel@tonic-gate 	}
71097c478bd9Sstevel@tonic-gate 
71105e3986cbScth 	if (devnm)
71115e3986cbScth 		ndi_devi_exit(vdip, circ);
71125e3986cbScth 
71137c478bd9Sstevel@tonic-gate 	return (ret);
71147c478bd9Sstevel@tonic-gate }
71157c478bd9Sstevel@tonic-gate 
71167c478bd9Sstevel@tonic-gate int
71177c478bd9Sstevel@tonic-gate mdi_component_is_vhci(dev_info_t *dip, const char **mdi_class)
71187c478bd9Sstevel@tonic-gate {
71197c478bd9Sstevel@tonic-gate 	mdi_vhci_t *vhci;
71207c478bd9Sstevel@tonic-gate 
71217c478bd9Sstevel@tonic-gate 	if (!MDI_VHCI(dip))
71227c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
71237c478bd9Sstevel@tonic-gate 
71247c478bd9Sstevel@tonic-gate 	if (mdi_class) {
71257c478bd9Sstevel@tonic-gate 		vhci = DEVI(dip)->devi_mdi_xhci;
71267c478bd9Sstevel@tonic-gate 		ASSERT(vhci);
71277c478bd9Sstevel@tonic-gate 		*mdi_class = vhci->vh_class;
71287c478bd9Sstevel@tonic-gate 	}
71297c478bd9Sstevel@tonic-gate 
71307c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
71317c478bd9Sstevel@tonic-gate }
71327c478bd9Sstevel@tonic-gate 
71337c478bd9Sstevel@tonic-gate int
71347c478bd9Sstevel@tonic-gate mdi_component_is_phci(dev_info_t *dip, const char **mdi_class)
71357c478bd9Sstevel@tonic-gate {
71367c478bd9Sstevel@tonic-gate 	mdi_phci_t *phci;
71377c478bd9Sstevel@tonic-gate 
71387c478bd9Sstevel@tonic-gate 	if (!MDI_PHCI(dip))
71397c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
71407c478bd9Sstevel@tonic-gate 
71417c478bd9Sstevel@tonic-gate 	if (mdi_class) {
71427c478bd9Sstevel@tonic-gate 		phci = DEVI(dip)->devi_mdi_xhci;
71437c478bd9Sstevel@tonic-gate 		ASSERT(phci);
71447c478bd9Sstevel@tonic-gate 		*mdi_class = phci->ph_vhci->vh_class;
71457c478bd9Sstevel@tonic-gate 	}
71467c478bd9Sstevel@tonic-gate 
71477c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
71487c478bd9Sstevel@tonic-gate }
71497c478bd9Sstevel@tonic-gate 
71507c478bd9Sstevel@tonic-gate int
71517c478bd9Sstevel@tonic-gate mdi_component_is_client(dev_info_t *dip, const char **mdi_class)
71527c478bd9Sstevel@tonic-gate {
71537c478bd9Sstevel@tonic-gate 	mdi_client_t *client;
71547c478bd9Sstevel@tonic-gate 
71557c478bd9Sstevel@tonic-gate 	if (!MDI_CLIENT(dip))
71567c478bd9Sstevel@tonic-gate 		return (MDI_FAILURE);
71577c478bd9Sstevel@tonic-gate 
71587c478bd9Sstevel@tonic-gate 	if (mdi_class) {
71597c478bd9Sstevel@tonic-gate 		client = DEVI(dip)->devi_mdi_client;
71607c478bd9Sstevel@tonic-gate 		ASSERT(client);
71617c478bd9Sstevel@tonic-gate 		*mdi_class = client->ct_vhci->vh_class;
71627c478bd9Sstevel@tonic-gate 	}
71637c478bd9Sstevel@tonic-gate 
71647c478bd9Sstevel@tonic-gate 	return (MDI_SUCCESS);
71657c478bd9Sstevel@tonic-gate }
71667c478bd9Sstevel@tonic-gate 
71677c478bd9Sstevel@tonic-gate void *
71687c478bd9Sstevel@tonic-gate mdi_client_get_vhci_private(dev_info_t *dip)
71697c478bd9Sstevel@tonic-gate {
71707c478bd9Sstevel@tonic-gate 	ASSERT(mdi_component_is_client(dip, NULL) == MDI_SUCCESS);
71717c478bd9Sstevel@tonic-gate 	if (mdi_component_is_client(dip, NULL) == MDI_SUCCESS) {
71727c478bd9Sstevel@tonic-gate 		mdi_client_t	*ct;
71737c478bd9Sstevel@tonic-gate 		ct = i_devi_get_client(dip);
71747c478bd9Sstevel@tonic-gate 		return (ct->ct_vprivate);
71757c478bd9Sstevel@tonic-gate 	}
71767c478bd9Sstevel@tonic-gate 	return (NULL);
71777c478bd9Sstevel@tonic-gate }
71787c478bd9Sstevel@tonic-gate 
71797c478bd9Sstevel@tonic-gate void
71807c478bd9Sstevel@tonic-gate mdi_client_set_vhci_private(dev_info_t *dip, void *data)
71817c478bd9Sstevel@tonic-gate {
71827c478bd9Sstevel@tonic-gate 	ASSERT(mdi_component_is_client(dip, NULL) == MDI_SUCCESS);
71837c478bd9Sstevel@tonic-gate 	if (mdi_component_is_client(dip, NULL) == MDI_SUCCESS) {
71847c478bd9Sstevel@tonic-gate 		mdi_client_t	*ct;
71857c478bd9Sstevel@tonic-gate 		ct = i_devi_get_client(dip);
71867c478bd9Sstevel@tonic-gate 		ct->ct_vprivate = data;
71877c478bd9Sstevel@tonic-gate 	}
71887c478bd9Sstevel@tonic-gate }
71897c478bd9Sstevel@tonic-gate /*
71907c478bd9Sstevel@tonic-gate  * mdi_pi_get_vhci_private():
71917c478bd9Sstevel@tonic-gate  *		Get the vhci private information associated with the
71927c478bd9Sstevel@tonic-gate  *		mdi_pathinfo node
71937c478bd9Sstevel@tonic-gate  */
71947c478bd9Sstevel@tonic-gate void *
71957c478bd9Sstevel@tonic-gate mdi_pi_get_vhci_private(mdi_pathinfo_t *pip)
71967c478bd9Sstevel@tonic-gate {
71977c478bd9Sstevel@tonic-gate 	caddr_t	vprivate = NULL;
71987c478bd9Sstevel@tonic-gate 	if (pip) {
71997c478bd9Sstevel@tonic-gate 		vprivate = MDI_PI(pip)->pi_vprivate;
72007c478bd9Sstevel@tonic-gate 	}
72017c478bd9Sstevel@tonic-gate 	return (vprivate);
72027c478bd9Sstevel@tonic-gate }
72037c478bd9Sstevel@tonic-gate 
72047c478bd9Sstevel@tonic-gate /*
72057c478bd9Sstevel@tonic-gate  * mdi_pi_set_vhci_private():
72067c478bd9Sstevel@tonic-gate  *		Set the vhci private information in the mdi_pathinfo node
72077c478bd9Sstevel@tonic-gate  */
72087c478bd9Sstevel@tonic-gate void
72097c478bd9Sstevel@tonic-gate mdi_pi_set_vhci_private(mdi_pathinfo_t *pip, void *priv)
72107c478bd9Sstevel@tonic-gate {
72117c478bd9Sstevel@tonic-gate 	if (pip) {
72127c478bd9Sstevel@tonic-gate 		MDI_PI(pip)->pi_vprivate = priv;
72137c478bd9Sstevel@tonic-gate 	}
72147c478bd9Sstevel@tonic-gate }
72157c478bd9Sstevel@tonic-gate 
72167c478bd9Sstevel@tonic-gate /*
72177c478bd9Sstevel@tonic-gate  * mdi_phci_get_vhci_private():
72187c478bd9Sstevel@tonic-gate  *		Get the vhci private information associated with the
72197c478bd9Sstevel@tonic-gate  *		mdi_phci node
72207c478bd9Sstevel@tonic-gate  */
72217c478bd9Sstevel@tonic-gate void *
72227c478bd9Sstevel@tonic-gate mdi_phci_get_vhci_private(dev_info_t *dip)
72237c478bd9Sstevel@tonic-gate {
72247c478bd9Sstevel@tonic-gate 	ASSERT(mdi_component_is_phci(dip, NULL) == MDI_SUCCESS);
72257c478bd9Sstevel@tonic-gate 	if (mdi_component_is_phci(dip, NULL) == MDI_SUCCESS) {
72267c478bd9Sstevel@tonic-gate 		mdi_phci_t	*ph;
72277c478bd9Sstevel@tonic-gate 		ph = i_devi_get_phci(dip);
72287c478bd9Sstevel@tonic-gate 		return (ph->ph_vprivate);
72297c478bd9Sstevel@tonic-gate 	}
72307c478bd9Sstevel@tonic-gate 	return (NULL);
72317c478bd9Sstevel@tonic-gate }
72327c478bd9Sstevel@tonic-gate 
72337c478bd9Sstevel@tonic-gate /*
72347c478bd9Sstevel@tonic-gate  * mdi_phci_set_vhci_private():
72357c478bd9Sstevel@tonic-gate  *		Set the vhci private information in the mdi_phci node
72367c478bd9Sstevel@tonic-gate  */
72377c478bd9Sstevel@tonic-gate void
72387c478bd9Sstevel@tonic-gate mdi_phci_set_vhci_private(dev_info_t *dip, void *priv)
72397c478bd9Sstevel@tonic-gate {
72407c478bd9Sstevel@tonic-gate 	ASSERT(mdi_component_is_phci(dip, NULL) == MDI_SUCCESS);
72417c478bd9Sstevel@tonic-gate 	if (mdi_component_is_phci(dip, NULL) == MDI_SUCCESS) {
72427c478bd9Sstevel@tonic-gate 		mdi_phci_t	*ph;
72437c478bd9Sstevel@tonic-gate 		ph = i_devi_get_phci(dip);
72447c478bd9Sstevel@tonic-gate 		ph->ph_vprivate = priv;
72457c478bd9Sstevel@tonic-gate 	}
72467c478bd9Sstevel@tonic-gate }
72473c34adc5Sramat 
72484c06356bSdh142964 int
72494c06356bSdh142964 mdi_pi_ishidden(mdi_pathinfo_t *pip)
72504c06356bSdh142964 {
72514c06356bSdh142964 	return (MDI_PI_FLAGS_IS_HIDDEN(pip));
72524c06356bSdh142964 }
72534c06356bSdh142964 
72544c06356bSdh142964 int
72554c06356bSdh142964 mdi_pi_device_isremoved(mdi_pathinfo_t *pip)
72564c06356bSdh142964 {
72574c06356bSdh142964 	return (MDI_PI_FLAGS_IS_DEVICE_REMOVED(pip));
72584c06356bSdh142964 }
72594c06356bSdh142964 
72604c06356bSdh142964 /*
72614c06356bSdh142964  * When processing hotplug, if mdi_pi_offline-mdi_pi_free fails then this
72624c06356bSdh142964  * interface is used to represent device removal.
72634c06356bSdh142964  */
72644c06356bSdh142964 int
72654c06356bSdh142964 mdi_pi_device_remove(mdi_pathinfo_t *pip)
72664c06356bSdh142964 {
72674c06356bSdh142964 	MDI_PI_LOCK(pip);
72684c06356bSdh142964 	if (mdi_pi_device_isremoved(pip)) {
72694c06356bSdh142964 		MDI_PI_UNLOCK(pip);
72704c06356bSdh142964 		return (0);
72714c06356bSdh142964 	}
72724c06356bSdh142964 	MDI_PI_FLAGS_SET_DEVICE_REMOVED(pip);
72734c06356bSdh142964 	MDI_PI_FLAGS_SET_HIDDEN(pip);
72744c06356bSdh142964 	MDI_PI_UNLOCK(pip);
72754c06356bSdh142964 
72764c06356bSdh142964 	i_ddi_di_cache_invalidate();
72774c06356bSdh142964 
72784c06356bSdh142964 	return (1);
72794c06356bSdh142964 }
72804c06356bSdh142964 
72814c06356bSdh142964 /*
72824c06356bSdh142964  * When processing hotplug, if a path marked mdi_pi_device_isremoved()
72834c06356bSdh142964  * is now accessible then this interfaces is used to represent device insertion.
72844c06356bSdh142964  */
72854c06356bSdh142964 int
72864c06356bSdh142964 mdi_pi_device_insert(mdi_pathinfo_t *pip)
72874c06356bSdh142964 {
72884c06356bSdh142964 	MDI_PI_LOCK(pip);
72894c06356bSdh142964 	if (!mdi_pi_device_isremoved(pip)) {
72904c06356bSdh142964 		MDI_PI_UNLOCK(pip);
72914c06356bSdh142964 		return (0);
72924c06356bSdh142964 	}
72934c06356bSdh142964 	MDI_PI_FLAGS_CLR_DEVICE_REMOVED(pip);
72944c06356bSdh142964 	MDI_PI_FLAGS_CLR_HIDDEN(pip);
72954c06356bSdh142964 	MDI_PI_UNLOCK(pip);
72964c06356bSdh142964 
72974c06356bSdh142964 	i_ddi_di_cache_invalidate();
72984c06356bSdh142964 
72994c06356bSdh142964 	return (1);
73004c06356bSdh142964 }
73014c06356bSdh142964 
73023c34adc5Sramat /*
73033c34adc5Sramat  * List of vhci class names:
73043c34adc5Sramat  * A vhci class name must be in this list only if the corresponding vhci
73053c34adc5Sramat  * driver intends to use the mdi provided bus config implementation
73063c34adc5Sramat  * (i.e., mdi_vhci_bus_config()).
73073c34adc5Sramat  */
73083c34adc5Sramat static char *vhci_class_list[] = { MDI_HCI_CLASS_SCSI, MDI_HCI_CLASS_IB };
73093c34adc5Sramat #define	N_VHCI_CLASSES	(sizeof (vhci_class_list) / sizeof (char *))
73103c34adc5Sramat 
73113c34adc5Sramat /*
73123c34adc5Sramat  * During boot time, the on-disk vhci cache for every vhci class is read
73133c34adc5Sramat  * in the form of an nvlist and stored here.
73143c34adc5Sramat  */
73153c34adc5Sramat static nvlist_t *vhcache_nvl[N_VHCI_CLASSES];
73163c34adc5Sramat 
73173c34adc5Sramat /* nvpair names in vhci cache nvlist */
73183c34adc5Sramat #define	MDI_VHCI_CACHE_VERSION	1
73193c34adc5Sramat #define	MDI_NVPNAME_VERSION	"version"
73203c34adc5Sramat #define	MDI_NVPNAME_PHCIS	"phcis"
73213c34adc5Sramat #define	MDI_NVPNAME_CTADDRMAP	"clientaddrmap"
73223c34adc5Sramat 
73233c34adc5Sramat /*
73243c34adc5Sramat  * Given vhci class name, return its on-disk vhci cache filename.
73253c34adc5Sramat  * Memory for the returned filename which includes the full path is allocated
73263c34adc5Sramat  * by this function.
73273c34adc5Sramat  */
73283c34adc5Sramat static char *
73293c34adc5Sramat vhclass2vhcache_filename(char *vhclass)
73303c34adc5Sramat {
73313c34adc5Sramat 	char *filename;
73323c34adc5Sramat 	int len;
73333c34adc5Sramat 	static char *fmt = "/etc/devices/mdi_%s_cache";
73343c34adc5Sramat 
73353c34adc5Sramat 	/*
73363c34adc5Sramat 	 * fmt contains the on-disk vhci cache file name format;
73373c34adc5Sramat 	 * for scsi_vhci the filename is "/etc/devices/mdi_scsi_vhci_cache".
73383c34adc5Sramat 	 */
73393c34adc5Sramat 
73403c34adc5Sramat 	/* the -1 below is to account for "%s" in the format string */
73413c34adc5Sramat 	len = strlen(fmt) + strlen(vhclass) - 1;
73423c34adc5Sramat 	filename = kmem_alloc(len, KM_SLEEP);
73433c34adc5Sramat 	(void) snprintf(filename, len, fmt, vhclass);
73443c34adc5Sramat 	ASSERT(len == (strlen(filename) + 1));
73453c34adc5Sramat 	return (filename);
73463c34adc5Sramat }
73473c34adc5Sramat 
73483c34adc5Sramat /*
73493c34adc5Sramat  * initialize the vhci cache related data structures and read the on-disk
73503c34adc5Sramat  * vhci cached data into memory.
73513c34adc5Sramat  */
73523c34adc5Sramat static void
73533c34adc5Sramat setup_vhci_cache(mdi_vhci_t *vh)
73543c34adc5Sramat {
73553c34adc5Sramat 	mdi_vhci_config_t *vhc;
73563c34adc5Sramat 	mdi_vhci_cache_t *vhcache;
73573c34adc5Sramat 	int i;
73583c34adc5Sramat 	nvlist_t *nvl = NULL;
73593c34adc5Sramat 
73603c34adc5Sramat 	vhc = kmem_zalloc(sizeof (mdi_vhci_config_t), KM_SLEEP);
73613c34adc5Sramat 	vh->vh_config = vhc;
73623c34adc5Sramat 	vhcache = &vhc->vhc_vhcache;
73633c34adc5Sramat 
73643c34adc5Sramat 	vhc->vhc_vhcache_filename = vhclass2vhcache_filename(vh->vh_class);
73653c34adc5Sramat 
73663c34adc5Sramat 	mutex_init(&vhc->vhc_lock, NULL, MUTEX_DEFAULT, NULL);
73673c34adc5Sramat 	cv_init(&vhc->vhc_cv, NULL, CV_DRIVER, NULL);
73683c34adc5Sramat 
73693c34adc5Sramat 	rw_init(&vhcache->vhcache_lock, NULL, RW_DRIVER, NULL);
73703c34adc5Sramat 
73713c34adc5Sramat 	/*
73723c34adc5Sramat 	 * Create string hash; same as mod_hash_create_strhash() except that
73733c34adc5Sramat 	 * we use NULL key destructor.
73743c34adc5Sramat 	 */
73753c34adc5Sramat 	vhcache->vhcache_client_hash = mod_hash_create_extended(vh->vh_class,
73763c34adc5Sramat 	    mdi_bus_config_cache_hash_size,
73773c34adc5Sramat 	    mod_hash_null_keydtor, mod_hash_null_valdtor,
73783c34adc5Sramat 	    mod_hash_bystr, NULL, mod_hash_strkey_cmp, KM_SLEEP);
73793c34adc5Sramat 
73803c34adc5Sramat 	/*
73813c34adc5Sramat 	 * The on-disk vhci cache is read during booting prior to the
73823c34adc5Sramat 	 * lights-out period by mdi_read_devices_files().
73833c34adc5Sramat 	 */
73843c34adc5Sramat 	for (i = 0; i < N_VHCI_CLASSES; i++) {
73853c34adc5Sramat 		if (strcmp(vhci_class_list[i], vh->vh_class) == 0) {
73863c34adc5Sramat 			nvl = vhcache_nvl[i];
73873c34adc5Sramat 			vhcache_nvl[i] = NULL;
73883c34adc5Sramat 			break;
73893c34adc5Sramat 		}
73903c34adc5Sramat 	}
73913c34adc5Sramat 
73923c34adc5Sramat 	/*
73933c34adc5Sramat 	 * this is to cover the case of some one manually causing unloading
73943c34adc5Sramat 	 * (or detaching) and reloading (or attaching) of a vhci driver.
73953c34adc5Sramat 	 */
73963c34adc5Sramat 	if (nvl == NULL && modrootloaded)
73973c34adc5Sramat 		nvl = read_on_disk_vhci_cache(vh->vh_class);
73983c34adc5Sramat 
73993c34adc5Sramat 	if (nvl != NULL) {
74003c34adc5Sramat 		rw_enter(&vhcache->vhcache_lock, RW_WRITER);
74013c34adc5Sramat 		if (mainnvl_to_vhcache(vhcache, nvl) == MDI_SUCCESS)
74023c34adc5Sramat 			vhcache->vhcache_flags |= MDI_VHCI_CACHE_SETUP_DONE;
74033c34adc5Sramat 		else  {
74043c34adc5Sramat 			cmn_err(CE_WARN,
74054c06356bSdh142964 			    "%s: data file corrupted, will recreate",
74063c34adc5Sramat 			    vhc->vhc_vhcache_filename);
74073c34adc5Sramat 		}
74083c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
74093c34adc5Sramat 		nvlist_free(nvl);
74103c34adc5Sramat 	}
74113c34adc5Sramat 
74123c34adc5Sramat 	vhc->vhc_cbid = callb_add(stop_vhcache_flush_thread, vhc,
74133c34adc5Sramat 	    CB_CL_UADMIN_PRE_VFS, "mdi_vhcache_flush");
741467e56d35Sramat 
741567e56d35Sramat 	vhc->vhc_path_discovery_boot = mdi_path_discovery_boot;
741667e56d35Sramat 	vhc->vhc_path_discovery_postboot = mdi_path_discovery_postboot;
74173c34adc5Sramat }
74183c34adc5Sramat 
74193c34adc5Sramat /*
74203c34adc5Sramat  * free all vhci cache related resources
74213c34adc5Sramat  */
74223c34adc5Sramat static int
74233c34adc5Sramat destroy_vhci_cache(mdi_vhci_t *vh)
74243c34adc5Sramat {
74253c34adc5Sramat 	mdi_vhci_config_t *vhc = vh->vh_config;
74263c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
74273c34adc5Sramat 	mdi_vhcache_phci_t *cphci, *cphci_next;
74283c34adc5Sramat 	mdi_vhcache_client_t *cct, *cct_next;
74293c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi, *cpi_next;
74303c34adc5Sramat 
74313c34adc5Sramat 	if (stop_vhcache_async_threads(vhc) != MDI_SUCCESS)
74323c34adc5Sramat 		return (MDI_FAILURE);
74333c34adc5Sramat 
74343c34adc5Sramat 	kmem_free(vhc->vhc_vhcache_filename,
74353c34adc5Sramat 	    strlen(vhc->vhc_vhcache_filename) + 1);
74363c34adc5Sramat 
74373c34adc5Sramat 	mod_hash_destroy_strhash(vhcache->vhcache_client_hash);
74383c34adc5Sramat 
74393c34adc5Sramat 	for (cphci = vhcache->vhcache_phci_head; cphci != NULL;
74403c34adc5Sramat 	    cphci = cphci_next) {
74413c34adc5Sramat 		cphci_next = cphci->cphci_next;
74423c34adc5Sramat 		free_vhcache_phci(cphci);
74433c34adc5Sramat 	}
74443c34adc5Sramat 
74453c34adc5Sramat 	for (cct = vhcache->vhcache_client_head; cct != NULL; cct = cct_next) {
74463c34adc5Sramat 		cct_next = cct->cct_next;
74473c34adc5Sramat 		for (cpi = cct->cct_cpi_head; cpi != NULL; cpi = cpi_next) {
74483c34adc5Sramat 			cpi_next = cpi->cpi_next;
74493c34adc5Sramat 			free_vhcache_pathinfo(cpi);
74503c34adc5Sramat 		}
74513c34adc5Sramat 		free_vhcache_client(cct);
74523c34adc5Sramat 	}
74533c34adc5Sramat 
74543c34adc5Sramat 	rw_destroy(&vhcache->vhcache_lock);
74553c34adc5Sramat 
74563c34adc5Sramat 	mutex_destroy(&vhc->vhc_lock);
74573c34adc5Sramat 	cv_destroy(&vhc->vhc_cv);
74583c34adc5Sramat 	kmem_free(vhc, sizeof (mdi_vhci_config_t));
74593c34adc5Sramat 	return (MDI_SUCCESS);
74603c34adc5Sramat }
74613c34adc5Sramat 
74623c34adc5Sramat /*
74633c34adc5Sramat  * Stop all vhci cache related async threads and free their resources.
74643c34adc5Sramat  */
74653c34adc5Sramat static int
74663c34adc5Sramat stop_vhcache_async_threads(mdi_vhci_config_t *vhc)
74673c34adc5Sramat {
74683c34adc5Sramat 	mdi_async_client_config_t *acc, *acc_next;
74693c34adc5Sramat 
74703c34adc5Sramat 	mutex_enter(&vhc->vhc_lock);
74713c34adc5Sramat 	vhc->vhc_flags |= MDI_VHC_EXIT;
74723c34adc5Sramat 	ASSERT(vhc->vhc_acc_thrcount >= 0);
74733c34adc5Sramat 	cv_broadcast(&vhc->vhc_cv);
74743c34adc5Sramat 
74753c34adc5Sramat 	while ((vhc->vhc_flags & MDI_VHC_VHCACHE_FLUSH_THREAD) ||
74763c34adc5Sramat 	    vhc->vhc_acc_thrcount != 0) {
74773c34adc5Sramat 		mutex_exit(&vhc->vhc_lock);
747896c4a178SChris Horne 		delay_random(mdi_delay);
74793c34adc5Sramat 		mutex_enter(&vhc->vhc_lock);
74803c34adc5Sramat 	}
74813c34adc5Sramat 
74823c34adc5Sramat 	vhc->vhc_flags &= ~MDI_VHC_EXIT;
74833c34adc5Sramat 
74843c34adc5Sramat 	for (acc = vhc->vhc_acc_list_head; acc != NULL; acc = acc_next) {
74853c34adc5Sramat 		acc_next = acc->acc_next;
74863c34adc5Sramat 		free_async_client_config(acc);
74873c34adc5Sramat 	}
74883c34adc5Sramat 	vhc->vhc_acc_list_head = NULL;
74893c34adc5Sramat 	vhc->vhc_acc_list_tail = NULL;
74903c34adc5Sramat 	vhc->vhc_acc_count = 0;
74913c34adc5Sramat 
74923c34adc5Sramat 	if (vhc->vhc_flags & MDI_VHC_VHCACHE_DIRTY) {
74933c34adc5Sramat 		vhc->vhc_flags &= ~MDI_VHC_VHCACHE_DIRTY;
74943c34adc5Sramat 		mutex_exit(&vhc->vhc_lock);
74953c34adc5Sramat 		if (flush_vhcache(vhc, 0) != MDI_SUCCESS) {
74963c34adc5Sramat 			vhcache_dirty(vhc);
74973c34adc5Sramat 			return (MDI_FAILURE);
74983c34adc5Sramat 		}
74993c34adc5Sramat 	} else
75003c34adc5Sramat 		mutex_exit(&vhc->vhc_lock);
75013c34adc5Sramat 
75023c34adc5Sramat 	if (callb_delete(vhc->vhc_cbid) != 0)
75033c34adc5Sramat 		return (MDI_FAILURE);
75043c34adc5Sramat 
75053c34adc5Sramat 	return (MDI_SUCCESS);
75063c34adc5Sramat }
75073c34adc5Sramat 
75083c34adc5Sramat /*
75093c34adc5Sramat  * Stop vhci cache flush thread
75103c34adc5Sramat  */
75113c34adc5Sramat /* ARGSUSED */
75123c34adc5Sramat static boolean_t
75133c34adc5Sramat stop_vhcache_flush_thread(void *arg, int code)
75143c34adc5Sramat {
75153c34adc5Sramat 	mdi_vhci_config_t *vhc = (mdi_vhci_config_t *)arg;
75163c34adc5Sramat 
75173c34adc5Sramat 	mutex_enter(&vhc->vhc_lock);
75183c34adc5Sramat 	vhc->vhc_flags |= MDI_VHC_EXIT;
75193c34adc5Sramat 	cv_broadcast(&vhc->vhc_cv);
75203c34adc5Sramat 
75213c34adc5Sramat 	while (vhc->vhc_flags & MDI_VHC_VHCACHE_FLUSH_THREAD) {
75223c34adc5Sramat 		mutex_exit(&vhc->vhc_lock);
752396c4a178SChris Horne 		delay_random(mdi_delay);
75243c34adc5Sramat 		mutex_enter(&vhc->vhc_lock);
75253c34adc5Sramat 	}
75263c34adc5Sramat 
75273c34adc5Sramat 	if (vhc->vhc_flags & MDI_VHC_VHCACHE_DIRTY) {
75283c34adc5Sramat 		vhc->vhc_flags &= ~MDI_VHC_VHCACHE_DIRTY;
75293c34adc5Sramat 		mutex_exit(&vhc->vhc_lock);
75303c34adc5Sramat 		(void) flush_vhcache(vhc, 1);
75313c34adc5Sramat 	} else
75323c34adc5Sramat 		mutex_exit(&vhc->vhc_lock);
75333c34adc5Sramat 
75343c34adc5Sramat 	return (B_TRUE);
75353c34adc5Sramat }
75363c34adc5Sramat 
75373c34adc5Sramat /*
75383c34adc5Sramat  * Enqueue the vhcache phci (cphci) at the tail of the list
75393c34adc5Sramat  */
75403c34adc5Sramat static void
75413c34adc5Sramat enqueue_vhcache_phci(mdi_vhci_cache_t *vhcache, mdi_vhcache_phci_t *cphci)
75423c34adc5Sramat {
75433c34adc5Sramat 	cphci->cphci_next = NULL;
75443c34adc5Sramat 	if (vhcache->vhcache_phci_head == NULL)
75453c34adc5Sramat 		vhcache->vhcache_phci_head = cphci;
75463c34adc5Sramat 	else
75473c34adc5Sramat 		vhcache->vhcache_phci_tail->cphci_next = cphci;
75483c34adc5Sramat 	vhcache->vhcache_phci_tail = cphci;
75493c34adc5Sramat }
75503c34adc5Sramat 
75513c34adc5Sramat /*
75523c34adc5Sramat  * Enqueue the vhcache pathinfo (cpi) at the tail of the list
75533c34adc5Sramat  */
75543c34adc5Sramat static void
75553c34adc5Sramat enqueue_tail_vhcache_pathinfo(mdi_vhcache_client_t *cct,
75563c34adc5Sramat     mdi_vhcache_pathinfo_t *cpi)
75573c34adc5Sramat {
75583c34adc5Sramat 	cpi->cpi_next = NULL;
75593c34adc5Sramat 	if (cct->cct_cpi_head == NULL)
75603c34adc5Sramat 		cct->cct_cpi_head = cpi;
75613c34adc5Sramat 	else
75623c34adc5Sramat 		cct->cct_cpi_tail->cpi_next = cpi;
75633c34adc5Sramat 	cct->cct_cpi_tail = cpi;
75643c34adc5Sramat }
75653c34adc5Sramat 
75663c34adc5Sramat /*
75673c34adc5Sramat  * Enqueue the vhcache pathinfo (cpi) at the correct location in the
75683c34adc5Sramat  * ordered list. All cpis which do not have MDI_CPI_HINT_PATH_DOES_NOT_EXIST
75693c34adc5Sramat  * flag set come at the beginning of the list. All cpis which have this
75703c34adc5Sramat  * flag set come at the end of the list.
75713c34adc5Sramat  */
75723c34adc5Sramat static void
75733c34adc5Sramat enqueue_vhcache_pathinfo(mdi_vhcache_client_t *cct,
75743c34adc5Sramat     mdi_vhcache_pathinfo_t *newcpi)
75753c34adc5Sramat {
75763c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi, *prev_cpi;
75773c34adc5Sramat 
75783c34adc5Sramat 	if (cct->cct_cpi_head == NULL ||
75793c34adc5Sramat 	    (newcpi->cpi_flags & MDI_CPI_HINT_PATH_DOES_NOT_EXIST))
75803c34adc5Sramat 		enqueue_tail_vhcache_pathinfo(cct, newcpi);
75813c34adc5Sramat 	else {
75823c34adc5Sramat 		for (cpi = cct->cct_cpi_head, prev_cpi = NULL; cpi != NULL &&
75833c34adc5Sramat 		    !(cpi->cpi_flags & MDI_CPI_HINT_PATH_DOES_NOT_EXIST);
75843c34adc5Sramat 		    prev_cpi = cpi, cpi = cpi->cpi_next)
75853c34adc5Sramat 			;
75863c34adc5Sramat 
75873c34adc5Sramat 		if (prev_cpi == NULL)
75883c34adc5Sramat 			cct->cct_cpi_head = newcpi;
75893c34adc5Sramat 		else
75903c34adc5Sramat 			prev_cpi->cpi_next = newcpi;
75913c34adc5Sramat 
75923c34adc5Sramat 		newcpi->cpi_next = cpi;
75933c34adc5Sramat 
75943c34adc5Sramat 		if (cpi == NULL)
75953c34adc5Sramat 			cct->cct_cpi_tail = newcpi;
75963c34adc5Sramat 	}
75973c34adc5Sramat }
75983c34adc5Sramat 
75993c34adc5Sramat /*
76003c34adc5Sramat  * Enqueue the vhcache client (cct) at the tail of the list
76013c34adc5Sramat  */
76023c34adc5Sramat static void
76033c34adc5Sramat enqueue_vhcache_client(mdi_vhci_cache_t *vhcache,
76043c34adc5Sramat     mdi_vhcache_client_t *cct)
76053c34adc5Sramat {
76063c34adc5Sramat 	cct->cct_next = NULL;
76073c34adc5Sramat 	if (vhcache->vhcache_client_head == NULL)
76083c34adc5Sramat 		vhcache->vhcache_client_head = cct;
76093c34adc5Sramat 	else
76103c34adc5Sramat 		vhcache->vhcache_client_tail->cct_next = cct;
76113c34adc5Sramat 	vhcache->vhcache_client_tail = cct;
76123c34adc5Sramat }
76133c34adc5Sramat 
76143c34adc5Sramat static void
76153c34adc5Sramat free_string_array(char **str, int nelem)
76163c34adc5Sramat {
76173c34adc5Sramat 	int i;
76183c34adc5Sramat 
76193c34adc5Sramat 	if (str) {
76203c34adc5Sramat 		for (i = 0; i < nelem; i++) {
76213c34adc5Sramat 			if (str[i])
76223c34adc5Sramat 				kmem_free(str[i], strlen(str[i]) + 1);
76233c34adc5Sramat 		}
76243c34adc5Sramat 		kmem_free(str, sizeof (char *) * nelem);
76253c34adc5Sramat 	}
76263c34adc5Sramat }
76273c34adc5Sramat 
76283c34adc5Sramat static void
76293c34adc5Sramat free_vhcache_phci(mdi_vhcache_phci_t *cphci)
76303c34adc5Sramat {
76313c34adc5Sramat 	kmem_free(cphci->cphci_path, strlen(cphci->cphci_path) + 1);
76323c34adc5Sramat 	kmem_free(cphci, sizeof (*cphci));
76333c34adc5Sramat }
76343c34adc5Sramat 
76353c34adc5Sramat static void
76363c34adc5Sramat free_vhcache_pathinfo(mdi_vhcache_pathinfo_t *cpi)
76373c34adc5Sramat {
76383c34adc5Sramat 	kmem_free(cpi->cpi_addr, strlen(cpi->cpi_addr) + 1);
76393c34adc5Sramat 	kmem_free(cpi, sizeof (*cpi));
76403c34adc5Sramat }
76413c34adc5Sramat 
76423c34adc5Sramat static void
76433c34adc5Sramat free_vhcache_client(mdi_vhcache_client_t *cct)
76443c34adc5Sramat {
76453c34adc5Sramat 	kmem_free(cct->cct_name_addr, strlen(cct->cct_name_addr) + 1);
76463c34adc5Sramat 	kmem_free(cct, sizeof (*cct));
76473c34adc5Sramat }
76483c34adc5Sramat 
76493c34adc5Sramat static char *
76503c34adc5Sramat vhcache_mknameaddr(char *ct_name, char *ct_addr, int *ret_len)
76513c34adc5Sramat {
76523c34adc5Sramat 	char *name_addr;
76533c34adc5Sramat 	int len;
76543c34adc5Sramat 
76553c34adc5Sramat 	len = strlen(ct_name) + strlen(ct_addr) + 2;
76563c34adc5Sramat 	name_addr = kmem_alloc(len, KM_SLEEP);
76573c34adc5Sramat 	(void) snprintf(name_addr, len, "%s@%s", ct_name, ct_addr);
76583c34adc5Sramat 
76593c34adc5Sramat 	if (ret_len)
76603c34adc5Sramat 		*ret_len = len;
76613c34adc5Sramat 	return (name_addr);
76623c34adc5Sramat }
76633c34adc5Sramat 
76643c34adc5Sramat /*
76653c34adc5Sramat  * Copy the contents of paddrnvl to vhci cache.
76663c34adc5Sramat  * paddrnvl nvlist contains path information for a vhci client.
76673c34adc5Sramat  * See the comment in mainnvl_to_vhcache() for the format of this nvlist.
76683c34adc5Sramat  */
76693c34adc5Sramat static void
76703c34adc5Sramat paddrnvl_to_vhcache(nvlist_t *nvl, mdi_vhcache_phci_t *cphci_list[],
76713c34adc5Sramat     mdi_vhcache_client_t *cct)
76723c34adc5Sramat {
76733c34adc5Sramat 	nvpair_t *nvp = NULL;
76743c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi;
76753c34adc5Sramat 	uint_t nelem;
76763c34adc5Sramat 	uint32_t *val;
76773c34adc5Sramat 
76783c34adc5Sramat 	while ((nvp = nvlist_next_nvpair(nvl, nvp)) != NULL) {
76793c34adc5Sramat 		ASSERT(nvpair_type(nvp) == DATA_TYPE_UINT32_ARRAY);
76803c34adc5Sramat 		cpi = kmem_zalloc(sizeof (*cpi), KM_SLEEP);
76813c34adc5Sramat 		cpi->cpi_addr = i_ddi_strdup(nvpair_name(nvp), KM_SLEEP);
76823c34adc5Sramat 		(void) nvpair_value_uint32_array(nvp, &val, &nelem);
76833c34adc5Sramat 		ASSERT(nelem == 2);
76843c34adc5Sramat 		cpi->cpi_cphci = cphci_list[val[0]];
76853c34adc5Sramat 		cpi->cpi_flags = val[1];
76863c34adc5Sramat 		enqueue_tail_vhcache_pathinfo(cct, cpi);
76873c34adc5Sramat 	}
76883c34adc5Sramat }
76893c34adc5Sramat 
76903c34adc5Sramat /*
76913c34adc5Sramat  * Copy the contents of caddrmapnvl to vhci cache.
76923c34adc5Sramat  * caddrmapnvl nvlist contains vhci client address to phci client address
76933c34adc5Sramat  * mappings. See the comment in mainnvl_to_vhcache() for the format of
76943c34adc5Sramat  * this nvlist.
76953c34adc5Sramat  */
76963c34adc5Sramat static void
76973c34adc5Sramat caddrmapnvl_to_vhcache(mdi_vhci_cache_t *vhcache, nvlist_t *nvl,
76983c34adc5Sramat     mdi_vhcache_phci_t *cphci_list[])
76993c34adc5Sramat {
77003c34adc5Sramat 	nvpair_t *nvp = NULL;
77013c34adc5Sramat 	nvlist_t *paddrnvl;
77023c34adc5Sramat 	mdi_vhcache_client_t *cct;
77033c34adc5Sramat 
77043c34adc5Sramat 	while ((nvp = nvlist_next_nvpair(nvl, nvp)) != NULL) {
77053c34adc5Sramat 		ASSERT(nvpair_type(nvp) == DATA_TYPE_NVLIST);
77063c34adc5Sramat 		cct = kmem_zalloc(sizeof (*cct), KM_SLEEP);
77073c34adc5Sramat 		cct->cct_name_addr = i_ddi_strdup(nvpair_name(nvp), KM_SLEEP);
77083c34adc5Sramat 		(void) nvpair_value_nvlist(nvp, &paddrnvl);
77093c34adc5Sramat 		paddrnvl_to_vhcache(paddrnvl, cphci_list, cct);
77103c34adc5Sramat 		/* the client must contain at least one path */
77113c34adc5Sramat 		ASSERT(cct->cct_cpi_head != NULL);
77123c34adc5Sramat 
77133c34adc5Sramat 		enqueue_vhcache_client(vhcache, cct);
77143c34adc5Sramat 		(void) mod_hash_insert(vhcache->vhcache_client_hash,
77153c34adc5Sramat 		    (mod_hash_key_t)cct->cct_name_addr, (mod_hash_val_t)cct);
77163c34adc5Sramat 	}
77173c34adc5Sramat }
77183c34adc5Sramat 
77193c34adc5Sramat /*
77203c34adc5Sramat  * Copy the contents of the main nvlist to vhci cache.
77213c34adc5Sramat  *
77223c34adc5Sramat  * VHCI busconfig cached data is stored in the form of a nvlist on the disk.
77233c34adc5Sramat  * The nvlist contains the mappings between the vhci client addresses and
77243c34adc5Sramat  * their corresponding phci client addresses.
77253c34adc5Sramat  *
77263c34adc5Sramat  * The structure of the nvlist is as follows:
77273c34adc5Sramat  *
77283c34adc5Sramat  * Main nvlist:
77293c34adc5Sramat  *	NAME		TYPE		DATA
77303c34adc5Sramat  *	version		int32		version number
77313c34adc5Sramat  *	phcis		string array	array of phci paths
77323c34adc5Sramat  *	clientaddrmap	nvlist_t	c2paddrs_nvl (see below)
77333c34adc5Sramat  *
77343c34adc5Sramat  * structure of c2paddrs_nvl:
77353c34adc5Sramat  *	NAME		TYPE		DATA
77363c34adc5Sramat  *	caddr1		nvlist_t	paddrs_nvl1
77373c34adc5Sramat  *	caddr2		nvlist_t	paddrs_nvl2
77383c34adc5Sramat  *	...
77393c34adc5Sramat  * where caddr1, caddr2, ... are vhci client name and addresses in the
77403c34adc5Sramat  * form of "<clientname>@<clientaddress>".
77413c34adc5Sramat  * (for example: "ssd@2000002037cd9f72");
77423c34adc5Sramat  * paddrs_nvl1, paddrs_nvl2, .. are nvlists that contain path information.
77433c34adc5Sramat  *
77443c34adc5Sramat  * structure of paddrs_nvl:
77453c34adc5Sramat  *	NAME		TYPE		DATA
77463c34adc5Sramat  *	pi_addr1	uint32_array	(phci-id, cpi_flags)
77473c34adc5Sramat  *	pi_addr2	uint32_array	(phci-id, cpi_flags)
77483c34adc5Sramat  *	...
77493c34adc5Sramat  * where pi_addr1, pi_addr2, ... are bus specific addresses of pathinfo nodes
77503c34adc5Sramat  * (so called pi_addrs, for example: "w2100002037cd9f72,0");
77514c06356bSdh142964  * phci-ids are integers that identify pHCIs to which the
77523c34adc5Sramat  * the bus specific address belongs to. These integers are used as an index
77534c06356bSdh142964  * into to the phcis string array in the main nvlist to get the pHCI path.
77543c34adc5Sramat  */
77553c34adc5Sramat static int
77563c34adc5Sramat mainnvl_to_vhcache(mdi_vhci_cache_t *vhcache, nvlist_t *nvl)
77573c34adc5Sramat {
77583c34adc5Sramat 	char **phcis, **phci_namep;
77593c34adc5Sramat 	uint_t nphcis;
77603c34adc5Sramat 	mdi_vhcache_phci_t *cphci, **cphci_list;
77613c34adc5Sramat 	nvlist_t *caddrmapnvl;
77623c34adc5Sramat 	int32_t ver;
77633c34adc5Sramat 	int i;
77643c34adc5Sramat 	size_t cphci_list_size;
77653c34adc5Sramat 
77663c34adc5Sramat 	ASSERT(RW_WRITE_HELD(&vhcache->vhcache_lock));
77673c34adc5Sramat 
77683c34adc5Sramat 	if (nvlist_lookup_int32(nvl, MDI_NVPNAME_VERSION, &ver) != 0 ||
77693c34adc5Sramat 	    ver != MDI_VHCI_CACHE_VERSION)
77703c34adc5Sramat 		return (MDI_FAILURE);
77713c34adc5Sramat 
77723c34adc5Sramat 	if (nvlist_lookup_string_array(nvl, MDI_NVPNAME_PHCIS, &phcis,
77733c34adc5Sramat 	    &nphcis) != 0)
77743c34adc5Sramat 		return (MDI_SUCCESS);
77753c34adc5Sramat 
77763c34adc5Sramat 	ASSERT(nphcis > 0);
77773c34adc5Sramat 
77783c34adc5Sramat 	cphci_list_size = sizeof (mdi_vhcache_phci_t *) * nphcis;
77793c34adc5Sramat 	cphci_list = kmem_alloc(cphci_list_size, KM_SLEEP);
77803c34adc5Sramat 	for (i = 0, phci_namep = phcis; i < nphcis; i++, phci_namep++) {
77813c34adc5Sramat 		cphci = kmem_zalloc(sizeof (mdi_vhcache_phci_t), KM_SLEEP);
77823c34adc5Sramat 		cphci->cphci_path = i_ddi_strdup(*phci_namep, KM_SLEEP);
77833c34adc5Sramat 		enqueue_vhcache_phci(vhcache, cphci);
77843c34adc5Sramat 		cphci_list[i] = cphci;
77853c34adc5Sramat 	}
77863c34adc5Sramat 
77873c34adc5Sramat 	ASSERT(vhcache->vhcache_phci_head != NULL);
77883c34adc5Sramat 
77893c34adc5Sramat 	if (nvlist_lookup_nvlist(nvl, MDI_NVPNAME_CTADDRMAP, &caddrmapnvl) == 0)
77903c34adc5Sramat 		caddrmapnvl_to_vhcache(vhcache, caddrmapnvl, cphci_list);
77913c34adc5Sramat 
77923c34adc5Sramat 	kmem_free(cphci_list, cphci_list_size);
77933c34adc5Sramat 	return (MDI_SUCCESS);
77943c34adc5Sramat }
77953c34adc5Sramat 
77963c34adc5Sramat /*
77973c34adc5Sramat  * Build paddrnvl for the specified client using the information in the
77983c34adc5Sramat  * vhci cache and add it to the caddrmapnnvl.
77993c34adc5Sramat  * Returns 0 on success, errno on failure.
78003c34adc5Sramat  */
78013c34adc5Sramat static int
78023c34adc5Sramat vhcache_to_paddrnvl(mdi_vhci_cache_t *vhcache, mdi_vhcache_client_t *cct,
78033c34adc5Sramat     nvlist_t *caddrmapnvl)
78043c34adc5Sramat {
78053c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi;
78063c34adc5Sramat 	nvlist_t *nvl;
78073c34adc5Sramat 	int err;
78083c34adc5Sramat 	uint32_t val[2];
78093c34adc5Sramat 
78103c34adc5Sramat 	ASSERT(RW_LOCK_HELD(&vhcache->vhcache_lock));
78113c34adc5Sramat 
78123c34adc5Sramat 	if ((err = nvlist_alloc(&nvl, 0, KM_SLEEP)) != 0)
78133c34adc5Sramat 		return (err);
78143c34adc5Sramat 
78153c34adc5Sramat 	for (cpi = cct->cct_cpi_head; cpi != NULL; cpi = cpi->cpi_next) {
78163c34adc5Sramat 		val[0] = cpi->cpi_cphci->cphci_id;
78173c34adc5Sramat 		val[1] = cpi->cpi_flags;
78183c34adc5Sramat 		if ((err = nvlist_add_uint32_array(nvl, cpi->cpi_addr, val, 2))
78193c34adc5Sramat 		    != 0)
78203c34adc5Sramat 			goto out;
78213c34adc5Sramat 	}
78223c34adc5Sramat 
78233c34adc5Sramat 	err = nvlist_add_nvlist(caddrmapnvl, cct->cct_name_addr, nvl);
78243c34adc5Sramat out:
78253c34adc5Sramat 	nvlist_free(nvl);
78263c34adc5Sramat 	return (err);
78273c34adc5Sramat }
78283c34adc5Sramat 
78293c34adc5Sramat /*
78303c34adc5Sramat  * Build caddrmapnvl using the information in the vhci cache
78313c34adc5Sramat  * and add it to the mainnvl.
78323c34adc5Sramat  * Returns 0 on success, errno on failure.
78333c34adc5Sramat  */
78343c34adc5Sramat static int
78353c34adc5Sramat vhcache_to_caddrmapnvl(mdi_vhci_cache_t *vhcache, nvlist_t *mainnvl)
78363c34adc5Sramat {
78373c34adc5Sramat 	mdi_vhcache_client_t *cct;
78383c34adc5Sramat 	nvlist_t *nvl;
78393c34adc5Sramat 	int err;
78403c34adc5Sramat 
78413c34adc5Sramat 	ASSERT(RW_LOCK_HELD(&vhcache->vhcache_lock));
78423c34adc5Sramat 
78433c34adc5Sramat 	if ((err = nvlist_alloc(&nvl, NV_UNIQUE_NAME, KM_SLEEP)) != 0)
78443c34adc5Sramat 		return (err);
78453c34adc5Sramat 
78463c34adc5Sramat 	for (cct = vhcache->vhcache_client_head; cct != NULL;
78473c34adc5Sramat 	    cct = cct->cct_next) {
78483c34adc5Sramat 		if ((err = vhcache_to_paddrnvl(vhcache, cct, nvl)) != 0)
78493c34adc5Sramat 			goto out;
78503c34adc5Sramat 	}
78513c34adc5Sramat 
78523c34adc5Sramat 	err = nvlist_add_nvlist(mainnvl, MDI_NVPNAME_CTADDRMAP, nvl);
78533c34adc5Sramat out:
78543c34adc5Sramat 	nvlist_free(nvl);
78553c34adc5Sramat 	return (err);
78563c34adc5Sramat }
78573c34adc5Sramat 
78583c34adc5Sramat /*
78593c34adc5Sramat  * Build nvlist using the information in the vhci cache.
78603c34adc5Sramat  * See the comment in mainnvl_to_vhcache() for the format of the nvlist.
78613c34adc5Sramat  * Returns nvl on success, NULL on failure.
78623c34adc5Sramat  */
78633c34adc5Sramat static nvlist_t *
78643c34adc5Sramat vhcache_to_mainnvl(mdi_vhci_cache_t *vhcache)
78653c34adc5Sramat {
78663c34adc5Sramat 	mdi_vhcache_phci_t *cphci;
78673c34adc5Sramat 	uint_t phci_count;
78683c34adc5Sramat 	char **phcis;
78693c34adc5Sramat 	nvlist_t *nvl;
78703c34adc5Sramat 	int err, i;
78713c34adc5Sramat 
78723c34adc5Sramat 	if ((err = nvlist_alloc(&nvl, NV_UNIQUE_NAME, KM_SLEEP)) != 0) {
78733c34adc5Sramat 		nvl = NULL;
78743c34adc5Sramat 		goto out;
78753c34adc5Sramat 	}
78763c34adc5Sramat 
78773c34adc5Sramat 	if ((err = nvlist_add_int32(nvl, MDI_NVPNAME_VERSION,
78783c34adc5Sramat 	    MDI_VHCI_CACHE_VERSION)) != 0)
78793c34adc5Sramat 		goto out;
78803c34adc5Sramat 
78813c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_READER);
78823c34adc5Sramat 	if (vhcache->vhcache_phci_head == NULL) {
78833c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
78843c34adc5Sramat 		return (nvl);
78853c34adc5Sramat 	}
78863c34adc5Sramat 
78873c34adc5Sramat 	phci_count = 0;
78883c34adc5Sramat 	for (cphci = vhcache->vhcache_phci_head; cphci != NULL;
78893c34adc5Sramat 	    cphci = cphci->cphci_next)
78903c34adc5Sramat 		cphci->cphci_id = phci_count++;
78913c34adc5Sramat 
78923c34adc5Sramat 	/* build phci pathname list */
78933c34adc5Sramat 	phcis = kmem_alloc(sizeof (char *) * phci_count, KM_SLEEP);
78943c34adc5Sramat 	for (cphci = vhcache->vhcache_phci_head, i = 0; cphci != NULL;
78953c34adc5Sramat 	    cphci = cphci->cphci_next, i++)
78963c34adc5Sramat 		phcis[i] = i_ddi_strdup(cphci->cphci_path, KM_SLEEP);
78973c34adc5Sramat 
78983c34adc5Sramat 	err = nvlist_add_string_array(nvl, MDI_NVPNAME_PHCIS, phcis,
78993c34adc5Sramat 	    phci_count);
79003c34adc5Sramat 	free_string_array(phcis, phci_count);
79013c34adc5Sramat 
79023c34adc5Sramat 	if (err == 0 &&
79033c34adc5Sramat 	    (err = vhcache_to_caddrmapnvl(vhcache, nvl)) == 0) {
79043c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
79053c34adc5Sramat 		return (nvl);
79063c34adc5Sramat 	}
79073c34adc5Sramat 
79083c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
79093c34adc5Sramat out:
79103c34adc5Sramat 	if (nvl)
79113c34adc5Sramat 		nvlist_free(nvl);
79123c34adc5Sramat 	return (NULL);
79133c34adc5Sramat }
79143c34adc5Sramat 
79153c34adc5Sramat /*
79163c34adc5Sramat  * Lookup vhcache phci structure for the specified phci path.
79173c34adc5Sramat  */
79183c34adc5Sramat static mdi_vhcache_phci_t *
79193c34adc5Sramat lookup_vhcache_phci_by_name(mdi_vhci_cache_t *vhcache, char *phci_path)
79203c34adc5Sramat {
79213c34adc5Sramat 	mdi_vhcache_phci_t *cphci;
79223c34adc5Sramat 
79233c34adc5Sramat 	ASSERT(RW_LOCK_HELD(&vhcache->vhcache_lock));
79243c34adc5Sramat 
79253c34adc5Sramat 	for (cphci = vhcache->vhcache_phci_head; cphci != NULL;
79263c34adc5Sramat 	    cphci = cphci->cphci_next) {
79273c34adc5Sramat 		if (strcmp(cphci->cphci_path, phci_path) == 0)
79283c34adc5Sramat 			return (cphci);
79293c34adc5Sramat 	}
79303c34adc5Sramat 
79313c34adc5Sramat 	return (NULL);
79323c34adc5Sramat }
79333c34adc5Sramat 
79343c34adc5Sramat /*
79353c34adc5Sramat  * Lookup vhcache phci structure for the specified phci.
79363c34adc5Sramat  */
79373c34adc5Sramat static mdi_vhcache_phci_t *
79383c34adc5Sramat lookup_vhcache_phci_by_addr(mdi_vhci_cache_t *vhcache, mdi_phci_t *ph)
79393c34adc5Sramat {
79403c34adc5Sramat 	mdi_vhcache_phci_t *cphci;
79413c34adc5Sramat 
79423c34adc5Sramat 	ASSERT(RW_LOCK_HELD(&vhcache->vhcache_lock));
79433c34adc5Sramat 
79443c34adc5Sramat 	for (cphci = vhcache->vhcache_phci_head; cphci != NULL;
79453c34adc5Sramat 	    cphci = cphci->cphci_next) {
79463c34adc5Sramat 		if (cphci->cphci_phci == ph)
79473c34adc5Sramat 			return (cphci);
79483c34adc5Sramat 	}
79493c34adc5Sramat 
79503c34adc5Sramat 	return (NULL);
79513c34adc5Sramat }
79523c34adc5Sramat 
79533c34adc5Sramat /*
79543c34adc5Sramat  * Add the specified phci to the vhci cache if not already present.
79553c34adc5Sramat  */
79563c34adc5Sramat static void
79573c34adc5Sramat vhcache_phci_add(mdi_vhci_config_t *vhc, mdi_phci_t *ph)
79583c34adc5Sramat {
79593c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
79603c34adc5Sramat 	mdi_vhcache_phci_t *cphci;
79613c34adc5Sramat 	char *pathname;
79623c34adc5Sramat 	int cache_updated;
79633c34adc5Sramat 
79643c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_WRITER);
79653c34adc5Sramat 
79663c34adc5Sramat 	pathname = kmem_alloc(MAXPATHLEN, KM_SLEEP);
79673c34adc5Sramat 	(void) ddi_pathname(ph->ph_dip, pathname);
79683c34adc5Sramat 	if ((cphci = lookup_vhcache_phci_by_name(vhcache, pathname))
79693c34adc5Sramat 	    != NULL) {
79703c34adc5Sramat 		cphci->cphci_phci = ph;
79713c34adc5Sramat 		cache_updated = 0;
79723c34adc5Sramat 	} else {
79733c34adc5Sramat 		cphci = kmem_zalloc(sizeof (*cphci), KM_SLEEP);
79743c34adc5Sramat 		cphci->cphci_path = i_ddi_strdup(pathname, KM_SLEEP);
79753c34adc5Sramat 		cphci->cphci_phci = ph;
79763c34adc5Sramat 		enqueue_vhcache_phci(vhcache, cphci);
79773c34adc5Sramat 		cache_updated = 1;
79783c34adc5Sramat 	}
797967e56d35Sramat 
79803c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
79813c34adc5Sramat 
798267e56d35Sramat 	/*
798367e56d35Sramat 	 * Since a new phci has been added, reset
798467e56d35Sramat 	 * vhc_path_discovery_cutoff_time to allow for discovery of paths
798567e56d35Sramat 	 * during next vhcache_discover_paths().
798667e56d35Sramat 	 */
798767e56d35Sramat 	mutex_enter(&vhc->vhc_lock);
798867e56d35Sramat 	vhc->vhc_path_discovery_cutoff_time = 0;
798967e56d35Sramat 	mutex_exit(&vhc->vhc_lock);
799067e56d35Sramat 
79913c34adc5Sramat 	kmem_free(pathname, MAXPATHLEN);
79923c34adc5Sramat 	if (cache_updated)
79933c34adc5Sramat 		vhcache_dirty(vhc);
79943c34adc5Sramat }
79953c34adc5Sramat 
79963c34adc5Sramat /*
79973c34adc5Sramat  * Remove the reference to the specified phci from the vhci cache.
79983c34adc5Sramat  */
79993c34adc5Sramat static void
80003c34adc5Sramat vhcache_phci_remove(mdi_vhci_config_t *vhc, mdi_phci_t *ph)
80013c34adc5Sramat {
80023c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
80033c34adc5Sramat 	mdi_vhcache_phci_t *cphci;
80043c34adc5Sramat 
80053c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_WRITER);
80063c34adc5Sramat 	if ((cphci = lookup_vhcache_phci_by_addr(vhcache, ph)) != NULL) {
80073c34adc5Sramat 		/* do not remove the actual mdi_vhcache_phci structure */
80083c34adc5Sramat 		cphci->cphci_phci = NULL;
80093c34adc5Sramat 	}
80103c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
80113c34adc5Sramat }
80123c34adc5Sramat 
80133c34adc5Sramat static void
80143c34adc5Sramat init_vhcache_lookup_token(mdi_vhcache_lookup_token_t *dst,
80153c34adc5Sramat     mdi_vhcache_lookup_token_t *src)
80163c34adc5Sramat {
80173c34adc5Sramat 	if (src == NULL) {
80183c34adc5Sramat 		dst->lt_cct = NULL;
80193c34adc5Sramat 		dst->lt_cct_lookup_time = 0;
80203c34adc5Sramat 	} else {
80213c34adc5Sramat 		dst->lt_cct = src->lt_cct;
80223c34adc5Sramat 		dst->lt_cct_lookup_time = src->lt_cct_lookup_time;
80233c34adc5Sramat 	}
80243c34adc5Sramat }
80253c34adc5Sramat 
80263c34adc5Sramat /*
80273c34adc5Sramat  * Look up vhcache client for the specified client.
80283c34adc5Sramat  */
80293c34adc5Sramat static mdi_vhcache_client_t *
80303c34adc5Sramat lookup_vhcache_client(mdi_vhci_cache_t *vhcache, char *ct_name, char *ct_addr,
80313c34adc5Sramat     mdi_vhcache_lookup_token_t *token)
80323c34adc5Sramat {
80333c34adc5Sramat 	mod_hash_val_t hv;
80343c34adc5Sramat 	char *name_addr;
80353c34adc5Sramat 	int len;
80363c34adc5Sramat 
80373c34adc5Sramat 	ASSERT(RW_LOCK_HELD(&vhcache->vhcache_lock));
80383c34adc5Sramat 
80393c34adc5Sramat 	/*
80403c34adc5Sramat 	 * If no vhcache clean occurred since the last lookup, we can
80413c34adc5Sramat 	 * simply return the cct from the last lookup operation.
80423c34adc5Sramat 	 * It works because ccts are never freed except during the vhcache
80433c34adc5Sramat 	 * cleanup operation.
80443c34adc5Sramat 	 */
80453c34adc5Sramat 	if (token != NULL &&
80463c34adc5Sramat 	    vhcache->vhcache_clean_time < token->lt_cct_lookup_time)
80473c34adc5Sramat 		return (token->lt_cct);
80483c34adc5Sramat 
80493c34adc5Sramat 	name_addr = vhcache_mknameaddr(ct_name, ct_addr, &len);
80503c34adc5Sramat 	if (mod_hash_find(vhcache->vhcache_client_hash,
80513c34adc5Sramat 	    (mod_hash_key_t)name_addr, &hv) == 0) {
80523c34adc5Sramat 		if (token) {
80533c34adc5Sramat 			token->lt_cct = (mdi_vhcache_client_t *)hv;
8054*d3d50737SRafael Vanoni 			token->lt_cct_lookup_time = ddi_get_lbolt64();
80553c34adc5Sramat 		}
80563c34adc5Sramat 	} else {
80573c34adc5Sramat 		if (token) {
80583c34adc5Sramat 			token->lt_cct = NULL;
80593c34adc5Sramat 			token->lt_cct_lookup_time = 0;
80603c34adc5Sramat 		}
80613c34adc5Sramat 		hv = NULL;
80623c34adc5Sramat 	}
80633c34adc5Sramat 	kmem_free(name_addr, len);
80643c34adc5Sramat 	return ((mdi_vhcache_client_t *)hv);
80653c34adc5Sramat }
80663c34adc5Sramat 
80673c34adc5Sramat /*
80683c34adc5Sramat  * Add the specified path to the vhci cache if not already present.
80693c34adc5Sramat  * Also add the vhcache client for the client corresponding to this path
80703c34adc5Sramat  * if it doesn't already exist.
80713c34adc5Sramat  */
80723c34adc5Sramat static void
80733c34adc5Sramat vhcache_pi_add(mdi_vhci_config_t *vhc, struct mdi_pathinfo *pip)
80743c34adc5Sramat {
80753c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
80763c34adc5Sramat 	mdi_vhcache_client_t *cct;
80773c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi;
80783c34adc5Sramat 	mdi_phci_t *ph = pip->pi_phci;
80793c34adc5Sramat 	mdi_client_t *ct = pip->pi_client;
80803c34adc5Sramat 	int cache_updated = 0;
80813c34adc5Sramat 
80823c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_WRITER);
80833c34adc5Sramat 
80843c34adc5Sramat 	/* if vhcache client for this pip doesn't already exist, add it */
80853c34adc5Sramat 	if ((cct = lookup_vhcache_client(vhcache, ct->ct_drvname, ct->ct_guid,
80863c34adc5Sramat 	    NULL)) == NULL) {
80873c34adc5Sramat 		cct = kmem_zalloc(sizeof (*cct), KM_SLEEP);
80883c34adc5Sramat 		cct->cct_name_addr = vhcache_mknameaddr(ct->ct_drvname,
80893c34adc5Sramat 		    ct->ct_guid, NULL);
80903c34adc5Sramat 		enqueue_vhcache_client(vhcache, cct);
80913c34adc5Sramat 		(void) mod_hash_insert(vhcache->vhcache_client_hash,
80923c34adc5Sramat 		    (mod_hash_key_t)cct->cct_name_addr, (mod_hash_val_t)cct);
80933c34adc5Sramat 		cache_updated = 1;
80943c34adc5Sramat 	}
80953c34adc5Sramat 
80963c34adc5Sramat 	for (cpi = cct->cct_cpi_head; cpi != NULL; cpi = cpi->cpi_next) {
80973c34adc5Sramat 		if (cpi->cpi_cphci->cphci_phci == ph &&
80983c34adc5Sramat 		    strcmp(cpi->cpi_addr, pip->pi_addr) == 0) {
80993c34adc5Sramat 			cpi->cpi_pip = pip;
81003c34adc5Sramat 			if (cpi->cpi_flags & MDI_CPI_HINT_PATH_DOES_NOT_EXIST) {
81013c34adc5Sramat 				cpi->cpi_flags &=
81023c34adc5Sramat 				    ~MDI_CPI_HINT_PATH_DOES_NOT_EXIST;
81033c34adc5Sramat 				sort_vhcache_paths(cct);
81043c34adc5Sramat 				cache_updated = 1;
81053c34adc5Sramat 			}
81063c34adc5Sramat 			break;
81073c34adc5Sramat 		}
81083c34adc5Sramat 	}
81093c34adc5Sramat 
81103c34adc5Sramat 	if (cpi == NULL) {
81113c34adc5Sramat 		cpi = kmem_zalloc(sizeof (*cpi), KM_SLEEP);
81123c34adc5Sramat 		cpi->cpi_addr = i_ddi_strdup(pip->pi_addr, KM_SLEEP);
81133c34adc5Sramat 		cpi->cpi_cphci = lookup_vhcache_phci_by_addr(vhcache, ph);
81143c34adc5Sramat 		ASSERT(cpi->cpi_cphci != NULL);
81153c34adc5Sramat 		cpi->cpi_pip = pip;
81163c34adc5Sramat 		enqueue_vhcache_pathinfo(cct, cpi);
81173c34adc5Sramat 		cache_updated = 1;
81183c34adc5Sramat 	}
81193c34adc5Sramat 
81203c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
81213c34adc5Sramat 
81223c34adc5Sramat 	if (cache_updated)
81233c34adc5Sramat 		vhcache_dirty(vhc);
81243c34adc5Sramat }
81253c34adc5Sramat 
81263c34adc5Sramat /*
81273c34adc5Sramat  * Remove the reference to the specified path from the vhci cache.
81283c34adc5Sramat  */
81293c34adc5Sramat static void
81303c34adc5Sramat vhcache_pi_remove(mdi_vhci_config_t *vhc, struct mdi_pathinfo *pip)
81313c34adc5Sramat {
81323c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
81333c34adc5Sramat 	mdi_client_t *ct = pip->pi_client;
81343c34adc5Sramat 	mdi_vhcache_client_t *cct;
81353c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi;
81363c34adc5Sramat 
81373c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_WRITER);
81383c34adc5Sramat 	if ((cct = lookup_vhcache_client(vhcache, ct->ct_drvname, ct->ct_guid,
81393c34adc5Sramat 	    NULL)) != NULL) {
81403c34adc5Sramat 		for (cpi = cct->cct_cpi_head; cpi != NULL;
81413c34adc5Sramat 		    cpi = cpi->cpi_next) {
81423c34adc5Sramat 			if (cpi->cpi_pip == pip) {
81433c34adc5Sramat 				cpi->cpi_pip = NULL;
81443c34adc5Sramat 				break;
81453c34adc5Sramat 			}
81463c34adc5Sramat 		}
81473c34adc5Sramat 	}
81483c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
81493c34adc5Sramat }
81503c34adc5Sramat 
81513c34adc5Sramat /*
81523c34adc5Sramat  * Flush the vhci cache to disk.
81533c34adc5Sramat  * Returns MDI_SUCCESS on success, MDI_FAILURE on failure.
81543c34adc5Sramat  */
81553c34adc5Sramat static int
81563c34adc5Sramat flush_vhcache(mdi_vhci_config_t *vhc, int force_flag)
81573c34adc5Sramat {
81583c34adc5Sramat 	nvlist_t *nvl;
81593c34adc5Sramat 	int err;
81603c34adc5Sramat 	int rv;
81613c34adc5Sramat 
81623c34adc5Sramat 	/*
81633c34adc5Sramat 	 * It is possible that the system may shutdown before
81643c34adc5Sramat 	 * i_ddi_io_initialized (during stmsboot for example). To allow for
81653c34adc5Sramat 	 * flushing the cache in this case do not check for
81663c34adc5Sramat 	 * i_ddi_io_initialized when force flag is set.
81673c34adc5Sramat 	 */
81683c34adc5Sramat 	if (force_flag == 0 && !i_ddi_io_initialized())
81693c34adc5Sramat 		return (MDI_FAILURE);
81703c34adc5Sramat 
81713c34adc5Sramat 	if ((nvl = vhcache_to_mainnvl(&vhc->vhc_vhcache)) != NULL) {
81723c34adc5Sramat 		err = fwrite_nvlist(vhc->vhc_vhcache_filename, nvl);
81733c34adc5Sramat 		nvlist_free(nvl);
81743c34adc5Sramat 	} else
81753c34adc5Sramat 		err = EFAULT;
81763c34adc5Sramat 
81773c34adc5Sramat 	rv = MDI_SUCCESS;
81783c34adc5Sramat 	mutex_enter(&vhc->vhc_lock);
81793c34adc5Sramat 	if (err != 0) {
81803c34adc5Sramat 		if (err == EROFS) {
81813c34adc5Sramat 			vhc->vhc_flags |= MDI_VHC_READONLY_FS;
81823c34adc5Sramat 			vhc->vhc_flags &= ~(MDI_VHC_VHCACHE_FLUSH_ERROR |
81833c34adc5Sramat 			    MDI_VHC_VHCACHE_DIRTY);
81843c34adc5Sramat 		} else {
81853c34adc5Sramat 			if (!(vhc->vhc_flags & MDI_VHC_VHCACHE_FLUSH_ERROR)) {
81863c34adc5Sramat 				cmn_err(CE_CONT, "%s: update failed\n",
81873c34adc5Sramat 				    vhc->vhc_vhcache_filename);
81883c34adc5Sramat 				vhc->vhc_flags |= MDI_VHC_VHCACHE_FLUSH_ERROR;
81893c34adc5Sramat 			}
81903c34adc5Sramat 			rv = MDI_FAILURE;
81913c34adc5Sramat 		}
81923c34adc5Sramat 	} else if (vhc->vhc_flags & MDI_VHC_VHCACHE_FLUSH_ERROR) {
81933c34adc5Sramat 		cmn_err(CE_CONT,
81943c34adc5Sramat 		    "%s: update now ok\n", vhc->vhc_vhcache_filename);
81953c34adc5Sramat 		vhc->vhc_flags &= ~MDI_VHC_VHCACHE_FLUSH_ERROR;
81963c34adc5Sramat 	}
81973c34adc5Sramat 	mutex_exit(&vhc->vhc_lock);
81983c34adc5Sramat 
81993c34adc5Sramat 	return (rv);
82003c34adc5Sramat }
82013c34adc5Sramat 
82023c34adc5Sramat /*
82033c34adc5Sramat  * Call flush_vhcache() to flush the vhci cache at the scheduled time.
82043c34adc5Sramat  * Exits itself if left idle for the idle timeout period.
82053c34adc5Sramat  */
82063c34adc5Sramat static void
82073c34adc5Sramat vhcache_flush_thread(void *arg)
82083c34adc5Sramat {
82093c34adc5Sramat 	mdi_vhci_config_t *vhc = (mdi_vhci_config_t *)arg;
82103c34adc5Sramat 	clock_t idle_time, quit_at_ticks;
82113c34adc5Sramat 	callb_cpr_t cprinfo;
82123c34adc5Sramat 
82133c34adc5Sramat 	/* number of seconds to sleep idle before exiting */
82143c34adc5Sramat 	idle_time = mdi_vhcache_flush_daemon_idle_time * TICKS_PER_SECOND;
82153c34adc5Sramat 
82163c34adc5Sramat 	CALLB_CPR_INIT(&cprinfo, &vhc->vhc_lock, callb_generic_cpr,
82173c34adc5Sramat 	    "mdi_vhcache_flush");
82183c34adc5Sramat 	mutex_enter(&vhc->vhc_lock);
82193c34adc5Sramat 	for (; ; ) {
82203c34adc5Sramat 		while (!(vhc->vhc_flags & MDI_VHC_EXIT) &&
82213c34adc5Sramat 		    (vhc->vhc_flags & MDI_VHC_VHCACHE_DIRTY)) {
82223c34adc5Sramat 			if (ddi_get_lbolt() < vhc->vhc_flush_at_ticks) {
82233c34adc5Sramat 				CALLB_CPR_SAFE_BEGIN(&cprinfo);
82243c34adc5Sramat 				(void) cv_timedwait(&vhc->vhc_cv,
82253c34adc5Sramat 				    &vhc->vhc_lock, vhc->vhc_flush_at_ticks);
82263c34adc5Sramat 				CALLB_CPR_SAFE_END(&cprinfo, &vhc->vhc_lock);
82273c34adc5Sramat 			} else {
82283c34adc5Sramat 				vhc->vhc_flags &= ~MDI_VHC_VHCACHE_DIRTY;
82293c34adc5Sramat 				mutex_exit(&vhc->vhc_lock);
82303c34adc5Sramat 
82313c34adc5Sramat 				if (flush_vhcache(vhc, 0) != MDI_SUCCESS)
82323c34adc5Sramat 					vhcache_dirty(vhc);
82333c34adc5Sramat 
82343c34adc5Sramat 				mutex_enter(&vhc->vhc_lock);
82353c34adc5Sramat 			}
82363c34adc5Sramat 		}
82373c34adc5Sramat 
82383c34adc5Sramat 		quit_at_ticks = ddi_get_lbolt() + idle_time;
82393c34adc5Sramat 
82403c34adc5Sramat 		while (!(vhc->vhc_flags & MDI_VHC_EXIT) &&
82413c34adc5Sramat 		    !(vhc->vhc_flags & MDI_VHC_VHCACHE_DIRTY) &&
82423c34adc5Sramat 		    ddi_get_lbolt() < quit_at_ticks) {
82433c34adc5Sramat 			CALLB_CPR_SAFE_BEGIN(&cprinfo);
82443c34adc5Sramat 			(void) cv_timedwait(&vhc->vhc_cv, &vhc->vhc_lock,
82453c34adc5Sramat 			    quit_at_ticks);
82463c34adc5Sramat 			CALLB_CPR_SAFE_END(&cprinfo, &vhc->vhc_lock);
82473c34adc5Sramat 		}
82483c34adc5Sramat 
82493c34adc5Sramat 		if ((vhc->vhc_flags & MDI_VHC_EXIT) ||
82503c34adc5Sramat 		    !(vhc->vhc_flags & MDI_VHC_VHCACHE_DIRTY))
82513c34adc5Sramat 			goto out;
82523c34adc5Sramat 	}
82533c34adc5Sramat 
82543c34adc5Sramat out:
82553c34adc5Sramat 	vhc->vhc_flags &= ~MDI_VHC_VHCACHE_FLUSH_THREAD;
82563c34adc5Sramat 	/* CALLB_CPR_EXIT releases the vhc->vhc_lock */
82573c34adc5Sramat 	CALLB_CPR_EXIT(&cprinfo);
82583c34adc5Sramat }
82593c34adc5Sramat 
82603c34adc5Sramat /*
82613c34adc5Sramat  * Make vhci cache dirty and schedule flushing by vhcache flush thread.
82623c34adc5Sramat  */
82633c34adc5Sramat static void
82643c34adc5Sramat vhcache_dirty(mdi_vhci_config_t *vhc)
82653c34adc5Sramat {
82663c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
82673c34adc5Sramat 	int create_thread;
82683c34adc5Sramat 
82693c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_READER);
82703c34adc5Sramat 	/* do not flush cache until the cache is fully built */
82713c34adc5Sramat 	if (!(vhcache->vhcache_flags & MDI_VHCI_CACHE_SETUP_DONE)) {
82723c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
82733c34adc5Sramat 		return;
82743c34adc5Sramat 	}
82753c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
82763c34adc5Sramat 
82773c34adc5Sramat 	mutex_enter(&vhc->vhc_lock);
82783c34adc5Sramat 	if (vhc->vhc_flags & MDI_VHC_READONLY_FS) {
82793c34adc5Sramat 		mutex_exit(&vhc->vhc_lock);
82803c34adc5Sramat 		return;
82813c34adc5Sramat 	}
82823c34adc5Sramat 
82833c34adc5Sramat 	vhc->vhc_flags |= MDI_VHC_VHCACHE_DIRTY;
82843c34adc5Sramat 	vhc->vhc_flush_at_ticks = ddi_get_lbolt() +
82853c34adc5Sramat 	    mdi_vhcache_flush_delay * TICKS_PER_SECOND;
82863c34adc5Sramat 	if (vhc->vhc_flags & MDI_VHC_VHCACHE_FLUSH_THREAD) {
82873c34adc5Sramat 		cv_broadcast(&vhc->vhc_cv);
82883c34adc5Sramat 		create_thread = 0;
82893c34adc5Sramat 	} else {
82903c34adc5Sramat 		vhc->vhc_flags |= MDI_VHC_VHCACHE_FLUSH_THREAD;
82913c34adc5Sramat 		create_thread = 1;
82923c34adc5Sramat 	}
82933c34adc5Sramat 	mutex_exit(&vhc->vhc_lock);
82943c34adc5Sramat 
82953c34adc5Sramat 	if (create_thread)
82963c34adc5Sramat 		(void) thread_create(NULL, 0, vhcache_flush_thread, vhc,
82973c34adc5Sramat 		    0, &p0, TS_RUN, minclsyspri);
82983c34adc5Sramat }
82993c34adc5Sramat 
83003c34adc5Sramat /*
83013c34adc5Sramat  * phci bus config structure - one for for each phci bus config operation that
83023c34adc5Sramat  * we initiate on behalf of a vhci.
83033c34adc5Sramat  */
83043c34adc5Sramat typedef struct mdi_phci_bus_config_s {
83053c34adc5Sramat 	char *phbc_phci_path;
83063c34adc5Sramat 	struct mdi_vhci_bus_config_s *phbc_vhbusconfig;	/* vhci bus config */
83073c34adc5Sramat 	struct mdi_phci_bus_config_s *phbc_next;
83083c34adc5Sramat } mdi_phci_bus_config_t;
83093c34adc5Sramat 
83103c34adc5Sramat /* vhci bus config structure - one for each vhci bus config operation */
83113c34adc5Sramat typedef struct mdi_vhci_bus_config_s {
83123c34adc5Sramat 	ddi_bus_config_op_t vhbc_op;	/* bus config op */
83133c34adc5Sramat 	major_t vhbc_op_major;		/* bus config op major */
83143c34adc5Sramat 	uint_t vhbc_op_flags;		/* bus config op flags */
83153c34adc5Sramat 	kmutex_t vhbc_lock;
83163c34adc5Sramat 	kcondvar_t vhbc_cv;
83173c34adc5Sramat 	int vhbc_thr_count;
83183c34adc5Sramat } mdi_vhci_bus_config_t;
83193c34adc5Sramat 
83203c34adc5Sramat /*
83213c34adc5Sramat  * bus config the specified phci
83223c34adc5Sramat  */
83233c34adc5Sramat static void
83243c34adc5Sramat bus_config_phci(void *arg)
83253c34adc5Sramat {
83263c34adc5Sramat 	mdi_phci_bus_config_t *phbc = (mdi_phci_bus_config_t *)arg;
83273c34adc5Sramat 	mdi_vhci_bus_config_t *vhbc = phbc->phbc_vhbusconfig;
83283c34adc5Sramat 	dev_info_t *ph_dip;
83293c34adc5Sramat 
83303c34adc5Sramat 	/*
83313c34adc5Sramat 	 * first configure all path components upto phci and then configure
83323c34adc5Sramat 	 * the phci children.
83333c34adc5Sramat 	 */
83343c34adc5Sramat 	if ((ph_dip = e_ddi_hold_devi_by_path(phbc->phbc_phci_path, 0))
83353c34adc5Sramat 	    != NULL) {
83363c34adc5Sramat 		if (vhbc->vhbc_op == BUS_CONFIG_DRIVER ||
83373c34adc5Sramat 		    vhbc->vhbc_op == BUS_UNCONFIG_DRIVER) {
83383c34adc5Sramat 			(void) ndi_devi_config_driver(ph_dip,
83393c34adc5Sramat 			    vhbc->vhbc_op_flags,
83403c34adc5Sramat 			    vhbc->vhbc_op_major);
83413c34adc5Sramat 		} else
83423c34adc5Sramat 			(void) ndi_devi_config(ph_dip,
83433c34adc5Sramat 			    vhbc->vhbc_op_flags);
83443c34adc5Sramat 
83453c34adc5Sramat 		/* release the hold that e_ddi_hold_devi_by_path() placed */
83463c34adc5Sramat 		ndi_rele_devi(ph_dip);
83473c34adc5Sramat 	}
83483c34adc5Sramat 
83493c34adc5Sramat 	kmem_free(phbc->phbc_phci_path, strlen(phbc->phbc_phci_path) + 1);
83503c34adc5Sramat 	kmem_free(phbc, sizeof (*phbc));
83513c34adc5Sramat 
83523c34adc5Sramat 	mutex_enter(&vhbc->vhbc_lock);
83533c34adc5Sramat 	vhbc->vhbc_thr_count--;
83543c34adc5Sramat 	if (vhbc->vhbc_thr_count == 0)
83553c34adc5Sramat 		cv_broadcast(&vhbc->vhbc_cv);
83563c34adc5Sramat 	mutex_exit(&vhbc->vhbc_lock);
83573c34adc5Sramat }
83583c34adc5Sramat 
83593c34adc5Sramat /*
83603c34adc5Sramat  * Bus config all phcis associated with the vhci in parallel.
83613c34adc5Sramat  * op must be BUS_CONFIG_DRIVER or BUS_CONFIG_ALL.
83623c34adc5Sramat  */
83633c34adc5Sramat static void
83643c34adc5Sramat bus_config_all_phcis(mdi_vhci_cache_t *vhcache, uint_t flags,
83653c34adc5Sramat     ddi_bus_config_op_t op, major_t maj)
83663c34adc5Sramat {
83673c34adc5Sramat 	mdi_phci_bus_config_t *phbc_head = NULL, *phbc, *phbc_next;
83683c34adc5Sramat 	mdi_vhci_bus_config_t *vhbc;
83693c34adc5Sramat 	mdi_vhcache_phci_t *cphci;
83703c34adc5Sramat 
83713c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_READER);
83723c34adc5Sramat 	if (vhcache->vhcache_phci_head == NULL) {
83733c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
83743c34adc5Sramat 		return;
83753c34adc5Sramat 	}
83763c34adc5Sramat 
83773c34adc5Sramat 	vhbc = kmem_zalloc(sizeof (*vhbc), KM_SLEEP);
83783c34adc5Sramat 
83793c34adc5Sramat 	for (cphci = vhcache->vhcache_phci_head; cphci != NULL;
83803c34adc5Sramat 	    cphci = cphci->cphci_next) {
8381273f4511Sgp87344 		/* skip phcis that haven't attached before root is available */
8382273f4511Sgp87344 		if (!modrootloaded && (cphci->cphci_phci == NULL))
8383273f4511Sgp87344 			continue;
83843c34adc5Sramat 		phbc = kmem_zalloc(sizeof (*phbc), KM_SLEEP);
83853c34adc5Sramat 		phbc->phbc_phci_path = i_ddi_strdup(cphci->cphci_path,
83863c34adc5Sramat 		    KM_SLEEP);
83873c34adc5Sramat 		phbc->phbc_vhbusconfig = vhbc;
83883c34adc5Sramat 		phbc->phbc_next = phbc_head;
83893c34adc5Sramat 		phbc_head = phbc;
83903c34adc5Sramat 		vhbc->vhbc_thr_count++;
83913c34adc5Sramat 	}
83923c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
83933c34adc5Sramat 
83943c34adc5Sramat 	vhbc->vhbc_op = op;
83953c34adc5Sramat 	vhbc->vhbc_op_major = maj;
83963c34adc5Sramat 	vhbc->vhbc_op_flags = NDI_NO_EVENT |
83973c34adc5Sramat 	    (flags & (NDI_CONFIG_REPROBE | NDI_DRV_CONF_REPROBE));
83983c34adc5Sramat 	mutex_init(&vhbc->vhbc_lock, NULL, MUTEX_DEFAULT, NULL);
83993c34adc5Sramat 	cv_init(&vhbc->vhbc_cv, NULL, CV_DRIVER, NULL);
84003c34adc5Sramat 
84013c34adc5Sramat 	/* now create threads to initiate bus config on all phcis in parallel */
84023c34adc5Sramat 	for (phbc = phbc_head; phbc != NULL; phbc = phbc_next) {
84033c34adc5Sramat 		phbc_next = phbc->phbc_next;
84043c34adc5Sramat 		if (mdi_mtc_off)
84053c34adc5Sramat 			bus_config_phci((void *)phbc);
84063c34adc5Sramat 		else
84073c34adc5Sramat 			(void) thread_create(NULL, 0, bus_config_phci, phbc,
84083c34adc5Sramat 			    0, &p0, TS_RUN, minclsyspri);
84093c34adc5Sramat 	}
84103c34adc5Sramat 
84113c34adc5Sramat 	mutex_enter(&vhbc->vhbc_lock);
84123c34adc5Sramat 	/* wait until all threads exit */
84133c34adc5Sramat 	while (vhbc->vhbc_thr_count > 0)
84143c34adc5Sramat 		cv_wait(&vhbc->vhbc_cv, &vhbc->vhbc_lock);
84153c34adc5Sramat 	mutex_exit(&vhbc->vhbc_lock);
84163c34adc5Sramat 
84173c34adc5Sramat 	mutex_destroy(&vhbc->vhbc_lock);
84183c34adc5Sramat 	cv_destroy(&vhbc->vhbc_cv);
84193c34adc5Sramat 	kmem_free(vhbc, sizeof (*vhbc));
84203c34adc5Sramat }
84213c34adc5Sramat 
84223c34adc5Sramat /*
842367e56d35Sramat  * Single threaded version of bus_config_all_phcis()
842467e56d35Sramat  */
842567e56d35Sramat static void
842667e56d35Sramat st_bus_config_all_phcis(mdi_vhci_config_t *vhc, uint_t flags,
842767e56d35Sramat     ddi_bus_config_op_t op, major_t maj)
842867e56d35Sramat {
842967e56d35Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
843067e56d35Sramat 
843167e56d35Sramat 	single_threaded_vhconfig_enter(vhc);
843267e56d35Sramat 	bus_config_all_phcis(vhcache, flags, op, maj);
843367e56d35Sramat 	single_threaded_vhconfig_exit(vhc);
843467e56d35Sramat }
843567e56d35Sramat 
843667e56d35Sramat /*
84373c34adc5Sramat  * Perform BUS_CONFIG_ONE on the specified child of the phci.
84383c34adc5Sramat  * The path includes the child component in addition to the phci path.
84393c34adc5Sramat  */
84403c34adc5Sramat static int
84413c34adc5Sramat bus_config_one_phci_child(char *path)
84423c34adc5Sramat {
84433c34adc5Sramat 	dev_info_t *ph_dip, *child;
84443c34adc5Sramat 	char *devnm;
84453c34adc5Sramat 	int rv = MDI_FAILURE;
84463c34adc5Sramat 
84473c34adc5Sramat 	/* extract the child component of the phci */
84483c34adc5Sramat 	devnm = strrchr(path, '/');
84493c34adc5Sramat 	*devnm++ = '\0';
84503c34adc5Sramat 
84513c34adc5Sramat 	/*
84523c34adc5Sramat 	 * first configure all path components upto phci and then
84533c34adc5Sramat 	 * configure the phci child.
84543c34adc5Sramat 	 */
84553c34adc5Sramat 	if ((ph_dip = e_ddi_hold_devi_by_path(path, 0)) != NULL) {
84563c34adc5Sramat 		if (ndi_devi_config_one(ph_dip, devnm, &child, NDI_NO_EVENT) ==
84573c34adc5Sramat 		    NDI_SUCCESS) {
84583c34adc5Sramat 			/*
84593c34adc5Sramat 			 * release the hold that ndi_devi_config_one() placed
84603c34adc5Sramat 			 */
84613c34adc5Sramat 			ndi_rele_devi(child);
84623c34adc5Sramat 			rv = MDI_SUCCESS;
84633c34adc5Sramat 		}
84643c34adc5Sramat 
84653c34adc5Sramat 		/* release the hold that e_ddi_hold_devi_by_path() placed */
84663c34adc5Sramat 		ndi_rele_devi(ph_dip);
84673c34adc5Sramat 	}
84683c34adc5Sramat 
84693c34adc5Sramat 	devnm--;
84703c34adc5Sramat 	*devnm = '/';
84713c34adc5Sramat 	return (rv);
84723c34adc5Sramat }
84733c34adc5Sramat 
84743c34adc5Sramat /*
84753c34adc5Sramat  * Build a list of phci client paths for the specified vhci client.
84763c34adc5Sramat  * The list includes only those phci client paths which aren't configured yet.
84773c34adc5Sramat  */
84783c34adc5Sramat static mdi_phys_path_t *
84793c34adc5Sramat build_phclient_path_list(mdi_vhcache_client_t *cct, char *ct_name)
84803c34adc5Sramat {
84813c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi;
84823c34adc5Sramat 	mdi_phys_path_t *pp_head = NULL, *pp_tail = NULL, *pp;
84833c34adc5Sramat 	int config_path, len;
84843c34adc5Sramat 
84853c34adc5Sramat 	for (cpi = cct->cct_cpi_head; cpi != NULL; cpi = cpi->cpi_next) {
84863c34adc5Sramat 		/*
84873c34adc5Sramat 		 * include only those paths that aren't configured.
84883c34adc5Sramat 		 */
84893c34adc5Sramat 		config_path = 0;
84903c34adc5Sramat 		if (cpi->cpi_pip == NULL)
84913c34adc5Sramat 			config_path = 1;
84923c34adc5Sramat 		else {
84933c34adc5Sramat 			MDI_PI_LOCK(cpi->cpi_pip);
84943c34adc5Sramat 			if (MDI_PI_IS_INIT(cpi->cpi_pip))
84953c34adc5Sramat 				config_path = 1;
84963c34adc5Sramat 			MDI_PI_UNLOCK(cpi->cpi_pip);
84973c34adc5Sramat 		}
84983c34adc5Sramat 
84993c34adc5Sramat 		if (config_path) {
85003c34adc5Sramat 			pp = kmem_alloc(sizeof (*pp), KM_SLEEP);
85013c34adc5Sramat 			len = strlen(cpi->cpi_cphci->cphci_path) +
85023c34adc5Sramat 			    strlen(ct_name) + strlen(cpi->cpi_addr) + 3;
85033c34adc5Sramat 			pp->phys_path = kmem_alloc(len, KM_SLEEP);
85043c34adc5Sramat 			(void) snprintf(pp->phys_path, len, "%s/%s@%s",
85053c34adc5Sramat 			    cpi->cpi_cphci->cphci_path, ct_name,
85063c34adc5Sramat 			    cpi->cpi_addr);
85073c34adc5Sramat 			pp->phys_path_next = NULL;
85083c34adc5Sramat 
85093c34adc5Sramat 			if (pp_head == NULL)
85103c34adc5Sramat 				pp_head = pp;
85113c34adc5Sramat 			else
85123c34adc5Sramat 				pp_tail->phys_path_next = pp;
85133c34adc5Sramat 			pp_tail = pp;
85143c34adc5Sramat 		}
85153c34adc5Sramat 	}
85163c34adc5Sramat 
85173c34adc5Sramat 	return (pp_head);
85183c34adc5Sramat }
85193c34adc5Sramat 
85203c34adc5Sramat /*
85213c34adc5Sramat  * Free the memory allocated for phci client path list.
85223c34adc5Sramat  */
85233c34adc5Sramat static void
85243c34adc5Sramat free_phclient_path_list(mdi_phys_path_t *pp_head)
85253c34adc5Sramat {
85263c34adc5Sramat 	mdi_phys_path_t *pp, *pp_next;
85273c34adc5Sramat 
85283c34adc5Sramat 	for (pp = pp_head; pp != NULL; pp = pp_next) {
85293c34adc5Sramat 		pp_next = pp->phys_path_next;
85303c34adc5Sramat 		kmem_free(pp->phys_path, strlen(pp->phys_path) + 1);
85313c34adc5Sramat 		kmem_free(pp, sizeof (*pp));
85323c34adc5Sramat 	}
85333c34adc5Sramat }
85343c34adc5Sramat 
85353c34adc5Sramat /*
85363c34adc5Sramat  * Allocated async client structure and initialize with the specified values.
85373c34adc5Sramat  */
85383c34adc5Sramat static mdi_async_client_config_t *
85393c34adc5Sramat alloc_async_client_config(char *ct_name, char *ct_addr,
85403c34adc5Sramat     mdi_phys_path_t *pp_head, mdi_vhcache_lookup_token_t *tok)
85413c34adc5Sramat {
85423c34adc5Sramat 	mdi_async_client_config_t *acc;
85433c34adc5Sramat 
85443c34adc5Sramat 	acc = kmem_alloc(sizeof (*acc), KM_SLEEP);
85453c34adc5Sramat 	acc->acc_ct_name = i_ddi_strdup(ct_name, KM_SLEEP);
85463c34adc5Sramat 	acc->acc_ct_addr = i_ddi_strdup(ct_addr, KM_SLEEP);
85473c34adc5Sramat 	acc->acc_phclient_path_list_head = pp_head;
85483c34adc5Sramat 	init_vhcache_lookup_token(&acc->acc_token, tok);
85493c34adc5Sramat 	acc->acc_next = NULL;
85503c34adc5Sramat 	return (acc);
85513c34adc5Sramat }
85523c34adc5Sramat 
85533c34adc5Sramat /*
85543c34adc5Sramat  * Free the memory allocated for the async client structure and their members.
85553c34adc5Sramat  */
85563c34adc5Sramat static void
85573c34adc5Sramat free_async_client_config(mdi_async_client_config_t *acc)
85583c34adc5Sramat {
85593c34adc5Sramat 	if (acc->acc_phclient_path_list_head)
85603c34adc5Sramat 		free_phclient_path_list(acc->acc_phclient_path_list_head);
85613c34adc5Sramat 	kmem_free(acc->acc_ct_name, strlen(acc->acc_ct_name) + 1);
85623c34adc5Sramat 	kmem_free(acc->acc_ct_addr, strlen(acc->acc_ct_addr) + 1);
85633c34adc5Sramat 	kmem_free(acc, sizeof (*acc));
85643c34adc5Sramat }
85653c34adc5Sramat 
85663c34adc5Sramat /*
85673c34adc5Sramat  * Sort vhcache pathinfos (cpis) of the specified client.
85683c34adc5Sramat  * All cpis which do not have MDI_CPI_HINT_PATH_DOES_NOT_EXIST
85693c34adc5Sramat  * flag set come at the beginning of the list. All cpis which have this
85703c34adc5Sramat  * flag set come at the end of the list.
85713c34adc5Sramat  */
85723c34adc5Sramat static void
85733c34adc5Sramat sort_vhcache_paths(mdi_vhcache_client_t *cct)
85743c34adc5Sramat {
85753c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi, *cpi_next, *cpi_head;
85763c34adc5Sramat 
85773c34adc5Sramat 	cpi_head = cct->cct_cpi_head;
85783c34adc5Sramat 	cct->cct_cpi_head = cct->cct_cpi_tail = NULL;
85793c34adc5Sramat 	for (cpi = cpi_head; cpi != NULL; cpi = cpi_next) {
85803c34adc5Sramat 		cpi_next = cpi->cpi_next;
85813c34adc5Sramat 		enqueue_vhcache_pathinfo(cct, cpi);
85823c34adc5Sramat 	}
85833c34adc5Sramat }
85843c34adc5Sramat 
85853c34adc5Sramat /*
85863c34adc5Sramat  * Verify whether MDI_CPI_HINT_PATH_DOES_NOT_EXIST flag setting is correct for
85873c34adc5Sramat  * every vhcache pathinfo of the specified client. If not adjust the flag
85883c34adc5Sramat  * setting appropriately.
85893c34adc5Sramat  *
85903c34adc5Sramat  * Note that MDI_CPI_HINT_PATH_DOES_NOT_EXIST flag is persisted in the
85913c34adc5Sramat  * on-disk vhci cache. So every time this flag is updated the cache must be
85923c34adc5Sramat  * flushed.
85933c34adc5Sramat  */
85943c34adc5Sramat static void
85953c34adc5Sramat adjust_sort_vhcache_paths(mdi_vhci_config_t *vhc, char *ct_name, char *ct_addr,
85963c34adc5Sramat     mdi_vhcache_lookup_token_t *tok)
85973c34adc5Sramat {
85983c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
85993c34adc5Sramat 	mdi_vhcache_client_t *cct;
86003c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi;
86013c34adc5Sramat 
86023c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_READER);
86033c34adc5Sramat 	if ((cct = lookup_vhcache_client(vhcache, ct_name, ct_addr, tok))
86043c34adc5Sramat 	    == NULL) {
86053c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
86063c34adc5Sramat 		return;
86073c34adc5Sramat 	}
86083c34adc5Sramat 
86093c34adc5Sramat 	/*
86103c34adc5Sramat 	 * to avoid unnecessary on-disk cache updates, first check if an
86113c34adc5Sramat 	 * update is really needed. If no update is needed simply return.
86123c34adc5Sramat 	 */
86133c34adc5Sramat 	for (cpi = cct->cct_cpi_head; cpi != NULL; cpi = cpi->cpi_next) {
86143c34adc5Sramat 		if ((cpi->cpi_pip != NULL &&
86153c34adc5Sramat 		    (cpi->cpi_flags & MDI_CPI_HINT_PATH_DOES_NOT_EXIST)) ||
86163c34adc5Sramat 		    (cpi->cpi_pip == NULL &&
86173c34adc5Sramat 		    !(cpi->cpi_flags & MDI_CPI_HINT_PATH_DOES_NOT_EXIST))) {
86183c34adc5Sramat 			break;
86193c34adc5Sramat 		}
86203c34adc5Sramat 	}
86213c34adc5Sramat 	if (cpi == NULL) {
86223c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
86233c34adc5Sramat 		return;
86243c34adc5Sramat 	}
86253c34adc5Sramat 
86263c34adc5Sramat 	if (rw_tryupgrade(&vhcache->vhcache_lock) == 0) {
86273c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
86283c34adc5Sramat 		rw_enter(&vhcache->vhcache_lock, RW_WRITER);
86293c34adc5Sramat 		if ((cct = lookup_vhcache_client(vhcache, ct_name, ct_addr,
86303c34adc5Sramat 		    tok)) == NULL) {
86313c34adc5Sramat 			rw_exit(&vhcache->vhcache_lock);
86323c34adc5Sramat 			return;
86333c34adc5Sramat 		}
86343c34adc5Sramat 	}
86353c34adc5Sramat 
86363c34adc5Sramat 	for (cpi = cct->cct_cpi_head; cpi != NULL; cpi = cpi->cpi_next) {
86373c34adc5Sramat 		if (cpi->cpi_pip != NULL)
86383c34adc5Sramat 			cpi->cpi_flags &= ~MDI_CPI_HINT_PATH_DOES_NOT_EXIST;
86393c34adc5Sramat 		else
86403c34adc5Sramat 			cpi->cpi_flags |= MDI_CPI_HINT_PATH_DOES_NOT_EXIST;
86413c34adc5Sramat 	}
86423c34adc5Sramat 	sort_vhcache_paths(cct);
86433c34adc5Sramat 
86443c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
86453c34adc5Sramat 	vhcache_dirty(vhc);
86463c34adc5Sramat }
86473c34adc5Sramat 
86483c34adc5Sramat /*
86493c34adc5Sramat  * Configure all specified paths of the client.
86503c34adc5Sramat  */
86513c34adc5Sramat static void
86523c34adc5Sramat config_client_paths_sync(mdi_vhci_config_t *vhc, char *ct_name, char *ct_addr,
86533c34adc5Sramat     mdi_phys_path_t *pp_head, mdi_vhcache_lookup_token_t *tok)
86543c34adc5Sramat {
86553c34adc5Sramat 	mdi_phys_path_t *pp;
86563c34adc5Sramat 
86573c34adc5Sramat 	for (pp = pp_head; pp != NULL; pp = pp->phys_path_next)
86583c34adc5Sramat 		(void) bus_config_one_phci_child(pp->phys_path);
86593c34adc5Sramat 	adjust_sort_vhcache_paths(vhc, ct_name, ct_addr, tok);
86603c34adc5Sramat }
86613c34adc5Sramat 
86623c34adc5Sramat /*
86633c34adc5Sramat  * Dequeue elements from vhci async client config list and bus configure
86643c34adc5Sramat  * their corresponding phci clients.
86653c34adc5Sramat  */
86663c34adc5Sramat static void
86673c34adc5Sramat config_client_paths_thread(void *arg)
86683c34adc5Sramat {
86693c34adc5Sramat 	mdi_vhci_config_t *vhc = (mdi_vhci_config_t *)arg;
86703c34adc5Sramat 	mdi_async_client_config_t *acc;
86713c34adc5Sramat 	clock_t quit_at_ticks;
86723c34adc5Sramat 	clock_t idle_time = mdi_async_config_idle_time * TICKS_PER_SECOND;
86733c34adc5Sramat 	callb_cpr_t cprinfo;
86743c34adc5Sramat 
86753c34adc5Sramat 	CALLB_CPR_INIT(&cprinfo, &vhc->vhc_lock, callb_generic_cpr,
86763c34adc5Sramat 	    "mdi_config_client_paths");
86773c34adc5Sramat 
86783c34adc5Sramat 	for (; ; ) {
86793c34adc5Sramat 		quit_at_ticks = ddi_get_lbolt() + idle_time;
86803c34adc5Sramat 
86813c34adc5Sramat 		mutex_enter(&vhc->vhc_lock);
86823c34adc5Sramat 		while (!(vhc->vhc_flags & MDI_VHC_EXIT) &&
86833c34adc5Sramat 		    vhc->vhc_acc_list_head == NULL &&
86843c34adc5Sramat 		    ddi_get_lbolt() < quit_at_ticks) {
86853c34adc5Sramat 			CALLB_CPR_SAFE_BEGIN(&cprinfo);
86863c34adc5Sramat 			(void) cv_timedwait(&vhc->vhc_cv, &vhc->vhc_lock,
86873c34adc5Sramat 			    quit_at_ticks);
86883c34adc5Sramat 			CALLB_CPR_SAFE_END(&cprinfo, &vhc->vhc_lock);
86893c34adc5Sramat 		}
86903c34adc5Sramat 
86913c34adc5Sramat 		if ((vhc->vhc_flags & MDI_VHC_EXIT) ||
86923c34adc5Sramat 		    vhc->vhc_acc_list_head == NULL)
86933c34adc5Sramat 			goto out;
86943c34adc5Sramat 
86953c34adc5Sramat 		acc = vhc->vhc_acc_list_head;
86963c34adc5Sramat 		vhc->vhc_acc_list_head = acc->acc_next;
86973c34adc5Sramat 		if (vhc->vhc_acc_list_head == NULL)
86983c34adc5Sramat 			vhc->vhc_acc_list_tail = NULL;
86993c34adc5Sramat 		vhc->vhc_acc_count--;
87003c34adc5Sramat 		mutex_exit(&vhc->vhc_lock);
87013c34adc5Sramat 
87023c34adc5Sramat 		config_client_paths_sync(vhc, acc->acc_ct_name,
87033c34adc5Sramat 		    acc->acc_ct_addr, acc->acc_phclient_path_list_head,
87043c34adc5Sramat 		    &acc->acc_token);
87053c34adc5Sramat 
87063c34adc5Sramat 		free_async_client_config(acc);
87073c34adc5Sramat 	}
87083c34adc5Sramat 
87093c34adc5Sramat out:
87103c34adc5Sramat 	vhc->vhc_acc_thrcount--;
87113c34adc5Sramat 	/* CALLB_CPR_EXIT releases the vhc->vhc_lock */
87123c34adc5Sramat 	CALLB_CPR_EXIT(&cprinfo);
87133c34adc5Sramat }
87143c34adc5Sramat 
87153c34adc5Sramat /*
87163c34adc5Sramat  * Arrange for all the phci client paths (pp_head) for the specified client
87173c34adc5Sramat  * to be bus configured asynchronously by a thread.
87183c34adc5Sramat  */
87193c34adc5Sramat static void
87203c34adc5Sramat config_client_paths_async(mdi_vhci_config_t *vhc, char *ct_name, char *ct_addr,
87213c34adc5Sramat     mdi_phys_path_t *pp_head, mdi_vhcache_lookup_token_t *tok)
87223c34adc5Sramat {
87233c34adc5Sramat 	mdi_async_client_config_t *acc, *newacc;
87243c34adc5Sramat 	int create_thread;
87253c34adc5Sramat 
87263c34adc5Sramat 	if (pp_head == NULL)
87273c34adc5Sramat 		return;
87283c34adc5Sramat 
87293c34adc5Sramat 	if (mdi_mtc_off) {
87303c34adc5Sramat 		config_client_paths_sync(vhc, ct_name, ct_addr, pp_head, tok);
87313c34adc5Sramat 		free_phclient_path_list(pp_head);
87323c34adc5Sramat 		return;
87333c34adc5Sramat 	}
87343c34adc5Sramat 
87353c34adc5Sramat 	newacc = alloc_async_client_config(ct_name, ct_addr, pp_head, tok);
87363c34adc5Sramat 	ASSERT(newacc);
87373c34adc5Sramat 
87383c34adc5Sramat 	mutex_enter(&vhc->vhc_lock);
87393c34adc5Sramat 	for (acc = vhc->vhc_acc_list_head; acc != NULL; acc = acc->acc_next) {
87403c34adc5Sramat 		if (strcmp(ct_name, acc->acc_ct_name) == 0 &&
87413c34adc5Sramat 		    strcmp(ct_addr, acc->acc_ct_addr) == 0) {
87423c34adc5Sramat 			free_async_client_config(newacc);
87433c34adc5Sramat 			mutex_exit(&vhc->vhc_lock);
87443c34adc5Sramat 			return;
87453c34adc5Sramat 		}
87463c34adc5Sramat 	}
87473c34adc5Sramat 
87483c34adc5Sramat 	if (vhc->vhc_acc_list_head == NULL)
87493c34adc5Sramat 		vhc->vhc_acc_list_head = newacc;
87503c34adc5Sramat 	else
87513c34adc5Sramat 		vhc->vhc_acc_list_tail->acc_next = newacc;
87523c34adc5Sramat 	vhc->vhc_acc_list_tail = newacc;
87533c34adc5Sramat 	vhc->vhc_acc_count++;
87543c34adc5Sramat 	if (vhc->vhc_acc_count <= vhc->vhc_acc_thrcount) {
87553c34adc5Sramat 		cv_broadcast(&vhc->vhc_cv);
87563c34adc5Sramat 		create_thread = 0;
87573c34adc5Sramat 	} else {
87583c34adc5Sramat 		vhc->vhc_acc_thrcount++;
87593c34adc5Sramat 		create_thread = 1;
87603c34adc5Sramat 	}
87613c34adc5Sramat 	mutex_exit(&vhc->vhc_lock);
87623c34adc5Sramat 
87633c34adc5Sramat 	if (create_thread)
87643c34adc5Sramat 		(void) thread_create(NULL, 0, config_client_paths_thread, vhc,
87653c34adc5Sramat 		    0, &p0, TS_RUN, minclsyspri);
87663c34adc5Sramat }
87673c34adc5Sramat 
87683c34adc5Sramat /*
87693c34adc5Sramat  * Return number of online paths for the specified client.
87703c34adc5Sramat  */
87713c34adc5Sramat static int
87723c34adc5Sramat nonline_paths(mdi_vhcache_client_t *cct)
87733c34adc5Sramat {
87743c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi;
87753c34adc5Sramat 	int online_count = 0;
87763c34adc5Sramat 
87773c34adc5Sramat 	for (cpi = cct->cct_cpi_head; cpi != NULL; cpi = cpi->cpi_next) {
87783c34adc5Sramat 		if (cpi->cpi_pip != NULL) {
87793c34adc5Sramat 			MDI_PI_LOCK(cpi->cpi_pip);
87803c34adc5Sramat 			if (cpi->cpi_pip->pi_state == MDI_PATHINFO_STATE_ONLINE)
87813c34adc5Sramat 				online_count++;
87823c34adc5Sramat 			MDI_PI_UNLOCK(cpi->cpi_pip);
87833c34adc5Sramat 		}
87843c34adc5Sramat 	}
87853c34adc5Sramat 
87863c34adc5Sramat 	return (online_count);
87873c34adc5Sramat }
87883c34adc5Sramat 
87893c34adc5Sramat /*
87903c34adc5Sramat  * Bus configure all paths for the specified vhci client.
87913c34adc5Sramat  * If at least one path for the client is already online, the remaining paths
87923c34adc5Sramat  * will be configured asynchronously. Otherwise, it synchronously configures
87933c34adc5Sramat  * the paths until at least one path is online and then rest of the paths
87943c34adc5Sramat  * will be configured asynchronously.
87953c34adc5Sramat  */
87963c34adc5Sramat static void
87973c34adc5Sramat config_client_paths(mdi_vhci_config_t *vhc, char *ct_name, char *ct_addr)
87983c34adc5Sramat {
87993c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
88003c34adc5Sramat 	mdi_phys_path_t *pp_head, *pp;
88013c34adc5Sramat 	mdi_vhcache_client_t *cct;
88023c34adc5Sramat 	mdi_vhcache_lookup_token_t tok;
88033c34adc5Sramat 
88043c34adc5Sramat 	ASSERT(RW_LOCK_HELD(&vhcache->vhcache_lock));
88053c34adc5Sramat 
88063c34adc5Sramat 	init_vhcache_lookup_token(&tok, NULL);
88073c34adc5Sramat 
88083c34adc5Sramat 	if (ct_name == NULL || ct_addr == NULL ||
88093c34adc5Sramat 	    (cct = lookup_vhcache_client(vhcache, ct_name, ct_addr, &tok))
88103c34adc5Sramat 	    == NULL ||
88113c34adc5Sramat 	    (pp_head = build_phclient_path_list(cct, ct_name)) == NULL) {
88123c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
88133c34adc5Sramat 		return;
88143c34adc5Sramat 	}
88153c34adc5Sramat 
88163c34adc5Sramat 	/* if at least one path is online, configure the rest asynchronously */
88173c34adc5Sramat 	if (nonline_paths(cct) > 0) {
88183c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
88193c34adc5Sramat 		config_client_paths_async(vhc, ct_name, ct_addr, pp_head, &tok);
88203c34adc5Sramat 		return;
88213c34adc5Sramat 	}
88223c34adc5Sramat 
88233c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
88243c34adc5Sramat 
88253c34adc5Sramat 	for (pp = pp_head; pp != NULL; pp = pp->phys_path_next) {
88263c34adc5Sramat 		if (bus_config_one_phci_child(pp->phys_path) == MDI_SUCCESS) {
88273c34adc5Sramat 			rw_enter(&vhcache->vhcache_lock, RW_READER);
88283c34adc5Sramat 
88293c34adc5Sramat 			if ((cct = lookup_vhcache_client(vhcache, ct_name,
88303c34adc5Sramat 			    ct_addr, &tok)) == NULL) {
88313c34adc5Sramat 				rw_exit(&vhcache->vhcache_lock);
88323c34adc5Sramat 				goto out;
88333c34adc5Sramat 			}
88343c34adc5Sramat 
88353c34adc5Sramat 			if (nonline_paths(cct) > 0 &&
88363c34adc5Sramat 			    pp->phys_path_next != NULL) {
88373c34adc5Sramat 				rw_exit(&vhcache->vhcache_lock);
88383c34adc5Sramat 				config_client_paths_async(vhc, ct_name, ct_addr,
88393c34adc5Sramat 				    pp->phys_path_next, &tok);
88403c34adc5Sramat 				pp->phys_path_next = NULL;
88413c34adc5Sramat 				goto out;
88423c34adc5Sramat 			}
88433c34adc5Sramat 
88443c34adc5Sramat 			rw_exit(&vhcache->vhcache_lock);
88453c34adc5Sramat 		}
88463c34adc5Sramat 	}
88473c34adc5Sramat 
88483c34adc5Sramat 	adjust_sort_vhcache_paths(vhc, ct_name, ct_addr, &tok);
88493c34adc5Sramat out:
88503c34adc5Sramat 	free_phclient_path_list(pp_head);
88513c34adc5Sramat }
88523c34adc5Sramat 
88533c34adc5Sramat static void
88543c34adc5Sramat single_threaded_vhconfig_enter(mdi_vhci_config_t *vhc)
88553c34adc5Sramat {
88563c34adc5Sramat 	mutex_enter(&vhc->vhc_lock);
88573c34adc5Sramat 	while (vhc->vhc_flags & MDI_VHC_SINGLE_THREADED)
88583c34adc5Sramat 		cv_wait(&vhc->vhc_cv, &vhc->vhc_lock);
88593c34adc5Sramat 	vhc->vhc_flags |= MDI_VHC_SINGLE_THREADED;
88603c34adc5Sramat 	mutex_exit(&vhc->vhc_lock);
88613c34adc5Sramat }
88623c34adc5Sramat 
88633c34adc5Sramat static void
88643c34adc5Sramat single_threaded_vhconfig_exit(mdi_vhci_config_t *vhc)
88653c34adc5Sramat {
88663c34adc5Sramat 	mutex_enter(&vhc->vhc_lock);
88673c34adc5Sramat 	vhc->vhc_flags &= ~MDI_VHC_SINGLE_THREADED;
88683c34adc5Sramat 	cv_broadcast(&vhc->vhc_cv);
88693c34adc5Sramat 	mutex_exit(&vhc->vhc_lock);
88703c34adc5Sramat }
88713c34adc5Sramat 
887252cac543Sramat typedef struct mdi_phci_driver_info {
887352cac543Sramat 	char	*phdriver_name;	/* name of the phci driver */
887452cac543Sramat 
887552cac543Sramat 	/* set to non zero if the phci driver supports root device */
887652cac543Sramat 	int	phdriver_root_support;
887752cac543Sramat } mdi_phci_driver_info_t;
887852cac543Sramat 
88793c34adc5Sramat /*
888052cac543Sramat  * vhci class and root support capability of a phci driver can be
888152cac543Sramat  * specified using ddi-vhci-class and ddi-no-root-support properties in the
888252cac543Sramat  * phci driver.conf file. The built-in tables below contain this information
888352cac543Sramat  * for those phci drivers whose driver.conf files don't yet contain this info.
888452cac543Sramat  *
888552cac543Sramat  * All phci drivers expect iscsi have root device support.
888652cac543Sramat  */
888752cac543Sramat static mdi_phci_driver_info_t scsi_phci_driver_list[] = {
888852cac543Sramat 	{ "fp", 1 },
888952cac543Sramat 	{ "iscsi", 0 },
889052cac543Sramat 	{ "ibsrp", 1 }
889152cac543Sramat 	};
889252cac543Sramat 
889352cac543Sramat static mdi_phci_driver_info_t ib_phci_driver_list[] = { "tavor", 1 };
889452cac543Sramat 
889552cac543Sramat static void *
889652cac543Sramat mdi_realloc(void *old_ptr, size_t old_size, size_t new_size)
889752cac543Sramat {
889852cac543Sramat 	void *new_ptr;
889952cac543Sramat 
890052cac543Sramat 	new_ptr = kmem_zalloc(new_size, KM_SLEEP);
890152cac543Sramat 	if (old_ptr) {
8902f7209cf2Spramodbg 		bcopy(old_ptr, new_ptr, MIN(old_size, new_size));
890352cac543Sramat 		kmem_free(old_ptr, old_size);
890452cac543Sramat 	}
890552cac543Sramat 	return (new_ptr);
890652cac543Sramat }
890752cac543Sramat 
890852cac543Sramat static void
890952cac543Sramat add_to_phci_list(char ***driver_list, int **root_support_list,
891052cac543Sramat     int *cur_elements, int *max_elements, char *driver_name, int root_support)
891152cac543Sramat {
891252cac543Sramat 	ASSERT(*cur_elements <= *max_elements);
891352cac543Sramat 	if (*cur_elements == *max_elements) {
891452cac543Sramat 		*max_elements += 10;
891552cac543Sramat 		*driver_list = mdi_realloc(*driver_list,
891652cac543Sramat 		    sizeof (char *) * (*cur_elements),
891752cac543Sramat 		    sizeof (char *) * (*max_elements));
891852cac543Sramat 		*root_support_list = mdi_realloc(*root_support_list,
891952cac543Sramat 		    sizeof (int) * (*cur_elements),
892052cac543Sramat 		    sizeof (int) * (*max_elements));
892152cac543Sramat 	}
892252cac543Sramat 	(*driver_list)[*cur_elements] = i_ddi_strdup(driver_name, KM_SLEEP);
892352cac543Sramat 	(*root_support_list)[*cur_elements] = root_support;
892452cac543Sramat 	(*cur_elements)++;
892552cac543Sramat }
892652cac543Sramat 
892752cac543Sramat static void
892852cac543Sramat get_phci_driver_list(char *vhci_class, char ***driver_list,
892952cac543Sramat     int **root_support_list, int *cur_elements, int *max_elements)
893052cac543Sramat {
893152cac543Sramat 	mdi_phci_driver_info_t	*st_driver_list, *p;
893252cac543Sramat 	int		st_ndrivers, root_support, i, j, driver_conf_count;
893352cac543Sramat 	major_t		m;
893452cac543Sramat 	struct devnames	*dnp;
893552cac543Sramat 	ddi_prop_t	*propp;
893652cac543Sramat 
893752cac543Sramat 	*driver_list = NULL;
893852cac543Sramat 	*root_support_list = NULL;
893952cac543Sramat 	*cur_elements = 0;
894052cac543Sramat 	*max_elements = 0;
894152cac543Sramat 
894252cac543Sramat 	/* add the phci drivers derived from the phci driver.conf files */
894352cac543Sramat 	for (m = 0; m < devcnt; m++) {
894452cac543Sramat 		dnp = &devnamesp[m];
894552cac543Sramat 
894652cac543Sramat 		if (dnp->dn_flags & DN_PHCI_DRIVER) {
894752cac543Sramat 			LOCK_DEV_OPS(&dnp->dn_lock);
894852cac543Sramat 			if (dnp->dn_global_prop_ptr != NULL &&
894952cac543Sramat 			    (propp = i_ddi_prop_search(DDI_DEV_T_ANY,
895052cac543Sramat 			    DDI_VHCI_CLASS, DDI_PROP_TYPE_STRING,
895152cac543Sramat 			    &dnp->dn_global_prop_ptr->prop_list)) != NULL &&
895252cac543Sramat 			    strcmp(propp->prop_val, vhci_class) == 0) {
895352cac543Sramat 
895452cac543Sramat 				root_support = (i_ddi_prop_search(DDI_DEV_T_ANY,
895552cac543Sramat 				    DDI_NO_ROOT_SUPPORT, DDI_PROP_TYPE_INT,
895652cac543Sramat 				    &dnp->dn_global_prop_ptr->prop_list)
895752cac543Sramat 				    == NULL) ? 1 : 0;
895852cac543Sramat 
895952cac543Sramat 				add_to_phci_list(driver_list, root_support_list,
896052cac543Sramat 				    cur_elements, max_elements, dnp->dn_name,
896152cac543Sramat 				    root_support);
896252cac543Sramat 
896352cac543Sramat 				UNLOCK_DEV_OPS(&dnp->dn_lock);
896452cac543Sramat 			} else
896552cac543Sramat 				UNLOCK_DEV_OPS(&dnp->dn_lock);
896652cac543Sramat 		}
896752cac543Sramat 	}
896852cac543Sramat 
896952cac543Sramat 	driver_conf_count = *cur_elements;
897052cac543Sramat 
897152cac543Sramat 	/* add the phci drivers specified in the built-in tables */
897252cac543Sramat 	if (strcmp(vhci_class, MDI_HCI_CLASS_SCSI) == 0) {
897352cac543Sramat 		st_driver_list = scsi_phci_driver_list;
897452cac543Sramat 		st_ndrivers = sizeof (scsi_phci_driver_list) /
897552cac543Sramat 		    sizeof (mdi_phci_driver_info_t);
897652cac543Sramat 	} else if (strcmp(vhci_class, MDI_HCI_CLASS_IB) == 0) {
897752cac543Sramat 		st_driver_list = ib_phci_driver_list;
897852cac543Sramat 		st_ndrivers = sizeof (ib_phci_driver_list) /
897952cac543Sramat 		    sizeof (mdi_phci_driver_info_t);
898052cac543Sramat 	} else {
898152cac543Sramat 		st_driver_list = NULL;
898252cac543Sramat 		st_ndrivers = 0;
898352cac543Sramat 	}
898452cac543Sramat 
898552cac543Sramat 	for (i = 0, p = st_driver_list; i < st_ndrivers; i++, p++) {
898652cac543Sramat 		/* add this phci driver if not already added before */
898752cac543Sramat 		for (j = 0; j < driver_conf_count; j++) {
898852cac543Sramat 			if (strcmp((*driver_list)[j], p->phdriver_name) == 0)
898952cac543Sramat 				break;
899052cac543Sramat 		}
899152cac543Sramat 		if (j == driver_conf_count) {
899252cac543Sramat 			add_to_phci_list(driver_list, root_support_list,
899352cac543Sramat 			    cur_elements, max_elements, p->phdriver_name,
899452cac543Sramat 			    p->phdriver_root_support);
899552cac543Sramat 		}
899652cac543Sramat 	}
899752cac543Sramat }
899852cac543Sramat 
899952cac543Sramat /*
900052cac543Sramat  * Attach the phci driver instances associated with the specified vhci class.
90013c34adc5Sramat  * If root is mounted attach all phci driver instances.
90023c34adc5Sramat  * If root is not mounted, attach the instances of only those phci
90033c34adc5Sramat  * drivers that have the root support.
90043c34adc5Sramat  */
90053c34adc5Sramat static void
900652cac543Sramat attach_phci_drivers(char *vhci_class)
90073c34adc5Sramat {
900852cac543Sramat 	char	**driver_list, **p;
900952cac543Sramat 	int	*root_support_list;
901052cac543Sramat 	int	cur_elements, max_elements, i;
90113c34adc5Sramat 	major_t	m;
90123c34adc5Sramat 
901352cac543Sramat 	get_phci_driver_list(vhci_class, &driver_list, &root_support_list,
901452cac543Sramat 	    &cur_elements, &max_elements);
90153c34adc5Sramat 
901652cac543Sramat 	for (i = 0; i < cur_elements; i++) {
901752cac543Sramat 		if (modrootloaded || root_support_list[i]) {
901852cac543Sramat 			m = ddi_name_to_major(driver_list[i]);
9019a204de77Scth 			if (m != DDI_MAJOR_T_NONE &&
9020a204de77Scth 			    ddi_hold_installed_driver(m))
90213c34adc5Sramat 				ddi_rele_driver(m);
90223c34adc5Sramat 		}
90233c34adc5Sramat 	}
902452cac543Sramat 
902552cac543Sramat 	if (driver_list) {
902652cac543Sramat 		for (i = 0, p = driver_list; i < cur_elements; i++, p++)
902752cac543Sramat 			kmem_free(*p, strlen(*p) + 1);
902852cac543Sramat 		kmem_free(driver_list, sizeof (char *) * max_elements);
902952cac543Sramat 		kmem_free(root_support_list, sizeof (int) * max_elements);
903052cac543Sramat 	}
90313c34adc5Sramat }
90323c34adc5Sramat 
90333c34adc5Sramat /*
90343c34adc5Sramat  * Build vhci cache:
90353c34adc5Sramat  *
90363c34adc5Sramat  * Attach phci driver instances and then drive BUS_CONFIG_ALL on
90373c34adc5Sramat  * the phci driver instances. During this process the cache gets built.
90383c34adc5Sramat  *
903967e56d35Sramat  * Cache is built fully if the root is mounted.
90403c34adc5Sramat  * If the root is not mounted, phci drivers that do not have root support
90413c34adc5Sramat  * are not attached. As a result the cache is built partially. The entries
90423c34adc5Sramat  * in the cache reflect only those phci drivers that have root support.
90433c34adc5Sramat  */
904467e56d35Sramat static int
904552cac543Sramat build_vhci_cache(mdi_vhci_t *vh)
90463c34adc5Sramat {
904752cac543Sramat 	mdi_vhci_config_t *vhc = vh->vh_config;
90483c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
90493c34adc5Sramat 
905067e56d35Sramat 	single_threaded_vhconfig_enter(vhc);
905167e56d35Sramat 
90523c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_READER);
90533c34adc5Sramat 	if (vhcache->vhcache_flags & MDI_VHCI_CACHE_SETUP_DONE) {
90543c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
905567e56d35Sramat 		single_threaded_vhconfig_exit(vhc);
905667e56d35Sramat 		return (0);
90573c34adc5Sramat 	}
90583c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
90593c34adc5Sramat 
906052cac543Sramat 	attach_phci_drivers(vh->vh_class);
90613c34adc5Sramat 	bus_config_all_phcis(vhcache, NDI_DRV_CONF_REPROBE | NDI_NO_EVENT,
9062a204de77Scth 	    BUS_CONFIG_ALL, DDI_MAJOR_T_NONE);
90633c34adc5Sramat 
90643c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_WRITER);
90653c34adc5Sramat 	vhcache->vhcache_flags |= MDI_VHCI_CACHE_SETUP_DONE;
90663c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
906767e56d35Sramat 
906867e56d35Sramat 	single_threaded_vhconfig_exit(vhc);
90693c34adc5Sramat 	vhcache_dirty(vhc);
907067e56d35Sramat 	return (1);
90713c34adc5Sramat }
90723c34adc5Sramat 
90733c34adc5Sramat /*
907467e56d35Sramat  * Determine if discovery of paths is needed.
90753c34adc5Sramat  */
90763c34adc5Sramat static int
907767e56d35Sramat vhcache_do_discovery(mdi_vhci_config_t *vhc)
90783c34adc5Sramat {
907967e56d35Sramat 	int rv = 1;
908067e56d35Sramat 
908167e56d35Sramat 	mutex_enter(&vhc->vhc_lock);
908267e56d35Sramat 	if (i_ddi_io_initialized() == 0) {
908367e56d35Sramat 		if (vhc->vhc_path_discovery_boot > 0) {
908467e56d35Sramat 			vhc->vhc_path_discovery_boot--;
908567e56d35Sramat 			goto out;
908667e56d35Sramat 		}
908767e56d35Sramat 	} else {
908867e56d35Sramat 		if (vhc->vhc_path_discovery_postboot > 0) {
908967e56d35Sramat 			vhc->vhc_path_discovery_postboot--;
909067e56d35Sramat 			goto out;
909167e56d35Sramat 		}
909267e56d35Sramat 	}
909367e56d35Sramat 
909467e56d35Sramat 	/*
909567e56d35Sramat 	 * Do full path discovery at most once per mdi_path_discovery_interval.
909667e56d35Sramat 	 * This is to avoid a series of full path discoveries when opening
909767e56d35Sramat 	 * stale /dev/[r]dsk links.
909867e56d35Sramat 	 */
909967e56d35Sramat 	if (mdi_path_discovery_interval != -1 &&
9100*d3d50737SRafael Vanoni 	    ddi_get_lbolt64() >= vhc->vhc_path_discovery_cutoff_time)
910167e56d35Sramat 		goto out;
910267e56d35Sramat 
910367e56d35Sramat 	rv = 0;
910467e56d35Sramat out:
910567e56d35Sramat 	mutex_exit(&vhc->vhc_lock);
910667e56d35Sramat 	return (rv);
910767e56d35Sramat }
910867e56d35Sramat 
910967e56d35Sramat /*
911067e56d35Sramat  * Discover all paths:
911167e56d35Sramat  *
911267e56d35Sramat  * Attach phci driver instances and then drive BUS_CONFIG_ALL on all the phci
911367e56d35Sramat  * driver instances. During this process all paths will be discovered.
911467e56d35Sramat  */
911567e56d35Sramat static int
911652cac543Sramat vhcache_discover_paths(mdi_vhci_t *vh)
911767e56d35Sramat {
911852cac543Sramat 	mdi_vhci_config_t *vhc = vh->vh_config;
911967e56d35Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
912067e56d35Sramat 	int rv = 0;
91213c34adc5Sramat 
91223c34adc5Sramat 	single_threaded_vhconfig_enter(vhc);
91233c34adc5Sramat 
912467e56d35Sramat 	if (vhcache_do_discovery(vhc)) {
912552cac543Sramat 		attach_phci_drivers(vh->vh_class);
912667e56d35Sramat 		bus_config_all_phcis(vhcache, NDI_DRV_CONF_REPROBE |
9127a204de77Scth 		    NDI_NO_EVENT, BUS_CONFIG_ALL, DDI_MAJOR_T_NONE);
912867e56d35Sramat 
91293c34adc5Sramat 		mutex_enter(&vhc->vhc_lock);
9130*d3d50737SRafael Vanoni 		vhc->vhc_path_discovery_cutoff_time = ddi_get_lbolt64() +
913167e56d35Sramat 		    mdi_path_discovery_interval * TICKS_PER_SECOND;
91323c34adc5Sramat 		mutex_exit(&vhc->vhc_lock);
913367e56d35Sramat 		rv = 1;
91343c34adc5Sramat 	}
91353c34adc5Sramat 
91363c34adc5Sramat 	single_threaded_vhconfig_exit(vhc);
91373c34adc5Sramat 	return (rv);
91383c34adc5Sramat }
91393c34adc5Sramat 
91403c34adc5Sramat /*
91413c34adc5Sramat  * Generic vhci bus config implementation:
91423c34adc5Sramat  *
91433c34adc5Sramat  * Parameters
91443c34adc5Sramat  *	vdip	vhci dip
91453c34adc5Sramat  *	flags	bus config flags
91463c34adc5Sramat  *	op	bus config operation
91473c34adc5Sramat  *	The remaining parameters are bus config operation specific
91483c34adc5Sramat  *
91493c34adc5Sramat  * for BUS_CONFIG_ONE
91503c34adc5Sramat  *	arg	pointer to name@addr
91513c34adc5Sramat  *	child	upon successful return from this function, *child will be
91523c34adc5Sramat  *		set to the configured and held devinfo child node of vdip.
91533c34adc5Sramat  *	ct_addr	pointer to client address (i.e. GUID)
91543c34adc5Sramat  *
91553c34adc5Sramat  * for BUS_CONFIG_DRIVER
91563c34adc5Sramat  *	arg	major number of the driver
91573c34adc5Sramat  *	child and ct_addr parameters are ignored
91583c34adc5Sramat  *
91593c34adc5Sramat  * for BUS_CONFIG_ALL
91603c34adc5Sramat  *	arg, child, and ct_addr parameters are ignored
91613c34adc5Sramat  *
91623c34adc5Sramat  * Note that for the rest of the bus config operations, this function simply
91633c34adc5Sramat  * calls the framework provided default bus config routine.
91643c34adc5Sramat  */
91653c34adc5Sramat int
91663c34adc5Sramat mdi_vhci_bus_config(dev_info_t *vdip, uint_t flags, ddi_bus_config_op_t op,
91673c34adc5Sramat     void *arg, dev_info_t **child, char *ct_addr)
91683c34adc5Sramat {
91693c34adc5Sramat 	mdi_vhci_t *vh = i_devi_get_vhci(vdip);
91703c34adc5Sramat 	mdi_vhci_config_t *vhc = vh->vh_config;
91713c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
917267e56d35Sramat 	int rv = 0;
917367e56d35Sramat 	int params_valid = 0;
91743c34adc5Sramat 	char *cp;
91753c34adc5Sramat 
91763c34adc5Sramat 	/*
91775e3986cbScth 	 * To bus config vhcis we relay operation, possibly using another
91785e3986cbScth 	 * thread, to phcis. The phci driver then interacts with MDI to cause
91795e3986cbScth 	 * vhci child nodes to be enumerated under the vhci node.  Adding a
91805e3986cbScth 	 * vhci child requires an ndi_devi_enter of the vhci. Since another
91815e3986cbScth 	 * thread may be adding the child, to avoid deadlock we can't wait
91825e3986cbScth 	 * for the relayed operations to complete if we have already entered
91835e3986cbScth 	 * the vhci node.
91843c34adc5Sramat 	 */
91853c34adc5Sramat 	if (DEVI_BUSY_OWNED(vdip)) {
91864c06356bSdh142964 		MDI_DEBUG(2, (MDI_NOTE, vdip,
91874c06356bSdh142964 		    "vhci dip is busy owned %p", (void *)vdip));
91883c34adc5Sramat 		goto default_bus_config;
91893c34adc5Sramat 	}
91903c34adc5Sramat 
91913c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_READER);
91923c34adc5Sramat 	if (!(vhcache->vhcache_flags & MDI_VHCI_CACHE_SETUP_DONE)) {
91933c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
919452cac543Sramat 		rv = build_vhci_cache(vh);
91953c34adc5Sramat 		rw_enter(&vhcache->vhcache_lock, RW_READER);
91963c34adc5Sramat 	}
91973c34adc5Sramat 
91983c34adc5Sramat 	switch (op) {
91993c34adc5Sramat 	case BUS_CONFIG_ONE:
920067e56d35Sramat 		if (arg != NULL && ct_addr != NULL) {
92013c34adc5Sramat 			/* extract node name */
92023c34adc5Sramat 			cp = (char *)arg;
92033c34adc5Sramat 			while (*cp != '\0' && *cp != '@')
92043c34adc5Sramat 				cp++;
92053c34adc5Sramat 			if (*cp == '@') {
920667e56d35Sramat 				params_valid = 1;
92073c34adc5Sramat 				*cp = '\0';
92083c34adc5Sramat 				config_client_paths(vhc, (char *)arg, ct_addr);
920967e56d35Sramat 				/* config_client_paths() releases cache_lock */
92103c34adc5Sramat 				*cp = '@';
921167e56d35Sramat 				break;
921267e56d35Sramat 			}
921367e56d35Sramat 		}
921467e56d35Sramat 
92153c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
92163c34adc5Sramat 		break;
92173c34adc5Sramat 
92183c34adc5Sramat 	case BUS_CONFIG_DRIVER:
92193c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
922067e56d35Sramat 		if (rv == 0)
922167e56d35Sramat 			st_bus_config_all_phcis(vhc, flags, op,
92223c34adc5Sramat 			    (major_t)(uintptr_t)arg);
92233c34adc5Sramat 		break;
92243c34adc5Sramat 
92253c34adc5Sramat 	case BUS_CONFIG_ALL:
92263c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
922767e56d35Sramat 		if (rv == 0)
922867e56d35Sramat 			st_bus_config_all_phcis(vhc, flags, op, -1);
92293c34adc5Sramat 		break;
92303c34adc5Sramat 
92313c34adc5Sramat 	default:
92323c34adc5Sramat 		rw_exit(&vhcache->vhcache_lock);
92333c34adc5Sramat 		break;
92343c34adc5Sramat 	}
92353c34adc5Sramat 
92363c34adc5Sramat 
92373c34adc5Sramat default_bus_config:
92383c34adc5Sramat 	/*
92393c34adc5Sramat 	 * All requested child nodes are enumerated under the vhci.
92403c34adc5Sramat 	 * Now configure them.
92413c34adc5Sramat 	 */
92423c34adc5Sramat 	if (ndi_busop_bus_config(vdip, flags, op, arg, child, 0) ==
92433c34adc5Sramat 	    NDI_SUCCESS) {
92443c34adc5Sramat 		return (MDI_SUCCESS);
924567e56d35Sramat 	} else if (op == BUS_CONFIG_ONE && rv == 0 && params_valid) {
924667e56d35Sramat 		/* discover all paths and try configuring again */
924752cac543Sramat 		if (vhcache_discover_paths(vh) &&
924867e56d35Sramat 		    ndi_busop_bus_config(vdip, flags, op, arg, child, 0) ==
924967e56d35Sramat 		    NDI_SUCCESS)
925067e56d35Sramat 			return (MDI_SUCCESS);
92513c34adc5Sramat 	}
92523c34adc5Sramat 
92533c34adc5Sramat 	return (MDI_FAILURE);
92543c34adc5Sramat }
92553c34adc5Sramat 
92563c34adc5Sramat /*
92573c34adc5Sramat  * Read the on-disk vhci cache into an nvlist for the specified vhci class.
92583c34adc5Sramat  */
92593c34adc5Sramat static nvlist_t *
92603c34adc5Sramat read_on_disk_vhci_cache(char *vhci_class)
92613c34adc5Sramat {
92623c34adc5Sramat 	nvlist_t *nvl;
92633c34adc5Sramat 	int err;
92643c34adc5Sramat 	char *filename;
92653c34adc5Sramat 
92663c34adc5Sramat 	filename = vhclass2vhcache_filename(vhci_class);
92673c34adc5Sramat 
92683c34adc5Sramat 	if ((err = fread_nvlist(filename, &nvl)) == 0) {
92693c34adc5Sramat 		kmem_free(filename, strlen(filename) + 1);
92703c34adc5Sramat 		return (nvl);
92713c34adc5Sramat 	} else if (err == EIO)
92724c06356bSdh142964 		cmn_err(CE_WARN, "%s: I/O error, will recreate", filename);
92733c34adc5Sramat 	else if (err == EINVAL)
92743c34adc5Sramat 		cmn_err(CE_WARN,
92754c06356bSdh142964 		    "%s: data file corrupted, will recreate", filename);
92763c34adc5Sramat 
92773c34adc5Sramat 	kmem_free(filename, strlen(filename) + 1);
92783c34adc5Sramat 	return (NULL);
92793c34adc5Sramat }
92803c34adc5Sramat 
92813c34adc5Sramat /*
92823c34adc5Sramat  * Read on-disk vhci cache into nvlists for all vhci classes.
92833c34adc5Sramat  * Called during booting by i_ddi_read_devices_files().
92843c34adc5Sramat  */
92853c34adc5Sramat void
92863c34adc5Sramat mdi_read_devices_files(void)
92873c34adc5Sramat {
92883c34adc5Sramat 	int i;
92893c34adc5Sramat 
92903c34adc5Sramat 	for (i = 0; i < N_VHCI_CLASSES; i++)
92913c34adc5Sramat 		vhcache_nvl[i] = read_on_disk_vhci_cache(vhci_class_list[i]);
92923c34adc5Sramat }
92933c34adc5Sramat 
92943c34adc5Sramat /*
92953c34adc5Sramat  * Remove all stale entries from vhci cache.
92963c34adc5Sramat  */
92973c34adc5Sramat static void
92983c34adc5Sramat clean_vhcache(mdi_vhci_config_t *vhc)
92993c34adc5Sramat {
93003c34adc5Sramat 	mdi_vhci_cache_t *vhcache = &vhc->vhc_vhcache;
93013c34adc5Sramat 	mdi_vhcache_phci_t *cphci, *cphci_head, *cphci_next;
93023c34adc5Sramat 	mdi_vhcache_client_t *cct, *cct_head, *cct_next;
93033c34adc5Sramat 	mdi_vhcache_pathinfo_t *cpi, *cpi_head, *cpi_next;
93043c34adc5Sramat 
93053c34adc5Sramat 	rw_enter(&vhcache->vhcache_lock, RW_WRITER);
93063c34adc5Sramat 
93073c34adc5Sramat 	cct_head = vhcache->vhcache_client_head;
93083c34adc5Sramat 	vhcache->vhcache_client_head = vhcache->vhcache_client_tail = NULL;
93093c34adc5Sramat 	for (cct = cct_head; cct != NULL; cct = cct_next) {
93103c34adc5Sramat 		cct_next = cct->cct_next;
93113c34adc5Sramat 
93123c34adc5Sramat 		cpi_head = cct->cct_cpi_head;
93133c34adc5Sramat 		cct->cct_cpi_head = cct->cct_cpi_tail = NULL;
93143c34adc5Sramat 		for (cpi = cpi_head; cpi != NULL; cpi = cpi_next) {
93153c34adc5Sramat 			cpi_next = cpi->cpi_next;
93163c34adc5Sramat 			if (cpi->cpi_pip != NULL) {
93173c34adc5Sramat 				ASSERT(cpi->cpi_cphci->cphci_phci != NULL);
93183c34adc5Sramat 				enqueue_tail_vhcache_pathinfo(cct, cpi);
93193c34adc5Sramat 			} else
93203c34adc5Sramat 				free_vhcache_pathinfo(cpi);
93213c34adc5Sramat 		}
93223c34adc5Sramat 
93233c34adc5Sramat 		if (cct->cct_cpi_head != NULL)
93243c34adc5Sramat 			enqueue_vhcache_client(vhcache, cct);
93253c34adc5Sramat 		else {
93263c34adc5Sramat 			(void) mod_hash_destroy(vhcache->vhcache_client_hash,
93273c34adc5Sramat 			    (mod_hash_key_t)cct->cct_name_addr);
93283c34adc5Sramat 			free_vhcache_client(cct);
93293c34adc5Sramat 		}
93303c34adc5Sramat 	}
93313c34adc5Sramat 
93323c34adc5Sramat 	cphci_head = vhcache->vhcache_phci_head;
93333c34adc5Sramat 	vhcache->vhcache_phci_head = vhcache->vhcache_phci_tail = NULL;
93343c34adc5Sramat 	for (cphci = cphci_head; cphci != NULL; cphci = cphci_next) {
93353c34adc5Sramat 		cphci_next = cphci->cphci_next;
93363c34adc5Sramat 		if (cphci->cphci_phci != NULL)
93373c34adc5Sramat 			enqueue_vhcache_phci(vhcache, cphci);
93383c34adc5Sramat 		else
93393c34adc5Sramat 			free_vhcache_phci(cphci);
93403c34adc5Sramat 	}
93413c34adc5Sramat 
9342*d3d50737SRafael Vanoni 	vhcache->vhcache_clean_time = ddi_get_lbolt64();
93433c34adc5Sramat 	rw_exit(&vhcache->vhcache_lock);
93443c34adc5Sramat 	vhcache_dirty(vhc);
93453c34adc5Sramat }
93463c34adc5Sramat 
93473c34adc5Sramat /*
93483c34adc5Sramat  * Remove all stale entries from vhci cache.
93493c34adc5Sramat  * Called by i_ddi_clean_devices_files() during the execution of devfsadm -C
93503c34adc5Sramat  */
93513c34adc5Sramat void
93523c34adc5Sramat mdi_clean_vhcache(void)
93533c34adc5Sramat {
93543c34adc5Sramat 	mdi_vhci_t *vh;
93553c34adc5Sramat 
93563c34adc5Sramat 	mutex_enter(&mdi_mutex);
93573c34adc5Sramat 	for (vh = mdi_vhci_head; vh != NULL; vh = vh->vh_next) {
93583c34adc5Sramat 		vh->vh_refcnt++;
93593c34adc5Sramat 		mutex_exit(&mdi_mutex);
93603c34adc5Sramat 		clean_vhcache(vh->vh_config);
93613c34adc5Sramat 		mutex_enter(&mdi_mutex);
93623c34adc5Sramat 		vh->vh_refcnt--;
93633c34adc5Sramat 	}
93643c34adc5Sramat 	mutex_exit(&mdi_mutex);
93653c34adc5Sramat }
93668c4f8890Srs135747 
93678c4f8890Srs135747 /*
93688c4f8890Srs135747  * mdi_vhci_walk_clients():
93698c4f8890Srs135747  *		Walker routine to traverse client dev_info nodes
93708c4f8890Srs135747  * ddi_walk_devs(ddi_get_child(vdip), f, arg) returns the entire tree
93718c4f8890Srs135747  * below the client, including nexus devices, which we dont want.
93728c4f8890Srs135747  * So we just traverse the immediate siblings, starting from 1st client.
93738c4f8890Srs135747  */
93748c4f8890Srs135747 void
93758c4f8890Srs135747 mdi_vhci_walk_clients(dev_info_t *vdip,
93768c4f8890Srs135747     int (*f)(dev_info_t *, void *), void *arg)
93778c4f8890Srs135747 {
93785e3986cbScth 	mdi_vhci_t	*vh = i_devi_get_vhci(vdip);
93798c4f8890Srs135747 	dev_info_t	*cdip;
93808c4f8890Srs135747 	mdi_client_t	*ct;
93818c4f8890Srs135747 
93825e3986cbScth 	MDI_VHCI_CLIENT_LOCK(vh);
93838c4f8890Srs135747 	cdip = ddi_get_child(vdip);
93848c4f8890Srs135747 	while (cdip) {
93858c4f8890Srs135747 		ct = i_devi_get_client(cdip);
93868c4f8890Srs135747 		MDI_CLIENT_LOCK(ct);
93878c4f8890Srs135747 
93885e3986cbScth 		if (((*f)(cdip, arg)) == DDI_WALK_CONTINUE)
93898c4f8890Srs135747 			cdip = ddi_get_next_sibling(cdip);
93905e3986cbScth 		else
93915e3986cbScth 			cdip = NULL;
9392c73a93f2Sdm120769 
9393c73a93f2Sdm120769 		MDI_CLIENT_UNLOCK(ct);
93948c4f8890Srs135747 	}
93955e3986cbScth 	MDI_VHCI_CLIENT_UNLOCK(vh);
93968c4f8890Srs135747 }
93978c4f8890Srs135747 
93988c4f8890Srs135747 /*
93998c4f8890Srs135747  * mdi_vhci_walk_phcis():
94008c4f8890Srs135747  *		Walker routine to traverse phci dev_info nodes
94018c4f8890Srs135747  */
94028c4f8890Srs135747 void
94038c4f8890Srs135747 mdi_vhci_walk_phcis(dev_info_t *vdip,
94048c4f8890Srs135747     int (*f)(dev_info_t *, void *), void *arg)
94058c4f8890Srs135747 {
94065e3986cbScth 	mdi_vhci_t	*vh = i_devi_get_vhci(vdip);
94075e3986cbScth 	mdi_phci_t	*ph, *next;
94088c4f8890Srs135747 
94095e3986cbScth 	MDI_VHCI_PHCI_LOCK(vh);
94108c4f8890Srs135747 	ph = vh->vh_phci_head;
94118c4f8890Srs135747 	while (ph) {
94128c4f8890Srs135747 		MDI_PHCI_LOCK(ph);
94138c4f8890Srs135747 
94145e3986cbScth 		if (((*f)(ph->ph_dip, arg)) == DDI_WALK_CONTINUE)
94155e3986cbScth 			next = ph->ph_next;
94165e3986cbScth 		else
94175e3986cbScth 			next = NULL;
9418c73a93f2Sdm120769 
9419c73a93f2Sdm120769 		MDI_PHCI_UNLOCK(ph);
94205e3986cbScth 		ph = next;
94218c4f8890Srs135747 	}
94225e3986cbScth 	MDI_VHCI_PHCI_UNLOCK(vh);
94238c4f8890Srs135747 }
94248c4f8890Srs135747 
94258c4f8890Srs135747 
94268c4f8890Srs135747 /*
94278c4f8890Srs135747  * mdi_walk_vhcis():
94288c4f8890Srs135747  *		Walker routine to traverse vhci dev_info nodes
94298c4f8890Srs135747  */
94308c4f8890Srs135747 void
94318c4f8890Srs135747 mdi_walk_vhcis(int (*f)(dev_info_t *, void *), void *arg)
94328c4f8890Srs135747 {
94338c4f8890Srs135747 	mdi_vhci_t	*vh = NULL;
94348c4f8890Srs135747 
94358c4f8890Srs135747 	mutex_enter(&mdi_mutex);
94368c4f8890Srs135747 	/*
94378c4f8890Srs135747 	 * Scan for already registered vhci
94388c4f8890Srs135747 	 */
94398c4f8890Srs135747 	for (vh = mdi_vhci_head; vh != NULL; vh = vh->vh_next) {
94408c4f8890Srs135747 		vh->vh_refcnt++;
94418c4f8890Srs135747 		mutex_exit(&mdi_mutex);
94428c4f8890Srs135747 		if (((*f)(vh->vh_dip, arg)) != DDI_WALK_CONTINUE) {
94438c4f8890Srs135747 			mutex_enter(&mdi_mutex);
94448c4f8890Srs135747 			vh->vh_refcnt--;
94458c4f8890Srs135747 			break;
94468c4f8890Srs135747 		} else {
94478c4f8890Srs135747 			mutex_enter(&mdi_mutex);
94488c4f8890Srs135747 			vh->vh_refcnt--;
94498c4f8890Srs135747 		}
94508c4f8890Srs135747 	}
94518c4f8890Srs135747 
94528c4f8890Srs135747 	mutex_exit(&mdi_mutex);
94538c4f8890Srs135747 }
94548c4f8890Srs135747 
94558c4f8890Srs135747 /*
94568c4f8890Srs135747  * i_mdi_log_sysevent():
94578c4f8890Srs135747  *		Logs events for pickup by syseventd
94588c4f8890Srs135747  */
94598c4f8890Srs135747 static void
94608c4f8890Srs135747 i_mdi_log_sysevent(dev_info_t *dip, char *ph_vh_class, char *subclass)
94618c4f8890Srs135747 {
94628c4f8890Srs135747 	char		*path_name;
94638c4f8890Srs135747 	nvlist_t	*attr_list;
94648c4f8890Srs135747 
94658c4f8890Srs135747 	if (nvlist_alloc(&attr_list, NV_UNIQUE_NAME_TYPE,
94668c4f8890Srs135747 	    KM_SLEEP) != DDI_SUCCESS) {
94678c4f8890Srs135747 		goto alloc_failed;
94688c4f8890Srs135747 	}
94698c4f8890Srs135747 
94708c4f8890Srs135747 	path_name = kmem_zalloc(MAXPATHLEN, KM_SLEEP);
94718c4f8890Srs135747 	(void) ddi_pathname(dip, path_name);
94728c4f8890Srs135747 
94738c4f8890Srs135747 	if (nvlist_add_string(attr_list, DDI_DRIVER_NAME,
94748c4f8890Srs135747 	    ddi_driver_name(dip)) != DDI_SUCCESS) {
94758c4f8890Srs135747 		goto error;
94768c4f8890Srs135747 	}
94778c4f8890Srs135747 
94788c4f8890Srs135747 	if (nvlist_add_int32(attr_list, DDI_DRIVER_MAJOR,
94798c4f8890Srs135747 	    (int32_t)ddi_driver_major(dip)) != DDI_SUCCESS) {
94808c4f8890Srs135747 		goto error;
94818c4f8890Srs135747 	}
94828c4f8890Srs135747 
94838c4f8890Srs135747 	if (nvlist_add_int32(attr_list, DDI_INSTANCE,
94848c4f8890Srs135747 	    (int32_t)ddi_get_instance(dip)) != DDI_SUCCESS) {
94858c4f8890Srs135747 		goto error;
94868c4f8890Srs135747 	}
94878c4f8890Srs135747 
94888c4f8890Srs135747 	if (nvlist_add_string(attr_list, DDI_PATHNAME,
94898c4f8890Srs135747 	    path_name) != DDI_SUCCESS) {
94908c4f8890Srs135747 		goto error;
94918c4f8890Srs135747 	}
94928c4f8890Srs135747 
94938c4f8890Srs135747 	if (nvlist_add_string(attr_list, DDI_CLASS,
94948c4f8890Srs135747 	    ph_vh_class) != DDI_SUCCESS) {
94958c4f8890Srs135747 		goto error;
94968c4f8890Srs135747 	}
94978c4f8890Srs135747 
94988c4f8890Srs135747 	(void) ddi_log_sysevent(dip, DDI_VENDOR_SUNW, EC_DDI, subclass,
94998c4f8890Srs135747 	    attr_list, NULL, DDI_SLEEP);
95008c4f8890Srs135747 
95018c4f8890Srs135747 error:
95028c4f8890Srs135747 	kmem_free(path_name, MAXPATHLEN);
95038c4f8890Srs135747 	nvlist_free(attr_list);
95048c4f8890Srs135747 	return;
95058c4f8890Srs135747 
95068c4f8890Srs135747 alloc_failed:
95074c06356bSdh142964 	MDI_DEBUG(1, (MDI_WARN, dip, "!unable to send sysevent"));
95088c4f8890Srs135747 }
9509f7209cf2Spramodbg 
9510f7209cf2Spramodbg char **
9511f7209cf2Spramodbg mdi_get_phci_driver_list(char *vhci_class, int	*ndrivers)
9512f7209cf2Spramodbg {
9513f7209cf2Spramodbg 	char	**driver_list, **ret_driver_list = NULL;
9514f7209cf2Spramodbg 	int	*root_support_list;
9515f7209cf2Spramodbg 	int	cur_elements, max_elements;
9516f7209cf2Spramodbg 
9517f7209cf2Spramodbg 	get_phci_driver_list(vhci_class, &driver_list, &root_support_list,
9518f7209cf2Spramodbg 	    &cur_elements, &max_elements);
9519f7209cf2Spramodbg 
9520f7209cf2Spramodbg 
9521f7209cf2Spramodbg 	if (driver_list) {
9522f7209cf2Spramodbg 		kmem_free(root_support_list, sizeof (int) * max_elements);
9523f7209cf2Spramodbg 		ret_driver_list = mdi_realloc(driver_list, sizeof (char *)
9524f7209cf2Spramodbg 		    * max_elements, sizeof (char *) * cur_elements);
9525f7209cf2Spramodbg 	}
9526f7209cf2Spramodbg 	*ndrivers = cur_elements;
9527f7209cf2Spramodbg 
9528f7209cf2Spramodbg 	return (ret_driver_list);
9529f7209cf2Spramodbg 
9530f7209cf2Spramodbg }
9531f7209cf2Spramodbg 
9532f7209cf2Spramodbg void
9533f7209cf2Spramodbg mdi_free_phci_driver_list(char **driver_list, int ndrivers)
9534f7209cf2Spramodbg {
9535f7209cf2Spramodbg 	char	**p;
9536f7209cf2Spramodbg 	int	i;
9537f7209cf2Spramodbg 
9538f7209cf2Spramodbg 	if (driver_list) {
9539f7209cf2Spramodbg 		for (i = 0, p = driver_list; i < ndrivers; i++, p++)
9540f7209cf2Spramodbg 			kmem_free(*p, strlen(*p) + 1);
9541f7209cf2Spramodbg 		kmem_free(driver_list, sizeof (char *) * ndrivers);
9542f7209cf2Spramodbg 	}
9543f7209cf2Spramodbg }
954455e592a2SRandall Ralphs 
954555e592a2SRandall Ralphs /*
954655e592a2SRandall Ralphs  * mdi_is_dev_supported():
954755e592a2SRandall Ralphs  *		function called by pHCI bus config operation to determine if a
954855e592a2SRandall Ralphs  *		device should be represented as a child of the vHCI or the
954955e592a2SRandall Ralphs  *		pHCI.  This decision is made by the vHCI, using cinfo idenity
955055e592a2SRandall Ralphs  *		information passed by the pHCI - specifics of the cinfo
955155e592a2SRandall Ralphs  *		representation are by agreement between the pHCI and vHCI.
955255e592a2SRandall Ralphs  * Return Values:
955355e592a2SRandall Ralphs  *		MDI_SUCCESS
955455e592a2SRandall Ralphs  *		MDI_FAILURE
955555e592a2SRandall Ralphs  */
955655e592a2SRandall Ralphs int
955755e592a2SRandall Ralphs mdi_is_dev_supported(char *class, dev_info_t *pdip, void *cinfo)
955855e592a2SRandall Ralphs {
955955e592a2SRandall Ralphs 	mdi_vhci_t	*vh;
956055e592a2SRandall Ralphs 
956155e592a2SRandall Ralphs 	ASSERT(class && pdip);
956255e592a2SRandall Ralphs 
956355e592a2SRandall Ralphs 	/*
956455e592a2SRandall Ralphs 	 * For dev_supported, mdi_phci_register() must have established pdip as
956555e592a2SRandall Ralphs 	 * a pHCI.
956655e592a2SRandall Ralphs 	 *
956755e592a2SRandall Ralphs 	 * NOTE: mdi_phci_register() does "mpxio-disable" processing, and
956855e592a2SRandall Ralphs 	 * MDI_PHCI(pdip) will return false if mpxio is disabled.
956955e592a2SRandall Ralphs 	 */
957055e592a2SRandall Ralphs 	if (!MDI_PHCI(pdip))
957155e592a2SRandall Ralphs 		return (MDI_FAILURE);
957255e592a2SRandall Ralphs 
957355e592a2SRandall Ralphs 	/* Return MDI_FAILURE if vHCI does not support asking the question. */
957455e592a2SRandall Ralphs 	vh = (mdi_vhci_t *)i_mdi_vhci_class2vhci(class);
957555e592a2SRandall Ralphs 	if ((vh == NULL) || (vh->vh_ops->vo_is_dev_supported == NULL)) {
957655e592a2SRandall Ralphs 		return (MDI_FAILURE);
957755e592a2SRandall Ralphs 	}
957855e592a2SRandall Ralphs 
957955e592a2SRandall Ralphs 	/* Return vHCI answer */
958055e592a2SRandall Ralphs 	return (vh->vh_ops->vo_is_dev_supported(vh->vh_dip, pdip, cinfo));
958155e592a2SRandall Ralphs }
958255e592a2SRandall Ralphs 
958355e592a2SRandall Ralphs int
958455e592a2SRandall Ralphs mdi_dc_return_dev_state(mdi_pathinfo_t *pip, struct devctl_iocdata *dcp)
958555e592a2SRandall Ralphs {
958655e592a2SRandall Ralphs 	uint_t devstate = 0;
958755e592a2SRandall Ralphs 	dev_info_t *cdip;
958855e592a2SRandall Ralphs 
958955e592a2SRandall Ralphs 	if ((pip == NULL) || (dcp == NULL))
959055e592a2SRandall Ralphs 		return (MDI_FAILURE);
959155e592a2SRandall Ralphs 
959255e592a2SRandall Ralphs 	cdip = mdi_pi_get_client(pip);
959355e592a2SRandall Ralphs 
959455e592a2SRandall Ralphs 	switch (mdi_pi_get_state(pip)) {
959555e592a2SRandall Ralphs 	case MDI_PATHINFO_STATE_INIT:
959655e592a2SRandall Ralphs 		devstate = DEVICE_DOWN;
959755e592a2SRandall Ralphs 		break;
959855e592a2SRandall Ralphs 	case MDI_PATHINFO_STATE_ONLINE:
959955e592a2SRandall Ralphs 		devstate = DEVICE_ONLINE;
960055e592a2SRandall Ralphs 		if ((cdip) && (devi_stillreferenced(cdip) == DEVI_REFERENCED))
960155e592a2SRandall Ralphs 			devstate |= DEVICE_BUSY;
960255e592a2SRandall Ralphs 		break;
960355e592a2SRandall Ralphs 	case MDI_PATHINFO_STATE_STANDBY:
960455e592a2SRandall Ralphs 		devstate = DEVICE_ONLINE;
960555e592a2SRandall Ralphs 		break;
960655e592a2SRandall Ralphs 	case MDI_PATHINFO_STATE_FAULT:
960755e592a2SRandall Ralphs 		devstate = DEVICE_DOWN;
960855e592a2SRandall Ralphs 		break;
960955e592a2SRandall Ralphs 	case MDI_PATHINFO_STATE_OFFLINE:
961055e592a2SRandall Ralphs 		devstate = DEVICE_OFFLINE;
961155e592a2SRandall Ralphs 		break;
961255e592a2SRandall Ralphs 	default:
961355e592a2SRandall Ralphs 		ASSERT(MDI_PI(pip)->pi_state);
961455e592a2SRandall Ralphs 	}
961555e592a2SRandall Ralphs 
961655e592a2SRandall Ralphs 	if (copyout(&devstate, dcp->cpyout_buf, sizeof (uint_t)) != 0)
961755e592a2SRandall Ralphs 		return (MDI_FAILURE);
961855e592a2SRandall Ralphs 
961955e592a2SRandall Ralphs 	return (MDI_SUCCESS);
962055e592a2SRandall Ralphs }
9621