xref: /titanic_53/usr/src/uts/sun4v/io/vsw.c (revision 71bdf9368645e130091ae5ff46e027dd75e4fc3a)
11ae08745Sheppo /*
21ae08745Sheppo  * CDDL HEADER START
31ae08745Sheppo  *
41ae08745Sheppo  * The contents of this file are subject to the terms of the
51ae08745Sheppo  * Common Development and Distribution License (the "License").
61ae08745Sheppo  * You may not use this file except in compliance with the License.
71ae08745Sheppo  *
81ae08745Sheppo  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
91ae08745Sheppo  * or http://www.opensolaris.org/os/licensing.
101ae08745Sheppo  * See the License for the specific language governing permissions
111ae08745Sheppo  * and limitations under the License.
121ae08745Sheppo  *
131ae08745Sheppo  * When distributing Covered Code, include this CDDL HEADER in each
141ae08745Sheppo  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
151ae08745Sheppo  * If applicable, add the following below this CDDL HEADER, with the
161ae08745Sheppo  * fields enclosed by brackets "[]" replaced with your own identifying
171ae08745Sheppo  * information: Portions Copyright [yyyy] [name of copyright owner]
181ae08745Sheppo  *
191ae08745Sheppo  * CDDL HEADER END
201ae08745Sheppo  */
211ae08745Sheppo 
221ae08745Sheppo /*
23f0ca1d9aSsb155480  * Copyright 2008 Sun Microsystems, Inc.  All rights reserved.
241ae08745Sheppo  * Use is subject to license terms.
251ae08745Sheppo  */
261ae08745Sheppo 
271ae08745Sheppo #include <sys/types.h>
281ae08745Sheppo #include <sys/errno.h>
291ae08745Sheppo #include <sys/debug.h>
301ae08745Sheppo #include <sys/time.h>
311ae08745Sheppo #include <sys/sysmacros.h>
321ae08745Sheppo #include <sys/systm.h>
331ae08745Sheppo #include <sys/user.h>
341ae08745Sheppo #include <sys/stropts.h>
351ae08745Sheppo #include <sys/stream.h>
361ae08745Sheppo #include <sys/strlog.h>
371ae08745Sheppo #include <sys/strsubr.h>
381ae08745Sheppo #include <sys/cmn_err.h>
391ae08745Sheppo #include <sys/cpu.h>
401ae08745Sheppo #include <sys/kmem.h>
411ae08745Sheppo #include <sys/conf.h>
421ae08745Sheppo #include <sys/ddi.h>
431ae08745Sheppo #include <sys/sunddi.h>
441ae08745Sheppo #include <sys/ksynch.h>
451ae08745Sheppo #include <sys/stat.h>
461ae08745Sheppo #include <sys/kstat.h>
471ae08745Sheppo #include <sys/vtrace.h>
481ae08745Sheppo #include <sys/strsun.h>
491ae08745Sheppo #include <sys/dlpi.h>
501ae08745Sheppo #include <sys/ethernet.h>
511ae08745Sheppo #include <net/if.h>
521ae08745Sheppo #include <sys/varargs.h>
531ae08745Sheppo #include <sys/machsystm.h>
541ae08745Sheppo #include <sys/modctl.h>
551ae08745Sheppo #include <sys/modhash.h>
561ae08745Sheppo #include <sys/mac.h>
57ba2e4443Sseb #include <sys/mac_ether.h>
581ae08745Sheppo #include <sys/taskq.h>
591ae08745Sheppo #include <sys/note.h>
601ae08745Sheppo #include <sys/mach_descrip.h>
611ae08745Sheppo #include <sys/mac.h>
621ae08745Sheppo #include <sys/mdeg.h>
631ae08745Sheppo #include <sys/ldc.h>
641ae08745Sheppo #include <sys/vsw_fdb.h>
651ae08745Sheppo #include <sys/vsw.h>
661ae08745Sheppo #include <sys/vio_mailbox.h>
671ae08745Sheppo #include <sys/vnet_mailbox.h>
681ae08745Sheppo #include <sys/vnet_common.h>
69d10e4ef2Snarayan #include <sys/vio_util.h>
70d10e4ef2Snarayan #include <sys/sdt.h>
7119b65a69Ssb155480 #include <sys/atomic.h>
7206db247cSraghuram #include <sys/callb.h>
73c1c61f44Ssb155480 #include <sys/vlan.h>
741ae08745Sheppo 
751ae08745Sheppo /*
761ae08745Sheppo  * Function prototypes.
771ae08745Sheppo  */
781ae08745Sheppo static	int vsw_attach(dev_info_t *, ddi_attach_cmd_t);
791ae08745Sheppo static	int vsw_detach(dev_info_t *, ddi_detach_cmd_t);
8034683adeSsg70180 static	int vsw_get_md_physname(vsw_t *, md_t *, mde_cookie_t, char *);
8134683adeSsg70180 static	int vsw_get_md_smodes(vsw_t *, md_t *, mde_cookie_t, uint8_t *, int *);
821ae08745Sheppo 
831ae08745Sheppo /* MDEG routines */
8434683adeSsg70180 static	int vsw_mdeg_register(vsw_t *vswp);
851ae08745Sheppo static	void vsw_mdeg_unregister(vsw_t *vswp);
861ae08745Sheppo static	int vsw_mdeg_cb(void *cb_argp, mdeg_result_t *);
8734683adeSsg70180 static	int vsw_port_mdeg_cb(void *cb_argp, mdeg_result_t *);
8819b65a69Ssb155480 static	int vsw_get_initial_md_properties(vsw_t *vswp, md_t *, mde_cookie_t);
89c1c61f44Ssb155480 static	int vsw_read_mdprops(vsw_t *vswp);
90c1c61f44Ssb155480 static	void vsw_vlan_read_ids(void *arg, int type, md_t *mdp,
91c1c61f44Ssb155480 	mde_cookie_t node, uint16_t *pvidp, uint16_t **vidspp,
92c1c61f44Ssb155480 	uint16_t *nvidsp, uint16_t *default_idp);
93c1c61f44Ssb155480 static	int vsw_port_read_props(vsw_port_t *portp, vsw_t *vswp,
94c1c61f44Ssb155480 	md_t *mdp, mde_cookie_t *node);
95f0ca1d9aSsb155480 static	void vsw_read_pri_eth_types(vsw_t *vswp, md_t *mdp,
96f0ca1d9aSsb155480 	mde_cookie_t node);
977b1f684aSSriharsha Basavapatna static	void vsw_mtu_read(vsw_t *vswp, md_t *mdp, mde_cookie_t node,
987b1f684aSSriharsha Basavapatna 	uint32_t *mtu);
997b1f684aSSriharsha Basavapatna static	int vsw_mtu_update(vsw_t *vswp, uint32_t mtu);
10034683adeSsg70180 static	void vsw_update_md_prop(vsw_t *, md_t *, mde_cookie_t);
10119b65a69Ssb155480 static void vsw_save_lmacaddr(vsw_t *vswp, uint64_t macaddr);
1021ae08745Sheppo 
10306db247cSraghuram /* Mac driver related routines */
10406db247cSraghuram static int vsw_mac_register(vsw_t *);
10506db247cSraghuram static int vsw_mac_unregister(vsw_t *);
10606db247cSraghuram static int vsw_m_stat(void *, uint_t, uint64_t *);
10706db247cSraghuram static void vsw_m_stop(void *arg);
10806db247cSraghuram static int vsw_m_start(void *arg);
10906db247cSraghuram static int vsw_m_unicst(void *arg, const uint8_t *);
11006db247cSraghuram static int vsw_m_multicst(void *arg, boolean_t, const uint8_t *);
11106db247cSraghuram static int vsw_m_promisc(void *arg, boolean_t);
11206db247cSraghuram static mblk_t *vsw_m_tx(void *arg, mblk_t *);
113f0ca1d9aSsb155480 void vsw_mac_rx(vsw_t *vswp, mac_resource_handle_t mrh,
114f0ca1d9aSsb155480     mblk_t *mp, vsw_macrx_flags_t flags);
1151ae08745Sheppo 
11606db247cSraghuram /*
11706db247cSraghuram  * Functions imported from other files.
11806db247cSraghuram  */
11906db247cSraghuram extern void vsw_setup_switching_timeout(void *arg);
12006db247cSraghuram extern void vsw_stop_switching_timeout(vsw_t *vswp);
12106db247cSraghuram extern int vsw_setup_switching(vsw_t *);
1227a327842Swentaoy extern void vsw_switch_frame_nop(vsw_t *vswp, mblk_t *mp, int caller,
1237a327842Swentaoy     vsw_port_t *port, mac_resource_handle_t mrh);
12406db247cSraghuram extern int vsw_add_mcst(vsw_t *, uint8_t, uint64_t, void *);
12506db247cSraghuram extern int vsw_del_mcst(vsw_t *, uint8_t, uint64_t, void *);
12606db247cSraghuram extern void vsw_del_mcst_vsw(vsw_t *);
12706db247cSraghuram extern mcst_addr_t *vsw_del_addr(uint8_t devtype, void *arg, uint64_t addr);
12806db247cSraghuram extern int vsw_detach_ports(vsw_t *vswp);
12906db247cSraghuram extern int vsw_port_add(vsw_t *vswp, md_t *mdp, mde_cookie_t *node);
13006db247cSraghuram extern int vsw_port_detach(vsw_t *vswp, int p_instance);
131c1c61f44Ssb155480 static int vsw_port_update(vsw_t *vswp, md_t *curr_mdp, mde_cookie_t curr_mdex,
132c1c61f44Ssb155480 	md_t *prev_mdp, mde_cookie_t prev_mdex);
133c1c61f44Ssb155480 extern	int vsw_port_attach(vsw_port_t *port);
13406db247cSraghuram extern vsw_port_t *vsw_lookup_port(vsw_t *vswp, int p_instance);
13506db247cSraghuram extern int vsw_mac_attach(vsw_t *vswp);
13606db247cSraghuram extern void vsw_mac_detach(vsw_t *vswp);
13706db247cSraghuram extern int vsw_mac_open(vsw_t *vswp);
13806db247cSraghuram extern void vsw_mac_close(vsw_t *vswp);
13906db247cSraghuram extern int vsw_set_hw(vsw_t *, vsw_port_t *, int);
14006db247cSraghuram extern int vsw_unset_hw(vsw_t *, vsw_port_t *, int);
14106db247cSraghuram extern void vsw_reconfig_hw(vsw_t *);
14206db247cSraghuram extern void vsw_unset_addrs(vsw_t *vswp);
143*71bdf936SWENTAO YANG extern void vsw_setup_layer2_post_process(vsw_t *vswp);
144c1c61f44Ssb155480 extern void vsw_create_vlans(void *arg, int type);
145c1c61f44Ssb155480 extern void vsw_destroy_vlans(void *arg, int type);
146c1c61f44Ssb155480 extern void vsw_vlan_add_ids(void *arg, int type);
147c1c61f44Ssb155480 extern void vsw_vlan_remove_ids(void *arg, int type);
148c1c61f44Ssb155480 extern void vsw_vlan_unaware_port_reset(vsw_port_t *portp);
149c1c61f44Ssb155480 extern uint32_t vsw_vlan_frame_untag(void *arg, int type, mblk_t **np,
150c1c61f44Ssb155480 	mblk_t **npt);
151c1c61f44Ssb155480 extern mblk_t *vsw_vlan_frame_pretag(void *arg, int type, mblk_t *mp);
152678453a8Sspeer extern void vsw_hio_cleanup(vsw_t *vswp);
1537b1f684aSSriharsha Basavapatna extern void vsw_reset_ports(vsw_t *vswp);
1547b1f684aSSriharsha Basavapatna extern void vsw_port_reset(vsw_port_t *portp);
155678453a8Sspeer void vsw_hio_port_update(vsw_port_t *portp, boolean_t hio_enabled);
15606db247cSraghuram 
15706db247cSraghuram /*
15806db247cSraghuram  * Internal tunables.
15906db247cSraghuram  */
160445b4c2eSsb155480 int	vsw_num_handshakes = VNET_NUM_HANDSHAKES; /* # of handshake attempts */
1611ae08745Sheppo int	vsw_wretries = 100;		/* # of write attempts */
162d10e4ef2Snarayan int	vsw_desc_delay = 0;		/* delay in us */
163d10e4ef2Snarayan int	vsw_read_attempts = 5;		/* # of reads of descriptor */
16419b65a69Ssb155480 int	vsw_setup_switching_delay = 3;	/* setup sw timeout interval in sec */
1650e8b4070Ssb155480 int	vsw_mac_open_retries = 300;	/* max # of mac_open() retries */
1660e8b4070Ssb155480 					/* 300*3 = 900sec(15min) of max tmout */
16706db247cSraghuram int	vsw_ldc_tx_delay = 5;		/* delay(ticks) for tx retries */
16806db247cSraghuram int	vsw_ldc_tx_retries = 10;	/* # of ldc tx retries */
16906db247cSraghuram boolean_t vsw_ldc_rxthr_enabled = B_TRUE;	/* LDC Rx thread enabled */
17006db247cSraghuram boolean_t vsw_ldc_txthr_enabled = B_TRUE;	/* LDC Tx thread enabled */
171d10e4ef2Snarayan 
172c1c61f44Ssb155480 uint32_t	vsw_fdb_nchains = 8;	/* # of chains in fdb hash table */
173c1c61f44Ssb155480 uint32_t	vsw_vlan_nchains = 4;	/* # of chains in vlan id hash table */
174c1c61f44Ssb155480 uint32_t	vsw_ethermtu = 1500;	/* mtu of the device */
175c1c61f44Ssb155480 
1767a327842Swentaoy /* sw timeout for boot delay only, in milliseconds */
1777a327842Swentaoy int vsw_setup_switching_boot_delay = 100 * MILLISEC;
1787a327842Swentaoy 
179c1c61f44Ssb155480 /* delay in usec to wait for all references on a fdb entry to be dropped */
180c1c61f44Ssb155480 uint32_t vsw_fdbe_refcnt_delay = 10;
181c1c61f44Ssb155480 
182c1c61f44Ssb155480 /*
183c1c61f44Ssb155480  * Default vlan id. This is only used internally when the "default-vlan-id"
184c1c61f44Ssb155480  * property is not present in the MD device node. Therefore, this should not be
185c1c61f44Ssb155480  * used as a tunable; if this value is changed, the corresponding variable
186c1c61f44Ssb155480  * should be updated to the same value in all vnets connected to this vsw.
187c1c61f44Ssb155480  */
188c1c61f44Ssb155480 uint16_t	vsw_default_vlan_id = 1;
189c1c61f44Ssb155480 
190f0ca1d9aSsb155480 /*
191f0ca1d9aSsb155480  * Workaround for a version handshake bug in obp's vnet.
192f0ca1d9aSsb155480  * If vsw initiates version negotiation starting from the highest version,
193f0ca1d9aSsb155480  * obp sends a nack and terminates version handshake. To workaround
194f0ca1d9aSsb155480  * this, we do not initiate version handshake when the channel comes up.
195f0ca1d9aSsb155480  * Instead, we wait for the peer to send its version info msg and go through
196f0ca1d9aSsb155480  * the version protocol exchange. If we successfully negotiate a version,
197f0ca1d9aSsb155480  * before sending the ack, we send our version info msg to the peer
198f0ca1d9aSsb155480  * using the <major,minor> version that we are about to ack.
199f0ca1d9aSsb155480  */
200f0ca1d9aSsb155480 boolean_t vsw_obp_ver_proto_workaround = B_TRUE;
201f0ca1d9aSsb155480 
202f0ca1d9aSsb155480 /*
203f0ca1d9aSsb155480  * In the absence of "priority-ether-types" property in MD, the following
204f0ca1d9aSsb155480  * internal tunable can be set to specify a single priority ethertype.
205f0ca1d9aSsb155480  */
206f0ca1d9aSsb155480 uint64_t vsw_pri_eth_type = 0;
207f0ca1d9aSsb155480 
208f0ca1d9aSsb155480 /*
209f0ca1d9aSsb155480  * Number of transmit priority buffers that are preallocated per device.
210f0ca1d9aSsb155480  * This number is chosen to be a small value to throttle transmission
211f0ca1d9aSsb155480  * of priority packets. Note: Must be a power of 2 for vio_create_mblks().
212f0ca1d9aSsb155480  */
213f0ca1d9aSsb155480 uint32_t vsw_pri_tx_nmblks = 64;
214d10e4ef2Snarayan 
21551aa9d07Ssb155480 /*
21651aa9d07Ssb155480  * Number of RARP packets sent to announce macaddr to the physical switch,
21751aa9d07Ssb155480  * after vsw's physical device is changed dynamically or after a guest (client
21851aa9d07Ssb155480  * vnet) is live migrated in.
21951aa9d07Ssb155480  */
22051aa9d07Ssb155480 uint32_t vsw_publish_macaddr_count = 3;
22151aa9d07Ssb155480 
222678453a8Sspeer boolean_t vsw_hio_enabled = B_TRUE;	/* Enable/disable HybridIO */
223678453a8Sspeer int vsw_hio_max_cleanup_retries = 10;	/* Max retries for HybridIO cleanp */
224678453a8Sspeer int vsw_hio_cleanup_delay = 10000;	/* 10ms */
225678453a8Sspeer 
22606db247cSraghuram /*
22706db247cSraghuram  * External tunables.
22806db247cSraghuram  */
22906db247cSraghuram /*
23006db247cSraghuram  * Enable/disable thread per ring. This is a mode selection
23106db247cSraghuram  * that is done a vsw driver attach time.
23206db247cSraghuram  */
23306db247cSraghuram boolean_t vsw_multi_ring_enable = B_FALSE;
23406db247cSraghuram int vsw_mac_rx_rings = VSW_MAC_RX_RINGS;
23506db247cSraghuram 
236f0ca1d9aSsb155480 /* Number of transmit descriptors -  must be power of 2 */
237f0ca1d9aSsb155480 uint32_t vsw_ntxds = VSW_RING_NUM_EL;
238f0ca1d9aSsb155480 
23906db247cSraghuram /*
24006db247cSraghuram  * Max number of mblks received in one receive operation.
24106db247cSraghuram  */
24206db247cSraghuram uint32_t vsw_chain_len = (VSW_NUM_MBLKS * 0.6);
24306db247cSraghuram 
24406db247cSraghuram /*
2457b1f684aSSriharsha Basavapatna  * Internal tunables for receive buffer pools, that is,  the size and number of
2467b1f684aSSriharsha Basavapatna  * mblks for each pool. At least 3 sizes must be specified if these are used.
2477b1f684aSSriharsha Basavapatna  * The sizes must be specified in increasing order. Non-zero value of the first
2487b1f684aSSriharsha Basavapatna  * size will be used as a hint to use these values instead of the algorithm
2497b1f684aSSriharsha Basavapatna  * that determines the sizes based on MTU.
25006db247cSraghuram  */
2517b1f684aSSriharsha Basavapatna uint32_t vsw_mblk_size1 = 0;
2527b1f684aSSriharsha Basavapatna uint32_t vsw_mblk_size2 = 0;
2537b1f684aSSriharsha Basavapatna uint32_t vsw_mblk_size3 = 0;
2547b1f684aSSriharsha Basavapatna uint32_t vsw_mblk_size4 = 0;
25506db247cSraghuram uint32_t vsw_num_mblks1 = VSW_NUM_MBLKS;	/* number of mblks for pool1 */
25606db247cSraghuram uint32_t vsw_num_mblks2 = VSW_NUM_MBLKS;	/* number of mblks for pool2 */
25706db247cSraghuram uint32_t vsw_num_mblks3 = VSW_NUM_MBLKS;	/* number of mblks for pool3 */
2587b1f684aSSriharsha Basavapatna uint32_t vsw_num_mblks4 = VSW_NUM_MBLKS;	/* number of mblks for pool4 */
2597b1f684aSSriharsha Basavapatna 
2607b1f684aSSriharsha Basavapatna /*
2617b1f684aSSriharsha Basavapatna  * Set this to non-zero to enable additional internal receive buffer pools
2627b1f684aSSriharsha Basavapatna  * based on the MTU of the device for better performance at the cost of more
2637b1f684aSSriharsha Basavapatna  * memory consumption. This is turned off by default, to use allocb(9F) for
2647b1f684aSSriharsha Basavapatna  * receive buffer allocations of sizes > 2K.
2657b1f684aSSriharsha Basavapatna  */
2667b1f684aSSriharsha Basavapatna boolean_t vsw_jumbo_rxpools = B_FALSE;
26706db247cSraghuram 
26806db247cSraghuram /*
269f0ca1d9aSsb155480  * vsw_max_tx_qcount is the maximum # of packets that can be queued
270f0ca1d9aSsb155480  * before the tx worker thread begins processing the queue. Its value
271f0ca1d9aSsb155480  * is chosen to be 4x the default length of tx descriptor ring.
272f0ca1d9aSsb155480  */
273f0ca1d9aSsb155480 uint32_t vsw_max_tx_qcount = 4 * VSW_RING_NUM_EL;
274f0ca1d9aSsb155480 
275f0ca1d9aSsb155480 /*
27606db247cSraghuram  * MAC callbacks
27706db247cSraghuram  */
278ba2e4443Sseb static	mac_callbacks_t	vsw_m_callbacks = {
279ba2e4443Sseb 	0,
280ba2e4443Sseb 	vsw_m_stat,
281ba2e4443Sseb 	vsw_m_start,
282ba2e4443Sseb 	vsw_m_stop,
283ba2e4443Sseb 	vsw_m_promisc,
284ba2e4443Sseb 	vsw_m_multicst,
285ba2e4443Sseb 	vsw_m_unicst,
286ba2e4443Sseb 	vsw_m_tx,
287ba2e4443Sseb 	NULL,
288ba2e4443Sseb 	NULL,
289ba2e4443Sseb 	NULL
290ba2e4443Sseb };
291ba2e4443Sseb 
2921ae08745Sheppo static	struct	cb_ops	vsw_cb_ops = {
2931ae08745Sheppo 	nulldev,			/* cb_open */
2941ae08745Sheppo 	nulldev,			/* cb_close */
2951ae08745Sheppo 	nodev,				/* cb_strategy */
2961ae08745Sheppo 	nodev,				/* cb_print */
2971ae08745Sheppo 	nodev,				/* cb_dump */
2981ae08745Sheppo 	nodev,				/* cb_read */
2991ae08745Sheppo 	nodev,				/* cb_write */
3001ae08745Sheppo 	nodev,				/* cb_ioctl */
3011ae08745Sheppo 	nodev,				/* cb_devmap */
3021ae08745Sheppo 	nodev,				/* cb_mmap */
3031ae08745Sheppo 	nodev,				/* cb_segmap */
3041ae08745Sheppo 	nochpoll,			/* cb_chpoll */
3051ae08745Sheppo 	ddi_prop_op,			/* cb_prop_op */
3061ae08745Sheppo 	NULL,				/* cb_stream */
3071ae08745Sheppo 	D_MP,				/* cb_flag */
3081ae08745Sheppo 	CB_REV,				/* rev */
3091ae08745Sheppo 	nodev,				/* int (*cb_aread)() */
3101ae08745Sheppo 	nodev				/* int (*cb_awrite)() */
3111ae08745Sheppo };
3121ae08745Sheppo 
3131ae08745Sheppo static	struct	dev_ops	vsw_ops = {
3141ae08745Sheppo 	DEVO_REV,		/* devo_rev */
3151ae08745Sheppo 	0,			/* devo_refcnt */
31671184a40SWENTAO YANG 	NULL,			/* devo_getinfo */
3171ae08745Sheppo 	nulldev,		/* devo_identify */
3181ae08745Sheppo 	nulldev,		/* devo_probe */
3191ae08745Sheppo 	vsw_attach,		/* devo_attach */
3201ae08745Sheppo 	vsw_detach,		/* devo_detach */
3211ae08745Sheppo 	nodev,			/* devo_reset */
3221ae08745Sheppo 	&vsw_cb_ops,		/* devo_cb_ops */
3231ae08745Sheppo 	(struct bus_ops *)NULL,	/* devo_bus_ops */
3241ae08745Sheppo 	ddi_power		/* devo_power */
3251ae08745Sheppo };
3261ae08745Sheppo 
3271ae08745Sheppo extern	struct	mod_ops	mod_driverops;
3281ae08745Sheppo static struct modldrv vswmodldrv = {
3291ae08745Sheppo 	&mod_driverops,
330205eeb1aSlm66018 	"sun4v Virtual Switch",
3311ae08745Sheppo 	&vsw_ops,
3321ae08745Sheppo };
3331ae08745Sheppo 
3341ae08745Sheppo #define	LDC_ENTER_LOCK(ldcp)	\
3351ae08745Sheppo 				mutex_enter(&((ldcp)->ldc_cblock));\
33606db247cSraghuram 				mutex_enter(&((ldcp)->ldc_rxlock));\
3371ae08745Sheppo 				mutex_enter(&((ldcp)->ldc_txlock));
3381ae08745Sheppo #define	LDC_EXIT_LOCK(ldcp)	\
3391ae08745Sheppo 				mutex_exit(&((ldcp)->ldc_txlock));\
34006db247cSraghuram 				mutex_exit(&((ldcp)->ldc_rxlock));\
3411ae08745Sheppo 				mutex_exit(&((ldcp)->ldc_cblock));
3421ae08745Sheppo 
3431ae08745Sheppo /* Driver soft state ptr  */
3441ae08745Sheppo static void	*vsw_state;
3451ae08745Sheppo 
3461ae08745Sheppo /*
3471ae08745Sheppo  * Linked list of "vsw_t" structures - one per instance.
3481ae08745Sheppo  */
3491ae08745Sheppo vsw_t		*vsw_head = NULL;
3501ae08745Sheppo krwlock_t	vsw_rw;
3511ae08745Sheppo 
3521ae08745Sheppo /*
3531ae08745Sheppo  * Property names
3541ae08745Sheppo  */
3551ae08745Sheppo static char vdev_propname[] = "virtual-device";
3561ae08745Sheppo static char vsw_propname[] = "virtual-network-switch";
3571ae08745Sheppo static char physdev_propname[] = "vsw-phys-dev";
3581ae08745Sheppo static char smode_propname[] = "vsw-switch-mode";
3591ae08745Sheppo static char macaddr_propname[] = "local-mac-address";
3601ae08745Sheppo static char remaddr_propname[] = "remote-mac-address";
3611ae08745Sheppo static char ldcids_propname[] = "ldc-ids";
3621ae08745Sheppo static char chan_propname[] = "channel-endpoint";
3631ae08745Sheppo static char id_propname[] = "id";
3641ae08745Sheppo static char reg_propname[] = "reg";
365f0ca1d9aSsb155480 static char pri_types_propname[] = "priority-ether-types";
366c1c61f44Ssb155480 static char vsw_pvid_propname[] = "port-vlan-id";
367c1c61f44Ssb155480 static char vsw_vid_propname[] = "vlan-id";
368c1c61f44Ssb155480 static char vsw_dvid_propname[] = "default-vlan-id";
369c1c61f44Ssb155480 static char port_pvid_propname[] = "remote-port-vlan-id";
370c1c61f44Ssb155480 static char port_vid_propname[] = "remote-vlan-id";
371678453a8Sspeer static char hybrid_propname[] = "hybrid";
3727b1f684aSSriharsha Basavapatna static char vsw_mtu_propname[] = "mtu";
3731ae08745Sheppo 
3741ae08745Sheppo /*
3751ae08745Sheppo  * Matching criteria passed to the MDEG to register interest
3761ae08745Sheppo  * in changes to 'virtual-device-port' nodes identified by their
3771ae08745Sheppo  * 'id' property.
3781ae08745Sheppo  */
3791ae08745Sheppo static md_prop_match_t vport_prop_match[] = {
3801ae08745Sheppo 	{ MDET_PROP_VAL,    "id"   },
3811ae08745Sheppo 	{ MDET_LIST_END,    NULL    }
3821ae08745Sheppo };
3831ae08745Sheppo 
3841ae08745Sheppo static mdeg_node_match_t vport_match = { "virtual-device-port",
3851ae08745Sheppo 						vport_prop_match };
3861ae08745Sheppo 
3871ae08745Sheppo /*
38834683adeSsg70180  * Matching criteria passed to the MDEG to register interest
38934683adeSsg70180  * in changes to 'virtual-device' nodes (i.e. vsw nodes) identified
39034683adeSsg70180  * by their 'name' and 'cfg-handle' properties.
39134683adeSsg70180  */
39234683adeSsg70180 static md_prop_match_t vdev_prop_match[] = {
39334683adeSsg70180 	{ MDET_PROP_STR,    "name"   },
39434683adeSsg70180 	{ MDET_PROP_VAL,    "cfg-handle" },
39534683adeSsg70180 	{ MDET_LIST_END,    NULL    }
39634683adeSsg70180 };
39734683adeSsg70180 
39834683adeSsg70180 static mdeg_node_match_t vdev_match = { "virtual-device",
39934683adeSsg70180 						vdev_prop_match };
40034683adeSsg70180 
40134683adeSsg70180 
40234683adeSsg70180 /*
4031ae08745Sheppo  * Specification of an MD node passed to the MDEG to filter any
4041ae08745Sheppo  * 'vport' nodes that do not belong to the specified node. This
4051ae08745Sheppo  * template is copied for each vsw instance and filled in with
4061ae08745Sheppo  * the appropriate 'cfg-handle' value before being passed to the MDEG.
4071ae08745Sheppo  */
4081ae08745Sheppo static mdeg_prop_spec_t vsw_prop_template[] = {
4091ae08745Sheppo 	{ MDET_PROP_STR,    "name",		vsw_propname },
4101ae08745Sheppo 	{ MDET_PROP_VAL,    "cfg-handle",	NULL	},
4111ae08745Sheppo 	{ MDET_LIST_END,    NULL,		NULL	}
4121ae08745Sheppo };
4131ae08745Sheppo 
4141ae08745Sheppo #define	VSW_SET_MDEG_PROP_INST(specp, val)	(specp)[1].ps_val = (val);
4151ae08745Sheppo 
41606db247cSraghuram #ifdef	DEBUG
4177636cb21Slm66018 /*
4181ae08745Sheppo  * Print debug messages - set to 0x1f to enable all msgs
4191ae08745Sheppo  * or 0x0 to turn all off.
4201ae08745Sheppo  */
4211ae08745Sheppo int vswdbg = 0x0;
4221ae08745Sheppo 
4231ae08745Sheppo /*
4241ae08745Sheppo  * debug levels:
4251ae08745Sheppo  * 0x01:	Function entry/exit tracing
4261ae08745Sheppo  * 0x02:	Internal function messages
4271ae08745Sheppo  * 0x04:	Verbose internal messages
4281ae08745Sheppo  * 0x08:	Warning messages
4291ae08745Sheppo  * 0x10:	Error messages
4301ae08745Sheppo  */
4311ae08745Sheppo 
43206db247cSraghuram void
4331ae08745Sheppo vswdebug(vsw_t *vswp, const char *fmt, ...)
4341ae08745Sheppo {
4351ae08745Sheppo 	char buf[512];
4361ae08745Sheppo 	va_list ap;
4371ae08745Sheppo 
4381ae08745Sheppo 	va_start(ap, fmt);
4391ae08745Sheppo 	(void) vsprintf(buf, fmt, ap);
4401ae08745Sheppo 	va_end(ap);
4411ae08745Sheppo 
4421ae08745Sheppo 	if (vswp == NULL)
4431ae08745Sheppo 		cmn_err(CE_CONT, "%s\n", buf);
4441ae08745Sheppo 	else
4451ae08745Sheppo 		cmn_err(CE_CONT, "vsw%d: %s\n", vswp->instance, buf);
4461ae08745Sheppo }
4471ae08745Sheppo 
4481ae08745Sheppo #endif	/* DEBUG */
4491ae08745Sheppo 
4501ae08745Sheppo static struct modlinkage modlinkage = {
4511ae08745Sheppo 	MODREV_1,
4521ae08745Sheppo 	&vswmodldrv,
4531ae08745Sheppo 	NULL
4541ae08745Sheppo };
4551ae08745Sheppo 
4561ae08745Sheppo int
4571ae08745Sheppo _init(void)
4581ae08745Sheppo {
4591ae08745Sheppo 	int status;
4601ae08745Sheppo 
4611ae08745Sheppo 	rw_init(&vsw_rw, NULL, RW_DRIVER, NULL);
4621ae08745Sheppo 
4631ae08745Sheppo 	status = ddi_soft_state_init(&vsw_state, sizeof (vsw_t), 1);
4641ae08745Sheppo 	if (status != 0) {
4651ae08745Sheppo 		return (status);
4661ae08745Sheppo 	}
4671ae08745Sheppo 
46806db247cSraghuram 	mac_init_ops(&vsw_ops, DRV_NAME);
4691ae08745Sheppo 	status = mod_install(&modlinkage);
4701ae08745Sheppo 	if (status != 0) {
4711ae08745Sheppo 		ddi_soft_state_fini(&vsw_state);
4721ae08745Sheppo 	}
4731ae08745Sheppo 	return (status);
4741ae08745Sheppo }
4751ae08745Sheppo 
4761ae08745Sheppo int
4771ae08745Sheppo _fini(void)
4781ae08745Sheppo {
4791ae08745Sheppo 	int status;
4801ae08745Sheppo 
4811ae08745Sheppo 	status = mod_remove(&modlinkage);
4821ae08745Sheppo 	if (status != 0)
4831ae08745Sheppo 		return (status);
4841ae08745Sheppo 	mac_fini_ops(&vsw_ops);
4851ae08745Sheppo 	ddi_soft_state_fini(&vsw_state);
4861ae08745Sheppo 
4871ae08745Sheppo 	rw_destroy(&vsw_rw);
4881ae08745Sheppo 
4891ae08745Sheppo 	return (status);
4901ae08745Sheppo }
4911ae08745Sheppo 
4921ae08745Sheppo int
4931ae08745Sheppo _info(struct modinfo *modinfop)
4941ae08745Sheppo {
4951ae08745Sheppo 	return (mod_info(&modlinkage, modinfop));
4961ae08745Sheppo }
4971ae08745Sheppo 
4981ae08745Sheppo static int
4991ae08745Sheppo vsw_attach(dev_info_t *dip, ddi_attach_cmd_t cmd)
5001ae08745Sheppo {
5011ae08745Sheppo 	vsw_t		*vswp;
50234683adeSsg70180 	int		instance;
5031ae08745Sheppo 	char		hashname[MAXNAMELEN];
5041ae08745Sheppo 	char		qname[TASKQ_NAMELEN];
5057636cb21Slm66018 	enum		{ PROG_init = 0x00,
50619b65a69Ssb155480 				PROG_locks = 0x01,
50719b65a69Ssb155480 				PROG_readmd = 0x02,
50819b65a69Ssb155480 				PROG_fdb = 0x04,
50919b65a69Ssb155480 				PROG_mfdb = 0x08,
51019b65a69Ssb155480 				PROG_taskq = 0x10,
511f0ca1d9aSsb155480 				PROG_swmode = 0x20,
512f0ca1d9aSsb155480 				PROG_macreg = 0x40,
513f0ca1d9aSsb155480 				PROG_mdreg = 0x80}
5141ae08745Sheppo 			progress;
5151ae08745Sheppo 
5161ae08745Sheppo 	progress = PROG_init;
51719b65a69Ssb155480 	int		rv;
5181ae08745Sheppo 
5191ae08745Sheppo 	switch (cmd) {
5201ae08745Sheppo 	case DDI_ATTACH:
5211ae08745Sheppo 		break;
5221ae08745Sheppo 	case DDI_RESUME:
5231ae08745Sheppo 		/* nothing to do for this non-device */
5241ae08745Sheppo 		return (DDI_SUCCESS);
5251ae08745Sheppo 	case DDI_PM_RESUME:
5261ae08745Sheppo 	default:
5271ae08745Sheppo 		return (DDI_FAILURE);
5281ae08745Sheppo 	}
5291ae08745Sheppo 
5301ae08745Sheppo 	instance = ddi_get_instance(dip);
5311ae08745Sheppo 	if (ddi_soft_state_zalloc(vsw_state, instance) != DDI_SUCCESS) {
5321ae08745Sheppo 		DERR(NULL, "vsw%d: ddi_soft_state_zalloc failed", instance);
5331ae08745Sheppo 		return (DDI_FAILURE);
5341ae08745Sheppo 	}
5351ae08745Sheppo 	vswp = ddi_get_soft_state(vsw_state, instance);
5361ae08745Sheppo 
5371ae08745Sheppo 	if (vswp == NULL) {
5381ae08745Sheppo 		DERR(NULL, "vsw%d: ddi_get_soft_state failed", instance);
5391ae08745Sheppo 		goto vsw_attach_fail;
5401ae08745Sheppo 	}
5411ae08745Sheppo 
5421ae08745Sheppo 	vswp->dip = dip;
5431ae08745Sheppo 	vswp->instance = instance;
5441ae08745Sheppo 	ddi_set_driver_private(dip, (caddr_t)vswp);
5451ae08745Sheppo 
5465f94e909Ssg70180 	mutex_init(&vswp->hw_lock, NULL, MUTEX_DRIVER, NULL);
54719b65a69Ssb155480 	mutex_init(&vswp->mca_lock, NULL, MUTEX_DRIVER, NULL);
54819b65a69Ssb155480 	mutex_init(&vswp->swtmout_lock, NULL, MUTEX_DRIVER, NULL);
5491ae08745Sheppo 	rw_init(&vswp->if_lockrw, NULL, RW_DRIVER, NULL);
5503c1bce15Swentaoy 	rw_init(&vswp->mac_rwlock, NULL, RW_DRIVER, NULL);
55119b65a69Ssb155480 	rw_init(&vswp->mfdbrw, NULL, RW_DRIVER, NULL);
55219b65a69Ssb155480 	rw_init(&vswp->plist.lockrw, NULL, RW_DRIVER, NULL);
55319b65a69Ssb155480 
55419b65a69Ssb155480 	progress |= PROG_locks;
55519b65a69Ssb155480 
55619b65a69Ssb155480 	rv = vsw_read_mdprops(vswp);
55719b65a69Ssb155480 	if (rv != 0)
55819b65a69Ssb155480 		goto vsw_attach_fail;
55919b65a69Ssb155480 
56019b65a69Ssb155480 	progress |= PROG_readmd;
5611ae08745Sheppo 
5621ae08745Sheppo 	/* setup the unicast forwarding database  */
5631ae08745Sheppo 	(void) snprintf(hashname, MAXNAMELEN, "vsw_unicst_table-%d",
5641ae08745Sheppo 	    vswp->instance);
5651ae08745Sheppo 	D2(vswp, "creating unicast hash table (%s)...", hashname);
566c1c61f44Ssb155480 	vswp->fdb_nchains = vsw_fdb_nchains;
567c1c61f44Ssb155480 	vswp->fdb_hashp = mod_hash_create_ptrhash(hashname, vswp->fdb_nchains,
5681ae08745Sheppo 	    mod_hash_null_valdtor, sizeof (void *));
569c1c61f44Ssb155480 	vsw_create_vlans((void *)vswp, VSW_LOCALDEV);
5701ae08745Sheppo 	progress |= PROG_fdb;
5711ae08745Sheppo 
5721ae08745Sheppo 	/* setup the multicast fowarding database */
5731ae08745Sheppo 	(void) snprintf(hashname, MAXNAMELEN, "vsw_mcst_table-%d",
5741ae08745Sheppo 	    vswp->instance);
5751ae08745Sheppo 	D2(vswp, "creating multicast hash table %s)...", hashname);
576c1c61f44Ssb155480 	vswp->mfdb = mod_hash_create_ptrhash(hashname, vsw_fdb_nchains,
5771ae08745Sheppo 	    mod_hash_null_valdtor, sizeof (void *));
5781ae08745Sheppo 
5791ae08745Sheppo 	progress |= PROG_mfdb;
5801ae08745Sheppo 
5811ae08745Sheppo 	/*
5821ae08745Sheppo 	 * Create the taskq which will process all the VIO
5831ae08745Sheppo 	 * control messages.
5841ae08745Sheppo 	 */
5851ae08745Sheppo 	(void) snprintf(qname, TASKQ_NAMELEN, "vsw_taskq%d", vswp->instance);
5861ae08745Sheppo 	if ((vswp->taskq_p = ddi_taskq_create(vswp->dip, qname, 1,
5871ae08745Sheppo 	    TASKQ_DEFAULTPRI, 0)) == NULL) {
58834683adeSsg70180 		cmn_err(CE_WARN, "!vsw%d: Unable to create task queue",
58934683adeSsg70180 		    vswp->instance);
5901ae08745Sheppo 		goto vsw_attach_fail;
5911ae08745Sheppo 	}
5921ae08745Sheppo 
5931ae08745Sheppo 	progress |= PROG_taskq;
5941ae08745Sheppo 
595d10e4ef2Snarayan 	/* prevent auto-detaching */
596d10e4ef2Snarayan 	if (ddi_prop_update_int(DDI_DEV_T_NONE, vswp->dip,
597d10e4ef2Snarayan 	    DDI_NO_AUTODETACH, 1) != DDI_SUCCESS) {
59834683adeSsg70180 		cmn_err(CE_NOTE, "!Unable to set \"%s\" property for "
599d10e4ef2Snarayan 		    "instance %u", DDI_NO_AUTODETACH, instance);
600d10e4ef2Snarayan 	}
601d10e4ef2Snarayan 
6021ae08745Sheppo 	/*
6037a327842Swentaoy 	 * The null switching function is set to avoid panic until
6047a327842Swentaoy 	 * switch mode is setup.
6057a327842Swentaoy 	 */
6067a327842Swentaoy 	vswp->vsw_switch_frame = vsw_switch_frame_nop;
6077a327842Swentaoy 
6087a327842Swentaoy 	/*
60919b65a69Ssb155480 	 * Setup the required switching mode,
61019b65a69Ssb155480 	 * based on the mdprops that we read earlier.
6117a327842Swentaoy 	 * schedule a short timeout (0.1 sec) for the first time
6127a327842Swentaoy 	 * setup and avoid calling mac_open() directly here,
6137a327842Swentaoy 	 * others are regular timeout 3 secs.
61419b65a69Ssb155480 	 */
61519b65a69Ssb155480 	mutex_enter(&vswp->swtmout_lock);
61619b65a69Ssb155480 
61719b65a69Ssb155480 	vswp->swtmout_enabled = B_TRUE;
6187a327842Swentaoy 	vswp->swtmout_id = timeout(vsw_setup_switching_timeout, vswp,
6197a327842Swentaoy 	    drv_usectohz(vsw_setup_switching_boot_delay));
62019b65a69Ssb155480 
62119b65a69Ssb155480 	mutex_exit(&vswp->swtmout_lock);
62219b65a69Ssb155480 
62319b65a69Ssb155480 	progress |= PROG_swmode;
62419b65a69Ssb155480 
62519b65a69Ssb155480 	/* Register with mac layer as a provider */
62619b65a69Ssb155480 	rv = vsw_mac_register(vswp);
62719b65a69Ssb155480 	if (rv != 0)
62819b65a69Ssb155480 		goto vsw_attach_fail;
62919b65a69Ssb155480 
63019b65a69Ssb155480 	progress |= PROG_macreg;
63119b65a69Ssb155480 
63219b65a69Ssb155480 	/*
63334683adeSsg70180 	 * Now we have everything setup, register an interest in
63434683adeSsg70180 	 * specific MD nodes.
63534683adeSsg70180 	 *
63634683adeSsg70180 	 * The callback is invoked in 2 cases, firstly if upon mdeg
63734683adeSsg70180 	 * registration there are existing nodes which match our specified
63834683adeSsg70180 	 * criteria, and secondly if the MD is changed (and again, there
63934683adeSsg70180 	 * are nodes which we are interested in present within it. Note
64034683adeSsg70180 	 * that our callback will be invoked even if our specified nodes
64134683adeSsg70180 	 * have not actually changed).
64234683adeSsg70180 	 *
6431ae08745Sheppo 	 */
64419b65a69Ssb155480 	rv = vsw_mdeg_register(vswp);
64519b65a69Ssb155480 	if (rv != 0)
64634683adeSsg70180 		goto vsw_attach_fail;
6471ae08745Sheppo 
64819b65a69Ssb155480 	progress |= PROG_mdreg;
64919b65a69Ssb155480 
65019b65a69Ssb155480 	WRITE_ENTER(&vsw_rw);
65119b65a69Ssb155480 	vswp->next = vsw_head;
65219b65a69Ssb155480 	vsw_head = vswp;
65319b65a69Ssb155480 	RW_EXIT(&vsw_rw);
65419b65a69Ssb155480 
65519b65a69Ssb155480 	ddi_report_dev(vswp->dip);
6561ae08745Sheppo 	return (DDI_SUCCESS);
6571ae08745Sheppo 
6581ae08745Sheppo vsw_attach_fail:
6591ae08745Sheppo 	DERR(NULL, "vsw_attach: failed");
6601ae08745Sheppo 
66119b65a69Ssb155480 	if (progress & PROG_mdreg) {
66219b65a69Ssb155480 		vsw_mdeg_unregister(vswp);
66319b65a69Ssb155480 		(void) vsw_detach_ports(vswp);
66419b65a69Ssb155480 	}
66519b65a69Ssb155480 
66619b65a69Ssb155480 	if (progress & PROG_macreg)
66719b65a69Ssb155480 		(void) vsw_mac_unregister(vswp);
66819b65a69Ssb155480 
66919b65a69Ssb155480 	if (progress & PROG_swmode) {
67019b65a69Ssb155480 		vsw_stop_switching_timeout(vswp);
671678453a8Sspeer 		vsw_hio_cleanup(vswp);
6723c1bce15Swentaoy 		WRITE_ENTER(&vswp->mac_rwlock);
67319b65a69Ssb155480 		vsw_mac_detach(vswp);
67419b65a69Ssb155480 		vsw_mac_close(vswp);
6753c1bce15Swentaoy 		RW_EXIT(&vswp->mac_rwlock);
67619b65a69Ssb155480 	}
67719b65a69Ssb155480 
6781ae08745Sheppo 	if (progress & PROG_taskq)
6791ae08745Sheppo 		ddi_taskq_destroy(vswp->taskq_p);
6801ae08745Sheppo 
68119b65a69Ssb155480 	if (progress & PROG_mfdb)
6821ae08745Sheppo 		mod_hash_destroy_hash(vswp->mfdb);
6831ae08745Sheppo 
684c1c61f44Ssb155480 	if (progress & PROG_fdb) {
685c1c61f44Ssb155480 		vsw_destroy_vlans(vswp, VSW_LOCALDEV);
686c1c61f44Ssb155480 		mod_hash_destroy_hash(vswp->fdb_hashp);
687c1c61f44Ssb155480 	}
6881ae08745Sheppo 
689f0ca1d9aSsb155480 	if (progress & PROG_readmd) {
690f0ca1d9aSsb155480 		if (VSW_PRI_ETH_DEFINED(vswp)) {
691f0ca1d9aSsb155480 			kmem_free(vswp->pri_types,
692f0ca1d9aSsb155480 			    sizeof (uint16_t) * vswp->pri_num_types);
693f0ca1d9aSsb155480 		}
694f0ca1d9aSsb155480 		(void) vio_destroy_mblks(vswp->pri_tx_vmp);
695f0ca1d9aSsb155480 	}
696f0ca1d9aSsb155480 
69719b65a69Ssb155480 	if (progress & PROG_locks) {
69819b65a69Ssb155480 		rw_destroy(&vswp->plist.lockrw);
69919b65a69Ssb155480 		rw_destroy(&vswp->mfdbrw);
7003c1bce15Swentaoy 		rw_destroy(&vswp->mac_rwlock);
7011ae08745Sheppo 		rw_destroy(&vswp->if_lockrw);
70219b65a69Ssb155480 		mutex_destroy(&vswp->swtmout_lock);
70319b65a69Ssb155480 		mutex_destroy(&vswp->mca_lock);
7045f94e909Ssg70180 		mutex_destroy(&vswp->hw_lock);
70534683adeSsg70180 	}
7061ae08745Sheppo 
7071ae08745Sheppo 	ddi_soft_state_free(vsw_state, instance);
7081ae08745Sheppo 	return (DDI_FAILURE);
7091ae08745Sheppo }
7101ae08745Sheppo 
7111ae08745Sheppo static int
7121ae08745Sheppo vsw_detach(dev_info_t *dip, ddi_detach_cmd_t cmd)
7131ae08745Sheppo {
714d10e4ef2Snarayan 	vio_mblk_pool_t		*poolp, *npoolp;
7151ae08745Sheppo 	vsw_t			**vswpp, *vswp;
7161ae08745Sheppo 	int 			instance;
7171ae08745Sheppo 
7181ae08745Sheppo 	instance = ddi_get_instance(dip);
7191ae08745Sheppo 	vswp = ddi_get_soft_state(vsw_state, instance);
7201ae08745Sheppo 
7211ae08745Sheppo 	if (vswp == NULL) {
7221ae08745Sheppo 		return (DDI_FAILURE);
7231ae08745Sheppo 	}
7241ae08745Sheppo 
7251ae08745Sheppo 	switch (cmd) {
7261ae08745Sheppo 	case DDI_DETACH:
7271ae08745Sheppo 		break;
7281ae08745Sheppo 	case DDI_SUSPEND:
7291ae08745Sheppo 	case DDI_PM_SUSPEND:
7301ae08745Sheppo 	default:
7311ae08745Sheppo 		return (DDI_FAILURE);
7321ae08745Sheppo 	}
7331ae08745Sheppo 
7341ae08745Sheppo 	D2(vswp, "detaching instance %d", instance);
7351ae08745Sheppo 
73619b65a69Ssb155480 	/* Stop any pending timeout to setup switching mode. */
73719b65a69Ssb155480 	vsw_stop_switching_timeout(vswp);
73819b65a69Ssb155480 
73934683adeSsg70180 	if (vswp->if_state & VSW_IF_REG) {
7401ae08745Sheppo 		if (vsw_mac_unregister(vswp) != 0) {
74134683adeSsg70180 			cmn_err(CE_WARN, "!vsw%d: Unable to detach from "
74234683adeSsg70180 			    "MAC layer", vswp->instance);
7431ae08745Sheppo 			return (DDI_FAILURE);
7441ae08745Sheppo 		}
745d10e4ef2Snarayan 	}
7461ae08745Sheppo 
7471ae08745Sheppo 	vsw_mdeg_unregister(vswp);
7481ae08745Sheppo 
749e1ebb9ecSlm66018 	/* remove mac layer callback */
7503c1bce15Swentaoy 	WRITE_ENTER(&vswp->mac_rwlock);
751e1ebb9ecSlm66018 	if ((vswp->mh != NULL) && (vswp->mrh != NULL)) {
7521f8aaf0dSethindra 		mac_rx_remove(vswp->mh, vswp->mrh, B_TRUE);
753e1ebb9ecSlm66018 		vswp->mrh = NULL;
7541ae08745Sheppo 	}
7553c1bce15Swentaoy 	RW_EXIT(&vswp->mac_rwlock);
7561ae08745Sheppo 
7571ae08745Sheppo 	if (vsw_detach_ports(vswp) != 0) {
7581ef0bbb5Snarayan 		cmn_err(CE_WARN, "!vsw%d: Unable to unconfigure ports",
75934683adeSsg70180 		    vswp->instance);
7601ae08745Sheppo 		return (DDI_FAILURE);
7611ae08745Sheppo 	}
7621ae08745Sheppo 
76334683adeSsg70180 	rw_destroy(&vswp->if_lockrw);
76434683adeSsg70180 
765678453a8Sspeer 	/* cleanup HybridIO */
766678453a8Sspeer 	vsw_hio_cleanup(vswp);
767678453a8Sspeer 
7685f94e909Ssg70180 	mutex_destroy(&vswp->hw_lock);
7695f94e909Ssg70180 
7701ae08745Sheppo 	/*
771e1ebb9ecSlm66018 	 * Now that the ports have been deleted, stop and close
772e1ebb9ecSlm66018 	 * the physical device.
773e1ebb9ecSlm66018 	 */
7743c1bce15Swentaoy 	WRITE_ENTER(&vswp->mac_rwlock);
775e1ebb9ecSlm66018 
77619b65a69Ssb155480 	vsw_mac_detach(vswp);
77719b65a69Ssb155480 	vsw_mac_close(vswp);
77819b65a69Ssb155480 
7793c1bce15Swentaoy 	RW_EXIT(&vswp->mac_rwlock);
78019b65a69Ssb155480 
7813c1bce15Swentaoy 	rw_destroy(&vswp->mac_rwlock);
78219b65a69Ssb155480 	mutex_destroy(&vswp->swtmout_lock);
783e1ebb9ecSlm66018 
784e1ebb9ecSlm66018 	/*
785d10e4ef2Snarayan 	 * Destroy any free pools that may still exist.
786d10e4ef2Snarayan 	 */
787d10e4ef2Snarayan 	poolp = vswp->rxh;
788d10e4ef2Snarayan 	while (poolp != NULL) {
789d10e4ef2Snarayan 		npoolp = vswp->rxh = poolp->nextp;
790d10e4ef2Snarayan 		if (vio_destroy_mblks(poolp) != 0) {
791d10e4ef2Snarayan 			vswp->rxh = poolp;
792d10e4ef2Snarayan 			return (DDI_FAILURE);
793d10e4ef2Snarayan 		}
794d10e4ef2Snarayan 		poolp = npoolp;
795d10e4ef2Snarayan 	}
796d10e4ef2Snarayan 
797d10e4ef2Snarayan 	/*
7981ae08745Sheppo 	 * Remove this instance from any entries it may be on in
7991ae08745Sheppo 	 * the hash table by using the list of addresses maintained
8001ae08745Sheppo 	 * in the vsw_t structure.
8011ae08745Sheppo 	 */
8021ae08745Sheppo 	vsw_del_mcst_vsw(vswp);
8031ae08745Sheppo 
8041ae08745Sheppo 	vswp->mcap = NULL;
8051ae08745Sheppo 	mutex_destroy(&vswp->mca_lock);
8061ae08745Sheppo 
8071ae08745Sheppo 	/*
8081ae08745Sheppo 	 * By now any pending tasks have finished and the underlying
8091ae08745Sheppo 	 * ldc's have been destroyed, so its safe to delete the control
8101ae08745Sheppo 	 * message taskq.
8111ae08745Sheppo 	 */
8121ae08745Sheppo 	if (vswp->taskq_p != NULL)
8131ae08745Sheppo 		ddi_taskq_destroy(vswp->taskq_p);
8141ae08745Sheppo 
8151ae08745Sheppo 	/*
8161ae08745Sheppo 	 * At this stage all the data pointers in the hash table
8171ae08745Sheppo 	 * should be NULL, as all the ports have been removed and will
8181ae08745Sheppo 	 * have deleted themselves from the port lists which the data
8191ae08745Sheppo 	 * pointers point to. Hence we can destroy the table using the
8201ae08745Sheppo 	 * default destructors.
8211ae08745Sheppo 	 */
8221ae08745Sheppo 	D2(vswp, "vsw_detach: destroying hash tables..");
823c1c61f44Ssb155480 	vsw_destroy_vlans(vswp, VSW_LOCALDEV);
824c1c61f44Ssb155480 	mod_hash_destroy_hash(vswp->fdb_hashp);
825c1c61f44Ssb155480 	vswp->fdb_hashp = NULL;
8261ae08745Sheppo 
8271ae08745Sheppo 	WRITE_ENTER(&vswp->mfdbrw);
8281ae08745Sheppo 	mod_hash_destroy_hash(vswp->mfdb);
8291ae08745Sheppo 	vswp->mfdb = NULL;
8301ae08745Sheppo 	RW_EXIT(&vswp->mfdbrw);
8311ae08745Sheppo 	rw_destroy(&vswp->mfdbrw);
8321ae08745Sheppo 
833f0ca1d9aSsb155480 	/* free pri_types table */
834f0ca1d9aSsb155480 	if (VSW_PRI_ETH_DEFINED(vswp)) {
835f0ca1d9aSsb155480 		kmem_free(vswp->pri_types,
836f0ca1d9aSsb155480 		    sizeof (uint16_t) * vswp->pri_num_types);
837f0ca1d9aSsb155480 		(void) vio_destroy_mblks(vswp->pri_tx_vmp);
838f0ca1d9aSsb155480 	}
839f0ca1d9aSsb155480 
8401ae08745Sheppo 	ddi_remove_minor_node(dip, NULL);
8411ae08745Sheppo 
8421ae08745Sheppo 	rw_destroy(&vswp->plist.lockrw);
8431ae08745Sheppo 	WRITE_ENTER(&vsw_rw);
8441ae08745Sheppo 	for (vswpp = &vsw_head; *vswpp; vswpp = &(*vswpp)->next) {
8451ae08745Sheppo 		if (*vswpp == vswp) {
8461ae08745Sheppo 			*vswpp = vswp->next;
8471ae08745Sheppo 			break;
8481ae08745Sheppo 		}
8491ae08745Sheppo 	}
8501ae08745Sheppo 	RW_EXIT(&vsw_rw);
8511ae08745Sheppo 	ddi_soft_state_free(vsw_state, instance);
8521ae08745Sheppo 
8531ae08745Sheppo 	return (DDI_SUCCESS);
8541ae08745Sheppo }
8551ae08745Sheppo 
8561ae08745Sheppo /*
85734683adeSsg70180  * Get the value of the "vsw-phys-dev" property in the specified
85834683adeSsg70180  * node. This property is the name of the physical device that
85934683adeSsg70180  * the virtual switch will use to talk to the outside world.
86034683adeSsg70180  *
86134683adeSsg70180  * Note it is valid for this property to be NULL (but the property
86234683adeSsg70180  * itself must exist). Callers of this routine should verify that
86334683adeSsg70180  * the value returned is what they expected (i.e. either NULL or non NULL).
86434683adeSsg70180  *
86534683adeSsg70180  * On success returns value of the property in region pointed to by
86634683adeSsg70180  * the 'name' argument, and with return value of 0. Otherwise returns 1.
8671ae08745Sheppo  */
86834683adeSsg70180 static int
86934683adeSsg70180 vsw_get_md_physname(vsw_t *vswp, md_t *mdp, mde_cookie_t node, char *name)
8701ae08745Sheppo {
87134683adeSsg70180 	int		len = 0;
872f2b610cfSwentaoy 	int		instance;
8731ae08745Sheppo 	char		*physname = NULL;
8741ae08745Sheppo 	char		*dev;
875f2b610cfSwentaoy 	const char	*dev_name;
876f2b610cfSwentaoy 	char		myname[MAXNAMELEN];
877f2b610cfSwentaoy 
878f2b610cfSwentaoy 	dev_name = ddi_driver_name(vswp->dip);
879f2b610cfSwentaoy 	instance = ddi_get_instance(vswp->dip);
880f2b610cfSwentaoy 	(void) snprintf(myname, MAXNAMELEN, "%s%d", dev_name, instance);
8811ae08745Sheppo 
88234683adeSsg70180 	if (md_get_prop_data(mdp, node, physdev_propname,
8831ae08745Sheppo 	    (uint8_t **)(&physname), &len) != 0) {
88434683adeSsg70180 		cmn_err(CE_WARN, "!vsw%d: Unable to get name(s) of physical "
88534683adeSsg70180 		    "device(s) from MD", vswp->instance);
88634683adeSsg70180 		return (1);
8871ae08745Sheppo 	} else if ((strlen(physname) + 1) > LIFNAMSIZ) {
88834683adeSsg70180 		cmn_err(CE_WARN, "!vsw%d: %s is too long a device name",
88934683adeSsg70180 		    vswp->instance, physname);
89034683adeSsg70180 		return (1);
891f2b610cfSwentaoy 	} else if (strcmp(myname, physname) == 0) {
892f2b610cfSwentaoy 		/*
893f2b610cfSwentaoy 		 * Prevent the vswitch from opening itself as the
894f2b610cfSwentaoy 		 * network device.
895f2b610cfSwentaoy 		 */
896f2b610cfSwentaoy 		cmn_err(CE_WARN, "!vsw%d: %s is an invalid device name",
897f2b610cfSwentaoy 		    vswp->instance, physname);
898f2b610cfSwentaoy 		return (1);
8991ae08745Sheppo 	} else {
90034683adeSsg70180 		(void) strncpy(name, physname, strlen(physname) + 1);
9011ae08745Sheppo 		D2(vswp, "%s: using first device specified (%s)",
90234683adeSsg70180 		    __func__, physname);
9031ae08745Sheppo 	}
9041ae08745Sheppo 
9051ae08745Sheppo #ifdef DEBUG
9061ae08745Sheppo 	/*
9071ae08745Sheppo 	 * As a temporary measure to aid testing we check to see if there
9081ae08745Sheppo 	 * is a vsw.conf file present. If there is we use the value of the
9091ae08745Sheppo 	 * vsw_physname property in the file as the name of the physical
9101ae08745Sheppo 	 * device, overriding the value from the MD.
9111ae08745Sheppo 	 *
9121ae08745Sheppo 	 * There may be multiple devices listed, but for the moment
9131ae08745Sheppo 	 * we just use the first one.
9141ae08745Sheppo 	 */
9151ae08745Sheppo 	if (ddi_prop_lookup_string(DDI_DEV_T_ANY, vswp->dip, 0,
9161ae08745Sheppo 	    "vsw_physname", &dev) == DDI_PROP_SUCCESS) {
9171ae08745Sheppo 		if ((strlen(dev) + 1) > LIFNAMSIZ) {
91834683adeSsg70180 			cmn_err(CE_WARN, "vsw%d: %s is too long a device name",
91934683adeSsg70180 			    vswp->instance, dev);
92034683adeSsg70180 			ddi_prop_free(dev);
92134683adeSsg70180 			return (1);
9221ae08745Sheppo 		} else {
92334683adeSsg70180 			cmn_err(CE_NOTE, "vsw%d: Using device name (%s) from "
92434683adeSsg70180 			    "config file", vswp->instance, dev);
9251ae08745Sheppo 
92634683adeSsg70180 			(void) strncpy(name, dev, strlen(dev) + 1);
9271ae08745Sheppo 		}
9281ae08745Sheppo 
9291ae08745Sheppo 		ddi_prop_free(dev);
9301ae08745Sheppo 	}
9311ae08745Sheppo #endif
9321ae08745Sheppo 
93334683adeSsg70180 	return (0);
93434683adeSsg70180 }
935e1ebb9ecSlm66018 
936e1ebb9ecSlm66018 /*
93734683adeSsg70180  * Read the 'vsw-switch-mode' property from the specified MD node.
93834683adeSsg70180  *
93934683adeSsg70180  * Returns 0 on success and the number of modes found in 'found',
94034683adeSsg70180  * otherwise returns 1.
941e1ebb9ecSlm66018  */
94234683adeSsg70180 static int
94334683adeSsg70180 vsw_get_md_smodes(vsw_t *vswp, md_t *mdp, mde_cookie_t node,
94434683adeSsg70180 						uint8_t *modes, int *found)
94534683adeSsg70180 {
94634683adeSsg70180 	int		len = 0;
94734683adeSsg70180 	int		smode_num = 0;
94834683adeSsg70180 	char		*smode = NULL;
94934683adeSsg70180 	char		*curr_mode = NULL;
95034683adeSsg70180 
95134683adeSsg70180 	D1(vswp, "%s: enter", __func__);
9521ae08745Sheppo 
9531ae08745Sheppo 	/*
9541ae08745Sheppo 	 * Get the switch-mode property. The modes are listed in
9551ae08745Sheppo 	 * decreasing order of preference, i.e. prefered mode is
9561ae08745Sheppo 	 * first item in list.
9571ae08745Sheppo 	 */
9581ae08745Sheppo 	len = 0;
95934683adeSsg70180 	smode_num = 0;
96034683adeSsg70180 	if (md_get_prop_data(mdp, node, smode_propname,
9611ae08745Sheppo 	    (uint8_t **)(&smode), &len) != 0) {
9621ae08745Sheppo 		/*
963e1ebb9ecSlm66018 		 * Unable to get switch-mode property from MD, nothing
964e1ebb9ecSlm66018 		 * more we can do.
9651ae08745Sheppo 		 */
96634683adeSsg70180 		cmn_err(CE_WARN, "!vsw%d: Unable to get switch mode property"
96734683adeSsg70180 		    " from the MD", vswp->instance);
96834683adeSsg70180 		*found = 0;
96934683adeSsg70180 		return (1);
970e1ebb9ecSlm66018 	}
971e1ebb9ecSlm66018 
9721ae08745Sheppo 	curr_mode = smode;
9731ae08745Sheppo 	/*
9741ae08745Sheppo 	 * Modes of operation:
9751ae08745Sheppo 	 * 'switched'	 - layer 2 switching, underlying HW in
976e1ebb9ecSlm66018 	 *			programmed mode.
9771ae08745Sheppo 	 * 'promiscuous' - layer 2 switching, underlying HW in
9781ae08745Sheppo 	 *			promiscuous mode.
9791ae08745Sheppo 	 * 'routed'	 - layer 3 (i.e. IP) routing, underlying HW
9801ae08745Sheppo 	 *			in non-promiscuous mode.
9811ae08745Sheppo 	 */
98234683adeSsg70180 	while ((curr_mode < (smode + len)) && (smode_num < NUM_SMODES)) {
9831ae08745Sheppo 		D2(vswp, "%s: curr_mode = [%s]", __func__, curr_mode);
984e1ebb9ecSlm66018 		if (strcmp(curr_mode, "switched") == 0) {
98534683adeSsg70180 			modes[smode_num++] = VSW_LAYER2;
986e1ebb9ecSlm66018 		} else if (strcmp(curr_mode, "promiscuous") == 0) {
98734683adeSsg70180 			modes[smode_num++] = VSW_LAYER2_PROMISC;
988e1ebb9ecSlm66018 		} else if (strcmp(curr_mode, "routed") == 0) {
98934683adeSsg70180 			modes[smode_num++] = VSW_LAYER3;
990e1ebb9ecSlm66018 		} else {
9911ef0bbb5Snarayan 			DWARN(vswp, "%s: Unknown switch mode %s, "
9921ef0bbb5Snarayan 			    "setting to default 'switched' mode",
9931ef0bbb5Snarayan 			    __func__, curr_mode);
99434683adeSsg70180 			modes[smode_num++] = VSW_LAYER2;
9951ae08745Sheppo 		}
9961ae08745Sheppo 		curr_mode += strlen(curr_mode) + 1;
9971ae08745Sheppo 	}
99834683adeSsg70180 	*found = smode_num;
9991ae08745Sheppo 
100034683adeSsg70180 	D2(vswp, "%s: %d modes found", __func__, smode_num);
10011ae08745Sheppo 
10021ae08745Sheppo 	D1(vswp, "%s: exit", __func__);
100334683adeSsg70180 
100434683adeSsg70180 	return (0);
10051ae08745Sheppo }
10061ae08745Sheppo 
1007e1ebb9ecSlm66018 /*
10081ae08745Sheppo  * Register with the MAC layer as a network device, so we
10091ae08745Sheppo  * can be plumbed if necessary.
10101ae08745Sheppo  */
10111ae08745Sheppo static int
10121ae08745Sheppo vsw_mac_register(vsw_t *vswp)
10131ae08745Sheppo {
1014ba2e4443Sseb 	mac_register_t	*macp;
1015ba2e4443Sseb 	int		rv;
10161ae08745Sheppo 
10171ae08745Sheppo 	D1(vswp, "%s: enter", __func__);
10181ae08745Sheppo 
1019ba2e4443Sseb 	if ((macp = mac_alloc(MAC_VERSION)) == NULL)
1020ba2e4443Sseb 		return (EINVAL);
1021ba2e4443Sseb 	macp->m_type_ident = MAC_PLUGIN_IDENT_ETHER;
10221ae08745Sheppo 	macp->m_driver = vswp;
1023ba2e4443Sseb 	macp->m_dip = vswp->dip;
1024ba2e4443Sseb 	macp->m_src_addr = (uint8_t *)&vswp->if_addr;
1025ba2e4443Sseb 	macp->m_callbacks = &vsw_m_callbacks;
1026ba2e4443Sseb 	macp->m_min_sdu = 0;
10277b1f684aSSriharsha Basavapatna 	macp->m_max_sdu = vswp->mtu;
1028c1c61f44Ssb155480 	macp->m_margin = VLAN_TAGSZ;
1029ba2e4443Sseb 	rv = mac_register(macp, &vswp->if_mh);
1030ba2e4443Sseb 	mac_free(macp);
103119b65a69Ssb155480 	if (rv != 0) {
103219b65a69Ssb155480 		/*
103319b65a69Ssb155480 		 * Treat this as a non-fatal error as we may be
103419b65a69Ssb155480 		 * able to operate in some other mode.
103519b65a69Ssb155480 		 */
103619b65a69Ssb155480 		cmn_err(CE_NOTE, "!vsw%d: Unable to register as "
103719b65a69Ssb155480 		    "a provider with MAC layer", vswp->instance);
103819b65a69Ssb155480 		return (rv);
103919b65a69Ssb155480 	}
104019b65a69Ssb155480 
1041ba2e4443Sseb 	vswp->if_state |= VSW_IF_REG;
10421ae08745Sheppo 
10431ae08745Sheppo 	D1(vswp, "%s: exit", __func__);
10441ae08745Sheppo 
10451ae08745Sheppo 	return (rv);
10461ae08745Sheppo }
10471ae08745Sheppo 
10481ae08745Sheppo static int
10491ae08745Sheppo vsw_mac_unregister(vsw_t *vswp)
10501ae08745Sheppo {
10511ae08745Sheppo 	int		rv = 0;
10521ae08745Sheppo 
10531ae08745Sheppo 	D1(vswp, "%s: enter", __func__);
10541ae08745Sheppo 
10551ae08745Sheppo 	WRITE_ENTER(&vswp->if_lockrw);
10561ae08745Sheppo 
1057ba2e4443Sseb 	if (vswp->if_state & VSW_IF_REG) {
1058ba2e4443Sseb 		rv = mac_unregister(vswp->if_mh);
10591ae08745Sheppo 		if (rv != 0) {
10601ae08745Sheppo 			DWARN(vswp, "%s: unable to unregister from MAC "
10611ae08745Sheppo 			    "framework", __func__);
10621ae08745Sheppo 
10631ae08745Sheppo 			RW_EXIT(&vswp->if_lockrw);
10641ae08745Sheppo 			D1(vswp, "%s: fail exit", __func__);
10651ae08745Sheppo 			return (rv);
10661ae08745Sheppo 		}
10671ae08745Sheppo 
1068ba2e4443Sseb 		/* mark i/f as down and unregistered */
1069ba2e4443Sseb 		vswp->if_state &= ~(VSW_IF_UP | VSW_IF_REG);
10701ae08745Sheppo 	}
10711ae08745Sheppo 	RW_EXIT(&vswp->if_lockrw);
10721ae08745Sheppo 
10731ae08745Sheppo 	D1(vswp, "%s: exit", __func__);
10741ae08745Sheppo 
10751ae08745Sheppo 	return (rv);
10761ae08745Sheppo }
10771ae08745Sheppo 
1078ba2e4443Sseb static int
1079ba2e4443Sseb vsw_m_stat(void *arg, uint_t stat, uint64_t *val)
10801ae08745Sheppo {
10811ae08745Sheppo 	vsw_t			*vswp = (vsw_t *)arg;
10821ae08745Sheppo 
10831ae08745Sheppo 	D1(vswp, "%s: enter", __func__);
10841ae08745Sheppo 
10853c1bce15Swentaoy 	WRITE_ENTER(&vswp->mac_rwlock);
108634683adeSsg70180 	if (vswp->mh == NULL) {
10873c1bce15Swentaoy 		RW_EXIT(&vswp->mac_rwlock);
1088ba2e4443Sseb 		return (EINVAL);
108934683adeSsg70180 	}
10901ae08745Sheppo 
10911ae08745Sheppo 	/* return stats from underlying device */
1092ba2e4443Sseb 	*val = mac_stat_get(vswp->mh, stat);
109334683adeSsg70180 
10943c1bce15Swentaoy 	RW_EXIT(&vswp->mac_rwlock);
109534683adeSsg70180 
1096ba2e4443Sseb 	return (0);
10971ae08745Sheppo }
10981ae08745Sheppo 
10991ae08745Sheppo static void
11001ae08745Sheppo vsw_m_stop(void *arg)
11011ae08745Sheppo {
11021ae08745Sheppo 	vsw_t	*vswp = (vsw_t *)arg;
11031ae08745Sheppo 
11041ae08745Sheppo 	D1(vswp, "%s: enter", __func__);
11051ae08745Sheppo 
11061ae08745Sheppo 	WRITE_ENTER(&vswp->if_lockrw);
11071ae08745Sheppo 	vswp->if_state &= ~VSW_IF_UP;
11081ae08745Sheppo 	RW_EXIT(&vswp->if_lockrw);
11091ae08745Sheppo 
11105f94e909Ssg70180 	mutex_enter(&vswp->hw_lock);
11115f94e909Ssg70180 
11125f94e909Ssg70180 	(void) vsw_unset_hw(vswp, NULL, VSW_LOCALDEV);
11135f94e909Ssg70180 
11145f94e909Ssg70180 	if (vswp->recfg_reqd)
11155f94e909Ssg70180 		vsw_reconfig_hw(vswp);
11165f94e909Ssg70180 
11175f94e909Ssg70180 	mutex_exit(&vswp->hw_lock);
11185f94e909Ssg70180 
11191ae08745Sheppo 	D1(vswp, "%s: exit (state = %d)", __func__, vswp->if_state);
11201ae08745Sheppo }
11211ae08745Sheppo 
11221ae08745Sheppo static int
11231ae08745Sheppo vsw_m_start(void *arg)
11241ae08745Sheppo {
11251ae08745Sheppo 	vsw_t		*vswp = (vsw_t *)arg;
11261ae08745Sheppo 
11271ae08745Sheppo 	D1(vswp, "%s: enter", __func__);
11281ae08745Sheppo 
11291ae08745Sheppo 	WRITE_ENTER(&vswp->if_lockrw);
11301ae08745Sheppo 
113119b65a69Ssb155480 	vswp->if_state |= VSW_IF_UP;
113219b65a69Ssb155480 
113319b65a69Ssb155480 	if (vswp->switching_setup_done == B_FALSE) {
113419b65a69Ssb155480 		/*
113519b65a69Ssb155480 		 * If the switching mode has not been setup yet, just
113619b65a69Ssb155480 		 * return. The unicast address will be programmed
113719b65a69Ssb155480 		 * after the physical device is successfully setup by the
113819b65a69Ssb155480 		 * timeout handler.
113919b65a69Ssb155480 		 */
114019b65a69Ssb155480 		RW_EXIT(&vswp->if_lockrw);
114119b65a69Ssb155480 		return (0);
114219b65a69Ssb155480 	}
114319b65a69Ssb155480 
114419b65a69Ssb155480 	/* if in layer2 mode, program unicast address. */
114519b65a69Ssb155480 	if (vswp->mh != NULL) {
11465f94e909Ssg70180 		mutex_enter(&vswp->hw_lock);
11475f94e909Ssg70180 		(void) vsw_set_hw(vswp, NULL, VSW_LOCALDEV);
11485f94e909Ssg70180 		mutex_exit(&vswp->hw_lock);
114919b65a69Ssb155480 	}
115019b65a69Ssb155480 
115119b65a69Ssb155480 	RW_EXIT(&vswp->if_lockrw);
11525f94e909Ssg70180 
11531ae08745Sheppo 	D1(vswp, "%s: exit (state = %d)", __func__, vswp->if_state);
11541ae08745Sheppo 	return (0);
11551ae08745Sheppo }
11561ae08745Sheppo 
11571ae08745Sheppo /*
11581ae08745Sheppo  * Change the local interface address.
11595f94e909Ssg70180  *
11605f94e909Ssg70180  * Note: we don't support this entry point. The local
11615f94e909Ssg70180  * mac address of the switch can only be changed via its
11625f94e909Ssg70180  * MD node properties.
11631ae08745Sheppo  */
11641ae08745Sheppo static int
11651ae08745Sheppo vsw_m_unicst(void *arg, const uint8_t *macaddr)
11661ae08745Sheppo {
11675f94e909Ssg70180 	_NOTE(ARGUNUSED(arg, macaddr))
11681ae08745Sheppo 
11695f94e909Ssg70180 	return (DDI_FAILURE);
11701ae08745Sheppo }
11711ae08745Sheppo 
11721ae08745Sheppo static int
11731ae08745Sheppo vsw_m_multicst(void *arg, boolean_t add, const uint8_t *mca)
11741ae08745Sheppo {
11751ae08745Sheppo 	vsw_t		*vswp = (vsw_t *)arg;
11761ae08745Sheppo 	mcst_addr_t	*mcst_p = NULL;
11771ae08745Sheppo 	uint64_t	addr = 0x0;
1178e1ebb9ecSlm66018 	int		i, ret = 0;
11791ae08745Sheppo 
11801ae08745Sheppo 	D1(vswp, "%s: enter", __func__);
11811ae08745Sheppo 
11821ae08745Sheppo 	/*
11831ae08745Sheppo 	 * Convert address into form that can be used
11841ae08745Sheppo 	 * as hash table key.
11851ae08745Sheppo 	 */
11861ae08745Sheppo 	for (i = 0; i < ETHERADDRL; i++) {
11871ae08745Sheppo 		addr = (addr << 8) | mca[i];
11881ae08745Sheppo 	}
11891ae08745Sheppo 
11901ae08745Sheppo 	D2(vswp, "%s: addr = 0x%llx", __func__, addr);
11911ae08745Sheppo 
11921ae08745Sheppo 	if (add) {
11931ae08745Sheppo 		D2(vswp, "%s: adding multicast", __func__);
11941ae08745Sheppo 		if (vsw_add_mcst(vswp, VSW_LOCALDEV, addr, NULL) == 0) {
11951ae08745Sheppo 			/*
11961ae08745Sheppo 			 * Update the list of multicast addresses
11971ae08745Sheppo 			 * contained within the vsw_t structure to
11981ae08745Sheppo 			 * include this new one.
11991ae08745Sheppo 			 */
12001ae08745Sheppo 			mcst_p = kmem_zalloc(sizeof (mcst_addr_t), KM_NOSLEEP);
12011ae08745Sheppo 			if (mcst_p == NULL) {
12021ae08745Sheppo 				DERR(vswp, "%s unable to alloc mem", __func__);
120319b65a69Ssb155480 				(void) vsw_del_mcst(vswp,
120419b65a69Ssb155480 				    VSW_LOCALDEV, addr, NULL);
12051ae08745Sheppo 				return (1);
12061ae08745Sheppo 			}
12071ae08745Sheppo 			mcst_p->addr = addr;
120819b65a69Ssb155480 			ether_copy(mca, &mcst_p->mca);
12091ae08745Sheppo 
12101ae08745Sheppo 			/*
12111ae08745Sheppo 			 * Call into the underlying driver to program the
12121ae08745Sheppo 			 * address into HW.
12131ae08745Sheppo 			 */
12143c1bce15Swentaoy 			WRITE_ENTER(&vswp->mac_rwlock);
1215e1ebb9ecSlm66018 			if (vswp->mh != NULL) {
1216e1ebb9ecSlm66018 				ret = mac_multicst_add(vswp->mh, mca);
1217e1ebb9ecSlm66018 				if (ret != 0) {
12181ef0bbb5Snarayan 					cmn_err(CE_NOTE, "!vsw%d: unable to "
121934683adeSsg70180 					    "add multicast address",
122034683adeSsg70180 					    vswp->instance);
12213c1bce15Swentaoy 					RW_EXIT(&vswp->mac_rwlock);
122219b65a69Ssb155480 					(void) vsw_del_mcst(vswp,
122319b65a69Ssb155480 					    VSW_LOCALDEV, addr, NULL);
122419b65a69Ssb155480 					kmem_free(mcst_p, sizeof (*mcst_p));
122519b65a69Ssb155480 					return (ret);
1226e1ebb9ecSlm66018 				}
122719b65a69Ssb155480 				mcst_p->mac_added = B_TRUE;
12281ae08745Sheppo 			}
12293c1bce15Swentaoy 			RW_EXIT(&vswp->mac_rwlock);
123019b65a69Ssb155480 
123119b65a69Ssb155480 			mutex_enter(&vswp->mca_lock);
123219b65a69Ssb155480 			mcst_p->nextp = vswp->mcap;
123319b65a69Ssb155480 			vswp->mcap = mcst_p;
123419b65a69Ssb155480 			mutex_exit(&vswp->mca_lock);
12351ae08745Sheppo 		} else {
12361ef0bbb5Snarayan 			cmn_err(CE_NOTE, "!vsw%d: unable to add multicast "
123734683adeSsg70180 			    "address", vswp->instance);
1238e1ebb9ecSlm66018 		}
1239e1ebb9ecSlm66018 		return (ret);
1240e1ebb9ecSlm66018 	}
1241e1ebb9ecSlm66018 
12421ae08745Sheppo 	D2(vswp, "%s: removing multicast", __func__);
12431ae08745Sheppo 	/*
12441ae08745Sheppo 	 * Remove the address from the hash table..
12451ae08745Sheppo 	 */
12461ae08745Sheppo 	if (vsw_del_mcst(vswp, VSW_LOCALDEV, addr, NULL) == 0) {
12471ae08745Sheppo 
12481ae08745Sheppo 		/*
12491ae08745Sheppo 		 * ..and then from the list maintained in the
12501ae08745Sheppo 		 * vsw_t structure.
12511ae08745Sheppo 		 */
125219b65a69Ssb155480 		mcst_p = vsw_del_addr(VSW_LOCALDEV, vswp, addr);
125319b65a69Ssb155480 		ASSERT(mcst_p != NULL);
12541ae08745Sheppo 
12553c1bce15Swentaoy 		WRITE_ENTER(&vswp->mac_rwlock);
125619b65a69Ssb155480 		if (vswp->mh != NULL && mcst_p->mac_added) {
12571ae08745Sheppo 			(void) mac_multicst_remove(vswp->mh, mca);
125819b65a69Ssb155480 			mcst_p->mac_added = B_FALSE;
125919b65a69Ssb155480 		}
12603c1bce15Swentaoy 		RW_EXIT(&vswp->mac_rwlock);
126119b65a69Ssb155480 		kmem_free(mcst_p, sizeof (*mcst_p));
12621ae08745Sheppo 	}
12631ae08745Sheppo 
12641ae08745Sheppo 	D1(vswp, "%s: exit", __func__);
12651ae08745Sheppo 
12661ae08745Sheppo 	return (0);
12671ae08745Sheppo }
12681ae08745Sheppo 
12691ae08745Sheppo static int
12701ae08745Sheppo vsw_m_promisc(void *arg, boolean_t on)
12711ae08745Sheppo {
12721ae08745Sheppo 	vsw_t		*vswp = (vsw_t *)arg;
12731ae08745Sheppo 
12741ae08745Sheppo 	D1(vswp, "%s: enter", __func__);
12751ae08745Sheppo 
12761ae08745Sheppo 	WRITE_ENTER(&vswp->if_lockrw);
12771ae08745Sheppo 	if (on)
12781ae08745Sheppo 		vswp->if_state |= VSW_IF_PROMISC;
12791ae08745Sheppo 	else
12801ae08745Sheppo 		vswp->if_state &= ~VSW_IF_PROMISC;
12811ae08745Sheppo 	RW_EXIT(&vswp->if_lockrw);
12821ae08745Sheppo 
12831ae08745Sheppo 	D1(vswp, "%s: exit", __func__);
12841ae08745Sheppo 
12851ae08745Sheppo 	return (0);
12861ae08745Sheppo }
12871ae08745Sheppo 
12881ae08745Sheppo static mblk_t *
12891ae08745Sheppo vsw_m_tx(void *arg, mblk_t *mp)
12901ae08745Sheppo {
12911ae08745Sheppo 	vsw_t		*vswp = (vsw_t *)arg;
12921ae08745Sheppo 
12931ae08745Sheppo 	D1(vswp, "%s: enter", __func__);
12941ae08745Sheppo 
1295c1c61f44Ssb155480 	mp = vsw_vlan_frame_pretag(vswp, VSW_LOCALDEV, mp);
1296c1c61f44Ssb155480 
1297c1c61f44Ssb155480 	if (mp == NULL) {
1298c1c61f44Ssb155480 		return (NULL);
1299c1c61f44Ssb155480 	}
1300c1c61f44Ssb155480 
130134683adeSsg70180 	vswp->vsw_switch_frame(vswp, mp, VSW_LOCALDEV, NULL, NULL);
13021ae08745Sheppo 
13031ae08745Sheppo 	D1(vswp, "%s: exit", __func__);
13041ae08745Sheppo 
13051ae08745Sheppo 	return (NULL);
13061ae08745Sheppo }
13071ae08745Sheppo 
13081ae08745Sheppo /*
13091ae08745Sheppo  * Register for machine description (MD) updates.
131034683adeSsg70180  *
131134683adeSsg70180  * Returns 0 on success, 1 on failure.
13121ae08745Sheppo  */
131334683adeSsg70180 static int
13141ae08745Sheppo vsw_mdeg_register(vsw_t *vswp)
13151ae08745Sheppo {
13161ae08745Sheppo 	mdeg_prop_spec_t	*pspecp;
13171ae08745Sheppo 	mdeg_node_spec_t	*inst_specp;
131834683adeSsg70180 	mdeg_handle_t		mdeg_hdl, mdeg_port_hdl;
13191ae08745Sheppo 	size_t			templatesz;
132019b65a69Ssb155480 	int			rv;
13211ae08745Sheppo 
13221ae08745Sheppo 	D1(vswp, "%s: enter", __func__);
13231ae08745Sheppo 
132434683adeSsg70180 	/*
13251ae08745Sheppo 	 * Allocate and initialize a per-instance copy
13261ae08745Sheppo 	 * of the global property spec array that will
13271ae08745Sheppo 	 * uniquely identify this vsw instance.
13281ae08745Sheppo 	 */
13291ae08745Sheppo 	templatesz = sizeof (vsw_prop_template);
13301ae08745Sheppo 	pspecp = kmem_zalloc(templatesz, KM_SLEEP);
13311ae08745Sheppo 
13321ae08745Sheppo 	bcopy(vsw_prop_template, pspecp, templatesz);
13331ae08745Sheppo 
133419b65a69Ssb155480 	VSW_SET_MDEG_PROP_INST(pspecp, vswp->regprop);
13351ae08745Sheppo 
13361ae08745Sheppo 	/* initialize the complete prop spec structure */
13371ae08745Sheppo 	inst_specp = kmem_zalloc(sizeof (mdeg_node_spec_t), KM_SLEEP);
13381ae08745Sheppo 	inst_specp->namep = "virtual-device";
13391ae08745Sheppo 	inst_specp->specp = pspecp;
13401ae08745Sheppo 
134119b65a69Ssb155480 	D2(vswp, "%s: instance %d registering with mdeg", __func__,
134219b65a69Ssb155480 	    vswp->regprop);
134334683adeSsg70180 	/*
134434683adeSsg70180 	 * Register an interest in 'virtual-device' nodes with a
134534683adeSsg70180 	 * 'name' property of 'virtual-network-switch'
134634683adeSsg70180 	 */
134734683adeSsg70180 	rv = mdeg_register(inst_specp, &vdev_match, vsw_mdeg_cb,
13481ae08745Sheppo 	    (void *)vswp, &mdeg_hdl);
134934683adeSsg70180 	if (rv != MDEG_SUCCESS) {
135034683adeSsg70180 		DERR(vswp, "%s: mdeg_register failed (%d) for vsw node",
135134683adeSsg70180 		    __func__, rv);
135234683adeSsg70180 		goto mdeg_reg_fail;
135334683adeSsg70180 	}
13541ae08745Sheppo 
135534683adeSsg70180 	/*
135634683adeSsg70180 	 * Register an interest in 'vsw-port' nodes.
135734683adeSsg70180 	 */
135834683adeSsg70180 	rv = mdeg_register(inst_specp, &vport_match, vsw_port_mdeg_cb,
135934683adeSsg70180 	    (void *)vswp, &mdeg_port_hdl);
13601ae08745Sheppo 	if (rv != MDEG_SUCCESS) {
13611ae08745Sheppo 		DERR(vswp, "%s: mdeg_register failed (%d)\n", __func__, rv);
136234683adeSsg70180 		(void) mdeg_unregister(mdeg_hdl);
136334683adeSsg70180 		goto mdeg_reg_fail;
13641ae08745Sheppo 	}
13651ae08745Sheppo 
13661ae08745Sheppo 	/* save off data that will be needed later */
13671ae08745Sheppo 	vswp->inst_spec = inst_specp;
13681ae08745Sheppo 	vswp->mdeg_hdl = mdeg_hdl;
136934683adeSsg70180 	vswp->mdeg_port_hdl = mdeg_port_hdl;
13701ae08745Sheppo 
13711ae08745Sheppo 	D1(vswp, "%s: exit", __func__);
137234683adeSsg70180 	return (0);
137334683adeSsg70180 
137434683adeSsg70180 mdeg_reg_fail:
137534683adeSsg70180 	cmn_err(CE_WARN, "!vsw%d: Unable to register MDEG callbacks",
137634683adeSsg70180 	    vswp->instance);
137734683adeSsg70180 	kmem_free(pspecp, templatesz);
137834683adeSsg70180 	kmem_free(inst_specp, sizeof (mdeg_node_spec_t));
137934683adeSsg70180 
138034683adeSsg70180 	vswp->mdeg_hdl = NULL;
138134683adeSsg70180 	vswp->mdeg_port_hdl = NULL;
138234683adeSsg70180 
138334683adeSsg70180 	return (1);
13841ae08745Sheppo }
13851ae08745Sheppo 
13861ae08745Sheppo static void
13871ae08745Sheppo vsw_mdeg_unregister(vsw_t *vswp)
13881ae08745Sheppo {
13891ae08745Sheppo 	D1(vswp, "vsw_mdeg_unregister: enter");
13901ae08745Sheppo 
139134683adeSsg70180 	if (vswp->mdeg_hdl != NULL)
13921ae08745Sheppo 		(void) mdeg_unregister(vswp->mdeg_hdl);
13931ae08745Sheppo 
139434683adeSsg70180 	if (vswp->mdeg_port_hdl != NULL)
139534683adeSsg70180 		(void) mdeg_unregister(vswp->mdeg_port_hdl);
139634683adeSsg70180 
139734683adeSsg70180 	if (vswp->inst_spec != NULL) {
13981ae08745Sheppo 		if (vswp->inst_spec->specp != NULL) {
13991ae08745Sheppo 			(void) kmem_free(vswp->inst_spec->specp,
14001ae08745Sheppo 			    sizeof (vsw_prop_template));
14011ae08745Sheppo 			vswp->inst_spec->specp = NULL;
14021ae08745Sheppo 		}
14031ae08745Sheppo 
1404205eeb1aSlm66018 		(void) kmem_free(vswp->inst_spec, sizeof (mdeg_node_spec_t));
14051ae08745Sheppo 		vswp->inst_spec = NULL;
14061ae08745Sheppo 	}
14071ae08745Sheppo 
14081ae08745Sheppo 	D1(vswp, "vsw_mdeg_unregister: exit");
14091ae08745Sheppo }
14101ae08745Sheppo 
141134683adeSsg70180 /*
141234683adeSsg70180  * Mdeg callback invoked for the vsw node itself.
141334683adeSsg70180  */
14141ae08745Sheppo static int
14151ae08745Sheppo vsw_mdeg_cb(void *cb_argp, mdeg_result_t *resp)
14161ae08745Sheppo {
14171ae08745Sheppo 	vsw_t		*vswp;
14181ae08745Sheppo 	md_t		*mdp;
14191ae08745Sheppo 	mde_cookie_t	node;
14201ae08745Sheppo 	uint64_t	inst;
142134683adeSsg70180 	char		*node_name = NULL;
14221ae08745Sheppo 
14231ae08745Sheppo 	if (resp == NULL)
14241ae08745Sheppo 		return (MDEG_FAILURE);
14251ae08745Sheppo 
14261ae08745Sheppo 	vswp = (vsw_t *)cb_argp;
14271ae08745Sheppo 
142834683adeSsg70180 	D1(vswp, "%s: added %d : removed %d : curr matched %d"
142934683adeSsg70180 	    " : prev matched %d", __func__, resp->added.nelem,
143034683adeSsg70180 	    resp->removed.nelem, resp->match_curr.nelem,
143134683adeSsg70180 	    resp->match_prev.nelem);
143234683adeSsg70180 
143334683adeSsg70180 	/*
143419b65a69Ssb155480 	 * We get an initial callback for this node as 'added'
143519b65a69Ssb155480 	 * after registering with mdeg. Note that we would have
143619b65a69Ssb155480 	 * already gathered information about this vsw node by
143719b65a69Ssb155480 	 * walking MD earlier during attach (in vsw_read_mdprops()).
143819b65a69Ssb155480 	 * So, there is a window where the properties of this
143919b65a69Ssb155480 	 * node might have changed when we get this initial 'added'
144019b65a69Ssb155480 	 * callback. We handle this as if an update occured
144119b65a69Ssb155480 	 * and invoke the same function which handles updates to
144219b65a69Ssb155480 	 * the properties of this vsw-node if any.
144319b65a69Ssb155480 	 *
144434683adeSsg70180 	 * A non-zero 'match' value indicates that the MD has been
144519b65a69Ssb155480 	 * updated and that a virtual-network-switch node is
144619b65a69Ssb155480 	 * present which may or may not have been updated. It is
144719b65a69Ssb155480 	 * up to the clients to examine their own nodes and
144819b65a69Ssb155480 	 * determine if they have changed.
144934683adeSsg70180 	 */
145019b65a69Ssb155480 	if (resp->added.nelem != 0) {
145134683adeSsg70180 
145219b65a69Ssb155480 		if (resp->added.nelem != 1) {
145319b65a69Ssb155480 			cmn_err(CE_NOTE, "!vsw%d: number of nodes added "
145419b65a69Ssb155480 			    "invalid: %d\n", vswp->instance, resp->added.nelem);
145519b65a69Ssb155480 			return (MDEG_FAILURE);
145619b65a69Ssb155480 		}
145719b65a69Ssb155480 
145819b65a69Ssb155480 		mdp = resp->added.mdp;
145919b65a69Ssb155480 		node = resp->added.mdep[0];
146019b65a69Ssb155480 
146119b65a69Ssb155480 	} else if (resp->match_curr.nelem != 0) {
146219b65a69Ssb155480 
146319b65a69Ssb155480 		if (resp->match_curr.nelem != 1) {
146419b65a69Ssb155480 			cmn_err(CE_NOTE, "!vsw%d: number of nodes updated "
146519b65a69Ssb155480 			    "invalid: %d\n", vswp->instance,
146619b65a69Ssb155480 			    resp->match_curr.nelem);
146719b65a69Ssb155480 			return (MDEG_FAILURE);
146819b65a69Ssb155480 		}
146919b65a69Ssb155480 
147019b65a69Ssb155480 		mdp = resp->match_curr.mdp;
147119b65a69Ssb155480 		node = resp->match_curr.mdep[0];
147219b65a69Ssb155480 
147319b65a69Ssb155480 	} else {
147419b65a69Ssb155480 		return (MDEG_FAILURE);
147519b65a69Ssb155480 	}
147619b65a69Ssb155480 
147719b65a69Ssb155480 	/* Validate name and instance */
147834683adeSsg70180 	if (md_get_prop_str(mdp, node, "name", &node_name) != 0) {
147919b65a69Ssb155480 		DERR(vswp, "%s: unable to get node name\n",  __func__);
148019b65a69Ssb155480 		return (MDEG_FAILURE);
148119b65a69Ssb155480 	}
148219b65a69Ssb155480 
148319b65a69Ssb155480 	/* is this a virtual-network-switch? */
148419b65a69Ssb155480 	if (strcmp(node_name, vsw_propname) != 0) {
148519b65a69Ssb155480 		DERR(vswp, "%s: Invalid node name: %s\n",
148619b65a69Ssb155480 		    __func__, node_name);
148719b65a69Ssb155480 		return (MDEG_FAILURE);
148834683adeSsg70180 	}
148934683adeSsg70180 
149034683adeSsg70180 	if (md_get_prop_val(mdp, node, "cfg-handle", &inst)) {
149119b65a69Ssb155480 		DERR(vswp, "%s: prop(cfg-handle) not found\n",
149219b65a69Ssb155480 		    __func__);
149319b65a69Ssb155480 		return (MDEG_FAILURE);
149434683adeSsg70180 	}
149534683adeSsg70180 
149619b65a69Ssb155480 	/* is this the right instance of vsw? */
149719b65a69Ssb155480 	if (inst != vswp->regprop) {
149819b65a69Ssb155480 		DERR(vswp, "%s: Invalid cfg-handle: %lx\n",
149919b65a69Ssb155480 		    __func__, inst);
150019b65a69Ssb155480 		return (MDEG_FAILURE);
150119b65a69Ssb155480 	}
150234683adeSsg70180 
150334683adeSsg70180 	vsw_update_md_prop(vswp, mdp, node);
150434683adeSsg70180 
150534683adeSsg70180 	return (MDEG_SUCCESS);
150634683adeSsg70180 }
150734683adeSsg70180 
150834683adeSsg70180 /*
150934683adeSsg70180  * Mdeg callback invoked for changes to the vsw-port nodes
151034683adeSsg70180  * under the vsw node.
151134683adeSsg70180  */
151234683adeSsg70180 static int
151334683adeSsg70180 vsw_port_mdeg_cb(void *cb_argp, mdeg_result_t *resp)
151434683adeSsg70180 {
151534683adeSsg70180 	vsw_t		*vswp;
151634683adeSsg70180 	int		idx;
151734683adeSsg70180 	md_t		*mdp;
151834683adeSsg70180 	mde_cookie_t	node;
151934683adeSsg70180 	uint64_t	inst;
15201ef0bbb5Snarayan 	int		rv;
152134683adeSsg70180 
152234683adeSsg70180 	if ((resp == NULL) || (cb_argp == NULL))
152334683adeSsg70180 		return (MDEG_FAILURE);
152434683adeSsg70180 
152534683adeSsg70180 	vswp = (vsw_t *)cb_argp;
152634683adeSsg70180 
152734683adeSsg70180 	D2(vswp, "%s: added %d : removed %d : curr matched %d"
152834683adeSsg70180 	    " : prev matched %d", __func__, resp->added.nelem,
152934683adeSsg70180 	    resp->removed.nelem, resp->match_curr.nelem,
15301ae08745Sheppo 	    resp->match_prev.nelem);
15311ae08745Sheppo 
15321ae08745Sheppo 	/* process added ports */
15331ae08745Sheppo 	for (idx = 0; idx < resp->added.nelem; idx++) {
15341ae08745Sheppo 		mdp = resp->added.mdp;
15351ae08745Sheppo 		node = resp->added.mdep[idx];
15361ae08745Sheppo 
15371ae08745Sheppo 		D2(vswp, "%s: adding node(%d) 0x%lx", __func__, idx, node);
15381ae08745Sheppo 
15391ef0bbb5Snarayan 		if ((rv = vsw_port_add(vswp, mdp, &node)) != 0) {
154034683adeSsg70180 			cmn_err(CE_WARN, "!vsw%d: Unable to add new port "
15411ef0bbb5Snarayan 			    "(0x%lx), err=%d", vswp->instance, node, rv);
15421ae08745Sheppo 		}
15431ae08745Sheppo 	}
15441ae08745Sheppo 
15451ae08745Sheppo 	/* process removed ports */
15461ae08745Sheppo 	for (idx = 0; idx < resp->removed.nelem; idx++) {
15471ae08745Sheppo 		mdp = resp->removed.mdp;
15481ae08745Sheppo 		node = resp->removed.mdep[idx];
15491ae08745Sheppo 
15501ae08745Sheppo 		if (md_get_prop_val(mdp, node, id_propname, &inst)) {
155134683adeSsg70180 			DERR(vswp, "%s: prop(%s) not found in port(%d)",
15521ae08745Sheppo 			    __func__, id_propname, idx);
15531ae08745Sheppo 			continue;
15541ae08745Sheppo 		}
15551ae08745Sheppo 
15561ae08745Sheppo 		D2(vswp, "%s: removing node(%d) 0x%lx", __func__, idx, node);
15571ae08745Sheppo 
15581ae08745Sheppo 		if (vsw_port_detach(vswp, inst) != 0) {
155934683adeSsg70180 			cmn_err(CE_WARN, "!vsw%d: Unable to remove port %ld",
156034683adeSsg70180 			    vswp->instance, inst);
15611ae08745Sheppo 		}
15621ae08745Sheppo 	}
15631ae08745Sheppo 
1564c1c61f44Ssb155480 	for (idx = 0; idx < resp->match_curr.nelem; idx++) {
1565c1c61f44Ssb155480 		(void) vsw_port_update(vswp, resp->match_curr.mdp,
1566c1c61f44Ssb155480 		    resp->match_curr.mdep[idx],
1567c1c61f44Ssb155480 		    resp->match_prev.mdp,
1568c1c61f44Ssb155480 		    resp->match_prev.mdep[idx]);
1569c1c61f44Ssb155480 	}
15701ae08745Sheppo 
15711ae08745Sheppo 	D1(vswp, "%s: exit", __func__);
15721ae08745Sheppo 
15731ae08745Sheppo 	return (MDEG_SUCCESS);
15741ae08745Sheppo }
15751ae08745Sheppo 
15761ae08745Sheppo /*
157719b65a69Ssb155480  * Scan the machine description for this instance of vsw
157819b65a69Ssb155480  * and read its properties. Called only from vsw_attach().
157919b65a69Ssb155480  * Returns: 0 on success, 1 on failure.
158019b65a69Ssb155480  */
158119b65a69Ssb155480 static int
158219b65a69Ssb155480 vsw_read_mdprops(vsw_t *vswp)
158319b65a69Ssb155480 {
158419b65a69Ssb155480 	md_t		*mdp = NULL;
158519b65a69Ssb155480 	mde_cookie_t	rootnode;
158619b65a69Ssb155480 	mde_cookie_t	*listp = NULL;
158719b65a69Ssb155480 	uint64_t	inst;
158819b65a69Ssb155480 	uint64_t	cfgh;
158919b65a69Ssb155480 	char		*name;
159019b65a69Ssb155480 	int		rv = 1;
159119b65a69Ssb155480 	int		num_nodes = 0;
159219b65a69Ssb155480 	int		num_devs = 0;
159319b65a69Ssb155480 	int		listsz = 0;
159419b65a69Ssb155480 	int		i;
159519b65a69Ssb155480 
159619b65a69Ssb155480 	/*
159719b65a69Ssb155480 	 * In each 'virtual-device' node in the MD there is a
159819b65a69Ssb155480 	 * 'cfg-handle' property which is the MD's concept of
159919b65a69Ssb155480 	 * an instance number (this may be completely different from
160019b65a69Ssb155480 	 * the device drivers instance #). OBP reads that value and
160119b65a69Ssb155480 	 * stores it in the 'reg' property of the appropriate node in
160219b65a69Ssb155480 	 * the device tree. We first read this reg property and use this
160319b65a69Ssb155480 	 * to compare against the 'cfg-handle' property of vsw nodes
160419b65a69Ssb155480 	 * in MD to get to this specific vsw instance and then read
160519b65a69Ssb155480 	 * other properties that we are interested in.
160619b65a69Ssb155480 	 * We also cache the value of 'reg' property and use it later
160719b65a69Ssb155480 	 * to register callbacks with mdeg (see vsw_mdeg_register())
160819b65a69Ssb155480 	 */
160919b65a69Ssb155480 	inst = ddi_prop_get_int(DDI_DEV_T_ANY, vswp->dip,
161019b65a69Ssb155480 	    DDI_PROP_DONTPASS, reg_propname, -1);
161119b65a69Ssb155480 	if (inst == -1) {
161219b65a69Ssb155480 		cmn_err(CE_NOTE, "!vsw%d: Unable to read %s property from "
161319b65a69Ssb155480 		    "OBP device tree", vswp->instance, reg_propname);
161419b65a69Ssb155480 		return (rv);
161519b65a69Ssb155480 	}
161619b65a69Ssb155480 
161719b65a69Ssb155480 	vswp->regprop = inst;
161819b65a69Ssb155480 
161919b65a69Ssb155480 	if ((mdp = md_get_handle()) == NULL) {
162019b65a69Ssb155480 		DWARN(vswp, "%s: cannot init MD\n", __func__);
162119b65a69Ssb155480 		return (rv);
162219b65a69Ssb155480 	}
162319b65a69Ssb155480 
162419b65a69Ssb155480 	num_nodes = md_node_count(mdp);
162519b65a69Ssb155480 	ASSERT(num_nodes > 0);
162619b65a69Ssb155480 
162719b65a69Ssb155480 	listsz = num_nodes * sizeof (mde_cookie_t);
162819b65a69Ssb155480 	listp = (mde_cookie_t *)kmem_zalloc(listsz, KM_SLEEP);
162919b65a69Ssb155480 
163019b65a69Ssb155480 	rootnode = md_root_node(mdp);
163119b65a69Ssb155480 
163219b65a69Ssb155480 	/* search for all "virtual_device" nodes */
163319b65a69Ssb155480 	num_devs = md_scan_dag(mdp, rootnode,
163419b65a69Ssb155480 	    md_find_name(mdp, vdev_propname),
163519b65a69Ssb155480 	    md_find_name(mdp, "fwd"), listp);
163619b65a69Ssb155480 	if (num_devs <= 0) {
163719b65a69Ssb155480 		DWARN(vswp, "%s: invalid num_devs:%d\n", __func__, num_devs);
163819b65a69Ssb155480 		goto vsw_readmd_exit;
163919b65a69Ssb155480 	}
164019b65a69Ssb155480 
164119b65a69Ssb155480 	/*
164219b65a69Ssb155480 	 * Now loop through the list of virtual-devices looking for
164319b65a69Ssb155480 	 * devices with name "virtual-network-switch" and for each
164419b65a69Ssb155480 	 * such device compare its instance with what we have from
164519b65a69Ssb155480 	 * the 'reg' property to find the right node in MD and then
164619b65a69Ssb155480 	 * read all its properties.
164719b65a69Ssb155480 	 */
164819b65a69Ssb155480 	for (i = 0; i < num_devs; i++) {
164919b65a69Ssb155480 
165019b65a69Ssb155480 		if (md_get_prop_str(mdp, listp[i], "name", &name) != 0) {
165119b65a69Ssb155480 			DWARN(vswp, "%s: name property not found\n",
165219b65a69Ssb155480 			    __func__);
165319b65a69Ssb155480 			goto vsw_readmd_exit;
165419b65a69Ssb155480 		}
165519b65a69Ssb155480 
165619b65a69Ssb155480 		/* is this a virtual-network-switch? */
165719b65a69Ssb155480 		if (strcmp(name, vsw_propname) != 0)
165819b65a69Ssb155480 			continue;
165919b65a69Ssb155480 
166019b65a69Ssb155480 		if (md_get_prop_val(mdp, listp[i], "cfg-handle", &cfgh) != 0) {
166119b65a69Ssb155480 			DWARN(vswp, "%s: cfg-handle property not found\n",
166219b65a69Ssb155480 			    __func__);
166319b65a69Ssb155480 			goto vsw_readmd_exit;
166419b65a69Ssb155480 		}
166519b65a69Ssb155480 
166619b65a69Ssb155480 		/* is this the required instance of vsw? */
166719b65a69Ssb155480 		if (inst != cfgh)
166819b65a69Ssb155480 			continue;
166919b65a69Ssb155480 
167019b65a69Ssb155480 		/* now read all properties of this vsw instance */
167119b65a69Ssb155480 		rv = vsw_get_initial_md_properties(vswp, mdp, listp[i]);
167219b65a69Ssb155480 		break;
167319b65a69Ssb155480 	}
167419b65a69Ssb155480 
167519b65a69Ssb155480 vsw_readmd_exit:
167619b65a69Ssb155480 
167719b65a69Ssb155480 	kmem_free(listp, listsz);
167819b65a69Ssb155480 	(void) md_fini_handle(mdp);
167919b65a69Ssb155480 	return (rv);
168019b65a69Ssb155480 }
168119b65a69Ssb155480 
168219b65a69Ssb155480 /*
168334683adeSsg70180  * Read the initial start-of-day values from the specified MD node.
168434683adeSsg70180  */
168519b65a69Ssb155480 static int
168634683adeSsg70180 vsw_get_initial_md_properties(vsw_t *vswp, md_t *mdp, mde_cookie_t node)
168734683adeSsg70180 {
168834683adeSsg70180 	int		i;
168934683adeSsg70180 	uint64_t 	macaddr = 0;
169034683adeSsg70180 
169134683adeSsg70180 	D1(vswp, "%s: enter", __func__);
169234683adeSsg70180 
169319b65a69Ssb155480 	if (vsw_get_md_physname(vswp, mdp, node, vswp->physname) != 0) {
169419b65a69Ssb155480 		return (1);
169534683adeSsg70180 	}
169634683adeSsg70180 
169734683adeSsg70180 	/* mac address for vswitch device itself */
169834683adeSsg70180 	if (md_get_prop_val(mdp, node, macaddr_propname, &macaddr) != 0) {
169934683adeSsg70180 		cmn_err(CE_WARN, "!vsw%d: Unable to get MAC address from MD",
170034683adeSsg70180 		    vswp->instance);
170119b65a69Ssb155480 		return (1);
170219b65a69Ssb155480 	}
170334683adeSsg70180 
170419b65a69Ssb155480 	vsw_save_lmacaddr(vswp, macaddr);
170534683adeSsg70180 
1706205eeb1aSlm66018 	if (vsw_get_md_smodes(vswp, mdp, node, vswp->smode, &vswp->smode_num)) {
17071ef0bbb5Snarayan 		DWARN(vswp, "%s: Unable to read %s property from MD, "
17081ef0bbb5Snarayan 		    "defaulting to 'switched' mode",
17091ef0bbb5Snarayan 		    __func__, smode_propname);
171034683adeSsg70180 
171134683adeSsg70180 		for (i = 0; i < NUM_SMODES; i++)
171234683adeSsg70180 			vswp->smode[i] = VSW_LAYER2;
171334683adeSsg70180 
171434683adeSsg70180 		vswp->smode_num = NUM_SMODES;
171534683adeSsg70180 	} else {
171634683adeSsg70180 		ASSERT(vswp->smode_num != 0);
171734683adeSsg70180 	}
171834683adeSsg70180 
17197b1f684aSSriharsha Basavapatna 	/* read mtu */
17207b1f684aSSriharsha Basavapatna 	vsw_mtu_read(vswp, mdp, node, &vswp->mtu);
17217b1f684aSSriharsha Basavapatna 	if (vswp->mtu < ETHERMTU || vswp->mtu > VNET_MAX_MTU) {
17227b1f684aSSriharsha Basavapatna 		vswp->mtu = ETHERMTU;
17237b1f684aSSriharsha Basavapatna 	}
17247b1f684aSSriharsha Basavapatna 	vswp->max_frame_size = vswp->mtu + sizeof (struct ether_header) +
17257b1f684aSSriharsha Basavapatna 	    VLAN_TAGSZ;
17267b1f684aSSriharsha Basavapatna 
1727c1c61f44Ssb155480 	/* read vlan id properties of this vsw instance */
1728c1c61f44Ssb155480 	vsw_vlan_read_ids(vswp, VSW_LOCALDEV, mdp, node, &vswp->pvid,
1729c1c61f44Ssb155480 	    &vswp->vids, &vswp->nvids, &vswp->default_vlan_id);
1730c1c61f44Ssb155480 
1731c1c61f44Ssb155480 	/* read priority-ether-types */
1732f0ca1d9aSsb155480 	vsw_read_pri_eth_types(vswp, mdp, node);
1733f0ca1d9aSsb155480 
173434683adeSsg70180 	D1(vswp, "%s: exit", __func__);
173519b65a69Ssb155480 	return (0);
173634683adeSsg70180 }
173734683adeSsg70180 
173834683adeSsg70180 /*
1739c1c61f44Ssb155480  * Read vlan id properties of the given MD node.
1740c1c61f44Ssb155480  * Arguments:
1741c1c61f44Ssb155480  *   arg:          device argument(vsw device or a port)
1742c1c61f44Ssb155480  *   type:         type of arg; VSW_LOCALDEV(vsw device) or VSW_VNETPORT(port)
1743c1c61f44Ssb155480  *   mdp:          machine description
1744c1c61f44Ssb155480  *   node:         md node cookie
1745c1c61f44Ssb155480  *
1746c1c61f44Ssb155480  * Returns:
1747c1c61f44Ssb155480  *   pvidp:        port-vlan-id of the node
1748c1c61f44Ssb155480  *   vidspp:       list of vlan-ids of the node
1749c1c61f44Ssb155480  *   nvidsp:       # of vlan-ids in the list
1750c1c61f44Ssb155480  *   default_idp:  default-vlan-id of the node(if node is vsw device)
1751c1c61f44Ssb155480  */
1752c1c61f44Ssb155480 static void
1753c1c61f44Ssb155480 vsw_vlan_read_ids(void *arg, int type, md_t *mdp, mde_cookie_t node,
1754c1c61f44Ssb155480 	uint16_t *pvidp, uint16_t **vidspp, uint16_t *nvidsp,
1755c1c61f44Ssb155480 	uint16_t *default_idp)
1756c1c61f44Ssb155480 {
1757c1c61f44Ssb155480 	vsw_t		*vswp;
1758c1c61f44Ssb155480 	vsw_port_t	*portp;
1759c1c61f44Ssb155480 	char		*pvid_propname;
1760c1c61f44Ssb155480 	char		*vid_propname;
1761c1c61f44Ssb155480 	uint_t		nvids = 0;
1762c1c61f44Ssb155480 	uint32_t	vids_size;
1763c1c61f44Ssb155480 	int		rv;
1764c1c61f44Ssb155480 	int		i;
1765c1c61f44Ssb155480 	uint64_t	*data;
1766c1c61f44Ssb155480 	uint64_t	val;
1767c1c61f44Ssb155480 	int		size;
1768c1c61f44Ssb155480 	int		inst;
1769c1c61f44Ssb155480 
1770c1c61f44Ssb155480 	if (type == VSW_LOCALDEV) {
1771c1c61f44Ssb155480 
1772c1c61f44Ssb155480 		vswp = (vsw_t *)arg;
1773c1c61f44Ssb155480 		pvid_propname = vsw_pvid_propname;
1774c1c61f44Ssb155480 		vid_propname = vsw_vid_propname;
1775c1c61f44Ssb155480 		inst = vswp->instance;
1776c1c61f44Ssb155480 
1777c1c61f44Ssb155480 	} else if (type == VSW_VNETPORT) {
1778c1c61f44Ssb155480 
1779c1c61f44Ssb155480 		portp = (vsw_port_t *)arg;
1780c1c61f44Ssb155480 		vswp = portp->p_vswp;
1781c1c61f44Ssb155480 		pvid_propname = port_pvid_propname;
1782c1c61f44Ssb155480 		vid_propname = port_vid_propname;
1783c1c61f44Ssb155480 		inst = portp->p_instance;
1784c1c61f44Ssb155480 
1785c1c61f44Ssb155480 	} else {
1786c1c61f44Ssb155480 		return;
1787c1c61f44Ssb155480 	}
1788c1c61f44Ssb155480 
1789c1c61f44Ssb155480 	if (type == VSW_LOCALDEV && default_idp != NULL) {
1790c1c61f44Ssb155480 		rv = md_get_prop_val(mdp, node, vsw_dvid_propname, &val);
1791c1c61f44Ssb155480 		if (rv != 0) {
1792c1c61f44Ssb155480 			DWARN(vswp, "%s: prop(%s) not found", __func__,
1793c1c61f44Ssb155480 			    vsw_dvid_propname);
1794c1c61f44Ssb155480 
1795c1c61f44Ssb155480 			*default_idp = vsw_default_vlan_id;
1796c1c61f44Ssb155480 		} else {
1797c1c61f44Ssb155480 			*default_idp = val & 0xFFF;
1798c1c61f44Ssb155480 			D2(vswp, "%s: %s(%d): (%d)\n", __func__,
1799c1c61f44Ssb155480 			    vsw_dvid_propname, inst, *default_idp);
1800c1c61f44Ssb155480 		}
1801c1c61f44Ssb155480 	}
1802c1c61f44Ssb155480 
1803c1c61f44Ssb155480 	rv = md_get_prop_val(mdp, node, pvid_propname, &val);
1804c1c61f44Ssb155480 	if (rv != 0) {
1805c1c61f44Ssb155480 		DWARN(vswp, "%s: prop(%s) not found", __func__, pvid_propname);
1806c1c61f44Ssb155480 		*pvidp = vsw_default_vlan_id;
1807c1c61f44Ssb155480 	} else {
1808c1c61f44Ssb155480 
1809c1c61f44Ssb155480 		*pvidp = val & 0xFFF;
1810c1c61f44Ssb155480 		D2(vswp, "%s: %s(%d): (%d)\n", __func__,
1811c1c61f44Ssb155480 		    pvid_propname, inst, *pvidp);
1812c1c61f44Ssb155480 	}
1813c1c61f44Ssb155480 
1814c1c61f44Ssb155480 	rv = md_get_prop_data(mdp, node, vid_propname, (uint8_t **)&data,
1815c1c61f44Ssb155480 	    &size);
1816c1c61f44Ssb155480 	if (rv != 0) {
1817c1c61f44Ssb155480 		D2(vswp, "%s: prop(%s) not found", __func__, vid_propname);
1818c1c61f44Ssb155480 		size = 0;
1819c1c61f44Ssb155480 	} else {
1820c1c61f44Ssb155480 		size /= sizeof (uint64_t);
1821c1c61f44Ssb155480 	}
1822c1c61f44Ssb155480 	nvids = size;
1823c1c61f44Ssb155480 
1824c1c61f44Ssb155480 	if (nvids != 0) {
1825c1c61f44Ssb155480 		D2(vswp, "%s: %s(%d): ", __func__, vid_propname, inst);
1826c1c61f44Ssb155480 		vids_size = sizeof (uint16_t) * nvids;
1827c1c61f44Ssb155480 		*vidspp = kmem_zalloc(vids_size, KM_SLEEP);
1828c1c61f44Ssb155480 		for (i = 0; i < nvids; i++) {
1829c1c61f44Ssb155480 			(*vidspp)[i] = data[i] & 0xFFFF;
1830c1c61f44Ssb155480 			D2(vswp, " %d ", (*vidspp)[i]);
1831c1c61f44Ssb155480 		}
1832c1c61f44Ssb155480 		D2(vswp, "\n");
1833c1c61f44Ssb155480 	}
1834c1c61f44Ssb155480 
1835c1c61f44Ssb155480 	*nvidsp = nvids;
1836c1c61f44Ssb155480 }
1837c1c61f44Ssb155480 
1838c1c61f44Ssb155480 /*
1839f0ca1d9aSsb155480  * This function reads "priority-ether-types" property from md. This property
1840f0ca1d9aSsb155480  * is used to enable support for priority frames. Applications which need
1841f0ca1d9aSsb155480  * guaranteed and timely delivery of certain high priority frames to/from
1842f0ca1d9aSsb155480  * a vnet or vsw within ldoms, should configure this property by providing
1843f0ca1d9aSsb155480  * the ether type(s) for which the priority facility is needed.
1844f0ca1d9aSsb155480  * Normal data frames are delivered over a ldc channel using the descriptor
1845f0ca1d9aSsb155480  * ring mechanism which is constrained by factors such as descriptor ring size,
1846f0ca1d9aSsb155480  * the rate at which the ring is processed at the peer ldc end point, etc.
1847f0ca1d9aSsb155480  * The priority mechanism provides an Out-Of-Band path to send/receive frames
1848f0ca1d9aSsb155480  * as raw pkt data (VIO_PKT_DATA) messages over the channel, avoiding the
1849f0ca1d9aSsb155480  * descriptor ring path and enables a more reliable and timely delivery of
1850f0ca1d9aSsb155480  * frames to the peer.
1851f0ca1d9aSsb155480  */
1852f0ca1d9aSsb155480 static void
1853f0ca1d9aSsb155480 vsw_read_pri_eth_types(vsw_t *vswp, md_t *mdp, mde_cookie_t node)
1854f0ca1d9aSsb155480 {
1855f0ca1d9aSsb155480 	int		rv;
1856f0ca1d9aSsb155480 	uint16_t	*types;
1857f0ca1d9aSsb155480 	uint64_t	*data;
1858f0ca1d9aSsb155480 	int		size;
1859f0ca1d9aSsb155480 	int		i;
1860f0ca1d9aSsb155480 	size_t		mblk_sz;
1861f0ca1d9aSsb155480 
1862f0ca1d9aSsb155480 	rv = md_get_prop_data(mdp, node, pri_types_propname,
1863f0ca1d9aSsb155480 	    (uint8_t **)&data, &size);
1864f0ca1d9aSsb155480 	if (rv != 0) {
1865f0ca1d9aSsb155480 		/*
1866f0ca1d9aSsb155480 		 * Property may not exist if we are running pre-ldoms1.1 f/w.
1867f0ca1d9aSsb155480 		 * Check if 'vsw_pri_eth_type' has been set in that case.
1868f0ca1d9aSsb155480 		 */
1869f0ca1d9aSsb155480 		if (vsw_pri_eth_type != 0) {
1870f0ca1d9aSsb155480 			size = sizeof (vsw_pri_eth_type);
1871f0ca1d9aSsb155480 			data = &vsw_pri_eth_type;
1872f0ca1d9aSsb155480 		} else {
1873f0ca1d9aSsb155480 			D3(vswp, "%s: prop(%s) not found", __func__,
1874f0ca1d9aSsb155480 			    pri_types_propname);
1875f0ca1d9aSsb155480 			size = 0;
1876f0ca1d9aSsb155480 		}
1877f0ca1d9aSsb155480 	}
1878f0ca1d9aSsb155480 
1879f0ca1d9aSsb155480 	if (size == 0) {
1880f0ca1d9aSsb155480 		vswp->pri_num_types = 0;
1881f0ca1d9aSsb155480 		return;
1882f0ca1d9aSsb155480 	}
1883f0ca1d9aSsb155480 
1884f0ca1d9aSsb155480 	/*
1885f0ca1d9aSsb155480 	 * we have some priority-ether-types defined;
1886f0ca1d9aSsb155480 	 * allocate a table of these types and also
1887f0ca1d9aSsb155480 	 * allocate a pool of mblks to transmit these
1888f0ca1d9aSsb155480 	 * priority packets.
1889f0ca1d9aSsb155480 	 */
1890f0ca1d9aSsb155480 	size /= sizeof (uint64_t);
1891f0ca1d9aSsb155480 	vswp->pri_num_types = size;
1892f0ca1d9aSsb155480 	vswp->pri_types = kmem_zalloc(size * sizeof (uint16_t), KM_SLEEP);
1893f0ca1d9aSsb155480 	for (i = 0, types = vswp->pri_types; i < size; i++) {
1894f0ca1d9aSsb155480 		types[i] = data[i] & 0xFFFF;
1895f0ca1d9aSsb155480 	}
1896f0ca1d9aSsb155480 	mblk_sz = (VIO_PKT_DATA_HDRSIZE + ETHERMAX + 7) & ~7;
1897f0ca1d9aSsb155480 	(void) vio_create_mblks(vsw_pri_tx_nmblks, mblk_sz, &vswp->pri_tx_vmp);
1898f0ca1d9aSsb155480 }
1899f0ca1d9aSsb155480 
19007b1f684aSSriharsha Basavapatna static void
19017b1f684aSSriharsha Basavapatna vsw_mtu_read(vsw_t *vswp, md_t *mdp, mde_cookie_t node, uint32_t *mtu)
19027b1f684aSSriharsha Basavapatna {
19037b1f684aSSriharsha Basavapatna 	int		rv;
19047b1f684aSSriharsha Basavapatna 	int		inst;
19057b1f684aSSriharsha Basavapatna 	uint64_t	val;
19067b1f684aSSriharsha Basavapatna 	char		*mtu_propname;
19077b1f684aSSriharsha Basavapatna 
19087b1f684aSSriharsha Basavapatna 	mtu_propname = vsw_mtu_propname;
19097b1f684aSSriharsha Basavapatna 	inst = vswp->instance;
19107b1f684aSSriharsha Basavapatna 
19117b1f684aSSriharsha Basavapatna 	rv = md_get_prop_val(mdp, node, mtu_propname, &val);
19127b1f684aSSriharsha Basavapatna 	if (rv != 0) {
19137b1f684aSSriharsha Basavapatna 		D3(vswp, "%s: prop(%s) not found", __func__, mtu_propname);
19147b1f684aSSriharsha Basavapatna 		*mtu = vsw_ethermtu;
19157b1f684aSSriharsha Basavapatna 	} else {
19167b1f684aSSriharsha Basavapatna 
19177b1f684aSSriharsha Basavapatna 		*mtu = val & 0xFFFF;
19187b1f684aSSriharsha Basavapatna 		D2(vswp, "%s: %s(%d): (%d)\n", __func__,
19197b1f684aSSriharsha Basavapatna 		    mtu_propname, inst, *mtu);
19207b1f684aSSriharsha Basavapatna 	}
19217b1f684aSSriharsha Basavapatna }
19227b1f684aSSriharsha Basavapatna 
19237b1f684aSSriharsha Basavapatna /*
19247b1f684aSSriharsha Basavapatna  * Update the mtu of the vsw device. We first check if the device has been
19257b1f684aSSriharsha Basavapatna  * plumbed and if so fail the mtu update. Otherwise, we continue to update the
19267b1f684aSSriharsha Basavapatna  * new mtu and reset all ports to initiate handshake re-negotiation with peers
19277b1f684aSSriharsha Basavapatna  * using the new mtu.
19287b1f684aSSriharsha Basavapatna  */
19297b1f684aSSriharsha Basavapatna static int
19307b1f684aSSriharsha Basavapatna vsw_mtu_update(vsw_t *vswp, uint32_t mtu)
19317b1f684aSSriharsha Basavapatna {
19327b1f684aSSriharsha Basavapatna 	int	rv;
19337b1f684aSSriharsha Basavapatna 
19347b1f684aSSriharsha Basavapatna 	WRITE_ENTER(&vswp->if_lockrw);
19357b1f684aSSriharsha Basavapatna 
19367b1f684aSSriharsha Basavapatna 	if (vswp->if_state & VSW_IF_UP) {
19377b1f684aSSriharsha Basavapatna 
19387b1f684aSSriharsha Basavapatna 		RW_EXIT(&vswp->if_lockrw);
19397b1f684aSSriharsha Basavapatna 
19407b1f684aSSriharsha Basavapatna 		cmn_err(CE_NOTE, "!vsw%d: Unable to process mtu update"
19417b1f684aSSriharsha Basavapatna 		    " as the device is plumbed\n", vswp->instance);
19427b1f684aSSriharsha Basavapatna 		return (EBUSY);
19437b1f684aSSriharsha Basavapatna 
19447b1f684aSSriharsha Basavapatna 	} else {
19457b1f684aSSriharsha Basavapatna 
19467b1f684aSSriharsha Basavapatna 		D2(vswp, "%s: curr_mtu(%d) new_mtu(%d)\n",
19477b1f684aSSriharsha Basavapatna 		    __func__, vswp->mtu, mtu);
19487b1f684aSSriharsha Basavapatna 
19497b1f684aSSriharsha Basavapatna 		vswp->mtu = mtu;
19507b1f684aSSriharsha Basavapatna 		vswp->max_frame_size = vswp->mtu +
19517b1f684aSSriharsha Basavapatna 		    sizeof (struct ether_header) + VLAN_TAGSZ;
19527b1f684aSSriharsha Basavapatna 
19537b1f684aSSriharsha Basavapatna 		rv = mac_maxsdu_update(vswp->if_mh, mtu);
19547b1f684aSSriharsha Basavapatna 		if (rv != 0) {
19557b1f684aSSriharsha Basavapatna 			cmn_err(CE_NOTE,
19567b1f684aSSriharsha Basavapatna 			    "!vsw%d: Unable to update mtu with mac"
19577b1f684aSSriharsha Basavapatna 			    " layer\n", vswp->instance);
19587b1f684aSSriharsha Basavapatna 		}
19597b1f684aSSriharsha Basavapatna 
19607b1f684aSSriharsha Basavapatna 		RW_EXIT(&vswp->if_lockrw);
19617b1f684aSSriharsha Basavapatna 
19627b1f684aSSriharsha Basavapatna 		WRITE_ENTER(&vswp->mac_rwlock);
19637b1f684aSSriharsha Basavapatna 
19647b1f684aSSriharsha Basavapatna 		if (vswp->mh == 0) {
19657b1f684aSSriharsha Basavapatna 			/*
19667b1f684aSSriharsha Basavapatna 			 * Physical device is not available yet; mtu will be
19677b1f684aSSriharsha Basavapatna 			 * updated after we open it successfully, as we have
19687b1f684aSSriharsha Basavapatna 			 * saved the new mtu.
19697b1f684aSSriharsha Basavapatna 			 */
19707b1f684aSSriharsha Basavapatna 			D2(vswp, "%s: Physical device:%s is not "
19717b1f684aSSriharsha Basavapatna 			    "available yet; can't update its mtu\n",
19727b1f684aSSriharsha Basavapatna 			    __func__, vswp->physname);
19737b1f684aSSriharsha Basavapatna 
19747b1f684aSSriharsha Basavapatna 		} else {
19757b1f684aSSriharsha Basavapatna 
19767b1f684aSSriharsha Basavapatna 			/*
19777b1f684aSSriharsha Basavapatna 			 * Stop and restart to enable the
19787b1f684aSSriharsha Basavapatna 			 * new mtu in the physical device.
19797b1f684aSSriharsha Basavapatna 			 */
19807b1f684aSSriharsha Basavapatna 			vsw_mac_detach(vswp);
19817b1f684aSSriharsha Basavapatna 			rv = vsw_mac_attach(vswp);
19827b1f684aSSriharsha Basavapatna 			if (rv != 0) {
19837b1f684aSSriharsha Basavapatna 				RW_EXIT(&vswp->mac_rwlock);
19847b1f684aSSriharsha Basavapatna 				return (EIO);
19857b1f684aSSriharsha Basavapatna 			}
19867b1f684aSSriharsha Basavapatna 
19877b1f684aSSriharsha Basavapatna 		}
19887b1f684aSSriharsha Basavapatna 
19897b1f684aSSriharsha Basavapatna 		RW_EXIT(&vswp->mac_rwlock);
19907b1f684aSSriharsha Basavapatna 
19917b1f684aSSriharsha Basavapatna 		/* Reset ports to renegotiate with the new mtu */
19927b1f684aSSriharsha Basavapatna 		vsw_reset_ports(vswp);
19937b1f684aSSriharsha Basavapatna 
19947b1f684aSSriharsha Basavapatna 	}
19957b1f684aSSriharsha Basavapatna 
19967b1f684aSSriharsha Basavapatna 	return (0);
19977b1f684aSSriharsha Basavapatna }
19987b1f684aSSriharsha Basavapatna 
1999f0ca1d9aSsb155480 /*
200034683adeSsg70180  * Check to see if the relevant properties in the specified node have
200134683adeSsg70180  * changed, and if so take the appropriate action.
200234683adeSsg70180  *
200334683adeSsg70180  * If any of the properties are missing or invalid we don't take
200434683adeSsg70180  * any action, as this function should only be invoked when modifications
200534683adeSsg70180  * have been made to what we assume is a working configuration, which
200634683adeSsg70180  * we leave active.
200734683adeSsg70180  *
200834683adeSsg70180  * Note it is legal for this routine to be invoked even if none of the
200934683adeSsg70180  * properties in the port node within the MD have actually changed.
201034683adeSsg70180  */
201134683adeSsg70180 static void
201234683adeSsg70180 vsw_update_md_prop(vsw_t *vswp, md_t *mdp, mde_cookie_t node)
201334683adeSsg70180 {
201434683adeSsg70180 	char		physname[LIFNAMSIZ];
201534683adeSsg70180 	char		drv[LIFNAMSIZ];
201634683adeSsg70180 	uint_t		ddi_instance;
201734683adeSsg70180 	uint8_t		new_smode[NUM_SMODES];
201834683adeSsg70180 	int		i, smode_num = 0;
201934683adeSsg70180 	uint64_t 	macaddr = 0;
202034683adeSsg70180 	enum		{MD_init = 0x1,
202134683adeSsg70180 				MD_physname = 0x2,
202234683adeSsg70180 				MD_macaddr = 0x4,
2023c1c61f44Ssb155480 				MD_smode = 0x8,
20247b1f684aSSriharsha Basavapatna 				MD_vlans = 0x10,
20257b1f684aSSriharsha Basavapatna 				MD_mtu = 0x20} updated;
202619b65a69Ssb155480 	int		rv;
2027c1c61f44Ssb155480 	uint16_t	pvid;
2028c1c61f44Ssb155480 	uint16_t	*vids;
2029c1c61f44Ssb155480 	uint16_t	nvids;
20307b1f684aSSriharsha Basavapatna 	uint32_t	mtu;
203134683adeSsg70180 
203234683adeSsg70180 	updated = MD_init;
203334683adeSsg70180 
203434683adeSsg70180 	D1(vswp, "%s: enter", __func__);
203534683adeSsg70180 
203634683adeSsg70180 	/*
203734683adeSsg70180 	 * Check if name of physical device in MD has changed.
203834683adeSsg70180 	 */
203934683adeSsg70180 	if (vsw_get_md_physname(vswp, mdp, node, (char *)&physname) == 0) {
204034683adeSsg70180 		/*
204134683adeSsg70180 		 * Do basic sanity check on new device name/instance,
204234683adeSsg70180 		 * if its non NULL. It is valid for the device name to
204334683adeSsg70180 		 * have changed from a non NULL to a NULL value, i.e.
204434683adeSsg70180 		 * the vsw is being changed to 'routed' mode.
204534683adeSsg70180 		 */
204634683adeSsg70180 		if ((strlen(physname) != 0) &&
204719b65a69Ssb155480 		    (ddi_parse(physname, drv,
204819b65a69Ssb155480 		    &ddi_instance) != DDI_SUCCESS)) {
20491ef0bbb5Snarayan 			cmn_err(CE_WARN, "!vsw%d: physical device %s is not"
205034683adeSsg70180 			    " a valid device name/instance",
205134683adeSsg70180 			    vswp->instance, physname);
205234683adeSsg70180 			goto fail_reconf;
205334683adeSsg70180 		}
205434683adeSsg70180 
205534683adeSsg70180 		if (strcmp(physname, vswp->physname)) {
205634683adeSsg70180 			D2(vswp, "%s: device name changed from %s to %s",
205734683adeSsg70180 			    __func__, vswp->physname, physname);
205834683adeSsg70180 
205934683adeSsg70180 			updated |= MD_physname;
206034683adeSsg70180 		} else {
206134683adeSsg70180 			D2(vswp, "%s: device name unchanged at %s",
206234683adeSsg70180 			    __func__, vswp->physname);
206334683adeSsg70180 		}
206434683adeSsg70180 	} else {
206534683adeSsg70180 		cmn_err(CE_WARN, "!vsw%d: Unable to read name of physical "
206634683adeSsg70180 		    "device from updated MD.", vswp->instance);
206734683adeSsg70180 		goto fail_reconf;
206834683adeSsg70180 	}
206934683adeSsg70180 
207034683adeSsg70180 	/*
207134683adeSsg70180 	 * Check if MAC address has changed.
207234683adeSsg70180 	 */
207334683adeSsg70180 	if (md_get_prop_val(mdp, node, macaddr_propname, &macaddr) != 0) {
207434683adeSsg70180 		cmn_err(CE_WARN, "!vsw%d: Unable to get MAC address from MD",
207534683adeSsg70180 		    vswp->instance);
207634683adeSsg70180 		goto fail_reconf;
207734683adeSsg70180 	} else {
207819b65a69Ssb155480 		uint64_t maddr = macaddr;
207934683adeSsg70180 		READ_ENTER(&vswp->if_lockrw);
208034683adeSsg70180 		for (i = ETHERADDRL - 1; i >= 0; i--) {
208119b65a69Ssb155480 			if (vswp->if_addr.ether_addr_octet[i]
208219b65a69Ssb155480 			    != (macaddr & 0xFF)) {
208334683adeSsg70180 				D2(vswp, "%s: octet[%d] 0x%x != 0x%x",
208434683adeSsg70180 				    __func__, i,
208534683adeSsg70180 				    vswp->if_addr.ether_addr_octet[i],
208634683adeSsg70180 				    (macaddr & 0xFF));
208734683adeSsg70180 				updated |= MD_macaddr;
208819b65a69Ssb155480 				macaddr = maddr;
208934683adeSsg70180 				break;
209034683adeSsg70180 			}
209134683adeSsg70180 			macaddr >>= 8;
209234683adeSsg70180 		}
209334683adeSsg70180 		RW_EXIT(&vswp->if_lockrw);
209419b65a69Ssb155480 		if (updated & MD_macaddr) {
209519b65a69Ssb155480 			vsw_save_lmacaddr(vswp, macaddr);
209619b65a69Ssb155480 		}
209734683adeSsg70180 	}
209834683adeSsg70180 
209934683adeSsg70180 	/*
210034683adeSsg70180 	 * Check if switching modes have changed.
210134683adeSsg70180 	 */
210219b65a69Ssb155480 	if (vsw_get_md_smodes(vswp, mdp, node,
210319b65a69Ssb155480 	    new_smode, &smode_num)) {
210434683adeSsg70180 		cmn_err(CE_WARN, "!vsw%d: Unable to read %s property from MD",
210534683adeSsg70180 		    vswp->instance, smode_propname);
210634683adeSsg70180 		goto fail_reconf;
210734683adeSsg70180 	} else {
210834683adeSsg70180 		ASSERT(smode_num != 0);
210934683adeSsg70180 		if (smode_num != vswp->smode_num) {
211034683adeSsg70180 			D2(vswp, "%s: number of modes changed from %d to %d",
211134683adeSsg70180 			    __func__, vswp->smode_num, smode_num);
211234683adeSsg70180 		}
211334683adeSsg70180 
211434683adeSsg70180 		for (i = 0; i < smode_num; i++) {
211534683adeSsg70180 			if (new_smode[i] != vswp->smode[i]) {
211634683adeSsg70180 				D2(vswp, "%s: mode changed from %d to %d",
211734683adeSsg70180 				    __func__, vswp->smode[i], new_smode[i]);
211834683adeSsg70180 				updated |= MD_smode;
211934683adeSsg70180 				break;
212034683adeSsg70180 			}
212134683adeSsg70180 		}
212234683adeSsg70180 	}
212334683adeSsg70180 
2124c1c61f44Ssb155480 	/* Read the vlan ids */
2125c1c61f44Ssb155480 	vsw_vlan_read_ids(vswp, VSW_LOCALDEV, mdp, node, &pvid, &vids,
2126c1c61f44Ssb155480 	    &nvids, NULL);
2127c1c61f44Ssb155480 
2128c1c61f44Ssb155480 	/* Determine if there are any vlan id updates */
2129c1c61f44Ssb155480 	if ((pvid != vswp->pvid) ||		/* pvid changed? */
2130c1c61f44Ssb155480 	    (nvids != vswp->nvids) ||		/* # of vids changed? */
2131c1c61f44Ssb155480 	    ((nvids != 0) && (vswp->nvids != 0) &&	/* vids changed? */
2132c1c61f44Ssb155480 	    bcmp(vids, vswp->vids, sizeof (uint16_t) * nvids))) {
2133c1c61f44Ssb155480 		updated |= MD_vlans;
2134c1c61f44Ssb155480 	}
2135c1c61f44Ssb155480 
21367b1f684aSSriharsha Basavapatna 	/* Read mtu */
21377b1f684aSSriharsha Basavapatna 	vsw_mtu_read(vswp, mdp, node, &mtu);
21387b1f684aSSriharsha Basavapatna 	if (mtu != vswp->mtu) {
21397b1f684aSSriharsha Basavapatna 		if (mtu >= ETHERMTU && mtu <= VNET_MAX_MTU) {
21407b1f684aSSriharsha Basavapatna 			updated |= MD_mtu;
21417b1f684aSSriharsha Basavapatna 		} else {
21427b1f684aSSriharsha Basavapatna 			cmn_err(CE_NOTE, "!vsw%d: Unable to process mtu update"
21437b1f684aSSriharsha Basavapatna 			    " as the specified value:%d is invalid\n",
21447b1f684aSSriharsha Basavapatna 			    vswp->instance, mtu);
21457b1f684aSSriharsha Basavapatna 		}
21467b1f684aSSriharsha Basavapatna 	}
21477b1f684aSSriharsha Basavapatna 
214834683adeSsg70180 	/*
214934683adeSsg70180 	 * Now make any changes which are needed...
215034683adeSsg70180 	 */
215134683adeSsg70180 
215234683adeSsg70180 	if (updated & (MD_physname | MD_smode)) {
215334683adeSsg70180 
215434683adeSsg70180 		/*
215519b65a69Ssb155480 		 * Stop any pending timeout to setup switching mode.
215634683adeSsg70180 		 */
215719b65a69Ssb155480 		vsw_stop_switching_timeout(vswp);
215819b65a69Ssb155480 
2159678453a8Sspeer 		/* Cleanup HybridIO */
2160678453a8Sspeer 		vsw_hio_cleanup(vswp);
2161678453a8Sspeer 
216219b65a69Ssb155480 		/*
216319b65a69Ssb155480 		 * Remove unicst, mcst addrs of vsw interface
216419b65a69Ssb155480 		 * and ports from the physdev.
216519b65a69Ssb155480 		 */
216619b65a69Ssb155480 		vsw_unset_addrs(vswp);
216719b65a69Ssb155480 
216819b65a69Ssb155480 		/*
216919b65a69Ssb155480 		 * Stop, detach and close the old device..
217019b65a69Ssb155480 		 */
21713c1bce15Swentaoy 		WRITE_ENTER(&vswp->mac_rwlock);
217219b65a69Ssb155480 
217334683adeSsg70180 		vsw_mac_detach(vswp);
217419b65a69Ssb155480 		vsw_mac_close(vswp);
217519b65a69Ssb155480 
21763c1bce15Swentaoy 		RW_EXIT(&vswp->mac_rwlock);
217734683adeSsg70180 
217834683adeSsg70180 		/*
217934683adeSsg70180 		 * Update phys name.
218034683adeSsg70180 		 */
218134683adeSsg70180 		if (updated & MD_physname) {
218234683adeSsg70180 			cmn_err(CE_NOTE, "!vsw%d: changing from %s to %s",
218334683adeSsg70180 			    vswp->instance, vswp->physname, physname);
218434683adeSsg70180 			(void) strncpy(vswp->physname,
218534683adeSsg70180 			    physname, strlen(physname) + 1);
218634683adeSsg70180 		}
218734683adeSsg70180 
218834683adeSsg70180 		/*
218934683adeSsg70180 		 * Update array with the new switch mode values.
219034683adeSsg70180 		 */
219134683adeSsg70180 		if (updated & MD_smode) {
219234683adeSsg70180 			for (i = 0; i < smode_num; i++)
219334683adeSsg70180 				vswp->smode[i] = new_smode[i];
219434683adeSsg70180 
219534683adeSsg70180 			vswp->smode_num = smode_num;
219634683adeSsg70180 			vswp->smode_idx = 0;
219734683adeSsg70180 		}
219834683adeSsg70180 
219934683adeSsg70180 		/*
220034683adeSsg70180 		 * ..and attach, start the new device.
220134683adeSsg70180 		 */
220219b65a69Ssb155480 		rv = vsw_setup_switching(vswp);
220319b65a69Ssb155480 		if (rv == EAGAIN) {
220419b65a69Ssb155480 			/*
220519b65a69Ssb155480 			 * Unable to setup switching mode.
220619b65a69Ssb155480 			 * As the error is EAGAIN, schedule a timeout to retry
220719b65a69Ssb155480 			 * and return. Programming addresses of ports and
220819b65a69Ssb155480 			 * vsw interface will be done when the timeout handler
220919b65a69Ssb155480 			 * completes successfully.
221019b65a69Ssb155480 			 */
221119b65a69Ssb155480 			mutex_enter(&vswp->swtmout_lock);
221219b65a69Ssb155480 
221319b65a69Ssb155480 			vswp->swtmout_enabled = B_TRUE;
221419b65a69Ssb155480 			vswp->swtmout_id =
221519b65a69Ssb155480 			    timeout(vsw_setup_switching_timeout, vswp,
221619b65a69Ssb155480 			    (vsw_setup_switching_delay *
221719b65a69Ssb155480 			    drv_usectohz(MICROSEC)));
221819b65a69Ssb155480 
221919b65a69Ssb155480 			mutex_exit(&vswp->swtmout_lock);
222019b65a69Ssb155480 
222119b65a69Ssb155480 			return;
222219b65a69Ssb155480 
222319b65a69Ssb155480 		} else if (rv) {
222434683adeSsg70180 			goto fail_update;
222519b65a69Ssb155480 		}
222634683adeSsg70180 
2227*71bdf936SWENTAO YANG 		vsw_setup_layer2_post_process(vswp);
222819b65a69Ssb155480 	} else if (updated & MD_macaddr) {
222919b65a69Ssb155480 		/*
223019b65a69Ssb155480 		 * We enter here if only MD_macaddr is exclusively updated.
223119b65a69Ssb155480 		 * If MD_physname and/or MD_smode are also updated, then
223219b65a69Ssb155480 		 * as part of that, we would have implicitly processed
223319b65a69Ssb155480 		 * MD_macaddr update (above).
223419b65a69Ssb155480 		 */
223534683adeSsg70180 		cmn_err(CE_NOTE, "!vsw%d: changing mac address to 0x%lx",
223634683adeSsg70180 		    vswp->instance, macaddr);
223734683adeSsg70180 
223819b65a69Ssb155480 		READ_ENTER(&vswp->if_lockrw);
223919b65a69Ssb155480 		if (vswp->if_state & VSW_IF_UP) {
224034683adeSsg70180 
22415f94e909Ssg70180 			mutex_enter(&vswp->hw_lock);
224219b65a69Ssb155480 			/*
224319b65a69Ssb155480 			 * Remove old mac address of vsw interface
224419b65a69Ssb155480 			 * from the physdev
224519b65a69Ssb155480 			 */
22465f94e909Ssg70180 			(void) vsw_unset_hw(vswp, NULL, VSW_LOCALDEV);
224719b65a69Ssb155480 			/*
224819b65a69Ssb155480 			 * Program new mac address of vsw interface
224919b65a69Ssb155480 			 * in the physdev
225019b65a69Ssb155480 			 */
225119b65a69Ssb155480 			rv = vsw_set_hw(vswp, NULL, VSW_LOCALDEV);
22525f94e909Ssg70180 			mutex_exit(&vswp->hw_lock);
225319b65a69Ssb155480 			if (rv != 0) {
225419b65a69Ssb155480 				cmn_err(CE_NOTE,
225519b65a69Ssb155480 				    "!vsw%d: failed to program interface "
225619b65a69Ssb155480 				    "unicast address\n", vswp->instance);
225719b65a69Ssb155480 			}
22585f94e909Ssg70180 			/*
225934683adeSsg70180 			 * Notify the MAC layer of the changed address.
226034683adeSsg70180 			 */
226119b65a69Ssb155480 			mac_unicst_update(vswp->if_mh,
226219b65a69Ssb155480 			    (uint8_t *)&vswp->if_addr);
226319b65a69Ssb155480 
226419b65a69Ssb155480 		}
226519b65a69Ssb155480 		RW_EXIT(&vswp->if_lockrw);
226619b65a69Ssb155480 
226734683adeSsg70180 	}
226834683adeSsg70180 
2269c1c61f44Ssb155480 	if (updated & MD_vlans) {
2270c1c61f44Ssb155480 		/* Remove existing vlan ids from the hash table. */
2271c1c61f44Ssb155480 		vsw_vlan_remove_ids(vswp, VSW_LOCALDEV);
2272c1c61f44Ssb155480 
2273c1c61f44Ssb155480 		/* save the new vlan ids */
2274c1c61f44Ssb155480 		vswp->pvid = pvid;
2275c1c61f44Ssb155480 		if (vswp->nvids != 0) {
2276c1c61f44Ssb155480 			kmem_free(vswp->vids, sizeof (uint16_t) * vswp->nvids);
2277c1c61f44Ssb155480 			vswp->nvids = 0;
2278c1c61f44Ssb155480 		}
2279c1c61f44Ssb155480 		if (nvids != 0) {
2280c1c61f44Ssb155480 			vswp->nvids = nvids;
2281c1c61f44Ssb155480 			vswp->vids = vids;
2282c1c61f44Ssb155480 		}
2283c1c61f44Ssb155480 
2284c1c61f44Ssb155480 		/* add these new vlan ids into hash table */
2285c1c61f44Ssb155480 		vsw_vlan_add_ids(vswp, VSW_LOCALDEV);
2286c1c61f44Ssb155480 	} else {
2287c1c61f44Ssb155480 		if (nvids != 0) {
2288c1c61f44Ssb155480 			kmem_free(vids, sizeof (uint16_t) * nvids);
2289c1c61f44Ssb155480 		}
2290c1c61f44Ssb155480 	}
2291c1c61f44Ssb155480 
22927b1f684aSSriharsha Basavapatna 	if (updated & MD_mtu) {
22937b1f684aSSriharsha Basavapatna 
22947b1f684aSSriharsha Basavapatna 		rv = vsw_mtu_update(vswp, mtu);
22957b1f684aSSriharsha Basavapatna 		if (rv != 0) {
22967b1f684aSSriharsha Basavapatna 			goto fail_update;
22977b1f684aSSriharsha Basavapatna 		}
22987b1f684aSSriharsha Basavapatna 
22997b1f684aSSriharsha Basavapatna 	}
23007b1f684aSSriharsha Basavapatna 
230134683adeSsg70180 	return;
230234683adeSsg70180 
230334683adeSsg70180 fail_reconf:
230434683adeSsg70180 	cmn_err(CE_WARN, "!vsw%d: configuration unchanged", vswp->instance);
230534683adeSsg70180 	return;
230634683adeSsg70180 
230734683adeSsg70180 fail_update:
23081ef0bbb5Snarayan 	cmn_err(CE_WARN, "!vsw%d: re-configuration failed",
230934683adeSsg70180 	    vswp->instance);
231034683adeSsg70180 }
231134683adeSsg70180 
231234683adeSsg70180 /*
2313c1c61f44Ssb155480  * Read the port's md properties.
23141ae08745Sheppo  */
2315c1c61f44Ssb155480 static int
2316c1c61f44Ssb155480 vsw_port_read_props(vsw_port_t *portp, vsw_t *vswp,
2317c1c61f44Ssb155480 	md_t *mdp, mde_cookie_t *node)
23181ae08745Sheppo {
23191ae08745Sheppo 	uint64_t		ldc_id;
23201ae08745Sheppo 	uint8_t			*addrp;
23211ae08745Sheppo 	int			i, addrsz;
23221ae08745Sheppo 	int			num_nodes = 0, nchan = 0;
23231ae08745Sheppo 	int			listsz = 0;
23241ae08745Sheppo 	mde_cookie_t		*listp = NULL;
23251ae08745Sheppo 	struct ether_addr	ea;
23261ae08745Sheppo 	uint64_t		macaddr;
23271ae08745Sheppo 	uint64_t		inst = 0;
2328678453a8Sspeer 	uint64_t		val;
23291ae08745Sheppo 
23301ae08745Sheppo 	if (md_get_prop_val(mdp, *node, id_propname, &inst)) {
23311ae08745Sheppo 		DWARN(vswp, "%s: prop(%s) not found", __func__,
23321ae08745Sheppo 		    id_propname);
23331ae08745Sheppo 		return (1);
23341ae08745Sheppo 	}
23351ae08745Sheppo 
23361ae08745Sheppo 	/*
23371ae08745Sheppo 	 * Find the channel endpoint node(s) (which should be under this
23381ae08745Sheppo 	 * port node) which contain the channel id(s).
23391ae08745Sheppo 	 */
23401ae08745Sheppo 	if ((num_nodes = md_node_count(mdp)) <= 0) {
23411ae08745Sheppo 		DERR(vswp, "%s: invalid number of nodes found (%d)",
23421ae08745Sheppo 		    __func__, num_nodes);
23431ae08745Sheppo 		return (1);
23441ae08745Sheppo 	}
23451ae08745Sheppo 
234634683adeSsg70180 	D2(vswp, "%s: %d nodes found", __func__, num_nodes);
234734683adeSsg70180 
23481ae08745Sheppo 	/* allocate enough space for node list */
23491ae08745Sheppo 	listsz = num_nodes * sizeof (mde_cookie_t);
23501ae08745Sheppo 	listp = kmem_zalloc(listsz, KM_SLEEP);
23511ae08745Sheppo 
2352205eeb1aSlm66018 	nchan = md_scan_dag(mdp, *node, md_find_name(mdp, chan_propname),
23531ae08745Sheppo 	    md_find_name(mdp, "fwd"), listp);
23541ae08745Sheppo 
23551ae08745Sheppo 	if (nchan <= 0) {
23561ae08745Sheppo 		DWARN(vswp, "%s: no %s nodes found", __func__, chan_propname);
23571ae08745Sheppo 		kmem_free(listp, listsz);
23581ae08745Sheppo 		return (1);
23591ae08745Sheppo 	}
23601ae08745Sheppo 
23611ae08745Sheppo 	D2(vswp, "%s: %d %s nodes found", __func__, nchan, chan_propname);
23621ae08745Sheppo 
23631ae08745Sheppo 	/* use property from first node found */
23641ae08745Sheppo 	if (md_get_prop_val(mdp, listp[0], id_propname, &ldc_id)) {
23651ae08745Sheppo 		DWARN(vswp, "%s: prop(%s) not found\n", __func__,
23661ae08745Sheppo 		    id_propname);
23671ae08745Sheppo 		kmem_free(listp, listsz);
23681ae08745Sheppo 		return (1);
23691ae08745Sheppo 	}
23701ae08745Sheppo 
23711ae08745Sheppo 	/* don't need list any more */
23721ae08745Sheppo 	kmem_free(listp, listsz);
23731ae08745Sheppo 
23741ae08745Sheppo 	D2(vswp, "%s: ldc_id 0x%llx", __func__, ldc_id);
23751ae08745Sheppo 
23761ae08745Sheppo 	/* read mac-address property */
23771ae08745Sheppo 	if (md_get_prop_data(mdp, *node, remaddr_propname,
23781ae08745Sheppo 	    &addrp, &addrsz)) {
23791ae08745Sheppo 		DWARN(vswp, "%s: prop(%s) not found",
23801ae08745Sheppo 		    __func__, remaddr_propname);
23811ae08745Sheppo 		return (1);
23821ae08745Sheppo 	}
23831ae08745Sheppo 
23841ae08745Sheppo 	if (addrsz < ETHERADDRL) {
23851ae08745Sheppo 		DWARN(vswp, "%s: invalid address size", __func__);
23861ae08745Sheppo 		return (1);
23871ae08745Sheppo 	}
23881ae08745Sheppo 
23891ae08745Sheppo 	macaddr = *((uint64_t *)addrp);
23901ae08745Sheppo 	D2(vswp, "%s: remote mac address 0x%llx", __func__, macaddr);
23911ae08745Sheppo 
23921ae08745Sheppo 	for (i = ETHERADDRL - 1; i >= 0; i--) {
23931ae08745Sheppo 		ea.ether_addr_octet[i] = macaddr & 0xFF;
23941ae08745Sheppo 		macaddr >>= 8;
23951ae08745Sheppo 	}
23961ae08745Sheppo 
2397c1c61f44Ssb155480 	/* now update all properties into the port */
2398c1c61f44Ssb155480 	portp->p_vswp = vswp;
2399c1c61f44Ssb155480 	portp->p_instance = inst;
2400c1c61f44Ssb155480 	portp->addr_set = VSW_ADDR_UNSET;
2401c1c61f44Ssb155480 	ether_copy(&ea, &portp->p_macaddr);
2402c1c61f44Ssb155480 	if (nchan > VSW_PORT_MAX_LDCS) {
2403c1c61f44Ssb155480 		D2(vswp, "%s: using first of %d ldc ids",
2404c1c61f44Ssb155480 		    __func__, nchan);
2405c1c61f44Ssb155480 		nchan = VSW_PORT_MAX_LDCS;
2406c1c61f44Ssb155480 	}
2407c1c61f44Ssb155480 	portp->num_ldcs = nchan;
2408c1c61f44Ssb155480 	portp->ldc_ids =
2409c1c61f44Ssb155480 	    kmem_zalloc(sizeof (uint64_t) * nchan, KM_SLEEP);
2410c1c61f44Ssb155480 	bcopy(&ldc_id, (portp->ldc_ids), sizeof (uint64_t) * nchan);
2411c1c61f44Ssb155480 
2412c1c61f44Ssb155480 	/* read vlan id properties of this port node */
2413c1c61f44Ssb155480 	vsw_vlan_read_ids(portp, VSW_VNETPORT, mdp, *node, &portp->pvid,
2414c1c61f44Ssb155480 	    &portp->vids, &portp->nvids, NULL);
2415c1c61f44Ssb155480 
2416678453a8Sspeer 	/* Check if hybrid property is present */
2417678453a8Sspeer 	if (md_get_prop_val(mdp, *node, hybrid_propname, &val) == 0) {
2418678453a8Sspeer 		D1(vswp, "%s: prop(%s) found\n", __func__, hybrid_propname);
2419678453a8Sspeer 		portp->p_hio_enabled = B_TRUE;
2420678453a8Sspeer 	} else {
2421678453a8Sspeer 		portp->p_hio_enabled = B_FALSE;
2422678453a8Sspeer 	}
2423678453a8Sspeer 	/*
2424678453a8Sspeer 	 * Port hio capability determined after version
2425678453a8Sspeer 	 * negotiation, i.e., when we know the peer is HybridIO capable.
2426678453a8Sspeer 	 */
2427678453a8Sspeer 	portp->p_hio_capable = B_FALSE;
2428c1c61f44Ssb155480 	return (0);
2429c1c61f44Ssb155480 }
2430c1c61f44Ssb155480 
2431c1c61f44Ssb155480 /*
2432c1c61f44Ssb155480  * Add a new port to the system.
2433c1c61f44Ssb155480  *
2434c1c61f44Ssb155480  * Returns 0 on success, 1 on failure.
2435c1c61f44Ssb155480  */
2436c1c61f44Ssb155480 int
2437c1c61f44Ssb155480 vsw_port_add(vsw_t *vswp, md_t *mdp, mde_cookie_t *node)
2438c1c61f44Ssb155480 {
2439c1c61f44Ssb155480 	vsw_port_t	*portp;
2440c1c61f44Ssb155480 	int		rv;
2441c1c61f44Ssb155480 
2442c1c61f44Ssb155480 	portp = kmem_zalloc(sizeof (vsw_port_t), KM_SLEEP);
2443c1c61f44Ssb155480 
2444c1c61f44Ssb155480 	rv = vsw_port_read_props(portp, vswp, mdp, node);
2445c1c61f44Ssb155480 	if (rv != 0) {
2446c1c61f44Ssb155480 		kmem_free(portp, sizeof (*portp));
2447c1c61f44Ssb155480 		return (1);
2448c1c61f44Ssb155480 	}
2449c1c61f44Ssb155480 
2450c1c61f44Ssb155480 	rv = vsw_port_attach(portp);
2451c1c61f44Ssb155480 	if (rv != 0) {
24521ae08745Sheppo 		DERR(vswp, "%s: failed to attach port", __func__);
24531ae08745Sheppo 		return (1);
24541ae08745Sheppo 	}
24551ae08745Sheppo 
2456c1c61f44Ssb155480 	return (0);
2457c1c61f44Ssb155480 }
24581ae08745Sheppo 
2459c1c61f44Ssb155480 static int
2460c1c61f44Ssb155480 vsw_port_update(vsw_t *vswp, md_t *curr_mdp, mde_cookie_t curr_mdex,
2461c1c61f44Ssb155480 	md_t *prev_mdp, mde_cookie_t prev_mdex)
2462c1c61f44Ssb155480 {
2463c1c61f44Ssb155480 	uint64_t	cport_num;
2464c1c61f44Ssb155480 	uint64_t	pport_num;
2465c1c61f44Ssb155480 	vsw_port_list_t	*plistp;
2466c1c61f44Ssb155480 	vsw_port_t	*portp;
2467c1c61f44Ssb155480 	boolean_t	updated_vlans = B_FALSE;
2468c1c61f44Ssb155480 	uint16_t	pvid;
2469c1c61f44Ssb155480 	uint16_t	*vids;
2470c1c61f44Ssb155480 	uint16_t	nvids;
2471678453a8Sspeer 	uint64_t	val;
2472678453a8Sspeer 	boolean_t	hio_enabled = B_FALSE;
2473c1c61f44Ssb155480 
2474c1c61f44Ssb155480 	/*
2475c1c61f44Ssb155480 	 * For now, we get port updates only if vlan ids changed.
2476c1c61f44Ssb155480 	 * We read the port num and do some sanity check.
2477c1c61f44Ssb155480 	 */
2478c1c61f44Ssb155480 	if (md_get_prop_val(curr_mdp, curr_mdex, id_propname, &cport_num)) {
2479c1c61f44Ssb155480 		return (1);
2480c1c61f44Ssb155480 	}
2481c1c61f44Ssb155480 
2482c1c61f44Ssb155480 	if (md_get_prop_val(prev_mdp, prev_mdex, id_propname, &pport_num)) {
2483c1c61f44Ssb155480 		return (1);
2484c1c61f44Ssb155480 	}
2485c1c61f44Ssb155480 	if (cport_num != pport_num)
2486c1c61f44Ssb155480 		return (1);
2487c1c61f44Ssb155480 
2488c1c61f44Ssb155480 	plistp = &(vswp->plist);
2489c1c61f44Ssb155480 
2490c1c61f44Ssb155480 	READ_ENTER(&plistp->lockrw);
2491c1c61f44Ssb155480 
2492c1c61f44Ssb155480 	portp = vsw_lookup_port(vswp, cport_num);
2493c1c61f44Ssb155480 	if (portp == NULL) {
2494c1c61f44Ssb155480 		RW_EXIT(&plistp->lockrw);
2495c1c61f44Ssb155480 		return (1);
2496c1c61f44Ssb155480 	}
2497c1c61f44Ssb155480 
2498c1c61f44Ssb155480 	/* Read the vlan ids */
2499c1c61f44Ssb155480 	vsw_vlan_read_ids(portp, VSW_VNETPORT, curr_mdp, curr_mdex, &pvid,
2500c1c61f44Ssb155480 	    &vids, &nvids, NULL);
2501c1c61f44Ssb155480 
2502c1c61f44Ssb155480 	/* Determine if there are any vlan id updates */
2503c1c61f44Ssb155480 	if ((pvid != portp->pvid) ||		/* pvid changed? */
2504c1c61f44Ssb155480 	    (nvids != portp->nvids) ||		/* # of vids changed? */
2505c1c61f44Ssb155480 	    ((nvids != 0) && (portp->nvids != 0) &&	/* vids changed? */
2506c1c61f44Ssb155480 	    bcmp(vids, portp->vids, sizeof (uint16_t) * nvids))) {
2507c1c61f44Ssb155480 		updated_vlans = B_TRUE;
2508c1c61f44Ssb155480 	}
2509c1c61f44Ssb155480 
2510678453a8Sspeer 	if (updated_vlans == B_TRUE) {
2511c1c61f44Ssb155480 
2512c1c61f44Ssb155480 		/* Remove existing vlan ids from the hash table. */
2513c1c61f44Ssb155480 		vsw_vlan_remove_ids(portp, VSW_VNETPORT);
2514c1c61f44Ssb155480 
2515c1c61f44Ssb155480 		/* save the new vlan ids */
2516c1c61f44Ssb155480 		portp->pvid = pvid;
2517c1c61f44Ssb155480 		if (portp->nvids != 0) {
2518678453a8Sspeer 			kmem_free(portp->vids,
2519678453a8Sspeer 			    sizeof (uint16_t) * portp->nvids);
2520c1c61f44Ssb155480 			portp->nvids = 0;
2521c1c61f44Ssb155480 		}
2522c1c61f44Ssb155480 		if (nvids != 0) {
2523678453a8Sspeer 			portp->vids = kmem_zalloc(sizeof (uint16_t) *
2524678453a8Sspeer 			    nvids, KM_SLEEP);
2525c1c61f44Ssb155480 			bcopy(vids, portp->vids, sizeof (uint16_t) * nvids);
2526c1c61f44Ssb155480 			portp->nvids = nvids;
2527c1c61f44Ssb155480 			kmem_free(vids, sizeof (uint16_t) * nvids);
2528c1c61f44Ssb155480 		}
2529c1c61f44Ssb155480 
2530c1c61f44Ssb155480 		/* add these new vlan ids into hash table */
2531c1c61f44Ssb155480 		vsw_vlan_add_ids(portp, VSW_VNETPORT);
2532c1c61f44Ssb155480 
2533c1c61f44Ssb155480 		/* reset the port if it is vlan unaware (ver < 1.3) */
2534c1c61f44Ssb155480 		vsw_vlan_unaware_port_reset(portp);
2535678453a8Sspeer 	}
2536678453a8Sspeer 
2537678453a8Sspeer 	/* Check if hybrid property is present */
2538678453a8Sspeer 	if (md_get_prop_val(curr_mdp, curr_mdex, hybrid_propname, &val) == 0) {
2539678453a8Sspeer 		D1(vswp, "%s: prop(%s) found\n", __func__, hybrid_propname);
2540678453a8Sspeer 		hio_enabled = B_TRUE;
2541678453a8Sspeer 	}
2542678453a8Sspeer 
2543678453a8Sspeer 	if (portp->p_hio_enabled != hio_enabled) {
2544678453a8Sspeer 		vsw_hio_port_update(portp, hio_enabled);
2545678453a8Sspeer 	}
2546c1c61f44Ssb155480 
2547c1c61f44Ssb155480 	RW_EXIT(&plistp->lockrw);
25481ae08745Sheppo 
25491ae08745Sheppo 	return (0);
25501ae08745Sheppo }
25511ae08745Sheppo 
25521ae08745Sheppo /*
255306db247cSraghuram  * vsw_mac_rx -- A common function to send packets to the interface.
255406db247cSraghuram  * By default this function check if the interface is UP or not, the
255506db247cSraghuram  * rest of the behaviour depends on the flags as below:
25561ae08745Sheppo  *
255706db247cSraghuram  *	VSW_MACRX_PROMISC -- Check if the promisc mode set or not.
255806db247cSraghuram  *	VSW_MACRX_COPYMSG -- Make a copy of the message(s).
255906db247cSraghuram  *	VSW_MACRX_FREEMSG -- Free if the messages cannot be sent up the stack.
25601ae08745Sheppo  */
25611ae08745Sheppo void
2562f0ca1d9aSsb155480 vsw_mac_rx(vsw_t *vswp, mac_resource_handle_t mrh,
2563f0ca1d9aSsb155480     mblk_t *mp, vsw_macrx_flags_t flags)
25641ae08745Sheppo {
2565c1c61f44Ssb155480 	mblk_t		*mpt;
2566c1c61f44Ssb155480 
256706db247cSraghuram 	D1(vswp, "%s:enter\n", __func__);
25681ae08745Sheppo 	READ_ENTER(&vswp->if_lockrw);
256906db247cSraghuram 	/* Check if the interface is up */
257006db247cSraghuram 	if (!(vswp->if_state & VSW_IF_UP)) {
25711ae08745Sheppo 		RW_EXIT(&vswp->if_lockrw);
257206db247cSraghuram 		/* Free messages only if FREEMSG flag specified */
257306db247cSraghuram 		if (flags & VSW_MACRX_FREEMSG) {
257406db247cSraghuram 			freemsgchain(mp);
257506db247cSraghuram 		}
257606db247cSraghuram 		D1(vswp, "%s:exit\n", __func__);
257706db247cSraghuram 		return;
257806db247cSraghuram 	}
257906db247cSraghuram 	/*
258006db247cSraghuram 	 * If PROMISC flag is passed, then check if
258106db247cSraghuram 	 * the interface is in the PROMISC mode.
258206db247cSraghuram 	 * If not, drop the messages.
258306db247cSraghuram 	 */
258406db247cSraghuram 	if (flags & VSW_MACRX_PROMISC) {
258506db247cSraghuram 		if (!(vswp->if_state & VSW_IF_PROMISC)) {
258606db247cSraghuram 			RW_EXIT(&vswp->if_lockrw);
258706db247cSraghuram 			/* Free messages only if FREEMSG flag specified */
258806db247cSraghuram 			if (flags & VSW_MACRX_FREEMSG) {
258906db247cSraghuram 				freemsgchain(mp);
259006db247cSraghuram 			}
259106db247cSraghuram 			D1(vswp, "%s:exit\n", __func__);
259206db247cSraghuram 			return;
259306db247cSraghuram 		}
259406db247cSraghuram 	}
259506db247cSraghuram 	RW_EXIT(&vswp->if_lockrw);
259606db247cSraghuram 	/*
259706db247cSraghuram 	 * If COPYMSG flag is passed, then make a copy
259806db247cSraghuram 	 * of the message chain and send up the copy.
259906db247cSraghuram 	 */
260006db247cSraghuram 	if (flags & VSW_MACRX_COPYMSG) {
260106db247cSraghuram 		mp = copymsgchain(mp);
2602f0ca1d9aSsb155480 		if (mp == NULL) {
260306db247cSraghuram 			D1(vswp, "%s:exit\n", __func__);
260406db247cSraghuram 			return;
260506db247cSraghuram 		}
260606db247cSraghuram 	}
260706db247cSraghuram 
2608f0ca1d9aSsb155480 	D2(vswp, "%s: sending up stack", __func__);
2609c1c61f44Ssb155480 
2610c1c61f44Ssb155480 	mpt = NULL;
2611c1c61f44Ssb155480 	(void) vsw_vlan_frame_untag(vswp, VSW_LOCALDEV, &mp, &mpt);
2612c1c61f44Ssb155480 	if (mp != NULL) {
2613ba2e4443Sseb 		mac_rx(vswp->if_mh, mrh, mp);
2614c1c61f44Ssb155480 	}
261506db247cSraghuram 	D1(vswp, "%s:exit\n", __func__);
26161ae08745Sheppo }
26171ae08745Sheppo 
261806db247cSraghuram /* copy mac address of vsw into soft state structure */
26191ae08745Sheppo static void
262006db247cSraghuram vsw_save_lmacaddr(vsw_t *vswp, uint64_t macaddr)
26211ae08745Sheppo {
26221ae08745Sheppo 	int	i;
26231ae08745Sheppo 
262406db247cSraghuram 	WRITE_ENTER(&vswp->if_lockrw);
262506db247cSraghuram 	for (i = ETHERADDRL - 1; i >= 0; i--) {
262606db247cSraghuram 		vswp->if_addr.ether_addr_octet[i] = macaddr & 0xFF;
262706db247cSraghuram 		macaddr >>= 8;
26281ae08745Sheppo 	}
262906db247cSraghuram 	RW_EXIT(&vswp->if_lockrw);
26301ae08745Sheppo }
2631