11ae08745Sheppo /* 21ae08745Sheppo * CDDL HEADER START 31ae08745Sheppo * 41ae08745Sheppo * The contents of this file are subject to the terms of the 51ae08745Sheppo * Common Development and Distribution License (the "License"). 61ae08745Sheppo * You may not use this file except in compliance with the License. 71ae08745Sheppo * 81ae08745Sheppo * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 91ae08745Sheppo * or http://www.opensolaris.org/os/licensing. 101ae08745Sheppo * See the License for the specific language governing permissions 111ae08745Sheppo * and limitations under the License. 121ae08745Sheppo * 131ae08745Sheppo * When distributing Covered Code, include this CDDL HEADER in each 141ae08745Sheppo * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 151ae08745Sheppo * If applicable, add the following below this CDDL HEADER, with the 161ae08745Sheppo * fields enclosed by brackets "[]" replaced with your own identifying 171ae08745Sheppo * information: Portions Copyright [yyyy] [name of copyright owner] 181ae08745Sheppo * 191ae08745Sheppo * CDDL HEADER END 201ae08745Sheppo */ 211ae08745Sheppo 221ae08745Sheppo /* 23*6f09f0feSWENTAO YANG * Copyright 2009 Sun Microsystems, Inc. All rights reserved. 241ae08745Sheppo * Use is subject to license terms. 251ae08745Sheppo */ 261ae08745Sheppo 271ae08745Sheppo #include <sys/types.h> 281ae08745Sheppo #include <sys/errno.h> 291ae08745Sheppo #include <sys/debug.h> 301ae08745Sheppo #include <sys/time.h> 311ae08745Sheppo #include <sys/sysmacros.h> 321ae08745Sheppo #include <sys/systm.h> 331ae08745Sheppo #include <sys/user.h> 341ae08745Sheppo #include <sys/stropts.h> 351ae08745Sheppo #include <sys/stream.h> 361ae08745Sheppo #include <sys/strlog.h> 371ae08745Sheppo #include <sys/strsubr.h> 381ae08745Sheppo #include <sys/cmn_err.h> 391ae08745Sheppo #include <sys/cpu.h> 401ae08745Sheppo #include <sys/kmem.h> 411ae08745Sheppo #include <sys/conf.h> 421ae08745Sheppo #include <sys/ddi.h> 431ae08745Sheppo #include <sys/sunddi.h> 441ae08745Sheppo #include <sys/ksynch.h> 451ae08745Sheppo #include <sys/stat.h> 461ae08745Sheppo #include <sys/kstat.h> 471ae08745Sheppo #include <sys/vtrace.h> 481ae08745Sheppo #include <sys/strsun.h> 491ae08745Sheppo #include <sys/dlpi.h> 501ae08745Sheppo #include <sys/ethernet.h> 511ae08745Sheppo #include <net/if.h> 521ae08745Sheppo #include <sys/varargs.h> 531ae08745Sheppo #include <sys/machsystm.h> 541ae08745Sheppo #include <sys/modctl.h> 551ae08745Sheppo #include <sys/modhash.h> 56da14cebeSEric Cheng #include <sys/mac_provider.h> 57ba2e4443Sseb #include <sys/mac_ether.h> 581ae08745Sheppo #include <sys/taskq.h> 591ae08745Sheppo #include <sys/note.h> 601ae08745Sheppo #include <sys/mach_descrip.h> 61da14cebeSEric Cheng #include <sys/mac_provider.h> 621ae08745Sheppo #include <sys/mdeg.h> 631ae08745Sheppo #include <sys/ldc.h> 641ae08745Sheppo #include <sys/vsw_fdb.h> 651ae08745Sheppo #include <sys/vsw.h> 661ae08745Sheppo #include <sys/vio_mailbox.h> 671ae08745Sheppo #include <sys/vnet_mailbox.h> 681ae08745Sheppo #include <sys/vnet_common.h> 69d10e4ef2Snarayan #include <sys/vio_util.h> 70d10e4ef2Snarayan #include <sys/sdt.h> 7119b65a69Ssb155480 #include <sys/atomic.h> 7206db247cSraghuram #include <sys/callb.h> 73c1c61f44Ssb155480 #include <sys/vlan.h> 741ae08745Sheppo 751ae08745Sheppo /* 761ae08745Sheppo * Function prototypes. 771ae08745Sheppo */ 781ae08745Sheppo static int vsw_attach(dev_info_t *, ddi_attach_cmd_t); 791ae08745Sheppo static int vsw_detach(dev_info_t *, ddi_detach_cmd_t); 80*6f09f0feSWENTAO YANG static int vsw_unattach(vsw_t *vswp); 8134683adeSsg70180 static int vsw_get_md_physname(vsw_t *, md_t *, mde_cookie_t, char *); 82da14cebeSEric Cheng static int vsw_get_md_smodes(vsw_t *, md_t *, mde_cookie_t, uint8_t *); 83*6f09f0feSWENTAO YANG static int vsw_mod_cleanup(void); 841ae08745Sheppo 851ae08745Sheppo /* MDEG routines */ 8634683adeSsg70180 static int vsw_mdeg_register(vsw_t *vswp); 871ae08745Sheppo static void vsw_mdeg_unregister(vsw_t *vswp); 881ae08745Sheppo static int vsw_mdeg_cb(void *cb_argp, mdeg_result_t *); 8934683adeSsg70180 static int vsw_port_mdeg_cb(void *cb_argp, mdeg_result_t *); 9019b65a69Ssb155480 static int vsw_get_initial_md_properties(vsw_t *vswp, md_t *, mde_cookie_t); 91c1c61f44Ssb155480 static int vsw_read_mdprops(vsw_t *vswp); 92c1c61f44Ssb155480 static void vsw_vlan_read_ids(void *arg, int type, md_t *mdp, 93da14cebeSEric Cheng mde_cookie_t node, uint16_t *pvidp, vsw_vlanid_t **vidspp, 94c1c61f44Ssb155480 uint16_t *nvidsp, uint16_t *default_idp); 95c1c61f44Ssb155480 static int vsw_port_read_props(vsw_port_t *portp, vsw_t *vswp, 96c1c61f44Ssb155480 md_t *mdp, mde_cookie_t *node); 97f0ca1d9aSsb155480 static void vsw_read_pri_eth_types(vsw_t *vswp, md_t *mdp, 98f0ca1d9aSsb155480 mde_cookie_t node); 997b1f684aSSriharsha Basavapatna static void vsw_mtu_read(vsw_t *vswp, md_t *mdp, mde_cookie_t node, 1007b1f684aSSriharsha Basavapatna uint32_t *mtu); 1017b1f684aSSriharsha Basavapatna static int vsw_mtu_update(vsw_t *vswp, uint32_t mtu); 10234683adeSsg70180 static void vsw_update_md_prop(vsw_t *, md_t *, mde_cookie_t); 10319b65a69Ssb155480 static void vsw_save_lmacaddr(vsw_t *vswp, uint64_t macaddr); 104da14cebeSEric Cheng static boolean_t vsw_cmp_vids(vsw_vlanid_t *vids1, 105da14cebeSEric Cheng vsw_vlanid_t *vids2, int nvids); 1061ae08745Sheppo 10706db247cSraghuram /* Mac driver related routines */ 10806db247cSraghuram static int vsw_mac_register(vsw_t *); 10906db247cSraghuram static int vsw_mac_unregister(vsw_t *); 11006db247cSraghuram static int vsw_m_stat(void *, uint_t, uint64_t *); 11106db247cSraghuram static void vsw_m_stop(void *arg); 11206db247cSraghuram static int vsw_m_start(void *arg); 11306db247cSraghuram static int vsw_m_unicst(void *arg, const uint8_t *); 11406db247cSraghuram static int vsw_m_multicst(void *arg, boolean_t, const uint8_t *); 11506db247cSraghuram static int vsw_m_promisc(void *arg, boolean_t); 11606db247cSraghuram static mblk_t *vsw_m_tx(void *arg, mblk_t *); 117f0ca1d9aSsb155480 void vsw_mac_rx(vsw_t *vswp, mac_resource_handle_t mrh, 118f0ca1d9aSsb155480 mblk_t *mp, vsw_macrx_flags_t flags); 1191ae08745Sheppo 12006db247cSraghuram /* 12106db247cSraghuram * Functions imported from other files. 12206db247cSraghuram */ 123808f26a8SSriharsha Basavapatna extern void vsw_setup_switching_thread(void *arg); 124808f26a8SSriharsha Basavapatna extern int vsw_setup_switching_start(vsw_t *vswp); 125808f26a8SSriharsha Basavapatna extern void vsw_setup_switching_stop(vsw_t *vswp); 12606db247cSraghuram extern int vsw_setup_switching(vsw_t *); 1277a327842Swentaoy extern void vsw_switch_frame_nop(vsw_t *vswp, mblk_t *mp, int caller, 1287a327842Swentaoy vsw_port_t *port, mac_resource_handle_t mrh); 12906db247cSraghuram extern int vsw_add_mcst(vsw_t *, uint8_t, uint64_t, void *); 13006db247cSraghuram extern int vsw_del_mcst(vsw_t *, uint8_t, uint64_t, void *); 13106db247cSraghuram extern void vsw_del_mcst_vsw(vsw_t *); 13206db247cSraghuram extern mcst_addr_t *vsw_del_addr(uint8_t devtype, void *arg, uint64_t addr); 133*6f09f0feSWENTAO YANG extern void vsw_detach_ports(vsw_t *vswp); 13406db247cSraghuram extern int vsw_port_add(vsw_t *vswp, md_t *mdp, mde_cookie_t *node); 13506db247cSraghuram extern int vsw_port_detach(vsw_t *vswp, int p_instance); 136c1c61f44Ssb155480 static int vsw_port_update(vsw_t *vswp, md_t *curr_mdp, mde_cookie_t curr_mdex, 137c1c61f44Ssb155480 md_t *prev_mdp, mde_cookie_t prev_mdex); 138c1c61f44Ssb155480 extern int vsw_port_attach(vsw_port_t *port); 13906db247cSraghuram extern vsw_port_t *vsw_lookup_port(vsw_t *vswp, int p_instance); 14006db247cSraghuram extern int vsw_mac_open(vsw_t *vswp); 14106db247cSraghuram extern void vsw_mac_close(vsw_t *vswp); 142da14cebeSEric Cheng extern void vsw_mac_cleanup_ports(vsw_t *vswp); 14306db247cSraghuram extern void vsw_unset_addrs(vsw_t *vswp); 14471bdf936SWENTAO YANG extern void vsw_setup_layer2_post_process(vsw_t *vswp); 145c1c61f44Ssb155480 extern void vsw_create_vlans(void *arg, int type); 146c1c61f44Ssb155480 extern void vsw_destroy_vlans(void *arg, int type); 147c1c61f44Ssb155480 extern void vsw_vlan_add_ids(void *arg, int type); 148c1c61f44Ssb155480 extern void vsw_vlan_remove_ids(void *arg, int type); 149c1c61f44Ssb155480 extern void vsw_vlan_unaware_port_reset(vsw_port_t *portp); 150c1c61f44Ssb155480 extern uint32_t vsw_vlan_frame_untag(void *arg, int type, mblk_t **np, 151c1c61f44Ssb155480 mblk_t **npt); 152c1c61f44Ssb155480 extern mblk_t *vsw_vlan_frame_pretag(void *arg, int type, mblk_t *mp); 153678453a8Sspeer extern void vsw_hio_cleanup(vsw_t *vswp); 154da14cebeSEric Cheng extern void vsw_hio_start_ports(vsw_t *vswp); 155da14cebeSEric Cheng extern void vsw_hio_port_update(vsw_port_t *portp, boolean_t hio_enabled); 156da14cebeSEric Cheng extern int vsw_mac_multicast_add(vsw_t *, vsw_port_t *, mcst_addr_t *, int); 157da14cebeSEric Cheng extern void vsw_mac_multicast_remove(vsw_t *, vsw_port_t *, mcst_addr_t *, int); 158da14cebeSEric Cheng extern void vsw_mac_port_reconfig_vlans(vsw_port_t *portp, uint16_t new_pvid, 159da14cebeSEric Cheng vsw_vlanid_t *new_vids, int new_nvids); 160da14cebeSEric Cheng extern int vsw_mac_client_init(vsw_t *vswp, vsw_port_t *port, int type); 161da14cebeSEric Cheng extern void vsw_mac_client_cleanup(vsw_t *vswp, vsw_port_t *port, int type); 162da14cebeSEric Cheng extern void vsw_if_mac_reconfig(vsw_t *vswp, boolean_t update_vlans, 163da14cebeSEric Cheng uint16_t new_pvid, vsw_vlanid_t *new_vids, int new_nvids); 1647b1f684aSSriharsha Basavapatna extern void vsw_reset_ports(vsw_t *vswp); 1657b1f684aSSriharsha Basavapatna extern void vsw_port_reset(vsw_port_t *portp); 166678453a8Sspeer void vsw_hio_port_update(vsw_port_t *portp, boolean_t hio_enabled); 16706db247cSraghuram 16806db247cSraghuram /* 16906db247cSraghuram * Internal tunables. 17006db247cSraghuram */ 171445b4c2eSsb155480 int vsw_num_handshakes = VNET_NUM_HANDSHAKES; /* # of handshake attempts */ 1721ae08745Sheppo int vsw_wretries = 100; /* # of write attempts */ 173d10e4ef2Snarayan int vsw_desc_delay = 0; /* delay in us */ 174d10e4ef2Snarayan int vsw_read_attempts = 5; /* # of reads of descriptor */ 17519b65a69Ssb155480 int vsw_setup_switching_delay = 3; /* setup sw timeout interval in sec */ 1760e8b4070Ssb155480 int vsw_mac_open_retries = 300; /* max # of mac_open() retries */ 1770e8b4070Ssb155480 /* 300*3 = 900sec(15min) of max tmout */ 17806db247cSraghuram int vsw_ldc_tx_delay = 5; /* delay(ticks) for tx retries */ 17906db247cSraghuram int vsw_ldc_tx_retries = 10; /* # of ldc tx retries */ 180*6f09f0feSWENTAO YANG int vsw_ldc_retries = 5; /* # of ldc_close() retries */ 181*6f09f0feSWENTAO YANG int vsw_ldc_delay = 1000; /* 1 ms delay for ldc_close() */ 18206db247cSraghuram boolean_t vsw_ldc_rxthr_enabled = B_TRUE; /* LDC Rx thread enabled */ 18306db247cSraghuram boolean_t vsw_ldc_txthr_enabled = B_TRUE; /* LDC Tx thread enabled */ 184d10e4ef2Snarayan 185c1c61f44Ssb155480 uint32_t vsw_fdb_nchains = 8; /* # of chains in fdb hash table */ 186c1c61f44Ssb155480 uint32_t vsw_vlan_nchains = 4; /* # of chains in vlan id hash table */ 187c1c61f44Ssb155480 uint32_t vsw_ethermtu = 1500; /* mtu of the device */ 188c1c61f44Ssb155480 189c1c61f44Ssb155480 /* delay in usec to wait for all references on a fdb entry to be dropped */ 190c1c61f44Ssb155480 uint32_t vsw_fdbe_refcnt_delay = 10; 191c1c61f44Ssb155480 192c1c61f44Ssb155480 /* 193c1c61f44Ssb155480 * Default vlan id. This is only used internally when the "default-vlan-id" 194c1c61f44Ssb155480 * property is not present in the MD device node. Therefore, this should not be 195c1c61f44Ssb155480 * used as a tunable; if this value is changed, the corresponding variable 196c1c61f44Ssb155480 * should be updated to the same value in all vnets connected to this vsw. 197c1c61f44Ssb155480 */ 198c1c61f44Ssb155480 uint16_t vsw_default_vlan_id = 1; 199c1c61f44Ssb155480 200f0ca1d9aSsb155480 /* 201f0ca1d9aSsb155480 * Workaround for a version handshake bug in obp's vnet. 202f0ca1d9aSsb155480 * If vsw initiates version negotiation starting from the highest version, 203f0ca1d9aSsb155480 * obp sends a nack and terminates version handshake. To workaround 204f0ca1d9aSsb155480 * this, we do not initiate version handshake when the channel comes up. 205f0ca1d9aSsb155480 * Instead, we wait for the peer to send its version info msg and go through 206f0ca1d9aSsb155480 * the version protocol exchange. If we successfully negotiate a version, 207f0ca1d9aSsb155480 * before sending the ack, we send our version info msg to the peer 208f0ca1d9aSsb155480 * using the <major,minor> version that we are about to ack. 209f0ca1d9aSsb155480 */ 210f0ca1d9aSsb155480 boolean_t vsw_obp_ver_proto_workaround = B_TRUE; 211f0ca1d9aSsb155480 212f0ca1d9aSsb155480 /* 213f0ca1d9aSsb155480 * In the absence of "priority-ether-types" property in MD, the following 214f0ca1d9aSsb155480 * internal tunable can be set to specify a single priority ethertype. 215f0ca1d9aSsb155480 */ 216f0ca1d9aSsb155480 uint64_t vsw_pri_eth_type = 0; 217f0ca1d9aSsb155480 218f0ca1d9aSsb155480 /* 219f0ca1d9aSsb155480 * Number of transmit priority buffers that are preallocated per device. 220f0ca1d9aSsb155480 * This number is chosen to be a small value to throttle transmission 221f0ca1d9aSsb155480 * of priority packets. Note: Must be a power of 2 for vio_create_mblks(). 222f0ca1d9aSsb155480 */ 223f0ca1d9aSsb155480 uint32_t vsw_pri_tx_nmblks = 64; 224d10e4ef2Snarayan 22551aa9d07Ssb155480 /* 22651aa9d07Ssb155480 * Number of RARP packets sent to announce macaddr to the physical switch, 22751aa9d07Ssb155480 * after vsw's physical device is changed dynamically or after a guest (client 22851aa9d07Ssb155480 * vnet) is live migrated in. 22951aa9d07Ssb155480 */ 23051aa9d07Ssb155480 uint32_t vsw_publish_macaddr_count = 3; 23151aa9d07Ssb155480 232678453a8Sspeer boolean_t vsw_hio_enabled = B_TRUE; /* Enable/disable HybridIO */ 233678453a8Sspeer int vsw_hio_max_cleanup_retries = 10; /* Max retries for HybridIO cleanp */ 234678453a8Sspeer int vsw_hio_cleanup_delay = 10000; /* 10ms */ 235678453a8Sspeer 236f0ca1d9aSsb155480 /* Number of transmit descriptors - must be power of 2 */ 237f0ca1d9aSsb155480 uint32_t vsw_ntxds = VSW_RING_NUM_EL; 238f0ca1d9aSsb155480 23906db247cSraghuram /* 24006db247cSraghuram * Max number of mblks received in one receive operation. 24106db247cSraghuram */ 24206db247cSraghuram uint32_t vsw_chain_len = (VSW_NUM_MBLKS * 0.6); 24306db247cSraghuram 24406db247cSraghuram /* 2457b1f684aSSriharsha Basavapatna * Internal tunables for receive buffer pools, that is, the size and number of 2467b1f684aSSriharsha Basavapatna * mblks for each pool. At least 3 sizes must be specified if these are used. 2477b1f684aSSriharsha Basavapatna * The sizes must be specified in increasing order. Non-zero value of the first 2487b1f684aSSriharsha Basavapatna * size will be used as a hint to use these values instead of the algorithm 2497b1f684aSSriharsha Basavapatna * that determines the sizes based on MTU. 25006db247cSraghuram */ 2517b1f684aSSriharsha Basavapatna uint32_t vsw_mblk_size1 = 0; 2527b1f684aSSriharsha Basavapatna uint32_t vsw_mblk_size2 = 0; 2537b1f684aSSriharsha Basavapatna uint32_t vsw_mblk_size3 = 0; 2547b1f684aSSriharsha Basavapatna uint32_t vsw_mblk_size4 = 0; 25506db247cSraghuram uint32_t vsw_num_mblks1 = VSW_NUM_MBLKS; /* number of mblks for pool1 */ 25606db247cSraghuram uint32_t vsw_num_mblks2 = VSW_NUM_MBLKS; /* number of mblks for pool2 */ 25706db247cSraghuram uint32_t vsw_num_mblks3 = VSW_NUM_MBLKS; /* number of mblks for pool3 */ 2587b1f684aSSriharsha Basavapatna uint32_t vsw_num_mblks4 = VSW_NUM_MBLKS; /* number of mblks for pool4 */ 2597b1f684aSSriharsha Basavapatna 2607b1f684aSSriharsha Basavapatna /* 2617b1f684aSSriharsha Basavapatna * Set this to non-zero to enable additional internal receive buffer pools 2627b1f684aSSriharsha Basavapatna * based on the MTU of the device for better performance at the cost of more 2637b1f684aSSriharsha Basavapatna * memory consumption. This is turned off by default, to use allocb(9F) for 2647b1f684aSSriharsha Basavapatna * receive buffer allocations of sizes > 2K. 2657b1f684aSSriharsha Basavapatna */ 2667b1f684aSSriharsha Basavapatna boolean_t vsw_jumbo_rxpools = B_FALSE; 26706db247cSraghuram 26806db247cSraghuram /* 269f0ca1d9aSsb155480 * vsw_max_tx_qcount is the maximum # of packets that can be queued 270f0ca1d9aSsb155480 * before the tx worker thread begins processing the queue. Its value 271f0ca1d9aSsb155480 * is chosen to be 4x the default length of tx descriptor ring. 272f0ca1d9aSsb155480 */ 273f0ca1d9aSsb155480 uint32_t vsw_max_tx_qcount = 4 * VSW_RING_NUM_EL; 274f0ca1d9aSsb155480 275f0ca1d9aSsb155480 /* 27606db247cSraghuram * MAC callbacks 27706db247cSraghuram */ 278ba2e4443Sseb static mac_callbacks_t vsw_m_callbacks = { 279ba2e4443Sseb 0, 280ba2e4443Sseb vsw_m_stat, 281ba2e4443Sseb vsw_m_start, 282ba2e4443Sseb vsw_m_stop, 283ba2e4443Sseb vsw_m_promisc, 284ba2e4443Sseb vsw_m_multicst, 285ba2e4443Sseb vsw_m_unicst, 286ba2e4443Sseb vsw_m_tx, 287ba2e4443Sseb NULL, 288ba2e4443Sseb NULL, 289ba2e4443Sseb NULL 290ba2e4443Sseb }; 291ba2e4443Sseb 2921ae08745Sheppo static struct cb_ops vsw_cb_ops = { 2931ae08745Sheppo nulldev, /* cb_open */ 2941ae08745Sheppo nulldev, /* cb_close */ 2951ae08745Sheppo nodev, /* cb_strategy */ 2961ae08745Sheppo nodev, /* cb_print */ 2971ae08745Sheppo nodev, /* cb_dump */ 2981ae08745Sheppo nodev, /* cb_read */ 2991ae08745Sheppo nodev, /* cb_write */ 3001ae08745Sheppo nodev, /* cb_ioctl */ 3011ae08745Sheppo nodev, /* cb_devmap */ 3021ae08745Sheppo nodev, /* cb_mmap */ 3031ae08745Sheppo nodev, /* cb_segmap */ 3041ae08745Sheppo nochpoll, /* cb_chpoll */ 3051ae08745Sheppo ddi_prop_op, /* cb_prop_op */ 3061ae08745Sheppo NULL, /* cb_stream */ 3071ae08745Sheppo D_MP, /* cb_flag */ 3081ae08745Sheppo CB_REV, /* rev */ 3091ae08745Sheppo nodev, /* int (*cb_aread)() */ 3101ae08745Sheppo nodev /* int (*cb_awrite)() */ 3111ae08745Sheppo }; 3121ae08745Sheppo 3131ae08745Sheppo static struct dev_ops vsw_ops = { 3141ae08745Sheppo DEVO_REV, /* devo_rev */ 3151ae08745Sheppo 0, /* devo_refcnt */ 31671184a40SWENTAO YANG NULL, /* devo_getinfo */ 3171ae08745Sheppo nulldev, /* devo_identify */ 3181ae08745Sheppo nulldev, /* devo_probe */ 3191ae08745Sheppo vsw_attach, /* devo_attach */ 3201ae08745Sheppo vsw_detach, /* devo_detach */ 3211ae08745Sheppo nodev, /* devo_reset */ 3221ae08745Sheppo &vsw_cb_ops, /* devo_cb_ops */ 3231ae08745Sheppo (struct bus_ops *)NULL, /* devo_bus_ops */ 3241ae08745Sheppo ddi_power /* devo_power */ 3251ae08745Sheppo }; 3261ae08745Sheppo 3271ae08745Sheppo extern struct mod_ops mod_driverops; 3281ae08745Sheppo static struct modldrv vswmodldrv = { 3291ae08745Sheppo &mod_driverops, 330205eeb1aSlm66018 "sun4v Virtual Switch", 3311ae08745Sheppo &vsw_ops, 3321ae08745Sheppo }; 3331ae08745Sheppo 3341ae08745Sheppo #define LDC_ENTER_LOCK(ldcp) \ 3351ae08745Sheppo mutex_enter(&((ldcp)->ldc_cblock));\ 33606db247cSraghuram mutex_enter(&((ldcp)->ldc_rxlock));\ 3371ae08745Sheppo mutex_enter(&((ldcp)->ldc_txlock)); 3381ae08745Sheppo #define LDC_EXIT_LOCK(ldcp) \ 3391ae08745Sheppo mutex_exit(&((ldcp)->ldc_txlock));\ 34006db247cSraghuram mutex_exit(&((ldcp)->ldc_rxlock));\ 3411ae08745Sheppo mutex_exit(&((ldcp)->ldc_cblock)); 3421ae08745Sheppo 3431ae08745Sheppo /* Driver soft state ptr */ 3441ae08745Sheppo static void *vsw_state; 3451ae08745Sheppo 3461ae08745Sheppo /* 3471ae08745Sheppo * Linked list of "vsw_t" structures - one per instance. 3481ae08745Sheppo */ 3491ae08745Sheppo vsw_t *vsw_head = NULL; 350*6f09f0feSWENTAO YANG vio_mblk_pool_t *vsw_rx_poolp = NULL; 3511ae08745Sheppo krwlock_t vsw_rw; 3521ae08745Sheppo 3531ae08745Sheppo /* 3541ae08745Sheppo * Property names 3551ae08745Sheppo */ 3561ae08745Sheppo static char vdev_propname[] = "virtual-device"; 3571ae08745Sheppo static char vsw_propname[] = "virtual-network-switch"; 3581ae08745Sheppo static char physdev_propname[] = "vsw-phys-dev"; 3591ae08745Sheppo static char smode_propname[] = "vsw-switch-mode"; 3601ae08745Sheppo static char macaddr_propname[] = "local-mac-address"; 3611ae08745Sheppo static char remaddr_propname[] = "remote-mac-address"; 3621ae08745Sheppo static char ldcids_propname[] = "ldc-ids"; 3631ae08745Sheppo static char chan_propname[] = "channel-endpoint"; 3641ae08745Sheppo static char id_propname[] = "id"; 3651ae08745Sheppo static char reg_propname[] = "reg"; 366f0ca1d9aSsb155480 static char pri_types_propname[] = "priority-ether-types"; 367c1c61f44Ssb155480 static char vsw_pvid_propname[] = "port-vlan-id"; 368c1c61f44Ssb155480 static char vsw_vid_propname[] = "vlan-id"; 369c1c61f44Ssb155480 static char vsw_dvid_propname[] = "default-vlan-id"; 370c1c61f44Ssb155480 static char port_pvid_propname[] = "remote-port-vlan-id"; 371c1c61f44Ssb155480 static char port_vid_propname[] = "remote-vlan-id"; 372678453a8Sspeer static char hybrid_propname[] = "hybrid"; 3737b1f684aSSriharsha Basavapatna static char vsw_mtu_propname[] = "mtu"; 3741ae08745Sheppo 3751ae08745Sheppo /* 3761ae08745Sheppo * Matching criteria passed to the MDEG to register interest 3771ae08745Sheppo * in changes to 'virtual-device-port' nodes identified by their 3781ae08745Sheppo * 'id' property. 3791ae08745Sheppo */ 3801ae08745Sheppo static md_prop_match_t vport_prop_match[] = { 3811ae08745Sheppo { MDET_PROP_VAL, "id" }, 3821ae08745Sheppo { MDET_LIST_END, NULL } 3831ae08745Sheppo }; 3841ae08745Sheppo 3851ae08745Sheppo static mdeg_node_match_t vport_match = { "virtual-device-port", 3861ae08745Sheppo vport_prop_match }; 3871ae08745Sheppo 3881ae08745Sheppo /* 38934683adeSsg70180 * Matching criteria passed to the MDEG to register interest 39034683adeSsg70180 * in changes to 'virtual-device' nodes (i.e. vsw nodes) identified 39134683adeSsg70180 * by their 'name' and 'cfg-handle' properties. 39234683adeSsg70180 */ 39334683adeSsg70180 static md_prop_match_t vdev_prop_match[] = { 39434683adeSsg70180 { MDET_PROP_STR, "name" }, 39534683adeSsg70180 { MDET_PROP_VAL, "cfg-handle" }, 39634683adeSsg70180 { MDET_LIST_END, NULL } 39734683adeSsg70180 }; 39834683adeSsg70180 39934683adeSsg70180 static mdeg_node_match_t vdev_match = { "virtual-device", 40034683adeSsg70180 vdev_prop_match }; 40134683adeSsg70180 40234683adeSsg70180 40334683adeSsg70180 /* 4041ae08745Sheppo * Specification of an MD node passed to the MDEG to filter any 4051ae08745Sheppo * 'vport' nodes that do not belong to the specified node. This 4061ae08745Sheppo * template is copied for each vsw instance and filled in with 4071ae08745Sheppo * the appropriate 'cfg-handle' value before being passed to the MDEG. 4081ae08745Sheppo */ 4091ae08745Sheppo static mdeg_prop_spec_t vsw_prop_template[] = { 4101ae08745Sheppo { MDET_PROP_STR, "name", vsw_propname }, 4111ae08745Sheppo { MDET_PROP_VAL, "cfg-handle", NULL }, 4121ae08745Sheppo { MDET_LIST_END, NULL, NULL } 4131ae08745Sheppo }; 4141ae08745Sheppo 4151ae08745Sheppo #define VSW_SET_MDEG_PROP_INST(specp, val) (specp)[1].ps_val = (val); 4161ae08745Sheppo 41706db247cSraghuram #ifdef DEBUG 4187636cb21Slm66018 /* 4191ae08745Sheppo * Print debug messages - set to 0x1f to enable all msgs 4201ae08745Sheppo * or 0x0 to turn all off. 4211ae08745Sheppo */ 4221ae08745Sheppo int vswdbg = 0x0; 4231ae08745Sheppo 4241ae08745Sheppo /* 4251ae08745Sheppo * debug levels: 4261ae08745Sheppo * 0x01: Function entry/exit tracing 4271ae08745Sheppo * 0x02: Internal function messages 4281ae08745Sheppo * 0x04: Verbose internal messages 4291ae08745Sheppo * 0x08: Warning messages 4301ae08745Sheppo * 0x10: Error messages 4311ae08745Sheppo */ 4321ae08745Sheppo 43306db247cSraghuram void 4341ae08745Sheppo vswdebug(vsw_t *vswp, const char *fmt, ...) 4351ae08745Sheppo { 4361ae08745Sheppo char buf[512]; 4371ae08745Sheppo va_list ap; 4381ae08745Sheppo 4391ae08745Sheppo va_start(ap, fmt); 4401ae08745Sheppo (void) vsprintf(buf, fmt, ap); 4411ae08745Sheppo va_end(ap); 4421ae08745Sheppo 4431ae08745Sheppo if (vswp == NULL) 4441ae08745Sheppo cmn_err(CE_CONT, "%s\n", buf); 4451ae08745Sheppo else 4461ae08745Sheppo cmn_err(CE_CONT, "vsw%d: %s\n", vswp->instance, buf); 4471ae08745Sheppo } 4481ae08745Sheppo 4491ae08745Sheppo #endif /* DEBUG */ 4501ae08745Sheppo 4511ae08745Sheppo static struct modlinkage modlinkage = { 4521ae08745Sheppo MODREV_1, 4531ae08745Sheppo &vswmodldrv, 4541ae08745Sheppo NULL 4551ae08745Sheppo }; 4561ae08745Sheppo 4571ae08745Sheppo int 4581ae08745Sheppo _init(void) 4591ae08745Sheppo { 4601ae08745Sheppo int status; 4611ae08745Sheppo 4621ae08745Sheppo rw_init(&vsw_rw, NULL, RW_DRIVER, NULL); 4631ae08745Sheppo 4641ae08745Sheppo status = ddi_soft_state_init(&vsw_state, sizeof (vsw_t), 1); 4651ae08745Sheppo if (status != 0) { 4661ae08745Sheppo return (status); 4671ae08745Sheppo } 4681ae08745Sheppo 46906db247cSraghuram mac_init_ops(&vsw_ops, DRV_NAME); 4701ae08745Sheppo status = mod_install(&modlinkage); 4711ae08745Sheppo if (status != 0) { 4721ae08745Sheppo ddi_soft_state_fini(&vsw_state); 4731ae08745Sheppo } 4741ae08745Sheppo return (status); 4751ae08745Sheppo } 4761ae08745Sheppo 4771ae08745Sheppo int 4781ae08745Sheppo _fini(void) 4791ae08745Sheppo { 4801ae08745Sheppo int status; 4811ae08745Sheppo 482*6f09f0feSWENTAO YANG status = vsw_mod_cleanup(); 483*6f09f0feSWENTAO YANG if (status != 0) 484*6f09f0feSWENTAO YANG return (status); 485*6f09f0feSWENTAO YANG 4861ae08745Sheppo status = mod_remove(&modlinkage); 4871ae08745Sheppo if (status != 0) 4881ae08745Sheppo return (status); 4891ae08745Sheppo mac_fini_ops(&vsw_ops); 4901ae08745Sheppo ddi_soft_state_fini(&vsw_state); 4911ae08745Sheppo 4921ae08745Sheppo rw_destroy(&vsw_rw); 4931ae08745Sheppo 4941ae08745Sheppo return (status); 4951ae08745Sheppo } 4961ae08745Sheppo 4971ae08745Sheppo int 4981ae08745Sheppo _info(struct modinfo *modinfop) 4991ae08745Sheppo { 5001ae08745Sheppo return (mod_info(&modlinkage, modinfop)); 5011ae08745Sheppo } 5021ae08745Sheppo 5031ae08745Sheppo static int 5041ae08745Sheppo vsw_attach(dev_info_t *dip, ddi_attach_cmd_t cmd) 5051ae08745Sheppo { 5061ae08745Sheppo vsw_t *vswp; 50734683adeSsg70180 int instance; 5081ae08745Sheppo char hashname[MAXNAMELEN]; 5091ae08745Sheppo char qname[TASKQ_NAMELEN]; 510*6f09f0feSWENTAO YANG vsw_attach_progress_t progress = PROG_init; 51119b65a69Ssb155480 int rv; 5121ae08745Sheppo 5131ae08745Sheppo switch (cmd) { 5141ae08745Sheppo case DDI_ATTACH: 5151ae08745Sheppo break; 5161ae08745Sheppo case DDI_RESUME: 5171ae08745Sheppo /* nothing to do for this non-device */ 5181ae08745Sheppo return (DDI_SUCCESS); 5191ae08745Sheppo case DDI_PM_RESUME: 5201ae08745Sheppo default: 5211ae08745Sheppo return (DDI_FAILURE); 5221ae08745Sheppo } 5231ae08745Sheppo 5241ae08745Sheppo instance = ddi_get_instance(dip); 5251ae08745Sheppo if (ddi_soft_state_zalloc(vsw_state, instance) != DDI_SUCCESS) { 5261ae08745Sheppo DERR(NULL, "vsw%d: ddi_soft_state_zalloc failed", instance); 5271ae08745Sheppo return (DDI_FAILURE); 5281ae08745Sheppo } 5291ae08745Sheppo vswp = ddi_get_soft_state(vsw_state, instance); 5301ae08745Sheppo 5311ae08745Sheppo if (vswp == NULL) { 5321ae08745Sheppo DERR(NULL, "vsw%d: ddi_get_soft_state failed", instance); 5331ae08745Sheppo goto vsw_attach_fail; 5341ae08745Sheppo } 5351ae08745Sheppo 5361ae08745Sheppo vswp->dip = dip; 5371ae08745Sheppo vswp->instance = instance; 5381ae08745Sheppo ddi_set_driver_private(dip, (caddr_t)vswp); 5391ae08745Sheppo 540da14cebeSEric Cheng mutex_init(&vswp->mac_lock, NULL, MUTEX_DRIVER, NULL); 54119b65a69Ssb155480 mutex_init(&vswp->mca_lock, NULL, MUTEX_DRIVER, NULL); 542808f26a8SSriharsha Basavapatna mutex_init(&vswp->sw_thr_lock, NULL, MUTEX_DRIVER, NULL); 543808f26a8SSriharsha Basavapatna cv_init(&vswp->sw_thr_cv, NULL, CV_DRIVER, NULL); 544da14cebeSEric Cheng rw_init(&vswp->maccl_rwlock, NULL, RW_DRIVER, NULL); 5451ae08745Sheppo rw_init(&vswp->if_lockrw, NULL, RW_DRIVER, NULL); 54619b65a69Ssb155480 rw_init(&vswp->mfdbrw, NULL, RW_DRIVER, NULL); 54719b65a69Ssb155480 rw_init(&vswp->plist.lockrw, NULL, RW_DRIVER, NULL); 54819b65a69Ssb155480 54919b65a69Ssb155480 progress |= PROG_locks; 55019b65a69Ssb155480 55119b65a69Ssb155480 rv = vsw_read_mdprops(vswp); 55219b65a69Ssb155480 if (rv != 0) 55319b65a69Ssb155480 goto vsw_attach_fail; 55419b65a69Ssb155480 55519b65a69Ssb155480 progress |= PROG_readmd; 5561ae08745Sheppo 5571ae08745Sheppo /* setup the unicast forwarding database */ 5581ae08745Sheppo (void) snprintf(hashname, MAXNAMELEN, "vsw_unicst_table-%d", 5591ae08745Sheppo vswp->instance); 5601ae08745Sheppo D2(vswp, "creating unicast hash table (%s)...", hashname); 561c1c61f44Ssb155480 vswp->fdb_nchains = vsw_fdb_nchains; 562c1c61f44Ssb155480 vswp->fdb_hashp = mod_hash_create_ptrhash(hashname, vswp->fdb_nchains, 5631ae08745Sheppo mod_hash_null_valdtor, sizeof (void *)); 564c1c61f44Ssb155480 vsw_create_vlans((void *)vswp, VSW_LOCALDEV); 5651ae08745Sheppo progress |= PROG_fdb; 5661ae08745Sheppo 5671ae08745Sheppo /* setup the multicast fowarding database */ 5681ae08745Sheppo (void) snprintf(hashname, MAXNAMELEN, "vsw_mcst_table-%d", 5691ae08745Sheppo vswp->instance); 5701ae08745Sheppo D2(vswp, "creating multicast hash table %s)...", hashname); 571c1c61f44Ssb155480 vswp->mfdb = mod_hash_create_ptrhash(hashname, vsw_fdb_nchains, 5721ae08745Sheppo mod_hash_null_valdtor, sizeof (void *)); 5731ae08745Sheppo 5741ae08745Sheppo progress |= PROG_mfdb; 5751ae08745Sheppo 5761ae08745Sheppo /* 5771ae08745Sheppo * Create the taskq which will process all the VIO 5781ae08745Sheppo * control messages. 5791ae08745Sheppo */ 5801ae08745Sheppo (void) snprintf(qname, TASKQ_NAMELEN, "vsw_taskq%d", vswp->instance); 5811ae08745Sheppo if ((vswp->taskq_p = ddi_taskq_create(vswp->dip, qname, 1, 5821ae08745Sheppo TASKQ_DEFAULTPRI, 0)) == NULL) { 58334683adeSsg70180 cmn_err(CE_WARN, "!vsw%d: Unable to create task queue", 58434683adeSsg70180 vswp->instance); 5851ae08745Sheppo goto vsw_attach_fail; 5861ae08745Sheppo } 5871ae08745Sheppo 5881ae08745Sheppo progress |= PROG_taskq; 5891ae08745Sheppo 590d10e4ef2Snarayan /* prevent auto-detaching */ 591d10e4ef2Snarayan if (ddi_prop_update_int(DDI_DEV_T_NONE, vswp->dip, 592d10e4ef2Snarayan DDI_NO_AUTODETACH, 1) != DDI_SUCCESS) { 59334683adeSsg70180 cmn_err(CE_NOTE, "!Unable to set \"%s\" property for " 594d10e4ef2Snarayan "instance %u", DDI_NO_AUTODETACH, instance); 595d10e4ef2Snarayan } 596d10e4ef2Snarayan 5971ae08745Sheppo /* 5987a327842Swentaoy * The null switching function is set to avoid panic until 5997a327842Swentaoy * switch mode is setup. 6007a327842Swentaoy */ 6017a327842Swentaoy vswp->vsw_switch_frame = vsw_switch_frame_nop; 6027a327842Swentaoy 6037a327842Swentaoy /* 604808f26a8SSriharsha Basavapatna * Setup the required switching mode, based on the mdprops that we read 605808f26a8SSriharsha Basavapatna * earlier. We start a thread to do this, to avoid calling mac_open() 606808f26a8SSriharsha Basavapatna * directly from attach(). 60719b65a69Ssb155480 */ 608808f26a8SSriharsha Basavapatna rv = vsw_setup_switching_start(vswp); 609808f26a8SSriharsha Basavapatna if (rv != 0) { 610808f26a8SSriharsha Basavapatna goto vsw_attach_fail; 611808f26a8SSriharsha Basavapatna } 61219b65a69Ssb155480 61319b65a69Ssb155480 progress |= PROG_swmode; 61419b65a69Ssb155480 61519b65a69Ssb155480 /* Register with mac layer as a provider */ 61619b65a69Ssb155480 rv = vsw_mac_register(vswp); 61719b65a69Ssb155480 if (rv != 0) 61819b65a69Ssb155480 goto vsw_attach_fail; 61919b65a69Ssb155480 62019b65a69Ssb155480 progress |= PROG_macreg; 62119b65a69Ssb155480 62219b65a69Ssb155480 /* 62334683adeSsg70180 * Now we have everything setup, register an interest in 62434683adeSsg70180 * specific MD nodes. 62534683adeSsg70180 * 62634683adeSsg70180 * The callback is invoked in 2 cases, firstly if upon mdeg 62734683adeSsg70180 * registration there are existing nodes which match our specified 62834683adeSsg70180 * criteria, and secondly if the MD is changed (and again, there 62934683adeSsg70180 * are nodes which we are interested in present within it. Note 63034683adeSsg70180 * that our callback will be invoked even if our specified nodes 63134683adeSsg70180 * have not actually changed). 63234683adeSsg70180 * 6331ae08745Sheppo */ 63419b65a69Ssb155480 rv = vsw_mdeg_register(vswp); 63519b65a69Ssb155480 if (rv != 0) 63634683adeSsg70180 goto vsw_attach_fail; 6371ae08745Sheppo 63819b65a69Ssb155480 progress |= PROG_mdreg; 63919b65a69Ssb155480 640*6f09f0feSWENTAO YANG vswp->attach_progress = progress; 641*6f09f0feSWENTAO YANG 64219b65a69Ssb155480 WRITE_ENTER(&vsw_rw); 64319b65a69Ssb155480 vswp->next = vsw_head; 64419b65a69Ssb155480 vsw_head = vswp; 64519b65a69Ssb155480 RW_EXIT(&vsw_rw); 64619b65a69Ssb155480 64719b65a69Ssb155480 ddi_report_dev(vswp->dip); 6481ae08745Sheppo return (DDI_SUCCESS); 6491ae08745Sheppo 6501ae08745Sheppo vsw_attach_fail: 6511ae08745Sheppo DERR(NULL, "vsw_attach: failed"); 6521ae08745Sheppo 653*6f09f0feSWENTAO YANG vswp->attach_progress = progress; 654*6f09f0feSWENTAO YANG (void) vsw_unattach(vswp); 6551ae08745Sheppo ddi_soft_state_free(vsw_state, instance); 6561ae08745Sheppo return (DDI_FAILURE); 6571ae08745Sheppo } 6581ae08745Sheppo 6591ae08745Sheppo static int 6601ae08745Sheppo vsw_detach(dev_info_t *dip, ddi_detach_cmd_t cmd) 6611ae08745Sheppo { 6621ae08745Sheppo vsw_t **vswpp, *vswp; 6631ae08745Sheppo int instance; 6641ae08745Sheppo 6651ae08745Sheppo instance = ddi_get_instance(dip); 6661ae08745Sheppo vswp = ddi_get_soft_state(vsw_state, instance); 6671ae08745Sheppo 6681ae08745Sheppo if (vswp == NULL) { 6691ae08745Sheppo return (DDI_FAILURE); 6701ae08745Sheppo } 6711ae08745Sheppo 6721ae08745Sheppo switch (cmd) { 6731ae08745Sheppo case DDI_DETACH: 6741ae08745Sheppo break; 6751ae08745Sheppo case DDI_SUSPEND: 6761ae08745Sheppo case DDI_PM_SUSPEND: 6771ae08745Sheppo default: 6781ae08745Sheppo return (DDI_FAILURE); 6791ae08745Sheppo } 6801ae08745Sheppo 6811ae08745Sheppo D2(vswp, "detaching instance %d", instance); 6821ae08745Sheppo 683*6f09f0feSWENTAO YANG if (vsw_unattach(vswp) != 0) { 6841ae08745Sheppo return (DDI_FAILURE); 6851ae08745Sheppo } 686f0ca1d9aSsb155480 6871ae08745Sheppo ddi_remove_minor_node(dip, NULL); 6881ae08745Sheppo 6891ae08745Sheppo WRITE_ENTER(&vsw_rw); 6901ae08745Sheppo for (vswpp = &vsw_head; *vswpp; vswpp = &(*vswpp)->next) { 6911ae08745Sheppo if (*vswpp == vswp) { 6921ae08745Sheppo *vswpp = vswp->next; 6931ae08745Sheppo break; 6941ae08745Sheppo } 6951ae08745Sheppo } 6961ae08745Sheppo RW_EXIT(&vsw_rw); 697*6f09f0feSWENTAO YANG 6981ae08745Sheppo ddi_soft_state_free(vsw_state, instance); 6991ae08745Sheppo 7001ae08745Sheppo return (DDI_SUCCESS); 7011ae08745Sheppo } 7021ae08745Sheppo 7031ae08745Sheppo /* 704*6f09f0feSWENTAO YANG * Common routine to handle vsw_attach() failure and vsw_detach(). Note that 705*6f09f0feSWENTAO YANG * the only reason this function could fail is if mac_unregister() fails. 706*6f09f0feSWENTAO YANG * Otherwise, this function must ensure that all resources are freed and return 707*6f09f0feSWENTAO YANG * success. 708*6f09f0feSWENTAO YANG */ 709*6f09f0feSWENTAO YANG static int 710*6f09f0feSWENTAO YANG vsw_unattach(vsw_t *vswp) 711*6f09f0feSWENTAO YANG { 712*6f09f0feSWENTAO YANG vio_mblk_pool_t *poolp, *npoolp; 713*6f09f0feSWENTAO YANG vsw_attach_progress_t progress; 714*6f09f0feSWENTAO YANG 715*6f09f0feSWENTAO YANG progress = vswp->attach_progress; 716*6f09f0feSWENTAO YANG 717*6f09f0feSWENTAO YANG /* 718*6f09f0feSWENTAO YANG * Unregister from the gldv3 subsystem. This can fail, in particular 719*6f09f0feSWENTAO YANG * if there are still any open references to this mac device; in which 720*6f09f0feSWENTAO YANG * case we just return failure without continuing to detach further. 721*6f09f0feSWENTAO YANG */ 722*6f09f0feSWENTAO YANG if (progress & PROG_macreg) { 723*6f09f0feSWENTAO YANG if (vsw_mac_unregister(vswp) != 0) { 724*6f09f0feSWENTAO YANG cmn_err(CE_WARN, "!vsw%d: Unable to detach from " 725*6f09f0feSWENTAO YANG "MAC layer", vswp->instance); 726*6f09f0feSWENTAO YANG return (1); 727*6f09f0feSWENTAO YANG } 728*6f09f0feSWENTAO YANG progress &= ~PROG_macreg; 729*6f09f0feSWENTAO YANG } 730*6f09f0feSWENTAO YANG 731*6f09f0feSWENTAO YANG /* 732*6f09f0feSWENTAO YANG * Now that we have unregistered from gldv3, we must finish all other 733*6f09f0feSWENTAO YANG * steps and successfully return from this function; otherwise we will 734*6f09f0feSWENTAO YANG * end up leaving the device in a broken/unusable state. 735*6f09f0feSWENTAO YANG * 736*6f09f0feSWENTAO YANG * If we have registered with mdeg, unregister now to stop further 737*6f09f0feSWENTAO YANG * callbacks to this vsw device and/or its ports. Then, detach any 738*6f09f0feSWENTAO YANG * existing ports. 739*6f09f0feSWENTAO YANG */ 740*6f09f0feSWENTAO YANG if (progress & PROG_mdreg) { 741*6f09f0feSWENTAO YANG vsw_mdeg_unregister(vswp); 742*6f09f0feSWENTAO YANG vsw_detach_ports(vswp); 743*6f09f0feSWENTAO YANG 744*6f09f0feSWENTAO YANG /* 745*6f09f0feSWENTAO YANG * At this point, we attempt to free receive mblk pools that 746*6f09f0feSWENTAO YANG * couldn't be destroyed when the ports were detached; if this 747*6f09f0feSWENTAO YANG * attempt also fails, we hook up the pool(s) to the module so 748*6f09f0feSWENTAO YANG * they can be cleaned up in _fini(). 749*6f09f0feSWENTAO YANG */ 750*6f09f0feSWENTAO YANG poolp = vswp->rxh; 751*6f09f0feSWENTAO YANG while (poolp != NULL) { 752*6f09f0feSWENTAO YANG npoolp = vswp->rxh = poolp->nextp; 753*6f09f0feSWENTAO YANG if (vio_destroy_mblks(poolp) != 0) { 754*6f09f0feSWENTAO YANG WRITE_ENTER(&vsw_rw); 755*6f09f0feSWENTAO YANG poolp->nextp = vsw_rx_poolp; 756*6f09f0feSWENTAO YANG vsw_rx_poolp = poolp; 757*6f09f0feSWENTAO YANG RW_EXIT(&vsw_rw); 758*6f09f0feSWENTAO YANG } 759*6f09f0feSWENTAO YANG poolp = npoolp; 760*6f09f0feSWENTAO YANG } 761*6f09f0feSWENTAO YANG progress &= ~PROG_mdreg; 762*6f09f0feSWENTAO YANG } 763*6f09f0feSWENTAO YANG 764*6f09f0feSWENTAO YANG /* 765*6f09f0feSWENTAO YANG * If we have started a thread to setup the switching mode, stop it, if 766*6f09f0feSWENTAO YANG * it is still running. If it has finished setting up the switching 767*6f09f0feSWENTAO YANG * mode, then we need to clean up some additional things if we are 768*6f09f0feSWENTAO YANG * running in L2 mode: first free up any hybrid resources; then stop 769*6f09f0feSWENTAO YANG * and close the underlying physical device. Note that we would have 770*6f09f0feSWENTAO YANG * already released all per mac_client resources (ucast, mcast addrs, 771*6f09f0feSWENTAO YANG * hio-shares etc) as all the ports are detached and if the vsw device 772*6f09f0feSWENTAO YANG * itself was in use as an interface, it has been unplumbed (otherwise 773*6f09f0feSWENTAO YANG * mac_unregister() above would fail). 774*6f09f0feSWENTAO YANG */ 775*6f09f0feSWENTAO YANG if (progress & PROG_swmode) { 776*6f09f0feSWENTAO YANG 777*6f09f0feSWENTAO YANG vsw_setup_switching_stop(vswp); 778*6f09f0feSWENTAO YANG 779*6f09f0feSWENTAO YANG if (vswp->hio_capable == B_TRUE) { 780*6f09f0feSWENTAO YANG vsw_hio_cleanup(vswp); 781*6f09f0feSWENTAO YANG vswp->hio_capable = B_FALSE; 782*6f09f0feSWENTAO YANG } 783*6f09f0feSWENTAO YANG 784*6f09f0feSWENTAO YANG mutex_enter(&vswp->mac_lock); 785*6f09f0feSWENTAO YANG vsw_mac_close(vswp); 786*6f09f0feSWENTAO YANG mutex_exit(&vswp->mac_lock); 787*6f09f0feSWENTAO YANG 788*6f09f0feSWENTAO YANG progress &= ~PROG_swmode; 789*6f09f0feSWENTAO YANG } 790*6f09f0feSWENTAO YANG 791*6f09f0feSWENTAO YANG /* 792*6f09f0feSWENTAO YANG * By now any pending tasks have finished and the underlying 793*6f09f0feSWENTAO YANG * ldc's have been destroyed, so its safe to delete the control 794*6f09f0feSWENTAO YANG * message taskq. 795*6f09f0feSWENTAO YANG */ 796*6f09f0feSWENTAO YANG if (progress & PROG_taskq) { 797*6f09f0feSWENTAO YANG ddi_taskq_destroy(vswp->taskq_p); 798*6f09f0feSWENTAO YANG progress &= ~PROG_taskq; 799*6f09f0feSWENTAO YANG } 800*6f09f0feSWENTAO YANG 801*6f09f0feSWENTAO YANG /* Destroy the multicast hash table */ 802*6f09f0feSWENTAO YANG if (progress & PROG_mfdb) { 803*6f09f0feSWENTAO YANG mod_hash_destroy_hash(vswp->mfdb); 804*6f09f0feSWENTAO YANG progress &= ~PROG_mfdb; 805*6f09f0feSWENTAO YANG } 806*6f09f0feSWENTAO YANG 807*6f09f0feSWENTAO YANG /* Destroy the vlan hash table and fdb */ 808*6f09f0feSWENTAO YANG if (progress & PROG_fdb) { 809*6f09f0feSWENTAO YANG vsw_destroy_vlans(vswp, VSW_LOCALDEV); 810*6f09f0feSWENTAO YANG mod_hash_destroy_hash(vswp->fdb_hashp); 811*6f09f0feSWENTAO YANG progress &= ~PROG_fdb; 812*6f09f0feSWENTAO YANG } 813*6f09f0feSWENTAO YANG 814*6f09f0feSWENTAO YANG if (progress & PROG_readmd) { 815*6f09f0feSWENTAO YANG if (VSW_PRI_ETH_DEFINED(vswp)) { 816*6f09f0feSWENTAO YANG kmem_free(vswp->pri_types, 817*6f09f0feSWENTAO YANG sizeof (uint16_t) * vswp->pri_num_types); 818*6f09f0feSWENTAO YANG (void) vio_destroy_mblks(vswp->pri_tx_vmp); 819*6f09f0feSWENTAO YANG } 820*6f09f0feSWENTAO YANG progress &= ~PROG_readmd; 821*6f09f0feSWENTAO YANG } 822*6f09f0feSWENTAO YANG 823*6f09f0feSWENTAO YANG if (progress & PROG_locks) { 824*6f09f0feSWENTAO YANG rw_destroy(&vswp->plist.lockrw); 825*6f09f0feSWENTAO YANG rw_destroy(&vswp->mfdbrw); 826*6f09f0feSWENTAO YANG rw_destroy(&vswp->if_lockrw); 827*6f09f0feSWENTAO YANG rw_destroy(&vswp->maccl_rwlock); 828*6f09f0feSWENTAO YANG cv_destroy(&vswp->sw_thr_cv); 829*6f09f0feSWENTAO YANG mutex_destroy(&vswp->sw_thr_lock); 830*6f09f0feSWENTAO YANG mutex_destroy(&vswp->mca_lock); 831*6f09f0feSWENTAO YANG mutex_destroy(&vswp->mac_lock); 832*6f09f0feSWENTAO YANG progress &= ~PROG_locks; 833*6f09f0feSWENTAO YANG } 834*6f09f0feSWENTAO YANG 835*6f09f0feSWENTAO YANG vswp->attach_progress = progress; 836*6f09f0feSWENTAO YANG 837*6f09f0feSWENTAO YANG return (0); 838*6f09f0feSWENTAO YANG } 839*6f09f0feSWENTAO YANG 840*6f09f0feSWENTAO YANG /* 841*6f09f0feSWENTAO YANG * one time cleanup. 842*6f09f0feSWENTAO YANG */ 843*6f09f0feSWENTAO YANG static int 844*6f09f0feSWENTAO YANG vsw_mod_cleanup(void) 845*6f09f0feSWENTAO YANG { 846*6f09f0feSWENTAO YANG vio_mblk_pool_t *poolp, *npoolp; 847*6f09f0feSWENTAO YANG 848*6f09f0feSWENTAO YANG /* 849*6f09f0feSWENTAO YANG * If any rx mblk pools are still in use, return 850*6f09f0feSWENTAO YANG * error and stop the module from unloading. 851*6f09f0feSWENTAO YANG */ 852*6f09f0feSWENTAO YANG WRITE_ENTER(&vsw_rw); 853*6f09f0feSWENTAO YANG poolp = vsw_rx_poolp; 854*6f09f0feSWENTAO YANG while (poolp != NULL) { 855*6f09f0feSWENTAO YANG npoolp = vsw_rx_poolp = poolp->nextp; 856*6f09f0feSWENTAO YANG if (vio_destroy_mblks(poolp) != 0) { 857*6f09f0feSWENTAO YANG vsw_rx_poolp = poolp; 858*6f09f0feSWENTAO YANG RW_EXIT(&vsw_rw); 859*6f09f0feSWENTAO YANG return (EBUSY); 860*6f09f0feSWENTAO YANG } 861*6f09f0feSWENTAO YANG poolp = npoolp; 862*6f09f0feSWENTAO YANG } 863*6f09f0feSWENTAO YANG RW_EXIT(&vsw_rw); 864*6f09f0feSWENTAO YANG 865*6f09f0feSWENTAO YANG return (0); 866*6f09f0feSWENTAO YANG } 867*6f09f0feSWENTAO YANG 868*6f09f0feSWENTAO YANG /* 86934683adeSsg70180 * Get the value of the "vsw-phys-dev" property in the specified 87034683adeSsg70180 * node. This property is the name of the physical device that 87134683adeSsg70180 * the virtual switch will use to talk to the outside world. 87234683adeSsg70180 * 87334683adeSsg70180 * Note it is valid for this property to be NULL (but the property 87434683adeSsg70180 * itself must exist). Callers of this routine should verify that 87534683adeSsg70180 * the value returned is what they expected (i.e. either NULL or non NULL). 87634683adeSsg70180 * 87734683adeSsg70180 * On success returns value of the property in region pointed to by 87834683adeSsg70180 * the 'name' argument, and with return value of 0. Otherwise returns 1. 8791ae08745Sheppo */ 88034683adeSsg70180 static int 88134683adeSsg70180 vsw_get_md_physname(vsw_t *vswp, md_t *mdp, mde_cookie_t node, char *name) 8821ae08745Sheppo { 88334683adeSsg70180 int len = 0; 884f2b610cfSwentaoy int instance; 8851ae08745Sheppo char *physname = NULL; 8861ae08745Sheppo char *dev; 887f2b610cfSwentaoy const char *dev_name; 888f2b610cfSwentaoy char myname[MAXNAMELEN]; 889f2b610cfSwentaoy 890f2b610cfSwentaoy dev_name = ddi_driver_name(vswp->dip); 891f2b610cfSwentaoy instance = ddi_get_instance(vswp->dip); 892f2b610cfSwentaoy (void) snprintf(myname, MAXNAMELEN, "%s%d", dev_name, instance); 8931ae08745Sheppo 89434683adeSsg70180 if (md_get_prop_data(mdp, node, physdev_propname, 8951ae08745Sheppo (uint8_t **)(&physname), &len) != 0) { 89634683adeSsg70180 cmn_err(CE_WARN, "!vsw%d: Unable to get name(s) of physical " 89734683adeSsg70180 "device(s) from MD", vswp->instance); 89834683adeSsg70180 return (1); 8991ae08745Sheppo } else if ((strlen(physname) + 1) > LIFNAMSIZ) { 90034683adeSsg70180 cmn_err(CE_WARN, "!vsw%d: %s is too long a device name", 90134683adeSsg70180 vswp->instance, physname); 90234683adeSsg70180 return (1); 903f2b610cfSwentaoy } else if (strcmp(myname, physname) == 0) { 904f2b610cfSwentaoy /* 905f2b610cfSwentaoy * Prevent the vswitch from opening itself as the 906f2b610cfSwentaoy * network device. 907f2b610cfSwentaoy */ 908f2b610cfSwentaoy cmn_err(CE_WARN, "!vsw%d: %s is an invalid device name", 909f2b610cfSwentaoy vswp->instance, physname); 910f2b610cfSwentaoy return (1); 9111ae08745Sheppo } else { 91234683adeSsg70180 (void) strncpy(name, physname, strlen(physname) + 1); 9131ae08745Sheppo D2(vswp, "%s: using first device specified (%s)", 91434683adeSsg70180 __func__, physname); 9151ae08745Sheppo } 9161ae08745Sheppo 9171ae08745Sheppo #ifdef DEBUG 9181ae08745Sheppo /* 9191ae08745Sheppo * As a temporary measure to aid testing we check to see if there 9201ae08745Sheppo * is a vsw.conf file present. If there is we use the value of the 9211ae08745Sheppo * vsw_physname property in the file as the name of the physical 9221ae08745Sheppo * device, overriding the value from the MD. 9231ae08745Sheppo * 9241ae08745Sheppo * There may be multiple devices listed, but for the moment 9251ae08745Sheppo * we just use the first one. 9261ae08745Sheppo */ 9271ae08745Sheppo if (ddi_prop_lookup_string(DDI_DEV_T_ANY, vswp->dip, 0, 9281ae08745Sheppo "vsw_physname", &dev) == DDI_PROP_SUCCESS) { 9291ae08745Sheppo if ((strlen(dev) + 1) > LIFNAMSIZ) { 93034683adeSsg70180 cmn_err(CE_WARN, "vsw%d: %s is too long a device name", 93134683adeSsg70180 vswp->instance, dev); 93234683adeSsg70180 ddi_prop_free(dev); 93334683adeSsg70180 return (1); 9341ae08745Sheppo } else { 93534683adeSsg70180 cmn_err(CE_NOTE, "vsw%d: Using device name (%s) from " 93634683adeSsg70180 "config file", vswp->instance, dev); 9371ae08745Sheppo 93834683adeSsg70180 (void) strncpy(name, dev, strlen(dev) + 1); 9391ae08745Sheppo } 9401ae08745Sheppo 9411ae08745Sheppo ddi_prop_free(dev); 9421ae08745Sheppo } 9431ae08745Sheppo #endif 9441ae08745Sheppo 94534683adeSsg70180 return (0); 94634683adeSsg70180 } 947e1ebb9ecSlm66018 948e1ebb9ecSlm66018 /* 94934683adeSsg70180 * Read the 'vsw-switch-mode' property from the specified MD node. 95034683adeSsg70180 * 951da14cebeSEric Cheng * Returns 0 on success, otherwise returns 1. 952e1ebb9ecSlm66018 */ 95334683adeSsg70180 static int 954da14cebeSEric Cheng vsw_get_md_smodes(vsw_t *vswp, md_t *mdp, mde_cookie_t node, uint8_t *mode) 95534683adeSsg70180 { 95634683adeSsg70180 int len = 0; 95734683adeSsg70180 char *smode = NULL; 95834683adeSsg70180 char *curr_mode = NULL; 95934683adeSsg70180 96034683adeSsg70180 D1(vswp, "%s: enter", __func__); 9611ae08745Sheppo 9621ae08745Sheppo /* 9631ae08745Sheppo * Get the switch-mode property. The modes are listed in 9641ae08745Sheppo * decreasing order of preference, i.e. prefered mode is 9651ae08745Sheppo * first item in list. 9661ae08745Sheppo */ 9671ae08745Sheppo len = 0; 96834683adeSsg70180 if (md_get_prop_data(mdp, node, smode_propname, 9691ae08745Sheppo (uint8_t **)(&smode), &len) != 0) { 9701ae08745Sheppo /* 971e1ebb9ecSlm66018 * Unable to get switch-mode property from MD, nothing 972e1ebb9ecSlm66018 * more we can do. 9731ae08745Sheppo */ 97434683adeSsg70180 cmn_err(CE_WARN, "!vsw%d: Unable to get switch mode property" 97534683adeSsg70180 " from the MD", vswp->instance); 97634683adeSsg70180 return (1); 977e1ebb9ecSlm66018 } 978e1ebb9ecSlm66018 9791ae08745Sheppo curr_mode = smode; 9801ae08745Sheppo /* 9811ae08745Sheppo * Modes of operation: 9821ae08745Sheppo * 'switched' - layer 2 switching, underlying HW in 983e1ebb9ecSlm66018 * programmed mode. 9841ae08745Sheppo * 'promiscuous' - layer 2 switching, underlying HW in 9851ae08745Sheppo * promiscuous mode. 9861ae08745Sheppo * 'routed' - layer 3 (i.e. IP) routing, underlying HW 9871ae08745Sheppo * in non-promiscuous mode. 9881ae08745Sheppo */ 989da14cebeSEric Cheng while (curr_mode < (smode + len)) { 9901ae08745Sheppo D2(vswp, "%s: curr_mode = [%s]", __func__, curr_mode); 991e1ebb9ecSlm66018 if (strcmp(curr_mode, "switched") == 0) { 992da14cebeSEric Cheng *mode = VSW_LAYER2; 993e1ebb9ecSlm66018 } else if (strcmp(curr_mode, "promiscuous") == 0) { 994da14cebeSEric Cheng *mode = VSW_LAYER2 | VSW_LAYER2_PROMISC; 995e1ebb9ecSlm66018 } else if (strcmp(curr_mode, "routed") == 0) { 996da14cebeSEric Cheng *mode = VSW_LAYER3; 997e1ebb9ecSlm66018 } else { 998da14cebeSEric Cheng cmn_err(CE_WARN, "!vsw%d: Unknown switch mode %s, " 999da14cebeSEric Cheng "setting to default switched mode", 1000da14cebeSEric Cheng vswp->instance, curr_mode); 1001da14cebeSEric Cheng *mode = VSW_LAYER2; 10021ae08745Sheppo } 10031ae08745Sheppo curr_mode += strlen(curr_mode) + 1; 10041ae08745Sheppo } 10051ae08745Sheppo 1006da14cebeSEric Cheng D2(vswp, "%s: %d mode", __func__, *mode); 10071ae08745Sheppo 10081ae08745Sheppo D1(vswp, "%s: exit", __func__); 100934683adeSsg70180 101034683adeSsg70180 return (0); 10111ae08745Sheppo } 10121ae08745Sheppo 1013e1ebb9ecSlm66018 /* 10141ae08745Sheppo * Register with the MAC layer as a network device, so we 10151ae08745Sheppo * can be plumbed if necessary. 10161ae08745Sheppo */ 10171ae08745Sheppo static int 10181ae08745Sheppo vsw_mac_register(vsw_t *vswp) 10191ae08745Sheppo { 1020ba2e4443Sseb mac_register_t *macp; 1021ba2e4443Sseb int rv; 10221ae08745Sheppo 10231ae08745Sheppo D1(vswp, "%s: enter", __func__); 10241ae08745Sheppo 1025ba2e4443Sseb if ((macp = mac_alloc(MAC_VERSION)) == NULL) 1026ba2e4443Sseb return (EINVAL); 1027ba2e4443Sseb macp->m_type_ident = MAC_PLUGIN_IDENT_ETHER; 10281ae08745Sheppo macp->m_driver = vswp; 1029ba2e4443Sseb macp->m_dip = vswp->dip; 1030ba2e4443Sseb macp->m_src_addr = (uint8_t *)&vswp->if_addr; 1031ba2e4443Sseb macp->m_callbacks = &vsw_m_callbacks; 1032ba2e4443Sseb macp->m_min_sdu = 0; 10337b1f684aSSriharsha Basavapatna macp->m_max_sdu = vswp->mtu; 1034c1c61f44Ssb155480 macp->m_margin = VLAN_TAGSZ; 1035ba2e4443Sseb rv = mac_register(macp, &vswp->if_mh); 1036ba2e4443Sseb mac_free(macp); 103719b65a69Ssb155480 if (rv != 0) { 103819b65a69Ssb155480 /* 103919b65a69Ssb155480 * Treat this as a non-fatal error as we may be 104019b65a69Ssb155480 * able to operate in some other mode. 104119b65a69Ssb155480 */ 104219b65a69Ssb155480 cmn_err(CE_NOTE, "!vsw%d: Unable to register as " 104319b65a69Ssb155480 "a provider with MAC layer", vswp->instance); 104419b65a69Ssb155480 return (rv); 104519b65a69Ssb155480 } 104619b65a69Ssb155480 1047ba2e4443Sseb vswp->if_state |= VSW_IF_REG; 10481ae08745Sheppo 10491ae08745Sheppo D1(vswp, "%s: exit", __func__); 10501ae08745Sheppo 10511ae08745Sheppo return (rv); 10521ae08745Sheppo } 10531ae08745Sheppo 10541ae08745Sheppo static int 10551ae08745Sheppo vsw_mac_unregister(vsw_t *vswp) 10561ae08745Sheppo { 10571ae08745Sheppo int rv = 0; 10581ae08745Sheppo 10591ae08745Sheppo D1(vswp, "%s: enter", __func__); 10601ae08745Sheppo 10611ae08745Sheppo WRITE_ENTER(&vswp->if_lockrw); 10621ae08745Sheppo 1063ba2e4443Sseb if (vswp->if_state & VSW_IF_REG) { 1064ba2e4443Sseb rv = mac_unregister(vswp->if_mh); 10651ae08745Sheppo if (rv != 0) { 10661ae08745Sheppo DWARN(vswp, "%s: unable to unregister from MAC " 10671ae08745Sheppo "framework", __func__); 10681ae08745Sheppo 10691ae08745Sheppo RW_EXIT(&vswp->if_lockrw); 10701ae08745Sheppo D1(vswp, "%s: fail exit", __func__); 10711ae08745Sheppo return (rv); 10721ae08745Sheppo } 10731ae08745Sheppo 1074ba2e4443Sseb /* mark i/f as down and unregistered */ 1075ba2e4443Sseb vswp->if_state &= ~(VSW_IF_UP | VSW_IF_REG); 10761ae08745Sheppo } 10771ae08745Sheppo RW_EXIT(&vswp->if_lockrw); 10781ae08745Sheppo 10791ae08745Sheppo D1(vswp, "%s: exit", __func__); 10801ae08745Sheppo 10811ae08745Sheppo return (rv); 10821ae08745Sheppo } 10831ae08745Sheppo 1084ba2e4443Sseb static int 1085ba2e4443Sseb vsw_m_stat(void *arg, uint_t stat, uint64_t *val) 10861ae08745Sheppo { 10871ae08745Sheppo vsw_t *vswp = (vsw_t *)arg; 10881ae08745Sheppo 10891ae08745Sheppo D1(vswp, "%s: enter", __func__); 10901ae08745Sheppo 1091da14cebeSEric Cheng mutex_enter(&vswp->mac_lock); 109234683adeSsg70180 if (vswp->mh == NULL) { 1093da14cebeSEric Cheng mutex_exit(&vswp->mac_lock); 1094ba2e4443Sseb return (EINVAL); 109534683adeSsg70180 } 10961ae08745Sheppo 10971ae08745Sheppo /* return stats from underlying device */ 1098ba2e4443Sseb *val = mac_stat_get(vswp->mh, stat); 109934683adeSsg70180 1100da14cebeSEric Cheng mutex_exit(&vswp->mac_lock); 110134683adeSsg70180 1102ba2e4443Sseb return (0); 11031ae08745Sheppo } 11041ae08745Sheppo 11051ae08745Sheppo static void 11061ae08745Sheppo vsw_m_stop(void *arg) 11071ae08745Sheppo { 11081ae08745Sheppo vsw_t *vswp = (vsw_t *)arg; 11091ae08745Sheppo 11101ae08745Sheppo D1(vswp, "%s: enter", __func__); 11111ae08745Sheppo 11121ae08745Sheppo WRITE_ENTER(&vswp->if_lockrw); 11131ae08745Sheppo vswp->if_state &= ~VSW_IF_UP; 11141ae08745Sheppo RW_EXIT(&vswp->if_lockrw); 11151ae08745Sheppo 1116da14cebeSEric Cheng /* Cleanup and close the mac client */ 1117da14cebeSEric Cheng vsw_mac_client_cleanup(vswp, NULL, VSW_LOCALDEV); 11185f94e909Ssg70180 11191ae08745Sheppo D1(vswp, "%s: exit (state = %d)", __func__, vswp->if_state); 11201ae08745Sheppo } 11211ae08745Sheppo 11221ae08745Sheppo static int 11231ae08745Sheppo vsw_m_start(void *arg) 11241ae08745Sheppo { 1125da14cebeSEric Cheng int rv; 11261ae08745Sheppo vsw_t *vswp = (vsw_t *)arg; 11271ae08745Sheppo 11281ae08745Sheppo D1(vswp, "%s: enter", __func__); 11291ae08745Sheppo 11301ae08745Sheppo WRITE_ENTER(&vswp->if_lockrw); 11311ae08745Sheppo 113219b65a69Ssb155480 vswp->if_state |= VSW_IF_UP; 113319b65a69Ssb155480 113419b65a69Ssb155480 if (vswp->switching_setup_done == B_FALSE) { 113519b65a69Ssb155480 /* 113619b65a69Ssb155480 * If the switching mode has not been setup yet, just 113719b65a69Ssb155480 * return. The unicast address will be programmed 113819b65a69Ssb155480 * after the physical device is successfully setup by the 113919b65a69Ssb155480 * timeout handler. 114019b65a69Ssb155480 */ 114119b65a69Ssb155480 RW_EXIT(&vswp->if_lockrw); 114219b65a69Ssb155480 return (0); 114319b65a69Ssb155480 } 114419b65a69Ssb155480 114519b65a69Ssb155480 /* if in layer2 mode, program unicast address. */ 114619b65a69Ssb155480 if (vswp->mh != NULL) { 1147da14cebeSEric Cheng /* Init a mac client and program addresses */ 1148da14cebeSEric Cheng rv = vsw_mac_client_init(vswp, NULL, VSW_LOCALDEV); 1149da14cebeSEric Cheng if (rv != 0) { 1150da14cebeSEric Cheng cmn_err(CE_NOTE, 1151da14cebeSEric Cheng "!vsw%d: failed to program interface " 1152da14cebeSEric Cheng "unicast address\n", vswp->instance); 1153da14cebeSEric Cheng } 115419b65a69Ssb155480 } 115519b65a69Ssb155480 115619b65a69Ssb155480 RW_EXIT(&vswp->if_lockrw); 11575f94e909Ssg70180 11581ae08745Sheppo D1(vswp, "%s: exit (state = %d)", __func__, vswp->if_state); 11591ae08745Sheppo return (0); 11601ae08745Sheppo } 11611ae08745Sheppo 11621ae08745Sheppo /* 11631ae08745Sheppo * Change the local interface address. 11645f94e909Ssg70180 * 11655f94e909Ssg70180 * Note: we don't support this entry point. The local 11665f94e909Ssg70180 * mac address of the switch can only be changed via its 11675f94e909Ssg70180 * MD node properties. 11681ae08745Sheppo */ 11691ae08745Sheppo static int 11701ae08745Sheppo vsw_m_unicst(void *arg, const uint8_t *macaddr) 11711ae08745Sheppo { 11725f94e909Ssg70180 _NOTE(ARGUNUSED(arg, macaddr)) 11731ae08745Sheppo 11745f94e909Ssg70180 return (DDI_FAILURE); 11751ae08745Sheppo } 11761ae08745Sheppo 11771ae08745Sheppo static int 11781ae08745Sheppo vsw_m_multicst(void *arg, boolean_t add, const uint8_t *mca) 11791ae08745Sheppo { 11801ae08745Sheppo vsw_t *vswp = (vsw_t *)arg; 11811ae08745Sheppo mcst_addr_t *mcst_p = NULL; 11821ae08745Sheppo uint64_t addr = 0x0; 1183e1ebb9ecSlm66018 int i, ret = 0; 11841ae08745Sheppo 11851ae08745Sheppo D1(vswp, "%s: enter", __func__); 11861ae08745Sheppo 11871ae08745Sheppo /* 11881ae08745Sheppo * Convert address into form that can be used 11891ae08745Sheppo * as hash table key. 11901ae08745Sheppo */ 11911ae08745Sheppo for (i = 0; i < ETHERADDRL; i++) { 11921ae08745Sheppo addr = (addr << 8) | mca[i]; 11931ae08745Sheppo } 11941ae08745Sheppo 11951ae08745Sheppo D2(vswp, "%s: addr = 0x%llx", __func__, addr); 11961ae08745Sheppo 11971ae08745Sheppo if (add) { 11981ae08745Sheppo D2(vswp, "%s: adding multicast", __func__); 11991ae08745Sheppo if (vsw_add_mcst(vswp, VSW_LOCALDEV, addr, NULL) == 0) { 12001ae08745Sheppo /* 12011ae08745Sheppo * Update the list of multicast addresses 12021ae08745Sheppo * contained within the vsw_t structure to 12031ae08745Sheppo * include this new one. 12041ae08745Sheppo */ 12051ae08745Sheppo mcst_p = kmem_zalloc(sizeof (mcst_addr_t), KM_NOSLEEP); 12061ae08745Sheppo if (mcst_p == NULL) { 12071ae08745Sheppo DERR(vswp, "%s unable to alloc mem", __func__); 120819b65a69Ssb155480 (void) vsw_del_mcst(vswp, 120919b65a69Ssb155480 VSW_LOCALDEV, addr, NULL); 12101ae08745Sheppo return (1); 12111ae08745Sheppo } 12121ae08745Sheppo mcst_p->addr = addr; 121319b65a69Ssb155480 ether_copy(mca, &mcst_p->mca); 12141ae08745Sheppo 12151ae08745Sheppo /* 12161ae08745Sheppo * Call into the underlying driver to program the 12171ae08745Sheppo * address into HW. 12181ae08745Sheppo */ 1219da14cebeSEric Cheng ret = vsw_mac_multicast_add(vswp, NULL, mcst_p, 1220da14cebeSEric Cheng VSW_LOCALDEV); 1221e1ebb9ecSlm66018 if (ret != 0) { 122219b65a69Ssb155480 (void) vsw_del_mcst(vswp, 122319b65a69Ssb155480 VSW_LOCALDEV, addr, NULL); 122419b65a69Ssb155480 kmem_free(mcst_p, sizeof (*mcst_p)); 122519b65a69Ssb155480 return (ret); 1226e1ebb9ecSlm66018 } 122719b65a69Ssb155480 122819b65a69Ssb155480 mutex_enter(&vswp->mca_lock); 122919b65a69Ssb155480 mcst_p->nextp = vswp->mcap; 123019b65a69Ssb155480 vswp->mcap = mcst_p; 123119b65a69Ssb155480 mutex_exit(&vswp->mca_lock); 12321ae08745Sheppo } else { 1233da14cebeSEric Cheng cmn_err(CE_WARN, "!vsw%d: unable to add multicast " 123434683adeSsg70180 "address", vswp->instance); 1235e1ebb9ecSlm66018 } 1236e1ebb9ecSlm66018 return (ret); 1237e1ebb9ecSlm66018 } 1238e1ebb9ecSlm66018 12391ae08745Sheppo D2(vswp, "%s: removing multicast", __func__); 12401ae08745Sheppo /* 12411ae08745Sheppo * Remove the address from the hash table.. 12421ae08745Sheppo */ 12431ae08745Sheppo if (vsw_del_mcst(vswp, VSW_LOCALDEV, addr, NULL) == 0) { 12441ae08745Sheppo 12451ae08745Sheppo /* 12461ae08745Sheppo * ..and then from the list maintained in the 12471ae08745Sheppo * vsw_t structure. 12481ae08745Sheppo */ 124919b65a69Ssb155480 mcst_p = vsw_del_addr(VSW_LOCALDEV, vswp, addr); 125019b65a69Ssb155480 ASSERT(mcst_p != NULL); 12511ae08745Sheppo 1252da14cebeSEric Cheng vsw_mac_multicast_remove(vswp, NULL, mcst_p, VSW_LOCALDEV); 125319b65a69Ssb155480 kmem_free(mcst_p, sizeof (*mcst_p)); 12541ae08745Sheppo } 12551ae08745Sheppo 12561ae08745Sheppo D1(vswp, "%s: exit", __func__); 12571ae08745Sheppo 12581ae08745Sheppo return (0); 12591ae08745Sheppo } 12601ae08745Sheppo 12611ae08745Sheppo static int 12621ae08745Sheppo vsw_m_promisc(void *arg, boolean_t on) 12631ae08745Sheppo { 12641ae08745Sheppo vsw_t *vswp = (vsw_t *)arg; 12651ae08745Sheppo 12661ae08745Sheppo D1(vswp, "%s: enter", __func__); 12671ae08745Sheppo 12681ae08745Sheppo WRITE_ENTER(&vswp->if_lockrw); 12691ae08745Sheppo if (on) 12701ae08745Sheppo vswp->if_state |= VSW_IF_PROMISC; 12711ae08745Sheppo else 12721ae08745Sheppo vswp->if_state &= ~VSW_IF_PROMISC; 12731ae08745Sheppo RW_EXIT(&vswp->if_lockrw); 12741ae08745Sheppo 12751ae08745Sheppo D1(vswp, "%s: exit", __func__); 12761ae08745Sheppo 12771ae08745Sheppo return (0); 12781ae08745Sheppo } 12791ae08745Sheppo 12801ae08745Sheppo static mblk_t * 12811ae08745Sheppo vsw_m_tx(void *arg, mblk_t *mp) 12821ae08745Sheppo { 12831ae08745Sheppo vsw_t *vswp = (vsw_t *)arg; 12841ae08745Sheppo 12851ae08745Sheppo D1(vswp, "%s: enter", __func__); 12861ae08745Sheppo 1287c1c61f44Ssb155480 mp = vsw_vlan_frame_pretag(vswp, VSW_LOCALDEV, mp); 1288c1c61f44Ssb155480 1289c1c61f44Ssb155480 if (mp == NULL) { 1290c1c61f44Ssb155480 return (NULL); 1291c1c61f44Ssb155480 } 1292c1c61f44Ssb155480 129334683adeSsg70180 vswp->vsw_switch_frame(vswp, mp, VSW_LOCALDEV, NULL, NULL); 12941ae08745Sheppo 12951ae08745Sheppo D1(vswp, "%s: exit", __func__); 12961ae08745Sheppo 12971ae08745Sheppo return (NULL); 12981ae08745Sheppo } 12991ae08745Sheppo 13001ae08745Sheppo /* 13011ae08745Sheppo * Register for machine description (MD) updates. 130234683adeSsg70180 * 130334683adeSsg70180 * Returns 0 on success, 1 on failure. 13041ae08745Sheppo */ 130534683adeSsg70180 static int 13061ae08745Sheppo vsw_mdeg_register(vsw_t *vswp) 13071ae08745Sheppo { 13081ae08745Sheppo mdeg_prop_spec_t *pspecp; 13091ae08745Sheppo mdeg_node_spec_t *inst_specp; 131034683adeSsg70180 mdeg_handle_t mdeg_hdl, mdeg_port_hdl; 13111ae08745Sheppo size_t templatesz; 131219b65a69Ssb155480 int rv; 13131ae08745Sheppo 13141ae08745Sheppo D1(vswp, "%s: enter", __func__); 13151ae08745Sheppo 131634683adeSsg70180 /* 13171ae08745Sheppo * Allocate and initialize a per-instance copy 13181ae08745Sheppo * of the global property spec array that will 13191ae08745Sheppo * uniquely identify this vsw instance. 13201ae08745Sheppo */ 13211ae08745Sheppo templatesz = sizeof (vsw_prop_template); 13221ae08745Sheppo pspecp = kmem_zalloc(templatesz, KM_SLEEP); 13231ae08745Sheppo 13241ae08745Sheppo bcopy(vsw_prop_template, pspecp, templatesz); 13251ae08745Sheppo 132619b65a69Ssb155480 VSW_SET_MDEG_PROP_INST(pspecp, vswp->regprop); 13271ae08745Sheppo 13281ae08745Sheppo /* initialize the complete prop spec structure */ 13291ae08745Sheppo inst_specp = kmem_zalloc(sizeof (mdeg_node_spec_t), KM_SLEEP); 13301ae08745Sheppo inst_specp->namep = "virtual-device"; 13311ae08745Sheppo inst_specp->specp = pspecp; 13321ae08745Sheppo 133319b65a69Ssb155480 D2(vswp, "%s: instance %d registering with mdeg", __func__, 133419b65a69Ssb155480 vswp->regprop); 133534683adeSsg70180 /* 133634683adeSsg70180 * Register an interest in 'virtual-device' nodes with a 133734683adeSsg70180 * 'name' property of 'virtual-network-switch' 133834683adeSsg70180 */ 133934683adeSsg70180 rv = mdeg_register(inst_specp, &vdev_match, vsw_mdeg_cb, 13401ae08745Sheppo (void *)vswp, &mdeg_hdl); 134134683adeSsg70180 if (rv != MDEG_SUCCESS) { 134234683adeSsg70180 DERR(vswp, "%s: mdeg_register failed (%d) for vsw node", 134334683adeSsg70180 __func__, rv); 134434683adeSsg70180 goto mdeg_reg_fail; 134534683adeSsg70180 } 13461ae08745Sheppo 134734683adeSsg70180 /* 134834683adeSsg70180 * Register an interest in 'vsw-port' nodes. 134934683adeSsg70180 */ 135034683adeSsg70180 rv = mdeg_register(inst_specp, &vport_match, vsw_port_mdeg_cb, 135134683adeSsg70180 (void *)vswp, &mdeg_port_hdl); 13521ae08745Sheppo if (rv != MDEG_SUCCESS) { 13531ae08745Sheppo DERR(vswp, "%s: mdeg_register failed (%d)\n", __func__, rv); 135434683adeSsg70180 (void) mdeg_unregister(mdeg_hdl); 135534683adeSsg70180 goto mdeg_reg_fail; 13561ae08745Sheppo } 13571ae08745Sheppo 13581ae08745Sheppo /* save off data that will be needed later */ 13591ae08745Sheppo vswp->inst_spec = inst_specp; 13601ae08745Sheppo vswp->mdeg_hdl = mdeg_hdl; 136134683adeSsg70180 vswp->mdeg_port_hdl = mdeg_port_hdl; 13621ae08745Sheppo 13631ae08745Sheppo D1(vswp, "%s: exit", __func__); 136434683adeSsg70180 return (0); 136534683adeSsg70180 136634683adeSsg70180 mdeg_reg_fail: 136734683adeSsg70180 cmn_err(CE_WARN, "!vsw%d: Unable to register MDEG callbacks", 136834683adeSsg70180 vswp->instance); 136934683adeSsg70180 kmem_free(pspecp, templatesz); 137034683adeSsg70180 kmem_free(inst_specp, sizeof (mdeg_node_spec_t)); 137134683adeSsg70180 137234683adeSsg70180 vswp->mdeg_hdl = NULL; 137334683adeSsg70180 vswp->mdeg_port_hdl = NULL; 137434683adeSsg70180 137534683adeSsg70180 return (1); 13761ae08745Sheppo } 13771ae08745Sheppo 13781ae08745Sheppo static void 13791ae08745Sheppo vsw_mdeg_unregister(vsw_t *vswp) 13801ae08745Sheppo { 13811ae08745Sheppo D1(vswp, "vsw_mdeg_unregister: enter"); 13821ae08745Sheppo 138334683adeSsg70180 if (vswp->mdeg_hdl != NULL) 13841ae08745Sheppo (void) mdeg_unregister(vswp->mdeg_hdl); 13851ae08745Sheppo 138634683adeSsg70180 if (vswp->mdeg_port_hdl != NULL) 138734683adeSsg70180 (void) mdeg_unregister(vswp->mdeg_port_hdl); 138834683adeSsg70180 138934683adeSsg70180 if (vswp->inst_spec != NULL) { 13901ae08745Sheppo if (vswp->inst_spec->specp != NULL) { 13911ae08745Sheppo (void) kmem_free(vswp->inst_spec->specp, 13921ae08745Sheppo sizeof (vsw_prop_template)); 13931ae08745Sheppo vswp->inst_spec->specp = NULL; 13941ae08745Sheppo } 13951ae08745Sheppo 1396205eeb1aSlm66018 (void) kmem_free(vswp->inst_spec, sizeof (mdeg_node_spec_t)); 13971ae08745Sheppo vswp->inst_spec = NULL; 13981ae08745Sheppo } 13991ae08745Sheppo 14001ae08745Sheppo D1(vswp, "vsw_mdeg_unregister: exit"); 14011ae08745Sheppo } 14021ae08745Sheppo 140334683adeSsg70180 /* 140434683adeSsg70180 * Mdeg callback invoked for the vsw node itself. 140534683adeSsg70180 */ 14061ae08745Sheppo static int 14071ae08745Sheppo vsw_mdeg_cb(void *cb_argp, mdeg_result_t *resp) 14081ae08745Sheppo { 14091ae08745Sheppo vsw_t *vswp; 14101ae08745Sheppo md_t *mdp; 14111ae08745Sheppo mde_cookie_t node; 14121ae08745Sheppo uint64_t inst; 141334683adeSsg70180 char *node_name = NULL; 14141ae08745Sheppo 14151ae08745Sheppo if (resp == NULL) 14161ae08745Sheppo return (MDEG_FAILURE); 14171ae08745Sheppo 14181ae08745Sheppo vswp = (vsw_t *)cb_argp; 14191ae08745Sheppo 142034683adeSsg70180 D1(vswp, "%s: added %d : removed %d : curr matched %d" 142134683adeSsg70180 " : prev matched %d", __func__, resp->added.nelem, 142234683adeSsg70180 resp->removed.nelem, resp->match_curr.nelem, 142334683adeSsg70180 resp->match_prev.nelem); 142434683adeSsg70180 142534683adeSsg70180 /* 142619b65a69Ssb155480 * We get an initial callback for this node as 'added' 142719b65a69Ssb155480 * after registering with mdeg. Note that we would have 142819b65a69Ssb155480 * already gathered information about this vsw node by 142919b65a69Ssb155480 * walking MD earlier during attach (in vsw_read_mdprops()). 143019b65a69Ssb155480 * So, there is a window where the properties of this 143119b65a69Ssb155480 * node might have changed when we get this initial 'added' 143219b65a69Ssb155480 * callback. We handle this as if an update occured 143319b65a69Ssb155480 * and invoke the same function which handles updates to 143419b65a69Ssb155480 * the properties of this vsw-node if any. 143519b65a69Ssb155480 * 143634683adeSsg70180 * A non-zero 'match' value indicates that the MD has been 143719b65a69Ssb155480 * updated and that a virtual-network-switch node is 143819b65a69Ssb155480 * present which may or may not have been updated. It is 143919b65a69Ssb155480 * up to the clients to examine their own nodes and 144019b65a69Ssb155480 * determine if they have changed. 144134683adeSsg70180 */ 144219b65a69Ssb155480 if (resp->added.nelem != 0) { 144334683adeSsg70180 144419b65a69Ssb155480 if (resp->added.nelem != 1) { 144519b65a69Ssb155480 cmn_err(CE_NOTE, "!vsw%d: number of nodes added " 144619b65a69Ssb155480 "invalid: %d\n", vswp->instance, resp->added.nelem); 144719b65a69Ssb155480 return (MDEG_FAILURE); 144819b65a69Ssb155480 } 144919b65a69Ssb155480 145019b65a69Ssb155480 mdp = resp->added.mdp; 145119b65a69Ssb155480 node = resp->added.mdep[0]; 145219b65a69Ssb155480 145319b65a69Ssb155480 } else if (resp->match_curr.nelem != 0) { 145419b65a69Ssb155480 145519b65a69Ssb155480 if (resp->match_curr.nelem != 1) { 145619b65a69Ssb155480 cmn_err(CE_NOTE, "!vsw%d: number of nodes updated " 145719b65a69Ssb155480 "invalid: %d\n", vswp->instance, 145819b65a69Ssb155480 resp->match_curr.nelem); 145919b65a69Ssb155480 return (MDEG_FAILURE); 146019b65a69Ssb155480 } 146119b65a69Ssb155480 146219b65a69Ssb155480 mdp = resp->match_curr.mdp; 146319b65a69Ssb155480 node = resp->match_curr.mdep[0]; 146419b65a69Ssb155480 146519b65a69Ssb155480 } else { 146619b65a69Ssb155480 return (MDEG_FAILURE); 146719b65a69Ssb155480 } 146819b65a69Ssb155480 146919b65a69Ssb155480 /* Validate name and instance */ 147034683adeSsg70180 if (md_get_prop_str(mdp, node, "name", &node_name) != 0) { 147119b65a69Ssb155480 DERR(vswp, "%s: unable to get node name\n", __func__); 147219b65a69Ssb155480 return (MDEG_FAILURE); 147319b65a69Ssb155480 } 147419b65a69Ssb155480 147519b65a69Ssb155480 /* is this a virtual-network-switch? */ 147619b65a69Ssb155480 if (strcmp(node_name, vsw_propname) != 0) { 147719b65a69Ssb155480 DERR(vswp, "%s: Invalid node name: %s\n", 147819b65a69Ssb155480 __func__, node_name); 147919b65a69Ssb155480 return (MDEG_FAILURE); 148034683adeSsg70180 } 148134683adeSsg70180 148234683adeSsg70180 if (md_get_prop_val(mdp, node, "cfg-handle", &inst)) { 148319b65a69Ssb155480 DERR(vswp, "%s: prop(cfg-handle) not found\n", 148419b65a69Ssb155480 __func__); 148519b65a69Ssb155480 return (MDEG_FAILURE); 148634683adeSsg70180 } 148734683adeSsg70180 148819b65a69Ssb155480 /* is this the right instance of vsw? */ 148919b65a69Ssb155480 if (inst != vswp->regprop) { 149019b65a69Ssb155480 DERR(vswp, "%s: Invalid cfg-handle: %lx\n", 149119b65a69Ssb155480 __func__, inst); 149219b65a69Ssb155480 return (MDEG_FAILURE); 149319b65a69Ssb155480 } 149434683adeSsg70180 149534683adeSsg70180 vsw_update_md_prop(vswp, mdp, node); 149634683adeSsg70180 149734683adeSsg70180 return (MDEG_SUCCESS); 149834683adeSsg70180 } 149934683adeSsg70180 150034683adeSsg70180 /* 150134683adeSsg70180 * Mdeg callback invoked for changes to the vsw-port nodes 150234683adeSsg70180 * under the vsw node. 150334683adeSsg70180 */ 150434683adeSsg70180 static int 150534683adeSsg70180 vsw_port_mdeg_cb(void *cb_argp, mdeg_result_t *resp) 150634683adeSsg70180 { 150734683adeSsg70180 vsw_t *vswp; 150834683adeSsg70180 int idx; 150934683adeSsg70180 md_t *mdp; 151034683adeSsg70180 mde_cookie_t node; 151134683adeSsg70180 uint64_t inst; 15121ef0bbb5Snarayan int rv; 151334683adeSsg70180 151434683adeSsg70180 if ((resp == NULL) || (cb_argp == NULL)) 151534683adeSsg70180 return (MDEG_FAILURE); 151634683adeSsg70180 151734683adeSsg70180 vswp = (vsw_t *)cb_argp; 151834683adeSsg70180 151934683adeSsg70180 D2(vswp, "%s: added %d : removed %d : curr matched %d" 152034683adeSsg70180 " : prev matched %d", __func__, resp->added.nelem, 152134683adeSsg70180 resp->removed.nelem, resp->match_curr.nelem, 15221ae08745Sheppo resp->match_prev.nelem); 15231ae08745Sheppo 15241ae08745Sheppo /* process added ports */ 15251ae08745Sheppo for (idx = 0; idx < resp->added.nelem; idx++) { 15261ae08745Sheppo mdp = resp->added.mdp; 15271ae08745Sheppo node = resp->added.mdep[idx]; 15281ae08745Sheppo 15291ae08745Sheppo D2(vswp, "%s: adding node(%d) 0x%lx", __func__, idx, node); 15301ae08745Sheppo 15311ef0bbb5Snarayan if ((rv = vsw_port_add(vswp, mdp, &node)) != 0) { 153234683adeSsg70180 cmn_err(CE_WARN, "!vsw%d: Unable to add new port " 15331ef0bbb5Snarayan "(0x%lx), err=%d", vswp->instance, node, rv); 15341ae08745Sheppo } 15351ae08745Sheppo } 15361ae08745Sheppo 15371ae08745Sheppo /* process removed ports */ 15381ae08745Sheppo for (idx = 0; idx < resp->removed.nelem; idx++) { 15391ae08745Sheppo mdp = resp->removed.mdp; 15401ae08745Sheppo node = resp->removed.mdep[idx]; 15411ae08745Sheppo 15421ae08745Sheppo if (md_get_prop_val(mdp, node, id_propname, &inst)) { 154334683adeSsg70180 DERR(vswp, "%s: prop(%s) not found in port(%d)", 15441ae08745Sheppo __func__, id_propname, idx); 15451ae08745Sheppo continue; 15461ae08745Sheppo } 15471ae08745Sheppo 15481ae08745Sheppo D2(vswp, "%s: removing node(%d) 0x%lx", __func__, idx, node); 15491ae08745Sheppo 15501ae08745Sheppo if (vsw_port_detach(vswp, inst) != 0) { 155134683adeSsg70180 cmn_err(CE_WARN, "!vsw%d: Unable to remove port %ld", 155234683adeSsg70180 vswp->instance, inst); 15531ae08745Sheppo } 15541ae08745Sheppo } 15551ae08745Sheppo 1556c1c61f44Ssb155480 for (idx = 0; idx < resp->match_curr.nelem; idx++) { 1557c1c61f44Ssb155480 (void) vsw_port_update(vswp, resp->match_curr.mdp, 1558c1c61f44Ssb155480 resp->match_curr.mdep[idx], 1559c1c61f44Ssb155480 resp->match_prev.mdp, 1560c1c61f44Ssb155480 resp->match_prev.mdep[idx]); 1561c1c61f44Ssb155480 } 15621ae08745Sheppo 15631ae08745Sheppo D1(vswp, "%s: exit", __func__); 15641ae08745Sheppo 15651ae08745Sheppo return (MDEG_SUCCESS); 15661ae08745Sheppo } 15671ae08745Sheppo 15681ae08745Sheppo /* 156919b65a69Ssb155480 * Scan the machine description for this instance of vsw 157019b65a69Ssb155480 * and read its properties. Called only from vsw_attach(). 157119b65a69Ssb155480 * Returns: 0 on success, 1 on failure. 157219b65a69Ssb155480 */ 157319b65a69Ssb155480 static int 157419b65a69Ssb155480 vsw_read_mdprops(vsw_t *vswp) 157519b65a69Ssb155480 { 157619b65a69Ssb155480 md_t *mdp = NULL; 157719b65a69Ssb155480 mde_cookie_t rootnode; 157819b65a69Ssb155480 mde_cookie_t *listp = NULL; 157919b65a69Ssb155480 uint64_t inst; 158019b65a69Ssb155480 uint64_t cfgh; 158119b65a69Ssb155480 char *name; 158219b65a69Ssb155480 int rv = 1; 158319b65a69Ssb155480 int num_nodes = 0; 158419b65a69Ssb155480 int num_devs = 0; 158519b65a69Ssb155480 int listsz = 0; 158619b65a69Ssb155480 int i; 158719b65a69Ssb155480 158819b65a69Ssb155480 /* 158919b65a69Ssb155480 * In each 'virtual-device' node in the MD there is a 159019b65a69Ssb155480 * 'cfg-handle' property which is the MD's concept of 159119b65a69Ssb155480 * an instance number (this may be completely different from 159219b65a69Ssb155480 * the device drivers instance #). OBP reads that value and 159319b65a69Ssb155480 * stores it in the 'reg' property of the appropriate node in 159419b65a69Ssb155480 * the device tree. We first read this reg property and use this 159519b65a69Ssb155480 * to compare against the 'cfg-handle' property of vsw nodes 159619b65a69Ssb155480 * in MD to get to this specific vsw instance and then read 159719b65a69Ssb155480 * other properties that we are interested in. 159819b65a69Ssb155480 * We also cache the value of 'reg' property and use it later 159919b65a69Ssb155480 * to register callbacks with mdeg (see vsw_mdeg_register()) 160019b65a69Ssb155480 */ 160119b65a69Ssb155480 inst = ddi_prop_get_int(DDI_DEV_T_ANY, vswp->dip, 160219b65a69Ssb155480 DDI_PROP_DONTPASS, reg_propname, -1); 160319b65a69Ssb155480 if (inst == -1) { 160419b65a69Ssb155480 cmn_err(CE_NOTE, "!vsw%d: Unable to read %s property from " 160519b65a69Ssb155480 "OBP device tree", vswp->instance, reg_propname); 160619b65a69Ssb155480 return (rv); 160719b65a69Ssb155480 } 160819b65a69Ssb155480 160919b65a69Ssb155480 vswp->regprop = inst; 161019b65a69Ssb155480 161119b65a69Ssb155480 if ((mdp = md_get_handle()) == NULL) { 161219b65a69Ssb155480 DWARN(vswp, "%s: cannot init MD\n", __func__); 161319b65a69Ssb155480 return (rv); 161419b65a69Ssb155480 } 161519b65a69Ssb155480 161619b65a69Ssb155480 num_nodes = md_node_count(mdp); 161719b65a69Ssb155480 ASSERT(num_nodes > 0); 161819b65a69Ssb155480 161919b65a69Ssb155480 listsz = num_nodes * sizeof (mde_cookie_t); 162019b65a69Ssb155480 listp = (mde_cookie_t *)kmem_zalloc(listsz, KM_SLEEP); 162119b65a69Ssb155480 162219b65a69Ssb155480 rootnode = md_root_node(mdp); 162319b65a69Ssb155480 162419b65a69Ssb155480 /* search for all "virtual_device" nodes */ 162519b65a69Ssb155480 num_devs = md_scan_dag(mdp, rootnode, 162619b65a69Ssb155480 md_find_name(mdp, vdev_propname), 162719b65a69Ssb155480 md_find_name(mdp, "fwd"), listp); 162819b65a69Ssb155480 if (num_devs <= 0) { 162919b65a69Ssb155480 DWARN(vswp, "%s: invalid num_devs:%d\n", __func__, num_devs); 163019b65a69Ssb155480 goto vsw_readmd_exit; 163119b65a69Ssb155480 } 163219b65a69Ssb155480 163319b65a69Ssb155480 /* 163419b65a69Ssb155480 * Now loop through the list of virtual-devices looking for 163519b65a69Ssb155480 * devices with name "virtual-network-switch" and for each 163619b65a69Ssb155480 * such device compare its instance with what we have from 163719b65a69Ssb155480 * the 'reg' property to find the right node in MD and then 163819b65a69Ssb155480 * read all its properties. 163919b65a69Ssb155480 */ 164019b65a69Ssb155480 for (i = 0; i < num_devs; i++) { 164119b65a69Ssb155480 164219b65a69Ssb155480 if (md_get_prop_str(mdp, listp[i], "name", &name) != 0) { 164319b65a69Ssb155480 DWARN(vswp, "%s: name property not found\n", 164419b65a69Ssb155480 __func__); 164519b65a69Ssb155480 goto vsw_readmd_exit; 164619b65a69Ssb155480 } 164719b65a69Ssb155480 164819b65a69Ssb155480 /* is this a virtual-network-switch? */ 164919b65a69Ssb155480 if (strcmp(name, vsw_propname) != 0) 165019b65a69Ssb155480 continue; 165119b65a69Ssb155480 165219b65a69Ssb155480 if (md_get_prop_val(mdp, listp[i], "cfg-handle", &cfgh) != 0) { 165319b65a69Ssb155480 DWARN(vswp, "%s: cfg-handle property not found\n", 165419b65a69Ssb155480 __func__); 165519b65a69Ssb155480 goto vsw_readmd_exit; 165619b65a69Ssb155480 } 165719b65a69Ssb155480 165819b65a69Ssb155480 /* is this the required instance of vsw? */ 165919b65a69Ssb155480 if (inst != cfgh) 166019b65a69Ssb155480 continue; 166119b65a69Ssb155480 166219b65a69Ssb155480 /* now read all properties of this vsw instance */ 166319b65a69Ssb155480 rv = vsw_get_initial_md_properties(vswp, mdp, listp[i]); 166419b65a69Ssb155480 break; 166519b65a69Ssb155480 } 166619b65a69Ssb155480 166719b65a69Ssb155480 vsw_readmd_exit: 166819b65a69Ssb155480 166919b65a69Ssb155480 kmem_free(listp, listsz); 167019b65a69Ssb155480 (void) md_fini_handle(mdp); 167119b65a69Ssb155480 return (rv); 167219b65a69Ssb155480 } 167319b65a69Ssb155480 167419b65a69Ssb155480 /* 167534683adeSsg70180 * Read the initial start-of-day values from the specified MD node. 167634683adeSsg70180 */ 167719b65a69Ssb155480 static int 167834683adeSsg70180 vsw_get_initial_md_properties(vsw_t *vswp, md_t *mdp, mde_cookie_t node) 167934683adeSsg70180 { 168034683adeSsg70180 uint64_t macaddr = 0; 168134683adeSsg70180 168234683adeSsg70180 D1(vswp, "%s: enter", __func__); 168334683adeSsg70180 168419b65a69Ssb155480 if (vsw_get_md_physname(vswp, mdp, node, vswp->physname) != 0) { 168519b65a69Ssb155480 return (1); 168634683adeSsg70180 } 168734683adeSsg70180 168834683adeSsg70180 /* mac address for vswitch device itself */ 168934683adeSsg70180 if (md_get_prop_val(mdp, node, macaddr_propname, &macaddr) != 0) { 169034683adeSsg70180 cmn_err(CE_WARN, "!vsw%d: Unable to get MAC address from MD", 169134683adeSsg70180 vswp->instance); 169219b65a69Ssb155480 return (1); 169319b65a69Ssb155480 } 169434683adeSsg70180 169519b65a69Ssb155480 vsw_save_lmacaddr(vswp, macaddr); 169634683adeSsg70180 1697da14cebeSEric Cheng if (vsw_get_md_smodes(vswp, mdp, node, &vswp->smode)) { 16981ef0bbb5Snarayan DWARN(vswp, "%s: Unable to read %s property from MD, " 16991ef0bbb5Snarayan "defaulting to 'switched' mode", 17001ef0bbb5Snarayan __func__, smode_propname); 170134683adeSsg70180 1702da14cebeSEric Cheng vswp->smode = VSW_LAYER2; 170334683adeSsg70180 } 170434683adeSsg70180 17057b1f684aSSriharsha Basavapatna /* read mtu */ 17067b1f684aSSriharsha Basavapatna vsw_mtu_read(vswp, mdp, node, &vswp->mtu); 17077b1f684aSSriharsha Basavapatna if (vswp->mtu < ETHERMTU || vswp->mtu > VNET_MAX_MTU) { 17087b1f684aSSriharsha Basavapatna vswp->mtu = ETHERMTU; 17097b1f684aSSriharsha Basavapatna } 17107b1f684aSSriharsha Basavapatna vswp->max_frame_size = vswp->mtu + sizeof (struct ether_header) + 17117b1f684aSSriharsha Basavapatna VLAN_TAGSZ; 17127b1f684aSSriharsha Basavapatna 1713c1c61f44Ssb155480 /* read vlan id properties of this vsw instance */ 1714c1c61f44Ssb155480 vsw_vlan_read_ids(vswp, VSW_LOCALDEV, mdp, node, &vswp->pvid, 1715c1c61f44Ssb155480 &vswp->vids, &vswp->nvids, &vswp->default_vlan_id); 1716c1c61f44Ssb155480 1717c1c61f44Ssb155480 /* read priority-ether-types */ 1718f0ca1d9aSsb155480 vsw_read_pri_eth_types(vswp, mdp, node); 1719f0ca1d9aSsb155480 172034683adeSsg70180 D1(vswp, "%s: exit", __func__); 172119b65a69Ssb155480 return (0); 172234683adeSsg70180 } 172334683adeSsg70180 172434683adeSsg70180 /* 1725c1c61f44Ssb155480 * Read vlan id properties of the given MD node. 1726c1c61f44Ssb155480 * Arguments: 1727c1c61f44Ssb155480 * arg: device argument(vsw device or a port) 1728c1c61f44Ssb155480 * type: type of arg; VSW_LOCALDEV(vsw device) or VSW_VNETPORT(port) 1729c1c61f44Ssb155480 * mdp: machine description 1730c1c61f44Ssb155480 * node: md node cookie 1731c1c61f44Ssb155480 * 1732c1c61f44Ssb155480 * Returns: 1733c1c61f44Ssb155480 * pvidp: port-vlan-id of the node 1734c1c61f44Ssb155480 * vidspp: list of vlan-ids of the node 1735c1c61f44Ssb155480 * nvidsp: # of vlan-ids in the list 1736c1c61f44Ssb155480 * default_idp: default-vlan-id of the node(if node is vsw device) 1737c1c61f44Ssb155480 */ 1738c1c61f44Ssb155480 static void 1739c1c61f44Ssb155480 vsw_vlan_read_ids(void *arg, int type, md_t *mdp, mde_cookie_t node, 1740da14cebeSEric Cheng uint16_t *pvidp, vsw_vlanid_t **vidspp, uint16_t *nvidsp, 1741c1c61f44Ssb155480 uint16_t *default_idp) 1742c1c61f44Ssb155480 { 1743c1c61f44Ssb155480 vsw_t *vswp; 1744c1c61f44Ssb155480 vsw_port_t *portp; 1745c1c61f44Ssb155480 char *pvid_propname; 1746c1c61f44Ssb155480 char *vid_propname; 1747c1c61f44Ssb155480 uint_t nvids = 0; 1748c1c61f44Ssb155480 uint32_t vids_size; 1749c1c61f44Ssb155480 int rv; 1750c1c61f44Ssb155480 int i; 1751c1c61f44Ssb155480 uint64_t *data; 1752c1c61f44Ssb155480 uint64_t val; 1753c1c61f44Ssb155480 int size; 1754c1c61f44Ssb155480 int inst; 1755c1c61f44Ssb155480 1756c1c61f44Ssb155480 if (type == VSW_LOCALDEV) { 1757c1c61f44Ssb155480 1758c1c61f44Ssb155480 vswp = (vsw_t *)arg; 1759c1c61f44Ssb155480 pvid_propname = vsw_pvid_propname; 1760c1c61f44Ssb155480 vid_propname = vsw_vid_propname; 1761c1c61f44Ssb155480 inst = vswp->instance; 1762c1c61f44Ssb155480 1763c1c61f44Ssb155480 } else if (type == VSW_VNETPORT) { 1764c1c61f44Ssb155480 1765c1c61f44Ssb155480 portp = (vsw_port_t *)arg; 1766c1c61f44Ssb155480 vswp = portp->p_vswp; 1767c1c61f44Ssb155480 pvid_propname = port_pvid_propname; 1768c1c61f44Ssb155480 vid_propname = port_vid_propname; 1769c1c61f44Ssb155480 inst = portp->p_instance; 1770c1c61f44Ssb155480 1771c1c61f44Ssb155480 } else { 1772c1c61f44Ssb155480 return; 1773c1c61f44Ssb155480 } 1774c1c61f44Ssb155480 1775c1c61f44Ssb155480 if (type == VSW_LOCALDEV && default_idp != NULL) { 1776c1c61f44Ssb155480 rv = md_get_prop_val(mdp, node, vsw_dvid_propname, &val); 1777c1c61f44Ssb155480 if (rv != 0) { 1778c1c61f44Ssb155480 DWARN(vswp, "%s: prop(%s) not found", __func__, 1779c1c61f44Ssb155480 vsw_dvid_propname); 1780c1c61f44Ssb155480 1781c1c61f44Ssb155480 *default_idp = vsw_default_vlan_id; 1782c1c61f44Ssb155480 } else { 1783c1c61f44Ssb155480 *default_idp = val & 0xFFF; 1784c1c61f44Ssb155480 D2(vswp, "%s: %s(%d): (%d)\n", __func__, 1785c1c61f44Ssb155480 vsw_dvid_propname, inst, *default_idp); 1786c1c61f44Ssb155480 } 1787c1c61f44Ssb155480 } 1788c1c61f44Ssb155480 1789c1c61f44Ssb155480 rv = md_get_prop_val(mdp, node, pvid_propname, &val); 1790c1c61f44Ssb155480 if (rv != 0) { 1791c1c61f44Ssb155480 DWARN(vswp, "%s: prop(%s) not found", __func__, pvid_propname); 1792c1c61f44Ssb155480 *pvidp = vsw_default_vlan_id; 1793c1c61f44Ssb155480 } else { 1794c1c61f44Ssb155480 1795c1c61f44Ssb155480 *pvidp = val & 0xFFF; 1796c1c61f44Ssb155480 D2(vswp, "%s: %s(%d): (%d)\n", __func__, 1797c1c61f44Ssb155480 pvid_propname, inst, *pvidp); 1798c1c61f44Ssb155480 } 1799c1c61f44Ssb155480 1800c1c61f44Ssb155480 rv = md_get_prop_data(mdp, node, vid_propname, (uint8_t **)&data, 1801c1c61f44Ssb155480 &size); 1802c1c61f44Ssb155480 if (rv != 0) { 1803c1c61f44Ssb155480 D2(vswp, "%s: prop(%s) not found", __func__, vid_propname); 1804c1c61f44Ssb155480 size = 0; 1805c1c61f44Ssb155480 } else { 1806c1c61f44Ssb155480 size /= sizeof (uint64_t); 1807c1c61f44Ssb155480 } 1808c1c61f44Ssb155480 nvids = size; 1809c1c61f44Ssb155480 1810c1c61f44Ssb155480 if (nvids != 0) { 1811c1c61f44Ssb155480 D2(vswp, "%s: %s(%d): ", __func__, vid_propname, inst); 1812da14cebeSEric Cheng vids_size = sizeof (vsw_vlanid_t) * nvids; 1813c1c61f44Ssb155480 *vidspp = kmem_zalloc(vids_size, KM_SLEEP); 1814c1c61f44Ssb155480 for (i = 0; i < nvids; i++) { 1815da14cebeSEric Cheng (*vidspp)[i].vl_vid = data[i] & 0xFFFF; 1816da14cebeSEric Cheng (*vidspp)[i].vl_set = B_FALSE; 1817da14cebeSEric Cheng D2(vswp, " %d ", (*vidspp)[i].vl_vid); 1818c1c61f44Ssb155480 } 1819c1c61f44Ssb155480 D2(vswp, "\n"); 1820c1c61f44Ssb155480 } 1821c1c61f44Ssb155480 1822c1c61f44Ssb155480 *nvidsp = nvids; 1823c1c61f44Ssb155480 } 1824c1c61f44Ssb155480 1825c1c61f44Ssb155480 /* 1826f0ca1d9aSsb155480 * This function reads "priority-ether-types" property from md. This property 1827f0ca1d9aSsb155480 * is used to enable support for priority frames. Applications which need 1828f0ca1d9aSsb155480 * guaranteed and timely delivery of certain high priority frames to/from 1829f0ca1d9aSsb155480 * a vnet or vsw within ldoms, should configure this property by providing 1830f0ca1d9aSsb155480 * the ether type(s) for which the priority facility is needed. 1831f0ca1d9aSsb155480 * Normal data frames are delivered over a ldc channel using the descriptor 1832f0ca1d9aSsb155480 * ring mechanism which is constrained by factors such as descriptor ring size, 1833f0ca1d9aSsb155480 * the rate at which the ring is processed at the peer ldc end point, etc. 1834f0ca1d9aSsb155480 * The priority mechanism provides an Out-Of-Band path to send/receive frames 1835f0ca1d9aSsb155480 * as raw pkt data (VIO_PKT_DATA) messages over the channel, avoiding the 1836f0ca1d9aSsb155480 * descriptor ring path and enables a more reliable and timely delivery of 1837f0ca1d9aSsb155480 * frames to the peer. 1838f0ca1d9aSsb155480 */ 1839f0ca1d9aSsb155480 static void 1840f0ca1d9aSsb155480 vsw_read_pri_eth_types(vsw_t *vswp, md_t *mdp, mde_cookie_t node) 1841f0ca1d9aSsb155480 { 1842f0ca1d9aSsb155480 int rv; 1843f0ca1d9aSsb155480 uint16_t *types; 1844f0ca1d9aSsb155480 uint64_t *data; 1845f0ca1d9aSsb155480 int size; 1846f0ca1d9aSsb155480 int i; 1847f0ca1d9aSsb155480 size_t mblk_sz; 1848f0ca1d9aSsb155480 1849f0ca1d9aSsb155480 rv = md_get_prop_data(mdp, node, pri_types_propname, 1850f0ca1d9aSsb155480 (uint8_t **)&data, &size); 1851f0ca1d9aSsb155480 if (rv != 0) { 1852f0ca1d9aSsb155480 /* 1853f0ca1d9aSsb155480 * Property may not exist if we are running pre-ldoms1.1 f/w. 1854f0ca1d9aSsb155480 * Check if 'vsw_pri_eth_type' has been set in that case. 1855f0ca1d9aSsb155480 */ 1856f0ca1d9aSsb155480 if (vsw_pri_eth_type != 0) { 1857f0ca1d9aSsb155480 size = sizeof (vsw_pri_eth_type); 1858f0ca1d9aSsb155480 data = &vsw_pri_eth_type; 1859f0ca1d9aSsb155480 } else { 1860f0ca1d9aSsb155480 D3(vswp, "%s: prop(%s) not found", __func__, 1861f0ca1d9aSsb155480 pri_types_propname); 1862f0ca1d9aSsb155480 size = 0; 1863f0ca1d9aSsb155480 } 1864f0ca1d9aSsb155480 } 1865f0ca1d9aSsb155480 1866f0ca1d9aSsb155480 if (size == 0) { 1867f0ca1d9aSsb155480 vswp->pri_num_types = 0; 1868f0ca1d9aSsb155480 return; 1869f0ca1d9aSsb155480 } 1870f0ca1d9aSsb155480 1871f0ca1d9aSsb155480 /* 1872f0ca1d9aSsb155480 * we have some priority-ether-types defined; 1873f0ca1d9aSsb155480 * allocate a table of these types and also 1874f0ca1d9aSsb155480 * allocate a pool of mblks to transmit these 1875f0ca1d9aSsb155480 * priority packets. 1876f0ca1d9aSsb155480 */ 1877f0ca1d9aSsb155480 size /= sizeof (uint64_t); 1878f0ca1d9aSsb155480 vswp->pri_num_types = size; 1879f0ca1d9aSsb155480 vswp->pri_types = kmem_zalloc(size * sizeof (uint16_t), KM_SLEEP); 1880f0ca1d9aSsb155480 for (i = 0, types = vswp->pri_types; i < size; i++) { 1881f0ca1d9aSsb155480 types[i] = data[i] & 0xFFFF; 1882f0ca1d9aSsb155480 } 1883f0ca1d9aSsb155480 mblk_sz = (VIO_PKT_DATA_HDRSIZE + ETHERMAX + 7) & ~7; 1884f0ca1d9aSsb155480 (void) vio_create_mblks(vsw_pri_tx_nmblks, mblk_sz, &vswp->pri_tx_vmp); 1885f0ca1d9aSsb155480 } 1886f0ca1d9aSsb155480 18877b1f684aSSriharsha Basavapatna static void 18887b1f684aSSriharsha Basavapatna vsw_mtu_read(vsw_t *vswp, md_t *mdp, mde_cookie_t node, uint32_t *mtu) 18897b1f684aSSriharsha Basavapatna { 18907b1f684aSSriharsha Basavapatna int rv; 18917b1f684aSSriharsha Basavapatna int inst; 18927b1f684aSSriharsha Basavapatna uint64_t val; 18937b1f684aSSriharsha Basavapatna char *mtu_propname; 18947b1f684aSSriharsha Basavapatna 18957b1f684aSSriharsha Basavapatna mtu_propname = vsw_mtu_propname; 18967b1f684aSSriharsha Basavapatna inst = vswp->instance; 18977b1f684aSSriharsha Basavapatna 18987b1f684aSSriharsha Basavapatna rv = md_get_prop_val(mdp, node, mtu_propname, &val); 18997b1f684aSSriharsha Basavapatna if (rv != 0) { 19007b1f684aSSriharsha Basavapatna D3(vswp, "%s: prop(%s) not found", __func__, mtu_propname); 19017b1f684aSSriharsha Basavapatna *mtu = vsw_ethermtu; 19027b1f684aSSriharsha Basavapatna } else { 19037b1f684aSSriharsha Basavapatna 19047b1f684aSSriharsha Basavapatna *mtu = val & 0xFFFF; 19057b1f684aSSriharsha Basavapatna D2(vswp, "%s: %s(%d): (%d)\n", __func__, 19067b1f684aSSriharsha Basavapatna mtu_propname, inst, *mtu); 19077b1f684aSSriharsha Basavapatna } 19087b1f684aSSriharsha Basavapatna } 19097b1f684aSSriharsha Basavapatna 19107b1f684aSSriharsha Basavapatna /* 19117b1f684aSSriharsha Basavapatna * Update the mtu of the vsw device. We first check if the device has been 19127b1f684aSSriharsha Basavapatna * plumbed and if so fail the mtu update. Otherwise, we continue to update the 19137b1f684aSSriharsha Basavapatna * new mtu and reset all ports to initiate handshake re-negotiation with peers 19147b1f684aSSriharsha Basavapatna * using the new mtu. 19157b1f684aSSriharsha Basavapatna */ 19167b1f684aSSriharsha Basavapatna static int 19177b1f684aSSriharsha Basavapatna vsw_mtu_update(vsw_t *vswp, uint32_t mtu) 19187b1f684aSSriharsha Basavapatna { 19197b1f684aSSriharsha Basavapatna int rv; 19207b1f684aSSriharsha Basavapatna 19217b1f684aSSriharsha Basavapatna WRITE_ENTER(&vswp->if_lockrw); 19227b1f684aSSriharsha Basavapatna 19237b1f684aSSriharsha Basavapatna if (vswp->if_state & VSW_IF_UP) { 19247b1f684aSSriharsha Basavapatna 19257b1f684aSSriharsha Basavapatna RW_EXIT(&vswp->if_lockrw); 19267b1f684aSSriharsha Basavapatna 19277b1f684aSSriharsha Basavapatna cmn_err(CE_NOTE, "!vsw%d: Unable to process mtu update" 19287b1f684aSSriharsha Basavapatna " as the device is plumbed\n", vswp->instance); 19297b1f684aSSriharsha Basavapatna return (EBUSY); 19307b1f684aSSriharsha Basavapatna 19317b1f684aSSriharsha Basavapatna } else { 19327b1f684aSSriharsha Basavapatna 19337b1f684aSSriharsha Basavapatna D2(vswp, "%s: curr_mtu(%d) new_mtu(%d)\n", 19347b1f684aSSriharsha Basavapatna __func__, vswp->mtu, mtu); 19357b1f684aSSriharsha Basavapatna 19367b1f684aSSriharsha Basavapatna vswp->mtu = mtu; 19377b1f684aSSriharsha Basavapatna vswp->max_frame_size = vswp->mtu + 19387b1f684aSSriharsha Basavapatna sizeof (struct ether_header) + VLAN_TAGSZ; 19397b1f684aSSriharsha Basavapatna 19407b1f684aSSriharsha Basavapatna rv = mac_maxsdu_update(vswp->if_mh, mtu); 19417b1f684aSSriharsha Basavapatna if (rv != 0) { 19427b1f684aSSriharsha Basavapatna cmn_err(CE_NOTE, 19437b1f684aSSriharsha Basavapatna "!vsw%d: Unable to update mtu with mac" 19447b1f684aSSriharsha Basavapatna " layer\n", vswp->instance); 19457b1f684aSSriharsha Basavapatna } 19467b1f684aSSriharsha Basavapatna 19477b1f684aSSriharsha Basavapatna RW_EXIT(&vswp->if_lockrw); 19487b1f684aSSriharsha Basavapatna 19497b1f684aSSriharsha Basavapatna /* Reset ports to renegotiate with the new mtu */ 19507b1f684aSSriharsha Basavapatna vsw_reset_ports(vswp); 19517b1f684aSSriharsha Basavapatna 19527b1f684aSSriharsha Basavapatna } 19537b1f684aSSriharsha Basavapatna 19547b1f684aSSriharsha Basavapatna return (0); 19557b1f684aSSriharsha Basavapatna } 19567b1f684aSSriharsha Basavapatna 1957f0ca1d9aSsb155480 /* 195834683adeSsg70180 * Check to see if the relevant properties in the specified node have 195934683adeSsg70180 * changed, and if so take the appropriate action. 196034683adeSsg70180 * 196134683adeSsg70180 * If any of the properties are missing or invalid we don't take 196234683adeSsg70180 * any action, as this function should only be invoked when modifications 196334683adeSsg70180 * have been made to what we assume is a working configuration, which 196434683adeSsg70180 * we leave active. 196534683adeSsg70180 * 196634683adeSsg70180 * Note it is legal for this routine to be invoked even if none of the 196734683adeSsg70180 * properties in the port node within the MD have actually changed. 196834683adeSsg70180 */ 196934683adeSsg70180 static void 197034683adeSsg70180 vsw_update_md_prop(vsw_t *vswp, md_t *mdp, mde_cookie_t node) 197134683adeSsg70180 { 197234683adeSsg70180 char physname[LIFNAMSIZ]; 197334683adeSsg70180 char drv[LIFNAMSIZ]; 197434683adeSsg70180 uint_t ddi_instance; 1975da14cebeSEric Cheng uint8_t new_smode; 1976da14cebeSEric Cheng int i; 197734683adeSsg70180 uint64_t macaddr = 0; 197834683adeSsg70180 enum {MD_init = 0x1, 197934683adeSsg70180 MD_physname = 0x2, 198034683adeSsg70180 MD_macaddr = 0x4, 1981c1c61f44Ssb155480 MD_smode = 0x8, 19827b1f684aSSriharsha Basavapatna MD_vlans = 0x10, 19837b1f684aSSriharsha Basavapatna MD_mtu = 0x20} updated; 198419b65a69Ssb155480 int rv; 1985c1c61f44Ssb155480 uint16_t pvid; 1986da14cebeSEric Cheng vsw_vlanid_t *vids; 1987c1c61f44Ssb155480 uint16_t nvids; 19887b1f684aSSriharsha Basavapatna uint32_t mtu; 198934683adeSsg70180 199034683adeSsg70180 updated = MD_init; 199134683adeSsg70180 199234683adeSsg70180 D1(vswp, "%s: enter", __func__); 199334683adeSsg70180 199434683adeSsg70180 /* 199534683adeSsg70180 * Check if name of physical device in MD has changed. 199634683adeSsg70180 */ 199734683adeSsg70180 if (vsw_get_md_physname(vswp, mdp, node, (char *)&physname) == 0) { 199834683adeSsg70180 /* 199934683adeSsg70180 * Do basic sanity check on new device name/instance, 200034683adeSsg70180 * if its non NULL. It is valid for the device name to 200134683adeSsg70180 * have changed from a non NULL to a NULL value, i.e. 200234683adeSsg70180 * the vsw is being changed to 'routed' mode. 200334683adeSsg70180 */ 200434683adeSsg70180 if ((strlen(physname) != 0) && 200519b65a69Ssb155480 (ddi_parse(physname, drv, 200619b65a69Ssb155480 &ddi_instance) != DDI_SUCCESS)) { 20071ef0bbb5Snarayan cmn_err(CE_WARN, "!vsw%d: physical device %s is not" 200834683adeSsg70180 " a valid device name/instance", 200934683adeSsg70180 vswp->instance, physname); 201034683adeSsg70180 goto fail_reconf; 201134683adeSsg70180 } 201234683adeSsg70180 201334683adeSsg70180 if (strcmp(physname, vswp->physname)) { 201434683adeSsg70180 D2(vswp, "%s: device name changed from %s to %s", 201534683adeSsg70180 __func__, vswp->physname, physname); 201634683adeSsg70180 201734683adeSsg70180 updated |= MD_physname; 201834683adeSsg70180 } else { 201934683adeSsg70180 D2(vswp, "%s: device name unchanged at %s", 202034683adeSsg70180 __func__, vswp->physname); 202134683adeSsg70180 } 202234683adeSsg70180 } else { 202334683adeSsg70180 cmn_err(CE_WARN, "!vsw%d: Unable to read name of physical " 202434683adeSsg70180 "device from updated MD.", vswp->instance); 202534683adeSsg70180 goto fail_reconf; 202634683adeSsg70180 } 202734683adeSsg70180 202834683adeSsg70180 /* 202934683adeSsg70180 * Check if MAC address has changed. 203034683adeSsg70180 */ 203134683adeSsg70180 if (md_get_prop_val(mdp, node, macaddr_propname, &macaddr) != 0) { 203234683adeSsg70180 cmn_err(CE_WARN, "!vsw%d: Unable to get MAC address from MD", 203334683adeSsg70180 vswp->instance); 203434683adeSsg70180 goto fail_reconf; 203534683adeSsg70180 } else { 203619b65a69Ssb155480 uint64_t maddr = macaddr; 203734683adeSsg70180 READ_ENTER(&vswp->if_lockrw); 203834683adeSsg70180 for (i = ETHERADDRL - 1; i >= 0; i--) { 203919b65a69Ssb155480 if (vswp->if_addr.ether_addr_octet[i] 204019b65a69Ssb155480 != (macaddr & 0xFF)) { 204134683adeSsg70180 D2(vswp, "%s: octet[%d] 0x%x != 0x%x", 204234683adeSsg70180 __func__, i, 204334683adeSsg70180 vswp->if_addr.ether_addr_octet[i], 204434683adeSsg70180 (macaddr & 0xFF)); 204534683adeSsg70180 updated |= MD_macaddr; 204619b65a69Ssb155480 macaddr = maddr; 204734683adeSsg70180 break; 204834683adeSsg70180 } 204934683adeSsg70180 macaddr >>= 8; 205034683adeSsg70180 } 205134683adeSsg70180 RW_EXIT(&vswp->if_lockrw); 205219b65a69Ssb155480 if (updated & MD_macaddr) { 205319b65a69Ssb155480 vsw_save_lmacaddr(vswp, macaddr); 205419b65a69Ssb155480 } 205534683adeSsg70180 } 205634683adeSsg70180 205734683adeSsg70180 /* 205834683adeSsg70180 * Check if switching modes have changed. 205934683adeSsg70180 */ 2060da14cebeSEric Cheng if (vsw_get_md_smodes(vswp, mdp, node, &new_smode)) { 206134683adeSsg70180 cmn_err(CE_WARN, "!vsw%d: Unable to read %s property from MD", 206234683adeSsg70180 vswp->instance, smode_propname); 206334683adeSsg70180 goto fail_reconf; 206434683adeSsg70180 } else { 2065da14cebeSEric Cheng if (new_smode != vswp->smode) { 2066da14cebeSEric Cheng D2(vswp, "%s: switching mode changed from %d to %d", 2067da14cebeSEric Cheng __func__, vswp->smode, new_smode); 206834683adeSsg70180 206934683adeSsg70180 updated |= MD_smode; 207034683adeSsg70180 } 207134683adeSsg70180 } 207234683adeSsg70180 2073c1c61f44Ssb155480 /* Read the vlan ids */ 2074c1c61f44Ssb155480 vsw_vlan_read_ids(vswp, VSW_LOCALDEV, mdp, node, &pvid, &vids, 2075c1c61f44Ssb155480 &nvids, NULL); 2076c1c61f44Ssb155480 2077c1c61f44Ssb155480 /* Determine if there are any vlan id updates */ 2078c1c61f44Ssb155480 if ((pvid != vswp->pvid) || /* pvid changed? */ 2079c1c61f44Ssb155480 (nvids != vswp->nvids) || /* # of vids changed? */ 2080c1c61f44Ssb155480 ((nvids != 0) && (vswp->nvids != 0) && /* vids changed? */ 2081da14cebeSEric Cheng !vsw_cmp_vids(vids, vswp->vids, nvids))) { 2082c1c61f44Ssb155480 updated |= MD_vlans; 2083c1c61f44Ssb155480 } 2084c1c61f44Ssb155480 20857b1f684aSSriharsha Basavapatna /* Read mtu */ 20867b1f684aSSriharsha Basavapatna vsw_mtu_read(vswp, mdp, node, &mtu); 20877b1f684aSSriharsha Basavapatna if (mtu != vswp->mtu) { 20887b1f684aSSriharsha Basavapatna if (mtu >= ETHERMTU && mtu <= VNET_MAX_MTU) { 20897b1f684aSSriharsha Basavapatna updated |= MD_mtu; 20907b1f684aSSriharsha Basavapatna } else { 20917b1f684aSSriharsha Basavapatna cmn_err(CE_NOTE, "!vsw%d: Unable to process mtu update" 20927b1f684aSSriharsha Basavapatna " as the specified value:%d is invalid\n", 20937b1f684aSSriharsha Basavapatna vswp->instance, mtu); 20947b1f684aSSriharsha Basavapatna } 20957b1f684aSSriharsha Basavapatna } 20967b1f684aSSriharsha Basavapatna 209734683adeSsg70180 /* 209834683adeSsg70180 * Now make any changes which are needed... 209934683adeSsg70180 */ 210034683adeSsg70180 2101da14cebeSEric Cheng if (updated & (MD_physname | MD_smode | MD_mtu)) { 210234683adeSsg70180 210334683adeSsg70180 /* 2104808f26a8SSriharsha Basavapatna * Stop any pending thread to setup switching mode. 210534683adeSsg70180 */ 2106808f26a8SSriharsha Basavapatna vsw_setup_switching_stop(vswp); 210719b65a69Ssb155480 2108678453a8Sspeer /* Cleanup HybridIO */ 2109678453a8Sspeer vsw_hio_cleanup(vswp); 2110678453a8Sspeer 211119b65a69Ssb155480 /* 211219b65a69Ssb155480 * Remove unicst, mcst addrs of vsw interface 2113da14cebeSEric Cheng * and ports from the physdev. This also closes 2114da14cebeSEric Cheng * the corresponding mac clients. 211519b65a69Ssb155480 */ 211619b65a69Ssb155480 vsw_unset_addrs(vswp); 211719b65a69Ssb155480 211819b65a69Ssb155480 /* 211919b65a69Ssb155480 * Stop, detach and close the old device.. 212019b65a69Ssb155480 */ 2121da14cebeSEric Cheng mutex_enter(&vswp->mac_lock); 212219b65a69Ssb155480 vsw_mac_close(vswp); 2123da14cebeSEric Cheng mutex_exit(&vswp->mac_lock); 212434683adeSsg70180 212534683adeSsg70180 /* 212634683adeSsg70180 * Update phys name. 212734683adeSsg70180 */ 212834683adeSsg70180 if (updated & MD_physname) { 212934683adeSsg70180 cmn_err(CE_NOTE, "!vsw%d: changing from %s to %s", 213034683adeSsg70180 vswp->instance, vswp->physname, physname); 213134683adeSsg70180 (void) strncpy(vswp->physname, 213234683adeSsg70180 physname, strlen(physname) + 1); 213334683adeSsg70180 } 213434683adeSsg70180 213534683adeSsg70180 /* 213634683adeSsg70180 * Update array with the new switch mode values. 213734683adeSsg70180 */ 213834683adeSsg70180 if (updated & MD_smode) { 2139da14cebeSEric Cheng vswp->smode = new_smode; 2140da14cebeSEric Cheng } 214134683adeSsg70180 2142da14cebeSEric Cheng /* Update mtu */ 2143da14cebeSEric Cheng if (updated & MD_mtu) { 2144da14cebeSEric Cheng rv = vsw_mtu_update(vswp, mtu); 2145da14cebeSEric Cheng if (rv != 0) { 2146da14cebeSEric Cheng goto fail_update; 2147da14cebeSEric Cheng } 214834683adeSsg70180 } 214934683adeSsg70180 215034683adeSsg70180 /* 215134683adeSsg70180 * ..and attach, start the new device. 215234683adeSsg70180 */ 215319b65a69Ssb155480 rv = vsw_setup_switching(vswp); 215419b65a69Ssb155480 if (rv == EAGAIN) { 215519b65a69Ssb155480 /* 215619b65a69Ssb155480 * Unable to setup switching mode. 2157808f26a8SSriharsha Basavapatna * As the error is EAGAIN, schedule a thread to retry 215819b65a69Ssb155480 * and return. Programming addresses of ports and 2159808f26a8SSriharsha Basavapatna * vsw interface will be done by the thread when the 2160808f26a8SSriharsha Basavapatna * switching setup completes successfully. 216119b65a69Ssb155480 */ 2162808f26a8SSriharsha Basavapatna if (vsw_setup_switching_start(vswp) != 0) { 2163808f26a8SSriharsha Basavapatna goto fail_update; 2164808f26a8SSriharsha Basavapatna } 216519b65a69Ssb155480 return; 216619b65a69Ssb155480 216719b65a69Ssb155480 } else if (rv) { 216834683adeSsg70180 goto fail_update; 216919b65a69Ssb155480 } 217034683adeSsg70180 217171bdf936SWENTAO YANG vsw_setup_layer2_post_process(vswp); 217219b65a69Ssb155480 } else if (updated & MD_macaddr) { 217319b65a69Ssb155480 /* 217419b65a69Ssb155480 * We enter here if only MD_macaddr is exclusively updated. 217519b65a69Ssb155480 * If MD_physname and/or MD_smode are also updated, then 217619b65a69Ssb155480 * as part of that, we would have implicitly processed 217719b65a69Ssb155480 * MD_macaddr update (above). 217819b65a69Ssb155480 */ 217934683adeSsg70180 cmn_err(CE_NOTE, "!vsw%d: changing mac address to 0x%lx", 218034683adeSsg70180 vswp->instance, macaddr); 218134683adeSsg70180 218219b65a69Ssb155480 READ_ENTER(&vswp->if_lockrw); 218319b65a69Ssb155480 if (vswp->if_state & VSW_IF_UP) { 2184da14cebeSEric Cheng /* reconfigure with new address */ 2185da14cebeSEric Cheng vsw_if_mac_reconfig(vswp, B_FALSE, 0, NULL, 0); 218634683adeSsg70180 21875f94e909Ssg70180 /* 218834683adeSsg70180 * Notify the MAC layer of the changed address. 218934683adeSsg70180 */ 219019b65a69Ssb155480 mac_unicst_update(vswp->if_mh, 219119b65a69Ssb155480 (uint8_t *)&vswp->if_addr); 219219b65a69Ssb155480 219319b65a69Ssb155480 } 219419b65a69Ssb155480 RW_EXIT(&vswp->if_lockrw); 219519b65a69Ssb155480 219634683adeSsg70180 } 219734683adeSsg70180 2198c1c61f44Ssb155480 if (updated & MD_vlans) { 2199c1c61f44Ssb155480 /* Remove existing vlan ids from the hash table. */ 2200c1c61f44Ssb155480 vsw_vlan_remove_ids(vswp, VSW_LOCALDEV); 2201c1c61f44Ssb155480 2202da14cebeSEric Cheng if (vswp->if_state & VSW_IF_UP) { 2203da14cebeSEric Cheng vsw_if_mac_reconfig(vswp, B_TRUE, pvid, vids, nvids); 2204da14cebeSEric Cheng } else { 2205c1c61f44Ssb155480 if (vswp->nvids != 0) { 2206da14cebeSEric Cheng kmem_free(vswp->vids, 2207da14cebeSEric Cheng sizeof (vsw_vlanid_t) * vswp->nvids); 2208c1c61f44Ssb155480 } 2209c1c61f44Ssb155480 vswp->vids = vids; 2210da14cebeSEric Cheng vswp->nvids = nvids; 2211da14cebeSEric Cheng vswp->pvid = pvid; 2212c1c61f44Ssb155480 } 2213c1c61f44Ssb155480 2214c1c61f44Ssb155480 /* add these new vlan ids into hash table */ 2215c1c61f44Ssb155480 vsw_vlan_add_ids(vswp, VSW_LOCALDEV); 2216c1c61f44Ssb155480 } else { 2217c1c61f44Ssb155480 if (nvids != 0) { 2218da14cebeSEric Cheng kmem_free(vids, sizeof (vsw_vlanid_t) * nvids); 2219c1c61f44Ssb155480 } 2220c1c61f44Ssb155480 } 2221c1c61f44Ssb155480 222234683adeSsg70180 return; 222334683adeSsg70180 222434683adeSsg70180 fail_reconf: 222534683adeSsg70180 cmn_err(CE_WARN, "!vsw%d: configuration unchanged", vswp->instance); 222634683adeSsg70180 return; 222734683adeSsg70180 222834683adeSsg70180 fail_update: 22291ef0bbb5Snarayan cmn_err(CE_WARN, "!vsw%d: re-configuration failed", 223034683adeSsg70180 vswp->instance); 223134683adeSsg70180 } 223234683adeSsg70180 223334683adeSsg70180 /* 2234c1c61f44Ssb155480 * Read the port's md properties. 22351ae08745Sheppo */ 2236c1c61f44Ssb155480 static int 2237c1c61f44Ssb155480 vsw_port_read_props(vsw_port_t *portp, vsw_t *vswp, 2238c1c61f44Ssb155480 md_t *mdp, mde_cookie_t *node) 22391ae08745Sheppo { 22401ae08745Sheppo uint64_t ldc_id; 22411ae08745Sheppo uint8_t *addrp; 22421ae08745Sheppo int i, addrsz; 22431ae08745Sheppo int num_nodes = 0, nchan = 0; 22441ae08745Sheppo int listsz = 0; 22451ae08745Sheppo mde_cookie_t *listp = NULL; 22461ae08745Sheppo struct ether_addr ea; 22471ae08745Sheppo uint64_t macaddr; 22481ae08745Sheppo uint64_t inst = 0; 2249678453a8Sspeer uint64_t val; 22501ae08745Sheppo 22511ae08745Sheppo if (md_get_prop_val(mdp, *node, id_propname, &inst)) { 22521ae08745Sheppo DWARN(vswp, "%s: prop(%s) not found", __func__, 22531ae08745Sheppo id_propname); 22541ae08745Sheppo return (1); 22551ae08745Sheppo } 22561ae08745Sheppo 22571ae08745Sheppo /* 22581ae08745Sheppo * Find the channel endpoint node(s) (which should be under this 22591ae08745Sheppo * port node) which contain the channel id(s). 22601ae08745Sheppo */ 22611ae08745Sheppo if ((num_nodes = md_node_count(mdp)) <= 0) { 22621ae08745Sheppo DERR(vswp, "%s: invalid number of nodes found (%d)", 22631ae08745Sheppo __func__, num_nodes); 22641ae08745Sheppo return (1); 22651ae08745Sheppo } 22661ae08745Sheppo 226734683adeSsg70180 D2(vswp, "%s: %d nodes found", __func__, num_nodes); 226834683adeSsg70180 22691ae08745Sheppo /* allocate enough space for node list */ 22701ae08745Sheppo listsz = num_nodes * sizeof (mde_cookie_t); 22711ae08745Sheppo listp = kmem_zalloc(listsz, KM_SLEEP); 22721ae08745Sheppo 2273205eeb1aSlm66018 nchan = md_scan_dag(mdp, *node, md_find_name(mdp, chan_propname), 22741ae08745Sheppo md_find_name(mdp, "fwd"), listp); 22751ae08745Sheppo 22761ae08745Sheppo if (nchan <= 0) { 22771ae08745Sheppo DWARN(vswp, "%s: no %s nodes found", __func__, chan_propname); 22781ae08745Sheppo kmem_free(listp, listsz); 22791ae08745Sheppo return (1); 22801ae08745Sheppo } 22811ae08745Sheppo 22821ae08745Sheppo D2(vswp, "%s: %d %s nodes found", __func__, nchan, chan_propname); 22831ae08745Sheppo 22841ae08745Sheppo /* use property from first node found */ 22851ae08745Sheppo if (md_get_prop_val(mdp, listp[0], id_propname, &ldc_id)) { 22861ae08745Sheppo DWARN(vswp, "%s: prop(%s) not found\n", __func__, 22871ae08745Sheppo id_propname); 22881ae08745Sheppo kmem_free(listp, listsz); 22891ae08745Sheppo return (1); 22901ae08745Sheppo } 22911ae08745Sheppo 22921ae08745Sheppo /* don't need list any more */ 22931ae08745Sheppo kmem_free(listp, listsz); 22941ae08745Sheppo 22951ae08745Sheppo D2(vswp, "%s: ldc_id 0x%llx", __func__, ldc_id); 22961ae08745Sheppo 22971ae08745Sheppo /* read mac-address property */ 22981ae08745Sheppo if (md_get_prop_data(mdp, *node, remaddr_propname, 22991ae08745Sheppo &addrp, &addrsz)) { 23001ae08745Sheppo DWARN(vswp, "%s: prop(%s) not found", 23011ae08745Sheppo __func__, remaddr_propname); 23021ae08745Sheppo return (1); 23031ae08745Sheppo } 23041ae08745Sheppo 23051ae08745Sheppo if (addrsz < ETHERADDRL) { 23061ae08745Sheppo DWARN(vswp, "%s: invalid address size", __func__); 23071ae08745Sheppo return (1); 23081ae08745Sheppo } 23091ae08745Sheppo 23101ae08745Sheppo macaddr = *((uint64_t *)addrp); 23111ae08745Sheppo D2(vswp, "%s: remote mac address 0x%llx", __func__, macaddr); 23121ae08745Sheppo 23131ae08745Sheppo for (i = ETHERADDRL - 1; i >= 0; i--) { 23141ae08745Sheppo ea.ether_addr_octet[i] = macaddr & 0xFF; 23151ae08745Sheppo macaddr >>= 8; 23161ae08745Sheppo } 23171ae08745Sheppo 2318c1c61f44Ssb155480 /* now update all properties into the port */ 2319c1c61f44Ssb155480 portp->p_vswp = vswp; 2320c1c61f44Ssb155480 portp->p_instance = inst; 2321da14cebeSEric Cheng portp->addr_set = B_FALSE; 2322c1c61f44Ssb155480 ether_copy(&ea, &portp->p_macaddr); 2323c1c61f44Ssb155480 if (nchan > VSW_PORT_MAX_LDCS) { 2324c1c61f44Ssb155480 D2(vswp, "%s: using first of %d ldc ids", 2325c1c61f44Ssb155480 __func__, nchan); 2326c1c61f44Ssb155480 nchan = VSW_PORT_MAX_LDCS; 2327c1c61f44Ssb155480 } 2328c1c61f44Ssb155480 portp->num_ldcs = nchan; 2329c1c61f44Ssb155480 portp->ldc_ids = 2330c1c61f44Ssb155480 kmem_zalloc(sizeof (uint64_t) * nchan, KM_SLEEP); 2331c1c61f44Ssb155480 bcopy(&ldc_id, (portp->ldc_ids), sizeof (uint64_t) * nchan); 2332c1c61f44Ssb155480 2333c1c61f44Ssb155480 /* read vlan id properties of this port node */ 2334c1c61f44Ssb155480 vsw_vlan_read_ids(portp, VSW_VNETPORT, mdp, *node, &portp->pvid, 2335c1c61f44Ssb155480 &portp->vids, &portp->nvids, NULL); 2336c1c61f44Ssb155480 2337678453a8Sspeer /* Check if hybrid property is present */ 2338678453a8Sspeer if (md_get_prop_val(mdp, *node, hybrid_propname, &val) == 0) { 2339678453a8Sspeer D1(vswp, "%s: prop(%s) found\n", __func__, hybrid_propname); 2340678453a8Sspeer portp->p_hio_enabled = B_TRUE; 2341678453a8Sspeer } else { 2342678453a8Sspeer portp->p_hio_enabled = B_FALSE; 2343678453a8Sspeer } 2344678453a8Sspeer /* 2345678453a8Sspeer * Port hio capability determined after version 2346678453a8Sspeer * negotiation, i.e., when we know the peer is HybridIO capable. 2347678453a8Sspeer */ 2348678453a8Sspeer portp->p_hio_capable = B_FALSE; 2349c1c61f44Ssb155480 return (0); 2350c1c61f44Ssb155480 } 2351c1c61f44Ssb155480 2352c1c61f44Ssb155480 /* 2353c1c61f44Ssb155480 * Add a new port to the system. 2354c1c61f44Ssb155480 * 2355c1c61f44Ssb155480 * Returns 0 on success, 1 on failure. 2356c1c61f44Ssb155480 */ 2357c1c61f44Ssb155480 int 2358c1c61f44Ssb155480 vsw_port_add(vsw_t *vswp, md_t *mdp, mde_cookie_t *node) 2359c1c61f44Ssb155480 { 2360c1c61f44Ssb155480 vsw_port_t *portp; 2361c1c61f44Ssb155480 int rv; 2362c1c61f44Ssb155480 2363c1c61f44Ssb155480 portp = kmem_zalloc(sizeof (vsw_port_t), KM_SLEEP); 2364c1c61f44Ssb155480 2365c1c61f44Ssb155480 rv = vsw_port_read_props(portp, vswp, mdp, node); 2366c1c61f44Ssb155480 if (rv != 0) { 2367c1c61f44Ssb155480 kmem_free(portp, sizeof (*portp)); 2368c1c61f44Ssb155480 return (1); 2369c1c61f44Ssb155480 } 2370c1c61f44Ssb155480 2371c1c61f44Ssb155480 rv = vsw_port_attach(portp); 2372c1c61f44Ssb155480 if (rv != 0) { 23731ae08745Sheppo DERR(vswp, "%s: failed to attach port", __func__); 23741ae08745Sheppo return (1); 23751ae08745Sheppo } 23761ae08745Sheppo 2377c1c61f44Ssb155480 return (0); 2378c1c61f44Ssb155480 } 23791ae08745Sheppo 2380c1c61f44Ssb155480 static int 2381c1c61f44Ssb155480 vsw_port_update(vsw_t *vswp, md_t *curr_mdp, mde_cookie_t curr_mdex, 2382c1c61f44Ssb155480 md_t *prev_mdp, mde_cookie_t prev_mdex) 2383c1c61f44Ssb155480 { 2384c1c61f44Ssb155480 uint64_t cport_num; 2385c1c61f44Ssb155480 uint64_t pport_num; 2386c1c61f44Ssb155480 vsw_port_list_t *plistp; 2387c1c61f44Ssb155480 vsw_port_t *portp; 2388c1c61f44Ssb155480 boolean_t updated_vlans = B_FALSE; 2389c1c61f44Ssb155480 uint16_t pvid; 2390da14cebeSEric Cheng vsw_vlanid_t *vids; 2391c1c61f44Ssb155480 uint16_t nvids; 2392678453a8Sspeer uint64_t val; 2393678453a8Sspeer boolean_t hio_enabled = B_FALSE; 2394c1c61f44Ssb155480 2395c1c61f44Ssb155480 /* 2396c1c61f44Ssb155480 * For now, we get port updates only if vlan ids changed. 2397c1c61f44Ssb155480 * We read the port num and do some sanity check. 2398c1c61f44Ssb155480 */ 2399c1c61f44Ssb155480 if (md_get_prop_val(curr_mdp, curr_mdex, id_propname, &cport_num)) { 2400c1c61f44Ssb155480 return (1); 2401c1c61f44Ssb155480 } 2402c1c61f44Ssb155480 2403c1c61f44Ssb155480 if (md_get_prop_val(prev_mdp, prev_mdex, id_propname, &pport_num)) { 2404c1c61f44Ssb155480 return (1); 2405c1c61f44Ssb155480 } 2406c1c61f44Ssb155480 if (cport_num != pport_num) 2407c1c61f44Ssb155480 return (1); 2408c1c61f44Ssb155480 2409c1c61f44Ssb155480 plistp = &(vswp->plist); 2410c1c61f44Ssb155480 2411c1c61f44Ssb155480 READ_ENTER(&plistp->lockrw); 2412c1c61f44Ssb155480 2413c1c61f44Ssb155480 portp = vsw_lookup_port(vswp, cport_num); 2414c1c61f44Ssb155480 if (portp == NULL) { 2415c1c61f44Ssb155480 RW_EXIT(&plistp->lockrw); 2416c1c61f44Ssb155480 return (1); 2417c1c61f44Ssb155480 } 2418c1c61f44Ssb155480 2419c1c61f44Ssb155480 /* Read the vlan ids */ 2420c1c61f44Ssb155480 vsw_vlan_read_ids(portp, VSW_VNETPORT, curr_mdp, curr_mdex, &pvid, 2421c1c61f44Ssb155480 &vids, &nvids, NULL); 2422c1c61f44Ssb155480 2423c1c61f44Ssb155480 /* Determine if there are any vlan id updates */ 2424c1c61f44Ssb155480 if ((pvid != portp->pvid) || /* pvid changed? */ 2425c1c61f44Ssb155480 (nvids != portp->nvids) || /* # of vids changed? */ 2426c1c61f44Ssb155480 ((nvids != 0) && (portp->nvids != 0) && /* vids changed? */ 2427da14cebeSEric Cheng !vsw_cmp_vids(vids, portp->vids, nvids))) { 2428c1c61f44Ssb155480 updated_vlans = B_TRUE; 2429c1c61f44Ssb155480 } 2430c1c61f44Ssb155480 2431678453a8Sspeer if (updated_vlans == B_TRUE) { 2432c1c61f44Ssb155480 2433c1c61f44Ssb155480 /* Remove existing vlan ids from the hash table. */ 2434c1c61f44Ssb155480 vsw_vlan_remove_ids(portp, VSW_VNETPORT); 2435c1c61f44Ssb155480 2436da14cebeSEric Cheng /* Reconfigure vlans with network device */ 2437da14cebeSEric Cheng vsw_mac_port_reconfig_vlans(portp, pvid, vids, nvids); 2438c1c61f44Ssb155480 2439c1c61f44Ssb155480 /* add these new vlan ids into hash table */ 2440c1c61f44Ssb155480 vsw_vlan_add_ids(portp, VSW_VNETPORT); 2441c1c61f44Ssb155480 2442c1c61f44Ssb155480 /* reset the port if it is vlan unaware (ver < 1.3) */ 2443c1c61f44Ssb155480 vsw_vlan_unaware_port_reset(portp); 2444678453a8Sspeer } 2445678453a8Sspeer 2446678453a8Sspeer /* Check if hybrid property is present */ 2447678453a8Sspeer if (md_get_prop_val(curr_mdp, curr_mdex, hybrid_propname, &val) == 0) { 2448678453a8Sspeer D1(vswp, "%s: prop(%s) found\n", __func__, hybrid_propname); 2449678453a8Sspeer hio_enabled = B_TRUE; 2450678453a8Sspeer } 2451678453a8Sspeer 2452678453a8Sspeer if (portp->p_hio_enabled != hio_enabled) { 2453678453a8Sspeer vsw_hio_port_update(portp, hio_enabled); 2454678453a8Sspeer } 2455c1c61f44Ssb155480 2456c1c61f44Ssb155480 RW_EXIT(&plistp->lockrw); 24571ae08745Sheppo 24581ae08745Sheppo return (0); 24591ae08745Sheppo } 24601ae08745Sheppo 24611ae08745Sheppo /* 246206db247cSraghuram * vsw_mac_rx -- A common function to send packets to the interface. 246306db247cSraghuram * By default this function check if the interface is UP or not, the 246406db247cSraghuram * rest of the behaviour depends on the flags as below: 24651ae08745Sheppo * 246606db247cSraghuram * VSW_MACRX_PROMISC -- Check if the promisc mode set or not. 246706db247cSraghuram * VSW_MACRX_COPYMSG -- Make a copy of the message(s). 246806db247cSraghuram * VSW_MACRX_FREEMSG -- Free if the messages cannot be sent up the stack. 24691ae08745Sheppo */ 24701ae08745Sheppo void 2471f0ca1d9aSsb155480 vsw_mac_rx(vsw_t *vswp, mac_resource_handle_t mrh, 2472f0ca1d9aSsb155480 mblk_t *mp, vsw_macrx_flags_t flags) 24731ae08745Sheppo { 2474c1c61f44Ssb155480 mblk_t *mpt; 2475c1c61f44Ssb155480 247606db247cSraghuram D1(vswp, "%s:enter\n", __func__); 24771ae08745Sheppo READ_ENTER(&vswp->if_lockrw); 247806db247cSraghuram /* Check if the interface is up */ 247906db247cSraghuram if (!(vswp->if_state & VSW_IF_UP)) { 24801ae08745Sheppo RW_EXIT(&vswp->if_lockrw); 248106db247cSraghuram /* Free messages only if FREEMSG flag specified */ 248206db247cSraghuram if (flags & VSW_MACRX_FREEMSG) { 248306db247cSraghuram freemsgchain(mp); 248406db247cSraghuram } 248506db247cSraghuram D1(vswp, "%s:exit\n", __func__); 248606db247cSraghuram return; 248706db247cSraghuram } 248806db247cSraghuram /* 248906db247cSraghuram * If PROMISC flag is passed, then check if 249006db247cSraghuram * the interface is in the PROMISC mode. 249106db247cSraghuram * If not, drop the messages. 249206db247cSraghuram */ 249306db247cSraghuram if (flags & VSW_MACRX_PROMISC) { 249406db247cSraghuram if (!(vswp->if_state & VSW_IF_PROMISC)) { 249506db247cSraghuram RW_EXIT(&vswp->if_lockrw); 249606db247cSraghuram /* Free messages only if FREEMSG flag specified */ 249706db247cSraghuram if (flags & VSW_MACRX_FREEMSG) { 249806db247cSraghuram freemsgchain(mp); 249906db247cSraghuram } 250006db247cSraghuram D1(vswp, "%s:exit\n", __func__); 250106db247cSraghuram return; 250206db247cSraghuram } 250306db247cSraghuram } 250406db247cSraghuram RW_EXIT(&vswp->if_lockrw); 250506db247cSraghuram /* 250606db247cSraghuram * If COPYMSG flag is passed, then make a copy 250706db247cSraghuram * of the message chain and send up the copy. 250806db247cSraghuram */ 250906db247cSraghuram if (flags & VSW_MACRX_COPYMSG) { 251006db247cSraghuram mp = copymsgchain(mp); 2511f0ca1d9aSsb155480 if (mp == NULL) { 251206db247cSraghuram D1(vswp, "%s:exit\n", __func__); 251306db247cSraghuram return; 251406db247cSraghuram } 251506db247cSraghuram } 251606db247cSraghuram 2517f0ca1d9aSsb155480 D2(vswp, "%s: sending up stack", __func__); 2518c1c61f44Ssb155480 2519c1c61f44Ssb155480 mpt = NULL; 2520c1c61f44Ssb155480 (void) vsw_vlan_frame_untag(vswp, VSW_LOCALDEV, &mp, &mpt); 2521c1c61f44Ssb155480 if (mp != NULL) { 2522ba2e4443Sseb mac_rx(vswp->if_mh, mrh, mp); 2523c1c61f44Ssb155480 } 252406db247cSraghuram D1(vswp, "%s:exit\n", __func__); 25251ae08745Sheppo } 25261ae08745Sheppo 252706db247cSraghuram /* copy mac address of vsw into soft state structure */ 25281ae08745Sheppo static void 252906db247cSraghuram vsw_save_lmacaddr(vsw_t *vswp, uint64_t macaddr) 25301ae08745Sheppo { 25311ae08745Sheppo int i; 25321ae08745Sheppo 253306db247cSraghuram WRITE_ENTER(&vswp->if_lockrw); 253406db247cSraghuram for (i = ETHERADDRL - 1; i >= 0; i--) { 253506db247cSraghuram vswp->if_addr.ether_addr_octet[i] = macaddr & 0xFF; 253606db247cSraghuram macaddr >>= 8; 25371ae08745Sheppo } 253806db247cSraghuram RW_EXIT(&vswp->if_lockrw); 25391ae08745Sheppo } 2540da14cebeSEric Cheng 2541da14cebeSEric Cheng /* Compare VLAN ids, array size expected to be same. */ 2542da14cebeSEric Cheng static boolean_t 2543da14cebeSEric Cheng vsw_cmp_vids(vsw_vlanid_t *vids1, vsw_vlanid_t *vids2, int nvids) 2544da14cebeSEric Cheng { 2545da14cebeSEric Cheng int i, j; 2546da14cebeSEric Cheng uint16_t vid; 2547da14cebeSEric Cheng 2548da14cebeSEric Cheng for (i = 0; i < nvids; i++) { 2549da14cebeSEric Cheng vid = vids1[i].vl_vid; 2550da14cebeSEric Cheng for (j = 0; j < nvids; j++) { 2551da14cebeSEric Cheng if (vid == vids2[i].vl_vid) 2552da14cebeSEric Cheng break; 2553da14cebeSEric Cheng } 2554da14cebeSEric Cheng if (j == nvids) { 2555da14cebeSEric Cheng return (B_FALSE); 2556da14cebeSEric Cheng } 2557da14cebeSEric Cheng } 2558da14cebeSEric Cheng return (B_TRUE); 2559da14cebeSEric Cheng } 2560