xref: /illumos-gate/usr/src/uts/sun4v/io/vnet.c (revision bbf21555)
11ae08745Sheppo /*
21ae08745Sheppo  * CDDL HEADER START
31ae08745Sheppo  *
41ae08745Sheppo  * The contents of this file are subject to the terms of the
51ae08745Sheppo  * Common Development and Distribution License (the "License").
61ae08745Sheppo  * You may not use this file except in compliance with the License.
71ae08745Sheppo  *
81ae08745Sheppo  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
91ae08745Sheppo  * or http://www.opensolaris.org/os/licensing.
101ae08745Sheppo  * See the License for the specific language governing permissions
111ae08745Sheppo  * and limitations under the License.
121ae08745Sheppo  *
131ae08745Sheppo  * When distributing Covered Code, include this CDDL HEADER in each
141ae08745Sheppo  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
151ae08745Sheppo  * If applicable, add the following below this CDDL HEADER, with the
161ae08745Sheppo  * fields enclosed by brackets "[]" replaced with your own identifying
171ae08745Sheppo  * information: Portions Copyright [yyyy] [name of copyright owner]
181ae08745Sheppo  *
191ae08745Sheppo  * CDDL HEADER END
201ae08745Sheppo  */
211ae08745Sheppo 
221ae08745Sheppo /*
230c4606f0SWENTAO YANG  * Copyright 2010 Sun Microsystems, Inc.  All rights reserved.
241ae08745Sheppo  * Use is subject to license terms.
2545948e49SRyan Zezeski  * Copyright 2018 Joyent, Inc.
261ae08745Sheppo  */
271ae08745Sheppo 
281ae08745Sheppo #include <sys/types.h>
291ae08745Sheppo #include <sys/errno.h>
301ae08745Sheppo #include <sys/param.h>
310dc2366fSVenugopal Iyer #include <sys/callb.h>
321ae08745Sheppo #include <sys/stream.h>
331ae08745Sheppo #include <sys/kmem.h>
341ae08745Sheppo #include <sys/conf.h>
351ae08745Sheppo #include <sys/devops.h>
361ae08745Sheppo #include <sys/ksynch.h>
371ae08745Sheppo #include <sys/stat.h>
381ae08745Sheppo #include <sys/modctl.h>
39c1c61f44Ssb155480 #include <sys/modhash.h>
401ae08745Sheppo #include <sys/debug.h>
411ae08745Sheppo #include <sys/ethernet.h>
421ae08745Sheppo #include <sys/dlpi.h>
431ae08745Sheppo #include <net/if.h>
44da14cebeSEric Cheng #include <sys/mac_provider.h>
4563f531d1SSriharsha Basavapatna #include <sys/mac_client.h>
4663f531d1SSriharsha Basavapatna #include <sys/mac_client_priv.h>
47ba2e4443Sseb #include <sys/mac_ether.h>
481ae08745Sheppo #include <sys/ddi.h>
491ae08745Sheppo #include <sys/sunddi.h>
501ae08745Sheppo #include <sys/strsun.h>
511ae08745Sheppo #include <sys/note.h>
52c1c61f44Ssb155480 #include <sys/atomic.h>
531ae08745Sheppo #include <sys/vnet.h>
54c1c61f44Ssb155480 #include <sys/vlan.h>
55678453a8Sspeer #include <sys/vnet_mailbox.h>
56678453a8Sspeer #include <sys/vnet_common.h>
57678453a8Sspeer #include <sys/dds.h>
58678453a8Sspeer #include <sys/strsubr.h>
59678453a8Sspeer #include <sys/taskq.h>
601ae08745Sheppo 
611ae08745Sheppo /*
621ae08745Sheppo  * Function prototypes.
631ae08745Sheppo  */
641ae08745Sheppo 
651ae08745Sheppo /* DDI entrypoints */
661ae08745Sheppo static int vnetdevinfo(dev_info_t *, ddi_info_cmd_t, void *, void **);
671ae08745Sheppo static int vnetattach(dev_info_t *, ddi_attach_cmd_t);
681ae08745Sheppo static int vnetdetach(dev_info_t *, ddi_detach_cmd_t);
691ae08745Sheppo 
701ae08745Sheppo /* MAC entrypoints  */
71ba2e4443Sseb static int vnet_m_stat(void *, uint_t, uint64_t *);
721ae08745Sheppo static int vnet_m_start(void *);
731ae08745Sheppo static void vnet_m_stop(void *);
741ae08745Sheppo static int vnet_m_promisc(void *, boolean_t);
751ae08745Sheppo static int vnet_m_multicst(void *, boolean_t, const uint8_t *);
761ae08745Sheppo static int vnet_m_unicst(void *, const uint8_t *);
771ae08745Sheppo mblk_t *vnet_m_tx(void *, mblk_t *);
781107ea93SSriharsha Basavapatna static void vnet_m_ioctl(void *arg, queue_t *q, mblk_t *mp);
791107ea93SSriharsha Basavapatna #ifdef	VNET_IOC_DEBUG
801107ea93SSriharsha Basavapatna static void vnet_force_link_state(vnet_t *vnetp, queue_t *q, mblk_t *mp);
811107ea93SSriharsha Basavapatna #endif
8263f531d1SSriharsha Basavapatna static boolean_t vnet_m_capab(void *arg, mac_capab_t cap, void *cap_data);
8363f531d1SSriharsha Basavapatna static void vnet_get_ring(void *arg, mac_ring_type_t rtype, const int g_index,
8463f531d1SSriharsha Basavapatna 	const int r_index, mac_ring_info_t *infop, mac_ring_handle_t r_handle);
8563f531d1SSriharsha Basavapatna static void vnet_get_group(void *arg, mac_ring_type_t type, const int index,
8663f531d1SSriharsha Basavapatna 	mac_group_info_t *infop, mac_group_handle_t handle);
8763f531d1SSriharsha Basavapatna static int vnet_rx_ring_start(mac_ring_driver_t rdriver, uint64_t mr_gen_num);
8863f531d1SSriharsha Basavapatna static void vnet_rx_ring_stop(mac_ring_driver_t rdriver);
890dc2366fSVenugopal Iyer static int vnet_rx_ring_stat(mac_ring_driver_t rdriver, uint_t stat,
900dc2366fSVenugopal Iyer 	uint64_t *val);
9163f531d1SSriharsha Basavapatna static int vnet_tx_ring_start(mac_ring_driver_t rdriver, uint64_t mr_gen_num);
9263f531d1SSriharsha Basavapatna static void vnet_tx_ring_stop(mac_ring_driver_t rdriver);
930dc2366fSVenugopal Iyer static int vnet_tx_ring_stat(mac_ring_driver_t rdriver, uint_t stat,
940dc2366fSVenugopal Iyer 	uint64_t *val);
9563f531d1SSriharsha Basavapatna static int vnet_ring_enable_intr(void *arg);
9663f531d1SSriharsha Basavapatna static int vnet_ring_disable_intr(void *arg);
9763f531d1SSriharsha Basavapatna static mblk_t *vnet_rx_poll(void *arg, int bytes_to_pickup);
9863f531d1SSriharsha Basavapatna static int vnet_addmac(void *arg, const uint8_t *mac_addr);
9963f531d1SSriharsha Basavapatna static int vnet_remmac(void *arg, const uint8_t *mac_addr);
1001ae08745Sheppo 
1011ae08745Sheppo /* vnet internal functions */
1026f09f0feSWENTAO YANG static int vnet_unattach(vnet_t *vnetp);
10363f531d1SSriharsha Basavapatna static void vnet_ring_grp_init(vnet_t *vnetp);
10463f531d1SSriharsha Basavapatna static void vnet_ring_grp_uninit(vnet_t *vnetp);
1051ae08745Sheppo static int vnet_mac_register(vnet_t *);
1061ae08745Sheppo static int vnet_read_mac_address(vnet_t *vnetp);
10763f531d1SSriharsha Basavapatna static int vnet_bind_vgenring(vnet_res_t *vresp);
10863f531d1SSriharsha Basavapatna static void vnet_unbind_vgenring(vnet_res_t *vresp);
10963f531d1SSriharsha Basavapatna static int vnet_bind_hwrings(vnet_t *vnetp);
11063f531d1SSriharsha Basavapatna static void vnet_unbind_hwrings(vnet_t *vnetp);
11163f531d1SSriharsha Basavapatna static int vnet_bind_rings(vnet_res_t *vresp);
11263f531d1SSriharsha Basavapatna static void vnet_unbind_rings(vnet_res_t *vresp);
11363f531d1SSriharsha Basavapatna static int vnet_hio_stat(void *, uint_t, uint64_t *);
11463f531d1SSriharsha Basavapatna static int vnet_hio_start(void *);
11563f531d1SSriharsha Basavapatna static void vnet_hio_stop(void *);
11663f531d1SSriharsha Basavapatna mblk_t *vnet_hio_tx(void *, mblk_t *);
1171ae08745Sheppo 
118c1c61f44Ssb155480 /* Forwarding database (FDB) routines */
119c1c61f44Ssb155480 static void vnet_fdb_create(vnet_t *vnetp);
120c1c61f44Ssb155480 static void vnet_fdb_destroy(vnet_t *vnetp);
121678453a8Sspeer static vnet_res_t *vnet_fdbe_find(vnet_t *vnetp, struct ether_addr *addrp);
122c1c61f44Ssb155480 static void vnet_fdbe_find_cb(mod_hash_key_t key, mod_hash_val_t val);
123678453a8Sspeer void vnet_fdbe_add(vnet_t *vnetp, vnet_res_t *vresp);
124678453a8Sspeer static void vnet_fdbe_del(vnet_t *vnetp, vnet_res_t *vresp);
125c1c61f44Ssb155480 
1268c242ab0SSriharsha Basavapatna static void vnet_rx_frames_untag(uint16_t pvid, mblk_t **mp);
127678453a8Sspeer static void vnet_rx(vio_net_handle_t vrh, mblk_t *mp);
128678453a8Sspeer static void vnet_tx_update(vio_net_handle_t vrh);
129678453a8Sspeer static void vnet_res_start_task(void *arg);
130678453a8Sspeer static void vnet_start_resources(vnet_t *vnetp);
131678453a8Sspeer static void vnet_stop_resources(vnet_t *vnetp);
132678453a8Sspeer static void vnet_dispatch_res_task(vnet_t *vnetp);
133678453a8Sspeer static void vnet_res_start_task(void *arg);
134678453a8Sspeer static void vnet_handle_res_err(vio_net_handle_t vrh, vio_net_err_val_t err);
13563f531d1SSriharsha Basavapatna static void vnet_add_resource(vnet_t *vnetp, vnet_res_t *vresp);
13663f531d1SSriharsha Basavapatna static vnet_res_t *vnet_rem_resource(vnet_t *vnetp, vnet_res_t *vresp);
1370dc2366fSVenugopal Iyer static void vnet_tx_notify_thread(void *);
1381107ea93SSriharsha Basavapatna 
1391107ea93SSriharsha Basavapatna /* Exported to vnet_gen */
1407b1f684aSSriharsha Basavapatna int vnet_mtu_update(vnet_t *vnetp, uint32_t mtu);
1411107ea93SSriharsha Basavapatna void vnet_link_update(vnet_t *vnetp, link_state_t link_state);
1426d6de4eeSWENTAO YANG void vnet_dds_cleanup_hio(vnet_t *vnetp);
143678453a8Sspeer 
1446ab6cb20SWENTAO YANG static kstat_t *vnet_hio_setup_kstats(char *ks_mod, char *ks_name,
1456ab6cb20SWENTAO YANG     vnet_res_t *vresp);
1466ab6cb20SWENTAO YANG static int vnet_hio_update_kstats(kstat_t *ksp, int rw);
1476ab6cb20SWENTAO YANG static void vnet_hio_get_stats(vnet_res_t *vresp, vnet_hio_stats_t *statsp);
1486ab6cb20SWENTAO YANG static void vnet_hio_destroy_kstats(kstat_t *ksp);
1496ab6cb20SWENTAO YANG 
150678453a8Sspeer /* Exported to to vnet_dds */
151678453a8Sspeer int vnet_send_dds_msg(vnet_t *vnetp, void *dmsg);
15263f531d1SSriharsha Basavapatna int vnet_hio_mac_init(vnet_t *vnetp, char *ifname);
15363f531d1SSriharsha Basavapatna void vnet_hio_mac_cleanup(vnet_t *vnetp);
154678453a8Sspeer 
155678453a8Sspeer /* Externs that are imported from vnet_gen */
156678453a8Sspeer extern int vgen_init(void *vnetp, uint64_t regprop, dev_info_t *vnetdip,
157678453a8Sspeer     const uint8_t *macaddr, void **vgenhdl);
15863f531d1SSriharsha Basavapatna extern int vgen_init_mdeg(void *arg);
1593ab636deSWENTAO YANG extern void vgen_uninit(void *arg);
160678453a8Sspeer extern int vgen_dds_tx(void *arg, void *dmsg);
16163f531d1SSriharsha Basavapatna extern int vgen_enable_intr(void *arg);
16263f531d1SSriharsha Basavapatna extern int vgen_disable_intr(void *arg);
1637bd3a2e2SSriharsha Basavapatna extern mblk_t *vgen_rx_poll(void *arg, int bytes_to_pickup);
164678453a8Sspeer 
165678453a8Sspeer /* Externs that are imported from vnet_dds */
166678453a8Sspeer extern void vdds_mod_init(void);
167678453a8Sspeer extern void vdds_mod_fini(void);
168678453a8Sspeer extern int vdds_init(vnet_t *vnetp);
169678453a8Sspeer extern void vdds_cleanup(vnet_t *vnetp);
170678453a8Sspeer extern void vdds_process_dds_msg(vnet_t *vnetp, vio_dds_msg_t *dmsg);
171d0288fccSRaghuram Kothakota extern void vdds_cleanup_hybrid_res(void *arg);
1726d6de4eeSWENTAO YANG extern void vdds_cleanup_hio(vnet_t *vnetp);
1731ae08745Sheppo 
1740dc2366fSVenugopal Iyer extern pri_t	minclsyspri;
17563f531d1SSriharsha Basavapatna 
1766ab6cb20SWENTAO YANG #define	DRV_NAME	"vnet"
177c1c61f44Ssb155480 #define	VNET_FDBE_REFHOLD(p)						\
178c1c61f44Ssb155480 {									\
179c1c61f44Ssb155480 	atomic_inc_32(&(p)->refcnt);					\
180c1c61f44Ssb155480 	ASSERT((p)->refcnt != 0);					\
181c1c61f44Ssb155480 }
182c1c61f44Ssb155480 
183c1c61f44Ssb155480 #define	VNET_FDBE_REFRELE(p)						\
184c1c61f44Ssb155480 {									\
185c1c61f44Ssb155480 	ASSERT((p)->refcnt != 0);					\
186c1c61f44Ssb155480 	atomic_dec_32(&(p)->refcnt);					\
187c1c61f44Ssb155480 }
188c1c61f44Ssb155480 
1891107ea93SSriharsha Basavapatna #ifdef	VNET_IOC_DEBUG
19063f531d1SSriharsha Basavapatna #define	VNET_M_CALLBACK_FLAGS	(MC_IOCTL | MC_GETCAPAB)
1911107ea93SSriharsha Basavapatna #else
19263f531d1SSriharsha Basavapatna #define	VNET_M_CALLBACK_FLAGS	(MC_GETCAPAB)
1931107ea93SSriharsha Basavapatna #endif
1941107ea93SSriharsha Basavapatna 
195ba2e4443Sseb static mac_callbacks_t vnet_m_callbacks = {
1961107ea93SSriharsha Basavapatna 	VNET_M_CALLBACK_FLAGS,
197ba2e4443Sseb 	vnet_m_stat,
198ba2e4443Sseb 	vnet_m_start,
199ba2e4443Sseb 	vnet_m_stop,
200ba2e4443Sseb 	vnet_m_promisc,
201ba2e4443Sseb 	vnet_m_multicst,
20263f531d1SSriharsha Basavapatna 	NULL,	/* m_unicst entry must be NULL while rx rings are exposed */
20363f531d1SSriharsha Basavapatna 	NULL,	/* m_tx entry must be NULL while tx rings are exposed */
2040dc2366fSVenugopal Iyer 	NULL,
2051107ea93SSriharsha Basavapatna 	vnet_m_ioctl,
20663f531d1SSriharsha Basavapatna 	vnet_m_capab,
20763f531d1SSriharsha Basavapatna 	NULL
20863f531d1SSriharsha Basavapatna };
20963f531d1SSriharsha Basavapatna 
21063f531d1SSriharsha Basavapatna static mac_callbacks_t vnet_hio_res_callbacks = {
21163f531d1SSriharsha Basavapatna 	0,
21263f531d1SSriharsha Basavapatna 	vnet_hio_stat,
21363f531d1SSriharsha Basavapatna 	vnet_hio_start,
21463f531d1SSriharsha Basavapatna 	vnet_hio_stop,
21563f531d1SSriharsha Basavapatna 	NULL,
21663f531d1SSriharsha Basavapatna 	NULL,
21763f531d1SSriharsha Basavapatna 	NULL,
21863f531d1SSriharsha Basavapatna 	vnet_hio_tx,
21963f531d1SSriharsha Basavapatna 	NULL,
220ba2e4443Sseb 	NULL,
221ba2e4443Sseb 	NULL
222ba2e4443Sseb };
223ba2e4443Sseb 
2241ae08745Sheppo /*
2251ae08745Sheppo  * Linked list of "vnet_t" structures - one per instance.
2261ae08745Sheppo  */
2271ae08745Sheppo static vnet_t	*vnet_headp = NULL;
2281ae08745Sheppo static krwlock_t vnet_rw;
2291ae08745Sheppo 
2301ae08745Sheppo /* Tunables */
2317bd3a2e2SSriharsha Basavapatna uint32_t vnet_num_descriptors = VNET_NUM_DESCRIPTORS;
232c1c61f44Ssb155480 
2337bd3a2e2SSriharsha Basavapatna /*
2347bd3a2e2SSriharsha Basavapatna  * Configure tx serialization in mac layer for the vnet device. This tunable
2357bd3a2e2SSriharsha Basavapatna  * should be enabled to improve performance only if HybridIO is configured for
2367bd3a2e2SSriharsha Basavapatna  * the vnet device.
2377bd3a2e2SSriharsha Basavapatna  */
2387bd3a2e2SSriharsha Basavapatna boolean_t vnet_mac_tx_serialize = B_FALSE;
2397bd3a2e2SSriharsha Basavapatna 
2400dc2366fSVenugopal Iyer /* Configure enqueing at Rx soft rings in mac layer for the vnet device */
2410dc2366fSVenugopal Iyer boolean_t vnet_mac_rx_queuing = B_TRUE;
24263f531d1SSriharsha Basavapatna 
2437b1f684aSSriharsha Basavapatna /*
2447b1f684aSSriharsha Basavapatna  * Set this to non-zero to enable additional internal receive buffer pools
2457b1f684aSSriharsha Basavapatna  * based on the MTU of the device for better performance at the cost of more
2467b1f684aSSriharsha Basavapatna  * memory consumption. This is turned off by default, to use allocb(9F) for
2477b1f684aSSriharsha Basavapatna  * receive buffer allocations of sizes > 2K.
2487b1f684aSSriharsha Basavapatna  */
2497b1f684aSSriharsha Basavapatna boolean_t vnet_jumbo_rxpools = B_FALSE;
2507b1f684aSSriharsha Basavapatna 
251c1c61f44Ssb155480 /* # of chains in fdb hash table */
252c1c61f44Ssb155480 uint32_t	vnet_fdb_nchains = VNET_NFDB_HASH;
253c1c61f44Ssb155480 
254c1c61f44Ssb155480 /* Internal tunables */
255c1c61f44Ssb155480 uint32_t	vnet_ethermtu = 1500;	/* mtu of the device */
256c1c61f44Ssb155480 
257c1c61f44Ssb155480 /*
258c1c61f44Ssb155480  * Default vlan id. This is only used internally when the "default-vlan-id"
259c1c61f44Ssb155480  * property is not present in the MD device node. Therefore, this should not be
260c1c61f44Ssb155480  * used as a tunable; if this value is changed, the corresponding variable
261c1c61f44Ssb155480  * should be updated to the same value in vsw and also other vnets connected to
262c1c61f44Ssb155480  * the same vsw.
263c1c61f44Ssb155480  */
264c1c61f44Ssb155480 uint16_t	vnet_default_vlan_id = 1;
265c1c61f44Ssb155480 
266c1c61f44Ssb155480 /* delay in usec to wait for all references on a fdb entry to be dropped */
267c1c61f44Ssb155480 uint32_t vnet_fdbe_refcnt_delay = 10;
2681ae08745Sheppo 
269678453a8Sspeer static struct ether_addr etherbroadcastaddr = {
270678453a8Sspeer 	0xff, 0xff, 0xff, 0xff, 0xff, 0xff
271678453a8Sspeer };
272678453a8Sspeer 
27363f531d1SSriharsha Basavapatna /* mac_open() retry delay in usec */
27463f531d1SSriharsha Basavapatna uint32_t vnet_mac_open_delay = 100;	/* 0.1 ms */
27563f531d1SSriharsha Basavapatna 
27663f531d1SSriharsha Basavapatna /* max # of mac_open() retries */
27763f531d1SSriharsha Basavapatna uint32_t vnet_mac_open_retries = 100;
278678453a8Sspeer 
2791ae08745Sheppo /*
2801ae08745Sheppo  * Property names
2811ae08745Sheppo  */
2821ae08745Sheppo static char macaddr_propname[] = "local-mac-address";
2831ae08745Sheppo 
2841ae08745Sheppo /*
285*bbf21555SRichard Lowe  * This is the string displayed by modinfo(8).
2861ae08745Sheppo  */
2877b1f684aSSriharsha Basavapatna static char vnet_ident[] = "vnet driver";
2881ae08745Sheppo extern struct mod_ops mod_driverops;
2891ae08745Sheppo static struct cb_ops cb_vnetops = {
2901ae08745Sheppo 	nulldev,		/* cb_open */
2911ae08745Sheppo 	nulldev,		/* cb_close */
2921ae08745Sheppo 	nodev,			/* cb_strategy */
2931ae08745Sheppo 	nodev,			/* cb_print */
2941ae08745Sheppo 	nodev,			/* cb_dump */
2951ae08745Sheppo 	nodev,			/* cb_read */
2961ae08745Sheppo 	nodev,			/* cb_write */
2971ae08745Sheppo 	nodev,			/* cb_ioctl */
2981ae08745Sheppo 	nodev,			/* cb_devmap */
2991ae08745Sheppo 	nodev,			/* cb_mmap */
3001ae08745Sheppo 	nodev,			/* cb_segmap */
3011ae08745Sheppo 	nochpoll,		/* cb_chpoll */
3021ae08745Sheppo 	ddi_prop_op,		/* cb_prop_op */
3031ae08745Sheppo 	NULL,			/* cb_stream */
3041ae08745Sheppo 	(int)(D_MP)		/* cb_flag */
3051ae08745Sheppo };
3061ae08745Sheppo 
3071ae08745Sheppo static struct dev_ops vnetops = {
3081ae08745Sheppo 	DEVO_REV,		/* devo_rev */
3091ae08745Sheppo 	0,			/* devo_refcnt */
3101ae08745Sheppo 	NULL,			/* devo_getinfo */
3111ae08745Sheppo 	nulldev,		/* devo_identify */
3121ae08745Sheppo 	nulldev,		/* devo_probe */
3131ae08745Sheppo 	vnetattach,		/* devo_attach */
3141ae08745Sheppo 	vnetdetach,		/* devo_detach */
3151ae08745Sheppo 	nodev,			/* devo_reset */
3161ae08745Sheppo 	&cb_vnetops,		/* devo_cb_ops */
31719397407SSherry Moore 	(struct bus_ops *)NULL,	/* devo_bus_ops */
31819397407SSherry Moore 	NULL,			/* devo_power */
31919397407SSherry Moore 	ddi_quiesce_not_supported,	/* devo_quiesce */
3201ae08745Sheppo };
3211ae08745Sheppo 
3221ae08745Sheppo static struct modldrv modldrv = {
3231ae08745Sheppo 	&mod_driverops,		/* Type of module.  This one is a driver */
3241ae08745Sheppo 	vnet_ident,		/* ID string */
3251ae08745Sheppo 	&vnetops		/* driver specific ops */
3261ae08745Sheppo };
3271ae08745Sheppo 
3281ae08745Sheppo static struct modlinkage modlinkage = {
3291ae08745Sheppo 	MODREV_1, (void *)&modldrv, NULL
3301ae08745Sheppo };
3311ae08745Sheppo 
332844e62a3Sraghuram #ifdef DEBUG
3331ae08745Sheppo 
3347bd3a2e2SSriharsha Basavapatna #define	DEBUG_PRINTF	debug_printf
3357bd3a2e2SSriharsha Basavapatna 
3361ae08745Sheppo /*
3371ae08745Sheppo  * Print debug messages - set to 0xf to enable all msgs
3381ae08745Sheppo  */
339844e62a3Sraghuram int vnet_dbglevel = 0x8;
3401ae08745Sheppo 
341844e62a3Sraghuram static void
debug_printf(const char * fname,void * arg,const char * fmt,...)342844e62a3Sraghuram debug_printf(const char *fname, void *arg, const char *fmt, ...)
3431ae08745Sheppo {
3441ae08745Sheppo 	char    buf[512];
3451ae08745Sheppo 	va_list ap;
3461ae08745Sheppo 	vnet_t *vnetp = (vnet_t *)arg;
347844e62a3Sraghuram 	char    *bufp = buf;
3481ae08745Sheppo 
349844e62a3Sraghuram 	if (vnetp == NULL) {
350844e62a3Sraghuram 		(void) sprintf(bufp, "%s: ", fname);
351844e62a3Sraghuram 		bufp += strlen(bufp);
352844e62a3Sraghuram 	} else {
353844e62a3Sraghuram 		(void) sprintf(bufp, "vnet%d:%s: ", vnetp->instance, fname);
354844e62a3Sraghuram 		bufp += strlen(bufp);
3551ae08745Sheppo 	}
356844e62a3Sraghuram 	va_start(ap, fmt);
357844e62a3Sraghuram 	(void) vsprintf(bufp, fmt, ap);
358844e62a3Sraghuram 	va_end(ap);
359844e62a3Sraghuram 	cmn_err(CE_CONT, "%s\n", buf);
360844e62a3Sraghuram }
3611ae08745Sheppo 
3621ae08745Sheppo #endif
3631ae08745Sheppo 
3641ae08745Sheppo /* _init(9E): initialize the loadable module */
3651ae08745Sheppo int
_init(void)3661ae08745Sheppo _init(void)
3671ae08745Sheppo {
3681ae08745Sheppo 	int status;
3691ae08745Sheppo 
370844e62a3Sraghuram 	DBG1(NULL, "enter\n");
3711ae08745Sheppo 
3721ae08745Sheppo 	mac_init_ops(&vnetops, "vnet");
3731ae08745Sheppo 	status = mod_install(&modlinkage);
3741ae08745Sheppo 	if (status != 0) {
3751ae08745Sheppo 		mac_fini_ops(&vnetops);
3761ae08745Sheppo 	}
377678453a8Sspeer 	vdds_mod_init();
378844e62a3Sraghuram 	DBG1(NULL, "exit(%d)\n", status);
3791ae08745Sheppo 	return (status);
3801ae08745Sheppo }
3811ae08745Sheppo 
3821ae08745Sheppo /* _fini(9E): prepare the module for unloading. */
3831ae08745Sheppo int
_fini(void)3841ae08745Sheppo _fini(void)
3851ae08745Sheppo {
3861ae08745Sheppo 	int		status;
3871ae08745Sheppo 
388844e62a3Sraghuram 	DBG1(NULL, "enter\n");
3891ae08745Sheppo 
3901ae08745Sheppo 	status = mod_remove(&modlinkage);
3911ae08745Sheppo 	if (status != 0)
3921ae08745Sheppo 		return (status);
3931ae08745Sheppo 	mac_fini_ops(&vnetops);
394678453a8Sspeer 	vdds_mod_fini();
3951ae08745Sheppo 
396844e62a3Sraghuram 	DBG1(NULL, "exit(%d)\n", status);
3971ae08745Sheppo 	return (status);
3981ae08745Sheppo }
3991ae08745Sheppo 
4001ae08745Sheppo /* _info(9E): return information about the loadable module */
4011ae08745Sheppo int
_info(struct modinfo * modinfop)4021ae08745Sheppo _info(struct modinfo *modinfop)
4031ae08745Sheppo {
4041ae08745Sheppo 	return (mod_info(&modlinkage, modinfop));
4051ae08745Sheppo }
4061ae08745Sheppo 
4071ae08745Sheppo /*
4081ae08745Sheppo  * attach(9E): attach a device to the system.
4091ae08745Sheppo  * called once for each instance of the device on the system.
4101ae08745Sheppo  */
4111ae08745Sheppo static int
vnetattach(dev_info_t * dip,ddi_attach_cmd_t cmd)4121ae08745Sheppo vnetattach(dev_info_t *dip, ddi_attach_cmd_t cmd)
4131ae08745Sheppo {
4141ae08745Sheppo 	vnet_t			*vnetp;
4151ae08745Sheppo 	int			status;
416678453a8Sspeer 	int			instance;
417678453a8Sspeer 	uint64_t		reg;
418678453a8Sspeer 	char			qname[TASKQ_NAMELEN];
4196f09f0feSWENTAO YANG 	vnet_attach_progress_t	attach_progress;
4201ae08745Sheppo 
4216f09f0feSWENTAO YANG 	attach_progress = AST_init;
4221ae08745Sheppo 
4231ae08745Sheppo 	switch (cmd) {
4241ae08745Sheppo 	case DDI_ATTACH:
4251ae08745Sheppo 		break;
4261ae08745Sheppo 	case DDI_RESUME:
4271ae08745Sheppo 	case DDI_PM_RESUME:
4281ae08745Sheppo 	default:
4291ae08745Sheppo 		goto vnet_attach_fail;
4301ae08745Sheppo 	}
4311ae08745Sheppo 
4321ae08745Sheppo 	instance = ddi_get_instance(dip);
433844e62a3Sraghuram 	DBG1(NULL, "instance(%d) enter\n", instance);
4341ae08745Sheppo 
4351ae08745Sheppo 	/* allocate vnet_t and mac_t structures */
4361ae08745Sheppo 	vnetp = kmem_zalloc(sizeof (vnet_t), KM_SLEEP);
437678453a8Sspeer 	vnetp->dip = dip;
438678453a8Sspeer 	vnetp->instance = instance;
439678453a8Sspeer 	rw_init(&vnetp->vrwlock, NULL, RW_DRIVER, NULL);
440678453a8Sspeer 	rw_init(&vnetp->vsw_fp_rw, NULL, RW_DRIVER, NULL);
4416f09f0feSWENTAO YANG 	attach_progress |= AST_vnet_alloc;
4421ae08745Sheppo 
44363f531d1SSriharsha Basavapatna 	vnet_ring_grp_init(vnetp);
44463f531d1SSriharsha Basavapatna 	attach_progress |= AST_ring_init;
44563f531d1SSriharsha Basavapatna 
446678453a8Sspeer 	status = vdds_init(vnetp);
447678453a8Sspeer 	if (status != 0) {
448678453a8Sspeer 		goto vnet_attach_fail;
449678453a8Sspeer 	}
4506f09f0feSWENTAO YANG 	attach_progress |= AST_vdds_init;
451678453a8Sspeer 
4521ae08745Sheppo 	/* setup links to vnet_t from both devinfo and mac_t */
4531ae08745Sheppo 	ddi_set_driver_private(dip, (caddr_t)vnetp);
4541ae08745Sheppo 
4551ae08745Sheppo 	/* read the mac address */
4561ae08745Sheppo 	status = vnet_read_mac_address(vnetp);
4571ae08745Sheppo 	if (status != DDI_SUCCESS) {
4581ae08745Sheppo 		goto vnet_attach_fail;
4591ae08745Sheppo 	}
4606f09f0feSWENTAO YANG 	attach_progress |= AST_read_macaddr;
4611ae08745Sheppo 
462678453a8Sspeer 	reg = ddi_prop_get_int(DDI_DEV_T_ANY, dip,
463678453a8Sspeer 	    DDI_PROP_DONTPASS, "reg", -1);
464678453a8Sspeer 	if (reg == -1) {
4651ae08745Sheppo 		goto vnet_attach_fail;
4661ae08745Sheppo 	}
467678453a8Sspeer 	vnetp->reg = reg;
4681ae08745Sheppo 
469c1c61f44Ssb155480 	vnet_fdb_create(vnetp);
4706f09f0feSWENTAO YANG 	attach_progress |= AST_fdbh_alloc;
4711ae08745Sheppo 
4727bd3a2e2SSriharsha Basavapatna 	(void) snprintf(qname, TASKQ_NAMELEN, "vres_taskq%d", instance);
473678453a8Sspeer 	if ((vnetp->taskqp = ddi_taskq_create(dip, qname, 1,
474678453a8Sspeer 	    TASKQ_DEFAULTPRI, 0)) == NULL) {
475678453a8Sspeer 		cmn_err(CE_WARN, "!vnet%d: Unable to create task queue",
476678453a8Sspeer 		    instance);
4771ae08745Sheppo 		goto vnet_attach_fail;
4781ae08745Sheppo 	}
4796f09f0feSWENTAO YANG 	attach_progress |= AST_taskq_create;
4801ae08745Sheppo 
4811ae08745Sheppo 	/* add to the list of vnet devices */
4821ae08745Sheppo 	WRITE_ENTER(&vnet_rw);
4831ae08745Sheppo 	vnetp->nextp = vnet_headp;
4841ae08745Sheppo 	vnet_headp = vnetp;
4851ae08745Sheppo 	RW_EXIT(&vnet_rw);
4861ae08745Sheppo 
4876f09f0feSWENTAO YANG 	attach_progress |= AST_vnet_list;
488678453a8Sspeer 
489678453a8Sspeer 	/*
49063f531d1SSriharsha Basavapatna 	 * Initialize the generic vnet plugin which provides communication via
49163f531d1SSriharsha Basavapatna 	 * sun4v LDC (logical domain channel) based resources. This involves 2
49263f531d1SSriharsha Basavapatna 	 * steps; first, vgen_init() is invoked to read the various properties
49363f531d1SSriharsha Basavapatna 	 * of the vnet device from its MD node (including its mtu which is
49463f531d1SSriharsha Basavapatna 	 * needed to mac_register()) and obtain a handle to the vgen layer.
49563f531d1SSriharsha Basavapatna 	 * After mac_register() is done and we have a mac handle, we then
49663f531d1SSriharsha Basavapatna 	 * invoke vgen_init_mdeg() which registers with the the MD event
49763f531d1SSriharsha Basavapatna 	 * generator (mdeg) framework to allow LDC resource notifications.
49863f531d1SSriharsha Basavapatna 	 * Note: this sequence also allows us to report the correct default #
49963f531d1SSriharsha Basavapatna 	 * of pseudo rings (2TX and 3RX) in vnet_m_capab() which gets invoked
50063f531d1SSriharsha Basavapatna 	 * in the context of mac_register(); and avoids conflicting with
50163f531d1SSriharsha Basavapatna 	 * dynamic pseudo rx rings which get added/removed as a result of mdeg
50263f531d1SSriharsha Basavapatna 	 * events in vgen.
503678453a8Sspeer 	 */
504678453a8Sspeer 	status = vgen_init(vnetp, reg, vnetp->dip,
505678453a8Sspeer 	    (uint8_t *)vnetp->curr_macaddr, &vnetp->vgenhdl);
506678453a8Sspeer 	if (status != DDI_SUCCESS) {
507678453a8Sspeer 		DERR(vnetp, "vgen_init() failed\n");
508678453a8Sspeer 		goto vnet_attach_fail;
509678453a8Sspeer 	}
5106f09f0feSWENTAO YANG 	attach_progress |= AST_vgen_init;
511678453a8Sspeer 
512678453a8Sspeer 	status = vnet_mac_register(vnetp);
513678453a8Sspeer 	if (status != DDI_SUCCESS) {
514678453a8Sspeer 		goto vnet_attach_fail;
515678453a8Sspeer 	}
5161107ea93SSriharsha Basavapatna 	vnetp->link_state = LINK_STATE_UNKNOWN;
5176f09f0feSWENTAO YANG 	attach_progress |= AST_macreg;
5186f09f0feSWENTAO YANG 
51963f531d1SSriharsha Basavapatna 	status = vgen_init_mdeg(vnetp->vgenhdl);
52063f531d1SSriharsha Basavapatna 	if (status != DDI_SUCCESS) {
52163f531d1SSriharsha Basavapatna 		goto vnet_attach_fail;
52263f531d1SSriharsha Basavapatna 	}
52363f531d1SSriharsha Basavapatna 	attach_progress |= AST_init_mdeg;
52463f531d1SSriharsha Basavapatna 
5256f09f0feSWENTAO YANG 	vnetp->attach_progress = attach_progress;
5266f09f0feSWENTAO YANG 
527844e62a3Sraghuram 	DBG1(NULL, "instance(%d) exit\n", instance);
5281ae08745Sheppo 	return (DDI_SUCCESS);
5291ae08745Sheppo 
5301ae08745Sheppo vnet_attach_fail:
5316f09f0feSWENTAO YANG 	vnetp->attach_progress = attach_progress;
5323ab636deSWENTAO YANG 	status = vnet_unattach(vnetp);
5333ab636deSWENTAO YANG 	ASSERT(status == 0);
5341ae08745Sheppo 	return (DDI_FAILURE);
5351ae08745Sheppo }
5361ae08745Sheppo 
5371ae08745Sheppo /*
5381ae08745Sheppo  * detach(9E): detach a device from the system.
5391ae08745Sheppo  */
5401ae08745Sheppo static int
vnetdetach(dev_info_t * dip,ddi_detach_cmd_t cmd)5411ae08745Sheppo vnetdetach(dev_info_t *dip, ddi_detach_cmd_t cmd)
5421ae08745Sheppo {
5431ae08745Sheppo 	vnet_t		*vnetp;
5441ae08745Sheppo 	int		instance;
5451ae08745Sheppo 
5461ae08745Sheppo 	instance = ddi_get_instance(dip);
547844e62a3Sraghuram 	DBG1(NULL, "instance(%d) enter\n", instance);
5481ae08745Sheppo 
5491ae08745Sheppo 	vnetp = ddi_get_driver_private(dip);
5501ae08745Sheppo 	if (vnetp == NULL) {
5511ae08745Sheppo 		goto vnet_detach_fail;
5521ae08745Sheppo 	}
5531ae08745Sheppo 
5541ae08745Sheppo 	switch (cmd) {
5551ae08745Sheppo 	case DDI_DETACH:
5561ae08745Sheppo 		break;
5571ae08745Sheppo 	case DDI_SUSPEND:
5581ae08745Sheppo 	case DDI_PM_SUSPEND:
5591ae08745Sheppo 	default:
5601ae08745Sheppo 		goto vnet_detach_fail;
5611ae08745Sheppo 	}
5621ae08745Sheppo 
5636f09f0feSWENTAO YANG 	if (vnet_unattach(vnetp) != 0) {
564d10e4ef2Snarayan 		goto vnet_detach_fail;
565d10e4ef2Snarayan 	}
566d10e4ef2Snarayan 
5676f09f0feSWENTAO YANG 	return (DDI_SUCCESS);
5681ae08745Sheppo 
5696f09f0feSWENTAO YANG vnet_detach_fail:
5706f09f0feSWENTAO YANG 	return (DDI_FAILURE);
5716f09f0feSWENTAO YANG }
5726f09f0feSWENTAO YANG 
5736f09f0feSWENTAO YANG /*
5746f09f0feSWENTAO YANG  * Common routine to handle vnetattach() failure and vnetdetach(). Note that
5756f09f0feSWENTAO YANG  * the only reason this function could fail is if mac_unregister() fails.
5766f09f0feSWENTAO YANG  * Otherwise, this function must ensure that all resources are freed and return
5776f09f0feSWENTAO YANG  * success.
5786f09f0feSWENTAO YANG  */
5796f09f0feSWENTAO YANG static int
vnet_unattach(vnet_t * vnetp)5806f09f0feSWENTAO YANG vnet_unattach(vnet_t *vnetp)
5816f09f0feSWENTAO YANG {
5826f09f0feSWENTAO YANG 	vnet_attach_progress_t	attach_progress;
5836f09f0feSWENTAO YANG 
5846f09f0feSWENTAO YANG 	attach_progress = vnetp->attach_progress;
5856f09f0feSWENTAO YANG 
5866f09f0feSWENTAO YANG 	/*
58763f531d1SSriharsha Basavapatna 	 * Disable the mac device in the gldv3 subsystem. This can fail, in
58863f531d1SSriharsha Basavapatna 	 * particular if there are still any open references to this mac
58963f531d1SSriharsha Basavapatna 	 * device; in which case we just return failure without continuing to
59063f531d1SSriharsha Basavapatna 	 * detach further.
59163f531d1SSriharsha Basavapatna 	 * If it succeeds, we then invoke vgen_uninit() which should unregister
59263f531d1SSriharsha Basavapatna 	 * any pseudo rings registered with the mac layer. Note we keep the
59363f531d1SSriharsha Basavapatna 	 * AST_macreg flag on, so we can unregister with the mac layer at
59463f531d1SSriharsha Basavapatna 	 * the end of this routine.
5956f09f0feSWENTAO YANG 	 */
5966f09f0feSWENTAO YANG 	if (attach_progress & AST_macreg) {
59763f531d1SSriharsha Basavapatna 		if (mac_disable(vnetp->mh) != 0) {
5986f09f0feSWENTAO YANG 			return (1);
5996f09f0feSWENTAO YANG 		}
6006f09f0feSWENTAO YANG 	}
6016f09f0feSWENTAO YANG 
6026f09f0feSWENTAO YANG 	/*
60363f531d1SSriharsha Basavapatna 	 * Now that we have disabled the device, we must finish all other steps
60463f531d1SSriharsha Basavapatna 	 * and successfully return from this function; otherwise we will end up
60563f531d1SSriharsha Basavapatna 	 * leaving the device in a broken/unusable state.
6066f09f0feSWENTAO YANG 	 *
6076f09f0feSWENTAO YANG 	 * First, release any hybrid resources assigned to this vnet device.
6086f09f0feSWENTAO YANG 	 */
6096f09f0feSWENTAO YANG 	if (attach_progress & AST_vdds_init) {
6106f09f0feSWENTAO YANG 		vdds_cleanup(vnetp);
6116f09f0feSWENTAO YANG 		attach_progress &= ~AST_vdds_init;
6126f09f0feSWENTAO YANG 	}
6136f09f0feSWENTAO YANG 
6146f09f0feSWENTAO YANG 	/*
6156f09f0feSWENTAO YANG 	 * Uninit vgen. This stops further mdeg callbacks to this vnet
6166f09f0feSWENTAO YANG 	 * device and/or its ports; and detaches any existing ports.
6176f09f0feSWENTAO YANG 	 */
61863f531d1SSriharsha Basavapatna 	if (attach_progress & (AST_vgen_init|AST_init_mdeg)) {
6196f09f0feSWENTAO YANG 		vgen_uninit(vnetp->vgenhdl);
6206f09f0feSWENTAO YANG 		attach_progress &= ~AST_vgen_init;
62163f531d1SSriharsha Basavapatna 		attach_progress &= ~AST_init_mdeg;
6226f09f0feSWENTAO YANG 	}
6236f09f0feSWENTAO YANG 
6246f09f0feSWENTAO YANG 	/* Destroy the taskq. */
6256f09f0feSWENTAO YANG 	if (attach_progress & AST_taskq_create) {
6266f09f0feSWENTAO YANG 		ddi_taskq_destroy(vnetp->taskqp);
6276f09f0feSWENTAO YANG 		attach_progress &= ~AST_taskq_create;
6286f09f0feSWENTAO YANG 	}
6296f09f0feSWENTAO YANG 
6306f09f0feSWENTAO YANG 	/* Destroy fdb. */
6316f09f0feSWENTAO YANG 	if (attach_progress & AST_fdbh_alloc) {
6326f09f0feSWENTAO YANG 		vnet_fdb_destroy(vnetp);
6336f09f0feSWENTAO YANG 		attach_progress &= ~AST_fdbh_alloc;
6346f09f0feSWENTAO YANG 	}
6356f09f0feSWENTAO YANG 
6366f09f0feSWENTAO YANG 	/* Remove from the device list */
6376f09f0feSWENTAO YANG 	if (attach_progress & AST_vnet_list) {
6386f09f0feSWENTAO YANG 		vnet_t		**vnetpp;
6391ae08745Sheppo 		/* unlink from instance(vnet_t) list */
6401ae08745Sheppo 		WRITE_ENTER(&vnet_rw);
6416f09f0feSWENTAO YANG 		for (vnetpp = &vnet_headp; *vnetpp;
6426f09f0feSWENTAO YANG 		    vnetpp = &(*vnetpp)->nextp) {
6431ae08745Sheppo 			if (*vnetpp == vnetp) {
6441ae08745Sheppo 				*vnetpp = vnetp->nextp;
6451ae08745Sheppo 				break;
6461ae08745Sheppo 			}
6471ae08745Sheppo 		}
6481ae08745Sheppo 		RW_EXIT(&vnet_rw);
6496f09f0feSWENTAO YANG 		attach_progress &= ~AST_vnet_list;
6506f09f0feSWENTAO YANG 	}
6511ae08745Sheppo 
65263f531d1SSriharsha Basavapatna 	if (attach_progress & AST_ring_init) {
65363f531d1SSriharsha Basavapatna 		vnet_ring_grp_uninit(vnetp);
65463f531d1SSriharsha Basavapatna 		attach_progress &= ~AST_ring_init;
65563f531d1SSriharsha Basavapatna 	}
65663f531d1SSriharsha Basavapatna 
65763f531d1SSriharsha Basavapatna 	if (attach_progress & AST_macreg) {
65863f531d1SSriharsha Basavapatna 		VERIFY(mac_unregister(vnetp->mh) == 0);
65963f531d1SSriharsha Basavapatna 		vnetp->mh = NULL;
66063f531d1SSriharsha Basavapatna 		attach_progress &= ~AST_macreg;
66163f531d1SSriharsha Basavapatna 	}
66263f531d1SSriharsha Basavapatna 
6636f09f0feSWENTAO YANG 	if (attach_progress & AST_vnet_alloc) {
664678453a8Sspeer 		rw_destroy(&vnetp->vrwlock);
665678453a8Sspeer 		rw_destroy(&vnetp->vsw_fp_rw);
6666f09f0feSWENTAO YANG 		attach_progress &= ~AST_vnet_list;
6671ae08745Sheppo 		KMEM_FREE(vnetp);
6686f09f0feSWENTAO YANG 	}
6691ae08745Sheppo 
6706f09f0feSWENTAO YANG 	return (0);
6711ae08745Sheppo }
6721ae08745Sheppo 
6731ae08745Sheppo /* enable the device for transmit/receive */
6741ae08745Sheppo static int
vnet_m_start(void * arg)6751ae08745Sheppo vnet_m_start(void *arg)
6761ae08745Sheppo {
6771ae08745Sheppo 	vnet_t		*vnetp = arg;
6781ae08745Sheppo 
679844e62a3Sraghuram 	DBG1(vnetp, "enter\n");
6801ae08745Sheppo 
681678453a8Sspeer 	WRITE_ENTER(&vnetp->vrwlock);
682678453a8Sspeer 	vnetp->flags |= VNET_STARTED;
683678453a8Sspeer 	vnet_start_resources(vnetp);
684678453a8Sspeer 	RW_EXIT(&vnetp->vrwlock);
6851ae08745Sheppo 
686844e62a3Sraghuram 	DBG1(vnetp, "exit\n");
6871ae08745Sheppo 	return (VNET_SUCCESS);
6881ae08745Sheppo 
6891ae08745Sheppo }
6901ae08745Sheppo 
6911ae08745Sheppo /* stop transmit/receive for the device */
6921ae08745Sheppo static void
vnet_m_stop(void * arg)6931ae08745Sheppo vnet_m_stop(void *arg)
6941ae08745Sheppo {
6951ae08745Sheppo 	vnet_t		*vnetp = arg;
6961ae08745Sheppo 
697844e62a3Sraghuram 	DBG1(vnetp, "enter\n");
6981ae08745Sheppo 
699678453a8Sspeer 	WRITE_ENTER(&vnetp->vrwlock);
700678453a8Sspeer 	if (vnetp->flags & VNET_STARTED) {
7015460ddbdSSriharsha Basavapatna 		/*
7025460ddbdSSriharsha Basavapatna 		 * Set the flags appropriately; this should prevent starting of
7035460ddbdSSriharsha Basavapatna 		 * any new resources that are added(see vnet_res_start_task()),
7045460ddbdSSriharsha Basavapatna 		 * while we release the vrwlock in vnet_stop_resources() before
7055460ddbdSSriharsha Basavapatna 		 * stopping each resource.
7065460ddbdSSriharsha Basavapatna 		 */
707678453a8Sspeer 		vnetp->flags &= ~VNET_STARTED;
7085460ddbdSSriharsha Basavapatna 		vnetp->flags |= VNET_STOPPING;
7095460ddbdSSriharsha Basavapatna 		vnet_stop_resources(vnetp);
7105460ddbdSSriharsha Basavapatna 		vnetp->flags &= ~VNET_STOPPING;
7111ae08745Sheppo 	}
712678453a8Sspeer 	RW_EXIT(&vnetp->vrwlock);
7131ae08745Sheppo 
714844e62a3Sraghuram 	DBG1(vnetp, "exit\n");
7151ae08745Sheppo }
7161ae08745Sheppo 
7171ae08745Sheppo /* set the unicast mac address of the device */
7181ae08745Sheppo static int
vnet_m_unicst(void * arg,const uint8_t * macaddr)7191ae08745Sheppo vnet_m_unicst(void *arg, const uint8_t *macaddr)
7201ae08745Sheppo {
7211ae08745Sheppo 	_NOTE(ARGUNUSED(macaddr))
7221ae08745Sheppo 
7231ae08745Sheppo 	vnet_t *vnetp = arg;
7241ae08745Sheppo 
725844e62a3Sraghuram 	DBG1(vnetp, "enter\n");
7261ae08745Sheppo 	/*
7273af08d82Slm66018 	 * NOTE: setting mac address dynamically is not supported.
7281ae08745Sheppo 	 */
729844e62a3Sraghuram 	DBG1(vnetp, "exit\n");
7301ae08745Sheppo 
7318e6a2a04Slm66018 	return (VNET_FAILURE);
7321ae08745Sheppo }
7331ae08745Sheppo 
7341ae08745Sheppo /* enable/disable a multicast address */
7351ae08745Sheppo static int
vnet_m_multicst(void * arg,boolean_t add,const uint8_t * mca)7361ae08745Sheppo vnet_m_multicst(void *arg, boolean_t add, const uint8_t *mca)
7371ae08745Sheppo {
7381ae08745Sheppo 	_NOTE(ARGUNUSED(add, mca))
7391ae08745Sheppo 
7401ae08745Sheppo 	vnet_t		*vnetp = arg;
741678453a8Sspeer 	vnet_res_t	*vresp;
742678453a8Sspeer 	mac_register_t	*macp;
743ba2e4443Sseb 	mac_callbacks_t	*cbp;
7441ae08745Sheppo 	int		rv = VNET_SUCCESS;
7451ae08745Sheppo 
746844e62a3Sraghuram 	DBG1(vnetp, "enter\n");
747678453a8Sspeer 
7480c4606f0SWENTAO YANG 	READ_ENTER(&vnetp->vsw_fp_rw);
7490c4606f0SWENTAO YANG 	if (vnetp->vsw_fp == NULL) {
7500c4606f0SWENTAO YANG 		RW_EXIT(&vnetp->vsw_fp_rw);
7510c4606f0SWENTAO YANG 		return (EAGAIN);
7520c4606f0SWENTAO YANG 	}
7530c4606f0SWENTAO YANG 	VNET_FDBE_REFHOLD(vnetp->vsw_fp);
7540c4606f0SWENTAO YANG 	RW_EXIT(&vnetp->vsw_fp_rw);
7550c4606f0SWENTAO YANG 
7560c4606f0SWENTAO YANG 	vresp = vnetp->vsw_fp;
757678453a8Sspeer 	macp = &vresp->macreg;
758678453a8Sspeer 	cbp = macp->m_callbacks;
759678453a8Sspeer 	rv = cbp->mc_multicst(macp->m_driver, add, mca);
7600c4606f0SWENTAO YANG 
7610c4606f0SWENTAO YANG 	VNET_FDBE_REFRELE(vnetp->vsw_fp);
762678453a8Sspeer 
763844e62a3Sraghuram 	DBG1(vnetp, "exit(%d)\n", rv);
7641ae08745Sheppo 	return (rv);
7651ae08745Sheppo }
7661ae08745Sheppo 
7671ae08745Sheppo /* set or clear promiscuous mode on the device */
7681ae08745Sheppo static int
vnet_m_promisc(void * arg,boolean_t on)7691ae08745Sheppo vnet_m_promisc(void *arg, boolean_t on)
7701ae08745Sheppo {
7711ae08745Sheppo 	_NOTE(ARGUNUSED(on))
7721ae08745Sheppo 
7731ae08745Sheppo 	vnet_t *vnetp = arg;
774844e62a3Sraghuram 	DBG1(vnetp, "enter\n");
7751ae08745Sheppo 	/*
7763af08d82Slm66018 	 * NOTE: setting promiscuous mode is not supported, just return success.
7771ae08745Sheppo 	 */
778844e62a3Sraghuram 	DBG1(vnetp, "exit\n");
7791ae08745Sheppo 	return (VNET_SUCCESS);
7801ae08745Sheppo }
7811ae08745Sheppo 
7821ae08745Sheppo /*
7831ae08745Sheppo  * Transmit a chain of packets. This function provides switching functionality
7841ae08745Sheppo  * based on the destination mac address to reach other guests (within ldoms) or
7851ae08745Sheppo  * external hosts.
7861ae08745Sheppo  */
7871ae08745Sheppo mblk_t *
vnet_tx_ring_send(void * arg,mblk_t * mp)78863f531d1SSriharsha Basavapatna vnet_tx_ring_send(void *arg, mblk_t *mp)
7891ae08745Sheppo {
79063f531d1SSriharsha Basavapatna 	vnet_pseudo_tx_ring_t	*tx_ringp;
7910dc2366fSVenugopal Iyer 	vnet_tx_ring_stats_t	*statsp;
7921ae08745Sheppo 	vnet_t			*vnetp;
793678453a8Sspeer 	vnet_res_t		*vresp;
7941ae08745Sheppo 	mblk_t			*next;
7951ae08745Sheppo 	mblk_t			*resid_mp;
796678453a8Sspeer 	mac_register_t		*macp;
797c1c61f44Ssb155480 	struct ether_header	*ehp;
798678453a8Sspeer 	boolean_t		is_unicast;
7998c242ab0SSriharsha Basavapatna 	boolean_t		is_pvid;	/* non-default pvid ? */
8008c242ab0SSriharsha Basavapatna 	boolean_t		hres;		/* Hybrid resource ? */
80163f531d1SSriharsha Basavapatna 	void			*tx_arg;
8020dc2366fSVenugopal Iyer 	size_t			size;
8031ae08745Sheppo 
80463f531d1SSriharsha Basavapatna 	tx_ringp = (vnet_pseudo_tx_ring_t *)arg;
8050dc2366fSVenugopal Iyer 	statsp = &tx_ringp->tx_ring_stats;
80663f531d1SSriharsha Basavapatna 	vnetp = (vnet_t *)tx_ringp->vnetp;
807844e62a3Sraghuram 	DBG1(vnetp, "enter\n");
8081ae08745Sheppo 	ASSERT(mp != NULL);
8091ae08745Sheppo 
8108c242ab0SSriharsha Basavapatna 	is_pvid = (vnetp->pvid != vnetp->default_vlan_id) ? B_TRUE : B_FALSE;
8118c242ab0SSriharsha Basavapatna 
8121ae08745Sheppo 	while (mp != NULL) {
813c1c61f44Ssb155480 
8141ae08745Sheppo 		next = mp->b_next;
8151ae08745Sheppo 		mp->b_next = NULL;
8161ae08745Sheppo 
8170dc2366fSVenugopal Iyer 		/* update stats */
8180dc2366fSVenugopal Iyer 		size = msgsize(mp);
8190dc2366fSVenugopal Iyer 
8201ae08745Sheppo 		/*
821c1c61f44Ssb155480 		 * Find fdb entry for the destination
822c1c61f44Ssb155480 		 * and hold a reference to it.
8231ae08745Sheppo 		 */
824c1c61f44Ssb155480 		ehp = (struct ether_header *)mp->b_rptr;
825678453a8Sspeer 		vresp = vnet_fdbe_find(vnetp, &ehp->ether_dhost);
826678453a8Sspeer 		if (vresp != NULL) {
827c1c61f44Ssb155480 
828c1c61f44Ssb155480 			/*
829c1c61f44Ssb155480 			 * Destination found in FDB.
830c1c61f44Ssb155480 			 * The destination is a vnet device within ldoms
831c1c61f44Ssb155480 			 * and directly reachable, invoke the tx function
832c1c61f44Ssb155480 			 * in the fdb entry.
833c1c61f44Ssb155480 			 */
834678453a8Sspeer 			macp = &vresp->macreg;
835678453a8Sspeer 			resid_mp = macp->m_callbacks->mc_tx(macp->m_driver, mp);
836c1c61f44Ssb155480 
837c1c61f44Ssb155480 			/* tx done; now release ref on fdb entry */
838678453a8Sspeer 			VNET_FDBE_REFRELE(vresp);
839c1c61f44Ssb155480 
8401ae08745Sheppo 			if (resid_mp != NULL) {
8411ae08745Sheppo 				/* m_tx failed */
8421ae08745Sheppo 				mp->b_next = next;
8431ae08745Sheppo 				break;
8441ae08745Sheppo 			}
8451ae08745Sheppo 		} else {
846678453a8Sspeer 			is_unicast = !(IS_BROADCAST(ehp) ||
847678453a8Sspeer 			    (IS_MULTICAST(ehp)));
8481ae08745Sheppo 			/*
849c1c61f44Ssb155480 			 * Destination is not in FDB.
850678453a8Sspeer 			 * If the destination is broadcast or multicast,
851678453a8Sspeer 			 * then forward the packet to vswitch.
852678453a8Sspeer 			 * If a Hybrid resource avilable, then send the
853678453a8Sspeer 			 * unicast packet via hybrid resource, otherwise
854678453a8Sspeer 			 * forward it to vswitch.
8551ae08745Sheppo 			 */
856c1c61f44Ssb155480 			READ_ENTER(&vnetp->vsw_fp_rw);
857c1c61f44Ssb155480 
858678453a8Sspeer 			if ((is_unicast) && (vnetp->hio_fp != NULL)) {
859678453a8Sspeer 				vresp = vnetp->hio_fp;
8608c242ab0SSriharsha Basavapatna 				hres = B_TRUE;
861678453a8Sspeer 			} else {
862678453a8Sspeer 				vresp = vnetp->vsw_fp;
8638c242ab0SSriharsha Basavapatna 				hres = B_FALSE;
864678453a8Sspeer 			}
865678453a8Sspeer 			if (vresp == NULL) {
866c1c61f44Ssb155480 				/*
867c1c61f44Ssb155480 				 * no fdb entry to vsw? drop the packet.
868c1c61f44Ssb155480 				 */
869c1c61f44Ssb155480 				RW_EXIT(&vnetp->vsw_fp_rw);
870c1c61f44Ssb155480 				freemsg(mp);
871c1c61f44Ssb155480 				mp = next;
872c1c61f44Ssb155480 				continue;
873c1c61f44Ssb155480 			}
874c1c61f44Ssb155480 
875c1c61f44Ssb155480 			/* ref hold the fdb entry to vsw */
876678453a8Sspeer 			VNET_FDBE_REFHOLD(vresp);
877c1c61f44Ssb155480 
878c1c61f44Ssb155480 			RW_EXIT(&vnetp->vsw_fp_rw);
879c1c61f44Ssb155480 
8808c242ab0SSriharsha Basavapatna 			/*
8818c242ab0SSriharsha Basavapatna 			 * In the case of a hybrid resource we need to insert
8828c242ab0SSriharsha Basavapatna 			 * the tag for the pvid case here; unlike packets that
8838c242ab0SSriharsha Basavapatna 			 * are destined to a vnet/vsw in which case the vgen
8848c242ab0SSriharsha Basavapatna 			 * layer does the tagging before sending it over ldc.
8858c242ab0SSriharsha Basavapatna 			 */
8868c242ab0SSriharsha Basavapatna 			if (hres == B_TRUE) {
8878c242ab0SSriharsha Basavapatna 				/*
8888c242ab0SSriharsha Basavapatna 				 * Determine if the frame being transmitted
8898c242ab0SSriharsha Basavapatna 				 * over the hybrid resource is untagged. If so,
8908c242ab0SSriharsha Basavapatna 				 * insert the tag before transmitting.
8918c242ab0SSriharsha Basavapatna 				 */
8928c242ab0SSriharsha Basavapatna 				if (is_pvid == B_TRUE &&
8938c242ab0SSriharsha Basavapatna 				    ehp->ether_type != htons(ETHERTYPE_VLAN)) {
8948c242ab0SSriharsha Basavapatna 
8958c242ab0SSriharsha Basavapatna 					mp = vnet_vlan_insert_tag(mp,
8968c242ab0SSriharsha Basavapatna 					    vnetp->pvid);
8978c242ab0SSriharsha Basavapatna 					if (mp == NULL) {
8988c242ab0SSriharsha Basavapatna 						VNET_FDBE_REFRELE(vresp);
8998c242ab0SSriharsha Basavapatna 						mp = next;
9008c242ab0SSriharsha Basavapatna 						continue;
9018c242ab0SSriharsha Basavapatna 					}
9028c242ab0SSriharsha Basavapatna 
9038c242ab0SSriharsha Basavapatna 				}
9048c242ab0SSriharsha Basavapatna 
905678453a8Sspeer 				macp = &vresp->macreg;
90663f531d1SSriharsha Basavapatna 				tx_arg = tx_ringp;
90763f531d1SSriharsha Basavapatna 			} else {
90863f531d1SSriharsha Basavapatna 				macp = &vresp->macreg;
90963f531d1SSriharsha Basavapatna 				tx_arg = macp->m_driver;
91063f531d1SSriharsha Basavapatna 			}
91163f531d1SSriharsha Basavapatna 			resid_mp = macp->m_callbacks->mc_tx(tx_arg, mp);
912c1c61f44Ssb155480 
913c1c61f44Ssb155480 			/* tx done; now release ref on fdb entry */
914678453a8Sspeer 			VNET_FDBE_REFRELE(vresp);
915c1c61f44Ssb155480 
9161ae08745Sheppo 			if (resid_mp != NULL) {
9171ae08745Sheppo 				/* m_tx failed */
9181ae08745Sheppo 				mp->b_next = next;
9191ae08745Sheppo 				break;
9201ae08745Sheppo 			}
9211ae08745Sheppo 		}
9221ae08745Sheppo 
9230dc2366fSVenugopal Iyer 		statsp->obytes += size;
9240dc2366fSVenugopal Iyer 		statsp->opackets++;
9251ae08745Sheppo 		mp = next;
9261ae08745Sheppo 	}
9271ae08745Sheppo 
928844e62a3Sraghuram 	DBG1(vnetp, "exit\n");
9291ae08745Sheppo 	return (mp);
9301ae08745Sheppo }
9311ae08745Sheppo 
9321ae08745Sheppo /* get statistics from the device */
933ba2e4443Sseb int
vnet_m_stat(void * arg,uint_t stat,uint64_t * val)934ba2e4443Sseb vnet_m_stat(void *arg, uint_t stat, uint64_t *val)
9351ae08745Sheppo {
9361ae08745Sheppo 	vnet_t *vnetp = arg;
937678453a8Sspeer 	vnet_res_t	*vresp;
938678453a8Sspeer 	mac_register_t	*macp;
939ba2e4443Sseb 	mac_callbacks_t	*cbp;
940ba2e4443Sseb 	uint64_t val_total = 0;
9411ae08745Sheppo 
942844e62a3Sraghuram 	DBG1(vnetp, "enter\n");
9431ae08745Sheppo 
9441ae08745Sheppo 	/*
945ba2e4443Sseb 	 * get the specified statistic from each transport and return the
946ba2e4443Sseb 	 * aggregate val.  This obviously only works for counters.
9471ae08745Sheppo 	 */
948ba2e4443Sseb 	if ((IS_MAC_STAT(stat) && !MAC_STAT_ISACOUNTER(stat)) ||
949ba2e4443Sseb 	    (IS_MACTYPE_STAT(stat) && !ETHER_STAT_ISACOUNTER(stat))) {
950ba2e4443Sseb 		return (ENOTSUP);
951ba2e4443Sseb 	}
952678453a8Sspeer 
953678453a8Sspeer 	READ_ENTER(&vnetp->vrwlock);
954678453a8Sspeer 	for (vresp = vnetp->vres_list; vresp != NULL; vresp = vresp->nextp) {
955678453a8Sspeer 		macp = &vresp->macreg;
956678453a8Sspeer 		cbp = macp->m_callbacks;
957678453a8Sspeer 		if (cbp->mc_getstat(macp->m_driver, stat, val) == 0)
958ba2e4443Sseb 			val_total += *val;
9591ae08745Sheppo 	}
960678453a8Sspeer 	RW_EXIT(&vnetp->vrwlock);
9611ae08745Sheppo 
962ba2e4443Sseb 	*val = val_total;
963ba2e4443Sseb 
964844e62a3Sraghuram 	DBG1(vnetp, "exit\n");
965ba2e4443Sseb 	return (0);
9661ae08745Sheppo }
9671ae08745Sheppo 
96863f531d1SSriharsha Basavapatna static void
vnet_ring_grp_init(vnet_t * vnetp)96963f531d1SSriharsha Basavapatna vnet_ring_grp_init(vnet_t *vnetp)
97063f531d1SSriharsha Basavapatna {
97163f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_group_t	*rx_grp;
97263f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_ring_t	*rx_ringp;
97363f531d1SSriharsha Basavapatna 	vnet_pseudo_tx_group_t	*tx_grp;
97463f531d1SSriharsha Basavapatna 	vnet_pseudo_tx_ring_t	*tx_ringp;
97563f531d1SSriharsha Basavapatna 	int			i;
97663f531d1SSriharsha Basavapatna 
97763f531d1SSriharsha Basavapatna 	tx_grp = &vnetp->tx_grp[0];
97863f531d1SSriharsha Basavapatna 	tx_ringp = kmem_zalloc(sizeof (vnet_pseudo_tx_ring_t) *
97963f531d1SSriharsha Basavapatna 	    VNET_NUM_PSEUDO_TXRINGS, KM_SLEEP);
98063f531d1SSriharsha Basavapatna 	for (i = 0; i < VNET_NUM_PSEUDO_TXRINGS; i++) {
98163f531d1SSriharsha Basavapatna 		tx_ringp[i].state |= VNET_TXRING_SHARED;
98263f531d1SSriharsha Basavapatna 	}
98363f531d1SSriharsha Basavapatna 	tx_grp->rings = tx_ringp;
98463f531d1SSriharsha Basavapatna 	tx_grp->ring_cnt = VNET_NUM_PSEUDO_TXRINGS;
9850dc2366fSVenugopal Iyer 	mutex_init(&tx_grp->flowctl_lock, NULL, MUTEX_DRIVER, NULL);
9860dc2366fSVenugopal Iyer 	cv_init(&tx_grp->flowctl_cv, NULL, CV_DRIVER, NULL);
9870dc2366fSVenugopal Iyer 	tx_grp->flowctl_thread = thread_create(NULL, 0,
9880dc2366fSVenugopal Iyer 	    vnet_tx_notify_thread, tx_grp, 0, &p0, TS_RUN, minclsyspri);
98963f531d1SSriharsha Basavapatna 
99063f531d1SSriharsha Basavapatna 	rx_grp = &vnetp->rx_grp[0];
99163f531d1SSriharsha Basavapatna 	rx_grp->max_ring_cnt = MAX_RINGS_PER_GROUP;
99263f531d1SSriharsha Basavapatna 	rw_init(&rx_grp->lock, NULL, RW_DRIVER, NULL);
99363f531d1SSriharsha Basavapatna 	rx_ringp = kmem_zalloc(sizeof (vnet_pseudo_rx_ring_t) *
99463f531d1SSriharsha Basavapatna 	    rx_grp->max_ring_cnt, KM_SLEEP);
99563f531d1SSriharsha Basavapatna 
99663f531d1SSriharsha Basavapatna 	/*
99763f531d1SSriharsha Basavapatna 	 * Setup the first 3 Pseudo RX Rings that are reserved;
99863f531d1SSriharsha Basavapatna 	 * 1 for LDC resource to vswitch + 2 for RX rings of Hybrid resource.
99963f531d1SSriharsha Basavapatna 	 */
100063f531d1SSriharsha Basavapatna 	rx_ringp[0].state |= VNET_RXRING_INUSE|VNET_RXRING_LDC_SERVICE;
100163f531d1SSriharsha Basavapatna 	rx_ringp[0].index = 0;
100263f531d1SSriharsha Basavapatna 	rx_ringp[1].state |= VNET_RXRING_INUSE|VNET_RXRING_HYBRID;
100363f531d1SSriharsha Basavapatna 	rx_ringp[1].index = 1;
100463f531d1SSriharsha Basavapatna 	rx_ringp[2].state |= VNET_RXRING_INUSE|VNET_RXRING_HYBRID;
100563f531d1SSriharsha Basavapatna 	rx_ringp[2].index = 2;
100663f531d1SSriharsha Basavapatna 
100763f531d1SSriharsha Basavapatna 	rx_grp->ring_cnt = VNET_NUM_PSEUDO_RXRINGS_DEFAULT;
100863f531d1SSriharsha Basavapatna 	rx_grp->rings = rx_ringp;
100963f531d1SSriharsha Basavapatna 
101063f531d1SSriharsha Basavapatna 	for (i = VNET_NUM_PSEUDO_RXRINGS_DEFAULT;
101163f531d1SSriharsha Basavapatna 	    i < rx_grp->max_ring_cnt; i++) {
101263f531d1SSriharsha Basavapatna 		rx_ringp = &rx_grp->rings[i];
101363f531d1SSriharsha Basavapatna 		rx_ringp->state = VNET_RXRING_FREE;
101463f531d1SSriharsha Basavapatna 		rx_ringp->index = i;
101563f531d1SSriharsha Basavapatna 	}
101663f531d1SSriharsha Basavapatna }
101763f531d1SSriharsha Basavapatna 
101863f531d1SSriharsha Basavapatna static void
vnet_ring_grp_uninit(vnet_t * vnetp)101963f531d1SSriharsha Basavapatna vnet_ring_grp_uninit(vnet_t *vnetp)
102063f531d1SSriharsha Basavapatna {
102163f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_group_t	*rx_grp;
102263f531d1SSriharsha Basavapatna 	vnet_pseudo_tx_group_t	*tx_grp;
10230dc2366fSVenugopal Iyer 	kt_did_t		tid = 0;
102463f531d1SSriharsha Basavapatna 
102563f531d1SSriharsha Basavapatna 	tx_grp = &vnetp->tx_grp[0];
10260dc2366fSVenugopal Iyer 
10270dc2366fSVenugopal Iyer 	/* Inform tx_notify_thread to exit */
10280dc2366fSVenugopal Iyer 	mutex_enter(&tx_grp->flowctl_lock);
10290dc2366fSVenugopal Iyer 	if (tx_grp->flowctl_thread != NULL) {
10300dc2366fSVenugopal Iyer 		tid = tx_grp->flowctl_thread->t_did;
10310dc2366fSVenugopal Iyer 		tx_grp->flowctl_done = B_TRUE;
10320dc2366fSVenugopal Iyer 		cv_signal(&tx_grp->flowctl_cv);
10330dc2366fSVenugopal Iyer 	}
10340dc2366fSVenugopal Iyer 	mutex_exit(&tx_grp->flowctl_lock);
10350dc2366fSVenugopal Iyer 	if (tid != 0)
10360dc2366fSVenugopal Iyer 		thread_join(tid);
10370dc2366fSVenugopal Iyer 
103863f531d1SSriharsha Basavapatna 	if (tx_grp->rings != NULL) {
103963f531d1SSriharsha Basavapatna 		ASSERT(tx_grp->ring_cnt == VNET_NUM_PSEUDO_TXRINGS);
104063f531d1SSriharsha Basavapatna 		kmem_free(tx_grp->rings, sizeof (vnet_pseudo_tx_ring_t) *
104163f531d1SSriharsha Basavapatna 		    tx_grp->ring_cnt);
104263f531d1SSriharsha Basavapatna 		tx_grp->rings = NULL;
104363f531d1SSriharsha Basavapatna 	}
104463f531d1SSriharsha Basavapatna 
104563f531d1SSriharsha Basavapatna 	rx_grp = &vnetp->rx_grp[0];
104663f531d1SSriharsha Basavapatna 	if (rx_grp->rings != NULL) {
104763f531d1SSriharsha Basavapatna 		ASSERT(rx_grp->max_ring_cnt == MAX_RINGS_PER_GROUP);
104863f531d1SSriharsha Basavapatna 		ASSERT(rx_grp->ring_cnt == VNET_NUM_PSEUDO_RXRINGS_DEFAULT);
104963f531d1SSriharsha Basavapatna 		kmem_free(rx_grp->rings, sizeof (vnet_pseudo_rx_ring_t) *
105063f531d1SSriharsha Basavapatna 		    rx_grp->max_ring_cnt);
105163f531d1SSriharsha Basavapatna 		rx_grp->rings = NULL;
105263f531d1SSriharsha Basavapatna 	}
105363f531d1SSriharsha Basavapatna }
105463f531d1SSriharsha Basavapatna 
105563f531d1SSriharsha Basavapatna static vnet_pseudo_rx_ring_t *
vnet_alloc_pseudo_rx_ring(vnet_t * vnetp)105663f531d1SSriharsha Basavapatna vnet_alloc_pseudo_rx_ring(vnet_t *vnetp)
105763f531d1SSriharsha Basavapatna {
105863f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_group_t  *rx_grp;
105963f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_ring_t	*rx_ringp;
106063f531d1SSriharsha Basavapatna 	int			index;
106163f531d1SSriharsha Basavapatna 
106263f531d1SSriharsha Basavapatna 	rx_grp = &vnetp->rx_grp[0];
106363f531d1SSriharsha Basavapatna 	WRITE_ENTER(&rx_grp->lock);
106463f531d1SSriharsha Basavapatna 
106563f531d1SSriharsha Basavapatna 	if (rx_grp->ring_cnt == rx_grp->max_ring_cnt) {
106663f531d1SSriharsha Basavapatna 		/* no rings available */
106763f531d1SSriharsha Basavapatna 		RW_EXIT(&rx_grp->lock);
106863f531d1SSriharsha Basavapatna 		return (NULL);
106963f531d1SSriharsha Basavapatna 	}
107063f531d1SSriharsha Basavapatna 
107163f531d1SSriharsha Basavapatna 	for (index = VNET_NUM_PSEUDO_RXRINGS_DEFAULT;
107263f531d1SSriharsha Basavapatna 	    index < rx_grp->max_ring_cnt; index++) {
107363f531d1SSriharsha Basavapatna 		rx_ringp = &rx_grp->rings[index];
107463f531d1SSriharsha Basavapatna 		if (rx_ringp->state == VNET_RXRING_FREE) {
107563f531d1SSriharsha Basavapatna 			rx_ringp->state |= VNET_RXRING_INUSE;
107663f531d1SSriharsha Basavapatna 			rx_grp->ring_cnt++;
107763f531d1SSriharsha Basavapatna 			break;
107863f531d1SSriharsha Basavapatna 		}
107963f531d1SSriharsha Basavapatna 	}
108063f531d1SSriharsha Basavapatna 
108163f531d1SSriharsha Basavapatna 	RW_EXIT(&rx_grp->lock);
108263f531d1SSriharsha Basavapatna 	return (rx_ringp);
108363f531d1SSriharsha Basavapatna }
108463f531d1SSriharsha Basavapatna 
108563f531d1SSriharsha Basavapatna static void
vnet_free_pseudo_rx_ring(vnet_t * vnetp,vnet_pseudo_rx_ring_t * ringp)108663f531d1SSriharsha Basavapatna vnet_free_pseudo_rx_ring(vnet_t *vnetp, vnet_pseudo_rx_ring_t *ringp)
108763f531d1SSriharsha Basavapatna {
108863f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_group_t  *rx_grp;
108963f531d1SSriharsha Basavapatna 
109063f531d1SSriharsha Basavapatna 	ASSERT(ringp->index >= VNET_NUM_PSEUDO_RXRINGS_DEFAULT);
109163f531d1SSriharsha Basavapatna 	rx_grp = &vnetp->rx_grp[0];
109263f531d1SSriharsha Basavapatna 	WRITE_ENTER(&rx_grp->lock);
109363f531d1SSriharsha Basavapatna 
109463f531d1SSriharsha Basavapatna 	if (ringp->state != VNET_RXRING_FREE) {
109563f531d1SSriharsha Basavapatna 		ringp->state = VNET_RXRING_FREE;
109663f531d1SSriharsha Basavapatna 		ringp->handle = NULL;
109763f531d1SSriharsha Basavapatna 		rx_grp->ring_cnt--;
109863f531d1SSriharsha Basavapatna 	}
109963f531d1SSriharsha Basavapatna 
110063f531d1SSriharsha Basavapatna 	RW_EXIT(&rx_grp->lock);
110163f531d1SSriharsha Basavapatna }
110263f531d1SSriharsha Basavapatna 
11031ae08745Sheppo /* wrapper function for mac_register() */
11041ae08745Sheppo static int
vnet_mac_register(vnet_t * vnetp)11051ae08745Sheppo vnet_mac_register(vnet_t *vnetp)
11061ae08745Sheppo {
1107ba2e4443Sseb 	mac_register_t	*macp;
1108ba2e4443Sseb 	int		err;
11091ae08745Sheppo 
1110ba2e4443Sseb 	if ((macp = mac_alloc(MAC_VERSION)) == NULL)
1111ba2e4443Sseb 		return (DDI_FAILURE);
1112ba2e4443Sseb 	macp->m_type_ident = MAC_PLUGIN_IDENT_ETHER;
1113ba2e4443Sseb 	macp->m_driver = vnetp;
11141ae08745Sheppo 	macp->m_dip = vnetp->dip;
1115ba2e4443Sseb 	macp->m_src_addr = vnetp->curr_macaddr;
1116ba2e4443Sseb 	macp->m_callbacks = &vnet_m_callbacks;
1117ba2e4443Sseb 	macp->m_min_sdu = 0;
11187b1f684aSSriharsha Basavapatna 	macp->m_max_sdu = vnetp->mtu;
1119c1c61f44Ssb155480 	macp->m_margin = VLAN_TAGSZ;
11201ae08745Sheppo 
112163f531d1SSriharsha Basavapatna 	macp->m_v12n = MAC_VIRT_LEVEL1;
112263f531d1SSriharsha Basavapatna 
112363f531d1SSriharsha Basavapatna 	/*
11241ae08745Sheppo 	 * Finally, we're ready to register ourselves with the MAC layer
11251ae08745Sheppo 	 * interface; if this succeeds, we're all ready to start()
11261ae08745Sheppo 	 */
1127ba2e4443Sseb 	err = mac_register(macp, &vnetp->mh);
1128ba2e4443Sseb 	mac_free(macp);
1129ba2e4443Sseb 	return (err == 0 ? DDI_SUCCESS : DDI_FAILURE);
11301ae08745Sheppo }
11311ae08745Sheppo 
11321ae08745Sheppo /* read the mac address of the device */
11331ae08745Sheppo static int
vnet_read_mac_address(vnet_t * vnetp)11341ae08745Sheppo vnet_read_mac_address(vnet_t *vnetp)
11351ae08745Sheppo {
11361ae08745Sheppo 	uchar_t		*macaddr;
11371ae08745Sheppo 	uint32_t	size;
11381ae08745Sheppo 	int		rv;
11391ae08745Sheppo 
11401ae08745Sheppo 	rv = ddi_prop_lookup_byte_array(DDI_DEV_T_ANY, vnetp->dip,
11411ae08745Sheppo 	    DDI_PROP_DONTPASS, macaddr_propname, &macaddr, &size);
11421ae08745Sheppo 	if ((rv != DDI_PROP_SUCCESS) || (size != ETHERADDRL)) {
1143844e62a3Sraghuram 		DWARN(vnetp, "prop_lookup failed(%s) err(%d)\n",
1144844e62a3Sraghuram 		    macaddr_propname, rv);
11451ae08745Sheppo 		return (DDI_FAILURE);
11461ae08745Sheppo 	}
11471ae08745Sheppo 	bcopy(macaddr, (caddr_t)vnetp->vendor_addr, ETHERADDRL);
11481ae08745Sheppo 	bcopy(macaddr, (caddr_t)vnetp->curr_macaddr, ETHERADDRL);
11491ae08745Sheppo 	ddi_prop_free(macaddr);
11501ae08745Sheppo 
11511ae08745Sheppo 	return (DDI_SUCCESS);
11521ae08745Sheppo }
11531ae08745Sheppo 
115493b13a42Swentaoy static void
vnet_fdb_create(vnet_t * vnetp)1155c1c61f44Ssb155480 vnet_fdb_create(vnet_t *vnetp)
115693b13a42Swentaoy {
1157c1c61f44Ssb155480 	char		hashname[MAXNAMELEN];
115893b13a42Swentaoy 
1159c1c61f44Ssb155480 	(void) snprintf(hashname, MAXNAMELEN, "vnet%d-fdbhash",
1160c1c61f44Ssb155480 	    vnetp->instance);
1161c1c61f44Ssb155480 	vnetp->fdb_nchains = vnet_fdb_nchains;
1162c1c61f44Ssb155480 	vnetp->fdb_hashp = mod_hash_create_ptrhash(hashname, vnetp->fdb_nchains,
1163c1c61f44Ssb155480 	    mod_hash_null_valdtor, sizeof (void *));
116493b13a42Swentaoy }
116593b13a42Swentaoy 
116693b13a42Swentaoy static void
vnet_fdb_destroy(vnet_t * vnetp)1167c1c61f44Ssb155480 vnet_fdb_destroy(vnet_t *vnetp)
116893b13a42Swentaoy {
1169c1c61f44Ssb155480 	/* destroy fdb-hash-table */
1170c1c61f44Ssb155480 	if (vnetp->fdb_hashp != NULL) {
1171c1c61f44Ssb155480 		mod_hash_destroy_hash(vnetp->fdb_hashp);
1172c1c61f44Ssb155480 		vnetp->fdb_hashp = NULL;
1173c1c61f44Ssb155480 		vnetp->fdb_nchains = 0;
1174c1c61f44Ssb155480 	}
117593b13a42Swentaoy }
117693b13a42Swentaoy 
117793b13a42Swentaoy /*
1178c1c61f44Ssb155480  * Add an entry into the fdb.
117993b13a42Swentaoy  */
11801ae08745Sheppo void
vnet_fdbe_add(vnet_t * vnetp,vnet_res_t * vresp)1181678453a8Sspeer vnet_fdbe_add(vnet_t *vnetp, vnet_res_t *vresp)
11821ae08745Sheppo {
1183c1c61f44Ssb155480 	uint64_t	addr = 0;
1184c1c61f44Ssb155480 	int		rv;
1185c1c61f44Ssb155480 
1186678453a8Sspeer 	KEY_HASH(addr, vresp->rem_macaddr);
11871ae08745Sheppo 
11881ae08745Sheppo 	/*
1189678453a8Sspeer 	 * If the entry being added corresponds to LDC_SERVICE resource,
1190678453a8Sspeer 	 * that is, vswitch connection, it is added to the hash and also
1191678453a8Sspeer 	 * the entry is cached, an additional reference count reflects
1192678453a8Sspeer 	 * this. The HYBRID resource is not added to the hash, but only
1193678453a8Sspeer 	 * cached, as it is only used for sending out packets for unknown
1194678453a8Sspeer 	 * unicast destinations.
11951ae08745Sheppo 	 */
1196678453a8Sspeer 	(vresp->type == VIO_NET_RES_LDC_SERVICE) ?
1197678453a8Sspeer 	    (vresp->refcnt = 1) : (vresp->refcnt = 0);
11981ae08745Sheppo 
1199c1c61f44Ssb155480 	/*
1200c1c61f44Ssb155480 	 * Note: duplicate keys will be rejected by mod_hash.
1201c1c61f44Ssb155480 	 */
1202678453a8Sspeer 	if (vresp->type != VIO_NET_RES_HYBRID) {
1203c1c61f44Ssb155480 		rv = mod_hash_insert(vnetp->fdb_hashp, (mod_hash_key_t)addr,
1204678453a8Sspeer 		    (mod_hash_val_t)vresp);
1205c1c61f44Ssb155480 		if (rv != 0) {
1206c1c61f44Ssb155480 			DWARN(vnetp, "Duplicate macaddr key(%lx)\n", addr);
12071ae08745Sheppo 			return;
12081ae08745Sheppo 		}
1209678453a8Sspeer 	}
12101ae08745Sheppo 
1211678453a8Sspeer 	if (vresp->type == VIO_NET_RES_LDC_SERVICE) {
1212c1c61f44Ssb155480 		/* Cache the fdb entry to vsw-port */
1213c1c61f44Ssb155480 		WRITE_ENTER(&vnetp->vsw_fp_rw);
1214c1c61f44Ssb155480 		if (vnetp->vsw_fp == NULL)
1215678453a8Sspeer 			vnetp->vsw_fp = vresp;
1216678453a8Sspeer 		RW_EXIT(&vnetp->vsw_fp_rw);
1217678453a8Sspeer 	} else if (vresp->type == VIO_NET_RES_HYBRID) {
1218678453a8Sspeer 		/* Cache the fdb entry to hybrid resource */
1219678453a8Sspeer 		WRITE_ENTER(&vnetp->vsw_fp_rw);
1220678453a8Sspeer 		if (vnetp->hio_fp == NULL)
1221678453a8Sspeer 			vnetp->hio_fp = vresp;
1222c1c61f44Ssb155480 		RW_EXIT(&vnetp->vsw_fp_rw);
1223c1c61f44Ssb155480 	}
12241ae08745Sheppo }
12251ae08745Sheppo 
1226c1c61f44Ssb155480 /*
1227c1c61f44Ssb155480  * Remove an entry from fdb.
1228c1c61f44Ssb155480  */
1229678453a8Sspeer static void
vnet_fdbe_del(vnet_t * vnetp,vnet_res_t * vresp)1230678453a8Sspeer vnet_fdbe_del(vnet_t *vnetp, vnet_res_t *vresp)
12311ae08745Sheppo {
1232c1c61f44Ssb155480 	uint64_t	addr = 0;
1233c1c61f44Ssb155480 	int		rv;
1234c1c61f44Ssb155480 	uint32_t	refcnt;
1235678453a8Sspeer 	vnet_res_t	*tmp;
1236c1c61f44Ssb155480 
1237678453a8Sspeer 	KEY_HASH(addr, vresp->rem_macaddr);
12381ae08745Sheppo 
12391ae08745Sheppo 	/*
1240c1c61f44Ssb155480 	 * Remove the entry from fdb hash table.
1241c1c61f44Ssb155480 	 * This prevents further references to this fdb entry.
12421ae08745Sheppo 	 */
1243678453a8Sspeer 	if (vresp->type != VIO_NET_RES_HYBRID) {
1244c1c61f44Ssb155480 		rv = mod_hash_remove(vnetp->fdb_hashp, (mod_hash_key_t)addr,
1245678453a8Sspeer 		    (mod_hash_val_t *)&tmp);
1246678453a8Sspeer 		if (rv != 0) {
1247678453a8Sspeer 			/*
1248678453a8Sspeer 			 * As the resources are added to the hash only
1249678453a8Sspeer 			 * after they are started, this can occur if
1250678453a8Sspeer 			 * a resource unregisters before it is ever started.
1251678453a8Sspeer 			 */
1252678453a8Sspeer 			return;
1253678453a8Sspeer 		}
1254678453a8Sspeer 	}
12551ae08745Sheppo 
1256678453a8Sspeer 	if (vresp->type == VIO_NET_RES_LDC_SERVICE) {
1257c1c61f44Ssb155480 		WRITE_ENTER(&vnetp->vsw_fp_rw);
12581ae08745Sheppo 
1259678453a8Sspeer 		ASSERT(tmp == vnetp->vsw_fp);
1260c1c61f44Ssb155480 		vnetp->vsw_fp = NULL;
1261c1c61f44Ssb155480 
1262c1c61f44Ssb155480 		RW_EXIT(&vnetp->vsw_fp_rw);
1263678453a8Sspeer 	} else if (vresp->type == VIO_NET_RES_HYBRID) {
1264678453a8Sspeer 		WRITE_ENTER(&vnetp->vsw_fp_rw);
1265678453a8Sspeer 
1266678453a8Sspeer 		vnetp->hio_fp = NULL;
1267678453a8Sspeer 
1268678453a8Sspeer 		RW_EXIT(&vnetp->vsw_fp_rw);
12691ae08745Sheppo 	}
12701ae08745Sheppo 
1271c1c61f44Ssb155480 	/*
1272c1c61f44Ssb155480 	 * If there are threads already ref holding before the entry was
1273c1c61f44Ssb155480 	 * removed from hash table, then wait for ref count to drop to zero.
1274c1c61f44Ssb155480 	 */
1275678453a8Sspeer 	(vresp->type == VIO_NET_RES_LDC_SERVICE) ?
1276678453a8Sspeer 	    (refcnt = 1) : (refcnt = 0);
1277678453a8Sspeer 	while (vresp->refcnt > refcnt) {
1278c1c61f44Ssb155480 		delay(drv_usectohz(vnet_fdbe_refcnt_delay));
1279c1c61f44Ssb155480 	}
1280c1c61f44Ssb155480 }
1281c1c61f44Ssb155480 
1282c1c61f44Ssb155480 /*
1283c1c61f44Ssb155480  * Search fdb for a given mac address. If an entry is found, hold
1284c1c61f44Ssb155480  * a reference to it and return the entry; else returns NULL.
1285c1c61f44Ssb155480  */
1286678453a8Sspeer static vnet_res_t *
vnet_fdbe_find(vnet_t * vnetp,struct ether_addr * addrp)1287c1c61f44Ssb155480 vnet_fdbe_find(vnet_t *vnetp, struct ether_addr *addrp)
1288c1c61f44Ssb155480 {
1289c1c61f44Ssb155480 	uint64_t	key = 0;
1290678453a8Sspeer 	vnet_res_t	*vresp;
1291c1c61f44Ssb155480 	int		rv;
1292c1c61f44Ssb155480 
1293678453a8Sspeer 	KEY_HASH(key, addrp->ether_addr_octet);
1294c1c61f44Ssb155480 
1295c1c61f44Ssb155480 	rv = mod_hash_find_cb(vnetp->fdb_hashp, (mod_hash_key_t)key,
1296678453a8Sspeer 	    (mod_hash_val_t *)&vresp, vnet_fdbe_find_cb);
1297c1c61f44Ssb155480 
1298c1c61f44Ssb155480 	if (rv != 0)
1299c1c61f44Ssb155480 		return (NULL);
1300c1c61f44Ssb155480 
1301678453a8Sspeer 	return (vresp);
1302c1c61f44Ssb155480 }
1303c1c61f44Ssb155480 
1304c1c61f44Ssb155480 /*
1305c1c61f44Ssb155480  * Callback function provided to mod_hash_find_cb(). After finding the fdb
1306c1c61f44Ssb155480  * entry corresponding to the key (macaddr), this callback will be invoked by
1307c1c61f44Ssb155480  * mod_hash_find_cb() to atomically increment the reference count on the fdb
1308c1c61f44Ssb155480  * entry before returning the found entry.
1309c1c61f44Ssb155480  */
1310c1c61f44Ssb155480 static void
vnet_fdbe_find_cb(mod_hash_key_t key,mod_hash_val_t val)1311c1c61f44Ssb155480 vnet_fdbe_find_cb(mod_hash_key_t key, mod_hash_val_t val)
1312c1c61f44Ssb155480 {
1313c1c61f44Ssb155480 	_NOTE(ARGUNUSED(key))
1314678453a8Sspeer 	VNET_FDBE_REFHOLD((vnet_res_t *)val);
1315678453a8Sspeer }
1316678453a8Sspeer 
13178c242ab0SSriharsha Basavapatna /*
13188c242ab0SSriharsha Basavapatna  * Frames received that are tagged with the pvid of the vnet device must be
13198c242ab0SSriharsha Basavapatna  * untagged before sending up the stack. This function walks the chain of rx
13208c242ab0SSriharsha Basavapatna  * frames, untags any such frames and returns the updated chain.
13218c242ab0SSriharsha Basavapatna  *
13228c242ab0SSriharsha Basavapatna  * Arguments:
13238c242ab0SSriharsha Basavapatna  *    pvid:  pvid of the vnet device for which packets are being received
13248c242ab0SSriharsha Basavapatna  *    mp:    head of pkt chain to be validated and untagged
13258c242ab0SSriharsha Basavapatna  *
13268c242ab0SSriharsha Basavapatna  * Returns:
13278c242ab0SSriharsha Basavapatna  *    mp:    head of updated chain of packets
13288c242ab0SSriharsha Basavapatna  */
13298c242ab0SSriharsha Basavapatna static void
vnet_rx_frames_untag(uint16_t pvid,mblk_t ** mp)13308c242ab0SSriharsha Basavapatna vnet_rx_frames_untag(uint16_t pvid, mblk_t **mp)
13318c242ab0SSriharsha Basavapatna {
13328c242ab0SSriharsha Basavapatna 	struct ether_vlan_header	*evhp;
13338c242ab0SSriharsha Basavapatna 	mblk_t				*bp;
13348c242ab0SSriharsha Basavapatna 	mblk_t				*bpt;
13358c242ab0SSriharsha Basavapatna 	mblk_t				*bph;
13368c242ab0SSriharsha Basavapatna 	mblk_t				*bpn;
13378c242ab0SSriharsha Basavapatna 
13388c242ab0SSriharsha Basavapatna 	bpn = bph = bpt = NULL;
13398c242ab0SSriharsha Basavapatna 
13408c242ab0SSriharsha Basavapatna 	for (bp = *mp; bp != NULL; bp = bpn) {
13418c242ab0SSriharsha Basavapatna 
13428c242ab0SSriharsha Basavapatna 		bpn = bp->b_next;
13438c242ab0SSriharsha Basavapatna 		bp->b_next = bp->b_prev = NULL;
13448c242ab0SSriharsha Basavapatna 
13458c242ab0SSriharsha Basavapatna 		evhp = (struct ether_vlan_header *)bp->b_rptr;
13468c242ab0SSriharsha Basavapatna 
13478c242ab0SSriharsha Basavapatna 		if (ntohs(evhp->ether_tpid) == ETHERTYPE_VLAN &&
13488c242ab0SSriharsha Basavapatna 		    VLAN_ID(ntohs(evhp->ether_tci)) == pvid) {
13498c242ab0SSriharsha Basavapatna 
13508c242ab0SSriharsha Basavapatna 			bp = vnet_vlan_remove_tag(bp);
13518c242ab0SSriharsha Basavapatna 			if (bp == NULL) {
13528c242ab0SSriharsha Basavapatna 				continue;
13538c242ab0SSriharsha Basavapatna 			}
13548c242ab0SSriharsha Basavapatna 
13558c242ab0SSriharsha Basavapatna 		}
13568c242ab0SSriharsha Basavapatna 
13578c242ab0SSriharsha Basavapatna 		/* build a chain of processed packets */
13588c242ab0SSriharsha Basavapatna 		if (bph == NULL) {
13598c242ab0SSriharsha Basavapatna 			bph = bpt = bp;
13608c242ab0SSriharsha Basavapatna 		} else {
13618c242ab0SSriharsha Basavapatna 			bpt->b_next = bp;
13628c242ab0SSriharsha Basavapatna 			bpt = bp;
13638c242ab0SSriharsha Basavapatna 		}
13648c242ab0SSriharsha Basavapatna 
13658c242ab0SSriharsha Basavapatna 	}
13668c242ab0SSriharsha Basavapatna 
13678c242ab0SSriharsha Basavapatna 	*mp = bph;
13688c242ab0SSriharsha Basavapatna }
13698c242ab0SSriharsha Basavapatna 
1370678453a8Sspeer static void
vnet_rx(vio_net_handle_t vrh,mblk_t * mp)1371678453a8Sspeer vnet_rx(vio_net_handle_t vrh, mblk_t *mp)
1372678453a8Sspeer {
1373678453a8Sspeer 	vnet_res_t		*vresp = (vnet_res_t *)vrh;
1374678453a8Sspeer 	vnet_t			*vnetp = vresp->vnetp;
137563f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_ring_t	*ringp;
1376678453a8Sspeer 
13778c242ab0SSriharsha Basavapatna 	if ((vnetp == NULL) || (vnetp->mh == 0)) {
1378678453a8Sspeer 		freemsgchain(mp);
13798c242ab0SSriharsha Basavapatna 		return;
1380678453a8Sspeer 	}
13818c242ab0SSriharsha Basavapatna 
138263f531d1SSriharsha Basavapatna 	ringp = vresp->rx_ringp;
138363f531d1SSriharsha Basavapatna 	mac_rx_ring(vnetp->mh, ringp->handle, mp, ringp->gen_num);
13841ae08745Sheppo }
1385ba2e4443Sseb 
1386ba2e4443Sseb void
vnet_tx_update(vio_net_handle_t vrh)1387678453a8Sspeer vnet_tx_update(vio_net_handle_t vrh)
1388ba2e4443Sseb {
1389678453a8Sspeer 	vnet_res_t		*vresp = (vnet_res_t *)vrh;
1390678453a8Sspeer 	vnet_t			*vnetp = vresp->vnetp;
139163f531d1SSriharsha Basavapatna 	vnet_pseudo_tx_ring_t	*tx_ringp;
139263f531d1SSriharsha Basavapatna 	vnet_pseudo_tx_group_t	*tx_grp;
139363f531d1SSriharsha Basavapatna 	int			i;
1394ba2e4443Sseb 
139563f531d1SSriharsha Basavapatna 	if (vnetp == NULL || vnetp->mh == NULL) {
139663f531d1SSriharsha Basavapatna 		return;
139763f531d1SSriharsha Basavapatna 	}
139863f531d1SSriharsha Basavapatna 
139963f531d1SSriharsha Basavapatna 	/*
140063f531d1SSriharsha Basavapatna 	 * Currently, the tx hwring API (used to access rings that belong to
140163f531d1SSriharsha Basavapatna 	 * a Hybrid IO resource) does not provide us a per ring flow ctrl
140263f531d1SSriharsha Basavapatna 	 * update; also the pseudo rings are shared by the ports/ldcs in the
140363f531d1SSriharsha Basavapatna 	 * vgen layer. Thus we can't figure out which pseudo ring is being
140463f531d1SSriharsha Basavapatna 	 * re-enabled for transmits. To work around this, when we get a tx
140563f531d1SSriharsha Basavapatna 	 * restart notification from below, we simply propagate that to all
140663f531d1SSriharsha Basavapatna 	 * the tx pseudo rings registered with the mac layer above.
140763f531d1SSriharsha Basavapatna 	 *
140863f531d1SSriharsha Basavapatna 	 * There are a couple of side effects with this approach, but they are
140963f531d1SSriharsha Basavapatna 	 * not harmful, as outlined below:
141063f531d1SSriharsha Basavapatna 	 *
141163f531d1SSriharsha Basavapatna 	 * A) We might send an invalid ring_update() for a ring that is not
141263f531d1SSriharsha Basavapatna 	 * really flow controlled. This will not have any effect in the mac
141363f531d1SSriharsha Basavapatna 	 * layer and packets will continue to be transmitted on that ring.
141463f531d1SSriharsha Basavapatna 	 *
141563f531d1SSriharsha Basavapatna 	 * B) We might end up clearing the flow control in the mac layer for
141663f531d1SSriharsha Basavapatna 	 * a ring that is still flow controlled in the underlying resource.
141763f531d1SSriharsha Basavapatna 	 * This will result in the mac layer restarting	transmit, only to be
141863f531d1SSriharsha Basavapatna 	 * flow controlled again on that ring.
141963f531d1SSriharsha Basavapatna 	 */
142063f531d1SSriharsha Basavapatna 	tx_grp = &vnetp->tx_grp[0];
142163f531d1SSriharsha Basavapatna 	for (i = 0; i < tx_grp->ring_cnt; i++) {
142263f531d1SSriharsha Basavapatna 		tx_ringp = &tx_grp->rings[i];
142363f531d1SSriharsha Basavapatna 		mac_tx_ring_update(vnetp->mh, tx_ringp->handle);
1424ba2e4443Sseb 	}
1425678453a8Sspeer }
1426678453a8Sspeer 
1427678453a8Sspeer /*
14280dc2366fSVenugopal Iyer  * vnet_tx_notify_thread:
14290dc2366fSVenugopal Iyer  *
14300dc2366fSVenugopal Iyer  * vnet_tx_ring_update() callback function wakes up this thread when
14310dc2366fSVenugopal Iyer  * it gets called. This thread will call mac_tx_ring_update() to
14320dc2366fSVenugopal Iyer  * notify upper mac of flow control getting relieved. Note that
14330dc2366fSVenugopal Iyer  * vnet_tx_ring_update() cannot call mac_tx_ring_update() directly
14340dc2366fSVenugopal Iyer  * because vnet_tx_ring_update() is called from lower mac with
14350dc2366fSVenugopal Iyer  * mi_rw_lock held and mac_tx_ring_update() would also try to grab
14360dc2366fSVenugopal Iyer  * the same lock.
14370dc2366fSVenugopal Iyer  */
14380dc2366fSVenugopal Iyer static void
vnet_tx_notify_thread(void * arg)14390dc2366fSVenugopal Iyer vnet_tx_notify_thread(void *arg)
14400dc2366fSVenugopal Iyer {
14410dc2366fSVenugopal Iyer 	callb_cpr_t		cprinfo;
14420dc2366fSVenugopal Iyer 	vnet_pseudo_tx_group_t	*tx_grp = (vnet_pseudo_tx_group_t *)arg;
14430dc2366fSVenugopal Iyer 	vnet_pseudo_tx_ring_t	*tx_ringp;
14440dc2366fSVenugopal Iyer 	vnet_t			*vnetp;
14450dc2366fSVenugopal Iyer 	int			i;
14460dc2366fSVenugopal Iyer 
14470dc2366fSVenugopal Iyer 	CALLB_CPR_INIT(&cprinfo, &tx_grp->flowctl_lock, callb_generic_cpr,
14480dc2366fSVenugopal Iyer 	    "vnet_tx_notify_thread");
14490dc2366fSVenugopal Iyer 
14500dc2366fSVenugopal Iyer 	mutex_enter(&tx_grp->flowctl_lock);
14510dc2366fSVenugopal Iyer 	while (!tx_grp->flowctl_done) {
14520dc2366fSVenugopal Iyer 		CALLB_CPR_SAFE_BEGIN(&cprinfo);
14530dc2366fSVenugopal Iyer 		cv_wait(&tx_grp->flowctl_cv, &tx_grp->flowctl_lock);
14540dc2366fSVenugopal Iyer 		CALLB_CPR_SAFE_END(&cprinfo, &tx_grp->flowctl_lock);
14550dc2366fSVenugopal Iyer 
14560dc2366fSVenugopal Iyer 		for (i = 0; i < tx_grp->ring_cnt; i++) {
14570dc2366fSVenugopal Iyer 			tx_ringp = &tx_grp->rings[i];
14580dc2366fSVenugopal Iyer 			if (tx_ringp->woken_up) {
14590dc2366fSVenugopal Iyer 				tx_ringp->woken_up = B_FALSE;
14600dc2366fSVenugopal Iyer 				vnetp = tx_ringp->vnetp;
14610dc2366fSVenugopal Iyer 				mac_tx_ring_update(vnetp->mh, tx_ringp->handle);
14620dc2366fSVenugopal Iyer 			}
14630dc2366fSVenugopal Iyer 		}
14640dc2366fSVenugopal Iyer 	}
14650dc2366fSVenugopal Iyer 	/*
14660dc2366fSVenugopal Iyer 	 * The tx_grp is being destroyed, exit the thread.
14670dc2366fSVenugopal Iyer 	 */
14680dc2366fSVenugopal Iyer 	tx_grp->flowctl_thread = NULL;
14690dc2366fSVenugopal Iyer 	CALLB_CPR_EXIT(&cprinfo);
14700dc2366fSVenugopal Iyer 	thread_exit();
14710dc2366fSVenugopal Iyer }
14720dc2366fSVenugopal Iyer 
14730dc2366fSVenugopal Iyer void
vnet_tx_ring_update(void * arg1,uintptr_t arg2)14740dc2366fSVenugopal Iyer vnet_tx_ring_update(void *arg1, uintptr_t arg2)
14750dc2366fSVenugopal Iyer {
14760dc2366fSVenugopal Iyer 	vnet_t			*vnetp = (vnet_t *)arg1;
14770dc2366fSVenugopal Iyer 	vnet_pseudo_tx_group_t	*tx_grp;
14780dc2366fSVenugopal Iyer 	vnet_pseudo_tx_ring_t	*tx_ringp;
14790dc2366fSVenugopal Iyer 	int			i;
14800dc2366fSVenugopal Iyer 
14810dc2366fSVenugopal Iyer 	tx_grp = &vnetp->tx_grp[0];
14820dc2366fSVenugopal Iyer 	for (i = 0; i < tx_grp->ring_cnt; i++) {
14830dc2366fSVenugopal Iyer 		tx_ringp = &tx_grp->rings[i];
14840dc2366fSVenugopal Iyer 		if (tx_ringp->hw_rh == (mac_ring_handle_t)arg2) {
14850dc2366fSVenugopal Iyer 			mutex_enter(&tx_grp->flowctl_lock);
14860dc2366fSVenugopal Iyer 			tx_ringp->woken_up = B_TRUE;
14870dc2366fSVenugopal Iyer 			cv_signal(&tx_grp->flowctl_cv);
14880dc2366fSVenugopal Iyer 			mutex_exit(&tx_grp->flowctl_lock);
14890dc2366fSVenugopal Iyer 			break;
14900dc2366fSVenugopal Iyer 		}
14910dc2366fSVenugopal Iyer 	}
14920dc2366fSVenugopal Iyer }
14930dc2366fSVenugopal Iyer 
14940dc2366fSVenugopal Iyer /*
14957b1f684aSSriharsha Basavapatna  * Update the new mtu of vnet into the mac layer. First check if the device has
14967b1f684aSSriharsha Basavapatna  * been plumbed and if so fail the mtu update. Returns 0 on success.
14977b1f684aSSriharsha Basavapatna  */
14987b1f684aSSriharsha Basavapatna int
vnet_mtu_update(vnet_t * vnetp,uint32_t mtu)14997b1f684aSSriharsha Basavapatna vnet_mtu_update(vnet_t *vnetp, uint32_t mtu)
15007b1f684aSSriharsha Basavapatna {
15017b1f684aSSriharsha Basavapatna 	int	rv;
15027b1f684aSSriharsha Basavapatna 
15037b1f684aSSriharsha Basavapatna 	if (vnetp == NULL || vnetp->mh == NULL) {
15047b1f684aSSriharsha Basavapatna 		return (EINVAL);
15057b1f684aSSriharsha Basavapatna 	}
15067b1f684aSSriharsha Basavapatna 
15077b1f684aSSriharsha Basavapatna 	WRITE_ENTER(&vnetp->vrwlock);
15087b1f684aSSriharsha Basavapatna 
15097b1f684aSSriharsha Basavapatna 	if (vnetp->flags & VNET_STARTED) {
15107b1f684aSSriharsha Basavapatna 		RW_EXIT(&vnetp->vrwlock);
15117b1f684aSSriharsha Basavapatna 		cmn_err(CE_NOTE, "!vnet%d: Unable to process mtu "
15127b1f684aSSriharsha Basavapatna 		    "update as the device is plumbed\n",
15137b1f684aSSriharsha Basavapatna 		    vnetp->instance);
15147b1f684aSSriharsha Basavapatna 		return (EBUSY);
15157b1f684aSSriharsha Basavapatna 	}
15167b1f684aSSriharsha Basavapatna 
15177b1f684aSSriharsha Basavapatna 	/* update mtu in the mac layer */
15187b1f684aSSriharsha Basavapatna 	rv = mac_maxsdu_update(vnetp->mh, mtu);
15197b1f684aSSriharsha Basavapatna 	if (rv != 0) {
15207b1f684aSSriharsha Basavapatna 		RW_EXIT(&vnetp->vrwlock);
15217b1f684aSSriharsha Basavapatna 		cmn_err(CE_NOTE,
15227b1f684aSSriharsha Basavapatna 		    "!vnet%d: Unable to update mtu with mac layer\n",
15237b1f684aSSriharsha Basavapatna 		    vnetp->instance);
15247b1f684aSSriharsha Basavapatna 		return (EIO);
15257b1f684aSSriharsha Basavapatna 	}
15267b1f684aSSriharsha Basavapatna 
15277b1f684aSSriharsha Basavapatna 	vnetp->mtu = mtu;
15287b1f684aSSriharsha Basavapatna 
15297b1f684aSSriharsha Basavapatna 	RW_EXIT(&vnetp->vrwlock);
15307b1f684aSSriharsha Basavapatna 
15317b1f684aSSriharsha Basavapatna 	return (0);
15327b1f684aSSriharsha Basavapatna }
15337b1f684aSSriharsha Basavapatna 
15347b1f684aSSriharsha Basavapatna /*
15351107ea93SSriharsha Basavapatna  * Update the link state of vnet to the mac layer.
15361107ea93SSriharsha Basavapatna  */
15371107ea93SSriharsha Basavapatna void
vnet_link_update(vnet_t * vnetp,link_state_t link_state)15381107ea93SSriharsha Basavapatna vnet_link_update(vnet_t *vnetp, link_state_t link_state)
15391107ea93SSriharsha Basavapatna {
15401107ea93SSriharsha Basavapatna 	if (vnetp == NULL || vnetp->mh == NULL) {
15411107ea93SSriharsha Basavapatna 		return;
15421107ea93SSriharsha Basavapatna 	}
15431107ea93SSriharsha Basavapatna 
15441107ea93SSriharsha Basavapatna 	WRITE_ENTER(&vnetp->vrwlock);
15451107ea93SSriharsha Basavapatna 	if (vnetp->link_state == link_state) {
15461107ea93SSriharsha Basavapatna 		RW_EXIT(&vnetp->vrwlock);
15471107ea93SSriharsha Basavapatna 		return;
15481107ea93SSriharsha Basavapatna 	}
15491107ea93SSriharsha Basavapatna 	vnetp->link_state = link_state;
15501107ea93SSriharsha Basavapatna 	RW_EXIT(&vnetp->vrwlock);
15511107ea93SSriharsha Basavapatna 
15521107ea93SSriharsha Basavapatna 	mac_link_update(vnetp->mh, link_state);
15531107ea93SSriharsha Basavapatna }
15541107ea93SSriharsha Basavapatna 
15551107ea93SSriharsha Basavapatna /*
1556678453a8Sspeer  * vio_net_resource_reg -- An interface called to register a resource
1557678453a8Sspeer  *	with vnet.
1558678453a8Sspeer  *	macp -- a GLDv3 mac_register that has all the details of
1559678453a8Sspeer  *		a resource and its callbacks etc.
1560678453a8Sspeer  *	type -- resource type.
1561678453a8Sspeer  *	local_macaddr -- resource's MAC address. This is used to
1562678453a8Sspeer  *			 associate a resource with a corresponding vnet.
1563678453a8Sspeer  *	remote_macaddr -- remote side MAC address. This is ignored for
1564678453a8Sspeer  *			  the Hybrid resources.
1565678453a8Sspeer  *	vhp -- A handle returned to the caller.
1566678453a8Sspeer  *	vcb -- A set of callbacks provided to the callers.
1567678453a8Sspeer  */
vio_net_resource_reg(mac_register_t * macp,vio_net_res_type_t type,ether_addr_t local_macaddr,ether_addr_t rem_macaddr,vio_net_handle_t * vhp,vio_net_callbacks_t * vcb)1568678453a8Sspeer int vio_net_resource_reg(mac_register_t *macp, vio_net_res_type_t type,
1569678453a8Sspeer     ether_addr_t local_macaddr, ether_addr_t rem_macaddr, vio_net_handle_t *vhp,
1570678453a8Sspeer     vio_net_callbacks_t *vcb)
1571678453a8Sspeer {
1572678453a8Sspeer 	vnet_t		*vnetp;
1573678453a8Sspeer 	vnet_res_t	*vresp;
1574678453a8Sspeer 
1575678453a8Sspeer 	vresp = kmem_zalloc(sizeof (vnet_res_t), KM_SLEEP);
1576678453a8Sspeer 	ether_copy(local_macaddr, vresp->local_macaddr);
1577678453a8Sspeer 	ether_copy(rem_macaddr, vresp->rem_macaddr);
1578678453a8Sspeer 	vresp->type = type;
1579678453a8Sspeer 	bcopy(macp, &vresp->macreg, sizeof (mac_register_t));
1580678453a8Sspeer 
1581678453a8Sspeer 	DBG1(NULL, "Resource Registerig type=0%X\n", type);
1582678453a8Sspeer 
1583678453a8Sspeer 	READ_ENTER(&vnet_rw);
1584678453a8Sspeer 	vnetp = vnet_headp;
1585678453a8Sspeer 	while (vnetp != NULL) {
1586678453a8Sspeer 		if (VNET_MATCH_RES(vresp, vnetp)) {
1587678453a8Sspeer 			vresp->vnetp = vnetp;
15886b8fc343SWENTAO YANG 
15896b8fc343SWENTAO YANG 			/* Setup kstats for hio resource */
15906b8fc343SWENTAO YANG 			if (vresp->type == VIO_NET_RES_HYBRID) {
15916b8fc343SWENTAO YANG 				vresp->ksp = vnet_hio_setup_kstats(DRV_NAME,
15926b8fc343SWENTAO YANG 				    "hio", vresp);
15936b8fc343SWENTAO YANG 				if (vresp->ksp == NULL) {
15946b8fc343SWENTAO YANG 					cmn_err(CE_NOTE, "!vnet%d: Cannot "
15956b8fc343SWENTAO YANG 					    "create kstats for hio resource",
15966b8fc343SWENTAO YANG 					    vnetp->instance);
15976b8fc343SWENTAO YANG 				}
15986b8fc343SWENTAO YANG 			}
159963f531d1SSriharsha Basavapatna 			vnet_add_resource(vnetp, vresp);
1600678453a8Sspeer 			break;
1601678453a8Sspeer 		}
1602678453a8Sspeer 		vnetp = vnetp->nextp;
1603678453a8Sspeer 	}
1604678453a8Sspeer 	RW_EXIT(&vnet_rw);
1605678453a8Sspeer 	if (vresp->vnetp == NULL) {
1606678453a8Sspeer 		DWARN(NULL, "No vnet instance");
1607678453a8Sspeer 		kmem_free(vresp, sizeof (vnet_res_t));
1608678453a8Sspeer 		return (ENXIO);
1609678453a8Sspeer 	}
1610678453a8Sspeer 
1611678453a8Sspeer 	*vhp = vresp;
1612678453a8Sspeer 	vcb->vio_net_rx_cb = vnet_rx;
1613678453a8Sspeer 	vcb->vio_net_tx_update = vnet_tx_update;
1614678453a8Sspeer 	vcb->vio_net_report_err = vnet_handle_res_err;
1615678453a8Sspeer 
161663f531d1SSriharsha Basavapatna 	/* Bind the resource to pseudo ring(s) */
161763f531d1SSriharsha Basavapatna 	if (vnet_bind_rings(vresp) != 0) {
161863f531d1SSriharsha Basavapatna 		(void) vnet_rem_resource(vnetp, vresp);
161963f531d1SSriharsha Basavapatna 		vnet_hio_destroy_kstats(vresp->ksp);
162063f531d1SSriharsha Basavapatna 		KMEM_FREE(vresp);
162163f531d1SSriharsha Basavapatna 		return (1);
162263f531d1SSriharsha Basavapatna 	}
162363f531d1SSriharsha Basavapatna 
1624678453a8Sspeer 	/* Dispatch a task to start resources */
1625678453a8Sspeer 	vnet_dispatch_res_task(vnetp);
1626678453a8Sspeer 	return (0);
1627678453a8Sspeer }
1628678453a8Sspeer 
1629678453a8Sspeer /*
1630678453a8Sspeer  * vio_net_resource_unreg -- An interface to unregister a resource.
1631678453a8Sspeer  */
1632678453a8Sspeer void
vio_net_resource_unreg(vio_net_handle_t vhp)1633678453a8Sspeer vio_net_resource_unreg(vio_net_handle_t vhp)
1634678453a8Sspeer {
1635678453a8Sspeer 	vnet_res_t	*vresp = (vnet_res_t *)vhp;
1636678453a8Sspeer 	vnet_t		*vnetp = vresp->vnetp;
1637678453a8Sspeer 
1638678453a8Sspeer 	DBG1(NULL, "Resource Registerig hdl=0x%p", vhp);
1639678453a8Sspeer 
1640678453a8Sspeer 	ASSERT(vnetp != NULL);
16415460ddbdSSriharsha Basavapatna 	/*
16425460ddbdSSriharsha Basavapatna 	 * Remove the resource from fdb; this ensures
16435460ddbdSSriharsha Basavapatna 	 * there are no references to the resource.
16445460ddbdSSriharsha Basavapatna 	 */
1645678453a8Sspeer 	vnet_fdbe_del(vnetp, vresp);
1646678453a8Sspeer 
164763f531d1SSriharsha Basavapatna 	vnet_unbind_rings(vresp);
164863f531d1SSriharsha Basavapatna 
16495460ddbdSSriharsha Basavapatna 	/* Now remove the resource from the list */
165063f531d1SSriharsha Basavapatna 	(void) vnet_rem_resource(vnetp, vresp);
165163f531d1SSriharsha Basavapatna 
165263f531d1SSriharsha Basavapatna 	vnet_hio_destroy_kstats(vresp->ksp);
165363f531d1SSriharsha Basavapatna 	KMEM_FREE(vresp);
165463f531d1SSriharsha Basavapatna }
165563f531d1SSriharsha Basavapatna 
165663f531d1SSriharsha Basavapatna static void
vnet_add_resource(vnet_t * vnetp,vnet_res_t * vresp)165763f531d1SSriharsha Basavapatna vnet_add_resource(vnet_t *vnetp, vnet_res_t *vresp)
165863f531d1SSriharsha Basavapatna {
165963f531d1SSriharsha Basavapatna 	WRITE_ENTER(&vnetp->vrwlock);
166063f531d1SSriharsha Basavapatna 	vresp->nextp = vnetp->vres_list;
166163f531d1SSriharsha Basavapatna 	vnetp->vres_list = vresp;
166263f531d1SSriharsha Basavapatna 	RW_EXIT(&vnetp->vrwlock);
166363f531d1SSriharsha Basavapatna }
166463f531d1SSriharsha Basavapatna 
166563f531d1SSriharsha Basavapatna static vnet_res_t *
vnet_rem_resource(vnet_t * vnetp,vnet_res_t * vresp)166663f531d1SSriharsha Basavapatna vnet_rem_resource(vnet_t *vnetp, vnet_res_t *vresp)
166763f531d1SSriharsha Basavapatna {
166863f531d1SSriharsha Basavapatna 	vnet_res_t	*vrp;
166963f531d1SSriharsha Basavapatna 
1670678453a8Sspeer 	WRITE_ENTER(&vnetp->vrwlock);
1671678453a8Sspeer 	if (vresp == vnetp->vres_list) {
1672678453a8Sspeer 		vnetp->vres_list = vresp->nextp;
1673678453a8Sspeer 	} else {
1674678453a8Sspeer 		vrp = vnetp->vres_list;
1675678453a8Sspeer 		while (vrp->nextp != NULL) {
1676678453a8Sspeer 			if (vrp->nextp == vresp) {
1677678453a8Sspeer 				vrp->nextp = vresp->nextp;
1678678453a8Sspeer 				break;
1679678453a8Sspeer 			}
1680678453a8Sspeer 			vrp = vrp->nextp;
1681678453a8Sspeer 		}
1682678453a8Sspeer 	}
1683678453a8Sspeer 	vresp->vnetp = NULL;
1684678453a8Sspeer 	vresp->nextp = NULL;
168563f531d1SSriharsha Basavapatna 
1686678453a8Sspeer 	RW_EXIT(&vnetp->vrwlock);
168763f531d1SSriharsha Basavapatna 
168863f531d1SSriharsha Basavapatna 	return (vresp);
1689678453a8Sspeer }
1690678453a8Sspeer 
1691678453a8Sspeer /*
1692678453a8Sspeer  * vnet_dds_rx -- an interface called by vgen to DDS messages.
1693678453a8Sspeer  */
1694678453a8Sspeer void
vnet_dds_rx(void * arg,void * dmsg)1695678453a8Sspeer vnet_dds_rx(void *arg, void *dmsg)
1696678453a8Sspeer {
1697678453a8Sspeer 	vnet_t *vnetp = arg;
1698678453a8Sspeer 	vdds_process_dds_msg(vnetp, dmsg);
1699678453a8Sspeer }
1700678453a8Sspeer 
1701678453a8Sspeer /*
1702678453a8Sspeer  * vnet_send_dds_msg -- An interface provided to DDS to send
1703678453a8Sspeer  *	DDS messages. This simply sends meessages via vgen.
1704678453a8Sspeer  */
1705678453a8Sspeer int
vnet_send_dds_msg(vnet_t * vnetp,void * dmsg)1706678453a8Sspeer vnet_send_dds_msg(vnet_t *vnetp, void *dmsg)
1707678453a8Sspeer {
1708678453a8Sspeer 	int rv;
1709678453a8Sspeer 
1710678453a8Sspeer 	if (vnetp->vgenhdl != NULL) {
1711678453a8Sspeer 		rv = vgen_dds_tx(vnetp->vgenhdl, dmsg);
1712678453a8Sspeer 	}
1713678453a8Sspeer 	return (rv);
1714678453a8Sspeer }
1715678453a8Sspeer 
1716678453a8Sspeer /*
17176d6de4eeSWENTAO YANG  * vnet_cleanup_hio -- an interface called by vgen to cleanup hio resources.
17186d6de4eeSWENTAO YANG  */
17196d6de4eeSWENTAO YANG void
vnet_dds_cleanup_hio(vnet_t * vnetp)17206d6de4eeSWENTAO YANG vnet_dds_cleanup_hio(vnet_t *vnetp)
17216d6de4eeSWENTAO YANG {
17226d6de4eeSWENTAO YANG 	vdds_cleanup_hio(vnetp);
17236d6de4eeSWENTAO YANG }
17246d6de4eeSWENTAO YANG 
17256d6de4eeSWENTAO YANG /*
1726678453a8Sspeer  * vnet_handle_res_err -- A callback function called by a resource
1727678453a8Sspeer  *	to report an error. For example, vgen can call to report
1728678453a8Sspeer  *	an LDC down/reset event. This will trigger cleanup of associated
1729678453a8Sspeer  *	Hybrid resource.
1730678453a8Sspeer  */
1731678453a8Sspeer /* ARGSUSED */
1732678453a8Sspeer static void
vnet_handle_res_err(vio_net_handle_t vrh,vio_net_err_val_t err)1733678453a8Sspeer vnet_handle_res_err(vio_net_handle_t vrh, vio_net_err_val_t err)
1734678453a8Sspeer {
1735678453a8Sspeer 	vnet_res_t *vresp = (vnet_res_t *)vrh;
1736678453a8Sspeer 	vnet_t *vnetp = vresp->vnetp;
1737678453a8Sspeer 
1738678453a8Sspeer 	if (vnetp == NULL) {
1739678453a8Sspeer 		return;
1740678453a8Sspeer 	}
1741678453a8Sspeer 	if ((vresp->type != VIO_NET_RES_LDC_SERVICE) &&
1742678453a8Sspeer 	    (vresp->type != VIO_NET_RES_HYBRID)) {
1743678453a8Sspeer 		return;
1744678453a8Sspeer 	}
17456d6de4eeSWENTAO YANG 
17466d6de4eeSWENTAO YANG 	vdds_cleanup_hio(vnetp);
1747678453a8Sspeer }
1748678453a8Sspeer 
1749678453a8Sspeer /*
1750678453a8Sspeer  * vnet_dispatch_res_task -- A function to dispatch tasks start resources.
1751678453a8Sspeer  */
1752678453a8Sspeer static void
vnet_dispatch_res_task(vnet_t * vnetp)1753678453a8Sspeer vnet_dispatch_res_task(vnet_t *vnetp)
1754678453a8Sspeer {
1755678453a8Sspeer 	int rv;
1756678453a8Sspeer 
17578b923298SZach Kissel 	/*
17588b923298SZach Kissel 	 * Dispatch the task. It could be the case that vnetp->flags does
17598b923298SZach Kissel 	 * not have VNET_STARTED set. This is ok as vnet_rest_start_task()
17605460ddbdSSriharsha Basavapatna 	 * can abort the task when the task is started. See related comments
17615460ddbdSSriharsha Basavapatna 	 * in vnet_m_stop() and vnet_stop_resources().
17628b923298SZach Kissel 	 */
1763678453a8Sspeer 	rv = ddi_taskq_dispatch(vnetp->taskqp, vnet_res_start_task,
1764678453a8Sspeer 	    vnetp, DDI_NOSLEEP);
1765678453a8Sspeer 	if (rv != DDI_SUCCESS) {
1766678453a8Sspeer 		cmn_err(CE_WARN,
1767678453a8Sspeer 		    "vnet%d:Can't dispatch start resource task",
1768678453a8Sspeer 		    vnetp->instance);
1769678453a8Sspeer 	}
1770678453a8Sspeer }
1771678453a8Sspeer 
1772678453a8Sspeer /*
1773678453a8Sspeer  * vnet_res_start_task -- A taskq callback function that starts a resource.
1774678453a8Sspeer  */
1775678453a8Sspeer static void
vnet_res_start_task(void * arg)1776678453a8Sspeer vnet_res_start_task(void *arg)
1777678453a8Sspeer {
1778678453a8Sspeer 	vnet_t *vnetp = arg;
1779678453a8Sspeer 
1780678453a8Sspeer 	WRITE_ENTER(&vnetp->vrwlock);
1781678453a8Sspeer 	if (vnetp->flags & VNET_STARTED) {
1782678453a8Sspeer 		vnet_start_resources(vnetp);
1783678453a8Sspeer 	}
1784678453a8Sspeer 	RW_EXIT(&vnetp->vrwlock);
1785678453a8Sspeer }
1786678453a8Sspeer 
1787678453a8Sspeer /*
1788678453a8Sspeer  * vnet_start_resources -- starts all resources associated with
1789678453a8Sspeer  *	a vnet.
1790678453a8Sspeer  */
1791678453a8Sspeer static void
vnet_start_resources(vnet_t * vnetp)1792678453a8Sspeer vnet_start_resources(vnet_t *vnetp)
1793678453a8Sspeer {
1794678453a8Sspeer 	mac_register_t	*macp;
1795678453a8Sspeer 	mac_callbacks_t	*cbp;
1796678453a8Sspeer 	vnet_res_t	*vresp;
1797678453a8Sspeer 	int rv;
1798678453a8Sspeer 
1799678453a8Sspeer 	DBG1(vnetp, "enter\n");
1800678453a8Sspeer 
18015460ddbdSSriharsha Basavapatna 	ASSERT(RW_WRITE_HELD(&vnetp->vrwlock));
18025460ddbdSSriharsha Basavapatna 
1803678453a8Sspeer 	for (vresp = vnetp->vres_list; vresp != NULL; vresp = vresp->nextp) {
1804678453a8Sspeer 		/* skip if it is already started */
1805678453a8Sspeer 		if (vresp->flags & VNET_STARTED) {
1806678453a8Sspeer 			continue;
1807678453a8Sspeer 		}
1808678453a8Sspeer 		macp = &vresp->macreg;
1809678453a8Sspeer 		cbp = macp->m_callbacks;
1810678453a8Sspeer 		rv = cbp->mc_start(macp->m_driver);
1811678453a8Sspeer 		if (rv == 0) {
1812678453a8Sspeer 			/*
1813678453a8Sspeer 			 * Successfully started the resource, so now
1814678453a8Sspeer 			 * add it to the fdb.
1815678453a8Sspeer 			 */
1816678453a8Sspeer 			vresp->flags |= VNET_STARTED;
1817678453a8Sspeer 			vnet_fdbe_add(vnetp, vresp);
1818678453a8Sspeer 		}
1819678453a8Sspeer 	}
1820678453a8Sspeer 
1821678453a8Sspeer 	DBG1(vnetp, "exit\n");
1822678453a8Sspeer 
1823678453a8Sspeer }
1824678453a8Sspeer 
1825678453a8Sspeer /*
1826678453a8Sspeer  * vnet_stop_resources -- stop all resources associated with a vnet.
1827678453a8Sspeer  */
1828678453a8Sspeer static void
vnet_stop_resources(vnet_t * vnetp)1829678453a8Sspeer vnet_stop_resources(vnet_t *vnetp)
1830678453a8Sspeer {
1831678453a8Sspeer 	vnet_res_t	*vresp;
1832678453a8Sspeer 	mac_register_t	*macp;
1833678453a8Sspeer 	mac_callbacks_t	*cbp;
1834678453a8Sspeer 
1835678453a8Sspeer 	DBG1(vnetp, "enter\n");
1836678453a8Sspeer 
18375460ddbdSSriharsha Basavapatna 	ASSERT(RW_WRITE_HELD(&vnetp->vrwlock));
18385460ddbdSSriharsha Basavapatna 
1839678453a8Sspeer 	for (vresp = vnetp->vres_list; vresp != NULL; ) {
1840678453a8Sspeer 		if (vresp->flags & VNET_STARTED) {
18415460ddbdSSriharsha Basavapatna 			/*
18425460ddbdSSriharsha Basavapatna 			 * Release the lock while invoking mc_stop() of the
18435460ddbdSSriharsha Basavapatna 			 * underlying resource. We hold a reference to this
18445460ddbdSSriharsha Basavapatna 			 * resource to prevent being removed from the list in
18455460ddbdSSriharsha Basavapatna 			 * vio_net_resource_unreg(). Note that new resources
18465460ddbdSSriharsha Basavapatna 			 * can be added to the head of the list while the lock
18475460ddbdSSriharsha Basavapatna 			 * is released, but they won't be started, as
18485460ddbdSSriharsha Basavapatna 			 * VNET_STARTED flag has been cleared for the vnet
18495460ddbdSSriharsha Basavapatna 			 * device in vnet_m_stop(). Also, while the lock is
18505460ddbdSSriharsha Basavapatna 			 * released a resource could be removed from the list
18515460ddbdSSriharsha Basavapatna 			 * in vio_net_resource_unreg(); but that is ok, as we
18525460ddbdSSriharsha Basavapatna 			 * re-acquire the lock and only then access the forward
18535460ddbdSSriharsha Basavapatna 			 * link (vresp->nextp) to continue with the next
18545460ddbdSSriharsha Basavapatna 			 * resource.
18555460ddbdSSriharsha Basavapatna 			 */
18565460ddbdSSriharsha Basavapatna 			vresp->flags &= ~VNET_STARTED;
18575460ddbdSSriharsha Basavapatna 			vresp->flags |= VNET_STOPPING;
1858678453a8Sspeer 			macp = &vresp->macreg;
1859678453a8Sspeer 			cbp = macp->m_callbacks;
18605460ddbdSSriharsha Basavapatna 			VNET_FDBE_REFHOLD(vresp);
18615460ddbdSSriharsha Basavapatna 			RW_EXIT(&vnetp->vrwlock);
18625460ddbdSSriharsha Basavapatna 
1863678453a8Sspeer 			cbp->mc_stop(macp->m_driver);
18645460ddbdSSriharsha Basavapatna 
18655460ddbdSSriharsha Basavapatna 			WRITE_ENTER(&vnetp->vrwlock);
18665460ddbdSSriharsha Basavapatna 			vresp->flags &= ~VNET_STOPPING;
18675460ddbdSSriharsha Basavapatna 			VNET_FDBE_REFRELE(vresp);
1868678453a8Sspeer 		}
18695460ddbdSSriharsha Basavapatna 		vresp = vresp->nextp;
1870678453a8Sspeer 	}
1871678453a8Sspeer 	DBG1(vnetp, "exit\n");
1872678453a8Sspeer }
18736ab6cb20SWENTAO YANG 
18746ab6cb20SWENTAO YANG /*
18756ab6cb20SWENTAO YANG  * Setup kstats for the HIO statistics.
18766ab6cb20SWENTAO YANG  * NOTE: the synchronization for the statistics is the
18776ab6cb20SWENTAO YANG  * responsibility of the caller.
18786ab6cb20SWENTAO YANG  */
18796ab6cb20SWENTAO YANG kstat_t *
vnet_hio_setup_kstats(char * ks_mod,char * ks_name,vnet_res_t * vresp)18806ab6cb20SWENTAO YANG vnet_hio_setup_kstats(char *ks_mod, char *ks_name, vnet_res_t *vresp)
18816ab6cb20SWENTAO YANG {
18826ab6cb20SWENTAO YANG 	kstat_t *ksp;
18836ab6cb20SWENTAO YANG 	vnet_t *vnetp = vresp->vnetp;
18846ab6cb20SWENTAO YANG 	vnet_hio_kstats_t *hiokp;
18856ab6cb20SWENTAO YANG 	size_t size;
18866ab6cb20SWENTAO YANG 
18876ab6cb20SWENTAO YANG 	ASSERT(vnetp != NULL);
18886ab6cb20SWENTAO YANG 	size = sizeof (vnet_hio_kstats_t) / sizeof (kstat_named_t);
18896ab6cb20SWENTAO YANG 	ksp = kstat_create(ks_mod, vnetp->instance, ks_name, "net",
18906ab6cb20SWENTAO YANG 	    KSTAT_TYPE_NAMED, size, 0);
18916ab6cb20SWENTAO YANG 	if (ksp == NULL) {
18926ab6cb20SWENTAO YANG 		return (NULL);
18936ab6cb20SWENTAO YANG 	}
18946ab6cb20SWENTAO YANG 
18956ab6cb20SWENTAO YANG 	hiokp = (vnet_hio_kstats_t *)ksp->ks_data;
18966ab6cb20SWENTAO YANG 	kstat_named_init(&hiokp->ipackets,		"ipackets",
18976ab6cb20SWENTAO YANG 	    KSTAT_DATA_ULONG);
18986ab6cb20SWENTAO YANG 	kstat_named_init(&hiokp->ierrors,		"ierrors",
18996ab6cb20SWENTAO YANG 	    KSTAT_DATA_ULONG);
19006ab6cb20SWENTAO YANG 	kstat_named_init(&hiokp->opackets,		"opackets",
19016ab6cb20SWENTAO YANG 	    KSTAT_DATA_ULONG);
19026ab6cb20SWENTAO YANG 	kstat_named_init(&hiokp->oerrors,		"oerrors",
19036ab6cb20SWENTAO YANG 	    KSTAT_DATA_ULONG);
19046ab6cb20SWENTAO YANG 
19056ab6cb20SWENTAO YANG 
19066ab6cb20SWENTAO YANG 	/* MIB II kstat variables */
19076ab6cb20SWENTAO YANG 	kstat_named_init(&hiokp->rbytes,		"rbytes",
19086ab6cb20SWENTAO YANG 	    KSTAT_DATA_ULONG);
19096ab6cb20SWENTAO YANG 	kstat_named_init(&hiokp->obytes,		"obytes",
19106ab6cb20SWENTAO YANG 	    KSTAT_DATA_ULONG);
19116ab6cb20SWENTAO YANG 	kstat_named_init(&hiokp->multircv,		"multircv",
19126ab6cb20SWENTAO YANG 	    KSTAT_DATA_ULONG);
19136ab6cb20SWENTAO YANG 	kstat_named_init(&hiokp->multixmt,		"multixmt",
19146ab6cb20SWENTAO YANG 	    KSTAT_DATA_ULONG);
19156ab6cb20SWENTAO YANG 	kstat_named_init(&hiokp->brdcstrcv,		"brdcstrcv",
19166ab6cb20SWENTAO YANG 	    KSTAT_DATA_ULONG);
19176ab6cb20SWENTAO YANG 	kstat_named_init(&hiokp->brdcstxmt,		"brdcstxmt",
19186ab6cb20SWENTAO YANG 	    KSTAT_DATA_ULONG);
19196ab6cb20SWENTAO YANG 	kstat_named_init(&hiokp->norcvbuf,		"norcvbuf",
19206ab6cb20SWENTAO YANG 	    KSTAT_DATA_ULONG);
19216ab6cb20SWENTAO YANG 	kstat_named_init(&hiokp->noxmtbuf,		"noxmtbuf",
19226ab6cb20SWENTAO YANG 	    KSTAT_DATA_ULONG);
19236ab6cb20SWENTAO YANG 
19246ab6cb20SWENTAO YANG 	ksp->ks_update = vnet_hio_update_kstats;
19256ab6cb20SWENTAO YANG 	ksp->ks_private = (void *)vresp;
19266ab6cb20SWENTAO YANG 	kstat_install(ksp);
19276ab6cb20SWENTAO YANG 	return (ksp);
19286ab6cb20SWENTAO YANG }
19296ab6cb20SWENTAO YANG 
19306ab6cb20SWENTAO YANG /*
19316ab6cb20SWENTAO YANG  * Destroy kstats.
19326ab6cb20SWENTAO YANG  */
19336ab6cb20SWENTAO YANG static void
vnet_hio_destroy_kstats(kstat_t * ksp)19346ab6cb20SWENTAO YANG vnet_hio_destroy_kstats(kstat_t *ksp)
19356ab6cb20SWENTAO YANG {
19366ab6cb20SWENTAO YANG 	if (ksp != NULL)
19376ab6cb20SWENTAO YANG 		kstat_delete(ksp);
19386ab6cb20SWENTAO YANG }
19396ab6cb20SWENTAO YANG 
19406ab6cb20SWENTAO YANG /*
19416ab6cb20SWENTAO YANG  * Update the kstats.
19426ab6cb20SWENTAO YANG  */
19436ab6cb20SWENTAO YANG static int
vnet_hio_update_kstats(kstat_t * ksp,int rw)19446ab6cb20SWENTAO YANG vnet_hio_update_kstats(kstat_t *ksp, int rw)
19456ab6cb20SWENTAO YANG {
19466ab6cb20SWENTAO YANG 	vnet_t *vnetp;
19476ab6cb20SWENTAO YANG 	vnet_res_t *vresp;
19486ab6cb20SWENTAO YANG 	vnet_hio_stats_t statsp;
19496ab6cb20SWENTAO YANG 	vnet_hio_kstats_t *hiokp;
19506ab6cb20SWENTAO YANG 
19516ab6cb20SWENTAO YANG 	vresp = (vnet_res_t *)ksp->ks_private;
19526ab6cb20SWENTAO YANG 	vnetp = vresp->vnetp;
19536ab6cb20SWENTAO YANG 
19546ab6cb20SWENTAO YANG 	bzero(&statsp, sizeof (vnet_hio_stats_t));
19556ab6cb20SWENTAO YANG 
19566ab6cb20SWENTAO YANG 	READ_ENTER(&vnetp->vsw_fp_rw);
19576ab6cb20SWENTAO YANG 	if (vnetp->hio_fp == NULL) {
19586ab6cb20SWENTAO YANG 		/* not using hio resources, just return */
19596ab6cb20SWENTAO YANG 		RW_EXIT(&vnetp->vsw_fp_rw);
19606ab6cb20SWENTAO YANG 		return (0);
19616ab6cb20SWENTAO YANG 	}
19626ab6cb20SWENTAO YANG 	VNET_FDBE_REFHOLD(vnetp->hio_fp);
19636ab6cb20SWENTAO YANG 	RW_EXIT(&vnetp->vsw_fp_rw);
19646ab6cb20SWENTAO YANG 	vnet_hio_get_stats(vnetp->hio_fp, &statsp);
19656ab6cb20SWENTAO YANG 	VNET_FDBE_REFRELE(vnetp->hio_fp);
19666ab6cb20SWENTAO YANG 
19676ab6cb20SWENTAO YANG 	hiokp = (vnet_hio_kstats_t *)ksp->ks_data;
19686ab6cb20SWENTAO YANG 
19696ab6cb20SWENTAO YANG 	if (rw == KSTAT_READ) {
19706ab6cb20SWENTAO YANG 		/* Link Input/Output stats */
19716ab6cb20SWENTAO YANG 		hiokp->ipackets.value.ul	= (uint32_t)statsp.ipackets;
19726ab6cb20SWENTAO YANG 		hiokp->ipackets64.value.ull	= statsp.ipackets;
19736ab6cb20SWENTAO YANG 		hiokp->ierrors.value.ul		= statsp.ierrors;
19746ab6cb20SWENTAO YANG 		hiokp->opackets.value.ul	= (uint32_t)statsp.opackets;
19756ab6cb20SWENTAO YANG 		hiokp->opackets64.value.ull	= statsp.opackets;
19766ab6cb20SWENTAO YANG 		hiokp->oerrors.value.ul		= statsp.oerrors;
19776ab6cb20SWENTAO YANG 
19786ab6cb20SWENTAO YANG 		/* MIB II kstat variables */
19796ab6cb20SWENTAO YANG 		hiokp->rbytes.value.ul		= (uint32_t)statsp.rbytes;
19806ab6cb20SWENTAO YANG 		hiokp->rbytes64.value.ull	= statsp.rbytes;
19816ab6cb20SWENTAO YANG 		hiokp->obytes.value.ul		= (uint32_t)statsp.obytes;
19826ab6cb20SWENTAO YANG 		hiokp->obytes64.value.ull	= statsp.obytes;
19836ab6cb20SWENTAO YANG 		hiokp->multircv.value.ul	= statsp.multircv;
19846ab6cb20SWENTAO YANG 		hiokp->multixmt.value.ul	= statsp.multixmt;
19856ab6cb20SWENTAO YANG 		hiokp->brdcstrcv.value.ul	= statsp.brdcstrcv;
19866ab6cb20SWENTAO YANG 		hiokp->brdcstxmt.value.ul	= statsp.brdcstxmt;
19876ab6cb20SWENTAO YANG 		hiokp->norcvbuf.value.ul	= statsp.norcvbuf;
19886ab6cb20SWENTAO YANG 		hiokp->noxmtbuf.value.ul	= statsp.noxmtbuf;
19896ab6cb20SWENTAO YANG 	} else {
19906ab6cb20SWENTAO YANG 		return (EACCES);
19916ab6cb20SWENTAO YANG 	}
19926ab6cb20SWENTAO YANG 
19936ab6cb20SWENTAO YANG 	return (0);
19946ab6cb20SWENTAO YANG }
19956ab6cb20SWENTAO YANG 
19966ab6cb20SWENTAO YANG static void
vnet_hio_get_stats(vnet_res_t * vresp,vnet_hio_stats_t * statsp)19976ab6cb20SWENTAO YANG vnet_hio_get_stats(vnet_res_t *vresp, vnet_hio_stats_t *statsp)
19986ab6cb20SWENTAO YANG {
19996ab6cb20SWENTAO YANG 	mac_register_t		*macp;
20006ab6cb20SWENTAO YANG 	mac_callbacks_t		*cbp;
20016ab6cb20SWENTAO YANG 	uint64_t		val;
20026ab6cb20SWENTAO YANG 	int			stat;
20036ab6cb20SWENTAO YANG 
20046ab6cb20SWENTAO YANG 	/*
20056ab6cb20SWENTAO YANG 	 * get the specified statistics from the underlying nxge.
20066ab6cb20SWENTAO YANG 	 */
20076ab6cb20SWENTAO YANG 	macp = &vresp->macreg;
20086ab6cb20SWENTAO YANG 	cbp = macp->m_callbacks;
20096ab6cb20SWENTAO YANG 	for (stat = MAC_STAT_MIN; stat < MAC_STAT_OVERFLOWS; stat++) {
20106ab6cb20SWENTAO YANG 		if (cbp->mc_getstat(macp->m_driver, stat, &val) == 0) {
20116ab6cb20SWENTAO YANG 			switch (stat) {
20126ab6cb20SWENTAO YANG 			case MAC_STAT_IPACKETS:
20136ab6cb20SWENTAO YANG 				statsp->ipackets = val;
20146ab6cb20SWENTAO YANG 				break;
20156ab6cb20SWENTAO YANG 
20166ab6cb20SWENTAO YANG 			case MAC_STAT_IERRORS:
20176ab6cb20SWENTAO YANG 				statsp->ierrors = val;
20186ab6cb20SWENTAO YANG 				break;
20196ab6cb20SWENTAO YANG 
20206ab6cb20SWENTAO YANG 			case MAC_STAT_OPACKETS:
20216ab6cb20SWENTAO YANG 				statsp->opackets = val;
20226ab6cb20SWENTAO YANG 				break;
20236ab6cb20SWENTAO YANG 
20246ab6cb20SWENTAO YANG 			case MAC_STAT_OERRORS:
20256ab6cb20SWENTAO YANG 				statsp->oerrors = val;
20266ab6cb20SWENTAO YANG 				break;
20276ab6cb20SWENTAO YANG 
20286ab6cb20SWENTAO YANG 			case MAC_STAT_RBYTES:
20296ab6cb20SWENTAO YANG 				statsp->rbytes = val;
20306ab6cb20SWENTAO YANG 				break;
20316ab6cb20SWENTAO YANG 
20326ab6cb20SWENTAO YANG 			case MAC_STAT_OBYTES:
20336ab6cb20SWENTAO YANG 				statsp->obytes = val;
20346ab6cb20SWENTAO YANG 				break;
20356ab6cb20SWENTAO YANG 
20366ab6cb20SWENTAO YANG 			case MAC_STAT_MULTIRCV:
20376ab6cb20SWENTAO YANG 				statsp->multircv = val;
20386ab6cb20SWENTAO YANG 				break;
20396ab6cb20SWENTAO YANG 
20406ab6cb20SWENTAO YANG 			case MAC_STAT_MULTIXMT:
20416ab6cb20SWENTAO YANG 				statsp->multixmt = val;
20426ab6cb20SWENTAO YANG 				break;
20436ab6cb20SWENTAO YANG 
20446ab6cb20SWENTAO YANG 			case MAC_STAT_BRDCSTRCV:
20456ab6cb20SWENTAO YANG 				statsp->brdcstrcv = val;
20466ab6cb20SWENTAO YANG 				break;
20476ab6cb20SWENTAO YANG 
20486ab6cb20SWENTAO YANG 			case MAC_STAT_BRDCSTXMT:
20496ab6cb20SWENTAO YANG 				statsp->brdcstxmt = val;
20506ab6cb20SWENTAO YANG 				break;
20516ab6cb20SWENTAO YANG 
20526ab6cb20SWENTAO YANG 			case MAC_STAT_NOXMTBUF:
20536ab6cb20SWENTAO YANG 				statsp->noxmtbuf = val;
20546ab6cb20SWENTAO YANG 				break;
20556ab6cb20SWENTAO YANG 
20566ab6cb20SWENTAO YANG 			case MAC_STAT_NORCVBUF:
20576ab6cb20SWENTAO YANG 				statsp->norcvbuf = val;
20586ab6cb20SWENTAO YANG 				break;
20596ab6cb20SWENTAO YANG 
20606ab6cb20SWENTAO YANG 			default:
20616ab6cb20SWENTAO YANG 				/*
20626ab6cb20SWENTAO YANG 				 * parameters not interested.
20636ab6cb20SWENTAO YANG 				 */
20646ab6cb20SWENTAO YANG 				break;
20656ab6cb20SWENTAO YANG 			}
20666ab6cb20SWENTAO YANG 		}
20676ab6cb20SWENTAO YANG 	}
20686ab6cb20SWENTAO YANG }
20691107ea93SSriharsha Basavapatna 
207063f531d1SSriharsha Basavapatna static boolean_t
vnet_m_capab(void * arg,mac_capab_t cap,void * cap_data)207163f531d1SSriharsha Basavapatna vnet_m_capab(void *arg, mac_capab_t cap, void *cap_data)
207263f531d1SSriharsha Basavapatna {
207363f531d1SSriharsha Basavapatna 	vnet_t	*vnetp = (vnet_t *)arg;
207463f531d1SSriharsha Basavapatna 
207563f531d1SSriharsha Basavapatna 	if (vnetp == NULL) {
207663f531d1SSriharsha Basavapatna 		return (0);
207763f531d1SSriharsha Basavapatna 	}
207863f531d1SSriharsha Basavapatna 
207963f531d1SSriharsha Basavapatna 	switch (cap) {
208063f531d1SSriharsha Basavapatna 
208163f531d1SSriharsha Basavapatna 	case MAC_CAPAB_RINGS: {
208263f531d1SSriharsha Basavapatna 
208363f531d1SSriharsha Basavapatna 		mac_capab_rings_t *cap_rings = cap_data;
208463f531d1SSriharsha Basavapatna 		/*
208563f531d1SSriharsha Basavapatna 		 * Rings Capability Notes:
208663f531d1SSriharsha Basavapatna 		 * We advertise rings to make use of the rings framework in
208763f531d1SSriharsha Basavapatna 		 * gldv3 mac layer, to improve the performance. This is
208863f531d1SSriharsha Basavapatna 		 * specifically needed when a Hybrid resource (with multiple
208963f531d1SSriharsha Basavapatna 		 * tx/rx hardware rings) is assigned to a vnet device. We also
209063f531d1SSriharsha Basavapatna 		 * leverage this for the normal case when no Hybrid resource is
209163f531d1SSriharsha Basavapatna 		 * assigned.
209263f531d1SSriharsha Basavapatna 		 *
209363f531d1SSriharsha Basavapatna 		 * Ring Allocation:
209463f531d1SSriharsha Basavapatna 		 * - TX path:
209563f531d1SSriharsha Basavapatna 		 * We expose a pseudo ring group with 2 pseudo tx rings (as
209663f531d1SSriharsha Basavapatna 		 * currently HybridIO exports only 2 rings) In the normal case,
209763f531d1SSriharsha Basavapatna 		 * transmit traffic that comes down to the driver through the
209863f531d1SSriharsha Basavapatna 		 * mri_tx (vnet_tx_ring_send()) entry point goes through the
209963f531d1SSriharsha Basavapatna 		 * distributed switching algorithm in vnet and gets transmitted
210063f531d1SSriharsha Basavapatna 		 * over a port/LDC in the vgen layer to either the vswitch or a
210163f531d1SSriharsha Basavapatna 		 * peer vnet. If and when a Hybrid resource is assigned to the
210263f531d1SSriharsha Basavapatna 		 * vnet, we obtain the tx ring information of the Hybrid device
210363f531d1SSriharsha Basavapatna 		 * (nxge) and map the pseudo rings 1:1 to the 2 hw tx rings.
210463f531d1SSriharsha Basavapatna 		 * Traffic being sent over the Hybrid resource by the mac layer
210563f531d1SSriharsha Basavapatna 		 * gets spread across both hw rings, as they are mapped to the
210663f531d1SSriharsha Basavapatna 		 * 2 pseudo tx rings in vnet.
210763f531d1SSriharsha Basavapatna 		 *
210863f531d1SSriharsha Basavapatna 		 * - RX path:
210963f531d1SSriharsha Basavapatna 		 * We expose a pseudo ring group with 3 pseudo rx rings (static
211063f531d1SSriharsha Basavapatna 		 * rings) initially. The first (default) pseudo rx ring is
211163f531d1SSriharsha Basavapatna 		 * reserved for the resource that connects to the vswitch
211263f531d1SSriharsha Basavapatna 		 * service. The next 2 rings are reserved for a Hybrid resource
211363f531d1SSriharsha Basavapatna 		 * that may be assigned to the vnet device. If and when a
211463f531d1SSriharsha Basavapatna 		 * Hybrid resource is assigned to the vnet, we obtain the rx
211563f531d1SSriharsha Basavapatna 		 * ring information of the Hybrid device (nxge) and map these
211663f531d1SSriharsha Basavapatna 		 * pseudo rings 1:1 to the 2 hw rx rings. For each additional
211763f531d1SSriharsha Basavapatna 		 * resource that connects to a peer vnet, we dynamically
211863f531d1SSriharsha Basavapatna 		 * allocate a pseudo rx ring and map it to that resource, when
211963f531d1SSriharsha Basavapatna 		 * the resource gets added; and the pseudo rx ring is
212063f531d1SSriharsha Basavapatna 		 * dynamically registered with the upper mac layer. We do the
212163f531d1SSriharsha Basavapatna 		 * reverse and unregister the ring with the mac layer when
212263f531d1SSriharsha Basavapatna 		 * the resource gets removed.
212363f531d1SSriharsha Basavapatna 		 *
212463f531d1SSriharsha Basavapatna 		 * Synchronization notes:
212563f531d1SSriharsha Basavapatna 		 * We don't need any lock to protect members of ring structure,
212663f531d1SSriharsha Basavapatna 		 * specifically ringp->hw_rh, in either the TX or the RX ring,
212763f531d1SSriharsha Basavapatna 		 * as explained below.
212863f531d1SSriharsha Basavapatna 		 * - TX ring:
212963f531d1SSriharsha Basavapatna 		 * ring->hw_rh is initialized only when a Hybrid resource is
213063f531d1SSriharsha Basavapatna 		 * associated; and gets referenced only in vnet_hio_tx(). The
213163f531d1SSriharsha Basavapatna 		 * Hybrid resource itself is available in fdb only after tx
213263f531d1SSriharsha Basavapatna 		 * hwrings are found and mapped; i.e, in vio_net_resource_reg()
213363f531d1SSriharsha Basavapatna 		 * we call vnet_bind_rings() first and then call
213463f531d1SSriharsha Basavapatna 		 * vnet_start_resources() which adds an entry to fdb. For
213563f531d1SSriharsha Basavapatna 		 * traffic going over LDC resources, we don't reference
213663f531d1SSriharsha Basavapatna 		 * ring->hw_rh at all.
213763f531d1SSriharsha Basavapatna 		 * - RX ring:
213863f531d1SSriharsha Basavapatna 		 * For rings mapped to Hybrid resource ring->hw_rh is
213963f531d1SSriharsha Basavapatna 		 * initialized and only then do we add the rx callback for
214063f531d1SSriharsha Basavapatna 		 * the underlying Hybrid resource; we disable callbacks before
214163f531d1SSriharsha Basavapatna 		 * we unmap ring->hw_rh. For rings mapped to LDC resources, we
214263f531d1SSriharsha Basavapatna 		 * stop the rx callbacks (in vgen) before we remove ring->hw_rh
214363f531d1SSriharsha Basavapatna 		 * (vio_net_resource_unreg()).
21440dc2366fSVenugopal Iyer 		 * Also, we access ring->hw_rh in vnet_rx_ring_stat().
21450dc2366fSVenugopal Iyer 		 * Note that for rings mapped to Hybrid resource, though the
21460dc2366fSVenugopal Iyer 		 * rings are statically registered with the mac layer, its
21470dc2366fSVenugopal Iyer 		 * hardware ring mapping (ringp->hw_rh) can be torn down in
21480dc2366fSVenugopal Iyer 		 * vnet_unbind_hwrings() while the kstat operation is in
21490dc2366fSVenugopal Iyer 		 * progress. To protect against this, we hold a reference to
21500dc2366fSVenugopal Iyer 		 * the resource in FDB; this ensures that the thread in
21510dc2366fSVenugopal Iyer 		 * vio_net_resource_unreg() waits for the reference to be
21520dc2366fSVenugopal Iyer 		 * dropped before unbinding the ring.
21530dc2366fSVenugopal Iyer 		 *
21540dc2366fSVenugopal Iyer 		 * We don't need to do this for rings mapped to LDC resources.
21550dc2366fSVenugopal Iyer 		 * These rings are registered/unregistered dynamically with
21560dc2366fSVenugopal Iyer 		 * the mac layer and so any attempt to unregister the ring
21570dc2366fSVenugopal Iyer 		 * while kstat operation is in progress will block in
21580dc2366fSVenugopal Iyer 		 * mac_group_rem_ring(). Thus implicitly protects the
21590dc2366fSVenugopal Iyer 		 * resource (ringp->hw_rh) from disappearing.
216063f531d1SSriharsha Basavapatna 		 */
216163f531d1SSriharsha Basavapatna 
216263f531d1SSriharsha Basavapatna 		if (cap_rings->mr_type == MAC_RING_TYPE_RX) {
216363f531d1SSriharsha Basavapatna 			cap_rings->mr_group_type = MAC_GROUP_TYPE_STATIC;
216463f531d1SSriharsha Basavapatna 
216563f531d1SSriharsha Basavapatna 			/*
216663f531d1SSriharsha Basavapatna 			 * The ring_cnt for rx grp is initialized in
216763f531d1SSriharsha Basavapatna 			 * vnet_ring_grp_init(). Later, the ring_cnt gets
216863f531d1SSriharsha Basavapatna 			 * updated dynamically whenever LDC resources are added
216963f531d1SSriharsha Basavapatna 			 * or removed.
217063f531d1SSriharsha Basavapatna 			 */
217163f531d1SSriharsha Basavapatna 			cap_rings->mr_rnum = vnetp->rx_grp[0].ring_cnt;
217263f531d1SSriharsha Basavapatna 			cap_rings->mr_rget = vnet_get_ring;
217363f531d1SSriharsha Basavapatna 
217463f531d1SSriharsha Basavapatna 			cap_rings->mr_gnum = VNET_NUM_PSEUDO_GROUPS;
217563f531d1SSriharsha Basavapatna 			cap_rings->mr_gget = vnet_get_group;
217663f531d1SSriharsha Basavapatna 			cap_rings->mr_gaddring = NULL;
217763f531d1SSriharsha Basavapatna 			cap_rings->mr_gremring = NULL;
217863f531d1SSriharsha Basavapatna 		} else {
217963f531d1SSriharsha Basavapatna 			cap_rings->mr_group_type = MAC_GROUP_TYPE_STATIC;
218063f531d1SSriharsha Basavapatna 
218163f531d1SSriharsha Basavapatna 			/*
218263f531d1SSriharsha Basavapatna 			 * The ring_cnt for tx grp is initialized in
218363f531d1SSriharsha Basavapatna 			 * vnet_ring_grp_init() and remains constant, as we
218463f531d1SSriharsha Basavapatna 			 * do not support dymanic tx rings for now.
218563f531d1SSriharsha Basavapatna 			 */
218663f531d1SSriharsha Basavapatna 			cap_rings->mr_rnum = vnetp->tx_grp[0].ring_cnt;
218763f531d1SSriharsha Basavapatna 			cap_rings->mr_rget = vnet_get_ring;
218863f531d1SSriharsha Basavapatna 
218963f531d1SSriharsha Basavapatna 			/*
219063f531d1SSriharsha Basavapatna 			 * Transmit rings are not grouped; i.e, the number of
219163f531d1SSriharsha Basavapatna 			 * transmit ring groups advertised should be set to 0.
219263f531d1SSriharsha Basavapatna 			 */
219363f531d1SSriharsha Basavapatna 			cap_rings->mr_gnum = 0;
219463f531d1SSriharsha Basavapatna 
219563f531d1SSriharsha Basavapatna 			cap_rings->mr_gget = vnet_get_group;
219663f531d1SSriharsha Basavapatna 			cap_rings->mr_gaddring = NULL;
219763f531d1SSriharsha Basavapatna 			cap_rings->mr_gremring = NULL;
219863f531d1SSriharsha Basavapatna 		}
219963f531d1SSriharsha Basavapatna 		return (B_TRUE);
220063f531d1SSriharsha Basavapatna 
220163f531d1SSriharsha Basavapatna 	}
220263f531d1SSriharsha Basavapatna 
220363f531d1SSriharsha Basavapatna 	default:
220463f531d1SSriharsha Basavapatna 		break;
220563f531d1SSriharsha Basavapatna 
220663f531d1SSriharsha Basavapatna 	}
220763f531d1SSriharsha Basavapatna 
220863f531d1SSriharsha Basavapatna 	return (B_FALSE);
220963f531d1SSriharsha Basavapatna }
221063f531d1SSriharsha Basavapatna 
221163f531d1SSriharsha Basavapatna /*
221263f531d1SSriharsha Basavapatna  * Callback funtion for MAC layer to get ring information.
221363f531d1SSriharsha Basavapatna  */
221463f531d1SSriharsha Basavapatna static void
vnet_get_ring(void * arg,mac_ring_type_t rtype,const int g_index,const int r_index,mac_ring_info_t * infop,mac_ring_handle_t r_handle)221563f531d1SSriharsha Basavapatna vnet_get_ring(void *arg, mac_ring_type_t rtype, const int g_index,
221663f531d1SSriharsha Basavapatna     const int r_index, mac_ring_info_t *infop, mac_ring_handle_t r_handle)
221763f531d1SSriharsha Basavapatna {
221863f531d1SSriharsha Basavapatna 	vnet_t	*vnetp = arg;
221963f531d1SSriharsha Basavapatna 
222063f531d1SSriharsha Basavapatna 	switch (rtype) {
222163f531d1SSriharsha Basavapatna 
222263f531d1SSriharsha Basavapatna 	case MAC_RING_TYPE_RX: {
222363f531d1SSriharsha Basavapatna 
222463f531d1SSriharsha Basavapatna 		vnet_pseudo_rx_group_t	*rx_grp;
222563f531d1SSriharsha Basavapatna 		vnet_pseudo_rx_ring_t	*rx_ringp;
222663f531d1SSriharsha Basavapatna 		mac_intr_t		*mintr;
222763f531d1SSriharsha Basavapatna 
222863f531d1SSriharsha Basavapatna 		/* We advertised only one RX group */
222963f531d1SSriharsha Basavapatna 		ASSERT(g_index == 0);
223063f531d1SSriharsha Basavapatna 		rx_grp = &vnetp->rx_grp[g_index];
223163f531d1SSriharsha Basavapatna 
223263f531d1SSriharsha Basavapatna 		/* Check the current # of rings in the rx group */
223363f531d1SSriharsha Basavapatna 		ASSERT((r_index >= 0) && (r_index < rx_grp->max_ring_cnt));
223463f531d1SSriharsha Basavapatna 
223563f531d1SSriharsha Basavapatna 		/* Get the ring based on the index */
223663f531d1SSriharsha Basavapatna 		rx_ringp = &rx_grp->rings[r_index];
223763f531d1SSriharsha Basavapatna 
223863f531d1SSriharsha Basavapatna 		rx_ringp->handle = r_handle;
223963f531d1SSriharsha Basavapatna 		/*
224063f531d1SSriharsha Basavapatna 		 * Note: we don't need to save the incoming r_index in rx_ring,
224163f531d1SSriharsha Basavapatna 		 * as vnet_ring_grp_init() would have initialized the index for
224263f531d1SSriharsha Basavapatna 		 * each ring in the array.
224363f531d1SSriharsha Basavapatna 		 */
224463f531d1SSriharsha Basavapatna 		rx_ringp->grp = rx_grp;
224563f531d1SSriharsha Basavapatna 		rx_ringp->vnetp = vnetp;
224663f531d1SSriharsha Basavapatna 
224763f531d1SSriharsha Basavapatna 		mintr = &infop->mri_intr;
224863f531d1SSriharsha Basavapatna 		mintr->mi_handle = (mac_intr_handle_t)rx_ringp;
224963f531d1SSriharsha Basavapatna 		mintr->mi_enable = (mac_intr_enable_t)vnet_ring_enable_intr;
225063f531d1SSriharsha Basavapatna 		mintr->mi_disable = (mac_intr_disable_t)vnet_ring_disable_intr;
225163f531d1SSriharsha Basavapatna 
225263f531d1SSriharsha Basavapatna 		infop->mri_driver = (mac_ring_driver_t)rx_ringp;
225363f531d1SSriharsha Basavapatna 		infop->mri_start = vnet_rx_ring_start;
225463f531d1SSriharsha Basavapatna 		infop->mri_stop = vnet_rx_ring_stop;
22550dc2366fSVenugopal Iyer 		infop->mri_stat = vnet_rx_ring_stat;
225663f531d1SSriharsha Basavapatna 
225763f531d1SSriharsha Basavapatna 		/* Set the poll function, as this is an rx ring */
225863f531d1SSriharsha Basavapatna 		infop->mri_poll = vnet_rx_poll;
22590dc2366fSVenugopal Iyer 		/*
22600dc2366fSVenugopal Iyer 		 * MAC_RING_RX_ENQUEUE bit needed to be set for nxge
22610dc2366fSVenugopal Iyer 		 * which was not sending packet chains in interrupt
22620dc2366fSVenugopal Iyer 		 * context. For such drivers, packets are queued in
22630dc2366fSVenugopal Iyer 		 * Rx soft rings so that we get a chance to switch
22640dc2366fSVenugopal Iyer 		 * into a polling mode under backlog. This bug (not
22650dc2366fSVenugopal Iyer 		 * sending packet chains) has now been fixed. Once
22660dc2366fSVenugopal Iyer 		 * the performance impact is measured, this change
22670dc2366fSVenugopal Iyer 		 * will be removed.
22680dc2366fSVenugopal Iyer 		 */
22690dc2366fSVenugopal Iyer 		infop->mri_flags = (vnet_mac_rx_queuing ?
22700dc2366fSVenugopal Iyer 		    MAC_RING_RX_ENQUEUE : 0);
227163f531d1SSriharsha Basavapatna 		break;
227263f531d1SSriharsha Basavapatna 	}
227363f531d1SSriharsha Basavapatna 
227463f531d1SSriharsha Basavapatna 	case MAC_RING_TYPE_TX: {
227563f531d1SSriharsha Basavapatna 		vnet_pseudo_tx_group_t	*tx_grp;
227663f531d1SSriharsha Basavapatna 		vnet_pseudo_tx_ring_t	*tx_ringp;
227763f531d1SSriharsha Basavapatna 
227863f531d1SSriharsha Basavapatna 		/*
227963f531d1SSriharsha Basavapatna 		 * No need to check grp index; mac layer passes -1 for it.
228063f531d1SSriharsha Basavapatna 		 */
228163f531d1SSriharsha Basavapatna 		tx_grp = &vnetp->tx_grp[0];
228263f531d1SSriharsha Basavapatna 
228363f531d1SSriharsha Basavapatna 		/* Check the # of rings in the tx group */
228463f531d1SSriharsha Basavapatna 		ASSERT((r_index >= 0) && (r_index < tx_grp->ring_cnt));
228563f531d1SSriharsha Basavapatna 
228663f531d1SSriharsha Basavapatna 		/* Get the ring based on the index */
228763f531d1SSriharsha Basavapatna 		tx_ringp = &tx_grp->rings[r_index];
228863f531d1SSriharsha Basavapatna 
228963f531d1SSriharsha Basavapatna 		tx_ringp->handle = r_handle;
229063f531d1SSriharsha Basavapatna 		tx_ringp->index = r_index;
229163f531d1SSriharsha Basavapatna 		tx_ringp->grp = tx_grp;
229263f531d1SSriharsha Basavapatna 		tx_ringp->vnetp = vnetp;
229363f531d1SSriharsha Basavapatna 
229463f531d1SSriharsha Basavapatna 		infop->mri_driver = (mac_ring_driver_t)tx_ringp;
229563f531d1SSriharsha Basavapatna 		infop->mri_start = vnet_tx_ring_start;
229663f531d1SSriharsha Basavapatna 		infop->mri_stop = vnet_tx_ring_stop;
22970dc2366fSVenugopal Iyer 		infop->mri_stat = vnet_tx_ring_stat;
229863f531d1SSriharsha Basavapatna 
229963f531d1SSriharsha Basavapatna 		/* Set the transmit function, as this is a tx ring */
230063f531d1SSriharsha Basavapatna 		infop->mri_tx = vnet_tx_ring_send;
23010dc2366fSVenugopal Iyer 		/*
23020dc2366fSVenugopal Iyer 		 * MAC_RING_TX_SERIALIZE bit needs to be set while
23030dc2366fSVenugopal Iyer 		 * hybridIO is enabled to workaround tx lock
23040dc2366fSVenugopal Iyer 		 * contention issues in nxge.
23050dc2366fSVenugopal Iyer 		 */
23060dc2366fSVenugopal Iyer 		infop->mri_flags = (vnet_mac_tx_serialize ?
23070dc2366fSVenugopal Iyer 		    MAC_RING_TX_SERIALIZE : 0);
230863f531d1SSriharsha Basavapatna 		break;
230963f531d1SSriharsha Basavapatna 	}
231063f531d1SSriharsha Basavapatna 
231163f531d1SSriharsha Basavapatna 	default:
231263f531d1SSriharsha Basavapatna 		break;
231363f531d1SSriharsha Basavapatna 	}
231463f531d1SSriharsha Basavapatna }
231563f531d1SSriharsha Basavapatna 
231663f531d1SSriharsha Basavapatna /*
231763f531d1SSriharsha Basavapatna  * Callback funtion for MAC layer to get group information.
231863f531d1SSriharsha Basavapatna  */
231963f531d1SSriharsha Basavapatna static void
vnet_get_group(void * arg,mac_ring_type_t type,const int index,mac_group_info_t * infop,mac_group_handle_t handle)232063f531d1SSriharsha Basavapatna vnet_get_group(void *arg, mac_ring_type_t type, const int index,
232163f531d1SSriharsha Basavapatna     mac_group_info_t *infop, mac_group_handle_t handle)
232263f531d1SSriharsha Basavapatna {
232363f531d1SSriharsha Basavapatna 	vnet_t	*vnetp = (vnet_t *)arg;
232463f531d1SSriharsha Basavapatna 
232563f531d1SSriharsha Basavapatna 	switch (type) {
232663f531d1SSriharsha Basavapatna 
232763f531d1SSriharsha Basavapatna 	case MAC_RING_TYPE_RX:
232863f531d1SSriharsha Basavapatna 	{
232963f531d1SSriharsha Basavapatna 		vnet_pseudo_rx_group_t	*rx_grp;
233063f531d1SSriharsha Basavapatna 
233163f531d1SSriharsha Basavapatna 		/* We advertised only one RX group */
233263f531d1SSriharsha Basavapatna 		ASSERT(index == 0);
233363f531d1SSriharsha Basavapatna 
233463f531d1SSriharsha Basavapatna 		rx_grp = &vnetp->rx_grp[index];
233563f531d1SSriharsha Basavapatna 		rx_grp->handle = handle;
233663f531d1SSriharsha Basavapatna 		rx_grp->index = index;
233763f531d1SSriharsha Basavapatna 		rx_grp->vnetp = vnetp;
233863f531d1SSriharsha Basavapatna 
233963f531d1SSriharsha Basavapatna 		infop->mgi_driver = (mac_group_driver_t)rx_grp;
234063f531d1SSriharsha Basavapatna 		infop->mgi_start = NULL;
234163f531d1SSriharsha Basavapatna 		infop->mgi_stop = NULL;
234263f531d1SSriharsha Basavapatna 		infop->mgi_addmac = vnet_addmac;
234363f531d1SSriharsha Basavapatna 		infop->mgi_remmac = vnet_remmac;
234463f531d1SSriharsha Basavapatna 		infop->mgi_count = rx_grp->ring_cnt;
234563f531d1SSriharsha Basavapatna 
234663f531d1SSriharsha Basavapatna 		break;
234763f531d1SSriharsha Basavapatna 	}
234863f531d1SSriharsha Basavapatna 
234963f531d1SSriharsha Basavapatna 	case MAC_RING_TYPE_TX:
235063f531d1SSriharsha Basavapatna 	{
235163f531d1SSriharsha Basavapatna 		vnet_pseudo_tx_group_t	*tx_grp;
235263f531d1SSriharsha Basavapatna 
235363f531d1SSriharsha Basavapatna 		/* We advertised only one TX group */
235463f531d1SSriharsha Basavapatna 		ASSERT(index == 0);
235563f531d1SSriharsha Basavapatna 
235663f531d1SSriharsha Basavapatna 		tx_grp = &vnetp->tx_grp[index];
235763f531d1SSriharsha Basavapatna 		tx_grp->handle = handle;
235863f531d1SSriharsha Basavapatna 		tx_grp->index = index;
235963f531d1SSriharsha Basavapatna 		tx_grp->vnetp = vnetp;
236063f531d1SSriharsha Basavapatna 
236163f531d1SSriharsha Basavapatna 		infop->mgi_driver = (mac_group_driver_t)tx_grp;
236263f531d1SSriharsha Basavapatna 		infop->mgi_start = NULL;
236363f531d1SSriharsha Basavapatna 		infop->mgi_stop = NULL;
236463f531d1SSriharsha Basavapatna 		infop->mgi_addmac = NULL;
236563f531d1SSriharsha Basavapatna 		infop->mgi_remmac = NULL;
236663f531d1SSriharsha Basavapatna 		infop->mgi_count = VNET_NUM_PSEUDO_TXRINGS;
236763f531d1SSriharsha Basavapatna 
236863f531d1SSriharsha Basavapatna 		break;
236963f531d1SSriharsha Basavapatna 	}
237063f531d1SSriharsha Basavapatna 
237163f531d1SSriharsha Basavapatna 	default:
237263f531d1SSriharsha Basavapatna 		break;
237363f531d1SSriharsha Basavapatna 
237463f531d1SSriharsha Basavapatna 	}
237563f531d1SSriharsha Basavapatna }
237663f531d1SSriharsha Basavapatna 
237763f531d1SSriharsha Basavapatna static int
vnet_rx_ring_start(mac_ring_driver_t arg,uint64_t mr_gen_num)237863f531d1SSriharsha Basavapatna vnet_rx_ring_start(mac_ring_driver_t arg, uint64_t mr_gen_num)
237963f531d1SSriharsha Basavapatna {
238063f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_ring_t	*rx_ringp = (vnet_pseudo_rx_ring_t *)arg;
238163f531d1SSriharsha Basavapatna 	int			err;
238263f531d1SSriharsha Basavapatna 
238363f531d1SSriharsha Basavapatna 	/*
238463f531d1SSriharsha Basavapatna 	 * If this ring is mapped to a LDC resource, simply mark the state to
238563f531d1SSriharsha Basavapatna 	 * indicate the ring is started and return.
238663f531d1SSriharsha Basavapatna 	 */
238763f531d1SSriharsha Basavapatna 	if ((rx_ringp->state &
238863f531d1SSriharsha Basavapatna 	    (VNET_RXRING_LDC_SERVICE|VNET_RXRING_LDC_GUEST)) != 0) {
238963f531d1SSriharsha Basavapatna 		rx_ringp->gen_num = mr_gen_num;
239063f531d1SSriharsha Basavapatna 		rx_ringp->state |= VNET_RXRING_STARTED;
239163f531d1SSriharsha Basavapatna 		return (0);
239263f531d1SSriharsha Basavapatna 	}
239363f531d1SSriharsha Basavapatna 
239463f531d1SSriharsha Basavapatna 	ASSERT((rx_ringp->state & VNET_RXRING_HYBRID) != 0);
239563f531d1SSriharsha Basavapatna 
239663f531d1SSriharsha Basavapatna 	/*
239763f531d1SSriharsha Basavapatna 	 * This must be a ring reserved for a hwring. If the hwring is not
239863f531d1SSriharsha Basavapatna 	 * bound yet, simply mark the state to indicate the ring is started and
239963f531d1SSriharsha Basavapatna 	 * return. If and when a hybrid resource is activated for this vnet
240063f531d1SSriharsha Basavapatna 	 * device, we will bind the hwring and start it then. If a hwring is
240163f531d1SSriharsha Basavapatna 	 * already bound, start it now.
240263f531d1SSriharsha Basavapatna 	 */
240363f531d1SSriharsha Basavapatna 	if (rx_ringp->hw_rh == NULL) {
240463f531d1SSriharsha Basavapatna 		rx_ringp->gen_num = mr_gen_num;
240563f531d1SSriharsha Basavapatna 		rx_ringp->state |= VNET_RXRING_STARTED;
240663f531d1SSriharsha Basavapatna 		return (0);
240763f531d1SSriharsha Basavapatna 	}
240863f531d1SSriharsha Basavapatna 
240945948e49SRyan Zezeski 	err = mac_hwring_activate(rx_ringp->hw_rh);
241063f531d1SSriharsha Basavapatna 	if (err == 0) {
241163f531d1SSriharsha Basavapatna 		rx_ringp->gen_num = mr_gen_num;
241263f531d1SSriharsha Basavapatna 		rx_ringp->state |= VNET_RXRING_STARTED;
241363f531d1SSriharsha Basavapatna 	} else {
241463f531d1SSriharsha Basavapatna 		err = ENXIO;
241563f531d1SSriharsha Basavapatna 	}
241663f531d1SSriharsha Basavapatna 
241763f531d1SSriharsha Basavapatna 	return (err);
241863f531d1SSriharsha Basavapatna }
241963f531d1SSriharsha Basavapatna 
242063f531d1SSriharsha Basavapatna static void
vnet_rx_ring_stop(mac_ring_driver_t arg)242163f531d1SSriharsha Basavapatna vnet_rx_ring_stop(mac_ring_driver_t arg)
242263f531d1SSriharsha Basavapatna {
242363f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_ring_t	*rx_ringp = (vnet_pseudo_rx_ring_t *)arg;
242463f531d1SSriharsha Basavapatna 
242563f531d1SSriharsha Basavapatna 	/*
242663f531d1SSriharsha Basavapatna 	 * If this ring is mapped to a LDC resource, simply mark the state to
242763f531d1SSriharsha Basavapatna 	 * indicate the ring is now stopped and return.
242863f531d1SSriharsha Basavapatna 	 */
242963f531d1SSriharsha Basavapatna 	if ((rx_ringp->state &
243063f531d1SSriharsha Basavapatna 	    (VNET_RXRING_LDC_SERVICE|VNET_RXRING_LDC_GUEST)) != 0) {
243163f531d1SSriharsha Basavapatna 		rx_ringp->state &= ~VNET_RXRING_STARTED;
2432e8c4ecbbSWENTAO YANG 		return;
243363f531d1SSriharsha Basavapatna 	}
243463f531d1SSriharsha Basavapatna 
243563f531d1SSriharsha Basavapatna 	ASSERT((rx_ringp->state & VNET_RXRING_HYBRID) != 0);
243663f531d1SSriharsha Basavapatna 
243763f531d1SSriharsha Basavapatna 	/*
243863f531d1SSriharsha Basavapatna 	 * This must be a ring reserved for a hwring. If the hwring is not
243963f531d1SSriharsha Basavapatna 	 * bound yet, simply mark the state to indicate the ring is stopped and
244063f531d1SSriharsha Basavapatna 	 * return. If a hwring is already bound, stop it now.
244163f531d1SSriharsha Basavapatna 	 */
244263f531d1SSriharsha Basavapatna 	if (rx_ringp->hw_rh == NULL) {
244363f531d1SSriharsha Basavapatna 		rx_ringp->state &= ~VNET_RXRING_STARTED;
244463f531d1SSriharsha Basavapatna 		return;
244563f531d1SSriharsha Basavapatna 	}
244663f531d1SSriharsha Basavapatna 
244745948e49SRyan Zezeski 	mac_hwring_quiesce(rx_ringp->hw_rh);
244863f531d1SSriharsha Basavapatna 	rx_ringp->state &= ~VNET_RXRING_STARTED;
244963f531d1SSriharsha Basavapatna }
245063f531d1SSriharsha Basavapatna 
24510dc2366fSVenugopal Iyer static int
vnet_rx_ring_stat(mac_ring_driver_t rdriver,uint_t stat,uint64_t * val)24520dc2366fSVenugopal Iyer vnet_rx_ring_stat(mac_ring_driver_t rdriver, uint_t stat, uint64_t *val)
24530dc2366fSVenugopal Iyer {
24540dc2366fSVenugopal Iyer 	vnet_pseudo_rx_ring_t	*rx_ringp = (vnet_pseudo_rx_ring_t *)rdriver;
24550dc2366fSVenugopal Iyer 	vnet_t			*vnetp = (vnet_t *)rx_ringp->vnetp;
24560dc2366fSVenugopal Iyer 	vnet_res_t		*vresp;
24570dc2366fSVenugopal Iyer 	mac_register_t		*macp;
24580dc2366fSVenugopal Iyer 	mac_callbacks_t		*cbp;
24590dc2366fSVenugopal Iyer 
24600dc2366fSVenugopal Iyer 	/*
24610dc2366fSVenugopal Iyer 	 * Refer to vnet_m_capab() function for detailed comments on ring
24620dc2366fSVenugopal Iyer 	 * synchronization.
24630dc2366fSVenugopal Iyer 	 */
24640dc2366fSVenugopal Iyer 	if ((rx_ringp->state & VNET_RXRING_HYBRID) != 0) {
24650dc2366fSVenugopal Iyer 		READ_ENTER(&vnetp->vsw_fp_rw);
24660dc2366fSVenugopal Iyer 		if (vnetp->hio_fp == NULL) {
24670dc2366fSVenugopal Iyer 			RW_EXIT(&vnetp->vsw_fp_rw);
24680dc2366fSVenugopal Iyer 			return (0);
24690dc2366fSVenugopal Iyer 		}
24700dc2366fSVenugopal Iyer 
24710dc2366fSVenugopal Iyer 		VNET_FDBE_REFHOLD(vnetp->hio_fp);
24720dc2366fSVenugopal Iyer 		RW_EXIT(&vnetp->vsw_fp_rw);
24739f26b864SVenugopal Iyer 		(void) mac_hwring_getstat(rx_ringp->hw_rh, stat, val);
24740dc2366fSVenugopal Iyer 		VNET_FDBE_REFRELE(vnetp->hio_fp);
24750dc2366fSVenugopal Iyer 		return (0);
24760dc2366fSVenugopal Iyer 	}
24770dc2366fSVenugopal Iyer 
24780dc2366fSVenugopal Iyer 	ASSERT((rx_ringp->state &
24790dc2366fSVenugopal Iyer 	    (VNET_RXRING_LDC_SERVICE|VNET_RXRING_LDC_GUEST)) != 0);
24800dc2366fSVenugopal Iyer 	vresp = (vnet_res_t *)rx_ringp->hw_rh;
24810dc2366fSVenugopal Iyer 	macp = &vresp->macreg;
24820dc2366fSVenugopal Iyer 	cbp = macp->m_callbacks;
24830dc2366fSVenugopal Iyer 
2484b17aa18cSToomas Soome 	(void) cbp->mc_getstat(macp->m_driver, stat, val);
24850dc2366fSVenugopal Iyer 
24860dc2366fSVenugopal Iyer 	return (0);
24870dc2366fSVenugopal Iyer }
24880dc2366fSVenugopal Iyer 
248963f531d1SSriharsha Basavapatna /* ARGSUSED */
249063f531d1SSriharsha Basavapatna static int
vnet_tx_ring_start(mac_ring_driver_t arg,uint64_t mr_gen_num)249163f531d1SSriharsha Basavapatna vnet_tx_ring_start(mac_ring_driver_t arg, uint64_t mr_gen_num)
249263f531d1SSriharsha Basavapatna {
249363f531d1SSriharsha Basavapatna 	vnet_pseudo_tx_ring_t	*tx_ringp = (vnet_pseudo_tx_ring_t *)arg;
249463f531d1SSriharsha Basavapatna 
249563f531d1SSriharsha Basavapatna 	tx_ringp->state |= VNET_TXRING_STARTED;
249663f531d1SSriharsha Basavapatna 	return (0);
249763f531d1SSriharsha Basavapatna }
249863f531d1SSriharsha Basavapatna 
249963f531d1SSriharsha Basavapatna static void
vnet_tx_ring_stop(mac_ring_driver_t arg)250063f531d1SSriharsha Basavapatna vnet_tx_ring_stop(mac_ring_driver_t arg)
250163f531d1SSriharsha Basavapatna {
250263f531d1SSriharsha Basavapatna 	vnet_pseudo_tx_ring_t	*tx_ringp = (vnet_pseudo_tx_ring_t *)arg;
250363f531d1SSriharsha Basavapatna 
250463f531d1SSriharsha Basavapatna 	tx_ringp->state &= ~VNET_TXRING_STARTED;
250563f531d1SSriharsha Basavapatna }
250663f531d1SSriharsha Basavapatna 
25070dc2366fSVenugopal Iyer static int
vnet_tx_ring_stat(mac_ring_driver_t rdriver,uint_t stat,uint64_t * val)25080dc2366fSVenugopal Iyer vnet_tx_ring_stat(mac_ring_driver_t rdriver, uint_t stat, uint64_t *val)
25090dc2366fSVenugopal Iyer {
25100dc2366fSVenugopal Iyer 	vnet_pseudo_tx_ring_t	*tx_ringp = (vnet_pseudo_tx_ring_t *)rdriver;
25110dc2366fSVenugopal Iyer 	vnet_tx_ring_stats_t	*statsp;
25120dc2366fSVenugopal Iyer 
25130dc2366fSVenugopal Iyer 	statsp = &tx_ringp->tx_ring_stats;
25140dc2366fSVenugopal Iyer 
25150dc2366fSVenugopal Iyer 	switch (stat) {
25160dc2366fSVenugopal Iyer 	case MAC_STAT_OPACKETS:
25170dc2366fSVenugopal Iyer 		*val = statsp->opackets;
25180dc2366fSVenugopal Iyer 		break;
25190dc2366fSVenugopal Iyer 
25200dc2366fSVenugopal Iyer 	case MAC_STAT_OBYTES:
25210dc2366fSVenugopal Iyer 		*val = statsp->obytes;
25220dc2366fSVenugopal Iyer 		break;
25230dc2366fSVenugopal Iyer 
25240dc2366fSVenugopal Iyer 	default:
25250dc2366fSVenugopal Iyer 		*val = 0;
25260dc2366fSVenugopal Iyer 		return (ENOTSUP);
25270dc2366fSVenugopal Iyer 	}
25280dc2366fSVenugopal Iyer 
25290dc2366fSVenugopal Iyer 	return (0);
25300dc2366fSVenugopal Iyer }
25310dc2366fSVenugopal Iyer 
253263f531d1SSriharsha Basavapatna /*
253363f531d1SSriharsha Basavapatna  * Disable polling for a ring and enable its interrupt.
253463f531d1SSriharsha Basavapatna  */
253563f531d1SSriharsha Basavapatna static int
vnet_ring_enable_intr(void * arg)253663f531d1SSriharsha Basavapatna vnet_ring_enable_intr(void *arg)
253763f531d1SSriharsha Basavapatna {
253863f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_ring_t	*rx_ringp = (vnet_pseudo_rx_ring_t *)arg;
253963f531d1SSriharsha Basavapatna 	vnet_res_t		*vresp;
254063f531d1SSriharsha Basavapatna 
254163f531d1SSriharsha Basavapatna 	if (rx_ringp->hw_rh == NULL) {
254263f531d1SSriharsha Basavapatna 		/*
254363f531d1SSriharsha Basavapatna 		 * Ring enable intr func is being invoked, but the ring is
254463f531d1SSriharsha Basavapatna 		 * not bound to any underlying resource ? This must be a ring
254563f531d1SSriharsha Basavapatna 		 * reserved for Hybrid resource and no such resource has been
254663f531d1SSriharsha Basavapatna 		 * assigned to this vnet device yet. We simply return success.
254763f531d1SSriharsha Basavapatna 		 */
254863f531d1SSriharsha Basavapatna 		ASSERT((rx_ringp->state & VNET_RXRING_HYBRID) != 0);
254963f531d1SSriharsha Basavapatna 		return (0);
255063f531d1SSriharsha Basavapatna 	}
255163f531d1SSriharsha Basavapatna 
255263f531d1SSriharsha Basavapatna 	/*
255363f531d1SSriharsha Basavapatna 	 * The rx ring has been bound to either a LDC or a Hybrid resource.
255463f531d1SSriharsha Basavapatna 	 * Call the appropriate function to enable interrupts for the ring.
255563f531d1SSriharsha Basavapatna 	 */
255663f531d1SSriharsha Basavapatna 	if (rx_ringp->state & VNET_RXRING_HYBRID) {
255763f531d1SSriharsha Basavapatna 		return (mac_hwring_enable_intr(rx_ringp->hw_rh));
255863f531d1SSriharsha Basavapatna 	} else {
255963f531d1SSriharsha Basavapatna 		vresp = (vnet_res_t *)rx_ringp->hw_rh;
256063f531d1SSriharsha Basavapatna 		return (vgen_enable_intr(vresp->macreg.m_driver));
256163f531d1SSriharsha Basavapatna 	}
256263f531d1SSriharsha Basavapatna }
256363f531d1SSriharsha Basavapatna 
256463f531d1SSriharsha Basavapatna /*
256563f531d1SSriharsha Basavapatna  * Enable polling for a ring and disable its interrupt.
256663f531d1SSriharsha Basavapatna  */
256763f531d1SSriharsha Basavapatna static int
vnet_ring_disable_intr(void * arg)256863f531d1SSriharsha Basavapatna vnet_ring_disable_intr(void *arg)
256963f531d1SSriharsha Basavapatna {
257063f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_ring_t	*rx_ringp = (vnet_pseudo_rx_ring_t *)arg;
257163f531d1SSriharsha Basavapatna 	vnet_res_t		*vresp;
257263f531d1SSriharsha Basavapatna 
257363f531d1SSriharsha Basavapatna 	if (rx_ringp->hw_rh == NULL) {
257463f531d1SSriharsha Basavapatna 		/*
257563f531d1SSriharsha Basavapatna 		 * Ring disable intr func is being invoked, but the ring is
257663f531d1SSriharsha Basavapatna 		 * not bound to any underlying resource ? This must be a ring
257763f531d1SSriharsha Basavapatna 		 * reserved for Hybrid resource and no such resource has been
257863f531d1SSriharsha Basavapatna 		 * assigned to this vnet device yet. We simply return success.
257963f531d1SSriharsha Basavapatna 		 */
258063f531d1SSriharsha Basavapatna 		ASSERT((rx_ringp->state & VNET_RXRING_HYBRID) != 0);
258163f531d1SSriharsha Basavapatna 		return (0);
258263f531d1SSriharsha Basavapatna 	}
258363f531d1SSriharsha Basavapatna 
258463f531d1SSriharsha Basavapatna 	/*
258563f531d1SSriharsha Basavapatna 	 * The rx ring has been bound to either a LDC or a Hybrid resource.
258663f531d1SSriharsha Basavapatna 	 * Call the appropriate function to disable interrupts for the ring.
258763f531d1SSriharsha Basavapatna 	 */
258863f531d1SSriharsha Basavapatna 	if (rx_ringp->state & VNET_RXRING_HYBRID) {
258963f531d1SSriharsha Basavapatna 		return (mac_hwring_disable_intr(rx_ringp->hw_rh));
259063f531d1SSriharsha Basavapatna 	} else {
259163f531d1SSriharsha Basavapatna 		vresp = (vnet_res_t *)rx_ringp->hw_rh;
259263f531d1SSriharsha Basavapatna 		return (vgen_disable_intr(vresp->macreg.m_driver));
259363f531d1SSriharsha Basavapatna 	}
259463f531d1SSriharsha Basavapatna }
259563f531d1SSriharsha Basavapatna 
259663f531d1SSriharsha Basavapatna /*
259763f531d1SSriharsha Basavapatna  * Poll 'bytes_to_pickup' bytes of message from the rx ring.
259863f531d1SSriharsha Basavapatna  */
259963f531d1SSriharsha Basavapatna static mblk_t *
vnet_rx_poll(void * arg,int bytes_to_pickup)260063f531d1SSriharsha Basavapatna vnet_rx_poll(void *arg, int bytes_to_pickup)
260163f531d1SSriharsha Basavapatna {
260263f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_ring_t	*rx_ringp = (vnet_pseudo_rx_ring_t *)arg;
260363f531d1SSriharsha Basavapatna 	mblk_t			*mp = NULL;
260463f531d1SSriharsha Basavapatna 	vnet_res_t		*vresp;
260563f531d1SSriharsha Basavapatna 	vnet_t			*vnetp = rx_ringp->vnetp;
260663f531d1SSriharsha Basavapatna 
260763f531d1SSriharsha Basavapatna 	if (rx_ringp->hw_rh == NULL) {
260863f531d1SSriharsha Basavapatna 		return (NULL);
260963f531d1SSriharsha Basavapatna 	}
261063f531d1SSriharsha Basavapatna 
261163f531d1SSriharsha Basavapatna 	if (rx_ringp->state & VNET_RXRING_HYBRID) {
261263f531d1SSriharsha Basavapatna 		mp = mac_hwring_poll(rx_ringp->hw_rh, bytes_to_pickup);
261363f531d1SSriharsha Basavapatna 		/*
261463f531d1SSriharsha Basavapatna 		 * Packets received over a hybrid resource need additional
261563f531d1SSriharsha Basavapatna 		 * processing to remove the tag, for the pvid case. The
261663f531d1SSriharsha Basavapatna 		 * underlying resource is not aware of the vnet's pvid and thus
261763f531d1SSriharsha Basavapatna 		 * packets are received with the vlan tag in the header; unlike
261863f531d1SSriharsha Basavapatna 		 * packets that are received over a ldc channel in which case
261963f531d1SSriharsha Basavapatna 		 * the peer vnet/vsw would have already removed the tag.
262063f531d1SSriharsha Basavapatna 		 */
262163f531d1SSriharsha Basavapatna 		if (vnetp->pvid != vnetp->default_vlan_id) {
262263f531d1SSriharsha Basavapatna 			vnet_rx_frames_untag(vnetp->pvid, &mp);
262363f531d1SSriharsha Basavapatna 		}
262463f531d1SSriharsha Basavapatna 	} else {
262563f531d1SSriharsha Basavapatna 		vresp = (vnet_res_t *)rx_ringp->hw_rh;
26267bd3a2e2SSriharsha Basavapatna 		mp = vgen_rx_poll(vresp->macreg.m_driver, bytes_to_pickup);
262763f531d1SSriharsha Basavapatna 	}
262863f531d1SSriharsha Basavapatna 	return (mp);
262963f531d1SSriharsha Basavapatna }
263063f531d1SSriharsha Basavapatna 
263163f531d1SSriharsha Basavapatna /* ARGSUSED */
263263f531d1SSriharsha Basavapatna void
vnet_hio_rx_cb(void * arg,mac_resource_handle_t mrh,mblk_t * mp,boolean_t loopback)263363f531d1SSriharsha Basavapatna vnet_hio_rx_cb(void *arg, mac_resource_handle_t mrh, mblk_t *mp,
263463f531d1SSriharsha Basavapatna     boolean_t loopback)
263563f531d1SSriharsha Basavapatna {
263663f531d1SSriharsha Basavapatna 	vnet_t			*vnetp = (vnet_t *)arg;
263763f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_ring_t	*ringp = (vnet_pseudo_rx_ring_t *)mrh;
263863f531d1SSriharsha Basavapatna 
263963f531d1SSriharsha Basavapatna 	/*
264063f531d1SSriharsha Basavapatna 	 * Packets received over a hybrid resource need additional processing
264163f531d1SSriharsha Basavapatna 	 * to remove the tag, for the pvid case. The underlying resource is
264263f531d1SSriharsha Basavapatna 	 * not aware of the vnet's pvid and thus packets are received with the
264363f531d1SSriharsha Basavapatna 	 * vlan tag in the header; unlike packets that are received over a ldc
264463f531d1SSriharsha Basavapatna 	 * channel in which case the peer vnet/vsw would have already removed
264563f531d1SSriharsha Basavapatna 	 * the tag.
264663f531d1SSriharsha Basavapatna 	 */
264763f531d1SSriharsha Basavapatna 	if (vnetp->pvid != vnetp->default_vlan_id) {
264863f531d1SSriharsha Basavapatna 		vnet_rx_frames_untag(vnetp->pvid, &mp);
264963f531d1SSriharsha Basavapatna 		if (mp == NULL) {
265063f531d1SSriharsha Basavapatna 			return;
265163f531d1SSriharsha Basavapatna 		}
265263f531d1SSriharsha Basavapatna 	}
265363f531d1SSriharsha Basavapatna 	mac_rx_ring(vnetp->mh, ringp->handle, mp, ringp->gen_num);
265463f531d1SSriharsha Basavapatna }
265563f531d1SSriharsha Basavapatna 
265663f531d1SSriharsha Basavapatna static int
vnet_addmac(void * arg,const uint8_t * mac_addr)265763f531d1SSriharsha Basavapatna vnet_addmac(void *arg, const uint8_t *mac_addr)
265863f531d1SSriharsha Basavapatna {
265963f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_group_t  *rx_grp = (vnet_pseudo_rx_group_t *)arg;
266063f531d1SSriharsha Basavapatna 	vnet_t			*vnetp;
266163f531d1SSriharsha Basavapatna 
266263f531d1SSriharsha Basavapatna 	vnetp = rx_grp->vnetp;
266363f531d1SSriharsha Basavapatna 
266463f531d1SSriharsha Basavapatna 	if (bcmp(mac_addr, vnetp->curr_macaddr, ETHERADDRL) == 0) {
266563f531d1SSriharsha Basavapatna 		return (0);
266663f531d1SSriharsha Basavapatna 	}
266763f531d1SSriharsha Basavapatna 
266863f531d1SSriharsha Basavapatna 	cmn_err(CE_CONT, "!vnet%d: %s: Multiple macaddr unsupported\n",
266963f531d1SSriharsha Basavapatna 	    vnetp->instance, __func__);
267063f531d1SSriharsha Basavapatna 	return (EINVAL);
267163f531d1SSriharsha Basavapatna }
267263f531d1SSriharsha Basavapatna 
267363f531d1SSriharsha Basavapatna static int
vnet_remmac(void * arg,const uint8_t * mac_addr)267463f531d1SSriharsha Basavapatna vnet_remmac(void *arg, const uint8_t *mac_addr)
267563f531d1SSriharsha Basavapatna {
267663f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_group_t  *rx_grp = (vnet_pseudo_rx_group_t *)arg;
267763f531d1SSriharsha Basavapatna 	vnet_t			*vnetp;
267863f531d1SSriharsha Basavapatna 
267963f531d1SSriharsha Basavapatna 	vnetp = rx_grp->vnetp;
268063f531d1SSriharsha Basavapatna 
268163f531d1SSriharsha Basavapatna 	if (bcmp(mac_addr, vnetp->curr_macaddr, ETHERADDRL) == 0) {
268263f531d1SSriharsha Basavapatna 		return (0);
268363f531d1SSriharsha Basavapatna 	}
268463f531d1SSriharsha Basavapatna 
268563f531d1SSriharsha Basavapatna 	cmn_err(CE_CONT, "!vnet%d: %s: Invalid macaddr: %s\n",
268663f531d1SSriharsha Basavapatna 	    vnetp->instance, __func__, ether_sprintf((void *)mac_addr));
268763f531d1SSriharsha Basavapatna 	return (EINVAL);
268863f531d1SSriharsha Basavapatna }
268963f531d1SSriharsha Basavapatna 
269063f531d1SSriharsha Basavapatna int
vnet_hio_mac_init(vnet_t * vnetp,char * ifname)269163f531d1SSriharsha Basavapatna vnet_hio_mac_init(vnet_t *vnetp, char *ifname)
269263f531d1SSriharsha Basavapatna {
269363f531d1SSriharsha Basavapatna 	mac_handle_t		mh;
269463f531d1SSriharsha Basavapatna 	mac_client_handle_t	mch = NULL;
269563f531d1SSriharsha Basavapatna 	mac_unicast_handle_t	muh = NULL;
269663f531d1SSriharsha Basavapatna 	mac_diag_t		diag;
269763f531d1SSriharsha Basavapatna 	mac_register_t		*macp;
269863f531d1SSriharsha Basavapatna 	char			client_name[MAXNAMELEN];
269963f531d1SSriharsha Basavapatna 	int			rv;
270063f531d1SSriharsha Basavapatna 	uint16_t		mac_flags = MAC_UNICAST_TAG_DISABLE |
270163f531d1SSriharsha Basavapatna 	    MAC_UNICAST_STRIP_DISABLE | MAC_UNICAST_PRIMARY;
270263f531d1SSriharsha Basavapatna 	vio_net_callbacks_t	vcb;
270363f531d1SSriharsha Basavapatna 	ether_addr_t		rem_addr =
270463f531d1SSriharsha Basavapatna 		{ 0xff, 0xff, 0xff, 0xff, 0xff, 0xff };
270563f531d1SSriharsha Basavapatna 	uint32_t		retries = 0;
270663f531d1SSriharsha Basavapatna 
270763f531d1SSriharsha Basavapatna 	if ((macp = mac_alloc(MAC_VERSION)) == NULL) {
270863f531d1SSriharsha Basavapatna 		return (EAGAIN);
270963f531d1SSriharsha Basavapatna 	}
271063f531d1SSriharsha Basavapatna 
271163f531d1SSriharsha Basavapatna 	do {
271263f531d1SSriharsha Basavapatna 		rv = mac_open_by_linkname(ifname, &mh);
271363f531d1SSriharsha Basavapatna 		if (rv == 0) {
271463f531d1SSriharsha Basavapatna 			break;
271563f531d1SSriharsha Basavapatna 		}
271663f531d1SSriharsha Basavapatna 		if (rv != ENOENT || (retries++ >= vnet_mac_open_retries)) {
271763f531d1SSriharsha Basavapatna 			mac_free(macp);
271863f531d1SSriharsha Basavapatna 			return (rv);
271963f531d1SSriharsha Basavapatna 		}
272063f531d1SSriharsha Basavapatna 		drv_usecwait(vnet_mac_open_delay);
272163f531d1SSriharsha Basavapatna 	} while (rv == ENOENT);
272263f531d1SSriharsha Basavapatna 
272363f531d1SSriharsha Basavapatna 	vnetp->hio_mh = mh;
272463f531d1SSriharsha Basavapatna 
272563f531d1SSriharsha Basavapatna 	(void) snprintf(client_name, MAXNAMELEN, "vnet%d-%s", vnetp->instance,
272663f531d1SSriharsha Basavapatna 	    ifname);
272763f531d1SSriharsha Basavapatna 	rv = mac_client_open(mh, &mch, client_name, MAC_OPEN_FLAGS_EXCLUSIVE);
272863f531d1SSriharsha Basavapatna 	if (rv != 0) {
272963f531d1SSriharsha Basavapatna 		goto fail;
273063f531d1SSriharsha Basavapatna 	}
273163f531d1SSriharsha Basavapatna 	vnetp->hio_mch = mch;
273263f531d1SSriharsha Basavapatna 
273363f531d1SSriharsha Basavapatna 	rv = mac_unicast_add(mch, vnetp->curr_macaddr, mac_flags, &muh, 0,
273463f531d1SSriharsha Basavapatna 	    &diag);
273563f531d1SSriharsha Basavapatna 	if (rv != 0) {
273663f531d1SSriharsha Basavapatna 		goto fail;
273763f531d1SSriharsha Basavapatna 	}
273863f531d1SSriharsha Basavapatna 	vnetp->hio_muh = muh;
273963f531d1SSriharsha Basavapatna 
274063f531d1SSriharsha Basavapatna 	macp->m_type_ident = MAC_PLUGIN_IDENT_ETHER;
274163f531d1SSriharsha Basavapatna 	macp->m_driver = vnetp;
274263f531d1SSriharsha Basavapatna 	macp->m_dip = NULL;
274363f531d1SSriharsha Basavapatna 	macp->m_src_addr = NULL;
274463f531d1SSriharsha Basavapatna 	macp->m_callbacks = &vnet_hio_res_callbacks;
274563f531d1SSriharsha Basavapatna 	macp->m_min_sdu = 0;
274663f531d1SSriharsha Basavapatna 	macp->m_max_sdu = ETHERMTU;
274763f531d1SSriharsha Basavapatna 
274863f531d1SSriharsha Basavapatna 	rv = vio_net_resource_reg(macp, VIO_NET_RES_HYBRID,
274963f531d1SSriharsha Basavapatna 	    vnetp->curr_macaddr, rem_addr, &vnetp->hio_vhp, &vcb);
275063f531d1SSriharsha Basavapatna 	if (rv != 0) {
275163f531d1SSriharsha Basavapatna 		goto fail;
275263f531d1SSriharsha Basavapatna 	}
275363f531d1SSriharsha Basavapatna 	mac_free(macp);
275463f531d1SSriharsha Basavapatna 
275563f531d1SSriharsha Basavapatna 	/* add the recv callback */
275663f531d1SSriharsha Basavapatna 	mac_rx_set(vnetp->hio_mch, vnet_hio_rx_cb, vnetp);
275763f531d1SSriharsha Basavapatna 
275863f531d1SSriharsha Basavapatna 	return (0);
275963f531d1SSriharsha Basavapatna 
276063f531d1SSriharsha Basavapatna fail:
276163f531d1SSriharsha Basavapatna 	mac_free(macp);
276263f531d1SSriharsha Basavapatna 	vnet_hio_mac_cleanup(vnetp);
276363f531d1SSriharsha Basavapatna 	return (1);
276463f531d1SSriharsha Basavapatna }
276563f531d1SSriharsha Basavapatna 
276663f531d1SSriharsha Basavapatna void
vnet_hio_mac_cleanup(vnet_t * vnetp)276763f531d1SSriharsha Basavapatna vnet_hio_mac_cleanup(vnet_t *vnetp)
276863f531d1SSriharsha Basavapatna {
276963f531d1SSriharsha Basavapatna 	if (vnetp->hio_vhp != NULL) {
277063f531d1SSriharsha Basavapatna 		vio_net_resource_unreg(vnetp->hio_vhp);
277163f531d1SSriharsha Basavapatna 		vnetp->hio_vhp = NULL;
277263f531d1SSriharsha Basavapatna 	}
277363f531d1SSriharsha Basavapatna 
277463f531d1SSriharsha Basavapatna 	if (vnetp->hio_muh != NULL) {
277507d06da5SSurya Prakki 		(void) mac_unicast_remove(vnetp->hio_mch, vnetp->hio_muh);
277663f531d1SSriharsha Basavapatna 		vnetp->hio_muh = NULL;
277763f531d1SSriharsha Basavapatna 	}
277863f531d1SSriharsha Basavapatna 
277963f531d1SSriharsha Basavapatna 	if (vnetp->hio_mch != NULL) {
278063f531d1SSriharsha Basavapatna 		mac_client_close(vnetp->hio_mch, 0);
278163f531d1SSriharsha Basavapatna 		vnetp->hio_mch = NULL;
278263f531d1SSriharsha Basavapatna 	}
278363f531d1SSriharsha Basavapatna 
278463f531d1SSriharsha Basavapatna 	if (vnetp->hio_mh != NULL) {
278563f531d1SSriharsha Basavapatna 		mac_close(vnetp->hio_mh);
278663f531d1SSriharsha Basavapatna 		vnetp->hio_mh = NULL;
278763f531d1SSriharsha Basavapatna 	}
278863f531d1SSriharsha Basavapatna }
278963f531d1SSriharsha Basavapatna 
279063f531d1SSriharsha Basavapatna /* Bind pseudo rings to hwrings */
279163f531d1SSriharsha Basavapatna static int
vnet_bind_hwrings(vnet_t * vnetp)279263f531d1SSriharsha Basavapatna vnet_bind_hwrings(vnet_t *vnetp)
279363f531d1SSriharsha Basavapatna {
279463f531d1SSriharsha Basavapatna 	mac_ring_handle_t	hw_rh[VNET_NUM_HYBRID_RINGS];
279563f531d1SSriharsha Basavapatna 	mac_perim_handle_t	mph1;
279663f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_group_t	*rx_grp;
279763f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_ring_t	*rx_ringp;
279863f531d1SSriharsha Basavapatna 	vnet_pseudo_tx_group_t	*tx_grp;
279963f531d1SSriharsha Basavapatna 	vnet_pseudo_tx_ring_t	*tx_ringp;
280063f531d1SSriharsha Basavapatna 	int			hw_ring_cnt;
280163f531d1SSriharsha Basavapatna 	int			i;
280263f531d1SSriharsha Basavapatna 	int			rv;
280363f531d1SSriharsha Basavapatna 
280463f531d1SSriharsha Basavapatna 	mac_perim_enter_by_mh(vnetp->hio_mh, &mph1);
280563f531d1SSriharsha Basavapatna 
280663f531d1SSriharsha Basavapatna 	/* Get the list of the underlying RX rings. */
280763f531d1SSriharsha Basavapatna 	hw_ring_cnt = mac_hwrings_get(vnetp->hio_mch, &vnetp->rx_hwgh, hw_rh,
280863f531d1SSriharsha Basavapatna 	    MAC_RING_TYPE_RX);
280963f531d1SSriharsha Basavapatna 
281063f531d1SSriharsha Basavapatna 	/* We expect the the # of hw rx rings to match VNET_NUM_HYBRID_RINGS */
281163f531d1SSriharsha Basavapatna 	if (hw_ring_cnt != VNET_NUM_HYBRID_RINGS) {
281263f531d1SSriharsha Basavapatna 		cmn_err(CE_WARN,
281363f531d1SSriharsha Basavapatna 		    "!vnet%d: vnet_bind_hwrings: bad rx hw_ring_cnt(%d)\n",
281463f531d1SSriharsha Basavapatna 		    vnetp->instance, hw_ring_cnt);
281563f531d1SSriharsha Basavapatna 		goto fail;
281663f531d1SSriharsha Basavapatna 	}
281763f531d1SSriharsha Basavapatna 
281863f531d1SSriharsha Basavapatna 	if (vnetp->rx_hwgh != NULL) {
281963f531d1SSriharsha Basavapatna 		/*
282063f531d1SSriharsha Basavapatna 		 * Quiesce the HW ring and the mac srs on the ring. Note
282163f531d1SSriharsha Basavapatna 		 * that the HW ring will be restarted when the pseudo ring
282263f531d1SSriharsha Basavapatna 		 * is started. At that time all the packets will be
282363f531d1SSriharsha Basavapatna 		 * directly passed up to the pseudo RX ring and handled
282463f531d1SSriharsha Basavapatna 		 * by mac srs created over the pseudo RX ring.
282563f531d1SSriharsha Basavapatna 		 */
282663f531d1SSriharsha Basavapatna 		mac_rx_client_quiesce(vnetp->hio_mch);
282763f531d1SSriharsha Basavapatna 		mac_srs_perm_quiesce(vnetp->hio_mch, B_TRUE);
282863f531d1SSriharsha Basavapatna 	}
282963f531d1SSriharsha Basavapatna 
283063f531d1SSriharsha Basavapatna 	/*
283163f531d1SSriharsha Basavapatna 	 * Bind the pseudo rings to the hwrings and start the hwrings.
283263f531d1SSriharsha Basavapatna 	 * Note we don't need to register these with the upper mac, as we have
283363f531d1SSriharsha Basavapatna 	 * statically exported these pseudo rxrings which are reserved for
283463f531d1SSriharsha Basavapatna 	 * rxrings of Hybrid resource.
283563f531d1SSriharsha Basavapatna 	 */
283663f531d1SSriharsha Basavapatna 	rx_grp = &vnetp->rx_grp[0];
283763f531d1SSriharsha Basavapatna 	for (i = 0; i < VNET_NUM_HYBRID_RINGS; i++) {
283863f531d1SSriharsha Basavapatna 		/* Pick the rxrings reserved for Hybrid resource */
283963f531d1SSriharsha Basavapatna 		rx_ringp = &rx_grp->rings[i + VNET_HYBRID_RXRING_INDEX];
284063f531d1SSriharsha Basavapatna 
284163f531d1SSriharsha Basavapatna 		/* Store the hw ring handle */
284263f531d1SSriharsha Basavapatna 		rx_ringp->hw_rh = hw_rh[i];
284363f531d1SSriharsha Basavapatna 
284463f531d1SSriharsha Basavapatna 		/* Bind the pseudo ring to the underlying hwring */
284563f531d1SSriharsha Basavapatna 		mac_hwring_setup(rx_ringp->hw_rh,
28460dc2366fSVenugopal Iyer 		    (mac_resource_handle_t)rx_ringp, NULL);
284763f531d1SSriharsha Basavapatna 
284863f531d1SSriharsha Basavapatna 		/* Start the hwring if needed */
284963f531d1SSriharsha Basavapatna 		if (rx_ringp->state & VNET_RXRING_STARTED) {
285045948e49SRyan Zezeski 			rv = mac_hwring_activate(rx_ringp->hw_rh);
285163f531d1SSriharsha Basavapatna 			if (rv != 0) {
285263f531d1SSriharsha Basavapatna 				mac_hwring_teardown(rx_ringp->hw_rh);
285363f531d1SSriharsha Basavapatna 				rx_ringp->hw_rh = NULL;
285463f531d1SSriharsha Basavapatna 				goto fail;
285563f531d1SSriharsha Basavapatna 			}
285663f531d1SSriharsha Basavapatna 		}
285763f531d1SSriharsha Basavapatna 	}
285863f531d1SSriharsha Basavapatna 
285963f531d1SSriharsha Basavapatna 	/* Get the list of the underlying TX rings. */
286063f531d1SSriharsha Basavapatna 	hw_ring_cnt = mac_hwrings_get(vnetp->hio_mch, &vnetp->tx_hwgh, hw_rh,
286163f531d1SSriharsha Basavapatna 	    MAC_RING_TYPE_TX);
286263f531d1SSriharsha Basavapatna 
286363f531d1SSriharsha Basavapatna 	/* We expect the # of hw tx rings to match VNET_NUM_HYBRID_RINGS */
286463f531d1SSriharsha Basavapatna 	if (hw_ring_cnt != VNET_NUM_HYBRID_RINGS) {
286563f531d1SSriharsha Basavapatna 		cmn_err(CE_WARN,
286663f531d1SSriharsha Basavapatna 		    "!vnet%d: vnet_bind_hwrings: bad tx hw_ring_cnt(%d)\n",
286763f531d1SSriharsha Basavapatna 		    vnetp->instance, hw_ring_cnt);
286863f531d1SSriharsha Basavapatna 		goto fail;
286963f531d1SSriharsha Basavapatna 	}
287063f531d1SSriharsha Basavapatna 
287163f531d1SSriharsha Basavapatna 	/*
287263f531d1SSriharsha Basavapatna 	 * Now map the pseudo txrings to the hw txrings. Note we don't need
287363f531d1SSriharsha Basavapatna 	 * to register these with the upper mac, as we have statically exported
287463f531d1SSriharsha Basavapatna 	 * these rings. Note that these rings will continue to be used for LDC
287563f531d1SSriharsha Basavapatna 	 * resources to peer vnets and vswitch (shared ring).
287663f531d1SSriharsha Basavapatna 	 */
287763f531d1SSriharsha Basavapatna 	tx_grp = &vnetp->tx_grp[0];
287863f531d1SSriharsha Basavapatna 	for (i = 0; i < tx_grp->ring_cnt; i++) {
287963f531d1SSriharsha Basavapatna 		tx_ringp = &tx_grp->rings[i];
288063f531d1SSriharsha Basavapatna 		tx_ringp->hw_rh = hw_rh[i];
288163f531d1SSriharsha Basavapatna 		tx_ringp->state |= VNET_TXRING_HYBRID;
288263f531d1SSriharsha Basavapatna 	}
28830dc2366fSVenugopal Iyer 	tx_grp->tx_notify_handle =
28840dc2366fSVenugopal Iyer 	    mac_client_tx_notify(vnetp->hio_mch, vnet_tx_ring_update, vnetp);
288563f531d1SSriharsha Basavapatna 
288663f531d1SSriharsha Basavapatna 	mac_perim_exit(mph1);
288763f531d1SSriharsha Basavapatna 	return (0);
288863f531d1SSriharsha Basavapatna 
288963f531d1SSriharsha Basavapatna fail:
289063f531d1SSriharsha Basavapatna 	mac_perim_exit(mph1);
289163f531d1SSriharsha Basavapatna 	vnet_unbind_hwrings(vnetp);
289263f531d1SSriharsha Basavapatna 	return (1);
289363f531d1SSriharsha Basavapatna }
289463f531d1SSriharsha Basavapatna 
289563f531d1SSriharsha Basavapatna /* Unbind pseudo rings from hwrings */
289663f531d1SSriharsha Basavapatna static void
vnet_unbind_hwrings(vnet_t * vnetp)289763f531d1SSriharsha Basavapatna vnet_unbind_hwrings(vnet_t *vnetp)
289863f531d1SSriharsha Basavapatna {
289963f531d1SSriharsha Basavapatna 	mac_perim_handle_t	mph1;
290063f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_ring_t	*rx_ringp;
290163f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_group_t	*rx_grp;
290263f531d1SSriharsha Basavapatna 	vnet_pseudo_tx_group_t	*tx_grp;
290363f531d1SSriharsha Basavapatna 	vnet_pseudo_tx_ring_t	*tx_ringp;
290463f531d1SSriharsha Basavapatna 	int			i;
290563f531d1SSriharsha Basavapatna 
290663f531d1SSriharsha Basavapatna 	mac_perim_enter_by_mh(vnetp->hio_mh, &mph1);
290763f531d1SSriharsha Basavapatna 
290863f531d1SSriharsha Basavapatna 	tx_grp = &vnetp->tx_grp[0];
290963f531d1SSriharsha Basavapatna 	for (i = 0; i < VNET_NUM_HYBRID_RINGS; i++) {
291063f531d1SSriharsha Basavapatna 		tx_ringp = &tx_grp->rings[i];
291163f531d1SSriharsha Basavapatna 		if (tx_ringp->state & VNET_TXRING_HYBRID) {
291263f531d1SSriharsha Basavapatna 			tx_ringp->state &= ~VNET_TXRING_HYBRID;
291363f531d1SSriharsha Basavapatna 			tx_ringp->hw_rh = NULL;
291463f531d1SSriharsha Basavapatna 		}
291563f531d1SSriharsha Basavapatna 	}
29160dc2366fSVenugopal Iyer 	(void) mac_client_tx_notify(vnetp->hio_mch, NULL,
29170dc2366fSVenugopal Iyer 	    tx_grp->tx_notify_handle);
291863f531d1SSriharsha Basavapatna 
291963f531d1SSriharsha Basavapatna 	rx_grp = &vnetp->rx_grp[0];
292063f531d1SSriharsha Basavapatna 	for (i = 0; i < VNET_NUM_HYBRID_RINGS; i++) {
292163f531d1SSriharsha Basavapatna 		rx_ringp = &rx_grp->rings[i + VNET_HYBRID_RXRING_INDEX];
292263f531d1SSriharsha Basavapatna 		if (rx_ringp->hw_rh != NULL) {
292363f531d1SSriharsha Basavapatna 			/* Stop the hwring */
292445948e49SRyan Zezeski 			mac_hwring_quiesce(rx_ringp->hw_rh);
292563f531d1SSriharsha Basavapatna 
292663f531d1SSriharsha Basavapatna 			/* Teardown the hwring */
292763f531d1SSriharsha Basavapatna 			mac_hwring_teardown(rx_ringp->hw_rh);
292863f531d1SSriharsha Basavapatna 			rx_ringp->hw_rh = NULL;
292963f531d1SSriharsha Basavapatna 		}
293063f531d1SSriharsha Basavapatna 	}
293163f531d1SSriharsha Basavapatna 
293263f531d1SSriharsha Basavapatna 	if (vnetp->rx_hwgh != NULL) {
293363f531d1SSriharsha Basavapatna 		vnetp->rx_hwgh = NULL;
293463f531d1SSriharsha Basavapatna 		/*
293563f531d1SSriharsha Basavapatna 		 * First clear the permanent-quiesced flag of the RX srs then
293663f531d1SSriharsha Basavapatna 		 * restart the HW ring and the mac srs on the ring.
293763f531d1SSriharsha Basavapatna 		 */
293863f531d1SSriharsha Basavapatna 		mac_srs_perm_quiesce(vnetp->hio_mch, B_FALSE);
293963f531d1SSriharsha Basavapatna 		mac_rx_client_restart(vnetp->hio_mch);
294063f531d1SSriharsha Basavapatna 	}
294163f531d1SSriharsha Basavapatna 
294263f531d1SSriharsha Basavapatna 	mac_perim_exit(mph1);
294363f531d1SSriharsha Basavapatna }
294463f531d1SSriharsha Basavapatna 
294563f531d1SSriharsha Basavapatna /* Bind pseudo ring to a LDC resource */
294663f531d1SSriharsha Basavapatna static int
vnet_bind_vgenring(vnet_res_t * vresp)294763f531d1SSriharsha Basavapatna vnet_bind_vgenring(vnet_res_t *vresp)
294863f531d1SSriharsha Basavapatna {
294963f531d1SSriharsha Basavapatna 	vnet_t			*vnetp;
295063f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_group_t	*rx_grp;
295163f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_ring_t	*rx_ringp;
295263f531d1SSriharsha Basavapatna 	mac_perim_handle_t	mph1;
295363f531d1SSriharsha Basavapatna 	int			rv;
295463f531d1SSriharsha Basavapatna 	int			type;
295563f531d1SSriharsha Basavapatna 
295663f531d1SSriharsha Basavapatna 	vnetp = vresp->vnetp;
295763f531d1SSriharsha Basavapatna 	type = vresp->type;
295863f531d1SSriharsha Basavapatna 	rx_grp = &vnetp->rx_grp[0];
295963f531d1SSriharsha Basavapatna 
296063f531d1SSriharsha Basavapatna 	if (type == VIO_NET_RES_LDC_SERVICE) {
296163f531d1SSriharsha Basavapatna 		/*
296263f531d1SSriharsha Basavapatna 		 * Ring Index 0 is the default ring in the group and is
296363f531d1SSriharsha Basavapatna 		 * reserved for LDC_SERVICE in vnet_ring_grp_init(). This ring
296463f531d1SSriharsha Basavapatna 		 * is allocated statically and is reported to the mac layer
296563f531d1SSriharsha Basavapatna 		 * in vnet_m_capab(). So, all we need to do here, is save a
296663f531d1SSriharsha Basavapatna 		 * reference to the associated vresp.
296763f531d1SSriharsha Basavapatna 		 */
296863f531d1SSriharsha Basavapatna 		rx_ringp = &rx_grp->rings[0];
296963f531d1SSriharsha Basavapatna 		rx_ringp->hw_rh = (mac_ring_handle_t)vresp;
297063f531d1SSriharsha Basavapatna 		vresp->rx_ringp = (void *)rx_ringp;
297163f531d1SSriharsha Basavapatna 		return (0);
297263f531d1SSriharsha Basavapatna 	}
297363f531d1SSriharsha Basavapatna 	ASSERT(type == VIO_NET_RES_LDC_GUEST);
297463f531d1SSriharsha Basavapatna 
297563f531d1SSriharsha Basavapatna 	mac_perim_enter_by_mh(vnetp->mh, &mph1);
297663f531d1SSriharsha Basavapatna 
297763f531d1SSriharsha Basavapatna 	rx_ringp = vnet_alloc_pseudo_rx_ring(vnetp);
297863f531d1SSriharsha Basavapatna 	if (rx_ringp == NULL) {
297963f531d1SSriharsha Basavapatna 		cmn_err(CE_WARN, "!vnet%d: Failed to allocate pseudo rx ring",
298063f531d1SSriharsha Basavapatna 		    vnetp->instance);
298163f531d1SSriharsha Basavapatna 		goto fail;
298263f531d1SSriharsha Basavapatna 	}
298363f531d1SSriharsha Basavapatna 
298463f531d1SSriharsha Basavapatna 	/* Store the LDC resource itself as the ring handle */
298563f531d1SSriharsha Basavapatna 	rx_ringp->hw_rh = (mac_ring_handle_t)vresp;
298663f531d1SSriharsha Basavapatna 
298763f531d1SSriharsha Basavapatna 	/*
298863f531d1SSriharsha Basavapatna 	 * Save a reference to the ring in the resource for lookup during
298963f531d1SSriharsha Basavapatna 	 * unbind. Note this is only done for LDC resources. We don't need this
299063f531d1SSriharsha Basavapatna 	 * in the case of a Hybrid resource (see vnet_bind_hwrings()), as its
299163f531d1SSriharsha Basavapatna 	 * rx rings are mapped to reserved pseudo rx rings (index 1 and 2).
299263f531d1SSriharsha Basavapatna 	 */
299363f531d1SSriharsha Basavapatna 	vresp->rx_ringp = (void *)rx_ringp;
299463f531d1SSriharsha Basavapatna 	rx_ringp->state |= VNET_RXRING_LDC_GUEST;
299563f531d1SSriharsha Basavapatna 
299663f531d1SSriharsha Basavapatna 	/* Register the pseudo ring with upper-mac */
299763f531d1SSriharsha Basavapatna 	rv = mac_group_add_ring(rx_grp->handle, rx_ringp->index);
299863f531d1SSriharsha Basavapatna 	if (rv != 0) {
299963f531d1SSriharsha Basavapatna 		rx_ringp->state &= ~VNET_RXRING_LDC_GUEST;
300063f531d1SSriharsha Basavapatna 		rx_ringp->hw_rh = NULL;
300163f531d1SSriharsha Basavapatna 		vnet_free_pseudo_rx_ring(vnetp, rx_ringp);
300263f531d1SSriharsha Basavapatna 		goto fail;
300363f531d1SSriharsha Basavapatna 	}
300463f531d1SSriharsha Basavapatna 
300563f531d1SSriharsha Basavapatna 	mac_perim_exit(mph1);
300663f531d1SSriharsha Basavapatna 	return (0);
300763f531d1SSriharsha Basavapatna fail:
300863f531d1SSriharsha Basavapatna 	mac_perim_exit(mph1);
300963f531d1SSriharsha Basavapatna 	return (1);
301063f531d1SSriharsha Basavapatna }
301163f531d1SSriharsha Basavapatna 
301263f531d1SSriharsha Basavapatna /* Unbind pseudo ring from a LDC resource */
301363f531d1SSriharsha Basavapatna static void
vnet_unbind_vgenring(vnet_res_t * vresp)301463f531d1SSriharsha Basavapatna vnet_unbind_vgenring(vnet_res_t *vresp)
301563f531d1SSriharsha Basavapatna {
301663f531d1SSriharsha Basavapatna 	vnet_t			*vnetp;
301763f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_group_t	*rx_grp;
301863f531d1SSriharsha Basavapatna 	vnet_pseudo_rx_ring_t	*rx_ringp;
301963f531d1SSriharsha Basavapatna 	mac_perim_handle_t	mph1;
302063f531d1SSriharsha Basavapatna 	int			type;
302163f531d1SSriharsha Basavapatna 
302263f531d1SSriharsha Basavapatna 	vnetp = vresp->vnetp;
302363f531d1SSriharsha Basavapatna 	type = vresp->type;
302463f531d1SSriharsha Basavapatna 	rx_grp = &vnetp->rx_grp[0];
302563f531d1SSriharsha Basavapatna 
302663f531d1SSriharsha Basavapatna 	if (vresp->rx_ringp == NULL) {
302763f531d1SSriharsha Basavapatna 		return;
302863f531d1SSriharsha Basavapatna 	}
302963f531d1SSriharsha Basavapatna 
303063f531d1SSriharsha Basavapatna 	if (type == VIO_NET_RES_LDC_SERVICE) {
303163f531d1SSriharsha Basavapatna 		/*
303263f531d1SSriharsha Basavapatna 		 * Ring Index 0 is the default ring in the group and is
303363f531d1SSriharsha Basavapatna 		 * reserved for LDC_SERVICE in vnet_ring_grp_init(). This ring
303463f531d1SSriharsha Basavapatna 		 * is allocated statically and is reported to the mac layer
303563f531d1SSriharsha Basavapatna 		 * in vnet_m_capab(). So, all we need to do here, is remove its
303663f531d1SSriharsha Basavapatna 		 * reference to the associated vresp.
303763f531d1SSriharsha Basavapatna 		 */
303863f531d1SSriharsha Basavapatna 		rx_ringp = &rx_grp->rings[0];
303963f531d1SSriharsha Basavapatna 		rx_ringp->hw_rh = NULL;
304063f531d1SSriharsha Basavapatna 		vresp->rx_ringp = NULL;
304163f531d1SSriharsha Basavapatna 		return;
304263f531d1SSriharsha Basavapatna 	}
304363f531d1SSriharsha Basavapatna 	ASSERT(type == VIO_NET_RES_LDC_GUEST);
304463f531d1SSriharsha Basavapatna 
304563f531d1SSriharsha Basavapatna 	mac_perim_enter_by_mh(vnetp->mh, &mph1);
304663f531d1SSriharsha Basavapatna 
304763f531d1SSriharsha Basavapatna 	rx_ringp = (vnet_pseudo_rx_ring_t *)vresp->rx_ringp;
304863f531d1SSriharsha Basavapatna 	vresp->rx_ringp = NULL;
304963f531d1SSriharsha Basavapatna 
305063f531d1SSriharsha Basavapatna 	if (rx_ringp != NULL && (rx_ringp->state & VNET_RXRING_LDC_GUEST)) {
305163f531d1SSriharsha Basavapatna 		/* Unregister the pseudo ring with upper-mac */
305263f531d1SSriharsha Basavapatna 		mac_group_rem_ring(rx_grp->handle, rx_ringp->handle);
305363f531d1SSriharsha Basavapatna 
305463f531d1SSriharsha Basavapatna 		rx_ringp->hw_rh = NULL;
305563f531d1SSriharsha Basavapatna 		rx_ringp->state &= ~VNET_RXRING_LDC_GUEST;
305663f531d1SSriharsha Basavapatna 
305763f531d1SSriharsha Basavapatna 		/* Free the pseudo rx ring */
305863f531d1SSriharsha Basavapatna 		vnet_free_pseudo_rx_ring(vnetp, rx_ringp);
305963f531d1SSriharsha Basavapatna 	}
306063f531d1SSriharsha Basavapatna 
306163f531d1SSriharsha Basavapatna 	mac_perim_exit(mph1);
306263f531d1SSriharsha Basavapatna }
306363f531d1SSriharsha Basavapatna 
306463f531d1SSriharsha Basavapatna static void
vnet_unbind_rings(vnet_res_t * vresp)306563f531d1SSriharsha Basavapatna vnet_unbind_rings(vnet_res_t *vresp)
306663f531d1SSriharsha Basavapatna {
306763f531d1SSriharsha Basavapatna 	switch (vresp->type) {
306863f531d1SSriharsha Basavapatna 
306963f531d1SSriharsha Basavapatna 	case VIO_NET_RES_LDC_SERVICE:
307063f531d1SSriharsha Basavapatna 	case VIO_NET_RES_LDC_GUEST:
307163f531d1SSriharsha Basavapatna 		vnet_unbind_vgenring(vresp);
307263f531d1SSriharsha Basavapatna 		break;
307363f531d1SSriharsha Basavapatna 
307463f531d1SSriharsha Basavapatna 	case VIO_NET_RES_HYBRID:
307563f531d1SSriharsha Basavapatna 		vnet_unbind_hwrings(vresp->vnetp);
307663f531d1SSriharsha Basavapatna 		break;
307763f531d1SSriharsha Basavapatna 
307863f531d1SSriharsha Basavapatna 	default:
307963f531d1SSriharsha Basavapatna 		break;
308063f531d1SSriharsha Basavapatna 
308163f531d1SSriharsha Basavapatna 	}
308263f531d1SSriharsha Basavapatna }
308363f531d1SSriharsha Basavapatna 
308463f531d1SSriharsha Basavapatna static int
vnet_bind_rings(vnet_res_t * vresp)308563f531d1SSriharsha Basavapatna vnet_bind_rings(vnet_res_t *vresp)
308663f531d1SSriharsha Basavapatna {
308763f531d1SSriharsha Basavapatna 	int	rv;
308863f531d1SSriharsha Basavapatna 
308963f531d1SSriharsha Basavapatna 	switch (vresp->type) {
309063f531d1SSriharsha Basavapatna 
309163f531d1SSriharsha Basavapatna 	case VIO_NET_RES_LDC_SERVICE:
309263f531d1SSriharsha Basavapatna 	case VIO_NET_RES_LDC_GUEST:
309363f531d1SSriharsha Basavapatna 		rv = vnet_bind_vgenring(vresp);
309463f531d1SSriharsha Basavapatna 		break;
309563f531d1SSriharsha Basavapatna 
309663f531d1SSriharsha Basavapatna 	case VIO_NET_RES_HYBRID:
309763f531d1SSriharsha Basavapatna 		rv = vnet_bind_hwrings(vresp->vnetp);
309863f531d1SSriharsha Basavapatna 		break;
309963f531d1SSriharsha Basavapatna 
310063f531d1SSriharsha Basavapatna 	default:
310163f531d1SSriharsha Basavapatna 		rv = 1;
310263f531d1SSriharsha Basavapatna 		break;
310363f531d1SSriharsha Basavapatna 
310463f531d1SSriharsha Basavapatna 	}
310563f531d1SSriharsha Basavapatna 
310663f531d1SSriharsha Basavapatna 	return (rv);
310763f531d1SSriharsha Basavapatna }
310863f531d1SSriharsha Basavapatna 
310963f531d1SSriharsha Basavapatna /* ARGSUSED */
311063f531d1SSriharsha Basavapatna int
vnet_hio_stat(void * arg,uint_t stat,uint64_t * val)311163f531d1SSriharsha Basavapatna vnet_hio_stat(void *arg, uint_t stat, uint64_t *val)
311263f531d1SSriharsha Basavapatna {
311363f531d1SSriharsha Basavapatna 	vnet_t	*vnetp = (vnet_t *)arg;
311463f531d1SSriharsha Basavapatna 
311563f531d1SSriharsha Basavapatna 	*val = mac_stat_get(vnetp->hio_mh, stat);
311663f531d1SSriharsha Basavapatna 	return (0);
311763f531d1SSriharsha Basavapatna }
311863f531d1SSriharsha Basavapatna 
311963f531d1SSriharsha Basavapatna /*
312063f531d1SSriharsha Basavapatna  * The start() and stop() routines for the Hybrid resource below, are just
312163f531d1SSriharsha Basavapatna  * dummy functions. This is provided to avoid resource type specific code in
312263f531d1SSriharsha Basavapatna  * vnet_start_resources() and vnet_stop_resources(). The starting and stopping
312363f531d1SSriharsha Basavapatna  * of the Hybrid resource happens in the context of the mac_client interfaces
312463f531d1SSriharsha Basavapatna  * that are invoked in vnet_hio_mac_init() and vnet_hio_mac_cleanup().
312563f531d1SSriharsha Basavapatna  */
312663f531d1SSriharsha Basavapatna /* ARGSUSED */
312763f531d1SSriharsha Basavapatna static int
vnet_hio_start(void * arg)312863f531d1SSriharsha Basavapatna vnet_hio_start(void *arg)
312963f531d1SSriharsha Basavapatna {
313063f531d1SSriharsha Basavapatna 	return (0);
313163f531d1SSriharsha Basavapatna }
313263f531d1SSriharsha Basavapatna 
313363f531d1SSriharsha Basavapatna /* ARGSUSED */
313463f531d1SSriharsha Basavapatna static void
vnet_hio_stop(void * arg)313563f531d1SSriharsha Basavapatna vnet_hio_stop(void *arg)
313663f531d1SSriharsha Basavapatna {
313763f531d1SSriharsha Basavapatna }
313863f531d1SSriharsha Basavapatna 
313963f531d1SSriharsha Basavapatna mblk_t *
vnet_hio_tx(void * arg,mblk_t * mp)314063f531d1SSriharsha Basavapatna vnet_hio_tx(void *arg, mblk_t *mp)
314163f531d1SSriharsha Basavapatna {
314263f531d1SSriharsha Basavapatna 	vnet_pseudo_tx_ring_t	*tx_ringp;
314363f531d1SSriharsha Basavapatna 	mblk_t			*nextp;
314463f531d1SSriharsha Basavapatna 	mblk_t			*ret_mp;
314563f531d1SSriharsha Basavapatna 
314663f531d1SSriharsha Basavapatna 	tx_ringp = (vnet_pseudo_tx_ring_t *)arg;
314763f531d1SSriharsha Basavapatna 	for (;;) {
314863f531d1SSriharsha Basavapatna 		nextp = mp->b_next;
314963f531d1SSriharsha Basavapatna 		mp->b_next = NULL;
315063f531d1SSriharsha Basavapatna 
315163f531d1SSriharsha Basavapatna 		ret_mp = mac_hwring_tx(tx_ringp->hw_rh, mp);
315263f531d1SSriharsha Basavapatna 		if (ret_mp != NULL) {
315363f531d1SSriharsha Basavapatna 			ret_mp->b_next = nextp;
315463f531d1SSriharsha Basavapatna 			mp = ret_mp;
315563f531d1SSriharsha Basavapatna 			break;
315663f531d1SSriharsha Basavapatna 		}
315763f531d1SSriharsha Basavapatna 
315863f531d1SSriharsha Basavapatna 		if ((mp = nextp) == NULL)
315963f531d1SSriharsha Basavapatna 			break;
316063f531d1SSriharsha Basavapatna 	}
316163f531d1SSriharsha Basavapatna 	return (mp);
316263f531d1SSriharsha Basavapatna }
316363f531d1SSriharsha Basavapatna 
31641107ea93SSriharsha Basavapatna #ifdef	VNET_IOC_DEBUG
31651107ea93SSriharsha Basavapatna 
31661107ea93SSriharsha Basavapatna /*
31671107ea93SSriharsha Basavapatna  * The ioctl entry point is used only for debugging for now. The ioctl commands
31681107ea93SSriharsha Basavapatna  * can be used to force the link state of the channel connected to vsw.
31691107ea93SSriharsha Basavapatna  */
31701107ea93SSriharsha Basavapatna static void
vnet_m_ioctl(void * arg,queue_t * q,mblk_t * mp)31711107ea93SSriharsha Basavapatna vnet_m_ioctl(void *arg, queue_t *q, mblk_t *mp)
31721107ea93SSriharsha Basavapatna {
31731107ea93SSriharsha Basavapatna 	struct iocblk	*iocp;
31741107ea93SSriharsha Basavapatna 	vnet_t		*vnetp;
31751107ea93SSriharsha Basavapatna 
31761107ea93SSriharsha Basavapatna 	iocp = (struct iocblk *)(uintptr_t)mp->b_rptr;
31771107ea93SSriharsha Basavapatna 	iocp->ioc_error = 0;
31781107ea93SSriharsha Basavapatna 	vnetp = (vnet_t *)arg;
31791107ea93SSriharsha Basavapatna 
31801107ea93SSriharsha Basavapatna 	if (vnetp == NULL) {
31811107ea93SSriharsha Basavapatna 		miocnak(q, mp, 0, EINVAL);
31821107ea93SSriharsha Basavapatna 		return;
31831107ea93SSriharsha Basavapatna 	}
31841107ea93SSriharsha Basavapatna 
31851107ea93SSriharsha Basavapatna 	switch (iocp->ioc_cmd) {
31861107ea93SSriharsha Basavapatna 
31871107ea93SSriharsha Basavapatna 	case VNET_FORCE_LINK_DOWN:
31881107ea93SSriharsha Basavapatna 	case VNET_FORCE_LINK_UP:
31891107ea93SSriharsha Basavapatna 		vnet_force_link_state(vnetp, q, mp);
31901107ea93SSriharsha Basavapatna 		break;
31911107ea93SSriharsha Basavapatna 
31921107ea93SSriharsha Basavapatna 	default:
31931107ea93SSriharsha Basavapatna 		iocp->ioc_error = EINVAL;
31941107ea93SSriharsha Basavapatna 		miocnak(q, mp, 0, iocp->ioc_error);
31951107ea93SSriharsha Basavapatna 		break;
31961107ea93SSriharsha Basavapatna 
31971107ea93SSriharsha Basavapatna 	}
31981107ea93SSriharsha Basavapatna }
31991107ea93SSriharsha Basavapatna 
32001107ea93SSriharsha Basavapatna static void
vnet_force_link_state(vnet_t * vnetp,queue_t * q,mblk_t * mp)32011107ea93SSriharsha Basavapatna vnet_force_link_state(vnet_t *vnetp, queue_t *q, mblk_t *mp)
32021107ea93SSriharsha Basavapatna {
32031107ea93SSriharsha Basavapatna 	mac_register_t	*macp;
32041107ea93SSriharsha Basavapatna 	mac_callbacks_t	*cbp;
32051107ea93SSriharsha Basavapatna 	vnet_res_t	*vresp;
32061107ea93SSriharsha Basavapatna 
32071107ea93SSriharsha Basavapatna 	READ_ENTER(&vnetp->vsw_fp_rw);
32081107ea93SSriharsha Basavapatna 
32091107ea93SSriharsha Basavapatna 	vresp = vnetp->vsw_fp;
32101107ea93SSriharsha Basavapatna 	if (vresp == NULL) {
32111107ea93SSriharsha Basavapatna 		RW_EXIT(&vnetp->vsw_fp_rw);
32121107ea93SSriharsha Basavapatna 		return;
32131107ea93SSriharsha Basavapatna 	}
32141107ea93SSriharsha Basavapatna 
32151107ea93SSriharsha Basavapatna 	macp = &vresp->macreg;
32161107ea93SSriharsha Basavapatna 	cbp = macp->m_callbacks;
32171107ea93SSriharsha Basavapatna 	cbp->mc_ioctl(macp->m_driver, q, mp);
32181107ea93SSriharsha Basavapatna 
32191107ea93SSriharsha Basavapatna 	RW_EXIT(&vnetp->vsw_fp_rw);
32201107ea93SSriharsha Basavapatna }
32211107ea93SSriharsha Basavapatna 
32221107ea93SSriharsha Basavapatna #else
32231107ea93SSriharsha Basavapatna 
32241107ea93SSriharsha Basavapatna static void
vnet_m_ioctl(void * arg,queue_t * q,mblk_t * mp)32251107ea93SSriharsha Basavapatna vnet_m_ioctl(void *arg, queue_t *q, mblk_t *mp)
32261107ea93SSriharsha Basavapatna {
32271107ea93SSriharsha Basavapatna 	vnet_t		*vnetp;
32281107ea93SSriharsha Basavapatna 
32291107ea93SSriharsha Basavapatna 	vnetp = (vnet_t *)arg;
32301107ea93SSriharsha Basavapatna 
32311107ea93SSriharsha Basavapatna 	if (vnetp == NULL) {
32321107ea93SSriharsha Basavapatna 		miocnak(q, mp, 0, EINVAL);
32331107ea93SSriharsha Basavapatna 		return;
32341107ea93SSriharsha Basavapatna 	}
32351107ea93SSriharsha Basavapatna 
32361107ea93SSriharsha Basavapatna 	/* ioctl support only for debugging */
32371107ea93SSriharsha Basavapatna 	miocnak(q, mp, 0, ENOTSUP);
32381107ea93SSriharsha Basavapatna }
32391107ea93SSriharsha Basavapatna 
32401107ea93SSriharsha Basavapatna #endif
3241