xref: /freebsd/sys/dev/virtio/network/if_vtnetvar.h (revision c66ec88fed842fbaad62c30d510644ceb7bd2d71)
1 /*-
2  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
3  *
4  * Copyright (c) 2011, Bryan Venteicher <bryanv@FreeBSD.org>
5  * All rights reserved.
6  *
7  * Redistribution and use in source and binary forms, with or without
8  * modification, are permitted provided that the following conditions
9  * are met:
10  * 1. Redistributions of source code must retain the above copyright
11  *    notice unmodified, this list of conditions, and the following
12  *    disclaimer.
13  * 2. Redistributions in binary form must reproduce the above copyright
14  *    notice, this list of conditions and the following disclaimer in the
15  *    documentation and/or other materials provided with the distribution.
16  *
17  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
18  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
19  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
20  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
21  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
22  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
26  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27  *
28  * $FreeBSD$
29  */
30 
31 #ifndef _IF_VTNETVAR_H
32 #define _IF_VTNETVAR_H
33 
34 struct vtnet_softc;
35 
36 struct vtnet_statistics {
37 	uint64_t	mbuf_alloc_failed;
38 
39 	uint64_t	rx_frame_too_large;
40 	uint64_t	rx_enq_replacement_failed;
41 	uint64_t	rx_mergeable_failed;
42 	uint64_t	rx_csum_bad_ethtype;
43 	uint64_t	rx_csum_bad_ipproto;
44 	uint64_t	rx_csum_bad_offset;
45 	uint64_t	rx_csum_bad_proto;
46 	uint64_t	tx_csum_bad_ethtype;
47 	uint64_t	tx_tso_bad_ethtype;
48 	uint64_t	tx_tso_not_tcp;
49 	uint64_t	tx_defragged;
50 	uint64_t	tx_defrag_failed;
51 
52 	/*
53 	 * These are accumulated from each Rx/Tx queue.
54 	 */
55 	uint64_t	rx_csum_failed;
56 	uint64_t	rx_csum_offloaded;
57 	uint64_t	rx_task_rescheduled;
58 	uint64_t	tx_csum_offloaded;
59 	uint64_t	tx_tso_offloaded;
60 	uint64_t	tx_task_rescheduled;
61 };
62 
63 struct vtnet_rxq_stats {
64 	uint64_t	vrxs_ipackets;	/* if_ipackets */
65 	uint64_t	vrxs_ibytes;	/* if_ibytes */
66 	uint64_t	vrxs_iqdrops;	/* if_iqdrops */
67 	uint64_t	vrxs_ierrors;	/* if_ierrors */
68 	uint64_t	vrxs_csum;
69 	uint64_t	vrxs_csum_failed;
70 	uint64_t	vrxs_rescheduled;
71 };
72 
73 struct vtnet_rxq {
74 	struct mtx		 vtnrx_mtx;
75 	struct vtnet_softc	*vtnrx_sc;
76 	struct virtqueue	*vtnrx_vq;
77 	struct sglist		*vtnrx_sg;
78 	int			 vtnrx_id;
79 	struct vtnet_rxq_stats	 vtnrx_stats;
80 	struct taskqueue	*vtnrx_tq;
81 	struct task		 vtnrx_intrtask;
82 #ifdef DEV_NETMAP
83 	uint32_t		 vtnrx_nm_refill;
84 	struct virtio_net_hdr_mrg_rxbuf vtnrx_shrhdr;
85 #endif  /* DEV_NETMAP */
86 	char			 vtnrx_name[16];
87 } __aligned(CACHE_LINE_SIZE);
88 
89 #define VTNET_RXQ_LOCK(_rxq)	mtx_lock(&(_rxq)->vtnrx_mtx)
90 #define VTNET_RXQ_UNLOCK(_rxq)	mtx_unlock(&(_rxq)->vtnrx_mtx)
91 #define VTNET_RXQ_LOCK_ASSERT(_rxq)		\
92     mtx_assert(&(_rxq)->vtnrx_mtx, MA_OWNED)
93 #define VTNET_RXQ_LOCK_ASSERT_NOTOWNED(_rxq)	\
94     mtx_assert(&(_rxq)->vtnrx_mtx, MA_NOTOWNED)
95 
96 struct vtnet_txq_stats {
97 	uint64_t vtxs_opackets;	/* if_opackets */
98 	uint64_t vtxs_obytes;	/* if_obytes */
99 	uint64_t vtxs_omcasts;	/* if_omcasts */
100 	uint64_t vtxs_csum;
101 	uint64_t vtxs_tso;
102 	uint64_t vtxs_rescheduled;
103 };
104 
105 struct vtnet_txq {
106 	struct mtx		 vtntx_mtx;
107 	struct vtnet_softc	*vtntx_sc;
108 	struct virtqueue	*vtntx_vq;
109 	struct sglist		*vtntx_sg;
110 #ifndef VTNET_LEGACY_TX
111 	struct buf_ring		*vtntx_br;
112 #endif
113 	int			 vtntx_id;
114 	int			 vtntx_watchdog;
115 	struct vtnet_txq_stats	 vtntx_stats;
116 	struct taskqueue	*vtntx_tq;
117 	struct task		 vtntx_intrtask;
118 #ifndef VTNET_LEGACY_TX
119 	struct task		 vtntx_defrtask;
120 #endif
121 #ifdef DEV_NETMAP
122 	struct virtio_net_hdr_mrg_rxbuf vtntx_shrhdr;
123 #endif  /* DEV_NETMAP */
124 	char			 vtntx_name[16];
125 } __aligned(CACHE_LINE_SIZE);
126 
127 #define VTNET_TXQ_LOCK(_txq)	mtx_lock(&(_txq)->vtntx_mtx)
128 #define VTNET_TXQ_TRYLOCK(_txq)	mtx_trylock(&(_txq)->vtntx_mtx)
129 #define VTNET_TXQ_UNLOCK(_txq)	mtx_unlock(&(_txq)->vtntx_mtx)
130 #define VTNET_TXQ_LOCK_ASSERT(_txq)		\
131     mtx_assert(&(_txq)->vtntx_mtx, MA_OWNED)
132 #define VTNET_TXQ_LOCK_ASSERT_NOTOWNED(_txq)	\
133     mtx_assert(&(_txq)->vtntx_mtx, MA_NOTOWNED)
134 
135 struct vtnet_softc {
136 	device_t		 vtnet_dev;
137 	struct ifnet		*vtnet_ifp;
138 	struct vtnet_rxq	*vtnet_rxqs;
139 	struct vtnet_txq	*vtnet_txqs;
140 	pfil_head_t		 vtnet_pfil;
141 
142 	uint32_t		 vtnet_flags;
143 #define VTNET_FLAG_SUSPENDED	 0x0001
144 #define VTNET_FLAG_MAC		 0x0002
145 #define VTNET_FLAG_CTRL_VQ	 0x0004
146 #define VTNET_FLAG_CTRL_RX	 0x0008
147 #define VTNET_FLAG_CTRL_MAC	 0x0010
148 #define VTNET_FLAG_VLAN_FILTER	 0x0020
149 #define VTNET_FLAG_TSO_ECN	 0x0040
150 #define VTNET_FLAG_MRG_RXBUFS	 0x0080
151 #define VTNET_FLAG_LRO_NOMRG	 0x0100
152 #define VTNET_FLAG_MULTIQ	 0x0200
153 #define VTNET_FLAG_INDIRECT	 0x0400
154 #define VTNET_FLAG_EVENT_IDX	 0x0800
155 
156 	int			 vtnet_link_active;
157 	int			 vtnet_hdr_size;
158 	int			 vtnet_rx_process_limit;
159 	int			 vtnet_rx_nsegs;
160 	int			 vtnet_rx_nmbufs;
161 	int			 vtnet_rx_clsize;
162 	int			 vtnet_rx_new_clsize;
163 	int			 vtnet_tx_intr_thresh;
164 	int			 vtnet_tx_nsegs;
165 	int			 vtnet_if_flags;
166 	int			 vtnet_act_vq_pairs;
167 	int			 vtnet_max_vq_pairs;
168 	int			 vtnet_requested_vq_pairs;
169 
170 	struct virtqueue	*vtnet_ctrl_vq;
171 	struct vtnet_mac_filter	*vtnet_mac_filter;
172 	uint32_t		*vtnet_vlan_filter;
173 
174 	uint64_t		 vtnet_features;
175 	struct vtnet_statistics	 vtnet_stats;
176 	struct callout		 vtnet_tick_ch;
177 	struct ifmedia		 vtnet_media;
178 	eventhandler_tag	 vtnet_vlan_attach;
179 	eventhandler_tag	 vtnet_vlan_detach;
180 
181 	struct mtx		 vtnet_mtx;
182 	char			 vtnet_mtx_name[16];
183 	char			 vtnet_hwaddr[ETHER_ADDR_LEN];
184 };
185 
186 /*
187  * Maximum number of queue pairs we will autoconfigure to.
188  */
189 #define VTNET_MAX_QUEUE_PAIRS	8
190 
191 /*
192  * Additional completed entries can appear in a virtqueue before we can
193  * reenable interrupts. Number of times to retry before scheduling the
194  * taskqueue to process the completed entries.
195  */
196 #define VTNET_INTR_DISABLE_RETRIES	4
197 
198 /*
199  * Similarly, additional completed entries can appear in a virtqueue
200  * between when lasted checked and before notifying the host. Number
201  * of times to retry before scheduling the taskqueue to process the
202  * queue.
203  */
204 #define VTNET_NOTIFY_RETRIES		4
205 
206 /*
207  * Fake the media type. The host does not provide us with any real media
208  * information.
209  */
210 #define VTNET_MEDIATYPE		 (IFM_ETHER | IFM_10G_T | IFM_FDX)
211 
212 /*
213  * Number of words to allocate for the VLAN shadow table. There is one
214  * bit for each VLAN.
215  */
216 #define VTNET_VLAN_FILTER_NWORDS	(4096 / 32)
217 
218 /*
219  * When mergeable buffers are not negotiated, the vtnet_rx_header structure
220  * below is placed at the beginning of the mbuf data. Use 4 bytes of pad to
221  * both keep the VirtIO header and the data non-contiguous and to keep the
222  * frame's payload 4 byte aligned. Note that non-legacy drivers still want
223  * room for a full mergeable buffer header.
224  *
225  * When mergeable buffers are negotiated, the host puts the VirtIO header in
226  * the beginning of the first mbuf's data.
227  */
228 #define VTNET_RX_HEADER_PAD	4
229 struct vtnet_rx_header {
230 	union {
231 		struct virtio_net_hdr		hdr;
232 		struct virtio_net_hdr_mrg_rxbuf	mhdr;
233 	} vrh_uhdr;
234 
235 	char	vrh_pad[VTNET_RX_HEADER_PAD];
236 } __packed;
237 
238 /*
239  * For each outgoing frame, the vtnet_tx_header below is allocated from
240  * the vtnet_tx_header_zone.
241  */
242 struct vtnet_tx_header {
243 	union {
244 		struct virtio_net_hdr		hdr;
245 		struct virtio_net_hdr_mrg_rxbuf	mhdr;
246 	} vth_uhdr;
247 
248 	struct mbuf *vth_mbuf;
249 };
250 
251 /*
252  * The VirtIO specification does not place a limit on the number of MAC
253  * addresses the guest driver may request to be filtered. In practice,
254  * the host is constrained by available resources. To simplify this driver,
255  * impose a reasonably high limit of MAC addresses we will filter before
256  * falling back to promiscuous or all-multicast modes.
257  */
258 #define VTNET_MAX_MAC_ENTRIES	128
259 
260 struct vtnet_mac_table {
261 	uint32_t	nentries;
262 	uint8_t		macs[VTNET_MAX_MAC_ENTRIES][ETHER_ADDR_LEN];
263 } __packed;
264 
265 struct vtnet_mac_filter {
266 	struct vtnet_mac_table	vmf_unicast;
267 	uint32_t		vmf_pad; /* Make tables non-contiguous. */
268 	struct vtnet_mac_table	vmf_multicast;
269 };
270 
271 /*
272  * The MAC filter table is malloc(9)'d when needed. Ensure it will
273  * always fit in one segment.
274  */
275 CTASSERT(sizeof(struct vtnet_mac_filter) <= PAGE_SIZE);
276 
277 #define VTNET_TX_TIMEOUT	5
278 #define VTNET_CSUM_OFFLOAD	(CSUM_TCP | CSUM_UDP)
279 #define VTNET_CSUM_OFFLOAD_IPV6	(CSUM_TCP_IPV6 | CSUM_UDP_IPV6)
280 
281 #define VTNET_CSUM_ALL_OFFLOAD	\
282     (VTNET_CSUM_OFFLOAD | VTNET_CSUM_OFFLOAD_IPV6 | CSUM_TSO)
283 
284 /* Features desired/implemented by this driver. */
285 #define VTNET_FEATURES \
286     (VIRTIO_NET_F_MAC			| \
287      VIRTIO_NET_F_STATUS		| \
288      VIRTIO_NET_F_CTRL_VQ		| \
289      VIRTIO_NET_F_CTRL_RX		| \
290      VIRTIO_NET_F_CTRL_MAC_ADDR		| \
291      VIRTIO_NET_F_CTRL_VLAN		| \
292      VIRTIO_NET_F_CSUM			| \
293      VIRTIO_NET_F_GSO			| \
294      VIRTIO_NET_F_HOST_TSO4		| \
295      VIRTIO_NET_F_HOST_TSO6		| \
296      VIRTIO_NET_F_HOST_ECN		| \
297      VIRTIO_NET_F_GUEST_CSUM		| \
298      VIRTIO_NET_F_GUEST_TSO4		| \
299      VIRTIO_NET_F_GUEST_TSO6		| \
300      VIRTIO_NET_F_GUEST_ECN		| \
301      VIRTIO_NET_F_MRG_RXBUF		| \
302      VIRTIO_NET_F_MQ			| \
303      VIRTIO_RING_F_EVENT_IDX		| \
304      VIRTIO_RING_F_INDIRECT_DESC	| \
305      VIRTIO_F_VERSION_1)
306 
307 /*
308  * The VIRTIO_NET_F_HOST_TSO[46] features permit us to send the host
309  * frames larger than 1514 bytes.
310  */
311 #define VTNET_TSO_FEATURES (VIRTIO_NET_F_GSO | VIRTIO_NET_F_HOST_TSO4 | \
312     VIRTIO_NET_F_HOST_TSO6 | VIRTIO_NET_F_HOST_ECN)
313 
314 /*
315  * The VIRTIO_NET_F_GUEST_TSO[46] features permit the host to send us
316  * frames larger than 1514 bytes. We do not yet support software LRO
317  * via tcp_lro_rx().
318  */
319 #define VTNET_LRO_FEATURES (VIRTIO_NET_F_GUEST_TSO4 | \
320     VIRTIO_NET_F_GUEST_TSO6 | VIRTIO_NET_F_GUEST_ECN)
321 
322 #define VTNET_MAX_MTU		65536
323 #define VTNET_MAX_RX_SIZE	65550
324 
325 /*
326  * Used to preallocate the Vq indirect descriptors. The first segment
327  * is reserved for the header, except for mergeable buffers since the
328  * header is placed inline with the data.
329  */
330 #define VTNET_MRG_RX_SEGS	1
331 #define VTNET_MIN_RX_SEGS	2
332 #define VTNET_MAX_RX_SEGS	34
333 #define VTNET_MIN_TX_SEGS	32
334 #define VTNET_MAX_TX_SEGS	64
335 
336 /*
337  * Assert we can receive and transmit the maximum with regular
338  * size clusters.
339  */
340 CTASSERT(((VTNET_MAX_RX_SEGS - 1) * MCLBYTES) >= VTNET_MAX_RX_SIZE);
341 CTASSERT(((VTNET_MAX_TX_SEGS - 1) * MCLBYTES) >= VTNET_MAX_MTU);
342 
343 /*
344  * Number of slots in the Tx bufrings. This value matches most other
345  * multiqueue drivers.
346  */
347 #define VTNET_DEFAULT_BUFRING_SIZE	4096
348 
349 /*
350  * Determine how many mbufs are in each receive buffer. For LRO without
351  * mergeable buffers, we must allocate an mbuf chain large enough to
352  * hold both the vtnet_rx_header and the maximum receivable data.
353  */
354 #define VTNET_NEEDED_RX_MBUFS(_sc, _clsize)				\
355 	((_sc)->vtnet_flags & VTNET_FLAG_LRO_NOMRG) == 0 ? 1 :		\
356 	    howmany(sizeof(struct vtnet_rx_header) + VTNET_MAX_RX_SIZE,	\
357 	        (_clsize))
358 
359 #define VTNET_CORE_MTX(_sc)		&(_sc)->vtnet_mtx
360 #define VTNET_CORE_LOCK(_sc)		mtx_lock(VTNET_CORE_MTX((_sc)))
361 #define VTNET_CORE_UNLOCK(_sc)		mtx_unlock(VTNET_CORE_MTX((_sc)))
362 #define VTNET_CORE_LOCK_DESTROY(_sc)	mtx_destroy(VTNET_CORE_MTX((_sc)))
363 #define VTNET_CORE_LOCK_ASSERT(_sc)		\
364     mtx_assert(VTNET_CORE_MTX((_sc)), MA_OWNED)
365 #define VTNET_CORE_LOCK_ASSERT_NOTOWNED(_sc)	\
366     mtx_assert(VTNET_CORE_MTX((_sc)), MA_NOTOWNED)
367 
368 #define VTNET_CORE_LOCK_INIT(_sc) do {					\
369     snprintf((_sc)->vtnet_mtx_name, sizeof((_sc)->vtnet_mtx_name),	\
370         "%s", device_get_nameunit((_sc)->vtnet_dev));			\
371     mtx_init(VTNET_CORE_MTX((_sc)), (_sc)->vtnet_mtx_name,		\
372         "VTNET Core Lock", MTX_DEF);					\
373 } while (0)
374 
375 /*
376  * Values for the init_mode argument of vtnet_init_locked().
377  */
378 #define VTNET_INIT_NETMAP_ENTER		1
379 #define VTNET_INIT_NETMAP_EXIT		2
380 
381 #endif /* _IF_VTNETVAR_H */
382