1718cf2ccSPedro F. Giffuni /*-
24d846d26SWarner Losh * SPDX-License-Identifier: BSD-2-Clause
3718cf2ccSPedro F. Giffuni *
437e3a6d3SLuigi Rizzo * Copyright (C) 2011-2014 Matteo Landi, Luigi Rizzo
537e3a6d3SLuigi Rizzo * Copyright (C) 2013-2016 Universita` di Pisa
637e3a6d3SLuigi Rizzo * All rights reserved.
768b8534bSLuigi Rizzo *
868b8534bSLuigi Rizzo * Redistribution and use in source and binary forms, with or without
968b8534bSLuigi Rizzo * modification, are permitted provided that the following conditions
1068b8534bSLuigi Rizzo * are met:
1168b8534bSLuigi Rizzo * 1. Redistributions of source code must retain the above copyright
1268b8534bSLuigi Rizzo * notice, this list of conditions and the following disclaimer.
1368b8534bSLuigi Rizzo * 2. Redistributions in binary form must reproduce the above copyright
1468b8534bSLuigi Rizzo * notice, this list of conditions and the following disclaimer in the
1568b8534bSLuigi Rizzo * documentation and/or other materials provided with the distribution.
1668b8534bSLuigi Rizzo *
1768b8534bSLuigi Rizzo * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
1868b8534bSLuigi Rizzo * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
1968b8534bSLuigi Rizzo * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
2068b8534bSLuigi Rizzo * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
2168b8534bSLuigi Rizzo * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
2268b8534bSLuigi Rizzo * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
2368b8534bSLuigi Rizzo * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
2468b8534bSLuigi Rizzo * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
2568b8534bSLuigi Rizzo * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
2668b8534bSLuigi Rizzo * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
2768b8534bSLuigi Rizzo * SUCH DAMAGE.
2868b8534bSLuigi Rizzo */
2968b8534bSLuigi Rizzo
3068b8534bSLuigi Rizzo /*
3168b8534bSLuigi Rizzo *
3268b8534bSLuigi Rizzo * The header contains the definitions of constants and function
3368b8534bSLuigi Rizzo * prototypes used only in kernelspace.
3468b8534bSLuigi Rizzo */
3568b8534bSLuigi Rizzo
3668b8534bSLuigi Rizzo #ifndef _NET_NETMAP_KERN_H_
3768b8534bSLuigi Rizzo #define _NET_NETMAP_KERN_H_
3868b8534bSLuigi Rizzo
39847bf383SLuigi Rizzo #if defined(linux)
40847bf383SLuigi Rizzo
414f80b14cSVincenzo Maffione #if defined(CONFIG_NETMAP_EXTMEM)
424f80b14cSVincenzo Maffione #define WITH_EXTMEM
434f80b14cSVincenzo Maffione #endif
44847bf383SLuigi Rizzo #if defined(CONFIG_NETMAP_VALE)
45847bf383SLuigi Rizzo #define WITH_VALE
46847bf383SLuigi Rizzo #endif
47847bf383SLuigi Rizzo #if defined(CONFIG_NETMAP_PIPE)
48847bf383SLuigi Rizzo #define WITH_PIPES
49847bf383SLuigi Rizzo #endif
50847bf383SLuigi Rizzo #if defined(CONFIG_NETMAP_MONITOR)
51847bf383SLuigi Rizzo #define WITH_MONITOR
52847bf383SLuigi Rizzo #endif
53847bf383SLuigi Rizzo #if defined(CONFIG_NETMAP_GENERIC)
54847bf383SLuigi Rizzo #define WITH_GENERIC
55847bf383SLuigi Rizzo #endif
56b6e66be2SVincenzo Maffione #if defined(CONFIG_NETMAP_PTNETMAP)
57b6e66be2SVincenzo Maffione #define WITH_PTNETMAP
58847bf383SLuigi Rizzo #endif
59c3e9b4dbSLuiz Otavio O Souza #if defined(CONFIG_NETMAP_SINK)
60c3e9b4dbSLuiz Otavio O Souza #define WITH_SINK
61c3e9b4dbSLuiz Otavio O Souza #endif
62b6e66be2SVincenzo Maffione #if defined(CONFIG_NETMAP_NULL)
63b6e66be2SVincenzo Maffione #define WITH_NMNULL
64b6e66be2SVincenzo Maffione #endif
65847bf383SLuigi Rizzo
6637e3a6d3SLuigi Rizzo #elif defined (_WIN32)
67f9790aebSLuigi Rizzo #define WITH_VALE // comment out to disable VALE support
68f0ea3689SLuigi Rizzo #define WITH_PIPES
694bf50f18SLuigi Rizzo #define WITH_MONITOR
70039dd540SLuigi Rizzo #define WITH_GENERIC
71b6e66be2SVincenzo Maffione #define WITH_NMNULL
72f9790aebSLuigi Rizzo
7337e3a6d3SLuigi Rizzo #else /* neither linux nor windows */
7437e3a6d3SLuigi Rizzo #define WITH_VALE // comment out to disable VALE support
7537e3a6d3SLuigi Rizzo #define WITH_PIPES
7637e3a6d3SLuigi Rizzo #define WITH_MONITOR
7737e3a6d3SLuigi Rizzo #define WITH_GENERIC
782ff91c17SVincenzo Maffione #define WITH_EXTMEM
79b6e66be2SVincenzo Maffione #define WITH_NMNULL
80847bf383SLuigi Rizzo #endif
81847bf383SLuigi Rizzo
821a26580eSLuigi Rizzo #if defined(__FreeBSD__)
83225d33ffSSean Bruno #include <sys/selinfo.h>
84*1bae9dc5SMark Johnston #include <vm/vm.h>
85d4b42e08SLuigi Rizzo
86ce3ee1e7SLuigi Rizzo #define likely(x) __builtin_expect((long)!!(x), 1L)
87ce3ee1e7SLuigi Rizzo #define unlikely(x) __builtin_expect((long)!!(x), 0L)
8837e3a6d3SLuigi Rizzo #define __user
89f196ce38SLuigi Rizzo
90847bf383SLuigi Rizzo #define NM_LOCK_T struct mtx /* low level spinlock, used to protect queues */
91039dd540SLuigi Rizzo
92847bf383SLuigi Rizzo #define NM_MTX_T struct sx /* OS-specific mutex (sleepable) */
93847bf383SLuigi Rizzo #define NM_MTX_INIT(m) sx_init(&(m), #m)
94847bf383SLuigi Rizzo #define NM_MTX_DESTROY(m) sx_destroy(&(m))
95847bf383SLuigi Rizzo #define NM_MTX_LOCK(m) sx_xlock(&(m))
964f80b14cSVincenzo Maffione #define NM_MTX_SPINLOCK(m) while (!sx_try_xlock(&(m))) ;
97847bf383SLuigi Rizzo #define NM_MTX_UNLOCK(m) sx_xunlock(&(m))
98847bf383SLuigi Rizzo #define NM_MTX_ASSERT(m) sx_assert(&(m), SA_XLOCKED)
99f9790aebSLuigi Rizzo
1000e73f29aSLuigi Rizzo #define NM_SELINFO_T struct nm_selinfo
10137e3a6d3SLuigi Rizzo #define NM_SELRECORD_T struct thread
1021a26580eSLuigi Rizzo #define MBUF_LEN(m) ((m)->m_pkthdr.len)
10337e3a6d3SLuigi Rizzo #define MBUF_TXQ(m) ((m)->m_pkthdr.flowid)
10437e3a6d3SLuigi Rizzo #define MBUF_TRANSMIT(na, ifp, m) ((na)->if_transmit(ifp, m))
10537e3a6d3SLuigi Rizzo #define GEN_TX_MBUF_IFP(m) ((m)->m_pkthdr.rcvif)
10673fdbfb9STom Jones #define GEN_TX_MBUF_NA(m) ((struct netmap_adapter *)(m)->m_ext.ext_arg1)
107d4b42e08SLuigi Rizzo
1084f80b14cSVincenzo Maffione #define NM_ATOMIC_T volatile int /* required by atomic/bitops.h */
109f9790aebSLuigi Rizzo /* atomic operations */
110f9790aebSLuigi Rizzo #include <machine/atomic.h>
111f9790aebSLuigi Rizzo #define NM_ATOMIC_TEST_AND_SET(p) (!atomic_cmpset_acq_int((p), 0, 1))
112f9790aebSLuigi Rizzo #define NM_ATOMIC_CLEAR(p) atomic_store_rel_int((p), 0)
113f9790aebSLuigi Rizzo
11446aa1303SLuigi Rizzo struct netmap_adapter *netmap_getna(if_t ifp);
115f9790aebSLuigi Rizzo
11637e3a6d3SLuigi Rizzo #define MBUF_REFCNT(m) ((m)->m_ext.ext_count)
11737e3a6d3SLuigi Rizzo #define SET_MBUF_REFCNT(m, x) (m)->m_ext.ext_count = x
1184bf50f18SLuigi Rizzo
11937e3a6d3SLuigi Rizzo #define MBUF_QUEUED(m) 1
120f9790aebSLuigi Rizzo
1210e73f29aSLuigi Rizzo struct nm_selinfo {
12245100257SVincenzo Maffione /* Support for select(2) and poll(2). */
1230e73f29aSLuigi Rizzo struct selinfo si;
12445100257SVincenzo Maffione /* Support for kqueue(9). See comments in netmap_freebsd.c */
12519c4ec08SVincenzo Maffione struct taskqueue *ntfytq;
12619c4ec08SVincenzo Maffione struct task ntfytask;
1270e73f29aSLuigi Rizzo struct mtx m;
12819c4ec08SVincenzo Maffione char mtxname[32];
12945100257SVincenzo Maffione int kqueue_users;
1300e73f29aSLuigi Rizzo };
1310e73f29aSLuigi Rizzo
1320e73f29aSLuigi Rizzo
133f9790aebSLuigi Rizzo struct hrtimer {
1344f80b14cSVincenzo Maffione /* Not used in FreeBSD. */
135f9790aebSLuigi Rizzo };
1364f80b14cSVincenzo Maffione
137847bf383SLuigi Rizzo #define NM_BNS_GET(b)
138847bf383SLuigi Rizzo #define NM_BNS_PUT(b)
139ce3ee1e7SLuigi Rizzo
14064ae02c3SLuigi Rizzo #elif defined (linux)
141d4b42e08SLuigi Rizzo
1422579e2d7SLuigi Rizzo #define NM_LOCK_T safe_spinlock_t // see bsd_glue.h
1431a26580eSLuigi Rizzo #define NM_SELINFO_T wait_queue_head_t
1441a26580eSLuigi Rizzo #define MBUF_LEN(m) ((m)->len)
14537e3a6d3SLuigi Rizzo #define MBUF_TRANSMIT(na, ifp, m) \
14637e3a6d3SLuigi Rizzo ({ \
14737e3a6d3SLuigi Rizzo /* Avoid infinite recursion with generic. */ \
14837e3a6d3SLuigi Rizzo m->priority = NM_MAGIC_PRIORITY_TX; \
14937e3a6d3SLuigi Rizzo (((struct net_device_ops *)(na)->if_transmit)->ndo_start_xmit(m, ifp)); \
15037e3a6d3SLuigi Rizzo 0; \
15137e3a6d3SLuigi Rizzo })
15237e3a6d3SLuigi Rizzo
15337e3a6d3SLuigi Rizzo /* See explanation in nm_os_generic_xmit_frame. */
154e330262fSJustin Hibbits #define GEN_TX_MBUF_IFP(m) ((if_t)skb_shinfo(m)->destructor_arg)
155f196ce38SLuigi Rizzo
156ce3ee1e7SLuigi Rizzo #define NM_ATOMIC_T volatile long unsigned int
157ce3ee1e7SLuigi Rizzo
158847bf383SLuigi Rizzo #define NM_MTX_T struct mutex /* OS-specific sleepable lock */
159847bf383SLuigi Rizzo #define NM_MTX_INIT(m) mutex_init(&(m))
160847bf383SLuigi Rizzo #define NM_MTX_DESTROY(m) do { (void)(m); } while (0)
161039dd540SLuigi Rizzo #define NM_MTX_LOCK(m) mutex_lock(&(m))
162039dd540SLuigi Rizzo #define NM_MTX_UNLOCK(m) mutex_unlock(&(m))
163847bf383SLuigi Rizzo #define NM_MTX_ASSERT(m) mutex_is_locked(&(m))
164f9790aebSLuigi Rizzo
165f196ce38SLuigi Rizzo #ifndef DEV_NETMAP
166f196ce38SLuigi Rizzo #define DEV_NETMAP
167ce3ee1e7SLuigi Rizzo #endif /* DEV_NETMAP */
168f196ce38SLuigi Rizzo
169f196ce38SLuigi Rizzo #elif defined (__APPLE__)
170d4b42e08SLuigi Rizzo
1718241616dSLuigi Rizzo #warning apple support is incomplete.
172f196ce38SLuigi Rizzo #define likely(x) __builtin_expect(!!(x), 1)
173f196ce38SLuigi Rizzo #define unlikely(x) __builtin_expect(!!(x), 0)
174f196ce38SLuigi Rizzo #define NM_LOCK_T IOLock *
175f196ce38SLuigi Rizzo #define NM_SELINFO_T struct selinfo
176f196ce38SLuigi Rizzo #define MBUF_LEN(m) ((m)->m_pkthdr.len)
17737e3a6d3SLuigi Rizzo
17837e3a6d3SLuigi Rizzo #elif defined (_WIN32)
17937e3a6d3SLuigi Rizzo #include "../../../WINDOWS/win_glue.h"
18037e3a6d3SLuigi Rizzo
18137e3a6d3SLuigi Rizzo #define NM_SELRECORD_T IO_STACK_LOCATION
18237e3a6d3SLuigi Rizzo #define NM_SELINFO_T win_SELINFO // see win_glue.h
18337e3a6d3SLuigi Rizzo #define NM_LOCK_T win_spinlock_t // see win_glue.h
18437e3a6d3SLuigi Rizzo #define NM_MTX_T KGUARDED_MUTEX /* OS-specific mutex (sleepable) */
18537e3a6d3SLuigi Rizzo
18637e3a6d3SLuigi Rizzo #define NM_MTX_INIT(m) KeInitializeGuardedMutex(&m);
18737e3a6d3SLuigi Rizzo #define NM_MTX_DESTROY(m) do { (void)(m); } while (0)
18837e3a6d3SLuigi Rizzo #define NM_MTX_LOCK(m) KeAcquireGuardedMutex(&(m))
18937e3a6d3SLuigi Rizzo #define NM_MTX_UNLOCK(m) KeReleaseGuardedMutex(&(m))
19037e3a6d3SLuigi Rizzo #define NM_MTX_ASSERT(m) assert(&m.Count>0)
19137e3a6d3SLuigi Rizzo
19237e3a6d3SLuigi Rizzo //These linknames are for the NDIS driver
19337e3a6d3SLuigi Rizzo #define NETMAP_NDIS_LINKNAME_STRING L"\\DosDevices\\NMAPNDIS"
19437e3a6d3SLuigi Rizzo #define NETMAP_NDIS_NTDEVICE_STRING L"\\Device\\NMAPNDIS"
19537e3a6d3SLuigi Rizzo
19637e3a6d3SLuigi Rizzo //Definition of internal driver-to-driver ioctl codes
19737e3a6d3SLuigi Rizzo #define NETMAP_KERNEL_XCHANGE_POINTERS _IO('i', 180)
19837e3a6d3SLuigi Rizzo #define NETMAP_KERNEL_SEND_SHUTDOWN_SIGNAL _IO_direct('i', 195)
19937e3a6d3SLuigi Rizzo
20037e3a6d3SLuigi Rizzo typedef struct hrtimer{
20137e3a6d3SLuigi Rizzo KTIMER timer;
20237e3a6d3SLuigi Rizzo BOOLEAN active;
20337e3a6d3SLuigi Rizzo KDPC deferred_proc;
20437e3a6d3SLuigi Rizzo };
20537e3a6d3SLuigi Rizzo
20637e3a6d3SLuigi Rizzo /* MSVC does not have likely/unlikely support */
20737e3a6d3SLuigi Rizzo #ifdef _MSC_VER
20837e3a6d3SLuigi Rizzo #define likely(x) (x)
20937e3a6d3SLuigi Rizzo #define unlikely(x) (x)
21037e3a6d3SLuigi Rizzo #else
21137e3a6d3SLuigi Rizzo #define likely(x) __builtin_expect((long)!!(x), 1L)
21237e3a6d3SLuigi Rizzo #define unlikely(x) __builtin_expect((long)!!(x), 0L)
21337e3a6d3SLuigi Rizzo #endif //_MSC_VER
214f196ce38SLuigi Rizzo
2151a26580eSLuigi Rizzo #else
216d4b42e08SLuigi Rizzo
2171a26580eSLuigi Rizzo #error unsupported platform
218d4b42e08SLuigi Rizzo
219d4b42e08SLuigi Rizzo #endif /* end - platform-specific code */
2201a26580eSLuigi Rizzo
22137e3a6d3SLuigi Rizzo #ifndef _WIN32 /* support for emulated sysctl */
22237e3a6d3SLuigi Rizzo #define SYSBEGIN(x)
22337e3a6d3SLuigi Rizzo #define SYSEND
22437e3a6d3SLuigi Rizzo #endif /* _WIN32 */
22537e3a6d3SLuigi Rizzo
22637e3a6d3SLuigi Rizzo #define NM_ACCESS_ONCE(x) (*(volatile __typeof__(x) *)&(x))
22737e3a6d3SLuigi Rizzo
228847bf383SLuigi Rizzo #define NMG_LOCK_T NM_MTX_T
229847bf383SLuigi Rizzo #define NMG_LOCK_INIT() NM_MTX_INIT(netmap_global_lock)
230847bf383SLuigi Rizzo #define NMG_LOCK_DESTROY() NM_MTX_DESTROY(netmap_global_lock)
231847bf383SLuigi Rizzo #define NMG_LOCK() NM_MTX_LOCK(netmap_global_lock)
232847bf383SLuigi Rizzo #define NMG_UNLOCK() NM_MTX_UNLOCK(netmap_global_lock)
233847bf383SLuigi Rizzo #define NMG_LOCK_ASSERT() NM_MTX_ASSERT(netmap_global_lock)
234847bf383SLuigi Rizzo
235c3e9b4dbSLuiz Otavio O Souza #if defined(__FreeBSD__)
236b6e66be2SVincenzo Maffione #define nm_prerr_int printf
237b6e66be2SVincenzo Maffione #define nm_prinf_int printf
238c3e9b4dbSLuiz Otavio O Souza #elif defined (_WIN32)
239b6e66be2SVincenzo Maffione #define nm_prerr_int DbgPrint
240b6e66be2SVincenzo Maffione #define nm_prinf_int DbgPrint
241c3e9b4dbSLuiz Otavio O Souza #elif defined(linux)
242b6e66be2SVincenzo Maffione #define nm_prerr_int(fmt, arg...) printk(KERN_ERR fmt, ##arg)
243b6e66be2SVincenzo Maffione #define nm_prinf_int(fmt, arg...) printk(KERN_INFO fmt, ##arg)
244c3e9b4dbSLuiz Otavio O Souza #endif
245c3e9b4dbSLuiz Otavio O Souza
246b6e66be2SVincenzo Maffione #define nm_prinf(format, ...) \
24768b8534bSLuigi Rizzo do { \
24868b8534bSLuigi Rizzo struct timeval __xxts; \
24968b8534bSLuigi Rizzo microtime(&__xxts); \
250b6e66be2SVincenzo Maffione nm_prinf_int("%03d.%06d [%4d] %-25s " format "\n",\
25168b8534bSLuigi Rizzo (int)__xxts.tv_sec % 1000, (int)__xxts.tv_usec, \
25217885a7bSLuigi Rizzo __LINE__, __FUNCTION__, ##__VA_ARGS__); \
25368b8534bSLuigi Rizzo } while (0)
25468b8534bSLuigi Rizzo
255b6e66be2SVincenzo Maffione #define nm_prerr(format, ...) \
256b6e66be2SVincenzo Maffione do { \
257b6e66be2SVincenzo Maffione struct timeval __xxts; \
258b6e66be2SVincenzo Maffione microtime(&__xxts); \
259b6e66be2SVincenzo Maffione nm_prerr_int("%03d.%06d [%4d] %-25s " format "\n",\
260b6e66be2SVincenzo Maffione (int)__xxts.tv_sec % 1000, (int)__xxts.tv_usec, \
261b6e66be2SVincenzo Maffione __LINE__, __FUNCTION__, ##__VA_ARGS__); \
262b6e66be2SVincenzo Maffione } while (0)
263b6e66be2SVincenzo Maffione
26475f4f3edSVincenzo Maffione /* Disabled printf (used to be nm_prdis). */
265b6e66be2SVincenzo Maffione #define nm_prdis(format, ...)
266b6e66be2SVincenzo Maffione
267b6e66be2SVincenzo Maffione /* Rate limited, lps indicates how many per second. */
268b6e66be2SVincenzo Maffione #define nm_prlim(lps, format, ...) \
2698241616dSLuigi Rizzo do { \
2708241616dSLuigi Rizzo static int t0, __cnt; \
2718241616dSLuigi Rizzo if (t0 != time_second) { \
2728241616dSLuigi Rizzo t0 = time_second; \
2738241616dSLuigi Rizzo __cnt = 0; \
2748241616dSLuigi Rizzo } \
2758241616dSLuigi Rizzo if (__cnt++ < lps) \
276b6e66be2SVincenzo Maffione nm_prinf(format, ##__VA_ARGS__); \
2778241616dSLuigi Rizzo } while (0)
2788241616dSLuigi Rizzo
27968b8534bSLuigi Rizzo struct netmap_adapter;
280f18be576SLuigi Rizzo struct nm_bdg_fwd;
281f18be576SLuigi Rizzo struct nm_bridge;
282f18be576SLuigi Rizzo struct netmap_priv_d;
2832a7db7a6SVincenzo Maffione struct nm_bdg_args;
28468b8534bSLuigi Rizzo
28545c67e8fSVincenzo Maffione /* os-specific NM_SELINFO_T initialization/destruction functions */
28619c4ec08SVincenzo Maffione int nm_os_selinfo_init(NM_SELINFO_T *, const char *name);
28737e3a6d3SLuigi Rizzo void nm_os_selinfo_uninit(NM_SELINFO_T *);
28837e3a6d3SLuigi Rizzo
289ce3ee1e7SLuigi Rizzo const char *nm_dump_buf(char *p, int len, int lim, char *dst);
290ce3ee1e7SLuigi Rizzo
29137e3a6d3SLuigi Rizzo void nm_os_selwakeup(NM_SELINFO_T *si);
29237e3a6d3SLuigi Rizzo void nm_os_selrecord(NM_SELRECORD_T *sr, NM_SELINFO_T *si);
29337e3a6d3SLuigi Rizzo
29437e3a6d3SLuigi Rizzo int nm_os_ifnet_init(void);
29537e3a6d3SLuigi Rizzo void nm_os_ifnet_fini(void);
29637e3a6d3SLuigi Rizzo void nm_os_ifnet_lock(void);
29737e3a6d3SLuigi Rizzo void nm_os_ifnet_unlock(void);
29837e3a6d3SLuigi Rizzo
299e330262fSJustin Hibbits unsigned nm_os_ifnet_mtu(if_t ifp);
3004f80b14cSVincenzo Maffione
30137e3a6d3SLuigi Rizzo void nm_os_get_module(void);
30237e3a6d3SLuigi Rizzo void nm_os_put_module(void);
30337e3a6d3SLuigi Rizzo
304e330262fSJustin Hibbits void netmap_make_zombie(if_t);
305e330262fSJustin Hibbits void netmap_undo_zombie(if_t);
30637e3a6d3SLuigi Rizzo
307c3e9b4dbSLuiz Otavio O Souza /* os independent alloc/realloc/free */
308c3e9b4dbSLuiz Otavio O Souza void *nm_os_malloc(size_t);
3094f80b14cSVincenzo Maffione void *nm_os_vmalloc(size_t);
310c3e9b4dbSLuiz Otavio O Souza void *nm_os_realloc(void *, size_t new_size, size_t old_size);
311c3e9b4dbSLuiz Otavio O Souza void nm_os_free(void *);
3124f80b14cSVincenzo Maffione void nm_os_vfree(void *);
313c3e9b4dbSLuiz Otavio O Souza
3142a7db7a6SVincenzo Maffione /* os specific attach/detach enter/exit-netmap-mode routines */
315e330262fSJustin Hibbits void nm_os_onattach(if_t);
316e330262fSJustin Hibbits void nm_os_ondetach(if_t);
317e330262fSJustin Hibbits void nm_os_onenter(if_t);
318e330262fSJustin Hibbits void nm_os_onexit(if_t);
3192a7db7a6SVincenzo Maffione
32037e3a6d3SLuigi Rizzo /* passes a packet up to the host stack.
32137e3a6d3SLuigi Rizzo * If the packet is sent (or dropped) immediately it returns NULL,
32237e3a6d3SLuigi Rizzo * otherwise it links the packet to prev and returns m.
32337e3a6d3SLuigi Rizzo * In this case, a final call with m=NULL and prev != NULL will send up
32437e3a6d3SLuigi Rizzo * the entire chain to the host stack.
32537e3a6d3SLuigi Rizzo */
326e330262fSJustin Hibbits void *nm_os_send_up(if_t, struct mbuf *m, struct mbuf *prev);
32737e3a6d3SLuigi Rizzo
3282a7db7a6SVincenzo Maffione int nm_os_mbuf_has_seg_offld(struct mbuf *m);
3292a7db7a6SVincenzo Maffione int nm_os_mbuf_has_csum_offld(struct mbuf *m);
33037e3a6d3SLuigi Rizzo
331f9790aebSLuigi Rizzo #include "netmap_mbq.h"
332f9790aebSLuigi Rizzo
333f9790aebSLuigi Rizzo extern NMG_LOCK_T netmap_global_lock;
334f9790aebSLuigi Rizzo
335847bf383SLuigi Rizzo enum txrx { NR_RX = 0, NR_TX = 1, NR_TXRX };
336847bf383SLuigi Rizzo
337847bf383SLuigi Rizzo static __inline const char*
nm_txrx2str(enum txrx t)338847bf383SLuigi Rizzo nm_txrx2str(enum txrx t)
339847bf383SLuigi Rizzo {
340847bf383SLuigi Rizzo return (t== NR_RX ? "RX" : "TX");
341847bf383SLuigi Rizzo }
342847bf383SLuigi Rizzo
343847bf383SLuigi Rizzo static __inline enum txrx
nm_txrx_swap(enum txrx t)344847bf383SLuigi Rizzo nm_txrx_swap(enum txrx t)
345847bf383SLuigi Rizzo {
346847bf383SLuigi Rizzo return (t== NR_RX ? NR_TX : NR_RX);
347847bf383SLuigi Rizzo }
348847bf383SLuigi Rizzo
349847bf383SLuigi Rizzo #define for_rx_tx(t) for ((t) = 0; (t) < NR_TXRX; (t)++)
350847bf383SLuigi Rizzo
351c3e9b4dbSLuiz Otavio O Souza #ifdef WITH_MONITOR
352c3e9b4dbSLuiz Otavio O Souza struct netmap_zmon_list {
353c3e9b4dbSLuiz Otavio O Souza struct netmap_kring *next;
354c3e9b4dbSLuiz Otavio O Souza struct netmap_kring *prev;
355c3e9b4dbSLuiz Otavio O Souza };
356c3e9b4dbSLuiz Otavio O Souza #endif /* WITH_MONITOR */
357847bf383SLuigi Rizzo
35868b8534bSLuigi Rizzo /*
35964ae02c3SLuigi Rizzo * private, kernel view of a ring. Keeps track of the status of
36064ae02c3SLuigi Rizzo * a ring across system calls.
36164ae02c3SLuigi Rizzo *
36264ae02c3SLuigi Rizzo * nr_hwcur index of the next buffer to refill.
36317885a7bSLuigi Rizzo * It corresponds to ring->head
36417885a7bSLuigi Rizzo * at the time the system call returns.
36564ae02c3SLuigi Rizzo *
36617885a7bSLuigi Rizzo * nr_hwtail index of the first buffer owned by the kernel.
36717885a7bSLuigi Rizzo * On RX, hwcur->hwtail are receive buffers
36817885a7bSLuigi Rizzo * not yet released. hwcur is advanced following
36917885a7bSLuigi Rizzo * ring->head, hwtail is advanced on incoming packets,
37017885a7bSLuigi Rizzo * and a wakeup is generated when hwtail passes ring->cur
37117885a7bSLuigi Rizzo * On TX, hwcur->rcur have been filled by the sender
37217885a7bSLuigi Rizzo * but not sent yet to the NIC; rcur->hwtail are available
37317885a7bSLuigi Rizzo * for new transmissions, and hwtail->hwcur-1 are pending
37417885a7bSLuigi Rizzo * transmissions not yet acknowledged.
37568b8534bSLuigi Rizzo *
3761a26580eSLuigi Rizzo * The indexes in the NIC and netmap rings are offset by nkr_hwofs slots.
37768b8534bSLuigi Rizzo * This is so that, on a reset, buffers owned by userspace are not
37868b8534bSLuigi Rizzo * modified by the kernel. In particular:
37917885a7bSLuigi Rizzo * RX rings: the next empty buffer (hwtail + hwofs) coincides with
38068b8534bSLuigi Rizzo * the next empty buffer as known by the hardware (next_to_check or so).
38168b8534bSLuigi Rizzo * TX rings: hwcur + hwofs coincides with next_to_send
3821dce924dSLuigi Rizzo *
383ce3ee1e7SLuigi Rizzo * The following fields are used to implement lock-free copy of packets
384ce3ee1e7SLuigi Rizzo * from input to output ports in VALE switch:
385ce3ee1e7SLuigi Rizzo * nkr_hwlease buffer after the last one being copied.
386ce3ee1e7SLuigi Rizzo * A writer in nm_bdg_flush reserves N buffers
387ce3ee1e7SLuigi Rizzo * from nr_hwlease, advances it, then does the
388ce3ee1e7SLuigi Rizzo * copy outside the lock.
389ce3ee1e7SLuigi Rizzo * In RX rings (used for VALE ports),
39017885a7bSLuigi Rizzo * nkr_hwtail <= nkr_hwlease < nkr_hwcur+N-1
391ce3ee1e7SLuigi Rizzo * In TX rings (used for NIC or host stack ports)
39217885a7bSLuigi Rizzo * nkr_hwcur <= nkr_hwlease < nkr_hwtail
393ce3ee1e7SLuigi Rizzo * nkr_leases array of nkr_num_slots where writers can report
394ce3ee1e7SLuigi Rizzo * completion of their block. NR_NOSLOT (~0) indicates
395ce3ee1e7SLuigi Rizzo * that the writer has not finished yet
396ce3ee1e7SLuigi Rizzo * nkr_lease_idx index of next free slot in nr_leases, to be assigned
397ce3ee1e7SLuigi Rizzo *
398ce3ee1e7SLuigi Rizzo * The kring is manipulated by txsync/rxsync and generic netmap function.
39917885a7bSLuigi Rizzo *
40017885a7bSLuigi Rizzo * Concurrent rxsync or txsync on the same ring are prevented through
40189cc2556SLuigi Rizzo * by nm_kr_(try)lock() which in turn uses nr_busy. This is all we need
40217885a7bSLuigi Rizzo * for NIC rings, and for TX rings attached to the host stack.
40317885a7bSLuigi Rizzo *
40417885a7bSLuigi Rizzo * RX rings attached to the host stack use an mbq (rx_queue) on both
40517885a7bSLuigi Rizzo * rxsync_from_host() and netmap_transmit(). The mbq is protected
40617885a7bSLuigi Rizzo * by its internal lock.
40717885a7bSLuigi Rizzo *
4084bf50f18SLuigi Rizzo * RX rings attached to the VALE switch are accessed by both senders
40917885a7bSLuigi Rizzo * and receiver. They are protected through the q_lock on the RX ring.
41068b8534bSLuigi Rizzo */
41168b8534bSLuigi Rizzo struct netmap_kring {
41268b8534bSLuigi Rizzo struct netmap_ring *ring;
41317885a7bSLuigi Rizzo
4142ff91c17SVincenzo Maffione uint32_t nr_hwcur; /* should be nr_hwhead */
41517885a7bSLuigi Rizzo uint32_t nr_hwtail;
41617885a7bSLuigi Rizzo
41717885a7bSLuigi Rizzo /*
41817885a7bSLuigi Rizzo * Copies of values in user rings, so we do not need to look
41917885a7bSLuigi Rizzo * at the ring (which could be modified). These are set in the
42017885a7bSLuigi Rizzo * *sync_prologue()/finalize() routines.
42117885a7bSLuigi Rizzo */
42217885a7bSLuigi Rizzo uint32_t rhead;
42317885a7bSLuigi Rizzo uint32_t rcur;
42417885a7bSLuigi Rizzo uint32_t rtail;
42517885a7bSLuigi Rizzo
426ce3ee1e7SLuigi Rizzo uint32_t nr_kflags; /* private driver flags */
4272157a17cSLuigi Rizzo #define NKR_PENDINTR 0x1 // Pending interrupt.
428847bf383SLuigi Rizzo #define NKR_EXCLUSIVE 0x2 /* exclusive binding */
42937e3a6d3SLuigi Rizzo #define NKR_FORWARD 0x4 /* (host ring only) there are
43037e3a6d3SLuigi Rizzo packets to forward
43137e3a6d3SLuigi Rizzo */
43237e3a6d3SLuigi Rizzo #define NKR_NEEDRING 0x8 /* ring needed even if users==0
43337e3a6d3SLuigi Rizzo * (used internally by pipes and
43437e3a6d3SLuigi Rizzo * by ptnetmap host ports)
43537e3a6d3SLuigi Rizzo */
4364f80b14cSVincenzo Maffione #define NKR_NOINTR 0x10 /* don't use interrupts on this ring */
4372ff91c17SVincenzo Maffione #define NKR_FAKERING 0x20 /* don't allocate/free buffers */
43837e3a6d3SLuigi Rizzo
43937e3a6d3SLuigi Rizzo uint32_t nr_mode;
44037e3a6d3SLuigi Rizzo uint32_t nr_pending_mode;
44137e3a6d3SLuigi Rizzo #define NKR_NETMAP_OFF 0x0
44237e3a6d3SLuigi Rizzo #define NKR_NETMAP_ON 0x1
44337e3a6d3SLuigi Rizzo
444ce3ee1e7SLuigi Rizzo uint32_t nkr_num_slots;
44517885a7bSLuigi Rizzo
44617885a7bSLuigi Rizzo /*
44717885a7bSLuigi Rizzo * On a NIC reset, the NIC ring indexes may be reset but the
44817885a7bSLuigi Rizzo * indexes in the netmap rings remain the same. nkr_hwofs
44917885a7bSLuigi Rizzo * keeps track of the offset between the two.
450a6d768d8SVincenzo Maffione *
451a6d768d8SVincenzo Maffione * Moreover, during reset, we can restore only the subset of
452a6d768d8SVincenzo Maffione * the NIC ring that corresponds to the kernel-owned part of
453a6d768d8SVincenzo Maffione * the netmap ring. The rest of the slots must be restored
454a6d768d8SVincenzo Maffione * by the *sync routines when the user releases more slots.
455a6d768d8SVincenzo Maffione * The nkr_to_refill field keeps track of the number of slots
456a6d768d8SVincenzo Maffione * that still need to be restored.
45717885a7bSLuigi Rizzo */
45817885a7bSLuigi Rizzo int32_t nkr_hwofs;
459a6d768d8SVincenzo Maffione int32_t nkr_to_refill;
46068b8534bSLuigi Rizzo
46117885a7bSLuigi Rizzo /* last_reclaim is opaque marker to help reduce the frequency
46217885a7bSLuigi Rizzo * of operations such as reclaiming tx buffers. A possible use
46317885a7bSLuigi Rizzo * is set it to ticks and do the reclaim only once per tick.
46417885a7bSLuigi Rizzo */
46517885a7bSLuigi Rizzo uint64_t last_reclaim;
46617885a7bSLuigi Rizzo
467ce3ee1e7SLuigi Rizzo
4681a26580eSLuigi Rizzo NM_SELINFO_T si; /* poll/select wait queue */
469ce3ee1e7SLuigi Rizzo NM_LOCK_T q_lock; /* protects kring and ring. */
470ce3ee1e7SLuigi Rizzo NM_ATOMIC_T nr_busy; /* prevent concurrent syscalls */
471ce3ee1e7SLuigi Rizzo
4722ff91c17SVincenzo Maffione /* the adapter the owns this kring */
47317885a7bSLuigi Rizzo struct netmap_adapter *na;
47417885a7bSLuigi Rizzo
4752ff91c17SVincenzo Maffione /* the adapter that wants to be notified when this kring has
47645c67e8fSVincenzo Maffione * new slots available. This is usually the same as the above,
4772ff91c17SVincenzo Maffione * but wrappers may let it point to themselves
4782ff91c17SVincenzo Maffione */
4792ff91c17SVincenzo Maffione struct netmap_adapter *notify_na;
4802ff91c17SVincenzo Maffione
4816435a0dcSLuigi Rizzo /* The following fields are for VALE switch support */
48217885a7bSLuigi Rizzo struct nm_bdg_fwd *nkr_ft;
48317885a7bSLuigi Rizzo uint32_t *nkr_leases;
48417885a7bSLuigi Rizzo #define NR_NOSLOT ((uint32_t)~0) /* used in nkr_*lease* */
48517885a7bSLuigi Rizzo uint32_t nkr_hwlease;
48617885a7bSLuigi Rizzo uint32_t nkr_lease_idx;
48717885a7bSLuigi Rizzo
4884bf50f18SLuigi Rizzo /* while nkr_stopped is set, no new [tr]xsync operations can
4894bf50f18SLuigi Rizzo * be started on this kring.
4904bf50f18SLuigi Rizzo * This is used by netmap_disable_all_rings()
4914bf50f18SLuigi Rizzo * to find a synchronization point where critical data
4924bf50f18SLuigi Rizzo * structures pointed to by the kring can be added or removed
4934bf50f18SLuigi Rizzo */
4944bf50f18SLuigi Rizzo volatile int nkr_stopped;
495f9790aebSLuigi Rizzo
496f0ea3689SLuigi Rizzo /* Support for adapters without native netmap support.
497f9790aebSLuigi Rizzo * On tx rings we preallocate an array of tx buffers
498f9790aebSLuigi Rizzo * (same size as the netmap ring), on rx rings we
499f0ea3689SLuigi Rizzo * store incoming mbufs in a queue that is drained by
500f0ea3689SLuigi Rizzo * a rxsync.
501f9790aebSLuigi Rizzo */
502f9790aebSLuigi Rizzo struct mbuf **tx_pool;
50337e3a6d3SLuigi Rizzo struct mbuf *tx_event; /* TX event used as a notification */
50437e3a6d3SLuigi Rizzo NM_LOCK_T tx_event_lock; /* protects the tx_event mbuf */
505ce12afaaSMark Johnston #ifdef __FreeBSD__
506ce12afaaSMark Johnston struct callout tx_event_callout;
507ce12afaaSMark Johnston #endif
50817885a7bSLuigi Rizzo struct mbq rx_queue; /* intercepted rx mbufs. */
50917885a7bSLuigi Rizzo
510847bf383SLuigi Rizzo uint32_t users; /* existing bindings for this ring */
511847bf383SLuigi Rizzo
51237e3a6d3SLuigi Rizzo uint32_t ring_id; /* kring identifier */
513847bf383SLuigi Rizzo enum txrx tx; /* kind of ring (tx or rx) */
51417885a7bSLuigi Rizzo char name[64]; /* diagnostic */
515f9790aebSLuigi Rizzo
5164bf50f18SLuigi Rizzo /* [tx]sync callback for this kring.
5174bf50f18SLuigi Rizzo * The default nm_kring_create callback (netmap_krings_create)
5184bf50f18SLuigi Rizzo * sets the nm_sync callback of each hardware tx(rx) kring to
5194bf50f18SLuigi Rizzo * the corresponding nm_txsync(nm_rxsync) taken from the
5204bf50f18SLuigi Rizzo * netmap_adapter; moreover, it sets the sync callback
5214bf50f18SLuigi Rizzo * of the host tx(rx) ring to netmap_txsync_to_host
5224bf50f18SLuigi Rizzo * (netmap_rxsync_from_host).
5234bf50f18SLuigi Rizzo *
5244bf50f18SLuigi Rizzo * Overrides: the above configuration is not changed by
5254bf50f18SLuigi Rizzo * any of the nm_krings_create callbacks.
5264bf50f18SLuigi Rizzo */
527f0ea3689SLuigi Rizzo int (*nm_sync)(struct netmap_kring *kring, int flags);
528847bf383SLuigi Rizzo int (*nm_notify)(struct netmap_kring *kring, int flags);
529f0ea3689SLuigi Rizzo
530f0ea3689SLuigi Rizzo #ifdef WITH_PIPES
5314bf50f18SLuigi Rizzo struct netmap_kring *pipe; /* if this is a pipe ring,
5324bf50f18SLuigi Rizzo * pointer to the other end
5334bf50f18SLuigi Rizzo */
5342a7db7a6SVincenzo Maffione uint32_t pipe_tail; /* hwtail updated by the other end */
535f0ea3689SLuigi Rizzo #endif /* WITH_PIPES */
536f0ea3689SLuigi Rizzo
537a6d768d8SVincenzo Maffione /* mask for the offset-related part of the ptr field in the slots */
538a6d768d8SVincenzo Maffione uint64_t offset_mask;
539a6d768d8SVincenzo Maffione /* maximum user-specified offset, as stipulated at bind time.
540a6d768d8SVincenzo Maffione * Larger offset requests will be silently capped to offset_max.
541a6d768d8SVincenzo Maffione */
542a6d768d8SVincenzo Maffione uint64_t offset_max;
543a6d768d8SVincenzo Maffione /* minimum gap between two consecutive offsets into the same
544a6d768d8SVincenzo Maffione * buffer, as stipulated at bind time. This is used to choose
545a6d768d8SVincenzo Maffione * the hwbuf_len, but is not otherwise checked for compliance
546a6d768d8SVincenzo Maffione * at runtime.
547a6d768d8SVincenzo Maffione */
548a6d768d8SVincenzo Maffione uint64_t offset_gap;
549a6d768d8SVincenzo Maffione
550a6d768d8SVincenzo Maffione /* size of hardware buffer. This may be less than the size of
551a6d768d8SVincenzo Maffione * the netmap buffers because of non-zero offsets, or because
552a6d768d8SVincenzo Maffione * the netmap buffer size exceeds the capability of the hardware.
553a6d768d8SVincenzo Maffione */
554a6d768d8SVincenzo Maffione uint64_t hwbuf_len;
555a6d768d8SVincenzo Maffione
55645c67e8fSVincenzo Maffione /* required alignment (in bytes) for the buffers used by this ring.
557a6d768d8SVincenzo Maffione * Netmap buffers are aligned to cachelines, which should suffice
558a6d768d8SVincenzo Maffione * for most NICs. If the user is passing offsets, though, we need
559a6d768d8SVincenzo Maffione * to check that the resulting buf address complies with any
560a6d768d8SVincenzo Maffione * alignment restriction.
561a6d768d8SVincenzo Maffione */
562a6d768d8SVincenzo Maffione uint64_t buf_align;
563a6d768d8SVincenzo Maffione
56445c67e8fSVincenzo Maffione /* hardware specific logic for the selection of the hwbuf_len */
565a6d768d8SVincenzo Maffione int (*nm_bufcfg)(struct netmap_kring *kring, uint64_t target);
566a6d768d8SVincenzo Maffione
567847bf383SLuigi Rizzo int (*save_notify)(struct netmap_kring *kring, int flags);
568847bf383SLuigi Rizzo
5694bf50f18SLuigi Rizzo #ifdef WITH_MONITOR
570847bf383SLuigi Rizzo /* array of krings that are monitoring this kring */
571847bf383SLuigi Rizzo struct netmap_kring **monitors;
572847bf383SLuigi Rizzo uint32_t max_monitors; /* current size of the monitors array */
573847bf383SLuigi Rizzo uint32_t n_monitors; /* next unused entry in the monitor array */
574c3e9b4dbSLuiz Otavio O Souza uint32_t mon_pos[NR_TXRX]; /* index of this ring in the monitored ring array */
575c3e9b4dbSLuiz Otavio O Souza uint32_t mon_tail; /* last seen slot on rx */
576c3e9b4dbSLuiz Otavio O Souza
577c3e9b4dbSLuiz Otavio O Souza /* circular list of zero-copy monitors */
578c3e9b4dbSLuiz Otavio O Souza struct netmap_zmon_list zmon_list[NR_TXRX];
579c3e9b4dbSLuiz Otavio O Souza
5804bf50f18SLuigi Rizzo /*
581847bf383SLuigi Rizzo * Monitors work by intercepting the sync and notify callbacks of the
582847bf383SLuigi Rizzo * monitored krings. This is implemented by replacing the pointers
583847bf383SLuigi Rizzo * above and saving the previous ones in mon_* pointers below
5844bf50f18SLuigi Rizzo */
585847bf383SLuigi Rizzo int (*mon_sync)(struct netmap_kring *kring, int flags);
586847bf383SLuigi Rizzo int (*mon_notify)(struct netmap_kring *kring, int flags);
587847bf383SLuigi Rizzo
5884bf50f18SLuigi Rizzo #endif
58937e3a6d3SLuigi Rizzo }
59037e3a6d3SLuigi Rizzo #ifdef _WIN32
59137e3a6d3SLuigi Rizzo __declspec(align(64));
59237e3a6d3SLuigi Rizzo #else
59337e3a6d3SLuigi Rizzo __attribute__((__aligned__(64)));
59437e3a6d3SLuigi Rizzo #endif
59568b8534bSLuigi Rizzo
59637e3a6d3SLuigi Rizzo /* return 1 iff the kring needs to be turned on */
59737e3a6d3SLuigi Rizzo static inline int
nm_kring_pending_on(struct netmap_kring * kring)59837e3a6d3SLuigi Rizzo nm_kring_pending_on(struct netmap_kring *kring)
59937e3a6d3SLuigi Rizzo {
60037e3a6d3SLuigi Rizzo return kring->nr_pending_mode == NKR_NETMAP_ON &&
60137e3a6d3SLuigi Rizzo kring->nr_mode == NKR_NETMAP_OFF;
60237e3a6d3SLuigi Rizzo }
60337e3a6d3SLuigi Rizzo
60437e3a6d3SLuigi Rizzo /* return 1 iff the kring needs to be turned off */
60537e3a6d3SLuigi Rizzo static inline int
nm_kring_pending_off(struct netmap_kring * kring)60637e3a6d3SLuigi Rizzo nm_kring_pending_off(struct netmap_kring *kring)
60737e3a6d3SLuigi Rizzo {
60837e3a6d3SLuigi Rizzo return kring->nr_pending_mode == NKR_NETMAP_OFF &&
60937e3a6d3SLuigi Rizzo kring->nr_mode == NKR_NETMAP_ON;
61037e3a6d3SLuigi Rizzo }
611ce3ee1e7SLuigi Rizzo
612ce3ee1e7SLuigi Rizzo /* return the next index, with wraparound */
613ce3ee1e7SLuigi Rizzo static inline uint32_t
nm_next(uint32_t i,uint32_t lim)614ce3ee1e7SLuigi Rizzo nm_next(uint32_t i, uint32_t lim)
615ce3ee1e7SLuigi Rizzo {
616ce3ee1e7SLuigi Rizzo return unlikely (i == lim) ? 0 : i + 1;
617ce3ee1e7SLuigi Rizzo }
618ce3ee1e7SLuigi Rizzo
61917885a7bSLuigi Rizzo
62017885a7bSLuigi Rizzo /* return the previous index, with wraparound */
62117885a7bSLuigi Rizzo static inline uint32_t
nm_prev(uint32_t i,uint32_t lim)62217885a7bSLuigi Rizzo nm_prev(uint32_t i, uint32_t lim)
62317885a7bSLuigi Rizzo {
62417885a7bSLuigi Rizzo return unlikely (i == 0) ? lim : i - 1;
62517885a7bSLuigi Rizzo }
62617885a7bSLuigi Rizzo
62717885a7bSLuigi Rizzo
628ce3ee1e7SLuigi Rizzo /*
629ce3ee1e7SLuigi Rizzo *
630ce3ee1e7SLuigi Rizzo * Here is the layout for the Rx and Tx rings.
631ce3ee1e7SLuigi Rizzo
632ce3ee1e7SLuigi Rizzo RxRING TxRING
633ce3ee1e7SLuigi Rizzo
634ce3ee1e7SLuigi Rizzo +-----------------+ +-----------------+
635ce3ee1e7SLuigi Rizzo | | | |
6364f80b14cSVincenzo Maffione | free | | free |
637ce3ee1e7SLuigi Rizzo +-----------------+ +-----------------+
63817885a7bSLuigi Rizzo head->| owned by user |<-hwcur | not sent to nic |<-hwcur
63917885a7bSLuigi Rizzo | | | yet |
64017885a7bSLuigi Rizzo +-----------------+ | |
64117885a7bSLuigi Rizzo cur->| available to | | |
64217885a7bSLuigi Rizzo | user, not read | +-----------------+
64317885a7bSLuigi Rizzo | yet | cur->| (being |
64417885a7bSLuigi Rizzo | | | prepared) |
645ce3ee1e7SLuigi Rizzo | | | |
64617885a7bSLuigi Rizzo +-----------------+ + ------ +
64717885a7bSLuigi Rizzo tail->| |<-hwtail | |<-hwlease
64817885a7bSLuigi Rizzo | (being | ... | | ...
64917885a7bSLuigi Rizzo | prepared) | ... | | ...
65017885a7bSLuigi Rizzo +-----------------+ ... | | ...
65117885a7bSLuigi Rizzo | |<-hwlease +-----------------+
65217885a7bSLuigi Rizzo | | tail->| |<-hwtail
653ce3ee1e7SLuigi Rizzo | | | |
654ce3ee1e7SLuigi Rizzo | | | |
655ce3ee1e7SLuigi Rizzo | | | |
656ce3ee1e7SLuigi Rizzo +-----------------+ +-----------------+
657ce3ee1e7SLuigi Rizzo
65817885a7bSLuigi Rizzo * The cur/tail (user view) and hwcur/hwtail (kernel view)
659ce3ee1e7SLuigi Rizzo * are used in the normal operation of the card.
660ce3ee1e7SLuigi Rizzo *
661ce3ee1e7SLuigi Rizzo * When a ring is the output of a switch port (Rx ring for
662ce3ee1e7SLuigi Rizzo * a VALE port, Tx ring for the host stack or NIC), slots
663ce3ee1e7SLuigi Rizzo * are reserved in blocks through 'hwlease' which points
664ce3ee1e7SLuigi Rizzo * to the next unused slot.
66517885a7bSLuigi Rizzo * On an Rx ring, hwlease is always after hwtail,
66617885a7bSLuigi Rizzo * and completions cause hwtail to advance.
66717885a7bSLuigi Rizzo * On a Tx ring, hwlease is always between cur and hwtail,
668ce3ee1e7SLuigi Rizzo * and completions cause cur to advance.
669ce3ee1e7SLuigi Rizzo *
670ce3ee1e7SLuigi Rizzo * nm_kr_space() returns the maximum number of slots that
671ce3ee1e7SLuigi Rizzo * can be assigned.
672ce3ee1e7SLuigi Rizzo * nm_kr_lease() reserves the required number of buffers,
673ce3ee1e7SLuigi Rizzo * advances nkr_hwlease and also returns an entry in
674ce3ee1e7SLuigi Rizzo * a circular array where completions should be reported.
675ce3ee1e7SLuigi Rizzo */
676ce3ee1e7SLuigi Rizzo
6774f80b14cSVincenzo Maffione struct lut_entry;
6784f80b14cSVincenzo Maffione #ifdef __FreeBSD__
6794f80b14cSVincenzo Maffione #define plut_entry lut_entry
6804f80b14cSVincenzo Maffione #endif
681ce3ee1e7SLuigi Rizzo
682847bf383SLuigi Rizzo struct netmap_lut {
683847bf383SLuigi Rizzo struct lut_entry *lut;
6844f80b14cSVincenzo Maffione struct plut_entry *plut;
685847bf383SLuigi Rizzo uint32_t objtotal; /* max buffer index */
686847bf383SLuigi Rizzo uint32_t objsize; /* buffer size */
687847bf383SLuigi Rizzo };
688ce3ee1e7SLuigi Rizzo
6894bf50f18SLuigi Rizzo struct netmap_vp_adapter; // forward
6902a7db7a6SVincenzo Maffione struct nm_bridge;
6914bf50f18SLuigi Rizzo
6922ff91c17SVincenzo Maffione /* Struct to be filled by nm_config callbacks. */
6932ff91c17SVincenzo Maffione struct nm_config_info {
6942ff91c17SVincenzo Maffione unsigned num_tx_rings;
6952ff91c17SVincenzo Maffione unsigned num_rx_rings;
6962ff91c17SVincenzo Maffione unsigned num_tx_descs;
6972ff91c17SVincenzo Maffione unsigned num_rx_descs;
6982ff91c17SVincenzo Maffione unsigned rx_buf_maxsize;
6992ff91c17SVincenzo Maffione };
7002ff91c17SVincenzo Maffione
70168b8534bSLuigi Rizzo /*
7022a7db7a6SVincenzo Maffione * default type for the magic field.
70345c67e8fSVincenzo Maffione * May be overridden in glue code.
7042a7db7a6SVincenzo Maffione */
7052a7db7a6SVincenzo Maffione #ifndef NM_OS_MAGIC
7062a7db7a6SVincenzo Maffione #define NM_OS_MAGIC uint32_t
7072a7db7a6SVincenzo Maffione #endif /* !NM_OS_MAGIC */
7082a7db7a6SVincenzo Maffione
7092a7db7a6SVincenzo Maffione /*
710f9790aebSLuigi Rizzo * The "struct netmap_adapter" extends the "struct adapter"
711f9790aebSLuigi Rizzo * (or equivalent) device descriptor.
712f9790aebSLuigi Rizzo * It contains all base fields needed to support netmap operation.
713f9790aebSLuigi Rizzo * There are in fact different types of netmap adapters
714f9790aebSLuigi Rizzo * (native, generic, VALE switch...) so a netmap_adapter is
715f9790aebSLuigi Rizzo * just the first field in the derived type.
71668b8534bSLuigi Rizzo */
71768b8534bSLuigi Rizzo struct netmap_adapter {
7188241616dSLuigi Rizzo /*
7198241616dSLuigi Rizzo * On linux we do not have a good way to tell if an interface
720f9790aebSLuigi Rizzo * is netmap-capable. So we always use the following trick:
7218241616dSLuigi Rizzo * NA(ifp) points here, and the first entry (which hopefully
7228241616dSLuigi Rizzo * always exists and is at least 32 bits) contains a magic
7238241616dSLuigi Rizzo * value which we can use to detect that the interface is good.
7248241616dSLuigi Rizzo */
7252a7db7a6SVincenzo Maffione NM_OS_MAGIC magic;
726f9790aebSLuigi Rizzo uint32_t na_flags; /* enabled, and other flags */
7278241616dSLuigi Rizzo #define NAF_SKIP_INTR 1 /* use the regular interrupt handler.
7288241616dSLuigi Rizzo * useful during initialization
7298241616dSLuigi Rizzo */
730f18be576SLuigi Rizzo #define NAF_SW_ONLY 2 /* forward packets only to sw adapter */
731ce3ee1e7SLuigi Rizzo #define NAF_BDG_MAYSLEEP 4 /* the bridge is allowed to sleep when
732ce3ee1e7SLuigi Rizzo * forwarding packets coming from this
733ce3ee1e7SLuigi Rizzo * interface
734ce3ee1e7SLuigi Rizzo */
735847bf383SLuigi Rizzo #define NAF_MEM_OWNER 8 /* the adapter uses its own memory area
736847bf383SLuigi Rizzo * that cannot be changed
737ce3ee1e7SLuigi Rizzo */
738847bf383SLuigi Rizzo #define NAF_NATIVE 16 /* the adapter is native.
73985fe4e7cSLuigi Rizzo * Virtual ports (non persistent vale ports,
74085fe4e7cSLuigi Rizzo * pipes, monitors...) should never use
74185fe4e7cSLuigi Rizzo * this flag.
742f9790aebSLuigi Rizzo */
743f9790aebSLuigi Rizzo #define NAF_NETMAP_ON 32 /* netmap is active (either native or
7444bf50f18SLuigi Rizzo * emulated). Where possible (e.g. FreeBSD)
745f9790aebSLuigi Rizzo * IFCAP_NETMAP also mirrors this flag.
746f9790aebSLuigi Rizzo */
747f0ea3689SLuigi Rizzo #define NAF_HOST_RINGS 64 /* the adapter supports the host rings */
7484bf50f18SLuigi Rizzo #define NAF_FORCE_NATIVE 128 /* the adapter is always NATIVE */
749b6e66be2SVincenzo Maffione /* free */
7504f80b14cSVincenzo Maffione #define NAF_MOREFRAG 512 /* the adapter supports NS_MOREFRAG */
751a6d768d8SVincenzo Maffione #define NAF_OFFSETS 1024 /* the adapter supports the slot offsets */
752a6d768d8SVincenzo Maffione #define NAF_HOST_ALL 2048 /* the adapter wants as many host rings as hw */
75337e3a6d3SLuigi Rizzo #define NAF_ZOMBIE (1U<<30) /* the nic driver has been unloaded */
7544bf50f18SLuigi Rizzo #define NAF_BUSY (1U<<31) /* the adapter is used internally and
7554bf50f18SLuigi Rizzo * cannot be registered from userspace
7564bf50f18SLuigi Rizzo */
757f9790aebSLuigi Rizzo int active_fds; /* number of user-space descriptors using this
75868b8534bSLuigi Rizzo interface, which is equal to the number of
75968b8534bSLuigi Rizzo struct netmap_if objs in the mapped region. */
76068b8534bSLuigi Rizzo
76124e57ec9SEd Maste u_int num_rx_rings; /* number of adapter receive rings */
76224e57ec9SEd Maste u_int num_tx_rings; /* number of adapter transmit rings */
7632a7db7a6SVincenzo Maffione u_int num_host_rx_rings; /* number of host receive rings */
7642a7db7a6SVincenzo Maffione u_int num_host_tx_rings; /* number of host transmit rings */
76568b8534bSLuigi Rizzo
76668b8534bSLuigi Rizzo u_int num_tx_desc; /* number of descriptor in each queue */
76768b8534bSLuigi Rizzo u_int num_rx_desc;
76868b8534bSLuigi Rizzo
769b6e66be2SVincenzo Maffione /* tx_rings and rx_rings are private but allocated as a
770b6e66be2SVincenzo Maffione * contiguous chunk of memory. Each array has N+K entries,
771b6e66be2SVincenzo Maffione * N for the hardware rings and K for the host rings.
77268b8534bSLuigi Rizzo */
7732ff91c17SVincenzo Maffione struct netmap_kring **tx_rings; /* array of TX rings. */
7742ff91c17SVincenzo Maffione struct netmap_kring **rx_rings; /* array of RX rings. */
77517885a7bSLuigi Rizzo
776f9790aebSLuigi Rizzo void *tailroom; /* space below the rings array */
777f9790aebSLuigi Rizzo /* (used for leases) */
778f9790aebSLuigi Rizzo
77968b8534bSLuigi Rizzo
780847bf383SLuigi Rizzo NM_SELINFO_T si[NR_TXRX]; /* global wait queues */
78164ae02c3SLuigi Rizzo
782f0ea3689SLuigi Rizzo /* count users of the global wait queues */
783847bf383SLuigi Rizzo int si_users[NR_TXRX];
784f0ea3689SLuigi Rizzo
7854bf50f18SLuigi Rizzo void *pdev; /* used to store pci device */
7864bf50f18SLuigi Rizzo
78768b8534bSLuigi Rizzo /* copy of if_qflush and if_transmit pointers, to intercept
78868b8534bSLuigi Rizzo * packets from the network stack when netmap is active.
78968b8534bSLuigi Rizzo */
790e330262fSJustin Hibbits int (*if_transmit)(if_t, struct mbuf *);
79168b8534bSLuigi Rizzo
79217885a7bSLuigi Rizzo /* copy of if_input for netmap_send_up() */
793e330262fSJustin Hibbits void (*if_input)(if_t, struct mbuf *);
79417885a7bSLuigi Rizzo
7954f80b14cSVincenzo Maffione /* Back reference to the parent ifnet struct. Used for
7964f80b14cSVincenzo Maffione * hardware ports (emulated netmap included). */
797e330262fSJustin Hibbits if_t ifp; /* adapter is if_getsoftc(ifp) */
79868b8534bSLuigi Rizzo
79917885a7bSLuigi Rizzo /*---- callbacks for this netmap adapter -----*/
80017885a7bSLuigi Rizzo /*
80117885a7bSLuigi Rizzo * nm_dtor() is the cleanup routine called when destroying
80217885a7bSLuigi Rizzo * the adapter.
80389cc2556SLuigi Rizzo * Called with NMG_LOCK held.
80417885a7bSLuigi Rizzo *
80517885a7bSLuigi Rizzo * nm_register() is called on NIOCREGIF and close() to enter
80617885a7bSLuigi Rizzo * or exit netmap mode on the NIC
8074bf50f18SLuigi Rizzo * Called with NNG_LOCK held.
80817885a7bSLuigi Rizzo *
80917885a7bSLuigi Rizzo * nm_txsync() pushes packets to the underlying hw/switch
81017885a7bSLuigi Rizzo *
81117885a7bSLuigi Rizzo * nm_rxsync() collects packets from the underlying hw/switch
81217885a7bSLuigi Rizzo *
81317885a7bSLuigi Rizzo * nm_config() returns configuration information from the OS
81489cc2556SLuigi Rizzo * Called with NMG_LOCK held.
81517885a7bSLuigi Rizzo *
816a6d768d8SVincenzo Maffione * nm_bufcfg()
817a6d768d8SVincenzo Maffione * the purpose of this callback is to fill the kring->hwbuf_len
818a6d768d8SVincenzo Maffione * (l) and kring->buf_align fields. The l value is most important
819a6d768d8SVincenzo Maffione * for RX rings, where we want to disallow writes outside of the
820a6d768d8SVincenzo Maffione * netmap buffer. The l value must be computed taking into account
82145c67e8fSVincenzo Maffione * the stipulated max_offset (o), possibly increased if there are
822a6d768d8SVincenzo Maffione * alignment constraints, the maxframe (m), if known, and the
823a6d768d8SVincenzo Maffione * current NETMAP_BUF_SIZE (b) of the memory region used by the
824a6d768d8SVincenzo Maffione * adapter. We want the largest supported l such that o + l <= b.
825a6d768d8SVincenzo Maffione * If m is known to be <= b - o, the callback may also choose the
82666671ae5SVincenzo Maffione * largest l <= m, ignoring the offset. The buf_align field is
827a6d768d8SVincenzo Maffione * most important for TX rings when there are offsets. The user
828a6d768d8SVincenzo Maffione * will see this value in the ring->buf_align field. Misaligned
829a6d768d8SVincenzo Maffione * offsets will cause the corresponding packets to be silently
830a6d768d8SVincenzo Maffione * dropped.
831a6d768d8SVincenzo Maffione *
8324bf50f18SLuigi Rizzo * nm_krings_create() create and init the tx_rings and
8334bf50f18SLuigi Rizzo * rx_rings arrays of kring structures. In particular,
8344bf50f18SLuigi Rizzo * set the nm_sync callbacks for each ring.
8354bf50f18SLuigi Rizzo * There is no need to also allocate the corresponding
8364bf50f18SLuigi Rizzo * netmap_rings, since netmap_mem_rings_create() will always
8374bf50f18SLuigi Rizzo * be called to provide the missing ones.
8384bf50f18SLuigi Rizzo * Called with NNG_LOCK held.
83917885a7bSLuigi Rizzo *
8404bf50f18SLuigi Rizzo * nm_krings_delete() cleanup and delete the tx_rings and rx_rings
8414bf50f18SLuigi Rizzo * arrays
8424bf50f18SLuigi Rizzo * Called with NMG_LOCK held.
84317885a7bSLuigi Rizzo *
84489cc2556SLuigi Rizzo * nm_notify() is used to act after data have become available
84589cc2556SLuigi Rizzo * (or the stopped state of the ring has changed)
84617885a7bSLuigi Rizzo * For hw devices this is typically a selwakeup(),
84717885a7bSLuigi Rizzo * but for NIC/host ports attached to a switch (or vice-versa)
84817885a7bSLuigi Rizzo * we also need to invoke the 'txsync' code downstream.
84937e3a6d3SLuigi Rizzo * This callback pointer is actually used only to initialize
85037e3a6d3SLuigi Rizzo * kring->nm_notify.
85137e3a6d3SLuigi Rizzo * Return values are the same as for netmap_rx_irq().
85217885a7bSLuigi Rizzo */
853f9790aebSLuigi Rizzo void (*nm_dtor)(struct netmap_adapter *);
8541a26580eSLuigi Rizzo
855f9790aebSLuigi Rizzo int (*nm_register)(struct netmap_adapter *, int onoff);
85637e3a6d3SLuigi Rizzo void (*nm_intr)(struct netmap_adapter *, int onoff);
857ce3ee1e7SLuigi Rizzo
8584bf50f18SLuigi Rizzo int (*nm_txsync)(struct netmap_kring *kring, int flags);
8594bf50f18SLuigi Rizzo int (*nm_rxsync)(struct netmap_kring *kring, int flags);
860847bf383SLuigi Rizzo int (*nm_notify)(struct netmap_kring *kring, int flags);
861a6d768d8SVincenzo Maffione int (*nm_bufcfg)(struct netmap_kring *kring, uint64_t target);
862ce3ee1e7SLuigi Rizzo #define NAF_FORCE_READ 1
863ce3ee1e7SLuigi Rizzo #define NAF_FORCE_RECLAIM 2
864c3e9b4dbSLuiz Otavio O Souza #define NAF_CAN_FORWARD_DOWN 4
865ae10d1afSLuigi Rizzo /* return configuration information */
8662ff91c17SVincenzo Maffione int (*nm_config)(struct netmap_adapter *, struct nm_config_info *info);
867f9790aebSLuigi Rizzo int (*nm_krings_create)(struct netmap_adapter *);
868f9790aebSLuigi Rizzo void (*nm_krings_delete)(struct netmap_adapter *);
8694bf50f18SLuigi Rizzo /*
8704bf50f18SLuigi Rizzo * nm_bdg_attach() initializes the na_vp field to point
8714bf50f18SLuigi Rizzo * to an adapter that can be attached to a VALE switch. If the
8724bf50f18SLuigi Rizzo * current adapter is already a VALE port, na_vp is simply a cast;
8734bf50f18SLuigi Rizzo * otherwise, na_vp points to a netmap_bwrap_adapter.
8744bf50f18SLuigi Rizzo * If applicable, this callback also initializes na_hostvp,
8754bf50f18SLuigi Rizzo * that can be used to connect the adapter host rings to the
8764bf50f18SLuigi Rizzo * switch.
8774bf50f18SLuigi Rizzo * Called with NMG_LOCK held.
8784bf50f18SLuigi Rizzo *
8794bf50f18SLuigi Rizzo * nm_bdg_ctl() is called on the actual attach/detach to/from
8804bf50f18SLuigi Rizzo * to/from the switch, to perform adapter-specific
8814bf50f18SLuigi Rizzo * initializations
8824bf50f18SLuigi Rizzo * Called with NMG_LOCK held.
8834bf50f18SLuigi Rizzo */
8842a7db7a6SVincenzo Maffione int (*nm_bdg_attach)(const char *bdg_name, struct netmap_adapter *,
8852a7db7a6SVincenzo Maffione struct nm_bridge *);
8862ff91c17SVincenzo Maffione int (*nm_bdg_ctl)(struct nmreq_header *, struct netmap_adapter *);
8874bf50f18SLuigi Rizzo
8884bf50f18SLuigi Rizzo /* adapter used to attach this adapter to a VALE switch (if any) */
8894bf50f18SLuigi Rizzo struct netmap_vp_adapter *na_vp;
8904bf50f18SLuigi Rizzo /* adapter used to attach the host rings of this adapter
8914bf50f18SLuigi Rizzo * to a VALE switch (if any) */
8924bf50f18SLuigi Rizzo struct netmap_vp_adapter *na_hostvp;
893f9790aebSLuigi Rizzo
894f9790aebSLuigi Rizzo /* standard refcount to control the lifetime of the adapter
895f9790aebSLuigi Rizzo * (it should be equal to the lifetime of the corresponding ifp)
896f9790aebSLuigi Rizzo */
897f9790aebSLuigi Rizzo int na_refcount;
898f9790aebSLuigi Rizzo
899f9790aebSLuigi Rizzo /* memory allocator (opaque)
900f9790aebSLuigi Rizzo * We also cache a pointer to the lut_entry for translating
90137e3a6d3SLuigi Rizzo * buffer addresses, the total number of buffers and the buffer size.
902f9790aebSLuigi Rizzo */
903f9790aebSLuigi Rizzo struct netmap_mem_d *nm_mem;
9044f80b14cSVincenzo Maffione struct netmap_mem_d *nm_mem_prev;
905847bf383SLuigi Rizzo struct netmap_lut na_lut;
906f9790aebSLuigi Rizzo
9074bf50f18SLuigi Rizzo /* additional information attached to this adapter
9084bf50f18SLuigi Rizzo * by other netmap subsystems. Currently used by
90937e3a6d3SLuigi Rizzo * bwrap, LINUX/v1000 and ptnetmap
910f9790aebSLuigi Rizzo */
911f9790aebSLuigi Rizzo void *na_private;
912f0ea3689SLuigi Rizzo
9134bf50f18SLuigi Rizzo /* array of pipes that have this adapter as a parent */
914f0ea3689SLuigi Rizzo struct netmap_pipe_adapter **na_pipes;
9154bf50f18SLuigi Rizzo int na_next_pipe; /* next free slot in the array */
9164bf50f18SLuigi Rizzo int na_max_pipes; /* size of the array */
9174bf50f18SLuigi Rizzo
91837e3a6d3SLuigi Rizzo /* Offset of ethernet header for each packet. */
91937e3a6d3SLuigi Rizzo u_int virt_hdr_len;
92037e3a6d3SLuigi Rizzo
9212ff91c17SVincenzo Maffione /* Max number of bytes that the NIC can store in the buffer
9222ff91c17SVincenzo Maffione * referenced by each RX descriptor. This translates to the maximum
9232ff91c17SVincenzo Maffione * bytes that a single netmap slot can reference. Larger packets
9242ff91c17SVincenzo Maffione * require NS_MOREFRAG support. */
9252ff91c17SVincenzo Maffione unsigned rx_buf_maxsize;
9262ff91c17SVincenzo Maffione
9272ff91c17SVincenzo Maffione char name[NETMAP_REQ_IFNAMSIZ]; /* used at least by pipes */
9282a7db7a6SVincenzo Maffione
9292a7db7a6SVincenzo Maffione #ifdef WITH_MONITOR
9302a7db7a6SVincenzo Maffione unsigned long monitor_id; /* debugging */
9312a7db7a6SVincenzo Maffione #endif
932f9790aebSLuigi Rizzo };
933f9790aebSLuigi Rizzo
934847bf383SLuigi Rizzo static __inline u_int
nma_get_ndesc(struct netmap_adapter * na,enum txrx t)935847bf383SLuigi Rizzo nma_get_ndesc(struct netmap_adapter *na, enum txrx t)
936847bf383SLuigi Rizzo {
937847bf383SLuigi Rizzo return (t == NR_TX ? na->num_tx_desc : na->num_rx_desc);
938847bf383SLuigi Rizzo }
939847bf383SLuigi Rizzo
940847bf383SLuigi Rizzo static __inline void
nma_set_ndesc(struct netmap_adapter * na,enum txrx t,u_int v)941847bf383SLuigi Rizzo nma_set_ndesc(struct netmap_adapter *na, enum txrx t, u_int v)
942847bf383SLuigi Rizzo {
943847bf383SLuigi Rizzo if (t == NR_TX)
944847bf383SLuigi Rizzo na->num_tx_desc = v;
945847bf383SLuigi Rizzo else
946847bf383SLuigi Rizzo na->num_rx_desc = v;
947847bf383SLuigi Rizzo }
948847bf383SLuigi Rizzo
949847bf383SLuigi Rizzo static __inline u_int
nma_get_nrings(struct netmap_adapter * na,enum txrx t)950847bf383SLuigi Rizzo nma_get_nrings(struct netmap_adapter *na, enum txrx t)
951847bf383SLuigi Rizzo {
952847bf383SLuigi Rizzo return (t == NR_TX ? na->num_tx_rings : na->num_rx_rings);
953847bf383SLuigi Rizzo }
954847bf383SLuigi Rizzo
9552a7db7a6SVincenzo Maffione static __inline u_int
nma_get_host_nrings(struct netmap_adapter * na,enum txrx t)9562a7db7a6SVincenzo Maffione nma_get_host_nrings(struct netmap_adapter *na, enum txrx t)
9572a7db7a6SVincenzo Maffione {
9582a7db7a6SVincenzo Maffione return (t == NR_TX ? na->num_host_tx_rings : na->num_host_rx_rings);
9592a7db7a6SVincenzo Maffione }
9602a7db7a6SVincenzo Maffione
961847bf383SLuigi Rizzo static __inline void
nma_set_nrings(struct netmap_adapter * na,enum txrx t,u_int v)962847bf383SLuigi Rizzo nma_set_nrings(struct netmap_adapter *na, enum txrx t, u_int v)
963847bf383SLuigi Rizzo {
964847bf383SLuigi Rizzo if (t == NR_TX)
965847bf383SLuigi Rizzo na->num_tx_rings = v;
966847bf383SLuigi Rizzo else
967847bf383SLuigi Rizzo na->num_rx_rings = v;
968847bf383SLuigi Rizzo }
969847bf383SLuigi Rizzo
9702a7db7a6SVincenzo Maffione static __inline void
nma_set_host_nrings(struct netmap_adapter * na,enum txrx t,u_int v)9712a7db7a6SVincenzo Maffione nma_set_host_nrings(struct netmap_adapter *na, enum txrx t, u_int v)
9722a7db7a6SVincenzo Maffione {
9732a7db7a6SVincenzo Maffione if (t == NR_TX)
9742a7db7a6SVincenzo Maffione na->num_host_tx_rings = v;
9752a7db7a6SVincenzo Maffione else
9762a7db7a6SVincenzo Maffione na->num_host_rx_rings = v;
9772a7db7a6SVincenzo Maffione }
9782a7db7a6SVincenzo Maffione
9792ff91c17SVincenzo Maffione static __inline struct netmap_kring**
NMR(struct netmap_adapter * na,enum txrx t)980847bf383SLuigi Rizzo NMR(struct netmap_adapter *na, enum txrx t)
981847bf383SLuigi Rizzo {
982847bf383SLuigi Rizzo return (t == NR_TX ? na->tx_rings : na->rx_rings);
983847bf383SLuigi Rizzo }
98417885a7bSLuigi Rizzo
9854f80b14cSVincenzo Maffione int nma_intr_enable(struct netmap_adapter *na, int onoff);
9864f80b14cSVincenzo Maffione
987f9790aebSLuigi Rizzo /*
988f9790aebSLuigi Rizzo * If the NIC is owned by the kernel
989f9790aebSLuigi Rizzo * (i.e., bridge), neither another bridge nor user can use it;
990f9790aebSLuigi Rizzo * if the NIC is owned by a user, only users can share it.
991f9790aebSLuigi Rizzo * Evaluation must be done under NMG_LOCK().
992f9790aebSLuigi Rizzo */
9934bf50f18SLuigi Rizzo #define NETMAP_OWNED_BY_KERN(na) ((na)->na_flags & NAF_BUSY)
994f9790aebSLuigi Rizzo #define NETMAP_OWNED_BY_ANY(na) \
9954bf50f18SLuigi Rizzo (NETMAP_OWNED_BY_KERN(na) || ((na)->active_fds > 0))
996f9790aebSLuigi Rizzo
997f9790aebSLuigi Rizzo /*
998f9790aebSLuigi Rizzo * derived netmap adapters for various types of ports
999f9790aebSLuigi Rizzo */
1000f9790aebSLuigi Rizzo struct netmap_vp_adapter { /* VALE software port */
1001f9790aebSLuigi Rizzo struct netmap_adapter up;
1002f196ce38SLuigi Rizzo
1003849bec0eSLuigi Rizzo /*
1004849bec0eSLuigi Rizzo * Bridge support:
1005849bec0eSLuigi Rizzo *
1006849bec0eSLuigi Rizzo * bdg_port is the port number used in the bridge;
1007f18be576SLuigi Rizzo * na_bdg points to the bridge this NA is attached to.
1008849bec0eSLuigi Rizzo */
1009f196ce38SLuigi Rizzo int bdg_port;
1010f18be576SLuigi Rizzo struct nm_bridge *na_bdg;
1011f9790aebSLuigi Rizzo int retry;
1012c3e9b4dbSLuiz Otavio O Souza int autodelete; /* remove the ifp on last reference */
1013f9790aebSLuigi Rizzo
1014f0ea3689SLuigi Rizzo /* Maximum Frame Size, used in bdg_mismatch_datapath() */
1015f0ea3689SLuigi Rizzo u_int mfs;
1016847bf383SLuigi Rizzo /* Last source MAC on this port */
1017847bf383SLuigi Rizzo uint64_t last_smac;
1018f9790aebSLuigi Rizzo };
1019f9790aebSLuigi Rizzo
102017885a7bSLuigi Rizzo
1021f9790aebSLuigi Rizzo struct netmap_hw_adapter { /* physical device */
1022f9790aebSLuigi Rizzo struct netmap_adapter up;
1023f9790aebSLuigi Rizzo
10244f80b14cSVincenzo Maffione #ifdef linux
10254f80b14cSVincenzo Maffione struct net_device_ops nm_ndo;
10264f80b14cSVincenzo Maffione struct ethtool_ops nm_eto;
10274f80b14cSVincenzo Maffione #endif
10284bf50f18SLuigi Rizzo const struct ethtool_ops* save_ethtool;
10294bf50f18SLuigi Rizzo
10304bf50f18SLuigi Rizzo int (*nm_hw_register)(struct netmap_adapter *, int onoff);
1031f9790aebSLuigi Rizzo };
1032f9790aebSLuigi Rizzo
1033039dd540SLuigi Rizzo #ifdef WITH_GENERIC
1034f0ea3689SLuigi Rizzo /* Mitigation support. */
1035f0ea3689SLuigi Rizzo struct nm_generic_mit {
1036f0ea3689SLuigi Rizzo struct hrtimer mit_timer;
1037f0ea3689SLuigi Rizzo int mit_pending;
10384bf50f18SLuigi Rizzo int mit_ring_idx; /* index of the ring being mitigated */
1039f0ea3689SLuigi Rizzo struct netmap_adapter *mit_na; /* backpointer */
1040f0ea3689SLuigi Rizzo };
104117885a7bSLuigi Rizzo
104217885a7bSLuigi Rizzo struct netmap_generic_adapter { /* emulated device */
1043f9790aebSLuigi Rizzo struct netmap_hw_adapter up;
1044f9790aebSLuigi Rizzo
1045f9790aebSLuigi Rizzo /* Pointer to a previously used netmap adapter. */
1046f9790aebSLuigi Rizzo struct netmap_adapter *prev;
1047f9790aebSLuigi Rizzo
10484f80b14cSVincenzo Maffione /* Emulated netmap adapters support:
10494f80b14cSVincenzo Maffione * - mit implements rx interrupt mitigation;
1050f9790aebSLuigi Rizzo */
1051f0ea3689SLuigi Rizzo struct nm_generic_mit *mit;
105217885a7bSLuigi Rizzo #ifdef linux
1053e330262fSJustin Hibbits netdev_tx_t (*save_start_xmit)(struct mbuf *, if_t);
105417885a7bSLuigi Rizzo #endif
105537e3a6d3SLuigi Rizzo /* Is the adapter able to use multiple RX slots to scatter
105637e3a6d3SLuigi Rizzo * each packet pushed up by the driver? */
105737e3a6d3SLuigi Rizzo int rxsg;
105837e3a6d3SLuigi Rizzo
105937e3a6d3SLuigi Rizzo /* Is the transmission path controlled by a netmap-aware
106037e3a6d3SLuigi Rizzo * device queue (i.e. qdisc on linux)? */
106137e3a6d3SLuigi Rizzo int txqdisc;
1062f9790aebSLuigi Rizzo };
1063039dd540SLuigi Rizzo #endif /* WITH_GENERIC */
1064f9790aebSLuigi Rizzo
10652a7db7a6SVincenzo Maffione static __inline u_int
netmap_real_rings(struct netmap_adapter * na,enum txrx t)1066847bf383SLuigi Rizzo netmap_real_rings(struct netmap_adapter *na, enum txrx t)
1067f0ea3689SLuigi Rizzo {
10682a7db7a6SVincenzo Maffione return nma_get_nrings(na, t) +
10692a7db7a6SVincenzo Maffione !!(na->na_flags & NAF_HOST_RINGS) * nma_get_host_nrings(na, t);
1070f0ea3689SLuigi Rizzo }
1071f0ea3689SLuigi Rizzo
10722a7db7a6SVincenzo Maffione /* account for fake rings */
10732a7db7a6SVincenzo Maffione static __inline u_int
netmap_all_rings(struct netmap_adapter * na,enum txrx t)10742a7db7a6SVincenzo Maffione netmap_all_rings(struct netmap_adapter *na, enum txrx t)
10752a7db7a6SVincenzo Maffione {
10762a7db7a6SVincenzo Maffione return max(nma_get_nrings(na, t) + 1, netmap_real_rings(na, t));
10772a7db7a6SVincenzo Maffione }
10782a7db7a6SVincenzo Maffione
10792a7db7a6SVincenzo Maffione int netmap_default_bdg_attach(const char *name, struct netmap_adapter *na,
10802a7db7a6SVincenzo Maffione struct nm_bridge *);
108137e3a6d3SLuigi Rizzo struct nm_bdg_polling_state;
108217885a7bSLuigi Rizzo /*
108317885a7bSLuigi Rizzo * Bridge wrapper for non VALE ports attached to a VALE switch.
1084f9790aebSLuigi Rizzo *
108517885a7bSLuigi Rizzo * The real device must already have its own netmap adapter (hwna).
108617885a7bSLuigi Rizzo * The bridge wrapper and the hwna adapter share the same set of
108717885a7bSLuigi Rizzo * netmap rings and buffers, but they have two separate sets of
108817885a7bSLuigi Rizzo * krings descriptors, with tx/rx meanings swapped:
1089f9790aebSLuigi Rizzo *
1090f9790aebSLuigi Rizzo * netmap
1091f9790aebSLuigi Rizzo * bwrap krings rings krings hwna
1092f9790aebSLuigi Rizzo * +------+ +------+ +-----+ +------+ +------+
1093f9790aebSLuigi Rizzo * |tx_rings->| |\ /| |----| |<-tx_rings|
1094f9790aebSLuigi Rizzo * | | +------+ \ / +-----+ +------+ | |
1095f9790aebSLuigi Rizzo * | | X | |
1096f9790aebSLuigi Rizzo * | | / \ | |
1097f9790aebSLuigi Rizzo * | | +------+/ \+-----+ +------+ | |
1098f9790aebSLuigi Rizzo * |rx_rings->| | | |----| |<-rx_rings|
1099f9790aebSLuigi Rizzo * | | +------+ +-----+ +------+ | |
1100f9790aebSLuigi Rizzo * +------+ +------+
1101f9790aebSLuigi Rizzo *
110217885a7bSLuigi Rizzo * - packets coming from the bridge go to the brwap rx rings,
110317885a7bSLuigi Rizzo * which are also the hwna tx rings. The bwrap notify callback
110417885a7bSLuigi Rizzo * will then complete the hwna tx (see netmap_bwrap_notify).
1105f9790aebSLuigi Rizzo *
110617885a7bSLuigi Rizzo * - packets coming from the outside go to the hwna rx rings,
110717885a7bSLuigi Rizzo * which are also the bwrap tx rings. The (overwritten) hwna
110817885a7bSLuigi Rizzo * notify method will then complete the bridge tx
110917885a7bSLuigi Rizzo * (see netmap_bwrap_intr_notify).
1110f9790aebSLuigi Rizzo *
111117885a7bSLuigi Rizzo * The bridge wrapper may optionally connect the hwna 'host' rings
111217885a7bSLuigi Rizzo * to the bridge. This is done by using a second port in the
111317885a7bSLuigi Rizzo * bridge and connecting it to the 'host' netmap_vp_adapter
111417885a7bSLuigi Rizzo * contained in the netmap_bwrap_adapter. The brwap host adapter
111517885a7bSLuigi Rizzo * cross-links the hwna host rings in the same way as shown above.
111617885a7bSLuigi Rizzo *
111717885a7bSLuigi Rizzo * - packets coming from the bridge and directed to the host stack
111817885a7bSLuigi Rizzo * are handled by the bwrap host notify callback
111917885a7bSLuigi Rizzo * (see netmap_bwrap_host_notify)
112017885a7bSLuigi Rizzo *
112117885a7bSLuigi Rizzo * - packets coming from the host stack are still handled by the
112217885a7bSLuigi Rizzo * overwritten hwna notify callback (netmap_bwrap_intr_notify),
112317885a7bSLuigi Rizzo * but are diverted to the host adapter depending on the ring number.
1124f9790aebSLuigi Rizzo *
1125f9790aebSLuigi Rizzo */
1126f9790aebSLuigi Rizzo struct netmap_bwrap_adapter {
1127f9790aebSLuigi Rizzo struct netmap_vp_adapter up;
1128f9790aebSLuigi Rizzo struct netmap_vp_adapter host; /* for host rings */
1129f9790aebSLuigi Rizzo struct netmap_adapter *hwna; /* the underlying device */
1130f9790aebSLuigi Rizzo
113117885a7bSLuigi Rizzo /*
113217885a7bSLuigi Rizzo * When we attach a physical interface to the bridge, we
1133f18be576SLuigi Rizzo * allow the controlling process to terminate, so we need
11344bf50f18SLuigi Rizzo * a place to store the n_detmap_priv_d data structure.
113517885a7bSLuigi Rizzo * This is only done when physical interfaces
113617885a7bSLuigi Rizzo * are attached to a bridge.
1137f18be576SLuigi Rizzo */
1138f18be576SLuigi Rizzo struct netmap_priv_d *na_kpriv;
113937e3a6d3SLuigi Rizzo struct nm_bdg_polling_state *na_polling_state;
11402ff91c17SVincenzo Maffione /* we overwrite the hwna->na_vp pointer, so we save
11412ff91c17SVincenzo Maffione * here its original value, to be restored at detach
11422ff91c17SVincenzo Maffione */
11432ff91c17SVincenzo Maffione struct netmap_vp_adapter *saved_na_vp;
1144a6d768d8SVincenzo Maffione int (*nm_intr_notify)(struct netmap_kring *kring, int flags);
114568b8534bSLuigi Rizzo };
11464ad57c7aSVincenzo Maffione int nm_is_bwrap(struct netmap_adapter *na);
11472ff91c17SVincenzo Maffione int nm_bdg_polling(struct nmreq_header *hdr);
11482a7db7a6SVincenzo Maffione
1149a6d768d8SVincenzo Maffione int netmap_bdg_attach(struct nmreq_header *hdr, void *auth_token);
1150a6d768d8SVincenzo Maffione int netmap_bdg_detach(struct nmreq_header *hdr, void *auth_token);
11512a7db7a6SVincenzo Maffione #ifdef WITH_VALE
1152b6e66be2SVincenzo Maffione int netmap_vale_list(struct nmreq_header *hdr);
11532ff91c17SVincenzo Maffione int netmap_vi_create(struct nmreq_header *hdr, int);
11542ff91c17SVincenzo Maffione int nm_vi_create(struct nmreq_header *);
11552ff91c17SVincenzo Maffione int nm_vi_destroy(const char *name);
1156c3e9b4dbSLuiz Otavio O Souza #else /* !WITH_VALE */
11572ff91c17SVincenzo Maffione #define netmap_vi_create(hdr, a) (EOPNOTSUPP)
115817885a7bSLuigi Rizzo #endif /* WITH_VALE */
1159ce3ee1e7SLuigi Rizzo
1160f0ea3689SLuigi Rizzo #ifdef WITH_PIPES
1161f0ea3689SLuigi Rizzo
1162f0ea3689SLuigi Rizzo #define NM_MAXPIPES 64 /* max number of pipes per adapter */
1163f0ea3689SLuigi Rizzo
1164f0ea3689SLuigi Rizzo struct netmap_pipe_adapter {
11652ff91c17SVincenzo Maffione /* pipe identifier is up.name */
1166f0ea3689SLuigi Rizzo struct netmap_adapter up;
1167f0ea3689SLuigi Rizzo
11682ff91c17SVincenzo Maffione #define NM_PIPE_ROLE_MASTER 0x1
11692ff91c17SVincenzo Maffione #define NM_PIPE_ROLE_SLAVE 0x2
11702ff91c17SVincenzo Maffione int role; /* either NM_PIPE_ROLE_MASTER or NM_PIPE_ROLE_SLAVE */
1171f0ea3689SLuigi Rizzo
1172f0ea3689SLuigi Rizzo struct netmap_adapter *parent; /* adapter that owns the memory */
1173f0ea3689SLuigi Rizzo struct netmap_pipe_adapter *peer; /* the other end of the pipe */
1174f0ea3689SLuigi Rizzo int peer_ref; /* 1 iff we are holding a ref to the peer */
1175e330262fSJustin Hibbits if_t parent_ifp; /* maybe null */
1176f0ea3689SLuigi Rizzo
1177f0ea3689SLuigi Rizzo u_int parent_slot; /* index in the parent pipe array */
1178f0ea3689SLuigi Rizzo };
1179f0ea3689SLuigi Rizzo
1180f0ea3689SLuigi Rizzo #endif /* WITH_PIPES */
1181f0ea3689SLuigi Rizzo
1182b6e66be2SVincenzo Maffione #ifdef WITH_NMNULL
1183b6e66be2SVincenzo Maffione struct netmap_null_adapter {
1184b6e66be2SVincenzo Maffione struct netmap_adapter up;
1185b6e66be2SVincenzo Maffione };
1186b6e66be2SVincenzo Maffione #endif /* WITH_NMNULL */
1187b6e66be2SVincenzo Maffione
118817885a7bSLuigi Rizzo
118917885a7bSLuigi Rizzo /* return slots reserved to rx clients; used in drivers */
119017885a7bSLuigi Rizzo static inline uint32_t
nm_kr_rxspace(struct netmap_kring * k)119117885a7bSLuigi Rizzo nm_kr_rxspace(struct netmap_kring *k)
119217885a7bSLuigi Rizzo {
119317885a7bSLuigi Rizzo int space = k->nr_hwtail - k->nr_hwcur;
1194ce3ee1e7SLuigi Rizzo if (space < 0)
1195ce3ee1e7SLuigi Rizzo space += k->nkr_num_slots;
119675f4f3edSVincenzo Maffione nm_prdis("preserving %d rx slots %d -> %d", space, k->nr_hwcur, k->nr_hwtail);
119717885a7bSLuigi Rizzo
1198ce3ee1e7SLuigi Rizzo return space;
1199ce3ee1e7SLuigi Rizzo }
1200ce3ee1e7SLuigi Rizzo
120137e3a6d3SLuigi Rizzo /* return slots reserved to tx clients */
120237e3a6d3SLuigi Rizzo #define nm_kr_txspace(_k) nm_kr_rxspace(_k)
1203ce3ee1e7SLuigi Rizzo
120437e3a6d3SLuigi Rizzo
120537e3a6d3SLuigi Rizzo /* True if no space in the tx ring, only valid after txsync_prologue */
120617885a7bSLuigi Rizzo static inline int
nm_kr_txempty(struct netmap_kring * kring)120717885a7bSLuigi Rizzo nm_kr_txempty(struct netmap_kring *kring)
1208ce3ee1e7SLuigi Rizzo {
1209f79ba6d7SVincenzo Maffione return kring->rhead == kring->nr_hwtail;
1210f9790aebSLuigi Rizzo }
1211f9790aebSLuigi Rizzo
121237e3a6d3SLuigi Rizzo /* True if no more completed slots in the rx ring, only valid after
121337e3a6d3SLuigi Rizzo * rxsync_prologue */
121437e3a6d3SLuigi Rizzo #define nm_kr_rxempty(_k) nm_kr_txempty(_k)
1215ce3ee1e7SLuigi Rizzo
12165faab778SVincenzo Maffione /* True if the application needs to wait for more space on the ring
12175faab778SVincenzo Maffione * (more received packets or more free tx slots).
12185faab778SVincenzo Maffione * Only valid after *xsync_prologue. */
12195faab778SVincenzo Maffione static inline int
nm_kr_wouldblock(struct netmap_kring * kring)12205faab778SVincenzo Maffione nm_kr_wouldblock(struct netmap_kring *kring)
12215faab778SVincenzo Maffione {
12225faab778SVincenzo Maffione return kring->rcur == kring->nr_hwtail;
12235faab778SVincenzo Maffione }
12245faab778SVincenzo Maffione
1225ce3ee1e7SLuigi Rizzo /*
1226f9790aebSLuigi Rizzo * protect against multiple threads using the same ring.
122737e3a6d3SLuigi Rizzo * also check that the ring has not been stopped or locked
122868b8534bSLuigi Rizzo */
122937e3a6d3SLuigi Rizzo #define NM_KR_BUSY 1 /* some other thread is syncing the ring */
123037e3a6d3SLuigi Rizzo #define NM_KR_STOPPED 2 /* unbounded stop (ifconfig down or driver unload) */
123137e3a6d3SLuigi Rizzo #define NM_KR_LOCKED 3 /* bounded, brief stop for mutual exclusion */
123268b8534bSLuigi Rizzo
123317885a7bSLuigi Rizzo
123437e3a6d3SLuigi Rizzo /* release the previously acquired right to use the *sync() methods of the ring */
nm_kr_put(struct netmap_kring * kr)1235f9790aebSLuigi Rizzo static __inline void nm_kr_put(struct netmap_kring *kr)
1236f9790aebSLuigi Rizzo {
1237f9790aebSLuigi Rizzo NM_ATOMIC_CLEAR(&kr->nr_busy);
1238f9790aebSLuigi Rizzo }
1239f9790aebSLuigi Rizzo
124017885a7bSLuigi Rizzo
124137e3a6d3SLuigi Rizzo /* true if the ifp that backed the adapter has disappeared (e.g., the
124237e3a6d3SLuigi Rizzo * driver has been unloaded)
124337e3a6d3SLuigi Rizzo */
124437e3a6d3SLuigi Rizzo static inline int nm_iszombie(struct netmap_adapter *na);
124537e3a6d3SLuigi Rizzo
124637e3a6d3SLuigi Rizzo /* try to obtain exclusive right to issue the *sync() operations on the ring.
124737e3a6d3SLuigi Rizzo * The right is obtained and must be later relinquished via nm_kr_put() if and
124837e3a6d3SLuigi Rizzo * only if nm_kr_tryget() returns 0.
124937e3a6d3SLuigi Rizzo * If can_sleep is 1 there are only two other possible outcomes:
125037e3a6d3SLuigi Rizzo * - the function returns NM_KR_BUSY
125137e3a6d3SLuigi Rizzo * - the function returns NM_KR_STOPPED and sets the POLLERR bit in *perr
125237e3a6d3SLuigi Rizzo * (if non-null)
125337e3a6d3SLuigi Rizzo * In both cases the caller will typically skip the ring, possibly collecting
125437e3a6d3SLuigi Rizzo * errors along the way.
125537e3a6d3SLuigi Rizzo * If the calling context does not allow sleeping, the caller must pass 0 in can_sleep.
125637e3a6d3SLuigi Rizzo * In the latter case, the function may also return NM_KR_LOCKED and leave *perr
125737e3a6d3SLuigi Rizzo * untouched: ideally, the caller should try again at a later time.
125837e3a6d3SLuigi Rizzo */
nm_kr_tryget(struct netmap_kring * kr,int can_sleep,int * perr)125937e3a6d3SLuigi Rizzo static __inline int nm_kr_tryget(struct netmap_kring *kr, int can_sleep, int *perr)
1260f9790aebSLuigi Rizzo {
126137e3a6d3SLuigi Rizzo int busy = 1, stopped;
1262f9790aebSLuigi Rizzo /* check a first time without taking the lock
1263f9790aebSLuigi Rizzo * to avoid starvation for nm_kr_get()
1264f9790aebSLuigi Rizzo */
126537e3a6d3SLuigi Rizzo retry:
126637e3a6d3SLuigi Rizzo stopped = kr->nkr_stopped;
126737e3a6d3SLuigi Rizzo if (unlikely(stopped)) {
126837e3a6d3SLuigi Rizzo goto stop;
1269f9790aebSLuigi Rizzo }
127037e3a6d3SLuigi Rizzo busy = NM_ATOMIC_TEST_AND_SET(&kr->nr_busy);
127137e3a6d3SLuigi Rizzo /* we should not return NM_KR_BUSY if the ring was
127237e3a6d3SLuigi Rizzo * actually stopped, so check another time after
127337e3a6d3SLuigi Rizzo * the barrier provided by the atomic operation
127437e3a6d3SLuigi Rizzo */
127537e3a6d3SLuigi Rizzo stopped = kr->nkr_stopped;
127637e3a6d3SLuigi Rizzo if (unlikely(stopped)) {
127737e3a6d3SLuigi Rizzo goto stop;
1278f9790aebSLuigi Rizzo }
127968b8534bSLuigi Rizzo
128037e3a6d3SLuigi Rizzo if (unlikely(nm_iszombie(kr->na))) {
128137e3a6d3SLuigi Rizzo stopped = NM_KR_STOPPED;
128237e3a6d3SLuigi Rizzo goto stop;
128337e3a6d3SLuigi Rizzo }
128437e3a6d3SLuigi Rizzo
128537e3a6d3SLuigi Rizzo return unlikely(busy) ? NM_KR_BUSY : 0;
128637e3a6d3SLuigi Rizzo
128737e3a6d3SLuigi Rizzo stop:
128837e3a6d3SLuigi Rizzo if (!busy)
128937e3a6d3SLuigi Rizzo nm_kr_put(kr);
129037e3a6d3SLuigi Rizzo if (stopped == NM_KR_STOPPED) {
129137e3a6d3SLuigi Rizzo /* if POLLERR is defined we want to use it to simplify netmap_poll().
129237e3a6d3SLuigi Rizzo * Otherwise, any non-zero value will do.
129337e3a6d3SLuigi Rizzo */
129437e3a6d3SLuigi Rizzo #ifdef POLLERR
129537e3a6d3SLuigi Rizzo #define NM_POLLERR POLLERR
129637e3a6d3SLuigi Rizzo #else
129737e3a6d3SLuigi Rizzo #define NM_POLLERR 1
129837e3a6d3SLuigi Rizzo #endif /* POLLERR */
129937e3a6d3SLuigi Rizzo if (perr)
130037e3a6d3SLuigi Rizzo *perr |= NM_POLLERR;
130137e3a6d3SLuigi Rizzo #undef NM_POLLERR
130237e3a6d3SLuigi Rizzo } else if (can_sleep) {
130337e3a6d3SLuigi Rizzo tsleep(kr, 0, "NM_KR_TRYGET", 4);
130437e3a6d3SLuigi Rizzo goto retry;
130537e3a6d3SLuigi Rizzo }
130637e3a6d3SLuigi Rizzo return stopped;
130737e3a6d3SLuigi Rizzo }
130837e3a6d3SLuigi Rizzo
130937e3a6d3SLuigi Rizzo /* put the ring in the 'stopped' state and wait for the current user (if any) to
131037e3a6d3SLuigi Rizzo * notice. stopped must be either NM_KR_STOPPED or NM_KR_LOCKED
131137e3a6d3SLuigi Rizzo */
nm_kr_stop(struct netmap_kring * kr,int stopped)131237e3a6d3SLuigi Rizzo static __inline void nm_kr_stop(struct netmap_kring *kr, int stopped)
1313847bf383SLuigi Rizzo {
131437e3a6d3SLuigi Rizzo kr->nkr_stopped = stopped;
1315847bf383SLuigi Rizzo while (NM_ATOMIC_TEST_AND_SET(&kr->nr_busy))
1316847bf383SLuigi Rizzo tsleep(kr, 0, "NM_KR_GET", 4);
1317847bf383SLuigi Rizzo }
1318847bf383SLuigi Rizzo
131937e3a6d3SLuigi Rizzo /* restart a ring after a stop */
nm_kr_start(struct netmap_kring * kr)132037e3a6d3SLuigi Rizzo static __inline void nm_kr_start(struct netmap_kring *kr)
132137e3a6d3SLuigi Rizzo {
132237e3a6d3SLuigi Rizzo kr->nkr_stopped = 0;
132337e3a6d3SLuigi Rizzo nm_kr_put(kr);
132437e3a6d3SLuigi Rizzo }
132537e3a6d3SLuigi Rizzo
1326847bf383SLuigi Rizzo
132768b8534bSLuigi Rizzo /*
132817885a7bSLuigi Rizzo * The following functions are used by individual drivers to
132968b8534bSLuigi Rizzo * support netmap operation.
133068b8534bSLuigi Rizzo *
133168b8534bSLuigi Rizzo * netmap_attach() initializes a struct netmap_adapter, allocating the
133268b8534bSLuigi Rizzo * struct netmap_ring's and the struct selinfo.
133368b8534bSLuigi Rizzo *
133468b8534bSLuigi Rizzo * netmap_detach() frees the memory allocated by netmap_attach().
133568b8534bSLuigi Rizzo *
1336ce3ee1e7SLuigi Rizzo * netmap_transmit() replaces the if_transmit routine of the interface,
133768b8534bSLuigi Rizzo * and is used to intercept packets coming from the stack.
133868b8534bSLuigi Rizzo *
133968b8534bSLuigi Rizzo * netmap_load_map/netmap_reload_map are helper routines to set/reset
134068b8534bSLuigi Rizzo * the dmamap for a packet buffer
134168b8534bSLuigi Rizzo *
13424bf50f18SLuigi Rizzo * netmap_reset() is a helper routine to be called in the hw driver
13434bf50f18SLuigi Rizzo * when reinitializing a ring. It should not be called by
13444bf50f18SLuigi Rizzo * virtual ports (vale, pipes, monitor)
134568b8534bSLuigi Rizzo */
1346f9790aebSLuigi Rizzo int netmap_attach(struct netmap_adapter *);
13474f80b14cSVincenzo Maffione int netmap_attach_ext(struct netmap_adapter *, size_t size, int override_reg);
1348e330262fSJustin Hibbits void netmap_detach(if_t);
1349e330262fSJustin Hibbits int netmap_transmit(if_t, struct mbuf *);
135068b8534bSLuigi Rizzo struct netmap_slot *netmap_reset(struct netmap_adapter *na,
1351ce3ee1e7SLuigi Rizzo enum txrx tx, u_int n, u_int new_cur);
135268b8534bSLuigi Rizzo int netmap_ring_reinit(struct netmap_kring *);
13532ff91c17SVincenzo Maffione int netmap_rings_config_get(struct netmap_adapter *, struct nm_config_info *);
135468b8534bSLuigi Rizzo
135537e3a6d3SLuigi Rizzo /* Return codes for netmap_*x_irq. */
135637e3a6d3SLuigi Rizzo enum {
135737e3a6d3SLuigi Rizzo /* Driver should do normal interrupt processing, e.g. because
135837e3a6d3SLuigi Rizzo * the interface is not in netmap mode. */
135937e3a6d3SLuigi Rizzo NM_IRQ_PASS = 0,
136037e3a6d3SLuigi Rizzo /* Port is in netmap mode, and the interrupt work has been
136137e3a6d3SLuigi Rizzo * completed. The driver does not have to notify netmap
136237e3a6d3SLuigi Rizzo * again before the next interrupt. */
136337e3a6d3SLuigi Rizzo NM_IRQ_COMPLETED = -1,
136437e3a6d3SLuigi Rizzo /* Port is in netmap mode, but the interrupt work has not been
136537e3a6d3SLuigi Rizzo * completed. The driver has to make sure netmap will be
136637e3a6d3SLuigi Rizzo * notified again soon, even if no more interrupts come (e.g.
136737e3a6d3SLuigi Rizzo * on Linux the driver should not call napi_complete()). */
136837e3a6d3SLuigi Rizzo NM_IRQ_RESCHED = -2,
136937e3a6d3SLuigi Rizzo };
137037e3a6d3SLuigi Rizzo
137117885a7bSLuigi Rizzo /* default functions to handle rx/tx interrupts */
1372e330262fSJustin Hibbits int netmap_rx_irq(if_t, u_int, u_int *);
137317885a7bSLuigi Rizzo #define netmap_tx_irq(_n, _q) netmap_rx_irq(_n, _q, NULL)
137437e3a6d3SLuigi Rizzo int netmap_common_irq(struct netmap_adapter *, u_int, u_int *work_done);
137517885a7bSLuigi Rizzo
137617885a7bSLuigi Rizzo
13774bf50f18SLuigi Rizzo #ifdef WITH_VALE
13784bf50f18SLuigi Rizzo /* functions used by external modules to interface with VALE */
13794bf50f18SLuigi Rizzo #define netmap_vp_to_ifp(_vp) ((_vp)->up.ifp)
13804bf50f18SLuigi Rizzo #define netmap_ifp_to_vp(_ifp) (NA(_ifp)->na_vp)
13814bf50f18SLuigi Rizzo #define netmap_ifp_to_host_vp(_ifp) (NA(_ifp)->na_hostvp)
13824bf50f18SLuigi Rizzo #define netmap_bdg_idx(_vp) ((_vp)->bdg_port)
13834bf50f18SLuigi Rizzo const char *netmap_bdg_name(struct netmap_vp_adapter *);
13844bf50f18SLuigi Rizzo #else /* !WITH_VALE */
13854bf50f18SLuigi Rizzo #define netmap_vp_to_ifp(_vp) NULL
13864bf50f18SLuigi Rizzo #define netmap_ifp_to_vp(_ifp) NULL
13874bf50f18SLuigi Rizzo #define netmap_ifp_to_host_vp(_ifp) NULL
13884bf50f18SLuigi Rizzo #define netmap_bdg_idx(_vp) -1
13894bf50f18SLuigi Rizzo #endif /* WITH_VALE */
13904bf50f18SLuigi Rizzo
13914bf50f18SLuigi Rizzo static inline int
nm_netmap_on(struct netmap_adapter * na)13924bf50f18SLuigi Rizzo nm_netmap_on(struct netmap_adapter *na)
13934bf50f18SLuigi Rizzo {
13944bf50f18SLuigi Rizzo return na && na->na_flags & NAF_NETMAP_ON;
13954bf50f18SLuigi Rizzo }
139617885a7bSLuigi Rizzo
1397847bf383SLuigi Rizzo static inline int
nm_native_on(struct netmap_adapter * na)1398847bf383SLuigi Rizzo nm_native_on(struct netmap_adapter *na)
1399847bf383SLuigi Rizzo {
1400847bf383SLuigi Rizzo return nm_netmap_on(na) && (na->na_flags & NAF_NATIVE);
1401847bf383SLuigi Rizzo }
1402847bf383SLuigi Rizzo
140366823237SVincenzo Maffione static inline struct netmap_kring *
netmap_kring_on(struct netmap_adapter * na,u_int q,enum txrx t)140466823237SVincenzo Maffione netmap_kring_on(struct netmap_adapter *na, u_int q, enum txrx t)
140566823237SVincenzo Maffione {
140666823237SVincenzo Maffione struct netmap_kring *kring = NULL;
140766823237SVincenzo Maffione
140866823237SVincenzo Maffione if (!nm_native_on(na))
140966823237SVincenzo Maffione return NULL;
141066823237SVincenzo Maffione
141166823237SVincenzo Maffione if (t == NR_RX && q < na->num_rx_rings)
141266823237SVincenzo Maffione kring = na->rx_rings[q];
141366823237SVincenzo Maffione else if (t == NR_TX && q < na->num_tx_rings)
141466823237SVincenzo Maffione kring = na->tx_rings[q];
141566823237SVincenzo Maffione else
141666823237SVincenzo Maffione return NULL;
141766823237SVincenzo Maffione
141866823237SVincenzo Maffione return (kring->nr_mode == NKR_NETMAP_ON) ? kring : NULL;
141966823237SVincenzo Maffione }
142066823237SVincenzo Maffione
142137e3a6d3SLuigi Rizzo static inline int
nm_iszombie(struct netmap_adapter * na)142237e3a6d3SLuigi Rizzo nm_iszombie(struct netmap_adapter *na)
142337e3a6d3SLuigi Rizzo {
142437e3a6d3SLuigi Rizzo return na == NULL || (na->na_flags & NAF_ZOMBIE);
142537e3a6d3SLuigi Rizzo }
142637e3a6d3SLuigi Rizzo
14272a7db7a6SVincenzo Maffione void nm_set_native_flags(struct netmap_adapter *);
14282a7db7a6SVincenzo Maffione void nm_clear_native_flags(struct netmap_adapter *);
14292ff91c17SVincenzo Maffione
143075f4f3edSVincenzo Maffione void netmap_krings_mode_commit(struct netmap_adapter *na, int onoff);
143175f4f3edSVincenzo Maffione
143237e3a6d3SLuigi Rizzo /*
143337e3a6d3SLuigi Rizzo * nm_*sync_prologue() functions are used in ioctl/poll and ptnetmap
143437e3a6d3SLuigi Rizzo * kthreads.
143537e3a6d3SLuigi Rizzo * We need netmap_ring* parameter, because in ptnetmap it is decoupled
143637e3a6d3SLuigi Rizzo * from host kring.
143737e3a6d3SLuigi Rizzo * The user-space ring pointers (head/cur/tail) are shared through
143837e3a6d3SLuigi Rizzo * CSB between host and guest.
143937e3a6d3SLuigi Rizzo */
144037e3a6d3SLuigi Rizzo
144137e3a6d3SLuigi Rizzo /*
144237e3a6d3SLuigi Rizzo * validates parameters in the ring/kring, returns a value for head
144337e3a6d3SLuigi Rizzo * If any error, returns ring_size to force a reinit.
144437e3a6d3SLuigi Rizzo */
144537e3a6d3SLuigi Rizzo uint32_t nm_txsync_prologue(struct netmap_kring *, struct netmap_ring *);
144637e3a6d3SLuigi Rizzo
144737e3a6d3SLuigi Rizzo
144837e3a6d3SLuigi Rizzo /*
144937e3a6d3SLuigi Rizzo * validates parameters in the ring/kring, returns a value for head
145037e3a6d3SLuigi Rizzo * If any error, returns ring_size lim to force a reinit.
145137e3a6d3SLuigi Rizzo */
145237e3a6d3SLuigi Rizzo uint32_t nm_rxsync_prologue(struct netmap_kring *, struct netmap_ring *);
145337e3a6d3SLuigi Rizzo
1454f9790aebSLuigi Rizzo
1455f9790aebSLuigi Rizzo /* check/fix address and len in tx rings */
1456f9790aebSLuigi Rizzo #if 1 /* debug version */
14574bf50f18SLuigi Rizzo #define NM_CHECK_ADDR_LEN(_na, _a, _l) do { \
14584bf50f18SLuigi Rizzo if (_a == NETMAP_BUF_BASE(_na) || _l > NETMAP_BUF_SIZE(_na)) { \
145975f4f3edSVincenzo Maffione nm_prlim(5, "bad addr/len ring %d slot %d idx %d len %d", \
14604bf50f18SLuigi Rizzo kring->ring_id, nm_i, slot->buf_idx, len); \
14614bf50f18SLuigi Rizzo if (_l > NETMAP_BUF_SIZE(_na)) \
14624bf50f18SLuigi Rizzo _l = NETMAP_BUF_SIZE(_na); \
1463f9790aebSLuigi Rizzo } } while (0)
1464f9790aebSLuigi Rizzo #else /* no debug version */
14654bf50f18SLuigi Rizzo #define NM_CHECK_ADDR_LEN(_na, _a, _l) do { \
14664bf50f18SLuigi Rizzo if (_l > NETMAP_BUF_SIZE(_na)) \
14674bf50f18SLuigi Rizzo _l = NETMAP_BUF_SIZE(_na); \
1468f9790aebSLuigi Rizzo } while (0)
1469f9790aebSLuigi Rizzo #endif
1470f9790aebSLuigi Rizzo
1471a6d768d8SVincenzo Maffione #define NM_CHECK_ADDR_LEN_OFF(na_, l_, o_) do { \
1472a6d768d8SVincenzo Maffione if ((l_) + (o_) < (l_) || \
1473a6d768d8SVincenzo Maffione (l_) + (o_) > NETMAP_BUF_SIZE(na_)) { \
1474a6d768d8SVincenzo Maffione (l_) = NETMAP_BUF_SIZE(na_) - (o_); \
1475a6d768d8SVincenzo Maffione } } while (0)
1476a6d768d8SVincenzo Maffione
1477f9790aebSLuigi Rizzo
1478f9790aebSLuigi Rizzo /*---------------------------------------------------------------*/
1479f9790aebSLuigi Rizzo /*
14804bf50f18SLuigi Rizzo * Support routines used by netmap subsystems
14814bf50f18SLuigi Rizzo * (native drivers, VALE, generic, pipes, monitors, ...)
14824bf50f18SLuigi Rizzo */
14834bf50f18SLuigi Rizzo
14844bf50f18SLuigi Rizzo
14854bf50f18SLuigi Rizzo /* common routine for all functions that create a netmap adapter. It performs
14864bf50f18SLuigi Rizzo * two main tasks:
14874bf50f18SLuigi Rizzo * - if the na points to an ifp, mark the ifp as netmap capable
14884bf50f18SLuigi Rizzo * using na as its native adapter;
14894bf50f18SLuigi Rizzo * - provide defaults for the setup callbacks and the memory allocator
14904bf50f18SLuigi Rizzo */
14914bf50f18SLuigi Rizzo int netmap_attach_common(struct netmap_adapter *);
14924bf50f18SLuigi Rizzo /* fill priv->np_[tr]xq{first,last} using the ringid and flags information
14932ff91c17SVincenzo Maffione * coming from a struct nmreq_register
14944bf50f18SLuigi Rizzo */
1495ee0005f1SVincenzo Maffione int netmap_interp_ringid(struct netmap_priv_d *priv, struct nmreq_header *hdr);
14964bf50f18SLuigi Rizzo /* update the ring parameters (number and size of tx and rx rings).
14974bf50f18SLuigi Rizzo * It calls the nm_config callback, if available.
1498f9790aebSLuigi Rizzo */
1499f9790aebSLuigi Rizzo int netmap_update_config(struct netmap_adapter *na);
15004bf50f18SLuigi Rizzo /* create and initialize the common fields of the krings array.
15014bf50f18SLuigi Rizzo * using the information that must be already available in the na.
15024bf50f18SLuigi Rizzo * tailroom can be used to request the allocation of additional
15034bf50f18SLuigi Rizzo * tailroom bytes after the krings array. This is used by
15044bf50f18SLuigi Rizzo * netmap_vp_adapter's (i.e., VALE ports) to make room for
15054bf50f18SLuigi Rizzo * leasing-related data structures
15064bf50f18SLuigi Rizzo */
1507f0ea3689SLuigi Rizzo int netmap_krings_create(struct netmap_adapter *na, u_int tailroom);
15084bf50f18SLuigi Rizzo /* deletes the kring array of the adapter. The array must have
15094bf50f18SLuigi Rizzo * been created using netmap_krings_create
15104bf50f18SLuigi Rizzo */
1511f9790aebSLuigi Rizzo void netmap_krings_delete(struct netmap_adapter *na);
151217885a7bSLuigi Rizzo
151337e3a6d3SLuigi Rizzo int netmap_hw_krings_create(struct netmap_adapter *na);
151437e3a6d3SLuigi Rizzo void netmap_hw_krings_delete(struct netmap_adapter *na);
151537e3a6d3SLuigi Rizzo
15164bf50f18SLuigi Rizzo /* set the stopped/enabled status of ring
15174bf50f18SLuigi Rizzo * When stopping, they also wait for all current activity on the ring to
15184bf50f18SLuigi Rizzo * terminate. The status change is then notified using the na nm_notify
15194bf50f18SLuigi Rizzo * callback.
15204bf50f18SLuigi Rizzo */
1521847bf383SLuigi Rizzo void netmap_set_ring(struct netmap_adapter *, u_int ring_id, enum txrx, int stopped);
15224bf50f18SLuigi Rizzo /* set the stopped/enabled status of all rings of the adapter. */
15234bf50f18SLuigi Rizzo void netmap_set_all_rings(struct netmap_adapter *, int stopped);
152437e3a6d3SLuigi Rizzo /* convenience wrappers for netmap_set_all_rings */
1525e330262fSJustin Hibbits void netmap_disable_all_rings(if_t);
1526e330262fSJustin Hibbits void netmap_enable_all_rings(if_t);
15274bf50f18SLuigi Rizzo
152877a2baf5SVincenzo Maffione int netmap_buf_size_validate(const struct netmap_adapter *na, unsigned mtu);
15298fd44c93SLuigi Rizzo int netmap_do_regif(struct netmap_priv_d *priv, struct netmap_adapter *na,
1530ee0005f1SVincenzo Maffione struct nmreq_header *);
153137e3a6d3SLuigi Rizzo void netmap_do_unregif(struct netmap_priv_d *priv);
1532f9790aebSLuigi Rizzo
1533f9790aebSLuigi Rizzo u_int nm_bound_var(u_int *v, u_int dflt, u_int lo, u_int hi, const char *msg);
15342ff91c17SVincenzo Maffione int netmap_get_na(struct nmreq_header *hdr, struct netmap_adapter **na,
1535e330262fSJustin Hibbits if_t *ifp, struct netmap_mem_d *nmd, int create);
1536e330262fSJustin Hibbits void netmap_unget_na(struct netmap_adapter *na, if_t ifp);
1537e330262fSJustin Hibbits int netmap_get_hw_na(if_t ifp,
1538c3e9b4dbSLuiz Otavio O Souza struct netmap_mem_d *nmd, struct netmap_adapter **na);
1539a6d768d8SVincenzo Maffione void netmap_mem_restore(struct netmap_adapter *na);
1540f9790aebSLuigi Rizzo
15412a7db7a6SVincenzo Maffione #ifdef WITH_VALE
1542b6e66be2SVincenzo Maffione uint32_t netmap_vale_learning(struct nm_bdg_fwd *ft, uint8_t *dst_ring,
15432a7db7a6SVincenzo Maffione struct netmap_vp_adapter *, void *private_data);
15442a7db7a6SVincenzo Maffione
15452a7db7a6SVincenzo Maffione /* these are redefined in case of no VALE support */
15462a7db7a6SVincenzo Maffione int netmap_get_vale_na(struct nmreq_header *hdr, struct netmap_adapter **na,
15472a7db7a6SVincenzo Maffione struct netmap_mem_d *nmd, int create);
15482a7db7a6SVincenzo Maffione void *netmap_vale_create(const char *bdg_name, int *return_status);
15492a7db7a6SVincenzo Maffione int netmap_vale_destroy(const char *bdg_name, void *auth_token);
1550f9790aebSLuigi Rizzo
1551dd6ab49aSVincenzo Maffione extern unsigned int vale_max_bridges;
1552dd6ab49aSVincenzo Maffione
1553f9790aebSLuigi Rizzo #else /* !WITH_VALE */
15542a7db7a6SVincenzo Maffione #define netmap_bdg_learning(_1, _2, _3, _4) 0
15552a7db7a6SVincenzo Maffione #define netmap_get_vale_na(_1, _2, _3, _4) 0
15562a7db7a6SVincenzo Maffione #define netmap_bdg_create(_1, _2) NULL
15572a7db7a6SVincenzo Maffione #define netmap_bdg_destroy(_1, _2) 0
15584ad57c7aSVincenzo Maffione #define vale_max_bridges 1
1559f9790aebSLuigi Rizzo #endif /* !WITH_VALE */
1560f9790aebSLuigi Rizzo
1561f0ea3689SLuigi Rizzo #ifdef WITH_PIPES
1562f0ea3689SLuigi Rizzo /* max number of pipes per device */
15634f80b14cSVincenzo Maffione #define NM_MAXPIPES 64 /* XXX this should probably be a sysctl */
1564f0ea3689SLuigi Rizzo void netmap_pipe_dealloc(struct netmap_adapter *);
15652ff91c17SVincenzo Maffione int netmap_get_pipe_na(struct nmreq_header *hdr, struct netmap_adapter **na,
1566c3e9b4dbSLuiz Otavio O Souza struct netmap_mem_d *nmd, int create);
1567f0ea3689SLuigi Rizzo #else /* !WITH_PIPES */
1568f0ea3689SLuigi Rizzo #define NM_MAXPIPES 0
1569847bf383SLuigi Rizzo #define netmap_pipe_alloc(_1, _2) 0
1570f0ea3689SLuigi Rizzo #define netmap_pipe_dealloc(_1)
15712ff91c17SVincenzo Maffione #define netmap_get_pipe_na(hdr, _2, _3, _4) \
15722ff91c17SVincenzo Maffione ((strchr(hdr->nr_name, '{') != NULL || strchr(hdr->nr_name, '}') != NULL) ? EOPNOTSUPP : 0)
1573f0ea3689SLuigi Rizzo #endif
1574f0ea3689SLuigi Rizzo
15754bf50f18SLuigi Rizzo #ifdef WITH_MONITOR
15762ff91c17SVincenzo Maffione int netmap_get_monitor_na(struct nmreq_header *hdr, struct netmap_adapter **na,
1577c3e9b4dbSLuiz Otavio O Souza struct netmap_mem_d *nmd, int create);
1578847bf383SLuigi Rizzo void netmap_monitor_stop(struct netmap_adapter *na);
15794bf50f18SLuigi Rizzo #else
15802ff91c17SVincenzo Maffione #define netmap_get_monitor_na(hdr, _2, _3, _4) \
1581cfa866f6SMatt Macy (((struct nmreq_register *)(uintptr_t)hdr->nr_body)->nr_flags & (NR_MONITOR_TX | NR_MONITOR_RX) ? EOPNOTSUPP : 0)
1582847bf383SLuigi Rizzo #endif
1583847bf383SLuigi Rizzo
1584b6e66be2SVincenzo Maffione #ifdef WITH_NMNULL
1585b6e66be2SVincenzo Maffione int netmap_get_null_na(struct nmreq_header *hdr, struct netmap_adapter **na,
1586b6e66be2SVincenzo Maffione struct netmap_mem_d *nmd, int create);
1587b6e66be2SVincenzo Maffione #else /* !WITH_NMNULL */
1588b6e66be2SVincenzo Maffione #define netmap_get_null_na(hdr, _2, _3, _4) \
1589b6e66be2SVincenzo Maffione (((struct nmreq_register *)(uintptr_t)hdr->nr_body)->nr_flags & (NR_MONITOR_TX | NR_MONITOR_RX) ? EOPNOTSUPP : 0)
1590b6e66be2SVincenzo Maffione #endif /* WITH_NMNULL */
1591b6e66be2SVincenzo Maffione
1592847bf383SLuigi Rizzo #ifdef CONFIG_NET_NS
1593847bf383SLuigi Rizzo struct net *netmap_bns_get(void);
1594847bf383SLuigi Rizzo void netmap_bns_put(struct net *);
1595847bf383SLuigi Rizzo void netmap_bns_getbridges(struct nm_bridge **, u_int *);
1596847bf383SLuigi Rizzo #else
1597b6e66be2SVincenzo Maffione extern struct nm_bridge *nm_bridges;
1598847bf383SLuigi Rizzo #define netmap_bns_get()
1599847bf383SLuigi Rizzo #define netmap_bns_put(_1)
1600847bf383SLuigi Rizzo #define netmap_bns_getbridges(b, n) \
1601dd6ab49aSVincenzo Maffione do { *b = nm_bridges; *n = vale_max_bridges; } while (0)
16024bf50f18SLuigi Rizzo #endif
16034bf50f18SLuigi Rizzo
1604f9790aebSLuigi Rizzo /* Various prototypes */
160537e3a6d3SLuigi Rizzo int netmap_poll(struct netmap_priv_d *, int events, NM_SELRECORD_T *td);
1606f9790aebSLuigi Rizzo int netmap_init(void);
1607f9790aebSLuigi Rizzo void netmap_fini(void);
1608f9790aebSLuigi Rizzo int netmap_get_memory(struct netmap_priv_d* p);
1609f9790aebSLuigi Rizzo void netmap_dtor(void *data);
1610f9790aebSLuigi Rizzo
16112ff91c17SVincenzo Maffione int netmap_ioctl(struct netmap_priv_d *priv, u_long cmd, caddr_t data,
16122ff91c17SVincenzo Maffione struct thread *, int nr_body_is_user);
16132ff91c17SVincenzo Maffione int netmap_ioctl_legacy(struct netmap_priv_d *priv, u_long cmd, caddr_t data,
16142ff91c17SVincenzo Maffione struct thread *td);
16152ff91c17SVincenzo Maffione size_t nmreq_size_by_type(uint16_t nr_reqtype);
1616f9790aebSLuigi Rizzo
1617f9790aebSLuigi Rizzo /* netmap_adapter creation/destruction */
161817885a7bSLuigi Rizzo
161917885a7bSLuigi Rizzo // #define NM_DEBUG_PUTGET 1
1620f9790aebSLuigi Rizzo
1621f9790aebSLuigi Rizzo #ifdef NM_DEBUG_PUTGET
1622f9790aebSLuigi Rizzo
1623f9790aebSLuigi Rizzo #define NM_DBG(f) __##f
1624f9790aebSLuigi Rizzo
1625f9790aebSLuigi Rizzo void __netmap_adapter_get(struct netmap_adapter *na);
1626f9790aebSLuigi Rizzo
1627f9790aebSLuigi Rizzo #define netmap_adapter_get(na) \
1628f9790aebSLuigi Rizzo do { \
1629f9790aebSLuigi Rizzo struct netmap_adapter *__na = na; \
1630f9790aebSLuigi Rizzo __netmap_adapter_get(__na); \
163192e8b4a6SVincenzo Maffione nm_prinf("getting %p:%s -> %d", __na, (__na)->name, (__na)->na_refcount); \
1632f9790aebSLuigi Rizzo } while (0)
1633f9790aebSLuigi Rizzo
1634f9790aebSLuigi Rizzo int __netmap_adapter_put(struct netmap_adapter *na);
1635f9790aebSLuigi Rizzo
1636f9790aebSLuigi Rizzo #define netmap_adapter_put(na) \
1637fb25194fSLuigi Rizzo ({ \
1638f9790aebSLuigi Rizzo struct netmap_adapter *__na = na; \
163992e8b4a6SVincenzo Maffione if (__na == NULL) \
164092e8b4a6SVincenzo Maffione nm_prinf("putting NULL"); \
164192e8b4a6SVincenzo Maffione else \
164292e8b4a6SVincenzo Maffione nm_prinf("putting %p:%s -> %d", __na, (__na)->name, (__na)->na_refcount - 1); \
1643f9790aebSLuigi Rizzo __netmap_adapter_put(__na); \
1644fb25194fSLuigi Rizzo })
1645f9790aebSLuigi Rizzo
1646f9790aebSLuigi Rizzo #else /* !NM_DEBUG_PUTGET */
1647f9790aebSLuigi Rizzo
1648f9790aebSLuigi Rizzo #define NM_DBG(f) f
1649f9790aebSLuigi Rizzo void netmap_adapter_get(struct netmap_adapter *na);
1650f9790aebSLuigi Rizzo int netmap_adapter_put(struct netmap_adapter *na);
1651f9790aebSLuigi Rizzo
1652f9790aebSLuigi Rizzo #endif /* !NM_DEBUG_PUTGET */
1653f9790aebSLuigi Rizzo
1654f9790aebSLuigi Rizzo
165517885a7bSLuigi Rizzo /*
165617885a7bSLuigi Rizzo * module variables
165717885a7bSLuigi Rizzo */
165837e3a6d3SLuigi Rizzo #define NETMAP_BUF_BASE(_na) ((_na)->na_lut.lut[0].vaddr)
165937e3a6d3SLuigi Rizzo #define NETMAP_BUF_SIZE(_na) ((_na)->na_lut.objsize)
16605819da83SLuigi Rizzo extern int netmap_no_pendintr;
1661b6e66be2SVincenzo Maffione extern int netmap_verbose;
1662b6e66be2SVincenzo Maffione #ifdef CONFIG_NETMAP_DEBUG
1663b6e66be2SVincenzo Maffione extern int netmap_debug; /* for debugging */
1664b6e66be2SVincenzo Maffione #else /* !CONFIG_NETMAP_DEBUG */
1665b6e66be2SVincenzo Maffione #define netmap_debug (0)
1666b6e66be2SVincenzo Maffione #endif /* !CONFIG_NETMAP_DEBUG */
1667b6e66be2SVincenzo Maffione enum { /* debug flags */
166845c67e8fSVincenzo Maffione NM_DEBUG_ON = 1, /* generic debug messages */
1669b6e66be2SVincenzo Maffione NM_DEBUG_HOST = 0x2, /* debug host stack */
1670b6e66be2SVincenzo Maffione NM_DEBUG_RXSYNC = 0x10, /* debug on rxsync/txsync */
1671b6e66be2SVincenzo Maffione NM_DEBUG_TXSYNC = 0x20,
1672b6e66be2SVincenzo Maffione NM_DEBUG_RXINTR = 0x100, /* debug on rx/tx intr (driver) */
1673b6e66be2SVincenzo Maffione NM_DEBUG_TXINTR = 0x200,
1674b6e66be2SVincenzo Maffione NM_DEBUG_NIC_RXSYNC = 0x1000, /* debug on rx/tx intr (driver) */
1675b6e66be2SVincenzo Maffione NM_DEBUG_NIC_TXSYNC = 0x2000,
1676b6e66be2SVincenzo Maffione NM_DEBUG_MEM = 0x4000, /* verbose memory allocations/deallocations */
1677b6e66be2SVincenzo Maffione NM_DEBUG_VALE = 0x8000, /* debug messages from memory allocators */
1678b6e66be2SVincenzo Maffione NM_DEBUG_BDG = NM_DEBUG_VALE,
167968b8534bSLuigi Rizzo };
168068b8534bSLuigi Rizzo
1681f9790aebSLuigi Rizzo extern int netmap_txsync_retry;
16822a7db7a6SVincenzo Maffione extern int netmap_generic_hwcsum;
1683f9790aebSLuigi Rizzo extern int netmap_generic_mit;
1684f9790aebSLuigi Rizzo extern int netmap_generic_ringsize;
1685f0ea3689SLuigi Rizzo extern int netmap_generic_rings;
16864f80b14cSVincenzo Maffione #ifdef linux
168737e3a6d3SLuigi Rizzo extern int netmap_generic_txqdisc;
16884f80b14cSVincenzo Maffione #endif
1689f9790aebSLuigi Rizzo
169068b8534bSLuigi Rizzo /*
16912a7db7a6SVincenzo Maffione * NA returns a pointer to the struct netmap adapter from the ifp.
169222bf2a47SVincenzo Maffione * The if_getnetmapadapter() and if_setnetmapadapter() helpers are
169322bf2a47SVincenzo Maffione * os-specific and must be defined in glue code.
169468b8534bSLuigi Rizzo */
169522bf2a47SVincenzo Maffione #define NA(_ifp) (if_getnetmapadapter(_ifp))
169668b8534bSLuigi Rizzo
16978241616dSLuigi Rizzo /*
16982a7db7a6SVincenzo Maffione * we provide a default implementation of NM_ATTACH_NA/NM_DETACH_NA
169922bf2a47SVincenzo Maffione * based on the if_setnetmapadapter() setter function.
17002a7db7a6SVincenzo Maffione * Glue code may override this by defining its own NM_ATTACH_NA
17012a7db7a6SVincenzo Maffione */
17022a7db7a6SVincenzo Maffione #ifndef NM_ATTACH_NA
17032a7db7a6SVincenzo Maffione /*
170437e3a6d3SLuigi Rizzo * On old versions of FreeBSD, NA(ifp) is a pspare. On linux we
170537e3a6d3SLuigi Rizzo * overload another pointer in the netdev.
170637e3a6d3SLuigi Rizzo *
170737e3a6d3SLuigi Rizzo * We check if NA(ifp) is set and its first element has a related
17088241616dSLuigi Rizzo * magic value. The capenable is within the struct netmap_adapter.
17098241616dSLuigi Rizzo */
17108241616dSLuigi Rizzo #define NETMAP_MAGIC 0x52697a7a
17118241616dSLuigi Rizzo
171237e3a6d3SLuigi Rizzo #define NM_NA_VALID(ifp) (NA(ifp) && \
17138241616dSLuigi Rizzo ((uint32_t)(uintptr_t)NA(ifp) ^ NA(ifp)->magic) == NETMAP_MAGIC )
17148241616dSLuigi Rizzo
171537e3a6d3SLuigi Rizzo #define NM_ATTACH_NA(ifp, na) do { \
1716e330262fSJustin Hibbits if_setnetmapadapter(ifp, na); \
171737e3a6d3SLuigi Rizzo if (NA(ifp)) \
171837e3a6d3SLuigi Rizzo NA(ifp)->magic = \
171937e3a6d3SLuigi Rizzo ((uint32_t)(uintptr_t)NA(ifp)) ^ NETMAP_MAGIC; \
172037e3a6d3SLuigi Rizzo } while(0)
1721e330262fSJustin Hibbits #define NM_RESTORE_NA(ifp, na) if_setnetmapadapter(ifp, na);
17222a7db7a6SVincenzo Maffione
1723e330262fSJustin Hibbits #define NM_DETACH_NA(ifp) do { if_setnetmapadapter(ifp, NULL); } while (0)
17242a7db7a6SVincenzo Maffione #define NM_NA_CLASH(ifp) (NA(ifp) && !NM_NA_VALID(ifp))
17252a7db7a6SVincenzo Maffione #endif /* !NM_ATTACH_NA */
17262a7db7a6SVincenzo Maffione
17278241616dSLuigi Rizzo
172837e3a6d3SLuigi Rizzo #define NM_IS_NATIVE(ifp) (NM_NA_VALID(ifp) && NA(ifp)->nm_dtor == netmap_hw_dtor)
172968b8534bSLuigi Rizzo
173037e3a6d3SLuigi Rizzo #if defined(__FreeBSD__)
1731*1bae9dc5SMark Johnston extern int netmap_port_numa_affinity;
1732f9790aebSLuigi Rizzo
1733*1bae9dc5SMark Johnston static inline int
nm_iommu_group_id(struct netmap_adapter * na)1734*1bae9dc5SMark Johnston nm_iommu_group_id(struct netmap_adapter *na)
1735*1bae9dc5SMark Johnston {
1736*1bae9dc5SMark Johnston return (-1);
1737*1bae9dc5SMark Johnston }
1738*1bae9dc5SMark Johnston
1739*1bae9dc5SMark Johnston static inline int
nm_numa_domain(struct netmap_adapter * na)1740*1bae9dc5SMark Johnston nm_numa_domain(struct netmap_adapter *na)
1741*1bae9dc5SMark Johnston {
1742*1bae9dc5SMark Johnston int domain;
1743*1bae9dc5SMark Johnston
1744*1bae9dc5SMark Johnston /*
1745*1bae9dc5SMark Johnston * If the system has only one NUMA domain, don't bother distinguishing
1746*1bae9dc5SMark Johnston * between IF_NODOM and domain 0.
1747*1bae9dc5SMark Johnston */
1748*1bae9dc5SMark Johnston if (vm_ndomains == 1 || netmap_port_numa_affinity == 0)
1749*1bae9dc5SMark Johnston return (-1);
1750*1bae9dc5SMark Johnston domain = if_getnumadomain(na->ifp);
1751*1bae9dc5SMark Johnston if (domain == IF_NODOM)
1752*1bae9dc5SMark Johnston domain = -1;
1753*1bae9dc5SMark Johnston return (domain);
1754*1bae9dc5SMark Johnston }
17554bf50f18SLuigi Rizzo
175617885a7bSLuigi Rizzo /* Callback invoked by the dma machinery after a successful dmamap_load */
netmap_dmamap_cb(__unused void * arg,__unused bus_dma_segment_t * segs,__unused int nseg,__unused int error)17576dba29a2SLuigi Rizzo static void netmap_dmamap_cb(__unused void *arg,
17586dba29a2SLuigi Rizzo __unused bus_dma_segment_t * segs, __unused int nseg, __unused int error)
17596dba29a2SLuigi Rizzo {
17606dba29a2SLuigi Rizzo }
17616dba29a2SLuigi Rizzo
17626dba29a2SLuigi Rizzo /* bus_dmamap_load wrapper: call aforementioned function if map != NULL.
17636dba29a2SLuigi Rizzo * XXX can we do it without a callback ?
17646dba29a2SLuigi Rizzo */
17654f80b14cSVincenzo Maffione static inline int
netmap_load_map(struct netmap_adapter * na,bus_dma_tag_t tag,bus_dmamap_t map,void * buf)17664bf50f18SLuigi Rizzo netmap_load_map(struct netmap_adapter *na,
17674bf50f18SLuigi Rizzo bus_dma_tag_t tag, bus_dmamap_t map, void *buf)
17686dba29a2SLuigi Rizzo {
17696dba29a2SLuigi Rizzo if (map)
17704bf50f18SLuigi Rizzo bus_dmamap_load(tag, map, buf, NETMAP_BUF_SIZE(na),
17716dba29a2SLuigi Rizzo netmap_dmamap_cb, NULL, BUS_DMA_NOWAIT);
17724f80b14cSVincenzo Maffione return 0;
17736dba29a2SLuigi Rizzo }
17746dba29a2SLuigi Rizzo
17754bf50f18SLuigi Rizzo static inline void
netmap_unload_map(struct netmap_adapter * na,bus_dma_tag_t tag,bus_dmamap_t map)17764bf50f18SLuigi Rizzo netmap_unload_map(struct netmap_adapter *na,
17774bf50f18SLuigi Rizzo bus_dma_tag_t tag, bus_dmamap_t map)
17784bf50f18SLuigi Rizzo {
17794bf50f18SLuigi Rizzo if (map)
17804bf50f18SLuigi Rizzo bus_dmamap_unload(tag, map);
17814bf50f18SLuigi Rizzo }
17824bf50f18SLuigi Rizzo
17834f80b14cSVincenzo Maffione #define netmap_sync_map(na, tag, map, sz, t)
17844f80b14cSVincenzo Maffione
17856dba29a2SLuigi Rizzo /* update the map when a buffer changes. */
17866dba29a2SLuigi Rizzo static inline void
netmap_reload_map(struct netmap_adapter * na,bus_dma_tag_t tag,bus_dmamap_t map,void * buf)17874bf50f18SLuigi Rizzo netmap_reload_map(struct netmap_adapter *na,
17884bf50f18SLuigi Rizzo bus_dma_tag_t tag, bus_dmamap_t map, void *buf)
17896dba29a2SLuigi Rizzo {
17906dba29a2SLuigi Rizzo if (map) {
17916dba29a2SLuigi Rizzo bus_dmamap_unload(tag, map);
17924bf50f18SLuigi Rizzo bus_dmamap_load(tag, map, buf, NETMAP_BUF_SIZE(na),
17936dba29a2SLuigi Rizzo netmap_dmamap_cb, NULL, BUS_DMA_NOWAIT);
17946dba29a2SLuigi Rizzo }
17956dba29a2SLuigi Rizzo }
1796f9790aebSLuigi Rizzo
179737e3a6d3SLuigi Rizzo #elif defined(_WIN32)
179837e3a6d3SLuigi Rizzo
1799f196ce38SLuigi Rizzo #else /* linux */
1800f196ce38SLuigi Rizzo
18014bf50f18SLuigi Rizzo int nm_iommu_group_id(bus_dma_tag_t dev);
18024bf50f18SLuigi Rizzo #include <linux/dma-mapping.h>
18034bf50f18SLuigi Rizzo
1804f196ce38SLuigi Rizzo /*
1805f196ce38SLuigi Rizzo * on linux we need
1806f196ce38SLuigi Rizzo * dma_map_single(&pdev->dev, virt_addr, len, direction)
18074f80b14cSVincenzo Maffione * dma_unmap_single(&adapter->pdev->dev, phys_addr, len, direction)
1808f196ce38SLuigi Rizzo */
1809f196ce38SLuigi Rizzo #if 0
1810f196ce38SLuigi Rizzo struct e1000_buffer *buffer_info = &tx_ring->buffer_info[l];
1811f196ce38SLuigi Rizzo /* set time_stamp *before* dma to help avoid a possible race */
1812f196ce38SLuigi Rizzo buffer_info->time_stamp = jiffies;
1813f196ce38SLuigi Rizzo buffer_info->mapped_as_page = false;
1814f196ce38SLuigi Rizzo buffer_info->length = len;
1815f196ce38SLuigi Rizzo //buffer_info->next_to_watch = l;
1816f196ce38SLuigi Rizzo /* reload dma map */
1817f196ce38SLuigi Rizzo dma_unmap_single(&adapter->pdev->dev, buffer_info->dma,
1818f196ce38SLuigi Rizzo NETMAP_BUF_SIZE, DMA_TO_DEVICE);
1819f196ce38SLuigi Rizzo buffer_info->dma = dma_map_single(&adapter->pdev->dev,
1820f196ce38SLuigi Rizzo addr, NETMAP_BUF_SIZE, DMA_TO_DEVICE);
1821f196ce38SLuigi Rizzo
1822f196ce38SLuigi Rizzo if (dma_mapping_error(&adapter->pdev->dev, buffer_info->dma)) {
182375f4f3edSVincenzo Maffione nm_prerr("dma mapping error");
1824f196ce38SLuigi Rizzo /* goto dma_error; See e1000_put_txbuf() */
1825f196ce38SLuigi Rizzo /* XXX reset */
1826f196ce38SLuigi Rizzo }
1827f196ce38SLuigi Rizzo tx_desc->buffer_addr = htole64(buffer_info->dma); //XXX
1828f196ce38SLuigi Rizzo
1829f196ce38SLuigi Rizzo #endif
1830f196ce38SLuigi Rizzo
18314f80b14cSVincenzo Maffione static inline int
netmap_load_map(struct netmap_adapter * na,bus_dma_tag_t tag,bus_dmamap_t map,void * buf,u_int size)18324f80b14cSVincenzo Maffione netmap_load_map(struct netmap_adapter *na,
18334f80b14cSVincenzo Maffione bus_dma_tag_t tag, bus_dmamap_t map, void *buf, u_int size)
18344f80b14cSVincenzo Maffione {
18354f80b14cSVincenzo Maffione if (map) {
18364f80b14cSVincenzo Maffione *map = dma_map_single(na->pdev, buf, size,
18374f80b14cSVincenzo Maffione DMA_BIDIRECTIONAL);
18384f80b14cSVincenzo Maffione if (dma_mapping_error(na->pdev, *map)) {
18394f80b14cSVincenzo Maffione *map = 0;
18404f80b14cSVincenzo Maffione return ENOMEM;
18414f80b14cSVincenzo Maffione }
18424f80b14cSVincenzo Maffione }
18434f80b14cSVincenzo Maffione return 0;
18444f80b14cSVincenzo Maffione }
18454f80b14cSVincenzo Maffione
18464f80b14cSVincenzo Maffione static inline void
netmap_unload_map(struct netmap_adapter * na,bus_dma_tag_t tag,bus_dmamap_t map,u_int sz)18474f80b14cSVincenzo Maffione netmap_unload_map(struct netmap_adapter *na,
18484f80b14cSVincenzo Maffione bus_dma_tag_t tag, bus_dmamap_t map, u_int sz)
18494f80b14cSVincenzo Maffione {
18504f80b14cSVincenzo Maffione if (*map) {
18514f80b14cSVincenzo Maffione dma_unmap_single(na->pdev, *map, sz,
18524f80b14cSVincenzo Maffione DMA_BIDIRECTIONAL);
18534f80b14cSVincenzo Maffione }
18544f80b14cSVincenzo Maffione }
18554f80b14cSVincenzo Maffione
18562a7db7a6SVincenzo Maffione #ifdef NETMAP_LINUX_HAVE_DMASYNC
18574f80b14cSVincenzo Maffione static inline void
netmap_sync_map_cpu(struct netmap_adapter * na,bus_dma_tag_t tag,bus_dmamap_t map,u_int sz,enum txrx t)18582a7db7a6SVincenzo Maffione netmap_sync_map_cpu(struct netmap_adapter *na,
18594f80b14cSVincenzo Maffione bus_dma_tag_t tag, bus_dmamap_t map, u_int sz, enum txrx t)
18604f80b14cSVincenzo Maffione {
18614f80b14cSVincenzo Maffione if (*map) {
18624f80b14cSVincenzo Maffione dma_sync_single_for_cpu(na->pdev, *map, sz,
18632a7db7a6SVincenzo Maffione (t == NR_TX ? DMA_TO_DEVICE : DMA_FROM_DEVICE));
18642a7db7a6SVincenzo Maffione }
18652a7db7a6SVincenzo Maffione }
18662a7db7a6SVincenzo Maffione
18672a7db7a6SVincenzo Maffione static inline void
netmap_sync_map_dev(struct netmap_adapter * na,bus_dma_tag_t tag,bus_dmamap_t map,u_int sz,enum txrx t)18682a7db7a6SVincenzo Maffione netmap_sync_map_dev(struct netmap_adapter *na,
18692a7db7a6SVincenzo Maffione bus_dma_tag_t tag, bus_dmamap_t map, u_int sz, enum txrx t)
18702a7db7a6SVincenzo Maffione {
18712a7db7a6SVincenzo Maffione if (*map) {
18724f80b14cSVincenzo Maffione dma_sync_single_for_device(na->pdev, *map, sz,
18732a7db7a6SVincenzo Maffione (t == NR_TX ? DMA_TO_DEVICE : DMA_FROM_DEVICE));
18744f80b14cSVincenzo Maffione }
18754f80b14cSVincenzo Maffione }
18764f80b14cSVincenzo Maffione
18774f80b14cSVincenzo Maffione static inline void
netmap_reload_map(struct netmap_adapter * na,bus_dma_tag_t tag,bus_dmamap_t map,void * buf)18784f80b14cSVincenzo Maffione netmap_reload_map(struct netmap_adapter *na,
18794f80b14cSVincenzo Maffione bus_dma_tag_t tag, bus_dmamap_t map, void *buf)
18804f80b14cSVincenzo Maffione {
18814f80b14cSVincenzo Maffione u_int sz = NETMAP_BUF_SIZE(na);
18824f80b14cSVincenzo Maffione
18834f80b14cSVincenzo Maffione if (*map) {
18844f80b14cSVincenzo Maffione dma_unmap_single(na->pdev, *map, sz,
18854f80b14cSVincenzo Maffione DMA_BIDIRECTIONAL);
18864f80b14cSVincenzo Maffione }
18874f80b14cSVincenzo Maffione
18884f80b14cSVincenzo Maffione *map = dma_map_single(na->pdev, buf, sz,
18894f80b14cSVincenzo Maffione DMA_BIDIRECTIONAL);
18904f80b14cSVincenzo Maffione }
18912a7db7a6SVincenzo Maffione #else /* !NETMAP_LINUX_HAVE_DMASYNC */
18922a7db7a6SVincenzo Maffione #define netmap_sync_map_cpu(na, tag, map, sz, t)
18932a7db7a6SVincenzo Maffione #define netmap_sync_map_dev(na, tag, map, sz, t)
18942a7db7a6SVincenzo Maffione #endif /* NETMAP_LINUX_HAVE_DMASYNC */
1895f196ce38SLuigi Rizzo
1896f196ce38SLuigi Rizzo #endif /* linux */
18976dba29a2SLuigi Rizzo
1898ce3ee1e7SLuigi Rizzo
18995644ccecSLuigi Rizzo /*
19005644ccecSLuigi Rizzo * functions to map NIC to KRING indexes (n2k) and vice versa (k2n)
19015644ccecSLuigi Rizzo */
19025644ccecSLuigi Rizzo static inline int
netmap_idx_n2k(struct netmap_kring * kr,int idx)190364ae02c3SLuigi Rizzo netmap_idx_n2k(struct netmap_kring *kr, int idx)
19045644ccecSLuigi Rizzo {
190564ae02c3SLuigi Rizzo int n = kr->nkr_num_slots;
1906b6e66be2SVincenzo Maffione
1907b6e66be2SVincenzo Maffione if (likely(kr->nkr_hwofs == 0)) {
1908b6e66be2SVincenzo Maffione return idx;
1909b6e66be2SVincenzo Maffione }
1910b6e66be2SVincenzo Maffione
191164ae02c3SLuigi Rizzo idx += kr->nkr_hwofs;
191264ae02c3SLuigi Rizzo if (idx < 0)
191364ae02c3SLuigi Rizzo return idx + n;
191464ae02c3SLuigi Rizzo else if (idx < n)
191564ae02c3SLuigi Rizzo return idx;
19165644ccecSLuigi Rizzo else
191764ae02c3SLuigi Rizzo return idx - n;
19185644ccecSLuigi Rizzo }
19195644ccecSLuigi Rizzo
19205644ccecSLuigi Rizzo
19215644ccecSLuigi Rizzo static inline int
netmap_idx_k2n(struct netmap_kring * kr,int idx)192264ae02c3SLuigi Rizzo netmap_idx_k2n(struct netmap_kring *kr, int idx)
19235644ccecSLuigi Rizzo {
192464ae02c3SLuigi Rizzo int n = kr->nkr_num_slots;
1925b6e66be2SVincenzo Maffione
1926b6e66be2SVincenzo Maffione if (likely(kr->nkr_hwofs == 0)) {
1927b6e66be2SVincenzo Maffione return idx;
1928b6e66be2SVincenzo Maffione }
1929b6e66be2SVincenzo Maffione
193064ae02c3SLuigi Rizzo idx -= kr->nkr_hwofs;
193164ae02c3SLuigi Rizzo if (idx < 0)
193264ae02c3SLuigi Rizzo return idx + n;
193364ae02c3SLuigi Rizzo else if (idx < n)
193464ae02c3SLuigi Rizzo return idx;
19355644ccecSLuigi Rizzo else
193664ae02c3SLuigi Rizzo return idx - n;
19375644ccecSLuigi Rizzo }
19385644ccecSLuigi Rizzo
19395644ccecSLuigi Rizzo
1940d76bf4ffSLuigi Rizzo /* Entries of the look-up table. */
19414f80b14cSVincenzo Maffione #ifdef __FreeBSD__
1942d76bf4ffSLuigi Rizzo struct lut_entry {
1943d76bf4ffSLuigi Rizzo void *vaddr; /* virtual address. */
1944849bec0eSLuigi Rizzo vm_paddr_t paddr; /* physical address. */
1945d76bf4ffSLuigi Rizzo };
19464f80b14cSVincenzo Maffione #else /* linux & _WIN32 */
19474f80b14cSVincenzo Maffione /* dma-mapping in linux can assign a buffer a different address
19484f80b14cSVincenzo Maffione * depending on the device, so we need to have a separate
19494f80b14cSVincenzo Maffione * physical-address look-up table for each na.
19504f80b14cSVincenzo Maffione * We can still share the vaddrs, though, therefore we split
19514f80b14cSVincenzo Maffione * the lut_entry structure.
19524f80b14cSVincenzo Maffione */
19534f80b14cSVincenzo Maffione struct lut_entry {
19544f80b14cSVincenzo Maffione void *vaddr; /* virtual address. */
19554f80b14cSVincenzo Maffione };
19564f80b14cSVincenzo Maffione
19574f80b14cSVincenzo Maffione struct plut_entry {
19584f80b14cSVincenzo Maffione vm_paddr_t paddr; /* physical address. */
19594f80b14cSVincenzo Maffione };
19604f80b14cSVincenzo Maffione #endif /* linux & _WIN32 */
1961d76bf4ffSLuigi Rizzo
1962d76bf4ffSLuigi Rizzo struct netmap_obj_pool;
1963d76bf4ffSLuigi Rizzo
1964a6d768d8SVincenzo Maffione /* alignment for netmap buffers */
1965a6d768d8SVincenzo Maffione #define NM_BUF_ALIGN 64
1966a6d768d8SVincenzo Maffione
196768b8534bSLuigi Rizzo /*
19686e10c8b8SLuigi Rizzo * NMB return the virtual address of a buffer (buffer 0 on bad index)
19696e10c8b8SLuigi Rizzo * PNMB also fills the physical address
197068b8534bSLuigi Rizzo */
19716e10c8b8SLuigi Rizzo static inline void *
NMB(struct netmap_adapter * na,struct netmap_slot * slot)19724bf50f18SLuigi Rizzo NMB(struct netmap_adapter *na, struct netmap_slot *slot)
1973f9790aebSLuigi Rizzo {
1974847bf383SLuigi Rizzo struct lut_entry *lut = na->na_lut.lut;
1975f9790aebSLuigi Rizzo uint32_t i = slot->buf_idx;
1976847bf383SLuigi Rizzo return (unlikely(i >= na->na_lut.objtotal)) ?
1977f9790aebSLuigi Rizzo lut[0].vaddr : lut[i].vaddr;
1978f9790aebSLuigi Rizzo }
1979f9790aebSLuigi Rizzo
19804bf50f18SLuigi Rizzo static inline void *
PNMB(struct netmap_adapter * na,struct netmap_slot * slot,uint64_t * pp)19814bf50f18SLuigi Rizzo PNMB(struct netmap_adapter *na, struct netmap_slot *slot, uint64_t *pp)
19824bf50f18SLuigi Rizzo {
19834bf50f18SLuigi Rizzo uint32_t i = slot->buf_idx;
1984847bf383SLuigi Rizzo struct lut_entry *lut = na->na_lut.lut;
19854f80b14cSVincenzo Maffione struct plut_entry *plut = na->na_lut.plut;
1986847bf383SLuigi Rizzo void *ret = (i >= na->na_lut.objtotal) ? lut[0].vaddr : lut[i].vaddr;
19874bf50f18SLuigi Rizzo
19884f80b14cSVincenzo Maffione #ifdef _WIN32
19894f80b14cSVincenzo Maffione *pp = (i >= na->na_lut.objtotal) ? (uint64_t)plut[0].paddr.QuadPart : (uint64_t)plut[i].paddr.QuadPart;
199037e3a6d3SLuigi Rizzo #else
19914f80b14cSVincenzo Maffione *pp = (i >= na->na_lut.objtotal) ? plut[0].paddr : plut[i].paddr;
199237e3a6d3SLuigi Rizzo #endif
19934bf50f18SLuigi Rizzo return ret;
19944bf50f18SLuigi Rizzo }
19954bf50f18SLuigi Rizzo
1996a6d768d8SVincenzo Maffione static inline void
nm_write_offset(struct netmap_kring * kring,struct netmap_slot * slot,uint64_t offset)1997a6d768d8SVincenzo Maffione nm_write_offset(struct netmap_kring *kring,
1998a6d768d8SVincenzo Maffione struct netmap_slot *slot, uint64_t offset)
1999a6d768d8SVincenzo Maffione {
2000a6d768d8SVincenzo Maffione slot->ptr = (slot->ptr & ~kring->offset_mask) |
2001a6d768d8SVincenzo Maffione (offset & kring->offset_mask);
2002a6d768d8SVincenzo Maffione }
2003a6d768d8SVincenzo Maffione
2004a6d768d8SVincenzo Maffione static inline uint64_t
nm_get_offset(struct netmap_kring * kring,struct netmap_slot * slot)2005a6d768d8SVincenzo Maffione nm_get_offset(struct netmap_kring *kring, struct netmap_slot *slot)
2006a6d768d8SVincenzo Maffione {
2007a6d768d8SVincenzo Maffione uint64_t offset = (slot->ptr & kring->offset_mask);
2008a6d768d8SVincenzo Maffione if (unlikely(offset > kring->offset_max))
2009a6d768d8SVincenzo Maffione offset = kring->offset_max;
2010a6d768d8SVincenzo Maffione return offset;
2011a6d768d8SVincenzo Maffione }
2012a6d768d8SVincenzo Maffione
2013a6d768d8SVincenzo Maffione static inline void *
NMB_O(struct netmap_kring * kring,struct netmap_slot * slot)2014a6d768d8SVincenzo Maffione NMB_O(struct netmap_kring *kring, struct netmap_slot *slot)
2015a6d768d8SVincenzo Maffione {
2016a6d768d8SVincenzo Maffione void *addr = NMB(kring->na, slot);
2017a6d768d8SVincenzo Maffione return (char *)addr + nm_get_offset(kring, slot);
2018a6d768d8SVincenzo Maffione }
2019a6d768d8SVincenzo Maffione
2020a6d768d8SVincenzo Maffione static inline void *
PNMB_O(struct netmap_kring * kring,struct netmap_slot * slot,uint64_t * pp)2021a6d768d8SVincenzo Maffione PNMB_O(struct netmap_kring *kring, struct netmap_slot *slot, uint64_t *pp)
2022a6d768d8SVincenzo Maffione {
2023a6d768d8SVincenzo Maffione void *addr = PNMB(kring->na, slot, pp);
2024a6d768d8SVincenzo Maffione uint64_t offset = nm_get_offset(kring, slot);
2025a6d768d8SVincenzo Maffione addr = (char *)addr + offset;
2026a6d768d8SVincenzo Maffione *pp += offset;
2027a6d768d8SVincenzo Maffione return addr;
2028a6d768d8SVincenzo Maffione }
2029a6d768d8SVincenzo Maffione
2030f9790aebSLuigi Rizzo
203117885a7bSLuigi Rizzo /*
20328fd44c93SLuigi Rizzo * Structure associated to each netmap file descriptor.
20338fd44c93SLuigi Rizzo * It is created on open and left unbound (np_nifp == NULL).
20348fd44c93SLuigi Rizzo * A successful NIOCREGIF will set np_nifp and the first few fields;
20358fd44c93SLuigi Rizzo * this is protected by a global lock (NMG_LOCK) due to low contention.
2036f9790aebSLuigi Rizzo *
20378fd44c93SLuigi Rizzo * np_refs counts the number of references to the structure: one for the fd,
20388fd44c93SLuigi Rizzo * plus (on FreeBSD) one for each active mmap which we track ourselves
203985fe4e7cSLuigi Rizzo * (linux automatically tracks them, but FreeBSD does not).
20408fd44c93SLuigi Rizzo * np_refs is protected by NMG_LOCK.
204117885a7bSLuigi Rizzo *
20428fd44c93SLuigi Rizzo * Read access to the structure is lock free, because ni_nifp once set
20438fd44c93SLuigi Rizzo * can only go to 0 when nobody is using the entry anymore. Readers
20448fd44c93SLuigi Rizzo * must check that np_nifp != NULL before using the other fields.
2045f9790aebSLuigi Rizzo */
2046f9790aebSLuigi Rizzo struct netmap_priv_d {
2047f9790aebSLuigi Rizzo struct netmap_if * volatile np_nifp; /* netmap if descriptor. */
2048f9790aebSLuigi Rizzo
2049f9790aebSLuigi Rizzo struct netmap_adapter *np_na;
2050e330262fSJustin Hibbits if_t np_ifp;
2051f0ea3689SLuigi Rizzo uint32_t np_flags; /* from the ioctl */
2052847bf383SLuigi Rizzo u_int np_qfirst[NR_TXRX],
2053847bf383SLuigi Rizzo np_qlast[NR_TXRX]; /* range of tx/rx rings to scan */
20544f80b14cSVincenzo Maffione uint16_t np_txpoll;
2055b6e66be2SVincenzo Maffione uint16_t np_kloop_state; /* use with NMG_LOCK held */
2056b6e66be2SVincenzo Maffione #define NM_SYNC_KLOOP_RUNNING (1 << 0)
2057b6e66be2SVincenzo Maffione #define NM_SYNC_KLOOP_STOPPING (1 << 1)
2058c3e9b4dbSLuiz Otavio O Souza int np_sync_flags; /* to be passed to nm_sync */
2059f9790aebSLuigi Rizzo
20608fd44c93SLuigi Rizzo int np_refs; /* use with NMG_LOCK held */
2061f0ea3689SLuigi Rizzo
2062f0ea3689SLuigi Rizzo /* pointers to the selinfo to be used for selrecord.
2063f0ea3689SLuigi Rizzo * Either the local or the global one depending on the
2064f0ea3689SLuigi Rizzo * number of rings.
2065f0ea3689SLuigi Rizzo */
2066847bf383SLuigi Rizzo NM_SELINFO_T *np_si[NR_TXRX];
2067b6e66be2SVincenzo Maffione
2068b6e66be2SVincenzo Maffione /* In the optional CSB mode, the user must specify the start address
2069b6e66be2SVincenzo Maffione * of two arrays of Communication Status Block (CSB) entries, for the
2070b6e66be2SVincenzo Maffione * two directions (kernel read application write, and kernel write
2071b6e66be2SVincenzo Maffione * application read).
2072b6e66be2SVincenzo Maffione * The number of entries must agree with the number of rings bound to
2073b6e66be2SVincenzo Maffione * the netmap file descriptor. The entries corresponding to the TX
2074b6e66be2SVincenzo Maffione * rings are laid out before the ones corresponding to the RX rings.
2075b6e66be2SVincenzo Maffione *
2076b6e66be2SVincenzo Maffione * Array of CSB entries for application --> kernel communication
2077b6e66be2SVincenzo Maffione * (N entries). */
2078b6e66be2SVincenzo Maffione struct nm_csb_atok *np_csb_atok_base;
2079b6e66be2SVincenzo Maffione /* Array of CSB entries for kernel --> application communication
2080b6e66be2SVincenzo Maffione * (N entries). */
2081b6e66be2SVincenzo Maffione struct nm_csb_ktoa *np_csb_ktoa_base;
2082b6e66be2SVincenzo Maffione
2083b6e66be2SVincenzo Maffione #ifdef linux
2084b6e66be2SVincenzo Maffione struct file *np_filp; /* used by sync kloop */
2085b6e66be2SVincenzo Maffione #endif /* linux */
2086f9790aebSLuigi Rizzo };
2087f9790aebSLuigi Rizzo
208837e3a6d3SLuigi Rizzo struct netmap_priv_d *netmap_priv_new(void);
208937e3a6d3SLuigi Rizzo void netmap_priv_delete(struct netmap_priv_d *);
209037e3a6d3SLuigi Rizzo
nm_kring_pending(struct netmap_priv_d * np)209137e3a6d3SLuigi Rizzo static inline int nm_kring_pending(struct netmap_priv_d *np)
209237e3a6d3SLuigi Rizzo {
209337e3a6d3SLuigi Rizzo struct netmap_adapter *na = np->np_na;
209437e3a6d3SLuigi Rizzo enum txrx t;
209537e3a6d3SLuigi Rizzo int i;
209637e3a6d3SLuigi Rizzo
209737e3a6d3SLuigi Rizzo for_rx_tx(t) {
209837e3a6d3SLuigi Rizzo for (i = np->np_qfirst[t]; i < np->np_qlast[t]; i++) {
20992ff91c17SVincenzo Maffione struct netmap_kring *kring = NMR(na, t)[i];
210037e3a6d3SLuigi Rizzo if (kring->nr_mode != kring->nr_pending_mode) {
210137e3a6d3SLuigi Rizzo return 1;
210237e3a6d3SLuigi Rizzo }
210337e3a6d3SLuigi Rizzo }
210437e3a6d3SLuigi Rizzo }
210537e3a6d3SLuigi Rizzo return 0;
210637e3a6d3SLuigi Rizzo }
210737e3a6d3SLuigi Rizzo
2108b6e66be2SVincenzo Maffione /* call with NMG_LOCK held */
2109b6e66be2SVincenzo Maffione static __inline int
nm_si_user(struct netmap_priv_d * priv,enum txrx t)2110b6e66be2SVincenzo Maffione nm_si_user(struct netmap_priv_d *priv, enum txrx t)
2111b6e66be2SVincenzo Maffione {
2112b6e66be2SVincenzo Maffione return (priv->np_na != NULL &&
2113b6e66be2SVincenzo Maffione (priv->np_qlast[t] - priv->np_qfirst[t] > 1));
2114b6e66be2SVincenzo Maffione }
2115b6e66be2SVincenzo Maffione
2116c3e9b4dbSLuiz Otavio O Souza #ifdef WITH_PIPES
2117c3e9b4dbSLuiz Otavio O Souza int netmap_pipe_txsync(struct netmap_kring *txkring, int flags);
2118c3e9b4dbSLuiz Otavio O Souza int netmap_pipe_rxsync(struct netmap_kring *rxkring, int flags);
211975f4f3edSVincenzo Maffione int netmap_pipe_krings_create_both(struct netmap_adapter *na,
212075f4f3edSVincenzo Maffione struct netmap_adapter *ona);
212175f4f3edSVincenzo Maffione void netmap_pipe_krings_delete_both(struct netmap_adapter *na,
212275f4f3edSVincenzo Maffione struct netmap_adapter *ona);
212375f4f3edSVincenzo Maffione int netmap_pipe_reg_both(struct netmap_adapter *na,
212475f4f3edSVincenzo Maffione struct netmap_adapter *ona);
2125c3e9b4dbSLuiz Otavio O Souza #endif /* WITH_PIPES */
2126c3e9b4dbSLuiz Otavio O Souza
21274bf50f18SLuigi Rizzo #ifdef WITH_MONITOR
21284bf50f18SLuigi Rizzo
21294bf50f18SLuigi Rizzo struct netmap_monitor_adapter {
21304bf50f18SLuigi Rizzo struct netmap_adapter up;
21314bf50f18SLuigi Rizzo
21324bf50f18SLuigi Rizzo struct netmap_priv_d priv;
21334bf50f18SLuigi Rizzo uint32_t flags;
21344bf50f18SLuigi Rizzo };
21354bf50f18SLuigi Rizzo
21364bf50f18SLuigi Rizzo #endif /* WITH_MONITOR */
21374bf50f18SLuigi Rizzo
2138f9790aebSLuigi Rizzo
2139039dd540SLuigi Rizzo #ifdef WITH_GENERIC
2140f9790aebSLuigi Rizzo /*
2141f9790aebSLuigi Rizzo * generic netmap emulation for devices that do not have
2142f9790aebSLuigi Rizzo * native netmap support.
2143f9790aebSLuigi Rizzo */
2144e330262fSJustin Hibbits int generic_netmap_attach(if_t ifp);
2145e330262fSJustin Hibbits int generic_rx_handler(if_t ifp, struct mbuf *m);
2146f9790aebSLuigi Rizzo
214737e3a6d3SLuigi Rizzo int nm_os_catch_rx(struct netmap_generic_adapter *gna, int intercept);
214837e3a6d3SLuigi Rizzo int nm_os_catch_tx(struct netmap_generic_adapter *gna, int intercept);
214937e3a6d3SLuigi Rizzo
2150c3e9b4dbSLuiz Otavio O Souza int na_is_generic(struct netmap_adapter *na);
2151c3e9b4dbSLuiz Otavio O Souza
215237e3a6d3SLuigi Rizzo /*
215337e3a6d3SLuigi Rizzo * the generic transmit routine is passed a structure to optionally
215437e3a6d3SLuigi Rizzo * build a queue of descriptors, in an OS-specific way.
215537e3a6d3SLuigi Rizzo * The payload is at addr, if non-null, and the routine should send or queue
215637e3a6d3SLuigi Rizzo * the packet, returning 0 if successful, 1 on failure.
215737e3a6d3SLuigi Rizzo *
215837e3a6d3SLuigi Rizzo * At the end, if head is non-null, there will be an additional call
215937e3a6d3SLuigi Rizzo * to the function with addr = NULL; this should tell the OS-specific
216037e3a6d3SLuigi Rizzo * routine to send the queue and free any resources. Failure is ignored.
216137e3a6d3SLuigi Rizzo */
216237e3a6d3SLuigi Rizzo struct nm_os_gen_arg {
2163e330262fSJustin Hibbits if_t ifp;
216437e3a6d3SLuigi Rizzo void *m; /* os-specific mbuf-like object */
216537e3a6d3SLuigi Rizzo void *head, *tail; /* tailq, if the OS-specific routine needs to build one */
216637e3a6d3SLuigi Rizzo void *addr; /* payload of current packet */
216737e3a6d3SLuigi Rizzo u_int len; /* packet length */
2168854b2f30SMark Johnston u_int ring_nr; /* transmit ring index */
216937e3a6d3SLuigi Rizzo u_int qevent; /* in txqdisc mode, place an event on this mbuf */
217037e3a6d3SLuigi Rizzo };
217137e3a6d3SLuigi Rizzo
217237e3a6d3SLuigi Rizzo int nm_os_generic_xmit_frame(struct nm_os_gen_arg *);
2173e330262fSJustin Hibbits int nm_os_generic_find_num_desc(if_t ifp, u_int *tx, u_int *rx);
2174e330262fSJustin Hibbits void nm_os_generic_find_num_queues(if_t ifp, u_int *txq, u_int *rxq);
217537e3a6d3SLuigi Rizzo void nm_os_generic_set_features(struct netmap_generic_adapter *gna);
217637e3a6d3SLuigi Rizzo
2177e330262fSJustin Hibbits static inline if_t
netmap_generic_getifp(struct netmap_generic_adapter * gna)2178847bf383SLuigi Rizzo netmap_generic_getifp(struct netmap_generic_adapter *gna)
2179847bf383SLuigi Rizzo {
2180847bf383SLuigi Rizzo if (gna->prev)
2181847bf383SLuigi Rizzo return gna->prev->ifp;
2182847bf383SLuigi Rizzo
2183847bf383SLuigi Rizzo return gna->up.up.ifp;
2184847bf383SLuigi Rizzo }
2185f9790aebSLuigi Rizzo
218637e3a6d3SLuigi Rizzo void netmap_generic_irq(struct netmap_adapter *na, u_int q, u_int *work_done);
218737e3a6d3SLuigi Rizzo
21884bf50f18SLuigi Rizzo //#define RATE_GENERIC /* Enables communication statistics for generic. */
21894bf50f18SLuigi Rizzo #ifdef RATE_GENERIC
21904bf50f18SLuigi Rizzo void generic_rate(int txp, int txs, int txi, int rxp, int rxs, int rxi);
21914bf50f18SLuigi Rizzo #else
21924bf50f18SLuigi Rizzo #define generic_rate(txp, txs, txi, rxp, rxs, rxi)
21934bf50f18SLuigi Rizzo #endif
21944bf50f18SLuigi Rizzo
2195f9790aebSLuigi Rizzo /*
2196f9790aebSLuigi Rizzo * netmap_mitigation API. This is used by the generic adapter
2197f9790aebSLuigi Rizzo * to reduce the number of interrupt requests/selwakeup
2198f9790aebSLuigi Rizzo * to clients on incoming packets.
2199f9790aebSLuigi Rizzo */
220037e3a6d3SLuigi Rizzo void nm_os_mitigation_init(struct nm_generic_mit *mit, int idx,
22014bf50f18SLuigi Rizzo struct netmap_adapter *na);
220237e3a6d3SLuigi Rizzo void nm_os_mitigation_start(struct nm_generic_mit *mit);
220337e3a6d3SLuigi Rizzo void nm_os_mitigation_restart(struct nm_generic_mit *mit);
220437e3a6d3SLuigi Rizzo int nm_os_mitigation_active(struct nm_generic_mit *mit);
220537e3a6d3SLuigi Rizzo void nm_os_mitigation_cleanup(struct nm_generic_mit *mit);
220637e3a6d3SLuigi Rizzo #else /* !WITH_GENERIC */
220737e3a6d3SLuigi Rizzo #define generic_netmap_attach(ifp) (EOPNOTSUPP)
2208c3e9b4dbSLuiz Otavio O Souza #define na_is_generic(na) (0)
2209039dd540SLuigi Rizzo #endif /* WITH_GENERIC */
2210f0ea3689SLuigi Rizzo
2211f0ea3689SLuigi Rizzo /* Shared declarations for the VALE switch. */
2212f0ea3689SLuigi Rizzo
2213f0ea3689SLuigi Rizzo /*
2214f0ea3689SLuigi Rizzo * Each transmit queue accumulates a batch of packets into
2215f0ea3689SLuigi Rizzo * a structure before forwarding. Packets to the same
2216f0ea3689SLuigi Rizzo * destination are put in a list using ft_next as a link field.
2217f0ea3689SLuigi Rizzo * ft_frags and ft_next are valid only on the first fragment.
2218f0ea3689SLuigi Rizzo */
2219f0ea3689SLuigi Rizzo struct nm_bdg_fwd { /* forwarding entry for a bridge */
2220f0ea3689SLuigi Rizzo void *ft_buf; /* netmap or indirect buffer */
2221f0ea3689SLuigi Rizzo uint8_t ft_frags; /* how many fragments (only on 1st frag) */
22222ff91c17SVincenzo Maffione uint16_t ft_offset; /* dst port (unused) */
2223f0ea3689SLuigi Rizzo uint16_t ft_flags; /* flags, e.g. indirect */
2224f0ea3689SLuigi Rizzo uint16_t ft_len; /* src fragment len */
2225f0ea3689SLuigi Rizzo uint16_t ft_next; /* next packet to same destination */
2226f0ea3689SLuigi Rizzo };
2227f0ea3689SLuigi Rizzo
2228f0ea3689SLuigi Rizzo /* struct 'virtio_net_hdr' from linux. */
2229f0ea3689SLuigi Rizzo struct nm_vnet_hdr {
2230f0ea3689SLuigi Rizzo #define VIRTIO_NET_HDR_F_NEEDS_CSUM 1 /* Use csum_start, csum_offset */
2231f0ea3689SLuigi Rizzo #define VIRTIO_NET_HDR_F_DATA_VALID 2 /* Csum is valid */
2232f0ea3689SLuigi Rizzo uint8_t flags;
2233f0ea3689SLuigi Rizzo #define VIRTIO_NET_HDR_GSO_NONE 0 /* Not a GSO frame */
2234f0ea3689SLuigi Rizzo #define VIRTIO_NET_HDR_GSO_TCPV4 1 /* GSO frame, IPv4 TCP (TSO) */
2235f0ea3689SLuigi Rizzo #define VIRTIO_NET_HDR_GSO_UDP 3 /* GSO frame, IPv4 UDP (UFO) */
2236f0ea3689SLuigi Rizzo #define VIRTIO_NET_HDR_GSO_TCPV6 4 /* GSO frame, IPv6 TCP */
2237f0ea3689SLuigi Rizzo #define VIRTIO_NET_HDR_GSO_ECN 0x80 /* TCP has ECN set */
2238f0ea3689SLuigi Rizzo uint8_t gso_type;
2239f0ea3689SLuigi Rizzo uint16_t hdr_len;
2240f0ea3689SLuigi Rizzo uint16_t gso_size;
2241f0ea3689SLuigi Rizzo uint16_t csum_start;
2242f0ea3689SLuigi Rizzo uint16_t csum_offset;
2243f0ea3689SLuigi Rizzo };
2244f0ea3689SLuigi Rizzo
2245f0ea3689SLuigi Rizzo #define WORST_CASE_GSO_HEADER (14+40+60) /* IPv6 + TCP */
2246f0ea3689SLuigi Rizzo
2247f0ea3689SLuigi Rizzo /* Private definitions for IPv4, IPv6, UDP and TCP headers. */
2248f0ea3689SLuigi Rizzo
2249f0ea3689SLuigi Rizzo struct nm_iphdr {
2250f0ea3689SLuigi Rizzo uint8_t version_ihl;
2251f0ea3689SLuigi Rizzo uint8_t tos;
2252f0ea3689SLuigi Rizzo uint16_t tot_len;
2253f0ea3689SLuigi Rizzo uint16_t id;
2254f0ea3689SLuigi Rizzo uint16_t frag_off;
2255f0ea3689SLuigi Rizzo uint8_t ttl;
2256f0ea3689SLuigi Rizzo uint8_t protocol;
2257f0ea3689SLuigi Rizzo uint16_t check;
2258f0ea3689SLuigi Rizzo uint32_t saddr;
2259f0ea3689SLuigi Rizzo uint32_t daddr;
2260f0ea3689SLuigi Rizzo /*The options start here. */
2261f0ea3689SLuigi Rizzo };
2262f0ea3689SLuigi Rizzo
2263f0ea3689SLuigi Rizzo struct nm_tcphdr {
2264f0ea3689SLuigi Rizzo uint16_t source;
2265f0ea3689SLuigi Rizzo uint16_t dest;
2266f0ea3689SLuigi Rizzo uint32_t seq;
2267f0ea3689SLuigi Rizzo uint32_t ack_seq;
2268f0ea3689SLuigi Rizzo uint8_t doff; /* Data offset + Reserved */
2269f0ea3689SLuigi Rizzo uint8_t flags;
2270f0ea3689SLuigi Rizzo uint16_t window;
2271f0ea3689SLuigi Rizzo uint16_t check;
2272f0ea3689SLuigi Rizzo uint16_t urg_ptr;
2273f0ea3689SLuigi Rizzo };
2274f0ea3689SLuigi Rizzo
2275f0ea3689SLuigi Rizzo struct nm_udphdr {
2276f0ea3689SLuigi Rizzo uint16_t source;
2277f0ea3689SLuigi Rizzo uint16_t dest;
2278f0ea3689SLuigi Rizzo uint16_t len;
2279f0ea3689SLuigi Rizzo uint16_t check;
2280f0ea3689SLuigi Rizzo };
2281f0ea3689SLuigi Rizzo
2282f0ea3689SLuigi Rizzo struct nm_ipv6hdr {
2283f0ea3689SLuigi Rizzo uint8_t priority_version;
2284f0ea3689SLuigi Rizzo uint8_t flow_lbl[3];
2285f0ea3689SLuigi Rizzo
2286f0ea3689SLuigi Rizzo uint16_t payload_len;
2287f0ea3689SLuigi Rizzo uint8_t nexthdr;
2288f0ea3689SLuigi Rizzo uint8_t hop_limit;
2289f0ea3689SLuigi Rizzo
2290f0ea3689SLuigi Rizzo uint8_t saddr[16];
2291f0ea3689SLuigi Rizzo uint8_t daddr[16];
2292f0ea3689SLuigi Rizzo };
2293f0ea3689SLuigi Rizzo
2294f0ea3689SLuigi Rizzo /* Type used to store a checksum (in host byte order) that hasn't been
2295f0ea3689SLuigi Rizzo * folded yet.
2296f0ea3689SLuigi Rizzo */
2297f0ea3689SLuigi Rizzo #define rawsum_t uint32_t
2298f0ea3689SLuigi Rizzo
229937e3a6d3SLuigi Rizzo rawsum_t nm_os_csum_raw(uint8_t *data, size_t len, rawsum_t cur_sum);
230037e3a6d3SLuigi Rizzo uint16_t nm_os_csum_ipv4(struct nm_iphdr *iph);
230137e3a6d3SLuigi Rizzo void nm_os_csum_tcpudp_ipv4(struct nm_iphdr *iph, void *data,
2302f0ea3689SLuigi Rizzo size_t datalen, uint16_t *check);
230337e3a6d3SLuigi Rizzo void nm_os_csum_tcpudp_ipv6(struct nm_ipv6hdr *ip6h, void *data,
2304f0ea3689SLuigi Rizzo size_t datalen, uint16_t *check);
230537e3a6d3SLuigi Rizzo uint16_t nm_os_csum_fold(rawsum_t cur_sum);
2306f0ea3689SLuigi Rizzo
2307f0ea3689SLuigi Rizzo void bdg_mismatch_datapath(struct netmap_vp_adapter *na,
2308f0ea3689SLuigi Rizzo struct netmap_vp_adapter *dst_na,
230937e3a6d3SLuigi Rizzo const struct nm_bdg_fwd *ft_p,
231037e3a6d3SLuigi Rizzo struct netmap_ring *dst_ring,
2311f0ea3689SLuigi Rizzo u_int *j, u_int lim, u_int *howmany);
23124bf50f18SLuigi Rizzo
23134bf50f18SLuigi Rizzo /* persistent virtual port routines */
2314e330262fSJustin Hibbits int nm_os_vi_persist(const char *, if_t *);
2315e330262fSJustin Hibbits void nm_os_vi_detach(if_t);
231637e3a6d3SLuigi Rizzo void nm_os_vi_init_index(void);
231737e3a6d3SLuigi Rizzo
231837e3a6d3SLuigi Rizzo /*
231937e3a6d3SLuigi Rizzo * kernel thread routines
232037e3a6d3SLuigi Rizzo */
2321c3e9b4dbSLuiz Otavio O Souza struct nm_kctx; /* OS-specific kernel context - opaque */
2322b6e66be2SVincenzo Maffione typedef void (*nm_kctx_worker_fn_t)(void *data);
232337e3a6d3SLuigi Rizzo
232437e3a6d3SLuigi Rizzo /* kthread configuration */
2325c3e9b4dbSLuiz Otavio O Souza struct nm_kctx_cfg {
232637e3a6d3SLuigi Rizzo long type; /* kthread type/identifier */
2327c3e9b4dbSLuiz Otavio O Souza nm_kctx_worker_fn_t worker_fn; /* worker function */
232837e3a6d3SLuigi Rizzo void *worker_private;/* worker parameter */
232937e3a6d3SLuigi Rizzo int attach_user; /* attach kthread to user process */
233037e3a6d3SLuigi Rizzo };
233137e3a6d3SLuigi Rizzo /* kthread configuration */
2332c3e9b4dbSLuiz Otavio O Souza struct nm_kctx *nm_os_kctx_create(struct nm_kctx_cfg *cfg,
2333844a6f0cSLuigi Rizzo void *opaque);
2334c3e9b4dbSLuiz Otavio O Souza int nm_os_kctx_worker_start(struct nm_kctx *);
2335c3e9b4dbSLuiz Otavio O Souza void nm_os_kctx_worker_stop(struct nm_kctx *);
2336c3e9b4dbSLuiz Otavio O Souza void nm_os_kctx_destroy(struct nm_kctx *);
2337c3e9b4dbSLuiz Otavio O Souza void nm_os_kctx_worker_setaff(struct nm_kctx *, int);
233837e3a6d3SLuigi Rizzo u_int nm_os_ncpus(void);
233937e3a6d3SLuigi Rizzo
2340b6e66be2SVincenzo Maffione int netmap_sync_kloop(struct netmap_priv_d *priv,
2341b6e66be2SVincenzo Maffione struct nmreq_header *hdr);
2342b6e66be2SVincenzo Maffione int netmap_sync_kloop_stop(struct netmap_priv_d *priv);
2343b6e66be2SVincenzo Maffione
2344b6e66be2SVincenzo Maffione #ifdef WITH_PTNETMAP
2345b6e66be2SVincenzo Maffione /* ptnetmap guest routines */
2346b6e66be2SVincenzo Maffione
234737e3a6d3SLuigi Rizzo /*
2348b6e66be2SVincenzo Maffione * ptnetmap_memdev routines used to talk with ptnetmap_memdev device driver
234937e3a6d3SLuigi Rizzo */
2350b6e66be2SVincenzo Maffione struct ptnetmap_memdev;
2351b6e66be2SVincenzo Maffione int nm_os_pt_memdev_iomap(struct ptnetmap_memdev *, vm_paddr_t *, void **,
2352b6e66be2SVincenzo Maffione uint64_t *);
2353b6e66be2SVincenzo Maffione void nm_os_pt_memdev_iounmap(struct ptnetmap_memdev *);
2354b6e66be2SVincenzo Maffione uint32_t nm_os_pt_memdev_ioread(struct ptnetmap_memdev *, unsigned int);
235537e3a6d3SLuigi Rizzo
235637e3a6d3SLuigi Rizzo /*
235737e3a6d3SLuigi Rizzo * netmap adapter for guest ptnetmap ports
235837e3a6d3SLuigi Rizzo */
235937e3a6d3SLuigi Rizzo struct netmap_pt_guest_adapter {
236037e3a6d3SLuigi Rizzo /* The netmap adapter to be used by netmap applications.
236137e3a6d3SLuigi Rizzo * This field must be the first, to allow upcast. */
236237e3a6d3SLuigi Rizzo struct netmap_hw_adapter hwup;
236337e3a6d3SLuigi Rizzo
236437e3a6d3SLuigi Rizzo /* The netmap adapter to be used by the driver. */
236537e3a6d3SLuigi Rizzo struct netmap_hw_adapter dr;
236637e3a6d3SLuigi Rizzo
236737e3a6d3SLuigi Rizzo /* Reference counter to track users of backend netmap port: the
236837e3a6d3SLuigi Rizzo * network stack and netmap clients.
236937e3a6d3SLuigi Rizzo * Used to decide when we need (de)allocate krings/rings and
237037e3a6d3SLuigi Rizzo * start (stop) ptnetmap kthreads. */
2371b6e66be2SVincenzo Maffione int backend_users;
237237e3a6d3SLuigi Rizzo
237337e3a6d3SLuigi Rizzo };
237437e3a6d3SLuigi Rizzo
237546023447SVincenzo Maffione int netmap_pt_guest_attach(struct netmap_adapter *na,
237646023447SVincenzo Maffione unsigned int nifp_offset,
237746023447SVincenzo Maffione unsigned int memid);
2378b6e66be2SVincenzo Maffione bool netmap_pt_guest_txsync(struct nm_csb_atok *atok,
2379b6e66be2SVincenzo Maffione struct nm_csb_ktoa *ktoa,
2380b6e66be2SVincenzo Maffione struct netmap_kring *kring, int flags);
2381b6e66be2SVincenzo Maffione bool netmap_pt_guest_rxsync(struct nm_csb_atok *atok,
2382b6e66be2SVincenzo Maffione struct nm_csb_ktoa *ktoa,
238346023447SVincenzo Maffione struct netmap_kring *kring, int flags);
238437e3a6d3SLuigi Rizzo int ptnet_nm_krings_create(struct netmap_adapter *na);
238537e3a6d3SLuigi Rizzo void ptnet_nm_krings_delete(struct netmap_adapter *na);
238637e3a6d3SLuigi Rizzo void ptnet_nm_dtor(struct netmap_adapter *na);
2387b6e66be2SVincenzo Maffione
2388f79ba6d7SVincenzo Maffione /* Helper function wrapping nm_sync_kloop_appl_read(). */
2389b6e66be2SVincenzo Maffione static inline void
ptnet_sync_tail(struct nm_csb_ktoa * ktoa,struct netmap_kring * kring)2390b6e66be2SVincenzo Maffione ptnet_sync_tail(struct nm_csb_ktoa *ktoa, struct netmap_kring *kring)
2391b6e66be2SVincenzo Maffione {
2392b6e66be2SVincenzo Maffione struct netmap_ring *ring = kring->ring;
2393b6e66be2SVincenzo Maffione
2394b6e66be2SVincenzo Maffione /* Update hwcur and hwtail as known by the host. */
2395f79ba6d7SVincenzo Maffione nm_sync_kloop_appl_read(ktoa, &kring->nr_hwtail, &kring->nr_hwcur);
2396b6e66be2SVincenzo Maffione
2397b6e66be2SVincenzo Maffione /* nm_sync_finalize */
2398b6e66be2SVincenzo Maffione ring->tail = kring->rtail = kring->nr_hwtail;
2399b6e66be2SVincenzo Maffione }
2400b6e66be2SVincenzo Maffione #endif /* WITH_PTNETMAP */
24014bf50f18SLuigi Rizzo
24022a7db7a6SVincenzo Maffione #ifdef __FreeBSD__
24032a7db7a6SVincenzo Maffione /*
24042a7db7a6SVincenzo Maffione * FreeBSD mbuf allocator/deallocator in emulation mode:
24052a7db7a6SVincenzo Maffione *
24062a7db7a6SVincenzo Maffione * We allocate mbufs with m_gethdr(), since the mbuf header is needed
24072a7db7a6SVincenzo Maffione * by the driver. We also attach a customly-provided external storage,
2408ce12afaaSMark Johnston * which in this case is a netmap buffer.
24092a7db7a6SVincenzo Maffione *
24102a7db7a6SVincenzo Maffione * The dtor function does nothing, however we need it since mb_free_ext()
24112a7db7a6SVincenzo Maffione * has a KASSERT(), checking that the mbuf dtor function is not NULL.
24122a7db7a6SVincenzo Maffione */
24132a7db7a6SVincenzo Maffione
2414ce12afaaSMark Johnston static inline void
nm_generic_mbuf_dtor(struct mbuf * m)2415ce12afaaSMark Johnston nm_generic_mbuf_dtor(struct mbuf *m)
2416ce12afaaSMark Johnston {
2417ce12afaaSMark Johnston uma_zfree(zone_clust, m->m_ext.ext_buf);
2418ce12afaaSMark Johnston }
24192a7db7a6SVincenzo Maffione
242073fdbfb9STom Jones #define SET_MBUF_DESTRUCTOR(m, fn, na) do { \
24212a7db7a6SVincenzo Maffione (m)->m_ext.ext_free = (fn != NULL) ? \
2422ce12afaaSMark Johnston (void *)fn : (void *)nm_generic_mbuf_dtor; \
242373fdbfb9STom Jones (m)->m_ext.ext_arg1 = na; \
24242a7db7a6SVincenzo Maffione } while (0)
24252a7db7a6SVincenzo Maffione
24262a7db7a6SVincenzo Maffione static inline struct mbuf *
nm_os_get_mbuf(if_t ifp __unused,int len)2427ce12afaaSMark Johnston nm_os_get_mbuf(if_t ifp __unused, int len)
24282a7db7a6SVincenzo Maffione {
24292a7db7a6SVincenzo Maffione struct mbuf *m;
2430ce12afaaSMark Johnston void *buf;
24312a7db7a6SVincenzo Maffione
2432ce12afaaSMark Johnston KASSERT(len <= MCLBYTES, ("%s: len %d", __func__, len));
24332a7db7a6SVincenzo Maffione
24342a7db7a6SVincenzo Maffione m = m_gethdr(M_NOWAIT, MT_DATA);
2435ce12afaaSMark Johnston if (__predict_false(m == NULL))
2436ce12afaaSMark Johnston return (NULL);
2437ce12afaaSMark Johnston buf = uma_zalloc(zone_clust, M_NOWAIT);
2438ce12afaaSMark Johnston if (__predict_false(buf == NULL)) {
2439ce12afaaSMark Johnston m_free(m);
2440ce12afaaSMark Johnston return (NULL);
2441ce12afaaSMark Johnston }
2442ce12afaaSMark Johnston m_extadd(m, buf, MCLBYTES, nm_generic_mbuf_dtor, NULL, NULL, 0,
2443ce12afaaSMark Johnston EXT_NET_DRV);
2444ce12afaaSMark Johnston return (m);
24452a7db7a6SVincenzo Maffione }
24462a7db7a6SVincenzo Maffione
2447ce12afaaSMark Johnston static inline void
nm_os_mbuf_reinit(struct mbuf * m)2448ce12afaaSMark Johnston nm_os_mbuf_reinit(struct mbuf *m)
2449ce12afaaSMark Johnston {
2450ce12afaaSMark Johnston void *buf;
24512a7db7a6SVincenzo Maffione
2452ce12afaaSMark Johnston KASSERT((m->m_flags & M_EXT) != 0,
2453ce12afaaSMark Johnston ("%s: mbuf %p has no external storage", __func__, m));
2454ce12afaaSMark Johnston KASSERT(m->m_ext.ext_size == MCLBYTES,
2455ce12afaaSMark Johnston ("%s: mbuf %p has wrong external storage size %u", __func__, m,
2456ce12afaaSMark Johnston m->m_ext.ext_size));
2457ce12afaaSMark Johnston
2458ce12afaaSMark Johnston buf = m->m_ext.ext_buf;
2459ce12afaaSMark Johnston m_init(m, M_NOWAIT, MT_DATA, M_PKTHDR);
2460ce12afaaSMark Johnston m_extadd(m, buf, MCLBYTES, nm_generic_mbuf_dtor, NULL, NULL, 0,
2461ce12afaaSMark Johnston EXT_NET_DRV);
24622a7db7a6SVincenzo Maffione }
24632a7db7a6SVincenzo Maffione
24642a7db7a6SVincenzo Maffione #endif /* __FreeBSD__ */
24652a7db7a6SVincenzo Maffione
2466253b2ec1SVincenzo Maffione struct nmreq_option * nmreq_getoption(struct nmreq_header *, uint16_t);
24672ff91c17SVincenzo Maffione
2468b6e66be2SVincenzo Maffione int netmap_init_bridges(void);
2469b6e66be2SVincenzo Maffione void netmap_uninit_bridges(void);
2470b6e66be2SVincenzo Maffione
2471b6e66be2SVincenzo Maffione /* Functions to read and write CSB fields from the kernel. */
2472b6e66be2SVincenzo Maffione #if defined (linux)
2473b6e66be2SVincenzo Maffione #define CSB_READ(csb, field, r) (get_user(r, &csb->field))
2474b6e66be2SVincenzo Maffione #define CSB_WRITE(csb, field, v) (put_user(v, &csb->field))
2475b6e66be2SVincenzo Maffione #else /* ! linux */
247699efa2c8SMark Johnston #define CSB_READ(csb, field, r) do { \
247799efa2c8SMark Johnston int32_t v __diagused; \
247899efa2c8SMark Johnston \
247999efa2c8SMark Johnston v = fuword32(&csb->field); \
248099efa2c8SMark Johnston KASSERT(v != -1, ("%s: fuword32 failed", __func__)); \
248199efa2c8SMark Johnston r = v; \
248299efa2c8SMark Johnston } while (0)
248399efa2c8SMark Johnston #define CSB_WRITE(csb, field, v) do { \
248499efa2c8SMark Johnston int error __diagused; \
248599efa2c8SMark Johnston \
248699efa2c8SMark Johnston error = suword32(&csb->field, v); \
248799efa2c8SMark Johnston KASSERT(error == 0, ("%s: suword32 failed", __func__)); \
248899efa2c8SMark Johnston } while (0)
2489b6e66be2SVincenzo Maffione #endif /* ! linux */
2490b6e66be2SVincenzo Maffione
2491a6d768d8SVincenzo Maffione /* some macros that may not be defined */
2492a6d768d8SVincenzo Maffione #ifndef ETH_HLEN
2493a6d768d8SVincenzo Maffione #define ETH_HLEN 6
2494a6d768d8SVincenzo Maffione #endif
2495a6d768d8SVincenzo Maffione #ifndef ETH_FCS_LEN
2496a6d768d8SVincenzo Maffione #define ETH_FCS_LEN 4
2497a6d768d8SVincenzo Maffione #endif
2498a6d768d8SVincenzo Maffione #ifndef VLAN_HLEN
2499a6d768d8SVincenzo Maffione #define VLAN_HLEN 4
2500a6d768d8SVincenzo Maffione #endif
2501a6d768d8SVincenzo Maffione
250268b8534bSLuigi Rizzo #endif /* _NET_NETMAP_KERN_H_ */
2503