168b8534bSLuigi Rizzo /* 2*1a26580eSLuigi Rizzo * Copyright (C) 2011-2012 Matteo Landi, Luigi Rizzo. All rights reserved. 368b8534bSLuigi Rizzo * 468b8534bSLuigi Rizzo * Redistribution and use in source and binary forms, with or without 568b8534bSLuigi Rizzo * modification, are permitted provided that the following conditions 668b8534bSLuigi Rizzo * are met: 768b8534bSLuigi Rizzo * 1. Redistributions of source code must retain the above copyright 868b8534bSLuigi Rizzo * notice, this list of conditions and the following disclaimer. 968b8534bSLuigi Rizzo * 2. Redistributions in binary form must reproduce the above copyright 1068b8534bSLuigi Rizzo * notice, this list of conditions and the following disclaimer in the 1168b8534bSLuigi Rizzo * documentation and/or other materials provided with the distribution. 1268b8534bSLuigi Rizzo * 1368b8534bSLuigi Rizzo * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 1468b8534bSLuigi Rizzo * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 1568b8534bSLuigi Rizzo * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 1668b8534bSLuigi Rizzo * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 1768b8534bSLuigi Rizzo * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 1868b8534bSLuigi Rizzo * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 1968b8534bSLuigi Rizzo * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 2068b8534bSLuigi Rizzo * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 2168b8534bSLuigi Rizzo * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 2268b8534bSLuigi Rizzo * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 2368b8534bSLuigi Rizzo * SUCH DAMAGE. 2468b8534bSLuigi Rizzo */ 2568b8534bSLuigi Rizzo 2668b8534bSLuigi Rizzo /* 2768b8534bSLuigi Rizzo * $FreeBSD$ 28506cc70cSLuigi Rizzo * $Id: netmap_kern.h 9795 2011-12-02 11:39:08Z luigi $ 2968b8534bSLuigi Rizzo * 3068b8534bSLuigi Rizzo * The header contains the definitions of constants and function 3168b8534bSLuigi Rizzo * prototypes used only in kernelspace. 3268b8534bSLuigi Rizzo */ 3368b8534bSLuigi Rizzo 3468b8534bSLuigi Rizzo #ifndef _NET_NETMAP_KERN_H_ 3568b8534bSLuigi Rizzo #define _NET_NETMAP_KERN_H_ 3668b8534bSLuigi Rizzo 37*1a26580eSLuigi Rizzo #if defined(__FreeBSD__) 38*1a26580eSLuigi Rizzo #define NM_LOCK_T struct mtx 39*1a26580eSLuigi Rizzo #define NM_SELINFO_T struct selinfo 40*1a26580eSLuigi Rizzo #define MBUF_LEN(m) ((m)->m_pkthdr.len) 41*1a26580eSLuigi Rizzo #define NM_SEND_UP(ifp, m) ((ifp)->if_input)(ifp, m) 42*1a26580eSLuigi Rizzo #elif defined (__linux__) 43*1a26580eSLuigi Rizzo #define NM_LOCK_T spinlock_t 44*1a26580eSLuigi Rizzo #define NM_SELINFO_T wait_queue_head_t 45*1a26580eSLuigi Rizzo #define MBUF_LEN(m) ((m)->len) 46*1a26580eSLuigi Rizzo #define NM_SEND_UP(ifp, m) netif_rx(m) 47*1a26580eSLuigi Rizzo #else 48*1a26580eSLuigi Rizzo #error unsupported platform 49*1a26580eSLuigi Rizzo #endif 50*1a26580eSLuigi Rizzo 5168b8534bSLuigi Rizzo #ifdef MALLOC_DECLARE 5268b8534bSLuigi Rizzo MALLOC_DECLARE(M_NETMAP); 5368b8534bSLuigi Rizzo #endif 5468b8534bSLuigi Rizzo 5568b8534bSLuigi Rizzo #define ND(format, ...) 5668b8534bSLuigi Rizzo #define D(format, ...) \ 5768b8534bSLuigi Rizzo do { \ 5868b8534bSLuigi Rizzo struct timeval __xxts; \ 5968b8534bSLuigi Rizzo microtime(&__xxts); \ 6068b8534bSLuigi Rizzo printf("%03d.%06d %s [%d] " format "\n", \ 6168b8534bSLuigi Rizzo (int)__xxts.tv_sec % 1000, (int)__xxts.tv_usec, \ 6268b8534bSLuigi Rizzo __FUNCTION__, __LINE__, ##__VA_ARGS__); \ 6368b8534bSLuigi Rizzo } while (0) 6468b8534bSLuigi Rizzo 6568b8534bSLuigi Rizzo struct netmap_adapter; 6668b8534bSLuigi Rizzo 6768b8534bSLuigi Rizzo /* 6868b8534bSLuigi Rizzo * private, kernel view of a ring. 6968b8534bSLuigi Rizzo * 70*1a26580eSLuigi Rizzo * The indexes in the NIC and netmap rings are offset by nkr_hwofs slots. 7168b8534bSLuigi Rizzo * This is so that, on a reset, buffers owned by userspace are not 7268b8534bSLuigi Rizzo * modified by the kernel. In particular: 73*1a26580eSLuigi Rizzo * RX rings: the next empty buffer (hwcur + hwavail + hwofs) coincides with 7468b8534bSLuigi Rizzo * the next empty buffer as known by the hardware (next_to_check or so). 7568b8534bSLuigi Rizzo * TX rings: hwcur + hwofs coincides with next_to_send 7668b8534bSLuigi Rizzo */ 7768b8534bSLuigi Rizzo struct netmap_kring { 7868b8534bSLuigi Rizzo struct netmap_ring *ring; 7968b8534bSLuigi Rizzo u_int nr_hwcur; 8068b8534bSLuigi Rizzo int nr_hwavail; 812157a17cSLuigi Rizzo u_int nr_kflags; /* private driver flags */ 822157a17cSLuigi Rizzo #define NKR_PENDINTR 0x1 // Pending interrupt. 8368b8534bSLuigi Rizzo u_int nkr_num_slots; 8468b8534bSLuigi Rizzo 85506cc70cSLuigi Rizzo int nkr_hwofs; /* offset between NIC and netmap ring */ 86*1a26580eSLuigi Rizzo struct netmap_adapter *na; 87*1a26580eSLuigi Rizzo NM_SELINFO_T si; /* poll/select wait queue */ 88*1a26580eSLuigi Rizzo NM_LOCK_T q_lock; /* used if no device lock available */ 892157a17cSLuigi Rizzo } __attribute__((__aligned__(64))); 9068b8534bSLuigi Rizzo 9168b8534bSLuigi Rizzo /* 92*1a26580eSLuigi Rizzo * This struct extends the 'struct adapter' (or 9368b8534bSLuigi Rizzo * equivalent) device descriptor. It contains all fields needed to 9468b8534bSLuigi Rizzo * support netmap operation. 9568b8534bSLuigi Rizzo */ 9668b8534bSLuigi Rizzo struct netmap_adapter { 9768b8534bSLuigi Rizzo int refcount; /* number of user-space descriptors using this 9868b8534bSLuigi Rizzo interface, which is equal to the number of 9968b8534bSLuigi Rizzo struct netmap_if objs in the mapped region. */ 10068b8534bSLuigi Rizzo 10168b8534bSLuigi Rizzo int separate_locks; /* set if the interface suports different 10268b8534bSLuigi Rizzo locks for rx, tx and core. */ 10368b8534bSLuigi Rizzo 10468b8534bSLuigi Rizzo u_int num_queues; /* number of tx/rx queue pairs: this is 10568b8534bSLuigi Rizzo a duplicate field needed to simplify the 10668b8534bSLuigi Rizzo signature of ``netmap_detach``. */ 10768b8534bSLuigi Rizzo 10868b8534bSLuigi Rizzo u_int num_tx_desc; /* number of descriptor in each queue */ 10968b8534bSLuigi Rizzo u_int num_rx_desc; 11068b8534bSLuigi Rizzo u_int buff_size; 11168b8534bSLuigi Rizzo 112*1a26580eSLuigi Rizzo //u_int flags; // XXX unused 11368b8534bSLuigi Rizzo /* tx_rings and rx_rings are private but allocated 11468b8534bSLuigi Rizzo * as a contiguous chunk of memory. Each array has 11568b8534bSLuigi Rizzo * N+1 entries, for the adapter queues and for the host queue. 11668b8534bSLuigi Rizzo */ 11768b8534bSLuigi Rizzo struct netmap_kring *tx_rings; /* array of TX rings. */ 11868b8534bSLuigi Rizzo struct netmap_kring *rx_rings; /* array of RX rings. */ 11968b8534bSLuigi Rizzo 12068b8534bSLuigi Rizzo /* copy of if_qflush and if_transmit pointers, to intercept 12168b8534bSLuigi Rizzo * packets from the network stack when netmap is active. 12268b8534bSLuigi Rizzo * XXX probably if_qflush is not necessary. 12368b8534bSLuigi Rizzo */ 124*1a26580eSLuigi Rizzo //void (*if_qflush)(struct ifnet *); // XXX unused 12568b8534bSLuigi Rizzo int (*if_transmit)(struct ifnet *, struct mbuf *); 12668b8534bSLuigi Rizzo 12768b8534bSLuigi Rizzo /* references to the ifnet and device routines, used by 12868b8534bSLuigi Rizzo * the generic netmap functions. 12968b8534bSLuigi Rizzo */ 13068b8534bSLuigi Rizzo struct ifnet *ifp; /* adapter is ifp->if_softc */ 13168b8534bSLuigi Rizzo 132*1a26580eSLuigi Rizzo NM_LOCK_T core_lock; /* used if no device lock available */ 133*1a26580eSLuigi Rizzo 13468b8534bSLuigi Rizzo int (*nm_register)(struct ifnet *, int onoff); 135*1a26580eSLuigi Rizzo void (*nm_lock)(struct ifnet *, int what, u_int ringid); 136*1a26580eSLuigi Rizzo int (*nm_txsync)(struct ifnet *, u_int ring, int lock); 137*1a26580eSLuigi Rizzo int (*nm_rxsync)(struct ifnet *, u_int ring, int lock); 13868b8534bSLuigi Rizzo }; 13968b8534bSLuigi Rizzo 14068b8534bSLuigi Rizzo /* 14168b8534bSLuigi Rizzo * The combination of "enable" (ifp->if_capabilities &IFCAP_NETMAP) 14268b8534bSLuigi Rizzo * and refcount gives the status of the interface, namely: 14368b8534bSLuigi Rizzo * 14468b8534bSLuigi Rizzo * enable refcount Status 14568b8534bSLuigi Rizzo * 14668b8534bSLuigi Rizzo * FALSE 0 normal operation 14768b8534bSLuigi Rizzo * FALSE != 0 -- (impossible) 14868b8534bSLuigi Rizzo * TRUE 1 netmap mode 14968b8534bSLuigi Rizzo * TRUE 0 being deleted. 15068b8534bSLuigi Rizzo */ 15168b8534bSLuigi Rizzo 15268b8534bSLuigi Rizzo #define NETMAP_DELETING(_na) ( ((_na)->refcount == 0) && \ 15368b8534bSLuigi Rizzo ( (_na)->ifp->if_capenable & IFCAP_NETMAP) ) 15468b8534bSLuigi Rizzo 15568b8534bSLuigi Rizzo /* 15668b8534bSLuigi Rizzo * parameters for (*nm_lock)(adapter, what, index) 15768b8534bSLuigi Rizzo */ 15868b8534bSLuigi Rizzo enum { 15968b8534bSLuigi Rizzo NETMAP_NO_LOCK = 0, 16068b8534bSLuigi Rizzo NETMAP_CORE_LOCK, NETMAP_CORE_UNLOCK, 16168b8534bSLuigi Rizzo NETMAP_TX_LOCK, NETMAP_TX_UNLOCK, 16268b8534bSLuigi Rizzo NETMAP_RX_LOCK, NETMAP_RX_UNLOCK, 163*1a26580eSLuigi Rizzo #ifdef __FreeBSD__ 164*1a26580eSLuigi Rizzo #define NETMAP_REG_LOCK NETMAP_CORE_LOCK 165*1a26580eSLuigi Rizzo #define NETMAP_REG_UNLOCK NETMAP_CORE_UNLOCK 166*1a26580eSLuigi Rizzo #else 167*1a26580eSLuigi Rizzo NETMAP_REG_LOCK, NETMAP_REG_UNLOCK 168*1a26580eSLuigi Rizzo #endif 16968b8534bSLuigi Rizzo }; 17068b8534bSLuigi Rizzo 17168b8534bSLuigi Rizzo /* 17268b8534bSLuigi Rizzo * The following are support routines used by individual drivers to 17368b8534bSLuigi Rizzo * support netmap operation. 17468b8534bSLuigi Rizzo * 17568b8534bSLuigi Rizzo * netmap_attach() initializes a struct netmap_adapter, allocating the 17668b8534bSLuigi Rizzo * struct netmap_ring's and the struct selinfo. 17768b8534bSLuigi Rizzo * 17868b8534bSLuigi Rizzo * netmap_detach() frees the memory allocated by netmap_attach(). 17968b8534bSLuigi Rizzo * 18068b8534bSLuigi Rizzo * netmap_start() replaces the if_transmit routine of the interface, 18168b8534bSLuigi Rizzo * and is used to intercept packets coming from the stack. 18268b8534bSLuigi Rizzo * 18368b8534bSLuigi Rizzo * netmap_load_map/netmap_reload_map are helper routines to set/reset 18468b8534bSLuigi Rizzo * the dmamap for a packet buffer 18568b8534bSLuigi Rizzo * 18668b8534bSLuigi Rizzo * netmap_reset() is a helper routine to be called in the driver 18768b8534bSLuigi Rizzo * when reinitializing a ring. 18868b8534bSLuigi Rizzo */ 18968b8534bSLuigi Rizzo int netmap_attach(struct netmap_adapter *, int); 19068b8534bSLuigi Rizzo void netmap_detach(struct ifnet *); 19168b8534bSLuigi Rizzo int netmap_start(struct ifnet *, struct mbuf *); 19268b8534bSLuigi Rizzo enum txrx { NR_RX = 0, NR_TX = 1 }; 19368b8534bSLuigi Rizzo struct netmap_slot *netmap_reset(struct netmap_adapter *na, 19468b8534bSLuigi Rizzo enum txrx tx, int n, u_int new_cur); 19568b8534bSLuigi Rizzo int netmap_ring_reinit(struct netmap_kring *); 19668b8534bSLuigi Rizzo 1975819da83SLuigi Rizzo extern int netmap_buf_size; 1985819da83SLuigi Rizzo #define NETMAP_BUF_SIZE netmap_buf_size 1992157a17cSLuigi Rizzo extern int netmap_mitigate; 2005819da83SLuigi Rizzo extern int netmap_no_pendintr; 20168b8534bSLuigi Rizzo extern u_int netmap_total_buffers; 20268b8534bSLuigi Rizzo extern char *netmap_buffer_base; 20368b8534bSLuigi Rizzo extern int netmap_verbose; // XXX debugging 20468b8534bSLuigi Rizzo enum { /* verbose flags */ 20568b8534bSLuigi Rizzo NM_VERB_ON = 1, /* generic verbose */ 20668b8534bSLuigi Rizzo NM_VERB_HOST = 0x2, /* verbose host stack */ 20768b8534bSLuigi Rizzo NM_VERB_RXSYNC = 0x10, /* verbose on rxsync/txsync */ 20868b8534bSLuigi Rizzo NM_VERB_TXSYNC = 0x20, 20968b8534bSLuigi Rizzo NM_VERB_RXINTR = 0x100, /* verbose on rx/tx intr (driver) */ 21068b8534bSLuigi Rizzo NM_VERB_TXINTR = 0x200, 21168b8534bSLuigi Rizzo NM_VERB_NIC_RXSYNC = 0x1000, /* verbose on rx/tx intr (driver) */ 21268b8534bSLuigi Rizzo NM_VERB_NIC_TXSYNC = 0x2000, 21368b8534bSLuigi Rizzo }; 21468b8534bSLuigi Rizzo 21568b8534bSLuigi Rizzo /* 216d0c7b075SLuigi Rizzo * NA returns a pointer to the struct netmap adapter from the ifp, 217d0c7b075SLuigi Rizzo * WNA is used to write it. 21868b8534bSLuigi Rizzo */ 219d0c7b075SLuigi Rizzo #ifndef WNA 220d0c7b075SLuigi Rizzo #define WNA(_ifp) (_ifp)->if_pspare[0] 221d0c7b075SLuigi Rizzo #endif 222d0c7b075SLuigi Rizzo #define NA(_ifp) ((struct netmap_adapter *)WNA(_ifp)) 22368b8534bSLuigi Rizzo 22468b8534bSLuigi Rizzo 2256dba29a2SLuigi Rizzo /* Callback invoked by the dma machinery after a successfull dmamap_load */ 2266dba29a2SLuigi Rizzo static void netmap_dmamap_cb(__unused void *arg, 2276dba29a2SLuigi Rizzo __unused bus_dma_segment_t * segs, __unused int nseg, __unused int error) 2286dba29a2SLuigi Rizzo { 2296dba29a2SLuigi Rizzo } 2306dba29a2SLuigi Rizzo 2316dba29a2SLuigi Rizzo /* bus_dmamap_load wrapper: call aforementioned function if map != NULL. 2326dba29a2SLuigi Rizzo * XXX can we do it without a callback ? 2336dba29a2SLuigi Rizzo */ 2346dba29a2SLuigi Rizzo static inline void 2356dba29a2SLuigi Rizzo netmap_load_map(bus_dma_tag_t tag, bus_dmamap_t map, void *buf) 2366dba29a2SLuigi Rizzo { 2376dba29a2SLuigi Rizzo if (map) 2386dba29a2SLuigi Rizzo bus_dmamap_load(tag, map, buf, NETMAP_BUF_SIZE, 2396dba29a2SLuigi Rizzo netmap_dmamap_cb, NULL, BUS_DMA_NOWAIT); 2406dba29a2SLuigi Rizzo } 2416dba29a2SLuigi Rizzo 2426dba29a2SLuigi Rizzo /* update the map when a buffer changes. */ 2436dba29a2SLuigi Rizzo static inline void 2446dba29a2SLuigi Rizzo netmap_reload_map(bus_dma_tag_t tag, bus_dmamap_t map, void *buf) 2456dba29a2SLuigi Rizzo { 2466dba29a2SLuigi Rizzo if (map) { 2476dba29a2SLuigi Rizzo bus_dmamap_unload(tag, map); 2486dba29a2SLuigi Rizzo bus_dmamap_load(tag, map, buf, NETMAP_BUF_SIZE, 2496dba29a2SLuigi Rizzo netmap_dmamap_cb, NULL, BUS_DMA_NOWAIT); 2506dba29a2SLuigi Rizzo } 2516dba29a2SLuigi Rizzo } 2526dba29a2SLuigi Rizzo 2536dba29a2SLuigi Rizzo 25468b8534bSLuigi Rizzo /* 2556e10c8b8SLuigi Rizzo * NMB return the virtual address of a buffer (buffer 0 on bad index) 2566e10c8b8SLuigi Rizzo * PNMB also fills the physical address 25768b8534bSLuigi Rizzo */ 2586e10c8b8SLuigi Rizzo static inline void * 25968b8534bSLuigi Rizzo NMB(struct netmap_slot *slot) 26068b8534bSLuigi Rizzo { 26168b8534bSLuigi Rizzo uint32_t i = slot->buf_idx; 26268b8534bSLuigi Rizzo return (i >= netmap_total_buffers) ? netmap_buffer_base : 26368b8534bSLuigi Rizzo netmap_buffer_base + (i *NETMAP_BUF_SIZE); 26468b8534bSLuigi Rizzo } 26568b8534bSLuigi Rizzo 2666e10c8b8SLuigi Rizzo static inline void * 2676e10c8b8SLuigi Rizzo PNMB(struct netmap_slot *slot, uint64_t *pp) 2686e10c8b8SLuigi Rizzo { 2696e10c8b8SLuigi Rizzo uint32_t i = slot->buf_idx; 2706e10c8b8SLuigi Rizzo void *ret = (i >= netmap_total_buffers) ? netmap_buffer_base : 2716e10c8b8SLuigi Rizzo netmap_buffer_base + (i *NETMAP_BUF_SIZE); 2726e10c8b8SLuigi Rizzo *pp = vtophys(ret); 2736e10c8b8SLuigi Rizzo return ret; 2746e10c8b8SLuigi Rizzo } 2756e10c8b8SLuigi Rizzo 276*1a26580eSLuigi Rizzo /* default functions to handle rx/tx interrupts */ 277*1a26580eSLuigi Rizzo int netmap_rx_irq(struct ifnet *, int, int *); 278*1a26580eSLuigi Rizzo #define netmap_tx_irq(_n, _q) netmap_rx_irq(_n, _q, NULL) 279*1a26580eSLuigi Rizzo #ifdef __linux__ 280*1a26580eSLuigi Rizzo #define bus_dmamap_sync(_a, _b, _c) // wmb() or rmb() ? 281*1a26580eSLuigi Rizzo netdev_tx_t netmap_start_linux(struct sk_buff *skb, struct net_device *dev); 282*1a26580eSLuigi Rizzo #endif 28368b8534bSLuigi Rizzo #endif /* _NET_NETMAP_KERN_H_ */ 284