1718cf2ccSPedro F. Giffuni /*- 24d846d26SWarner Losh * SPDX-License-Identifier: BSD-2-Clause 3718cf2ccSPedro F. Giffuni * 437e3a6d3SLuigi Rizzo * Copyright (C) 2012-2014 Matteo Landi 537e3a6d3SLuigi Rizzo * Copyright (C) 2012-2016 Luigi Rizzo 637e3a6d3SLuigi Rizzo * Copyright (C) 2012-2016 Giuseppe Lettieri 737e3a6d3SLuigi Rizzo * All rights reserved. 8ab1e2860SLuigi Rizzo * 9ab1e2860SLuigi Rizzo * Redistribution and use in source and binary forms, with or without 10ab1e2860SLuigi Rizzo * modification, are permitted provided that the following conditions 11ab1e2860SLuigi Rizzo * are met: 12ab1e2860SLuigi Rizzo * 1. Redistributions of source code must retain the above copyright 13ab1e2860SLuigi Rizzo * notice, this list of conditions and the following disclaimer. 14ab1e2860SLuigi Rizzo * 2. Redistributions in binary form must reproduce the above copyright 15ab1e2860SLuigi Rizzo * notice, this list of conditions and the following disclaimer in the 16ab1e2860SLuigi Rizzo * documentation and/or other materials provided with the distribution. 17ab1e2860SLuigi Rizzo * 18ab1e2860SLuigi Rizzo * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 19ab1e2860SLuigi Rizzo * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 20ab1e2860SLuigi Rizzo * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 21ab1e2860SLuigi Rizzo * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 22ab1e2860SLuigi Rizzo * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 23ab1e2860SLuigi Rizzo * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 24ab1e2860SLuigi Rizzo * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 25ab1e2860SLuigi Rizzo * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 26ab1e2860SLuigi Rizzo * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 27ab1e2860SLuigi Rizzo * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 28ab1e2860SLuigi Rizzo * SUCH DAMAGE. 29ab1e2860SLuigi Rizzo */ 30ab1e2860SLuigi Rizzo 31ab1e2860SLuigi Rizzo /* 32ab1e2860SLuigi Rizzo * 33ab1e2860SLuigi Rizzo * (New) memory allocator for netmap 34ab1e2860SLuigi Rizzo */ 35ab1e2860SLuigi Rizzo 36ab1e2860SLuigi Rizzo /* 37ab1e2860SLuigi Rizzo * This allocator creates three memory pools: 38ab1e2860SLuigi Rizzo * nm_if_pool for the struct netmap_if 39ab1e2860SLuigi Rizzo * nm_ring_pool for the struct netmap_ring 40ab1e2860SLuigi Rizzo * nm_buf_pool for the packet buffers. 41ab1e2860SLuigi Rizzo * 42ab1e2860SLuigi Rizzo * that contain netmap objects. Each pool is made of a number of clusters, 43ab1e2860SLuigi Rizzo * multiple of a page size, each containing an integer number of objects. 44ab1e2860SLuigi Rizzo * The clusters are contiguous in user space but not in the kernel. 45ab1e2860SLuigi Rizzo * Only nm_buf_pool needs to be dma-able, 46ab1e2860SLuigi Rizzo * but for convenience use the same type of allocator for all. 47ab1e2860SLuigi Rizzo * 48ab1e2860SLuigi Rizzo * Once mapped, the three pools are exported to userspace 49ab1e2860SLuigi Rizzo * as a contiguous block, starting from nm_if_pool. Each 50ab1e2860SLuigi Rizzo * cluster (and pool) is an integral number of pages. 51ab1e2860SLuigi Rizzo * [ . . . ][ . . . . . .][ . . . . . . . . . .] 52ab1e2860SLuigi Rizzo * nm_if nm_ring nm_buf 53ab1e2860SLuigi Rizzo * 54ab1e2860SLuigi Rizzo * The userspace areas contain offsets of the objects in userspace. 55ab1e2860SLuigi Rizzo * When (at init time) we write these offsets, we find out the index 56ab1e2860SLuigi Rizzo * of the object, and from there locate the offset from the beginning 57ab1e2860SLuigi Rizzo * of the region. 58ab1e2860SLuigi Rizzo * 5945c67e8fSVincenzo Maffione * The individual allocators manage a pool of memory for objects of 60ab1e2860SLuigi Rizzo * the same size. 61ab1e2860SLuigi Rizzo * The pool is split into smaller clusters, whose size is a 62ab1e2860SLuigi Rizzo * multiple of the page size. The cluster size is chosen 63ab1e2860SLuigi Rizzo * to minimize the waste for a given max cluster size 64ab1e2860SLuigi Rizzo * (we do it by brute force, as we have relatively few objects 65ab1e2860SLuigi Rizzo * per cluster). 66ab1e2860SLuigi Rizzo * 67ab1e2860SLuigi Rizzo * Objects are aligned to the cache line (64 bytes) rounding up object 68ab1e2860SLuigi Rizzo * sizes when needed. A bitmap contains the state of each object. 69ab1e2860SLuigi Rizzo * Allocation scans the bitmap; this is done only on attach, so we are not 70ab1e2860SLuigi Rizzo * too worried about performance 71ab1e2860SLuigi Rizzo * 7245c67e8fSVincenzo Maffione * For each allocator we can define (through sysctl) the size and 73ab1e2860SLuigi Rizzo * number of each object. Memory is allocated at the first use of a 74ab1e2860SLuigi Rizzo * netmap file descriptor, and can be freed when all such descriptors 75ab1e2860SLuigi Rizzo * have been released (including unmapping the memory). 76ab1e2860SLuigi Rizzo * If memory is scarce, the system tries to get as much as possible 77ab1e2860SLuigi Rizzo * and the sysctl values reflect the actual allocation. 78ab1e2860SLuigi Rizzo * Together with desired values, the sysctl export also absolute 79ab1e2860SLuigi Rizzo * min and maximum values that cannot be overridden. 80ab1e2860SLuigi Rizzo * 81ab1e2860SLuigi Rizzo * struct netmap_if: 82ab1e2860SLuigi Rizzo * variable size, max 16 bytes per ring pair plus some fixed amount. 83ab1e2860SLuigi Rizzo * 1024 bytes should be large enough in practice. 84ab1e2860SLuigi Rizzo * 85ab1e2860SLuigi Rizzo * In the worst case we have one netmap_if per ring in the system. 86ab1e2860SLuigi Rizzo * 87ab1e2860SLuigi Rizzo * struct netmap_ring 88ab1e2860SLuigi Rizzo * variable size, 8 byte per slot plus some fixed amount. 89ab1e2860SLuigi Rizzo * Rings can be large (e.g. 4k slots, or >32Kbytes). 90ab1e2860SLuigi Rizzo * We default to 36 KB (9 pages), and a few hundred rings. 91ab1e2860SLuigi Rizzo * 92ab1e2860SLuigi Rizzo * struct netmap_buffer 93ab1e2860SLuigi Rizzo * The more the better, both because fast interfaces tend to have 94ab1e2860SLuigi Rizzo * many slots, and because we may want to use buffers to store 95ab1e2860SLuigi Rizzo * packets in userspace avoiding copies. 96ab1e2860SLuigi Rizzo * Must contain a full frame (eg 1518, or more for vlans, jumbo 97ab1e2860SLuigi Rizzo * frames etc.) plus be nicely aligned, plus some NICs restrict 98ab1e2860SLuigi Rizzo * the size to multiple of 1K or so. Default to 2K 99ab1e2860SLuigi Rizzo */ 100ab1e2860SLuigi Rizzo #ifndef _NET_NETMAP_MEM2_H_ 101ab1e2860SLuigi Rizzo #define _NET_NETMAP_MEM2_H_ 102ab1e2860SLuigi Rizzo 103ab1e2860SLuigi Rizzo 104ab1e2860SLuigi Rizzo 105ab1e2860SLuigi Rizzo /* We implement two kinds of netmap_mem_d structures: 106ab1e2860SLuigi Rizzo * 107ab1e2860SLuigi Rizzo * - global: used by hardware NICS; 108ab1e2860SLuigi Rizzo * 109ab1e2860SLuigi Rizzo * - private: used by VALE ports. 110ab1e2860SLuigi Rizzo * 111ab1e2860SLuigi Rizzo * In both cases, the netmap_mem_d structure has the same lifetime as the 112ab1e2860SLuigi Rizzo * netmap_adapter of the corresponding NIC or port. It is the responsibility of 113ab1e2860SLuigi Rizzo * the client code to delete the private allocator when the associated 114ab1e2860SLuigi Rizzo * netmap_adapter is freed (this is implemented by the NAF_MEM_OWNER flag in 115ab1e2860SLuigi Rizzo * netmap.c). The 'refcount' field counts the number of active users of the 116ab1e2860SLuigi Rizzo * structure. The global allocator uses this information to prevent/allow 117ab1e2860SLuigi Rizzo * reconfiguration. The private allocators release all their memory when there 118ab1e2860SLuigi Rizzo * are no active users. By 'active user' we mean an existing netmap_priv 119ab1e2860SLuigi Rizzo * structure holding a reference to the allocator. 120ab1e2860SLuigi Rizzo */ 121ab1e2860SLuigi Rizzo 122ab1e2860SLuigi Rizzo extern struct netmap_mem_d nm_mem; 123c3e9b4dbSLuiz Otavio O Souza typedef uint16_t nm_memid_t; 124ab1e2860SLuigi Rizzo 12537e3a6d3SLuigi Rizzo int netmap_mem_get_lut(struct netmap_mem_d *, struct netmap_lut *); 126c3e9b4dbSLuiz Otavio O Souza nm_memid_t netmap_mem_get_id(struct netmap_mem_d *); 127ab1e2860SLuigi Rizzo vm_paddr_t netmap_mem_ofstophys(struct netmap_mem_d *, vm_ooffset_t); 12837e3a6d3SLuigi Rizzo #ifdef _WIN32 12937e3a6d3SLuigi Rizzo PMDL win32_build_user_vm_map(struct netmap_mem_d* nmd); 13037e3a6d3SLuigi Rizzo #endif 1314bf50f18SLuigi Rizzo int netmap_mem_finalize(struct netmap_mem_d *, struct netmap_adapter *); 132ab1e2860SLuigi Rizzo int netmap_mem_init(void); 133ab1e2860SLuigi Rizzo void netmap_mem_fini(void); 134c3e9b4dbSLuiz Otavio O Souza struct netmap_if * netmap_mem_if_new(struct netmap_adapter *, struct netmap_priv_d *); 135f9790aebSLuigi Rizzo void netmap_mem_if_delete(struct netmap_adapter *, struct netmap_if *); 136f9790aebSLuigi Rizzo int netmap_mem_rings_create(struct netmap_adapter *); 137f9790aebSLuigi Rizzo void netmap_mem_rings_delete(struct netmap_adapter *); 1384f80b14cSVincenzo Maffione int netmap_mem_deref(struct netmap_mem_d *, struct netmap_adapter *); 13937e3a6d3SLuigi Rizzo int netmap_mem2_get_pool_info(struct netmap_mem_d *, u_int, u_int *, u_int *); 1402ff91c17SVincenzo Maffione int netmap_mem_get_info(struct netmap_mem_d *, uint64_t *size, 1412ff91c17SVincenzo Maffione u_int *memflags, nm_memid_t *id); 142f9790aebSLuigi Rizzo ssize_t netmap_mem_if_offset(struct netmap_mem_d *, const void *vaddr); 143c3e9b4dbSLuiz Otavio O Souza struct netmap_mem_d* netmap_mem_private_new( u_int txr, u_int txd, u_int rxr, u_int rxd, 144c3e9b4dbSLuiz Otavio O Souza u_int extra_bufs, u_int npipes, int* error); 145847bf383SLuigi Rizzo 146c3e9b4dbSLuiz Otavio O Souza #define netmap_mem_get(d) __netmap_mem_get(d, __FUNCTION__, __LINE__) 147c3e9b4dbSLuiz Otavio O Souza #define netmap_mem_put(d) __netmap_mem_put(d, __FUNCTION__, __LINE__) 148c3e9b4dbSLuiz Otavio O Souza struct netmap_mem_d* __netmap_mem_get(struct netmap_mem_d *, const char *, int); 149*1bae9dc5SMark Johnston struct netmap_mem_d* netmap_mem_get_allocator(struct netmap_adapter *); 150847bf383SLuigi Rizzo void __netmap_mem_put(struct netmap_mem_d *, const char *, int); 151c3e9b4dbSLuiz Otavio O Souza struct netmap_mem_d* netmap_mem_find(nm_memid_t); 1524f80b14cSVincenzo Maffione unsigned netmap_mem_bufsize(struct netmap_mem_d *nmd); 1534f80b14cSVincenzo Maffione 1544f80b14cSVincenzo Maffione #ifdef WITH_EXTMEM 1552ff91c17SVincenzo Maffione struct netmap_mem_d* netmap_mem_ext_create(uint64_t, struct nmreq_pools_info *, int *); 1564f80b14cSVincenzo Maffione #else /* !WITH_EXTMEM */ 1574f80b14cSVincenzo Maffione #define netmap_mem_ext_create(nmr, _perr) \ 1584f80b14cSVincenzo Maffione ({ int *perr = _perr; if (perr) *(perr) = EOPNOTSUPP; NULL; }) 1594f80b14cSVincenzo Maffione #endif /* WITH_EXTMEM */ 160ab1e2860SLuigi Rizzo 161b6e66be2SVincenzo Maffione #ifdef WITH_PTNETMAP 162e330262fSJustin Hibbits struct netmap_mem_d* netmap_mem_pt_guest_new(if_t, 16337e3a6d3SLuigi Rizzo unsigned int nifp_offset, 164844a6f0cSLuigi Rizzo unsigned int memid); 16537e3a6d3SLuigi Rizzo struct ptnetmap_memdev; 16637e3a6d3SLuigi Rizzo struct netmap_mem_d* netmap_mem_pt_guest_attach(struct ptnetmap_memdev *, uint16_t); 167e330262fSJustin Hibbits int netmap_mem_pt_guest_ifp_del(struct netmap_mem_d *, if_t); 168b6e66be2SVincenzo Maffione #endif /* WITH_PTNETMAP */ 16937e3a6d3SLuigi Rizzo 1702ff91c17SVincenzo Maffione int netmap_mem_pools_info_get(struct nmreq_pools_info *, 1712ff91c17SVincenzo Maffione struct netmap_mem_d *); 172844a6f0cSLuigi Rizzo 1734bf50f18SLuigi Rizzo #define NETMAP_MEM_PRIVATE 0x2 /* allocator uses private address space */ 1744bf50f18SLuigi Rizzo #define NETMAP_MEM_IO 0x4 /* the underlying memory is mmapped I/O */ 175ab1e2860SLuigi Rizzo 176f0ea3689SLuigi Rizzo uint32_t netmap_extra_alloc(struct netmap_adapter *, uint32_t *, uint32_t n); 177ab1e2860SLuigi Rizzo 1782ff91c17SVincenzo Maffione #ifdef WITH_EXTMEM 1792ff91c17SVincenzo Maffione #include <net/netmap_virt.h> 1802ff91c17SVincenzo Maffione struct nm_os_extmem; /* opaque */ 1812ff91c17SVincenzo Maffione struct nm_os_extmem *nm_os_extmem_create(unsigned long, struct nmreq_pools_info *, int *perror); 1822ff91c17SVincenzo Maffione char *nm_os_extmem_nextpage(struct nm_os_extmem *); 1832ff91c17SVincenzo Maffione int nm_os_extmem_nr_pages(struct nm_os_extmem *); 1842ff91c17SVincenzo Maffione int nm_os_extmem_isequal(struct nm_os_extmem *, struct nm_os_extmem *); 1852ff91c17SVincenzo Maffione void nm_os_extmem_delete(struct nm_os_extmem *); 1862ff91c17SVincenzo Maffione #endif /* WITH_EXTMEM */ 1872ff91c17SVincenzo Maffione 188ab1e2860SLuigi Rizzo #endif 189