1c398230bSWarner Losh /*- 2df8bae1dSRodney W. Grimes * Copyright (c) 1990, 1991, 1993 3253a3814SLawrence Stewart * The Regents of the University of California. All rights reserved. 4df8bae1dSRodney W. Grimes * 5df8bae1dSRodney W. Grimes * This code is derived from the Stanford/CMU enet packet filter, 6df8bae1dSRodney W. Grimes * (net/enet.c) distributed as part of 4.3BSD, and code contributed 7df8bae1dSRodney W. Grimes * to Berkeley by Steven McCanne and Van Jacobson both of Lawrence 8df8bae1dSRodney W. Grimes * Berkeley Laboratory. 9df8bae1dSRodney W. Grimes * 10df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 11df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 12df8bae1dSRodney W. Grimes * are met: 13df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 14df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 15df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 16df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 17df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 18df8bae1dSRodney W. Grimes * 4. Neither the name of the University nor the names of its contributors 19df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 20df8bae1dSRodney W. Grimes * without specific prior written permission. 21df8bae1dSRodney W. Grimes * 22df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 23df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 24df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 25df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 26df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 27df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 28df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 29df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 30df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 31df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 32df8bae1dSRodney W. Grimes * SUCH DAMAGE. 33df8bae1dSRodney W. Grimes * 344f252c4dSRuslan Ermilov * @(#)bpf.c 8.4 (Berkeley) 1/9/95 35df8bae1dSRodney W. Grimes */ 36df8bae1dSRodney W. Grimes 37c7866007SRobert Watson #include <sys/cdefs.h> 38c7866007SRobert Watson __FBSDID("$FreeBSD$"); 39c7866007SRobert Watson 405bb5f2c9SPeter Wemm #include "opt_bpf.h" 41fc0a61a4SKonstantin Belousov #include "opt_compat.h" 425bb5f2c9SPeter Wemm #include "opt_netgraph.h" 43df8bae1dSRodney W. Grimes 4495aab9ccSJohn-Mark Gurney #include <sys/types.h> 45df8bae1dSRodney W. Grimes #include <sys/param.h> 46e4b3229aSAlexander V. Chernikov #include <sys/lock.h> 47e4b3229aSAlexander V. Chernikov #include <sys/rwlock.h> 48df8bae1dSRodney W. Grimes #include <sys/systm.h> 49ce7609a4SBruce Evans #include <sys/conf.h> 50e76eee55SPoul-Henning Kamp #include <sys/fcntl.h> 51ebd8672cSBjoern A. Zeeb #include <sys/jail.h> 524d1d4912SBruce Evans #include <sys/malloc.h> 53df8bae1dSRodney W. Grimes #include <sys/mbuf.h> 54df8bae1dSRodney W. Grimes #include <sys/time.h> 55acd3428bSRobert Watson #include <sys/priv.h> 56df8bae1dSRodney W. Grimes #include <sys/proc.h> 570310c19fSBruce Evans #include <sys/signalvar.h> 58528f627fSBruce Evans #include <sys/filio.h> 59528f627fSBruce Evans #include <sys/sockio.h> 60528f627fSBruce Evans #include <sys/ttycom.h> 61e76eee55SPoul-Henning Kamp #include <sys/uio.h> 62df8bae1dSRodney W. Grimes 6395aab9ccSJohn-Mark Gurney #include <sys/event.h> 6495aab9ccSJohn-Mark Gurney #include <sys/file.h> 65243ac7d8SPeter Wemm #include <sys/poll.h> 6695aab9ccSJohn-Mark Gurney #include <sys/proc.h> 67df8bae1dSRodney W. Grimes 68df8bae1dSRodney W. Grimes #include <sys/socket.h> 69df8bae1dSRodney W. Grimes 70fba9235dSBruce Evans #include <net/if.h> 71e4b3229aSAlexander V. Chernikov #define BPF_INTERNAL 72df8bae1dSRodney W. Grimes #include <net/bpf.h> 734d621040SChristian S.J. Peron #include <net/bpf_buffer.h> 74ae275efcSJung-uk Kim #ifdef BPF_JITTER 75ae275efcSJung-uk Kim #include <net/bpf_jitter.h> 76ae275efcSJung-uk Kim #endif 774d621040SChristian S.J. Peron #include <net/bpf_zerocopy.h> 78df8bae1dSRodney W. Grimes #include <net/bpfdesc.h> 79530c0060SRobert Watson #include <net/vnet.h> 80df8bae1dSRodney W. Grimes 81df8bae1dSRodney W. Grimes #include <netinet/in.h> 82df8bae1dSRodney W. Grimes #include <netinet/if_ether.h> 83df8bae1dSRodney W. Grimes #include <sys/kernel.h> 84f708ef1bSPoul-Henning Kamp #include <sys/sysctl.h> 857b778b5eSEivind Eklund 86246b5467SSam Leffler #include <net80211/ieee80211_freebsd.h> 87246b5467SSam Leffler 88aed55708SRobert Watson #include <security/mac/mac_framework.h> 89aed55708SRobert Watson 904d621040SChristian S.J. Peron MALLOC_DEFINE(M_BPF, "BPF", "BPF data"); 9187f6c662SJulian Elischer 925bb5f2c9SPeter Wemm #if defined(DEV_BPF) || defined(NETGRAPH_BPF) 9353ac6efbSJulian Elischer 94df8bae1dSRodney W. Grimes #define PRINET 26 /* interruptible */ 95df8bae1dSRodney W. Grimes 96547d94bdSJung-uk Kim #define SIZEOF_BPF_HDR(type) \ 97547d94bdSJung-uk Kim (offsetof(type, bh_hdrlen) + sizeof(((type *)0)->bh_hdrlen)) 98547d94bdSJung-uk Kim 99fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 100fc0a61a4SKonstantin Belousov #include <sys/mount.h> 101fc0a61a4SKonstantin Belousov #include <compat/freebsd32/freebsd32.h> 102fc0a61a4SKonstantin Belousov #define BPF_ALIGNMENT32 sizeof(int32_t) 103fc0a61a4SKonstantin Belousov #define BPF_WORDALIGN32(x) (((x)+(BPF_ALIGNMENT32-1))&~(BPF_ALIGNMENT32-1)) 104fc0a61a4SKonstantin Belousov 105547d94bdSJung-uk Kim #ifndef BURN_BRIDGES 106fc0a61a4SKonstantin Belousov /* 107fc0a61a4SKonstantin Belousov * 32-bit version of structure prepended to each packet. We use this header 108fc0a61a4SKonstantin Belousov * instead of the standard one for 32-bit streams. We mark the a stream as 109fc0a61a4SKonstantin Belousov * 32-bit the first time we see a 32-bit compat ioctl request. 110fc0a61a4SKonstantin Belousov */ 111fc0a61a4SKonstantin Belousov struct bpf_hdr32 { 112fc0a61a4SKonstantin Belousov struct timeval32 bh_tstamp; /* time stamp */ 113fc0a61a4SKonstantin Belousov uint32_t bh_caplen; /* length of captured portion */ 114fc0a61a4SKonstantin Belousov uint32_t bh_datalen; /* original length of packet */ 115fc0a61a4SKonstantin Belousov uint16_t bh_hdrlen; /* length of bpf header (this struct 116fc0a61a4SKonstantin Belousov plus alignment padding) */ 117fc0a61a4SKonstantin Belousov }; 118253a3814SLawrence Stewart #endif 119fc0a61a4SKonstantin Belousov 120fc0a61a4SKonstantin Belousov struct bpf_program32 { 121fc0a61a4SKonstantin Belousov u_int bf_len; 122fc0a61a4SKonstantin Belousov uint32_t bf_insns; 123fc0a61a4SKonstantin Belousov }; 124fc0a61a4SKonstantin Belousov 125fc0a61a4SKonstantin Belousov struct bpf_dltlist32 { 126fc0a61a4SKonstantin Belousov u_int bfl_len; 127fc0a61a4SKonstantin Belousov u_int bfl_list; 128fc0a61a4SKonstantin Belousov }; 129fc0a61a4SKonstantin Belousov 130fc0a61a4SKonstantin Belousov #define BIOCSETF32 _IOW('B', 103, struct bpf_program32) 131fc0a61a4SKonstantin Belousov #define BIOCSRTIMEOUT32 _IOW('B', 109, struct timeval32) 132fc0a61a4SKonstantin Belousov #define BIOCGRTIMEOUT32 _IOR('B', 110, struct timeval32) 133fc0a61a4SKonstantin Belousov #define BIOCGDLTLIST32 _IOWR('B', 121, struct bpf_dltlist32) 134fc0a61a4SKonstantin Belousov #define BIOCSETWF32 _IOW('B', 123, struct bpf_program32) 135fc0a61a4SKonstantin Belousov #define BIOCSETFNR32 _IOW('B', 130, struct bpf_program32) 136253a3814SLawrence Stewart #endif 137fc0a61a4SKonstantin Belousov 138df8bae1dSRodney W. Grimes /* 139d1a67300SRobert Watson * bpf_iflist is a list of BPF interface structures, each corresponding to a 140d1a67300SRobert Watson * specific DLT. The same network interface might have several BPF interface 141d1a67300SRobert Watson * structures registered by different layers in the stack (i.e., 802.11 142d1a67300SRobert Watson * frames, ethernet frames, etc). 143df8bae1dSRodney W. Grimes */ 1444a3feeaaSRobert Watson static LIST_HEAD(, bpf_if) bpf_iflist; 145e7bb21b3SJonathan Lemon static struct mtx bpf_mtx; /* bpf global lock */ 14669f7644bSChristian S.J. Peron static int bpf_bpfd_cnt; 147df8bae1dSRodney W. Grimes 14819ba8395SChristian S.J. Peron static void bpf_attachd(struct bpf_d *, struct bpf_if *); 14919ba8395SChristian S.J. Peron static void bpf_detachd(struct bpf_d *); 150*6c74ff0eSAlexander V. Chernikov static void bpf_detachd_locked(struct bpf_d *); 151929ddbbbSAlfred Perlstein static void bpf_freed(struct bpf_d *); 152cb44b6dfSAndrew Thompson static int bpf_movein(struct uio *, int, struct ifnet *, struct mbuf **, 153560a54e1SJung-uk Kim struct sockaddr *, int *, struct bpf_insn *); 154929ddbbbSAlfred Perlstein static int bpf_setif(struct bpf_d *, struct ifreq *); 155929ddbbbSAlfred Perlstein static void bpf_timed_out(void *); 156e7bb21b3SJonathan Lemon static __inline void 157929ddbbbSAlfred Perlstein bpf_wakeup(struct bpf_d *); 1584d621040SChristian S.J. Peron static void catchpacket(struct bpf_d *, u_char *, u_int, u_int, 1594d621040SChristian S.J. Peron void (*)(struct bpf_d *, caddr_t, u_int, void *, u_int), 160547d94bdSJung-uk Kim struct bintime *); 161929ddbbbSAlfred Perlstein static void reset_d(struct bpf_d *); 16293e39f0bSChristian S.J. Peron static int bpf_setf(struct bpf_d *, struct bpf_program *, u_long cmd); 1638eab61f3SSam Leffler static int bpf_getdltlist(struct bpf_d *, struct bpf_dltlist *); 1648eab61f3SSam Leffler static int bpf_setdlt(struct bpf_d *, u_int); 16595aab9ccSJohn-Mark Gurney static void filt_bpfdetach(struct knote *); 16695aab9ccSJohn-Mark Gurney static int filt_bpfread(struct knote *, long); 167a3272e3cSChristian S.J. Peron static void bpf_drvinit(void *); 16869f7644bSChristian S.J. Peron static int bpf_stats_sysctl(SYSCTL_HANDLER_ARGS); 16969f7644bSChristian S.J. Peron 17069f7644bSChristian S.J. Peron SYSCTL_NODE(_net, OID_AUTO, bpf, CTLFLAG_RW, 0, "bpf sysctl"); 17112dc9582SJung-uk Kim int bpf_maxinsns = BPF_MAXINSNS; 17269f7644bSChristian S.J. Peron SYSCTL_INT(_net_bpf, OID_AUTO, maxinsns, CTLFLAG_RW, 17369f7644bSChristian S.J. Peron &bpf_maxinsns, 0, "Maximum bpf program instructions"); 174ffeeb924SChristian S.J. Peron static int bpf_zerocopy_enable = 0; 1754d621040SChristian S.J. Peron SYSCTL_INT(_net_bpf, OID_AUTO, zerocopy_enable, CTLFLAG_RW, 1764d621040SChristian S.J. Peron &bpf_zerocopy_enable, 0, "Enable new zero-copy BPF buffer sessions"); 1776472ac3dSEd Schouten static SYSCTL_NODE(_net_bpf, OID_AUTO, stats, CTLFLAG_MPSAFE | CTLFLAG_RW, 17869f7644bSChristian S.J. Peron bpf_stats_sysctl, "bpf statistics portal"); 179df8bae1dSRodney W. Grimes 18051ec1eb7SAlexander V. Chernikov static VNET_DEFINE(int, bpf_optimize_writers) = 0; 18151ec1eb7SAlexander V. Chernikov #define V_bpf_optimize_writers VNET(bpf_optimize_writers) 18251ec1eb7SAlexander V. Chernikov SYSCTL_VNET_INT(_net_bpf, OID_AUTO, optimize_writers, 18351ec1eb7SAlexander V. Chernikov CTLFLAG_RW, &VNET_NAME(bpf_optimize_writers), 0, 18451ec1eb7SAlexander V. Chernikov "Do not send packets until BPF program is set"); 18551ec1eb7SAlexander V. Chernikov 18687f6c662SJulian Elischer static d_open_t bpfopen; 18787f6c662SJulian Elischer static d_read_t bpfread; 18887f6c662SJulian Elischer static d_write_t bpfwrite; 18987f6c662SJulian Elischer static d_ioctl_t bpfioctl; 190243ac7d8SPeter Wemm static d_poll_t bpfpoll; 19195aab9ccSJohn-Mark Gurney static d_kqfilter_t bpfkqfilter; 19287f6c662SJulian Elischer 1934e2f199eSPoul-Henning Kamp static struct cdevsw bpf_cdevsw = { 194dc08ffecSPoul-Henning Kamp .d_version = D_VERSION, 1957ac40f5fSPoul-Henning Kamp .d_open = bpfopen, 1967ac40f5fSPoul-Henning Kamp .d_read = bpfread, 1977ac40f5fSPoul-Henning Kamp .d_write = bpfwrite, 1987ac40f5fSPoul-Henning Kamp .d_ioctl = bpfioctl, 1997ac40f5fSPoul-Henning Kamp .d_poll = bpfpoll, 2007ac40f5fSPoul-Henning Kamp .d_name = "bpf", 20195aab9ccSJohn-Mark Gurney .d_kqfilter = bpfkqfilter, 2024e2f199eSPoul-Henning Kamp }; 20387f6c662SJulian Elischer 204e76d823bSRobert Watson static struct filterops bpfread_filtops = { 205e76d823bSRobert Watson .f_isfd = 1, 206e76d823bSRobert Watson .f_detach = filt_bpfdetach, 207e76d823bSRobert Watson .f_event = filt_bpfread, 208e76d823bSRobert Watson }; 20987f6c662SJulian Elischer 2104d621040SChristian S.J. Peron /* 211*6c74ff0eSAlexander V. Chernikov * LOCKING MODEL USED BY BPF: 212*6c74ff0eSAlexander V. Chernikov * Locks: 213*6c74ff0eSAlexander V. Chernikov * 1) global lock (BPF_LOCK). Mutex, used to protect interface addition/removal, 214*6c74ff0eSAlexander V. Chernikov * some global counters and every bpf_if reference. 215*6c74ff0eSAlexander V. Chernikov * 2) Interface lock. Rwlock, used to protect list of BPF descriptors and their filters. 216*6c74ff0eSAlexander V. Chernikov * 3) Descriptor lock. Rwlock, used to protect BPF buffers and various structure fields 217*6c74ff0eSAlexander V. Chernikov * used by bpf_mtap code. 218*6c74ff0eSAlexander V. Chernikov * 219*6c74ff0eSAlexander V. Chernikov * Lock order: 220*6c74ff0eSAlexander V. Chernikov * 221*6c74ff0eSAlexander V. Chernikov * Global lock, interface lock, descriptor lock 222*6c74ff0eSAlexander V. Chernikov * 223*6c74ff0eSAlexander V. Chernikov * We have to acquire interface lock before descriptor main lock due to BPF_MTAP[2] 224*6c74ff0eSAlexander V. Chernikov * working model. In many places (like bpf_detachd) we start with BPF descriptor 225*6c74ff0eSAlexander V. Chernikov * (and we need to at least rlock it to get reliable interface pointer). This 226*6c74ff0eSAlexander V. Chernikov * gives us potential LOR. As a result, we use global lock to protect from bpf_if 227*6c74ff0eSAlexander V. Chernikov * change in every such place. 228*6c74ff0eSAlexander V. Chernikov * 229*6c74ff0eSAlexander V. Chernikov * Changing d->bd_bif is protected by 1) global lock, 2) interface lock and 230*6c74ff0eSAlexander V. Chernikov * 3) descriptor main wlock. 231*6c74ff0eSAlexander V. Chernikov * Reading bd_bif can be protected by any of these locks, typically global lock. 232*6c74ff0eSAlexander V. Chernikov * 233*6c74ff0eSAlexander V. Chernikov * Changing read/write BPF filter is protected by the same three locks, 234*6c74ff0eSAlexander V. Chernikov * the same applies for reading. 235*6c74ff0eSAlexander V. Chernikov * 236*6c74ff0eSAlexander V. Chernikov * Sleeping in global lock is not allowed due to bpfdetach() using it. 237*6c74ff0eSAlexander V. Chernikov */ 238*6c74ff0eSAlexander V. Chernikov 239*6c74ff0eSAlexander V. Chernikov /* 2404d621040SChristian S.J. Peron * Wrapper functions for various buffering methods. If the set of buffer 2414d621040SChristian S.J. Peron * modes expands, we will probably want to introduce a switch data structure 2424d621040SChristian S.J. Peron * similar to protosw, et. 2434d621040SChristian S.J. Peron */ 2444d621040SChristian S.J. Peron static void 2454d621040SChristian S.J. Peron bpf_append_bytes(struct bpf_d *d, caddr_t buf, u_int offset, void *src, 2464d621040SChristian S.J. Peron u_int len) 2474d621040SChristian S.J. Peron { 2484d621040SChristian S.J. Peron 249e4b3229aSAlexander V. Chernikov BPFD_WLOCK_ASSERT(d); 2504d621040SChristian S.J. Peron 2514d621040SChristian S.J. Peron switch (d->bd_bufmode) { 2524d621040SChristian S.J. Peron case BPF_BUFMODE_BUFFER: 2534d621040SChristian S.J. Peron return (bpf_buffer_append_bytes(d, buf, offset, src, len)); 2544d621040SChristian S.J. Peron 2554d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 2564d621040SChristian S.J. Peron d->bd_zcopy++; 2574d621040SChristian S.J. Peron return (bpf_zerocopy_append_bytes(d, buf, offset, src, len)); 2584d621040SChristian S.J. Peron 2594d621040SChristian S.J. Peron default: 2604d621040SChristian S.J. Peron panic("bpf_buf_append_bytes"); 2614d621040SChristian S.J. Peron } 2624d621040SChristian S.J. Peron } 2634d621040SChristian S.J. Peron 2644d621040SChristian S.J. Peron static void 2654d621040SChristian S.J. Peron bpf_append_mbuf(struct bpf_d *d, caddr_t buf, u_int offset, void *src, 2664d621040SChristian S.J. Peron u_int len) 2674d621040SChristian S.J. Peron { 2684d621040SChristian S.J. Peron 269e4b3229aSAlexander V. Chernikov BPFD_WLOCK_ASSERT(d); 2704d621040SChristian S.J. Peron 2714d621040SChristian S.J. Peron switch (d->bd_bufmode) { 2724d621040SChristian S.J. Peron case BPF_BUFMODE_BUFFER: 2734d621040SChristian S.J. Peron return (bpf_buffer_append_mbuf(d, buf, offset, src, len)); 2744d621040SChristian S.J. Peron 2754d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 2764d621040SChristian S.J. Peron d->bd_zcopy++; 2774d621040SChristian S.J. Peron return (bpf_zerocopy_append_mbuf(d, buf, offset, src, len)); 2784d621040SChristian S.J. Peron 2794d621040SChristian S.J. Peron default: 2804d621040SChristian S.J. Peron panic("bpf_buf_append_mbuf"); 2814d621040SChristian S.J. Peron } 2824d621040SChristian S.J. Peron } 2834d621040SChristian S.J. Peron 2844d621040SChristian S.J. Peron /* 28529f612ecSChristian S.J. Peron * This function gets called when the free buffer is re-assigned. 28629f612ecSChristian S.J. Peron */ 28729f612ecSChristian S.J. Peron static void 28829f612ecSChristian S.J. Peron bpf_buf_reclaimed(struct bpf_d *d) 28929f612ecSChristian S.J. Peron { 29029f612ecSChristian S.J. Peron 291e4b3229aSAlexander V. Chernikov BPFD_WLOCK_ASSERT(d); 29229f612ecSChristian S.J. Peron 29329f612ecSChristian S.J. Peron switch (d->bd_bufmode) { 29429f612ecSChristian S.J. Peron case BPF_BUFMODE_BUFFER: 29529f612ecSChristian S.J. Peron return; 29629f612ecSChristian S.J. Peron 29729f612ecSChristian S.J. Peron case BPF_BUFMODE_ZBUF: 29829f612ecSChristian S.J. Peron bpf_zerocopy_buf_reclaimed(d); 29929f612ecSChristian S.J. Peron return; 30029f612ecSChristian S.J. Peron 30129f612ecSChristian S.J. Peron default: 30229f612ecSChristian S.J. Peron panic("bpf_buf_reclaimed"); 30329f612ecSChristian S.J. Peron } 30429f612ecSChristian S.J. Peron } 30529f612ecSChristian S.J. Peron 30629f612ecSChristian S.J. Peron /* 3074d621040SChristian S.J. Peron * If the buffer mechanism has a way to decide that a held buffer can be made 3084d621040SChristian S.J. Peron * free, then it is exposed via the bpf_canfreebuf() interface. (1) is 3094d621040SChristian S.J. Peron * returned if the buffer can be discarded, (0) is returned if it cannot. 3104d621040SChristian S.J. Peron */ 3114d621040SChristian S.J. Peron static int 3124d621040SChristian S.J. Peron bpf_canfreebuf(struct bpf_d *d) 3134d621040SChristian S.J. Peron { 3144d621040SChristian S.J. Peron 3154d621040SChristian S.J. Peron BPFD_LOCK_ASSERT(d); 3164d621040SChristian S.J. Peron 3174d621040SChristian S.J. Peron switch (d->bd_bufmode) { 3184d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 3194d621040SChristian S.J. Peron return (bpf_zerocopy_canfreebuf(d)); 3204d621040SChristian S.J. Peron } 3214d621040SChristian S.J. Peron return (0); 3224d621040SChristian S.J. Peron } 3234d621040SChristian S.J. Peron 324a7a91e65SRobert Watson /* 325a7a91e65SRobert Watson * Allow the buffer model to indicate that the current store buffer is 326a7a91e65SRobert Watson * immutable, regardless of the appearance of space. Return (1) if the 327a7a91e65SRobert Watson * buffer is writable, and (0) if not. 328a7a91e65SRobert Watson */ 329a7a91e65SRobert Watson static int 330a7a91e65SRobert Watson bpf_canwritebuf(struct bpf_d *d) 331a7a91e65SRobert Watson { 332a7a91e65SRobert Watson BPFD_LOCK_ASSERT(d); 333a7a91e65SRobert Watson 334a7a91e65SRobert Watson switch (d->bd_bufmode) { 335a7a91e65SRobert Watson case BPF_BUFMODE_ZBUF: 336a7a91e65SRobert Watson return (bpf_zerocopy_canwritebuf(d)); 337a7a91e65SRobert Watson } 338a7a91e65SRobert Watson return (1); 339a7a91e65SRobert Watson } 340a7a91e65SRobert Watson 341a7a91e65SRobert Watson /* 342a7a91e65SRobert Watson * Notify buffer model that an attempt to write to the store buffer has 343a7a91e65SRobert Watson * resulted in a dropped packet, in which case the buffer may be considered 344a7a91e65SRobert Watson * full. 345a7a91e65SRobert Watson */ 346a7a91e65SRobert Watson static void 347a7a91e65SRobert Watson bpf_buffull(struct bpf_d *d) 348a7a91e65SRobert Watson { 349a7a91e65SRobert Watson 350e4b3229aSAlexander V. Chernikov BPFD_WLOCK_ASSERT(d); 351a7a91e65SRobert Watson 352a7a91e65SRobert Watson switch (d->bd_bufmode) { 353a7a91e65SRobert Watson case BPF_BUFMODE_ZBUF: 354a7a91e65SRobert Watson bpf_zerocopy_buffull(d); 355a7a91e65SRobert Watson break; 356a7a91e65SRobert Watson } 357a7a91e65SRobert Watson } 358a7a91e65SRobert Watson 359a7a91e65SRobert Watson /* 360a7a91e65SRobert Watson * Notify the buffer model that a buffer has moved into the hold position. 361a7a91e65SRobert Watson */ 3624d621040SChristian S.J. Peron void 3634d621040SChristian S.J. Peron bpf_bufheld(struct bpf_d *d) 3644d621040SChristian S.J. Peron { 3654d621040SChristian S.J. Peron 366e4b3229aSAlexander V. Chernikov BPFD_WLOCK_ASSERT(d); 3674d621040SChristian S.J. Peron 3684d621040SChristian S.J. Peron switch (d->bd_bufmode) { 3694d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 3704d621040SChristian S.J. Peron bpf_zerocopy_bufheld(d); 3714d621040SChristian S.J. Peron break; 3724d621040SChristian S.J. Peron } 3734d621040SChristian S.J. Peron } 3744d621040SChristian S.J. Peron 3754d621040SChristian S.J. Peron static void 3764d621040SChristian S.J. Peron bpf_free(struct bpf_d *d) 3774d621040SChristian S.J. Peron { 3784d621040SChristian S.J. Peron 3794d621040SChristian S.J. Peron switch (d->bd_bufmode) { 3804d621040SChristian S.J. Peron case BPF_BUFMODE_BUFFER: 3814d621040SChristian S.J. Peron return (bpf_buffer_free(d)); 3824d621040SChristian S.J. Peron 3834d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 3844d621040SChristian S.J. Peron return (bpf_zerocopy_free(d)); 3854d621040SChristian S.J. Peron 3864d621040SChristian S.J. Peron default: 3874d621040SChristian S.J. Peron panic("bpf_buf_free"); 3884d621040SChristian S.J. Peron } 3894d621040SChristian S.J. Peron } 3904d621040SChristian S.J. Peron 3914d621040SChristian S.J. Peron static int 3924d621040SChristian S.J. Peron bpf_uiomove(struct bpf_d *d, caddr_t buf, u_int len, struct uio *uio) 3934d621040SChristian S.J. Peron { 3944d621040SChristian S.J. Peron 3954d621040SChristian S.J. Peron if (d->bd_bufmode != BPF_BUFMODE_BUFFER) 3964d621040SChristian S.J. Peron return (EOPNOTSUPP); 3974d621040SChristian S.J. Peron return (bpf_buffer_uiomove(d, buf, len, uio)); 3984d621040SChristian S.J. Peron } 3994d621040SChristian S.J. Peron 4004d621040SChristian S.J. Peron static int 4014d621040SChristian S.J. Peron bpf_ioctl_sblen(struct bpf_d *d, u_int *i) 4024d621040SChristian S.J. Peron { 4034d621040SChristian S.J. Peron 4044d621040SChristian S.J. Peron if (d->bd_bufmode != BPF_BUFMODE_BUFFER) 4054d621040SChristian S.J. Peron return (EOPNOTSUPP); 4064d621040SChristian S.J. Peron return (bpf_buffer_ioctl_sblen(d, i)); 4074d621040SChristian S.J. Peron } 4084d621040SChristian S.J. Peron 4094d621040SChristian S.J. Peron static int 4104d621040SChristian S.J. Peron bpf_ioctl_getzmax(struct thread *td, struct bpf_d *d, size_t *i) 4114d621040SChristian S.J. Peron { 4124d621040SChristian S.J. Peron 4134d621040SChristian S.J. Peron if (d->bd_bufmode != BPF_BUFMODE_ZBUF) 4144d621040SChristian S.J. Peron return (EOPNOTSUPP); 4154d621040SChristian S.J. Peron return (bpf_zerocopy_ioctl_getzmax(td, d, i)); 4164d621040SChristian S.J. Peron } 4174d621040SChristian S.J. Peron 4184d621040SChristian S.J. Peron static int 4194d621040SChristian S.J. Peron bpf_ioctl_rotzbuf(struct thread *td, struct bpf_d *d, struct bpf_zbuf *bz) 4204d621040SChristian S.J. Peron { 4214d621040SChristian S.J. Peron 4224d621040SChristian S.J. Peron if (d->bd_bufmode != BPF_BUFMODE_ZBUF) 4234d621040SChristian S.J. Peron return (EOPNOTSUPP); 4244d621040SChristian S.J. Peron return (bpf_zerocopy_ioctl_rotzbuf(td, d, bz)); 4254d621040SChristian S.J. Peron } 4264d621040SChristian S.J. Peron 4274d621040SChristian S.J. Peron static int 4284d621040SChristian S.J. Peron bpf_ioctl_setzbuf(struct thread *td, struct bpf_d *d, struct bpf_zbuf *bz) 4294d621040SChristian S.J. Peron { 4304d621040SChristian S.J. Peron 4314d621040SChristian S.J. Peron if (d->bd_bufmode != BPF_BUFMODE_ZBUF) 4324d621040SChristian S.J. Peron return (EOPNOTSUPP); 4334d621040SChristian S.J. Peron return (bpf_zerocopy_ioctl_setzbuf(td, d, bz)); 4344d621040SChristian S.J. Peron } 4354d621040SChristian S.J. Peron 4364d621040SChristian S.J. Peron /* 4374d621040SChristian S.J. Peron * General BPF functions. 4384d621040SChristian S.J. Peron */ 439df8bae1dSRodney W. Grimes static int 440cb44b6dfSAndrew Thompson bpf_movein(struct uio *uio, int linktype, struct ifnet *ifp, struct mbuf **mp, 441560a54e1SJung-uk Kim struct sockaddr *sockp, int *hdrlen, struct bpf_insn *wfilter) 442df8bae1dSRodney W. Grimes { 443246b5467SSam Leffler const struct ieee80211_bpf_params *p; 444cb44b6dfSAndrew Thompson struct ether_header *eh; 445df8bae1dSRodney W. Grimes struct mbuf *m; 446df8bae1dSRodney W. Grimes int error; 447df8bae1dSRodney W. Grimes int len; 448df8bae1dSRodney W. Grimes int hlen; 44993e39f0bSChristian S.J. Peron int slen; 450df8bae1dSRodney W. Grimes 451df8bae1dSRodney W. Grimes /* 452df8bae1dSRodney W. Grimes * Build a sockaddr based on the data link layer type. 453df8bae1dSRodney W. Grimes * We do this at this level because the ethernet header 454df8bae1dSRodney W. Grimes * is copied directly into the data field of the sockaddr. 455df8bae1dSRodney W. Grimes * In the case of SLIP, there is no header and the packet 456df8bae1dSRodney W. Grimes * is forwarded as is. 457df8bae1dSRodney W. Grimes * Also, we are careful to leave room at the front of the mbuf 458df8bae1dSRodney W. Grimes * for the link level header. 459df8bae1dSRodney W. Grimes */ 460df8bae1dSRodney W. Grimes switch (linktype) { 461df8bae1dSRodney W. Grimes 462df8bae1dSRodney W. Grimes case DLT_SLIP: 463df8bae1dSRodney W. Grimes sockp->sa_family = AF_INET; 464df8bae1dSRodney W. Grimes hlen = 0; 465df8bae1dSRodney W. Grimes break; 466df8bae1dSRodney W. Grimes 467df8bae1dSRodney W. Grimes case DLT_EN10MB: 468df8bae1dSRodney W. Grimes sockp->sa_family = AF_UNSPEC; 469df8bae1dSRodney W. Grimes /* XXX Would MAXLINKHDR be better? */ 470797f247bSMatthew N. Dodd hlen = ETHER_HDR_LEN; 471df8bae1dSRodney W. Grimes break; 472df8bae1dSRodney W. Grimes 473df8bae1dSRodney W. Grimes case DLT_FDDI: 474d41f24e7SDavid Greenman sockp->sa_family = AF_IMPLINK; 475d41f24e7SDavid Greenman hlen = 0; 476df8bae1dSRodney W. Grimes break; 477df8bae1dSRodney W. Grimes 47822f05c43SAndrey A. Chernov case DLT_RAW: 479df8bae1dSRodney W. Grimes sockp->sa_family = AF_UNSPEC; 480df8bae1dSRodney W. Grimes hlen = 0; 481df8bae1dSRodney W. Grimes break; 482df8bae1dSRodney W. Grimes 48301399f34SDavid Malone case DLT_NULL: 48401399f34SDavid Malone /* 48501399f34SDavid Malone * null interface types require a 4 byte pseudo header which 48601399f34SDavid Malone * corresponds to the address family of the packet. 48701399f34SDavid Malone */ 48801399f34SDavid Malone sockp->sa_family = AF_UNSPEC; 48901399f34SDavid Malone hlen = 4; 49001399f34SDavid Malone break; 49101399f34SDavid Malone 4924f53e3ccSKenjiro Cho case DLT_ATM_RFC1483: 4934f53e3ccSKenjiro Cho /* 4944f53e3ccSKenjiro Cho * en atm driver requires 4-byte atm pseudo header. 4954f53e3ccSKenjiro Cho * though it isn't standard, vpi:vci needs to be 4964f53e3ccSKenjiro Cho * specified anyway. 4974f53e3ccSKenjiro Cho */ 4984f53e3ccSKenjiro Cho sockp->sa_family = AF_UNSPEC; 4994f53e3ccSKenjiro Cho hlen = 12; /* XXX 4(ATM_PH) + 3(LLC) + 5(SNAP) */ 5004f53e3ccSKenjiro Cho break; 5014f53e3ccSKenjiro Cho 50230fa52a6SBrian Somers case DLT_PPP: 50330fa52a6SBrian Somers sockp->sa_family = AF_UNSPEC; 50430fa52a6SBrian Somers hlen = 4; /* This should match PPP_HDRLEN */ 50530fa52a6SBrian Somers break; 50630fa52a6SBrian Somers 507246b5467SSam Leffler case DLT_IEEE802_11: /* IEEE 802.11 wireless */ 508246b5467SSam Leffler sockp->sa_family = AF_IEEE80211; 509246b5467SSam Leffler hlen = 0; 510246b5467SSam Leffler break; 511246b5467SSam Leffler 512246b5467SSam Leffler case DLT_IEEE802_11_RADIO: /* IEEE 802.11 wireless w/ phy params */ 513246b5467SSam Leffler sockp->sa_family = AF_IEEE80211; 514246b5467SSam Leffler sockp->sa_len = 12; /* XXX != 0 */ 515246b5467SSam Leffler hlen = sizeof(struct ieee80211_bpf_params); 516246b5467SSam Leffler break; 517246b5467SSam Leffler 518df8bae1dSRodney W. Grimes default: 519df8bae1dSRodney W. Grimes return (EIO); 520df8bae1dSRodney W. Grimes } 521df8bae1dSRodney W. Grimes 522df8bae1dSRodney W. Grimes len = uio->uio_resid; 52301399f34SDavid Malone 524cb44b6dfSAndrew Thompson if (len - hlen > ifp->if_mtu) 52501399f34SDavid Malone return (EMSGSIZE); 52601399f34SDavid Malone 527968c88bcSJung-uk Kim if ((unsigned)len > MJUM16BYTES) 528df8bae1dSRodney W. Grimes return (EIO); 529df8bae1dSRodney W. Grimes 530968c88bcSJung-uk Kim if (len <= MHLEN) 531968c88bcSJung-uk Kim MGETHDR(m, M_WAIT, MT_DATA); 532968c88bcSJung-uk Kim else if (len <= MCLBYTES) 533ea26d587SRuslan Ermilov m = m_getcl(M_WAIT, MT_DATA, M_PKTHDR); 534ea26d587SRuslan Ermilov else 535968c88bcSJung-uk Kim m = m_getjcl(M_WAIT, MT_DATA, M_PKTHDR, 536968c88bcSJung-uk Kim #if (MJUMPAGESIZE > MCLBYTES) 537968c88bcSJung-uk Kim len <= MJUMPAGESIZE ? MJUMPAGESIZE : 538968c88bcSJung-uk Kim #endif 539968c88bcSJung-uk Kim (len <= MJUM9BYTES ? MJUM9BYTES : MJUM16BYTES)); 540963e4c2aSGarrett Wollman m->m_pkthdr.len = m->m_len = len; 541963e4c2aSGarrett Wollman m->m_pkthdr.rcvif = NULL; 542df8bae1dSRodney W. Grimes *mp = m; 54324a229f4SSam Leffler 54493e39f0bSChristian S.J. Peron if (m->m_len < hlen) { 54593e39f0bSChristian S.J. Peron error = EPERM; 54693e39f0bSChristian S.J. Peron goto bad; 54793e39f0bSChristian S.J. Peron } 54893e39f0bSChristian S.J. Peron 54993e39f0bSChristian S.J. Peron error = uiomove(mtod(m, u_char *), len, uio); 55093e39f0bSChristian S.J. Peron if (error) 55193e39f0bSChristian S.J. Peron goto bad; 55293e39f0bSChristian S.J. Peron 55393e39f0bSChristian S.J. Peron slen = bpf_filter(wfilter, mtod(m, u_char *), len, len); 55493e39f0bSChristian S.J. Peron if (slen == 0) { 55593e39f0bSChristian S.J. Peron error = EPERM; 55693e39f0bSChristian S.J. Peron goto bad; 55793e39f0bSChristian S.J. Peron } 55893e39f0bSChristian S.J. Peron 559cb44b6dfSAndrew Thompson /* Check for multicast destination */ 560cb44b6dfSAndrew Thompson switch (linktype) { 561cb44b6dfSAndrew Thompson case DLT_EN10MB: 562cb44b6dfSAndrew Thompson eh = mtod(m, struct ether_header *); 563cb44b6dfSAndrew Thompson if (ETHER_IS_MULTICAST(eh->ether_dhost)) { 564cb44b6dfSAndrew Thompson if (bcmp(ifp->if_broadcastaddr, eh->ether_dhost, 565cb44b6dfSAndrew Thompson ETHER_ADDR_LEN) == 0) 566cb44b6dfSAndrew Thompson m->m_flags |= M_BCAST; 567cb44b6dfSAndrew Thompson else 568cb44b6dfSAndrew Thompson m->m_flags |= M_MCAST; 569cb44b6dfSAndrew Thompson } 570cb44b6dfSAndrew Thompson break; 571cb44b6dfSAndrew Thompson } 572cb44b6dfSAndrew Thompson 573df8bae1dSRodney W. Grimes /* 57493e39f0bSChristian S.J. Peron * Make room for link header, and copy it to sockaddr 575df8bae1dSRodney W. Grimes */ 576df8bae1dSRodney W. Grimes if (hlen != 0) { 577246b5467SSam Leffler if (sockp->sa_family == AF_IEEE80211) { 578246b5467SSam Leffler /* 579246b5467SSam Leffler * Collect true length from the parameter header 580246b5467SSam Leffler * NB: sockp is known to be zero'd so if we do a 581246b5467SSam Leffler * short copy unspecified parameters will be 582246b5467SSam Leffler * zero. 583246b5467SSam Leffler * NB: packet may not be aligned after stripping 584246b5467SSam Leffler * bpf params 585246b5467SSam Leffler * XXX check ibp_vers 586246b5467SSam Leffler */ 587246b5467SSam Leffler p = mtod(m, const struct ieee80211_bpf_params *); 588246b5467SSam Leffler hlen = p->ibp_len; 589246b5467SSam Leffler if (hlen > sizeof(sockp->sa_data)) { 590246b5467SSam Leffler error = EINVAL; 591246b5467SSam Leffler goto bad; 592246b5467SSam Leffler } 593246b5467SSam Leffler } 59493e39f0bSChristian S.J. Peron bcopy(m->m_data, sockp->sa_data, hlen); 595df8bae1dSRodney W. Grimes } 596560a54e1SJung-uk Kim *hdrlen = hlen; 59793e39f0bSChristian S.J. Peron 598df8bae1dSRodney W. Grimes return (0); 599df8bae1dSRodney W. Grimes bad: 600df8bae1dSRodney W. Grimes m_freem(m); 601df8bae1dSRodney W. Grimes return (error); 602df8bae1dSRodney W. Grimes } 603df8bae1dSRodney W. Grimes 604df8bae1dSRodney W. Grimes /* 605df8bae1dSRodney W. Grimes * Attach file to the bpf interface, i.e. make d listen on bp. 606df8bae1dSRodney W. Grimes */ 607df8bae1dSRodney W. Grimes static void 60819ba8395SChristian S.J. Peron bpf_attachd(struct bpf_d *d, struct bpf_if *bp) 609df8bae1dSRodney W. Grimes { 610*6c74ff0eSAlexander V. Chernikov int op_w; 611*6c74ff0eSAlexander V. Chernikov 612*6c74ff0eSAlexander V. Chernikov BPF_LOCK_ASSERT(); 613*6c74ff0eSAlexander V. Chernikov 614*6c74ff0eSAlexander V. Chernikov /* 615*6c74ff0eSAlexander V. Chernikov * Save sysctl value to protect from sysctl change 616*6c74ff0eSAlexander V. Chernikov * between reads 617*6c74ff0eSAlexander V. Chernikov */ 618*6c74ff0eSAlexander V. Chernikov op_w = V_bpf_optimize_writers; 619*6c74ff0eSAlexander V. Chernikov 620*6c74ff0eSAlexander V. Chernikov if (d->bd_bif != NULL) 621*6c74ff0eSAlexander V. Chernikov bpf_detachd_locked(d); 622df8bae1dSRodney W. Grimes /* 62351ec1eb7SAlexander V. Chernikov * Point d at bp, and add d to the interface's list. 62451ec1eb7SAlexander V. Chernikov * Since there are many applicaiotns using BPF for 62551ec1eb7SAlexander V. Chernikov * sending raw packets only (dhcpd, cdpd are good examples) 62651ec1eb7SAlexander V. Chernikov * we can delay adding d to the list of active listeners until 62751ec1eb7SAlexander V. Chernikov * some filter is configured. 628df8bae1dSRodney W. Grimes */ 62951ec1eb7SAlexander V. Chernikov 63051ec1eb7SAlexander V. Chernikov BPFIF_WLOCK(bp); 631*6c74ff0eSAlexander V. Chernikov BPFD_WLOCK(d); 63251ec1eb7SAlexander V. Chernikov 633*6c74ff0eSAlexander V. Chernikov d->bd_bif = bp; 634*6c74ff0eSAlexander V. Chernikov 635*6c74ff0eSAlexander V. Chernikov if (op_w != 0) { 63651ec1eb7SAlexander V. Chernikov /* Add to writers-only list */ 63751ec1eb7SAlexander V. Chernikov LIST_INSERT_HEAD(&bp->bif_wlist, d, bd_next); 63851ec1eb7SAlexander V. Chernikov /* 63951ec1eb7SAlexander V. Chernikov * We decrement bd_writer on every filter set operation. 64051ec1eb7SAlexander V. Chernikov * First BIOCSETF is done by pcap_open_live() to set up 64151ec1eb7SAlexander V. Chernikov * snap length. After that appliation usually sets its own filter 64251ec1eb7SAlexander V. Chernikov */ 64351ec1eb7SAlexander V. Chernikov d->bd_writer = 2; 64451ec1eb7SAlexander V. Chernikov } else 6454a3feeaaSRobert Watson LIST_INSERT_HEAD(&bp->bif_dlist, d, bd_next); 646df8bae1dSRodney W. Grimes 647*6c74ff0eSAlexander V. Chernikov BPFD_WUNLOCK(d); 648e4b3229aSAlexander V. Chernikov BPFIF_WUNLOCK(bp); 649b743c310SSam Leffler 65051ec1eb7SAlexander V. Chernikov bpf_bpfd_cnt++; 65151ec1eb7SAlexander V. Chernikov 65251ec1eb7SAlexander V. Chernikov CTR3(KTR_NET, "%s: bpf_attach called by pid %d, adding to %s list", 65351ec1eb7SAlexander V. Chernikov __func__, d->bd_pid, d->bd_writer ? "writer" : "active"); 65451ec1eb7SAlexander V. Chernikov 655*6c74ff0eSAlexander V. Chernikov if (op_w == 0) 65651ec1eb7SAlexander V. Chernikov EVENTHANDLER_INVOKE(bpf_track, bp->bif_ifp, bp->bif_dlt, 1); 65751ec1eb7SAlexander V. Chernikov } 65851ec1eb7SAlexander V. Chernikov 65951ec1eb7SAlexander V. Chernikov /* 66051ec1eb7SAlexander V. Chernikov * Add d to the list of active bp filters. 66151ec1eb7SAlexander V. Chernikov * Reuqires bpf_attachd() to be called before 66251ec1eb7SAlexander V. Chernikov */ 66351ec1eb7SAlexander V. Chernikov static void 66451ec1eb7SAlexander V. Chernikov bpf_upgraded(struct bpf_d *d) 66551ec1eb7SAlexander V. Chernikov { 66651ec1eb7SAlexander V. Chernikov struct bpf_if *bp; 66751ec1eb7SAlexander V. Chernikov 668*6c74ff0eSAlexander V. Chernikov BPF_LOCK_ASSERT(); 669*6c74ff0eSAlexander V. Chernikov 67051ec1eb7SAlexander V. Chernikov bp = d->bd_bif; 67151ec1eb7SAlexander V. Chernikov 672*6c74ff0eSAlexander V. Chernikov /* 673*6c74ff0eSAlexander V. Chernikov * Filter can be set several times without specifying interface. 674*6c74ff0eSAlexander V. Chernikov * Mark d as reader and exit. 675*6c74ff0eSAlexander V. Chernikov */ 676*6c74ff0eSAlexander V. Chernikov if (bp == NULL) { 677*6c74ff0eSAlexander V. Chernikov BPFD_WLOCK(d); 678*6c74ff0eSAlexander V. Chernikov d->bd_writer = 0; 679*6c74ff0eSAlexander V. Chernikov BPFD_WUNLOCK(d); 680*6c74ff0eSAlexander V. Chernikov return; 681*6c74ff0eSAlexander V. Chernikov } 682*6c74ff0eSAlexander V. Chernikov 68351ec1eb7SAlexander V. Chernikov BPFIF_WLOCK(bp); 68451ec1eb7SAlexander V. Chernikov BPFD_WLOCK(d); 68551ec1eb7SAlexander V. Chernikov 68651ec1eb7SAlexander V. Chernikov /* Remove from writers-only list */ 68751ec1eb7SAlexander V. Chernikov LIST_REMOVE(d, bd_next); 68851ec1eb7SAlexander V. Chernikov LIST_INSERT_HEAD(&bp->bif_dlist, d, bd_next); 68951ec1eb7SAlexander V. Chernikov /* Mark d as reader */ 69051ec1eb7SAlexander V. Chernikov d->bd_writer = 0; 69151ec1eb7SAlexander V. Chernikov 69251ec1eb7SAlexander V. Chernikov BPFD_WUNLOCK(d); 69351ec1eb7SAlexander V. Chernikov BPFIF_WUNLOCK(bp); 69451ec1eb7SAlexander V. Chernikov 69551ec1eb7SAlexander V. Chernikov CTR2(KTR_NET, "%s: upgrade required by pid %d", __func__, d->bd_pid); 69651ec1eb7SAlexander V. Chernikov 6975ce8d970SSam Leffler EVENTHANDLER_INVOKE(bpf_track, bp->bif_ifp, bp->bif_dlt, 1); 698df8bae1dSRodney W. Grimes } 699df8bae1dSRodney W. Grimes 700df8bae1dSRodney W. Grimes /* 701df8bae1dSRodney W. Grimes * Detach a file from its interface. 702df8bae1dSRodney W. Grimes */ 703df8bae1dSRodney W. Grimes static void 70419ba8395SChristian S.J. Peron bpf_detachd(struct bpf_d *d) 705df8bae1dSRodney W. Grimes { 706*6c74ff0eSAlexander V. Chernikov BPF_LOCK(); 707*6c74ff0eSAlexander V. Chernikov bpf_detachd_locked(d); 708*6c74ff0eSAlexander V. Chernikov BPF_UNLOCK(); 709*6c74ff0eSAlexander V. Chernikov } 710*6c74ff0eSAlexander V. Chernikov 711*6c74ff0eSAlexander V. Chernikov static void 712*6c74ff0eSAlexander V. Chernikov bpf_detachd_locked(struct bpf_d *d) 713*6c74ff0eSAlexander V. Chernikov { 7146e891d64SPoul-Henning Kamp int error; 715df8bae1dSRodney W. Grimes struct bpf_if *bp; 71646448b5aSRobert Watson struct ifnet *ifp; 717df8bae1dSRodney W. Grimes 71851ec1eb7SAlexander V. Chernikov CTR2(KTR_NET, "%s: detach required by pid %d", __func__, d->bd_pid); 71951ec1eb7SAlexander V. Chernikov 720e4b3229aSAlexander V. Chernikov BPF_LOCK_ASSERT(); 721e4b3229aSAlexander V. Chernikov 722*6c74ff0eSAlexander V. Chernikov /* Check if descriptor is attached */ 723*6c74ff0eSAlexander V. Chernikov if ((bp = d->bd_bif) == NULL) 724*6c74ff0eSAlexander V. Chernikov return; 725*6c74ff0eSAlexander V. Chernikov 726e4b3229aSAlexander V. Chernikov BPFIF_WLOCK(bp); 727e4b3229aSAlexander V. Chernikov BPFD_WLOCK(d); 72846448b5aSRobert Watson 72951ec1eb7SAlexander V. Chernikov /* Save bd_writer value */ 73051ec1eb7SAlexander V. Chernikov error = d->bd_writer; 73151ec1eb7SAlexander V. Chernikov 73246448b5aSRobert Watson /* 73346448b5aSRobert Watson * Remove d from the interface's descriptor list. 73446448b5aSRobert Watson */ 73546448b5aSRobert Watson LIST_REMOVE(d, bd_next); 73646448b5aSRobert Watson 737e4b3229aSAlexander V. Chernikov ifp = bp->bif_ifp; 738572bde2aSRobert Watson d->bd_bif = NULL; 739e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 740e4b3229aSAlexander V. Chernikov BPFIF_WUNLOCK(bp); 741e4b3229aSAlexander V. Chernikov 742e4b3229aSAlexander V. Chernikov bpf_bpfd_cnt--; 74346448b5aSRobert Watson 74451ec1eb7SAlexander V. Chernikov /* Call event handler iff d is attached */ 74551ec1eb7SAlexander V. Chernikov if (error == 0) 7465ce8d970SSam Leffler EVENTHANDLER_INVOKE(bpf_track, ifp, bp->bif_dlt, 0); 747b743c310SSam Leffler 748df8bae1dSRodney W. Grimes /* 749df8bae1dSRodney W. Grimes * Check if this descriptor had requested promiscuous mode. 750df8bae1dSRodney W. Grimes * If so, turn it off. 751df8bae1dSRodney W. Grimes */ 752df8bae1dSRodney W. Grimes if (d->bd_promisc) { 753df8bae1dSRodney W. Grimes d->bd_promisc = 0; 75497021c24SMarko Zec CURVNET_SET(ifp->if_vnet); 75546448b5aSRobert Watson error = ifpromisc(ifp, 0); 75697021c24SMarko Zec CURVNET_RESTORE(); 7576e891d64SPoul-Henning Kamp if (error != 0 && error != ENXIO) { 758df8bae1dSRodney W. Grimes /* 7596e891d64SPoul-Henning Kamp * ENXIO can happen if a pccard is unplugged 760df8bae1dSRodney W. Grimes * Something is really wrong if we were able to put 761df8bae1dSRodney W. Grimes * the driver into promiscuous mode, but can't 762df8bae1dSRodney W. Grimes * take it out. 763df8bae1dSRodney W. Grimes */ 7648eab61f3SSam Leffler if_printf(bp->bif_ifp, 7658eab61f3SSam Leffler "bpf_detach: ifpromisc failed (%d)\n", error); 7666e891d64SPoul-Henning Kamp } 767df8bae1dSRodney W. Grimes } 768df8bae1dSRodney W. Grimes } 769df8bae1dSRodney W. Grimes 770df8bae1dSRodney W. Grimes /* 771136600feSEd Schouten * Close the descriptor by detaching it from its interface, 772136600feSEd Schouten * deallocating its buffers, and marking it free. 773136600feSEd Schouten */ 774136600feSEd Schouten static void 775136600feSEd Schouten bpf_dtor(void *data) 776136600feSEd Schouten { 777136600feSEd Schouten struct bpf_d *d = data; 778136600feSEd Schouten 779e4b3229aSAlexander V. Chernikov BPFD_WLOCK(d); 780136600feSEd Schouten if (d->bd_state == BPF_WAITING) 781136600feSEd Schouten callout_stop(&d->bd_callout); 782136600feSEd Schouten d->bd_state = BPF_IDLE; 783e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 784136600feSEd Schouten funsetown(&d->bd_sigio); 785136600feSEd Schouten bpf_detachd(d); 786136600feSEd Schouten #ifdef MAC 787136600feSEd Schouten mac_bpfdesc_destroy(d); 788136600feSEd Schouten #endif /* MAC */ 7896aba400aSAttilio Rao seldrain(&d->bd_sel); 790136600feSEd Schouten knlist_destroy(&d->bd_sel.si_note); 7919fee1bd1SJung-uk Kim callout_drain(&d->bd_callout); 792136600feSEd Schouten bpf_freed(d); 793136600feSEd Schouten free(d, M_BPF); 794136600feSEd Schouten } 795136600feSEd Schouten 796136600feSEd Schouten /* 797df8bae1dSRodney W. Grimes * Open ethernet device. Returns ENXIO for illegal minor device number, 798df8bae1dSRodney W. Grimes * EBUSY if file is open by another process. 799df8bae1dSRodney W. Grimes */ 800df8bae1dSRodney W. Grimes /* ARGSUSED */ 80187f6c662SJulian Elischer static int 80219ba8395SChristian S.J. Peron bpfopen(struct cdev *dev, int flags, int fmt, struct thread *td) 803df8bae1dSRodney W. Grimes { 804e7bb21b3SJonathan Lemon struct bpf_d *d; 805136600feSEd Schouten int error; 806df8bae1dSRodney W. Grimes 8071ede983cSDag-Erling Smørgrav d = malloc(sizeof(*d), M_BPF, M_WAITOK | M_ZERO); 808136600feSEd Schouten error = devfs_set_cdevpriv(d, bpf_dtor); 809136600feSEd Schouten if (error != 0) { 810136600feSEd Schouten free(d, M_BPF); 811136600feSEd Schouten return (error); 812136600feSEd Schouten } 8134d621040SChristian S.J. Peron 8144d621040SChristian S.J. Peron /* 8154d621040SChristian S.J. Peron * For historical reasons, perform a one-time initialization call to 8164d621040SChristian S.J. Peron * the buffer routines, even though we're not yet committed to a 8174d621040SChristian S.J. Peron * particular buffer method. 8184d621040SChristian S.J. Peron */ 8194d621040SChristian S.J. Peron bpf_buffer_init(d); 8204d621040SChristian S.J. Peron d->bd_bufmode = BPF_BUFMODE_BUFFER; 82100a83887SPaul Traina d->bd_sig = SIGIO; 822560a54e1SJung-uk Kim d->bd_direction = BPF_D_INOUT; 823e4b3229aSAlexander V. Chernikov BPF_PID_REFRESH(d, td); 82482f4445dSRobert Watson #ifdef MAC 82530d239bcSRobert Watson mac_bpfdesc_init(d); 82630d239bcSRobert Watson mac_bpfdesc_create(td->td_ucred, d); 82782f4445dSRobert Watson #endif 828e4b3229aSAlexander V. Chernikov rw_init(&d->bd_lock, "bpf cdev lock"); 829e4b3229aSAlexander V. Chernikov callout_init_rw(&d->bd_callout, &d->bd_lock, 0); 830e4b3229aSAlexander V. Chernikov knlist_init_rw_reader(&d->bd_sel.si_note, &d->bd_lock); 831df8bae1dSRodney W. Grimes 832df8bae1dSRodney W. Grimes return (0); 833df8bae1dSRodney W. Grimes } 834df8bae1dSRodney W. Grimes 835df8bae1dSRodney W. Grimes /* 836df8bae1dSRodney W. Grimes * bpfread - read next chunk of packets from buffers 837df8bae1dSRodney W. Grimes */ 83887f6c662SJulian Elischer static int 83919ba8395SChristian S.J. Peron bpfread(struct cdev *dev, struct uio *uio, int ioflag) 840df8bae1dSRodney W. Grimes { 841136600feSEd Schouten struct bpf_d *d; 842df8bae1dSRodney W. Grimes int error; 8438df67d77SJung-uk Kim int non_block; 8448df67d77SJung-uk Kim int timed_out; 845df8bae1dSRodney W. Grimes 846136600feSEd Schouten error = devfs_get_cdevpriv((void **)&d); 847136600feSEd Schouten if (error != 0) 848136600feSEd Schouten return (error); 849136600feSEd Schouten 850df8bae1dSRodney W. Grimes /* 851df8bae1dSRodney W. Grimes * Restrict application to use a buffer the same size as 852df8bae1dSRodney W. Grimes * as kernel buffers. 853df8bae1dSRodney W. Grimes */ 854df8bae1dSRodney W. Grimes if (uio->uio_resid != d->bd_bufsize) 855df8bae1dSRodney W. Grimes return (EINVAL); 856df8bae1dSRodney W. Grimes 8578df67d77SJung-uk Kim non_block = ((ioflag & O_NONBLOCK) != 0); 8588df67d77SJung-uk Kim 859e4b3229aSAlexander V. Chernikov BPFD_WLOCK(d); 860e4b3229aSAlexander V. Chernikov BPF_PID_REFRESH_CUR(d); 8614d621040SChristian S.J. Peron if (d->bd_bufmode != BPF_BUFMODE_BUFFER) { 862e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 8634d621040SChristian S.J. Peron return (EOPNOTSUPP); 8644d621040SChristian S.J. Peron } 86581bda851SJohn Polstra if (d->bd_state == BPF_WAITING) 86681bda851SJohn Polstra callout_stop(&d->bd_callout); 86781bda851SJohn Polstra timed_out = (d->bd_state == BPF_TIMED_OUT); 86881bda851SJohn Polstra d->bd_state = BPF_IDLE; 869df8bae1dSRodney W. Grimes /* 870df8bae1dSRodney W. Grimes * If the hold buffer is empty, then do a timed sleep, which 871df8bae1dSRodney W. Grimes * ends when the timeout expires or when enough packets 872df8bae1dSRodney W. Grimes * have arrived to fill the store buffer. 873df8bae1dSRodney W. Grimes */ 874572bde2aSRobert Watson while (d->bd_hbuf == NULL) { 8758df67d77SJung-uk Kim if (d->bd_slen != 0) { 876df8bae1dSRodney W. Grimes /* 877df8bae1dSRodney W. Grimes * A packet(s) either arrived since the previous 878df8bae1dSRodney W. Grimes * read or arrived while we were asleep. 8798df67d77SJung-uk Kim */ 8808df67d77SJung-uk Kim if (d->bd_immediate || non_block || timed_out) { 8818df67d77SJung-uk Kim /* 8828df67d77SJung-uk Kim * Rotate the buffers and return what's here 8838df67d77SJung-uk Kim * if we are in immediate mode, non-blocking 8848df67d77SJung-uk Kim * flag is set, or this descriptor timed out. 885df8bae1dSRodney W. Grimes */ 886df8bae1dSRodney W. Grimes ROTATE_BUFFERS(d); 887df8bae1dSRodney W. Grimes break; 888df8bae1dSRodney W. Grimes } 8898df67d77SJung-uk Kim } 890de5d9935SRobert Watson 891de5d9935SRobert Watson /* 892de5d9935SRobert Watson * No data is available, check to see if the bpf device 893de5d9935SRobert Watson * is still pointed at a real interface. If not, return 894de5d9935SRobert Watson * ENXIO so that the userland process knows to rebind 895de5d9935SRobert Watson * it before using it again. 896de5d9935SRobert Watson */ 897de5d9935SRobert Watson if (d->bd_bif == NULL) { 898e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 899de5d9935SRobert Watson return (ENXIO); 900de5d9935SRobert Watson } 901de5d9935SRobert Watson 9028df67d77SJung-uk Kim if (non_block) { 903e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 904fba3cfdeSJohn Polstra return (EWOULDBLOCK); 905fba3cfdeSJohn Polstra } 906e4b3229aSAlexander V. Chernikov error = rw_sleep(d, &d->bd_lock, PRINET|PCATCH, 907e7bb21b3SJonathan Lemon "bpf", d->bd_rtout); 908df8bae1dSRodney W. Grimes if (error == EINTR || error == ERESTART) { 909e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 910df8bae1dSRodney W. Grimes return (error); 911df8bae1dSRodney W. Grimes } 912df8bae1dSRodney W. Grimes if (error == EWOULDBLOCK) { 913df8bae1dSRodney W. Grimes /* 914df8bae1dSRodney W. Grimes * On a timeout, return what's in the buffer, 915df8bae1dSRodney W. Grimes * which may be nothing. If there is something 916df8bae1dSRodney W. Grimes * in the store buffer, we can rotate the buffers. 917df8bae1dSRodney W. Grimes */ 918df8bae1dSRodney W. Grimes if (d->bd_hbuf) 919df8bae1dSRodney W. Grimes /* 920df8bae1dSRodney W. Grimes * We filled up the buffer in between 921df8bae1dSRodney W. Grimes * getting the timeout and arriving 922df8bae1dSRodney W. Grimes * here, so we don't need to rotate. 923df8bae1dSRodney W. Grimes */ 924df8bae1dSRodney W. Grimes break; 925df8bae1dSRodney W. Grimes 926df8bae1dSRodney W. Grimes if (d->bd_slen == 0) { 927e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 928df8bae1dSRodney W. Grimes return (0); 929df8bae1dSRodney W. Grimes } 930df8bae1dSRodney W. Grimes ROTATE_BUFFERS(d); 931df8bae1dSRodney W. Grimes break; 932df8bae1dSRodney W. Grimes } 933df8bae1dSRodney W. Grimes } 934df8bae1dSRodney W. Grimes /* 935df8bae1dSRodney W. Grimes * At this point, we know we have something in the hold slot. 936df8bae1dSRodney W. Grimes */ 937e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 938df8bae1dSRodney W. Grimes 939df8bae1dSRodney W. Grimes /* 940df8bae1dSRodney W. Grimes * Move data from hold buffer into user space. 941df8bae1dSRodney W. Grimes * We know the entire buffer is transferred since 942df8bae1dSRodney W. Grimes * we checked above that the read buffer is bpf_bufsize bytes. 94331b32e6dSRobert Watson * 94431b32e6dSRobert Watson * XXXRW: More synchronization needed here: what if a second thread 94531b32e6dSRobert Watson * issues a read on the same fd at the same time? Don't want this 94631b32e6dSRobert Watson * getting invalidated. 947df8bae1dSRodney W. Grimes */ 9484d621040SChristian S.J. Peron error = bpf_uiomove(d, d->bd_hbuf, d->bd_hlen, uio); 949df8bae1dSRodney W. Grimes 950e4b3229aSAlexander V. Chernikov BPFD_WLOCK(d); 951df8bae1dSRodney W. Grimes d->bd_fbuf = d->bd_hbuf; 952572bde2aSRobert Watson d->bd_hbuf = NULL; 953df8bae1dSRodney W. Grimes d->bd_hlen = 0; 95429f612ecSChristian S.J. Peron bpf_buf_reclaimed(d); 955e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 956df8bae1dSRodney W. Grimes 957df8bae1dSRodney W. Grimes return (error); 958df8bae1dSRodney W. Grimes } 959df8bae1dSRodney W. Grimes 960df8bae1dSRodney W. Grimes /* 961df8bae1dSRodney W. Grimes * If there are processes sleeping on this descriptor, wake them up. 962df8bae1dSRodney W. Grimes */ 963e7bb21b3SJonathan Lemon static __inline void 96419ba8395SChristian S.J. Peron bpf_wakeup(struct bpf_d *d) 965df8bae1dSRodney W. Grimes { 966a3272e3cSChristian S.J. Peron 967e4b3229aSAlexander V. Chernikov BPFD_WLOCK_ASSERT(d); 96881bda851SJohn Polstra if (d->bd_state == BPF_WAITING) { 96981bda851SJohn Polstra callout_stop(&d->bd_callout); 97081bda851SJohn Polstra d->bd_state = BPF_IDLE; 97181bda851SJohn Polstra } 972521f364bSDag-Erling Smørgrav wakeup(d); 973831d27a9SDon Lewis if (d->bd_async && d->bd_sig && d->bd_sigio) 974f1320723SAlfred Perlstein pgsigio(&d->bd_sigio, d->bd_sig, 0); 97500a83887SPaul Traina 976512824f8SSeigo Tanimura selwakeuppri(&d->bd_sel, PRINET); 977ad3b9257SJohn-Mark Gurney KNOTE_LOCKED(&d->bd_sel.si_note, 0); 978df8bae1dSRodney W. Grimes } 979df8bae1dSRodney W. Grimes 98081bda851SJohn Polstra static void 98119ba8395SChristian S.J. Peron bpf_timed_out(void *arg) 98281bda851SJohn Polstra { 98381bda851SJohn Polstra struct bpf_d *d = (struct bpf_d *)arg; 98481bda851SJohn Polstra 985e4b3229aSAlexander V. Chernikov BPFD_WLOCK_ASSERT(d); 9869fee1bd1SJung-uk Kim 9879fee1bd1SJung-uk Kim if (callout_pending(&d->bd_callout) || !callout_active(&d->bd_callout)) 9889fee1bd1SJung-uk Kim return; 98981bda851SJohn Polstra if (d->bd_state == BPF_WAITING) { 99081bda851SJohn Polstra d->bd_state = BPF_TIMED_OUT; 99181bda851SJohn Polstra if (d->bd_slen != 0) 99281bda851SJohn Polstra bpf_wakeup(d); 99381bda851SJohn Polstra } 99481bda851SJohn Polstra } 99581bda851SJohn Polstra 99687f6c662SJulian Elischer static int 9974d621040SChristian S.J. Peron bpf_ready(struct bpf_d *d) 9984d621040SChristian S.J. Peron { 9994d621040SChristian S.J. Peron 1000e4b3229aSAlexander V. Chernikov BPFD_WLOCK_ASSERT(d); 10014d621040SChristian S.J. Peron 10024d621040SChristian S.J. Peron if (!bpf_canfreebuf(d) && d->bd_hlen != 0) 10034d621040SChristian S.J. Peron return (1); 10044d621040SChristian S.J. Peron if ((d->bd_immediate || d->bd_state == BPF_TIMED_OUT) && 10054d621040SChristian S.J. Peron d->bd_slen != 0) 10064d621040SChristian S.J. Peron return (1); 10074d621040SChristian S.J. Peron return (0); 10084d621040SChristian S.J. Peron } 10094d621040SChristian S.J. Peron 10104d621040SChristian S.J. Peron static int 101119ba8395SChristian S.J. Peron bpfwrite(struct cdev *dev, struct uio *uio, int ioflag) 1012df8bae1dSRodney W. Grimes { 1013136600feSEd Schouten struct bpf_d *d; 1014df8bae1dSRodney W. Grimes struct ifnet *ifp; 1015560a54e1SJung-uk Kim struct mbuf *m, *mc; 10168240bf1eSRobert Watson struct sockaddr dst; 1017560a54e1SJung-uk Kim int error, hlen; 1018df8bae1dSRodney W. Grimes 1019136600feSEd Schouten error = devfs_get_cdevpriv((void **)&d); 1020136600feSEd Schouten if (error != 0) 1021136600feSEd Schouten return (error); 1022136600feSEd Schouten 1023e4b3229aSAlexander V. Chernikov BPF_PID_REFRESH_CUR(d); 10244d621040SChristian S.J. Peron d->bd_wcount++; 1025*6c74ff0eSAlexander V. Chernikov /* XXX: locking required */ 10264d621040SChristian S.J. Peron if (d->bd_bif == NULL) { 10274d621040SChristian S.J. Peron d->bd_wdcount++; 1028df8bae1dSRodney W. Grimes return (ENXIO); 10294d621040SChristian S.J. Peron } 1030df8bae1dSRodney W. Grimes 1031df8bae1dSRodney W. Grimes ifp = d->bd_bif->bif_ifp; 1032df8bae1dSRodney W. Grimes 10334d621040SChristian S.J. Peron if ((ifp->if_flags & IFF_UP) == 0) { 10344d621040SChristian S.J. Peron d->bd_wdcount++; 10353518d220SSam Leffler return (ENETDOWN); 10364d621040SChristian S.J. Peron } 10373518d220SSam Leffler 10384d621040SChristian S.J. Peron if (uio->uio_resid == 0) { 10394d621040SChristian S.J. Peron d->bd_wdcount++; 1040df8bae1dSRodney W. Grimes return (0); 10414d621040SChristian S.J. Peron } 1042df8bae1dSRodney W. Grimes 10438240bf1eSRobert Watson bzero(&dst, sizeof(dst)); 1044d83e603aSChristian S.J. Peron m = NULL; 1045d83e603aSChristian S.J. Peron hlen = 0; 1046*6c74ff0eSAlexander V. Chernikov /* XXX: bpf_movein() can sleep */ 1047cb44b6dfSAndrew Thompson error = bpf_movein(uio, (int)d->bd_bif->bif_dlt, ifp, 1048560a54e1SJung-uk Kim &m, &dst, &hlen, d->bd_wfilter); 10494d621040SChristian S.J. Peron if (error) { 10504d621040SChristian S.J. Peron d->bd_wdcount++; 1051df8bae1dSRodney W. Grimes return (error); 10524d621040SChristian S.J. Peron } 10534d621040SChristian S.J. Peron d->bd_wfcount++; 1054114ae644SMike Smith if (d->bd_hdrcmplt) 1055114ae644SMike Smith dst.sa_family = pseudo_AF_HDRCMPLT; 1056114ae644SMike Smith 1057560a54e1SJung-uk Kim if (d->bd_feedback) { 1058560a54e1SJung-uk Kim mc = m_dup(m, M_DONTWAIT); 1059560a54e1SJung-uk Kim if (mc != NULL) 1060560a54e1SJung-uk Kim mc->m_pkthdr.rcvif = ifp; 10618cd892f7SJung-uk Kim /* Set M_PROMISC for outgoing packets to be discarded. */ 10628cd892f7SJung-uk Kim if (d->bd_direction == BPF_D_INOUT) 10638cd892f7SJung-uk Kim m->m_flags |= M_PROMISC; 1064560a54e1SJung-uk Kim } else 1065560a54e1SJung-uk Kim mc = NULL; 1066560a54e1SJung-uk Kim 1067560a54e1SJung-uk Kim m->m_pkthdr.len -= hlen; 1068560a54e1SJung-uk Kim m->m_len -= hlen; 1069560a54e1SJung-uk Kim m->m_data += hlen; /* XXX */ 1070560a54e1SJung-uk Kim 107121ca7b57SMarko Zec CURVNET_SET(ifp->if_vnet); 107282f4445dSRobert Watson #ifdef MAC 1073e4b3229aSAlexander V. Chernikov BPFD_WLOCK(d); 107430d239bcSRobert Watson mac_bpfdesc_create_mbuf(d, m); 1075560a54e1SJung-uk Kim if (mc != NULL) 107630d239bcSRobert Watson mac_bpfdesc_create_mbuf(d, mc); 1077e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 107882f4445dSRobert Watson #endif 1079560a54e1SJung-uk Kim 1080572bde2aSRobert Watson error = (*ifp->if_output)(ifp, m, &dst, NULL); 10814d621040SChristian S.J. Peron if (error) 10824d621040SChristian S.J. Peron d->bd_wdcount++; 1083560a54e1SJung-uk Kim 1084560a54e1SJung-uk Kim if (mc != NULL) { 10850bf686c1SRobert Watson if (error == 0) 1086560a54e1SJung-uk Kim (*ifp->if_input)(ifp, mc); 10870bf686c1SRobert Watson else 1088560a54e1SJung-uk Kim m_freem(mc); 1089560a54e1SJung-uk Kim } 109021ca7b57SMarko Zec CURVNET_RESTORE(); 1091560a54e1SJung-uk Kim 1092df8bae1dSRodney W. Grimes return (error); 1093df8bae1dSRodney W. Grimes } 1094df8bae1dSRodney W. Grimes 1095df8bae1dSRodney W. Grimes /* 1096e82669d9SRobert Watson * Reset a descriptor by flushing its packet buffer and clearing the receive 1097e82669d9SRobert Watson * and drop counts. This is doable for kernel-only buffers, but with 1098e82669d9SRobert Watson * zero-copy buffers, we can't write to (or rotate) buffers that are 1099e82669d9SRobert Watson * currently owned by userspace. It would be nice if we could encapsulate 1100e82669d9SRobert Watson * this logic in the buffer code rather than here. 1101df8bae1dSRodney W. Grimes */ 1102df8bae1dSRodney W. Grimes static void 110319ba8395SChristian S.J. Peron reset_d(struct bpf_d *d) 1104df8bae1dSRodney W. Grimes { 1105e7bb21b3SJonathan Lemon 1106e4b3229aSAlexander V. Chernikov BPFD_WLOCK_ASSERT(d); 1107e82669d9SRobert Watson 1108e82669d9SRobert Watson if ((d->bd_hbuf != NULL) && 1109e82669d9SRobert Watson (d->bd_bufmode != BPF_BUFMODE_ZBUF || bpf_canfreebuf(d))) { 1110df8bae1dSRodney W. Grimes /* Free the hold buffer. */ 1111df8bae1dSRodney W. Grimes d->bd_fbuf = d->bd_hbuf; 1112572bde2aSRobert Watson d->bd_hbuf = NULL; 1113e82669d9SRobert Watson d->bd_hlen = 0; 111429f612ecSChristian S.J. Peron bpf_buf_reclaimed(d); 1115df8bae1dSRodney W. Grimes } 1116e82669d9SRobert Watson if (bpf_canwritebuf(d)) 1117df8bae1dSRodney W. Grimes d->bd_slen = 0; 1118df8bae1dSRodney W. Grimes d->bd_rcount = 0; 1119df8bae1dSRodney W. Grimes d->bd_dcount = 0; 112069f7644bSChristian S.J. Peron d->bd_fcount = 0; 11214d621040SChristian S.J. Peron d->bd_wcount = 0; 11224d621040SChristian S.J. Peron d->bd_wfcount = 0; 11234d621040SChristian S.J. Peron d->bd_wdcount = 0; 11244d621040SChristian S.J. Peron d->bd_zcopy = 0; 1125df8bae1dSRodney W. Grimes } 1126df8bae1dSRodney W. Grimes 1127df8bae1dSRodney W. Grimes /* 1128df8bae1dSRodney W. Grimes * FIONREAD Check for read packet available. 1129df8bae1dSRodney W. Grimes * SIOCGIFADDR Get interface address - convenient hook to driver. 1130df8bae1dSRodney W. Grimes * BIOCGBLEN Get buffer len [for read()]. 1131f11c3508SDavid Malone * BIOCSETF Set read filter. 1132f11c3508SDavid Malone * BIOCSETFNR Set read filter without resetting descriptor. 1133f11c3508SDavid Malone * BIOCSETWF Set write filter. 1134df8bae1dSRodney W. Grimes * BIOCFLUSH Flush read packet buffer. 1135df8bae1dSRodney W. Grimes * BIOCPROMISC Put interface into promiscuous mode. 1136df8bae1dSRodney W. Grimes * BIOCGDLT Get link layer type. 1137df8bae1dSRodney W. Grimes * BIOCGETIF Get interface name. 1138df8bae1dSRodney W. Grimes * BIOCSETIF Set interface. 1139df8bae1dSRodney W. Grimes * BIOCSRTIMEOUT Set read timeout. 1140df8bae1dSRodney W. Grimes * BIOCGRTIMEOUT Get read timeout. 1141df8bae1dSRodney W. Grimes * BIOCGSTATS Get packet stats. 1142df8bae1dSRodney W. Grimes * BIOCIMMEDIATE Set immediate mode. 1143df8bae1dSRodney W. Grimes * BIOCVERSION Get filter language version. 1144114ae644SMike Smith * BIOCGHDRCMPLT Get "header already complete" flag 1145114ae644SMike Smith * BIOCSHDRCMPLT Set "header already complete" flag 1146560a54e1SJung-uk Kim * BIOCGDIRECTION Get packet direction flag 1147560a54e1SJung-uk Kim * BIOCSDIRECTION Set packet direction flag 1148547d94bdSJung-uk Kim * BIOCGTSTAMP Get time stamp format and resolution. 1149547d94bdSJung-uk Kim * BIOCSTSTAMP Set time stamp format and resolution. 115093e39f0bSChristian S.J. Peron * BIOCLOCK Set "locked" flag 1151560a54e1SJung-uk Kim * BIOCFEEDBACK Set packet feedback mode. 11524d621040SChristian S.J. Peron * BIOCSETZBUF Set current zero-copy buffer locations. 11534d621040SChristian S.J. Peron * BIOCGETZMAX Get maximum zero-copy buffer size. 11544d621040SChristian S.J. Peron * BIOCROTZBUF Force rotation of zero-copy buffer 11554d621040SChristian S.J. Peron * BIOCSETBUFMODE Set buffer mode. 11564d621040SChristian S.J. Peron * BIOCGETBUFMODE Get current buffer mode. 1157df8bae1dSRodney W. Grimes */ 1158df8bae1dSRodney W. Grimes /* ARGSUSED */ 115987f6c662SJulian Elischer static int 116019ba8395SChristian S.J. Peron bpfioctl(struct cdev *dev, u_long cmd, caddr_t addr, int flags, 116119ba8395SChristian S.J. Peron struct thread *td) 1162df8bae1dSRodney W. Grimes { 1163136600feSEd Schouten struct bpf_d *d; 1164136600feSEd Schouten int error; 1165136600feSEd Schouten 1166136600feSEd Schouten error = devfs_get_cdevpriv((void **)&d); 1167136600feSEd Schouten if (error != 0) 1168136600feSEd Schouten return (error); 1169df8bae1dSRodney W. Grimes 1170b75a24a0SChristian S.J. Peron /* 1171b75a24a0SChristian S.J. Peron * Refresh PID associated with this descriptor. 1172b75a24a0SChristian S.J. Peron */ 1173e4b3229aSAlexander V. Chernikov BPFD_WLOCK(d); 1174e4b3229aSAlexander V. Chernikov BPF_PID_REFRESH(d, td); 117581bda851SJohn Polstra if (d->bd_state == BPF_WAITING) 117681bda851SJohn Polstra callout_stop(&d->bd_callout); 117781bda851SJohn Polstra d->bd_state = BPF_IDLE; 1178e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 117981bda851SJohn Polstra 118093e39f0bSChristian S.J. Peron if (d->bd_locked == 1) { 118193e39f0bSChristian S.J. Peron switch (cmd) { 118293e39f0bSChristian S.J. Peron case BIOCGBLEN: 118393e39f0bSChristian S.J. Peron case BIOCFLUSH: 118493e39f0bSChristian S.J. Peron case BIOCGDLT: 118593e39f0bSChristian S.J. Peron case BIOCGDLTLIST: 1186fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 1187fc0a61a4SKonstantin Belousov case BIOCGDLTLIST32: 1188fc0a61a4SKonstantin Belousov #endif 118993e39f0bSChristian S.J. Peron case BIOCGETIF: 119093e39f0bSChristian S.J. Peron case BIOCGRTIMEOUT: 11919624d947SJuli Mallett #if defined(COMPAT_FREEBSD32) && !defined(__mips__) 1192fc0a61a4SKonstantin Belousov case BIOCGRTIMEOUT32: 1193fc0a61a4SKonstantin Belousov #endif 119493e39f0bSChristian S.J. Peron case BIOCGSTATS: 119593e39f0bSChristian S.J. Peron case BIOCVERSION: 119693e39f0bSChristian S.J. Peron case BIOCGRSIG: 119793e39f0bSChristian S.J. Peron case BIOCGHDRCMPLT: 1198547d94bdSJung-uk Kim case BIOCSTSTAMP: 1199560a54e1SJung-uk Kim case BIOCFEEDBACK: 120093e39f0bSChristian S.J. Peron case FIONREAD: 120193e39f0bSChristian S.J. Peron case BIOCLOCK: 120293e39f0bSChristian S.J. Peron case BIOCSRTIMEOUT: 12039624d947SJuli Mallett #if defined(COMPAT_FREEBSD32) && !defined(__mips__) 1204fc0a61a4SKonstantin Belousov case BIOCSRTIMEOUT32: 1205fc0a61a4SKonstantin Belousov #endif 120693e39f0bSChristian S.J. Peron case BIOCIMMEDIATE: 120793e39f0bSChristian S.J. Peron case TIOCGPGRP: 12084d621040SChristian S.J. Peron case BIOCROTZBUF: 120993e39f0bSChristian S.J. Peron break; 121093e39f0bSChristian S.J. Peron default: 121193e39f0bSChristian S.J. Peron return (EPERM); 121293e39f0bSChristian S.J. Peron } 121393e39f0bSChristian S.J. Peron } 1214fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 1215fc0a61a4SKonstantin Belousov /* 1216fc0a61a4SKonstantin Belousov * If we see a 32-bit compat ioctl, mark the stream as 32-bit so 1217fc0a61a4SKonstantin Belousov * that it will get 32-bit packet headers. 1218fc0a61a4SKonstantin Belousov */ 1219fc0a61a4SKonstantin Belousov switch (cmd) { 1220fc0a61a4SKonstantin Belousov case BIOCSETF32: 1221fc0a61a4SKonstantin Belousov case BIOCSETFNR32: 1222fc0a61a4SKonstantin Belousov case BIOCSETWF32: 1223fc0a61a4SKonstantin Belousov case BIOCGDLTLIST32: 1224fc0a61a4SKonstantin Belousov case BIOCGRTIMEOUT32: 1225fc0a61a4SKonstantin Belousov case BIOCSRTIMEOUT32: 1226fc0a61a4SKonstantin Belousov d->bd_compat32 = 1; 1227fc0a61a4SKonstantin Belousov } 1228fc0a61a4SKonstantin Belousov #endif 1229fc0a61a4SKonstantin Belousov 123097021c24SMarko Zec CURVNET_SET(TD_TO_VNET(td)); 1231df8bae1dSRodney W. Grimes switch (cmd) { 1232df8bae1dSRodney W. Grimes 1233df8bae1dSRodney W. Grimes default: 1234df8bae1dSRodney W. Grimes error = EINVAL; 1235df8bae1dSRodney W. Grimes break; 1236df8bae1dSRodney W. Grimes 1237df8bae1dSRodney W. Grimes /* 1238df8bae1dSRodney W. Grimes * Check for read packet available. 1239df8bae1dSRodney W. Grimes */ 1240df8bae1dSRodney W. Grimes case FIONREAD: 1241df8bae1dSRodney W. Grimes { 1242df8bae1dSRodney W. Grimes int n; 1243df8bae1dSRodney W. Grimes 1244e4b3229aSAlexander V. Chernikov BPFD_WLOCK(d); 1245df8bae1dSRodney W. Grimes n = d->bd_slen; 1246df8bae1dSRodney W. Grimes if (d->bd_hbuf) 1247df8bae1dSRodney W. Grimes n += d->bd_hlen; 1248e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 1249df8bae1dSRodney W. Grimes 1250df8bae1dSRodney W. Grimes *(int *)addr = n; 1251df8bae1dSRodney W. Grimes break; 1252df8bae1dSRodney W. Grimes } 1253df8bae1dSRodney W. Grimes 1254df8bae1dSRodney W. Grimes case SIOCGIFADDR: 1255df8bae1dSRodney W. Grimes { 1256df8bae1dSRodney W. Grimes struct ifnet *ifp; 1257df8bae1dSRodney W. Grimes 1258572bde2aSRobert Watson if (d->bd_bif == NULL) 1259df8bae1dSRodney W. Grimes error = EINVAL; 1260df8bae1dSRodney W. Grimes else { 1261df8bae1dSRodney W. Grimes ifp = d->bd_bif->bif_ifp; 1262df8bae1dSRodney W. Grimes error = (*ifp->if_ioctl)(ifp, cmd, addr); 1263df8bae1dSRodney W. Grimes } 1264df8bae1dSRodney W. Grimes break; 1265df8bae1dSRodney W. Grimes } 1266df8bae1dSRodney W. Grimes 1267df8bae1dSRodney W. Grimes /* 1268df8bae1dSRodney W. Grimes * Get buffer len [for read()]. 1269df8bae1dSRodney W. Grimes */ 1270df8bae1dSRodney W. Grimes case BIOCGBLEN: 1271df8bae1dSRodney W. Grimes *(u_int *)addr = d->bd_bufsize; 1272df8bae1dSRodney W. Grimes break; 1273df8bae1dSRodney W. Grimes 1274df8bae1dSRodney W. Grimes /* 1275df8bae1dSRodney W. Grimes * Set buffer length. 1276df8bae1dSRodney W. Grimes */ 1277df8bae1dSRodney W. Grimes case BIOCSBLEN: 12784d621040SChristian S.J. Peron error = bpf_ioctl_sblen(d, (u_int *)addr); 1279df8bae1dSRodney W. Grimes break; 1280df8bae1dSRodney W. Grimes 1281df8bae1dSRodney W. Grimes /* 1282df8bae1dSRodney W. Grimes * Set link layer read filter. 1283df8bae1dSRodney W. Grimes */ 1284df8bae1dSRodney W. Grimes case BIOCSETF: 1285f11c3508SDavid Malone case BIOCSETFNR: 128693e39f0bSChristian S.J. Peron case BIOCSETWF: 1287fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 1288fc0a61a4SKonstantin Belousov case BIOCSETF32: 1289fc0a61a4SKonstantin Belousov case BIOCSETFNR32: 1290fc0a61a4SKonstantin Belousov case BIOCSETWF32: 1291fc0a61a4SKonstantin Belousov #endif 129293e39f0bSChristian S.J. Peron error = bpf_setf(d, (struct bpf_program *)addr, cmd); 1293df8bae1dSRodney W. Grimes break; 1294df8bae1dSRodney W. Grimes 1295df8bae1dSRodney W. Grimes /* 1296df8bae1dSRodney W. Grimes * Flush read packet buffer. 1297df8bae1dSRodney W. Grimes */ 1298df8bae1dSRodney W. Grimes case BIOCFLUSH: 1299e4b3229aSAlexander V. Chernikov BPFD_WLOCK(d); 1300df8bae1dSRodney W. Grimes reset_d(d); 1301e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 1302df8bae1dSRodney W. Grimes break; 1303df8bae1dSRodney W. Grimes 1304df8bae1dSRodney W. Grimes /* 1305df8bae1dSRodney W. Grimes * Put interface into promiscuous mode. 1306df8bae1dSRodney W. Grimes */ 1307df8bae1dSRodney W. Grimes case BIOCPROMISC: 1308572bde2aSRobert Watson if (d->bd_bif == NULL) { 1309df8bae1dSRodney W. Grimes /* 1310df8bae1dSRodney W. Grimes * No interface attached yet. 1311df8bae1dSRodney W. Grimes */ 1312df8bae1dSRodney W. Grimes error = EINVAL; 1313df8bae1dSRodney W. Grimes break; 1314df8bae1dSRodney W. Grimes } 1315df8bae1dSRodney W. Grimes if (d->bd_promisc == 0) { 1316df8bae1dSRodney W. Grimes error = ifpromisc(d->bd_bif->bif_ifp, 1); 1317df8bae1dSRodney W. Grimes if (error == 0) 1318df8bae1dSRodney W. Grimes d->bd_promisc = 1; 1319df8bae1dSRodney W. Grimes } 1320df8bae1dSRodney W. Grimes break; 1321df8bae1dSRodney W. Grimes 1322df8bae1dSRodney W. Grimes /* 13238eab61f3SSam Leffler * Get current data link type. 1324df8bae1dSRodney W. Grimes */ 1325df8bae1dSRodney W. Grimes case BIOCGDLT: 1326572bde2aSRobert Watson if (d->bd_bif == NULL) 1327df8bae1dSRodney W. Grimes error = EINVAL; 1328df8bae1dSRodney W. Grimes else 1329df8bae1dSRodney W. Grimes *(u_int *)addr = d->bd_bif->bif_dlt; 1330df8bae1dSRodney W. Grimes break; 1331df8bae1dSRodney W. Grimes 1332df8bae1dSRodney W. Grimes /* 13338eab61f3SSam Leffler * Get a list of supported data link types. 13348eab61f3SSam Leffler */ 1335fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 1336fc0a61a4SKonstantin Belousov case BIOCGDLTLIST32: 1337fc0a61a4SKonstantin Belousov { 1338fc0a61a4SKonstantin Belousov struct bpf_dltlist32 *list32; 1339fc0a61a4SKonstantin Belousov struct bpf_dltlist dltlist; 1340fc0a61a4SKonstantin Belousov 1341fc0a61a4SKonstantin Belousov list32 = (struct bpf_dltlist32 *)addr; 1342fc0a61a4SKonstantin Belousov dltlist.bfl_len = list32->bfl_len; 1343fc0a61a4SKonstantin Belousov dltlist.bfl_list = PTRIN(list32->bfl_list); 1344fc0a61a4SKonstantin Belousov if (d->bd_bif == NULL) 1345fc0a61a4SKonstantin Belousov error = EINVAL; 1346fc0a61a4SKonstantin Belousov else { 1347fc0a61a4SKonstantin Belousov error = bpf_getdltlist(d, &dltlist); 1348fc0a61a4SKonstantin Belousov if (error == 0) 1349fc0a61a4SKonstantin Belousov list32->bfl_len = dltlist.bfl_len; 1350fc0a61a4SKonstantin Belousov } 1351fc0a61a4SKonstantin Belousov break; 1352fc0a61a4SKonstantin Belousov } 1353fc0a61a4SKonstantin Belousov #endif 1354fc0a61a4SKonstantin Belousov 13558eab61f3SSam Leffler case BIOCGDLTLIST: 1356572bde2aSRobert Watson if (d->bd_bif == NULL) 13578eab61f3SSam Leffler error = EINVAL; 13588eab61f3SSam Leffler else 13598eab61f3SSam Leffler error = bpf_getdltlist(d, (struct bpf_dltlist *)addr); 13608eab61f3SSam Leffler break; 13618eab61f3SSam Leffler 13628eab61f3SSam Leffler /* 13638eab61f3SSam Leffler * Set data link type. 13648eab61f3SSam Leffler */ 13658eab61f3SSam Leffler case BIOCSDLT: 1366*6c74ff0eSAlexander V. Chernikov BPF_LOCK(); 1367572bde2aSRobert Watson if (d->bd_bif == NULL) 13688eab61f3SSam Leffler error = EINVAL; 13698eab61f3SSam Leffler else 13708eab61f3SSam Leffler error = bpf_setdlt(d, *(u_int *)addr); 1371*6c74ff0eSAlexander V. Chernikov BPF_UNLOCK(); 13728eab61f3SSam Leffler break; 13738eab61f3SSam Leffler 13748eab61f3SSam Leffler /* 13751dd0feaaSArchie Cobbs * Get interface name. 1376df8bae1dSRodney W. Grimes */ 1377df8bae1dSRodney W. Grimes case BIOCGETIF: 1378572bde2aSRobert Watson if (d->bd_bif == NULL) 1379df8bae1dSRodney W. Grimes error = EINVAL; 13801dd0feaaSArchie Cobbs else { 13811dd0feaaSArchie Cobbs struct ifnet *const ifp = d->bd_bif->bif_ifp; 13821dd0feaaSArchie Cobbs struct ifreq *const ifr = (struct ifreq *)addr; 13831dd0feaaSArchie Cobbs 13849bf40edeSBrooks Davis strlcpy(ifr->ifr_name, ifp->if_xname, 13859bf40edeSBrooks Davis sizeof(ifr->ifr_name)); 13861dd0feaaSArchie Cobbs } 1387df8bae1dSRodney W. Grimes break; 1388df8bae1dSRodney W. Grimes 1389df8bae1dSRodney W. Grimes /* 1390df8bae1dSRodney W. Grimes * Set interface. 1391df8bae1dSRodney W. Grimes */ 1392df8bae1dSRodney W. Grimes case BIOCSETIF: 1393*6c74ff0eSAlexander V. Chernikov BPF_LOCK(); 1394df8bae1dSRodney W. Grimes error = bpf_setif(d, (struct ifreq *)addr); 1395*6c74ff0eSAlexander V. Chernikov BPF_UNLOCK(); 1396df8bae1dSRodney W. Grimes break; 1397df8bae1dSRodney W. Grimes 1398df8bae1dSRodney W. Grimes /* 1399df8bae1dSRodney W. Grimes * Set read timeout. 1400df8bae1dSRodney W. Grimes */ 1401df8bae1dSRodney W. Grimes case BIOCSRTIMEOUT: 14029624d947SJuli Mallett #if defined(COMPAT_FREEBSD32) && !defined(__mips__) 1403fc0a61a4SKonstantin Belousov case BIOCSRTIMEOUT32: 1404fc0a61a4SKonstantin Belousov #endif 1405df8bae1dSRodney W. Grimes { 1406df8bae1dSRodney W. Grimes struct timeval *tv = (struct timeval *)addr; 14079624d947SJuli Mallett #if defined(COMPAT_FREEBSD32) && !defined(__mips__) 1408fc0a61a4SKonstantin Belousov struct timeval32 *tv32; 1409fc0a61a4SKonstantin Belousov struct timeval tv64; 1410fc0a61a4SKonstantin Belousov 1411fc0a61a4SKonstantin Belousov if (cmd == BIOCSRTIMEOUT32) { 1412fc0a61a4SKonstantin Belousov tv32 = (struct timeval32 *)addr; 1413fc0a61a4SKonstantin Belousov tv = &tv64; 1414fc0a61a4SKonstantin Belousov tv->tv_sec = tv32->tv_sec; 1415fc0a61a4SKonstantin Belousov tv->tv_usec = tv32->tv_usec; 1416fc0a61a4SKonstantin Belousov } else 1417fc0a61a4SKonstantin Belousov #endif 1418fc0a61a4SKonstantin Belousov tv = (struct timeval *)addr; 1419df8bae1dSRodney W. Grimes 1420bdc2cdc5SAlexander Langer /* 1421bdc2cdc5SAlexander Langer * Subtract 1 tick from tvtohz() since this isn't 1422bdc2cdc5SAlexander Langer * a one-shot timer. 1423bdc2cdc5SAlexander Langer */ 1424bdc2cdc5SAlexander Langer if ((error = itimerfix(tv)) == 0) 1425bdc2cdc5SAlexander Langer d->bd_rtout = tvtohz(tv) - 1; 1426df8bae1dSRodney W. Grimes break; 1427df8bae1dSRodney W. Grimes } 1428df8bae1dSRodney W. Grimes 1429df8bae1dSRodney W. Grimes /* 1430df8bae1dSRodney W. Grimes * Get read timeout. 1431df8bae1dSRodney W. Grimes */ 1432df8bae1dSRodney W. Grimes case BIOCGRTIMEOUT: 14339624d947SJuli Mallett #if defined(COMPAT_FREEBSD32) && !defined(__mips__) 1434fc0a61a4SKonstantin Belousov case BIOCGRTIMEOUT32: 1435fc0a61a4SKonstantin Belousov #endif 1436df8bae1dSRodney W. Grimes { 1437fc0a61a4SKonstantin Belousov struct timeval *tv; 14389624d947SJuli Mallett #if defined(COMPAT_FREEBSD32) && !defined(__mips__) 1439fc0a61a4SKonstantin Belousov struct timeval32 *tv32; 1440fc0a61a4SKonstantin Belousov struct timeval tv64; 1441fc0a61a4SKonstantin Belousov 1442fc0a61a4SKonstantin Belousov if (cmd == BIOCGRTIMEOUT32) 1443fc0a61a4SKonstantin Belousov tv = &tv64; 1444fc0a61a4SKonstantin Belousov else 1445fc0a61a4SKonstantin Belousov #endif 1446fc0a61a4SKonstantin Belousov tv = (struct timeval *)addr; 1447df8bae1dSRodney W. Grimes 1448bdc2cdc5SAlexander Langer tv->tv_sec = d->bd_rtout / hz; 1449bdc2cdc5SAlexander Langer tv->tv_usec = (d->bd_rtout % hz) * tick; 14509624d947SJuli Mallett #if defined(COMPAT_FREEBSD32) && !defined(__mips__) 1451fc0a61a4SKonstantin Belousov if (cmd == BIOCGRTIMEOUT32) { 1452fc0a61a4SKonstantin Belousov tv32 = (struct timeval32 *)addr; 1453fc0a61a4SKonstantin Belousov tv32->tv_sec = tv->tv_sec; 1454fc0a61a4SKonstantin Belousov tv32->tv_usec = tv->tv_usec; 1455fc0a61a4SKonstantin Belousov } 1456fc0a61a4SKonstantin Belousov #endif 1457fc0a61a4SKonstantin Belousov 1458df8bae1dSRodney W. Grimes break; 1459df8bae1dSRodney W. Grimes } 1460df8bae1dSRodney W. Grimes 1461df8bae1dSRodney W. Grimes /* 1462df8bae1dSRodney W. Grimes * Get packet stats. 1463df8bae1dSRodney W. Grimes */ 1464df8bae1dSRodney W. Grimes case BIOCGSTATS: 1465df8bae1dSRodney W. Grimes { 1466df8bae1dSRodney W. Grimes struct bpf_stat *bs = (struct bpf_stat *)addr; 1467df8bae1dSRodney W. Grimes 14684d621040SChristian S.J. Peron /* XXXCSJP overflow */ 1469df8bae1dSRodney W. Grimes bs->bs_recv = d->bd_rcount; 1470df8bae1dSRodney W. Grimes bs->bs_drop = d->bd_dcount; 1471df8bae1dSRodney W. Grimes break; 1472df8bae1dSRodney W. Grimes } 1473df8bae1dSRodney W. Grimes 1474df8bae1dSRodney W. Grimes /* 1475df8bae1dSRodney W. Grimes * Set immediate mode. 1476df8bae1dSRodney W. Grimes */ 1477df8bae1dSRodney W. Grimes case BIOCIMMEDIATE: 1478df8bae1dSRodney W. Grimes d->bd_immediate = *(u_int *)addr; 1479df8bae1dSRodney W. Grimes break; 1480df8bae1dSRodney W. Grimes 1481df8bae1dSRodney W. Grimes case BIOCVERSION: 1482df8bae1dSRodney W. Grimes { 1483df8bae1dSRodney W. Grimes struct bpf_version *bv = (struct bpf_version *)addr; 1484df8bae1dSRodney W. Grimes 1485df8bae1dSRodney W. Grimes bv->bv_major = BPF_MAJOR_VERSION; 1486df8bae1dSRodney W. Grimes bv->bv_minor = BPF_MINOR_VERSION; 1487df8bae1dSRodney W. Grimes break; 1488df8bae1dSRodney W. Grimes } 148900a83887SPaul Traina 1490114ae644SMike Smith /* 1491114ae644SMike Smith * Get "header already complete" flag 1492114ae644SMike Smith */ 1493114ae644SMike Smith case BIOCGHDRCMPLT: 1494114ae644SMike Smith *(u_int *)addr = d->bd_hdrcmplt; 1495114ae644SMike Smith break; 1496114ae644SMike Smith 1497114ae644SMike Smith /* 1498114ae644SMike Smith * Set "header already complete" flag 1499114ae644SMike Smith */ 1500114ae644SMike Smith case BIOCSHDRCMPLT: 1501114ae644SMike Smith d->bd_hdrcmplt = *(u_int *)addr ? 1 : 0; 1502114ae644SMike Smith break; 1503114ae644SMike Smith 15048ed3828cSRobert Watson /* 1505560a54e1SJung-uk Kim * Get packet direction flag 15068ed3828cSRobert Watson */ 1507560a54e1SJung-uk Kim case BIOCGDIRECTION: 1508560a54e1SJung-uk Kim *(u_int *)addr = d->bd_direction; 15098ed3828cSRobert Watson break; 15108ed3828cSRobert Watson 15118ed3828cSRobert Watson /* 1512560a54e1SJung-uk Kim * Set packet direction flag 15138ed3828cSRobert Watson */ 1514560a54e1SJung-uk Kim case BIOCSDIRECTION: 1515560a54e1SJung-uk Kim { 1516560a54e1SJung-uk Kim u_int direction; 1517560a54e1SJung-uk Kim 1518560a54e1SJung-uk Kim direction = *(u_int *)addr; 1519560a54e1SJung-uk Kim switch (direction) { 1520560a54e1SJung-uk Kim case BPF_D_IN: 1521560a54e1SJung-uk Kim case BPF_D_INOUT: 1522560a54e1SJung-uk Kim case BPF_D_OUT: 1523560a54e1SJung-uk Kim d->bd_direction = direction; 1524560a54e1SJung-uk Kim break; 1525560a54e1SJung-uk Kim default: 1526560a54e1SJung-uk Kim error = EINVAL; 1527560a54e1SJung-uk Kim } 1528560a54e1SJung-uk Kim } 1529560a54e1SJung-uk Kim break; 1530560a54e1SJung-uk Kim 1531547d94bdSJung-uk Kim /* 1532d0d7bcdfSJung-uk Kim * Get packet timestamp format and resolution. 1533547d94bdSJung-uk Kim */ 1534547d94bdSJung-uk Kim case BIOCGTSTAMP: 1535547d94bdSJung-uk Kim *(u_int *)addr = d->bd_tstamp; 1536547d94bdSJung-uk Kim break; 1537547d94bdSJung-uk Kim 1538547d94bdSJung-uk Kim /* 1539547d94bdSJung-uk Kim * Set packet timestamp format and resolution. 1540547d94bdSJung-uk Kim */ 1541547d94bdSJung-uk Kim case BIOCSTSTAMP: 1542547d94bdSJung-uk Kim { 1543547d94bdSJung-uk Kim u_int func; 1544547d94bdSJung-uk Kim 1545547d94bdSJung-uk Kim func = *(u_int *)addr; 1546547d94bdSJung-uk Kim if (BPF_T_VALID(func)) 1547547d94bdSJung-uk Kim d->bd_tstamp = func; 1548547d94bdSJung-uk Kim else 1549547d94bdSJung-uk Kim error = EINVAL; 1550547d94bdSJung-uk Kim } 1551547d94bdSJung-uk Kim break; 1552547d94bdSJung-uk Kim 1553560a54e1SJung-uk Kim case BIOCFEEDBACK: 1554560a54e1SJung-uk Kim d->bd_feedback = *(u_int *)addr; 1555560a54e1SJung-uk Kim break; 1556560a54e1SJung-uk Kim 1557560a54e1SJung-uk Kim case BIOCLOCK: 1558560a54e1SJung-uk Kim d->bd_locked = 1; 15598ed3828cSRobert Watson break; 15608ed3828cSRobert Watson 156100a83887SPaul Traina case FIONBIO: /* Non-blocking I/O */ 156200a83887SPaul Traina break; 156300a83887SPaul Traina 156400a83887SPaul Traina case FIOASYNC: /* Send signal on receive packets */ 156500a83887SPaul Traina d->bd_async = *(int *)addr; 156600a83887SPaul Traina break; 156700a83887SPaul Traina 1568831d27a9SDon Lewis case FIOSETOWN: 1569831d27a9SDon Lewis error = fsetown(*(int *)addr, &d->bd_sigio); 157000a83887SPaul Traina break; 157100a83887SPaul Traina 1572831d27a9SDon Lewis case FIOGETOWN: 157391e97a82SDon Lewis *(int *)addr = fgetown(&d->bd_sigio); 1574831d27a9SDon Lewis break; 1575831d27a9SDon Lewis 1576831d27a9SDon Lewis /* This is deprecated, FIOSETOWN should be used instead. */ 1577831d27a9SDon Lewis case TIOCSPGRP: 1578831d27a9SDon Lewis error = fsetown(-(*(int *)addr), &d->bd_sigio); 1579831d27a9SDon Lewis break; 1580831d27a9SDon Lewis 1581831d27a9SDon Lewis /* This is deprecated, FIOGETOWN should be used instead. */ 158200a83887SPaul Traina case TIOCGPGRP: 158391e97a82SDon Lewis *(int *)addr = -fgetown(&d->bd_sigio); 158400a83887SPaul Traina break; 158500a83887SPaul Traina 158600a83887SPaul Traina case BIOCSRSIG: /* Set receive signal */ 158700a83887SPaul Traina { 158800a83887SPaul Traina u_int sig; 158900a83887SPaul Traina 159000a83887SPaul Traina sig = *(u_int *)addr; 159100a83887SPaul Traina 159200a83887SPaul Traina if (sig >= NSIG) 159300a83887SPaul Traina error = EINVAL; 159400a83887SPaul Traina else 159500a83887SPaul Traina d->bd_sig = sig; 159600a83887SPaul Traina break; 159700a83887SPaul Traina } 159800a83887SPaul Traina case BIOCGRSIG: 159900a83887SPaul Traina *(u_int *)addr = d->bd_sig; 160000a83887SPaul Traina break; 16014d621040SChristian S.J. Peron 16024d621040SChristian S.J. Peron case BIOCGETBUFMODE: 16034d621040SChristian S.J. Peron *(u_int *)addr = d->bd_bufmode; 16044d621040SChristian S.J. Peron break; 16054d621040SChristian S.J. Peron 16064d621040SChristian S.J. Peron case BIOCSETBUFMODE: 16074d621040SChristian S.J. Peron /* 16084d621040SChristian S.J. Peron * Allow the buffering mode to be changed as long as we 16094d621040SChristian S.J. Peron * haven't yet committed to a particular mode. Our 16104d621040SChristian S.J. Peron * definition of commitment, for now, is whether or not a 16114d621040SChristian S.J. Peron * buffer has been allocated or an interface attached, since 16124d621040SChristian S.J. Peron * that's the point where things get tricky. 16134d621040SChristian S.J. Peron */ 16144d621040SChristian S.J. Peron switch (*(u_int *)addr) { 16154d621040SChristian S.J. Peron case BPF_BUFMODE_BUFFER: 16164d621040SChristian S.J. Peron break; 16174d621040SChristian S.J. Peron 16184d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 16194d621040SChristian S.J. Peron if (bpf_zerocopy_enable) 16204d621040SChristian S.J. Peron break; 16214d621040SChristian S.J. Peron /* FALLSTHROUGH */ 16224d621040SChristian S.J. Peron 16234d621040SChristian S.J. Peron default: 16241b610a74SBjoern A. Zeeb CURVNET_RESTORE(); 16254d621040SChristian S.J. Peron return (EINVAL); 16264d621040SChristian S.J. Peron } 16274d621040SChristian S.J. Peron 1628e4b3229aSAlexander V. Chernikov BPFD_WLOCK(d); 16294d621040SChristian S.J. Peron if (d->bd_sbuf != NULL || d->bd_hbuf != NULL || 16304d621040SChristian S.J. Peron d->bd_fbuf != NULL || d->bd_bif != NULL) { 1631e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 16321b610a74SBjoern A. Zeeb CURVNET_RESTORE(); 16334d621040SChristian S.J. Peron return (EBUSY); 16344d621040SChristian S.J. Peron } 16354d621040SChristian S.J. Peron d->bd_bufmode = *(u_int *)addr; 1636e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 16374d621040SChristian S.J. Peron break; 16384d621040SChristian S.J. Peron 16394d621040SChristian S.J. Peron case BIOCGETZMAX: 16401b610a74SBjoern A. Zeeb error = bpf_ioctl_getzmax(td, d, (size_t *)addr); 16411b610a74SBjoern A. Zeeb break; 16424d621040SChristian S.J. Peron 16434d621040SChristian S.J. Peron case BIOCSETZBUF: 16441b610a74SBjoern A. Zeeb error = bpf_ioctl_setzbuf(td, d, (struct bpf_zbuf *)addr); 16451b610a74SBjoern A. Zeeb break; 16464d621040SChristian S.J. Peron 16474d621040SChristian S.J. Peron case BIOCROTZBUF: 16481b610a74SBjoern A. Zeeb error = bpf_ioctl_rotzbuf(td, d, (struct bpf_zbuf *)addr); 16491b610a74SBjoern A. Zeeb break; 1650df8bae1dSRodney W. Grimes } 165197021c24SMarko Zec CURVNET_RESTORE(); 1652df8bae1dSRodney W. Grimes return (error); 1653df8bae1dSRodney W. Grimes } 1654df8bae1dSRodney W. Grimes 1655df8bae1dSRodney W. Grimes /* 1656df8bae1dSRodney W. Grimes * Set d's packet filter program to fp. If this file already has a filter, 1657df8bae1dSRodney W. Grimes * free it and replace it. Returns EINVAL for bogus requests. 1658df8bae1dSRodney W. Grimes */ 1659f708ef1bSPoul-Henning Kamp static int 166019ba8395SChristian S.J. Peron bpf_setf(struct bpf_d *d, struct bpf_program *fp, u_long cmd) 1661df8bae1dSRodney W. Grimes { 1662df8bae1dSRodney W. Grimes struct bpf_insn *fcode, *old; 166393e39f0bSChristian S.J. Peron u_int wfilter, flen, size; 1664293c06a1SRuslan Ermilov #ifdef BPF_JITTER 1665ae275efcSJung-uk Kim bpf_jit_filter *ofunc; 1666ae275efcSJung-uk Kim #endif 16679431cc16SAlexander V. Chernikov int need_upgrade; 1668fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 1669fc0a61a4SKonstantin Belousov struct bpf_program32 *fp32; 1670fc0a61a4SKonstantin Belousov struct bpf_program fp_swab; 1671df8bae1dSRodney W. Grimes 1672fc0a61a4SKonstantin Belousov if (cmd == BIOCSETWF32 || cmd == BIOCSETF32 || cmd == BIOCSETFNR32) { 1673fc0a61a4SKonstantin Belousov fp32 = (struct bpf_program32 *)fp; 1674fc0a61a4SKonstantin Belousov fp_swab.bf_len = fp32->bf_len; 1675fc0a61a4SKonstantin Belousov fp_swab.bf_insns = (struct bpf_insn *)(uintptr_t)fp32->bf_insns; 1676fc0a61a4SKonstantin Belousov fp = &fp_swab; 1677fc0a61a4SKonstantin Belousov if (cmd == BIOCSETWF32) 1678fc0a61a4SKonstantin Belousov cmd = BIOCSETWF; 1679fc0a61a4SKonstantin Belousov } 1680fc0a61a4SKonstantin Belousov #endif 1681*6c74ff0eSAlexander V. Chernikov /* 1682*6c74ff0eSAlexander V. Chernikov * Check new filter validness before acquiring any locks. 1683*6c74ff0eSAlexander V. Chernikov * Allocate memory for new filter, if needed. 1684*6c74ff0eSAlexander V. Chernikov */ 1685*6c74ff0eSAlexander V. Chernikov flen = fp->bf_len; 1686*6c74ff0eSAlexander V. Chernikov if ((flen > bpf_maxinsns) || ((fp->bf_insns == NULL) && (flen != 0))) 1687*6c74ff0eSAlexander V. Chernikov return (EINVAL); 1688*6c74ff0eSAlexander V. Chernikov 1689*6c74ff0eSAlexander V. Chernikov need_upgrade = 0; 1690*6c74ff0eSAlexander V. Chernikov size = flen * sizeof(*fp->bf_insns); 1691*6c74ff0eSAlexander V. Chernikov if (size > 0) 1692*6c74ff0eSAlexander V. Chernikov fcode = (struct bpf_insn *)malloc(size, M_BPF, M_WAITOK); 1693*6c74ff0eSAlexander V. Chernikov else 1694*6c74ff0eSAlexander V. Chernikov fcode = NULL; /* Make compiler happy */ 1695*6c74ff0eSAlexander V. Chernikov 1696*6c74ff0eSAlexander V. Chernikov BPF_LOCK(); 1697*6c74ff0eSAlexander V. Chernikov 169893e39f0bSChristian S.J. Peron if (cmd == BIOCSETWF) { 169993e39f0bSChristian S.J. Peron old = d->bd_wfilter; 170093e39f0bSChristian S.J. Peron wfilter = 1; 1701293c06a1SRuslan Ermilov #ifdef BPF_JITTER 1702ae275efcSJung-uk Kim ofunc = NULL; 1703ae275efcSJung-uk Kim #endif 170493e39f0bSChristian S.J. Peron } else { 170593e39f0bSChristian S.J. Peron wfilter = 0; 170693e39f0bSChristian S.J. Peron old = d->bd_rfilter; 1707293c06a1SRuslan Ermilov #ifdef BPF_JITTER 1708ae275efcSJung-uk Kim ofunc = d->bd_bfilter; 1709ae275efcSJung-uk Kim #endif 171093e39f0bSChristian S.J. Peron } 1711572bde2aSRobert Watson if (fp->bf_insns == NULL) { 1712e4b3229aSAlexander V. Chernikov /* 1713*6c74ff0eSAlexander V. Chernikov * Protect filter removal by interface lock. 1714*6c74ff0eSAlexander V. Chernikov * Additionally, we are protected by global lock here. 1715e4b3229aSAlexander V. Chernikov */ 1716*6c74ff0eSAlexander V. Chernikov if (d->bd_bif != NULL) 1717e4b3229aSAlexander V. Chernikov BPFIF_WLOCK(d->bd_bif); 1718e4b3229aSAlexander V. Chernikov BPFD_WLOCK(d); 171993e39f0bSChristian S.J. Peron if (wfilter) 172093e39f0bSChristian S.J. Peron d->bd_wfilter = NULL; 1721ae275efcSJung-uk Kim else { 172293e39f0bSChristian S.J. Peron d->bd_rfilter = NULL; 1723293c06a1SRuslan Ermilov #ifdef BPF_JITTER 1724ae275efcSJung-uk Kim d->bd_bfilter = NULL; 1725ae275efcSJung-uk Kim #endif 1726f11c3508SDavid Malone if (cmd == BIOCSETF) 1727df8bae1dSRodney W. Grimes reset_d(d); 1728f11c3508SDavid Malone } 1729e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 1730*6c74ff0eSAlexander V. Chernikov if (d->bd_bif != NULL) 1731e4b3229aSAlexander V. Chernikov BPFIF_WUNLOCK(d->bd_bif); 1732572bde2aSRobert Watson if (old != NULL) 1733bd3a5320SPoul-Henning Kamp free((caddr_t)old, M_BPF); 1734293c06a1SRuslan Ermilov #ifdef BPF_JITTER 1735ae275efcSJung-uk Kim if (ofunc != NULL) 1736ae275efcSJung-uk Kim bpf_destroy_jit_filter(ofunc); 1737ae275efcSJung-uk Kim #endif 1738*6c74ff0eSAlexander V. Chernikov BPF_UNLOCK(); 1739df8bae1dSRodney W. Grimes return (0); 1740df8bae1dSRodney W. Grimes } 1741df8bae1dSRodney W. Grimes 1742df8bae1dSRodney W. Grimes if (copyin((caddr_t)fp->bf_insns, (caddr_t)fcode, size) == 0 && 1743df8bae1dSRodney W. Grimes bpf_validate(fcode, (int)flen)) { 1744e4b3229aSAlexander V. Chernikov /* 1745*6c74ff0eSAlexander V. Chernikov * Protect filter change by interface lock 1746*6c74ff0eSAlexander V. Chernikov * Additionally, we are protected by global lock here. 1747e4b3229aSAlexander V. Chernikov */ 1748*6c74ff0eSAlexander V. Chernikov if (d->bd_bif != NULL) 1749e4b3229aSAlexander V. Chernikov BPFIF_WLOCK(d->bd_bif); 1750e4b3229aSAlexander V. Chernikov BPFD_WLOCK(d); 175193e39f0bSChristian S.J. Peron if (wfilter) 175293e39f0bSChristian S.J. Peron d->bd_wfilter = fcode; 1753ae275efcSJung-uk Kim else { 175493e39f0bSChristian S.J. Peron d->bd_rfilter = fcode; 1755293c06a1SRuslan Ermilov #ifdef BPF_JITTER 1756ae275efcSJung-uk Kim d->bd_bfilter = bpf_jitter(fcode, flen); 1757ae275efcSJung-uk Kim #endif 1758f11c3508SDavid Malone if (cmd == BIOCSETF) 1759df8bae1dSRodney W. Grimes reset_d(d); 176051ec1eb7SAlexander V. Chernikov 176151ec1eb7SAlexander V. Chernikov /* 176251ec1eb7SAlexander V. Chernikov * Do not require upgrade by first BIOCSETF 176351ec1eb7SAlexander V. Chernikov * (used to set snaplen) by pcap_open_live() 176451ec1eb7SAlexander V. Chernikov */ 176551ec1eb7SAlexander V. Chernikov if ((d->bd_writer != 0) && (--d->bd_writer == 0)) 176651ec1eb7SAlexander V. Chernikov need_upgrade = 1; 176751ec1eb7SAlexander V. Chernikov CTR4(KTR_NET, "%s: filter function set by pid %d, " 176851ec1eb7SAlexander V. Chernikov "bd_writer counter %d, need_upgrade %d", 176951ec1eb7SAlexander V. Chernikov __func__, d->bd_pid, d->bd_writer, need_upgrade); 1770f11c3508SDavid Malone } 1771e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 1772*6c74ff0eSAlexander V. Chernikov if (d->bd_bif != NULL) 1773e4b3229aSAlexander V. Chernikov BPFIF_WUNLOCK(d->bd_bif); 1774572bde2aSRobert Watson if (old != NULL) 1775bd3a5320SPoul-Henning Kamp free((caddr_t)old, M_BPF); 1776293c06a1SRuslan Ermilov #ifdef BPF_JITTER 1777ae275efcSJung-uk Kim if (ofunc != NULL) 1778ae275efcSJung-uk Kim bpf_destroy_jit_filter(ofunc); 1779ae275efcSJung-uk Kim #endif 1780df8bae1dSRodney W. Grimes 178151ec1eb7SAlexander V. Chernikov /* Move d to active readers list */ 178251ec1eb7SAlexander V. Chernikov if (need_upgrade != 0) 178351ec1eb7SAlexander V. Chernikov bpf_upgraded(d); 178451ec1eb7SAlexander V. Chernikov 1785*6c74ff0eSAlexander V. Chernikov BPF_UNLOCK(); 1786df8bae1dSRodney W. Grimes return (0); 1787df8bae1dSRodney W. Grimes } 1788bd3a5320SPoul-Henning Kamp free((caddr_t)fcode, M_BPF); 1789*6c74ff0eSAlexander V. Chernikov BPF_UNLOCK(); 1790df8bae1dSRodney W. Grimes return (EINVAL); 1791df8bae1dSRodney W. Grimes } 1792df8bae1dSRodney W. Grimes 1793df8bae1dSRodney W. Grimes /* 1794df8bae1dSRodney W. Grimes * Detach a file from its current interface (if attached at all) and attach 1795df8bae1dSRodney W. Grimes * to the interface indicated by the name stored in ifr. 1796df8bae1dSRodney W. Grimes * Return an errno or 0. 1797df8bae1dSRodney W. Grimes */ 1798df8bae1dSRodney W. Grimes static int 179919ba8395SChristian S.J. Peron bpf_setif(struct bpf_d *d, struct ifreq *ifr) 1800df8bae1dSRodney W. Grimes { 1801df8bae1dSRodney W. Grimes struct bpf_if *bp; 18029b44ff22SGarrett Wollman struct ifnet *theywant; 1803df8bae1dSRodney W. Grimes 1804*6c74ff0eSAlexander V. Chernikov BPF_LOCK_ASSERT(); 1805*6c74ff0eSAlexander V. Chernikov 18069b44ff22SGarrett Wollman theywant = ifunit(ifr->ifr_name); 180716d878ccSChristian S.J. Peron if (theywant == NULL || theywant->if_bpf == NULL) 180816d878ccSChristian S.J. Peron return (ENXIO); 18099b44ff22SGarrett Wollman 181016d878ccSChristian S.J. Peron bp = theywant->if_bpf; 18114d621040SChristian S.J. Peron 1812df8bae1dSRodney W. Grimes /* 18134d621040SChristian S.J. Peron * Behavior here depends on the buffering model. If we're using 18144d621040SChristian S.J. Peron * kernel memory buffers, then we can allocate them here. If we're 18154d621040SChristian S.J. Peron * using zero-copy, then the user process must have registered 18164d621040SChristian S.J. Peron * buffers by the time we get here. If not, return an error. 18174d621040SChristian S.J. Peron * 18184d621040SChristian S.J. Peron * XXXRW: There are locking issues here with multi-threaded use: what 18194d621040SChristian S.J. Peron * if two threads try to set the interface at once? 1820df8bae1dSRodney W. Grimes */ 18214d621040SChristian S.J. Peron switch (d->bd_bufmode) { 18224d621040SChristian S.J. Peron case BPF_BUFMODE_BUFFER: 1823a3594432SRobert Watson if (d->bd_sbuf == NULL) 18244d621040SChristian S.J. Peron bpf_buffer_alloc(d); 18254d621040SChristian S.J. Peron KASSERT(d->bd_sbuf != NULL, ("bpf_setif: bd_sbuf NULL")); 18264d621040SChristian S.J. Peron break; 18274d621040SChristian S.J. Peron 18284d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 18294d621040SChristian S.J. Peron if (d->bd_sbuf == NULL) 18304d621040SChristian S.J. Peron return (EINVAL); 18314d621040SChristian S.J. Peron break; 18324d621040SChristian S.J. Peron 18334d621040SChristian S.J. Peron default: 18344d621040SChristian S.J. Peron panic("bpf_setif: bufmode %d", d->bd_bufmode); 18354d621040SChristian S.J. Peron } 1836*6c74ff0eSAlexander V. Chernikov if (bp != d->bd_bif) 1837df8bae1dSRodney W. Grimes bpf_attachd(d, bp); 1838e4b3229aSAlexander V. Chernikov BPFD_WLOCK(d); 1839df8bae1dSRodney W. Grimes reset_d(d); 1840e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 1841df8bae1dSRodney W. Grimes return (0); 1842df8bae1dSRodney W. Grimes } 1843df8bae1dSRodney W. Grimes 1844df8bae1dSRodney W. Grimes /* 1845243ac7d8SPeter Wemm * Support for select() and poll() system calls 1846df8bae1dSRodney W. Grimes * 1847df8bae1dSRodney W. Grimes * Return true iff the specific operation will not block indefinitely. 1848df8bae1dSRodney W. Grimes * Otherwise, return false but make a note that a selwakeup() must be done. 1849df8bae1dSRodney W. Grimes */ 185037c84183SPoul-Henning Kamp static int 185119ba8395SChristian S.J. Peron bpfpoll(struct cdev *dev, int events, struct thread *td) 1852df8bae1dSRodney W. Grimes { 1853e7bb21b3SJonathan Lemon struct bpf_d *d; 18540832fc64SGarance A Drosehn int revents; 1855df8bae1dSRodney W. Grimes 1856136600feSEd Schouten if (devfs_get_cdevpriv((void **)&d) != 0 || d->bd_bif == NULL) 1857136600feSEd Schouten return (events & 1858136600feSEd Schouten (POLLHUP|POLLIN|POLLRDNORM|POLLOUT|POLLWRNORM)); 1859de5d9935SRobert Watson 1860b75a24a0SChristian S.J. Peron /* 1861b75a24a0SChristian S.J. Peron * Refresh PID associated with this descriptor. 1862b75a24a0SChristian S.J. Peron */ 18630832fc64SGarance A Drosehn revents = events & (POLLOUT | POLLWRNORM); 1864e4b3229aSAlexander V. Chernikov BPFD_WLOCK(d); 1865e4b3229aSAlexander V. Chernikov BPF_PID_REFRESH(d, td); 186675c13541SPoul-Henning Kamp if (events & (POLLIN | POLLRDNORM)) { 186795aab9ccSJohn-Mark Gurney if (bpf_ready(d)) 1868243ac7d8SPeter Wemm revents |= events & (POLLIN | POLLRDNORM); 186981bda851SJohn Polstra else { 1870ed01445dSJohn Baldwin selrecord(td, &d->bd_sel); 187181bda851SJohn Polstra /* Start the read timeout if necessary. */ 187281bda851SJohn Polstra if (d->bd_rtout > 0 && d->bd_state == BPF_IDLE) { 187381bda851SJohn Polstra callout_reset(&d->bd_callout, d->bd_rtout, 187481bda851SJohn Polstra bpf_timed_out, d); 187581bda851SJohn Polstra d->bd_state = BPF_WAITING; 187681bda851SJohn Polstra } 187781bda851SJohn Polstra } 187875c13541SPoul-Henning Kamp } 1879e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 1880243ac7d8SPeter Wemm return (revents); 1881df8bae1dSRodney W. Grimes } 1882df8bae1dSRodney W. Grimes 1883df8bae1dSRodney W. Grimes /* 188495aab9ccSJohn-Mark Gurney * Support for kevent() system call. Register EVFILT_READ filters and 188595aab9ccSJohn-Mark Gurney * reject all others. 188695aab9ccSJohn-Mark Gurney */ 188795aab9ccSJohn-Mark Gurney int 188819ba8395SChristian S.J. Peron bpfkqfilter(struct cdev *dev, struct knote *kn) 188995aab9ccSJohn-Mark Gurney { 1890136600feSEd Schouten struct bpf_d *d; 189195aab9ccSJohn-Mark Gurney 1892136600feSEd Schouten if (devfs_get_cdevpriv((void **)&d) != 0 || 1893136600feSEd Schouten kn->kn_filter != EVFILT_READ) 189495aab9ccSJohn-Mark Gurney return (1); 189595aab9ccSJohn-Mark Gurney 1896b75a24a0SChristian S.J. Peron /* 1897b75a24a0SChristian S.J. Peron * Refresh PID associated with this descriptor. 1898b75a24a0SChristian S.J. Peron */ 1899e4b3229aSAlexander V. Chernikov BPFD_WLOCK(d); 1900e4b3229aSAlexander V. Chernikov BPF_PID_REFRESH_CUR(d); 190195aab9ccSJohn-Mark Gurney kn->kn_fop = &bpfread_filtops; 190295aab9ccSJohn-Mark Gurney kn->kn_hook = d; 19034b19419eSChristian S.J. Peron knlist_add(&d->bd_sel.si_note, kn, 1); 1904e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 190595aab9ccSJohn-Mark Gurney 190695aab9ccSJohn-Mark Gurney return (0); 190795aab9ccSJohn-Mark Gurney } 190895aab9ccSJohn-Mark Gurney 190995aab9ccSJohn-Mark Gurney static void 191019ba8395SChristian S.J. Peron filt_bpfdetach(struct knote *kn) 191195aab9ccSJohn-Mark Gurney { 191295aab9ccSJohn-Mark Gurney struct bpf_d *d = (struct bpf_d *)kn->kn_hook; 191395aab9ccSJohn-Mark Gurney 1914ad3b9257SJohn-Mark Gurney knlist_remove(&d->bd_sel.si_note, kn, 0); 191595aab9ccSJohn-Mark Gurney } 191695aab9ccSJohn-Mark Gurney 191795aab9ccSJohn-Mark Gurney static int 191819ba8395SChristian S.J. Peron filt_bpfread(struct knote *kn, long hint) 191995aab9ccSJohn-Mark Gurney { 192095aab9ccSJohn-Mark Gurney struct bpf_d *d = (struct bpf_d *)kn->kn_hook; 192195aab9ccSJohn-Mark Gurney int ready; 192295aab9ccSJohn-Mark Gurney 1923e4b3229aSAlexander V. Chernikov BPFD_WLOCK_ASSERT(d); 192495aab9ccSJohn-Mark Gurney ready = bpf_ready(d); 192595aab9ccSJohn-Mark Gurney if (ready) { 192695aab9ccSJohn-Mark Gurney kn->kn_data = d->bd_slen; 192795aab9ccSJohn-Mark Gurney if (d->bd_hbuf) 192895aab9ccSJohn-Mark Gurney kn->kn_data += d->bd_hlen; 19295d7af3a1SJung-uk Kim } else if (d->bd_rtout > 0 && d->bd_state == BPF_IDLE) { 193095aab9ccSJohn-Mark Gurney callout_reset(&d->bd_callout, d->bd_rtout, 193195aab9ccSJohn-Mark Gurney bpf_timed_out, d); 193295aab9ccSJohn-Mark Gurney d->bd_state = BPF_WAITING; 193395aab9ccSJohn-Mark Gurney } 193495aab9ccSJohn-Mark Gurney 193595aab9ccSJohn-Mark Gurney return (ready); 193695aab9ccSJohn-Mark Gurney } 193795aab9ccSJohn-Mark Gurney 1938253a3814SLawrence Stewart #define BPF_TSTAMP_NONE 0 1939253a3814SLawrence Stewart #define BPF_TSTAMP_FAST 1 1940253a3814SLawrence Stewart #define BPF_TSTAMP_NORMAL 2 1941253a3814SLawrence Stewart #define BPF_TSTAMP_EXTERN 3 1942253a3814SLawrence Stewart 1943253a3814SLawrence Stewart static int 1944253a3814SLawrence Stewart bpf_ts_quality(int tstype) 1945253a3814SLawrence Stewart { 1946253a3814SLawrence Stewart 1947253a3814SLawrence Stewart if (tstype == BPF_T_NONE) 1948253a3814SLawrence Stewart return (BPF_TSTAMP_NONE); 1949253a3814SLawrence Stewart if ((tstype & BPF_T_FAST) != 0) 1950253a3814SLawrence Stewart return (BPF_TSTAMP_FAST); 1951253a3814SLawrence Stewart 1952253a3814SLawrence Stewart return (BPF_TSTAMP_NORMAL); 1953253a3814SLawrence Stewart } 1954253a3814SLawrence Stewart 1955253a3814SLawrence Stewart static int 1956253a3814SLawrence Stewart bpf_gettime(struct bintime *bt, int tstype, struct mbuf *m) 1957253a3814SLawrence Stewart { 1958253a3814SLawrence Stewart struct m_tag *tag; 1959253a3814SLawrence Stewart int quality; 1960253a3814SLawrence Stewart 1961253a3814SLawrence Stewart quality = bpf_ts_quality(tstype); 1962253a3814SLawrence Stewart if (quality == BPF_TSTAMP_NONE) 1963253a3814SLawrence Stewart return (quality); 1964253a3814SLawrence Stewart 1965253a3814SLawrence Stewart if (m != NULL) { 1966253a3814SLawrence Stewart tag = m_tag_locate(m, MTAG_BPF, MTAG_BPF_TIMESTAMP, NULL); 1967253a3814SLawrence Stewart if (tag != NULL) { 1968253a3814SLawrence Stewart *bt = *(struct bintime *)(tag + 1); 1969253a3814SLawrence Stewart return (BPF_TSTAMP_EXTERN); 1970253a3814SLawrence Stewart } 1971253a3814SLawrence Stewart } 1972253a3814SLawrence Stewart if (quality == BPF_TSTAMP_NORMAL) 1973253a3814SLawrence Stewart binuptime(bt); 1974253a3814SLawrence Stewart else 1975253a3814SLawrence Stewart getbinuptime(bt); 1976253a3814SLawrence Stewart 1977253a3814SLawrence Stewart return (quality); 1978253a3814SLawrence Stewart } 1979253a3814SLawrence Stewart 198095aab9ccSJohn-Mark Gurney /* 1981df8bae1dSRodney W. Grimes * Incoming linkage from device drivers. Process the packet pkt, of length 1982df8bae1dSRodney W. Grimes * pktlen, which is stored in a contiguous buffer. The packet is parsed 1983df8bae1dSRodney W. Grimes * by each process' filter, and if accepted, stashed into the corresponding 1984df8bae1dSRodney W. Grimes * buffer. 1985df8bae1dSRodney W. Grimes */ 1986df8bae1dSRodney W. Grimes void 198719ba8395SChristian S.J. Peron bpf_tap(struct bpf_if *bp, u_char *pkt, u_int pktlen) 1988df8bae1dSRodney W. Grimes { 1989547d94bdSJung-uk Kim struct bintime bt; 19908994a245SDag-Erling Smørgrav struct bpf_d *d; 1991a36599ccSJung-uk Kim #ifdef BPF_JITTER 1992a36599ccSJung-uk Kim bpf_jit_filter *bf; 1993a36599ccSJung-uk Kim #endif 1994253a3814SLawrence Stewart u_int slen; 1995253a3814SLawrence Stewart int gottime; 1996e7bb21b3SJonathan Lemon 1997253a3814SLawrence Stewart gottime = BPF_TSTAMP_NONE; 1998e4b3229aSAlexander V. Chernikov 1999e4b3229aSAlexander V. Chernikov BPFIF_RLOCK(bp); 2000e4b3229aSAlexander V. Chernikov 20014a3feeaaSRobert Watson LIST_FOREACH(d, &bp->bif_dlist, bd_next) { 2002e4b3229aSAlexander V. Chernikov /* 2003e4b3229aSAlexander V. Chernikov * We are not using any locks for d here because: 2004e4b3229aSAlexander V. Chernikov * 1) any filter change is protected by interface 2005e4b3229aSAlexander V. Chernikov * write lock 2006e4b3229aSAlexander V. Chernikov * 2) destroying/detaching d is protected by interface 2007e4b3229aSAlexander V. Chernikov * write lock, too 2008e4b3229aSAlexander V. Chernikov */ 2009e4b3229aSAlexander V. Chernikov 2010e4b3229aSAlexander V. Chernikov /* XXX: Do not protect counter for the sake of performance. */ 2011df8bae1dSRodney W. Grimes ++d->bd_rcount; 2012a05cf8c6SChristian S.J. Peron /* 2013a05cf8c6SChristian S.J. Peron * NB: We dont call BPF_CHECK_DIRECTION() here since there is no 2014a05cf8c6SChristian S.J. Peron * way for the caller to indiciate to us whether this packet 2015a05cf8c6SChristian S.J. Peron * is inbound or outbound. In the bpf_mtap() routines, we use 2016a05cf8c6SChristian S.J. Peron * the interface pointers on the mbuf to figure it out. 2017a05cf8c6SChristian S.J. Peron */ 2018ae275efcSJung-uk Kim #ifdef BPF_JITTER 2019a36599ccSJung-uk Kim bf = bpf_jitter_enable != 0 ? d->bd_bfilter : NULL; 2020a36599ccSJung-uk Kim if (bf != NULL) 2021a36599ccSJung-uk Kim slen = (*(bf->func))(pkt, pktlen, pktlen); 2022ae275efcSJung-uk Kim else 2023ae275efcSJung-uk Kim #endif 202493e39f0bSChristian S.J. Peron slen = bpf_filter(d->bd_rfilter, pkt, pktlen, pktlen); 2025ec272d87SRobert Watson if (slen != 0) { 2026e4b3229aSAlexander V. Chernikov /* 2027e4b3229aSAlexander V. Chernikov * Filter matches. Let's to acquire write lock. 2028e4b3229aSAlexander V. Chernikov */ 2029e4b3229aSAlexander V. Chernikov BPFD_WLOCK(d); 2030e4b3229aSAlexander V. Chernikov 203169f7644bSChristian S.J. Peron d->bd_fcount++; 2032253a3814SLawrence Stewart if (gottime < bpf_ts_quality(d->bd_tstamp)) 2033253a3814SLawrence Stewart gottime = bpf_gettime(&bt, d->bd_tstamp, NULL); 2034ec272d87SRobert Watson #ifdef MAC 203530d239bcSRobert Watson if (mac_bpfdesc_check_receive(d, bp->bif_ifp) == 0) 2036ec272d87SRobert Watson #endif 20374d621040SChristian S.J. Peron catchpacket(d, pkt, pktlen, slen, 2038547d94bdSJung-uk Kim bpf_append_bytes, &bt); 2039e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 2040ec272d87SRobert Watson } 2041df8bae1dSRodney W. Grimes } 2042e4b3229aSAlexander V. Chernikov BPFIF_RUNLOCK(bp); 2043df8bae1dSRodney W. Grimes } 2044df8bae1dSRodney W. Grimes 2045f81a2a49SJung-uk Kim #define BPF_CHECK_DIRECTION(d, r, i) \ 2046f81a2a49SJung-uk Kim (((d)->bd_direction == BPF_D_IN && (r) != (i)) || \ 2047f81a2a49SJung-uk Kim ((d)->bd_direction == BPF_D_OUT && (r) == (i))) 2048560a54e1SJung-uk Kim 2049df8bae1dSRodney W. Grimes /* 2050df8bae1dSRodney W. Grimes * Incoming linkage from device drivers, when packet is in an mbuf chain. 2051e4b3229aSAlexander V. Chernikov * Locking model is explained in bpf_tap(). 2052df8bae1dSRodney W. Grimes */ 2053df8bae1dSRodney W. Grimes void 205419ba8395SChristian S.J. Peron bpf_mtap(struct bpf_if *bp, struct mbuf *m) 2055df8bae1dSRodney W. Grimes { 2056547d94bdSJung-uk Kim struct bintime bt; 2057df8bae1dSRodney W. Grimes struct bpf_d *d; 2058a36599ccSJung-uk Kim #ifdef BPF_JITTER 2059a36599ccSJung-uk Kim bpf_jit_filter *bf; 2060a36599ccSJung-uk Kim #endif 2061253a3814SLawrence Stewart u_int pktlen, slen; 2062253a3814SLawrence Stewart int gottime; 206391433904SDavid Malone 20648cd892f7SJung-uk Kim /* Skip outgoing duplicate packets. */ 20658cd892f7SJung-uk Kim if ((m->m_flags & M_PROMISC) != 0 && m->m_pkthdr.rcvif == NULL) { 20668cd892f7SJung-uk Kim m->m_flags &= ~M_PROMISC; 20678cd892f7SJung-uk Kim return; 20688cd892f7SJung-uk Kim } 20698cd892f7SJung-uk Kim 2070f0e2422bSPoul-Henning Kamp pktlen = m_length(m, NULL); 2071253a3814SLawrence Stewart gottime = BPF_TSTAMP_NONE; 2072e4b3229aSAlexander V. Chernikov 2073e4b3229aSAlexander V. Chernikov BPFIF_RLOCK(bp); 2074e4b3229aSAlexander V. Chernikov 20754a3feeaaSRobert Watson LIST_FOREACH(d, &bp->bif_dlist, bd_next) { 2076f81a2a49SJung-uk Kim if (BPF_CHECK_DIRECTION(d, m->m_pkthdr.rcvif, bp->bif_ifp)) 20778ed3828cSRobert Watson continue; 2078df8bae1dSRodney W. Grimes ++d->bd_rcount; 2079ae275efcSJung-uk Kim #ifdef BPF_JITTER 2080a36599ccSJung-uk Kim bf = bpf_jitter_enable != 0 ? d->bd_bfilter : NULL; 2081ae275efcSJung-uk Kim /* XXX We cannot handle multiple mbufs. */ 2082a36599ccSJung-uk Kim if (bf != NULL && m->m_next == NULL) 2083a36599ccSJung-uk Kim slen = (*(bf->func))(mtod(m, u_char *), pktlen, pktlen); 2084ae275efcSJung-uk Kim else 2085ae275efcSJung-uk Kim #endif 208693e39f0bSChristian S.J. Peron slen = bpf_filter(d->bd_rfilter, (u_char *)m, pktlen, 0); 20874ddfb531SChristian S.J. Peron if (slen != 0) { 2088e4b3229aSAlexander V. Chernikov BPFD_WLOCK(d); 2089e4b3229aSAlexander V. Chernikov 209069f7644bSChristian S.J. Peron d->bd_fcount++; 2091253a3814SLawrence Stewart if (gottime < bpf_ts_quality(d->bd_tstamp)) 2092253a3814SLawrence Stewart gottime = bpf_gettime(&bt, d->bd_tstamp, m); 20930c7fb534SRobert Watson #ifdef MAC 209430d239bcSRobert Watson if (mac_bpfdesc_check_receive(d, bp->bif_ifp) == 0) 20950c7fb534SRobert Watson #endif 20960c7fb534SRobert Watson catchpacket(d, (u_char *)m, pktlen, slen, 2097547d94bdSJung-uk Kim bpf_append_mbuf, &bt); 2098e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 20994ddfb531SChristian S.J. Peron } 2100df8bae1dSRodney W. Grimes } 2101e4b3229aSAlexander V. Chernikov BPFIF_RUNLOCK(bp); 2102df8bae1dSRodney W. Grimes } 2103df8bae1dSRodney W. Grimes 2104df8bae1dSRodney W. Grimes /* 2105437ffe18SSam Leffler * Incoming linkage from device drivers, when packet is in 2106437ffe18SSam Leffler * an mbuf chain and to be prepended by a contiguous header. 2107437ffe18SSam Leffler */ 2108437ffe18SSam Leffler void 210919ba8395SChristian S.J. Peron bpf_mtap2(struct bpf_if *bp, void *data, u_int dlen, struct mbuf *m) 2110437ffe18SSam Leffler { 2111547d94bdSJung-uk Kim struct bintime bt; 2112437ffe18SSam Leffler struct mbuf mb; 2113437ffe18SSam Leffler struct bpf_d *d; 2114253a3814SLawrence Stewart u_int pktlen, slen; 2115253a3814SLawrence Stewart int gottime; 211691433904SDavid Malone 21178cd892f7SJung-uk Kim /* Skip outgoing duplicate packets. */ 21188cd892f7SJung-uk Kim if ((m->m_flags & M_PROMISC) != 0 && m->m_pkthdr.rcvif == NULL) { 21198cd892f7SJung-uk Kim m->m_flags &= ~M_PROMISC; 21208cd892f7SJung-uk Kim return; 21218cd892f7SJung-uk Kim } 21228cd892f7SJung-uk Kim 2123437ffe18SSam Leffler pktlen = m_length(m, NULL); 2124437ffe18SSam Leffler /* 2125437ffe18SSam Leffler * Craft on-stack mbuf suitable for passing to bpf_filter. 2126437ffe18SSam Leffler * Note that we cut corners here; we only setup what's 2127437ffe18SSam Leffler * absolutely needed--this mbuf should never go anywhere else. 2128437ffe18SSam Leffler */ 2129437ffe18SSam Leffler mb.m_next = m; 2130437ffe18SSam Leffler mb.m_data = data; 2131437ffe18SSam Leffler mb.m_len = dlen; 2132437ffe18SSam Leffler pktlen += dlen; 2133437ffe18SSam Leffler 2134253a3814SLawrence Stewart gottime = BPF_TSTAMP_NONE; 2135e4b3229aSAlexander V. Chernikov 2136e4b3229aSAlexander V. Chernikov BPFIF_RLOCK(bp); 2137e4b3229aSAlexander V. Chernikov 21384a3feeaaSRobert Watson LIST_FOREACH(d, &bp->bif_dlist, bd_next) { 2139f81a2a49SJung-uk Kim if (BPF_CHECK_DIRECTION(d, m->m_pkthdr.rcvif, bp->bif_ifp)) 2140437ffe18SSam Leffler continue; 2141437ffe18SSam Leffler ++d->bd_rcount; 214293e39f0bSChristian S.J. Peron slen = bpf_filter(d->bd_rfilter, (u_char *)&mb, pktlen, 0); 21434ddfb531SChristian S.J. Peron if (slen != 0) { 2144e4b3229aSAlexander V. Chernikov BPFD_WLOCK(d); 2145e4b3229aSAlexander V. Chernikov 214669f7644bSChristian S.J. Peron d->bd_fcount++; 2147253a3814SLawrence Stewart if (gottime < bpf_ts_quality(d->bd_tstamp)) 2148253a3814SLawrence Stewart gottime = bpf_gettime(&bt, d->bd_tstamp, m); 2149437ffe18SSam Leffler #ifdef MAC 215030d239bcSRobert Watson if (mac_bpfdesc_check_receive(d, bp->bif_ifp) == 0) 2151437ffe18SSam Leffler #endif 2152437ffe18SSam Leffler catchpacket(d, (u_char *)&mb, pktlen, slen, 2153547d94bdSJung-uk Kim bpf_append_mbuf, &bt); 2154e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 21554ddfb531SChristian S.J. Peron } 2156437ffe18SSam Leffler } 2157e4b3229aSAlexander V. Chernikov BPFIF_RUNLOCK(bp); 2158437ffe18SSam Leffler } 2159437ffe18SSam Leffler 2160560a54e1SJung-uk Kim #undef BPF_CHECK_DIRECTION 2161560a54e1SJung-uk Kim 2162253a3814SLawrence Stewart #undef BPF_TSTAMP_NONE 2163253a3814SLawrence Stewart #undef BPF_TSTAMP_FAST 2164253a3814SLawrence Stewart #undef BPF_TSTAMP_NORMAL 2165253a3814SLawrence Stewart #undef BPF_TSTAMP_EXTERN 2166253a3814SLawrence Stewart 2167547d94bdSJung-uk Kim static int 2168547d94bdSJung-uk Kim bpf_hdrlen(struct bpf_d *d) 2169547d94bdSJung-uk Kim { 2170547d94bdSJung-uk Kim int hdrlen; 2171547d94bdSJung-uk Kim 2172547d94bdSJung-uk Kim hdrlen = d->bd_bif->bif_hdrlen; 2173547d94bdSJung-uk Kim #ifndef BURN_BRIDGES 2174547d94bdSJung-uk Kim if (d->bd_tstamp == BPF_T_NONE || 2175547d94bdSJung-uk Kim BPF_T_FORMAT(d->bd_tstamp) == BPF_T_MICROTIME) 2176547d94bdSJung-uk Kim #ifdef COMPAT_FREEBSD32 2177547d94bdSJung-uk Kim if (d->bd_compat32) 2178547d94bdSJung-uk Kim hdrlen += SIZEOF_BPF_HDR(struct bpf_hdr32); 2179547d94bdSJung-uk Kim else 2180547d94bdSJung-uk Kim #endif 2181547d94bdSJung-uk Kim hdrlen += SIZEOF_BPF_HDR(struct bpf_hdr); 2182547d94bdSJung-uk Kim else 2183547d94bdSJung-uk Kim #endif 2184547d94bdSJung-uk Kim hdrlen += SIZEOF_BPF_HDR(struct bpf_xhdr); 2185547d94bdSJung-uk Kim #ifdef COMPAT_FREEBSD32 2186547d94bdSJung-uk Kim if (d->bd_compat32) 2187547d94bdSJung-uk Kim hdrlen = BPF_WORDALIGN32(hdrlen); 2188547d94bdSJung-uk Kim else 2189547d94bdSJung-uk Kim #endif 2190547d94bdSJung-uk Kim hdrlen = BPF_WORDALIGN(hdrlen); 2191547d94bdSJung-uk Kim 2192547d94bdSJung-uk Kim return (hdrlen - d->bd_bif->bif_hdrlen); 2193547d94bdSJung-uk Kim } 2194547d94bdSJung-uk Kim 2195547d94bdSJung-uk Kim static void 2196547d94bdSJung-uk Kim bpf_bintime2ts(struct bintime *bt, struct bpf_ts *ts, int tstype) 2197547d94bdSJung-uk Kim { 2198253a3814SLawrence Stewart struct bintime bt2; 2199547d94bdSJung-uk Kim struct timeval tsm; 2200547d94bdSJung-uk Kim struct timespec tsn; 2201547d94bdSJung-uk Kim 2202253a3814SLawrence Stewart if ((tstype & BPF_T_MONOTONIC) == 0) { 2203253a3814SLawrence Stewart bt2 = *bt; 2204253a3814SLawrence Stewart bintime_add(&bt2, &boottimebin); 2205253a3814SLawrence Stewart bt = &bt2; 2206253a3814SLawrence Stewart } 2207547d94bdSJung-uk Kim switch (BPF_T_FORMAT(tstype)) { 2208547d94bdSJung-uk Kim case BPF_T_MICROTIME: 2209547d94bdSJung-uk Kim bintime2timeval(bt, &tsm); 2210547d94bdSJung-uk Kim ts->bt_sec = tsm.tv_sec; 2211547d94bdSJung-uk Kim ts->bt_frac = tsm.tv_usec; 2212547d94bdSJung-uk Kim break; 2213547d94bdSJung-uk Kim case BPF_T_NANOTIME: 2214547d94bdSJung-uk Kim bintime2timespec(bt, &tsn); 2215547d94bdSJung-uk Kim ts->bt_sec = tsn.tv_sec; 2216547d94bdSJung-uk Kim ts->bt_frac = tsn.tv_nsec; 2217547d94bdSJung-uk Kim break; 2218547d94bdSJung-uk Kim case BPF_T_BINTIME: 2219547d94bdSJung-uk Kim ts->bt_sec = bt->sec; 2220547d94bdSJung-uk Kim ts->bt_frac = bt->frac; 2221547d94bdSJung-uk Kim break; 2222547d94bdSJung-uk Kim } 2223547d94bdSJung-uk Kim } 2224547d94bdSJung-uk Kim 2225437ffe18SSam Leffler /* 2226df8bae1dSRodney W. Grimes * Move the packet data from interface memory (pkt) into the 22279e610888SDag-Erling Smørgrav * store buffer. "cpfn" is the routine called to do the actual data 2228df8bae1dSRodney W. Grimes * transfer. bcopy is passed in to copy contiguous chunks, while 22294d621040SChristian S.J. Peron * bpf_append_mbuf is passed in to copy mbuf chains. In the latter case, 2230df8bae1dSRodney W. Grimes * pkt is really an mbuf. 2231df8bae1dSRodney W. Grimes */ 2232df8bae1dSRodney W. Grimes static void 223319ba8395SChristian S.J. Peron catchpacket(struct bpf_d *d, u_char *pkt, u_int pktlen, u_int snaplen, 22344d621040SChristian S.J. Peron void (*cpfn)(struct bpf_d *, caddr_t, u_int, void *, u_int), 2235547d94bdSJung-uk Kim struct bintime *bt) 2236df8bae1dSRodney W. Grimes { 2237547d94bdSJung-uk Kim struct bpf_xhdr hdr; 2238547d94bdSJung-uk Kim #ifndef BURN_BRIDGES 2239547d94bdSJung-uk Kim struct bpf_hdr hdr_old; 2240fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 2241547d94bdSJung-uk Kim struct bpf_hdr32 hdr32_old; 2242fc0a61a4SKonstantin Belousov #endif 2243547d94bdSJung-uk Kim #endif 2244547d94bdSJung-uk Kim int caplen, curlen, hdrlen, totlen; 22457819da79SJohn-Mark Gurney int do_wakeup = 0; 2246547d94bdSJung-uk Kim int do_timestamp; 2247547d94bdSJung-uk Kim int tstype; 22489e610888SDag-Erling Smørgrav 2249e4b3229aSAlexander V. Chernikov BPFD_WLOCK_ASSERT(d); 22504d621040SChristian S.J. Peron 22514d621040SChristian S.J. Peron /* 22524d621040SChristian S.J. Peron * Detect whether user space has released a buffer back to us, and if 22534d621040SChristian S.J. Peron * so, move it from being a hold buffer to a free buffer. This may 22544d621040SChristian S.J. Peron * not be the best place to do it (for example, we might only want to 22554d621040SChristian S.J. Peron * run this check if we need the space), but for now it's a reliable 22564d621040SChristian S.J. Peron * spot to do it. 22574d621040SChristian S.J. Peron */ 2258fa0c2b34SRobert Watson if (d->bd_fbuf == NULL && bpf_canfreebuf(d)) { 22594d621040SChristian S.J. Peron d->bd_fbuf = d->bd_hbuf; 22604d621040SChristian S.J. Peron d->bd_hbuf = NULL; 22614d621040SChristian S.J. Peron d->bd_hlen = 0; 226229f612ecSChristian S.J. Peron bpf_buf_reclaimed(d); 22634d621040SChristian S.J. Peron } 22644d621040SChristian S.J. Peron 2265df8bae1dSRodney W. Grimes /* 2266df8bae1dSRodney W. Grimes * Figure out how many bytes to move. If the packet is 2267df8bae1dSRodney W. Grimes * greater or equal to the snapshot length, transfer that 2268df8bae1dSRodney W. Grimes * much. Otherwise, transfer the whole packet (unless 2269df8bae1dSRodney W. Grimes * we hit the buffer size limit). 2270df8bae1dSRodney W. Grimes */ 2271547d94bdSJung-uk Kim hdrlen = bpf_hdrlen(d); 2272df8bae1dSRodney W. Grimes totlen = hdrlen + min(snaplen, pktlen); 2273df8bae1dSRodney W. Grimes if (totlen > d->bd_bufsize) 2274df8bae1dSRodney W. Grimes totlen = d->bd_bufsize; 2275df8bae1dSRodney W. Grimes 2276df8bae1dSRodney W. Grimes /* 2277df8bae1dSRodney W. Grimes * Round up the end of the previous packet to the next longword. 2278a7a91e65SRobert Watson * 2279a7a91e65SRobert Watson * Drop the packet if there's no room and no hope of room 2280a7a91e65SRobert Watson * If the packet would overflow the storage buffer or the storage 2281a7a91e65SRobert Watson * buffer is considered immutable by the buffer model, try to rotate 2282a7a91e65SRobert Watson * the buffer and wakeup pending processes. 2283df8bae1dSRodney W. Grimes */ 2284fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 2285fc0a61a4SKonstantin Belousov if (d->bd_compat32) 2286fc0a61a4SKonstantin Belousov curlen = BPF_WORDALIGN32(d->bd_slen); 2287fc0a61a4SKonstantin Belousov else 2288fc0a61a4SKonstantin Belousov #endif 2289df8bae1dSRodney W. Grimes curlen = BPF_WORDALIGN(d->bd_slen); 2290a7a91e65SRobert Watson if (curlen + totlen > d->bd_bufsize || !bpf_canwritebuf(d)) { 2291572bde2aSRobert Watson if (d->bd_fbuf == NULL) { 2292df8bae1dSRodney W. Grimes /* 2293a7a91e65SRobert Watson * There's no room in the store buffer, and no 2294a7a91e65SRobert Watson * prospect of room, so drop the packet. Notify the 2295a7a91e65SRobert Watson * buffer model. 2296df8bae1dSRodney W. Grimes */ 2297a7a91e65SRobert Watson bpf_buffull(d); 2298df8bae1dSRodney W. Grimes ++d->bd_dcount; 2299df8bae1dSRodney W. Grimes return; 2300df8bae1dSRodney W. Grimes } 2301df8bae1dSRodney W. Grimes ROTATE_BUFFERS(d); 23027819da79SJohn-Mark Gurney do_wakeup = 1; 2303df8bae1dSRodney W. Grimes curlen = 0; 2304a7a91e65SRobert Watson } else if (d->bd_immediate || d->bd_state == BPF_TIMED_OUT) 2305df8bae1dSRodney W. Grimes /* 23064d621040SChristian S.J. Peron * Immediate mode is set, or the read timeout has already 23074d621040SChristian S.J. Peron * expired during a select call. A packet arrived, so the 23084d621040SChristian S.J. Peron * reader should be woken up. 2309df8bae1dSRodney W. Grimes */ 23107819da79SJohn-Mark Gurney do_wakeup = 1; 2311547d94bdSJung-uk Kim caplen = totlen - hdrlen; 2312547d94bdSJung-uk Kim tstype = d->bd_tstamp; 2313547d94bdSJung-uk Kim do_timestamp = tstype != BPF_T_NONE; 2314547d94bdSJung-uk Kim #ifndef BURN_BRIDGES 2315547d94bdSJung-uk Kim if (tstype == BPF_T_NONE || BPF_T_FORMAT(tstype) == BPF_T_MICROTIME) { 2316547d94bdSJung-uk Kim struct bpf_ts ts; 2317547d94bdSJung-uk Kim if (do_timestamp) 2318547d94bdSJung-uk Kim bpf_bintime2ts(bt, &ts, tstype); 2319fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 2320fc0a61a4SKonstantin Belousov if (d->bd_compat32) { 2321547d94bdSJung-uk Kim bzero(&hdr32_old, sizeof(hdr32_old)); 2322547d94bdSJung-uk Kim if (do_timestamp) { 2323547d94bdSJung-uk Kim hdr32_old.bh_tstamp.tv_sec = ts.bt_sec; 2324547d94bdSJung-uk Kim hdr32_old.bh_tstamp.tv_usec = ts.bt_frac; 2325547d94bdSJung-uk Kim } 2326547d94bdSJung-uk Kim hdr32_old.bh_datalen = pktlen; 2327547d94bdSJung-uk Kim hdr32_old.bh_hdrlen = hdrlen; 2328547d94bdSJung-uk Kim hdr32_old.bh_caplen = caplen; 2329547d94bdSJung-uk Kim bpf_append_bytes(d, d->bd_sbuf, curlen, &hdr32_old, 2330547d94bdSJung-uk Kim sizeof(hdr32_old)); 2331547d94bdSJung-uk Kim goto copy; 2332547d94bdSJung-uk Kim } 2333547d94bdSJung-uk Kim #endif 2334547d94bdSJung-uk Kim bzero(&hdr_old, sizeof(hdr_old)); 2335547d94bdSJung-uk Kim if (do_timestamp) { 2336547d94bdSJung-uk Kim hdr_old.bh_tstamp.tv_sec = ts.bt_sec; 2337547d94bdSJung-uk Kim hdr_old.bh_tstamp.tv_usec = ts.bt_frac; 2338547d94bdSJung-uk Kim } 2339547d94bdSJung-uk Kim hdr_old.bh_datalen = pktlen; 2340547d94bdSJung-uk Kim hdr_old.bh_hdrlen = hdrlen; 2341547d94bdSJung-uk Kim hdr_old.bh_caplen = caplen; 2342547d94bdSJung-uk Kim bpf_append_bytes(d, d->bd_sbuf, curlen, &hdr_old, 2343547d94bdSJung-uk Kim sizeof(hdr_old)); 2344fc0a61a4SKonstantin Belousov goto copy; 2345fc0a61a4SKonstantin Belousov } 2346fc0a61a4SKonstantin Belousov #endif 2347df8bae1dSRodney W. Grimes 2348df8bae1dSRodney W. Grimes /* 23494d621040SChristian S.J. Peron * Append the bpf header. Note we append the actual header size, but 23504d621040SChristian S.J. Peron * move forward the length of the header plus padding. 2351df8bae1dSRodney W. Grimes */ 23524d621040SChristian S.J. Peron bzero(&hdr, sizeof(hdr)); 2353547d94bdSJung-uk Kim if (do_timestamp) 2354547d94bdSJung-uk Kim bpf_bintime2ts(bt, &hdr.bh_tstamp, tstype); 23554d621040SChristian S.J. Peron hdr.bh_datalen = pktlen; 23564d621040SChristian S.J. Peron hdr.bh_hdrlen = hdrlen; 2357547d94bdSJung-uk Kim hdr.bh_caplen = caplen; 23584d621040SChristian S.J. Peron bpf_append_bytes(d, d->bd_sbuf, curlen, &hdr, sizeof(hdr)); 23594d621040SChristian S.J. Peron 2360df8bae1dSRodney W. Grimes /* 2361df8bae1dSRodney W. Grimes * Copy the packet data into the store buffer and update its length. 2362df8bae1dSRodney W. Grimes */ 2363547d94bdSJung-uk Kim #ifndef BURN_BRIDGES 2364fc0a61a4SKonstantin Belousov copy: 2365fc0a61a4SKonstantin Belousov #endif 2366547d94bdSJung-uk Kim (*cpfn)(d, d->bd_sbuf, curlen + hdrlen, pkt, caplen); 2367df8bae1dSRodney W. Grimes d->bd_slen = curlen + totlen; 23687819da79SJohn-Mark Gurney 23697819da79SJohn-Mark Gurney if (do_wakeup) 23707819da79SJohn-Mark Gurney bpf_wakeup(d); 2371df8bae1dSRodney W. Grimes } 2372df8bae1dSRodney W. Grimes 2373df8bae1dSRodney W. Grimes /* 2374df8bae1dSRodney W. Grimes * Free buffers currently in use by a descriptor. 2375df8bae1dSRodney W. Grimes * Called on close. 2376df8bae1dSRodney W. Grimes */ 2377df8bae1dSRodney W. Grimes static void 237819ba8395SChristian S.J. Peron bpf_freed(struct bpf_d *d) 2379df8bae1dSRodney W. Grimes { 23804d621040SChristian S.J. Peron 2381df8bae1dSRodney W. Grimes /* 2382df8bae1dSRodney W. Grimes * We don't need to lock out interrupts since this descriptor has 2383df8bae1dSRodney W. Grimes * been detached from its interface and it yet hasn't been marked 2384df8bae1dSRodney W. Grimes * free. 2385df8bae1dSRodney W. Grimes */ 23864d621040SChristian S.J. Peron bpf_free(d); 238770485847SJung-uk Kim if (d->bd_rfilter != NULL) { 238893e39f0bSChristian S.J. Peron free((caddr_t)d->bd_rfilter, M_BPF); 2389ae275efcSJung-uk Kim #ifdef BPF_JITTER 239070485847SJung-uk Kim if (d->bd_bfilter != NULL) 2391ae275efcSJung-uk Kim bpf_destroy_jit_filter(d->bd_bfilter); 2392ae275efcSJung-uk Kim #endif 2393ae275efcSJung-uk Kim } 239470485847SJung-uk Kim if (d->bd_wfilter != NULL) 239593e39f0bSChristian S.J. Peron free((caddr_t)d->bd_wfilter, M_BPF); 2396e4b3229aSAlexander V. Chernikov rw_destroy(&d->bd_lock); 2397df8bae1dSRodney W. Grimes } 2398df8bae1dSRodney W. Grimes 2399df8bae1dSRodney W. Grimes /* 240024a229f4SSam Leffler * Attach an interface to bpf. dlt is the link layer type; hdrlen is the 240124a229f4SSam Leffler * fixed size of the link header (variable length headers not yet supported). 2402df8bae1dSRodney W. Grimes */ 2403df8bae1dSRodney W. Grimes void 240419ba8395SChristian S.J. Peron bpfattach(struct ifnet *ifp, u_int dlt, u_int hdrlen) 2405df8bae1dSRodney W. Grimes { 240624a229f4SSam Leffler 240724a229f4SSam Leffler bpfattach2(ifp, dlt, hdrlen, &ifp->if_bpf); 240824a229f4SSam Leffler } 240924a229f4SSam Leffler 241024a229f4SSam Leffler /* 241124a229f4SSam Leffler * Attach an interface to bpf. ifp is a pointer to the structure 241224a229f4SSam Leffler * defining the interface to be attached, dlt is the link layer type, 241324a229f4SSam Leffler * and hdrlen is the fixed size of the link header (variable length 241424a229f4SSam Leffler * headers are not yet supporrted). 241524a229f4SSam Leffler */ 241624a229f4SSam Leffler void 241719ba8395SChristian S.J. Peron bpfattach2(struct ifnet *ifp, u_int dlt, u_int hdrlen, struct bpf_if **driverp) 241824a229f4SSam Leffler { 2419df8bae1dSRodney W. Grimes struct bpf_if *bp; 242019ba8395SChristian S.J. Peron 242119ba8395SChristian S.J. Peron bp = malloc(sizeof(*bp), M_BPF, M_NOWAIT | M_ZERO); 2422572bde2aSRobert Watson if (bp == NULL) 2423df8bae1dSRodney W. Grimes panic("bpfattach"); 2424df8bae1dSRodney W. Grimes 24254a3feeaaSRobert Watson LIST_INIT(&bp->bif_dlist); 242651ec1eb7SAlexander V. Chernikov LIST_INIT(&bp->bif_wlist); 2427df8bae1dSRodney W. Grimes bp->bif_ifp = ifp; 2428df8bae1dSRodney W. Grimes bp->bif_dlt = dlt; 2429e4b3229aSAlexander V. Chernikov rw_init(&bp->bif_lock, "bpf interface lock"); 243016d878ccSChristian S.J. Peron KASSERT(*driverp == NULL, ("bpfattach2: driverp already initialized")); 243116d878ccSChristian S.J. Peron *driverp = bp; 2432df8bae1dSRodney W. Grimes 2433e4b3229aSAlexander V. Chernikov BPF_LOCK(); 24344a3feeaaSRobert Watson LIST_INSERT_HEAD(&bpf_iflist, bp, bif_next); 2435e4b3229aSAlexander V. Chernikov BPF_UNLOCK(); 2436df8bae1dSRodney W. Grimes 2437547d94bdSJung-uk Kim bp->bif_hdrlen = hdrlen; 2438df8bae1dSRodney W. Grimes 24392eeab939SGarrett Wollman if (bootverbose) 244024a229f4SSam Leffler if_printf(ifp, "bpf attached\n"); 2441df8bae1dSRodney W. Grimes } 244253ac6efbSJulian Elischer 2443de5d9935SRobert Watson /* 2444de5d9935SRobert Watson * Detach bpf from an interface. This involves detaching each descriptor 2445*6c74ff0eSAlexander V. Chernikov * associated with the interface. Notify each descriptor as it's detached 2446*6c74ff0eSAlexander V. Chernikov * so that any sleepers wake up and get ENXIO. 2447de5d9935SRobert Watson */ 2448de5d9935SRobert Watson void 244919ba8395SChristian S.J. Peron bpfdetach(struct ifnet *ifp) 2450de5d9935SRobert Watson { 24514a3feeaaSRobert Watson struct bpf_if *bp; 2452de5d9935SRobert Watson struct bpf_d *d; 24539a7e6bacSLawrence Stewart #ifdef INVARIANTS 24549a7e6bacSLawrence Stewart int ndetached; 2455de5d9935SRobert Watson 24569a7e6bacSLawrence Stewart ndetached = 0; 24579a7e6bacSLawrence Stewart #endif 24589a7e6bacSLawrence Stewart 24599a7e6bacSLawrence Stewart /* Find all bpf_if struct's which reference ifp and detach them. */ 24609a7e6bacSLawrence Stewart do { 2461e4b3229aSAlexander V. Chernikov BPF_LOCK(); 24624a3feeaaSRobert Watson LIST_FOREACH(bp, &bpf_iflist, bif_next) { 2463de5d9935SRobert Watson if (ifp == bp->bif_ifp) 2464de5d9935SRobert Watson break; 2465de5d9935SRobert Watson } 24669a7e6bacSLawrence Stewart if (bp != NULL) 24674a3feeaaSRobert Watson LIST_REMOVE(bp, bif_next); 2468e4b3229aSAlexander V. Chernikov BPF_UNLOCK(); 2469de5d9935SRobert Watson 24709a7e6bacSLawrence Stewart if (bp != NULL) { 24719a7e6bacSLawrence Stewart #ifdef INVARIANTS 24729a7e6bacSLawrence Stewart ndetached++; 24739a7e6bacSLawrence Stewart #endif 24744a3feeaaSRobert Watson while ((d = LIST_FIRST(&bp->bif_dlist)) != NULL) { 2475e7bb21b3SJonathan Lemon bpf_detachd(d); 2476e4b3229aSAlexander V. Chernikov BPFD_WLOCK(d); 2477e7bb21b3SJonathan Lemon bpf_wakeup(d); 2478e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 2479e7bb21b3SJonathan Lemon } 2480*6c74ff0eSAlexander V. Chernikov /* Free writer-only descriptors */ 2481*6c74ff0eSAlexander V. Chernikov while ((d = LIST_FIRST(&bp->bif_wlist)) != NULL) { 2482*6c74ff0eSAlexander V. Chernikov bpf_detachd(d); 2483*6c74ff0eSAlexander V. Chernikov BPFD_WLOCK(d); 2484*6c74ff0eSAlexander V. Chernikov bpf_wakeup(d); 2485*6c74ff0eSAlexander V. Chernikov BPFD_WUNLOCK(d); 2486*6c74ff0eSAlexander V. Chernikov } 2487e4b3229aSAlexander V. Chernikov rw_destroy(&bp->bif_lock); 2488de5d9935SRobert Watson free(bp, M_BPF); 24898eab61f3SSam Leffler } 24909a7e6bacSLawrence Stewart } while (bp != NULL); 24919a7e6bacSLawrence Stewart 24929a7e6bacSLawrence Stewart #ifdef INVARIANTS 24939a7e6bacSLawrence Stewart if (ndetached == 0) 24949a7e6bacSLawrence Stewart printf("bpfdetach: %s was not attached\n", ifp->if_xname); 24959a7e6bacSLawrence Stewart #endif 24969a7e6bacSLawrence Stewart } 2497de5d9935SRobert Watson 24988eab61f3SSam Leffler /* 24998eab61f3SSam Leffler * Get a list of available data link type of the interface. 25008eab61f3SSam Leffler */ 25018eab61f3SSam Leffler static int 250219ba8395SChristian S.J. Peron bpf_getdltlist(struct bpf_d *d, struct bpf_dltlist *bfl) 25038eab61f3SSam Leffler { 25048eab61f3SSam Leffler int n, error; 25058eab61f3SSam Leffler struct ifnet *ifp; 25068eab61f3SSam Leffler struct bpf_if *bp; 25078eab61f3SSam Leffler 25088eab61f3SSam Leffler ifp = d->bd_bif->bif_ifp; 25098eab61f3SSam Leffler n = 0; 25108eab61f3SSam Leffler error = 0; 2511e4b3229aSAlexander V. Chernikov BPF_LOCK(); 25124a3feeaaSRobert Watson LIST_FOREACH(bp, &bpf_iflist, bif_next) { 25138eab61f3SSam Leffler if (bp->bif_ifp != ifp) 25148eab61f3SSam Leffler continue; 25158eab61f3SSam Leffler if (bfl->bfl_list != NULL) { 25168eab61f3SSam Leffler if (n >= bfl->bfl_len) { 2517e4b3229aSAlexander V. Chernikov BPF_UNLOCK(); 25188eab61f3SSam Leffler return (ENOMEM); 25198eab61f3SSam Leffler } 25208eab61f3SSam Leffler error = copyout(&bp->bif_dlt, 25218eab61f3SSam Leffler bfl->bfl_list + n, sizeof(u_int)); 25228eab61f3SSam Leffler } 25238eab61f3SSam Leffler n++; 25248eab61f3SSam Leffler } 2525e4b3229aSAlexander V. Chernikov BPF_UNLOCK(); 25268eab61f3SSam Leffler bfl->bfl_len = n; 25278eab61f3SSam Leffler return (error); 25288eab61f3SSam Leffler } 25298eab61f3SSam Leffler 25308eab61f3SSam Leffler /* 25318eab61f3SSam Leffler * Set the data link type of a BPF instance. 25328eab61f3SSam Leffler */ 25338eab61f3SSam Leffler static int 253419ba8395SChristian S.J. Peron bpf_setdlt(struct bpf_d *d, u_int dlt) 25358eab61f3SSam Leffler { 25368eab61f3SSam Leffler int error, opromisc; 25378eab61f3SSam Leffler struct ifnet *ifp; 25388eab61f3SSam Leffler struct bpf_if *bp; 25398eab61f3SSam Leffler 2540*6c74ff0eSAlexander V. Chernikov BPF_LOCK_ASSERT(); 2541*6c74ff0eSAlexander V. Chernikov 25428eab61f3SSam Leffler if (d->bd_bif->bif_dlt == dlt) 25438eab61f3SSam Leffler return (0); 25448eab61f3SSam Leffler ifp = d->bd_bif->bif_ifp; 2545*6c74ff0eSAlexander V. Chernikov 25464a3feeaaSRobert Watson LIST_FOREACH(bp, &bpf_iflist, bif_next) { 25478eab61f3SSam Leffler if (bp->bif_ifp == ifp && bp->bif_dlt == dlt) 25488eab61f3SSam Leffler break; 25498eab61f3SSam Leffler } 2550*6c74ff0eSAlexander V. Chernikov 25518eab61f3SSam Leffler if (bp != NULL) { 25528eab61f3SSam Leffler opromisc = d->bd_promisc; 25538eab61f3SSam Leffler bpf_attachd(d, bp); 2554e4b3229aSAlexander V. Chernikov BPFD_WLOCK(d); 25558eab61f3SSam Leffler reset_d(d); 2556e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(d); 25578eab61f3SSam Leffler if (opromisc) { 25588eab61f3SSam Leffler error = ifpromisc(bp->bif_ifp, 1); 25598eab61f3SSam Leffler if (error) 25608eab61f3SSam Leffler if_printf(bp->bif_ifp, 25618eab61f3SSam Leffler "bpf_setdlt: ifpromisc failed (%d)\n", 25628eab61f3SSam Leffler error); 25638eab61f3SSam Leffler else 25648eab61f3SSam Leffler d->bd_promisc = 1; 25658eab61f3SSam Leffler } 25668eab61f3SSam Leffler } 25678eab61f3SSam Leffler return (bp == NULL ? EINVAL : 0); 2568de5d9935SRobert Watson } 2569de5d9935SRobert Watson 25703f54a085SPoul-Henning Kamp static void 257119ba8395SChristian S.J. Peron bpf_drvinit(void *unused) 257253ac6efbSJulian Elischer { 2573136600feSEd Schouten struct cdev *dev; 257453ac6efbSJulian Elischer 25756008862bSJohn Baldwin mtx_init(&bpf_mtx, "bpf global lock", NULL, MTX_DEF); 25764a3feeaaSRobert Watson LIST_INIT(&bpf_iflist); 2577136600feSEd Schouten 2578136600feSEd Schouten dev = make_dev(&bpf_cdevsw, 0, UID_ROOT, GID_WHEEL, 0600, "bpf"); 2579136600feSEd Schouten /* For compatibility */ 2580136600feSEd Schouten make_dev_alias(dev, "bpf0"); 25817198bf47SJulian Elischer } 258253ac6efbSJulian Elischer 25830e37f3e1SChristian S.J. Peron /* 25840e37f3e1SChristian S.J. Peron * Zero out the various packet counters associated with all of the bpf 25850e37f3e1SChristian S.J. Peron * descriptors. At some point, we will probably want to get a bit more 25860e37f3e1SChristian S.J. Peron * granular and allow the user to specify descriptors to be zeroed. 25870e37f3e1SChristian S.J. Peron */ 25880e37f3e1SChristian S.J. Peron static void 25890e37f3e1SChristian S.J. Peron bpf_zero_counters(void) 25900e37f3e1SChristian S.J. Peron { 25910e37f3e1SChristian S.J. Peron struct bpf_if *bp; 25920e37f3e1SChristian S.J. Peron struct bpf_d *bd; 25930e37f3e1SChristian S.J. Peron 2594e4b3229aSAlexander V. Chernikov BPF_LOCK(); 25950e37f3e1SChristian S.J. Peron LIST_FOREACH(bp, &bpf_iflist, bif_next) { 2596e4b3229aSAlexander V. Chernikov BPFIF_RLOCK(bp); 25970e37f3e1SChristian S.J. Peron LIST_FOREACH(bd, &bp->bif_dlist, bd_next) { 2598e4b3229aSAlexander V. Chernikov BPFD_WLOCK(bd); 25990e37f3e1SChristian S.J. Peron bd->bd_rcount = 0; 26000e37f3e1SChristian S.J. Peron bd->bd_dcount = 0; 26010e37f3e1SChristian S.J. Peron bd->bd_fcount = 0; 26020e37f3e1SChristian S.J. Peron bd->bd_wcount = 0; 26030e37f3e1SChristian S.J. Peron bd->bd_wfcount = 0; 26040e37f3e1SChristian S.J. Peron bd->bd_zcopy = 0; 2605e4b3229aSAlexander V. Chernikov BPFD_WUNLOCK(bd); 26060e37f3e1SChristian S.J. Peron } 2607e4b3229aSAlexander V. Chernikov BPFIF_RUNLOCK(bp); 26080e37f3e1SChristian S.J. Peron } 2609e4b3229aSAlexander V. Chernikov BPF_UNLOCK(); 26100e37f3e1SChristian S.J. Peron } 26110e37f3e1SChristian S.J. Peron 2612*6c74ff0eSAlexander V. Chernikov /* 2613*6c74ff0eSAlexander V. Chernikov * Fill filter statistics 2614*6c74ff0eSAlexander V. Chernikov */ 261569f7644bSChristian S.J. Peron static void 261669f7644bSChristian S.J. Peron bpfstats_fill_xbpf(struct xbpf_d *d, struct bpf_d *bd) 261769f7644bSChristian S.J. Peron { 261869f7644bSChristian S.J. Peron 261969f7644bSChristian S.J. Peron bzero(d, sizeof(*d)); 262069f7644bSChristian S.J. Peron BPFD_LOCK_ASSERT(bd); 26214d621040SChristian S.J. Peron d->bd_structsize = sizeof(*d); 2622*6c74ff0eSAlexander V. Chernikov /* XXX: reading should be protected by global lock */ 262369f7644bSChristian S.J. Peron d->bd_immediate = bd->bd_immediate; 262469f7644bSChristian S.J. Peron d->bd_promisc = bd->bd_promisc; 262569f7644bSChristian S.J. Peron d->bd_hdrcmplt = bd->bd_hdrcmplt; 2626560a54e1SJung-uk Kim d->bd_direction = bd->bd_direction; 2627560a54e1SJung-uk Kim d->bd_feedback = bd->bd_feedback; 262869f7644bSChristian S.J. Peron d->bd_async = bd->bd_async; 262969f7644bSChristian S.J. Peron d->bd_rcount = bd->bd_rcount; 263069f7644bSChristian S.J. Peron d->bd_dcount = bd->bd_dcount; 263169f7644bSChristian S.J. Peron d->bd_fcount = bd->bd_fcount; 263269f7644bSChristian S.J. Peron d->bd_sig = bd->bd_sig; 263369f7644bSChristian S.J. Peron d->bd_slen = bd->bd_slen; 263469f7644bSChristian S.J. Peron d->bd_hlen = bd->bd_hlen; 263569f7644bSChristian S.J. Peron d->bd_bufsize = bd->bd_bufsize; 263669f7644bSChristian S.J. Peron d->bd_pid = bd->bd_pid; 263769f7644bSChristian S.J. Peron strlcpy(d->bd_ifname, 263869f7644bSChristian S.J. Peron bd->bd_bif->bif_ifp->if_xname, IFNAMSIZ); 263993e39f0bSChristian S.J. Peron d->bd_locked = bd->bd_locked; 26404d621040SChristian S.J. Peron d->bd_wcount = bd->bd_wcount; 26414d621040SChristian S.J. Peron d->bd_wdcount = bd->bd_wdcount; 26424d621040SChristian S.J. Peron d->bd_wfcount = bd->bd_wfcount; 26434d621040SChristian S.J. Peron d->bd_zcopy = bd->bd_zcopy; 26444d621040SChristian S.J. Peron d->bd_bufmode = bd->bd_bufmode; 264569f7644bSChristian S.J. Peron } 264669f7644bSChristian S.J. Peron 2647*6c74ff0eSAlexander V. Chernikov /* 2648*6c74ff0eSAlexander V. Chernikov * Handle `netstat -B' stats request 2649*6c74ff0eSAlexander V. Chernikov */ 265069f7644bSChristian S.J. Peron static int 265169f7644bSChristian S.J. Peron bpf_stats_sysctl(SYSCTL_HANDLER_ARGS) 265269f7644bSChristian S.J. Peron { 26530e37f3e1SChristian S.J. Peron struct xbpf_d *xbdbuf, *xbd, zerostats; 2654422a63daSChristian S.J. Peron int index, error; 265569f7644bSChristian S.J. Peron struct bpf_if *bp; 265669f7644bSChristian S.J. Peron struct bpf_d *bd; 265769f7644bSChristian S.J. Peron 265869f7644bSChristian S.J. Peron /* 265969f7644bSChristian S.J. Peron * XXX This is not technically correct. It is possible for non 266069f7644bSChristian S.J. Peron * privileged users to open bpf devices. It would make sense 266169f7644bSChristian S.J. Peron * if the users who opened the devices were able to retrieve 266269f7644bSChristian S.J. Peron * the statistics for them, too. 266369f7644bSChristian S.J. Peron */ 2664acd3428bSRobert Watson error = priv_check(req->td, PRIV_NET_BPF); 266569f7644bSChristian S.J. Peron if (error) 266669f7644bSChristian S.J. Peron return (error); 26670e37f3e1SChristian S.J. Peron /* 26680e37f3e1SChristian S.J. Peron * Check to see if the user is requesting that the counters be 26690e37f3e1SChristian S.J. Peron * zeroed out. Explicitly check that the supplied data is zeroed, 26700e37f3e1SChristian S.J. Peron * as we aren't allowing the user to set the counters currently. 26710e37f3e1SChristian S.J. Peron */ 26720e37f3e1SChristian S.J. Peron if (req->newptr != NULL) { 26730e37f3e1SChristian S.J. Peron if (req->newlen != sizeof(zerostats)) 26740e37f3e1SChristian S.J. Peron return (EINVAL); 26750e37f3e1SChristian S.J. Peron bzero(&zerostats, sizeof(zerostats)); 26760e37f3e1SChristian S.J. Peron xbd = req->newptr; 26770e37f3e1SChristian S.J. Peron if (bcmp(xbd, &zerostats, sizeof(*xbd)) != 0) 26780e37f3e1SChristian S.J. Peron return (EINVAL); 26790e37f3e1SChristian S.J. Peron bpf_zero_counters(); 26800e37f3e1SChristian S.J. Peron return (0); 26810e37f3e1SChristian S.J. Peron } 268269f7644bSChristian S.J. Peron if (req->oldptr == NULL) 2683422a63daSChristian S.J. Peron return (SYSCTL_OUT(req, 0, bpf_bpfd_cnt * sizeof(*xbd))); 268469f7644bSChristian S.J. Peron if (bpf_bpfd_cnt == 0) 268569f7644bSChristian S.J. Peron return (SYSCTL_OUT(req, 0, 0)); 2686422a63daSChristian S.J. Peron xbdbuf = malloc(req->oldlen, M_BPF, M_WAITOK); 2687e4b3229aSAlexander V. Chernikov BPF_LOCK(); 2688422a63daSChristian S.J. Peron if (req->oldlen < (bpf_bpfd_cnt * sizeof(*xbd))) { 2689e4b3229aSAlexander V. Chernikov BPF_UNLOCK(); 2690422a63daSChristian S.J. Peron free(xbdbuf, M_BPF); 2691422a63daSChristian S.J. Peron return (ENOMEM); 2692422a63daSChristian S.J. Peron } 2693422a63daSChristian S.J. Peron index = 0; 269469f7644bSChristian S.J. Peron LIST_FOREACH(bp, &bpf_iflist, bif_next) { 2695e4b3229aSAlexander V. Chernikov BPFIF_RLOCK(bp); 269651ec1eb7SAlexander V. Chernikov /* Send writers-only first */ 269751ec1eb7SAlexander V. Chernikov LIST_FOREACH(bd, &bp->bif_wlist, bd_next) { 269851ec1eb7SAlexander V. Chernikov xbd = &xbdbuf[index++]; 269951ec1eb7SAlexander V. Chernikov BPFD_RLOCK(bd); 270051ec1eb7SAlexander V. Chernikov bpfstats_fill_xbpf(xbd, bd); 270151ec1eb7SAlexander V. Chernikov BPFD_RUNLOCK(bd); 270251ec1eb7SAlexander V. Chernikov } 270369f7644bSChristian S.J. Peron LIST_FOREACH(bd, &bp->bif_dlist, bd_next) { 2704422a63daSChristian S.J. Peron xbd = &xbdbuf[index++]; 2705e4b3229aSAlexander V. Chernikov BPFD_RLOCK(bd); 2706422a63daSChristian S.J. Peron bpfstats_fill_xbpf(xbd, bd); 2707e4b3229aSAlexander V. Chernikov BPFD_RUNLOCK(bd); 270869f7644bSChristian S.J. Peron } 2709e4b3229aSAlexander V. Chernikov BPFIF_RUNLOCK(bp); 271069f7644bSChristian S.J. Peron } 2711e4b3229aSAlexander V. Chernikov BPF_UNLOCK(); 2712422a63daSChristian S.J. Peron error = SYSCTL_OUT(req, xbdbuf, index * sizeof(*xbd)); 2713422a63daSChristian S.J. Peron free(xbdbuf, M_BPF); 271469f7644bSChristian S.J. Peron return (error); 271569f7644bSChristian S.J. Peron } 271669f7644bSChristian S.J. Peron 2717237fdd78SRobert Watson SYSINIT(bpfdev,SI_SUB_DRIVERS,SI_ORDER_MIDDLE,bpf_drvinit,NULL); 271853ac6efbSJulian Elischer 27195bb5f2c9SPeter Wemm #else /* !DEV_BPF && !NETGRAPH_BPF */ 2720f8dc4716SMike Smith /* 2721f8dc4716SMike Smith * NOP stubs to allow bpf-using drivers to load and function. 2722f8dc4716SMike Smith * 2723f8dc4716SMike Smith * A 'better' implementation would allow the core bpf functionality 2724f8dc4716SMike Smith * to be loaded at runtime. 2725f8dc4716SMike Smith */ 27267eae78a4SChristian S.J. Peron static struct bpf_if bp_null; 2727f8dc4716SMike Smith 2728f8dc4716SMike Smith void 272919ba8395SChristian S.J. Peron bpf_tap(struct bpf_if *bp, u_char *pkt, u_int pktlen) 2730f8dc4716SMike Smith { 2731f8dc4716SMike Smith } 2732f8dc4716SMike Smith 2733f8dc4716SMike Smith void 273419ba8395SChristian S.J. Peron bpf_mtap(struct bpf_if *bp, struct mbuf *m) 2735f8dc4716SMike Smith { 2736f8dc4716SMike Smith } 2737f8dc4716SMike Smith 2738f8dc4716SMike Smith void 273919ba8395SChristian S.J. Peron bpf_mtap2(struct bpf_if *bp, void *d, u_int l, struct mbuf *m) 2740437ffe18SSam Leffler { 2741437ffe18SSam Leffler } 2742437ffe18SSam Leffler 2743437ffe18SSam Leffler void 274419ba8395SChristian S.J. Peron bpfattach(struct ifnet *ifp, u_int dlt, u_int hdrlen) 2745f8dc4716SMike Smith { 27467eae78a4SChristian S.J. Peron 27477eae78a4SChristian S.J. Peron bpfattach2(ifp, dlt, hdrlen, &ifp->if_bpf); 2748f8dc4716SMike Smith } 2749f8dc4716SMike Smith 2750da626c17SBill Paul void 275119ba8395SChristian S.J. Peron bpfattach2(struct ifnet *ifp, u_int dlt, u_int hdrlen, struct bpf_if **driverp) 27525f7a7923SSam Leffler { 27537eae78a4SChristian S.J. Peron 27547eae78a4SChristian S.J. Peron *driverp = &bp_null; 27555f7a7923SSam Leffler } 27565f7a7923SSam Leffler 27575f7a7923SSam Leffler void 275819ba8395SChristian S.J. Peron bpfdetach(struct ifnet *ifp) 2759da626c17SBill Paul { 2760da626c17SBill Paul } 2761da626c17SBill Paul 2762f8dc4716SMike Smith u_int 276319ba8395SChristian S.J. Peron bpf_filter(const struct bpf_insn *pc, u_char *p, u_int wirelen, u_int buflen) 2764f8dc4716SMike Smith { 2765f8dc4716SMike Smith return -1; /* "no filter" behaviour */ 2766f8dc4716SMike Smith } 2767f8dc4716SMike Smith 27685bb5f2c9SPeter Wemm int 276919ba8395SChristian S.J. Peron bpf_validate(const struct bpf_insn *f, int len) 27705bb5f2c9SPeter Wemm { 27715bb5f2c9SPeter Wemm return 0; /* false */ 27725bb5f2c9SPeter Wemm } 27735bb5f2c9SPeter Wemm 27745bb5f2c9SPeter Wemm #endif /* !DEV_BPF && !NETGRAPH_BPF */ 2775