1c398230bSWarner Losh /*- 2df8bae1dSRodney W. Grimes * Copyright (c) 1990, 1991, 1993 3253a3814SLawrence Stewart * The Regents of the University of California. All rights reserved. 4df8bae1dSRodney W. Grimes * 5df8bae1dSRodney W. Grimes * This code is derived from the Stanford/CMU enet packet filter, 6df8bae1dSRodney W. Grimes * (net/enet.c) distributed as part of 4.3BSD, and code contributed 7df8bae1dSRodney W. Grimes * to Berkeley by Steven McCanne and Van Jacobson both of Lawrence 8df8bae1dSRodney W. Grimes * Berkeley Laboratory. 9df8bae1dSRodney W. Grimes * 10df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 11df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 12df8bae1dSRodney W. Grimes * are met: 13df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 14df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 15df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 16df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 17df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 18fbbd9655SWarner Losh * 3. Neither the name of the University nor the names of its contributors 19df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 20df8bae1dSRodney W. Grimes * without specific prior written permission. 21df8bae1dSRodney W. Grimes * 22df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 23df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 24df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 25df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 26df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 27df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 28df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 29df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 30df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 31df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 32df8bae1dSRodney W. Grimes * SUCH DAMAGE. 33df8bae1dSRodney W. Grimes * 344f252c4dSRuslan Ermilov * @(#)bpf.c 8.4 (Berkeley) 1/9/95 35df8bae1dSRodney W. Grimes */ 36df8bae1dSRodney W. Grimes 37c7866007SRobert Watson #include <sys/cdefs.h> 38c7866007SRobert Watson __FBSDID("$FreeBSD$"); 39c7866007SRobert Watson 405bb5f2c9SPeter Wemm #include "opt_bpf.h" 41fc0a61a4SKonstantin Belousov #include "opt_compat.h" 4205fc4164SBjoern A. Zeeb #include "opt_ddb.h" 435bb5f2c9SPeter Wemm #include "opt_netgraph.h" 44df8bae1dSRodney W. Grimes 4595aab9ccSJohn-Mark Gurney #include <sys/types.h> 46df8bae1dSRodney W. Grimes #include <sys/param.h> 47e4b3229aSAlexander V. Chernikov #include <sys/lock.h> 48e4b3229aSAlexander V. Chernikov #include <sys/rwlock.h> 49df8bae1dSRodney W. Grimes #include <sys/systm.h> 50ce7609a4SBruce Evans #include <sys/conf.h> 51e76eee55SPoul-Henning Kamp #include <sys/fcntl.h> 52ebd8672cSBjoern A. Zeeb #include <sys/jail.h> 534d1d4912SBruce Evans #include <sys/malloc.h> 54df8bae1dSRodney W. Grimes #include <sys/mbuf.h> 55df8bae1dSRodney W. Grimes #include <sys/time.h> 56acd3428bSRobert Watson #include <sys/priv.h> 57df8bae1dSRodney W. Grimes #include <sys/proc.h> 580310c19fSBruce Evans #include <sys/signalvar.h> 59528f627fSBruce Evans #include <sys/filio.h> 60528f627fSBruce Evans #include <sys/sockio.h> 61528f627fSBruce Evans #include <sys/ttycom.h> 62e76eee55SPoul-Henning Kamp #include <sys/uio.h> 63df8bae1dSRodney W. Grimes 6495aab9ccSJohn-Mark Gurney #include <sys/event.h> 6595aab9ccSJohn-Mark Gurney #include <sys/file.h> 66243ac7d8SPeter Wemm #include <sys/poll.h> 6795aab9ccSJohn-Mark Gurney #include <sys/proc.h> 68df8bae1dSRodney W. Grimes 69df8bae1dSRodney W. Grimes #include <sys/socket.h> 70df8bae1dSRodney W. Grimes 7105fc4164SBjoern A. Zeeb #ifdef DDB 7205fc4164SBjoern A. Zeeb #include <ddb/ddb.h> 7305fc4164SBjoern A. Zeeb #endif 7405fc4164SBjoern A. Zeeb 75fba9235dSBruce Evans #include <net/if.h> 7676039bc8SGleb Smirnoff #include <net/if_var.h> 774fb3a820SAlexander V. Chernikov #include <net/if_dl.h> 78df8bae1dSRodney W. Grimes #include <net/bpf.h> 794d621040SChristian S.J. Peron #include <net/bpf_buffer.h> 80ae275efcSJung-uk Kim #ifdef BPF_JITTER 81ae275efcSJung-uk Kim #include <net/bpf_jitter.h> 82ae275efcSJung-uk Kim #endif 834d621040SChristian S.J. Peron #include <net/bpf_zerocopy.h> 84df8bae1dSRodney W. Grimes #include <net/bpfdesc.h> 854fb3a820SAlexander V. Chernikov #include <net/route.h> 86530c0060SRobert Watson #include <net/vnet.h> 87df8bae1dSRodney W. Grimes 88df8bae1dSRodney W. Grimes #include <netinet/in.h> 89df8bae1dSRodney W. Grimes #include <netinet/if_ether.h> 90df8bae1dSRodney W. Grimes #include <sys/kernel.h> 91f708ef1bSPoul-Henning Kamp #include <sys/sysctl.h> 927b778b5eSEivind Eklund 93246b5467SSam Leffler #include <net80211/ieee80211_freebsd.h> 94246b5467SSam Leffler 95aed55708SRobert Watson #include <security/mac/mac_framework.h> 96aed55708SRobert Watson 974d621040SChristian S.J. Peron MALLOC_DEFINE(M_BPF, "BPF", "BPF data"); 9887f6c662SJulian Elischer 99b23cbbe6SMark Johnston struct bpf_if { 100b23cbbe6SMark Johnston #define bif_next bif_ext.bif_next 101b23cbbe6SMark Johnston #define bif_dlist bif_ext.bif_dlist 102b23cbbe6SMark Johnston struct bpf_if_ext bif_ext; /* public members */ 103b23cbbe6SMark Johnston u_int bif_dlt; /* link layer type */ 104b23cbbe6SMark Johnston u_int bif_hdrlen; /* length of link header */ 105b23cbbe6SMark Johnston struct ifnet *bif_ifp; /* corresponding interface */ 106b23cbbe6SMark Johnston struct rwlock bif_lock; /* interface lock */ 107b23cbbe6SMark Johnston LIST_HEAD(, bpf_d) bif_wlist; /* writer-only list */ 108b23cbbe6SMark Johnston int bif_flags; /* Interface flags */ 109*9ce40d32SKristof Provost struct bpf_if **bif_bpf; /* Pointer to pointer to us */ 110b23cbbe6SMark Johnston }; 111b23cbbe6SMark Johnston 112b23cbbe6SMark Johnston CTASSERT(offsetof(struct bpf_if, bif_ext) == 0); 113b23cbbe6SMark Johnston 1145bb5f2c9SPeter Wemm #if defined(DEV_BPF) || defined(NETGRAPH_BPF) 11553ac6efbSJulian Elischer 116df8bae1dSRodney W. Grimes #define PRINET 26 /* interruptible */ 117df8bae1dSRodney W. Grimes 118547d94bdSJung-uk Kim #define SIZEOF_BPF_HDR(type) \ 119547d94bdSJung-uk Kim (offsetof(type, bh_hdrlen) + sizeof(((type *)0)->bh_hdrlen)) 120547d94bdSJung-uk Kim 121fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 122fc0a61a4SKonstantin Belousov #include <sys/mount.h> 123fc0a61a4SKonstantin Belousov #include <compat/freebsd32/freebsd32.h> 124fc0a61a4SKonstantin Belousov #define BPF_ALIGNMENT32 sizeof(int32_t) 125d9c9c81cSPedro F. Giffuni #define BPF_WORDALIGN32(x) roundup2(x, BPF_ALIGNMENT32) 126fc0a61a4SKonstantin Belousov 127547d94bdSJung-uk Kim #ifndef BURN_BRIDGES 128fc0a61a4SKonstantin Belousov /* 129fc0a61a4SKonstantin Belousov * 32-bit version of structure prepended to each packet. We use this header 130fc0a61a4SKonstantin Belousov * instead of the standard one for 32-bit streams. We mark the a stream as 131fc0a61a4SKonstantin Belousov * 32-bit the first time we see a 32-bit compat ioctl request. 132fc0a61a4SKonstantin Belousov */ 133fc0a61a4SKonstantin Belousov struct bpf_hdr32 { 134fc0a61a4SKonstantin Belousov struct timeval32 bh_tstamp; /* time stamp */ 135fc0a61a4SKonstantin Belousov uint32_t bh_caplen; /* length of captured portion */ 136fc0a61a4SKonstantin Belousov uint32_t bh_datalen; /* original length of packet */ 137fc0a61a4SKonstantin Belousov uint16_t bh_hdrlen; /* length of bpf header (this struct 138fc0a61a4SKonstantin Belousov plus alignment padding) */ 139fc0a61a4SKonstantin Belousov }; 140253a3814SLawrence Stewart #endif 141fc0a61a4SKonstantin Belousov 142fc0a61a4SKonstantin Belousov struct bpf_program32 { 143fc0a61a4SKonstantin Belousov u_int bf_len; 144fc0a61a4SKonstantin Belousov uint32_t bf_insns; 145fc0a61a4SKonstantin Belousov }; 146fc0a61a4SKonstantin Belousov 147fc0a61a4SKonstantin Belousov struct bpf_dltlist32 { 148fc0a61a4SKonstantin Belousov u_int bfl_len; 149fc0a61a4SKonstantin Belousov u_int bfl_list; 150fc0a61a4SKonstantin Belousov }; 151fc0a61a4SKonstantin Belousov 152fc0a61a4SKonstantin Belousov #define BIOCSETF32 _IOW('B', 103, struct bpf_program32) 153fc0a61a4SKonstantin Belousov #define BIOCSRTIMEOUT32 _IOW('B', 109, struct timeval32) 154fc0a61a4SKonstantin Belousov #define BIOCGRTIMEOUT32 _IOR('B', 110, struct timeval32) 155fc0a61a4SKonstantin Belousov #define BIOCGDLTLIST32 _IOWR('B', 121, struct bpf_dltlist32) 156fc0a61a4SKonstantin Belousov #define BIOCSETWF32 _IOW('B', 123, struct bpf_program32) 157fc0a61a4SKonstantin Belousov #define BIOCSETFNR32 _IOW('B', 130, struct bpf_program32) 158253a3814SLawrence Stewart #endif 159fc0a61a4SKonstantin Belousov 160df8bae1dSRodney W. Grimes /* 161d1a67300SRobert Watson * bpf_iflist is a list of BPF interface structures, each corresponding to a 162d1a67300SRobert Watson * specific DLT. The same network interface might have several BPF interface 163d1a67300SRobert Watson * structures registered by different layers in the stack (i.e., 802.11 164d1a67300SRobert Watson * frames, ethernet frames, etc). 165df8bae1dSRodney W. Grimes */ 166f079a0faSAlexander V. Chernikov static LIST_HEAD(, bpf_if) bpf_iflist, bpf_freelist; 167e7bb21b3SJonathan Lemon static struct mtx bpf_mtx; /* bpf global lock */ 16869f7644bSChristian S.J. Peron static int bpf_bpfd_cnt; 169df8bae1dSRodney W. Grimes 17019ba8395SChristian S.J. Peron static void bpf_attachd(struct bpf_d *, struct bpf_if *); 17119ba8395SChristian S.J. Peron static void bpf_detachd(struct bpf_d *); 1726c74ff0eSAlexander V. Chernikov static void bpf_detachd_locked(struct bpf_d *); 173929ddbbbSAlfred Perlstein static void bpf_freed(struct bpf_d *); 174cb44b6dfSAndrew Thompson static int bpf_movein(struct uio *, int, struct ifnet *, struct mbuf **, 1754fb3a820SAlexander V. Chernikov struct sockaddr *, int *, struct bpf_d *); 176929ddbbbSAlfred Perlstein static int bpf_setif(struct bpf_d *, struct ifreq *); 177929ddbbbSAlfred Perlstein static void bpf_timed_out(void *); 178e7bb21b3SJonathan Lemon static __inline void 179929ddbbbSAlfred Perlstein bpf_wakeup(struct bpf_d *); 1804d621040SChristian S.J. Peron static void catchpacket(struct bpf_d *, u_char *, u_int, u_int, 1814d621040SChristian S.J. Peron void (*)(struct bpf_d *, caddr_t, u_int, void *, u_int), 182547d94bdSJung-uk Kim struct bintime *); 183929ddbbbSAlfred Perlstein static void reset_d(struct bpf_d *); 18493e39f0bSChristian S.J. Peron static int bpf_setf(struct bpf_d *, struct bpf_program *, u_long cmd); 1858eab61f3SSam Leffler static int bpf_getdltlist(struct bpf_d *, struct bpf_dltlist *); 1868eab61f3SSam Leffler static int bpf_setdlt(struct bpf_d *, u_int); 18795aab9ccSJohn-Mark Gurney static void filt_bpfdetach(struct knote *); 18895aab9ccSJohn-Mark Gurney static int filt_bpfread(struct knote *, long); 189a3272e3cSChristian S.J. Peron static void bpf_drvinit(void *); 19069f7644bSChristian S.J. Peron static int bpf_stats_sysctl(SYSCTL_HANDLER_ARGS); 19169f7644bSChristian S.J. Peron 19269f7644bSChristian S.J. Peron SYSCTL_NODE(_net, OID_AUTO, bpf, CTLFLAG_RW, 0, "bpf sysctl"); 19312dc9582SJung-uk Kim int bpf_maxinsns = BPF_MAXINSNS; 19469f7644bSChristian S.J. Peron SYSCTL_INT(_net_bpf, OID_AUTO, maxinsns, CTLFLAG_RW, 19569f7644bSChristian S.J. Peron &bpf_maxinsns, 0, "Maximum bpf program instructions"); 196ffeeb924SChristian S.J. Peron static int bpf_zerocopy_enable = 0; 1974d621040SChristian S.J. Peron SYSCTL_INT(_net_bpf, OID_AUTO, zerocopy_enable, CTLFLAG_RW, 1984d621040SChristian S.J. Peron &bpf_zerocopy_enable, 0, "Enable new zero-copy BPF buffer sessions"); 1996472ac3dSEd Schouten static SYSCTL_NODE(_net_bpf, OID_AUTO, stats, CTLFLAG_MPSAFE | CTLFLAG_RW, 20069f7644bSChristian S.J. Peron bpf_stats_sysctl, "bpf statistics portal"); 201df8bae1dSRodney W. Grimes 20251ec1eb7SAlexander V. Chernikov static VNET_DEFINE(int, bpf_optimize_writers) = 0; 20351ec1eb7SAlexander V. Chernikov #define V_bpf_optimize_writers VNET(bpf_optimize_writers) 2046df8a710SGleb Smirnoff SYSCTL_INT(_net_bpf, OID_AUTO, optimize_writers, CTLFLAG_VNET | CTLFLAG_RW, 2056df8a710SGleb Smirnoff &VNET_NAME(bpf_optimize_writers), 0, 20651ec1eb7SAlexander V. Chernikov "Do not send packets until BPF program is set"); 20751ec1eb7SAlexander V. Chernikov 20887f6c662SJulian Elischer static d_open_t bpfopen; 20987f6c662SJulian Elischer static d_read_t bpfread; 21087f6c662SJulian Elischer static d_write_t bpfwrite; 21187f6c662SJulian Elischer static d_ioctl_t bpfioctl; 212243ac7d8SPeter Wemm static d_poll_t bpfpoll; 21395aab9ccSJohn-Mark Gurney static d_kqfilter_t bpfkqfilter; 21487f6c662SJulian Elischer 2154e2f199eSPoul-Henning Kamp static struct cdevsw bpf_cdevsw = { 216dc08ffecSPoul-Henning Kamp .d_version = D_VERSION, 2177ac40f5fSPoul-Henning Kamp .d_open = bpfopen, 2187ac40f5fSPoul-Henning Kamp .d_read = bpfread, 2197ac40f5fSPoul-Henning Kamp .d_write = bpfwrite, 2207ac40f5fSPoul-Henning Kamp .d_ioctl = bpfioctl, 2217ac40f5fSPoul-Henning Kamp .d_poll = bpfpoll, 2227ac40f5fSPoul-Henning Kamp .d_name = "bpf", 22395aab9ccSJohn-Mark Gurney .d_kqfilter = bpfkqfilter, 2244e2f199eSPoul-Henning Kamp }; 22587f6c662SJulian Elischer 226e76d823bSRobert Watson static struct filterops bpfread_filtops = { 227e76d823bSRobert Watson .f_isfd = 1, 228e76d823bSRobert Watson .f_detach = filt_bpfdetach, 229e76d823bSRobert Watson .f_event = filt_bpfread, 230e76d823bSRobert Watson }; 23187f6c662SJulian Elischer 232afa85850SAlexander V. Chernikov eventhandler_tag bpf_ifdetach_cookie = NULL; 233afa85850SAlexander V. Chernikov 2344d621040SChristian S.J. Peron /* 2356c74ff0eSAlexander V. Chernikov * LOCKING MODEL USED BY BPF: 2366c74ff0eSAlexander V. Chernikov * Locks: 2376c74ff0eSAlexander V. Chernikov * 1) global lock (BPF_LOCK). Mutex, used to protect interface addition/removal, 2386c74ff0eSAlexander V. Chernikov * some global counters and every bpf_if reference. 2396c74ff0eSAlexander V. Chernikov * 2) Interface lock. Rwlock, used to protect list of BPF descriptors and their filters. 240afa85850SAlexander V. Chernikov * 3) Descriptor lock. Mutex, used to protect BPF buffers and various structure fields 2416c74ff0eSAlexander V. Chernikov * used by bpf_mtap code. 2426c74ff0eSAlexander V. Chernikov * 2436c74ff0eSAlexander V. Chernikov * Lock order: 2446c74ff0eSAlexander V. Chernikov * 2456c74ff0eSAlexander V. Chernikov * Global lock, interface lock, descriptor lock 2466c74ff0eSAlexander V. Chernikov * 2476c74ff0eSAlexander V. Chernikov * We have to acquire interface lock before descriptor main lock due to BPF_MTAP[2] 2486c74ff0eSAlexander V. Chernikov * working model. In many places (like bpf_detachd) we start with BPF descriptor 2496c74ff0eSAlexander V. Chernikov * (and we need to at least rlock it to get reliable interface pointer). This 2506c74ff0eSAlexander V. Chernikov * gives us potential LOR. As a result, we use global lock to protect from bpf_if 2516c74ff0eSAlexander V. Chernikov * change in every such place. 2526c74ff0eSAlexander V. Chernikov * 2536c74ff0eSAlexander V. Chernikov * Changing d->bd_bif is protected by 1) global lock, 2) interface lock and 2546c74ff0eSAlexander V. Chernikov * 3) descriptor main wlock. 2556c74ff0eSAlexander V. Chernikov * Reading bd_bif can be protected by any of these locks, typically global lock. 2566c74ff0eSAlexander V. Chernikov * 2576c74ff0eSAlexander V. Chernikov * Changing read/write BPF filter is protected by the same three locks, 2586c74ff0eSAlexander V. Chernikov * the same applies for reading. 2596c74ff0eSAlexander V. Chernikov * 2606c74ff0eSAlexander V. Chernikov * Sleeping in global lock is not allowed due to bpfdetach() using it. 2616c74ff0eSAlexander V. Chernikov */ 2626c74ff0eSAlexander V. Chernikov 2636c74ff0eSAlexander V. Chernikov /* 2644d621040SChristian S.J. Peron * Wrapper functions for various buffering methods. If the set of buffer 2654d621040SChristian S.J. Peron * modes expands, we will probably want to introduce a switch data structure 2664d621040SChristian S.J. Peron * similar to protosw, et. 2674d621040SChristian S.J. Peron */ 2684d621040SChristian S.J. Peron static void 2694d621040SChristian S.J. Peron bpf_append_bytes(struct bpf_d *d, caddr_t buf, u_int offset, void *src, 2704d621040SChristian S.J. Peron u_int len) 2714d621040SChristian S.J. Peron { 2724d621040SChristian S.J. Peron 273afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 2744d621040SChristian S.J. Peron 2754d621040SChristian S.J. Peron switch (d->bd_bufmode) { 2764d621040SChristian S.J. Peron case BPF_BUFMODE_BUFFER: 2774d621040SChristian S.J. Peron return (bpf_buffer_append_bytes(d, buf, offset, src, len)); 2784d621040SChristian S.J. Peron 2794d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 2804d621040SChristian S.J. Peron d->bd_zcopy++; 2814d621040SChristian S.J. Peron return (bpf_zerocopy_append_bytes(d, buf, offset, src, len)); 2824d621040SChristian S.J. Peron 2834d621040SChristian S.J. Peron default: 2844d621040SChristian S.J. Peron panic("bpf_buf_append_bytes"); 2854d621040SChristian S.J. Peron } 2864d621040SChristian S.J. Peron } 2874d621040SChristian S.J. Peron 2884d621040SChristian S.J. Peron static void 2894d621040SChristian S.J. Peron bpf_append_mbuf(struct bpf_d *d, caddr_t buf, u_int offset, void *src, 2904d621040SChristian S.J. Peron u_int len) 2914d621040SChristian S.J. Peron { 2924d621040SChristian S.J. Peron 293afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 2944d621040SChristian S.J. Peron 2954d621040SChristian S.J. Peron switch (d->bd_bufmode) { 2964d621040SChristian S.J. Peron case BPF_BUFMODE_BUFFER: 2974d621040SChristian S.J. Peron return (bpf_buffer_append_mbuf(d, buf, offset, src, len)); 2984d621040SChristian S.J. Peron 2994d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 3004d621040SChristian S.J. Peron d->bd_zcopy++; 3014d621040SChristian S.J. Peron return (bpf_zerocopy_append_mbuf(d, buf, offset, src, len)); 3024d621040SChristian S.J. Peron 3034d621040SChristian S.J. Peron default: 3044d621040SChristian S.J. Peron panic("bpf_buf_append_mbuf"); 3054d621040SChristian S.J. Peron } 3064d621040SChristian S.J. Peron } 3074d621040SChristian S.J. Peron 3084d621040SChristian S.J. Peron /* 30929f612ecSChristian S.J. Peron * This function gets called when the free buffer is re-assigned. 31029f612ecSChristian S.J. Peron */ 31129f612ecSChristian S.J. Peron static void 31229f612ecSChristian S.J. Peron bpf_buf_reclaimed(struct bpf_d *d) 31329f612ecSChristian S.J. Peron { 31429f612ecSChristian S.J. Peron 315afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 31629f612ecSChristian S.J. Peron 31729f612ecSChristian S.J. Peron switch (d->bd_bufmode) { 31829f612ecSChristian S.J. Peron case BPF_BUFMODE_BUFFER: 31929f612ecSChristian S.J. Peron return; 32029f612ecSChristian S.J. Peron 32129f612ecSChristian S.J. Peron case BPF_BUFMODE_ZBUF: 32229f612ecSChristian S.J. Peron bpf_zerocopy_buf_reclaimed(d); 32329f612ecSChristian S.J. Peron return; 32429f612ecSChristian S.J. Peron 32529f612ecSChristian S.J. Peron default: 32629f612ecSChristian S.J. Peron panic("bpf_buf_reclaimed"); 32729f612ecSChristian S.J. Peron } 32829f612ecSChristian S.J. Peron } 32929f612ecSChristian S.J. Peron 33029f612ecSChristian S.J. Peron /* 3314d621040SChristian S.J. Peron * If the buffer mechanism has a way to decide that a held buffer can be made 3324d621040SChristian S.J. Peron * free, then it is exposed via the bpf_canfreebuf() interface. (1) is 3334d621040SChristian S.J. Peron * returned if the buffer can be discarded, (0) is returned if it cannot. 3344d621040SChristian S.J. Peron */ 3354d621040SChristian S.J. Peron static int 3364d621040SChristian S.J. Peron bpf_canfreebuf(struct bpf_d *d) 3374d621040SChristian S.J. Peron { 3384d621040SChristian S.J. Peron 3394d621040SChristian S.J. Peron BPFD_LOCK_ASSERT(d); 3404d621040SChristian S.J. Peron 3414d621040SChristian S.J. Peron switch (d->bd_bufmode) { 3424d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 3434d621040SChristian S.J. Peron return (bpf_zerocopy_canfreebuf(d)); 3444d621040SChristian S.J. Peron } 3454d621040SChristian S.J. Peron return (0); 3464d621040SChristian S.J. Peron } 3474d621040SChristian S.J. Peron 348a7a91e65SRobert Watson /* 349a7a91e65SRobert Watson * Allow the buffer model to indicate that the current store buffer is 350a7a91e65SRobert Watson * immutable, regardless of the appearance of space. Return (1) if the 351a7a91e65SRobert Watson * buffer is writable, and (0) if not. 352a7a91e65SRobert Watson */ 353a7a91e65SRobert Watson static int 354a7a91e65SRobert Watson bpf_canwritebuf(struct bpf_d *d) 355a7a91e65SRobert Watson { 356a7a91e65SRobert Watson BPFD_LOCK_ASSERT(d); 357a7a91e65SRobert Watson 358a7a91e65SRobert Watson switch (d->bd_bufmode) { 359a7a91e65SRobert Watson case BPF_BUFMODE_ZBUF: 360a7a91e65SRobert Watson return (bpf_zerocopy_canwritebuf(d)); 361a7a91e65SRobert Watson } 362a7a91e65SRobert Watson return (1); 363a7a91e65SRobert Watson } 364a7a91e65SRobert Watson 365a7a91e65SRobert Watson /* 366a7a91e65SRobert Watson * Notify buffer model that an attempt to write to the store buffer has 367a7a91e65SRobert Watson * resulted in a dropped packet, in which case the buffer may be considered 368a7a91e65SRobert Watson * full. 369a7a91e65SRobert Watson */ 370a7a91e65SRobert Watson static void 371a7a91e65SRobert Watson bpf_buffull(struct bpf_d *d) 372a7a91e65SRobert Watson { 373a7a91e65SRobert Watson 374afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 375a7a91e65SRobert Watson 376a7a91e65SRobert Watson switch (d->bd_bufmode) { 377a7a91e65SRobert Watson case BPF_BUFMODE_ZBUF: 378a7a91e65SRobert Watson bpf_zerocopy_buffull(d); 379a7a91e65SRobert Watson break; 380a7a91e65SRobert Watson } 381a7a91e65SRobert Watson } 382a7a91e65SRobert Watson 383a7a91e65SRobert Watson /* 384a7a91e65SRobert Watson * Notify the buffer model that a buffer has moved into the hold position. 385a7a91e65SRobert Watson */ 3864d621040SChristian S.J. Peron void 3874d621040SChristian S.J. Peron bpf_bufheld(struct bpf_d *d) 3884d621040SChristian S.J. Peron { 3894d621040SChristian S.J. Peron 390afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 3914d621040SChristian S.J. Peron 3924d621040SChristian S.J. Peron switch (d->bd_bufmode) { 3934d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 3944d621040SChristian S.J. Peron bpf_zerocopy_bufheld(d); 3954d621040SChristian S.J. Peron break; 3964d621040SChristian S.J. Peron } 3974d621040SChristian S.J. Peron } 3984d621040SChristian S.J. Peron 3994d621040SChristian S.J. Peron static void 4004d621040SChristian S.J. Peron bpf_free(struct bpf_d *d) 4014d621040SChristian S.J. Peron { 4024d621040SChristian S.J. Peron 4034d621040SChristian S.J. Peron switch (d->bd_bufmode) { 4044d621040SChristian S.J. Peron case BPF_BUFMODE_BUFFER: 4054d621040SChristian S.J. Peron return (bpf_buffer_free(d)); 4064d621040SChristian S.J. Peron 4074d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 4084d621040SChristian S.J. Peron return (bpf_zerocopy_free(d)); 4094d621040SChristian S.J. Peron 4104d621040SChristian S.J. Peron default: 4114d621040SChristian S.J. Peron panic("bpf_buf_free"); 4124d621040SChristian S.J. Peron } 4134d621040SChristian S.J. Peron } 4144d621040SChristian S.J. Peron 4154d621040SChristian S.J. Peron static int 4164d621040SChristian S.J. Peron bpf_uiomove(struct bpf_d *d, caddr_t buf, u_int len, struct uio *uio) 4174d621040SChristian S.J. Peron { 4184d621040SChristian S.J. Peron 4194d621040SChristian S.J. Peron if (d->bd_bufmode != BPF_BUFMODE_BUFFER) 4204d621040SChristian S.J. Peron return (EOPNOTSUPP); 4214d621040SChristian S.J. Peron return (bpf_buffer_uiomove(d, buf, len, uio)); 4224d621040SChristian S.J. Peron } 4234d621040SChristian S.J. Peron 4244d621040SChristian S.J. Peron static int 4254d621040SChristian S.J. Peron bpf_ioctl_sblen(struct bpf_d *d, u_int *i) 4264d621040SChristian S.J. Peron { 4274d621040SChristian S.J. Peron 4284d621040SChristian S.J. Peron if (d->bd_bufmode != BPF_BUFMODE_BUFFER) 4294d621040SChristian S.J. Peron return (EOPNOTSUPP); 4304d621040SChristian S.J. Peron return (bpf_buffer_ioctl_sblen(d, i)); 4314d621040SChristian S.J. Peron } 4324d621040SChristian S.J. Peron 4334d621040SChristian S.J. Peron static int 4344d621040SChristian S.J. Peron bpf_ioctl_getzmax(struct thread *td, struct bpf_d *d, size_t *i) 4354d621040SChristian S.J. Peron { 4364d621040SChristian S.J. Peron 4374d621040SChristian S.J. Peron if (d->bd_bufmode != BPF_BUFMODE_ZBUF) 4384d621040SChristian S.J. Peron return (EOPNOTSUPP); 4394d621040SChristian S.J. Peron return (bpf_zerocopy_ioctl_getzmax(td, d, i)); 4404d621040SChristian S.J. Peron } 4414d621040SChristian S.J. Peron 4424d621040SChristian S.J. Peron static int 4434d621040SChristian S.J. Peron bpf_ioctl_rotzbuf(struct thread *td, struct bpf_d *d, struct bpf_zbuf *bz) 4444d621040SChristian S.J. Peron { 4454d621040SChristian S.J. Peron 4464d621040SChristian S.J. Peron if (d->bd_bufmode != BPF_BUFMODE_ZBUF) 4474d621040SChristian S.J. Peron return (EOPNOTSUPP); 4484d621040SChristian S.J. Peron return (bpf_zerocopy_ioctl_rotzbuf(td, d, bz)); 4494d621040SChristian S.J. Peron } 4504d621040SChristian S.J. Peron 4514d621040SChristian S.J. Peron static int 4524d621040SChristian S.J. Peron bpf_ioctl_setzbuf(struct thread *td, struct bpf_d *d, struct bpf_zbuf *bz) 4534d621040SChristian S.J. Peron { 4544d621040SChristian S.J. Peron 4554d621040SChristian S.J. Peron if (d->bd_bufmode != BPF_BUFMODE_ZBUF) 4564d621040SChristian S.J. Peron return (EOPNOTSUPP); 4574d621040SChristian S.J. Peron return (bpf_zerocopy_ioctl_setzbuf(td, d, bz)); 4584d621040SChristian S.J. Peron } 4594d621040SChristian S.J. Peron 4604d621040SChristian S.J. Peron /* 4614d621040SChristian S.J. Peron * General BPF functions. 4624d621040SChristian S.J. Peron */ 463df8bae1dSRodney W. Grimes static int 464cb44b6dfSAndrew Thompson bpf_movein(struct uio *uio, int linktype, struct ifnet *ifp, struct mbuf **mp, 4654fb3a820SAlexander V. Chernikov struct sockaddr *sockp, int *hdrlen, struct bpf_d *d) 466df8bae1dSRodney W. Grimes { 467246b5467SSam Leffler const struct ieee80211_bpf_params *p; 468cb44b6dfSAndrew Thompson struct ether_header *eh; 469df8bae1dSRodney W. Grimes struct mbuf *m; 470df8bae1dSRodney W. Grimes int error; 471df8bae1dSRodney W. Grimes int len; 472df8bae1dSRodney W. Grimes int hlen; 47393e39f0bSChristian S.J. Peron int slen; 474df8bae1dSRodney W. Grimes 475df8bae1dSRodney W. Grimes /* 476df8bae1dSRodney W. Grimes * Build a sockaddr based on the data link layer type. 477df8bae1dSRodney W. Grimes * We do this at this level because the ethernet header 478df8bae1dSRodney W. Grimes * is copied directly into the data field of the sockaddr. 479df8bae1dSRodney W. Grimes * In the case of SLIP, there is no header and the packet 480df8bae1dSRodney W. Grimes * is forwarded as is. 481df8bae1dSRodney W. Grimes * Also, we are careful to leave room at the front of the mbuf 482df8bae1dSRodney W. Grimes * for the link level header. 483df8bae1dSRodney W. Grimes */ 484df8bae1dSRodney W. Grimes switch (linktype) { 485df8bae1dSRodney W. Grimes 486df8bae1dSRodney W. Grimes case DLT_SLIP: 487df8bae1dSRodney W. Grimes sockp->sa_family = AF_INET; 488df8bae1dSRodney W. Grimes hlen = 0; 489df8bae1dSRodney W. Grimes break; 490df8bae1dSRodney W. Grimes 491df8bae1dSRodney W. Grimes case DLT_EN10MB: 492df8bae1dSRodney W. Grimes sockp->sa_family = AF_UNSPEC; 493df8bae1dSRodney W. Grimes /* XXX Would MAXLINKHDR be better? */ 494797f247bSMatthew N. Dodd hlen = ETHER_HDR_LEN; 495df8bae1dSRodney W. Grimes break; 496df8bae1dSRodney W. Grimes 497df8bae1dSRodney W. Grimes case DLT_FDDI: 498d41f24e7SDavid Greenman sockp->sa_family = AF_IMPLINK; 499d41f24e7SDavid Greenman hlen = 0; 500df8bae1dSRodney W. Grimes break; 501df8bae1dSRodney W. Grimes 50222f05c43SAndrey A. Chernov case DLT_RAW: 503df8bae1dSRodney W. Grimes sockp->sa_family = AF_UNSPEC; 504df8bae1dSRodney W. Grimes hlen = 0; 505df8bae1dSRodney W. Grimes break; 506df8bae1dSRodney W. Grimes 50701399f34SDavid Malone case DLT_NULL: 50801399f34SDavid Malone /* 50901399f34SDavid Malone * null interface types require a 4 byte pseudo header which 51001399f34SDavid Malone * corresponds to the address family of the packet. 51101399f34SDavid Malone */ 51201399f34SDavid Malone sockp->sa_family = AF_UNSPEC; 51301399f34SDavid Malone hlen = 4; 51401399f34SDavid Malone break; 51501399f34SDavid Malone 5164f53e3ccSKenjiro Cho case DLT_ATM_RFC1483: 5174f53e3ccSKenjiro Cho /* 5184f53e3ccSKenjiro Cho * en atm driver requires 4-byte atm pseudo header. 5194f53e3ccSKenjiro Cho * though it isn't standard, vpi:vci needs to be 5204f53e3ccSKenjiro Cho * specified anyway. 5214f53e3ccSKenjiro Cho */ 5224f53e3ccSKenjiro Cho sockp->sa_family = AF_UNSPEC; 5234f53e3ccSKenjiro Cho hlen = 12; /* XXX 4(ATM_PH) + 3(LLC) + 5(SNAP) */ 5244f53e3ccSKenjiro Cho break; 5254f53e3ccSKenjiro Cho 52630fa52a6SBrian Somers case DLT_PPP: 52730fa52a6SBrian Somers sockp->sa_family = AF_UNSPEC; 52830fa52a6SBrian Somers hlen = 4; /* This should match PPP_HDRLEN */ 52930fa52a6SBrian Somers break; 53030fa52a6SBrian Somers 531246b5467SSam Leffler case DLT_IEEE802_11: /* IEEE 802.11 wireless */ 532246b5467SSam Leffler sockp->sa_family = AF_IEEE80211; 533246b5467SSam Leffler hlen = 0; 534246b5467SSam Leffler break; 535246b5467SSam Leffler 536246b5467SSam Leffler case DLT_IEEE802_11_RADIO: /* IEEE 802.11 wireless w/ phy params */ 537246b5467SSam Leffler sockp->sa_family = AF_IEEE80211; 538246b5467SSam Leffler sockp->sa_len = 12; /* XXX != 0 */ 539246b5467SSam Leffler hlen = sizeof(struct ieee80211_bpf_params); 540246b5467SSam Leffler break; 541246b5467SSam Leffler 542df8bae1dSRodney W. Grimes default: 543df8bae1dSRodney W. Grimes return (EIO); 544df8bae1dSRodney W. Grimes } 545df8bae1dSRodney W. Grimes 546df8bae1dSRodney W. Grimes len = uio->uio_resid; 547ed63043bSGleb Smirnoff if (len < hlen || len - hlen > ifp->if_mtu) 54801399f34SDavid Malone return (EMSGSIZE); 54901399f34SDavid Malone 55041a7572bSGleb Smirnoff m = m_get2(len, M_WAITOK, MT_DATA, M_PKTHDR); 551ed63043bSGleb Smirnoff if (m == NULL) 552df8bae1dSRodney W. Grimes return (EIO); 553963e4c2aSGarrett Wollman m->m_pkthdr.len = m->m_len = len; 554df8bae1dSRodney W. Grimes *mp = m; 55524a229f4SSam Leffler 55693e39f0bSChristian S.J. Peron error = uiomove(mtod(m, u_char *), len, uio); 55793e39f0bSChristian S.J. Peron if (error) 55893e39f0bSChristian S.J. Peron goto bad; 55993e39f0bSChristian S.J. Peron 5604fb3a820SAlexander V. Chernikov slen = bpf_filter(d->bd_wfilter, mtod(m, u_char *), len, len); 56193e39f0bSChristian S.J. Peron if (slen == 0) { 56293e39f0bSChristian S.J. Peron error = EPERM; 56393e39f0bSChristian S.J. Peron goto bad; 56493e39f0bSChristian S.J. Peron } 56593e39f0bSChristian S.J. Peron 566cb44b6dfSAndrew Thompson /* Check for multicast destination */ 567cb44b6dfSAndrew Thompson switch (linktype) { 568cb44b6dfSAndrew Thompson case DLT_EN10MB: 569cb44b6dfSAndrew Thompson eh = mtod(m, struct ether_header *); 570cb44b6dfSAndrew Thompson if (ETHER_IS_MULTICAST(eh->ether_dhost)) { 571cb44b6dfSAndrew Thompson if (bcmp(ifp->if_broadcastaddr, eh->ether_dhost, 572cb44b6dfSAndrew Thompson ETHER_ADDR_LEN) == 0) 573cb44b6dfSAndrew Thompson m->m_flags |= M_BCAST; 574cb44b6dfSAndrew Thompson else 575cb44b6dfSAndrew Thompson m->m_flags |= M_MCAST; 576cb44b6dfSAndrew Thompson } 5774fb3a820SAlexander V. Chernikov if (d->bd_hdrcmplt == 0) { 5784fb3a820SAlexander V. Chernikov memcpy(eh->ether_shost, IF_LLADDR(ifp), 5794fb3a820SAlexander V. Chernikov sizeof(eh->ether_shost)); 5804fb3a820SAlexander V. Chernikov } 581cb44b6dfSAndrew Thompson break; 582cb44b6dfSAndrew Thompson } 583cb44b6dfSAndrew Thompson 584df8bae1dSRodney W. Grimes /* 58593e39f0bSChristian S.J. Peron * Make room for link header, and copy it to sockaddr 586df8bae1dSRodney W. Grimes */ 587df8bae1dSRodney W. Grimes if (hlen != 0) { 588246b5467SSam Leffler if (sockp->sa_family == AF_IEEE80211) { 589246b5467SSam Leffler /* 590246b5467SSam Leffler * Collect true length from the parameter header 591246b5467SSam Leffler * NB: sockp is known to be zero'd so if we do a 592246b5467SSam Leffler * short copy unspecified parameters will be 593246b5467SSam Leffler * zero. 594246b5467SSam Leffler * NB: packet may not be aligned after stripping 595246b5467SSam Leffler * bpf params 596246b5467SSam Leffler * XXX check ibp_vers 597246b5467SSam Leffler */ 598246b5467SSam Leffler p = mtod(m, const struct ieee80211_bpf_params *); 599246b5467SSam Leffler hlen = p->ibp_len; 600246b5467SSam Leffler if (hlen > sizeof(sockp->sa_data)) { 601246b5467SSam Leffler error = EINVAL; 602246b5467SSam Leffler goto bad; 603246b5467SSam Leffler } 604246b5467SSam Leffler } 605a09968c4SAdrian Chadd bcopy(mtod(m, const void *), sockp->sa_data, hlen); 606df8bae1dSRodney W. Grimes } 607560a54e1SJung-uk Kim *hdrlen = hlen; 60893e39f0bSChristian S.J. Peron 609df8bae1dSRodney W. Grimes return (0); 610df8bae1dSRodney W. Grimes bad: 611df8bae1dSRodney W. Grimes m_freem(m); 612df8bae1dSRodney W. Grimes return (error); 613df8bae1dSRodney W. Grimes } 614df8bae1dSRodney W. Grimes 615df8bae1dSRodney W. Grimes /* 616df8bae1dSRodney W. Grimes * Attach file to the bpf interface, i.e. make d listen on bp. 617df8bae1dSRodney W. Grimes */ 618df8bae1dSRodney W. Grimes static void 61919ba8395SChristian S.J. Peron bpf_attachd(struct bpf_d *d, struct bpf_if *bp) 620df8bae1dSRodney W. Grimes { 6216c74ff0eSAlexander V. Chernikov int op_w; 6226c74ff0eSAlexander V. Chernikov 6236c74ff0eSAlexander V. Chernikov BPF_LOCK_ASSERT(); 6246c74ff0eSAlexander V. Chernikov 6256c74ff0eSAlexander V. Chernikov /* 6266c74ff0eSAlexander V. Chernikov * Save sysctl value to protect from sysctl change 6276c74ff0eSAlexander V. Chernikov * between reads 6286c74ff0eSAlexander V. Chernikov */ 62971448753SAlexander Motin op_w = V_bpf_optimize_writers || d->bd_writer; 6306c74ff0eSAlexander V. Chernikov 6316c74ff0eSAlexander V. Chernikov if (d->bd_bif != NULL) 6326c74ff0eSAlexander V. Chernikov bpf_detachd_locked(d); 633df8bae1dSRodney W. Grimes /* 63451ec1eb7SAlexander V. Chernikov * Point d at bp, and add d to the interface's list. 635f87e372eSLuiz Otavio O Souza * Since there are many applications using BPF for 63651ec1eb7SAlexander V. Chernikov * sending raw packets only (dhcpd, cdpd are good examples) 63751ec1eb7SAlexander V. Chernikov * we can delay adding d to the list of active listeners until 63851ec1eb7SAlexander V. Chernikov * some filter is configured. 639df8bae1dSRodney W. Grimes */ 64051ec1eb7SAlexander V. Chernikov 64151ec1eb7SAlexander V. Chernikov BPFIF_WLOCK(bp); 642afa85850SAlexander V. Chernikov BPFD_LOCK(d); 64351ec1eb7SAlexander V. Chernikov 6446c74ff0eSAlexander V. Chernikov d->bd_bif = bp; 6456c74ff0eSAlexander V. Chernikov 6466c74ff0eSAlexander V. Chernikov if (op_w != 0) { 64751ec1eb7SAlexander V. Chernikov /* Add to writers-only list */ 64851ec1eb7SAlexander V. Chernikov LIST_INSERT_HEAD(&bp->bif_wlist, d, bd_next); 64951ec1eb7SAlexander V. Chernikov /* 65051ec1eb7SAlexander V. Chernikov * We decrement bd_writer on every filter set operation. 65151ec1eb7SAlexander V. Chernikov * First BIOCSETF is done by pcap_open_live() to set up 65251ec1eb7SAlexander V. Chernikov * snap length. After that appliation usually sets its own filter 65351ec1eb7SAlexander V. Chernikov */ 65451ec1eb7SAlexander V. Chernikov d->bd_writer = 2; 65551ec1eb7SAlexander V. Chernikov } else 6564a3feeaaSRobert Watson LIST_INSERT_HEAD(&bp->bif_dlist, d, bd_next); 657df8bae1dSRodney W. Grimes 658afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 659e4b3229aSAlexander V. Chernikov BPFIF_WUNLOCK(bp); 660b743c310SSam Leffler 66151ec1eb7SAlexander V. Chernikov bpf_bpfd_cnt++; 66251ec1eb7SAlexander V. Chernikov 66351ec1eb7SAlexander V. Chernikov CTR3(KTR_NET, "%s: bpf_attach called by pid %d, adding to %s list", 66451ec1eb7SAlexander V. Chernikov __func__, d->bd_pid, d->bd_writer ? "writer" : "active"); 66551ec1eb7SAlexander V. Chernikov 6666c74ff0eSAlexander V. Chernikov if (op_w == 0) 66751ec1eb7SAlexander V. Chernikov EVENTHANDLER_INVOKE(bpf_track, bp->bif_ifp, bp->bif_dlt, 1); 66851ec1eb7SAlexander V. Chernikov } 66951ec1eb7SAlexander V. Chernikov 67051ec1eb7SAlexander V. Chernikov /* 671402000ffSAlexander V. Chernikov * Check if we need to upgrade our descriptor @d from write-only mode. 672402000ffSAlexander V. Chernikov */ 673402000ffSAlexander V. Chernikov static int 674402000ffSAlexander V. Chernikov bpf_check_upgrade(u_long cmd, struct bpf_d *d, struct bpf_insn *fcode, int flen) 675402000ffSAlexander V. Chernikov { 676402000ffSAlexander V. Chernikov int is_snap, need_upgrade; 677402000ffSAlexander V. Chernikov 678402000ffSAlexander V. Chernikov /* 679402000ffSAlexander V. Chernikov * Check if we've already upgraded or new filter is empty. 680402000ffSAlexander V. Chernikov */ 681402000ffSAlexander V. Chernikov if (d->bd_writer == 0 || fcode == NULL) 682402000ffSAlexander V. Chernikov return (0); 683402000ffSAlexander V. Chernikov 684402000ffSAlexander V. Chernikov need_upgrade = 0; 685402000ffSAlexander V. Chernikov 686402000ffSAlexander V. Chernikov /* 687402000ffSAlexander V. Chernikov * Check if cmd looks like snaplen setting from 688402000ffSAlexander V. Chernikov * pcap_bpf.c:pcap_open_live(). 689402000ffSAlexander V. Chernikov * Note we're not checking .k value here: 690402000ffSAlexander V. Chernikov * while pcap_open_live() definitely sets to to non-zero value, 691402000ffSAlexander V. Chernikov * we'd prefer to treat k=0 (deny ALL) case the same way: e.g. 692402000ffSAlexander V. Chernikov * do not consider upgrading immediately 693402000ffSAlexander V. Chernikov */ 694402000ffSAlexander V. Chernikov if (cmd == BIOCSETF && flen == 1 && fcode[0].code == (BPF_RET | BPF_K)) 695402000ffSAlexander V. Chernikov is_snap = 1; 696402000ffSAlexander V. Chernikov else 697402000ffSAlexander V. Chernikov is_snap = 0; 698402000ffSAlexander V. Chernikov 699402000ffSAlexander V. Chernikov if (is_snap == 0) { 700402000ffSAlexander V. Chernikov /* 701402000ffSAlexander V. Chernikov * We're setting first filter and it doesn't look like 702402000ffSAlexander V. Chernikov * setting snaplen. We're probably using bpf directly. 703402000ffSAlexander V. Chernikov * Upgrade immediately. 704402000ffSAlexander V. Chernikov */ 705402000ffSAlexander V. Chernikov need_upgrade = 1; 706402000ffSAlexander V. Chernikov } else { 707402000ffSAlexander V. Chernikov /* 708402000ffSAlexander V. Chernikov * Do not require upgrade by first BIOCSETF 709402000ffSAlexander V. Chernikov * (used to set snaplen) by pcap_open_live(). 710402000ffSAlexander V. Chernikov */ 711402000ffSAlexander V. Chernikov 712402000ffSAlexander V. Chernikov if (--d->bd_writer == 0) { 713402000ffSAlexander V. Chernikov /* 714402000ffSAlexander V. Chernikov * First snaplen filter has already 715402000ffSAlexander V. Chernikov * been set. This is probably catch-all 716402000ffSAlexander V. Chernikov * filter 717402000ffSAlexander V. Chernikov */ 718402000ffSAlexander V. Chernikov need_upgrade = 1; 719402000ffSAlexander V. Chernikov } 720402000ffSAlexander V. Chernikov } 721402000ffSAlexander V. Chernikov 722402000ffSAlexander V. Chernikov CTR5(KTR_NET, 723402000ffSAlexander V. Chernikov "%s: filter function set by pid %d, " 724402000ffSAlexander V. Chernikov "bd_writer counter %d, snap %d upgrade %d", 725402000ffSAlexander V. Chernikov __func__, d->bd_pid, d->bd_writer, 726402000ffSAlexander V. Chernikov is_snap, need_upgrade); 727402000ffSAlexander V. Chernikov 728402000ffSAlexander V. Chernikov return (need_upgrade); 729402000ffSAlexander V. Chernikov } 730402000ffSAlexander V. Chernikov 731402000ffSAlexander V. Chernikov /* 73251ec1eb7SAlexander V. Chernikov * Add d to the list of active bp filters. 733f87e372eSLuiz Otavio O Souza * Requires bpf_attachd() to be called before. 73451ec1eb7SAlexander V. Chernikov */ 73551ec1eb7SAlexander V. Chernikov static void 73651ec1eb7SAlexander V. Chernikov bpf_upgraded(struct bpf_d *d) 73751ec1eb7SAlexander V. Chernikov { 73851ec1eb7SAlexander V. Chernikov struct bpf_if *bp; 73951ec1eb7SAlexander V. Chernikov 7406c74ff0eSAlexander V. Chernikov BPF_LOCK_ASSERT(); 7416c74ff0eSAlexander V. Chernikov 74251ec1eb7SAlexander V. Chernikov bp = d->bd_bif; 74351ec1eb7SAlexander V. Chernikov 7446c74ff0eSAlexander V. Chernikov /* 7456c74ff0eSAlexander V. Chernikov * Filter can be set several times without specifying interface. 7466c74ff0eSAlexander V. Chernikov * Mark d as reader and exit. 7476c74ff0eSAlexander V. Chernikov */ 7486c74ff0eSAlexander V. Chernikov if (bp == NULL) { 749afa85850SAlexander V. Chernikov BPFD_LOCK(d); 7506c74ff0eSAlexander V. Chernikov d->bd_writer = 0; 751afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 7526c74ff0eSAlexander V. Chernikov return; 7536c74ff0eSAlexander V. Chernikov } 7546c74ff0eSAlexander V. Chernikov 75551ec1eb7SAlexander V. Chernikov BPFIF_WLOCK(bp); 756afa85850SAlexander V. Chernikov BPFD_LOCK(d); 75751ec1eb7SAlexander V. Chernikov 75851ec1eb7SAlexander V. Chernikov /* Remove from writers-only list */ 75951ec1eb7SAlexander V. Chernikov LIST_REMOVE(d, bd_next); 76051ec1eb7SAlexander V. Chernikov LIST_INSERT_HEAD(&bp->bif_dlist, d, bd_next); 76151ec1eb7SAlexander V. Chernikov /* Mark d as reader */ 76251ec1eb7SAlexander V. Chernikov d->bd_writer = 0; 76351ec1eb7SAlexander V. Chernikov 764afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 76551ec1eb7SAlexander V. Chernikov BPFIF_WUNLOCK(bp); 76651ec1eb7SAlexander V. Chernikov 76751ec1eb7SAlexander V. Chernikov CTR2(KTR_NET, "%s: upgrade required by pid %d", __func__, d->bd_pid); 76851ec1eb7SAlexander V. Chernikov 7695ce8d970SSam Leffler EVENTHANDLER_INVOKE(bpf_track, bp->bif_ifp, bp->bif_dlt, 1); 770df8bae1dSRodney W. Grimes } 771df8bae1dSRodney W. Grimes 772df8bae1dSRodney W. Grimes /* 773df8bae1dSRodney W. Grimes * Detach a file from its interface. 774df8bae1dSRodney W. Grimes */ 775df8bae1dSRodney W. Grimes static void 77619ba8395SChristian S.J. Peron bpf_detachd(struct bpf_d *d) 777df8bae1dSRodney W. Grimes { 7786c74ff0eSAlexander V. Chernikov BPF_LOCK(); 7796c74ff0eSAlexander V. Chernikov bpf_detachd_locked(d); 7806c74ff0eSAlexander V. Chernikov BPF_UNLOCK(); 7816c74ff0eSAlexander V. Chernikov } 7826c74ff0eSAlexander V. Chernikov 7836c74ff0eSAlexander V. Chernikov static void 7846c74ff0eSAlexander V. Chernikov bpf_detachd_locked(struct bpf_d *d) 7856c74ff0eSAlexander V. Chernikov { 7866e891d64SPoul-Henning Kamp int error; 787df8bae1dSRodney W. Grimes struct bpf_if *bp; 78846448b5aSRobert Watson struct ifnet *ifp; 789df8bae1dSRodney W. Grimes 79051ec1eb7SAlexander V. Chernikov CTR2(KTR_NET, "%s: detach required by pid %d", __func__, d->bd_pid); 79151ec1eb7SAlexander V. Chernikov 792e4b3229aSAlexander V. Chernikov BPF_LOCK_ASSERT(); 793e4b3229aSAlexander V. Chernikov 7946c74ff0eSAlexander V. Chernikov /* Check if descriptor is attached */ 7956c74ff0eSAlexander V. Chernikov if ((bp = d->bd_bif) == NULL) 7966c74ff0eSAlexander V. Chernikov return; 7976c74ff0eSAlexander V. Chernikov 798e4b3229aSAlexander V. Chernikov BPFIF_WLOCK(bp); 799afa85850SAlexander V. Chernikov BPFD_LOCK(d); 80046448b5aSRobert Watson 80151ec1eb7SAlexander V. Chernikov /* Save bd_writer value */ 80251ec1eb7SAlexander V. Chernikov error = d->bd_writer; 80351ec1eb7SAlexander V. Chernikov 80446448b5aSRobert Watson /* 80546448b5aSRobert Watson * Remove d from the interface's descriptor list. 80646448b5aSRobert Watson */ 80746448b5aSRobert Watson LIST_REMOVE(d, bd_next); 80846448b5aSRobert Watson 809e4b3229aSAlexander V. Chernikov ifp = bp->bif_ifp; 810572bde2aSRobert Watson d->bd_bif = NULL; 811afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 812e4b3229aSAlexander V. Chernikov BPFIF_WUNLOCK(bp); 813e4b3229aSAlexander V. Chernikov 814e4b3229aSAlexander V. Chernikov bpf_bpfd_cnt--; 81546448b5aSRobert Watson 81651ec1eb7SAlexander V. Chernikov /* Call event handler iff d is attached */ 81751ec1eb7SAlexander V. Chernikov if (error == 0) 8185ce8d970SSam Leffler EVENTHANDLER_INVOKE(bpf_track, ifp, bp->bif_dlt, 0); 819b743c310SSam Leffler 820df8bae1dSRodney W. Grimes /* 821df8bae1dSRodney W. Grimes * Check if this descriptor had requested promiscuous mode. 822df8bae1dSRodney W. Grimes * If so, turn it off. 823df8bae1dSRodney W. Grimes */ 824df8bae1dSRodney W. Grimes if (d->bd_promisc) { 825df8bae1dSRodney W. Grimes d->bd_promisc = 0; 82697021c24SMarko Zec CURVNET_SET(ifp->if_vnet); 82746448b5aSRobert Watson error = ifpromisc(ifp, 0); 82897021c24SMarko Zec CURVNET_RESTORE(); 8296e891d64SPoul-Henning Kamp if (error != 0 && error != ENXIO) { 830df8bae1dSRodney W. Grimes /* 8316e891d64SPoul-Henning Kamp * ENXIO can happen if a pccard is unplugged 832df8bae1dSRodney W. Grimes * Something is really wrong if we were able to put 833df8bae1dSRodney W. Grimes * the driver into promiscuous mode, but can't 834df8bae1dSRodney W. Grimes * take it out. 835df8bae1dSRodney W. Grimes */ 8368eab61f3SSam Leffler if_printf(bp->bif_ifp, 8378eab61f3SSam Leffler "bpf_detach: ifpromisc failed (%d)\n", error); 8386e891d64SPoul-Henning Kamp } 839df8bae1dSRodney W. Grimes } 840df8bae1dSRodney W. Grimes } 841df8bae1dSRodney W. Grimes 842df8bae1dSRodney W. Grimes /* 843136600feSEd Schouten * Close the descriptor by detaching it from its interface, 844136600feSEd Schouten * deallocating its buffers, and marking it free. 845136600feSEd Schouten */ 846136600feSEd Schouten static void 847136600feSEd Schouten bpf_dtor(void *data) 848136600feSEd Schouten { 849136600feSEd Schouten struct bpf_d *d = data; 850136600feSEd Schouten 851afa85850SAlexander V. Chernikov BPFD_LOCK(d); 852136600feSEd Schouten if (d->bd_state == BPF_WAITING) 853136600feSEd Schouten callout_stop(&d->bd_callout); 854136600feSEd Schouten d->bd_state = BPF_IDLE; 855afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 856136600feSEd Schouten funsetown(&d->bd_sigio); 857136600feSEd Schouten bpf_detachd(d); 858136600feSEd Schouten #ifdef MAC 859136600feSEd Schouten mac_bpfdesc_destroy(d); 860136600feSEd Schouten #endif /* MAC */ 8616aba400aSAttilio Rao seldrain(&d->bd_sel); 862136600feSEd Schouten knlist_destroy(&d->bd_sel.si_note); 8639fee1bd1SJung-uk Kim callout_drain(&d->bd_callout); 864136600feSEd Schouten bpf_freed(d); 865136600feSEd Schouten free(d, M_BPF); 866136600feSEd Schouten } 867136600feSEd Schouten 868136600feSEd Schouten /* 869df8bae1dSRodney W. Grimes * Open ethernet device. Returns ENXIO for illegal minor device number, 870df8bae1dSRodney W. Grimes * EBUSY if file is open by another process. 871df8bae1dSRodney W. Grimes */ 872df8bae1dSRodney W. Grimes /* ARGSUSED */ 87387f6c662SJulian Elischer static int 87419ba8395SChristian S.J. Peron bpfopen(struct cdev *dev, int flags, int fmt, struct thread *td) 875df8bae1dSRodney W. Grimes { 876e7bb21b3SJonathan Lemon struct bpf_d *d; 8774f42daa4SLuiz Otavio O Souza int error; 878df8bae1dSRodney W. Grimes 8791ede983cSDag-Erling Smørgrav d = malloc(sizeof(*d), M_BPF, M_WAITOK | M_ZERO); 880136600feSEd Schouten error = devfs_set_cdevpriv(d, bpf_dtor); 881136600feSEd Schouten if (error != 0) { 882136600feSEd Schouten free(d, M_BPF); 883136600feSEd Schouten return (error); 884136600feSEd Schouten } 8854d621040SChristian S.J. Peron 8864d621040SChristian S.J. Peron /* 8874d621040SChristian S.J. Peron * For historical reasons, perform a one-time initialization call to 8884d621040SChristian S.J. Peron * the buffer routines, even though we're not yet committed to a 8894d621040SChristian S.J. Peron * particular buffer method. 8904d621040SChristian S.J. Peron */ 8914d621040SChristian S.J. Peron bpf_buffer_init(d); 89271448753SAlexander Motin if ((flags & FREAD) == 0) 89371448753SAlexander Motin d->bd_writer = 2; 8943b3b91e7SGuy Helmer d->bd_hbuf_in_use = 0; 8954d621040SChristian S.J. Peron d->bd_bufmode = BPF_BUFMODE_BUFFER; 89600a83887SPaul Traina d->bd_sig = SIGIO; 897560a54e1SJung-uk Kim d->bd_direction = BPF_D_INOUT; 898e4b3229aSAlexander V. Chernikov BPF_PID_REFRESH(d, td); 89982f4445dSRobert Watson #ifdef MAC 90030d239bcSRobert Watson mac_bpfdesc_init(d); 90130d239bcSRobert Watson mac_bpfdesc_create(td->td_ucred, d); 90282f4445dSRobert Watson #endif 903afa85850SAlexander V. Chernikov mtx_init(&d->bd_lock, devtoname(dev), "bpf cdev lock", MTX_DEF); 904afa85850SAlexander V. Chernikov callout_init_mtx(&d->bd_callout, &d->bd_lock, 0); 905afa85850SAlexander V. Chernikov knlist_init_mtx(&d->bd_sel.si_note, &d->bd_lock); 906df8bae1dSRodney W. Grimes 907df8bae1dSRodney W. Grimes return (0); 908df8bae1dSRodney W. Grimes } 909df8bae1dSRodney W. Grimes 910df8bae1dSRodney W. Grimes /* 911df8bae1dSRodney W. Grimes * bpfread - read next chunk of packets from buffers 912df8bae1dSRodney W. Grimes */ 91387f6c662SJulian Elischer static int 91419ba8395SChristian S.J. Peron bpfread(struct cdev *dev, struct uio *uio, int ioflag) 915df8bae1dSRodney W. Grimes { 916136600feSEd Schouten struct bpf_d *d; 917df8bae1dSRodney W. Grimes int error; 9188df67d77SJung-uk Kim int non_block; 9198df67d77SJung-uk Kim int timed_out; 920df8bae1dSRodney W. Grimes 921136600feSEd Schouten error = devfs_get_cdevpriv((void **)&d); 922136600feSEd Schouten if (error != 0) 923136600feSEd Schouten return (error); 924136600feSEd Schouten 925df8bae1dSRodney W. Grimes /* 926df8bae1dSRodney W. Grimes * Restrict application to use a buffer the same size as 927df8bae1dSRodney W. Grimes * as kernel buffers. 928df8bae1dSRodney W. Grimes */ 929df8bae1dSRodney W. Grimes if (uio->uio_resid != d->bd_bufsize) 930df8bae1dSRodney W. Grimes return (EINVAL); 931df8bae1dSRodney W. Grimes 9328df67d77SJung-uk Kim non_block = ((ioflag & O_NONBLOCK) != 0); 9338df67d77SJung-uk Kim 934afa85850SAlexander V. Chernikov BPFD_LOCK(d); 935e4b3229aSAlexander V. Chernikov BPF_PID_REFRESH_CUR(d); 9364d621040SChristian S.J. Peron if (d->bd_bufmode != BPF_BUFMODE_BUFFER) { 937afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 9384d621040SChristian S.J. Peron return (EOPNOTSUPP); 9394d621040SChristian S.J. Peron } 94081bda851SJohn Polstra if (d->bd_state == BPF_WAITING) 94181bda851SJohn Polstra callout_stop(&d->bd_callout); 94281bda851SJohn Polstra timed_out = (d->bd_state == BPF_TIMED_OUT); 94381bda851SJohn Polstra d->bd_state = BPF_IDLE; 944d013d902SGuy Helmer while (d->bd_hbuf_in_use) { 945d013d902SGuy Helmer error = mtx_sleep(&d->bd_hbuf_in_use, &d->bd_lock, 9463b3b91e7SGuy Helmer PRINET|PCATCH, "bd_hbuf", 0); 947d013d902SGuy Helmer if (error != 0) { 948d013d902SGuy Helmer BPFD_UNLOCK(d); 949d013d902SGuy Helmer return (error); 950d013d902SGuy Helmer } 951d013d902SGuy Helmer } 952df8bae1dSRodney W. Grimes /* 953df8bae1dSRodney W. Grimes * If the hold buffer is empty, then do a timed sleep, which 954df8bae1dSRodney W. Grimes * ends when the timeout expires or when enough packets 955df8bae1dSRodney W. Grimes * have arrived to fill the store buffer. 956df8bae1dSRodney W. Grimes */ 957572bde2aSRobert Watson while (d->bd_hbuf == NULL) { 9588df67d77SJung-uk Kim if (d->bd_slen != 0) { 959df8bae1dSRodney W. Grimes /* 960df8bae1dSRodney W. Grimes * A packet(s) either arrived since the previous 961df8bae1dSRodney W. Grimes * read or arrived while we were asleep. 9628df67d77SJung-uk Kim */ 9638df67d77SJung-uk Kim if (d->bd_immediate || non_block || timed_out) { 9648df67d77SJung-uk Kim /* 9658df67d77SJung-uk Kim * Rotate the buffers and return what's here 9668df67d77SJung-uk Kim * if we are in immediate mode, non-blocking 9678df67d77SJung-uk Kim * flag is set, or this descriptor timed out. 968df8bae1dSRodney W. Grimes */ 969df8bae1dSRodney W. Grimes ROTATE_BUFFERS(d); 970df8bae1dSRodney W. Grimes break; 971df8bae1dSRodney W. Grimes } 9728df67d77SJung-uk Kim } 973de5d9935SRobert Watson 974de5d9935SRobert Watson /* 975de5d9935SRobert Watson * No data is available, check to see if the bpf device 976de5d9935SRobert Watson * is still pointed at a real interface. If not, return 977de5d9935SRobert Watson * ENXIO so that the userland process knows to rebind 978de5d9935SRobert Watson * it before using it again. 979de5d9935SRobert Watson */ 980de5d9935SRobert Watson if (d->bd_bif == NULL) { 981afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 982de5d9935SRobert Watson return (ENXIO); 983de5d9935SRobert Watson } 984de5d9935SRobert Watson 9858df67d77SJung-uk Kim if (non_block) { 986afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 987fba3cfdeSJohn Polstra return (EWOULDBLOCK); 988fba3cfdeSJohn Polstra } 989afa85850SAlexander V. Chernikov error = msleep(d, &d->bd_lock, PRINET|PCATCH, 990e7bb21b3SJonathan Lemon "bpf", d->bd_rtout); 991df8bae1dSRodney W. Grimes if (error == EINTR || error == ERESTART) { 992afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 993df8bae1dSRodney W. Grimes return (error); 994df8bae1dSRodney W. Grimes } 995df8bae1dSRodney W. Grimes if (error == EWOULDBLOCK) { 996df8bae1dSRodney W. Grimes /* 997df8bae1dSRodney W. Grimes * On a timeout, return what's in the buffer, 998df8bae1dSRodney W. Grimes * which may be nothing. If there is something 999df8bae1dSRodney W. Grimes * in the store buffer, we can rotate the buffers. 1000df8bae1dSRodney W. Grimes */ 1001df8bae1dSRodney W. Grimes if (d->bd_hbuf) 1002df8bae1dSRodney W. Grimes /* 1003df8bae1dSRodney W. Grimes * We filled up the buffer in between 1004df8bae1dSRodney W. Grimes * getting the timeout and arriving 1005df8bae1dSRodney W. Grimes * here, so we don't need to rotate. 1006df8bae1dSRodney W. Grimes */ 1007df8bae1dSRodney W. Grimes break; 1008df8bae1dSRodney W. Grimes 1009df8bae1dSRodney W. Grimes if (d->bd_slen == 0) { 1010afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 1011df8bae1dSRodney W. Grimes return (0); 1012df8bae1dSRodney W. Grimes } 1013df8bae1dSRodney W. Grimes ROTATE_BUFFERS(d); 1014df8bae1dSRodney W. Grimes break; 1015df8bae1dSRodney W. Grimes } 1016df8bae1dSRodney W. Grimes } 1017df8bae1dSRodney W. Grimes /* 1018df8bae1dSRodney W. Grimes * At this point, we know we have something in the hold slot. 1019df8bae1dSRodney W. Grimes */ 10203b3b91e7SGuy Helmer d->bd_hbuf_in_use = 1; 1021afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 1022df8bae1dSRodney W. Grimes 1023df8bae1dSRodney W. Grimes /* 1024df8bae1dSRodney W. Grimes * Move data from hold buffer into user space. 1025df8bae1dSRodney W. Grimes * We know the entire buffer is transferred since 1026df8bae1dSRodney W. Grimes * we checked above that the read buffer is bpf_bufsize bytes. 102731b32e6dSRobert Watson * 10283b3b91e7SGuy Helmer * We do not have to worry about simultaneous reads because 10293b3b91e7SGuy Helmer * we waited for sole access to the hold buffer above. 1030df8bae1dSRodney W. Grimes */ 10314d621040SChristian S.J. Peron error = bpf_uiomove(d, d->bd_hbuf, d->bd_hlen, uio); 1032df8bae1dSRodney W. Grimes 1033afa85850SAlexander V. Chernikov BPFD_LOCK(d); 10343b3b91e7SGuy Helmer KASSERT(d->bd_hbuf != NULL, ("bpfread: lost bd_hbuf")); 1035df8bae1dSRodney W. Grimes d->bd_fbuf = d->bd_hbuf; 1036572bde2aSRobert Watson d->bd_hbuf = NULL; 1037df8bae1dSRodney W. Grimes d->bd_hlen = 0; 103829f612ecSChristian S.J. Peron bpf_buf_reclaimed(d); 10393b3b91e7SGuy Helmer d->bd_hbuf_in_use = 0; 10403b3b91e7SGuy Helmer wakeup(&d->bd_hbuf_in_use); 1041afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 1042df8bae1dSRodney W. Grimes 1043df8bae1dSRodney W. Grimes return (error); 1044df8bae1dSRodney W. Grimes } 1045df8bae1dSRodney W. Grimes 1046df8bae1dSRodney W. Grimes /* 1047df8bae1dSRodney W. Grimes * If there are processes sleeping on this descriptor, wake them up. 1048df8bae1dSRodney W. Grimes */ 1049e7bb21b3SJonathan Lemon static __inline void 105019ba8395SChristian S.J. Peron bpf_wakeup(struct bpf_d *d) 1051df8bae1dSRodney W. Grimes { 1052a3272e3cSChristian S.J. Peron 1053afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 105481bda851SJohn Polstra if (d->bd_state == BPF_WAITING) { 105581bda851SJohn Polstra callout_stop(&d->bd_callout); 105681bda851SJohn Polstra d->bd_state = BPF_IDLE; 105781bda851SJohn Polstra } 1058521f364bSDag-Erling Smørgrav wakeup(d); 1059831d27a9SDon Lewis if (d->bd_async && d->bd_sig && d->bd_sigio) 1060f1320723SAlfred Perlstein pgsigio(&d->bd_sigio, d->bd_sig, 0); 106100a83887SPaul Traina 1062512824f8SSeigo Tanimura selwakeuppri(&d->bd_sel, PRINET); 1063ad3b9257SJohn-Mark Gurney KNOTE_LOCKED(&d->bd_sel.si_note, 0); 1064df8bae1dSRodney W. Grimes } 1065df8bae1dSRodney W. Grimes 106681bda851SJohn Polstra static void 106719ba8395SChristian S.J. Peron bpf_timed_out(void *arg) 106881bda851SJohn Polstra { 106981bda851SJohn Polstra struct bpf_d *d = (struct bpf_d *)arg; 107081bda851SJohn Polstra 1071afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 10729fee1bd1SJung-uk Kim 10739fee1bd1SJung-uk Kim if (callout_pending(&d->bd_callout) || !callout_active(&d->bd_callout)) 10749fee1bd1SJung-uk Kim return; 107581bda851SJohn Polstra if (d->bd_state == BPF_WAITING) { 107681bda851SJohn Polstra d->bd_state = BPF_TIMED_OUT; 107781bda851SJohn Polstra if (d->bd_slen != 0) 107881bda851SJohn Polstra bpf_wakeup(d); 107981bda851SJohn Polstra } 108081bda851SJohn Polstra } 108181bda851SJohn Polstra 108287f6c662SJulian Elischer static int 10834d621040SChristian S.J. Peron bpf_ready(struct bpf_d *d) 10844d621040SChristian S.J. Peron { 10854d621040SChristian S.J. Peron 1086afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 10874d621040SChristian S.J. Peron 10884d621040SChristian S.J. Peron if (!bpf_canfreebuf(d) && d->bd_hlen != 0) 10894d621040SChristian S.J. Peron return (1); 10904d621040SChristian S.J. Peron if ((d->bd_immediate || d->bd_state == BPF_TIMED_OUT) && 10914d621040SChristian S.J. Peron d->bd_slen != 0) 10924d621040SChristian S.J. Peron return (1); 10934d621040SChristian S.J. Peron return (0); 10944d621040SChristian S.J. Peron } 10954d621040SChristian S.J. Peron 10964d621040SChristian S.J. Peron static int 109719ba8395SChristian S.J. Peron bpfwrite(struct cdev *dev, struct uio *uio, int ioflag) 1098df8bae1dSRodney W. Grimes { 1099136600feSEd Schouten struct bpf_d *d; 1100df8bae1dSRodney W. Grimes struct ifnet *ifp; 1101560a54e1SJung-uk Kim struct mbuf *m, *mc; 11028240bf1eSRobert Watson struct sockaddr dst; 11034fb3a820SAlexander V. Chernikov struct route ro; 1104560a54e1SJung-uk Kim int error, hlen; 1105df8bae1dSRodney W. Grimes 1106136600feSEd Schouten error = devfs_get_cdevpriv((void **)&d); 1107136600feSEd Schouten if (error != 0) 1108136600feSEd Schouten return (error); 1109136600feSEd Schouten 1110e4b3229aSAlexander V. Chernikov BPF_PID_REFRESH_CUR(d); 11114d621040SChristian S.J. Peron d->bd_wcount++; 11126c74ff0eSAlexander V. Chernikov /* XXX: locking required */ 11134d621040SChristian S.J. Peron if (d->bd_bif == NULL) { 11144d621040SChristian S.J. Peron d->bd_wdcount++; 1115df8bae1dSRodney W. Grimes return (ENXIO); 11164d621040SChristian S.J. Peron } 1117df8bae1dSRodney W. Grimes 1118df8bae1dSRodney W. Grimes ifp = d->bd_bif->bif_ifp; 1119df8bae1dSRodney W. Grimes 11204d621040SChristian S.J. Peron if ((ifp->if_flags & IFF_UP) == 0) { 11214d621040SChristian S.J. Peron d->bd_wdcount++; 11223518d220SSam Leffler return (ENETDOWN); 11234d621040SChristian S.J. Peron } 11243518d220SSam Leffler 11254d621040SChristian S.J. Peron if (uio->uio_resid == 0) { 11264d621040SChristian S.J. Peron d->bd_wdcount++; 1127df8bae1dSRodney W. Grimes return (0); 11284d621040SChristian S.J. Peron } 1129df8bae1dSRodney W. Grimes 11308240bf1eSRobert Watson bzero(&dst, sizeof(dst)); 1131d83e603aSChristian S.J. Peron m = NULL; 1132d83e603aSChristian S.J. Peron hlen = 0; 11336c74ff0eSAlexander V. Chernikov /* XXX: bpf_movein() can sleep */ 1134cb44b6dfSAndrew Thompson error = bpf_movein(uio, (int)d->bd_bif->bif_dlt, ifp, 11354fb3a820SAlexander V. Chernikov &m, &dst, &hlen, d); 11364d621040SChristian S.J. Peron if (error) { 11374d621040SChristian S.J. Peron d->bd_wdcount++; 1138df8bae1dSRodney W. Grimes return (error); 11394d621040SChristian S.J. Peron } 11404d621040SChristian S.J. Peron d->bd_wfcount++; 1141114ae644SMike Smith if (d->bd_hdrcmplt) 1142114ae644SMike Smith dst.sa_family = pseudo_AF_HDRCMPLT; 1143114ae644SMike Smith 1144560a54e1SJung-uk Kim if (d->bd_feedback) { 1145eb1b1807SGleb Smirnoff mc = m_dup(m, M_NOWAIT); 1146560a54e1SJung-uk Kim if (mc != NULL) 1147560a54e1SJung-uk Kim mc->m_pkthdr.rcvif = ifp; 11488cd892f7SJung-uk Kim /* Set M_PROMISC for outgoing packets to be discarded. */ 11498cd892f7SJung-uk Kim if (d->bd_direction == BPF_D_INOUT) 11508cd892f7SJung-uk Kim m->m_flags |= M_PROMISC; 1151560a54e1SJung-uk Kim } else 1152560a54e1SJung-uk Kim mc = NULL; 1153560a54e1SJung-uk Kim 1154560a54e1SJung-uk Kim m->m_pkthdr.len -= hlen; 1155560a54e1SJung-uk Kim m->m_len -= hlen; 1156560a54e1SJung-uk Kim m->m_data += hlen; /* XXX */ 1157560a54e1SJung-uk Kim 115821ca7b57SMarko Zec CURVNET_SET(ifp->if_vnet); 115982f4445dSRobert Watson #ifdef MAC 1160afa85850SAlexander V. Chernikov BPFD_LOCK(d); 116130d239bcSRobert Watson mac_bpfdesc_create_mbuf(d, m); 1162560a54e1SJung-uk Kim if (mc != NULL) 116330d239bcSRobert Watson mac_bpfdesc_create_mbuf(d, mc); 1164afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 116582f4445dSRobert Watson #endif 1166560a54e1SJung-uk Kim 11674fb3a820SAlexander V. Chernikov bzero(&ro, sizeof(ro)); 11684fb3a820SAlexander V. Chernikov if (hlen != 0) { 11694fb3a820SAlexander V. Chernikov ro.ro_prepend = (u_char *)&dst.sa_data; 11704fb3a820SAlexander V. Chernikov ro.ro_plen = hlen; 11714fb3a820SAlexander V. Chernikov ro.ro_flags = RT_HAS_HEADER; 11724fb3a820SAlexander V. Chernikov } 11734fb3a820SAlexander V. Chernikov 11744fb3a820SAlexander V. Chernikov error = (*ifp->if_output)(ifp, m, &dst, &ro); 11754d621040SChristian S.J. Peron if (error) 11764d621040SChristian S.J. Peron d->bd_wdcount++; 1177560a54e1SJung-uk Kim 1178560a54e1SJung-uk Kim if (mc != NULL) { 11790bf686c1SRobert Watson if (error == 0) 1180560a54e1SJung-uk Kim (*ifp->if_input)(ifp, mc); 11810bf686c1SRobert Watson else 1182560a54e1SJung-uk Kim m_freem(mc); 1183560a54e1SJung-uk Kim } 118421ca7b57SMarko Zec CURVNET_RESTORE(); 1185560a54e1SJung-uk Kim 1186df8bae1dSRodney W. Grimes return (error); 1187df8bae1dSRodney W. Grimes } 1188df8bae1dSRodney W. Grimes 1189df8bae1dSRodney W. Grimes /* 1190e82669d9SRobert Watson * Reset a descriptor by flushing its packet buffer and clearing the receive 1191e82669d9SRobert Watson * and drop counts. This is doable for kernel-only buffers, but with 1192e82669d9SRobert Watson * zero-copy buffers, we can't write to (or rotate) buffers that are 1193e82669d9SRobert Watson * currently owned by userspace. It would be nice if we could encapsulate 1194e82669d9SRobert Watson * this logic in the buffer code rather than here. 1195df8bae1dSRodney W. Grimes */ 1196df8bae1dSRodney W. Grimes static void 119719ba8395SChristian S.J. Peron reset_d(struct bpf_d *d) 1198df8bae1dSRodney W. Grimes { 1199e7bb21b3SJonathan Lemon 1200afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 1201e82669d9SRobert Watson 12023b3b91e7SGuy Helmer while (d->bd_hbuf_in_use) 12033b3b91e7SGuy Helmer mtx_sleep(&d->bd_hbuf_in_use, &d->bd_lock, PRINET, 12043b3b91e7SGuy Helmer "bd_hbuf", 0); 1205e82669d9SRobert Watson if ((d->bd_hbuf != NULL) && 1206e82669d9SRobert Watson (d->bd_bufmode != BPF_BUFMODE_ZBUF || bpf_canfreebuf(d))) { 1207df8bae1dSRodney W. Grimes /* Free the hold buffer. */ 1208df8bae1dSRodney W. Grimes d->bd_fbuf = d->bd_hbuf; 1209572bde2aSRobert Watson d->bd_hbuf = NULL; 1210e82669d9SRobert Watson d->bd_hlen = 0; 121129f612ecSChristian S.J. Peron bpf_buf_reclaimed(d); 1212df8bae1dSRodney W. Grimes } 1213e82669d9SRobert Watson if (bpf_canwritebuf(d)) 1214df8bae1dSRodney W. Grimes d->bd_slen = 0; 1215df8bae1dSRodney W. Grimes d->bd_rcount = 0; 1216df8bae1dSRodney W. Grimes d->bd_dcount = 0; 121769f7644bSChristian S.J. Peron d->bd_fcount = 0; 12184d621040SChristian S.J. Peron d->bd_wcount = 0; 12194d621040SChristian S.J. Peron d->bd_wfcount = 0; 12204d621040SChristian S.J. Peron d->bd_wdcount = 0; 12214d621040SChristian S.J. Peron d->bd_zcopy = 0; 1222df8bae1dSRodney W. Grimes } 1223df8bae1dSRodney W. Grimes 1224df8bae1dSRodney W. Grimes /* 1225df8bae1dSRodney W. Grimes * FIONREAD Check for read packet available. 1226df8bae1dSRodney W. Grimes * BIOCGBLEN Get buffer len [for read()]. 1227f11c3508SDavid Malone * BIOCSETF Set read filter. 1228f11c3508SDavid Malone * BIOCSETFNR Set read filter without resetting descriptor. 1229f11c3508SDavid Malone * BIOCSETWF Set write filter. 1230df8bae1dSRodney W. Grimes * BIOCFLUSH Flush read packet buffer. 1231df8bae1dSRodney W. Grimes * BIOCPROMISC Put interface into promiscuous mode. 1232df8bae1dSRodney W. Grimes * BIOCGDLT Get link layer type. 1233df8bae1dSRodney W. Grimes * BIOCGETIF Get interface name. 1234df8bae1dSRodney W. Grimes * BIOCSETIF Set interface. 1235df8bae1dSRodney W. Grimes * BIOCSRTIMEOUT Set read timeout. 1236df8bae1dSRodney W. Grimes * BIOCGRTIMEOUT Get read timeout. 1237df8bae1dSRodney W. Grimes * BIOCGSTATS Get packet stats. 1238df8bae1dSRodney W. Grimes * BIOCIMMEDIATE Set immediate mode. 1239df8bae1dSRodney W. Grimes * BIOCVERSION Get filter language version. 1240114ae644SMike Smith * BIOCGHDRCMPLT Get "header already complete" flag 1241114ae644SMike Smith * BIOCSHDRCMPLT Set "header already complete" flag 1242560a54e1SJung-uk Kim * BIOCGDIRECTION Get packet direction flag 1243560a54e1SJung-uk Kim * BIOCSDIRECTION Set packet direction flag 1244547d94bdSJung-uk Kim * BIOCGTSTAMP Get time stamp format and resolution. 1245547d94bdSJung-uk Kim * BIOCSTSTAMP Set time stamp format and resolution. 124693e39f0bSChristian S.J. Peron * BIOCLOCK Set "locked" flag 1247560a54e1SJung-uk Kim * BIOCFEEDBACK Set packet feedback mode. 12484d621040SChristian S.J. Peron * BIOCSETZBUF Set current zero-copy buffer locations. 12494d621040SChristian S.J. Peron * BIOCGETZMAX Get maximum zero-copy buffer size. 12504d621040SChristian S.J. Peron * BIOCROTZBUF Force rotation of zero-copy buffer 12514d621040SChristian S.J. Peron * BIOCSETBUFMODE Set buffer mode. 12524d621040SChristian S.J. Peron * BIOCGETBUFMODE Get current buffer mode. 1253df8bae1dSRodney W. Grimes */ 1254df8bae1dSRodney W. Grimes /* ARGSUSED */ 125587f6c662SJulian Elischer static int 125619ba8395SChristian S.J. Peron bpfioctl(struct cdev *dev, u_long cmd, caddr_t addr, int flags, 125719ba8395SChristian S.J. Peron struct thread *td) 1258df8bae1dSRodney W. Grimes { 1259136600feSEd Schouten struct bpf_d *d; 1260136600feSEd Schouten int error; 1261136600feSEd Schouten 1262136600feSEd Schouten error = devfs_get_cdevpriv((void **)&d); 1263136600feSEd Schouten if (error != 0) 1264136600feSEd Schouten return (error); 1265df8bae1dSRodney W. Grimes 1266b75a24a0SChristian S.J. Peron /* 1267b75a24a0SChristian S.J. Peron * Refresh PID associated with this descriptor. 1268b75a24a0SChristian S.J. Peron */ 1269afa85850SAlexander V. Chernikov BPFD_LOCK(d); 1270e4b3229aSAlexander V. Chernikov BPF_PID_REFRESH(d, td); 127181bda851SJohn Polstra if (d->bd_state == BPF_WAITING) 127281bda851SJohn Polstra callout_stop(&d->bd_callout); 127381bda851SJohn Polstra d->bd_state = BPF_IDLE; 1274afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 127581bda851SJohn Polstra 127693e39f0bSChristian S.J. Peron if (d->bd_locked == 1) { 127793e39f0bSChristian S.J. Peron switch (cmd) { 127893e39f0bSChristian S.J. Peron case BIOCGBLEN: 127993e39f0bSChristian S.J. Peron case BIOCFLUSH: 128093e39f0bSChristian S.J. Peron case BIOCGDLT: 128193e39f0bSChristian S.J. Peron case BIOCGDLTLIST: 1282fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 1283fc0a61a4SKonstantin Belousov case BIOCGDLTLIST32: 1284fc0a61a4SKonstantin Belousov #endif 128593e39f0bSChristian S.J. Peron case BIOCGETIF: 128693e39f0bSChristian S.J. Peron case BIOCGRTIMEOUT: 1287b4366092SJustin Hibbits #if defined(COMPAT_FREEBSD32) && defined(__amd64__) 1288fc0a61a4SKonstantin Belousov case BIOCGRTIMEOUT32: 1289fc0a61a4SKonstantin Belousov #endif 129093e39f0bSChristian S.J. Peron case BIOCGSTATS: 129193e39f0bSChristian S.J. Peron case BIOCVERSION: 129293e39f0bSChristian S.J. Peron case BIOCGRSIG: 129393e39f0bSChristian S.J. Peron case BIOCGHDRCMPLT: 1294547d94bdSJung-uk Kim case BIOCSTSTAMP: 1295560a54e1SJung-uk Kim case BIOCFEEDBACK: 129693e39f0bSChristian S.J. Peron case FIONREAD: 129793e39f0bSChristian S.J. Peron case BIOCLOCK: 129893e39f0bSChristian S.J. Peron case BIOCSRTIMEOUT: 1299b4366092SJustin Hibbits #if defined(COMPAT_FREEBSD32) && defined(__amd64__) 1300fc0a61a4SKonstantin Belousov case BIOCSRTIMEOUT32: 1301fc0a61a4SKonstantin Belousov #endif 130293e39f0bSChristian S.J. Peron case BIOCIMMEDIATE: 130393e39f0bSChristian S.J. Peron case TIOCGPGRP: 13044d621040SChristian S.J. Peron case BIOCROTZBUF: 130593e39f0bSChristian S.J. Peron break; 130693e39f0bSChristian S.J. Peron default: 130793e39f0bSChristian S.J. Peron return (EPERM); 130893e39f0bSChristian S.J. Peron } 130993e39f0bSChristian S.J. Peron } 1310fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 1311fc0a61a4SKonstantin Belousov /* 1312fc0a61a4SKonstantin Belousov * If we see a 32-bit compat ioctl, mark the stream as 32-bit so 1313fc0a61a4SKonstantin Belousov * that it will get 32-bit packet headers. 1314fc0a61a4SKonstantin Belousov */ 1315fc0a61a4SKonstantin Belousov switch (cmd) { 1316fc0a61a4SKonstantin Belousov case BIOCSETF32: 1317fc0a61a4SKonstantin Belousov case BIOCSETFNR32: 1318fc0a61a4SKonstantin Belousov case BIOCSETWF32: 1319fc0a61a4SKonstantin Belousov case BIOCGDLTLIST32: 1320fc0a61a4SKonstantin Belousov case BIOCGRTIMEOUT32: 1321fc0a61a4SKonstantin Belousov case BIOCSRTIMEOUT32: 132297aacec6SAlexander V. Chernikov BPFD_LOCK(d); 1323fc0a61a4SKonstantin Belousov d->bd_compat32 = 1; 132497aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 1325fc0a61a4SKonstantin Belousov } 1326fc0a61a4SKonstantin Belousov #endif 1327fc0a61a4SKonstantin Belousov 132897021c24SMarko Zec CURVNET_SET(TD_TO_VNET(td)); 1329df8bae1dSRodney W. Grimes switch (cmd) { 1330df8bae1dSRodney W. Grimes 1331df8bae1dSRodney W. Grimes default: 1332df8bae1dSRodney W. Grimes error = EINVAL; 1333df8bae1dSRodney W. Grimes break; 1334df8bae1dSRodney W. Grimes 1335df8bae1dSRodney W. Grimes /* 1336df8bae1dSRodney W. Grimes * Check for read packet available. 1337df8bae1dSRodney W. Grimes */ 1338df8bae1dSRodney W. Grimes case FIONREAD: 1339df8bae1dSRodney W. Grimes { 1340df8bae1dSRodney W. Grimes int n; 1341df8bae1dSRodney W. Grimes 1342afa85850SAlexander V. Chernikov BPFD_LOCK(d); 1343df8bae1dSRodney W. Grimes n = d->bd_slen; 13443b3b91e7SGuy Helmer while (d->bd_hbuf_in_use) 13453b3b91e7SGuy Helmer mtx_sleep(&d->bd_hbuf_in_use, &d->bd_lock, 13463b3b91e7SGuy Helmer PRINET, "bd_hbuf", 0); 1347df8bae1dSRodney W. Grimes if (d->bd_hbuf) 1348df8bae1dSRodney W. Grimes n += d->bd_hlen; 1349afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 1350df8bae1dSRodney W. Grimes 1351df8bae1dSRodney W. Grimes *(int *)addr = n; 1352df8bae1dSRodney W. Grimes break; 1353df8bae1dSRodney W. Grimes } 1354df8bae1dSRodney W. Grimes 1355df8bae1dSRodney W. Grimes /* 1356df8bae1dSRodney W. Grimes * Get buffer len [for read()]. 1357df8bae1dSRodney W. Grimes */ 1358df8bae1dSRodney W. Grimes case BIOCGBLEN: 135997aacec6SAlexander V. Chernikov BPFD_LOCK(d); 1360df8bae1dSRodney W. Grimes *(u_int *)addr = d->bd_bufsize; 136197aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 1362df8bae1dSRodney W. Grimes break; 1363df8bae1dSRodney W. Grimes 1364df8bae1dSRodney W. Grimes /* 1365df8bae1dSRodney W. Grimes * Set buffer length. 1366df8bae1dSRodney W. Grimes */ 1367df8bae1dSRodney W. Grimes case BIOCSBLEN: 13684d621040SChristian S.J. Peron error = bpf_ioctl_sblen(d, (u_int *)addr); 1369df8bae1dSRodney W. Grimes break; 1370df8bae1dSRodney W. Grimes 1371df8bae1dSRodney W. Grimes /* 1372df8bae1dSRodney W. Grimes * Set link layer read filter. 1373df8bae1dSRodney W. Grimes */ 1374df8bae1dSRodney W. Grimes case BIOCSETF: 1375f11c3508SDavid Malone case BIOCSETFNR: 137693e39f0bSChristian S.J. Peron case BIOCSETWF: 1377fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 1378fc0a61a4SKonstantin Belousov case BIOCSETF32: 1379fc0a61a4SKonstantin Belousov case BIOCSETFNR32: 1380fc0a61a4SKonstantin Belousov case BIOCSETWF32: 1381fc0a61a4SKonstantin Belousov #endif 138293e39f0bSChristian S.J. Peron error = bpf_setf(d, (struct bpf_program *)addr, cmd); 1383df8bae1dSRodney W. Grimes break; 1384df8bae1dSRodney W. Grimes 1385df8bae1dSRodney W. Grimes /* 1386df8bae1dSRodney W. Grimes * Flush read packet buffer. 1387df8bae1dSRodney W. Grimes */ 1388df8bae1dSRodney W. Grimes case BIOCFLUSH: 1389afa85850SAlexander V. Chernikov BPFD_LOCK(d); 1390df8bae1dSRodney W. Grimes reset_d(d); 1391afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 1392df8bae1dSRodney W. Grimes break; 1393df8bae1dSRodney W. Grimes 1394df8bae1dSRodney W. Grimes /* 1395df8bae1dSRodney W. Grimes * Put interface into promiscuous mode. 1396df8bae1dSRodney W. Grimes */ 1397df8bae1dSRodney W. Grimes case BIOCPROMISC: 1398572bde2aSRobert Watson if (d->bd_bif == NULL) { 1399df8bae1dSRodney W. Grimes /* 1400df8bae1dSRodney W. Grimes * No interface attached yet. 1401df8bae1dSRodney W. Grimes */ 1402df8bae1dSRodney W. Grimes error = EINVAL; 1403df8bae1dSRodney W. Grimes break; 1404df8bae1dSRodney W. Grimes } 1405df8bae1dSRodney W. Grimes if (d->bd_promisc == 0) { 1406df8bae1dSRodney W. Grimes error = ifpromisc(d->bd_bif->bif_ifp, 1); 1407df8bae1dSRodney W. Grimes if (error == 0) 1408df8bae1dSRodney W. Grimes d->bd_promisc = 1; 1409df8bae1dSRodney W. Grimes } 1410df8bae1dSRodney W. Grimes break; 1411df8bae1dSRodney W. Grimes 1412df8bae1dSRodney W. Grimes /* 14138eab61f3SSam Leffler * Get current data link type. 1414df8bae1dSRodney W. Grimes */ 1415df8bae1dSRodney W. Grimes case BIOCGDLT: 141697aacec6SAlexander V. Chernikov BPF_LOCK(); 1417572bde2aSRobert Watson if (d->bd_bif == NULL) 1418df8bae1dSRodney W. Grimes error = EINVAL; 1419df8bae1dSRodney W. Grimes else 1420df8bae1dSRodney W. Grimes *(u_int *)addr = d->bd_bif->bif_dlt; 142197aacec6SAlexander V. Chernikov BPF_UNLOCK(); 1422df8bae1dSRodney W. Grimes break; 1423df8bae1dSRodney W. Grimes 1424df8bae1dSRodney W. Grimes /* 14258eab61f3SSam Leffler * Get a list of supported data link types. 14268eab61f3SSam Leffler */ 1427fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 1428fc0a61a4SKonstantin Belousov case BIOCGDLTLIST32: 1429fc0a61a4SKonstantin Belousov { 1430fc0a61a4SKonstantin Belousov struct bpf_dltlist32 *list32; 1431fc0a61a4SKonstantin Belousov struct bpf_dltlist dltlist; 1432fc0a61a4SKonstantin Belousov 1433fc0a61a4SKonstantin Belousov list32 = (struct bpf_dltlist32 *)addr; 1434fc0a61a4SKonstantin Belousov dltlist.bfl_len = list32->bfl_len; 1435fc0a61a4SKonstantin Belousov dltlist.bfl_list = PTRIN(list32->bfl_list); 143697aacec6SAlexander V. Chernikov BPF_LOCK(); 1437fc0a61a4SKonstantin Belousov if (d->bd_bif == NULL) 1438fc0a61a4SKonstantin Belousov error = EINVAL; 1439fc0a61a4SKonstantin Belousov else { 1440fc0a61a4SKonstantin Belousov error = bpf_getdltlist(d, &dltlist); 1441fc0a61a4SKonstantin Belousov if (error == 0) 1442fc0a61a4SKonstantin Belousov list32->bfl_len = dltlist.bfl_len; 1443fc0a61a4SKonstantin Belousov } 144497aacec6SAlexander V. Chernikov BPF_UNLOCK(); 1445fc0a61a4SKonstantin Belousov break; 1446fc0a61a4SKonstantin Belousov } 1447fc0a61a4SKonstantin Belousov #endif 1448fc0a61a4SKonstantin Belousov 14498eab61f3SSam Leffler case BIOCGDLTLIST: 145097aacec6SAlexander V. Chernikov BPF_LOCK(); 1451572bde2aSRobert Watson if (d->bd_bif == NULL) 14528eab61f3SSam Leffler error = EINVAL; 14538eab61f3SSam Leffler else 14548eab61f3SSam Leffler error = bpf_getdltlist(d, (struct bpf_dltlist *)addr); 145597aacec6SAlexander V. Chernikov BPF_UNLOCK(); 14568eab61f3SSam Leffler break; 14578eab61f3SSam Leffler 14588eab61f3SSam Leffler /* 14598eab61f3SSam Leffler * Set data link type. 14608eab61f3SSam Leffler */ 14618eab61f3SSam Leffler case BIOCSDLT: 14626c74ff0eSAlexander V. Chernikov BPF_LOCK(); 1463572bde2aSRobert Watson if (d->bd_bif == NULL) 14648eab61f3SSam Leffler error = EINVAL; 14658eab61f3SSam Leffler else 14668eab61f3SSam Leffler error = bpf_setdlt(d, *(u_int *)addr); 14676c74ff0eSAlexander V. Chernikov BPF_UNLOCK(); 14688eab61f3SSam Leffler break; 14698eab61f3SSam Leffler 14708eab61f3SSam Leffler /* 14711dd0feaaSArchie Cobbs * Get interface name. 1472df8bae1dSRodney W. Grimes */ 1473df8bae1dSRodney W. Grimes case BIOCGETIF: 147497aacec6SAlexander V. Chernikov BPF_LOCK(); 1475572bde2aSRobert Watson if (d->bd_bif == NULL) 1476df8bae1dSRodney W. Grimes error = EINVAL; 14771dd0feaaSArchie Cobbs else { 14781dd0feaaSArchie Cobbs struct ifnet *const ifp = d->bd_bif->bif_ifp; 14791dd0feaaSArchie Cobbs struct ifreq *const ifr = (struct ifreq *)addr; 14801dd0feaaSArchie Cobbs 14819bf40edeSBrooks Davis strlcpy(ifr->ifr_name, ifp->if_xname, 14829bf40edeSBrooks Davis sizeof(ifr->ifr_name)); 14831dd0feaaSArchie Cobbs } 148497aacec6SAlexander V. Chernikov BPF_UNLOCK(); 1485df8bae1dSRodney W. Grimes break; 1486df8bae1dSRodney W. Grimes 1487df8bae1dSRodney W. Grimes /* 1488df8bae1dSRodney W. Grimes * Set interface. 1489df8bae1dSRodney W. Grimes */ 1490df8bae1dSRodney W. Grimes case BIOCSETIF: 14914f42daa4SLuiz Otavio O Souza { 14924f42daa4SLuiz Otavio O Souza int alloc_buf, size; 14934f42daa4SLuiz Otavio O Souza 14944f42daa4SLuiz Otavio O Souza /* 14954f42daa4SLuiz Otavio O Souza * Behavior here depends on the buffering model. If 14964f42daa4SLuiz Otavio O Souza * we're using kernel memory buffers, then we can 14974f42daa4SLuiz Otavio O Souza * allocate them here. If we're using zero-copy, 14984f42daa4SLuiz Otavio O Souza * then the user process must have registered buffers 14994f42daa4SLuiz Otavio O Souza * by the time we get here. 15004f42daa4SLuiz Otavio O Souza */ 15014f42daa4SLuiz Otavio O Souza alloc_buf = 0; 15024f42daa4SLuiz Otavio O Souza BPFD_LOCK(d); 15034f42daa4SLuiz Otavio O Souza if (d->bd_bufmode == BPF_BUFMODE_BUFFER && 15044f42daa4SLuiz Otavio O Souza d->bd_sbuf == NULL) 15054f42daa4SLuiz Otavio O Souza alloc_buf = 1; 15064f42daa4SLuiz Otavio O Souza BPFD_UNLOCK(d); 15074f42daa4SLuiz Otavio O Souza if (alloc_buf) { 15084f42daa4SLuiz Otavio O Souza size = d->bd_bufsize; 15094f42daa4SLuiz Otavio O Souza error = bpf_buffer_ioctl_sblen(d, &size); 15104f42daa4SLuiz Otavio O Souza if (error != 0) 15114f42daa4SLuiz Otavio O Souza break; 15124f42daa4SLuiz Otavio O Souza } 15136c74ff0eSAlexander V. Chernikov BPF_LOCK(); 1514df8bae1dSRodney W. Grimes error = bpf_setif(d, (struct ifreq *)addr); 15156c74ff0eSAlexander V. Chernikov BPF_UNLOCK(); 1516df8bae1dSRodney W. Grimes break; 15174f42daa4SLuiz Otavio O Souza } 1518df8bae1dSRodney W. Grimes 1519df8bae1dSRodney W. Grimes /* 1520df8bae1dSRodney W. Grimes * Set read timeout. 1521df8bae1dSRodney W. Grimes */ 1522df8bae1dSRodney W. Grimes case BIOCSRTIMEOUT: 1523b4366092SJustin Hibbits #if defined(COMPAT_FREEBSD32) && defined(__amd64__) 1524fc0a61a4SKonstantin Belousov case BIOCSRTIMEOUT32: 1525fc0a61a4SKonstantin Belousov #endif 1526df8bae1dSRodney W. Grimes { 1527df8bae1dSRodney W. Grimes struct timeval *tv = (struct timeval *)addr; 15289624d947SJuli Mallett #if defined(COMPAT_FREEBSD32) && !defined(__mips__) 1529fc0a61a4SKonstantin Belousov struct timeval32 *tv32; 1530fc0a61a4SKonstantin Belousov struct timeval tv64; 1531fc0a61a4SKonstantin Belousov 1532fc0a61a4SKonstantin Belousov if (cmd == BIOCSRTIMEOUT32) { 1533fc0a61a4SKonstantin Belousov tv32 = (struct timeval32 *)addr; 1534fc0a61a4SKonstantin Belousov tv = &tv64; 1535fc0a61a4SKonstantin Belousov tv->tv_sec = tv32->tv_sec; 1536fc0a61a4SKonstantin Belousov tv->tv_usec = tv32->tv_usec; 1537fc0a61a4SKonstantin Belousov } else 1538fc0a61a4SKonstantin Belousov #endif 1539fc0a61a4SKonstantin Belousov tv = (struct timeval *)addr; 1540df8bae1dSRodney W. Grimes 1541bdc2cdc5SAlexander Langer /* 1542bdc2cdc5SAlexander Langer * Subtract 1 tick from tvtohz() since this isn't 1543bdc2cdc5SAlexander Langer * a one-shot timer. 1544bdc2cdc5SAlexander Langer */ 1545bdc2cdc5SAlexander Langer if ((error = itimerfix(tv)) == 0) 1546bdc2cdc5SAlexander Langer d->bd_rtout = tvtohz(tv) - 1; 1547df8bae1dSRodney W. Grimes break; 1548df8bae1dSRodney W. Grimes } 1549df8bae1dSRodney W. Grimes 1550df8bae1dSRodney W. Grimes /* 1551df8bae1dSRodney W. Grimes * Get read timeout. 1552df8bae1dSRodney W. Grimes */ 1553df8bae1dSRodney W. Grimes case BIOCGRTIMEOUT: 1554b4366092SJustin Hibbits #if defined(COMPAT_FREEBSD32) && defined(__amd64__) 1555fc0a61a4SKonstantin Belousov case BIOCGRTIMEOUT32: 1556fc0a61a4SKonstantin Belousov #endif 1557df8bae1dSRodney W. Grimes { 1558fc0a61a4SKonstantin Belousov struct timeval *tv; 1559b4366092SJustin Hibbits #if defined(COMPAT_FREEBSD32) && defined(__amd64__) 1560fc0a61a4SKonstantin Belousov struct timeval32 *tv32; 1561fc0a61a4SKonstantin Belousov struct timeval tv64; 1562fc0a61a4SKonstantin Belousov 1563fc0a61a4SKonstantin Belousov if (cmd == BIOCGRTIMEOUT32) 1564fc0a61a4SKonstantin Belousov tv = &tv64; 1565fc0a61a4SKonstantin Belousov else 1566fc0a61a4SKonstantin Belousov #endif 1567fc0a61a4SKonstantin Belousov tv = (struct timeval *)addr; 1568df8bae1dSRodney W. Grimes 1569bdc2cdc5SAlexander Langer tv->tv_sec = d->bd_rtout / hz; 1570bdc2cdc5SAlexander Langer tv->tv_usec = (d->bd_rtout % hz) * tick; 1571b4366092SJustin Hibbits #if defined(COMPAT_FREEBSD32) && defined(__amd64__) 1572fc0a61a4SKonstantin Belousov if (cmd == BIOCGRTIMEOUT32) { 1573fc0a61a4SKonstantin Belousov tv32 = (struct timeval32 *)addr; 1574fc0a61a4SKonstantin Belousov tv32->tv_sec = tv->tv_sec; 1575fc0a61a4SKonstantin Belousov tv32->tv_usec = tv->tv_usec; 1576fc0a61a4SKonstantin Belousov } 1577fc0a61a4SKonstantin Belousov #endif 1578fc0a61a4SKonstantin Belousov 1579df8bae1dSRodney W. Grimes break; 1580df8bae1dSRodney W. Grimes } 1581df8bae1dSRodney W. Grimes 1582df8bae1dSRodney W. Grimes /* 1583df8bae1dSRodney W. Grimes * Get packet stats. 1584df8bae1dSRodney W. Grimes */ 1585df8bae1dSRodney W. Grimes case BIOCGSTATS: 1586df8bae1dSRodney W. Grimes { 1587df8bae1dSRodney W. Grimes struct bpf_stat *bs = (struct bpf_stat *)addr; 1588df8bae1dSRodney W. Grimes 15894d621040SChristian S.J. Peron /* XXXCSJP overflow */ 1590df8bae1dSRodney W. Grimes bs->bs_recv = d->bd_rcount; 1591df8bae1dSRodney W. Grimes bs->bs_drop = d->bd_dcount; 1592df8bae1dSRodney W. Grimes break; 1593df8bae1dSRodney W. Grimes } 1594df8bae1dSRodney W. Grimes 1595df8bae1dSRodney W. Grimes /* 1596df8bae1dSRodney W. Grimes * Set immediate mode. 1597df8bae1dSRodney W. Grimes */ 1598df8bae1dSRodney W. Grimes case BIOCIMMEDIATE: 159997aacec6SAlexander V. Chernikov BPFD_LOCK(d); 1600df8bae1dSRodney W. Grimes d->bd_immediate = *(u_int *)addr; 160197aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 1602df8bae1dSRodney W. Grimes break; 1603df8bae1dSRodney W. Grimes 1604df8bae1dSRodney W. Grimes case BIOCVERSION: 1605df8bae1dSRodney W. Grimes { 1606df8bae1dSRodney W. Grimes struct bpf_version *bv = (struct bpf_version *)addr; 1607df8bae1dSRodney W. Grimes 1608df8bae1dSRodney W. Grimes bv->bv_major = BPF_MAJOR_VERSION; 1609df8bae1dSRodney W. Grimes bv->bv_minor = BPF_MINOR_VERSION; 1610df8bae1dSRodney W. Grimes break; 1611df8bae1dSRodney W. Grimes } 161200a83887SPaul Traina 1613114ae644SMike Smith /* 1614114ae644SMike Smith * Get "header already complete" flag 1615114ae644SMike Smith */ 1616114ae644SMike Smith case BIOCGHDRCMPLT: 161797aacec6SAlexander V. Chernikov BPFD_LOCK(d); 1618114ae644SMike Smith *(u_int *)addr = d->bd_hdrcmplt; 161997aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 1620114ae644SMike Smith break; 1621114ae644SMike Smith 1622114ae644SMike Smith /* 1623114ae644SMike Smith * Set "header already complete" flag 1624114ae644SMike Smith */ 1625114ae644SMike Smith case BIOCSHDRCMPLT: 162697aacec6SAlexander V. Chernikov BPFD_LOCK(d); 1627114ae644SMike Smith d->bd_hdrcmplt = *(u_int *)addr ? 1 : 0; 162897aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 1629114ae644SMike Smith break; 1630114ae644SMike Smith 16318ed3828cSRobert Watson /* 1632560a54e1SJung-uk Kim * Get packet direction flag 16338ed3828cSRobert Watson */ 1634560a54e1SJung-uk Kim case BIOCGDIRECTION: 163597aacec6SAlexander V. Chernikov BPFD_LOCK(d); 1636560a54e1SJung-uk Kim *(u_int *)addr = d->bd_direction; 163797aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 16388ed3828cSRobert Watson break; 16398ed3828cSRobert Watson 16408ed3828cSRobert Watson /* 1641560a54e1SJung-uk Kim * Set packet direction flag 16428ed3828cSRobert Watson */ 1643560a54e1SJung-uk Kim case BIOCSDIRECTION: 1644560a54e1SJung-uk Kim { 1645560a54e1SJung-uk Kim u_int direction; 1646560a54e1SJung-uk Kim 1647560a54e1SJung-uk Kim direction = *(u_int *)addr; 1648560a54e1SJung-uk Kim switch (direction) { 1649560a54e1SJung-uk Kim case BPF_D_IN: 1650560a54e1SJung-uk Kim case BPF_D_INOUT: 1651560a54e1SJung-uk Kim case BPF_D_OUT: 165297aacec6SAlexander V. Chernikov BPFD_LOCK(d); 1653560a54e1SJung-uk Kim d->bd_direction = direction; 165497aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 1655560a54e1SJung-uk Kim break; 1656560a54e1SJung-uk Kim default: 1657560a54e1SJung-uk Kim error = EINVAL; 1658560a54e1SJung-uk Kim } 1659560a54e1SJung-uk Kim } 1660560a54e1SJung-uk Kim break; 1661560a54e1SJung-uk Kim 1662547d94bdSJung-uk Kim /* 1663d0d7bcdfSJung-uk Kim * Get packet timestamp format and resolution. 1664547d94bdSJung-uk Kim */ 1665547d94bdSJung-uk Kim case BIOCGTSTAMP: 166697aacec6SAlexander V. Chernikov BPFD_LOCK(d); 1667547d94bdSJung-uk Kim *(u_int *)addr = d->bd_tstamp; 166897aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 1669547d94bdSJung-uk Kim break; 1670547d94bdSJung-uk Kim 1671547d94bdSJung-uk Kim /* 1672547d94bdSJung-uk Kim * Set packet timestamp format and resolution. 1673547d94bdSJung-uk Kim */ 1674547d94bdSJung-uk Kim case BIOCSTSTAMP: 1675547d94bdSJung-uk Kim { 1676547d94bdSJung-uk Kim u_int func; 1677547d94bdSJung-uk Kim 1678547d94bdSJung-uk Kim func = *(u_int *)addr; 1679547d94bdSJung-uk Kim if (BPF_T_VALID(func)) 1680547d94bdSJung-uk Kim d->bd_tstamp = func; 1681547d94bdSJung-uk Kim else 1682547d94bdSJung-uk Kim error = EINVAL; 1683547d94bdSJung-uk Kim } 1684547d94bdSJung-uk Kim break; 1685547d94bdSJung-uk Kim 1686560a54e1SJung-uk Kim case BIOCFEEDBACK: 168797aacec6SAlexander V. Chernikov BPFD_LOCK(d); 1688560a54e1SJung-uk Kim d->bd_feedback = *(u_int *)addr; 168997aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 1690560a54e1SJung-uk Kim break; 1691560a54e1SJung-uk Kim 1692560a54e1SJung-uk Kim case BIOCLOCK: 169397aacec6SAlexander V. Chernikov BPFD_LOCK(d); 1694560a54e1SJung-uk Kim d->bd_locked = 1; 169597aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 16968ed3828cSRobert Watson break; 16978ed3828cSRobert Watson 169800a83887SPaul Traina case FIONBIO: /* Non-blocking I/O */ 169900a83887SPaul Traina break; 170000a83887SPaul Traina 170100a83887SPaul Traina case FIOASYNC: /* Send signal on receive packets */ 170297aacec6SAlexander V. Chernikov BPFD_LOCK(d); 170300a83887SPaul Traina d->bd_async = *(int *)addr; 170497aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 170500a83887SPaul Traina break; 170600a83887SPaul Traina 1707831d27a9SDon Lewis case FIOSETOWN: 170897aacec6SAlexander V. Chernikov /* 170997aacec6SAlexander V. Chernikov * XXX: Add some sort of locking here? 171097aacec6SAlexander V. Chernikov * fsetown() can sleep. 171197aacec6SAlexander V. Chernikov */ 1712831d27a9SDon Lewis error = fsetown(*(int *)addr, &d->bd_sigio); 171300a83887SPaul Traina break; 171400a83887SPaul Traina 1715831d27a9SDon Lewis case FIOGETOWN: 171697aacec6SAlexander V. Chernikov BPFD_LOCK(d); 171791e97a82SDon Lewis *(int *)addr = fgetown(&d->bd_sigio); 171897aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 1719831d27a9SDon Lewis break; 1720831d27a9SDon Lewis 1721831d27a9SDon Lewis /* This is deprecated, FIOSETOWN should be used instead. */ 1722831d27a9SDon Lewis case TIOCSPGRP: 1723831d27a9SDon Lewis error = fsetown(-(*(int *)addr), &d->bd_sigio); 1724831d27a9SDon Lewis break; 1725831d27a9SDon Lewis 1726831d27a9SDon Lewis /* This is deprecated, FIOGETOWN should be used instead. */ 172700a83887SPaul Traina case TIOCGPGRP: 172891e97a82SDon Lewis *(int *)addr = -fgetown(&d->bd_sigio); 172900a83887SPaul Traina break; 173000a83887SPaul Traina 173100a83887SPaul Traina case BIOCSRSIG: /* Set receive signal */ 173200a83887SPaul Traina { 173300a83887SPaul Traina u_int sig; 173400a83887SPaul Traina 173500a83887SPaul Traina sig = *(u_int *)addr; 173600a83887SPaul Traina 173700a83887SPaul Traina if (sig >= NSIG) 173800a83887SPaul Traina error = EINVAL; 173997aacec6SAlexander V. Chernikov else { 174097aacec6SAlexander V. Chernikov BPFD_LOCK(d); 174100a83887SPaul Traina d->bd_sig = sig; 174297aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 174397aacec6SAlexander V. Chernikov } 174400a83887SPaul Traina break; 174500a83887SPaul Traina } 174600a83887SPaul Traina case BIOCGRSIG: 174797aacec6SAlexander V. Chernikov BPFD_LOCK(d); 174800a83887SPaul Traina *(u_int *)addr = d->bd_sig; 174997aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 175000a83887SPaul Traina break; 17514d621040SChristian S.J. Peron 17524d621040SChristian S.J. Peron case BIOCGETBUFMODE: 175397aacec6SAlexander V. Chernikov BPFD_LOCK(d); 17544d621040SChristian S.J. Peron *(u_int *)addr = d->bd_bufmode; 175597aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 17564d621040SChristian S.J. Peron break; 17574d621040SChristian S.J. Peron 17584d621040SChristian S.J. Peron case BIOCSETBUFMODE: 17594d621040SChristian S.J. Peron /* 17604d621040SChristian S.J. Peron * Allow the buffering mode to be changed as long as we 17614d621040SChristian S.J. Peron * haven't yet committed to a particular mode. Our 17624d621040SChristian S.J. Peron * definition of commitment, for now, is whether or not a 17634d621040SChristian S.J. Peron * buffer has been allocated or an interface attached, since 17644d621040SChristian S.J. Peron * that's the point where things get tricky. 17654d621040SChristian S.J. Peron */ 17664d621040SChristian S.J. Peron switch (*(u_int *)addr) { 17674d621040SChristian S.J. Peron case BPF_BUFMODE_BUFFER: 17684d621040SChristian S.J. Peron break; 17694d621040SChristian S.J. Peron 17704d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 17714d621040SChristian S.J. Peron if (bpf_zerocopy_enable) 17724d621040SChristian S.J. Peron break; 17734d621040SChristian S.J. Peron /* FALLSTHROUGH */ 17744d621040SChristian S.J. Peron 17754d621040SChristian S.J. Peron default: 17761b610a74SBjoern A. Zeeb CURVNET_RESTORE(); 17774d621040SChristian S.J. Peron return (EINVAL); 17784d621040SChristian S.J. Peron } 17794d621040SChristian S.J. Peron 1780afa85850SAlexander V. Chernikov BPFD_LOCK(d); 17814d621040SChristian S.J. Peron if (d->bd_sbuf != NULL || d->bd_hbuf != NULL || 17824d621040SChristian S.J. Peron d->bd_fbuf != NULL || d->bd_bif != NULL) { 1783afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 17841b610a74SBjoern A. Zeeb CURVNET_RESTORE(); 17854d621040SChristian S.J. Peron return (EBUSY); 17864d621040SChristian S.J. Peron } 17874d621040SChristian S.J. Peron d->bd_bufmode = *(u_int *)addr; 1788afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 17894d621040SChristian S.J. Peron break; 17904d621040SChristian S.J. Peron 17914d621040SChristian S.J. Peron case BIOCGETZMAX: 17921b610a74SBjoern A. Zeeb error = bpf_ioctl_getzmax(td, d, (size_t *)addr); 17931b610a74SBjoern A. Zeeb break; 17944d621040SChristian S.J. Peron 17954d621040SChristian S.J. Peron case BIOCSETZBUF: 17961b610a74SBjoern A. Zeeb error = bpf_ioctl_setzbuf(td, d, (struct bpf_zbuf *)addr); 17971b610a74SBjoern A. Zeeb break; 17984d621040SChristian S.J. Peron 17994d621040SChristian S.J. Peron case BIOCROTZBUF: 18001b610a74SBjoern A. Zeeb error = bpf_ioctl_rotzbuf(td, d, (struct bpf_zbuf *)addr); 18011b610a74SBjoern A. Zeeb break; 1802df8bae1dSRodney W. Grimes } 180397021c24SMarko Zec CURVNET_RESTORE(); 1804df8bae1dSRodney W. Grimes return (error); 1805df8bae1dSRodney W. Grimes } 1806df8bae1dSRodney W. Grimes 1807df8bae1dSRodney W. Grimes /* 1808df8bae1dSRodney W. Grimes * Set d's packet filter program to fp. If this file already has a filter, 1809df8bae1dSRodney W. Grimes * free it and replace it. Returns EINVAL for bogus requests. 1810784292f8SAlexander V. Chernikov * 1811784292f8SAlexander V. Chernikov * Note we need global lock here to serialize bpf_setf() and bpf_setif() calls 1812784292f8SAlexander V. Chernikov * since reading d->bd_bif can't be protected by d or interface lock due to 1813784292f8SAlexander V. Chernikov * lock order. 1814784292f8SAlexander V. Chernikov * 1815784292f8SAlexander V. Chernikov * Additionally, we have to acquire interface write lock due to bpf_mtap() uses 1816784292f8SAlexander V. Chernikov * interface read lock to read all filers. 1817784292f8SAlexander V. Chernikov * 1818df8bae1dSRodney W. Grimes */ 1819f708ef1bSPoul-Henning Kamp static int 182019ba8395SChristian S.J. Peron bpf_setf(struct bpf_d *d, struct bpf_program *fp, u_long cmd) 1821df8bae1dSRodney W. Grimes { 18229b7d4a7fSJung-uk Kim #ifdef COMPAT_FREEBSD32 18239b7d4a7fSJung-uk Kim struct bpf_program fp_swab; 18249b7d4a7fSJung-uk Kim struct bpf_program32 *fp32; 18259b7d4a7fSJung-uk Kim #endif 1826df8bae1dSRodney W. Grimes struct bpf_insn *fcode, *old; 1827293c06a1SRuslan Ermilov #ifdef BPF_JITTER 1828a86227d1SAlexander V. Chernikov bpf_jit_filter *jfunc, *ofunc; 1829ae275efcSJung-uk Kim #endif 18308b04b48aSJung-uk Kim size_t size; 18318b04b48aSJung-uk Kim u_int flen; 18329431cc16SAlexander V. Chernikov int need_upgrade; 1833df8bae1dSRodney W. Grimes 18349b7d4a7fSJung-uk Kim #ifdef COMPAT_FREEBSD32 18356f731135SJung-uk Kim switch (cmd) { 18366f731135SJung-uk Kim case BIOCSETF32: 18376f731135SJung-uk Kim case BIOCSETWF32: 18386f731135SJung-uk Kim case BIOCSETFNR32: 1839fc0a61a4SKonstantin Belousov fp32 = (struct bpf_program32 *)fp; 1840fc0a61a4SKonstantin Belousov fp_swab.bf_len = fp32->bf_len; 1841fc0a61a4SKonstantin Belousov fp_swab.bf_insns = (struct bpf_insn *)(uintptr_t)fp32->bf_insns; 1842fc0a61a4SKonstantin Belousov fp = &fp_swab; 18436f731135SJung-uk Kim switch (cmd) { 18446f731135SJung-uk Kim case BIOCSETF32: 18456f731135SJung-uk Kim cmd = BIOCSETF; 18466f731135SJung-uk Kim break; 18476f731135SJung-uk Kim case BIOCSETWF32: 1848fc0a61a4SKonstantin Belousov cmd = BIOCSETWF; 18496f731135SJung-uk Kim break; 18506f731135SJung-uk Kim } 18516f731135SJung-uk Kim break; 1852fc0a61a4SKonstantin Belousov } 1853fc0a61a4SKonstantin Belousov #endif 18548b04b48aSJung-uk Kim 18558b04b48aSJung-uk Kim fcode = NULL; 18568b04b48aSJung-uk Kim #ifdef BPF_JITTER 18578b04b48aSJung-uk Kim jfunc = ofunc = NULL; 18588b04b48aSJung-uk Kim #endif 18599b7d4a7fSJung-uk Kim need_upgrade = 0; 18608b04b48aSJung-uk Kim 18616c74ff0eSAlexander V. Chernikov /* 18626c74ff0eSAlexander V. Chernikov * Check new filter validness before acquiring any locks. 18636c74ff0eSAlexander V. Chernikov * Allocate memory for new filter, if needed. 18646c74ff0eSAlexander V. Chernikov */ 18656c74ff0eSAlexander V. Chernikov flen = fp->bf_len; 18669b7d4a7fSJung-uk Kim if (flen > bpf_maxinsns || (fp->bf_insns == NULL && flen != 0)) 18676c74ff0eSAlexander V. Chernikov return (EINVAL); 18686c74ff0eSAlexander V. Chernikov size = flen * sizeof(*fp->bf_insns); 1869a86227d1SAlexander V. Chernikov if (size > 0) { 18709b7d4a7fSJung-uk Kim /* We're setting up new filter. Copy and check actual data. */ 18719b7d4a7fSJung-uk Kim fcode = malloc(size, M_BPF, M_WAITOK); 18729b7d4a7fSJung-uk Kim if (copyin(fp->bf_insns, fcode, size) != 0 || 18739b7d4a7fSJung-uk Kim !bpf_validate(fcode, flen)) { 1874a86227d1SAlexander V. Chernikov free(fcode, M_BPF); 1875a86227d1SAlexander V. Chernikov return (EINVAL); 1876a86227d1SAlexander V. Chernikov } 1877c7b0200eSAlexander V. Chernikov #ifdef BPF_JITTER 18789b7d4a7fSJung-uk Kim /* Filter is copied inside fcode and is perfectly valid. */ 1879c7b0200eSAlexander V. Chernikov jfunc = bpf_jitter(fcode, flen); 1880c7b0200eSAlexander V. Chernikov #endif 18818b04b48aSJung-uk Kim } 1882c7b0200eSAlexander V. Chernikov 18836c74ff0eSAlexander V. Chernikov BPF_LOCK(); 18846c74ff0eSAlexander V. Chernikov 1885e4b3229aSAlexander V. Chernikov /* 1886a86227d1SAlexander V. Chernikov * Set up new filter. 18879b7d4a7fSJung-uk Kim * Protect filter change by interface lock. 18886c74ff0eSAlexander V. Chernikov * Additionally, we are protected by global lock here. 1889e4b3229aSAlexander V. Chernikov */ 18906c74ff0eSAlexander V. Chernikov if (d->bd_bif != NULL) 1891e4b3229aSAlexander V. Chernikov BPFIF_WLOCK(d->bd_bif); 1892afa85850SAlexander V. Chernikov BPFD_LOCK(d); 18938b04b48aSJung-uk Kim if (cmd == BIOCSETWF) { 18948b04b48aSJung-uk Kim old = d->bd_wfilter; 189593e39f0bSChristian S.J. Peron d->bd_wfilter = fcode; 18968b04b48aSJung-uk Kim } else { 18978b04b48aSJung-uk Kim old = d->bd_rfilter; 189893e39f0bSChristian S.J. Peron d->bd_rfilter = fcode; 1899293c06a1SRuslan Ermilov #ifdef BPF_JITTER 19008b04b48aSJung-uk Kim ofunc = d->bd_bfilter; 1901c7b0200eSAlexander V. Chernikov d->bd_bfilter = jfunc; 1902ae275efcSJung-uk Kim #endif 1903f11c3508SDavid Malone if (cmd == BIOCSETF) 1904df8bae1dSRodney W. Grimes reset_d(d); 190551ec1eb7SAlexander V. Chernikov 1906402000ffSAlexander V. Chernikov need_upgrade = bpf_check_upgrade(cmd, d, fcode, flen); 19078b04b48aSJung-uk Kim } 1908afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 19096c74ff0eSAlexander V. Chernikov if (d->bd_bif != NULL) 1910e4b3229aSAlexander V. Chernikov BPFIF_WUNLOCK(d->bd_bif); 1911572bde2aSRobert Watson if (old != NULL) 19129b7d4a7fSJung-uk Kim free(old, M_BPF); 1913293c06a1SRuslan Ermilov #ifdef BPF_JITTER 1914ae275efcSJung-uk Kim if (ofunc != NULL) 1915ae275efcSJung-uk Kim bpf_destroy_jit_filter(ofunc); 1916ae275efcSJung-uk Kim #endif 1917df8bae1dSRodney W. Grimes 19189b7d4a7fSJung-uk Kim /* Move d to active readers list. */ 1919402000ffSAlexander V. Chernikov if (need_upgrade != 0) 192051ec1eb7SAlexander V. Chernikov bpf_upgraded(d); 192151ec1eb7SAlexander V. Chernikov 19226c74ff0eSAlexander V. Chernikov BPF_UNLOCK(); 1923df8bae1dSRodney W. Grimes return (0); 1924df8bae1dSRodney W. Grimes } 1925df8bae1dSRodney W. Grimes 1926df8bae1dSRodney W. Grimes /* 1927df8bae1dSRodney W. Grimes * Detach a file from its current interface (if attached at all) and attach 1928df8bae1dSRodney W. Grimes * to the interface indicated by the name stored in ifr. 1929df8bae1dSRodney W. Grimes * Return an errno or 0. 1930df8bae1dSRodney W. Grimes */ 1931df8bae1dSRodney W. Grimes static int 193219ba8395SChristian S.J. Peron bpf_setif(struct bpf_d *d, struct ifreq *ifr) 1933df8bae1dSRodney W. Grimes { 1934df8bae1dSRodney W. Grimes struct bpf_if *bp; 19359b44ff22SGarrett Wollman struct ifnet *theywant; 1936df8bae1dSRodney W. Grimes 19376c74ff0eSAlexander V. Chernikov BPF_LOCK_ASSERT(); 19386c74ff0eSAlexander V. Chernikov 19399b44ff22SGarrett Wollman theywant = ifunit(ifr->ifr_name); 194016d878ccSChristian S.J. Peron if (theywant == NULL || theywant->if_bpf == NULL) 194116d878ccSChristian S.J. Peron return (ENXIO); 19429b44ff22SGarrett Wollman 194316d878ccSChristian S.J. Peron bp = theywant->if_bpf; 19444d621040SChristian S.J. Peron 1945afa85850SAlexander V. Chernikov /* Check if interface is not being detached from BPF */ 1946afa85850SAlexander V. Chernikov BPFIF_RLOCK(bp); 1947b23cbbe6SMark Johnston if (bp->bif_flags & BPFIF_FLAG_DYING) { 1948afa85850SAlexander V. Chernikov BPFIF_RUNLOCK(bp); 1949afa85850SAlexander V. Chernikov return (ENXIO); 1950afa85850SAlexander V. Chernikov } 1951afa85850SAlexander V. Chernikov BPFIF_RUNLOCK(bp); 1952afa85850SAlexander V. Chernikov 1953df8bae1dSRodney W. Grimes /* 19544f42daa4SLuiz Otavio O Souza * At this point, we expect the buffer is already allocated. If not, 19554f42daa4SLuiz Otavio O Souza * return an error. 1956df8bae1dSRodney W. Grimes */ 19574d621040SChristian S.J. Peron switch (d->bd_bufmode) { 19584d621040SChristian S.J. Peron case BPF_BUFMODE_BUFFER: 19594d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 19604d621040SChristian S.J. Peron if (d->bd_sbuf == NULL) 19614d621040SChristian S.J. Peron return (EINVAL); 19624d621040SChristian S.J. Peron break; 19634d621040SChristian S.J. Peron 19644d621040SChristian S.J. Peron default: 19654d621040SChristian S.J. Peron panic("bpf_setif: bufmode %d", d->bd_bufmode); 19664d621040SChristian S.J. Peron } 19676c74ff0eSAlexander V. Chernikov if (bp != d->bd_bif) 1968df8bae1dSRodney W. Grimes bpf_attachd(d, bp); 1969afa85850SAlexander V. Chernikov BPFD_LOCK(d); 1970df8bae1dSRodney W. Grimes reset_d(d); 1971afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 1972df8bae1dSRodney W. Grimes return (0); 1973df8bae1dSRodney W. Grimes } 1974df8bae1dSRodney W. Grimes 1975df8bae1dSRodney W. Grimes /* 1976243ac7d8SPeter Wemm * Support for select() and poll() system calls 1977df8bae1dSRodney W. Grimes * 1978df8bae1dSRodney W. Grimes * Return true iff the specific operation will not block indefinitely. 1979df8bae1dSRodney W. Grimes * Otherwise, return false but make a note that a selwakeup() must be done. 1980df8bae1dSRodney W. Grimes */ 198137c84183SPoul-Henning Kamp static int 198219ba8395SChristian S.J. Peron bpfpoll(struct cdev *dev, int events, struct thread *td) 1983df8bae1dSRodney W. Grimes { 1984e7bb21b3SJonathan Lemon struct bpf_d *d; 19850832fc64SGarance A Drosehn int revents; 1986df8bae1dSRodney W. Grimes 1987136600feSEd Schouten if (devfs_get_cdevpriv((void **)&d) != 0 || d->bd_bif == NULL) 1988136600feSEd Schouten return (events & 1989136600feSEd Schouten (POLLHUP|POLLIN|POLLRDNORM|POLLOUT|POLLWRNORM)); 1990de5d9935SRobert Watson 1991b75a24a0SChristian S.J. Peron /* 1992b75a24a0SChristian S.J. Peron * Refresh PID associated with this descriptor. 1993b75a24a0SChristian S.J. Peron */ 19940832fc64SGarance A Drosehn revents = events & (POLLOUT | POLLWRNORM); 1995afa85850SAlexander V. Chernikov BPFD_LOCK(d); 1996e4b3229aSAlexander V. Chernikov BPF_PID_REFRESH(d, td); 199775c13541SPoul-Henning Kamp if (events & (POLLIN | POLLRDNORM)) { 199895aab9ccSJohn-Mark Gurney if (bpf_ready(d)) 1999243ac7d8SPeter Wemm revents |= events & (POLLIN | POLLRDNORM); 200081bda851SJohn Polstra else { 2001ed01445dSJohn Baldwin selrecord(td, &d->bd_sel); 200281bda851SJohn Polstra /* Start the read timeout if necessary. */ 200381bda851SJohn Polstra if (d->bd_rtout > 0 && d->bd_state == BPF_IDLE) { 200481bda851SJohn Polstra callout_reset(&d->bd_callout, d->bd_rtout, 200581bda851SJohn Polstra bpf_timed_out, d); 200681bda851SJohn Polstra d->bd_state = BPF_WAITING; 200781bda851SJohn Polstra } 200881bda851SJohn Polstra } 200975c13541SPoul-Henning Kamp } 2010afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 2011243ac7d8SPeter Wemm return (revents); 2012df8bae1dSRodney W. Grimes } 2013df8bae1dSRodney W. Grimes 2014df8bae1dSRodney W. Grimes /* 201595aab9ccSJohn-Mark Gurney * Support for kevent() system call. Register EVFILT_READ filters and 201695aab9ccSJohn-Mark Gurney * reject all others. 201795aab9ccSJohn-Mark Gurney */ 201895aab9ccSJohn-Mark Gurney int 201919ba8395SChristian S.J. Peron bpfkqfilter(struct cdev *dev, struct knote *kn) 202095aab9ccSJohn-Mark Gurney { 2021136600feSEd Schouten struct bpf_d *d; 202295aab9ccSJohn-Mark Gurney 2023136600feSEd Schouten if (devfs_get_cdevpriv((void **)&d) != 0 || 2024136600feSEd Schouten kn->kn_filter != EVFILT_READ) 202595aab9ccSJohn-Mark Gurney return (1); 202695aab9ccSJohn-Mark Gurney 2027b75a24a0SChristian S.J. Peron /* 2028b75a24a0SChristian S.J. Peron * Refresh PID associated with this descriptor. 2029b75a24a0SChristian S.J. Peron */ 2030afa85850SAlexander V. Chernikov BPFD_LOCK(d); 2031e4b3229aSAlexander V. Chernikov BPF_PID_REFRESH_CUR(d); 203295aab9ccSJohn-Mark Gurney kn->kn_fop = &bpfread_filtops; 203395aab9ccSJohn-Mark Gurney kn->kn_hook = d; 20344b19419eSChristian S.J. Peron knlist_add(&d->bd_sel.si_note, kn, 1); 2035afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 203695aab9ccSJohn-Mark Gurney 203795aab9ccSJohn-Mark Gurney return (0); 203895aab9ccSJohn-Mark Gurney } 203995aab9ccSJohn-Mark Gurney 204095aab9ccSJohn-Mark Gurney static void 204119ba8395SChristian S.J. Peron filt_bpfdetach(struct knote *kn) 204295aab9ccSJohn-Mark Gurney { 204395aab9ccSJohn-Mark Gurney struct bpf_d *d = (struct bpf_d *)kn->kn_hook; 204495aab9ccSJohn-Mark Gurney 2045ad3b9257SJohn-Mark Gurney knlist_remove(&d->bd_sel.si_note, kn, 0); 204695aab9ccSJohn-Mark Gurney } 204795aab9ccSJohn-Mark Gurney 204895aab9ccSJohn-Mark Gurney static int 204919ba8395SChristian S.J. Peron filt_bpfread(struct knote *kn, long hint) 205095aab9ccSJohn-Mark Gurney { 205195aab9ccSJohn-Mark Gurney struct bpf_d *d = (struct bpf_d *)kn->kn_hook; 205295aab9ccSJohn-Mark Gurney int ready; 205395aab9ccSJohn-Mark Gurney 2054afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 205595aab9ccSJohn-Mark Gurney ready = bpf_ready(d); 205695aab9ccSJohn-Mark Gurney if (ready) { 205795aab9ccSJohn-Mark Gurney kn->kn_data = d->bd_slen; 205892242172SLuiz Otavio O Souza /* 205992242172SLuiz Otavio O Souza * Ignore the hold buffer if it is being copied to user space. 206092242172SLuiz Otavio O Souza */ 206192242172SLuiz Otavio O Souza if (!d->bd_hbuf_in_use && d->bd_hbuf) 206295aab9ccSJohn-Mark Gurney kn->kn_data += d->bd_hlen; 20635d7af3a1SJung-uk Kim } else if (d->bd_rtout > 0 && d->bd_state == BPF_IDLE) { 206495aab9ccSJohn-Mark Gurney callout_reset(&d->bd_callout, d->bd_rtout, 206595aab9ccSJohn-Mark Gurney bpf_timed_out, d); 206695aab9ccSJohn-Mark Gurney d->bd_state = BPF_WAITING; 206795aab9ccSJohn-Mark Gurney } 206895aab9ccSJohn-Mark Gurney 206995aab9ccSJohn-Mark Gurney return (ready); 207095aab9ccSJohn-Mark Gurney } 207195aab9ccSJohn-Mark Gurney 2072253a3814SLawrence Stewart #define BPF_TSTAMP_NONE 0 2073253a3814SLawrence Stewart #define BPF_TSTAMP_FAST 1 2074253a3814SLawrence Stewart #define BPF_TSTAMP_NORMAL 2 2075253a3814SLawrence Stewart #define BPF_TSTAMP_EXTERN 3 2076253a3814SLawrence Stewart 2077253a3814SLawrence Stewart static int 2078253a3814SLawrence Stewart bpf_ts_quality(int tstype) 2079253a3814SLawrence Stewart { 2080253a3814SLawrence Stewart 2081253a3814SLawrence Stewart if (tstype == BPF_T_NONE) 2082253a3814SLawrence Stewart return (BPF_TSTAMP_NONE); 2083253a3814SLawrence Stewart if ((tstype & BPF_T_FAST) != 0) 2084253a3814SLawrence Stewart return (BPF_TSTAMP_FAST); 2085253a3814SLawrence Stewart 2086253a3814SLawrence Stewart return (BPF_TSTAMP_NORMAL); 2087253a3814SLawrence Stewart } 2088253a3814SLawrence Stewart 2089253a3814SLawrence Stewart static int 2090253a3814SLawrence Stewart bpf_gettime(struct bintime *bt, int tstype, struct mbuf *m) 2091253a3814SLawrence Stewart { 2092253a3814SLawrence Stewart struct m_tag *tag; 2093253a3814SLawrence Stewart int quality; 2094253a3814SLawrence Stewart 2095253a3814SLawrence Stewart quality = bpf_ts_quality(tstype); 2096253a3814SLawrence Stewart if (quality == BPF_TSTAMP_NONE) 2097253a3814SLawrence Stewart return (quality); 2098253a3814SLawrence Stewart 2099253a3814SLawrence Stewart if (m != NULL) { 2100253a3814SLawrence Stewart tag = m_tag_locate(m, MTAG_BPF, MTAG_BPF_TIMESTAMP, NULL); 2101253a3814SLawrence Stewart if (tag != NULL) { 2102253a3814SLawrence Stewart *bt = *(struct bintime *)(tag + 1); 2103253a3814SLawrence Stewart return (BPF_TSTAMP_EXTERN); 2104253a3814SLawrence Stewart } 2105253a3814SLawrence Stewart } 2106253a3814SLawrence Stewart if (quality == BPF_TSTAMP_NORMAL) 2107253a3814SLawrence Stewart binuptime(bt); 2108253a3814SLawrence Stewart else 2109253a3814SLawrence Stewart getbinuptime(bt); 2110253a3814SLawrence Stewart 2111253a3814SLawrence Stewart return (quality); 2112253a3814SLawrence Stewart } 2113253a3814SLawrence Stewart 211495aab9ccSJohn-Mark Gurney /* 2115df8bae1dSRodney W. Grimes * Incoming linkage from device drivers. Process the packet pkt, of length 2116df8bae1dSRodney W. Grimes * pktlen, which is stored in a contiguous buffer. The packet is parsed 2117df8bae1dSRodney W. Grimes * by each process' filter, and if accepted, stashed into the corresponding 2118df8bae1dSRodney W. Grimes * buffer. 2119df8bae1dSRodney W. Grimes */ 2120df8bae1dSRodney W. Grimes void 212119ba8395SChristian S.J. Peron bpf_tap(struct bpf_if *bp, u_char *pkt, u_int pktlen) 2122df8bae1dSRodney W. Grimes { 2123547d94bdSJung-uk Kim struct bintime bt; 21248994a245SDag-Erling Smørgrav struct bpf_d *d; 2125a36599ccSJung-uk Kim #ifdef BPF_JITTER 2126a36599ccSJung-uk Kim bpf_jit_filter *bf; 2127a36599ccSJung-uk Kim #endif 2128253a3814SLawrence Stewart u_int slen; 2129253a3814SLawrence Stewart int gottime; 2130e7bb21b3SJonathan Lemon 2131253a3814SLawrence Stewart gottime = BPF_TSTAMP_NONE; 2132e4b3229aSAlexander V. Chernikov 2133e4b3229aSAlexander V. Chernikov BPFIF_RLOCK(bp); 2134e4b3229aSAlexander V. Chernikov 21354a3feeaaSRobert Watson LIST_FOREACH(d, &bp->bif_dlist, bd_next) { 2136e4b3229aSAlexander V. Chernikov /* 2137e4b3229aSAlexander V. Chernikov * We are not using any locks for d here because: 2138e4b3229aSAlexander V. Chernikov * 1) any filter change is protected by interface 2139e4b3229aSAlexander V. Chernikov * write lock 2140e4b3229aSAlexander V. Chernikov * 2) destroying/detaching d is protected by interface 2141e4b3229aSAlexander V. Chernikov * write lock, too 2142e4b3229aSAlexander V. Chernikov */ 2143e4b3229aSAlexander V. Chernikov 2144e4b3229aSAlexander V. Chernikov /* XXX: Do not protect counter for the sake of performance. */ 2145df8bae1dSRodney W. Grimes ++d->bd_rcount; 2146a05cf8c6SChristian S.J. Peron /* 2147a05cf8c6SChristian S.J. Peron * NB: We dont call BPF_CHECK_DIRECTION() here since there is no 2148a05cf8c6SChristian S.J. Peron * way for the caller to indiciate to us whether this packet 2149a05cf8c6SChristian S.J. Peron * is inbound or outbound. In the bpf_mtap() routines, we use 2150a05cf8c6SChristian S.J. Peron * the interface pointers on the mbuf to figure it out. 2151a05cf8c6SChristian S.J. Peron */ 2152ae275efcSJung-uk Kim #ifdef BPF_JITTER 2153a36599ccSJung-uk Kim bf = bpf_jitter_enable != 0 ? d->bd_bfilter : NULL; 2154a36599ccSJung-uk Kim if (bf != NULL) 2155a36599ccSJung-uk Kim slen = (*(bf->func))(pkt, pktlen, pktlen); 2156ae275efcSJung-uk Kim else 2157ae275efcSJung-uk Kim #endif 215893e39f0bSChristian S.J. Peron slen = bpf_filter(d->bd_rfilter, pkt, pktlen, pktlen); 2159ec272d87SRobert Watson if (slen != 0) { 2160e4b3229aSAlexander V. Chernikov /* 2161e4b3229aSAlexander V. Chernikov * Filter matches. Let's to acquire write lock. 2162e4b3229aSAlexander V. Chernikov */ 2163afa85850SAlexander V. Chernikov BPFD_LOCK(d); 2164e4b3229aSAlexander V. Chernikov 216569f7644bSChristian S.J. Peron d->bd_fcount++; 2166253a3814SLawrence Stewart if (gottime < bpf_ts_quality(d->bd_tstamp)) 2167253a3814SLawrence Stewart gottime = bpf_gettime(&bt, d->bd_tstamp, NULL); 2168ec272d87SRobert Watson #ifdef MAC 216930d239bcSRobert Watson if (mac_bpfdesc_check_receive(d, bp->bif_ifp) == 0) 2170ec272d87SRobert Watson #endif 21714d621040SChristian S.J. Peron catchpacket(d, pkt, pktlen, slen, 2172547d94bdSJung-uk Kim bpf_append_bytes, &bt); 2173afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 2174ec272d87SRobert Watson } 2175df8bae1dSRodney W. Grimes } 2176e4b3229aSAlexander V. Chernikov BPFIF_RUNLOCK(bp); 2177df8bae1dSRodney W. Grimes } 2178df8bae1dSRodney W. Grimes 2179f81a2a49SJung-uk Kim #define BPF_CHECK_DIRECTION(d, r, i) \ 2180f81a2a49SJung-uk Kim (((d)->bd_direction == BPF_D_IN && (r) != (i)) || \ 2181f81a2a49SJung-uk Kim ((d)->bd_direction == BPF_D_OUT && (r) == (i))) 2182560a54e1SJung-uk Kim 2183df8bae1dSRodney W. Grimes /* 2184df8bae1dSRodney W. Grimes * Incoming linkage from device drivers, when packet is in an mbuf chain. 2185e4b3229aSAlexander V. Chernikov * Locking model is explained in bpf_tap(). 2186df8bae1dSRodney W. Grimes */ 2187df8bae1dSRodney W. Grimes void 218819ba8395SChristian S.J. Peron bpf_mtap(struct bpf_if *bp, struct mbuf *m) 2189df8bae1dSRodney W. Grimes { 2190547d94bdSJung-uk Kim struct bintime bt; 2191df8bae1dSRodney W. Grimes struct bpf_d *d; 2192a36599ccSJung-uk Kim #ifdef BPF_JITTER 2193a36599ccSJung-uk Kim bpf_jit_filter *bf; 2194a36599ccSJung-uk Kim #endif 2195253a3814SLawrence Stewart u_int pktlen, slen; 2196253a3814SLawrence Stewart int gottime; 219791433904SDavid Malone 21988cd892f7SJung-uk Kim /* Skip outgoing duplicate packets. */ 21998cd892f7SJung-uk Kim if ((m->m_flags & M_PROMISC) != 0 && m->m_pkthdr.rcvif == NULL) { 22008cd892f7SJung-uk Kim m->m_flags &= ~M_PROMISC; 22018cd892f7SJung-uk Kim return; 22028cd892f7SJung-uk Kim } 22038cd892f7SJung-uk Kim 2204f0e2422bSPoul-Henning Kamp pktlen = m_length(m, NULL); 2205253a3814SLawrence Stewart gottime = BPF_TSTAMP_NONE; 2206e4b3229aSAlexander V. Chernikov 2207e4b3229aSAlexander V. Chernikov BPFIF_RLOCK(bp); 2208e4b3229aSAlexander V. Chernikov 22094a3feeaaSRobert Watson LIST_FOREACH(d, &bp->bif_dlist, bd_next) { 2210f81a2a49SJung-uk Kim if (BPF_CHECK_DIRECTION(d, m->m_pkthdr.rcvif, bp->bif_ifp)) 22118ed3828cSRobert Watson continue; 2212df8bae1dSRodney W. Grimes ++d->bd_rcount; 2213ae275efcSJung-uk Kim #ifdef BPF_JITTER 2214a36599ccSJung-uk Kim bf = bpf_jitter_enable != 0 ? d->bd_bfilter : NULL; 2215ae275efcSJung-uk Kim /* XXX We cannot handle multiple mbufs. */ 2216a36599ccSJung-uk Kim if (bf != NULL && m->m_next == NULL) 2217a36599ccSJung-uk Kim slen = (*(bf->func))(mtod(m, u_char *), pktlen, pktlen); 2218ae275efcSJung-uk Kim else 2219ae275efcSJung-uk Kim #endif 222093e39f0bSChristian S.J. Peron slen = bpf_filter(d->bd_rfilter, (u_char *)m, pktlen, 0); 22214ddfb531SChristian S.J. Peron if (slen != 0) { 2222afa85850SAlexander V. Chernikov BPFD_LOCK(d); 2223e4b3229aSAlexander V. Chernikov 222469f7644bSChristian S.J. Peron d->bd_fcount++; 2225253a3814SLawrence Stewart if (gottime < bpf_ts_quality(d->bd_tstamp)) 2226253a3814SLawrence Stewart gottime = bpf_gettime(&bt, d->bd_tstamp, m); 22270c7fb534SRobert Watson #ifdef MAC 222830d239bcSRobert Watson if (mac_bpfdesc_check_receive(d, bp->bif_ifp) == 0) 22290c7fb534SRobert Watson #endif 22300c7fb534SRobert Watson catchpacket(d, (u_char *)m, pktlen, slen, 2231547d94bdSJung-uk Kim bpf_append_mbuf, &bt); 2232afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 22334ddfb531SChristian S.J. Peron } 2234df8bae1dSRodney W. Grimes } 2235e4b3229aSAlexander V. Chernikov BPFIF_RUNLOCK(bp); 2236df8bae1dSRodney W. Grimes } 2237df8bae1dSRodney W. Grimes 2238df8bae1dSRodney W. Grimes /* 2239437ffe18SSam Leffler * Incoming linkage from device drivers, when packet is in 2240437ffe18SSam Leffler * an mbuf chain and to be prepended by a contiguous header. 2241437ffe18SSam Leffler */ 2242437ffe18SSam Leffler void 224319ba8395SChristian S.J. Peron bpf_mtap2(struct bpf_if *bp, void *data, u_int dlen, struct mbuf *m) 2244437ffe18SSam Leffler { 2245547d94bdSJung-uk Kim struct bintime bt; 2246437ffe18SSam Leffler struct mbuf mb; 2247437ffe18SSam Leffler struct bpf_d *d; 2248253a3814SLawrence Stewart u_int pktlen, slen; 2249253a3814SLawrence Stewart int gottime; 225091433904SDavid Malone 22518cd892f7SJung-uk Kim /* Skip outgoing duplicate packets. */ 22528cd892f7SJung-uk Kim if ((m->m_flags & M_PROMISC) != 0 && m->m_pkthdr.rcvif == NULL) { 22538cd892f7SJung-uk Kim m->m_flags &= ~M_PROMISC; 22548cd892f7SJung-uk Kim return; 22558cd892f7SJung-uk Kim } 22568cd892f7SJung-uk Kim 2257437ffe18SSam Leffler pktlen = m_length(m, NULL); 2258437ffe18SSam Leffler /* 2259437ffe18SSam Leffler * Craft on-stack mbuf suitable for passing to bpf_filter. 2260437ffe18SSam Leffler * Note that we cut corners here; we only setup what's 2261437ffe18SSam Leffler * absolutely needed--this mbuf should never go anywhere else. 2262437ffe18SSam Leffler */ 2263437ffe18SSam Leffler mb.m_next = m; 2264437ffe18SSam Leffler mb.m_data = data; 2265437ffe18SSam Leffler mb.m_len = dlen; 2266437ffe18SSam Leffler pktlen += dlen; 2267437ffe18SSam Leffler 2268253a3814SLawrence Stewart gottime = BPF_TSTAMP_NONE; 2269e4b3229aSAlexander V. Chernikov 2270e4b3229aSAlexander V. Chernikov BPFIF_RLOCK(bp); 2271e4b3229aSAlexander V. Chernikov 22724a3feeaaSRobert Watson LIST_FOREACH(d, &bp->bif_dlist, bd_next) { 2273f81a2a49SJung-uk Kim if (BPF_CHECK_DIRECTION(d, m->m_pkthdr.rcvif, bp->bif_ifp)) 2274437ffe18SSam Leffler continue; 2275437ffe18SSam Leffler ++d->bd_rcount; 227693e39f0bSChristian S.J. Peron slen = bpf_filter(d->bd_rfilter, (u_char *)&mb, pktlen, 0); 22774ddfb531SChristian S.J. Peron if (slen != 0) { 2278afa85850SAlexander V. Chernikov BPFD_LOCK(d); 2279e4b3229aSAlexander V. Chernikov 228069f7644bSChristian S.J. Peron d->bd_fcount++; 2281253a3814SLawrence Stewart if (gottime < bpf_ts_quality(d->bd_tstamp)) 2282253a3814SLawrence Stewart gottime = bpf_gettime(&bt, d->bd_tstamp, m); 2283437ffe18SSam Leffler #ifdef MAC 228430d239bcSRobert Watson if (mac_bpfdesc_check_receive(d, bp->bif_ifp) == 0) 2285437ffe18SSam Leffler #endif 2286437ffe18SSam Leffler catchpacket(d, (u_char *)&mb, pktlen, slen, 2287547d94bdSJung-uk Kim bpf_append_mbuf, &bt); 2288afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 22894ddfb531SChristian S.J. Peron } 2290437ffe18SSam Leffler } 2291e4b3229aSAlexander V. Chernikov BPFIF_RUNLOCK(bp); 2292437ffe18SSam Leffler } 2293437ffe18SSam Leffler 2294560a54e1SJung-uk Kim #undef BPF_CHECK_DIRECTION 2295560a54e1SJung-uk Kim 2296253a3814SLawrence Stewart #undef BPF_TSTAMP_NONE 2297253a3814SLawrence Stewart #undef BPF_TSTAMP_FAST 2298253a3814SLawrence Stewart #undef BPF_TSTAMP_NORMAL 2299253a3814SLawrence Stewart #undef BPF_TSTAMP_EXTERN 2300253a3814SLawrence Stewart 2301547d94bdSJung-uk Kim static int 2302547d94bdSJung-uk Kim bpf_hdrlen(struct bpf_d *d) 2303547d94bdSJung-uk Kim { 2304547d94bdSJung-uk Kim int hdrlen; 2305547d94bdSJung-uk Kim 2306547d94bdSJung-uk Kim hdrlen = d->bd_bif->bif_hdrlen; 2307547d94bdSJung-uk Kim #ifndef BURN_BRIDGES 2308547d94bdSJung-uk Kim if (d->bd_tstamp == BPF_T_NONE || 2309547d94bdSJung-uk Kim BPF_T_FORMAT(d->bd_tstamp) == BPF_T_MICROTIME) 2310547d94bdSJung-uk Kim #ifdef COMPAT_FREEBSD32 2311547d94bdSJung-uk Kim if (d->bd_compat32) 2312547d94bdSJung-uk Kim hdrlen += SIZEOF_BPF_HDR(struct bpf_hdr32); 2313547d94bdSJung-uk Kim else 2314547d94bdSJung-uk Kim #endif 2315547d94bdSJung-uk Kim hdrlen += SIZEOF_BPF_HDR(struct bpf_hdr); 2316547d94bdSJung-uk Kim else 2317547d94bdSJung-uk Kim #endif 2318547d94bdSJung-uk Kim hdrlen += SIZEOF_BPF_HDR(struct bpf_xhdr); 2319547d94bdSJung-uk Kim #ifdef COMPAT_FREEBSD32 2320547d94bdSJung-uk Kim if (d->bd_compat32) 2321547d94bdSJung-uk Kim hdrlen = BPF_WORDALIGN32(hdrlen); 2322547d94bdSJung-uk Kim else 2323547d94bdSJung-uk Kim #endif 2324547d94bdSJung-uk Kim hdrlen = BPF_WORDALIGN(hdrlen); 2325547d94bdSJung-uk Kim 2326547d94bdSJung-uk Kim return (hdrlen - d->bd_bif->bif_hdrlen); 2327547d94bdSJung-uk Kim } 2328547d94bdSJung-uk Kim 2329547d94bdSJung-uk Kim static void 2330547d94bdSJung-uk Kim bpf_bintime2ts(struct bintime *bt, struct bpf_ts *ts, int tstype) 2331547d94bdSJung-uk Kim { 2332584b675eSKonstantin Belousov struct bintime bt2, boottimebin; 2333547d94bdSJung-uk Kim struct timeval tsm; 2334547d94bdSJung-uk Kim struct timespec tsn; 2335547d94bdSJung-uk Kim 2336253a3814SLawrence Stewart if ((tstype & BPF_T_MONOTONIC) == 0) { 2337253a3814SLawrence Stewart bt2 = *bt; 2338584b675eSKonstantin Belousov getboottimebin(&boottimebin); 2339253a3814SLawrence Stewart bintime_add(&bt2, &boottimebin); 2340253a3814SLawrence Stewart bt = &bt2; 2341253a3814SLawrence Stewart } 2342547d94bdSJung-uk Kim switch (BPF_T_FORMAT(tstype)) { 2343547d94bdSJung-uk Kim case BPF_T_MICROTIME: 2344547d94bdSJung-uk Kim bintime2timeval(bt, &tsm); 2345547d94bdSJung-uk Kim ts->bt_sec = tsm.tv_sec; 2346547d94bdSJung-uk Kim ts->bt_frac = tsm.tv_usec; 2347547d94bdSJung-uk Kim break; 2348547d94bdSJung-uk Kim case BPF_T_NANOTIME: 2349547d94bdSJung-uk Kim bintime2timespec(bt, &tsn); 2350547d94bdSJung-uk Kim ts->bt_sec = tsn.tv_sec; 2351547d94bdSJung-uk Kim ts->bt_frac = tsn.tv_nsec; 2352547d94bdSJung-uk Kim break; 2353547d94bdSJung-uk Kim case BPF_T_BINTIME: 2354547d94bdSJung-uk Kim ts->bt_sec = bt->sec; 2355547d94bdSJung-uk Kim ts->bt_frac = bt->frac; 2356547d94bdSJung-uk Kim break; 2357547d94bdSJung-uk Kim } 2358547d94bdSJung-uk Kim } 2359547d94bdSJung-uk Kim 2360437ffe18SSam Leffler /* 2361df8bae1dSRodney W. Grimes * Move the packet data from interface memory (pkt) into the 23629e610888SDag-Erling Smørgrav * store buffer. "cpfn" is the routine called to do the actual data 2363df8bae1dSRodney W. Grimes * transfer. bcopy is passed in to copy contiguous chunks, while 23644d621040SChristian S.J. Peron * bpf_append_mbuf is passed in to copy mbuf chains. In the latter case, 2365df8bae1dSRodney W. Grimes * pkt is really an mbuf. 2366df8bae1dSRodney W. Grimes */ 2367df8bae1dSRodney W. Grimes static void 236819ba8395SChristian S.J. Peron catchpacket(struct bpf_d *d, u_char *pkt, u_int pktlen, u_int snaplen, 23694d621040SChristian S.J. Peron void (*cpfn)(struct bpf_d *, caddr_t, u_int, void *, u_int), 2370547d94bdSJung-uk Kim struct bintime *bt) 2371df8bae1dSRodney W. Grimes { 2372547d94bdSJung-uk Kim struct bpf_xhdr hdr; 2373547d94bdSJung-uk Kim #ifndef BURN_BRIDGES 2374547d94bdSJung-uk Kim struct bpf_hdr hdr_old; 2375fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 2376547d94bdSJung-uk Kim struct bpf_hdr32 hdr32_old; 2377fc0a61a4SKonstantin Belousov #endif 2378547d94bdSJung-uk Kim #endif 2379547d94bdSJung-uk Kim int caplen, curlen, hdrlen, totlen; 23807819da79SJohn-Mark Gurney int do_wakeup = 0; 2381547d94bdSJung-uk Kim int do_timestamp; 2382547d94bdSJung-uk Kim int tstype; 23839e610888SDag-Erling Smørgrav 2384afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 23854d621040SChristian S.J. Peron 23864d621040SChristian S.J. Peron /* 23874d621040SChristian S.J. Peron * Detect whether user space has released a buffer back to us, and if 23884d621040SChristian S.J. Peron * so, move it from being a hold buffer to a free buffer. This may 23894d621040SChristian S.J. Peron * not be the best place to do it (for example, we might only want to 23904d621040SChristian S.J. Peron * run this check if we need the space), but for now it's a reliable 23914d621040SChristian S.J. Peron * spot to do it. 23924d621040SChristian S.J. Peron */ 2393fa0c2b34SRobert Watson if (d->bd_fbuf == NULL && bpf_canfreebuf(d)) { 23944d621040SChristian S.J. Peron d->bd_fbuf = d->bd_hbuf; 23954d621040SChristian S.J. Peron d->bd_hbuf = NULL; 23964d621040SChristian S.J. Peron d->bd_hlen = 0; 239729f612ecSChristian S.J. Peron bpf_buf_reclaimed(d); 23984d621040SChristian S.J. Peron } 23994d621040SChristian S.J. Peron 2400df8bae1dSRodney W. Grimes /* 2401df8bae1dSRodney W. Grimes * Figure out how many bytes to move. If the packet is 2402df8bae1dSRodney W. Grimes * greater or equal to the snapshot length, transfer that 2403df8bae1dSRodney W. Grimes * much. Otherwise, transfer the whole packet (unless 2404df8bae1dSRodney W. Grimes * we hit the buffer size limit). 2405df8bae1dSRodney W. Grimes */ 2406547d94bdSJung-uk Kim hdrlen = bpf_hdrlen(d); 2407df8bae1dSRodney W. Grimes totlen = hdrlen + min(snaplen, pktlen); 2408df8bae1dSRodney W. Grimes if (totlen > d->bd_bufsize) 2409df8bae1dSRodney W. Grimes totlen = d->bd_bufsize; 2410df8bae1dSRodney W. Grimes 2411df8bae1dSRodney W. Grimes /* 2412df8bae1dSRodney W. Grimes * Round up the end of the previous packet to the next longword. 2413a7a91e65SRobert Watson * 2414a7a91e65SRobert Watson * Drop the packet if there's no room and no hope of room 2415a7a91e65SRobert Watson * If the packet would overflow the storage buffer or the storage 2416a7a91e65SRobert Watson * buffer is considered immutable by the buffer model, try to rotate 2417a7a91e65SRobert Watson * the buffer and wakeup pending processes. 2418df8bae1dSRodney W. Grimes */ 2419fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 2420fc0a61a4SKonstantin Belousov if (d->bd_compat32) 2421fc0a61a4SKonstantin Belousov curlen = BPF_WORDALIGN32(d->bd_slen); 2422fc0a61a4SKonstantin Belousov else 2423fc0a61a4SKonstantin Belousov #endif 2424df8bae1dSRodney W. Grimes curlen = BPF_WORDALIGN(d->bd_slen); 2425a7a91e65SRobert Watson if (curlen + totlen > d->bd_bufsize || !bpf_canwritebuf(d)) { 2426572bde2aSRobert Watson if (d->bd_fbuf == NULL) { 2427df8bae1dSRodney W. Grimes /* 2428a7a91e65SRobert Watson * There's no room in the store buffer, and no 2429a7a91e65SRobert Watson * prospect of room, so drop the packet. Notify the 2430a7a91e65SRobert Watson * buffer model. 2431df8bae1dSRodney W. Grimes */ 2432a7a91e65SRobert Watson bpf_buffull(d); 2433df8bae1dSRodney W. Grimes ++d->bd_dcount; 2434df8bae1dSRodney W. Grimes return; 2435df8bae1dSRodney W. Grimes } 243698fa5d85SLuiz Otavio O Souza KASSERT(!d->bd_hbuf_in_use, ("hold buffer is in use")); 2437df8bae1dSRodney W. Grimes ROTATE_BUFFERS(d); 24387819da79SJohn-Mark Gurney do_wakeup = 1; 2439df8bae1dSRodney W. Grimes curlen = 0; 2440a7a91e65SRobert Watson } else if (d->bd_immediate || d->bd_state == BPF_TIMED_OUT) 2441df8bae1dSRodney W. Grimes /* 24424d621040SChristian S.J. Peron * Immediate mode is set, or the read timeout has already 24434d621040SChristian S.J. Peron * expired during a select call. A packet arrived, so the 24444d621040SChristian S.J. Peron * reader should be woken up. 2445df8bae1dSRodney W. Grimes */ 24467819da79SJohn-Mark Gurney do_wakeup = 1; 2447547d94bdSJung-uk Kim caplen = totlen - hdrlen; 2448547d94bdSJung-uk Kim tstype = d->bd_tstamp; 2449547d94bdSJung-uk Kim do_timestamp = tstype != BPF_T_NONE; 2450547d94bdSJung-uk Kim #ifndef BURN_BRIDGES 2451547d94bdSJung-uk Kim if (tstype == BPF_T_NONE || BPF_T_FORMAT(tstype) == BPF_T_MICROTIME) { 2452547d94bdSJung-uk Kim struct bpf_ts ts; 2453547d94bdSJung-uk Kim if (do_timestamp) 2454547d94bdSJung-uk Kim bpf_bintime2ts(bt, &ts, tstype); 2455fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 2456fc0a61a4SKonstantin Belousov if (d->bd_compat32) { 2457547d94bdSJung-uk Kim bzero(&hdr32_old, sizeof(hdr32_old)); 2458547d94bdSJung-uk Kim if (do_timestamp) { 2459547d94bdSJung-uk Kim hdr32_old.bh_tstamp.tv_sec = ts.bt_sec; 2460547d94bdSJung-uk Kim hdr32_old.bh_tstamp.tv_usec = ts.bt_frac; 2461547d94bdSJung-uk Kim } 2462547d94bdSJung-uk Kim hdr32_old.bh_datalen = pktlen; 2463547d94bdSJung-uk Kim hdr32_old.bh_hdrlen = hdrlen; 2464547d94bdSJung-uk Kim hdr32_old.bh_caplen = caplen; 2465547d94bdSJung-uk Kim bpf_append_bytes(d, d->bd_sbuf, curlen, &hdr32_old, 2466547d94bdSJung-uk Kim sizeof(hdr32_old)); 2467547d94bdSJung-uk Kim goto copy; 2468547d94bdSJung-uk Kim } 2469547d94bdSJung-uk Kim #endif 2470547d94bdSJung-uk Kim bzero(&hdr_old, sizeof(hdr_old)); 2471547d94bdSJung-uk Kim if (do_timestamp) { 2472547d94bdSJung-uk Kim hdr_old.bh_tstamp.tv_sec = ts.bt_sec; 2473547d94bdSJung-uk Kim hdr_old.bh_tstamp.tv_usec = ts.bt_frac; 2474547d94bdSJung-uk Kim } 2475547d94bdSJung-uk Kim hdr_old.bh_datalen = pktlen; 2476547d94bdSJung-uk Kim hdr_old.bh_hdrlen = hdrlen; 2477547d94bdSJung-uk Kim hdr_old.bh_caplen = caplen; 2478547d94bdSJung-uk Kim bpf_append_bytes(d, d->bd_sbuf, curlen, &hdr_old, 2479547d94bdSJung-uk Kim sizeof(hdr_old)); 2480fc0a61a4SKonstantin Belousov goto copy; 2481fc0a61a4SKonstantin Belousov } 2482fc0a61a4SKonstantin Belousov #endif 2483df8bae1dSRodney W. Grimes 2484df8bae1dSRodney W. Grimes /* 24854d621040SChristian S.J. Peron * Append the bpf header. Note we append the actual header size, but 24864d621040SChristian S.J. Peron * move forward the length of the header plus padding. 2487df8bae1dSRodney W. Grimes */ 24884d621040SChristian S.J. Peron bzero(&hdr, sizeof(hdr)); 2489547d94bdSJung-uk Kim if (do_timestamp) 2490547d94bdSJung-uk Kim bpf_bintime2ts(bt, &hdr.bh_tstamp, tstype); 24914d621040SChristian S.J. Peron hdr.bh_datalen = pktlen; 24924d621040SChristian S.J. Peron hdr.bh_hdrlen = hdrlen; 2493547d94bdSJung-uk Kim hdr.bh_caplen = caplen; 24944d621040SChristian S.J. Peron bpf_append_bytes(d, d->bd_sbuf, curlen, &hdr, sizeof(hdr)); 24954d621040SChristian S.J. Peron 2496df8bae1dSRodney W. Grimes /* 2497df8bae1dSRodney W. Grimes * Copy the packet data into the store buffer and update its length. 2498df8bae1dSRodney W. Grimes */ 2499547d94bdSJung-uk Kim #ifndef BURN_BRIDGES 2500fc0a61a4SKonstantin Belousov copy: 2501fc0a61a4SKonstantin Belousov #endif 2502547d94bdSJung-uk Kim (*cpfn)(d, d->bd_sbuf, curlen + hdrlen, pkt, caplen); 2503df8bae1dSRodney W. Grimes d->bd_slen = curlen + totlen; 25047819da79SJohn-Mark Gurney 25057819da79SJohn-Mark Gurney if (do_wakeup) 25067819da79SJohn-Mark Gurney bpf_wakeup(d); 2507df8bae1dSRodney W. Grimes } 2508df8bae1dSRodney W. Grimes 2509df8bae1dSRodney W. Grimes /* 2510df8bae1dSRodney W. Grimes * Free buffers currently in use by a descriptor. 2511df8bae1dSRodney W. Grimes * Called on close. 2512df8bae1dSRodney W. Grimes */ 2513df8bae1dSRodney W. Grimes static void 251419ba8395SChristian S.J. Peron bpf_freed(struct bpf_d *d) 2515df8bae1dSRodney W. Grimes { 25164d621040SChristian S.J. Peron 2517df8bae1dSRodney W. Grimes /* 2518df8bae1dSRodney W. Grimes * We don't need to lock out interrupts since this descriptor has 2519df8bae1dSRodney W. Grimes * been detached from its interface and it yet hasn't been marked 2520df8bae1dSRodney W. Grimes * free. 2521df8bae1dSRodney W. Grimes */ 25224d621040SChristian S.J. Peron bpf_free(d); 252370485847SJung-uk Kim if (d->bd_rfilter != NULL) { 252493e39f0bSChristian S.J. Peron free((caddr_t)d->bd_rfilter, M_BPF); 2525ae275efcSJung-uk Kim #ifdef BPF_JITTER 252670485847SJung-uk Kim if (d->bd_bfilter != NULL) 2527ae275efcSJung-uk Kim bpf_destroy_jit_filter(d->bd_bfilter); 2528ae275efcSJung-uk Kim #endif 2529ae275efcSJung-uk Kim } 253070485847SJung-uk Kim if (d->bd_wfilter != NULL) 253193e39f0bSChristian S.J. Peron free((caddr_t)d->bd_wfilter, M_BPF); 2532afa85850SAlexander V. Chernikov mtx_destroy(&d->bd_lock); 2533df8bae1dSRodney W. Grimes } 2534df8bae1dSRodney W. Grimes 2535df8bae1dSRodney W. Grimes /* 253624a229f4SSam Leffler * Attach an interface to bpf. dlt is the link layer type; hdrlen is the 253724a229f4SSam Leffler * fixed size of the link header (variable length headers not yet supported). 2538df8bae1dSRodney W. Grimes */ 2539df8bae1dSRodney W. Grimes void 254019ba8395SChristian S.J. Peron bpfattach(struct ifnet *ifp, u_int dlt, u_int hdrlen) 2541df8bae1dSRodney W. Grimes { 254224a229f4SSam Leffler 254324a229f4SSam Leffler bpfattach2(ifp, dlt, hdrlen, &ifp->if_bpf); 254424a229f4SSam Leffler } 254524a229f4SSam Leffler 254624a229f4SSam Leffler /* 254724a229f4SSam Leffler * Attach an interface to bpf. ifp is a pointer to the structure 254824a229f4SSam Leffler * defining the interface to be attached, dlt is the link layer type, 254924a229f4SSam Leffler * and hdrlen is the fixed size of the link header (variable length 255024a229f4SSam Leffler * headers are not yet supporrted). 255124a229f4SSam Leffler */ 255224a229f4SSam Leffler void 255319ba8395SChristian S.J. Peron bpfattach2(struct ifnet *ifp, u_int dlt, u_int hdrlen, struct bpf_if **driverp) 255424a229f4SSam Leffler { 2555df8bae1dSRodney W. Grimes struct bpf_if *bp; 255619ba8395SChristian S.J. Peron 255719ba8395SChristian S.J. Peron bp = malloc(sizeof(*bp), M_BPF, M_NOWAIT | M_ZERO); 2558572bde2aSRobert Watson if (bp == NULL) 2559df8bae1dSRodney W. Grimes panic("bpfattach"); 2560df8bae1dSRodney W. Grimes 25614a3feeaaSRobert Watson LIST_INIT(&bp->bif_dlist); 256251ec1eb7SAlexander V. Chernikov LIST_INIT(&bp->bif_wlist); 2563df8bae1dSRodney W. Grimes bp->bif_ifp = ifp; 2564df8bae1dSRodney W. Grimes bp->bif_dlt = dlt; 2565e4b3229aSAlexander V. Chernikov rw_init(&bp->bif_lock, "bpf interface lock"); 256616d878ccSChristian S.J. Peron KASSERT(*driverp == NULL, ("bpfattach2: driverp already initialized")); 2567*9ce40d32SKristof Provost bp->bif_bpf = driverp; 256816d878ccSChristian S.J. Peron *driverp = bp; 2569df8bae1dSRodney W. Grimes 2570e4b3229aSAlexander V. Chernikov BPF_LOCK(); 25714a3feeaaSRobert Watson LIST_INSERT_HEAD(&bpf_iflist, bp, bif_next); 2572e4b3229aSAlexander V. Chernikov BPF_UNLOCK(); 2573df8bae1dSRodney W. Grimes 2574547d94bdSJung-uk Kim bp->bif_hdrlen = hdrlen; 2575df8bae1dSRodney W. Grimes 2576616bc4f4SBjoern A. Zeeb if (bootverbose && IS_DEFAULT_VNET(curvnet)) 257724a229f4SSam Leffler if_printf(ifp, "bpf attached\n"); 2578df8bae1dSRodney W. Grimes } 257953ac6efbSJulian Elischer 258005fc4164SBjoern A. Zeeb #ifdef VIMAGE 258105fc4164SBjoern A. Zeeb /* 258205fc4164SBjoern A. Zeeb * When moving interfaces between vnet instances we need a way to 258305fc4164SBjoern A. Zeeb * query the dlt and hdrlen before detach so we can re-attch the if_bpf 258405fc4164SBjoern A. Zeeb * after the vmove. We unfortunately have no device driver infrastructure 258505fc4164SBjoern A. Zeeb * to query the interface for these values after creation/attach, thus 258605fc4164SBjoern A. Zeeb * add this as a workaround. 258705fc4164SBjoern A. Zeeb */ 258805fc4164SBjoern A. Zeeb int 258905fc4164SBjoern A. Zeeb bpf_get_bp_params(struct bpf_if *bp, u_int *bif_dlt, u_int *bif_hdrlen) 259005fc4164SBjoern A. Zeeb { 259105fc4164SBjoern A. Zeeb 259205fc4164SBjoern A. Zeeb if (bp == NULL) 259305fc4164SBjoern A. Zeeb return (ENXIO); 259405fc4164SBjoern A. Zeeb if (bif_dlt == NULL && bif_hdrlen == NULL) 259505fc4164SBjoern A. Zeeb return (0); 259605fc4164SBjoern A. Zeeb 259705fc4164SBjoern A. Zeeb if (bif_dlt != NULL) 259805fc4164SBjoern A. Zeeb *bif_dlt = bp->bif_dlt; 259905fc4164SBjoern A. Zeeb if (bif_hdrlen != NULL) 260005fc4164SBjoern A. Zeeb *bif_hdrlen = bp->bif_hdrlen; 260105fc4164SBjoern A. Zeeb 260205fc4164SBjoern A. Zeeb return (0); 260305fc4164SBjoern A. Zeeb } 260405fc4164SBjoern A. Zeeb #endif 260505fc4164SBjoern A. Zeeb 2606de5d9935SRobert Watson /* 2607de5d9935SRobert Watson * Detach bpf from an interface. This involves detaching each descriptor 26086c74ff0eSAlexander V. Chernikov * associated with the interface. Notify each descriptor as it's detached 26096c74ff0eSAlexander V. Chernikov * so that any sleepers wake up and get ENXIO. 2610de5d9935SRobert Watson */ 2611de5d9935SRobert Watson void 261219ba8395SChristian S.J. Peron bpfdetach(struct ifnet *ifp) 2613de5d9935SRobert Watson { 2614f079a0faSAlexander V. Chernikov struct bpf_if *bp, *bp_temp; 2615de5d9935SRobert Watson struct bpf_d *d; 26169a7e6bacSLawrence Stewart int ndetached; 2617de5d9935SRobert Watson 26189a7e6bacSLawrence Stewart ndetached = 0; 26199a7e6bacSLawrence Stewart 2620afa85850SAlexander V. Chernikov BPF_LOCK(); 26219a7e6bacSLawrence Stewart /* Find all bpf_if struct's which reference ifp and detach them. */ 2622f079a0faSAlexander V. Chernikov LIST_FOREACH_SAFE(bp, &bpf_iflist, bif_next, bp_temp) { 2623f079a0faSAlexander V. Chernikov if (ifp != bp->bif_ifp) 2624f079a0faSAlexander V. Chernikov continue; 2625de5d9935SRobert Watson 2626f079a0faSAlexander V. Chernikov LIST_REMOVE(bp, bif_next); 2627f079a0faSAlexander V. Chernikov /* Add to to-be-freed list */ 2628f079a0faSAlexander V. Chernikov LIST_INSERT_HEAD(&bpf_freelist, bp, bif_next); 2629f079a0faSAlexander V. Chernikov 26309a7e6bacSLawrence Stewart ndetached++; 2631f079a0faSAlexander V. Chernikov /* 2632f079a0faSAlexander V. Chernikov * Delay freeing bp till interface is detached 2633f079a0faSAlexander V. Chernikov * and all routes through this interface are removed. 2634f079a0faSAlexander V. Chernikov * Mark bp as detached to restrict new consumers. 2635f079a0faSAlexander V. Chernikov */ 2636f079a0faSAlexander V. Chernikov BPFIF_WLOCK(bp); 2637b23cbbe6SMark Johnston bp->bif_flags |= BPFIF_FLAG_DYING; 2638*9ce40d32SKristof Provost *bp->bif_bpf = NULL; 2639f079a0faSAlexander V. Chernikov BPFIF_WUNLOCK(bp); 2640f079a0faSAlexander V. Chernikov 2641f079a0faSAlexander V. Chernikov CTR4(KTR_NET, "%s: sheduling free for encap %d (%p) for if %p", 2642f079a0faSAlexander V. Chernikov __func__, bp->bif_dlt, bp, ifp); 2643f079a0faSAlexander V. Chernikov 2644f079a0faSAlexander V. Chernikov /* Free common descriptors */ 26454a3feeaaSRobert Watson while ((d = LIST_FIRST(&bp->bif_dlist)) != NULL) { 2646afa85850SAlexander V. Chernikov bpf_detachd_locked(d); 2647afa85850SAlexander V. Chernikov BPFD_LOCK(d); 2648e7bb21b3SJonathan Lemon bpf_wakeup(d); 2649afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 2650e7bb21b3SJonathan Lemon } 2651f079a0faSAlexander V. Chernikov 26526c74ff0eSAlexander V. Chernikov /* Free writer-only descriptors */ 26536c74ff0eSAlexander V. Chernikov while ((d = LIST_FIRST(&bp->bif_wlist)) != NULL) { 2654afa85850SAlexander V. Chernikov bpf_detachd_locked(d); 2655afa85850SAlexander V. Chernikov BPFD_LOCK(d); 26566c74ff0eSAlexander V. Chernikov bpf_wakeup(d); 2657afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 26586c74ff0eSAlexander V. Chernikov } 26598eab61f3SSam Leffler } 2660afa85850SAlexander V. Chernikov BPF_UNLOCK(); 26619a7e6bacSLawrence Stewart 26629a7e6bacSLawrence Stewart #ifdef INVARIANTS 26639a7e6bacSLawrence Stewart if (ndetached == 0) 26649a7e6bacSLawrence Stewart printf("bpfdetach: %s was not attached\n", ifp->if_xname); 26659a7e6bacSLawrence Stewart #endif 26669a7e6bacSLawrence Stewart } 2667de5d9935SRobert Watson 26688eab61f3SSam Leffler /* 2669784292f8SAlexander V. Chernikov * Interface departure handler. 26704fe83b81SAlexander V. Chernikov * Note departure event does not guarantee interface is going down. 2671f079a0faSAlexander V. Chernikov * Interface renaming is currently done via departure/arrival event set. 2672f079a0faSAlexander V. Chernikov * 2673f079a0faSAlexander V. Chernikov * Departure handled is called after all routes pointing to 2674f079a0faSAlexander V. Chernikov * given interface are removed and interface is in down state 2675f079a0faSAlexander V. Chernikov * restricting any packets to be sent/received. We assume it is now safe 2676f079a0faSAlexander V. Chernikov * to free data allocated by BPF. 2677afa85850SAlexander V. Chernikov */ 2678afa85850SAlexander V. Chernikov static void 2679afa85850SAlexander V. Chernikov bpf_ifdetach(void *arg __unused, struct ifnet *ifp) 2680afa85850SAlexander V. Chernikov { 2681f079a0faSAlexander V. Chernikov struct bpf_if *bp, *bp_temp; 2682f079a0faSAlexander V. Chernikov int nmatched = 0; 2683afa85850SAlexander V. Chernikov 2684250a8e27SAndrey V. Elsukov /* Ignore ifnet renaming. */ 2685250a8e27SAndrey V. Elsukov if (ifp->if_flags & IFF_RENAMING) 2686250a8e27SAndrey V. Elsukov return; 2687250a8e27SAndrey V. Elsukov 2688784292f8SAlexander V. Chernikov BPF_LOCK(); 2689f079a0faSAlexander V. Chernikov /* 2690f079a0faSAlexander V. Chernikov * Find matching entries in free list. 2691f079a0faSAlexander V. Chernikov * Nothing should be found if bpfdetach() was not called. 2692f079a0faSAlexander V. Chernikov */ 2693f079a0faSAlexander V. Chernikov LIST_FOREACH_SAFE(bp, &bpf_freelist, bif_next, bp_temp) { 2694f079a0faSAlexander V. Chernikov if (ifp != bp->bif_ifp) 2695f079a0faSAlexander V. Chernikov continue; 2696784292f8SAlexander V. Chernikov 2697f079a0faSAlexander V. Chernikov CTR3(KTR_NET, "%s: freeing BPF instance %p for interface %p", 2698afa85850SAlexander V. Chernikov __func__, bp, ifp); 2699afa85850SAlexander V. Chernikov 2700f079a0faSAlexander V. Chernikov LIST_REMOVE(bp, bif_next); 2701784292f8SAlexander V. Chernikov 2702afa85850SAlexander V. Chernikov rw_destroy(&bp->bif_lock); 2703afa85850SAlexander V. Chernikov free(bp, M_BPF); 2704f079a0faSAlexander V. Chernikov 2705f079a0faSAlexander V. Chernikov nmatched++; 2706f079a0faSAlexander V. Chernikov } 2707f079a0faSAlexander V. Chernikov BPF_UNLOCK(); 2708afa85850SAlexander V. Chernikov } 2709afa85850SAlexander V. Chernikov 2710afa85850SAlexander V. Chernikov /* 27118eab61f3SSam Leffler * Get a list of available data link type of the interface. 27128eab61f3SSam Leffler */ 27138eab61f3SSam Leffler static int 271419ba8395SChristian S.J. Peron bpf_getdltlist(struct bpf_d *d, struct bpf_dltlist *bfl) 27158eab61f3SSam Leffler { 27168eab61f3SSam Leffler struct ifnet *ifp; 27178eab61f3SSam Leffler struct bpf_if *bp; 271870209acaSKonstantin Belousov u_int *lst; 271970209acaSKonstantin Belousov int error, n, n1; 27208eab61f3SSam Leffler 272197aacec6SAlexander V. Chernikov BPF_LOCK_ASSERT(); 272297aacec6SAlexander V. Chernikov 27238eab61f3SSam Leffler ifp = d->bd_bif->bif_ifp; 272470209acaSKonstantin Belousov again: 272570209acaSKonstantin Belousov n1 = 0; 272670209acaSKonstantin Belousov LIST_FOREACH(bp, &bpf_iflist, bif_next) { 272770209acaSKonstantin Belousov if (bp->bif_ifp == ifp) 272870209acaSKonstantin Belousov n1++; 272970209acaSKonstantin Belousov } 273070209acaSKonstantin Belousov if (bfl->bfl_list == NULL) { 273170209acaSKonstantin Belousov bfl->bfl_len = n1; 273270209acaSKonstantin Belousov return (0); 273370209acaSKonstantin Belousov } 273470209acaSKonstantin Belousov if (n1 > bfl->bfl_len) 273570209acaSKonstantin Belousov return (ENOMEM); 273670209acaSKonstantin Belousov BPF_UNLOCK(); 273770209acaSKonstantin Belousov lst = malloc(n1 * sizeof(u_int), M_TEMP, M_WAITOK); 27388eab61f3SSam Leffler n = 0; 273970209acaSKonstantin Belousov BPF_LOCK(); 27404a3feeaaSRobert Watson LIST_FOREACH(bp, &bpf_iflist, bif_next) { 27418eab61f3SSam Leffler if (bp->bif_ifp != ifp) 27428eab61f3SSam Leffler continue; 27435412ec6eSConrad Meyer if (n >= n1) { 274470209acaSKonstantin Belousov free(lst, M_TEMP); 274570209acaSKonstantin Belousov goto again; 27468eab61f3SSam Leffler } 274770209acaSKonstantin Belousov lst[n] = bp->bif_dlt; 27488eab61f3SSam Leffler n++; 27498eab61f3SSam Leffler } 275070209acaSKonstantin Belousov BPF_UNLOCK(); 275170209acaSKonstantin Belousov error = copyout(lst, bfl->bfl_list, sizeof(u_int) * n); 275270209acaSKonstantin Belousov free(lst, M_TEMP); 275370209acaSKonstantin Belousov BPF_LOCK(); 27548eab61f3SSam Leffler bfl->bfl_len = n; 27558eab61f3SSam Leffler return (error); 27568eab61f3SSam Leffler } 27578eab61f3SSam Leffler 27588eab61f3SSam Leffler /* 27598eab61f3SSam Leffler * Set the data link type of a BPF instance. 27608eab61f3SSam Leffler */ 27618eab61f3SSam Leffler static int 276219ba8395SChristian S.J. Peron bpf_setdlt(struct bpf_d *d, u_int dlt) 27638eab61f3SSam Leffler { 27648eab61f3SSam Leffler int error, opromisc; 27658eab61f3SSam Leffler struct ifnet *ifp; 27668eab61f3SSam Leffler struct bpf_if *bp; 27678eab61f3SSam Leffler 27686c74ff0eSAlexander V. Chernikov BPF_LOCK_ASSERT(); 27696c74ff0eSAlexander V. Chernikov 27708eab61f3SSam Leffler if (d->bd_bif->bif_dlt == dlt) 27718eab61f3SSam Leffler return (0); 27728eab61f3SSam Leffler ifp = d->bd_bif->bif_ifp; 27736c74ff0eSAlexander V. Chernikov 27744a3feeaaSRobert Watson LIST_FOREACH(bp, &bpf_iflist, bif_next) { 27758eab61f3SSam Leffler if (bp->bif_ifp == ifp && bp->bif_dlt == dlt) 27768eab61f3SSam Leffler break; 27778eab61f3SSam Leffler } 27786c74ff0eSAlexander V. Chernikov 27798eab61f3SSam Leffler if (bp != NULL) { 27808eab61f3SSam Leffler opromisc = d->bd_promisc; 27818eab61f3SSam Leffler bpf_attachd(d, bp); 2782afa85850SAlexander V. Chernikov BPFD_LOCK(d); 27838eab61f3SSam Leffler reset_d(d); 2784afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 27858eab61f3SSam Leffler if (opromisc) { 27868eab61f3SSam Leffler error = ifpromisc(bp->bif_ifp, 1); 27878eab61f3SSam Leffler if (error) 27888eab61f3SSam Leffler if_printf(bp->bif_ifp, 27898eab61f3SSam Leffler "bpf_setdlt: ifpromisc failed (%d)\n", 27908eab61f3SSam Leffler error); 27918eab61f3SSam Leffler else 27928eab61f3SSam Leffler d->bd_promisc = 1; 27938eab61f3SSam Leffler } 27948eab61f3SSam Leffler } 27958eab61f3SSam Leffler return (bp == NULL ? EINVAL : 0); 2796de5d9935SRobert Watson } 2797de5d9935SRobert Watson 27983f54a085SPoul-Henning Kamp static void 279919ba8395SChristian S.J. Peron bpf_drvinit(void *unused) 280053ac6efbSJulian Elischer { 2801136600feSEd Schouten struct cdev *dev; 280253ac6efbSJulian Elischer 28036008862bSJohn Baldwin mtx_init(&bpf_mtx, "bpf global lock", NULL, MTX_DEF); 28044a3feeaaSRobert Watson LIST_INIT(&bpf_iflist); 2805f079a0faSAlexander V. Chernikov LIST_INIT(&bpf_freelist); 2806136600feSEd Schouten 2807136600feSEd Schouten dev = make_dev(&bpf_cdevsw, 0, UID_ROOT, GID_WHEEL, 0600, "bpf"); 2808136600feSEd Schouten /* For compatibility */ 2809136600feSEd Schouten make_dev_alias(dev, "bpf0"); 2810afa85850SAlexander V. Chernikov 2811afa85850SAlexander V. Chernikov /* Register interface departure handler */ 2812afa85850SAlexander V. Chernikov bpf_ifdetach_cookie = EVENTHANDLER_REGISTER( 2813afa85850SAlexander V. Chernikov ifnet_departure_event, bpf_ifdetach, NULL, 2814afa85850SAlexander V. Chernikov EVENTHANDLER_PRI_ANY); 28157198bf47SJulian Elischer } 281653ac6efbSJulian Elischer 28170e37f3e1SChristian S.J. Peron /* 28180e37f3e1SChristian S.J. Peron * Zero out the various packet counters associated with all of the bpf 28190e37f3e1SChristian S.J. Peron * descriptors. At some point, we will probably want to get a bit more 28200e37f3e1SChristian S.J. Peron * granular and allow the user to specify descriptors to be zeroed. 28210e37f3e1SChristian S.J. Peron */ 28220e37f3e1SChristian S.J. Peron static void 28230e37f3e1SChristian S.J. Peron bpf_zero_counters(void) 28240e37f3e1SChristian S.J. Peron { 28250e37f3e1SChristian S.J. Peron struct bpf_if *bp; 28260e37f3e1SChristian S.J. Peron struct bpf_d *bd; 28270e37f3e1SChristian S.J. Peron 2828e4b3229aSAlexander V. Chernikov BPF_LOCK(); 28290e37f3e1SChristian S.J. Peron LIST_FOREACH(bp, &bpf_iflist, bif_next) { 2830e4b3229aSAlexander V. Chernikov BPFIF_RLOCK(bp); 28310e37f3e1SChristian S.J. Peron LIST_FOREACH(bd, &bp->bif_dlist, bd_next) { 2832afa85850SAlexander V. Chernikov BPFD_LOCK(bd); 28330e37f3e1SChristian S.J. Peron bd->bd_rcount = 0; 28340e37f3e1SChristian S.J. Peron bd->bd_dcount = 0; 28350e37f3e1SChristian S.J. Peron bd->bd_fcount = 0; 28360e37f3e1SChristian S.J. Peron bd->bd_wcount = 0; 28370e37f3e1SChristian S.J. Peron bd->bd_wfcount = 0; 28380e37f3e1SChristian S.J. Peron bd->bd_zcopy = 0; 2839afa85850SAlexander V. Chernikov BPFD_UNLOCK(bd); 28400e37f3e1SChristian S.J. Peron } 2841e4b3229aSAlexander V. Chernikov BPFIF_RUNLOCK(bp); 28420e37f3e1SChristian S.J. Peron } 2843e4b3229aSAlexander V. Chernikov BPF_UNLOCK(); 28440e37f3e1SChristian S.J. Peron } 28450e37f3e1SChristian S.J. Peron 28466c74ff0eSAlexander V. Chernikov /* 28476c74ff0eSAlexander V. Chernikov * Fill filter statistics 28486c74ff0eSAlexander V. Chernikov */ 284969f7644bSChristian S.J. Peron static void 285069f7644bSChristian S.J. Peron bpfstats_fill_xbpf(struct xbpf_d *d, struct bpf_d *bd) 285169f7644bSChristian S.J. Peron { 285269f7644bSChristian S.J. Peron 285369f7644bSChristian S.J. Peron bzero(d, sizeof(*d)); 285469f7644bSChristian S.J. Peron BPFD_LOCK_ASSERT(bd); 28554d621040SChristian S.J. Peron d->bd_structsize = sizeof(*d); 28566c74ff0eSAlexander V. Chernikov /* XXX: reading should be protected by global lock */ 285769f7644bSChristian S.J. Peron d->bd_immediate = bd->bd_immediate; 285869f7644bSChristian S.J. Peron d->bd_promisc = bd->bd_promisc; 285969f7644bSChristian S.J. Peron d->bd_hdrcmplt = bd->bd_hdrcmplt; 2860560a54e1SJung-uk Kim d->bd_direction = bd->bd_direction; 2861560a54e1SJung-uk Kim d->bd_feedback = bd->bd_feedback; 286269f7644bSChristian S.J. Peron d->bd_async = bd->bd_async; 286369f7644bSChristian S.J. Peron d->bd_rcount = bd->bd_rcount; 286469f7644bSChristian S.J. Peron d->bd_dcount = bd->bd_dcount; 286569f7644bSChristian S.J. Peron d->bd_fcount = bd->bd_fcount; 286669f7644bSChristian S.J. Peron d->bd_sig = bd->bd_sig; 286769f7644bSChristian S.J. Peron d->bd_slen = bd->bd_slen; 286869f7644bSChristian S.J. Peron d->bd_hlen = bd->bd_hlen; 286969f7644bSChristian S.J. Peron d->bd_bufsize = bd->bd_bufsize; 287069f7644bSChristian S.J. Peron d->bd_pid = bd->bd_pid; 287169f7644bSChristian S.J. Peron strlcpy(d->bd_ifname, 287269f7644bSChristian S.J. Peron bd->bd_bif->bif_ifp->if_xname, IFNAMSIZ); 287393e39f0bSChristian S.J. Peron d->bd_locked = bd->bd_locked; 28744d621040SChristian S.J. Peron d->bd_wcount = bd->bd_wcount; 28754d621040SChristian S.J. Peron d->bd_wdcount = bd->bd_wdcount; 28764d621040SChristian S.J. Peron d->bd_wfcount = bd->bd_wfcount; 28774d621040SChristian S.J. Peron d->bd_zcopy = bd->bd_zcopy; 28784d621040SChristian S.J. Peron d->bd_bufmode = bd->bd_bufmode; 287969f7644bSChristian S.J. Peron } 288069f7644bSChristian S.J. Peron 28816c74ff0eSAlexander V. Chernikov /* 28826c74ff0eSAlexander V. Chernikov * Handle `netstat -B' stats request 28836c74ff0eSAlexander V. Chernikov */ 288469f7644bSChristian S.J. Peron static int 288569f7644bSChristian S.J. Peron bpf_stats_sysctl(SYSCTL_HANDLER_ARGS) 288669f7644bSChristian S.J. Peron { 28870e1152fcSHans Petter Selasky static const struct xbpf_d zerostats; 28880e1152fcSHans Petter Selasky struct xbpf_d *xbdbuf, *xbd, tempstats; 2889422a63daSChristian S.J. Peron int index, error; 289069f7644bSChristian S.J. Peron struct bpf_if *bp; 289169f7644bSChristian S.J. Peron struct bpf_d *bd; 289269f7644bSChristian S.J. Peron 289369f7644bSChristian S.J. Peron /* 289469f7644bSChristian S.J. Peron * XXX This is not technically correct. It is possible for non 289569f7644bSChristian S.J. Peron * privileged users to open bpf devices. It would make sense 289669f7644bSChristian S.J. Peron * if the users who opened the devices were able to retrieve 289769f7644bSChristian S.J. Peron * the statistics for them, too. 289869f7644bSChristian S.J. Peron */ 2899acd3428bSRobert Watson error = priv_check(req->td, PRIV_NET_BPF); 290069f7644bSChristian S.J. Peron if (error) 290169f7644bSChristian S.J. Peron return (error); 29020e37f3e1SChristian S.J. Peron /* 29030e37f3e1SChristian S.J. Peron * Check to see if the user is requesting that the counters be 29040e37f3e1SChristian S.J. Peron * zeroed out. Explicitly check that the supplied data is zeroed, 29050e37f3e1SChristian S.J. Peron * as we aren't allowing the user to set the counters currently. 29060e37f3e1SChristian S.J. Peron */ 29070e37f3e1SChristian S.J. Peron if (req->newptr != NULL) { 29080e1152fcSHans Petter Selasky if (req->newlen != sizeof(tempstats)) 29090e37f3e1SChristian S.J. Peron return (EINVAL); 29100e1152fcSHans Petter Selasky memset(&tempstats, 0, sizeof(tempstats)); 29110e1152fcSHans Petter Selasky error = SYSCTL_IN(req, &tempstats, sizeof(tempstats)); 29120e1152fcSHans Petter Selasky if (error) 29130e1152fcSHans Petter Selasky return (error); 29140e1152fcSHans Petter Selasky if (bcmp(&tempstats, &zerostats, sizeof(tempstats)) != 0) 29150e37f3e1SChristian S.J. Peron return (EINVAL); 29160e37f3e1SChristian S.J. Peron bpf_zero_counters(); 29170e37f3e1SChristian S.J. Peron return (0); 29180e37f3e1SChristian S.J. Peron } 291969f7644bSChristian S.J. Peron if (req->oldptr == NULL) 2920422a63daSChristian S.J. Peron return (SYSCTL_OUT(req, 0, bpf_bpfd_cnt * sizeof(*xbd))); 292169f7644bSChristian S.J. Peron if (bpf_bpfd_cnt == 0) 292269f7644bSChristian S.J. Peron return (SYSCTL_OUT(req, 0, 0)); 2923422a63daSChristian S.J. Peron xbdbuf = malloc(req->oldlen, M_BPF, M_WAITOK); 2924e4b3229aSAlexander V. Chernikov BPF_LOCK(); 2925422a63daSChristian S.J. Peron if (req->oldlen < (bpf_bpfd_cnt * sizeof(*xbd))) { 2926e4b3229aSAlexander V. Chernikov BPF_UNLOCK(); 2927422a63daSChristian S.J. Peron free(xbdbuf, M_BPF); 2928422a63daSChristian S.J. Peron return (ENOMEM); 2929422a63daSChristian S.J. Peron } 2930422a63daSChristian S.J. Peron index = 0; 293169f7644bSChristian S.J. Peron LIST_FOREACH(bp, &bpf_iflist, bif_next) { 2932e4b3229aSAlexander V. Chernikov BPFIF_RLOCK(bp); 293351ec1eb7SAlexander V. Chernikov /* Send writers-only first */ 293451ec1eb7SAlexander V. Chernikov LIST_FOREACH(bd, &bp->bif_wlist, bd_next) { 293551ec1eb7SAlexander V. Chernikov xbd = &xbdbuf[index++]; 2936afa85850SAlexander V. Chernikov BPFD_LOCK(bd); 293751ec1eb7SAlexander V. Chernikov bpfstats_fill_xbpf(xbd, bd); 2938afa85850SAlexander V. Chernikov BPFD_UNLOCK(bd); 293951ec1eb7SAlexander V. Chernikov } 294069f7644bSChristian S.J. Peron LIST_FOREACH(bd, &bp->bif_dlist, bd_next) { 2941422a63daSChristian S.J. Peron xbd = &xbdbuf[index++]; 2942afa85850SAlexander V. Chernikov BPFD_LOCK(bd); 2943422a63daSChristian S.J. Peron bpfstats_fill_xbpf(xbd, bd); 2944afa85850SAlexander V. Chernikov BPFD_UNLOCK(bd); 294569f7644bSChristian S.J. Peron } 2946e4b3229aSAlexander V. Chernikov BPFIF_RUNLOCK(bp); 294769f7644bSChristian S.J. Peron } 2948e4b3229aSAlexander V. Chernikov BPF_UNLOCK(); 2949422a63daSChristian S.J. Peron error = SYSCTL_OUT(req, xbdbuf, index * sizeof(*xbd)); 2950422a63daSChristian S.J. Peron free(xbdbuf, M_BPF); 295169f7644bSChristian S.J. Peron return (error); 295269f7644bSChristian S.J. Peron } 295369f7644bSChristian S.J. Peron 2954237fdd78SRobert Watson SYSINIT(bpfdev,SI_SUB_DRIVERS,SI_ORDER_MIDDLE,bpf_drvinit,NULL); 295553ac6efbSJulian Elischer 29565bb5f2c9SPeter Wemm #else /* !DEV_BPF && !NETGRAPH_BPF */ 2957f8dc4716SMike Smith /* 2958f8dc4716SMike Smith * NOP stubs to allow bpf-using drivers to load and function. 2959f8dc4716SMike Smith * 2960f8dc4716SMike Smith * A 'better' implementation would allow the core bpf functionality 2961f8dc4716SMike Smith * to be loaded at runtime. 2962f8dc4716SMike Smith */ 29637eae78a4SChristian S.J. Peron static struct bpf_if bp_null; 2964f8dc4716SMike Smith 2965f8dc4716SMike Smith void 296619ba8395SChristian S.J. Peron bpf_tap(struct bpf_if *bp, u_char *pkt, u_int pktlen) 2967f8dc4716SMike Smith { 2968f8dc4716SMike Smith } 2969f8dc4716SMike Smith 2970f8dc4716SMike Smith void 297119ba8395SChristian S.J. Peron bpf_mtap(struct bpf_if *bp, struct mbuf *m) 2972f8dc4716SMike Smith { 2973f8dc4716SMike Smith } 2974f8dc4716SMike Smith 2975f8dc4716SMike Smith void 297619ba8395SChristian S.J. Peron bpf_mtap2(struct bpf_if *bp, void *d, u_int l, struct mbuf *m) 2977437ffe18SSam Leffler { 2978437ffe18SSam Leffler } 2979437ffe18SSam Leffler 2980437ffe18SSam Leffler void 298119ba8395SChristian S.J. Peron bpfattach(struct ifnet *ifp, u_int dlt, u_int hdrlen) 2982f8dc4716SMike Smith { 29837eae78a4SChristian S.J. Peron 29847eae78a4SChristian S.J. Peron bpfattach2(ifp, dlt, hdrlen, &ifp->if_bpf); 2985f8dc4716SMike Smith } 2986f8dc4716SMike Smith 2987da626c17SBill Paul void 298819ba8395SChristian S.J. Peron bpfattach2(struct ifnet *ifp, u_int dlt, u_int hdrlen, struct bpf_if **driverp) 29895f7a7923SSam Leffler { 29907eae78a4SChristian S.J. Peron 29917eae78a4SChristian S.J. Peron *driverp = &bp_null; 29925f7a7923SSam Leffler } 29935f7a7923SSam Leffler 29945f7a7923SSam Leffler void 299519ba8395SChristian S.J. Peron bpfdetach(struct ifnet *ifp) 2996da626c17SBill Paul { 2997da626c17SBill Paul } 2998da626c17SBill Paul 2999f8dc4716SMike Smith u_int 300019ba8395SChristian S.J. Peron bpf_filter(const struct bpf_insn *pc, u_char *p, u_int wirelen, u_int buflen) 3001f8dc4716SMike Smith { 3002f8dc4716SMike Smith return -1; /* "no filter" behaviour */ 3003f8dc4716SMike Smith } 3004f8dc4716SMike Smith 30055bb5f2c9SPeter Wemm int 300619ba8395SChristian S.J. Peron bpf_validate(const struct bpf_insn *f, int len) 30075bb5f2c9SPeter Wemm { 30085bb5f2c9SPeter Wemm return 0; /* false */ 30095bb5f2c9SPeter Wemm } 30105bb5f2c9SPeter Wemm 30115bb5f2c9SPeter Wemm #endif /* !DEV_BPF && !NETGRAPH_BPF */ 301205fc4164SBjoern A. Zeeb 301305fc4164SBjoern A. Zeeb #ifdef DDB 301405fc4164SBjoern A. Zeeb static void 301505fc4164SBjoern A. Zeeb bpf_show_bpf_if(struct bpf_if *bpf_if) 301605fc4164SBjoern A. Zeeb { 301705fc4164SBjoern A. Zeeb 301805fc4164SBjoern A. Zeeb if (bpf_if == NULL) 301905fc4164SBjoern A. Zeeb return; 302005fc4164SBjoern A. Zeeb db_printf("%p:\n", bpf_if); 302105fc4164SBjoern A. Zeeb #define BPF_DB_PRINTF(f, e) db_printf(" %s = " f "\n", #e, bpf_if->e); 302205fc4164SBjoern A. Zeeb /* bif_ext.bif_next */ 302305fc4164SBjoern A. Zeeb /* bif_ext.bif_dlist */ 302405fc4164SBjoern A. Zeeb BPF_DB_PRINTF("%#x", bif_dlt); 302505fc4164SBjoern A. Zeeb BPF_DB_PRINTF("%u", bif_hdrlen); 302605fc4164SBjoern A. Zeeb BPF_DB_PRINTF("%p", bif_ifp); 302705fc4164SBjoern A. Zeeb /* bif_lock */ 302805fc4164SBjoern A. Zeeb /* bif_wlist */ 302905fc4164SBjoern A. Zeeb BPF_DB_PRINTF("%#x", bif_flags); 303005fc4164SBjoern A. Zeeb } 303105fc4164SBjoern A. Zeeb 303205fc4164SBjoern A. Zeeb DB_SHOW_COMMAND(bpf_if, db_show_bpf_if) 303305fc4164SBjoern A. Zeeb { 303405fc4164SBjoern A. Zeeb 303505fc4164SBjoern A. Zeeb if (!have_addr) { 303605fc4164SBjoern A. Zeeb db_printf("usage: show bpf_if <struct bpf_if *>\n"); 303705fc4164SBjoern A. Zeeb return; 303805fc4164SBjoern A. Zeeb } 303905fc4164SBjoern A. Zeeb 304005fc4164SBjoern A. Zeeb bpf_show_bpf_if((struct bpf_if *)addr); 304105fc4164SBjoern A. Zeeb } 304205fc4164SBjoern A. Zeeb #endif 3043