1c398230bSWarner Losh /*- 251369649SPedro F. Giffuni * SPDX-License-Identifier: BSD-3-Clause 351369649SPedro F. Giffuni * 4df8bae1dSRodney W. Grimes * Copyright (c) 1990, 1991, 1993 5253a3814SLawrence Stewart * The Regents of the University of California. All rights reserved. 6df8bae1dSRodney W. Grimes * 7df8bae1dSRodney W. Grimes * This code is derived from the Stanford/CMU enet packet filter, 8df8bae1dSRodney W. Grimes * (net/enet.c) distributed as part of 4.3BSD, and code contributed 9df8bae1dSRodney W. Grimes * to Berkeley by Steven McCanne and Van Jacobson both of Lawrence 10df8bae1dSRodney W. Grimes * Berkeley Laboratory. 11df8bae1dSRodney W. Grimes * 12df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 13df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 14df8bae1dSRodney W. Grimes * are met: 15df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 16df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 17df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 18df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 19df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 20fbbd9655SWarner Losh * 3. Neither the name of the University nor the names of its contributors 21df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 22df8bae1dSRodney W. Grimes * without specific prior written permission. 23df8bae1dSRodney W. Grimes * 24df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 25df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 26df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 27df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 28df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 29df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 30df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 31df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 32df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 33df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 34df8bae1dSRodney W. Grimes * SUCH DAMAGE. 35df8bae1dSRodney W. Grimes * 364f252c4dSRuslan Ermilov * @(#)bpf.c 8.4 (Berkeley) 1/9/95 37df8bae1dSRodney W. Grimes */ 38df8bae1dSRodney W. Grimes 39c7866007SRobert Watson #include <sys/cdefs.h> 40c7866007SRobert Watson __FBSDID("$FreeBSD$"); 41c7866007SRobert Watson 425bb5f2c9SPeter Wemm #include "opt_bpf.h" 43fc0a61a4SKonstantin Belousov #include "opt_compat.h" 4405fc4164SBjoern A. Zeeb #include "opt_ddb.h" 455bb5f2c9SPeter Wemm #include "opt_netgraph.h" 46df8bae1dSRodney W. Grimes 4795aab9ccSJohn-Mark Gurney #include <sys/types.h> 48df8bae1dSRodney W. Grimes #include <sys/param.h> 49e4b3229aSAlexander V. Chernikov #include <sys/lock.h> 50e4b3229aSAlexander V. Chernikov #include <sys/rwlock.h> 51df8bae1dSRodney W. Grimes #include <sys/systm.h> 52ce7609a4SBruce Evans #include <sys/conf.h> 53e76eee55SPoul-Henning Kamp #include <sys/fcntl.h> 54ebd8672cSBjoern A. Zeeb #include <sys/jail.h> 554d1d4912SBruce Evans #include <sys/malloc.h> 56df8bae1dSRodney W. Grimes #include <sys/mbuf.h> 57df8bae1dSRodney W. Grimes #include <sys/time.h> 58acd3428bSRobert Watson #include <sys/priv.h> 59df8bae1dSRodney W. Grimes #include <sys/proc.h> 600310c19fSBruce Evans #include <sys/signalvar.h> 61528f627fSBruce Evans #include <sys/filio.h> 62528f627fSBruce Evans #include <sys/sockio.h> 63528f627fSBruce Evans #include <sys/ttycom.h> 64e76eee55SPoul-Henning Kamp #include <sys/uio.h> 6574549d4bSWojciech Macek #include <sys/sysent.h> 66df8bae1dSRodney W. Grimes 6795aab9ccSJohn-Mark Gurney #include <sys/event.h> 6895aab9ccSJohn-Mark Gurney #include <sys/file.h> 69243ac7d8SPeter Wemm #include <sys/poll.h> 7095aab9ccSJohn-Mark Gurney #include <sys/proc.h> 71df8bae1dSRodney W. Grimes 72df8bae1dSRodney W. Grimes #include <sys/socket.h> 73df8bae1dSRodney W. Grimes 7405fc4164SBjoern A. Zeeb #ifdef DDB 7505fc4164SBjoern A. Zeeb #include <ddb/ddb.h> 7605fc4164SBjoern A. Zeeb #endif 7705fc4164SBjoern A. Zeeb 78fba9235dSBruce Evans #include <net/if.h> 7976039bc8SGleb Smirnoff #include <net/if_var.h> 804fb3a820SAlexander V. Chernikov #include <net/if_dl.h> 81df8bae1dSRodney W. Grimes #include <net/bpf.h> 824d621040SChristian S.J. Peron #include <net/bpf_buffer.h> 83ae275efcSJung-uk Kim #ifdef BPF_JITTER 84ae275efcSJung-uk Kim #include <net/bpf_jitter.h> 85ae275efcSJung-uk Kim #endif 864d621040SChristian S.J. Peron #include <net/bpf_zerocopy.h> 87df8bae1dSRodney W. Grimes #include <net/bpfdesc.h> 884fb3a820SAlexander V. Chernikov #include <net/route.h> 89530c0060SRobert Watson #include <net/vnet.h> 90df8bae1dSRodney W. Grimes 91df8bae1dSRodney W. Grimes #include <netinet/in.h> 92df8bae1dSRodney W. Grimes #include <netinet/if_ether.h> 93df8bae1dSRodney W. Grimes #include <sys/kernel.h> 94f708ef1bSPoul-Henning Kamp #include <sys/sysctl.h> 957b778b5eSEivind Eklund 96246b5467SSam Leffler #include <net80211/ieee80211_freebsd.h> 97246b5467SSam Leffler 98aed55708SRobert Watson #include <security/mac/mac_framework.h> 99aed55708SRobert Watson 1004d621040SChristian S.J. Peron MALLOC_DEFINE(M_BPF, "BPF", "BPF data"); 10187f6c662SJulian Elischer 102b23cbbe6SMark Johnston struct bpf_if { 103b23cbbe6SMark Johnston #define bif_next bif_ext.bif_next 104b23cbbe6SMark Johnston #define bif_dlist bif_ext.bif_dlist 105b23cbbe6SMark Johnston struct bpf_if_ext bif_ext; /* public members */ 106b23cbbe6SMark Johnston u_int bif_dlt; /* link layer type */ 107b23cbbe6SMark Johnston u_int bif_hdrlen; /* length of link header */ 108b23cbbe6SMark Johnston struct ifnet *bif_ifp; /* corresponding interface */ 109b23cbbe6SMark Johnston struct rwlock bif_lock; /* interface lock */ 110b23cbbe6SMark Johnston LIST_HEAD(, bpf_d) bif_wlist; /* writer-only list */ 111b23cbbe6SMark Johnston int bif_flags; /* Interface flags */ 1129ce40d32SKristof Provost struct bpf_if **bif_bpf; /* Pointer to pointer to us */ 113b23cbbe6SMark Johnston }; 114b23cbbe6SMark Johnston 115b23cbbe6SMark Johnston CTASSERT(offsetof(struct bpf_if, bif_ext) == 0); 116b23cbbe6SMark Johnston 1175bb5f2c9SPeter Wemm #if defined(DEV_BPF) || defined(NETGRAPH_BPF) 11853ac6efbSJulian Elischer 119df8bae1dSRodney W. Grimes #define PRINET 26 /* interruptible */ 120df8bae1dSRodney W. Grimes 121547d94bdSJung-uk Kim #define SIZEOF_BPF_HDR(type) \ 122547d94bdSJung-uk Kim (offsetof(type, bh_hdrlen) + sizeof(((type *)0)->bh_hdrlen)) 123547d94bdSJung-uk Kim 124fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 125fc0a61a4SKonstantin Belousov #include <sys/mount.h> 126fc0a61a4SKonstantin Belousov #include <compat/freebsd32/freebsd32.h> 127fc0a61a4SKonstantin Belousov #define BPF_ALIGNMENT32 sizeof(int32_t) 128d9c9c81cSPedro F. Giffuni #define BPF_WORDALIGN32(x) roundup2(x, BPF_ALIGNMENT32) 129fc0a61a4SKonstantin Belousov 130547d94bdSJung-uk Kim #ifndef BURN_BRIDGES 131fc0a61a4SKonstantin Belousov /* 132fc0a61a4SKonstantin Belousov * 32-bit version of structure prepended to each packet. We use this header 133fc0a61a4SKonstantin Belousov * instead of the standard one for 32-bit streams. We mark the a stream as 134fc0a61a4SKonstantin Belousov * 32-bit the first time we see a 32-bit compat ioctl request. 135fc0a61a4SKonstantin Belousov */ 136fc0a61a4SKonstantin Belousov struct bpf_hdr32 { 137fc0a61a4SKonstantin Belousov struct timeval32 bh_tstamp; /* time stamp */ 138fc0a61a4SKonstantin Belousov uint32_t bh_caplen; /* length of captured portion */ 139fc0a61a4SKonstantin Belousov uint32_t bh_datalen; /* original length of packet */ 140fc0a61a4SKonstantin Belousov uint16_t bh_hdrlen; /* length of bpf header (this struct 141fc0a61a4SKonstantin Belousov plus alignment padding) */ 142fc0a61a4SKonstantin Belousov }; 143253a3814SLawrence Stewart #endif 144fc0a61a4SKonstantin Belousov 145fc0a61a4SKonstantin Belousov struct bpf_program32 { 146fc0a61a4SKonstantin Belousov u_int bf_len; 147fc0a61a4SKonstantin Belousov uint32_t bf_insns; 148fc0a61a4SKonstantin Belousov }; 149fc0a61a4SKonstantin Belousov 150fc0a61a4SKonstantin Belousov struct bpf_dltlist32 { 151fc0a61a4SKonstantin Belousov u_int bfl_len; 152fc0a61a4SKonstantin Belousov u_int bfl_list; 153fc0a61a4SKonstantin Belousov }; 154fc0a61a4SKonstantin Belousov 155fc0a61a4SKonstantin Belousov #define BIOCSETF32 _IOW('B', 103, struct bpf_program32) 156fc0a61a4SKonstantin Belousov #define BIOCSRTIMEOUT32 _IOW('B', 109, struct timeval32) 157fc0a61a4SKonstantin Belousov #define BIOCGRTIMEOUT32 _IOR('B', 110, struct timeval32) 158fc0a61a4SKonstantin Belousov #define BIOCGDLTLIST32 _IOWR('B', 121, struct bpf_dltlist32) 159fc0a61a4SKonstantin Belousov #define BIOCSETWF32 _IOW('B', 123, struct bpf_program32) 160fc0a61a4SKonstantin Belousov #define BIOCSETFNR32 _IOW('B', 130, struct bpf_program32) 161253a3814SLawrence Stewart #endif 162fc0a61a4SKonstantin Belousov 163df8bae1dSRodney W. Grimes /* 164d1a67300SRobert Watson * bpf_iflist is a list of BPF interface structures, each corresponding to a 165d1a67300SRobert Watson * specific DLT. The same network interface might have several BPF interface 166d1a67300SRobert Watson * structures registered by different layers in the stack (i.e., 802.11 167d1a67300SRobert Watson * frames, ethernet frames, etc). 168df8bae1dSRodney W. Grimes */ 169f079a0faSAlexander V. Chernikov static LIST_HEAD(, bpf_if) bpf_iflist, bpf_freelist; 170e7bb21b3SJonathan Lemon static struct mtx bpf_mtx; /* bpf global lock */ 17169f7644bSChristian S.J. Peron static int bpf_bpfd_cnt; 172df8bae1dSRodney W. Grimes 17319ba8395SChristian S.J. Peron static void bpf_attachd(struct bpf_d *, struct bpf_if *); 17419ba8395SChristian S.J. Peron static void bpf_detachd(struct bpf_d *); 1756c74ff0eSAlexander V. Chernikov static void bpf_detachd_locked(struct bpf_d *); 176929ddbbbSAlfred Perlstein static void bpf_freed(struct bpf_d *); 177cb44b6dfSAndrew Thompson static int bpf_movein(struct uio *, int, struct ifnet *, struct mbuf **, 1784fb3a820SAlexander V. Chernikov struct sockaddr *, int *, struct bpf_d *); 179929ddbbbSAlfred Perlstein static int bpf_setif(struct bpf_d *, struct ifreq *); 180929ddbbbSAlfred Perlstein static void bpf_timed_out(void *); 181e7bb21b3SJonathan Lemon static __inline void 182929ddbbbSAlfred Perlstein bpf_wakeup(struct bpf_d *); 1834d621040SChristian S.J. Peron static void catchpacket(struct bpf_d *, u_char *, u_int, u_int, 1844d621040SChristian S.J. Peron void (*)(struct bpf_d *, caddr_t, u_int, void *, u_int), 185547d94bdSJung-uk Kim struct bintime *); 186929ddbbbSAlfred Perlstein static void reset_d(struct bpf_d *); 18793e39f0bSChristian S.J. Peron static int bpf_setf(struct bpf_d *, struct bpf_program *, u_long cmd); 1888eab61f3SSam Leffler static int bpf_getdltlist(struct bpf_d *, struct bpf_dltlist *); 1898eab61f3SSam Leffler static int bpf_setdlt(struct bpf_d *, u_int); 19095aab9ccSJohn-Mark Gurney static void filt_bpfdetach(struct knote *); 19195aab9ccSJohn-Mark Gurney static int filt_bpfread(struct knote *, long); 192a3272e3cSChristian S.J. Peron static void bpf_drvinit(void *); 19369f7644bSChristian S.J. Peron static int bpf_stats_sysctl(SYSCTL_HANDLER_ARGS); 19469f7644bSChristian S.J. Peron 19569f7644bSChristian S.J. Peron SYSCTL_NODE(_net, OID_AUTO, bpf, CTLFLAG_RW, 0, "bpf sysctl"); 19612dc9582SJung-uk Kim int bpf_maxinsns = BPF_MAXINSNS; 19769f7644bSChristian S.J. Peron SYSCTL_INT(_net_bpf, OID_AUTO, maxinsns, CTLFLAG_RW, 19869f7644bSChristian S.J. Peron &bpf_maxinsns, 0, "Maximum bpf program instructions"); 199ffeeb924SChristian S.J. Peron static int bpf_zerocopy_enable = 0; 2004d621040SChristian S.J. Peron SYSCTL_INT(_net_bpf, OID_AUTO, zerocopy_enable, CTLFLAG_RW, 2014d621040SChristian S.J. Peron &bpf_zerocopy_enable, 0, "Enable new zero-copy BPF buffer sessions"); 2026472ac3dSEd Schouten static SYSCTL_NODE(_net_bpf, OID_AUTO, stats, CTLFLAG_MPSAFE | CTLFLAG_RW, 20369f7644bSChristian S.J. Peron bpf_stats_sysctl, "bpf statistics portal"); 204df8bae1dSRodney W. Grimes 20551ec1eb7SAlexander V. Chernikov static VNET_DEFINE(int, bpf_optimize_writers) = 0; 20651ec1eb7SAlexander V. Chernikov #define V_bpf_optimize_writers VNET(bpf_optimize_writers) 2076df8a710SGleb Smirnoff SYSCTL_INT(_net_bpf, OID_AUTO, optimize_writers, CTLFLAG_VNET | CTLFLAG_RW, 2086df8a710SGleb Smirnoff &VNET_NAME(bpf_optimize_writers), 0, 20951ec1eb7SAlexander V. Chernikov "Do not send packets until BPF program is set"); 21051ec1eb7SAlexander V. Chernikov 21187f6c662SJulian Elischer static d_open_t bpfopen; 21287f6c662SJulian Elischer static d_read_t bpfread; 21387f6c662SJulian Elischer static d_write_t bpfwrite; 21487f6c662SJulian Elischer static d_ioctl_t bpfioctl; 215243ac7d8SPeter Wemm static d_poll_t bpfpoll; 21695aab9ccSJohn-Mark Gurney static d_kqfilter_t bpfkqfilter; 21787f6c662SJulian Elischer 2184e2f199eSPoul-Henning Kamp static struct cdevsw bpf_cdevsw = { 219dc08ffecSPoul-Henning Kamp .d_version = D_VERSION, 2207ac40f5fSPoul-Henning Kamp .d_open = bpfopen, 2217ac40f5fSPoul-Henning Kamp .d_read = bpfread, 2227ac40f5fSPoul-Henning Kamp .d_write = bpfwrite, 2237ac40f5fSPoul-Henning Kamp .d_ioctl = bpfioctl, 2247ac40f5fSPoul-Henning Kamp .d_poll = bpfpoll, 2257ac40f5fSPoul-Henning Kamp .d_name = "bpf", 22695aab9ccSJohn-Mark Gurney .d_kqfilter = bpfkqfilter, 2274e2f199eSPoul-Henning Kamp }; 22887f6c662SJulian Elischer 229e76d823bSRobert Watson static struct filterops bpfread_filtops = { 230e76d823bSRobert Watson .f_isfd = 1, 231e76d823bSRobert Watson .f_detach = filt_bpfdetach, 232e76d823bSRobert Watson .f_event = filt_bpfread, 233e76d823bSRobert Watson }; 23487f6c662SJulian Elischer 235afa85850SAlexander V. Chernikov eventhandler_tag bpf_ifdetach_cookie = NULL; 236afa85850SAlexander V. Chernikov 2374d621040SChristian S.J. Peron /* 2386c74ff0eSAlexander V. Chernikov * LOCKING MODEL USED BY BPF: 2396c74ff0eSAlexander V. Chernikov * Locks: 2406c74ff0eSAlexander V. Chernikov * 1) global lock (BPF_LOCK). Mutex, used to protect interface addition/removal, 2416c74ff0eSAlexander V. Chernikov * some global counters and every bpf_if reference. 2426c74ff0eSAlexander V. Chernikov * 2) Interface lock. Rwlock, used to protect list of BPF descriptors and their filters. 243afa85850SAlexander V. Chernikov * 3) Descriptor lock. Mutex, used to protect BPF buffers and various structure fields 2446c74ff0eSAlexander V. Chernikov * used by bpf_mtap code. 2456c74ff0eSAlexander V. Chernikov * 2466c74ff0eSAlexander V. Chernikov * Lock order: 2476c74ff0eSAlexander V. Chernikov * 2486c74ff0eSAlexander V. Chernikov * Global lock, interface lock, descriptor lock 2496c74ff0eSAlexander V. Chernikov * 2506c74ff0eSAlexander V. Chernikov * We have to acquire interface lock before descriptor main lock due to BPF_MTAP[2] 2516c74ff0eSAlexander V. Chernikov * working model. In many places (like bpf_detachd) we start with BPF descriptor 2526c74ff0eSAlexander V. Chernikov * (and we need to at least rlock it to get reliable interface pointer). This 2536c74ff0eSAlexander V. Chernikov * gives us potential LOR. As a result, we use global lock to protect from bpf_if 2546c74ff0eSAlexander V. Chernikov * change in every such place. 2556c74ff0eSAlexander V. Chernikov * 2566c74ff0eSAlexander V. Chernikov * Changing d->bd_bif is protected by 1) global lock, 2) interface lock and 2576c74ff0eSAlexander V. Chernikov * 3) descriptor main wlock. 2586c74ff0eSAlexander V. Chernikov * Reading bd_bif can be protected by any of these locks, typically global lock. 2596c74ff0eSAlexander V. Chernikov * 2606c74ff0eSAlexander V. Chernikov * Changing read/write BPF filter is protected by the same three locks, 2616c74ff0eSAlexander V. Chernikov * the same applies for reading. 2626c74ff0eSAlexander V. Chernikov * 2636c74ff0eSAlexander V. Chernikov * Sleeping in global lock is not allowed due to bpfdetach() using it. 2646c74ff0eSAlexander V. Chernikov */ 2656c74ff0eSAlexander V. Chernikov 2666c74ff0eSAlexander V. Chernikov /* 2674d621040SChristian S.J. Peron * Wrapper functions for various buffering methods. If the set of buffer 2684d621040SChristian S.J. Peron * modes expands, we will probably want to introduce a switch data structure 2694d621040SChristian S.J. Peron * similar to protosw, et. 2704d621040SChristian S.J. Peron */ 2714d621040SChristian S.J. Peron static void 2724d621040SChristian S.J. Peron bpf_append_bytes(struct bpf_d *d, caddr_t buf, u_int offset, void *src, 2734d621040SChristian S.J. Peron u_int len) 2744d621040SChristian S.J. Peron { 2754d621040SChristian S.J. Peron 276afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 2774d621040SChristian S.J. Peron 2784d621040SChristian S.J. Peron switch (d->bd_bufmode) { 2794d621040SChristian S.J. Peron case BPF_BUFMODE_BUFFER: 2804d621040SChristian S.J. Peron return (bpf_buffer_append_bytes(d, buf, offset, src, len)); 2814d621040SChristian S.J. Peron 2824d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 283*b2b7ca49SAlexander V. Chernikov counter_u64_add(d->bd_zcopy, 1); 2844d621040SChristian S.J. Peron return (bpf_zerocopy_append_bytes(d, buf, offset, src, len)); 2854d621040SChristian S.J. Peron 2864d621040SChristian S.J. Peron default: 2874d621040SChristian S.J. Peron panic("bpf_buf_append_bytes"); 2884d621040SChristian S.J. Peron } 2894d621040SChristian S.J. Peron } 2904d621040SChristian S.J. Peron 2914d621040SChristian S.J. Peron static void 2924d621040SChristian S.J. Peron bpf_append_mbuf(struct bpf_d *d, caddr_t buf, u_int offset, void *src, 2934d621040SChristian S.J. Peron u_int len) 2944d621040SChristian S.J. Peron { 2954d621040SChristian S.J. Peron 296afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 2974d621040SChristian S.J. Peron 2984d621040SChristian S.J. Peron switch (d->bd_bufmode) { 2994d621040SChristian S.J. Peron case BPF_BUFMODE_BUFFER: 3004d621040SChristian S.J. Peron return (bpf_buffer_append_mbuf(d, buf, offset, src, len)); 3014d621040SChristian S.J. Peron 3024d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 303*b2b7ca49SAlexander V. Chernikov counter_u64_add(d->bd_zcopy, 1); 3044d621040SChristian S.J. Peron return (bpf_zerocopy_append_mbuf(d, buf, offset, src, len)); 3054d621040SChristian S.J. Peron 3064d621040SChristian S.J. Peron default: 3074d621040SChristian S.J. Peron panic("bpf_buf_append_mbuf"); 3084d621040SChristian S.J. Peron } 3094d621040SChristian S.J. Peron } 3104d621040SChristian S.J. Peron 3114d621040SChristian S.J. Peron /* 31229f612ecSChristian S.J. Peron * This function gets called when the free buffer is re-assigned. 31329f612ecSChristian S.J. Peron */ 31429f612ecSChristian S.J. Peron static void 31529f612ecSChristian S.J. Peron bpf_buf_reclaimed(struct bpf_d *d) 31629f612ecSChristian S.J. Peron { 31729f612ecSChristian S.J. Peron 318afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 31929f612ecSChristian S.J. Peron 32029f612ecSChristian S.J. Peron switch (d->bd_bufmode) { 32129f612ecSChristian S.J. Peron case BPF_BUFMODE_BUFFER: 32229f612ecSChristian S.J. Peron return; 32329f612ecSChristian S.J. Peron 32429f612ecSChristian S.J. Peron case BPF_BUFMODE_ZBUF: 32529f612ecSChristian S.J. Peron bpf_zerocopy_buf_reclaimed(d); 32629f612ecSChristian S.J. Peron return; 32729f612ecSChristian S.J. Peron 32829f612ecSChristian S.J. Peron default: 32929f612ecSChristian S.J. Peron panic("bpf_buf_reclaimed"); 33029f612ecSChristian S.J. Peron } 33129f612ecSChristian S.J. Peron } 33229f612ecSChristian S.J. Peron 33329f612ecSChristian S.J. Peron /* 3344d621040SChristian S.J. Peron * If the buffer mechanism has a way to decide that a held buffer can be made 3354d621040SChristian S.J. Peron * free, then it is exposed via the bpf_canfreebuf() interface. (1) is 3364d621040SChristian S.J. Peron * returned if the buffer can be discarded, (0) is returned if it cannot. 3374d621040SChristian S.J. Peron */ 3384d621040SChristian S.J. Peron static int 3394d621040SChristian S.J. Peron bpf_canfreebuf(struct bpf_d *d) 3404d621040SChristian S.J. Peron { 3414d621040SChristian S.J. Peron 3424d621040SChristian S.J. Peron BPFD_LOCK_ASSERT(d); 3434d621040SChristian S.J. Peron 3444d621040SChristian S.J. Peron switch (d->bd_bufmode) { 3454d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 3464d621040SChristian S.J. Peron return (bpf_zerocopy_canfreebuf(d)); 3474d621040SChristian S.J. Peron } 3484d621040SChristian S.J. Peron return (0); 3494d621040SChristian S.J. Peron } 3504d621040SChristian S.J. Peron 351a7a91e65SRobert Watson /* 352a7a91e65SRobert Watson * Allow the buffer model to indicate that the current store buffer is 353a7a91e65SRobert Watson * immutable, regardless of the appearance of space. Return (1) if the 354a7a91e65SRobert Watson * buffer is writable, and (0) if not. 355a7a91e65SRobert Watson */ 356a7a91e65SRobert Watson static int 357a7a91e65SRobert Watson bpf_canwritebuf(struct bpf_d *d) 358a7a91e65SRobert Watson { 359a7a91e65SRobert Watson BPFD_LOCK_ASSERT(d); 360a7a91e65SRobert Watson 361a7a91e65SRobert Watson switch (d->bd_bufmode) { 362a7a91e65SRobert Watson case BPF_BUFMODE_ZBUF: 363a7a91e65SRobert Watson return (bpf_zerocopy_canwritebuf(d)); 364a7a91e65SRobert Watson } 365a7a91e65SRobert Watson return (1); 366a7a91e65SRobert Watson } 367a7a91e65SRobert Watson 368a7a91e65SRobert Watson /* 369a7a91e65SRobert Watson * Notify buffer model that an attempt to write to the store buffer has 370a7a91e65SRobert Watson * resulted in a dropped packet, in which case the buffer may be considered 371a7a91e65SRobert Watson * full. 372a7a91e65SRobert Watson */ 373a7a91e65SRobert Watson static void 374a7a91e65SRobert Watson bpf_buffull(struct bpf_d *d) 375a7a91e65SRobert Watson { 376a7a91e65SRobert Watson 377afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 378a7a91e65SRobert Watson 379a7a91e65SRobert Watson switch (d->bd_bufmode) { 380a7a91e65SRobert Watson case BPF_BUFMODE_ZBUF: 381a7a91e65SRobert Watson bpf_zerocopy_buffull(d); 382a7a91e65SRobert Watson break; 383a7a91e65SRobert Watson } 384a7a91e65SRobert Watson } 385a7a91e65SRobert Watson 386a7a91e65SRobert Watson /* 387a7a91e65SRobert Watson * Notify the buffer model that a buffer has moved into the hold position. 388a7a91e65SRobert Watson */ 3894d621040SChristian S.J. Peron void 3904d621040SChristian S.J. Peron bpf_bufheld(struct bpf_d *d) 3914d621040SChristian S.J. Peron { 3924d621040SChristian S.J. Peron 393afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 3944d621040SChristian S.J. Peron 3954d621040SChristian S.J. Peron switch (d->bd_bufmode) { 3964d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 3974d621040SChristian S.J. Peron bpf_zerocopy_bufheld(d); 3984d621040SChristian S.J. Peron break; 3994d621040SChristian S.J. Peron } 4004d621040SChristian S.J. Peron } 4014d621040SChristian S.J. Peron 4024d621040SChristian S.J. Peron static void 4034d621040SChristian S.J. Peron bpf_free(struct bpf_d *d) 4044d621040SChristian S.J. Peron { 4054d621040SChristian S.J. Peron 4064d621040SChristian S.J. Peron switch (d->bd_bufmode) { 4074d621040SChristian S.J. Peron case BPF_BUFMODE_BUFFER: 4084d621040SChristian S.J. Peron return (bpf_buffer_free(d)); 4094d621040SChristian S.J. Peron 4104d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 4114d621040SChristian S.J. Peron return (bpf_zerocopy_free(d)); 4124d621040SChristian S.J. Peron 4134d621040SChristian S.J. Peron default: 4144d621040SChristian S.J. Peron panic("bpf_buf_free"); 4154d621040SChristian S.J. Peron } 4164d621040SChristian S.J. Peron } 4174d621040SChristian S.J. Peron 4184d621040SChristian S.J. Peron static int 4194d621040SChristian S.J. Peron bpf_uiomove(struct bpf_d *d, caddr_t buf, u_int len, struct uio *uio) 4204d621040SChristian S.J. Peron { 4214d621040SChristian S.J. Peron 4224d621040SChristian S.J. Peron if (d->bd_bufmode != BPF_BUFMODE_BUFFER) 4234d621040SChristian S.J. Peron return (EOPNOTSUPP); 4244d621040SChristian S.J. Peron return (bpf_buffer_uiomove(d, buf, len, uio)); 4254d621040SChristian S.J. Peron } 4264d621040SChristian S.J. Peron 4274d621040SChristian S.J. Peron static int 4284d621040SChristian S.J. Peron bpf_ioctl_sblen(struct bpf_d *d, u_int *i) 4294d621040SChristian S.J. Peron { 4304d621040SChristian S.J. Peron 4314d621040SChristian S.J. Peron if (d->bd_bufmode != BPF_BUFMODE_BUFFER) 4324d621040SChristian S.J. Peron return (EOPNOTSUPP); 4334d621040SChristian S.J. Peron return (bpf_buffer_ioctl_sblen(d, i)); 4344d621040SChristian S.J. Peron } 4354d621040SChristian S.J. Peron 4364d621040SChristian S.J. Peron static int 4374d621040SChristian S.J. Peron bpf_ioctl_getzmax(struct thread *td, struct bpf_d *d, size_t *i) 4384d621040SChristian S.J. Peron { 4394d621040SChristian S.J. Peron 4404d621040SChristian S.J. Peron if (d->bd_bufmode != BPF_BUFMODE_ZBUF) 4414d621040SChristian S.J. Peron return (EOPNOTSUPP); 4424d621040SChristian S.J. Peron return (bpf_zerocopy_ioctl_getzmax(td, d, i)); 4434d621040SChristian S.J. Peron } 4444d621040SChristian S.J. Peron 4454d621040SChristian S.J. Peron static int 4464d621040SChristian S.J. Peron bpf_ioctl_rotzbuf(struct thread *td, struct bpf_d *d, struct bpf_zbuf *bz) 4474d621040SChristian S.J. Peron { 4484d621040SChristian S.J. Peron 4494d621040SChristian S.J. Peron if (d->bd_bufmode != BPF_BUFMODE_ZBUF) 4504d621040SChristian S.J. Peron return (EOPNOTSUPP); 4514d621040SChristian S.J. Peron return (bpf_zerocopy_ioctl_rotzbuf(td, d, bz)); 4524d621040SChristian S.J. Peron } 4534d621040SChristian S.J. Peron 4544d621040SChristian S.J. Peron static int 4554d621040SChristian S.J. Peron bpf_ioctl_setzbuf(struct thread *td, struct bpf_d *d, struct bpf_zbuf *bz) 4564d621040SChristian S.J. Peron { 4574d621040SChristian S.J. Peron 4584d621040SChristian S.J. Peron if (d->bd_bufmode != BPF_BUFMODE_ZBUF) 4594d621040SChristian S.J. Peron return (EOPNOTSUPP); 4604d621040SChristian S.J. Peron return (bpf_zerocopy_ioctl_setzbuf(td, d, bz)); 4614d621040SChristian S.J. Peron } 4624d621040SChristian S.J. Peron 4634d621040SChristian S.J. Peron /* 4644d621040SChristian S.J. Peron * General BPF functions. 4654d621040SChristian S.J. Peron */ 466df8bae1dSRodney W. Grimes static int 467cb44b6dfSAndrew Thompson bpf_movein(struct uio *uio, int linktype, struct ifnet *ifp, struct mbuf **mp, 4684fb3a820SAlexander V. Chernikov struct sockaddr *sockp, int *hdrlen, struct bpf_d *d) 469df8bae1dSRodney W. Grimes { 470246b5467SSam Leffler const struct ieee80211_bpf_params *p; 471cb44b6dfSAndrew Thompson struct ether_header *eh; 472df8bae1dSRodney W. Grimes struct mbuf *m; 473df8bae1dSRodney W. Grimes int error; 474df8bae1dSRodney W. Grimes int len; 475df8bae1dSRodney W. Grimes int hlen; 47693e39f0bSChristian S.J. Peron int slen; 477df8bae1dSRodney W. Grimes 478df8bae1dSRodney W. Grimes /* 479df8bae1dSRodney W. Grimes * Build a sockaddr based on the data link layer type. 480df8bae1dSRodney W. Grimes * We do this at this level because the ethernet header 481df8bae1dSRodney W. Grimes * is copied directly into the data field of the sockaddr. 482df8bae1dSRodney W. Grimes * In the case of SLIP, there is no header and the packet 483df8bae1dSRodney W. Grimes * is forwarded as is. 484df8bae1dSRodney W. Grimes * Also, we are careful to leave room at the front of the mbuf 485df8bae1dSRodney W. Grimes * for the link level header. 486df8bae1dSRodney W. Grimes */ 487df8bae1dSRodney W. Grimes switch (linktype) { 488df8bae1dSRodney W. Grimes 489df8bae1dSRodney W. Grimes case DLT_SLIP: 490df8bae1dSRodney W. Grimes sockp->sa_family = AF_INET; 491df8bae1dSRodney W. Grimes hlen = 0; 492df8bae1dSRodney W. Grimes break; 493df8bae1dSRodney W. Grimes 494df8bae1dSRodney W. Grimes case DLT_EN10MB: 495df8bae1dSRodney W. Grimes sockp->sa_family = AF_UNSPEC; 496df8bae1dSRodney W. Grimes /* XXX Would MAXLINKHDR be better? */ 497797f247bSMatthew N. Dodd hlen = ETHER_HDR_LEN; 498df8bae1dSRodney W. Grimes break; 499df8bae1dSRodney W. Grimes 500df8bae1dSRodney W. Grimes case DLT_FDDI: 501d41f24e7SDavid Greenman sockp->sa_family = AF_IMPLINK; 502d41f24e7SDavid Greenman hlen = 0; 503df8bae1dSRodney W. Grimes break; 504df8bae1dSRodney W. Grimes 50522f05c43SAndrey A. Chernov case DLT_RAW: 506df8bae1dSRodney W. Grimes sockp->sa_family = AF_UNSPEC; 507df8bae1dSRodney W. Grimes hlen = 0; 508df8bae1dSRodney W. Grimes break; 509df8bae1dSRodney W. Grimes 51001399f34SDavid Malone case DLT_NULL: 51101399f34SDavid Malone /* 51201399f34SDavid Malone * null interface types require a 4 byte pseudo header which 51301399f34SDavid Malone * corresponds to the address family of the packet. 51401399f34SDavid Malone */ 51501399f34SDavid Malone sockp->sa_family = AF_UNSPEC; 51601399f34SDavid Malone hlen = 4; 51701399f34SDavid Malone break; 51801399f34SDavid Malone 5194f53e3ccSKenjiro Cho case DLT_ATM_RFC1483: 5204f53e3ccSKenjiro Cho /* 5214f53e3ccSKenjiro Cho * en atm driver requires 4-byte atm pseudo header. 5224f53e3ccSKenjiro Cho * though it isn't standard, vpi:vci needs to be 5234f53e3ccSKenjiro Cho * specified anyway. 5244f53e3ccSKenjiro Cho */ 5254f53e3ccSKenjiro Cho sockp->sa_family = AF_UNSPEC; 5264f53e3ccSKenjiro Cho hlen = 12; /* XXX 4(ATM_PH) + 3(LLC) + 5(SNAP) */ 5274f53e3ccSKenjiro Cho break; 5284f53e3ccSKenjiro Cho 52930fa52a6SBrian Somers case DLT_PPP: 53030fa52a6SBrian Somers sockp->sa_family = AF_UNSPEC; 53130fa52a6SBrian Somers hlen = 4; /* This should match PPP_HDRLEN */ 53230fa52a6SBrian Somers break; 53330fa52a6SBrian Somers 534246b5467SSam Leffler case DLT_IEEE802_11: /* IEEE 802.11 wireless */ 535246b5467SSam Leffler sockp->sa_family = AF_IEEE80211; 536246b5467SSam Leffler hlen = 0; 537246b5467SSam Leffler break; 538246b5467SSam Leffler 539246b5467SSam Leffler case DLT_IEEE802_11_RADIO: /* IEEE 802.11 wireless w/ phy params */ 540246b5467SSam Leffler sockp->sa_family = AF_IEEE80211; 541246b5467SSam Leffler sockp->sa_len = 12; /* XXX != 0 */ 542246b5467SSam Leffler hlen = sizeof(struct ieee80211_bpf_params); 543246b5467SSam Leffler break; 544246b5467SSam Leffler 545df8bae1dSRodney W. Grimes default: 546df8bae1dSRodney W. Grimes return (EIO); 547df8bae1dSRodney W. Grimes } 548df8bae1dSRodney W. Grimes 549df8bae1dSRodney W. Grimes len = uio->uio_resid; 550ed63043bSGleb Smirnoff if (len < hlen || len - hlen > ifp->if_mtu) 55101399f34SDavid Malone return (EMSGSIZE); 55201399f34SDavid Malone 55341a7572bSGleb Smirnoff m = m_get2(len, M_WAITOK, MT_DATA, M_PKTHDR); 554ed63043bSGleb Smirnoff if (m == NULL) 555df8bae1dSRodney W. Grimes return (EIO); 556963e4c2aSGarrett Wollman m->m_pkthdr.len = m->m_len = len; 557df8bae1dSRodney W. Grimes *mp = m; 55824a229f4SSam Leffler 55993e39f0bSChristian S.J. Peron error = uiomove(mtod(m, u_char *), len, uio); 56093e39f0bSChristian S.J. Peron if (error) 56193e39f0bSChristian S.J. Peron goto bad; 56293e39f0bSChristian S.J. Peron 5634fb3a820SAlexander V. Chernikov slen = bpf_filter(d->bd_wfilter, mtod(m, u_char *), len, len); 56493e39f0bSChristian S.J. Peron if (slen == 0) { 56593e39f0bSChristian S.J. Peron error = EPERM; 56693e39f0bSChristian S.J. Peron goto bad; 56793e39f0bSChristian S.J. Peron } 56893e39f0bSChristian S.J. Peron 569cb44b6dfSAndrew Thompson /* Check for multicast destination */ 570cb44b6dfSAndrew Thompson switch (linktype) { 571cb44b6dfSAndrew Thompson case DLT_EN10MB: 572cb44b6dfSAndrew Thompson eh = mtod(m, struct ether_header *); 573cb44b6dfSAndrew Thompson if (ETHER_IS_MULTICAST(eh->ether_dhost)) { 574cb44b6dfSAndrew Thompson if (bcmp(ifp->if_broadcastaddr, eh->ether_dhost, 575cb44b6dfSAndrew Thompson ETHER_ADDR_LEN) == 0) 576cb44b6dfSAndrew Thompson m->m_flags |= M_BCAST; 577cb44b6dfSAndrew Thompson else 578cb44b6dfSAndrew Thompson m->m_flags |= M_MCAST; 579cb44b6dfSAndrew Thompson } 5804fb3a820SAlexander V. Chernikov if (d->bd_hdrcmplt == 0) { 5814fb3a820SAlexander V. Chernikov memcpy(eh->ether_shost, IF_LLADDR(ifp), 5824fb3a820SAlexander V. Chernikov sizeof(eh->ether_shost)); 5834fb3a820SAlexander V. Chernikov } 584cb44b6dfSAndrew Thompson break; 585cb44b6dfSAndrew Thompson } 586cb44b6dfSAndrew Thompson 587df8bae1dSRodney W. Grimes /* 58893e39f0bSChristian S.J. Peron * Make room for link header, and copy it to sockaddr 589df8bae1dSRodney W. Grimes */ 590df8bae1dSRodney W. Grimes if (hlen != 0) { 591246b5467SSam Leffler if (sockp->sa_family == AF_IEEE80211) { 592246b5467SSam Leffler /* 593246b5467SSam Leffler * Collect true length from the parameter header 594246b5467SSam Leffler * NB: sockp is known to be zero'd so if we do a 595246b5467SSam Leffler * short copy unspecified parameters will be 596246b5467SSam Leffler * zero. 597246b5467SSam Leffler * NB: packet may not be aligned after stripping 598246b5467SSam Leffler * bpf params 599246b5467SSam Leffler * XXX check ibp_vers 600246b5467SSam Leffler */ 601246b5467SSam Leffler p = mtod(m, const struct ieee80211_bpf_params *); 602246b5467SSam Leffler hlen = p->ibp_len; 603246b5467SSam Leffler if (hlen > sizeof(sockp->sa_data)) { 604246b5467SSam Leffler error = EINVAL; 605246b5467SSam Leffler goto bad; 606246b5467SSam Leffler } 607246b5467SSam Leffler } 608a09968c4SAdrian Chadd bcopy(mtod(m, const void *), sockp->sa_data, hlen); 609df8bae1dSRodney W. Grimes } 610560a54e1SJung-uk Kim *hdrlen = hlen; 61193e39f0bSChristian S.J. Peron 612df8bae1dSRodney W. Grimes return (0); 613df8bae1dSRodney W. Grimes bad: 614df8bae1dSRodney W. Grimes m_freem(m); 615df8bae1dSRodney W. Grimes return (error); 616df8bae1dSRodney W. Grimes } 617df8bae1dSRodney W. Grimes 618df8bae1dSRodney W. Grimes /* 619df8bae1dSRodney W. Grimes * Attach file to the bpf interface, i.e. make d listen on bp. 620df8bae1dSRodney W. Grimes */ 621df8bae1dSRodney W. Grimes static void 62219ba8395SChristian S.J. Peron bpf_attachd(struct bpf_d *d, struct bpf_if *bp) 623df8bae1dSRodney W. Grimes { 6246c74ff0eSAlexander V. Chernikov int op_w; 6256c74ff0eSAlexander V. Chernikov 6266c74ff0eSAlexander V. Chernikov BPF_LOCK_ASSERT(); 6276c74ff0eSAlexander V. Chernikov 6286c74ff0eSAlexander V. Chernikov /* 6296c74ff0eSAlexander V. Chernikov * Save sysctl value to protect from sysctl change 6306c74ff0eSAlexander V. Chernikov * between reads 6316c74ff0eSAlexander V. Chernikov */ 63271448753SAlexander Motin op_w = V_bpf_optimize_writers || d->bd_writer; 6336c74ff0eSAlexander V. Chernikov 6346c74ff0eSAlexander V. Chernikov if (d->bd_bif != NULL) 6356c74ff0eSAlexander V. Chernikov bpf_detachd_locked(d); 636df8bae1dSRodney W. Grimes /* 63751ec1eb7SAlexander V. Chernikov * Point d at bp, and add d to the interface's list. 638f87e372eSLuiz Otavio O Souza * Since there are many applications using BPF for 63951ec1eb7SAlexander V. Chernikov * sending raw packets only (dhcpd, cdpd are good examples) 64051ec1eb7SAlexander V. Chernikov * we can delay adding d to the list of active listeners until 64151ec1eb7SAlexander V. Chernikov * some filter is configured. 642df8bae1dSRodney W. Grimes */ 64351ec1eb7SAlexander V. Chernikov 64451ec1eb7SAlexander V. Chernikov BPFIF_WLOCK(bp); 645afa85850SAlexander V. Chernikov BPFD_LOCK(d); 64651ec1eb7SAlexander V. Chernikov 6476c74ff0eSAlexander V. Chernikov d->bd_bif = bp; 6486c74ff0eSAlexander V. Chernikov 6496c74ff0eSAlexander V. Chernikov if (op_w != 0) { 65051ec1eb7SAlexander V. Chernikov /* Add to writers-only list */ 65151ec1eb7SAlexander V. Chernikov LIST_INSERT_HEAD(&bp->bif_wlist, d, bd_next); 65251ec1eb7SAlexander V. Chernikov /* 65351ec1eb7SAlexander V. Chernikov * We decrement bd_writer on every filter set operation. 65451ec1eb7SAlexander V. Chernikov * First BIOCSETF is done by pcap_open_live() to set up 65551ec1eb7SAlexander V. Chernikov * snap length. After that appliation usually sets its own filter 65651ec1eb7SAlexander V. Chernikov */ 65751ec1eb7SAlexander V. Chernikov d->bd_writer = 2; 65851ec1eb7SAlexander V. Chernikov } else 6594a3feeaaSRobert Watson LIST_INSERT_HEAD(&bp->bif_dlist, d, bd_next); 660df8bae1dSRodney W. Grimes 661afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 662e4b3229aSAlexander V. Chernikov BPFIF_WUNLOCK(bp); 663b743c310SSam Leffler 66451ec1eb7SAlexander V. Chernikov bpf_bpfd_cnt++; 66551ec1eb7SAlexander V. Chernikov 66651ec1eb7SAlexander V. Chernikov CTR3(KTR_NET, "%s: bpf_attach called by pid %d, adding to %s list", 66751ec1eb7SAlexander V. Chernikov __func__, d->bd_pid, d->bd_writer ? "writer" : "active"); 66851ec1eb7SAlexander V. Chernikov 6696c74ff0eSAlexander V. Chernikov if (op_w == 0) 67051ec1eb7SAlexander V. Chernikov EVENTHANDLER_INVOKE(bpf_track, bp->bif_ifp, bp->bif_dlt, 1); 67151ec1eb7SAlexander V. Chernikov } 67251ec1eb7SAlexander V. Chernikov 67351ec1eb7SAlexander V. Chernikov /* 674402000ffSAlexander V. Chernikov * Check if we need to upgrade our descriptor @d from write-only mode. 675402000ffSAlexander V. Chernikov */ 676402000ffSAlexander V. Chernikov static int 677402000ffSAlexander V. Chernikov bpf_check_upgrade(u_long cmd, struct bpf_d *d, struct bpf_insn *fcode, int flen) 678402000ffSAlexander V. Chernikov { 679402000ffSAlexander V. Chernikov int is_snap, need_upgrade; 680402000ffSAlexander V. Chernikov 681402000ffSAlexander V. Chernikov /* 682402000ffSAlexander V. Chernikov * Check if we've already upgraded or new filter is empty. 683402000ffSAlexander V. Chernikov */ 684402000ffSAlexander V. Chernikov if (d->bd_writer == 0 || fcode == NULL) 685402000ffSAlexander V. Chernikov return (0); 686402000ffSAlexander V. Chernikov 687402000ffSAlexander V. Chernikov need_upgrade = 0; 688402000ffSAlexander V. Chernikov 689402000ffSAlexander V. Chernikov /* 690402000ffSAlexander V. Chernikov * Check if cmd looks like snaplen setting from 691402000ffSAlexander V. Chernikov * pcap_bpf.c:pcap_open_live(). 692402000ffSAlexander V. Chernikov * Note we're not checking .k value here: 693caa7e52fSEitan Adler * while pcap_open_live() definitely sets to non-zero value, 694402000ffSAlexander V. Chernikov * we'd prefer to treat k=0 (deny ALL) case the same way: e.g. 695402000ffSAlexander V. Chernikov * do not consider upgrading immediately 696402000ffSAlexander V. Chernikov */ 697402000ffSAlexander V. Chernikov if (cmd == BIOCSETF && flen == 1 && fcode[0].code == (BPF_RET | BPF_K)) 698402000ffSAlexander V. Chernikov is_snap = 1; 699402000ffSAlexander V. Chernikov else 700402000ffSAlexander V. Chernikov is_snap = 0; 701402000ffSAlexander V. Chernikov 702402000ffSAlexander V. Chernikov if (is_snap == 0) { 703402000ffSAlexander V. Chernikov /* 704402000ffSAlexander V. Chernikov * We're setting first filter and it doesn't look like 705402000ffSAlexander V. Chernikov * setting snaplen. We're probably using bpf directly. 706402000ffSAlexander V. Chernikov * Upgrade immediately. 707402000ffSAlexander V. Chernikov */ 708402000ffSAlexander V. Chernikov need_upgrade = 1; 709402000ffSAlexander V. Chernikov } else { 710402000ffSAlexander V. Chernikov /* 711402000ffSAlexander V. Chernikov * Do not require upgrade by first BIOCSETF 712402000ffSAlexander V. Chernikov * (used to set snaplen) by pcap_open_live(). 713402000ffSAlexander V. Chernikov */ 714402000ffSAlexander V. Chernikov 715402000ffSAlexander V. Chernikov if (--d->bd_writer == 0) { 716402000ffSAlexander V. Chernikov /* 717402000ffSAlexander V. Chernikov * First snaplen filter has already 718402000ffSAlexander V. Chernikov * been set. This is probably catch-all 719402000ffSAlexander V. Chernikov * filter 720402000ffSAlexander V. Chernikov */ 721402000ffSAlexander V. Chernikov need_upgrade = 1; 722402000ffSAlexander V. Chernikov } 723402000ffSAlexander V. Chernikov } 724402000ffSAlexander V. Chernikov 725402000ffSAlexander V. Chernikov CTR5(KTR_NET, 726402000ffSAlexander V. Chernikov "%s: filter function set by pid %d, " 727402000ffSAlexander V. Chernikov "bd_writer counter %d, snap %d upgrade %d", 728402000ffSAlexander V. Chernikov __func__, d->bd_pid, d->bd_writer, 729402000ffSAlexander V. Chernikov is_snap, need_upgrade); 730402000ffSAlexander V. Chernikov 731402000ffSAlexander V. Chernikov return (need_upgrade); 732402000ffSAlexander V. Chernikov } 733402000ffSAlexander V. Chernikov 734402000ffSAlexander V. Chernikov /* 73551ec1eb7SAlexander V. Chernikov * Add d to the list of active bp filters. 736f87e372eSLuiz Otavio O Souza * Requires bpf_attachd() to be called before. 73751ec1eb7SAlexander V. Chernikov */ 73851ec1eb7SAlexander V. Chernikov static void 73951ec1eb7SAlexander V. Chernikov bpf_upgraded(struct bpf_d *d) 74051ec1eb7SAlexander V. Chernikov { 74151ec1eb7SAlexander V. Chernikov struct bpf_if *bp; 74251ec1eb7SAlexander V. Chernikov 7436c74ff0eSAlexander V. Chernikov BPF_LOCK_ASSERT(); 7446c74ff0eSAlexander V. Chernikov 74551ec1eb7SAlexander V. Chernikov bp = d->bd_bif; 74651ec1eb7SAlexander V. Chernikov 7476c74ff0eSAlexander V. Chernikov /* 7486c74ff0eSAlexander V. Chernikov * Filter can be set several times without specifying interface. 7496c74ff0eSAlexander V. Chernikov * Mark d as reader and exit. 7506c74ff0eSAlexander V. Chernikov */ 7516c74ff0eSAlexander V. Chernikov if (bp == NULL) { 752afa85850SAlexander V. Chernikov BPFD_LOCK(d); 7536c74ff0eSAlexander V. Chernikov d->bd_writer = 0; 754afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 7556c74ff0eSAlexander V. Chernikov return; 7566c74ff0eSAlexander V. Chernikov } 7576c74ff0eSAlexander V. Chernikov 75851ec1eb7SAlexander V. Chernikov BPFIF_WLOCK(bp); 759afa85850SAlexander V. Chernikov BPFD_LOCK(d); 76051ec1eb7SAlexander V. Chernikov 76151ec1eb7SAlexander V. Chernikov /* Remove from writers-only list */ 76251ec1eb7SAlexander V. Chernikov LIST_REMOVE(d, bd_next); 76351ec1eb7SAlexander V. Chernikov LIST_INSERT_HEAD(&bp->bif_dlist, d, bd_next); 76451ec1eb7SAlexander V. Chernikov /* Mark d as reader */ 76551ec1eb7SAlexander V. Chernikov d->bd_writer = 0; 76651ec1eb7SAlexander V. Chernikov 767afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 76851ec1eb7SAlexander V. Chernikov BPFIF_WUNLOCK(bp); 76951ec1eb7SAlexander V. Chernikov 77051ec1eb7SAlexander V. Chernikov CTR2(KTR_NET, "%s: upgrade required by pid %d", __func__, d->bd_pid); 77151ec1eb7SAlexander V. Chernikov 7725ce8d970SSam Leffler EVENTHANDLER_INVOKE(bpf_track, bp->bif_ifp, bp->bif_dlt, 1); 773df8bae1dSRodney W. Grimes } 774df8bae1dSRodney W. Grimes 775df8bae1dSRodney W. Grimes /* 776df8bae1dSRodney W. Grimes * Detach a file from its interface. 777df8bae1dSRodney W. Grimes */ 778df8bae1dSRodney W. Grimes static void 77919ba8395SChristian S.J. Peron bpf_detachd(struct bpf_d *d) 780df8bae1dSRodney W. Grimes { 7816c74ff0eSAlexander V. Chernikov BPF_LOCK(); 7826c74ff0eSAlexander V. Chernikov bpf_detachd_locked(d); 7836c74ff0eSAlexander V. Chernikov BPF_UNLOCK(); 7846c74ff0eSAlexander V. Chernikov } 7856c74ff0eSAlexander V. Chernikov 7866c74ff0eSAlexander V. Chernikov static void 7876c74ff0eSAlexander V. Chernikov bpf_detachd_locked(struct bpf_d *d) 7886c74ff0eSAlexander V. Chernikov { 7896e891d64SPoul-Henning Kamp int error; 790df8bae1dSRodney W. Grimes struct bpf_if *bp; 79146448b5aSRobert Watson struct ifnet *ifp; 792df8bae1dSRodney W. Grimes 79351ec1eb7SAlexander V. Chernikov CTR2(KTR_NET, "%s: detach required by pid %d", __func__, d->bd_pid); 79451ec1eb7SAlexander V. Chernikov 795e4b3229aSAlexander V. Chernikov BPF_LOCK_ASSERT(); 796e4b3229aSAlexander V. Chernikov 7976c74ff0eSAlexander V. Chernikov /* Check if descriptor is attached */ 7986c74ff0eSAlexander V. Chernikov if ((bp = d->bd_bif) == NULL) 7996c74ff0eSAlexander V. Chernikov return; 8006c74ff0eSAlexander V. Chernikov 801e4b3229aSAlexander V. Chernikov BPFIF_WLOCK(bp); 802afa85850SAlexander V. Chernikov BPFD_LOCK(d); 80346448b5aSRobert Watson 80451ec1eb7SAlexander V. Chernikov /* Save bd_writer value */ 80551ec1eb7SAlexander V. Chernikov error = d->bd_writer; 80651ec1eb7SAlexander V. Chernikov 80746448b5aSRobert Watson /* 80846448b5aSRobert Watson * Remove d from the interface's descriptor list. 80946448b5aSRobert Watson */ 81046448b5aSRobert Watson LIST_REMOVE(d, bd_next); 81146448b5aSRobert Watson 812e4b3229aSAlexander V. Chernikov ifp = bp->bif_ifp; 813572bde2aSRobert Watson d->bd_bif = NULL; 814afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 815e4b3229aSAlexander V. Chernikov BPFIF_WUNLOCK(bp); 816e4b3229aSAlexander V. Chernikov 817e4b3229aSAlexander V. Chernikov bpf_bpfd_cnt--; 81846448b5aSRobert Watson 81951ec1eb7SAlexander V. Chernikov /* Call event handler iff d is attached */ 82051ec1eb7SAlexander V. Chernikov if (error == 0) 8215ce8d970SSam Leffler EVENTHANDLER_INVOKE(bpf_track, ifp, bp->bif_dlt, 0); 822b743c310SSam Leffler 823df8bae1dSRodney W. Grimes /* 824df8bae1dSRodney W. Grimes * Check if this descriptor had requested promiscuous mode. 825df8bae1dSRodney W. Grimes * If so, turn it off. 826df8bae1dSRodney W. Grimes */ 827df8bae1dSRodney W. Grimes if (d->bd_promisc) { 828df8bae1dSRodney W. Grimes d->bd_promisc = 0; 82997021c24SMarko Zec CURVNET_SET(ifp->if_vnet); 83046448b5aSRobert Watson error = ifpromisc(ifp, 0); 83197021c24SMarko Zec CURVNET_RESTORE(); 8326e891d64SPoul-Henning Kamp if (error != 0 && error != ENXIO) { 833df8bae1dSRodney W. Grimes /* 8346e891d64SPoul-Henning Kamp * ENXIO can happen if a pccard is unplugged 835df8bae1dSRodney W. Grimes * Something is really wrong if we were able to put 836df8bae1dSRodney W. Grimes * the driver into promiscuous mode, but can't 837df8bae1dSRodney W. Grimes * take it out. 838df8bae1dSRodney W. Grimes */ 8398eab61f3SSam Leffler if_printf(bp->bif_ifp, 8408eab61f3SSam Leffler "bpf_detach: ifpromisc failed (%d)\n", error); 8416e891d64SPoul-Henning Kamp } 842df8bae1dSRodney W. Grimes } 843df8bae1dSRodney W. Grimes } 844df8bae1dSRodney W. Grimes 845df8bae1dSRodney W. Grimes /* 846136600feSEd Schouten * Close the descriptor by detaching it from its interface, 847136600feSEd Schouten * deallocating its buffers, and marking it free. 848136600feSEd Schouten */ 849136600feSEd Schouten static void 850136600feSEd Schouten bpf_dtor(void *data) 851136600feSEd Schouten { 852136600feSEd Schouten struct bpf_d *d = data; 853136600feSEd Schouten 854afa85850SAlexander V. Chernikov BPFD_LOCK(d); 855136600feSEd Schouten if (d->bd_state == BPF_WAITING) 856136600feSEd Schouten callout_stop(&d->bd_callout); 857136600feSEd Schouten d->bd_state = BPF_IDLE; 858afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 859136600feSEd Schouten funsetown(&d->bd_sigio); 860136600feSEd Schouten bpf_detachd(d); 861136600feSEd Schouten #ifdef MAC 862136600feSEd Schouten mac_bpfdesc_destroy(d); 863136600feSEd Schouten #endif /* MAC */ 8646aba400aSAttilio Rao seldrain(&d->bd_sel); 865136600feSEd Schouten knlist_destroy(&d->bd_sel.si_note); 8669fee1bd1SJung-uk Kim callout_drain(&d->bd_callout); 867136600feSEd Schouten bpf_freed(d); 868136600feSEd Schouten free(d, M_BPF); 869136600feSEd Schouten } 870136600feSEd Schouten 871136600feSEd Schouten /* 872df8bae1dSRodney W. Grimes * Open ethernet device. Returns ENXIO for illegal minor device number, 873df8bae1dSRodney W. Grimes * EBUSY if file is open by another process. 874df8bae1dSRodney W. Grimes */ 875df8bae1dSRodney W. Grimes /* ARGSUSED */ 87687f6c662SJulian Elischer static int 87719ba8395SChristian S.J. Peron bpfopen(struct cdev *dev, int flags, int fmt, struct thread *td) 878df8bae1dSRodney W. Grimes { 879e7bb21b3SJonathan Lemon struct bpf_d *d; 8804f42daa4SLuiz Otavio O Souza int error; 881df8bae1dSRodney W. Grimes 8821ede983cSDag-Erling Smørgrav d = malloc(sizeof(*d), M_BPF, M_WAITOK | M_ZERO); 883136600feSEd Schouten error = devfs_set_cdevpriv(d, bpf_dtor); 884136600feSEd Schouten if (error != 0) { 885136600feSEd Schouten free(d, M_BPF); 886136600feSEd Schouten return (error); 887136600feSEd Schouten } 8884d621040SChristian S.J. Peron 889*b2b7ca49SAlexander V. Chernikov /* Setup counters */ 890*b2b7ca49SAlexander V. Chernikov d->bd_rcount = counter_u64_alloc(M_WAITOK); 891*b2b7ca49SAlexander V. Chernikov d->bd_dcount = counter_u64_alloc(M_WAITOK); 892*b2b7ca49SAlexander V. Chernikov d->bd_fcount = counter_u64_alloc(M_WAITOK); 893*b2b7ca49SAlexander V. Chernikov d->bd_wcount = counter_u64_alloc(M_WAITOK); 894*b2b7ca49SAlexander V. Chernikov d->bd_wfcount = counter_u64_alloc(M_WAITOK); 895*b2b7ca49SAlexander V. Chernikov d->bd_wdcount = counter_u64_alloc(M_WAITOK); 896*b2b7ca49SAlexander V. Chernikov d->bd_zcopy = counter_u64_alloc(M_WAITOK); 897*b2b7ca49SAlexander V. Chernikov 8984d621040SChristian S.J. Peron /* 8994d621040SChristian S.J. Peron * For historical reasons, perform a one-time initialization call to 9004d621040SChristian S.J. Peron * the buffer routines, even though we're not yet committed to a 9014d621040SChristian S.J. Peron * particular buffer method. 9024d621040SChristian S.J. Peron */ 9034d621040SChristian S.J. Peron bpf_buffer_init(d); 90471448753SAlexander Motin if ((flags & FREAD) == 0) 90571448753SAlexander Motin d->bd_writer = 2; 9063b3b91e7SGuy Helmer d->bd_hbuf_in_use = 0; 9074d621040SChristian S.J. Peron d->bd_bufmode = BPF_BUFMODE_BUFFER; 90800a83887SPaul Traina d->bd_sig = SIGIO; 909560a54e1SJung-uk Kim d->bd_direction = BPF_D_INOUT; 910e4b3229aSAlexander V. Chernikov BPF_PID_REFRESH(d, td); 91182f4445dSRobert Watson #ifdef MAC 91230d239bcSRobert Watson mac_bpfdesc_init(d); 91330d239bcSRobert Watson mac_bpfdesc_create(td->td_ucred, d); 91482f4445dSRobert Watson #endif 915afa85850SAlexander V. Chernikov mtx_init(&d->bd_lock, devtoname(dev), "bpf cdev lock", MTX_DEF); 916afa85850SAlexander V. Chernikov callout_init_mtx(&d->bd_callout, &d->bd_lock, 0); 917afa85850SAlexander V. Chernikov knlist_init_mtx(&d->bd_sel.si_note, &d->bd_lock); 918df8bae1dSRodney W. Grimes 919df8bae1dSRodney W. Grimes return (0); 920df8bae1dSRodney W. Grimes } 921df8bae1dSRodney W. Grimes 922df8bae1dSRodney W. Grimes /* 923df8bae1dSRodney W. Grimes * bpfread - read next chunk of packets from buffers 924df8bae1dSRodney W. Grimes */ 92587f6c662SJulian Elischer static int 92619ba8395SChristian S.J. Peron bpfread(struct cdev *dev, struct uio *uio, int ioflag) 927df8bae1dSRodney W. Grimes { 928136600feSEd Schouten struct bpf_d *d; 929df8bae1dSRodney W. Grimes int error; 9308df67d77SJung-uk Kim int non_block; 9318df67d77SJung-uk Kim int timed_out; 932df8bae1dSRodney W. Grimes 933136600feSEd Schouten error = devfs_get_cdevpriv((void **)&d); 934136600feSEd Schouten if (error != 0) 935136600feSEd Schouten return (error); 936136600feSEd Schouten 937df8bae1dSRodney W. Grimes /* 938df8bae1dSRodney W. Grimes * Restrict application to use a buffer the same size as 939df8bae1dSRodney W. Grimes * as kernel buffers. 940df8bae1dSRodney W. Grimes */ 941df8bae1dSRodney W. Grimes if (uio->uio_resid != d->bd_bufsize) 942df8bae1dSRodney W. Grimes return (EINVAL); 943df8bae1dSRodney W. Grimes 9448df67d77SJung-uk Kim non_block = ((ioflag & O_NONBLOCK) != 0); 9458df67d77SJung-uk Kim 946afa85850SAlexander V. Chernikov BPFD_LOCK(d); 947e4b3229aSAlexander V. Chernikov BPF_PID_REFRESH_CUR(d); 9484d621040SChristian S.J. Peron if (d->bd_bufmode != BPF_BUFMODE_BUFFER) { 949afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 9504d621040SChristian S.J. Peron return (EOPNOTSUPP); 9514d621040SChristian S.J. Peron } 95281bda851SJohn Polstra if (d->bd_state == BPF_WAITING) 95381bda851SJohn Polstra callout_stop(&d->bd_callout); 95481bda851SJohn Polstra timed_out = (d->bd_state == BPF_TIMED_OUT); 95581bda851SJohn Polstra d->bd_state = BPF_IDLE; 956d013d902SGuy Helmer while (d->bd_hbuf_in_use) { 957d013d902SGuy Helmer error = mtx_sleep(&d->bd_hbuf_in_use, &d->bd_lock, 9583b3b91e7SGuy Helmer PRINET|PCATCH, "bd_hbuf", 0); 959d013d902SGuy Helmer if (error != 0) { 960d013d902SGuy Helmer BPFD_UNLOCK(d); 961d013d902SGuy Helmer return (error); 962d013d902SGuy Helmer } 963d013d902SGuy Helmer } 964df8bae1dSRodney W. Grimes /* 965df8bae1dSRodney W. Grimes * If the hold buffer is empty, then do a timed sleep, which 966df8bae1dSRodney W. Grimes * ends when the timeout expires or when enough packets 967df8bae1dSRodney W. Grimes * have arrived to fill the store buffer. 968df8bae1dSRodney W. Grimes */ 969572bde2aSRobert Watson while (d->bd_hbuf == NULL) { 9708df67d77SJung-uk Kim if (d->bd_slen != 0) { 971df8bae1dSRodney W. Grimes /* 972df8bae1dSRodney W. Grimes * A packet(s) either arrived since the previous 973df8bae1dSRodney W. Grimes * read or arrived while we were asleep. 9748df67d77SJung-uk Kim */ 9758df67d77SJung-uk Kim if (d->bd_immediate || non_block || timed_out) { 9768df67d77SJung-uk Kim /* 9778df67d77SJung-uk Kim * Rotate the buffers and return what's here 9788df67d77SJung-uk Kim * if we are in immediate mode, non-blocking 9798df67d77SJung-uk Kim * flag is set, or this descriptor timed out. 980df8bae1dSRodney W. Grimes */ 981df8bae1dSRodney W. Grimes ROTATE_BUFFERS(d); 982df8bae1dSRodney W. Grimes break; 983df8bae1dSRodney W. Grimes } 9848df67d77SJung-uk Kim } 985de5d9935SRobert Watson 986de5d9935SRobert Watson /* 987de5d9935SRobert Watson * No data is available, check to see if the bpf device 988de5d9935SRobert Watson * is still pointed at a real interface. If not, return 989de5d9935SRobert Watson * ENXIO so that the userland process knows to rebind 990de5d9935SRobert Watson * it before using it again. 991de5d9935SRobert Watson */ 992de5d9935SRobert Watson if (d->bd_bif == NULL) { 993afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 994de5d9935SRobert Watson return (ENXIO); 995de5d9935SRobert Watson } 996de5d9935SRobert Watson 9978df67d77SJung-uk Kim if (non_block) { 998afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 999fba3cfdeSJohn Polstra return (EWOULDBLOCK); 1000fba3cfdeSJohn Polstra } 1001afa85850SAlexander V. Chernikov error = msleep(d, &d->bd_lock, PRINET|PCATCH, 1002e7bb21b3SJonathan Lemon "bpf", d->bd_rtout); 1003df8bae1dSRodney W. Grimes if (error == EINTR || error == ERESTART) { 1004afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 1005df8bae1dSRodney W. Grimes return (error); 1006df8bae1dSRodney W. Grimes } 1007df8bae1dSRodney W. Grimes if (error == EWOULDBLOCK) { 1008df8bae1dSRodney W. Grimes /* 1009df8bae1dSRodney W. Grimes * On a timeout, return what's in the buffer, 1010df8bae1dSRodney W. Grimes * which may be nothing. If there is something 1011df8bae1dSRodney W. Grimes * in the store buffer, we can rotate the buffers. 1012df8bae1dSRodney W. Grimes */ 1013df8bae1dSRodney W. Grimes if (d->bd_hbuf) 1014df8bae1dSRodney W. Grimes /* 1015df8bae1dSRodney W. Grimes * We filled up the buffer in between 1016df8bae1dSRodney W. Grimes * getting the timeout and arriving 1017df8bae1dSRodney W. Grimes * here, so we don't need to rotate. 1018df8bae1dSRodney W. Grimes */ 1019df8bae1dSRodney W. Grimes break; 1020df8bae1dSRodney W. Grimes 1021df8bae1dSRodney W. Grimes if (d->bd_slen == 0) { 1022afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 1023df8bae1dSRodney W. Grimes return (0); 1024df8bae1dSRodney W. Grimes } 1025df8bae1dSRodney W. Grimes ROTATE_BUFFERS(d); 1026df8bae1dSRodney W. Grimes break; 1027df8bae1dSRodney W. Grimes } 1028df8bae1dSRodney W. Grimes } 1029df8bae1dSRodney W. Grimes /* 1030df8bae1dSRodney W. Grimes * At this point, we know we have something in the hold slot. 1031df8bae1dSRodney W. Grimes */ 10323b3b91e7SGuy Helmer d->bd_hbuf_in_use = 1; 1033afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 1034df8bae1dSRodney W. Grimes 1035df8bae1dSRodney W. Grimes /* 1036df8bae1dSRodney W. Grimes * Move data from hold buffer into user space. 1037df8bae1dSRodney W. Grimes * We know the entire buffer is transferred since 1038df8bae1dSRodney W. Grimes * we checked above that the read buffer is bpf_bufsize bytes. 103931b32e6dSRobert Watson * 10403b3b91e7SGuy Helmer * We do not have to worry about simultaneous reads because 10413b3b91e7SGuy Helmer * we waited for sole access to the hold buffer above. 1042df8bae1dSRodney W. Grimes */ 10434d621040SChristian S.J. Peron error = bpf_uiomove(d, d->bd_hbuf, d->bd_hlen, uio); 1044df8bae1dSRodney W. Grimes 1045afa85850SAlexander V. Chernikov BPFD_LOCK(d); 10463b3b91e7SGuy Helmer KASSERT(d->bd_hbuf != NULL, ("bpfread: lost bd_hbuf")); 1047df8bae1dSRodney W. Grimes d->bd_fbuf = d->bd_hbuf; 1048572bde2aSRobert Watson d->bd_hbuf = NULL; 1049df8bae1dSRodney W. Grimes d->bd_hlen = 0; 105029f612ecSChristian S.J. Peron bpf_buf_reclaimed(d); 10513b3b91e7SGuy Helmer d->bd_hbuf_in_use = 0; 10523b3b91e7SGuy Helmer wakeup(&d->bd_hbuf_in_use); 1053afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 1054df8bae1dSRodney W. Grimes 1055df8bae1dSRodney W. Grimes return (error); 1056df8bae1dSRodney W. Grimes } 1057df8bae1dSRodney W. Grimes 1058df8bae1dSRodney W. Grimes /* 1059df8bae1dSRodney W. Grimes * If there are processes sleeping on this descriptor, wake them up. 1060df8bae1dSRodney W. Grimes */ 1061e7bb21b3SJonathan Lemon static __inline void 106219ba8395SChristian S.J. Peron bpf_wakeup(struct bpf_d *d) 1063df8bae1dSRodney W. Grimes { 1064a3272e3cSChristian S.J. Peron 1065afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 106681bda851SJohn Polstra if (d->bd_state == BPF_WAITING) { 106781bda851SJohn Polstra callout_stop(&d->bd_callout); 106881bda851SJohn Polstra d->bd_state = BPF_IDLE; 106981bda851SJohn Polstra } 1070521f364bSDag-Erling Smørgrav wakeup(d); 1071831d27a9SDon Lewis if (d->bd_async && d->bd_sig && d->bd_sigio) 1072f1320723SAlfred Perlstein pgsigio(&d->bd_sigio, d->bd_sig, 0); 107300a83887SPaul Traina 1074512824f8SSeigo Tanimura selwakeuppri(&d->bd_sel, PRINET); 1075ad3b9257SJohn-Mark Gurney KNOTE_LOCKED(&d->bd_sel.si_note, 0); 1076df8bae1dSRodney W. Grimes } 1077df8bae1dSRodney W. Grimes 107881bda851SJohn Polstra static void 107919ba8395SChristian S.J. Peron bpf_timed_out(void *arg) 108081bda851SJohn Polstra { 108181bda851SJohn Polstra struct bpf_d *d = (struct bpf_d *)arg; 108281bda851SJohn Polstra 1083afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 10849fee1bd1SJung-uk Kim 10859fee1bd1SJung-uk Kim if (callout_pending(&d->bd_callout) || !callout_active(&d->bd_callout)) 10869fee1bd1SJung-uk Kim return; 108781bda851SJohn Polstra if (d->bd_state == BPF_WAITING) { 108881bda851SJohn Polstra d->bd_state = BPF_TIMED_OUT; 108981bda851SJohn Polstra if (d->bd_slen != 0) 109081bda851SJohn Polstra bpf_wakeup(d); 109181bda851SJohn Polstra } 109281bda851SJohn Polstra } 109381bda851SJohn Polstra 109487f6c662SJulian Elischer static int 10954d621040SChristian S.J. Peron bpf_ready(struct bpf_d *d) 10964d621040SChristian S.J. Peron { 10974d621040SChristian S.J. Peron 1098afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 10994d621040SChristian S.J. Peron 11004d621040SChristian S.J. Peron if (!bpf_canfreebuf(d) && d->bd_hlen != 0) 11014d621040SChristian S.J. Peron return (1); 11024d621040SChristian S.J. Peron if ((d->bd_immediate || d->bd_state == BPF_TIMED_OUT) && 11034d621040SChristian S.J. Peron d->bd_slen != 0) 11044d621040SChristian S.J. Peron return (1); 11054d621040SChristian S.J. Peron return (0); 11064d621040SChristian S.J. Peron } 11074d621040SChristian S.J. Peron 11084d621040SChristian S.J. Peron static int 110919ba8395SChristian S.J. Peron bpfwrite(struct cdev *dev, struct uio *uio, int ioflag) 1110df8bae1dSRodney W. Grimes { 1111136600feSEd Schouten struct bpf_d *d; 1112df8bae1dSRodney W. Grimes struct ifnet *ifp; 1113560a54e1SJung-uk Kim struct mbuf *m, *mc; 11148240bf1eSRobert Watson struct sockaddr dst; 11154fb3a820SAlexander V. Chernikov struct route ro; 1116560a54e1SJung-uk Kim int error, hlen; 1117df8bae1dSRodney W. Grimes 1118136600feSEd Schouten error = devfs_get_cdevpriv((void **)&d); 1119136600feSEd Schouten if (error != 0) 1120136600feSEd Schouten return (error); 1121136600feSEd Schouten 1122e4b3229aSAlexander V. Chernikov BPF_PID_REFRESH_CUR(d); 1123*b2b7ca49SAlexander V. Chernikov counter_u64_add(d->bd_wcount, 1); 11246c74ff0eSAlexander V. Chernikov /* XXX: locking required */ 11254d621040SChristian S.J. Peron if (d->bd_bif == NULL) { 1126*b2b7ca49SAlexander V. Chernikov counter_u64_add(d->bd_wdcount, 1); 1127df8bae1dSRodney W. Grimes return (ENXIO); 11284d621040SChristian S.J. Peron } 1129df8bae1dSRodney W. Grimes 1130df8bae1dSRodney W. Grimes ifp = d->bd_bif->bif_ifp; 1131df8bae1dSRodney W. Grimes 11324d621040SChristian S.J. Peron if ((ifp->if_flags & IFF_UP) == 0) { 1133*b2b7ca49SAlexander V. Chernikov counter_u64_add(d->bd_wdcount, 1); 11343518d220SSam Leffler return (ENETDOWN); 11354d621040SChristian S.J. Peron } 11363518d220SSam Leffler 11374d621040SChristian S.J. Peron if (uio->uio_resid == 0) { 1138*b2b7ca49SAlexander V. Chernikov counter_u64_add(d->bd_wdcount, 1); 1139df8bae1dSRodney W. Grimes return (0); 11404d621040SChristian S.J. Peron } 1141df8bae1dSRodney W. Grimes 11428240bf1eSRobert Watson bzero(&dst, sizeof(dst)); 1143d83e603aSChristian S.J. Peron m = NULL; 1144d83e603aSChristian S.J. Peron hlen = 0; 11456c74ff0eSAlexander V. Chernikov /* XXX: bpf_movein() can sleep */ 1146cb44b6dfSAndrew Thompson error = bpf_movein(uio, (int)d->bd_bif->bif_dlt, ifp, 11474fb3a820SAlexander V. Chernikov &m, &dst, &hlen, d); 11484d621040SChristian S.J. Peron if (error) { 1149*b2b7ca49SAlexander V. Chernikov counter_u64_add(d->bd_wdcount, 1); 1150df8bae1dSRodney W. Grimes return (error); 11514d621040SChristian S.J. Peron } 1152*b2b7ca49SAlexander V. Chernikov counter_u64_add(d->bd_wfcount, 1); 1153114ae644SMike Smith if (d->bd_hdrcmplt) 1154114ae644SMike Smith dst.sa_family = pseudo_AF_HDRCMPLT; 1155114ae644SMike Smith 1156560a54e1SJung-uk Kim if (d->bd_feedback) { 1157eb1b1807SGleb Smirnoff mc = m_dup(m, M_NOWAIT); 1158560a54e1SJung-uk Kim if (mc != NULL) 1159560a54e1SJung-uk Kim mc->m_pkthdr.rcvif = ifp; 11608cd892f7SJung-uk Kim /* Set M_PROMISC for outgoing packets to be discarded. */ 11618cd892f7SJung-uk Kim if (d->bd_direction == BPF_D_INOUT) 11628cd892f7SJung-uk Kim m->m_flags |= M_PROMISC; 1163560a54e1SJung-uk Kim } else 1164560a54e1SJung-uk Kim mc = NULL; 1165560a54e1SJung-uk Kim 1166560a54e1SJung-uk Kim m->m_pkthdr.len -= hlen; 1167560a54e1SJung-uk Kim m->m_len -= hlen; 1168560a54e1SJung-uk Kim m->m_data += hlen; /* XXX */ 1169560a54e1SJung-uk Kim 117021ca7b57SMarko Zec CURVNET_SET(ifp->if_vnet); 117182f4445dSRobert Watson #ifdef MAC 1172afa85850SAlexander V. Chernikov BPFD_LOCK(d); 117330d239bcSRobert Watson mac_bpfdesc_create_mbuf(d, m); 1174560a54e1SJung-uk Kim if (mc != NULL) 117530d239bcSRobert Watson mac_bpfdesc_create_mbuf(d, mc); 1176afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 117782f4445dSRobert Watson #endif 1178560a54e1SJung-uk Kim 11794fb3a820SAlexander V. Chernikov bzero(&ro, sizeof(ro)); 11804fb3a820SAlexander V. Chernikov if (hlen != 0) { 11814fb3a820SAlexander V. Chernikov ro.ro_prepend = (u_char *)&dst.sa_data; 11824fb3a820SAlexander V. Chernikov ro.ro_plen = hlen; 11834fb3a820SAlexander V. Chernikov ro.ro_flags = RT_HAS_HEADER; 11844fb3a820SAlexander V. Chernikov } 11854fb3a820SAlexander V. Chernikov 11864fb3a820SAlexander V. Chernikov error = (*ifp->if_output)(ifp, m, &dst, &ro); 11874d621040SChristian S.J. Peron if (error) 1188*b2b7ca49SAlexander V. Chernikov counter_u64_add(d->bd_wdcount, 1); 1189560a54e1SJung-uk Kim 1190560a54e1SJung-uk Kim if (mc != NULL) { 11910bf686c1SRobert Watson if (error == 0) 1192560a54e1SJung-uk Kim (*ifp->if_input)(ifp, mc); 11930bf686c1SRobert Watson else 1194560a54e1SJung-uk Kim m_freem(mc); 1195560a54e1SJung-uk Kim } 119621ca7b57SMarko Zec CURVNET_RESTORE(); 1197560a54e1SJung-uk Kim 1198df8bae1dSRodney W. Grimes return (error); 1199df8bae1dSRodney W. Grimes } 1200df8bae1dSRodney W. Grimes 1201df8bae1dSRodney W. Grimes /* 1202e82669d9SRobert Watson * Reset a descriptor by flushing its packet buffer and clearing the receive 1203e82669d9SRobert Watson * and drop counts. This is doable for kernel-only buffers, but with 1204e82669d9SRobert Watson * zero-copy buffers, we can't write to (or rotate) buffers that are 1205e82669d9SRobert Watson * currently owned by userspace. It would be nice if we could encapsulate 1206e82669d9SRobert Watson * this logic in the buffer code rather than here. 1207df8bae1dSRodney W. Grimes */ 1208df8bae1dSRodney W. Grimes static void 120919ba8395SChristian S.J. Peron reset_d(struct bpf_d *d) 1210df8bae1dSRodney W. Grimes { 1211e7bb21b3SJonathan Lemon 1212afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 1213e82669d9SRobert Watson 12143b3b91e7SGuy Helmer while (d->bd_hbuf_in_use) 12153b3b91e7SGuy Helmer mtx_sleep(&d->bd_hbuf_in_use, &d->bd_lock, PRINET, 12163b3b91e7SGuy Helmer "bd_hbuf", 0); 1217e82669d9SRobert Watson if ((d->bd_hbuf != NULL) && 1218e82669d9SRobert Watson (d->bd_bufmode != BPF_BUFMODE_ZBUF || bpf_canfreebuf(d))) { 1219df8bae1dSRodney W. Grimes /* Free the hold buffer. */ 1220df8bae1dSRodney W. Grimes d->bd_fbuf = d->bd_hbuf; 1221572bde2aSRobert Watson d->bd_hbuf = NULL; 1222e82669d9SRobert Watson d->bd_hlen = 0; 122329f612ecSChristian S.J. Peron bpf_buf_reclaimed(d); 1224df8bae1dSRodney W. Grimes } 1225e82669d9SRobert Watson if (bpf_canwritebuf(d)) 1226df8bae1dSRodney W. Grimes d->bd_slen = 0; 1227*b2b7ca49SAlexander V. Chernikov counter_u64_zero(d->bd_rcount); 1228*b2b7ca49SAlexander V. Chernikov counter_u64_zero(d->bd_dcount); 1229*b2b7ca49SAlexander V. Chernikov counter_u64_zero(d->bd_fcount); 1230*b2b7ca49SAlexander V. Chernikov counter_u64_zero(d->bd_wcount); 1231*b2b7ca49SAlexander V. Chernikov counter_u64_zero(d->bd_wfcount); 1232*b2b7ca49SAlexander V. Chernikov counter_u64_zero(d->bd_wdcount); 1233*b2b7ca49SAlexander V. Chernikov counter_u64_zero(d->bd_zcopy); 1234df8bae1dSRodney W. Grimes } 1235df8bae1dSRodney W. Grimes 1236df8bae1dSRodney W. Grimes /* 1237df8bae1dSRodney W. Grimes * FIONREAD Check for read packet available. 1238df8bae1dSRodney W. Grimes * BIOCGBLEN Get buffer len [for read()]. 1239f11c3508SDavid Malone * BIOCSETF Set read filter. 1240f11c3508SDavid Malone * BIOCSETFNR Set read filter without resetting descriptor. 1241f11c3508SDavid Malone * BIOCSETWF Set write filter. 1242df8bae1dSRodney W. Grimes * BIOCFLUSH Flush read packet buffer. 1243df8bae1dSRodney W. Grimes * BIOCPROMISC Put interface into promiscuous mode. 1244df8bae1dSRodney W. Grimes * BIOCGDLT Get link layer type. 1245df8bae1dSRodney W. Grimes * BIOCGETIF Get interface name. 1246df8bae1dSRodney W. Grimes * BIOCSETIF Set interface. 1247df8bae1dSRodney W. Grimes * BIOCSRTIMEOUT Set read timeout. 1248df8bae1dSRodney W. Grimes * BIOCGRTIMEOUT Get read timeout. 1249df8bae1dSRodney W. Grimes * BIOCGSTATS Get packet stats. 1250df8bae1dSRodney W. Grimes * BIOCIMMEDIATE Set immediate mode. 1251df8bae1dSRodney W. Grimes * BIOCVERSION Get filter language version. 1252114ae644SMike Smith * BIOCGHDRCMPLT Get "header already complete" flag 1253114ae644SMike Smith * BIOCSHDRCMPLT Set "header already complete" flag 1254560a54e1SJung-uk Kim * BIOCGDIRECTION Get packet direction flag 1255560a54e1SJung-uk Kim * BIOCSDIRECTION Set packet direction flag 1256547d94bdSJung-uk Kim * BIOCGTSTAMP Get time stamp format and resolution. 1257547d94bdSJung-uk Kim * BIOCSTSTAMP Set time stamp format and resolution. 125893e39f0bSChristian S.J. Peron * BIOCLOCK Set "locked" flag 1259560a54e1SJung-uk Kim * BIOCFEEDBACK Set packet feedback mode. 12604d621040SChristian S.J. Peron * BIOCSETZBUF Set current zero-copy buffer locations. 12614d621040SChristian S.J. Peron * BIOCGETZMAX Get maximum zero-copy buffer size. 12624d621040SChristian S.J. Peron * BIOCROTZBUF Force rotation of zero-copy buffer 12634d621040SChristian S.J. Peron * BIOCSETBUFMODE Set buffer mode. 12644d621040SChristian S.J. Peron * BIOCGETBUFMODE Get current buffer mode. 1265df8bae1dSRodney W. Grimes */ 1266df8bae1dSRodney W. Grimes /* ARGSUSED */ 126787f6c662SJulian Elischer static int 126819ba8395SChristian S.J. Peron bpfioctl(struct cdev *dev, u_long cmd, caddr_t addr, int flags, 126919ba8395SChristian S.J. Peron struct thread *td) 1270df8bae1dSRodney W. Grimes { 1271136600feSEd Schouten struct bpf_d *d; 1272136600feSEd Schouten int error; 1273136600feSEd Schouten 1274136600feSEd Schouten error = devfs_get_cdevpriv((void **)&d); 1275136600feSEd Schouten if (error != 0) 1276136600feSEd Schouten return (error); 1277df8bae1dSRodney W. Grimes 1278b75a24a0SChristian S.J. Peron /* 1279b75a24a0SChristian S.J. Peron * Refresh PID associated with this descriptor. 1280b75a24a0SChristian S.J. Peron */ 1281afa85850SAlexander V. Chernikov BPFD_LOCK(d); 1282e4b3229aSAlexander V. Chernikov BPF_PID_REFRESH(d, td); 128381bda851SJohn Polstra if (d->bd_state == BPF_WAITING) 128481bda851SJohn Polstra callout_stop(&d->bd_callout); 128581bda851SJohn Polstra d->bd_state = BPF_IDLE; 1286afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 128781bda851SJohn Polstra 128893e39f0bSChristian S.J. Peron if (d->bd_locked == 1) { 128993e39f0bSChristian S.J. Peron switch (cmd) { 129093e39f0bSChristian S.J. Peron case BIOCGBLEN: 129193e39f0bSChristian S.J. Peron case BIOCFLUSH: 129293e39f0bSChristian S.J. Peron case BIOCGDLT: 129393e39f0bSChristian S.J. Peron case BIOCGDLTLIST: 1294fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 1295fc0a61a4SKonstantin Belousov case BIOCGDLTLIST32: 1296fc0a61a4SKonstantin Belousov #endif 129793e39f0bSChristian S.J. Peron case BIOCGETIF: 129893e39f0bSChristian S.J. Peron case BIOCGRTIMEOUT: 1299b4366092SJustin Hibbits #if defined(COMPAT_FREEBSD32) && defined(__amd64__) 1300fc0a61a4SKonstantin Belousov case BIOCGRTIMEOUT32: 1301fc0a61a4SKonstantin Belousov #endif 130293e39f0bSChristian S.J. Peron case BIOCGSTATS: 130393e39f0bSChristian S.J. Peron case BIOCVERSION: 130493e39f0bSChristian S.J. Peron case BIOCGRSIG: 130593e39f0bSChristian S.J. Peron case BIOCGHDRCMPLT: 1306547d94bdSJung-uk Kim case BIOCSTSTAMP: 1307560a54e1SJung-uk Kim case BIOCFEEDBACK: 130893e39f0bSChristian S.J. Peron case FIONREAD: 130993e39f0bSChristian S.J. Peron case BIOCLOCK: 131093e39f0bSChristian S.J. Peron case BIOCSRTIMEOUT: 1311b4366092SJustin Hibbits #if defined(COMPAT_FREEBSD32) && defined(__amd64__) 1312fc0a61a4SKonstantin Belousov case BIOCSRTIMEOUT32: 1313fc0a61a4SKonstantin Belousov #endif 131493e39f0bSChristian S.J. Peron case BIOCIMMEDIATE: 131593e39f0bSChristian S.J. Peron case TIOCGPGRP: 13164d621040SChristian S.J. Peron case BIOCROTZBUF: 131793e39f0bSChristian S.J. Peron break; 131893e39f0bSChristian S.J. Peron default: 131993e39f0bSChristian S.J. Peron return (EPERM); 132093e39f0bSChristian S.J. Peron } 132193e39f0bSChristian S.J. Peron } 1322fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 1323fc0a61a4SKonstantin Belousov /* 1324fc0a61a4SKonstantin Belousov * If we see a 32-bit compat ioctl, mark the stream as 32-bit so 1325fc0a61a4SKonstantin Belousov * that it will get 32-bit packet headers. 1326fc0a61a4SKonstantin Belousov */ 1327fc0a61a4SKonstantin Belousov switch (cmd) { 1328fc0a61a4SKonstantin Belousov case BIOCSETF32: 1329fc0a61a4SKonstantin Belousov case BIOCSETFNR32: 1330fc0a61a4SKonstantin Belousov case BIOCSETWF32: 1331fc0a61a4SKonstantin Belousov case BIOCGDLTLIST32: 1332fc0a61a4SKonstantin Belousov case BIOCGRTIMEOUT32: 1333fc0a61a4SKonstantin Belousov case BIOCSRTIMEOUT32: 133474549d4bSWojciech Macek if (SV_PROC_FLAG(td->td_proc, SV_ILP32)) { 133597aacec6SAlexander V. Chernikov BPFD_LOCK(d); 1336fc0a61a4SKonstantin Belousov d->bd_compat32 = 1; 133797aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 1338fc0a61a4SKonstantin Belousov } 133974549d4bSWojciech Macek } 1340fc0a61a4SKonstantin Belousov #endif 1341fc0a61a4SKonstantin Belousov 134297021c24SMarko Zec CURVNET_SET(TD_TO_VNET(td)); 1343df8bae1dSRodney W. Grimes switch (cmd) { 1344df8bae1dSRodney W. Grimes 1345df8bae1dSRodney W. Grimes default: 1346df8bae1dSRodney W. Grimes error = EINVAL; 1347df8bae1dSRodney W. Grimes break; 1348df8bae1dSRodney W. Grimes 1349df8bae1dSRodney W. Grimes /* 1350df8bae1dSRodney W. Grimes * Check for read packet available. 1351df8bae1dSRodney W. Grimes */ 1352df8bae1dSRodney W. Grimes case FIONREAD: 1353df8bae1dSRodney W. Grimes { 1354df8bae1dSRodney W. Grimes int n; 1355df8bae1dSRodney W. Grimes 1356afa85850SAlexander V. Chernikov BPFD_LOCK(d); 1357df8bae1dSRodney W. Grimes n = d->bd_slen; 13583b3b91e7SGuy Helmer while (d->bd_hbuf_in_use) 13593b3b91e7SGuy Helmer mtx_sleep(&d->bd_hbuf_in_use, &d->bd_lock, 13603b3b91e7SGuy Helmer PRINET, "bd_hbuf", 0); 1361df8bae1dSRodney W. Grimes if (d->bd_hbuf) 1362df8bae1dSRodney W. Grimes n += d->bd_hlen; 1363afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 1364df8bae1dSRodney W. Grimes 1365df8bae1dSRodney W. Grimes *(int *)addr = n; 1366df8bae1dSRodney W. Grimes break; 1367df8bae1dSRodney W. Grimes } 1368df8bae1dSRodney W. Grimes 1369df8bae1dSRodney W. Grimes /* 1370df8bae1dSRodney W. Grimes * Get buffer len [for read()]. 1371df8bae1dSRodney W. Grimes */ 1372df8bae1dSRodney W. Grimes case BIOCGBLEN: 137397aacec6SAlexander V. Chernikov BPFD_LOCK(d); 1374df8bae1dSRodney W. Grimes *(u_int *)addr = d->bd_bufsize; 137597aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 1376df8bae1dSRodney W. Grimes break; 1377df8bae1dSRodney W. Grimes 1378df8bae1dSRodney W. Grimes /* 1379df8bae1dSRodney W. Grimes * Set buffer length. 1380df8bae1dSRodney W. Grimes */ 1381df8bae1dSRodney W. Grimes case BIOCSBLEN: 13824d621040SChristian S.J. Peron error = bpf_ioctl_sblen(d, (u_int *)addr); 1383df8bae1dSRodney W. Grimes break; 1384df8bae1dSRodney W. Grimes 1385df8bae1dSRodney W. Grimes /* 1386df8bae1dSRodney W. Grimes * Set link layer read filter. 1387df8bae1dSRodney W. Grimes */ 1388df8bae1dSRodney W. Grimes case BIOCSETF: 1389f11c3508SDavid Malone case BIOCSETFNR: 139093e39f0bSChristian S.J. Peron case BIOCSETWF: 1391fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 1392fc0a61a4SKonstantin Belousov case BIOCSETF32: 1393fc0a61a4SKonstantin Belousov case BIOCSETFNR32: 1394fc0a61a4SKonstantin Belousov case BIOCSETWF32: 1395fc0a61a4SKonstantin Belousov #endif 139693e39f0bSChristian S.J. Peron error = bpf_setf(d, (struct bpf_program *)addr, cmd); 1397df8bae1dSRodney W. Grimes break; 1398df8bae1dSRodney W. Grimes 1399df8bae1dSRodney W. Grimes /* 1400df8bae1dSRodney W. Grimes * Flush read packet buffer. 1401df8bae1dSRodney W. Grimes */ 1402df8bae1dSRodney W. Grimes case BIOCFLUSH: 1403afa85850SAlexander V. Chernikov BPFD_LOCK(d); 1404df8bae1dSRodney W. Grimes reset_d(d); 1405afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 1406df8bae1dSRodney W. Grimes break; 1407df8bae1dSRodney W. Grimes 1408df8bae1dSRodney W. Grimes /* 1409df8bae1dSRodney W. Grimes * Put interface into promiscuous mode. 1410df8bae1dSRodney W. Grimes */ 1411df8bae1dSRodney W. Grimes case BIOCPROMISC: 1412572bde2aSRobert Watson if (d->bd_bif == NULL) { 1413df8bae1dSRodney W. Grimes /* 1414df8bae1dSRodney W. Grimes * No interface attached yet. 1415df8bae1dSRodney W. Grimes */ 1416df8bae1dSRodney W. Grimes error = EINVAL; 1417df8bae1dSRodney W. Grimes break; 1418df8bae1dSRodney W. Grimes } 1419df8bae1dSRodney W. Grimes if (d->bd_promisc == 0) { 1420df8bae1dSRodney W. Grimes error = ifpromisc(d->bd_bif->bif_ifp, 1); 1421df8bae1dSRodney W. Grimes if (error == 0) 1422df8bae1dSRodney W. Grimes d->bd_promisc = 1; 1423df8bae1dSRodney W. Grimes } 1424df8bae1dSRodney W. Grimes break; 1425df8bae1dSRodney W. Grimes 1426df8bae1dSRodney W. Grimes /* 14278eab61f3SSam Leffler * Get current data link type. 1428df8bae1dSRodney W. Grimes */ 1429df8bae1dSRodney W. Grimes case BIOCGDLT: 143097aacec6SAlexander V. Chernikov BPF_LOCK(); 1431572bde2aSRobert Watson if (d->bd_bif == NULL) 1432df8bae1dSRodney W. Grimes error = EINVAL; 1433df8bae1dSRodney W. Grimes else 1434df8bae1dSRodney W. Grimes *(u_int *)addr = d->bd_bif->bif_dlt; 143597aacec6SAlexander V. Chernikov BPF_UNLOCK(); 1436df8bae1dSRodney W. Grimes break; 1437df8bae1dSRodney W. Grimes 1438df8bae1dSRodney W. Grimes /* 14398eab61f3SSam Leffler * Get a list of supported data link types. 14408eab61f3SSam Leffler */ 1441fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 1442fc0a61a4SKonstantin Belousov case BIOCGDLTLIST32: 1443fc0a61a4SKonstantin Belousov { 1444fc0a61a4SKonstantin Belousov struct bpf_dltlist32 *list32; 1445fc0a61a4SKonstantin Belousov struct bpf_dltlist dltlist; 1446fc0a61a4SKonstantin Belousov 1447fc0a61a4SKonstantin Belousov list32 = (struct bpf_dltlist32 *)addr; 1448fc0a61a4SKonstantin Belousov dltlist.bfl_len = list32->bfl_len; 1449fc0a61a4SKonstantin Belousov dltlist.bfl_list = PTRIN(list32->bfl_list); 145097aacec6SAlexander V. Chernikov BPF_LOCK(); 1451fc0a61a4SKonstantin Belousov if (d->bd_bif == NULL) 1452fc0a61a4SKonstantin Belousov error = EINVAL; 1453fc0a61a4SKonstantin Belousov else { 1454fc0a61a4SKonstantin Belousov error = bpf_getdltlist(d, &dltlist); 1455fc0a61a4SKonstantin Belousov if (error == 0) 1456fc0a61a4SKonstantin Belousov list32->bfl_len = dltlist.bfl_len; 1457fc0a61a4SKonstantin Belousov } 145897aacec6SAlexander V. Chernikov BPF_UNLOCK(); 1459fc0a61a4SKonstantin Belousov break; 1460fc0a61a4SKonstantin Belousov } 1461fc0a61a4SKonstantin Belousov #endif 1462fc0a61a4SKonstantin Belousov 14638eab61f3SSam Leffler case BIOCGDLTLIST: 146497aacec6SAlexander V. Chernikov BPF_LOCK(); 1465572bde2aSRobert Watson if (d->bd_bif == NULL) 14668eab61f3SSam Leffler error = EINVAL; 14678eab61f3SSam Leffler else 14688eab61f3SSam Leffler error = bpf_getdltlist(d, (struct bpf_dltlist *)addr); 146997aacec6SAlexander V. Chernikov BPF_UNLOCK(); 14708eab61f3SSam Leffler break; 14718eab61f3SSam Leffler 14728eab61f3SSam Leffler /* 14738eab61f3SSam Leffler * Set data link type. 14748eab61f3SSam Leffler */ 14758eab61f3SSam Leffler case BIOCSDLT: 14766c74ff0eSAlexander V. Chernikov BPF_LOCK(); 1477572bde2aSRobert Watson if (d->bd_bif == NULL) 14788eab61f3SSam Leffler error = EINVAL; 14798eab61f3SSam Leffler else 14808eab61f3SSam Leffler error = bpf_setdlt(d, *(u_int *)addr); 14816c74ff0eSAlexander V. Chernikov BPF_UNLOCK(); 14828eab61f3SSam Leffler break; 14838eab61f3SSam Leffler 14848eab61f3SSam Leffler /* 14851dd0feaaSArchie Cobbs * Get interface name. 1486df8bae1dSRodney W. Grimes */ 1487df8bae1dSRodney W. Grimes case BIOCGETIF: 148897aacec6SAlexander V. Chernikov BPF_LOCK(); 1489572bde2aSRobert Watson if (d->bd_bif == NULL) 1490df8bae1dSRodney W. Grimes error = EINVAL; 14911dd0feaaSArchie Cobbs else { 14921dd0feaaSArchie Cobbs struct ifnet *const ifp = d->bd_bif->bif_ifp; 14931dd0feaaSArchie Cobbs struct ifreq *const ifr = (struct ifreq *)addr; 14941dd0feaaSArchie Cobbs 14959bf40edeSBrooks Davis strlcpy(ifr->ifr_name, ifp->if_xname, 14969bf40edeSBrooks Davis sizeof(ifr->ifr_name)); 14971dd0feaaSArchie Cobbs } 149897aacec6SAlexander V. Chernikov BPF_UNLOCK(); 1499df8bae1dSRodney W. Grimes break; 1500df8bae1dSRodney W. Grimes 1501df8bae1dSRodney W. Grimes /* 1502df8bae1dSRodney W. Grimes * Set interface. 1503df8bae1dSRodney W. Grimes */ 1504df8bae1dSRodney W. Grimes case BIOCSETIF: 15054f42daa4SLuiz Otavio O Souza { 15064f42daa4SLuiz Otavio O Souza int alloc_buf, size; 15074f42daa4SLuiz Otavio O Souza 15084f42daa4SLuiz Otavio O Souza /* 15094f42daa4SLuiz Otavio O Souza * Behavior here depends on the buffering model. If 15104f42daa4SLuiz Otavio O Souza * we're using kernel memory buffers, then we can 15114f42daa4SLuiz Otavio O Souza * allocate them here. If we're using zero-copy, 15124f42daa4SLuiz Otavio O Souza * then the user process must have registered buffers 15134f42daa4SLuiz Otavio O Souza * by the time we get here. 15144f42daa4SLuiz Otavio O Souza */ 15154f42daa4SLuiz Otavio O Souza alloc_buf = 0; 15164f42daa4SLuiz Otavio O Souza BPFD_LOCK(d); 15174f42daa4SLuiz Otavio O Souza if (d->bd_bufmode == BPF_BUFMODE_BUFFER && 15184f42daa4SLuiz Otavio O Souza d->bd_sbuf == NULL) 15194f42daa4SLuiz Otavio O Souza alloc_buf = 1; 15204f42daa4SLuiz Otavio O Souza BPFD_UNLOCK(d); 15214f42daa4SLuiz Otavio O Souza if (alloc_buf) { 15224f42daa4SLuiz Otavio O Souza size = d->bd_bufsize; 15234f42daa4SLuiz Otavio O Souza error = bpf_buffer_ioctl_sblen(d, &size); 15244f42daa4SLuiz Otavio O Souza if (error != 0) 15254f42daa4SLuiz Otavio O Souza break; 15264f42daa4SLuiz Otavio O Souza } 15276c74ff0eSAlexander V. Chernikov BPF_LOCK(); 1528df8bae1dSRodney W. Grimes error = bpf_setif(d, (struct ifreq *)addr); 15296c74ff0eSAlexander V. Chernikov BPF_UNLOCK(); 1530df8bae1dSRodney W. Grimes break; 15314f42daa4SLuiz Otavio O Souza } 1532df8bae1dSRodney W. Grimes 1533df8bae1dSRodney W. Grimes /* 1534df8bae1dSRodney W. Grimes * Set read timeout. 1535df8bae1dSRodney W. Grimes */ 1536df8bae1dSRodney W. Grimes case BIOCSRTIMEOUT: 1537b4366092SJustin Hibbits #if defined(COMPAT_FREEBSD32) && defined(__amd64__) 1538fc0a61a4SKonstantin Belousov case BIOCSRTIMEOUT32: 1539fc0a61a4SKonstantin Belousov #endif 1540df8bae1dSRodney W. Grimes { 1541df8bae1dSRodney W. Grimes struct timeval *tv = (struct timeval *)addr; 15429624d947SJuli Mallett #if defined(COMPAT_FREEBSD32) && !defined(__mips__) 1543fc0a61a4SKonstantin Belousov struct timeval32 *tv32; 1544fc0a61a4SKonstantin Belousov struct timeval tv64; 1545fc0a61a4SKonstantin Belousov 1546fc0a61a4SKonstantin Belousov if (cmd == BIOCSRTIMEOUT32) { 1547fc0a61a4SKonstantin Belousov tv32 = (struct timeval32 *)addr; 1548fc0a61a4SKonstantin Belousov tv = &tv64; 1549fc0a61a4SKonstantin Belousov tv->tv_sec = tv32->tv_sec; 1550fc0a61a4SKonstantin Belousov tv->tv_usec = tv32->tv_usec; 1551fc0a61a4SKonstantin Belousov } else 1552fc0a61a4SKonstantin Belousov #endif 1553fc0a61a4SKonstantin Belousov tv = (struct timeval *)addr; 1554df8bae1dSRodney W. Grimes 1555bdc2cdc5SAlexander Langer /* 1556bdc2cdc5SAlexander Langer * Subtract 1 tick from tvtohz() since this isn't 1557bdc2cdc5SAlexander Langer * a one-shot timer. 1558bdc2cdc5SAlexander Langer */ 1559bdc2cdc5SAlexander Langer if ((error = itimerfix(tv)) == 0) 1560bdc2cdc5SAlexander Langer d->bd_rtout = tvtohz(tv) - 1; 1561df8bae1dSRodney W. Grimes break; 1562df8bae1dSRodney W. Grimes } 1563df8bae1dSRodney W. Grimes 1564df8bae1dSRodney W. Grimes /* 1565df8bae1dSRodney W. Grimes * Get read timeout. 1566df8bae1dSRodney W. Grimes */ 1567df8bae1dSRodney W. Grimes case BIOCGRTIMEOUT: 1568b4366092SJustin Hibbits #if defined(COMPAT_FREEBSD32) && defined(__amd64__) 1569fc0a61a4SKonstantin Belousov case BIOCGRTIMEOUT32: 1570fc0a61a4SKonstantin Belousov #endif 1571df8bae1dSRodney W. Grimes { 1572fc0a61a4SKonstantin Belousov struct timeval *tv; 1573b4366092SJustin Hibbits #if defined(COMPAT_FREEBSD32) && defined(__amd64__) 1574fc0a61a4SKonstantin Belousov struct timeval32 *tv32; 1575fc0a61a4SKonstantin Belousov struct timeval tv64; 1576fc0a61a4SKonstantin Belousov 1577fc0a61a4SKonstantin Belousov if (cmd == BIOCGRTIMEOUT32) 1578fc0a61a4SKonstantin Belousov tv = &tv64; 1579fc0a61a4SKonstantin Belousov else 1580fc0a61a4SKonstantin Belousov #endif 1581fc0a61a4SKonstantin Belousov tv = (struct timeval *)addr; 1582df8bae1dSRodney W. Grimes 1583bdc2cdc5SAlexander Langer tv->tv_sec = d->bd_rtout / hz; 1584bdc2cdc5SAlexander Langer tv->tv_usec = (d->bd_rtout % hz) * tick; 1585b4366092SJustin Hibbits #if defined(COMPAT_FREEBSD32) && defined(__amd64__) 1586fc0a61a4SKonstantin Belousov if (cmd == BIOCGRTIMEOUT32) { 1587fc0a61a4SKonstantin Belousov tv32 = (struct timeval32 *)addr; 1588fc0a61a4SKonstantin Belousov tv32->tv_sec = tv->tv_sec; 1589fc0a61a4SKonstantin Belousov tv32->tv_usec = tv->tv_usec; 1590fc0a61a4SKonstantin Belousov } 1591fc0a61a4SKonstantin Belousov #endif 1592fc0a61a4SKonstantin Belousov 1593df8bae1dSRodney W. Grimes break; 1594df8bae1dSRodney W. Grimes } 1595df8bae1dSRodney W. Grimes 1596df8bae1dSRodney W. Grimes /* 1597df8bae1dSRodney W. Grimes * Get packet stats. 1598df8bae1dSRodney W. Grimes */ 1599df8bae1dSRodney W. Grimes case BIOCGSTATS: 1600df8bae1dSRodney W. Grimes { 1601df8bae1dSRodney W. Grimes struct bpf_stat *bs = (struct bpf_stat *)addr; 1602df8bae1dSRodney W. Grimes 16034d621040SChristian S.J. Peron /* XXXCSJP overflow */ 1604*b2b7ca49SAlexander V. Chernikov bs->bs_recv = (u_int)counter_u64_fetch(d->bd_rcount); 1605*b2b7ca49SAlexander V. Chernikov bs->bs_drop = (u_int)counter_u64_fetch(d->bd_dcount); 1606df8bae1dSRodney W. Grimes break; 1607df8bae1dSRodney W. Grimes } 1608df8bae1dSRodney W. Grimes 1609df8bae1dSRodney W. Grimes /* 1610df8bae1dSRodney W. Grimes * Set immediate mode. 1611df8bae1dSRodney W. Grimes */ 1612df8bae1dSRodney W. Grimes case BIOCIMMEDIATE: 161397aacec6SAlexander V. Chernikov BPFD_LOCK(d); 1614df8bae1dSRodney W. Grimes d->bd_immediate = *(u_int *)addr; 161597aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 1616df8bae1dSRodney W. Grimes break; 1617df8bae1dSRodney W. Grimes 1618df8bae1dSRodney W. Grimes case BIOCVERSION: 1619df8bae1dSRodney W. Grimes { 1620df8bae1dSRodney W. Grimes struct bpf_version *bv = (struct bpf_version *)addr; 1621df8bae1dSRodney W. Grimes 1622df8bae1dSRodney W. Grimes bv->bv_major = BPF_MAJOR_VERSION; 1623df8bae1dSRodney W. Grimes bv->bv_minor = BPF_MINOR_VERSION; 1624df8bae1dSRodney W. Grimes break; 1625df8bae1dSRodney W. Grimes } 162600a83887SPaul Traina 1627114ae644SMike Smith /* 1628114ae644SMike Smith * Get "header already complete" flag 1629114ae644SMike Smith */ 1630114ae644SMike Smith case BIOCGHDRCMPLT: 163197aacec6SAlexander V. Chernikov BPFD_LOCK(d); 1632114ae644SMike Smith *(u_int *)addr = d->bd_hdrcmplt; 163397aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 1634114ae644SMike Smith break; 1635114ae644SMike Smith 1636114ae644SMike Smith /* 1637114ae644SMike Smith * Set "header already complete" flag 1638114ae644SMike Smith */ 1639114ae644SMike Smith case BIOCSHDRCMPLT: 164097aacec6SAlexander V. Chernikov BPFD_LOCK(d); 1641114ae644SMike Smith d->bd_hdrcmplt = *(u_int *)addr ? 1 : 0; 164297aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 1643114ae644SMike Smith break; 1644114ae644SMike Smith 16458ed3828cSRobert Watson /* 1646560a54e1SJung-uk Kim * Get packet direction flag 16478ed3828cSRobert Watson */ 1648560a54e1SJung-uk Kim case BIOCGDIRECTION: 164997aacec6SAlexander V. Chernikov BPFD_LOCK(d); 1650560a54e1SJung-uk Kim *(u_int *)addr = d->bd_direction; 165197aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 16528ed3828cSRobert Watson break; 16538ed3828cSRobert Watson 16548ed3828cSRobert Watson /* 1655560a54e1SJung-uk Kim * Set packet direction flag 16568ed3828cSRobert Watson */ 1657560a54e1SJung-uk Kim case BIOCSDIRECTION: 1658560a54e1SJung-uk Kim { 1659560a54e1SJung-uk Kim u_int direction; 1660560a54e1SJung-uk Kim 1661560a54e1SJung-uk Kim direction = *(u_int *)addr; 1662560a54e1SJung-uk Kim switch (direction) { 1663560a54e1SJung-uk Kim case BPF_D_IN: 1664560a54e1SJung-uk Kim case BPF_D_INOUT: 1665560a54e1SJung-uk Kim case BPF_D_OUT: 166697aacec6SAlexander V. Chernikov BPFD_LOCK(d); 1667560a54e1SJung-uk Kim d->bd_direction = direction; 166897aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 1669560a54e1SJung-uk Kim break; 1670560a54e1SJung-uk Kim default: 1671560a54e1SJung-uk Kim error = EINVAL; 1672560a54e1SJung-uk Kim } 1673560a54e1SJung-uk Kim } 1674560a54e1SJung-uk Kim break; 1675560a54e1SJung-uk Kim 1676547d94bdSJung-uk Kim /* 1677d0d7bcdfSJung-uk Kim * Get packet timestamp format and resolution. 1678547d94bdSJung-uk Kim */ 1679547d94bdSJung-uk Kim case BIOCGTSTAMP: 168097aacec6SAlexander V. Chernikov BPFD_LOCK(d); 1681547d94bdSJung-uk Kim *(u_int *)addr = d->bd_tstamp; 168297aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 1683547d94bdSJung-uk Kim break; 1684547d94bdSJung-uk Kim 1685547d94bdSJung-uk Kim /* 1686547d94bdSJung-uk Kim * Set packet timestamp format and resolution. 1687547d94bdSJung-uk Kim */ 1688547d94bdSJung-uk Kim case BIOCSTSTAMP: 1689547d94bdSJung-uk Kim { 1690547d94bdSJung-uk Kim u_int func; 1691547d94bdSJung-uk Kim 1692547d94bdSJung-uk Kim func = *(u_int *)addr; 1693547d94bdSJung-uk Kim if (BPF_T_VALID(func)) 1694547d94bdSJung-uk Kim d->bd_tstamp = func; 1695547d94bdSJung-uk Kim else 1696547d94bdSJung-uk Kim error = EINVAL; 1697547d94bdSJung-uk Kim } 1698547d94bdSJung-uk Kim break; 1699547d94bdSJung-uk Kim 1700560a54e1SJung-uk Kim case BIOCFEEDBACK: 170197aacec6SAlexander V. Chernikov BPFD_LOCK(d); 1702560a54e1SJung-uk Kim d->bd_feedback = *(u_int *)addr; 170397aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 1704560a54e1SJung-uk Kim break; 1705560a54e1SJung-uk Kim 1706560a54e1SJung-uk Kim case BIOCLOCK: 170797aacec6SAlexander V. Chernikov BPFD_LOCK(d); 1708560a54e1SJung-uk Kim d->bd_locked = 1; 170997aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 17108ed3828cSRobert Watson break; 17118ed3828cSRobert Watson 171200a83887SPaul Traina case FIONBIO: /* Non-blocking I/O */ 171300a83887SPaul Traina break; 171400a83887SPaul Traina 171500a83887SPaul Traina case FIOASYNC: /* Send signal on receive packets */ 171697aacec6SAlexander V. Chernikov BPFD_LOCK(d); 171700a83887SPaul Traina d->bd_async = *(int *)addr; 171897aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 171900a83887SPaul Traina break; 172000a83887SPaul Traina 1721831d27a9SDon Lewis case FIOSETOWN: 172297aacec6SAlexander V. Chernikov /* 172397aacec6SAlexander V. Chernikov * XXX: Add some sort of locking here? 172497aacec6SAlexander V. Chernikov * fsetown() can sleep. 172597aacec6SAlexander V. Chernikov */ 1726831d27a9SDon Lewis error = fsetown(*(int *)addr, &d->bd_sigio); 172700a83887SPaul Traina break; 172800a83887SPaul Traina 1729831d27a9SDon Lewis case FIOGETOWN: 173097aacec6SAlexander V. Chernikov BPFD_LOCK(d); 173191e97a82SDon Lewis *(int *)addr = fgetown(&d->bd_sigio); 173297aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 1733831d27a9SDon Lewis break; 1734831d27a9SDon Lewis 1735831d27a9SDon Lewis /* This is deprecated, FIOSETOWN should be used instead. */ 1736831d27a9SDon Lewis case TIOCSPGRP: 1737831d27a9SDon Lewis error = fsetown(-(*(int *)addr), &d->bd_sigio); 1738831d27a9SDon Lewis break; 1739831d27a9SDon Lewis 1740831d27a9SDon Lewis /* This is deprecated, FIOGETOWN should be used instead. */ 174100a83887SPaul Traina case TIOCGPGRP: 174291e97a82SDon Lewis *(int *)addr = -fgetown(&d->bd_sigio); 174300a83887SPaul Traina break; 174400a83887SPaul Traina 174500a83887SPaul Traina case BIOCSRSIG: /* Set receive signal */ 174600a83887SPaul Traina { 174700a83887SPaul Traina u_int sig; 174800a83887SPaul Traina 174900a83887SPaul Traina sig = *(u_int *)addr; 175000a83887SPaul Traina 175100a83887SPaul Traina if (sig >= NSIG) 175200a83887SPaul Traina error = EINVAL; 175397aacec6SAlexander V. Chernikov else { 175497aacec6SAlexander V. Chernikov BPFD_LOCK(d); 175500a83887SPaul Traina d->bd_sig = sig; 175697aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 175797aacec6SAlexander V. Chernikov } 175800a83887SPaul Traina break; 175900a83887SPaul Traina } 176000a83887SPaul Traina case BIOCGRSIG: 176197aacec6SAlexander V. Chernikov BPFD_LOCK(d); 176200a83887SPaul Traina *(u_int *)addr = d->bd_sig; 176397aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 176400a83887SPaul Traina break; 17654d621040SChristian S.J. Peron 17664d621040SChristian S.J. Peron case BIOCGETBUFMODE: 176797aacec6SAlexander V. Chernikov BPFD_LOCK(d); 17684d621040SChristian S.J. Peron *(u_int *)addr = d->bd_bufmode; 176997aacec6SAlexander V. Chernikov BPFD_UNLOCK(d); 17704d621040SChristian S.J. Peron break; 17714d621040SChristian S.J. Peron 17724d621040SChristian S.J. Peron case BIOCSETBUFMODE: 17734d621040SChristian S.J. Peron /* 17744d621040SChristian S.J. Peron * Allow the buffering mode to be changed as long as we 17754d621040SChristian S.J. Peron * haven't yet committed to a particular mode. Our 17764d621040SChristian S.J. Peron * definition of commitment, for now, is whether or not a 17774d621040SChristian S.J. Peron * buffer has been allocated or an interface attached, since 17784d621040SChristian S.J. Peron * that's the point where things get tricky. 17794d621040SChristian S.J. Peron */ 17804d621040SChristian S.J. Peron switch (*(u_int *)addr) { 17814d621040SChristian S.J. Peron case BPF_BUFMODE_BUFFER: 17824d621040SChristian S.J. Peron break; 17834d621040SChristian S.J. Peron 17844d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 17854d621040SChristian S.J. Peron if (bpf_zerocopy_enable) 17864d621040SChristian S.J. Peron break; 17874d621040SChristian S.J. Peron /* FALLSTHROUGH */ 17884d621040SChristian S.J. Peron 17894d621040SChristian S.J. Peron default: 17901b610a74SBjoern A. Zeeb CURVNET_RESTORE(); 17914d621040SChristian S.J. Peron return (EINVAL); 17924d621040SChristian S.J. Peron } 17934d621040SChristian S.J. Peron 1794afa85850SAlexander V. Chernikov BPFD_LOCK(d); 17954d621040SChristian S.J. Peron if (d->bd_sbuf != NULL || d->bd_hbuf != NULL || 17964d621040SChristian S.J. Peron d->bd_fbuf != NULL || d->bd_bif != NULL) { 1797afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 17981b610a74SBjoern A. Zeeb CURVNET_RESTORE(); 17994d621040SChristian S.J. Peron return (EBUSY); 18004d621040SChristian S.J. Peron } 18014d621040SChristian S.J. Peron d->bd_bufmode = *(u_int *)addr; 1802afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 18034d621040SChristian S.J. Peron break; 18044d621040SChristian S.J. Peron 18054d621040SChristian S.J. Peron case BIOCGETZMAX: 18061b610a74SBjoern A. Zeeb error = bpf_ioctl_getzmax(td, d, (size_t *)addr); 18071b610a74SBjoern A. Zeeb break; 18084d621040SChristian S.J. Peron 18094d621040SChristian S.J. Peron case BIOCSETZBUF: 18101b610a74SBjoern A. Zeeb error = bpf_ioctl_setzbuf(td, d, (struct bpf_zbuf *)addr); 18111b610a74SBjoern A. Zeeb break; 18124d621040SChristian S.J. Peron 18134d621040SChristian S.J. Peron case BIOCROTZBUF: 18141b610a74SBjoern A. Zeeb error = bpf_ioctl_rotzbuf(td, d, (struct bpf_zbuf *)addr); 18151b610a74SBjoern A. Zeeb break; 1816df8bae1dSRodney W. Grimes } 181797021c24SMarko Zec CURVNET_RESTORE(); 1818df8bae1dSRodney W. Grimes return (error); 1819df8bae1dSRodney W. Grimes } 1820df8bae1dSRodney W. Grimes 1821df8bae1dSRodney W. Grimes /* 1822df8bae1dSRodney W. Grimes * Set d's packet filter program to fp. If this file already has a filter, 1823df8bae1dSRodney W. Grimes * free it and replace it. Returns EINVAL for bogus requests. 1824784292f8SAlexander V. Chernikov * 1825784292f8SAlexander V. Chernikov * Note we need global lock here to serialize bpf_setf() and bpf_setif() calls 1826784292f8SAlexander V. Chernikov * since reading d->bd_bif can't be protected by d or interface lock due to 1827784292f8SAlexander V. Chernikov * lock order. 1828784292f8SAlexander V. Chernikov * 1829784292f8SAlexander V. Chernikov * Additionally, we have to acquire interface write lock due to bpf_mtap() uses 1830784292f8SAlexander V. Chernikov * interface read lock to read all filers. 1831784292f8SAlexander V. Chernikov * 1832df8bae1dSRodney W. Grimes */ 1833f708ef1bSPoul-Henning Kamp static int 183419ba8395SChristian S.J. Peron bpf_setf(struct bpf_d *d, struct bpf_program *fp, u_long cmd) 1835df8bae1dSRodney W. Grimes { 18369b7d4a7fSJung-uk Kim #ifdef COMPAT_FREEBSD32 18379b7d4a7fSJung-uk Kim struct bpf_program fp_swab; 18389b7d4a7fSJung-uk Kim struct bpf_program32 *fp32; 18399b7d4a7fSJung-uk Kim #endif 1840df8bae1dSRodney W. Grimes struct bpf_insn *fcode, *old; 1841293c06a1SRuslan Ermilov #ifdef BPF_JITTER 1842a86227d1SAlexander V. Chernikov bpf_jit_filter *jfunc, *ofunc; 1843ae275efcSJung-uk Kim #endif 18448b04b48aSJung-uk Kim size_t size; 18458b04b48aSJung-uk Kim u_int flen; 18469431cc16SAlexander V. Chernikov int need_upgrade; 1847df8bae1dSRodney W. Grimes 18489b7d4a7fSJung-uk Kim #ifdef COMPAT_FREEBSD32 18496f731135SJung-uk Kim switch (cmd) { 18506f731135SJung-uk Kim case BIOCSETF32: 18516f731135SJung-uk Kim case BIOCSETWF32: 18526f731135SJung-uk Kim case BIOCSETFNR32: 1853fc0a61a4SKonstantin Belousov fp32 = (struct bpf_program32 *)fp; 1854fc0a61a4SKonstantin Belousov fp_swab.bf_len = fp32->bf_len; 1855fc0a61a4SKonstantin Belousov fp_swab.bf_insns = (struct bpf_insn *)(uintptr_t)fp32->bf_insns; 1856fc0a61a4SKonstantin Belousov fp = &fp_swab; 18576f731135SJung-uk Kim switch (cmd) { 18586f731135SJung-uk Kim case BIOCSETF32: 18596f731135SJung-uk Kim cmd = BIOCSETF; 18606f731135SJung-uk Kim break; 18616f731135SJung-uk Kim case BIOCSETWF32: 1862fc0a61a4SKonstantin Belousov cmd = BIOCSETWF; 18636f731135SJung-uk Kim break; 18646f731135SJung-uk Kim } 18656f731135SJung-uk Kim break; 1866fc0a61a4SKonstantin Belousov } 1867fc0a61a4SKonstantin Belousov #endif 18688b04b48aSJung-uk Kim 18698b04b48aSJung-uk Kim fcode = NULL; 18708b04b48aSJung-uk Kim #ifdef BPF_JITTER 18718b04b48aSJung-uk Kim jfunc = ofunc = NULL; 18728b04b48aSJung-uk Kim #endif 18739b7d4a7fSJung-uk Kim need_upgrade = 0; 18748b04b48aSJung-uk Kim 18756c74ff0eSAlexander V. Chernikov /* 18766c74ff0eSAlexander V. Chernikov * Check new filter validness before acquiring any locks. 18776c74ff0eSAlexander V. Chernikov * Allocate memory for new filter, if needed. 18786c74ff0eSAlexander V. Chernikov */ 18796c74ff0eSAlexander V. Chernikov flen = fp->bf_len; 18809b7d4a7fSJung-uk Kim if (flen > bpf_maxinsns || (fp->bf_insns == NULL && flen != 0)) 18816c74ff0eSAlexander V. Chernikov return (EINVAL); 18826c74ff0eSAlexander V. Chernikov size = flen * sizeof(*fp->bf_insns); 1883a86227d1SAlexander V. Chernikov if (size > 0) { 18849b7d4a7fSJung-uk Kim /* We're setting up new filter. Copy and check actual data. */ 18859b7d4a7fSJung-uk Kim fcode = malloc(size, M_BPF, M_WAITOK); 18869b7d4a7fSJung-uk Kim if (copyin(fp->bf_insns, fcode, size) != 0 || 18879b7d4a7fSJung-uk Kim !bpf_validate(fcode, flen)) { 1888a86227d1SAlexander V. Chernikov free(fcode, M_BPF); 1889a86227d1SAlexander V. Chernikov return (EINVAL); 1890a86227d1SAlexander V. Chernikov } 1891c7b0200eSAlexander V. Chernikov #ifdef BPF_JITTER 18929b7d4a7fSJung-uk Kim /* Filter is copied inside fcode and is perfectly valid. */ 1893c7b0200eSAlexander V. Chernikov jfunc = bpf_jitter(fcode, flen); 1894c7b0200eSAlexander V. Chernikov #endif 18958b04b48aSJung-uk Kim } 1896c7b0200eSAlexander V. Chernikov 18976c74ff0eSAlexander V. Chernikov BPF_LOCK(); 18986c74ff0eSAlexander V. Chernikov 1899e4b3229aSAlexander V. Chernikov /* 1900a86227d1SAlexander V. Chernikov * Set up new filter. 19019b7d4a7fSJung-uk Kim * Protect filter change by interface lock. 19026c74ff0eSAlexander V. Chernikov * Additionally, we are protected by global lock here. 1903e4b3229aSAlexander V. Chernikov */ 19046c74ff0eSAlexander V. Chernikov if (d->bd_bif != NULL) 1905e4b3229aSAlexander V. Chernikov BPFIF_WLOCK(d->bd_bif); 1906afa85850SAlexander V. Chernikov BPFD_LOCK(d); 19078b04b48aSJung-uk Kim if (cmd == BIOCSETWF) { 19088b04b48aSJung-uk Kim old = d->bd_wfilter; 190993e39f0bSChristian S.J. Peron d->bd_wfilter = fcode; 19108b04b48aSJung-uk Kim } else { 19118b04b48aSJung-uk Kim old = d->bd_rfilter; 191293e39f0bSChristian S.J. Peron d->bd_rfilter = fcode; 1913293c06a1SRuslan Ermilov #ifdef BPF_JITTER 19148b04b48aSJung-uk Kim ofunc = d->bd_bfilter; 1915c7b0200eSAlexander V. Chernikov d->bd_bfilter = jfunc; 1916ae275efcSJung-uk Kim #endif 1917f11c3508SDavid Malone if (cmd == BIOCSETF) 1918df8bae1dSRodney W. Grimes reset_d(d); 191951ec1eb7SAlexander V. Chernikov 1920402000ffSAlexander V. Chernikov need_upgrade = bpf_check_upgrade(cmd, d, fcode, flen); 19218b04b48aSJung-uk Kim } 1922afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 19236c74ff0eSAlexander V. Chernikov if (d->bd_bif != NULL) 1924e4b3229aSAlexander V. Chernikov BPFIF_WUNLOCK(d->bd_bif); 1925572bde2aSRobert Watson if (old != NULL) 19269b7d4a7fSJung-uk Kim free(old, M_BPF); 1927293c06a1SRuslan Ermilov #ifdef BPF_JITTER 1928ae275efcSJung-uk Kim if (ofunc != NULL) 1929ae275efcSJung-uk Kim bpf_destroy_jit_filter(ofunc); 1930ae275efcSJung-uk Kim #endif 1931df8bae1dSRodney W. Grimes 19329b7d4a7fSJung-uk Kim /* Move d to active readers list. */ 1933402000ffSAlexander V. Chernikov if (need_upgrade != 0) 193451ec1eb7SAlexander V. Chernikov bpf_upgraded(d); 193551ec1eb7SAlexander V. Chernikov 19366c74ff0eSAlexander V. Chernikov BPF_UNLOCK(); 1937df8bae1dSRodney W. Grimes return (0); 1938df8bae1dSRodney W. Grimes } 1939df8bae1dSRodney W. Grimes 1940df8bae1dSRodney W. Grimes /* 1941df8bae1dSRodney W. Grimes * Detach a file from its current interface (if attached at all) and attach 1942df8bae1dSRodney W. Grimes * to the interface indicated by the name stored in ifr. 1943df8bae1dSRodney W. Grimes * Return an errno or 0. 1944df8bae1dSRodney W. Grimes */ 1945df8bae1dSRodney W. Grimes static int 194619ba8395SChristian S.J. Peron bpf_setif(struct bpf_d *d, struct ifreq *ifr) 1947df8bae1dSRodney W. Grimes { 1948df8bae1dSRodney W. Grimes struct bpf_if *bp; 19499b44ff22SGarrett Wollman struct ifnet *theywant; 1950df8bae1dSRodney W. Grimes 19516c74ff0eSAlexander V. Chernikov BPF_LOCK_ASSERT(); 19526c74ff0eSAlexander V. Chernikov 19539b44ff22SGarrett Wollman theywant = ifunit(ifr->ifr_name); 195416d878ccSChristian S.J. Peron if (theywant == NULL || theywant->if_bpf == NULL) 195516d878ccSChristian S.J. Peron return (ENXIO); 19569b44ff22SGarrett Wollman 195716d878ccSChristian S.J. Peron bp = theywant->if_bpf; 19584d621040SChristian S.J. Peron 1959afa85850SAlexander V. Chernikov /* Check if interface is not being detached from BPF */ 1960afa85850SAlexander V. Chernikov BPFIF_RLOCK(bp); 1961b23cbbe6SMark Johnston if (bp->bif_flags & BPFIF_FLAG_DYING) { 1962afa85850SAlexander V. Chernikov BPFIF_RUNLOCK(bp); 1963afa85850SAlexander V. Chernikov return (ENXIO); 1964afa85850SAlexander V. Chernikov } 1965afa85850SAlexander V. Chernikov BPFIF_RUNLOCK(bp); 1966afa85850SAlexander V. Chernikov 1967df8bae1dSRodney W. Grimes /* 19684f42daa4SLuiz Otavio O Souza * At this point, we expect the buffer is already allocated. If not, 19694f42daa4SLuiz Otavio O Souza * return an error. 1970df8bae1dSRodney W. Grimes */ 19714d621040SChristian S.J. Peron switch (d->bd_bufmode) { 19724d621040SChristian S.J. Peron case BPF_BUFMODE_BUFFER: 19734d621040SChristian S.J. Peron case BPF_BUFMODE_ZBUF: 19744d621040SChristian S.J. Peron if (d->bd_sbuf == NULL) 19754d621040SChristian S.J. Peron return (EINVAL); 19764d621040SChristian S.J. Peron break; 19774d621040SChristian S.J. Peron 19784d621040SChristian S.J. Peron default: 19794d621040SChristian S.J. Peron panic("bpf_setif: bufmode %d", d->bd_bufmode); 19804d621040SChristian S.J. Peron } 19816c74ff0eSAlexander V. Chernikov if (bp != d->bd_bif) 1982df8bae1dSRodney W. Grimes bpf_attachd(d, bp); 1983afa85850SAlexander V. Chernikov BPFD_LOCK(d); 1984df8bae1dSRodney W. Grimes reset_d(d); 1985afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 1986df8bae1dSRodney W. Grimes return (0); 1987df8bae1dSRodney W. Grimes } 1988df8bae1dSRodney W. Grimes 1989df8bae1dSRodney W. Grimes /* 1990243ac7d8SPeter Wemm * Support for select() and poll() system calls 1991df8bae1dSRodney W. Grimes * 1992df8bae1dSRodney W. Grimes * Return true iff the specific operation will not block indefinitely. 1993df8bae1dSRodney W. Grimes * Otherwise, return false but make a note that a selwakeup() must be done. 1994df8bae1dSRodney W. Grimes */ 199537c84183SPoul-Henning Kamp static int 199619ba8395SChristian S.J. Peron bpfpoll(struct cdev *dev, int events, struct thread *td) 1997df8bae1dSRodney W. Grimes { 1998e7bb21b3SJonathan Lemon struct bpf_d *d; 19990832fc64SGarance A Drosehn int revents; 2000df8bae1dSRodney W. Grimes 2001136600feSEd Schouten if (devfs_get_cdevpriv((void **)&d) != 0 || d->bd_bif == NULL) 2002136600feSEd Schouten return (events & 2003136600feSEd Schouten (POLLHUP|POLLIN|POLLRDNORM|POLLOUT|POLLWRNORM)); 2004de5d9935SRobert Watson 2005b75a24a0SChristian S.J. Peron /* 2006b75a24a0SChristian S.J. Peron * Refresh PID associated with this descriptor. 2007b75a24a0SChristian S.J. Peron */ 20080832fc64SGarance A Drosehn revents = events & (POLLOUT | POLLWRNORM); 2009afa85850SAlexander V. Chernikov BPFD_LOCK(d); 2010e4b3229aSAlexander V. Chernikov BPF_PID_REFRESH(d, td); 201175c13541SPoul-Henning Kamp if (events & (POLLIN | POLLRDNORM)) { 201295aab9ccSJohn-Mark Gurney if (bpf_ready(d)) 2013243ac7d8SPeter Wemm revents |= events & (POLLIN | POLLRDNORM); 201481bda851SJohn Polstra else { 2015ed01445dSJohn Baldwin selrecord(td, &d->bd_sel); 201681bda851SJohn Polstra /* Start the read timeout if necessary. */ 201781bda851SJohn Polstra if (d->bd_rtout > 0 && d->bd_state == BPF_IDLE) { 201881bda851SJohn Polstra callout_reset(&d->bd_callout, d->bd_rtout, 201981bda851SJohn Polstra bpf_timed_out, d); 202081bda851SJohn Polstra d->bd_state = BPF_WAITING; 202181bda851SJohn Polstra } 202281bda851SJohn Polstra } 202375c13541SPoul-Henning Kamp } 2024afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 2025243ac7d8SPeter Wemm return (revents); 2026df8bae1dSRodney W. Grimes } 2027df8bae1dSRodney W. Grimes 2028df8bae1dSRodney W. Grimes /* 202995aab9ccSJohn-Mark Gurney * Support for kevent() system call. Register EVFILT_READ filters and 203095aab9ccSJohn-Mark Gurney * reject all others. 203195aab9ccSJohn-Mark Gurney */ 203295aab9ccSJohn-Mark Gurney int 203319ba8395SChristian S.J. Peron bpfkqfilter(struct cdev *dev, struct knote *kn) 203495aab9ccSJohn-Mark Gurney { 2035136600feSEd Schouten struct bpf_d *d; 203695aab9ccSJohn-Mark Gurney 2037136600feSEd Schouten if (devfs_get_cdevpriv((void **)&d) != 0 || 2038136600feSEd Schouten kn->kn_filter != EVFILT_READ) 203995aab9ccSJohn-Mark Gurney return (1); 204095aab9ccSJohn-Mark Gurney 2041b75a24a0SChristian S.J. Peron /* 2042b75a24a0SChristian S.J. Peron * Refresh PID associated with this descriptor. 2043b75a24a0SChristian S.J. Peron */ 2044afa85850SAlexander V. Chernikov BPFD_LOCK(d); 2045e4b3229aSAlexander V. Chernikov BPF_PID_REFRESH_CUR(d); 204695aab9ccSJohn-Mark Gurney kn->kn_fop = &bpfread_filtops; 204795aab9ccSJohn-Mark Gurney kn->kn_hook = d; 20484b19419eSChristian S.J. Peron knlist_add(&d->bd_sel.si_note, kn, 1); 2049afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 205095aab9ccSJohn-Mark Gurney 205195aab9ccSJohn-Mark Gurney return (0); 205295aab9ccSJohn-Mark Gurney } 205395aab9ccSJohn-Mark Gurney 205495aab9ccSJohn-Mark Gurney static void 205519ba8395SChristian S.J. Peron filt_bpfdetach(struct knote *kn) 205695aab9ccSJohn-Mark Gurney { 205795aab9ccSJohn-Mark Gurney struct bpf_d *d = (struct bpf_d *)kn->kn_hook; 205895aab9ccSJohn-Mark Gurney 2059ad3b9257SJohn-Mark Gurney knlist_remove(&d->bd_sel.si_note, kn, 0); 206095aab9ccSJohn-Mark Gurney } 206195aab9ccSJohn-Mark Gurney 206295aab9ccSJohn-Mark Gurney static int 206319ba8395SChristian S.J. Peron filt_bpfread(struct knote *kn, long hint) 206495aab9ccSJohn-Mark Gurney { 206595aab9ccSJohn-Mark Gurney struct bpf_d *d = (struct bpf_d *)kn->kn_hook; 206695aab9ccSJohn-Mark Gurney int ready; 206795aab9ccSJohn-Mark Gurney 2068afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 206995aab9ccSJohn-Mark Gurney ready = bpf_ready(d); 207095aab9ccSJohn-Mark Gurney if (ready) { 207195aab9ccSJohn-Mark Gurney kn->kn_data = d->bd_slen; 207292242172SLuiz Otavio O Souza /* 207392242172SLuiz Otavio O Souza * Ignore the hold buffer if it is being copied to user space. 207492242172SLuiz Otavio O Souza */ 207592242172SLuiz Otavio O Souza if (!d->bd_hbuf_in_use && d->bd_hbuf) 207695aab9ccSJohn-Mark Gurney kn->kn_data += d->bd_hlen; 20775d7af3a1SJung-uk Kim } else if (d->bd_rtout > 0 && d->bd_state == BPF_IDLE) { 207895aab9ccSJohn-Mark Gurney callout_reset(&d->bd_callout, d->bd_rtout, 207995aab9ccSJohn-Mark Gurney bpf_timed_out, d); 208095aab9ccSJohn-Mark Gurney d->bd_state = BPF_WAITING; 208195aab9ccSJohn-Mark Gurney } 208295aab9ccSJohn-Mark Gurney 208395aab9ccSJohn-Mark Gurney return (ready); 208495aab9ccSJohn-Mark Gurney } 208595aab9ccSJohn-Mark Gurney 2086253a3814SLawrence Stewart #define BPF_TSTAMP_NONE 0 2087253a3814SLawrence Stewart #define BPF_TSTAMP_FAST 1 2088253a3814SLawrence Stewart #define BPF_TSTAMP_NORMAL 2 2089253a3814SLawrence Stewart #define BPF_TSTAMP_EXTERN 3 2090253a3814SLawrence Stewart 2091253a3814SLawrence Stewart static int 2092253a3814SLawrence Stewart bpf_ts_quality(int tstype) 2093253a3814SLawrence Stewart { 2094253a3814SLawrence Stewart 2095253a3814SLawrence Stewart if (tstype == BPF_T_NONE) 2096253a3814SLawrence Stewart return (BPF_TSTAMP_NONE); 2097253a3814SLawrence Stewart if ((tstype & BPF_T_FAST) != 0) 2098253a3814SLawrence Stewart return (BPF_TSTAMP_FAST); 2099253a3814SLawrence Stewart 2100253a3814SLawrence Stewart return (BPF_TSTAMP_NORMAL); 2101253a3814SLawrence Stewart } 2102253a3814SLawrence Stewart 2103253a3814SLawrence Stewart static int 2104253a3814SLawrence Stewart bpf_gettime(struct bintime *bt, int tstype, struct mbuf *m) 2105253a3814SLawrence Stewart { 2106253a3814SLawrence Stewart struct m_tag *tag; 2107253a3814SLawrence Stewart int quality; 2108253a3814SLawrence Stewart 2109253a3814SLawrence Stewart quality = bpf_ts_quality(tstype); 2110253a3814SLawrence Stewart if (quality == BPF_TSTAMP_NONE) 2111253a3814SLawrence Stewart return (quality); 2112253a3814SLawrence Stewart 2113253a3814SLawrence Stewart if (m != NULL) { 2114253a3814SLawrence Stewart tag = m_tag_locate(m, MTAG_BPF, MTAG_BPF_TIMESTAMP, NULL); 2115253a3814SLawrence Stewart if (tag != NULL) { 2116253a3814SLawrence Stewart *bt = *(struct bintime *)(tag + 1); 2117253a3814SLawrence Stewart return (BPF_TSTAMP_EXTERN); 2118253a3814SLawrence Stewart } 2119253a3814SLawrence Stewart } 2120253a3814SLawrence Stewart if (quality == BPF_TSTAMP_NORMAL) 2121253a3814SLawrence Stewart binuptime(bt); 2122253a3814SLawrence Stewart else 2123253a3814SLawrence Stewart getbinuptime(bt); 2124253a3814SLawrence Stewart 2125253a3814SLawrence Stewart return (quality); 2126253a3814SLawrence Stewart } 2127253a3814SLawrence Stewart 212895aab9ccSJohn-Mark Gurney /* 2129df8bae1dSRodney W. Grimes * Incoming linkage from device drivers. Process the packet pkt, of length 2130df8bae1dSRodney W. Grimes * pktlen, which is stored in a contiguous buffer. The packet is parsed 2131df8bae1dSRodney W. Grimes * by each process' filter, and if accepted, stashed into the corresponding 2132df8bae1dSRodney W. Grimes * buffer. 2133df8bae1dSRodney W. Grimes */ 2134df8bae1dSRodney W. Grimes void 213519ba8395SChristian S.J. Peron bpf_tap(struct bpf_if *bp, u_char *pkt, u_int pktlen) 2136df8bae1dSRodney W. Grimes { 2137547d94bdSJung-uk Kim struct bintime bt; 21388994a245SDag-Erling Smørgrav struct bpf_d *d; 2139a36599ccSJung-uk Kim #ifdef BPF_JITTER 2140a36599ccSJung-uk Kim bpf_jit_filter *bf; 2141a36599ccSJung-uk Kim #endif 2142253a3814SLawrence Stewart u_int slen; 2143253a3814SLawrence Stewart int gottime; 2144e7bb21b3SJonathan Lemon 2145253a3814SLawrence Stewart gottime = BPF_TSTAMP_NONE; 2146e4b3229aSAlexander V. Chernikov 2147e4b3229aSAlexander V. Chernikov BPFIF_RLOCK(bp); 2148e4b3229aSAlexander V. Chernikov 21494a3feeaaSRobert Watson LIST_FOREACH(d, &bp->bif_dlist, bd_next) { 2150e4b3229aSAlexander V. Chernikov /* 2151e4b3229aSAlexander V. Chernikov * We are not using any locks for d here because: 2152e4b3229aSAlexander V. Chernikov * 1) any filter change is protected by interface 2153e4b3229aSAlexander V. Chernikov * write lock 2154e4b3229aSAlexander V. Chernikov * 2) destroying/detaching d is protected by interface 2155e4b3229aSAlexander V. Chernikov * write lock, too 2156e4b3229aSAlexander V. Chernikov */ 2157e4b3229aSAlexander V. Chernikov 2158*b2b7ca49SAlexander V. Chernikov counter_u64_add(d->bd_rcount, 1); 2159a05cf8c6SChristian S.J. Peron /* 2160a05cf8c6SChristian S.J. Peron * NB: We dont call BPF_CHECK_DIRECTION() here since there is no 2161a05cf8c6SChristian S.J. Peron * way for the caller to indiciate to us whether this packet 2162a05cf8c6SChristian S.J. Peron * is inbound or outbound. In the bpf_mtap() routines, we use 2163a05cf8c6SChristian S.J. Peron * the interface pointers on the mbuf to figure it out. 2164a05cf8c6SChristian S.J. Peron */ 2165ae275efcSJung-uk Kim #ifdef BPF_JITTER 2166a36599ccSJung-uk Kim bf = bpf_jitter_enable != 0 ? d->bd_bfilter : NULL; 2167a36599ccSJung-uk Kim if (bf != NULL) 2168a36599ccSJung-uk Kim slen = (*(bf->func))(pkt, pktlen, pktlen); 2169ae275efcSJung-uk Kim else 2170ae275efcSJung-uk Kim #endif 217193e39f0bSChristian S.J. Peron slen = bpf_filter(d->bd_rfilter, pkt, pktlen, pktlen); 2172ec272d87SRobert Watson if (slen != 0) { 2173e4b3229aSAlexander V. Chernikov /* 2174e4b3229aSAlexander V. Chernikov * Filter matches. Let's to acquire write lock. 2175e4b3229aSAlexander V. Chernikov */ 2176afa85850SAlexander V. Chernikov BPFD_LOCK(d); 2177e4b3229aSAlexander V. Chernikov 2178*b2b7ca49SAlexander V. Chernikov counter_u64_add(d->bd_fcount, 1); 2179253a3814SLawrence Stewart if (gottime < bpf_ts_quality(d->bd_tstamp)) 2180253a3814SLawrence Stewart gottime = bpf_gettime(&bt, d->bd_tstamp, NULL); 2181ec272d87SRobert Watson #ifdef MAC 218230d239bcSRobert Watson if (mac_bpfdesc_check_receive(d, bp->bif_ifp) == 0) 2183ec272d87SRobert Watson #endif 21844d621040SChristian S.J. Peron catchpacket(d, pkt, pktlen, slen, 2185547d94bdSJung-uk Kim bpf_append_bytes, &bt); 2186afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 2187ec272d87SRobert Watson } 2188df8bae1dSRodney W. Grimes } 2189e4b3229aSAlexander V. Chernikov BPFIF_RUNLOCK(bp); 2190df8bae1dSRodney W. Grimes } 2191df8bae1dSRodney W. Grimes 2192f81a2a49SJung-uk Kim #define BPF_CHECK_DIRECTION(d, r, i) \ 2193f81a2a49SJung-uk Kim (((d)->bd_direction == BPF_D_IN && (r) != (i)) || \ 2194f81a2a49SJung-uk Kim ((d)->bd_direction == BPF_D_OUT && (r) == (i))) 2195560a54e1SJung-uk Kim 2196df8bae1dSRodney W. Grimes /* 2197df8bae1dSRodney W. Grimes * Incoming linkage from device drivers, when packet is in an mbuf chain. 2198e4b3229aSAlexander V. Chernikov * Locking model is explained in bpf_tap(). 2199df8bae1dSRodney W. Grimes */ 2200df8bae1dSRodney W. Grimes void 220119ba8395SChristian S.J. Peron bpf_mtap(struct bpf_if *bp, struct mbuf *m) 2202df8bae1dSRodney W. Grimes { 2203547d94bdSJung-uk Kim struct bintime bt; 2204df8bae1dSRodney W. Grimes struct bpf_d *d; 2205a36599ccSJung-uk Kim #ifdef BPF_JITTER 2206a36599ccSJung-uk Kim bpf_jit_filter *bf; 2207a36599ccSJung-uk Kim #endif 2208253a3814SLawrence Stewart u_int pktlen, slen; 2209253a3814SLawrence Stewart int gottime; 221091433904SDavid Malone 22118cd892f7SJung-uk Kim /* Skip outgoing duplicate packets. */ 22128cd892f7SJung-uk Kim if ((m->m_flags & M_PROMISC) != 0 && m->m_pkthdr.rcvif == NULL) { 22138cd892f7SJung-uk Kim m->m_flags &= ~M_PROMISC; 22148cd892f7SJung-uk Kim return; 22158cd892f7SJung-uk Kim } 22168cd892f7SJung-uk Kim 2217f0e2422bSPoul-Henning Kamp pktlen = m_length(m, NULL); 2218253a3814SLawrence Stewart gottime = BPF_TSTAMP_NONE; 2219e4b3229aSAlexander V. Chernikov 2220e4b3229aSAlexander V. Chernikov BPFIF_RLOCK(bp); 2221e4b3229aSAlexander V. Chernikov 22224a3feeaaSRobert Watson LIST_FOREACH(d, &bp->bif_dlist, bd_next) { 2223f81a2a49SJung-uk Kim if (BPF_CHECK_DIRECTION(d, m->m_pkthdr.rcvif, bp->bif_ifp)) 22248ed3828cSRobert Watson continue; 2225*b2b7ca49SAlexander V. Chernikov counter_u64_add(d->bd_rcount, 1); 2226ae275efcSJung-uk Kim #ifdef BPF_JITTER 2227a36599ccSJung-uk Kim bf = bpf_jitter_enable != 0 ? d->bd_bfilter : NULL; 2228ae275efcSJung-uk Kim /* XXX We cannot handle multiple mbufs. */ 2229a36599ccSJung-uk Kim if (bf != NULL && m->m_next == NULL) 2230a36599ccSJung-uk Kim slen = (*(bf->func))(mtod(m, u_char *), pktlen, pktlen); 2231ae275efcSJung-uk Kim else 2232ae275efcSJung-uk Kim #endif 223393e39f0bSChristian S.J. Peron slen = bpf_filter(d->bd_rfilter, (u_char *)m, pktlen, 0); 22344ddfb531SChristian S.J. Peron if (slen != 0) { 2235afa85850SAlexander V. Chernikov BPFD_LOCK(d); 2236e4b3229aSAlexander V. Chernikov 2237*b2b7ca49SAlexander V. Chernikov counter_u64_add(d->bd_fcount, 1); 2238253a3814SLawrence Stewart if (gottime < bpf_ts_quality(d->bd_tstamp)) 2239253a3814SLawrence Stewart gottime = bpf_gettime(&bt, d->bd_tstamp, m); 22400c7fb534SRobert Watson #ifdef MAC 224130d239bcSRobert Watson if (mac_bpfdesc_check_receive(d, bp->bif_ifp) == 0) 22420c7fb534SRobert Watson #endif 22430c7fb534SRobert Watson catchpacket(d, (u_char *)m, pktlen, slen, 2244547d94bdSJung-uk Kim bpf_append_mbuf, &bt); 2245afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 22464ddfb531SChristian S.J. Peron } 2247df8bae1dSRodney W. Grimes } 2248e4b3229aSAlexander V. Chernikov BPFIF_RUNLOCK(bp); 2249df8bae1dSRodney W. Grimes } 2250df8bae1dSRodney W. Grimes 2251df8bae1dSRodney W. Grimes /* 2252437ffe18SSam Leffler * Incoming linkage from device drivers, when packet is in 2253437ffe18SSam Leffler * an mbuf chain and to be prepended by a contiguous header. 2254437ffe18SSam Leffler */ 2255437ffe18SSam Leffler void 225619ba8395SChristian S.J. Peron bpf_mtap2(struct bpf_if *bp, void *data, u_int dlen, struct mbuf *m) 2257437ffe18SSam Leffler { 2258547d94bdSJung-uk Kim struct bintime bt; 2259437ffe18SSam Leffler struct mbuf mb; 2260437ffe18SSam Leffler struct bpf_d *d; 2261253a3814SLawrence Stewart u_int pktlen, slen; 2262253a3814SLawrence Stewart int gottime; 226391433904SDavid Malone 22648cd892f7SJung-uk Kim /* Skip outgoing duplicate packets. */ 22658cd892f7SJung-uk Kim if ((m->m_flags & M_PROMISC) != 0 && m->m_pkthdr.rcvif == NULL) { 22668cd892f7SJung-uk Kim m->m_flags &= ~M_PROMISC; 22678cd892f7SJung-uk Kim return; 22688cd892f7SJung-uk Kim } 22698cd892f7SJung-uk Kim 2270437ffe18SSam Leffler pktlen = m_length(m, NULL); 2271437ffe18SSam Leffler /* 2272437ffe18SSam Leffler * Craft on-stack mbuf suitable for passing to bpf_filter. 2273437ffe18SSam Leffler * Note that we cut corners here; we only setup what's 2274437ffe18SSam Leffler * absolutely needed--this mbuf should never go anywhere else. 2275437ffe18SSam Leffler */ 2276437ffe18SSam Leffler mb.m_next = m; 2277437ffe18SSam Leffler mb.m_data = data; 2278437ffe18SSam Leffler mb.m_len = dlen; 2279437ffe18SSam Leffler pktlen += dlen; 2280437ffe18SSam Leffler 2281253a3814SLawrence Stewart gottime = BPF_TSTAMP_NONE; 2282e4b3229aSAlexander V. Chernikov 2283e4b3229aSAlexander V. Chernikov BPFIF_RLOCK(bp); 2284e4b3229aSAlexander V. Chernikov 22854a3feeaaSRobert Watson LIST_FOREACH(d, &bp->bif_dlist, bd_next) { 2286f81a2a49SJung-uk Kim if (BPF_CHECK_DIRECTION(d, m->m_pkthdr.rcvif, bp->bif_ifp)) 2287437ffe18SSam Leffler continue; 2288*b2b7ca49SAlexander V. Chernikov counter_u64_add(d->bd_rcount, 1); 228993e39f0bSChristian S.J. Peron slen = bpf_filter(d->bd_rfilter, (u_char *)&mb, pktlen, 0); 22904ddfb531SChristian S.J. Peron if (slen != 0) { 2291afa85850SAlexander V. Chernikov BPFD_LOCK(d); 2292e4b3229aSAlexander V. Chernikov 2293*b2b7ca49SAlexander V. Chernikov counter_u64_add(d->bd_fcount, 1); 2294253a3814SLawrence Stewart if (gottime < bpf_ts_quality(d->bd_tstamp)) 2295253a3814SLawrence Stewart gottime = bpf_gettime(&bt, d->bd_tstamp, m); 2296437ffe18SSam Leffler #ifdef MAC 229730d239bcSRobert Watson if (mac_bpfdesc_check_receive(d, bp->bif_ifp) == 0) 2298437ffe18SSam Leffler #endif 2299437ffe18SSam Leffler catchpacket(d, (u_char *)&mb, pktlen, slen, 2300547d94bdSJung-uk Kim bpf_append_mbuf, &bt); 2301afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 23024ddfb531SChristian S.J. Peron } 2303437ffe18SSam Leffler } 2304e4b3229aSAlexander V. Chernikov BPFIF_RUNLOCK(bp); 2305437ffe18SSam Leffler } 2306437ffe18SSam Leffler 2307560a54e1SJung-uk Kim #undef BPF_CHECK_DIRECTION 2308560a54e1SJung-uk Kim 2309253a3814SLawrence Stewart #undef BPF_TSTAMP_NONE 2310253a3814SLawrence Stewart #undef BPF_TSTAMP_FAST 2311253a3814SLawrence Stewart #undef BPF_TSTAMP_NORMAL 2312253a3814SLawrence Stewart #undef BPF_TSTAMP_EXTERN 2313253a3814SLawrence Stewart 2314547d94bdSJung-uk Kim static int 2315547d94bdSJung-uk Kim bpf_hdrlen(struct bpf_d *d) 2316547d94bdSJung-uk Kim { 2317547d94bdSJung-uk Kim int hdrlen; 2318547d94bdSJung-uk Kim 2319547d94bdSJung-uk Kim hdrlen = d->bd_bif->bif_hdrlen; 2320547d94bdSJung-uk Kim #ifndef BURN_BRIDGES 2321547d94bdSJung-uk Kim if (d->bd_tstamp == BPF_T_NONE || 2322547d94bdSJung-uk Kim BPF_T_FORMAT(d->bd_tstamp) == BPF_T_MICROTIME) 2323547d94bdSJung-uk Kim #ifdef COMPAT_FREEBSD32 2324547d94bdSJung-uk Kim if (d->bd_compat32) 2325547d94bdSJung-uk Kim hdrlen += SIZEOF_BPF_HDR(struct bpf_hdr32); 2326547d94bdSJung-uk Kim else 2327547d94bdSJung-uk Kim #endif 2328547d94bdSJung-uk Kim hdrlen += SIZEOF_BPF_HDR(struct bpf_hdr); 2329547d94bdSJung-uk Kim else 2330547d94bdSJung-uk Kim #endif 2331547d94bdSJung-uk Kim hdrlen += SIZEOF_BPF_HDR(struct bpf_xhdr); 2332547d94bdSJung-uk Kim #ifdef COMPAT_FREEBSD32 2333547d94bdSJung-uk Kim if (d->bd_compat32) 2334547d94bdSJung-uk Kim hdrlen = BPF_WORDALIGN32(hdrlen); 2335547d94bdSJung-uk Kim else 2336547d94bdSJung-uk Kim #endif 2337547d94bdSJung-uk Kim hdrlen = BPF_WORDALIGN(hdrlen); 2338547d94bdSJung-uk Kim 2339547d94bdSJung-uk Kim return (hdrlen - d->bd_bif->bif_hdrlen); 2340547d94bdSJung-uk Kim } 2341547d94bdSJung-uk Kim 2342547d94bdSJung-uk Kim static void 2343547d94bdSJung-uk Kim bpf_bintime2ts(struct bintime *bt, struct bpf_ts *ts, int tstype) 2344547d94bdSJung-uk Kim { 2345584b675eSKonstantin Belousov struct bintime bt2, boottimebin; 2346547d94bdSJung-uk Kim struct timeval tsm; 2347547d94bdSJung-uk Kim struct timespec tsn; 2348547d94bdSJung-uk Kim 2349253a3814SLawrence Stewart if ((tstype & BPF_T_MONOTONIC) == 0) { 2350253a3814SLawrence Stewart bt2 = *bt; 2351584b675eSKonstantin Belousov getboottimebin(&boottimebin); 2352253a3814SLawrence Stewart bintime_add(&bt2, &boottimebin); 2353253a3814SLawrence Stewart bt = &bt2; 2354253a3814SLawrence Stewart } 2355547d94bdSJung-uk Kim switch (BPF_T_FORMAT(tstype)) { 2356547d94bdSJung-uk Kim case BPF_T_MICROTIME: 2357547d94bdSJung-uk Kim bintime2timeval(bt, &tsm); 2358547d94bdSJung-uk Kim ts->bt_sec = tsm.tv_sec; 2359547d94bdSJung-uk Kim ts->bt_frac = tsm.tv_usec; 2360547d94bdSJung-uk Kim break; 2361547d94bdSJung-uk Kim case BPF_T_NANOTIME: 2362547d94bdSJung-uk Kim bintime2timespec(bt, &tsn); 2363547d94bdSJung-uk Kim ts->bt_sec = tsn.tv_sec; 2364547d94bdSJung-uk Kim ts->bt_frac = tsn.tv_nsec; 2365547d94bdSJung-uk Kim break; 2366547d94bdSJung-uk Kim case BPF_T_BINTIME: 2367547d94bdSJung-uk Kim ts->bt_sec = bt->sec; 2368547d94bdSJung-uk Kim ts->bt_frac = bt->frac; 2369547d94bdSJung-uk Kim break; 2370547d94bdSJung-uk Kim } 2371547d94bdSJung-uk Kim } 2372547d94bdSJung-uk Kim 2373437ffe18SSam Leffler /* 2374df8bae1dSRodney W. Grimes * Move the packet data from interface memory (pkt) into the 23759e610888SDag-Erling Smørgrav * store buffer. "cpfn" is the routine called to do the actual data 2376df8bae1dSRodney W. Grimes * transfer. bcopy is passed in to copy contiguous chunks, while 23774d621040SChristian S.J. Peron * bpf_append_mbuf is passed in to copy mbuf chains. In the latter case, 2378df8bae1dSRodney W. Grimes * pkt is really an mbuf. 2379df8bae1dSRodney W. Grimes */ 2380df8bae1dSRodney W. Grimes static void 238119ba8395SChristian S.J. Peron catchpacket(struct bpf_d *d, u_char *pkt, u_int pktlen, u_int snaplen, 23824d621040SChristian S.J. Peron void (*cpfn)(struct bpf_d *, caddr_t, u_int, void *, u_int), 2383547d94bdSJung-uk Kim struct bintime *bt) 2384df8bae1dSRodney W. Grimes { 2385547d94bdSJung-uk Kim struct bpf_xhdr hdr; 2386547d94bdSJung-uk Kim #ifndef BURN_BRIDGES 2387547d94bdSJung-uk Kim struct bpf_hdr hdr_old; 2388fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 2389547d94bdSJung-uk Kim struct bpf_hdr32 hdr32_old; 2390fc0a61a4SKonstantin Belousov #endif 2391547d94bdSJung-uk Kim #endif 2392547d94bdSJung-uk Kim int caplen, curlen, hdrlen, totlen; 23937819da79SJohn-Mark Gurney int do_wakeup = 0; 2394547d94bdSJung-uk Kim int do_timestamp; 2395547d94bdSJung-uk Kim int tstype; 23969e610888SDag-Erling Smørgrav 2397afa85850SAlexander V. Chernikov BPFD_LOCK_ASSERT(d); 23984d621040SChristian S.J. Peron 23994d621040SChristian S.J. Peron /* 24004d621040SChristian S.J. Peron * Detect whether user space has released a buffer back to us, and if 24014d621040SChristian S.J. Peron * so, move it from being a hold buffer to a free buffer. This may 24024d621040SChristian S.J. Peron * not be the best place to do it (for example, we might only want to 24034d621040SChristian S.J. Peron * run this check if we need the space), but for now it's a reliable 24044d621040SChristian S.J. Peron * spot to do it. 24054d621040SChristian S.J. Peron */ 2406fa0c2b34SRobert Watson if (d->bd_fbuf == NULL && bpf_canfreebuf(d)) { 24074d621040SChristian S.J. Peron d->bd_fbuf = d->bd_hbuf; 24084d621040SChristian S.J. Peron d->bd_hbuf = NULL; 24094d621040SChristian S.J. Peron d->bd_hlen = 0; 241029f612ecSChristian S.J. Peron bpf_buf_reclaimed(d); 24114d621040SChristian S.J. Peron } 24124d621040SChristian S.J. Peron 2413df8bae1dSRodney W. Grimes /* 2414df8bae1dSRodney W. Grimes * Figure out how many bytes to move. If the packet is 2415df8bae1dSRodney W. Grimes * greater or equal to the snapshot length, transfer that 2416df8bae1dSRodney W. Grimes * much. Otherwise, transfer the whole packet (unless 2417df8bae1dSRodney W. Grimes * we hit the buffer size limit). 2418df8bae1dSRodney W. Grimes */ 2419547d94bdSJung-uk Kim hdrlen = bpf_hdrlen(d); 2420df8bae1dSRodney W. Grimes totlen = hdrlen + min(snaplen, pktlen); 2421df8bae1dSRodney W. Grimes if (totlen > d->bd_bufsize) 2422df8bae1dSRodney W. Grimes totlen = d->bd_bufsize; 2423df8bae1dSRodney W. Grimes 2424df8bae1dSRodney W. Grimes /* 2425df8bae1dSRodney W. Grimes * Round up the end of the previous packet to the next longword. 2426a7a91e65SRobert Watson * 2427a7a91e65SRobert Watson * Drop the packet if there's no room and no hope of room 2428a7a91e65SRobert Watson * If the packet would overflow the storage buffer or the storage 2429a7a91e65SRobert Watson * buffer is considered immutable by the buffer model, try to rotate 2430a7a91e65SRobert Watson * the buffer and wakeup pending processes. 2431df8bae1dSRodney W. Grimes */ 2432fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 2433fc0a61a4SKonstantin Belousov if (d->bd_compat32) 2434fc0a61a4SKonstantin Belousov curlen = BPF_WORDALIGN32(d->bd_slen); 2435fc0a61a4SKonstantin Belousov else 2436fc0a61a4SKonstantin Belousov #endif 2437df8bae1dSRodney W. Grimes curlen = BPF_WORDALIGN(d->bd_slen); 2438a7a91e65SRobert Watson if (curlen + totlen > d->bd_bufsize || !bpf_canwritebuf(d)) { 2439572bde2aSRobert Watson if (d->bd_fbuf == NULL) { 2440df8bae1dSRodney W. Grimes /* 2441a7a91e65SRobert Watson * There's no room in the store buffer, and no 2442a7a91e65SRobert Watson * prospect of room, so drop the packet. Notify the 2443a7a91e65SRobert Watson * buffer model. 2444df8bae1dSRodney W. Grimes */ 2445a7a91e65SRobert Watson bpf_buffull(d); 2446*b2b7ca49SAlexander V. Chernikov counter_u64_add(d->bd_dcount, 1); 2447df8bae1dSRodney W. Grimes return; 2448df8bae1dSRodney W. Grimes } 244998fa5d85SLuiz Otavio O Souza KASSERT(!d->bd_hbuf_in_use, ("hold buffer is in use")); 2450df8bae1dSRodney W. Grimes ROTATE_BUFFERS(d); 24517819da79SJohn-Mark Gurney do_wakeup = 1; 2452df8bae1dSRodney W. Grimes curlen = 0; 2453a7a91e65SRobert Watson } else if (d->bd_immediate || d->bd_state == BPF_TIMED_OUT) 2454df8bae1dSRodney W. Grimes /* 24554d621040SChristian S.J. Peron * Immediate mode is set, or the read timeout has already 24564d621040SChristian S.J. Peron * expired during a select call. A packet arrived, so the 24574d621040SChristian S.J. Peron * reader should be woken up. 2458df8bae1dSRodney W. Grimes */ 24597819da79SJohn-Mark Gurney do_wakeup = 1; 2460547d94bdSJung-uk Kim caplen = totlen - hdrlen; 2461547d94bdSJung-uk Kim tstype = d->bd_tstamp; 2462547d94bdSJung-uk Kim do_timestamp = tstype != BPF_T_NONE; 2463547d94bdSJung-uk Kim #ifndef BURN_BRIDGES 2464547d94bdSJung-uk Kim if (tstype == BPF_T_NONE || BPF_T_FORMAT(tstype) == BPF_T_MICROTIME) { 2465547d94bdSJung-uk Kim struct bpf_ts ts; 2466547d94bdSJung-uk Kim if (do_timestamp) 2467547d94bdSJung-uk Kim bpf_bintime2ts(bt, &ts, tstype); 2468fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32 2469fc0a61a4SKonstantin Belousov if (d->bd_compat32) { 2470547d94bdSJung-uk Kim bzero(&hdr32_old, sizeof(hdr32_old)); 2471547d94bdSJung-uk Kim if (do_timestamp) { 2472547d94bdSJung-uk Kim hdr32_old.bh_tstamp.tv_sec = ts.bt_sec; 2473547d94bdSJung-uk Kim hdr32_old.bh_tstamp.tv_usec = ts.bt_frac; 2474547d94bdSJung-uk Kim } 2475547d94bdSJung-uk Kim hdr32_old.bh_datalen = pktlen; 2476547d94bdSJung-uk Kim hdr32_old.bh_hdrlen = hdrlen; 2477547d94bdSJung-uk Kim hdr32_old.bh_caplen = caplen; 2478547d94bdSJung-uk Kim bpf_append_bytes(d, d->bd_sbuf, curlen, &hdr32_old, 2479547d94bdSJung-uk Kim sizeof(hdr32_old)); 2480547d94bdSJung-uk Kim goto copy; 2481547d94bdSJung-uk Kim } 2482547d94bdSJung-uk Kim #endif 2483547d94bdSJung-uk Kim bzero(&hdr_old, sizeof(hdr_old)); 2484547d94bdSJung-uk Kim if (do_timestamp) { 2485547d94bdSJung-uk Kim hdr_old.bh_tstamp.tv_sec = ts.bt_sec; 2486547d94bdSJung-uk Kim hdr_old.bh_tstamp.tv_usec = ts.bt_frac; 2487547d94bdSJung-uk Kim } 2488547d94bdSJung-uk Kim hdr_old.bh_datalen = pktlen; 2489547d94bdSJung-uk Kim hdr_old.bh_hdrlen = hdrlen; 2490547d94bdSJung-uk Kim hdr_old.bh_caplen = caplen; 2491547d94bdSJung-uk Kim bpf_append_bytes(d, d->bd_sbuf, curlen, &hdr_old, 2492547d94bdSJung-uk Kim sizeof(hdr_old)); 2493fc0a61a4SKonstantin Belousov goto copy; 2494fc0a61a4SKonstantin Belousov } 2495fc0a61a4SKonstantin Belousov #endif 2496df8bae1dSRodney W. Grimes 2497df8bae1dSRodney W. Grimes /* 24984d621040SChristian S.J. Peron * Append the bpf header. Note we append the actual header size, but 24994d621040SChristian S.J. Peron * move forward the length of the header plus padding. 2500df8bae1dSRodney W. Grimes */ 25014d621040SChristian S.J. Peron bzero(&hdr, sizeof(hdr)); 2502547d94bdSJung-uk Kim if (do_timestamp) 2503547d94bdSJung-uk Kim bpf_bintime2ts(bt, &hdr.bh_tstamp, tstype); 25044d621040SChristian S.J. Peron hdr.bh_datalen = pktlen; 25054d621040SChristian S.J. Peron hdr.bh_hdrlen = hdrlen; 2506547d94bdSJung-uk Kim hdr.bh_caplen = caplen; 25074d621040SChristian S.J. Peron bpf_append_bytes(d, d->bd_sbuf, curlen, &hdr, sizeof(hdr)); 25084d621040SChristian S.J. Peron 2509df8bae1dSRodney W. Grimes /* 2510df8bae1dSRodney W. Grimes * Copy the packet data into the store buffer and update its length. 2511df8bae1dSRodney W. Grimes */ 2512547d94bdSJung-uk Kim #ifndef BURN_BRIDGES 2513fc0a61a4SKonstantin Belousov copy: 2514fc0a61a4SKonstantin Belousov #endif 2515547d94bdSJung-uk Kim (*cpfn)(d, d->bd_sbuf, curlen + hdrlen, pkt, caplen); 2516df8bae1dSRodney W. Grimes d->bd_slen = curlen + totlen; 25177819da79SJohn-Mark Gurney 25187819da79SJohn-Mark Gurney if (do_wakeup) 25197819da79SJohn-Mark Gurney bpf_wakeup(d); 2520df8bae1dSRodney W. Grimes } 2521df8bae1dSRodney W. Grimes 2522df8bae1dSRodney W. Grimes /* 2523df8bae1dSRodney W. Grimes * Free buffers currently in use by a descriptor. 2524df8bae1dSRodney W. Grimes * Called on close. 2525df8bae1dSRodney W. Grimes */ 2526df8bae1dSRodney W. Grimes static void 252719ba8395SChristian S.J. Peron bpf_freed(struct bpf_d *d) 2528df8bae1dSRodney W. Grimes { 25294d621040SChristian S.J. Peron 2530df8bae1dSRodney W. Grimes /* 2531df8bae1dSRodney W. Grimes * We don't need to lock out interrupts since this descriptor has 2532df8bae1dSRodney W. Grimes * been detached from its interface and it yet hasn't been marked 2533df8bae1dSRodney W. Grimes * free. 2534df8bae1dSRodney W. Grimes */ 25354d621040SChristian S.J. Peron bpf_free(d); 253670485847SJung-uk Kim if (d->bd_rfilter != NULL) { 253793e39f0bSChristian S.J. Peron free((caddr_t)d->bd_rfilter, M_BPF); 2538ae275efcSJung-uk Kim #ifdef BPF_JITTER 253970485847SJung-uk Kim if (d->bd_bfilter != NULL) 2540ae275efcSJung-uk Kim bpf_destroy_jit_filter(d->bd_bfilter); 2541ae275efcSJung-uk Kim #endif 2542ae275efcSJung-uk Kim } 254370485847SJung-uk Kim if (d->bd_wfilter != NULL) 254493e39f0bSChristian S.J. Peron free((caddr_t)d->bd_wfilter, M_BPF); 2545afa85850SAlexander V. Chernikov mtx_destroy(&d->bd_lock); 2546*b2b7ca49SAlexander V. Chernikov 2547*b2b7ca49SAlexander V. Chernikov counter_u64_free(d->bd_rcount); 2548*b2b7ca49SAlexander V. Chernikov counter_u64_free(d->bd_dcount); 2549*b2b7ca49SAlexander V. Chernikov counter_u64_free(d->bd_fcount); 2550*b2b7ca49SAlexander V. Chernikov counter_u64_free(d->bd_wcount); 2551*b2b7ca49SAlexander V. Chernikov counter_u64_free(d->bd_wfcount); 2552*b2b7ca49SAlexander V. Chernikov counter_u64_free(d->bd_wdcount); 2553*b2b7ca49SAlexander V. Chernikov counter_u64_free(d->bd_zcopy); 2554*b2b7ca49SAlexander V. Chernikov 2555df8bae1dSRodney W. Grimes } 2556df8bae1dSRodney W. Grimes 2557df8bae1dSRodney W. Grimes /* 255824a229f4SSam Leffler * Attach an interface to bpf. dlt is the link layer type; hdrlen is the 255924a229f4SSam Leffler * fixed size of the link header (variable length headers not yet supported). 2560df8bae1dSRodney W. Grimes */ 2561df8bae1dSRodney W. Grimes void 256219ba8395SChristian S.J. Peron bpfattach(struct ifnet *ifp, u_int dlt, u_int hdrlen) 2563df8bae1dSRodney W. Grimes { 256424a229f4SSam Leffler 256524a229f4SSam Leffler bpfattach2(ifp, dlt, hdrlen, &ifp->if_bpf); 256624a229f4SSam Leffler } 256724a229f4SSam Leffler 256824a229f4SSam Leffler /* 256924a229f4SSam Leffler * Attach an interface to bpf. ifp is a pointer to the structure 257024a229f4SSam Leffler * defining the interface to be attached, dlt is the link layer type, 257124a229f4SSam Leffler * and hdrlen is the fixed size of the link header (variable length 257224a229f4SSam Leffler * headers are not yet supporrted). 257324a229f4SSam Leffler */ 257424a229f4SSam Leffler void 257519ba8395SChristian S.J. Peron bpfattach2(struct ifnet *ifp, u_int dlt, u_int hdrlen, struct bpf_if **driverp) 257624a229f4SSam Leffler { 2577df8bae1dSRodney W. Grimes struct bpf_if *bp; 257819ba8395SChristian S.J. Peron 257919ba8395SChristian S.J. Peron bp = malloc(sizeof(*bp), M_BPF, M_NOWAIT | M_ZERO); 2580572bde2aSRobert Watson if (bp == NULL) 2581df8bae1dSRodney W. Grimes panic("bpfattach"); 2582df8bae1dSRodney W. Grimes 25834a3feeaaSRobert Watson LIST_INIT(&bp->bif_dlist); 258451ec1eb7SAlexander V. Chernikov LIST_INIT(&bp->bif_wlist); 2585df8bae1dSRodney W. Grimes bp->bif_ifp = ifp; 2586df8bae1dSRodney W. Grimes bp->bif_dlt = dlt; 2587e4b3229aSAlexander V. Chernikov rw_init(&bp->bif_lock, "bpf interface lock"); 258816d878ccSChristian S.J. Peron KASSERT(*driverp == NULL, ("bpfattach2: driverp already initialized")); 25899ce40d32SKristof Provost bp->bif_bpf = driverp; 259016d878ccSChristian S.J. Peron *driverp = bp; 2591df8bae1dSRodney W. Grimes 2592e4b3229aSAlexander V. Chernikov BPF_LOCK(); 25934a3feeaaSRobert Watson LIST_INSERT_HEAD(&bpf_iflist, bp, bif_next); 2594e4b3229aSAlexander V. Chernikov BPF_UNLOCK(); 2595df8bae1dSRodney W. Grimes 2596547d94bdSJung-uk Kim bp->bif_hdrlen = hdrlen; 2597df8bae1dSRodney W. Grimes 2598616bc4f4SBjoern A. Zeeb if (bootverbose && IS_DEFAULT_VNET(curvnet)) 259924a229f4SSam Leffler if_printf(ifp, "bpf attached\n"); 2600df8bae1dSRodney W. Grimes } 260153ac6efbSJulian Elischer 260205fc4164SBjoern A. Zeeb #ifdef VIMAGE 260305fc4164SBjoern A. Zeeb /* 260405fc4164SBjoern A. Zeeb * When moving interfaces between vnet instances we need a way to 260505fc4164SBjoern A. Zeeb * query the dlt and hdrlen before detach so we can re-attch the if_bpf 260605fc4164SBjoern A. Zeeb * after the vmove. We unfortunately have no device driver infrastructure 260705fc4164SBjoern A. Zeeb * to query the interface for these values after creation/attach, thus 260805fc4164SBjoern A. Zeeb * add this as a workaround. 260905fc4164SBjoern A. Zeeb */ 261005fc4164SBjoern A. Zeeb int 261105fc4164SBjoern A. Zeeb bpf_get_bp_params(struct bpf_if *bp, u_int *bif_dlt, u_int *bif_hdrlen) 261205fc4164SBjoern A. Zeeb { 261305fc4164SBjoern A. Zeeb 261405fc4164SBjoern A. Zeeb if (bp == NULL) 261505fc4164SBjoern A. Zeeb return (ENXIO); 261605fc4164SBjoern A. Zeeb if (bif_dlt == NULL && bif_hdrlen == NULL) 261705fc4164SBjoern A. Zeeb return (0); 261805fc4164SBjoern A. Zeeb 261905fc4164SBjoern A. Zeeb if (bif_dlt != NULL) 262005fc4164SBjoern A. Zeeb *bif_dlt = bp->bif_dlt; 262105fc4164SBjoern A. Zeeb if (bif_hdrlen != NULL) 262205fc4164SBjoern A. Zeeb *bif_hdrlen = bp->bif_hdrlen; 262305fc4164SBjoern A. Zeeb 262405fc4164SBjoern A. Zeeb return (0); 262505fc4164SBjoern A. Zeeb } 262605fc4164SBjoern A. Zeeb #endif 262705fc4164SBjoern A. Zeeb 2628de5d9935SRobert Watson /* 2629de5d9935SRobert Watson * Detach bpf from an interface. This involves detaching each descriptor 26306c74ff0eSAlexander V. Chernikov * associated with the interface. Notify each descriptor as it's detached 26316c74ff0eSAlexander V. Chernikov * so that any sleepers wake up and get ENXIO. 2632de5d9935SRobert Watson */ 2633de5d9935SRobert Watson void 263419ba8395SChristian S.J. Peron bpfdetach(struct ifnet *ifp) 2635de5d9935SRobert Watson { 2636f079a0faSAlexander V. Chernikov struct bpf_if *bp, *bp_temp; 2637de5d9935SRobert Watson struct bpf_d *d; 26389a7e6bacSLawrence Stewart int ndetached; 2639de5d9935SRobert Watson 26409a7e6bacSLawrence Stewart ndetached = 0; 26419a7e6bacSLawrence Stewart 2642afa85850SAlexander V. Chernikov BPF_LOCK(); 26439a7e6bacSLawrence Stewart /* Find all bpf_if struct's which reference ifp and detach them. */ 2644f079a0faSAlexander V. Chernikov LIST_FOREACH_SAFE(bp, &bpf_iflist, bif_next, bp_temp) { 2645f079a0faSAlexander V. Chernikov if (ifp != bp->bif_ifp) 2646f079a0faSAlexander V. Chernikov continue; 2647de5d9935SRobert Watson 2648f079a0faSAlexander V. Chernikov LIST_REMOVE(bp, bif_next); 2649f079a0faSAlexander V. Chernikov /* Add to to-be-freed list */ 2650f079a0faSAlexander V. Chernikov LIST_INSERT_HEAD(&bpf_freelist, bp, bif_next); 2651f079a0faSAlexander V. Chernikov 26529a7e6bacSLawrence Stewart ndetached++; 2653f079a0faSAlexander V. Chernikov /* 2654f079a0faSAlexander V. Chernikov * Delay freeing bp till interface is detached 2655f079a0faSAlexander V. Chernikov * and all routes through this interface are removed. 2656f079a0faSAlexander V. Chernikov * Mark bp as detached to restrict new consumers. 2657f079a0faSAlexander V. Chernikov */ 2658f079a0faSAlexander V. Chernikov BPFIF_WLOCK(bp); 2659b23cbbe6SMark Johnston bp->bif_flags |= BPFIF_FLAG_DYING; 26609ce40d32SKristof Provost *bp->bif_bpf = NULL; 2661f079a0faSAlexander V. Chernikov BPFIF_WUNLOCK(bp); 2662f079a0faSAlexander V. Chernikov 2663f079a0faSAlexander V. Chernikov CTR4(KTR_NET, "%s: sheduling free for encap %d (%p) for if %p", 2664f079a0faSAlexander V. Chernikov __func__, bp->bif_dlt, bp, ifp); 2665f079a0faSAlexander V. Chernikov 2666f079a0faSAlexander V. Chernikov /* Free common descriptors */ 26674a3feeaaSRobert Watson while ((d = LIST_FIRST(&bp->bif_dlist)) != NULL) { 2668afa85850SAlexander V. Chernikov bpf_detachd_locked(d); 2669afa85850SAlexander V. Chernikov BPFD_LOCK(d); 2670e7bb21b3SJonathan Lemon bpf_wakeup(d); 2671afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 2672e7bb21b3SJonathan Lemon } 2673f079a0faSAlexander V. Chernikov 26746c74ff0eSAlexander V. Chernikov /* Free writer-only descriptors */ 26756c74ff0eSAlexander V. Chernikov while ((d = LIST_FIRST(&bp->bif_wlist)) != NULL) { 2676afa85850SAlexander V. Chernikov bpf_detachd_locked(d); 2677afa85850SAlexander V. Chernikov BPFD_LOCK(d); 26786c74ff0eSAlexander V. Chernikov bpf_wakeup(d); 2679afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 26806c74ff0eSAlexander V. Chernikov } 26818eab61f3SSam Leffler } 2682afa85850SAlexander V. Chernikov BPF_UNLOCK(); 26839a7e6bacSLawrence Stewart 26849a7e6bacSLawrence Stewart #ifdef INVARIANTS 26859a7e6bacSLawrence Stewart if (ndetached == 0) 26869a7e6bacSLawrence Stewart printf("bpfdetach: %s was not attached\n", ifp->if_xname); 26879a7e6bacSLawrence Stewart #endif 26889a7e6bacSLawrence Stewart } 2689de5d9935SRobert Watson 26908eab61f3SSam Leffler /* 2691784292f8SAlexander V. Chernikov * Interface departure handler. 26924fe83b81SAlexander V. Chernikov * Note departure event does not guarantee interface is going down. 2693f079a0faSAlexander V. Chernikov * Interface renaming is currently done via departure/arrival event set. 2694f079a0faSAlexander V. Chernikov * 2695f079a0faSAlexander V. Chernikov * Departure handled is called after all routes pointing to 2696f079a0faSAlexander V. Chernikov * given interface are removed and interface is in down state 2697f079a0faSAlexander V. Chernikov * restricting any packets to be sent/received. We assume it is now safe 2698f079a0faSAlexander V. Chernikov * to free data allocated by BPF. 2699afa85850SAlexander V. Chernikov */ 2700afa85850SAlexander V. Chernikov static void 2701afa85850SAlexander V. Chernikov bpf_ifdetach(void *arg __unused, struct ifnet *ifp) 2702afa85850SAlexander V. Chernikov { 2703f079a0faSAlexander V. Chernikov struct bpf_if *bp, *bp_temp; 2704f079a0faSAlexander V. Chernikov int nmatched = 0; 2705afa85850SAlexander V. Chernikov 2706250a8e27SAndrey V. Elsukov /* Ignore ifnet renaming. */ 2707250a8e27SAndrey V. Elsukov if (ifp->if_flags & IFF_RENAMING) 2708250a8e27SAndrey V. Elsukov return; 2709250a8e27SAndrey V. Elsukov 2710784292f8SAlexander V. Chernikov BPF_LOCK(); 2711f079a0faSAlexander V. Chernikov /* 2712f079a0faSAlexander V. Chernikov * Find matching entries in free list. 2713f079a0faSAlexander V. Chernikov * Nothing should be found if bpfdetach() was not called. 2714f079a0faSAlexander V. Chernikov */ 2715f079a0faSAlexander V. Chernikov LIST_FOREACH_SAFE(bp, &bpf_freelist, bif_next, bp_temp) { 2716f079a0faSAlexander V. Chernikov if (ifp != bp->bif_ifp) 2717f079a0faSAlexander V. Chernikov continue; 2718784292f8SAlexander V. Chernikov 2719f079a0faSAlexander V. Chernikov CTR3(KTR_NET, "%s: freeing BPF instance %p for interface %p", 2720afa85850SAlexander V. Chernikov __func__, bp, ifp); 2721afa85850SAlexander V. Chernikov 2722f079a0faSAlexander V. Chernikov LIST_REMOVE(bp, bif_next); 2723784292f8SAlexander V. Chernikov 2724afa85850SAlexander V. Chernikov rw_destroy(&bp->bif_lock); 2725afa85850SAlexander V. Chernikov free(bp, M_BPF); 2726f079a0faSAlexander V. Chernikov 2727f079a0faSAlexander V. Chernikov nmatched++; 2728f079a0faSAlexander V. Chernikov } 2729f079a0faSAlexander V. Chernikov BPF_UNLOCK(); 2730afa85850SAlexander V. Chernikov } 2731afa85850SAlexander V. Chernikov 2732afa85850SAlexander V. Chernikov /* 27338eab61f3SSam Leffler * Get a list of available data link type of the interface. 27348eab61f3SSam Leffler */ 27358eab61f3SSam Leffler static int 273619ba8395SChristian S.J. Peron bpf_getdltlist(struct bpf_d *d, struct bpf_dltlist *bfl) 27378eab61f3SSam Leffler { 27388eab61f3SSam Leffler struct ifnet *ifp; 27398eab61f3SSam Leffler struct bpf_if *bp; 274070209acaSKonstantin Belousov u_int *lst; 274170209acaSKonstantin Belousov int error, n, n1; 27428eab61f3SSam Leffler 274397aacec6SAlexander V. Chernikov BPF_LOCK_ASSERT(); 274497aacec6SAlexander V. Chernikov 27458eab61f3SSam Leffler ifp = d->bd_bif->bif_ifp; 274670209acaSKonstantin Belousov again: 274770209acaSKonstantin Belousov n1 = 0; 274870209acaSKonstantin Belousov LIST_FOREACH(bp, &bpf_iflist, bif_next) { 274970209acaSKonstantin Belousov if (bp->bif_ifp == ifp) 275070209acaSKonstantin Belousov n1++; 275170209acaSKonstantin Belousov } 275270209acaSKonstantin Belousov if (bfl->bfl_list == NULL) { 275370209acaSKonstantin Belousov bfl->bfl_len = n1; 275470209acaSKonstantin Belousov return (0); 275570209acaSKonstantin Belousov } 275670209acaSKonstantin Belousov if (n1 > bfl->bfl_len) 275770209acaSKonstantin Belousov return (ENOMEM); 275870209acaSKonstantin Belousov BPF_UNLOCK(); 275970209acaSKonstantin Belousov lst = malloc(n1 * sizeof(u_int), M_TEMP, M_WAITOK); 27608eab61f3SSam Leffler n = 0; 276170209acaSKonstantin Belousov BPF_LOCK(); 27624a3feeaaSRobert Watson LIST_FOREACH(bp, &bpf_iflist, bif_next) { 27638eab61f3SSam Leffler if (bp->bif_ifp != ifp) 27648eab61f3SSam Leffler continue; 27655412ec6eSConrad Meyer if (n >= n1) { 276670209acaSKonstantin Belousov free(lst, M_TEMP); 276770209acaSKonstantin Belousov goto again; 27688eab61f3SSam Leffler } 276970209acaSKonstantin Belousov lst[n] = bp->bif_dlt; 27708eab61f3SSam Leffler n++; 27718eab61f3SSam Leffler } 277270209acaSKonstantin Belousov BPF_UNLOCK(); 277370209acaSKonstantin Belousov error = copyout(lst, bfl->bfl_list, sizeof(u_int) * n); 277470209acaSKonstantin Belousov free(lst, M_TEMP); 277570209acaSKonstantin Belousov BPF_LOCK(); 27768eab61f3SSam Leffler bfl->bfl_len = n; 27778eab61f3SSam Leffler return (error); 27788eab61f3SSam Leffler } 27798eab61f3SSam Leffler 27808eab61f3SSam Leffler /* 27818eab61f3SSam Leffler * Set the data link type of a BPF instance. 27828eab61f3SSam Leffler */ 27838eab61f3SSam Leffler static int 278419ba8395SChristian S.J. Peron bpf_setdlt(struct bpf_d *d, u_int dlt) 27858eab61f3SSam Leffler { 27868eab61f3SSam Leffler int error, opromisc; 27878eab61f3SSam Leffler struct ifnet *ifp; 27888eab61f3SSam Leffler struct bpf_if *bp; 27898eab61f3SSam Leffler 27906c74ff0eSAlexander V. Chernikov BPF_LOCK_ASSERT(); 27916c74ff0eSAlexander V. Chernikov 27928eab61f3SSam Leffler if (d->bd_bif->bif_dlt == dlt) 27938eab61f3SSam Leffler return (0); 27948eab61f3SSam Leffler ifp = d->bd_bif->bif_ifp; 27956c74ff0eSAlexander V. Chernikov 27964a3feeaaSRobert Watson LIST_FOREACH(bp, &bpf_iflist, bif_next) { 27978eab61f3SSam Leffler if (bp->bif_ifp == ifp && bp->bif_dlt == dlt) 27988eab61f3SSam Leffler break; 27998eab61f3SSam Leffler } 28006c74ff0eSAlexander V. Chernikov 28018eab61f3SSam Leffler if (bp != NULL) { 28028eab61f3SSam Leffler opromisc = d->bd_promisc; 28038eab61f3SSam Leffler bpf_attachd(d, bp); 2804afa85850SAlexander V. Chernikov BPFD_LOCK(d); 28058eab61f3SSam Leffler reset_d(d); 2806afa85850SAlexander V. Chernikov BPFD_UNLOCK(d); 28078eab61f3SSam Leffler if (opromisc) { 28088eab61f3SSam Leffler error = ifpromisc(bp->bif_ifp, 1); 28098eab61f3SSam Leffler if (error) 28108eab61f3SSam Leffler if_printf(bp->bif_ifp, 28118eab61f3SSam Leffler "bpf_setdlt: ifpromisc failed (%d)\n", 28128eab61f3SSam Leffler error); 28138eab61f3SSam Leffler else 28148eab61f3SSam Leffler d->bd_promisc = 1; 28158eab61f3SSam Leffler } 28168eab61f3SSam Leffler } 28178eab61f3SSam Leffler return (bp == NULL ? EINVAL : 0); 2818de5d9935SRobert Watson } 2819de5d9935SRobert Watson 28203f54a085SPoul-Henning Kamp static void 282119ba8395SChristian S.J. Peron bpf_drvinit(void *unused) 282253ac6efbSJulian Elischer { 2823136600feSEd Schouten struct cdev *dev; 282453ac6efbSJulian Elischer 28256008862bSJohn Baldwin mtx_init(&bpf_mtx, "bpf global lock", NULL, MTX_DEF); 28264a3feeaaSRobert Watson LIST_INIT(&bpf_iflist); 2827f079a0faSAlexander V. Chernikov LIST_INIT(&bpf_freelist); 2828136600feSEd Schouten 2829136600feSEd Schouten dev = make_dev(&bpf_cdevsw, 0, UID_ROOT, GID_WHEEL, 0600, "bpf"); 2830136600feSEd Schouten /* For compatibility */ 2831136600feSEd Schouten make_dev_alias(dev, "bpf0"); 2832afa85850SAlexander V. Chernikov 2833afa85850SAlexander V. Chernikov /* Register interface departure handler */ 2834afa85850SAlexander V. Chernikov bpf_ifdetach_cookie = EVENTHANDLER_REGISTER( 2835afa85850SAlexander V. Chernikov ifnet_departure_event, bpf_ifdetach, NULL, 2836afa85850SAlexander V. Chernikov EVENTHANDLER_PRI_ANY); 28377198bf47SJulian Elischer } 283853ac6efbSJulian Elischer 28390e37f3e1SChristian S.J. Peron /* 28400e37f3e1SChristian S.J. Peron * Zero out the various packet counters associated with all of the bpf 28410e37f3e1SChristian S.J. Peron * descriptors. At some point, we will probably want to get a bit more 28420e37f3e1SChristian S.J. Peron * granular and allow the user to specify descriptors to be zeroed. 28430e37f3e1SChristian S.J. Peron */ 28440e37f3e1SChristian S.J. Peron static void 28450e37f3e1SChristian S.J. Peron bpf_zero_counters(void) 28460e37f3e1SChristian S.J. Peron { 28470e37f3e1SChristian S.J. Peron struct bpf_if *bp; 28480e37f3e1SChristian S.J. Peron struct bpf_d *bd; 28490e37f3e1SChristian S.J. Peron 2850e4b3229aSAlexander V. Chernikov BPF_LOCK(); 28510e37f3e1SChristian S.J. Peron LIST_FOREACH(bp, &bpf_iflist, bif_next) { 2852e4b3229aSAlexander V. Chernikov BPFIF_RLOCK(bp); 28530e37f3e1SChristian S.J. Peron LIST_FOREACH(bd, &bp->bif_dlist, bd_next) { 2854afa85850SAlexander V. Chernikov BPFD_LOCK(bd); 2855*b2b7ca49SAlexander V. Chernikov counter_u64_zero(bd->bd_rcount); 2856*b2b7ca49SAlexander V. Chernikov counter_u64_zero(bd->bd_dcount); 2857*b2b7ca49SAlexander V. Chernikov counter_u64_zero(bd->bd_fcount); 2858*b2b7ca49SAlexander V. Chernikov counter_u64_zero(bd->bd_wcount); 2859*b2b7ca49SAlexander V. Chernikov counter_u64_zero(bd->bd_wfcount); 2860*b2b7ca49SAlexander V. Chernikov counter_u64_zero(bd->bd_zcopy); 2861afa85850SAlexander V. Chernikov BPFD_UNLOCK(bd); 28620e37f3e1SChristian S.J. Peron } 2863e4b3229aSAlexander V. Chernikov BPFIF_RUNLOCK(bp); 28640e37f3e1SChristian S.J. Peron } 2865e4b3229aSAlexander V. Chernikov BPF_UNLOCK(); 28660e37f3e1SChristian S.J. Peron } 28670e37f3e1SChristian S.J. Peron 28686c74ff0eSAlexander V. Chernikov /* 28696c74ff0eSAlexander V. Chernikov * Fill filter statistics 28706c74ff0eSAlexander V. Chernikov */ 287169f7644bSChristian S.J. Peron static void 287269f7644bSChristian S.J. Peron bpfstats_fill_xbpf(struct xbpf_d *d, struct bpf_d *bd) 287369f7644bSChristian S.J. Peron { 287469f7644bSChristian S.J. Peron 287569f7644bSChristian S.J. Peron bzero(d, sizeof(*d)); 287669f7644bSChristian S.J. Peron BPFD_LOCK_ASSERT(bd); 28774d621040SChristian S.J. Peron d->bd_structsize = sizeof(*d); 28786c74ff0eSAlexander V. Chernikov /* XXX: reading should be protected by global lock */ 287969f7644bSChristian S.J. Peron d->bd_immediate = bd->bd_immediate; 288069f7644bSChristian S.J. Peron d->bd_promisc = bd->bd_promisc; 288169f7644bSChristian S.J. Peron d->bd_hdrcmplt = bd->bd_hdrcmplt; 2882560a54e1SJung-uk Kim d->bd_direction = bd->bd_direction; 2883560a54e1SJung-uk Kim d->bd_feedback = bd->bd_feedback; 288469f7644bSChristian S.J. Peron d->bd_async = bd->bd_async; 2885*b2b7ca49SAlexander V. Chernikov d->bd_rcount = counter_u64_fetch(bd->bd_rcount); 2886*b2b7ca49SAlexander V. Chernikov d->bd_dcount = counter_u64_fetch(bd->bd_dcount); 2887*b2b7ca49SAlexander V. Chernikov d->bd_fcount = counter_u64_fetch(bd->bd_fcount); 288869f7644bSChristian S.J. Peron d->bd_sig = bd->bd_sig; 288969f7644bSChristian S.J. Peron d->bd_slen = bd->bd_slen; 289069f7644bSChristian S.J. Peron d->bd_hlen = bd->bd_hlen; 289169f7644bSChristian S.J. Peron d->bd_bufsize = bd->bd_bufsize; 289269f7644bSChristian S.J. Peron d->bd_pid = bd->bd_pid; 289369f7644bSChristian S.J. Peron strlcpy(d->bd_ifname, 289469f7644bSChristian S.J. Peron bd->bd_bif->bif_ifp->if_xname, IFNAMSIZ); 289593e39f0bSChristian S.J. Peron d->bd_locked = bd->bd_locked; 2896*b2b7ca49SAlexander V. Chernikov d->bd_wcount = counter_u64_fetch(bd->bd_wcount); 2897*b2b7ca49SAlexander V. Chernikov d->bd_wdcount = counter_u64_fetch(bd->bd_wdcount); 2898*b2b7ca49SAlexander V. Chernikov d->bd_wfcount = counter_u64_fetch(bd->bd_wfcount); 2899*b2b7ca49SAlexander V. Chernikov d->bd_zcopy = counter_u64_fetch(bd->bd_zcopy); 29004d621040SChristian S.J. Peron d->bd_bufmode = bd->bd_bufmode; 290169f7644bSChristian S.J. Peron } 290269f7644bSChristian S.J. Peron 29036c74ff0eSAlexander V. Chernikov /* 29046c74ff0eSAlexander V. Chernikov * Handle `netstat -B' stats request 29056c74ff0eSAlexander V. Chernikov */ 290669f7644bSChristian S.J. Peron static int 290769f7644bSChristian S.J. Peron bpf_stats_sysctl(SYSCTL_HANDLER_ARGS) 290869f7644bSChristian S.J. Peron { 29090e1152fcSHans Petter Selasky static const struct xbpf_d zerostats; 29100e1152fcSHans Petter Selasky struct xbpf_d *xbdbuf, *xbd, tempstats; 2911422a63daSChristian S.J. Peron int index, error; 291269f7644bSChristian S.J. Peron struct bpf_if *bp; 291369f7644bSChristian S.J. Peron struct bpf_d *bd; 291469f7644bSChristian S.J. Peron 291569f7644bSChristian S.J. Peron /* 291669f7644bSChristian S.J. Peron * XXX This is not technically correct. It is possible for non 291769f7644bSChristian S.J. Peron * privileged users to open bpf devices. It would make sense 291869f7644bSChristian S.J. Peron * if the users who opened the devices were able to retrieve 291969f7644bSChristian S.J. Peron * the statistics for them, too. 292069f7644bSChristian S.J. Peron */ 2921acd3428bSRobert Watson error = priv_check(req->td, PRIV_NET_BPF); 292269f7644bSChristian S.J. Peron if (error) 292369f7644bSChristian S.J. Peron return (error); 29240e37f3e1SChristian S.J. Peron /* 29250e37f3e1SChristian S.J. Peron * Check to see if the user is requesting that the counters be 29260e37f3e1SChristian S.J. Peron * zeroed out. Explicitly check that the supplied data is zeroed, 29270e37f3e1SChristian S.J. Peron * as we aren't allowing the user to set the counters currently. 29280e37f3e1SChristian S.J. Peron */ 29290e37f3e1SChristian S.J. Peron if (req->newptr != NULL) { 29300e1152fcSHans Petter Selasky if (req->newlen != sizeof(tempstats)) 29310e37f3e1SChristian S.J. Peron return (EINVAL); 29320e1152fcSHans Petter Selasky memset(&tempstats, 0, sizeof(tempstats)); 29330e1152fcSHans Petter Selasky error = SYSCTL_IN(req, &tempstats, sizeof(tempstats)); 29340e1152fcSHans Petter Selasky if (error) 29350e1152fcSHans Petter Selasky return (error); 29360e1152fcSHans Petter Selasky if (bcmp(&tempstats, &zerostats, sizeof(tempstats)) != 0) 29370e37f3e1SChristian S.J. Peron return (EINVAL); 29380e37f3e1SChristian S.J. Peron bpf_zero_counters(); 29390e37f3e1SChristian S.J. Peron return (0); 29400e37f3e1SChristian S.J. Peron } 294169f7644bSChristian S.J. Peron if (req->oldptr == NULL) 2942422a63daSChristian S.J. Peron return (SYSCTL_OUT(req, 0, bpf_bpfd_cnt * sizeof(*xbd))); 294369f7644bSChristian S.J. Peron if (bpf_bpfd_cnt == 0) 294469f7644bSChristian S.J. Peron return (SYSCTL_OUT(req, 0, 0)); 2945422a63daSChristian S.J. Peron xbdbuf = malloc(req->oldlen, M_BPF, M_WAITOK); 2946e4b3229aSAlexander V. Chernikov BPF_LOCK(); 2947422a63daSChristian S.J. Peron if (req->oldlen < (bpf_bpfd_cnt * sizeof(*xbd))) { 2948e4b3229aSAlexander V. Chernikov BPF_UNLOCK(); 2949422a63daSChristian S.J. Peron free(xbdbuf, M_BPF); 2950422a63daSChristian S.J. Peron return (ENOMEM); 2951422a63daSChristian S.J. Peron } 2952422a63daSChristian S.J. Peron index = 0; 295369f7644bSChristian S.J. Peron LIST_FOREACH(bp, &bpf_iflist, bif_next) { 2954e4b3229aSAlexander V. Chernikov BPFIF_RLOCK(bp); 295551ec1eb7SAlexander V. Chernikov /* Send writers-only first */ 295651ec1eb7SAlexander V. Chernikov LIST_FOREACH(bd, &bp->bif_wlist, bd_next) { 295751ec1eb7SAlexander V. Chernikov xbd = &xbdbuf[index++]; 2958afa85850SAlexander V. Chernikov BPFD_LOCK(bd); 295951ec1eb7SAlexander V. Chernikov bpfstats_fill_xbpf(xbd, bd); 2960afa85850SAlexander V. Chernikov BPFD_UNLOCK(bd); 296151ec1eb7SAlexander V. Chernikov } 296269f7644bSChristian S.J. Peron LIST_FOREACH(bd, &bp->bif_dlist, bd_next) { 2963422a63daSChristian S.J. Peron xbd = &xbdbuf[index++]; 2964afa85850SAlexander V. Chernikov BPFD_LOCK(bd); 2965422a63daSChristian S.J. Peron bpfstats_fill_xbpf(xbd, bd); 2966afa85850SAlexander V. Chernikov BPFD_UNLOCK(bd); 296769f7644bSChristian S.J. Peron } 2968e4b3229aSAlexander V. Chernikov BPFIF_RUNLOCK(bp); 296969f7644bSChristian S.J. Peron } 2970e4b3229aSAlexander V. Chernikov BPF_UNLOCK(); 2971422a63daSChristian S.J. Peron error = SYSCTL_OUT(req, xbdbuf, index * sizeof(*xbd)); 2972422a63daSChristian S.J. Peron free(xbdbuf, M_BPF); 297369f7644bSChristian S.J. Peron return (error); 297469f7644bSChristian S.J. Peron } 297569f7644bSChristian S.J. Peron 2976237fdd78SRobert Watson SYSINIT(bpfdev,SI_SUB_DRIVERS,SI_ORDER_MIDDLE,bpf_drvinit,NULL); 297753ac6efbSJulian Elischer 29785bb5f2c9SPeter Wemm #else /* !DEV_BPF && !NETGRAPH_BPF */ 2979f8dc4716SMike Smith /* 2980f8dc4716SMike Smith * NOP stubs to allow bpf-using drivers to load and function. 2981f8dc4716SMike Smith * 2982f8dc4716SMike Smith * A 'better' implementation would allow the core bpf functionality 2983f8dc4716SMike Smith * to be loaded at runtime. 2984f8dc4716SMike Smith */ 29857eae78a4SChristian S.J. Peron static struct bpf_if bp_null; 2986f8dc4716SMike Smith 2987f8dc4716SMike Smith void 298819ba8395SChristian S.J. Peron bpf_tap(struct bpf_if *bp, u_char *pkt, u_int pktlen) 2989f8dc4716SMike Smith { 2990f8dc4716SMike Smith } 2991f8dc4716SMike Smith 2992f8dc4716SMike Smith void 299319ba8395SChristian S.J. Peron bpf_mtap(struct bpf_if *bp, struct mbuf *m) 2994f8dc4716SMike Smith { 2995f8dc4716SMike Smith } 2996f8dc4716SMike Smith 2997f8dc4716SMike Smith void 299819ba8395SChristian S.J. Peron bpf_mtap2(struct bpf_if *bp, void *d, u_int l, struct mbuf *m) 2999437ffe18SSam Leffler { 3000437ffe18SSam Leffler } 3001437ffe18SSam Leffler 3002437ffe18SSam Leffler void 300319ba8395SChristian S.J. Peron bpfattach(struct ifnet *ifp, u_int dlt, u_int hdrlen) 3004f8dc4716SMike Smith { 30057eae78a4SChristian S.J. Peron 30067eae78a4SChristian S.J. Peron bpfattach2(ifp, dlt, hdrlen, &ifp->if_bpf); 3007f8dc4716SMike Smith } 3008f8dc4716SMike Smith 3009da626c17SBill Paul void 301019ba8395SChristian S.J. Peron bpfattach2(struct ifnet *ifp, u_int dlt, u_int hdrlen, struct bpf_if **driverp) 30115f7a7923SSam Leffler { 30127eae78a4SChristian S.J. Peron 30137eae78a4SChristian S.J. Peron *driverp = &bp_null; 30145f7a7923SSam Leffler } 30155f7a7923SSam Leffler 30165f7a7923SSam Leffler void 301719ba8395SChristian S.J. Peron bpfdetach(struct ifnet *ifp) 3018da626c17SBill Paul { 3019da626c17SBill Paul } 3020da626c17SBill Paul 3021f8dc4716SMike Smith u_int 302219ba8395SChristian S.J. Peron bpf_filter(const struct bpf_insn *pc, u_char *p, u_int wirelen, u_int buflen) 3023f8dc4716SMike Smith { 3024f8dc4716SMike Smith return -1; /* "no filter" behaviour */ 3025f8dc4716SMike Smith } 3026f8dc4716SMike Smith 30275bb5f2c9SPeter Wemm int 302819ba8395SChristian S.J. Peron bpf_validate(const struct bpf_insn *f, int len) 30295bb5f2c9SPeter Wemm { 30305bb5f2c9SPeter Wemm return 0; /* false */ 30315bb5f2c9SPeter Wemm } 30325bb5f2c9SPeter Wemm 30335bb5f2c9SPeter Wemm #endif /* !DEV_BPF && !NETGRAPH_BPF */ 303405fc4164SBjoern A. Zeeb 303505fc4164SBjoern A. Zeeb #ifdef DDB 303605fc4164SBjoern A. Zeeb static void 303705fc4164SBjoern A. Zeeb bpf_show_bpf_if(struct bpf_if *bpf_if) 303805fc4164SBjoern A. Zeeb { 303905fc4164SBjoern A. Zeeb 304005fc4164SBjoern A. Zeeb if (bpf_if == NULL) 304105fc4164SBjoern A. Zeeb return; 304205fc4164SBjoern A. Zeeb db_printf("%p:\n", bpf_if); 304305fc4164SBjoern A. Zeeb #define BPF_DB_PRINTF(f, e) db_printf(" %s = " f "\n", #e, bpf_if->e); 304405fc4164SBjoern A. Zeeb /* bif_ext.bif_next */ 304505fc4164SBjoern A. Zeeb /* bif_ext.bif_dlist */ 304605fc4164SBjoern A. Zeeb BPF_DB_PRINTF("%#x", bif_dlt); 304705fc4164SBjoern A. Zeeb BPF_DB_PRINTF("%u", bif_hdrlen); 304805fc4164SBjoern A. Zeeb BPF_DB_PRINTF("%p", bif_ifp); 304905fc4164SBjoern A. Zeeb /* bif_lock */ 305005fc4164SBjoern A. Zeeb /* bif_wlist */ 305105fc4164SBjoern A. Zeeb BPF_DB_PRINTF("%#x", bif_flags); 305205fc4164SBjoern A. Zeeb } 305305fc4164SBjoern A. Zeeb 305405fc4164SBjoern A. Zeeb DB_SHOW_COMMAND(bpf_if, db_show_bpf_if) 305505fc4164SBjoern A. Zeeb { 305605fc4164SBjoern A. Zeeb 305705fc4164SBjoern A. Zeeb if (!have_addr) { 305805fc4164SBjoern A. Zeeb db_printf("usage: show bpf_if <struct bpf_if *>\n"); 305905fc4164SBjoern A. Zeeb return; 306005fc4164SBjoern A. Zeeb } 306105fc4164SBjoern A. Zeeb 306205fc4164SBjoern A. Zeeb bpf_show_bpf_if((struct bpf_if *)addr); 306305fc4164SBjoern A. Zeeb } 306405fc4164SBjoern A. Zeeb #endif 3065