xref: /freebsd/sys/net/bpf.c (revision 0e1152fcc2fe48dea2583ac89d30ba77b4ab78cc)
1c398230bSWarner Losh /*-
2df8bae1dSRodney W. Grimes  * Copyright (c) 1990, 1991, 1993
3253a3814SLawrence Stewart  *	The Regents of the University of California.  All rights reserved.
4df8bae1dSRodney W. Grimes  *
5df8bae1dSRodney W. Grimes  * This code is derived from the Stanford/CMU enet packet filter,
6df8bae1dSRodney W. Grimes  * (net/enet.c) distributed as part of 4.3BSD, and code contributed
7df8bae1dSRodney W. Grimes  * to Berkeley by Steven McCanne and Van Jacobson both of Lawrence
8df8bae1dSRodney W. Grimes  * Berkeley Laboratory.
9df8bae1dSRodney W. Grimes  *
10df8bae1dSRodney W. Grimes  * Redistribution and use in source and binary forms, with or without
11df8bae1dSRodney W. Grimes  * modification, are permitted provided that the following conditions
12df8bae1dSRodney W. Grimes  * are met:
13df8bae1dSRodney W. Grimes  * 1. Redistributions of source code must retain the above copyright
14df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer.
15df8bae1dSRodney W. Grimes  * 2. Redistributions in binary form must reproduce the above copyright
16df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer in the
17df8bae1dSRodney W. Grimes  *    documentation and/or other materials provided with the distribution.
18df8bae1dSRodney W. Grimes  * 4. Neither the name of the University nor the names of its contributors
19df8bae1dSRodney W. Grimes  *    may be used to endorse or promote products derived from this software
20df8bae1dSRodney W. Grimes  *    without specific prior written permission.
21df8bae1dSRodney W. Grimes  *
22df8bae1dSRodney W. Grimes  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23df8bae1dSRodney W. Grimes  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24df8bae1dSRodney W. Grimes  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25df8bae1dSRodney W. Grimes  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26df8bae1dSRodney W. Grimes  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27df8bae1dSRodney W. Grimes  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28df8bae1dSRodney W. Grimes  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29df8bae1dSRodney W. Grimes  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30df8bae1dSRodney W. Grimes  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31df8bae1dSRodney W. Grimes  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32df8bae1dSRodney W. Grimes  * SUCH DAMAGE.
33df8bae1dSRodney W. Grimes  *
344f252c4dSRuslan Ermilov  *      @(#)bpf.c	8.4 (Berkeley) 1/9/95
35df8bae1dSRodney W. Grimes  */
36df8bae1dSRodney W. Grimes 
37c7866007SRobert Watson #include <sys/cdefs.h>
38c7866007SRobert Watson __FBSDID("$FreeBSD$");
39c7866007SRobert Watson 
405bb5f2c9SPeter Wemm #include "opt_bpf.h"
41fc0a61a4SKonstantin Belousov #include "opt_compat.h"
425bb5f2c9SPeter Wemm #include "opt_netgraph.h"
43df8bae1dSRodney W. Grimes 
4495aab9ccSJohn-Mark Gurney #include <sys/types.h>
45df8bae1dSRodney W. Grimes #include <sys/param.h>
46e4b3229aSAlexander V. Chernikov #include <sys/lock.h>
47e4b3229aSAlexander V. Chernikov #include <sys/rwlock.h>
48df8bae1dSRodney W. Grimes #include <sys/systm.h>
49ce7609a4SBruce Evans #include <sys/conf.h>
50e76eee55SPoul-Henning Kamp #include <sys/fcntl.h>
51ebd8672cSBjoern A. Zeeb #include <sys/jail.h>
524d1d4912SBruce Evans #include <sys/malloc.h>
53df8bae1dSRodney W. Grimes #include <sys/mbuf.h>
54df8bae1dSRodney W. Grimes #include <sys/time.h>
55acd3428bSRobert Watson #include <sys/priv.h>
56df8bae1dSRodney W. Grimes #include <sys/proc.h>
570310c19fSBruce Evans #include <sys/signalvar.h>
58528f627fSBruce Evans #include <sys/filio.h>
59528f627fSBruce Evans #include <sys/sockio.h>
60528f627fSBruce Evans #include <sys/ttycom.h>
61e76eee55SPoul-Henning Kamp #include <sys/uio.h>
62df8bae1dSRodney W. Grimes 
6395aab9ccSJohn-Mark Gurney #include <sys/event.h>
6495aab9ccSJohn-Mark Gurney #include <sys/file.h>
65243ac7d8SPeter Wemm #include <sys/poll.h>
6695aab9ccSJohn-Mark Gurney #include <sys/proc.h>
67df8bae1dSRodney W. Grimes 
68df8bae1dSRodney W. Grimes #include <sys/socket.h>
69df8bae1dSRodney W. Grimes 
70fba9235dSBruce Evans #include <net/if.h>
7176039bc8SGleb Smirnoff #include <net/if_var.h>
72e4b3229aSAlexander V. Chernikov #define	BPF_INTERNAL
73df8bae1dSRodney W. Grimes #include <net/bpf.h>
744d621040SChristian S.J. Peron #include <net/bpf_buffer.h>
75ae275efcSJung-uk Kim #ifdef BPF_JITTER
76ae275efcSJung-uk Kim #include <net/bpf_jitter.h>
77ae275efcSJung-uk Kim #endif
784d621040SChristian S.J. Peron #include <net/bpf_zerocopy.h>
79df8bae1dSRodney W. Grimes #include <net/bpfdesc.h>
80530c0060SRobert Watson #include <net/vnet.h>
81df8bae1dSRodney W. Grimes 
82df8bae1dSRodney W. Grimes #include <netinet/in.h>
83df8bae1dSRodney W. Grimes #include <netinet/if_ether.h>
84df8bae1dSRodney W. Grimes #include <sys/kernel.h>
85f708ef1bSPoul-Henning Kamp #include <sys/sysctl.h>
867b778b5eSEivind Eklund 
87246b5467SSam Leffler #include <net80211/ieee80211_freebsd.h>
88246b5467SSam Leffler 
89aed55708SRobert Watson #include <security/mac/mac_framework.h>
90aed55708SRobert Watson 
914d621040SChristian S.J. Peron MALLOC_DEFINE(M_BPF, "BPF", "BPF data");
9287f6c662SJulian Elischer 
935bb5f2c9SPeter Wemm #if defined(DEV_BPF) || defined(NETGRAPH_BPF)
9453ac6efbSJulian Elischer 
95df8bae1dSRodney W. Grimes #define PRINET  26			/* interruptible */
96df8bae1dSRodney W. Grimes 
97547d94bdSJung-uk Kim #define	SIZEOF_BPF_HDR(type)	\
98547d94bdSJung-uk Kim     (offsetof(type, bh_hdrlen) + sizeof(((type *)0)->bh_hdrlen))
99547d94bdSJung-uk Kim 
100fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32
101fc0a61a4SKonstantin Belousov #include <sys/mount.h>
102fc0a61a4SKonstantin Belousov #include <compat/freebsd32/freebsd32.h>
103fc0a61a4SKonstantin Belousov #define BPF_ALIGNMENT32 sizeof(int32_t)
104fc0a61a4SKonstantin Belousov #define BPF_WORDALIGN32(x) (((x)+(BPF_ALIGNMENT32-1))&~(BPF_ALIGNMENT32-1))
105fc0a61a4SKonstantin Belousov 
106547d94bdSJung-uk Kim #ifndef BURN_BRIDGES
107fc0a61a4SKonstantin Belousov /*
108fc0a61a4SKonstantin Belousov  * 32-bit version of structure prepended to each packet.  We use this header
109fc0a61a4SKonstantin Belousov  * instead of the standard one for 32-bit streams.  We mark the a stream as
110fc0a61a4SKonstantin Belousov  * 32-bit the first time we see a 32-bit compat ioctl request.
111fc0a61a4SKonstantin Belousov  */
112fc0a61a4SKonstantin Belousov struct bpf_hdr32 {
113fc0a61a4SKonstantin Belousov 	struct timeval32 bh_tstamp;	/* time stamp */
114fc0a61a4SKonstantin Belousov 	uint32_t	bh_caplen;	/* length of captured portion */
115fc0a61a4SKonstantin Belousov 	uint32_t	bh_datalen;	/* original length of packet */
116fc0a61a4SKonstantin Belousov 	uint16_t	bh_hdrlen;	/* length of bpf header (this struct
117fc0a61a4SKonstantin Belousov 					   plus alignment padding) */
118fc0a61a4SKonstantin Belousov };
119253a3814SLawrence Stewart #endif
120fc0a61a4SKonstantin Belousov 
121fc0a61a4SKonstantin Belousov struct bpf_program32 {
122fc0a61a4SKonstantin Belousov 	u_int bf_len;
123fc0a61a4SKonstantin Belousov 	uint32_t bf_insns;
124fc0a61a4SKonstantin Belousov };
125fc0a61a4SKonstantin Belousov 
126fc0a61a4SKonstantin Belousov struct bpf_dltlist32 {
127fc0a61a4SKonstantin Belousov 	u_int	bfl_len;
128fc0a61a4SKonstantin Belousov 	u_int	bfl_list;
129fc0a61a4SKonstantin Belousov };
130fc0a61a4SKonstantin Belousov 
131fc0a61a4SKonstantin Belousov #define	BIOCSETF32	_IOW('B', 103, struct bpf_program32)
132fc0a61a4SKonstantin Belousov #define	BIOCSRTIMEOUT32	_IOW('B', 109, struct timeval32)
133fc0a61a4SKonstantin Belousov #define	BIOCGRTIMEOUT32	_IOR('B', 110, struct timeval32)
134fc0a61a4SKonstantin Belousov #define	BIOCGDLTLIST32	_IOWR('B', 121, struct bpf_dltlist32)
135fc0a61a4SKonstantin Belousov #define	BIOCSETWF32	_IOW('B', 123, struct bpf_program32)
136fc0a61a4SKonstantin Belousov #define	BIOCSETFNR32	_IOW('B', 130, struct bpf_program32)
137253a3814SLawrence Stewart #endif
138fc0a61a4SKonstantin Belousov 
139df8bae1dSRodney W. Grimes /*
140d1a67300SRobert Watson  * bpf_iflist is a list of BPF interface structures, each corresponding to a
141d1a67300SRobert Watson  * specific DLT.  The same network interface might have several BPF interface
142d1a67300SRobert Watson  * structures registered by different layers in the stack (i.e., 802.11
143d1a67300SRobert Watson  * frames, ethernet frames, etc).
144df8bae1dSRodney W. Grimes  */
145f079a0faSAlexander V. Chernikov static LIST_HEAD(, bpf_if)	bpf_iflist, bpf_freelist;
146e7bb21b3SJonathan Lemon static struct mtx	bpf_mtx;		/* bpf global lock */
14769f7644bSChristian S.J. Peron static int		bpf_bpfd_cnt;
148df8bae1dSRodney W. Grimes 
14919ba8395SChristian S.J. Peron static void	bpf_attachd(struct bpf_d *, struct bpf_if *);
15019ba8395SChristian S.J. Peron static void	bpf_detachd(struct bpf_d *);
1516c74ff0eSAlexander V. Chernikov static void	bpf_detachd_locked(struct bpf_d *);
152929ddbbbSAlfred Perlstein static void	bpf_freed(struct bpf_d *);
153cb44b6dfSAndrew Thompson static int	bpf_movein(struct uio *, int, struct ifnet *, struct mbuf **,
154560a54e1SJung-uk Kim 		    struct sockaddr *, int *, struct bpf_insn *);
155929ddbbbSAlfred Perlstein static int	bpf_setif(struct bpf_d *, struct ifreq *);
156929ddbbbSAlfred Perlstein static void	bpf_timed_out(void *);
157e7bb21b3SJonathan Lemon static __inline void
158929ddbbbSAlfred Perlstein 		bpf_wakeup(struct bpf_d *);
1594d621040SChristian S.J. Peron static void	catchpacket(struct bpf_d *, u_char *, u_int, u_int,
1604d621040SChristian S.J. Peron 		    void (*)(struct bpf_d *, caddr_t, u_int, void *, u_int),
161547d94bdSJung-uk Kim 		    struct bintime *);
162929ddbbbSAlfred Perlstein static void	reset_d(struct bpf_d *);
16393e39f0bSChristian S.J. Peron static int	bpf_setf(struct bpf_d *, struct bpf_program *, u_long cmd);
1648eab61f3SSam Leffler static int	bpf_getdltlist(struct bpf_d *, struct bpf_dltlist *);
1658eab61f3SSam Leffler static int	bpf_setdlt(struct bpf_d *, u_int);
16695aab9ccSJohn-Mark Gurney static void	filt_bpfdetach(struct knote *);
16795aab9ccSJohn-Mark Gurney static int	filt_bpfread(struct knote *, long);
168a3272e3cSChristian S.J. Peron static void	bpf_drvinit(void *);
16969f7644bSChristian S.J. Peron static int	bpf_stats_sysctl(SYSCTL_HANDLER_ARGS);
17069f7644bSChristian S.J. Peron 
17169f7644bSChristian S.J. Peron SYSCTL_NODE(_net, OID_AUTO, bpf, CTLFLAG_RW, 0, "bpf sysctl");
17212dc9582SJung-uk Kim int bpf_maxinsns = BPF_MAXINSNS;
17369f7644bSChristian S.J. Peron SYSCTL_INT(_net_bpf, OID_AUTO, maxinsns, CTLFLAG_RW,
17469f7644bSChristian S.J. Peron     &bpf_maxinsns, 0, "Maximum bpf program instructions");
175ffeeb924SChristian S.J. Peron static int bpf_zerocopy_enable = 0;
1764d621040SChristian S.J. Peron SYSCTL_INT(_net_bpf, OID_AUTO, zerocopy_enable, CTLFLAG_RW,
1774d621040SChristian S.J. Peron     &bpf_zerocopy_enable, 0, "Enable new zero-copy BPF buffer sessions");
1786472ac3dSEd Schouten static SYSCTL_NODE(_net_bpf, OID_AUTO, stats, CTLFLAG_MPSAFE | CTLFLAG_RW,
17969f7644bSChristian S.J. Peron     bpf_stats_sysctl, "bpf statistics portal");
180df8bae1dSRodney W. Grimes 
18151ec1eb7SAlexander V. Chernikov static VNET_DEFINE(int, bpf_optimize_writers) = 0;
18251ec1eb7SAlexander V. Chernikov #define	V_bpf_optimize_writers VNET(bpf_optimize_writers)
18351ec1eb7SAlexander V. Chernikov SYSCTL_VNET_INT(_net_bpf, OID_AUTO, optimize_writers,
18451ec1eb7SAlexander V. Chernikov     CTLFLAG_RW, &VNET_NAME(bpf_optimize_writers), 0,
18551ec1eb7SAlexander V. Chernikov     "Do not send packets until BPF program is set");
18651ec1eb7SAlexander V. Chernikov 
18787f6c662SJulian Elischer static	d_open_t	bpfopen;
18887f6c662SJulian Elischer static	d_read_t	bpfread;
18987f6c662SJulian Elischer static	d_write_t	bpfwrite;
19087f6c662SJulian Elischer static	d_ioctl_t	bpfioctl;
191243ac7d8SPeter Wemm static	d_poll_t	bpfpoll;
19295aab9ccSJohn-Mark Gurney static	d_kqfilter_t	bpfkqfilter;
19387f6c662SJulian Elischer 
1944e2f199eSPoul-Henning Kamp static struct cdevsw bpf_cdevsw = {
195dc08ffecSPoul-Henning Kamp 	.d_version =	D_VERSION,
1967ac40f5fSPoul-Henning Kamp 	.d_open =	bpfopen,
1977ac40f5fSPoul-Henning Kamp 	.d_read =	bpfread,
1987ac40f5fSPoul-Henning Kamp 	.d_write =	bpfwrite,
1997ac40f5fSPoul-Henning Kamp 	.d_ioctl =	bpfioctl,
2007ac40f5fSPoul-Henning Kamp 	.d_poll =	bpfpoll,
2017ac40f5fSPoul-Henning Kamp 	.d_name =	"bpf",
20295aab9ccSJohn-Mark Gurney 	.d_kqfilter =	bpfkqfilter,
2034e2f199eSPoul-Henning Kamp };
20487f6c662SJulian Elischer 
205e76d823bSRobert Watson static struct filterops bpfread_filtops = {
206e76d823bSRobert Watson 	.f_isfd = 1,
207e76d823bSRobert Watson 	.f_detach = filt_bpfdetach,
208e76d823bSRobert Watson 	.f_event = filt_bpfread,
209e76d823bSRobert Watson };
21087f6c662SJulian Elischer 
211afa85850SAlexander V. Chernikov eventhandler_tag	bpf_ifdetach_cookie = NULL;
212afa85850SAlexander V. Chernikov 
2134d621040SChristian S.J. Peron /*
2146c74ff0eSAlexander V. Chernikov  * LOCKING MODEL USED BY BPF:
2156c74ff0eSAlexander V. Chernikov  * Locks:
2166c74ff0eSAlexander V. Chernikov  * 1) global lock (BPF_LOCK). Mutex, used to protect interface addition/removal,
2176c74ff0eSAlexander V. Chernikov  * some global counters and every bpf_if reference.
2186c74ff0eSAlexander V. Chernikov  * 2) Interface lock. Rwlock, used to protect list of BPF descriptors and their filters.
219afa85850SAlexander V. Chernikov  * 3) Descriptor lock. Mutex, used to protect BPF buffers and various structure fields
2206c74ff0eSAlexander V. Chernikov  *   used by bpf_mtap code.
2216c74ff0eSAlexander V. Chernikov  *
2226c74ff0eSAlexander V. Chernikov  * Lock order:
2236c74ff0eSAlexander V. Chernikov  *
2246c74ff0eSAlexander V. Chernikov  * Global lock, interface lock, descriptor lock
2256c74ff0eSAlexander V. Chernikov  *
2266c74ff0eSAlexander V. Chernikov  * We have to acquire interface lock before descriptor main lock due to BPF_MTAP[2]
2276c74ff0eSAlexander V. Chernikov  * working model. In many places (like bpf_detachd) we start with BPF descriptor
2286c74ff0eSAlexander V. Chernikov  * (and we need to at least rlock it to get reliable interface pointer). This
2296c74ff0eSAlexander V. Chernikov  * gives us potential LOR. As a result, we use global lock to protect from bpf_if
2306c74ff0eSAlexander V. Chernikov  * change in every such place.
2316c74ff0eSAlexander V. Chernikov  *
2326c74ff0eSAlexander V. Chernikov  * Changing d->bd_bif is protected by 1) global lock, 2) interface lock and
2336c74ff0eSAlexander V. Chernikov  * 3) descriptor main wlock.
2346c74ff0eSAlexander V. Chernikov  * Reading bd_bif can be protected by any of these locks, typically global lock.
2356c74ff0eSAlexander V. Chernikov  *
2366c74ff0eSAlexander V. Chernikov  * Changing read/write BPF filter is protected by the same three locks,
2376c74ff0eSAlexander V. Chernikov  * the same applies for reading.
2386c74ff0eSAlexander V. Chernikov  *
2396c74ff0eSAlexander V. Chernikov  * Sleeping in global lock is not allowed due to bpfdetach() using it.
2406c74ff0eSAlexander V. Chernikov  */
2416c74ff0eSAlexander V. Chernikov 
2426c74ff0eSAlexander V. Chernikov /*
2434d621040SChristian S.J. Peron  * Wrapper functions for various buffering methods.  If the set of buffer
2444d621040SChristian S.J. Peron  * modes expands, we will probably want to introduce a switch data structure
2454d621040SChristian S.J. Peron  * similar to protosw, et.
2464d621040SChristian S.J. Peron  */
2474d621040SChristian S.J. Peron static void
2484d621040SChristian S.J. Peron bpf_append_bytes(struct bpf_d *d, caddr_t buf, u_int offset, void *src,
2494d621040SChristian S.J. Peron     u_int len)
2504d621040SChristian S.J. Peron {
2514d621040SChristian S.J. Peron 
252afa85850SAlexander V. Chernikov 	BPFD_LOCK_ASSERT(d);
2534d621040SChristian S.J. Peron 
2544d621040SChristian S.J. Peron 	switch (d->bd_bufmode) {
2554d621040SChristian S.J. Peron 	case BPF_BUFMODE_BUFFER:
2564d621040SChristian S.J. Peron 		return (bpf_buffer_append_bytes(d, buf, offset, src, len));
2574d621040SChristian S.J. Peron 
2584d621040SChristian S.J. Peron 	case BPF_BUFMODE_ZBUF:
2594d621040SChristian S.J. Peron 		d->bd_zcopy++;
2604d621040SChristian S.J. Peron 		return (bpf_zerocopy_append_bytes(d, buf, offset, src, len));
2614d621040SChristian S.J. Peron 
2624d621040SChristian S.J. Peron 	default:
2634d621040SChristian S.J. Peron 		panic("bpf_buf_append_bytes");
2644d621040SChristian S.J. Peron 	}
2654d621040SChristian S.J. Peron }
2664d621040SChristian S.J. Peron 
2674d621040SChristian S.J. Peron static void
2684d621040SChristian S.J. Peron bpf_append_mbuf(struct bpf_d *d, caddr_t buf, u_int offset, void *src,
2694d621040SChristian S.J. Peron     u_int len)
2704d621040SChristian S.J. Peron {
2714d621040SChristian S.J. Peron 
272afa85850SAlexander V. Chernikov 	BPFD_LOCK_ASSERT(d);
2734d621040SChristian S.J. Peron 
2744d621040SChristian S.J. Peron 	switch (d->bd_bufmode) {
2754d621040SChristian S.J. Peron 	case BPF_BUFMODE_BUFFER:
2764d621040SChristian S.J. Peron 		return (bpf_buffer_append_mbuf(d, buf, offset, src, len));
2774d621040SChristian S.J. Peron 
2784d621040SChristian S.J. Peron 	case BPF_BUFMODE_ZBUF:
2794d621040SChristian S.J. Peron 		d->bd_zcopy++;
2804d621040SChristian S.J. Peron 		return (bpf_zerocopy_append_mbuf(d, buf, offset, src, len));
2814d621040SChristian S.J. Peron 
2824d621040SChristian S.J. Peron 	default:
2834d621040SChristian S.J. Peron 		panic("bpf_buf_append_mbuf");
2844d621040SChristian S.J. Peron 	}
2854d621040SChristian S.J. Peron }
2864d621040SChristian S.J. Peron 
2874d621040SChristian S.J. Peron /*
28829f612ecSChristian S.J. Peron  * This function gets called when the free buffer is re-assigned.
28929f612ecSChristian S.J. Peron  */
29029f612ecSChristian S.J. Peron static void
29129f612ecSChristian S.J. Peron bpf_buf_reclaimed(struct bpf_d *d)
29229f612ecSChristian S.J. Peron {
29329f612ecSChristian S.J. Peron 
294afa85850SAlexander V. Chernikov 	BPFD_LOCK_ASSERT(d);
29529f612ecSChristian S.J. Peron 
29629f612ecSChristian S.J. Peron 	switch (d->bd_bufmode) {
29729f612ecSChristian S.J. Peron 	case BPF_BUFMODE_BUFFER:
29829f612ecSChristian S.J. Peron 		return;
29929f612ecSChristian S.J. Peron 
30029f612ecSChristian S.J. Peron 	case BPF_BUFMODE_ZBUF:
30129f612ecSChristian S.J. Peron 		bpf_zerocopy_buf_reclaimed(d);
30229f612ecSChristian S.J. Peron 		return;
30329f612ecSChristian S.J. Peron 
30429f612ecSChristian S.J. Peron 	default:
30529f612ecSChristian S.J. Peron 		panic("bpf_buf_reclaimed");
30629f612ecSChristian S.J. Peron 	}
30729f612ecSChristian S.J. Peron }
30829f612ecSChristian S.J. Peron 
30929f612ecSChristian S.J. Peron /*
3104d621040SChristian S.J. Peron  * If the buffer mechanism has a way to decide that a held buffer can be made
3114d621040SChristian S.J. Peron  * free, then it is exposed via the bpf_canfreebuf() interface.  (1) is
3124d621040SChristian S.J. Peron  * returned if the buffer can be discarded, (0) is returned if it cannot.
3134d621040SChristian S.J. Peron  */
3144d621040SChristian S.J. Peron static int
3154d621040SChristian S.J. Peron bpf_canfreebuf(struct bpf_d *d)
3164d621040SChristian S.J. Peron {
3174d621040SChristian S.J. Peron 
3184d621040SChristian S.J. Peron 	BPFD_LOCK_ASSERT(d);
3194d621040SChristian S.J. Peron 
3204d621040SChristian S.J. Peron 	switch (d->bd_bufmode) {
3214d621040SChristian S.J. Peron 	case BPF_BUFMODE_ZBUF:
3224d621040SChristian S.J. Peron 		return (bpf_zerocopy_canfreebuf(d));
3234d621040SChristian S.J. Peron 	}
3244d621040SChristian S.J. Peron 	return (0);
3254d621040SChristian S.J. Peron }
3264d621040SChristian S.J. Peron 
327a7a91e65SRobert Watson /*
328a7a91e65SRobert Watson  * Allow the buffer model to indicate that the current store buffer is
329a7a91e65SRobert Watson  * immutable, regardless of the appearance of space.  Return (1) if the
330a7a91e65SRobert Watson  * buffer is writable, and (0) if not.
331a7a91e65SRobert Watson  */
332a7a91e65SRobert Watson static int
333a7a91e65SRobert Watson bpf_canwritebuf(struct bpf_d *d)
334a7a91e65SRobert Watson {
335a7a91e65SRobert Watson 	BPFD_LOCK_ASSERT(d);
336a7a91e65SRobert Watson 
337a7a91e65SRobert Watson 	switch (d->bd_bufmode) {
338a7a91e65SRobert Watson 	case BPF_BUFMODE_ZBUF:
339a7a91e65SRobert Watson 		return (bpf_zerocopy_canwritebuf(d));
340a7a91e65SRobert Watson 	}
341a7a91e65SRobert Watson 	return (1);
342a7a91e65SRobert Watson }
343a7a91e65SRobert Watson 
344a7a91e65SRobert Watson /*
345a7a91e65SRobert Watson  * Notify buffer model that an attempt to write to the store buffer has
346a7a91e65SRobert Watson  * resulted in a dropped packet, in which case the buffer may be considered
347a7a91e65SRobert Watson  * full.
348a7a91e65SRobert Watson  */
349a7a91e65SRobert Watson static void
350a7a91e65SRobert Watson bpf_buffull(struct bpf_d *d)
351a7a91e65SRobert Watson {
352a7a91e65SRobert Watson 
353afa85850SAlexander V. Chernikov 	BPFD_LOCK_ASSERT(d);
354a7a91e65SRobert Watson 
355a7a91e65SRobert Watson 	switch (d->bd_bufmode) {
356a7a91e65SRobert Watson 	case BPF_BUFMODE_ZBUF:
357a7a91e65SRobert Watson 		bpf_zerocopy_buffull(d);
358a7a91e65SRobert Watson 		break;
359a7a91e65SRobert Watson 	}
360a7a91e65SRobert Watson }
361a7a91e65SRobert Watson 
362a7a91e65SRobert Watson /*
363a7a91e65SRobert Watson  * Notify the buffer model that a buffer has moved into the hold position.
364a7a91e65SRobert Watson  */
3654d621040SChristian S.J. Peron void
3664d621040SChristian S.J. Peron bpf_bufheld(struct bpf_d *d)
3674d621040SChristian S.J. Peron {
3684d621040SChristian S.J. Peron 
369afa85850SAlexander V. Chernikov 	BPFD_LOCK_ASSERT(d);
3704d621040SChristian S.J. Peron 
3714d621040SChristian S.J. Peron 	switch (d->bd_bufmode) {
3724d621040SChristian S.J. Peron 	case BPF_BUFMODE_ZBUF:
3734d621040SChristian S.J. Peron 		bpf_zerocopy_bufheld(d);
3744d621040SChristian S.J. Peron 		break;
3754d621040SChristian S.J. Peron 	}
3764d621040SChristian S.J. Peron }
3774d621040SChristian S.J. Peron 
3784d621040SChristian S.J. Peron static void
3794d621040SChristian S.J. Peron bpf_free(struct bpf_d *d)
3804d621040SChristian S.J. Peron {
3814d621040SChristian S.J. Peron 
3824d621040SChristian S.J. Peron 	switch (d->bd_bufmode) {
3834d621040SChristian S.J. Peron 	case BPF_BUFMODE_BUFFER:
3844d621040SChristian S.J. Peron 		return (bpf_buffer_free(d));
3854d621040SChristian S.J. Peron 
3864d621040SChristian S.J. Peron 	case BPF_BUFMODE_ZBUF:
3874d621040SChristian S.J. Peron 		return (bpf_zerocopy_free(d));
3884d621040SChristian S.J. Peron 
3894d621040SChristian S.J. Peron 	default:
3904d621040SChristian S.J. Peron 		panic("bpf_buf_free");
3914d621040SChristian S.J. Peron 	}
3924d621040SChristian S.J. Peron }
3934d621040SChristian S.J. Peron 
3944d621040SChristian S.J. Peron static int
3954d621040SChristian S.J. Peron bpf_uiomove(struct bpf_d *d, caddr_t buf, u_int len, struct uio *uio)
3964d621040SChristian S.J. Peron {
3974d621040SChristian S.J. Peron 
3984d621040SChristian S.J. Peron 	if (d->bd_bufmode != BPF_BUFMODE_BUFFER)
3994d621040SChristian S.J. Peron 		return (EOPNOTSUPP);
4004d621040SChristian S.J. Peron 	return (bpf_buffer_uiomove(d, buf, len, uio));
4014d621040SChristian S.J. Peron }
4024d621040SChristian S.J. Peron 
4034d621040SChristian S.J. Peron static int
4044d621040SChristian S.J. Peron bpf_ioctl_sblen(struct bpf_d *d, u_int *i)
4054d621040SChristian S.J. Peron {
4064d621040SChristian S.J. Peron 
4074d621040SChristian S.J. Peron 	if (d->bd_bufmode != BPF_BUFMODE_BUFFER)
4084d621040SChristian S.J. Peron 		return (EOPNOTSUPP);
4094d621040SChristian S.J. Peron 	return (bpf_buffer_ioctl_sblen(d, i));
4104d621040SChristian S.J. Peron }
4114d621040SChristian S.J. Peron 
4124d621040SChristian S.J. Peron static int
4134d621040SChristian S.J. Peron bpf_ioctl_getzmax(struct thread *td, struct bpf_d *d, size_t *i)
4144d621040SChristian S.J. Peron {
4154d621040SChristian S.J. Peron 
4164d621040SChristian S.J. Peron 	if (d->bd_bufmode != BPF_BUFMODE_ZBUF)
4174d621040SChristian S.J. Peron 		return (EOPNOTSUPP);
4184d621040SChristian S.J. Peron 	return (bpf_zerocopy_ioctl_getzmax(td, d, i));
4194d621040SChristian S.J. Peron }
4204d621040SChristian S.J. Peron 
4214d621040SChristian S.J. Peron static int
4224d621040SChristian S.J. Peron bpf_ioctl_rotzbuf(struct thread *td, struct bpf_d *d, struct bpf_zbuf *bz)
4234d621040SChristian S.J. Peron {
4244d621040SChristian S.J. Peron 
4254d621040SChristian S.J. Peron 	if (d->bd_bufmode != BPF_BUFMODE_ZBUF)
4264d621040SChristian S.J. Peron 		return (EOPNOTSUPP);
4274d621040SChristian S.J. Peron 	return (bpf_zerocopy_ioctl_rotzbuf(td, d, bz));
4284d621040SChristian S.J. Peron }
4294d621040SChristian S.J. Peron 
4304d621040SChristian S.J. Peron static int
4314d621040SChristian S.J. Peron bpf_ioctl_setzbuf(struct thread *td, struct bpf_d *d, struct bpf_zbuf *bz)
4324d621040SChristian S.J. Peron {
4334d621040SChristian S.J. Peron 
4344d621040SChristian S.J. Peron 	if (d->bd_bufmode != BPF_BUFMODE_ZBUF)
4354d621040SChristian S.J. Peron 		return (EOPNOTSUPP);
4364d621040SChristian S.J. Peron 	return (bpf_zerocopy_ioctl_setzbuf(td, d, bz));
4374d621040SChristian S.J. Peron }
4384d621040SChristian S.J. Peron 
4394d621040SChristian S.J. Peron /*
4404d621040SChristian S.J. Peron  * General BPF functions.
4414d621040SChristian S.J. Peron  */
442df8bae1dSRodney W. Grimes static int
443cb44b6dfSAndrew Thompson bpf_movein(struct uio *uio, int linktype, struct ifnet *ifp, struct mbuf **mp,
444560a54e1SJung-uk Kim     struct sockaddr *sockp, int *hdrlen, struct bpf_insn *wfilter)
445df8bae1dSRodney W. Grimes {
446246b5467SSam Leffler 	const struct ieee80211_bpf_params *p;
447cb44b6dfSAndrew Thompson 	struct ether_header *eh;
448df8bae1dSRodney W. Grimes 	struct mbuf *m;
449df8bae1dSRodney W. Grimes 	int error;
450df8bae1dSRodney W. Grimes 	int len;
451df8bae1dSRodney W. Grimes 	int hlen;
45293e39f0bSChristian S.J. Peron 	int slen;
453df8bae1dSRodney W. Grimes 
454df8bae1dSRodney W. Grimes 	/*
455df8bae1dSRodney W. Grimes 	 * Build a sockaddr based on the data link layer type.
456df8bae1dSRodney W. Grimes 	 * We do this at this level because the ethernet header
457df8bae1dSRodney W. Grimes 	 * is copied directly into the data field of the sockaddr.
458df8bae1dSRodney W. Grimes 	 * In the case of SLIP, there is no header and the packet
459df8bae1dSRodney W. Grimes 	 * is forwarded as is.
460df8bae1dSRodney W. Grimes 	 * Also, we are careful to leave room at the front of the mbuf
461df8bae1dSRodney W. Grimes 	 * for the link level header.
462df8bae1dSRodney W. Grimes 	 */
463df8bae1dSRodney W. Grimes 	switch (linktype) {
464df8bae1dSRodney W. Grimes 
465df8bae1dSRodney W. Grimes 	case DLT_SLIP:
466df8bae1dSRodney W. Grimes 		sockp->sa_family = AF_INET;
467df8bae1dSRodney W. Grimes 		hlen = 0;
468df8bae1dSRodney W. Grimes 		break;
469df8bae1dSRodney W. Grimes 
470df8bae1dSRodney W. Grimes 	case DLT_EN10MB:
471df8bae1dSRodney W. Grimes 		sockp->sa_family = AF_UNSPEC;
472df8bae1dSRodney W. Grimes 		/* XXX Would MAXLINKHDR be better? */
473797f247bSMatthew N. Dodd 		hlen = ETHER_HDR_LEN;
474df8bae1dSRodney W. Grimes 		break;
475df8bae1dSRodney W. Grimes 
476df8bae1dSRodney W. Grimes 	case DLT_FDDI:
477d41f24e7SDavid Greenman 		sockp->sa_family = AF_IMPLINK;
478d41f24e7SDavid Greenman 		hlen = 0;
479df8bae1dSRodney W. Grimes 		break;
480df8bae1dSRodney W. Grimes 
48122f05c43SAndrey A. Chernov 	case DLT_RAW:
482df8bae1dSRodney W. Grimes 		sockp->sa_family = AF_UNSPEC;
483df8bae1dSRodney W. Grimes 		hlen = 0;
484df8bae1dSRodney W. Grimes 		break;
485df8bae1dSRodney W. Grimes 
48601399f34SDavid Malone 	case DLT_NULL:
48701399f34SDavid Malone 		/*
48801399f34SDavid Malone 		 * null interface types require a 4 byte pseudo header which
48901399f34SDavid Malone 		 * corresponds to the address family of the packet.
49001399f34SDavid Malone 		 */
49101399f34SDavid Malone 		sockp->sa_family = AF_UNSPEC;
49201399f34SDavid Malone 		hlen = 4;
49301399f34SDavid Malone 		break;
49401399f34SDavid Malone 
4954f53e3ccSKenjiro Cho 	case DLT_ATM_RFC1483:
4964f53e3ccSKenjiro Cho 		/*
4974f53e3ccSKenjiro Cho 		 * en atm driver requires 4-byte atm pseudo header.
4984f53e3ccSKenjiro Cho 		 * though it isn't standard, vpi:vci needs to be
4994f53e3ccSKenjiro Cho 		 * specified anyway.
5004f53e3ccSKenjiro Cho 		 */
5014f53e3ccSKenjiro Cho 		sockp->sa_family = AF_UNSPEC;
5024f53e3ccSKenjiro Cho 		hlen = 12;	/* XXX 4(ATM_PH) + 3(LLC) + 5(SNAP) */
5034f53e3ccSKenjiro Cho 		break;
5044f53e3ccSKenjiro Cho 
50530fa52a6SBrian Somers 	case DLT_PPP:
50630fa52a6SBrian Somers 		sockp->sa_family = AF_UNSPEC;
50730fa52a6SBrian Somers 		hlen = 4;	/* This should match PPP_HDRLEN */
50830fa52a6SBrian Somers 		break;
50930fa52a6SBrian Somers 
510246b5467SSam Leffler 	case DLT_IEEE802_11:		/* IEEE 802.11 wireless */
511246b5467SSam Leffler 		sockp->sa_family = AF_IEEE80211;
512246b5467SSam Leffler 		hlen = 0;
513246b5467SSam Leffler 		break;
514246b5467SSam Leffler 
515246b5467SSam Leffler 	case DLT_IEEE802_11_RADIO:	/* IEEE 802.11 wireless w/ phy params */
516246b5467SSam Leffler 		sockp->sa_family = AF_IEEE80211;
517246b5467SSam Leffler 		sockp->sa_len = 12;	/* XXX != 0 */
518246b5467SSam Leffler 		hlen = sizeof(struct ieee80211_bpf_params);
519246b5467SSam Leffler 		break;
520246b5467SSam Leffler 
521df8bae1dSRodney W. Grimes 	default:
522df8bae1dSRodney W. Grimes 		return (EIO);
523df8bae1dSRodney W. Grimes 	}
524df8bae1dSRodney W. Grimes 
525df8bae1dSRodney W. Grimes 	len = uio->uio_resid;
526ed63043bSGleb Smirnoff 	if (len < hlen || len - hlen > ifp->if_mtu)
52701399f34SDavid Malone 		return (EMSGSIZE);
52801399f34SDavid Malone 
52941a7572bSGleb Smirnoff 	m = m_get2(len, M_WAITOK, MT_DATA, M_PKTHDR);
530ed63043bSGleb Smirnoff 	if (m == NULL)
531df8bae1dSRodney W. Grimes 		return (EIO);
532963e4c2aSGarrett Wollman 	m->m_pkthdr.len = m->m_len = len;
533df8bae1dSRodney W. Grimes 	*mp = m;
53424a229f4SSam Leffler 
53593e39f0bSChristian S.J. Peron 	error = uiomove(mtod(m, u_char *), len, uio);
53693e39f0bSChristian S.J. Peron 	if (error)
53793e39f0bSChristian S.J. Peron 		goto bad;
53893e39f0bSChristian S.J. Peron 
53993e39f0bSChristian S.J. Peron 	slen = bpf_filter(wfilter, mtod(m, u_char *), len, len);
54093e39f0bSChristian S.J. Peron 	if (slen == 0) {
54193e39f0bSChristian S.J. Peron 		error = EPERM;
54293e39f0bSChristian S.J. Peron 		goto bad;
54393e39f0bSChristian S.J. Peron 	}
54493e39f0bSChristian S.J. Peron 
545cb44b6dfSAndrew Thompson 	/* Check for multicast destination */
546cb44b6dfSAndrew Thompson 	switch (linktype) {
547cb44b6dfSAndrew Thompson 	case DLT_EN10MB:
548cb44b6dfSAndrew Thompson 		eh = mtod(m, struct ether_header *);
549cb44b6dfSAndrew Thompson 		if (ETHER_IS_MULTICAST(eh->ether_dhost)) {
550cb44b6dfSAndrew Thompson 			if (bcmp(ifp->if_broadcastaddr, eh->ether_dhost,
551cb44b6dfSAndrew Thompson 			    ETHER_ADDR_LEN) == 0)
552cb44b6dfSAndrew Thompson 				m->m_flags |= M_BCAST;
553cb44b6dfSAndrew Thompson 			else
554cb44b6dfSAndrew Thompson 				m->m_flags |= M_MCAST;
555cb44b6dfSAndrew Thompson 		}
556cb44b6dfSAndrew Thompson 		break;
557cb44b6dfSAndrew Thompson 	}
558cb44b6dfSAndrew Thompson 
559df8bae1dSRodney W. Grimes 	/*
56093e39f0bSChristian S.J. Peron 	 * Make room for link header, and copy it to sockaddr
561df8bae1dSRodney W. Grimes 	 */
562df8bae1dSRodney W. Grimes 	if (hlen != 0) {
563246b5467SSam Leffler 		if (sockp->sa_family == AF_IEEE80211) {
564246b5467SSam Leffler 			/*
565246b5467SSam Leffler 			 * Collect true length from the parameter header
566246b5467SSam Leffler 			 * NB: sockp is known to be zero'd so if we do a
567246b5467SSam Leffler 			 *     short copy unspecified parameters will be
568246b5467SSam Leffler 			 *     zero.
569246b5467SSam Leffler 			 * NB: packet may not be aligned after stripping
570246b5467SSam Leffler 			 *     bpf params
571246b5467SSam Leffler 			 * XXX check ibp_vers
572246b5467SSam Leffler 			 */
573246b5467SSam Leffler 			p = mtod(m, const struct ieee80211_bpf_params *);
574246b5467SSam Leffler 			hlen = p->ibp_len;
575246b5467SSam Leffler 			if (hlen > sizeof(sockp->sa_data)) {
576246b5467SSam Leffler 				error = EINVAL;
577246b5467SSam Leffler 				goto bad;
578246b5467SSam Leffler 			}
579246b5467SSam Leffler 		}
580a09968c4SAdrian Chadd 		bcopy(mtod(m, const void *), sockp->sa_data, hlen);
581df8bae1dSRodney W. Grimes 	}
582560a54e1SJung-uk Kim 	*hdrlen = hlen;
58393e39f0bSChristian S.J. Peron 
584df8bae1dSRodney W. Grimes 	return (0);
585df8bae1dSRodney W. Grimes bad:
586df8bae1dSRodney W. Grimes 	m_freem(m);
587df8bae1dSRodney W. Grimes 	return (error);
588df8bae1dSRodney W. Grimes }
589df8bae1dSRodney W. Grimes 
590df8bae1dSRodney W. Grimes /*
591df8bae1dSRodney W. Grimes  * Attach file to the bpf interface, i.e. make d listen on bp.
592df8bae1dSRodney W. Grimes  */
593df8bae1dSRodney W. Grimes static void
59419ba8395SChristian S.J. Peron bpf_attachd(struct bpf_d *d, struct bpf_if *bp)
595df8bae1dSRodney W. Grimes {
5966c74ff0eSAlexander V. Chernikov 	int op_w;
5976c74ff0eSAlexander V. Chernikov 
5986c74ff0eSAlexander V. Chernikov 	BPF_LOCK_ASSERT();
5996c74ff0eSAlexander V. Chernikov 
6006c74ff0eSAlexander V. Chernikov 	/*
6016c74ff0eSAlexander V. Chernikov 	 * Save sysctl value to protect from sysctl change
6026c74ff0eSAlexander V. Chernikov 	 * between reads
6036c74ff0eSAlexander V. Chernikov 	 */
6046c74ff0eSAlexander V. Chernikov 	op_w = V_bpf_optimize_writers;
6056c74ff0eSAlexander V. Chernikov 
6066c74ff0eSAlexander V. Chernikov 	if (d->bd_bif != NULL)
6076c74ff0eSAlexander V. Chernikov 		bpf_detachd_locked(d);
608df8bae1dSRodney W. Grimes 	/*
60951ec1eb7SAlexander V. Chernikov 	 * Point d at bp, and add d to the interface's list.
61051ec1eb7SAlexander V. Chernikov 	 * Since there are many applicaiotns using BPF for
61151ec1eb7SAlexander V. Chernikov 	 * sending raw packets only (dhcpd, cdpd are good examples)
61251ec1eb7SAlexander V. Chernikov 	 * we can delay adding d to the list of active listeners until
61351ec1eb7SAlexander V. Chernikov 	 * some filter is configured.
614df8bae1dSRodney W. Grimes 	 */
61551ec1eb7SAlexander V. Chernikov 
61651ec1eb7SAlexander V. Chernikov 	BPFIF_WLOCK(bp);
617afa85850SAlexander V. Chernikov 	BPFD_LOCK(d);
61851ec1eb7SAlexander V. Chernikov 
6196c74ff0eSAlexander V. Chernikov 	d->bd_bif = bp;
6206c74ff0eSAlexander V. Chernikov 
6216c74ff0eSAlexander V. Chernikov 	if (op_w != 0) {
62251ec1eb7SAlexander V. Chernikov 		/* Add to writers-only list */
62351ec1eb7SAlexander V. Chernikov 		LIST_INSERT_HEAD(&bp->bif_wlist, d, bd_next);
62451ec1eb7SAlexander V. Chernikov 		/*
62551ec1eb7SAlexander V. Chernikov 		 * We decrement bd_writer on every filter set operation.
62651ec1eb7SAlexander V. Chernikov 		 * First BIOCSETF is done by pcap_open_live() to set up
62751ec1eb7SAlexander V. Chernikov 		 * snap length. After that appliation usually sets its own filter
62851ec1eb7SAlexander V. Chernikov 		 */
62951ec1eb7SAlexander V. Chernikov 		d->bd_writer = 2;
63051ec1eb7SAlexander V. Chernikov 	} else
6314a3feeaaSRobert Watson 		LIST_INSERT_HEAD(&bp->bif_dlist, d, bd_next);
632df8bae1dSRodney W. Grimes 
633afa85850SAlexander V. Chernikov 	BPFD_UNLOCK(d);
634e4b3229aSAlexander V. Chernikov 	BPFIF_WUNLOCK(bp);
635b743c310SSam Leffler 
63651ec1eb7SAlexander V. Chernikov 	bpf_bpfd_cnt++;
63751ec1eb7SAlexander V. Chernikov 
63851ec1eb7SAlexander V. Chernikov 	CTR3(KTR_NET, "%s: bpf_attach called by pid %d, adding to %s list",
63951ec1eb7SAlexander V. Chernikov 	    __func__, d->bd_pid, d->bd_writer ? "writer" : "active");
64051ec1eb7SAlexander V. Chernikov 
6416c74ff0eSAlexander V. Chernikov 	if (op_w == 0)
64251ec1eb7SAlexander V. Chernikov 		EVENTHANDLER_INVOKE(bpf_track, bp->bif_ifp, bp->bif_dlt, 1);
64351ec1eb7SAlexander V. Chernikov }
64451ec1eb7SAlexander V. Chernikov 
64551ec1eb7SAlexander V. Chernikov /*
646402000ffSAlexander V. Chernikov  * Check if we need to upgrade our descriptor @d from write-only mode.
647402000ffSAlexander V. Chernikov  */
648402000ffSAlexander V. Chernikov static int
649402000ffSAlexander V. Chernikov bpf_check_upgrade(u_long cmd, struct bpf_d *d, struct bpf_insn *fcode, int flen)
650402000ffSAlexander V. Chernikov {
651402000ffSAlexander V. Chernikov 	int is_snap, need_upgrade;
652402000ffSAlexander V. Chernikov 
653402000ffSAlexander V. Chernikov 	/*
654402000ffSAlexander V. Chernikov 	 * Check if we've already upgraded or new filter is empty.
655402000ffSAlexander V. Chernikov 	 */
656402000ffSAlexander V. Chernikov 	if (d->bd_writer == 0 || fcode == NULL)
657402000ffSAlexander V. Chernikov 		return (0);
658402000ffSAlexander V. Chernikov 
659402000ffSAlexander V. Chernikov 	need_upgrade = 0;
660402000ffSAlexander V. Chernikov 
661402000ffSAlexander V. Chernikov 	/*
662402000ffSAlexander V. Chernikov 	 * Check if cmd looks like snaplen setting from
663402000ffSAlexander V. Chernikov 	 * pcap_bpf.c:pcap_open_live().
664402000ffSAlexander V. Chernikov 	 * Note we're not checking .k value here:
665402000ffSAlexander V. Chernikov 	 * while pcap_open_live() definitely sets to to non-zero value,
666402000ffSAlexander V. Chernikov 	 * we'd prefer to treat k=0 (deny ALL) case the same way: e.g.
667402000ffSAlexander V. Chernikov 	 * do not consider upgrading immediately
668402000ffSAlexander V. Chernikov 	 */
669402000ffSAlexander V. Chernikov 	if (cmd == BIOCSETF && flen == 1 && fcode[0].code == (BPF_RET | BPF_K))
670402000ffSAlexander V. Chernikov 		is_snap = 1;
671402000ffSAlexander V. Chernikov 	else
672402000ffSAlexander V. Chernikov 		is_snap = 0;
673402000ffSAlexander V. Chernikov 
674402000ffSAlexander V. Chernikov 	if (is_snap == 0) {
675402000ffSAlexander V. Chernikov 		/*
676402000ffSAlexander V. Chernikov 		 * We're setting first filter and it doesn't look like
677402000ffSAlexander V. Chernikov 		 * setting snaplen.  We're probably using bpf directly.
678402000ffSAlexander V. Chernikov 		 * Upgrade immediately.
679402000ffSAlexander V. Chernikov 		 */
680402000ffSAlexander V. Chernikov 		need_upgrade = 1;
681402000ffSAlexander V. Chernikov 	} else {
682402000ffSAlexander V. Chernikov 		/*
683402000ffSAlexander V. Chernikov 		 * Do not require upgrade by first BIOCSETF
684402000ffSAlexander V. Chernikov 		 * (used to set snaplen) by pcap_open_live().
685402000ffSAlexander V. Chernikov 		 */
686402000ffSAlexander V. Chernikov 
687402000ffSAlexander V. Chernikov 		if (--d->bd_writer == 0) {
688402000ffSAlexander V. Chernikov 			/*
689402000ffSAlexander V. Chernikov 			 * First snaplen filter has already
690402000ffSAlexander V. Chernikov 			 * been set. This is probably catch-all
691402000ffSAlexander V. Chernikov 			 * filter
692402000ffSAlexander V. Chernikov 			 */
693402000ffSAlexander V. Chernikov 			need_upgrade = 1;
694402000ffSAlexander V. Chernikov 		}
695402000ffSAlexander V. Chernikov 	}
696402000ffSAlexander V. Chernikov 
697402000ffSAlexander V. Chernikov 	CTR5(KTR_NET,
698402000ffSAlexander V. Chernikov 	    "%s: filter function set by pid %d, "
699402000ffSAlexander V. Chernikov 	    "bd_writer counter %d, snap %d upgrade %d",
700402000ffSAlexander V. Chernikov 	    __func__, d->bd_pid, d->bd_writer,
701402000ffSAlexander V. Chernikov 	    is_snap, need_upgrade);
702402000ffSAlexander V. Chernikov 
703402000ffSAlexander V. Chernikov 	return (need_upgrade);
704402000ffSAlexander V. Chernikov }
705402000ffSAlexander V. Chernikov 
706402000ffSAlexander V. Chernikov /*
70751ec1eb7SAlexander V. Chernikov  * Add d to the list of active bp filters.
70851ec1eb7SAlexander V. Chernikov  * Reuqires bpf_attachd() to be called before
70951ec1eb7SAlexander V. Chernikov  */
71051ec1eb7SAlexander V. Chernikov static void
71151ec1eb7SAlexander V. Chernikov bpf_upgraded(struct bpf_d *d)
71251ec1eb7SAlexander V. Chernikov {
71351ec1eb7SAlexander V. Chernikov 	struct bpf_if *bp;
71451ec1eb7SAlexander V. Chernikov 
7156c74ff0eSAlexander V. Chernikov 	BPF_LOCK_ASSERT();
7166c74ff0eSAlexander V. Chernikov 
71751ec1eb7SAlexander V. Chernikov 	bp = d->bd_bif;
71851ec1eb7SAlexander V. Chernikov 
7196c74ff0eSAlexander V. Chernikov 	/*
7206c74ff0eSAlexander V. Chernikov 	 * Filter can be set several times without specifying interface.
7216c74ff0eSAlexander V. Chernikov 	 * Mark d as reader and exit.
7226c74ff0eSAlexander V. Chernikov 	 */
7236c74ff0eSAlexander V. Chernikov 	if (bp == NULL) {
724afa85850SAlexander V. Chernikov 		BPFD_LOCK(d);
7256c74ff0eSAlexander V. Chernikov 		d->bd_writer = 0;
726afa85850SAlexander V. Chernikov 		BPFD_UNLOCK(d);
7276c74ff0eSAlexander V. Chernikov 		return;
7286c74ff0eSAlexander V. Chernikov 	}
7296c74ff0eSAlexander V. Chernikov 
73051ec1eb7SAlexander V. Chernikov 	BPFIF_WLOCK(bp);
731afa85850SAlexander V. Chernikov 	BPFD_LOCK(d);
73251ec1eb7SAlexander V. Chernikov 
73351ec1eb7SAlexander V. Chernikov 	/* Remove from writers-only list */
73451ec1eb7SAlexander V. Chernikov 	LIST_REMOVE(d, bd_next);
73551ec1eb7SAlexander V. Chernikov 	LIST_INSERT_HEAD(&bp->bif_dlist, d, bd_next);
73651ec1eb7SAlexander V. Chernikov 	/* Mark d as reader */
73751ec1eb7SAlexander V. Chernikov 	d->bd_writer = 0;
73851ec1eb7SAlexander V. Chernikov 
739afa85850SAlexander V. Chernikov 	BPFD_UNLOCK(d);
74051ec1eb7SAlexander V. Chernikov 	BPFIF_WUNLOCK(bp);
74151ec1eb7SAlexander V. Chernikov 
74251ec1eb7SAlexander V. Chernikov 	CTR2(KTR_NET, "%s: upgrade required by pid %d", __func__, d->bd_pid);
74351ec1eb7SAlexander V. Chernikov 
7445ce8d970SSam Leffler 	EVENTHANDLER_INVOKE(bpf_track, bp->bif_ifp, bp->bif_dlt, 1);
745df8bae1dSRodney W. Grimes }
746df8bae1dSRodney W. Grimes 
747df8bae1dSRodney W. Grimes /*
748df8bae1dSRodney W. Grimes  * Detach a file from its interface.
749df8bae1dSRodney W. Grimes  */
750df8bae1dSRodney W. Grimes static void
75119ba8395SChristian S.J. Peron bpf_detachd(struct bpf_d *d)
752df8bae1dSRodney W. Grimes {
7536c74ff0eSAlexander V. Chernikov 	BPF_LOCK();
7546c74ff0eSAlexander V. Chernikov 	bpf_detachd_locked(d);
7556c74ff0eSAlexander V. Chernikov 	BPF_UNLOCK();
7566c74ff0eSAlexander V. Chernikov }
7576c74ff0eSAlexander V. Chernikov 
7586c74ff0eSAlexander V. Chernikov static void
7596c74ff0eSAlexander V. Chernikov bpf_detachd_locked(struct bpf_d *d)
7606c74ff0eSAlexander V. Chernikov {
7616e891d64SPoul-Henning Kamp 	int error;
762df8bae1dSRodney W. Grimes 	struct bpf_if *bp;
76346448b5aSRobert Watson 	struct ifnet *ifp;
764df8bae1dSRodney W. Grimes 
76551ec1eb7SAlexander V. Chernikov 	CTR2(KTR_NET, "%s: detach required by pid %d", __func__, d->bd_pid);
76651ec1eb7SAlexander V. Chernikov 
767e4b3229aSAlexander V. Chernikov 	BPF_LOCK_ASSERT();
768e4b3229aSAlexander V. Chernikov 
7696c74ff0eSAlexander V. Chernikov 	/* Check if descriptor is attached */
7706c74ff0eSAlexander V. Chernikov 	if ((bp = d->bd_bif) == NULL)
7716c74ff0eSAlexander V. Chernikov 		return;
7726c74ff0eSAlexander V. Chernikov 
773e4b3229aSAlexander V. Chernikov 	BPFIF_WLOCK(bp);
774afa85850SAlexander V. Chernikov 	BPFD_LOCK(d);
77546448b5aSRobert Watson 
77651ec1eb7SAlexander V. Chernikov 	/* Save bd_writer value */
77751ec1eb7SAlexander V. Chernikov 	error = d->bd_writer;
77851ec1eb7SAlexander V. Chernikov 
77946448b5aSRobert Watson 	/*
78046448b5aSRobert Watson 	 * Remove d from the interface's descriptor list.
78146448b5aSRobert Watson 	 */
78246448b5aSRobert Watson 	LIST_REMOVE(d, bd_next);
78346448b5aSRobert Watson 
784e4b3229aSAlexander V. Chernikov 	ifp = bp->bif_ifp;
785572bde2aSRobert Watson 	d->bd_bif = NULL;
786afa85850SAlexander V. Chernikov 	BPFD_UNLOCK(d);
787e4b3229aSAlexander V. Chernikov 	BPFIF_WUNLOCK(bp);
788e4b3229aSAlexander V. Chernikov 
789e4b3229aSAlexander V. Chernikov 	bpf_bpfd_cnt--;
79046448b5aSRobert Watson 
79151ec1eb7SAlexander V. Chernikov 	/* Call event handler iff d is attached */
79251ec1eb7SAlexander V. Chernikov 	if (error == 0)
7935ce8d970SSam Leffler 		EVENTHANDLER_INVOKE(bpf_track, ifp, bp->bif_dlt, 0);
794b743c310SSam Leffler 
795df8bae1dSRodney W. Grimes 	/*
796df8bae1dSRodney W. Grimes 	 * Check if this descriptor had requested promiscuous mode.
797df8bae1dSRodney W. Grimes 	 * If so, turn it off.
798df8bae1dSRodney W. Grimes 	 */
799df8bae1dSRodney W. Grimes 	if (d->bd_promisc) {
800df8bae1dSRodney W. Grimes 		d->bd_promisc = 0;
80197021c24SMarko Zec 		CURVNET_SET(ifp->if_vnet);
80246448b5aSRobert Watson 		error = ifpromisc(ifp, 0);
80397021c24SMarko Zec 		CURVNET_RESTORE();
8046e891d64SPoul-Henning Kamp 		if (error != 0 && error != ENXIO) {
805df8bae1dSRodney W. Grimes 			/*
8066e891d64SPoul-Henning Kamp 			 * ENXIO can happen if a pccard is unplugged
807df8bae1dSRodney W. Grimes 			 * Something is really wrong if we were able to put
808df8bae1dSRodney W. Grimes 			 * the driver into promiscuous mode, but can't
809df8bae1dSRodney W. Grimes 			 * take it out.
810df8bae1dSRodney W. Grimes 			 */
8118eab61f3SSam Leffler 			if_printf(bp->bif_ifp,
8128eab61f3SSam Leffler 				"bpf_detach: ifpromisc failed (%d)\n", error);
8136e891d64SPoul-Henning Kamp 		}
814df8bae1dSRodney W. Grimes 	}
815df8bae1dSRodney W. Grimes }
816df8bae1dSRodney W. Grimes 
817df8bae1dSRodney W. Grimes /*
818136600feSEd Schouten  * Close the descriptor by detaching it from its interface,
819136600feSEd Schouten  * deallocating its buffers, and marking it free.
820136600feSEd Schouten  */
821136600feSEd Schouten static void
822136600feSEd Schouten bpf_dtor(void *data)
823136600feSEd Schouten {
824136600feSEd Schouten 	struct bpf_d *d = data;
825136600feSEd Schouten 
826afa85850SAlexander V. Chernikov 	BPFD_LOCK(d);
827136600feSEd Schouten 	if (d->bd_state == BPF_WAITING)
828136600feSEd Schouten 		callout_stop(&d->bd_callout);
829136600feSEd Schouten 	d->bd_state = BPF_IDLE;
830afa85850SAlexander V. Chernikov 	BPFD_UNLOCK(d);
831136600feSEd Schouten 	funsetown(&d->bd_sigio);
832136600feSEd Schouten 	bpf_detachd(d);
833136600feSEd Schouten #ifdef MAC
834136600feSEd Schouten 	mac_bpfdesc_destroy(d);
835136600feSEd Schouten #endif /* MAC */
8366aba400aSAttilio Rao 	seldrain(&d->bd_sel);
837136600feSEd Schouten 	knlist_destroy(&d->bd_sel.si_note);
8389fee1bd1SJung-uk Kim 	callout_drain(&d->bd_callout);
839136600feSEd Schouten 	bpf_freed(d);
840136600feSEd Schouten 	free(d, M_BPF);
841136600feSEd Schouten }
842136600feSEd Schouten 
843136600feSEd Schouten /*
844df8bae1dSRodney W. Grimes  * Open ethernet device.  Returns ENXIO for illegal minor device number,
845df8bae1dSRodney W. Grimes  * EBUSY if file is open by another process.
846df8bae1dSRodney W. Grimes  */
847df8bae1dSRodney W. Grimes /* ARGSUSED */
84887f6c662SJulian Elischer static	int
84919ba8395SChristian S.J. Peron bpfopen(struct cdev *dev, int flags, int fmt, struct thread *td)
850df8bae1dSRodney W. Grimes {
851e7bb21b3SJonathan Lemon 	struct bpf_d *d;
852c7b0200eSAlexander V. Chernikov 	int error, size;
853df8bae1dSRodney W. Grimes 
8541ede983cSDag-Erling Smørgrav 	d = malloc(sizeof(*d), M_BPF, M_WAITOK | M_ZERO);
855136600feSEd Schouten 	error = devfs_set_cdevpriv(d, bpf_dtor);
856136600feSEd Schouten 	if (error != 0) {
857136600feSEd Schouten 		free(d, M_BPF);
858136600feSEd Schouten 		return (error);
859136600feSEd Schouten 	}
8604d621040SChristian S.J. Peron 
8614d621040SChristian S.J. Peron 	/*
8624d621040SChristian S.J. Peron 	 * For historical reasons, perform a one-time initialization call to
8634d621040SChristian S.J. Peron 	 * the buffer routines, even though we're not yet committed to a
8644d621040SChristian S.J. Peron 	 * particular buffer method.
8654d621040SChristian S.J. Peron 	 */
8664d621040SChristian S.J. Peron 	bpf_buffer_init(d);
8673b3b91e7SGuy Helmer 	d->bd_hbuf_in_use = 0;
8684d621040SChristian S.J. Peron 	d->bd_bufmode = BPF_BUFMODE_BUFFER;
86900a83887SPaul Traina 	d->bd_sig = SIGIO;
870560a54e1SJung-uk Kim 	d->bd_direction = BPF_D_INOUT;
871e4b3229aSAlexander V. Chernikov 	BPF_PID_REFRESH(d, td);
87282f4445dSRobert Watson #ifdef MAC
87330d239bcSRobert Watson 	mac_bpfdesc_init(d);
87430d239bcSRobert Watson 	mac_bpfdesc_create(td->td_ucred, d);
87582f4445dSRobert Watson #endif
876afa85850SAlexander V. Chernikov 	mtx_init(&d->bd_lock, devtoname(dev), "bpf cdev lock", MTX_DEF);
877afa85850SAlexander V. Chernikov 	callout_init_mtx(&d->bd_callout, &d->bd_lock, 0);
878afa85850SAlexander V. Chernikov 	knlist_init_mtx(&d->bd_sel.si_note, &d->bd_lock);
879df8bae1dSRodney W. Grimes 
880c7b0200eSAlexander V. Chernikov 	/* Allocate default buffers */
881c7b0200eSAlexander V. Chernikov 	size = d->bd_bufsize;
882c7b0200eSAlexander V. Chernikov 	bpf_buffer_ioctl_sblen(d, &size);
883c7b0200eSAlexander V. Chernikov 
884df8bae1dSRodney W. Grimes 	return (0);
885df8bae1dSRodney W. Grimes }
886df8bae1dSRodney W. Grimes 
887df8bae1dSRodney W. Grimes /*
888df8bae1dSRodney W. Grimes  *  bpfread - read next chunk of packets from buffers
889df8bae1dSRodney W. Grimes  */
89087f6c662SJulian Elischer static	int
89119ba8395SChristian S.J. Peron bpfread(struct cdev *dev, struct uio *uio, int ioflag)
892df8bae1dSRodney W. Grimes {
893136600feSEd Schouten 	struct bpf_d *d;
894df8bae1dSRodney W. Grimes 	int error;
8958df67d77SJung-uk Kim 	int non_block;
8968df67d77SJung-uk Kim 	int timed_out;
897df8bae1dSRodney W. Grimes 
898136600feSEd Schouten 	error = devfs_get_cdevpriv((void **)&d);
899136600feSEd Schouten 	if (error != 0)
900136600feSEd Schouten 		return (error);
901136600feSEd Schouten 
902df8bae1dSRodney W. Grimes 	/*
903df8bae1dSRodney W. Grimes 	 * Restrict application to use a buffer the same size as
904df8bae1dSRodney W. Grimes 	 * as kernel buffers.
905df8bae1dSRodney W. Grimes 	 */
906df8bae1dSRodney W. Grimes 	if (uio->uio_resid != d->bd_bufsize)
907df8bae1dSRodney W. Grimes 		return (EINVAL);
908df8bae1dSRodney W. Grimes 
9098df67d77SJung-uk Kim 	non_block = ((ioflag & O_NONBLOCK) != 0);
9108df67d77SJung-uk Kim 
911afa85850SAlexander V. Chernikov 	BPFD_LOCK(d);
912e4b3229aSAlexander V. Chernikov 	BPF_PID_REFRESH_CUR(d);
9134d621040SChristian S.J. Peron 	if (d->bd_bufmode != BPF_BUFMODE_BUFFER) {
914afa85850SAlexander V. Chernikov 		BPFD_UNLOCK(d);
9154d621040SChristian S.J. Peron 		return (EOPNOTSUPP);
9164d621040SChristian S.J. Peron 	}
91781bda851SJohn Polstra 	if (d->bd_state == BPF_WAITING)
91881bda851SJohn Polstra 		callout_stop(&d->bd_callout);
91981bda851SJohn Polstra 	timed_out = (d->bd_state == BPF_TIMED_OUT);
92081bda851SJohn Polstra 	d->bd_state = BPF_IDLE;
921d013d902SGuy Helmer 	while (d->bd_hbuf_in_use) {
922d013d902SGuy Helmer 		error = mtx_sleep(&d->bd_hbuf_in_use, &d->bd_lock,
9233b3b91e7SGuy Helmer 		    PRINET|PCATCH, "bd_hbuf", 0);
924d013d902SGuy Helmer 		if (error != 0) {
925d013d902SGuy Helmer 			BPFD_UNLOCK(d);
926d013d902SGuy Helmer 			return (error);
927d013d902SGuy Helmer 		}
928d013d902SGuy Helmer 	}
929df8bae1dSRodney W. Grimes 	/*
930df8bae1dSRodney W. Grimes 	 * If the hold buffer is empty, then do a timed sleep, which
931df8bae1dSRodney W. Grimes 	 * ends when the timeout expires or when enough packets
932df8bae1dSRodney W. Grimes 	 * have arrived to fill the store buffer.
933df8bae1dSRodney W. Grimes 	 */
934572bde2aSRobert Watson 	while (d->bd_hbuf == NULL) {
9358df67d77SJung-uk Kim 		if (d->bd_slen != 0) {
936df8bae1dSRodney W. Grimes 			/*
937df8bae1dSRodney W. Grimes 			 * A packet(s) either arrived since the previous
938df8bae1dSRodney W. Grimes 			 * read or arrived while we were asleep.
9398df67d77SJung-uk Kim 			 */
9408df67d77SJung-uk Kim 			if (d->bd_immediate || non_block || timed_out) {
9418df67d77SJung-uk Kim 				/*
9428df67d77SJung-uk Kim 				 * Rotate the buffers and return what's here
9438df67d77SJung-uk Kim 				 * if we are in immediate mode, non-blocking
9448df67d77SJung-uk Kim 				 * flag is set, or this descriptor timed out.
945df8bae1dSRodney W. Grimes 				 */
946df8bae1dSRodney W. Grimes 				ROTATE_BUFFERS(d);
947df8bae1dSRodney W. Grimes 				break;
948df8bae1dSRodney W. Grimes 			}
9498df67d77SJung-uk Kim 		}
950de5d9935SRobert Watson 
951de5d9935SRobert Watson 		/*
952de5d9935SRobert Watson 		 * No data is available, check to see if the bpf device
953de5d9935SRobert Watson 		 * is still pointed at a real interface.  If not, return
954de5d9935SRobert Watson 		 * ENXIO so that the userland process knows to rebind
955de5d9935SRobert Watson 		 * it before using it again.
956de5d9935SRobert Watson 		 */
957de5d9935SRobert Watson 		if (d->bd_bif == NULL) {
958afa85850SAlexander V. Chernikov 			BPFD_UNLOCK(d);
959de5d9935SRobert Watson 			return (ENXIO);
960de5d9935SRobert Watson 		}
961de5d9935SRobert Watson 
9628df67d77SJung-uk Kim 		if (non_block) {
963afa85850SAlexander V. Chernikov 			BPFD_UNLOCK(d);
964fba3cfdeSJohn Polstra 			return (EWOULDBLOCK);
965fba3cfdeSJohn Polstra 		}
966afa85850SAlexander V. Chernikov 		error = msleep(d, &d->bd_lock, PRINET|PCATCH,
967e7bb21b3SJonathan Lemon 		     "bpf", d->bd_rtout);
968df8bae1dSRodney W. Grimes 		if (error == EINTR || error == ERESTART) {
969afa85850SAlexander V. Chernikov 			BPFD_UNLOCK(d);
970df8bae1dSRodney W. Grimes 			return (error);
971df8bae1dSRodney W. Grimes 		}
972df8bae1dSRodney W. Grimes 		if (error == EWOULDBLOCK) {
973df8bae1dSRodney W. Grimes 			/*
974df8bae1dSRodney W. Grimes 			 * On a timeout, return what's in the buffer,
975df8bae1dSRodney W. Grimes 			 * which may be nothing.  If there is something
976df8bae1dSRodney W. Grimes 			 * in the store buffer, we can rotate the buffers.
977df8bae1dSRodney W. Grimes 			 */
978df8bae1dSRodney W. Grimes 			if (d->bd_hbuf)
979df8bae1dSRodney W. Grimes 				/*
980df8bae1dSRodney W. Grimes 				 * We filled up the buffer in between
981df8bae1dSRodney W. Grimes 				 * getting the timeout and arriving
982df8bae1dSRodney W. Grimes 				 * here, so we don't need to rotate.
983df8bae1dSRodney W. Grimes 				 */
984df8bae1dSRodney W. Grimes 				break;
985df8bae1dSRodney W. Grimes 
986df8bae1dSRodney W. Grimes 			if (d->bd_slen == 0) {
987afa85850SAlexander V. Chernikov 				BPFD_UNLOCK(d);
988df8bae1dSRodney W. Grimes 				return (0);
989df8bae1dSRodney W. Grimes 			}
990df8bae1dSRodney W. Grimes 			ROTATE_BUFFERS(d);
991df8bae1dSRodney W. Grimes 			break;
992df8bae1dSRodney W. Grimes 		}
993df8bae1dSRodney W. Grimes 	}
994df8bae1dSRodney W. Grimes 	/*
995df8bae1dSRodney W. Grimes 	 * At this point, we know we have something in the hold slot.
996df8bae1dSRodney W. Grimes 	 */
9973b3b91e7SGuy Helmer 	d->bd_hbuf_in_use = 1;
998afa85850SAlexander V. Chernikov 	BPFD_UNLOCK(d);
999df8bae1dSRodney W. Grimes 
1000df8bae1dSRodney W. Grimes 	/*
1001df8bae1dSRodney W. Grimes 	 * Move data from hold buffer into user space.
1002df8bae1dSRodney W. Grimes 	 * We know the entire buffer is transferred since
1003df8bae1dSRodney W. Grimes 	 * we checked above that the read buffer is bpf_bufsize bytes.
100431b32e6dSRobert Watson   	 *
10053b3b91e7SGuy Helmer 	 * We do not have to worry about simultaneous reads because
10063b3b91e7SGuy Helmer 	 * we waited for sole access to the hold buffer above.
1007df8bae1dSRodney W. Grimes 	 */
10084d621040SChristian S.J. Peron 	error = bpf_uiomove(d, d->bd_hbuf, d->bd_hlen, uio);
1009df8bae1dSRodney W. Grimes 
1010afa85850SAlexander V. Chernikov 	BPFD_LOCK(d);
10113b3b91e7SGuy Helmer 	KASSERT(d->bd_hbuf != NULL, ("bpfread: lost bd_hbuf"));
1012df8bae1dSRodney W. Grimes 	d->bd_fbuf = d->bd_hbuf;
1013572bde2aSRobert Watson 	d->bd_hbuf = NULL;
1014df8bae1dSRodney W. Grimes 	d->bd_hlen = 0;
101529f612ecSChristian S.J. Peron 	bpf_buf_reclaimed(d);
10163b3b91e7SGuy Helmer 	d->bd_hbuf_in_use = 0;
10173b3b91e7SGuy Helmer 	wakeup(&d->bd_hbuf_in_use);
1018afa85850SAlexander V. Chernikov 	BPFD_UNLOCK(d);
1019df8bae1dSRodney W. Grimes 
1020df8bae1dSRodney W. Grimes 	return (error);
1021df8bae1dSRodney W. Grimes }
1022df8bae1dSRodney W. Grimes 
1023df8bae1dSRodney W. Grimes /*
1024df8bae1dSRodney W. Grimes  * If there are processes sleeping on this descriptor, wake them up.
1025df8bae1dSRodney W. Grimes  */
1026e7bb21b3SJonathan Lemon static __inline void
102719ba8395SChristian S.J. Peron bpf_wakeup(struct bpf_d *d)
1028df8bae1dSRodney W. Grimes {
1029a3272e3cSChristian S.J. Peron 
1030afa85850SAlexander V. Chernikov 	BPFD_LOCK_ASSERT(d);
103181bda851SJohn Polstra 	if (d->bd_state == BPF_WAITING) {
103281bda851SJohn Polstra 		callout_stop(&d->bd_callout);
103381bda851SJohn Polstra 		d->bd_state = BPF_IDLE;
103481bda851SJohn Polstra 	}
1035521f364bSDag-Erling Smørgrav 	wakeup(d);
1036831d27a9SDon Lewis 	if (d->bd_async && d->bd_sig && d->bd_sigio)
1037f1320723SAlfred Perlstein 		pgsigio(&d->bd_sigio, d->bd_sig, 0);
103800a83887SPaul Traina 
1039512824f8SSeigo Tanimura 	selwakeuppri(&d->bd_sel, PRINET);
1040ad3b9257SJohn-Mark Gurney 	KNOTE_LOCKED(&d->bd_sel.si_note, 0);
1041df8bae1dSRodney W. Grimes }
1042df8bae1dSRodney W. Grimes 
104381bda851SJohn Polstra static void
104419ba8395SChristian S.J. Peron bpf_timed_out(void *arg)
104581bda851SJohn Polstra {
104681bda851SJohn Polstra 	struct bpf_d *d = (struct bpf_d *)arg;
104781bda851SJohn Polstra 
1048afa85850SAlexander V. Chernikov 	BPFD_LOCK_ASSERT(d);
10499fee1bd1SJung-uk Kim 
10509fee1bd1SJung-uk Kim 	if (callout_pending(&d->bd_callout) || !callout_active(&d->bd_callout))
10519fee1bd1SJung-uk Kim 		return;
105281bda851SJohn Polstra 	if (d->bd_state == BPF_WAITING) {
105381bda851SJohn Polstra 		d->bd_state = BPF_TIMED_OUT;
105481bda851SJohn Polstra 		if (d->bd_slen != 0)
105581bda851SJohn Polstra 			bpf_wakeup(d);
105681bda851SJohn Polstra 	}
105781bda851SJohn Polstra }
105881bda851SJohn Polstra 
105987f6c662SJulian Elischer static int
10604d621040SChristian S.J. Peron bpf_ready(struct bpf_d *d)
10614d621040SChristian S.J. Peron {
10624d621040SChristian S.J. Peron 
1063afa85850SAlexander V. Chernikov 	BPFD_LOCK_ASSERT(d);
10644d621040SChristian S.J. Peron 
10654d621040SChristian S.J. Peron 	if (!bpf_canfreebuf(d) && d->bd_hlen != 0)
10664d621040SChristian S.J. Peron 		return (1);
10674d621040SChristian S.J. Peron 	if ((d->bd_immediate || d->bd_state == BPF_TIMED_OUT) &&
10684d621040SChristian S.J. Peron 	    d->bd_slen != 0)
10694d621040SChristian S.J. Peron 		return (1);
10704d621040SChristian S.J. Peron 	return (0);
10714d621040SChristian S.J. Peron }
10724d621040SChristian S.J. Peron 
10734d621040SChristian S.J. Peron static int
107419ba8395SChristian S.J. Peron bpfwrite(struct cdev *dev, struct uio *uio, int ioflag)
1075df8bae1dSRodney W. Grimes {
1076136600feSEd Schouten 	struct bpf_d *d;
1077df8bae1dSRodney W. Grimes 	struct ifnet *ifp;
1078560a54e1SJung-uk Kim 	struct mbuf *m, *mc;
10798240bf1eSRobert Watson 	struct sockaddr dst;
1080560a54e1SJung-uk Kim 	int error, hlen;
1081df8bae1dSRodney W. Grimes 
1082136600feSEd Schouten 	error = devfs_get_cdevpriv((void **)&d);
1083136600feSEd Schouten 	if (error != 0)
1084136600feSEd Schouten 		return (error);
1085136600feSEd Schouten 
1086e4b3229aSAlexander V. Chernikov 	BPF_PID_REFRESH_CUR(d);
10874d621040SChristian S.J. Peron 	d->bd_wcount++;
10886c74ff0eSAlexander V. Chernikov 	/* XXX: locking required */
10894d621040SChristian S.J. Peron 	if (d->bd_bif == NULL) {
10904d621040SChristian S.J. Peron 		d->bd_wdcount++;
1091df8bae1dSRodney W. Grimes 		return (ENXIO);
10924d621040SChristian S.J. Peron 	}
1093df8bae1dSRodney W. Grimes 
1094df8bae1dSRodney W. Grimes 	ifp = d->bd_bif->bif_ifp;
1095df8bae1dSRodney W. Grimes 
10964d621040SChristian S.J. Peron 	if ((ifp->if_flags & IFF_UP) == 0) {
10974d621040SChristian S.J. Peron 		d->bd_wdcount++;
10983518d220SSam Leffler 		return (ENETDOWN);
10994d621040SChristian S.J. Peron 	}
11003518d220SSam Leffler 
11014d621040SChristian S.J. Peron 	if (uio->uio_resid == 0) {
11024d621040SChristian S.J. Peron 		d->bd_wdcount++;
1103df8bae1dSRodney W. Grimes 		return (0);
11044d621040SChristian S.J. Peron 	}
1105df8bae1dSRodney W. Grimes 
11068240bf1eSRobert Watson 	bzero(&dst, sizeof(dst));
1107d83e603aSChristian S.J. Peron 	m = NULL;
1108d83e603aSChristian S.J. Peron 	hlen = 0;
11096c74ff0eSAlexander V. Chernikov 	/* XXX: bpf_movein() can sleep */
1110cb44b6dfSAndrew Thompson 	error = bpf_movein(uio, (int)d->bd_bif->bif_dlt, ifp,
1111560a54e1SJung-uk Kim 	    &m, &dst, &hlen, d->bd_wfilter);
11124d621040SChristian S.J. Peron 	if (error) {
11134d621040SChristian S.J. Peron 		d->bd_wdcount++;
1114df8bae1dSRodney W. Grimes 		return (error);
11154d621040SChristian S.J. Peron 	}
11164d621040SChristian S.J. Peron 	d->bd_wfcount++;
1117114ae644SMike Smith 	if (d->bd_hdrcmplt)
1118114ae644SMike Smith 		dst.sa_family = pseudo_AF_HDRCMPLT;
1119114ae644SMike Smith 
1120560a54e1SJung-uk Kim 	if (d->bd_feedback) {
1121eb1b1807SGleb Smirnoff 		mc = m_dup(m, M_NOWAIT);
1122560a54e1SJung-uk Kim 		if (mc != NULL)
1123560a54e1SJung-uk Kim 			mc->m_pkthdr.rcvif = ifp;
11248cd892f7SJung-uk Kim 		/* Set M_PROMISC for outgoing packets to be discarded. */
11258cd892f7SJung-uk Kim 		if (d->bd_direction == BPF_D_INOUT)
11268cd892f7SJung-uk Kim 			m->m_flags |= M_PROMISC;
1127560a54e1SJung-uk Kim 	} else
1128560a54e1SJung-uk Kim 		mc = NULL;
1129560a54e1SJung-uk Kim 
1130560a54e1SJung-uk Kim 	m->m_pkthdr.len -= hlen;
1131560a54e1SJung-uk Kim 	m->m_len -= hlen;
1132560a54e1SJung-uk Kim 	m->m_data += hlen;	/* XXX */
1133560a54e1SJung-uk Kim 
113421ca7b57SMarko Zec 	CURVNET_SET(ifp->if_vnet);
113582f4445dSRobert Watson #ifdef MAC
1136afa85850SAlexander V. Chernikov 	BPFD_LOCK(d);
113730d239bcSRobert Watson 	mac_bpfdesc_create_mbuf(d, m);
1138560a54e1SJung-uk Kim 	if (mc != NULL)
113930d239bcSRobert Watson 		mac_bpfdesc_create_mbuf(d, mc);
1140afa85850SAlexander V. Chernikov 	BPFD_UNLOCK(d);
114182f4445dSRobert Watson #endif
1142560a54e1SJung-uk Kim 
1143572bde2aSRobert Watson 	error = (*ifp->if_output)(ifp, m, &dst, NULL);
11444d621040SChristian S.J. Peron 	if (error)
11454d621040SChristian S.J. Peron 		d->bd_wdcount++;
1146560a54e1SJung-uk Kim 
1147560a54e1SJung-uk Kim 	if (mc != NULL) {
11480bf686c1SRobert Watson 		if (error == 0)
1149560a54e1SJung-uk Kim 			(*ifp->if_input)(ifp, mc);
11500bf686c1SRobert Watson 		else
1151560a54e1SJung-uk Kim 			m_freem(mc);
1152560a54e1SJung-uk Kim 	}
115321ca7b57SMarko Zec 	CURVNET_RESTORE();
1154560a54e1SJung-uk Kim 
1155df8bae1dSRodney W. Grimes 	return (error);
1156df8bae1dSRodney W. Grimes }
1157df8bae1dSRodney W. Grimes 
1158df8bae1dSRodney W. Grimes /*
1159e82669d9SRobert Watson  * Reset a descriptor by flushing its packet buffer and clearing the receive
1160e82669d9SRobert Watson  * and drop counts.  This is doable for kernel-only buffers, but with
1161e82669d9SRobert Watson  * zero-copy buffers, we can't write to (or rotate) buffers that are
1162e82669d9SRobert Watson  * currently owned by userspace.  It would be nice if we could encapsulate
1163e82669d9SRobert Watson  * this logic in the buffer code rather than here.
1164df8bae1dSRodney W. Grimes  */
1165df8bae1dSRodney W. Grimes static void
116619ba8395SChristian S.J. Peron reset_d(struct bpf_d *d)
1167df8bae1dSRodney W. Grimes {
1168e7bb21b3SJonathan Lemon 
1169afa85850SAlexander V. Chernikov 	BPFD_LOCK_ASSERT(d);
1170e82669d9SRobert Watson 
11713b3b91e7SGuy Helmer 	while (d->bd_hbuf_in_use)
11723b3b91e7SGuy Helmer 		mtx_sleep(&d->bd_hbuf_in_use, &d->bd_lock, PRINET,
11733b3b91e7SGuy Helmer 		    "bd_hbuf", 0);
1174e82669d9SRobert Watson 	if ((d->bd_hbuf != NULL) &&
1175e82669d9SRobert Watson 	    (d->bd_bufmode != BPF_BUFMODE_ZBUF || bpf_canfreebuf(d))) {
1176df8bae1dSRodney W. Grimes 		/* Free the hold buffer. */
1177df8bae1dSRodney W. Grimes 		d->bd_fbuf = d->bd_hbuf;
1178572bde2aSRobert Watson 		d->bd_hbuf = NULL;
1179e82669d9SRobert Watson 		d->bd_hlen = 0;
118029f612ecSChristian S.J. Peron 		bpf_buf_reclaimed(d);
1181df8bae1dSRodney W. Grimes 	}
1182e82669d9SRobert Watson 	if (bpf_canwritebuf(d))
1183df8bae1dSRodney W. Grimes 		d->bd_slen = 0;
1184df8bae1dSRodney W. Grimes 	d->bd_rcount = 0;
1185df8bae1dSRodney W. Grimes 	d->bd_dcount = 0;
118669f7644bSChristian S.J. Peron 	d->bd_fcount = 0;
11874d621040SChristian S.J. Peron 	d->bd_wcount = 0;
11884d621040SChristian S.J. Peron 	d->bd_wfcount = 0;
11894d621040SChristian S.J. Peron 	d->bd_wdcount = 0;
11904d621040SChristian S.J. Peron 	d->bd_zcopy = 0;
1191df8bae1dSRodney W. Grimes }
1192df8bae1dSRodney W. Grimes 
1193df8bae1dSRodney W. Grimes /*
1194df8bae1dSRodney W. Grimes  *  FIONREAD		Check for read packet available.
1195df8bae1dSRodney W. Grimes  *  SIOCGIFADDR		Get interface address - convenient hook to driver.
1196df8bae1dSRodney W. Grimes  *  BIOCGBLEN		Get buffer len [for read()].
1197f11c3508SDavid Malone  *  BIOCSETF		Set read filter.
1198f11c3508SDavid Malone  *  BIOCSETFNR		Set read filter without resetting descriptor.
1199f11c3508SDavid Malone  *  BIOCSETWF		Set write filter.
1200df8bae1dSRodney W. Grimes  *  BIOCFLUSH		Flush read packet buffer.
1201df8bae1dSRodney W. Grimes  *  BIOCPROMISC		Put interface into promiscuous mode.
1202df8bae1dSRodney W. Grimes  *  BIOCGDLT		Get link layer type.
1203df8bae1dSRodney W. Grimes  *  BIOCGETIF		Get interface name.
1204df8bae1dSRodney W. Grimes  *  BIOCSETIF		Set interface.
1205df8bae1dSRodney W. Grimes  *  BIOCSRTIMEOUT	Set read timeout.
1206df8bae1dSRodney W. Grimes  *  BIOCGRTIMEOUT	Get read timeout.
1207df8bae1dSRodney W. Grimes  *  BIOCGSTATS		Get packet stats.
1208df8bae1dSRodney W. Grimes  *  BIOCIMMEDIATE	Set immediate mode.
1209df8bae1dSRodney W. Grimes  *  BIOCVERSION		Get filter language version.
1210114ae644SMike Smith  *  BIOCGHDRCMPLT	Get "header already complete" flag
1211114ae644SMike Smith  *  BIOCSHDRCMPLT	Set "header already complete" flag
1212560a54e1SJung-uk Kim  *  BIOCGDIRECTION	Get packet direction flag
1213560a54e1SJung-uk Kim  *  BIOCSDIRECTION	Set packet direction flag
1214547d94bdSJung-uk Kim  *  BIOCGTSTAMP		Get time stamp format and resolution.
1215547d94bdSJung-uk Kim  *  BIOCSTSTAMP		Set time stamp format and resolution.
121693e39f0bSChristian S.J. Peron  *  BIOCLOCK		Set "locked" flag
1217560a54e1SJung-uk Kim  *  BIOCFEEDBACK	Set packet feedback mode.
12184d621040SChristian S.J. Peron  *  BIOCSETZBUF		Set current zero-copy buffer locations.
12194d621040SChristian S.J. Peron  *  BIOCGETZMAX		Get maximum zero-copy buffer size.
12204d621040SChristian S.J. Peron  *  BIOCROTZBUF		Force rotation of zero-copy buffer
12214d621040SChristian S.J. Peron  *  BIOCSETBUFMODE	Set buffer mode.
12224d621040SChristian S.J. Peron  *  BIOCGETBUFMODE	Get current buffer mode.
1223df8bae1dSRodney W. Grimes  */
1224df8bae1dSRodney W. Grimes /* ARGSUSED */
122587f6c662SJulian Elischer static	int
122619ba8395SChristian S.J. Peron bpfioctl(struct cdev *dev, u_long cmd, caddr_t addr, int flags,
122719ba8395SChristian S.J. Peron     struct thread *td)
1228df8bae1dSRodney W. Grimes {
1229136600feSEd Schouten 	struct bpf_d *d;
1230136600feSEd Schouten 	int error;
1231136600feSEd Schouten 
1232136600feSEd Schouten 	error = devfs_get_cdevpriv((void **)&d);
1233136600feSEd Schouten 	if (error != 0)
1234136600feSEd Schouten 		return (error);
1235df8bae1dSRodney W. Grimes 
1236b75a24a0SChristian S.J. Peron 	/*
1237b75a24a0SChristian S.J. Peron 	 * Refresh PID associated with this descriptor.
1238b75a24a0SChristian S.J. Peron 	 */
1239afa85850SAlexander V. Chernikov 	BPFD_LOCK(d);
1240e4b3229aSAlexander V. Chernikov 	BPF_PID_REFRESH(d, td);
124181bda851SJohn Polstra 	if (d->bd_state == BPF_WAITING)
124281bda851SJohn Polstra 		callout_stop(&d->bd_callout);
124381bda851SJohn Polstra 	d->bd_state = BPF_IDLE;
1244afa85850SAlexander V. Chernikov 	BPFD_UNLOCK(d);
124581bda851SJohn Polstra 
124693e39f0bSChristian S.J. Peron 	if (d->bd_locked == 1) {
124793e39f0bSChristian S.J. Peron 		switch (cmd) {
124893e39f0bSChristian S.J. Peron 		case BIOCGBLEN:
124993e39f0bSChristian S.J. Peron 		case BIOCFLUSH:
125093e39f0bSChristian S.J. Peron 		case BIOCGDLT:
125193e39f0bSChristian S.J. Peron 		case BIOCGDLTLIST:
1252fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32
1253fc0a61a4SKonstantin Belousov 		case BIOCGDLTLIST32:
1254fc0a61a4SKonstantin Belousov #endif
125593e39f0bSChristian S.J. Peron 		case BIOCGETIF:
125693e39f0bSChristian S.J. Peron 		case BIOCGRTIMEOUT:
12579624d947SJuli Mallett #if defined(COMPAT_FREEBSD32) && !defined(__mips__)
1258fc0a61a4SKonstantin Belousov 		case BIOCGRTIMEOUT32:
1259fc0a61a4SKonstantin Belousov #endif
126093e39f0bSChristian S.J. Peron 		case BIOCGSTATS:
126193e39f0bSChristian S.J. Peron 		case BIOCVERSION:
126293e39f0bSChristian S.J. Peron 		case BIOCGRSIG:
126393e39f0bSChristian S.J. Peron 		case BIOCGHDRCMPLT:
1264547d94bdSJung-uk Kim 		case BIOCSTSTAMP:
1265560a54e1SJung-uk Kim 		case BIOCFEEDBACK:
126693e39f0bSChristian S.J. Peron 		case FIONREAD:
126793e39f0bSChristian S.J. Peron 		case BIOCLOCK:
126893e39f0bSChristian S.J. Peron 		case BIOCSRTIMEOUT:
12699624d947SJuli Mallett #if defined(COMPAT_FREEBSD32) && !defined(__mips__)
1270fc0a61a4SKonstantin Belousov 		case BIOCSRTIMEOUT32:
1271fc0a61a4SKonstantin Belousov #endif
127293e39f0bSChristian S.J. Peron 		case BIOCIMMEDIATE:
127393e39f0bSChristian S.J. Peron 		case TIOCGPGRP:
12744d621040SChristian S.J. Peron 		case BIOCROTZBUF:
127593e39f0bSChristian S.J. Peron 			break;
127693e39f0bSChristian S.J. Peron 		default:
127793e39f0bSChristian S.J. Peron 			return (EPERM);
127893e39f0bSChristian S.J. Peron 		}
127993e39f0bSChristian S.J. Peron 	}
1280fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32
1281fc0a61a4SKonstantin Belousov 	/*
1282fc0a61a4SKonstantin Belousov 	 * If we see a 32-bit compat ioctl, mark the stream as 32-bit so
1283fc0a61a4SKonstantin Belousov 	 * that it will get 32-bit packet headers.
1284fc0a61a4SKonstantin Belousov 	 */
1285fc0a61a4SKonstantin Belousov 	switch (cmd) {
1286fc0a61a4SKonstantin Belousov 	case BIOCSETF32:
1287fc0a61a4SKonstantin Belousov 	case BIOCSETFNR32:
1288fc0a61a4SKonstantin Belousov 	case BIOCSETWF32:
1289fc0a61a4SKonstantin Belousov 	case BIOCGDLTLIST32:
1290fc0a61a4SKonstantin Belousov 	case BIOCGRTIMEOUT32:
1291fc0a61a4SKonstantin Belousov 	case BIOCSRTIMEOUT32:
129297aacec6SAlexander V. Chernikov 		BPFD_LOCK(d);
1293fc0a61a4SKonstantin Belousov 		d->bd_compat32 = 1;
129497aacec6SAlexander V. Chernikov 		BPFD_UNLOCK(d);
1295fc0a61a4SKonstantin Belousov 	}
1296fc0a61a4SKonstantin Belousov #endif
1297fc0a61a4SKonstantin Belousov 
129897021c24SMarko Zec 	CURVNET_SET(TD_TO_VNET(td));
1299df8bae1dSRodney W. Grimes 	switch (cmd) {
1300df8bae1dSRodney W. Grimes 
1301df8bae1dSRodney W. Grimes 	default:
1302df8bae1dSRodney W. Grimes 		error = EINVAL;
1303df8bae1dSRodney W. Grimes 		break;
1304df8bae1dSRodney W. Grimes 
1305df8bae1dSRodney W. Grimes 	/*
1306df8bae1dSRodney W. Grimes 	 * Check for read packet available.
1307df8bae1dSRodney W. Grimes 	 */
1308df8bae1dSRodney W. Grimes 	case FIONREAD:
1309df8bae1dSRodney W. Grimes 		{
1310df8bae1dSRodney W. Grimes 			int n;
1311df8bae1dSRodney W. Grimes 
1312afa85850SAlexander V. Chernikov 			BPFD_LOCK(d);
1313df8bae1dSRodney W. Grimes 			n = d->bd_slen;
13143b3b91e7SGuy Helmer 			while (d->bd_hbuf_in_use)
13153b3b91e7SGuy Helmer 				mtx_sleep(&d->bd_hbuf_in_use, &d->bd_lock,
13163b3b91e7SGuy Helmer 				    PRINET, "bd_hbuf", 0);
1317df8bae1dSRodney W. Grimes 			if (d->bd_hbuf)
1318df8bae1dSRodney W. Grimes 				n += d->bd_hlen;
1319afa85850SAlexander V. Chernikov 			BPFD_UNLOCK(d);
1320df8bae1dSRodney W. Grimes 
1321df8bae1dSRodney W. Grimes 			*(int *)addr = n;
1322df8bae1dSRodney W. Grimes 			break;
1323df8bae1dSRodney W. Grimes 		}
1324df8bae1dSRodney W. Grimes 
1325df8bae1dSRodney W. Grimes 	case SIOCGIFADDR:
1326df8bae1dSRodney W. Grimes 		{
1327df8bae1dSRodney W. Grimes 			struct ifnet *ifp;
1328df8bae1dSRodney W. Grimes 
1329572bde2aSRobert Watson 			if (d->bd_bif == NULL)
1330df8bae1dSRodney W. Grimes 				error = EINVAL;
1331df8bae1dSRodney W. Grimes 			else {
1332df8bae1dSRodney W. Grimes 				ifp = d->bd_bif->bif_ifp;
1333df8bae1dSRodney W. Grimes 				error = (*ifp->if_ioctl)(ifp, cmd, addr);
1334df8bae1dSRodney W. Grimes 			}
1335df8bae1dSRodney W. Grimes 			break;
1336df8bae1dSRodney W. Grimes 		}
1337df8bae1dSRodney W. Grimes 
1338df8bae1dSRodney W. Grimes 	/*
1339df8bae1dSRodney W. Grimes 	 * Get buffer len [for read()].
1340df8bae1dSRodney W. Grimes 	 */
1341df8bae1dSRodney W. Grimes 	case BIOCGBLEN:
134297aacec6SAlexander V. Chernikov 		BPFD_LOCK(d);
1343df8bae1dSRodney W. Grimes 		*(u_int *)addr = d->bd_bufsize;
134497aacec6SAlexander V. Chernikov 		BPFD_UNLOCK(d);
1345df8bae1dSRodney W. Grimes 		break;
1346df8bae1dSRodney W. Grimes 
1347df8bae1dSRodney W. Grimes 	/*
1348df8bae1dSRodney W. Grimes 	 * Set buffer length.
1349df8bae1dSRodney W. Grimes 	 */
1350df8bae1dSRodney W. Grimes 	case BIOCSBLEN:
13514d621040SChristian S.J. Peron 		error = bpf_ioctl_sblen(d, (u_int *)addr);
1352df8bae1dSRodney W. Grimes 		break;
1353df8bae1dSRodney W. Grimes 
1354df8bae1dSRodney W. Grimes 	/*
1355df8bae1dSRodney W. Grimes 	 * Set link layer read filter.
1356df8bae1dSRodney W. Grimes 	 */
1357df8bae1dSRodney W. Grimes 	case BIOCSETF:
1358f11c3508SDavid Malone 	case BIOCSETFNR:
135993e39f0bSChristian S.J. Peron 	case BIOCSETWF:
1360fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32
1361fc0a61a4SKonstantin Belousov 	case BIOCSETF32:
1362fc0a61a4SKonstantin Belousov 	case BIOCSETFNR32:
1363fc0a61a4SKonstantin Belousov 	case BIOCSETWF32:
1364fc0a61a4SKonstantin Belousov #endif
136593e39f0bSChristian S.J. Peron 		error = bpf_setf(d, (struct bpf_program *)addr, cmd);
1366df8bae1dSRodney W. Grimes 		break;
1367df8bae1dSRodney W. Grimes 
1368df8bae1dSRodney W. Grimes 	/*
1369df8bae1dSRodney W. Grimes 	 * Flush read packet buffer.
1370df8bae1dSRodney W. Grimes 	 */
1371df8bae1dSRodney W. Grimes 	case BIOCFLUSH:
1372afa85850SAlexander V. Chernikov 		BPFD_LOCK(d);
1373df8bae1dSRodney W. Grimes 		reset_d(d);
1374afa85850SAlexander V. Chernikov 		BPFD_UNLOCK(d);
1375df8bae1dSRodney W. Grimes 		break;
1376df8bae1dSRodney W. Grimes 
1377df8bae1dSRodney W. Grimes 	/*
1378df8bae1dSRodney W. Grimes 	 * Put interface into promiscuous mode.
1379df8bae1dSRodney W. Grimes 	 */
1380df8bae1dSRodney W. Grimes 	case BIOCPROMISC:
1381572bde2aSRobert Watson 		if (d->bd_bif == NULL) {
1382df8bae1dSRodney W. Grimes 			/*
1383df8bae1dSRodney W. Grimes 			 * No interface attached yet.
1384df8bae1dSRodney W. Grimes 			 */
1385df8bae1dSRodney W. Grimes 			error = EINVAL;
1386df8bae1dSRodney W. Grimes 			break;
1387df8bae1dSRodney W. Grimes 		}
1388df8bae1dSRodney W. Grimes 		if (d->bd_promisc == 0) {
1389df8bae1dSRodney W. Grimes 			error = ifpromisc(d->bd_bif->bif_ifp, 1);
1390df8bae1dSRodney W. Grimes 			if (error == 0)
1391df8bae1dSRodney W. Grimes 				d->bd_promisc = 1;
1392df8bae1dSRodney W. Grimes 		}
1393df8bae1dSRodney W. Grimes 		break;
1394df8bae1dSRodney W. Grimes 
1395df8bae1dSRodney W. Grimes 	/*
13968eab61f3SSam Leffler 	 * Get current data link type.
1397df8bae1dSRodney W. Grimes 	 */
1398df8bae1dSRodney W. Grimes 	case BIOCGDLT:
139997aacec6SAlexander V. Chernikov 		BPF_LOCK();
1400572bde2aSRobert Watson 		if (d->bd_bif == NULL)
1401df8bae1dSRodney W. Grimes 			error = EINVAL;
1402df8bae1dSRodney W. Grimes 		else
1403df8bae1dSRodney W. Grimes 			*(u_int *)addr = d->bd_bif->bif_dlt;
140497aacec6SAlexander V. Chernikov 		BPF_UNLOCK();
1405df8bae1dSRodney W. Grimes 		break;
1406df8bae1dSRodney W. Grimes 
1407df8bae1dSRodney W. Grimes 	/*
14088eab61f3SSam Leffler 	 * Get a list of supported data link types.
14098eab61f3SSam Leffler 	 */
1410fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32
1411fc0a61a4SKonstantin Belousov 	case BIOCGDLTLIST32:
1412fc0a61a4SKonstantin Belousov 		{
1413fc0a61a4SKonstantin Belousov 			struct bpf_dltlist32 *list32;
1414fc0a61a4SKonstantin Belousov 			struct bpf_dltlist dltlist;
1415fc0a61a4SKonstantin Belousov 
1416fc0a61a4SKonstantin Belousov 			list32 = (struct bpf_dltlist32 *)addr;
1417fc0a61a4SKonstantin Belousov 			dltlist.bfl_len = list32->bfl_len;
1418fc0a61a4SKonstantin Belousov 			dltlist.bfl_list = PTRIN(list32->bfl_list);
141997aacec6SAlexander V. Chernikov 			BPF_LOCK();
1420fc0a61a4SKonstantin Belousov 			if (d->bd_bif == NULL)
1421fc0a61a4SKonstantin Belousov 				error = EINVAL;
1422fc0a61a4SKonstantin Belousov 			else {
1423fc0a61a4SKonstantin Belousov 				error = bpf_getdltlist(d, &dltlist);
1424fc0a61a4SKonstantin Belousov 				if (error == 0)
1425fc0a61a4SKonstantin Belousov 					list32->bfl_len = dltlist.bfl_len;
1426fc0a61a4SKonstantin Belousov 			}
142797aacec6SAlexander V. Chernikov 			BPF_UNLOCK();
1428fc0a61a4SKonstantin Belousov 			break;
1429fc0a61a4SKonstantin Belousov 		}
1430fc0a61a4SKonstantin Belousov #endif
1431fc0a61a4SKonstantin Belousov 
14328eab61f3SSam Leffler 	case BIOCGDLTLIST:
143397aacec6SAlexander V. Chernikov 		BPF_LOCK();
1434572bde2aSRobert Watson 		if (d->bd_bif == NULL)
14358eab61f3SSam Leffler 			error = EINVAL;
14368eab61f3SSam Leffler 		else
14378eab61f3SSam Leffler 			error = bpf_getdltlist(d, (struct bpf_dltlist *)addr);
143897aacec6SAlexander V. Chernikov 		BPF_UNLOCK();
14398eab61f3SSam Leffler 		break;
14408eab61f3SSam Leffler 
14418eab61f3SSam Leffler 	/*
14428eab61f3SSam Leffler 	 * Set data link type.
14438eab61f3SSam Leffler 	 */
14448eab61f3SSam Leffler 	case BIOCSDLT:
14456c74ff0eSAlexander V. Chernikov 		BPF_LOCK();
1446572bde2aSRobert Watson 		if (d->bd_bif == NULL)
14478eab61f3SSam Leffler 			error = EINVAL;
14488eab61f3SSam Leffler 		else
14498eab61f3SSam Leffler 			error = bpf_setdlt(d, *(u_int *)addr);
14506c74ff0eSAlexander V. Chernikov 		BPF_UNLOCK();
14518eab61f3SSam Leffler 		break;
14528eab61f3SSam Leffler 
14538eab61f3SSam Leffler 	/*
14541dd0feaaSArchie Cobbs 	 * Get interface name.
1455df8bae1dSRodney W. Grimes 	 */
1456df8bae1dSRodney W. Grimes 	case BIOCGETIF:
145797aacec6SAlexander V. Chernikov 		BPF_LOCK();
1458572bde2aSRobert Watson 		if (d->bd_bif == NULL)
1459df8bae1dSRodney W. Grimes 			error = EINVAL;
14601dd0feaaSArchie Cobbs 		else {
14611dd0feaaSArchie Cobbs 			struct ifnet *const ifp = d->bd_bif->bif_ifp;
14621dd0feaaSArchie Cobbs 			struct ifreq *const ifr = (struct ifreq *)addr;
14631dd0feaaSArchie Cobbs 
14649bf40edeSBrooks Davis 			strlcpy(ifr->ifr_name, ifp->if_xname,
14659bf40edeSBrooks Davis 			    sizeof(ifr->ifr_name));
14661dd0feaaSArchie Cobbs 		}
146797aacec6SAlexander V. Chernikov 		BPF_UNLOCK();
1468df8bae1dSRodney W. Grimes 		break;
1469df8bae1dSRodney W. Grimes 
1470df8bae1dSRodney W. Grimes 	/*
1471df8bae1dSRodney W. Grimes 	 * Set interface.
1472df8bae1dSRodney W. Grimes 	 */
1473df8bae1dSRodney W. Grimes 	case BIOCSETIF:
14746c74ff0eSAlexander V. Chernikov 		BPF_LOCK();
1475df8bae1dSRodney W. Grimes 		error = bpf_setif(d, (struct ifreq *)addr);
14766c74ff0eSAlexander V. Chernikov 		BPF_UNLOCK();
1477df8bae1dSRodney W. Grimes 		break;
1478df8bae1dSRodney W. Grimes 
1479df8bae1dSRodney W. Grimes 	/*
1480df8bae1dSRodney W. Grimes 	 * Set read timeout.
1481df8bae1dSRodney W. Grimes 	 */
1482df8bae1dSRodney W. Grimes 	case BIOCSRTIMEOUT:
14839624d947SJuli Mallett #if defined(COMPAT_FREEBSD32) && !defined(__mips__)
1484fc0a61a4SKonstantin Belousov 	case BIOCSRTIMEOUT32:
1485fc0a61a4SKonstantin Belousov #endif
1486df8bae1dSRodney W. Grimes 		{
1487df8bae1dSRodney W. Grimes 			struct timeval *tv = (struct timeval *)addr;
14889624d947SJuli Mallett #if defined(COMPAT_FREEBSD32) && !defined(__mips__)
1489fc0a61a4SKonstantin Belousov 			struct timeval32 *tv32;
1490fc0a61a4SKonstantin Belousov 			struct timeval tv64;
1491fc0a61a4SKonstantin Belousov 
1492fc0a61a4SKonstantin Belousov 			if (cmd == BIOCSRTIMEOUT32) {
1493fc0a61a4SKonstantin Belousov 				tv32 = (struct timeval32 *)addr;
1494fc0a61a4SKonstantin Belousov 				tv = &tv64;
1495fc0a61a4SKonstantin Belousov 				tv->tv_sec = tv32->tv_sec;
1496fc0a61a4SKonstantin Belousov 				tv->tv_usec = tv32->tv_usec;
1497fc0a61a4SKonstantin Belousov 			} else
1498fc0a61a4SKonstantin Belousov #endif
1499fc0a61a4SKonstantin Belousov 				tv = (struct timeval *)addr;
1500df8bae1dSRodney W. Grimes 
1501bdc2cdc5SAlexander Langer 			/*
1502bdc2cdc5SAlexander Langer 			 * Subtract 1 tick from tvtohz() since this isn't
1503bdc2cdc5SAlexander Langer 			 * a one-shot timer.
1504bdc2cdc5SAlexander Langer 			 */
1505bdc2cdc5SAlexander Langer 			if ((error = itimerfix(tv)) == 0)
1506bdc2cdc5SAlexander Langer 				d->bd_rtout = tvtohz(tv) - 1;
1507df8bae1dSRodney W. Grimes 			break;
1508df8bae1dSRodney W. Grimes 		}
1509df8bae1dSRodney W. Grimes 
1510df8bae1dSRodney W. Grimes 	/*
1511df8bae1dSRodney W. Grimes 	 * Get read timeout.
1512df8bae1dSRodney W. Grimes 	 */
1513df8bae1dSRodney W. Grimes 	case BIOCGRTIMEOUT:
15149624d947SJuli Mallett #if defined(COMPAT_FREEBSD32) && !defined(__mips__)
1515fc0a61a4SKonstantin Belousov 	case BIOCGRTIMEOUT32:
1516fc0a61a4SKonstantin Belousov #endif
1517df8bae1dSRodney W. Grimes 		{
1518fc0a61a4SKonstantin Belousov 			struct timeval *tv;
15199624d947SJuli Mallett #if defined(COMPAT_FREEBSD32) && !defined(__mips__)
1520fc0a61a4SKonstantin Belousov 			struct timeval32 *tv32;
1521fc0a61a4SKonstantin Belousov 			struct timeval tv64;
1522fc0a61a4SKonstantin Belousov 
1523fc0a61a4SKonstantin Belousov 			if (cmd == BIOCGRTIMEOUT32)
1524fc0a61a4SKonstantin Belousov 				tv = &tv64;
1525fc0a61a4SKonstantin Belousov 			else
1526fc0a61a4SKonstantin Belousov #endif
1527fc0a61a4SKonstantin Belousov 				tv = (struct timeval *)addr;
1528df8bae1dSRodney W. Grimes 
1529bdc2cdc5SAlexander Langer 			tv->tv_sec = d->bd_rtout / hz;
1530bdc2cdc5SAlexander Langer 			tv->tv_usec = (d->bd_rtout % hz) * tick;
15319624d947SJuli Mallett #if defined(COMPAT_FREEBSD32) && !defined(__mips__)
1532fc0a61a4SKonstantin Belousov 			if (cmd == BIOCGRTIMEOUT32) {
1533fc0a61a4SKonstantin Belousov 				tv32 = (struct timeval32 *)addr;
1534fc0a61a4SKonstantin Belousov 				tv32->tv_sec = tv->tv_sec;
1535fc0a61a4SKonstantin Belousov 				tv32->tv_usec = tv->tv_usec;
1536fc0a61a4SKonstantin Belousov 			}
1537fc0a61a4SKonstantin Belousov #endif
1538fc0a61a4SKonstantin Belousov 
1539df8bae1dSRodney W. Grimes 			break;
1540df8bae1dSRodney W. Grimes 		}
1541df8bae1dSRodney W. Grimes 
1542df8bae1dSRodney W. Grimes 	/*
1543df8bae1dSRodney W. Grimes 	 * Get packet stats.
1544df8bae1dSRodney W. Grimes 	 */
1545df8bae1dSRodney W. Grimes 	case BIOCGSTATS:
1546df8bae1dSRodney W. Grimes 		{
1547df8bae1dSRodney W. Grimes 			struct bpf_stat *bs = (struct bpf_stat *)addr;
1548df8bae1dSRodney W. Grimes 
15494d621040SChristian S.J. Peron 			/* XXXCSJP overflow */
1550df8bae1dSRodney W. Grimes 			bs->bs_recv = d->bd_rcount;
1551df8bae1dSRodney W. Grimes 			bs->bs_drop = d->bd_dcount;
1552df8bae1dSRodney W. Grimes 			break;
1553df8bae1dSRodney W. Grimes 		}
1554df8bae1dSRodney W. Grimes 
1555df8bae1dSRodney W. Grimes 	/*
1556df8bae1dSRodney W. Grimes 	 * Set immediate mode.
1557df8bae1dSRodney W. Grimes 	 */
1558df8bae1dSRodney W. Grimes 	case BIOCIMMEDIATE:
155997aacec6SAlexander V. Chernikov 		BPFD_LOCK(d);
1560df8bae1dSRodney W. Grimes 		d->bd_immediate = *(u_int *)addr;
156197aacec6SAlexander V. Chernikov 		BPFD_UNLOCK(d);
1562df8bae1dSRodney W. Grimes 		break;
1563df8bae1dSRodney W. Grimes 
1564df8bae1dSRodney W. Grimes 	case BIOCVERSION:
1565df8bae1dSRodney W. Grimes 		{
1566df8bae1dSRodney W. Grimes 			struct bpf_version *bv = (struct bpf_version *)addr;
1567df8bae1dSRodney W. Grimes 
1568df8bae1dSRodney W. Grimes 			bv->bv_major = BPF_MAJOR_VERSION;
1569df8bae1dSRodney W. Grimes 			bv->bv_minor = BPF_MINOR_VERSION;
1570df8bae1dSRodney W. Grimes 			break;
1571df8bae1dSRodney W. Grimes 		}
157200a83887SPaul Traina 
1573114ae644SMike Smith 	/*
1574114ae644SMike Smith 	 * Get "header already complete" flag
1575114ae644SMike Smith 	 */
1576114ae644SMike Smith 	case BIOCGHDRCMPLT:
157797aacec6SAlexander V. Chernikov 		BPFD_LOCK(d);
1578114ae644SMike Smith 		*(u_int *)addr = d->bd_hdrcmplt;
157997aacec6SAlexander V. Chernikov 		BPFD_UNLOCK(d);
1580114ae644SMike Smith 		break;
1581114ae644SMike Smith 
1582114ae644SMike Smith 	/*
1583114ae644SMike Smith 	 * Set "header already complete" flag
1584114ae644SMike Smith 	 */
1585114ae644SMike Smith 	case BIOCSHDRCMPLT:
158697aacec6SAlexander V. Chernikov 		BPFD_LOCK(d);
1587114ae644SMike Smith 		d->bd_hdrcmplt = *(u_int *)addr ? 1 : 0;
158897aacec6SAlexander V. Chernikov 		BPFD_UNLOCK(d);
1589114ae644SMike Smith 		break;
1590114ae644SMike Smith 
15918ed3828cSRobert Watson 	/*
1592560a54e1SJung-uk Kim 	 * Get packet direction flag
15938ed3828cSRobert Watson 	 */
1594560a54e1SJung-uk Kim 	case BIOCGDIRECTION:
159597aacec6SAlexander V. Chernikov 		BPFD_LOCK(d);
1596560a54e1SJung-uk Kim 		*(u_int *)addr = d->bd_direction;
159797aacec6SAlexander V. Chernikov 		BPFD_UNLOCK(d);
15988ed3828cSRobert Watson 		break;
15998ed3828cSRobert Watson 
16008ed3828cSRobert Watson 	/*
1601560a54e1SJung-uk Kim 	 * Set packet direction flag
16028ed3828cSRobert Watson 	 */
1603560a54e1SJung-uk Kim 	case BIOCSDIRECTION:
1604560a54e1SJung-uk Kim 		{
1605560a54e1SJung-uk Kim 			u_int	direction;
1606560a54e1SJung-uk Kim 
1607560a54e1SJung-uk Kim 			direction = *(u_int *)addr;
1608560a54e1SJung-uk Kim 			switch (direction) {
1609560a54e1SJung-uk Kim 			case BPF_D_IN:
1610560a54e1SJung-uk Kim 			case BPF_D_INOUT:
1611560a54e1SJung-uk Kim 			case BPF_D_OUT:
161297aacec6SAlexander V. Chernikov 				BPFD_LOCK(d);
1613560a54e1SJung-uk Kim 				d->bd_direction = direction;
161497aacec6SAlexander V. Chernikov 				BPFD_UNLOCK(d);
1615560a54e1SJung-uk Kim 				break;
1616560a54e1SJung-uk Kim 			default:
1617560a54e1SJung-uk Kim 				error = EINVAL;
1618560a54e1SJung-uk Kim 			}
1619560a54e1SJung-uk Kim 		}
1620560a54e1SJung-uk Kim 		break;
1621560a54e1SJung-uk Kim 
1622547d94bdSJung-uk Kim 	/*
1623d0d7bcdfSJung-uk Kim 	 * Get packet timestamp format and resolution.
1624547d94bdSJung-uk Kim 	 */
1625547d94bdSJung-uk Kim 	case BIOCGTSTAMP:
162697aacec6SAlexander V. Chernikov 		BPFD_LOCK(d);
1627547d94bdSJung-uk Kim 		*(u_int *)addr = d->bd_tstamp;
162897aacec6SAlexander V. Chernikov 		BPFD_UNLOCK(d);
1629547d94bdSJung-uk Kim 		break;
1630547d94bdSJung-uk Kim 
1631547d94bdSJung-uk Kim 	/*
1632547d94bdSJung-uk Kim 	 * Set packet timestamp format and resolution.
1633547d94bdSJung-uk Kim 	 */
1634547d94bdSJung-uk Kim 	case BIOCSTSTAMP:
1635547d94bdSJung-uk Kim 		{
1636547d94bdSJung-uk Kim 			u_int	func;
1637547d94bdSJung-uk Kim 
1638547d94bdSJung-uk Kim 			func = *(u_int *)addr;
1639547d94bdSJung-uk Kim 			if (BPF_T_VALID(func))
1640547d94bdSJung-uk Kim 				d->bd_tstamp = func;
1641547d94bdSJung-uk Kim 			else
1642547d94bdSJung-uk Kim 				error = EINVAL;
1643547d94bdSJung-uk Kim 		}
1644547d94bdSJung-uk Kim 		break;
1645547d94bdSJung-uk Kim 
1646560a54e1SJung-uk Kim 	case BIOCFEEDBACK:
164797aacec6SAlexander V. Chernikov 		BPFD_LOCK(d);
1648560a54e1SJung-uk Kim 		d->bd_feedback = *(u_int *)addr;
164997aacec6SAlexander V. Chernikov 		BPFD_UNLOCK(d);
1650560a54e1SJung-uk Kim 		break;
1651560a54e1SJung-uk Kim 
1652560a54e1SJung-uk Kim 	case BIOCLOCK:
165397aacec6SAlexander V. Chernikov 		BPFD_LOCK(d);
1654560a54e1SJung-uk Kim 		d->bd_locked = 1;
165597aacec6SAlexander V. Chernikov 		BPFD_UNLOCK(d);
16568ed3828cSRobert Watson 		break;
16578ed3828cSRobert Watson 
165800a83887SPaul Traina 	case FIONBIO:		/* Non-blocking I/O */
165900a83887SPaul Traina 		break;
166000a83887SPaul Traina 
166100a83887SPaul Traina 	case FIOASYNC:		/* Send signal on receive packets */
166297aacec6SAlexander V. Chernikov 		BPFD_LOCK(d);
166300a83887SPaul Traina 		d->bd_async = *(int *)addr;
166497aacec6SAlexander V. Chernikov 		BPFD_UNLOCK(d);
166500a83887SPaul Traina 		break;
166600a83887SPaul Traina 
1667831d27a9SDon Lewis 	case FIOSETOWN:
166897aacec6SAlexander V. Chernikov 		/*
166997aacec6SAlexander V. Chernikov 		 * XXX: Add some sort of locking here?
167097aacec6SAlexander V. Chernikov 		 * fsetown() can sleep.
167197aacec6SAlexander V. Chernikov 		 */
1672831d27a9SDon Lewis 		error = fsetown(*(int *)addr, &d->bd_sigio);
167300a83887SPaul Traina 		break;
167400a83887SPaul Traina 
1675831d27a9SDon Lewis 	case FIOGETOWN:
167697aacec6SAlexander V. Chernikov 		BPFD_LOCK(d);
167791e97a82SDon Lewis 		*(int *)addr = fgetown(&d->bd_sigio);
167897aacec6SAlexander V. Chernikov 		BPFD_UNLOCK(d);
1679831d27a9SDon Lewis 		break;
1680831d27a9SDon Lewis 
1681831d27a9SDon Lewis 	/* This is deprecated, FIOSETOWN should be used instead. */
1682831d27a9SDon Lewis 	case TIOCSPGRP:
1683831d27a9SDon Lewis 		error = fsetown(-(*(int *)addr), &d->bd_sigio);
1684831d27a9SDon Lewis 		break;
1685831d27a9SDon Lewis 
1686831d27a9SDon Lewis 	/* This is deprecated, FIOGETOWN should be used instead. */
168700a83887SPaul Traina 	case TIOCGPGRP:
168891e97a82SDon Lewis 		*(int *)addr = -fgetown(&d->bd_sigio);
168900a83887SPaul Traina 		break;
169000a83887SPaul Traina 
169100a83887SPaul Traina 	case BIOCSRSIG:		/* Set receive signal */
169200a83887SPaul Traina 		{
169300a83887SPaul Traina 			u_int sig;
169400a83887SPaul Traina 
169500a83887SPaul Traina 			sig = *(u_int *)addr;
169600a83887SPaul Traina 
169700a83887SPaul Traina 			if (sig >= NSIG)
169800a83887SPaul Traina 				error = EINVAL;
169997aacec6SAlexander V. Chernikov 			else {
170097aacec6SAlexander V. Chernikov 				BPFD_LOCK(d);
170100a83887SPaul Traina 				d->bd_sig = sig;
170297aacec6SAlexander V. Chernikov 				BPFD_UNLOCK(d);
170397aacec6SAlexander V. Chernikov 			}
170400a83887SPaul Traina 			break;
170500a83887SPaul Traina 		}
170600a83887SPaul Traina 	case BIOCGRSIG:
170797aacec6SAlexander V. Chernikov 		BPFD_LOCK(d);
170800a83887SPaul Traina 		*(u_int *)addr = d->bd_sig;
170997aacec6SAlexander V. Chernikov 		BPFD_UNLOCK(d);
171000a83887SPaul Traina 		break;
17114d621040SChristian S.J. Peron 
17124d621040SChristian S.J. Peron 	case BIOCGETBUFMODE:
171397aacec6SAlexander V. Chernikov 		BPFD_LOCK(d);
17144d621040SChristian S.J. Peron 		*(u_int *)addr = d->bd_bufmode;
171597aacec6SAlexander V. Chernikov 		BPFD_UNLOCK(d);
17164d621040SChristian S.J. Peron 		break;
17174d621040SChristian S.J. Peron 
17184d621040SChristian S.J. Peron 	case BIOCSETBUFMODE:
17194d621040SChristian S.J. Peron 		/*
17204d621040SChristian S.J. Peron 		 * Allow the buffering mode to be changed as long as we
17214d621040SChristian S.J. Peron 		 * haven't yet committed to a particular mode.  Our
17224d621040SChristian S.J. Peron 		 * definition of commitment, for now, is whether or not a
17234d621040SChristian S.J. Peron 		 * buffer has been allocated or an interface attached, since
17244d621040SChristian S.J. Peron 		 * that's the point where things get tricky.
17254d621040SChristian S.J. Peron 		 */
17264d621040SChristian S.J. Peron 		switch (*(u_int *)addr) {
17274d621040SChristian S.J. Peron 		case BPF_BUFMODE_BUFFER:
17284d621040SChristian S.J. Peron 			break;
17294d621040SChristian S.J. Peron 
17304d621040SChristian S.J. Peron 		case BPF_BUFMODE_ZBUF:
17314d621040SChristian S.J. Peron 			if (bpf_zerocopy_enable)
17324d621040SChristian S.J. Peron 				break;
17334d621040SChristian S.J. Peron 			/* FALLSTHROUGH */
17344d621040SChristian S.J. Peron 
17354d621040SChristian S.J. Peron 		default:
17361b610a74SBjoern A. Zeeb 			CURVNET_RESTORE();
17374d621040SChristian S.J. Peron 			return (EINVAL);
17384d621040SChristian S.J. Peron 		}
17394d621040SChristian S.J. Peron 
1740afa85850SAlexander V. Chernikov 		BPFD_LOCK(d);
17414d621040SChristian S.J. Peron 		if (d->bd_sbuf != NULL || d->bd_hbuf != NULL ||
17424d621040SChristian S.J. Peron 		    d->bd_fbuf != NULL || d->bd_bif != NULL) {
1743afa85850SAlexander V. Chernikov 			BPFD_UNLOCK(d);
17441b610a74SBjoern A. Zeeb 			CURVNET_RESTORE();
17454d621040SChristian S.J. Peron 			return (EBUSY);
17464d621040SChristian S.J. Peron 		}
17474d621040SChristian S.J. Peron 		d->bd_bufmode = *(u_int *)addr;
1748afa85850SAlexander V. Chernikov 		BPFD_UNLOCK(d);
17494d621040SChristian S.J. Peron 		break;
17504d621040SChristian S.J. Peron 
17514d621040SChristian S.J. Peron 	case BIOCGETZMAX:
17521b610a74SBjoern A. Zeeb 		error = bpf_ioctl_getzmax(td, d, (size_t *)addr);
17531b610a74SBjoern A. Zeeb 		break;
17544d621040SChristian S.J. Peron 
17554d621040SChristian S.J. Peron 	case BIOCSETZBUF:
17561b610a74SBjoern A. Zeeb 		error = bpf_ioctl_setzbuf(td, d, (struct bpf_zbuf *)addr);
17571b610a74SBjoern A. Zeeb 		break;
17584d621040SChristian S.J. Peron 
17594d621040SChristian S.J. Peron 	case BIOCROTZBUF:
17601b610a74SBjoern A. Zeeb 		error = bpf_ioctl_rotzbuf(td, d, (struct bpf_zbuf *)addr);
17611b610a74SBjoern A. Zeeb 		break;
1762df8bae1dSRodney W. Grimes 	}
176397021c24SMarko Zec 	CURVNET_RESTORE();
1764df8bae1dSRodney W. Grimes 	return (error);
1765df8bae1dSRodney W. Grimes }
1766df8bae1dSRodney W. Grimes 
1767df8bae1dSRodney W. Grimes /*
1768df8bae1dSRodney W. Grimes  * Set d's packet filter program to fp.  If this file already has a filter,
1769df8bae1dSRodney W. Grimes  * free it and replace it.  Returns EINVAL for bogus requests.
1770784292f8SAlexander V. Chernikov  *
1771784292f8SAlexander V. Chernikov  * Note we need global lock here to serialize bpf_setf() and bpf_setif() calls
1772784292f8SAlexander V. Chernikov  * since reading d->bd_bif can't be protected by d or interface lock due to
1773784292f8SAlexander V. Chernikov  * lock order.
1774784292f8SAlexander V. Chernikov  *
1775784292f8SAlexander V. Chernikov  * Additionally, we have to acquire interface write lock due to bpf_mtap() uses
1776784292f8SAlexander V. Chernikov  * interface read lock to read all filers.
1777784292f8SAlexander V. Chernikov  *
1778df8bae1dSRodney W. Grimes  */
1779f708ef1bSPoul-Henning Kamp static int
178019ba8395SChristian S.J. Peron bpf_setf(struct bpf_d *d, struct bpf_program *fp, u_long cmd)
1781df8bae1dSRodney W. Grimes {
17829b7d4a7fSJung-uk Kim #ifdef COMPAT_FREEBSD32
17839b7d4a7fSJung-uk Kim 	struct bpf_program fp_swab;
17849b7d4a7fSJung-uk Kim 	struct bpf_program32 *fp32;
17859b7d4a7fSJung-uk Kim #endif
1786df8bae1dSRodney W. Grimes 	struct bpf_insn *fcode, *old;
1787293c06a1SRuslan Ermilov #ifdef BPF_JITTER
1788a86227d1SAlexander V. Chernikov 	bpf_jit_filter *jfunc, *ofunc;
1789ae275efcSJung-uk Kim #endif
17908b04b48aSJung-uk Kim 	size_t size;
17918b04b48aSJung-uk Kim 	u_int flen;
17929431cc16SAlexander V. Chernikov 	int need_upgrade;
1793df8bae1dSRodney W. Grimes 
17949b7d4a7fSJung-uk Kim #ifdef COMPAT_FREEBSD32
17956f731135SJung-uk Kim 	switch (cmd) {
17966f731135SJung-uk Kim 	case BIOCSETF32:
17976f731135SJung-uk Kim 	case BIOCSETWF32:
17986f731135SJung-uk Kim 	case BIOCSETFNR32:
1799fc0a61a4SKonstantin Belousov 		fp32 = (struct bpf_program32 *)fp;
1800fc0a61a4SKonstantin Belousov 		fp_swab.bf_len = fp32->bf_len;
1801fc0a61a4SKonstantin Belousov 		fp_swab.bf_insns = (struct bpf_insn *)(uintptr_t)fp32->bf_insns;
1802fc0a61a4SKonstantin Belousov 		fp = &fp_swab;
18036f731135SJung-uk Kim 		switch (cmd) {
18046f731135SJung-uk Kim 		case BIOCSETF32:
18056f731135SJung-uk Kim 			cmd = BIOCSETF;
18066f731135SJung-uk Kim 			break;
18076f731135SJung-uk Kim 		case BIOCSETWF32:
1808fc0a61a4SKonstantin Belousov 			cmd = BIOCSETWF;
18096f731135SJung-uk Kim 			break;
18106f731135SJung-uk Kim 		}
18116f731135SJung-uk Kim 		break;
1812fc0a61a4SKonstantin Belousov 	}
1813fc0a61a4SKonstantin Belousov #endif
18148b04b48aSJung-uk Kim 
18158b04b48aSJung-uk Kim 	fcode = NULL;
18168b04b48aSJung-uk Kim #ifdef BPF_JITTER
18178b04b48aSJung-uk Kim 	jfunc = ofunc = NULL;
18188b04b48aSJung-uk Kim #endif
18199b7d4a7fSJung-uk Kim 	need_upgrade = 0;
18208b04b48aSJung-uk Kim 
18216c74ff0eSAlexander V. Chernikov 	/*
18226c74ff0eSAlexander V. Chernikov 	 * Check new filter validness before acquiring any locks.
18236c74ff0eSAlexander V. Chernikov 	 * Allocate memory for new filter, if needed.
18246c74ff0eSAlexander V. Chernikov 	 */
18256c74ff0eSAlexander V. Chernikov 	flen = fp->bf_len;
18269b7d4a7fSJung-uk Kim 	if (flen > bpf_maxinsns || (fp->bf_insns == NULL && flen != 0))
18276c74ff0eSAlexander V. Chernikov 		return (EINVAL);
18286c74ff0eSAlexander V. Chernikov 	size = flen * sizeof(*fp->bf_insns);
1829a86227d1SAlexander V. Chernikov 	if (size > 0) {
18309b7d4a7fSJung-uk Kim 		/* We're setting up new filter.  Copy and check actual data. */
18319b7d4a7fSJung-uk Kim 		fcode = malloc(size, M_BPF, M_WAITOK);
18329b7d4a7fSJung-uk Kim 		if (copyin(fp->bf_insns, fcode, size) != 0 ||
18339b7d4a7fSJung-uk Kim 		    !bpf_validate(fcode, flen)) {
1834a86227d1SAlexander V. Chernikov 			free(fcode, M_BPF);
1835a86227d1SAlexander V. Chernikov 			return (EINVAL);
1836a86227d1SAlexander V. Chernikov 		}
1837c7b0200eSAlexander V. Chernikov #ifdef BPF_JITTER
18389b7d4a7fSJung-uk Kim 		/* Filter is copied inside fcode and is perfectly valid. */
1839c7b0200eSAlexander V. Chernikov 		jfunc = bpf_jitter(fcode, flen);
1840c7b0200eSAlexander V. Chernikov #endif
18418b04b48aSJung-uk Kim 	}
1842c7b0200eSAlexander V. Chernikov 
18436c74ff0eSAlexander V. Chernikov 	BPF_LOCK();
18446c74ff0eSAlexander V. Chernikov 
1845e4b3229aSAlexander V. Chernikov 	/*
1846a86227d1SAlexander V. Chernikov 	 * Set up new filter.
18479b7d4a7fSJung-uk Kim 	 * Protect filter change by interface lock.
18486c74ff0eSAlexander V. Chernikov 	 * Additionally, we are protected by global lock here.
1849e4b3229aSAlexander V. Chernikov 	 */
18506c74ff0eSAlexander V. Chernikov 	if (d->bd_bif != NULL)
1851e4b3229aSAlexander V. Chernikov 		BPFIF_WLOCK(d->bd_bif);
1852afa85850SAlexander V. Chernikov 	BPFD_LOCK(d);
18538b04b48aSJung-uk Kim 	if (cmd == BIOCSETWF) {
18548b04b48aSJung-uk Kim 		old = d->bd_wfilter;
185593e39f0bSChristian S.J. Peron 		d->bd_wfilter = fcode;
18568b04b48aSJung-uk Kim 	} else {
18578b04b48aSJung-uk Kim 		old = d->bd_rfilter;
185893e39f0bSChristian S.J. Peron 		d->bd_rfilter = fcode;
1859293c06a1SRuslan Ermilov #ifdef BPF_JITTER
18608b04b48aSJung-uk Kim 		ofunc = d->bd_bfilter;
1861c7b0200eSAlexander V. Chernikov 		d->bd_bfilter = jfunc;
1862ae275efcSJung-uk Kim #endif
1863f11c3508SDavid Malone 		if (cmd == BIOCSETF)
1864df8bae1dSRodney W. Grimes 			reset_d(d);
186551ec1eb7SAlexander V. Chernikov 
1866402000ffSAlexander V. Chernikov 		need_upgrade = bpf_check_upgrade(cmd, d, fcode, flen);
18678b04b48aSJung-uk Kim 	}
1868afa85850SAlexander V. Chernikov 	BPFD_UNLOCK(d);
18696c74ff0eSAlexander V. Chernikov 	if (d->bd_bif != NULL)
1870e4b3229aSAlexander V. Chernikov 		BPFIF_WUNLOCK(d->bd_bif);
1871572bde2aSRobert Watson 	if (old != NULL)
18729b7d4a7fSJung-uk Kim 		free(old, M_BPF);
1873293c06a1SRuslan Ermilov #ifdef BPF_JITTER
1874ae275efcSJung-uk Kim 	if (ofunc != NULL)
1875ae275efcSJung-uk Kim 		bpf_destroy_jit_filter(ofunc);
1876ae275efcSJung-uk Kim #endif
1877df8bae1dSRodney W. Grimes 
18789b7d4a7fSJung-uk Kim 	/* Move d to active readers list. */
1879402000ffSAlexander V. Chernikov 	if (need_upgrade != 0)
188051ec1eb7SAlexander V. Chernikov 		bpf_upgraded(d);
188151ec1eb7SAlexander V. Chernikov 
18826c74ff0eSAlexander V. Chernikov 	BPF_UNLOCK();
1883df8bae1dSRodney W. Grimes 	return (0);
1884df8bae1dSRodney W. Grimes }
1885df8bae1dSRodney W. Grimes 
1886df8bae1dSRodney W. Grimes /*
1887df8bae1dSRodney W. Grimes  * Detach a file from its current interface (if attached at all) and attach
1888df8bae1dSRodney W. Grimes  * to the interface indicated by the name stored in ifr.
1889df8bae1dSRodney W. Grimes  * Return an errno or 0.
1890df8bae1dSRodney W. Grimes  */
1891df8bae1dSRodney W. Grimes static int
189219ba8395SChristian S.J. Peron bpf_setif(struct bpf_d *d, struct ifreq *ifr)
1893df8bae1dSRodney W. Grimes {
1894df8bae1dSRodney W. Grimes 	struct bpf_if *bp;
18959b44ff22SGarrett Wollman 	struct ifnet *theywant;
1896df8bae1dSRodney W. Grimes 
18976c74ff0eSAlexander V. Chernikov 	BPF_LOCK_ASSERT();
18986c74ff0eSAlexander V. Chernikov 
18999b44ff22SGarrett Wollman 	theywant = ifunit(ifr->ifr_name);
190016d878ccSChristian S.J. Peron 	if (theywant == NULL || theywant->if_bpf == NULL)
190116d878ccSChristian S.J. Peron 		return (ENXIO);
19029b44ff22SGarrett Wollman 
190316d878ccSChristian S.J. Peron 	bp = theywant->if_bpf;
19044d621040SChristian S.J. Peron 
1905afa85850SAlexander V. Chernikov 	/* Check if interface is not being detached from BPF */
1906afa85850SAlexander V. Chernikov 	BPFIF_RLOCK(bp);
1907afa85850SAlexander V. Chernikov 	if (bp->flags & BPFIF_FLAG_DYING) {
1908afa85850SAlexander V. Chernikov 		BPFIF_RUNLOCK(bp);
1909afa85850SAlexander V. Chernikov 		return (ENXIO);
1910afa85850SAlexander V. Chernikov 	}
1911afa85850SAlexander V. Chernikov 	BPFIF_RUNLOCK(bp);
1912afa85850SAlexander V. Chernikov 
1913df8bae1dSRodney W. Grimes 	/*
19144d621040SChristian S.J. Peron 	 * Behavior here depends on the buffering model.  If we're using
19154d621040SChristian S.J. Peron 	 * kernel memory buffers, then we can allocate them here.  If we're
19164d621040SChristian S.J. Peron 	 * using zero-copy, then the user process must have registered
19174d621040SChristian S.J. Peron 	 * buffers by the time we get here.  If not, return an error.
1918df8bae1dSRodney W. Grimes 	 */
19194d621040SChristian S.J. Peron 	switch (d->bd_bufmode) {
19204d621040SChristian S.J. Peron 	case BPF_BUFMODE_BUFFER:
19214d621040SChristian S.J. Peron 	case BPF_BUFMODE_ZBUF:
19224d621040SChristian S.J. Peron 		if (d->bd_sbuf == NULL)
19234d621040SChristian S.J. Peron 			return (EINVAL);
19244d621040SChristian S.J. Peron 		break;
19254d621040SChristian S.J. Peron 
19264d621040SChristian S.J. Peron 	default:
19274d621040SChristian S.J. Peron 		panic("bpf_setif: bufmode %d", d->bd_bufmode);
19284d621040SChristian S.J. Peron 	}
19296c74ff0eSAlexander V. Chernikov 	if (bp != d->bd_bif)
1930df8bae1dSRodney W. Grimes 		bpf_attachd(d, bp);
1931afa85850SAlexander V. Chernikov 	BPFD_LOCK(d);
1932df8bae1dSRodney W. Grimes 	reset_d(d);
1933afa85850SAlexander V. Chernikov 	BPFD_UNLOCK(d);
1934df8bae1dSRodney W. Grimes 	return (0);
1935df8bae1dSRodney W. Grimes }
1936df8bae1dSRodney W. Grimes 
1937df8bae1dSRodney W. Grimes /*
1938243ac7d8SPeter Wemm  * Support for select() and poll() system calls
1939df8bae1dSRodney W. Grimes  *
1940df8bae1dSRodney W. Grimes  * Return true iff the specific operation will not block indefinitely.
1941df8bae1dSRodney W. Grimes  * Otherwise, return false but make a note that a selwakeup() must be done.
1942df8bae1dSRodney W. Grimes  */
194337c84183SPoul-Henning Kamp static int
194419ba8395SChristian S.J. Peron bpfpoll(struct cdev *dev, int events, struct thread *td)
1945df8bae1dSRodney W. Grimes {
1946e7bb21b3SJonathan Lemon 	struct bpf_d *d;
19470832fc64SGarance A Drosehn 	int revents;
1948df8bae1dSRodney W. Grimes 
1949136600feSEd Schouten 	if (devfs_get_cdevpriv((void **)&d) != 0 || d->bd_bif == NULL)
1950136600feSEd Schouten 		return (events &
1951136600feSEd Schouten 		    (POLLHUP|POLLIN|POLLRDNORM|POLLOUT|POLLWRNORM));
1952de5d9935SRobert Watson 
1953b75a24a0SChristian S.J. Peron 	/*
1954b75a24a0SChristian S.J. Peron 	 * Refresh PID associated with this descriptor.
1955b75a24a0SChristian S.J. Peron 	 */
19560832fc64SGarance A Drosehn 	revents = events & (POLLOUT | POLLWRNORM);
1957afa85850SAlexander V. Chernikov 	BPFD_LOCK(d);
1958e4b3229aSAlexander V. Chernikov 	BPF_PID_REFRESH(d, td);
195975c13541SPoul-Henning Kamp 	if (events & (POLLIN | POLLRDNORM)) {
196095aab9ccSJohn-Mark Gurney 		if (bpf_ready(d))
1961243ac7d8SPeter Wemm 			revents |= events & (POLLIN | POLLRDNORM);
196281bda851SJohn Polstra 		else {
1963ed01445dSJohn Baldwin 			selrecord(td, &d->bd_sel);
196481bda851SJohn Polstra 			/* Start the read timeout if necessary. */
196581bda851SJohn Polstra 			if (d->bd_rtout > 0 && d->bd_state == BPF_IDLE) {
196681bda851SJohn Polstra 				callout_reset(&d->bd_callout, d->bd_rtout,
196781bda851SJohn Polstra 				    bpf_timed_out, d);
196881bda851SJohn Polstra 				d->bd_state = BPF_WAITING;
196981bda851SJohn Polstra 			}
197081bda851SJohn Polstra 		}
197175c13541SPoul-Henning Kamp 	}
1972afa85850SAlexander V. Chernikov 	BPFD_UNLOCK(d);
1973243ac7d8SPeter Wemm 	return (revents);
1974df8bae1dSRodney W. Grimes }
1975df8bae1dSRodney W. Grimes 
1976df8bae1dSRodney W. Grimes /*
197795aab9ccSJohn-Mark Gurney  * Support for kevent() system call.  Register EVFILT_READ filters and
197895aab9ccSJohn-Mark Gurney  * reject all others.
197995aab9ccSJohn-Mark Gurney  */
198095aab9ccSJohn-Mark Gurney int
198119ba8395SChristian S.J. Peron bpfkqfilter(struct cdev *dev, struct knote *kn)
198295aab9ccSJohn-Mark Gurney {
1983136600feSEd Schouten 	struct bpf_d *d;
198495aab9ccSJohn-Mark Gurney 
1985136600feSEd Schouten 	if (devfs_get_cdevpriv((void **)&d) != 0 ||
1986136600feSEd Schouten 	    kn->kn_filter != EVFILT_READ)
198795aab9ccSJohn-Mark Gurney 		return (1);
198895aab9ccSJohn-Mark Gurney 
1989b75a24a0SChristian S.J. Peron 	/*
1990b75a24a0SChristian S.J. Peron 	 * Refresh PID associated with this descriptor.
1991b75a24a0SChristian S.J. Peron 	 */
1992afa85850SAlexander V. Chernikov 	BPFD_LOCK(d);
1993e4b3229aSAlexander V. Chernikov 	BPF_PID_REFRESH_CUR(d);
199495aab9ccSJohn-Mark Gurney 	kn->kn_fop = &bpfread_filtops;
199595aab9ccSJohn-Mark Gurney 	kn->kn_hook = d;
19964b19419eSChristian S.J. Peron 	knlist_add(&d->bd_sel.si_note, kn, 1);
1997afa85850SAlexander V. Chernikov 	BPFD_UNLOCK(d);
199895aab9ccSJohn-Mark Gurney 
199995aab9ccSJohn-Mark Gurney 	return (0);
200095aab9ccSJohn-Mark Gurney }
200195aab9ccSJohn-Mark Gurney 
200295aab9ccSJohn-Mark Gurney static void
200319ba8395SChristian S.J. Peron filt_bpfdetach(struct knote *kn)
200495aab9ccSJohn-Mark Gurney {
200595aab9ccSJohn-Mark Gurney 	struct bpf_d *d = (struct bpf_d *)kn->kn_hook;
200695aab9ccSJohn-Mark Gurney 
2007ad3b9257SJohn-Mark Gurney 	knlist_remove(&d->bd_sel.si_note, kn, 0);
200895aab9ccSJohn-Mark Gurney }
200995aab9ccSJohn-Mark Gurney 
201095aab9ccSJohn-Mark Gurney static int
201119ba8395SChristian S.J. Peron filt_bpfread(struct knote *kn, long hint)
201295aab9ccSJohn-Mark Gurney {
201395aab9ccSJohn-Mark Gurney 	struct bpf_d *d = (struct bpf_d *)kn->kn_hook;
201495aab9ccSJohn-Mark Gurney 	int ready;
201595aab9ccSJohn-Mark Gurney 
2016afa85850SAlexander V. Chernikov 	BPFD_LOCK_ASSERT(d);
201795aab9ccSJohn-Mark Gurney 	ready = bpf_ready(d);
201895aab9ccSJohn-Mark Gurney 	if (ready) {
201995aab9ccSJohn-Mark Gurney 		kn->kn_data = d->bd_slen;
20203b3b91e7SGuy Helmer 		while (d->bd_hbuf_in_use)
20213b3b91e7SGuy Helmer 			mtx_sleep(&d->bd_hbuf_in_use, &d->bd_lock,
20223b3b91e7SGuy Helmer 			    PRINET, "bd_hbuf", 0);
202395aab9ccSJohn-Mark Gurney 		if (d->bd_hbuf)
202495aab9ccSJohn-Mark Gurney 			kn->kn_data += d->bd_hlen;
20255d7af3a1SJung-uk Kim 	} else if (d->bd_rtout > 0 && d->bd_state == BPF_IDLE) {
202695aab9ccSJohn-Mark Gurney 		callout_reset(&d->bd_callout, d->bd_rtout,
202795aab9ccSJohn-Mark Gurney 		    bpf_timed_out, d);
202895aab9ccSJohn-Mark Gurney 		d->bd_state = BPF_WAITING;
202995aab9ccSJohn-Mark Gurney 	}
203095aab9ccSJohn-Mark Gurney 
203195aab9ccSJohn-Mark Gurney 	return (ready);
203295aab9ccSJohn-Mark Gurney }
203395aab9ccSJohn-Mark Gurney 
2034253a3814SLawrence Stewart #define	BPF_TSTAMP_NONE		0
2035253a3814SLawrence Stewart #define	BPF_TSTAMP_FAST		1
2036253a3814SLawrence Stewart #define	BPF_TSTAMP_NORMAL	2
2037253a3814SLawrence Stewart #define	BPF_TSTAMP_EXTERN	3
2038253a3814SLawrence Stewart 
2039253a3814SLawrence Stewart static int
2040253a3814SLawrence Stewart bpf_ts_quality(int tstype)
2041253a3814SLawrence Stewart {
2042253a3814SLawrence Stewart 
2043253a3814SLawrence Stewart 	if (tstype == BPF_T_NONE)
2044253a3814SLawrence Stewart 		return (BPF_TSTAMP_NONE);
2045253a3814SLawrence Stewart 	if ((tstype & BPF_T_FAST) != 0)
2046253a3814SLawrence Stewart 		return (BPF_TSTAMP_FAST);
2047253a3814SLawrence Stewart 
2048253a3814SLawrence Stewart 	return (BPF_TSTAMP_NORMAL);
2049253a3814SLawrence Stewart }
2050253a3814SLawrence Stewart 
2051253a3814SLawrence Stewart static int
2052253a3814SLawrence Stewart bpf_gettime(struct bintime *bt, int tstype, struct mbuf *m)
2053253a3814SLawrence Stewart {
2054253a3814SLawrence Stewart 	struct m_tag *tag;
2055253a3814SLawrence Stewart 	int quality;
2056253a3814SLawrence Stewart 
2057253a3814SLawrence Stewart 	quality = bpf_ts_quality(tstype);
2058253a3814SLawrence Stewart 	if (quality == BPF_TSTAMP_NONE)
2059253a3814SLawrence Stewart 		return (quality);
2060253a3814SLawrence Stewart 
2061253a3814SLawrence Stewart 	if (m != NULL) {
2062253a3814SLawrence Stewart 		tag = m_tag_locate(m, MTAG_BPF, MTAG_BPF_TIMESTAMP, NULL);
2063253a3814SLawrence Stewart 		if (tag != NULL) {
2064253a3814SLawrence Stewart 			*bt = *(struct bintime *)(tag + 1);
2065253a3814SLawrence Stewart 			return (BPF_TSTAMP_EXTERN);
2066253a3814SLawrence Stewart 		}
2067253a3814SLawrence Stewart 	}
2068253a3814SLawrence Stewart 	if (quality == BPF_TSTAMP_NORMAL)
2069253a3814SLawrence Stewart 		binuptime(bt);
2070253a3814SLawrence Stewart 	else
2071253a3814SLawrence Stewart 		getbinuptime(bt);
2072253a3814SLawrence Stewart 
2073253a3814SLawrence Stewart 	return (quality);
2074253a3814SLawrence Stewart }
2075253a3814SLawrence Stewart 
207695aab9ccSJohn-Mark Gurney /*
2077df8bae1dSRodney W. Grimes  * Incoming linkage from device drivers.  Process the packet pkt, of length
2078df8bae1dSRodney W. Grimes  * pktlen, which is stored in a contiguous buffer.  The packet is parsed
2079df8bae1dSRodney W. Grimes  * by each process' filter, and if accepted, stashed into the corresponding
2080df8bae1dSRodney W. Grimes  * buffer.
2081df8bae1dSRodney W. Grimes  */
2082df8bae1dSRodney W. Grimes void
208319ba8395SChristian S.J. Peron bpf_tap(struct bpf_if *bp, u_char *pkt, u_int pktlen)
2084df8bae1dSRodney W. Grimes {
2085547d94bdSJung-uk Kim 	struct bintime bt;
20868994a245SDag-Erling Smørgrav 	struct bpf_d *d;
2087a36599ccSJung-uk Kim #ifdef BPF_JITTER
2088a36599ccSJung-uk Kim 	bpf_jit_filter *bf;
2089a36599ccSJung-uk Kim #endif
2090253a3814SLawrence Stewart 	u_int slen;
2091253a3814SLawrence Stewart 	int gottime;
2092e7bb21b3SJonathan Lemon 
2093253a3814SLawrence Stewart 	gottime = BPF_TSTAMP_NONE;
2094e4b3229aSAlexander V. Chernikov 
2095e4b3229aSAlexander V. Chernikov 	BPFIF_RLOCK(bp);
2096e4b3229aSAlexander V. Chernikov 
20974a3feeaaSRobert Watson 	LIST_FOREACH(d, &bp->bif_dlist, bd_next) {
2098e4b3229aSAlexander V. Chernikov 		/*
2099e4b3229aSAlexander V. Chernikov 		 * We are not using any locks for d here because:
2100e4b3229aSAlexander V. Chernikov 		 * 1) any filter change is protected by interface
2101e4b3229aSAlexander V. Chernikov 		 * write lock
2102e4b3229aSAlexander V. Chernikov 		 * 2) destroying/detaching d is protected by interface
2103e4b3229aSAlexander V. Chernikov 		 * write lock, too
2104e4b3229aSAlexander V. Chernikov 		 */
2105e4b3229aSAlexander V. Chernikov 
2106e4b3229aSAlexander V. Chernikov 		/* XXX: Do not protect counter for the sake of performance. */
2107df8bae1dSRodney W. Grimes 		++d->bd_rcount;
2108a05cf8c6SChristian S.J. Peron 		/*
2109a05cf8c6SChristian S.J. Peron 		 * NB: We dont call BPF_CHECK_DIRECTION() here since there is no
2110a05cf8c6SChristian S.J. Peron 		 * way for the caller to indiciate to us whether this packet
2111a05cf8c6SChristian S.J. Peron 		 * is inbound or outbound.  In the bpf_mtap() routines, we use
2112a05cf8c6SChristian S.J. Peron 		 * the interface pointers on the mbuf to figure it out.
2113a05cf8c6SChristian S.J. Peron 		 */
2114ae275efcSJung-uk Kim #ifdef BPF_JITTER
2115a36599ccSJung-uk Kim 		bf = bpf_jitter_enable != 0 ? d->bd_bfilter : NULL;
2116a36599ccSJung-uk Kim 		if (bf != NULL)
2117a36599ccSJung-uk Kim 			slen = (*(bf->func))(pkt, pktlen, pktlen);
2118ae275efcSJung-uk Kim 		else
2119ae275efcSJung-uk Kim #endif
212093e39f0bSChristian S.J. Peron 		slen = bpf_filter(d->bd_rfilter, pkt, pktlen, pktlen);
2121ec272d87SRobert Watson 		if (slen != 0) {
2122e4b3229aSAlexander V. Chernikov 			/*
2123e4b3229aSAlexander V. Chernikov 			 * Filter matches. Let's to acquire write lock.
2124e4b3229aSAlexander V. Chernikov 			 */
2125afa85850SAlexander V. Chernikov 			BPFD_LOCK(d);
2126e4b3229aSAlexander V. Chernikov 
212769f7644bSChristian S.J. Peron 			d->bd_fcount++;
2128253a3814SLawrence Stewart 			if (gottime < bpf_ts_quality(d->bd_tstamp))
2129253a3814SLawrence Stewart 				gottime = bpf_gettime(&bt, d->bd_tstamp, NULL);
2130ec272d87SRobert Watson #ifdef MAC
213130d239bcSRobert Watson 			if (mac_bpfdesc_check_receive(d, bp->bif_ifp) == 0)
2132ec272d87SRobert Watson #endif
21334d621040SChristian S.J. Peron 				catchpacket(d, pkt, pktlen, slen,
2134547d94bdSJung-uk Kim 				    bpf_append_bytes, &bt);
2135afa85850SAlexander V. Chernikov 			BPFD_UNLOCK(d);
2136ec272d87SRobert Watson 		}
2137df8bae1dSRodney W. Grimes 	}
2138e4b3229aSAlexander V. Chernikov 	BPFIF_RUNLOCK(bp);
2139df8bae1dSRodney W. Grimes }
2140df8bae1dSRodney W. Grimes 
2141f81a2a49SJung-uk Kim #define	BPF_CHECK_DIRECTION(d, r, i)				\
2142f81a2a49SJung-uk Kim 	    (((d)->bd_direction == BPF_D_IN && (r) != (i)) ||	\
2143f81a2a49SJung-uk Kim 	    ((d)->bd_direction == BPF_D_OUT && (r) == (i)))
2144560a54e1SJung-uk Kim 
2145df8bae1dSRodney W. Grimes /*
2146df8bae1dSRodney W. Grimes  * Incoming linkage from device drivers, when packet is in an mbuf chain.
2147e4b3229aSAlexander V. Chernikov  * Locking model is explained in bpf_tap().
2148df8bae1dSRodney W. Grimes  */
2149df8bae1dSRodney W. Grimes void
215019ba8395SChristian S.J. Peron bpf_mtap(struct bpf_if *bp, struct mbuf *m)
2151df8bae1dSRodney W. Grimes {
2152547d94bdSJung-uk Kim 	struct bintime bt;
2153df8bae1dSRodney W. Grimes 	struct bpf_d *d;
2154a36599ccSJung-uk Kim #ifdef BPF_JITTER
2155a36599ccSJung-uk Kim 	bpf_jit_filter *bf;
2156a36599ccSJung-uk Kim #endif
2157253a3814SLawrence Stewart 	u_int pktlen, slen;
2158253a3814SLawrence Stewart 	int gottime;
215991433904SDavid Malone 
21608cd892f7SJung-uk Kim 	/* Skip outgoing duplicate packets. */
21618cd892f7SJung-uk Kim 	if ((m->m_flags & M_PROMISC) != 0 && m->m_pkthdr.rcvif == NULL) {
21628cd892f7SJung-uk Kim 		m->m_flags &= ~M_PROMISC;
21638cd892f7SJung-uk Kim 		return;
21648cd892f7SJung-uk Kim 	}
21658cd892f7SJung-uk Kim 
2166f0e2422bSPoul-Henning Kamp 	pktlen = m_length(m, NULL);
2167253a3814SLawrence Stewart 	gottime = BPF_TSTAMP_NONE;
2168e4b3229aSAlexander V. Chernikov 
2169e4b3229aSAlexander V. Chernikov 	BPFIF_RLOCK(bp);
2170e4b3229aSAlexander V. Chernikov 
21714a3feeaaSRobert Watson 	LIST_FOREACH(d, &bp->bif_dlist, bd_next) {
2172f81a2a49SJung-uk Kim 		if (BPF_CHECK_DIRECTION(d, m->m_pkthdr.rcvif, bp->bif_ifp))
21738ed3828cSRobert Watson 			continue;
2174df8bae1dSRodney W. Grimes 		++d->bd_rcount;
2175ae275efcSJung-uk Kim #ifdef BPF_JITTER
2176a36599ccSJung-uk Kim 		bf = bpf_jitter_enable != 0 ? d->bd_bfilter : NULL;
2177ae275efcSJung-uk Kim 		/* XXX We cannot handle multiple mbufs. */
2178a36599ccSJung-uk Kim 		if (bf != NULL && m->m_next == NULL)
2179a36599ccSJung-uk Kim 			slen = (*(bf->func))(mtod(m, u_char *), pktlen, pktlen);
2180ae275efcSJung-uk Kim 		else
2181ae275efcSJung-uk Kim #endif
218293e39f0bSChristian S.J. Peron 		slen = bpf_filter(d->bd_rfilter, (u_char *)m, pktlen, 0);
21834ddfb531SChristian S.J. Peron 		if (slen != 0) {
2184afa85850SAlexander V. Chernikov 			BPFD_LOCK(d);
2185e4b3229aSAlexander V. Chernikov 
218669f7644bSChristian S.J. Peron 			d->bd_fcount++;
2187253a3814SLawrence Stewart 			if (gottime < bpf_ts_quality(d->bd_tstamp))
2188253a3814SLawrence Stewart 				gottime = bpf_gettime(&bt, d->bd_tstamp, m);
21890c7fb534SRobert Watson #ifdef MAC
219030d239bcSRobert Watson 			if (mac_bpfdesc_check_receive(d, bp->bif_ifp) == 0)
21910c7fb534SRobert Watson #endif
21920c7fb534SRobert Watson 				catchpacket(d, (u_char *)m, pktlen, slen,
2193547d94bdSJung-uk Kim 				    bpf_append_mbuf, &bt);
2194afa85850SAlexander V. Chernikov 			BPFD_UNLOCK(d);
21954ddfb531SChristian S.J. Peron 		}
2196df8bae1dSRodney W. Grimes 	}
2197e4b3229aSAlexander V. Chernikov 	BPFIF_RUNLOCK(bp);
2198df8bae1dSRodney W. Grimes }
2199df8bae1dSRodney W. Grimes 
2200df8bae1dSRodney W. Grimes /*
2201437ffe18SSam Leffler  * Incoming linkage from device drivers, when packet is in
2202437ffe18SSam Leffler  * an mbuf chain and to be prepended by a contiguous header.
2203437ffe18SSam Leffler  */
2204437ffe18SSam Leffler void
220519ba8395SChristian S.J. Peron bpf_mtap2(struct bpf_if *bp, void *data, u_int dlen, struct mbuf *m)
2206437ffe18SSam Leffler {
2207547d94bdSJung-uk Kim 	struct bintime bt;
2208437ffe18SSam Leffler 	struct mbuf mb;
2209437ffe18SSam Leffler 	struct bpf_d *d;
2210253a3814SLawrence Stewart 	u_int pktlen, slen;
2211253a3814SLawrence Stewart 	int gottime;
221291433904SDavid Malone 
22138cd892f7SJung-uk Kim 	/* Skip outgoing duplicate packets. */
22148cd892f7SJung-uk Kim 	if ((m->m_flags & M_PROMISC) != 0 && m->m_pkthdr.rcvif == NULL) {
22158cd892f7SJung-uk Kim 		m->m_flags &= ~M_PROMISC;
22168cd892f7SJung-uk Kim 		return;
22178cd892f7SJung-uk Kim 	}
22188cd892f7SJung-uk Kim 
2219437ffe18SSam Leffler 	pktlen = m_length(m, NULL);
2220437ffe18SSam Leffler 	/*
2221437ffe18SSam Leffler 	 * Craft on-stack mbuf suitable for passing to bpf_filter.
2222437ffe18SSam Leffler 	 * Note that we cut corners here; we only setup what's
2223437ffe18SSam Leffler 	 * absolutely needed--this mbuf should never go anywhere else.
2224437ffe18SSam Leffler 	 */
2225437ffe18SSam Leffler 	mb.m_next = m;
2226437ffe18SSam Leffler 	mb.m_data = data;
2227437ffe18SSam Leffler 	mb.m_len = dlen;
2228437ffe18SSam Leffler 	pktlen += dlen;
2229437ffe18SSam Leffler 
2230253a3814SLawrence Stewart 	gottime = BPF_TSTAMP_NONE;
2231e4b3229aSAlexander V. Chernikov 
2232e4b3229aSAlexander V. Chernikov 	BPFIF_RLOCK(bp);
2233e4b3229aSAlexander V. Chernikov 
22344a3feeaaSRobert Watson 	LIST_FOREACH(d, &bp->bif_dlist, bd_next) {
2235f81a2a49SJung-uk Kim 		if (BPF_CHECK_DIRECTION(d, m->m_pkthdr.rcvif, bp->bif_ifp))
2236437ffe18SSam Leffler 			continue;
2237437ffe18SSam Leffler 		++d->bd_rcount;
223893e39f0bSChristian S.J. Peron 		slen = bpf_filter(d->bd_rfilter, (u_char *)&mb, pktlen, 0);
22394ddfb531SChristian S.J. Peron 		if (slen != 0) {
2240afa85850SAlexander V. Chernikov 			BPFD_LOCK(d);
2241e4b3229aSAlexander V. Chernikov 
224269f7644bSChristian S.J. Peron 			d->bd_fcount++;
2243253a3814SLawrence Stewart 			if (gottime < bpf_ts_quality(d->bd_tstamp))
2244253a3814SLawrence Stewart 				gottime = bpf_gettime(&bt, d->bd_tstamp, m);
2245437ffe18SSam Leffler #ifdef MAC
224630d239bcSRobert Watson 			if (mac_bpfdesc_check_receive(d, bp->bif_ifp) == 0)
2247437ffe18SSam Leffler #endif
2248437ffe18SSam Leffler 				catchpacket(d, (u_char *)&mb, pktlen, slen,
2249547d94bdSJung-uk Kim 				    bpf_append_mbuf, &bt);
2250afa85850SAlexander V. Chernikov 			BPFD_UNLOCK(d);
22514ddfb531SChristian S.J. Peron 		}
2252437ffe18SSam Leffler 	}
2253e4b3229aSAlexander V. Chernikov 	BPFIF_RUNLOCK(bp);
2254437ffe18SSam Leffler }
2255437ffe18SSam Leffler 
2256560a54e1SJung-uk Kim #undef	BPF_CHECK_DIRECTION
2257560a54e1SJung-uk Kim 
2258253a3814SLawrence Stewart #undef	BPF_TSTAMP_NONE
2259253a3814SLawrence Stewart #undef	BPF_TSTAMP_FAST
2260253a3814SLawrence Stewart #undef	BPF_TSTAMP_NORMAL
2261253a3814SLawrence Stewart #undef	BPF_TSTAMP_EXTERN
2262253a3814SLawrence Stewart 
2263547d94bdSJung-uk Kim static int
2264547d94bdSJung-uk Kim bpf_hdrlen(struct bpf_d *d)
2265547d94bdSJung-uk Kim {
2266547d94bdSJung-uk Kim 	int hdrlen;
2267547d94bdSJung-uk Kim 
2268547d94bdSJung-uk Kim 	hdrlen = d->bd_bif->bif_hdrlen;
2269547d94bdSJung-uk Kim #ifndef BURN_BRIDGES
2270547d94bdSJung-uk Kim 	if (d->bd_tstamp == BPF_T_NONE ||
2271547d94bdSJung-uk Kim 	    BPF_T_FORMAT(d->bd_tstamp) == BPF_T_MICROTIME)
2272547d94bdSJung-uk Kim #ifdef COMPAT_FREEBSD32
2273547d94bdSJung-uk Kim 		if (d->bd_compat32)
2274547d94bdSJung-uk Kim 			hdrlen += SIZEOF_BPF_HDR(struct bpf_hdr32);
2275547d94bdSJung-uk Kim 		else
2276547d94bdSJung-uk Kim #endif
2277547d94bdSJung-uk Kim 			hdrlen += SIZEOF_BPF_HDR(struct bpf_hdr);
2278547d94bdSJung-uk Kim 	else
2279547d94bdSJung-uk Kim #endif
2280547d94bdSJung-uk Kim 		hdrlen += SIZEOF_BPF_HDR(struct bpf_xhdr);
2281547d94bdSJung-uk Kim #ifdef COMPAT_FREEBSD32
2282547d94bdSJung-uk Kim 	if (d->bd_compat32)
2283547d94bdSJung-uk Kim 		hdrlen = BPF_WORDALIGN32(hdrlen);
2284547d94bdSJung-uk Kim 	else
2285547d94bdSJung-uk Kim #endif
2286547d94bdSJung-uk Kim 		hdrlen = BPF_WORDALIGN(hdrlen);
2287547d94bdSJung-uk Kim 
2288547d94bdSJung-uk Kim 	return (hdrlen - d->bd_bif->bif_hdrlen);
2289547d94bdSJung-uk Kim }
2290547d94bdSJung-uk Kim 
2291547d94bdSJung-uk Kim static void
2292547d94bdSJung-uk Kim bpf_bintime2ts(struct bintime *bt, struct bpf_ts *ts, int tstype)
2293547d94bdSJung-uk Kim {
2294253a3814SLawrence Stewart 	struct bintime bt2;
2295547d94bdSJung-uk Kim 	struct timeval tsm;
2296547d94bdSJung-uk Kim 	struct timespec tsn;
2297547d94bdSJung-uk Kim 
2298253a3814SLawrence Stewart 	if ((tstype & BPF_T_MONOTONIC) == 0) {
2299253a3814SLawrence Stewart 		bt2 = *bt;
2300253a3814SLawrence Stewart 		bintime_add(&bt2, &boottimebin);
2301253a3814SLawrence Stewart 		bt = &bt2;
2302253a3814SLawrence Stewart 	}
2303547d94bdSJung-uk Kim 	switch (BPF_T_FORMAT(tstype)) {
2304547d94bdSJung-uk Kim 	case BPF_T_MICROTIME:
2305547d94bdSJung-uk Kim 		bintime2timeval(bt, &tsm);
2306547d94bdSJung-uk Kim 		ts->bt_sec = tsm.tv_sec;
2307547d94bdSJung-uk Kim 		ts->bt_frac = tsm.tv_usec;
2308547d94bdSJung-uk Kim 		break;
2309547d94bdSJung-uk Kim 	case BPF_T_NANOTIME:
2310547d94bdSJung-uk Kim 		bintime2timespec(bt, &tsn);
2311547d94bdSJung-uk Kim 		ts->bt_sec = tsn.tv_sec;
2312547d94bdSJung-uk Kim 		ts->bt_frac = tsn.tv_nsec;
2313547d94bdSJung-uk Kim 		break;
2314547d94bdSJung-uk Kim 	case BPF_T_BINTIME:
2315547d94bdSJung-uk Kim 		ts->bt_sec = bt->sec;
2316547d94bdSJung-uk Kim 		ts->bt_frac = bt->frac;
2317547d94bdSJung-uk Kim 		break;
2318547d94bdSJung-uk Kim 	}
2319547d94bdSJung-uk Kim }
2320547d94bdSJung-uk Kim 
2321437ffe18SSam Leffler /*
2322df8bae1dSRodney W. Grimes  * Move the packet data from interface memory (pkt) into the
23239e610888SDag-Erling Smørgrav  * store buffer.  "cpfn" is the routine called to do the actual data
2324df8bae1dSRodney W. Grimes  * transfer.  bcopy is passed in to copy contiguous chunks, while
23254d621040SChristian S.J. Peron  * bpf_append_mbuf is passed in to copy mbuf chains.  In the latter case,
2326df8bae1dSRodney W. Grimes  * pkt is really an mbuf.
2327df8bae1dSRodney W. Grimes  */
2328df8bae1dSRodney W. Grimes static void
232919ba8395SChristian S.J. Peron catchpacket(struct bpf_d *d, u_char *pkt, u_int pktlen, u_int snaplen,
23304d621040SChristian S.J. Peron     void (*cpfn)(struct bpf_d *, caddr_t, u_int, void *, u_int),
2331547d94bdSJung-uk Kim     struct bintime *bt)
2332df8bae1dSRodney W. Grimes {
2333547d94bdSJung-uk Kim 	struct bpf_xhdr hdr;
2334547d94bdSJung-uk Kim #ifndef BURN_BRIDGES
2335547d94bdSJung-uk Kim 	struct bpf_hdr hdr_old;
2336fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32
2337547d94bdSJung-uk Kim 	struct bpf_hdr32 hdr32_old;
2338fc0a61a4SKonstantin Belousov #endif
2339547d94bdSJung-uk Kim #endif
2340547d94bdSJung-uk Kim 	int caplen, curlen, hdrlen, totlen;
23417819da79SJohn-Mark Gurney 	int do_wakeup = 0;
2342547d94bdSJung-uk Kim 	int do_timestamp;
2343547d94bdSJung-uk Kim 	int tstype;
23449e610888SDag-Erling Smørgrav 
2345afa85850SAlexander V. Chernikov 	BPFD_LOCK_ASSERT(d);
23464d621040SChristian S.J. Peron 
23474d621040SChristian S.J. Peron 	/*
23484d621040SChristian S.J. Peron 	 * Detect whether user space has released a buffer back to us, and if
23494d621040SChristian S.J. Peron 	 * so, move it from being a hold buffer to a free buffer.  This may
23504d621040SChristian S.J. Peron 	 * not be the best place to do it (for example, we might only want to
23514d621040SChristian S.J. Peron 	 * run this check if we need the space), but for now it's a reliable
23524d621040SChristian S.J. Peron 	 * spot to do it.
23534d621040SChristian S.J. Peron 	 */
2354fa0c2b34SRobert Watson 	if (d->bd_fbuf == NULL && bpf_canfreebuf(d)) {
23553b3b91e7SGuy Helmer 		while (d->bd_hbuf_in_use)
23563b3b91e7SGuy Helmer 			mtx_sleep(&d->bd_hbuf_in_use, &d->bd_lock,
23573b3b91e7SGuy Helmer 			    PRINET, "bd_hbuf", 0);
23584d621040SChristian S.J. Peron 		d->bd_fbuf = d->bd_hbuf;
23594d621040SChristian S.J. Peron 		d->bd_hbuf = NULL;
23604d621040SChristian S.J. Peron 		d->bd_hlen = 0;
236129f612ecSChristian S.J. Peron 		bpf_buf_reclaimed(d);
23624d621040SChristian S.J. Peron 	}
23634d621040SChristian S.J. Peron 
2364df8bae1dSRodney W. Grimes 	/*
2365df8bae1dSRodney W. Grimes 	 * Figure out how many bytes to move.  If the packet is
2366df8bae1dSRodney W. Grimes 	 * greater or equal to the snapshot length, transfer that
2367df8bae1dSRodney W. Grimes 	 * much.  Otherwise, transfer the whole packet (unless
2368df8bae1dSRodney W. Grimes 	 * we hit the buffer size limit).
2369df8bae1dSRodney W. Grimes 	 */
2370547d94bdSJung-uk Kim 	hdrlen = bpf_hdrlen(d);
2371df8bae1dSRodney W. Grimes 	totlen = hdrlen + min(snaplen, pktlen);
2372df8bae1dSRodney W. Grimes 	if (totlen > d->bd_bufsize)
2373df8bae1dSRodney W. Grimes 		totlen = d->bd_bufsize;
2374df8bae1dSRodney W. Grimes 
2375df8bae1dSRodney W. Grimes 	/*
2376df8bae1dSRodney W. Grimes 	 * Round up the end of the previous packet to the next longword.
2377a7a91e65SRobert Watson 	 *
2378a7a91e65SRobert Watson 	 * Drop the packet if there's no room and no hope of room
2379a7a91e65SRobert Watson 	 * If the packet would overflow the storage buffer or the storage
2380a7a91e65SRobert Watson 	 * buffer is considered immutable by the buffer model, try to rotate
2381a7a91e65SRobert Watson 	 * the buffer and wakeup pending processes.
2382df8bae1dSRodney W. Grimes 	 */
2383fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32
2384fc0a61a4SKonstantin Belousov 	if (d->bd_compat32)
2385fc0a61a4SKonstantin Belousov 		curlen = BPF_WORDALIGN32(d->bd_slen);
2386fc0a61a4SKonstantin Belousov 	else
2387fc0a61a4SKonstantin Belousov #endif
2388df8bae1dSRodney W. Grimes 		curlen = BPF_WORDALIGN(d->bd_slen);
2389a7a91e65SRobert Watson 	if (curlen + totlen > d->bd_bufsize || !bpf_canwritebuf(d)) {
2390572bde2aSRobert Watson 		if (d->bd_fbuf == NULL) {
2391df8bae1dSRodney W. Grimes 			/*
2392a7a91e65SRobert Watson 			 * There's no room in the store buffer, and no
2393a7a91e65SRobert Watson 			 * prospect of room, so drop the packet.  Notify the
2394a7a91e65SRobert Watson 			 * buffer model.
2395df8bae1dSRodney W. Grimes 			 */
2396a7a91e65SRobert Watson 			bpf_buffull(d);
2397df8bae1dSRodney W. Grimes 			++d->bd_dcount;
2398df8bae1dSRodney W. Grimes 			return;
2399df8bae1dSRodney W. Grimes 		}
24003b3b91e7SGuy Helmer 		while (d->bd_hbuf_in_use)
24013b3b91e7SGuy Helmer 			mtx_sleep(&d->bd_hbuf_in_use, &d->bd_lock,
24023b3b91e7SGuy Helmer 			    PRINET, "bd_hbuf", 0);
2403df8bae1dSRodney W. Grimes 		ROTATE_BUFFERS(d);
24047819da79SJohn-Mark Gurney 		do_wakeup = 1;
2405df8bae1dSRodney W. Grimes 		curlen = 0;
2406a7a91e65SRobert Watson 	} else if (d->bd_immediate || d->bd_state == BPF_TIMED_OUT)
2407df8bae1dSRodney W. Grimes 		/*
24084d621040SChristian S.J. Peron 		 * Immediate mode is set, or the read timeout has already
24094d621040SChristian S.J. Peron 		 * expired during a select call.  A packet arrived, so the
24104d621040SChristian S.J. Peron 		 * reader should be woken up.
2411df8bae1dSRodney W. Grimes 		 */
24127819da79SJohn-Mark Gurney 		do_wakeup = 1;
2413547d94bdSJung-uk Kim 	caplen = totlen - hdrlen;
2414547d94bdSJung-uk Kim 	tstype = d->bd_tstamp;
2415547d94bdSJung-uk Kim 	do_timestamp = tstype != BPF_T_NONE;
2416547d94bdSJung-uk Kim #ifndef BURN_BRIDGES
2417547d94bdSJung-uk Kim 	if (tstype == BPF_T_NONE || BPF_T_FORMAT(tstype) == BPF_T_MICROTIME) {
2418547d94bdSJung-uk Kim 		struct bpf_ts ts;
2419547d94bdSJung-uk Kim 		if (do_timestamp)
2420547d94bdSJung-uk Kim 			bpf_bintime2ts(bt, &ts, tstype);
2421fc0a61a4SKonstantin Belousov #ifdef COMPAT_FREEBSD32
2422fc0a61a4SKonstantin Belousov 		if (d->bd_compat32) {
2423547d94bdSJung-uk Kim 			bzero(&hdr32_old, sizeof(hdr32_old));
2424547d94bdSJung-uk Kim 			if (do_timestamp) {
2425547d94bdSJung-uk Kim 				hdr32_old.bh_tstamp.tv_sec = ts.bt_sec;
2426547d94bdSJung-uk Kim 				hdr32_old.bh_tstamp.tv_usec = ts.bt_frac;
2427547d94bdSJung-uk Kim 			}
2428547d94bdSJung-uk Kim 			hdr32_old.bh_datalen = pktlen;
2429547d94bdSJung-uk Kim 			hdr32_old.bh_hdrlen = hdrlen;
2430547d94bdSJung-uk Kim 			hdr32_old.bh_caplen = caplen;
2431547d94bdSJung-uk Kim 			bpf_append_bytes(d, d->bd_sbuf, curlen, &hdr32_old,
2432547d94bdSJung-uk Kim 			    sizeof(hdr32_old));
2433547d94bdSJung-uk Kim 			goto copy;
2434547d94bdSJung-uk Kim 		}
2435547d94bdSJung-uk Kim #endif
2436547d94bdSJung-uk Kim 		bzero(&hdr_old, sizeof(hdr_old));
2437547d94bdSJung-uk Kim 		if (do_timestamp) {
2438547d94bdSJung-uk Kim 			hdr_old.bh_tstamp.tv_sec = ts.bt_sec;
2439547d94bdSJung-uk Kim 			hdr_old.bh_tstamp.tv_usec = ts.bt_frac;
2440547d94bdSJung-uk Kim 		}
2441547d94bdSJung-uk Kim 		hdr_old.bh_datalen = pktlen;
2442547d94bdSJung-uk Kim 		hdr_old.bh_hdrlen = hdrlen;
2443547d94bdSJung-uk Kim 		hdr_old.bh_caplen = caplen;
2444547d94bdSJung-uk Kim 		bpf_append_bytes(d, d->bd_sbuf, curlen, &hdr_old,
2445547d94bdSJung-uk Kim 		    sizeof(hdr_old));
2446fc0a61a4SKonstantin Belousov 		goto copy;
2447fc0a61a4SKonstantin Belousov 	}
2448fc0a61a4SKonstantin Belousov #endif
2449df8bae1dSRodney W. Grimes 
2450df8bae1dSRodney W. Grimes 	/*
24514d621040SChristian S.J. Peron 	 * Append the bpf header.  Note we append the actual header size, but
24524d621040SChristian S.J. Peron 	 * move forward the length of the header plus padding.
2453df8bae1dSRodney W. Grimes 	 */
24544d621040SChristian S.J. Peron 	bzero(&hdr, sizeof(hdr));
2455547d94bdSJung-uk Kim 	if (do_timestamp)
2456547d94bdSJung-uk Kim 		bpf_bintime2ts(bt, &hdr.bh_tstamp, tstype);
24574d621040SChristian S.J. Peron 	hdr.bh_datalen = pktlen;
24584d621040SChristian S.J. Peron 	hdr.bh_hdrlen = hdrlen;
2459547d94bdSJung-uk Kim 	hdr.bh_caplen = caplen;
24604d621040SChristian S.J. Peron 	bpf_append_bytes(d, d->bd_sbuf, curlen, &hdr, sizeof(hdr));
24614d621040SChristian S.J. Peron 
2462df8bae1dSRodney W. Grimes 	/*
2463df8bae1dSRodney W. Grimes 	 * Copy the packet data into the store buffer and update its length.
2464df8bae1dSRodney W. Grimes 	 */
2465547d94bdSJung-uk Kim #ifndef BURN_BRIDGES
2466fc0a61a4SKonstantin Belousov copy:
2467fc0a61a4SKonstantin Belousov #endif
2468547d94bdSJung-uk Kim 	(*cpfn)(d, d->bd_sbuf, curlen + hdrlen, pkt, caplen);
2469df8bae1dSRodney W. Grimes 	d->bd_slen = curlen + totlen;
24707819da79SJohn-Mark Gurney 
24717819da79SJohn-Mark Gurney 	if (do_wakeup)
24727819da79SJohn-Mark Gurney 		bpf_wakeup(d);
2473df8bae1dSRodney W. Grimes }
2474df8bae1dSRodney W. Grimes 
2475df8bae1dSRodney W. Grimes /*
2476df8bae1dSRodney W. Grimes  * Free buffers currently in use by a descriptor.
2477df8bae1dSRodney W. Grimes  * Called on close.
2478df8bae1dSRodney W. Grimes  */
2479df8bae1dSRodney W. Grimes static void
248019ba8395SChristian S.J. Peron bpf_freed(struct bpf_d *d)
2481df8bae1dSRodney W. Grimes {
24824d621040SChristian S.J. Peron 
2483df8bae1dSRodney W. Grimes 	/*
2484df8bae1dSRodney W. Grimes 	 * We don't need to lock out interrupts since this descriptor has
2485df8bae1dSRodney W. Grimes 	 * been detached from its interface and it yet hasn't been marked
2486df8bae1dSRodney W. Grimes 	 * free.
2487df8bae1dSRodney W. Grimes 	 */
24884d621040SChristian S.J. Peron 	bpf_free(d);
248970485847SJung-uk Kim 	if (d->bd_rfilter != NULL) {
249093e39f0bSChristian S.J. Peron 		free((caddr_t)d->bd_rfilter, M_BPF);
2491ae275efcSJung-uk Kim #ifdef BPF_JITTER
249270485847SJung-uk Kim 		if (d->bd_bfilter != NULL)
2493ae275efcSJung-uk Kim 			bpf_destroy_jit_filter(d->bd_bfilter);
2494ae275efcSJung-uk Kim #endif
2495ae275efcSJung-uk Kim 	}
249670485847SJung-uk Kim 	if (d->bd_wfilter != NULL)
249793e39f0bSChristian S.J. Peron 		free((caddr_t)d->bd_wfilter, M_BPF);
2498afa85850SAlexander V. Chernikov 	mtx_destroy(&d->bd_lock);
2499df8bae1dSRodney W. Grimes }
2500df8bae1dSRodney W. Grimes 
2501df8bae1dSRodney W. Grimes /*
250224a229f4SSam Leffler  * Attach an interface to bpf.  dlt is the link layer type; hdrlen is the
250324a229f4SSam Leffler  * fixed size of the link header (variable length headers not yet supported).
2504df8bae1dSRodney W. Grimes  */
2505df8bae1dSRodney W. Grimes void
250619ba8395SChristian S.J. Peron bpfattach(struct ifnet *ifp, u_int dlt, u_int hdrlen)
2507df8bae1dSRodney W. Grimes {
250824a229f4SSam Leffler 
250924a229f4SSam Leffler 	bpfattach2(ifp, dlt, hdrlen, &ifp->if_bpf);
251024a229f4SSam Leffler }
251124a229f4SSam Leffler 
251224a229f4SSam Leffler /*
251324a229f4SSam Leffler  * Attach an interface to bpf.  ifp is a pointer to the structure
251424a229f4SSam Leffler  * defining the interface to be attached, dlt is the link layer type,
251524a229f4SSam Leffler  * and hdrlen is the fixed size of the link header (variable length
251624a229f4SSam Leffler  * headers are not yet supporrted).
251724a229f4SSam Leffler  */
251824a229f4SSam Leffler void
251919ba8395SChristian S.J. Peron bpfattach2(struct ifnet *ifp, u_int dlt, u_int hdrlen, struct bpf_if **driverp)
252024a229f4SSam Leffler {
2521df8bae1dSRodney W. Grimes 	struct bpf_if *bp;
252219ba8395SChristian S.J. Peron 
252319ba8395SChristian S.J. Peron 	bp = malloc(sizeof(*bp), M_BPF, M_NOWAIT | M_ZERO);
2524572bde2aSRobert Watson 	if (bp == NULL)
2525df8bae1dSRodney W. Grimes 		panic("bpfattach");
2526df8bae1dSRodney W. Grimes 
25274a3feeaaSRobert Watson 	LIST_INIT(&bp->bif_dlist);
252851ec1eb7SAlexander V. Chernikov 	LIST_INIT(&bp->bif_wlist);
2529df8bae1dSRodney W. Grimes 	bp->bif_ifp = ifp;
2530df8bae1dSRodney W. Grimes 	bp->bif_dlt = dlt;
2531e4b3229aSAlexander V. Chernikov 	rw_init(&bp->bif_lock, "bpf interface lock");
253216d878ccSChristian S.J. Peron 	KASSERT(*driverp == NULL, ("bpfattach2: driverp already initialized"));
253316d878ccSChristian S.J. Peron 	*driverp = bp;
2534df8bae1dSRodney W. Grimes 
2535e4b3229aSAlexander V. Chernikov 	BPF_LOCK();
25364a3feeaaSRobert Watson 	LIST_INSERT_HEAD(&bpf_iflist, bp, bif_next);
2537e4b3229aSAlexander V. Chernikov 	BPF_UNLOCK();
2538df8bae1dSRodney W. Grimes 
2539547d94bdSJung-uk Kim 	bp->bif_hdrlen = hdrlen;
2540df8bae1dSRodney W. Grimes 
25412eeab939SGarrett Wollman 	if (bootverbose)
254224a229f4SSam Leffler 		if_printf(ifp, "bpf attached\n");
2543df8bae1dSRodney W. Grimes }
254453ac6efbSJulian Elischer 
2545de5d9935SRobert Watson /*
2546de5d9935SRobert Watson  * Detach bpf from an interface. This involves detaching each descriptor
25476c74ff0eSAlexander V. Chernikov  * associated with the interface. Notify each descriptor as it's detached
25486c74ff0eSAlexander V. Chernikov  * so that any sleepers wake up and get ENXIO.
2549de5d9935SRobert Watson  */
2550de5d9935SRobert Watson void
255119ba8395SChristian S.J. Peron bpfdetach(struct ifnet *ifp)
2552de5d9935SRobert Watson {
2553f079a0faSAlexander V. Chernikov 	struct bpf_if	*bp, *bp_temp;
2554de5d9935SRobert Watson 	struct bpf_d	*d;
25559a7e6bacSLawrence Stewart 	int ndetached;
2556de5d9935SRobert Watson 
25579a7e6bacSLawrence Stewart 	ndetached = 0;
25589a7e6bacSLawrence Stewart 
2559afa85850SAlexander V. Chernikov 	BPF_LOCK();
25609a7e6bacSLawrence Stewart 	/* Find all bpf_if struct's which reference ifp and detach them. */
2561f079a0faSAlexander V. Chernikov 	LIST_FOREACH_SAFE(bp, &bpf_iflist, bif_next, bp_temp) {
2562f079a0faSAlexander V. Chernikov 		if (ifp != bp->bif_ifp)
2563f079a0faSAlexander V. Chernikov 			continue;
2564de5d9935SRobert Watson 
2565f079a0faSAlexander V. Chernikov 		LIST_REMOVE(bp, bif_next);
2566f079a0faSAlexander V. Chernikov 		/* Add to to-be-freed list */
2567f079a0faSAlexander V. Chernikov 		LIST_INSERT_HEAD(&bpf_freelist, bp, bif_next);
2568f079a0faSAlexander V. Chernikov 
25699a7e6bacSLawrence Stewart 		ndetached++;
2570f079a0faSAlexander V. Chernikov 		/*
2571f079a0faSAlexander V. Chernikov 		 * Delay freeing bp till interface is detached
2572f079a0faSAlexander V. Chernikov 		 * and all routes through this interface are removed.
2573f079a0faSAlexander V. Chernikov 		 * Mark bp as detached to restrict new consumers.
2574f079a0faSAlexander V. Chernikov 		 */
2575f079a0faSAlexander V. Chernikov 		BPFIF_WLOCK(bp);
2576f079a0faSAlexander V. Chernikov 		bp->flags |= BPFIF_FLAG_DYING;
2577f079a0faSAlexander V. Chernikov 		BPFIF_WUNLOCK(bp);
2578f079a0faSAlexander V. Chernikov 
2579f079a0faSAlexander V. Chernikov 		CTR4(KTR_NET, "%s: sheduling free for encap %d (%p) for if %p",
2580f079a0faSAlexander V. Chernikov 		    __func__, bp->bif_dlt, bp, ifp);
2581f079a0faSAlexander V. Chernikov 
2582f079a0faSAlexander V. Chernikov 		/* Free common descriptors */
25834a3feeaaSRobert Watson 		while ((d = LIST_FIRST(&bp->bif_dlist)) != NULL) {
2584afa85850SAlexander V. Chernikov 			bpf_detachd_locked(d);
2585afa85850SAlexander V. Chernikov 			BPFD_LOCK(d);
2586e7bb21b3SJonathan Lemon 			bpf_wakeup(d);
2587afa85850SAlexander V. Chernikov 			BPFD_UNLOCK(d);
2588e7bb21b3SJonathan Lemon 		}
2589f079a0faSAlexander V. Chernikov 
25906c74ff0eSAlexander V. Chernikov 		/* Free writer-only descriptors */
25916c74ff0eSAlexander V. Chernikov 		while ((d = LIST_FIRST(&bp->bif_wlist)) != NULL) {
2592afa85850SAlexander V. Chernikov 			bpf_detachd_locked(d);
2593afa85850SAlexander V. Chernikov 			BPFD_LOCK(d);
25946c74ff0eSAlexander V. Chernikov 			bpf_wakeup(d);
2595afa85850SAlexander V. Chernikov 			BPFD_UNLOCK(d);
25966c74ff0eSAlexander V. Chernikov 		}
25978eab61f3SSam Leffler 	}
2598afa85850SAlexander V. Chernikov 	BPF_UNLOCK();
25999a7e6bacSLawrence Stewart 
26009a7e6bacSLawrence Stewart #ifdef INVARIANTS
26019a7e6bacSLawrence Stewart 	if (ndetached == 0)
26029a7e6bacSLawrence Stewart 		printf("bpfdetach: %s was not attached\n", ifp->if_xname);
26039a7e6bacSLawrence Stewart #endif
26049a7e6bacSLawrence Stewart }
2605de5d9935SRobert Watson 
26068eab61f3SSam Leffler /*
2607784292f8SAlexander V. Chernikov  * Interface departure handler.
26084fe83b81SAlexander V. Chernikov  * Note departure event does not guarantee interface is going down.
2609f079a0faSAlexander V. Chernikov  * Interface renaming is currently done via departure/arrival event set.
2610f079a0faSAlexander V. Chernikov  *
2611f079a0faSAlexander V. Chernikov  * Departure handled is called after all routes pointing to
2612f079a0faSAlexander V. Chernikov  * given interface are removed and interface is in down state
2613f079a0faSAlexander V. Chernikov  * restricting any packets to be sent/received. We assume it is now safe
2614f079a0faSAlexander V. Chernikov  * to free data allocated by BPF.
2615afa85850SAlexander V. Chernikov  */
2616afa85850SAlexander V. Chernikov static void
2617afa85850SAlexander V. Chernikov bpf_ifdetach(void *arg __unused, struct ifnet *ifp)
2618afa85850SAlexander V. Chernikov {
2619f079a0faSAlexander V. Chernikov 	struct bpf_if *bp, *bp_temp;
2620f079a0faSAlexander V. Chernikov 	int nmatched = 0;
2621afa85850SAlexander V. Chernikov 
2622784292f8SAlexander V. Chernikov 	BPF_LOCK();
2623f079a0faSAlexander V. Chernikov 	/*
2624f079a0faSAlexander V. Chernikov 	 * Find matching entries in free list.
2625f079a0faSAlexander V. Chernikov 	 * Nothing should be found if bpfdetach() was not called.
2626f079a0faSAlexander V. Chernikov 	 */
2627f079a0faSAlexander V. Chernikov 	LIST_FOREACH_SAFE(bp, &bpf_freelist, bif_next, bp_temp) {
2628f079a0faSAlexander V. Chernikov 		if (ifp != bp->bif_ifp)
2629f079a0faSAlexander V. Chernikov 			continue;
2630784292f8SAlexander V. Chernikov 
2631f079a0faSAlexander V. Chernikov 		CTR3(KTR_NET, "%s: freeing BPF instance %p for interface %p",
2632afa85850SAlexander V. Chernikov 		    __func__, bp, ifp);
2633afa85850SAlexander V. Chernikov 
2634f079a0faSAlexander V. Chernikov 		LIST_REMOVE(bp, bif_next);
2635784292f8SAlexander V. Chernikov 
2636afa85850SAlexander V. Chernikov 		rw_destroy(&bp->bif_lock);
2637afa85850SAlexander V. Chernikov 		free(bp, M_BPF);
2638f079a0faSAlexander V. Chernikov 
2639f079a0faSAlexander V. Chernikov 		nmatched++;
2640f079a0faSAlexander V. Chernikov 	}
2641f079a0faSAlexander V. Chernikov 	BPF_UNLOCK();
2642f079a0faSAlexander V. Chernikov 
2643f079a0faSAlexander V. Chernikov 	/*
2644f079a0faSAlexander V. Chernikov 	 * Note that we cannot zero other pointers to
2645f079a0faSAlexander V. Chernikov 	 * custom DLTs possibly used by given interface.
2646f079a0faSAlexander V. Chernikov 	 */
2647f079a0faSAlexander V. Chernikov 	if (nmatched != 0)
2648f079a0faSAlexander V. Chernikov 		ifp->if_bpf = NULL;
2649afa85850SAlexander V. Chernikov }
2650afa85850SAlexander V. Chernikov 
2651afa85850SAlexander V. Chernikov /*
26528eab61f3SSam Leffler  * Get a list of available data link type of the interface.
26538eab61f3SSam Leffler  */
26548eab61f3SSam Leffler static int
265519ba8395SChristian S.J. Peron bpf_getdltlist(struct bpf_d *d, struct bpf_dltlist *bfl)
26568eab61f3SSam Leffler {
26578eab61f3SSam Leffler 	int n, error;
26588eab61f3SSam Leffler 	struct ifnet *ifp;
26598eab61f3SSam Leffler 	struct bpf_if *bp;
26608eab61f3SSam Leffler 
266197aacec6SAlexander V. Chernikov 	BPF_LOCK_ASSERT();
266297aacec6SAlexander V. Chernikov 
26638eab61f3SSam Leffler 	ifp = d->bd_bif->bif_ifp;
26648eab61f3SSam Leffler 	n = 0;
26658eab61f3SSam Leffler 	error = 0;
26664a3feeaaSRobert Watson 	LIST_FOREACH(bp, &bpf_iflist, bif_next) {
26678eab61f3SSam Leffler 		if (bp->bif_ifp != ifp)
26688eab61f3SSam Leffler 			continue;
26698eab61f3SSam Leffler 		if (bfl->bfl_list != NULL) {
267097aacec6SAlexander V. Chernikov 			if (n >= bfl->bfl_len)
26718eab61f3SSam Leffler 				return (ENOMEM);
26728eab61f3SSam Leffler 			error = copyout(&bp->bif_dlt,
26738eab61f3SSam Leffler 			    bfl->bfl_list + n, sizeof(u_int));
26748eab61f3SSam Leffler 		}
26758eab61f3SSam Leffler 		n++;
26768eab61f3SSam Leffler 	}
26778eab61f3SSam Leffler 	bfl->bfl_len = n;
26788eab61f3SSam Leffler 	return (error);
26798eab61f3SSam Leffler }
26808eab61f3SSam Leffler 
26818eab61f3SSam Leffler /*
26828eab61f3SSam Leffler  * Set the data link type of a BPF instance.
26838eab61f3SSam Leffler  */
26848eab61f3SSam Leffler static int
268519ba8395SChristian S.J. Peron bpf_setdlt(struct bpf_d *d, u_int dlt)
26868eab61f3SSam Leffler {
26878eab61f3SSam Leffler 	int error, opromisc;
26888eab61f3SSam Leffler 	struct ifnet *ifp;
26898eab61f3SSam Leffler 	struct bpf_if *bp;
26908eab61f3SSam Leffler 
26916c74ff0eSAlexander V. Chernikov 	BPF_LOCK_ASSERT();
26926c74ff0eSAlexander V. Chernikov 
26938eab61f3SSam Leffler 	if (d->bd_bif->bif_dlt == dlt)
26948eab61f3SSam Leffler 		return (0);
26958eab61f3SSam Leffler 	ifp = d->bd_bif->bif_ifp;
26966c74ff0eSAlexander V. Chernikov 
26974a3feeaaSRobert Watson 	LIST_FOREACH(bp, &bpf_iflist, bif_next) {
26988eab61f3SSam Leffler 		if (bp->bif_ifp == ifp && bp->bif_dlt == dlt)
26998eab61f3SSam Leffler 			break;
27008eab61f3SSam Leffler 	}
27016c74ff0eSAlexander V. Chernikov 
27028eab61f3SSam Leffler 	if (bp != NULL) {
27038eab61f3SSam Leffler 		opromisc = d->bd_promisc;
27048eab61f3SSam Leffler 		bpf_attachd(d, bp);
2705afa85850SAlexander V. Chernikov 		BPFD_LOCK(d);
27068eab61f3SSam Leffler 		reset_d(d);
2707afa85850SAlexander V. Chernikov 		BPFD_UNLOCK(d);
27088eab61f3SSam Leffler 		if (opromisc) {
27098eab61f3SSam Leffler 			error = ifpromisc(bp->bif_ifp, 1);
27108eab61f3SSam Leffler 			if (error)
27118eab61f3SSam Leffler 				if_printf(bp->bif_ifp,
27128eab61f3SSam Leffler 					"bpf_setdlt: ifpromisc failed (%d)\n",
27138eab61f3SSam Leffler 					error);
27148eab61f3SSam Leffler 			else
27158eab61f3SSam Leffler 				d->bd_promisc = 1;
27168eab61f3SSam Leffler 		}
27178eab61f3SSam Leffler 	}
27188eab61f3SSam Leffler 	return (bp == NULL ? EINVAL : 0);
2719de5d9935SRobert Watson }
2720de5d9935SRobert Watson 
27213f54a085SPoul-Henning Kamp static void
272219ba8395SChristian S.J. Peron bpf_drvinit(void *unused)
272353ac6efbSJulian Elischer {
2724136600feSEd Schouten 	struct cdev *dev;
272553ac6efbSJulian Elischer 
27266008862bSJohn Baldwin 	mtx_init(&bpf_mtx, "bpf global lock", NULL, MTX_DEF);
27274a3feeaaSRobert Watson 	LIST_INIT(&bpf_iflist);
2728f079a0faSAlexander V. Chernikov 	LIST_INIT(&bpf_freelist);
2729136600feSEd Schouten 
2730136600feSEd Schouten 	dev = make_dev(&bpf_cdevsw, 0, UID_ROOT, GID_WHEEL, 0600, "bpf");
2731136600feSEd Schouten 	/* For compatibility */
2732136600feSEd Schouten 	make_dev_alias(dev, "bpf0");
2733afa85850SAlexander V. Chernikov 
2734afa85850SAlexander V. Chernikov 	/* Register interface departure handler */
2735afa85850SAlexander V. Chernikov 	bpf_ifdetach_cookie = EVENTHANDLER_REGISTER(
2736afa85850SAlexander V. Chernikov 		    ifnet_departure_event, bpf_ifdetach, NULL,
2737afa85850SAlexander V. Chernikov 		    EVENTHANDLER_PRI_ANY);
27387198bf47SJulian Elischer }
273953ac6efbSJulian Elischer 
27400e37f3e1SChristian S.J. Peron /*
27410e37f3e1SChristian S.J. Peron  * Zero out the various packet counters associated with all of the bpf
27420e37f3e1SChristian S.J. Peron  * descriptors.  At some point, we will probably want to get a bit more
27430e37f3e1SChristian S.J. Peron  * granular and allow the user to specify descriptors to be zeroed.
27440e37f3e1SChristian S.J. Peron  */
27450e37f3e1SChristian S.J. Peron static void
27460e37f3e1SChristian S.J. Peron bpf_zero_counters(void)
27470e37f3e1SChristian S.J. Peron {
27480e37f3e1SChristian S.J. Peron 	struct bpf_if *bp;
27490e37f3e1SChristian S.J. Peron 	struct bpf_d *bd;
27500e37f3e1SChristian S.J. Peron 
2751e4b3229aSAlexander V. Chernikov 	BPF_LOCK();
27520e37f3e1SChristian S.J. Peron 	LIST_FOREACH(bp, &bpf_iflist, bif_next) {
2753e4b3229aSAlexander V. Chernikov 		BPFIF_RLOCK(bp);
27540e37f3e1SChristian S.J. Peron 		LIST_FOREACH(bd, &bp->bif_dlist, bd_next) {
2755afa85850SAlexander V. Chernikov 			BPFD_LOCK(bd);
27560e37f3e1SChristian S.J. Peron 			bd->bd_rcount = 0;
27570e37f3e1SChristian S.J. Peron 			bd->bd_dcount = 0;
27580e37f3e1SChristian S.J. Peron 			bd->bd_fcount = 0;
27590e37f3e1SChristian S.J. Peron 			bd->bd_wcount = 0;
27600e37f3e1SChristian S.J. Peron 			bd->bd_wfcount = 0;
27610e37f3e1SChristian S.J. Peron 			bd->bd_zcopy = 0;
2762afa85850SAlexander V. Chernikov 			BPFD_UNLOCK(bd);
27630e37f3e1SChristian S.J. Peron 		}
2764e4b3229aSAlexander V. Chernikov 		BPFIF_RUNLOCK(bp);
27650e37f3e1SChristian S.J. Peron 	}
2766e4b3229aSAlexander V. Chernikov 	BPF_UNLOCK();
27670e37f3e1SChristian S.J. Peron }
27680e37f3e1SChristian S.J. Peron 
27696c74ff0eSAlexander V. Chernikov /*
27706c74ff0eSAlexander V. Chernikov  * Fill filter statistics
27716c74ff0eSAlexander V. Chernikov  */
277269f7644bSChristian S.J. Peron static void
277369f7644bSChristian S.J. Peron bpfstats_fill_xbpf(struct xbpf_d *d, struct bpf_d *bd)
277469f7644bSChristian S.J. Peron {
277569f7644bSChristian S.J. Peron 
277669f7644bSChristian S.J. Peron 	bzero(d, sizeof(*d));
277769f7644bSChristian S.J. Peron 	BPFD_LOCK_ASSERT(bd);
27784d621040SChristian S.J. Peron 	d->bd_structsize = sizeof(*d);
27796c74ff0eSAlexander V. Chernikov 	/* XXX: reading should be protected by global lock */
278069f7644bSChristian S.J. Peron 	d->bd_immediate = bd->bd_immediate;
278169f7644bSChristian S.J. Peron 	d->bd_promisc = bd->bd_promisc;
278269f7644bSChristian S.J. Peron 	d->bd_hdrcmplt = bd->bd_hdrcmplt;
2783560a54e1SJung-uk Kim 	d->bd_direction = bd->bd_direction;
2784560a54e1SJung-uk Kim 	d->bd_feedback = bd->bd_feedback;
278569f7644bSChristian S.J. Peron 	d->bd_async = bd->bd_async;
278669f7644bSChristian S.J. Peron 	d->bd_rcount = bd->bd_rcount;
278769f7644bSChristian S.J. Peron 	d->bd_dcount = bd->bd_dcount;
278869f7644bSChristian S.J. Peron 	d->bd_fcount = bd->bd_fcount;
278969f7644bSChristian S.J. Peron 	d->bd_sig = bd->bd_sig;
279069f7644bSChristian S.J. Peron 	d->bd_slen = bd->bd_slen;
279169f7644bSChristian S.J. Peron 	d->bd_hlen = bd->bd_hlen;
279269f7644bSChristian S.J. Peron 	d->bd_bufsize = bd->bd_bufsize;
279369f7644bSChristian S.J. Peron 	d->bd_pid = bd->bd_pid;
279469f7644bSChristian S.J. Peron 	strlcpy(d->bd_ifname,
279569f7644bSChristian S.J. Peron 	    bd->bd_bif->bif_ifp->if_xname, IFNAMSIZ);
279693e39f0bSChristian S.J. Peron 	d->bd_locked = bd->bd_locked;
27974d621040SChristian S.J. Peron 	d->bd_wcount = bd->bd_wcount;
27984d621040SChristian S.J. Peron 	d->bd_wdcount = bd->bd_wdcount;
27994d621040SChristian S.J. Peron 	d->bd_wfcount = bd->bd_wfcount;
28004d621040SChristian S.J. Peron 	d->bd_zcopy = bd->bd_zcopy;
28014d621040SChristian S.J. Peron 	d->bd_bufmode = bd->bd_bufmode;
280269f7644bSChristian S.J. Peron }
280369f7644bSChristian S.J. Peron 
28046c74ff0eSAlexander V. Chernikov /*
28056c74ff0eSAlexander V. Chernikov  * Handle `netstat -B' stats request
28066c74ff0eSAlexander V. Chernikov  */
280769f7644bSChristian S.J. Peron static int
280869f7644bSChristian S.J. Peron bpf_stats_sysctl(SYSCTL_HANDLER_ARGS)
280969f7644bSChristian S.J. Peron {
2810*0e1152fcSHans Petter Selasky 	static const struct xbpf_d zerostats;
2811*0e1152fcSHans Petter Selasky 	struct xbpf_d *xbdbuf, *xbd, tempstats;
2812422a63daSChristian S.J. Peron 	int index, error;
281369f7644bSChristian S.J. Peron 	struct bpf_if *bp;
281469f7644bSChristian S.J. Peron 	struct bpf_d *bd;
281569f7644bSChristian S.J. Peron 
281669f7644bSChristian S.J. Peron 	/*
281769f7644bSChristian S.J. Peron 	 * XXX This is not technically correct. It is possible for non
281869f7644bSChristian S.J. Peron 	 * privileged users to open bpf devices. It would make sense
281969f7644bSChristian S.J. Peron 	 * if the users who opened the devices were able to retrieve
282069f7644bSChristian S.J. Peron 	 * the statistics for them, too.
282169f7644bSChristian S.J. Peron 	 */
2822acd3428bSRobert Watson 	error = priv_check(req->td, PRIV_NET_BPF);
282369f7644bSChristian S.J. Peron 	if (error)
282469f7644bSChristian S.J. Peron 		return (error);
28250e37f3e1SChristian S.J. Peron 	/*
28260e37f3e1SChristian S.J. Peron 	 * Check to see if the user is requesting that the counters be
28270e37f3e1SChristian S.J. Peron 	 * zeroed out.  Explicitly check that the supplied data is zeroed,
28280e37f3e1SChristian S.J. Peron 	 * as we aren't allowing the user to set the counters currently.
28290e37f3e1SChristian S.J. Peron 	 */
28300e37f3e1SChristian S.J. Peron 	if (req->newptr != NULL) {
2831*0e1152fcSHans Petter Selasky 		if (req->newlen != sizeof(tempstats))
28320e37f3e1SChristian S.J. Peron 			return (EINVAL);
2833*0e1152fcSHans Petter Selasky 		memset(&tempstats, 0, sizeof(tempstats));
2834*0e1152fcSHans Petter Selasky 		error = SYSCTL_IN(req, &tempstats, sizeof(tempstats));
2835*0e1152fcSHans Petter Selasky 		if (error)
2836*0e1152fcSHans Petter Selasky 			return (error);
2837*0e1152fcSHans Petter Selasky 		if (bcmp(&tempstats, &zerostats, sizeof(tempstats)) != 0)
28380e37f3e1SChristian S.J. Peron 			return (EINVAL);
28390e37f3e1SChristian S.J. Peron 		bpf_zero_counters();
28400e37f3e1SChristian S.J. Peron 		return (0);
28410e37f3e1SChristian S.J. Peron 	}
284269f7644bSChristian S.J. Peron 	if (req->oldptr == NULL)
2843422a63daSChristian S.J. Peron 		return (SYSCTL_OUT(req, 0, bpf_bpfd_cnt * sizeof(*xbd)));
284469f7644bSChristian S.J. Peron 	if (bpf_bpfd_cnt == 0)
284569f7644bSChristian S.J. Peron 		return (SYSCTL_OUT(req, 0, 0));
2846422a63daSChristian S.J. Peron 	xbdbuf = malloc(req->oldlen, M_BPF, M_WAITOK);
2847e4b3229aSAlexander V. Chernikov 	BPF_LOCK();
2848422a63daSChristian S.J. Peron 	if (req->oldlen < (bpf_bpfd_cnt * sizeof(*xbd))) {
2849e4b3229aSAlexander V. Chernikov 		BPF_UNLOCK();
2850422a63daSChristian S.J. Peron 		free(xbdbuf, M_BPF);
2851422a63daSChristian S.J. Peron 		return (ENOMEM);
2852422a63daSChristian S.J. Peron 	}
2853422a63daSChristian S.J. Peron 	index = 0;
285469f7644bSChristian S.J. Peron 	LIST_FOREACH(bp, &bpf_iflist, bif_next) {
2855e4b3229aSAlexander V. Chernikov 		BPFIF_RLOCK(bp);
285651ec1eb7SAlexander V. Chernikov 		/* Send writers-only first */
285751ec1eb7SAlexander V. Chernikov 		LIST_FOREACH(bd, &bp->bif_wlist, bd_next) {
285851ec1eb7SAlexander V. Chernikov 			xbd = &xbdbuf[index++];
2859afa85850SAlexander V. Chernikov 			BPFD_LOCK(bd);
286051ec1eb7SAlexander V. Chernikov 			bpfstats_fill_xbpf(xbd, bd);
2861afa85850SAlexander V. Chernikov 			BPFD_UNLOCK(bd);
286251ec1eb7SAlexander V. Chernikov 		}
286369f7644bSChristian S.J. Peron 		LIST_FOREACH(bd, &bp->bif_dlist, bd_next) {
2864422a63daSChristian S.J. Peron 			xbd = &xbdbuf[index++];
2865afa85850SAlexander V. Chernikov 			BPFD_LOCK(bd);
2866422a63daSChristian S.J. Peron 			bpfstats_fill_xbpf(xbd, bd);
2867afa85850SAlexander V. Chernikov 			BPFD_UNLOCK(bd);
286869f7644bSChristian S.J. Peron 		}
2869e4b3229aSAlexander V. Chernikov 		BPFIF_RUNLOCK(bp);
287069f7644bSChristian S.J. Peron 	}
2871e4b3229aSAlexander V. Chernikov 	BPF_UNLOCK();
2872422a63daSChristian S.J. Peron 	error = SYSCTL_OUT(req, xbdbuf, index * sizeof(*xbd));
2873422a63daSChristian S.J. Peron 	free(xbdbuf, M_BPF);
287469f7644bSChristian S.J. Peron 	return (error);
287569f7644bSChristian S.J. Peron }
287669f7644bSChristian S.J. Peron 
2877237fdd78SRobert Watson SYSINIT(bpfdev,SI_SUB_DRIVERS,SI_ORDER_MIDDLE,bpf_drvinit,NULL);
287853ac6efbSJulian Elischer 
28795bb5f2c9SPeter Wemm #else /* !DEV_BPF && !NETGRAPH_BPF */
2880f8dc4716SMike Smith /*
2881f8dc4716SMike Smith  * NOP stubs to allow bpf-using drivers to load and function.
2882f8dc4716SMike Smith  *
2883f8dc4716SMike Smith  * A 'better' implementation would allow the core bpf functionality
2884f8dc4716SMike Smith  * to be loaded at runtime.
2885f8dc4716SMike Smith  */
28867eae78a4SChristian S.J. Peron static struct bpf_if bp_null;
2887f8dc4716SMike Smith 
2888f8dc4716SMike Smith void
288919ba8395SChristian S.J. Peron bpf_tap(struct bpf_if *bp, u_char *pkt, u_int pktlen)
2890f8dc4716SMike Smith {
2891f8dc4716SMike Smith }
2892f8dc4716SMike Smith 
2893f8dc4716SMike Smith void
289419ba8395SChristian S.J. Peron bpf_mtap(struct bpf_if *bp, struct mbuf *m)
2895f8dc4716SMike Smith {
2896f8dc4716SMike Smith }
2897f8dc4716SMike Smith 
2898f8dc4716SMike Smith void
289919ba8395SChristian S.J. Peron bpf_mtap2(struct bpf_if *bp, void *d, u_int l, struct mbuf *m)
2900437ffe18SSam Leffler {
2901437ffe18SSam Leffler }
2902437ffe18SSam Leffler 
2903437ffe18SSam Leffler void
290419ba8395SChristian S.J. Peron bpfattach(struct ifnet *ifp, u_int dlt, u_int hdrlen)
2905f8dc4716SMike Smith {
29067eae78a4SChristian S.J. Peron 
29077eae78a4SChristian S.J. Peron 	bpfattach2(ifp, dlt, hdrlen, &ifp->if_bpf);
2908f8dc4716SMike Smith }
2909f8dc4716SMike Smith 
2910da626c17SBill Paul void
291119ba8395SChristian S.J. Peron bpfattach2(struct ifnet *ifp, u_int dlt, u_int hdrlen, struct bpf_if **driverp)
29125f7a7923SSam Leffler {
29137eae78a4SChristian S.J. Peron 
29147eae78a4SChristian S.J. Peron 	*driverp = &bp_null;
29155f7a7923SSam Leffler }
29165f7a7923SSam Leffler 
29175f7a7923SSam Leffler void
291819ba8395SChristian S.J. Peron bpfdetach(struct ifnet *ifp)
2919da626c17SBill Paul {
2920da626c17SBill Paul }
2921da626c17SBill Paul 
2922f8dc4716SMike Smith u_int
292319ba8395SChristian S.J. Peron bpf_filter(const struct bpf_insn *pc, u_char *p, u_int wirelen, u_int buflen)
2924f8dc4716SMike Smith {
2925f8dc4716SMike Smith 	return -1;	/* "no filter" behaviour */
2926f8dc4716SMike Smith }
2927f8dc4716SMike Smith 
29285bb5f2c9SPeter Wemm int
292919ba8395SChristian S.J. Peron bpf_validate(const struct bpf_insn *f, int len)
29305bb5f2c9SPeter Wemm {
29315bb5f2c9SPeter Wemm 	return 0;		/* false */
29325bb5f2c9SPeter Wemm }
29335bb5f2c9SPeter Wemm 
29345bb5f2c9SPeter Wemm #endif /* !DEV_BPF && !NETGRAPH_BPF */
2935