xref: /freebsd/contrib/libpcap/pcap-pf.c (revision 1e413cf93298b5b97441a21d9a50fdcd0ee9945e)
1 /*
2  * Copyright (c) 1990, 1991, 1992, 1993, 1994, 1995, 1996
3  *	The Regents of the University of California.  All rights reserved.
4  *
5  * Redistribution and use in source and binary forms, with or without
6  * modification, are permitted provided that: (1) source code distributions
7  * retain the above copyright notice and this paragraph in its entirety, (2)
8  * distributions including binary code include the above copyright notice and
9  * this paragraph in its entirety in the documentation or other materials
10  * provided with the distribution, and (3) all advertising materials mentioning
11  * features or use of this software display the following acknowledgement:
12  * ``This product includes software developed by the University of California,
13  * Lawrence Berkeley Laboratory and its contributors.'' Neither the name of
14  * the University nor the names of its contributors may be used to endorse
15  * or promote products derived from this software without specific prior
16  * written permission.
17  * THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR IMPLIED
18  * WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED WARRANTIES OF
19  * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
20  *
21  * packet filter subroutines for tcpdump
22  *	Extraction/creation by Jeffrey Mogul, DECWRL
23  */
24 
25 #ifndef lint
26 static const char rcsid[] _U_ =
27     "@(#) $Header: /tcpdump/master/libpcap/pcap-pf.c,v 1.91.2.2 2005/05/03 18:54:37 guy Exp $ (LBL)";
28 #endif
29 
30 #ifdef HAVE_CONFIG_H
31 #include "config.h"
32 #endif
33 
34 #include <sys/types.h>
35 #include <sys/time.h>
36 #include <sys/timeb.h>
37 #include <sys/socket.h>
38 #include <sys/file.h>
39 #include <sys/ioctl.h>
40 #include <net/pfilt.h>
41 
42 struct mbuf;
43 struct rtentry;
44 #include <net/if.h>
45 
46 #include <netinet/in.h>
47 #include <netinet/in_systm.h>
48 #include <netinet/ip.h>
49 #include <netinet/if_ether.h>
50 #include <netinet/ip_var.h>
51 #include <netinet/udp.h>
52 #include <netinet/udp_var.h>
53 #include <netinet/tcp.h>
54 #include <netinet/tcpip.h>
55 
56 #include <ctype.h>
57 #include <errno.h>
58 #include <netdb.h>
59 #include <stdio.h>
60 #include <stdlib.h>
61 #include <string.h>
62 #include <unistd.h>
63 
64 /*
65  * Make "pcap.h" not include "pcap-bpf.h"; we are going to include the
66  * native OS version, as we need various BPF ioctls from it.
67  */
68 #define PCAP_DONT_INCLUDE_PCAP_BPF_H
69 #include <net/bpf.h>
70 
71 #include "pcap-int.h"
72 
73 #ifdef HAVE_OS_PROTO_H
74 #include "os-proto.h"
75 #endif
76 
77 static int pcap_setfilter_pf(pcap_t *, struct bpf_program *);
78 
79 /*
80  * BUFSPACE is the size in bytes of the packet read buffer.  Most tcpdump
81  * applications aren't going to need more than 200 bytes of packet header
82  * and the read shouldn't return more packets than packetfilter's internal
83  * queue limit (bounded at 256).
84  */
85 #define BUFSPACE (200 * 256)
86 
87 static int
88 pcap_read_pf(pcap_t *pc, int cnt, pcap_handler callback, u_char *user)
89 {
90 	register u_char *p, *bp;
91 	struct bpf_insn *fcode;
92 	register int cc, n, buflen, inc;
93 	register struct enstamp *sp;
94 #ifdef LBL_ALIGN
95 	struct enstamp stamp;
96 #endif
97 #ifdef PCAP_FDDIPAD
98 	register int pad;
99 #endif
100 
101 	fcode = pc->md.use_bpf ? NULL : pc->fcode.bf_insns;
102  again:
103 	cc = pc->cc;
104 	if (cc == 0) {
105 		cc = read(pc->fd, (char *)pc->buffer + pc->offset, pc->bufsize);
106 		if (cc < 0) {
107 			if (errno == EWOULDBLOCK)
108 				return (0);
109 			if (errno == EINVAL &&
110 			    lseek(pc->fd, 0L, SEEK_CUR) + pc->bufsize < 0) {
111 				/*
112 				 * Due to a kernel bug, after 2^31 bytes,
113 				 * the kernel file offset overflows and
114 				 * read fails with EINVAL. The lseek()
115 				 * to 0 will fix things.
116 				 */
117 				(void)lseek(pc->fd, 0L, SEEK_SET);
118 				goto again;
119 			}
120 			snprintf(pc->errbuf, sizeof(pc->errbuf), "pf read: %s",
121 				pcap_strerror(errno));
122 			return (-1);
123 		}
124 		bp = pc->buffer + pc->offset;
125 	} else
126 		bp = pc->bp;
127 	/*
128 	 * Loop through each packet.
129 	 */
130 	n = 0;
131 #ifdef PCAP_FDDIPAD
132 	pad = pc->fddipad;
133 #endif
134 	while (cc > 0) {
135 		/*
136 		 * Has "pcap_breakloop()" been called?
137 		 * If so, return immediately - if we haven't read any
138 		 * packets, clear the flag and return -2 to indicate
139 		 * that we were told to break out of the loop, otherwise
140 		 * leave the flag set, so that the *next* call will break
141 		 * out of the loop without having read any packets, and
142 		 * return the number of packets we've processed so far.
143 		 */
144 		if (pc->break_loop) {
145 			if (n == 0) {
146 				pc->break_loop = 0;
147 				return (-2);
148 			} else {
149 				pc->cc = cc;
150 				pc->bp = bp;
151 				return (n);
152 			}
153 		}
154 		if (cc < sizeof(*sp)) {
155 			snprintf(pc->errbuf, sizeof(pc->errbuf),
156 			    "pf short read (%d)", cc);
157 			return (-1);
158 		}
159 #ifdef LBL_ALIGN
160 		if ((long)bp & 3) {
161 			sp = &stamp;
162 			memcpy((char *)sp, (char *)bp, sizeof(*sp));
163 		} else
164 #endif
165 			sp = (struct enstamp *)bp;
166 		if (sp->ens_stamplen != sizeof(*sp)) {
167 			snprintf(pc->errbuf, sizeof(pc->errbuf),
168 			    "pf short stamplen (%d)",
169 			    sp->ens_stamplen);
170 			return (-1);
171 		}
172 
173 		p = bp + sp->ens_stamplen;
174 		buflen = sp->ens_count;
175 		if (buflen > pc->snapshot)
176 			buflen = pc->snapshot;
177 
178 		/* Calculate inc before possible pad update */
179 		inc = ENALIGN(buflen + sp->ens_stamplen);
180 		cc -= inc;
181 		bp += inc;
182 		pc->md.TotPkts++;
183 		pc->md.TotDrops += sp->ens_dropped;
184 		pc->md.TotMissed = sp->ens_ifoverflows;
185 		if (pc->md.OrigMissed < 0)
186 			pc->md.OrigMissed = pc->md.TotMissed;
187 
188 		/*
189 		 * Short-circuit evaluation: if using BPF filter
190 		 * in kernel, no need to do it now.
191 		 *
192 #ifdef PCAP_FDDIPAD
193 		 * Note: the filter code was generated assuming
194 		 * that pc->fddipad was the amount of padding
195 		 * before the header, as that's what's required
196 		 * in the kernel, so we run the filter before
197 		 * skipping that padding.
198 #endif
199 		 */
200 		if (fcode == NULL ||
201 		    bpf_filter(fcode, p, sp->ens_count, buflen)) {
202 			struct pcap_pkthdr h;
203 			pc->md.TotAccepted++;
204 			h.ts = sp->ens_tstamp;
205 #ifdef PCAP_FDDIPAD
206 			h.len = sp->ens_count - pad;
207 #else
208 			h.len = sp->ens_count;
209 #endif
210 #ifdef PCAP_FDDIPAD
211 			p += pad;
212 			buflen -= pad;
213 #endif
214 			h.caplen = buflen;
215 			(*callback)(user, &h, p);
216 			if (++n >= cnt && cnt > 0) {
217 				pc->cc = cc;
218 				pc->bp = bp;
219 				return (n);
220 			}
221 		}
222 	}
223 	pc->cc = 0;
224 	return (n);
225 }
226 
227 static int
228 pcap_inject_pf(pcap_t *p, const void *buf, size_t size)
229 {
230 	int ret;
231 
232 	ret = write(p->fd, buf, size);
233 	if (ret == -1) {
234 		snprintf(p->errbuf, PCAP_ERRBUF_SIZE, "send: %s",
235 		    pcap_strerror(errno));
236 		return (-1);
237 	}
238 	return (ret);
239 }
240 
241 static int
242 pcap_stats_pf(pcap_t *p, struct pcap_stat *ps)
243 {
244 
245 	/*
246 	 * If packet filtering is being done in the kernel:
247 	 *
248 	 *	"ps_recv" counts only packets that passed the filter.
249 	 *	This does not include packets dropped because we
250 	 *	ran out of buffer space.  (XXX - perhaps it should,
251 	 *	by adding "ps_drop" to "ps_recv", for compatibility
252 	 *	with some other platforms.  On the other hand, on
253 	 *	some platforms "ps_recv" counts only packets that
254 	 *	passed the filter, and on others it counts packets
255 	 *	that didn't pass the filter....)
256 	 *
257 	 *	"ps_drop" counts packets that passed the kernel filter
258 	 *	(if any) but were dropped because the input queue was
259 	 *	full.
260 	 *
261 	 *	"ps_ifdrop" counts packets dropped by the network
262 	 *	inteface (regardless of whether they would have passed
263 	 *	the input filter, of course).
264 	 *
265 	 * If packet filtering is not being done in the kernel:
266 	 *
267 	 *	"ps_recv" counts only packets that passed the filter.
268 	 *
269 	 *	"ps_drop" counts packets that were dropped because the
270 	 *	input queue was full, regardless of whether they passed
271 	 *	the userland filter.
272 	 *
273 	 *	"ps_ifdrop" counts packets dropped by the network
274 	 *	inteface (regardless of whether they would have passed
275 	 *	the input filter, of course).
276 	 *
277 	 * These statistics don't include packets not yet read from
278 	 * the kernel by libpcap, but they may include packets not
279 	 * yet read from libpcap by the application.
280 	 */
281 	ps->ps_recv = p->md.TotAccepted;
282 	ps->ps_drop = p->md.TotDrops;
283 	ps->ps_ifdrop = p->md.TotMissed - p->md.OrigMissed;
284 	return (0);
285 }
286 
287 /*
288  * We include the OS's <net/bpf.h>, not our "pcap-bpf.h", so we probably
289  * don't get DLT_DOCSIS defined.
290  */
291 #ifndef DLT_DOCSIS
292 #define DLT_DOCSIS	143
293 #endif
294 
295 pcap_t *
296 pcap_open_live(const char *device, int snaplen, int promisc, int to_ms,
297     char *ebuf)
298 {
299 	pcap_t *p;
300 	short enmode;
301 	int backlog = -1;	/* request the most */
302 	struct enfilter Filter;
303 	struct endevp devparams;
304 
305 	p = (pcap_t *)malloc(sizeof(*p));
306 	if (p == NULL) {
307 		snprintf(ebuf, PCAP_ERRBUF_SIZE,
308 		    "pcap_open_live: %s", pcap_strerror(errno));
309 		return (0);
310 	}
311 	memset(p, 0, sizeof(*p));
312 	/*
313 	 * Initially try a read/write open (to allow the inject
314 	 * method to work).  If that fails due to permission
315 	 * issues, fall back to read-only.  This allows a
316 	 * non-root user to be granted specific access to pcap
317 	 * capabilities via file permissions.
318 	 *
319 	 * XXX - we should have an API that has a flag that
320 	 * controls whether to open read-only or read-write,
321 	 * so that denial of permission to send (or inability
322 	 * to send, if sending packets isn't supported on
323 	 * the device in question) can be indicated at open
324 	 * time.
325 	 *
326 	 * XXX - we assume here that "pfopen()" does not, in fact, modify
327 	 * its argument, even though it takes a "char *" rather than a
328 	 * "const char *" as its first argument.  That appears to be
329 	 * the case, at least on Digital UNIX 4.0.
330 	 */
331 	p->fd = pfopen(device, O_RDWR);
332 	if (p->fd == -1 && errno == EACCES)
333 		p->fd = pfopen(device, O_RDONLY);
334 	if (p->fd < 0) {
335 		snprintf(ebuf, PCAP_ERRBUF_SIZE, "pf open: %s: %s\n\
336 your system may not be properly configured; see the packetfilter(4) man page\n",
337 			device, pcap_strerror(errno));
338 		goto bad;
339 	}
340 	p->md.OrigMissed = -1;
341 	enmode = ENTSTAMP|ENBATCH|ENNONEXCL;
342 	if (promisc)
343 		enmode |= ENPROMISC;
344 	if (ioctl(p->fd, EIOCMBIS, (caddr_t)&enmode) < 0) {
345 		snprintf(ebuf, PCAP_ERRBUF_SIZE, "EIOCMBIS: %s",
346 		    pcap_strerror(errno));
347 		goto bad;
348 	}
349 #ifdef	ENCOPYALL
350 	/* Try to set COPYALL mode so that we see packets to ourself */
351 	enmode = ENCOPYALL;
352 	(void)ioctl(p->fd, EIOCMBIS, (caddr_t)&enmode);/* OK if this fails */
353 #endif
354 	/* set the backlog */
355 	if (ioctl(p->fd, EIOCSETW, (caddr_t)&backlog) < 0) {
356 		snprintf(ebuf, PCAP_ERRBUF_SIZE, "EIOCSETW: %s",
357 		    pcap_strerror(errno));
358 		goto bad;
359 	}
360 	/* discover interface type */
361 	if (ioctl(p->fd, EIOCDEVP, (caddr_t)&devparams) < 0) {
362 		snprintf(ebuf, PCAP_ERRBUF_SIZE, "EIOCDEVP: %s",
363 		    pcap_strerror(errno));
364 		goto bad;
365 	}
366 	/* HACK: to compile prior to Ultrix 4.2 */
367 #ifndef	ENDT_FDDI
368 #define	ENDT_FDDI	4
369 #endif
370 	switch (devparams.end_dev_type) {
371 
372 	case ENDT_10MB:
373 		p->linktype = DLT_EN10MB;
374 		p->offset = 2;
375 		/*
376 		 * This is (presumably) a real Ethernet capture; give it a
377 		 * link-layer-type list with DLT_EN10MB and DLT_DOCSIS, so
378 		 * that an application can let you choose it, in case you're
379 		 * capturing DOCSIS traffic that a Cisco Cable Modem
380 		 * Termination System is putting out onto an Ethernet (it
381 		 * doesn't put an Ethernet header onto the wire, it puts raw
382 		 * DOCSIS frames out on the wire inside the low-level
383 		 * Ethernet framing).
384 		 */
385 		p->dlt_list = (u_int *) malloc(sizeof(u_int) * 2);
386 		/*
387 		 * If that fails, just leave the list empty.
388 		 */
389 		if (p->dlt_list != NULL) {
390 			p->dlt_list[0] = DLT_EN10MB;
391 			p->dlt_list[1] = DLT_DOCSIS;
392 			p->dlt_count = 2;
393 		}
394 		break;
395 
396 	case ENDT_FDDI:
397 		p->linktype = DLT_FDDI;
398 		break;
399 
400 #ifdef ENDT_SLIP
401 	case ENDT_SLIP:
402 		p->linktype = DLT_SLIP;
403 		break;
404 #endif
405 
406 #ifdef ENDT_PPP
407 	case ENDT_PPP:
408 		p->linktype = DLT_PPP;
409 		break;
410 #endif
411 
412 #ifdef ENDT_LOOPBACK
413 	case ENDT_LOOPBACK:
414 		/*
415 		 * It appears to use Ethernet framing, at least on
416 		 * Digital UNIX 4.0.
417 		 */
418 		p->linktype = DLT_EN10MB;
419 		p->offset = 2;
420 		break;
421 #endif
422 
423 #ifdef ENDT_TRN
424 	case ENDT_TRN:
425 		p->linktype = DLT_IEEE802;
426 		break;
427 #endif
428 
429 	default:
430 		/*
431 		 * XXX - what about ENDT_IEEE802?  The pfilt.h header
432 		 * file calls this "IEEE 802 networks (non-Ethernet)",
433 		 * but that doesn't specify a specific link layer type;
434 		 * it could be 802.4, or 802.5 (except that 802.5 is
435 		 * ENDT_TRN), or 802.6, or 802.11, or....  That's why
436 		 * DLT_IEEE802 was hijacked to mean Token Ring in various
437 		 * BSDs, and why we went along with that hijacking.
438 		 *
439 		 * XXX - what about ENDT_HDLC and ENDT_NULL?
440 		 * Presumably, as ENDT_OTHER is just "Miscellaneous
441 		 * framing", there's not much we can do, as that
442 		 * doesn't specify a particular type of header.
443 		 */
444 		snprintf(ebuf, PCAP_ERRBUF_SIZE, "unknown data-link type %u",
445 		    devparams.end_dev_type);
446 		goto bad;
447 	}
448 	/* set truncation */
449 #ifdef PCAP_FDDIPAD
450 	if (p->linktype == DLT_FDDI) {
451 		p->fddipad = PCAP_FDDIPAD;
452 
453 		/* packetfilter includes the padding in the snapshot */
454 		snaplen += PCAP_FDDIPAD;
455 	} else
456 		p->fddipad = 0;
457 #endif
458 	if (ioctl(p->fd, EIOCTRUNCATE, (caddr_t)&snaplen) < 0) {
459 		snprintf(ebuf, PCAP_ERRBUF_SIZE, "EIOCTRUNCATE: %s",
460 		    pcap_strerror(errno));
461 		goto bad;
462 	}
463 	p->snapshot = snaplen;
464 	/* accept all packets */
465 	memset(&Filter, 0, sizeof(Filter));
466 	Filter.enf_Priority = 37;	/* anything > 2 */
467 	Filter.enf_FilterLen = 0;	/* means "always true" */
468 	if (ioctl(p->fd, EIOCSETF, (caddr_t)&Filter) < 0) {
469 		snprintf(ebuf, PCAP_ERRBUF_SIZE, "EIOCSETF: %s",
470 		    pcap_strerror(errno));
471 		goto bad;
472 	}
473 
474 	if (to_ms != 0) {
475 		struct timeval timeout;
476 		timeout.tv_sec = to_ms / 1000;
477 		timeout.tv_usec = (to_ms * 1000) % 1000000;
478 		if (ioctl(p->fd, EIOCSRTIMEOUT, (caddr_t)&timeout) < 0) {
479 			snprintf(ebuf, PCAP_ERRBUF_SIZE, "EIOCSRTIMEOUT: %s",
480 				pcap_strerror(errno));
481 			goto bad;
482 		}
483 	}
484 
485 	p->bufsize = BUFSPACE;
486 	p->buffer = (u_char*)malloc(p->bufsize + p->offset);
487 	if (p->buffer == NULL) {
488 		strlcpy(ebuf, pcap_strerror(errno), PCAP_ERRBUF_SIZE);
489 		goto bad;
490 	}
491 
492 	/*
493 	 * "select()" and "poll()" work on packetfilter devices.
494 	 */
495 	p->selectable_fd = p->fd;
496 
497 	p->read_op = pcap_read_pf;
498 	p->inject_op = pcap_inject_pf;
499 	p->setfilter_op = pcap_setfilter_pf;
500 	p->setdirection_op = NULL;	/* Not implemented. */
501 	p->set_datalink_op = NULL;	/* can't change data link type */
502 	p->getnonblock_op = pcap_getnonblock_fd;
503 	p->setnonblock_op = pcap_setnonblock_fd;
504 	p->stats_op = pcap_stats_pf;
505 	p->close_op = pcap_close_common;
506 
507 	return (p);
508  bad:
509 	if (p->fd >= 0)
510 		close(p->fd);
511 	/*
512 	 * Get rid of any link-layer type list we allocated.
513 	 */
514 	if (p->dlt_list != NULL)
515 		free(p->dlt_list);
516 	free(p);
517 	return (NULL);
518 }
519 
520 int
521 pcap_platform_finddevs(pcap_if_t **alldevsp, char *errbuf)
522 {
523 	return (0);
524 }
525 
526 static int
527 pcap_setfilter_pf(pcap_t *p, struct bpf_program *fp)
528 {
529 	struct bpf_version bv;
530 
531 	/*
532 	 * See if BIOCVERSION works.  If not, we assume the kernel doesn't
533 	 * support BPF-style filters (it's not documented in the bpf(7)
534 	 * or packetfiler(7) man pages, but the code used to fail if
535 	 * BIOCSETF worked but BIOCVERSION didn't, and I've seen it do
536 	 * kernel filtering in DU 4.0, so presumably BIOCVERSION works
537 	 * there, at least).
538 	 */
539 	if (ioctl(p->fd, BIOCVERSION, (caddr_t)&bv) >= 0) {
540 		/*
541 		 * OK, we have the version of the BPF interpreter;
542 		 * is it the same major version as us, and the same
543 		 * or better minor version?
544 		 */
545 		if (bv.bv_major == BPF_MAJOR_VERSION &&
546 		    bv.bv_minor >= BPF_MINOR_VERSION) {
547 			/*
548 			 * Yes.  Try to install the filter.
549 			 */
550 			if (ioctl(p->fd, BIOCSETF, (caddr_t)fp) < 0) {
551 				snprintf(p->errbuf, sizeof(p->errbuf),
552 				    "BIOCSETF: %s", pcap_strerror(errno));
553 				return (-1);
554 			}
555 
556 			/*
557 			 * OK, that succeeded.  We're doing filtering in
558 			 * the kernel.  (We assume we don't have a
559 			 * userland filter installed - that'd require
560 			 * a previous version check to have failed but
561 			 * this one to succeed.)
562 			 *
563 			 * XXX - this message should be supplied to the
564 			 * application as a warning of some sort,
565 			 * except that if it's a GUI application, it's
566 			 * not clear that it should be displayed in
567 			 * a window to annoy the user.
568 			 */
569 			fprintf(stderr, "tcpdump: Using kernel BPF filter\n");
570 			p->md.use_bpf = 1;
571 
572 			/*
573 			 * Discard any previously-received packets,
574 			 * as they might have passed whatever filter
575 			 * was formerly in effect, but might not pass
576 			 * this filter (BIOCSETF discards packets buffered
577 			 * in the kernel, so you can lose packets in any
578 			 * case).
579 			 */
580 			p->cc = 0;
581 			return (0);
582 		}
583 
584 		/*
585 		 * We can't use the kernel's BPF interpreter; don't give
586 		 * up, just log a message and be inefficient.
587 		 *
588 		 * XXX - this should really be supplied to the application
589 		 * as a warning of some sort.
590 		 */
591 		fprintf(stderr,
592 	    "tcpdump: Requires BPF language %d.%d or higher; kernel is %d.%d\n",
593 		    BPF_MAJOR_VERSION, BPF_MINOR_VERSION,
594 		    bv.bv_major, bv.bv_minor);
595 	}
596 
597 	/*
598 	 * We couldn't do filtering in the kernel; do it in userland.
599 	 */
600 	if (install_bpf_program(p, fp) < 0)
601 		return (-1);
602 
603 	/*
604 	 * XXX - this message should be supplied by the application as
605 	 * a warning of some sort.
606 	 */
607 	fprintf(stderr, "tcpdump: Filtering in user process\n");
608 	p->md.use_bpf = 0;
609 	return (0);
610 }
611