]> The Tcpdump Group git mirrors - libpcap/blob - pcap-pf.c
Clean up the declaration of the packet-filtering routines.
[libpcap] / pcap-pf.c
1 /*
2 * Copyright (c) 1990, 1991, 1992, 1993, 1994, 1995, 1996
3 * The Regents of the University of California. All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that: (1) source code distributions
7 * retain the above copyright notice and this paragraph in its entirety, (2)
8 * distributions including binary code include the above copyright notice and
9 * this paragraph in its entirety in the documentation or other materials
10 * provided with the distribution, and (3) all advertising materials mentioning
11 * features or use of this software display the following acknowledgement:
12 * ``This product includes software developed by the University of California,
13 * Lawrence Berkeley Laboratory and its contributors.'' Neither the name of
14 * the University nor the names of its contributors may be used to endorse
15 * or promote products derived from this software without specific prior
16 * written permission.
17 * THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR IMPLIED
18 * WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED WARRANTIES OF
19 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
20 *
21 * packet filter subroutines for tcpdump
22 * Extraction/creation by Jeffrey Mogul, DECWRL
23 */
24
25 #ifdef HAVE_CONFIG_H
26 #include <config.h>
27 #endif
28
29 #include <sys/types.h>
30 #include <sys/time.h>
31 #include <sys/timeb.h>
32 #include <sys/socket.h>
33 #include <sys/file.h>
34 #include <sys/ioctl.h>
35 #include <net/pfilt.h>
36
37 struct mbuf;
38 struct rtentry;
39 #include <net/if.h>
40
41 #include <netinet/in.h>
42 #include <netinet/in_systm.h>
43 #include <netinet/ip.h>
44 #include <netinet/if_ether.h>
45 #include <netinet/ip_var.h>
46 #include <netinet/udp.h>
47 #include <netinet/udp_var.h>
48 #include <netinet/tcp.h>
49 #include <netinet/tcpip.h>
50
51 #include <ctype.h>
52 #include <errno.h>
53 #include <netdb.h>
54 #include <stdio.h>
55 #include <stdlib.h>
56 #include <string.h>
57 #include <unistd.h>
58
59 /*
60 * Make "pcap.h" not include "pcap/bpf.h"; we are going to include the
61 * native OS version, as we need various BPF ioctls from it.
62 */
63 #define PCAP_DONT_INCLUDE_PCAP_BPF_H
64 #include <net/bpf.h>
65
66 #include "pcap-int.h"
67
68 #ifdef HAVE_OS_PROTO_H
69 #include "os-proto.h"
70 #endif
71
72 /*
73 * FDDI packets are padded to make everything line up on a nice boundary.
74 */
75 #define PCAP_FDDIPAD 3
76
77 /*
78 * Private data for capturing on Ultrix and DEC OSF/1^WDigital UNIX^W^W
79 * Tru64 UNIX packetfilter devices.
80 */
81 struct pcap_pf {
82 int filtering_in_kernel; /* using kernel filter */
83 u_long TotPkts; /* can't oflow for 79 hrs on ether */
84 u_long TotAccepted; /* count accepted by filter */
85 u_long TotDrops; /* count of dropped packets */
86 long TotMissed; /* missed by i/f during this run */
87 long OrigMissed; /* missed by i/f before this run */
88 };
89
90 static int pcap_setfilter_pf(pcap_t *, struct bpf_program *);
91
92 /*
93 * BUFSPACE is the size in bytes of the packet read buffer. Most tcpdump
94 * applications aren't going to need more than 200 bytes of packet header
95 * and the read shouldn't return more packets than packetfilter's internal
96 * queue limit (bounded at 256).
97 */
98 #define BUFSPACE (200 * 256)
99
100 static int
101 pcap_read_pf(pcap_t *pc, int cnt, pcap_handler callback, u_char *user)
102 {
103 struct pcap_pf *pf = pc->priv;
104 register u_char *p, *bp;
105 register int cc, n, buflen, inc;
106 register struct enstamp *sp;
107 struct enstamp stamp;
108 register u_int pad;
109
110 again:
111 cc = pc->cc;
112 if (cc == 0) {
113 cc = read(pc->fd, (char *)pc->buffer + pc->offset, pc->bufsize);
114 if (cc < 0) {
115 if (errno == EWOULDBLOCK)
116 return (0);
117 if (errno == EINVAL &&
118 lseek(pc->fd, 0L, SEEK_CUR) + pc->bufsize < 0) {
119 /*
120 * Due to a kernel bug, after 2^31 bytes,
121 * the kernel file offset overflows and
122 * read fails with EINVAL. The lseek()
123 * to 0 will fix things.
124 */
125 (void)lseek(pc->fd, 0L, SEEK_SET);
126 goto again;
127 }
128 pcap_fmt_errmsg_for_errno(pc->errbuf,
129 sizeof(pc->errbuf), errno, "pf read");
130 return (-1);
131 }
132 bp = (u_char *)pc->buffer + pc->offset;
133 } else
134 bp = pc->bp;
135 /*
136 * Loop through each packet.
137 */
138 n = 0;
139 pad = pc->fddipad;
140 while (cc > 0) {
141 /*
142 * Has "pcap_breakloop()" been called?
143 * If so, return immediately - if we haven't read any
144 * packets, clear the flag and return -2 to indicate
145 * that we were told to break out of the loop, otherwise
146 * leave the flag set, so that the *next* call will break
147 * out of the loop without having read any packets, and
148 * return the number of packets we've processed so far.
149 */
150 if (pc->break_loop) {
151 if (n == 0) {
152 pc->break_loop = 0;
153 return (-2);
154 } else {
155 pc->cc = cc;
156 pc->bp = bp;
157 return (n);
158 }
159 }
160 if (cc < sizeof(*sp)) {
161 pcap_snprintf(pc->errbuf, sizeof(pc->errbuf),
162 "pf short read (%d)", cc);
163 return (-1);
164 }
165 if ((long)bp & 3) {
166 sp = &stamp;
167 memcpy((char *)sp, (char *)bp, sizeof(*sp));
168 } else
169 sp = (struct enstamp *)bp;
170 if (sp->ens_stamplen != sizeof(*sp)) {
171 pcap_snprintf(pc->errbuf, sizeof(pc->errbuf),
172 "pf short stamplen (%d)",
173 sp->ens_stamplen);
174 return (-1);
175 }
176
177 p = bp + sp->ens_stamplen;
178 buflen = sp->ens_count;
179 if (buflen > pc->snapshot)
180 buflen = pc->snapshot;
181
182 /* Calculate inc before possible pad update */
183 inc = ENALIGN(buflen + sp->ens_stamplen);
184 cc -= inc;
185 bp += inc;
186 pf->TotPkts++;
187 pf->TotDrops += sp->ens_dropped;
188 pf->TotMissed = sp->ens_ifoverflows;
189 if (pf->OrigMissed < 0)
190 pf->OrigMissed = pf->TotMissed;
191
192 /*
193 * Short-circuit evaluation: if using BPF filter
194 * in kernel, no need to do it now - we already know
195 * the packet passed the filter.
196 *
197 * Note: the filter code was generated assuming
198 * that pc->fddipad was the amount of padding
199 * before the header, as that's what's required
200 * in the kernel, so we run the filter before
201 * skipping that padding.
202 */
203 if (pf->filtering_in_kernel ||
204 pcap_filter(pc->fcode.bf_insns, p, sp->ens_count, buflen)) {
205 struct pcap_pkthdr h;
206 pf->TotAccepted++;
207 h.ts = sp->ens_tstamp;
208 h.len = sp->ens_count - pad;
209 p += pad;
210 buflen -= pad;
211 h.caplen = buflen;
212 (*callback)(user, &h, p);
213 if (++n >= cnt && !PACKET_COUNT_IS_UNLIMITED(cnt)) {
214 pc->cc = cc;
215 pc->bp = bp;
216 return (n);
217 }
218 }
219 }
220 pc->cc = 0;
221 return (n);
222 }
223
224 static int
225 pcap_inject_pf(pcap_t *p, const void *buf, size_t size)
226 {
227 int ret;
228
229 ret = write(p->fd, buf, size);
230 if (ret == -1) {
231 pcap_fmt_errmsg_for_errno(p->errbuf, PCAP_ERRBUF_SIZE,
232 errno, "send");
233 return (-1);
234 }
235 return (ret);
236 }
237
238 static int
239 pcap_stats_pf(pcap_t *p, struct pcap_stat *ps)
240 {
241 struct pcap_pf *pf = p->priv;
242
243 /*
244 * If packet filtering is being done in the kernel:
245 *
246 * "ps_recv" counts only packets that passed the filter.
247 * This does not include packets dropped because we
248 * ran out of buffer space. (XXX - perhaps it should,
249 * by adding "ps_drop" to "ps_recv", for compatibility
250 * with some other platforms. On the other hand, on
251 * some platforms "ps_recv" counts only packets that
252 * passed the filter, and on others it counts packets
253 * that didn't pass the filter....)
254 *
255 * "ps_drop" counts packets that passed the kernel filter
256 * (if any) but were dropped because the input queue was
257 * full.
258 *
259 * "ps_ifdrop" counts packets dropped by the network
260 * inteface (regardless of whether they would have passed
261 * the input filter, of course).
262 *
263 * If packet filtering is not being done in the kernel:
264 *
265 * "ps_recv" counts only packets that passed the filter.
266 *
267 * "ps_drop" counts packets that were dropped because the
268 * input queue was full, regardless of whether they passed
269 * the userland filter.
270 *
271 * "ps_ifdrop" counts packets dropped by the network
272 * inteface (regardless of whether they would have passed
273 * the input filter, of course).
274 *
275 * These statistics don't include packets not yet read from
276 * the kernel by libpcap, but they may include packets not
277 * yet read from libpcap by the application.
278 */
279 ps->ps_recv = pf->TotAccepted;
280 ps->ps_drop = pf->TotDrops;
281 ps->ps_ifdrop = pf->TotMissed - pf->OrigMissed;
282 return (0);
283 }
284
285 /*
286 * We include the OS's <net/bpf.h>, not our "pcap/bpf.h", so we probably
287 * don't get DLT_DOCSIS defined.
288 */
289 #ifndef DLT_DOCSIS
290 #define DLT_DOCSIS 143
291 #endif
292
293 static int
294 pcap_activate_pf(pcap_t *p)
295 {
296 struct pcap_pf *pf = p->priv;
297 short enmode;
298 int backlog = -1; /* request the most */
299 struct enfilter Filter;
300 struct endevp devparams;
301 int err;
302
303 /*
304 * Initially try a read/write open (to allow the inject
305 * method to work). If that fails due to permission
306 * issues, fall back to read-only. This allows a
307 * non-root user to be granted specific access to pcap
308 * capabilities via file permissions.
309 *
310 * XXX - we should have an API that has a flag that
311 * controls whether to open read-only or read-write,
312 * so that denial of permission to send (or inability
313 * to send, if sending packets isn't supported on
314 * the device in question) can be indicated at open
315 * time.
316 *
317 * XXX - we assume here that "pfopen()" does not, in fact, modify
318 * its argument, even though it takes a "char *" rather than a
319 * "const char *" as its first argument. That appears to be
320 * the case, at least on Digital UNIX 4.0.
321 *
322 * XXX - is there an error that means "no such device"? Is
323 * there one that means "that device doesn't support pf"?
324 */
325 p->fd = pfopen(p->opt.device, O_RDWR);
326 if (p->fd == -1 && errno == EACCES)
327 p->fd = pfopen(p->opt.device, O_RDONLY);
328 if (p->fd < 0) {
329 if (errno == EACCES) {
330 pcap_snprintf(p->errbuf, PCAP_ERRBUF_SIZE,
331 "pf open: %s: Permission denied\n"
332 "your system may not be properly configured; see the packetfilter(4) man page",
333 p->opt.device);
334 err = PCAP_ERROR_PERM_DENIED;
335 } else {
336 pcap_fmt_errmsg_for_errno(p->errbuf, PCAP_ERRBUF_SIZE,
337 errno, "pf open: %s", p->opt.device);
338 err = PCAP_ERROR;
339 }
340 goto bad;
341 }
342
343 /*
344 * Turn a negative snapshot value (invalid), a snapshot value of
345 * 0 (unspecified), or a value bigger than the normal maximum
346 * value, into the maximum allowed value.
347 *
348 * If some application really *needs* a bigger snapshot
349 * length, we should just increase MAXIMUM_SNAPLEN.
350 */
351 if (p->snapshot <= 0 || p->snapshot > MAXIMUM_SNAPLEN)
352 p->snapshot = MAXIMUM_SNAPLEN;
353
354 pf->OrigMissed = -1;
355 enmode = ENTSTAMP|ENNONEXCL;
356 if (!p->opt.immediate)
357 enmode |= ENBATCH;
358 if (p->opt.promisc)
359 enmode |= ENPROMISC;
360 if (ioctl(p->fd, EIOCMBIS, (caddr_t)&enmode) < 0) {
361 pcap_fmt_errmsg_for_errno(p->errbuf, PCAP_ERRBUF_SIZE,
362 errno, "EIOCMBIS");
363 err = PCAP_ERROR;
364 goto bad;
365 }
366 #ifdef ENCOPYALL
367 /* Try to set COPYALL mode so that we see packets to ourself */
368 enmode = ENCOPYALL;
369 (void)ioctl(p->fd, EIOCMBIS, (caddr_t)&enmode);/* OK if this fails */
370 #endif
371 /* set the backlog */
372 if (ioctl(p->fd, EIOCSETW, (caddr_t)&backlog) < 0) {
373 pcap_fmt_errmsg_for_errno(p->errbuf, PCAP_ERRBUF_SIZE,
374 errno, "EIOCSETW");
375 err = PCAP_ERROR;
376 goto bad;
377 }
378 /* discover interface type */
379 if (ioctl(p->fd, EIOCDEVP, (caddr_t)&devparams) < 0) {
380 pcap_fmt_errmsg_for_errno(p->errbuf, PCAP_ERRBUF_SIZE,
381 errno, "EIOCDEVP");
382 err = PCAP_ERROR;
383 goto bad;
384 }
385 /* HACK: to compile prior to Ultrix 4.2 */
386 #ifndef ENDT_FDDI
387 #define ENDT_FDDI 4
388 #endif
389 switch (devparams.end_dev_type) {
390
391 case ENDT_10MB:
392 p->linktype = DLT_EN10MB;
393 p->offset = 2;
394 /*
395 * This is (presumably) a real Ethernet capture; give it a
396 * link-layer-type list with DLT_EN10MB and DLT_DOCSIS, so
397 * that an application can let you choose it, in case you're
398 * capturing DOCSIS traffic that a Cisco Cable Modem
399 * Termination System is putting out onto an Ethernet (it
400 * doesn't put an Ethernet header onto the wire, it puts raw
401 * DOCSIS frames out on the wire inside the low-level
402 * Ethernet framing).
403 */
404 p->dlt_list = (u_int *) malloc(sizeof(u_int) * 2);
405 /*
406 * If that fails, just leave the list empty.
407 */
408 if (p->dlt_list != NULL) {
409 p->dlt_list[0] = DLT_EN10MB;
410 p->dlt_list[1] = DLT_DOCSIS;
411 p->dlt_count = 2;
412 }
413 break;
414
415 case ENDT_FDDI:
416 p->linktype = DLT_FDDI;
417 break;
418
419 #ifdef ENDT_SLIP
420 case ENDT_SLIP:
421 p->linktype = DLT_SLIP;
422 break;
423 #endif
424
425 #ifdef ENDT_PPP
426 case ENDT_PPP:
427 p->linktype = DLT_PPP;
428 break;
429 #endif
430
431 #ifdef ENDT_LOOPBACK
432 case ENDT_LOOPBACK:
433 /*
434 * It appears to use Ethernet framing, at least on
435 * Digital UNIX 4.0.
436 */
437 p->linktype = DLT_EN10MB;
438 p->offset = 2;
439 break;
440 #endif
441
442 #ifdef ENDT_TRN
443 case ENDT_TRN:
444 p->linktype = DLT_IEEE802;
445 break;
446 #endif
447
448 default:
449 /*
450 * XXX - what about ENDT_IEEE802? The pfilt.h header
451 * file calls this "IEEE 802 networks (non-Ethernet)",
452 * but that doesn't specify a specific link layer type;
453 * it could be 802.4, or 802.5 (except that 802.5 is
454 * ENDT_TRN), or 802.6, or 802.11, or.... That's why
455 * DLT_IEEE802 was hijacked to mean Token Ring in various
456 * BSDs, and why we went along with that hijacking.
457 *
458 * XXX - what about ENDT_HDLC and ENDT_NULL?
459 * Presumably, as ENDT_OTHER is just "Miscellaneous
460 * framing", there's not much we can do, as that
461 * doesn't specify a particular type of header.
462 */
463 pcap_snprintf(p->errbuf, PCAP_ERRBUF_SIZE,
464 "unknown data-link type %u", devparams.end_dev_type);
465 err = PCAP_ERROR;
466 goto bad;
467 }
468 /* set truncation */
469 if (p->linktype == DLT_FDDI) {
470 p->fddipad = PCAP_FDDIPAD;
471
472 /* packetfilter includes the padding in the snapshot */
473 p->snapshot += PCAP_FDDIPAD;
474 } else
475 p->fddipad = 0;
476 if (ioctl(p->fd, EIOCTRUNCATE, (caddr_t)&p->snapshot) < 0) {
477 pcap_fmt_errmsg_for_errno(p->errbuf, PCAP_ERRBUF_SIZE,
478 errno, "EIOCTRUNCATE");
479 err = PCAP_ERROR;
480 goto bad;
481 }
482 /* accept all packets */
483 memset(&Filter, 0, sizeof(Filter));
484 Filter.enf_Priority = 37; /* anything > 2 */
485 Filter.enf_FilterLen = 0; /* means "always true" */
486 if (ioctl(p->fd, EIOCSETF, (caddr_t)&Filter) < 0) {
487 pcap_fmt_errmsg_for_errno(p->errbuf, PCAP_ERRBUF_SIZE,
488 errno, "EIOCSETF");
489 err = PCAP_ERROR;
490 goto bad;
491 }
492
493 if (p->opt.timeout != 0) {
494 struct timeval timeout;
495 timeout.tv_sec = p->opt.timeout / 1000;
496 timeout.tv_usec = (p->opt.timeout * 1000) % 1000000;
497 if (ioctl(p->fd, EIOCSRTIMEOUT, (caddr_t)&timeout) < 0) {
498 pcap_fmt_errmsg_for_errno(p->errbuf, PCAP_ERRBUF_SIZE,
499 errno, "EIOCSRTIMEOUT");
500 err = PCAP_ERROR;
501 goto bad;
502 }
503 }
504
505 p->bufsize = BUFSPACE;
506 p->buffer = malloc(p->bufsize + p->offset);
507 if (p->buffer == NULL) {
508 pcap_fmt_errmsg_for_errno(p->errbuf, PCAP_ERRBUF_SIZE,
509 errno, "malloc");
510 err = PCAP_ERROR;
511 goto bad;
512 }
513
514 /*
515 * "select()" and "poll()" work on packetfilter devices.
516 */
517 p->selectable_fd = p->fd;
518
519 p->read_op = pcap_read_pf;
520 p->inject_op = pcap_inject_pf;
521 p->setfilter_op = pcap_setfilter_pf;
522 p->setdirection_op = NULL; /* Not implemented. */
523 p->set_datalink_op = NULL; /* can't change data link type */
524 p->getnonblock_op = pcap_getnonblock_fd;
525 p->setnonblock_op = pcap_setnonblock_fd;
526 p->stats_op = pcap_stats_pf;
527
528 return (0);
529 bad:
530 pcap_cleanup_live_common(p);
531 return (err);
532 }
533
534 pcap_t *
535 pcap_create_interface(const char *device _U_, char *ebuf)
536 {
537 pcap_t *p;
538
539 p = pcap_create_common(ebuf, sizeof (struct pcap_pf));
540 if (p == NULL)
541 return (NULL);
542
543 p->activate_op = pcap_activate_pf;
544 return (p);
545 }
546
547 /*
548 * XXX - is there an error from pfopen() that means "no such device"?
549 * Is there one that means "that device doesn't support pf"?
550 */
551 static int
552 can_be_bound(const char *name _U_)
553 {
554 return (1);
555 }
556
557 static int
558 get_if_flags(const char *name _U_, bpf_u_int32 *flags _U_, char *errbuf _U_)
559 {
560 /*
561 * Nothing we can do other than mark loopback devices as "the
562 * connected/disconnected status doesn't apply".
563 *
564 * XXX - is there a way to find out whether an adapter has
565 * something plugged into it?
566 */
567 if (*flags & PCAP_IF_LOOPBACK) {
568 /*
569 * Loopback devices aren't wireless, and "connected"/
570 * "disconnected" doesn't apply to them.
571 */
572 *flags |= PCAP_IF_CONNECTION_STATUS_NOT_APPLICABLE;
573 return (0);
574 }
575 return (0);
576 }
577
578 int
579 pcap_platform_finddevs(pcap_if_list_t *devlistp, char *errbuf)
580 {
581 return (pcap_findalldevs_interfaces(devlistp, errbuf, can_be_bound,
582 get_if_flags));
583 }
584
585 static int
586 pcap_setfilter_pf(pcap_t *p, struct bpf_program *fp)
587 {
588 struct pcap_pf *pf = p->priv;
589 struct bpf_version bv;
590
591 /*
592 * See if BIOCVERSION works. If not, we assume the kernel doesn't
593 * support BPF-style filters (it's not documented in the bpf(7)
594 * or packetfiler(7) man pages, but the code used to fail if
595 * BIOCSETF worked but BIOCVERSION didn't, and I've seen it do
596 * kernel filtering in DU 4.0, so presumably BIOCVERSION works
597 * there, at least).
598 */
599 if (ioctl(p->fd, BIOCVERSION, (caddr_t)&bv) >= 0) {
600 /*
601 * OK, we have the version of the BPF interpreter;
602 * is it the same major version as us, and the same
603 * or better minor version?
604 */
605 if (bv.bv_major == BPF_MAJOR_VERSION &&
606 bv.bv_minor >= BPF_MINOR_VERSION) {
607 /*
608 * Yes. Try to install the filter.
609 */
610 if (ioctl(p->fd, BIOCSETF, (caddr_t)fp) < 0) {
611 pcap_fmt_errmsg_for_errno(p->errbuf,
612 sizeof(p->errbuf), errno, "BIOCSETF");
613 return (-1);
614 }
615
616 /*
617 * OK, that succeeded. We're doing filtering in
618 * the kernel. (We assume we don't have a
619 * userland filter installed - that'd require
620 * a previous version check to have failed but
621 * this one to succeed.)
622 *
623 * XXX - this message should be supplied to the
624 * application as a warning of some sort,
625 * except that if it's a GUI application, it's
626 * not clear that it should be displayed in
627 * a window to annoy the user.
628 */
629 fprintf(stderr, "tcpdump: Using kernel BPF filter\n");
630 pf->filtering_in_kernel = 1;
631
632 /*
633 * Discard any previously-received packets,
634 * as they might have passed whatever filter
635 * was formerly in effect, but might not pass
636 * this filter (BIOCSETF discards packets buffered
637 * in the kernel, so you can lose packets in any
638 * case).
639 */
640 p->cc = 0;
641 return (0);
642 }
643
644 /*
645 * We can't use the kernel's BPF interpreter; don't give
646 * up, just log a message and be inefficient.
647 *
648 * XXX - this should really be supplied to the application
649 * as a warning of some sort.
650 */
651 fprintf(stderr,
652 "tcpdump: Requires BPF language %d.%d or higher; kernel is %d.%d\n",
653 BPF_MAJOR_VERSION, BPF_MINOR_VERSION,
654 bv.bv_major, bv.bv_minor);
655 }
656
657 /*
658 * We couldn't do filtering in the kernel; do it in userland.
659 */
660 if (install_bpf_program(p, fp) < 0)
661 return (-1);
662
663 /*
664 * XXX - this message should be supplied by the application as
665 * a warning of some sort.
666 */
667 fprintf(stderr, "tcpdump: Filtering in user process\n");
668 pf->filtering_in_kernel = 0;
669 return (0);
670 }
671
672 /*
673 * Libpcap version string.
674 */
675 const char *
676 pcap_lib_version(void)
677 {
678 return (PCAP_VERSION_STRING);
679 }