#include "bpf.h"
#ifndef __GNUC__
#define inline
#else
#define inline __inline
#endif
#include <sys/param.h>
#include <sys/systm.h>
#include <sys/conf.h>
#include <sys/malloc.h>
#include <sys/mbuf.h>
#include <sys/time.h>
#include <sys/proc.h>
#include <sys/signalvar.h>
#include <sys/filio.h>
#include <sys/sockio.h>
#include <sys/ttycom.h>
#include <sys/filedesc.h>
#include <sys/uio_internal.h>
#include <sys/file_internal.h>
#include <sys/event.h>
#include <sys/poll.h>
#include <sys/socket.h>
#include <sys/socketvar.h>
#include <sys/vnode.h>
#include <net/if.h>
#include <net/bpf.h>
#include <net/bpfdesc.h>
#include <netinet/in.h>
#include <netinet/in_pcb.h>
#include <netinet/in_var.h>
#include <netinet/ip_var.h>
#include <netinet/tcp.h>
#include <netinet/tcp_var.h>
#include <netinet/udp.h>
#include <netinet/udp_var.h>
#include <netinet/if_ether.h>
#include <sys/kernel.h>
#include <sys/sysctl.h>
#include <net/firewire.h>
#include <miscfs/devfs/devfs.h>
#include <net/dlil.h>
#include <net/pktap.h>
#include <kern/locks.h>
#include <kern/thread_call.h>
#include <libkern/section_keywords.h>
#if CONFIG_MACF_NET
#include <security/mac_framework.h>
#endif
extern int tvtohz(struct timeval *);
#define BPF_BUFSIZE 4096
#define UIOMOVE(cp, len, code, uio) uiomove(cp, len, uio)
#define PRINET 26
typedef void (*pktcopyfunc_t)(const void *, void *, size_t);
static unsigned int bpf_bufsize = BPF_BUFSIZE;
SYSCTL_INT(_debug, OID_AUTO, bpf_bufsize, CTLFLAG_RW | CTLFLAG_LOCKED,
&bpf_bufsize, 0, "");
__private_extern__ unsigned int bpf_maxbufsize = BPF_MAXBUFSIZE;
SYSCTL_INT(_debug, OID_AUTO, bpf_maxbufsize, CTLFLAG_RW | CTLFLAG_LOCKED,
&bpf_maxbufsize, 0, "");
static unsigned int bpf_maxdevices = 256;
SYSCTL_UINT(_debug, OID_AUTO, bpf_maxdevices, CTLFLAG_RW | CTLFLAG_LOCKED,
&bpf_maxdevices, 0, "");
#if CONFIG_EMBEDDED
static unsigned int bpf_wantpktap = 1;
#else
static unsigned int bpf_wantpktap = 0;
#endif
SYSCTL_UINT(_debug, OID_AUTO, bpf_wantpktap, CTLFLAG_RW | CTLFLAG_LOCKED,
&bpf_wantpktap, 0, "");
static int bpf_debug = 0;
SYSCTL_INT(_debug, OID_AUTO, bpf_debug, CTLFLAG_RW | CTLFLAG_LOCKED,
&bpf_debug, 0, "");
static struct bpf_if *bpf_iflist;
#ifdef __APPLE__
static struct bpf_d **bpf_dtab = NULL;
static unsigned int bpf_dtab_size = 0;
static unsigned int nbpfilter = 0;
decl_lck_mtx_data(static, bpf_mlock_data);
static lck_mtx_t *bpf_mlock = &bpf_mlock_data;
static lck_grp_t *bpf_mlock_grp;
static lck_grp_attr_t *bpf_mlock_grp_attr;
static lck_attr_t *bpf_mlock_attr;
#endif
static int bpf_allocbufs(struct bpf_d *);
static errno_t bpf_attachd(struct bpf_d *d, struct bpf_if *bp);
static int bpf_detachd(struct bpf_d *d, int);
static void bpf_freed(struct bpf_d *);
static int bpf_movein(struct uio *, int,
struct mbuf **, struct sockaddr *, int *);
static int bpf_setif(struct bpf_d *, ifnet_t ifp);
static void bpf_timed_out(void *, void *);
static void bpf_wakeup(struct bpf_d *);
static void catchpacket(struct bpf_d *, struct bpf_packet *, u_int, int);
static void reset_d(struct bpf_d *);
static int bpf_setf(struct bpf_d *, u_int, user_addr_t, u_long);
static int bpf_getdltlist(struct bpf_d *, caddr_t, struct proc *);
static int bpf_setdlt(struct bpf_d *, u_int);
static int bpf_set_traffic_class(struct bpf_d *, int);
static void bpf_set_packet_service_class(struct mbuf *, int);
static void bpf_acquire_d(struct bpf_d *);
static void bpf_release_d(struct bpf_d *);
static int bpf_devsw_installed;
void bpf_init(void *unused);
static int bpf_tap_callback(struct ifnet *ifp, struct mbuf *m);
d_open_t bpfopen;
d_close_t bpfclose;
d_read_t bpfread;
d_write_t bpfwrite;
ioctl_fcn_t bpfioctl;
select_fcn_t bpfselect;
#define CDEV_MAJOR 23
static struct cdevsw bpf_cdevsw = {
bpfopen,
bpfclose,
bpfread,
bpfwrite,
bpfioctl,
eno_stop,
eno_reset,
NULL,
bpfselect,
eno_mmap,
eno_strat,
eno_getc,
eno_putc,
0
};
#define SOCKADDR_HDR_LEN offsetof(struct sockaddr, sa_data)
static int
bpf_movein(struct uio *uio, int linktype, struct mbuf **mp, struct sockaddr *sockp, int *datlen)
{
struct mbuf *m;
int error;
int len;
uint8_t sa_family;
int hlen;
switch (linktype) {
#if SLIP
case DLT_SLIP:
sa_family = AF_INET;
hlen = 0;
break;
#endif
case DLT_EN10MB:
sa_family = AF_UNSPEC;
hlen = sizeof(struct ether_header);
break;
#if FDDI
case DLT_FDDI:
#if defined(__FreeBSD__) || defined(__bsdi__)
sa_family = AF_IMPLINK;
hlen = 0;
#else
sa_family = AF_UNSPEC;
hlen = 24;
#endif
break;
#endif
case DLT_RAW:
case DLT_NULL:
sa_family = AF_UNSPEC;
hlen = 0;
break;
#ifdef __FreeBSD__
case DLT_ATM_RFC1483:
sa_family = AF_UNSPEC;
hlen = 12;
break;
#endif
case DLT_PPP:
sa_family = AF_UNSPEC;
hlen = 4;
break;
case DLT_APPLE_IP_OVER_IEEE1394:
sa_family = AF_UNSPEC;
hlen = sizeof(struct firewire_header);
break;
case DLT_IEEE802_11:
sa_family = AF_IEEE80211;
hlen = 0;
break;
case DLT_IEEE802_11_RADIO:
sa_family = AF_IEEE80211;
hlen = 0;
break;
default:
return (EIO);
}
len = uio_resid(uio);
*datlen = len - hlen;
if ((unsigned)len > MCLBYTES)
return (EIO);
if (sockp) {
if ((hlen + SOCKADDR_HDR_LEN) > sockp->sa_len) {
return (EIO);
}
sockp->sa_family = sa_family;
} else {
hlen = 0;
}
MGETHDR(m, M_WAIT, MT_DATA);
if (m == 0)
return (ENOBUFS);
if ((unsigned)len > MHLEN) {
MCLGET(m, M_WAIT);
if ((m->m_flags & M_EXT) == 0) {
error = ENOBUFS;
goto bad;
}
}
m->m_pkthdr.len = m->m_len = len;
m->m_pkthdr.rcvif = NULL;
*mp = m;
if (hlen != 0) {
m->m_pkthdr.len -= hlen;
m->m_len -= hlen;
m->m_data += hlen;
error = UIOMOVE((caddr_t)sockp->sa_data, hlen, UIO_WRITE, uio);
if (error)
goto bad;
}
error = UIOMOVE(mtod(m, caddr_t), len - hlen, UIO_WRITE, uio);
if (error)
goto bad;
switch (linktype) {
case DLT_EN10MB: {
struct ether_header *eh = mtod(m, struct ether_header *);
if (ETHER_IS_MULTICAST(eh->ether_dhost)) {
if (_ether_cmp(etherbroadcastaddr, eh->ether_dhost) == 0)
m->m_flags |= M_BCAST;
else
m->m_flags |= M_MCAST;
}
break;
}
}
return 0;
bad:
m_freem(m);
return (error);
}
#ifdef __APPLE__
static void
bpf_make_dev_t(int maj)
{
static int bpf_growing = 0;
unsigned int cur_size = nbpfilter, i;
if (nbpfilter >= bpf_maxdevices)
return;
while (bpf_growing) {
(void)tsleep((caddr_t)&bpf_growing, PZERO, "bpf_growing", 0);
}
if (nbpfilter > cur_size) {
return;
}
bpf_growing = 1;
if (nbpfilter == bpf_dtab_size) {
int new_dtab_size;
struct bpf_d **new_dtab = NULL;
struct bpf_d **old_dtab = NULL;
new_dtab_size = bpf_dtab_size + NBPFILTER;
new_dtab = (struct bpf_d **)_MALLOC(sizeof(struct bpf_d *) * new_dtab_size, M_DEVBUF, M_WAIT);
if (new_dtab == 0) {
printf("bpf_make_dev_t: malloc bpf_dtab failed\n");
goto done;
}
if (bpf_dtab) {
bcopy(bpf_dtab, new_dtab,
sizeof(struct bpf_d *) * bpf_dtab_size);
}
bzero(new_dtab + bpf_dtab_size,
sizeof(struct bpf_d *) * NBPFILTER);
old_dtab = bpf_dtab;
bpf_dtab = new_dtab;
bpf_dtab_size = new_dtab_size;
if (old_dtab != NULL)
_FREE(old_dtab, M_DEVBUF);
}
i = nbpfilter++;
(void) devfs_make_node(makedev(maj, i),
DEVFS_CHAR, UID_ROOT, GID_WHEEL, 0600,
"bpf%d", i);
done:
bpf_growing = 0;
wakeup((caddr_t)&bpf_growing);
}
#endif
static errno_t
bpf_attachd(struct bpf_d *d, struct bpf_if *bp)
{
int first = bp->bif_dlist == NULL;
int error = 0;
d->bd_bif = bp;
d->bd_next = bp->bif_dlist;
bp->bif_dlist = d;
bpf_acquire_d(d);
if (first) {
if (bp->bif_ifp->if_bpf == NULL) {
struct bpf_if *tmp, *primary = NULL;
for (tmp = bpf_iflist; tmp; tmp = tmp->bif_next) {
if (tmp->bif_ifp == bp->bif_ifp) {
primary = tmp;
break;
}
}
bp->bif_ifp->if_bpf = primary;
}
if (bp->bif_ifp->if_bpf == bp)
dlil_set_bpf_tap(bp->bif_ifp, BPF_TAP_INPUT_OUTPUT, bpf_tap_callback);
if (bp->bif_tap != NULL)
error = bp->bif_tap(bp->bif_ifp, bp->bif_dlt, BPF_TAP_INPUT_OUTPUT);
}
d->bd_flags &= ~(BPF_DETACHING | BPF_DETACHED);
if (bp->bif_dlt == DLT_PKTAP) {
d->bd_flags |= BPF_FINALIZE_PKTAP;
} else {
d->bd_flags &= ~BPF_FINALIZE_PKTAP;
}
return error;
}
static int
bpf_detachd(struct bpf_d *d, int closing)
{
struct bpf_d **p;
struct bpf_if *bp;
struct ifnet *ifp;
int bpf_closed = d->bd_flags & BPF_CLOSING;
if ((d->bd_flags & (BPF_DETACHED | BPF_DETACHING)) != 0)
goto done;
d->bd_flags |= BPF_DETACHING;
ifp = d->bd_bif->bif_ifp;
bp = d->bd_bif;
if (bpf_debug != 0)
printf("%s: %llx %s%s\n",
__func__, (uint64_t)VM_KERNEL_ADDRPERM(d),
if_name(ifp), closing ? " closing" : "");
p = &bp->bif_dlist;
while (*p != d) {
p = &(*p)->bd_next;
if (*p == 0)
panic("bpf_detachd: descriptor not in list");
}
*p = (*p)->bd_next;
if (bp->bif_dlist == 0) {
if (bp->bif_ifp->if_bpf == bp)
dlil_set_bpf_tap(ifp, BPF_TAP_DISABLE, NULL);
if (bp->bif_tap)
bp->bif_tap(ifp, bp->bif_dlt, BPF_TAP_DISABLE);
for (bp = bpf_iflist; bp; bp = bp->bif_next)
if (bp->bif_ifp == ifp && bp->bif_dlist != 0)
break;
if (bp == NULL)
ifp->if_bpf = NULL;
}
d->bd_bif = NULL;
if (d->bd_promisc) {
d->bd_promisc = 0;
lck_mtx_unlock(bpf_mlock);
if (ifnet_set_promiscuous(ifp, 0)) {
printf("%s: ifnet_set_promiscuous failed\n", __func__);
}
lck_mtx_lock(bpf_mlock);
}
d->bd_flags &= ~BPF_DETACHING;
d->bd_flags |= BPF_DETACHED;
bpf_closed = d->bd_flags & BPF_CLOSING;
bpf_release_d(d);
done:
if (bpf_debug != 0)
printf("%s: %llx done\n",
__func__, (uint64_t)VM_KERNEL_ADDRPERM(d));
if (bpf_closed)
return (1);
else
return (0);
}
static void
bpf_start_timer(struct bpf_d *d)
{
uint64_t deadline;
struct timeval tv;
if (d->bd_rtout > 0 && d->bd_state == BPF_IDLE) {
tv.tv_sec = d->bd_rtout / hz;
tv.tv_usec = (d->bd_rtout % hz) * tick;
clock_interval_to_deadline(
(uint64_t)tv.tv_sec * USEC_PER_SEC + tv.tv_usec,
NSEC_PER_USEC, &deadline);
thread_call_enter_delayed(d->bd_thread_call, deadline);
d->bd_state = BPF_WAITING;
}
}
static boolean_t
bpf_stop_timer(struct bpf_d *d)
{
return (thread_call_cancel(d->bd_thread_call));
}
void
bpf_acquire_d(struct bpf_d *d)
{
void *lr_saved = __builtin_return_address(0);
LCK_MTX_ASSERT(bpf_mlock, LCK_MTX_ASSERT_OWNED);
d->bd_refcnt += 1;
d->bd_ref_lr[d->bd_next_ref_lr] = lr_saved;
d->bd_next_ref_lr = (d->bd_next_ref_lr + 1) % BPF_REF_HIST;
}
void
bpf_release_d(struct bpf_d *d)
{
void *lr_saved = __builtin_return_address(0);
LCK_MTX_ASSERT(bpf_mlock, LCK_MTX_ASSERT_OWNED);
if (d->bd_refcnt <= 0)
panic("%s: %p refcnt <= 0", __func__, d);
d->bd_refcnt -= 1;
d->bd_unref_lr[d->bd_next_unref_lr] = lr_saved;
d->bd_next_unref_lr = (d->bd_next_unref_lr + 1) % BPF_REF_HIST;
if (d->bd_refcnt == 0) {
if ((d->bd_flags & BPF_DETACHED) == 0)
panic("%s: %p BPF_DETACHED not set", __func__, d);
_FREE(d, M_DEVBUF);
}
}
int
bpfopen(dev_t dev, int flags, __unused int fmt,
__unused struct proc *p)
{
struct bpf_d *d;
lck_mtx_lock(bpf_mlock);
if ((unsigned int) minor(dev) >= nbpfilter) {
lck_mtx_unlock(bpf_mlock);
return (ENXIO);
}
if ((unsigned int) minor(dev) == (nbpfilter - 1))
bpf_make_dev_t(major(dev));
if (bpf_dtab[minor(dev)] == 0) {
bpf_dtab[minor(dev)] = (void *)1;
} else {
lck_mtx_unlock(bpf_mlock);
return (EBUSY);
}
d = (struct bpf_d *)_MALLOC(sizeof(struct bpf_d), M_DEVBUF,
M_WAIT | M_ZERO);
if (d == NULL) {
printf("bpfopen: malloc bpf_d failed\n");
bpf_dtab[minor(dev)] = NULL;
lck_mtx_unlock(bpf_mlock);
return ENOMEM;
}
bpf_acquire_d(d);
d->bd_bufsize = bpf_bufsize;
d->bd_sig = SIGIO;
d->bd_seesent = 1;
d->bd_oflags = flags;
d->bd_state = BPF_IDLE;
d->bd_traffic_class = SO_TC_BE;
d->bd_flags |= BPF_DETACHED;
if (bpf_wantpktap)
d->bd_flags |= BPF_WANT_PKTAP;
else
d->bd_flags &= ~BPF_WANT_PKTAP;
d->bd_thread_call = thread_call_allocate(bpf_timed_out, d);
if (d->bd_thread_call == NULL) {
printf("bpfopen: malloc thread call failed\n");
bpf_dtab[minor(dev)] = NULL;
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
return (ENOMEM);
}
#if CONFIG_MACF_NET
mac_bpfdesc_label_init(d);
mac_bpfdesc_label_associate(kauth_cred_get(), d);
#endif
bpf_dtab[minor(dev)] = d;
lck_mtx_unlock(bpf_mlock);
return (0);
}
int
bpfclose(dev_t dev, __unused int flags, __unused int fmt,
__unused struct proc *p)
{
struct bpf_d *d;
lck_mtx_lock(bpf_mlock);
d = bpf_dtab[minor(dev)];
if (d == 0 || d == (void *)1) {
lck_mtx_unlock(bpf_mlock);
return (ENXIO);
}
d->bd_flags |= BPF_CLOSING;
if (bpf_debug != 0)
printf("%s: %llx\n",
__func__, (uint64_t)VM_KERNEL_ADDRPERM(d));
bpf_dtab[minor(dev)] = (void *)1;
switch (d->bd_state) {
case BPF_IDLE:
break;
case BPF_WAITING:
if (!bpf_stop_timer(d)) {
d->bd_state = BPF_DRAINING;
while (d->bd_state == BPF_DRAINING)
msleep((caddr_t)d, bpf_mlock, PRINET,
"bpfdraining", NULL);
}
d->bd_state = BPF_IDLE;
break;
case BPF_TIMED_OUT:
d->bd_state = BPF_IDLE;
break;
case BPF_DRAINING:
panic("Two threads blocked in a BPF close");
break;
}
if (d->bd_bif)
bpf_detachd(d, 1);
selthreadclear(&d->bd_sel);
#if CONFIG_MACF_NET
mac_bpfdesc_label_destroy(d);
#endif
thread_call_free(d->bd_thread_call);
while (d->bd_hbuf_read)
msleep((caddr_t)d, bpf_mlock, PRINET, "bpf_reading", NULL);
bpf_freed(d);
bpf_dtab[minor(dev)] = NULL;
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
return (0);
}
#define BPF_SLEEP bpf_sleep
static int
bpf_sleep(struct bpf_d *d, int pri, const char *wmesg, int timo)
{
u_int64_t abstime = 0;
if(timo)
clock_interval_to_deadline(timo, NSEC_PER_SEC / hz, &abstime);
return msleep1((caddr_t)d, bpf_mlock, pri, wmesg, abstime);
}
#define ROTATE_BUFFERS(d) \
if (d->bd_hbuf_read) \
panic("rotating bpf buffers during read"); \
(d)->bd_hbuf = (d)->bd_sbuf; \
(d)->bd_hlen = (d)->bd_slen; \
(d)->bd_hcnt = (d)->bd_scnt; \
(d)->bd_sbuf = (d)->bd_fbuf; \
(d)->bd_slen = 0; \
(d)->bd_scnt = 0; \
(d)->bd_fbuf = NULL;
int
bpfread(dev_t dev, struct uio *uio, int ioflag)
{
struct bpf_d *d;
caddr_t hbuf;
int timed_out, hbuf_len;
int error;
int flags;
lck_mtx_lock(bpf_mlock);
d = bpf_dtab[minor(dev)];
if (d == 0 || d == (void *)1 || (d->bd_flags & BPF_CLOSING) != 0) {
lck_mtx_unlock(bpf_mlock);
return (ENXIO);
}
bpf_acquire_d(d);
if (uio_resid(uio) != d->bd_bufsize) {
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
return (EINVAL);
}
if (d->bd_state == BPF_WAITING)
bpf_stop_timer(d);
timed_out = (d->bd_state == BPF_TIMED_OUT);
d->bd_state = BPF_IDLE;
while (d->bd_hbuf_read)
msleep((caddr_t)d, bpf_mlock, PRINET, "bpf_reading", NULL);
if ((d->bd_flags & BPF_CLOSING) != 0) {
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
return (ENXIO);
}
while (d->bd_hbuf == 0) {
if ((d->bd_immediate || timed_out || (ioflag & IO_NDELAY))
&& d->bd_slen != 0) {
ROTATE_BUFFERS(d);
break;
}
if (d->bd_bif == NULL) {
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
return (ENXIO);
}
if (ioflag & IO_NDELAY) {
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
return (EWOULDBLOCK);
}
error = BPF_SLEEP(d, PRINET|PCATCH, "bpf",
d->bd_rtout);
if ((d->bd_flags & BPF_CLOSING) != 0) {
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
return (ENXIO);
}
while (d->bd_hbuf_read)
msleep((caddr_t)d, bpf_mlock, PRINET, "bpf_reading", NULL);
if ((d->bd_flags & BPF_CLOSING) != 0) {
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
return (ENXIO);
}
if (error == EINTR || error == ERESTART) {
if (d->bd_hbuf != NULL) {
break;
}
if (d->bd_slen != 0) {
ROTATE_BUFFERS(d);
break;
}
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
if (error == ERESTART) {
printf("%s: %llx ERESTART to EINTR\n",
__func__, (uint64_t)VM_KERNEL_ADDRPERM(d));
error = EINTR;
}
return (error);
}
if (error == EWOULDBLOCK) {
if (d->bd_hbuf)
break;
if (d->bd_slen == 0) {
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
return (0);
}
ROTATE_BUFFERS(d);
break;
}
}
d->bd_hbuf_read = 1;
hbuf = d->bd_hbuf;
hbuf_len = d->bd_hlen;
flags = d->bd_flags;
lck_mtx_unlock(bpf_mlock);
#ifdef __APPLE__
if (flags & BPF_EXTENDED_HDR) {
char *p;
p = hbuf;
while (p < hbuf + hbuf_len) {
struct bpf_hdr_ext *ehp;
uint32_t flowid;
struct so_procinfo soprocinfo;
int found = 0;
ehp = (struct bpf_hdr_ext *)(void *)p;
if ((flowid = ehp->bh_flowid)) {
if (ehp->bh_proto == IPPROTO_TCP)
found = inp_findinpcb_procinfo(&tcbinfo,
flowid, &soprocinfo);
else if (ehp->bh_proto == IPPROTO_UDP)
found = inp_findinpcb_procinfo(&udbinfo,
flowid, &soprocinfo);
if (found == 1) {
ehp->bh_pid = soprocinfo.spi_pid;
proc_name(ehp->bh_pid, ehp->bh_comm, MAXCOMLEN);
}
ehp->bh_flowid = 0;
}
if (flags & BPF_FINALIZE_PKTAP) {
struct pktap_header *pktaphdr;
pktaphdr = (struct pktap_header *)(void *)
(p + BPF_WORDALIGN(ehp->bh_hdrlen));
if (pktaphdr->pth_flags & PTH_FLAG_DELAY_PKTAP)
pktap_finalize_proc_info(pktaphdr);
if (pktaphdr->pth_flags & PTH_FLAG_TSTAMP) {
ehp->bh_tstamp.tv_sec =
pktaphdr->pth_tstamp.tv_sec;
ehp->bh_tstamp.tv_usec =
pktaphdr->pth_tstamp.tv_usec;
}
}
p += BPF_WORDALIGN(ehp->bh_hdrlen + ehp->bh_caplen);
}
} else if (flags & BPF_FINALIZE_PKTAP) {
char *p;
p = hbuf;
while (p < hbuf + hbuf_len) {
struct bpf_hdr *hp;
struct pktap_header *pktaphdr;
hp = (struct bpf_hdr *)(void *)p;
pktaphdr = (struct pktap_header *)(void *)
(p + BPF_WORDALIGN(hp->bh_hdrlen));
if (pktaphdr->pth_flags & PTH_FLAG_DELAY_PKTAP)
pktap_finalize_proc_info(pktaphdr);
if (pktaphdr->pth_flags & PTH_FLAG_TSTAMP) {
hp->bh_tstamp.tv_sec =
pktaphdr->pth_tstamp.tv_sec;
hp->bh_tstamp.tv_usec =
pktaphdr->pth_tstamp.tv_usec;
}
p += BPF_WORDALIGN(hp->bh_hdrlen + hp->bh_caplen);
}
}
#endif
error = UIOMOVE(hbuf, hbuf_len, UIO_READ, uio);
lck_mtx_lock(bpf_mlock);
if ((d->bd_flags & BPF_CLOSING) != 0) {
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
return (ENXIO);
}
d->bd_hbuf_read = 0;
d->bd_fbuf = d->bd_hbuf;
d->bd_hbuf = NULL;
d->bd_hlen = 0;
d->bd_hcnt = 0;
wakeup((caddr_t)d);
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
return (error);
}
static void
bpf_wakeup(struct bpf_d *d)
{
if (d->bd_state == BPF_WAITING) {
bpf_stop_timer(d);
d->bd_state = BPF_IDLE;
}
wakeup((caddr_t)d);
if (d->bd_async && d->bd_sig && d->bd_sigio)
pgsigio(d->bd_sigio, d->bd_sig);
selwakeup(&d->bd_sel);
if ((d->bd_flags & BPF_KNOTE))
KNOTE(&d->bd_sel.si_note, 1);
}
static void
bpf_timed_out(void *arg, __unused void *dummy)
{
struct bpf_d *d = (struct bpf_d *)arg;
lck_mtx_lock(bpf_mlock);
if (d->bd_state == BPF_WAITING) {
d->bd_state = BPF_TIMED_OUT;
if (d->bd_slen != 0)
bpf_wakeup(d);
} else if (d->bd_state == BPF_DRAINING) {
d->bd_state = BPF_IDLE;
bpf_wakeup(d);
}
lck_mtx_unlock(bpf_mlock);
}
#define MAX_DATALINK_HDR_LEN (sizeof(struct firewire_header))
int
bpfwrite(dev_t dev, struct uio *uio, __unused int ioflag)
{
struct bpf_d *d;
struct ifnet *ifp;
struct mbuf *m = NULL;
int error;
char dst_buf[SOCKADDR_HDR_LEN + MAX_DATALINK_HDR_LEN];
int datlen = 0;
int bif_dlt;
int bd_hdrcmplt;
lck_mtx_lock(bpf_mlock);
d = bpf_dtab[minor(dev)];
if (d == 0 || d == (void *)1 || (d->bd_flags & BPF_CLOSING) != 0) {
lck_mtx_unlock(bpf_mlock);
return (ENXIO);
}
bpf_acquire_d(d);
if (d->bd_bif == 0) {
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
return (ENXIO);
}
ifp = d->bd_bif->bif_ifp;
if ((ifp->if_flags & IFF_UP) == 0) {
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
return (ENETDOWN);
}
if (uio_resid(uio) == 0) {
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
return (0);
}
((struct sockaddr *)dst_buf)->sa_len = sizeof(dst_buf);
bif_dlt = (int)d->bd_bif->bif_dlt;
bd_hdrcmplt = d->bd_hdrcmplt;
lck_mtx_unlock(bpf_mlock);
error = bpf_movein(uio, bif_dlt, &m,
bd_hdrcmplt ? NULL : (struct sockaddr *)dst_buf,
&datlen);
lck_mtx_lock(bpf_mlock);
if (error) {
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
return (error);
}
if ((d->bd_flags & BPF_CLOSING) != 0) {
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
m_freem(m);
return (ENXIO);
}
if (d->bd_bif == NULL) {
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
m_free(m);
return (ENXIO);
}
if ((unsigned)datlen > ifp->if_mtu) {
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
m_freem(m);
return (EMSGSIZE);
}
#if CONFIG_MACF_NET
mac_mbuf_label_associate_bpfdesc(d, m);
#endif
bpf_set_packet_service_class(m, d->bd_traffic_class);
lck_mtx_unlock(bpf_mlock);
if (d->bd_hdrcmplt) {
if (d->bd_bif->bif_send)
error = d->bd_bif->bif_send(ifp, d->bd_bif->bif_dlt, m);
else
error = dlil_output(ifp, 0, m, NULL, NULL, 1, NULL);
} else {
error = dlil_output(ifp, PF_INET, m, NULL,
(struct sockaddr *)dst_buf, 0, NULL);
}
lck_mtx_lock(bpf_mlock);
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
return (error);
}
static void
reset_d(struct bpf_d *d)
{
if (d->bd_hbuf_read)
panic("resetting buffers during read");
if (d->bd_hbuf) {
d->bd_fbuf = d->bd_hbuf;
d->bd_hbuf = NULL;
}
d->bd_slen = 0;
d->bd_hlen = 0;
d->bd_scnt = 0;
d->bd_hcnt = 0;
d->bd_rcount = 0;
d->bd_dcount = 0;
}
int
bpfioctl(dev_t dev, u_long cmd, caddr_t addr, __unused int flags,
struct proc *p)
{
struct bpf_d *d;
int error = 0;
u_int int_arg;
struct ifreq ifr;
lck_mtx_lock(bpf_mlock);
d = bpf_dtab[minor(dev)];
if (d == 0 || d == (void *)1 || (d->bd_flags & BPF_CLOSING) != 0) {
lck_mtx_unlock(bpf_mlock);
return (ENXIO);
}
bpf_acquire_d(d);
if (d->bd_state == BPF_WAITING)
bpf_stop_timer(d);
d->bd_state = BPF_IDLE;
switch (cmd) {
default:
error = EINVAL;
break;
case FIONREAD:
{
int n;
n = d->bd_slen;
if (d->bd_hbuf && d->bd_hbuf_read == 0)
n += d->bd_hlen;
bcopy(&n, addr, sizeof (n));
break;
}
case SIOCGIFADDR:
{
struct ifnet *ifp;
if (d->bd_bif == 0)
error = EINVAL;
else {
ifp = d->bd_bif->bif_ifp;
error = ifnet_ioctl(ifp, 0, cmd, addr);
}
break;
}
case BIOCGBLEN:
bcopy(&d->bd_bufsize, addr, sizeof (u_int));
break;
case BIOCSBLEN:
if (d->bd_bif != 0 || (d->bd_flags & BPF_DETACHING))
error = EINVAL;
else {
u_int size;
bcopy(addr, &size, sizeof (size));
if (d->bd_headdrop != 0 && size > 2 * bpf_maxbufsize)
size = 2 * bpf_maxbufsize;
else if (size > bpf_maxbufsize)
size = bpf_maxbufsize;
else if (size < BPF_MINBUFSIZE)
size = BPF_MINBUFSIZE;
bcopy(&size, addr, sizeof (size));
d->bd_bufsize = size;
}
break;
case BIOCSETF32:
case BIOCSETFNR32: {
struct bpf_program32 prg32;
bcopy(addr, &prg32, sizeof (prg32));
error = bpf_setf(d, prg32.bf_len,
CAST_USER_ADDR_T(prg32.bf_insns), cmd);
break;
}
case BIOCSETF64:
case BIOCSETFNR64: {
struct bpf_program64 prg64;
bcopy(addr, &prg64, sizeof (prg64));
error = bpf_setf(d, prg64.bf_len, prg64.bf_insns, cmd);
break;
}
case BIOCFLUSH:
while (d->bd_hbuf_read) {
msleep((caddr_t)d, bpf_mlock, PRINET, "bpf_reading", NULL);
}
if ((d->bd_flags & BPF_CLOSING) != 0) {
error = ENXIO;
break;
}
reset_d(d);
break;
case BIOCPROMISC:
if (d->bd_bif == 0) {
error = EINVAL;
break;
}
if (d->bd_promisc == 0) {
lck_mtx_unlock(bpf_mlock);
error = ifnet_set_promiscuous(d->bd_bif->bif_ifp, 1);
lck_mtx_lock(bpf_mlock);
if (error == 0)
d->bd_promisc = 1;
}
break;
case BIOCGDLT:
if (d->bd_bif == 0)
error = EINVAL;
else
bcopy(&d->bd_bif->bif_dlt, addr, sizeof (u_int));
break;
case BIOCGDLTLIST:
if (d->bd_bif == NULL) {
error = EINVAL;
} else {
error = bpf_getdltlist(d, addr, p);
}
break;
case BIOCSDLT:
if (d->bd_bif == NULL) {
error = EINVAL;
} else {
u_int dlt;
bcopy(addr, &dlt, sizeof (dlt));
if (dlt == DLT_PKTAP && !(d->bd_flags & BPF_WANT_PKTAP)) {
printf("BIOCSDLT downgrade DLT_PKTAP to DLT_RAW\n");
dlt = DLT_RAW;
}
error = bpf_setdlt(d, dlt);
}
break;
case BIOCGETIF:
if (d->bd_bif == 0)
error = EINVAL;
else {
struct ifnet *const ifp = d->bd_bif->bif_ifp;
snprintf(((struct ifreq *)(void *)addr)->ifr_name,
sizeof (ifr.ifr_name), "%s", if_name(ifp));
}
break;
case BIOCSETIF: {
ifnet_t ifp;
bcopy(addr, &ifr, sizeof (ifr));
ifr.ifr_name[IFNAMSIZ - 1] = '\0';
ifp = ifunit(ifr.ifr_name);
if (ifp == NULL)
error = ENXIO;
else
error = bpf_setif(d, ifp);
break;
}
case BIOCSRTIMEOUT32: {
struct user32_timeval _tv;
struct timeval tv;
bcopy(addr, &_tv, sizeof (_tv));
tv.tv_sec = _tv.tv_sec;
tv.tv_usec = _tv.tv_usec;
if ((error = itimerfix(&tv)) == 0)
d->bd_rtout = tvtohz(&tv) - 1;
break;
}
case BIOCSRTIMEOUT64: {
struct user64_timeval _tv;
struct timeval tv;
bcopy(addr, &_tv, sizeof (_tv));
tv.tv_sec = _tv.tv_sec;
tv.tv_usec = _tv.tv_usec;
if ((error = itimerfix(&tv)) == 0)
d->bd_rtout = tvtohz(&tv) - 1;
break;
}
case BIOCGRTIMEOUT32: {
struct user32_timeval tv;
bzero(&tv, sizeof (tv));
tv.tv_sec = d->bd_rtout / hz;
tv.tv_usec = (d->bd_rtout % hz) * tick;
bcopy(&tv, addr, sizeof (tv));
break;
}
case BIOCGRTIMEOUT64: {
struct user64_timeval tv;
bzero(&tv, sizeof (tv));
tv.tv_sec = d->bd_rtout / hz;
tv.tv_usec = (d->bd_rtout % hz) * tick;
bcopy(&tv, addr, sizeof (tv));
break;
}
case BIOCGSTATS: {
struct bpf_stat bs;
bzero(&bs, sizeof (bs));
bs.bs_recv = d->bd_rcount;
bs.bs_drop = d->bd_dcount;
bcopy(&bs, addr, sizeof (bs));
break;
}
case BIOCIMMEDIATE:
d->bd_immediate = *(u_int *)(void *)addr;
break;
case BIOCVERSION: {
struct bpf_version bv;
bzero(&bv, sizeof (bv));
bv.bv_major = BPF_MAJOR_VERSION;
bv.bv_minor = BPF_MINOR_VERSION;
bcopy(&bv, addr, sizeof (bv));
break;
}
case BIOCGHDRCMPLT:
bcopy(&d->bd_hdrcmplt, addr, sizeof (u_int));
break;
case BIOCSHDRCMPLT:
bcopy(addr, &int_arg, sizeof (int_arg));
d->bd_hdrcmplt = int_arg ? 1 : 0;
break;
case BIOCGSEESENT:
bcopy(&d->bd_seesent, addr, sizeof (u_int));
break;
case BIOCSSEESENT:
bcopy(addr, &d->bd_seesent, sizeof (u_int));
break;
case BIOCSETTC: {
int tc;
bcopy(addr, &tc, sizeof (int));
error = bpf_set_traffic_class(d, tc);
break;
}
case BIOCGETTC:
bcopy(&d->bd_traffic_class, addr, sizeof (int));
break;
case FIONBIO:
break;
case FIOASYNC:
bcopy(addr, &d->bd_async, sizeof (int));
break;
#ifndef __APPLE__
case FIOSETOWN:
error = fsetown(*(int *)addr, &d->bd_sigio);
break;
case FIOGETOWN:
*(int *)addr = fgetown(d->bd_sigio);
break;
case TIOCSPGRP:
error = fsetown(-(*(int *)addr), &d->bd_sigio);
break;
case TIOCGPGRP:
*(int *)addr = -fgetown(d->bd_sigio);
break;
#endif
case BIOCSRSIG: {
u_int sig;
bcopy(addr, &sig, sizeof (u_int));
if (sig >= NSIG)
error = EINVAL;
else
d->bd_sig = sig;
break;
}
case BIOCGRSIG:
bcopy(&d->bd_sig, addr, sizeof (u_int));
break;
#ifdef __APPLE__
case BIOCSEXTHDR:
bcopy(addr, &int_arg, sizeof (int_arg));
if (int_arg)
d->bd_flags |= BPF_EXTENDED_HDR;
else
d->bd_flags &= ~BPF_EXTENDED_HDR;
break;
case BIOCGIFATTACHCOUNT: {
ifnet_t ifp;
struct bpf_if *bp;
bcopy(addr, &ifr, sizeof (ifr));
ifr.ifr_name[IFNAMSIZ - 1] = '\0';
ifp = ifunit(ifr.ifr_name);
if (ifp == NULL) {
error = ENXIO;
break;
}
ifr.ifr_intval = 0;
for (bp = bpf_iflist; bp != 0; bp = bp->bif_next) {
struct bpf_d *bpf_d;
if (bp->bif_ifp == NULL || bp->bif_ifp != ifp)
continue;
for (bpf_d = bp->bif_dlist; bpf_d; bpf_d = bpf_d->bd_next) {
ifr.ifr_intval += 1;
}
}
bcopy(&ifr, addr, sizeof (ifr));
break;
}
case BIOCGWANTPKTAP:
int_arg = d->bd_flags & BPF_WANT_PKTAP ? 1 : 0;
bcopy(&int_arg, addr, sizeof (int_arg));
break;
case BIOCSWANTPKTAP:
bcopy(addr, &int_arg, sizeof (int_arg));
if (int_arg)
d->bd_flags |= BPF_WANT_PKTAP;
else
d->bd_flags &= ~BPF_WANT_PKTAP;
break;
#endif
case BIOCSHEADDROP:
bcopy(addr, &int_arg, sizeof (int_arg));
d->bd_headdrop = int_arg ? 1 : 0;
break;
case BIOCGHEADDROP:
bcopy(&d->bd_headdrop, addr, sizeof (int));
break;
}
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
return (error);
}
static int
bpf_setf(struct bpf_d *d, u_int bf_len, user_addr_t bf_insns,
u_long cmd)
{
struct bpf_insn *fcode, *old;
u_int flen, size;
while (d->bd_hbuf_read)
msleep((caddr_t)d, bpf_mlock, PRINET, "bpf_reading", NULL);
if ((d->bd_flags & BPF_CLOSING) != 0)
return (ENXIO);
old = d->bd_filter;
if (bf_insns == USER_ADDR_NULL) {
if (bf_len != 0)
return (EINVAL);
d->bd_filter = NULL;
reset_d(d);
if (old != 0)
FREE((caddr_t)old, M_DEVBUF);
return (0);
}
flen = bf_len;
if (flen > BPF_MAXINSNS)
return (EINVAL);
size = flen * sizeof(struct bpf_insn);
fcode = (struct bpf_insn *) _MALLOC(size, M_DEVBUF, M_WAIT);
#ifdef __APPLE__
if (fcode == NULL)
return (ENOBUFS);
#endif
if (copyin(bf_insns, (caddr_t)fcode, size) == 0 &&
bpf_validate(fcode, (int)flen)) {
d->bd_filter = fcode;
if (cmd == BIOCSETF32 || cmd == BIOCSETF64)
reset_d(d);
if (old != 0)
FREE((caddr_t)old, M_DEVBUF);
return (0);
}
FREE((caddr_t)fcode, M_DEVBUF);
return (EINVAL);
}
static int
bpf_setif(struct bpf_d *d, ifnet_t theywant)
{
struct bpf_if *bp;
int error;
while (d->bd_hbuf_read)
msleep((caddr_t)d, bpf_mlock, PRINET, "bpf_reading", NULL);
if ((d->bd_flags & BPF_CLOSING) != 0)
return (ENXIO);
for (bp = bpf_iflist; bp != 0; bp = bp->bif_next) {
struct ifnet *ifp = bp->bif_ifp;
if (ifp == 0 || ifp != theywant)
continue;
if (bp->bif_dlt == DLT_PKTAP && !(d->bd_flags & BPF_WANT_PKTAP))
continue;
if (!intcoproc_unrestricted && IFNET_IS_INTCOPROC(ifp))
continue;
error = bpf_allocbufs(d);
if (error != 0)
return (error);
if (bp != d->bd_bif) {
if (d->bd_bif != NULL) {
if (bpf_detachd(d, 0) != 0)
return (ENXIO);
}
if (bpf_attachd(d, bp) != 0)
return (ENXIO);
}
reset_d(d);
return (0);
}
return (ENXIO);
}
static int
bpf_getdltlist(struct bpf_d *d, caddr_t addr, struct proc *p)
{
u_int n;
int error;
struct ifnet *ifp;
struct bpf_if *bp;
user_addr_t dlist;
struct bpf_dltlist bfl;
bcopy(addr, &bfl, sizeof (bfl));
if (proc_is64bit(p)) {
dlist = (user_addr_t)bfl.bfl_u.bflu_pad;
} else {
dlist = CAST_USER_ADDR_T(bfl.bfl_u.bflu_list);
}
ifp = d->bd_bif->bif_ifp;
n = 0;
error = 0;
for (bp = bpf_iflist; bp; bp = bp->bif_next) {
if (bp->bif_ifp != ifp)
continue;
if (bp->bif_dlt == DLT_PKTAP && !(d->bd_flags & BPF_WANT_PKTAP))
continue;
if (dlist != USER_ADDR_NULL) {
if (n >= bfl.bfl_len) {
return (ENOMEM);
}
error = copyout(&bp->bif_dlt, dlist,
sizeof (bp->bif_dlt));
if (error != 0)
break;
dlist += sizeof (bp->bif_dlt);
}
n++;
}
bfl.bfl_len = n;
bcopy(&bfl, addr, sizeof (bfl));
return (error);
}
static int
bpf_setdlt(struct bpf_d *d, uint32_t dlt)
{
int error, opromisc;
struct ifnet *ifp;
struct bpf_if *bp;
if (d->bd_bif->bif_dlt == dlt)
return (0);
while (d->bd_hbuf_read)
msleep((caddr_t)d, bpf_mlock, PRINET, "bpf_reading", NULL);
if ((d->bd_flags & BPF_CLOSING) != 0)
return (ENXIO);
ifp = d->bd_bif->bif_ifp;
for (bp = bpf_iflist; bp; bp = bp->bif_next) {
if (bp->bif_ifp == ifp && bp->bif_dlt == dlt) {
if (bp->bif_dlt == DLT_PKTAP && !(d->bd_flags & BPF_WANT_PKTAP)) {
continue;
}
break;
}
}
if (bp != NULL) {
opromisc = d->bd_promisc;
if (bpf_detachd(d, 0) != 0)
return (ENXIO);
error = bpf_attachd(d, bp);
if (error) {
printf("bpf_setdlt: bpf_attachd %s%d failed (%d)\n",
ifnet_name(bp->bif_ifp), ifnet_unit(bp->bif_ifp), error);
return error;
}
reset_d(d);
if (opromisc) {
lck_mtx_unlock(bpf_mlock);
error = ifnet_set_promiscuous(bp->bif_ifp, 1);
lck_mtx_lock(bpf_mlock);
if (error) {
printf("%s: ifpromisc %s%d failed (%d)\n",
__func__, ifnet_name(bp->bif_ifp),
ifnet_unit(bp->bif_ifp), error);
} else {
d->bd_promisc = 1;
}
}
}
return (bp == NULL ? EINVAL : 0);
}
static int
bpf_set_traffic_class(struct bpf_d *d, int tc)
{
int error = 0;
if (!SO_VALID_TC(tc))
error = EINVAL;
else
d->bd_traffic_class = tc;
return (error);
}
static void
bpf_set_packet_service_class(struct mbuf *m, int tc)
{
if (!(m->m_flags & M_PKTHDR))
return;
VERIFY(SO_VALID_TC(tc));
(void) m_set_service_class(m, so_tc2msc(tc));
}
int
bpfselect(dev_t dev, int which, void * wql, struct proc *p)
{
struct bpf_d *d;
int ret = 0;
lck_mtx_lock(bpf_mlock);
d = bpf_dtab[minor(dev)];
if (d == 0 || d == (void *)1 || (d->bd_flags & BPF_CLOSING) != 0) {
lck_mtx_unlock(bpf_mlock);
return (ENXIO);
}
bpf_acquire_d(d);
if (d->bd_bif == NULL) {
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
return (ENXIO);
}
while (d->bd_hbuf_read)
msleep((caddr_t)d, bpf_mlock, PRINET, "bpf_reading", NULL);
if ((d->bd_flags & BPF_CLOSING) != 0) {
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
return (ENXIO);
}
switch (which) {
case FREAD:
if (d->bd_hlen != 0 ||
((d->bd_immediate || d->bd_state == BPF_TIMED_OUT) &&
d->bd_slen != 0))
ret = 1;
else {
selrecord(p, &d->bd_sel, wql);
bpf_start_timer(d);
}
break;
case FWRITE:
ret = 1;
break;
}
bpf_release_d(d);
lck_mtx_unlock(bpf_mlock);
return (ret);
}
int bpfkqfilter(dev_t dev, struct knote *kn);
static void filt_bpfdetach(struct knote *);
static int filt_bpfread(struct knote *, long);
static int filt_bpftouch(struct knote *kn, struct kevent_internal_s *kev);
static int filt_bpfprocess(struct knote *kn, struct filt_process_s *data, struct kevent_internal_s *kev);
SECURITY_READ_ONLY_EARLY(struct filterops) bpfread_filtops = {
.f_isfd = 1,
.f_detach = filt_bpfdetach,
.f_event = filt_bpfread,
.f_touch = filt_bpftouch,
.f_process = filt_bpfprocess,
};
static int
filt_bpfread_common(struct knote *kn, struct bpf_d *d)
{
int ready = 0;
if (d->bd_immediate) {
kn->kn_data = ((d->bd_hlen == 0 || d->bd_hbuf_read)
? d->bd_slen : d->bd_hlen);
int64_t lowwat = 1;
if (kn->kn_sfflags & NOTE_LOWAT)
{
if (kn->kn_sdata > d->bd_bufsize)
lowwat = d->bd_bufsize;
else if (kn->kn_sdata > lowwat)
lowwat = kn->kn_sdata;
}
ready = (kn->kn_data >= lowwat);
} else {
kn->kn_data = ((d->bd_hlen == 0 || d->bd_hbuf_read) && d->bd_state == BPF_TIMED_OUT ?
d->bd_slen : d->bd_hlen);
ready = (kn->kn_data > 0);
}
if (!ready)
bpf_start_timer(d);
return (ready);
}
int
bpfkqfilter(dev_t dev, struct knote *kn)
{
struct bpf_d *d;
int res;
if (major(dev) != CDEV_MAJOR ||
kn->kn_filter != EVFILT_READ) {
kn->kn_flags = EV_ERROR;
kn->kn_data = EINVAL;
return 0;
}
lck_mtx_lock(bpf_mlock);
d = bpf_dtab[minor(dev)];
if (d == 0 ||
d == (void *)1 ||
d->bd_bif == NULL ||
(d->bd_flags & BPF_CLOSING) != 0) {
lck_mtx_unlock(bpf_mlock);
kn->kn_flags = EV_ERROR;
kn->kn_data = ENXIO;
return 0;
}
kn->kn_hook = d;
kn->kn_filtid = EVFILTID_BPFREAD;
KNOTE_ATTACH(&d->bd_sel.si_note, kn);
d->bd_flags |= BPF_KNOTE;
res = filt_bpfread_common(kn, d);
lck_mtx_unlock(bpf_mlock);
return (res);
}
static void
filt_bpfdetach(struct knote *kn)
{
struct bpf_d *d = (struct bpf_d *)kn->kn_hook;
lck_mtx_lock(bpf_mlock);
if (d->bd_flags & BPF_KNOTE) {
KNOTE_DETACH(&d->bd_sel.si_note, kn);
d->bd_flags &= ~BPF_KNOTE;
}
lck_mtx_unlock(bpf_mlock);
}
static int
filt_bpfread(struct knote *kn, long hint)
{
#pragma unused(hint)
struct bpf_d *d = (struct bpf_d *)kn->kn_hook;
return filt_bpfread_common(kn, d);
}
static int
filt_bpftouch(struct knote *kn, struct kevent_internal_s *kev)
{
struct bpf_d *d = (struct bpf_d *)kn->kn_hook;
int res;
lck_mtx_lock(bpf_mlock);
kn->kn_sdata = kev->data;
kn->kn_sfflags = kev->fflags;
if ((kn->kn_status & KN_UDATA_SPECIFIC) == 0)
kn->kn_udata = kev->udata;
res = filt_bpfread_common(kn, d);
lck_mtx_unlock(bpf_mlock);
return res;
}
static int
filt_bpfprocess(struct knote *kn, struct filt_process_s *data, struct kevent_internal_s *kev)
{
#pragma unused(data)
struct bpf_d *d = (struct bpf_d *)kn->kn_hook;
int res;
lck_mtx_lock(bpf_mlock);
res = filt_bpfread_common(kn, d);
if (res) {
*kev = kn->kn_kevent;
}
lck_mtx_unlock(bpf_mlock);
return res;
}
static void
bpf_mcopy(struct mbuf * m, void *dst_arg, size_t len)
{
u_int count;
u_char *dst;
dst = dst_arg;
while (len > 0) {
if (m == 0)
panic("bpf_mcopy");
count = min(m->m_len, len);
bcopy(mbuf_data(m), dst, count);
m = m->m_next;
dst += count;
len -= count;
}
}
static inline void
bpf_tap_imp(
ifnet_t ifp,
u_int32_t dlt,
struct bpf_packet *bpf_pkt,
int outbound)
{
struct bpf_d *d;
u_int slen;
struct bpf_if *bp;
lck_mtx_lock(bpf_mlock);
if (ifp->if_bpf == NULL) {
lck_mtx_unlock(bpf_mlock);
return;
}
for (bp = ifp->if_bpf; bp != NULL; bp = bp->bif_next) {
if (bp->bif_ifp != ifp) {
bp = NULL;
break;
}
if (dlt == 0 || bp->bif_dlt == dlt) {
break;
}
}
if (bp == NULL) {
goto done;
}
for (d = bp->bif_dlist; d; d = d->bd_next) {
if (outbound && !d->bd_seesent)
continue;
++d->bd_rcount;
slen = bpf_filter(d->bd_filter, (u_char *)bpf_pkt,
bpf_pkt->bpfp_total_length, 0);
if (slen != 0) {
#if CONFIG_MACF_NET
if (mac_bpfdesc_check_receive(d, bp->bif_ifp) != 0)
continue;
#endif
catchpacket(d, bpf_pkt, slen, outbound);
}
}
done:
lck_mtx_unlock(bpf_mlock);
}
static inline void
bpf_tap_mbuf(
ifnet_t ifp,
u_int32_t dlt,
mbuf_t m,
void* hdr,
size_t hlen,
int outbound)
{
struct bpf_packet bpf_pkt;
struct mbuf *m0;
if (ifp->if_bpf == NULL) {
return;
}
bpf_pkt.bpfp_type = BPF_PACKET_TYPE_MBUF;
bpf_pkt.bpfp_mbuf = m;
bpf_pkt.bpfp_total_length = 0;
for (m0 = m; m0 != NULL; m0 = m0->m_next)
bpf_pkt.bpfp_total_length += m0->m_len;
bpf_pkt.bpfp_header = hdr;
if (hdr != NULL) {
bpf_pkt.bpfp_total_length += hlen;
bpf_pkt.bpfp_header_length = hlen;
} else {
bpf_pkt.bpfp_header_length = 0;
}
bpf_tap_imp(ifp, dlt, &bpf_pkt, outbound);
}
void
bpf_tap_out(
ifnet_t ifp,
u_int32_t dlt,
mbuf_t m,
void* hdr,
size_t hlen)
{
bpf_tap_mbuf(ifp, dlt, m, hdr, hlen, 1);
}
void
bpf_tap_in(
ifnet_t ifp,
u_int32_t dlt,
mbuf_t m,
void* hdr,
size_t hlen)
{
bpf_tap_mbuf(ifp, dlt, m, hdr, hlen, 0);
}
static int bpf_tap_callback(struct ifnet *ifp, struct mbuf *m)
{
bpf_tap_mbuf(ifp, 0, m, NULL, 0, mbuf_pkthdr_rcvif(m) == NULL);
return 0;
}
static void
copy_bpf_packet(struct bpf_packet * pkt, void * dst, size_t len)
{
if (pkt->bpfp_header_length != 0) {
size_t count = min(len, pkt->bpfp_header_length);
bcopy(pkt->bpfp_header, dst, count);
len -= count;
dst += count;
}
if (len == 0) {
return;
}
switch (pkt->bpfp_type) {
case BPF_PACKET_TYPE_MBUF:
bpf_mcopy(pkt->bpfp_mbuf, dst, len);
break;
default:
break;
}
}
static void
catchpacket(struct bpf_d *d, struct bpf_packet * pkt,
u_int snaplen, int outbound)
{
struct bpf_hdr *hp;
struct bpf_hdr_ext *ehp;
int totlen, curlen;
int hdrlen, caplen;
int do_wakeup = 0;
u_char *payload;
struct timeval tv;
hdrlen = (d->bd_flags & BPF_EXTENDED_HDR) ? d->bd_bif->bif_exthdrlen :
d->bd_bif->bif_hdrlen;
totlen = hdrlen + min(snaplen, pkt->bpfp_total_length);
if (totlen > d->bd_bufsize)
totlen = d->bd_bufsize;
if (hdrlen > totlen)
return;
curlen = BPF_WORDALIGN(d->bd_slen);
if (curlen + totlen > d->bd_bufsize) {
if (d->bd_hbuf_read) {
++d->bd_dcount;
return;
}
if (d->bd_fbuf == NULL) {
if (d->bd_headdrop == 0) {
++d->bd_dcount;
return;
}
d->bd_dcount += d->bd_hcnt;
d->bd_fbuf = d->bd_hbuf;
ROTATE_BUFFERS(d);
} else {
ROTATE_BUFFERS(d);
}
do_wakeup = 1;
curlen = 0;
}
else if (d->bd_immediate || d->bd_state == BPF_TIMED_OUT)
do_wakeup = 1;
microtime(&tv);
if (d->bd_flags & BPF_EXTENDED_HDR) {
struct mbuf *m;
m = (pkt->bpfp_type == BPF_PACKET_TYPE_MBUF)
? pkt->bpfp_mbuf : NULL;
ehp = (struct bpf_hdr_ext *)(void *)(d->bd_sbuf + curlen);
memset(ehp, 0, sizeof(*ehp));
ehp->bh_tstamp.tv_sec = tv.tv_sec;
ehp->bh_tstamp.tv_usec = tv.tv_usec;
ehp->bh_datalen = pkt->bpfp_total_length;
ehp->bh_hdrlen = hdrlen;
caplen = ehp->bh_caplen = totlen - hdrlen;
if (m == NULL) {
if (outbound) {
ehp->bh_flags |= BPF_HDR_EXT_FLAGS_DIR_OUT;
} else {
ehp->bh_flags |= BPF_HDR_EXT_FLAGS_DIR_IN;
}
} else if (outbound) {
ehp->bh_flags |= BPF_HDR_EXT_FLAGS_DIR_OUT;
if ((m->m_pkthdr.pkt_flags & (PKTF_FLOW_ID|
PKTF_FLOW_LOCALSRC|PKTF_FLOW_RAWSOCK)) ==
(PKTF_FLOW_ID|PKTF_FLOW_LOCALSRC) &&
m->m_pkthdr.pkt_flowsrc == FLOWSRC_INPCB) {
ehp->bh_flowid = m->m_pkthdr.pkt_flowid;
ehp->bh_proto = m->m_pkthdr.pkt_proto;
}
ehp->bh_svc = so_svc2tc(m->m_pkthdr.pkt_svc);
if (m->m_pkthdr.pkt_flags & PKTF_TCP_REXMT)
ehp->bh_pktflags |= BPF_PKTFLAGS_TCP_REXMT;
if (m->m_pkthdr.pkt_flags & PKTF_START_SEQ)
ehp->bh_pktflags |= BPF_PKTFLAGS_START_SEQ;
if (m->m_pkthdr.pkt_flags & PKTF_LAST_PKT)
ehp->bh_pktflags |= BPF_PKTFLAGS_LAST_PKT;
if (m->m_pkthdr.pkt_flags & PKTF_VALID_UNSENT_DATA) {
ehp->bh_unsent_bytes =
m->m_pkthdr.bufstatus_if;
ehp->bh_unsent_snd =
m->m_pkthdr.bufstatus_sndbuf;
}
} else
ehp->bh_flags |= BPF_HDR_EXT_FLAGS_DIR_IN;
payload = (u_char *)ehp + hdrlen;
} else {
hp = (struct bpf_hdr *)(void *)(d->bd_sbuf + curlen);
hp->bh_tstamp.tv_sec = tv.tv_sec;
hp->bh_tstamp.tv_usec = tv.tv_usec;
hp->bh_datalen = pkt->bpfp_total_length;
hp->bh_hdrlen = hdrlen;
caplen = hp->bh_caplen = totlen - hdrlen;
payload = (u_char *)hp + hdrlen;
}
copy_bpf_packet(pkt, payload, caplen);
d->bd_slen = curlen + totlen;
d->bd_scnt += 1;
if (do_wakeup)
bpf_wakeup(d);
}
static int
bpf_allocbufs(struct bpf_d *d)
{
if (d->bd_sbuf != NULL) {
FREE(d->bd_sbuf, M_DEVBUF);
d->bd_sbuf = NULL;
}
if (d->bd_hbuf != NULL) {
FREE(d->bd_hbuf, M_DEVBUF);
d->bd_hbuf = NULL;
}
if (d->bd_fbuf != NULL) {
FREE(d->bd_fbuf, M_DEVBUF);
d->bd_fbuf = NULL;
}
d->bd_fbuf = (caddr_t) _MALLOC(d->bd_bufsize, M_DEVBUF, M_WAIT);
if (d->bd_fbuf == NULL)
return (ENOBUFS);
d->bd_sbuf = (caddr_t) _MALLOC(d->bd_bufsize, M_DEVBUF, M_WAIT);
if (d->bd_sbuf == NULL) {
FREE(d->bd_fbuf, M_DEVBUF);
d->bd_fbuf = NULL;
return (ENOBUFS);
}
d->bd_slen = 0;
d->bd_hlen = 0;
d->bd_scnt = 0;
d->bd_hcnt = 0;
return (0);
}
static void
bpf_freed(struct bpf_d *d)
{
if (d->bd_hbuf_read)
panic("bpf buffer freed during read");
if (d->bd_sbuf != 0) {
FREE(d->bd_sbuf, M_DEVBUF);
if (d->bd_hbuf != 0)
FREE(d->bd_hbuf, M_DEVBUF);
if (d->bd_fbuf != 0)
FREE(d->bd_fbuf, M_DEVBUF);
}
if (d->bd_filter)
FREE((caddr_t)d->bd_filter, M_DEVBUF);
}
void
bpfattach(struct ifnet *ifp, u_int dlt, u_int hdrlen)
{
bpf_attach(ifp, dlt, hdrlen, NULL, NULL);
}
errno_t
bpf_attach(
ifnet_t ifp,
u_int32_t dlt,
u_int32_t hdrlen,
bpf_send_func send,
bpf_tap_func tap)
{
struct bpf_if *bp;
struct bpf_if *bp_new;
struct bpf_if *bp_before_first = NULL;
struct bpf_if *bp_first = NULL;
struct bpf_if *bp_last = NULL;
boolean_t found;
bp_new = (struct bpf_if *) _MALLOC(sizeof(*bp_new), M_DEVBUF,
M_WAIT | M_ZERO);
if (bp_new == 0)
panic("bpfattach");
lck_mtx_lock(bpf_mlock);
found = FALSE;
for (bp = bpf_iflist; bp != NULL; bp = bp->bif_next) {
if (bp->bif_ifp != ifp) {
if (bp_first != NULL) {
break;
}
bp_before_first = bp;
} else {
if (bp->bif_dlt == dlt) {
found = TRUE;
break;
}
if (bp_first == NULL) {
bp_first = bp;
}
bp_last = bp;
}
}
if (found) {
lck_mtx_unlock(bpf_mlock);
printf("bpfattach - %s with dlt %d is already attached\n",
if_name(ifp), dlt);
FREE(bp_new, M_DEVBUF);
return EEXIST;
}
bp_new->bif_ifp = ifp;
bp_new->bif_dlt = dlt;
bp_new->bif_send = send;
bp_new->bif_tap = tap;
if (bp_first == NULL) {
bp_new->bif_next = bpf_iflist;
bpf_iflist = bp_new;
}
else {
if (ifnet_type(ifp) == IFT_ETHER && dlt == DLT_EN10MB) {
if (bp_before_first != NULL) {
bp_before_first->bif_next = bp_new;
} else {
bpf_iflist = bp_new;
}
bp_new->bif_next = bp_first;
} else {
bp_new->bif_next = bp_last->bif_next;
bp_last->bif_next = bp_new;
}
}
bp_new->bif_hdrlen = BPF_WORDALIGN(hdrlen + SIZEOF_BPF_HDR) - hdrlen;
bp_new->bif_exthdrlen = BPF_WORDALIGN(hdrlen +
sizeof(struct bpf_hdr_ext)) - hdrlen;
ifnet_reference(ifp);
lck_mtx_unlock(bpf_mlock);
#ifndef __APPLE__
if (bootverbose)
printf("bpf: %s attached\n", if_name(ifp));
#endif
return 0;
}
void
bpfdetach(struct ifnet *ifp)
{
struct bpf_if *bp, *bp_prev, *bp_next;
struct bpf_d *d;
if (bpf_debug != 0)
printf("%s: %s\n", __func__, if_name(ifp));
lck_mtx_lock(bpf_mlock);
bp_prev = NULL;
for (bp = bpf_iflist; bp != NULL; bp = bp_next) {
bp_next = bp->bif_next;
if (ifp != bp->bif_ifp) {
bp_prev = bp;
continue;
}
if (bp_prev)
bp_prev->bif_next = bp->bif_next;
else
bpf_iflist = bp->bif_next;
while ((d = bp->bif_dlist) != NULL) {
bpf_acquire_d(d);
bpf_detachd(d, 0);
bpf_wakeup(d);
bpf_release_d(d);
}
ifnet_release(ifp);
}
lck_mtx_unlock(bpf_mlock);
}
void
bpf_init(__unused void *unused)
{
#ifdef __APPLE__
int i;
int maj;
if (bpf_devsw_installed == 0) {
bpf_devsw_installed = 1;
bpf_mlock_grp_attr = lck_grp_attr_alloc_init();
bpf_mlock_grp = lck_grp_alloc_init("bpf", bpf_mlock_grp_attr);
bpf_mlock_attr = lck_attr_alloc_init();
lck_mtx_init(bpf_mlock, bpf_mlock_grp, bpf_mlock_attr);
maj = cdevsw_add(CDEV_MAJOR, &bpf_cdevsw);
if (maj == -1) {
if (bpf_mlock_attr)
lck_attr_free(bpf_mlock_attr);
if (bpf_mlock_grp)
lck_grp_free(bpf_mlock_grp);
if (bpf_mlock_grp_attr)
lck_grp_attr_free(bpf_mlock_grp_attr);
bpf_mlock = NULL;
bpf_mlock_attr = NULL;
bpf_mlock_grp = NULL;
bpf_mlock_grp_attr = NULL;
bpf_devsw_installed = 0;
printf("bpf_init: failed to allocate a major number!\n");
return;
}
for (i = 0 ; i < NBPFILTER; i++)
bpf_make_dev_t(maj);
}
#else
cdevsw_add(&bpf_cdevsw);
#endif
}
#ifndef __APPLE__
SYSINIT(bpfdev,SI_SUB_DRIVERS,SI_ORDER_MIDDLE+CDEV_MAJOR,bpf_drvinit,NULL)
#endif
#if CONFIG_MACF_NET
struct label *
mac_bpfdesc_label_get(struct bpf_d *d)
{
return (d->bd_label);
}
void
mac_bpfdesc_label_set(struct bpf_d *d, struct label *label)
{
d->bd_label = label;
}
#endif