1*f933b737SSascha Wildner /*
2*f933b737SSascha Wildner * Copyright (C) 2011 Matteo Landi, Luigi Rizzo. All rights reserved.
3*f933b737SSascha Wildner * Copyright (C) 2013 Universita` di Pisa
4*f933b737SSascha Wildner *
5*f933b737SSascha Wildner * Redistribution and use in source and binary forms, with or without
6*f933b737SSascha Wildner * modification, are permitted provided that the following conditions
7*f933b737SSascha Wildner * are met:
8*f933b737SSascha Wildner *
9*f933b737SSascha Wildner * 1. Redistributions of source code must retain the above copyright
10*f933b737SSascha Wildner * notice, this list of conditions and the following disclaimer.
11*f933b737SSascha Wildner * 2. Redistributions in binary form must reproduce the above copyright
12*f933b737SSascha Wildner * notice, this list of conditions and the following disclaimer in the
13*f933b737SSascha Wildner * documentation and/or other materials provided with the distribution.
14*f933b737SSascha Wildner *
15*f933b737SSascha Wildner * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
16*f933b737SSascha Wildner * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17*f933b737SSascha Wildner * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18*f933b737SSascha Wildner * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
19*f933b737SSascha Wildner * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20*f933b737SSascha Wildner * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
21*f933b737SSascha Wildner * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22*f933b737SSascha Wildner * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23*f933b737SSascha Wildner * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24*f933b737SSascha Wildner * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25*f933b737SSascha Wildner * SUCH DAMAGE.
26*f933b737SSascha Wildner */
27*f933b737SSascha Wildner
28*f933b737SSascha Wildner /*
29*f933b737SSascha Wildner * $FreeBSD$
30*f933b737SSascha Wildner *
31*f933b737SSascha Wildner * This header contains the macros used to manipulate netmap structures
32*f933b737SSascha Wildner * and packets in userspace. See netmap(4) for more information.
33*f933b737SSascha Wildner *
34*f933b737SSascha Wildner * The address of the struct netmap_if, say nifp, is computed from the
35*f933b737SSascha Wildner * value returned from ioctl(.., NIOCREG, ...) and the mmap region:
36*f933b737SSascha Wildner * ioctl(fd, NIOCREG, &req);
37*f933b737SSascha Wildner * mem = mmap(0, ... );
38*f933b737SSascha Wildner * nifp = NETMAP_IF(mem, req.nr_nifp);
39*f933b737SSascha Wildner * (so simple, we could just do it manually)
40*f933b737SSascha Wildner *
41*f933b737SSascha Wildner * From there:
42*f933b737SSascha Wildner * struct netmap_ring *NETMAP_TXRING(nifp, index)
43*f933b737SSascha Wildner * struct netmap_ring *NETMAP_RXRING(nifp, index)
44*f933b737SSascha Wildner * we can access ring->nr_cur, ring->nr_avail, ring->nr_flags
45*f933b737SSascha Wildner *
46*f933b737SSascha Wildner * ring->slot[i] gives us the i-th slot (we can access
47*f933b737SSascha Wildner * directly plen, flags, bufindex)
48*f933b737SSascha Wildner *
49*f933b737SSascha Wildner * char *buf = NETMAP_BUF(ring, x) returns a pointer to
50*f933b737SSascha Wildner * the buffer numbered x
51*f933b737SSascha Wildner *
52*f933b737SSascha Wildner * Since rings are circular, we have macros to compute the next index
53*f933b737SSascha Wildner * i = NETMAP_RING_NEXT(ring, i);
54*f933b737SSascha Wildner *
55*f933b737SSascha Wildner * To ease porting apps from pcap to netmap we supply a few fuctions
56*f933b737SSascha Wildner * that can be called to open, close and read from netmap in a way
57*f933b737SSascha Wildner * similar to libpcap.
58*f933b737SSascha Wildner *
59*f933b737SSascha Wildner * In order to use these, include #define NETMAP_WITH_LIBS
60*f933b737SSascha Wildner * in the source file that invokes these functions.
61*f933b737SSascha Wildner */
62*f933b737SSascha Wildner
63*f933b737SSascha Wildner #ifndef _NET_NETMAP_USER_H_
64*f933b737SSascha Wildner #define _NET_NETMAP_USER_H_
65*f933b737SSascha Wildner
66*f933b737SSascha Wildner #include <stdint.h>
67*f933b737SSascha Wildner #include <net/if.h> /* IFNAMSIZ */
68*f933b737SSascha Wildner #include <net/netmap/netmap.h>
69*f933b737SSascha Wildner
70*f933b737SSascha Wildner #define _NETMAP_OFFSET(type, ptr, offset) \
71*f933b737SSascha Wildner ((type)(void *)((char *)(ptr) + (offset)))
72*f933b737SSascha Wildner
73*f933b737SSascha Wildner #define NETMAP_IF(b, o) _NETMAP_OFFSET(struct netmap_if *, b, o)
74*f933b737SSascha Wildner
75*f933b737SSascha Wildner #define NETMAP_TXRING(nifp, index) _NETMAP_OFFSET(struct netmap_ring *, \
76*f933b737SSascha Wildner nifp, (nifp)->ring_ofs[index] )
77*f933b737SSascha Wildner
78*f933b737SSascha Wildner #define NETMAP_RXRING(nifp, index) _NETMAP_OFFSET(struct netmap_ring *, \
79*f933b737SSascha Wildner nifp, (nifp)->ring_ofs[index + (nifp)->ni_tx_rings + 1] )
80*f933b737SSascha Wildner
81*f933b737SSascha Wildner #define NETMAP_BUF(ring, index) \
82*f933b737SSascha Wildner ((char *)(ring) + (ring)->buf_ofs + ((index)*(ring)->nr_buf_size))
83*f933b737SSascha Wildner
84*f933b737SSascha Wildner #define NETMAP_BUF_IDX(ring, buf) \
85*f933b737SSascha Wildner ( ((char *)(buf) - ((char *)(ring) + (ring)->buf_ofs) ) / \
86*f933b737SSascha Wildner (ring)->nr_buf_size )
87*f933b737SSascha Wildner
88*f933b737SSascha Wildner #define NETMAP_RING_NEXT(r, i) \
89*f933b737SSascha Wildner ((i)+1 == (r)->num_slots ? 0 : (i) + 1 )
90*f933b737SSascha Wildner
91*f933b737SSascha Wildner #define NETMAP_RING_FIRST_RESERVED(r) \
92*f933b737SSascha Wildner ( (r)->cur < (r)->reserved ? \
93*f933b737SSascha Wildner (r)->cur + (r)->num_slots - (r)->reserved : \
94*f933b737SSascha Wildner (r)->cur - (r)->reserved )
95*f933b737SSascha Wildner
96*f933b737SSascha Wildner /*
97*f933b737SSascha Wildner * Return 1 if the given tx ring is empty.
98*f933b737SSascha Wildner */
99*f933b737SSascha Wildner #define NETMAP_TX_RING_EMPTY(r) ((r)->avail >= (r)->num_slots - 1)
100*f933b737SSascha Wildner
101*f933b737SSascha Wildner #ifdef NETMAP_WITH_LIBS
102*f933b737SSascha Wildner /*
103*f933b737SSascha Wildner * Support for simple I/O libraries.
104*f933b737SSascha Wildner * Include other system headers required for compiling this.
105*f933b737SSascha Wildner */
106*f933b737SSascha Wildner
107*f933b737SSascha Wildner #ifndef HAVE_NETMAP_WITH_LIBS
108*f933b737SSascha Wildner #define HAVE_NETMAP_WITH_LIBS
109*f933b737SSascha Wildner
110*f933b737SSascha Wildner #include <sys/time.h>
111*f933b737SSascha Wildner #include <sys/mman.h>
112*f933b737SSascha Wildner #include <string.h> /* memset */
113*f933b737SSascha Wildner #include <sys/ioctl.h>
114*f933b737SSascha Wildner #include <sys/errno.h> /* EINVAL */
115*f933b737SSascha Wildner #include <fcntl.h> /* O_RDWR */
116*f933b737SSascha Wildner #include <stdlib.h>
117*f933b737SSascha Wildner
118*f933b737SSascha Wildner struct nm_hdr_t { /* same as pcap_pkthdr */
119*f933b737SSascha Wildner struct timeval ts;
120*f933b737SSascha Wildner uint32_t caplen;
121*f933b737SSascha Wildner uint32_t len;
122*f933b737SSascha Wildner };
123*f933b737SSascha Wildner
124*f933b737SSascha Wildner struct nm_desc_t {
125*f933b737SSascha Wildner struct nm_desc_t *self;
126*f933b737SSascha Wildner int fd;
127*f933b737SSascha Wildner void *mem;
128*f933b737SSascha Wildner int memsize;
129*f933b737SSascha Wildner struct netmap_if *nifp;
130*f933b737SSascha Wildner uint16_t first_ring, last_ring, cur_ring;
131*f933b737SSascha Wildner struct nmreq req;
132*f933b737SSascha Wildner struct nm_hdr_t hdr;
133*f933b737SSascha Wildner };
134*f933b737SSascha Wildner
135*f933b737SSascha Wildner /*
136*f933b737SSascha Wildner * when the descriptor is open correctly, d->self == d
137*f933b737SSascha Wildner */
138*f933b737SSascha Wildner #define P2NMD(p) ((struct nm_desc_t *)(p))
139*f933b737SSascha Wildner #define IS_NETMAP_DESC(d) (P2NMD(d)->self == P2NMD(d))
140*f933b737SSascha Wildner #define NETMAP_FD(d) (P2NMD(d)->fd)
141*f933b737SSascha Wildner
142*f933b737SSascha Wildner /*
143*f933b737SSascha Wildner * The callback, invoked on each received packet. Same as libpcap
144*f933b737SSascha Wildner */
145*f933b737SSascha Wildner typedef void (*nm_cb_t)(u_char *, const struct nm_hdr_t *, const u_char *d);
146*f933b737SSascha Wildner
147*f933b737SSascha Wildner /*
148*f933b737SSascha Wildner * The open routine accepts an ifname (netmap:foo or vale:foo) and
149*f933b737SSascha Wildner * optionally a second (string) argument indicating the ring number
150*f933b737SSascha Wildner * to open. If successful, t opens the fd and maps the memory.
151*f933b737SSascha Wildner */
152*f933b737SSascha Wildner static struct nm_desc_t *nm_open(const char *ifname,
153*f933b737SSascha Wildner const char *ring_no, int flags, int ring_flags);
154*f933b737SSascha Wildner
155*f933b737SSascha Wildner /*
156*f933b737SSascha Wildner * nm_dispatch() is the same as pcap_dispatch()
157*f933b737SSascha Wildner * nm_next() is the same as pcap_next()
158*f933b737SSascha Wildner */
159*f933b737SSascha Wildner static int nm_dispatch(struct nm_desc_t *, int, nm_cb_t, u_char *);
160*f933b737SSascha Wildner static u_char *nm_next(struct nm_desc_t *, struct nm_hdr_t *);
161*f933b737SSascha Wildner
162*f933b737SSascha Wildner /*
163*f933b737SSascha Wildner * unmap memory, close file descriptor and free the descriptor.
164*f933b737SSascha Wildner */
165*f933b737SSascha Wildner static int nm_close(struct nm_desc_t *);
166*f933b737SSascha Wildner
167*f933b737SSascha Wildner
168*f933b737SSascha Wildner /*
169*f933b737SSascha Wildner * Try to open, return descriptor if successful, NULL otherwise.
170*f933b737SSascha Wildner * An invalid netmap name will return errno = 0;
171*f933b737SSascha Wildner */
172*f933b737SSascha Wildner static struct nm_desc_t *
nm_open(const char * ifname,const char * ring_name,int flags,int ring_flags)173*f933b737SSascha Wildner nm_open(const char *ifname, const char *ring_name, int flags, int ring_flags)
174*f933b737SSascha Wildner {
175*f933b737SSascha Wildner struct nm_desc_t *d;
176*f933b737SSascha Wildner u_int n;
177*f933b737SSascha Wildner
178*f933b737SSascha Wildner if (strncmp(ifname, "netmap:", 7) && strncmp(ifname, "vale", 4)) {
179*f933b737SSascha Wildner errno = 0; /* name not recognised */
180*f933b737SSascha Wildner return NULL;
181*f933b737SSascha Wildner }
182*f933b737SSascha Wildner if (ifname[0] == 'n')
183*f933b737SSascha Wildner ifname += 7;
184*f933b737SSascha Wildner d = (struct nm_desc_t *)calloc(1, sizeof(*d));
185*f933b737SSascha Wildner if (d == NULL) {
186*f933b737SSascha Wildner errno = ENOMEM;
187*f933b737SSascha Wildner return NULL;
188*f933b737SSascha Wildner }
189*f933b737SSascha Wildner d->self = d; /* set this early so nm_close() works */
190*f933b737SSascha Wildner d->fd = open("/dev/netmap", O_RDWR);
191*f933b737SSascha Wildner if (d->fd < 0)
192*f933b737SSascha Wildner goto fail;
193*f933b737SSascha Wildner
194*f933b737SSascha Wildner if (flags & NETMAP_SW_RING) {
195*f933b737SSascha Wildner d->req.nr_ringid = NETMAP_SW_RING;
196*f933b737SSascha Wildner } else {
197*f933b737SSascha Wildner u_int r;
198*f933b737SSascha Wildner if (flags & NETMAP_HW_RING) /* interpret ring as int */
199*f933b737SSascha Wildner r = (uintptr_t)ring_name;
200*f933b737SSascha Wildner else /* interpret ring as numeric string */
201*f933b737SSascha Wildner r = ring_name ? atoi(ring_name) : ~0;
202*f933b737SSascha Wildner r = (r < NETMAP_RING_MASK) ? (r | NETMAP_HW_RING) : 0;
203*f933b737SSascha Wildner d->req.nr_ringid = r; /* set the ring */
204*f933b737SSascha Wildner }
205*f933b737SSascha Wildner d->req.nr_ringid |= (flags & ~NETMAP_RING_MASK);
206*f933b737SSascha Wildner d->req.nr_version = NETMAP_API;
207*f933b737SSascha Wildner strncpy(d->req.nr_name, ifname, sizeof(d->req.nr_name));
208*f933b737SSascha Wildner if (ioctl(d->fd, NIOCREGIF, &d->req))
209*f933b737SSascha Wildner goto fail;
210*f933b737SSascha Wildner
211*f933b737SSascha Wildner d->memsize = d->req.nr_memsize;
212*f933b737SSascha Wildner d->mem = mmap(0, d->memsize, PROT_WRITE | PROT_READ, MAP_SHARED,
213*f933b737SSascha Wildner d->fd, 0);
214*f933b737SSascha Wildner if (d->mem == NULL)
215*f933b737SSascha Wildner goto fail;
216*f933b737SSascha Wildner d->nifp = NETMAP_IF(d->mem, d->req.nr_offset);
217*f933b737SSascha Wildner if (d->req.nr_ringid & NETMAP_SW_RING) {
218*f933b737SSascha Wildner d->first_ring = d->last_ring = d->req.nr_rx_rings;
219*f933b737SSascha Wildner } else if (d->req.nr_ringid & NETMAP_HW_RING) {
220*f933b737SSascha Wildner d->first_ring = d->last_ring =
221*f933b737SSascha Wildner d->req.nr_ringid & NETMAP_RING_MASK;
222*f933b737SSascha Wildner } else {
223*f933b737SSascha Wildner d->first_ring = 0;
224*f933b737SSascha Wildner d->last_ring = d->req.nr_rx_rings - 1;
225*f933b737SSascha Wildner }
226*f933b737SSascha Wildner d->cur_ring = d->first_ring;
227*f933b737SSascha Wildner for (n = d->first_ring; n <= d->last_ring; n++) {
228*f933b737SSascha Wildner struct netmap_ring *ring = NETMAP_RXRING(d->nifp, n);
229*f933b737SSascha Wildner ring->flags |= ring_flags;
230*f933b737SSascha Wildner }
231*f933b737SSascha Wildner return d;
232*f933b737SSascha Wildner
233*f933b737SSascha Wildner fail:
234*f933b737SSascha Wildner nm_close(d);
235*f933b737SSascha Wildner errno = EINVAL;
236*f933b737SSascha Wildner return NULL;
237*f933b737SSascha Wildner }
238*f933b737SSascha Wildner
239*f933b737SSascha Wildner
240*f933b737SSascha Wildner static int
nm_close(struct nm_desc_t * d)241*f933b737SSascha Wildner nm_close(struct nm_desc_t *d)
242*f933b737SSascha Wildner {
243*f933b737SSascha Wildner if (d == NULL || d->self != d)
244*f933b737SSascha Wildner return EINVAL;
245*f933b737SSascha Wildner if (d->mem)
246*f933b737SSascha Wildner munmap(d->mem, d->memsize);
247*f933b737SSascha Wildner if (d->fd)
248*f933b737SSascha Wildner close(d->fd);
249*f933b737SSascha Wildner bzero(d, sizeof(*d));
250*f933b737SSascha Wildner free(d);
251*f933b737SSascha Wildner return 0;
252*f933b737SSascha Wildner }
253*f933b737SSascha Wildner
254*f933b737SSascha Wildner
255*f933b737SSascha Wildner /*
256*f933b737SSascha Wildner * Same prototype as pcap_dispatch(), only need to cast.
257*f933b737SSascha Wildner */
258*f933b737SSascha Wildner inline /* not really, but disable unused warnings */
259*f933b737SSascha Wildner static int
nm_dispatch(struct nm_desc_t * d,int cnt,nm_cb_t cb,u_char * arg)260*f933b737SSascha Wildner nm_dispatch(struct nm_desc_t *d, int cnt, nm_cb_t cb, u_char *arg)
261*f933b737SSascha Wildner {
262*f933b737SSascha Wildner int n = d->last_ring - d->first_ring + 1;
263*f933b737SSascha Wildner int c, got = 0, ri = d->cur_ring;
264*f933b737SSascha Wildner
265*f933b737SSascha Wildner if (cnt == 0)
266*f933b737SSascha Wildner cnt = -1;
267*f933b737SSascha Wildner /* cnt == -1 means infinite, but rings have a finite amount
268*f933b737SSascha Wildner * of buffers and the int is large enough that we never wrap,
269*f933b737SSascha Wildner * so we can omit checking for -1
270*f933b737SSascha Wildner */
271*f933b737SSascha Wildner for (c=0; c < n && cnt != got; c++) {
272*f933b737SSascha Wildner /* compute current ring to use */
273*f933b737SSascha Wildner struct netmap_ring *ring;
274*f933b737SSascha Wildner
275*f933b737SSascha Wildner ri = d->cur_ring + c;
276*f933b737SSascha Wildner if (ri > d->last_ring)
277*f933b737SSascha Wildner ri = d->first_ring;
278*f933b737SSascha Wildner ring = NETMAP_RXRING(d->nifp, ri);
279*f933b737SSascha Wildner for ( ; ring->avail > 0 && cnt != got; got++) {
280*f933b737SSascha Wildner u_int i = ring->cur;
281*f933b737SSascha Wildner u_int idx = ring->slot[i].buf_idx;
282*f933b737SSascha Wildner u_char *buf = (u_char *)NETMAP_BUF(ring, idx);
283*f933b737SSascha Wildner // XXX should check valid buf
284*f933b737SSascha Wildner // prefetch(buf);
285*f933b737SSascha Wildner d->hdr.len = d->hdr.caplen = ring->slot[i].len;
286*f933b737SSascha Wildner d->hdr.ts = ring->ts;
287*f933b737SSascha Wildner cb(arg, &d->hdr, buf);
288*f933b737SSascha Wildner ring->cur = NETMAP_RING_NEXT(ring, i);
289*f933b737SSascha Wildner ring->avail--;
290*f933b737SSascha Wildner }
291*f933b737SSascha Wildner }
292*f933b737SSascha Wildner d->cur_ring = ri;
293*f933b737SSascha Wildner return got;
294*f933b737SSascha Wildner }
295*f933b737SSascha Wildner
296*f933b737SSascha Wildner inline /* not really, but disable unused warnings */
297*f933b737SSascha Wildner static u_char *
nm_next(struct nm_desc_t * d,struct nm_hdr_t * hdr)298*f933b737SSascha Wildner nm_next(struct nm_desc_t *d, struct nm_hdr_t *hdr)
299*f933b737SSascha Wildner {
300*f933b737SSascha Wildner int ri = d->cur_ring;
301*f933b737SSascha Wildner
302*f933b737SSascha Wildner do {
303*f933b737SSascha Wildner /* compute current ring to use */
304*f933b737SSascha Wildner struct netmap_ring *ring = NETMAP_RXRING(d->nifp, ri);
305*f933b737SSascha Wildner if (ring->avail > 0) {
306*f933b737SSascha Wildner u_int i = ring->cur;
307*f933b737SSascha Wildner u_int idx = ring->slot[i].buf_idx;
308*f933b737SSascha Wildner u_char *buf = (u_char *)NETMAP_BUF(ring, idx);
309*f933b737SSascha Wildner // XXX should check valid buf
310*f933b737SSascha Wildner // prefetch(buf);
311*f933b737SSascha Wildner hdr->ts = ring->ts;
312*f933b737SSascha Wildner hdr->len = hdr->caplen = ring->slot[i].len;
313*f933b737SSascha Wildner ring->cur = NETMAP_RING_NEXT(ring, i);
314*f933b737SSascha Wildner ring->avail--;
315*f933b737SSascha Wildner d->cur_ring = ri;
316*f933b737SSascha Wildner return buf;
317*f933b737SSascha Wildner }
318*f933b737SSascha Wildner ri++;
319*f933b737SSascha Wildner if (ri > d->last_ring)
320*f933b737SSascha Wildner ri = d->first_ring;
321*f933b737SSascha Wildner } while (ri != d->cur_ring);
322*f933b737SSascha Wildner return NULL; /* nothing found */
323*f933b737SSascha Wildner }
324*f933b737SSascha Wildner
325*f933b737SSascha Wildner #endif /* !HAVE_NETMAP_WITH_LIBS */
326*f933b737SSascha Wildner
327*f933b737SSascha Wildner #endif /* NETMAP_WITH_LIBS */
328*f933b737SSascha Wildner
329*f933b737SSascha Wildner #endif /* _NET_NETMAP_USER_H_ */
330