xref: /netbsd-src/sys/net/npf/npf_os.c (revision d90047b5d07facf36e6c01dcc0bded8997ce9cc2)
1 /*-
2  * Copyright (c) 2009-2016 The NetBSD Foundation, Inc.
3  * All rights reserved.
4  *
5  * This material is based upon work partially supported by The
6  * NetBSD Foundation under a contract with Mindaugas Rasiukevicius.
7  *
8  * Redistribution and use in source and binary forms, with or without
9  * modification, are permitted provided that the following conditions
10  * are met:
11  * 1. Redistributions of source code must retain the above copyright
12  *    notice, this list of conditions and the following disclaimer.
13  * 2. Redistributions in binary form must reproduce the above copyright
14  *    notice, this list of conditions and the following disclaimer in the
15  *    documentation and/or other materials provided with the distribution.
16  *
17  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
18  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
19  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
20  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
21  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
22  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
23  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
24  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
25  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
26  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
27  * POSSIBILITY OF SUCH DAMAGE.
28  */
29 
30 /*
31  * NPF main: dynamic load/initialisation and unload routines.
32  */
33 
34 #ifdef _KERNEL
35 #include <sys/cdefs.h>
36 __KERNEL_RCSID(0, "$NetBSD: npf_os.c,v 1.18 2020/05/30 14:16:56 rmind Exp $");
37 
38 #ifdef _KERNEL_OPT
39 #include "pf.h"
40 #if NPF > 0
41 #error "NPF and PF are mutually exclusive; please select one"
42 #endif
43 #endif
44 
45 #include <sys/param.h>
46 #include <sys/types.h>
47 
48 #include <sys/conf.h>
49 #include <sys/kauth.h>
50 #include <sys/kmem.h>
51 #include <sys/lwp.h>
52 #include <sys/module.h>
53 #include <sys/pserialize.h>
54 #include <sys/socketvar.h>
55 #include <sys/uio.h>
56 
57 #include <netinet/in.h>
58 #include <netinet6/in6_var.h>
59 #endif
60 
61 #include "npf_impl.h"
62 #include "npfkern.h"
63 
64 #ifdef _KERNEL
65 #ifndef _MODULE
66 #include "opt_modular.h"
67 #include "opt_net_mpsafe.h"
68 #endif
69 #include "ioconf.h"
70 #endif
71 
72 /*
73  * Module and device structures.
74  */
75 #ifndef _MODULE
76 /*
77  * Modular kernels load drivers too early, and we need percpu to be inited
78  * So we make this misc; a better way would be to have early boot and late
79  * boot drivers.
80  */
81 MODULE(MODULE_CLASS_MISC, npf, "bpf");
82 #else
83 /* This module autoloads via /dev/npf so it needs to be a driver */
84 MODULE(MODULE_CLASS_DRIVER, npf, "bpf");
85 #endif
86 
87 #define	NPF_IOCTL_DATA_LIMIT	(4 * 1024 * 1024)
88 
89 static int	npf_pfil_register(bool);
90 static void	npf_pfil_unregister(bool);
91 
92 static int	npf_dev_open(dev_t, int, int, lwp_t *);
93 static int	npf_dev_close(dev_t, int, int, lwp_t *);
94 static int	npf_dev_ioctl(dev_t, u_long, void *, int, lwp_t *);
95 static int	npf_dev_poll(dev_t, int, lwp_t *);
96 static int	npf_dev_read(dev_t, struct uio *, int);
97 
98 const struct cdevsw npf_cdevsw = {
99 	.d_open = npf_dev_open,
100 	.d_close = npf_dev_close,
101 	.d_read = npf_dev_read,
102 	.d_write = nowrite,
103 	.d_ioctl = npf_dev_ioctl,
104 	.d_stop = nostop,
105 	.d_tty = notty,
106 	.d_poll = npf_dev_poll,
107 	.d_mmap = nommap,
108 	.d_kqfilter = nokqfilter,
109 	.d_discard = nodiscard,
110 	.d_flag = D_OTHER | D_MPSAFE
111 };
112 
113 static const char *	npf_ifop_getname(npf_t *, ifnet_t *);
114 static ifnet_t *	npf_ifop_lookup(npf_t *, const char *);
115 static void		npf_ifop_flush(npf_t *, void *);
116 static void *		npf_ifop_getmeta(npf_t *, const ifnet_t *);
117 static void		npf_ifop_setmeta(npf_t *, ifnet_t *, void *);
118 
119 static const unsigned	nworkers = 1;
120 
121 static bool		pfil_registered = false;
122 static pfil_head_t *	npf_ph_if = NULL;
123 static pfil_head_t *	npf_ph_inet = NULL;
124 static pfil_head_t *	npf_ph_inet6 = NULL;
125 
126 static const npf_ifops_t kern_ifops = {
127 	.getname	= npf_ifop_getname,
128 	.lookup		= npf_ifop_lookup,
129 	.flush		= npf_ifop_flush,
130 	.getmeta	= npf_ifop_getmeta,
131 	.setmeta	= npf_ifop_setmeta,
132 };
133 
134 static int
135 npf_fini(void)
136 {
137 	npf_t *npf = npf_getkernctx();
138 
139 	/* At first, detach device and remove pfil hooks. */
140 #ifdef _MODULE
141 	devsw_detach(NULL, &npf_cdevsw);
142 #endif
143 	npf_pfil_unregister(true);
144 	npfk_destroy(npf);
145 	npfk_sysfini();
146 	return 0;
147 }
148 
149 static int
150 npf_init(void)
151 {
152 	npf_t *npf;
153 	int error = 0;
154 
155 	error = npfk_sysinit(nworkers);
156 	if (error)
157 		return error;
158 	npf = npfk_create(0, NULL, &kern_ifops, NULL);
159 	npf_setkernctx(npf);
160 	npf_pfil_register(true);
161 
162 #ifdef _MODULE
163 	devmajor_t bmajor = NODEVMAJOR, cmajor = NODEVMAJOR;
164 
165 	/* Attach /dev/npf device. */
166 	error = devsw_attach("npf", NULL, &bmajor, &npf_cdevsw, &cmajor);
167 	if (error) {
168 		/* It will call devsw_detach(), which is safe. */
169 		(void)npf_fini();
170 	}
171 #endif
172 	return error;
173 }
174 
175 
176 /*
177  * Module interface.
178  */
179 static int
180 npf_modcmd(modcmd_t cmd, void *arg)
181 {
182 	switch (cmd) {
183 	case MODULE_CMD_INIT:
184 		return npf_init();
185 	case MODULE_CMD_FINI:
186 		return npf_fini();
187 	case MODULE_CMD_AUTOUNLOAD:
188 		if (npf_autounload_p()) {
189 			return EBUSY;
190 		}
191 		break;
192 	default:
193 		return ENOTTY;
194 	}
195 	return 0;
196 }
197 
198 void
199 npfattach(int nunits)
200 {
201 	/* Nothing */
202 }
203 
204 static int
205 npf_dev_open(dev_t dev, int flag, int mode, lwp_t *l)
206 {
207 	/* Available only for super-user. */
208 	if (kauth_authorize_network(l->l_cred, KAUTH_NETWORK_FIREWALL,
209 	    KAUTH_REQ_NETWORK_FIREWALL_FW, NULL, NULL, NULL)) {
210 		return EPERM;
211 	}
212 	return 0;
213 }
214 
215 static int
216 npf_dev_close(dev_t dev, int flag, int mode, lwp_t *l)
217 {
218 	return 0;
219 }
220 
221 static int
222 npf_stats_export(npf_t *npf, void *data)
223 {
224 	uint64_t *fullst, *uptr = *(uint64_t **)data;
225 	int error;
226 
227 	fullst = kmem_alloc(NPF_STATS_SIZE, KM_SLEEP);
228 	npfk_stats(npf, fullst); /* will zero the buffer */
229 	error = copyout(fullst, uptr, NPF_STATS_SIZE);
230 	kmem_free(fullst, NPF_STATS_SIZE);
231 	return error;
232 }
233 
234 /*
235  * npfctl_switch: enable or disable packet inspection.
236  */
237 static int
238 npfctl_switch(void *data)
239 {
240 	const bool onoff = *(int *)data ? true : false;
241 	int error;
242 
243 	if (onoff) {
244 		/* Enable: add pfil hooks. */
245 		error = npf_pfil_register(false);
246 	} else {
247 		/* Disable: remove pfil hooks. */
248 		npf_pfil_unregister(false);
249 		error = 0;
250 	}
251 	return error;
252 }
253 
254 static int
255 npf_dev_ioctl(dev_t dev, u_long cmd, void *data, int flag, lwp_t *l)
256 {
257 	npf_t *npf = npf_getkernctx();
258 	nvlist_t *req, *resp;
259 	int error;
260 
261 	/* Available only for super-user. */
262 	if (kauth_authorize_network(l->l_cred, KAUTH_NETWORK_FIREWALL,
263 	    KAUTH_REQ_NETWORK_FIREWALL_FW, NULL, NULL, NULL)) {
264 		return EPERM;
265 	}
266 
267 	switch (cmd) {
268 	case IOC_NPF_VERSION:
269 		*(int *)data = NPF_VERSION;
270 		return 0;
271 
272 	case IOC_NPF_SWITCH:
273 		return npfctl_switch(data);
274 
275 	case IOC_NPF_TABLE:
276 		return npfctl_table(npf, data);
277 
278 	case IOC_NPF_STATS:
279 		return npf_stats_export(npf, data);
280 	}
281 
282 	error = nvlist_copyin(data, &req, NPF_IOCTL_DATA_LIMIT);
283 	if (__predict_false(error)) {
284 #ifdef __NetBSD__
285 		/* Until the version bump. */
286 		if (cmd != IOC_NPF_SAVE) {
287 			return error;
288 		}
289 		req = nvlist_create(0);
290 #else
291 		return error;
292 #endif
293 	}
294 	resp = nvlist_create(0);
295 	npfctl_run_op(npf, cmd, req, resp);
296 	error = nvlist_copyout(data, resp);
297 	nvlist_destroy(resp);
298 	nvlist_destroy(req);
299 
300 	return error;
301 }
302 
303 static int
304 npf_dev_poll(dev_t dev, int events, lwp_t *l)
305 {
306 	return ENOTSUP;
307 }
308 
309 static int
310 npf_dev_read(dev_t dev, struct uio *uio, int flag)
311 {
312 	return ENOTSUP;
313 }
314 
315 bool
316 npf_autounload_p(void)
317 {
318 	npf_t *npf = npf_getkernctx();
319 	return !npf_active_p() && npf_default_pass(npf);
320 }
321 
322 /*
323  * Interface operations.
324  */
325 
326 static const char *
327 npf_ifop_getname(npf_t *npf __unused, ifnet_t *ifp)
328 {
329 	return ifp->if_xname;
330 }
331 
332 static ifnet_t *
333 npf_ifop_lookup(npf_t *npf __unused, const char *name)
334 {
335 	return ifunit(name);
336 }
337 
338 static void
339 npf_ifop_flush(npf_t *npf __unused, void *arg)
340 {
341 	ifnet_t *ifp;
342 
343 	KERNEL_LOCK(1, NULL);
344 	IFNET_GLOBAL_LOCK();
345 	IFNET_WRITER_FOREACH(ifp) {
346 		ifp->if_npf_private = arg;
347 	}
348 	IFNET_GLOBAL_UNLOCK();
349 	KERNEL_UNLOCK_ONE(NULL);
350 }
351 
352 static void *
353 npf_ifop_getmeta(npf_t *npf __unused, const ifnet_t *ifp)
354 {
355 	return ifp->if_npf_private;
356 }
357 
358 static void
359 npf_ifop_setmeta(npf_t *npf __unused, ifnet_t *ifp, void *arg)
360 {
361 	ifp->if_npf_private = arg;
362 }
363 
364 #ifdef _KERNEL
365 
366 /*
367  * Wrapper of the main packet handler to pass the kernel NPF context.
368  */
369 static int
370 npfos_packet_handler(void *arg, struct mbuf **mp, ifnet_t *ifp, int di)
371 {
372 	npf_t *npf = npf_getkernctx();
373 	return npfk_packet_handler(npf, mp, ifp, di);
374 }
375 
376 /*
377  * npf_ifhook: hook handling interface changes.
378  */
379 static void
380 npf_ifhook(void *arg, unsigned long cmd, void *arg2)
381 {
382 	npf_t *npf = npf_getkernctx();
383 	ifnet_t *ifp = arg2;
384 
385 	switch (cmd) {
386 	case PFIL_IFNET_ATTACH:
387 		npfk_ifmap_attach(npf, ifp);
388 		npf_ifaddr_sync(npf, ifp);
389 		break;
390 	case PFIL_IFNET_DETACH:
391 		npfk_ifmap_detach(npf, ifp);
392 		npf_ifaddr_flush(npf, ifp);
393 		break;
394 	}
395 }
396 
397 static void
398 npf_ifaddrhook(void *arg, u_long cmd, void *arg2)
399 {
400 	npf_t *npf = npf_getkernctx();
401 	struct ifaddr *ifa = arg2;
402 
403 	switch (cmd) {
404 	case SIOCSIFADDR:
405 	case SIOCAIFADDR:
406 	case SIOCDIFADDR:
407 #ifdef INET6
408 	case SIOCSIFADDR_IN6:
409 	case SIOCAIFADDR_IN6:
410 	case SIOCDIFADDR_IN6:
411 #endif
412 		KASSERT(ifa != NULL);
413 		break;
414 	default:
415 		return;
416 	}
417 	npf_ifaddr_sync(npf, ifa->ifa_ifp);
418 }
419 
420 /*
421  * npf_pfil_register: register pfil(9) hooks.
422  */
423 static int
424 npf_pfil_register(bool init)
425 {
426 	npf_t *npf = npf_getkernctx();
427 	int error = 0;
428 
429 	SOFTNET_KERNEL_LOCK_UNLESS_NET_MPSAFE();
430 
431 	/* Init: interface re-config and attach/detach hook. */
432 	if (!npf_ph_if) {
433 		npf_ph_if = pfil_head_get(PFIL_TYPE_IFNET, 0);
434 		if (!npf_ph_if) {
435 			error = ENOENT;
436 			goto out;
437 		}
438 
439 		error = pfil_add_ihook(npf_ifhook, NULL,
440 		    PFIL_IFNET, npf_ph_if);
441 		KASSERT(error == 0);
442 
443 		error = pfil_add_ihook(npf_ifaddrhook, NULL,
444 		    PFIL_IFADDR, npf_ph_if);
445 		KASSERT(error == 0);
446 	}
447 	if (init) {
448 		goto out;
449 	}
450 
451 	/* Check if pfil hooks are not already registered. */
452 	if (pfil_registered) {
453 		error = EEXIST;
454 		goto out;
455 	}
456 
457 	/* Capture points of the activity in the IP layer. */
458 	npf_ph_inet = pfil_head_get(PFIL_TYPE_AF, (void *)AF_INET);
459 	npf_ph_inet6 = pfil_head_get(PFIL_TYPE_AF, (void *)AF_INET6);
460 	if (!npf_ph_inet && !npf_ph_inet6) {
461 		error = ENOENT;
462 		goto out;
463 	}
464 
465 	/* Packet IN/OUT handlers for IP layer. */
466 	if (npf_ph_inet) {
467 		error = pfil_add_hook(npfos_packet_handler, npf,
468 		    PFIL_ALL, npf_ph_inet);
469 		KASSERT(error == 0);
470 	}
471 	if (npf_ph_inet6) {
472 		error = pfil_add_hook(npfos_packet_handler, npf,
473 		    PFIL_ALL, npf_ph_inet6);
474 		KASSERT(error == 0);
475 	}
476 
477 	/*
478 	 * It is necessary to re-sync all/any interface address tables,
479 	 * since we did not listen for any changes.
480 	 */
481 	npf_ifaddr_syncall(npf);
482 	pfil_registered = true;
483 out:
484 	SOFTNET_KERNEL_UNLOCK_UNLESS_NET_MPSAFE();
485 
486 	return error;
487 }
488 
489 /*
490  * npf_pfil_unregister: unregister pfil(9) hooks.
491  */
492 static void
493 npf_pfil_unregister(bool fini)
494 {
495 	npf_t *npf = npf_getkernctx();
496 
497 	SOFTNET_KERNEL_LOCK_UNLESS_NET_MPSAFE();
498 
499 	if (fini && npf_ph_if) {
500 		(void)pfil_remove_ihook(npf_ifhook, NULL,
501 		    PFIL_IFNET, npf_ph_if);
502 		(void)pfil_remove_ihook(npf_ifaddrhook, NULL,
503 		    PFIL_IFADDR, npf_ph_if);
504 	}
505 	if (npf_ph_inet) {
506 		(void)pfil_remove_hook(npfos_packet_handler, npf,
507 		    PFIL_ALL, npf_ph_inet);
508 	}
509 	if (npf_ph_inet6) {
510 		(void)pfil_remove_hook(npfos_packet_handler, npf,
511 		    PFIL_ALL, npf_ph_inet6);
512 	}
513 	pfil_registered = false;
514 
515 	SOFTNET_KERNEL_UNLOCK_UNLESS_NET_MPSAFE();
516 }
517 
518 bool
519 npf_active_p(void)
520 {
521 	return pfil_registered;
522 }
523 
524 #endif
525 
526 #ifdef __NetBSD__
527 
528 /*
529  * Epoch-Based Reclamation (EBR) wrappers: in NetBSD, we rely on the
530  * passive serialization mechanism (see pserialize(9) manual page),
531  * which provides sufficient guarantees for NPF.
532  */
533 
534 ebr_t *
535 npf_ebr_create(void)
536 {
537 	return pserialize_create();
538 }
539 
540 void
541 npf_ebr_destroy(ebr_t *ebr)
542 {
543 	pserialize_destroy(ebr);
544 }
545 
546 void
547 npf_ebr_register(ebr_t *ebr)
548 {
549 	KASSERT(ebr != NULL); (void)ebr;
550 }
551 
552 void
553 npf_ebr_unregister(ebr_t *ebr)
554 {
555 	KASSERT(ebr != NULL); (void)ebr;
556 }
557 
558 int
559 npf_ebr_enter(ebr_t *ebr)
560 {
561 	KASSERT(ebr != NULL); (void)ebr;
562 	return pserialize_read_enter();
563 }
564 
565 void
566 npf_ebr_exit(ebr_t *ebr, int s)
567 {
568 	KASSERT(ebr != NULL); (void)ebr;
569 	pserialize_read_exit(s);
570 }
571 
572 void
573 npf_ebr_full_sync(ebr_t *ebr)
574 {
575 	pserialize_perform(ebr);
576 }
577 
578 bool
579 npf_ebr_incrit_p(ebr_t *ebr)
580 {
581 	KASSERT(ebr != NULL); (void)ebr;
582 	return pserialize_in_read_section();
583 }
584 
585 #endif
586