xref: /netbsd-src/sys/netinet6/in6_proto.c (revision 274254cdae52594c1aa480a736aef78313d15c9c)
1 /*	$NetBSD: in6_proto.c,v 1.84 2009/03/23 18:43:20 liamjfoy Exp $	*/
2 /*	$KAME: in6_proto.c,v 1.66 2000/10/10 15:35:47 itojun Exp $	*/
3 
4 /*
5  * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
6  * All rights reserved.
7  *
8  * Redistribution and use in source and binary forms, with or without
9  * modification, are permitted provided that the following conditions
10  * are met:
11  * 1. Redistributions of source code must retain the above copyright
12  *    notice, this list of conditions and the following disclaimer.
13  * 2. Redistributions in binary form must reproduce the above copyright
14  *    notice, this list of conditions and the following disclaimer in the
15  *    documentation and/or other materials provided with the distribution.
16  * 3. Neither the name of the project nor the names of its contributors
17  *    may be used to endorse or promote products derived from this software
18  *    without specific prior written permission.
19  *
20  * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND
21  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
22  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
23  * ARE DISCLAIMED.  IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE
24  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
25  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
26  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
28  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
29  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
30  * SUCH DAMAGE.
31  */
32 
33 /*
34  * Copyright (c) 1982, 1986, 1993
35  *	The Regents of the University of California.  All rights reserved.
36  *
37  * Redistribution and use in source and binary forms, with or without
38  * modification, are permitted provided that the following conditions
39  * are met:
40  * 1. Redistributions of source code must retain the above copyright
41  *    notice, this list of conditions and the following disclaimer.
42  * 2. Redistributions in binary form must reproduce the above copyright
43  *    notice, this list of conditions and the following disclaimer in the
44  *    documentation and/or other materials provided with the distribution.
45  * 3. Neither the name of the University nor the names of its contributors
46  *    may be used to endorse or promote products derived from this software
47  *    without specific prior written permission.
48  *
49  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
50  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
51  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
52  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
53  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
54  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
55  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
56  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
57  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
58  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
59  * SUCH DAMAGE.
60  *
61  *	@(#)in_proto.c	8.1 (Berkeley) 6/10/93
62  */
63 
64 #include <sys/cdefs.h>
65 __KERNEL_RCSID(0, "$NetBSD: in6_proto.c,v 1.84 2009/03/23 18:43:20 liamjfoy Exp $");
66 
67 #include "opt_inet.h"
68 #include "opt_ipsec.h"
69 #include "opt_iso.h"
70 
71 #include <sys/param.h>
72 #include <sys/socket.h>
73 #include <sys/protosw.h>
74 #include <sys/kernel.h>
75 #include <sys/domain.h>
76 #include <sys/mbuf.h>
77 
78 #include <net/if.h>
79 #include <net/radix.h>
80 #include <net/route.h>
81 
82 #include <netinet/in.h>
83 #include <netinet/in_systm.h>
84 #include <netinet/in_var.h>
85 #include <netinet/ip_encap.h>
86 #include <netinet/ip.h>
87 #include <netinet/ip_var.h>
88 #include <netinet/in_pcb.h>
89 #include <netinet/ip6.h>
90 #include <netinet6/ip6_var.h>
91 #include <netinet/icmp6.h>
92 #include <netinet6/in6_pcb.h>
93 
94 #include <netinet/tcp.h>
95 #include <netinet/tcp_fsm.h>
96 #include <netinet/tcp_seq.h>
97 #include <netinet/tcp_timer.h>
98 #include <netinet/tcp_var.h>
99 #include <netinet/tcpip.h>
100 #include <netinet/tcp_debug.h>
101 
102 #include <netinet6/udp6.h>
103 #include <netinet6/udp6_var.h>
104 
105 #include <netinet6/pim6_var.h>
106 
107 #include <netinet6/nd6.h>
108 
109 #ifdef IPSEC
110 #include <netinet6/ipsec.h>
111 #include <netinet6/ah.h>
112 #ifdef IPSEC_ESP
113 #include <netinet6/esp.h>
114 #endif
115 #include <netinet6/ipcomp.h>
116 #endif /* IPSEC */
117 
118 #ifdef FAST_IPSEC
119 #include <netipsec/ipsec.h>
120 #include <netipsec/ipsec6.h>
121 #include <netipsec/key.h>
122 #endif /* FAST_IPSEC */
123 
124 
125 #include "carp.h"
126 #if NCARP > 0
127 #include <netinet/ip_carp.h>
128 #endif
129 
130 #include "etherip.h"
131 #if NETHERIP > 1
132 #include <netinet6/ip6_etherip.h>
133 #endif
134 
135 #include <netinet6/ip6protosw.h>
136 
137 #include <net/net_osdep.h>
138 
139 #ifndef offsetof		/* XXX */
140 #define	offsetof(type, member)	((size_t)(&((type *)0)->member))
141 #endif
142 
143 /*
144  * TCP/IP protocol family: IP6, ICMP6, UDP, TCP.
145  */
146 
147 DOMAIN_DEFINE(inet6domain);	/* forward declare and add to link set */
148 
149 /* Wrappers to acquire kernel_lock. */
150 
151 PR_WRAP_USRREQ(rip6_usrreq)
152 PR_WRAP_USRREQ(udp6_usrreq)
153 PR_WRAP_USRREQ(tcp_usrreq)
154 
155 #define	rip6_usrreq 	rip6_usrreq_wrapper
156 #define	udp6_usrreq 	udp6_usrreq_wrapper
157 #define	tcp_usrreq 	tcp_usrreq_wrapper
158 
159 PR_WRAP_CTLINPUT(rip6_ctlinput)
160 PR_WRAP_CTLINPUT(encap6_ctlinput)
161 PR_WRAP_CTLINPUT(udp6_ctlinput)
162 PR_WRAP_CTLINPUT(tcp6_ctlinput)
163 
164 #define	rip6_ctlinput	rip6_ctlinput_wrapper
165 #define	encap6_ctlinput	encap6_ctlinput_wrapper
166 #define	udp6_ctlinput	udp6_ctlinput_wrapper
167 #define	tcp6_ctlinput	tcp6_ctlinput_wrapper
168 
169 PR_WRAP_CTLOUTPUT(rip6_ctloutput)
170 PR_WRAP_CTLOUTPUT(ip6_ctloutput)
171 PR_WRAP_CTLOUTPUT(tcp_ctloutput)
172 PR_WRAP_CTLOUTPUT(icmp6_ctloutput)
173 
174 #define	rip6_ctloutput	rip6_ctloutput_wrapper
175 #define	ip6_ctloutput	ip6_ctloutput_wrapper
176 #define	tcp_ctloutput	tcp_ctloutput_wrapper
177 #define	icmp6_ctloutput	icmp6_ctloutput_wrapper
178 
179 #if defined(IPSEC) || defined(FAST_IPSEC)
180 PR_WRAP_CTLINPUT(ah6_ctlinput)
181 PR_WRAP_CTLINPUT(esp6_ctlinput)
182 
183 #define	ah6_ctlinput	ah6_ctlinput_wrapper
184 #define	esp6_ctlinput	esp6_ctlinput_wrapper
185 #endif
186 
187 const struct ip6protosw inet6sw[] = {
188 {	.pr_domain = &inet6domain,
189 	.pr_protocol = IPPROTO_IPV6,
190 	.pr_init = ip6_init,
191 	.pr_slowtimo = frag6_slowtimo,
192 	.pr_drain = frag6_drain,
193 },
194 {	.pr_type = SOCK_DGRAM,
195 	.pr_domain = &inet6domain,
196 	.pr_protocol = IPPROTO_UDP,
197 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_PURGEIF,
198 	.pr_input = udp6_input,
199 	.pr_ctlinput = udp6_ctlinput,
200 	.pr_ctloutput = ip6_ctloutput,
201 	.pr_usrreq = udp6_usrreq,
202 	.pr_init = udp6_init,
203 },
204 {	.pr_type = SOCK_STREAM,
205 	.pr_domain = &inet6domain,
206 	.pr_protocol = IPPROTO_TCP,
207 	.pr_flags = PR_CONNREQUIRED|PR_WANTRCVD|PR_LISTEN|PR_ABRTACPTDIS|PR_PURGEIF,
208 	.pr_input = tcp6_input,
209 	.pr_ctlinput = tcp6_ctlinput,
210 	.pr_ctloutput = tcp_ctloutput,
211 	.pr_usrreq = tcp_usrreq,
212 #ifndef INET	/* don't call initialization and timeout routines twice */
213 	.pr_init = tcp_init,
214 	.pr_slowtimo = tcp_slowtimo,
215 	.pr_drain = tcp_drain,
216 #endif
217 },
218 {	.pr_type = SOCK_RAW,
219 	.pr_domain = &inet6domain,
220 	.pr_protocol = IPPROTO_RAW,
221 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_PURGEIF,
222 	.pr_input = rip6_input,
223 	.pr_output = rip6_output,
224 	.pr_ctlinput = rip6_ctlinput,
225 	.pr_ctloutput = rip6_ctloutput,
226 	.pr_usrreq = rip6_usrreq,
227 },
228 #ifdef GATEWAY
229 {	.pr_domain = &inet6domain,
230 	.pr_protocol = IPPROTO_IPV6,
231 	.pr_slowtimo = ip6flow_slowtimo,
232 	.pr_init = ip6flow_poolinit,
233 },
234 #endif /* GATEWAY */
235 {	.pr_type = SOCK_RAW,
236 	.pr_domain = &inet6domain,
237 	.pr_protocol = IPPROTO_ICMPV6,
238 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
239 	.pr_input = icmp6_input,
240 	.pr_output = rip6_output,
241 	.pr_ctlinput = rip6_ctlinput,
242 	.pr_ctloutput = icmp6_ctloutput,
243 	.pr_usrreq = rip6_usrreq,
244 	.pr_init = icmp6_init,
245 },
246 {	.pr_type = SOCK_RAW,
247 	.pr_domain = &inet6domain,
248 	.pr_protocol = IPPROTO_DSTOPTS,
249 	.pr_flags = PR_ATOMIC|PR_ADDR,
250 	.pr_input = dest6_input,
251 },
252 {	.pr_type = SOCK_RAW,
253 	.pr_domain = &inet6domain,
254 	.pr_protocol = IPPROTO_ROUTING,
255 	.pr_flags = PR_ATOMIC|PR_ADDR,
256 	.pr_input = route6_input,
257 },
258 {	.pr_type = SOCK_RAW,
259 	.pr_domain = &inet6domain,
260 	.pr_protocol = IPPROTO_FRAGMENT,
261 	.pr_flags = PR_ATOMIC|PR_ADDR,
262 	.pr_input = frag6_input,
263 },
264 #ifdef IPSEC
265 {	.pr_type = SOCK_RAW,
266 	.pr_domain = &inet6domain,
267 	.pr_protocol = IPPROTO_AH,
268 	.pr_flags = PR_ATOMIC|PR_ADDR,
269 	.pr_input = ah6_input,
270 	.pr_ctlinput = ah6_ctlinput,
271 	.pr_init = ah6_init,
272 },
273 #ifdef IPSEC_ESP
274 {	.pr_type = SOCK_RAW,
275 	.pr_domain = &inet6domain,
276 	.pr_protocol = IPPROTO_ESP,
277 	.pr_flags = PR_ATOMIC|PR_ADDR,
278 	.pr_input = esp6_input,
279 	.pr_ctlinput = esp6_ctlinput,
280 	.pr_init = esp6_init,
281 },
282 #endif
283 {	.pr_type = SOCK_RAW,
284 	.pr_domain = &inet6domain,
285 	.pr_protocol = IPPROTO_IPCOMP,
286 	.pr_flags = PR_ATOMIC|PR_ADDR,
287 	.pr_input = ipcomp6_input,
288 	.pr_init = ipcomp6_init,
289 },
290 #endif /* IPSEC */
291 #ifdef FAST_IPSEC
292 {	.pr_type = SOCK_RAW,
293 	.pr_domain = &inet6domain,
294 	.pr_protocol = IPPROTO_AH,
295 	.pr_flags = PR_ATOMIC|PR_ADDR,
296 	.pr_input = ipsec6_common_input,
297 	.pr_ctlinput = ah6_ctlinput,
298 },
299 {	.pr_type = SOCK_RAW,
300 	.pr_domain = &inet6domain,
301 	.pr_protocol = IPPROTO_ESP,
302 	.pr_flags = PR_ATOMIC|PR_ADDR,
303 	.pr_input = ipsec6_common_input,
304 	.pr_ctlinput = esp6_ctlinput,
305 },
306 {	.pr_type = SOCK_RAW,
307 	.pr_domain = &inet6domain,
308 	.pr_protocol = IPPROTO_IPCOMP,
309 	.pr_flags = PR_ATOMIC|PR_ADDR,
310 	.pr_input = ipsec6_common_input,
311 },
312 #endif /* FAST_IPSEC */
313 #ifdef INET
314 {	.pr_type = SOCK_RAW,
315 	.pr_domain = &inet6domain,
316 	.pr_protocol = IPPROTO_IPV4,
317 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
318 	.pr_input = encap6_input,
319 	.pr_output = rip6_output,
320 	.pr_ctlinput = encap6_ctlinput,
321 	.pr_ctloutput = rip6_ctloutput,
322 	.pr_usrreq = rip6_usrreq,
323 	.pr_init = encap_init,
324 },
325 #endif
326 {	.pr_type = SOCK_RAW,
327 	.pr_domain = &inet6domain,
328 	.pr_protocol = IPPROTO_IPV6,
329 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
330 	.pr_input = encap6_input,
331 	.pr_output = rip6_output,
332 	.pr_ctlinput = encap6_ctlinput,
333 	.pr_ctloutput = rip6_ctloutput,
334 	.pr_usrreq = rip6_usrreq,
335 	.pr_init = encap_init,
336 },
337 #if NETHERIP > 1
338 {	.pr_type = SOCK_RAW,
339 	.pr_domain = &inet6domain,
340 	.pr_protocol = IPPROTO_ETHERIP,
341 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
342 	.pr_input = ip6_etherip_input,
343 	.pr_output = rip6_output,
344 	.pr_ctlinput = rip6_ctlinput,
345 	.pr_ctloutput = rip6_ctloutput,
346 	.pr_usrreq = rip6_usrreq,
347 },
348 #endif
349 #if NCARP > 0
350 {	.pr_type = SOCK_RAW,
351 	.pr_domain = &inet6domain,
352 	.pr_protocol = IPPROTO_CARP,
353 	.pr_flags = PR_ATOMIC|PR_ADDR,
354 	.pr_input = carp6_proto_input,
355 	.pr_output = rip6_output,
356 	.pr_ctloutput = rip6_ctloutput,
357 	.pr_usrreq = rip6_usrreq,
358 },
359 #endif /* NCARP */
360 #ifdef ISO
361 {	.pr_type = SOCK_RAW,
362 	.pr_domain = &inet6domain,
363 	.pr_protocol = IPPROTO_EON,
364 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
365 	.pr_input = encap6_input,
366 	.pr_output = rip6_output,
367 	.pr_ctlinput = encap6_ctlinput,
368 	.pr_ctloutput = rip6_ctloutput,
369 	.pr_usrreq = rip6_usrreq,
370 	/*XXX*/
371 	.pr_init = encap_init,
372 },
373 #endif
374 {	.pr_type = SOCK_RAW,
375 	.pr_domain = &inet6domain,
376 	.pr_protocol = IPPROTO_PIM,
377 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
378 	.pr_input = pim6_input,
379 	.pr_output = rip6_output,
380 	.pr_ctloutput = rip6_ctloutput,
381 	.pr_usrreq = rip6_usrreq,
382 	.pr_init = pim6_init,
383 },
384 /* raw wildcard */
385 {	.pr_type = SOCK_RAW,
386 	.pr_domain = &inet6domain,
387 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
388 	.pr_input = rip6_input,
389 	.pr_output = rip6_output,
390 	.pr_ctloutput = rip6_ctloutput,
391 	.pr_usrreq = rip6_usrreq,
392 	.pr_init = rip6_init,
393 },
394 };
395 
396 static const struct sockaddr_in6 in6_any = {
397 	  .sin6_len = sizeof(in6_any)
398 	, .sin6_family = AF_INET6
399 	, .sin6_port = 0
400 	, .sin6_flowinfo = 0
401 	, .sin6_addr = IN6ADDR_ANY_INIT
402 	, .sin6_scope_id = 0
403 };
404 
405 struct domain inet6domain = {
406 	.dom_family = AF_INET6, .dom_name = "internet6",
407 	.dom_init = NULL, .dom_externalize = NULL, .dom_dispose = NULL,
408 	.dom_protosw = (const struct protosw *)inet6sw,
409 	.dom_protoswNPROTOSW = (const struct protosw *)&inet6sw[sizeof(inet6sw)/sizeof(inet6sw[0])],
410 	.dom_rtattach = rn_inithead,
411 	.dom_rtoffset = offsetof(struct sockaddr_in6, sin6_addr) << 3,
412 	.dom_maxrtkey = sizeof(struct ip_pack6),
413 	.dom_ifattach = in6_domifattach, .dom_ifdetach = in6_domifdetach,
414 	.dom_ifqueues = { &ip6intrq, NULL },
415 	.dom_link = { NULL },
416 	.dom_mowner = MOWNER_INIT("",""),
417 	.dom_sa_cmpofs = offsetof(struct sockaddr_in6, sin6_addr),
418 	.dom_sa_cmplen = sizeof(struct in6_addr),
419 	.dom_sa_any = (const struct sockaddr *)&in6_any,
420 	.dom_rtcache = LIST_HEAD_INITIALIZER(inet6domain.dom_rtcache)
421 };
422 
423 int
424 sockaddr_in6_cmp(const struct sockaddr *lsa, const struct sockaddr *rsa)
425 {
426 	uint_fast8_t len;
427 	const uint_fast8_t addrofs = offsetof(struct sockaddr_in6, sin6_addr),
428 			   addrend = addrofs + sizeof(struct in6_addr);
429 	int rc;
430 	const struct sockaddr_in6 *lsin6, *rsin6;
431 
432 	lsin6 = satocsin6(lsa);
433 	rsin6 = satocsin6(rsa);
434 
435 	len = MIN(addrend, MIN(lsin6->sin6_len, rsin6->sin6_len));
436 
437 	if (len > addrofs &&
438 	    (rc = memcmp(&lsin6->sin6_addr, &rsin6->sin6_addr,
439 	                  len - addrofs)) != 0)
440 		return rc;
441 
442 	return lsin6->sin6_len - rsin6->sin6_len;
443 }
444 
445 /*
446  * Internet configuration info
447  */
448 #ifndef	IPV6FORWARDING
449 #ifdef GATEWAY6
450 #define	IPV6FORWARDING	1	/* forward IP6 packets not for us */
451 #else
452 #define	IPV6FORWARDING	0	/* don't forward IP6 packets not for us */
453 #endif /* GATEWAY6 */
454 #endif /* !IPV6FORWARDING */
455 
456 int	ip6_forwarding = IPV6FORWARDING;	/* act as router? */
457 int	ip6_sendredirects = 1;
458 int	ip6_defhlim = IPV6_DEFHLIM;
459 int	ip6_defmcasthlim = IPV6_DEFAULT_MULTICAST_HOPS;
460 int	ip6_accept_rtadv = 0;	/* "IPV6FORWARDING ? 0 : 1" is dangerous */
461 int	ip6_maxfragpackets = 200;
462 int	ip6_maxfrags = 200;
463 int	ip6_log_interval = 5;
464 int	ip6_hdrnestlimit = 50;	/* appropriate? */
465 int	ip6_dad_count = 1;	/* DupAddrDetectionTransmits */
466 int	ip6_auto_flowlabel = 1;
467 int	ip6_use_deprecated = 1;	/* allow deprecated addr (RFC2462 5.5.4) */
468 int	ip6_rr_prune = 5;	/* router renumbering prefix
469 				 * walk list every 5 sec. */
470 int	ip6_mcast_pmtu = 0;	/* enable pMTU discovery for multicast? */
471 int	ip6_v6only = 1;
472 
473 int	ip6_keepfaith = 0;
474 time_t	ip6_log_time = (time_t)0L;
475 
476 /* icmp6 */
477 /*
478  * BSDI4 defines these variables in in_proto.c...
479  * XXX: what if we don't define INET? Should we define pmtu6_expire
480  * or so? (jinmei@kame.net 19990310)
481  */
482 int pmtu_expire = 60*10;
483 
484 /* raw IP6 parameters */
485 /*
486  * Nominal space allocated to a raw ip socket.
487  */
488 #define	RIPV6SNDQ	8192
489 #define	RIPV6RCVQ	8192
490 
491 u_long	rip6_sendspace = RIPV6SNDQ;
492 u_long	rip6_recvspace = RIPV6RCVQ;
493 
494 /* ICMPV6 parameters */
495 int	icmp6_rediraccept = 1;		/* accept and process redirects */
496 int	icmp6_redirtimeout = 10 * 60;	/* 10 minutes */
497 int	icmp6errppslim = 100;		/* 100pps */
498 int	icmp6_nodeinfo = 1;		/* enable/disable NI response */
499 
500 /* UDP on IP6 parameters */
501 int	udp6_sendspace = 9216;		/* really max datagram size */
502 int	udp6_recvspace = 40 * (1024 + sizeof(struct sockaddr_in6));
503 					/* 40 1K datagrams */
504