xref: /netbsd-src/sys/netinet6/in6_proto.c (revision 6d322f2f4598f0d8a138f10ea648ec4fabe41f8b)
1 /*	$NetBSD: in6_proto.c,v 1.100 2014/01/02 18:29:01 pooka Exp $	*/
2 /*	$KAME: in6_proto.c,v 1.66 2000/10/10 15:35:47 itojun Exp $	*/
3 
4 /*
5  * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
6  * All rights reserved.
7  *
8  * Redistribution and use in source and binary forms, with or without
9  * modification, are permitted provided that the following conditions
10  * are met:
11  * 1. Redistributions of source code must retain the above copyright
12  *    notice, this list of conditions and the following disclaimer.
13  * 2. Redistributions in binary form must reproduce the above copyright
14  *    notice, this list of conditions and the following disclaimer in the
15  *    documentation and/or other materials provided with the distribution.
16  * 3. Neither the name of the project nor the names of its contributors
17  *    may be used to endorse or promote products derived from this software
18  *    without specific prior written permission.
19  *
20  * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND
21  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
22  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
23  * ARE DISCLAIMED.  IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE
24  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
25  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
26  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
28  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
29  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
30  * SUCH DAMAGE.
31  */
32 
33 /*
34  * Copyright (c) 1982, 1986, 1993
35  *	The Regents of the University of California.  All rights reserved.
36  *
37  * Redistribution and use in source and binary forms, with or without
38  * modification, are permitted provided that the following conditions
39  * are met:
40  * 1. Redistributions of source code must retain the above copyright
41  *    notice, this list of conditions and the following disclaimer.
42  * 2. Redistributions in binary form must reproduce the above copyright
43  *    notice, this list of conditions and the following disclaimer in the
44  *    documentation and/or other materials provided with the distribution.
45  * 3. Neither the name of the University nor the names of its contributors
46  *    may be used to endorse or promote products derived from this software
47  *    without specific prior written permission.
48  *
49  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
50  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
51  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
52  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
53  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
54  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
55  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
56  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
57  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
58  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
59  * SUCH DAMAGE.
60  *
61  *	@(#)in_proto.c	8.1 (Berkeley) 6/10/93
62  */
63 
64 #include <sys/cdefs.h>
65 __KERNEL_RCSID(0, "$NetBSD: in6_proto.c,v 1.100 2014/01/02 18:29:01 pooka Exp $");
66 
67 #include "opt_gateway.h"
68 #include "opt_inet.h"
69 #include "opt_ipsec.h"
70 
71 #include <sys/param.h>
72 #include <sys/socket.h>
73 #include <sys/protosw.h>
74 #include <sys/kernel.h>
75 #include <sys/domain.h>
76 #include <sys/mbuf.h>
77 
78 #include <net/if.h>
79 #include <net/radix.h>
80 #include <net/route.h>
81 
82 #include <netinet/in.h>
83 #include <netinet/in_systm.h>
84 #include <netinet/in_var.h>
85 #include <netinet/ip_encap.h>
86 #include <netinet/ip.h>
87 #include <netinet/ip_var.h>
88 #include <netinet/in_pcb.h>
89 #include <netinet/ip6.h>
90 #include <netinet6/ip6_var.h>
91 #include <netinet/icmp6.h>
92 #include <netinet6/in6_pcb.h>
93 
94 #include <netinet/tcp.h>
95 #include <netinet/tcp_fsm.h>
96 #include <netinet/tcp_seq.h>
97 #include <netinet/tcp_timer.h>
98 #include <netinet/tcp_var.h>
99 #include <netinet/tcpip.h>
100 #include <netinet/tcp_debug.h>
101 
102 #include <netinet6/udp6.h>
103 #include <netinet6/udp6_var.h>
104 
105 #include <netinet6/pim6_var.h>
106 
107 #include <netinet6/nd6.h>
108 
109 #ifdef IPSEC
110 #include <netipsec/ipsec.h>
111 #include <netipsec/ipsec6.h>
112 #include <netipsec/key.h>
113 #endif /* IPSEC */
114 
115 
116 #include "carp.h"
117 #if NCARP > 0
118 #include <netinet/ip_carp.h>
119 #endif
120 
121 #include "etherip.h"
122 #if NETHERIP > 0
123 #include <netinet6/ip6_etherip.h>
124 #endif
125 
126 #include <netinet6/ip6protosw.h>
127 
128 #include <net/net_osdep.h>
129 
130 /*
131  * TCP/IP protocol family: IP6, ICMP6, UDP, TCP.
132  */
133 
134 DOMAIN_DEFINE(inet6domain);	/* forward declare and add to link set */
135 
136 /* Wrappers to acquire kernel_lock. */
137 
138 PR_WRAP_USRREQ(rip6_usrreq)
139 PR_WRAP_USRREQ(udp6_usrreq)
140 PR_WRAP_USRREQ(tcp_usrreq)
141 
142 #define	rip6_usrreq 	rip6_usrreq_wrapper
143 #define	udp6_usrreq 	udp6_usrreq_wrapper
144 #define	tcp_usrreq 	tcp_usrreq_wrapper
145 
146 PR_WRAP_CTLINPUT(rip6_ctlinput)
147 PR_WRAP_CTLINPUT(encap6_ctlinput)
148 PR_WRAP_CTLINPUT(udp6_ctlinput)
149 PR_WRAP_CTLINPUT(tcp6_ctlinput)
150 
151 #define	rip6_ctlinput	rip6_ctlinput_wrapper
152 #define	encap6_ctlinput	encap6_ctlinput_wrapper
153 #define	udp6_ctlinput	udp6_ctlinput_wrapper
154 #define	tcp6_ctlinput	tcp6_ctlinput_wrapper
155 
156 PR_WRAP_CTLOUTPUT(rip6_ctloutput)
157 PR_WRAP_CTLOUTPUT(tcp_ctloutput)
158 PR_WRAP_CTLOUTPUT(udp6_ctloutput)
159 PR_WRAP_CTLOUTPUT(icmp6_ctloutput)
160 
161 #define	rip6_ctloutput	rip6_ctloutput_wrapper
162 #define	tcp_ctloutput	tcp_ctloutput_wrapper
163 #define	udp6_ctloutput	udp6_ctloutput_wrapper
164 #define	icmp6_ctloutput	icmp6_ctloutput_wrapper
165 
166 #if defined(IPSEC)
167 PR_WRAP_CTLINPUT(ah6_ctlinput)
168 
169 #define	ah6_ctlinput	ah6_ctlinput_wrapper
170 #endif
171 
172 #if defined(IPSEC)
173 PR_WRAP_CTLINPUT(esp6_ctlinput)
174 
175 #define	esp6_ctlinput	esp6_ctlinput_wrapper
176 #endif
177 
178 static void
179 tcp6_init(void)
180 {
181 
182 	icmp6_mtudisc_callback_register(tcp6_mtudisc_callback);
183 
184 	tcp_init_common(sizeof(struct ip6_hdr));
185 }
186 
187 const struct ip6protosw inet6sw[] = {
188 {	.pr_domain = &inet6domain,
189 	.pr_protocol = IPPROTO_IPV6,
190 	.pr_init = ip6_init,
191 	.pr_fasttimo = frag6_fasttimo,
192 	.pr_slowtimo = frag6_slowtimo,
193 	.pr_drain = frag6_drainstub,
194 },
195 {	.pr_type = SOCK_DGRAM,
196 	.pr_domain = &inet6domain,
197 	.pr_protocol = IPPROTO_UDP,
198 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_PURGEIF,
199 	.pr_input = udp6_input,
200 	.pr_ctlinput = udp6_ctlinput,
201 	.pr_ctloutput = udp6_ctloutput,
202 	.pr_usrreq = udp6_usrreq,
203 	.pr_init = udp6_init,
204 },
205 {	.pr_type = SOCK_STREAM,
206 	.pr_domain = &inet6domain,
207 	.pr_protocol = IPPROTO_TCP,
208 	.pr_flags = PR_CONNREQUIRED|PR_WANTRCVD|PR_LISTEN|PR_ABRTACPTDIS|PR_PURGEIF,
209 	.pr_input = tcp6_input,
210 	.pr_ctlinput = tcp6_ctlinput,
211 	.pr_ctloutput = tcp_ctloutput,
212 	.pr_usrreq = tcp_usrreq,
213 	.pr_init = tcp6_init,
214 	.pr_fasttimo = tcp_fasttimo,
215 	.pr_drain = tcp_drainstub,
216 },
217 {	.pr_type = SOCK_RAW,
218 	.pr_domain = &inet6domain,
219 	.pr_protocol = IPPROTO_RAW,
220 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_PURGEIF,
221 	.pr_input = rip6_input,
222 	.pr_output = rip6_output,
223 	.pr_ctlinput = rip6_ctlinput,
224 	.pr_ctloutput = rip6_ctloutput,
225 	.pr_usrreq = rip6_usrreq,
226 },
227 #ifdef GATEWAY
228 {	.pr_domain = &inet6domain,
229 	.pr_protocol = IPPROTO_IPV6,
230 	.pr_slowtimo = ip6flow_slowtimo,
231 	.pr_init = ip6flow_poolinit,
232 },
233 #endif /* GATEWAY */
234 {	.pr_type = SOCK_RAW,
235 	.pr_domain = &inet6domain,
236 	.pr_protocol = IPPROTO_ICMPV6,
237 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
238 	.pr_input = icmp6_input,
239 	.pr_output = rip6_output,
240 	.pr_ctlinput = rip6_ctlinput,
241 	.pr_ctloutput = icmp6_ctloutput,
242 	.pr_usrreq = rip6_usrreq,
243 	.pr_init = icmp6_init,
244 },
245 {	.pr_type = SOCK_RAW,
246 	.pr_domain = &inet6domain,
247 	.pr_protocol = IPPROTO_DSTOPTS,
248 	.pr_flags = PR_ATOMIC|PR_ADDR,
249 	.pr_input = dest6_input,
250 },
251 {	.pr_type = SOCK_RAW,
252 	.pr_domain = &inet6domain,
253 	.pr_protocol = IPPROTO_ROUTING,
254 	.pr_flags = PR_ATOMIC|PR_ADDR,
255 	.pr_input = route6_input,
256 },
257 {	.pr_type = SOCK_RAW,
258 	.pr_domain = &inet6domain,
259 	.pr_protocol = IPPROTO_FRAGMENT,
260 	.pr_flags = PR_ATOMIC|PR_ADDR,
261 	.pr_input = frag6_input,
262 },
263 #ifdef IPSEC
264 {	.pr_type = SOCK_RAW,
265 	.pr_domain = &inet6domain,
266 	.pr_protocol = IPPROTO_AH,
267 	.pr_flags = PR_ATOMIC|PR_ADDR,
268 	.pr_input = ipsec6_common_input,
269 	.pr_ctlinput = ah6_ctlinput,
270 },
271 {	.pr_type = SOCK_RAW,
272 	.pr_domain = &inet6domain,
273 	.pr_protocol = IPPROTO_ESP,
274 	.pr_flags = PR_ATOMIC|PR_ADDR,
275 	.pr_input = ipsec6_common_input,
276 	.pr_ctlinput = esp6_ctlinput,
277 },
278 {	.pr_type = SOCK_RAW,
279 	.pr_domain = &inet6domain,
280 	.pr_protocol = IPPROTO_IPCOMP,
281 	.pr_flags = PR_ATOMIC|PR_ADDR,
282 	.pr_input = ipsec6_common_input,
283 },
284 #endif /* IPSEC */
285 #ifdef INET
286 {	.pr_type = SOCK_RAW,
287 	.pr_domain = &inet6domain,
288 	.pr_protocol = IPPROTO_IPV4,
289 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
290 	.pr_input = encap6_input,
291 	.pr_output = rip6_output,
292 	.pr_ctlinput = encap6_ctlinput,
293 	.pr_ctloutput = rip6_ctloutput,
294 	.pr_usrreq = rip6_usrreq,
295 	.pr_init = encap_init,
296 },
297 #endif
298 {	.pr_type = SOCK_RAW,
299 	.pr_domain = &inet6domain,
300 	.pr_protocol = IPPROTO_IPV6,
301 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
302 	.pr_input = encap6_input,
303 	.pr_output = rip6_output,
304 	.pr_ctlinput = encap6_ctlinput,
305 	.pr_ctloutput = rip6_ctloutput,
306 	.pr_usrreq = rip6_usrreq,
307 	.pr_init = encap_init,
308 },
309 #if NETHERIP > 0
310 {	.pr_type = SOCK_RAW,
311 	.pr_domain = &inet6domain,
312 	.pr_protocol = IPPROTO_ETHERIP,
313 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
314 	.pr_input = ip6_etherip_input,
315 	.pr_output = rip6_output,
316 	.pr_ctlinput = rip6_ctlinput,
317 	.pr_ctloutput = rip6_ctloutput,
318 	.pr_usrreq = rip6_usrreq,
319 },
320 #endif
321 #if NCARP > 0
322 {	.pr_type = SOCK_RAW,
323 	.pr_domain = &inet6domain,
324 	.pr_protocol = IPPROTO_CARP,
325 	.pr_flags = PR_ATOMIC|PR_ADDR,
326 	.pr_input = carp6_proto_input,
327 	.pr_output = rip6_output,
328 	.pr_ctloutput = rip6_ctloutput,
329 	.pr_usrreq = rip6_usrreq,
330 },
331 #endif /* NCARP */
332 {	.pr_type = SOCK_RAW,
333 	.pr_domain = &inet6domain,
334 	.pr_protocol = IPPROTO_PIM,
335 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
336 	.pr_input = pim6_input,
337 	.pr_output = rip6_output,
338 	.pr_ctloutput = rip6_ctloutput,
339 	.pr_usrreq = rip6_usrreq,
340 	.pr_init = pim6_init,
341 },
342 /* raw wildcard */
343 {	.pr_type = SOCK_RAW,
344 	.pr_domain = &inet6domain,
345 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
346 	.pr_input = rip6_input,
347 	.pr_output = rip6_output,
348 	.pr_ctloutput = rip6_ctloutput,
349 	.pr_usrreq = rip6_usrreq,
350 	.pr_init = rip6_init,
351 },
352 };
353 
354 static const struct sockaddr_in6 in6_any = {
355 	  .sin6_len = sizeof(in6_any)
356 	, .sin6_family = AF_INET6
357 	, .sin6_port = 0
358 	, .sin6_flowinfo = 0
359 	, .sin6_addr = IN6ADDR_ANY_INIT
360 	, .sin6_scope_id = 0
361 };
362 
363 bool in6_present = false;
364 static void
365 in6_init(void)
366 {
367 
368 	in6_present = true;
369 }
370 
371 struct domain inet6domain = {
372 	.dom_family = AF_INET6, .dom_name = "internet6",
373 	.dom_init = in6_init, .dom_externalize = NULL, .dom_dispose = NULL,
374 	.dom_protosw = (const struct protosw *)inet6sw,
375 	.dom_protoswNPROTOSW = (const struct protosw *)&inet6sw[sizeof(inet6sw)/sizeof(inet6sw[0])],
376 	.dom_rtattach = rt_inithead,
377 	.dom_rtoffset = offsetof(struct sockaddr_in6, sin6_addr) << 3,
378 	.dom_maxrtkey = sizeof(struct ip_pack6),
379 	.dom_ifattach = in6_domifattach, .dom_ifdetach = in6_domifdetach,
380 	.dom_ifqueues = { &ip6intrq, NULL },
381 	.dom_link = { NULL },
382 	.dom_mowner = MOWNER_INIT("",""),
383 	.dom_sa_cmpofs = offsetof(struct sockaddr_in6, sin6_addr),
384 	.dom_sa_cmplen = sizeof(struct in6_addr),
385 	.dom_sa_any = (const struct sockaddr *)&in6_any,
386 	.dom_sockaddr_externalize = sockaddr_in6_externalize,
387 	.dom_rtcache = LIST_HEAD_INITIALIZER(inet6domain.dom_rtcache)
388 };
389 
390 #if 0
391 int
392 sockaddr_in6_cmp(const struct sockaddr *lsa, const struct sockaddr *rsa)
393 {
394 	uint_fast8_t len;
395 	const uint_fast8_t addrofs = offsetof(struct sockaddr_in6, sin6_addr),
396 			   addrend = addrofs + sizeof(struct in6_addr);
397 	int rc;
398 	const struct sockaddr_in6 *lsin6, *rsin6;
399 
400 	lsin6 = satocsin6(lsa);
401 	rsin6 = satocsin6(rsa);
402 
403 	len = MIN(addrend, MIN(lsin6->sin6_len, rsin6->sin6_len));
404 
405 	if (len > addrofs &&
406 	    (rc = memcmp(&lsin6->sin6_addr, &rsin6->sin6_addr,
407 	                  len - addrofs)) != 0)
408 		return rc;
409 
410 	return lsin6->sin6_len - rsin6->sin6_len;
411 }
412 #endif
413 
414 /*
415  * Internet configuration info
416  */
417 #ifndef	IPV6FORWARDING
418 #ifdef GATEWAY6
419 #define	IPV6FORWARDING	1	/* forward IP6 packets not for us */
420 #else
421 #define	IPV6FORWARDING	0	/* don't forward IP6 packets not for us */
422 #endif /* GATEWAY6 */
423 #endif /* !IPV6FORWARDING */
424 
425 int	ip6_forwarding = IPV6FORWARDING;	/* act as router? */
426 int	ip6_sendredirects = 1;
427 int	ip6_defhlim = IPV6_DEFHLIM;
428 int	ip6_defmcasthlim = IPV6_DEFAULT_MULTICAST_HOPS;
429 int	ip6_accept_rtadv = 0;	/* "IPV6FORWARDING ? 0 : 1" is dangerous */
430 int	ip6_maxfragpackets = 200;
431 int	ip6_maxfrags = 200;
432 int	ip6_log_interval = 5;
433 int	ip6_hdrnestlimit = 50;	/* appropriate? */
434 int	ip6_dad_count = 1;	/* DupAddrDetectionTransmits */
435 int	ip6_auto_flowlabel = 1;
436 int	ip6_use_deprecated = 1;	/* allow deprecated addr (RFC2462 5.5.4) */
437 int	ip6_rr_prune = 5;	/* router renumbering prefix
438 				 * walk list every 5 sec. */
439 int	ip6_mcast_pmtu = 0;	/* enable pMTU discovery for multicast? */
440 int	ip6_v6only = 1;
441 int     ip6_neighborgcthresh = 2048; /* Threshold # of NDP entries for GC */
442 int     ip6_maxifprefixes = 16; /* Max acceptable prefixes via RA per IF */
443 int     ip6_maxifdefrouters = 16; /* Max acceptable def routers via RA */
444 int     ip6_maxdynroutes = 4096; /* Max # of routes created via redirect */
445 
446 int	ip6_keepfaith = 0;
447 time_t	ip6_log_time = 0;
448 int	ip6_rtadv_maxroutes = 100; /* (arbitrary) initial maximum number of
449                                     * routes via rtadv expected to be
450                                     * significantly larger than common use.
451                                     * if you need to count: 3 extra initial
452                                     * routes, plus 1 per interface after the
453                                     * first one, then one per non-linklocal
454                                     * prefix */
455 
456 /* icmp6 */
457 /*
458  * BSDI4 defines these variables in in_proto.c...
459  * XXX: what if we don't define INET? Should we define pmtu6_expire
460  * or so? (jinmei@kame.net 19990310)
461  */
462 int pmtu_expire = 60*10;
463 
464 /* raw IP6 parameters */
465 /*
466  * Nominal space allocated to a raw ip socket.
467  */
468 #define	RIPV6SNDQ	8192
469 #define	RIPV6RCVQ	8192
470 
471 u_long	rip6_sendspace = RIPV6SNDQ;
472 u_long	rip6_recvspace = RIPV6RCVQ;
473 
474 /* ICMPV6 parameters */
475 int	icmp6_rediraccept = 1;		/* accept and process redirects */
476 int	icmp6_redirtimeout = 10 * 60;	/* 10 minutes */
477 int	icmp6errppslim = 100;		/* 100pps */
478 int	icmp6_nodeinfo = 1;		/* enable/disable NI response */
479 
480 /* UDP on IP6 parameters */
481 int	udp6_sendspace = 9216;		/* really max datagram size */
482 int	udp6_recvspace = 40 * (1024 + sizeof(struct sockaddr_in6));
483 					/* 40 1K datagrams */
484