xref: /netbsd-src/sys/netinet6/in6_proto.c (revision 8b0f9554ff8762542c4defc4f70e1eb76fb508fa)
1 /*	$NetBSD: in6_proto.c,v 1.79 2007/09/19 04:33:44 dyoung Exp $	*/
2 /*	$KAME: in6_proto.c,v 1.66 2000/10/10 15:35:47 itojun Exp $	*/
3 
4 /*
5  * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
6  * All rights reserved.
7  *
8  * Redistribution and use in source and binary forms, with or without
9  * modification, are permitted provided that the following conditions
10  * are met:
11  * 1. Redistributions of source code must retain the above copyright
12  *    notice, this list of conditions and the following disclaimer.
13  * 2. Redistributions in binary form must reproduce the above copyright
14  *    notice, this list of conditions and the following disclaimer in the
15  *    documentation and/or other materials provided with the distribution.
16  * 3. Neither the name of the project nor the names of its contributors
17  *    may be used to endorse or promote products derived from this software
18  *    without specific prior written permission.
19  *
20  * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND
21  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
22  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
23  * ARE DISCLAIMED.  IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE
24  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
25  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
26  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
28  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
29  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
30  * SUCH DAMAGE.
31  */
32 
33 /*
34  * Copyright (c) 1982, 1986, 1993
35  *	The Regents of the University of California.  All rights reserved.
36  *
37  * Redistribution and use in source and binary forms, with or without
38  * modification, are permitted provided that the following conditions
39  * are met:
40  * 1. Redistributions of source code must retain the above copyright
41  *    notice, this list of conditions and the following disclaimer.
42  * 2. Redistributions in binary form must reproduce the above copyright
43  *    notice, this list of conditions and the following disclaimer in the
44  *    documentation and/or other materials provided with the distribution.
45  * 3. Neither the name of the University nor the names of its contributors
46  *    may be used to endorse or promote products derived from this software
47  *    without specific prior written permission.
48  *
49  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
50  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
51  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
52  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
53  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
54  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
55  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
56  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
57  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
58  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
59  * SUCH DAMAGE.
60  *
61  *	@(#)in_proto.c	8.1 (Berkeley) 6/10/93
62  */
63 
64 #include <sys/cdefs.h>
65 __KERNEL_RCSID(0, "$NetBSD: in6_proto.c,v 1.79 2007/09/19 04:33:44 dyoung Exp $");
66 
67 #include "opt_inet.h"
68 #include "opt_ipsec.h"
69 #include "opt_iso.h"
70 
71 #include <sys/param.h>
72 #include <sys/socket.h>
73 #include <sys/protosw.h>
74 #include <sys/kernel.h>
75 #include <sys/domain.h>
76 #include <sys/mbuf.h>
77 
78 #include <net/if.h>
79 #include <net/radix.h>
80 #include <net/route.h>
81 
82 #include <netinet/in.h>
83 #include <netinet/in_systm.h>
84 #include <netinet/in_var.h>
85 #include <netinet/ip_encap.h>
86 #include <netinet/ip.h>
87 #include <netinet/ip_var.h>
88 #include <netinet/in_pcb.h>
89 #include <netinet/ip6.h>
90 #include <netinet6/ip6_var.h>
91 #include <netinet/icmp6.h>
92 #include <netinet6/in6_pcb.h>
93 
94 #include <netinet/tcp.h>
95 #include <netinet/tcp_fsm.h>
96 #include <netinet/tcp_seq.h>
97 #include <netinet/tcp_timer.h>
98 #include <netinet/tcp_var.h>
99 #include <netinet/tcpip.h>
100 #include <netinet/tcp_debug.h>
101 
102 #include <netinet6/udp6.h>
103 #include <netinet6/udp6_var.h>
104 
105 #include <netinet6/pim6_var.h>
106 
107 #include <netinet6/nd6.h>
108 
109 #ifdef IPSEC
110 #include <netinet6/ipsec.h>
111 #include <netinet6/ah.h>
112 #ifdef IPSEC_ESP
113 #include <netinet6/esp.h>
114 #endif
115 #include <netinet6/ipcomp.h>
116 #endif /* IPSEC */
117 
118 #ifdef FAST_IPSEC
119 #include <netipsec/ipsec.h>
120 #include <netipsec/ipsec6.h>
121 #include <netipsec/key.h>
122 #endif /* FAST_IPSEC */
123 
124 
125 #include "carp.h"
126 #if NCARP > 0
127 #include <netinet/ip_carp.h>
128 #endif
129 
130 #include "etherip.h"
131 #if NETHERIP > 1
132 #include <netinet6/ip6_etherip.h>
133 #endif
134 
135 #include <netinet6/ip6protosw.h>
136 
137 #include <net/net_osdep.h>
138 
139 #ifndef offsetof		/* XXX */
140 #define	offsetof(type, member)	((size_t)(&((type *)0)->member))
141 #endif
142 
143 /*
144  * TCP/IP protocol family: IP6, ICMP6, UDP, TCP.
145  */
146 
147 DOMAIN_DEFINE(inet6domain);	/* forward declare and add to link set */
148 
149 const struct ip6protosw inet6sw[] = {
150 {	.pr_domain = &inet6domain,
151 	.pr_protocol = IPPROTO_IPV6,
152 	.pr_init = ip6_init,
153 	.pr_slowtimo = frag6_slowtimo,
154 	.pr_drain = frag6_drain,
155 },
156 {	.pr_type = SOCK_DGRAM,
157 	.pr_domain = &inet6domain,
158 	.pr_protocol = IPPROTO_UDP,
159 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_PURGEIF,
160 	.pr_input = udp6_input,
161 	.pr_ctlinput = udp6_ctlinput,
162 	.pr_ctloutput = ip6_ctloutput,
163 	.pr_usrreq = udp6_usrreq,
164 	.pr_init = udp6_init,
165 },
166 {	.pr_type = SOCK_STREAM,
167 	.pr_domain = &inet6domain,
168 	.pr_protocol = IPPROTO_TCP,
169 	.pr_flags = PR_CONNREQUIRED|PR_WANTRCVD|PR_LISTEN|PR_ABRTACPTDIS|PR_PURGEIF,
170 	.pr_input = tcp6_input,
171 	.pr_ctlinput = tcp6_ctlinput,
172 	.pr_ctloutput = tcp_ctloutput,
173 	.pr_usrreq = tcp_usrreq,
174 #ifndef INET	/* don't call initialization and timeout routines twice */
175 	.pr_init = tcp_init,
176 	.pr_slowtimo = tcp_slowtimo,
177 	.pr_drain = tcp_drain,
178 #endif
179 },
180 {	.pr_type = SOCK_RAW,
181 	.pr_domain = &inet6domain,
182 	.pr_protocol = IPPROTO_RAW,
183 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_PURGEIF,
184 	.pr_input = rip6_input,
185 	.pr_output = rip6_output,
186 	.pr_ctlinput = rip6_ctlinput,
187 	.pr_ctloutput = rip6_ctloutput,
188 	.pr_usrreq = rip6_usrreq,
189 },
190 #ifdef GATEWAY
191 {	.pr_domain = &inet6domain,
192 	.pr_protocol = IPPROTO_IPV6,
193 	.pr_slowtimo = ip6flow_slowtimo,
194 },
195 #endif /* GATEWAY */
196 {	.pr_type = SOCK_RAW,
197 	.pr_domain = &inet6domain,
198 	.pr_protocol = IPPROTO_ICMPV6,
199 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
200 	.pr_input = icmp6_input,
201 	.pr_output = rip6_output,
202 	.pr_ctlinput = rip6_ctlinput,
203 	.pr_ctloutput = icmp6_ctloutput,
204 	.pr_usrreq = rip6_usrreq,
205 	.pr_init = icmp6_init,
206 },
207 {	.pr_type = SOCK_RAW,
208 	.pr_domain = &inet6domain,
209 	.pr_protocol = IPPROTO_DSTOPTS,
210 	.pr_flags = PR_ATOMIC|PR_ADDR,
211 	.pr_input = dest6_input,
212 },
213 {	.pr_type = SOCK_RAW,
214 	.pr_domain = &inet6domain,
215 	.pr_protocol = IPPROTO_ROUTING,
216 	.pr_flags = PR_ATOMIC|PR_ADDR,
217 	.pr_input = route6_input,
218 },
219 {	.pr_type = SOCK_RAW,
220 	.pr_domain = &inet6domain,
221 	.pr_protocol = IPPROTO_FRAGMENT,
222 	.pr_flags = PR_ATOMIC|PR_ADDR,
223 	.pr_input = frag6_input,
224 },
225 #ifdef IPSEC
226 {	.pr_type = SOCK_RAW,
227 	.pr_domain = &inet6domain,
228 	.pr_protocol = IPPROTO_AH,
229 	.pr_flags = PR_ATOMIC|PR_ADDR,
230 	.pr_input = ah6_input,
231 	.pr_ctlinput = ah6_ctlinput,
232 },
233 #ifdef IPSEC_ESP
234 {	.pr_type = SOCK_RAW,
235 	.pr_domain = &inet6domain,
236 	.pr_protocol = IPPROTO_ESP,
237 	.pr_flags = PR_ATOMIC|PR_ADDR,
238 	.pr_input = esp6_input,
239 	.pr_ctlinput = esp6_ctlinput,
240 },
241 #endif
242 {	.pr_type = SOCK_RAW,
243 	.pr_domain = &inet6domain,
244 	.pr_protocol = IPPROTO_IPCOMP,
245 	.pr_flags = PR_ATOMIC|PR_ADDR,
246 	.pr_input = ipcomp6_input,
247 },
248 #endif /* IPSEC */
249 #ifdef FAST_IPSEC
250 {	.pr_type = SOCK_RAW,
251 	.pr_domain = &inet6domain,
252 	.pr_protocol = IPPROTO_AH,
253 	.pr_flags = PR_ATOMIC|PR_ADDR,
254 	.pr_input = ipsec6_common_input,
255 	.pr_ctlinput = ah6_ctlinput,
256 },
257 {	.pr_type = SOCK_RAW,
258 	.pr_domain = &inet6domain,
259 	.pr_protocol = IPPROTO_ESP,
260 	.pr_flags = PR_ATOMIC|PR_ADDR,
261 	.pr_input = ipsec6_common_input,
262 	.pr_ctlinput = esp6_ctlinput,
263 },
264 {	.pr_type = SOCK_RAW,
265 	.pr_domain = &inet6domain,
266 	.pr_protocol = IPPROTO_IPCOMP,
267 	.pr_flags = PR_ATOMIC|PR_ADDR,
268 	.pr_input = ipsec6_common_input,
269 },
270 #endif /* FAST_IPSEC */
271 #ifdef INET
272 {	.pr_type = SOCK_RAW,
273 	.pr_domain = &inet6domain,
274 	.pr_protocol = IPPROTO_IPV4,
275 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
276 	.pr_input = encap6_input,
277 	.pr_output = rip6_output,
278 	.pr_ctlinput = encap6_ctlinput,
279 	.pr_ctloutput = rip6_ctloutput,
280 	.pr_usrreq = rip6_usrreq,
281 	.pr_init = encap_init,
282 },
283 #endif
284 {	.pr_type = SOCK_RAW,
285 	.pr_domain = &inet6domain,
286 	.pr_protocol = IPPROTO_IPV6,
287 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
288 	.pr_input = encap6_input,
289 	.pr_output = rip6_output,
290 	.pr_ctlinput = encap6_ctlinput,
291 	.pr_ctloutput = rip6_ctloutput,
292 	.pr_usrreq = rip6_usrreq,
293 	.pr_init = encap_init,
294 },
295 #if NETHERIP > 1
296 {	.pr_type = SOCK_RAW,
297 	.pr_domain = &inet6domain,
298 	.pr_protocol = IPPROTO_ETHERIP,
299 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
300 	.pr_input = ip6_etherip_input,
301 	.pr_output = rip6_output,
302 	.pr_ctlinput = rip6_ctlinput,
303 	.pr_ctloutput = rip6_ctloutput,
304 	.pr_usrreq = rip6_usrreq,
305 },
306 #endif
307 #if NCARP > 0
308 {	.pr_type = SOCK_RAW,
309 	.pr_domain = &inet6domain,
310 	.pr_protocol = IPPROTO_CARP,
311 	.pr_flags = PR_ATOMIC|PR_ADDR,
312 	.pr_input = carp6_proto_input,
313 	.pr_output = rip6_output,
314 	.pr_ctloutput = rip6_ctloutput,
315 	.pr_usrreq = rip6_usrreq,
316 },
317 #endif /* NCARP */
318 #ifdef ISO
319 {	.pr_type = SOCK_RAW,
320 	.pr_domain = &inet6domain,
321 	.pr_protocol = IPPROTO_EON,
322 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
323 	.pr_input = encap6_input,
324 	.pr_output = rip6_output,
325 	.pr_ctlinput = encap6_ctlinput,
326 	.pr_ctloutput = rip6_ctloutput,
327 	.pr_usrreq = rip6_usrreq,
328 	/*XXX*/
329 	.pr_init = encap_init,
330 },
331 #endif
332 {	.pr_type = SOCK_RAW,
333 	.pr_domain = &inet6domain,
334 	.pr_protocol = IPPROTO_PIM,
335 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
336 	.pr_input = pim6_input,
337 	.pr_output = rip6_output,
338 	.pr_ctloutput = rip6_ctloutput,
339 	.pr_usrreq = rip6_usrreq,
340 },
341 /* raw wildcard */
342 {	.pr_type = SOCK_RAW,
343 	.pr_domain = &inet6domain,
344 	.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
345 	.pr_input = rip6_input,
346 	.pr_output = rip6_output,
347 	.pr_ctloutput = rip6_ctloutput,
348 	.pr_usrreq = rip6_usrreq,
349 	.pr_init = rip6_init,
350 },
351 };
352 
353 static const struct sockaddr_in6 in6_any = {
354 	  .sin6_len = sizeof(in6_any)
355 	, .sin6_family = AF_INET6
356 	, .sin6_port = 0
357 	, .sin6_flowinfo = 0
358 	, .sin6_addr = IN6ADDR_ANY_INIT
359 	, .sin6_scope_id = 0
360 };
361 
362 struct domain inet6domain = {
363 	.dom_family = AF_INET6, .dom_name = "internet6",
364 	.dom_init = NULL, .dom_externalize = NULL, .dom_dispose = NULL,
365 	.dom_protosw = (const struct protosw *)inet6sw,
366 	.dom_protoswNPROTOSW = (const struct protosw *)&inet6sw[sizeof(inet6sw)/sizeof(inet6sw[0])],
367 	.dom_rtattach = rn_inithead,
368 	.dom_rtoffset = offsetof(struct sockaddr_in6, sin6_addr) << 3,
369 	.dom_maxrtkey = sizeof(struct sockaddr_in6),
370 	.dom_ifattach = in6_domifattach, .dom_ifdetach = in6_domifdetach,
371 	.dom_ifqueues = { &ip6intrq, NULL },
372 	.dom_link = { NULL },
373 	.dom_mowner = MOWNER_INIT("",""),
374 	.dom_sa_cmpofs = offsetof(struct sockaddr_in6, sin6_addr),
375 	.dom_sa_cmplen = sizeof(struct in6_addr),
376 	.dom_sa_any = (const struct sockaddr *)&in6_any,
377 	.dom_rtcache = LIST_HEAD_INITIALIZER(inet6domain.dom_rtcache)
378 };
379 
380 int
381 sockaddr_in6_cmp(const struct sockaddr *lsa, const struct sockaddr *rsa)
382 {
383 	uint_fast8_t len;
384 	const uint_fast8_t addrofs = offsetof(struct sockaddr_in6, sin6_addr),
385 			   addrend = addrofs + sizeof(struct in6_addr);
386 	int rc;
387 	const struct sockaddr_in6 *lsin6, *rsin6;
388 
389 	lsin6 = satocsin6(lsa);
390 	rsin6 = satocsin6(rsa);
391 
392 	len = MIN(addrend, MIN(lsin6->sin6_len, rsin6->sin6_len));
393 
394 	if (len > addrofs &&
395 	    (rc = memcmp(&lsin6->sin6_addr, &rsin6->sin6_addr,
396 	                  len - addrofs)) != 0)
397 		return rc;
398 
399 	return lsin6->sin6_len - rsin6->sin6_len;
400 }
401 
402 /*
403  * Internet configuration info
404  */
405 #ifndef	IPV6FORWARDING
406 #ifdef GATEWAY6
407 #define	IPV6FORWARDING	1	/* forward IP6 packets not for us */
408 #else
409 #define	IPV6FORWARDING	0	/* don't forward IP6 packets not for us */
410 #endif /* GATEWAY6 */
411 #endif /* !IPV6FORWARDING */
412 
413 int	ip6_forwarding = IPV6FORWARDING;	/* act as router? */
414 int	ip6_sendredirects = 1;
415 int	ip6_defhlim = IPV6_DEFHLIM;
416 int	ip6_defmcasthlim = IPV6_DEFAULT_MULTICAST_HOPS;
417 int	ip6_accept_rtadv = 0;	/* "IPV6FORWARDING ? 0 : 1" is dangerous */
418 int	ip6_maxfragpackets = 200;
419 int	ip6_maxfrags = 200;
420 int	ip6_log_interval = 5;
421 int	ip6_hdrnestlimit = 50;	/* appropriate? */
422 int	ip6_dad_count = 1;	/* DupAddrDetectionTransmits */
423 int	ip6_auto_flowlabel = 1;
424 int	ip6_use_deprecated = 1;	/* allow deprecated addr (RFC2462 5.5.4) */
425 int	ip6_rr_prune = 5;	/* router renumbering prefix
426 				 * walk list every 5 sec. */
427 int	ip6_mcast_pmtu = 0;	/* enable pMTU discovery for multicast? */
428 int	ip6_v6only = 1;
429 
430 int	ip6_keepfaith = 0;
431 time_t	ip6_log_time = (time_t)0L;
432 
433 /* icmp6 */
434 /*
435  * BSDI4 defines these variables in in_proto.c...
436  * XXX: what if we don't define INET? Should we define pmtu6_expire
437  * or so? (jinmei@kame.net 19990310)
438  */
439 int pmtu_expire = 60*10;
440 
441 /* raw IP6 parameters */
442 /*
443  * Nominal space allocated to a raw ip socket.
444  */
445 #define	RIPV6SNDQ	8192
446 #define	RIPV6RCVQ	8192
447 
448 u_long	rip6_sendspace = RIPV6SNDQ;
449 u_long	rip6_recvspace = RIPV6RCVQ;
450 
451 /* ICMPV6 parameters */
452 int	icmp6_rediraccept = 1;		/* accept and process redirects */
453 int	icmp6_redirtimeout = 10 * 60;	/* 10 minutes */
454 int	icmp6errppslim = 100;		/* 100pps */
455 int	icmp6_nodeinfo = 1;		/* enable/disable NI response */
456 
457 /* UDP on IP6 parameters */
458 int	udp6_sendspace = 9216;		/* really max datagram size */
459 int	udp6_recvspace = 40 * (1024 + sizeof(struct sockaddr_in6));
460 					/* 40 1K datagrams */
461