1caf43b02SWarner Losh /*- 251369649SPedro F. Giffuni * SPDX-License-Identifier: BSD-3-Clause 351369649SPedro F. Giffuni * 482cd038dSYoshinobu Inoue * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project. 5fa046d87SRobert Watson * Copyright (c) 2010-2011 Juniper Networks, Inc. 682cd038dSYoshinobu Inoue * All rights reserved. 782cd038dSYoshinobu Inoue * 8fa046d87SRobert Watson * Portions of this software were developed by Robert N. M. Watson under 9fa046d87SRobert Watson * contract to Juniper Networks, Inc. 10fa046d87SRobert Watson * 1182cd038dSYoshinobu Inoue * Redistribution and use in source and binary forms, with or without 1282cd038dSYoshinobu Inoue * modification, are permitted provided that the following conditions 1382cd038dSYoshinobu Inoue * are met: 1482cd038dSYoshinobu Inoue * 1. Redistributions of source code must retain the above copyright 1582cd038dSYoshinobu Inoue * notice, this list of conditions and the following disclaimer. 1682cd038dSYoshinobu Inoue * 2. Redistributions in binary form must reproduce the above copyright 1782cd038dSYoshinobu Inoue * notice, this list of conditions and the following disclaimer in the 1882cd038dSYoshinobu Inoue * documentation and/or other materials provided with the distribution. 1982cd038dSYoshinobu Inoue * 3. Neither the name of the project nor the names of its contributors 2082cd038dSYoshinobu Inoue * may be used to endorse or promote products derived from this software 2182cd038dSYoshinobu Inoue * without specific prior written permission. 2282cd038dSYoshinobu Inoue * 2382cd038dSYoshinobu Inoue * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND 2482cd038dSYoshinobu Inoue * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 2582cd038dSYoshinobu Inoue * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 2682cd038dSYoshinobu Inoue * ARE DISCLAIMED. IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE 2782cd038dSYoshinobu Inoue * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 2882cd038dSYoshinobu Inoue * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 2982cd038dSYoshinobu Inoue * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 3082cd038dSYoshinobu Inoue * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 3182cd038dSYoshinobu Inoue * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 3282cd038dSYoshinobu Inoue * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 3382cd038dSYoshinobu Inoue * SUCH DAMAGE. 3482cd038dSYoshinobu Inoue * 35b48287a3SDavid E. O'Brien * $KAME: in6_pcb.c,v 1.31 2001/05/21 05:45:10 jinmei Exp $ 3682cd038dSYoshinobu Inoue */ 3782cd038dSYoshinobu Inoue 38caf43b02SWarner Losh /*- 3982cd038dSYoshinobu Inoue * Copyright (c) 1982, 1986, 1991, 1993 4082cd038dSYoshinobu Inoue * The Regents of the University of California. All rights reserved. 4182cd038dSYoshinobu Inoue * 4282cd038dSYoshinobu Inoue * Redistribution and use in source and binary forms, with or without 4382cd038dSYoshinobu Inoue * modification, are permitted provided that the following conditions 4482cd038dSYoshinobu Inoue * are met: 4582cd038dSYoshinobu Inoue * 1. Redistributions of source code must retain the above copyright 4682cd038dSYoshinobu Inoue * notice, this list of conditions and the following disclaimer. 4782cd038dSYoshinobu Inoue * 2. Redistributions in binary form must reproduce the above copyright 4882cd038dSYoshinobu Inoue * notice, this list of conditions and the following disclaimer in the 4982cd038dSYoshinobu Inoue * documentation and/or other materials provided with the distribution. 50fbbd9655SWarner Losh * 3. Neither the name of the University nor the names of its contributors 5182cd038dSYoshinobu Inoue * may be used to endorse or promote products derived from this software 5282cd038dSYoshinobu Inoue * without specific prior written permission. 5382cd038dSYoshinobu Inoue * 5482cd038dSYoshinobu Inoue * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 5582cd038dSYoshinobu Inoue * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 5682cd038dSYoshinobu Inoue * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 5782cd038dSYoshinobu Inoue * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 5882cd038dSYoshinobu Inoue * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 5982cd038dSYoshinobu Inoue * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 6082cd038dSYoshinobu Inoue * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 6182cd038dSYoshinobu Inoue * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 6282cd038dSYoshinobu Inoue * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 6382cd038dSYoshinobu Inoue * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 6482cd038dSYoshinobu Inoue * SUCH DAMAGE. 6582cd038dSYoshinobu Inoue */ 6682cd038dSYoshinobu Inoue 67b48287a3SDavid E. O'Brien #include <sys/cdefs.h> 6833841545SHajimu UMEMOTO #include "opt_inet.h" 6933841545SHajimu UMEMOTO #include "opt_inet6.h" 706a800098SYoshinobu Inoue #include "opt_ipsec.h" 710c325f53SAlexander V. Chernikov #include "opt_route.h" 727527624eSRobert Watson #include "opt_rss.h" 7382cd038dSYoshinobu Inoue 74a0577692SGleb Smirnoff #include <sys/hash.h> 7582cd038dSYoshinobu Inoue #include <sys/param.h> 7682cd038dSYoshinobu Inoue #include <sys/systm.h> 7782cd038dSYoshinobu Inoue #include <sys/malloc.h> 7882cd038dSYoshinobu Inoue #include <sys/mbuf.h> 79fb59c426SYoshinobu Inoue #include <sys/domain.h> 80fdb987beSMark Johnston #include <sys/proc.h> 8182cd038dSYoshinobu Inoue #include <sys/protosw.h> 82fdb987beSMark Johnston #include <sys/smr.h> 8382cd038dSYoshinobu Inoue #include <sys/socket.h> 8482cd038dSYoshinobu Inoue #include <sys/socketvar.h> 8582cd038dSYoshinobu Inoue #include <sys/sockio.h> 86417b35a9SMark Johnston #include <sys/sysctl.h> 8782cd038dSYoshinobu Inoue #include <sys/errno.h> 8882cd038dSYoshinobu Inoue #include <sys/time.h> 89acd3428bSRobert Watson #include <sys/priv.h> 9082cd038dSYoshinobu Inoue #include <sys/proc.h> 9182cd038dSYoshinobu Inoue #include <sys/jail.h> 9282cd038dSYoshinobu Inoue 9394540027SJeff Roberson #include <vm/uma.h> 9482cd038dSYoshinobu Inoue 9582cd038dSYoshinobu Inoue #include <net/if.h> 9676039bc8SGleb Smirnoff #include <net/if_var.h> 976d768226SGeorge V. Neville-Neil #include <net/if_llatbl.h> 9882cd038dSYoshinobu Inoue #include <net/if_types.h> 9982cd038dSYoshinobu Inoue #include <net/route.h> 100983066f0SAlexander V. Chernikov #include <net/route/nhop.h> 101417b35a9SMark Johnston #include <net/vnet.h> 10282cd038dSYoshinobu Inoue 10382cd038dSYoshinobu Inoue #include <netinet/in.h> 10482cd038dSYoshinobu Inoue #include <netinet/in_var.h> 10582cd038dSYoshinobu Inoue #include <netinet/in_systm.h> 106686cdd19SJun-ichiro itojun Hagino #include <netinet/ip6.h> 107fb59c426SYoshinobu Inoue #include <netinet/ip_var.h> 108ac957cd2SJulian Elischer 10982cd038dSYoshinobu Inoue #include <netinet6/ip6_var.h> 11082cd038dSYoshinobu Inoue #include <netinet6/nd6.h> 11182cd038dSYoshinobu Inoue #include <netinet/in_pcb.h> 1120f617ae4SGleb Smirnoff #include <netinet/in_pcb_var.h> 11382cd038dSYoshinobu Inoue #include <netinet6/in6_pcb.h> 114983066f0SAlexander V. Chernikov #include <netinet6/in6_fib.h> 115a1f7e5f8SHajimu UMEMOTO #include <netinet6/scope6_var.h> 11682cd038dSYoshinobu Inoue 117417b35a9SMark Johnston SYSCTL_DECL(_net_inet6); 118417b35a9SMark Johnston SYSCTL_DECL(_net_inet6_ip6); 119417b35a9SMark Johnston VNET_DEFINE_STATIC(int, connect_in6addr_wild) = 1; 120417b35a9SMark Johnston #define V_connect_in6addr_wild VNET(connect_in6addr_wild) 121417b35a9SMark Johnston SYSCTL_INT(_net_inet6_ip6, OID_AUTO, connect_in6addr_wild, 122417b35a9SMark Johnston CTLFLAG_VNET | CTLFLAG_RW, &VNET_NAME(connect_in6addr_wild), 0, 123417b35a9SMark Johnston "Allow connecting to the unspecified address for connect(2)"); 124417b35a9SMark Johnston 12582cd038dSYoshinobu Inoue int 126147f018aSGleb Smirnoff in6_pcbsetport(struct in6_addr *laddr, struct inpcb *inp, struct ucred *cred) 127147f018aSGleb Smirnoff { 128147f018aSGleb Smirnoff struct socket *so = inp->inp_socket; 129147f018aSGleb Smirnoff u_int16_t lport = 0; 130147f018aSGleb Smirnoff int error, lookupflags = 0; 131147f018aSGleb Smirnoff #ifdef INVARIANTS 132147f018aSGleb Smirnoff struct inpcbinfo *pcbinfo = inp->inp_pcbinfo; 133147f018aSGleb Smirnoff #endif 134147f018aSGleb Smirnoff 135147f018aSGleb Smirnoff INP_WLOCK_ASSERT(inp); 136147f018aSGleb Smirnoff INP_HASH_WLOCK_ASSERT(pcbinfo); 137147f018aSGleb Smirnoff 138147f018aSGleb Smirnoff error = prison_local_ip6(cred, laddr, 139147f018aSGleb Smirnoff ((inp->inp_flags & IN6P_IPV6_V6ONLY) != 0)); 140147f018aSGleb Smirnoff if (error) 141147f018aSGleb Smirnoff return(error); 142147f018aSGleb Smirnoff 143147f018aSGleb Smirnoff /* XXX: this is redundant when called from in6_pcbbind */ 144147f018aSGleb Smirnoff if ((so->so_options & (SO_REUSEADDR|SO_REUSEPORT|SO_REUSEPORT_LB)) == 0) 145147f018aSGleb Smirnoff lookupflags = INPLOOKUP_WILDCARD; 146147f018aSGleb Smirnoff 147147f018aSGleb Smirnoff inp->inp_flags |= INP_ANONPORT; 148147f018aSGleb Smirnoff 149147f018aSGleb Smirnoff error = in_pcb_lport(inp, NULL, &lport, cred, lookupflags); 150147f018aSGleb Smirnoff if (error != 0) 151147f018aSGleb Smirnoff return (error); 152147f018aSGleb Smirnoff 153147f018aSGleb Smirnoff inp->inp_lport = lport; 154147f018aSGleb Smirnoff if (in_pcbinshash(inp) != 0) { 155147f018aSGleb Smirnoff inp->in6p_laddr = in6addr_any; 156147f018aSGleb Smirnoff inp->inp_lport = 0; 157147f018aSGleb Smirnoff return (EAGAIN); 158147f018aSGleb Smirnoff } 159147f018aSGleb Smirnoff 160147f018aSGleb Smirnoff return (0); 161147f018aSGleb Smirnoff } 162147f018aSGleb Smirnoff 1631a43cff9SSean Bruno /* 16401f8ce83SMark Johnston * Determine whether the inpcb can be bound to the specified address/port tuple. 1651a43cff9SSean Bruno */ 16601f8ce83SMark Johnston static int 16701f8ce83SMark Johnston in6_pcbbind_avail(struct inpcb *inp, const struct sockaddr_in6 *sin6, 16801f8ce83SMark Johnston int sooptions, int lookupflags, struct ucred *cred) 16901f8ce83SMark Johnston { 17001f8ce83SMark Johnston const struct in6_addr *laddr; 17101f8ce83SMark Johnston int reuseport, reuseport_lb; 17201f8ce83SMark Johnston u_short lport; 1731a43cff9SSean Bruno 17401f8ce83SMark Johnston INP_LOCK_ASSERT(inp); 17501f8ce83SMark Johnston INP_HASH_LOCK_ASSERT(inp->inp_pcbinfo); 17607385abdSRobert Watson 17701f8ce83SMark Johnston laddr = &sin6->sin6_addr; 17882cd038dSYoshinobu Inoue lport = sin6->sin6_port; 17901f8ce83SMark Johnston 18001f8ce83SMark Johnston reuseport = (sooptions & SO_REUSEPORT); 18101f8ce83SMark Johnston reuseport_lb = (sooptions & SO_REUSEPORT_LB); 18201f8ce83SMark Johnston 18301f8ce83SMark Johnston if (IN6_IS_ADDR_MULTICAST(laddr)) { 18482cd038dSYoshinobu Inoue /* 18582cd038dSYoshinobu Inoue * Treat SO_REUSEADDR as SO_REUSEPORT for multicast; 18682cd038dSYoshinobu Inoue * allow compepte duplication of binding if 18782cd038dSYoshinobu Inoue * SO_REUSEPORT is set, or if SO_REUSEADDR is set 18882cd038dSYoshinobu Inoue * and a multicast address is bound on both 18982cd038dSYoshinobu Inoue * new and duplicated sockets. 19082cd038dSYoshinobu Inoue */ 19101f8ce83SMark Johnston if ((sooptions & (SO_REUSEADDR | SO_REUSEPORT)) != 0) 19282cd038dSYoshinobu Inoue reuseport = SO_REUSEADDR | SO_REUSEPORT; 1931a43cff9SSean Bruno /* 1941a43cff9SSean Bruno * XXX: How to deal with SO_REUSEPORT_LB here? 1951a43cff9SSean Bruno * Treat same as SO_REUSEPORT for now. 1961a43cff9SSean Bruno */ 19701f8ce83SMark Johnston if ((sooptions & (SO_REUSEADDR | SO_REUSEPORT_LB)) != 0) 1981a43cff9SSean Bruno reuseport_lb = SO_REUSEADDR | SO_REUSEPORT_LB; 19901f8ce83SMark Johnston } else if (!IN6_IS_ADDR_UNSPECIFIED(laddr)) { 20001f8ce83SMark Johnston struct sockaddr_in6 sin6; 201a68cc388SGleb Smirnoff struct epoch_tracker et; 2028c0fec80SRobert Watson struct ifaddr *ifa; 20382cd038dSYoshinobu Inoue 20401f8ce83SMark Johnston memset(&sin6, 0, sizeof(sin6)); 20501f8ce83SMark Johnston sin6.sin6_family = AF_INET6; 20601f8ce83SMark Johnston sin6.sin6_len = sizeof(sin6); 20701f8ce83SMark Johnston sin6.sin6_addr = *laddr; 20801f8ce83SMark Johnston 209a68cc388SGleb Smirnoff NET_EPOCH_ENTER(et); 21001f8ce83SMark Johnston if ((ifa = ifa_ifwithaddr((const struct sockaddr *)&sin6)) == 21101f8ce83SMark Johnston NULL && (inp->inp_flags & INP_BINDANY) == 0) { 212a68cc388SGleb Smirnoff NET_EPOCH_EXIT(et); 21382cd038dSYoshinobu Inoue return (EADDRNOTAVAIL); 214f44270e7SPawel Jakub Dawidek } 21582cd038dSYoshinobu Inoue 21682cd038dSYoshinobu Inoue /* 21782cd038dSYoshinobu Inoue * XXX: bind to an anycast address might accidentally 21882cd038dSYoshinobu Inoue * cause sending a packet with anycast source address. 21933841545SHajimu UMEMOTO * We should allow to bind to a deprecated address, since 2207efe5d92SHajimu UMEMOTO * the application dares to use it. 22182cd038dSYoshinobu Inoue */ 2228c0fec80SRobert Watson if (ifa != NULL && 2238c0fec80SRobert Watson ((struct in6_ifaddr *)ifa)->ia6_flags & 22433841545SHajimu UMEMOTO (IN6_IFF_ANYCAST | IN6_IFF_NOTREADY | IN6_IFF_DETACHED)) { 225a68cc388SGleb Smirnoff NET_EPOCH_EXIT(et); 22682cd038dSYoshinobu Inoue return (EADDRNOTAVAIL); 22782cd038dSYoshinobu Inoue } 228a68cc388SGleb Smirnoff NET_EPOCH_EXIT(et); 22982cd038dSYoshinobu Inoue } 23001f8ce83SMark Johnston 23101f8ce83SMark Johnston if (lport != 0) { 23282cd038dSYoshinobu Inoue struct inpcb *t; 23382cd038dSYoshinobu Inoue 234603724d3SBjoern A. Zeeb if (ntohs(lport) <= V_ipport_reservedhigh && 235603724d3SBjoern A. Zeeb ntohs(lport) >= V_ipport_reservedlow && 236cc426dd3SMateusz Guzik priv_check_cred(cred, PRIV_NETINET_RESERVEDPORT)) 23782cd038dSYoshinobu Inoue return (EACCES); 23845a77bf2SMark Johnston 23901f8ce83SMark Johnston if (!IN6_IS_ADDR_MULTICAST(laddr) && 24001f8ce83SMark Johnston priv_check_cred(inp->inp_cred, PRIV_NETINET_REUSEPORT) != 24101f8ce83SMark Johnston 0) { 242*c9756953SMark Johnston /* 243*c9756953SMark Johnston * If a socket owned by a different user is already 244*c9756953SMark Johnston * bound to this port, fail. In particular, SO_REUSE* 245*c9756953SMark Johnston * can only be used to share a port among sockets owned 246*c9756953SMark Johnston * by the same user. 247*c9756953SMark Johnston * 248*c9756953SMark Johnston * However, we can share a port with a connected socket 249*c9756953SMark Johnston * which has a unique 4-tuple. 250*c9756953SMark Johnston */ 25101f8ce83SMark Johnston t = in6_pcblookup_local(inp->inp_pcbinfo, laddr, lport, 252078b7042SBjoern A. Zeeb INPLOOKUP_WILDCARD, cred); 2533aff4ccdSMark Johnston if (t != NULL && 25401f8ce83SMark Johnston (inp->inp_socket->so_type != SOCK_STREAM || 255f66145c6SYaroslav Tykhiy IN6_IS_ADDR_UNSPECIFIED(&t->in6p_faddr)) && 25601f8ce83SMark Johnston (inp->inp_cred->cr_uid != t->inp_cred->cr_uid)) 25782cd038dSYoshinobu Inoue return (EADDRINUSE); 258c7c0d948SAdrian Chadd 25967107f45SBjoern A. Zeeb #ifdef INET 26033841545SHajimu UMEMOTO if ((inp->inp_flags & IN6P_IPV6_V6ONLY) == 0 && 26101f8ce83SMark Johnston IN6_IS_ADDR_UNSPECIFIED(laddr)) { 262fb59c426SYoshinobu Inoue struct sockaddr_in sin; 263fb59c426SYoshinobu Inoue 264fb59c426SYoshinobu Inoue in6_sin6_2_sin(&sin, sin6); 26501f8ce83SMark Johnston t = in_pcblookup_local(inp->inp_pcbinfo, 26601f8ce83SMark Johnston sin.sin_addr, lport, INPLOOKUP_WILDCARD, 26701f8ce83SMark Johnston cred); 2683aff4ccdSMark Johnston if (t != NULL && 26901f8ce83SMark Johnston (inp->inp_socket->so_type != SOCK_STREAM || 27045a77bf2SMark Johnston in_nullhost(t->inp_faddr)) && 27186d02c5cSBjoern A. Zeeb (inp->inp_cred->cr_uid != 27286d02c5cSBjoern A. Zeeb t->inp_cred->cr_uid)) 273fb59c426SYoshinobu Inoue return (EADDRINUSE); 274fb59c426SYoshinobu Inoue } 27567107f45SBjoern A. Zeeb #endif 27682cd038dSYoshinobu Inoue } 27701f8ce83SMark Johnston t = in6_pcblookup_local(inp->inp_pcbinfo, laddr, lport, 27801f8ce83SMark Johnston lookupflags, cred); 27945a77bf2SMark Johnston if (t != NULL && ((reuseport | reuseport_lb) & 28045a77bf2SMark Johnston t->inp_socket->so_options) == 0) 28129381b36SMikolaj Golub return (EADDRINUSE); 28267107f45SBjoern A. Zeeb #ifdef INET 28333841545SHajimu UMEMOTO if ((inp->inp_flags & IN6P_IPV6_V6ONLY) == 0 && 28401f8ce83SMark Johnston IN6_IS_ADDR_UNSPECIFIED(laddr)) { 285fb59c426SYoshinobu Inoue struct sockaddr_in sin; 286fb59c426SYoshinobu Inoue 287fb59c426SYoshinobu Inoue in6_sin6_2_sin(&sin, sin6); 28801f8ce83SMark Johnston t = in_pcblookup_local(inp->inp_pcbinfo, sin.sin_addr, 28968e0d7e0SRobert Watson lport, lookupflags, cred); 29045a77bf2SMark Johnston if (t != NULL && ((reuseport | reuseport_lb) & 29145a77bf2SMark Johnston t->inp_socket->so_options) == 0 && 29245a77bf2SMark Johnston (!in_nullhost(t->inp_laddr) || 2931a43cff9SSean Bruno (t->inp_vflag & INP_IPV6PROTO) != 0)) { 294fb59c426SYoshinobu Inoue return (EADDRINUSE); 295fb59c426SYoshinobu Inoue } 2961a43cff9SSean Bruno } 29767107f45SBjoern A. Zeeb #endif 29882cd038dSYoshinobu Inoue } 29901f8ce83SMark Johnston return (0); 30001f8ce83SMark Johnston } 30101f8ce83SMark Johnston 30201f8ce83SMark Johnston int 30301f8ce83SMark Johnston in6_pcbbind(struct inpcb *inp, struct sockaddr_in6 *sin6, struct ucred *cred) 30401f8ce83SMark Johnston { 30501f8ce83SMark Johnston struct socket *so = inp->inp_socket; 30601f8ce83SMark Johnston u_short lport = 0; 30701f8ce83SMark Johnston int error, lookupflags, sooptions; 30801f8ce83SMark Johnston 30901f8ce83SMark Johnston INP_WLOCK_ASSERT(inp); 310ffb3d384SMark Johnston INP_HASH_WLOCK_ASSERT(inp->inp_pcbinfo); 31101f8ce83SMark Johnston 31201f8ce83SMark Johnston if (inp->inp_lport || !IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr)) 31301f8ce83SMark Johnston return (EINVAL); 31401f8ce83SMark Johnston 31501f8ce83SMark Johnston lookupflags = 0; 31601f8ce83SMark Johnston sooptions = atomic_load_int(&so->so_options); 31701f8ce83SMark Johnston if ((sooptions & (SO_REUSEADDR | SO_REUSEPORT | SO_REUSEPORT_LB)) == 0) 31801f8ce83SMark Johnston lookupflags = INPLOOKUP_WILDCARD; 31901f8ce83SMark Johnston if (sin6 == NULL) { 32001f8ce83SMark Johnston if ((error = prison_local_ip6(cred, &inp->in6p_laddr, 32101f8ce83SMark Johnston ((inp->inp_flags & IN6P_IPV6_V6ONLY) != 0))) != 0) 32201f8ce83SMark Johnston return (error); 32301f8ce83SMark Johnston } else { 32401f8ce83SMark Johnston KASSERT(sin6->sin6_family == AF_INET6, 32501f8ce83SMark Johnston ("%s: invalid address family for %p", __func__, sin6)); 32601f8ce83SMark Johnston KASSERT(sin6->sin6_len == sizeof(*sin6), 32701f8ce83SMark Johnston ("%s: invalid address length for %p", __func__, sin6)); 32801f8ce83SMark Johnston 32901f8ce83SMark Johnston if ((error = sa6_embedscope(sin6, V_ip6_use_defzone)) != 0) 33001f8ce83SMark Johnston return(error); 33101f8ce83SMark Johnston 33201f8ce83SMark Johnston if ((error = prison_local_ip6(cred, &sin6->sin6_addr, 33301f8ce83SMark Johnston ((inp->inp_flags & IN6P_IPV6_V6ONLY) != 0))) != 0) 33401f8ce83SMark Johnston return (error); 33501f8ce83SMark Johnston 33601f8ce83SMark Johnston /* See if this address/port combo is available. */ 33701f8ce83SMark Johnston error = in6_pcbbind_avail(inp, sin6, sooptions, lookupflags, 33801f8ce83SMark Johnston cred); 33901f8ce83SMark Johnston if (error != 0) 34001f8ce83SMark Johnston return (error); 34101f8ce83SMark Johnston 34201f8ce83SMark Johnston lport = sin6->sin6_port; 34382cd038dSYoshinobu Inoue inp->in6p_laddr = sin6->sin6_addr; 34482cd038dSYoshinobu Inoue } 34582cd038dSYoshinobu Inoue if (lport == 0) { 3464616026fSErmal Luçi if ((error = in6_pcbsetport(&inp->in6p_laddr, inp, cred)) != 0) { 3474a2b2562SBjoern A. Zeeb /* Undo an address bind that may have occurred. */ 3484a2b2562SBjoern A. Zeeb inp->in6p_laddr = in6addr_any; 349b89e82ddSJamie Gritton return (error); 3504a2b2562SBjoern A. Zeeb } 35155fd3bafSBjoern A. Zeeb } else { 35282cd038dSYoshinobu Inoue inp->inp_lport = lport; 35382cd038dSYoshinobu Inoue if (in_pcbinshash(inp) != 0) { 35482cd038dSYoshinobu Inoue inp->in6p_laddr = in6addr_any; 35582cd038dSYoshinobu Inoue inp->inp_lport = 0; 35682cd038dSYoshinobu Inoue return (EAGAIN); 35782cd038dSYoshinobu Inoue } 358686cdd19SJun-ichiro itojun Hagino } 35982cd038dSYoshinobu Inoue return (0); 36082cd038dSYoshinobu Inoue } 36182cd038dSYoshinobu Inoue 36282cd038dSYoshinobu Inoue /* 36382cd038dSYoshinobu Inoue * Transform old in6_pcbconnect() into an inner subroutine for new 36482cd038dSYoshinobu Inoue * in6_pcbconnect(): Do some validity-checking on the remote 36582cd038dSYoshinobu Inoue * address (in mbuf 'nam') and then determine local host address 36682cd038dSYoshinobu Inoue * (i.e., which interface) to use to access that remote host. 36782cd038dSYoshinobu Inoue * 36882cd038dSYoshinobu Inoue * This preserves definition of in6_pcbconnect(), while supporting a 36982cd038dSYoshinobu Inoue * slightly different version for T/TCP. (This is more than 37082cd038dSYoshinobu Inoue * a bit of a kludge, but cleaning up the internal interfaces would 37182cd038dSYoshinobu Inoue * have forced minor changes in every protocol). 37282cd038dSYoshinobu Inoue */ 373a7e201bbSAndrey V. Elsukov static int 374f161d294SMark Johnston in6_pcbladdr(struct inpcb *inp, struct sockaddr_in6 *sin6, 3750bf5377bSAndrey V. Elsukov struct in6_addr *plocal_addr6, bool sas_required) 37682cd038dSYoshinobu Inoue { 37782cd038dSYoshinobu Inoue int error = 0; 378a1f7e5f8SHajimu UMEMOTO int scope_ambiguous = 0; 37988d166bfSBjoern A. Zeeb struct in6_addr in6a; 38082cd038dSYoshinobu Inoue 3813d76be28SGleb Smirnoff NET_EPOCH_ASSERT(); 3828501a69cSRobert Watson INP_WLOCK_ASSERT(inp); 383fa046d87SRobert Watson INP_HASH_WLOCK_ASSERT(inp->inp_pcbinfo); /* XXXRW: why? */ 3848deea4a8SRobert Watson 38582cd038dSYoshinobu Inoue if (sin6->sin6_port == 0) 38682cd038dSYoshinobu Inoue return (EADDRNOTAVAIL); 38782cd038dSYoshinobu Inoue 388603724d3SBjoern A. Zeeb if (sin6->sin6_scope_id == 0 && !V_ip6_use_defzone) 389a1f7e5f8SHajimu UMEMOTO scope_ambiguous = 1; 390603724d3SBjoern A. Zeeb if ((error = sa6_embedscope(sin6, V_ip6_use_defzone)) != 0) 391a1f7e5f8SHajimu UMEMOTO return(error); 392a1f7e5f8SHajimu UMEMOTO 393417b35a9SMark Johnston if (V_connect_in6addr_wild && !CK_STAILQ_EMPTY(&V_in6_ifaddrhead)) { 39482cd038dSYoshinobu Inoue /* 39582cd038dSYoshinobu Inoue * If the destination address is UNSPECIFIED addr, 39682cd038dSYoshinobu Inoue * use the loopback addr, e.g ::1. 39782cd038dSYoshinobu Inoue */ 39882cd038dSYoshinobu Inoue if (IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr)) 39982cd038dSYoshinobu Inoue sin6->sin6_addr = in6addr_loopback; 4000c605af3SMark Johnston } else if (IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr)) { 4010c605af3SMark Johnston return (ENETUNREACH); 40282cd038dSYoshinobu Inoue } 4030c605af3SMark Johnston 404b89e82ddSJamie Gritton if ((error = prison_remote_ip6(inp->inp_cred, &sin6->sin6_addr)) != 0) 405b89e82ddSJamie Gritton return (error); 406a1f7e5f8SHajimu UMEMOTO 4070bf5377bSAndrey V. Elsukov if (sas_required) { 408601c0b8bSAlexander V. Chernikov error = in6_selectsrc_socket(sin6, inp->in6p_outputopts, 409601c0b8bSAlexander V. Chernikov inp, inp->inp_cred, scope_ambiguous, &in6a, NULL); 41088d166bfSBjoern A. Zeeb if (error) 41188d166bfSBjoern A. Zeeb return (error); 4120bf5377bSAndrey V. Elsukov } else { 4130bf5377bSAndrey V. Elsukov /* 4140bf5377bSAndrey V. Elsukov * Source address selection isn't required when syncache 4150bf5377bSAndrey V. Elsukov * has already established connection and both source and 4160bf5377bSAndrey V. Elsukov * destination addresses was chosen. 4170bf5377bSAndrey V. Elsukov * 4180bf5377bSAndrey V. Elsukov * This also includes the case when fwd_tag was used to 4190bf5377bSAndrey V. Elsukov * select source address in tcp_input(). 4200bf5377bSAndrey V. Elsukov */ 4210bf5377bSAndrey V. Elsukov in6a = inp->in6p_laddr; 4220bf5377bSAndrey V. Elsukov } 4230bf5377bSAndrey V. Elsukov 424713264f6SMark Johnston if (IN6_IS_ADDR_UNSPECIFIED(&in6a)) 425713264f6SMark Johnston return (EHOSTUNREACH); 42688d166bfSBjoern A. Zeeb /* 42788d166bfSBjoern A. Zeeb * Do not update this earlier, in case we return with an error. 42888d166bfSBjoern A. Zeeb * 429601c0b8bSAlexander V. Chernikov * XXX: this in6_selectsrc_socket result might replace the bound local 430681ffdf9SBjoern A. Zeeb * address with the address specified by setsockopt(IPV6_PKTINFO). 43188d166bfSBjoern A. Zeeb * Is it the intended behavior? 43288d166bfSBjoern A. Zeeb */ 43388d166bfSBjoern A. Zeeb *plocal_addr6 = in6a; 43488d166bfSBjoern A. Zeeb 43582cd038dSYoshinobu Inoue /* 43682cd038dSYoshinobu Inoue * Don't do pcblookup call here; return interface in 43782cd038dSYoshinobu Inoue * plocal_addr6 43882cd038dSYoshinobu Inoue * and exit to caller, that will do the lookup. 43982cd038dSYoshinobu Inoue */ 440a1f7e5f8SHajimu UMEMOTO 44182cd038dSYoshinobu Inoue return (0); 44282cd038dSYoshinobu Inoue } 44382cd038dSYoshinobu Inoue 44482cd038dSYoshinobu Inoue /* 44582cd038dSYoshinobu Inoue * Outer subroutine: 44682cd038dSYoshinobu Inoue * Connect from a socket to a specified address. 44782cd038dSYoshinobu Inoue * Both address and port must be specified in argument sin. 44882cd038dSYoshinobu Inoue * If don't have a local address for this socket yet, 44982cd038dSYoshinobu Inoue * then pick one. 45082cd038dSYoshinobu Inoue */ 45182cd038dSYoshinobu Inoue int 452a9d22cceSGleb Smirnoff in6_pcbconnect(struct inpcb *inp, struct sockaddr_in6 *sin6, struct ucred *cred, 4530bf5377bSAndrey V. Elsukov bool sas_required) 45482cd038dSYoshinobu Inoue { 455fa046d87SRobert Watson struct inpcbinfo *pcbinfo = inp->inp_pcbinfo; 45625102351SMike Karels struct sockaddr_in6 laddr6; 45782cd038dSYoshinobu Inoue int error; 45882cd038dSYoshinobu Inoue 4593d76be28SGleb Smirnoff NET_EPOCH_ASSERT(); 4603d76be28SGleb Smirnoff INP_WLOCK_ASSERT(inp); 4613d76be28SGleb Smirnoff INP_HASH_WLOCK_ASSERT(pcbinfo); 462f161d294SMark Johnston KASSERT(sin6->sin6_family == AF_INET6, 463f161d294SMark Johnston ("%s: invalid address family for %p", __func__, sin6)); 464f161d294SMark Johnston KASSERT(sin6->sin6_len == sizeof(*sin6), 465f161d294SMark Johnston ("%s: invalid address length for %p", __func__, sin6)); 466fdb987beSMark Johnston KASSERT(IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr), 467fdb987beSMark Johnston ("%s: inp is already connected", __func__)); 468f161d294SMark Johnston 46925102351SMike Karels bzero(&laddr6, sizeof(laddr6)); 47025102351SMike Karels laddr6.sin6_family = AF_INET6; 47125102351SMike Karels 4720c325f53SAlexander V. Chernikov #ifdef ROUTE_MPATH 4730c325f53SAlexander V. Chernikov if (CALC_FLOWID_OUTBOUND) { 4740c325f53SAlexander V. Chernikov uint32_t hash_type, hash_val; 4750c325f53SAlexander V. Chernikov 4760c325f53SAlexander V. Chernikov hash_val = fib6_calc_software_hash(&inp->in6p_laddr, 4770c325f53SAlexander V. Chernikov &sin6->sin6_addr, 0, sin6->sin6_port, 4780c325f53SAlexander V. Chernikov inp->inp_socket->so_proto->pr_protocol, &hash_type); 4790c325f53SAlexander V. Chernikov inp->inp_flowid = hash_val; 4800c325f53SAlexander V. Chernikov inp->inp_flowtype = hash_type; 4810c325f53SAlexander V. Chernikov } 4820c325f53SAlexander V. Chernikov #endif 48382cd038dSYoshinobu Inoue /* 48482cd038dSYoshinobu Inoue * Call inner routine, to assign local interface address. 48588ff5695SSUZUKI Shinsuke * in6_pcbladdr() may automatically fill in sin6_scope_id. 48682cd038dSYoshinobu Inoue */ 4870bf5377bSAndrey V. Elsukov if ((error = in6_pcbladdr(inp, sin6, &laddr6.sin6_addr, 4880bf5377bSAndrey V. Elsukov sas_required)) != 0) 48982cd038dSYoshinobu Inoue return (error); 49082cd038dSYoshinobu Inoue 491fa046d87SRobert Watson if (in6_pcblookup_hash_locked(pcbinfo, &sin6->sin6_addr, 4924130ea61SMark Johnston sin6->sin6_port, IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr) ? 4934130ea61SMark Johnston &laddr6.sin6_addr : &inp->in6p_laddr, inp->inp_lport, 0, 4944130ea61SMark Johnston M_NODOM) != NULL) 49582cd038dSYoshinobu Inoue return (EADDRINUSE); 49682cd038dSYoshinobu Inoue if (IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr)) { 49782cd038dSYoshinobu Inoue if (inp->inp_lport == 0) { 49825102351SMike Karels error = in_pcb_lport_dest(inp, 49925102351SMike Karels (struct sockaddr *) &laddr6, &inp->inp_lport, 500440598ddSJonathan T. Looney (struct sockaddr *) sin6, sin6->sin6_port, cred, 501440598ddSJonathan T. Looney INPLOOKUP_WILDCARD); 5024616026fSErmal Luçi if (error) 50382cd038dSYoshinobu Inoue return (error); 50482cd038dSYoshinobu Inoue } 50525102351SMike Karels inp->in6p_laddr = laddr6.sin6_addr; 50682cd038dSYoshinobu Inoue } 50782cd038dSYoshinobu Inoue inp->in6p_faddr = sin6->sin6_addr; 50882cd038dSYoshinobu Inoue inp->inp_fport = sin6->sin6_port; 50933841545SHajimu UMEMOTO /* update flowinfo - draft-itojun-ipv6-flowlabel-api-00 */ 510fc384fa5SBjoern A. Zeeb inp->inp_flow &= ~IPV6_FLOWLABEL_MASK; 511fc384fa5SBjoern A. Zeeb if (inp->inp_flags & IN6P_AUTOFLOWLABEL) 512fc384fa5SBjoern A. Zeeb inp->inp_flow |= 513b79274baSHajimu UMEMOTO (htonl(ip6_randomflowlabel()) & IPV6_FLOWLABEL_MASK); 51482cd038dSYoshinobu Inoue 515fdb987beSMark Johnston if ((inp->inp_flags & INP_INHASHLIST) != 0) { 516db0ac6deSCy Schubert in_pcbrehash(inp); 517fe1274eeSMichael Tuexen } else { 518db0ac6deSCy Schubert in_pcbinshash(inp); 519fe1274eeSMichael Tuexen } 5202cb64cb2SGeorge V. Neville-Neil 52182cd038dSYoshinobu Inoue return (0); 52282cd038dSYoshinobu Inoue } 52382cd038dSYoshinobu Inoue 52482cd038dSYoshinobu Inoue void 5251272577eSXin LI in6_pcbdisconnect(struct inpcb *inp) 52682cd038dSYoshinobu Inoue { 52707385abdSRobert Watson 5288501a69cSRobert Watson INP_WLOCK_ASSERT(inp); 529fa046d87SRobert Watson INP_HASH_WLOCK_ASSERT(inp->inp_pcbinfo); 530fdb987beSMark Johnston KASSERT(inp->inp_smr == SMR_SEQ_INVALID, 531fdb987beSMark Johnston ("%s: inp %p was already disconnected", __func__, inp)); 53207385abdSRobert Watson 533fdb987beSMark Johnston in_pcbremhash_locked(inp); 534fdb987beSMark Johnston 535fdb987beSMark Johnston /* See the comment in in_pcbinshash(). */ 536fdb987beSMark Johnston inp->inp_smr = smr_advance(inp->inp_pcbinfo->ipi_smr); 537fdb987beSMark Johnston 538fdb987beSMark Johnston /* XXX-MJ torn writes are visible to SMR lookup */ 5392589ec0fSMark Johnston memset(&inp->in6p_laddr, 0, sizeof(inp->in6p_laddr)); 5402589ec0fSMark Johnston memset(&inp->in6p_faddr, 0, sizeof(inp->in6p_faddr)); 54182cd038dSYoshinobu Inoue inp->inp_fport = 0; 54233841545SHajimu UMEMOTO /* clear flowinfo - draft-itojun-ipv6-flowlabel-api-00 */ 543fc384fa5SBjoern A. Zeeb inp->inp_flow &= ~IPV6_FLOWLABEL_MASK; 54482cd038dSYoshinobu Inoue } 54582cd038dSYoshinobu Inoue 54682cd038dSYoshinobu Inoue int 5470fac350cSGleb Smirnoff in6_getsockaddr(struct socket *so, struct sockaddr *sa) 54882cd038dSYoshinobu Inoue { 5493e85b721SEd Maste struct inpcb *inp; 55082cd038dSYoshinobu Inoue 55182cd038dSYoshinobu Inoue inp = sotoinpcb(so); 55254d642bbSRobert Watson KASSERT(inp != NULL, ("in6_getsockaddr: inp == NULL")); 55348477723SRobert Watson 5540fac350cSGleb Smirnoff *(struct sockaddr_in6 *)sa = (struct sockaddr_in6 ){ 5550fac350cSGleb Smirnoff .sin6_len = sizeof(struct sockaddr_in6), 5560fac350cSGleb Smirnoff .sin6_family = AF_INET6, 5570fac350cSGleb Smirnoff .sin6_port = inp->inp_lport, 5580fac350cSGleb Smirnoff .sin6_addr = inp->in6p_laddr, 5590fac350cSGleb Smirnoff }; 5600fac350cSGleb Smirnoff /* XXX: should catch errors */ 5610fac350cSGleb Smirnoff (void)sa6_recoverscope((struct sockaddr_in6 *)sa); 56282cd038dSYoshinobu Inoue 5630fac350cSGleb Smirnoff return (0); 56482cd038dSYoshinobu Inoue } 56582cd038dSYoshinobu Inoue 56682cd038dSYoshinobu Inoue int 5670fac350cSGleb Smirnoff in6_getpeeraddr(struct socket *so, struct sockaddr *sa) 56882cd038dSYoshinobu Inoue { 56982cd038dSYoshinobu Inoue struct inpcb *inp; 57082cd038dSYoshinobu Inoue 57182cd038dSYoshinobu Inoue inp = sotoinpcb(so); 57254d642bbSRobert Watson KASSERT(inp != NULL, ("in6_getpeeraddr: inp == NULL")); 57348477723SRobert Watson 5740fac350cSGleb Smirnoff *(struct sockaddr_in6 *)sa = (struct sockaddr_in6 ){ 5750fac350cSGleb Smirnoff .sin6_len = sizeof(struct sockaddr_in6), 5760fac350cSGleb Smirnoff .sin6_family = AF_INET6, 5770fac350cSGleb Smirnoff .sin6_port = inp->inp_fport, 5780fac350cSGleb Smirnoff .sin6_addr = inp->in6p_faddr, 5790fac350cSGleb Smirnoff }; 5800fac350cSGleb Smirnoff /* XXX: should catch errors */ 5810fac350cSGleb Smirnoff (void)sa6_recoverscope((struct sockaddr_in6 *)sa); 58282cd038dSYoshinobu Inoue 5830fac350cSGleb Smirnoff return (0); 58482cd038dSYoshinobu Inoue } 58582cd038dSYoshinobu Inoue 58682cd038dSYoshinobu Inoue int 5870fac350cSGleb Smirnoff in6_mapped_sockaddr(struct socket *so, struct sockaddr *sa) 58882cd038dSYoshinobu Inoue { 58982cd038dSYoshinobu Inoue int error; 590042fb58dSLexi Winter #ifdef INET 591042fb58dSLexi Winter struct inpcb *inp; 59282cd038dSYoshinobu Inoue 59348477723SRobert Watson inp = sotoinpcb(so); 59448477723SRobert Watson KASSERT(inp != NULL, ("in6_mapped_sockaddr: inp == NULL")); 59548477723SRobert Watson 5965fac4178SHajimu UMEMOTO if ((inp->inp_vflag & (INP_IPV4 | INP_IPV6)) == INP_IPV4) { 5970fac350cSGleb Smirnoff struct sockaddr_in sin; 5980fac350cSGleb Smirnoff 5990fac350cSGleb Smirnoff error = in_getsockaddr(so, (struct sockaddr *)&sin); 600369dc8ceSEivind Eklund if (error == 0) 6010fac350cSGleb Smirnoff in6_sin_2_v4mapsin6(&sin, (struct sockaddr_in6 *)sa); 60267107f45SBjoern A. Zeeb } else 60367107f45SBjoern A. Zeeb #endif 60467107f45SBjoern A. Zeeb { 60554d642bbSRobert Watson /* scope issues will be handled in in6_getsockaddr(). */ 6060fac350cSGleb Smirnoff error = in6_getsockaddr(so, sa); 6077efe5d92SHajimu UMEMOTO } 60882cd038dSYoshinobu Inoue 60982cd038dSYoshinobu Inoue return error; 61082cd038dSYoshinobu Inoue } 61182cd038dSYoshinobu Inoue 61282cd038dSYoshinobu Inoue int 6130fac350cSGleb Smirnoff in6_mapped_peeraddr(struct socket *so, struct sockaddr *sa) 61482cd038dSYoshinobu Inoue { 61582cd038dSYoshinobu Inoue int error; 616042fb58dSLexi Winter #ifdef INET 617042fb58dSLexi Winter struct inpcb *inp; 61882cd038dSYoshinobu Inoue 61948477723SRobert Watson inp = sotoinpcb(so); 62048477723SRobert Watson KASSERT(inp != NULL, ("in6_mapped_peeraddr: inp == NULL")); 62148477723SRobert Watson 6225fac4178SHajimu UMEMOTO if ((inp->inp_vflag & (INP_IPV4 | INP_IPV6)) == INP_IPV4) { 6230fac350cSGleb Smirnoff struct sockaddr_in sin; 6240fac350cSGleb Smirnoff 6250fac350cSGleb Smirnoff error = in_getpeeraddr(so, (struct sockaddr *)&sin); 626369dc8ceSEivind Eklund if (error == 0) 6270fac350cSGleb Smirnoff in6_sin_2_v4mapsin6(&sin, (struct sockaddr_in6 *)sa); 62882cd038dSYoshinobu Inoue } else 62967107f45SBjoern A. Zeeb #endif 630042fb58dSLexi Winter { 63154d642bbSRobert Watson /* scope issues will be handled in in6_getpeeraddr(). */ 6320fac350cSGleb Smirnoff error = in6_getpeeraddr(so, sa); 633042fb58dSLexi Winter } 63482cd038dSYoshinobu Inoue 63582cd038dSYoshinobu Inoue return error; 63682cd038dSYoshinobu Inoue } 63782cd038dSYoshinobu Inoue 63882cd038dSYoshinobu Inoue /* 63982cd038dSYoshinobu Inoue * Pass some notification to all connections of a protocol 64082cd038dSYoshinobu Inoue * associated with address dst. The local address and/or port numbers 64182cd038dSYoshinobu Inoue * may be specified to limit the search. The "usual action" will be 64282cd038dSYoshinobu Inoue * taken, depending on the ctlinput cmd. The caller must filter any 64382cd038dSYoshinobu Inoue * cmds that are uninteresting (e.g., no error in the map). 64482cd038dSYoshinobu Inoue * Call the protocol specific routine (if any) to report 64582cd038dSYoshinobu Inoue * any errors for each matching socket. 64682cd038dSYoshinobu Inoue */ 647db0ac6deSCy Schubert static bool 648db0ac6deSCy Schubert inp_match6(const struct inpcb *inp, void *v __unused) 649db0ac6deSCy Schubert { 650db0ac6deSCy Schubert 651db0ac6deSCy Schubert return ((inp->inp_vflag & INP_IPV6) != 0); 652db0ac6deSCy Schubert } 653fcb3f813SGleb Smirnoff 65482cd038dSYoshinobu Inoue void 65543d39ca7SGleb Smirnoff in6_pcbnotify(struct inpcbinfo *pcbinfo, struct sockaddr_in6 *sa6_dst, 65643d39ca7SGleb Smirnoff u_int fport_arg, const struct sockaddr_in6 *src, u_int lport_arg, 657fcb3f813SGleb Smirnoff int errno, void *cmdarg, 6589233d8f3SDavid E. O'Brien struct inpcb *(*notify)(struct inpcb *, int)) 65982cd038dSYoshinobu Inoue { 660db0ac6deSCy Schubert struct inpcb_iterator inpi = INP_ITERATOR(pcbinfo, INPLOOKUP_WLOCKPCB, 661db0ac6deSCy Schubert inp_match6, NULL); 662db0ac6deSCy Schubert struct inpcb *inp; 66343d39ca7SGleb Smirnoff struct sockaddr_in6 sa6_src; 66482cd038dSYoshinobu Inoue u_short fport = fport_arg, lport = lport_arg; 66533841545SHajimu UMEMOTO u_int32_t flowinfo; 66633841545SHajimu UMEMOTO 66733841545SHajimu UMEMOTO if (IN6_IS_ADDR_UNSPECIFIED(&sa6_dst->sin6_addr)) 66882cd038dSYoshinobu Inoue return; 66982cd038dSYoshinobu Inoue 67082cd038dSYoshinobu Inoue /* 67133841545SHajimu UMEMOTO * note that src can be NULL when we get notify by local fragmentation. 67233841545SHajimu UMEMOTO */ 67343d39ca7SGleb Smirnoff sa6_src = (src == NULL) ? sa6_any : *src; 67433841545SHajimu UMEMOTO flowinfo = sa6_src.sin6_flowinfo; 67533841545SHajimu UMEMOTO 676db0ac6deSCy Schubert while ((inp = inp_next(&inpi)) != NULL) { 677db0ac6deSCy Schubert INP_WLOCK_ASSERT(inp); 678686cdd19SJun-ichiro itojun Hagino /* 679efddf5c6SHajimu UMEMOTO * If the error designates a new path MTU for a destination 680efddf5c6SHajimu UMEMOTO * and the application (associated with this socket) wanted to 6818f1beb88SAndrey V. Elsukov * know the value, notify. 682efddf5c6SHajimu UMEMOTO * XXX: should we avoid to notify the value to TCP sockets? 683efddf5c6SHajimu UMEMOTO */ 684fcb3f813SGleb Smirnoff if (errno == EMSGSIZE && cmdarg != NULL) 68543d39ca7SGleb Smirnoff ip6_notify_pmtu(inp, sa6_dst, *(uint32_t *)cmdarg); 686efddf5c6SHajimu UMEMOTO 687efddf5c6SHajimu UMEMOTO /* 68833841545SHajimu UMEMOTO * Detect if we should notify the error. If no source and 68904389c85SGordon Bergling * destination ports are specified, but non-zero flowinfo and 69033841545SHajimu UMEMOTO * local address match, notify the error. This is the case 69133841545SHajimu UMEMOTO * when the error is delivered with an encrypted buffer 69233841545SHajimu UMEMOTO * by ESP. Otherwise, just compare addresses and ports 69333841545SHajimu UMEMOTO * as usual. 694686cdd19SJun-ichiro itojun Hagino */ 69533841545SHajimu UMEMOTO if (lport == 0 && fport == 0 && flowinfo && 69633841545SHajimu UMEMOTO inp->inp_socket != NULL && 697fc384fa5SBjoern A. Zeeb flowinfo == (inp->inp_flow & IPV6_FLOWLABEL_MASK) && 69833841545SHajimu UMEMOTO IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, &sa6_src.sin6_addr)) 69933841545SHajimu UMEMOTO goto do_notify; 70033841545SHajimu UMEMOTO else if (!IN6_ARE_ADDR_EQUAL(&inp->in6p_faddr, 70133841545SHajimu UMEMOTO &sa6_dst->sin6_addr) || 70282cd038dSYoshinobu Inoue inp->inp_socket == 0 || 70382cd038dSYoshinobu Inoue (lport && inp->inp_lport != lport) || 70433841545SHajimu UMEMOTO (!IN6_IS_ADDR_UNSPECIFIED(&sa6_src.sin6_addr) && 70533841545SHajimu UMEMOTO !IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, 70633841545SHajimu UMEMOTO &sa6_src.sin6_addr)) || 707f31f65a7SRobert Watson (fport && inp->inp_fport != fport)) { 70882cd038dSYoshinobu Inoue continue; 709f31f65a7SRobert Watson } 710686cdd19SJun-ichiro itojun Hagino 71133841545SHajimu UMEMOTO do_notify: 712db0ac6deSCy Schubert if (notify) 713db0ac6deSCy Schubert (*notify)(inp, errno); 71482cd038dSYoshinobu Inoue } 71582cd038dSYoshinobu Inoue } 71682cd038dSYoshinobu Inoue 71782cd038dSYoshinobu Inoue /* 718fa046d87SRobert Watson * Lookup a PCB based on the local address and port. Caller must hold the 719fa046d87SRobert Watson * hash lock. No inpcb locks or references are acquired. 72082cd038dSYoshinobu Inoue */ 72182cd038dSYoshinobu Inoue struct inpcb * 72252ef944bSMark Johnston in6_pcblookup_local(struct inpcbinfo *pcbinfo, const struct in6_addr *laddr, 72368e0d7e0SRobert Watson u_short lport, int lookupflags, struct ucred *cred) 72482cd038dSYoshinobu Inoue { 7253e85b721SEd Maste struct inpcb *inp; 72682cd038dSYoshinobu Inoue int matchwild = 3, wildcard; 72782cd038dSYoshinobu Inoue 72868e0d7e0SRobert Watson KASSERT((lookupflags & ~(INPLOOKUP_WILDCARD)) == 0, 72968e0d7e0SRobert Watson ("%s: invalid lookup flags %d", __func__, lookupflags)); 73068e0d7e0SRobert Watson 731c17cd08fSGleb Smirnoff INP_HASH_LOCK_ASSERT(pcbinfo); 7328deea4a8SRobert Watson 73368e0d7e0SRobert Watson if ((lookupflags & INPLOOKUP_WILDCARD) == 0) { 73482cd038dSYoshinobu Inoue struct inpcbhead *head; 73582cd038dSYoshinobu Inoue /* 73682cd038dSYoshinobu Inoue * Look for an unconnected (wildcard foreign addr) PCB that 73782cd038dSYoshinobu Inoue * matches the local address and port we're looking for. 73882cd038dSYoshinobu Inoue */ 739fdb987beSMark Johnston head = &pcbinfo->ipi_hash_wild[INP_PCBHASH_WILD(lport, 7401b44e5ffSAndrey V. Elsukov pcbinfo->ipi_hashmask)]; 741fdb987beSMark Johnston CK_LIST_FOREACH(inp, head, inp_hash_wild) { 742413628a7SBjoern A. Zeeb /* XXX inp locking */ 743369dc8ceSEivind Eklund if ((inp->inp_vflag & INP_IPV6) == 0) 74482cd038dSYoshinobu Inoue continue; 74582cd038dSYoshinobu Inoue if (IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr) && 74682cd038dSYoshinobu Inoue IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, laddr) && 74782cd038dSYoshinobu Inoue inp->inp_lport == lport) { 748413628a7SBjoern A. Zeeb /* Found. */ 749ac1750ddSMark Johnston if (prison_equal_ip6(cred->cr_prison, 7500304c731SJamie Gritton inp->inp_cred->cr_prison)) 75182cd038dSYoshinobu Inoue return (inp); 75282cd038dSYoshinobu Inoue } 75382cd038dSYoshinobu Inoue } 75482cd038dSYoshinobu Inoue /* 75582cd038dSYoshinobu Inoue * Not found. 75682cd038dSYoshinobu Inoue */ 75782cd038dSYoshinobu Inoue return (NULL); 75882cd038dSYoshinobu Inoue } else { 75982cd038dSYoshinobu Inoue struct inpcbporthead *porthash; 76082cd038dSYoshinobu Inoue struct inpcbport *phd; 76182cd038dSYoshinobu Inoue struct inpcb *match = NULL; 76282cd038dSYoshinobu Inoue /* 76382cd038dSYoshinobu Inoue * Best fit PCB lookup. 76482cd038dSYoshinobu Inoue * 76582cd038dSYoshinobu Inoue * First see if this local port is in use by looking on the 76682cd038dSYoshinobu Inoue * port hash list. 76782cd038dSYoshinobu Inoue */ 768712fc218SRobert Watson porthash = &pcbinfo->ipi_porthashbase[INP_PCBPORTHASH(lport, 769712fc218SRobert Watson pcbinfo->ipi_porthashmask)]; 770b872626dSMatt Macy CK_LIST_FOREACH(phd, porthash, phd_hash) { 77182cd038dSYoshinobu Inoue if (phd->phd_port == lport) 77282cd038dSYoshinobu Inoue break; 77382cd038dSYoshinobu Inoue } 77482cd038dSYoshinobu Inoue if (phd != NULL) { 77582cd038dSYoshinobu Inoue /* 77682cd038dSYoshinobu Inoue * Port is in use by one or more PCBs. Look for best 77782cd038dSYoshinobu Inoue * fit. 77882cd038dSYoshinobu Inoue */ 779b872626dSMatt Macy CK_LIST_FOREACH(inp, &phd->phd_pcblist, inp_portlist) { 78082cd038dSYoshinobu Inoue wildcard = 0; 781ac1750ddSMark Johnston if (!prison_equal_ip6(cred->cr_prison, 7820304c731SJamie Gritton inp->inp_cred->cr_prison)) 783413628a7SBjoern A. Zeeb continue; 784413628a7SBjoern A. Zeeb /* XXX inp locking */ 785369dc8ceSEivind Eklund if ((inp->inp_vflag & INP_IPV6) == 0) 78682cd038dSYoshinobu Inoue continue; 78782cd038dSYoshinobu Inoue if (!IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr)) 78882cd038dSYoshinobu Inoue wildcard++; 78982cd038dSYoshinobu Inoue if (!IN6_IS_ADDR_UNSPECIFIED( 79082cd038dSYoshinobu Inoue &inp->in6p_laddr)) { 79182cd038dSYoshinobu Inoue if (IN6_IS_ADDR_UNSPECIFIED(laddr)) 79282cd038dSYoshinobu Inoue wildcard++; 79382cd038dSYoshinobu Inoue else if (!IN6_ARE_ADDR_EQUAL( 79482cd038dSYoshinobu Inoue &inp->in6p_laddr, laddr)) 79582cd038dSYoshinobu Inoue continue; 79682cd038dSYoshinobu Inoue } else { 79782cd038dSYoshinobu Inoue if (!IN6_IS_ADDR_UNSPECIFIED(laddr)) 79882cd038dSYoshinobu Inoue wildcard++; 79982cd038dSYoshinobu Inoue } 80082cd038dSYoshinobu Inoue if (wildcard < matchwild) { 80182cd038dSYoshinobu Inoue match = inp; 80282cd038dSYoshinobu Inoue matchwild = wildcard; 803413628a7SBjoern A. Zeeb if (matchwild == 0) 80482cd038dSYoshinobu Inoue break; 80582cd038dSYoshinobu Inoue } 80682cd038dSYoshinobu Inoue } 80782cd038dSYoshinobu Inoue } 80882cd038dSYoshinobu Inoue return (match); 80982cd038dSYoshinobu Inoue } 81082cd038dSYoshinobu Inoue } 81182cd038dSYoshinobu Inoue 812db0ac6deSCy Schubert static bool 813db0ac6deSCy Schubert in6_multi_match(const struct inpcb *inp, void *v __unused) 814db0ac6deSCy Schubert { 815db0ac6deSCy Schubert 816db0ac6deSCy Schubert if ((inp->inp_vflag & INP_IPV6) && inp->in6p_moptions != NULL) 817db0ac6deSCy Schubert return (true); 818db0ac6deSCy Schubert else 819db0ac6deSCy Schubert return (false); 820db0ac6deSCy Schubert } 821db0ac6deSCy Schubert 822e43cc4aeSHajimu UMEMOTO void 8231272577eSXin LI in6_pcbpurgeif0(struct inpcbinfo *pcbinfo, struct ifnet *ifp) 824e43cc4aeSHajimu UMEMOTO { 825db0ac6deSCy Schubert struct inpcb_iterator inpi = INP_ITERATOR(pcbinfo, INPLOOKUP_RLOCKPCB, 826db0ac6deSCy Schubert in6_multi_match, NULL); 8270ecd976eSBjoern A. Zeeb struct inpcb *inp; 82859854ecfSHans Petter Selasky struct in6_multi *inm; 82959854ecfSHans Petter Selasky struct in6_mfilter *imf; 830e43cc4aeSHajimu UMEMOTO struct ip6_moptions *im6o; 831e43cc4aeSHajimu UMEMOTO 832db0ac6deSCy Schubert IN6_MULTI_LOCK_ASSERT(); 833db0ac6deSCy Schubert 834db0ac6deSCy Schubert while ((inp = inp_next(&inpi)) != NULL) { 835db0ac6deSCy Schubert INP_RLOCK_ASSERT(inp); 836db0ac6deSCy Schubert 8370ecd976eSBjoern A. Zeeb im6o = inp->in6p_moptions; 838e43cc4aeSHajimu UMEMOTO /* 83933cde130SBruce M Simpson * Unselect the outgoing ifp for multicast if it 84033cde130SBruce M Simpson * is being detached. 841e43cc4aeSHajimu UMEMOTO */ 842e43cc4aeSHajimu UMEMOTO if (im6o->im6o_multicast_ifp == ifp) 843e43cc4aeSHajimu UMEMOTO im6o->im6o_multicast_ifp = NULL; 844e43cc4aeSHajimu UMEMOTO /* 845e43cc4aeSHajimu UMEMOTO * Drop multicast group membership if we joined 846e43cc4aeSHajimu UMEMOTO * through the interface being detached. 847e43cc4aeSHajimu UMEMOTO */ 84859854ecfSHans Petter Selasky restart: 84959854ecfSHans Petter Selasky IP6_MFILTER_FOREACH(imf, &im6o->im6o_head) { 85059854ecfSHans Petter Selasky if ((inm = imf->im6f_in6m) == NULL) 85159854ecfSHans Petter Selasky continue; 85259854ecfSHans Petter Selasky if (inm->in6m_ifp != ifp) 85359854ecfSHans Petter Selasky continue; 85459854ecfSHans Petter Selasky ip6_mfilter_remove(&im6o->im6o_head, imf); 85559854ecfSHans Petter Selasky in6_leavegroup_locked(inm, NULL); 85659854ecfSHans Petter Selasky ip6_mfilter_free(imf); 85759854ecfSHans Petter Selasky goto restart; 858e43cc4aeSHajimu UMEMOTO } 859e43cc4aeSHajimu UMEMOTO } 860e43cc4aeSHajimu UMEMOTO } 861e43cc4aeSHajimu UMEMOTO 86282cd038dSYoshinobu Inoue /* 86382cd038dSYoshinobu Inoue * Check for alternatives when higher level complains 86482cd038dSYoshinobu Inoue * about service problems. For now, invalidate cached 86582cd038dSYoshinobu Inoue * routing information. If the route was created dynamically 86682cd038dSYoshinobu Inoue * (by a redirect), time to try a default gateway again. 86782cd038dSYoshinobu Inoue */ 86882cd038dSYoshinobu Inoue void 869ec86402eSBjoern A. Zeeb in6_losing(struct inpcb *inp) 87082cd038dSYoshinobu Inoue { 8711272577eSXin LI 872ec86402eSBjoern A. Zeeb RO_INVALIDATE_CACHE(&inp->inp_route6); 87382cd038dSYoshinobu Inoue } 87482cd038dSYoshinobu Inoue 87582cd038dSYoshinobu Inoue /* 87682cd038dSYoshinobu Inoue * After a routing change, flush old routing 87782cd038dSYoshinobu Inoue * and allocate a (hopefully) better one. 87882cd038dSYoshinobu Inoue */ 8793ce144eaSJeffrey Hsu struct inpcb * 880ec86402eSBjoern A. Zeeb in6_rtchange(struct inpcb *inp, int errno __unused) 88182cd038dSYoshinobu Inoue { 88284cc0778SGeorge V. Neville-Neil 883ec86402eSBjoern A. Zeeb RO_INVALIDATE_CACHE(&inp->inp_route6); 8843ce144eaSJeffrey Hsu return inp; 88582cd038dSYoshinobu Inoue } 88682cd038dSYoshinobu Inoue 887d93ec8cbSMark Johnston static bool 888d93ec8cbSMark Johnston in6_pcblookup_lb_numa_match(const struct inpcblbgroup *grp, int domain) 889d93ec8cbSMark Johnston { 890d93ec8cbSMark Johnston return (domain == M_NODOM || domain == grp->il_numa_domain); 891d93ec8cbSMark Johnston } 892d93ec8cbSMark Johnston 8931a43cff9SSean Bruno static struct inpcb * 8941a43cff9SSean Bruno in6_pcblookup_lbgroup(const struct inpcbinfo *pcbinfo, 8954130ea61SMark Johnston const struct in6_addr *faddr, uint16_t fport, const struct in6_addr *laddr, 8964130ea61SMark Johnston uint16_t lport, uint8_t domain) 8971a43cff9SSean Bruno { 8981a43cff9SSean Bruno const struct inpcblbgrouphead *hdr; 8991a43cff9SSean Bruno struct inpcblbgroup *grp; 900d93ec8cbSMark Johnston struct inpcblbgroup *jail_exact, *jail_wild, *local_exact, *local_wild; 901a600aabeSMark Johnston struct inpcb *inp; 902a600aabeSMark Johnston u_int count; 9031a43cff9SSean Bruno 9041a43cff9SSean Bruno INP_HASH_LOCK_ASSERT(pcbinfo); 9051a43cff9SSean Bruno 9069d2877fcSMark Johnston hdr = &pcbinfo->ipi_lbgrouphashbase[ 9079d2877fcSMark Johnston INP_PCBPORTHASH(lport, pcbinfo->ipi_lbgrouphashmask)]; 9081a43cff9SSean Bruno 9091a43cff9SSean Bruno /* 910d93ec8cbSMark Johnston * Search for an LB group match based on the following criteria: 911d93ec8cbSMark Johnston * - prefer jailed groups to non-jailed groups 912d93ec8cbSMark Johnston * - prefer exact source address matches to wildcard matches 913d93ec8cbSMark Johnston * - prefer groups bound to the specified NUMA domain 9141a43cff9SSean Bruno */ 915d93ec8cbSMark Johnston jail_exact = jail_wild = local_exact = local_wild = NULL; 91654af3d0dSMark Johnston CK_LIST_FOREACH(grp, hdr, il_list) { 917d93ec8cbSMark Johnston bool injail; 918d93ec8cbSMark Johnston 9194b82a7b6SAndrew Gallatin #ifdef INET 9204b82a7b6SAndrew Gallatin if (!(grp->il_vflag & INP_IPV6)) 9214b82a7b6SAndrew Gallatin continue; 9224b82a7b6SAndrew Gallatin #endif 923d3a4b0daSMark Johnston if (grp->il_lport != lport) 924d3a4b0daSMark Johnston continue; 9251a43cff9SSean Bruno 926d93ec8cbSMark Johnston injail = prison_flag(grp->il_cred, PR_IP6) != 0; 927d93ec8cbSMark Johnston if (injail && prison_check_ip6_locked(grp->il_cred->cr_prison, 928d93ec8cbSMark Johnston laddr) != 0) 929d93ec8cbSMark Johnston continue; 930d93ec8cbSMark Johnston 931a034518aSAndrew Gallatin if (IN6_ARE_ADDR_EQUAL(&grp->il6_laddr, laddr)) { 932d93ec8cbSMark Johnston if (injail) { 933d93ec8cbSMark Johnston jail_exact = grp; 934d93ec8cbSMark Johnston if (in6_pcblookup_lb_numa_match(grp, domain)) 935d93ec8cbSMark Johnston /* This is a perfect match. */ 936d93ec8cbSMark Johnston goto out; 937d93ec8cbSMark Johnston } else if (local_exact == NULL || 938d93ec8cbSMark Johnston in6_pcblookup_lb_numa_match(grp, domain)) { 939d93ec8cbSMark Johnston local_exact = grp; 940a034518aSAndrew Gallatin } 9414130ea61SMark Johnston } else if (IN6_IS_ADDR_UNSPECIFIED(&grp->il6_laddr)) { 942d93ec8cbSMark Johnston if (injail) { 943d93ec8cbSMark Johnston if (jail_wild == NULL || 944d93ec8cbSMark Johnston in6_pcblookup_lb_numa_match(grp, domain)) 945d93ec8cbSMark Johnston jail_wild = grp; 946d93ec8cbSMark Johnston } else if (local_wild == NULL || 947d93ec8cbSMark Johnston in6_pcblookup_lb_numa_match(grp, domain)) { 948d93ec8cbSMark Johnston local_wild = grp; 949d93ec8cbSMark Johnston } 950d93ec8cbSMark Johnston } 951d93ec8cbSMark Johnston } 952d93ec8cbSMark Johnston 953d93ec8cbSMark Johnston if (jail_exact != NULL) 954d93ec8cbSMark Johnston grp = jail_exact; 955d93ec8cbSMark Johnston else if (jail_wild != NULL) 956d93ec8cbSMark Johnston grp = jail_wild; 957d93ec8cbSMark Johnston else if (local_exact != NULL) 958d93ec8cbSMark Johnston grp = local_exact; 959a034518aSAndrew Gallatin else 960d93ec8cbSMark Johnston grp = local_wild; 961d93ec8cbSMark Johnston if (grp == NULL) 962d93ec8cbSMark Johnston return (NULL); 963d93ec8cbSMark Johnston out: 964a600aabeSMark Johnston /* 965a600aabeSMark Johnston * Synchronize with in_pcblbgroup_insert(). 966a600aabeSMark Johnston */ 967a600aabeSMark Johnston count = atomic_load_acq_int(&grp->il_inpcnt); 968a600aabeSMark Johnston if (count == 0) 969a600aabeSMark Johnston return (NULL); 970a600aabeSMark Johnston inp = grp->il_inp[INP6_PCBLBGROUP_PKTHASH(faddr, lport, fport) % count]; 971a600aabeSMark Johnston KASSERT(inp != NULL, ("%s: inp == NULL", __func__)); 972a600aabeSMark Johnston return (inp); 9731a43cff9SSean Bruno } 9741a43cff9SSean Bruno 9753e98dcb3SMark Johnston static bool 9763e98dcb3SMark Johnston in6_pcblookup_exact_match(const struct inpcb *inp, const struct in6_addr *faddr, 9773e98dcb3SMark Johnston u_short fport, const struct in6_addr *laddr, u_short lport) 9783e98dcb3SMark Johnston { 9793e98dcb3SMark Johnston /* XXX inp locking */ 9803e98dcb3SMark Johnston if ((inp->inp_vflag & INP_IPV6) == 0) 9813e98dcb3SMark Johnston return (false); 9823e98dcb3SMark Johnston if (IN6_ARE_ADDR_EQUAL(&inp->in6p_faddr, faddr) && 9833e98dcb3SMark Johnston IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, laddr) && 9843e98dcb3SMark Johnston inp->inp_fport == fport && inp->inp_lport == lport) 9853e98dcb3SMark Johnston return (true); 9863e98dcb3SMark Johnston return (false); 9873e98dcb3SMark Johnston } 9883e98dcb3SMark Johnston 9894130ea61SMark Johnston static struct inpcb * 9907b92493aSMark Johnston in6_pcblookup_hash_exact(struct inpcbinfo *pcbinfo, 9917b92493aSMark Johnston const struct in6_addr *faddr, u_short fport, 9927b92493aSMark Johnston const struct in6_addr *laddr, u_short lport) 99382cd038dSYoshinobu Inoue { 99482cd038dSYoshinobu Inoue struct inpcbhead *head; 9953e98dcb3SMark Johnston struct inpcb *inp; 99668e0d7e0SRobert Watson 997fa046d87SRobert Watson INP_HASH_LOCK_ASSERT(pcbinfo); 9988deea4a8SRobert Watson 99982cd038dSYoshinobu Inoue /* 100082cd038dSYoshinobu Inoue * First look for an exact match. 100182cd038dSYoshinobu Inoue */ 1002fdb987beSMark Johnston head = &pcbinfo->ipi_hash_exact[INP6_PCBHASH(faddr, lport, fport, 1003a0577692SGleb Smirnoff pcbinfo->ipi_hashmask)]; 1004fdb987beSMark Johnston CK_LIST_FOREACH(inp, head, inp_hash_exact) { 10053e98dcb3SMark Johnston if (in6_pcblookup_exact_match(inp, faddr, fport, laddr, lport)) 100682cd038dSYoshinobu Inoue return (inp); 100782cd038dSYoshinobu Inoue } 10083e98dcb3SMark Johnston return (NULL); 10093e98dcb3SMark Johnston } 10103e98dcb3SMark Johnston 10113e98dcb3SMark Johnston typedef enum { 10123e98dcb3SMark Johnston INPLOOKUP_MATCH_NONE = 0, 10133e98dcb3SMark Johnston INPLOOKUP_MATCH_WILD = 1, 10143e98dcb3SMark Johnston INPLOOKUP_MATCH_LADDR = 2, 10153e98dcb3SMark Johnston } inp_lookup_match_t; 10163e98dcb3SMark Johnston 10173e98dcb3SMark Johnston static inp_lookup_match_t 10183e98dcb3SMark Johnston in6_pcblookup_wild_match(const struct inpcb *inp, const struct in6_addr *laddr, 10193e98dcb3SMark Johnston u_short lport) 10203e98dcb3SMark Johnston { 10213e98dcb3SMark Johnston /* XXX inp locking */ 10223e98dcb3SMark Johnston if ((inp->inp_vflag & INP_IPV6) == 0) 10233e98dcb3SMark Johnston return (INPLOOKUP_MATCH_NONE); 10243e98dcb3SMark Johnston if (!IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr) || 10253e98dcb3SMark Johnston inp->inp_lport != lport) 10263e98dcb3SMark Johnston return (INPLOOKUP_MATCH_NONE); 10273e98dcb3SMark Johnston if (IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr)) 10283e98dcb3SMark Johnston return (INPLOOKUP_MATCH_WILD); 10293e98dcb3SMark Johnston if (IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, laddr)) 10303e98dcb3SMark Johnston return (INPLOOKUP_MATCH_LADDR); 10313e98dcb3SMark Johnston return (INPLOOKUP_MATCH_NONE); 10324130ea61SMark Johnston } 103382cd038dSYoshinobu Inoue 10347b92493aSMark Johnston #define INP_LOOKUP_AGAIN ((struct inpcb *)(uintptr_t)-1) 10357b92493aSMark Johnston 10367b92493aSMark Johnston static struct inpcb * 10377b92493aSMark Johnston in6_pcblookup_hash_wild_smr(struct inpcbinfo *pcbinfo, 103821d7ac8cSMark Johnston const struct in6_addr *laddr, u_short lport, const inp_lookup_t lockflags) 10397b92493aSMark Johnston { 10407b92493aSMark Johnston struct inpcbhead *head; 10417b92493aSMark Johnston struct inpcb *inp; 10427b92493aSMark Johnston 10437b92493aSMark Johnston KASSERT(SMR_ENTERED(pcbinfo->ipi_smr), 10447b92493aSMark Johnston ("%s: not in SMR read section", __func__)); 10457b92493aSMark Johnston 10467b92493aSMark Johnston head = &pcbinfo->ipi_hash_wild[INP_PCBHASH_WILD(lport, 10477b92493aSMark Johnston pcbinfo->ipi_hashmask)]; 10487b92493aSMark Johnston CK_LIST_FOREACH(inp, head, inp_hash_wild) { 10497b92493aSMark Johnston inp_lookup_match_t match; 10507b92493aSMark Johnston 10517b92493aSMark Johnston match = in6_pcblookup_wild_match(inp, laddr, lport); 10527b92493aSMark Johnston if (match == INPLOOKUP_MATCH_NONE) 10537b92493aSMark Johnston continue; 10547b92493aSMark Johnston 10557b92493aSMark Johnston if (__predict_true(inp_smr_lock(inp, lockflags))) { 1056a306ed50SMark Johnston match = in6_pcblookup_wild_match(inp, laddr, lport); 1057a306ed50SMark Johnston if (match != INPLOOKUP_MATCH_NONE && 1058a306ed50SMark Johnston prison_check_ip6_locked(inp->inp_cred->cr_prison, 1059a306ed50SMark Johnston laddr) == 0) 10607b92493aSMark Johnston return (inp); 10617b92493aSMark Johnston inp_unlock(inp, lockflags); 10627b92493aSMark Johnston } 10637b92493aSMark Johnston 10647b92493aSMark Johnston /* 10657b92493aSMark Johnston * The matching socket disappeared out from under us. Fall back 10667b92493aSMark Johnston * to a serialized lookup. 10677b92493aSMark Johnston */ 10687b92493aSMark Johnston return (INP_LOOKUP_AGAIN); 10697b92493aSMark Johnston } 10707b92493aSMark Johnston return (NULL); 10717b92493aSMark Johnston } 10727b92493aSMark Johnston 10734130ea61SMark Johnston static struct inpcb * 10744130ea61SMark Johnston in6_pcblookup_hash_wild_locked(struct inpcbinfo *pcbinfo, 107521d7ac8cSMark Johnston const struct in6_addr *laddr, u_short lport) 10764130ea61SMark Johnston { 10774130ea61SMark Johnston struct inpcbhead *head; 10784130ea61SMark Johnston struct inpcb *inp, *jail_wild, *local_exact, *local_wild; 1079d93ec8cbSMark Johnston 10803e98dcb3SMark Johnston INP_HASH_LOCK_ASSERT(pcbinfo); 10813e98dcb3SMark Johnston 1082d93ec8cbSMark Johnston /* 1083413628a7SBjoern A. Zeeb * Order of socket selection - we always prefer jails. 1084413628a7SBjoern A. Zeeb * 1. jailed, non-wild. 1085413628a7SBjoern A. Zeeb * 2. jailed, wild. 1086413628a7SBjoern A. Zeeb * 3. non-jailed, non-wild. 1087413628a7SBjoern A. Zeeb * 4. non-jailed, wild. 1088413628a7SBjoern A. Zeeb */ 1089fdb987beSMark Johnston head = &pcbinfo->ipi_hash_wild[INP_PCBHASH_WILD(lport, 10901b44e5ffSAndrey V. Elsukov pcbinfo->ipi_hashmask)]; 10914130ea61SMark Johnston local_wild = local_exact = jail_wild = NULL; 1092fdb987beSMark Johnston CK_LIST_FOREACH(inp, head, inp_hash_wild) { 10933e98dcb3SMark Johnston inp_lookup_match_t match; 10944130ea61SMark Johnston bool injail; 10954130ea61SMark Johnston 10963e98dcb3SMark Johnston match = in6_pcblookup_wild_match(inp, laddr, lport); 10973e98dcb3SMark Johnston if (match == INPLOOKUP_MATCH_NONE) 109882cd038dSYoshinobu Inoue continue; 1099413628a7SBjoern A. Zeeb 11004130ea61SMark Johnston injail = prison_flag(inp->inp_cred, PR_IP6) != 0; 1101413628a7SBjoern A. Zeeb if (injail) { 1102185e659cSGleb Smirnoff if (prison_check_ip6_locked( 1103185e659cSGleb Smirnoff inp->inp_cred->cr_prison, laddr) != 0) 1104413628a7SBjoern A. Zeeb continue; 1105413628a7SBjoern A. Zeeb } else { 1106413628a7SBjoern A. Zeeb if (local_exact != NULL) 1107413628a7SBjoern A. Zeeb continue; 1108413628a7SBjoern A. Zeeb } 1109413628a7SBjoern A. Zeeb 11103e98dcb3SMark Johnston if (match == INPLOOKUP_MATCH_LADDR) { 1111413628a7SBjoern A. Zeeb if (injail) 111282cd038dSYoshinobu Inoue return (inp); 1113413628a7SBjoern A. Zeeb else 1114413628a7SBjoern A. Zeeb local_exact = inp; 11153e98dcb3SMark Johnston } else { 1116413628a7SBjoern A. Zeeb if (injail) 1117413628a7SBjoern A. Zeeb jail_wild = inp; 1118413628a7SBjoern A. Zeeb else 111982cd038dSYoshinobu Inoue local_wild = inp; 112082cd038dSYoshinobu Inoue } 11214130ea61SMark Johnston } 1122413628a7SBjoern A. Zeeb 1123413628a7SBjoern A. Zeeb if (jail_wild != NULL) 1124413628a7SBjoern A. Zeeb return (jail_wild); 1125413628a7SBjoern A. Zeeb if (local_exact != NULL) 1126413628a7SBjoern A. Zeeb return (local_exact); 1127413628a7SBjoern A. Zeeb if (local_wild != NULL) 112882cd038dSYoshinobu Inoue return (local_wild); 112982cd038dSYoshinobu Inoue return (NULL); 113082cd038dSYoshinobu Inoue } 113182cd038dSYoshinobu Inoue 11324130ea61SMark Johnston struct inpcb * 11337b92493aSMark Johnston in6_pcblookup_hash_locked(struct inpcbinfo *pcbinfo, 11347b92493aSMark Johnston const struct in6_addr *faddr, u_int fport_arg, 11357b92493aSMark Johnston const struct in6_addr *laddr, u_int lport_arg, 11364130ea61SMark Johnston int lookupflags, uint8_t numa_domain) 11374130ea61SMark Johnston { 11384130ea61SMark Johnston struct inpcb *inp; 11394130ea61SMark Johnston u_short fport = fport_arg, lport = lport_arg; 11404130ea61SMark Johnston 11414130ea61SMark Johnston KASSERT((lookupflags & ~INPLOOKUP_WILDCARD) == 0, 11424130ea61SMark Johnston ("%s: invalid lookup flags %d", __func__, lookupflags)); 11434130ea61SMark Johnston KASSERT(!IN6_IS_ADDR_UNSPECIFIED(faddr), 11444130ea61SMark Johnston ("%s: invalid foreign address", __func__)); 11454130ea61SMark Johnston KASSERT(!IN6_IS_ADDR_UNSPECIFIED(laddr), 11464130ea61SMark Johnston ("%s: invalid local address", __func__)); 11474130ea61SMark Johnston INP_HASH_LOCK_ASSERT(pcbinfo); 11484130ea61SMark Johnston 11494130ea61SMark Johnston inp = in6_pcblookup_hash_exact(pcbinfo, faddr, fport, laddr, lport); 11504130ea61SMark Johnston if (inp != NULL) 11514130ea61SMark Johnston return (inp); 11524130ea61SMark Johnston 11534130ea61SMark Johnston if ((lookupflags & INPLOOKUP_WILDCARD) != 0) { 11544130ea61SMark Johnston inp = in6_pcblookup_lbgroup(pcbinfo, faddr, fport, laddr, 11554130ea61SMark Johnston lport, numa_domain); 11564130ea61SMark Johnston if (inp == NULL) { 115721d7ac8cSMark Johnston inp = in6_pcblookup_hash_wild_locked(pcbinfo, 115821d7ac8cSMark Johnston laddr, lport); 11594130ea61SMark Johnston } 11604130ea61SMark Johnston } 11614130ea61SMark Johnston return (inp); 11624130ea61SMark Johnston } 11634130ea61SMark Johnston 1164fa046d87SRobert Watson static struct inpcb * 11657b92493aSMark Johnston in6_pcblookup_hash(struct inpcbinfo *pcbinfo, const struct in6_addr *faddr, 11667b92493aSMark Johnston u_int fport, const struct in6_addr *laddr, u_int lport, int lookupflags, 11674130ea61SMark Johnston uint8_t numa_domain) 1168fa046d87SRobert Watson { 1169fa046d87SRobert Watson struct inpcb *inp; 11707b92493aSMark Johnston const inp_lookup_t lockflags = lookupflags & INPLOOKUP_LOCKMASK; 11717b92493aSMark Johnston 11727b92493aSMark Johnston KASSERT((lookupflags & (INPLOOKUP_RLOCKPCB | INPLOOKUP_WLOCKPCB)) != 0, 11737b92493aSMark Johnston ("%s: LOCKPCB not set", __func__)); 11747b92493aSMark Johnston 11757b92493aSMark Johnston INP_HASH_WLOCK(pcbinfo); 11767b92493aSMark Johnston inp = in6_pcblookup_hash_locked(pcbinfo, faddr, fport, laddr, lport, 11777b92493aSMark Johnston lookupflags & ~INPLOOKUP_LOCKMASK, numa_domain); 11787b92493aSMark Johnston if (inp != NULL && !inp_trylock(inp, lockflags)) { 11797b92493aSMark Johnston in_pcbref(inp); 11807b92493aSMark Johnston INP_HASH_WUNLOCK(pcbinfo); 11817b92493aSMark Johnston inp_lock(inp, lockflags); 11827b92493aSMark Johnston if (in_pcbrele(inp, lockflags)) 11837b92493aSMark Johnston /* XXX-MJ or retry until we get a negative match? */ 11847b92493aSMark Johnston inp = NULL; 11857b92493aSMark Johnston } else { 11867b92493aSMark Johnston INP_HASH_WUNLOCK(pcbinfo); 11877b92493aSMark Johnston } 11887b92493aSMark Johnston return (inp); 11897b92493aSMark Johnston } 11907b92493aSMark Johnston 11917b92493aSMark Johnston static struct inpcb * 119252ef944bSMark Johnston in6_pcblookup_hash_smr(struct inpcbinfo *pcbinfo, const struct in6_addr *faddr, 119352ef944bSMark Johnston u_int fport_arg, const struct in6_addr *laddr, u_int lport_arg, 119452ef944bSMark Johnston int lookupflags, uint8_t numa_domain) 11957b92493aSMark Johnston { 11967b92493aSMark Johnston struct inpcb *inp; 11977b92493aSMark Johnston const inp_lookup_t lockflags = lookupflags & INPLOOKUP_LOCKMASK; 11987b92493aSMark Johnston const u_short fport = fport_arg, lport = lport_arg; 1199fa046d87SRobert Watson 1200675e2618SMark Johnston KASSERT((lookupflags & ~INPLOOKUP_MASK) == 0, 1201675e2618SMark Johnston ("%s: invalid lookup flags %d", __func__, lookupflags)); 1202675e2618SMark Johnston KASSERT((lookupflags & (INPLOOKUP_RLOCKPCB | INPLOOKUP_WLOCKPCB)) != 0, 1203675e2618SMark Johnston ("%s: LOCKPCB not set", __func__)); 1204675e2618SMark Johnston 1205db0ac6deSCy Schubert smr_enter(pcbinfo->ipi_smr); 12067b92493aSMark Johnston inp = in6_pcblookup_hash_exact(pcbinfo, faddr, fport, laddr, lport); 1207fa046d87SRobert Watson if (inp != NULL) { 12087b92493aSMark Johnston if (__predict_true(inp_smr_lock(inp, lockflags))) { 12097b92493aSMark Johnston if (__predict_true(in6_pcblookup_exact_match(inp, 12107b92493aSMark Johnston faddr, fport, laddr, lport))) 12117b92493aSMark Johnston return (inp); 12127b92493aSMark Johnston inp_unlock(inp, lockflags); 12137b92493aSMark Johnston } 12147b92493aSMark Johnston /* 12157b92493aSMark Johnston * We failed to lock the inpcb, or its connection state changed 12167b92493aSMark Johnston * out from under us. Fall back to a precise search. 12177b92493aSMark Johnston */ 12187b92493aSMark Johnston return (in6_pcblookup_hash(pcbinfo, faddr, fport, laddr, lport, 12197b92493aSMark Johnston lookupflags, numa_domain)); 12207b92493aSMark Johnston } 12217b92493aSMark Johnston 12227b92493aSMark Johnston if ((lookupflags & INPLOOKUP_WILDCARD) != 0) { 12237b92493aSMark Johnston inp = in6_pcblookup_lbgroup(pcbinfo, faddr, fport, 12247b92493aSMark Johnston laddr, lport, numa_domain); 12257b92493aSMark Johnston if (inp != NULL) { 12267b92493aSMark Johnston if (__predict_true(inp_smr_lock(inp, lockflags))) { 12277b92493aSMark Johnston if (__predict_true(in6_pcblookup_wild_match(inp, 12287b92493aSMark Johnston laddr, lport) != INPLOOKUP_MATCH_NONE)) 12297b92493aSMark Johnston return (inp); 12307b92493aSMark Johnston inp_unlock(inp, lockflags); 12317b92493aSMark Johnston } 12327b92493aSMark Johnston inp = INP_LOOKUP_AGAIN; 12337b92493aSMark Johnston } else { 123421d7ac8cSMark Johnston inp = in6_pcblookup_hash_wild_smr(pcbinfo, laddr, lport, 123521d7ac8cSMark Johnston lockflags); 12367b92493aSMark Johnston } 12377b92493aSMark Johnston if (inp == INP_LOOKUP_AGAIN) { 12387b92493aSMark Johnston return (in6_pcblookup_hash(pcbinfo, faddr, fport, laddr, 12397b92493aSMark Johnston lport, lookupflags, numa_domain)); 12407b92493aSMark Johnston } 12417b92493aSMark Johnston } 12427b92493aSMark Johnston 12437b92493aSMark Johnston if (inp == NULL) 1244db0ac6deSCy Schubert smr_exit(pcbinfo->ipi_smr); 1245db0ac6deSCy Schubert 1246fa046d87SRobert Watson return (inp); 1247fa046d87SRobert Watson } 1248fa046d87SRobert Watson 1249fa046d87SRobert Watson /* 1250d3c1f003SRobert Watson * Public inpcb lookup routines, accepting a 4-tuple, and optionally, an mbuf 1251d3c1f003SRobert Watson * from which a pre-calculated hash value may be extracted. 1252fa046d87SRobert Watson */ 1253fa046d87SRobert Watson struct inpcb * 125452ef944bSMark Johnston in6_pcblookup(struct inpcbinfo *pcbinfo, const struct in6_addr *faddr, 125552ef944bSMark Johnston u_int fport, const struct in6_addr *laddr, u_int lport, int lookupflags, 12564130ea61SMark Johnston struct ifnet *ifp __unused) 1257fa046d87SRobert Watson { 12584130ea61SMark Johnston return (in6_pcblookup_hash_smr(pcbinfo, faddr, fport, laddr, lport, 12594130ea61SMark Johnston lookupflags, M_NODOM)); 1260d3c1f003SRobert Watson } 1261d3c1f003SRobert Watson 1262d3c1f003SRobert Watson struct inpcb * 126352ef944bSMark Johnston in6_pcblookup_mbuf(struct inpcbinfo *pcbinfo, const struct in6_addr *faddr, 126452ef944bSMark Johnston u_int fport, const struct in6_addr *laddr, u_int lport, int lookupflags, 12654130ea61SMark Johnston struct ifnet *ifp __unused, struct mbuf *m) 1266d3c1f003SRobert Watson { 12674130ea61SMark Johnston return (in6_pcblookup_hash_smr(pcbinfo, faddr, fport, laddr, lport, 12684130ea61SMark Johnston lookupflags, m->m_pkthdr.numa_domain)); 1269fa046d87SRobert Watson } 1270fa046d87SRobert Watson 127182cd038dSYoshinobu Inoue void 1272dce33a45SErmal Luçi init_sin6(struct sockaddr_in6 *sin6, struct mbuf *m, int srcordst) 127382cd038dSYoshinobu Inoue { 127482cd038dSYoshinobu Inoue struct ip6_hdr *ip; 127582cd038dSYoshinobu Inoue 127682cd038dSYoshinobu Inoue ip = mtod(m, struct ip6_hdr *); 127782cd038dSYoshinobu Inoue bzero(sin6, sizeof(*sin6)); 127882cd038dSYoshinobu Inoue sin6->sin6_len = sizeof(*sin6); 127982cd038dSYoshinobu Inoue sin6->sin6_family = AF_INET6; 1280dce33a45SErmal Luçi sin6->sin6_addr = srcordst ? ip->ip6_dst : ip->ip6_src; 1281a1f7e5f8SHajimu UMEMOTO 1282a1f7e5f8SHajimu UMEMOTO (void)sa6_recoverscope(sin6); /* XXX: should catch errors... */ 128382cd038dSYoshinobu Inoue 128482cd038dSYoshinobu Inoue return; 128582cd038dSYoshinobu Inoue } 1286