xref: /csrg-svn/sys/netinet/in_pcb.c (revision 58998)
123177Smckusick /*
248464Skarels  * Copyright (c) 1982, 1986, 1991 Regents of the University of California.
332787Sbostic  * All rights reserved.
423177Smckusick  *
544475Sbostic  * %sccs.include.redist.c%
632787Sbostic  *
7*58998Ssklower  *	@(#)in_pcb.c	7.26 (Berkeley) 04/07/93
823177Smckusick  */
94905Swnj 
1056531Sbostic #include <sys/param.h>
1156531Sbostic #include <sys/systm.h>
1256531Sbostic #include <sys/malloc.h>
1356531Sbostic #include <sys/mbuf.h>
1456531Sbostic #include <sys/protosw.h>
1556531Sbostic #include <sys/socket.h>
1656531Sbostic #include <sys/socketvar.h>
1756531Sbostic #include <sys/ioctl.h>
1856531Sbostic #include <sys/errno.h>
1948464Skarels 
2056531Sbostic #include <net/if.h>
2156531Sbostic #include <net/route.h>
2248464Skarels 
2356531Sbostic #include <netinet/in.h>
2456531Sbostic #include <netinet/in_systm.h>
2556531Sbostic #include <netinet/ip.h>
2656531Sbostic #include <netinet/in_pcb.h>
2756531Sbostic #include <netinet/in_var.h>
284905Swnj 
2956531Sbostic #include <netinet/ip_var.h>
3054716Ssklower 
315240Sroot struct	in_addr zeroin_addr;
325161Swnj 
337506Sroot in_pcballoc(so, head)
347506Sroot 	struct socket *so;
357506Sroot 	struct inpcb *head;
367506Sroot {
377506Sroot 	struct mbuf *m;
387506Sroot 	register struct inpcb *inp;
397506Sroot 
4054716Ssklower 	MALLOC(inp, struct inpcb *, sizeof(*inp), M_PCB, M_WAITOK);
4154716Ssklower 	if (inp == NULL)
427506Sroot 		return (ENOBUFS);
4354716Ssklower 	bzero((caddr_t)inp, sizeof(*inp));
447506Sroot 	inp->inp_head = head;
457506Sroot 	inp->inp_socket = so;
467506Sroot 	insque(inp, head);
477506Sroot 	so->so_pcb = (caddr_t)inp;
487506Sroot 	return (0);
497506Sroot }
507506Sroot 
518270Sroot in_pcbbind(inp, nam)
527506Sroot 	register struct inpcb *inp;
538270Sroot 	struct mbuf *nam;
547506Sroot {
557506Sroot 	register struct socket *so = inp->inp_socket;
567506Sroot 	register struct inpcb *head = inp->inp_head;
578270Sroot 	register struct sockaddr_in *sin;
587506Sroot 	u_short lport = 0;
5958373Smckusick 	int wild = 0;
607506Sroot 
6118374Skarels 	if (in_ifaddr == 0)
627506Sroot 		return (EADDRNOTAVAIL);
6310141Ssam 	if (inp->inp_lport || inp->inp_laddr.s_addr != INADDR_ANY)
648270Sroot 		return (EINVAL);
6558373Smckusick 	if ((so->so_options & SO_REUSEADDR) == 0 &&
6658373Smckusick 	    ((so->so_proto->pr_flags & PR_CONNREQUIRED) == 0 ||
6758373Smckusick 	     (so->so_options & SO_ACCEPTCONN) == 0))
6858373Smckusick 		wild = INPLOOKUP_WILDCARD;
698270Sroot 	if (nam == 0)
708270Sroot 		goto noname;
718270Sroot 	sin = mtod(nam, struct sockaddr_in *);
728270Sroot 	if (nam->m_len != sizeof (*sin))
738270Sroot 		return (EINVAL);
7410141Ssam 	if (sin->sin_addr.s_addr != INADDR_ANY) {
758270Sroot 		int tport = sin->sin_port;
767506Sroot 
778270Sroot 		sin->sin_port = 0;		/* yech... */
7818374Skarels 		if (ifa_ifwithaddr((struct sockaddr *)sin) == 0)
798270Sroot 			return (EADDRNOTAVAIL);
808270Sroot 		sin->sin_port = tport;
817506Sroot 	}
828270Sroot 	lport = sin->sin_port;
838270Sroot 	if (lport) {
8455347Ssklower 		struct inpcb *t;
8517429Skarels 		u_short aport = ntohs(lport);
867506Sroot 
878270Sroot 		/* GROSS */
8848464Skarels 		if (aport < IPPORT_RESERVED && (so->so_state & SS_PRIV) == 0)
898270Sroot 			return (EACCES);
9055347Ssklower 		t = in_pcblookup(head, zeroin_addr, 0,
9155352Ssklower 				sin->sin_addr, lport, wild);
9255347Ssklower 		if (t && !((so->so_options & t->inp_socket->so_options) &
9355347Ssklower 		    SO_REUSEPORT))
948270Sroot 			return (EADDRINUSE);
954951Swnj 	}
968270Sroot 	inp->inp_laddr = sin->sin_addr;
978270Sroot noname:
985172Swnj 	if (lport == 0)
995172Swnj 		do {
10026025Skarels 			if (head->inp_lport++ < IPPORT_RESERVED ||
10126025Skarels 			    head->inp_lport > IPPORT_USERRESERVED)
1025994Swnj 				head->inp_lport = IPPORT_RESERVED;
1035172Swnj 			lport = htons(head->inp_lport);
1045994Swnj 		} while (in_pcblookup(head,
10558373Smckusick 			    zeroin_addr, 0, inp->inp_laddr, lport, wild));
1065172Swnj 	inp->inp_lport = lport;
1074951Swnj 	return (0);
1084905Swnj }
1094905Swnj 
1106116Swnj /*
1116116Swnj  * Connect from a socket to a specified address.
1126116Swnj  * Both address and port must be specified in argument sin.
1136116Swnj  * If don't have a local address for this socket yet,
1146116Swnj  * then pick one.
1156116Swnj  */
1168270Sroot in_pcbconnect(inp, nam)
11731976Skarels 	register struct inpcb *inp;
1188270Sroot 	struct mbuf *nam;
1194923Swnj {
12018374Skarels 	struct in_ifaddr *ia;
1216338Ssam 	struct sockaddr_in *ifaddr;
1228270Sroot 	register struct sockaddr_in *sin = mtod(nam, struct sockaddr_in *);
1234923Swnj 
1248270Sroot 	if (nam->m_len != sizeof (*sin))
1258270Sroot 		return (EINVAL);
1264951Swnj 	if (sin->sin_family != AF_INET)
1274951Swnj 		return (EAFNOSUPPORT);
12818374Skarels 	if (sin->sin_port == 0)
1294951Swnj 		return (EADDRNOTAVAIL);
13018374Skarels 	if (in_ifaddr) {
13118655Skarels 		/*
13218655Skarels 		 * If the destination address is INADDR_ANY,
13318655Skarels 		 * use the primary local address.
13418655Skarels 		 * If the supplied address is INADDR_BROADCAST,
13518655Skarels 		 * and the primary interface supports broadcast,
13618655Skarels 		 * choose the broadcast address for that interface.
13718655Skarels 		 */
13818374Skarels #define	satosin(sa)	((struct sockaddr_in *)(sa))
139*58998Ssklower #define sintosa(sin)	((struct sockaddr *)(sin))
140*58998Ssklower #define ifatoia(ifa)	((struct in_ifaddr *)(ifa))
14118374Skarels 		if (sin->sin_addr.s_addr == INADDR_ANY)
14218655Skarels 		    sin->sin_addr = IA_SIN(in_ifaddr)->sin_addr;
14324807Skarels 		else if (sin->sin_addr.s_addr == (u_long)INADDR_BROADCAST &&
14418655Skarels 		  (in_ifaddr->ia_ifp->if_flags & IFF_BROADCAST))
14518655Skarels 		    sin->sin_addr = satosin(&in_ifaddr->ia_broadaddr)->sin_addr;
14618374Skarels 	}
14710141Ssam 	if (inp->inp_laddr.s_addr == INADDR_ANY) {
14827262Skarels 		register struct route *ro;
14917271Skarels 
15027262Skarels 		ia = (struct in_ifaddr *)0;
15127262Skarels 		/*
15227262Skarels 		 * If route is known or can be allocated now,
15327262Skarels 		 * our src addr is taken from the i/f, else punt.
15427262Skarels 		 */
15527262Skarels 		ro = &inp->inp_route;
15627262Skarels 		if (ro->ro_rt &&
15730336Skarels 		    (satosin(&ro->ro_dst)->sin_addr.s_addr !=
15830336Skarels 			sin->sin_addr.s_addr ||
15930336Skarels 		    inp->inp_socket->so_options & SO_DONTROUTE)) {
16027262Skarels 			RTFREE(ro->ro_rt);
16127262Skarels 			ro->ro_rt = (struct rtentry *)0;
1626338Ssam 		}
16328847Skarels 		if ((inp->inp_socket->so_options & SO_DONTROUTE) == 0 && /*XXX*/
16428847Skarels 		    (ro->ro_rt == (struct rtentry *)0 ||
16529826Skarels 		    ro->ro_rt->rt_ifp == (struct ifnet *)0)) {
16627262Skarels 			/* No route yet, so try to acquire one */
16727262Skarels 			ro->ro_dst.sa_family = AF_INET;
16837471Ssklower 			ro->ro_dst.sa_len = sizeof(struct sockaddr_in);
16927262Skarels 			((struct sockaddr_in *) &ro->ro_dst)->sin_addr =
17027262Skarels 				sin->sin_addr;
17127262Skarels 			rtalloc(ro);
17227262Skarels 		}
17329826Skarels 		/*
17429826Skarels 		 * If we found a route, use the address
17529826Skarels 		 * corresponding to the outgoing interface
17629826Skarels 		 * unless it is the loopback (in case a route
17729826Skarels 		 * to our address on another net goes to loopback).
17829826Skarels 		 */
179*58998Ssklower 		if (ro->ro_rt && !(ro->ro_rt->rt_ifp->if_flags & IFF_LOOPBACK))
180*58998Ssklower 			ia = ifatoia(ro->ro_rt->rt_ifa);
18128847Skarels 		if (ia == 0) {
18230336Skarels 			int fport = sin->sin_port;
18330336Skarels 
18430336Skarels 			sin->sin_port = 0;
185*58998Ssklower 			ia = ifatoia(ifa_ifwithdstaddr(sintosa(sin)));
186*58998Ssklower 			if (ia == 0)
187*58998Ssklower 				ia = ifatoia(ifa_ifwithnet(sintosa(sin)));
18830336Skarels 			sin->sin_port = fport;
18928847Skarels 			if (ia == 0)
19028847Skarels 				ia = in_ifaddr;
19128847Skarels 			if (ia == 0)
19228847Skarels 				return (EADDRNOTAVAIL);
19327262Skarels 		}
19454716Ssklower 		/*
19554716Ssklower 		 * If the destination address is multicast and an outgoing
19654716Ssklower 		 * interface has been set as a multicast option, use the
19754716Ssklower 		 * address of that interface as our source address.
19854716Ssklower 		 */
19954716Ssklower 		if (IN_MULTICAST(ntohl(sin->sin_addr.s_addr)) &&
20054716Ssklower 		    inp->inp_moptions != NULL) {
20154716Ssklower 			struct ip_moptions *imo;
202*58998Ssklower 			struct ifnet *ifp;
20354716Ssklower 
20454716Ssklower 			imo = inp->inp_moptions;
20554716Ssklower 			if (imo->imo_multicast_ifp != NULL) {
20654716Ssklower 				ifp = imo->imo_multicast_ifp;
20754716Ssklower 				for (ia = in_ifaddr; ia; ia = ia->ia_next)
20854716Ssklower 					if (ia->ia_ifp == ifp)
20954716Ssklower 						break;
21054716Ssklower 				if (ia == 0)
21154716Ssklower 					return (EADDRNOTAVAIL);
21254716Ssklower 			}
21354716Ssklower 		}
21418374Skarels 		ifaddr = (struct sockaddr_in *)&ia->ia_addr;
2155994Swnj 	}
2165994Swnj 	if (in_pcblookup(inp->inp_head,
2176116Swnj 	    sin->sin_addr,
2186116Swnj 	    sin->sin_port,
2196338Ssam 	    inp->inp_laddr.s_addr ? inp->inp_laddr : ifaddr->sin_addr,
2206116Swnj 	    inp->inp_lport,
2216116Swnj 	    0))
2225172Swnj 		return (EADDRINUSE);
22314146Ssam 	if (inp->inp_laddr.s_addr == INADDR_ANY) {
22414146Ssam 		if (inp->inp_lport == 0)
22526382Skarels 			(void)in_pcbbind(inp, (struct mbuf *)0);
2266338Ssam 		inp->inp_laddr = ifaddr->sin_addr;
22714146Ssam 	}
2284951Swnj 	inp->inp_faddr = sin->sin_addr;
2294951Swnj 	inp->inp_fport = sin->sin_port;
2304923Swnj 	return (0);
2314923Swnj }
2324923Swnj 
2335161Swnj in_pcbdisconnect(inp)
2344905Swnj 	struct inpcb *inp;
2354905Swnj {
2365161Swnj 
23710141Ssam 	inp->inp_faddr.s_addr = INADDR_ANY;
2386028Sroot 	inp->inp_fport = 0;
2397506Sroot 	if (inp->inp_socket->so_state & SS_NOFDREF)
2405161Swnj 		in_pcbdetach(inp);
2415161Swnj }
2425161Swnj 
2435161Swnj in_pcbdetach(inp)
2445161Swnj 	struct inpcb *inp;
2455161Swnj {
2464905Swnj 	struct socket *so = inp->inp_socket;
2474905Swnj 
2485009Swnj 	so->so_pcb = 0;
2495009Swnj 	sofree(so);
25024807Skarels 	if (inp->inp_options)
25126382Skarels 		(void)m_free(inp->inp_options);
2526350Ssam 	if (inp->inp_route.ro_rt)
2536367Ssam 		rtfree(inp->inp_route.ro_rt);
25454716Ssklower 	ip_freemoptions(inp->inp_moptions);
2554983Swnj 	remque(inp);
25654716Ssklower 	FREE(inp, M_PCB);
2574905Swnj }
2584905Swnj 
2598270Sroot in_setsockaddr(inp, nam)
2606509Ssam 	register struct inpcb *inp;
2618270Sroot 	struct mbuf *nam;
2626509Ssam {
26332071Skarels 	register struct sockaddr_in *sin;
2648270Sroot 
2658270Sroot 	nam->m_len = sizeof (*sin);
2668270Sroot 	sin = mtod(nam, struct sockaddr_in *);
2676509Ssam 	bzero((caddr_t)sin, sizeof (*sin));
2686509Ssam 	sin->sin_family = AF_INET;
26937471Ssklower 	sin->sin_len = sizeof(*sin);
2706509Ssam 	sin->sin_port = inp->inp_lport;
2716509Ssam 	sin->sin_addr = inp->inp_laddr;
2726509Ssam }
2736509Ssam 
27414123Ssam in_setpeeraddr(inp, nam)
27531976Skarels 	struct inpcb *inp;
27614123Ssam 	struct mbuf *nam;
27714123Ssam {
27832071Skarels 	register struct sockaddr_in *sin;
27914123Ssam 
28014123Ssam 	nam->m_len = sizeof (*sin);
28114123Ssam 	sin = mtod(nam, struct sockaddr_in *);
28214123Ssam 	bzero((caddr_t)sin, sizeof (*sin));
28314123Ssam 	sin->sin_family = AF_INET;
28437471Ssklower 	sin->sin_len = sizeof(*sin);
28514123Ssam 	sin->sin_port = inp->inp_fport;
28614123Ssam 	sin->sin_addr = inp->inp_faddr;
28714123Ssam }
28814123Ssam 
2895161Swnj /*
29017357Skarels  * Pass some notification to all connections of a protocol
29140692Skarels  * associated with address dst.  The local address and/or port numbers
29240692Skarels  * may be specified to limit the search.  The "usual action" will be
29340692Skarels  * taken, depending on the ctlinput cmd.  The caller must filter any
29440692Skarels  * cmds that are uninteresting (e.g., no error in the map).
29540692Skarels  * Call the protocol specific routine (if any) to report
29640692Skarels  * any errors for each matching socket.
29740692Skarels  *
29840692Skarels  * Must be called at splnet.
2996583Ssam  */
30040692Skarels in_pcbnotify(head, dst, fport, laddr, lport, cmd, notify)
3016583Ssam 	struct inpcb *head;
30240692Skarels 	struct sockaddr *dst;
30340692Skarels 	u_short fport, lport;
30440692Skarels 	struct in_addr laddr;
30540692Skarels 	int cmd, (*notify)();
3066583Ssam {
3076583Ssam 	register struct inpcb *inp, *oinp;
30840692Skarels 	struct in_addr faddr;
30940692Skarels 	int errno;
31040692Skarels 	int in_rtchange();
31140692Skarels 	extern u_char inetctlerrmap[];
3126583Ssam 
31340692Skarels 	if ((unsigned)cmd > PRC_NCMDS || dst->sa_family != AF_INET)
31440692Skarels 		return;
31540692Skarels 	faddr = ((struct sockaddr_in *)dst)->sin_addr;
31640692Skarels 	if (faddr.s_addr == INADDR_ANY)
31740692Skarels 		return;
31840692Skarels 
31940692Skarels 	/*
32040692Skarels 	 * Redirects go to all references to the destination,
32140692Skarels 	 * and use in_rtchange to invalidate the route cache.
32240692Skarels 	 * Dead host indications: notify all references to the destination.
32340692Skarels 	 * Otherwise, if we have knowledge of the local port and address,
32440692Skarels 	 * deliver only to that socket.
32540692Skarels 	 */
32640692Skarels 	if (PRC_IS_REDIRECT(cmd) || cmd == PRC_HOSTDEAD) {
32740692Skarels 		fport = 0;
32840692Skarels 		lport = 0;
32940692Skarels 		laddr.s_addr = 0;
33040692Skarels 		if (cmd != PRC_HOSTDEAD)
33140692Skarels 			notify = in_rtchange;
33240692Skarels 	}
33340692Skarels 	errno = inetctlerrmap[cmd];
3346583Ssam 	for (inp = head->inp_next; inp != head;) {
33540692Skarels 		if (inp->inp_faddr.s_addr != faddr.s_addr ||
33640692Skarels 		    inp->inp_socket == 0 ||
33740692Skarels 		    (lport && inp->inp_lport != lport) ||
33840692Skarels 		    (laddr.s_addr && inp->inp_laddr.s_addr != laddr.s_addr) ||
33940692Skarels 		    (fport && inp->inp_fport != fport)) {
3406583Ssam 			inp = inp->inp_next;
3416583Ssam 			continue;
3426583Ssam 		}
3436583Ssam 		oinp = inp;
3446583Ssam 		inp = inp->inp_next;
34524807Skarels 		if (notify)
34644381Skarels 			(*notify)(oinp, errno);
3476583Ssam 	}
3486583Ssam }
3496583Ssam 
35017357Skarels /*
35125508Skarels  * Check for alternatives when higher level complains
35225508Skarels  * about service problems.  For now, invalidate cached
35325508Skarels  * routing information.  If the route was created dynamically
35425508Skarels  * (by a redirect), time to try a default gateway again.
35525508Skarels  */
35625508Skarels in_losing(inp)
35725508Skarels 	struct inpcb *inp;
35825508Skarels {
35925508Skarels 	register struct rtentry *rt;
36052555Ssklower 	struct rt_addrinfo info;
36125508Skarels 
36225508Skarels 	if ((rt = inp->inp_route.ro_rt)) {
36355543Ssklower 		inp->inp_route.ro_rt = 0;
36452555Ssklower 		bzero((caddr_t)&info, sizeof(info));
36552555Ssklower 		info.rti_info[RTAX_DST] =
36652555Ssklower 			(struct sockaddr *)&inp->inp_route.ro_dst;
36752555Ssklower 		info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
36852555Ssklower 		info.rti_info[RTAX_NETMASK] = rt_mask(rt);
36952555Ssklower 		rt_missmsg(RTM_LOSING, &info, rt->rt_flags, 0);
37025508Skarels 		if (rt->rt_flags & RTF_DYNAMIC)
37137471Ssklower 			(void) rtrequest(RTM_DELETE, rt_key(rt),
37237471Ssklower 				rt->rt_gateway, rt_mask(rt), rt->rt_flags,
37337471Ssklower 				(struct rtentry **)0);
37455543Ssklower 		else
37525508Skarels 		/*
37625508Skarels 		 * A new route can be allocated
37725508Skarels 		 * the next time output is attempted.
37825508Skarels 		 */
37955543Ssklower 			rtfree(rt);
38025508Skarels 	}
38125508Skarels }
38225508Skarels 
38325508Skarels /*
38417357Skarels  * After a routing change, flush old routing
38517357Skarels  * and allocate a (hopefully) better one.
38617357Skarels  */
38717357Skarels in_rtchange(inp)
38825508Skarels 	register struct inpcb *inp;
38917357Skarels {
39017357Skarels 	if (inp->inp_route.ro_rt) {
39117357Skarels 		rtfree(inp->inp_route.ro_rt);
39217357Skarels 		inp->inp_route.ro_rt = 0;
39317357Skarels 		/*
39417357Skarels 		 * A new route can be allocated the next time
39517357Skarels 		 * output is attempted.
39617357Skarels 		 */
39717357Skarels 	}
39817357Skarels }
39917357Skarels 
4004907Swnj struct inpcb *
4016028Sroot in_pcblookup(head, faddr, fport, laddr, lport, flags)
4024905Swnj 	struct inpcb *head;
4034951Swnj 	struct in_addr faddr, laddr;
4044905Swnj 	u_short fport, lport;
4056028Sroot 	int flags;
4064905Swnj {
4075994Swnj 	register struct inpcb *inp, *match = 0;
4085994Swnj 	int matchwild = 3, wildcard;
4094905Swnj 
4105161Swnj 	for (inp = head->inp_next; inp != head; inp = inp->inp_next) {
4115994Swnj 		if (inp->inp_lport != lport)
4125161Swnj 			continue;
4135994Swnj 		wildcard = 0;
41410141Ssam 		if (inp->inp_laddr.s_addr != INADDR_ANY) {
41510141Ssam 			if (laddr.s_addr == INADDR_ANY)
4166116Swnj 				wildcard++;
4176116Swnj 			else if (inp->inp_laddr.s_addr != laddr.s_addr)
4185994Swnj 				continue;
4195994Swnj 		} else {
42010141Ssam 			if (laddr.s_addr != INADDR_ANY)
4215994Swnj 				wildcard++;
4225994Swnj 		}
42310141Ssam 		if (inp->inp_faddr.s_addr != INADDR_ANY) {
42410141Ssam 			if (faddr.s_addr == INADDR_ANY)
4256116Swnj 				wildcard++;
4266116Swnj 			else if (inp->inp_faddr.s_addr != faddr.s_addr ||
4276028Sroot 			    inp->inp_fport != fport)
4285994Swnj 				continue;
4295994Swnj 		} else {
43010141Ssam 			if (faddr.s_addr != INADDR_ANY)
4315994Swnj 				wildcard++;
4325994Swnj 		}
4336028Sroot 		if (wildcard && (flags & INPLOOKUP_WILDCARD) == 0)
4345994Swnj 			continue;
4355994Swnj 		if (wildcard < matchwild) {
4365161Swnj 			match = inp;
4375994Swnj 			matchwild = wildcard;
4385994Swnj 			if (matchwild == 0)
4395994Swnj 				break;
4405161Swnj 		}
4415161Swnj 	}
4425161Swnj 	return (match);
4434905Swnj }
444