xref: /csrg-svn/sys/netinet/in_pcb.c (revision 55543)
123177Smckusick /*
248464Skarels  * Copyright (c) 1982, 1986, 1991 Regents of the University of California.
332787Sbostic  * All rights reserved.
423177Smckusick  *
544475Sbostic  * %sccs.include.redist.c%
632787Sbostic  *
7*55543Ssklower  *	@(#)in_pcb.c	7.22 (Berkeley) 07/22/92
823177Smckusick  */
94905Swnj 
1017058Sbloom #include "param.h"
1117058Sbloom #include "systm.h"
1235794Skarels #include "malloc.h"
1317058Sbloom #include "mbuf.h"
1448464Skarels #include "protosw.h"
1517058Sbloom #include "socket.h"
1617058Sbloom #include "socketvar.h"
1725508Skarels #include "ioctl.h"
1851270Ssklower #include "errno.h"
1948464Skarels 
2040692Skarels #include "../net/if.h"
2140692Skarels #include "../net/route.h"
2248464Skarels 
2317058Sbloom #include "in.h"
2417058Sbloom #include "in_systm.h"
2540692Skarels #include "ip.h"
2617058Sbloom #include "in_pcb.h"
2718374Skarels #include "in_var.h"
284905Swnj 
2954716Ssklower #ifdef MULTICAST
3054716Ssklower #include "ip_var.h"
3154716Ssklower #endif
3254716Ssklower 
335240Sroot struct	in_addr zeroin_addr;
345161Swnj 
357506Sroot in_pcballoc(so, head)
367506Sroot 	struct socket *so;
377506Sroot 	struct inpcb *head;
387506Sroot {
397506Sroot 	struct mbuf *m;
407506Sroot 	register struct inpcb *inp;
417506Sroot 
4254716Ssklower 	MALLOC(inp, struct inpcb *, sizeof(*inp), M_PCB, M_WAITOK);
4354716Ssklower 	if (inp == NULL)
447506Sroot 		return (ENOBUFS);
4554716Ssklower 	bzero((caddr_t)inp, sizeof(*inp));
467506Sroot 	inp->inp_head = head;
477506Sroot 	inp->inp_socket = so;
487506Sroot 	insque(inp, head);
497506Sroot 	so->so_pcb = (caddr_t)inp;
507506Sroot 	return (0);
517506Sroot }
527506Sroot 
538270Sroot in_pcbbind(inp, nam)
547506Sroot 	register struct inpcb *inp;
558270Sroot 	struct mbuf *nam;
567506Sroot {
577506Sroot 	register struct socket *so = inp->inp_socket;
587506Sroot 	register struct inpcb *head = inp->inp_head;
598270Sroot 	register struct sockaddr_in *sin;
607506Sroot 	u_short lport = 0;
617506Sroot 
6218374Skarels 	if (in_ifaddr == 0)
637506Sroot 		return (EADDRNOTAVAIL);
6410141Ssam 	if (inp->inp_lport || inp->inp_laddr.s_addr != INADDR_ANY)
658270Sroot 		return (EINVAL);
668270Sroot 	if (nam == 0)
678270Sroot 		goto noname;
688270Sroot 	sin = mtod(nam, struct sockaddr_in *);
698270Sroot 	if (nam->m_len != sizeof (*sin))
708270Sroot 		return (EINVAL);
7110141Ssam 	if (sin->sin_addr.s_addr != INADDR_ANY) {
728270Sroot 		int tport = sin->sin_port;
737506Sroot 
748270Sroot 		sin->sin_port = 0;		/* yech... */
7518374Skarels 		if (ifa_ifwithaddr((struct sockaddr *)sin) == 0)
768270Sroot 			return (EADDRNOTAVAIL);
778270Sroot 		sin->sin_port = tport;
787506Sroot 	}
798270Sroot 	lport = sin->sin_port;
808270Sroot 	if (lport) {
8155347Ssklower 		struct inpcb *t;
8217429Skarels 		u_short aport = ntohs(lport);
838270Sroot 		int wild = 0;
847506Sroot 
858270Sroot 		/* GROSS */
8648464Skarels 		if (aport < IPPORT_RESERVED && (so->so_state & SS_PRIV) == 0)
878270Sroot 			return (EACCES);
8810598Ssam 		/* even GROSSER, but this is the Internet */
8910598Ssam 		if ((so->so_options & SO_REUSEADDR) == 0 &&
9010598Ssam 		    ((so->so_proto->pr_flags & PR_CONNREQUIRED) == 0 ||
9110598Ssam 		     (so->so_options & SO_ACCEPTCONN) == 0))
928270Sroot 			wild = INPLOOKUP_WILDCARD;
9355347Ssklower 		t = in_pcblookup(head, zeroin_addr, 0,
9455352Ssklower 				sin->sin_addr, lport, wild);
9555347Ssklower 		if (t && !((so->so_options & t->inp_socket->so_options) &
9655347Ssklower 		    SO_REUSEPORT))
978270Sroot 			return (EADDRINUSE);
984951Swnj 	}
998270Sroot 	inp->inp_laddr = sin->sin_addr;
1008270Sroot noname:
1015172Swnj 	if (lport == 0)
1025172Swnj 		do {
10326025Skarels 			if (head->inp_lport++ < IPPORT_RESERVED ||
10426025Skarels 			    head->inp_lport > IPPORT_USERRESERVED)
1055994Swnj 				head->inp_lport = IPPORT_RESERVED;
1065172Swnj 			lport = htons(head->inp_lport);
1075994Swnj 		} while (in_pcblookup(head,
1085994Swnj 			    zeroin_addr, 0, inp->inp_laddr, lport, 0));
1095172Swnj 	inp->inp_lport = lport;
1104951Swnj 	return (0);
1114905Swnj }
1124905Swnj 
1136116Swnj /*
1146116Swnj  * Connect from a socket to a specified address.
1156116Swnj  * Both address and port must be specified in argument sin.
1166116Swnj  * If don't have a local address for this socket yet,
1176116Swnj  * then pick one.
1186116Swnj  */
1198270Sroot in_pcbconnect(inp, nam)
12031976Skarels 	register struct inpcb *inp;
1218270Sroot 	struct mbuf *nam;
1224923Swnj {
12318374Skarels 	struct in_ifaddr *ia;
1246338Ssam 	struct sockaddr_in *ifaddr;
1258270Sroot 	register struct sockaddr_in *sin = mtod(nam, struct sockaddr_in *);
1264923Swnj 
1278270Sroot 	if (nam->m_len != sizeof (*sin))
1288270Sroot 		return (EINVAL);
1294951Swnj 	if (sin->sin_family != AF_INET)
1304951Swnj 		return (EAFNOSUPPORT);
13118374Skarels 	if (sin->sin_port == 0)
1324951Swnj 		return (EADDRNOTAVAIL);
13318374Skarels 	if (in_ifaddr) {
13418655Skarels 		/*
13518655Skarels 		 * If the destination address is INADDR_ANY,
13618655Skarels 		 * use the primary local address.
13718655Skarels 		 * If the supplied address is INADDR_BROADCAST,
13818655Skarels 		 * and the primary interface supports broadcast,
13918655Skarels 		 * choose the broadcast address for that interface.
14018655Skarels 		 */
14118374Skarels #define	satosin(sa)	((struct sockaddr_in *)(sa))
14218374Skarels 		if (sin->sin_addr.s_addr == INADDR_ANY)
14318655Skarels 		    sin->sin_addr = IA_SIN(in_ifaddr)->sin_addr;
14424807Skarels 		else if (sin->sin_addr.s_addr == (u_long)INADDR_BROADCAST &&
14518655Skarels 		  (in_ifaddr->ia_ifp->if_flags & IFF_BROADCAST))
14618655Skarels 		    sin->sin_addr = satosin(&in_ifaddr->ia_broadaddr)->sin_addr;
14718374Skarels 	}
14810141Ssam 	if (inp->inp_laddr.s_addr == INADDR_ANY) {
14927262Skarels 		register struct route *ro;
15027262Skarels 		struct ifnet *ifp;
15117271Skarels 
15227262Skarels 		ia = (struct in_ifaddr *)0;
15327262Skarels 		/*
15427262Skarels 		 * If route is known or can be allocated now,
15527262Skarels 		 * our src addr is taken from the i/f, else punt.
15627262Skarels 		 */
15727262Skarels 		ro = &inp->inp_route;
15827262Skarels 		if (ro->ro_rt &&
15930336Skarels 		    (satosin(&ro->ro_dst)->sin_addr.s_addr !=
16030336Skarels 			sin->sin_addr.s_addr ||
16130336Skarels 		    inp->inp_socket->so_options & SO_DONTROUTE)) {
16227262Skarels 			RTFREE(ro->ro_rt);
16327262Skarels 			ro->ro_rt = (struct rtentry *)0;
1646338Ssam 		}
16528847Skarels 		if ((inp->inp_socket->so_options & SO_DONTROUTE) == 0 && /*XXX*/
16628847Skarels 		    (ro->ro_rt == (struct rtentry *)0 ||
16729826Skarels 		    ro->ro_rt->rt_ifp == (struct ifnet *)0)) {
16827262Skarels 			/* No route yet, so try to acquire one */
16927262Skarels 			ro->ro_dst.sa_family = AF_INET;
17037471Ssklower 			ro->ro_dst.sa_len = sizeof(struct sockaddr_in);
17127262Skarels 			((struct sockaddr_in *) &ro->ro_dst)->sin_addr =
17227262Skarels 				sin->sin_addr;
17327262Skarels 			rtalloc(ro);
17427262Skarels 		}
17529826Skarels 		/*
17629826Skarels 		 * If we found a route, use the address
17729826Skarels 		 * corresponding to the outgoing interface
17829826Skarels 		 * unless it is the loopback (in case a route
17929826Skarels 		 * to our address on another net goes to loopback).
18029826Skarels 		 */
18129826Skarels 		if (ro->ro_rt && (ifp = ro->ro_rt->rt_ifp) &&
18253042Ssklower 		    (ifp->if_flags & IFF_LOOPBACK) == 0 &&
18353042Ssklower 		    (ia = (struct in_ifaddr *)ro->ro_rt->rt_ifa) == 0)
18429826Skarels 			for (ia = in_ifaddr; ia; ia = ia->ia_next)
18529826Skarels 				if (ia->ia_ifp == ifp)
18629826Skarels 					break;
18728847Skarels 		if (ia == 0) {
18830336Skarels 			int fport = sin->sin_port;
18930336Skarels 
19030336Skarels 			sin->sin_port = 0;
19128847Skarels 			ia = (struct in_ifaddr *)
19228847Skarels 			    ifa_ifwithdstaddr((struct sockaddr *)sin);
19330336Skarels 			sin->sin_port = fport;
19428847Skarels 			if (ia == 0)
19528847Skarels 				ia = in_iaonnetof(in_netof(sin->sin_addr));
19628847Skarels 			if (ia == 0)
19728847Skarels 				ia = in_ifaddr;
19828847Skarels 			if (ia == 0)
19928847Skarels 				return (EADDRNOTAVAIL);
20027262Skarels 		}
20154716Ssklower #ifdef MULTICAST
20254716Ssklower 		/*
20354716Ssklower 		 * If the destination address is multicast and an outgoing
20454716Ssklower 		 * interface has been set as a multicast option, use the
20554716Ssklower 		 * address of that interface as our source address.
20654716Ssklower 		 */
20754716Ssklower 		if (IN_MULTICAST(ntohl(sin->sin_addr.s_addr)) &&
20854716Ssklower 		    inp->inp_moptions != NULL) {
20954716Ssklower 			struct ip_moptions *imo;
21054716Ssklower 
21154716Ssklower 			imo = inp->inp_moptions;
21254716Ssklower 			if (imo->imo_multicast_ifp != NULL) {
21354716Ssklower 				ifp = imo->imo_multicast_ifp;
21454716Ssklower 				for (ia = in_ifaddr; ia; ia = ia->ia_next)
21554716Ssklower 					if (ia->ia_ifp == ifp)
21654716Ssklower 						break;
21754716Ssklower 				if (ia == 0)
21854716Ssklower 					return (EADDRNOTAVAIL);
21954716Ssklower 			}
22054716Ssklower 		}
22154716Ssklower #endif
22218374Skarels 		ifaddr = (struct sockaddr_in *)&ia->ia_addr;
2235994Swnj 	}
2245994Swnj 	if (in_pcblookup(inp->inp_head,
2256116Swnj 	    sin->sin_addr,
2266116Swnj 	    sin->sin_port,
2276338Ssam 	    inp->inp_laddr.s_addr ? inp->inp_laddr : ifaddr->sin_addr,
2286116Swnj 	    inp->inp_lport,
2296116Swnj 	    0))
2305172Swnj 		return (EADDRINUSE);
23114146Ssam 	if (inp->inp_laddr.s_addr == INADDR_ANY) {
23214146Ssam 		if (inp->inp_lport == 0)
23326382Skarels 			(void)in_pcbbind(inp, (struct mbuf *)0);
2346338Ssam 		inp->inp_laddr = ifaddr->sin_addr;
23514146Ssam 	}
2364951Swnj 	inp->inp_faddr = sin->sin_addr;
2374951Swnj 	inp->inp_fport = sin->sin_port;
2384923Swnj 	return (0);
2394923Swnj }
2404923Swnj 
2415161Swnj in_pcbdisconnect(inp)
2424905Swnj 	struct inpcb *inp;
2434905Swnj {
2445161Swnj 
24510141Ssam 	inp->inp_faddr.s_addr = INADDR_ANY;
2466028Sroot 	inp->inp_fport = 0;
2477506Sroot 	if (inp->inp_socket->so_state & SS_NOFDREF)
2485161Swnj 		in_pcbdetach(inp);
2495161Swnj }
2505161Swnj 
2515161Swnj in_pcbdetach(inp)
2525161Swnj 	struct inpcb *inp;
2535161Swnj {
2544905Swnj 	struct socket *so = inp->inp_socket;
2554905Swnj 
2565009Swnj 	so->so_pcb = 0;
2575009Swnj 	sofree(so);
25824807Skarels 	if (inp->inp_options)
25926382Skarels 		(void)m_free(inp->inp_options);
2606350Ssam 	if (inp->inp_route.ro_rt)
2616367Ssam 		rtfree(inp->inp_route.ro_rt);
26254716Ssklower #ifdef MULTICAST
26354716Ssklower 	ip_freemoptions(inp->inp_moptions);
26454716Ssklower #endif
2654983Swnj 	remque(inp);
26654716Ssklower 	FREE(inp, M_PCB);
2674905Swnj }
2684905Swnj 
2698270Sroot in_setsockaddr(inp, nam)
2706509Ssam 	register struct inpcb *inp;
2718270Sroot 	struct mbuf *nam;
2726509Ssam {
27332071Skarels 	register struct sockaddr_in *sin;
2748270Sroot 
2758270Sroot 	nam->m_len = sizeof (*sin);
2768270Sroot 	sin = mtod(nam, struct sockaddr_in *);
2776509Ssam 	bzero((caddr_t)sin, sizeof (*sin));
2786509Ssam 	sin->sin_family = AF_INET;
27937471Ssklower 	sin->sin_len = sizeof(*sin);
2806509Ssam 	sin->sin_port = inp->inp_lport;
2816509Ssam 	sin->sin_addr = inp->inp_laddr;
2826509Ssam }
2836509Ssam 
28414123Ssam in_setpeeraddr(inp, nam)
28531976Skarels 	struct inpcb *inp;
28614123Ssam 	struct mbuf *nam;
28714123Ssam {
28832071Skarels 	register struct sockaddr_in *sin;
28914123Ssam 
29014123Ssam 	nam->m_len = sizeof (*sin);
29114123Ssam 	sin = mtod(nam, struct sockaddr_in *);
29214123Ssam 	bzero((caddr_t)sin, sizeof (*sin));
29314123Ssam 	sin->sin_family = AF_INET;
29437471Ssklower 	sin->sin_len = sizeof(*sin);
29514123Ssam 	sin->sin_port = inp->inp_fport;
29614123Ssam 	sin->sin_addr = inp->inp_faddr;
29714123Ssam }
29814123Ssam 
2995161Swnj /*
30017357Skarels  * Pass some notification to all connections of a protocol
30140692Skarels  * associated with address dst.  The local address and/or port numbers
30240692Skarels  * may be specified to limit the search.  The "usual action" will be
30340692Skarels  * taken, depending on the ctlinput cmd.  The caller must filter any
30440692Skarels  * cmds that are uninteresting (e.g., no error in the map).
30540692Skarels  * Call the protocol specific routine (if any) to report
30640692Skarels  * any errors for each matching socket.
30740692Skarels  *
30840692Skarels  * Must be called at splnet.
3096583Ssam  */
31040692Skarels in_pcbnotify(head, dst, fport, laddr, lport, cmd, notify)
3116583Ssam 	struct inpcb *head;
31240692Skarels 	struct sockaddr *dst;
31340692Skarels 	u_short fport, lport;
31440692Skarels 	struct in_addr laddr;
31540692Skarels 	int cmd, (*notify)();
3166583Ssam {
3176583Ssam 	register struct inpcb *inp, *oinp;
31840692Skarels 	struct in_addr faddr;
31940692Skarels 	int errno;
32040692Skarels 	int in_rtchange();
32140692Skarels 	extern u_char inetctlerrmap[];
3226583Ssam 
32340692Skarels 	if ((unsigned)cmd > PRC_NCMDS || dst->sa_family != AF_INET)
32440692Skarels 		return;
32540692Skarels 	faddr = ((struct sockaddr_in *)dst)->sin_addr;
32640692Skarels 	if (faddr.s_addr == INADDR_ANY)
32740692Skarels 		return;
32840692Skarels 
32940692Skarels 	/*
33040692Skarels 	 * Redirects go to all references to the destination,
33140692Skarels 	 * and use in_rtchange to invalidate the route cache.
33240692Skarels 	 * Dead host indications: notify all references to the destination.
33340692Skarels 	 * Otherwise, if we have knowledge of the local port and address,
33440692Skarels 	 * deliver only to that socket.
33540692Skarels 	 */
33640692Skarels 	if (PRC_IS_REDIRECT(cmd) || cmd == PRC_HOSTDEAD) {
33740692Skarels 		fport = 0;
33840692Skarels 		lport = 0;
33940692Skarels 		laddr.s_addr = 0;
34040692Skarels 		if (cmd != PRC_HOSTDEAD)
34140692Skarels 			notify = in_rtchange;
34240692Skarels 	}
34340692Skarels 	errno = inetctlerrmap[cmd];
3446583Ssam 	for (inp = head->inp_next; inp != head;) {
34540692Skarels 		if (inp->inp_faddr.s_addr != faddr.s_addr ||
34640692Skarels 		    inp->inp_socket == 0 ||
34740692Skarels 		    (lport && inp->inp_lport != lport) ||
34840692Skarels 		    (laddr.s_addr && inp->inp_laddr.s_addr != laddr.s_addr) ||
34940692Skarels 		    (fport && inp->inp_fport != fport)) {
3506583Ssam 			inp = inp->inp_next;
3516583Ssam 			continue;
3526583Ssam 		}
3536583Ssam 		oinp = inp;
3546583Ssam 		inp = inp->inp_next;
35524807Skarels 		if (notify)
35644381Skarels 			(*notify)(oinp, errno);
3576583Ssam 	}
3586583Ssam }
3596583Ssam 
36017357Skarels /*
36125508Skarels  * Check for alternatives when higher level complains
36225508Skarels  * about service problems.  For now, invalidate cached
36325508Skarels  * routing information.  If the route was created dynamically
36425508Skarels  * (by a redirect), time to try a default gateway again.
36525508Skarels  */
36625508Skarels in_losing(inp)
36725508Skarels 	struct inpcb *inp;
36825508Skarels {
36925508Skarels 	register struct rtentry *rt;
37052555Ssklower 	struct rt_addrinfo info;
37125508Skarels 
37225508Skarels 	if ((rt = inp->inp_route.ro_rt)) {
373*55543Ssklower 		inp->inp_route.ro_rt = 0;
37452555Ssklower 		bzero((caddr_t)&info, sizeof(info));
37552555Ssklower 		info.rti_info[RTAX_DST] =
37652555Ssklower 			(struct sockaddr *)&inp->inp_route.ro_dst;
37752555Ssklower 		info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
37852555Ssklower 		info.rti_info[RTAX_NETMASK] = rt_mask(rt);
37952555Ssklower 		rt_missmsg(RTM_LOSING, &info, rt->rt_flags, 0);
38025508Skarels 		if (rt->rt_flags & RTF_DYNAMIC)
38137471Ssklower 			(void) rtrequest(RTM_DELETE, rt_key(rt),
38237471Ssklower 				rt->rt_gateway, rt_mask(rt), rt->rt_flags,
38337471Ssklower 				(struct rtentry **)0);
384*55543Ssklower 		else
38525508Skarels 		/*
38625508Skarels 		 * A new route can be allocated
38725508Skarels 		 * the next time output is attempted.
38825508Skarels 		 */
389*55543Ssklower 			rtfree(rt);
39025508Skarels 	}
39125508Skarels }
39225508Skarels 
39325508Skarels /*
39417357Skarels  * After a routing change, flush old routing
39517357Skarels  * and allocate a (hopefully) better one.
39617357Skarels  */
39717357Skarels in_rtchange(inp)
39825508Skarels 	register struct inpcb *inp;
39917357Skarels {
40017357Skarels 	if (inp->inp_route.ro_rt) {
40117357Skarels 		rtfree(inp->inp_route.ro_rt);
40217357Skarels 		inp->inp_route.ro_rt = 0;
40317357Skarels 		/*
40417357Skarels 		 * A new route can be allocated the next time
40517357Skarels 		 * output is attempted.
40617357Skarels 		 */
40717357Skarels 	}
40817357Skarels }
40917357Skarels 
4104907Swnj struct inpcb *
4116028Sroot in_pcblookup(head, faddr, fport, laddr, lport, flags)
4124905Swnj 	struct inpcb *head;
4134951Swnj 	struct in_addr faddr, laddr;
4144905Swnj 	u_short fport, lport;
4156028Sroot 	int flags;
4164905Swnj {
4175994Swnj 	register struct inpcb *inp, *match = 0;
4185994Swnj 	int matchwild = 3, wildcard;
4194905Swnj 
4205161Swnj 	for (inp = head->inp_next; inp != head; inp = inp->inp_next) {
4215994Swnj 		if (inp->inp_lport != lport)
4225161Swnj 			continue;
4235994Swnj 		wildcard = 0;
42410141Ssam 		if (inp->inp_laddr.s_addr != INADDR_ANY) {
42510141Ssam 			if (laddr.s_addr == INADDR_ANY)
4266116Swnj 				wildcard++;
4276116Swnj 			else if (inp->inp_laddr.s_addr != laddr.s_addr)
4285994Swnj 				continue;
4295994Swnj 		} else {
43010141Ssam 			if (laddr.s_addr != INADDR_ANY)
4315994Swnj 				wildcard++;
4325994Swnj 		}
43310141Ssam 		if (inp->inp_faddr.s_addr != INADDR_ANY) {
43410141Ssam 			if (faddr.s_addr == INADDR_ANY)
4356116Swnj 				wildcard++;
4366116Swnj 			else if (inp->inp_faddr.s_addr != faddr.s_addr ||
4376028Sroot 			    inp->inp_fport != fport)
4385994Swnj 				continue;
4395994Swnj 		} else {
44010141Ssam 			if (faddr.s_addr != INADDR_ANY)
4415994Swnj 				wildcard++;
4425994Swnj 		}
4436028Sroot 		if (wildcard && (flags & INPLOOKUP_WILDCARD) == 0)
4445994Swnj 			continue;
4455994Swnj 		if (wildcard < matchwild) {
4465161Swnj 			match = inp;
4475994Swnj 			matchwild = wildcard;
4485994Swnj 			if (matchwild == 0)
4495994Swnj 				break;
4505161Swnj 		}
4515161Swnj 	}
4525161Swnj 	return (match);
4534905Swnj }
454