123177Smckusick /*
2*69639Skarels * Copyright (c) 1982, 1986, 1991, 1993, 1995
363218Sbostic * The Regents of the University of California. All rights reserved.
423177Smckusick *
544475Sbostic * %sccs.include.redist.c%
632787Sbostic *
7*69639Skarels * @(#)in_pcb.c 8.4 (Berkeley) 05/24/95
823177Smckusick */
94905Swnj
1056531Sbostic #include <sys/param.h>
1156531Sbostic #include <sys/systm.h>
1256531Sbostic #include <sys/malloc.h>
1356531Sbostic #include <sys/mbuf.h>
1456531Sbostic #include <sys/protosw.h>
1556531Sbostic #include <sys/socket.h>
1656531Sbostic #include <sys/socketvar.h>
1756531Sbostic #include <sys/ioctl.h>
1856531Sbostic #include <sys/errno.h>
1960847Skarels #include <sys/time.h>
2060847Skarels #include <sys/proc.h>
2148464Skarels
2256531Sbostic #include <net/if.h>
2356531Sbostic #include <net/route.h>
2448464Skarels
2556531Sbostic #include <netinet/in.h>
2656531Sbostic #include <netinet/in_systm.h>
2756531Sbostic #include <netinet/ip.h>
2856531Sbostic #include <netinet/in_pcb.h>
2956531Sbostic #include <netinet/in_var.h>
3056531Sbostic #include <netinet/ip_var.h>
3154716Ssklower
325240Sroot struct in_addr zeroin_addr;
335161Swnj
3461313Sbostic int
in_pcballoc(so,head)357506Sroot in_pcballoc(so, head)
367506Sroot struct socket *so;
377506Sroot struct inpcb *head;
387506Sroot {
397506Sroot register struct inpcb *inp;
407506Sroot
41*69639Skarels MALLOC(inp, struct inpcb *, sizeof(*inp), M_PCB, M_NOWAIT);
4254716Ssklower if (inp == NULL)
437506Sroot return (ENOBUFS);
4454716Ssklower bzero((caddr_t)inp, sizeof(*inp));
457506Sroot inp->inp_head = head;
467506Sroot inp->inp_socket = so;
477506Sroot insque(inp, head);
487506Sroot so->so_pcb = (caddr_t)inp;
497506Sroot return (0);
507506Sroot }
5161313Sbostic
5261313Sbostic int
in_pcbbind(inp,nam)538270Sroot in_pcbbind(inp, nam)
547506Sroot register struct inpcb *inp;
558270Sroot struct mbuf *nam;
567506Sroot {
577506Sroot register struct socket *so = inp->inp_socket;
587506Sroot register struct inpcb *head = inp->inp_head;
598270Sroot register struct sockaddr_in *sin;
6060847Skarels struct proc *p = curproc; /* XXX */
617506Sroot u_short lport = 0;
6260847Skarels int wild = 0, reuseport = (so->so_options & SO_REUSEPORT);
6360847Skarels int error;
647506Sroot
6518374Skarels if (in_ifaddr == 0)
667506Sroot return (EADDRNOTAVAIL);
6710141Ssam if (inp->inp_lport || inp->inp_laddr.s_addr != INADDR_ANY)
688270Sroot return (EINVAL);
6960847Skarels if ((so->so_options & (SO_REUSEADDR|SO_REUSEPORT)) == 0 &&
7058373Smckusick ((so->so_proto->pr_flags & PR_CONNREQUIRED) == 0 ||
7158373Smckusick (so->so_options & SO_ACCEPTCONN) == 0))
7258373Smckusick wild = INPLOOKUP_WILDCARD;
7360847Skarels if (nam) {
7460847Skarels sin = mtod(nam, struct sockaddr_in *);
7560847Skarels if (nam->m_len != sizeof (*sin))
7660847Skarels return (EINVAL);
7760847Skarels #ifdef notdef
7860847Skarels /*
7960847Skarels * We should check the family, but old programs
8060847Skarels * incorrectly fail to initialize it.
8160847Skarels */
8260847Skarels if (sin->sin_family != AF_INET)
8360847Skarels return (EAFNOSUPPORT);
8460847Skarels #endif
8560847Skarels lport = sin->sin_port;
8660847Skarels if (IN_MULTICAST(ntohl(sin->sin_addr.s_addr))) {
8760847Skarels /*
8860847Skarels * Treat SO_REUSEADDR as SO_REUSEPORT for multicast;
8960847Skarels * allow complete duplication of binding if
9060847Skarels * SO_REUSEPORT is set, or if SO_REUSEADDR is set
9160847Skarels * and a multicast address is bound on both
9260847Skarels * new and duplicated sockets.
9360847Skarels */
9460847Skarels if (so->so_options & SO_REUSEADDR)
9560847Skarels reuseport = SO_REUSEADDR|SO_REUSEPORT;
9660847Skarels } else if (sin->sin_addr.s_addr != INADDR_ANY) {
9760847Skarels sin->sin_port = 0; /* yech... */
9860847Skarels if (ifa_ifwithaddr((struct sockaddr *)sin) == 0)
9960847Skarels return (EADDRNOTAVAIL);
10060847Skarels }
10160847Skarels if (lport) {
10260847Skarels struct inpcb *t;
1037506Sroot
10460847Skarels /* GROSS */
10560847Skarels if (ntohs(lport) < IPPORT_RESERVED &&
10660847Skarels (error = suser(p->p_ucred, &p->p_acflag)))
10767884Smckusick return (EACCES);
10860847Skarels t = in_pcblookup(head, zeroin_addr, 0,
10960847Skarels sin->sin_addr, lport, wild);
11060847Skarels if (t && (reuseport & t->inp_socket->so_options) == 0)
11160847Skarels return (EADDRINUSE);
11260847Skarels }
11360847Skarels inp->inp_laddr = sin->sin_addr;
1147506Sroot }
1155172Swnj if (lport == 0)
1165172Swnj do {
11726025Skarels if (head->inp_lport++ < IPPORT_RESERVED ||
11826025Skarels head->inp_lport > IPPORT_USERRESERVED)
1195994Swnj head->inp_lport = IPPORT_RESERVED;
1205172Swnj lport = htons(head->inp_lport);
1215994Swnj } while (in_pcblookup(head,
12258373Smckusick zeroin_addr, 0, inp->inp_laddr, lport, wild));
1235172Swnj inp->inp_lport = lport;
1244951Swnj return (0);
1254905Swnj }
1264905Swnj
1276116Swnj /*
1286116Swnj * Connect from a socket to a specified address.
1296116Swnj * Both address and port must be specified in argument sin.
1306116Swnj * If don't have a local address for this socket yet,
1316116Swnj * then pick one.
1326116Swnj */
13361313Sbostic int
in_pcbconnect(inp,nam)1348270Sroot in_pcbconnect(inp, nam)
13531976Skarels register struct inpcb *inp;
1368270Sroot struct mbuf *nam;
1374923Swnj {
13818374Skarels struct in_ifaddr *ia;
1396338Ssam struct sockaddr_in *ifaddr;
1408270Sroot register struct sockaddr_in *sin = mtod(nam, struct sockaddr_in *);
1414923Swnj
1428270Sroot if (nam->m_len != sizeof (*sin))
1438270Sroot return (EINVAL);
1444951Swnj if (sin->sin_family != AF_INET)
1454951Swnj return (EAFNOSUPPORT);
14618374Skarels if (sin->sin_port == 0)
1474951Swnj return (EADDRNOTAVAIL);
14818374Skarels if (in_ifaddr) {
14918655Skarels /*
15018655Skarels * If the destination address is INADDR_ANY,
15118655Skarels * use the primary local address.
15218655Skarels * If the supplied address is INADDR_BROADCAST,
15318655Skarels * and the primary interface supports broadcast,
15418655Skarels * choose the broadcast address for that interface.
15518655Skarels */
15618374Skarels #define satosin(sa) ((struct sockaddr_in *)(sa))
15758998Ssklower #define sintosa(sin) ((struct sockaddr *)(sin))
15858998Ssklower #define ifatoia(ifa) ((struct in_ifaddr *)(ifa))
15918374Skarels if (sin->sin_addr.s_addr == INADDR_ANY)
16018655Skarels sin->sin_addr = IA_SIN(in_ifaddr)->sin_addr;
16124807Skarels else if (sin->sin_addr.s_addr == (u_long)INADDR_BROADCAST &&
16218655Skarels (in_ifaddr->ia_ifp->if_flags & IFF_BROADCAST))
16318655Skarels sin->sin_addr = satosin(&in_ifaddr->ia_broadaddr)->sin_addr;
16418374Skarels }
16510141Ssam if (inp->inp_laddr.s_addr == INADDR_ANY) {
16627262Skarels register struct route *ro;
16717271Skarels
16827262Skarels ia = (struct in_ifaddr *)0;
16927262Skarels /*
17027262Skarels * If route is known or can be allocated now,
17127262Skarels * our src addr is taken from the i/f, else punt.
17227262Skarels */
17327262Skarels ro = &inp->inp_route;
17427262Skarels if (ro->ro_rt &&
17530336Skarels (satosin(&ro->ro_dst)->sin_addr.s_addr !=
17630336Skarels sin->sin_addr.s_addr ||
17730336Skarels inp->inp_socket->so_options & SO_DONTROUTE)) {
17827262Skarels RTFREE(ro->ro_rt);
17927262Skarels ro->ro_rt = (struct rtentry *)0;
1806338Ssam }
18128847Skarels if ((inp->inp_socket->so_options & SO_DONTROUTE) == 0 && /*XXX*/
18228847Skarels (ro->ro_rt == (struct rtentry *)0 ||
18329826Skarels ro->ro_rt->rt_ifp == (struct ifnet *)0)) {
18427262Skarels /* No route yet, so try to acquire one */
18527262Skarels ro->ro_dst.sa_family = AF_INET;
18637471Ssklower ro->ro_dst.sa_len = sizeof(struct sockaddr_in);
18727262Skarels ((struct sockaddr_in *) &ro->ro_dst)->sin_addr =
18827262Skarels sin->sin_addr;
18927262Skarels rtalloc(ro);
19027262Skarels }
19129826Skarels /*
19229826Skarels * If we found a route, use the address
19329826Skarels * corresponding to the outgoing interface
19429826Skarels * unless it is the loopback (in case a route
19529826Skarels * to our address on another net goes to loopback).
19629826Skarels */
19758998Ssklower if (ro->ro_rt && !(ro->ro_rt->rt_ifp->if_flags & IFF_LOOPBACK))
19858998Ssklower ia = ifatoia(ro->ro_rt->rt_ifa);
19928847Skarels if (ia == 0) {
20061313Sbostic u_short fport = sin->sin_port;
20130336Skarels
20230336Skarels sin->sin_port = 0;
20358998Ssklower ia = ifatoia(ifa_ifwithdstaddr(sintosa(sin)));
20458998Ssklower if (ia == 0)
20558998Ssklower ia = ifatoia(ifa_ifwithnet(sintosa(sin)));
20630336Skarels sin->sin_port = fport;
20728847Skarels if (ia == 0)
20828847Skarels ia = in_ifaddr;
20928847Skarels if (ia == 0)
21028847Skarels return (EADDRNOTAVAIL);
21127262Skarels }
21254716Ssklower /*
21354716Ssklower * If the destination address is multicast and an outgoing
21454716Ssklower * interface has been set as a multicast option, use the
21554716Ssklower * address of that interface as our source address.
21654716Ssklower */
21754716Ssklower if (IN_MULTICAST(ntohl(sin->sin_addr.s_addr)) &&
21854716Ssklower inp->inp_moptions != NULL) {
21954716Ssklower struct ip_moptions *imo;
22058998Ssklower struct ifnet *ifp;
22154716Ssklower
22254716Ssklower imo = inp->inp_moptions;
22354716Ssklower if (imo->imo_multicast_ifp != NULL) {
22454716Ssklower ifp = imo->imo_multicast_ifp;
22554716Ssklower for (ia = in_ifaddr; ia; ia = ia->ia_next)
22654716Ssklower if (ia->ia_ifp == ifp)
22754716Ssklower break;
22854716Ssklower if (ia == 0)
22954716Ssklower return (EADDRNOTAVAIL);
23054716Ssklower }
23154716Ssklower }
23218374Skarels ifaddr = (struct sockaddr_in *)&ia->ia_addr;
2335994Swnj }
2345994Swnj if (in_pcblookup(inp->inp_head,
2356116Swnj sin->sin_addr,
2366116Swnj sin->sin_port,
2376338Ssam inp->inp_laddr.s_addr ? inp->inp_laddr : ifaddr->sin_addr,
2386116Swnj inp->inp_lport,
2396116Swnj 0))
2405172Swnj return (EADDRINUSE);
24114146Ssam if (inp->inp_laddr.s_addr == INADDR_ANY) {
24214146Ssam if (inp->inp_lport == 0)
24326382Skarels (void)in_pcbbind(inp, (struct mbuf *)0);
2446338Ssam inp->inp_laddr = ifaddr->sin_addr;
24514146Ssam }
2464951Swnj inp->inp_faddr = sin->sin_addr;
2474951Swnj inp->inp_fport = sin->sin_port;
2484923Swnj return (0);
2494923Swnj }
2504923Swnj
25161313Sbostic int
in_pcbdisconnect(inp)2525161Swnj in_pcbdisconnect(inp)
2534905Swnj struct inpcb *inp;
2544905Swnj {
2555161Swnj
25610141Ssam inp->inp_faddr.s_addr = INADDR_ANY;
2576028Sroot inp->inp_fport = 0;
2587506Sroot if (inp->inp_socket->so_state & SS_NOFDREF)
2595161Swnj in_pcbdetach(inp);
2605161Swnj }
2615161Swnj
26261313Sbostic int
in_pcbdetach(inp)2635161Swnj in_pcbdetach(inp)
2645161Swnj struct inpcb *inp;
2655161Swnj {
2664905Swnj struct socket *so = inp->inp_socket;
2674905Swnj
2685009Swnj so->so_pcb = 0;
2695009Swnj sofree(so);
27024807Skarels if (inp->inp_options)
27126382Skarels (void)m_free(inp->inp_options);
2726350Ssam if (inp->inp_route.ro_rt)
2736367Ssam rtfree(inp->inp_route.ro_rt);
27454716Ssklower ip_freemoptions(inp->inp_moptions);
2754983Swnj remque(inp);
27654716Ssklower FREE(inp, M_PCB);
2774905Swnj }
2784905Swnj
27961313Sbostic int
in_setsockaddr(inp,nam)2808270Sroot in_setsockaddr(inp, nam)
2816509Ssam register struct inpcb *inp;
2828270Sroot struct mbuf *nam;
2836509Ssam {
28432071Skarels register struct sockaddr_in *sin;
2858270Sroot
2868270Sroot nam->m_len = sizeof (*sin);
2878270Sroot sin = mtod(nam, struct sockaddr_in *);
2886509Ssam bzero((caddr_t)sin, sizeof (*sin));
2896509Ssam sin->sin_family = AF_INET;
29037471Ssklower sin->sin_len = sizeof(*sin);
2916509Ssam sin->sin_port = inp->inp_lport;
2926509Ssam sin->sin_addr = inp->inp_laddr;
2936509Ssam }
2946509Ssam
29561313Sbostic int
in_setpeeraddr(inp,nam)29614123Ssam in_setpeeraddr(inp, nam)
29731976Skarels struct inpcb *inp;
29814123Ssam struct mbuf *nam;
29914123Ssam {
30032071Skarels register struct sockaddr_in *sin;
30114123Ssam
30214123Ssam nam->m_len = sizeof (*sin);
30314123Ssam sin = mtod(nam, struct sockaddr_in *);
30414123Ssam bzero((caddr_t)sin, sizeof (*sin));
30514123Ssam sin->sin_family = AF_INET;
30637471Ssklower sin->sin_len = sizeof(*sin);
30714123Ssam sin->sin_port = inp->inp_fport;
30814123Ssam sin->sin_addr = inp->inp_faddr;
30914123Ssam }
31014123Ssam
3115161Swnj /*
31217357Skarels * Pass some notification to all connections of a protocol
31340692Skarels * associated with address dst. The local address and/or port numbers
31440692Skarels * may be specified to limit the search. The "usual action" will be
31540692Skarels * taken, depending on the ctlinput cmd. The caller must filter any
31640692Skarels * cmds that are uninteresting (e.g., no error in the map).
31740692Skarels * Call the protocol specific routine (if any) to report
31840692Skarels * any errors for each matching socket.
31940692Skarels *
32040692Skarels * Must be called at splnet.
3216583Ssam */
32261313Sbostic int
in_pcbnotify(head,dst,fport_arg,laddr,lport_arg,cmd,notify)32361313Sbostic in_pcbnotify(head, dst, fport_arg, laddr, lport_arg, cmd, notify)
3246583Ssam struct inpcb *head;
32540692Skarels struct sockaddr *dst;
32661313Sbostic u_int fport_arg, lport_arg;
32740692Skarels struct in_addr laddr;
32861313Sbostic int cmd;
32961313Sbostic void (*notify) __P((struct inpcb *, int));
3306583Ssam {
33161313Sbostic extern u_char inetctlerrmap[];
3326583Ssam register struct inpcb *inp, *oinp;
33340692Skarels struct in_addr faddr;
33461313Sbostic u_short fport = fport_arg, lport = lport_arg;
33540692Skarels int errno;
3366583Ssam
33740692Skarels if ((unsigned)cmd > PRC_NCMDS || dst->sa_family != AF_INET)
33840692Skarels return;
33940692Skarels faddr = ((struct sockaddr_in *)dst)->sin_addr;
34040692Skarels if (faddr.s_addr == INADDR_ANY)
34140692Skarels return;
34240692Skarels
34340692Skarels /*
34440692Skarels * Redirects go to all references to the destination,
34540692Skarels * and use in_rtchange to invalidate the route cache.
34640692Skarels * Dead host indications: notify all references to the destination.
34740692Skarels * Otherwise, if we have knowledge of the local port and address,
34840692Skarels * deliver only to that socket.
34940692Skarels */
35040692Skarels if (PRC_IS_REDIRECT(cmd) || cmd == PRC_HOSTDEAD) {
35140692Skarels fport = 0;
35240692Skarels lport = 0;
35340692Skarels laddr.s_addr = 0;
35440692Skarels if (cmd != PRC_HOSTDEAD)
35540692Skarels notify = in_rtchange;
35640692Skarels }
35740692Skarels errno = inetctlerrmap[cmd];
3586583Ssam for (inp = head->inp_next; inp != head;) {
35940692Skarels if (inp->inp_faddr.s_addr != faddr.s_addr ||
36040692Skarels inp->inp_socket == 0 ||
36140692Skarels (lport && inp->inp_lport != lport) ||
36240692Skarels (laddr.s_addr && inp->inp_laddr.s_addr != laddr.s_addr) ||
36340692Skarels (fport && inp->inp_fport != fport)) {
3646583Ssam inp = inp->inp_next;
3656583Ssam continue;
3666583Ssam }
3676583Ssam oinp = inp;
3686583Ssam inp = inp->inp_next;
36924807Skarels if (notify)
37044381Skarels (*notify)(oinp, errno);
3716583Ssam }
3726583Ssam }
3736583Ssam
37417357Skarels /*
37525508Skarels * Check for alternatives when higher level complains
37625508Skarels * about service problems. For now, invalidate cached
37725508Skarels * routing information. If the route was created dynamically
37825508Skarels * (by a redirect), time to try a default gateway again.
37925508Skarels */
38061313Sbostic int
in_losing(inp)38125508Skarels in_losing(inp)
38225508Skarels struct inpcb *inp;
38325508Skarels {
38425508Skarels register struct rtentry *rt;
38552555Ssklower struct rt_addrinfo info;
38625508Skarels
38725508Skarels if ((rt = inp->inp_route.ro_rt)) {
38855543Ssklower inp->inp_route.ro_rt = 0;
38952555Ssklower bzero((caddr_t)&info, sizeof(info));
39052555Ssklower info.rti_info[RTAX_DST] =
39152555Ssklower (struct sockaddr *)&inp->inp_route.ro_dst;
39252555Ssklower info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
39352555Ssklower info.rti_info[RTAX_NETMASK] = rt_mask(rt);
39452555Ssklower rt_missmsg(RTM_LOSING, &info, rt->rt_flags, 0);
39525508Skarels if (rt->rt_flags & RTF_DYNAMIC)
39637471Ssklower (void) rtrequest(RTM_DELETE, rt_key(rt),
39737471Ssklower rt->rt_gateway, rt_mask(rt), rt->rt_flags,
39837471Ssklower (struct rtentry **)0);
39955543Ssklower else
40025508Skarels /*
40125508Skarels * A new route can be allocated
40225508Skarels * the next time output is attempted.
40325508Skarels */
40455543Ssklower rtfree(rt);
40525508Skarels }
40625508Skarels }
40725508Skarels
40825508Skarels /*
40917357Skarels * After a routing change, flush old routing
41017357Skarels * and allocate a (hopefully) better one.
41117357Skarels */
41261313Sbostic void
in_rtchange(inp,errno)41361313Sbostic in_rtchange(inp, errno)
41425508Skarels register struct inpcb *inp;
41561313Sbostic int errno;
41617357Skarels {
41717357Skarels if (inp->inp_route.ro_rt) {
41817357Skarels rtfree(inp->inp_route.ro_rt);
41917357Skarels inp->inp_route.ro_rt = 0;
42017357Skarels /*
42117357Skarels * A new route can be allocated the next time
42217357Skarels * output is attempted.
42317357Skarels */
42417357Skarels }
42517357Skarels }
42617357Skarels
4274907Swnj struct inpcb *
in_pcblookup(head,faddr,fport_arg,laddr,lport_arg,flags)42861313Sbostic in_pcblookup(head, faddr, fport_arg, laddr, lport_arg, flags)
4294905Swnj struct inpcb *head;
4304951Swnj struct in_addr faddr, laddr;
43161313Sbostic u_int fport_arg, lport_arg;
4326028Sroot int flags;
4334905Swnj {
4345994Swnj register struct inpcb *inp, *match = 0;
4355994Swnj int matchwild = 3, wildcard;
43661313Sbostic u_short fport = fport_arg, lport = lport_arg;
4374905Swnj
4385161Swnj for (inp = head->inp_next; inp != head; inp = inp->inp_next) {
4395994Swnj if (inp->inp_lport != lport)
4405161Swnj continue;
4415994Swnj wildcard = 0;
44210141Ssam if (inp->inp_laddr.s_addr != INADDR_ANY) {
44310141Ssam if (laddr.s_addr == INADDR_ANY)
4446116Swnj wildcard++;
4456116Swnj else if (inp->inp_laddr.s_addr != laddr.s_addr)
4465994Swnj continue;
4475994Swnj } else {
44810141Ssam if (laddr.s_addr != INADDR_ANY)
4495994Swnj wildcard++;
4505994Swnj }
45110141Ssam if (inp->inp_faddr.s_addr != INADDR_ANY) {
45210141Ssam if (faddr.s_addr == INADDR_ANY)
4536116Swnj wildcard++;
4546116Swnj else if (inp->inp_faddr.s_addr != faddr.s_addr ||
4556028Sroot inp->inp_fport != fport)
4565994Swnj continue;
4575994Swnj } else {
45810141Ssam if (faddr.s_addr != INADDR_ANY)
4595994Swnj wildcard++;
4605994Swnj }
4616028Sroot if (wildcard && (flags & INPLOOKUP_WILDCARD) == 0)
4625994Swnj continue;
4635994Swnj if (wildcard < matchwild) {
4645161Swnj match = inp;
4655994Swnj matchwild = wildcard;
4665994Swnj if (matchwild == 0)
4675994Swnj break;
4685161Swnj }
4695161Swnj }
4705161Swnj return (match);
4714905Swnj }
472