1 /* 2 * Copyright (c) 2004 Jeffrey Hsu. All rights reserved. 3 * Copyright (c) 1982, 1986, 1988, 1990, 1993, 1995 4 * The Regents of the University of California. All rights reserved. 5 * 6 * Redistribution and use in source and binary forms, with or without 7 * modification, are permitted provided that the following conditions 8 * are met: 9 * 1. Redistributions of source code must retain the above copyright 10 * notice, this list of conditions and the following disclaimer. 11 * 2. Redistributions in binary form must reproduce the above copyright 12 * notice, this list of conditions and the following disclaimer in the 13 * documentation and/or other materials provided with the distribution. 14 * 3. All advertising materials mentioning features or use of this software 15 * must display the following acknowledgement: 16 * This product includes software developed by the University of 17 * California, Berkeley and its contributors. 18 * 4. Neither the name of the University nor the names of its contributors 19 * may be used to endorse or promote products derived from this software 20 * without specific prior written permission. 21 * 22 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 23 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 24 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 25 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 26 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 27 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 28 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 29 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 30 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 31 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 32 * SUCH DAMAGE. 33 * 34 * @(#)udp_usrreq.c 8.6 (Berkeley) 5/23/95 35 * $FreeBSD: src/sys/netinet/udp_usrreq.c,v 1.64.2.18 2003/01/24 05:11:34 sam Exp $ 36 * $DragonFly: src/sys/netinet/udp_usrreq.c,v 1.17 2004/03/22 06:38:17 hsu Exp $ 37 */ 38 39 #include "opt_ipsec.h" 40 #include "opt_inet6.h" 41 42 #include <sys/param.h> 43 #include <sys/systm.h> 44 #include <sys/kernel.h> 45 #include <sys/malloc.h> 46 #include <sys/mbuf.h> 47 #include <sys/domain.h> 48 #include <sys/proc.h> 49 #include <sys/protosw.h> 50 #include <sys/socket.h> 51 #include <sys/socketvar.h> 52 #include <sys/sysctl.h> 53 #include <sys/syslog.h> 54 #include <sys/in_cksum.h> 55 56 #include <vm/vm_zone.h> 57 58 #include <net/if.h> 59 #include <net/route.h> 60 61 #include <netinet/in.h> 62 #include <netinet/in_systm.h> 63 #include <netinet/ip.h> 64 #ifdef INET6 65 #include <netinet/ip6.h> 66 #endif 67 #include <netinet/in_pcb.h> 68 #include <netinet/in_var.h> 69 #include <netinet/ip_var.h> 70 #ifdef INET6 71 #include <netinet6/ip6_var.h> 72 #endif 73 #include <netinet/ip_icmp.h> 74 #include <netinet/icmp_var.h> 75 #include <netinet/udp.h> 76 #include <netinet/udp_var.h> 77 78 #ifdef FAST_IPSEC 79 #include <netipsec/ipsec.h> 80 #endif /*FAST_IPSEC*/ 81 82 #ifdef IPSEC 83 #include <netinet6/ipsec.h> 84 #endif /*IPSEC*/ 85 86 /* 87 * UDP protocol implementation. 88 * Per RFC 768, August, 1980. 89 */ 90 #ifndef COMPAT_42 91 static int udpcksum = 1; 92 #else 93 static int udpcksum = 0; /* XXX */ 94 #endif 95 SYSCTL_INT(_net_inet_udp, UDPCTL_CHECKSUM, checksum, CTLFLAG_RW, 96 &udpcksum, 0, ""); 97 98 int log_in_vain = 0; 99 SYSCTL_INT(_net_inet_udp, OID_AUTO, log_in_vain, CTLFLAG_RW, 100 &log_in_vain, 0, "Log all incoming UDP packets"); 101 102 static int blackhole = 0; 103 SYSCTL_INT(_net_inet_udp, OID_AUTO, blackhole, CTLFLAG_RW, 104 &blackhole, 0, "Do not send port unreachables for refused connects"); 105 106 static int strict_mcast_mship = 1; 107 SYSCTL_INT(_net_inet_udp, OID_AUTO, strict_mcast_mship, CTLFLAG_RW, 108 &strict_mcast_mship, 0, "Only send multicast to member sockets"); 109 110 struct inpcbinfo udbinfo; 111 112 #ifndef UDBHASHSIZE 113 #define UDBHASHSIZE 16 114 #endif 115 116 struct udpstat udpstat; /* from udp_var.h */ 117 SYSCTL_STRUCT(_net_inet_udp, UDPCTL_STATS, stats, CTLFLAG_RW, 118 &udpstat, udpstat, "UDP statistics (struct udpstat, netinet/udp_var.h)"); 119 120 static struct sockaddr_in udp_in = { sizeof(udp_in), AF_INET }; 121 #ifdef INET6 122 struct udp_in6 { 123 struct sockaddr_in6 uin6_sin; 124 u_char uin6_init_done : 1; 125 } udp_in6 = { 126 { sizeof(udp_in6.uin6_sin), AF_INET6 }, 127 0 128 }; 129 struct udp_ip6 { 130 struct ip6_hdr uip6_ip6; 131 u_char uip6_init_done : 1; 132 } udp_ip6; 133 #endif /* INET6 */ 134 135 static void udp_append (struct inpcb *last, struct ip *ip, 136 struct mbuf *n, int off); 137 #ifdef INET6 138 static void ip_2_ip6_hdr (struct ip6_hdr *ip6, struct ip *ip); 139 #endif 140 141 static int udp_detach (struct socket *so); 142 static int udp_output (struct inpcb *, struct mbuf *, struct sockaddr *, 143 struct mbuf *, struct thread *); 144 145 void 146 udp_init() 147 { 148 LIST_INIT(&udbinfo.listhead); 149 udbinfo.hashbase = hashinit(UDBHASHSIZE, M_PCB, &udbinfo.hashmask); 150 udbinfo.porthashbase = hashinit(UDBHASHSIZE, M_PCB, 151 &udbinfo.porthashmask); 152 udbinfo.bindhashbase = hashinit(UDBHASHSIZE, M_PCB, 153 &udbinfo.bindhashmask); 154 udbinfo.ipi_zone = zinit("udpcb", sizeof(struct inpcb), maxsockets, 155 ZONE_INTERRUPT, 0); 156 udp_thread_init(); 157 } 158 159 /* 160 * Check multicast packets to make sure they are only sent to sockets with 161 * multicast memberships for the packet's destination address and arrival 162 * interface. Multicast packets to multicast-unaware sockets are also 163 * disallowed. 164 * 165 * Returns 0 if the packet is acceptable, -1 if it is not. 166 */ 167 static __inline 168 int 169 check_multicast_membership(struct ip *ip, struct inpcb *inp, struct mbuf *m) 170 { 171 int mshipno; 172 struct ip_moptions *mopt; 173 174 if (strict_mcast_mship == 0 || 175 !IN_MULTICAST(ntohl(ip->ip_dst.s_addr))) { 176 return(0); 177 } 178 mopt = inp->inp_moptions; 179 if (mopt == NULL) 180 return(-1); 181 for (mshipno = 0; mshipno <= mopt->imo_num_memberships; ++mshipno) { 182 if (ip->ip_dst.s_addr == mopt->imo_membership[mshipno]->inm_addr.s_addr && 183 m->m_pkthdr.rcvif == mopt->imo_membership[mshipno]->inm_ifp) { 184 return(0); 185 } 186 } 187 return(-1); 188 } 189 190 void 191 udp_input(m, off, proto) 192 struct mbuf *m; 193 int off, proto; 194 { 195 int iphlen = off; 196 struct ip *ip; 197 struct udphdr *uh; 198 struct inpcb *inp; 199 struct mbuf *opts = 0; 200 int len; 201 struct ip save_ip; 202 struct sockaddr *append_sa; 203 204 udpstat.udps_ipackets++; 205 206 /* 207 * Strip IP options, if any; should skip this, 208 * make available to user, and use on returned packets, 209 * but we don't yet have a way to check the checksum 210 * with options still present. 211 */ 212 if (iphlen > sizeof (struct ip)) { 213 ip_stripoptions(m); 214 iphlen = sizeof(struct ip); 215 } 216 217 /* 218 * IP and UDP headers are together in first mbuf. 219 * Already checked and pulled up in ip_demux(). 220 */ 221 KASSERT(m->m_len >= iphlen + sizeof(struct udphdr), 222 ("UDP header not in one mbuf")); 223 224 ip = mtod(m, struct ip *); 225 uh = (struct udphdr *)((caddr_t)ip + iphlen); 226 227 /* destination port of 0 is illegal, based on RFC768. */ 228 if (uh->uh_dport == 0) 229 goto bad; 230 231 /* 232 * Make mbuf data length reflect UDP length. 233 * If not enough data to reflect UDP length, drop. 234 */ 235 len = ntohs((u_short)uh->uh_ulen); 236 if (ip->ip_len != len) { 237 if (len > ip->ip_len || len < sizeof(struct udphdr)) { 238 udpstat.udps_badlen++; 239 goto bad; 240 } 241 m_adj(m, len - ip->ip_len); 242 /* ip->ip_len = len; */ 243 } 244 /* 245 * Save a copy of the IP header in case we want restore it 246 * for sending an ICMP error message in response. 247 */ 248 save_ip = *ip; 249 250 /* 251 * Checksum extended UDP header and data. 252 */ 253 if (uh->uh_sum) { 254 if (m->m_pkthdr.csum_flags & CSUM_DATA_VALID) { 255 if (m->m_pkthdr.csum_flags & CSUM_PSEUDO_HDR) 256 uh->uh_sum = m->m_pkthdr.csum_data; 257 else 258 uh->uh_sum = in_pseudo(ip->ip_src.s_addr, 259 ip->ip_dst.s_addr, htonl((u_short)len + 260 m->m_pkthdr.csum_data + IPPROTO_UDP)); 261 uh->uh_sum ^= 0xffff; 262 } else { 263 char b[9]; 264 bcopy(((struct ipovly *)ip)->ih_x1, b, 9); 265 bzero(((struct ipovly *)ip)->ih_x1, 9); 266 ((struct ipovly *)ip)->ih_len = uh->uh_ulen; 267 uh->uh_sum = in_cksum(m, len + sizeof (struct ip)); 268 bcopy(b, ((struct ipovly *)ip)->ih_x1, 9); 269 } 270 if (uh->uh_sum) { 271 udpstat.udps_badsum++; 272 m_freem(m); 273 return; 274 } 275 } else 276 udpstat.udps_nosum++; 277 278 if (IN_MULTICAST(ntohl(ip->ip_dst.s_addr)) || 279 in_broadcast(ip->ip_dst, m->m_pkthdr.rcvif)) { 280 struct inpcb *last; 281 /* 282 * Deliver a multicast or broadcast datagram to *all* sockets 283 * for which the local and remote addresses and ports match 284 * those of the incoming datagram. This allows more than 285 * one process to receive multi/broadcasts on the same port. 286 * (This really ought to be done for unicast datagrams as 287 * well, but that would cause problems with existing 288 * applications that open both address-specific sockets and 289 * a wildcard socket listening to the same port -- they would 290 * end up receiving duplicates of every unicast datagram. 291 * Those applications open the multiple sockets to overcome an 292 * inadequacy of the UDP socket interface, but for backwards 293 * compatibility we avoid the problem here rather than 294 * fixing the interface. Maybe 4.5BSD will remedy this?) 295 */ 296 297 /* 298 * Construct sockaddr format source address. 299 */ 300 udp_in.sin_port = uh->uh_sport; 301 udp_in.sin_addr = ip->ip_src; 302 /* 303 * Locate pcb(s) for datagram. 304 * (Algorithm copied from raw_intr().) 305 */ 306 last = NULL; 307 #ifdef INET6 308 udp_in6.uin6_init_done = udp_ip6.uip6_init_done = 0; 309 #endif 310 LIST_FOREACH(inp, &udbinfo.listhead, inp_list) { 311 #ifdef INET6 312 if ((inp->inp_vflag & INP_IPV4) == 0) 313 continue; 314 #endif 315 if (inp->inp_lport != uh->uh_dport) 316 continue; 317 if (inp->inp_laddr.s_addr != INADDR_ANY) { 318 if (inp->inp_laddr.s_addr != 319 ip->ip_dst.s_addr) 320 continue; 321 } 322 if (inp->inp_faddr.s_addr != INADDR_ANY) { 323 if (inp->inp_faddr.s_addr != 324 ip->ip_src.s_addr || 325 inp->inp_fport != uh->uh_sport) 326 continue; 327 } 328 329 if (check_multicast_membership(ip, inp, m) < 0) 330 continue; 331 332 if (last != NULL) { 333 struct mbuf *n; 334 335 #ifdef IPSEC 336 /* check AH/ESP integrity. */ 337 if (ipsec4_in_reject_so(m, last->inp_socket)) 338 ipsecstat.in_polvio++; 339 /* do not inject data to pcb */ 340 else 341 #endif /*IPSEC*/ 342 #ifdef FAST_IPSEC 343 /* check AH/ESP integrity. */ 344 if (ipsec4_in_reject(m, last)) 345 ; 346 else 347 #endif /*FAST_IPSEC*/ 348 if ((n = m_copy(m, 0, M_COPYALL)) != NULL) 349 udp_append(last, ip, n, 350 iphlen + 351 sizeof(struct udphdr)); 352 } 353 last = inp; 354 /* 355 * Don't look for additional matches if this one does 356 * not have either the SO_REUSEPORT or SO_REUSEADDR 357 * socket options set. This heuristic avoids searching 358 * through all pcbs in the common case of a non-shared 359 * port. It * assumes that an application will never 360 * clear these options after setting them. 361 */ 362 if ((last->inp_socket->so_options&(SO_REUSEPORT|SO_REUSEADDR)) == 0) 363 break; 364 } 365 366 if (last == NULL) { 367 /* 368 * No matching pcb found; discard datagram. 369 * (No need to send an ICMP Port Unreachable 370 * for a broadcast or multicast datgram.) 371 */ 372 udpstat.udps_noportbcast++; 373 goto bad; 374 } 375 #ifdef IPSEC 376 /* check AH/ESP integrity. */ 377 if (ipsec4_in_reject_so(m, last->inp_socket)) { 378 ipsecstat.in_polvio++; 379 goto bad; 380 } 381 #endif /*IPSEC*/ 382 #ifdef FAST_IPSEC 383 /* check AH/ESP integrity. */ 384 if (ipsec4_in_reject(m, last)) 385 goto bad; 386 #endif /*FAST_IPSEC*/ 387 udp_append(last, ip, m, iphlen + sizeof(struct udphdr)); 388 return; 389 } 390 /* 391 * Locate pcb for datagram. 392 */ 393 inp = in_pcblookup_hash(&udbinfo, ip->ip_src, uh->uh_sport, 394 ip->ip_dst, uh->uh_dport, 1, m->m_pkthdr.rcvif); 395 if (inp == NULL) { 396 if (log_in_vain) { 397 char buf[4*sizeof "123"]; 398 399 strcpy(buf, inet_ntoa(ip->ip_dst)); 400 log(LOG_INFO, 401 "Connection attempt to UDP %s:%d from %s:%d\n", 402 buf, ntohs(uh->uh_dport), inet_ntoa(ip->ip_src), 403 ntohs(uh->uh_sport)); 404 } 405 udpstat.udps_noport++; 406 if (m->m_flags & (M_BCAST | M_MCAST)) { 407 udpstat.udps_noportbcast++; 408 goto bad; 409 } 410 if (blackhole) 411 goto bad; 412 #ifdef ICMP_BANDLIM 413 if (badport_bandlim(BANDLIM_ICMP_UNREACH) < 0) 414 goto bad; 415 #endif 416 *ip = save_ip; 417 ip->ip_len += iphlen; 418 icmp_error(m, ICMP_UNREACH, ICMP_UNREACH_PORT, 0, 0); 419 return; 420 } 421 #ifdef IPSEC 422 if (ipsec4_in_reject_so(m, inp->inp_socket)) { 423 ipsecstat.in_polvio++; 424 goto bad; 425 } 426 #endif /*IPSEC*/ 427 #ifdef FAST_IPSEC 428 if (ipsec4_in_reject(m, inp)) 429 goto bad; 430 #endif /*FAST_IPSEC*/ 431 432 /* 433 * Construct sockaddr format source address. 434 * Stuff source address and datagram in user buffer. 435 */ 436 udp_in.sin_port = uh->uh_sport; 437 udp_in.sin_addr = ip->ip_src; 438 if (inp->inp_flags & INP_CONTROLOPTS 439 || inp->inp_socket->so_options & SO_TIMESTAMP) { 440 #ifdef INET6 441 if (inp->inp_vflag & INP_IPV6) { 442 int savedflags; 443 444 ip_2_ip6_hdr(&udp_ip6.uip6_ip6, ip); 445 savedflags = inp->inp_flags; 446 inp->inp_flags &= ~INP_UNMAPPABLEOPTS; 447 ip6_savecontrol(inp, &opts, &udp_ip6.uip6_ip6, m); 448 inp->inp_flags = savedflags; 449 } else 450 #endif 451 ip_savecontrol(inp, &opts, ip, m); 452 } 453 m_adj(m, iphlen + sizeof(struct udphdr)); 454 #ifdef INET6 455 if (inp->inp_vflag & INP_IPV6) { 456 in6_sin_2_v4mapsin6(&udp_in, &udp_in6.uin6_sin); 457 append_sa = (struct sockaddr *)&udp_in6; 458 } else 459 #endif 460 append_sa = (struct sockaddr *)&udp_in; 461 if (sbappendaddr(&inp->inp_socket->so_rcv, append_sa, m, opts) == 0) { 462 udpstat.udps_fullsock++; 463 goto bad; 464 } 465 sorwakeup(inp->inp_socket); 466 return; 467 bad: 468 m_freem(m); 469 if (opts) 470 m_freem(opts); 471 return; 472 } 473 474 #ifdef INET6 475 static void 476 ip_2_ip6_hdr(ip6, ip) 477 struct ip6_hdr *ip6; 478 struct ip *ip; 479 { 480 bzero(ip6, sizeof(*ip6)); 481 482 ip6->ip6_vfc = IPV6_VERSION; 483 ip6->ip6_plen = ip->ip_len; 484 ip6->ip6_nxt = ip->ip_p; 485 ip6->ip6_hlim = ip->ip_ttl; 486 ip6->ip6_src.s6_addr32[2] = ip6->ip6_dst.s6_addr32[2] = 487 IPV6_ADDR_INT32_SMP; 488 ip6->ip6_src.s6_addr32[3] = ip->ip_src.s_addr; 489 ip6->ip6_dst.s6_addr32[3] = ip->ip_dst.s_addr; 490 } 491 #endif 492 493 /* 494 * subroutine of udp_input(), mainly for source code readability. 495 * caller must properly init udp_ip6 and udp_in6 beforehand. 496 */ 497 static void 498 udp_append(last, ip, n, off) 499 struct inpcb *last; 500 struct ip *ip; 501 struct mbuf *n; 502 int off; 503 { 504 struct sockaddr *append_sa; 505 struct mbuf *opts = 0; 506 507 if (last->inp_flags & INP_CONTROLOPTS || 508 last->inp_socket->so_options & SO_TIMESTAMP) { 509 #ifdef INET6 510 if (last->inp_vflag & INP_IPV6) { 511 int savedflags; 512 513 if (udp_ip6.uip6_init_done == 0) { 514 ip_2_ip6_hdr(&udp_ip6.uip6_ip6, ip); 515 udp_ip6.uip6_init_done = 1; 516 } 517 savedflags = last->inp_flags; 518 last->inp_flags &= ~INP_UNMAPPABLEOPTS; 519 ip6_savecontrol(last, &opts, &udp_ip6.uip6_ip6, n); 520 last->inp_flags = savedflags; 521 } else 522 #endif 523 ip_savecontrol(last, &opts, ip, n); 524 } 525 #ifdef INET6 526 if (last->inp_vflag & INP_IPV6) { 527 if (udp_in6.uin6_init_done == 0) { 528 in6_sin_2_v4mapsin6(&udp_in, &udp_in6.uin6_sin); 529 udp_in6.uin6_init_done = 1; 530 } 531 append_sa = (struct sockaddr *)&udp_in6.uin6_sin; 532 } else 533 #endif 534 append_sa = (struct sockaddr *)&udp_in; 535 m_adj(n, off); 536 if (sbappendaddr(&last->inp_socket->so_rcv, append_sa, n, opts) == 0) { 537 m_freem(n); 538 if (opts) 539 m_freem(opts); 540 udpstat.udps_fullsock++; 541 } else 542 sorwakeup(last->inp_socket); 543 } 544 545 /* 546 * Notify a udp user of an asynchronous error; 547 * just wake up so that he can collect error status. 548 */ 549 void 550 udp_notify(inp, errno) 551 struct inpcb *inp; 552 int errno; 553 { 554 inp->inp_socket->so_error = errno; 555 sorwakeup(inp->inp_socket); 556 sowwakeup(inp->inp_socket); 557 } 558 559 void 560 udp_ctlinput(cmd, sa, vip) 561 int cmd; 562 struct sockaddr *sa; 563 void *vip; 564 { 565 struct ip *ip = vip; 566 struct udphdr *uh; 567 void (*notify) (struct inpcb *, int) = udp_notify; 568 struct in_addr faddr; 569 struct inpcb *inp; 570 int s; 571 572 faddr = ((struct sockaddr_in *)sa)->sin_addr; 573 if (sa->sa_family != AF_INET || faddr.s_addr == INADDR_ANY) 574 return; 575 576 if (PRC_IS_REDIRECT(cmd)) { 577 ip = 0; 578 notify = in_rtchange; 579 } else if (cmd == PRC_HOSTDEAD) 580 ip = 0; 581 else if ((unsigned)cmd >= PRC_NCMDS || inetctlerrmap[cmd] == 0) 582 return; 583 if (ip) { 584 s = splnet(); 585 uh = (struct udphdr *)((caddr_t)ip + (ip->ip_hl << 2)); 586 inp = in_pcblookup_hash(&udbinfo, faddr, uh->uh_dport, 587 ip->ip_src, uh->uh_sport, 0, NULL); 588 if (inp != NULL && inp->inp_socket != NULL) 589 (*notify)(inp, inetctlerrmap[cmd]); 590 splx(s); 591 } else 592 in_pcbnotifyall(&udbinfo.listhead, faddr, inetctlerrmap[cmd], 593 notify); 594 } 595 596 static int 597 udp_pcblist(SYSCTL_HANDLER_ARGS) 598 { 599 int error, i, n, s; 600 struct inpcb *inp, **inp_list; 601 inp_gen_t gencnt; 602 struct xinpgen xig; 603 604 /* 605 * The process of preparing the TCB list is too time-consuming and 606 * resource-intensive to repeat twice on every request. 607 */ 608 if (req->oldptr == 0) { 609 n = udbinfo.ipi_count; 610 req->oldidx = 2 * (sizeof xig) 611 + (n + n/8) * sizeof(struct xinpcb); 612 return 0; 613 } 614 615 if (req->newptr != 0) 616 return EPERM; 617 618 /* 619 * OK, now we're committed to doing something. 620 */ 621 s = splnet(); 622 gencnt = udbinfo.ipi_gencnt; 623 n = udbinfo.ipi_count; 624 splx(s); 625 626 xig.xig_len = sizeof xig; 627 xig.xig_count = n; 628 xig.xig_gen = gencnt; 629 xig.xig_sogen = so_gencnt; 630 error = SYSCTL_OUT(req, &xig, sizeof xig); 631 if (error) 632 return error; 633 634 inp_list = malloc(n * sizeof *inp_list, M_TEMP, M_WAITOK); 635 if (inp_list == 0) 636 return ENOMEM; 637 638 s = splnet(); 639 for (inp = LIST_FIRST(&udbinfo.listhead), i = 0; inp && i < n; 640 inp = LIST_NEXT(inp, inp_list)) { 641 if (inp->inp_gencnt <= gencnt && !prison_xinpcb(req->td, inp)) 642 inp_list[i++] = inp; 643 } 644 splx(s); 645 n = i; 646 647 error = 0; 648 for (i = 0; i < n; i++) { 649 inp = inp_list[i]; 650 if (inp->inp_gencnt <= gencnt) { 651 struct xinpcb xi; 652 xi.xi_len = sizeof xi; 653 /* XXX should avoid extra copy */ 654 bcopy(inp, &xi.xi_inp, sizeof *inp); 655 if (inp->inp_socket) 656 sotoxsocket(inp->inp_socket, &xi.xi_socket); 657 error = SYSCTL_OUT(req, &xi, sizeof xi); 658 } 659 } 660 if (!error) { 661 /* 662 * Give the user an updated idea of our state. 663 * If the generation differs from what we told 664 * her before, she knows that something happened 665 * while we were processing this request, and it 666 * might be necessary to retry. 667 */ 668 s = splnet(); 669 xig.xig_gen = udbinfo.ipi_gencnt; 670 xig.xig_sogen = so_gencnt; 671 xig.xig_count = udbinfo.ipi_count; 672 splx(s); 673 error = SYSCTL_OUT(req, &xig, sizeof xig); 674 } 675 free(inp_list, M_TEMP); 676 return error; 677 } 678 679 SYSCTL_PROC(_net_inet_udp, UDPCTL_PCBLIST, pcblist, CTLFLAG_RD, 0, 0, 680 udp_pcblist, "S,xinpcb", "List of active UDP sockets"); 681 682 static int 683 udp_getcred(SYSCTL_HANDLER_ARGS) 684 { 685 struct sockaddr_in addrs[2]; 686 struct inpcb *inp; 687 int error, s; 688 689 error = suser(req->td); 690 if (error) 691 return (error); 692 error = SYSCTL_IN(req, addrs, sizeof(addrs)); 693 if (error) 694 return (error); 695 s = splnet(); 696 inp = in_pcblookup_hash(&udbinfo, addrs[1].sin_addr, addrs[1].sin_port, 697 addrs[0].sin_addr, addrs[0].sin_port, 1, NULL); 698 if (inp == NULL || inp->inp_socket == NULL) { 699 error = ENOENT; 700 goto out; 701 } 702 error = SYSCTL_OUT(req, inp->inp_socket->so_cred, sizeof(struct ucred)); 703 out: 704 splx(s); 705 return (error); 706 } 707 708 SYSCTL_PROC(_net_inet_udp, OID_AUTO, getcred, CTLTYPE_OPAQUE|CTLFLAG_RW, 709 0, 0, udp_getcred, "S,ucred", "Get the ucred of a UDP connection"); 710 711 static int 712 udp_output(inp, m, dstaddr, control, td) 713 struct inpcb *inp; 714 struct mbuf *m; 715 struct sockaddr *dstaddr; 716 struct mbuf *control; 717 struct thread *td; 718 { 719 struct udpiphdr *ui; 720 int len = m->m_pkthdr.len; 721 struct sockaddr_in *sin; /* really is initialized before use */ 722 int error = 0; 723 724 if (control) 725 m_freem(control); /* XXX */ 726 727 if (len + sizeof(struct udpiphdr) > IP_MAXPACKET) { 728 error = EMSGSIZE; 729 goto release; 730 } 731 732 if (inp->inp_lport == 0) { /* unbound socket */ 733 error = in_pcbbind(inp, (struct sockaddr *)NULL, td); 734 if (error) 735 goto release; 736 } 737 738 if (dstaddr != NULL) { /* destination address specified */ 739 if (inp->inp_faddr.s_addr != INADDR_ANY) { 740 /* already connected */ 741 error = EISCONN; 742 goto release; 743 } 744 sin = (struct sockaddr_in *)dstaddr; 745 prison_remote_ip(td, 0, &sin->sin_addr.s_addr); 746 } else { 747 if (inp->inp_faddr.s_addr == INADDR_ANY) { 748 /* no destination specified and not already connected */ 749 error = ENOTCONN; 750 goto release; 751 } 752 sin = NULL; 753 } 754 755 /* 756 * Calculate data length and get a mbuf 757 * for UDP and IP headers. 758 */ 759 M_PREPEND(m, sizeof(struct udpiphdr), M_DONTWAIT); 760 if (m == 0) { 761 error = ENOBUFS; 762 goto release; 763 } 764 765 /* 766 * Fill in mbuf with extended UDP header 767 * and addresses and length put into network format. 768 */ 769 ui = mtod(m, struct udpiphdr *); 770 bzero(ui->ui_x1, sizeof(ui->ui_x1)); /* XXX still needed? */ 771 ui->ui_pr = IPPROTO_UDP; 772 773 /* 774 * Set destination address. 775 */ 776 if (dstaddr != NULL) { /* use specified destination */ 777 ui->ui_dst = sin->sin_addr; 778 ui->ui_dport = sin->sin_port; 779 } else { /* use connected destination */ 780 ui->ui_dst = inp->inp_faddr; 781 ui->ui_dport = inp->inp_fport; 782 } 783 784 /* 785 * Set source address. If the source address is INADDR_ANY we 786 * have to lookup the outgoing interface based on the target address 787 * and assign the source address from that. 788 * 789 * If dstaddr is NULL the socket is connected and we have to use the 790 * connected target (in_faddr) as the target address, otherwise we 791 * just use dstaddr. 792 */ 793 if (inp->inp_laddr.s_addr == INADDR_ANY) { /* need to pick an address */ 794 struct sockaddr_in *if_sin; 795 struct sockaddr_in sin_tmp; 796 797 if (dstaddr == NULL) { 798 sin_tmp.sin_len = sizeof(sin_tmp); 799 sin_tmp.sin_family = AF_INET; 800 sin_tmp.sin_port = inp->inp_fport; 801 sin_tmp.sin_addr = inp->inp_faddr; 802 error = in_pcbladdr(inp, (void *)&sin_tmp, &if_sin); 803 } else { 804 error = in_pcbladdr(inp, dstaddr, &if_sin); 805 } 806 if (error) 807 goto release; 808 ui->ui_src = if_sin->sin_addr; 809 } else { /* use bound non-null address */ 810 ui->ui_src = inp->inp_laddr; 811 } 812 ui->ui_sport = inp->inp_lport; 813 KASSERT(inp->inp_lport != 0, ("inp lport should have been bound")); 814 815 ui->ui_ulen = htons((u_short)len + sizeof(struct udphdr)); 816 817 /* 818 * Set up checksum and output datagram. 819 */ 820 if (udpcksum) { 821 ui->ui_sum = in_pseudo(ui->ui_src.s_addr, ui->ui_dst.s_addr, 822 htons((u_short)len + sizeof(struct udphdr) + IPPROTO_UDP)); 823 m->m_pkthdr.csum_flags = CSUM_UDP; 824 m->m_pkthdr.csum_data = offsetof(struct udphdr, uh_sum); 825 } else { 826 ui->ui_sum = 0; 827 } 828 ((struct ip *)ui)->ip_len = sizeof (struct udpiphdr) + len; 829 ((struct ip *)ui)->ip_ttl = inp->inp_ip_ttl; /* XXX */ 830 ((struct ip *)ui)->ip_tos = inp->inp_ip_tos; /* XXX */ 831 udpstat.udps_opackets++; 832 833 error = ip_output(m, inp->inp_options, &inp->inp_route, 834 (inp->inp_socket->so_options & (SO_DONTROUTE | SO_BROADCAST)), 835 inp->inp_moptions, inp); 836 837 return (error); 838 839 release: 840 m_freem(m); 841 return (error); 842 } 843 844 u_long udp_sendspace = 9216; /* really max datagram size */ 845 /* 40 1K datagrams */ 846 SYSCTL_INT(_net_inet_udp, UDPCTL_MAXDGRAM, maxdgram, CTLFLAG_RW, 847 &udp_sendspace, 0, "Maximum outgoing UDP datagram size"); 848 849 u_long udp_recvspace = 40 * (1024 + 850 #ifdef INET6 851 sizeof(struct sockaddr_in6) 852 #else 853 sizeof(struct sockaddr_in) 854 #endif 855 ); 856 SYSCTL_INT(_net_inet_udp, UDPCTL_RECVSPACE, recvspace, CTLFLAG_RW, 857 &udp_recvspace, 0, "Maximum incoming UDP datagram size"); 858 859 static int 860 udp_abort(struct socket *so) 861 { 862 struct inpcb *inp; 863 int s; 864 865 inp = sotoinpcb(so); 866 if (inp == 0) 867 return EINVAL; /* ??? possible? panic instead? */ 868 soisdisconnected(so); 869 s = splnet(); 870 in_pcbdetach(inp); 871 splx(s); 872 return 0; 873 } 874 875 static int 876 udp_attach(struct socket *so, int proto, struct pru_attach_info *ai) 877 { 878 struct inpcb *inp; 879 int s, error; 880 881 inp = sotoinpcb(so); 882 if (inp != 0) 883 return EINVAL; 884 885 error = soreserve(so, udp_sendspace, udp_recvspace, ai->sb_rlimit); 886 if (error) 887 return error; 888 s = splnet(); 889 error = in_pcballoc(so, &udbinfo); 890 splx(s); 891 if (error) 892 return error; 893 894 inp = (struct inpcb *)so->so_pcb; 895 inp->inp_vflag |= INP_IPV4; 896 inp->inp_ip_ttl = ip_defttl; 897 return 0; 898 } 899 900 static int 901 udp_bind(struct socket *so, struct sockaddr *nam, struct thread *td) 902 { 903 struct inpcb *inp; 904 int s, error; 905 906 inp = sotoinpcb(so); 907 if (inp == 0) 908 return EINVAL; 909 s = splnet(); 910 error = in_pcbbind(inp, nam, td); 911 splx(s); 912 return error; 913 } 914 915 static int 916 udp_connect(struct socket *so, struct sockaddr *nam, struct thread *td) 917 { 918 struct inpcb *inp; 919 int s, error; 920 struct sockaddr_in *sin; 921 922 inp = sotoinpcb(so); 923 if (inp == 0) 924 return EINVAL; 925 if (inp->inp_faddr.s_addr != INADDR_ANY) 926 return EISCONN; 927 error = 0; 928 s = splnet(); 929 if (inp->inp_laddr.s_addr == INADDR_ANY && 930 td->td_proc && 931 td->td_proc->p_ucred->cr_prison != NULL) { 932 error = in_pcbbind(inp, NULL, td); 933 } 934 if (error == 0) { 935 sin = (struct sockaddr_in *)nam; 936 prison_remote_ip(td, 0, &sin->sin_addr.s_addr); 937 error = in_pcbconnect(inp, nam, td); 938 } 939 splx(s); 940 if (error == 0) 941 soisconnected(so); 942 return error; 943 } 944 945 static int 946 udp_detach(struct socket *so) 947 { 948 struct inpcb *inp; 949 int s; 950 951 inp = sotoinpcb(so); 952 if (inp == 0) 953 return EINVAL; 954 s = splnet(); 955 in_pcbdetach(inp); 956 splx(s); 957 return 0; 958 } 959 960 static int 961 udp_disconnect(struct socket *so) 962 { 963 struct inpcb *inp; 964 int s; 965 966 inp = sotoinpcb(so); 967 if (inp == 0) 968 return EINVAL; 969 if (inp->inp_faddr.s_addr == INADDR_ANY) 970 return ENOTCONN; 971 972 s = splnet(); 973 in_pcbdisconnect(inp); 974 inp->inp_laddr.s_addr = INADDR_ANY; 975 in_pcbinsbindhash(inp); 976 splx(s); 977 so->so_state &= ~SS_ISCONNECTED; /* XXX */ 978 return 0; 979 } 980 981 static int 982 udp_send(struct socket *so, int flags, struct mbuf *m, struct sockaddr *addr, 983 struct mbuf *control, struct thread *td) 984 { 985 struct inpcb *inp; 986 987 inp = sotoinpcb(so); 988 if (inp == 0) { 989 m_freem(m); 990 return EINVAL; 991 } 992 return udp_output(inp, m, addr, control, td); 993 } 994 995 int 996 udp_shutdown(struct socket *so) 997 { 998 struct inpcb *inp; 999 1000 inp = sotoinpcb(so); 1001 if (inp == 0) 1002 return EINVAL; 1003 socantsendmore(so); 1004 return 0; 1005 } 1006 1007 struct pr_usrreqs udp_usrreqs = { 1008 udp_abort, pru_accept_notsupp, udp_attach, udp_bind, udp_connect, 1009 pru_connect2_notsupp, in_control, udp_detach, udp_disconnect, 1010 pru_listen_notsupp, in_setpeeraddr, pru_rcvd_notsupp, 1011 pru_rcvoob_notsupp, udp_send, pru_sense_null, udp_shutdown, 1012 in_setsockaddr, sosend, soreceive, sopoll 1013 }; 1014 1015