10Sstevel@tonic-gate /* 20Sstevel@tonic-gate * CDDL HEADER START 30Sstevel@tonic-gate * 40Sstevel@tonic-gate * The contents of this file are subject to the terms of the 51676Sjpk * Common Development and Distribution License (the "License"). 61676Sjpk * You may not use this file except in compliance with the License. 70Sstevel@tonic-gate * 80Sstevel@tonic-gate * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 90Sstevel@tonic-gate * or http://www.opensolaris.org/os/licensing. 100Sstevel@tonic-gate * See the License for the specific language governing permissions 110Sstevel@tonic-gate * and limitations under the License. 120Sstevel@tonic-gate * 130Sstevel@tonic-gate * When distributing Covered Code, include this CDDL HEADER in each 140Sstevel@tonic-gate * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 150Sstevel@tonic-gate * If applicable, add the following below this CDDL HEADER, with the 160Sstevel@tonic-gate * fields enclosed by brackets "[]" replaced with your own identifying 170Sstevel@tonic-gate * information: Portions Copyright [yyyy] [name of copyright owner] 180Sstevel@tonic-gate * 190Sstevel@tonic-gate * CDDL HEADER END 200Sstevel@tonic-gate */ 211735Skcpoon 220Sstevel@tonic-gate /* 236712Stomee * Copyright 2008 Sun Microsystems, Inc. All rights reserved. 240Sstevel@tonic-gate * Use is subject to license terms. 250Sstevel@tonic-gate */ 260Sstevel@tonic-gate 270Sstevel@tonic-gate #include <sys/types.h> 280Sstevel@tonic-gate #include <sys/systm.h> 290Sstevel@tonic-gate #include <sys/stream.h> 301676Sjpk #include <sys/strsubr.h> 310Sstevel@tonic-gate #include <sys/ddi.h> 320Sstevel@tonic-gate #include <sys/sunddi.h> 330Sstevel@tonic-gate #include <sys/kmem.h> 340Sstevel@tonic-gate #include <sys/socket.h> 350Sstevel@tonic-gate #include <sys/random.h> 361676Sjpk #include <sys/tsol/tndb.h> 371676Sjpk #include <sys/tsol/tnet.h> 380Sstevel@tonic-gate 390Sstevel@tonic-gate #include <netinet/in.h> 400Sstevel@tonic-gate #include <netinet/ip6.h> 410Sstevel@tonic-gate #include <netinet/sctp.h> 420Sstevel@tonic-gate 430Sstevel@tonic-gate #include <inet/common.h> 440Sstevel@tonic-gate #include <inet/ip.h> 450Sstevel@tonic-gate #include <inet/ip6.h> 460Sstevel@tonic-gate #include <inet/ip_ire.h> 470Sstevel@tonic-gate #include <inet/mib2.h> 480Sstevel@tonic-gate #include <inet/nd.h> 490Sstevel@tonic-gate #include <inet/optcom.h> 500Sstevel@tonic-gate #include <inet/sctp_ip.h> 510Sstevel@tonic-gate #include <inet/ipclassifier.h> 521676Sjpk 530Sstevel@tonic-gate #include "sctp_impl.h" 540Sstevel@tonic-gate #include "sctp_addr.h" 551932Svi117747 #include "sctp_asconf.h" 560Sstevel@tonic-gate 570Sstevel@tonic-gate static struct kmem_cache *sctp_kmem_faddr_cache; 581735Skcpoon static void sctp_init_faddr(sctp_t *, sctp_faddr_t *, in6_addr_t *, mblk_t *); 590Sstevel@tonic-gate 601735Skcpoon /* Set the source address. Refer to comments in sctp_get_ire(). */ 611932Svi117747 void 621932Svi117747 sctp_set_saddr(sctp_t *sctp, sctp_faddr_t *fp) 630Sstevel@tonic-gate { 641719Sjarrett boolean_t v6 = !fp->isv4; 654818Skcpoon boolean_t addr_set; 661719Sjarrett 674818Skcpoon fp->saddr = sctp_get_valid_addr(sctp, v6, &addr_set); 684818Skcpoon /* 694818Skcpoon * If there is no source address avaialble, mark this peer address 704818Skcpoon * as unreachable for now. When the heartbeat timer fires, it will 714818Skcpoon * call sctp_get_ire() to re-check if there is any source address 724818Skcpoon * available. 734818Skcpoon */ 744818Skcpoon if (!addr_set) 754818Skcpoon fp->state = SCTP_FADDRS_UNREACH; 760Sstevel@tonic-gate } 770Sstevel@tonic-gate 780Sstevel@tonic-gate /* 790Sstevel@tonic-gate * Call this function to update the cached IRE of a peer addr fp. 800Sstevel@tonic-gate */ 810Sstevel@tonic-gate void 821735Skcpoon sctp_get_ire(sctp_t *sctp, sctp_faddr_t *fp) 830Sstevel@tonic-gate { 841735Skcpoon ire_t *ire; 851735Skcpoon ipaddr_t addr4; 861735Skcpoon in6_addr_t laddr; 870Sstevel@tonic-gate sctp_saddr_ipif_t *sp; 881735Skcpoon int hdrlen; 891735Skcpoon ts_label_t *tsl; 903448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 913448Sdh155122 ip_stack_t *ipst = sctps->sctps_netstack->netstack_ip; 920Sstevel@tonic-gate 930Sstevel@tonic-gate /* Remove the previous cache IRE */ 940Sstevel@tonic-gate if ((ire = fp->ire) != NULL) { 950Sstevel@tonic-gate IRE_REFRELE_NOTR(ire); 960Sstevel@tonic-gate fp->ire = NULL; 970Sstevel@tonic-gate } 980Sstevel@tonic-gate 990Sstevel@tonic-gate /* 1000Sstevel@tonic-gate * If this addr is not reachable, mark it as unconfirmed for now, the 1010Sstevel@tonic-gate * state will be changed back to unreachable later in this function 1020Sstevel@tonic-gate * if it is still the case. 1030Sstevel@tonic-gate */ 1040Sstevel@tonic-gate if (fp->state == SCTP_FADDRS_UNREACH) { 1050Sstevel@tonic-gate fp->state = SCTP_FADDRS_UNCONFIRMED; 1060Sstevel@tonic-gate } 1070Sstevel@tonic-gate 1081676Sjpk tsl = crgetlabel(CONN_CRED(sctp->sctp_connp)); 1091676Sjpk 1100Sstevel@tonic-gate if (fp->isv4) { 1110Sstevel@tonic-gate IN6_V4MAPPED_TO_IPADDR(&fp->faddr, addr4); 1123448Sdh155122 ire = ire_cache_lookup(addr4, sctp->sctp_zoneid, tsl, ipst); 1131676Sjpk if (ire != NULL) 1141676Sjpk IN6_IPADDR_TO_V4MAPPED(ire->ire_src_addr, &laddr); 1151676Sjpk } else { 1163448Sdh155122 ire = ire_cache_lookup_v6(&fp->faddr, sctp->sctp_zoneid, tsl, 1173448Sdh155122 ipst); 1181676Sjpk if (ire != NULL) 1191676Sjpk laddr = ire->ire_src_addr_v6; 1201676Sjpk } 1210Sstevel@tonic-gate 1221676Sjpk if (ire == NULL) { 1231676Sjpk dprint(3, ("ire2faddr: no ire for %x:%x:%x:%x\n", 1241676Sjpk SCTP_PRINTADDR(fp->faddr))); 1251676Sjpk /* 1261676Sjpk * It is tempting to just leave the src addr 1271676Sjpk * unspecified and let IP figure it out, but we 1281676Sjpk * *cannot* do this, since IP may choose a src addr 1291676Sjpk * that is not part of this association... unless 1301676Sjpk * this sctp has bound to all addrs. So if the ire 1311676Sjpk * lookup fails, try to find one in our src addr 1321676Sjpk * list, unless the sctp has bound to all addrs, in 1331676Sjpk * which case we change the src addr to unspec. 1341676Sjpk * 1351676Sjpk * Note that if this is a v6 endpoint but it does 1361676Sjpk * not have any v4 address at this point (e.g. may 1371676Sjpk * have been deleted), sctp_get_valid_addr() will 1381676Sjpk * return mapped INADDR_ANY. In this case, this 1391676Sjpk * address should be marked not reachable so that 1401676Sjpk * it won't be used to send data. 1411676Sjpk */ 1421932Svi117747 sctp_set_saddr(sctp, fp); 1431735Skcpoon if (fp->state == SCTP_FADDRS_UNREACH) 1441735Skcpoon return; 1451735Skcpoon goto check_current; 1461676Sjpk } 1471676Sjpk 1481735Skcpoon /* Make sure the laddr is part of this association */ 1493510Svi117747 if ((sp = sctp_saddr_lookup(sctp, &ire->ire_ipif->ipif_v6lcl_addr, 1503510Svi117747 0)) != NULL && !sp->saddr_ipif_dontsrc) { 1511676Sjpk if (sp->saddr_ipif_unconfirmed == 1) 1521676Sjpk sp->saddr_ipif_unconfirmed = 0; 1531676Sjpk fp->saddr = laddr; 1541676Sjpk } else { 1551676Sjpk dprint(2, ("ire2faddr: src addr is not part of assc\n")); 1561735Skcpoon 1571735Skcpoon /* 1581735Skcpoon * Set the src to the first saddr and hope for the best. 1591735Skcpoon * Note that we will still do the ire caching below. 1601735Skcpoon * Otherwise, whenever we send a packet, we need to do 1611735Skcpoon * the ire lookup again and still may not get the correct 1621735Skcpoon * source address. Note that this case should very seldomly 1631735Skcpoon * happen. One scenario this can happen is an app 1641735Skcpoon * explicitly bind() to an address. But that address is 1651735Skcpoon * not the preferred source address to send to the peer. 1661735Skcpoon */ 1671932Svi117747 sctp_set_saddr(sctp, fp); 1681735Skcpoon if (fp->state == SCTP_FADDRS_UNREACH) { 1691735Skcpoon IRE_REFRELE(ire); 1701735Skcpoon return; 1711735Skcpoon } 1720Sstevel@tonic-gate } 1730Sstevel@tonic-gate 1741735Skcpoon /* 1751735Skcpoon * Note that ire_cache_lookup_*() returns an ire with the tracing 1761735Skcpoon * bits enabled. This requires the thread holding the ire also 1771735Skcpoon * do the IRE_REFRELE(). Thus we need to do IRE_REFHOLD_NOTR() 1781735Skcpoon * and then IRE_REFRELE() the ire here to make the tracing bits 1791735Skcpoon * work. 1801735Skcpoon */ 1811735Skcpoon IRE_REFHOLD_NOTR(ire); 1821735Skcpoon IRE_REFRELE(ire); 1831735Skcpoon 1840Sstevel@tonic-gate /* Cache the IRE */ 1850Sstevel@tonic-gate fp->ire = ire; 1860Sstevel@tonic-gate if (fp->ire->ire_type == IRE_LOOPBACK && !sctp->sctp_loopback) 1870Sstevel@tonic-gate sctp->sctp_loopback = 1; 1880Sstevel@tonic-gate 1890Sstevel@tonic-gate /* 1900Sstevel@tonic-gate * Pull out RTO information for this faddr and use it if we don't 1910Sstevel@tonic-gate * have any yet. 1920Sstevel@tonic-gate */ 1930Sstevel@tonic-gate if (fp->srtt == -1 && ire->ire_uinfo.iulp_rtt != 0) { 194116Skcpoon /* The cached value is in ms. */ 195116Skcpoon fp->srtt = MSEC_TO_TICK(ire->ire_uinfo.iulp_rtt); 196116Skcpoon fp->rttvar = MSEC_TO_TICK(ire->ire_uinfo.iulp_rtt_sd); 1970Sstevel@tonic-gate fp->rto = 3 * fp->srtt; 1980Sstevel@tonic-gate 1990Sstevel@tonic-gate /* Bound the RTO by configured min and max values */ 2000Sstevel@tonic-gate if (fp->rto < sctp->sctp_rto_min) { 2010Sstevel@tonic-gate fp->rto = sctp->sctp_rto_min; 2020Sstevel@tonic-gate } 2030Sstevel@tonic-gate if (fp->rto > sctp->sctp_rto_max) { 2040Sstevel@tonic-gate fp->rto = sctp->sctp_rto_max; 2050Sstevel@tonic-gate } 2060Sstevel@tonic-gate } 2070Sstevel@tonic-gate 2080Sstevel@tonic-gate /* 2090Sstevel@tonic-gate * Record the MTU for this faddr. If the MTU for this faddr has 2100Sstevel@tonic-gate * changed, check if the assc MTU will also change. 2110Sstevel@tonic-gate */ 2120Sstevel@tonic-gate if (fp->isv4) { 2130Sstevel@tonic-gate hdrlen = sctp->sctp_hdr_len; 2140Sstevel@tonic-gate } else { 2150Sstevel@tonic-gate hdrlen = sctp->sctp_hdr6_len; 2160Sstevel@tonic-gate } 2170Sstevel@tonic-gate if ((fp->sfa_pmss + hdrlen) != ire->ire_max_frag) { 2180Sstevel@tonic-gate /* Make sure that sfa_pmss is a multiple of SCTP_ALIGN. */ 2190Sstevel@tonic-gate fp->sfa_pmss = (ire->ire_max_frag - hdrlen) & ~(SCTP_ALIGN - 1); 2200Sstevel@tonic-gate if (fp->cwnd < (fp->sfa_pmss * 2)) { 2213795Skcpoon SET_CWND(fp, fp->sfa_pmss, 2223795Skcpoon sctps->sctps_slow_start_initial); 2230Sstevel@tonic-gate } 2240Sstevel@tonic-gate } 2250Sstevel@tonic-gate 2261735Skcpoon check_current: 2271735Skcpoon if (fp == sctp->sctp_current) 2281735Skcpoon sctp_set_faddr_current(sctp, fp); 2290Sstevel@tonic-gate } 2300Sstevel@tonic-gate 2310Sstevel@tonic-gate void 2321735Skcpoon sctp_update_ire(sctp_t *sctp) 2330Sstevel@tonic-gate { 2341735Skcpoon ire_t *ire; 2351735Skcpoon sctp_faddr_t *fp; 2363448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 2370Sstevel@tonic-gate 2381735Skcpoon for (fp = sctp->sctp_faddrs; fp != NULL; fp = fp->next) { 2391735Skcpoon if ((ire = fp->ire) == NULL) 2401735Skcpoon continue; 2411735Skcpoon mutex_enter(&ire->ire_lock); 2420Sstevel@tonic-gate 2431735Skcpoon /* 2441735Skcpoon * If the cached IRE is going away, there is no point to 2451735Skcpoon * update it. 2461735Skcpoon */ 2471735Skcpoon if (ire->ire_marks & IRE_MARK_CONDEMNED) { 2481735Skcpoon mutex_exit(&ire->ire_lock); 2491735Skcpoon IRE_REFRELE_NOTR(ire); 2501735Skcpoon fp->ire = NULL; 2511735Skcpoon continue; 2520Sstevel@tonic-gate } 2530Sstevel@tonic-gate 2540Sstevel@tonic-gate /* 2551735Skcpoon * Only record the PMTU for this faddr if we actually have 2561735Skcpoon * done discovery. This prevents initialized default from 2571735Skcpoon * clobbering any real info that IP may have. 2580Sstevel@tonic-gate */ 2591735Skcpoon if (fp->pmtu_discovered) { 2601735Skcpoon if (fp->isv4) { 2611735Skcpoon ire->ire_max_frag = fp->sfa_pmss + 2621735Skcpoon sctp->sctp_hdr_len; 2631735Skcpoon } else { 2641735Skcpoon ire->ire_max_frag = fp->sfa_pmss + 2651735Skcpoon sctp->sctp_hdr6_len; 2661735Skcpoon } 2670Sstevel@tonic-gate } 2681735Skcpoon 2693448Sdh155122 if (sctps->sctps_rtt_updates != 0 && 2703448Sdh155122 fp->rtt_updates >= sctps->sctps_rtt_updates) { 2711735Skcpoon /* 2721735Skcpoon * If there is no old cached values, initialize them 2731735Skcpoon * conservatively. Set them to be (1.5 * new value). 2741735Skcpoon * This code copied from ip_ire_advise(). The cached 2751735Skcpoon * value is in ms. 2761735Skcpoon */ 2771735Skcpoon if (ire->ire_uinfo.iulp_rtt != 0) { 2781735Skcpoon ire->ire_uinfo.iulp_rtt = 2791735Skcpoon (ire->ire_uinfo.iulp_rtt + 2801735Skcpoon TICK_TO_MSEC(fp->srtt)) >> 1; 2811735Skcpoon } else { 2821735Skcpoon ire->ire_uinfo.iulp_rtt = 2831735Skcpoon TICK_TO_MSEC(fp->srtt + (fp->srtt >> 1)); 2841735Skcpoon } 2851735Skcpoon if (ire->ire_uinfo.iulp_rtt_sd != 0) { 2861735Skcpoon ire->ire_uinfo.iulp_rtt_sd = 2874691Skcpoon (ire->ire_uinfo.iulp_rtt_sd + 2884691Skcpoon TICK_TO_MSEC(fp->rttvar)) >> 1; 2891735Skcpoon } else { 2901735Skcpoon ire->ire_uinfo.iulp_rtt_sd = 2911735Skcpoon TICK_TO_MSEC(fp->rttvar + 2921735Skcpoon (fp->rttvar >> 1)); 2931735Skcpoon } 2941735Skcpoon fp->rtt_updates = 0; 2950Sstevel@tonic-gate } 2961735Skcpoon mutex_exit(&ire->ire_lock); 2970Sstevel@tonic-gate } 2980Sstevel@tonic-gate } 2990Sstevel@tonic-gate 3000Sstevel@tonic-gate /* 3010Sstevel@tonic-gate * The sender must set the total length in the IP header. 3020Sstevel@tonic-gate * If sendto == NULL, the current will be used. 3030Sstevel@tonic-gate */ 3040Sstevel@tonic-gate mblk_t * 3050Sstevel@tonic-gate sctp_make_mp(sctp_t *sctp, sctp_faddr_t *sendto, int trailer) 3060Sstevel@tonic-gate { 3070Sstevel@tonic-gate mblk_t *mp; 3080Sstevel@tonic-gate size_t ipsctplen; 3090Sstevel@tonic-gate int isv4; 3100Sstevel@tonic-gate sctp_faddr_t *fp; 3113448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 3124818Skcpoon boolean_t src_changed = B_FALSE; 3130Sstevel@tonic-gate 3140Sstevel@tonic-gate ASSERT(sctp->sctp_current != NULL || sendto != NULL); 3150Sstevel@tonic-gate if (sendto == NULL) { 3160Sstevel@tonic-gate fp = sctp->sctp_current; 3170Sstevel@tonic-gate } else { 3180Sstevel@tonic-gate fp = sendto; 3190Sstevel@tonic-gate } 3200Sstevel@tonic-gate isv4 = fp->isv4; 3210Sstevel@tonic-gate 3220Sstevel@tonic-gate /* Try to look for another IRE again. */ 3234818Skcpoon if (fp->ire == NULL) { 3241735Skcpoon sctp_get_ire(sctp, fp); 3254818Skcpoon /* 3264818Skcpoon * Although we still may not get an IRE, the source address 3274818Skcpoon * may be changed in sctp_get_ire(). Set src_changed to 3284818Skcpoon * true so that the source address is copied again. 3294818Skcpoon */ 3304818Skcpoon src_changed = B_TRUE; 3314818Skcpoon } 3320Sstevel@tonic-gate 3330Sstevel@tonic-gate /* There is no suitable source address to use, return. */ 3340Sstevel@tonic-gate if (fp->state == SCTP_FADDRS_UNREACH) 3350Sstevel@tonic-gate return (NULL); 3364818Skcpoon ASSERT(!IN6_IS_ADDR_V4MAPPED_ANY(&fp->saddr)); 3370Sstevel@tonic-gate 3380Sstevel@tonic-gate if (isv4) { 3390Sstevel@tonic-gate ipsctplen = sctp->sctp_hdr_len; 3400Sstevel@tonic-gate } else { 3410Sstevel@tonic-gate ipsctplen = sctp->sctp_hdr6_len; 3420Sstevel@tonic-gate } 3430Sstevel@tonic-gate 3443448Sdh155122 mp = allocb_cred(ipsctplen + sctps->sctps_wroff_xtra + trailer, 3451676Sjpk CONN_CRED(sctp->sctp_connp)); 3460Sstevel@tonic-gate if (mp == NULL) { 3471676Sjpk ip1dbg(("sctp_make_mp: error making mp..\n")); 3480Sstevel@tonic-gate return (NULL); 3490Sstevel@tonic-gate } 3503448Sdh155122 mp->b_rptr += sctps->sctps_wroff_xtra; 3510Sstevel@tonic-gate mp->b_wptr = mp->b_rptr + ipsctplen; 3520Sstevel@tonic-gate 3530Sstevel@tonic-gate ASSERT(OK_32PTR(mp->b_wptr)); 3540Sstevel@tonic-gate 3550Sstevel@tonic-gate if (isv4) { 3560Sstevel@tonic-gate ipha_t *iph = (ipha_t *)mp->b_rptr; 3570Sstevel@tonic-gate 3580Sstevel@tonic-gate bcopy(sctp->sctp_iphc, mp->b_rptr, ipsctplen); 3594818Skcpoon if (fp != sctp->sctp_current || src_changed) { 3604818Skcpoon /* Fix the source and destination addresses. */ 3610Sstevel@tonic-gate IN6_V4MAPPED_TO_IPADDR(&fp->faddr, iph->ipha_dst); 3624818Skcpoon IN6_V4MAPPED_TO_IPADDR(&fp->saddr, iph->ipha_src); 3630Sstevel@tonic-gate } 3640Sstevel@tonic-gate /* set or clear the don't fragment bit */ 3650Sstevel@tonic-gate if (fp->df) { 3660Sstevel@tonic-gate iph->ipha_fragment_offset_and_flags = htons(IPH_DF); 3670Sstevel@tonic-gate } else { 3680Sstevel@tonic-gate iph->ipha_fragment_offset_and_flags = 0; 3690Sstevel@tonic-gate } 3700Sstevel@tonic-gate } else { 3710Sstevel@tonic-gate bcopy(sctp->sctp_iphc6, mp->b_rptr, ipsctplen); 3724818Skcpoon if (fp != sctp->sctp_current || src_changed) { 3734818Skcpoon /* Fix the source and destination addresses. */ 3740Sstevel@tonic-gate ((ip6_t *)(mp->b_rptr))->ip6_dst = fp->faddr; 3754818Skcpoon ((ip6_t *)(mp->b_rptr))->ip6_src = fp->saddr; 3760Sstevel@tonic-gate } 3770Sstevel@tonic-gate } 3780Sstevel@tonic-gate ASSERT(sctp->sctp_connp != NULL); 3790Sstevel@tonic-gate 3800Sstevel@tonic-gate /* 3810Sstevel@tonic-gate * IP will not free this IRE if it is condemned. SCTP needs to 3820Sstevel@tonic-gate * free it. 3830Sstevel@tonic-gate */ 3840Sstevel@tonic-gate if ((fp->ire != NULL) && (fp->ire->ire_marks & IRE_MARK_CONDEMNED)) { 3850Sstevel@tonic-gate IRE_REFRELE_NOTR(fp->ire); 3860Sstevel@tonic-gate fp->ire = NULL; 3870Sstevel@tonic-gate } 3880Sstevel@tonic-gate /* Stash the conn and ire ptr info. for IP */ 3890Sstevel@tonic-gate SCTP_STASH_IPINFO(mp, fp->ire); 3900Sstevel@tonic-gate 3910Sstevel@tonic-gate return (mp); 3920Sstevel@tonic-gate } 3930Sstevel@tonic-gate 3940Sstevel@tonic-gate /* 3950Sstevel@tonic-gate * Notify upper layers about preferred write offset, write size. 3960Sstevel@tonic-gate */ 3970Sstevel@tonic-gate void 3980Sstevel@tonic-gate sctp_set_ulp_prop(sctp_t *sctp) 3990Sstevel@tonic-gate { 4000Sstevel@tonic-gate int hdrlen; 4013448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 4020Sstevel@tonic-gate 4030Sstevel@tonic-gate if (sctp->sctp_current->isv4) { 4040Sstevel@tonic-gate hdrlen = sctp->sctp_hdr_len; 4050Sstevel@tonic-gate } else { 4060Sstevel@tonic-gate hdrlen = sctp->sctp_hdr6_len; 4070Sstevel@tonic-gate } 4080Sstevel@tonic-gate ASSERT(sctp->sctp_ulpd); 4090Sstevel@tonic-gate 4100Sstevel@tonic-gate ASSERT(sctp->sctp_current->sfa_pmss == sctp->sctp_mss); 4110Sstevel@tonic-gate sctp->sctp_ulp_prop(sctp->sctp_ulpd, 4123448Sdh155122 sctps->sctps_wroff_xtra + hdrlen + sizeof (sctp_data_hdr_t), 4130Sstevel@tonic-gate sctp->sctp_mss - sizeof (sctp_data_hdr_t)); 4140Sstevel@tonic-gate } 4150Sstevel@tonic-gate 4160Sstevel@tonic-gate void 4170Sstevel@tonic-gate sctp_set_iplen(sctp_t *sctp, mblk_t *mp) 4180Sstevel@tonic-gate { 4190Sstevel@tonic-gate uint16_t sum = 0; 4200Sstevel@tonic-gate ipha_t *iph; 4210Sstevel@tonic-gate ip6_t *ip6h; 4220Sstevel@tonic-gate mblk_t *pmp = mp; 4230Sstevel@tonic-gate boolean_t isv4; 4240Sstevel@tonic-gate 4250Sstevel@tonic-gate isv4 = (IPH_HDR_VERSION(mp->b_rptr) == IPV4_VERSION); 4260Sstevel@tonic-gate for (; pmp; pmp = pmp->b_cont) 4270Sstevel@tonic-gate sum += pmp->b_wptr - pmp->b_rptr; 4280Sstevel@tonic-gate 4290Sstevel@tonic-gate if (isv4) { 4300Sstevel@tonic-gate iph = (ipha_t *)mp->b_rptr; 4310Sstevel@tonic-gate iph->ipha_length = htons(sum); 4320Sstevel@tonic-gate } else { 4330Sstevel@tonic-gate ip6h = (ip6_t *)mp->b_rptr; 434679Sseb /* 435679Sseb * If an ip6i_t is present, the real IPv6 header 436679Sseb * immediately follows. 437679Sseb */ 438679Sseb if (ip6h->ip6_nxt == IPPROTO_RAW) 439679Sseb ip6h = (ip6_t *)&ip6h[1]; 4400Sstevel@tonic-gate ip6h->ip6_plen = htons(sum - ((char *)&sctp->sctp_ip6h[1] - 4410Sstevel@tonic-gate sctp->sctp_iphc6)); 4420Sstevel@tonic-gate } 4430Sstevel@tonic-gate } 4440Sstevel@tonic-gate 4450Sstevel@tonic-gate int 4460Sstevel@tonic-gate sctp_compare_faddrsets(sctp_faddr_t *a1, sctp_faddr_t *a2) 4470Sstevel@tonic-gate { 4480Sstevel@tonic-gate int na1 = 0; 4490Sstevel@tonic-gate int overlap = 0; 4500Sstevel@tonic-gate int equal = 1; 4510Sstevel@tonic-gate int onematch; 4520Sstevel@tonic-gate sctp_faddr_t *fp1, *fp2; 4530Sstevel@tonic-gate 4540Sstevel@tonic-gate for (fp1 = a1; fp1; fp1 = fp1->next) { 4550Sstevel@tonic-gate onematch = 0; 4560Sstevel@tonic-gate for (fp2 = a2; fp2; fp2 = fp2->next) { 4570Sstevel@tonic-gate if (IN6_ARE_ADDR_EQUAL(&fp1->faddr, &fp2->faddr)) { 4580Sstevel@tonic-gate overlap++; 4590Sstevel@tonic-gate onematch = 1; 4600Sstevel@tonic-gate break; 4610Sstevel@tonic-gate } 4620Sstevel@tonic-gate if (!onematch) { 4630Sstevel@tonic-gate equal = 0; 4640Sstevel@tonic-gate } 4650Sstevel@tonic-gate } 4660Sstevel@tonic-gate na1++; 4670Sstevel@tonic-gate } 4680Sstevel@tonic-gate 4690Sstevel@tonic-gate if (equal) { 4700Sstevel@tonic-gate return (SCTP_ADDR_EQUAL); 4710Sstevel@tonic-gate } 4720Sstevel@tonic-gate if (overlap == na1) { 4730Sstevel@tonic-gate return (SCTP_ADDR_SUBSET); 4740Sstevel@tonic-gate } 4750Sstevel@tonic-gate if (overlap) { 4760Sstevel@tonic-gate return (SCTP_ADDR_OVERLAP); 4770Sstevel@tonic-gate } 4780Sstevel@tonic-gate return (SCTP_ADDR_DISJOINT); 4790Sstevel@tonic-gate } 4800Sstevel@tonic-gate 4810Sstevel@tonic-gate /* 4821735Skcpoon * Returns 0 on success, -1 on memory allocation failure. If sleep 4831735Skcpoon * is true, this function should never fail. The boolean parameter 4841735Skcpoon * first decides whether the newly created faddr structure should be 4851735Skcpoon * added at the beginning of the list or at the end. 4861735Skcpoon * 4871735Skcpoon * Note: caller must hold conn fanout lock. 4880Sstevel@tonic-gate */ 4891735Skcpoon int 4901735Skcpoon sctp_add_faddr(sctp_t *sctp, in6_addr_t *addr, int sleep, boolean_t first) 4910Sstevel@tonic-gate { 4921735Skcpoon sctp_faddr_t *faddr; 4931735Skcpoon mblk_t *timer_mp; 4940Sstevel@tonic-gate 4951676Sjpk if (is_system_labeled()) { 4961676Sjpk ts_label_t *tsl; 4971676Sjpk tsol_tpc_t *rhtp; 4981676Sjpk int retv; 4991676Sjpk 5001676Sjpk tsl = crgetlabel(CONN_CRED(sctp->sctp_connp)); 5011676Sjpk ASSERT(tsl != NULL); 5021676Sjpk 5031676Sjpk /* find_tpc automatically does the right thing with IPv4 */ 5041676Sjpk rhtp = find_tpc(addr, IPV6_VERSION, B_FALSE); 5051676Sjpk if (rhtp == NULL) 5061676Sjpk return (EACCES); 5070Sstevel@tonic-gate 5081676Sjpk retv = EACCES; 5091676Sjpk if (tsl->tsl_doi == rhtp->tpc_tp.tp_doi) { 5101676Sjpk switch (rhtp->tpc_tp.host_type) { 5111676Sjpk case UNLABELED: 5121676Sjpk /* 5131676Sjpk * Can talk to unlabeled hosts if any of the 5141676Sjpk * following are true: 5151676Sjpk * 1. zone's label matches the remote host's 5161676Sjpk * default label, 5171676Sjpk * 2. mac_exempt is on and the zone dominates 5181676Sjpk * the remote host's label, or 5191676Sjpk * 3. mac_exempt is on and the socket is from 5201676Sjpk * the global zone. 5211676Sjpk */ 5221676Sjpk if (blequal(&rhtp->tpc_tp.tp_def_label, 5231676Sjpk &tsl->tsl_label) || 5241676Sjpk (sctp->sctp_mac_exempt && 5251676Sjpk (sctp->sctp_zoneid == GLOBAL_ZONEID || 5261676Sjpk bldominates(&tsl->tsl_label, 5271676Sjpk &rhtp->tpc_tp.tp_def_label)))) 5281676Sjpk retv = 0; 5291676Sjpk break; 5301676Sjpk case SUN_CIPSO: 5311676Sjpk if (_blinrange(&tsl->tsl_label, 5321676Sjpk &rhtp->tpc_tp.tp_sl_range_cipso) || 5331676Sjpk blinlset(&tsl->tsl_label, 5341676Sjpk rhtp->tpc_tp.tp_sl_set_cipso)) 5351676Sjpk retv = 0; 5361676Sjpk break; 5371676Sjpk } 5381676Sjpk } 5391676Sjpk TPC_RELE(rhtp); 5401676Sjpk if (retv != 0) 5411676Sjpk return (retv); 5420Sstevel@tonic-gate } 5430Sstevel@tonic-gate 5441676Sjpk if ((faddr = kmem_cache_alloc(sctp_kmem_faddr_cache, sleep)) == NULL) 5451676Sjpk return (ENOMEM); 5464691Skcpoon timer_mp = sctp_timer_alloc((sctp), sctp_rexmit_timer, sleep); 5471735Skcpoon if (timer_mp == NULL) { 5481735Skcpoon kmem_cache_free(sctp_kmem_faddr_cache, faddr); 5491735Skcpoon return (ENOMEM); 5501735Skcpoon } 5511735Skcpoon ((sctpt_t *)(timer_mp->b_rptr))->sctpt_faddr = faddr; 5521676Sjpk 5531735Skcpoon sctp_init_faddr(sctp, faddr, addr, timer_mp); 5544818Skcpoon 5554818Skcpoon /* Check for subnet broadcast. */ 5564818Skcpoon if (faddr->ire != NULL && faddr->ire->ire_type & IRE_BROADCAST) { 5574818Skcpoon IRE_REFRELE_NOTR(faddr->ire); 5584818Skcpoon sctp_timer_free(timer_mp); 5595240Snordmark faddr->timer_mp = NULL; 5604818Skcpoon kmem_cache_free(sctp_kmem_faddr_cache, faddr); 5614818Skcpoon return (EADDRNOTAVAIL); 5624818Skcpoon } 5630Sstevel@tonic-gate ASSERT(faddr->next == NULL); 5640Sstevel@tonic-gate 5651676Sjpk if (sctp->sctp_faddrs == NULL) { 5661676Sjpk ASSERT(sctp->sctp_lastfaddr == NULL); 5671676Sjpk /* only element on list; first and last are same */ 5681676Sjpk sctp->sctp_faddrs = sctp->sctp_lastfaddr = faddr; 5691676Sjpk } else if (first) { 5701676Sjpk ASSERT(sctp->sctp_lastfaddr != NULL); 5711676Sjpk faddr->next = sctp->sctp_faddrs; 5721676Sjpk sctp->sctp_faddrs = faddr; 5730Sstevel@tonic-gate } else { 5741676Sjpk sctp->sctp_lastfaddr->next = faddr; 5751676Sjpk sctp->sctp_lastfaddr = faddr; 5760Sstevel@tonic-gate } 577852Svi117747 sctp->sctp_nfaddrs++; 5780Sstevel@tonic-gate 5790Sstevel@tonic-gate return (0); 5800Sstevel@tonic-gate } 5810Sstevel@tonic-gate 5820Sstevel@tonic-gate sctp_faddr_t * 5830Sstevel@tonic-gate sctp_lookup_faddr(sctp_t *sctp, in6_addr_t *addr) 5840Sstevel@tonic-gate { 5850Sstevel@tonic-gate sctp_faddr_t *fp; 5860Sstevel@tonic-gate 5870Sstevel@tonic-gate for (fp = sctp->sctp_faddrs; fp != NULL; fp = fp->next) { 5880Sstevel@tonic-gate if (IN6_ARE_ADDR_EQUAL(&fp->faddr, addr)) 5890Sstevel@tonic-gate break; 5900Sstevel@tonic-gate } 5910Sstevel@tonic-gate 5920Sstevel@tonic-gate return (fp); 5930Sstevel@tonic-gate } 5940Sstevel@tonic-gate 5950Sstevel@tonic-gate sctp_faddr_t * 5960Sstevel@tonic-gate sctp_lookup_faddr_nosctp(sctp_faddr_t *fp, in6_addr_t *addr) 5970Sstevel@tonic-gate { 5980Sstevel@tonic-gate for (; fp; fp = fp->next) { 5990Sstevel@tonic-gate if (IN6_ARE_ADDR_EQUAL(&fp->faddr, addr)) { 6000Sstevel@tonic-gate break; 6010Sstevel@tonic-gate } 6020Sstevel@tonic-gate } 6030Sstevel@tonic-gate 6040Sstevel@tonic-gate return (fp); 6050Sstevel@tonic-gate } 6060Sstevel@tonic-gate 6071735Skcpoon /* 6081735Skcpoon * To change the currently used peer address to the specified one. 6091735Skcpoon */ 6100Sstevel@tonic-gate void 6111735Skcpoon sctp_set_faddr_current(sctp_t *sctp, sctp_faddr_t *fp) 6120Sstevel@tonic-gate { 6131735Skcpoon /* Now setup the composite header. */ 6140Sstevel@tonic-gate if (fp->isv4) { 6150Sstevel@tonic-gate IN6_V4MAPPED_TO_IPADDR(&fp->faddr, 6160Sstevel@tonic-gate sctp->sctp_ipha->ipha_dst); 6170Sstevel@tonic-gate IN6_V4MAPPED_TO_IPADDR(&fp->saddr, sctp->sctp_ipha->ipha_src); 6180Sstevel@tonic-gate /* update don't fragment bit */ 6190Sstevel@tonic-gate if (fp->df) { 6200Sstevel@tonic-gate sctp->sctp_ipha->ipha_fragment_offset_and_flags = 6210Sstevel@tonic-gate htons(IPH_DF); 6220Sstevel@tonic-gate } else { 6230Sstevel@tonic-gate sctp->sctp_ipha->ipha_fragment_offset_and_flags = 0; 6240Sstevel@tonic-gate } 6250Sstevel@tonic-gate } else { 6260Sstevel@tonic-gate sctp->sctp_ip6h->ip6_dst = fp->faddr; 6270Sstevel@tonic-gate sctp->sctp_ip6h->ip6_src = fp->saddr; 6280Sstevel@tonic-gate } 6291735Skcpoon 6301735Skcpoon sctp->sctp_current = fp; 6311735Skcpoon sctp->sctp_mss = fp->sfa_pmss; 6321735Skcpoon 6331735Skcpoon /* Update the uppper layer for the change. */ 6341735Skcpoon if (!SCTP_IS_DETACHED(sctp)) 6351735Skcpoon sctp_set_ulp_prop(sctp); 6360Sstevel@tonic-gate } 6370Sstevel@tonic-gate 6380Sstevel@tonic-gate void 6390Sstevel@tonic-gate sctp_redo_faddr_srcs(sctp_t *sctp) 6400Sstevel@tonic-gate { 6410Sstevel@tonic-gate sctp_faddr_t *fp; 6420Sstevel@tonic-gate 6430Sstevel@tonic-gate for (fp = sctp->sctp_faddrs; fp != NULL; fp = fp->next) { 6441735Skcpoon sctp_get_ire(sctp, fp); 6450Sstevel@tonic-gate } 6460Sstevel@tonic-gate } 6470Sstevel@tonic-gate 6480Sstevel@tonic-gate void 6490Sstevel@tonic-gate sctp_faddr_alive(sctp_t *sctp, sctp_faddr_t *fp) 6500Sstevel@tonic-gate { 6510Sstevel@tonic-gate int64_t now = lbolt64; 6520Sstevel@tonic-gate 6530Sstevel@tonic-gate fp->strikes = 0; 6540Sstevel@tonic-gate sctp->sctp_strikes = 0; 6550Sstevel@tonic-gate fp->lastactive = now; 6560Sstevel@tonic-gate fp->hb_expiry = now + SET_HB_INTVL(fp); 6570Sstevel@tonic-gate fp->hb_pending = B_FALSE; 6580Sstevel@tonic-gate if (fp->state != SCTP_FADDRS_ALIVE) { 6590Sstevel@tonic-gate fp->state = SCTP_FADDRS_ALIVE; 6600Sstevel@tonic-gate sctp_intf_event(sctp, fp->faddr, SCTP_ADDR_AVAILABLE, 0); 6614818Skcpoon /* Should have a full IRE now */ 6624818Skcpoon sctp_get_ire(sctp, fp); 6630Sstevel@tonic-gate 6641735Skcpoon /* 6651735Skcpoon * If this is the primary, switch back to it now. And 6661735Skcpoon * we probably want to reset the source addr used to reach 6671735Skcpoon * it. 6681735Skcpoon */ 6690Sstevel@tonic-gate if (fp == sctp->sctp_primary) { 6704818Skcpoon ASSERT(fp->state != SCTP_FADDRS_UNREACH); 6711735Skcpoon sctp_set_faddr_current(sctp, fp); 6721735Skcpoon return; 6730Sstevel@tonic-gate } 6740Sstevel@tonic-gate } 6750Sstevel@tonic-gate } 6760Sstevel@tonic-gate 6770Sstevel@tonic-gate int 6780Sstevel@tonic-gate sctp_is_a_faddr_clean(sctp_t *sctp) 6790Sstevel@tonic-gate { 6800Sstevel@tonic-gate sctp_faddr_t *fp; 6810Sstevel@tonic-gate 6820Sstevel@tonic-gate for (fp = sctp->sctp_faddrs; fp; fp = fp->next) { 6830Sstevel@tonic-gate if (fp->state == SCTP_FADDRS_ALIVE && fp->strikes == 0) { 6840Sstevel@tonic-gate return (1); 6850Sstevel@tonic-gate } 6860Sstevel@tonic-gate } 6870Sstevel@tonic-gate 6880Sstevel@tonic-gate return (0); 6890Sstevel@tonic-gate } 6900Sstevel@tonic-gate 6910Sstevel@tonic-gate /* 6920Sstevel@tonic-gate * Returns 0 if there is at leave one other active faddr, -1 if there 6930Sstevel@tonic-gate * are none. If there are none left, faddr_dead() will start killing the 6940Sstevel@tonic-gate * association. 6950Sstevel@tonic-gate * If the downed faddr was the current faddr, a new current faddr 6960Sstevel@tonic-gate * will be chosen. 6970Sstevel@tonic-gate */ 6980Sstevel@tonic-gate int 6990Sstevel@tonic-gate sctp_faddr_dead(sctp_t *sctp, sctp_faddr_t *fp, int newstate) 7000Sstevel@tonic-gate { 7010Sstevel@tonic-gate sctp_faddr_t *ofp; 7023448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 7030Sstevel@tonic-gate 7040Sstevel@tonic-gate if (fp->state == SCTP_FADDRS_ALIVE) { 7050Sstevel@tonic-gate sctp_intf_event(sctp, fp->faddr, SCTP_ADDR_UNREACHABLE, 0); 7060Sstevel@tonic-gate } 7070Sstevel@tonic-gate fp->state = newstate; 7080Sstevel@tonic-gate 7090Sstevel@tonic-gate dprint(1, ("sctp_faddr_dead: %x:%x:%x:%x down (state=%d)\n", 7100Sstevel@tonic-gate SCTP_PRINTADDR(fp->faddr), newstate)); 7110Sstevel@tonic-gate 7120Sstevel@tonic-gate if (fp == sctp->sctp_current) { 7130Sstevel@tonic-gate /* Current faddr down; need to switch it */ 7140Sstevel@tonic-gate sctp->sctp_current = NULL; 7150Sstevel@tonic-gate } 7160Sstevel@tonic-gate 7170Sstevel@tonic-gate /* Find next alive faddr */ 7180Sstevel@tonic-gate ofp = fp; 7191735Skcpoon for (fp = fp->next; fp != NULL; fp = fp->next) { 7200Sstevel@tonic-gate if (fp->state == SCTP_FADDRS_ALIVE) { 7210Sstevel@tonic-gate break; 7220Sstevel@tonic-gate } 7230Sstevel@tonic-gate } 7240Sstevel@tonic-gate 7250Sstevel@tonic-gate if (fp == NULL) { 7260Sstevel@tonic-gate /* Continue from beginning of list */ 7270Sstevel@tonic-gate for (fp = sctp->sctp_faddrs; fp != ofp; fp = fp->next) { 7280Sstevel@tonic-gate if (fp->state == SCTP_FADDRS_ALIVE) { 7290Sstevel@tonic-gate break; 7300Sstevel@tonic-gate } 7310Sstevel@tonic-gate } 7320Sstevel@tonic-gate } 7330Sstevel@tonic-gate 7341735Skcpoon /* 7351735Skcpoon * Find a new fp, so if the current faddr is dead, use the new fp 7361735Skcpoon * as the current one. 7371735Skcpoon */ 7380Sstevel@tonic-gate if (fp != ofp) { 7390Sstevel@tonic-gate if (sctp->sctp_current == NULL) { 7400Sstevel@tonic-gate dprint(1, ("sctp_faddr_dead: failover->%x:%x:%x:%x\n", 7410Sstevel@tonic-gate SCTP_PRINTADDR(fp->faddr))); 7421735Skcpoon /* 7431735Skcpoon * Note that we don't need to reset the source addr 7441735Skcpoon * of the new fp. 7451735Skcpoon */ 7461735Skcpoon sctp_set_faddr_current(sctp, fp); 7470Sstevel@tonic-gate } 7480Sstevel@tonic-gate return (0); 7490Sstevel@tonic-gate } 7500Sstevel@tonic-gate 7510Sstevel@tonic-gate 7520Sstevel@tonic-gate /* All faddrs are down; kill the association */ 7530Sstevel@tonic-gate dprint(1, ("sctp_faddr_dead: all faddrs down, killing assoc\n")); 7543448Sdh155122 BUMP_MIB(&sctps->sctps_mib, sctpAborted); 7550Sstevel@tonic-gate sctp_assoc_event(sctp, sctp->sctp_state < SCTPS_ESTABLISHED ? 7560Sstevel@tonic-gate SCTP_CANT_STR_ASSOC : SCTP_COMM_LOST, 0, NULL); 7570Sstevel@tonic-gate sctp_clean_death(sctp, sctp->sctp_client_errno ? 7580Sstevel@tonic-gate sctp->sctp_client_errno : ETIMEDOUT); 7590Sstevel@tonic-gate 7600Sstevel@tonic-gate return (-1); 7610Sstevel@tonic-gate } 7620Sstevel@tonic-gate 7630Sstevel@tonic-gate sctp_faddr_t * 7640Sstevel@tonic-gate sctp_rotate_faddr(sctp_t *sctp, sctp_faddr_t *ofp) 7650Sstevel@tonic-gate { 7660Sstevel@tonic-gate sctp_faddr_t *nfp = NULL; 7670Sstevel@tonic-gate 7680Sstevel@tonic-gate if (ofp == NULL) { 7690Sstevel@tonic-gate ofp = sctp->sctp_current; 7700Sstevel@tonic-gate } 7710Sstevel@tonic-gate 7720Sstevel@tonic-gate /* Find the next live one */ 7730Sstevel@tonic-gate for (nfp = ofp->next; nfp != NULL; nfp = nfp->next) { 7740Sstevel@tonic-gate if (nfp->state == SCTP_FADDRS_ALIVE) { 7750Sstevel@tonic-gate break; 7760Sstevel@tonic-gate } 7770Sstevel@tonic-gate } 7780Sstevel@tonic-gate 7790Sstevel@tonic-gate if (nfp == NULL) { 7800Sstevel@tonic-gate /* Continue from beginning of list */ 7810Sstevel@tonic-gate for (nfp = sctp->sctp_faddrs; nfp != ofp; nfp = nfp->next) { 7820Sstevel@tonic-gate if (nfp->state == SCTP_FADDRS_ALIVE) { 7830Sstevel@tonic-gate break; 7840Sstevel@tonic-gate } 7850Sstevel@tonic-gate } 7860Sstevel@tonic-gate } 7870Sstevel@tonic-gate 7880Sstevel@tonic-gate /* 7890Sstevel@tonic-gate * nfp could only be NULL if all faddrs are down, and when 7900Sstevel@tonic-gate * this happens, faddr_dead() should have killed the 7910Sstevel@tonic-gate * association. Hence this assertion... 7920Sstevel@tonic-gate */ 7930Sstevel@tonic-gate ASSERT(nfp != NULL); 7940Sstevel@tonic-gate return (nfp); 7950Sstevel@tonic-gate } 7960Sstevel@tonic-gate 7970Sstevel@tonic-gate void 7980Sstevel@tonic-gate sctp_unlink_faddr(sctp_t *sctp, sctp_faddr_t *fp) 7990Sstevel@tonic-gate { 8000Sstevel@tonic-gate sctp_faddr_t *fpp; 8010Sstevel@tonic-gate 8020Sstevel@tonic-gate if (!sctp->sctp_faddrs) { 8030Sstevel@tonic-gate return; 8040Sstevel@tonic-gate } 8050Sstevel@tonic-gate 8060Sstevel@tonic-gate if (fp->timer_mp != NULL) { 8070Sstevel@tonic-gate sctp_timer_free(fp->timer_mp); 8080Sstevel@tonic-gate fp->timer_mp = NULL; 8090Sstevel@tonic-gate fp->timer_running = 0; 8100Sstevel@tonic-gate } 8110Sstevel@tonic-gate if (fp->rc_timer_mp != NULL) { 8120Sstevel@tonic-gate sctp_timer_free(fp->rc_timer_mp); 8130Sstevel@tonic-gate fp->rc_timer_mp = NULL; 8140Sstevel@tonic-gate fp->rc_timer_running = 0; 8150Sstevel@tonic-gate } 8160Sstevel@tonic-gate if (fp->ire != NULL) { 8170Sstevel@tonic-gate IRE_REFRELE_NOTR(fp->ire); 8180Sstevel@tonic-gate fp->ire = NULL; 8190Sstevel@tonic-gate } 8200Sstevel@tonic-gate 8210Sstevel@tonic-gate if (fp == sctp->sctp_faddrs) { 8220Sstevel@tonic-gate goto gotit; 8230Sstevel@tonic-gate } 8240Sstevel@tonic-gate 8250Sstevel@tonic-gate for (fpp = sctp->sctp_faddrs; fpp->next != fp; fpp = fpp->next) 8260Sstevel@tonic-gate ; 8270Sstevel@tonic-gate 8280Sstevel@tonic-gate gotit: 8290Sstevel@tonic-gate ASSERT(sctp->sctp_conn_tfp != NULL); 8300Sstevel@tonic-gate mutex_enter(&sctp->sctp_conn_tfp->tf_lock); 8310Sstevel@tonic-gate if (fp == sctp->sctp_faddrs) { 8320Sstevel@tonic-gate sctp->sctp_faddrs = fp->next; 8330Sstevel@tonic-gate } else { 8340Sstevel@tonic-gate fpp->next = fp->next; 8350Sstevel@tonic-gate } 8360Sstevel@tonic-gate mutex_exit(&sctp->sctp_conn_tfp->tf_lock); 8370Sstevel@tonic-gate /* XXX faddr2ire? */ 8380Sstevel@tonic-gate kmem_cache_free(sctp_kmem_faddr_cache, fp); 839852Svi117747 sctp->sctp_nfaddrs--; 8400Sstevel@tonic-gate } 8410Sstevel@tonic-gate 8420Sstevel@tonic-gate void 8430Sstevel@tonic-gate sctp_zap_faddrs(sctp_t *sctp, int caller_holds_lock) 8440Sstevel@tonic-gate { 8450Sstevel@tonic-gate sctp_faddr_t *fp, *fpn; 8460Sstevel@tonic-gate 8470Sstevel@tonic-gate if (sctp->sctp_faddrs == NULL) { 8480Sstevel@tonic-gate ASSERT(sctp->sctp_lastfaddr == NULL); 8490Sstevel@tonic-gate return; 8500Sstevel@tonic-gate } 8510Sstevel@tonic-gate 8520Sstevel@tonic-gate ASSERT(sctp->sctp_lastfaddr != NULL); 8530Sstevel@tonic-gate sctp->sctp_lastfaddr = NULL; 8540Sstevel@tonic-gate sctp->sctp_current = NULL; 8550Sstevel@tonic-gate sctp->sctp_primary = NULL; 8560Sstevel@tonic-gate 8570Sstevel@tonic-gate sctp_free_faddr_timers(sctp); 8580Sstevel@tonic-gate 8590Sstevel@tonic-gate if (sctp->sctp_conn_tfp != NULL && !caller_holds_lock) { 8600Sstevel@tonic-gate /* in conn fanout; need to hold lock */ 8610Sstevel@tonic-gate mutex_enter(&sctp->sctp_conn_tfp->tf_lock); 8620Sstevel@tonic-gate } 8630Sstevel@tonic-gate 8640Sstevel@tonic-gate for (fp = sctp->sctp_faddrs; fp; fp = fpn) { 8650Sstevel@tonic-gate fpn = fp->next; 8660Sstevel@tonic-gate if (fp->ire != NULL) 8670Sstevel@tonic-gate IRE_REFRELE_NOTR(fp->ire); 8680Sstevel@tonic-gate kmem_cache_free(sctp_kmem_faddr_cache, fp); 869852Svi117747 sctp->sctp_nfaddrs--; 8700Sstevel@tonic-gate } 8710Sstevel@tonic-gate 8720Sstevel@tonic-gate sctp->sctp_faddrs = NULL; 873852Svi117747 ASSERT(sctp->sctp_nfaddrs == 0); 8740Sstevel@tonic-gate if (sctp->sctp_conn_tfp != NULL && !caller_holds_lock) { 8750Sstevel@tonic-gate mutex_exit(&sctp->sctp_conn_tfp->tf_lock); 8760Sstevel@tonic-gate } 8770Sstevel@tonic-gate 8780Sstevel@tonic-gate } 8790Sstevel@tonic-gate 8800Sstevel@tonic-gate void 8810Sstevel@tonic-gate sctp_zap_addrs(sctp_t *sctp) 8820Sstevel@tonic-gate { 8830Sstevel@tonic-gate sctp_zap_faddrs(sctp, 0); 8840Sstevel@tonic-gate sctp_free_saddrs(sctp); 8850Sstevel@tonic-gate } 8860Sstevel@tonic-gate 8870Sstevel@tonic-gate /* 8880Sstevel@tonic-gate * Initialize the IPv4 header. Loses any record of any IP options. 8890Sstevel@tonic-gate */ 8900Sstevel@tonic-gate int 8910Sstevel@tonic-gate sctp_header_init_ipv4(sctp_t *sctp, int sleep) 8920Sstevel@tonic-gate { 8930Sstevel@tonic-gate sctp_hdr_t *sctph; 8943448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 8950Sstevel@tonic-gate 8960Sstevel@tonic-gate /* 8970Sstevel@tonic-gate * This is a simple initialization. If there's 8980Sstevel@tonic-gate * already a template, it should never be too small, 8990Sstevel@tonic-gate * so reuse it. Otherwise, allocate space for the new one. 9000Sstevel@tonic-gate */ 9010Sstevel@tonic-gate if (sctp->sctp_iphc != NULL) { 9020Sstevel@tonic-gate ASSERT(sctp->sctp_iphc_len >= SCTP_MAX_COMBINED_HEADER_LENGTH); 9030Sstevel@tonic-gate bzero(sctp->sctp_iphc, sctp->sctp_iphc_len); 9040Sstevel@tonic-gate } else { 9050Sstevel@tonic-gate sctp->sctp_iphc_len = SCTP_MAX_COMBINED_HEADER_LENGTH; 9060Sstevel@tonic-gate sctp->sctp_iphc = kmem_zalloc(sctp->sctp_iphc_len, sleep); 9070Sstevel@tonic-gate if (sctp->sctp_iphc == NULL) { 9080Sstevel@tonic-gate sctp->sctp_iphc_len = 0; 9090Sstevel@tonic-gate return (ENOMEM); 9100Sstevel@tonic-gate } 9110Sstevel@tonic-gate } 9120Sstevel@tonic-gate 9130Sstevel@tonic-gate sctp->sctp_ipha = (ipha_t *)sctp->sctp_iphc; 9140Sstevel@tonic-gate 9150Sstevel@tonic-gate sctp->sctp_hdr_len = sizeof (ipha_t) + sizeof (sctp_hdr_t); 9160Sstevel@tonic-gate sctp->sctp_ip_hdr_len = sizeof (ipha_t); 9170Sstevel@tonic-gate sctp->sctp_ipha->ipha_length = htons(sizeof (ipha_t) + 9180Sstevel@tonic-gate sizeof (sctp_hdr_t)); 9194691Skcpoon sctp->sctp_ipha->ipha_version_and_hdr_length = 9204691Skcpoon (IP_VERSION << 4) | IP_SIMPLE_HDR_LENGTH_IN_WORDS; 9210Sstevel@tonic-gate 9220Sstevel@tonic-gate /* 9230Sstevel@tonic-gate * These two fields should be zero, and are already set above. 9240Sstevel@tonic-gate * 9250Sstevel@tonic-gate * sctp->sctp_ipha->ipha_ident, 9260Sstevel@tonic-gate * sctp->sctp_ipha->ipha_fragment_offset_and_flags. 9270Sstevel@tonic-gate */ 9280Sstevel@tonic-gate 9293448Sdh155122 sctp->sctp_ipha->ipha_ttl = sctps->sctps_ipv4_ttl; 9300Sstevel@tonic-gate sctp->sctp_ipha->ipha_protocol = IPPROTO_SCTP; 9310Sstevel@tonic-gate 9320Sstevel@tonic-gate sctph = (sctp_hdr_t *)(sctp->sctp_iphc + sizeof (ipha_t)); 9330Sstevel@tonic-gate sctp->sctp_sctph = sctph; 9340Sstevel@tonic-gate 9350Sstevel@tonic-gate return (0); 9360Sstevel@tonic-gate } 9370Sstevel@tonic-gate 9380Sstevel@tonic-gate /* 9390Sstevel@tonic-gate * Update sctp_sticky_hdrs based on sctp_sticky_ipp. 9400Sstevel@tonic-gate * The headers include ip6i_t (if needed), ip6_t, any sticky extension 9410Sstevel@tonic-gate * headers, and the maximum size sctp header (to avoid reallocation 9420Sstevel@tonic-gate * on the fly for additional sctp options). 9430Sstevel@tonic-gate * Returns failure if can't allocate memory. 9440Sstevel@tonic-gate */ 9450Sstevel@tonic-gate int 9460Sstevel@tonic-gate sctp_build_hdrs(sctp_t *sctp) 9470Sstevel@tonic-gate { 9480Sstevel@tonic-gate char *hdrs; 9490Sstevel@tonic-gate uint_t hdrs_len; 9500Sstevel@tonic-gate ip6i_t *ip6i; 9510Sstevel@tonic-gate char buf[SCTP_MAX_HDR_LENGTH]; 9520Sstevel@tonic-gate ip6_pkt_t *ipp = &sctp->sctp_sticky_ipp; 9530Sstevel@tonic-gate in6_addr_t src; 9540Sstevel@tonic-gate in6_addr_t dst; 9553448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 9561676Sjpk 9570Sstevel@tonic-gate /* 9580Sstevel@tonic-gate * save the existing sctp header and source/dest IP addresses 9590Sstevel@tonic-gate */ 9600Sstevel@tonic-gate bcopy(sctp->sctp_sctph6, buf, sizeof (sctp_hdr_t)); 9610Sstevel@tonic-gate src = sctp->sctp_ip6h->ip6_src; 9620Sstevel@tonic-gate dst = sctp->sctp_ip6h->ip6_dst; 9630Sstevel@tonic-gate hdrs_len = ip_total_hdrs_len_v6(ipp) + SCTP_MAX_HDR_LENGTH; 9640Sstevel@tonic-gate ASSERT(hdrs_len != 0); 9650Sstevel@tonic-gate if (hdrs_len > sctp->sctp_iphc6_len) { 9660Sstevel@tonic-gate /* Need to reallocate */ 9670Sstevel@tonic-gate hdrs = kmem_zalloc(hdrs_len, KM_NOSLEEP); 9680Sstevel@tonic-gate if (hdrs == NULL) 9690Sstevel@tonic-gate return (ENOMEM); 9700Sstevel@tonic-gate 9710Sstevel@tonic-gate if (sctp->sctp_iphc6_len != 0) 9720Sstevel@tonic-gate kmem_free(sctp->sctp_iphc6, sctp->sctp_iphc6_len); 9730Sstevel@tonic-gate sctp->sctp_iphc6 = hdrs; 9740Sstevel@tonic-gate sctp->sctp_iphc6_len = hdrs_len; 9750Sstevel@tonic-gate } 9760Sstevel@tonic-gate ip_build_hdrs_v6((uchar_t *)sctp->sctp_iphc6, 9770Sstevel@tonic-gate hdrs_len - SCTP_MAX_HDR_LENGTH, ipp, IPPROTO_SCTP); 9780Sstevel@tonic-gate 9790Sstevel@tonic-gate /* Set header fields not in ipp */ 9800Sstevel@tonic-gate if (ipp->ipp_fields & IPPF_HAS_IP6I) { 9810Sstevel@tonic-gate ip6i = (ip6i_t *)sctp->sctp_iphc6; 9820Sstevel@tonic-gate sctp->sctp_ip6h = (ip6_t *)&ip6i[1]; 9830Sstevel@tonic-gate } else { 9840Sstevel@tonic-gate sctp->sctp_ip6h = (ip6_t *)sctp->sctp_iphc6; 9850Sstevel@tonic-gate } 9860Sstevel@tonic-gate /* 9870Sstevel@tonic-gate * sctp->sctp_ip_hdr_len will include ip6i_t if there is one. 9880Sstevel@tonic-gate */ 9890Sstevel@tonic-gate sctp->sctp_ip_hdr6_len = hdrs_len - SCTP_MAX_HDR_LENGTH; 9900Sstevel@tonic-gate sctp->sctp_sctph6 = (sctp_hdr_t *)(sctp->sctp_iphc6 + 9910Sstevel@tonic-gate sctp->sctp_ip_hdr6_len); 9920Sstevel@tonic-gate sctp->sctp_hdr6_len = sctp->sctp_ip_hdr6_len + sizeof (sctp_hdr_t); 9930Sstevel@tonic-gate 9940Sstevel@tonic-gate bcopy(buf, sctp->sctp_sctph6, sizeof (sctp_hdr_t)); 9950Sstevel@tonic-gate 9960Sstevel@tonic-gate sctp->sctp_ip6h->ip6_src = src; 9970Sstevel@tonic-gate sctp->sctp_ip6h->ip6_dst = dst; 9980Sstevel@tonic-gate /* 999679Sseb * If the hoplimit was not set by ip_build_hdrs_v6(), we need to 1000679Sseb * set it to the default value for SCTP. 10010Sstevel@tonic-gate */ 1002679Sseb if (!(ipp->ipp_fields & IPPF_UNICAST_HOPS)) 10033448Sdh155122 sctp->sctp_ip6h->ip6_hops = sctps->sctps_ipv6_hoplimit; 10040Sstevel@tonic-gate /* 10050Sstevel@tonic-gate * If we're setting extension headers after a connection 10060Sstevel@tonic-gate * has been established, and if we have a routing header 10070Sstevel@tonic-gate * among the extension headers, call ip_massage_options_v6 to 10080Sstevel@tonic-gate * manipulate the routing header/ip6_dst set the checksum 10090Sstevel@tonic-gate * difference in the sctp header template. 10100Sstevel@tonic-gate * (This happens in sctp_connect_ipv6 if the routing header 10110Sstevel@tonic-gate * is set prior to the connect.) 10120Sstevel@tonic-gate */ 10130Sstevel@tonic-gate 10140Sstevel@tonic-gate if ((sctp->sctp_state >= SCTPS_COOKIE_WAIT) && 10150Sstevel@tonic-gate (sctp->sctp_sticky_ipp.ipp_fields & IPPF_RTHDR)) { 10160Sstevel@tonic-gate ip6_rthdr_t *rth; 10170Sstevel@tonic-gate 10180Sstevel@tonic-gate rth = ip_find_rthdr_v6(sctp->sctp_ip6h, 10190Sstevel@tonic-gate (uint8_t *)sctp->sctp_sctph6); 10203448Sdh155122 if (rth != NULL) { 10213448Sdh155122 (void) ip_massage_options_v6(sctp->sctp_ip6h, rth, 10223448Sdh155122 sctps->sctps_netstack); 10233448Sdh155122 } 10240Sstevel@tonic-gate } 10250Sstevel@tonic-gate return (0); 10260Sstevel@tonic-gate } 10270Sstevel@tonic-gate 10280Sstevel@tonic-gate /* 10290Sstevel@tonic-gate * Initialize the IPv6 header. Loses any record of any IPv6 extension headers. 10300Sstevel@tonic-gate */ 10310Sstevel@tonic-gate int 10320Sstevel@tonic-gate sctp_header_init_ipv6(sctp_t *sctp, int sleep) 10330Sstevel@tonic-gate { 10340Sstevel@tonic-gate sctp_hdr_t *sctph; 10353448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 10360Sstevel@tonic-gate 10370Sstevel@tonic-gate /* 10380Sstevel@tonic-gate * This is a simple initialization. If there's 10390Sstevel@tonic-gate * already a template, it should never be too small, 10400Sstevel@tonic-gate * so reuse it. Otherwise, allocate space for the new one. 10410Sstevel@tonic-gate * Ensure that there is enough space to "downgrade" the sctp_t 10420Sstevel@tonic-gate * to an IPv4 sctp_t. This requires having space for a full load 10430Sstevel@tonic-gate * of IPv4 options 10440Sstevel@tonic-gate */ 10450Sstevel@tonic-gate if (sctp->sctp_iphc6 != NULL) { 10460Sstevel@tonic-gate ASSERT(sctp->sctp_iphc6_len >= 10470Sstevel@tonic-gate SCTP_MAX_COMBINED_HEADER_LENGTH); 10480Sstevel@tonic-gate bzero(sctp->sctp_iphc6, sctp->sctp_iphc6_len); 10490Sstevel@tonic-gate } else { 10500Sstevel@tonic-gate sctp->sctp_iphc6_len = SCTP_MAX_COMBINED_HEADER_LENGTH; 10510Sstevel@tonic-gate sctp->sctp_iphc6 = kmem_zalloc(sctp->sctp_iphc_len, sleep); 10520Sstevel@tonic-gate if (sctp->sctp_iphc6 == NULL) { 10530Sstevel@tonic-gate sctp->sctp_iphc6_len = 0; 10540Sstevel@tonic-gate return (ENOMEM); 10550Sstevel@tonic-gate } 10560Sstevel@tonic-gate } 10570Sstevel@tonic-gate sctp->sctp_hdr6_len = IPV6_HDR_LEN + sizeof (sctp_hdr_t); 10580Sstevel@tonic-gate sctp->sctp_ip_hdr6_len = IPV6_HDR_LEN; 10590Sstevel@tonic-gate sctp->sctp_ip6h = (ip6_t *)sctp->sctp_iphc6; 10600Sstevel@tonic-gate 10610Sstevel@tonic-gate /* Initialize the header template */ 10620Sstevel@tonic-gate 10630Sstevel@tonic-gate sctp->sctp_ip6h->ip6_vcf = IPV6_DEFAULT_VERS_AND_FLOW; 10640Sstevel@tonic-gate sctp->sctp_ip6h->ip6_plen = ntohs(sizeof (sctp_hdr_t)); 10650Sstevel@tonic-gate sctp->sctp_ip6h->ip6_nxt = IPPROTO_SCTP; 10663448Sdh155122 sctp->sctp_ip6h->ip6_hops = sctps->sctps_ipv6_hoplimit; 10670Sstevel@tonic-gate 10680Sstevel@tonic-gate sctph = (sctp_hdr_t *)(sctp->sctp_iphc6 + IPV6_HDR_LEN); 10690Sstevel@tonic-gate sctp->sctp_sctph6 = sctph; 10700Sstevel@tonic-gate 10710Sstevel@tonic-gate return (0); 10720Sstevel@tonic-gate } 10730Sstevel@tonic-gate 10741676Sjpk static int 10751676Sjpk sctp_v4_label(sctp_t *sctp) 10761676Sjpk { 10771676Sjpk uchar_t optbuf[IP_MAX_OPT_LENGTH]; 10781676Sjpk const cred_t *cr = CONN_CRED(sctp->sctp_connp); 10791676Sjpk int added; 10801676Sjpk 10811676Sjpk if (tsol_compute_label(cr, sctp->sctp_ipha->ipha_dst, optbuf, 10823448Sdh155122 sctp->sctp_mac_exempt, 10833448Sdh155122 sctp->sctp_sctps->sctps_netstack->netstack_ip) != 0) 10841676Sjpk return (EACCES); 10851676Sjpk 10861676Sjpk added = tsol_remove_secopt(sctp->sctp_ipha, sctp->sctp_hdr_len); 10871676Sjpk if (added == -1) 10881676Sjpk return (EACCES); 10891676Sjpk sctp->sctp_hdr_len += added; 10901676Sjpk sctp->sctp_sctph = (sctp_hdr_t *)((uchar_t *)sctp->sctp_sctph + added); 10911676Sjpk sctp->sctp_ip_hdr_len += added; 10921676Sjpk if ((sctp->sctp_v4label_len = optbuf[IPOPT_OLEN]) != 0) { 10931676Sjpk sctp->sctp_v4label_len = (sctp->sctp_v4label_len + 3) & ~3; 10941676Sjpk added = tsol_prepend_option(optbuf, sctp->sctp_ipha, 10951676Sjpk sctp->sctp_hdr_len); 10961676Sjpk if (added == -1) 10971676Sjpk return (EACCES); 10981676Sjpk sctp->sctp_hdr_len += added; 10991676Sjpk sctp->sctp_sctph = (sctp_hdr_t *)((uchar_t *)sctp->sctp_sctph + 11001676Sjpk added); 11011676Sjpk sctp->sctp_ip_hdr_len += added; 11021676Sjpk } 11031676Sjpk return (0); 11041676Sjpk } 11051676Sjpk 11061676Sjpk static int 11071676Sjpk sctp_v6_label(sctp_t *sctp) 11081676Sjpk { 11091676Sjpk uchar_t optbuf[TSOL_MAX_IPV6_OPTION]; 11101676Sjpk const cred_t *cr = CONN_CRED(sctp->sctp_connp); 11111676Sjpk 11121676Sjpk if (tsol_compute_label_v6(cr, &sctp->sctp_ip6h->ip6_dst, optbuf, 11133448Sdh155122 sctp->sctp_mac_exempt, 11143448Sdh155122 sctp->sctp_sctps->sctps_netstack->netstack_ip) != 0) 11151676Sjpk return (EACCES); 11161676Sjpk if (tsol_update_sticky(&sctp->sctp_sticky_ipp, &sctp->sctp_v6label_len, 11171676Sjpk optbuf) != 0) 11181676Sjpk return (EACCES); 11191676Sjpk if (sctp_build_hdrs(sctp) != 0) 11201676Sjpk return (EACCES); 11211676Sjpk return (0); 11221676Sjpk } 11231676Sjpk 11240Sstevel@tonic-gate /* 11250Sstevel@tonic-gate * XXX implement more sophisticated logic 11260Sstevel@tonic-gate */ 11271676Sjpk int 11281735Skcpoon sctp_set_hdraddrs(sctp_t *sctp) 11290Sstevel@tonic-gate { 11300Sstevel@tonic-gate sctp_faddr_t *fp; 11310Sstevel@tonic-gate int gotv4 = 0; 11320Sstevel@tonic-gate int gotv6 = 0; 11330Sstevel@tonic-gate 11340Sstevel@tonic-gate ASSERT(sctp->sctp_faddrs != NULL); 11350Sstevel@tonic-gate ASSERT(sctp->sctp_nsaddrs > 0); 11360Sstevel@tonic-gate 11370Sstevel@tonic-gate /* Set up using the primary first */ 11380Sstevel@tonic-gate if (IN6_IS_ADDR_V4MAPPED(&sctp->sctp_primary->faddr)) { 11390Sstevel@tonic-gate IN6_V4MAPPED_TO_IPADDR(&sctp->sctp_primary->faddr, 11400Sstevel@tonic-gate sctp->sctp_ipha->ipha_dst); 11410Sstevel@tonic-gate /* saddr may be unspec; make_mp() will handle this */ 11420Sstevel@tonic-gate IN6_V4MAPPED_TO_IPADDR(&sctp->sctp_primary->saddr, 11430Sstevel@tonic-gate sctp->sctp_ipha->ipha_src); 11441676Sjpk if (!is_system_labeled() || sctp_v4_label(sctp) == 0) { 11451676Sjpk gotv4 = 1; 11461676Sjpk if (sctp->sctp_ipversion == IPV4_VERSION) { 11471676Sjpk goto copyports; 11481676Sjpk } 11490Sstevel@tonic-gate } 11500Sstevel@tonic-gate } else { 11510Sstevel@tonic-gate sctp->sctp_ip6h->ip6_dst = sctp->sctp_primary->faddr; 11520Sstevel@tonic-gate /* saddr may be unspec; make_mp() will handle this */ 11530Sstevel@tonic-gate sctp->sctp_ip6h->ip6_src = sctp->sctp_primary->saddr; 11541676Sjpk if (!is_system_labeled() || sctp_v6_label(sctp) == 0) 11551676Sjpk gotv6 = 1; 11560Sstevel@tonic-gate } 11570Sstevel@tonic-gate 11580Sstevel@tonic-gate for (fp = sctp->sctp_faddrs; fp; fp = fp->next) { 11590Sstevel@tonic-gate if (!gotv4 && IN6_IS_ADDR_V4MAPPED(&fp->faddr)) { 11600Sstevel@tonic-gate IN6_V4MAPPED_TO_IPADDR(&fp->faddr, 11610Sstevel@tonic-gate sctp->sctp_ipha->ipha_dst); 11620Sstevel@tonic-gate /* copy in the faddr_t's saddr */ 11630Sstevel@tonic-gate IN6_V4MAPPED_TO_IPADDR(&fp->saddr, 11640Sstevel@tonic-gate sctp->sctp_ipha->ipha_src); 11651676Sjpk if (!is_system_labeled() || sctp_v4_label(sctp) == 0) { 11661676Sjpk gotv4 = 1; 11671676Sjpk if (sctp->sctp_ipversion == IPV4_VERSION || 11681676Sjpk gotv6) { 11691676Sjpk break; 11701676Sjpk } 11710Sstevel@tonic-gate } 11722283Skp158701 } else if (!gotv6 && !IN6_IS_ADDR_V4MAPPED(&fp->faddr)) { 11730Sstevel@tonic-gate sctp->sctp_ip6h->ip6_dst = fp->faddr; 11740Sstevel@tonic-gate /* copy in the faddr_t's saddr */ 11750Sstevel@tonic-gate sctp->sctp_ip6h->ip6_src = fp->saddr; 11761676Sjpk if (!is_system_labeled() || sctp_v6_label(sctp) == 0) { 11771676Sjpk gotv6 = 1; 11781676Sjpk if (gotv4) 11791676Sjpk break; 11800Sstevel@tonic-gate } 11810Sstevel@tonic-gate } 11820Sstevel@tonic-gate } 11830Sstevel@tonic-gate 11840Sstevel@tonic-gate copyports: 11851676Sjpk if (!gotv4 && !gotv6) 11861676Sjpk return (EACCES); 11871676Sjpk 11880Sstevel@tonic-gate /* copy in the ports for good measure */ 11890Sstevel@tonic-gate sctp->sctp_sctph->sh_sport = sctp->sctp_lport; 11900Sstevel@tonic-gate sctp->sctp_sctph->sh_dport = sctp->sctp_fport; 11910Sstevel@tonic-gate 11920Sstevel@tonic-gate sctp->sctp_sctph6->sh_sport = sctp->sctp_lport; 11930Sstevel@tonic-gate sctp->sctp_sctph6->sh_dport = sctp->sctp_fport; 11941676Sjpk return (0); 11950Sstevel@tonic-gate } 11960Sstevel@tonic-gate 11970Sstevel@tonic-gate void 11980Sstevel@tonic-gate sctp_add_unrec_parm(sctp_parm_hdr_t *uph, mblk_t **errmp) 11990Sstevel@tonic-gate { 12000Sstevel@tonic-gate mblk_t *mp; 12010Sstevel@tonic-gate sctp_parm_hdr_t *ph; 12020Sstevel@tonic-gate size_t len; 12030Sstevel@tonic-gate int pad; 1204*8153SGeorge.Shepherd@Sun.COM sctp_chunk_hdr_t *ecp; 12050Sstevel@tonic-gate 12060Sstevel@tonic-gate len = sizeof (*ph) + ntohs(uph->sph_len); 1207*8153SGeorge.Shepherd@Sun.COM if ((pad = len % SCTP_ALIGN) != 0) { 1208*8153SGeorge.Shepherd@Sun.COM pad = SCTP_ALIGN - pad; 12090Sstevel@tonic-gate len += pad; 12100Sstevel@tonic-gate } 12110Sstevel@tonic-gate mp = allocb(len, BPRI_MED); 12120Sstevel@tonic-gate if (mp == NULL) { 12130Sstevel@tonic-gate return; 12140Sstevel@tonic-gate } 12150Sstevel@tonic-gate 12160Sstevel@tonic-gate ph = (sctp_parm_hdr_t *)(mp->b_rptr); 12170Sstevel@tonic-gate ph->sph_type = htons(PARM_UNRECOGNIZED); 12180Sstevel@tonic-gate ph->sph_len = htons(len - pad); 12190Sstevel@tonic-gate 12200Sstevel@tonic-gate /* copy in the unrecognized parameter */ 12210Sstevel@tonic-gate bcopy(uph, ph + 1, ntohs(uph->sph_len)); 12220Sstevel@tonic-gate 1223*8153SGeorge.Shepherd@Sun.COM if (pad != 0) 1224*8153SGeorge.Shepherd@Sun.COM bzero((mp->b_rptr + len - pad), pad); 1225*8153SGeorge.Shepherd@Sun.COM 12260Sstevel@tonic-gate mp->b_wptr = mp->b_rptr + len; 12270Sstevel@tonic-gate if (*errmp != NULL) { 1228*8153SGeorge.Shepherd@Sun.COM /* 1229*8153SGeorge.Shepherd@Sun.COM * Update total length of the ERROR chunk, then link this 1230*8153SGeorge.Shepherd@Sun.COM * cause block to the possible chain of cause blocks 1231*8153SGeorge.Shepherd@Sun.COM * attached to the ERROR chunk. 1232*8153SGeorge.Shepherd@Sun.COM */ 1233*8153SGeorge.Shepherd@Sun.COM ecp = (sctp_chunk_hdr_t *)((*errmp)->b_rptr); 1234*8153SGeorge.Shepherd@Sun.COM ecp->sch_len = htons(ntohs(ecp->sch_len) + len); 12350Sstevel@tonic-gate linkb(*errmp, mp); 12360Sstevel@tonic-gate } else { 12370Sstevel@tonic-gate *errmp = mp; 12380Sstevel@tonic-gate } 12390Sstevel@tonic-gate } 12400Sstevel@tonic-gate 12410Sstevel@tonic-gate /* 12420Sstevel@tonic-gate * o Bounds checking 12430Sstevel@tonic-gate * o Updates remaining 12440Sstevel@tonic-gate * o Checks alignment 12450Sstevel@tonic-gate */ 12460Sstevel@tonic-gate sctp_parm_hdr_t * 12470Sstevel@tonic-gate sctp_next_parm(sctp_parm_hdr_t *current, ssize_t *remaining) 12480Sstevel@tonic-gate { 12490Sstevel@tonic-gate int pad; 12500Sstevel@tonic-gate uint16_t len; 12510Sstevel@tonic-gate 12520Sstevel@tonic-gate len = ntohs(current->sph_len); 12530Sstevel@tonic-gate *remaining -= len; 12540Sstevel@tonic-gate if (*remaining < sizeof (*current) || len < sizeof (*current)) { 12550Sstevel@tonic-gate return (NULL); 12560Sstevel@tonic-gate } 12570Sstevel@tonic-gate if ((pad = len & (SCTP_ALIGN - 1)) != 0) { 12580Sstevel@tonic-gate pad = SCTP_ALIGN - pad; 12590Sstevel@tonic-gate *remaining -= pad; 12600Sstevel@tonic-gate } 12610Sstevel@tonic-gate /*LINTED pointer cast may result in improper alignment*/ 12620Sstevel@tonic-gate current = (sctp_parm_hdr_t *)((char *)current + len + pad); 12630Sstevel@tonic-gate return (current); 12640Sstevel@tonic-gate } 12650Sstevel@tonic-gate 12660Sstevel@tonic-gate /* 12670Sstevel@tonic-gate * Sets the address parameters given in the INIT chunk into sctp's 12680Sstevel@tonic-gate * faddrs; if psctp is non-NULL, copies psctp's saddrs. If there are 12690Sstevel@tonic-gate * no address parameters in the INIT chunk, a single faddr is created 12700Sstevel@tonic-gate * from the ip hdr at the beginning of pkt. 12710Sstevel@tonic-gate * If there already are existing addresses hanging from sctp, merge 12720Sstevel@tonic-gate * them in, if the old info contains addresses which are not present 12730Sstevel@tonic-gate * in this new info, get rid of them, and clean the pointers if there's 12740Sstevel@tonic-gate * messages which have this as their target address. 12750Sstevel@tonic-gate * 1276432Svi117747 * We also re-adjust the source address list here since the list may 1277432Svi117747 * contain more than what is actually part of the association. If 1278432Svi117747 * we get here from sctp_send_cookie_echo(), we are on the active 1279432Svi117747 * side and psctp will be NULL and ich will be the INIT-ACK chunk. 1280432Svi117747 * If we get here from sctp_accept_comm(), ich will be the INIT chunk 1281432Svi117747 * and psctp will the listening endpoint. 1282432Svi117747 * 1283432Svi117747 * INIT processing: When processing the INIT we inherit the src address 1284432Svi117747 * list from the listener. For a loopback or linklocal association, we 1285432Svi117747 * delete the list and just take the address from the IP header (since 1286432Svi117747 * that's how we created the INIT-ACK). Additionally, for loopback we 1287432Svi117747 * ignore the address params in the INIT. For determining which address 1288432Svi117747 * types were sent in the INIT-ACK we follow the same logic as in 1289432Svi117747 * creating the INIT-ACK. We delete addresses of the type that are not 1290432Svi117747 * supported by the peer. 1291432Svi117747 * 1292432Svi117747 * INIT-ACK processing: When processing the INIT-ACK since we had not 1293432Svi117747 * included addr params for loopback or linklocal addresses when creating 1294432Svi117747 * the INIT, we just use the address from the IP header. Further, for 1295432Svi117747 * loopback we ignore the addr param list. We mark addresses of the 1296432Svi117747 * type not supported by the peer as unconfirmed. 1297432Svi117747 * 1298432Svi117747 * In case of INIT processing we look for supported address types in the 1299432Svi117747 * supported address param, if present. In both cases the address type in 1300432Svi117747 * the IP header is supported as well as types for addresses in the param 1301432Svi117747 * list, if any. 1302432Svi117747 * 1303432Svi117747 * Once we have the supported address types sctp_check_saddr() runs through 1304432Svi117747 * the source address list and deletes or marks as unconfirmed address of 1305432Svi117747 * types not supported by the peer. 1306432Svi117747 * 13070Sstevel@tonic-gate * Returns 0 on success, sys errno on failure 13080Sstevel@tonic-gate */ 13090Sstevel@tonic-gate int 13100Sstevel@tonic-gate sctp_get_addrparams(sctp_t *sctp, sctp_t *psctp, mblk_t *pkt, 13110Sstevel@tonic-gate sctp_chunk_hdr_t *ich, uint_t *sctp_options) 13120Sstevel@tonic-gate { 13130Sstevel@tonic-gate sctp_init_chunk_t *init; 13140Sstevel@tonic-gate ipha_t *iph; 13150Sstevel@tonic-gate ip6_t *ip6h; 1316432Svi117747 in6_addr_t hdrsaddr[1]; 1317432Svi117747 in6_addr_t hdrdaddr[1]; 13180Sstevel@tonic-gate sctp_parm_hdr_t *ph; 13190Sstevel@tonic-gate ssize_t remaining; 13200Sstevel@tonic-gate int isv4; 13210Sstevel@tonic-gate int err; 13220Sstevel@tonic-gate sctp_faddr_t *fp; 1323432Svi117747 int supp_af = 0; 1324432Svi117747 boolean_t check_saddr = B_TRUE; 1325852Svi117747 in6_addr_t curaddr; 13263448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 13270Sstevel@tonic-gate 13280Sstevel@tonic-gate if (sctp_options != NULL) 13290Sstevel@tonic-gate *sctp_options = 0; 13300Sstevel@tonic-gate 1331432Svi117747 /* extract the address from the IP header */ 1332432Svi117747 isv4 = (IPH_HDR_VERSION(pkt->b_rptr) == IPV4_VERSION); 1333432Svi117747 if (isv4) { 1334432Svi117747 iph = (ipha_t *)pkt->b_rptr; 1335432Svi117747 IN6_IPADDR_TO_V4MAPPED(iph->ipha_src, hdrsaddr); 1336432Svi117747 IN6_IPADDR_TO_V4MAPPED(iph->ipha_dst, hdrdaddr); 1337432Svi117747 supp_af |= PARM_SUPP_V4; 1338432Svi117747 } else { 1339432Svi117747 ip6h = (ip6_t *)pkt->b_rptr; 1340432Svi117747 hdrsaddr[0] = ip6h->ip6_src; 1341432Svi117747 hdrdaddr[0] = ip6h->ip6_dst; 1342432Svi117747 supp_af |= PARM_SUPP_V6; 1343432Svi117747 } 1344432Svi117747 1345432Svi117747 /* 1346432Svi117747 * Unfortunately, we can't delay this because adding an faddr 1347432Svi117747 * looks for the presence of the source address (from the ire 1348432Svi117747 * for the faddr) in the source address list. We could have 1349432Svi117747 * delayed this if, say, this was a loopback/linklocal connection. 1350432Svi117747 * Now, we just end up nuking this list and taking the addr from 1351432Svi117747 * the IP header for loopback/linklocal. 1352432Svi117747 */ 13530Sstevel@tonic-gate if (psctp != NULL && psctp->sctp_nsaddrs > 0) { 13540Sstevel@tonic-gate ASSERT(sctp->sctp_nsaddrs == 0); 13550Sstevel@tonic-gate 13560Sstevel@tonic-gate err = sctp_dup_saddrs(psctp, sctp, KM_NOSLEEP); 13570Sstevel@tonic-gate if (err != 0) 13580Sstevel@tonic-gate return (err); 13590Sstevel@tonic-gate } 1360432Svi117747 /* 1361432Svi117747 * We will add the faddr before parsing the address list as this 1362432Svi117747 * might be a loopback connection and we would not have to 1363432Svi117747 * go through the list. 1364432Svi117747 * 1365432Svi117747 * Make sure the header's addr is in the list 1366432Svi117747 */ 1367432Svi117747 fp = sctp_lookup_faddr(sctp, hdrsaddr); 1368432Svi117747 if (fp == NULL) { 1369432Svi117747 /* not included; add it now */ 13701735Skcpoon err = sctp_add_faddr(sctp, hdrsaddr, KM_NOSLEEP, B_TRUE); 13711676Sjpk if (err != 0) 13721676Sjpk return (err); 13730Sstevel@tonic-gate 1374432Svi117747 /* sctp_faddrs will be the hdr addr */ 1375432Svi117747 fp = sctp->sctp_faddrs; 13760Sstevel@tonic-gate } 1377432Svi117747 /* make the header addr the primary */ 1378852Svi117747 1379852Svi117747 if (cl_sctp_assoc_change != NULL && psctp == NULL) 1380852Svi117747 curaddr = sctp->sctp_current->faddr; 1381852Svi117747 1382432Svi117747 sctp->sctp_primary = fp; 1383432Svi117747 sctp->sctp_current = fp; 1384432Svi117747 sctp->sctp_mss = fp->sfa_pmss; 13850Sstevel@tonic-gate 1386432Svi117747 /* For loopback connections & linklocal get address from the header */ 1387432Svi117747 if (sctp->sctp_loopback || sctp->sctp_linklocal) { 1388432Svi117747 if (sctp->sctp_nsaddrs != 0) 1389432Svi117747 sctp_free_saddrs(sctp); 1390852Svi117747 if ((err = sctp_saddr_add_addr(sctp, hdrdaddr, 0)) != 0) 1391432Svi117747 return (err); 1392432Svi117747 /* For loopback ignore address list */ 1393432Svi117747 if (sctp->sctp_loopback) 1394432Svi117747 return (0); 1395432Svi117747 check_saddr = B_FALSE; 1396432Svi117747 } 13970Sstevel@tonic-gate 13980Sstevel@tonic-gate /* Walk the params in the INIT [ACK], pulling out addr params */ 13990Sstevel@tonic-gate remaining = ntohs(ich->sch_len) - sizeof (*ich) - 14000Sstevel@tonic-gate sizeof (sctp_init_chunk_t); 14010Sstevel@tonic-gate if (remaining < sizeof (*ph)) { 1402432Svi117747 if (check_saddr) { 1403432Svi117747 sctp_check_saddr(sctp, supp_af, psctp == NULL ? 14044818Skcpoon B_FALSE : B_TRUE, hdrdaddr); 1405432Svi117747 } 1406852Svi117747 ASSERT(sctp_saddr_lookup(sctp, hdrdaddr, 0) != NULL); 1407432Svi117747 return (0); 14080Sstevel@tonic-gate } 1409432Svi117747 14100Sstevel@tonic-gate init = (sctp_init_chunk_t *)(ich + 1); 14110Sstevel@tonic-gate ph = (sctp_parm_hdr_t *)(init + 1); 14120Sstevel@tonic-gate 1413432Svi117747 /* params will have already been byteordered when validating */ 14140Sstevel@tonic-gate while (ph != NULL) { 1415432Svi117747 if (ph->sph_type == htons(PARM_SUPP_ADDRS)) { 1416432Svi117747 int plen; 1417432Svi117747 uint16_t *p; 1418432Svi117747 uint16_t addrtype; 1419432Svi117747 1420432Svi117747 ASSERT(psctp != NULL); 1421432Svi117747 plen = ntohs(ph->sph_len); 1422432Svi117747 p = (uint16_t *)(ph + 1); 1423432Svi117747 while (plen > 0) { 1424432Svi117747 addrtype = ntohs(*p); 1425432Svi117747 switch (addrtype) { 1426432Svi117747 case PARM_ADDR6: 1427432Svi117747 supp_af |= PARM_SUPP_V6; 1428432Svi117747 break; 1429432Svi117747 case PARM_ADDR4: 1430432Svi117747 supp_af |= PARM_SUPP_V4; 1431432Svi117747 break; 1432432Svi117747 default: 1433432Svi117747 break; 1434432Svi117747 } 1435432Svi117747 p++; 1436432Svi117747 plen -= sizeof (*p); 1437432Svi117747 } 1438432Svi117747 } else if (ph->sph_type == htons(PARM_ADDR4)) { 14390Sstevel@tonic-gate if (remaining >= PARM_ADDR4_LEN) { 14400Sstevel@tonic-gate in6_addr_t addr; 14410Sstevel@tonic-gate ipaddr_t ta; 14420Sstevel@tonic-gate 1443432Svi117747 supp_af |= PARM_SUPP_V4; 14440Sstevel@tonic-gate /* 14450Sstevel@tonic-gate * Screen out broad/multicasts & loopback. 14460Sstevel@tonic-gate * If the endpoint only accepts v6 address, 14470Sstevel@tonic-gate * go to the next one. 14484818Skcpoon * 14494818Skcpoon * Subnet broadcast check is done in 14504818Skcpoon * sctp_add_faddr(). If the address is 14514818Skcpoon * a broadcast address, it won't be added. 14520Sstevel@tonic-gate */ 14530Sstevel@tonic-gate bcopy(ph + 1, &ta, sizeof (ta)); 14540Sstevel@tonic-gate if (ta == 0 || 14550Sstevel@tonic-gate ta == INADDR_BROADCAST || 14560Sstevel@tonic-gate ta == htonl(INADDR_LOOPBACK) || 14575215Skcpoon CLASSD(ta) || 14580Sstevel@tonic-gate sctp->sctp_connp->conn_ipv6_v6only) { 14590Sstevel@tonic-gate goto next; 14600Sstevel@tonic-gate } 14610Sstevel@tonic-gate IN6_INADDR_TO_V4MAPPED((struct in_addr *) 14620Sstevel@tonic-gate (ph + 1), &addr); 14634818Skcpoon 14640Sstevel@tonic-gate /* Check for duplicate. */ 14650Sstevel@tonic-gate if (sctp_lookup_faddr(sctp, &addr) != NULL) 14660Sstevel@tonic-gate goto next; 14670Sstevel@tonic-gate 14680Sstevel@tonic-gate /* OK, add it to the faddr set */ 14691735Skcpoon err = sctp_add_faddr(sctp, &addr, KM_NOSLEEP, 14701735Skcpoon B_FALSE); 14714818Skcpoon /* Something is wrong... Try the next one. */ 14721676Sjpk if (err != 0) 14734818Skcpoon goto next; 14740Sstevel@tonic-gate } 14750Sstevel@tonic-gate } else if (ph->sph_type == htons(PARM_ADDR6) && 14760Sstevel@tonic-gate sctp->sctp_family == AF_INET6) { 14770Sstevel@tonic-gate /* An v4 socket should not take v6 addresses. */ 14780Sstevel@tonic-gate if (remaining >= PARM_ADDR6_LEN) { 14790Sstevel@tonic-gate in6_addr_t *addr6; 14800Sstevel@tonic-gate 1481432Svi117747 supp_af |= PARM_SUPP_V6; 14820Sstevel@tonic-gate addr6 = (in6_addr_t *)(ph + 1); 14830Sstevel@tonic-gate /* 14840Sstevel@tonic-gate * Screen out link locals, mcast, loopback 14850Sstevel@tonic-gate * and bogus v6 address. 14860Sstevel@tonic-gate */ 14870Sstevel@tonic-gate if (IN6_IS_ADDR_LINKLOCAL(addr6) || 14880Sstevel@tonic-gate IN6_IS_ADDR_MULTICAST(addr6) || 14890Sstevel@tonic-gate IN6_IS_ADDR_LOOPBACK(addr6) || 14900Sstevel@tonic-gate IN6_IS_ADDR_V4MAPPED(addr6)) { 14910Sstevel@tonic-gate goto next; 14920Sstevel@tonic-gate } 14930Sstevel@tonic-gate /* Check for duplicate. */ 14940Sstevel@tonic-gate if (sctp_lookup_faddr(sctp, addr6) != NULL) 14950Sstevel@tonic-gate goto next; 14960Sstevel@tonic-gate 14971676Sjpk err = sctp_add_faddr(sctp, 14981735Skcpoon (in6_addr_t *)(ph + 1), KM_NOSLEEP, 14991735Skcpoon B_FALSE); 15004818Skcpoon /* Something is wrong... Try the next one. */ 15011676Sjpk if (err != 0) 15024818Skcpoon goto next; 15030Sstevel@tonic-gate } 15040Sstevel@tonic-gate } else if (ph->sph_type == htons(PARM_FORWARD_TSN)) { 15050Sstevel@tonic-gate if (sctp_options != NULL) 15060Sstevel@tonic-gate *sctp_options |= SCTP_PRSCTP_OPTION; 15070Sstevel@tonic-gate } /* else; skip */ 15080Sstevel@tonic-gate 15090Sstevel@tonic-gate next: 15100Sstevel@tonic-gate ph = sctp_next_parm(ph, &remaining); 15110Sstevel@tonic-gate } 1512432Svi117747 if (check_saddr) { 1513432Svi117747 sctp_check_saddr(sctp, supp_af, psctp == NULL ? B_FALSE : 15144818Skcpoon B_TRUE, hdrdaddr); 15150Sstevel@tonic-gate } 1516852Svi117747 ASSERT(sctp_saddr_lookup(sctp, hdrdaddr, 0) != NULL); 1517852Svi117747 /* 1518852Svi117747 * We have the right address list now, update clustering's 1519852Svi117747 * knowledge because when we sent the INIT we had just added 1520852Svi117747 * the address the INIT was sent to. 1521852Svi117747 */ 1522852Svi117747 if (psctp == NULL && cl_sctp_assoc_change != NULL) { 1523852Svi117747 uchar_t *alist; 1524852Svi117747 size_t asize; 1525852Svi117747 uchar_t *dlist; 1526852Svi117747 size_t dsize; 1527852Svi117747 1528852Svi117747 asize = sizeof (in6_addr_t) * sctp->sctp_nfaddrs; 1529852Svi117747 alist = kmem_alloc(asize, KM_NOSLEEP); 15301735Skcpoon if (alist == NULL) { 15313448Sdh155122 SCTP_KSTAT(sctps, sctp_cl_assoc_change); 1532852Svi117747 return (ENOMEM); 15331735Skcpoon } 1534852Svi117747 /* 1535852Svi117747 * Just include the address the INIT was sent to in the 1536852Svi117747 * delete list and send the entire faddr list. We could 1537852Svi117747 * do it differently (i.e include all the addresses in the 1538852Svi117747 * add list even if it contains the original address OR 1539852Svi117747 * remove the original address from the add list etc.), but 1540852Svi117747 * this seems reasonable enough. 1541852Svi117747 */ 1542852Svi117747 dsize = sizeof (in6_addr_t); 1543852Svi117747 dlist = kmem_alloc(dsize, KM_NOSLEEP); 1544852Svi117747 if (dlist == NULL) { 1545852Svi117747 kmem_free(alist, asize); 15463448Sdh155122 SCTP_KSTAT(sctps, sctp_cl_assoc_change); 1547852Svi117747 return (ENOMEM); 1548852Svi117747 } 1549852Svi117747 bcopy(&curaddr, dlist, sizeof (curaddr)); 1550852Svi117747 sctp_get_faddr_list(sctp, alist, asize); 1551852Svi117747 (*cl_sctp_assoc_change)(sctp->sctp_family, alist, asize, 1552852Svi117747 sctp->sctp_nfaddrs, dlist, dsize, 1, SCTP_CL_PADDR, 1553852Svi117747 (cl_sctp_handle_t)sctp); 1554852Svi117747 /* alist and dlist will be freed by the clustering module */ 1555852Svi117747 } 15560Sstevel@tonic-gate return (0); 15570Sstevel@tonic-gate } 15580Sstevel@tonic-gate 15590Sstevel@tonic-gate /* 15600Sstevel@tonic-gate * Returns 0 if the check failed and the restart should be refused, 15610Sstevel@tonic-gate * 1 if the check succeeded. 15620Sstevel@tonic-gate */ 15630Sstevel@tonic-gate int 15640Sstevel@tonic-gate sctp_secure_restart_check(mblk_t *pkt, sctp_chunk_hdr_t *ich, uint32_t ports, 15653448Sdh155122 int sleep, sctp_stack_t *sctps) 15660Sstevel@tonic-gate { 15674964Skcpoon sctp_faddr_t *fp, *fphead = NULL; 15680Sstevel@tonic-gate sctp_parm_hdr_t *ph; 15690Sstevel@tonic-gate ssize_t remaining; 15700Sstevel@tonic-gate int isv4; 15710Sstevel@tonic-gate ipha_t *iph; 15720Sstevel@tonic-gate ip6_t *ip6h; 15730Sstevel@tonic-gate in6_addr_t hdraddr[1]; 15740Sstevel@tonic-gate int retval = 0; 15750Sstevel@tonic-gate sctp_tf_t *tf; 15760Sstevel@tonic-gate sctp_t *sctp; 15770Sstevel@tonic-gate int compres; 15780Sstevel@tonic-gate sctp_init_chunk_t *init; 15790Sstevel@tonic-gate int nadded = 0; 15800Sstevel@tonic-gate 15810Sstevel@tonic-gate /* extract the address from the IP header */ 15820Sstevel@tonic-gate isv4 = (IPH_HDR_VERSION(pkt->b_rptr) == IPV4_VERSION); 15830Sstevel@tonic-gate if (isv4) { 15840Sstevel@tonic-gate iph = (ipha_t *)pkt->b_rptr; 15850Sstevel@tonic-gate IN6_IPADDR_TO_V4MAPPED(iph->ipha_src, hdraddr); 15860Sstevel@tonic-gate } else { 15870Sstevel@tonic-gate ip6h = (ip6_t *)pkt->b_rptr; 15880Sstevel@tonic-gate hdraddr[0] = ip6h->ip6_src; 15890Sstevel@tonic-gate } 15900Sstevel@tonic-gate 15910Sstevel@tonic-gate /* Walk the params in the INIT [ACK], pulling out addr params */ 15920Sstevel@tonic-gate remaining = ntohs(ich->sch_len) - sizeof (*ich) - 15930Sstevel@tonic-gate sizeof (sctp_init_chunk_t); 15940Sstevel@tonic-gate if (remaining < sizeof (*ph)) { 15950Sstevel@tonic-gate /* no parameters; restart OK */ 15960Sstevel@tonic-gate return (1); 15970Sstevel@tonic-gate } 15980Sstevel@tonic-gate init = (sctp_init_chunk_t *)(ich + 1); 15990Sstevel@tonic-gate ph = (sctp_parm_hdr_t *)(init + 1); 16000Sstevel@tonic-gate 16010Sstevel@tonic-gate while (ph != NULL) { 16024964Skcpoon sctp_faddr_t *fpa = NULL; 16034964Skcpoon 16040Sstevel@tonic-gate /* params will have already been byteordered when validating */ 16050Sstevel@tonic-gate if (ph->sph_type == htons(PARM_ADDR4)) { 16060Sstevel@tonic-gate if (remaining >= PARM_ADDR4_LEN) { 16070Sstevel@tonic-gate in6_addr_t addr; 16080Sstevel@tonic-gate IN6_INADDR_TO_V4MAPPED((struct in_addr *) 16090Sstevel@tonic-gate (ph + 1), &addr); 16100Sstevel@tonic-gate fpa = kmem_cache_alloc(sctp_kmem_faddr_cache, 16110Sstevel@tonic-gate sleep); 16124964Skcpoon if (fpa == NULL) { 16130Sstevel@tonic-gate goto done; 16140Sstevel@tonic-gate } 16150Sstevel@tonic-gate bzero(fpa, sizeof (*fpa)); 16160Sstevel@tonic-gate fpa->faddr = addr; 16170Sstevel@tonic-gate fpa->next = NULL; 16180Sstevel@tonic-gate } 16190Sstevel@tonic-gate } else if (ph->sph_type == htons(PARM_ADDR6)) { 16200Sstevel@tonic-gate if (remaining >= PARM_ADDR6_LEN) { 16210Sstevel@tonic-gate fpa = kmem_cache_alloc(sctp_kmem_faddr_cache, 16220Sstevel@tonic-gate sleep); 16234964Skcpoon if (fpa == NULL) { 16240Sstevel@tonic-gate goto done; 16250Sstevel@tonic-gate } 16260Sstevel@tonic-gate bzero(fpa, sizeof (*fpa)); 16270Sstevel@tonic-gate bcopy(ph + 1, &fpa->faddr, 16280Sstevel@tonic-gate sizeof (fpa->faddr)); 16290Sstevel@tonic-gate fpa->next = NULL; 16300Sstevel@tonic-gate } 16310Sstevel@tonic-gate } 16320Sstevel@tonic-gate /* link in the new addr, if it was an addr param */ 16334964Skcpoon if (fpa != NULL) { 16344964Skcpoon if (fphead == NULL) { 16350Sstevel@tonic-gate fphead = fpa; 16360Sstevel@tonic-gate } else { 16374964Skcpoon fpa->next = fphead; 16384964Skcpoon fphead = fpa; 16390Sstevel@tonic-gate } 16400Sstevel@tonic-gate } 16410Sstevel@tonic-gate 16420Sstevel@tonic-gate ph = sctp_next_parm(ph, &remaining); 16430Sstevel@tonic-gate } 16440Sstevel@tonic-gate 16450Sstevel@tonic-gate if (fphead == NULL) { 16460Sstevel@tonic-gate /* no addr parameters; restart OK */ 16470Sstevel@tonic-gate return (1); 16480Sstevel@tonic-gate } 16490Sstevel@tonic-gate 16500Sstevel@tonic-gate /* 16510Sstevel@tonic-gate * got at least one; make sure the header's addr is 16520Sstevel@tonic-gate * in the list 16530Sstevel@tonic-gate */ 16540Sstevel@tonic-gate fp = sctp_lookup_faddr_nosctp(fphead, hdraddr); 16554964Skcpoon if (fp == NULL) { 16560Sstevel@tonic-gate /* not included; add it now */ 16570Sstevel@tonic-gate fp = kmem_cache_alloc(sctp_kmem_faddr_cache, sleep); 16584964Skcpoon if (fp == NULL) { 16590Sstevel@tonic-gate goto done; 16600Sstevel@tonic-gate } 16610Sstevel@tonic-gate bzero(fp, sizeof (*fp)); 16620Sstevel@tonic-gate fp->faddr = *hdraddr; 16630Sstevel@tonic-gate fp->next = fphead; 16640Sstevel@tonic-gate fphead = fp; 16650Sstevel@tonic-gate } 16660Sstevel@tonic-gate 16670Sstevel@tonic-gate /* 16680Sstevel@tonic-gate * Now, we can finally do the check: For each sctp instance 16690Sstevel@tonic-gate * on the hash line for ports, compare its faddr set against 16700Sstevel@tonic-gate * the new one. If the new one is a strict subset of any 16710Sstevel@tonic-gate * existing sctp's faddrs, the restart is OK. However, if there 16720Sstevel@tonic-gate * is an overlap, this could be an attack, so return failure. 16730Sstevel@tonic-gate * If all sctp's faddrs are disjoint, this is a legitimate new 16740Sstevel@tonic-gate * association. 16750Sstevel@tonic-gate */ 16763448Sdh155122 tf = &(sctps->sctps_conn_fanout[SCTP_CONN_HASH(sctps, ports)]); 16770Sstevel@tonic-gate mutex_enter(&tf->tf_lock); 16780Sstevel@tonic-gate 16790Sstevel@tonic-gate for (sctp = tf->tf_sctp; sctp; sctp = sctp->sctp_conn_hash_next) { 16800Sstevel@tonic-gate if (ports != sctp->sctp_ports) { 16810Sstevel@tonic-gate continue; 16820Sstevel@tonic-gate } 16830Sstevel@tonic-gate compres = sctp_compare_faddrsets(fphead, sctp->sctp_faddrs); 16840Sstevel@tonic-gate if (compres <= SCTP_ADDR_SUBSET) { 16850Sstevel@tonic-gate retval = 1; 16860Sstevel@tonic-gate mutex_exit(&tf->tf_lock); 16870Sstevel@tonic-gate goto done; 16880Sstevel@tonic-gate } 16890Sstevel@tonic-gate if (compres == SCTP_ADDR_OVERLAP) { 16900Sstevel@tonic-gate dprint(1, 16910Sstevel@tonic-gate ("new assoc from %x:%x:%x:%x overlaps with %p\n", 16921676Sjpk SCTP_PRINTADDR(*hdraddr), (void *)sctp)); 16930Sstevel@tonic-gate /* 16940Sstevel@tonic-gate * While we still hold the lock, we need to 16950Sstevel@tonic-gate * figure out which addresses have been 16960Sstevel@tonic-gate * added so we can include them in the abort 16970Sstevel@tonic-gate * we will send back. Since these faddrs will 16980Sstevel@tonic-gate * never be used, we overload the rto field 16990Sstevel@tonic-gate * here, setting it to 0 if the address was 17000Sstevel@tonic-gate * not added, 1 if it was added. 17010Sstevel@tonic-gate */ 17020Sstevel@tonic-gate for (fp = fphead; fp; fp = fp->next) { 17030Sstevel@tonic-gate if (sctp_lookup_faddr(sctp, &fp->faddr)) { 17040Sstevel@tonic-gate fp->rto = 0; 17050Sstevel@tonic-gate } else { 17060Sstevel@tonic-gate fp->rto = 1; 17070Sstevel@tonic-gate nadded++; 17080Sstevel@tonic-gate } 17090Sstevel@tonic-gate } 17100Sstevel@tonic-gate mutex_exit(&tf->tf_lock); 17110Sstevel@tonic-gate goto done; 17120Sstevel@tonic-gate } 17130Sstevel@tonic-gate } 17140Sstevel@tonic-gate mutex_exit(&tf->tf_lock); 17150Sstevel@tonic-gate 17160Sstevel@tonic-gate /* All faddrs are disjoint; legit new association */ 17170Sstevel@tonic-gate retval = 1; 17180Sstevel@tonic-gate 17190Sstevel@tonic-gate done: 17200Sstevel@tonic-gate /* If are attempted adds, send back an abort listing the addrs */ 17210Sstevel@tonic-gate if (nadded > 0) { 17220Sstevel@tonic-gate void *dtail; 17230Sstevel@tonic-gate size_t dlen; 17240Sstevel@tonic-gate 17250Sstevel@tonic-gate dtail = kmem_alloc(PARM_ADDR6_LEN * nadded, KM_NOSLEEP); 17260Sstevel@tonic-gate if (dtail == NULL) { 17270Sstevel@tonic-gate goto cleanup; 17280Sstevel@tonic-gate } 17290Sstevel@tonic-gate 17300Sstevel@tonic-gate ph = dtail; 17310Sstevel@tonic-gate dlen = 0; 17320Sstevel@tonic-gate for (fp = fphead; fp; fp = fp->next) { 17330Sstevel@tonic-gate if (fp->rto == 0) { 17340Sstevel@tonic-gate continue; 17350Sstevel@tonic-gate } 17360Sstevel@tonic-gate if (IN6_IS_ADDR_V4MAPPED(&fp->faddr)) { 17370Sstevel@tonic-gate ipaddr_t addr4; 17380Sstevel@tonic-gate 17390Sstevel@tonic-gate ph->sph_type = htons(PARM_ADDR4); 17400Sstevel@tonic-gate ph->sph_len = htons(PARM_ADDR4_LEN); 17410Sstevel@tonic-gate IN6_V4MAPPED_TO_IPADDR(&fp->faddr, addr4); 17420Sstevel@tonic-gate ph++; 17430Sstevel@tonic-gate bcopy(&addr4, ph, sizeof (addr4)); 17440Sstevel@tonic-gate ph = (sctp_parm_hdr_t *) 17450Sstevel@tonic-gate ((char *)ph + sizeof (addr4)); 17460Sstevel@tonic-gate dlen += PARM_ADDR4_LEN; 17470Sstevel@tonic-gate } else { 17480Sstevel@tonic-gate ph->sph_type = htons(PARM_ADDR6); 17490Sstevel@tonic-gate ph->sph_len = htons(PARM_ADDR6_LEN); 17500Sstevel@tonic-gate ph++; 17510Sstevel@tonic-gate bcopy(&fp->faddr, ph, sizeof (fp->faddr)); 17520Sstevel@tonic-gate ph = (sctp_parm_hdr_t *) 17530Sstevel@tonic-gate ((char *)ph + sizeof (fp->faddr)); 17540Sstevel@tonic-gate dlen += PARM_ADDR6_LEN; 17550Sstevel@tonic-gate } 17560Sstevel@tonic-gate } 17570Sstevel@tonic-gate 17580Sstevel@tonic-gate /* Send off the abort */ 17590Sstevel@tonic-gate sctp_send_abort(sctp, sctp_init2vtag(ich), 17600Sstevel@tonic-gate SCTP_ERR_RESTART_NEW_ADDRS, dtail, dlen, pkt, 0, B_TRUE); 17610Sstevel@tonic-gate 17620Sstevel@tonic-gate kmem_free(dtail, PARM_ADDR6_LEN * nadded); 17630Sstevel@tonic-gate } 17640Sstevel@tonic-gate 17650Sstevel@tonic-gate cleanup: 17660Sstevel@tonic-gate /* Clean up */ 17670Sstevel@tonic-gate if (fphead) { 17680Sstevel@tonic-gate sctp_faddr_t *fpn; 17690Sstevel@tonic-gate for (fp = fphead; fp; fp = fpn) { 17700Sstevel@tonic-gate fpn = fp->next; 17710Sstevel@tonic-gate kmem_cache_free(sctp_kmem_faddr_cache, fp); 17720Sstevel@tonic-gate } 17730Sstevel@tonic-gate } 17740Sstevel@tonic-gate 17750Sstevel@tonic-gate return (retval); 17760Sstevel@tonic-gate } 17770Sstevel@tonic-gate 17781932Svi117747 /* 17791932Svi117747 * Reset any state related to transmitted chunks. 17801932Svi117747 */ 17810Sstevel@tonic-gate void 17820Sstevel@tonic-gate sctp_congest_reset(sctp_t *sctp) 17830Sstevel@tonic-gate { 17841932Svi117747 sctp_faddr_t *fp; 17853448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 17861932Svi117747 mblk_t *mp; 17870Sstevel@tonic-gate 17881932Svi117747 for (fp = sctp->sctp_faddrs; fp != NULL; fp = fp->next) { 17893448Sdh155122 fp->ssthresh = sctps->sctps_initial_mtu; 17903795Skcpoon SET_CWND(fp, fp->sfa_pmss, sctps->sctps_slow_start_initial); 17910Sstevel@tonic-gate fp->suna = 0; 17920Sstevel@tonic-gate fp->pba = 0; 17930Sstevel@tonic-gate } 17941932Svi117747 /* 17951932Svi117747 * Clean up the transmit list as well since we have reset accounting 17961932Svi117747 * on all the fps. Send event upstream, if required. 17971932Svi117747 */ 17981932Svi117747 while ((mp = sctp->sctp_xmit_head) != NULL) { 17991932Svi117747 sctp->sctp_xmit_head = mp->b_next; 18001932Svi117747 mp->b_next = NULL; 18011932Svi117747 if (sctp->sctp_xmit_head != NULL) 18021932Svi117747 sctp->sctp_xmit_head->b_prev = NULL; 18031932Svi117747 sctp_sendfail_event(sctp, mp, 0, B_TRUE); 18041932Svi117747 } 18051932Svi117747 sctp->sctp_xmit_head = NULL; 18061932Svi117747 sctp->sctp_xmit_tail = NULL; 18071932Svi117747 sctp->sctp_xmit_unacked = NULL; 18081932Svi117747 18091932Svi117747 sctp->sctp_unacked = 0; 18101932Svi117747 /* 18111932Svi117747 * Any control message as well. We will clean-up this list as well. 18121932Svi117747 * This contains any pending ASCONF request that we have queued/sent. 18131932Svi117747 * If we do get an ACK we will just drop it. However, given that 18141932Svi117747 * we are restarting chances are we aren't going to get any. 18151932Svi117747 */ 18161932Svi117747 if (sctp->sctp_cxmit_list != NULL) 18171932Svi117747 sctp_asconf_free_cxmit(sctp, NULL); 18181932Svi117747 sctp->sctp_cxmit_list = NULL; 18191932Svi117747 sctp->sctp_cchunk_pend = 0; 18201932Svi117747 18211932Svi117747 sctp->sctp_rexmitting = B_FALSE; 18221932Svi117747 sctp->sctp_rxt_nxttsn = 0; 18231932Svi117747 sctp->sctp_rxt_maxtsn = 0; 18241932Svi117747 18251932Svi117747 sctp->sctp_zero_win_probe = B_FALSE; 18260Sstevel@tonic-gate } 18270Sstevel@tonic-gate 18280Sstevel@tonic-gate static void 18291735Skcpoon sctp_init_faddr(sctp_t *sctp, sctp_faddr_t *fp, in6_addr_t *addr, 18301735Skcpoon mblk_t *timer_mp) 18310Sstevel@tonic-gate { 18323448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 18333448Sdh155122 18340Sstevel@tonic-gate bcopy(addr, &fp->faddr, sizeof (*addr)); 18350Sstevel@tonic-gate if (IN6_IS_ADDR_V4MAPPED(addr)) { 18360Sstevel@tonic-gate fp->isv4 = 1; 18370Sstevel@tonic-gate /* Make sure that sfa_pmss is a multiple of SCTP_ALIGN. */ 18384691Skcpoon fp->sfa_pmss = 18394691Skcpoon (sctps->sctps_initial_mtu - sctp->sctp_hdr_len) & 18404691Skcpoon ~(SCTP_ALIGN - 1); 18410Sstevel@tonic-gate } else { 18420Sstevel@tonic-gate fp->isv4 = 0; 18433448Sdh155122 fp->sfa_pmss = 18443448Sdh155122 (sctps->sctps_initial_mtu - sctp->sctp_hdr6_len) & 18453448Sdh155122 ~(SCTP_ALIGN - 1); 18460Sstevel@tonic-gate } 18473448Sdh155122 fp->cwnd = sctps->sctps_slow_start_initial * fp->sfa_pmss; 18480Sstevel@tonic-gate fp->rto = MIN(sctp->sctp_rto_initial, sctp->sctp_init_rto_max); 18490Sstevel@tonic-gate fp->srtt = -1; 18500Sstevel@tonic-gate fp->rtt_updates = 0; 18510Sstevel@tonic-gate fp->strikes = 0; 18520Sstevel@tonic-gate fp->max_retr = sctp->sctp_pp_max_rxt; 18530Sstevel@tonic-gate /* Mark it as not confirmed. */ 18540Sstevel@tonic-gate fp->state = SCTP_FADDRS_UNCONFIRMED; 18550Sstevel@tonic-gate fp->hb_interval = sctp->sctp_hb_interval; 18563448Sdh155122 fp->ssthresh = sctps->sctps_initial_ssthresh; 18570Sstevel@tonic-gate fp->suna = 0; 18580Sstevel@tonic-gate fp->pba = 0; 18590Sstevel@tonic-gate fp->acked = 0; 18600Sstevel@tonic-gate fp->lastactive = lbolt64; 18611735Skcpoon fp->timer_mp = timer_mp; 18620Sstevel@tonic-gate fp->hb_pending = B_FALSE; 18634818Skcpoon fp->hb_enabled = B_TRUE; 18640Sstevel@tonic-gate fp->df = 1; 18650Sstevel@tonic-gate fp->pmtu_discovered = 0; 18660Sstevel@tonic-gate fp->next = NULL; 18670Sstevel@tonic-gate fp->ire = NULL; 18680Sstevel@tonic-gate fp->T3expire = 0; 18690Sstevel@tonic-gate (void) random_get_pseudo_bytes((uint8_t *)&fp->hb_secret, 18700Sstevel@tonic-gate sizeof (fp->hb_secret)); 18710Sstevel@tonic-gate fp->hb_expiry = lbolt64; 18723795Skcpoon fp->rxt_unacked = 0; 18730Sstevel@tonic-gate 18741735Skcpoon sctp_get_ire(sctp, fp); 18750Sstevel@tonic-gate } 18760Sstevel@tonic-gate 18770Sstevel@tonic-gate /*ARGSUSED*/ 18786712Stomee static int 18796712Stomee faddr_constructor(void *buf, void *arg, int flags) 18806712Stomee { 18816712Stomee sctp_faddr_t *fp = buf; 18826712Stomee 18836712Stomee fp->timer_mp = NULL; 18846712Stomee fp->timer_running = 0; 18856712Stomee 18866712Stomee fp->rc_timer_mp = NULL; 18876712Stomee fp->rc_timer_running = 0; 18886712Stomee 18896712Stomee return (0); 18906712Stomee } 18916712Stomee 18926712Stomee /*ARGSUSED*/ 18930Sstevel@tonic-gate static void 18946712Stomee faddr_destructor(void *buf, void *arg) 18950Sstevel@tonic-gate { 18960Sstevel@tonic-gate sctp_faddr_t *fp = buf; 18970Sstevel@tonic-gate 18980Sstevel@tonic-gate ASSERT(fp->timer_mp == NULL); 18990Sstevel@tonic-gate ASSERT(fp->timer_running == 0); 19000Sstevel@tonic-gate 19010Sstevel@tonic-gate ASSERT(fp->rc_timer_mp == NULL); 19020Sstevel@tonic-gate ASSERT(fp->rc_timer_running == 0); 19030Sstevel@tonic-gate } 19040Sstevel@tonic-gate 19050Sstevel@tonic-gate void 19061676Sjpk sctp_faddr_init(void) 19070Sstevel@tonic-gate { 19080Sstevel@tonic-gate sctp_kmem_faddr_cache = kmem_cache_create("sctp_faddr_cache", 19096712Stomee sizeof (sctp_faddr_t), 0, faddr_constructor, faddr_destructor, 19100Sstevel@tonic-gate NULL, NULL, NULL, 0); 19110Sstevel@tonic-gate } 19120Sstevel@tonic-gate 19130Sstevel@tonic-gate void 19141676Sjpk sctp_faddr_fini(void) 19150Sstevel@tonic-gate { 19160Sstevel@tonic-gate kmem_cache_destroy(sctp_kmem_faddr_cache); 19170Sstevel@tonic-gate } 1918