10Sstevel@tonic-gate /* 20Sstevel@tonic-gate * CDDL HEADER START 30Sstevel@tonic-gate * 40Sstevel@tonic-gate * The contents of this file are subject to the terms of the 51676Sjpk * Common Development and Distribution License (the "License"). 61676Sjpk * You may not use this file except in compliance with the License. 70Sstevel@tonic-gate * 80Sstevel@tonic-gate * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 90Sstevel@tonic-gate * or http://www.opensolaris.org/os/licensing. 100Sstevel@tonic-gate * See the License for the specific language governing permissions 110Sstevel@tonic-gate * and limitations under the License. 120Sstevel@tonic-gate * 130Sstevel@tonic-gate * When distributing Covered Code, include this CDDL HEADER in each 140Sstevel@tonic-gate * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 150Sstevel@tonic-gate * If applicable, add the following below this CDDL HEADER, with the 160Sstevel@tonic-gate * fields enclosed by brackets "[]" replaced with your own identifying 170Sstevel@tonic-gate * information: Portions Copyright [yyyy] [name of copyright owner] 180Sstevel@tonic-gate * 190Sstevel@tonic-gate * CDDL HEADER END 200Sstevel@tonic-gate */ 211735Skcpoon 220Sstevel@tonic-gate /* 233448Sdh155122 * Copyright 2007 Sun Microsystems, Inc. All rights reserved. 240Sstevel@tonic-gate * Use is subject to license terms. 250Sstevel@tonic-gate */ 260Sstevel@tonic-gate 270Sstevel@tonic-gate #pragma ident "%Z%%M% %I% %E% SMI" 280Sstevel@tonic-gate 290Sstevel@tonic-gate #include <sys/types.h> 300Sstevel@tonic-gate #include <sys/systm.h> 310Sstevel@tonic-gate #include <sys/stream.h> 321676Sjpk #include <sys/strsubr.h> 330Sstevel@tonic-gate #include <sys/ddi.h> 340Sstevel@tonic-gate #include <sys/sunddi.h> 350Sstevel@tonic-gate #include <sys/kmem.h> 360Sstevel@tonic-gate #include <sys/socket.h> 370Sstevel@tonic-gate #include <sys/random.h> 381676Sjpk #include <sys/tsol/tndb.h> 391676Sjpk #include <sys/tsol/tnet.h> 400Sstevel@tonic-gate 410Sstevel@tonic-gate #include <netinet/in.h> 420Sstevel@tonic-gate #include <netinet/ip6.h> 430Sstevel@tonic-gate #include <netinet/sctp.h> 440Sstevel@tonic-gate 450Sstevel@tonic-gate #include <inet/common.h> 460Sstevel@tonic-gate #include <inet/ip.h> 470Sstevel@tonic-gate #include <inet/ip6.h> 480Sstevel@tonic-gate #include <inet/ip_ire.h> 490Sstevel@tonic-gate #include <inet/mib2.h> 500Sstevel@tonic-gate #include <inet/nd.h> 510Sstevel@tonic-gate #include <inet/optcom.h> 520Sstevel@tonic-gate #include <inet/sctp_ip.h> 530Sstevel@tonic-gate #include <inet/ipclassifier.h> 541676Sjpk 550Sstevel@tonic-gate #include "sctp_impl.h" 560Sstevel@tonic-gate #include "sctp_addr.h" 571932Svi117747 #include "sctp_asconf.h" 580Sstevel@tonic-gate 590Sstevel@tonic-gate static struct kmem_cache *sctp_kmem_faddr_cache; 601735Skcpoon static void sctp_init_faddr(sctp_t *, sctp_faddr_t *, in6_addr_t *, mblk_t *); 610Sstevel@tonic-gate 621735Skcpoon /* Set the source address. Refer to comments in sctp_get_ire(). */ 631932Svi117747 void 641932Svi117747 sctp_set_saddr(sctp_t *sctp, sctp_faddr_t *fp) 650Sstevel@tonic-gate { 661719Sjarrett boolean_t v6 = !fp->isv4; 674818Skcpoon boolean_t addr_set; 681719Sjarrett 694818Skcpoon fp->saddr = sctp_get_valid_addr(sctp, v6, &addr_set); 704818Skcpoon /* 714818Skcpoon * If there is no source address avaialble, mark this peer address 724818Skcpoon * as unreachable for now. When the heartbeat timer fires, it will 734818Skcpoon * call sctp_get_ire() to re-check if there is any source address 744818Skcpoon * available. 754818Skcpoon */ 764818Skcpoon if (!addr_set) 774818Skcpoon fp->state = SCTP_FADDRS_UNREACH; 780Sstevel@tonic-gate } 790Sstevel@tonic-gate 800Sstevel@tonic-gate /* 810Sstevel@tonic-gate * Call this function to update the cached IRE of a peer addr fp. 820Sstevel@tonic-gate */ 830Sstevel@tonic-gate void 841735Skcpoon sctp_get_ire(sctp_t *sctp, sctp_faddr_t *fp) 850Sstevel@tonic-gate { 861735Skcpoon ire_t *ire; 871735Skcpoon ipaddr_t addr4; 881735Skcpoon in6_addr_t laddr; 890Sstevel@tonic-gate sctp_saddr_ipif_t *sp; 901735Skcpoon int hdrlen; 911735Skcpoon ts_label_t *tsl; 923448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 933448Sdh155122 ip_stack_t *ipst = sctps->sctps_netstack->netstack_ip; 940Sstevel@tonic-gate 950Sstevel@tonic-gate /* Remove the previous cache IRE */ 960Sstevel@tonic-gate if ((ire = fp->ire) != NULL) { 970Sstevel@tonic-gate IRE_REFRELE_NOTR(ire); 980Sstevel@tonic-gate fp->ire = NULL; 990Sstevel@tonic-gate } 1000Sstevel@tonic-gate 1010Sstevel@tonic-gate /* 1020Sstevel@tonic-gate * If this addr is not reachable, mark it as unconfirmed for now, the 1030Sstevel@tonic-gate * state will be changed back to unreachable later in this function 1040Sstevel@tonic-gate * if it is still the case. 1050Sstevel@tonic-gate */ 1060Sstevel@tonic-gate if (fp->state == SCTP_FADDRS_UNREACH) { 1070Sstevel@tonic-gate fp->state = SCTP_FADDRS_UNCONFIRMED; 1080Sstevel@tonic-gate } 1090Sstevel@tonic-gate 1101676Sjpk tsl = crgetlabel(CONN_CRED(sctp->sctp_connp)); 1111676Sjpk 1120Sstevel@tonic-gate if (fp->isv4) { 1130Sstevel@tonic-gate IN6_V4MAPPED_TO_IPADDR(&fp->faddr, addr4); 1143448Sdh155122 ire = ire_cache_lookup(addr4, sctp->sctp_zoneid, tsl, ipst); 1151676Sjpk if (ire != NULL) 1161676Sjpk IN6_IPADDR_TO_V4MAPPED(ire->ire_src_addr, &laddr); 1171676Sjpk } else { 1183448Sdh155122 ire = ire_cache_lookup_v6(&fp->faddr, sctp->sctp_zoneid, tsl, 1193448Sdh155122 ipst); 1201676Sjpk if (ire != NULL) 1211676Sjpk laddr = ire->ire_src_addr_v6; 1221676Sjpk } 1230Sstevel@tonic-gate 1241676Sjpk if (ire == NULL) { 1251676Sjpk dprint(3, ("ire2faddr: no ire for %x:%x:%x:%x\n", 1261676Sjpk SCTP_PRINTADDR(fp->faddr))); 1271676Sjpk /* 1281676Sjpk * It is tempting to just leave the src addr 1291676Sjpk * unspecified and let IP figure it out, but we 1301676Sjpk * *cannot* do this, since IP may choose a src addr 1311676Sjpk * that is not part of this association... unless 1321676Sjpk * this sctp has bound to all addrs. So if the ire 1331676Sjpk * lookup fails, try to find one in our src addr 1341676Sjpk * list, unless the sctp has bound to all addrs, in 1351676Sjpk * which case we change the src addr to unspec. 1361676Sjpk * 1371676Sjpk * Note that if this is a v6 endpoint but it does 1381676Sjpk * not have any v4 address at this point (e.g. may 1391676Sjpk * have been deleted), sctp_get_valid_addr() will 1401676Sjpk * return mapped INADDR_ANY. In this case, this 1411676Sjpk * address should be marked not reachable so that 1421676Sjpk * it won't be used to send data. 1431676Sjpk */ 1441932Svi117747 sctp_set_saddr(sctp, fp); 1451735Skcpoon if (fp->state == SCTP_FADDRS_UNREACH) 1461735Skcpoon return; 1471735Skcpoon goto check_current; 1481676Sjpk } 1491676Sjpk 1501735Skcpoon /* Make sure the laddr is part of this association */ 1513510Svi117747 if ((sp = sctp_saddr_lookup(sctp, &ire->ire_ipif->ipif_v6lcl_addr, 1523510Svi117747 0)) != NULL && !sp->saddr_ipif_dontsrc) { 1531676Sjpk if (sp->saddr_ipif_unconfirmed == 1) 1541676Sjpk sp->saddr_ipif_unconfirmed = 0; 1551676Sjpk fp->saddr = laddr; 1561676Sjpk } else { 1571676Sjpk dprint(2, ("ire2faddr: src addr is not part of assc\n")); 1581735Skcpoon 1591735Skcpoon /* 1601735Skcpoon * Set the src to the first saddr and hope for the best. 1611735Skcpoon * Note that we will still do the ire caching below. 1621735Skcpoon * Otherwise, whenever we send a packet, we need to do 1631735Skcpoon * the ire lookup again and still may not get the correct 1641735Skcpoon * source address. Note that this case should very seldomly 1651735Skcpoon * happen. One scenario this can happen is an app 1661735Skcpoon * explicitly bind() to an address. But that address is 1671735Skcpoon * not the preferred source address to send to the peer. 1681735Skcpoon */ 1691932Svi117747 sctp_set_saddr(sctp, fp); 1701735Skcpoon if (fp->state == SCTP_FADDRS_UNREACH) { 1711735Skcpoon IRE_REFRELE(ire); 1721735Skcpoon return; 1731735Skcpoon } 1740Sstevel@tonic-gate } 1750Sstevel@tonic-gate 1761735Skcpoon /* 1771735Skcpoon * Note that ire_cache_lookup_*() returns an ire with the tracing 1781735Skcpoon * bits enabled. This requires the thread holding the ire also 1791735Skcpoon * do the IRE_REFRELE(). Thus we need to do IRE_REFHOLD_NOTR() 1801735Skcpoon * and then IRE_REFRELE() the ire here to make the tracing bits 1811735Skcpoon * work. 1821735Skcpoon */ 1831735Skcpoon IRE_REFHOLD_NOTR(ire); 1841735Skcpoon IRE_REFRELE(ire); 1851735Skcpoon 1860Sstevel@tonic-gate /* Cache the IRE */ 1870Sstevel@tonic-gate fp->ire = ire; 1880Sstevel@tonic-gate if (fp->ire->ire_type == IRE_LOOPBACK && !sctp->sctp_loopback) 1890Sstevel@tonic-gate sctp->sctp_loopback = 1; 1900Sstevel@tonic-gate 1910Sstevel@tonic-gate /* 1920Sstevel@tonic-gate * Pull out RTO information for this faddr and use it if we don't 1930Sstevel@tonic-gate * have any yet. 1940Sstevel@tonic-gate */ 1950Sstevel@tonic-gate if (fp->srtt == -1 && ire->ire_uinfo.iulp_rtt != 0) { 196116Skcpoon /* The cached value is in ms. */ 197116Skcpoon fp->srtt = MSEC_TO_TICK(ire->ire_uinfo.iulp_rtt); 198116Skcpoon fp->rttvar = MSEC_TO_TICK(ire->ire_uinfo.iulp_rtt_sd); 1990Sstevel@tonic-gate fp->rto = 3 * fp->srtt; 2000Sstevel@tonic-gate 2010Sstevel@tonic-gate /* Bound the RTO by configured min and max values */ 2020Sstevel@tonic-gate if (fp->rto < sctp->sctp_rto_min) { 2030Sstevel@tonic-gate fp->rto = sctp->sctp_rto_min; 2040Sstevel@tonic-gate } 2050Sstevel@tonic-gate if (fp->rto > sctp->sctp_rto_max) { 2060Sstevel@tonic-gate fp->rto = sctp->sctp_rto_max; 2070Sstevel@tonic-gate } 2080Sstevel@tonic-gate } 2090Sstevel@tonic-gate 2100Sstevel@tonic-gate /* 2110Sstevel@tonic-gate * Record the MTU for this faddr. If the MTU for this faddr has 2120Sstevel@tonic-gate * changed, check if the assc MTU will also change. 2130Sstevel@tonic-gate */ 2140Sstevel@tonic-gate if (fp->isv4) { 2150Sstevel@tonic-gate hdrlen = sctp->sctp_hdr_len; 2160Sstevel@tonic-gate } else { 2170Sstevel@tonic-gate hdrlen = sctp->sctp_hdr6_len; 2180Sstevel@tonic-gate } 2190Sstevel@tonic-gate if ((fp->sfa_pmss + hdrlen) != ire->ire_max_frag) { 2200Sstevel@tonic-gate /* Make sure that sfa_pmss is a multiple of SCTP_ALIGN. */ 2210Sstevel@tonic-gate fp->sfa_pmss = (ire->ire_max_frag - hdrlen) & ~(SCTP_ALIGN - 1); 2220Sstevel@tonic-gate if (fp->cwnd < (fp->sfa_pmss * 2)) { 2233795Skcpoon SET_CWND(fp, fp->sfa_pmss, 2243795Skcpoon sctps->sctps_slow_start_initial); 2250Sstevel@tonic-gate } 2260Sstevel@tonic-gate } 2270Sstevel@tonic-gate 2281735Skcpoon check_current: 2291735Skcpoon if (fp == sctp->sctp_current) 2301735Skcpoon sctp_set_faddr_current(sctp, fp); 2310Sstevel@tonic-gate } 2320Sstevel@tonic-gate 2330Sstevel@tonic-gate void 2341735Skcpoon sctp_update_ire(sctp_t *sctp) 2350Sstevel@tonic-gate { 2361735Skcpoon ire_t *ire; 2371735Skcpoon sctp_faddr_t *fp; 2383448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 2390Sstevel@tonic-gate 2401735Skcpoon for (fp = sctp->sctp_faddrs; fp != NULL; fp = fp->next) { 2411735Skcpoon if ((ire = fp->ire) == NULL) 2421735Skcpoon continue; 2431735Skcpoon mutex_enter(&ire->ire_lock); 2440Sstevel@tonic-gate 2451735Skcpoon /* 2461735Skcpoon * If the cached IRE is going away, there is no point to 2471735Skcpoon * update it. 2481735Skcpoon */ 2491735Skcpoon if (ire->ire_marks & IRE_MARK_CONDEMNED) { 2501735Skcpoon mutex_exit(&ire->ire_lock); 2511735Skcpoon IRE_REFRELE_NOTR(ire); 2521735Skcpoon fp->ire = NULL; 2531735Skcpoon continue; 2540Sstevel@tonic-gate } 2550Sstevel@tonic-gate 2560Sstevel@tonic-gate /* 2571735Skcpoon * Only record the PMTU for this faddr if we actually have 2581735Skcpoon * done discovery. This prevents initialized default from 2591735Skcpoon * clobbering any real info that IP may have. 2600Sstevel@tonic-gate */ 2611735Skcpoon if (fp->pmtu_discovered) { 2621735Skcpoon if (fp->isv4) { 2631735Skcpoon ire->ire_max_frag = fp->sfa_pmss + 2641735Skcpoon sctp->sctp_hdr_len; 2651735Skcpoon } else { 2661735Skcpoon ire->ire_max_frag = fp->sfa_pmss + 2671735Skcpoon sctp->sctp_hdr6_len; 2681735Skcpoon } 2690Sstevel@tonic-gate } 2701735Skcpoon 2713448Sdh155122 if (sctps->sctps_rtt_updates != 0 && 2723448Sdh155122 fp->rtt_updates >= sctps->sctps_rtt_updates) { 2731735Skcpoon /* 2741735Skcpoon * If there is no old cached values, initialize them 2751735Skcpoon * conservatively. Set them to be (1.5 * new value). 2761735Skcpoon * This code copied from ip_ire_advise(). The cached 2771735Skcpoon * value is in ms. 2781735Skcpoon */ 2791735Skcpoon if (ire->ire_uinfo.iulp_rtt != 0) { 2801735Skcpoon ire->ire_uinfo.iulp_rtt = 2811735Skcpoon (ire->ire_uinfo.iulp_rtt + 2821735Skcpoon TICK_TO_MSEC(fp->srtt)) >> 1; 2831735Skcpoon } else { 2841735Skcpoon ire->ire_uinfo.iulp_rtt = 2851735Skcpoon TICK_TO_MSEC(fp->srtt + (fp->srtt >> 1)); 2861735Skcpoon } 2871735Skcpoon if (ire->ire_uinfo.iulp_rtt_sd != 0) { 2881735Skcpoon ire->ire_uinfo.iulp_rtt_sd = 2894691Skcpoon (ire->ire_uinfo.iulp_rtt_sd + 2904691Skcpoon TICK_TO_MSEC(fp->rttvar)) >> 1; 2911735Skcpoon } else { 2921735Skcpoon ire->ire_uinfo.iulp_rtt_sd = 2931735Skcpoon TICK_TO_MSEC(fp->rttvar + 2941735Skcpoon (fp->rttvar >> 1)); 2951735Skcpoon } 2961735Skcpoon fp->rtt_updates = 0; 2970Sstevel@tonic-gate } 2981735Skcpoon mutex_exit(&ire->ire_lock); 2990Sstevel@tonic-gate } 3000Sstevel@tonic-gate } 3010Sstevel@tonic-gate 3020Sstevel@tonic-gate /* 3030Sstevel@tonic-gate * The sender must set the total length in the IP header. 3040Sstevel@tonic-gate * If sendto == NULL, the current will be used. 3050Sstevel@tonic-gate */ 3060Sstevel@tonic-gate mblk_t * 3070Sstevel@tonic-gate sctp_make_mp(sctp_t *sctp, sctp_faddr_t *sendto, int trailer) 3080Sstevel@tonic-gate { 3090Sstevel@tonic-gate mblk_t *mp; 3100Sstevel@tonic-gate size_t ipsctplen; 3110Sstevel@tonic-gate int isv4; 3120Sstevel@tonic-gate sctp_faddr_t *fp; 3133448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 3144818Skcpoon boolean_t src_changed = B_FALSE; 3150Sstevel@tonic-gate 3160Sstevel@tonic-gate ASSERT(sctp->sctp_current != NULL || sendto != NULL); 3170Sstevel@tonic-gate if (sendto == NULL) { 3180Sstevel@tonic-gate fp = sctp->sctp_current; 3190Sstevel@tonic-gate } else { 3200Sstevel@tonic-gate fp = sendto; 3210Sstevel@tonic-gate } 3220Sstevel@tonic-gate isv4 = fp->isv4; 3230Sstevel@tonic-gate 3240Sstevel@tonic-gate /* Try to look for another IRE again. */ 3254818Skcpoon if (fp->ire == NULL) { 3261735Skcpoon sctp_get_ire(sctp, fp); 3274818Skcpoon /* 3284818Skcpoon * Although we still may not get an IRE, the source address 3294818Skcpoon * may be changed in sctp_get_ire(). Set src_changed to 3304818Skcpoon * true so that the source address is copied again. 3314818Skcpoon */ 3324818Skcpoon src_changed = B_TRUE; 3334818Skcpoon } 3340Sstevel@tonic-gate 3350Sstevel@tonic-gate /* There is no suitable source address to use, return. */ 3360Sstevel@tonic-gate if (fp->state == SCTP_FADDRS_UNREACH) 3370Sstevel@tonic-gate return (NULL); 3384818Skcpoon ASSERT(!IN6_IS_ADDR_V4MAPPED_ANY(&fp->saddr)); 3390Sstevel@tonic-gate 3400Sstevel@tonic-gate if (isv4) { 3410Sstevel@tonic-gate ipsctplen = sctp->sctp_hdr_len; 3420Sstevel@tonic-gate } else { 3430Sstevel@tonic-gate ipsctplen = sctp->sctp_hdr6_len; 3440Sstevel@tonic-gate } 3450Sstevel@tonic-gate 3463448Sdh155122 mp = allocb_cred(ipsctplen + sctps->sctps_wroff_xtra + trailer, 3471676Sjpk CONN_CRED(sctp->sctp_connp)); 3480Sstevel@tonic-gate if (mp == NULL) { 3491676Sjpk ip1dbg(("sctp_make_mp: error making mp..\n")); 3500Sstevel@tonic-gate return (NULL); 3510Sstevel@tonic-gate } 3523448Sdh155122 mp->b_rptr += sctps->sctps_wroff_xtra; 3530Sstevel@tonic-gate mp->b_wptr = mp->b_rptr + ipsctplen; 3540Sstevel@tonic-gate 3550Sstevel@tonic-gate ASSERT(OK_32PTR(mp->b_wptr)); 3560Sstevel@tonic-gate 3570Sstevel@tonic-gate if (isv4) { 3580Sstevel@tonic-gate ipha_t *iph = (ipha_t *)mp->b_rptr; 3590Sstevel@tonic-gate 3600Sstevel@tonic-gate bcopy(sctp->sctp_iphc, mp->b_rptr, ipsctplen); 3614818Skcpoon if (fp != sctp->sctp_current || src_changed) { 3624818Skcpoon /* Fix the source and destination addresses. */ 3630Sstevel@tonic-gate IN6_V4MAPPED_TO_IPADDR(&fp->faddr, iph->ipha_dst); 3644818Skcpoon IN6_V4MAPPED_TO_IPADDR(&fp->saddr, iph->ipha_src); 3650Sstevel@tonic-gate } 3660Sstevel@tonic-gate /* set or clear the don't fragment bit */ 3670Sstevel@tonic-gate if (fp->df) { 3680Sstevel@tonic-gate iph->ipha_fragment_offset_and_flags = htons(IPH_DF); 3690Sstevel@tonic-gate } else { 3700Sstevel@tonic-gate iph->ipha_fragment_offset_and_flags = 0; 3710Sstevel@tonic-gate } 3720Sstevel@tonic-gate } else { 3730Sstevel@tonic-gate bcopy(sctp->sctp_iphc6, mp->b_rptr, ipsctplen); 3744818Skcpoon if (fp != sctp->sctp_current || src_changed) { 3754818Skcpoon /* Fix the source and destination addresses. */ 3760Sstevel@tonic-gate ((ip6_t *)(mp->b_rptr))->ip6_dst = fp->faddr; 3774818Skcpoon ((ip6_t *)(mp->b_rptr))->ip6_src = fp->saddr; 3780Sstevel@tonic-gate } 3790Sstevel@tonic-gate } 3800Sstevel@tonic-gate ASSERT(sctp->sctp_connp != NULL); 3810Sstevel@tonic-gate 3820Sstevel@tonic-gate /* 3830Sstevel@tonic-gate * IP will not free this IRE if it is condemned. SCTP needs to 3840Sstevel@tonic-gate * free it. 3850Sstevel@tonic-gate */ 3860Sstevel@tonic-gate if ((fp->ire != NULL) && (fp->ire->ire_marks & IRE_MARK_CONDEMNED)) { 3870Sstevel@tonic-gate IRE_REFRELE_NOTR(fp->ire); 3880Sstevel@tonic-gate fp->ire = NULL; 3890Sstevel@tonic-gate } 3900Sstevel@tonic-gate /* Stash the conn and ire ptr info. for IP */ 3910Sstevel@tonic-gate SCTP_STASH_IPINFO(mp, fp->ire); 3920Sstevel@tonic-gate 3930Sstevel@tonic-gate return (mp); 3940Sstevel@tonic-gate } 3950Sstevel@tonic-gate 3960Sstevel@tonic-gate /* 3970Sstevel@tonic-gate * Notify upper layers about preferred write offset, write size. 3980Sstevel@tonic-gate */ 3990Sstevel@tonic-gate void 4000Sstevel@tonic-gate sctp_set_ulp_prop(sctp_t *sctp) 4010Sstevel@tonic-gate { 4020Sstevel@tonic-gate int hdrlen; 4033448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 4040Sstevel@tonic-gate 4050Sstevel@tonic-gate if (sctp->sctp_current->isv4) { 4060Sstevel@tonic-gate hdrlen = sctp->sctp_hdr_len; 4070Sstevel@tonic-gate } else { 4080Sstevel@tonic-gate hdrlen = sctp->sctp_hdr6_len; 4090Sstevel@tonic-gate } 4100Sstevel@tonic-gate ASSERT(sctp->sctp_ulpd); 4110Sstevel@tonic-gate 4120Sstevel@tonic-gate ASSERT(sctp->sctp_current->sfa_pmss == sctp->sctp_mss); 4130Sstevel@tonic-gate sctp->sctp_ulp_prop(sctp->sctp_ulpd, 4143448Sdh155122 sctps->sctps_wroff_xtra + hdrlen + sizeof (sctp_data_hdr_t), 4150Sstevel@tonic-gate sctp->sctp_mss - sizeof (sctp_data_hdr_t)); 4160Sstevel@tonic-gate } 4170Sstevel@tonic-gate 4180Sstevel@tonic-gate void 4190Sstevel@tonic-gate sctp_set_iplen(sctp_t *sctp, mblk_t *mp) 4200Sstevel@tonic-gate { 4210Sstevel@tonic-gate uint16_t sum = 0; 4220Sstevel@tonic-gate ipha_t *iph; 4230Sstevel@tonic-gate ip6_t *ip6h; 4240Sstevel@tonic-gate mblk_t *pmp = mp; 4250Sstevel@tonic-gate boolean_t isv4; 4260Sstevel@tonic-gate 4270Sstevel@tonic-gate isv4 = (IPH_HDR_VERSION(mp->b_rptr) == IPV4_VERSION); 4280Sstevel@tonic-gate for (; pmp; pmp = pmp->b_cont) 4290Sstevel@tonic-gate sum += pmp->b_wptr - pmp->b_rptr; 4300Sstevel@tonic-gate 4310Sstevel@tonic-gate if (isv4) { 4320Sstevel@tonic-gate iph = (ipha_t *)mp->b_rptr; 4330Sstevel@tonic-gate iph->ipha_length = htons(sum); 4340Sstevel@tonic-gate } else { 4350Sstevel@tonic-gate ip6h = (ip6_t *)mp->b_rptr; 436679Sseb /* 437679Sseb * If an ip6i_t is present, the real IPv6 header 438679Sseb * immediately follows. 439679Sseb */ 440679Sseb if (ip6h->ip6_nxt == IPPROTO_RAW) 441679Sseb ip6h = (ip6_t *)&ip6h[1]; 4420Sstevel@tonic-gate ip6h->ip6_plen = htons(sum - ((char *)&sctp->sctp_ip6h[1] - 4430Sstevel@tonic-gate sctp->sctp_iphc6)); 4440Sstevel@tonic-gate } 4450Sstevel@tonic-gate } 4460Sstevel@tonic-gate 4470Sstevel@tonic-gate int 4480Sstevel@tonic-gate sctp_compare_faddrsets(sctp_faddr_t *a1, sctp_faddr_t *a2) 4490Sstevel@tonic-gate { 4500Sstevel@tonic-gate int na1 = 0; 4510Sstevel@tonic-gate int overlap = 0; 4520Sstevel@tonic-gate int equal = 1; 4530Sstevel@tonic-gate int onematch; 4540Sstevel@tonic-gate sctp_faddr_t *fp1, *fp2; 4550Sstevel@tonic-gate 4560Sstevel@tonic-gate for (fp1 = a1; fp1; fp1 = fp1->next) { 4570Sstevel@tonic-gate onematch = 0; 4580Sstevel@tonic-gate for (fp2 = a2; fp2; fp2 = fp2->next) { 4590Sstevel@tonic-gate if (IN6_ARE_ADDR_EQUAL(&fp1->faddr, &fp2->faddr)) { 4600Sstevel@tonic-gate overlap++; 4610Sstevel@tonic-gate onematch = 1; 4620Sstevel@tonic-gate break; 4630Sstevel@tonic-gate } 4640Sstevel@tonic-gate if (!onematch) { 4650Sstevel@tonic-gate equal = 0; 4660Sstevel@tonic-gate } 4670Sstevel@tonic-gate } 4680Sstevel@tonic-gate na1++; 4690Sstevel@tonic-gate } 4700Sstevel@tonic-gate 4710Sstevel@tonic-gate if (equal) { 4720Sstevel@tonic-gate return (SCTP_ADDR_EQUAL); 4730Sstevel@tonic-gate } 4740Sstevel@tonic-gate if (overlap == na1) { 4750Sstevel@tonic-gate return (SCTP_ADDR_SUBSET); 4760Sstevel@tonic-gate } 4770Sstevel@tonic-gate if (overlap) { 4780Sstevel@tonic-gate return (SCTP_ADDR_OVERLAP); 4790Sstevel@tonic-gate } 4800Sstevel@tonic-gate return (SCTP_ADDR_DISJOINT); 4810Sstevel@tonic-gate } 4820Sstevel@tonic-gate 4830Sstevel@tonic-gate /* 4841735Skcpoon * Returns 0 on success, -1 on memory allocation failure. If sleep 4851735Skcpoon * is true, this function should never fail. The boolean parameter 4861735Skcpoon * first decides whether the newly created faddr structure should be 4871735Skcpoon * added at the beginning of the list or at the end. 4881735Skcpoon * 4891735Skcpoon * Note: caller must hold conn fanout lock. 4900Sstevel@tonic-gate */ 4911735Skcpoon int 4921735Skcpoon sctp_add_faddr(sctp_t *sctp, in6_addr_t *addr, int sleep, boolean_t first) 4930Sstevel@tonic-gate { 4941735Skcpoon sctp_faddr_t *faddr; 4951735Skcpoon mblk_t *timer_mp; 4960Sstevel@tonic-gate 4971676Sjpk if (is_system_labeled()) { 4981676Sjpk ts_label_t *tsl; 4991676Sjpk tsol_tpc_t *rhtp; 5001676Sjpk int retv; 5011676Sjpk 5021676Sjpk tsl = crgetlabel(CONN_CRED(sctp->sctp_connp)); 5031676Sjpk ASSERT(tsl != NULL); 5041676Sjpk 5051676Sjpk /* find_tpc automatically does the right thing with IPv4 */ 5061676Sjpk rhtp = find_tpc(addr, IPV6_VERSION, B_FALSE); 5071676Sjpk if (rhtp == NULL) 5081676Sjpk return (EACCES); 5090Sstevel@tonic-gate 5101676Sjpk retv = EACCES; 5111676Sjpk if (tsl->tsl_doi == rhtp->tpc_tp.tp_doi) { 5121676Sjpk switch (rhtp->tpc_tp.host_type) { 5131676Sjpk case UNLABELED: 5141676Sjpk /* 5151676Sjpk * Can talk to unlabeled hosts if any of the 5161676Sjpk * following are true: 5171676Sjpk * 1. zone's label matches the remote host's 5181676Sjpk * default label, 5191676Sjpk * 2. mac_exempt is on and the zone dominates 5201676Sjpk * the remote host's label, or 5211676Sjpk * 3. mac_exempt is on and the socket is from 5221676Sjpk * the global zone. 5231676Sjpk */ 5241676Sjpk if (blequal(&rhtp->tpc_tp.tp_def_label, 5251676Sjpk &tsl->tsl_label) || 5261676Sjpk (sctp->sctp_mac_exempt && 5271676Sjpk (sctp->sctp_zoneid == GLOBAL_ZONEID || 5281676Sjpk bldominates(&tsl->tsl_label, 5291676Sjpk &rhtp->tpc_tp.tp_def_label)))) 5301676Sjpk retv = 0; 5311676Sjpk break; 5321676Sjpk case SUN_CIPSO: 5331676Sjpk if (_blinrange(&tsl->tsl_label, 5341676Sjpk &rhtp->tpc_tp.tp_sl_range_cipso) || 5351676Sjpk blinlset(&tsl->tsl_label, 5361676Sjpk rhtp->tpc_tp.tp_sl_set_cipso)) 5371676Sjpk retv = 0; 5381676Sjpk break; 5391676Sjpk } 5401676Sjpk } 5411676Sjpk TPC_RELE(rhtp); 5421676Sjpk if (retv != 0) 5431676Sjpk return (retv); 5440Sstevel@tonic-gate } 5450Sstevel@tonic-gate 5461676Sjpk if ((faddr = kmem_cache_alloc(sctp_kmem_faddr_cache, sleep)) == NULL) 5471676Sjpk return (ENOMEM); 5484691Skcpoon timer_mp = sctp_timer_alloc((sctp), sctp_rexmit_timer, sleep); 5491735Skcpoon if (timer_mp == NULL) { 5501735Skcpoon kmem_cache_free(sctp_kmem_faddr_cache, faddr); 5511735Skcpoon return (ENOMEM); 5521735Skcpoon } 5531735Skcpoon ((sctpt_t *)(timer_mp->b_rptr))->sctpt_faddr = faddr; 5541676Sjpk 5551735Skcpoon sctp_init_faddr(sctp, faddr, addr, timer_mp); 5564818Skcpoon 5574818Skcpoon /* Check for subnet broadcast. */ 5584818Skcpoon if (faddr->ire != NULL && faddr->ire->ire_type & IRE_BROADCAST) { 5594818Skcpoon IRE_REFRELE_NOTR(faddr->ire); 5604818Skcpoon sctp_timer_free(timer_mp); 5614818Skcpoon kmem_cache_free(sctp_kmem_faddr_cache, faddr); 5624818Skcpoon return (EADDRNOTAVAIL); 5634818Skcpoon } 5640Sstevel@tonic-gate ASSERT(faddr->next == NULL); 5650Sstevel@tonic-gate 5661676Sjpk if (sctp->sctp_faddrs == NULL) { 5671676Sjpk ASSERT(sctp->sctp_lastfaddr == NULL); 5681676Sjpk /* only element on list; first and last are same */ 5691676Sjpk sctp->sctp_faddrs = sctp->sctp_lastfaddr = faddr; 5701676Sjpk } else if (first) { 5711676Sjpk ASSERT(sctp->sctp_lastfaddr != NULL); 5721676Sjpk faddr->next = sctp->sctp_faddrs; 5731676Sjpk sctp->sctp_faddrs = faddr; 5740Sstevel@tonic-gate } else { 5751676Sjpk sctp->sctp_lastfaddr->next = faddr; 5761676Sjpk sctp->sctp_lastfaddr = faddr; 5770Sstevel@tonic-gate } 578852Svi117747 sctp->sctp_nfaddrs++; 5790Sstevel@tonic-gate 5800Sstevel@tonic-gate return (0); 5810Sstevel@tonic-gate } 5820Sstevel@tonic-gate 5830Sstevel@tonic-gate sctp_faddr_t * 5840Sstevel@tonic-gate sctp_lookup_faddr(sctp_t *sctp, in6_addr_t *addr) 5850Sstevel@tonic-gate { 5860Sstevel@tonic-gate sctp_faddr_t *fp; 5870Sstevel@tonic-gate 5880Sstevel@tonic-gate for (fp = sctp->sctp_faddrs; fp != NULL; fp = fp->next) { 5890Sstevel@tonic-gate if (IN6_ARE_ADDR_EQUAL(&fp->faddr, addr)) 5900Sstevel@tonic-gate break; 5910Sstevel@tonic-gate } 5920Sstevel@tonic-gate 5930Sstevel@tonic-gate return (fp); 5940Sstevel@tonic-gate } 5950Sstevel@tonic-gate 5960Sstevel@tonic-gate sctp_faddr_t * 5970Sstevel@tonic-gate sctp_lookup_faddr_nosctp(sctp_faddr_t *fp, in6_addr_t *addr) 5980Sstevel@tonic-gate { 5990Sstevel@tonic-gate for (; fp; fp = fp->next) { 6000Sstevel@tonic-gate if (IN6_ARE_ADDR_EQUAL(&fp->faddr, addr)) { 6010Sstevel@tonic-gate break; 6020Sstevel@tonic-gate } 6030Sstevel@tonic-gate } 6040Sstevel@tonic-gate 6050Sstevel@tonic-gate return (fp); 6060Sstevel@tonic-gate } 6070Sstevel@tonic-gate 6081735Skcpoon /* 6091735Skcpoon * To change the currently used peer address to the specified one. 6101735Skcpoon */ 6110Sstevel@tonic-gate void 6121735Skcpoon sctp_set_faddr_current(sctp_t *sctp, sctp_faddr_t *fp) 6130Sstevel@tonic-gate { 6141735Skcpoon /* Now setup the composite header. */ 6150Sstevel@tonic-gate if (fp->isv4) { 6160Sstevel@tonic-gate IN6_V4MAPPED_TO_IPADDR(&fp->faddr, 6170Sstevel@tonic-gate sctp->sctp_ipha->ipha_dst); 6180Sstevel@tonic-gate IN6_V4MAPPED_TO_IPADDR(&fp->saddr, sctp->sctp_ipha->ipha_src); 6190Sstevel@tonic-gate /* update don't fragment bit */ 6200Sstevel@tonic-gate if (fp->df) { 6210Sstevel@tonic-gate sctp->sctp_ipha->ipha_fragment_offset_and_flags = 6220Sstevel@tonic-gate htons(IPH_DF); 6230Sstevel@tonic-gate } else { 6240Sstevel@tonic-gate sctp->sctp_ipha->ipha_fragment_offset_and_flags = 0; 6250Sstevel@tonic-gate } 6260Sstevel@tonic-gate } else { 6270Sstevel@tonic-gate sctp->sctp_ip6h->ip6_dst = fp->faddr; 6280Sstevel@tonic-gate sctp->sctp_ip6h->ip6_src = fp->saddr; 6290Sstevel@tonic-gate } 6301735Skcpoon 6311735Skcpoon sctp->sctp_current = fp; 6321735Skcpoon sctp->sctp_mss = fp->sfa_pmss; 6331735Skcpoon 6341735Skcpoon /* Update the uppper layer for the change. */ 6351735Skcpoon if (!SCTP_IS_DETACHED(sctp)) 6361735Skcpoon sctp_set_ulp_prop(sctp); 6370Sstevel@tonic-gate } 6380Sstevel@tonic-gate 6390Sstevel@tonic-gate void 6400Sstevel@tonic-gate sctp_redo_faddr_srcs(sctp_t *sctp) 6410Sstevel@tonic-gate { 6420Sstevel@tonic-gate sctp_faddr_t *fp; 6430Sstevel@tonic-gate 6440Sstevel@tonic-gate for (fp = sctp->sctp_faddrs; fp != NULL; fp = fp->next) { 6451735Skcpoon sctp_get_ire(sctp, fp); 6460Sstevel@tonic-gate } 6470Sstevel@tonic-gate } 6480Sstevel@tonic-gate 6490Sstevel@tonic-gate void 6500Sstevel@tonic-gate sctp_faddr_alive(sctp_t *sctp, sctp_faddr_t *fp) 6510Sstevel@tonic-gate { 6520Sstevel@tonic-gate int64_t now = lbolt64; 6530Sstevel@tonic-gate 6540Sstevel@tonic-gate fp->strikes = 0; 6550Sstevel@tonic-gate sctp->sctp_strikes = 0; 6560Sstevel@tonic-gate fp->lastactive = now; 6570Sstevel@tonic-gate fp->hb_expiry = now + SET_HB_INTVL(fp); 6580Sstevel@tonic-gate fp->hb_pending = B_FALSE; 6590Sstevel@tonic-gate if (fp->state != SCTP_FADDRS_ALIVE) { 6600Sstevel@tonic-gate fp->state = SCTP_FADDRS_ALIVE; 6610Sstevel@tonic-gate sctp_intf_event(sctp, fp->faddr, SCTP_ADDR_AVAILABLE, 0); 6624818Skcpoon /* Should have a full IRE now */ 6634818Skcpoon sctp_get_ire(sctp, fp); 6640Sstevel@tonic-gate 6651735Skcpoon /* 6661735Skcpoon * If this is the primary, switch back to it now. And 6671735Skcpoon * we probably want to reset the source addr used to reach 6681735Skcpoon * it. 6691735Skcpoon */ 6700Sstevel@tonic-gate if (fp == sctp->sctp_primary) { 6714818Skcpoon ASSERT(fp->state != SCTP_FADDRS_UNREACH); 6721735Skcpoon sctp_set_faddr_current(sctp, fp); 6731735Skcpoon return; 6740Sstevel@tonic-gate } 6750Sstevel@tonic-gate } 6760Sstevel@tonic-gate } 6770Sstevel@tonic-gate 6780Sstevel@tonic-gate int 6790Sstevel@tonic-gate sctp_is_a_faddr_clean(sctp_t *sctp) 6800Sstevel@tonic-gate { 6810Sstevel@tonic-gate sctp_faddr_t *fp; 6820Sstevel@tonic-gate 6830Sstevel@tonic-gate for (fp = sctp->sctp_faddrs; fp; fp = fp->next) { 6840Sstevel@tonic-gate if (fp->state == SCTP_FADDRS_ALIVE && fp->strikes == 0) { 6850Sstevel@tonic-gate return (1); 6860Sstevel@tonic-gate } 6870Sstevel@tonic-gate } 6880Sstevel@tonic-gate 6890Sstevel@tonic-gate return (0); 6900Sstevel@tonic-gate } 6910Sstevel@tonic-gate 6920Sstevel@tonic-gate /* 6930Sstevel@tonic-gate * Returns 0 if there is at leave one other active faddr, -1 if there 6940Sstevel@tonic-gate * are none. If there are none left, faddr_dead() will start killing the 6950Sstevel@tonic-gate * association. 6960Sstevel@tonic-gate * If the downed faddr was the current faddr, a new current faddr 6970Sstevel@tonic-gate * will be chosen. 6980Sstevel@tonic-gate */ 6990Sstevel@tonic-gate int 7000Sstevel@tonic-gate sctp_faddr_dead(sctp_t *sctp, sctp_faddr_t *fp, int newstate) 7010Sstevel@tonic-gate { 7020Sstevel@tonic-gate sctp_faddr_t *ofp; 7033448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 7040Sstevel@tonic-gate 7050Sstevel@tonic-gate if (fp->state == SCTP_FADDRS_ALIVE) { 7060Sstevel@tonic-gate sctp_intf_event(sctp, fp->faddr, SCTP_ADDR_UNREACHABLE, 0); 7070Sstevel@tonic-gate } 7080Sstevel@tonic-gate fp->state = newstate; 7090Sstevel@tonic-gate 7100Sstevel@tonic-gate dprint(1, ("sctp_faddr_dead: %x:%x:%x:%x down (state=%d)\n", 7110Sstevel@tonic-gate SCTP_PRINTADDR(fp->faddr), newstate)); 7120Sstevel@tonic-gate 7130Sstevel@tonic-gate if (fp == sctp->sctp_current) { 7140Sstevel@tonic-gate /* Current faddr down; need to switch it */ 7150Sstevel@tonic-gate sctp->sctp_current = NULL; 7160Sstevel@tonic-gate } 7170Sstevel@tonic-gate 7180Sstevel@tonic-gate /* Find next alive faddr */ 7190Sstevel@tonic-gate ofp = fp; 7201735Skcpoon for (fp = fp->next; fp != NULL; fp = fp->next) { 7210Sstevel@tonic-gate if (fp->state == SCTP_FADDRS_ALIVE) { 7220Sstevel@tonic-gate break; 7230Sstevel@tonic-gate } 7240Sstevel@tonic-gate } 7250Sstevel@tonic-gate 7260Sstevel@tonic-gate if (fp == NULL) { 7270Sstevel@tonic-gate /* Continue from beginning of list */ 7280Sstevel@tonic-gate for (fp = sctp->sctp_faddrs; fp != ofp; fp = fp->next) { 7290Sstevel@tonic-gate if (fp->state == SCTP_FADDRS_ALIVE) { 7300Sstevel@tonic-gate break; 7310Sstevel@tonic-gate } 7320Sstevel@tonic-gate } 7330Sstevel@tonic-gate } 7340Sstevel@tonic-gate 7351735Skcpoon /* 7361735Skcpoon * Find a new fp, so if the current faddr is dead, use the new fp 7371735Skcpoon * as the current one. 7381735Skcpoon */ 7390Sstevel@tonic-gate if (fp != ofp) { 7400Sstevel@tonic-gate if (sctp->sctp_current == NULL) { 7410Sstevel@tonic-gate dprint(1, ("sctp_faddr_dead: failover->%x:%x:%x:%x\n", 7420Sstevel@tonic-gate SCTP_PRINTADDR(fp->faddr))); 7431735Skcpoon /* 7441735Skcpoon * Note that we don't need to reset the source addr 7451735Skcpoon * of the new fp. 7461735Skcpoon */ 7471735Skcpoon sctp_set_faddr_current(sctp, fp); 7480Sstevel@tonic-gate } 7490Sstevel@tonic-gate return (0); 7500Sstevel@tonic-gate } 7510Sstevel@tonic-gate 7520Sstevel@tonic-gate 7530Sstevel@tonic-gate /* All faddrs are down; kill the association */ 7540Sstevel@tonic-gate dprint(1, ("sctp_faddr_dead: all faddrs down, killing assoc\n")); 7553448Sdh155122 BUMP_MIB(&sctps->sctps_mib, sctpAborted); 7560Sstevel@tonic-gate sctp_assoc_event(sctp, sctp->sctp_state < SCTPS_ESTABLISHED ? 7570Sstevel@tonic-gate SCTP_CANT_STR_ASSOC : SCTP_COMM_LOST, 0, NULL); 7580Sstevel@tonic-gate sctp_clean_death(sctp, sctp->sctp_client_errno ? 7590Sstevel@tonic-gate sctp->sctp_client_errno : ETIMEDOUT); 7600Sstevel@tonic-gate 7610Sstevel@tonic-gate return (-1); 7620Sstevel@tonic-gate } 7630Sstevel@tonic-gate 7640Sstevel@tonic-gate sctp_faddr_t * 7650Sstevel@tonic-gate sctp_rotate_faddr(sctp_t *sctp, sctp_faddr_t *ofp) 7660Sstevel@tonic-gate { 7670Sstevel@tonic-gate sctp_faddr_t *nfp = NULL; 7680Sstevel@tonic-gate 7690Sstevel@tonic-gate if (ofp == NULL) { 7700Sstevel@tonic-gate ofp = sctp->sctp_current; 7710Sstevel@tonic-gate } 7720Sstevel@tonic-gate 7730Sstevel@tonic-gate /* Find the next live one */ 7740Sstevel@tonic-gate for (nfp = ofp->next; nfp != NULL; nfp = nfp->next) { 7750Sstevel@tonic-gate if (nfp->state == SCTP_FADDRS_ALIVE) { 7760Sstevel@tonic-gate break; 7770Sstevel@tonic-gate } 7780Sstevel@tonic-gate } 7790Sstevel@tonic-gate 7800Sstevel@tonic-gate if (nfp == NULL) { 7810Sstevel@tonic-gate /* Continue from beginning of list */ 7820Sstevel@tonic-gate for (nfp = sctp->sctp_faddrs; nfp != ofp; nfp = nfp->next) { 7830Sstevel@tonic-gate if (nfp->state == SCTP_FADDRS_ALIVE) { 7840Sstevel@tonic-gate break; 7850Sstevel@tonic-gate } 7860Sstevel@tonic-gate } 7870Sstevel@tonic-gate } 7880Sstevel@tonic-gate 7890Sstevel@tonic-gate /* 7900Sstevel@tonic-gate * nfp could only be NULL if all faddrs are down, and when 7910Sstevel@tonic-gate * this happens, faddr_dead() should have killed the 7920Sstevel@tonic-gate * association. Hence this assertion... 7930Sstevel@tonic-gate */ 7940Sstevel@tonic-gate ASSERT(nfp != NULL); 7950Sstevel@tonic-gate return (nfp); 7960Sstevel@tonic-gate } 7970Sstevel@tonic-gate 7980Sstevel@tonic-gate void 7990Sstevel@tonic-gate sctp_unlink_faddr(sctp_t *sctp, sctp_faddr_t *fp) 8000Sstevel@tonic-gate { 8010Sstevel@tonic-gate sctp_faddr_t *fpp; 8020Sstevel@tonic-gate 8030Sstevel@tonic-gate if (!sctp->sctp_faddrs) { 8040Sstevel@tonic-gate return; 8050Sstevel@tonic-gate } 8060Sstevel@tonic-gate 8070Sstevel@tonic-gate if (fp->timer_mp != NULL) { 8080Sstevel@tonic-gate sctp_timer_free(fp->timer_mp); 8090Sstevel@tonic-gate fp->timer_mp = NULL; 8100Sstevel@tonic-gate fp->timer_running = 0; 8110Sstevel@tonic-gate } 8120Sstevel@tonic-gate if (fp->rc_timer_mp != NULL) { 8130Sstevel@tonic-gate sctp_timer_free(fp->rc_timer_mp); 8140Sstevel@tonic-gate fp->rc_timer_mp = NULL; 8150Sstevel@tonic-gate fp->rc_timer_running = 0; 8160Sstevel@tonic-gate } 8170Sstevel@tonic-gate if (fp->ire != NULL) { 8180Sstevel@tonic-gate IRE_REFRELE_NOTR(fp->ire); 8190Sstevel@tonic-gate fp->ire = NULL; 8200Sstevel@tonic-gate } 8210Sstevel@tonic-gate 8220Sstevel@tonic-gate if (fp == sctp->sctp_faddrs) { 8230Sstevel@tonic-gate goto gotit; 8240Sstevel@tonic-gate } 8250Sstevel@tonic-gate 8260Sstevel@tonic-gate for (fpp = sctp->sctp_faddrs; fpp->next != fp; fpp = fpp->next) 8270Sstevel@tonic-gate ; 8280Sstevel@tonic-gate 8290Sstevel@tonic-gate gotit: 8300Sstevel@tonic-gate ASSERT(sctp->sctp_conn_tfp != NULL); 8310Sstevel@tonic-gate mutex_enter(&sctp->sctp_conn_tfp->tf_lock); 8320Sstevel@tonic-gate if (fp == sctp->sctp_faddrs) { 8330Sstevel@tonic-gate sctp->sctp_faddrs = fp->next; 8340Sstevel@tonic-gate } else { 8350Sstevel@tonic-gate fpp->next = fp->next; 8360Sstevel@tonic-gate } 8370Sstevel@tonic-gate mutex_exit(&sctp->sctp_conn_tfp->tf_lock); 8380Sstevel@tonic-gate /* XXX faddr2ire? */ 8390Sstevel@tonic-gate kmem_cache_free(sctp_kmem_faddr_cache, fp); 840852Svi117747 sctp->sctp_nfaddrs--; 8410Sstevel@tonic-gate } 8420Sstevel@tonic-gate 8430Sstevel@tonic-gate void 8440Sstevel@tonic-gate sctp_zap_faddrs(sctp_t *sctp, int caller_holds_lock) 8450Sstevel@tonic-gate { 8460Sstevel@tonic-gate sctp_faddr_t *fp, *fpn; 8470Sstevel@tonic-gate 8480Sstevel@tonic-gate if (sctp->sctp_faddrs == NULL) { 8490Sstevel@tonic-gate ASSERT(sctp->sctp_lastfaddr == NULL); 8500Sstevel@tonic-gate return; 8510Sstevel@tonic-gate } 8520Sstevel@tonic-gate 8530Sstevel@tonic-gate ASSERT(sctp->sctp_lastfaddr != NULL); 8540Sstevel@tonic-gate sctp->sctp_lastfaddr = NULL; 8550Sstevel@tonic-gate sctp->sctp_current = NULL; 8560Sstevel@tonic-gate sctp->sctp_primary = NULL; 8570Sstevel@tonic-gate 8580Sstevel@tonic-gate sctp_free_faddr_timers(sctp); 8590Sstevel@tonic-gate 8600Sstevel@tonic-gate if (sctp->sctp_conn_tfp != NULL && !caller_holds_lock) { 8610Sstevel@tonic-gate /* in conn fanout; need to hold lock */ 8620Sstevel@tonic-gate mutex_enter(&sctp->sctp_conn_tfp->tf_lock); 8630Sstevel@tonic-gate } 8640Sstevel@tonic-gate 8650Sstevel@tonic-gate for (fp = sctp->sctp_faddrs; fp; fp = fpn) { 8660Sstevel@tonic-gate fpn = fp->next; 8670Sstevel@tonic-gate if (fp->ire != NULL) 8680Sstevel@tonic-gate IRE_REFRELE_NOTR(fp->ire); 8690Sstevel@tonic-gate kmem_cache_free(sctp_kmem_faddr_cache, fp); 870852Svi117747 sctp->sctp_nfaddrs--; 8710Sstevel@tonic-gate } 8720Sstevel@tonic-gate 8730Sstevel@tonic-gate sctp->sctp_faddrs = NULL; 874852Svi117747 ASSERT(sctp->sctp_nfaddrs == 0); 8750Sstevel@tonic-gate if (sctp->sctp_conn_tfp != NULL && !caller_holds_lock) { 8760Sstevel@tonic-gate mutex_exit(&sctp->sctp_conn_tfp->tf_lock); 8770Sstevel@tonic-gate } 8780Sstevel@tonic-gate 8790Sstevel@tonic-gate } 8800Sstevel@tonic-gate 8810Sstevel@tonic-gate void 8820Sstevel@tonic-gate sctp_zap_addrs(sctp_t *sctp) 8830Sstevel@tonic-gate { 8840Sstevel@tonic-gate sctp_zap_faddrs(sctp, 0); 8850Sstevel@tonic-gate sctp_free_saddrs(sctp); 8860Sstevel@tonic-gate } 8870Sstevel@tonic-gate 8880Sstevel@tonic-gate /* 8890Sstevel@tonic-gate * Initialize the IPv4 header. Loses any record of any IP options. 8900Sstevel@tonic-gate */ 8910Sstevel@tonic-gate int 8920Sstevel@tonic-gate sctp_header_init_ipv4(sctp_t *sctp, int sleep) 8930Sstevel@tonic-gate { 8940Sstevel@tonic-gate sctp_hdr_t *sctph; 8953448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 8960Sstevel@tonic-gate 8970Sstevel@tonic-gate /* 8980Sstevel@tonic-gate * This is a simple initialization. If there's 8990Sstevel@tonic-gate * already a template, it should never be too small, 9000Sstevel@tonic-gate * so reuse it. Otherwise, allocate space for the new one. 9010Sstevel@tonic-gate */ 9020Sstevel@tonic-gate if (sctp->sctp_iphc != NULL) { 9030Sstevel@tonic-gate ASSERT(sctp->sctp_iphc_len >= SCTP_MAX_COMBINED_HEADER_LENGTH); 9040Sstevel@tonic-gate bzero(sctp->sctp_iphc, sctp->sctp_iphc_len); 9050Sstevel@tonic-gate } else { 9060Sstevel@tonic-gate sctp->sctp_iphc_len = SCTP_MAX_COMBINED_HEADER_LENGTH; 9070Sstevel@tonic-gate sctp->sctp_iphc = kmem_zalloc(sctp->sctp_iphc_len, sleep); 9080Sstevel@tonic-gate if (sctp->sctp_iphc == NULL) { 9090Sstevel@tonic-gate sctp->sctp_iphc_len = 0; 9100Sstevel@tonic-gate return (ENOMEM); 9110Sstevel@tonic-gate } 9120Sstevel@tonic-gate } 9130Sstevel@tonic-gate 9140Sstevel@tonic-gate sctp->sctp_ipha = (ipha_t *)sctp->sctp_iphc; 9150Sstevel@tonic-gate 9160Sstevel@tonic-gate sctp->sctp_hdr_len = sizeof (ipha_t) + sizeof (sctp_hdr_t); 9170Sstevel@tonic-gate sctp->sctp_ip_hdr_len = sizeof (ipha_t); 9180Sstevel@tonic-gate sctp->sctp_ipha->ipha_length = htons(sizeof (ipha_t) + 9190Sstevel@tonic-gate sizeof (sctp_hdr_t)); 9204691Skcpoon sctp->sctp_ipha->ipha_version_and_hdr_length = 9214691Skcpoon (IP_VERSION << 4) | IP_SIMPLE_HDR_LENGTH_IN_WORDS; 9220Sstevel@tonic-gate 9230Sstevel@tonic-gate /* 9240Sstevel@tonic-gate * These two fields should be zero, and are already set above. 9250Sstevel@tonic-gate * 9260Sstevel@tonic-gate * sctp->sctp_ipha->ipha_ident, 9270Sstevel@tonic-gate * sctp->sctp_ipha->ipha_fragment_offset_and_flags. 9280Sstevel@tonic-gate */ 9290Sstevel@tonic-gate 9303448Sdh155122 sctp->sctp_ipha->ipha_ttl = sctps->sctps_ipv4_ttl; 9310Sstevel@tonic-gate sctp->sctp_ipha->ipha_protocol = IPPROTO_SCTP; 9320Sstevel@tonic-gate 9330Sstevel@tonic-gate sctph = (sctp_hdr_t *)(sctp->sctp_iphc + sizeof (ipha_t)); 9340Sstevel@tonic-gate sctp->sctp_sctph = sctph; 9350Sstevel@tonic-gate 9360Sstevel@tonic-gate return (0); 9370Sstevel@tonic-gate } 9380Sstevel@tonic-gate 9390Sstevel@tonic-gate /* 9400Sstevel@tonic-gate * Update sctp_sticky_hdrs based on sctp_sticky_ipp. 9410Sstevel@tonic-gate * The headers include ip6i_t (if needed), ip6_t, any sticky extension 9420Sstevel@tonic-gate * headers, and the maximum size sctp header (to avoid reallocation 9430Sstevel@tonic-gate * on the fly for additional sctp options). 9440Sstevel@tonic-gate * Returns failure if can't allocate memory. 9450Sstevel@tonic-gate */ 9460Sstevel@tonic-gate int 9470Sstevel@tonic-gate sctp_build_hdrs(sctp_t *sctp) 9480Sstevel@tonic-gate { 9490Sstevel@tonic-gate char *hdrs; 9500Sstevel@tonic-gate uint_t hdrs_len; 9510Sstevel@tonic-gate ip6i_t *ip6i; 9520Sstevel@tonic-gate char buf[SCTP_MAX_HDR_LENGTH]; 9530Sstevel@tonic-gate ip6_pkt_t *ipp = &sctp->sctp_sticky_ipp; 9540Sstevel@tonic-gate in6_addr_t src; 9550Sstevel@tonic-gate in6_addr_t dst; 9563448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 9571676Sjpk 9580Sstevel@tonic-gate /* 9590Sstevel@tonic-gate * save the existing sctp header and source/dest IP addresses 9600Sstevel@tonic-gate */ 9610Sstevel@tonic-gate bcopy(sctp->sctp_sctph6, buf, sizeof (sctp_hdr_t)); 9620Sstevel@tonic-gate src = sctp->sctp_ip6h->ip6_src; 9630Sstevel@tonic-gate dst = sctp->sctp_ip6h->ip6_dst; 9640Sstevel@tonic-gate hdrs_len = ip_total_hdrs_len_v6(ipp) + SCTP_MAX_HDR_LENGTH; 9650Sstevel@tonic-gate ASSERT(hdrs_len != 0); 9660Sstevel@tonic-gate if (hdrs_len > sctp->sctp_iphc6_len) { 9670Sstevel@tonic-gate /* Need to reallocate */ 9680Sstevel@tonic-gate hdrs = kmem_zalloc(hdrs_len, KM_NOSLEEP); 9690Sstevel@tonic-gate if (hdrs == NULL) 9700Sstevel@tonic-gate return (ENOMEM); 9710Sstevel@tonic-gate 9720Sstevel@tonic-gate if (sctp->sctp_iphc6_len != 0) 9730Sstevel@tonic-gate kmem_free(sctp->sctp_iphc6, sctp->sctp_iphc6_len); 9740Sstevel@tonic-gate sctp->sctp_iphc6 = hdrs; 9750Sstevel@tonic-gate sctp->sctp_iphc6_len = hdrs_len; 9760Sstevel@tonic-gate } 9770Sstevel@tonic-gate ip_build_hdrs_v6((uchar_t *)sctp->sctp_iphc6, 9780Sstevel@tonic-gate hdrs_len - SCTP_MAX_HDR_LENGTH, ipp, IPPROTO_SCTP); 9790Sstevel@tonic-gate 9800Sstevel@tonic-gate /* Set header fields not in ipp */ 9810Sstevel@tonic-gate if (ipp->ipp_fields & IPPF_HAS_IP6I) { 9820Sstevel@tonic-gate ip6i = (ip6i_t *)sctp->sctp_iphc6; 9830Sstevel@tonic-gate sctp->sctp_ip6h = (ip6_t *)&ip6i[1]; 9840Sstevel@tonic-gate } else { 9850Sstevel@tonic-gate sctp->sctp_ip6h = (ip6_t *)sctp->sctp_iphc6; 9860Sstevel@tonic-gate } 9870Sstevel@tonic-gate /* 9880Sstevel@tonic-gate * sctp->sctp_ip_hdr_len will include ip6i_t if there is one. 9890Sstevel@tonic-gate */ 9900Sstevel@tonic-gate sctp->sctp_ip_hdr6_len = hdrs_len - SCTP_MAX_HDR_LENGTH; 9910Sstevel@tonic-gate sctp->sctp_sctph6 = (sctp_hdr_t *)(sctp->sctp_iphc6 + 9920Sstevel@tonic-gate sctp->sctp_ip_hdr6_len); 9930Sstevel@tonic-gate sctp->sctp_hdr6_len = sctp->sctp_ip_hdr6_len + sizeof (sctp_hdr_t); 9940Sstevel@tonic-gate 9950Sstevel@tonic-gate bcopy(buf, sctp->sctp_sctph6, sizeof (sctp_hdr_t)); 9960Sstevel@tonic-gate 9970Sstevel@tonic-gate sctp->sctp_ip6h->ip6_src = src; 9980Sstevel@tonic-gate sctp->sctp_ip6h->ip6_dst = dst; 9990Sstevel@tonic-gate /* 1000679Sseb * If the hoplimit was not set by ip_build_hdrs_v6(), we need to 1001679Sseb * set it to the default value for SCTP. 10020Sstevel@tonic-gate */ 1003679Sseb if (!(ipp->ipp_fields & IPPF_UNICAST_HOPS)) 10043448Sdh155122 sctp->sctp_ip6h->ip6_hops = sctps->sctps_ipv6_hoplimit; 10050Sstevel@tonic-gate /* 10060Sstevel@tonic-gate * If we're setting extension headers after a connection 10070Sstevel@tonic-gate * has been established, and if we have a routing header 10080Sstevel@tonic-gate * among the extension headers, call ip_massage_options_v6 to 10090Sstevel@tonic-gate * manipulate the routing header/ip6_dst set the checksum 10100Sstevel@tonic-gate * difference in the sctp header template. 10110Sstevel@tonic-gate * (This happens in sctp_connect_ipv6 if the routing header 10120Sstevel@tonic-gate * is set prior to the connect.) 10130Sstevel@tonic-gate */ 10140Sstevel@tonic-gate 10150Sstevel@tonic-gate if ((sctp->sctp_state >= SCTPS_COOKIE_WAIT) && 10160Sstevel@tonic-gate (sctp->sctp_sticky_ipp.ipp_fields & IPPF_RTHDR)) { 10170Sstevel@tonic-gate ip6_rthdr_t *rth; 10180Sstevel@tonic-gate 10190Sstevel@tonic-gate rth = ip_find_rthdr_v6(sctp->sctp_ip6h, 10200Sstevel@tonic-gate (uint8_t *)sctp->sctp_sctph6); 10213448Sdh155122 if (rth != NULL) { 10223448Sdh155122 (void) ip_massage_options_v6(sctp->sctp_ip6h, rth, 10233448Sdh155122 sctps->sctps_netstack); 10243448Sdh155122 } 10250Sstevel@tonic-gate } 10260Sstevel@tonic-gate return (0); 10270Sstevel@tonic-gate } 10280Sstevel@tonic-gate 10290Sstevel@tonic-gate /* 10300Sstevel@tonic-gate * Initialize the IPv6 header. Loses any record of any IPv6 extension headers. 10310Sstevel@tonic-gate */ 10320Sstevel@tonic-gate int 10330Sstevel@tonic-gate sctp_header_init_ipv6(sctp_t *sctp, int sleep) 10340Sstevel@tonic-gate { 10350Sstevel@tonic-gate sctp_hdr_t *sctph; 10363448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 10370Sstevel@tonic-gate 10380Sstevel@tonic-gate /* 10390Sstevel@tonic-gate * This is a simple initialization. If there's 10400Sstevel@tonic-gate * already a template, it should never be too small, 10410Sstevel@tonic-gate * so reuse it. Otherwise, allocate space for the new one. 10420Sstevel@tonic-gate * Ensure that there is enough space to "downgrade" the sctp_t 10430Sstevel@tonic-gate * to an IPv4 sctp_t. This requires having space for a full load 10440Sstevel@tonic-gate * of IPv4 options 10450Sstevel@tonic-gate */ 10460Sstevel@tonic-gate if (sctp->sctp_iphc6 != NULL) { 10470Sstevel@tonic-gate ASSERT(sctp->sctp_iphc6_len >= 10480Sstevel@tonic-gate SCTP_MAX_COMBINED_HEADER_LENGTH); 10490Sstevel@tonic-gate bzero(sctp->sctp_iphc6, sctp->sctp_iphc6_len); 10500Sstevel@tonic-gate } else { 10510Sstevel@tonic-gate sctp->sctp_iphc6_len = SCTP_MAX_COMBINED_HEADER_LENGTH; 10520Sstevel@tonic-gate sctp->sctp_iphc6 = kmem_zalloc(sctp->sctp_iphc_len, sleep); 10530Sstevel@tonic-gate if (sctp->sctp_iphc6 == NULL) { 10540Sstevel@tonic-gate sctp->sctp_iphc6_len = 0; 10550Sstevel@tonic-gate return (ENOMEM); 10560Sstevel@tonic-gate } 10570Sstevel@tonic-gate } 10580Sstevel@tonic-gate sctp->sctp_hdr6_len = IPV6_HDR_LEN + sizeof (sctp_hdr_t); 10590Sstevel@tonic-gate sctp->sctp_ip_hdr6_len = IPV6_HDR_LEN; 10600Sstevel@tonic-gate sctp->sctp_ip6h = (ip6_t *)sctp->sctp_iphc6; 10610Sstevel@tonic-gate 10620Sstevel@tonic-gate /* Initialize the header template */ 10630Sstevel@tonic-gate 10640Sstevel@tonic-gate sctp->sctp_ip6h->ip6_vcf = IPV6_DEFAULT_VERS_AND_FLOW; 10650Sstevel@tonic-gate sctp->sctp_ip6h->ip6_plen = ntohs(sizeof (sctp_hdr_t)); 10660Sstevel@tonic-gate sctp->sctp_ip6h->ip6_nxt = IPPROTO_SCTP; 10673448Sdh155122 sctp->sctp_ip6h->ip6_hops = sctps->sctps_ipv6_hoplimit; 10680Sstevel@tonic-gate 10690Sstevel@tonic-gate sctph = (sctp_hdr_t *)(sctp->sctp_iphc6 + IPV6_HDR_LEN); 10700Sstevel@tonic-gate sctp->sctp_sctph6 = sctph; 10710Sstevel@tonic-gate 10720Sstevel@tonic-gate return (0); 10730Sstevel@tonic-gate } 10740Sstevel@tonic-gate 10751676Sjpk static int 10761676Sjpk sctp_v4_label(sctp_t *sctp) 10771676Sjpk { 10781676Sjpk uchar_t optbuf[IP_MAX_OPT_LENGTH]; 10791676Sjpk const cred_t *cr = CONN_CRED(sctp->sctp_connp); 10801676Sjpk int added; 10811676Sjpk 10821676Sjpk if (tsol_compute_label(cr, sctp->sctp_ipha->ipha_dst, optbuf, 10833448Sdh155122 sctp->sctp_mac_exempt, 10843448Sdh155122 sctp->sctp_sctps->sctps_netstack->netstack_ip) != 0) 10851676Sjpk return (EACCES); 10861676Sjpk 10871676Sjpk added = tsol_remove_secopt(sctp->sctp_ipha, sctp->sctp_hdr_len); 10881676Sjpk if (added == -1) 10891676Sjpk return (EACCES); 10901676Sjpk sctp->sctp_hdr_len += added; 10911676Sjpk sctp->sctp_sctph = (sctp_hdr_t *)((uchar_t *)sctp->sctp_sctph + added); 10921676Sjpk sctp->sctp_ip_hdr_len += added; 10931676Sjpk if ((sctp->sctp_v4label_len = optbuf[IPOPT_OLEN]) != 0) { 10941676Sjpk sctp->sctp_v4label_len = (sctp->sctp_v4label_len + 3) & ~3; 10951676Sjpk added = tsol_prepend_option(optbuf, sctp->sctp_ipha, 10961676Sjpk sctp->sctp_hdr_len); 10971676Sjpk if (added == -1) 10981676Sjpk return (EACCES); 10991676Sjpk sctp->sctp_hdr_len += added; 11001676Sjpk sctp->sctp_sctph = (sctp_hdr_t *)((uchar_t *)sctp->sctp_sctph + 11011676Sjpk added); 11021676Sjpk sctp->sctp_ip_hdr_len += added; 11031676Sjpk } 11041676Sjpk return (0); 11051676Sjpk } 11061676Sjpk 11071676Sjpk static int 11081676Sjpk sctp_v6_label(sctp_t *sctp) 11091676Sjpk { 11101676Sjpk uchar_t optbuf[TSOL_MAX_IPV6_OPTION]; 11111676Sjpk const cred_t *cr = CONN_CRED(sctp->sctp_connp); 11121676Sjpk 11131676Sjpk if (tsol_compute_label_v6(cr, &sctp->sctp_ip6h->ip6_dst, optbuf, 11143448Sdh155122 sctp->sctp_mac_exempt, 11153448Sdh155122 sctp->sctp_sctps->sctps_netstack->netstack_ip) != 0) 11161676Sjpk return (EACCES); 11171676Sjpk if (tsol_update_sticky(&sctp->sctp_sticky_ipp, &sctp->sctp_v6label_len, 11181676Sjpk optbuf) != 0) 11191676Sjpk return (EACCES); 11201676Sjpk if (sctp_build_hdrs(sctp) != 0) 11211676Sjpk return (EACCES); 11221676Sjpk return (0); 11231676Sjpk } 11241676Sjpk 11250Sstevel@tonic-gate /* 11260Sstevel@tonic-gate * XXX implement more sophisticated logic 11270Sstevel@tonic-gate */ 11281676Sjpk int 11291735Skcpoon sctp_set_hdraddrs(sctp_t *sctp) 11300Sstevel@tonic-gate { 11310Sstevel@tonic-gate sctp_faddr_t *fp; 11320Sstevel@tonic-gate int gotv4 = 0; 11330Sstevel@tonic-gate int gotv6 = 0; 11340Sstevel@tonic-gate 11350Sstevel@tonic-gate ASSERT(sctp->sctp_faddrs != NULL); 11360Sstevel@tonic-gate ASSERT(sctp->sctp_nsaddrs > 0); 11370Sstevel@tonic-gate 11380Sstevel@tonic-gate /* Set up using the primary first */ 11390Sstevel@tonic-gate if (IN6_IS_ADDR_V4MAPPED(&sctp->sctp_primary->faddr)) { 11400Sstevel@tonic-gate IN6_V4MAPPED_TO_IPADDR(&sctp->sctp_primary->faddr, 11410Sstevel@tonic-gate sctp->sctp_ipha->ipha_dst); 11420Sstevel@tonic-gate /* saddr may be unspec; make_mp() will handle this */ 11430Sstevel@tonic-gate IN6_V4MAPPED_TO_IPADDR(&sctp->sctp_primary->saddr, 11440Sstevel@tonic-gate sctp->sctp_ipha->ipha_src); 11451676Sjpk if (!is_system_labeled() || sctp_v4_label(sctp) == 0) { 11461676Sjpk gotv4 = 1; 11471676Sjpk if (sctp->sctp_ipversion == IPV4_VERSION) { 11481676Sjpk goto copyports; 11491676Sjpk } 11500Sstevel@tonic-gate } 11510Sstevel@tonic-gate } else { 11520Sstevel@tonic-gate sctp->sctp_ip6h->ip6_dst = sctp->sctp_primary->faddr; 11530Sstevel@tonic-gate /* saddr may be unspec; make_mp() will handle this */ 11540Sstevel@tonic-gate sctp->sctp_ip6h->ip6_src = sctp->sctp_primary->saddr; 11551676Sjpk if (!is_system_labeled() || sctp_v6_label(sctp) == 0) 11561676Sjpk gotv6 = 1; 11570Sstevel@tonic-gate } 11580Sstevel@tonic-gate 11590Sstevel@tonic-gate for (fp = sctp->sctp_faddrs; fp; fp = fp->next) { 11600Sstevel@tonic-gate if (!gotv4 && IN6_IS_ADDR_V4MAPPED(&fp->faddr)) { 11610Sstevel@tonic-gate IN6_V4MAPPED_TO_IPADDR(&fp->faddr, 11620Sstevel@tonic-gate sctp->sctp_ipha->ipha_dst); 11630Sstevel@tonic-gate /* copy in the faddr_t's saddr */ 11640Sstevel@tonic-gate IN6_V4MAPPED_TO_IPADDR(&fp->saddr, 11650Sstevel@tonic-gate sctp->sctp_ipha->ipha_src); 11661676Sjpk if (!is_system_labeled() || sctp_v4_label(sctp) == 0) { 11671676Sjpk gotv4 = 1; 11681676Sjpk if (sctp->sctp_ipversion == IPV4_VERSION || 11691676Sjpk gotv6) { 11701676Sjpk break; 11711676Sjpk } 11720Sstevel@tonic-gate } 11732283Skp158701 } else if (!gotv6 && !IN6_IS_ADDR_V4MAPPED(&fp->faddr)) { 11740Sstevel@tonic-gate sctp->sctp_ip6h->ip6_dst = fp->faddr; 11750Sstevel@tonic-gate /* copy in the faddr_t's saddr */ 11760Sstevel@tonic-gate sctp->sctp_ip6h->ip6_src = fp->saddr; 11771676Sjpk if (!is_system_labeled() || sctp_v6_label(sctp) == 0) { 11781676Sjpk gotv6 = 1; 11791676Sjpk if (gotv4) 11801676Sjpk break; 11810Sstevel@tonic-gate } 11820Sstevel@tonic-gate } 11830Sstevel@tonic-gate } 11840Sstevel@tonic-gate 11850Sstevel@tonic-gate copyports: 11861676Sjpk if (!gotv4 && !gotv6) 11871676Sjpk return (EACCES); 11881676Sjpk 11890Sstevel@tonic-gate /* copy in the ports for good measure */ 11900Sstevel@tonic-gate sctp->sctp_sctph->sh_sport = sctp->sctp_lport; 11910Sstevel@tonic-gate sctp->sctp_sctph->sh_dport = sctp->sctp_fport; 11920Sstevel@tonic-gate 11930Sstevel@tonic-gate sctp->sctp_sctph6->sh_sport = sctp->sctp_lport; 11940Sstevel@tonic-gate sctp->sctp_sctph6->sh_dport = sctp->sctp_fport; 11951676Sjpk return (0); 11960Sstevel@tonic-gate } 11970Sstevel@tonic-gate 11980Sstevel@tonic-gate void 11990Sstevel@tonic-gate sctp_add_unrec_parm(sctp_parm_hdr_t *uph, mblk_t **errmp) 12000Sstevel@tonic-gate { 12010Sstevel@tonic-gate mblk_t *mp; 12020Sstevel@tonic-gate sctp_parm_hdr_t *ph; 12030Sstevel@tonic-gate size_t len; 12040Sstevel@tonic-gate int pad; 12050Sstevel@tonic-gate 12060Sstevel@tonic-gate len = sizeof (*ph) + ntohs(uph->sph_len); 12070Sstevel@tonic-gate if ((pad = len % 4) != 0) { 12080Sstevel@tonic-gate pad = 4 - pad; 12090Sstevel@tonic-gate len += pad; 12100Sstevel@tonic-gate } 12110Sstevel@tonic-gate mp = allocb(len, BPRI_MED); 12120Sstevel@tonic-gate if (mp == NULL) { 12130Sstevel@tonic-gate return; 12140Sstevel@tonic-gate } 12150Sstevel@tonic-gate 12160Sstevel@tonic-gate ph = (sctp_parm_hdr_t *)(mp->b_rptr); 12170Sstevel@tonic-gate ph->sph_type = htons(PARM_UNRECOGNIZED); 12180Sstevel@tonic-gate ph->sph_len = htons(len - pad); 12190Sstevel@tonic-gate 12200Sstevel@tonic-gate /* copy in the unrecognized parameter */ 12210Sstevel@tonic-gate bcopy(uph, ph + 1, ntohs(uph->sph_len)); 12220Sstevel@tonic-gate 12230Sstevel@tonic-gate mp->b_wptr = mp->b_rptr + len; 12240Sstevel@tonic-gate if (*errmp != NULL) { 12250Sstevel@tonic-gate linkb(*errmp, mp); 12260Sstevel@tonic-gate } else { 12270Sstevel@tonic-gate *errmp = mp; 12280Sstevel@tonic-gate } 12290Sstevel@tonic-gate } 12300Sstevel@tonic-gate 12310Sstevel@tonic-gate /* 12320Sstevel@tonic-gate * o Bounds checking 12330Sstevel@tonic-gate * o Updates remaining 12340Sstevel@tonic-gate * o Checks alignment 12350Sstevel@tonic-gate */ 12360Sstevel@tonic-gate sctp_parm_hdr_t * 12370Sstevel@tonic-gate sctp_next_parm(sctp_parm_hdr_t *current, ssize_t *remaining) 12380Sstevel@tonic-gate { 12390Sstevel@tonic-gate int pad; 12400Sstevel@tonic-gate uint16_t len; 12410Sstevel@tonic-gate 12420Sstevel@tonic-gate len = ntohs(current->sph_len); 12430Sstevel@tonic-gate *remaining -= len; 12440Sstevel@tonic-gate if (*remaining < sizeof (*current) || len < sizeof (*current)) { 12450Sstevel@tonic-gate return (NULL); 12460Sstevel@tonic-gate } 12470Sstevel@tonic-gate if ((pad = len & (SCTP_ALIGN - 1)) != 0) { 12480Sstevel@tonic-gate pad = SCTP_ALIGN - pad; 12490Sstevel@tonic-gate *remaining -= pad; 12500Sstevel@tonic-gate } 12510Sstevel@tonic-gate /*LINTED pointer cast may result in improper alignment*/ 12520Sstevel@tonic-gate current = (sctp_parm_hdr_t *)((char *)current + len + pad); 12530Sstevel@tonic-gate return (current); 12540Sstevel@tonic-gate } 12550Sstevel@tonic-gate 12560Sstevel@tonic-gate /* 12570Sstevel@tonic-gate * Sets the address parameters given in the INIT chunk into sctp's 12580Sstevel@tonic-gate * faddrs; if psctp is non-NULL, copies psctp's saddrs. If there are 12590Sstevel@tonic-gate * no address parameters in the INIT chunk, a single faddr is created 12600Sstevel@tonic-gate * from the ip hdr at the beginning of pkt. 12610Sstevel@tonic-gate * If there already are existing addresses hanging from sctp, merge 12620Sstevel@tonic-gate * them in, if the old info contains addresses which are not present 12630Sstevel@tonic-gate * in this new info, get rid of them, and clean the pointers if there's 12640Sstevel@tonic-gate * messages which have this as their target address. 12650Sstevel@tonic-gate * 1266432Svi117747 * We also re-adjust the source address list here since the list may 1267432Svi117747 * contain more than what is actually part of the association. If 1268432Svi117747 * we get here from sctp_send_cookie_echo(), we are on the active 1269432Svi117747 * side and psctp will be NULL and ich will be the INIT-ACK chunk. 1270432Svi117747 * If we get here from sctp_accept_comm(), ich will be the INIT chunk 1271432Svi117747 * and psctp will the listening endpoint. 1272432Svi117747 * 1273432Svi117747 * INIT processing: When processing the INIT we inherit the src address 1274432Svi117747 * list from the listener. For a loopback or linklocal association, we 1275432Svi117747 * delete the list and just take the address from the IP header (since 1276432Svi117747 * that's how we created the INIT-ACK). Additionally, for loopback we 1277432Svi117747 * ignore the address params in the INIT. For determining which address 1278432Svi117747 * types were sent in the INIT-ACK we follow the same logic as in 1279432Svi117747 * creating the INIT-ACK. We delete addresses of the type that are not 1280432Svi117747 * supported by the peer. 1281432Svi117747 * 1282432Svi117747 * INIT-ACK processing: When processing the INIT-ACK since we had not 1283432Svi117747 * included addr params for loopback or linklocal addresses when creating 1284432Svi117747 * the INIT, we just use the address from the IP header. Further, for 1285432Svi117747 * loopback we ignore the addr param list. We mark addresses of the 1286432Svi117747 * type not supported by the peer as unconfirmed. 1287432Svi117747 * 1288432Svi117747 * In case of INIT processing we look for supported address types in the 1289432Svi117747 * supported address param, if present. In both cases the address type in 1290432Svi117747 * the IP header is supported as well as types for addresses in the param 1291432Svi117747 * list, if any. 1292432Svi117747 * 1293432Svi117747 * Once we have the supported address types sctp_check_saddr() runs through 1294432Svi117747 * the source address list and deletes or marks as unconfirmed address of 1295432Svi117747 * types not supported by the peer. 1296432Svi117747 * 12970Sstevel@tonic-gate * Returns 0 on success, sys errno on failure 12980Sstevel@tonic-gate */ 12990Sstevel@tonic-gate int 13000Sstevel@tonic-gate sctp_get_addrparams(sctp_t *sctp, sctp_t *psctp, mblk_t *pkt, 13010Sstevel@tonic-gate sctp_chunk_hdr_t *ich, uint_t *sctp_options) 13020Sstevel@tonic-gate { 13030Sstevel@tonic-gate sctp_init_chunk_t *init; 13040Sstevel@tonic-gate ipha_t *iph; 13050Sstevel@tonic-gate ip6_t *ip6h; 1306432Svi117747 in6_addr_t hdrsaddr[1]; 1307432Svi117747 in6_addr_t hdrdaddr[1]; 13080Sstevel@tonic-gate sctp_parm_hdr_t *ph; 13090Sstevel@tonic-gate ssize_t remaining; 13100Sstevel@tonic-gate int isv4; 13110Sstevel@tonic-gate int err; 13120Sstevel@tonic-gate sctp_faddr_t *fp; 1313432Svi117747 int supp_af = 0; 1314432Svi117747 boolean_t check_saddr = B_TRUE; 1315852Svi117747 in6_addr_t curaddr; 13163448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 13170Sstevel@tonic-gate 13180Sstevel@tonic-gate if (sctp_options != NULL) 13190Sstevel@tonic-gate *sctp_options = 0; 13200Sstevel@tonic-gate 1321432Svi117747 /* extract the address from the IP header */ 1322432Svi117747 isv4 = (IPH_HDR_VERSION(pkt->b_rptr) == IPV4_VERSION); 1323432Svi117747 if (isv4) { 1324432Svi117747 iph = (ipha_t *)pkt->b_rptr; 1325432Svi117747 IN6_IPADDR_TO_V4MAPPED(iph->ipha_src, hdrsaddr); 1326432Svi117747 IN6_IPADDR_TO_V4MAPPED(iph->ipha_dst, hdrdaddr); 1327432Svi117747 supp_af |= PARM_SUPP_V4; 1328432Svi117747 } else { 1329432Svi117747 ip6h = (ip6_t *)pkt->b_rptr; 1330432Svi117747 hdrsaddr[0] = ip6h->ip6_src; 1331432Svi117747 hdrdaddr[0] = ip6h->ip6_dst; 1332432Svi117747 supp_af |= PARM_SUPP_V6; 1333432Svi117747 } 1334432Svi117747 1335432Svi117747 /* 1336432Svi117747 * Unfortunately, we can't delay this because adding an faddr 1337432Svi117747 * looks for the presence of the source address (from the ire 1338432Svi117747 * for the faddr) in the source address list. We could have 1339432Svi117747 * delayed this if, say, this was a loopback/linklocal connection. 1340432Svi117747 * Now, we just end up nuking this list and taking the addr from 1341432Svi117747 * the IP header for loopback/linklocal. 1342432Svi117747 */ 13430Sstevel@tonic-gate if (psctp != NULL && psctp->sctp_nsaddrs > 0) { 13440Sstevel@tonic-gate ASSERT(sctp->sctp_nsaddrs == 0); 13450Sstevel@tonic-gate 13460Sstevel@tonic-gate err = sctp_dup_saddrs(psctp, sctp, KM_NOSLEEP); 13470Sstevel@tonic-gate if (err != 0) 13480Sstevel@tonic-gate return (err); 13490Sstevel@tonic-gate } 1350432Svi117747 /* 1351432Svi117747 * We will add the faddr before parsing the address list as this 1352432Svi117747 * might be a loopback connection and we would not have to 1353432Svi117747 * go through the list. 1354432Svi117747 * 1355432Svi117747 * Make sure the header's addr is in the list 1356432Svi117747 */ 1357432Svi117747 fp = sctp_lookup_faddr(sctp, hdrsaddr); 1358432Svi117747 if (fp == NULL) { 1359432Svi117747 /* not included; add it now */ 13601735Skcpoon err = sctp_add_faddr(sctp, hdrsaddr, KM_NOSLEEP, B_TRUE); 13611676Sjpk if (err != 0) 13621676Sjpk return (err); 13630Sstevel@tonic-gate 1364432Svi117747 /* sctp_faddrs will be the hdr addr */ 1365432Svi117747 fp = sctp->sctp_faddrs; 13660Sstevel@tonic-gate } 1367432Svi117747 /* make the header addr the primary */ 1368852Svi117747 1369852Svi117747 if (cl_sctp_assoc_change != NULL && psctp == NULL) 1370852Svi117747 curaddr = sctp->sctp_current->faddr; 1371852Svi117747 1372432Svi117747 sctp->sctp_primary = fp; 1373432Svi117747 sctp->sctp_current = fp; 1374432Svi117747 sctp->sctp_mss = fp->sfa_pmss; 13750Sstevel@tonic-gate 1376432Svi117747 /* For loopback connections & linklocal get address from the header */ 1377432Svi117747 if (sctp->sctp_loopback || sctp->sctp_linklocal) { 1378432Svi117747 if (sctp->sctp_nsaddrs != 0) 1379432Svi117747 sctp_free_saddrs(sctp); 1380852Svi117747 if ((err = sctp_saddr_add_addr(sctp, hdrdaddr, 0)) != 0) 1381432Svi117747 return (err); 1382432Svi117747 /* For loopback ignore address list */ 1383432Svi117747 if (sctp->sctp_loopback) 1384432Svi117747 return (0); 1385432Svi117747 check_saddr = B_FALSE; 1386432Svi117747 } 13870Sstevel@tonic-gate 13880Sstevel@tonic-gate /* Walk the params in the INIT [ACK], pulling out addr params */ 13890Sstevel@tonic-gate remaining = ntohs(ich->sch_len) - sizeof (*ich) - 13900Sstevel@tonic-gate sizeof (sctp_init_chunk_t); 13910Sstevel@tonic-gate if (remaining < sizeof (*ph)) { 1392432Svi117747 if (check_saddr) { 1393432Svi117747 sctp_check_saddr(sctp, supp_af, psctp == NULL ? 13944818Skcpoon B_FALSE : B_TRUE, hdrdaddr); 1395432Svi117747 } 1396852Svi117747 ASSERT(sctp_saddr_lookup(sctp, hdrdaddr, 0) != NULL); 1397432Svi117747 return (0); 13980Sstevel@tonic-gate } 1399432Svi117747 14000Sstevel@tonic-gate init = (sctp_init_chunk_t *)(ich + 1); 14010Sstevel@tonic-gate ph = (sctp_parm_hdr_t *)(init + 1); 14020Sstevel@tonic-gate 1403432Svi117747 /* params will have already been byteordered when validating */ 14040Sstevel@tonic-gate while (ph != NULL) { 1405432Svi117747 if (ph->sph_type == htons(PARM_SUPP_ADDRS)) { 1406432Svi117747 int plen; 1407432Svi117747 uint16_t *p; 1408432Svi117747 uint16_t addrtype; 1409432Svi117747 1410432Svi117747 ASSERT(psctp != NULL); 1411432Svi117747 plen = ntohs(ph->sph_len); 1412432Svi117747 p = (uint16_t *)(ph + 1); 1413432Svi117747 while (plen > 0) { 1414432Svi117747 addrtype = ntohs(*p); 1415432Svi117747 switch (addrtype) { 1416432Svi117747 case PARM_ADDR6: 1417432Svi117747 supp_af |= PARM_SUPP_V6; 1418432Svi117747 break; 1419432Svi117747 case PARM_ADDR4: 1420432Svi117747 supp_af |= PARM_SUPP_V4; 1421432Svi117747 break; 1422432Svi117747 default: 1423432Svi117747 break; 1424432Svi117747 } 1425432Svi117747 p++; 1426432Svi117747 plen -= sizeof (*p); 1427432Svi117747 } 1428432Svi117747 } else if (ph->sph_type == htons(PARM_ADDR4)) { 14290Sstevel@tonic-gate if (remaining >= PARM_ADDR4_LEN) { 14300Sstevel@tonic-gate in6_addr_t addr; 14310Sstevel@tonic-gate ipaddr_t ta; 14320Sstevel@tonic-gate 1433432Svi117747 supp_af |= PARM_SUPP_V4; 14340Sstevel@tonic-gate /* 14350Sstevel@tonic-gate * Screen out broad/multicasts & loopback. 14360Sstevel@tonic-gate * If the endpoint only accepts v6 address, 14370Sstevel@tonic-gate * go to the next one. 14384818Skcpoon * 14394818Skcpoon * Subnet broadcast check is done in 14404818Skcpoon * sctp_add_faddr(). If the address is 14414818Skcpoon * a broadcast address, it won't be added. 14420Sstevel@tonic-gate */ 14430Sstevel@tonic-gate bcopy(ph + 1, &ta, sizeof (ta)); 14440Sstevel@tonic-gate if (ta == 0 || 14450Sstevel@tonic-gate ta == INADDR_BROADCAST || 14460Sstevel@tonic-gate ta == htonl(INADDR_LOOPBACK) || 14470Sstevel@tonic-gate IN_MULTICAST(ta) || 14480Sstevel@tonic-gate sctp->sctp_connp->conn_ipv6_v6only) { 14490Sstevel@tonic-gate goto next; 14500Sstevel@tonic-gate } 14510Sstevel@tonic-gate IN6_INADDR_TO_V4MAPPED((struct in_addr *) 14520Sstevel@tonic-gate (ph + 1), &addr); 14534818Skcpoon 14540Sstevel@tonic-gate /* Check for duplicate. */ 14550Sstevel@tonic-gate if (sctp_lookup_faddr(sctp, &addr) != NULL) 14560Sstevel@tonic-gate goto next; 14570Sstevel@tonic-gate 14580Sstevel@tonic-gate /* OK, add it to the faddr set */ 14591735Skcpoon err = sctp_add_faddr(sctp, &addr, KM_NOSLEEP, 14601735Skcpoon B_FALSE); 14614818Skcpoon /* Something is wrong... Try the next one. */ 14621676Sjpk if (err != 0) 14634818Skcpoon goto next; 14640Sstevel@tonic-gate } 14650Sstevel@tonic-gate } else if (ph->sph_type == htons(PARM_ADDR6) && 14660Sstevel@tonic-gate sctp->sctp_family == AF_INET6) { 14670Sstevel@tonic-gate /* An v4 socket should not take v6 addresses. */ 14680Sstevel@tonic-gate if (remaining >= PARM_ADDR6_LEN) { 14690Sstevel@tonic-gate in6_addr_t *addr6; 14700Sstevel@tonic-gate 1471432Svi117747 supp_af |= PARM_SUPP_V6; 14720Sstevel@tonic-gate addr6 = (in6_addr_t *)(ph + 1); 14730Sstevel@tonic-gate /* 14740Sstevel@tonic-gate * Screen out link locals, mcast, loopback 14750Sstevel@tonic-gate * and bogus v6 address. 14760Sstevel@tonic-gate */ 14770Sstevel@tonic-gate if (IN6_IS_ADDR_LINKLOCAL(addr6) || 14780Sstevel@tonic-gate IN6_IS_ADDR_MULTICAST(addr6) || 14790Sstevel@tonic-gate IN6_IS_ADDR_LOOPBACK(addr6) || 14800Sstevel@tonic-gate IN6_IS_ADDR_V4MAPPED(addr6)) { 14810Sstevel@tonic-gate goto next; 14820Sstevel@tonic-gate } 14830Sstevel@tonic-gate /* Check for duplicate. */ 14840Sstevel@tonic-gate if (sctp_lookup_faddr(sctp, addr6) != NULL) 14850Sstevel@tonic-gate goto next; 14860Sstevel@tonic-gate 14871676Sjpk err = sctp_add_faddr(sctp, 14881735Skcpoon (in6_addr_t *)(ph + 1), KM_NOSLEEP, 14891735Skcpoon B_FALSE); 14904818Skcpoon /* Something is wrong... Try the next one. */ 14911676Sjpk if (err != 0) 14924818Skcpoon goto next; 14930Sstevel@tonic-gate } 14940Sstevel@tonic-gate } else if (ph->sph_type == htons(PARM_FORWARD_TSN)) { 14950Sstevel@tonic-gate if (sctp_options != NULL) 14960Sstevel@tonic-gate *sctp_options |= SCTP_PRSCTP_OPTION; 14970Sstevel@tonic-gate } /* else; skip */ 14980Sstevel@tonic-gate 14990Sstevel@tonic-gate next: 15000Sstevel@tonic-gate ph = sctp_next_parm(ph, &remaining); 15010Sstevel@tonic-gate } 1502432Svi117747 if (check_saddr) { 1503432Svi117747 sctp_check_saddr(sctp, supp_af, psctp == NULL ? B_FALSE : 15044818Skcpoon B_TRUE, hdrdaddr); 15050Sstevel@tonic-gate } 1506852Svi117747 ASSERT(sctp_saddr_lookup(sctp, hdrdaddr, 0) != NULL); 1507852Svi117747 /* 1508852Svi117747 * We have the right address list now, update clustering's 1509852Svi117747 * knowledge because when we sent the INIT we had just added 1510852Svi117747 * the address the INIT was sent to. 1511852Svi117747 */ 1512852Svi117747 if (psctp == NULL && cl_sctp_assoc_change != NULL) { 1513852Svi117747 uchar_t *alist; 1514852Svi117747 size_t asize; 1515852Svi117747 uchar_t *dlist; 1516852Svi117747 size_t dsize; 1517852Svi117747 1518852Svi117747 asize = sizeof (in6_addr_t) * sctp->sctp_nfaddrs; 1519852Svi117747 alist = kmem_alloc(asize, KM_NOSLEEP); 15201735Skcpoon if (alist == NULL) { 15213448Sdh155122 SCTP_KSTAT(sctps, sctp_cl_assoc_change); 1522852Svi117747 return (ENOMEM); 15231735Skcpoon } 1524852Svi117747 /* 1525852Svi117747 * Just include the address the INIT was sent to in the 1526852Svi117747 * delete list and send the entire faddr list. We could 1527852Svi117747 * do it differently (i.e include all the addresses in the 1528852Svi117747 * add list even if it contains the original address OR 1529852Svi117747 * remove the original address from the add list etc.), but 1530852Svi117747 * this seems reasonable enough. 1531852Svi117747 */ 1532852Svi117747 dsize = sizeof (in6_addr_t); 1533852Svi117747 dlist = kmem_alloc(dsize, KM_NOSLEEP); 1534852Svi117747 if (dlist == NULL) { 1535852Svi117747 kmem_free(alist, asize); 15363448Sdh155122 SCTP_KSTAT(sctps, sctp_cl_assoc_change); 1537852Svi117747 return (ENOMEM); 1538852Svi117747 } 1539852Svi117747 bcopy(&curaddr, dlist, sizeof (curaddr)); 1540852Svi117747 sctp_get_faddr_list(sctp, alist, asize); 1541852Svi117747 (*cl_sctp_assoc_change)(sctp->sctp_family, alist, asize, 1542852Svi117747 sctp->sctp_nfaddrs, dlist, dsize, 1, SCTP_CL_PADDR, 1543852Svi117747 (cl_sctp_handle_t)sctp); 1544852Svi117747 /* alist and dlist will be freed by the clustering module */ 1545852Svi117747 } 15460Sstevel@tonic-gate return (0); 15470Sstevel@tonic-gate } 15480Sstevel@tonic-gate 15490Sstevel@tonic-gate /* 15500Sstevel@tonic-gate * Returns 0 if the check failed and the restart should be refused, 15510Sstevel@tonic-gate * 1 if the check succeeded. 15520Sstevel@tonic-gate */ 15530Sstevel@tonic-gate int 15540Sstevel@tonic-gate sctp_secure_restart_check(mblk_t *pkt, sctp_chunk_hdr_t *ich, uint32_t ports, 15553448Sdh155122 int sleep, sctp_stack_t *sctps) 15560Sstevel@tonic-gate { 1557*4964Skcpoon sctp_faddr_t *fp, *fphead = NULL; 15580Sstevel@tonic-gate sctp_parm_hdr_t *ph; 15590Sstevel@tonic-gate ssize_t remaining; 15600Sstevel@tonic-gate int isv4; 15610Sstevel@tonic-gate ipha_t *iph; 15620Sstevel@tonic-gate ip6_t *ip6h; 15630Sstevel@tonic-gate in6_addr_t hdraddr[1]; 15640Sstevel@tonic-gate int retval = 0; 15650Sstevel@tonic-gate sctp_tf_t *tf; 15660Sstevel@tonic-gate sctp_t *sctp; 15670Sstevel@tonic-gate int compres; 15680Sstevel@tonic-gate sctp_init_chunk_t *init; 15690Sstevel@tonic-gate int nadded = 0; 15700Sstevel@tonic-gate 15710Sstevel@tonic-gate /* extract the address from the IP header */ 15720Sstevel@tonic-gate isv4 = (IPH_HDR_VERSION(pkt->b_rptr) == IPV4_VERSION); 15730Sstevel@tonic-gate if (isv4) { 15740Sstevel@tonic-gate iph = (ipha_t *)pkt->b_rptr; 15750Sstevel@tonic-gate IN6_IPADDR_TO_V4MAPPED(iph->ipha_src, hdraddr); 15760Sstevel@tonic-gate } else { 15770Sstevel@tonic-gate ip6h = (ip6_t *)pkt->b_rptr; 15780Sstevel@tonic-gate hdraddr[0] = ip6h->ip6_src; 15790Sstevel@tonic-gate } 15800Sstevel@tonic-gate 15810Sstevel@tonic-gate /* Walk the params in the INIT [ACK], pulling out addr params */ 15820Sstevel@tonic-gate remaining = ntohs(ich->sch_len) - sizeof (*ich) - 15830Sstevel@tonic-gate sizeof (sctp_init_chunk_t); 15840Sstevel@tonic-gate if (remaining < sizeof (*ph)) { 15850Sstevel@tonic-gate /* no parameters; restart OK */ 15860Sstevel@tonic-gate return (1); 15870Sstevel@tonic-gate } 15880Sstevel@tonic-gate init = (sctp_init_chunk_t *)(ich + 1); 15890Sstevel@tonic-gate ph = (sctp_parm_hdr_t *)(init + 1); 15900Sstevel@tonic-gate 15910Sstevel@tonic-gate while (ph != NULL) { 1592*4964Skcpoon sctp_faddr_t *fpa = NULL; 1593*4964Skcpoon 15940Sstevel@tonic-gate /* params will have already been byteordered when validating */ 15950Sstevel@tonic-gate if (ph->sph_type == htons(PARM_ADDR4)) { 15960Sstevel@tonic-gate if (remaining >= PARM_ADDR4_LEN) { 15970Sstevel@tonic-gate in6_addr_t addr; 15980Sstevel@tonic-gate IN6_INADDR_TO_V4MAPPED((struct in_addr *) 15990Sstevel@tonic-gate (ph + 1), &addr); 16000Sstevel@tonic-gate fpa = kmem_cache_alloc(sctp_kmem_faddr_cache, 16010Sstevel@tonic-gate sleep); 1602*4964Skcpoon if (fpa == NULL) { 16030Sstevel@tonic-gate goto done; 16040Sstevel@tonic-gate } 16050Sstevel@tonic-gate bzero(fpa, sizeof (*fpa)); 16060Sstevel@tonic-gate fpa->faddr = addr; 16070Sstevel@tonic-gate fpa->next = NULL; 16080Sstevel@tonic-gate } 16090Sstevel@tonic-gate } else if (ph->sph_type == htons(PARM_ADDR6)) { 16100Sstevel@tonic-gate if (remaining >= PARM_ADDR6_LEN) { 16110Sstevel@tonic-gate fpa = kmem_cache_alloc(sctp_kmem_faddr_cache, 16120Sstevel@tonic-gate sleep); 1613*4964Skcpoon if (fpa == NULL) { 16140Sstevel@tonic-gate goto done; 16150Sstevel@tonic-gate } 16160Sstevel@tonic-gate bzero(fpa, sizeof (*fpa)); 16170Sstevel@tonic-gate bcopy(ph + 1, &fpa->faddr, 16180Sstevel@tonic-gate sizeof (fpa->faddr)); 16190Sstevel@tonic-gate fpa->next = NULL; 16200Sstevel@tonic-gate } 16210Sstevel@tonic-gate } 16220Sstevel@tonic-gate /* link in the new addr, if it was an addr param */ 1623*4964Skcpoon if (fpa != NULL) { 1624*4964Skcpoon if (fphead == NULL) { 16250Sstevel@tonic-gate fphead = fpa; 16260Sstevel@tonic-gate } else { 1627*4964Skcpoon fpa->next = fphead; 1628*4964Skcpoon fphead = fpa; 16290Sstevel@tonic-gate } 16300Sstevel@tonic-gate } 16310Sstevel@tonic-gate 16320Sstevel@tonic-gate ph = sctp_next_parm(ph, &remaining); 16330Sstevel@tonic-gate } 16340Sstevel@tonic-gate 16350Sstevel@tonic-gate if (fphead == NULL) { 16360Sstevel@tonic-gate /* no addr parameters; restart OK */ 16370Sstevel@tonic-gate return (1); 16380Sstevel@tonic-gate } 16390Sstevel@tonic-gate 16400Sstevel@tonic-gate /* 16410Sstevel@tonic-gate * got at least one; make sure the header's addr is 16420Sstevel@tonic-gate * in the list 16430Sstevel@tonic-gate */ 16440Sstevel@tonic-gate fp = sctp_lookup_faddr_nosctp(fphead, hdraddr); 1645*4964Skcpoon if (fp == NULL) { 16460Sstevel@tonic-gate /* not included; add it now */ 16470Sstevel@tonic-gate fp = kmem_cache_alloc(sctp_kmem_faddr_cache, sleep); 1648*4964Skcpoon if (fp == NULL) { 16490Sstevel@tonic-gate goto done; 16500Sstevel@tonic-gate } 16510Sstevel@tonic-gate bzero(fp, sizeof (*fp)); 16520Sstevel@tonic-gate fp->faddr = *hdraddr; 16530Sstevel@tonic-gate fp->next = fphead; 16540Sstevel@tonic-gate fphead = fp; 16550Sstevel@tonic-gate } 16560Sstevel@tonic-gate 16570Sstevel@tonic-gate /* 16580Sstevel@tonic-gate * Now, we can finally do the check: For each sctp instance 16590Sstevel@tonic-gate * on the hash line for ports, compare its faddr set against 16600Sstevel@tonic-gate * the new one. If the new one is a strict subset of any 16610Sstevel@tonic-gate * existing sctp's faddrs, the restart is OK. However, if there 16620Sstevel@tonic-gate * is an overlap, this could be an attack, so return failure. 16630Sstevel@tonic-gate * If all sctp's faddrs are disjoint, this is a legitimate new 16640Sstevel@tonic-gate * association. 16650Sstevel@tonic-gate */ 16663448Sdh155122 tf = &(sctps->sctps_conn_fanout[SCTP_CONN_HASH(sctps, ports)]); 16670Sstevel@tonic-gate mutex_enter(&tf->tf_lock); 16680Sstevel@tonic-gate 16690Sstevel@tonic-gate for (sctp = tf->tf_sctp; sctp; sctp = sctp->sctp_conn_hash_next) { 16700Sstevel@tonic-gate if (ports != sctp->sctp_ports) { 16710Sstevel@tonic-gate continue; 16720Sstevel@tonic-gate } 16730Sstevel@tonic-gate compres = sctp_compare_faddrsets(fphead, sctp->sctp_faddrs); 16740Sstevel@tonic-gate if (compres <= SCTP_ADDR_SUBSET) { 16750Sstevel@tonic-gate retval = 1; 16760Sstevel@tonic-gate mutex_exit(&tf->tf_lock); 16770Sstevel@tonic-gate goto done; 16780Sstevel@tonic-gate } 16790Sstevel@tonic-gate if (compres == SCTP_ADDR_OVERLAP) { 16800Sstevel@tonic-gate dprint(1, 16810Sstevel@tonic-gate ("new assoc from %x:%x:%x:%x overlaps with %p\n", 16821676Sjpk SCTP_PRINTADDR(*hdraddr), (void *)sctp)); 16830Sstevel@tonic-gate /* 16840Sstevel@tonic-gate * While we still hold the lock, we need to 16850Sstevel@tonic-gate * figure out which addresses have been 16860Sstevel@tonic-gate * added so we can include them in the abort 16870Sstevel@tonic-gate * we will send back. Since these faddrs will 16880Sstevel@tonic-gate * never be used, we overload the rto field 16890Sstevel@tonic-gate * here, setting it to 0 if the address was 16900Sstevel@tonic-gate * not added, 1 if it was added. 16910Sstevel@tonic-gate */ 16920Sstevel@tonic-gate for (fp = fphead; fp; fp = fp->next) { 16930Sstevel@tonic-gate if (sctp_lookup_faddr(sctp, &fp->faddr)) { 16940Sstevel@tonic-gate fp->rto = 0; 16950Sstevel@tonic-gate } else { 16960Sstevel@tonic-gate fp->rto = 1; 16970Sstevel@tonic-gate nadded++; 16980Sstevel@tonic-gate } 16990Sstevel@tonic-gate } 17000Sstevel@tonic-gate mutex_exit(&tf->tf_lock); 17010Sstevel@tonic-gate goto done; 17020Sstevel@tonic-gate } 17030Sstevel@tonic-gate } 17040Sstevel@tonic-gate mutex_exit(&tf->tf_lock); 17050Sstevel@tonic-gate 17060Sstevel@tonic-gate /* All faddrs are disjoint; legit new association */ 17070Sstevel@tonic-gate retval = 1; 17080Sstevel@tonic-gate 17090Sstevel@tonic-gate done: 17100Sstevel@tonic-gate /* If are attempted adds, send back an abort listing the addrs */ 17110Sstevel@tonic-gate if (nadded > 0) { 17120Sstevel@tonic-gate void *dtail; 17130Sstevel@tonic-gate size_t dlen; 17140Sstevel@tonic-gate 17150Sstevel@tonic-gate dtail = kmem_alloc(PARM_ADDR6_LEN * nadded, KM_NOSLEEP); 17160Sstevel@tonic-gate if (dtail == NULL) { 17170Sstevel@tonic-gate goto cleanup; 17180Sstevel@tonic-gate } 17190Sstevel@tonic-gate 17200Sstevel@tonic-gate ph = dtail; 17210Sstevel@tonic-gate dlen = 0; 17220Sstevel@tonic-gate for (fp = fphead; fp; fp = fp->next) { 17230Sstevel@tonic-gate if (fp->rto == 0) { 17240Sstevel@tonic-gate continue; 17250Sstevel@tonic-gate } 17260Sstevel@tonic-gate if (IN6_IS_ADDR_V4MAPPED(&fp->faddr)) { 17270Sstevel@tonic-gate ipaddr_t addr4; 17280Sstevel@tonic-gate 17290Sstevel@tonic-gate ph->sph_type = htons(PARM_ADDR4); 17300Sstevel@tonic-gate ph->sph_len = htons(PARM_ADDR4_LEN); 17310Sstevel@tonic-gate IN6_V4MAPPED_TO_IPADDR(&fp->faddr, addr4); 17320Sstevel@tonic-gate ph++; 17330Sstevel@tonic-gate bcopy(&addr4, ph, sizeof (addr4)); 17340Sstevel@tonic-gate ph = (sctp_parm_hdr_t *) 17350Sstevel@tonic-gate ((char *)ph + sizeof (addr4)); 17360Sstevel@tonic-gate dlen += PARM_ADDR4_LEN; 17370Sstevel@tonic-gate } else { 17380Sstevel@tonic-gate ph->sph_type = htons(PARM_ADDR6); 17390Sstevel@tonic-gate ph->sph_len = htons(PARM_ADDR6_LEN); 17400Sstevel@tonic-gate ph++; 17410Sstevel@tonic-gate bcopy(&fp->faddr, ph, sizeof (fp->faddr)); 17420Sstevel@tonic-gate ph = (sctp_parm_hdr_t *) 17430Sstevel@tonic-gate ((char *)ph + sizeof (fp->faddr)); 17440Sstevel@tonic-gate dlen += PARM_ADDR6_LEN; 17450Sstevel@tonic-gate } 17460Sstevel@tonic-gate } 17470Sstevel@tonic-gate 17480Sstevel@tonic-gate /* Send off the abort */ 17490Sstevel@tonic-gate sctp_send_abort(sctp, sctp_init2vtag(ich), 17500Sstevel@tonic-gate SCTP_ERR_RESTART_NEW_ADDRS, dtail, dlen, pkt, 0, B_TRUE); 17510Sstevel@tonic-gate 17520Sstevel@tonic-gate kmem_free(dtail, PARM_ADDR6_LEN * nadded); 17530Sstevel@tonic-gate } 17540Sstevel@tonic-gate 17550Sstevel@tonic-gate cleanup: 17560Sstevel@tonic-gate /* Clean up */ 17570Sstevel@tonic-gate if (fphead) { 17580Sstevel@tonic-gate sctp_faddr_t *fpn; 17590Sstevel@tonic-gate for (fp = fphead; fp; fp = fpn) { 17600Sstevel@tonic-gate fpn = fp->next; 17610Sstevel@tonic-gate kmem_cache_free(sctp_kmem_faddr_cache, fp); 17620Sstevel@tonic-gate } 17630Sstevel@tonic-gate } 17640Sstevel@tonic-gate 17650Sstevel@tonic-gate return (retval); 17660Sstevel@tonic-gate } 17670Sstevel@tonic-gate 17681932Svi117747 /* 17691932Svi117747 * Reset any state related to transmitted chunks. 17701932Svi117747 */ 17710Sstevel@tonic-gate void 17720Sstevel@tonic-gate sctp_congest_reset(sctp_t *sctp) 17730Sstevel@tonic-gate { 17741932Svi117747 sctp_faddr_t *fp; 17753448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 17761932Svi117747 mblk_t *mp; 17770Sstevel@tonic-gate 17781932Svi117747 for (fp = sctp->sctp_faddrs; fp != NULL; fp = fp->next) { 17793448Sdh155122 fp->ssthresh = sctps->sctps_initial_mtu; 17803795Skcpoon SET_CWND(fp, fp->sfa_pmss, sctps->sctps_slow_start_initial); 17810Sstevel@tonic-gate fp->suna = 0; 17820Sstevel@tonic-gate fp->pba = 0; 17830Sstevel@tonic-gate } 17841932Svi117747 /* 17851932Svi117747 * Clean up the transmit list as well since we have reset accounting 17861932Svi117747 * on all the fps. Send event upstream, if required. 17871932Svi117747 */ 17881932Svi117747 while ((mp = sctp->sctp_xmit_head) != NULL) { 17891932Svi117747 sctp->sctp_xmit_head = mp->b_next; 17901932Svi117747 mp->b_next = NULL; 17911932Svi117747 if (sctp->sctp_xmit_head != NULL) 17921932Svi117747 sctp->sctp_xmit_head->b_prev = NULL; 17931932Svi117747 sctp_sendfail_event(sctp, mp, 0, B_TRUE); 17941932Svi117747 } 17951932Svi117747 sctp->sctp_xmit_head = NULL; 17961932Svi117747 sctp->sctp_xmit_tail = NULL; 17971932Svi117747 sctp->sctp_xmit_unacked = NULL; 17981932Svi117747 17991932Svi117747 sctp->sctp_unacked = 0; 18001932Svi117747 /* 18011932Svi117747 * Any control message as well. We will clean-up this list as well. 18021932Svi117747 * This contains any pending ASCONF request that we have queued/sent. 18031932Svi117747 * If we do get an ACK we will just drop it. However, given that 18041932Svi117747 * we are restarting chances are we aren't going to get any. 18051932Svi117747 */ 18061932Svi117747 if (sctp->sctp_cxmit_list != NULL) 18071932Svi117747 sctp_asconf_free_cxmit(sctp, NULL); 18081932Svi117747 sctp->sctp_cxmit_list = NULL; 18091932Svi117747 sctp->sctp_cchunk_pend = 0; 18101932Svi117747 18111932Svi117747 sctp->sctp_rexmitting = B_FALSE; 18121932Svi117747 sctp->sctp_rxt_nxttsn = 0; 18131932Svi117747 sctp->sctp_rxt_maxtsn = 0; 18141932Svi117747 18151932Svi117747 sctp->sctp_zero_win_probe = B_FALSE; 18160Sstevel@tonic-gate } 18170Sstevel@tonic-gate 18180Sstevel@tonic-gate static void 18191735Skcpoon sctp_init_faddr(sctp_t *sctp, sctp_faddr_t *fp, in6_addr_t *addr, 18201735Skcpoon mblk_t *timer_mp) 18210Sstevel@tonic-gate { 18223448Sdh155122 sctp_stack_t *sctps = sctp->sctp_sctps; 18233448Sdh155122 18240Sstevel@tonic-gate bcopy(addr, &fp->faddr, sizeof (*addr)); 18250Sstevel@tonic-gate if (IN6_IS_ADDR_V4MAPPED(addr)) { 18260Sstevel@tonic-gate fp->isv4 = 1; 18270Sstevel@tonic-gate /* Make sure that sfa_pmss is a multiple of SCTP_ALIGN. */ 18284691Skcpoon fp->sfa_pmss = 18294691Skcpoon (sctps->sctps_initial_mtu - sctp->sctp_hdr_len) & 18304691Skcpoon ~(SCTP_ALIGN - 1); 18310Sstevel@tonic-gate } else { 18320Sstevel@tonic-gate fp->isv4 = 0; 18333448Sdh155122 fp->sfa_pmss = 18343448Sdh155122 (sctps->sctps_initial_mtu - sctp->sctp_hdr6_len) & 18353448Sdh155122 ~(SCTP_ALIGN - 1); 18360Sstevel@tonic-gate } 18373448Sdh155122 fp->cwnd = sctps->sctps_slow_start_initial * fp->sfa_pmss; 18380Sstevel@tonic-gate fp->rto = MIN(sctp->sctp_rto_initial, sctp->sctp_init_rto_max); 18390Sstevel@tonic-gate fp->srtt = -1; 18400Sstevel@tonic-gate fp->rtt_updates = 0; 18410Sstevel@tonic-gate fp->strikes = 0; 18420Sstevel@tonic-gate fp->max_retr = sctp->sctp_pp_max_rxt; 18430Sstevel@tonic-gate /* Mark it as not confirmed. */ 18440Sstevel@tonic-gate fp->state = SCTP_FADDRS_UNCONFIRMED; 18450Sstevel@tonic-gate fp->hb_interval = sctp->sctp_hb_interval; 18463448Sdh155122 fp->ssthresh = sctps->sctps_initial_ssthresh; 18470Sstevel@tonic-gate fp->suna = 0; 18480Sstevel@tonic-gate fp->pba = 0; 18490Sstevel@tonic-gate fp->acked = 0; 18500Sstevel@tonic-gate fp->lastactive = lbolt64; 18511735Skcpoon fp->timer_mp = timer_mp; 18520Sstevel@tonic-gate fp->hb_pending = B_FALSE; 18534818Skcpoon fp->hb_enabled = B_TRUE; 18540Sstevel@tonic-gate fp->timer_running = 0; 18550Sstevel@tonic-gate fp->df = 1; 18560Sstevel@tonic-gate fp->pmtu_discovered = 0; 18570Sstevel@tonic-gate fp->rc_timer_mp = NULL; 18580Sstevel@tonic-gate fp->rc_timer_running = 0; 18590Sstevel@tonic-gate fp->next = NULL; 18600Sstevel@tonic-gate fp->ire = NULL; 18610Sstevel@tonic-gate fp->T3expire = 0; 18620Sstevel@tonic-gate (void) random_get_pseudo_bytes((uint8_t *)&fp->hb_secret, 18630Sstevel@tonic-gate sizeof (fp->hb_secret)); 18640Sstevel@tonic-gate fp->hb_expiry = lbolt64; 18653795Skcpoon fp->rxt_unacked = 0; 18660Sstevel@tonic-gate 18671735Skcpoon sctp_get_ire(sctp, fp); 18680Sstevel@tonic-gate } 18690Sstevel@tonic-gate 18700Sstevel@tonic-gate /*ARGSUSED*/ 18710Sstevel@tonic-gate static void 18720Sstevel@tonic-gate faddr_destructor(void *buf, void *cdrarg) 18730Sstevel@tonic-gate { 18740Sstevel@tonic-gate sctp_faddr_t *fp = buf; 18750Sstevel@tonic-gate 18760Sstevel@tonic-gate ASSERT(fp->timer_mp == NULL); 18770Sstevel@tonic-gate ASSERT(fp->timer_running == 0); 18780Sstevel@tonic-gate 18790Sstevel@tonic-gate ASSERT(fp->rc_timer_mp == NULL); 18800Sstevel@tonic-gate ASSERT(fp->rc_timer_running == 0); 18810Sstevel@tonic-gate } 18820Sstevel@tonic-gate 18830Sstevel@tonic-gate void 18841676Sjpk sctp_faddr_init(void) 18850Sstevel@tonic-gate { 18860Sstevel@tonic-gate sctp_kmem_faddr_cache = kmem_cache_create("sctp_faddr_cache", 18870Sstevel@tonic-gate sizeof (sctp_faddr_t), 0, NULL, faddr_destructor, 18880Sstevel@tonic-gate NULL, NULL, NULL, 0); 18890Sstevel@tonic-gate } 18900Sstevel@tonic-gate 18910Sstevel@tonic-gate void 18921676Sjpk sctp_faddr_fini(void) 18930Sstevel@tonic-gate { 18940Sstevel@tonic-gate kmem_cache_destroy(sctp_kmem_faddr_cache); 18950Sstevel@tonic-gate } 1896