18348SEric.Yu@Sun.COM /* 28348SEric.Yu@Sun.COM * CDDL HEADER START 38348SEric.Yu@Sun.COM * 48348SEric.Yu@Sun.COM * The contents of this file are subject to the terms of the 58348SEric.Yu@Sun.COM * Common Development and Distribution License (the "License"). 68348SEric.Yu@Sun.COM * You may not use this file except in compliance with the License. 78348SEric.Yu@Sun.COM * 88348SEric.Yu@Sun.COM * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 98348SEric.Yu@Sun.COM * or http://www.opensolaris.org/os/licensing. 108348SEric.Yu@Sun.COM * See the License for the specific language governing permissions 118348SEric.Yu@Sun.COM * and limitations under the License. 128348SEric.Yu@Sun.COM * 138348SEric.Yu@Sun.COM * When distributing Covered Code, include this CDDL HEADER in each 148348SEric.Yu@Sun.COM * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 158348SEric.Yu@Sun.COM * If applicable, add the following below this CDDL HEADER, with the 168348SEric.Yu@Sun.COM * fields enclosed by brackets "[]" replaced with your own identifying 178348SEric.Yu@Sun.COM * information: Portions Copyright [yyyy] [name of copyright owner] 188348SEric.Yu@Sun.COM * 198348SEric.Yu@Sun.COM * CDDL HEADER END 208348SEric.Yu@Sun.COM */ 218348SEric.Yu@Sun.COM 228348SEric.Yu@Sun.COM /* 238489Sshenjian * Copyright 2009 Sun Microsystems, Inc. All rights reserved. 248348SEric.Yu@Sun.COM * Use is subject to license terms. 258348SEric.Yu@Sun.COM */ 268348SEric.Yu@Sun.COM 278348SEric.Yu@Sun.COM #include <sys/types.h> 288348SEric.Yu@Sun.COM #include <sys/param.h> 298348SEric.Yu@Sun.COM #include <sys/systm.h> 308348SEric.Yu@Sun.COM #include <sys/sysmacros.h> 318348SEric.Yu@Sun.COM #include <sys/debug.h> 328348SEric.Yu@Sun.COM #include <sys/cmn_err.h> 338348SEric.Yu@Sun.COM 348348SEric.Yu@Sun.COM #include <sys/stropts.h> 358348SEric.Yu@Sun.COM #include <sys/socket.h> 368348SEric.Yu@Sun.COM #include <sys/socketvar.h> 378348SEric.Yu@Sun.COM 388348SEric.Yu@Sun.COM #define _SUN_TPI_VERSION 2 398348SEric.Yu@Sun.COM #include <sys/tihdr.h> 408348SEric.Yu@Sun.COM #include <sys/sockio.h> 418348SEric.Yu@Sun.COM #include <sys/sodirect.h> 428348SEric.Yu@Sun.COM #include <sys/kmem_impl.h> 438348SEric.Yu@Sun.COM 448348SEric.Yu@Sun.COM #include <sys/strsubr.h> 458348SEric.Yu@Sun.COM #include <sys/strsun.h> 468348SEric.Yu@Sun.COM #include <sys/ddi.h> 478348SEric.Yu@Sun.COM #include <netinet/in.h> 488348SEric.Yu@Sun.COM #include <inet/ip.h> 498348SEric.Yu@Sun.COM 508348SEric.Yu@Sun.COM #include <fs/sockfs/sockcommon.h> 518348SEric.Yu@Sun.COM 528348SEric.Yu@Sun.COM #include <sys/socket_proto.h> 538348SEric.Yu@Sun.COM 548348SEric.Yu@Sun.COM #include <fs/sockfs/socktpi_impl.h> 558348SEric.Yu@Sun.COM #include <sys/tihdr.h> 568348SEric.Yu@Sun.COM #include <fs/sockfs/nl7c.h> 578348SEric.Yu@Sun.COM #include <inet/kssl/ksslapi.h> 588348SEric.Yu@Sun.COM 598348SEric.Yu@Sun.COM 608348SEric.Yu@Sun.COM extern int xnet_skip_checks; 618348SEric.Yu@Sun.COM extern int xnet_check_print; 628348SEric.Yu@Sun.COM 638348SEric.Yu@Sun.COM static void so_queue_oob(sock_upper_handle_t, mblk_t *, size_t); 648348SEric.Yu@Sun.COM 658348SEric.Yu@Sun.COM 668348SEric.Yu@Sun.COM /*ARGSUSED*/ 678348SEric.Yu@Sun.COM int 688348SEric.Yu@Sun.COM so_accept_notsupp(struct sonode *lso, int fflag, 698348SEric.Yu@Sun.COM struct cred *cr, struct sonode **nsop) 708348SEric.Yu@Sun.COM { 718348SEric.Yu@Sun.COM return (EOPNOTSUPP); 728348SEric.Yu@Sun.COM } 738348SEric.Yu@Sun.COM 748348SEric.Yu@Sun.COM /*ARGSUSED*/ 758348SEric.Yu@Sun.COM int 768348SEric.Yu@Sun.COM so_listen_notsupp(struct sonode *so, int backlog, struct cred *cr) 778348SEric.Yu@Sun.COM { 788348SEric.Yu@Sun.COM return (EOPNOTSUPP); 798348SEric.Yu@Sun.COM } 808348SEric.Yu@Sun.COM 818348SEric.Yu@Sun.COM /*ARGSUSED*/ 828348SEric.Yu@Sun.COM int 838348SEric.Yu@Sun.COM so_getsockname_notsupp(struct sonode *so, struct sockaddr *sa, 848348SEric.Yu@Sun.COM socklen_t *len, struct cred *cr) 858348SEric.Yu@Sun.COM { 868348SEric.Yu@Sun.COM return (EOPNOTSUPP); 878348SEric.Yu@Sun.COM } 888348SEric.Yu@Sun.COM 898348SEric.Yu@Sun.COM /*ARGSUSED*/ 908348SEric.Yu@Sun.COM int 918348SEric.Yu@Sun.COM so_getpeername_notsupp(struct sonode *so, struct sockaddr *addr, 928348SEric.Yu@Sun.COM socklen_t *addrlen, boolean_t accept, struct cred *cr) 938348SEric.Yu@Sun.COM { 948348SEric.Yu@Sun.COM return (EOPNOTSUPP); 958348SEric.Yu@Sun.COM } 968348SEric.Yu@Sun.COM 978348SEric.Yu@Sun.COM /*ARGSUSED*/ 988348SEric.Yu@Sun.COM int 998348SEric.Yu@Sun.COM so_shutdown_notsupp(struct sonode *so, int how, struct cred *cr) 1008348SEric.Yu@Sun.COM { 1018348SEric.Yu@Sun.COM return (EOPNOTSUPP); 1028348SEric.Yu@Sun.COM } 1038348SEric.Yu@Sun.COM 1048348SEric.Yu@Sun.COM /*ARGSUSED*/ 1058348SEric.Yu@Sun.COM int 1068348SEric.Yu@Sun.COM so_sendmblk_notsupp(struct sonode *so, struct msghdr *msg, int fflag, 1078348SEric.Yu@Sun.COM struct cred *cr, mblk_t **mpp) 1088348SEric.Yu@Sun.COM { 1098348SEric.Yu@Sun.COM return (EOPNOTSUPP); 1108348SEric.Yu@Sun.COM } 1118348SEric.Yu@Sun.COM 1128348SEric.Yu@Sun.COM /* 1138348SEric.Yu@Sun.COM * Generic Socket Ops 1148348SEric.Yu@Sun.COM */ 1158348SEric.Yu@Sun.COM 1168348SEric.Yu@Sun.COM /* ARGSUSED */ 1178348SEric.Yu@Sun.COM int 1188348SEric.Yu@Sun.COM so_init(struct sonode *so, struct sonode *pso, struct cred *cr, int flags) 1198348SEric.Yu@Sun.COM { 1208348SEric.Yu@Sun.COM return (socket_init_common(so, pso, flags, cr)); 1218348SEric.Yu@Sun.COM } 1228348SEric.Yu@Sun.COM 1238348SEric.Yu@Sun.COM int 1248348SEric.Yu@Sun.COM so_bind(struct sonode *so, struct sockaddr *name, socklen_t namelen, 1258348SEric.Yu@Sun.COM int flags, struct cred *cr) 1268348SEric.Yu@Sun.COM { 1278348SEric.Yu@Sun.COM int error; 1288348SEric.Yu@Sun.COM 1298348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_BIND(so, name, namelen, flags, cr)); 1308348SEric.Yu@Sun.COM 1318348SEric.Yu@Sun.COM ASSERT(flags == _SOBIND_XPG4_2 || flags == _SOBIND_SOCKBSD); 1328348SEric.Yu@Sun.COM 1338348SEric.Yu@Sun.COM /* X/Open requires this check */ 1348348SEric.Yu@Sun.COM if ((so->so_state & SS_CANTSENDMORE) && !xnet_skip_checks) { 1358348SEric.Yu@Sun.COM if (xnet_check_print) { 1368348SEric.Yu@Sun.COM printf("sockfs: X/Open bind state check " 1378348SEric.Yu@Sun.COM "caused EINVAL\n"); 1388348SEric.Yu@Sun.COM } 1398348SEric.Yu@Sun.COM error = EINVAL; 1408348SEric.Yu@Sun.COM goto done; 1418348SEric.Yu@Sun.COM } 1428348SEric.Yu@Sun.COM 1438348SEric.Yu@Sun.COM /* 1448348SEric.Yu@Sun.COM * a bind to a NULL address is interpreted as unbind. So just 1458348SEric.Yu@Sun.COM * do the downcall. 1468348SEric.Yu@Sun.COM */ 1478348SEric.Yu@Sun.COM if (name == NULL) 1488348SEric.Yu@Sun.COM goto dobind; 1498348SEric.Yu@Sun.COM 1508348SEric.Yu@Sun.COM switch (so->so_family) { 1518348SEric.Yu@Sun.COM case AF_INET: 1528348SEric.Yu@Sun.COM if ((size_t)namelen != sizeof (sin_t)) { 1538348SEric.Yu@Sun.COM error = name->sa_family != so->so_family ? 1548348SEric.Yu@Sun.COM EAFNOSUPPORT : EINVAL; 1558348SEric.Yu@Sun.COM eprintsoline(so, error); 1568348SEric.Yu@Sun.COM goto done; 1578348SEric.Yu@Sun.COM } 1588348SEric.Yu@Sun.COM 1598348SEric.Yu@Sun.COM if ((flags & _SOBIND_XPG4_2) && 1608348SEric.Yu@Sun.COM (name->sa_family != so->so_family)) { 1618348SEric.Yu@Sun.COM /* 1628348SEric.Yu@Sun.COM * This check has to be made for X/Open 1638348SEric.Yu@Sun.COM * sockets however application failures have 1648348SEric.Yu@Sun.COM * been observed when it is applied to 1658348SEric.Yu@Sun.COM * all sockets. 1668348SEric.Yu@Sun.COM */ 1678348SEric.Yu@Sun.COM error = EAFNOSUPPORT; 1688348SEric.Yu@Sun.COM eprintsoline(so, error); 1698348SEric.Yu@Sun.COM goto done; 1708348SEric.Yu@Sun.COM } 1718348SEric.Yu@Sun.COM /* 1728348SEric.Yu@Sun.COM * Force a zero sa_family to match so_family. 1738348SEric.Yu@Sun.COM * 1748348SEric.Yu@Sun.COM * Some programs like inetd(1M) don't set the 1758348SEric.Yu@Sun.COM * family field. Other programs leave 1768348SEric.Yu@Sun.COM * sin_family set to garbage - SunOS 4.X does 1778348SEric.Yu@Sun.COM * not check the family field on a bind. 1788348SEric.Yu@Sun.COM * We use the family field that 1798348SEric.Yu@Sun.COM * was passed in to the socket() call. 1808348SEric.Yu@Sun.COM */ 1818348SEric.Yu@Sun.COM name->sa_family = so->so_family; 1828348SEric.Yu@Sun.COM break; 1838348SEric.Yu@Sun.COM 1848348SEric.Yu@Sun.COM case AF_INET6: { 1858348SEric.Yu@Sun.COM #ifdef DEBUG 1868348SEric.Yu@Sun.COM sin6_t *sin6 = (sin6_t *)name; 1878348SEric.Yu@Sun.COM #endif 1888348SEric.Yu@Sun.COM if ((size_t)namelen != sizeof (sin6_t)) { 1898348SEric.Yu@Sun.COM error = name->sa_family != so->so_family ? 1908348SEric.Yu@Sun.COM EAFNOSUPPORT : EINVAL; 1918348SEric.Yu@Sun.COM eprintsoline(so, error); 1928348SEric.Yu@Sun.COM goto done; 1938348SEric.Yu@Sun.COM } 1948348SEric.Yu@Sun.COM 1958348SEric.Yu@Sun.COM if (name->sa_family != so->so_family) { 1968348SEric.Yu@Sun.COM /* 1978348SEric.Yu@Sun.COM * With IPv6 we require the family to match 1988348SEric.Yu@Sun.COM * unlike in IPv4. 1998348SEric.Yu@Sun.COM */ 2008348SEric.Yu@Sun.COM error = EAFNOSUPPORT; 2018348SEric.Yu@Sun.COM eprintsoline(so, error); 2028348SEric.Yu@Sun.COM goto done; 2038348SEric.Yu@Sun.COM } 2048348SEric.Yu@Sun.COM #ifdef DEBUG 2058348SEric.Yu@Sun.COM /* 2068348SEric.Yu@Sun.COM * Verify that apps don't forget to clear 2078348SEric.Yu@Sun.COM * sin6_scope_id etc 2088348SEric.Yu@Sun.COM */ 2098348SEric.Yu@Sun.COM if (sin6->sin6_scope_id != 0 && 2108348SEric.Yu@Sun.COM !IN6_IS_ADDR_LINKSCOPE(&sin6->sin6_addr)) { 2118348SEric.Yu@Sun.COM zcmn_err(getzoneid(), CE_WARN, 2128348SEric.Yu@Sun.COM "bind with uninitialized sin6_scope_id " 2138348SEric.Yu@Sun.COM "(%d) on socket. Pid = %d\n", 2148348SEric.Yu@Sun.COM (int)sin6->sin6_scope_id, 2158348SEric.Yu@Sun.COM (int)curproc->p_pid); 2168348SEric.Yu@Sun.COM } 2178348SEric.Yu@Sun.COM if (sin6->__sin6_src_id != 0) { 2188348SEric.Yu@Sun.COM zcmn_err(getzoneid(), CE_WARN, 2198348SEric.Yu@Sun.COM "bind with uninitialized __sin6_src_id " 2208348SEric.Yu@Sun.COM "(%d) on socket. Pid = %d\n", 2218348SEric.Yu@Sun.COM (int)sin6->__sin6_src_id, 2228348SEric.Yu@Sun.COM (int)curproc->p_pid); 2238348SEric.Yu@Sun.COM } 2248348SEric.Yu@Sun.COM #endif /* DEBUG */ 2258348SEric.Yu@Sun.COM 2268348SEric.Yu@Sun.COM break; 2278348SEric.Yu@Sun.COM } 2288348SEric.Yu@Sun.COM default: 2298348SEric.Yu@Sun.COM /* Just pass the request to the protocol */ 2308348SEric.Yu@Sun.COM goto dobind; 2318348SEric.Yu@Sun.COM } 2328348SEric.Yu@Sun.COM 2338348SEric.Yu@Sun.COM /* 2348348SEric.Yu@Sun.COM * First we check if either NCA or KSSL has been enabled for 2358348SEric.Yu@Sun.COM * the requested address, and if so, we fall back to TPI. 2368348SEric.Yu@Sun.COM * If neither of those two services are enabled, then we just 2378348SEric.Yu@Sun.COM * pass the request to the protocol. 2388348SEric.Yu@Sun.COM * 2398348SEric.Yu@Sun.COM * Note that KSSL can only be enabled on a socket if NCA is NOT 2408348SEric.Yu@Sun.COM * enabled for that socket, hence the else-statement below. 2418348SEric.Yu@Sun.COM */ 2428348SEric.Yu@Sun.COM if (nl7c_enabled && ((so->so_family == AF_INET || 2438348SEric.Yu@Sun.COM so->so_family == AF_INET6) && 2448348SEric.Yu@Sun.COM nl7c_lookup_addr(name, namelen) != NULL)) { 2458348SEric.Yu@Sun.COM /* 2468348SEric.Yu@Sun.COM * NL7C is not supported in non-global zones, 2478348SEric.Yu@Sun.COM * we enforce this restriction here. 2488348SEric.Yu@Sun.COM */ 2498348SEric.Yu@Sun.COM if (so->so_zoneid == GLOBAL_ZONEID) { 2508348SEric.Yu@Sun.COM /* NCA should be used, so fall back to TPI */ 2518348SEric.Yu@Sun.COM error = so_tpi_fallback(so, cr); 2528348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 2538348SEric.Yu@Sun.COM if (error) 2548348SEric.Yu@Sun.COM return (error); 2558348SEric.Yu@Sun.COM else 2568348SEric.Yu@Sun.COM return (SOP_BIND(so, name, namelen, flags, cr)); 2578348SEric.Yu@Sun.COM } 2588348SEric.Yu@Sun.COM } else if (so->so_type == SOCK_STREAM) { 2598348SEric.Yu@Sun.COM /* Check if KSSL has been configured for this address */ 2608348SEric.Yu@Sun.COM kssl_ent_t ent; 2618348SEric.Yu@Sun.COM kssl_endpt_type_t type; 2628348SEric.Yu@Sun.COM struct T_bind_req bind_req; 2638348SEric.Yu@Sun.COM mblk_t *mp; 2648348SEric.Yu@Sun.COM 2658348SEric.Yu@Sun.COM /* 2668348SEric.Yu@Sun.COM * TODO: Check with KSSL team if we could add a function call 2678348SEric.Yu@Sun.COM * that only queries whether KSSL is enabled for the given 2688348SEric.Yu@Sun.COM * address. 2698348SEric.Yu@Sun.COM */ 2708348SEric.Yu@Sun.COM bind_req.PRIM_type = T_BIND_REQ; 2718348SEric.Yu@Sun.COM bind_req.ADDR_length = namelen; 2728348SEric.Yu@Sun.COM bind_req.ADDR_offset = (t_scalar_t)sizeof (bind_req); 2738348SEric.Yu@Sun.COM mp = soallocproto2(&bind_req, sizeof (bind_req), 2748778SErik.Nordmark@Sun.COM name, namelen, 0, _ALLOC_SLEEP, cr); 2758348SEric.Yu@Sun.COM 2768348SEric.Yu@Sun.COM type = kssl_check_proxy(mp, so, &ent); 2778348SEric.Yu@Sun.COM freemsg(mp); 2788348SEric.Yu@Sun.COM 2798348SEric.Yu@Sun.COM if (type != KSSL_NO_PROXY) { 2808348SEric.Yu@Sun.COM /* 2818348SEric.Yu@Sun.COM * KSSL has been configured for this address, so 2828348SEric.Yu@Sun.COM * we must fall back to TPI. 2838348SEric.Yu@Sun.COM */ 2848348SEric.Yu@Sun.COM kssl_release_ent(ent, so, type); 2858348SEric.Yu@Sun.COM error = so_tpi_fallback(so, cr); 2868348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 2878348SEric.Yu@Sun.COM if (error) 2888348SEric.Yu@Sun.COM return (error); 2898348SEric.Yu@Sun.COM else 2908348SEric.Yu@Sun.COM return (SOP_BIND(so, name, namelen, flags, cr)); 2918348SEric.Yu@Sun.COM } 2928348SEric.Yu@Sun.COM } 2938348SEric.Yu@Sun.COM 2948348SEric.Yu@Sun.COM dobind: 2958348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_bind) 2968348SEric.Yu@Sun.COM (so->so_proto_handle, name, namelen, cr); 2978348SEric.Yu@Sun.COM done: 2988348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 2998348SEric.Yu@Sun.COM 3008348SEric.Yu@Sun.COM return (error); 3018348SEric.Yu@Sun.COM } 3028348SEric.Yu@Sun.COM 3038348SEric.Yu@Sun.COM int 3048348SEric.Yu@Sun.COM so_listen(struct sonode *so, int backlog, struct cred *cr) 3058348SEric.Yu@Sun.COM { 3068348SEric.Yu@Sun.COM int error = 0; 3078348SEric.Yu@Sun.COM 3088348SEric.Yu@Sun.COM ASSERT(MUTEX_NOT_HELD(&so->so_lock)); 3098348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_LISTEN(so, backlog, cr)); 3108348SEric.Yu@Sun.COM 3118348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_listen)(so->so_proto_handle, backlog, 3128348SEric.Yu@Sun.COM cr); 3138348SEric.Yu@Sun.COM 3148348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 3158348SEric.Yu@Sun.COM 3168348SEric.Yu@Sun.COM return (error); 3178348SEric.Yu@Sun.COM } 3188348SEric.Yu@Sun.COM 3198348SEric.Yu@Sun.COM 3208348SEric.Yu@Sun.COM int 3218348SEric.Yu@Sun.COM so_connect(struct sonode *so, const struct sockaddr *name, 3228348SEric.Yu@Sun.COM socklen_t namelen, int fflag, int flags, struct cred *cr) 3238348SEric.Yu@Sun.COM { 3248348SEric.Yu@Sun.COM int error = 0; 3258348SEric.Yu@Sun.COM sock_connid_t id; 3268348SEric.Yu@Sun.COM 3278348SEric.Yu@Sun.COM ASSERT(MUTEX_NOT_HELD(&so->so_lock)); 3288348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_CONNECT(so, name, namelen, fflag, flags, cr)); 3298348SEric.Yu@Sun.COM 3308348SEric.Yu@Sun.COM /* 3318348SEric.Yu@Sun.COM * If there is a pending error, return error 3328348SEric.Yu@Sun.COM * This can happen if a non blocking operation caused an error. 3338348SEric.Yu@Sun.COM */ 3348348SEric.Yu@Sun.COM 3358348SEric.Yu@Sun.COM if (so->so_error != 0) { 3368348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 3378348SEric.Yu@Sun.COM error = sogeterr(so, B_TRUE); 3388348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 3398348SEric.Yu@Sun.COM if (error != 0) 3408348SEric.Yu@Sun.COM goto done; 3418348SEric.Yu@Sun.COM } 3428348SEric.Yu@Sun.COM 3438348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_connect)(so->so_proto_handle, 3448348SEric.Yu@Sun.COM name, namelen, &id, cr); 3458348SEric.Yu@Sun.COM 3468348SEric.Yu@Sun.COM if (error == EINPROGRESS) 3478348SEric.Yu@Sun.COM error = so_wait_connected(so, fflag & (FNONBLOCK|FNDELAY), id); 3488348SEric.Yu@Sun.COM 3498348SEric.Yu@Sun.COM done: 3508348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 3518348SEric.Yu@Sun.COM return (error); 3528348SEric.Yu@Sun.COM } 3538348SEric.Yu@Sun.COM 3548348SEric.Yu@Sun.COM /*ARGSUSED*/ 3558348SEric.Yu@Sun.COM int 3568348SEric.Yu@Sun.COM so_accept(struct sonode *so, int fflag, struct cred *cr, struct sonode **nsop) 3578348SEric.Yu@Sun.COM { 3588348SEric.Yu@Sun.COM int error = 0; 3598348SEric.Yu@Sun.COM struct sonode *nso; 3608348SEric.Yu@Sun.COM 3618348SEric.Yu@Sun.COM *nsop = NULL; 3628348SEric.Yu@Sun.COM 3638348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_ACCEPT(so, fflag, cr, nsop)); 3648348SEric.Yu@Sun.COM if ((so->so_state & SS_ACCEPTCONN) == 0) { 3658348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 3668348SEric.Yu@Sun.COM return ((so->so_type == SOCK_DGRAM || so->so_type == SOCK_RAW) ? 3678348SEric.Yu@Sun.COM EOPNOTSUPP : EINVAL); 3688348SEric.Yu@Sun.COM } 3698348SEric.Yu@Sun.COM 3708348SEric.Yu@Sun.COM if ((error = so_acceptq_dequeue(so, (fflag & (FNONBLOCK|FNDELAY)), 3718348SEric.Yu@Sun.COM &nso)) == 0) { 3728348SEric.Yu@Sun.COM ASSERT(nso != NULL); 3738348SEric.Yu@Sun.COM 3748348SEric.Yu@Sun.COM /* finish the accept */ 3758348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_accept)(so->so_proto_handle, 3768348SEric.Yu@Sun.COM nso->so_proto_handle, (sock_upper_handle_t)nso, cr); 3778348SEric.Yu@Sun.COM if (error != 0) { 3788348SEric.Yu@Sun.COM (void) socket_close(nso, 0, cr); 3798348SEric.Yu@Sun.COM socket_destroy(nso); 3808348SEric.Yu@Sun.COM } else { 3818348SEric.Yu@Sun.COM *nsop = nso; 3828348SEric.Yu@Sun.COM } 3838348SEric.Yu@Sun.COM } 3848348SEric.Yu@Sun.COM 3858348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 3868348SEric.Yu@Sun.COM return (error); 3878348SEric.Yu@Sun.COM } 3888348SEric.Yu@Sun.COM 3898348SEric.Yu@Sun.COM int 3908348SEric.Yu@Sun.COM so_sendmsg(struct sonode *so, struct nmsghdr *msg, struct uio *uiop, 3918348SEric.Yu@Sun.COM struct cred *cr) 3928348SEric.Yu@Sun.COM { 3938348SEric.Yu@Sun.COM int error, flags; 3948348SEric.Yu@Sun.COM boolean_t dontblock; 3958348SEric.Yu@Sun.COM ssize_t orig_resid; 3968348SEric.Yu@Sun.COM mblk_t *mp; 3978348SEric.Yu@Sun.COM 3988348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_SENDMSG(so, msg, uiop, cr)); 3998348SEric.Yu@Sun.COM 4008348SEric.Yu@Sun.COM flags = msg->msg_flags; 4018348SEric.Yu@Sun.COM error = 0; 4028348SEric.Yu@Sun.COM dontblock = (flags & MSG_DONTWAIT) || 4038348SEric.Yu@Sun.COM (uiop->uio_fmode & (FNONBLOCK|FNDELAY)); 4048348SEric.Yu@Sun.COM 4058348SEric.Yu@Sun.COM if (!(flags & MSG_XPG4_2) && msg->msg_controllen != 0) { 4068348SEric.Yu@Sun.COM /* 4078348SEric.Yu@Sun.COM * Old way of passing fd's is not supported 4088348SEric.Yu@Sun.COM */ 4098348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 4108348SEric.Yu@Sun.COM return (EOPNOTSUPP); 4118348SEric.Yu@Sun.COM } 4128348SEric.Yu@Sun.COM 4138348SEric.Yu@Sun.COM if ((so->so_mode & SM_ATOMIC) && 4148348SEric.Yu@Sun.COM uiop->uio_resid > so->so_proto_props.sopp_maxpsz && 4158348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxpsz != -1) { 4168348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 4178348SEric.Yu@Sun.COM return (EMSGSIZE); 4188348SEric.Yu@Sun.COM } 4198348SEric.Yu@Sun.COM 4208348SEric.Yu@Sun.COM /* 4218348SEric.Yu@Sun.COM * For atomic sends we will only do one iteration. 4228348SEric.Yu@Sun.COM */ 4238348SEric.Yu@Sun.COM do { 4248348SEric.Yu@Sun.COM if (so->so_state & SS_CANTSENDMORE) { 4258348SEric.Yu@Sun.COM error = EPIPE; 4268348SEric.Yu@Sun.COM break; 4278348SEric.Yu@Sun.COM } 4288348SEric.Yu@Sun.COM 4298348SEric.Yu@Sun.COM if (so->so_error != 0) { 4308348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 4318348SEric.Yu@Sun.COM error = sogeterr(so, B_TRUE); 4328348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 4338348SEric.Yu@Sun.COM if (error != 0) 4348348SEric.Yu@Sun.COM break; 4358348SEric.Yu@Sun.COM } 4368348SEric.Yu@Sun.COM 4378348SEric.Yu@Sun.COM /* 4388348SEric.Yu@Sun.COM * Send down OOB messages even if the send path is being 4398348SEric.Yu@Sun.COM * flow controlled (assuming the protocol supports OOB data). 4408348SEric.Yu@Sun.COM */ 4418348SEric.Yu@Sun.COM if (flags & MSG_OOB) { 4428348SEric.Yu@Sun.COM if ((so->so_mode & SM_EXDATA) == 0) { 4438348SEric.Yu@Sun.COM error = EOPNOTSUPP; 4448348SEric.Yu@Sun.COM break; 4458348SEric.Yu@Sun.COM } 4468348SEric.Yu@Sun.COM } else if (so->so_snd_qfull) { 4478348SEric.Yu@Sun.COM /* 4488348SEric.Yu@Sun.COM * Need to wait until the protocol is ready to receive 4498348SEric.Yu@Sun.COM * more data for transmission. 4508348SEric.Yu@Sun.COM */ 4518348SEric.Yu@Sun.COM if ((error = so_snd_wait_qnotfull(so, dontblock)) != 0) 4528348SEric.Yu@Sun.COM break; 4538348SEric.Yu@Sun.COM } 4548348SEric.Yu@Sun.COM 4558348SEric.Yu@Sun.COM /* 4568348SEric.Yu@Sun.COM * Time to send data to the protocol. We either copy the 4578348SEric.Yu@Sun.COM * data into mblks or pass the uio directly to the protocol. 4588348SEric.Yu@Sun.COM * We decide what to do based on the available down calls. 4598348SEric.Yu@Sun.COM */ 4608348SEric.Yu@Sun.COM if (so->so_downcalls->sd_send_uio != NULL) { 4618348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_send_uio) 4628348SEric.Yu@Sun.COM (so->so_proto_handle, uiop, msg, cr); 4638348SEric.Yu@Sun.COM if (error != 0) 4648348SEric.Yu@Sun.COM break; 4658348SEric.Yu@Sun.COM } else { 4668348SEric.Yu@Sun.COM /* save the resid in case of failure */ 4678348SEric.Yu@Sun.COM orig_resid = uiop->uio_resid; 4688348SEric.Yu@Sun.COM 4698348SEric.Yu@Sun.COM if ((mp = socopyinuio(uiop, 4708348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxpsz, 4718348SEric.Yu@Sun.COM so->so_proto_props.sopp_wroff, 4728348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxblk, 4738778SErik.Nordmark@Sun.COM so->so_proto_props.sopp_tail, &error, 4748778SErik.Nordmark@Sun.COM cr)) == NULL) { 4758348SEric.Yu@Sun.COM break; 4768348SEric.Yu@Sun.COM } 4778348SEric.Yu@Sun.COM ASSERT(uiop->uio_resid >= 0); 4788348SEric.Yu@Sun.COM 4798348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_send) 4808348SEric.Yu@Sun.COM (so->so_proto_handle, mp, msg, cr); 4818348SEric.Yu@Sun.COM if (error != 0) { 4828348SEric.Yu@Sun.COM /* 4838348SEric.Yu@Sun.COM * The send failed. We do not have to free the 4848348SEric.Yu@Sun.COM * mblks, because that is the protocol's 4858348SEric.Yu@Sun.COM * responsibility. However, uio_resid must 4868348SEric.Yu@Sun.COM * remain accurate, so adjust that here. 4878348SEric.Yu@Sun.COM */ 4888348SEric.Yu@Sun.COM uiop->uio_resid = orig_resid; 4898348SEric.Yu@Sun.COM break; 4908348SEric.Yu@Sun.COM } 4918348SEric.Yu@Sun.COM } 4928348SEric.Yu@Sun.COM } while (uiop->uio_resid > 0); 4938348SEric.Yu@Sun.COM 4948348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 4958348SEric.Yu@Sun.COM 4968348SEric.Yu@Sun.COM return (error); 4978348SEric.Yu@Sun.COM } 4988348SEric.Yu@Sun.COM 4998348SEric.Yu@Sun.COM int 5008348SEric.Yu@Sun.COM so_sendmblk(struct sonode *so, struct nmsghdr *msg, int fflag, 5018348SEric.Yu@Sun.COM struct cred *cr, mblk_t **mpp) 5028348SEric.Yu@Sun.COM { 5038348SEric.Yu@Sun.COM int error; 5048348SEric.Yu@Sun.COM boolean_t dontblock; 5058348SEric.Yu@Sun.COM size_t size; 5068348SEric.Yu@Sun.COM mblk_t *mp = *mpp; 5078348SEric.Yu@Sun.COM 5088348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_SENDMBLK(so, msg, fflag, cr, mpp)); 5098348SEric.Yu@Sun.COM 5108348SEric.Yu@Sun.COM error = 0; 5118348SEric.Yu@Sun.COM dontblock = (msg->msg_flags & MSG_DONTWAIT) || 5128348SEric.Yu@Sun.COM (fflag & (FNONBLOCK|FNDELAY)); 5138348SEric.Yu@Sun.COM size = msgdsize(mp); 5148348SEric.Yu@Sun.COM 5158401SAnders.Persson@Sun.COM if ((so->so_mode & SM_SENDFILESUPP) == 0 || 5168401SAnders.Persson@Sun.COM so->so_downcalls->sd_send == NULL) { 5178348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 5188348SEric.Yu@Sun.COM return (EOPNOTSUPP); 5198348SEric.Yu@Sun.COM } 5208348SEric.Yu@Sun.COM 5218348SEric.Yu@Sun.COM if ((so->so_mode & SM_ATOMIC) && 5228348SEric.Yu@Sun.COM size > so->so_proto_props.sopp_maxpsz && 5238348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxpsz != -1) { 5248348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 5258348SEric.Yu@Sun.COM return (EMSGSIZE); 5268348SEric.Yu@Sun.COM } 5278348SEric.Yu@Sun.COM 5288348SEric.Yu@Sun.COM while (mp != NULL) { 5298348SEric.Yu@Sun.COM mblk_t *nmp, *last_mblk; 5308348SEric.Yu@Sun.COM size_t mlen; 5318348SEric.Yu@Sun.COM 5328348SEric.Yu@Sun.COM if (so->so_state & SS_CANTSENDMORE) { 5338348SEric.Yu@Sun.COM error = EPIPE; 5348348SEric.Yu@Sun.COM break; 5358348SEric.Yu@Sun.COM } 5368348SEric.Yu@Sun.COM if (so->so_error != 0) { 5378348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 5388348SEric.Yu@Sun.COM error = sogeterr(so, B_TRUE); 5398348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 5408348SEric.Yu@Sun.COM if (error != 0) 5418348SEric.Yu@Sun.COM break; 5428348SEric.Yu@Sun.COM } 5438348SEric.Yu@Sun.COM if (so->so_snd_qfull) { 5448348SEric.Yu@Sun.COM /* 5458348SEric.Yu@Sun.COM * Need to wait until the protocol is ready to receive 5468348SEric.Yu@Sun.COM * more data for transmission. 5478348SEric.Yu@Sun.COM */ 5488348SEric.Yu@Sun.COM if ((error = so_snd_wait_qnotfull(so, dontblock)) != 0) 5498348SEric.Yu@Sun.COM break; 5508348SEric.Yu@Sun.COM } 5518348SEric.Yu@Sun.COM 5528348SEric.Yu@Sun.COM /* 5538348SEric.Yu@Sun.COM * We only allow so_maxpsz of data to be sent down to 5548348SEric.Yu@Sun.COM * the protocol at time. 5558348SEric.Yu@Sun.COM */ 5568348SEric.Yu@Sun.COM mlen = MBLKL(mp); 5578348SEric.Yu@Sun.COM nmp = mp->b_cont; 5588348SEric.Yu@Sun.COM last_mblk = mp; 5598348SEric.Yu@Sun.COM while (nmp != NULL) { 5608348SEric.Yu@Sun.COM mlen += MBLKL(nmp); 5618348SEric.Yu@Sun.COM if (mlen > so->so_proto_props.sopp_maxpsz) { 5628348SEric.Yu@Sun.COM last_mblk->b_cont = NULL; 5638348SEric.Yu@Sun.COM break; 5648348SEric.Yu@Sun.COM } 5658348SEric.Yu@Sun.COM last_mblk = nmp; 5668348SEric.Yu@Sun.COM nmp = nmp->b_cont; 5678348SEric.Yu@Sun.COM } 5688348SEric.Yu@Sun.COM 5698348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_send) 5708348SEric.Yu@Sun.COM (so->so_proto_handle, mp, msg, cr); 5718348SEric.Yu@Sun.COM if (error != 0) { 5728348SEric.Yu@Sun.COM /* 5738348SEric.Yu@Sun.COM * The send failed. The protocol will free the mblks 5748348SEric.Yu@Sun.COM * that were sent down. Let the caller deal with the 5758348SEric.Yu@Sun.COM * rest. 5768348SEric.Yu@Sun.COM */ 5778348SEric.Yu@Sun.COM *mpp = nmp; 5788348SEric.Yu@Sun.COM break; 5798348SEric.Yu@Sun.COM } 5808348SEric.Yu@Sun.COM 5818348SEric.Yu@Sun.COM *mpp = mp = nmp; 5828348SEric.Yu@Sun.COM } 5838348SEric.Yu@Sun.COM 5848348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 5858348SEric.Yu@Sun.COM 5868348SEric.Yu@Sun.COM return (error); 5878348SEric.Yu@Sun.COM } 5888348SEric.Yu@Sun.COM 5898348SEric.Yu@Sun.COM int 5908348SEric.Yu@Sun.COM so_shutdown(struct sonode *so, int how, struct cred *cr) 5918348SEric.Yu@Sun.COM { 5928348SEric.Yu@Sun.COM int error; 5938348SEric.Yu@Sun.COM 5948348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_SHUTDOWN(so, how, cr)); 5958348SEric.Yu@Sun.COM 5968348SEric.Yu@Sun.COM /* 5978348SEric.Yu@Sun.COM * SunOS 4.X has no check for datagram sockets. 5988348SEric.Yu@Sun.COM * 5.X checks that it is connected (ENOTCONN) 5998348SEric.Yu@Sun.COM * X/Open requires that we check the connected state. 6008348SEric.Yu@Sun.COM */ 6018348SEric.Yu@Sun.COM if (!(so->so_state & SS_ISCONNECTED)) { 6028348SEric.Yu@Sun.COM if (!xnet_skip_checks) { 6038348SEric.Yu@Sun.COM error = ENOTCONN; 6048348SEric.Yu@Sun.COM if (xnet_check_print) { 6058348SEric.Yu@Sun.COM printf("sockfs: X/Open shutdown check " 6068348SEric.Yu@Sun.COM "caused ENOTCONN\n"); 6078348SEric.Yu@Sun.COM } 6088348SEric.Yu@Sun.COM } 6098348SEric.Yu@Sun.COM goto done; 6108348SEric.Yu@Sun.COM } 6118348SEric.Yu@Sun.COM 6128348SEric.Yu@Sun.COM error = ((*so->so_downcalls->sd_shutdown)(so->so_proto_handle, 6138348SEric.Yu@Sun.COM how, cr)); 6148348SEric.Yu@Sun.COM 6158348SEric.Yu@Sun.COM /* 6168348SEric.Yu@Sun.COM * Protocol agreed to shutdown. We need to flush the 6178348SEric.Yu@Sun.COM * receive buffer if the receive side is being shutdown. 6188348SEric.Yu@Sun.COM */ 6198348SEric.Yu@Sun.COM if (error == 0 && how != SHUT_WR) { 6208348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 6218348SEric.Yu@Sun.COM /* wait for active reader to finish */ 6228348SEric.Yu@Sun.COM (void) so_lock_read(so, 0); 6238348SEric.Yu@Sun.COM 6248348SEric.Yu@Sun.COM so_rcv_flush(so); 6258348SEric.Yu@Sun.COM 6268348SEric.Yu@Sun.COM so_unlock_read(so); 6278348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 6288348SEric.Yu@Sun.COM } 6298348SEric.Yu@Sun.COM 6308348SEric.Yu@Sun.COM done: 6318348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 6328348SEric.Yu@Sun.COM return (error); 6338348SEric.Yu@Sun.COM } 6348348SEric.Yu@Sun.COM 6358348SEric.Yu@Sun.COM int 6368348SEric.Yu@Sun.COM so_getsockname(struct sonode *so, struct sockaddr *addr, 6378348SEric.Yu@Sun.COM socklen_t *addrlen, struct cred *cr) 6388348SEric.Yu@Sun.COM { 6398348SEric.Yu@Sun.COM int error; 6408348SEric.Yu@Sun.COM 6418348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_GETSOCKNAME(so, addr, addrlen, cr)); 6428348SEric.Yu@Sun.COM 6438348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_getsockname) 6448348SEric.Yu@Sun.COM (so->so_proto_handle, addr, addrlen, cr); 6458348SEric.Yu@Sun.COM 6468348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 6478348SEric.Yu@Sun.COM return (error); 6488348SEric.Yu@Sun.COM } 6498348SEric.Yu@Sun.COM 6508348SEric.Yu@Sun.COM int 6518348SEric.Yu@Sun.COM so_getpeername(struct sonode *so, struct sockaddr *addr, 6528348SEric.Yu@Sun.COM socklen_t *addrlen, boolean_t accept, struct cred *cr) 6538348SEric.Yu@Sun.COM { 6548348SEric.Yu@Sun.COM int error; 6558348SEric.Yu@Sun.COM 6568348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_GETPEERNAME(so, addr, addrlen, accept, cr)); 6578348SEric.Yu@Sun.COM 6588348SEric.Yu@Sun.COM if (accept) { 6598348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_getpeername) 6608348SEric.Yu@Sun.COM (so->so_proto_handle, addr, addrlen, cr); 6618348SEric.Yu@Sun.COM } else if (!(so->so_state & SS_ISCONNECTED)) { 6628348SEric.Yu@Sun.COM error = ENOTCONN; 6638348SEric.Yu@Sun.COM } else if ((so->so_state & SS_CANTSENDMORE) && !xnet_skip_checks) { 6648348SEric.Yu@Sun.COM /* Added this check for X/Open */ 6658348SEric.Yu@Sun.COM error = EINVAL; 6668348SEric.Yu@Sun.COM if (xnet_check_print) { 6678348SEric.Yu@Sun.COM printf("sockfs: X/Open getpeername check => EINVAL\n"); 6688348SEric.Yu@Sun.COM } 6698348SEric.Yu@Sun.COM } else { 6708348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_getpeername) 6718348SEric.Yu@Sun.COM (so->so_proto_handle, addr, addrlen, cr); 6728348SEric.Yu@Sun.COM } 6738348SEric.Yu@Sun.COM 6748348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 6758348SEric.Yu@Sun.COM return (error); 6768348SEric.Yu@Sun.COM } 6778348SEric.Yu@Sun.COM 6788348SEric.Yu@Sun.COM int 6798348SEric.Yu@Sun.COM so_getsockopt(struct sonode *so, int level, int option_name, 6808348SEric.Yu@Sun.COM void *optval, socklen_t *optlenp, int flags, struct cred *cr) 6818348SEric.Yu@Sun.COM { 6828348SEric.Yu@Sun.COM int error = 0; 6838348SEric.Yu@Sun.COM 6848348SEric.Yu@Sun.COM ASSERT(MUTEX_NOT_HELD(&so->so_lock)); 6858348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, 6868348SEric.Yu@Sun.COM SOP_GETSOCKOPT(so, level, option_name, optval, optlenp, flags, cr)); 6878348SEric.Yu@Sun.COM 6888465SEric.Yu@Sun.COM error = socket_getopt_common(so, level, option_name, optval, optlenp, 6898465SEric.Yu@Sun.COM flags); 6908348SEric.Yu@Sun.COM if (error < 0) { 6918348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_getsockopt) 6928348SEric.Yu@Sun.COM (so->so_proto_handle, level, option_name, optval, optlenp, 6938348SEric.Yu@Sun.COM cr); 6948348SEric.Yu@Sun.COM if (error == ENOPROTOOPT) { 6958348SEric.Yu@Sun.COM if (level == SOL_SOCKET) { 6968348SEric.Yu@Sun.COM /* 6978348SEric.Yu@Sun.COM * If a protocol does not support a particular 6988348SEric.Yu@Sun.COM * socket option, set can fail (not allowed) 6998348SEric.Yu@Sun.COM * but get can not fail. This is the previous 7008348SEric.Yu@Sun.COM * sockfs bahvior. 7018348SEric.Yu@Sun.COM */ 7028348SEric.Yu@Sun.COM switch (option_name) { 7038348SEric.Yu@Sun.COM case SO_LINGER: 7048348SEric.Yu@Sun.COM if (*optlenp < (t_uscalar_t) 7058348SEric.Yu@Sun.COM sizeof (struct linger)) { 7068348SEric.Yu@Sun.COM error = EINVAL; 7078348SEric.Yu@Sun.COM break; 7088348SEric.Yu@Sun.COM } 7098348SEric.Yu@Sun.COM error = 0; 7108348SEric.Yu@Sun.COM bzero(optval, sizeof (struct linger)); 7118348SEric.Yu@Sun.COM *optlenp = sizeof (struct linger); 7128348SEric.Yu@Sun.COM break; 7138348SEric.Yu@Sun.COM case SO_RCVTIMEO: 7148348SEric.Yu@Sun.COM case SO_SNDTIMEO: 7158348SEric.Yu@Sun.COM if (*optlenp < (t_uscalar_t) 7168348SEric.Yu@Sun.COM sizeof (struct timeval)) { 7178348SEric.Yu@Sun.COM error = EINVAL; 7188348SEric.Yu@Sun.COM break; 7198348SEric.Yu@Sun.COM } 7208348SEric.Yu@Sun.COM error = 0; 7218348SEric.Yu@Sun.COM bzero(optval, sizeof (struct timeval)); 7228348SEric.Yu@Sun.COM *optlenp = sizeof (struct timeval); 7238348SEric.Yu@Sun.COM break; 7248348SEric.Yu@Sun.COM case SO_SND_BUFINFO: 7258348SEric.Yu@Sun.COM if (*optlenp < (t_uscalar_t) 7268348SEric.Yu@Sun.COM sizeof (struct so_snd_bufinfo)) { 7278348SEric.Yu@Sun.COM error = EINVAL; 7288348SEric.Yu@Sun.COM break; 7298348SEric.Yu@Sun.COM } 7308348SEric.Yu@Sun.COM error = 0; 7318348SEric.Yu@Sun.COM bzero(optval, 7328348SEric.Yu@Sun.COM sizeof (struct so_snd_bufinfo)); 7338348SEric.Yu@Sun.COM *optlenp = 7348348SEric.Yu@Sun.COM sizeof (struct so_snd_bufinfo); 7358348SEric.Yu@Sun.COM break; 7368348SEric.Yu@Sun.COM case SO_DEBUG: 7378348SEric.Yu@Sun.COM case SO_REUSEADDR: 7388348SEric.Yu@Sun.COM case SO_KEEPALIVE: 7398348SEric.Yu@Sun.COM case SO_DONTROUTE: 7408348SEric.Yu@Sun.COM case SO_BROADCAST: 7418348SEric.Yu@Sun.COM case SO_USELOOPBACK: 7428348SEric.Yu@Sun.COM case SO_OOBINLINE: 7438348SEric.Yu@Sun.COM case SO_DGRAM_ERRIND: 7448348SEric.Yu@Sun.COM case SO_SNDBUF: 7458348SEric.Yu@Sun.COM case SO_RCVBUF: 7468348SEric.Yu@Sun.COM error = 0; 7478348SEric.Yu@Sun.COM *((int32_t *)optval) = 0; 7488348SEric.Yu@Sun.COM *optlenp = sizeof (int32_t); 7498348SEric.Yu@Sun.COM break; 7508348SEric.Yu@Sun.COM default: 7518348SEric.Yu@Sun.COM break; 7528348SEric.Yu@Sun.COM } 7538348SEric.Yu@Sun.COM } 7548348SEric.Yu@Sun.COM } 7558348SEric.Yu@Sun.COM } 7568348SEric.Yu@Sun.COM 7578348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 7588348SEric.Yu@Sun.COM return (error); 7598348SEric.Yu@Sun.COM } 7608348SEric.Yu@Sun.COM 7618348SEric.Yu@Sun.COM int 7628348SEric.Yu@Sun.COM so_setsockopt(struct sonode *so, int level, int option_name, 7638348SEric.Yu@Sun.COM const void *optval, socklen_t optlen, struct cred *cr) 7648348SEric.Yu@Sun.COM { 7658348SEric.Yu@Sun.COM int error = 0; 7668612SAnders.Persson@Sun.COM struct timeval tl; 7678612SAnders.Persson@Sun.COM const void *opt = optval; 7688348SEric.Yu@Sun.COM 7698348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, 7708348SEric.Yu@Sun.COM SOP_SETSOCKOPT(so, level, option_name, optval, optlen, cr)); 7718348SEric.Yu@Sun.COM 7728348SEric.Yu@Sun.COM /* X/Open requires this check */ 7738348SEric.Yu@Sun.COM if (so->so_state & SS_CANTSENDMORE && !xnet_skip_checks) { 7748348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 7758348SEric.Yu@Sun.COM if (xnet_check_print) 7768348SEric.Yu@Sun.COM printf("sockfs: X/Open setsockopt check => EINVAL\n"); 7778348SEric.Yu@Sun.COM return (EINVAL); 7788348SEric.Yu@Sun.COM } 7798348SEric.Yu@Sun.COM 7808465SEric.Yu@Sun.COM if (level == SOL_SOCKET) { 7818465SEric.Yu@Sun.COM switch (option_name) { 7828465SEric.Yu@Sun.COM case SO_RCVTIMEO: 7838465SEric.Yu@Sun.COM case SO_SNDTIMEO: { 7848586Sshenjian /* 7858586Sshenjian * We pass down these two options to protocol in order 7868586Sshenjian * to support some third part protocols which need to 7878586Sshenjian * know them. For those protocols which don't care 7888586Sshenjian * these two options, simply return 0. 7898586Sshenjian */ 7908465SEric.Yu@Sun.COM clock_t t_usec; 7918348SEric.Yu@Sun.COM 7928575Sshenjian if (get_udatamodel() == DATAMODEL_NONE || 7938575Sshenjian get_udatamodel() == DATAMODEL_NATIVE) { 7948489Sshenjian if (optlen != sizeof (struct timeval)) { 7958489Sshenjian error = EINVAL; 7968489Sshenjian goto done; 7978489Sshenjian } 7988489Sshenjian bcopy((struct timeval *)optval, &tl, 7998489Sshenjian sizeof (struct timeval)); 8008489Sshenjian } else { 8018489Sshenjian if (optlen != sizeof (struct timeval32)) { 8028489Sshenjian error = EINVAL; 8038489Sshenjian goto done; 8048489Sshenjian } 8058489Sshenjian TIMEVAL32_TO_TIMEVAL(&tl, 8068489Sshenjian (struct timeval32 *)optval); 8078465SEric.Yu@Sun.COM } 8088612SAnders.Persson@Sun.COM opt = &tl; 8098612SAnders.Persson@Sun.COM optlen = sizeof (tl); 8108489Sshenjian t_usec = tl.tv_sec * 1000 * 1000 + tl.tv_usec; 8118465SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 8128465SEric.Yu@Sun.COM if (option_name == SO_RCVTIMEO) 8138465SEric.Yu@Sun.COM so->so_rcvtimeo = drv_usectohz(t_usec); 8148465SEric.Yu@Sun.COM else 8158465SEric.Yu@Sun.COM so->so_sndtimeo = drv_usectohz(t_usec); 8168465SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 8178586Sshenjian break; 8188348SEric.Yu@Sun.COM } 8198465SEric.Yu@Sun.COM case SO_RCVBUF: 8208465SEric.Yu@Sun.COM /* 8218465SEric.Yu@Sun.COM * XXX XPG 4.2 applications retrieve SO_RCVBUF from 8228465SEric.Yu@Sun.COM * sockfs since the transport might adjust the value 8238465SEric.Yu@Sun.COM * and not return exactly what was set by the 8248465SEric.Yu@Sun.COM * application. 8258465SEric.Yu@Sun.COM */ 8268465SEric.Yu@Sun.COM so->so_xpg_rcvbuf = *(int32_t *)optval; 8278465SEric.Yu@Sun.COM break; 8288465SEric.Yu@Sun.COM } 8298348SEric.Yu@Sun.COM } 8308348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_setsockopt) 8318612SAnders.Persson@Sun.COM (so->so_proto_handle, level, option_name, opt, optlen, cr); 8328489Sshenjian done: 8338348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 8348348SEric.Yu@Sun.COM return (error); 8358348SEric.Yu@Sun.COM } 8368348SEric.Yu@Sun.COM 8378348SEric.Yu@Sun.COM int 8388348SEric.Yu@Sun.COM so_ioctl(struct sonode *so, int cmd, intptr_t arg, int mode, 8398348SEric.Yu@Sun.COM struct cred *cr, int32_t *rvalp) 8408348SEric.Yu@Sun.COM { 8418348SEric.Yu@Sun.COM int error = 0; 8428348SEric.Yu@Sun.COM 8438348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_IOCTL(so, cmd, arg, mode, cr, rvalp)); 8448348SEric.Yu@Sun.COM 8458348SEric.Yu@Sun.COM /* 8468348SEric.Yu@Sun.COM * If there is a pending error, return error 8478348SEric.Yu@Sun.COM * This can happen if a non blocking operation caused an error. 8488348SEric.Yu@Sun.COM */ 8498348SEric.Yu@Sun.COM if (so->so_error != 0) { 8508348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 8518348SEric.Yu@Sun.COM error = sogeterr(so, B_TRUE); 8528348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 8538348SEric.Yu@Sun.COM if (error != 0) 8548348SEric.Yu@Sun.COM goto done; 8558348SEric.Yu@Sun.COM } 8568348SEric.Yu@Sun.COM 8578348SEric.Yu@Sun.COM /* 8588348SEric.Yu@Sun.COM * calling strioc can result in the socket falling back to TPI, 8598348SEric.Yu@Sun.COM * if that is supported. 8608348SEric.Yu@Sun.COM */ 8618348SEric.Yu@Sun.COM if ((error = socket_ioctl_common(so, cmd, arg, mode, cr, rvalp)) < 0 && 8628348SEric.Yu@Sun.COM (error = socket_strioc_common(so, cmd, arg, mode, cr, rvalp)) < 0) { 8638348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_ioctl)(so->so_proto_handle, 8648348SEric.Yu@Sun.COM cmd, arg, mode, rvalp, cr); 8658348SEric.Yu@Sun.COM } 8668348SEric.Yu@Sun.COM 8678348SEric.Yu@Sun.COM done: 8688348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 8698348SEric.Yu@Sun.COM 8708348SEric.Yu@Sun.COM return (error); 8718348SEric.Yu@Sun.COM } 8728348SEric.Yu@Sun.COM 8738348SEric.Yu@Sun.COM int 8748348SEric.Yu@Sun.COM so_poll(struct sonode *so, short events, int anyyet, short *reventsp, 8758348SEric.Yu@Sun.COM struct pollhead **phpp) 8768348SEric.Yu@Sun.COM { 8778348SEric.Yu@Sun.COM int state = so->so_state; 8788348SEric.Yu@Sun.COM *reventsp = 0; 8798348SEric.Yu@Sun.COM 8808348SEric.Yu@Sun.COM if (so->so_error != 0 && 8818348SEric.Yu@Sun.COM ((POLLIN|POLLRDNORM|POLLOUT) & events) != 0) { 8828348SEric.Yu@Sun.COM *reventsp = (POLLIN|POLLRDNORM|POLLOUT) & events; 8838348SEric.Yu@Sun.COM return (0); 8848348SEric.Yu@Sun.COM } 8858348SEric.Yu@Sun.COM 8868348SEric.Yu@Sun.COM /* 8878348SEric.Yu@Sun.COM * As long as there is buffer to send data, and the socket is 8888348SEric.Yu@Sun.COM * in a state where it can send data (i.e., connected for 8898348SEric.Yu@Sun.COM * connection oriented protocols), then turn on POLLOUT events 8908348SEric.Yu@Sun.COM */ 8918348SEric.Yu@Sun.COM if (!so->so_snd_qfull && ((so->so_mode & SM_CONNREQUIRED) == 0 || 8928348SEric.Yu@Sun.COM state & SS_ISCONNECTED)) { 8938348SEric.Yu@Sun.COM *reventsp |= POLLOUT & events; 8948348SEric.Yu@Sun.COM } 8958348SEric.Yu@Sun.COM 8968348SEric.Yu@Sun.COM /* 8978348SEric.Yu@Sun.COM * Turn on POLLIN whenever there is data on the receive queue, 8988348SEric.Yu@Sun.COM * or the socket is in a state where no more data will be received. 8998348SEric.Yu@Sun.COM * Also, if the socket is accepting connections, flip the bit if 9008348SEric.Yu@Sun.COM * there is something on the queue. 9018427SAnders.Persson@Sun.COM * 9028427SAnders.Persson@Sun.COM * We do an initial check for events without holding locks. However, 9038427SAnders.Persson@Sun.COM * if there are no event available, then we redo the check for POLLIN 9048427SAnders.Persson@Sun.COM * events under the lock. 9058348SEric.Yu@Sun.COM */ 9068348SEric.Yu@Sun.COM 9078348SEric.Yu@Sun.COM /* Pending connections */ 9088348SEric.Yu@Sun.COM if (so->so_acceptq_len > 0) 9098348SEric.Yu@Sun.COM *reventsp |= (POLLIN|POLLRDNORM) & events; 9108348SEric.Yu@Sun.COM 9118348SEric.Yu@Sun.COM /* Data */ 9128348SEric.Yu@Sun.COM /* so_downcalls is null for sctp */ 9138348SEric.Yu@Sun.COM if (so->so_downcalls != NULL && so->so_downcalls->sd_poll != NULL) { 9148348SEric.Yu@Sun.COM *reventsp |= (*so->so_downcalls->sd_poll) 9158348SEric.Yu@Sun.COM (so->so_proto_handle, events & SO_PROTO_POLLEV, anyyet, 9168348SEric.Yu@Sun.COM CRED()) & events; 9178348SEric.Yu@Sun.COM ASSERT((*reventsp & ~events) == 0); 9188348SEric.Yu@Sun.COM /* do not recheck events */ 9198348SEric.Yu@Sun.COM events &= ~SO_PROTO_POLLEV; 9208348SEric.Yu@Sun.COM } else { 9218348SEric.Yu@Sun.COM if (SO_HAVE_DATA(so)) 9228348SEric.Yu@Sun.COM *reventsp |= (POLLIN|POLLRDNORM) & events; 9238348SEric.Yu@Sun.COM 9248348SEric.Yu@Sun.COM /* Urgent data */ 9258348SEric.Yu@Sun.COM if ((state & SS_OOBPEND) != 0) 9268348SEric.Yu@Sun.COM *reventsp |= (POLLRDBAND) & events; 9278348SEric.Yu@Sun.COM } 9288348SEric.Yu@Sun.COM 9298348SEric.Yu@Sun.COM if (!*reventsp && !anyyet) { 9308348SEric.Yu@Sun.COM /* Check for read events again, but this time under lock */ 9318348SEric.Yu@Sun.COM if (events & (POLLIN|POLLRDNORM)) { 9328348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 9338348SEric.Yu@Sun.COM if (SO_HAVE_DATA(so) || so->so_acceptq_len > 0) { 9348348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 9358348SEric.Yu@Sun.COM *reventsp |= (POLLIN|POLLRDNORM) & events; 9368348SEric.Yu@Sun.COM return (0); 9378348SEric.Yu@Sun.COM } else { 9388348SEric.Yu@Sun.COM so->so_pollev |= SO_POLLEV_IN; 9398348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 9408348SEric.Yu@Sun.COM } 9418348SEric.Yu@Sun.COM } 9428348SEric.Yu@Sun.COM *phpp = &so->so_poll_list; 9438348SEric.Yu@Sun.COM } 9448348SEric.Yu@Sun.COM return (0); 9458348SEric.Yu@Sun.COM } 9468348SEric.Yu@Sun.COM 9478348SEric.Yu@Sun.COM /* 9488348SEric.Yu@Sun.COM * Generic Upcalls 9498348SEric.Yu@Sun.COM */ 9508348SEric.Yu@Sun.COM void 9518348SEric.Yu@Sun.COM so_connected(sock_upper_handle_t sock_handle, sock_connid_t id, 9528348SEric.Yu@Sun.COM cred_t *peer_cred, pid_t peer_cpid) 9538348SEric.Yu@Sun.COM { 9548348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 9558348SEric.Yu@Sun.COM 9568348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 9578348SEric.Yu@Sun.COM ASSERT(so->so_proto_handle != NULL); 9588348SEric.Yu@Sun.COM 9598348SEric.Yu@Sun.COM if (peer_cred != NULL) { 9608348SEric.Yu@Sun.COM if (so->so_peercred != NULL) 9618348SEric.Yu@Sun.COM crfree(so->so_peercred); 9628348SEric.Yu@Sun.COM crhold(peer_cred); 9638348SEric.Yu@Sun.COM so->so_peercred = peer_cred; 9648348SEric.Yu@Sun.COM so->so_cpid = peer_cpid; 9658348SEric.Yu@Sun.COM } 9668348SEric.Yu@Sun.COM 9678348SEric.Yu@Sun.COM so->so_proto_connid = id; 9688348SEric.Yu@Sun.COM soisconnected(so); 9698348SEric.Yu@Sun.COM /* 9708348SEric.Yu@Sun.COM * Wake ones who're waiting for conn to become established. 9718348SEric.Yu@Sun.COM */ 9728348SEric.Yu@Sun.COM so_notify_connected(so); 9738348SEric.Yu@Sun.COM } 9748348SEric.Yu@Sun.COM 9758348SEric.Yu@Sun.COM int 9768348SEric.Yu@Sun.COM so_disconnected(sock_upper_handle_t sock_handle, sock_connid_t id, int error) 9778348SEric.Yu@Sun.COM { 9788348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 9798348SEric.Yu@Sun.COM 9808348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 9818348SEric.Yu@Sun.COM 9828348SEric.Yu@Sun.COM so->so_proto_connid = id; 9838348SEric.Yu@Sun.COM soisdisconnected(so, error); 9848348SEric.Yu@Sun.COM so_notify_disconnected(so, error); 9858348SEric.Yu@Sun.COM 9868348SEric.Yu@Sun.COM return (0); 9878348SEric.Yu@Sun.COM } 9888348SEric.Yu@Sun.COM 9898348SEric.Yu@Sun.COM void 9908348SEric.Yu@Sun.COM so_opctl(sock_upper_handle_t sock_handle, sock_opctl_action_t action, 9918348SEric.Yu@Sun.COM uintptr_t arg) 9928348SEric.Yu@Sun.COM { 9938348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 9948348SEric.Yu@Sun.COM 9958348SEric.Yu@Sun.COM switch (action) { 9968348SEric.Yu@Sun.COM case SOCK_OPCTL_SHUT_SEND: 9978348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 9988348SEric.Yu@Sun.COM socantsendmore(so); 9998348SEric.Yu@Sun.COM so_notify_disconnecting(so); 10008348SEric.Yu@Sun.COM break; 10018348SEric.Yu@Sun.COM case SOCK_OPCTL_SHUT_RECV: { 10028348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 10038348SEric.Yu@Sun.COM socantrcvmore(so); 10048348SEric.Yu@Sun.COM so_notify_eof(so); 10058348SEric.Yu@Sun.COM break; 10068348SEric.Yu@Sun.COM } 10078348SEric.Yu@Sun.COM case SOCK_OPCTL_ENAB_ACCEPT: 10088348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 10098348SEric.Yu@Sun.COM so->so_state |= SS_ACCEPTCONN; 10108348SEric.Yu@Sun.COM so->so_backlog = (unsigned int)arg; 10118348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 10128348SEric.Yu@Sun.COM break; 10138348SEric.Yu@Sun.COM default: 10148348SEric.Yu@Sun.COM ASSERT(0); 10158348SEric.Yu@Sun.COM break; 10168348SEric.Yu@Sun.COM } 10178348SEric.Yu@Sun.COM } 10188348SEric.Yu@Sun.COM 10198348SEric.Yu@Sun.COM void 10208348SEric.Yu@Sun.COM so_txq_full(sock_upper_handle_t sock_handle, boolean_t qfull) 10218348SEric.Yu@Sun.COM { 10228348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 10238348SEric.Yu@Sun.COM 10248348SEric.Yu@Sun.COM if (qfull) { 10258348SEric.Yu@Sun.COM so_snd_qfull(so); 10268348SEric.Yu@Sun.COM } else { 10278348SEric.Yu@Sun.COM so_snd_qnotfull(so); 10288348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 10298348SEric.Yu@Sun.COM so_notify_writable(so); 10308348SEric.Yu@Sun.COM } 10318348SEric.Yu@Sun.COM } 10328348SEric.Yu@Sun.COM 10338348SEric.Yu@Sun.COM sock_upper_handle_t 10348348SEric.Yu@Sun.COM so_newconn(sock_upper_handle_t parenthandle, 10358348SEric.Yu@Sun.COM sock_lower_handle_t proto_handle, sock_downcalls_t *sock_downcalls, 10368348SEric.Yu@Sun.COM struct cred *peer_cred, pid_t peer_cpid, sock_upcalls_t **sock_upcallsp) 10378348SEric.Yu@Sun.COM { 10388348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)parenthandle; 10398348SEric.Yu@Sun.COM struct sonode *nso; 10408348SEric.Yu@Sun.COM int error; 10418348SEric.Yu@Sun.COM 10428348SEric.Yu@Sun.COM ASSERT(proto_handle != NULL); 10438348SEric.Yu@Sun.COM 10448348SEric.Yu@Sun.COM if ((so->so_state & SS_ACCEPTCONN) == 0 || 10458348SEric.Yu@Sun.COM so->so_acceptq_len >= so->so_backlog) 10468348SEric.Yu@Sun.COM return (NULL); 10478348SEric.Yu@Sun.COM 10488348SEric.Yu@Sun.COM nso = socket_newconn(so, proto_handle, sock_downcalls, SOCKET_NOSLEEP, 10498348SEric.Yu@Sun.COM &error); 10508348SEric.Yu@Sun.COM if (nso == NULL) 10518348SEric.Yu@Sun.COM return (NULL); 10528348SEric.Yu@Sun.COM 10538348SEric.Yu@Sun.COM if (peer_cred != NULL) { 10548348SEric.Yu@Sun.COM crhold(peer_cred); 10558348SEric.Yu@Sun.COM nso->so_peercred = peer_cred; 10568348SEric.Yu@Sun.COM nso->so_cpid = peer_cpid; 10578348SEric.Yu@Sun.COM } 10588348SEric.Yu@Sun.COM 1059*8820SAnders.Persson@Sun.COM /* 1060*8820SAnders.Persson@Sun.COM * The new socket (nso), proto_handle and sock_upcallsp are all 1061*8820SAnders.Persson@Sun.COM * valid at this point. But as soon as nso is placed in the accept 1062*8820SAnders.Persson@Sun.COM * queue that can no longer be assumed (since an accept() thread may 1063*8820SAnders.Persson@Sun.COM * pull it off the queue and close the socket). 1064*8820SAnders.Persson@Sun.COM */ 1065*8820SAnders.Persson@Sun.COM *sock_upcallsp = &so_upcalls; 1066*8820SAnders.Persson@Sun.COM 10678348SEric.Yu@Sun.COM (void) so_acceptq_enqueue(so, nso); 1068*8820SAnders.Persson@Sun.COM 10698348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 10708348SEric.Yu@Sun.COM so_notify_newconn(so); 10718348SEric.Yu@Sun.COM 10728348SEric.Yu@Sun.COM return ((sock_upper_handle_t)nso); 10738348SEric.Yu@Sun.COM } 10748348SEric.Yu@Sun.COM 10758348SEric.Yu@Sun.COM void 10768348SEric.Yu@Sun.COM so_set_prop(sock_upper_handle_t sock_handle, struct sock_proto_props *soppp) 10778348SEric.Yu@Sun.COM { 10788348SEric.Yu@Sun.COM struct sonode *so; 10798348SEric.Yu@Sun.COM 10808348SEric.Yu@Sun.COM so = (struct sonode *)sock_handle; 10818348SEric.Yu@Sun.COM 10828348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 10838348SEric.Yu@Sun.COM 10848348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_MAXBLK) 10858348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxblk = soppp->sopp_maxblk; 10868348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_WROFF) 10878348SEric.Yu@Sun.COM so->so_proto_props.sopp_wroff = soppp->sopp_wroff; 10888348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_TAIL) 10898348SEric.Yu@Sun.COM so->so_proto_props.sopp_tail = soppp->sopp_tail; 10908348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_RCVHIWAT) 10918348SEric.Yu@Sun.COM so->so_proto_props.sopp_rxhiwat = soppp->sopp_rxhiwat; 10928348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_RCVLOWAT) 10938348SEric.Yu@Sun.COM so->so_proto_props.sopp_rxlowat = soppp->sopp_rxlowat; 10948348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_MAXPSZ) 10958348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxpsz = soppp->sopp_maxpsz; 10968348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_MINPSZ) 10978348SEric.Yu@Sun.COM so->so_proto_props.sopp_minpsz = soppp->sopp_minpsz; 10988348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_ZCOPY) { 10998348SEric.Yu@Sun.COM if (soppp->sopp_zcopyflag & ZCVMSAFE) { 11008348SEric.Yu@Sun.COM so->so_proto_props.sopp_zcopyflag |= STZCVMSAFE; 11018348SEric.Yu@Sun.COM so->so_proto_props.sopp_zcopyflag &= ~STZCVMUNSAFE; 11028348SEric.Yu@Sun.COM } else if (soppp->sopp_zcopyflag & ZCVMUNSAFE) { 11038348SEric.Yu@Sun.COM so->so_proto_props.sopp_zcopyflag |= STZCVMUNSAFE; 11048348SEric.Yu@Sun.COM so->so_proto_props.sopp_zcopyflag &= ~STZCVMSAFE; 11058348SEric.Yu@Sun.COM } 11068348SEric.Yu@Sun.COM 11078348SEric.Yu@Sun.COM if (soppp->sopp_zcopyflag & COPYCACHED) { 11088348SEric.Yu@Sun.COM so->so_proto_props.sopp_zcopyflag |= STRCOPYCACHED; 11098348SEric.Yu@Sun.COM } 11108348SEric.Yu@Sun.COM } 11118348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_OOBINLINE) 11128348SEric.Yu@Sun.COM so->so_proto_props.sopp_oobinline = soppp->sopp_oobinline; 11138348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_RCVTIMER) 11148348SEric.Yu@Sun.COM so->so_proto_props.sopp_rcvtimer = soppp->sopp_rcvtimer; 11158348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_RCVTHRESH) 11168348SEric.Yu@Sun.COM so->so_proto_props.sopp_rcvthresh = soppp->sopp_rcvthresh; 11178348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_MAXADDRLEN) 11188348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxaddrlen = soppp->sopp_maxaddrlen; 11198348SEric.Yu@Sun.COM 11208348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 11218348SEric.Yu@Sun.COM 11228348SEric.Yu@Sun.COM #ifdef DEBUG 11238348SEric.Yu@Sun.COM soppp->sopp_flags &= ~(SOCKOPT_MAXBLK | SOCKOPT_WROFF | SOCKOPT_TAIL | 11248348SEric.Yu@Sun.COM SOCKOPT_RCVHIWAT | SOCKOPT_RCVLOWAT | SOCKOPT_MAXPSZ | 11258348SEric.Yu@Sun.COM SOCKOPT_ZCOPY | SOCKOPT_OOBINLINE | SOCKOPT_RCVTIMER | 11268348SEric.Yu@Sun.COM SOCKOPT_RCVTHRESH | SOCKOPT_MAXADDRLEN | SOCKOPT_MINPSZ); 11278348SEric.Yu@Sun.COM ASSERT(soppp->sopp_flags == 0); 11288348SEric.Yu@Sun.COM #endif 11298348SEric.Yu@Sun.COM } 11308348SEric.Yu@Sun.COM 11318348SEric.Yu@Sun.COM /* ARGSUSED */ 11328348SEric.Yu@Sun.COM ssize_t 11338348SEric.Yu@Sun.COM so_queue_msg(sock_upper_handle_t sock_handle, mblk_t *mp, 11348348SEric.Yu@Sun.COM size_t msg_size, int flags, int *errorp, boolean_t *force_pushp) 11358348SEric.Yu@Sun.COM { 11368348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 11378348SEric.Yu@Sun.COM boolean_t force_push = B_TRUE; 11388348SEric.Yu@Sun.COM int space_left; 11398348SEric.Yu@Sun.COM sodirect_t *sodp = so->so_direct; 11408348SEric.Yu@Sun.COM 11418348SEric.Yu@Sun.COM ASSERT(errorp != NULL); 11428348SEric.Yu@Sun.COM *errorp = 0; 11438348SEric.Yu@Sun.COM if (mp == NULL) { 11448348SEric.Yu@Sun.COM if (msg_size > 0) { 11458348SEric.Yu@Sun.COM ASSERT(so->so_downcalls->sd_recv_uio != NULL); 11468348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 11478348SEric.Yu@Sun.COM /* the notify functions will drop the lock */ 11488348SEric.Yu@Sun.COM if (flags & MSG_OOB) 11498348SEric.Yu@Sun.COM so_notify_oobdata(so, IS_SO_OOB_INLINE(so)); 11508348SEric.Yu@Sun.COM else 11518348SEric.Yu@Sun.COM so_notify_data(so, msg_size); 11528348SEric.Yu@Sun.COM return (0); 11538348SEric.Yu@Sun.COM } 11548348SEric.Yu@Sun.COM /* 11558348SEric.Yu@Sun.COM * recv space check 11568348SEric.Yu@Sun.COM */ 11578348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 11588348SEric.Yu@Sun.COM space_left = so->so_rcvbuf - so->so_rcv_queued; 11598348SEric.Yu@Sun.COM if (space_left <= 0) { 11608348SEric.Yu@Sun.COM so->so_flowctrld = B_TRUE; 11618348SEric.Yu@Sun.COM *errorp = ENOSPC; 11628348SEric.Yu@Sun.COM space_left = -1; 11638348SEric.Yu@Sun.COM } 11648348SEric.Yu@Sun.COM goto done_unlock; 11658348SEric.Yu@Sun.COM } 11668348SEric.Yu@Sun.COM 11678348SEric.Yu@Sun.COM ASSERT(mp->b_next == NULL); 11688348SEric.Yu@Sun.COM ASSERT(DB_TYPE(mp) == M_DATA || DB_TYPE(mp) == M_PROTO); 11698348SEric.Yu@Sun.COM ASSERT(msg_size == msgdsize(mp)); 11708348SEric.Yu@Sun.COM 11718348SEric.Yu@Sun.COM if (flags & MSG_OOB) { 11728348SEric.Yu@Sun.COM so_queue_oob(sock_handle, mp, msg_size); 11738348SEric.Yu@Sun.COM return (0); 11748348SEric.Yu@Sun.COM } 11758348SEric.Yu@Sun.COM 11768348SEric.Yu@Sun.COM if (force_pushp != NULL) 11778348SEric.Yu@Sun.COM force_push = *force_pushp; 11788348SEric.Yu@Sun.COM 11798348SEric.Yu@Sun.COM if (DB_TYPE(mp) == M_PROTO && !__TPI_PRIM_ISALIGNED(mp->b_rptr)) { 11808348SEric.Yu@Sun.COM /* The read pointer is not aligned correctly for TPI */ 11818348SEric.Yu@Sun.COM zcmn_err(getzoneid(), CE_WARN, 11828348SEric.Yu@Sun.COM "sockfs: Unaligned TPI message received. rptr = %p\n", 11838348SEric.Yu@Sun.COM (void *)mp->b_rptr); 11848348SEric.Yu@Sun.COM freemsg(mp); 11858348SEric.Yu@Sun.COM mutex_enter(sodp->sod_lockp); 11868348SEric.Yu@Sun.COM SOD_UIOAFINI(sodp); 11878348SEric.Yu@Sun.COM mutex_exit(sodp->sod_lockp); 11888348SEric.Yu@Sun.COM 11898348SEric.Yu@Sun.COM return (so->so_rcvbuf - so->so_rcv_queued); 11908348SEric.Yu@Sun.COM } 11918348SEric.Yu@Sun.COM 11928348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 11938348SEric.Yu@Sun.COM if (so->so_state & (SS_FALLBACK_PENDING | SS_FALLBACK_COMP)) { 11948348SEric.Yu@Sun.COM SOD_DISABLE(sodp); 11958348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 11968348SEric.Yu@Sun.COM *errorp = EOPNOTSUPP; 11978348SEric.Yu@Sun.COM return (-1); 11988348SEric.Yu@Sun.COM } 11998348SEric.Yu@Sun.COM if (so->so_state & SS_CANTRCVMORE) { 12008348SEric.Yu@Sun.COM freemsg(mp); 12018348SEric.Yu@Sun.COM SOD_DISABLE(sodp); 12028348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 12038348SEric.Yu@Sun.COM return (0); 12048348SEric.Yu@Sun.COM } 12058348SEric.Yu@Sun.COM 12068348SEric.Yu@Sun.COM /* process the mblk via I/OAT if capable */ 12078348SEric.Yu@Sun.COM if (sodp != NULL && (sodp->sod_state & SOD_ENABLED)) { 12088348SEric.Yu@Sun.COM if (DB_TYPE(mp) == M_DATA) { 12098348SEric.Yu@Sun.COM (void) sod_uioa_mblk_init(sodp, mp, msg_size); 12108348SEric.Yu@Sun.COM } else { 12118348SEric.Yu@Sun.COM SOD_UIOAFINI(sodp); 12128348SEric.Yu@Sun.COM } 12138348SEric.Yu@Sun.COM } 12148348SEric.Yu@Sun.COM 12158348SEric.Yu@Sun.COM if (mp->b_next == NULL) { 12168348SEric.Yu@Sun.COM so_enqueue_msg(so, mp, msg_size); 12178348SEric.Yu@Sun.COM } else { 12188348SEric.Yu@Sun.COM do { 12198348SEric.Yu@Sun.COM mblk_t *nmp; 12208348SEric.Yu@Sun.COM 12218348SEric.Yu@Sun.COM if ((nmp = mp->b_next) != NULL) { 12228348SEric.Yu@Sun.COM mp->b_next = NULL; 12238348SEric.Yu@Sun.COM } 12248348SEric.Yu@Sun.COM so_enqueue_msg(so, mp, msgdsize(mp)); 12258348SEric.Yu@Sun.COM mp = nmp; 12268348SEric.Yu@Sun.COM } while (mp != NULL); 12278348SEric.Yu@Sun.COM } 12288348SEric.Yu@Sun.COM 12298348SEric.Yu@Sun.COM space_left = so->so_rcvbuf - so->so_rcv_queued; 12308348SEric.Yu@Sun.COM if (space_left <= 0) { 12318348SEric.Yu@Sun.COM so->so_flowctrld = B_TRUE; 12328348SEric.Yu@Sun.COM *errorp = ENOSPC; 12338348SEric.Yu@Sun.COM space_left = -1; 12348348SEric.Yu@Sun.COM } 12358348SEric.Yu@Sun.COM 12368348SEric.Yu@Sun.COM if (force_push || so->so_rcv_queued >= so->so_rcv_thresh || 12378348SEric.Yu@Sun.COM so->so_rcv_queued >= so->so_rcv_wanted || 12388348SEric.Yu@Sun.COM (sodp != NULL && so->so_rcv_queued >= sodp->sod_want)) { 12398348SEric.Yu@Sun.COM SOCKET_TIMER_CANCEL(so); 12408348SEric.Yu@Sun.COM /* 12418348SEric.Yu@Sun.COM * so_notify_data will release the lock 12428348SEric.Yu@Sun.COM */ 12438348SEric.Yu@Sun.COM so_notify_data(so, so->so_rcv_queued); 12448348SEric.Yu@Sun.COM 12458348SEric.Yu@Sun.COM if (force_pushp != NULL) 12468348SEric.Yu@Sun.COM *force_pushp = B_TRUE; 12478348SEric.Yu@Sun.COM goto done; 12488348SEric.Yu@Sun.COM } else if (so->so_rcv_timer_tid == 0) { 12498348SEric.Yu@Sun.COM /* Make sure the recv push timer is running */ 12508348SEric.Yu@Sun.COM SOCKET_TIMER_START(so); 12518348SEric.Yu@Sun.COM } 12528348SEric.Yu@Sun.COM 12538348SEric.Yu@Sun.COM done_unlock: 12548348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 12558348SEric.Yu@Sun.COM done: 12568348SEric.Yu@Sun.COM return (space_left); 12578348SEric.Yu@Sun.COM } 12588348SEric.Yu@Sun.COM 12598348SEric.Yu@Sun.COM /* 12608348SEric.Yu@Sun.COM * Set the offset of where the oob data is relative to the bytes in 12618348SEric.Yu@Sun.COM * queued. Also generate SIGURG 12628348SEric.Yu@Sun.COM */ 12638348SEric.Yu@Sun.COM void 12648348SEric.Yu@Sun.COM so_signal_oob(sock_upper_handle_t sock_handle, ssize_t offset) 12658348SEric.Yu@Sun.COM { 12668348SEric.Yu@Sun.COM struct sonode *so; 12678348SEric.Yu@Sun.COM 12688348SEric.Yu@Sun.COM ASSERT(offset >= 0); 12698348SEric.Yu@Sun.COM so = (struct sonode *)sock_handle; 12708348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 12718348SEric.Yu@Sun.COM SOD_UIOAFINI(so->so_direct); 12728348SEric.Yu@Sun.COM 12738348SEric.Yu@Sun.COM /* 12748348SEric.Yu@Sun.COM * New urgent data on the way so forget about any old 12758348SEric.Yu@Sun.COM * urgent data. 12768348SEric.Yu@Sun.COM */ 12778348SEric.Yu@Sun.COM so->so_state &= ~(SS_HAVEOOBDATA|SS_HADOOBDATA); 12788348SEric.Yu@Sun.COM 12798348SEric.Yu@Sun.COM /* 12808348SEric.Yu@Sun.COM * Record that urgent data is pending. 12818348SEric.Yu@Sun.COM */ 12828348SEric.Yu@Sun.COM so->so_state |= SS_OOBPEND; 12838348SEric.Yu@Sun.COM 12848348SEric.Yu@Sun.COM if (so->so_oobmsg != NULL) { 12858348SEric.Yu@Sun.COM dprintso(so, 1, ("sock: discarding old oob\n")); 12868348SEric.Yu@Sun.COM freemsg(so->so_oobmsg); 12878348SEric.Yu@Sun.COM so->so_oobmsg = NULL; 12888348SEric.Yu@Sun.COM } 12898348SEric.Yu@Sun.COM 12908348SEric.Yu@Sun.COM /* 12918348SEric.Yu@Sun.COM * set the offset where the urgent byte is 12928348SEric.Yu@Sun.COM */ 12938348SEric.Yu@Sun.COM so->so_oobmark = so->so_rcv_queued + offset; 12948348SEric.Yu@Sun.COM if (so->so_oobmark == 0) 12958348SEric.Yu@Sun.COM so->so_state |= SS_RCVATMARK; 12968348SEric.Yu@Sun.COM else 12978348SEric.Yu@Sun.COM so->so_state &= ~SS_RCVATMARK; 12988348SEric.Yu@Sun.COM 12998348SEric.Yu@Sun.COM so_notify_oobsig(so); 13008348SEric.Yu@Sun.COM } 13018348SEric.Yu@Sun.COM 13028348SEric.Yu@Sun.COM /* 13038348SEric.Yu@Sun.COM * Queue the OOB byte 13048348SEric.Yu@Sun.COM */ 13058348SEric.Yu@Sun.COM static void 13068348SEric.Yu@Sun.COM so_queue_oob(sock_upper_handle_t sock_handle, mblk_t *mp, size_t len) 13078348SEric.Yu@Sun.COM { 13088348SEric.Yu@Sun.COM struct sonode *so; 13098348SEric.Yu@Sun.COM 13108348SEric.Yu@Sun.COM so = (struct sonode *)sock_handle; 13118348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 13128348SEric.Yu@Sun.COM SOD_UIOAFINI(so->so_direct); 13138348SEric.Yu@Sun.COM 13148348SEric.Yu@Sun.COM ASSERT(mp != NULL); 13158348SEric.Yu@Sun.COM if (!IS_SO_OOB_INLINE(so)) { 13168348SEric.Yu@Sun.COM so->so_oobmsg = mp; 13178348SEric.Yu@Sun.COM so->so_state |= SS_HAVEOOBDATA; 13188348SEric.Yu@Sun.COM } else { 13198348SEric.Yu@Sun.COM so_enqueue_msg(so, mp, len); 13208348SEric.Yu@Sun.COM } 13218348SEric.Yu@Sun.COM 13228348SEric.Yu@Sun.COM so_notify_oobdata(so, IS_SO_OOB_INLINE(so)); 13238348SEric.Yu@Sun.COM } 13248348SEric.Yu@Sun.COM 13258348SEric.Yu@Sun.COM int 13268348SEric.Yu@Sun.COM so_close(struct sonode *so, int flag, struct cred *cr) 13278348SEric.Yu@Sun.COM { 13288348SEric.Yu@Sun.COM int error; 13298348SEric.Yu@Sun.COM 13308348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_close)(so->so_proto_handle, flag, cr); 13318348SEric.Yu@Sun.COM 13328348SEric.Yu@Sun.COM /* 13338348SEric.Yu@Sun.COM * At this point there will be no more upcalls from the protocol 13348348SEric.Yu@Sun.COM */ 13358348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 13368399SRao.Shoaib@Sun.COM 13378399SRao.Shoaib@Sun.COM ASSERT(so_verify_oobstate(so)); 13388399SRao.Shoaib@Sun.COM 13398348SEric.Yu@Sun.COM so_rcv_flush(so); 13408348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 13418348SEric.Yu@Sun.COM 13428348SEric.Yu@Sun.COM return (error); 13438348SEric.Yu@Sun.COM } 13448348SEric.Yu@Sun.COM 13458348SEric.Yu@Sun.COM void 13468348SEric.Yu@Sun.COM so_zcopy_notify(sock_upper_handle_t sock_handle) 13478348SEric.Yu@Sun.COM { 13488348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 13498348SEric.Yu@Sun.COM 13508348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 13518348SEric.Yu@Sun.COM so->so_copyflag |= STZCNOTIFY; 13528348SEric.Yu@Sun.COM cv_broadcast(&so->so_copy_cv); 13538348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 13548348SEric.Yu@Sun.COM } 13558348SEric.Yu@Sun.COM 13568348SEric.Yu@Sun.COM void 13578348SEric.Yu@Sun.COM so_set_error(sock_upper_handle_t sock_handle, int error) 13588348SEric.Yu@Sun.COM { 13598348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 13608348SEric.Yu@Sun.COM 13618348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 13628348SEric.Yu@Sun.COM 13638348SEric.Yu@Sun.COM soseterror(so, error); 13648348SEric.Yu@Sun.COM 13658348SEric.Yu@Sun.COM so_notify_error(so); 13668348SEric.Yu@Sun.COM } 13678348SEric.Yu@Sun.COM 13688348SEric.Yu@Sun.COM /* 13698348SEric.Yu@Sun.COM * so_recvmsg - read data from the socket 13708348SEric.Yu@Sun.COM * 13718348SEric.Yu@Sun.COM * There are two ways of obtaining data; either we ask the protocol to 13728348SEric.Yu@Sun.COM * copy directly into the supplied buffer, or we copy data from the 13738348SEric.Yu@Sun.COM * sonode's receive queue. The decision which one to use depends on 13748348SEric.Yu@Sun.COM * whether the protocol has a sd_recv_uio down call. 13758348SEric.Yu@Sun.COM */ 13768348SEric.Yu@Sun.COM int 13778348SEric.Yu@Sun.COM so_recvmsg(struct sonode *so, struct nmsghdr *msg, struct uio *uiop, 13788348SEric.Yu@Sun.COM struct cred *cr) 13798348SEric.Yu@Sun.COM { 13808348SEric.Yu@Sun.COM rval_t rval; 13818348SEric.Yu@Sun.COM int flags = 0; 13828348SEric.Yu@Sun.COM t_uscalar_t controllen, namelen; 13838348SEric.Yu@Sun.COM int error = 0; 13848348SEric.Yu@Sun.COM int ret; 13858348SEric.Yu@Sun.COM mblk_t *mctlp = NULL; 13868348SEric.Yu@Sun.COM union T_primitives *tpr; 13878348SEric.Yu@Sun.COM void *control; 13888348SEric.Yu@Sun.COM ssize_t saved_resid; 13898348SEric.Yu@Sun.COM struct uio *suiop; 13908348SEric.Yu@Sun.COM 13918348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_RECVMSG(so, msg, uiop, cr)); 13928348SEric.Yu@Sun.COM 13938348SEric.Yu@Sun.COM if ((so->so_state & (SS_ISCONNECTED|SS_CANTRCVMORE)) == 0 && 13948348SEric.Yu@Sun.COM (so->so_mode & SM_CONNREQUIRED)) { 13958348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 13968348SEric.Yu@Sun.COM return (ENOTCONN); 13978348SEric.Yu@Sun.COM } 13988348SEric.Yu@Sun.COM 13998348SEric.Yu@Sun.COM if (msg->msg_flags & MSG_PEEK) 14008348SEric.Yu@Sun.COM msg->msg_flags &= ~MSG_WAITALL; 14018348SEric.Yu@Sun.COM 14028348SEric.Yu@Sun.COM if (so->so_mode & SM_ATOMIC) 14038348SEric.Yu@Sun.COM msg->msg_flags |= MSG_TRUNC; 14048348SEric.Yu@Sun.COM 14058348SEric.Yu@Sun.COM if (msg->msg_flags & MSG_OOB) { 14068348SEric.Yu@Sun.COM if ((so->so_mode & SM_EXDATA) == 0) { 14078348SEric.Yu@Sun.COM error = EOPNOTSUPP; 14088348SEric.Yu@Sun.COM } else if (so->so_downcalls->sd_recv_uio != NULL) { 14098348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_recv_uio) 14108348SEric.Yu@Sun.COM (so->so_proto_handle, uiop, msg, cr); 14118348SEric.Yu@Sun.COM } else { 14128348SEric.Yu@Sun.COM error = sorecvoob(so, msg, uiop, msg->msg_flags, 14138348SEric.Yu@Sun.COM IS_SO_OOB_INLINE(so)); 14148348SEric.Yu@Sun.COM } 14158348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 14168348SEric.Yu@Sun.COM return (error); 14178348SEric.Yu@Sun.COM } 14188348SEric.Yu@Sun.COM 14198348SEric.Yu@Sun.COM /* 14208348SEric.Yu@Sun.COM * If the protocol has the recv down call, then pass the request 14218348SEric.Yu@Sun.COM * down. 14228348SEric.Yu@Sun.COM */ 14238348SEric.Yu@Sun.COM if (so->so_downcalls->sd_recv_uio != NULL) { 14248348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_recv_uio) 14258348SEric.Yu@Sun.COM (so->so_proto_handle, uiop, msg, cr); 14268348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 14278348SEric.Yu@Sun.COM return (error); 14288348SEric.Yu@Sun.COM } 14298348SEric.Yu@Sun.COM 14308348SEric.Yu@Sun.COM /* 14318348SEric.Yu@Sun.COM * Reading data from the socket buffer 14328348SEric.Yu@Sun.COM */ 14338348SEric.Yu@Sun.COM flags = msg->msg_flags; 14348348SEric.Yu@Sun.COM msg->msg_flags = 0; 14358348SEric.Yu@Sun.COM 14368348SEric.Yu@Sun.COM /* 14378348SEric.Yu@Sun.COM * Set msg_controllen and msg_namelen to zero here to make it 14388348SEric.Yu@Sun.COM * simpler in the cases that no control or name is returned. 14398348SEric.Yu@Sun.COM */ 14408348SEric.Yu@Sun.COM controllen = msg->msg_controllen; 14418348SEric.Yu@Sun.COM namelen = msg->msg_namelen; 14428348SEric.Yu@Sun.COM msg->msg_controllen = 0; 14438348SEric.Yu@Sun.COM msg->msg_namelen = 0; 14448348SEric.Yu@Sun.COM 14458348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 14468348SEric.Yu@Sun.COM /* Set SOREADLOCKED */ 14478348SEric.Yu@Sun.COM error = so_lock_read_intr(so, 14488348SEric.Yu@Sun.COM uiop->uio_fmode | ((flags & MSG_DONTWAIT) ? FNONBLOCK : 0)); 14498348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 14508348SEric.Yu@Sun.COM if (error) { 14518348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 14528348SEric.Yu@Sun.COM return (error); 14538348SEric.Yu@Sun.COM } 14548348SEric.Yu@Sun.COM 14558348SEric.Yu@Sun.COM suiop = sod_rcv_init(so, flags, &uiop); 14568348SEric.Yu@Sun.COM retry: 14578348SEric.Yu@Sun.COM saved_resid = uiop->uio_resid; 14588348SEric.Yu@Sun.COM error = so_dequeue_msg(so, &mctlp, uiop, &rval, flags); 14598348SEric.Yu@Sun.COM if (error != 0) { 14608348SEric.Yu@Sun.COM goto out; 14618348SEric.Yu@Sun.COM } 14628348SEric.Yu@Sun.COM /* 14638348SEric.Yu@Sun.COM * For datagrams the MOREDATA flag is used to set MSG_TRUNC. 14648348SEric.Yu@Sun.COM * For non-datagrams MOREDATA is used to set MSG_EOR. 14658348SEric.Yu@Sun.COM */ 14668348SEric.Yu@Sun.COM ASSERT(!(rval.r_val1 & MORECTL)); 14678348SEric.Yu@Sun.COM if ((rval.r_val1 & MOREDATA) && (so->so_mode & SM_ATOMIC)) 14688348SEric.Yu@Sun.COM msg->msg_flags |= MSG_TRUNC; 14698348SEric.Yu@Sun.COM if (mctlp == NULL) { 14708348SEric.Yu@Sun.COM dprintso(so, 1, ("so_recvmsg: got M_DATA\n")); 14718348SEric.Yu@Sun.COM 14728348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 14738348SEric.Yu@Sun.COM /* Set MSG_EOR based on MOREDATA */ 14748348SEric.Yu@Sun.COM if (!(rval.r_val1 & MOREDATA)) { 14758348SEric.Yu@Sun.COM if (so->so_state & SS_SAVEDEOR) { 14768348SEric.Yu@Sun.COM msg->msg_flags |= MSG_EOR; 14778348SEric.Yu@Sun.COM so->so_state &= ~SS_SAVEDEOR; 14788348SEric.Yu@Sun.COM } 14798348SEric.Yu@Sun.COM } 14808348SEric.Yu@Sun.COM /* 14818348SEric.Yu@Sun.COM * If some data was received (i.e. not EOF) and the 14828348SEric.Yu@Sun.COM * read/recv* has not been satisfied wait for some more. 14838348SEric.Yu@Sun.COM */ 14848348SEric.Yu@Sun.COM if ((flags & MSG_WAITALL) && !(msg->msg_flags & MSG_EOR) && 14858348SEric.Yu@Sun.COM uiop->uio_resid != saved_resid && uiop->uio_resid > 0) { 14868348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 14878348SEric.Yu@Sun.COM goto retry; 14888348SEric.Yu@Sun.COM } 14898348SEric.Yu@Sun.COM 14908348SEric.Yu@Sun.COM goto out_locked; 14918348SEric.Yu@Sun.COM } 14928348SEric.Yu@Sun.COM /* strsock_proto has already verified length and alignment */ 14938348SEric.Yu@Sun.COM tpr = (union T_primitives *)mctlp->b_rptr; 14948348SEric.Yu@Sun.COM dprintso(so, 1, ("so_recvmsg: type %d\n", tpr->type)); 14958348SEric.Yu@Sun.COM switch (tpr->type) { 14968348SEric.Yu@Sun.COM case T_DATA_IND: { 14978348SEric.Yu@Sun.COM /* 14988348SEric.Yu@Sun.COM * Set msg_flags to MSG_EOR based on 14998348SEric.Yu@Sun.COM * MORE_flag and MOREDATA. 15008348SEric.Yu@Sun.COM */ 15018348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 15028348SEric.Yu@Sun.COM so->so_state &= ~SS_SAVEDEOR; 15038348SEric.Yu@Sun.COM if (!(tpr->data_ind.MORE_flag & 1)) { 15048348SEric.Yu@Sun.COM if (!(rval.r_val1 & MOREDATA)) 15058348SEric.Yu@Sun.COM msg->msg_flags |= MSG_EOR; 15068348SEric.Yu@Sun.COM else 15078348SEric.Yu@Sun.COM so->so_state |= SS_SAVEDEOR; 15088348SEric.Yu@Sun.COM } 15098348SEric.Yu@Sun.COM freemsg(mctlp); 15108348SEric.Yu@Sun.COM /* 15118348SEric.Yu@Sun.COM * If some data was received (i.e. not EOF) and the 15128348SEric.Yu@Sun.COM * read/recv* has not been satisfied wait for some more. 15138348SEric.Yu@Sun.COM */ 15148348SEric.Yu@Sun.COM if ((flags & MSG_WAITALL) && !(msg->msg_flags & MSG_EOR) && 15158348SEric.Yu@Sun.COM uiop->uio_resid != saved_resid && uiop->uio_resid > 0) { 15168348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 15178348SEric.Yu@Sun.COM goto retry; 15188348SEric.Yu@Sun.COM } 15198348SEric.Yu@Sun.COM goto out_locked; 15208348SEric.Yu@Sun.COM } 15218348SEric.Yu@Sun.COM case T_UNITDATA_IND: { 15228348SEric.Yu@Sun.COM void *addr; 15238348SEric.Yu@Sun.COM t_uscalar_t addrlen; 15248348SEric.Yu@Sun.COM void *abuf; 15258348SEric.Yu@Sun.COM t_uscalar_t optlen; 15268348SEric.Yu@Sun.COM void *opt; 15278348SEric.Yu@Sun.COM 15288348SEric.Yu@Sun.COM if (namelen != 0) { 15298348SEric.Yu@Sun.COM /* Caller wants source address */ 15308348SEric.Yu@Sun.COM addrlen = tpr->unitdata_ind.SRC_length; 15318348SEric.Yu@Sun.COM addr = sogetoff(mctlp, tpr->unitdata_ind.SRC_offset, 15328348SEric.Yu@Sun.COM addrlen, 1); 15338348SEric.Yu@Sun.COM if (addr == NULL) { 15348348SEric.Yu@Sun.COM freemsg(mctlp); 15358348SEric.Yu@Sun.COM error = EPROTO; 15368348SEric.Yu@Sun.COM eprintsoline(so, error); 15378348SEric.Yu@Sun.COM goto out; 15388348SEric.Yu@Sun.COM } 15398348SEric.Yu@Sun.COM ASSERT(so->so_family != AF_UNIX); 15408348SEric.Yu@Sun.COM } 15418348SEric.Yu@Sun.COM optlen = tpr->unitdata_ind.OPT_length; 15428348SEric.Yu@Sun.COM if (optlen != 0) { 15438348SEric.Yu@Sun.COM t_uscalar_t ncontrollen; 15448348SEric.Yu@Sun.COM 15458348SEric.Yu@Sun.COM /* 15468348SEric.Yu@Sun.COM * Extract any source address option. 15478348SEric.Yu@Sun.COM * Determine how large cmsg buffer is needed. 15488348SEric.Yu@Sun.COM */ 15498348SEric.Yu@Sun.COM opt = sogetoff(mctlp, tpr->unitdata_ind.OPT_offset, 15508348SEric.Yu@Sun.COM optlen, __TPI_ALIGN_SIZE); 15518348SEric.Yu@Sun.COM 15528348SEric.Yu@Sun.COM if (opt == NULL) { 15538348SEric.Yu@Sun.COM freemsg(mctlp); 15548348SEric.Yu@Sun.COM error = EPROTO; 15558348SEric.Yu@Sun.COM eprintsoline(so, error); 15568348SEric.Yu@Sun.COM goto out; 15578348SEric.Yu@Sun.COM } 15588348SEric.Yu@Sun.COM if (so->so_family == AF_UNIX) 15598348SEric.Yu@Sun.COM so_getopt_srcaddr(opt, optlen, &addr, &addrlen); 15608348SEric.Yu@Sun.COM ncontrollen = so_cmsglen(mctlp, opt, optlen, 15618348SEric.Yu@Sun.COM !(flags & MSG_XPG4_2)); 15628348SEric.Yu@Sun.COM if (controllen != 0) 15638348SEric.Yu@Sun.COM controllen = ncontrollen; 15648348SEric.Yu@Sun.COM else if (ncontrollen != 0) 15658348SEric.Yu@Sun.COM msg->msg_flags |= MSG_CTRUNC; 15668348SEric.Yu@Sun.COM } else { 15678348SEric.Yu@Sun.COM controllen = 0; 15688348SEric.Yu@Sun.COM } 15698348SEric.Yu@Sun.COM 15708348SEric.Yu@Sun.COM if (namelen != 0) { 15718348SEric.Yu@Sun.COM /* 15728348SEric.Yu@Sun.COM * Return address to caller. 15738348SEric.Yu@Sun.COM * Caller handles truncation if length 15748348SEric.Yu@Sun.COM * exceeds msg_namelen. 15758348SEric.Yu@Sun.COM * NOTE: AF_UNIX NUL termination is ensured by 15768348SEric.Yu@Sun.COM * the sender's copyin_name(). 15778348SEric.Yu@Sun.COM */ 15788348SEric.Yu@Sun.COM abuf = kmem_alloc(addrlen, KM_SLEEP); 15798348SEric.Yu@Sun.COM 15808348SEric.Yu@Sun.COM bcopy(addr, abuf, addrlen); 15818348SEric.Yu@Sun.COM msg->msg_name = abuf; 15828348SEric.Yu@Sun.COM msg->msg_namelen = addrlen; 15838348SEric.Yu@Sun.COM } 15848348SEric.Yu@Sun.COM 15858348SEric.Yu@Sun.COM if (controllen != 0) { 15868348SEric.Yu@Sun.COM /* 15878348SEric.Yu@Sun.COM * Return control msg to caller. 15888348SEric.Yu@Sun.COM * Caller handles truncation if length 15898348SEric.Yu@Sun.COM * exceeds msg_controllen. 15908348SEric.Yu@Sun.COM */ 15918348SEric.Yu@Sun.COM control = kmem_zalloc(controllen, KM_SLEEP); 15928348SEric.Yu@Sun.COM 15938348SEric.Yu@Sun.COM error = so_opt2cmsg(mctlp, opt, optlen, 15948348SEric.Yu@Sun.COM !(flags & MSG_XPG4_2), control, controllen); 15958348SEric.Yu@Sun.COM if (error) { 15968348SEric.Yu@Sun.COM freemsg(mctlp); 15978348SEric.Yu@Sun.COM if (msg->msg_namelen != 0) 15988348SEric.Yu@Sun.COM kmem_free(msg->msg_name, 15998348SEric.Yu@Sun.COM msg->msg_namelen); 16008348SEric.Yu@Sun.COM kmem_free(control, controllen); 16018348SEric.Yu@Sun.COM eprintsoline(so, error); 16028348SEric.Yu@Sun.COM goto out; 16038348SEric.Yu@Sun.COM } 16048348SEric.Yu@Sun.COM msg->msg_control = control; 16058348SEric.Yu@Sun.COM msg->msg_controllen = controllen; 16068348SEric.Yu@Sun.COM } 16078348SEric.Yu@Sun.COM 16088348SEric.Yu@Sun.COM freemsg(mctlp); 16098348SEric.Yu@Sun.COM goto out; 16108348SEric.Yu@Sun.COM } 16118348SEric.Yu@Sun.COM case T_OPTDATA_IND: { 16128348SEric.Yu@Sun.COM struct T_optdata_req *tdr; 16138348SEric.Yu@Sun.COM void *opt; 16148348SEric.Yu@Sun.COM t_uscalar_t optlen; 16158348SEric.Yu@Sun.COM 16168348SEric.Yu@Sun.COM tdr = (struct T_optdata_req *)mctlp->b_rptr; 16178348SEric.Yu@Sun.COM optlen = tdr->OPT_length; 16188348SEric.Yu@Sun.COM if (optlen != 0) { 16198348SEric.Yu@Sun.COM t_uscalar_t ncontrollen; 16208348SEric.Yu@Sun.COM /* 16218348SEric.Yu@Sun.COM * Determine how large cmsg buffer is needed. 16228348SEric.Yu@Sun.COM */ 16238348SEric.Yu@Sun.COM opt = sogetoff(mctlp, 16248348SEric.Yu@Sun.COM tpr->optdata_ind.OPT_offset, optlen, 16258348SEric.Yu@Sun.COM __TPI_ALIGN_SIZE); 16268348SEric.Yu@Sun.COM 16278348SEric.Yu@Sun.COM if (opt == NULL) { 16288348SEric.Yu@Sun.COM freemsg(mctlp); 16298348SEric.Yu@Sun.COM error = EPROTO; 16308348SEric.Yu@Sun.COM eprintsoline(so, error); 16318348SEric.Yu@Sun.COM goto out; 16328348SEric.Yu@Sun.COM } 16338348SEric.Yu@Sun.COM 16348348SEric.Yu@Sun.COM ncontrollen = so_cmsglen(mctlp, opt, optlen, 16358348SEric.Yu@Sun.COM !(flags & MSG_XPG4_2)); 16368348SEric.Yu@Sun.COM if (controllen != 0) 16378348SEric.Yu@Sun.COM controllen = ncontrollen; 16388348SEric.Yu@Sun.COM else if (ncontrollen != 0) 16398348SEric.Yu@Sun.COM msg->msg_flags |= MSG_CTRUNC; 16408348SEric.Yu@Sun.COM } else { 16418348SEric.Yu@Sun.COM controllen = 0; 16428348SEric.Yu@Sun.COM } 16438348SEric.Yu@Sun.COM 16448348SEric.Yu@Sun.COM if (controllen != 0) { 16458348SEric.Yu@Sun.COM /* 16468348SEric.Yu@Sun.COM * Return control msg to caller. 16478348SEric.Yu@Sun.COM * Caller handles truncation if length 16488348SEric.Yu@Sun.COM * exceeds msg_controllen. 16498348SEric.Yu@Sun.COM */ 16508348SEric.Yu@Sun.COM control = kmem_zalloc(controllen, KM_SLEEP); 16518348SEric.Yu@Sun.COM 16528348SEric.Yu@Sun.COM error = so_opt2cmsg(mctlp, opt, optlen, 16538348SEric.Yu@Sun.COM !(flags & MSG_XPG4_2), control, controllen); 16548348SEric.Yu@Sun.COM if (error) { 16558348SEric.Yu@Sun.COM freemsg(mctlp); 16568348SEric.Yu@Sun.COM kmem_free(control, controllen); 16578348SEric.Yu@Sun.COM eprintsoline(so, error); 16588348SEric.Yu@Sun.COM goto out; 16598348SEric.Yu@Sun.COM } 16608348SEric.Yu@Sun.COM msg->msg_control = control; 16618348SEric.Yu@Sun.COM msg->msg_controllen = controllen; 16628348SEric.Yu@Sun.COM } 16638348SEric.Yu@Sun.COM 16648348SEric.Yu@Sun.COM /* 16658348SEric.Yu@Sun.COM * Set msg_flags to MSG_EOR based on 16668348SEric.Yu@Sun.COM * DATA_flag and MOREDATA. 16678348SEric.Yu@Sun.COM */ 16688348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 16698348SEric.Yu@Sun.COM so->so_state &= ~SS_SAVEDEOR; 16708348SEric.Yu@Sun.COM if (!(tpr->data_ind.MORE_flag & 1)) { 16718348SEric.Yu@Sun.COM if (!(rval.r_val1 & MOREDATA)) 16728348SEric.Yu@Sun.COM msg->msg_flags |= MSG_EOR; 16738348SEric.Yu@Sun.COM else 16748348SEric.Yu@Sun.COM so->so_state |= SS_SAVEDEOR; 16758348SEric.Yu@Sun.COM } 16768348SEric.Yu@Sun.COM freemsg(mctlp); 16778348SEric.Yu@Sun.COM /* 16788348SEric.Yu@Sun.COM * If some data was received (i.e. not EOF) and the 16798348SEric.Yu@Sun.COM * read/recv* has not been satisfied wait for some more. 16808348SEric.Yu@Sun.COM * Not possible to wait if control info was received. 16818348SEric.Yu@Sun.COM */ 16828348SEric.Yu@Sun.COM if ((flags & MSG_WAITALL) && !(msg->msg_flags & MSG_EOR) && 16838348SEric.Yu@Sun.COM controllen == 0 && 16848348SEric.Yu@Sun.COM uiop->uio_resid != saved_resid && uiop->uio_resid > 0) { 16858348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 16868348SEric.Yu@Sun.COM goto retry; 16878348SEric.Yu@Sun.COM } 16888348SEric.Yu@Sun.COM goto out_locked; 16898348SEric.Yu@Sun.COM } 16908348SEric.Yu@Sun.COM default: 16918348SEric.Yu@Sun.COM cmn_err(CE_CONT, "so_recvmsg bad type %x \n", 16928348SEric.Yu@Sun.COM tpr->type); 16938348SEric.Yu@Sun.COM freemsg(mctlp); 16948348SEric.Yu@Sun.COM error = EPROTO; 16958348SEric.Yu@Sun.COM ASSERT(0); 16968348SEric.Yu@Sun.COM } 16978348SEric.Yu@Sun.COM out: 16988348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 16998348SEric.Yu@Sun.COM out_locked: 17008348SEric.Yu@Sun.COM /* The sod_lockp pointers to the sonode so_lock */ 17018348SEric.Yu@Sun.COM ret = sod_rcv_done(so, suiop, uiop); 17028348SEric.Yu@Sun.COM if (ret != 0 && error == 0) 17038348SEric.Yu@Sun.COM error = ret; 17048348SEric.Yu@Sun.COM 17058348SEric.Yu@Sun.COM so_unlock_read(so); /* Clear SOREADLOCKED */ 17068348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 17078348SEric.Yu@Sun.COM 17088348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 17098348SEric.Yu@Sun.COM 17108348SEric.Yu@Sun.COM return (error); 17118348SEric.Yu@Sun.COM } 17128348SEric.Yu@Sun.COM 17138348SEric.Yu@Sun.COM sonodeops_t so_sonodeops = { 17148348SEric.Yu@Sun.COM so_init, /* sop_init */ 17158348SEric.Yu@Sun.COM so_accept, /* sop_accept */ 17168348SEric.Yu@Sun.COM so_bind, /* sop_bind */ 17178348SEric.Yu@Sun.COM so_listen, /* sop_listen */ 17188348SEric.Yu@Sun.COM so_connect, /* sop_connect */ 17198348SEric.Yu@Sun.COM so_recvmsg, /* sop_recvmsg */ 17208348SEric.Yu@Sun.COM so_sendmsg, /* sop_sendmsg */ 17218348SEric.Yu@Sun.COM so_sendmblk, /* sop_sendmblk */ 17228348SEric.Yu@Sun.COM so_getpeername, /* sop_getpeername */ 17238348SEric.Yu@Sun.COM so_getsockname, /* sop_getsockname */ 17248348SEric.Yu@Sun.COM so_shutdown, /* sop_shutdown */ 17258348SEric.Yu@Sun.COM so_getsockopt, /* sop_getsockopt */ 17268348SEric.Yu@Sun.COM so_setsockopt, /* sop_setsockopt */ 17278348SEric.Yu@Sun.COM so_ioctl, /* sop_ioctl */ 17288348SEric.Yu@Sun.COM so_poll, /* sop_poll */ 17298348SEric.Yu@Sun.COM so_close, /* sop_close */ 17308348SEric.Yu@Sun.COM }; 17318348SEric.Yu@Sun.COM 17328348SEric.Yu@Sun.COM sock_upcalls_t so_upcalls = { 17338348SEric.Yu@Sun.COM so_newconn, 17348348SEric.Yu@Sun.COM so_connected, 17358348SEric.Yu@Sun.COM so_disconnected, 17368348SEric.Yu@Sun.COM so_opctl, 17378348SEric.Yu@Sun.COM so_queue_msg, 17388348SEric.Yu@Sun.COM so_set_prop, 17398348SEric.Yu@Sun.COM so_txq_full, 17408348SEric.Yu@Sun.COM so_signal_oob, 17418348SEric.Yu@Sun.COM so_zcopy_notify, 17428348SEric.Yu@Sun.COM so_set_error 17438348SEric.Yu@Sun.COM }; 1744