18348SEric.Yu@Sun.COM /* 28348SEric.Yu@Sun.COM * CDDL HEADER START 38348SEric.Yu@Sun.COM * 48348SEric.Yu@Sun.COM * The contents of this file are subject to the terms of the 58348SEric.Yu@Sun.COM * Common Development and Distribution License (the "License"). 68348SEric.Yu@Sun.COM * You may not use this file except in compliance with the License. 78348SEric.Yu@Sun.COM * 88348SEric.Yu@Sun.COM * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 98348SEric.Yu@Sun.COM * or http://www.opensolaris.org/os/licensing. 108348SEric.Yu@Sun.COM * See the License for the specific language governing permissions 118348SEric.Yu@Sun.COM * and limitations under the License. 128348SEric.Yu@Sun.COM * 138348SEric.Yu@Sun.COM * When distributing Covered Code, include this CDDL HEADER in each 148348SEric.Yu@Sun.COM * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 158348SEric.Yu@Sun.COM * If applicable, add the following below this CDDL HEADER, with the 168348SEric.Yu@Sun.COM * fields enclosed by brackets "[]" replaced with your own identifying 178348SEric.Yu@Sun.COM * information: Portions Copyright [yyyy] [name of copyright owner] 188348SEric.Yu@Sun.COM * 198348SEric.Yu@Sun.COM * CDDL HEADER END 208348SEric.Yu@Sun.COM */ 218348SEric.Yu@Sun.COM 228348SEric.Yu@Sun.COM /* 238348SEric.Yu@Sun.COM * Copyright 2008 Sun Microsystems, Inc. All rights reserved. 248348SEric.Yu@Sun.COM * Use is subject to license terms. 258348SEric.Yu@Sun.COM */ 268348SEric.Yu@Sun.COM 278348SEric.Yu@Sun.COM #pragma ident "@(#)sockcommon_sops.c 1.1 07/06/14 SMI" 288348SEric.Yu@Sun.COM 298348SEric.Yu@Sun.COM #include <sys/types.h> 308348SEric.Yu@Sun.COM #include <sys/param.h> 318348SEric.Yu@Sun.COM #include <sys/systm.h> 328348SEric.Yu@Sun.COM #include <sys/sysmacros.h> 338348SEric.Yu@Sun.COM #include <sys/debug.h> 348348SEric.Yu@Sun.COM #include <sys/cmn_err.h> 358348SEric.Yu@Sun.COM 368348SEric.Yu@Sun.COM #include <sys/stropts.h> 378348SEric.Yu@Sun.COM #include <sys/socket.h> 388348SEric.Yu@Sun.COM #include <sys/socketvar.h> 398348SEric.Yu@Sun.COM 408348SEric.Yu@Sun.COM #define _SUN_TPI_VERSION 2 418348SEric.Yu@Sun.COM #include <sys/tihdr.h> 428348SEric.Yu@Sun.COM #include <sys/sockio.h> 438348SEric.Yu@Sun.COM #include <sys/sodirect.h> 448348SEric.Yu@Sun.COM #include <sys/kmem_impl.h> 458348SEric.Yu@Sun.COM 468348SEric.Yu@Sun.COM #include <sys/strsubr.h> 478348SEric.Yu@Sun.COM #include <sys/strsun.h> 488348SEric.Yu@Sun.COM #include <sys/ddi.h> 498348SEric.Yu@Sun.COM #include <netinet/in.h> 508348SEric.Yu@Sun.COM #include <inet/ip.h> 518348SEric.Yu@Sun.COM 528348SEric.Yu@Sun.COM #include <fs/sockfs/sockcommon.h> 538348SEric.Yu@Sun.COM 548348SEric.Yu@Sun.COM #include <sys/socket_proto.h> 558348SEric.Yu@Sun.COM 568348SEric.Yu@Sun.COM #include <fs/sockfs/socktpi_impl.h> 578348SEric.Yu@Sun.COM #include <sys/tihdr.h> 588348SEric.Yu@Sun.COM #include <fs/sockfs/nl7c.h> 598348SEric.Yu@Sun.COM #include <inet/kssl/ksslapi.h> 608348SEric.Yu@Sun.COM 618348SEric.Yu@Sun.COM 628348SEric.Yu@Sun.COM extern int xnet_skip_checks; 638348SEric.Yu@Sun.COM extern int xnet_check_print; 648348SEric.Yu@Sun.COM 658348SEric.Yu@Sun.COM static void so_queue_oob(sock_upper_handle_t, mblk_t *, size_t); 668348SEric.Yu@Sun.COM 678348SEric.Yu@Sun.COM 688348SEric.Yu@Sun.COM /*ARGSUSED*/ 698348SEric.Yu@Sun.COM int 708348SEric.Yu@Sun.COM so_accept_notsupp(struct sonode *lso, int fflag, 718348SEric.Yu@Sun.COM struct cred *cr, struct sonode **nsop) 728348SEric.Yu@Sun.COM { 738348SEric.Yu@Sun.COM return (EOPNOTSUPP); 748348SEric.Yu@Sun.COM } 758348SEric.Yu@Sun.COM 768348SEric.Yu@Sun.COM /*ARGSUSED*/ 778348SEric.Yu@Sun.COM int 788348SEric.Yu@Sun.COM so_listen_notsupp(struct sonode *so, int backlog, struct cred *cr) 798348SEric.Yu@Sun.COM { 808348SEric.Yu@Sun.COM return (EOPNOTSUPP); 818348SEric.Yu@Sun.COM } 828348SEric.Yu@Sun.COM 838348SEric.Yu@Sun.COM /*ARGSUSED*/ 848348SEric.Yu@Sun.COM int 858348SEric.Yu@Sun.COM so_getsockname_notsupp(struct sonode *so, struct sockaddr *sa, 868348SEric.Yu@Sun.COM socklen_t *len, struct cred *cr) 878348SEric.Yu@Sun.COM { 888348SEric.Yu@Sun.COM return (EOPNOTSUPP); 898348SEric.Yu@Sun.COM } 908348SEric.Yu@Sun.COM 918348SEric.Yu@Sun.COM /*ARGSUSED*/ 928348SEric.Yu@Sun.COM int 938348SEric.Yu@Sun.COM so_getpeername_notsupp(struct sonode *so, struct sockaddr *addr, 948348SEric.Yu@Sun.COM socklen_t *addrlen, boolean_t accept, struct cred *cr) 958348SEric.Yu@Sun.COM { 968348SEric.Yu@Sun.COM return (EOPNOTSUPP); 978348SEric.Yu@Sun.COM } 988348SEric.Yu@Sun.COM 998348SEric.Yu@Sun.COM /*ARGSUSED*/ 1008348SEric.Yu@Sun.COM int 1018348SEric.Yu@Sun.COM so_shutdown_notsupp(struct sonode *so, int how, struct cred *cr) 1028348SEric.Yu@Sun.COM { 1038348SEric.Yu@Sun.COM return (EOPNOTSUPP); 1048348SEric.Yu@Sun.COM } 1058348SEric.Yu@Sun.COM 1068348SEric.Yu@Sun.COM /*ARGSUSED*/ 1078348SEric.Yu@Sun.COM int 1088348SEric.Yu@Sun.COM so_sendmblk_notsupp(struct sonode *so, struct msghdr *msg, int fflag, 1098348SEric.Yu@Sun.COM struct cred *cr, mblk_t **mpp) 1108348SEric.Yu@Sun.COM { 1118348SEric.Yu@Sun.COM return (EOPNOTSUPP); 1128348SEric.Yu@Sun.COM } 1138348SEric.Yu@Sun.COM 1148348SEric.Yu@Sun.COM /* 1158348SEric.Yu@Sun.COM * Generic Socket Ops 1168348SEric.Yu@Sun.COM */ 1178348SEric.Yu@Sun.COM 1188348SEric.Yu@Sun.COM /* ARGSUSED */ 1198348SEric.Yu@Sun.COM int 1208348SEric.Yu@Sun.COM so_init(struct sonode *so, struct sonode *pso, struct cred *cr, int flags) 1218348SEric.Yu@Sun.COM { 1228348SEric.Yu@Sun.COM return (socket_init_common(so, pso, flags, cr)); 1238348SEric.Yu@Sun.COM } 1248348SEric.Yu@Sun.COM 1258348SEric.Yu@Sun.COM int 1268348SEric.Yu@Sun.COM so_bind(struct sonode *so, struct sockaddr *name, socklen_t namelen, 1278348SEric.Yu@Sun.COM int flags, struct cred *cr) 1288348SEric.Yu@Sun.COM { 1298348SEric.Yu@Sun.COM int error; 1308348SEric.Yu@Sun.COM 1318348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_BIND(so, name, namelen, flags, cr)); 1328348SEric.Yu@Sun.COM 1338348SEric.Yu@Sun.COM ASSERT(flags == _SOBIND_XPG4_2 || flags == _SOBIND_SOCKBSD); 1348348SEric.Yu@Sun.COM 1358348SEric.Yu@Sun.COM /* X/Open requires this check */ 1368348SEric.Yu@Sun.COM if ((so->so_state & SS_CANTSENDMORE) && !xnet_skip_checks) { 1378348SEric.Yu@Sun.COM if (xnet_check_print) { 1388348SEric.Yu@Sun.COM printf("sockfs: X/Open bind state check " 1398348SEric.Yu@Sun.COM "caused EINVAL\n"); 1408348SEric.Yu@Sun.COM } 1418348SEric.Yu@Sun.COM error = EINVAL; 1428348SEric.Yu@Sun.COM goto done; 1438348SEric.Yu@Sun.COM } 1448348SEric.Yu@Sun.COM 1458348SEric.Yu@Sun.COM /* 1468348SEric.Yu@Sun.COM * a bind to a NULL address is interpreted as unbind. So just 1478348SEric.Yu@Sun.COM * do the downcall. 1488348SEric.Yu@Sun.COM */ 1498348SEric.Yu@Sun.COM if (name == NULL) 1508348SEric.Yu@Sun.COM goto dobind; 1518348SEric.Yu@Sun.COM 1528348SEric.Yu@Sun.COM switch (so->so_family) { 1538348SEric.Yu@Sun.COM case AF_INET: 1548348SEric.Yu@Sun.COM if ((size_t)namelen != sizeof (sin_t)) { 1558348SEric.Yu@Sun.COM error = name->sa_family != so->so_family ? 1568348SEric.Yu@Sun.COM EAFNOSUPPORT : EINVAL; 1578348SEric.Yu@Sun.COM eprintsoline(so, error); 1588348SEric.Yu@Sun.COM goto done; 1598348SEric.Yu@Sun.COM } 1608348SEric.Yu@Sun.COM 1618348SEric.Yu@Sun.COM if ((flags & _SOBIND_XPG4_2) && 1628348SEric.Yu@Sun.COM (name->sa_family != so->so_family)) { 1638348SEric.Yu@Sun.COM /* 1648348SEric.Yu@Sun.COM * This check has to be made for X/Open 1658348SEric.Yu@Sun.COM * sockets however application failures have 1668348SEric.Yu@Sun.COM * been observed when it is applied to 1678348SEric.Yu@Sun.COM * all sockets. 1688348SEric.Yu@Sun.COM */ 1698348SEric.Yu@Sun.COM error = EAFNOSUPPORT; 1708348SEric.Yu@Sun.COM eprintsoline(so, error); 1718348SEric.Yu@Sun.COM goto done; 1728348SEric.Yu@Sun.COM } 1738348SEric.Yu@Sun.COM /* 1748348SEric.Yu@Sun.COM * Force a zero sa_family to match so_family. 1758348SEric.Yu@Sun.COM * 1768348SEric.Yu@Sun.COM * Some programs like inetd(1M) don't set the 1778348SEric.Yu@Sun.COM * family field. Other programs leave 1788348SEric.Yu@Sun.COM * sin_family set to garbage - SunOS 4.X does 1798348SEric.Yu@Sun.COM * not check the family field on a bind. 1808348SEric.Yu@Sun.COM * We use the family field that 1818348SEric.Yu@Sun.COM * was passed in to the socket() call. 1828348SEric.Yu@Sun.COM */ 1838348SEric.Yu@Sun.COM name->sa_family = so->so_family; 1848348SEric.Yu@Sun.COM break; 1858348SEric.Yu@Sun.COM 1868348SEric.Yu@Sun.COM case AF_INET6: { 1878348SEric.Yu@Sun.COM #ifdef DEBUG 1888348SEric.Yu@Sun.COM sin6_t *sin6 = (sin6_t *)name; 1898348SEric.Yu@Sun.COM #endif 1908348SEric.Yu@Sun.COM if ((size_t)namelen != sizeof (sin6_t)) { 1918348SEric.Yu@Sun.COM error = name->sa_family != so->so_family ? 1928348SEric.Yu@Sun.COM EAFNOSUPPORT : EINVAL; 1938348SEric.Yu@Sun.COM eprintsoline(so, error); 1948348SEric.Yu@Sun.COM goto done; 1958348SEric.Yu@Sun.COM } 1968348SEric.Yu@Sun.COM 1978348SEric.Yu@Sun.COM if (name->sa_family != so->so_family) { 1988348SEric.Yu@Sun.COM /* 1998348SEric.Yu@Sun.COM * With IPv6 we require the family to match 2008348SEric.Yu@Sun.COM * unlike in IPv4. 2018348SEric.Yu@Sun.COM */ 2028348SEric.Yu@Sun.COM error = EAFNOSUPPORT; 2038348SEric.Yu@Sun.COM eprintsoline(so, error); 2048348SEric.Yu@Sun.COM goto done; 2058348SEric.Yu@Sun.COM } 2068348SEric.Yu@Sun.COM #ifdef DEBUG 2078348SEric.Yu@Sun.COM /* 2088348SEric.Yu@Sun.COM * Verify that apps don't forget to clear 2098348SEric.Yu@Sun.COM * sin6_scope_id etc 2108348SEric.Yu@Sun.COM */ 2118348SEric.Yu@Sun.COM if (sin6->sin6_scope_id != 0 && 2128348SEric.Yu@Sun.COM !IN6_IS_ADDR_LINKSCOPE(&sin6->sin6_addr)) { 2138348SEric.Yu@Sun.COM zcmn_err(getzoneid(), CE_WARN, 2148348SEric.Yu@Sun.COM "bind with uninitialized sin6_scope_id " 2158348SEric.Yu@Sun.COM "(%d) on socket. Pid = %d\n", 2168348SEric.Yu@Sun.COM (int)sin6->sin6_scope_id, 2178348SEric.Yu@Sun.COM (int)curproc->p_pid); 2188348SEric.Yu@Sun.COM } 2198348SEric.Yu@Sun.COM if (sin6->__sin6_src_id != 0) { 2208348SEric.Yu@Sun.COM zcmn_err(getzoneid(), CE_WARN, 2218348SEric.Yu@Sun.COM "bind with uninitialized __sin6_src_id " 2228348SEric.Yu@Sun.COM "(%d) on socket. Pid = %d\n", 2238348SEric.Yu@Sun.COM (int)sin6->__sin6_src_id, 2248348SEric.Yu@Sun.COM (int)curproc->p_pid); 2258348SEric.Yu@Sun.COM } 2268348SEric.Yu@Sun.COM #endif /* DEBUG */ 2278348SEric.Yu@Sun.COM 2288348SEric.Yu@Sun.COM break; 2298348SEric.Yu@Sun.COM } 2308348SEric.Yu@Sun.COM default: 2318348SEric.Yu@Sun.COM /* Just pass the request to the protocol */ 2328348SEric.Yu@Sun.COM goto dobind; 2338348SEric.Yu@Sun.COM } 2348348SEric.Yu@Sun.COM 2358348SEric.Yu@Sun.COM /* 2368348SEric.Yu@Sun.COM * First we check if either NCA or KSSL has been enabled for 2378348SEric.Yu@Sun.COM * the requested address, and if so, we fall back to TPI. 2388348SEric.Yu@Sun.COM * If neither of those two services are enabled, then we just 2398348SEric.Yu@Sun.COM * pass the request to the protocol. 2408348SEric.Yu@Sun.COM * 2418348SEric.Yu@Sun.COM * Note that KSSL can only be enabled on a socket if NCA is NOT 2428348SEric.Yu@Sun.COM * enabled for that socket, hence the else-statement below. 2438348SEric.Yu@Sun.COM */ 2448348SEric.Yu@Sun.COM if (nl7c_enabled && ((so->so_family == AF_INET || 2458348SEric.Yu@Sun.COM so->so_family == AF_INET6) && 2468348SEric.Yu@Sun.COM nl7c_lookup_addr(name, namelen) != NULL)) { 2478348SEric.Yu@Sun.COM /* 2488348SEric.Yu@Sun.COM * NL7C is not supported in non-global zones, 2498348SEric.Yu@Sun.COM * we enforce this restriction here. 2508348SEric.Yu@Sun.COM */ 2518348SEric.Yu@Sun.COM if (so->so_zoneid == GLOBAL_ZONEID) { 2528348SEric.Yu@Sun.COM /* NCA should be used, so fall back to TPI */ 2538348SEric.Yu@Sun.COM error = so_tpi_fallback(so, cr); 2548348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 2558348SEric.Yu@Sun.COM if (error) 2568348SEric.Yu@Sun.COM return (error); 2578348SEric.Yu@Sun.COM else 2588348SEric.Yu@Sun.COM return (SOP_BIND(so, name, namelen, flags, cr)); 2598348SEric.Yu@Sun.COM } 2608348SEric.Yu@Sun.COM } else if (so->so_type == SOCK_STREAM) { 2618348SEric.Yu@Sun.COM /* Check if KSSL has been configured for this address */ 2628348SEric.Yu@Sun.COM kssl_ent_t ent; 2638348SEric.Yu@Sun.COM kssl_endpt_type_t type; 2648348SEric.Yu@Sun.COM struct T_bind_req bind_req; 2658348SEric.Yu@Sun.COM mblk_t *mp; 2668348SEric.Yu@Sun.COM 2678348SEric.Yu@Sun.COM /* 2688348SEric.Yu@Sun.COM * TODO: Check with KSSL team if we could add a function call 2698348SEric.Yu@Sun.COM * that only queries whether KSSL is enabled for the given 2708348SEric.Yu@Sun.COM * address. 2718348SEric.Yu@Sun.COM */ 2728348SEric.Yu@Sun.COM bind_req.PRIM_type = T_BIND_REQ; 2738348SEric.Yu@Sun.COM bind_req.ADDR_length = namelen; 2748348SEric.Yu@Sun.COM bind_req.ADDR_offset = (t_scalar_t)sizeof (bind_req); 2758348SEric.Yu@Sun.COM mp = soallocproto2(&bind_req, sizeof (bind_req), 2768348SEric.Yu@Sun.COM name, namelen, 0, _ALLOC_SLEEP); 2778348SEric.Yu@Sun.COM 2788348SEric.Yu@Sun.COM type = kssl_check_proxy(mp, so, &ent); 2798348SEric.Yu@Sun.COM freemsg(mp); 2808348SEric.Yu@Sun.COM 2818348SEric.Yu@Sun.COM if (type != KSSL_NO_PROXY) { 2828348SEric.Yu@Sun.COM /* 2838348SEric.Yu@Sun.COM * KSSL has been configured for this address, so 2848348SEric.Yu@Sun.COM * we must fall back to TPI. 2858348SEric.Yu@Sun.COM */ 2868348SEric.Yu@Sun.COM kssl_release_ent(ent, so, type); 2878348SEric.Yu@Sun.COM error = so_tpi_fallback(so, cr); 2888348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 2898348SEric.Yu@Sun.COM if (error) 2908348SEric.Yu@Sun.COM return (error); 2918348SEric.Yu@Sun.COM else 2928348SEric.Yu@Sun.COM return (SOP_BIND(so, name, namelen, flags, cr)); 2938348SEric.Yu@Sun.COM } 2948348SEric.Yu@Sun.COM } 2958348SEric.Yu@Sun.COM 2968348SEric.Yu@Sun.COM dobind: 2978348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_bind) 2988348SEric.Yu@Sun.COM (so->so_proto_handle, name, namelen, cr); 2998348SEric.Yu@Sun.COM done: 3008348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 3018348SEric.Yu@Sun.COM 3028348SEric.Yu@Sun.COM return (error); 3038348SEric.Yu@Sun.COM } 3048348SEric.Yu@Sun.COM 3058348SEric.Yu@Sun.COM int 3068348SEric.Yu@Sun.COM so_listen(struct sonode *so, int backlog, struct cred *cr) 3078348SEric.Yu@Sun.COM { 3088348SEric.Yu@Sun.COM int error = 0; 3098348SEric.Yu@Sun.COM 3108348SEric.Yu@Sun.COM ASSERT(MUTEX_NOT_HELD(&so->so_lock)); 3118348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_LISTEN(so, backlog, cr)); 3128348SEric.Yu@Sun.COM 3138348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_listen)(so->so_proto_handle, backlog, 3148348SEric.Yu@Sun.COM cr); 3158348SEric.Yu@Sun.COM 3168348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 3178348SEric.Yu@Sun.COM 3188348SEric.Yu@Sun.COM return (error); 3198348SEric.Yu@Sun.COM } 3208348SEric.Yu@Sun.COM 3218348SEric.Yu@Sun.COM 3228348SEric.Yu@Sun.COM int 3238348SEric.Yu@Sun.COM so_connect(struct sonode *so, const struct sockaddr *name, 3248348SEric.Yu@Sun.COM socklen_t namelen, int fflag, int flags, struct cred *cr) 3258348SEric.Yu@Sun.COM { 3268348SEric.Yu@Sun.COM int error = 0; 3278348SEric.Yu@Sun.COM sock_connid_t id; 3288348SEric.Yu@Sun.COM 3298348SEric.Yu@Sun.COM ASSERT(MUTEX_NOT_HELD(&so->so_lock)); 3308348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_CONNECT(so, name, namelen, fflag, flags, cr)); 3318348SEric.Yu@Sun.COM 3328348SEric.Yu@Sun.COM /* 3338348SEric.Yu@Sun.COM * If there is a pending error, return error 3348348SEric.Yu@Sun.COM * This can happen if a non blocking operation caused an error. 3358348SEric.Yu@Sun.COM */ 3368348SEric.Yu@Sun.COM 3378348SEric.Yu@Sun.COM if (so->so_error != 0) { 3388348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 3398348SEric.Yu@Sun.COM error = sogeterr(so, B_TRUE); 3408348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 3418348SEric.Yu@Sun.COM if (error != 0) 3428348SEric.Yu@Sun.COM goto done; 3438348SEric.Yu@Sun.COM } 3448348SEric.Yu@Sun.COM 3458348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_connect)(so->so_proto_handle, 3468348SEric.Yu@Sun.COM name, namelen, &id, cr); 3478348SEric.Yu@Sun.COM 3488348SEric.Yu@Sun.COM if (error == EINPROGRESS) 3498348SEric.Yu@Sun.COM error = so_wait_connected(so, fflag & (FNONBLOCK|FNDELAY), id); 3508348SEric.Yu@Sun.COM 3518348SEric.Yu@Sun.COM done: 3528348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 3538348SEric.Yu@Sun.COM return (error); 3548348SEric.Yu@Sun.COM } 3558348SEric.Yu@Sun.COM 3568348SEric.Yu@Sun.COM /*ARGSUSED*/ 3578348SEric.Yu@Sun.COM int 3588348SEric.Yu@Sun.COM so_accept(struct sonode *so, int fflag, struct cred *cr, struct sonode **nsop) 3598348SEric.Yu@Sun.COM { 3608348SEric.Yu@Sun.COM int error = 0; 3618348SEric.Yu@Sun.COM struct sonode *nso; 3628348SEric.Yu@Sun.COM 3638348SEric.Yu@Sun.COM *nsop = NULL; 3648348SEric.Yu@Sun.COM 3658348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_ACCEPT(so, fflag, cr, nsop)); 3668348SEric.Yu@Sun.COM if ((so->so_state & SS_ACCEPTCONN) == 0) { 3678348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 3688348SEric.Yu@Sun.COM return ((so->so_type == SOCK_DGRAM || so->so_type == SOCK_RAW) ? 3698348SEric.Yu@Sun.COM EOPNOTSUPP : EINVAL); 3708348SEric.Yu@Sun.COM } 3718348SEric.Yu@Sun.COM 3728348SEric.Yu@Sun.COM if ((error = so_acceptq_dequeue(so, (fflag & (FNONBLOCK|FNDELAY)), 3738348SEric.Yu@Sun.COM &nso)) == 0) { 3748348SEric.Yu@Sun.COM ASSERT(nso != NULL); 3758348SEric.Yu@Sun.COM 3768348SEric.Yu@Sun.COM /* finish the accept */ 3778348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_accept)(so->so_proto_handle, 3788348SEric.Yu@Sun.COM nso->so_proto_handle, (sock_upper_handle_t)nso, cr); 3798348SEric.Yu@Sun.COM if (error != 0) { 3808348SEric.Yu@Sun.COM (void) socket_close(nso, 0, cr); 3818348SEric.Yu@Sun.COM socket_destroy(nso); 3828348SEric.Yu@Sun.COM } else { 3838348SEric.Yu@Sun.COM *nsop = nso; 3848348SEric.Yu@Sun.COM } 3858348SEric.Yu@Sun.COM } 3868348SEric.Yu@Sun.COM 3878348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 3888348SEric.Yu@Sun.COM return (error); 3898348SEric.Yu@Sun.COM } 3908348SEric.Yu@Sun.COM 3918348SEric.Yu@Sun.COM int 3928348SEric.Yu@Sun.COM so_sendmsg(struct sonode *so, struct nmsghdr *msg, struct uio *uiop, 3938348SEric.Yu@Sun.COM struct cred *cr) 3948348SEric.Yu@Sun.COM { 3958348SEric.Yu@Sun.COM int error, flags; 3968348SEric.Yu@Sun.COM boolean_t dontblock; 3978348SEric.Yu@Sun.COM ssize_t orig_resid; 3988348SEric.Yu@Sun.COM mblk_t *mp; 3998348SEric.Yu@Sun.COM 4008348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_SENDMSG(so, msg, uiop, cr)); 4018348SEric.Yu@Sun.COM 4028348SEric.Yu@Sun.COM flags = msg->msg_flags; 4038348SEric.Yu@Sun.COM error = 0; 4048348SEric.Yu@Sun.COM dontblock = (flags & MSG_DONTWAIT) || 4058348SEric.Yu@Sun.COM (uiop->uio_fmode & (FNONBLOCK|FNDELAY)); 4068348SEric.Yu@Sun.COM 4078348SEric.Yu@Sun.COM if (!(flags & MSG_XPG4_2) && msg->msg_controllen != 0) { 4088348SEric.Yu@Sun.COM /* 4098348SEric.Yu@Sun.COM * Old way of passing fd's is not supported 4108348SEric.Yu@Sun.COM */ 4118348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 4128348SEric.Yu@Sun.COM return (EOPNOTSUPP); 4138348SEric.Yu@Sun.COM } 4148348SEric.Yu@Sun.COM 4158348SEric.Yu@Sun.COM if ((so->so_mode & SM_ATOMIC) && 4168348SEric.Yu@Sun.COM uiop->uio_resid > so->so_proto_props.sopp_maxpsz && 4178348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxpsz != -1) { 4188348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 4198348SEric.Yu@Sun.COM return (EMSGSIZE); 4208348SEric.Yu@Sun.COM } 4218348SEric.Yu@Sun.COM 4228348SEric.Yu@Sun.COM /* 4238348SEric.Yu@Sun.COM * For atomic sends we will only do one iteration. 4248348SEric.Yu@Sun.COM */ 4258348SEric.Yu@Sun.COM do { 4268348SEric.Yu@Sun.COM if (so->so_state & SS_CANTSENDMORE) { 4278348SEric.Yu@Sun.COM error = EPIPE; 4288348SEric.Yu@Sun.COM break; 4298348SEric.Yu@Sun.COM } 4308348SEric.Yu@Sun.COM 4318348SEric.Yu@Sun.COM if (so->so_error != 0) { 4328348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 4338348SEric.Yu@Sun.COM error = sogeterr(so, B_TRUE); 4348348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 4358348SEric.Yu@Sun.COM if (error != 0) 4368348SEric.Yu@Sun.COM break; 4378348SEric.Yu@Sun.COM } 4388348SEric.Yu@Sun.COM 4398348SEric.Yu@Sun.COM /* 4408348SEric.Yu@Sun.COM * Send down OOB messages even if the send path is being 4418348SEric.Yu@Sun.COM * flow controlled (assuming the protocol supports OOB data). 4428348SEric.Yu@Sun.COM */ 4438348SEric.Yu@Sun.COM if (flags & MSG_OOB) { 4448348SEric.Yu@Sun.COM if ((so->so_mode & SM_EXDATA) == 0) { 4458348SEric.Yu@Sun.COM error = EOPNOTSUPP; 4468348SEric.Yu@Sun.COM break; 4478348SEric.Yu@Sun.COM } 4488348SEric.Yu@Sun.COM } else if (so->so_snd_qfull) { 4498348SEric.Yu@Sun.COM /* 4508348SEric.Yu@Sun.COM * Need to wait until the protocol is ready to receive 4518348SEric.Yu@Sun.COM * more data for transmission. 4528348SEric.Yu@Sun.COM */ 4538348SEric.Yu@Sun.COM if ((error = so_snd_wait_qnotfull(so, dontblock)) != 0) 4548348SEric.Yu@Sun.COM break; 4558348SEric.Yu@Sun.COM } 4568348SEric.Yu@Sun.COM 4578348SEric.Yu@Sun.COM /* 4588348SEric.Yu@Sun.COM * Time to send data to the protocol. We either copy the 4598348SEric.Yu@Sun.COM * data into mblks or pass the uio directly to the protocol. 4608348SEric.Yu@Sun.COM * We decide what to do based on the available down calls. 4618348SEric.Yu@Sun.COM */ 4628348SEric.Yu@Sun.COM if (so->so_downcalls->sd_send_uio != NULL) { 4638348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_send_uio) 4648348SEric.Yu@Sun.COM (so->so_proto_handle, uiop, msg, cr); 4658348SEric.Yu@Sun.COM if (error != 0) 4668348SEric.Yu@Sun.COM break; 4678348SEric.Yu@Sun.COM } else { 4688348SEric.Yu@Sun.COM /* save the resid in case of failure */ 4698348SEric.Yu@Sun.COM orig_resid = uiop->uio_resid; 4708348SEric.Yu@Sun.COM 4718348SEric.Yu@Sun.COM if ((mp = socopyinuio(uiop, 4728348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxpsz, 4738348SEric.Yu@Sun.COM so->so_proto_props.sopp_wroff, 4748348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxblk, 4758348SEric.Yu@Sun.COM so->so_proto_props.sopp_tail, &error)) == NULL) { 4768348SEric.Yu@Sun.COM break; 4778348SEric.Yu@Sun.COM } 4788348SEric.Yu@Sun.COM ASSERT(uiop->uio_resid >= 0); 4798348SEric.Yu@Sun.COM 4808348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_send) 4818348SEric.Yu@Sun.COM (so->so_proto_handle, mp, msg, cr); 4828348SEric.Yu@Sun.COM if (error != 0) { 4838348SEric.Yu@Sun.COM /* 4848348SEric.Yu@Sun.COM * The send failed. We do not have to free the 4858348SEric.Yu@Sun.COM * mblks, because that is the protocol's 4868348SEric.Yu@Sun.COM * responsibility. However, uio_resid must 4878348SEric.Yu@Sun.COM * remain accurate, so adjust that here. 4888348SEric.Yu@Sun.COM */ 4898348SEric.Yu@Sun.COM uiop->uio_resid = orig_resid; 4908348SEric.Yu@Sun.COM break; 4918348SEric.Yu@Sun.COM } 4928348SEric.Yu@Sun.COM } 4938348SEric.Yu@Sun.COM } while (uiop->uio_resid > 0); 4948348SEric.Yu@Sun.COM 4958348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 4968348SEric.Yu@Sun.COM 4978348SEric.Yu@Sun.COM return (error); 4988348SEric.Yu@Sun.COM } 4998348SEric.Yu@Sun.COM 5008348SEric.Yu@Sun.COM int 5018348SEric.Yu@Sun.COM so_sendmblk(struct sonode *so, struct nmsghdr *msg, int fflag, 5028348SEric.Yu@Sun.COM struct cred *cr, mblk_t **mpp) 5038348SEric.Yu@Sun.COM { 5048348SEric.Yu@Sun.COM int error; 5058348SEric.Yu@Sun.COM boolean_t dontblock; 5068348SEric.Yu@Sun.COM size_t size; 5078348SEric.Yu@Sun.COM mblk_t *mp = *mpp; 5088348SEric.Yu@Sun.COM 5098348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_SENDMBLK(so, msg, fflag, cr, mpp)); 5108348SEric.Yu@Sun.COM 5118348SEric.Yu@Sun.COM error = 0; 5128348SEric.Yu@Sun.COM dontblock = (msg->msg_flags & MSG_DONTWAIT) || 5138348SEric.Yu@Sun.COM (fflag & (FNONBLOCK|FNDELAY)); 5148348SEric.Yu@Sun.COM size = msgdsize(mp); 5158348SEric.Yu@Sun.COM 5168401SAnders.Persson@Sun.COM if ((so->so_mode & SM_SENDFILESUPP) == 0 || 5178401SAnders.Persson@Sun.COM so->so_downcalls->sd_send == NULL) { 5188348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 5198348SEric.Yu@Sun.COM return (EOPNOTSUPP); 5208348SEric.Yu@Sun.COM } 5218348SEric.Yu@Sun.COM 5228348SEric.Yu@Sun.COM if ((so->so_mode & SM_ATOMIC) && 5238348SEric.Yu@Sun.COM size > so->so_proto_props.sopp_maxpsz && 5248348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxpsz != -1) { 5258348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 5268348SEric.Yu@Sun.COM return (EMSGSIZE); 5278348SEric.Yu@Sun.COM } 5288348SEric.Yu@Sun.COM 5298348SEric.Yu@Sun.COM while (mp != NULL) { 5308348SEric.Yu@Sun.COM mblk_t *nmp, *last_mblk; 5318348SEric.Yu@Sun.COM size_t mlen; 5328348SEric.Yu@Sun.COM 5338348SEric.Yu@Sun.COM if (so->so_state & SS_CANTSENDMORE) { 5348348SEric.Yu@Sun.COM error = EPIPE; 5358348SEric.Yu@Sun.COM break; 5368348SEric.Yu@Sun.COM } 5378348SEric.Yu@Sun.COM if (so->so_error != 0) { 5388348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 5398348SEric.Yu@Sun.COM error = sogeterr(so, B_TRUE); 5408348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 5418348SEric.Yu@Sun.COM if (error != 0) 5428348SEric.Yu@Sun.COM break; 5438348SEric.Yu@Sun.COM } 5448348SEric.Yu@Sun.COM if (so->so_snd_qfull) { 5458348SEric.Yu@Sun.COM /* 5468348SEric.Yu@Sun.COM * Need to wait until the protocol is ready to receive 5478348SEric.Yu@Sun.COM * more data for transmission. 5488348SEric.Yu@Sun.COM */ 5498348SEric.Yu@Sun.COM if ((error = so_snd_wait_qnotfull(so, dontblock)) != 0) 5508348SEric.Yu@Sun.COM break; 5518348SEric.Yu@Sun.COM } 5528348SEric.Yu@Sun.COM 5538348SEric.Yu@Sun.COM /* 5548348SEric.Yu@Sun.COM * We only allow so_maxpsz of data to be sent down to 5558348SEric.Yu@Sun.COM * the protocol at time. 5568348SEric.Yu@Sun.COM */ 5578348SEric.Yu@Sun.COM mlen = MBLKL(mp); 5588348SEric.Yu@Sun.COM nmp = mp->b_cont; 5598348SEric.Yu@Sun.COM last_mblk = mp; 5608348SEric.Yu@Sun.COM while (nmp != NULL) { 5618348SEric.Yu@Sun.COM mlen += MBLKL(nmp); 5628348SEric.Yu@Sun.COM if (mlen > so->so_proto_props.sopp_maxpsz) { 5638348SEric.Yu@Sun.COM last_mblk->b_cont = NULL; 5648348SEric.Yu@Sun.COM break; 5658348SEric.Yu@Sun.COM } 5668348SEric.Yu@Sun.COM last_mblk = nmp; 5678348SEric.Yu@Sun.COM nmp = nmp->b_cont; 5688348SEric.Yu@Sun.COM } 5698348SEric.Yu@Sun.COM 5708348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_send) 5718348SEric.Yu@Sun.COM (so->so_proto_handle, mp, msg, cr); 5728348SEric.Yu@Sun.COM if (error != 0) { 5738348SEric.Yu@Sun.COM /* 5748348SEric.Yu@Sun.COM * The send failed. The protocol will free the mblks 5758348SEric.Yu@Sun.COM * that were sent down. Let the caller deal with the 5768348SEric.Yu@Sun.COM * rest. 5778348SEric.Yu@Sun.COM */ 5788348SEric.Yu@Sun.COM *mpp = nmp; 5798348SEric.Yu@Sun.COM break; 5808348SEric.Yu@Sun.COM } 5818348SEric.Yu@Sun.COM 5828348SEric.Yu@Sun.COM *mpp = mp = nmp; 5838348SEric.Yu@Sun.COM } 5848348SEric.Yu@Sun.COM 5858348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 5868348SEric.Yu@Sun.COM 5878348SEric.Yu@Sun.COM return (error); 5888348SEric.Yu@Sun.COM } 5898348SEric.Yu@Sun.COM 5908348SEric.Yu@Sun.COM int 5918348SEric.Yu@Sun.COM so_shutdown(struct sonode *so, int how, struct cred *cr) 5928348SEric.Yu@Sun.COM { 5938348SEric.Yu@Sun.COM int error; 5948348SEric.Yu@Sun.COM 5958348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_SHUTDOWN(so, how, cr)); 5968348SEric.Yu@Sun.COM 5978348SEric.Yu@Sun.COM /* 5988348SEric.Yu@Sun.COM * SunOS 4.X has no check for datagram sockets. 5998348SEric.Yu@Sun.COM * 5.X checks that it is connected (ENOTCONN) 6008348SEric.Yu@Sun.COM * X/Open requires that we check the connected state. 6018348SEric.Yu@Sun.COM */ 6028348SEric.Yu@Sun.COM if (!(so->so_state & SS_ISCONNECTED)) { 6038348SEric.Yu@Sun.COM if (!xnet_skip_checks) { 6048348SEric.Yu@Sun.COM error = ENOTCONN; 6058348SEric.Yu@Sun.COM if (xnet_check_print) { 6068348SEric.Yu@Sun.COM printf("sockfs: X/Open shutdown check " 6078348SEric.Yu@Sun.COM "caused ENOTCONN\n"); 6088348SEric.Yu@Sun.COM } 6098348SEric.Yu@Sun.COM } 6108348SEric.Yu@Sun.COM goto done; 6118348SEric.Yu@Sun.COM } 6128348SEric.Yu@Sun.COM 6138348SEric.Yu@Sun.COM error = ((*so->so_downcalls->sd_shutdown)(so->so_proto_handle, 6148348SEric.Yu@Sun.COM how, cr)); 6158348SEric.Yu@Sun.COM 6168348SEric.Yu@Sun.COM /* 6178348SEric.Yu@Sun.COM * Protocol agreed to shutdown. We need to flush the 6188348SEric.Yu@Sun.COM * receive buffer if the receive side is being shutdown. 6198348SEric.Yu@Sun.COM */ 6208348SEric.Yu@Sun.COM if (error == 0 && how != SHUT_WR) { 6218348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 6228348SEric.Yu@Sun.COM /* wait for active reader to finish */ 6238348SEric.Yu@Sun.COM (void) so_lock_read(so, 0); 6248348SEric.Yu@Sun.COM 6258348SEric.Yu@Sun.COM so_rcv_flush(so); 6268348SEric.Yu@Sun.COM 6278348SEric.Yu@Sun.COM so_unlock_read(so); 6288348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 6298348SEric.Yu@Sun.COM } 6308348SEric.Yu@Sun.COM 6318348SEric.Yu@Sun.COM done: 6328348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 6338348SEric.Yu@Sun.COM return (error); 6348348SEric.Yu@Sun.COM } 6358348SEric.Yu@Sun.COM 6368348SEric.Yu@Sun.COM int 6378348SEric.Yu@Sun.COM so_getsockname(struct sonode *so, struct sockaddr *addr, 6388348SEric.Yu@Sun.COM socklen_t *addrlen, struct cred *cr) 6398348SEric.Yu@Sun.COM { 6408348SEric.Yu@Sun.COM int error; 6418348SEric.Yu@Sun.COM 6428348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_GETSOCKNAME(so, addr, addrlen, cr)); 6438348SEric.Yu@Sun.COM 6448348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_getsockname) 6458348SEric.Yu@Sun.COM (so->so_proto_handle, addr, addrlen, cr); 6468348SEric.Yu@Sun.COM 6478348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 6488348SEric.Yu@Sun.COM return (error); 6498348SEric.Yu@Sun.COM } 6508348SEric.Yu@Sun.COM 6518348SEric.Yu@Sun.COM int 6528348SEric.Yu@Sun.COM so_getpeername(struct sonode *so, struct sockaddr *addr, 6538348SEric.Yu@Sun.COM socklen_t *addrlen, boolean_t accept, struct cred *cr) 6548348SEric.Yu@Sun.COM { 6558348SEric.Yu@Sun.COM int error; 6568348SEric.Yu@Sun.COM 6578348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_GETPEERNAME(so, addr, addrlen, accept, cr)); 6588348SEric.Yu@Sun.COM 6598348SEric.Yu@Sun.COM if (accept) { 6608348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_getpeername) 6618348SEric.Yu@Sun.COM (so->so_proto_handle, addr, addrlen, cr); 6628348SEric.Yu@Sun.COM } else if (!(so->so_state & SS_ISCONNECTED)) { 6638348SEric.Yu@Sun.COM error = ENOTCONN; 6648348SEric.Yu@Sun.COM } else if ((so->so_state & SS_CANTSENDMORE) && !xnet_skip_checks) { 6658348SEric.Yu@Sun.COM /* Added this check for X/Open */ 6668348SEric.Yu@Sun.COM error = EINVAL; 6678348SEric.Yu@Sun.COM if (xnet_check_print) { 6688348SEric.Yu@Sun.COM printf("sockfs: X/Open getpeername check => EINVAL\n"); 6698348SEric.Yu@Sun.COM } 6708348SEric.Yu@Sun.COM } else { 6718348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_getpeername) 6728348SEric.Yu@Sun.COM (so->so_proto_handle, addr, addrlen, cr); 6738348SEric.Yu@Sun.COM } 6748348SEric.Yu@Sun.COM 6758348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 6768348SEric.Yu@Sun.COM return (error); 6778348SEric.Yu@Sun.COM } 6788348SEric.Yu@Sun.COM 6798348SEric.Yu@Sun.COM int 6808348SEric.Yu@Sun.COM so_getsockopt(struct sonode *so, int level, int option_name, 6818348SEric.Yu@Sun.COM void *optval, socklen_t *optlenp, int flags, struct cred *cr) 6828348SEric.Yu@Sun.COM { 6838348SEric.Yu@Sun.COM int error = 0; 6848348SEric.Yu@Sun.COM 6858348SEric.Yu@Sun.COM ASSERT(MUTEX_NOT_HELD(&so->so_lock)); 6868348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, 6878348SEric.Yu@Sun.COM SOP_GETSOCKOPT(so, level, option_name, optval, optlenp, flags, cr)); 6888348SEric.Yu@Sun.COM 689*8465SEric.Yu@Sun.COM error = socket_getopt_common(so, level, option_name, optval, optlenp, 690*8465SEric.Yu@Sun.COM flags); 6918348SEric.Yu@Sun.COM if (error < 0) { 6928348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_getsockopt) 6938348SEric.Yu@Sun.COM (so->so_proto_handle, level, option_name, optval, optlenp, 6948348SEric.Yu@Sun.COM cr); 6958348SEric.Yu@Sun.COM if (error == ENOPROTOOPT) { 6968348SEric.Yu@Sun.COM if (level == SOL_SOCKET) { 6978348SEric.Yu@Sun.COM /* 6988348SEric.Yu@Sun.COM * If a protocol does not support a particular 6998348SEric.Yu@Sun.COM * socket option, set can fail (not allowed) 7008348SEric.Yu@Sun.COM * but get can not fail. This is the previous 7018348SEric.Yu@Sun.COM * sockfs bahvior. 7028348SEric.Yu@Sun.COM */ 7038348SEric.Yu@Sun.COM switch (option_name) { 7048348SEric.Yu@Sun.COM case SO_LINGER: 7058348SEric.Yu@Sun.COM if (*optlenp < (t_uscalar_t) 7068348SEric.Yu@Sun.COM sizeof (struct linger)) { 7078348SEric.Yu@Sun.COM error = EINVAL; 7088348SEric.Yu@Sun.COM break; 7098348SEric.Yu@Sun.COM } 7108348SEric.Yu@Sun.COM error = 0; 7118348SEric.Yu@Sun.COM bzero(optval, sizeof (struct linger)); 7128348SEric.Yu@Sun.COM *optlenp = sizeof (struct linger); 7138348SEric.Yu@Sun.COM break; 7148348SEric.Yu@Sun.COM case SO_RCVTIMEO: 7158348SEric.Yu@Sun.COM case SO_SNDTIMEO: 7168348SEric.Yu@Sun.COM if (*optlenp < (t_uscalar_t) 7178348SEric.Yu@Sun.COM sizeof (struct timeval)) { 7188348SEric.Yu@Sun.COM error = EINVAL; 7198348SEric.Yu@Sun.COM break; 7208348SEric.Yu@Sun.COM } 7218348SEric.Yu@Sun.COM error = 0; 7228348SEric.Yu@Sun.COM bzero(optval, sizeof (struct timeval)); 7238348SEric.Yu@Sun.COM *optlenp = sizeof (struct timeval); 7248348SEric.Yu@Sun.COM break; 7258348SEric.Yu@Sun.COM case SO_SND_BUFINFO: 7268348SEric.Yu@Sun.COM if (*optlenp < (t_uscalar_t) 7278348SEric.Yu@Sun.COM sizeof (struct so_snd_bufinfo)) { 7288348SEric.Yu@Sun.COM error = EINVAL; 7298348SEric.Yu@Sun.COM break; 7308348SEric.Yu@Sun.COM } 7318348SEric.Yu@Sun.COM error = 0; 7328348SEric.Yu@Sun.COM bzero(optval, 7338348SEric.Yu@Sun.COM sizeof (struct so_snd_bufinfo)); 7348348SEric.Yu@Sun.COM *optlenp = 7358348SEric.Yu@Sun.COM sizeof (struct so_snd_bufinfo); 7368348SEric.Yu@Sun.COM break; 7378348SEric.Yu@Sun.COM case SO_DEBUG: 7388348SEric.Yu@Sun.COM case SO_REUSEADDR: 7398348SEric.Yu@Sun.COM case SO_KEEPALIVE: 7408348SEric.Yu@Sun.COM case SO_DONTROUTE: 7418348SEric.Yu@Sun.COM case SO_BROADCAST: 7428348SEric.Yu@Sun.COM case SO_USELOOPBACK: 7438348SEric.Yu@Sun.COM case SO_OOBINLINE: 7448348SEric.Yu@Sun.COM case SO_DGRAM_ERRIND: 7458348SEric.Yu@Sun.COM case SO_SNDBUF: 7468348SEric.Yu@Sun.COM case SO_RCVBUF: 7478348SEric.Yu@Sun.COM error = 0; 7488348SEric.Yu@Sun.COM *((int32_t *)optval) = 0; 7498348SEric.Yu@Sun.COM *optlenp = sizeof (int32_t); 7508348SEric.Yu@Sun.COM break; 7518348SEric.Yu@Sun.COM default: 7528348SEric.Yu@Sun.COM break; 7538348SEric.Yu@Sun.COM } 7548348SEric.Yu@Sun.COM } 7558348SEric.Yu@Sun.COM } 7568348SEric.Yu@Sun.COM } 7578348SEric.Yu@Sun.COM 7588348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 7598348SEric.Yu@Sun.COM return (error); 7608348SEric.Yu@Sun.COM } 7618348SEric.Yu@Sun.COM 7628348SEric.Yu@Sun.COM int 7638348SEric.Yu@Sun.COM so_setsockopt(struct sonode *so, int level, int option_name, 7648348SEric.Yu@Sun.COM const void *optval, socklen_t optlen, struct cred *cr) 7658348SEric.Yu@Sun.COM { 7668348SEric.Yu@Sun.COM int error = 0; 7678348SEric.Yu@Sun.COM 7688348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, 7698348SEric.Yu@Sun.COM SOP_SETSOCKOPT(so, level, option_name, optval, optlen, cr)); 7708348SEric.Yu@Sun.COM 7718348SEric.Yu@Sun.COM /* X/Open requires this check */ 7728348SEric.Yu@Sun.COM if (so->so_state & SS_CANTSENDMORE && !xnet_skip_checks) { 7738348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 7748348SEric.Yu@Sun.COM if (xnet_check_print) 7758348SEric.Yu@Sun.COM printf("sockfs: X/Open setsockopt check => EINVAL\n"); 7768348SEric.Yu@Sun.COM return (EINVAL); 7778348SEric.Yu@Sun.COM } 7788348SEric.Yu@Sun.COM 779*8465SEric.Yu@Sun.COM if (level == SOL_SOCKET) { 780*8465SEric.Yu@Sun.COM switch (option_name) { 781*8465SEric.Yu@Sun.COM case SO_RCVTIMEO: 782*8465SEric.Yu@Sun.COM case SO_SNDTIMEO: { 783*8465SEric.Yu@Sun.COM struct timeval *tl = (struct timeval *)optval; 784*8465SEric.Yu@Sun.COM clock_t t_usec; 7858348SEric.Yu@Sun.COM 786*8465SEric.Yu@Sun.COM if (optlen != (t_uscalar_t)sizeof (struct timeval)) { 787*8465SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 788*8465SEric.Yu@Sun.COM return (EINVAL); 789*8465SEric.Yu@Sun.COM } 790*8465SEric.Yu@Sun.COM t_usec = tl->tv_sec * 1000 * 1000 + tl->tv_usec; 791*8465SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 792*8465SEric.Yu@Sun.COM if (option_name == SO_RCVTIMEO) 793*8465SEric.Yu@Sun.COM so->so_rcvtimeo = drv_usectohz(t_usec); 794*8465SEric.Yu@Sun.COM else 795*8465SEric.Yu@Sun.COM so->so_sndtimeo = drv_usectohz(t_usec); 796*8465SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 7978348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 798*8465SEric.Yu@Sun.COM return (0); 7998348SEric.Yu@Sun.COM } 800*8465SEric.Yu@Sun.COM case SO_RCVBUF: 801*8465SEric.Yu@Sun.COM /* 802*8465SEric.Yu@Sun.COM * XXX XPG 4.2 applications retrieve SO_RCVBUF from 803*8465SEric.Yu@Sun.COM * sockfs since the transport might adjust the value 804*8465SEric.Yu@Sun.COM * and not return exactly what was set by the 805*8465SEric.Yu@Sun.COM * application. 806*8465SEric.Yu@Sun.COM */ 807*8465SEric.Yu@Sun.COM so->so_xpg_rcvbuf = *(int32_t *)optval; 808*8465SEric.Yu@Sun.COM break; 809*8465SEric.Yu@Sun.COM } 8108348SEric.Yu@Sun.COM } 8118348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_setsockopt) 8128348SEric.Yu@Sun.COM (so->so_proto_handle, level, option_name, optval, optlen, cr); 8138348SEric.Yu@Sun.COM 8148348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 8158348SEric.Yu@Sun.COM return (error); 8168348SEric.Yu@Sun.COM } 8178348SEric.Yu@Sun.COM 8188348SEric.Yu@Sun.COM int 8198348SEric.Yu@Sun.COM so_ioctl(struct sonode *so, int cmd, intptr_t arg, int mode, 8208348SEric.Yu@Sun.COM struct cred *cr, int32_t *rvalp) 8218348SEric.Yu@Sun.COM { 8228348SEric.Yu@Sun.COM int error = 0; 8238348SEric.Yu@Sun.COM 8248348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_IOCTL(so, cmd, arg, mode, cr, rvalp)); 8258348SEric.Yu@Sun.COM 8268348SEric.Yu@Sun.COM /* 8278348SEric.Yu@Sun.COM * If there is a pending error, return error 8288348SEric.Yu@Sun.COM * This can happen if a non blocking operation caused an error. 8298348SEric.Yu@Sun.COM */ 8308348SEric.Yu@Sun.COM if (so->so_error != 0) { 8318348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 8328348SEric.Yu@Sun.COM error = sogeterr(so, B_TRUE); 8338348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 8348348SEric.Yu@Sun.COM if (error != 0) 8358348SEric.Yu@Sun.COM goto done; 8368348SEric.Yu@Sun.COM } 8378348SEric.Yu@Sun.COM 8388348SEric.Yu@Sun.COM /* 8398348SEric.Yu@Sun.COM * calling strioc can result in the socket falling back to TPI, 8408348SEric.Yu@Sun.COM * if that is supported. 8418348SEric.Yu@Sun.COM */ 8428348SEric.Yu@Sun.COM if ((error = socket_ioctl_common(so, cmd, arg, mode, cr, rvalp)) < 0 && 8438348SEric.Yu@Sun.COM (error = socket_strioc_common(so, cmd, arg, mode, cr, rvalp)) < 0) { 8448348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_ioctl)(so->so_proto_handle, 8458348SEric.Yu@Sun.COM cmd, arg, mode, rvalp, cr); 8468348SEric.Yu@Sun.COM } 8478348SEric.Yu@Sun.COM 8488348SEric.Yu@Sun.COM done: 8498348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 8508348SEric.Yu@Sun.COM 8518348SEric.Yu@Sun.COM return (error); 8528348SEric.Yu@Sun.COM } 8538348SEric.Yu@Sun.COM 8548348SEric.Yu@Sun.COM int 8558348SEric.Yu@Sun.COM so_poll(struct sonode *so, short events, int anyyet, short *reventsp, 8568348SEric.Yu@Sun.COM struct pollhead **phpp) 8578348SEric.Yu@Sun.COM { 8588348SEric.Yu@Sun.COM int state = so->so_state; 8598348SEric.Yu@Sun.COM *reventsp = 0; 8608348SEric.Yu@Sun.COM 8618348SEric.Yu@Sun.COM if (so->so_error != 0 && 8628348SEric.Yu@Sun.COM ((POLLIN|POLLRDNORM|POLLOUT) & events) != 0) { 8638348SEric.Yu@Sun.COM *reventsp = (POLLIN|POLLRDNORM|POLLOUT) & events; 8648348SEric.Yu@Sun.COM return (0); 8658348SEric.Yu@Sun.COM } 8668348SEric.Yu@Sun.COM 8678348SEric.Yu@Sun.COM /* 8688348SEric.Yu@Sun.COM * As long as there is buffer to send data, and the socket is 8698348SEric.Yu@Sun.COM * in a state where it can send data (i.e., connected for 8708348SEric.Yu@Sun.COM * connection oriented protocols), then turn on POLLOUT events 8718348SEric.Yu@Sun.COM */ 8728348SEric.Yu@Sun.COM if (!so->so_snd_qfull && ((so->so_mode & SM_CONNREQUIRED) == 0 || 8738348SEric.Yu@Sun.COM state & SS_ISCONNECTED)) { 8748348SEric.Yu@Sun.COM *reventsp |= POLLOUT & events; 8758348SEric.Yu@Sun.COM } 8768348SEric.Yu@Sun.COM 8778348SEric.Yu@Sun.COM /* 8788348SEric.Yu@Sun.COM * Turn on POLLIN whenever there is data on the receive queue, 8798348SEric.Yu@Sun.COM * or the socket is in a state where no more data will be received. 8808348SEric.Yu@Sun.COM * Also, if the socket is accepting connections, flip the bit if 8818348SEric.Yu@Sun.COM * there is something on the queue. 8828427SAnders.Persson@Sun.COM * 8838427SAnders.Persson@Sun.COM * We do an initial check for events without holding locks. However, 8848427SAnders.Persson@Sun.COM * if there are no event available, then we redo the check for POLLIN 8858427SAnders.Persson@Sun.COM * events under the lock. 8868348SEric.Yu@Sun.COM */ 8878348SEric.Yu@Sun.COM 8888348SEric.Yu@Sun.COM /* Pending connections */ 8898348SEric.Yu@Sun.COM if (so->so_acceptq_len > 0) 8908348SEric.Yu@Sun.COM *reventsp |= (POLLIN|POLLRDNORM) & events; 8918348SEric.Yu@Sun.COM 8928348SEric.Yu@Sun.COM /* Data */ 8938348SEric.Yu@Sun.COM /* so_downcalls is null for sctp */ 8948348SEric.Yu@Sun.COM if (so->so_downcalls != NULL && so->so_downcalls->sd_poll != NULL) { 8958348SEric.Yu@Sun.COM *reventsp |= (*so->so_downcalls->sd_poll) 8968348SEric.Yu@Sun.COM (so->so_proto_handle, events & SO_PROTO_POLLEV, anyyet, 8978348SEric.Yu@Sun.COM CRED()) & events; 8988348SEric.Yu@Sun.COM ASSERT((*reventsp & ~events) == 0); 8998348SEric.Yu@Sun.COM /* do not recheck events */ 9008348SEric.Yu@Sun.COM events &= ~SO_PROTO_POLLEV; 9018348SEric.Yu@Sun.COM } else { 9028348SEric.Yu@Sun.COM if (SO_HAVE_DATA(so)) 9038348SEric.Yu@Sun.COM *reventsp |= (POLLIN|POLLRDNORM) & events; 9048348SEric.Yu@Sun.COM 9058348SEric.Yu@Sun.COM /* Urgent data */ 9068348SEric.Yu@Sun.COM if ((state & SS_OOBPEND) != 0) 9078348SEric.Yu@Sun.COM *reventsp |= (POLLRDBAND) & events; 9088348SEric.Yu@Sun.COM } 9098348SEric.Yu@Sun.COM 9108348SEric.Yu@Sun.COM if (!*reventsp && !anyyet) { 9118348SEric.Yu@Sun.COM /* Check for read events again, but this time under lock */ 9128348SEric.Yu@Sun.COM if (events & (POLLIN|POLLRDNORM)) { 9138348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 9148348SEric.Yu@Sun.COM if (SO_HAVE_DATA(so) || so->so_acceptq_len > 0) { 9158348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 9168348SEric.Yu@Sun.COM *reventsp |= (POLLIN|POLLRDNORM) & events; 9178348SEric.Yu@Sun.COM return (0); 9188348SEric.Yu@Sun.COM } else { 9198348SEric.Yu@Sun.COM so->so_pollev |= SO_POLLEV_IN; 9208348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 9218348SEric.Yu@Sun.COM } 9228348SEric.Yu@Sun.COM } 9238348SEric.Yu@Sun.COM *phpp = &so->so_poll_list; 9248348SEric.Yu@Sun.COM } 9258348SEric.Yu@Sun.COM return (0); 9268348SEric.Yu@Sun.COM } 9278348SEric.Yu@Sun.COM 9288348SEric.Yu@Sun.COM /* 9298348SEric.Yu@Sun.COM * Generic Upcalls 9308348SEric.Yu@Sun.COM */ 9318348SEric.Yu@Sun.COM void 9328348SEric.Yu@Sun.COM so_connected(sock_upper_handle_t sock_handle, sock_connid_t id, 9338348SEric.Yu@Sun.COM cred_t *peer_cred, pid_t peer_cpid) 9348348SEric.Yu@Sun.COM { 9358348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 9368348SEric.Yu@Sun.COM 9378348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 9388348SEric.Yu@Sun.COM ASSERT(so->so_proto_handle != NULL); 9398348SEric.Yu@Sun.COM 9408348SEric.Yu@Sun.COM if (peer_cred != NULL) { 9418348SEric.Yu@Sun.COM if (so->so_peercred != NULL) 9428348SEric.Yu@Sun.COM crfree(so->so_peercred); 9438348SEric.Yu@Sun.COM crhold(peer_cred); 9448348SEric.Yu@Sun.COM so->so_peercred = peer_cred; 9458348SEric.Yu@Sun.COM so->so_cpid = peer_cpid; 9468348SEric.Yu@Sun.COM } 9478348SEric.Yu@Sun.COM 9488348SEric.Yu@Sun.COM so->so_proto_connid = id; 9498348SEric.Yu@Sun.COM soisconnected(so); 9508348SEric.Yu@Sun.COM /* 9518348SEric.Yu@Sun.COM * Wake ones who're waiting for conn to become established. 9528348SEric.Yu@Sun.COM */ 9538348SEric.Yu@Sun.COM so_notify_connected(so); 9548348SEric.Yu@Sun.COM } 9558348SEric.Yu@Sun.COM 9568348SEric.Yu@Sun.COM int 9578348SEric.Yu@Sun.COM so_disconnected(sock_upper_handle_t sock_handle, sock_connid_t id, int error) 9588348SEric.Yu@Sun.COM { 9598348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 9608348SEric.Yu@Sun.COM 9618348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 9628348SEric.Yu@Sun.COM 9638348SEric.Yu@Sun.COM so->so_proto_connid = id; 9648348SEric.Yu@Sun.COM soisdisconnected(so, error); 9658348SEric.Yu@Sun.COM so_notify_disconnected(so, error); 9668348SEric.Yu@Sun.COM 9678348SEric.Yu@Sun.COM return (0); 9688348SEric.Yu@Sun.COM } 9698348SEric.Yu@Sun.COM 9708348SEric.Yu@Sun.COM void 9718348SEric.Yu@Sun.COM so_opctl(sock_upper_handle_t sock_handle, sock_opctl_action_t action, 9728348SEric.Yu@Sun.COM uintptr_t arg) 9738348SEric.Yu@Sun.COM { 9748348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 9758348SEric.Yu@Sun.COM 9768348SEric.Yu@Sun.COM switch (action) { 9778348SEric.Yu@Sun.COM case SOCK_OPCTL_SHUT_SEND: 9788348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 9798348SEric.Yu@Sun.COM socantsendmore(so); 9808348SEric.Yu@Sun.COM so_notify_disconnecting(so); 9818348SEric.Yu@Sun.COM break; 9828348SEric.Yu@Sun.COM case SOCK_OPCTL_SHUT_RECV: { 9838348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 9848348SEric.Yu@Sun.COM socantrcvmore(so); 9858348SEric.Yu@Sun.COM so_notify_eof(so); 9868348SEric.Yu@Sun.COM break; 9878348SEric.Yu@Sun.COM } 9888348SEric.Yu@Sun.COM case SOCK_OPCTL_ENAB_ACCEPT: 9898348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 9908348SEric.Yu@Sun.COM so->so_state |= SS_ACCEPTCONN; 9918348SEric.Yu@Sun.COM so->so_backlog = (unsigned int)arg; 9928348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 9938348SEric.Yu@Sun.COM break; 9948348SEric.Yu@Sun.COM default: 9958348SEric.Yu@Sun.COM ASSERT(0); 9968348SEric.Yu@Sun.COM break; 9978348SEric.Yu@Sun.COM } 9988348SEric.Yu@Sun.COM } 9998348SEric.Yu@Sun.COM 10008348SEric.Yu@Sun.COM void 10018348SEric.Yu@Sun.COM so_txq_full(sock_upper_handle_t sock_handle, boolean_t qfull) 10028348SEric.Yu@Sun.COM { 10038348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 10048348SEric.Yu@Sun.COM 10058348SEric.Yu@Sun.COM if (qfull) { 10068348SEric.Yu@Sun.COM so_snd_qfull(so); 10078348SEric.Yu@Sun.COM } else { 10088348SEric.Yu@Sun.COM so_snd_qnotfull(so); 10098348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 10108348SEric.Yu@Sun.COM so_notify_writable(so); 10118348SEric.Yu@Sun.COM } 10128348SEric.Yu@Sun.COM } 10138348SEric.Yu@Sun.COM 10148348SEric.Yu@Sun.COM sock_upper_handle_t 10158348SEric.Yu@Sun.COM so_newconn(sock_upper_handle_t parenthandle, 10168348SEric.Yu@Sun.COM sock_lower_handle_t proto_handle, sock_downcalls_t *sock_downcalls, 10178348SEric.Yu@Sun.COM struct cred *peer_cred, pid_t peer_cpid, sock_upcalls_t **sock_upcallsp) 10188348SEric.Yu@Sun.COM { 10198348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)parenthandle; 10208348SEric.Yu@Sun.COM struct sonode *nso; 10218348SEric.Yu@Sun.COM int error; 10228348SEric.Yu@Sun.COM 10238348SEric.Yu@Sun.COM ASSERT(proto_handle != NULL); 10248348SEric.Yu@Sun.COM 10258348SEric.Yu@Sun.COM if ((so->so_state & SS_ACCEPTCONN) == 0 || 10268348SEric.Yu@Sun.COM so->so_acceptq_len >= so->so_backlog) 10278348SEric.Yu@Sun.COM return (NULL); 10288348SEric.Yu@Sun.COM 10298348SEric.Yu@Sun.COM nso = socket_newconn(so, proto_handle, sock_downcalls, SOCKET_NOSLEEP, 10308348SEric.Yu@Sun.COM &error); 10318348SEric.Yu@Sun.COM if (nso == NULL) 10328348SEric.Yu@Sun.COM return (NULL); 10338348SEric.Yu@Sun.COM 10348348SEric.Yu@Sun.COM if (peer_cred != NULL) { 10358348SEric.Yu@Sun.COM crhold(peer_cred); 10368348SEric.Yu@Sun.COM nso->so_peercred = peer_cred; 10378348SEric.Yu@Sun.COM nso->so_cpid = peer_cpid; 10388348SEric.Yu@Sun.COM } 10398348SEric.Yu@Sun.COM 10408348SEric.Yu@Sun.COM (void) so_acceptq_enqueue(so, nso); 10418348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 10428348SEric.Yu@Sun.COM so_notify_newconn(so); 10438348SEric.Yu@Sun.COM 10448348SEric.Yu@Sun.COM *sock_upcallsp = &so_upcalls; 10458348SEric.Yu@Sun.COM 10468348SEric.Yu@Sun.COM return ((sock_upper_handle_t)nso); 10478348SEric.Yu@Sun.COM } 10488348SEric.Yu@Sun.COM 10498348SEric.Yu@Sun.COM void 10508348SEric.Yu@Sun.COM so_set_prop(sock_upper_handle_t sock_handle, struct sock_proto_props *soppp) 10518348SEric.Yu@Sun.COM { 10528348SEric.Yu@Sun.COM struct sonode *so; 10538348SEric.Yu@Sun.COM 10548348SEric.Yu@Sun.COM so = (struct sonode *)sock_handle; 10558348SEric.Yu@Sun.COM 10568348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 10578348SEric.Yu@Sun.COM 10588348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_MAXBLK) 10598348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxblk = soppp->sopp_maxblk; 10608348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_WROFF) 10618348SEric.Yu@Sun.COM so->so_proto_props.sopp_wroff = soppp->sopp_wroff; 10628348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_TAIL) 10638348SEric.Yu@Sun.COM so->so_proto_props.sopp_tail = soppp->sopp_tail; 10648348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_RCVHIWAT) 10658348SEric.Yu@Sun.COM so->so_proto_props.sopp_rxhiwat = soppp->sopp_rxhiwat; 10668348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_RCVLOWAT) 10678348SEric.Yu@Sun.COM so->so_proto_props.sopp_rxlowat = soppp->sopp_rxlowat; 10688348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_MAXPSZ) 10698348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxpsz = soppp->sopp_maxpsz; 10708348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_MINPSZ) 10718348SEric.Yu@Sun.COM so->so_proto_props.sopp_minpsz = soppp->sopp_minpsz; 10728348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_ZCOPY) { 10738348SEric.Yu@Sun.COM if (soppp->sopp_zcopyflag & ZCVMSAFE) { 10748348SEric.Yu@Sun.COM so->so_proto_props.sopp_zcopyflag |= STZCVMSAFE; 10758348SEric.Yu@Sun.COM so->so_proto_props.sopp_zcopyflag &= ~STZCVMUNSAFE; 10768348SEric.Yu@Sun.COM } else if (soppp->sopp_zcopyflag & ZCVMUNSAFE) { 10778348SEric.Yu@Sun.COM so->so_proto_props.sopp_zcopyflag |= STZCVMUNSAFE; 10788348SEric.Yu@Sun.COM so->so_proto_props.sopp_zcopyflag &= ~STZCVMSAFE; 10798348SEric.Yu@Sun.COM } 10808348SEric.Yu@Sun.COM 10818348SEric.Yu@Sun.COM if (soppp->sopp_zcopyflag & COPYCACHED) { 10828348SEric.Yu@Sun.COM so->so_proto_props.sopp_zcopyflag |= STRCOPYCACHED; 10838348SEric.Yu@Sun.COM } 10848348SEric.Yu@Sun.COM } 10858348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_OOBINLINE) 10868348SEric.Yu@Sun.COM so->so_proto_props.sopp_oobinline = soppp->sopp_oobinline; 10878348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_RCVTIMER) 10888348SEric.Yu@Sun.COM so->so_proto_props.sopp_rcvtimer = soppp->sopp_rcvtimer; 10898348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_RCVTHRESH) 10908348SEric.Yu@Sun.COM so->so_proto_props.sopp_rcvthresh = soppp->sopp_rcvthresh; 10918348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_MAXADDRLEN) 10928348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxaddrlen = soppp->sopp_maxaddrlen; 10938348SEric.Yu@Sun.COM 10948348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 10958348SEric.Yu@Sun.COM 10968348SEric.Yu@Sun.COM #ifdef DEBUG 10978348SEric.Yu@Sun.COM soppp->sopp_flags &= ~(SOCKOPT_MAXBLK | SOCKOPT_WROFF | SOCKOPT_TAIL | 10988348SEric.Yu@Sun.COM SOCKOPT_RCVHIWAT | SOCKOPT_RCVLOWAT | SOCKOPT_MAXPSZ | 10998348SEric.Yu@Sun.COM SOCKOPT_ZCOPY | SOCKOPT_OOBINLINE | SOCKOPT_RCVTIMER | 11008348SEric.Yu@Sun.COM SOCKOPT_RCVTHRESH | SOCKOPT_MAXADDRLEN | SOCKOPT_MINPSZ); 11018348SEric.Yu@Sun.COM ASSERT(soppp->sopp_flags == 0); 11028348SEric.Yu@Sun.COM #endif 11038348SEric.Yu@Sun.COM } 11048348SEric.Yu@Sun.COM 11058348SEric.Yu@Sun.COM /* ARGSUSED */ 11068348SEric.Yu@Sun.COM ssize_t 11078348SEric.Yu@Sun.COM so_queue_msg(sock_upper_handle_t sock_handle, mblk_t *mp, 11088348SEric.Yu@Sun.COM size_t msg_size, int flags, int *errorp, boolean_t *force_pushp) 11098348SEric.Yu@Sun.COM { 11108348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 11118348SEric.Yu@Sun.COM boolean_t force_push = B_TRUE; 11128348SEric.Yu@Sun.COM int space_left; 11138348SEric.Yu@Sun.COM sodirect_t *sodp = so->so_direct; 11148348SEric.Yu@Sun.COM 11158348SEric.Yu@Sun.COM ASSERT(errorp != NULL); 11168348SEric.Yu@Sun.COM *errorp = 0; 11178348SEric.Yu@Sun.COM if (mp == NULL) { 11188348SEric.Yu@Sun.COM if (msg_size > 0) { 11198348SEric.Yu@Sun.COM ASSERT(so->so_downcalls->sd_recv_uio != NULL); 11208348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 11218348SEric.Yu@Sun.COM /* the notify functions will drop the lock */ 11228348SEric.Yu@Sun.COM if (flags & MSG_OOB) 11238348SEric.Yu@Sun.COM so_notify_oobdata(so, IS_SO_OOB_INLINE(so)); 11248348SEric.Yu@Sun.COM else 11258348SEric.Yu@Sun.COM so_notify_data(so, msg_size); 11268348SEric.Yu@Sun.COM return (0); 11278348SEric.Yu@Sun.COM } 11288348SEric.Yu@Sun.COM /* 11298348SEric.Yu@Sun.COM * recv space check 11308348SEric.Yu@Sun.COM */ 11318348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 11328348SEric.Yu@Sun.COM space_left = so->so_rcvbuf - so->so_rcv_queued; 11338348SEric.Yu@Sun.COM if (space_left <= 0) { 11348348SEric.Yu@Sun.COM so->so_flowctrld = B_TRUE; 11358348SEric.Yu@Sun.COM *errorp = ENOSPC; 11368348SEric.Yu@Sun.COM space_left = -1; 11378348SEric.Yu@Sun.COM } 11388348SEric.Yu@Sun.COM goto done_unlock; 11398348SEric.Yu@Sun.COM } 11408348SEric.Yu@Sun.COM 11418348SEric.Yu@Sun.COM ASSERT(mp->b_next == NULL); 11428348SEric.Yu@Sun.COM ASSERT(DB_TYPE(mp) == M_DATA || DB_TYPE(mp) == M_PROTO); 11438348SEric.Yu@Sun.COM ASSERT(msg_size == msgdsize(mp)); 11448348SEric.Yu@Sun.COM 11458348SEric.Yu@Sun.COM if (flags & MSG_OOB) { 11468348SEric.Yu@Sun.COM so_queue_oob(sock_handle, mp, msg_size); 11478348SEric.Yu@Sun.COM return (0); 11488348SEric.Yu@Sun.COM } 11498348SEric.Yu@Sun.COM 11508348SEric.Yu@Sun.COM if (force_pushp != NULL) 11518348SEric.Yu@Sun.COM force_push = *force_pushp; 11528348SEric.Yu@Sun.COM 11538348SEric.Yu@Sun.COM if (DB_TYPE(mp) == M_PROTO && !__TPI_PRIM_ISALIGNED(mp->b_rptr)) { 11548348SEric.Yu@Sun.COM /* The read pointer is not aligned correctly for TPI */ 11558348SEric.Yu@Sun.COM zcmn_err(getzoneid(), CE_WARN, 11568348SEric.Yu@Sun.COM "sockfs: Unaligned TPI message received. rptr = %p\n", 11578348SEric.Yu@Sun.COM (void *)mp->b_rptr); 11588348SEric.Yu@Sun.COM freemsg(mp); 11598348SEric.Yu@Sun.COM mutex_enter(sodp->sod_lockp); 11608348SEric.Yu@Sun.COM SOD_UIOAFINI(sodp); 11618348SEric.Yu@Sun.COM mutex_exit(sodp->sod_lockp); 11628348SEric.Yu@Sun.COM 11638348SEric.Yu@Sun.COM return (so->so_rcvbuf - so->so_rcv_queued); 11648348SEric.Yu@Sun.COM } 11658348SEric.Yu@Sun.COM 11668348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 11678348SEric.Yu@Sun.COM if (so->so_state & (SS_FALLBACK_PENDING | SS_FALLBACK_COMP)) { 11688348SEric.Yu@Sun.COM SOD_DISABLE(sodp); 11698348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 11708348SEric.Yu@Sun.COM *errorp = EOPNOTSUPP; 11718348SEric.Yu@Sun.COM return (-1); 11728348SEric.Yu@Sun.COM } 11738348SEric.Yu@Sun.COM if (so->so_state & SS_CANTRCVMORE) { 11748348SEric.Yu@Sun.COM freemsg(mp); 11758348SEric.Yu@Sun.COM SOD_DISABLE(sodp); 11768348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 11778348SEric.Yu@Sun.COM return (0); 11788348SEric.Yu@Sun.COM } 11798348SEric.Yu@Sun.COM 11808348SEric.Yu@Sun.COM /* process the mblk via I/OAT if capable */ 11818348SEric.Yu@Sun.COM if (sodp != NULL && (sodp->sod_state & SOD_ENABLED)) { 11828348SEric.Yu@Sun.COM if (DB_TYPE(mp) == M_DATA) { 11838348SEric.Yu@Sun.COM (void) sod_uioa_mblk_init(sodp, mp, msg_size); 11848348SEric.Yu@Sun.COM } else { 11858348SEric.Yu@Sun.COM SOD_UIOAFINI(sodp); 11868348SEric.Yu@Sun.COM } 11878348SEric.Yu@Sun.COM } 11888348SEric.Yu@Sun.COM 11898348SEric.Yu@Sun.COM if (mp->b_next == NULL) { 11908348SEric.Yu@Sun.COM so_enqueue_msg(so, mp, msg_size); 11918348SEric.Yu@Sun.COM } else { 11928348SEric.Yu@Sun.COM do { 11938348SEric.Yu@Sun.COM mblk_t *nmp; 11948348SEric.Yu@Sun.COM 11958348SEric.Yu@Sun.COM if ((nmp = mp->b_next) != NULL) { 11968348SEric.Yu@Sun.COM mp->b_next = NULL; 11978348SEric.Yu@Sun.COM } 11988348SEric.Yu@Sun.COM so_enqueue_msg(so, mp, msgdsize(mp)); 11998348SEric.Yu@Sun.COM mp = nmp; 12008348SEric.Yu@Sun.COM } while (mp != NULL); 12018348SEric.Yu@Sun.COM } 12028348SEric.Yu@Sun.COM 12038348SEric.Yu@Sun.COM space_left = so->so_rcvbuf - so->so_rcv_queued; 12048348SEric.Yu@Sun.COM if (space_left <= 0) { 12058348SEric.Yu@Sun.COM so->so_flowctrld = B_TRUE; 12068348SEric.Yu@Sun.COM *errorp = ENOSPC; 12078348SEric.Yu@Sun.COM space_left = -1; 12088348SEric.Yu@Sun.COM } 12098348SEric.Yu@Sun.COM 12108348SEric.Yu@Sun.COM if (force_push || so->so_rcv_queued >= so->so_rcv_thresh || 12118348SEric.Yu@Sun.COM so->so_rcv_queued >= so->so_rcv_wanted || 12128348SEric.Yu@Sun.COM (sodp != NULL && so->so_rcv_queued >= sodp->sod_want)) { 12138348SEric.Yu@Sun.COM SOCKET_TIMER_CANCEL(so); 12148348SEric.Yu@Sun.COM /* 12158348SEric.Yu@Sun.COM * so_notify_data will release the lock 12168348SEric.Yu@Sun.COM */ 12178348SEric.Yu@Sun.COM so_notify_data(so, so->so_rcv_queued); 12188348SEric.Yu@Sun.COM 12198348SEric.Yu@Sun.COM if (force_pushp != NULL) 12208348SEric.Yu@Sun.COM *force_pushp = B_TRUE; 12218348SEric.Yu@Sun.COM goto done; 12228348SEric.Yu@Sun.COM } else if (so->so_rcv_timer_tid == 0) { 12238348SEric.Yu@Sun.COM /* Make sure the recv push timer is running */ 12248348SEric.Yu@Sun.COM SOCKET_TIMER_START(so); 12258348SEric.Yu@Sun.COM } 12268348SEric.Yu@Sun.COM 12278348SEric.Yu@Sun.COM done_unlock: 12288348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 12298348SEric.Yu@Sun.COM done: 12308348SEric.Yu@Sun.COM return (space_left); 12318348SEric.Yu@Sun.COM } 12328348SEric.Yu@Sun.COM 12338348SEric.Yu@Sun.COM /* 12348348SEric.Yu@Sun.COM * Set the offset of where the oob data is relative to the bytes in 12358348SEric.Yu@Sun.COM * queued. Also generate SIGURG 12368348SEric.Yu@Sun.COM */ 12378348SEric.Yu@Sun.COM void 12388348SEric.Yu@Sun.COM so_signal_oob(sock_upper_handle_t sock_handle, ssize_t offset) 12398348SEric.Yu@Sun.COM { 12408348SEric.Yu@Sun.COM struct sonode *so; 12418348SEric.Yu@Sun.COM 12428348SEric.Yu@Sun.COM ASSERT(offset >= 0); 12438348SEric.Yu@Sun.COM so = (struct sonode *)sock_handle; 12448348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 12458348SEric.Yu@Sun.COM SOD_UIOAFINI(so->so_direct); 12468348SEric.Yu@Sun.COM 12478348SEric.Yu@Sun.COM /* 12488348SEric.Yu@Sun.COM * New urgent data on the way so forget about any old 12498348SEric.Yu@Sun.COM * urgent data. 12508348SEric.Yu@Sun.COM */ 12518348SEric.Yu@Sun.COM so->so_state &= ~(SS_HAVEOOBDATA|SS_HADOOBDATA); 12528348SEric.Yu@Sun.COM 12538348SEric.Yu@Sun.COM /* 12548348SEric.Yu@Sun.COM * Record that urgent data is pending. 12558348SEric.Yu@Sun.COM */ 12568348SEric.Yu@Sun.COM so->so_state |= SS_OOBPEND; 12578348SEric.Yu@Sun.COM 12588348SEric.Yu@Sun.COM if (so->so_oobmsg != NULL) { 12598348SEric.Yu@Sun.COM dprintso(so, 1, ("sock: discarding old oob\n")); 12608348SEric.Yu@Sun.COM freemsg(so->so_oobmsg); 12618348SEric.Yu@Sun.COM so->so_oobmsg = NULL; 12628348SEric.Yu@Sun.COM } 12638348SEric.Yu@Sun.COM 12648348SEric.Yu@Sun.COM /* 12658348SEric.Yu@Sun.COM * set the offset where the urgent byte is 12668348SEric.Yu@Sun.COM */ 12678348SEric.Yu@Sun.COM so->so_oobmark = so->so_rcv_queued + offset; 12688348SEric.Yu@Sun.COM if (so->so_oobmark == 0) 12698348SEric.Yu@Sun.COM so->so_state |= SS_RCVATMARK; 12708348SEric.Yu@Sun.COM else 12718348SEric.Yu@Sun.COM so->so_state &= ~SS_RCVATMARK; 12728348SEric.Yu@Sun.COM 12738348SEric.Yu@Sun.COM so_notify_oobsig(so); 12748348SEric.Yu@Sun.COM } 12758348SEric.Yu@Sun.COM 12768348SEric.Yu@Sun.COM /* 12778348SEric.Yu@Sun.COM * Queue the OOB byte 12788348SEric.Yu@Sun.COM */ 12798348SEric.Yu@Sun.COM static void 12808348SEric.Yu@Sun.COM so_queue_oob(sock_upper_handle_t sock_handle, mblk_t *mp, size_t len) 12818348SEric.Yu@Sun.COM { 12828348SEric.Yu@Sun.COM struct sonode *so; 12838348SEric.Yu@Sun.COM 12848348SEric.Yu@Sun.COM so = (struct sonode *)sock_handle; 12858348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 12868348SEric.Yu@Sun.COM SOD_UIOAFINI(so->so_direct); 12878348SEric.Yu@Sun.COM 12888348SEric.Yu@Sun.COM ASSERT(mp != NULL); 12898348SEric.Yu@Sun.COM if (!IS_SO_OOB_INLINE(so)) { 12908348SEric.Yu@Sun.COM so->so_oobmsg = mp; 12918348SEric.Yu@Sun.COM so->so_state |= SS_HAVEOOBDATA; 12928348SEric.Yu@Sun.COM } else { 12938348SEric.Yu@Sun.COM so_enqueue_msg(so, mp, len); 12948348SEric.Yu@Sun.COM } 12958348SEric.Yu@Sun.COM 12968348SEric.Yu@Sun.COM so_notify_oobdata(so, IS_SO_OOB_INLINE(so)); 12978348SEric.Yu@Sun.COM } 12988348SEric.Yu@Sun.COM 12998348SEric.Yu@Sun.COM int 13008348SEric.Yu@Sun.COM so_close(struct sonode *so, int flag, struct cred *cr) 13018348SEric.Yu@Sun.COM { 13028348SEric.Yu@Sun.COM int error; 13038348SEric.Yu@Sun.COM 13048348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_close)(so->so_proto_handle, flag, cr); 13058348SEric.Yu@Sun.COM 13068348SEric.Yu@Sun.COM /* 13078348SEric.Yu@Sun.COM * At this point there will be no more upcalls from the protocol 13088348SEric.Yu@Sun.COM */ 13098348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 13108399SRao.Shoaib@Sun.COM 13118399SRao.Shoaib@Sun.COM ASSERT(so_verify_oobstate(so)); 13128399SRao.Shoaib@Sun.COM 13138348SEric.Yu@Sun.COM so_rcv_flush(so); 13148348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 13158348SEric.Yu@Sun.COM 13168348SEric.Yu@Sun.COM return (error); 13178348SEric.Yu@Sun.COM } 13188348SEric.Yu@Sun.COM 13198348SEric.Yu@Sun.COM void 13208348SEric.Yu@Sun.COM so_zcopy_notify(sock_upper_handle_t sock_handle) 13218348SEric.Yu@Sun.COM { 13228348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 13238348SEric.Yu@Sun.COM 13248348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 13258348SEric.Yu@Sun.COM so->so_copyflag |= STZCNOTIFY; 13268348SEric.Yu@Sun.COM cv_broadcast(&so->so_copy_cv); 13278348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 13288348SEric.Yu@Sun.COM } 13298348SEric.Yu@Sun.COM 13308348SEric.Yu@Sun.COM void 13318348SEric.Yu@Sun.COM so_set_error(sock_upper_handle_t sock_handle, int error) 13328348SEric.Yu@Sun.COM { 13338348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 13348348SEric.Yu@Sun.COM 13358348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 13368348SEric.Yu@Sun.COM 13378348SEric.Yu@Sun.COM soseterror(so, error); 13388348SEric.Yu@Sun.COM 13398348SEric.Yu@Sun.COM so_notify_error(so); 13408348SEric.Yu@Sun.COM } 13418348SEric.Yu@Sun.COM 13428348SEric.Yu@Sun.COM /* 13438348SEric.Yu@Sun.COM * so_recvmsg - read data from the socket 13448348SEric.Yu@Sun.COM * 13458348SEric.Yu@Sun.COM * There are two ways of obtaining data; either we ask the protocol to 13468348SEric.Yu@Sun.COM * copy directly into the supplied buffer, or we copy data from the 13478348SEric.Yu@Sun.COM * sonode's receive queue. The decision which one to use depends on 13488348SEric.Yu@Sun.COM * whether the protocol has a sd_recv_uio down call. 13498348SEric.Yu@Sun.COM */ 13508348SEric.Yu@Sun.COM int 13518348SEric.Yu@Sun.COM so_recvmsg(struct sonode *so, struct nmsghdr *msg, struct uio *uiop, 13528348SEric.Yu@Sun.COM struct cred *cr) 13538348SEric.Yu@Sun.COM { 13548348SEric.Yu@Sun.COM rval_t rval; 13558348SEric.Yu@Sun.COM int flags = 0; 13568348SEric.Yu@Sun.COM t_uscalar_t controllen, namelen; 13578348SEric.Yu@Sun.COM int error = 0; 13588348SEric.Yu@Sun.COM int ret; 13598348SEric.Yu@Sun.COM mblk_t *mctlp = NULL; 13608348SEric.Yu@Sun.COM union T_primitives *tpr; 13618348SEric.Yu@Sun.COM void *control; 13628348SEric.Yu@Sun.COM ssize_t saved_resid; 13638348SEric.Yu@Sun.COM struct uio *suiop; 13648348SEric.Yu@Sun.COM 13658348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_RECVMSG(so, msg, uiop, cr)); 13668348SEric.Yu@Sun.COM 13678348SEric.Yu@Sun.COM if ((so->so_state & (SS_ISCONNECTED|SS_CANTRCVMORE)) == 0 && 13688348SEric.Yu@Sun.COM (so->so_mode & SM_CONNREQUIRED)) { 13698348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 13708348SEric.Yu@Sun.COM return (ENOTCONN); 13718348SEric.Yu@Sun.COM } 13728348SEric.Yu@Sun.COM 13738348SEric.Yu@Sun.COM if (msg->msg_flags & MSG_PEEK) 13748348SEric.Yu@Sun.COM msg->msg_flags &= ~MSG_WAITALL; 13758348SEric.Yu@Sun.COM 13768348SEric.Yu@Sun.COM if (so->so_mode & SM_ATOMIC) 13778348SEric.Yu@Sun.COM msg->msg_flags |= MSG_TRUNC; 13788348SEric.Yu@Sun.COM 13798348SEric.Yu@Sun.COM if (msg->msg_flags & MSG_OOB) { 13808348SEric.Yu@Sun.COM if ((so->so_mode & SM_EXDATA) == 0) { 13818348SEric.Yu@Sun.COM error = EOPNOTSUPP; 13828348SEric.Yu@Sun.COM } else if (so->so_downcalls->sd_recv_uio != NULL) { 13838348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_recv_uio) 13848348SEric.Yu@Sun.COM (so->so_proto_handle, uiop, msg, cr); 13858348SEric.Yu@Sun.COM } else { 13868348SEric.Yu@Sun.COM error = sorecvoob(so, msg, uiop, msg->msg_flags, 13878348SEric.Yu@Sun.COM IS_SO_OOB_INLINE(so)); 13888348SEric.Yu@Sun.COM } 13898348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 13908348SEric.Yu@Sun.COM return (error); 13918348SEric.Yu@Sun.COM } 13928348SEric.Yu@Sun.COM 13938348SEric.Yu@Sun.COM /* 13948348SEric.Yu@Sun.COM * If the protocol has the recv down call, then pass the request 13958348SEric.Yu@Sun.COM * down. 13968348SEric.Yu@Sun.COM */ 13978348SEric.Yu@Sun.COM if (so->so_downcalls->sd_recv_uio != NULL) { 13988348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_recv_uio) 13998348SEric.Yu@Sun.COM (so->so_proto_handle, uiop, msg, cr); 14008348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 14018348SEric.Yu@Sun.COM return (error); 14028348SEric.Yu@Sun.COM } 14038348SEric.Yu@Sun.COM 14048348SEric.Yu@Sun.COM /* 14058348SEric.Yu@Sun.COM * Reading data from the socket buffer 14068348SEric.Yu@Sun.COM */ 14078348SEric.Yu@Sun.COM flags = msg->msg_flags; 14088348SEric.Yu@Sun.COM msg->msg_flags = 0; 14098348SEric.Yu@Sun.COM 14108348SEric.Yu@Sun.COM /* 14118348SEric.Yu@Sun.COM * Set msg_controllen and msg_namelen to zero here to make it 14128348SEric.Yu@Sun.COM * simpler in the cases that no control or name is returned. 14138348SEric.Yu@Sun.COM */ 14148348SEric.Yu@Sun.COM controllen = msg->msg_controllen; 14158348SEric.Yu@Sun.COM namelen = msg->msg_namelen; 14168348SEric.Yu@Sun.COM msg->msg_controllen = 0; 14178348SEric.Yu@Sun.COM msg->msg_namelen = 0; 14188348SEric.Yu@Sun.COM 14198348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 14208348SEric.Yu@Sun.COM /* Set SOREADLOCKED */ 14218348SEric.Yu@Sun.COM error = so_lock_read_intr(so, 14228348SEric.Yu@Sun.COM uiop->uio_fmode | ((flags & MSG_DONTWAIT) ? FNONBLOCK : 0)); 14238348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 14248348SEric.Yu@Sun.COM if (error) { 14258348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 14268348SEric.Yu@Sun.COM return (error); 14278348SEric.Yu@Sun.COM } 14288348SEric.Yu@Sun.COM 14298348SEric.Yu@Sun.COM suiop = sod_rcv_init(so, flags, &uiop); 14308348SEric.Yu@Sun.COM retry: 14318348SEric.Yu@Sun.COM saved_resid = uiop->uio_resid; 14328348SEric.Yu@Sun.COM error = so_dequeue_msg(so, &mctlp, uiop, &rval, flags); 14338348SEric.Yu@Sun.COM if (error != 0) { 14348348SEric.Yu@Sun.COM goto out; 14358348SEric.Yu@Sun.COM } 14368348SEric.Yu@Sun.COM /* 14378348SEric.Yu@Sun.COM * For datagrams the MOREDATA flag is used to set MSG_TRUNC. 14388348SEric.Yu@Sun.COM * For non-datagrams MOREDATA is used to set MSG_EOR. 14398348SEric.Yu@Sun.COM */ 14408348SEric.Yu@Sun.COM ASSERT(!(rval.r_val1 & MORECTL)); 14418348SEric.Yu@Sun.COM if ((rval.r_val1 & MOREDATA) && (so->so_mode & SM_ATOMIC)) 14428348SEric.Yu@Sun.COM msg->msg_flags |= MSG_TRUNC; 14438348SEric.Yu@Sun.COM if (mctlp == NULL) { 14448348SEric.Yu@Sun.COM dprintso(so, 1, ("so_recvmsg: got M_DATA\n")); 14458348SEric.Yu@Sun.COM 14468348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 14478348SEric.Yu@Sun.COM /* Set MSG_EOR based on MOREDATA */ 14488348SEric.Yu@Sun.COM if (!(rval.r_val1 & MOREDATA)) { 14498348SEric.Yu@Sun.COM if (so->so_state & SS_SAVEDEOR) { 14508348SEric.Yu@Sun.COM msg->msg_flags |= MSG_EOR; 14518348SEric.Yu@Sun.COM so->so_state &= ~SS_SAVEDEOR; 14528348SEric.Yu@Sun.COM } 14538348SEric.Yu@Sun.COM } 14548348SEric.Yu@Sun.COM /* 14558348SEric.Yu@Sun.COM * If some data was received (i.e. not EOF) and the 14568348SEric.Yu@Sun.COM * read/recv* has not been satisfied wait for some more. 14578348SEric.Yu@Sun.COM */ 14588348SEric.Yu@Sun.COM if ((flags & MSG_WAITALL) && !(msg->msg_flags & MSG_EOR) && 14598348SEric.Yu@Sun.COM uiop->uio_resid != saved_resid && uiop->uio_resid > 0) { 14608348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 14618348SEric.Yu@Sun.COM goto retry; 14628348SEric.Yu@Sun.COM } 14638348SEric.Yu@Sun.COM 14648348SEric.Yu@Sun.COM goto out_locked; 14658348SEric.Yu@Sun.COM } 14668348SEric.Yu@Sun.COM /* strsock_proto has already verified length and alignment */ 14678348SEric.Yu@Sun.COM tpr = (union T_primitives *)mctlp->b_rptr; 14688348SEric.Yu@Sun.COM dprintso(so, 1, ("so_recvmsg: type %d\n", tpr->type)); 14698348SEric.Yu@Sun.COM switch (tpr->type) { 14708348SEric.Yu@Sun.COM case T_DATA_IND: { 14718348SEric.Yu@Sun.COM /* 14728348SEric.Yu@Sun.COM * Set msg_flags to MSG_EOR based on 14738348SEric.Yu@Sun.COM * MORE_flag and MOREDATA. 14748348SEric.Yu@Sun.COM */ 14758348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 14768348SEric.Yu@Sun.COM so->so_state &= ~SS_SAVEDEOR; 14778348SEric.Yu@Sun.COM if (!(tpr->data_ind.MORE_flag & 1)) { 14788348SEric.Yu@Sun.COM if (!(rval.r_val1 & MOREDATA)) 14798348SEric.Yu@Sun.COM msg->msg_flags |= MSG_EOR; 14808348SEric.Yu@Sun.COM else 14818348SEric.Yu@Sun.COM so->so_state |= SS_SAVEDEOR; 14828348SEric.Yu@Sun.COM } 14838348SEric.Yu@Sun.COM freemsg(mctlp); 14848348SEric.Yu@Sun.COM /* 14858348SEric.Yu@Sun.COM * If some data was received (i.e. not EOF) and the 14868348SEric.Yu@Sun.COM * read/recv* has not been satisfied wait for some more. 14878348SEric.Yu@Sun.COM */ 14888348SEric.Yu@Sun.COM if ((flags & MSG_WAITALL) && !(msg->msg_flags & MSG_EOR) && 14898348SEric.Yu@Sun.COM uiop->uio_resid != saved_resid && uiop->uio_resid > 0) { 14908348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 14918348SEric.Yu@Sun.COM goto retry; 14928348SEric.Yu@Sun.COM } 14938348SEric.Yu@Sun.COM goto out_locked; 14948348SEric.Yu@Sun.COM } 14958348SEric.Yu@Sun.COM case T_UNITDATA_IND: { 14968348SEric.Yu@Sun.COM void *addr; 14978348SEric.Yu@Sun.COM t_uscalar_t addrlen; 14988348SEric.Yu@Sun.COM void *abuf; 14998348SEric.Yu@Sun.COM t_uscalar_t optlen; 15008348SEric.Yu@Sun.COM void *opt; 15018348SEric.Yu@Sun.COM 15028348SEric.Yu@Sun.COM if (namelen != 0) { 15038348SEric.Yu@Sun.COM /* Caller wants source address */ 15048348SEric.Yu@Sun.COM addrlen = tpr->unitdata_ind.SRC_length; 15058348SEric.Yu@Sun.COM addr = sogetoff(mctlp, tpr->unitdata_ind.SRC_offset, 15068348SEric.Yu@Sun.COM addrlen, 1); 15078348SEric.Yu@Sun.COM if (addr == NULL) { 15088348SEric.Yu@Sun.COM freemsg(mctlp); 15098348SEric.Yu@Sun.COM error = EPROTO; 15108348SEric.Yu@Sun.COM eprintsoline(so, error); 15118348SEric.Yu@Sun.COM goto out; 15128348SEric.Yu@Sun.COM } 15138348SEric.Yu@Sun.COM ASSERT(so->so_family != AF_UNIX); 15148348SEric.Yu@Sun.COM } 15158348SEric.Yu@Sun.COM optlen = tpr->unitdata_ind.OPT_length; 15168348SEric.Yu@Sun.COM if (optlen != 0) { 15178348SEric.Yu@Sun.COM t_uscalar_t ncontrollen; 15188348SEric.Yu@Sun.COM 15198348SEric.Yu@Sun.COM /* 15208348SEric.Yu@Sun.COM * Extract any source address option. 15218348SEric.Yu@Sun.COM * Determine how large cmsg buffer is needed. 15228348SEric.Yu@Sun.COM */ 15238348SEric.Yu@Sun.COM opt = sogetoff(mctlp, tpr->unitdata_ind.OPT_offset, 15248348SEric.Yu@Sun.COM optlen, __TPI_ALIGN_SIZE); 15258348SEric.Yu@Sun.COM 15268348SEric.Yu@Sun.COM if (opt == NULL) { 15278348SEric.Yu@Sun.COM freemsg(mctlp); 15288348SEric.Yu@Sun.COM error = EPROTO; 15298348SEric.Yu@Sun.COM eprintsoline(so, error); 15308348SEric.Yu@Sun.COM goto out; 15318348SEric.Yu@Sun.COM } 15328348SEric.Yu@Sun.COM if (so->so_family == AF_UNIX) 15338348SEric.Yu@Sun.COM so_getopt_srcaddr(opt, optlen, &addr, &addrlen); 15348348SEric.Yu@Sun.COM ncontrollen = so_cmsglen(mctlp, opt, optlen, 15358348SEric.Yu@Sun.COM !(flags & MSG_XPG4_2)); 15368348SEric.Yu@Sun.COM if (controllen != 0) 15378348SEric.Yu@Sun.COM controllen = ncontrollen; 15388348SEric.Yu@Sun.COM else if (ncontrollen != 0) 15398348SEric.Yu@Sun.COM msg->msg_flags |= MSG_CTRUNC; 15408348SEric.Yu@Sun.COM } else { 15418348SEric.Yu@Sun.COM controllen = 0; 15428348SEric.Yu@Sun.COM } 15438348SEric.Yu@Sun.COM 15448348SEric.Yu@Sun.COM if (namelen != 0) { 15458348SEric.Yu@Sun.COM /* 15468348SEric.Yu@Sun.COM * Return address to caller. 15478348SEric.Yu@Sun.COM * Caller handles truncation if length 15488348SEric.Yu@Sun.COM * exceeds msg_namelen. 15498348SEric.Yu@Sun.COM * NOTE: AF_UNIX NUL termination is ensured by 15508348SEric.Yu@Sun.COM * the sender's copyin_name(). 15518348SEric.Yu@Sun.COM */ 15528348SEric.Yu@Sun.COM abuf = kmem_alloc(addrlen, KM_SLEEP); 15538348SEric.Yu@Sun.COM 15548348SEric.Yu@Sun.COM bcopy(addr, abuf, addrlen); 15558348SEric.Yu@Sun.COM msg->msg_name = abuf; 15568348SEric.Yu@Sun.COM msg->msg_namelen = addrlen; 15578348SEric.Yu@Sun.COM } 15588348SEric.Yu@Sun.COM 15598348SEric.Yu@Sun.COM if (controllen != 0) { 15608348SEric.Yu@Sun.COM /* 15618348SEric.Yu@Sun.COM * Return control msg to caller. 15628348SEric.Yu@Sun.COM * Caller handles truncation if length 15638348SEric.Yu@Sun.COM * exceeds msg_controllen. 15648348SEric.Yu@Sun.COM */ 15658348SEric.Yu@Sun.COM control = kmem_zalloc(controllen, KM_SLEEP); 15668348SEric.Yu@Sun.COM 15678348SEric.Yu@Sun.COM error = so_opt2cmsg(mctlp, opt, optlen, 15688348SEric.Yu@Sun.COM !(flags & MSG_XPG4_2), control, controllen); 15698348SEric.Yu@Sun.COM if (error) { 15708348SEric.Yu@Sun.COM freemsg(mctlp); 15718348SEric.Yu@Sun.COM if (msg->msg_namelen != 0) 15728348SEric.Yu@Sun.COM kmem_free(msg->msg_name, 15738348SEric.Yu@Sun.COM msg->msg_namelen); 15748348SEric.Yu@Sun.COM kmem_free(control, controllen); 15758348SEric.Yu@Sun.COM eprintsoline(so, error); 15768348SEric.Yu@Sun.COM goto out; 15778348SEric.Yu@Sun.COM } 15788348SEric.Yu@Sun.COM msg->msg_control = control; 15798348SEric.Yu@Sun.COM msg->msg_controllen = controllen; 15808348SEric.Yu@Sun.COM } 15818348SEric.Yu@Sun.COM 15828348SEric.Yu@Sun.COM freemsg(mctlp); 15838348SEric.Yu@Sun.COM goto out; 15848348SEric.Yu@Sun.COM } 15858348SEric.Yu@Sun.COM case T_OPTDATA_IND: { 15868348SEric.Yu@Sun.COM struct T_optdata_req *tdr; 15878348SEric.Yu@Sun.COM void *opt; 15888348SEric.Yu@Sun.COM t_uscalar_t optlen; 15898348SEric.Yu@Sun.COM 15908348SEric.Yu@Sun.COM tdr = (struct T_optdata_req *)mctlp->b_rptr; 15918348SEric.Yu@Sun.COM optlen = tdr->OPT_length; 15928348SEric.Yu@Sun.COM if (optlen != 0) { 15938348SEric.Yu@Sun.COM t_uscalar_t ncontrollen; 15948348SEric.Yu@Sun.COM /* 15958348SEric.Yu@Sun.COM * Determine how large cmsg buffer is needed. 15968348SEric.Yu@Sun.COM */ 15978348SEric.Yu@Sun.COM opt = sogetoff(mctlp, 15988348SEric.Yu@Sun.COM tpr->optdata_ind.OPT_offset, optlen, 15998348SEric.Yu@Sun.COM __TPI_ALIGN_SIZE); 16008348SEric.Yu@Sun.COM 16018348SEric.Yu@Sun.COM if (opt == NULL) { 16028348SEric.Yu@Sun.COM freemsg(mctlp); 16038348SEric.Yu@Sun.COM error = EPROTO; 16048348SEric.Yu@Sun.COM eprintsoline(so, error); 16058348SEric.Yu@Sun.COM goto out; 16068348SEric.Yu@Sun.COM } 16078348SEric.Yu@Sun.COM 16088348SEric.Yu@Sun.COM ncontrollen = so_cmsglen(mctlp, opt, optlen, 16098348SEric.Yu@Sun.COM !(flags & MSG_XPG4_2)); 16108348SEric.Yu@Sun.COM if (controllen != 0) 16118348SEric.Yu@Sun.COM controllen = ncontrollen; 16128348SEric.Yu@Sun.COM else if (ncontrollen != 0) 16138348SEric.Yu@Sun.COM msg->msg_flags |= MSG_CTRUNC; 16148348SEric.Yu@Sun.COM } else { 16158348SEric.Yu@Sun.COM controllen = 0; 16168348SEric.Yu@Sun.COM } 16178348SEric.Yu@Sun.COM 16188348SEric.Yu@Sun.COM if (controllen != 0) { 16198348SEric.Yu@Sun.COM /* 16208348SEric.Yu@Sun.COM * Return control msg to caller. 16218348SEric.Yu@Sun.COM * Caller handles truncation if length 16228348SEric.Yu@Sun.COM * exceeds msg_controllen. 16238348SEric.Yu@Sun.COM */ 16248348SEric.Yu@Sun.COM control = kmem_zalloc(controllen, KM_SLEEP); 16258348SEric.Yu@Sun.COM 16268348SEric.Yu@Sun.COM error = so_opt2cmsg(mctlp, opt, optlen, 16278348SEric.Yu@Sun.COM !(flags & MSG_XPG4_2), control, controllen); 16288348SEric.Yu@Sun.COM if (error) { 16298348SEric.Yu@Sun.COM freemsg(mctlp); 16308348SEric.Yu@Sun.COM kmem_free(control, controllen); 16318348SEric.Yu@Sun.COM eprintsoline(so, error); 16328348SEric.Yu@Sun.COM goto out; 16338348SEric.Yu@Sun.COM } 16348348SEric.Yu@Sun.COM msg->msg_control = control; 16358348SEric.Yu@Sun.COM msg->msg_controllen = controllen; 16368348SEric.Yu@Sun.COM } 16378348SEric.Yu@Sun.COM 16388348SEric.Yu@Sun.COM /* 16398348SEric.Yu@Sun.COM * Set msg_flags to MSG_EOR based on 16408348SEric.Yu@Sun.COM * DATA_flag and MOREDATA. 16418348SEric.Yu@Sun.COM */ 16428348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 16438348SEric.Yu@Sun.COM so->so_state &= ~SS_SAVEDEOR; 16448348SEric.Yu@Sun.COM if (!(tpr->data_ind.MORE_flag & 1)) { 16458348SEric.Yu@Sun.COM if (!(rval.r_val1 & MOREDATA)) 16468348SEric.Yu@Sun.COM msg->msg_flags |= MSG_EOR; 16478348SEric.Yu@Sun.COM else 16488348SEric.Yu@Sun.COM so->so_state |= SS_SAVEDEOR; 16498348SEric.Yu@Sun.COM } 16508348SEric.Yu@Sun.COM freemsg(mctlp); 16518348SEric.Yu@Sun.COM /* 16528348SEric.Yu@Sun.COM * If some data was received (i.e. not EOF) and the 16538348SEric.Yu@Sun.COM * read/recv* has not been satisfied wait for some more. 16548348SEric.Yu@Sun.COM * Not possible to wait if control info was received. 16558348SEric.Yu@Sun.COM */ 16568348SEric.Yu@Sun.COM if ((flags & MSG_WAITALL) && !(msg->msg_flags & MSG_EOR) && 16578348SEric.Yu@Sun.COM controllen == 0 && 16588348SEric.Yu@Sun.COM uiop->uio_resid != saved_resid && uiop->uio_resid > 0) { 16598348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 16608348SEric.Yu@Sun.COM goto retry; 16618348SEric.Yu@Sun.COM } 16628348SEric.Yu@Sun.COM goto out_locked; 16638348SEric.Yu@Sun.COM } 16648348SEric.Yu@Sun.COM default: 16658348SEric.Yu@Sun.COM cmn_err(CE_CONT, "so_recvmsg bad type %x \n", 16668348SEric.Yu@Sun.COM tpr->type); 16678348SEric.Yu@Sun.COM freemsg(mctlp); 16688348SEric.Yu@Sun.COM error = EPROTO; 16698348SEric.Yu@Sun.COM ASSERT(0); 16708348SEric.Yu@Sun.COM } 16718348SEric.Yu@Sun.COM out: 16728348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 16738348SEric.Yu@Sun.COM out_locked: 16748348SEric.Yu@Sun.COM /* The sod_lockp pointers to the sonode so_lock */ 16758348SEric.Yu@Sun.COM ret = sod_rcv_done(so, suiop, uiop); 16768348SEric.Yu@Sun.COM if (ret != 0 && error == 0) 16778348SEric.Yu@Sun.COM error = ret; 16788348SEric.Yu@Sun.COM 16798348SEric.Yu@Sun.COM so_unlock_read(so); /* Clear SOREADLOCKED */ 16808348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 16818348SEric.Yu@Sun.COM 16828348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 16838348SEric.Yu@Sun.COM 16848348SEric.Yu@Sun.COM return (error); 16858348SEric.Yu@Sun.COM } 16868348SEric.Yu@Sun.COM 16878348SEric.Yu@Sun.COM sonodeops_t so_sonodeops = { 16888348SEric.Yu@Sun.COM so_init, /* sop_init */ 16898348SEric.Yu@Sun.COM so_accept, /* sop_accept */ 16908348SEric.Yu@Sun.COM so_bind, /* sop_bind */ 16918348SEric.Yu@Sun.COM so_listen, /* sop_listen */ 16928348SEric.Yu@Sun.COM so_connect, /* sop_connect */ 16938348SEric.Yu@Sun.COM so_recvmsg, /* sop_recvmsg */ 16948348SEric.Yu@Sun.COM so_sendmsg, /* sop_sendmsg */ 16958348SEric.Yu@Sun.COM so_sendmblk, /* sop_sendmblk */ 16968348SEric.Yu@Sun.COM so_getpeername, /* sop_getpeername */ 16978348SEric.Yu@Sun.COM so_getsockname, /* sop_getsockname */ 16988348SEric.Yu@Sun.COM so_shutdown, /* sop_shutdown */ 16998348SEric.Yu@Sun.COM so_getsockopt, /* sop_getsockopt */ 17008348SEric.Yu@Sun.COM so_setsockopt, /* sop_setsockopt */ 17018348SEric.Yu@Sun.COM so_ioctl, /* sop_ioctl */ 17028348SEric.Yu@Sun.COM so_poll, /* sop_poll */ 17038348SEric.Yu@Sun.COM so_close, /* sop_close */ 17048348SEric.Yu@Sun.COM }; 17058348SEric.Yu@Sun.COM 17068348SEric.Yu@Sun.COM sock_upcalls_t so_upcalls = { 17078348SEric.Yu@Sun.COM so_newconn, 17088348SEric.Yu@Sun.COM so_connected, 17098348SEric.Yu@Sun.COM so_disconnected, 17108348SEric.Yu@Sun.COM so_opctl, 17118348SEric.Yu@Sun.COM so_queue_msg, 17128348SEric.Yu@Sun.COM so_set_prop, 17138348SEric.Yu@Sun.COM so_txq_full, 17148348SEric.Yu@Sun.COM so_signal_oob, 17158348SEric.Yu@Sun.COM so_zcopy_notify, 17168348SEric.Yu@Sun.COM so_set_error 17178348SEric.Yu@Sun.COM }; 1718