18348SEric.Yu@Sun.COM /* 28348SEric.Yu@Sun.COM * CDDL HEADER START 38348SEric.Yu@Sun.COM * 48348SEric.Yu@Sun.COM * The contents of this file are subject to the terms of the 58348SEric.Yu@Sun.COM * Common Development and Distribution License (the "License"). 68348SEric.Yu@Sun.COM * You may not use this file except in compliance with the License. 78348SEric.Yu@Sun.COM * 88348SEric.Yu@Sun.COM * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 98348SEric.Yu@Sun.COM * or http://www.opensolaris.org/os/licensing. 108348SEric.Yu@Sun.COM * See the License for the specific language governing permissions 118348SEric.Yu@Sun.COM * and limitations under the License. 128348SEric.Yu@Sun.COM * 138348SEric.Yu@Sun.COM * When distributing Covered Code, include this CDDL HEADER in each 148348SEric.Yu@Sun.COM * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 158348SEric.Yu@Sun.COM * If applicable, add the following below this CDDL HEADER, with the 168348SEric.Yu@Sun.COM * fields enclosed by brackets "[]" replaced with your own identifying 178348SEric.Yu@Sun.COM * information: Portions Copyright [yyyy] [name of copyright owner] 188348SEric.Yu@Sun.COM * 198348SEric.Yu@Sun.COM * CDDL HEADER END 208348SEric.Yu@Sun.COM */ 218348SEric.Yu@Sun.COM 228348SEric.Yu@Sun.COM /* 238489Sshenjian * Copyright 2009 Sun Microsystems, Inc. All rights reserved. 248348SEric.Yu@Sun.COM * Use is subject to license terms. 258348SEric.Yu@Sun.COM */ 268348SEric.Yu@Sun.COM 278348SEric.Yu@Sun.COM #pragma ident "@(#)sockcommon_sops.c 1.1 07/06/14 SMI" 288348SEric.Yu@Sun.COM 298348SEric.Yu@Sun.COM #include <sys/types.h> 308348SEric.Yu@Sun.COM #include <sys/param.h> 318348SEric.Yu@Sun.COM #include <sys/systm.h> 328348SEric.Yu@Sun.COM #include <sys/sysmacros.h> 338348SEric.Yu@Sun.COM #include <sys/debug.h> 348348SEric.Yu@Sun.COM #include <sys/cmn_err.h> 358348SEric.Yu@Sun.COM 368348SEric.Yu@Sun.COM #include <sys/stropts.h> 378348SEric.Yu@Sun.COM #include <sys/socket.h> 388348SEric.Yu@Sun.COM #include <sys/socketvar.h> 398348SEric.Yu@Sun.COM 408348SEric.Yu@Sun.COM #define _SUN_TPI_VERSION 2 418348SEric.Yu@Sun.COM #include <sys/tihdr.h> 428348SEric.Yu@Sun.COM #include <sys/sockio.h> 438348SEric.Yu@Sun.COM #include <sys/sodirect.h> 448348SEric.Yu@Sun.COM #include <sys/kmem_impl.h> 458348SEric.Yu@Sun.COM 468348SEric.Yu@Sun.COM #include <sys/strsubr.h> 478348SEric.Yu@Sun.COM #include <sys/strsun.h> 488348SEric.Yu@Sun.COM #include <sys/ddi.h> 498348SEric.Yu@Sun.COM #include <netinet/in.h> 508348SEric.Yu@Sun.COM #include <inet/ip.h> 518348SEric.Yu@Sun.COM 528348SEric.Yu@Sun.COM #include <fs/sockfs/sockcommon.h> 538348SEric.Yu@Sun.COM 548348SEric.Yu@Sun.COM #include <sys/socket_proto.h> 558348SEric.Yu@Sun.COM 568348SEric.Yu@Sun.COM #include <fs/sockfs/socktpi_impl.h> 578348SEric.Yu@Sun.COM #include <sys/tihdr.h> 588348SEric.Yu@Sun.COM #include <fs/sockfs/nl7c.h> 598348SEric.Yu@Sun.COM #include <inet/kssl/ksslapi.h> 608348SEric.Yu@Sun.COM 618348SEric.Yu@Sun.COM 628348SEric.Yu@Sun.COM extern int xnet_skip_checks; 638348SEric.Yu@Sun.COM extern int xnet_check_print; 648348SEric.Yu@Sun.COM 658348SEric.Yu@Sun.COM static void so_queue_oob(sock_upper_handle_t, mblk_t *, size_t); 668348SEric.Yu@Sun.COM 678348SEric.Yu@Sun.COM 688348SEric.Yu@Sun.COM /*ARGSUSED*/ 698348SEric.Yu@Sun.COM int 708348SEric.Yu@Sun.COM so_accept_notsupp(struct sonode *lso, int fflag, 718348SEric.Yu@Sun.COM struct cred *cr, struct sonode **nsop) 728348SEric.Yu@Sun.COM { 738348SEric.Yu@Sun.COM return (EOPNOTSUPP); 748348SEric.Yu@Sun.COM } 758348SEric.Yu@Sun.COM 768348SEric.Yu@Sun.COM /*ARGSUSED*/ 778348SEric.Yu@Sun.COM int 788348SEric.Yu@Sun.COM so_listen_notsupp(struct sonode *so, int backlog, struct cred *cr) 798348SEric.Yu@Sun.COM { 808348SEric.Yu@Sun.COM return (EOPNOTSUPP); 818348SEric.Yu@Sun.COM } 828348SEric.Yu@Sun.COM 838348SEric.Yu@Sun.COM /*ARGSUSED*/ 848348SEric.Yu@Sun.COM int 858348SEric.Yu@Sun.COM so_getsockname_notsupp(struct sonode *so, struct sockaddr *sa, 868348SEric.Yu@Sun.COM socklen_t *len, struct cred *cr) 878348SEric.Yu@Sun.COM { 888348SEric.Yu@Sun.COM return (EOPNOTSUPP); 898348SEric.Yu@Sun.COM } 908348SEric.Yu@Sun.COM 918348SEric.Yu@Sun.COM /*ARGSUSED*/ 928348SEric.Yu@Sun.COM int 938348SEric.Yu@Sun.COM so_getpeername_notsupp(struct sonode *so, struct sockaddr *addr, 948348SEric.Yu@Sun.COM socklen_t *addrlen, boolean_t accept, struct cred *cr) 958348SEric.Yu@Sun.COM { 968348SEric.Yu@Sun.COM return (EOPNOTSUPP); 978348SEric.Yu@Sun.COM } 988348SEric.Yu@Sun.COM 998348SEric.Yu@Sun.COM /*ARGSUSED*/ 1008348SEric.Yu@Sun.COM int 1018348SEric.Yu@Sun.COM so_shutdown_notsupp(struct sonode *so, int how, struct cred *cr) 1028348SEric.Yu@Sun.COM { 1038348SEric.Yu@Sun.COM return (EOPNOTSUPP); 1048348SEric.Yu@Sun.COM } 1058348SEric.Yu@Sun.COM 1068348SEric.Yu@Sun.COM /*ARGSUSED*/ 1078348SEric.Yu@Sun.COM int 1088348SEric.Yu@Sun.COM so_sendmblk_notsupp(struct sonode *so, struct msghdr *msg, int fflag, 1098348SEric.Yu@Sun.COM struct cred *cr, mblk_t **mpp) 1108348SEric.Yu@Sun.COM { 1118348SEric.Yu@Sun.COM return (EOPNOTSUPP); 1128348SEric.Yu@Sun.COM } 1138348SEric.Yu@Sun.COM 1148348SEric.Yu@Sun.COM /* 1158348SEric.Yu@Sun.COM * Generic Socket Ops 1168348SEric.Yu@Sun.COM */ 1178348SEric.Yu@Sun.COM 1188348SEric.Yu@Sun.COM /* ARGSUSED */ 1198348SEric.Yu@Sun.COM int 1208348SEric.Yu@Sun.COM so_init(struct sonode *so, struct sonode *pso, struct cred *cr, int flags) 1218348SEric.Yu@Sun.COM { 1228348SEric.Yu@Sun.COM return (socket_init_common(so, pso, flags, cr)); 1238348SEric.Yu@Sun.COM } 1248348SEric.Yu@Sun.COM 1258348SEric.Yu@Sun.COM int 1268348SEric.Yu@Sun.COM so_bind(struct sonode *so, struct sockaddr *name, socklen_t namelen, 1278348SEric.Yu@Sun.COM int flags, struct cred *cr) 1288348SEric.Yu@Sun.COM { 1298348SEric.Yu@Sun.COM int error; 1308348SEric.Yu@Sun.COM 1318348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_BIND(so, name, namelen, flags, cr)); 1328348SEric.Yu@Sun.COM 1338348SEric.Yu@Sun.COM ASSERT(flags == _SOBIND_XPG4_2 || flags == _SOBIND_SOCKBSD); 1348348SEric.Yu@Sun.COM 1358348SEric.Yu@Sun.COM /* X/Open requires this check */ 1368348SEric.Yu@Sun.COM if ((so->so_state & SS_CANTSENDMORE) && !xnet_skip_checks) { 1378348SEric.Yu@Sun.COM if (xnet_check_print) { 1388348SEric.Yu@Sun.COM printf("sockfs: X/Open bind state check " 1398348SEric.Yu@Sun.COM "caused EINVAL\n"); 1408348SEric.Yu@Sun.COM } 1418348SEric.Yu@Sun.COM error = EINVAL; 1428348SEric.Yu@Sun.COM goto done; 1438348SEric.Yu@Sun.COM } 1448348SEric.Yu@Sun.COM 1458348SEric.Yu@Sun.COM /* 1468348SEric.Yu@Sun.COM * a bind to a NULL address is interpreted as unbind. So just 1478348SEric.Yu@Sun.COM * do the downcall. 1488348SEric.Yu@Sun.COM */ 1498348SEric.Yu@Sun.COM if (name == NULL) 1508348SEric.Yu@Sun.COM goto dobind; 1518348SEric.Yu@Sun.COM 1528348SEric.Yu@Sun.COM switch (so->so_family) { 1538348SEric.Yu@Sun.COM case AF_INET: 1548348SEric.Yu@Sun.COM if ((size_t)namelen != sizeof (sin_t)) { 1558348SEric.Yu@Sun.COM error = name->sa_family != so->so_family ? 1568348SEric.Yu@Sun.COM EAFNOSUPPORT : EINVAL; 1578348SEric.Yu@Sun.COM eprintsoline(so, error); 1588348SEric.Yu@Sun.COM goto done; 1598348SEric.Yu@Sun.COM } 1608348SEric.Yu@Sun.COM 1618348SEric.Yu@Sun.COM if ((flags & _SOBIND_XPG4_2) && 1628348SEric.Yu@Sun.COM (name->sa_family != so->so_family)) { 1638348SEric.Yu@Sun.COM /* 1648348SEric.Yu@Sun.COM * This check has to be made for X/Open 1658348SEric.Yu@Sun.COM * sockets however application failures have 1668348SEric.Yu@Sun.COM * been observed when it is applied to 1678348SEric.Yu@Sun.COM * all sockets. 1688348SEric.Yu@Sun.COM */ 1698348SEric.Yu@Sun.COM error = EAFNOSUPPORT; 1708348SEric.Yu@Sun.COM eprintsoline(so, error); 1718348SEric.Yu@Sun.COM goto done; 1728348SEric.Yu@Sun.COM } 1738348SEric.Yu@Sun.COM /* 1748348SEric.Yu@Sun.COM * Force a zero sa_family to match so_family. 1758348SEric.Yu@Sun.COM * 1768348SEric.Yu@Sun.COM * Some programs like inetd(1M) don't set the 1778348SEric.Yu@Sun.COM * family field. Other programs leave 1788348SEric.Yu@Sun.COM * sin_family set to garbage - SunOS 4.X does 1798348SEric.Yu@Sun.COM * not check the family field on a bind. 1808348SEric.Yu@Sun.COM * We use the family field that 1818348SEric.Yu@Sun.COM * was passed in to the socket() call. 1828348SEric.Yu@Sun.COM */ 1838348SEric.Yu@Sun.COM name->sa_family = so->so_family; 1848348SEric.Yu@Sun.COM break; 1858348SEric.Yu@Sun.COM 1868348SEric.Yu@Sun.COM case AF_INET6: { 1878348SEric.Yu@Sun.COM #ifdef DEBUG 1888348SEric.Yu@Sun.COM sin6_t *sin6 = (sin6_t *)name; 1898348SEric.Yu@Sun.COM #endif 1908348SEric.Yu@Sun.COM if ((size_t)namelen != sizeof (sin6_t)) { 1918348SEric.Yu@Sun.COM error = name->sa_family != so->so_family ? 1928348SEric.Yu@Sun.COM EAFNOSUPPORT : EINVAL; 1938348SEric.Yu@Sun.COM eprintsoline(so, error); 1948348SEric.Yu@Sun.COM goto done; 1958348SEric.Yu@Sun.COM } 1968348SEric.Yu@Sun.COM 1978348SEric.Yu@Sun.COM if (name->sa_family != so->so_family) { 1988348SEric.Yu@Sun.COM /* 1998348SEric.Yu@Sun.COM * With IPv6 we require the family to match 2008348SEric.Yu@Sun.COM * unlike in IPv4. 2018348SEric.Yu@Sun.COM */ 2028348SEric.Yu@Sun.COM error = EAFNOSUPPORT; 2038348SEric.Yu@Sun.COM eprintsoline(so, error); 2048348SEric.Yu@Sun.COM goto done; 2058348SEric.Yu@Sun.COM } 2068348SEric.Yu@Sun.COM #ifdef DEBUG 2078348SEric.Yu@Sun.COM /* 2088348SEric.Yu@Sun.COM * Verify that apps don't forget to clear 2098348SEric.Yu@Sun.COM * sin6_scope_id etc 2108348SEric.Yu@Sun.COM */ 2118348SEric.Yu@Sun.COM if (sin6->sin6_scope_id != 0 && 2128348SEric.Yu@Sun.COM !IN6_IS_ADDR_LINKSCOPE(&sin6->sin6_addr)) { 2138348SEric.Yu@Sun.COM zcmn_err(getzoneid(), CE_WARN, 2148348SEric.Yu@Sun.COM "bind with uninitialized sin6_scope_id " 2158348SEric.Yu@Sun.COM "(%d) on socket. Pid = %d\n", 2168348SEric.Yu@Sun.COM (int)sin6->sin6_scope_id, 2178348SEric.Yu@Sun.COM (int)curproc->p_pid); 2188348SEric.Yu@Sun.COM } 2198348SEric.Yu@Sun.COM if (sin6->__sin6_src_id != 0) { 2208348SEric.Yu@Sun.COM zcmn_err(getzoneid(), CE_WARN, 2218348SEric.Yu@Sun.COM "bind with uninitialized __sin6_src_id " 2228348SEric.Yu@Sun.COM "(%d) on socket. Pid = %d\n", 2238348SEric.Yu@Sun.COM (int)sin6->__sin6_src_id, 2248348SEric.Yu@Sun.COM (int)curproc->p_pid); 2258348SEric.Yu@Sun.COM } 2268348SEric.Yu@Sun.COM #endif /* DEBUG */ 2278348SEric.Yu@Sun.COM 2288348SEric.Yu@Sun.COM break; 2298348SEric.Yu@Sun.COM } 2308348SEric.Yu@Sun.COM default: 2318348SEric.Yu@Sun.COM /* Just pass the request to the protocol */ 2328348SEric.Yu@Sun.COM goto dobind; 2338348SEric.Yu@Sun.COM } 2348348SEric.Yu@Sun.COM 2358348SEric.Yu@Sun.COM /* 2368348SEric.Yu@Sun.COM * First we check if either NCA or KSSL has been enabled for 2378348SEric.Yu@Sun.COM * the requested address, and if so, we fall back to TPI. 2388348SEric.Yu@Sun.COM * If neither of those two services are enabled, then we just 2398348SEric.Yu@Sun.COM * pass the request to the protocol. 2408348SEric.Yu@Sun.COM * 2418348SEric.Yu@Sun.COM * Note that KSSL can only be enabled on a socket if NCA is NOT 2428348SEric.Yu@Sun.COM * enabled for that socket, hence the else-statement below. 2438348SEric.Yu@Sun.COM */ 2448348SEric.Yu@Sun.COM if (nl7c_enabled && ((so->so_family == AF_INET || 2458348SEric.Yu@Sun.COM so->so_family == AF_INET6) && 2468348SEric.Yu@Sun.COM nl7c_lookup_addr(name, namelen) != NULL)) { 2478348SEric.Yu@Sun.COM /* 2488348SEric.Yu@Sun.COM * NL7C is not supported in non-global zones, 2498348SEric.Yu@Sun.COM * we enforce this restriction here. 2508348SEric.Yu@Sun.COM */ 2518348SEric.Yu@Sun.COM if (so->so_zoneid == GLOBAL_ZONEID) { 2528348SEric.Yu@Sun.COM /* NCA should be used, so fall back to TPI */ 2538348SEric.Yu@Sun.COM error = so_tpi_fallback(so, cr); 2548348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 2558348SEric.Yu@Sun.COM if (error) 2568348SEric.Yu@Sun.COM return (error); 2578348SEric.Yu@Sun.COM else 2588348SEric.Yu@Sun.COM return (SOP_BIND(so, name, namelen, flags, cr)); 2598348SEric.Yu@Sun.COM } 2608348SEric.Yu@Sun.COM } else if (so->so_type == SOCK_STREAM) { 2618348SEric.Yu@Sun.COM /* Check if KSSL has been configured for this address */ 2628348SEric.Yu@Sun.COM kssl_ent_t ent; 2638348SEric.Yu@Sun.COM kssl_endpt_type_t type; 2648348SEric.Yu@Sun.COM struct T_bind_req bind_req; 2658348SEric.Yu@Sun.COM mblk_t *mp; 2668348SEric.Yu@Sun.COM 2678348SEric.Yu@Sun.COM /* 2688348SEric.Yu@Sun.COM * TODO: Check with KSSL team if we could add a function call 2698348SEric.Yu@Sun.COM * that only queries whether KSSL is enabled for the given 2708348SEric.Yu@Sun.COM * address. 2718348SEric.Yu@Sun.COM */ 2728348SEric.Yu@Sun.COM bind_req.PRIM_type = T_BIND_REQ; 2738348SEric.Yu@Sun.COM bind_req.ADDR_length = namelen; 2748348SEric.Yu@Sun.COM bind_req.ADDR_offset = (t_scalar_t)sizeof (bind_req); 2758348SEric.Yu@Sun.COM mp = soallocproto2(&bind_req, sizeof (bind_req), 2768348SEric.Yu@Sun.COM name, namelen, 0, _ALLOC_SLEEP); 2778348SEric.Yu@Sun.COM 2788348SEric.Yu@Sun.COM type = kssl_check_proxy(mp, so, &ent); 2798348SEric.Yu@Sun.COM freemsg(mp); 2808348SEric.Yu@Sun.COM 2818348SEric.Yu@Sun.COM if (type != KSSL_NO_PROXY) { 2828348SEric.Yu@Sun.COM /* 2838348SEric.Yu@Sun.COM * KSSL has been configured for this address, so 2848348SEric.Yu@Sun.COM * we must fall back to TPI. 2858348SEric.Yu@Sun.COM */ 2868348SEric.Yu@Sun.COM kssl_release_ent(ent, so, type); 2878348SEric.Yu@Sun.COM error = so_tpi_fallback(so, cr); 2888348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 2898348SEric.Yu@Sun.COM if (error) 2908348SEric.Yu@Sun.COM return (error); 2918348SEric.Yu@Sun.COM else 2928348SEric.Yu@Sun.COM return (SOP_BIND(so, name, namelen, flags, cr)); 2938348SEric.Yu@Sun.COM } 2948348SEric.Yu@Sun.COM } 2958348SEric.Yu@Sun.COM 2968348SEric.Yu@Sun.COM dobind: 2978348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_bind) 2988348SEric.Yu@Sun.COM (so->so_proto_handle, name, namelen, cr); 2998348SEric.Yu@Sun.COM done: 3008348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 3018348SEric.Yu@Sun.COM 3028348SEric.Yu@Sun.COM return (error); 3038348SEric.Yu@Sun.COM } 3048348SEric.Yu@Sun.COM 3058348SEric.Yu@Sun.COM int 3068348SEric.Yu@Sun.COM so_listen(struct sonode *so, int backlog, struct cred *cr) 3078348SEric.Yu@Sun.COM { 3088348SEric.Yu@Sun.COM int error = 0; 3098348SEric.Yu@Sun.COM 3108348SEric.Yu@Sun.COM ASSERT(MUTEX_NOT_HELD(&so->so_lock)); 3118348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_LISTEN(so, backlog, cr)); 3128348SEric.Yu@Sun.COM 3138348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_listen)(so->so_proto_handle, backlog, 3148348SEric.Yu@Sun.COM cr); 3158348SEric.Yu@Sun.COM 3168348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 3178348SEric.Yu@Sun.COM 3188348SEric.Yu@Sun.COM return (error); 3198348SEric.Yu@Sun.COM } 3208348SEric.Yu@Sun.COM 3218348SEric.Yu@Sun.COM 3228348SEric.Yu@Sun.COM int 3238348SEric.Yu@Sun.COM so_connect(struct sonode *so, const struct sockaddr *name, 3248348SEric.Yu@Sun.COM socklen_t namelen, int fflag, int flags, struct cred *cr) 3258348SEric.Yu@Sun.COM { 3268348SEric.Yu@Sun.COM int error = 0; 3278348SEric.Yu@Sun.COM sock_connid_t id; 3288348SEric.Yu@Sun.COM 3298348SEric.Yu@Sun.COM ASSERT(MUTEX_NOT_HELD(&so->so_lock)); 3308348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_CONNECT(so, name, namelen, fflag, flags, cr)); 3318348SEric.Yu@Sun.COM 3328348SEric.Yu@Sun.COM /* 3338348SEric.Yu@Sun.COM * If there is a pending error, return error 3348348SEric.Yu@Sun.COM * This can happen if a non blocking operation caused an error. 3358348SEric.Yu@Sun.COM */ 3368348SEric.Yu@Sun.COM 3378348SEric.Yu@Sun.COM if (so->so_error != 0) { 3388348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 3398348SEric.Yu@Sun.COM error = sogeterr(so, B_TRUE); 3408348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 3418348SEric.Yu@Sun.COM if (error != 0) 3428348SEric.Yu@Sun.COM goto done; 3438348SEric.Yu@Sun.COM } 3448348SEric.Yu@Sun.COM 3458348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_connect)(so->so_proto_handle, 3468348SEric.Yu@Sun.COM name, namelen, &id, cr); 3478348SEric.Yu@Sun.COM 3488348SEric.Yu@Sun.COM if (error == EINPROGRESS) 3498348SEric.Yu@Sun.COM error = so_wait_connected(so, fflag & (FNONBLOCK|FNDELAY), id); 3508348SEric.Yu@Sun.COM 3518348SEric.Yu@Sun.COM done: 3528348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 3538348SEric.Yu@Sun.COM return (error); 3548348SEric.Yu@Sun.COM } 3558348SEric.Yu@Sun.COM 3568348SEric.Yu@Sun.COM /*ARGSUSED*/ 3578348SEric.Yu@Sun.COM int 3588348SEric.Yu@Sun.COM so_accept(struct sonode *so, int fflag, struct cred *cr, struct sonode **nsop) 3598348SEric.Yu@Sun.COM { 3608348SEric.Yu@Sun.COM int error = 0; 3618348SEric.Yu@Sun.COM struct sonode *nso; 3628348SEric.Yu@Sun.COM 3638348SEric.Yu@Sun.COM *nsop = NULL; 3648348SEric.Yu@Sun.COM 3658348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_ACCEPT(so, fflag, cr, nsop)); 3668348SEric.Yu@Sun.COM if ((so->so_state & SS_ACCEPTCONN) == 0) { 3678348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 3688348SEric.Yu@Sun.COM return ((so->so_type == SOCK_DGRAM || so->so_type == SOCK_RAW) ? 3698348SEric.Yu@Sun.COM EOPNOTSUPP : EINVAL); 3708348SEric.Yu@Sun.COM } 3718348SEric.Yu@Sun.COM 3728348SEric.Yu@Sun.COM if ((error = so_acceptq_dequeue(so, (fflag & (FNONBLOCK|FNDELAY)), 3738348SEric.Yu@Sun.COM &nso)) == 0) { 3748348SEric.Yu@Sun.COM ASSERT(nso != NULL); 3758348SEric.Yu@Sun.COM 3768348SEric.Yu@Sun.COM /* finish the accept */ 3778348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_accept)(so->so_proto_handle, 3788348SEric.Yu@Sun.COM nso->so_proto_handle, (sock_upper_handle_t)nso, cr); 3798348SEric.Yu@Sun.COM if (error != 0) { 3808348SEric.Yu@Sun.COM (void) socket_close(nso, 0, cr); 3818348SEric.Yu@Sun.COM socket_destroy(nso); 3828348SEric.Yu@Sun.COM } else { 3838348SEric.Yu@Sun.COM *nsop = nso; 3848348SEric.Yu@Sun.COM } 3858348SEric.Yu@Sun.COM } 3868348SEric.Yu@Sun.COM 3878348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 3888348SEric.Yu@Sun.COM return (error); 3898348SEric.Yu@Sun.COM } 3908348SEric.Yu@Sun.COM 3918348SEric.Yu@Sun.COM int 3928348SEric.Yu@Sun.COM so_sendmsg(struct sonode *so, struct nmsghdr *msg, struct uio *uiop, 3938348SEric.Yu@Sun.COM struct cred *cr) 3948348SEric.Yu@Sun.COM { 3958348SEric.Yu@Sun.COM int error, flags; 3968348SEric.Yu@Sun.COM boolean_t dontblock; 3978348SEric.Yu@Sun.COM ssize_t orig_resid; 3988348SEric.Yu@Sun.COM mblk_t *mp; 3998348SEric.Yu@Sun.COM 4008348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_SENDMSG(so, msg, uiop, cr)); 4018348SEric.Yu@Sun.COM 4028348SEric.Yu@Sun.COM flags = msg->msg_flags; 4038348SEric.Yu@Sun.COM error = 0; 4048348SEric.Yu@Sun.COM dontblock = (flags & MSG_DONTWAIT) || 4058348SEric.Yu@Sun.COM (uiop->uio_fmode & (FNONBLOCK|FNDELAY)); 4068348SEric.Yu@Sun.COM 4078348SEric.Yu@Sun.COM if (!(flags & MSG_XPG4_2) && msg->msg_controllen != 0) { 4088348SEric.Yu@Sun.COM /* 4098348SEric.Yu@Sun.COM * Old way of passing fd's is not supported 4108348SEric.Yu@Sun.COM */ 4118348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 4128348SEric.Yu@Sun.COM return (EOPNOTSUPP); 4138348SEric.Yu@Sun.COM } 4148348SEric.Yu@Sun.COM 4158348SEric.Yu@Sun.COM if ((so->so_mode & SM_ATOMIC) && 4168348SEric.Yu@Sun.COM uiop->uio_resid > so->so_proto_props.sopp_maxpsz && 4178348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxpsz != -1) { 4188348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 4198348SEric.Yu@Sun.COM return (EMSGSIZE); 4208348SEric.Yu@Sun.COM } 4218348SEric.Yu@Sun.COM 4228348SEric.Yu@Sun.COM /* 4238348SEric.Yu@Sun.COM * For atomic sends we will only do one iteration. 4248348SEric.Yu@Sun.COM */ 4258348SEric.Yu@Sun.COM do { 4268348SEric.Yu@Sun.COM if (so->so_state & SS_CANTSENDMORE) { 4278348SEric.Yu@Sun.COM error = EPIPE; 4288348SEric.Yu@Sun.COM break; 4298348SEric.Yu@Sun.COM } 4308348SEric.Yu@Sun.COM 4318348SEric.Yu@Sun.COM if (so->so_error != 0) { 4328348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 4338348SEric.Yu@Sun.COM error = sogeterr(so, B_TRUE); 4348348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 4358348SEric.Yu@Sun.COM if (error != 0) 4368348SEric.Yu@Sun.COM break; 4378348SEric.Yu@Sun.COM } 4388348SEric.Yu@Sun.COM 4398348SEric.Yu@Sun.COM /* 4408348SEric.Yu@Sun.COM * Send down OOB messages even if the send path is being 4418348SEric.Yu@Sun.COM * flow controlled (assuming the protocol supports OOB data). 4428348SEric.Yu@Sun.COM */ 4438348SEric.Yu@Sun.COM if (flags & MSG_OOB) { 4448348SEric.Yu@Sun.COM if ((so->so_mode & SM_EXDATA) == 0) { 4458348SEric.Yu@Sun.COM error = EOPNOTSUPP; 4468348SEric.Yu@Sun.COM break; 4478348SEric.Yu@Sun.COM } 4488348SEric.Yu@Sun.COM } else if (so->so_snd_qfull) { 4498348SEric.Yu@Sun.COM /* 4508348SEric.Yu@Sun.COM * Need to wait until the protocol is ready to receive 4518348SEric.Yu@Sun.COM * more data for transmission. 4528348SEric.Yu@Sun.COM */ 4538348SEric.Yu@Sun.COM if ((error = so_snd_wait_qnotfull(so, dontblock)) != 0) 4548348SEric.Yu@Sun.COM break; 4558348SEric.Yu@Sun.COM } 4568348SEric.Yu@Sun.COM 4578348SEric.Yu@Sun.COM /* 4588348SEric.Yu@Sun.COM * Time to send data to the protocol. We either copy the 4598348SEric.Yu@Sun.COM * data into mblks or pass the uio directly to the protocol. 4608348SEric.Yu@Sun.COM * We decide what to do based on the available down calls. 4618348SEric.Yu@Sun.COM */ 4628348SEric.Yu@Sun.COM if (so->so_downcalls->sd_send_uio != NULL) { 4638348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_send_uio) 4648348SEric.Yu@Sun.COM (so->so_proto_handle, uiop, msg, cr); 4658348SEric.Yu@Sun.COM if (error != 0) 4668348SEric.Yu@Sun.COM break; 4678348SEric.Yu@Sun.COM } else { 4688348SEric.Yu@Sun.COM /* save the resid in case of failure */ 4698348SEric.Yu@Sun.COM orig_resid = uiop->uio_resid; 4708348SEric.Yu@Sun.COM 4718348SEric.Yu@Sun.COM if ((mp = socopyinuio(uiop, 4728348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxpsz, 4738348SEric.Yu@Sun.COM so->so_proto_props.sopp_wroff, 4748348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxblk, 4758348SEric.Yu@Sun.COM so->so_proto_props.sopp_tail, &error)) == NULL) { 4768348SEric.Yu@Sun.COM break; 4778348SEric.Yu@Sun.COM } 4788348SEric.Yu@Sun.COM ASSERT(uiop->uio_resid >= 0); 4798348SEric.Yu@Sun.COM 4808348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_send) 4818348SEric.Yu@Sun.COM (so->so_proto_handle, mp, msg, cr); 4828348SEric.Yu@Sun.COM if (error != 0) { 4838348SEric.Yu@Sun.COM /* 4848348SEric.Yu@Sun.COM * The send failed. We do not have to free the 4858348SEric.Yu@Sun.COM * mblks, because that is the protocol's 4868348SEric.Yu@Sun.COM * responsibility. However, uio_resid must 4878348SEric.Yu@Sun.COM * remain accurate, so adjust that here. 4888348SEric.Yu@Sun.COM */ 4898348SEric.Yu@Sun.COM uiop->uio_resid = orig_resid; 4908348SEric.Yu@Sun.COM break; 4918348SEric.Yu@Sun.COM } 4928348SEric.Yu@Sun.COM } 4938348SEric.Yu@Sun.COM } while (uiop->uio_resid > 0); 4948348SEric.Yu@Sun.COM 4958348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 4968348SEric.Yu@Sun.COM 4978348SEric.Yu@Sun.COM return (error); 4988348SEric.Yu@Sun.COM } 4998348SEric.Yu@Sun.COM 5008348SEric.Yu@Sun.COM int 5018348SEric.Yu@Sun.COM so_sendmblk(struct sonode *so, struct nmsghdr *msg, int fflag, 5028348SEric.Yu@Sun.COM struct cred *cr, mblk_t **mpp) 5038348SEric.Yu@Sun.COM { 5048348SEric.Yu@Sun.COM int error; 5058348SEric.Yu@Sun.COM boolean_t dontblock; 5068348SEric.Yu@Sun.COM size_t size; 5078348SEric.Yu@Sun.COM mblk_t *mp = *mpp; 5088348SEric.Yu@Sun.COM 5098348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_SENDMBLK(so, msg, fflag, cr, mpp)); 5108348SEric.Yu@Sun.COM 5118348SEric.Yu@Sun.COM error = 0; 5128348SEric.Yu@Sun.COM dontblock = (msg->msg_flags & MSG_DONTWAIT) || 5138348SEric.Yu@Sun.COM (fflag & (FNONBLOCK|FNDELAY)); 5148348SEric.Yu@Sun.COM size = msgdsize(mp); 5158348SEric.Yu@Sun.COM 5168401SAnders.Persson@Sun.COM if ((so->so_mode & SM_SENDFILESUPP) == 0 || 5178401SAnders.Persson@Sun.COM so->so_downcalls->sd_send == NULL) { 5188348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 5198348SEric.Yu@Sun.COM return (EOPNOTSUPP); 5208348SEric.Yu@Sun.COM } 5218348SEric.Yu@Sun.COM 5228348SEric.Yu@Sun.COM if ((so->so_mode & SM_ATOMIC) && 5238348SEric.Yu@Sun.COM size > so->so_proto_props.sopp_maxpsz && 5248348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxpsz != -1) { 5258348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 5268348SEric.Yu@Sun.COM return (EMSGSIZE); 5278348SEric.Yu@Sun.COM } 5288348SEric.Yu@Sun.COM 5298348SEric.Yu@Sun.COM while (mp != NULL) { 5308348SEric.Yu@Sun.COM mblk_t *nmp, *last_mblk; 5318348SEric.Yu@Sun.COM size_t mlen; 5328348SEric.Yu@Sun.COM 5338348SEric.Yu@Sun.COM if (so->so_state & SS_CANTSENDMORE) { 5348348SEric.Yu@Sun.COM error = EPIPE; 5358348SEric.Yu@Sun.COM break; 5368348SEric.Yu@Sun.COM } 5378348SEric.Yu@Sun.COM if (so->so_error != 0) { 5388348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 5398348SEric.Yu@Sun.COM error = sogeterr(so, B_TRUE); 5408348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 5418348SEric.Yu@Sun.COM if (error != 0) 5428348SEric.Yu@Sun.COM break; 5438348SEric.Yu@Sun.COM } 5448348SEric.Yu@Sun.COM if (so->so_snd_qfull) { 5458348SEric.Yu@Sun.COM /* 5468348SEric.Yu@Sun.COM * Need to wait until the protocol is ready to receive 5478348SEric.Yu@Sun.COM * more data for transmission. 5488348SEric.Yu@Sun.COM */ 5498348SEric.Yu@Sun.COM if ((error = so_snd_wait_qnotfull(so, dontblock)) != 0) 5508348SEric.Yu@Sun.COM break; 5518348SEric.Yu@Sun.COM } 5528348SEric.Yu@Sun.COM 5538348SEric.Yu@Sun.COM /* 5548348SEric.Yu@Sun.COM * We only allow so_maxpsz of data to be sent down to 5558348SEric.Yu@Sun.COM * the protocol at time. 5568348SEric.Yu@Sun.COM */ 5578348SEric.Yu@Sun.COM mlen = MBLKL(mp); 5588348SEric.Yu@Sun.COM nmp = mp->b_cont; 5598348SEric.Yu@Sun.COM last_mblk = mp; 5608348SEric.Yu@Sun.COM while (nmp != NULL) { 5618348SEric.Yu@Sun.COM mlen += MBLKL(nmp); 5628348SEric.Yu@Sun.COM if (mlen > so->so_proto_props.sopp_maxpsz) { 5638348SEric.Yu@Sun.COM last_mblk->b_cont = NULL; 5648348SEric.Yu@Sun.COM break; 5658348SEric.Yu@Sun.COM } 5668348SEric.Yu@Sun.COM last_mblk = nmp; 5678348SEric.Yu@Sun.COM nmp = nmp->b_cont; 5688348SEric.Yu@Sun.COM } 5698348SEric.Yu@Sun.COM 5708348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_send) 5718348SEric.Yu@Sun.COM (so->so_proto_handle, mp, msg, cr); 5728348SEric.Yu@Sun.COM if (error != 0) { 5738348SEric.Yu@Sun.COM /* 5748348SEric.Yu@Sun.COM * The send failed. The protocol will free the mblks 5758348SEric.Yu@Sun.COM * that were sent down. Let the caller deal with the 5768348SEric.Yu@Sun.COM * rest. 5778348SEric.Yu@Sun.COM */ 5788348SEric.Yu@Sun.COM *mpp = nmp; 5798348SEric.Yu@Sun.COM break; 5808348SEric.Yu@Sun.COM } 5818348SEric.Yu@Sun.COM 5828348SEric.Yu@Sun.COM *mpp = mp = nmp; 5838348SEric.Yu@Sun.COM } 5848348SEric.Yu@Sun.COM 5858348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 5868348SEric.Yu@Sun.COM 5878348SEric.Yu@Sun.COM return (error); 5888348SEric.Yu@Sun.COM } 5898348SEric.Yu@Sun.COM 5908348SEric.Yu@Sun.COM int 5918348SEric.Yu@Sun.COM so_shutdown(struct sonode *so, int how, struct cred *cr) 5928348SEric.Yu@Sun.COM { 5938348SEric.Yu@Sun.COM int error; 5948348SEric.Yu@Sun.COM 5958348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_SHUTDOWN(so, how, cr)); 5968348SEric.Yu@Sun.COM 5978348SEric.Yu@Sun.COM /* 5988348SEric.Yu@Sun.COM * SunOS 4.X has no check for datagram sockets. 5998348SEric.Yu@Sun.COM * 5.X checks that it is connected (ENOTCONN) 6008348SEric.Yu@Sun.COM * X/Open requires that we check the connected state. 6018348SEric.Yu@Sun.COM */ 6028348SEric.Yu@Sun.COM if (!(so->so_state & SS_ISCONNECTED)) { 6038348SEric.Yu@Sun.COM if (!xnet_skip_checks) { 6048348SEric.Yu@Sun.COM error = ENOTCONN; 6058348SEric.Yu@Sun.COM if (xnet_check_print) { 6068348SEric.Yu@Sun.COM printf("sockfs: X/Open shutdown check " 6078348SEric.Yu@Sun.COM "caused ENOTCONN\n"); 6088348SEric.Yu@Sun.COM } 6098348SEric.Yu@Sun.COM } 6108348SEric.Yu@Sun.COM goto done; 6118348SEric.Yu@Sun.COM } 6128348SEric.Yu@Sun.COM 6138348SEric.Yu@Sun.COM error = ((*so->so_downcalls->sd_shutdown)(so->so_proto_handle, 6148348SEric.Yu@Sun.COM how, cr)); 6158348SEric.Yu@Sun.COM 6168348SEric.Yu@Sun.COM /* 6178348SEric.Yu@Sun.COM * Protocol agreed to shutdown. We need to flush the 6188348SEric.Yu@Sun.COM * receive buffer if the receive side is being shutdown. 6198348SEric.Yu@Sun.COM */ 6208348SEric.Yu@Sun.COM if (error == 0 && how != SHUT_WR) { 6218348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 6228348SEric.Yu@Sun.COM /* wait for active reader to finish */ 6238348SEric.Yu@Sun.COM (void) so_lock_read(so, 0); 6248348SEric.Yu@Sun.COM 6258348SEric.Yu@Sun.COM so_rcv_flush(so); 6268348SEric.Yu@Sun.COM 6278348SEric.Yu@Sun.COM so_unlock_read(so); 6288348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 6298348SEric.Yu@Sun.COM } 6308348SEric.Yu@Sun.COM 6318348SEric.Yu@Sun.COM done: 6328348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 6338348SEric.Yu@Sun.COM return (error); 6348348SEric.Yu@Sun.COM } 6358348SEric.Yu@Sun.COM 6368348SEric.Yu@Sun.COM int 6378348SEric.Yu@Sun.COM so_getsockname(struct sonode *so, struct sockaddr *addr, 6388348SEric.Yu@Sun.COM socklen_t *addrlen, struct cred *cr) 6398348SEric.Yu@Sun.COM { 6408348SEric.Yu@Sun.COM int error; 6418348SEric.Yu@Sun.COM 6428348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_GETSOCKNAME(so, addr, addrlen, cr)); 6438348SEric.Yu@Sun.COM 6448348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_getsockname) 6458348SEric.Yu@Sun.COM (so->so_proto_handle, addr, addrlen, cr); 6468348SEric.Yu@Sun.COM 6478348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 6488348SEric.Yu@Sun.COM return (error); 6498348SEric.Yu@Sun.COM } 6508348SEric.Yu@Sun.COM 6518348SEric.Yu@Sun.COM int 6528348SEric.Yu@Sun.COM so_getpeername(struct sonode *so, struct sockaddr *addr, 6538348SEric.Yu@Sun.COM socklen_t *addrlen, boolean_t accept, struct cred *cr) 6548348SEric.Yu@Sun.COM { 6558348SEric.Yu@Sun.COM int error; 6568348SEric.Yu@Sun.COM 6578348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_GETPEERNAME(so, addr, addrlen, accept, cr)); 6588348SEric.Yu@Sun.COM 6598348SEric.Yu@Sun.COM if (accept) { 6608348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_getpeername) 6618348SEric.Yu@Sun.COM (so->so_proto_handle, addr, addrlen, cr); 6628348SEric.Yu@Sun.COM } else if (!(so->so_state & SS_ISCONNECTED)) { 6638348SEric.Yu@Sun.COM error = ENOTCONN; 6648348SEric.Yu@Sun.COM } else if ((so->so_state & SS_CANTSENDMORE) && !xnet_skip_checks) { 6658348SEric.Yu@Sun.COM /* Added this check for X/Open */ 6668348SEric.Yu@Sun.COM error = EINVAL; 6678348SEric.Yu@Sun.COM if (xnet_check_print) { 6688348SEric.Yu@Sun.COM printf("sockfs: X/Open getpeername check => EINVAL\n"); 6698348SEric.Yu@Sun.COM } 6708348SEric.Yu@Sun.COM } else { 6718348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_getpeername) 6728348SEric.Yu@Sun.COM (so->so_proto_handle, addr, addrlen, cr); 6738348SEric.Yu@Sun.COM } 6748348SEric.Yu@Sun.COM 6758348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 6768348SEric.Yu@Sun.COM return (error); 6778348SEric.Yu@Sun.COM } 6788348SEric.Yu@Sun.COM 6798348SEric.Yu@Sun.COM int 6808348SEric.Yu@Sun.COM so_getsockopt(struct sonode *so, int level, int option_name, 6818348SEric.Yu@Sun.COM void *optval, socklen_t *optlenp, int flags, struct cred *cr) 6828348SEric.Yu@Sun.COM { 6838348SEric.Yu@Sun.COM int error = 0; 6848348SEric.Yu@Sun.COM 6858348SEric.Yu@Sun.COM ASSERT(MUTEX_NOT_HELD(&so->so_lock)); 6868348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, 6878348SEric.Yu@Sun.COM SOP_GETSOCKOPT(so, level, option_name, optval, optlenp, flags, cr)); 6888348SEric.Yu@Sun.COM 6898465SEric.Yu@Sun.COM error = socket_getopt_common(so, level, option_name, optval, optlenp, 6908465SEric.Yu@Sun.COM flags); 6918348SEric.Yu@Sun.COM if (error < 0) { 6928348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_getsockopt) 6938348SEric.Yu@Sun.COM (so->so_proto_handle, level, option_name, optval, optlenp, 6948348SEric.Yu@Sun.COM cr); 6958348SEric.Yu@Sun.COM if (error == ENOPROTOOPT) { 6968348SEric.Yu@Sun.COM if (level == SOL_SOCKET) { 6978348SEric.Yu@Sun.COM /* 6988348SEric.Yu@Sun.COM * If a protocol does not support a particular 6998348SEric.Yu@Sun.COM * socket option, set can fail (not allowed) 7008348SEric.Yu@Sun.COM * but get can not fail. This is the previous 7018348SEric.Yu@Sun.COM * sockfs bahvior. 7028348SEric.Yu@Sun.COM */ 7038348SEric.Yu@Sun.COM switch (option_name) { 7048348SEric.Yu@Sun.COM case SO_LINGER: 7058348SEric.Yu@Sun.COM if (*optlenp < (t_uscalar_t) 7068348SEric.Yu@Sun.COM sizeof (struct linger)) { 7078348SEric.Yu@Sun.COM error = EINVAL; 7088348SEric.Yu@Sun.COM break; 7098348SEric.Yu@Sun.COM } 7108348SEric.Yu@Sun.COM error = 0; 7118348SEric.Yu@Sun.COM bzero(optval, sizeof (struct linger)); 7128348SEric.Yu@Sun.COM *optlenp = sizeof (struct linger); 7138348SEric.Yu@Sun.COM break; 7148348SEric.Yu@Sun.COM case SO_RCVTIMEO: 7158348SEric.Yu@Sun.COM case SO_SNDTIMEO: 7168348SEric.Yu@Sun.COM if (*optlenp < (t_uscalar_t) 7178348SEric.Yu@Sun.COM sizeof (struct timeval)) { 7188348SEric.Yu@Sun.COM error = EINVAL; 7198348SEric.Yu@Sun.COM break; 7208348SEric.Yu@Sun.COM } 7218348SEric.Yu@Sun.COM error = 0; 7228348SEric.Yu@Sun.COM bzero(optval, sizeof (struct timeval)); 7238348SEric.Yu@Sun.COM *optlenp = sizeof (struct timeval); 7248348SEric.Yu@Sun.COM break; 7258348SEric.Yu@Sun.COM case SO_SND_BUFINFO: 7268348SEric.Yu@Sun.COM if (*optlenp < (t_uscalar_t) 7278348SEric.Yu@Sun.COM sizeof (struct so_snd_bufinfo)) { 7288348SEric.Yu@Sun.COM error = EINVAL; 7298348SEric.Yu@Sun.COM break; 7308348SEric.Yu@Sun.COM } 7318348SEric.Yu@Sun.COM error = 0; 7328348SEric.Yu@Sun.COM bzero(optval, 7338348SEric.Yu@Sun.COM sizeof (struct so_snd_bufinfo)); 7348348SEric.Yu@Sun.COM *optlenp = 7358348SEric.Yu@Sun.COM sizeof (struct so_snd_bufinfo); 7368348SEric.Yu@Sun.COM break; 7378348SEric.Yu@Sun.COM case SO_DEBUG: 7388348SEric.Yu@Sun.COM case SO_REUSEADDR: 7398348SEric.Yu@Sun.COM case SO_KEEPALIVE: 7408348SEric.Yu@Sun.COM case SO_DONTROUTE: 7418348SEric.Yu@Sun.COM case SO_BROADCAST: 7428348SEric.Yu@Sun.COM case SO_USELOOPBACK: 7438348SEric.Yu@Sun.COM case SO_OOBINLINE: 7448348SEric.Yu@Sun.COM case SO_DGRAM_ERRIND: 7458348SEric.Yu@Sun.COM case SO_SNDBUF: 7468348SEric.Yu@Sun.COM case SO_RCVBUF: 7478348SEric.Yu@Sun.COM error = 0; 7488348SEric.Yu@Sun.COM *((int32_t *)optval) = 0; 7498348SEric.Yu@Sun.COM *optlenp = sizeof (int32_t); 7508348SEric.Yu@Sun.COM break; 7518348SEric.Yu@Sun.COM default: 7528348SEric.Yu@Sun.COM break; 7538348SEric.Yu@Sun.COM } 7548348SEric.Yu@Sun.COM } 7558348SEric.Yu@Sun.COM } 7568348SEric.Yu@Sun.COM } 7578348SEric.Yu@Sun.COM 7588348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 7598348SEric.Yu@Sun.COM return (error); 7608348SEric.Yu@Sun.COM } 7618348SEric.Yu@Sun.COM 7628348SEric.Yu@Sun.COM int 7638348SEric.Yu@Sun.COM so_setsockopt(struct sonode *so, int level, int option_name, 7648348SEric.Yu@Sun.COM const void *optval, socklen_t optlen, struct cred *cr) 7658348SEric.Yu@Sun.COM { 7668348SEric.Yu@Sun.COM int error = 0; 7678348SEric.Yu@Sun.COM 7688348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, 7698348SEric.Yu@Sun.COM SOP_SETSOCKOPT(so, level, option_name, optval, optlen, cr)); 7708348SEric.Yu@Sun.COM 7718348SEric.Yu@Sun.COM /* X/Open requires this check */ 7728348SEric.Yu@Sun.COM if (so->so_state & SS_CANTSENDMORE && !xnet_skip_checks) { 7738348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 7748348SEric.Yu@Sun.COM if (xnet_check_print) 7758348SEric.Yu@Sun.COM printf("sockfs: X/Open setsockopt check => EINVAL\n"); 7768348SEric.Yu@Sun.COM return (EINVAL); 7778348SEric.Yu@Sun.COM } 7788348SEric.Yu@Sun.COM 7798465SEric.Yu@Sun.COM if (level == SOL_SOCKET) { 7808465SEric.Yu@Sun.COM switch (option_name) { 7818465SEric.Yu@Sun.COM case SO_RCVTIMEO: 7828465SEric.Yu@Sun.COM case SO_SNDTIMEO: { 7838489Sshenjian struct timeval tl; 7848465SEric.Yu@Sun.COM clock_t t_usec; 7858348SEric.Yu@Sun.COM 786*8575Sshenjian if (get_udatamodel() == DATAMODEL_NONE || 787*8575Sshenjian get_udatamodel() == DATAMODEL_NATIVE) { 7888489Sshenjian if (optlen != sizeof (struct timeval)) { 7898489Sshenjian error = EINVAL; 7908489Sshenjian goto done; 7918489Sshenjian } 7928489Sshenjian bcopy((struct timeval *)optval, &tl, 7938489Sshenjian sizeof (struct timeval)); 7948489Sshenjian } else { 7958489Sshenjian if (optlen != sizeof (struct timeval32)) { 7968489Sshenjian error = EINVAL; 7978489Sshenjian goto done; 7988489Sshenjian } 7998489Sshenjian TIMEVAL32_TO_TIMEVAL(&tl, 8008489Sshenjian (struct timeval32 *)optval); 8018465SEric.Yu@Sun.COM } 8028489Sshenjian t_usec = tl.tv_sec * 1000 * 1000 + tl.tv_usec; 8038465SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 8048465SEric.Yu@Sun.COM if (option_name == SO_RCVTIMEO) 8058465SEric.Yu@Sun.COM so->so_rcvtimeo = drv_usectohz(t_usec); 8068465SEric.Yu@Sun.COM else 8078465SEric.Yu@Sun.COM so->so_sndtimeo = drv_usectohz(t_usec); 8088465SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 8098348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 8108465SEric.Yu@Sun.COM return (0); 8118348SEric.Yu@Sun.COM } 8128465SEric.Yu@Sun.COM case SO_RCVBUF: 8138465SEric.Yu@Sun.COM /* 8148465SEric.Yu@Sun.COM * XXX XPG 4.2 applications retrieve SO_RCVBUF from 8158465SEric.Yu@Sun.COM * sockfs since the transport might adjust the value 8168465SEric.Yu@Sun.COM * and not return exactly what was set by the 8178465SEric.Yu@Sun.COM * application. 8188465SEric.Yu@Sun.COM */ 8198465SEric.Yu@Sun.COM so->so_xpg_rcvbuf = *(int32_t *)optval; 8208465SEric.Yu@Sun.COM break; 8218465SEric.Yu@Sun.COM } 8228348SEric.Yu@Sun.COM } 8238348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_setsockopt) 8248348SEric.Yu@Sun.COM (so->so_proto_handle, level, option_name, optval, optlen, cr); 8258489Sshenjian done: 8268348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 8278348SEric.Yu@Sun.COM return (error); 8288348SEric.Yu@Sun.COM } 8298348SEric.Yu@Sun.COM 8308348SEric.Yu@Sun.COM int 8318348SEric.Yu@Sun.COM so_ioctl(struct sonode *so, int cmd, intptr_t arg, int mode, 8328348SEric.Yu@Sun.COM struct cred *cr, int32_t *rvalp) 8338348SEric.Yu@Sun.COM { 8348348SEric.Yu@Sun.COM int error = 0; 8358348SEric.Yu@Sun.COM 8368348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_IOCTL(so, cmd, arg, mode, cr, rvalp)); 8378348SEric.Yu@Sun.COM 8388348SEric.Yu@Sun.COM /* 8398348SEric.Yu@Sun.COM * If there is a pending error, return error 8408348SEric.Yu@Sun.COM * This can happen if a non blocking operation caused an error. 8418348SEric.Yu@Sun.COM */ 8428348SEric.Yu@Sun.COM if (so->so_error != 0) { 8438348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 8448348SEric.Yu@Sun.COM error = sogeterr(so, B_TRUE); 8458348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 8468348SEric.Yu@Sun.COM if (error != 0) 8478348SEric.Yu@Sun.COM goto done; 8488348SEric.Yu@Sun.COM } 8498348SEric.Yu@Sun.COM 8508348SEric.Yu@Sun.COM /* 8518348SEric.Yu@Sun.COM * calling strioc can result in the socket falling back to TPI, 8528348SEric.Yu@Sun.COM * if that is supported. 8538348SEric.Yu@Sun.COM */ 8548348SEric.Yu@Sun.COM if ((error = socket_ioctl_common(so, cmd, arg, mode, cr, rvalp)) < 0 && 8558348SEric.Yu@Sun.COM (error = socket_strioc_common(so, cmd, arg, mode, cr, rvalp)) < 0) { 8568348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_ioctl)(so->so_proto_handle, 8578348SEric.Yu@Sun.COM cmd, arg, mode, rvalp, cr); 8588348SEric.Yu@Sun.COM } 8598348SEric.Yu@Sun.COM 8608348SEric.Yu@Sun.COM done: 8618348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 8628348SEric.Yu@Sun.COM 8638348SEric.Yu@Sun.COM return (error); 8648348SEric.Yu@Sun.COM } 8658348SEric.Yu@Sun.COM 8668348SEric.Yu@Sun.COM int 8678348SEric.Yu@Sun.COM so_poll(struct sonode *so, short events, int anyyet, short *reventsp, 8688348SEric.Yu@Sun.COM struct pollhead **phpp) 8698348SEric.Yu@Sun.COM { 8708348SEric.Yu@Sun.COM int state = so->so_state; 8718348SEric.Yu@Sun.COM *reventsp = 0; 8728348SEric.Yu@Sun.COM 8738348SEric.Yu@Sun.COM if (so->so_error != 0 && 8748348SEric.Yu@Sun.COM ((POLLIN|POLLRDNORM|POLLOUT) & events) != 0) { 8758348SEric.Yu@Sun.COM *reventsp = (POLLIN|POLLRDNORM|POLLOUT) & events; 8768348SEric.Yu@Sun.COM return (0); 8778348SEric.Yu@Sun.COM } 8788348SEric.Yu@Sun.COM 8798348SEric.Yu@Sun.COM /* 8808348SEric.Yu@Sun.COM * As long as there is buffer to send data, and the socket is 8818348SEric.Yu@Sun.COM * in a state where it can send data (i.e., connected for 8828348SEric.Yu@Sun.COM * connection oriented protocols), then turn on POLLOUT events 8838348SEric.Yu@Sun.COM */ 8848348SEric.Yu@Sun.COM if (!so->so_snd_qfull && ((so->so_mode & SM_CONNREQUIRED) == 0 || 8858348SEric.Yu@Sun.COM state & SS_ISCONNECTED)) { 8868348SEric.Yu@Sun.COM *reventsp |= POLLOUT & events; 8878348SEric.Yu@Sun.COM } 8888348SEric.Yu@Sun.COM 8898348SEric.Yu@Sun.COM /* 8908348SEric.Yu@Sun.COM * Turn on POLLIN whenever there is data on the receive queue, 8918348SEric.Yu@Sun.COM * or the socket is in a state where no more data will be received. 8928348SEric.Yu@Sun.COM * Also, if the socket is accepting connections, flip the bit if 8938348SEric.Yu@Sun.COM * there is something on the queue. 8948427SAnders.Persson@Sun.COM * 8958427SAnders.Persson@Sun.COM * We do an initial check for events without holding locks. However, 8968427SAnders.Persson@Sun.COM * if there are no event available, then we redo the check for POLLIN 8978427SAnders.Persson@Sun.COM * events under the lock. 8988348SEric.Yu@Sun.COM */ 8998348SEric.Yu@Sun.COM 9008348SEric.Yu@Sun.COM /* Pending connections */ 9018348SEric.Yu@Sun.COM if (so->so_acceptq_len > 0) 9028348SEric.Yu@Sun.COM *reventsp |= (POLLIN|POLLRDNORM) & events; 9038348SEric.Yu@Sun.COM 9048348SEric.Yu@Sun.COM /* Data */ 9058348SEric.Yu@Sun.COM /* so_downcalls is null for sctp */ 9068348SEric.Yu@Sun.COM if (so->so_downcalls != NULL && so->so_downcalls->sd_poll != NULL) { 9078348SEric.Yu@Sun.COM *reventsp |= (*so->so_downcalls->sd_poll) 9088348SEric.Yu@Sun.COM (so->so_proto_handle, events & SO_PROTO_POLLEV, anyyet, 9098348SEric.Yu@Sun.COM CRED()) & events; 9108348SEric.Yu@Sun.COM ASSERT((*reventsp & ~events) == 0); 9118348SEric.Yu@Sun.COM /* do not recheck events */ 9128348SEric.Yu@Sun.COM events &= ~SO_PROTO_POLLEV; 9138348SEric.Yu@Sun.COM } else { 9148348SEric.Yu@Sun.COM if (SO_HAVE_DATA(so)) 9158348SEric.Yu@Sun.COM *reventsp |= (POLLIN|POLLRDNORM) & events; 9168348SEric.Yu@Sun.COM 9178348SEric.Yu@Sun.COM /* Urgent data */ 9188348SEric.Yu@Sun.COM if ((state & SS_OOBPEND) != 0) 9198348SEric.Yu@Sun.COM *reventsp |= (POLLRDBAND) & events; 9208348SEric.Yu@Sun.COM } 9218348SEric.Yu@Sun.COM 9228348SEric.Yu@Sun.COM if (!*reventsp && !anyyet) { 9238348SEric.Yu@Sun.COM /* Check for read events again, but this time under lock */ 9248348SEric.Yu@Sun.COM if (events & (POLLIN|POLLRDNORM)) { 9258348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 9268348SEric.Yu@Sun.COM if (SO_HAVE_DATA(so) || so->so_acceptq_len > 0) { 9278348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 9288348SEric.Yu@Sun.COM *reventsp |= (POLLIN|POLLRDNORM) & events; 9298348SEric.Yu@Sun.COM return (0); 9308348SEric.Yu@Sun.COM } else { 9318348SEric.Yu@Sun.COM so->so_pollev |= SO_POLLEV_IN; 9328348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 9338348SEric.Yu@Sun.COM } 9348348SEric.Yu@Sun.COM } 9358348SEric.Yu@Sun.COM *phpp = &so->so_poll_list; 9368348SEric.Yu@Sun.COM } 9378348SEric.Yu@Sun.COM return (0); 9388348SEric.Yu@Sun.COM } 9398348SEric.Yu@Sun.COM 9408348SEric.Yu@Sun.COM /* 9418348SEric.Yu@Sun.COM * Generic Upcalls 9428348SEric.Yu@Sun.COM */ 9438348SEric.Yu@Sun.COM void 9448348SEric.Yu@Sun.COM so_connected(sock_upper_handle_t sock_handle, sock_connid_t id, 9458348SEric.Yu@Sun.COM cred_t *peer_cred, pid_t peer_cpid) 9468348SEric.Yu@Sun.COM { 9478348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 9488348SEric.Yu@Sun.COM 9498348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 9508348SEric.Yu@Sun.COM ASSERT(so->so_proto_handle != NULL); 9518348SEric.Yu@Sun.COM 9528348SEric.Yu@Sun.COM if (peer_cred != NULL) { 9538348SEric.Yu@Sun.COM if (so->so_peercred != NULL) 9548348SEric.Yu@Sun.COM crfree(so->so_peercred); 9558348SEric.Yu@Sun.COM crhold(peer_cred); 9568348SEric.Yu@Sun.COM so->so_peercred = peer_cred; 9578348SEric.Yu@Sun.COM so->so_cpid = peer_cpid; 9588348SEric.Yu@Sun.COM } 9598348SEric.Yu@Sun.COM 9608348SEric.Yu@Sun.COM so->so_proto_connid = id; 9618348SEric.Yu@Sun.COM soisconnected(so); 9628348SEric.Yu@Sun.COM /* 9638348SEric.Yu@Sun.COM * Wake ones who're waiting for conn to become established. 9648348SEric.Yu@Sun.COM */ 9658348SEric.Yu@Sun.COM so_notify_connected(so); 9668348SEric.Yu@Sun.COM } 9678348SEric.Yu@Sun.COM 9688348SEric.Yu@Sun.COM int 9698348SEric.Yu@Sun.COM so_disconnected(sock_upper_handle_t sock_handle, sock_connid_t id, int error) 9708348SEric.Yu@Sun.COM { 9718348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 9728348SEric.Yu@Sun.COM 9738348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 9748348SEric.Yu@Sun.COM 9758348SEric.Yu@Sun.COM so->so_proto_connid = id; 9768348SEric.Yu@Sun.COM soisdisconnected(so, error); 9778348SEric.Yu@Sun.COM so_notify_disconnected(so, error); 9788348SEric.Yu@Sun.COM 9798348SEric.Yu@Sun.COM return (0); 9808348SEric.Yu@Sun.COM } 9818348SEric.Yu@Sun.COM 9828348SEric.Yu@Sun.COM void 9838348SEric.Yu@Sun.COM so_opctl(sock_upper_handle_t sock_handle, sock_opctl_action_t action, 9848348SEric.Yu@Sun.COM uintptr_t arg) 9858348SEric.Yu@Sun.COM { 9868348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 9878348SEric.Yu@Sun.COM 9888348SEric.Yu@Sun.COM switch (action) { 9898348SEric.Yu@Sun.COM case SOCK_OPCTL_SHUT_SEND: 9908348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 9918348SEric.Yu@Sun.COM socantsendmore(so); 9928348SEric.Yu@Sun.COM so_notify_disconnecting(so); 9938348SEric.Yu@Sun.COM break; 9948348SEric.Yu@Sun.COM case SOCK_OPCTL_SHUT_RECV: { 9958348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 9968348SEric.Yu@Sun.COM socantrcvmore(so); 9978348SEric.Yu@Sun.COM so_notify_eof(so); 9988348SEric.Yu@Sun.COM break; 9998348SEric.Yu@Sun.COM } 10008348SEric.Yu@Sun.COM case SOCK_OPCTL_ENAB_ACCEPT: 10018348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 10028348SEric.Yu@Sun.COM so->so_state |= SS_ACCEPTCONN; 10038348SEric.Yu@Sun.COM so->so_backlog = (unsigned int)arg; 10048348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 10058348SEric.Yu@Sun.COM break; 10068348SEric.Yu@Sun.COM default: 10078348SEric.Yu@Sun.COM ASSERT(0); 10088348SEric.Yu@Sun.COM break; 10098348SEric.Yu@Sun.COM } 10108348SEric.Yu@Sun.COM } 10118348SEric.Yu@Sun.COM 10128348SEric.Yu@Sun.COM void 10138348SEric.Yu@Sun.COM so_txq_full(sock_upper_handle_t sock_handle, boolean_t qfull) 10148348SEric.Yu@Sun.COM { 10158348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 10168348SEric.Yu@Sun.COM 10178348SEric.Yu@Sun.COM if (qfull) { 10188348SEric.Yu@Sun.COM so_snd_qfull(so); 10198348SEric.Yu@Sun.COM } else { 10208348SEric.Yu@Sun.COM so_snd_qnotfull(so); 10218348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 10228348SEric.Yu@Sun.COM so_notify_writable(so); 10238348SEric.Yu@Sun.COM } 10248348SEric.Yu@Sun.COM } 10258348SEric.Yu@Sun.COM 10268348SEric.Yu@Sun.COM sock_upper_handle_t 10278348SEric.Yu@Sun.COM so_newconn(sock_upper_handle_t parenthandle, 10288348SEric.Yu@Sun.COM sock_lower_handle_t proto_handle, sock_downcalls_t *sock_downcalls, 10298348SEric.Yu@Sun.COM struct cred *peer_cred, pid_t peer_cpid, sock_upcalls_t **sock_upcallsp) 10308348SEric.Yu@Sun.COM { 10318348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)parenthandle; 10328348SEric.Yu@Sun.COM struct sonode *nso; 10338348SEric.Yu@Sun.COM int error; 10348348SEric.Yu@Sun.COM 10358348SEric.Yu@Sun.COM ASSERT(proto_handle != NULL); 10368348SEric.Yu@Sun.COM 10378348SEric.Yu@Sun.COM if ((so->so_state & SS_ACCEPTCONN) == 0 || 10388348SEric.Yu@Sun.COM so->so_acceptq_len >= so->so_backlog) 10398348SEric.Yu@Sun.COM return (NULL); 10408348SEric.Yu@Sun.COM 10418348SEric.Yu@Sun.COM nso = socket_newconn(so, proto_handle, sock_downcalls, SOCKET_NOSLEEP, 10428348SEric.Yu@Sun.COM &error); 10438348SEric.Yu@Sun.COM if (nso == NULL) 10448348SEric.Yu@Sun.COM return (NULL); 10458348SEric.Yu@Sun.COM 10468348SEric.Yu@Sun.COM if (peer_cred != NULL) { 10478348SEric.Yu@Sun.COM crhold(peer_cred); 10488348SEric.Yu@Sun.COM nso->so_peercred = peer_cred; 10498348SEric.Yu@Sun.COM nso->so_cpid = peer_cpid; 10508348SEric.Yu@Sun.COM } 10518348SEric.Yu@Sun.COM 10528348SEric.Yu@Sun.COM (void) so_acceptq_enqueue(so, nso); 10538348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 10548348SEric.Yu@Sun.COM so_notify_newconn(so); 10558348SEric.Yu@Sun.COM 10568348SEric.Yu@Sun.COM *sock_upcallsp = &so_upcalls; 10578348SEric.Yu@Sun.COM 10588348SEric.Yu@Sun.COM return ((sock_upper_handle_t)nso); 10598348SEric.Yu@Sun.COM } 10608348SEric.Yu@Sun.COM 10618348SEric.Yu@Sun.COM void 10628348SEric.Yu@Sun.COM so_set_prop(sock_upper_handle_t sock_handle, struct sock_proto_props *soppp) 10638348SEric.Yu@Sun.COM { 10648348SEric.Yu@Sun.COM struct sonode *so; 10658348SEric.Yu@Sun.COM 10668348SEric.Yu@Sun.COM so = (struct sonode *)sock_handle; 10678348SEric.Yu@Sun.COM 10688348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 10698348SEric.Yu@Sun.COM 10708348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_MAXBLK) 10718348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxblk = soppp->sopp_maxblk; 10728348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_WROFF) 10738348SEric.Yu@Sun.COM so->so_proto_props.sopp_wroff = soppp->sopp_wroff; 10748348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_TAIL) 10758348SEric.Yu@Sun.COM so->so_proto_props.sopp_tail = soppp->sopp_tail; 10768348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_RCVHIWAT) 10778348SEric.Yu@Sun.COM so->so_proto_props.sopp_rxhiwat = soppp->sopp_rxhiwat; 10788348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_RCVLOWAT) 10798348SEric.Yu@Sun.COM so->so_proto_props.sopp_rxlowat = soppp->sopp_rxlowat; 10808348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_MAXPSZ) 10818348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxpsz = soppp->sopp_maxpsz; 10828348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_MINPSZ) 10838348SEric.Yu@Sun.COM so->so_proto_props.sopp_minpsz = soppp->sopp_minpsz; 10848348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_ZCOPY) { 10858348SEric.Yu@Sun.COM if (soppp->sopp_zcopyflag & ZCVMSAFE) { 10868348SEric.Yu@Sun.COM so->so_proto_props.sopp_zcopyflag |= STZCVMSAFE; 10878348SEric.Yu@Sun.COM so->so_proto_props.sopp_zcopyflag &= ~STZCVMUNSAFE; 10888348SEric.Yu@Sun.COM } else if (soppp->sopp_zcopyflag & ZCVMUNSAFE) { 10898348SEric.Yu@Sun.COM so->so_proto_props.sopp_zcopyflag |= STZCVMUNSAFE; 10908348SEric.Yu@Sun.COM so->so_proto_props.sopp_zcopyflag &= ~STZCVMSAFE; 10918348SEric.Yu@Sun.COM } 10928348SEric.Yu@Sun.COM 10938348SEric.Yu@Sun.COM if (soppp->sopp_zcopyflag & COPYCACHED) { 10948348SEric.Yu@Sun.COM so->so_proto_props.sopp_zcopyflag |= STRCOPYCACHED; 10958348SEric.Yu@Sun.COM } 10968348SEric.Yu@Sun.COM } 10978348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_OOBINLINE) 10988348SEric.Yu@Sun.COM so->so_proto_props.sopp_oobinline = soppp->sopp_oobinline; 10998348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_RCVTIMER) 11008348SEric.Yu@Sun.COM so->so_proto_props.sopp_rcvtimer = soppp->sopp_rcvtimer; 11018348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_RCVTHRESH) 11028348SEric.Yu@Sun.COM so->so_proto_props.sopp_rcvthresh = soppp->sopp_rcvthresh; 11038348SEric.Yu@Sun.COM if (soppp->sopp_flags & SOCKOPT_MAXADDRLEN) 11048348SEric.Yu@Sun.COM so->so_proto_props.sopp_maxaddrlen = soppp->sopp_maxaddrlen; 11058348SEric.Yu@Sun.COM 11068348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 11078348SEric.Yu@Sun.COM 11088348SEric.Yu@Sun.COM #ifdef DEBUG 11098348SEric.Yu@Sun.COM soppp->sopp_flags &= ~(SOCKOPT_MAXBLK | SOCKOPT_WROFF | SOCKOPT_TAIL | 11108348SEric.Yu@Sun.COM SOCKOPT_RCVHIWAT | SOCKOPT_RCVLOWAT | SOCKOPT_MAXPSZ | 11118348SEric.Yu@Sun.COM SOCKOPT_ZCOPY | SOCKOPT_OOBINLINE | SOCKOPT_RCVTIMER | 11128348SEric.Yu@Sun.COM SOCKOPT_RCVTHRESH | SOCKOPT_MAXADDRLEN | SOCKOPT_MINPSZ); 11138348SEric.Yu@Sun.COM ASSERT(soppp->sopp_flags == 0); 11148348SEric.Yu@Sun.COM #endif 11158348SEric.Yu@Sun.COM } 11168348SEric.Yu@Sun.COM 11178348SEric.Yu@Sun.COM /* ARGSUSED */ 11188348SEric.Yu@Sun.COM ssize_t 11198348SEric.Yu@Sun.COM so_queue_msg(sock_upper_handle_t sock_handle, mblk_t *mp, 11208348SEric.Yu@Sun.COM size_t msg_size, int flags, int *errorp, boolean_t *force_pushp) 11218348SEric.Yu@Sun.COM { 11228348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 11238348SEric.Yu@Sun.COM boolean_t force_push = B_TRUE; 11248348SEric.Yu@Sun.COM int space_left; 11258348SEric.Yu@Sun.COM sodirect_t *sodp = so->so_direct; 11268348SEric.Yu@Sun.COM 11278348SEric.Yu@Sun.COM ASSERT(errorp != NULL); 11288348SEric.Yu@Sun.COM *errorp = 0; 11298348SEric.Yu@Sun.COM if (mp == NULL) { 11308348SEric.Yu@Sun.COM if (msg_size > 0) { 11318348SEric.Yu@Sun.COM ASSERT(so->so_downcalls->sd_recv_uio != NULL); 11328348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 11338348SEric.Yu@Sun.COM /* the notify functions will drop the lock */ 11348348SEric.Yu@Sun.COM if (flags & MSG_OOB) 11358348SEric.Yu@Sun.COM so_notify_oobdata(so, IS_SO_OOB_INLINE(so)); 11368348SEric.Yu@Sun.COM else 11378348SEric.Yu@Sun.COM so_notify_data(so, msg_size); 11388348SEric.Yu@Sun.COM return (0); 11398348SEric.Yu@Sun.COM } 11408348SEric.Yu@Sun.COM /* 11418348SEric.Yu@Sun.COM * recv space check 11428348SEric.Yu@Sun.COM */ 11438348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 11448348SEric.Yu@Sun.COM space_left = so->so_rcvbuf - so->so_rcv_queued; 11458348SEric.Yu@Sun.COM if (space_left <= 0) { 11468348SEric.Yu@Sun.COM so->so_flowctrld = B_TRUE; 11478348SEric.Yu@Sun.COM *errorp = ENOSPC; 11488348SEric.Yu@Sun.COM space_left = -1; 11498348SEric.Yu@Sun.COM } 11508348SEric.Yu@Sun.COM goto done_unlock; 11518348SEric.Yu@Sun.COM } 11528348SEric.Yu@Sun.COM 11538348SEric.Yu@Sun.COM ASSERT(mp->b_next == NULL); 11548348SEric.Yu@Sun.COM ASSERT(DB_TYPE(mp) == M_DATA || DB_TYPE(mp) == M_PROTO); 11558348SEric.Yu@Sun.COM ASSERT(msg_size == msgdsize(mp)); 11568348SEric.Yu@Sun.COM 11578348SEric.Yu@Sun.COM if (flags & MSG_OOB) { 11588348SEric.Yu@Sun.COM so_queue_oob(sock_handle, mp, msg_size); 11598348SEric.Yu@Sun.COM return (0); 11608348SEric.Yu@Sun.COM } 11618348SEric.Yu@Sun.COM 11628348SEric.Yu@Sun.COM if (force_pushp != NULL) 11638348SEric.Yu@Sun.COM force_push = *force_pushp; 11648348SEric.Yu@Sun.COM 11658348SEric.Yu@Sun.COM if (DB_TYPE(mp) == M_PROTO && !__TPI_PRIM_ISALIGNED(mp->b_rptr)) { 11668348SEric.Yu@Sun.COM /* The read pointer is not aligned correctly for TPI */ 11678348SEric.Yu@Sun.COM zcmn_err(getzoneid(), CE_WARN, 11688348SEric.Yu@Sun.COM "sockfs: Unaligned TPI message received. rptr = %p\n", 11698348SEric.Yu@Sun.COM (void *)mp->b_rptr); 11708348SEric.Yu@Sun.COM freemsg(mp); 11718348SEric.Yu@Sun.COM mutex_enter(sodp->sod_lockp); 11728348SEric.Yu@Sun.COM SOD_UIOAFINI(sodp); 11738348SEric.Yu@Sun.COM mutex_exit(sodp->sod_lockp); 11748348SEric.Yu@Sun.COM 11758348SEric.Yu@Sun.COM return (so->so_rcvbuf - so->so_rcv_queued); 11768348SEric.Yu@Sun.COM } 11778348SEric.Yu@Sun.COM 11788348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 11798348SEric.Yu@Sun.COM if (so->so_state & (SS_FALLBACK_PENDING | SS_FALLBACK_COMP)) { 11808348SEric.Yu@Sun.COM SOD_DISABLE(sodp); 11818348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 11828348SEric.Yu@Sun.COM *errorp = EOPNOTSUPP; 11838348SEric.Yu@Sun.COM return (-1); 11848348SEric.Yu@Sun.COM } 11858348SEric.Yu@Sun.COM if (so->so_state & SS_CANTRCVMORE) { 11868348SEric.Yu@Sun.COM freemsg(mp); 11878348SEric.Yu@Sun.COM SOD_DISABLE(sodp); 11888348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 11898348SEric.Yu@Sun.COM return (0); 11908348SEric.Yu@Sun.COM } 11918348SEric.Yu@Sun.COM 11928348SEric.Yu@Sun.COM /* process the mblk via I/OAT if capable */ 11938348SEric.Yu@Sun.COM if (sodp != NULL && (sodp->sod_state & SOD_ENABLED)) { 11948348SEric.Yu@Sun.COM if (DB_TYPE(mp) == M_DATA) { 11958348SEric.Yu@Sun.COM (void) sod_uioa_mblk_init(sodp, mp, msg_size); 11968348SEric.Yu@Sun.COM } else { 11978348SEric.Yu@Sun.COM SOD_UIOAFINI(sodp); 11988348SEric.Yu@Sun.COM } 11998348SEric.Yu@Sun.COM } 12008348SEric.Yu@Sun.COM 12018348SEric.Yu@Sun.COM if (mp->b_next == NULL) { 12028348SEric.Yu@Sun.COM so_enqueue_msg(so, mp, msg_size); 12038348SEric.Yu@Sun.COM } else { 12048348SEric.Yu@Sun.COM do { 12058348SEric.Yu@Sun.COM mblk_t *nmp; 12068348SEric.Yu@Sun.COM 12078348SEric.Yu@Sun.COM if ((nmp = mp->b_next) != NULL) { 12088348SEric.Yu@Sun.COM mp->b_next = NULL; 12098348SEric.Yu@Sun.COM } 12108348SEric.Yu@Sun.COM so_enqueue_msg(so, mp, msgdsize(mp)); 12118348SEric.Yu@Sun.COM mp = nmp; 12128348SEric.Yu@Sun.COM } while (mp != NULL); 12138348SEric.Yu@Sun.COM } 12148348SEric.Yu@Sun.COM 12158348SEric.Yu@Sun.COM space_left = so->so_rcvbuf - so->so_rcv_queued; 12168348SEric.Yu@Sun.COM if (space_left <= 0) { 12178348SEric.Yu@Sun.COM so->so_flowctrld = B_TRUE; 12188348SEric.Yu@Sun.COM *errorp = ENOSPC; 12198348SEric.Yu@Sun.COM space_left = -1; 12208348SEric.Yu@Sun.COM } 12218348SEric.Yu@Sun.COM 12228348SEric.Yu@Sun.COM if (force_push || so->so_rcv_queued >= so->so_rcv_thresh || 12238348SEric.Yu@Sun.COM so->so_rcv_queued >= so->so_rcv_wanted || 12248348SEric.Yu@Sun.COM (sodp != NULL && so->so_rcv_queued >= sodp->sod_want)) { 12258348SEric.Yu@Sun.COM SOCKET_TIMER_CANCEL(so); 12268348SEric.Yu@Sun.COM /* 12278348SEric.Yu@Sun.COM * so_notify_data will release the lock 12288348SEric.Yu@Sun.COM */ 12298348SEric.Yu@Sun.COM so_notify_data(so, so->so_rcv_queued); 12308348SEric.Yu@Sun.COM 12318348SEric.Yu@Sun.COM if (force_pushp != NULL) 12328348SEric.Yu@Sun.COM *force_pushp = B_TRUE; 12338348SEric.Yu@Sun.COM goto done; 12348348SEric.Yu@Sun.COM } else if (so->so_rcv_timer_tid == 0) { 12358348SEric.Yu@Sun.COM /* Make sure the recv push timer is running */ 12368348SEric.Yu@Sun.COM SOCKET_TIMER_START(so); 12378348SEric.Yu@Sun.COM } 12388348SEric.Yu@Sun.COM 12398348SEric.Yu@Sun.COM done_unlock: 12408348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 12418348SEric.Yu@Sun.COM done: 12428348SEric.Yu@Sun.COM return (space_left); 12438348SEric.Yu@Sun.COM } 12448348SEric.Yu@Sun.COM 12458348SEric.Yu@Sun.COM /* 12468348SEric.Yu@Sun.COM * Set the offset of where the oob data is relative to the bytes in 12478348SEric.Yu@Sun.COM * queued. Also generate SIGURG 12488348SEric.Yu@Sun.COM */ 12498348SEric.Yu@Sun.COM void 12508348SEric.Yu@Sun.COM so_signal_oob(sock_upper_handle_t sock_handle, ssize_t offset) 12518348SEric.Yu@Sun.COM { 12528348SEric.Yu@Sun.COM struct sonode *so; 12538348SEric.Yu@Sun.COM 12548348SEric.Yu@Sun.COM ASSERT(offset >= 0); 12558348SEric.Yu@Sun.COM so = (struct sonode *)sock_handle; 12568348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 12578348SEric.Yu@Sun.COM SOD_UIOAFINI(so->so_direct); 12588348SEric.Yu@Sun.COM 12598348SEric.Yu@Sun.COM /* 12608348SEric.Yu@Sun.COM * New urgent data on the way so forget about any old 12618348SEric.Yu@Sun.COM * urgent data. 12628348SEric.Yu@Sun.COM */ 12638348SEric.Yu@Sun.COM so->so_state &= ~(SS_HAVEOOBDATA|SS_HADOOBDATA); 12648348SEric.Yu@Sun.COM 12658348SEric.Yu@Sun.COM /* 12668348SEric.Yu@Sun.COM * Record that urgent data is pending. 12678348SEric.Yu@Sun.COM */ 12688348SEric.Yu@Sun.COM so->so_state |= SS_OOBPEND; 12698348SEric.Yu@Sun.COM 12708348SEric.Yu@Sun.COM if (so->so_oobmsg != NULL) { 12718348SEric.Yu@Sun.COM dprintso(so, 1, ("sock: discarding old oob\n")); 12728348SEric.Yu@Sun.COM freemsg(so->so_oobmsg); 12738348SEric.Yu@Sun.COM so->so_oobmsg = NULL; 12748348SEric.Yu@Sun.COM } 12758348SEric.Yu@Sun.COM 12768348SEric.Yu@Sun.COM /* 12778348SEric.Yu@Sun.COM * set the offset where the urgent byte is 12788348SEric.Yu@Sun.COM */ 12798348SEric.Yu@Sun.COM so->so_oobmark = so->so_rcv_queued + offset; 12808348SEric.Yu@Sun.COM if (so->so_oobmark == 0) 12818348SEric.Yu@Sun.COM so->so_state |= SS_RCVATMARK; 12828348SEric.Yu@Sun.COM else 12838348SEric.Yu@Sun.COM so->so_state &= ~SS_RCVATMARK; 12848348SEric.Yu@Sun.COM 12858348SEric.Yu@Sun.COM so_notify_oobsig(so); 12868348SEric.Yu@Sun.COM } 12878348SEric.Yu@Sun.COM 12888348SEric.Yu@Sun.COM /* 12898348SEric.Yu@Sun.COM * Queue the OOB byte 12908348SEric.Yu@Sun.COM */ 12918348SEric.Yu@Sun.COM static void 12928348SEric.Yu@Sun.COM so_queue_oob(sock_upper_handle_t sock_handle, mblk_t *mp, size_t len) 12938348SEric.Yu@Sun.COM { 12948348SEric.Yu@Sun.COM struct sonode *so; 12958348SEric.Yu@Sun.COM 12968348SEric.Yu@Sun.COM so = (struct sonode *)sock_handle; 12978348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 12988348SEric.Yu@Sun.COM SOD_UIOAFINI(so->so_direct); 12998348SEric.Yu@Sun.COM 13008348SEric.Yu@Sun.COM ASSERT(mp != NULL); 13018348SEric.Yu@Sun.COM if (!IS_SO_OOB_INLINE(so)) { 13028348SEric.Yu@Sun.COM so->so_oobmsg = mp; 13038348SEric.Yu@Sun.COM so->so_state |= SS_HAVEOOBDATA; 13048348SEric.Yu@Sun.COM } else { 13058348SEric.Yu@Sun.COM so_enqueue_msg(so, mp, len); 13068348SEric.Yu@Sun.COM } 13078348SEric.Yu@Sun.COM 13088348SEric.Yu@Sun.COM so_notify_oobdata(so, IS_SO_OOB_INLINE(so)); 13098348SEric.Yu@Sun.COM } 13108348SEric.Yu@Sun.COM 13118348SEric.Yu@Sun.COM int 13128348SEric.Yu@Sun.COM so_close(struct sonode *so, int flag, struct cred *cr) 13138348SEric.Yu@Sun.COM { 13148348SEric.Yu@Sun.COM int error; 13158348SEric.Yu@Sun.COM 13168348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_close)(so->so_proto_handle, flag, cr); 13178348SEric.Yu@Sun.COM 13188348SEric.Yu@Sun.COM /* 13198348SEric.Yu@Sun.COM * At this point there will be no more upcalls from the protocol 13208348SEric.Yu@Sun.COM */ 13218348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 13228399SRao.Shoaib@Sun.COM 13238399SRao.Shoaib@Sun.COM ASSERT(so_verify_oobstate(so)); 13248399SRao.Shoaib@Sun.COM 13258348SEric.Yu@Sun.COM so_rcv_flush(so); 13268348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 13278348SEric.Yu@Sun.COM 13288348SEric.Yu@Sun.COM return (error); 13298348SEric.Yu@Sun.COM } 13308348SEric.Yu@Sun.COM 13318348SEric.Yu@Sun.COM void 13328348SEric.Yu@Sun.COM so_zcopy_notify(sock_upper_handle_t sock_handle) 13338348SEric.Yu@Sun.COM { 13348348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 13358348SEric.Yu@Sun.COM 13368348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 13378348SEric.Yu@Sun.COM so->so_copyflag |= STZCNOTIFY; 13388348SEric.Yu@Sun.COM cv_broadcast(&so->so_copy_cv); 13398348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 13408348SEric.Yu@Sun.COM } 13418348SEric.Yu@Sun.COM 13428348SEric.Yu@Sun.COM void 13438348SEric.Yu@Sun.COM so_set_error(sock_upper_handle_t sock_handle, int error) 13448348SEric.Yu@Sun.COM { 13458348SEric.Yu@Sun.COM struct sonode *so = (struct sonode *)sock_handle; 13468348SEric.Yu@Sun.COM 13478348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 13488348SEric.Yu@Sun.COM 13498348SEric.Yu@Sun.COM soseterror(so, error); 13508348SEric.Yu@Sun.COM 13518348SEric.Yu@Sun.COM so_notify_error(so); 13528348SEric.Yu@Sun.COM } 13538348SEric.Yu@Sun.COM 13548348SEric.Yu@Sun.COM /* 13558348SEric.Yu@Sun.COM * so_recvmsg - read data from the socket 13568348SEric.Yu@Sun.COM * 13578348SEric.Yu@Sun.COM * There are two ways of obtaining data; either we ask the protocol to 13588348SEric.Yu@Sun.COM * copy directly into the supplied buffer, or we copy data from the 13598348SEric.Yu@Sun.COM * sonode's receive queue. The decision which one to use depends on 13608348SEric.Yu@Sun.COM * whether the protocol has a sd_recv_uio down call. 13618348SEric.Yu@Sun.COM */ 13628348SEric.Yu@Sun.COM int 13638348SEric.Yu@Sun.COM so_recvmsg(struct sonode *so, struct nmsghdr *msg, struct uio *uiop, 13648348SEric.Yu@Sun.COM struct cred *cr) 13658348SEric.Yu@Sun.COM { 13668348SEric.Yu@Sun.COM rval_t rval; 13678348SEric.Yu@Sun.COM int flags = 0; 13688348SEric.Yu@Sun.COM t_uscalar_t controllen, namelen; 13698348SEric.Yu@Sun.COM int error = 0; 13708348SEric.Yu@Sun.COM int ret; 13718348SEric.Yu@Sun.COM mblk_t *mctlp = NULL; 13728348SEric.Yu@Sun.COM union T_primitives *tpr; 13738348SEric.Yu@Sun.COM void *control; 13748348SEric.Yu@Sun.COM ssize_t saved_resid; 13758348SEric.Yu@Sun.COM struct uio *suiop; 13768348SEric.Yu@Sun.COM 13778348SEric.Yu@Sun.COM SO_BLOCK_FALLBACK(so, SOP_RECVMSG(so, msg, uiop, cr)); 13788348SEric.Yu@Sun.COM 13798348SEric.Yu@Sun.COM if ((so->so_state & (SS_ISCONNECTED|SS_CANTRCVMORE)) == 0 && 13808348SEric.Yu@Sun.COM (so->so_mode & SM_CONNREQUIRED)) { 13818348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 13828348SEric.Yu@Sun.COM return (ENOTCONN); 13838348SEric.Yu@Sun.COM } 13848348SEric.Yu@Sun.COM 13858348SEric.Yu@Sun.COM if (msg->msg_flags & MSG_PEEK) 13868348SEric.Yu@Sun.COM msg->msg_flags &= ~MSG_WAITALL; 13878348SEric.Yu@Sun.COM 13888348SEric.Yu@Sun.COM if (so->so_mode & SM_ATOMIC) 13898348SEric.Yu@Sun.COM msg->msg_flags |= MSG_TRUNC; 13908348SEric.Yu@Sun.COM 13918348SEric.Yu@Sun.COM if (msg->msg_flags & MSG_OOB) { 13928348SEric.Yu@Sun.COM if ((so->so_mode & SM_EXDATA) == 0) { 13938348SEric.Yu@Sun.COM error = EOPNOTSUPP; 13948348SEric.Yu@Sun.COM } else if (so->so_downcalls->sd_recv_uio != NULL) { 13958348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_recv_uio) 13968348SEric.Yu@Sun.COM (so->so_proto_handle, uiop, msg, cr); 13978348SEric.Yu@Sun.COM } else { 13988348SEric.Yu@Sun.COM error = sorecvoob(so, msg, uiop, msg->msg_flags, 13998348SEric.Yu@Sun.COM IS_SO_OOB_INLINE(so)); 14008348SEric.Yu@Sun.COM } 14018348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 14028348SEric.Yu@Sun.COM return (error); 14038348SEric.Yu@Sun.COM } 14048348SEric.Yu@Sun.COM 14058348SEric.Yu@Sun.COM /* 14068348SEric.Yu@Sun.COM * If the protocol has the recv down call, then pass the request 14078348SEric.Yu@Sun.COM * down. 14088348SEric.Yu@Sun.COM */ 14098348SEric.Yu@Sun.COM if (so->so_downcalls->sd_recv_uio != NULL) { 14108348SEric.Yu@Sun.COM error = (*so->so_downcalls->sd_recv_uio) 14118348SEric.Yu@Sun.COM (so->so_proto_handle, uiop, msg, cr); 14128348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 14138348SEric.Yu@Sun.COM return (error); 14148348SEric.Yu@Sun.COM } 14158348SEric.Yu@Sun.COM 14168348SEric.Yu@Sun.COM /* 14178348SEric.Yu@Sun.COM * Reading data from the socket buffer 14188348SEric.Yu@Sun.COM */ 14198348SEric.Yu@Sun.COM flags = msg->msg_flags; 14208348SEric.Yu@Sun.COM msg->msg_flags = 0; 14218348SEric.Yu@Sun.COM 14228348SEric.Yu@Sun.COM /* 14238348SEric.Yu@Sun.COM * Set msg_controllen and msg_namelen to zero here to make it 14248348SEric.Yu@Sun.COM * simpler in the cases that no control or name is returned. 14258348SEric.Yu@Sun.COM */ 14268348SEric.Yu@Sun.COM controllen = msg->msg_controllen; 14278348SEric.Yu@Sun.COM namelen = msg->msg_namelen; 14288348SEric.Yu@Sun.COM msg->msg_controllen = 0; 14298348SEric.Yu@Sun.COM msg->msg_namelen = 0; 14308348SEric.Yu@Sun.COM 14318348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 14328348SEric.Yu@Sun.COM /* Set SOREADLOCKED */ 14338348SEric.Yu@Sun.COM error = so_lock_read_intr(so, 14348348SEric.Yu@Sun.COM uiop->uio_fmode | ((flags & MSG_DONTWAIT) ? FNONBLOCK : 0)); 14358348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 14368348SEric.Yu@Sun.COM if (error) { 14378348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 14388348SEric.Yu@Sun.COM return (error); 14398348SEric.Yu@Sun.COM } 14408348SEric.Yu@Sun.COM 14418348SEric.Yu@Sun.COM suiop = sod_rcv_init(so, flags, &uiop); 14428348SEric.Yu@Sun.COM retry: 14438348SEric.Yu@Sun.COM saved_resid = uiop->uio_resid; 14448348SEric.Yu@Sun.COM error = so_dequeue_msg(so, &mctlp, uiop, &rval, flags); 14458348SEric.Yu@Sun.COM if (error != 0) { 14468348SEric.Yu@Sun.COM goto out; 14478348SEric.Yu@Sun.COM } 14488348SEric.Yu@Sun.COM /* 14498348SEric.Yu@Sun.COM * For datagrams the MOREDATA flag is used to set MSG_TRUNC. 14508348SEric.Yu@Sun.COM * For non-datagrams MOREDATA is used to set MSG_EOR. 14518348SEric.Yu@Sun.COM */ 14528348SEric.Yu@Sun.COM ASSERT(!(rval.r_val1 & MORECTL)); 14538348SEric.Yu@Sun.COM if ((rval.r_val1 & MOREDATA) && (so->so_mode & SM_ATOMIC)) 14548348SEric.Yu@Sun.COM msg->msg_flags |= MSG_TRUNC; 14558348SEric.Yu@Sun.COM if (mctlp == NULL) { 14568348SEric.Yu@Sun.COM dprintso(so, 1, ("so_recvmsg: got M_DATA\n")); 14578348SEric.Yu@Sun.COM 14588348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 14598348SEric.Yu@Sun.COM /* Set MSG_EOR based on MOREDATA */ 14608348SEric.Yu@Sun.COM if (!(rval.r_val1 & MOREDATA)) { 14618348SEric.Yu@Sun.COM if (so->so_state & SS_SAVEDEOR) { 14628348SEric.Yu@Sun.COM msg->msg_flags |= MSG_EOR; 14638348SEric.Yu@Sun.COM so->so_state &= ~SS_SAVEDEOR; 14648348SEric.Yu@Sun.COM } 14658348SEric.Yu@Sun.COM } 14668348SEric.Yu@Sun.COM /* 14678348SEric.Yu@Sun.COM * If some data was received (i.e. not EOF) and the 14688348SEric.Yu@Sun.COM * read/recv* has not been satisfied wait for some more. 14698348SEric.Yu@Sun.COM */ 14708348SEric.Yu@Sun.COM if ((flags & MSG_WAITALL) && !(msg->msg_flags & MSG_EOR) && 14718348SEric.Yu@Sun.COM uiop->uio_resid != saved_resid && uiop->uio_resid > 0) { 14728348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 14738348SEric.Yu@Sun.COM goto retry; 14748348SEric.Yu@Sun.COM } 14758348SEric.Yu@Sun.COM 14768348SEric.Yu@Sun.COM goto out_locked; 14778348SEric.Yu@Sun.COM } 14788348SEric.Yu@Sun.COM /* strsock_proto has already verified length and alignment */ 14798348SEric.Yu@Sun.COM tpr = (union T_primitives *)mctlp->b_rptr; 14808348SEric.Yu@Sun.COM dprintso(so, 1, ("so_recvmsg: type %d\n", tpr->type)); 14818348SEric.Yu@Sun.COM switch (tpr->type) { 14828348SEric.Yu@Sun.COM case T_DATA_IND: { 14838348SEric.Yu@Sun.COM /* 14848348SEric.Yu@Sun.COM * Set msg_flags to MSG_EOR based on 14858348SEric.Yu@Sun.COM * MORE_flag and MOREDATA. 14868348SEric.Yu@Sun.COM */ 14878348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 14888348SEric.Yu@Sun.COM so->so_state &= ~SS_SAVEDEOR; 14898348SEric.Yu@Sun.COM if (!(tpr->data_ind.MORE_flag & 1)) { 14908348SEric.Yu@Sun.COM if (!(rval.r_val1 & MOREDATA)) 14918348SEric.Yu@Sun.COM msg->msg_flags |= MSG_EOR; 14928348SEric.Yu@Sun.COM else 14938348SEric.Yu@Sun.COM so->so_state |= SS_SAVEDEOR; 14948348SEric.Yu@Sun.COM } 14958348SEric.Yu@Sun.COM freemsg(mctlp); 14968348SEric.Yu@Sun.COM /* 14978348SEric.Yu@Sun.COM * If some data was received (i.e. not EOF) and the 14988348SEric.Yu@Sun.COM * read/recv* has not been satisfied wait for some more. 14998348SEric.Yu@Sun.COM */ 15008348SEric.Yu@Sun.COM if ((flags & MSG_WAITALL) && !(msg->msg_flags & MSG_EOR) && 15018348SEric.Yu@Sun.COM uiop->uio_resid != saved_resid && uiop->uio_resid > 0) { 15028348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 15038348SEric.Yu@Sun.COM goto retry; 15048348SEric.Yu@Sun.COM } 15058348SEric.Yu@Sun.COM goto out_locked; 15068348SEric.Yu@Sun.COM } 15078348SEric.Yu@Sun.COM case T_UNITDATA_IND: { 15088348SEric.Yu@Sun.COM void *addr; 15098348SEric.Yu@Sun.COM t_uscalar_t addrlen; 15108348SEric.Yu@Sun.COM void *abuf; 15118348SEric.Yu@Sun.COM t_uscalar_t optlen; 15128348SEric.Yu@Sun.COM void *opt; 15138348SEric.Yu@Sun.COM 15148348SEric.Yu@Sun.COM if (namelen != 0) { 15158348SEric.Yu@Sun.COM /* Caller wants source address */ 15168348SEric.Yu@Sun.COM addrlen = tpr->unitdata_ind.SRC_length; 15178348SEric.Yu@Sun.COM addr = sogetoff(mctlp, tpr->unitdata_ind.SRC_offset, 15188348SEric.Yu@Sun.COM addrlen, 1); 15198348SEric.Yu@Sun.COM if (addr == NULL) { 15208348SEric.Yu@Sun.COM freemsg(mctlp); 15218348SEric.Yu@Sun.COM error = EPROTO; 15228348SEric.Yu@Sun.COM eprintsoline(so, error); 15238348SEric.Yu@Sun.COM goto out; 15248348SEric.Yu@Sun.COM } 15258348SEric.Yu@Sun.COM ASSERT(so->so_family != AF_UNIX); 15268348SEric.Yu@Sun.COM } 15278348SEric.Yu@Sun.COM optlen = tpr->unitdata_ind.OPT_length; 15288348SEric.Yu@Sun.COM if (optlen != 0) { 15298348SEric.Yu@Sun.COM t_uscalar_t ncontrollen; 15308348SEric.Yu@Sun.COM 15318348SEric.Yu@Sun.COM /* 15328348SEric.Yu@Sun.COM * Extract any source address option. 15338348SEric.Yu@Sun.COM * Determine how large cmsg buffer is needed. 15348348SEric.Yu@Sun.COM */ 15358348SEric.Yu@Sun.COM opt = sogetoff(mctlp, tpr->unitdata_ind.OPT_offset, 15368348SEric.Yu@Sun.COM optlen, __TPI_ALIGN_SIZE); 15378348SEric.Yu@Sun.COM 15388348SEric.Yu@Sun.COM if (opt == NULL) { 15398348SEric.Yu@Sun.COM freemsg(mctlp); 15408348SEric.Yu@Sun.COM error = EPROTO; 15418348SEric.Yu@Sun.COM eprintsoline(so, error); 15428348SEric.Yu@Sun.COM goto out; 15438348SEric.Yu@Sun.COM } 15448348SEric.Yu@Sun.COM if (so->so_family == AF_UNIX) 15458348SEric.Yu@Sun.COM so_getopt_srcaddr(opt, optlen, &addr, &addrlen); 15468348SEric.Yu@Sun.COM ncontrollen = so_cmsglen(mctlp, opt, optlen, 15478348SEric.Yu@Sun.COM !(flags & MSG_XPG4_2)); 15488348SEric.Yu@Sun.COM if (controllen != 0) 15498348SEric.Yu@Sun.COM controllen = ncontrollen; 15508348SEric.Yu@Sun.COM else if (ncontrollen != 0) 15518348SEric.Yu@Sun.COM msg->msg_flags |= MSG_CTRUNC; 15528348SEric.Yu@Sun.COM } else { 15538348SEric.Yu@Sun.COM controllen = 0; 15548348SEric.Yu@Sun.COM } 15558348SEric.Yu@Sun.COM 15568348SEric.Yu@Sun.COM if (namelen != 0) { 15578348SEric.Yu@Sun.COM /* 15588348SEric.Yu@Sun.COM * Return address to caller. 15598348SEric.Yu@Sun.COM * Caller handles truncation if length 15608348SEric.Yu@Sun.COM * exceeds msg_namelen. 15618348SEric.Yu@Sun.COM * NOTE: AF_UNIX NUL termination is ensured by 15628348SEric.Yu@Sun.COM * the sender's copyin_name(). 15638348SEric.Yu@Sun.COM */ 15648348SEric.Yu@Sun.COM abuf = kmem_alloc(addrlen, KM_SLEEP); 15658348SEric.Yu@Sun.COM 15668348SEric.Yu@Sun.COM bcopy(addr, abuf, addrlen); 15678348SEric.Yu@Sun.COM msg->msg_name = abuf; 15688348SEric.Yu@Sun.COM msg->msg_namelen = addrlen; 15698348SEric.Yu@Sun.COM } 15708348SEric.Yu@Sun.COM 15718348SEric.Yu@Sun.COM if (controllen != 0) { 15728348SEric.Yu@Sun.COM /* 15738348SEric.Yu@Sun.COM * Return control msg to caller. 15748348SEric.Yu@Sun.COM * Caller handles truncation if length 15758348SEric.Yu@Sun.COM * exceeds msg_controllen. 15768348SEric.Yu@Sun.COM */ 15778348SEric.Yu@Sun.COM control = kmem_zalloc(controllen, KM_SLEEP); 15788348SEric.Yu@Sun.COM 15798348SEric.Yu@Sun.COM error = so_opt2cmsg(mctlp, opt, optlen, 15808348SEric.Yu@Sun.COM !(flags & MSG_XPG4_2), control, controllen); 15818348SEric.Yu@Sun.COM if (error) { 15828348SEric.Yu@Sun.COM freemsg(mctlp); 15838348SEric.Yu@Sun.COM if (msg->msg_namelen != 0) 15848348SEric.Yu@Sun.COM kmem_free(msg->msg_name, 15858348SEric.Yu@Sun.COM msg->msg_namelen); 15868348SEric.Yu@Sun.COM kmem_free(control, controllen); 15878348SEric.Yu@Sun.COM eprintsoline(so, error); 15888348SEric.Yu@Sun.COM goto out; 15898348SEric.Yu@Sun.COM } 15908348SEric.Yu@Sun.COM msg->msg_control = control; 15918348SEric.Yu@Sun.COM msg->msg_controllen = controllen; 15928348SEric.Yu@Sun.COM } 15938348SEric.Yu@Sun.COM 15948348SEric.Yu@Sun.COM freemsg(mctlp); 15958348SEric.Yu@Sun.COM goto out; 15968348SEric.Yu@Sun.COM } 15978348SEric.Yu@Sun.COM case T_OPTDATA_IND: { 15988348SEric.Yu@Sun.COM struct T_optdata_req *tdr; 15998348SEric.Yu@Sun.COM void *opt; 16008348SEric.Yu@Sun.COM t_uscalar_t optlen; 16018348SEric.Yu@Sun.COM 16028348SEric.Yu@Sun.COM tdr = (struct T_optdata_req *)mctlp->b_rptr; 16038348SEric.Yu@Sun.COM optlen = tdr->OPT_length; 16048348SEric.Yu@Sun.COM if (optlen != 0) { 16058348SEric.Yu@Sun.COM t_uscalar_t ncontrollen; 16068348SEric.Yu@Sun.COM /* 16078348SEric.Yu@Sun.COM * Determine how large cmsg buffer is needed. 16088348SEric.Yu@Sun.COM */ 16098348SEric.Yu@Sun.COM opt = sogetoff(mctlp, 16108348SEric.Yu@Sun.COM tpr->optdata_ind.OPT_offset, optlen, 16118348SEric.Yu@Sun.COM __TPI_ALIGN_SIZE); 16128348SEric.Yu@Sun.COM 16138348SEric.Yu@Sun.COM if (opt == NULL) { 16148348SEric.Yu@Sun.COM freemsg(mctlp); 16158348SEric.Yu@Sun.COM error = EPROTO; 16168348SEric.Yu@Sun.COM eprintsoline(so, error); 16178348SEric.Yu@Sun.COM goto out; 16188348SEric.Yu@Sun.COM } 16198348SEric.Yu@Sun.COM 16208348SEric.Yu@Sun.COM ncontrollen = so_cmsglen(mctlp, opt, optlen, 16218348SEric.Yu@Sun.COM !(flags & MSG_XPG4_2)); 16228348SEric.Yu@Sun.COM if (controllen != 0) 16238348SEric.Yu@Sun.COM controllen = ncontrollen; 16248348SEric.Yu@Sun.COM else if (ncontrollen != 0) 16258348SEric.Yu@Sun.COM msg->msg_flags |= MSG_CTRUNC; 16268348SEric.Yu@Sun.COM } else { 16278348SEric.Yu@Sun.COM controllen = 0; 16288348SEric.Yu@Sun.COM } 16298348SEric.Yu@Sun.COM 16308348SEric.Yu@Sun.COM if (controllen != 0) { 16318348SEric.Yu@Sun.COM /* 16328348SEric.Yu@Sun.COM * Return control msg to caller. 16338348SEric.Yu@Sun.COM * Caller handles truncation if length 16348348SEric.Yu@Sun.COM * exceeds msg_controllen. 16358348SEric.Yu@Sun.COM */ 16368348SEric.Yu@Sun.COM control = kmem_zalloc(controllen, KM_SLEEP); 16378348SEric.Yu@Sun.COM 16388348SEric.Yu@Sun.COM error = so_opt2cmsg(mctlp, opt, optlen, 16398348SEric.Yu@Sun.COM !(flags & MSG_XPG4_2), control, controllen); 16408348SEric.Yu@Sun.COM if (error) { 16418348SEric.Yu@Sun.COM freemsg(mctlp); 16428348SEric.Yu@Sun.COM kmem_free(control, controllen); 16438348SEric.Yu@Sun.COM eprintsoline(so, error); 16448348SEric.Yu@Sun.COM goto out; 16458348SEric.Yu@Sun.COM } 16468348SEric.Yu@Sun.COM msg->msg_control = control; 16478348SEric.Yu@Sun.COM msg->msg_controllen = controllen; 16488348SEric.Yu@Sun.COM } 16498348SEric.Yu@Sun.COM 16508348SEric.Yu@Sun.COM /* 16518348SEric.Yu@Sun.COM * Set msg_flags to MSG_EOR based on 16528348SEric.Yu@Sun.COM * DATA_flag and MOREDATA. 16538348SEric.Yu@Sun.COM */ 16548348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 16558348SEric.Yu@Sun.COM so->so_state &= ~SS_SAVEDEOR; 16568348SEric.Yu@Sun.COM if (!(tpr->data_ind.MORE_flag & 1)) { 16578348SEric.Yu@Sun.COM if (!(rval.r_val1 & MOREDATA)) 16588348SEric.Yu@Sun.COM msg->msg_flags |= MSG_EOR; 16598348SEric.Yu@Sun.COM else 16608348SEric.Yu@Sun.COM so->so_state |= SS_SAVEDEOR; 16618348SEric.Yu@Sun.COM } 16628348SEric.Yu@Sun.COM freemsg(mctlp); 16638348SEric.Yu@Sun.COM /* 16648348SEric.Yu@Sun.COM * If some data was received (i.e. not EOF) and the 16658348SEric.Yu@Sun.COM * read/recv* has not been satisfied wait for some more. 16668348SEric.Yu@Sun.COM * Not possible to wait if control info was received. 16678348SEric.Yu@Sun.COM */ 16688348SEric.Yu@Sun.COM if ((flags & MSG_WAITALL) && !(msg->msg_flags & MSG_EOR) && 16698348SEric.Yu@Sun.COM controllen == 0 && 16708348SEric.Yu@Sun.COM uiop->uio_resid != saved_resid && uiop->uio_resid > 0) { 16718348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 16728348SEric.Yu@Sun.COM goto retry; 16738348SEric.Yu@Sun.COM } 16748348SEric.Yu@Sun.COM goto out_locked; 16758348SEric.Yu@Sun.COM } 16768348SEric.Yu@Sun.COM default: 16778348SEric.Yu@Sun.COM cmn_err(CE_CONT, "so_recvmsg bad type %x \n", 16788348SEric.Yu@Sun.COM tpr->type); 16798348SEric.Yu@Sun.COM freemsg(mctlp); 16808348SEric.Yu@Sun.COM error = EPROTO; 16818348SEric.Yu@Sun.COM ASSERT(0); 16828348SEric.Yu@Sun.COM } 16838348SEric.Yu@Sun.COM out: 16848348SEric.Yu@Sun.COM mutex_enter(&so->so_lock); 16858348SEric.Yu@Sun.COM out_locked: 16868348SEric.Yu@Sun.COM /* The sod_lockp pointers to the sonode so_lock */ 16878348SEric.Yu@Sun.COM ret = sod_rcv_done(so, suiop, uiop); 16888348SEric.Yu@Sun.COM if (ret != 0 && error == 0) 16898348SEric.Yu@Sun.COM error = ret; 16908348SEric.Yu@Sun.COM 16918348SEric.Yu@Sun.COM so_unlock_read(so); /* Clear SOREADLOCKED */ 16928348SEric.Yu@Sun.COM mutex_exit(&so->so_lock); 16938348SEric.Yu@Sun.COM 16948348SEric.Yu@Sun.COM SO_UNBLOCK_FALLBACK(so); 16958348SEric.Yu@Sun.COM 16968348SEric.Yu@Sun.COM return (error); 16978348SEric.Yu@Sun.COM } 16988348SEric.Yu@Sun.COM 16998348SEric.Yu@Sun.COM sonodeops_t so_sonodeops = { 17008348SEric.Yu@Sun.COM so_init, /* sop_init */ 17018348SEric.Yu@Sun.COM so_accept, /* sop_accept */ 17028348SEric.Yu@Sun.COM so_bind, /* sop_bind */ 17038348SEric.Yu@Sun.COM so_listen, /* sop_listen */ 17048348SEric.Yu@Sun.COM so_connect, /* sop_connect */ 17058348SEric.Yu@Sun.COM so_recvmsg, /* sop_recvmsg */ 17068348SEric.Yu@Sun.COM so_sendmsg, /* sop_sendmsg */ 17078348SEric.Yu@Sun.COM so_sendmblk, /* sop_sendmblk */ 17088348SEric.Yu@Sun.COM so_getpeername, /* sop_getpeername */ 17098348SEric.Yu@Sun.COM so_getsockname, /* sop_getsockname */ 17108348SEric.Yu@Sun.COM so_shutdown, /* sop_shutdown */ 17118348SEric.Yu@Sun.COM so_getsockopt, /* sop_getsockopt */ 17128348SEric.Yu@Sun.COM so_setsockopt, /* sop_setsockopt */ 17138348SEric.Yu@Sun.COM so_ioctl, /* sop_ioctl */ 17148348SEric.Yu@Sun.COM so_poll, /* sop_poll */ 17158348SEric.Yu@Sun.COM so_close, /* sop_close */ 17168348SEric.Yu@Sun.COM }; 17178348SEric.Yu@Sun.COM 17188348SEric.Yu@Sun.COM sock_upcalls_t so_upcalls = { 17198348SEric.Yu@Sun.COM so_newconn, 17208348SEric.Yu@Sun.COM so_connected, 17218348SEric.Yu@Sun.COM so_disconnected, 17228348SEric.Yu@Sun.COM so_opctl, 17238348SEric.Yu@Sun.COM so_queue_msg, 17248348SEric.Yu@Sun.COM so_set_prop, 17258348SEric.Yu@Sun.COM so_txq_full, 17268348SEric.Yu@Sun.COM so_signal_oob, 17278348SEric.Yu@Sun.COM so_zcopy_notify, 17288348SEric.Yu@Sun.COM so_set_error 17298348SEric.Yu@Sun.COM }; 1730