xref: /onnv-gate/usr/src/uts/common/fs/sockfs/sockcommon_sops.c (revision 8465:f9812c9a23b9)
18348SEric.Yu@Sun.COM /*
28348SEric.Yu@Sun.COM  * CDDL HEADER START
38348SEric.Yu@Sun.COM  *
48348SEric.Yu@Sun.COM  * The contents of this file are subject to the terms of the
58348SEric.Yu@Sun.COM  * Common Development and Distribution License (the "License").
68348SEric.Yu@Sun.COM  * You may not use this file except in compliance with the License.
78348SEric.Yu@Sun.COM  *
88348SEric.Yu@Sun.COM  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
98348SEric.Yu@Sun.COM  * or http://www.opensolaris.org/os/licensing.
108348SEric.Yu@Sun.COM  * See the License for the specific language governing permissions
118348SEric.Yu@Sun.COM  * and limitations under the License.
128348SEric.Yu@Sun.COM  *
138348SEric.Yu@Sun.COM  * When distributing Covered Code, include this CDDL HEADER in each
148348SEric.Yu@Sun.COM  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
158348SEric.Yu@Sun.COM  * If applicable, add the following below this CDDL HEADER, with the
168348SEric.Yu@Sun.COM  * fields enclosed by brackets "[]" replaced with your own identifying
178348SEric.Yu@Sun.COM  * information: Portions Copyright [yyyy] [name of copyright owner]
188348SEric.Yu@Sun.COM  *
198348SEric.Yu@Sun.COM  * CDDL HEADER END
208348SEric.Yu@Sun.COM  */
218348SEric.Yu@Sun.COM 
228348SEric.Yu@Sun.COM /*
238348SEric.Yu@Sun.COM  * Copyright 2008 Sun Microsystems, Inc.  All rights reserved.
248348SEric.Yu@Sun.COM  * Use is subject to license terms.
258348SEric.Yu@Sun.COM  */
268348SEric.Yu@Sun.COM 
278348SEric.Yu@Sun.COM #pragma ident	"@(#)sockcommon_sops.c	1.1	07/06/14 SMI"
288348SEric.Yu@Sun.COM 
298348SEric.Yu@Sun.COM #include <sys/types.h>
308348SEric.Yu@Sun.COM #include <sys/param.h>
318348SEric.Yu@Sun.COM #include <sys/systm.h>
328348SEric.Yu@Sun.COM #include <sys/sysmacros.h>
338348SEric.Yu@Sun.COM #include <sys/debug.h>
348348SEric.Yu@Sun.COM #include <sys/cmn_err.h>
358348SEric.Yu@Sun.COM 
368348SEric.Yu@Sun.COM #include <sys/stropts.h>
378348SEric.Yu@Sun.COM #include <sys/socket.h>
388348SEric.Yu@Sun.COM #include <sys/socketvar.h>
398348SEric.Yu@Sun.COM 
408348SEric.Yu@Sun.COM #define	_SUN_TPI_VERSION	2
418348SEric.Yu@Sun.COM #include <sys/tihdr.h>
428348SEric.Yu@Sun.COM #include <sys/sockio.h>
438348SEric.Yu@Sun.COM #include <sys/sodirect.h>
448348SEric.Yu@Sun.COM #include <sys/kmem_impl.h>
458348SEric.Yu@Sun.COM 
468348SEric.Yu@Sun.COM #include <sys/strsubr.h>
478348SEric.Yu@Sun.COM #include <sys/strsun.h>
488348SEric.Yu@Sun.COM #include <sys/ddi.h>
498348SEric.Yu@Sun.COM #include <netinet/in.h>
508348SEric.Yu@Sun.COM #include <inet/ip.h>
518348SEric.Yu@Sun.COM 
528348SEric.Yu@Sun.COM #include <fs/sockfs/sockcommon.h>
538348SEric.Yu@Sun.COM 
548348SEric.Yu@Sun.COM #include <sys/socket_proto.h>
558348SEric.Yu@Sun.COM 
568348SEric.Yu@Sun.COM #include <fs/sockfs/socktpi_impl.h>
578348SEric.Yu@Sun.COM #include <sys/tihdr.h>
588348SEric.Yu@Sun.COM #include <fs/sockfs/nl7c.h>
598348SEric.Yu@Sun.COM #include <inet/kssl/ksslapi.h>
608348SEric.Yu@Sun.COM 
618348SEric.Yu@Sun.COM 
628348SEric.Yu@Sun.COM extern int xnet_skip_checks;
638348SEric.Yu@Sun.COM extern int xnet_check_print;
648348SEric.Yu@Sun.COM 
658348SEric.Yu@Sun.COM static void so_queue_oob(sock_upper_handle_t, mblk_t *, size_t);
668348SEric.Yu@Sun.COM 
678348SEric.Yu@Sun.COM 
688348SEric.Yu@Sun.COM /*ARGSUSED*/
698348SEric.Yu@Sun.COM int
708348SEric.Yu@Sun.COM so_accept_notsupp(struct sonode *lso, int fflag,
718348SEric.Yu@Sun.COM     struct cred *cr, struct sonode **nsop)
728348SEric.Yu@Sun.COM {
738348SEric.Yu@Sun.COM 	return (EOPNOTSUPP);
748348SEric.Yu@Sun.COM }
758348SEric.Yu@Sun.COM 
768348SEric.Yu@Sun.COM /*ARGSUSED*/
778348SEric.Yu@Sun.COM int
788348SEric.Yu@Sun.COM so_listen_notsupp(struct sonode *so, int backlog, struct cred *cr)
798348SEric.Yu@Sun.COM {
808348SEric.Yu@Sun.COM 	return (EOPNOTSUPP);
818348SEric.Yu@Sun.COM }
828348SEric.Yu@Sun.COM 
838348SEric.Yu@Sun.COM /*ARGSUSED*/
848348SEric.Yu@Sun.COM int
858348SEric.Yu@Sun.COM so_getsockname_notsupp(struct sonode *so, struct sockaddr *sa,
868348SEric.Yu@Sun.COM     socklen_t *len, struct cred *cr)
878348SEric.Yu@Sun.COM {
888348SEric.Yu@Sun.COM 	return (EOPNOTSUPP);
898348SEric.Yu@Sun.COM }
908348SEric.Yu@Sun.COM 
918348SEric.Yu@Sun.COM /*ARGSUSED*/
928348SEric.Yu@Sun.COM int
938348SEric.Yu@Sun.COM so_getpeername_notsupp(struct sonode *so, struct sockaddr *addr,
948348SEric.Yu@Sun.COM     socklen_t *addrlen, boolean_t accept, struct cred *cr)
958348SEric.Yu@Sun.COM {
968348SEric.Yu@Sun.COM 	return (EOPNOTSUPP);
978348SEric.Yu@Sun.COM }
988348SEric.Yu@Sun.COM 
998348SEric.Yu@Sun.COM /*ARGSUSED*/
1008348SEric.Yu@Sun.COM int
1018348SEric.Yu@Sun.COM so_shutdown_notsupp(struct sonode *so, int how, struct cred *cr)
1028348SEric.Yu@Sun.COM {
1038348SEric.Yu@Sun.COM 	return (EOPNOTSUPP);
1048348SEric.Yu@Sun.COM }
1058348SEric.Yu@Sun.COM 
1068348SEric.Yu@Sun.COM /*ARGSUSED*/
1078348SEric.Yu@Sun.COM int
1088348SEric.Yu@Sun.COM so_sendmblk_notsupp(struct sonode *so, struct msghdr *msg, int fflag,
1098348SEric.Yu@Sun.COM     struct cred *cr, mblk_t **mpp)
1108348SEric.Yu@Sun.COM {
1118348SEric.Yu@Sun.COM 	return (EOPNOTSUPP);
1128348SEric.Yu@Sun.COM }
1138348SEric.Yu@Sun.COM 
1148348SEric.Yu@Sun.COM /*
1158348SEric.Yu@Sun.COM  * Generic Socket Ops
1168348SEric.Yu@Sun.COM  */
1178348SEric.Yu@Sun.COM 
1188348SEric.Yu@Sun.COM /* ARGSUSED */
1198348SEric.Yu@Sun.COM int
1208348SEric.Yu@Sun.COM so_init(struct sonode *so, struct sonode *pso, struct cred *cr, int flags)
1218348SEric.Yu@Sun.COM {
1228348SEric.Yu@Sun.COM 	return (socket_init_common(so, pso, flags, cr));
1238348SEric.Yu@Sun.COM }
1248348SEric.Yu@Sun.COM 
1258348SEric.Yu@Sun.COM int
1268348SEric.Yu@Sun.COM so_bind(struct sonode *so, struct sockaddr *name, socklen_t namelen,
1278348SEric.Yu@Sun.COM     int flags, struct cred *cr)
1288348SEric.Yu@Sun.COM {
1298348SEric.Yu@Sun.COM 	int error;
1308348SEric.Yu@Sun.COM 
1318348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_BIND(so, name, namelen, flags, cr));
1328348SEric.Yu@Sun.COM 
1338348SEric.Yu@Sun.COM 	ASSERT(flags == _SOBIND_XPG4_2 || flags == _SOBIND_SOCKBSD);
1348348SEric.Yu@Sun.COM 
1358348SEric.Yu@Sun.COM 	/* X/Open requires this check */
1368348SEric.Yu@Sun.COM 	if ((so->so_state & SS_CANTSENDMORE) && !xnet_skip_checks) {
1378348SEric.Yu@Sun.COM 		if (xnet_check_print) {
1388348SEric.Yu@Sun.COM 			printf("sockfs: X/Open bind state check "
1398348SEric.Yu@Sun.COM 			    "caused EINVAL\n");
1408348SEric.Yu@Sun.COM 		}
1418348SEric.Yu@Sun.COM 		error = EINVAL;
1428348SEric.Yu@Sun.COM 		goto done;
1438348SEric.Yu@Sun.COM 	}
1448348SEric.Yu@Sun.COM 
1458348SEric.Yu@Sun.COM 	/*
1468348SEric.Yu@Sun.COM 	 * a bind to a NULL address is interpreted as unbind. So just
1478348SEric.Yu@Sun.COM 	 * do the downcall.
1488348SEric.Yu@Sun.COM 	 */
1498348SEric.Yu@Sun.COM 	if (name == NULL)
1508348SEric.Yu@Sun.COM 		goto dobind;
1518348SEric.Yu@Sun.COM 
1528348SEric.Yu@Sun.COM 	switch (so->so_family) {
1538348SEric.Yu@Sun.COM 	case AF_INET:
1548348SEric.Yu@Sun.COM 		if ((size_t)namelen != sizeof (sin_t)) {
1558348SEric.Yu@Sun.COM 			error = name->sa_family != so->so_family ?
1568348SEric.Yu@Sun.COM 			    EAFNOSUPPORT : EINVAL;
1578348SEric.Yu@Sun.COM 			eprintsoline(so, error);
1588348SEric.Yu@Sun.COM 			goto done;
1598348SEric.Yu@Sun.COM 		}
1608348SEric.Yu@Sun.COM 
1618348SEric.Yu@Sun.COM 		if ((flags & _SOBIND_XPG4_2) &&
1628348SEric.Yu@Sun.COM 		    (name->sa_family != so->so_family)) {
1638348SEric.Yu@Sun.COM 			/*
1648348SEric.Yu@Sun.COM 			 * This check has to be made for X/Open
1658348SEric.Yu@Sun.COM 			 * sockets however application failures have
1668348SEric.Yu@Sun.COM 			 * been observed when it is applied to
1678348SEric.Yu@Sun.COM 			 * all sockets.
1688348SEric.Yu@Sun.COM 			 */
1698348SEric.Yu@Sun.COM 			error = EAFNOSUPPORT;
1708348SEric.Yu@Sun.COM 			eprintsoline(so, error);
1718348SEric.Yu@Sun.COM 			goto done;
1728348SEric.Yu@Sun.COM 		}
1738348SEric.Yu@Sun.COM 		/*
1748348SEric.Yu@Sun.COM 		 * Force a zero sa_family to match so_family.
1758348SEric.Yu@Sun.COM 		 *
1768348SEric.Yu@Sun.COM 		 * Some programs like inetd(1M) don't set the
1778348SEric.Yu@Sun.COM 		 * family field. Other programs leave
1788348SEric.Yu@Sun.COM 		 * sin_family set to garbage - SunOS 4.X does
1798348SEric.Yu@Sun.COM 		 * not check the family field on a bind.
1808348SEric.Yu@Sun.COM 		 * We use the family field that
1818348SEric.Yu@Sun.COM 		 * was passed in to the socket() call.
1828348SEric.Yu@Sun.COM 		 */
1838348SEric.Yu@Sun.COM 		name->sa_family = so->so_family;
1848348SEric.Yu@Sun.COM 		break;
1858348SEric.Yu@Sun.COM 
1868348SEric.Yu@Sun.COM 	case AF_INET6: {
1878348SEric.Yu@Sun.COM #ifdef DEBUG
1888348SEric.Yu@Sun.COM 		sin6_t *sin6 = (sin6_t *)name;
1898348SEric.Yu@Sun.COM #endif
1908348SEric.Yu@Sun.COM 		if ((size_t)namelen != sizeof (sin6_t)) {
1918348SEric.Yu@Sun.COM 			error = name->sa_family != so->so_family ?
1928348SEric.Yu@Sun.COM 			    EAFNOSUPPORT : EINVAL;
1938348SEric.Yu@Sun.COM 			eprintsoline(so, error);
1948348SEric.Yu@Sun.COM 			goto done;
1958348SEric.Yu@Sun.COM 		}
1968348SEric.Yu@Sun.COM 
1978348SEric.Yu@Sun.COM 		if (name->sa_family != so->so_family) {
1988348SEric.Yu@Sun.COM 			/*
1998348SEric.Yu@Sun.COM 			 * With IPv6 we require the family to match
2008348SEric.Yu@Sun.COM 			 * unlike in IPv4.
2018348SEric.Yu@Sun.COM 			 */
2028348SEric.Yu@Sun.COM 			error = EAFNOSUPPORT;
2038348SEric.Yu@Sun.COM 			eprintsoline(so, error);
2048348SEric.Yu@Sun.COM 			goto done;
2058348SEric.Yu@Sun.COM 		}
2068348SEric.Yu@Sun.COM #ifdef DEBUG
2078348SEric.Yu@Sun.COM 		/*
2088348SEric.Yu@Sun.COM 		 * Verify that apps don't forget to clear
2098348SEric.Yu@Sun.COM 		 * sin6_scope_id etc
2108348SEric.Yu@Sun.COM 		 */
2118348SEric.Yu@Sun.COM 		if (sin6->sin6_scope_id != 0 &&
2128348SEric.Yu@Sun.COM 		    !IN6_IS_ADDR_LINKSCOPE(&sin6->sin6_addr)) {
2138348SEric.Yu@Sun.COM 			zcmn_err(getzoneid(), CE_WARN,
2148348SEric.Yu@Sun.COM 			    "bind with uninitialized sin6_scope_id "
2158348SEric.Yu@Sun.COM 			    "(%d) on socket. Pid = %d\n",
2168348SEric.Yu@Sun.COM 			    (int)sin6->sin6_scope_id,
2178348SEric.Yu@Sun.COM 			    (int)curproc->p_pid);
2188348SEric.Yu@Sun.COM 		}
2198348SEric.Yu@Sun.COM 		if (sin6->__sin6_src_id != 0) {
2208348SEric.Yu@Sun.COM 			zcmn_err(getzoneid(), CE_WARN,
2218348SEric.Yu@Sun.COM 			    "bind with uninitialized __sin6_src_id "
2228348SEric.Yu@Sun.COM 			    "(%d) on socket. Pid = %d\n",
2238348SEric.Yu@Sun.COM 			    (int)sin6->__sin6_src_id,
2248348SEric.Yu@Sun.COM 			    (int)curproc->p_pid);
2258348SEric.Yu@Sun.COM 		}
2268348SEric.Yu@Sun.COM #endif /* DEBUG */
2278348SEric.Yu@Sun.COM 
2288348SEric.Yu@Sun.COM 		break;
2298348SEric.Yu@Sun.COM 	}
2308348SEric.Yu@Sun.COM 	default:
2318348SEric.Yu@Sun.COM 		/* Just pass the request to the protocol */
2328348SEric.Yu@Sun.COM 		goto dobind;
2338348SEric.Yu@Sun.COM 	}
2348348SEric.Yu@Sun.COM 
2358348SEric.Yu@Sun.COM 	/*
2368348SEric.Yu@Sun.COM 	 * First we check if either NCA or KSSL has been enabled for
2378348SEric.Yu@Sun.COM 	 * the requested address, and if so, we fall back to TPI.
2388348SEric.Yu@Sun.COM 	 * If neither of those two services are enabled, then we just
2398348SEric.Yu@Sun.COM 	 * pass the request to the protocol.
2408348SEric.Yu@Sun.COM 	 *
2418348SEric.Yu@Sun.COM 	 * Note that KSSL can only be enabled on a socket if NCA is NOT
2428348SEric.Yu@Sun.COM 	 * enabled for that socket, hence the else-statement below.
2438348SEric.Yu@Sun.COM 	 */
2448348SEric.Yu@Sun.COM 	if (nl7c_enabled && ((so->so_family == AF_INET ||
2458348SEric.Yu@Sun.COM 	    so->so_family == AF_INET6) &&
2468348SEric.Yu@Sun.COM 	    nl7c_lookup_addr(name, namelen) != NULL)) {
2478348SEric.Yu@Sun.COM 		/*
2488348SEric.Yu@Sun.COM 		 * NL7C is not supported in non-global zones,
2498348SEric.Yu@Sun.COM 		 * we enforce this restriction here.
2508348SEric.Yu@Sun.COM 		 */
2518348SEric.Yu@Sun.COM 		if (so->so_zoneid == GLOBAL_ZONEID) {
2528348SEric.Yu@Sun.COM 			/* NCA should be used, so fall back to TPI */
2538348SEric.Yu@Sun.COM 			error = so_tpi_fallback(so, cr);
2548348SEric.Yu@Sun.COM 			SO_UNBLOCK_FALLBACK(so);
2558348SEric.Yu@Sun.COM 			if (error)
2568348SEric.Yu@Sun.COM 				return (error);
2578348SEric.Yu@Sun.COM 			else
2588348SEric.Yu@Sun.COM 				return (SOP_BIND(so, name, namelen, flags, cr));
2598348SEric.Yu@Sun.COM 		}
2608348SEric.Yu@Sun.COM 	} else if (so->so_type == SOCK_STREAM) {
2618348SEric.Yu@Sun.COM 		/* Check if KSSL has been configured for this address */
2628348SEric.Yu@Sun.COM 		kssl_ent_t ent;
2638348SEric.Yu@Sun.COM 		kssl_endpt_type_t type;
2648348SEric.Yu@Sun.COM 		struct T_bind_req bind_req;
2658348SEric.Yu@Sun.COM 		mblk_t *mp;
2668348SEric.Yu@Sun.COM 
2678348SEric.Yu@Sun.COM 		/*
2688348SEric.Yu@Sun.COM 		 * TODO: Check with KSSL team if we could add a function call
2698348SEric.Yu@Sun.COM 		 * that only queries whether KSSL is enabled for the given
2708348SEric.Yu@Sun.COM 		 * address.
2718348SEric.Yu@Sun.COM 		 */
2728348SEric.Yu@Sun.COM 		bind_req.PRIM_type = T_BIND_REQ;
2738348SEric.Yu@Sun.COM 		bind_req.ADDR_length = namelen;
2748348SEric.Yu@Sun.COM 		bind_req.ADDR_offset = (t_scalar_t)sizeof (bind_req);
2758348SEric.Yu@Sun.COM 		mp = soallocproto2(&bind_req, sizeof (bind_req),
2768348SEric.Yu@Sun.COM 		    name, namelen, 0, _ALLOC_SLEEP);
2778348SEric.Yu@Sun.COM 
2788348SEric.Yu@Sun.COM 		type = kssl_check_proxy(mp, so, &ent);
2798348SEric.Yu@Sun.COM 		freemsg(mp);
2808348SEric.Yu@Sun.COM 
2818348SEric.Yu@Sun.COM 		if (type != KSSL_NO_PROXY) {
2828348SEric.Yu@Sun.COM 			/*
2838348SEric.Yu@Sun.COM 			 * KSSL has been configured for this address, so
2848348SEric.Yu@Sun.COM 			 * we must fall back to TPI.
2858348SEric.Yu@Sun.COM 			 */
2868348SEric.Yu@Sun.COM 			kssl_release_ent(ent, so, type);
2878348SEric.Yu@Sun.COM 			error = so_tpi_fallback(so, cr);
2888348SEric.Yu@Sun.COM 			SO_UNBLOCK_FALLBACK(so);
2898348SEric.Yu@Sun.COM 			if (error)
2908348SEric.Yu@Sun.COM 				return (error);
2918348SEric.Yu@Sun.COM 			else
2928348SEric.Yu@Sun.COM 				return (SOP_BIND(so, name, namelen, flags, cr));
2938348SEric.Yu@Sun.COM 		}
2948348SEric.Yu@Sun.COM 	}
2958348SEric.Yu@Sun.COM 
2968348SEric.Yu@Sun.COM dobind:
2978348SEric.Yu@Sun.COM 	error = (*so->so_downcalls->sd_bind)
2988348SEric.Yu@Sun.COM 	    (so->so_proto_handle, name, namelen, cr);
2998348SEric.Yu@Sun.COM done:
3008348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
3018348SEric.Yu@Sun.COM 
3028348SEric.Yu@Sun.COM 	return (error);
3038348SEric.Yu@Sun.COM }
3048348SEric.Yu@Sun.COM 
3058348SEric.Yu@Sun.COM int
3068348SEric.Yu@Sun.COM so_listen(struct sonode *so, int backlog, struct cred *cr)
3078348SEric.Yu@Sun.COM {
3088348SEric.Yu@Sun.COM 	int	error = 0;
3098348SEric.Yu@Sun.COM 
3108348SEric.Yu@Sun.COM 	ASSERT(MUTEX_NOT_HELD(&so->so_lock));
3118348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_LISTEN(so, backlog, cr));
3128348SEric.Yu@Sun.COM 
3138348SEric.Yu@Sun.COM 	error = (*so->so_downcalls->sd_listen)(so->so_proto_handle, backlog,
3148348SEric.Yu@Sun.COM 	    cr);
3158348SEric.Yu@Sun.COM 
3168348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
3178348SEric.Yu@Sun.COM 
3188348SEric.Yu@Sun.COM 	return (error);
3198348SEric.Yu@Sun.COM }
3208348SEric.Yu@Sun.COM 
3218348SEric.Yu@Sun.COM 
3228348SEric.Yu@Sun.COM int
3238348SEric.Yu@Sun.COM so_connect(struct sonode *so, const struct sockaddr *name,
3248348SEric.Yu@Sun.COM     socklen_t namelen, int fflag, int flags, struct cred *cr)
3258348SEric.Yu@Sun.COM {
3268348SEric.Yu@Sun.COM 	int error = 0;
3278348SEric.Yu@Sun.COM 	sock_connid_t id;
3288348SEric.Yu@Sun.COM 
3298348SEric.Yu@Sun.COM 	ASSERT(MUTEX_NOT_HELD(&so->so_lock));
3308348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_CONNECT(so, name, namelen, fflag, flags, cr));
3318348SEric.Yu@Sun.COM 
3328348SEric.Yu@Sun.COM 	/*
3338348SEric.Yu@Sun.COM 	 * If there is a pending error, return error
3348348SEric.Yu@Sun.COM 	 * This can happen if a non blocking operation caused an error.
3358348SEric.Yu@Sun.COM 	 */
3368348SEric.Yu@Sun.COM 
3378348SEric.Yu@Sun.COM 	if (so->so_error != 0) {
3388348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
3398348SEric.Yu@Sun.COM 		error = sogeterr(so, B_TRUE);
3408348SEric.Yu@Sun.COM 		mutex_exit(&so->so_lock);
3418348SEric.Yu@Sun.COM 		if (error != 0)
3428348SEric.Yu@Sun.COM 			goto done;
3438348SEric.Yu@Sun.COM 	}
3448348SEric.Yu@Sun.COM 
3458348SEric.Yu@Sun.COM 	error = (*so->so_downcalls->sd_connect)(so->so_proto_handle,
3468348SEric.Yu@Sun.COM 	    name, namelen, &id, cr);
3478348SEric.Yu@Sun.COM 
3488348SEric.Yu@Sun.COM 	if (error == EINPROGRESS)
3498348SEric.Yu@Sun.COM 		error = so_wait_connected(so, fflag & (FNONBLOCK|FNDELAY), id);
3508348SEric.Yu@Sun.COM 
3518348SEric.Yu@Sun.COM done:
3528348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
3538348SEric.Yu@Sun.COM 	return (error);
3548348SEric.Yu@Sun.COM }
3558348SEric.Yu@Sun.COM 
3568348SEric.Yu@Sun.COM /*ARGSUSED*/
3578348SEric.Yu@Sun.COM int
3588348SEric.Yu@Sun.COM so_accept(struct sonode *so, int fflag, struct cred *cr, struct sonode **nsop)
3598348SEric.Yu@Sun.COM {
3608348SEric.Yu@Sun.COM 	int error = 0;
3618348SEric.Yu@Sun.COM 	struct sonode *nso;
3628348SEric.Yu@Sun.COM 
3638348SEric.Yu@Sun.COM 	*nsop = NULL;
3648348SEric.Yu@Sun.COM 
3658348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_ACCEPT(so, fflag, cr, nsop));
3668348SEric.Yu@Sun.COM 	if ((so->so_state & SS_ACCEPTCONN) == 0) {
3678348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
3688348SEric.Yu@Sun.COM 		return ((so->so_type == SOCK_DGRAM || so->so_type == SOCK_RAW) ?
3698348SEric.Yu@Sun.COM 		    EOPNOTSUPP : EINVAL);
3708348SEric.Yu@Sun.COM 	}
3718348SEric.Yu@Sun.COM 
3728348SEric.Yu@Sun.COM 	if ((error = so_acceptq_dequeue(so, (fflag & (FNONBLOCK|FNDELAY)),
3738348SEric.Yu@Sun.COM 	    &nso)) == 0) {
3748348SEric.Yu@Sun.COM 		ASSERT(nso != NULL);
3758348SEric.Yu@Sun.COM 
3768348SEric.Yu@Sun.COM 		/* finish the accept */
3778348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_accept)(so->so_proto_handle,
3788348SEric.Yu@Sun.COM 		    nso->so_proto_handle, (sock_upper_handle_t)nso, cr);
3798348SEric.Yu@Sun.COM 		if (error != 0) {
3808348SEric.Yu@Sun.COM 			(void) socket_close(nso, 0, cr);
3818348SEric.Yu@Sun.COM 			socket_destroy(nso);
3828348SEric.Yu@Sun.COM 		} else {
3838348SEric.Yu@Sun.COM 			*nsop = nso;
3848348SEric.Yu@Sun.COM 		}
3858348SEric.Yu@Sun.COM 	}
3868348SEric.Yu@Sun.COM 
3878348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
3888348SEric.Yu@Sun.COM 	return (error);
3898348SEric.Yu@Sun.COM }
3908348SEric.Yu@Sun.COM 
3918348SEric.Yu@Sun.COM int
3928348SEric.Yu@Sun.COM so_sendmsg(struct sonode *so, struct nmsghdr *msg, struct uio *uiop,
3938348SEric.Yu@Sun.COM     struct cred *cr)
3948348SEric.Yu@Sun.COM {
3958348SEric.Yu@Sun.COM 	int error, flags;
3968348SEric.Yu@Sun.COM 	boolean_t dontblock;
3978348SEric.Yu@Sun.COM 	ssize_t orig_resid;
3988348SEric.Yu@Sun.COM 	mblk_t  *mp;
3998348SEric.Yu@Sun.COM 
4008348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_SENDMSG(so, msg, uiop, cr));
4018348SEric.Yu@Sun.COM 
4028348SEric.Yu@Sun.COM 	flags = msg->msg_flags;
4038348SEric.Yu@Sun.COM 	error = 0;
4048348SEric.Yu@Sun.COM 	dontblock = (flags & MSG_DONTWAIT) ||
4058348SEric.Yu@Sun.COM 	    (uiop->uio_fmode & (FNONBLOCK|FNDELAY));
4068348SEric.Yu@Sun.COM 
4078348SEric.Yu@Sun.COM 	if (!(flags & MSG_XPG4_2) && msg->msg_controllen != 0) {
4088348SEric.Yu@Sun.COM 		/*
4098348SEric.Yu@Sun.COM 		 * Old way of passing fd's is not supported
4108348SEric.Yu@Sun.COM 		 */
4118348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
4128348SEric.Yu@Sun.COM 		return (EOPNOTSUPP);
4138348SEric.Yu@Sun.COM 	}
4148348SEric.Yu@Sun.COM 
4158348SEric.Yu@Sun.COM 	if ((so->so_mode & SM_ATOMIC) &&
4168348SEric.Yu@Sun.COM 	    uiop->uio_resid > so->so_proto_props.sopp_maxpsz &&
4178348SEric.Yu@Sun.COM 	    so->so_proto_props.sopp_maxpsz != -1) {
4188348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
4198348SEric.Yu@Sun.COM 		return (EMSGSIZE);
4208348SEric.Yu@Sun.COM 	}
4218348SEric.Yu@Sun.COM 
4228348SEric.Yu@Sun.COM 	/*
4238348SEric.Yu@Sun.COM 	 * For atomic sends we will only do one iteration.
4248348SEric.Yu@Sun.COM 	 */
4258348SEric.Yu@Sun.COM 	do {
4268348SEric.Yu@Sun.COM 		if (so->so_state & SS_CANTSENDMORE) {
4278348SEric.Yu@Sun.COM 			error = EPIPE;
4288348SEric.Yu@Sun.COM 			break;
4298348SEric.Yu@Sun.COM 		}
4308348SEric.Yu@Sun.COM 
4318348SEric.Yu@Sun.COM 		if (so->so_error != 0) {
4328348SEric.Yu@Sun.COM 			mutex_enter(&so->so_lock);
4338348SEric.Yu@Sun.COM 			error = sogeterr(so, B_TRUE);
4348348SEric.Yu@Sun.COM 			mutex_exit(&so->so_lock);
4358348SEric.Yu@Sun.COM 			if (error != 0)
4368348SEric.Yu@Sun.COM 				break;
4378348SEric.Yu@Sun.COM 		}
4388348SEric.Yu@Sun.COM 
4398348SEric.Yu@Sun.COM 		/*
4408348SEric.Yu@Sun.COM 		 * Send down OOB messages even if the send path is being
4418348SEric.Yu@Sun.COM 		 * flow controlled (assuming the protocol supports OOB data).
4428348SEric.Yu@Sun.COM 		 */
4438348SEric.Yu@Sun.COM 		if (flags & MSG_OOB) {
4448348SEric.Yu@Sun.COM 			if ((so->so_mode & SM_EXDATA) == 0) {
4458348SEric.Yu@Sun.COM 				error = EOPNOTSUPP;
4468348SEric.Yu@Sun.COM 				break;
4478348SEric.Yu@Sun.COM 			}
4488348SEric.Yu@Sun.COM 		} else if (so->so_snd_qfull) {
4498348SEric.Yu@Sun.COM 			/*
4508348SEric.Yu@Sun.COM 			 * Need to wait until the protocol is ready to receive
4518348SEric.Yu@Sun.COM 			 * more data for transmission.
4528348SEric.Yu@Sun.COM 			 */
4538348SEric.Yu@Sun.COM 			if ((error = so_snd_wait_qnotfull(so, dontblock)) != 0)
4548348SEric.Yu@Sun.COM 				break;
4558348SEric.Yu@Sun.COM 		}
4568348SEric.Yu@Sun.COM 
4578348SEric.Yu@Sun.COM 		/*
4588348SEric.Yu@Sun.COM 		 * Time to send data to the protocol. We either copy the
4598348SEric.Yu@Sun.COM 		 * data into mblks or pass the uio directly to the protocol.
4608348SEric.Yu@Sun.COM 		 * We decide what to do based on the available down calls.
4618348SEric.Yu@Sun.COM 		 */
4628348SEric.Yu@Sun.COM 		if (so->so_downcalls->sd_send_uio != NULL) {
4638348SEric.Yu@Sun.COM 			error = (*so->so_downcalls->sd_send_uio)
4648348SEric.Yu@Sun.COM 			    (so->so_proto_handle, uiop, msg, cr);
4658348SEric.Yu@Sun.COM 			if (error != 0)
4668348SEric.Yu@Sun.COM 				break;
4678348SEric.Yu@Sun.COM 		} else {
4688348SEric.Yu@Sun.COM 			/* save the resid in case of failure */
4698348SEric.Yu@Sun.COM 			orig_resid = uiop->uio_resid;
4708348SEric.Yu@Sun.COM 
4718348SEric.Yu@Sun.COM 			if ((mp = socopyinuio(uiop,
4728348SEric.Yu@Sun.COM 			    so->so_proto_props.sopp_maxpsz,
4738348SEric.Yu@Sun.COM 			    so->so_proto_props.sopp_wroff,
4748348SEric.Yu@Sun.COM 			    so->so_proto_props.sopp_maxblk,
4758348SEric.Yu@Sun.COM 			    so->so_proto_props.sopp_tail, &error)) == NULL) {
4768348SEric.Yu@Sun.COM 				break;
4778348SEric.Yu@Sun.COM 			}
4788348SEric.Yu@Sun.COM 			ASSERT(uiop->uio_resid >= 0);
4798348SEric.Yu@Sun.COM 
4808348SEric.Yu@Sun.COM 			error = (*so->so_downcalls->sd_send)
4818348SEric.Yu@Sun.COM 			    (so->so_proto_handle, mp, msg, cr);
4828348SEric.Yu@Sun.COM 			if (error != 0) {
4838348SEric.Yu@Sun.COM 				/*
4848348SEric.Yu@Sun.COM 				 * The send failed. We do not have to free the
4858348SEric.Yu@Sun.COM 				 * mblks, because that is the protocol's
4868348SEric.Yu@Sun.COM 				 * responsibility. However, uio_resid must
4878348SEric.Yu@Sun.COM 				 * remain accurate, so adjust that here.
4888348SEric.Yu@Sun.COM 				 */
4898348SEric.Yu@Sun.COM 				uiop->uio_resid = orig_resid;
4908348SEric.Yu@Sun.COM 					break;
4918348SEric.Yu@Sun.COM 			}
4928348SEric.Yu@Sun.COM 		}
4938348SEric.Yu@Sun.COM 	} while (uiop->uio_resid > 0);
4948348SEric.Yu@Sun.COM 
4958348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
4968348SEric.Yu@Sun.COM 
4978348SEric.Yu@Sun.COM 	return (error);
4988348SEric.Yu@Sun.COM }
4998348SEric.Yu@Sun.COM 
5008348SEric.Yu@Sun.COM int
5018348SEric.Yu@Sun.COM so_sendmblk(struct sonode *so, struct nmsghdr *msg, int fflag,
5028348SEric.Yu@Sun.COM     struct cred *cr, mblk_t **mpp)
5038348SEric.Yu@Sun.COM {
5048348SEric.Yu@Sun.COM 	int error;
5058348SEric.Yu@Sun.COM 	boolean_t dontblock;
5068348SEric.Yu@Sun.COM 	size_t size;
5078348SEric.Yu@Sun.COM 	mblk_t *mp = *mpp;
5088348SEric.Yu@Sun.COM 
5098348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_SENDMBLK(so, msg, fflag, cr, mpp));
5108348SEric.Yu@Sun.COM 
5118348SEric.Yu@Sun.COM 	error = 0;
5128348SEric.Yu@Sun.COM 	dontblock = (msg->msg_flags & MSG_DONTWAIT) ||
5138348SEric.Yu@Sun.COM 	    (fflag & (FNONBLOCK|FNDELAY));
5148348SEric.Yu@Sun.COM 	size = msgdsize(mp);
5158348SEric.Yu@Sun.COM 
5168401SAnders.Persson@Sun.COM 	if ((so->so_mode & SM_SENDFILESUPP) == 0 ||
5178401SAnders.Persson@Sun.COM 	    so->so_downcalls->sd_send == NULL) {
5188348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
5198348SEric.Yu@Sun.COM 		return (EOPNOTSUPP);
5208348SEric.Yu@Sun.COM 	}
5218348SEric.Yu@Sun.COM 
5228348SEric.Yu@Sun.COM 	if ((so->so_mode & SM_ATOMIC) &&
5238348SEric.Yu@Sun.COM 	    size > so->so_proto_props.sopp_maxpsz &&
5248348SEric.Yu@Sun.COM 	    so->so_proto_props.sopp_maxpsz != -1) {
5258348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
5268348SEric.Yu@Sun.COM 		return (EMSGSIZE);
5278348SEric.Yu@Sun.COM 	}
5288348SEric.Yu@Sun.COM 
5298348SEric.Yu@Sun.COM 	while (mp != NULL) {
5308348SEric.Yu@Sun.COM 		mblk_t *nmp, *last_mblk;
5318348SEric.Yu@Sun.COM 		size_t mlen;
5328348SEric.Yu@Sun.COM 
5338348SEric.Yu@Sun.COM 		if (so->so_state & SS_CANTSENDMORE) {
5348348SEric.Yu@Sun.COM 			error = EPIPE;
5358348SEric.Yu@Sun.COM 			break;
5368348SEric.Yu@Sun.COM 		}
5378348SEric.Yu@Sun.COM 		if (so->so_error != 0) {
5388348SEric.Yu@Sun.COM 			mutex_enter(&so->so_lock);
5398348SEric.Yu@Sun.COM 			error = sogeterr(so, B_TRUE);
5408348SEric.Yu@Sun.COM 			mutex_exit(&so->so_lock);
5418348SEric.Yu@Sun.COM 			if (error != 0)
5428348SEric.Yu@Sun.COM 				break;
5438348SEric.Yu@Sun.COM 		}
5448348SEric.Yu@Sun.COM 		if (so->so_snd_qfull) {
5458348SEric.Yu@Sun.COM 			/*
5468348SEric.Yu@Sun.COM 			 * Need to wait until the protocol is ready to receive
5478348SEric.Yu@Sun.COM 			 * more data for transmission.
5488348SEric.Yu@Sun.COM 			 */
5498348SEric.Yu@Sun.COM 			if ((error = so_snd_wait_qnotfull(so, dontblock)) != 0)
5508348SEric.Yu@Sun.COM 				break;
5518348SEric.Yu@Sun.COM 		}
5528348SEric.Yu@Sun.COM 
5538348SEric.Yu@Sun.COM 		/*
5548348SEric.Yu@Sun.COM 		 * We only allow so_maxpsz of data to be sent down to
5558348SEric.Yu@Sun.COM 		 * the protocol at time.
5568348SEric.Yu@Sun.COM 		 */
5578348SEric.Yu@Sun.COM 		mlen = MBLKL(mp);
5588348SEric.Yu@Sun.COM 		nmp = mp->b_cont;
5598348SEric.Yu@Sun.COM 		last_mblk = mp;
5608348SEric.Yu@Sun.COM 		while (nmp != NULL) {
5618348SEric.Yu@Sun.COM 			mlen += MBLKL(nmp);
5628348SEric.Yu@Sun.COM 			if (mlen > so->so_proto_props.sopp_maxpsz) {
5638348SEric.Yu@Sun.COM 				last_mblk->b_cont = NULL;
5648348SEric.Yu@Sun.COM 				break;
5658348SEric.Yu@Sun.COM 			}
5668348SEric.Yu@Sun.COM 			last_mblk = nmp;
5678348SEric.Yu@Sun.COM 			nmp = nmp->b_cont;
5688348SEric.Yu@Sun.COM 		}
5698348SEric.Yu@Sun.COM 
5708348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_send)
5718348SEric.Yu@Sun.COM 		    (so->so_proto_handle, mp, msg, cr);
5728348SEric.Yu@Sun.COM 		if (error != 0) {
5738348SEric.Yu@Sun.COM 			/*
5748348SEric.Yu@Sun.COM 			 * The send failed. The protocol will free the mblks
5758348SEric.Yu@Sun.COM 			 * that were sent down. Let the caller deal with the
5768348SEric.Yu@Sun.COM 			 * rest.
5778348SEric.Yu@Sun.COM 			 */
5788348SEric.Yu@Sun.COM 			*mpp = nmp;
5798348SEric.Yu@Sun.COM 			break;
5808348SEric.Yu@Sun.COM 		}
5818348SEric.Yu@Sun.COM 
5828348SEric.Yu@Sun.COM 		*mpp = mp = nmp;
5838348SEric.Yu@Sun.COM 	}
5848348SEric.Yu@Sun.COM 
5858348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
5868348SEric.Yu@Sun.COM 
5878348SEric.Yu@Sun.COM 	return (error);
5888348SEric.Yu@Sun.COM }
5898348SEric.Yu@Sun.COM 
5908348SEric.Yu@Sun.COM int
5918348SEric.Yu@Sun.COM so_shutdown(struct sonode *so, int how, struct cred *cr)
5928348SEric.Yu@Sun.COM {
5938348SEric.Yu@Sun.COM 	int error;
5948348SEric.Yu@Sun.COM 
5958348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_SHUTDOWN(so, how, cr));
5968348SEric.Yu@Sun.COM 
5978348SEric.Yu@Sun.COM 	/*
5988348SEric.Yu@Sun.COM 	 * SunOS 4.X has no check for datagram sockets.
5998348SEric.Yu@Sun.COM 	 * 5.X checks that it is connected (ENOTCONN)
6008348SEric.Yu@Sun.COM 	 * X/Open requires that we check the connected state.
6018348SEric.Yu@Sun.COM 	 */
6028348SEric.Yu@Sun.COM 	if (!(so->so_state & SS_ISCONNECTED)) {
6038348SEric.Yu@Sun.COM 		if (!xnet_skip_checks) {
6048348SEric.Yu@Sun.COM 			error = ENOTCONN;
6058348SEric.Yu@Sun.COM 			if (xnet_check_print) {
6068348SEric.Yu@Sun.COM 				printf("sockfs: X/Open shutdown check "
6078348SEric.Yu@Sun.COM 				    "caused ENOTCONN\n");
6088348SEric.Yu@Sun.COM 			}
6098348SEric.Yu@Sun.COM 		}
6108348SEric.Yu@Sun.COM 		goto done;
6118348SEric.Yu@Sun.COM 	}
6128348SEric.Yu@Sun.COM 
6138348SEric.Yu@Sun.COM 	error = ((*so->so_downcalls->sd_shutdown)(so->so_proto_handle,
6148348SEric.Yu@Sun.COM 	    how, cr));
6158348SEric.Yu@Sun.COM 
6168348SEric.Yu@Sun.COM 	/*
6178348SEric.Yu@Sun.COM 	 * Protocol agreed to shutdown. We need to flush the
6188348SEric.Yu@Sun.COM 	 * receive buffer if the receive side is being shutdown.
6198348SEric.Yu@Sun.COM 	 */
6208348SEric.Yu@Sun.COM 	if (error == 0 && how != SHUT_WR) {
6218348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
6228348SEric.Yu@Sun.COM 		/* wait for active reader to finish */
6238348SEric.Yu@Sun.COM 		(void) so_lock_read(so, 0);
6248348SEric.Yu@Sun.COM 
6258348SEric.Yu@Sun.COM 		so_rcv_flush(so);
6268348SEric.Yu@Sun.COM 
6278348SEric.Yu@Sun.COM 		so_unlock_read(so);
6288348SEric.Yu@Sun.COM 		mutex_exit(&so->so_lock);
6298348SEric.Yu@Sun.COM 	}
6308348SEric.Yu@Sun.COM 
6318348SEric.Yu@Sun.COM done:
6328348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
6338348SEric.Yu@Sun.COM 	return (error);
6348348SEric.Yu@Sun.COM }
6358348SEric.Yu@Sun.COM 
6368348SEric.Yu@Sun.COM int
6378348SEric.Yu@Sun.COM so_getsockname(struct sonode *so, struct sockaddr *addr,
6388348SEric.Yu@Sun.COM     socklen_t *addrlen, struct cred *cr)
6398348SEric.Yu@Sun.COM {
6408348SEric.Yu@Sun.COM 	int error;
6418348SEric.Yu@Sun.COM 
6428348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_GETSOCKNAME(so, addr, addrlen, cr));
6438348SEric.Yu@Sun.COM 
6448348SEric.Yu@Sun.COM 	error = (*so->so_downcalls->sd_getsockname)
6458348SEric.Yu@Sun.COM 	    (so->so_proto_handle, addr, addrlen, cr);
6468348SEric.Yu@Sun.COM 
6478348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
6488348SEric.Yu@Sun.COM 	return (error);
6498348SEric.Yu@Sun.COM }
6508348SEric.Yu@Sun.COM 
6518348SEric.Yu@Sun.COM int
6528348SEric.Yu@Sun.COM so_getpeername(struct sonode *so, struct sockaddr *addr,
6538348SEric.Yu@Sun.COM     socklen_t *addrlen, boolean_t accept, struct cred *cr)
6548348SEric.Yu@Sun.COM {
6558348SEric.Yu@Sun.COM 	int error;
6568348SEric.Yu@Sun.COM 
6578348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_GETPEERNAME(so, addr, addrlen, accept, cr));
6588348SEric.Yu@Sun.COM 
6598348SEric.Yu@Sun.COM 	if (accept) {
6608348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_getpeername)
6618348SEric.Yu@Sun.COM 		    (so->so_proto_handle, addr, addrlen, cr);
6628348SEric.Yu@Sun.COM 	} else if (!(so->so_state & SS_ISCONNECTED)) {
6638348SEric.Yu@Sun.COM 		error = ENOTCONN;
6648348SEric.Yu@Sun.COM 	} else if ((so->so_state & SS_CANTSENDMORE) && !xnet_skip_checks) {
6658348SEric.Yu@Sun.COM 		/* Added this check for X/Open */
6668348SEric.Yu@Sun.COM 		error = EINVAL;
6678348SEric.Yu@Sun.COM 		if (xnet_check_print) {
6688348SEric.Yu@Sun.COM 			printf("sockfs: X/Open getpeername check => EINVAL\n");
6698348SEric.Yu@Sun.COM 		}
6708348SEric.Yu@Sun.COM 	} else {
6718348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_getpeername)
6728348SEric.Yu@Sun.COM 		    (so->so_proto_handle, addr, addrlen, cr);
6738348SEric.Yu@Sun.COM 	}
6748348SEric.Yu@Sun.COM 
6758348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
6768348SEric.Yu@Sun.COM 	return (error);
6778348SEric.Yu@Sun.COM }
6788348SEric.Yu@Sun.COM 
6798348SEric.Yu@Sun.COM int
6808348SEric.Yu@Sun.COM so_getsockopt(struct sonode *so, int level, int option_name,
6818348SEric.Yu@Sun.COM     void *optval, socklen_t *optlenp, int flags, struct cred *cr)
6828348SEric.Yu@Sun.COM {
6838348SEric.Yu@Sun.COM 	int error = 0;
6848348SEric.Yu@Sun.COM 
6858348SEric.Yu@Sun.COM 	ASSERT(MUTEX_NOT_HELD(&so->so_lock));
6868348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so,
6878348SEric.Yu@Sun.COM 	    SOP_GETSOCKOPT(so, level, option_name, optval, optlenp, flags, cr));
6888348SEric.Yu@Sun.COM 
689*8465SEric.Yu@Sun.COM 	error = socket_getopt_common(so, level, option_name, optval, optlenp,
690*8465SEric.Yu@Sun.COM 	    flags);
6918348SEric.Yu@Sun.COM 	if (error < 0) {
6928348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_getsockopt)
6938348SEric.Yu@Sun.COM 		    (so->so_proto_handle, level, option_name, optval, optlenp,
6948348SEric.Yu@Sun.COM 		    cr);
6958348SEric.Yu@Sun.COM 		if (error ==  ENOPROTOOPT) {
6968348SEric.Yu@Sun.COM 			if (level == SOL_SOCKET) {
6978348SEric.Yu@Sun.COM 				/*
6988348SEric.Yu@Sun.COM 				 * If a protocol does not support a particular
6998348SEric.Yu@Sun.COM 				 * socket option, set can fail (not allowed)
7008348SEric.Yu@Sun.COM 				 * but get can not fail. This is the previous
7018348SEric.Yu@Sun.COM 				 * sockfs bahvior.
7028348SEric.Yu@Sun.COM 				 */
7038348SEric.Yu@Sun.COM 				switch (option_name) {
7048348SEric.Yu@Sun.COM 				case SO_LINGER:
7058348SEric.Yu@Sun.COM 					if (*optlenp < (t_uscalar_t)
7068348SEric.Yu@Sun.COM 					    sizeof (struct linger)) {
7078348SEric.Yu@Sun.COM 						error = EINVAL;
7088348SEric.Yu@Sun.COM 						break;
7098348SEric.Yu@Sun.COM 					}
7108348SEric.Yu@Sun.COM 					error = 0;
7118348SEric.Yu@Sun.COM 					bzero(optval, sizeof (struct linger));
7128348SEric.Yu@Sun.COM 					*optlenp = sizeof (struct linger);
7138348SEric.Yu@Sun.COM 					break;
7148348SEric.Yu@Sun.COM 				case SO_RCVTIMEO:
7158348SEric.Yu@Sun.COM 				case SO_SNDTIMEO:
7168348SEric.Yu@Sun.COM 					if (*optlenp < (t_uscalar_t)
7178348SEric.Yu@Sun.COM 					    sizeof (struct timeval)) {
7188348SEric.Yu@Sun.COM 						error = EINVAL;
7198348SEric.Yu@Sun.COM 						break;
7208348SEric.Yu@Sun.COM 					}
7218348SEric.Yu@Sun.COM 					error = 0;
7228348SEric.Yu@Sun.COM 					bzero(optval, sizeof (struct timeval));
7238348SEric.Yu@Sun.COM 					*optlenp = sizeof (struct timeval);
7248348SEric.Yu@Sun.COM 					break;
7258348SEric.Yu@Sun.COM 				case SO_SND_BUFINFO:
7268348SEric.Yu@Sun.COM 					if (*optlenp < (t_uscalar_t)
7278348SEric.Yu@Sun.COM 					    sizeof (struct so_snd_bufinfo)) {
7288348SEric.Yu@Sun.COM 						error = EINVAL;
7298348SEric.Yu@Sun.COM 						break;
7308348SEric.Yu@Sun.COM 					}
7318348SEric.Yu@Sun.COM 					error = 0;
7328348SEric.Yu@Sun.COM 					bzero(optval,
7338348SEric.Yu@Sun.COM 					    sizeof (struct so_snd_bufinfo));
7348348SEric.Yu@Sun.COM 					*optlenp =
7358348SEric.Yu@Sun.COM 					    sizeof (struct so_snd_bufinfo);
7368348SEric.Yu@Sun.COM 					break;
7378348SEric.Yu@Sun.COM 				case SO_DEBUG:
7388348SEric.Yu@Sun.COM 				case SO_REUSEADDR:
7398348SEric.Yu@Sun.COM 				case SO_KEEPALIVE:
7408348SEric.Yu@Sun.COM 				case SO_DONTROUTE:
7418348SEric.Yu@Sun.COM 				case SO_BROADCAST:
7428348SEric.Yu@Sun.COM 				case SO_USELOOPBACK:
7438348SEric.Yu@Sun.COM 				case SO_OOBINLINE:
7448348SEric.Yu@Sun.COM 				case SO_DGRAM_ERRIND:
7458348SEric.Yu@Sun.COM 				case SO_SNDBUF:
7468348SEric.Yu@Sun.COM 				case SO_RCVBUF:
7478348SEric.Yu@Sun.COM 					error = 0;
7488348SEric.Yu@Sun.COM 					*((int32_t *)optval) = 0;
7498348SEric.Yu@Sun.COM 					*optlenp = sizeof (int32_t);
7508348SEric.Yu@Sun.COM 					break;
7518348SEric.Yu@Sun.COM 				default:
7528348SEric.Yu@Sun.COM 					break;
7538348SEric.Yu@Sun.COM 				}
7548348SEric.Yu@Sun.COM 			}
7558348SEric.Yu@Sun.COM 		}
7568348SEric.Yu@Sun.COM 	}
7578348SEric.Yu@Sun.COM 
7588348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
7598348SEric.Yu@Sun.COM 	return (error);
7608348SEric.Yu@Sun.COM }
7618348SEric.Yu@Sun.COM 
7628348SEric.Yu@Sun.COM int
7638348SEric.Yu@Sun.COM so_setsockopt(struct sonode *so, int level, int option_name,
7648348SEric.Yu@Sun.COM     const void *optval, socklen_t optlen, struct cred *cr)
7658348SEric.Yu@Sun.COM {
7668348SEric.Yu@Sun.COM 	int error = 0;
7678348SEric.Yu@Sun.COM 
7688348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so,
7698348SEric.Yu@Sun.COM 	    SOP_SETSOCKOPT(so, level, option_name, optval, optlen, cr));
7708348SEric.Yu@Sun.COM 
7718348SEric.Yu@Sun.COM 	/* X/Open requires this check */
7728348SEric.Yu@Sun.COM 	if (so->so_state & SS_CANTSENDMORE && !xnet_skip_checks) {
7738348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
7748348SEric.Yu@Sun.COM 		if (xnet_check_print)
7758348SEric.Yu@Sun.COM 			printf("sockfs: X/Open setsockopt check => EINVAL\n");
7768348SEric.Yu@Sun.COM 		return (EINVAL);
7778348SEric.Yu@Sun.COM 	}
7788348SEric.Yu@Sun.COM 
779*8465SEric.Yu@Sun.COM 	if (level == SOL_SOCKET) {
780*8465SEric.Yu@Sun.COM 		switch (option_name) {
781*8465SEric.Yu@Sun.COM 		case SO_RCVTIMEO:
782*8465SEric.Yu@Sun.COM 		case SO_SNDTIMEO: {
783*8465SEric.Yu@Sun.COM 			struct timeval *tl = (struct timeval *)optval;
784*8465SEric.Yu@Sun.COM 			clock_t t_usec;
7858348SEric.Yu@Sun.COM 
786*8465SEric.Yu@Sun.COM 			if (optlen != (t_uscalar_t)sizeof (struct timeval)) {
787*8465SEric.Yu@Sun.COM 				SO_UNBLOCK_FALLBACK(so);
788*8465SEric.Yu@Sun.COM 				return (EINVAL);
789*8465SEric.Yu@Sun.COM 			}
790*8465SEric.Yu@Sun.COM 			t_usec = tl->tv_sec * 1000 * 1000 + tl->tv_usec;
791*8465SEric.Yu@Sun.COM 			mutex_enter(&so->so_lock);
792*8465SEric.Yu@Sun.COM 			if (option_name == SO_RCVTIMEO)
793*8465SEric.Yu@Sun.COM 				so->so_rcvtimeo = drv_usectohz(t_usec);
794*8465SEric.Yu@Sun.COM 			else
795*8465SEric.Yu@Sun.COM 				so->so_sndtimeo = drv_usectohz(t_usec);
796*8465SEric.Yu@Sun.COM 			mutex_exit(&so->so_lock);
7978348SEric.Yu@Sun.COM 			SO_UNBLOCK_FALLBACK(so);
798*8465SEric.Yu@Sun.COM 			return (0);
7998348SEric.Yu@Sun.COM 		}
800*8465SEric.Yu@Sun.COM 		case SO_RCVBUF:
801*8465SEric.Yu@Sun.COM 			/*
802*8465SEric.Yu@Sun.COM 			 * XXX XPG 4.2 applications retrieve SO_RCVBUF from
803*8465SEric.Yu@Sun.COM 			 * sockfs since the transport might adjust the value
804*8465SEric.Yu@Sun.COM 			 * and not return exactly what was set by the
805*8465SEric.Yu@Sun.COM 			 * application.
806*8465SEric.Yu@Sun.COM 			 */
807*8465SEric.Yu@Sun.COM 			so->so_xpg_rcvbuf = *(int32_t *)optval;
808*8465SEric.Yu@Sun.COM 			break;
809*8465SEric.Yu@Sun.COM 		}
8108348SEric.Yu@Sun.COM 	}
8118348SEric.Yu@Sun.COM 	error = (*so->so_downcalls->sd_setsockopt)
8128348SEric.Yu@Sun.COM 	    (so->so_proto_handle, level, option_name, optval, optlen, cr);
8138348SEric.Yu@Sun.COM 
8148348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
8158348SEric.Yu@Sun.COM 	return (error);
8168348SEric.Yu@Sun.COM }
8178348SEric.Yu@Sun.COM 
8188348SEric.Yu@Sun.COM int
8198348SEric.Yu@Sun.COM so_ioctl(struct sonode *so, int cmd, intptr_t arg, int mode,
8208348SEric.Yu@Sun.COM     struct cred *cr, int32_t *rvalp)
8218348SEric.Yu@Sun.COM {
8228348SEric.Yu@Sun.COM 	int error = 0;
8238348SEric.Yu@Sun.COM 
8248348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_IOCTL(so, cmd, arg, mode, cr, rvalp));
8258348SEric.Yu@Sun.COM 
8268348SEric.Yu@Sun.COM 	/*
8278348SEric.Yu@Sun.COM 	 * If there is a pending error, return error
8288348SEric.Yu@Sun.COM 	 * This can happen if a non blocking operation caused an error.
8298348SEric.Yu@Sun.COM 	 */
8308348SEric.Yu@Sun.COM 	if (so->so_error != 0) {
8318348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
8328348SEric.Yu@Sun.COM 		error = sogeterr(so, B_TRUE);
8338348SEric.Yu@Sun.COM 		mutex_exit(&so->so_lock);
8348348SEric.Yu@Sun.COM 		if (error != 0)
8358348SEric.Yu@Sun.COM 			goto done;
8368348SEric.Yu@Sun.COM 	}
8378348SEric.Yu@Sun.COM 
8388348SEric.Yu@Sun.COM 	/*
8398348SEric.Yu@Sun.COM 	 * calling strioc can result in the socket falling back to TPI,
8408348SEric.Yu@Sun.COM 	 * if that is supported.
8418348SEric.Yu@Sun.COM 	 */
8428348SEric.Yu@Sun.COM 	if ((error = socket_ioctl_common(so, cmd, arg, mode, cr, rvalp)) < 0 &&
8438348SEric.Yu@Sun.COM 	    (error = socket_strioc_common(so, cmd, arg, mode, cr, rvalp)) < 0) {
8448348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_ioctl)(so->so_proto_handle,
8458348SEric.Yu@Sun.COM 		    cmd, arg, mode, rvalp, cr);
8468348SEric.Yu@Sun.COM 	}
8478348SEric.Yu@Sun.COM 
8488348SEric.Yu@Sun.COM done:
8498348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
8508348SEric.Yu@Sun.COM 
8518348SEric.Yu@Sun.COM 	return (error);
8528348SEric.Yu@Sun.COM }
8538348SEric.Yu@Sun.COM 
8548348SEric.Yu@Sun.COM int
8558348SEric.Yu@Sun.COM so_poll(struct sonode *so, short events, int anyyet, short *reventsp,
8568348SEric.Yu@Sun.COM     struct pollhead **phpp)
8578348SEric.Yu@Sun.COM {
8588348SEric.Yu@Sun.COM 	int state = so->so_state;
8598348SEric.Yu@Sun.COM 	*reventsp = 0;
8608348SEric.Yu@Sun.COM 
8618348SEric.Yu@Sun.COM 	if (so->so_error != 0 &&
8628348SEric.Yu@Sun.COM 	    ((POLLIN|POLLRDNORM|POLLOUT) & events)  != 0) {
8638348SEric.Yu@Sun.COM 		*reventsp = (POLLIN|POLLRDNORM|POLLOUT) & events;
8648348SEric.Yu@Sun.COM 		return (0);
8658348SEric.Yu@Sun.COM 	}
8668348SEric.Yu@Sun.COM 
8678348SEric.Yu@Sun.COM 	/*
8688348SEric.Yu@Sun.COM 	 * As long as there is buffer to send data, and the socket is
8698348SEric.Yu@Sun.COM 	 * in a state where it can send data (i.e., connected for
8708348SEric.Yu@Sun.COM 	 * connection oriented protocols), then turn on POLLOUT events
8718348SEric.Yu@Sun.COM 	 */
8728348SEric.Yu@Sun.COM 	if (!so->so_snd_qfull && ((so->so_mode & SM_CONNREQUIRED) == 0 ||
8738348SEric.Yu@Sun.COM 	    state & SS_ISCONNECTED)) {
8748348SEric.Yu@Sun.COM 		*reventsp |= POLLOUT & events;
8758348SEric.Yu@Sun.COM 	}
8768348SEric.Yu@Sun.COM 
8778348SEric.Yu@Sun.COM 	/*
8788348SEric.Yu@Sun.COM 	 * Turn on POLLIN whenever there is data on the receive queue,
8798348SEric.Yu@Sun.COM 	 * or the socket is in a state where no more data will be received.
8808348SEric.Yu@Sun.COM 	 * Also, if the socket is accepting connections, flip the bit if
8818348SEric.Yu@Sun.COM 	 * there is something on the queue.
8828427SAnders.Persson@Sun.COM 	 *
8838427SAnders.Persson@Sun.COM 	 * We do an initial check for events without holding locks. However,
8848427SAnders.Persson@Sun.COM 	 * if there are no event available, then we redo the check for POLLIN
8858427SAnders.Persson@Sun.COM 	 * events under the lock.
8868348SEric.Yu@Sun.COM 	 */
8878348SEric.Yu@Sun.COM 
8888348SEric.Yu@Sun.COM 	/* Pending connections */
8898348SEric.Yu@Sun.COM 	if (so->so_acceptq_len > 0)
8908348SEric.Yu@Sun.COM 		*reventsp |= (POLLIN|POLLRDNORM) & events;
8918348SEric.Yu@Sun.COM 
8928348SEric.Yu@Sun.COM 	/* Data */
8938348SEric.Yu@Sun.COM 	/* so_downcalls is null for sctp */
8948348SEric.Yu@Sun.COM 	if (so->so_downcalls != NULL && so->so_downcalls->sd_poll != NULL) {
8958348SEric.Yu@Sun.COM 		*reventsp |= (*so->so_downcalls->sd_poll)
8968348SEric.Yu@Sun.COM 		    (so->so_proto_handle, events & SO_PROTO_POLLEV, anyyet,
8978348SEric.Yu@Sun.COM 		    CRED()) & events;
8988348SEric.Yu@Sun.COM 		ASSERT((*reventsp & ~events) == 0);
8998348SEric.Yu@Sun.COM 		/* do not recheck events */
9008348SEric.Yu@Sun.COM 		events &= ~SO_PROTO_POLLEV;
9018348SEric.Yu@Sun.COM 	} else {
9028348SEric.Yu@Sun.COM 		if (SO_HAVE_DATA(so))
9038348SEric.Yu@Sun.COM 			*reventsp |= (POLLIN|POLLRDNORM) & events;
9048348SEric.Yu@Sun.COM 
9058348SEric.Yu@Sun.COM 		/* Urgent data */
9068348SEric.Yu@Sun.COM 		if ((state & SS_OOBPEND) != 0)
9078348SEric.Yu@Sun.COM 			*reventsp |= (POLLRDBAND) & events;
9088348SEric.Yu@Sun.COM 	}
9098348SEric.Yu@Sun.COM 
9108348SEric.Yu@Sun.COM 	if (!*reventsp && !anyyet) {
9118348SEric.Yu@Sun.COM 		/* Check for read events again, but this time under lock */
9128348SEric.Yu@Sun.COM 		if (events & (POLLIN|POLLRDNORM)) {
9138348SEric.Yu@Sun.COM 			mutex_enter(&so->so_lock);
9148348SEric.Yu@Sun.COM 			if (SO_HAVE_DATA(so) || so->so_acceptq_len > 0) {
9158348SEric.Yu@Sun.COM 				mutex_exit(&so->so_lock);
9168348SEric.Yu@Sun.COM 				*reventsp |= (POLLIN|POLLRDNORM) & events;
9178348SEric.Yu@Sun.COM 				return (0);
9188348SEric.Yu@Sun.COM 			} else {
9198348SEric.Yu@Sun.COM 				so->so_pollev |= SO_POLLEV_IN;
9208348SEric.Yu@Sun.COM 				mutex_exit(&so->so_lock);
9218348SEric.Yu@Sun.COM 			}
9228348SEric.Yu@Sun.COM 		}
9238348SEric.Yu@Sun.COM 		*phpp = &so->so_poll_list;
9248348SEric.Yu@Sun.COM 	}
9258348SEric.Yu@Sun.COM 	return (0);
9268348SEric.Yu@Sun.COM }
9278348SEric.Yu@Sun.COM 
9288348SEric.Yu@Sun.COM /*
9298348SEric.Yu@Sun.COM  * Generic Upcalls
9308348SEric.Yu@Sun.COM  */
9318348SEric.Yu@Sun.COM void
9328348SEric.Yu@Sun.COM so_connected(sock_upper_handle_t sock_handle, sock_connid_t id,
9338348SEric.Yu@Sun.COM     cred_t *peer_cred, pid_t peer_cpid)
9348348SEric.Yu@Sun.COM {
9358348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
9368348SEric.Yu@Sun.COM 
9378348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
9388348SEric.Yu@Sun.COM 	ASSERT(so->so_proto_handle != NULL);
9398348SEric.Yu@Sun.COM 
9408348SEric.Yu@Sun.COM 	if (peer_cred != NULL) {
9418348SEric.Yu@Sun.COM 		if (so->so_peercred != NULL)
9428348SEric.Yu@Sun.COM 			crfree(so->so_peercred);
9438348SEric.Yu@Sun.COM 		crhold(peer_cred);
9448348SEric.Yu@Sun.COM 		so->so_peercred = peer_cred;
9458348SEric.Yu@Sun.COM 		so->so_cpid = peer_cpid;
9468348SEric.Yu@Sun.COM 	}
9478348SEric.Yu@Sun.COM 
9488348SEric.Yu@Sun.COM 	so->so_proto_connid = id;
9498348SEric.Yu@Sun.COM 	soisconnected(so);
9508348SEric.Yu@Sun.COM 	/*
9518348SEric.Yu@Sun.COM 	 * Wake ones who're waiting for conn to become established.
9528348SEric.Yu@Sun.COM 	 */
9538348SEric.Yu@Sun.COM 	so_notify_connected(so);
9548348SEric.Yu@Sun.COM }
9558348SEric.Yu@Sun.COM 
9568348SEric.Yu@Sun.COM int
9578348SEric.Yu@Sun.COM so_disconnected(sock_upper_handle_t sock_handle, sock_connid_t id, int error)
9588348SEric.Yu@Sun.COM {
9598348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
9608348SEric.Yu@Sun.COM 
9618348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
9628348SEric.Yu@Sun.COM 
9638348SEric.Yu@Sun.COM 	so->so_proto_connid = id;
9648348SEric.Yu@Sun.COM 	soisdisconnected(so, error);
9658348SEric.Yu@Sun.COM 	so_notify_disconnected(so, error);
9668348SEric.Yu@Sun.COM 
9678348SEric.Yu@Sun.COM 	return (0);
9688348SEric.Yu@Sun.COM }
9698348SEric.Yu@Sun.COM 
9708348SEric.Yu@Sun.COM void
9718348SEric.Yu@Sun.COM so_opctl(sock_upper_handle_t sock_handle, sock_opctl_action_t action,
9728348SEric.Yu@Sun.COM     uintptr_t arg)
9738348SEric.Yu@Sun.COM {
9748348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
9758348SEric.Yu@Sun.COM 
9768348SEric.Yu@Sun.COM 	switch (action) {
9778348SEric.Yu@Sun.COM 	case SOCK_OPCTL_SHUT_SEND:
9788348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
9798348SEric.Yu@Sun.COM 		socantsendmore(so);
9808348SEric.Yu@Sun.COM 		so_notify_disconnecting(so);
9818348SEric.Yu@Sun.COM 		break;
9828348SEric.Yu@Sun.COM 	case SOCK_OPCTL_SHUT_RECV: {
9838348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
9848348SEric.Yu@Sun.COM 		socantrcvmore(so);
9858348SEric.Yu@Sun.COM 		so_notify_eof(so);
9868348SEric.Yu@Sun.COM 		break;
9878348SEric.Yu@Sun.COM 	}
9888348SEric.Yu@Sun.COM 	case SOCK_OPCTL_ENAB_ACCEPT:
9898348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
9908348SEric.Yu@Sun.COM 		so->so_state |= SS_ACCEPTCONN;
9918348SEric.Yu@Sun.COM 		so->so_backlog = (unsigned int)arg;
9928348SEric.Yu@Sun.COM 		mutex_exit(&so->so_lock);
9938348SEric.Yu@Sun.COM 		break;
9948348SEric.Yu@Sun.COM 	default:
9958348SEric.Yu@Sun.COM 		ASSERT(0);
9968348SEric.Yu@Sun.COM 		break;
9978348SEric.Yu@Sun.COM 	}
9988348SEric.Yu@Sun.COM }
9998348SEric.Yu@Sun.COM 
10008348SEric.Yu@Sun.COM void
10018348SEric.Yu@Sun.COM so_txq_full(sock_upper_handle_t sock_handle, boolean_t qfull)
10028348SEric.Yu@Sun.COM {
10038348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
10048348SEric.Yu@Sun.COM 
10058348SEric.Yu@Sun.COM 	if (qfull) {
10068348SEric.Yu@Sun.COM 		so_snd_qfull(so);
10078348SEric.Yu@Sun.COM 	} else {
10088348SEric.Yu@Sun.COM 		so_snd_qnotfull(so);
10098348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
10108348SEric.Yu@Sun.COM 		so_notify_writable(so);
10118348SEric.Yu@Sun.COM 	}
10128348SEric.Yu@Sun.COM }
10138348SEric.Yu@Sun.COM 
10148348SEric.Yu@Sun.COM sock_upper_handle_t
10158348SEric.Yu@Sun.COM so_newconn(sock_upper_handle_t parenthandle,
10168348SEric.Yu@Sun.COM     sock_lower_handle_t proto_handle, sock_downcalls_t *sock_downcalls,
10178348SEric.Yu@Sun.COM     struct cred *peer_cred, pid_t peer_cpid, sock_upcalls_t **sock_upcallsp)
10188348SEric.Yu@Sun.COM {
10198348SEric.Yu@Sun.COM 	struct sonode	*so = (struct sonode *)parenthandle;
10208348SEric.Yu@Sun.COM 	struct sonode	*nso;
10218348SEric.Yu@Sun.COM 	int error;
10228348SEric.Yu@Sun.COM 
10238348SEric.Yu@Sun.COM 	ASSERT(proto_handle != NULL);
10248348SEric.Yu@Sun.COM 
10258348SEric.Yu@Sun.COM 	if ((so->so_state & SS_ACCEPTCONN) == 0 ||
10268348SEric.Yu@Sun.COM 	    so->so_acceptq_len >= so->so_backlog)
10278348SEric.Yu@Sun.COM 		return (NULL);
10288348SEric.Yu@Sun.COM 
10298348SEric.Yu@Sun.COM 	nso = socket_newconn(so, proto_handle, sock_downcalls, SOCKET_NOSLEEP,
10308348SEric.Yu@Sun.COM 	    &error);
10318348SEric.Yu@Sun.COM 	if (nso == NULL)
10328348SEric.Yu@Sun.COM 		return (NULL);
10338348SEric.Yu@Sun.COM 
10348348SEric.Yu@Sun.COM 	if (peer_cred != NULL) {
10358348SEric.Yu@Sun.COM 		crhold(peer_cred);
10368348SEric.Yu@Sun.COM 		nso->so_peercred = peer_cred;
10378348SEric.Yu@Sun.COM 		nso->so_cpid = peer_cpid;
10388348SEric.Yu@Sun.COM 	}
10398348SEric.Yu@Sun.COM 
10408348SEric.Yu@Sun.COM 	(void) so_acceptq_enqueue(so, nso);
10418348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
10428348SEric.Yu@Sun.COM 	so_notify_newconn(so);
10438348SEric.Yu@Sun.COM 
10448348SEric.Yu@Sun.COM 	*sock_upcallsp = &so_upcalls;
10458348SEric.Yu@Sun.COM 
10468348SEric.Yu@Sun.COM 	return ((sock_upper_handle_t)nso);
10478348SEric.Yu@Sun.COM }
10488348SEric.Yu@Sun.COM 
10498348SEric.Yu@Sun.COM void
10508348SEric.Yu@Sun.COM so_set_prop(sock_upper_handle_t sock_handle, struct sock_proto_props *soppp)
10518348SEric.Yu@Sun.COM {
10528348SEric.Yu@Sun.COM 	struct sonode *so;
10538348SEric.Yu@Sun.COM 
10548348SEric.Yu@Sun.COM 	so = (struct sonode *)sock_handle;
10558348SEric.Yu@Sun.COM 
10568348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
10578348SEric.Yu@Sun.COM 
10588348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_MAXBLK)
10598348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_maxblk = soppp->sopp_maxblk;
10608348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_WROFF)
10618348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_wroff = soppp->sopp_wroff;
10628348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_TAIL)
10638348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_tail = soppp->sopp_tail;
10648348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_RCVHIWAT)
10658348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_rxhiwat = soppp->sopp_rxhiwat;
10668348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_RCVLOWAT)
10678348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_rxlowat = soppp->sopp_rxlowat;
10688348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_MAXPSZ)
10698348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_maxpsz = soppp->sopp_maxpsz;
10708348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_MINPSZ)
10718348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_minpsz = soppp->sopp_minpsz;
10728348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_ZCOPY) {
10738348SEric.Yu@Sun.COM 		if (soppp->sopp_zcopyflag & ZCVMSAFE) {
10748348SEric.Yu@Sun.COM 			so->so_proto_props.sopp_zcopyflag |= STZCVMSAFE;
10758348SEric.Yu@Sun.COM 			so->so_proto_props.sopp_zcopyflag &= ~STZCVMUNSAFE;
10768348SEric.Yu@Sun.COM 		} else if (soppp->sopp_zcopyflag & ZCVMUNSAFE) {
10778348SEric.Yu@Sun.COM 			so->so_proto_props.sopp_zcopyflag |= STZCVMUNSAFE;
10788348SEric.Yu@Sun.COM 			so->so_proto_props.sopp_zcopyflag &= ~STZCVMSAFE;
10798348SEric.Yu@Sun.COM 		}
10808348SEric.Yu@Sun.COM 
10818348SEric.Yu@Sun.COM 		if (soppp->sopp_zcopyflag & COPYCACHED) {
10828348SEric.Yu@Sun.COM 			so->so_proto_props.sopp_zcopyflag |= STRCOPYCACHED;
10838348SEric.Yu@Sun.COM 		}
10848348SEric.Yu@Sun.COM 	}
10858348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_OOBINLINE)
10868348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_oobinline = soppp->sopp_oobinline;
10878348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_RCVTIMER)
10888348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_rcvtimer = soppp->sopp_rcvtimer;
10898348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_RCVTHRESH)
10908348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_rcvthresh = soppp->sopp_rcvthresh;
10918348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_MAXADDRLEN)
10928348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_maxaddrlen = soppp->sopp_maxaddrlen;
10938348SEric.Yu@Sun.COM 
10948348SEric.Yu@Sun.COM 	mutex_exit(&so->so_lock);
10958348SEric.Yu@Sun.COM 
10968348SEric.Yu@Sun.COM #ifdef DEBUG
10978348SEric.Yu@Sun.COM 	soppp->sopp_flags &= ~(SOCKOPT_MAXBLK | SOCKOPT_WROFF | SOCKOPT_TAIL |
10988348SEric.Yu@Sun.COM 	    SOCKOPT_RCVHIWAT | SOCKOPT_RCVLOWAT | SOCKOPT_MAXPSZ |
10998348SEric.Yu@Sun.COM 	    SOCKOPT_ZCOPY | SOCKOPT_OOBINLINE | SOCKOPT_RCVTIMER |
11008348SEric.Yu@Sun.COM 	    SOCKOPT_RCVTHRESH | SOCKOPT_MAXADDRLEN | SOCKOPT_MINPSZ);
11018348SEric.Yu@Sun.COM 	ASSERT(soppp->sopp_flags == 0);
11028348SEric.Yu@Sun.COM #endif
11038348SEric.Yu@Sun.COM }
11048348SEric.Yu@Sun.COM 
11058348SEric.Yu@Sun.COM /* ARGSUSED */
11068348SEric.Yu@Sun.COM ssize_t
11078348SEric.Yu@Sun.COM so_queue_msg(sock_upper_handle_t sock_handle, mblk_t *mp,
11088348SEric.Yu@Sun.COM     size_t msg_size, int flags, int *errorp,  boolean_t *force_pushp)
11098348SEric.Yu@Sun.COM {
11108348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
11118348SEric.Yu@Sun.COM 	boolean_t force_push = B_TRUE;
11128348SEric.Yu@Sun.COM 	int space_left;
11138348SEric.Yu@Sun.COM 	sodirect_t *sodp = so->so_direct;
11148348SEric.Yu@Sun.COM 
11158348SEric.Yu@Sun.COM 	ASSERT(errorp != NULL);
11168348SEric.Yu@Sun.COM 	*errorp = 0;
11178348SEric.Yu@Sun.COM 	if (mp == NULL) {
11188348SEric.Yu@Sun.COM 		if (msg_size > 0) {
11198348SEric.Yu@Sun.COM 			ASSERT(so->so_downcalls->sd_recv_uio != NULL);
11208348SEric.Yu@Sun.COM 			mutex_enter(&so->so_lock);
11218348SEric.Yu@Sun.COM 			/* the notify functions will drop the lock */
11228348SEric.Yu@Sun.COM 			if (flags & MSG_OOB)
11238348SEric.Yu@Sun.COM 				so_notify_oobdata(so, IS_SO_OOB_INLINE(so));
11248348SEric.Yu@Sun.COM 			else
11258348SEric.Yu@Sun.COM 				so_notify_data(so, msg_size);
11268348SEric.Yu@Sun.COM 			return (0);
11278348SEric.Yu@Sun.COM 		}
11288348SEric.Yu@Sun.COM 		/*
11298348SEric.Yu@Sun.COM 		 * recv space check
11308348SEric.Yu@Sun.COM 		 */
11318348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
11328348SEric.Yu@Sun.COM 		space_left = so->so_rcvbuf - so->so_rcv_queued;
11338348SEric.Yu@Sun.COM 		if (space_left <= 0) {
11348348SEric.Yu@Sun.COM 			so->so_flowctrld = B_TRUE;
11358348SEric.Yu@Sun.COM 			*errorp = ENOSPC;
11368348SEric.Yu@Sun.COM 			space_left = -1;
11378348SEric.Yu@Sun.COM 		}
11388348SEric.Yu@Sun.COM 		goto done_unlock;
11398348SEric.Yu@Sun.COM 	}
11408348SEric.Yu@Sun.COM 
11418348SEric.Yu@Sun.COM 	ASSERT(mp->b_next == NULL);
11428348SEric.Yu@Sun.COM 	ASSERT(DB_TYPE(mp) == M_DATA || DB_TYPE(mp) == M_PROTO);
11438348SEric.Yu@Sun.COM 	ASSERT(msg_size == msgdsize(mp));
11448348SEric.Yu@Sun.COM 
11458348SEric.Yu@Sun.COM 	if (flags & MSG_OOB) {
11468348SEric.Yu@Sun.COM 		so_queue_oob(sock_handle, mp, msg_size);
11478348SEric.Yu@Sun.COM 		return (0);
11488348SEric.Yu@Sun.COM 	}
11498348SEric.Yu@Sun.COM 
11508348SEric.Yu@Sun.COM 	if (force_pushp != NULL)
11518348SEric.Yu@Sun.COM 		force_push = *force_pushp;
11528348SEric.Yu@Sun.COM 
11538348SEric.Yu@Sun.COM 	if (DB_TYPE(mp) == M_PROTO && !__TPI_PRIM_ISALIGNED(mp->b_rptr)) {
11548348SEric.Yu@Sun.COM 		/* The read pointer is not aligned correctly for TPI */
11558348SEric.Yu@Sun.COM 		zcmn_err(getzoneid(), CE_WARN,
11568348SEric.Yu@Sun.COM 		    "sockfs: Unaligned TPI message received. rptr = %p\n",
11578348SEric.Yu@Sun.COM 		    (void *)mp->b_rptr);
11588348SEric.Yu@Sun.COM 		freemsg(mp);
11598348SEric.Yu@Sun.COM 		mutex_enter(sodp->sod_lockp);
11608348SEric.Yu@Sun.COM 		SOD_UIOAFINI(sodp);
11618348SEric.Yu@Sun.COM 		mutex_exit(sodp->sod_lockp);
11628348SEric.Yu@Sun.COM 
11638348SEric.Yu@Sun.COM 		return (so->so_rcvbuf - so->so_rcv_queued);
11648348SEric.Yu@Sun.COM 	}
11658348SEric.Yu@Sun.COM 
11668348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
11678348SEric.Yu@Sun.COM 	if (so->so_state & (SS_FALLBACK_PENDING | SS_FALLBACK_COMP)) {
11688348SEric.Yu@Sun.COM 		SOD_DISABLE(sodp);
11698348SEric.Yu@Sun.COM 		mutex_exit(&so->so_lock);
11708348SEric.Yu@Sun.COM 		*errorp = EOPNOTSUPP;
11718348SEric.Yu@Sun.COM 		return (-1);
11728348SEric.Yu@Sun.COM 	}
11738348SEric.Yu@Sun.COM 	if (so->so_state & SS_CANTRCVMORE) {
11748348SEric.Yu@Sun.COM 		freemsg(mp);
11758348SEric.Yu@Sun.COM 		SOD_DISABLE(sodp);
11768348SEric.Yu@Sun.COM 		mutex_exit(&so->so_lock);
11778348SEric.Yu@Sun.COM 		return (0);
11788348SEric.Yu@Sun.COM 	}
11798348SEric.Yu@Sun.COM 
11808348SEric.Yu@Sun.COM 	/* process the mblk via I/OAT if capable */
11818348SEric.Yu@Sun.COM 	if (sodp != NULL && (sodp->sod_state & SOD_ENABLED)) {
11828348SEric.Yu@Sun.COM 		if (DB_TYPE(mp) == M_DATA) {
11838348SEric.Yu@Sun.COM 			(void) sod_uioa_mblk_init(sodp, mp, msg_size);
11848348SEric.Yu@Sun.COM 		} else {
11858348SEric.Yu@Sun.COM 			SOD_UIOAFINI(sodp);
11868348SEric.Yu@Sun.COM 		}
11878348SEric.Yu@Sun.COM 	}
11888348SEric.Yu@Sun.COM 
11898348SEric.Yu@Sun.COM 	if (mp->b_next == NULL) {
11908348SEric.Yu@Sun.COM 		so_enqueue_msg(so, mp, msg_size);
11918348SEric.Yu@Sun.COM 	} else {
11928348SEric.Yu@Sun.COM 		do {
11938348SEric.Yu@Sun.COM 			mblk_t *nmp;
11948348SEric.Yu@Sun.COM 
11958348SEric.Yu@Sun.COM 			if ((nmp = mp->b_next) != NULL) {
11968348SEric.Yu@Sun.COM 				mp->b_next = NULL;
11978348SEric.Yu@Sun.COM 			}
11988348SEric.Yu@Sun.COM 			so_enqueue_msg(so, mp, msgdsize(mp));
11998348SEric.Yu@Sun.COM 			mp = nmp;
12008348SEric.Yu@Sun.COM 		} while (mp != NULL);
12018348SEric.Yu@Sun.COM 	}
12028348SEric.Yu@Sun.COM 
12038348SEric.Yu@Sun.COM 	space_left = so->so_rcvbuf - so->so_rcv_queued;
12048348SEric.Yu@Sun.COM 	if (space_left <= 0) {
12058348SEric.Yu@Sun.COM 		so->so_flowctrld = B_TRUE;
12068348SEric.Yu@Sun.COM 		*errorp = ENOSPC;
12078348SEric.Yu@Sun.COM 		space_left = -1;
12088348SEric.Yu@Sun.COM 	}
12098348SEric.Yu@Sun.COM 
12108348SEric.Yu@Sun.COM 	if (force_push || so->so_rcv_queued >= so->so_rcv_thresh ||
12118348SEric.Yu@Sun.COM 	    so->so_rcv_queued >= so->so_rcv_wanted ||
12128348SEric.Yu@Sun.COM 	    (sodp != NULL && so->so_rcv_queued >= sodp->sod_want)) {
12138348SEric.Yu@Sun.COM 		SOCKET_TIMER_CANCEL(so);
12148348SEric.Yu@Sun.COM 		/*
12158348SEric.Yu@Sun.COM 		 * so_notify_data will release the lock
12168348SEric.Yu@Sun.COM 		 */
12178348SEric.Yu@Sun.COM 		so_notify_data(so, so->so_rcv_queued);
12188348SEric.Yu@Sun.COM 
12198348SEric.Yu@Sun.COM 		if (force_pushp != NULL)
12208348SEric.Yu@Sun.COM 			*force_pushp = B_TRUE;
12218348SEric.Yu@Sun.COM 		goto done;
12228348SEric.Yu@Sun.COM 	} else if (so->so_rcv_timer_tid == 0) {
12238348SEric.Yu@Sun.COM 		/* Make sure the recv push timer is running */
12248348SEric.Yu@Sun.COM 		SOCKET_TIMER_START(so);
12258348SEric.Yu@Sun.COM 	}
12268348SEric.Yu@Sun.COM 
12278348SEric.Yu@Sun.COM done_unlock:
12288348SEric.Yu@Sun.COM 	mutex_exit(&so->so_lock);
12298348SEric.Yu@Sun.COM done:
12308348SEric.Yu@Sun.COM 	return (space_left);
12318348SEric.Yu@Sun.COM }
12328348SEric.Yu@Sun.COM 
12338348SEric.Yu@Sun.COM /*
12348348SEric.Yu@Sun.COM  * Set the offset of where the oob data is relative to the bytes in
12358348SEric.Yu@Sun.COM  * queued. Also generate SIGURG
12368348SEric.Yu@Sun.COM  */
12378348SEric.Yu@Sun.COM void
12388348SEric.Yu@Sun.COM so_signal_oob(sock_upper_handle_t sock_handle, ssize_t offset)
12398348SEric.Yu@Sun.COM {
12408348SEric.Yu@Sun.COM 	struct sonode *so;
12418348SEric.Yu@Sun.COM 
12428348SEric.Yu@Sun.COM 	ASSERT(offset >= 0);
12438348SEric.Yu@Sun.COM 	so = (struct sonode *)sock_handle;
12448348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
12458348SEric.Yu@Sun.COM 	SOD_UIOAFINI(so->so_direct);
12468348SEric.Yu@Sun.COM 
12478348SEric.Yu@Sun.COM 	/*
12488348SEric.Yu@Sun.COM 	 * New urgent data on the way so forget about any old
12498348SEric.Yu@Sun.COM 	 * urgent data.
12508348SEric.Yu@Sun.COM 	 */
12518348SEric.Yu@Sun.COM 	so->so_state &= ~(SS_HAVEOOBDATA|SS_HADOOBDATA);
12528348SEric.Yu@Sun.COM 
12538348SEric.Yu@Sun.COM 	/*
12548348SEric.Yu@Sun.COM 	 * Record that urgent data is pending.
12558348SEric.Yu@Sun.COM 	 */
12568348SEric.Yu@Sun.COM 	so->so_state |= SS_OOBPEND;
12578348SEric.Yu@Sun.COM 
12588348SEric.Yu@Sun.COM 	if (so->so_oobmsg != NULL) {
12598348SEric.Yu@Sun.COM 		dprintso(so, 1, ("sock: discarding old oob\n"));
12608348SEric.Yu@Sun.COM 		freemsg(so->so_oobmsg);
12618348SEric.Yu@Sun.COM 		so->so_oobmsg = NULL;
12628348SEric.Yu@Sun.COM 	}
12638348SEric.Yu@Sun.COM 
12648348SEric.Yu@Sun.COM 	/*
12658348SEric.Yu@Sun.COM 	 * set the offset where the urgent byte is
12668348SEric.Yu@Sun.COM 	 */
12678348SEric.Yu@Sun.COM 	so->so_oobmark = so->so_rcv_queued + offset;
12688348SEric.Yu@Sun.COM 	if (so->so_oobmark == 0)
12698348SEric.Yu@Sun.COM 		so->so_state |= SS_RCVATMARK;
12708348SEric.Yu@Sun.COM 	else
12718348SEric.Yu@Sun.COM 		so->so_state &= ~SS_RCVATMARK;
12728348SEric.Yu@Sun.COM 
12738348SEric.Yu@Sun.COM 	so_notify_oobsig(so);
12748348SEric.Yu@Sun.COM }
12758348SEric.Yu@Sun.COM 
12768348SEric.Yu@Sun.COM /*
12778348SEric.Yu@Sun.COM  * Queue the OOB byte
12788348SEric.Yu@Sun.COM  */
12798348SEric.Yu@Sun.COM static void
12808348SEric.Yu@Sun.COM so_queue_oob(sock_upper_handle_t sock_handle, mblk_t *mp, size_t len)
12818348SEric.Yu@Sun.COM {
12828348SEric.Yu@Sun.COM 	struct sonode *so;
12838348SEric.Yu@Sun.COM 
12848348SEric.Yu@Sun.COM 	so = (struct sonode *)sock_handle;
12858348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
12868348SEric.Yu@Sun.COM 	SOD_UIOAFINI(so->so_direct);
12878348SEric.Yu@Sun.COM 
12888348SEric.Yu@Sun.COM 	ASSERT(mp != NULL);
12898348SEric.Yu@Sun.COM 	if (!IS_SO_OOB_INLINE(so)) {
12908348SEric.Yu@Sun.COM 		so->so_oobmsg = mp;
12918348SEric.Yu@Sun.COM 		so->so_state |= SS_HAVEOOBDATA;
12928348SEric.Yu@Sun.COM 	} else {
12938348SEric.Yu@Sun.COM 		so_enqueue_msg(so, mp, len);
12948348SEric.Yu@Sun.COM 	}
12958348SEric.Yu@Sun.COM 
12968348SEric.Yu@Sun.COM 	so_notify_oobdata(so, IS_SO_OOB_INLINE(so));
12978348SEric.Yu@Sun.COM }
12988348SEric.Yu@Sun.COM 
12998348SEric.Yu@Sun.COM int
13008348SEric.Yu@Sun.COM so_close(struct sonode *so, int flag, struct cred *cr)
13018348SEric.Yu@Sun.COM {
13028348SEric.Yu@Sun.COM 	int error;
13038348SEric.Yu@Sun.COM 
13048348SEric.Yu@Sun.COM 	error = (*so->so_downcalls->sd_close)(so->so_proto_handle, flag, cr);
13058348SEric.Yu@Sun.COM 
13068348SEric.Yu@Sun.COM 	/*
13078348SEric.Yu@Sun.COM 	 * At this point there will be no more upcalls from the protocol
13088348SEric.Yu@Sun.COM 	 */
13098348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
13108399SRao.Shoaib@Sun.COM 
13118399SRao.Shoaib@Sun.COM 	ASSERT(so_verify_oobstate(so));
13128399SRao.Shoaib@Sun.COM 
13138348SEric.Yu@Sun.COM 	so_rcv_flush(so);
13148348SEric.Yu@Sun.COM 	mutex_exit(&so->so_lock);
13158348SEric.Yu@Sun.COM 
13168348SEric.Yu@Sun.COM 	return (error);
13178348SEric.Yu@Sun.COM }
13188348SEric.Yu@Sun.COM 
13198348SEric.Yu@Sun.COM void
13208348SEric.Yu@Sun.COM so_zcopy_notify(sock_upper_handle_t sock_handle)
13218348SEric.Yu@Sun.COM {
13228348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
13238348SEric.Yu@Sun.COM 
13248348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
13258348SEric.Yu@Sun.COM 	so->so_copyflag |= STZCNOTIFY;
13268348SEric.Yu@Sun.COM 	cv_broadcast(&so->so_copy_cv);
13278348SEric.Yu@Sun.COM 	mutex_exit(&so->so_lock);
13288348SEric.Yu@Sun.COM }
13298348SEric.Yu@Sun.COM 
13308348SEric.Yu@Sun.COM void
13318348SEric.Yu@Sun.COM so_set_error(sock_upper_handle_t sock_handle, int error)
13328348SEric.Yu@Sun.COM {
13338348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
13348348SEric.Yu@Sun.COM 
13358348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
13368348SEric.Yu@Sun.COM 
13378348SEric.Yu@Sun.COM 	soseterror(so, error);
13388348SEric.Yu@Sun.COM 
13398348SEric.Yu@Sun.COM 	so_notify_error(so);
13408348SEric.Yu@Sun.COM }
13418348SEric.Yu@Sun.COM 
13428348SEric.Yu@Sun.COM /*
13438348SEric.Yu@Sun.COM  * so_recvmsg - read data from the socket
13448348SEric.Yu@Sun.COM  *
13458348SEric.Yu@Sun.COM  * There are two ways of obtaining data; either we ask the protocol to
13468348SEric.Yu@Sun.COM  * copy directly into the supplied buffer, or we copy data from the
13478348SEric.Yu@Sun.COM  * sonode's receive queue. The decision which one to use depends on
13488348SEric.Yu@Sun.COM  * whether the protocol has a sd_recv_uio down call.
13498348SEric.Yu@Sun.COM  */
13508348SEric.Yu@Sun.COM int
13518348SEric.Yu@Sun.COM so_recvmsg(struct sonode *so, struct nmsghdr *msg, struct uio *uiop,
13528348SEric.Yu@Sun.COM     struct cred *cr)
13538348SEric.Yu@Sun.COM {
13548348SEric.Yu@Sun.COM 	rval_t 		rval;
13558348SEric.Yu@Sun.COM 	int 		flags = 0;
13568348SEric.Yu@Sun.COM 	t_uscalar_t	controllen, namelen;
13578348SEric.Yu@Sun.COM 	int 		error = 0;
13588348SEric.Yu@Sun.COM 	int ret;
13598348SEric.Yu@Sun.COM 	mblk_t		*mctlp = NULL;
13608348SEric.Yu@Sun.COM 	union T_primitives *tpr;
13618348SEric.Yu@Sun.COM 	void		*control;
13628348SEric.Yu@Sun.COM 	ssize_t		saved_resid;
13638348SEric.Yu@Sun.COM 	struct uio	*suiop;
13648348SEric.Yu@Sun.COM 
13658348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_RECVMSG(so, msg, uiop, cr));
13668348SEric.Yu@Sun.COM 
13678348SEric.Yu@Sun.COM 	if ((so->so_state & (SS_ISCONNECTED|SS_CANTRCVMORE)) == 0 &&
13688348SEric.Yu@Sun.COM 	    (so->so_mode & SM_CONNREQUIRED)) {
13698348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
13708348SEric.Yu@Sun.COM 		return (ENOTCONN);
13718348SEric.Yu@Sun.COM 	}
13728348SEric.Yu@Sun.COM 
13738348SEric.Yu@Sun.COM 	if (msg->msg_flags & MSG_PEEK)
13748348SEric.Yu@Sun.COM 		msg->msg_flags &= ~MSG_WAITALL;
13758348SEric.Yu@Sun.COM 
13768348SEric.Yu@Sun.COM 	if (so->so_mode & SM_ATOMIC)
13778348SEric.Yu@Sun.COM 		msg->msg_flags |= MSG_TRUNC;
13788348SEric.Yu@Sun.COM 
13798348SEric.Yu@Sun.COM 	if (msg->msg_flags & MSG_OOB) {
13808348SEric.Yu@Sun.COM 		if ((so->so_mode & SM_EXDATA) == 0) {
13818348SEric.Yu@Sun.COM 			error = EOPNOTSUPP;
13828348SEric.Yu@Sun.COM 		} else if (so->so_downcalls->sd_recv_uio != NULL) {
13838348SEric.Yu@Sun.COM 			error = (*so->so_downcalls->sd_recv_uio)
13848348SEric.Yu@Sun.COM 			    (so->so_proto_handle, uiop, msg, cr);
13858348SEric.Yu@Sun.COM 		} else {
13868348SEric.Yu@Sun.COM 			error = sorecvoob(so, msg, uiop, msg->msg_flags,
13878348SEric.Yu@Sun.COM 			    IS_SO_OOB_INLINE(so));
13888348SEric.Yu@Sun.COM 		}
13898348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
13908348SEric.Yu@Sun.COM 		return (error);
13918348SEric.Yu@Sun.COM 	}
13928348SEric.Yu@Sun.COM 
13938348SEric.Yu@Sun.COM 	/*
13948348SEric.Yu@Sun.COM 	 * If the protocol has the recv down call, then pass the request
13958348SEric.Yu@Sun.COM 	 * down.
13968348SEric.Yu@Sun.COM 	 */
13978348SEric.Yu@Sun.COM 	if (so->so_downcalls->sd_recv_uio != NULL) {
13988348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_recv_uio)
13998348SEric.Yu@Sun.COM 		    (so->so_proto_handle, uiop, msg, cr);
14008348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
14018348SEric.Yu@Sun.COM 		return (error);
14028348SEric.Yu@Sun.COM 	}
14038348SEric.Yu@Sun.COM 
14048348SEric.Yu@Sun.COM 	/*
14058348SEric.Yu@Sun.COM 	 * Reading data from the socket buffer
14068348SEric.Yu@Sun.COM 	 */
14078348SEric.Yu@Sun.COM 	flags = msg->msg_flags;
14088348SEric.Yu@Sun.COM 	msg->msg_flags = 0;
14098348SEric.Yu@Sun.COM 
14108348SEric.Yu@Sun.COM 	/*
14118348SEric.Yu@Sun.COM 	 * Set msg_controllen and msg_namelen to zero here to make it
14128348SEric.Yu@Sun.COM 	 * simpler in the cases that no control or name is returned.
14138348SEric.Yu@Sun.COM 	 */
14148348SEric.Yu@Sun.COM 	controllen = msg->msg_controllen;
14158348SEric.Yu@Sun.COM 	namelen = msg->msg_namelen;
14168348SEric.Yu@Sun.COM 	msg->msg_controllen = 0;
14178348SEric.Yu@Sun.COM 	msg->msg_namelen = 0;
14188348SEric.Yu@Sun.COM 
14198348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
14208348SEric.Yu@Sun.COM 	/* Set SOREADLOCKED */
14218348SEric.Yu@Sun.COM 	error = so_lock_read_intr(so,
14228348SEric.Yu@Sun.COM 	    uiop->uio_fmode | ((flags & MSG_DONTWAIT) ? FNONBLOCK : 0));
14238348SEric.Yu@Sun.COM 	mutex_exit(&so->so_lock);
14248348SEric.Yu@Sun.COM 	if (error) {
14258348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
14268348SEric.Yu@Sun.COM 		return (error);
14278348SEric.Yu@Sun.COM 	}
14288348SEric.Yu@Sun.COM 
14298348SEric.Yu@Sun.COM 	suiop = sod_rcv_init(so, flags, &uiop);
14308348SEric.Yu@Sun.COM retry:
14318348SEric.Yu@Sun.COM 	saved_resid = uiop->uio_resid;
14328348SEric.Yu@Sun.COM 	error = so_dequeue_msg(so, &mctlp, uiop, &rval, flags);
14338348SEric.Yu@Sun.COM 	if (error != 0) {
14348348SEric.Yu@Sun.COM 		goto out;
14358348SEric.Yu@Sun.COM 	}
14368348SEric.Yu@Sun.COM 	/*
14378348SEric.Yu@Sun.COM 	 * For datagrams the MOREDATA flag is used to set MSG_TRUNC.
14388348SEric.Yu@Sun.COM 	 * For non-datagrams MOREDATA is used to set MSG_EOR.
14398348SEric.Yu@Sun.COM 	 */
14408348SEric.Yu@Sun.COM 	ASSERT(!(rval.r_val1 & MORECTL));
14418348SEric.Yu@Sun.COM 	if ((rval.r_val1 & MOREDATA) && (so->so_mode & SM_ATOMIC))
14428348SEric.Yu@Sun.COM 		msg->msg_flags |= MSG_TRUNC;
14438348SEric.Yu@Sun.COM 	if (mctlp == NULL) {
14448348SEric.Yu@Sun.COM 		dprintso(so, 1, ("so_recvmsg: got M_DATA\n"));
14458348SEric.Yu@Sun.COM 
14468348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
14478348SEric.Yu@Sun.COM 		/* Set MSG_EOR based on MOREDATA */
14488348SEric.Yu@Sun.COM 		if (!(rval.r_val1 & MOREDATA)) {
14498348SEric.Yu@Sun.COM 			if (so->so_state & SS_SAVEDEOR) {
14508348SEric.Yu@Sun.COM 				msg->msg_flags |= MSG_EOR;
14518348SEric.Yu@Sun.COM 				so->so_state &= ~SS_SAVEDEOR;
14528348SEric.Yu@Sun.COM 			}
14538348SEric.Yu@Sun.COM 		}
14548348SEric.Yu@Sun.COM 		/*
14558348SEric.Yu@Sun.COM 		 * If some data was received (i.e. not EOF) and the
14568348SEric.Yu@Sun.COM 		 * read/recv* has not been satisfied wait for some more.
14578348SEric.Yu@Sun.COM 		 */
14588348SEric.Yu@Sun.COM 		if ((flags & MSG_WAITALL) && !(msg->msg_flags & MSG_EOR) &&
14598348SEric.Yu@Sun.COM 		    uiop->uio_resid != saved_resid && uiop->uio_resid > 0) {
14608348SEric.Yu@Sun.COM 			mutex_exit(&so->so_lock);
14618348SEric.Yu@Sun.COM 			goto retry;
14628348SEric.Yu@Sun.COM 		}
14638348SEric.Yu@Sun.COM 
14648348SEric.Yu@Sun.COM 		goto out_locked;
14658348SEric.Yu@Sun.COM 	}
14668348SEric.Yu@Sun.COM 	/* strsock_proto has already verified length and alignment */
14678348SEric.Yu@Sun.COM 	tpr = (union T_primitives *)mctlp->b_rptr;
14688348SEric.Yu@Sun.COM 	dprintso(so, 1, ("so_recvmsg: type %d\n", tpr->type));
14698348SEric.Yu@Sun.COM 	switch (tpr->type) {
14708348SEric.Yu@Sun.COM 	case T_DATA_IND: {
14718348SEric.Yu@Sun.COM 		/*
14728348SEric.Yu@Sun.COM 		 * Set msg_flags to MSG_EOR based on
14738348SEric.Yu@Sun.COM 		 * MORE_flag and MOREDATA.
14748348SEric.Yu@Sun.COM 		 */
14758348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
14768348SEric.Yu@Sun.COM 		so->so_state &= ~SS_SAVEDEOR;
14778348SEric.Yu@Sun.COM 		if (!(tpr->data_ind.MORE_flag & 1)) {
14788348SEric.Yu@Sun.COM 			if (!(rval.r_val1 & MOREDATA))
14798348SEric.Yu@Sun.COM 				msg->msg_flags |= MSG_EOR;
14808348SEric.Yu@Sun.COM 			else
14818348SEric.Yu@Sun.COM 				so->so_state |= SS_SAVEDEOR;
14828348SEric.Yu@Sun.COM 		}
14838348SEric.Yu@Sun.COM 		freemsg(mctlp);
14848348SEric.Yu@Sun.COM 		/*
14858348SEric.Yu@Sun.COM 		 * If some data was received (i.e. not EOF) and the
14868348SEric.Yu@Sun.COM 		 * read/recv* has not been satisfied wait for some more.
14878348SEric.Yu@Sun.COM 		 */
14888348SEric.Yu@Sun.COM 		if ((flags & MSG_WAITALL) && !(msg->msg_flags & MSG_EOR) &&
14898348SEric.Yu@Sun.COM 		    uiop->uio_resid != saved_resid && uiop->uio_resid > 0) {
14908348SEric.Yu@Sun.COM 			mutex_exit(&so->so_lock);
14918348SEric.Yu@Sun.COM 			goto retry;
14928348SEric.Yu@Sun.COM 		}
14938348SEric.Yu@Sun.COM 		goto out_locked;
14948348SEric.Yu@Sun.COM 	}
14958348SEric.Yu@Sun.COM 	case T_UNITDATA_IND: {
14968348SEric.Yu@Sun.COM 		void *addr;
14978348SEric.Yu@Sun.COM 		t_uscalar_t addrlen;
14988348SEric.Yu@Sun.COM 		void *abuf;
14998348SEric.Yu@Sun.COM 		t_uscalar_t optlen;
15008348SEric.Yu@Sun.COM 		void *opt;
15018348SEric.Yu@Sun.COM 
15028348SEric.Yu@Sun.COM 		if (namelen != 0) {
15038348SEric.Yu@Sun.COM 			/* Caller wants source address */
15048348SEric.Yu@Sun.COM 			addrlen = tpr->unitdata_ind.SRC_length;
15058348SEric.Yu@Sun.COM 			addr = sogetoff(mctlp, tpr->unitdata_ind.SRC_offset,
15068348SEric.Yu@Sun.COM 			    addrlen, 1);
15078348SEric.Yu@Sun.COM 			if (addr == NULL) {
15088348SEric.Yu@Sun.COM 				freemsg(mctlp);
15098348SEric.Yu@Sun.COM 				error = EPROTO;
15108348SEric.Yu@Sun.COM 				eprintsoline(so, error);
15118348SEric.Yu@Sun.COM 				goto out;
15128348SEric.Yu@Sun.COM 			}
15138348SEric.Yu@Sun.COM 			ASSERT(so->so_family != AF_UNIX);
15148348SEric.Yu@Sun.COM 		}
15158348SEric.Yu@Sun.COM 		optlen = tpr->unitdata_ind.OPT_length;
15168348SEric.Yu@Sun.COM 		if (optlen != 0) {
15178348SEric.Yu@Sun.COM 			t_uscalar_t ncontrollen;
15188348SEric.Yu@Sun.COM 
15198348SEric.Yu@Sun.COM 			/*
15208348SEric.Yu@Sun.COM 			 * Extract any source address option.
15218348SEric.Yu@Sun.COM 			 * Determine how large cmsg buffer is needed.
15228348SEric.Yu@Sun.COM 			 */
15238348SEric.Yu@Sun.COM 			opt = sogetoff(mctlp, tpr->unitdata_ind.OPT_offset,
15248348SEric.Yu@Sun.COM 			    optlen, __TPI_ALIGN_SIZE);
15258348SEric.Yu@Sun.COM 
15268348SEric.Yu@Sun.COM 			if (opt == NULL) {
15278348SEric.Yu@Sun.COM 				freemsg(mctlp);
15288348SEric.Yu@Sun.COM 				error = EPROTO;
15298348SEric.Yu@Sun.COM 				eprintsoline(so, error);
15308348SEric.Yu@Sun.COM 				goto out;
15318348SEric.Yu@Sun.COM 			}
15328348SEric.Yu@Sun.COM 			if (so->so_family == AF_UNIX)
15338348SEric.Yu@Sun.COM 				so_getopt_srcaddr(opt, optlen, &addr, &addrlen);
15348348SEric.Yu@Sun.COM 			ncontrollen = so_cmsglen(mctlp, opt, optlen,
15358348SEric.Yu@Sun.COM 			    !(flags & MSG_XPG4_2));
15368348SEric.Yu@Sun.COM 			if (controllen != 0)
15378348SEric.Yu@Sun.COM 				controllen = ncontrollen;
15388348SEric.Yu@Sun.COM 			else if (ncontrollen != 0)
15398348SEric.Yu@Sun.COM 				msg->msg_flags |= MSG_CTRUNC;
15408348SEric.Yu@Sun.COM 		} else {
15418348SEric.Yu@Sun.COM 			controllen = 0;
15428348SEric.Yu@Sun.COM 		}
15438348SEric.Yu@Sun.COM 
15448348SEric.Yu@Sun.COM 		if (namelen != 0) {
15458348SEric.Yu@Sun.COM 			/*
15468348SEric.Yu@Sun.COM 			 * Return address to caller.
15478348SEric.Yu@Sun.COM 			 * Caller handles truncation if length
15488348SEric.Yu@Sun.COM 			 * exceeds msg_namelen.
15498348SEric.Yu@Sun.COM 			 * NOTE: AF_UNIX NUL termination is ensured by
15508348SEric.Yu@Sun.COM 			 * the sender's copyin_name().
15518348SEric.Yu@Sun.COM 			 */
15528348SEric.Yu@Sun.COM 			abuf = kmem_alloc(addrlen, KM_SLEEP);
15538348SEric.Yu@Sun.COM 
15548348SEric.Yu@Sun.COM 			bcopy(addr, abuf, addrlen);
15558348SEric.Yu@Sun.COM 			msg->msg_name = abuf;
15568348SEric.Yu@Sun.COM 			msg->msg_namelen = addrlen;
15578348SEric.Yu@Sun.COM 		}
15588348SEric.Yu@Sun.COM 
15598348SEric.Yu@Sun.COM 		if (controllen != 0) {
15608348SEric.Yu@Sun.COM 			/*
15618348SEric.Yu@Sun.COM 			 * Return control msg to caller.
15628348SEric.Yu@Sun.COM 			 * Caller handles truncation if length
15638348SEric.Yu@Sun.COM 			 * exceeds msg_controllen.
15648348SEric.Yu@Sun.COM 			 */
15658348SEric.Yu@Sun.COM 			control = kmem_zalloc(controllen, KM_SLEEP);
15668348SEric.Yu@Sun.COM 
15678348SEric.Yu@Sun.COM 			error = so_opt2cmsg(mctlp, opt, optlen,
15688348SEric.Yu@Sun.COM 			    !(flags & MSG_XPG4_2), control, controllen);
15698348SEric.Yu@Sun.COM 			if (error) {
15708348SEric.Yu@Sun.COM 				freemsg(mctlp);
15718348SEric.Yu@Sun.COM 				if (msg->msg_namelen != 0)
15728348SEric.Yu@Sun.COM 					kmem_free(msg->msg_name,
15738348SEric.Yu@Sun.COM 					    msg->msg_namelen);
15748348SEric.Yu@Sun.COM 				kmem_free(control, controllen);
15758348SEric.Yu@Sun.COM 				eprintsoline(so, error);
15768348SEric.Yu@Sun.COM 				goto out;
15778348SEric.Yu@Sun.COM 			}
15788348SEric.Yu@Sun.COM 			msg->msg_control = control;
15798348SEric.Yu@Sun.COM 			msg->msg_controllen = controllen;
15808348SEric.Yu@Sun.COM 		}
15818348SEric.Yu@Sun.COM 
15828348SEric.Yu@Sun.COM 		freemsg(mctlp);
15838348SEric.Yu@Sun.COM 		goto out;
15848348SEric.Yu@Sun.COM 	}
15858348SEric.Yu@Sun.COM 	case T_OPTDATA_IND: {
15868348SEric.Yu@Sun.COM 		struct T_optdata_req *tdr;
15878348SEric.Yu@Sun.COM 		void *opt;
15888348SEric.Yu@Sun.COM 		t_uscalar_t optlen;
15898348SEric.Yu@Sun.COM 
15908348SEric.Yu@Sun.COM 		tdr = (struct T_optdata_req *)mctlp->b_rptr;
15918348SEric.Yu@Sun.COM 		optlen = tdr->OPT_length;
15928348SEric.Yu@Sun.COM 		if (optlen != 0) {
15938348SEric.Yu@Sun.COM 			t_uscalar_t ncontrollen;
15948348SEric.Yu@Sun.COM 			/*
15958348SEric.Yu@Sun.COM 			 * Determine how large cmsg buffer is needed.
15968348SEric.Yu@Sun.COM 			 */
15978348SEric.Yu@Sun.COM 			opt = sogetoff(mctlp,
15988348SEric.Yu@Sun.COM 			    tpr->optdata_ind.OPT_offset, optlen,
15998348SEric.Yu@Sun.COM 			    __TPI_ALIGN_SIZE);
16008348SEric.Yu@Sun.COM 
16018348SEric.Yu@Sun.COM 			if (opt == NULL) {
16028348SEric.Yu@Sun.COM 				freemsg(mctlp);
16038348SEric.Yu@Sun.COM 				error = EPROTO;
16048348SEric.Yu@Sun.COM 				eprintsoline(so, error);
16058348SEric.Yu@Sun.COM 				goto out;
16068348SEric.Yu@Sun.COM 			}
16078348SEric.Yu@Sun.COM 
16088348SEric.Yu@Sun.COM 			ncontrollen = so_cmsglen(mctlp, opt, optlen,
16098348SEric.Yu@Sun.COM 			    !(flags & MSG_XPG4_2));
16108348SEric.Yu@Sun.COM 			if (controllen != 0)
16118348SEric.Yu@Sun.COM 				controllen = ncontrollen;
16128348SEric.Yu@Sun.COM 			else if (ncontrollen != 0)
16138348SEric.Yu@Sun.COM 				msg->msg_flags |= MSG_CTRUNC;
16148348SEric.Yu@Sun.COM 		} else {
16158348SEric.Yu@Sun.COM 			controllen = 0;
16168348SEric.Yu@Sun.COM 		}
16178348SEric.Yu@Sun.COM 
16188348SEric.Yu@Sun.COM 		if (controllen != 0) {
16198348SEric.Yu@Sun.COM 			/*
16208348SEric.Yu@Sun.COM 			 * Return control msg to caller.
16218348SEric.Yu@Sun.COM 			 * Caller handles truncation if length
16228348SEric.Yu@Sun.COM 			 * exceeds msg_controllen.
16238348SEric.Yu@Sun.COM 			 */
16248348SEric.Yu@Sun.COM 			control = kmem_zalloc(controllen, KM_SLEEP);
16258348SEric.Yu@Sun.COM 
16268348SEric.Yu@Sun.COM 			error = so_opt2cmsg(mctlp, opt, optlen,
16278348SEric.Yu@Sun.COM 			    !(flags & MSG_XPG4_2), control, controllen);
16288348SEric.Yu@Sun.COM 			if (error) {
16298348SEric.Yu@Sun.COM 				freemsg(mctlp);
16308348SEric.Yu@Sun.COM 				kmem_free(control, controllen);
16318348SEric.Yu@Sun.COM 				eprintsoline(so, error);
16328348SEric.Yu@Sun.COM 				goto out;
16338348SEric.Yu@Sun.COM 			}
16348348SEric.Yu@Sun.COM 			msg->msg_control = control;
16358348SEric.Yu@Sun.COM 			msg->msg_controllen = controllen;
16368348SEric.Yu@Sun.COM 		}
16378348SEric.Yu@Sun.COM 
16388348SEric.Yu@Sun.COM 		/*
16398348SEric.Yu@Sun.COM 		 * Set msg_flags to MSG_EOR based on
16408348SEric.Yu@Sun.COM 		 * DATA_flag and MOREDATA.
16418348SEric.Yu@Sun.COM 		 */
16428348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
16438348SEric.Yu@Sun.COM 		so->so_state &= ~SS_SAVEDEOR;
16448348SEric.Yu@Sun.COM 		if (!(tpr->data_ind.MORE_flag & 1)) {
16458348SEric.Yu@Sun.COM 			if (!(rval.r_val1 & MOREDATA))
16468348SEric.Yu@Sun.COM 				msg->msg_flags |= MSG_EOR;
16478348SEric.Yu@Sun.COM 			else
16488348SEric.Yu@Sun.COM 				so->so_state |= SS_SAVEDEOR;
16498348SEric.Yu@Sun.COM 		}
16508348SEric.Yu@Sun.COM 		freemsg(mctlp);
16518348SEric.Yu@Sun.COM 		/*
16528348SEric.Yu@Sun.COM 		 * If some data was received (i.e. not EOF) and the
16538348SEric.Yu@Sun.COM 		 * read/recv* has not been satisfied wait for some more.
16548348SEric.Yu@Sun.COM 		 * Not possible to wait if control info was received.
16558348SEric.Yu@Sun.COM 		 */
16568348SEric.Yu@Sun.COM 		if ((flags & MSG_WAITALL) && !(msg->msg_flags & MSG_EOR) &&
16578348SEric.Yu@Sun.COM 		    controllen == 0 &&
16588348SEric.Yu@Sun.COM 		    uiop->uio_resid != saved_resid && uiop->uio_resid > 0) {
16598348SEric.Yu@Sun.COM 			mutex_exit(&so->so_lock);
16608348SEric.Yu@Sun.COM 			goto retry;
16618348SEric.Yu@Sun.COM 		}
16628348SEric.Yu@Sun.COM 		goto out_locked;
16638348SEric.Yu@Sun.COM 	}
16648348SEric.Yu@Sun.COM 	default:
16658348SEric.Yu@Sun.COM 		cmn_err(CE_CONT, "so_recvmsg bad type %x \n",
16668348SEric.Yu@Sun.COM 		    tpr->type);
16678348SEric.Yu@Sun.COM 		freemsg(mctlp);
16688348SEric.Yu@Sun.COM 		error = EPROTO;
16698348SEric.Yu@Sun.COM 		ASSERT(0);
16708348SEric.Yu@Sun.COM 	}
16718348SEric.Yu@Sun.COM out:
16728348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
16738348SEric.Yu@Sun.COM out_locked:
16748348SEric.Yu@Sun.COM 	/* The sod_lockp pointers to the sonode so_lock */
16758348SEric.Yu@Sun.COM 	ret = sod_rcv_done(so, suiop, uiop);
16768348SEric.Yu@Sun.COM 	if (ret != 0 && error == 0)
16778348SEric.Yu@Sun.COM 		error = ret;
16788348SEric.Yu@Sun.COM 
16798348SEric.Yu@Sun.COM 	so_unlock_read(so);	/* Clear SOREADLOCKED */
16808348SEric.Yu@Sun.COM 	mutex_exit(&so->so_lock);
16818348SEric.Yu@Sun.COM 
16828348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
16838348SEric.Yu@Sun.COM 
16848348SEric.Yu@Sun.COM 	return (error);
16858348SEric.Yu@Sun.COM }
16868348SEric.Yu@Sun.COM 
16878348SEric.Yu@Sun.COM sonodeops_t so_sonodeops = {
16888348SEric.Yu@Sun.COM 	so_init,		/* sop_init	*/
16898348SEric.Yu@Sun.COM 	so_accept,		/* sop_accept   */
16908348SEric.Yu@Sun.COM 	so_bind,		/* sop_bind	*/
16918348SEric.Yu@Sun.COM 	so_listen,		/* sop_listen   */
16928348SEric.Yu@Sun.COM 	so_connect,		/* sop_connect  */
16938348SEric.Yu@Sun.COM 	so_recvmsg,		/* sop_recvmsg  */
16948348SEric.Yu@Sun.COM 	so_sendmsg,		/* sop_sendmsg  */
16958348SEric.Yu@Sun.COM 	so_sendmblk,		/* sop_sendmblk */
16968348SEric.Yu@Sun.COM 	so_getpeername,		/* sop_getpeername */
16978348SEric.Yu@Sun.COM 	so_getsockname,		/* sop_getsockname */
16988348SEric.Yu@Sun.COM 	so_shutdown,		/* sop_shutdown */
16998348SEric.Yu@Sun.COM 	so_getsockopt,		/* sop_getsockopt */
17008348SEric.Yu@Sun.COM 	so_setsockopt,		/* sop_setsockopt */
17018348SEric.Yu@Sun.COM 	so_ioctl,		/* sop_ioctl    */
17028348SEric.Yu@Sun.COM 	so_poll,		/* sop_poll	*/
17038348SEric.Yu@Sun.COM 	so_close,		/* sop_close */
17048348SEric.Yu@Sun.COM };
17058348SEric.Yu@Sun.COM 
17068348SEric.Yu@Sun.COM sock_upcalls_t so_upcalls = {
17078348SEric.Yu@Sun.COM 	so_newconn,
17088348SEric.Yu@Sun.COM 	so_connected,
17098348SEric.Yu@Sun.COM 	so_disconnected,
17108348SEric.Yu@Sun.COM 	so_opctl,
17118348SEric.Yu@Sun.COM 	so_queue_msg,
17128348SEric.Yu@Sun.COM 	so_set_prop,
17138348SEric.Yu@Sun.COM 	so_txq_full,
17148348SEric.Yu@Sun.COM 	so_signal_oob,
17158348SEric.Yu@Sun.COM 	so_zcopy_notify,
17168348SEric.Yu@Sun.COM 	so_set_error
17178348SEric.Yu@Sun.COM };
1718