xref: /onnv-gate/usr/src/uts/common/fs/sockfs/sockcommon_sops.c (revision 8575:586f608c7ab7)
18348SEric.Yu@Sun.COM /*
28348SEric.Yu@Sun.COM  * CDDL HEADER START
38348SEric.Yu@Sun.COM  *
48348SEric.Yu@Sun.COM  * The contents of this file are subject to the terms of the
58348SEric.Yu@Sun.COM  * Common Development and Distribution License (the "License").
68348SEric.Yu@Sun.COM  * You may not use this file except in compliance with the License.
78348SEric.Yu@Sun.COM  *
88348SEric.Yu@Sun.COM  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
98348SEric.Yu@Sun.COM  * or http://www.opensolaris.org/os/licensing.
108348SEric.Yu@Sun.COM  * See the License for the specific language governing permissions
118348SEric.Yu@Sun.COM  * and limitations under the License.
128348SEric.Yu@Sun.COM  *
138348SEric.Yu@Sun.COM  * When distributing Covered Code, include this CDDL HEADER in each
148348SEric.Yu@Sun.COM  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
158348SEric.Yu@Sun.COM  * If applicable, add the following below this CDDL HEADER, with the
168348SEric.Yu@Sun.COM  * fields enclosed by brackets "[]" replaced with your own identifying
178348SEric.Yu@Sun.COM  * information: Portions Copyright [yyyy] [name of copyright owner]
188348SEric.Yu@Sun.COM  *
198348SEric.Yu@Sun.COM  * CDDL HEADER END
208348SEric.Yu@Sun.COM  */
218348SEric.Yu@Sun.COM 
228348SEric.Yu@Sun.COM /*
238489Sshenjian  * Copyright 2009 Sun Microsystems, Inc.  All rights reserved.
248348SEric.Yu@Sun.COM  * Use is subject to license terms.
258348SEric.Yu@Sun.COM  */
268348SEric.Yu@Sun.COM 
278348SEric.Yu@Sun.COM #pragma ident	"@(#)sockcommon_sops.c	1.1	07/06/14 SMI"
288348SEric.Yu@Sun.COM 
298348SEric.Yu@Sun.COM #include <sys/types.h>
308348SEric.Yu@Sun.COM #include <sys/param.h>
318348SEric.Yu@Sun.COM #include <sys/systm.h>
328348SEric.Yu@Sun.COM #include <sys/sysmacros.h>
338348SEric.Yu@Sun.COM #include <sys/debug.h>
348348SEric.Yu@Sun.COM #include <sys/cmn_err.h>
358348SEric.Yu@Sun.COM 
368348SEric.Yu@Sun.COM #include <sys/stropts.h>
378348SEric.Yu@Sun.COM #include <sys/socket.h>
388348SEric.Yu@Sun.COM #include <sys/socketvar.h>
398348SEric.Yu@Sun.COM 
408348SEric.Yu@Sun.COM #define	_SUN_TPI_VERSION	2
418348SEric.Yu@Sun.COM #include <sys/tihdr.h>
428348SEric.Yu@Sun.COM #include <sys/sockio.h>
438348SEric.Yu@Sun.COM #include <sys/sodirect.h>
448348SEric.Yu@Sun.COM #include <sys/kmem_impl.h>
458348SEric.Yu@Sun.COM 
468348SEric.Yu@Sun.COM #include <sys/strsubr.h>
478348SEric.Yu@Sun.COM #include <sys/strsun.h>
488348SEric.Yu@Sun.COM #include <sys/ddi.h>
498348SEric.Yu@Sun.COM #include <netinet/in.h>
508348SEric.Yu@Sun.COM #include <inet/ip.h>
518348SEric.Yu@Sun.COM 
528348SEric.Yu@Sun.COM #include <fs/sockfs/sockcommon.h>
538348SEric.Yu@Sun.COM 
548348SEric.Yu@Sun.COM #include <sys/socket_proto.h>
558348SEric.Yu@Sun.COM 
568348SEric.Yu@Sun.COM #include <fs/sockfs/socktpi_impl.h>
578348SEric.Yu@Sun.COM #include <sys/tihdr.h>
588348SEric.Yu@Sun.COM #include <fs/sockfs/nl7c.h>
598348SEric.Yu@Sun.COM #include <inet/kssl/ksslapi.h>
608348SEric.Yu@Sun.COM 
618348SEric.Yu@Sun.COM 
628348SEric.Yu@Sun.COM extern int xnet_skip_checks;
638348SEric.Yu@Sun.COM extern int xnet_check_print;
648348SEric.Yu@Sun.COM 
658348SEric.Yu@Sun.COM static void so_queue_oob(sock_upper_handle_t, mblk_t *, size_t);
668348SEric.Yu@Sun.COM 
678348SEric.Yu@Sun.COM 
688348SEric.Yu@Sun.COM /*ARGSUSED*/
698348SEric.Yu@Sun.COM int
708348SEric.Yu@Sun.COM so_accept_notsupp(struct sonode *lso, int fflag,
718348SEric.Yu@Sun.COM     struct cred *cr, struct sonode **nsop)
728348SEric.Yu@Sun.COM {
738348SEric.Yu@Sun.COM 	return (EOPNOTSUPP);
748348SEric.Yu@Sun.COM }
758348SEric.Yu@Sun.COM 
768348SEric.Yu@Sun.COM /*ARGSUSED*/
778348SEric.Yu@Sun.COM int
788348SEric.Yu@Sun.COM so_listen_notsupp(struct sonode *so, int backlog, struct cred *cr)
798348SEric.Yu@Sun.COM {
808348SEric.Yu@Sun.COM 	return (EOPNOTSUPP);
818348SEric.Yu@Sun.COM }
828348SEric.Yu@Sun.COM 
838348SEric.Yu@Sun.COM /*ARGSUSED*/
848348SEric.Yu@Sun.COM int
858348SEric.Yu@Sun.COM so_getsockname_notsupp(struct sonode *so, struct sockaddr *sa,
868348SEric.Yu@Sun.COM     socklen_t *len, struct cred *cr)
878348SEric.Yu@Sun.COM {
888348SEric.Yu@Sun.COM 	return (EOPNOTSUPP);
898348SEric.Yu@Sun.COM }
908348SEric.Yu@Sun.COM 
918348SEric.Yu@Sun.COM /*ARGSUSED*/
928348SEric.Yu@Sun.COM int
938348SEric.Yu@Sun.COM so_getpeername_notsupp(struct sonode *so, struct sockaddr *addr,
948348SEric.Yu@Sun.COM     socklen_t *addrlen, boolean_t accept, struct cred *cr)
958348SEric.Yu@Sun.COM {
968348SEric.Yu@Sun.COM 	return (EOPNOTSUPP);
978348SEric.Yu@Sun.COM }
988348SEric.Yu@Sun.COM 
998348SEric.Yu@Sun.COM /*ARGSUSED*/
1008348SEric.Yu@Sun.COM int
1018348SEric.Yu@Sun.COM so_shutdown_notsupp(struct sonode *so, int how, struct cred *cr)
1028348SEric.Yu@Sun.COM {
1038348SEric.Yu@Sun.COM 	return (EOPNOTSUPP);
1048348SEric.Yu@Sun.COM }
1058348SEric.Yu@Sun.COM 
1068348SEric.Yu@Sun.COM /*ARGSUSED*/
1078348SEric.Yu@Sun.COM int
1088348SEric.Yu@Sun.COM so_sendmblk_notsupp(struct sonode *so, struct msghdr *msg, int fflag,
1098348SEric.Yu@Sun.COM     struct cred *cr, mblk_t **mpp)
1108348SEric.Yu@Sun.COM {
1118348SEric.Yu@Sun.COM 	return (EOPNOTSUPP);
1128348SEric.Yu@Sun.COM }
1138348SEric.Yu@Sun.COM 
1148348SEric.Yu@Sun.COM /*
1158348SEric.Yu@Sun.COM  * Generic Socket Ops
1168348SEric.Yu@Sun.COM  */
1178348SEric.Yu@Sun.COM 
1188348SEric.Yu@Sun.COM /* ARGSUSED */
1198348SEric.Yu@Sun.COM int
1208348SEric.Yu@Sun.COM so_init(struct sonode *so, struct sonode *pso, struct cred *cr, int flags)
1218348SEric.Yu@Sun.COM {
1228348SEric.Yu@Sun.COM 	return (socket_init_common(so, pso, flags, cr));
1238348SEric.Yu@Sun.COM }
1248348SEric.Yu@Sun.COM 
1258348SEric.Yu@Sun.COM int
1268348SEric.Yu@Sun.COM so_bind(struct sonode *so, struct sockaddr *name, socklen_t namelen,
1278348SEric.Yu@Sun.COM     int flags, struct cred *cr)
1288348SEric.Yu@Sun.COM {
1298348SEric.Yu@Sun.COM 	int error;
1308348SEric.Yu@Sun.COM 
1318348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_BIND(so, name, namelen, flags, cr));
1328348SEric.Yu@Sun.COM 
1338348SEric.Yu@Sun.COM 	ASSERT(flags == _SOBIND_XPG4_2 || flags == _SOBIND_SOCKBSD);
1348348SEric.Yu@Sun.COM 
1358348SEric.Yu@Sun.COM 	/* X/Open requires this check */
1368348SEric.Yu@Sun.COM 	if ((so->so_state & SS_CANTSENDMORE) && !xnet_skip_checks) {
1378348SEric.Yu@Sun.COM 		if (xnet_check_print) {
1388348SEric.Yu@Sun.COM 			printf("sockfs: X/Open bind state check "
1398348SEric.Yu@Sun.COM 			    "caused EINVAL\n");
1408348SEric.Yu@Sun.COM 		}
1418348SEric.Yu@Sun.COM 		error = EINVAL;
1428348SEric.Yu@Sun.COM 		goto done;
1438348SEric.Yu@Sun.COM 	}
1448348SEric.Yu@Sun.COM 
1458348SEric.Yu@Sun.COM 	/*
1468348SEric.Yu@Sun.COM 	 * a bind to a NULL address is interpreted as unbind. So just
1478348SEric.Yu@Sun.COM 	 * do the downcall.
1488348SEric.Yu@Sun.COM 	 */
1498348SEric.Yu@Sun.COM 	if (name == NULL)
1508348SEric.Yu@Sun.COM 		goto dobind;
1518348SEric.Yu@Sun.COM 
1528348SEric.Yu@Sun.COM 	switch (so->so_family) {
1538348SEric.Yu@Sun.COM 	case AF_INET:
1548348SEric.Yu@Sun.COM 		if ((size_t)namelen != sizeof (sin_t)) {
1558348SEric.Yu@Sun.COM 			error = name->sa_family != so->so_family ?
1568348SEric.Yu@Sun.COM 			    EAFNOSUPPORT : EINVAL;
1578348SEric.Yu@Sun.COM 			eprintsoline(so, error);
1588348SEric.Yu@Sun.COM 			goto done;
1598348SEric.Yu@Sun.COM 		}
1608348SEric.Yu@Sun.COM 
1618348SEric.Yu@Sun.COM 		if ((flags & _SOBIND_XPG4_2) &&
1628348SEric.Yu@Sun.COM 		    (name->sa_family != so->so_family)) {
1638348SEric.Yu@Sun.COM 			/*
1648348SEric.Yu@Sun.COM 			 * This check has to be made for X/Open
1658348SEric.Yu@Sun.COM 			 * sockets however application failures have
1668348SEric.Yu@Sun.COM 			 * been observed when it is applied to
1678348SEric.Yu@Sun.COM 			 * all sockets.
1688348SEric.Yu@Sun.COM 			 */
1698348SEric.Yu@Sun.COM 			error = EAFNOSUPPORT;
1708348SEric.Yu@Sun.COM 			eprintsoline(so, error);
1718348SEric.Yu@Sun.COM 			goto done;
1728348SEric.Yu@Sun.COM 		}
1738348SEric.Yu@Sun.COM 		/*
1748348SEric.Yu@Sun.COM 		 * Force a zero sa_family to match so_family.
1758348SEric.Yu@Sun.COM 		 *
1768348SEric.Yu@Sun.COM 		 * Some programs like inetd(1M) don't set the
1778348SEric.Yu@Sun.COM 		 * family field. Other programs leave
1788348SEric.Yu@Sun.COM 		 * sin_family set to garbage - SunOS 4.X does
1798348SEric.Yu@Sun.COM 		 * not check the family field on a bind.
1808348SEric.Yu@Sun.COM 		 * We use the family field that
1818348SEric.Yu@Sun.COM 		 * was passed in to the socket() call.
1828348SEric.Yu@Sun.COM 		 */
1838348SEric.Yu@Sun.COM 		name->sa_family = so->so_family;
1848348SEric.Yu@Sun.COM 		break;
1858348SEric.Yu@Sun.COM 
1868348SEric.Yu@Sun.COM 	case AF_INET6: {
1878348SEric.Yu@Sun.COM #ifdef DEBUG
1888348SEric.Yu@Sun.COM 		sin6_t *sin6 = (sin6_t *)name;
1898348SEric.Yu@Sun.COM #endif
1908348SEric.Yu@Sun.COM 		if ((size_t)namelen != sizeof (sin6_t)) {
1918348SEric.Yu@Sun.COM 			error = name->sa_family != so->so_family ?
1928348SEric.Yu@Sun.COM 			    EAFNOSUPPORT : EINVAL;
1938348SEric.Yu@Sun.COM 			eprintsoline(so, error);
1948348SEric.Yu@Sun.COM 			goto done;
1958348SEric.Yu@Sun.COM 		}
1968348SEric.Yu@Sun.COM 
1978348SEric.Yu@Sun.COM 		if (name->sa_family != so->so_family) {
1988348SEric.Yu@Sun.COM 			/*
1998348SEric.Yu@Sun.COM 			 * With IPv6 we require the family to match
2008348SEric.Yu@Sun.COM 			 * unlike in IPv4.
2018348SEric.Yu@Sun.COM 			 */
2028348SEric.Yu@Sun.COM 			error = EAFNOSUPPORT;
2038348SEric.Yu@Sun.COM 			eprintsoline(so, error);
2048348SEric.Yu@Sun.COM 			goto done;
2058348SEric.Yu@Sun.COM 		}
2068348SEric.Yu@Sun.COM #ifdef DEBUG
2078348SEric.Yu@Sun.COM 		/*
2088348SEric.Yu@Sun.COM 		 * Verify that apps don't forget to clear
2098348SEric.Yu@Sun.COM 		 * sin6_scope_id etc
2108348SEric.Yu@Sun.COM 		 */
2118348SEric.Yu@Sun.COM 		if (sin6->sin6_scope_id != 0 &&
2128348SEric.Yu@Sun.COM 		    !IN6_IS_ADDR_LINKSCOPE(&sin6->sin6_addr)) {
2138348SEric.Yu@Sun.COM 			zcmn_err(getzoneid(), CE_WARN,
2148348SEric.Yu@Sun.COM 			    "bind with uninitialized sin6_scope_id "
2158348SEric.Yu@Sun.COM 			    "(%d) on socket. Pid = %d\n",
2168348SEric.Yu@Sun.COM 			    (int)sin6->sin6_scope_id,
2178348SEric.Yu@Sun.COM 			    (int)curproc->p_pid);
2188348SEric.Yu@Sun.COM 		}
2198348SEric.Yu@Sun.COM 		if (sin6->__sin6_src_id != 0) {
2208348SEric.Yu@Sun.COM 			zcmn_err(getzoneid(), CE_WARN,
2218348SEric.Yu@Sun.COM 			    "bind with uninitialized __sin6_src_id "
2228348SEric.Yu@Sun.COM 			    "(%d) on socket. Pid = %d\n",
2238348SEric.Yu@Sun.COM 			    (int)sin6->__sin6_src_id,
2248348SEric.Yu@Sun.COM 			    (int)curproc->p_pid);
2258348SEric.Yu@Sun.COM 		}
2268348SEric.Yu@Sun.COM #endif /* DEBUG */
2278348SEric.Yu@Sun.COM 
2288348SEric.Yu@Sun.COM 		break;
2298348SEric.Yu@Sun.COM 	}
2308348SEric.Yu@Sun.COM 	default:
2318348SEric.Yu@Sun.COM 		/* Just pass the request to the protocol */
2328348SEric.Yu@Sun.COM 		goto dobind;
2338348SEric.Yu@Sun.COM 	}
2348348SEric.Yu@Sun.COM 
2358348SEric.Yu@Sun.COM 	/*
2368348SEric.Yu@Sun.COM 	 * First we check if either NCA or KSSL has been enabled for
2378348SEric.Yu@Sun.COM 	 * the requested address, and if so, we fall back to TPI.
2388348SEric.Yu@Sun.COM 	 * If neither of those two services are enabled, then we just
2398348SEric.Yu@Sun.COM 	 * pass the request to the protocol.
2408348SEric.Yu@Sun.COM 	 *
2418348SEric.Yu@Sun.COM 	 * Note that KSSL can only be enabled on a socket if NCA is NOT
2428348SEric.Yu@Sun.COM 	 * enabled for that socket, hence the else-statement below.
2438348SEric.Yu@Sun.COM 	 */
2448348SEric.Yu@Sun.COM 	if (nl7c_enabled && ((so->so_family == AF_INET ||
2458348SEric.Yu@Sun.COM 	    so->so_family == AF_INET6) &&
2468348SEric.Yu@Sun.COM 	    nl7c_lookup_addr(name, namelen) != NULL)) {
2478348SEric.Yu@Sun.COM 		/*
2488348SEric.Yu@Sun.COM 		 * NL7C is not supported in non-global zones,
2498348SEric.Yu@Sun.COM 		 * we enforce this restriction here.
2508348SEric.Yu@Sun.COM 		 */
2518348SEric.Yu@Sun.COM 		if (so->so_zoneid == GLOBAL_ZONEID) {
2528348SEric.Yu@Sun.COM 			/* NCA should be used, so fall back to TPI */
2538348SEric.Yu@Sun.COM 			error = so_tpi_fallback(so, cr);
2548348SEric.Yu@Sun.COM 			SO_UNBLOCK_FALLBACK(so);
2558348SEric.Yu@Sun.COM 			if (error)
2568348SEric.Yu@Sun.COM 				return (error);
2578348SEric.Yu@Sun.COM 			else
2588348SEric.Yu@Sun.COM 				return (SOP_BIND(so, name, namelen, flags, cr));
2598348SEric.Yu@Sun.COM 		}
2608348SEric.Yu@Sun.COM 	} else if (so->so_type == SOCK_STREAM) {
2618348SEric.Yu@Sun.COM 		/* Check if KSSL has been configured for this address */
2628348SEric.Yu@Sun.COM 		kssl_ent_t ent;
2638348SEric.Yu@Sun.COM 		kssl_endpt_type_t type;
2648348SEric.Yu@Sun.COM 		struct T_bind_req bind_req;
2658348SEric.Yu@Sun.COM 		mblk_t *mp;
2668348SEric.Yu@Sun.COM 
2678348SEric.Yu@Sun.COM 		/*
2688348SEric.Yu@Sun.COM 		 * TODO: Check with KSSL team if we could add a function call
2698348SEric.Yu@Sun.COM 		 * that only queries whether KSSL is enabled for the given
2708348SEric.Yu@Sun.COM 		 * address.
2718348SEric.Yu@Sun.COM 		 */
2728348SEric.Yu@Sun.COM 		bind_req.PRIM_type = T_BIND_REQ;
2738348SEric.Yu@Sun.COM 		bind_req.ADDR_length = namelen;
2748348SEric.Yu@Sun.COM 		bind_req.ADDR_offset = (t_scalar_t)sizeof (bind_req);
2758348SEric.Yu@Sun.COM 		mp = soallocproto2(&bind_req, sizeof (bind_req),
2768348SEric.Yu@Sun.COM 		    name, namelen, 0, _ALLOC_SLEEP);
2778348SEric.Yu@Sun.COM 
2788348SEric.Yu@Sun.COM 		type = kssl_check_proxy(mp, so, &ent);
2798348SEric.Yu@Sun.COM 		freemsg(mp);
2808348SEric.Yu@Sun.COM 
2818348SEric.Yu@Sun.COM 		if (type != KSSL_NO_PROXY) {
2828348SEric.Yu@Sun.COM 			/*
2838348SEric.Yu@Sun.COM 			 * KSSL has been configured for this address, so
2848348SEric.Yu@Sun.COM 			 * we must fall back to TPI.
2858348SEric.Yu@Sun.COM 			 */
2868348SEric.Yu@Sun.COM 			kssl_release_ent(ent, so, type);
2878348SEric.Yu@Sun.COM 			error = so_tpi_fallback(so, cr);
2888348SEric.Yu@Sun.COM 			SO_UNBLOCK_FALLBACK(so);
2898348SEric.Yu@Sun.COM 			if (error)
2908348SEric.Yu@Sun.COM 				return (error);
2918348SEric.Yu@Sun.COM 			else
2928348SEric.Yu@Sun.COM 				return (SOP_BIND(so, name, namelen, flags, cr));
2938348SEric.Yu@Sun.COM 		}
2948348SEric.Yu@Sun.COM 	}
2958348SEric.Yu@Sun.COM 
2968348SEric.Yu@Sun.COM dobind:
2978348SEric.Yu@Sun.COM 	error = (*so->so_downcalls->sd_bind)
2988348SEric.Yu@Sun.COM 	    (so->so_proto_handle, name, namelen, cr);
2998348SEric.Yu@Sun.COM done:
3008348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
3018348SEric.Yu@Sun.COM 
3028348SEric.Yu@Sun.COM 	return (error);
3038348SEric.Yu@Sun.COM }
3048348SEric.Yu@Sun.COM 
3058348SEric.Yu@Sun.COM int
3068348SEric.Yu@Sun.COM so_listen(struct sonode *so, int backlog, struct cred *cr)
3078348SEric.Yu@Sun.COM {
3088348SEric.Yu@Sun.COM 	int	error = 0;
3098348SEric.Yu@Sun.COM 
3108348SEric.Yu@Sun.COM 	ASSERT(MUTEX_NOT_HELD(&so->so_lock));
3118348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_LISTEN(so, backlog, cr));
3128348SEric.Yu@Sun.COM 
3138348SEric.Yu@Sun.COM 	error = (*so->so_downcalls->sd_listen)(so->so_proto_handle, backlog,
3148348SEric.Yu@Sun.COM 	    cr);
3158348SEric.Yu@Sun.COM 
3168348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
3178348SEric.Yu@Sun.COM 
3188348SEric.Yu@Sun.COM 	return (error);
3198348SEric.Yu@Sun.COM }
3208348SEric.Yu@Sun.COM 
3218348SEric.Yu@Sun.COM 
3228348SEric.Yu@Sun.COM int
3238348SEric.Yu@Sun.COM so_connect(struct sonode *so, const struct sockaddr *name,
3248348SEric.Yu@Sun.COM     socklen_t namelen, int fflag, int flags, struct cred *cr)
3258348SEric.Yu@Sun.COM {
3268348SEric.Yu@Sun.COM 	int error = 0;
3278348SEric.Yu@Sun.COM 	sock_connid_t id;
3288348SEric.Yu@Sun.COM 
3298348SEric.Yu@Sun.COM 	ASSERT(MUTEX_NOT_HELD(&so->so_lock));
3308348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_CONNECT(so, name, namelen, fflag, flags, cr));
3318348SEric.Yu@Sun.COM 
3328348SEric.Yu@Sun.COM 	/*
3338348SEric.Yu@Sun.COM 	 * If there is a pending error, return error
3348348SEric.Yu@Sun.COM 	 * This can happen if a non blocking operation caused an error.
3358348SEric.Yu@Sun.COM 	 */
3368348SEric.Yu@Sun.COM 
3378348SEric.Yu@Sun.COM 	if (so->so_error != 0) {
3388348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
3398348SEric.Yu@Sun.COM 		error = sogeterr(so, B_TRUE);
3408348SEric.Yu@Sun.COM 		mutex_exit(&so->so_lock);
3418348SEric.Yu@Sun.COM 		if (error != 0)
3428348SEric.Yu@Sun.COM 			goto done;
3438348SEric.Yu@Sun.COM 	}
3448348SEric.Yu@Sun.COM 
3458348SEric.Yu@Sun.COM 	error = (*so->so_downcalls->sd_connect)(so->so_proto_handle,
3468348SEric.Yu@Sun.COM 	    name, namelen, &id, cr);
3478348SEric.Yu@Sun.COM 
3488348SEric.Yu@Sun.COM 	if (error == EINPROGRESS)
3498348SEric.Yu@Sun.COM 		error = so_wait_connected(so, fflag & (FNONBLOCK|FNDELAY), id);
3508348SEric.Yu@Sun.COM 
3518348SEric.Yu@Sun.COM done:
3528348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
3538348SEric.Yu@Sun.COM 	return (error);
3548348SEric.Yu@Sun.COM }
3558348SEric.Yu@Sun.COM 
3568348SEric.Yu@Sun.COM /*ARGSUSED*/
3578348SEric.Yu@Sun.COM int
3588348SEric.Yu@Sun.COM so_accept(struct sonode *so, int fflag, struct cred *cr, struct sonode **nsop)
3598348SEric.Yu@Sun.COM {
3608348SEric.Yu@Sun.COM 	int error = 0;
3618348SEric.Yu@Sun.COM 	struct sonode *nso;
3628348SEric.Yu@Sun.COM 
3638348SEric.Yu@Sun.COM 	*nsop = NULL;
3648348SEric.Yu@Sun.COM 
3658348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_ACCEPT(so, fflag, cr, nsop));
3668348SEric.Yu@Sun.COM 	if ((so->so_state & SS_ACCEPTCONN) == 0) {
3678348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
3688348SEric.Yu@Sun.COM 		return ((so->so_type == SOCK_DGRAM || so->so_type == SOCK_RAW) ?
3698348SEric.Yu@Sun.COM 		    EOPNOTSUPP : EINVAL);
3708348SEric.Yu@Sun.COM 	}
3718348SEric.Yu@Sun.COM 
3728348SEric.Yu@Sun.COM 	if ((error = so_acceptq_dequeue(so, (fflag & (FNONBLOCK|FNDELAY)),
3738348SEric.Yu@Sun.COM 	    &nso)) == 0) {
3748348SEric.Yu@Sun.COM 		ASSERT(nso != NULL);
3758348SEric.Yu@Sun.COM 
3768348SEric.Yu@Sun.COM 		/* finish the accept */
3778348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_accept)(so->so_proto_handle,
3788348SEric.Yu@Sun.COM 		    nso->so_proto_handle, (sock_upper_handle_t)nso, cr);
3798348SEric.Yu@Sun.COM 		if (error != 0) {
3808348SEric.Yu@Sun.COM 			(void) socket_close(nso, 0, cr);
3818348SEric.Yu@Sun.COM 			socket_destroy(nso);
3828348SEric.Yu@Sun.COM 		} else {
3838348SEric.Yu@Sun.COM 			*nsop = nso;
3848348SEric.Yu@Sun.COM 		}
3858348SEric.Yu@Sun.COM 	}
3868348SEric.Yu@Sun.COM 
3878348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
3888348SEric.Yu@Sun.COM 	return (error);
3898348SEric.Yu@Sun.COM }
3908348SEric.Yu@Sun.COM 
3918348SEric.Yu@Sun.COM int
3928348SEric.Yu@Sun.COM so_sendmsg(struct sonode *so, struct nmsghdr *msg, struct uio *uiop,
3938348SEric.Yu@Sun.COM     struct cred *cr)
3948348SEric.Yu@Sun.COM {
3958348SEric.Yu@Sun.COM 	int error, flags;
3968348SEric.Yu@Sun.COM 	boolean_t dontblock;
3978348SEric.Yu@Sun.COM 	ssize_t orig_resid;
3988348SEric.Yu@Sun.COM 	mblk_t  *mp;
3998348SEric.Yu@Sun.COM 
4008348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_SENDMSG(so, msg, uiop, cr));
4018348SEric.Yu@Sun.COM 
4028348SEric.Yu@Sun.COM 	flags = msg->msg_flags;
4038348SEric.Yu@Sun.COM 	error = 0;
4048348SEric.Yu@Sun.COM 	dontblock = (flags & MSG_DONTWAIT) ||
4058348SEric.Yu@Sun.COM 	    (uiop->uio_fmode & (FNONBLOCK|FNDELAY));
4068348SEric.Yu@Sun.COM 
4078348SEric.Yu@Sun.COM 	if (!(flags & MSG_XPG4_2) && msg->msg_controllen != 0) {
4088348SEric.Yu@Sun.COM 		/*
4098348SEric.Yu@Sun.COM 		 * Old way of passing fd's is not supported
4108348SEric.Yu@Sun.COM 		 */
4118348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
4128348SEric.Yu@Sun.COM 		return (EOPNOTSUPP);
4138348SEric.Yu@Sun.COM 	}
4148348SEric.Yu@Sun.COM 
4158348SEric.Yu@Sun.COM 	if ((so->so_mode & SM_ATOMIC) &&
4168348SEric.Yu@Sun.COM 	    uiop->uio_resid > so->so_proto_props.sopp_maxpsz &&
4178348SEric.Yu@Sun.COM 	    so->so_proto_props.sopp_maxpsz != -1) {
4188348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
4198348SEric.Yu@Sun.COM 		return (EMSGSIZE);
4208348SEric.Yu@Sun.COM 	}
4218348SEric.Yu@Sun.COM 
4228348SEric.Yu@Sun.COM 	/*
4238348SEric.Yu@Sun.COM 	 * For atomic sends we will only do one iteration.
4248348SEric.Yu@Sun.COM 	 */
4258348SEric.Yu@Sun.COM 	do {
4268348SEric.Yu@Sun.COM 		if (so->so_state & SS_CANTSENDMORE) {
4278348SEric.Yu@Sun.COM 			error = EPIPE;
4288348SEric.Yu@Sun.COM 			break;
4298348SEric.Yu@Sun.COM 		}
4308348SEric.Yu@Sun.COM 
4318348SEric.Yu@Sun.COM 		if (so->so_error != 0) {
4328348SEric.Yu@Sun.COM 			mutex_enter(&so->so_lock);
4338348SEric.Yu@Sun.COM 			error = sogeterr(so, B_TRUE);
4348348SEric.Yu@Sun.COM 			mutex_exit(&so->so_lock);
4358348SEric.Yu@Sun.COM 			if (error != 0)
4368348SEric.Yu@Sun.COM 				break;
4378348SEric.Yu@Sun.COM 		}
4388348SEric.Yu@Sun.COM 
4398348SEric.Yu@Sun.COM 		/*
4408348SEric.Yu@Sun.COM 		 * Send down OOB messages even if the send path is being
4418348SEric.Yu@Sun.COM 		 * flow controlled (assuming the protocol supports OOB data).
4428348SEric.Yu@Sun.COM 		 */
4438348SEric.Yu@Sun.COM 		if (flags & MSG_OOB) {
4448348SEric.Yu@Sun.COM 			if ((so->so_mode & SM_EXDATA) == 0) {
4458348SEric.Yu@Sun.COM 				error = EOPNOTSUPP;
4468348SEric.Yu@Sun.COM 				break;
4478348SEric.Yu@Sun.COM 			}
4488348SEric.Yu@Sun.COM 		} else if (so->so_snd_qfull) {
4498348SEric.Yu@Sun.COM 			/*
4508348SEric.Yu@Sun.COM 			 * Need to wait until the protocol is ready to receive
4518348SEric.Yu@Sun.COM 			 * more data for transmission.
4528348SEric.Yu@Sun.COM 			 */
4538348SEric.Yu@Sun.COM 			if ((error = so_snd_wait_qnotfull(so, dontblock)) != 0)
4548348SEric.Yu@Sun.COM 				break;
4558348SEric.Yu@Sun.COM 		}
4568348SEric.Yu@Sun.COM 
4578348SEric.Yu@Sun.COM 		/*
4588348SEric.Yu@Sun.COM 		 * Time to send data to the protocol. We either copy the
4598348SEric.Yu@Sun.COM 		 * data into mblks or pass the uio directly to the protocol.
4608348SEric.Yu@Sun.COM 		 * We decide what to do based on the available down calls.
4618348SEric.Yu@Sun.COM 		 */
4628348SEric.Yu@Sun.COM 		if (so->so_downcalls->sd_send_uio != NULL) {
4638348SEric.Yu@Sun.COM 			error = (*so->so_downcalls->sd_send_uio)
4648348SEric.Yu@Sun.COM 			    (so->so_proto_handle, uiop, msg, cr);
4658348SEric.Yu@Sun.COM 			if (error != 0)
4668348SEric.Yu@Sun.COM 				break;
4678348SEric.Yu@Sun.COM 		} else {
4688348SEric.Yu@Sun.COM 			/* save the resid in case of failure */
4698348SEric.Yu@Sun.COM 			orig_resid = uiop->uio_resid;
4708348SEric.Yu@Sun.COM 
4718348SEric.Yu@Sun.COM 			if ((mp = socopyinuio(uiop,
4728348SEric.Yu@Sun.COM 			    so->so_proto_props.sopp_maxpsz,
4738348SEric.Yu@Sun.COM 			    so->so_proto_props.sopp_wroff,
4748348SEric.Yu@Sun.COM 			    so->so_proto_props.sopp_maxblk,
4758348SEric.Yu@Sun.COM 			    so->so_proto_props.sopp_tail, &error)) == NULL) {
4768348SEric.Yu@Sun.COM 				break;
4778348SEric.Yu@Sun.COM 			}
4788348SEric.Yu@Sun.COM 			ASSERT(uiop->uio_resid >= 0);
4798348SEric.Yu@Sun.COM 
4808348SEric.Yu@Sun.COM 			error = (*so->so_downcalls->sd_send)
4818348SEric.Yu@Sun.COM 			    (so->so_proto_handle, mp, msg, cr);
4828348SEric.Yu@Sun.COM 			if (error != 0) {
4838348SEric.Yu@Sun.COM 				/*
4848348SEric.Yu@Sun.COM 				 * The send failed. We do not have to free the
4858348SEric.Yu@Sun.COM 				 * mblks, because that is the protocol's
4868348SEric.Yu@Sun.COM 				 * responsibility. However, uio_resid must
4878348SEric.Yu@Sun.COM 				 * remain accurate, so adjust that here.
4888348SEric.Yu@Sun.COM 				 */
4898348SEric.Yu@Sun.COM 				uiop->uio_resid = orig_resid;
4908348SEric.Yu@Sun.COM 					break;
4918348SEric.Yu@Sun.COM 			}
4928348SEric.Yu@Sun.COM 		}
4938348SEric.Yu@Sun.COM 	} while (uiop->uio_resid > 0);
4948348SEric.Yu@Sun.COM 
4958348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
4968348SEric.Yu@Sun.COM 
4978348SEric.Yu@Sun.COM 	return (error);
4988348SEric.Yu@Sun.COM }
4998348SEric.Yu@Sun.COM 
5008348SEric.Yu@Sun.COM int
5018348SEric.Yu@Sun.COM so_sendmblk(struct sonode *so, struct nmsghdr *msg, int fflag,
5028348SEric.Yu@Sun.COM     struct cred *cr, mblk_t **mpp)
5038348SEric.Yu@Sun.COM {
5048348SEric.Yu@Sun.COM 	int error;
5058348SEric.Yu@Sun.COM 	boolean_t dontblock;
5068348SEric.Yu@Sun.COM 	size_t size;
5078348SEric.Yu@Sun.COM 	mblk_t *mp = *mpp;
5088348SEric.Yu@Sun.COM 
5098348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_SENDMBLK(so, msg, fflag, cr, mpp));
5108348SEric.Yu@Sun.COM 
5118348SEric.Yu@Sun.COM 	error = 0;
5128348SEric.Yu@Sun.COM 	dontblock = (msg->msg_flags & MSG_DONTWAIT) ||
5138348SEric.Yu@Sun.COM 	    (fflag & (FNONBLOCK|FNDELAY));
5148348SEric.Yu@Sun.COM 	size = msgdsize(mp);
5158348SEric.Yu@Sun.COM 
5168401SAnders.Persson@Sun.COM 	if ((so->so_mode & SM_SENDFILESUPP) == 0 ||
5178401SAnders.Persson@Sun.COM 	    so->so_downcalls->sd_send == NULL) {
5188348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
5198348SEric.Yu@Sun.COM 		return (EOPNOTSUPP);
5208348SEric.Yu@Sun.COM 	}
5218348SEric.Yu@Sun.COM 
5228348SEric.Yu@Sun.COM 	if ((so->so_mode & SM_ATOMIC) &&
5238348SEric.Yu@Sun.COM 	    size > so->so_proto_props.sopp_maxpsz &&
5248348SEric.Yu@Sun.COM 	    so->so_proto_props.sopp_maxpsz != -1) {
5258348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
5268348SEric.Yu@Sun.COM 		return (EMSGSIZE);
5278348SEric.Yu@Sun.COM 	}
5288348SEric.Yu@Sun.COM 
5298348SEric.Yu@Sun.COM 	while (mp != NULL) {
5308348SEric.Yu@Sun.COM 		mblk_t *nmp, *last_mblk;
5318348SEric.Yu@Sun.COM 		size_t mlen;
5328348SEric.Yu@Sun.COM 
5338348SEric.Yu@Sun.COM 		if (so->so_state & SS_CANTSENDMORE) {
5348348SEric.Yu@Sun.COM 			error = EPIPE;
5358348SEric.Yu@Sun.COM 			break;
5368348SEric.Yu@Sun.COM 		}
5378348SEric.Yu@Sun.COM 		if (so->so_error != 0) {
5388348SEric.Yu@Sun.COM 			mutex_enter(&so->so_lock);
5398348SEric.Yu@Sun.COM 			error = sogeterr(so, B_TRUE);
5408348SEric.Yu@Sun.COM 			mutex_exit(&so->so_lock);
5418348SEric.Yu@Sun.COM 			if (error != 0)
5428348SEric.Yu@Sun.COM 				break;
5438348SEric.Yu@Sun.COM 		}
5448348SEric.Yu@Sun.COM 		if (so->so_snd_qfull) {
5458348SEric.Yu@Sun.COM 			/*
5468348SEric.Yu@Sun.COM 			 * Need to wait until the protocol is ready to receive
5478348SEric.Yu@Sun.COM 			 * more data for transmission.
5488348SEric.Yu@Sun.COM 			 */
5498348SEric.Yu@Sun.COM 			if ((error = so_snd_wait_qnotfull(so, dontblock)) != 0)
5508348SEric.Yu@Sun.COM 				break;
5518348SEric.Yu@Sun.COM 		}
5528348SEric.Yu@Sun.COM 
5538348SEric.Yu@Sun.COM 		/*
5548348SEric.Yu@Sun.COM 		 * We only allow so_maxpsz of data to be sent down to
5558348SEric.Yu@Sun.COM 		 * the protocol at time.
5568348SEric.Yu@Sun.COM 		 */
5578348SEric.Yu@Sun.COM 		mlen = MBLKL(mp);
5588348SEric.Yu@Sun.COM 		nmp = mp->b_cont;
5598348SEric.Yu@Sun.COM 		last_mblk = mp;
5608348SEric.Yu@Sun.COM 		while (nmp != NULL) {
5618348SEric.Yu@Sun.COM 			mlen += MBLKL(nmp);
5628348SEric.Yu@Sun.COM 			if (mlen > so->so_proto_props.sopp_maxpsz) {
5638348SEric.Yu@Sun.COM 				last_mblk->b_cont = NULL;
5648348SEric.Yu@Sun.COM 				break;
5658348SEric.Yu@Sun.COM 			}
5668348SEric.Yu@Sun.COM 			last_mblk = nmp;
5678348SEric.Yu@Sun.COM 			nmp = nmp->b_cont;
5688348SEric.Yu@Sun.COM 		}
5698348SEric.Yu@Sun.COM 
5708348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_send)
5718348SEric.Yu@Sun.COM 		    (so->so_proto_handle, mp, msg, cr);
5728348SEric.Yu@Sun.COM 		if (error != 0) {
5738348SEric.Yu@Sun.COM 			/*
5748348SEric.Yu@Sun.COM 			 * The send failed. The protocol will free the mblks
5758348SEric.Yu@Sun.COM 			 * that were sent down. Let the caller deal with the
5768348SEric.Yu@Sun.COM 			 * rest.
5778348SEric.Yu@Sun.COM 			 */
5788348SEric.Yu@Sun.COM 			*mpp = nmp;
5798348SEric.Yu@Sun.COM 			break;
5808348SEric.Yu@Sun.COM 		}
5818348SEric.Yu@Sun.COM 
5828348SEric.Yu@Sun.COM 		*mpp = mp = nmp;
5838348SEric.Yu@Sun.COM 	}
5848348SEric.Yu@Sun.COM 
5858348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
5868348SEric.Yu@Sun.COM 
5878348SEric.Yu@Sun.COM 	return (error);
5888348SEric.Yu@Sun.COM }
5898348SEric.Yu@Sun.COM 
5908348SEric.Yu@Sun.COM int
5918348SEric.Yu@Sun.COM so_shutdown(struct sonode *so, int how, struct cred *cr)
5928348SEric.Yu@Sun.COM {
5938348SEric.Yu@Sun.COM 	int error;
5948348SEric.Yu@Sun.COM 
5958348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_SHUTDOWN(so, how, cr));
5968348SEric.Yu@Sun.COM 
5978348SEric.Yu@Sun.COM 	/*
5988348SEric.Yu@Sun.COM 	 * SunOS 4.X has no check for datagram sockets.
5998348SEric.Yu@Sun.COM 	 * 5.X checks that it is connected (ENOTCONN)
6008348SEric.Yu@Sun.COM 	 * X/Open requires that we check the connected state.
6018348SEric.Yu@Sun.COM 	 */
6028348SEric.Yu@Sun.COM 	if (!(so->so_state & SS_ISCONNECTED)) {
6038348SEric.Yu@Sun.COM 		if (!xnet_skip_checks) {
6048348SEric.Yu@Sun.COM 			error = ENOTCONN;
6058348SEric.Yu@Sun.COM 			if (xnet_check_print) {
6068348SEric.Yu@Sun.COM 				printf("sockfs: X/Open shutdown check "
6078348SEric.Yu@Sun.COM 				    "caused ENOTCONN\n");
6088348SEric.Yu@Sun.COM 			}
6098348SEric.Yu@Sun.COM 		}
6108348SEric.Yu@Sun.COM 		goto done;
6118348SEric.Yu@Sun.COM 	}
6128348SEric.Yu@Sun.COM 
6138348SEric.Yu@Sun.COM 	error = ((*so->so_downcalls->sd_shutdown)(so->so_proto_handle,
6148348SEric.Yu@Sun.COM 	    how, cr));
6158348SEric.Yu@Sun.COM 
6168348SEric.Yu@Sun.COM 	/*
6178348SEric.Yu@Sun.COM 	 * Protocol agreed to shutdown. We need to flush the
6188348SEric.Yu@Sun.COM 	 * receive buffer if the receive side is being shutdown.
6198348SEric.Yu@Sun.COM 	 */
6208348SEric.Yu@Sun.COM 	if (error == 0 && how != SHUT_WR) {
6218348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
6228348SEric.Yu@Sun.COM 		/* wait for active reader to finish */
6238348SEric.Yu@Sun.COM 		(void) so_lock_read(so, 0);
6248348SEric.Yu@Sun.COM 
6258348SEric.Yu@Sun.COM 		so_rcv_flush(so);
6268348SEric.Yu@Sun.COM 
6278348SEric.Yu@Sun.COM 		so_unlock_read(so);
6288348SEric.Yu@Sun.COM 		mutex_exit(&so->so_lock);
6298348SEric.Yu@Sun.COM 	}
6308348SEric.Yu@Sun.COM 
6318348SEric.Yu@Sun.COM done:
6328348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
6338348SEric.Yu@Sun.COM 	return (error);
6348348SEric.Yu@Sun.COM }
6358348SEric.Yu@Sun.COM 
6368348SEric.Yu@Sun.COM int
6378348SEric.Yu@Sun.COM so_getsockname(struct sonode *so, struct sockaddr *addr,
6388348SEric.Yu@Sun.COM     socklen_t *addrlen, struct cred *cr)
6398348SEric.Yu@Sun.COM {
6408348SEric.Yu@Sun.COM 	int error;
6418348SEric.Yu@Sun.COM 
6428348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_GETSOCKNAME(so, addr, addrlen, cr));
6438348SEric.Yu@Sun.COM 
6448348SEric.Yu@Sun.COM 	error = (*so->so_downcalls->sd_getsockname)
6458348SEric.Yu@Sun.COM 	    (so->so_proto_handle, addr, addrlen, cr);
6468348SEric.Yu@Sun.COM 
6478348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
6488348SEric.Yu@Sun.COM 	return (error);
6498348SEric.Yu@Sun.COM }
6508348SEric.Yu@Sun.COM 
6518348SEric.Yu@Sun.COM int
6528348SEric.Yu@Sun.COM so_getpeername(struct sonode *so, struct sockaddr *addr,
6538348SEric.Yu@Sun.COM     socklen_t *addrlen, boolean_t accept, struct cred *cr)
6548348SEric.Yu@Sun.COM {
6558348SEric.Yu@Sun.COM 	int error;
6568348SEric.Yu@Sun.COM 
6578348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_GETPEERNAME(so, addr, addrlen, accept, cr));
6588348SEric.Yu@Sun.COM 
6598348SEric.Yu@Sun.COM 	if (accept) {
6608348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_getpeername)
6618348SEric.Yu@Sun.COM 		    (so->so_proto_handle, addr, addrlen, cr);
6628348SEric.Yu@Sun.COM 	} else if (!(so->so_state & SS_ISCONNECTED)) {
6638348SEric.Yu@Sun.COM 		error = ENOTCONN;
6648348SEric.Yu@Sun.COM 	} else if ((so->so_state & SS_CANTSENDMORE) && !xnet_skip_checks) {
6658348SEric.Yu@Sun.COM 		/* Added this check for X/Open */
6668348SEric.Yu@Sun.COM 		error = EINVAL;
6678348SEric.Yu@Sun.COM 		if (xnet_check_print) {
6688348SEric.Yu@Sun.COM 			printf("sockfs: X/Open getpeername check => EINVAL\n");
6698348SEric.Yu@Sun.COM 		}
6708348SEric.Yu@Sun.COM 	} else {
6718348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_getpeername)
6728348SEric.Yu@Sun.COM 		    (so->so_proto_handle, addr, addrlen, cr);
6738348SEric.Yu@Sun.COM 	}
6748348SEric.Yu@Sun.COM 
6758348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
6768348SEric.Yu@Sun.COM 	return (error);
6778348SEric.Yu@Sun.COM }
6788348SEric.Yu@Sun.COM 
6798348SEric.Yu@Sun.COM int
6808348SEric.Yu@Sun.COM so_getsockopt(struct sonode *so, int level, int option_name,
6818348SEric.Yu@Sun.COM     void *optval, socklen_t *optlenp, int flags, struct cred *cr)
6828348SEric.Yu@Sun.COM {
6838348SEric.Yu@Sun.COM 	int error = 0;
6848348SEric.Yu@Sun.COM 
6858348SEric.Yu@Sun.COM 	ASSERT(MUTEX_NOT_HELD(&so->so_lock));
6868348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so,
6878348SEric.Yu@Sun.COM 	    SOP_GETSOCKOPT(so, level, option_name, optval, optlenp, flags, cr));
6888348SEric.Yu@Sun.COM 
6898465SEric.Yu@Sun.COM 	error = socket_getopt_common(so, level, option_name, optval, optlenp,
6908465SEric.Yu@Sun.COM 	    flags);
6918348SEric.Yu@Sun.COM 	if (error < 0) {
6928348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_getsockopt)
6938348SEric.Yu@Sun.COM 		    (so->so_proto_handle, level, option_name, optval, optlenp,
6948348SEric.Yu@Sun.COM 		    cr);
6958348SEric.Yu@Sun.COM 		if (error ==  ENOPROTOOPT) {
6968348SEric.Yu@Sun.COM 			if (level == SOL_SOCKET) {
6978348SEric.Yu@Sun.COM 				/*
6988348SEric.Yu@Sun.COM 				 * If a protocol does not support a particular
6998348SEric.Yu@Sun.COM 				 * socket option, set can fail (not allowed)
7008348SEric.Yu@Sun.COM 				 * but get can not fail. This is the previous
7018348SEric.Yu@Sun.COM 				 * sockfs bahvior.
7028348SEric.Yu@Sun.COM 				 */
7038348SEric.Yu@Sun.COM 				switch (option_name) {
7048348SEric.Yu@Sun.COM 				case SO_LINGER:
7058348SEric.Yu@Sun.COM 					if (*optlenp < (t_uscalar_t)
7068348SEric.Yu@Sun.COM 					    sizeof (struct linger)) {
7078348SEric.Yu@Sun.COM 						error = EINVAL;
7088348SEric.Yu@Sun.COM 						break;
7098348SEric.Yu@Sun.COM 					}
7108348SEric.Yu@Sun.COM 					error = 0;
7118348SEric.Yu@Sun.COM 					bzero(optval, sizeof (struct linger));
7128348SEric.Yu@Sun.COM 					*optlenp = sizeof (struct linger);
7138348SEric.Yu@Sun.COM 					break;
7148348SEric.Yu@Sun.COM 				case SO_RCVTIMEO:
7158348SEric.Yu@Sun.COM 				case SO_SNDTIMEO:
7168348SEric.Yu@Sun.COM 					if (*optlenp < (t_uscalar_t)
7178348SEric.Yu@Sun.COM 					    sizeof (struct timeval)) {
7188348SEric.Yu@Sun.COM 						error = EINVAL;
7198348SEric.Yu@Sun.COM 						break;
7208348SEric.Yu@Sun.COM 					}
7218348SEric.Yu@Sun.COM 					error = 0;
7228348SEric.Yu@Sun.COM 					bzero(optval, sizeof (struct timeval));
7238348SEric.Yu@Sun.COM 					*optlenp = sizeof (struct timeval);
7248348SEric.Yu@Sun.COM 					break;
7258348SEric.Yu@Sun.COM 				case SO_SND_BUFINFO:
7268348SEric.Yu@Sun.COM 					if (*optlenp < (t_uscalar_t)
7278348SEric.Yu@Sun.COM 					    sizeof (struct so_snd_bufinfo)) {
7288348SEric.Yu@Sun.COM 						error = EINVAL;
7298348SEric.Yu@Sun.COM 						break;
7308348SEric.Yu@Sun.COM 					}
7318348SEric.Yu@Sun.COM 					error = 0;
7328348SEric.Yu@Sun.COM 					bzero(optval,
7338348SEric.Yu@Sun.COM 					    sizeof (struct so_snd_bufinfo));
7348348SEric.Yu@Sun.COM 					*optlenp =
7358348SEric.Yu@Sun.COM 					    sizeof (struct so_snd_bufinfo);
7368348SEric.Yu@Sun.COM 					break;
7378348SEric.Yu@Sun.COM 				case SO_DEBUG:
7388348SEric.Yu@Sun.COM 				case SO_REUSEADDR:
7398348SEric.Yu@Sun.COM 				case SO_KEEPALIVE:
7408348SEric.Yu@Sun.COM 				case SO_DONTROUTE:
7418348SEric.Yu@Sun.COM 				case SO_BROADCAST:
7428348SEric.Yu@Sun.COM 				case SO_USELOOPBACK:
7438348SEric.Yu@Sun.COM 				case SO_OOBINLINE:
7448348SEric.Yu@Sun.COM 				case SO_DGRAM_ERRIND:
7458348SEric.Yu@Sun.COM 				case SO_SNDBUF:
7468348SEric.Yu@Sun.COM 				case SO_RCVBUF:
7478348SEric.Yu@Sun.COM 					error = 0;
7488348SEric.Yu@Sun.COM 					*((int32_t *)optval) = 0;
7498348SEric.Yu@Sun.COM 					*optlenp = sizeof (int32_t);
7508348SEric.Yu@Sun.COM 					break;
7518348SEric.Yu@Sun.COM 				default:
7528348SEric.Yu@Sun.COM 					break;
7538348SEric.Yu@Sun.COM 				}
7548348SEric.Yu@Sun.COM 			}
7558348SEric.Yu@Sun.COM 		}
7568348SEric.Yu@Sun.COM 	}
7578348SEric.Yu@Sun.COM 
7588348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
7598348SEric.Yu@Sun.COM 	return (error);
7608348SEric.Yu@Sun.COM }
7618348SEric.Yu@Sun.COM 
7628348SEric.Yu@Sun.COM int
7638348SEric.Yu@Sun.COM so_setsockopt(struct sonode *so, int level, int option_name,
7648348SEric.Yu@Sun.COM     const void *optval, socklen_t optlen, struct cred *cr)
7658348SEric.Yu@Sun.COM {
7668348SEric.Yu@Sun.COM 	int error = 0;
7678348SEric.Yu@Sun.COM 
7688348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so,
7698348SEric.Yu@Sun.COM 	    SOP_SETSOCKOPT(so, level, option_name, optval, optlen, cr));
7708348SEric.Yu@Sun.COM 
7718348SEric.Yu@Sun.COM 	/* X/Open requires this check */
7728348SEric.Yu@Sun.COM 	if (so->so_state & SS_CANTSENDMORE && !xnet_skip_checks) {
7738348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
7748348SEric.Yu@Sun.COM 		if (xnet_check_print)
7758348SEric.Yu@Sun.COM 			printf("sockfs: X/Open setsockopt check => EINVAL\n");
7768348SEric.Yu@Sun.COM 		return (EINVAL);
7778348SEric.Yu@Sun.COM 	}
7788348SEric.Yu@Sun.COM 
7798465SEric.Yu@Sun.COM 	if (level == SOL_SOCKET) {
7808465SEric.Yu@Sun.COM 		switch (option_name) {
7818465SEric.Yu@Sun.COM 		case SO_RCVTIMEO:
7828465SEric.Yu@Sun.COM 		case SO_SNDTIMEO: {
7838489Sshenjian 			struct timeval tl;
7848465SEric.Yu@Sun.COM 			clock_t t_usec;
7858348SEric.Yu@Sun.COM 
786*8575Sshenjian 			if (get_udatamodel() == DATAMODEL_NONE ||
787*8575Sshenjian 			    get_udatamodel() == DATAMODEL_NATIVE) {
7888489Sshenjian 				if (optlen != sizeof (struct timeval)) {
7898489Sshenjian 					error = EINVAL;
7908489Sshenjian 					goto done;
7918489Sshenjian 				}
7928489Sshenjian 				bcopy((struct timeval *)optval, &tl,
7938489Sshenjian 				    sizeof (struct timeval));
7948489Sshenjian 			} else {
7958489Sshenjian 				if (optlen != sizeof (struct timeval32)) {
7968489Sshenjian 					error = EINVAL;
7978489Sshenjian 					goto done;
7988489Sshenjian 				}
7998489Sshenjian 				TIMEVAL32_TO_TIMEVAL(&tl,
8008489Sshenjian 				    (struct timeval32 *)optval);
8018465SEric.Yu@Sun.COM 			}
8028489Sshenjian 			t_usec = tl.tv_sec * 1000 * 1000 + tl.tv_usec;
8038465SEric.Yu@Sun.COM 			mutex_enter(&so->so_lock);
8048465SEric.Yu@Sun.COM 			if (option_name == SO_RCVTIMEO)
8058465SEric.Yu@Sun.COM 				so->so_rcvtimeo = drv_usectohz(t_usec);
8068465SEric.Yu@Sun.COM 			else
8078465SEric.Yu@Sun.COM 				so->so_sndtimeo = drv_usectohz(t_usec);
8088465SEric.Yu@Sun.COM 			mutex_exit(&so->so_lock);
8098348SEric.Yu@Sun.COM 			SO_UNBLOCK_FALLBACK(so);
8108465SEric.Yu@Sun.COM 			return (0);
8118348SEric.Yu@Sun.COM 		}
8128465SEric.Yu@Sun.COM 		case SO_RCVBUF:
8138465SEric.Yu@Sun.COM 			/*
8148465SEric.Yu@Sun.COM 			 * XXX XPG 4.2 applications retrieve SO_RCVBUF from
8158465SEric.Yu@Sun.COM 			 * sockfs since the transport might adjust the value
8168465SEric.Yu@Sun.COM 			 * and not return exactly what was set by the
8178465SEric.Yu@Sun.COM 			 * application.
8188465SEric.Yu@Sun.COM 			 */
8198465SEric.Yu@Sun.COM 			so->so_xpg_rcvbuf = *(int32_t *)optval;
8208465SEric.Yu@Sun.COM 			break;
8218465SEric.Yu@Sun.COM 		}
8228348SEric.Yu@Sun.COM 	}
8238348SEric.Yu@Sun.COM 	error = (*so->so_downcalls->sd_setsockopt)
8248348SEric.Yu@Sun.COM 	    (so->so_proto_handle, level, option_name, optval, optlen, cr);
8258489Sshenjian done:
8268348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
8278348SEric.Yu@Sun.COM 	return (error);
8288348SEric.Yu@Sun.COM }
8298348SEric.Yu@Sun.COM 
8308348SEric.Yu@Sun.COM int
8318348SEric.Yu@Sun.COM so_ioctl(struct sonode *so, int cmd, intptr_t arg, int mode,
8328348SEric.Yu@Sun.COM     struct cred *cr, int32_t *rvalp)
8338348SEric.Yu@Sun.COM {
8348348SEric.Yu@Sun.COM 	int error = 0;
8358348SEric.Yu@Sun.COM 
8368348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_IOCTL(so, cmd, arg, mode, cr, rvalp));
8378348SEric.Yu@Sun.COM 
8388348SEric.Yu@Sun.COM 	/*
8398348SEric.Yu@Sun.COM 	 * If there is a pending error, return error
8408348SEric.Yu@Sun.COM 	 * This can happen if a non blocking operation caused an error.
8418348SEric.Yu@Sun.COM 	 */
8428348SEric.Yu@Sun.COM 	if (so->so_error != 0) {
8438348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
8448348SEric.Yu@Sun.COM 		error = sogeterr(so, B_TRUE);
8458348SEric.Yu@Sun.COM 		mutex_exit(&so->so_lock);
8468348SEric.Yu@Sun.COM 		if (error != 0)
8478348SEric.Yu@Sun.COM 			goto done;
8488348SEric.Yu@Sun.COM 	}
8498348SEric.Yu@Sun.COM 
8508348SEric.Yu@Sun.COM 	/*
8518348SEric.Yu@Sun.COM 	 * calling strioc can result in the socket falling back to TPI,
8528348SEric.Yu@Sun.COM 	 * if that is supported.
8538348SEric.Yu@Sun.COM 	 */
8548348SEric.Yu@Sun.COM 	if ((error = socket_ioctl_common(so, cmd, arg, mode, cr, rvalp)) < 0 &&
8558348SEric.Yu@Sun.COM 	    (error = socket_strioc_common(so, cmd, arg, mode, cr, rvalp)) < 0) {
8568348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_ioctl)(so->so_proto_handle,
8578348SEric.Yu@Sun.COM 		    cmd, arg, mode, rvalp, cr);
8588348SEric.Yu@Sun.COM 	}
8598348SEric.Yu@Sun.COM 
8608348SEric.Yu@Sun.COM done:
8618348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
8628348SEric.Yu@Sun.COM 
8638348SEric.Yu@Sun.COM 	return (error);
8648348SEric.Yu@Sun.COM }
8658348SEric.Yu@Sun.COM 
8668348SEric.Yu@Sun.COM int
8678348SEric.Yu@Sun.COM so_poll(struct sonode *so, short events, int anyyet, short *reventsp,
8688348SEric.Yu@Sun.COM     struct pollhead **phpp)
8698348SEric.Yu@Sun.COM {
8708348SEric.Yu@Sun.COM 	int state = so->so_state;
8718348SEric.Yu@Sun.COM 	*reventsp = 0;
8728348SEric.Yu@Sun.COM 
8738348SEric.Yu@Sun.COM 	if (so->so_error != 0 &&
8748348SEric.Yu@Sun.COM 	    ((POLLIN|POLLRDNORM|POLLOUT) & events)  != 0) {
8758348SEric.Yu@Sun.COM 		*reventsp = (POLLIN|POLLRDNORM|POLLOUT) & events;
8768348SEric.Yu@Sun.COM 		return (0);
8778348SEric.Yu@Sun.COM 	}
8788348SEric.Yu@Sun.COM 
8798348SEric.Yu@Sun.COM 	/*
8808348SEric.Yu@Sun.COM 	 * As long as there is buffer to send data, and the socket is
8818348SEric.Yu@Sun.COM 	 * in a state where it can send data (i.e., connected for
8828348SEric.Yu@Sun.COM 	 * connection oriented protocols), then turn on POLLOUT events
8838348SEric.Yu@Sun.COM 	 */
8848348SEric.Yu@Sun.COM 	if (!so->so_snd_qfull && ((so->so_mode & SM_CONNREQUIRED) == 0 ||
8858348SEric.Yu@Sun.COM 	    state & SS_ISCONNECTED)) {
8868348SEric.Yu@Sun.COM 		*reventsp |= POLLOUT & events;
8878348SEric.Yu@Sun.COM 	}
8888348SEric.Yu@Sun.COM 
8898348SEric.Yu@Sun.COM 	/*
8908348SEric.Yu@Sun.COM 	 * Turn on POLLIN whenever there is data on the receive queue,
8918348SEric.Yu@Sun.COM 	 * or the socket is in a state where no more data will be received.
8928348SEric.Yu@Sun.COM 	 * Also, if the socket is accepting connections, flip the bit if
8938348SEric.Yu@Sun.COM 	 * there is something on the queue.
8948427SAnders.Persson@Sun.COM 	 *
8958427SAnders.Persson@Sun.COM 	 * We do an initial check for events without holding locks. However,
8968427SAnders.Persson@Sun.COM 	 * if there are no event available, then we redo the check for POLLIN
8978427SAnders.Persson@Sun.COM 	 * events under the lock.
8988348SEric.Yu@Sun.COM 	 */
8998348SEric.Yu@Sun.COM 
9008348SEric.Yu@Sun.COM 	/* Pending connections */
9018348SEric.Yu@Sun.COM 	if (so->so_acceptq_len > 0)
9028348SEric.Yu@Sun.COM 		*reventsp |= (POLLIN|POLLRDNORM) & events;
9038348SEric.Yu@Sun.COM 
9048348SEric.Yu@Sun.COM 	/* Data */
9058348SEric.Yu@Sun.COM 	/* so_downcalls is null for sctp */
9068348SEric.Yu@Sun.COM 	if (so->so_downcalls != NULL && so->so_downcalls->sd_poll != NULL) {
9078348SEric.Yu@Sun.COM 		*reventsp |= (*so->so_downcalls->sd_poll)
9088348SEric.Yu@Sun.COM 		    (so->so_proto_handle, events & SO_PROTO_POLLEV, anyyet,
9098348SEric.Yu@Sun.COM 		    CRED()) & events;
9108348SEric.Yu@Sun.COM 		ASSERT((*reventsp & ~events) == 0);
9118348SEric.Yu@Sun.COM 		/* do not recheck events */
9128348SEric.Yu@Sun.COM 		events &= ~SO_PROTO_POLLEV;
9138348SEric.Yu@Sun.COM 	} else {
9148348SEric.Yu@Sun.COM 		if (SO_HAVE_DATA(so))
9158348SEric.Yu@Sun.COM 			*reventsp |= (POLLIN|POLLRDNORM) & events;
9168348SEric.Yu@Sun.COM 
9178348SEric.Yu@Sun.COM 		/* Urgent data */
9188348SEric.Yu@Sun.COM 		if ((state & SS_OOBPEND) != 0)
9198348SEric.Yu@Sun.COM 			*reventsp |= (POLLRDBAND) & events;
9208348SEric.Yu@Sun.COM 	}
9218348SEric.Yu@Sun.COM 
9228348SEric.Yu@Sun.COM 	if (!*reventsp && !anyyet) {
9238348SEric.Yu@Sun.COM 		/* Check for read events again, but this time under lock */
9248348SEric.Yu@Sun.COM 		if (events & (POLLIN|POLLRDNORM)) {
9258348SEric.Yu@Sun.COM 			mutex_enter(&so->so_lock);
9268348SEric.Yu@Sun.COM 			if (SO_HAVE_DATA(so) || so->so_acceptq_len > 0) {
9278348SEric.Yu@Sun.COM 				mutex_exit(&so->so_lock);
9288348SEric.Yu@Sun.COM 				*reventsp |= (POLLIN|POLLRDNORM) & events;
9298348SEric.Yu@Sun.COM 				return (0);
9308348SEric.Yu@Sun.COM 			} else {
9318348SEric.Yu@Sun.COM 				so->so_pollev |= SO_POLLEV_IN;
9328348SEric.Yu@Sun.COM 				mutex_exit(&so->so_lock);
9338348SEric.Yu@Sun.COM 			}
9348348SEric.Yu@Sun.COM 		}
9358348SEric.Yu@Sun.COM 		*phpp = &so->so_poll_list;
9368348SEric.Yu@Sun.COM 	}
9378348SEric.Yu@Sun.COM 	return (0);
9388348SEric.Yu@Sun.COM }
9398348SEric.Yu@Sun.COM 
9408348SEric.Yu@Sun.COM /*
9418348SEric.Yu@Sun.COM  * Generic Upcalls
9428348SEric.Yu@Sun.COM  */
9438348SEric.Yu@Sun.COM void
9448348SEric.Yu@Sun.COM so_connected(sock_upper_handle_t sock_handle, sock_connid_t id,
9458348SEric.Yu@Sun.COM     cred_t *peer_cred, pid_t peer_cpid)
9468348SEric.Yu@Sun.COM {
9478348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
9488348SEric.Yu@Sun.COM 
9498348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
9508348SEric.Yu@Sun.COM 	ASSERT(so->so_proto_handle != NULL);
9518348SEric.Yu@Sun.COM 
9528348SEric.Yu@Sun.COM 	if (peer_cred != NULL) {
9538348SEric.Yu@Sun.COM 		if (so->so_peercred != NULL)
9548348SEric.Yu@Sun.COM 			crfree(so->so_peercred);
9558348SEric.Yu@Sun.COM 		crhold(peer_cred);
9568348SEric.Yu@Sun.COM 		so->so_peercred = peer_cred;
9578348SEric.Yu@Sun.COM 		so->so_cpid = peer_cpid;
9588348SEric.Yu@Sun.COM 	}
9598348SEric.Yu@Sun.COM 
9608348SEric.Yu@Sun.COM 	so->so_proto_connid = id;
9618348SEric.Yu@Sun.COM 	soisconnected(so);
9628348SEric.Yu@Sun.COM 	/*
9638348SEric.Yu@Sun.COM 	 * Wake ones who're waiting for conn to become established.
9648348SEric.Yu@Sun.COM 	 */
9658348SEric.Yu@Sun.COM 	so_notify_connected(so);
9668348SEric.Yu@Sun.COM }
9678348SEric.Yu@Sun.COM 
9688348SEric.Yu@Sun.COM int
9698348SEric.Yu@Sun.COM so_disconnected(sock_upper_handle_t sock_handle, sock_connid_t id, int error)
9708348SEric.Yu@Sun.COM {
9718348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
9728348SEric.Yu@Sun.COM 
9738348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
9748348SEric.Yu@Sun.COM 
9758348SEric.Yu@Sun.COM 	so->so_proto_connid = id;
9768348SEric.Yu@Sun.COM 	soisdisconnected(so, error);
9778348SEric.Yu@Sun.COM 	so_notify_disconnected(so, error);
9788348SEric.Yu@Sun.COM 
9798348SEric.Yu@Sun.COM 	return (0);
9808348SEric.Yu@Sun.COM }
9818348SEric.Yu@Sun.COM 
9828348SEric.Yu@Sun.COM void
9838348SEric.Yu@Sun.COM so_opctl(sock_upper_handle_t sock_handle, sock_opctl_action_t action,
9848348SEric.Yu@Sun.COM     uintptr_t arg)
9858348SEric.Yu@Sun.COM {
9868348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
9878348SEric.Yu@Sun.COM 
9888348SEric.Yu@Sun.COM 	switch (action) {
9898348SEric.Yu@Sun.COM 	case SOCK_OPCTL_SHUT_SEND:
9908348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
9918348SEric.Yu@Sun.COM 		socantsendmore(so);
9928348SEric.Yu@Sun.COM 		so_notify_disconnecting(so);
9938348SEric.Yu@Sun.COM 		break;
9948348SEric.Yu@Sun.COM 	case SOCK_OPCTL_SHUT_RECV: {
9958348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
9968348SEric.Yu@Sun.COM 		socantrcvmore(so);
9978348SEric.Yu@Sun.COM 		so_notify_eof(so);
9988348SEric.Yu@Sun.COM 		break;
9998348SEric.Yu@Sun.COM 	}
10008348SEric.Yu@Sun.COM 	case SOCK_OPCTL_ENAB_ACCEPT:
10018348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
10028348SEric.Yu@Sun.COM 		so->so_state |= SS_ACCEPTCONN;
10038348SEric.Yu@Sun.COM 		so->so_backlog = (unsigned int)arg;
10048348SEric.Yu@Sun.COM 		mutex_exit(&so->so_lock);
10058348SEric.Yu@Sun.COM 		break;
10068348SEric.Yu@Sun.COM 	default:
10078348SEric.Yu@Sun.COM 		ASSERT(0);
10088348SEric.Yu@Sun.COM 		break;
10098348SEric.Yu@Sun.COM 	}
10108348SEric.Yu@Sun.COM }
10118348SEric.Yu@Sun.COM 
10128348SEric.Yu@Sun.COM void
10138348SEric.Yu@Sun.COM so_txq_full(sock_upper_handle_t sock_handle, boolean_t qfull)
10148348SEric.Yu@Sun.COM {
10158348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
10168348SEric.Yu@Sun.COM 
10178348SEric.Yu@Sun.COM 	if (qfull) {
10188348SEric.Yu@Sun.COM 		so_snd_qfull(so);
10198348SEric.Yu@Sun.COM 	} else {
10208348SEric.Yu@Sun.COM 		so_snd_qnotfull(so);
10218348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
10228348SEric.Yu@Sun.COM 		so_notify_writable(so);
10238348SEric.Yu@Sun.COM 	}
10248348SEric.Yu@Sun.COM }
10258348SEric.Yu@Sun.COM 
10268348SEric.Yu@Sun.COM sock_upper_handle_t
10278348SEric.Yu@Sun.COM so_newconn(sock_upper_handle_t parenthandle,
10288348SEric.Yu@Sun.COM     sock_lower_handle_t proto_handle, sock_downcalls_t *sock_downcalls,
10298348SEric.Yu@Sun.COM     struct cred *peer_cred, pid_t peer_cpid, sock_upcalls_t **sock_upcallsp)
10308348SEric.Yu@Sun.COM {
10318348SEric.Yu@Sun.COM 	struct sonode	*so = (struct sonode *)parenthandle;
10328348SEric.Yu@Sun.COM 	struct sonode	*nso;
10338348SEric.Yu@Sun.COM 	int error;
10348348SEric.Yu@Sun.COM 
10358348SEric.Yu@Sun.COM 	ASSERT(proto_handle != NULL);
10368348SEric.Yu@Sun.COM 
10378348SEric.Yu@Sun.COM 	if ((so->so_state & SS_ACCEPTCONN) == 0 ||
10388348SEric.Yu@Sun.COM 	    so->so_acceptq_len >= so->so_backlog)
10398348SEric.Yu@Sun.COM 		return (NULL);
10408348SEric.Yu@Sun.COM 
10418348SEric.Yu@Sun.COM 	nso = socket_newconn(so, proto_handle, sock_downcalls, SOCKET_NOSLEEP,
10428348SEric.Yu@Sun.COM 	    &error);
10438348SEric.Yu@Sun.COM 	if (nso == NULL)
10448348SEric.Yu@Sun.COM 		return (NULL);
10458348SEric.Yu@Sun.COM 
10468348SEric.Yu@Sun.COM 	if (peer_cred != NULL) {
10478348SEric.Yu@Sun.COM 		crhold(peer_cred);
10488348SEric.Yu@Sun.COM 		nso->so_peercred = peer_cred;
10498348SEric.Yu@Sun.COM 		nso->so_cpid = peer_cpid;
10508348SEric.Yu@Sun.COM 	}
10518348SEric.Yu@Sun.COM 
10528348SEric.Yu@Sun.COM 	(void) so_acceptq_enqueue(so, nso);
10538348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
10548348SEric.Yu@Sun.COM 	so_notify_newconn(so);
10558348SEric.Yu@Sun.COM 
10568348SEric.Yu@Sun.COM 	*sock_upcallsp = &so_upcalls;
10578348SEric.Yu@Sun.COM 
10588348SEric.Yu@Sun.COM 	return ((sock_upper_handle_t)nso);
10598348SEric.Yu@Sun.COM }
10608348SEric.Yu@Sun.COM 
10618348SEric.Yu@Sun.COM void
10628348SEric.Yu@Sun.COM so_set_prop(sock_upper_handle_t sock_handle, struct sock_proto_props *soppp)
10638348SEric.Yu@Sun.COM {
10648348SEric.Yu@Sun.COM 	struct sonode *so;
10658348SEric.Yu@Sun.COM 
10668348SEric.Yu@Sun.COM 	so = (struct sonode *)sock_handle;
10678348SEric.Yu@Sun.COM 
10688348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
10698348SEric.Yu@Sun.COM 
10708348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_MAXBLK)
10718348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_maxblk = soppp->sopp_maxblk;
10728348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_WROFF)
10738348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_wroff = soppp->sopp_wroff;
10748348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_TAIL)
10758348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_tail = soppp->sopp_tail;
10768348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_RCVHIWAT)
10778348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_rxhiwat = soppp->sopp_rxhiwat;
10788348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_RCVLOWAT)
10798348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_rxlowat = soppp->sopp_rxlowat;
10808348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_MAXPSZ)
10818348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_maxpsz = soppp->sopp_maxpsz;
10828348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_MINPSZ)
10838348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_minpsz = soppp->sopp_minpsz;
10848348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_ZCOPY) {
10858348SEric.Yu@Sun.COM 		if (soppp->sopp_zcopyflag & ZCVMSAFE) {
10868348SEric.Yu@Sun.COM 			so->so_proto_props.sopp_zcopyflag |= STZCVMSAFE;
10878348SEric.Yu@Sun.COM 			so->so_proto_props.sopp_zcopyflag &= ~STZCVMUNSAFE;
10888348SEric.Yu@Sun.COM 		} else if (soppp->sopp_zcopyflag & ZCVMUNSAFE) {
10898348SEric.Yu@Sun.COM 			so->so_proto_props.sopp_zcopyflag |= STZCVMUNSAFE;
10908348SEric.Yu@Sun.COM 			so->so_proto_props.sopp_zcopyflag &= ~STZCVMSAFE;
10918348SEric.Yu@Sun.COM 		}
10928348SEric.Yu@Sun.COM 
10938348SEric.Yu@Sun.COM 		if (soppp->sopp_zcopyflag & COPYCACHED) {
10948348SEric.Yu@Sun.COM 			so->so_proto_props.sopp_zcopyflag |= STRCOPYCACHED;
10958348SEric.Yu@Sun.COM 		}
10968348SEric.Yu@Sun.COM 	}
10978348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_OOBINLINE)
10988348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_oobinline = soppp->sopp_oobinline;
10998348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_RCVTIMER)
11008348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_rcvtimer = soppp->sopp_rcvtimer;
11018348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_RCVTHRESH)
11028348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_rcvthresh = soppp->sopp_rcvthresh;
11038348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_MAXADDRLEN)
11048348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_maxaddrlen = soppp->sopp_maxaddrlen;
11058348SEric.Yu@Sun.COM 
11068348SEric.Yu@Sun.COM 	mutex_exit(&so->so_lock);
11078348SEric.Yu@Sun.COM 
11088348SEric.Yu@Sun.COM #ifdef DEBUG
11098348SEric.Yu@Sun.COM 	soppp->sopp_flags &= ~(SOCKOPT_MAXBLK | SOCKOPT_WROFF | SOCKOPT_TAIL |
11108348SEric.Yu@Sun.COM 	    SOCKOPT_RCVHIWAT | SOCKOPT_RCVLOWAT | SOCKOPT_MAXPSZ |
11118348SEric.Yu@Sun.COM 	    SOCKOPT_ZCOPY | SOCKOPT_OOBINLINE | SOCKOPT_RCVTIMER |
11128348SEric.Yu@Sun.COM 	    SOCKOPT_RCVTHRESH | SOCKOPT_MAXADDRLEN | SOCKOPT_MINPSZ);
11138348SEric.Yu@Sun.COM 	ASSERT(soppp->sopp_flags == 0);
11148348SEric.Yu@Sun.COM #endif
11158348SEric.Yu@Sun.COM }
11168348SEric.Yu@Sun.COM 
11178348SEric.Yu@Sun.COM /* ARGSUSED */
11188348SEric.Yu@Sun.COM ssize_t
11198348SEric.Yu@Sun.COM so_queue_msg(sock_upper_handle_t sock_handle, mblk_t *mp,
11208348SEric.Yu@Sun.COM     size_t msg_size, int flags, int *errorp,  boolean_t *force_pushp)
11218348SEric.Yu@Sun.COM {
11228348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
11238348SEric.Yu@Sun.COM 	boolean_t force_push = B_TRUE;
11248348SEric.Yu@Sun.COM 	int space_left;
11258348SEric.Yu@Sun.COM 	sodirect_t *sodp = so->so_direct;
11268348SEric.Yu@Sun.COM 
11278348SEric.Yu@Sun.COM 	ASSERT(errorp != NULL);
11288348SEric.Yu@Sun.COM 	*errorp = 0;
11298348SEric.Yu@Sun.COM 	if (mp == NULL) {
11308348SEric.Yu@Sun.COM 		if (msg_size > 0) {
11318348SEric.Yu@Sun.COM 			ASSERT(so->so_downcalls->sd_recv_uio != NULL);
11328348SEric.Yu@Sun.COM 			mutex_enter(&so->so_lock);
11338348SEric.Yu@Sun.COM 			/* the notify functions will drop the lock */
11348348SEric.Yu@Sun.COM 			if (flags & MSG_OOB)
11358348SEric.Yu@Sun.COM 				so_notify_oobdata(so, IS_SO_OOB_INLINE(so));
11368348SEric.Yu@Sun.COM 			else
11378348SEric.Yu@Sun.COM 				so_notify_data(so, msg_size);
11388348SEric.Yu@Sun.COM 			return (0);
11398348SEric.Yu@Sun.COM 		}
11408348SEric.Yu@Sun.COM 		/*
11418348SEric.Yu@Sun.COM 		 * recv space check
11428348SEric.Yu@Sun.COM 		 */
11438348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
11448348SEric.Yu@Sun.COM 		space_left = so->so_rcvbuf - so->so_rcv_queued;
11458348SEric.Yu@Sun.COM 		if (space_left <= 0) {
11468348SEric.Yu@Sun.COM 			so->so_flowctrld = B_TRUE;
11478348SEric.Yu@Sun.COM 			*errorp = ENOSPC;
11488348SEric.Yu@Sun.COM 			space_left = -1;
11498348SEric.Yu@Sun.COM 		}
11508348SEric.Yu@Sun.COM 		goto done_unlock;
11518348SEric.Yu@Sun.COM 	}
11528348SEric.Yu@Sun.COM 
11538348SEric.Yu@Sun.COM 	ASSERT(mp->b_next == NULL);
11548348SEric.Yu@Sun.COM 	ASSERT(DB_TYPE(mp) == M_DATA || DB_TYPE(mp) == M_PROTO);
11558348SEric.Yu@Sun.COM 	ASSERT(msg_size == msgdsize(mp));
11568348SEric.Yu@Sun.COM 
11578348SEric.Yu@Sun.COM 	if (flags & MSG_OOB) {
11588348SEric.Yu@Sun.COM 		so_queue_oob(sock_handle, mp, msg_size);
11598348SEric.Yu@Sun.COM 		return (0);
11608348SEric.Yu@Sun.COM 	}
11618348SEric.Yu@Sun.COM 
11628348SEric.Yu@Sun.COM 	if (force_pushp != NULL)
11638348SEric.Yu@Sun.COM 		force_push = *force_pushp;
11648348SEric.Yu@Sun.COM 
11658348SEric.Yu@Sun.COM 	if (DB_TYPE(mp) == M_PROTO && !__TPI_PRIM_ISALIGNED(mp->b_rptr)) {
11668348SEric.Yu@Sun.COM 		/* The read pointer is not aligned correctly for TPI */
11678348SEric.Yu@Sun.COM 		zcmn_err(getzoneid(), CE_WARN,
11688348SEric.Yu@Sun.COM 		    "sockfs: Unaligned TPI message received. rptr = %p\n",
11698348SEric.Yu@Sun.COM 		    (void *)mp->b_rptr);
11708348SEric.Yu@Sun.COM 		freemsg(mp);
11718348SEric.Yu@Sun.COM 		mutex_enter(sodp->sod_lockp);
11728348SEric.Yu@Sun.COM 		SOD_UIOAFINI(sodp);
11738348SEric.Yu@Sun.COM 		mutex_exit(sodp->sod_lockp);
11748348SEric.Yu@Sun.COM 
11758348SEric.Yu@Sun.COM 		return (so->so_rcvbuf - so->so_rcv_queued);
11768348SEric.Yu@Sun.COM 	}
11778348SEric.Yu@Sun.COM 
11788348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
11798348SEric.Yu@Sun.COM 	if (so->so_state & (SS_FALLBACK_PENDING | SS_FALLBACK_COMP)) {
11808348SEric.Yu@Sun.COM 		SOD_DISABLE(sodp);
11818348SEric.Yu@Sun.COM 		mutex_exit(&so->so_lock);
11828348SEric.Yu@Sun.COM 		*errorp = EOPNOTSUPP;
11838348SEric.Yu@Sun.COM 		return (-1);
11848348SEric.Yu@Sun.COM 	}
11858348SEric.Yu@Sun.COM 	if (so->so_state & SS_CANTRCVMORE) {
11868348SEric.Yu@Sun.COM 		freemsg(mp);
11878348SEric.Yu@Sun.COM 		SOD_DISABLE(sodp);
11888348SEric.Yu@Sun.COM 		mutex_exit(&so->so_lock);
11898348SEric.Yu@Sun.COM 		return (0);
11908348SEric.Yu@Sun.COM 	}
11918348SEric.Yu@Sun.COM 
11928348SEric.Yu@Sun.COM 	/* process the mblk via I/OAT if capable */
11938348SEric.Yu@Sun.COM 	if (sodp != NULL && (sodp->sod_state & SOD_ENABLED)) {
11948348SEric.Yu@Sun.COM 		if (DB_TYPE(mp) == M_DATA) {
11958348SEric.Yu@Sun.COM 			(void) sod_uioa_mblk_init(sodp, mp, msg_size);
11968348SEric.Yu@Sun.COM 		} else {
11978348SEric.Yu@Sun.COM 			SOD_UIOAFINI(sodp);
11988348SEric.Yu@Sun.COM 		}
11998348SEric.Yu@Sun.COM 	}
12008348SEric.Yu@Sun.COM 
12018348SEric.Yu@Sun.COM 	if (mp->b_next == NULL) {
12028348SEric.Yu@Sun.COM 		so_enqueue_msg(so, mp, msg_size);
12038348SEric.Yu@Sun.COM 	} else {
12048348SEric.Yu@Sun.COM 		do {
12058348SEric.Yu@Sun.COM 			mblk_t *nmp;
12068348SEric.Yu@Sun.COM 
12078348SEric.Yu@Sun.COM 			if ((nmp = mp->b_next) != NULL) {
12088348SEric.Yu@Sun.COM 				mp->b_next = NULL;
12098348SEric.Yu@Sun.COM 			}
12108348SEric.Yu@Sun.COM 			so_enqueue_msg(so, mp, msgdsize(mp));
12118348SEric.Yu@Sun.COM 			mp = nmp;
12128348SEric.Yu@Sun.COM 		} while (mp != NULL);
12138348SEric.Yu@Sun.COM 	}
12148348SEric.Yu@Sun.COM 
12158348SEric.Yu@Sun.COM 	space_left = so->so_rcvbuf - so->so_rcv_queued;
12168348SEric.Yu@Sun.COM 	if (space_left <= 0) {
12178348SEric.Yu@Sun.COM 		so->so_flowctrld = B_TRUE;
12188348SEric.Yu@Sun.COM 		*errorp = ENOSPC;
12198348SEric.Yu@Sun.COM 		space_left = -1;
12208348SEric.Yu@Sun.COM 	}
12218348SEric.Yu@Sun.COM 
12228348SEric.Yu@Sun.COM 	if (force_push || so->so_rcv_queued >= so->so_rcv_thresh ||
12238348SEric.Yu@Sun.COM 	    so->so_rcv_queued >= so->so_rcv_wanted ||
12248348SEric.Yu@Sun.COM 	    (sodp != NULL && so->so_rcv_queued >= sodp->sod_want)) {
12258348SEric.Yu@Sun.COM 		SOCKET_TIMER_CANCEL(so);
12268348SEric.Yu@Sun.COM 		/*
12278348SEric.Yu@Sun.COM 		 * so_notify_data will release the lock
12288348SEric.Yu@Sun.COM 		 */
12298348SEric.Yu@Sun.COM 		so_notify_data(so, so->so_rcv_queued);
12308348SEric.Yu@Sun.COM 
12318348SEric.Yu@Sun.COM 		if (force_pushp != NULL)
12328348SEric.Yu@Sun.COM 			*force_pushp = B_TRUE;
12338348SEric.Yu@Sun.COM 		goto done;
12348348SEric.Yu@Sun.COM 	} else if (so->so_rcv_timer_tid == 0) {
12358348SEric.Yu@Sun.COM 		/* Make sure the recv push timer is running */
12368348SEric.Yu@Sun.COM 		SOCKET_TIMER_START(so);
12378348SEric.Yu@Sun.COM 	}
12388348SEric.Yu@Sun.COM 
12398348SEric.Yu@Sun.COM done_unlock:
12408348SEric.Yu@Sun.COM 	mutex_exit(&so->so_lock);
12418348SEric.Yu@Sun.COM done:
12428348SEric.Yu@Sun.COM 	return (space_left);
12438348SEric.Yu@Sun.COM }
12448348SEric.Yu@Sun.COM 
12458348SEric.Yu@Sun.COM /*
12468348SEric.Yu@Sun.COM  * Set the offset of where the oob data is relative to the bytes in
12478348SEric.Yu@Sun.COM  * queued. Also generate SIGURG
12488348SEric.Yu@Sun.COM  */
12498348SEric.Yu@Sun.COM void
12508348SEric.Yu@Sun.COM so_signal_oob(sock_upper_handle_t sock_handle, ssize_t offset)
12518348SEric.Yu@Sun.COM {
12528348SEric.Yu@Sun.COM 	struct sonode *so;
12538348SEric.Yu@Sun.COM 
12548348SEric.Yu@Sun.COM 	ASSERT(offset >= 0);
12558348SEric.Yu@Sun.COM 	so = (struct sonode *)sock_handle;
12568348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
12578348SEric.Yu@Sun.COM 	SOD_UIOAFINI(so->so_direct);
12588348SEric.Yu@Sun.COM 
12598348SEric.Yu@Sun.COM 	/*
12608348SEric.Yu@Sun.COM 	 * New urgent data on the way so forget about any old
12618348SEric.Yu@Sun.COM 	 * urgent data.
12628348SEric.Yu@Sun.COM 	 */
12638348SEric.Yu@Sun.COM 	so->so_state &= ~(SS_HAVEOOBDATA|SS_HADOOBDATA);
12648348SEric.Yu@Sun.COM 
12658348SEric.Yu@Sun.COM 	/*
12668348SEric.Yu@Sun.COM 	 * Record that urgent data is pending.
12678348SEric.Yu@Sun.COM 	 */
12688348SEric.Yu@Sun.COM 	so->so_state |= SS_OOBPEND;
12698348SEric.Yu@Sun.COM 
12708348SEric.Yu@Sun.COM 	if (so->so_oobmsg != NULL) {
12718348SEric.Yu@Sun.COM 		dprintso(so, 1, ("sock: discarding old oob\n"));
12728348SEric.Yu@Sun.COM 		freemsg(so->so_oobmsg);
12738348SEric.Yu@Sun.COM 		so->so_oobmsg = NULL;
12748348SEric.Yu@Sun.COM 	}
12758348SEric.Yu@Sun.COM 
12768348SEric.Yu@Sun.COM 	/*
12778348SEric.Yu@Sun.COM 	 * set the offset where the urgent byte is
12788348SEric.Yu@Sun.COM 	 */
12798348SEric.Yu@Sun.COM 	so->so_oobmark = so->so_rcv_queued + offset;
12808348SEric.Yu@Sun.COM 	if (so->so_oobmark == 0)
12818348SEric.Yu@Sun.COM 		so->so_state |= SS_RCVATMARK;
12828348SEric.Yu@Sun.COM 	else
12838348SEric.Yu@Sun.COM 		so->so_state &= ~SS_RCVATMARK;
12848348SEric.Yu@Sun.COM 
12858348SEric.Yu@Sun.COM 	so_notify_oobsig(so);
12868348SEric.Yu@Sun.COM }
12878348SEric.Yu@Sun.COM 
12888348SEric.Yu@Sun.COM /*
12898348SEric.Yu@Sun.COM  * Queue the OOB byte
12908348SEric.Yu@Sun.COM  */
12918348SEric.Yu@Sun.COM static void
12928348SEric.Yu@Sun.COM so_queue_oob(sock_upper_handle_t sock_handle, mblk_t *mp, size_t len)
12938348SEric.Yu@Sun.COM {
12948348SEric.Yu@Sun.COM 	struct sonode *so;
12958348SEric.Yu@Sun.COM 
12968348SEric.Yu@Sun.COM 	so = (struct sonode *)sock_handle;
12978348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
12988348SEric.Yu@Sun.COM 	SOD_UIOAFINI(so->so_direct);
12998348SEric.Yu@Sun.COM 
13008348SEric.Yu@Sun.COM 	ASSERT(mp != NULL);
13018348SEric.Yu@Sun.COM 	if (!IS_SO_OOB_INLINE(so)) {
13028348SEric.Yu@Sun.COM 		so->so_oobmsg = mp;
13038348SEric.Yu@Sun.COM 		so->so_state |= SS_HAVEOOBDATA;
13048348SEric.Yu@Sun.COM 	} else {
13058348SEric.Yu@Sun.COM 		so_enqueue_msg(so, mp, len);
13068348SEric.Yu@Sun.COM 	}
13078348SEric.Yu@Sun.COM 
13088348SEric.Yu@Sun.COM 	so_notify_oobdata(so, IS_SO_OOB_INLINE(so));
13098348SEric.Yu@Sun.COM }
13108348SEric.Yu@Sun.COM 
13118348SEric.Yu@Sun.COM int
13128348SEric.Yu@Sun.COM so_close(struct sonode *so, int flag, struct cred *cr)
13138348SEric.Yu@Sun.COM {
13148348SEric.Yu@Sun.COM 	int error;
13158348SEric.Yu@Sun.COM 
13168348SEric.Yu@Sun.COM 	error = (*so->so_downcalls->sd_close)(so->so_proto_handle, flag, cr);
13178348SEric.Yu@Sun.COM 
13188348SEric.Yu@Sun.COM 	/*
13198348SEric.Yu@Sun.COM 	 * At this point there will be no more upcalls from the protocol
13208348SEric.Yu@Sun.COM 	 */
13218348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
13228399SRao.Shoaib@Sun.COM 
13238399SRao.Shoaib@Sun.COM 	ASSERT(so_verify_oobstate(so));
13248399SRao.Shoaib@Sun.COM 
13258348SEric.Yu@Sun.COM 	so_rcv_flush(so);
13268348SEric.Yu@Sun.COM 	mutex_exit(&so->so_lock);
13278348SEric.Yu@Sun.COM 
13288348SEric.Yu@Sun.COM 	return (error);
13298348SEric.Yu@Sun.COM }
13308348SEric.Yu@Sun.COM 
13318348SEric.Yu@Sun.COM void
13328348SEric.Yu@Sun.COM so_zcopy_notify(sock_upper_handle_t sock_handle)
13338348SEric.Yu@Sun.COM {
13348348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
13358348SEric.Yu@Sun.COM 
13368348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
13378348SEric.Yu@Sun.COM 	so->so_copyflag |= STZCNOTIFY;
13388348SEric.Yu@Sun.COM 	cv_broadcast(&so->so_copy_cv);
13398348SEric.Yu@Sun.COM 	mutex_exit(&so->so_lock);
13408348SEric.Yu@Sun.COM }
13418348SEric.Yu@Sun.COM 
13428348SEric.Yu@Sun.COM void
13438348SEric.Yu@Sun.COM so_set_error(sock_upper_handle_t sock_handle, int error)
13448348SEric.Yu@Sun.COM {
13458348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
13468348SEric.Yu@Sun.COM 
13478348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
13488348SEric.Yu@Sun.COM 
13498348SEric.Yu@Sun.COM 	soseterror(so, error);
13508348SEric.Yu@Sun.COM 
13518348SEric.Yu@Sun.COM 	so_notify_error(so);
13528348SEric.Yu@Sun.COM }
13538348SEric.Yu@Sun.COM 
13548348SEric.Yu@Sun.COM /*
13558348SEric.Yu@Sun.COM  * so_recvmsg - read data from the socket
13568348SEric.Yu@Sun.COM  *
13578348SEric.Yu@Sun.COM  * There are two ways of obtaining data; either we ask the protocol to
13588348SEric.Yu@Sun.COM  * copy directly into the supplied buffer, or we copy data from the
13598348SEric.Yu@Sun.COM  * sonode's receive queue. The decision which one to use depends on
13608348SEric.Yu@Sun.COM  * whether the protocol has a sd_recv_uio down call.
13618348SEric.Yu@Sun.COM  */
13628348SEric.Yu@Sun.COM int
13638348SEric.Yu@Sun.COM so_recvmsg(struct sonode *so, struct nmsghdr *msg, struct uio *uiop,
13648348SEric.Yu@Sun.COM     struct cred *cr)
13658348SEric.Yu@Sun.COM {
13668348SEric.Yu@Sun.COM 	rval_t 		rval;
13678348SEric.Yu@Sun.COM 	int 		flags = 0;
13688348SEric.Yu@Sun.COM 	t_uscalar_t	controllen, namelen;
13698348SEric.Yu@Sun.COM 	int 		error = 0;
13708348SEric.Yu@Sun.COM 	int ret;
13718348SEric.Yu@Sun.COM 	mblk_t		*mctlp = NULL;
13728348SEric.Yu@Sun.COM 	union T_primitives *tpr;
13738348SEric.Yu@Sun.COM 	void		*control;
13748348SEric.Yu@Sun.COM 	ssize_t		saved_resid;
13758348SEric.Yu@Sun.COM 	struct uio	*suiop;
13768348SEric.Yu@Sun.COM 
13778348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_RECVMSG(so, msg, uiop, cr));
13788348SEric.Yu@Sun.COM 
13798348SEric.Yu@Sun.COM 	if ((so->so_state & (SS_ISCONNECTED|SS_CANTRCVMORE)) == 0 &&
13808348SEric.Yu@Sun.COM 	    (so->so_mode & SM_CONNREQUIRED)) {
13818348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
13828348SEric.Yu@Sun.COM 		return (ENOTCONN);
13838348SEric.Yu@Sun.COM 	}
13848348SEric.Yu@Sun.COM 
13858348SEric.Yu@Sun.COM 	if (msg->msg_flags & MSG_PEEK)
13868348SEric.Yu@Sun.COM 		msg->msg_flags &= ~MSG_WAITALL;
13878348SEric.Yu@Sun.COM 
13888348SEric.Yu@Sun.COM 	if (so->so_mode & SM_ATOMIC)
13898348SEric.Yu@Sun.COM 		msg->msg_flags |= MSG_TRUNC;
13908348SEric.Yu@Sun.COM 
13918348SEric.Yu@Sun.COM 	if (msg->msg_flags & MSG_OOB) {
13928348SEric.Yu@Sun.COM 		if ((so->so_mode & SM_EXDATA) == 0) {
13938348SEric.Yu@Sun.COM 			error = EOPNOTSUPP;
13948348SEric.Yu@Sun.COM 		} else if (so->so_downcalls->sd_recv_uio != NULL) {
13958348SEric.Yu@Sun.COM 			error = (*so->so_downcalls->sd_recv_uio)
13968348SEric.Yu@Sun.COM 			    (so->so_proto_handle, uiop, msg, cr);
13978348SEric.Yu@Sun.COM 		} else {
13988348SEric.Yu@Sun.COM 			error = sorecvoob(so, msg, uiop, msg->msg_flags,
13998348SEric.Yu@Sun.COM 			    IS_SO_OOB_INLINE(so));
14008348SEric.Yu@Sun.COM 		}
14018348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
14028348SEric.Yu@Sun.COM 		return (error);
14038348SEric.Yu@Sun.COM 	}
14048348SEric.Yu@Sun.COM 
14058348SEric.Yu@Sun.COM 	/*
14068348SEric.Yu@Sun.COM 	 * If the protocol has the recv down call, then pass the request
14078348SEric.Yu@Sun.COM 	 * down.
14088348SEric.Yu@Sun.COM 	 */
14098348SEric.Yu@Sun.COM 	if (so->so_downcalls->sd_recv_uio != NULL) {
14108348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_recv_uio)
14118348SEric.Yu@Sun.COM 		    (so->so_proto_handle, uiop, msg, cr);
14128348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
14138348SEric.Yu@Sun.COM 		return (error);
14148348SEric.Yu@Sun.COM 	}
14158348SEric.Yu@Sun.COM 
14168348SEric.Yu@Sun.COM 	/*
14178348SEric.Yu@Sun.COM 	 * Reading data from the socket buffer
14188348SEric.Yu@Sun.COM 	 */
14198348SEric.Yu@Sun.COM 	flags = msg->msg_flags;
14208348SEric.Yu@Sun.COM 	msg->msg_flags = 0;
14218348SEric.Yu@Sun.COM 
14228348SEric.Yu@Sun.COM 	/*
14238348SEric.Yu@Sun.COM 	 * Set msg_controllen and msg_namelen to zero here to make it
14248348SEric.Yu@Sun.COM 	 * simpler in the cases that no control or name is returned.
14258348SEric.Yu@Sun.COM 	 */
14268348SEric.Yu@Sun.COM 	controllen = msg->msg_controllen;
14278348SEric.Yu@Sun.COM 	namelen = msg->msg_namelen;
14288348SEric.Yu@Sun.COM 	msg->msg_controllen = 0;
14298348SEric.Yu@Sun.COM 	msg->msg_namelen = 0;
14308348SEric.Yu@Sun.COM 
14318348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
14328348SEric.Yu@Sun.COM 	/* Set SOREADLOCKED */
14338348SEric.Yu@Sun.COM 	error = so_lock_read_intr(so,
14348348SEric.Yu@Sun.COM 	    uiop->uio_fmode | ((flags & MSG_DONTWAIT) ? FNONBLOCK : 0));
14358348SEric.Yu@Sun.COM 	mutex_exit(&so->so_lock);
14368348SEric.Yu@Sun.COM 	if (error) {
14378348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
14388348SEric.Yu@Sun.COM 		return (error);
14398348SEric.Yu@Sun.COM 	}
14408348SEric.Yu@Sun.COM 
14418348SEric.Yu@Sun.COM 	suiop = sod_rcv_init(so, flags, &uiop);
14428348SEric.Yu@Sun.COM retry:
14438348SEric.Yu@Sun.COM 	saved_resid = uiop->uio_resid;
14448348SEric.Yu@Sun.COM 	error = so_dequeue_msg(so, &mctlp, uiop, &rval, flags);
14458348SEric.Yu@Sun.COM 	if (error != 0) {
14468348SEric.Yu@Sun.COM 		goto out;
14478348SEric.Yu@Sun.COM 	}
14488348SEric.Yu@Sun.COM 	/*
14498348SEric.Yu@Sun.COM 	 * For datagrams the MOREDATA flag is used to set MSG_TRUNC.
14508348SEric.Yu@Sun.COM 	 * For non-datagrams MOREDATA is used to set MSG_EOR.
14518348SEric.Yu@Sun.COM 	 */
14528348SEric.Yu@Sun.COM 	ASSERT(!(rval.r_val1 & MORECTL));
14538348SEric.Yu@Sun.COM 	if ((rval.r_val1 & MOREDATA) && (so->so_mode & SM_ATOMIC))
14548348SEric.Yu@Sun.COM 		msg->msg_flags |= MSG_TRUNC;
14558348SEric.Yu@Sun.COM 	if (mctlp == NULL) {
14568348SEric.Yu@Sun.COM 		dprintso(so, 1, ("so_recvmsg: got M_DATA\n"));
14578348SEric.Yu@Sun.COM 
14588348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
14598348SEric.Yu@Sun.COM 		/* Set MSG_EOR based on MOREDATA */
14608348SEric.Yu@Sun.COM 		if (!(rval.r_val1 & MOREDATA)) {
14618348SEric.Yu@Sun.COM 			if (so->so_state & SS_SAVEDEOR) {
14628348SEric.Yu@Sun.COM 				msg->msg_flags |= MSG_EOR;
14638348SEric.Yu@Sun.COM 				so->so_state &= ~SS_SAVEDEOR;
14648348SEric.Yu@Sun.COM 			}
14658348SEric.Yu@Sun.COM 		}
14668348SEric.Yu@Sun.COM 		/*
14678348SEric.Yu@Sun.COM 		 * If some data was received (i.e. not EOF) and the
14688348SEric.Yu@Sun.COM 		 * read/recv* has not been satisfied wait for some more.
14698348SEric.Yu@Sun.COM 		 */
14708348SEric.Yu@Sun.COM 		if ((flags & MSG_WAITALL) && !(msg->msg_flags & MSG_EOR) &&
14718348SEric.Yu@Sun.COM 		    uiop->uio_resid != saved_resid && uiop->uio_resid > 0) {
14728348SEric.Yu@Sun.COM 			mutex_exit(&so->so_lock);
14738348SEric.Yu@Sun.COM 			goto retry;
14748348SEric.Yu@Sun.COM 		}
14758348SEric.Yu@Sun.COM 
14768348SEric.Yu@Sun.COM 		goto out_locked;
14778348SEric.Yu@Sun.COM 	}
14788348SEric.Yu@Sun.COM 	/* strsock_proto has already verified length and alignment */
14798348SEric.Yu@Sun.COM 	tpr = (union T_primitives *)mctlp->b_rptr;
14808348SEric.Yu@Sun.COM 	dprintso(so, 1, ("so_recvmsg: type %d\n", tpr->type));
14818348SEric.Yu@Sun.COM 	switch (tpr->type) {
14828348SEric.Yu@Sun.COM 	case T_DATA_IND: {
14838348SEric.Yu@Sun.COM 		/*
14848348SEric.Yu@Sun.COM 		 * Set msg_flags to MSG_EOR based on
14858348SEric.Yu@Sun.COM 		 * MORE_flag and MOREDATA.
14868348SEric.Yu@Sun.COM 		 */
14878348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
14888348SEric.Yu@Sun.COM 		so->so_state &= ~SS_SAVEDEOR;
14898348SEric.Yu@Sun.COM 		if (!(tpr->data_ind.MORE_flag & 1)) {
14908348SEric.Yu@Sun.COM 			if (!(rval.r_val1 & MOREDATA))
14918348SEric.Yu@Sun.COM 				msg->msg_flags |= MSG_EOR;
14928348SEric.Yu@Sun.COM 			else
14938348SEric.Yu@Sun.COM 				so->so_state |= SS_SAVEDEOR;
14948348SEric.Yu@Sun.COM 		}
14958348SEric.Yu@Sun.COM 		freemsg(mctlp);
14968348SEric.Yu@Sun.COM 		/*
14978348SEric.Yu@Sun.COM 		 * If some data was received (i.e. not EOF) and the
14988348SEric.Yu@Sun.COM 		 * read/recv* has not been satisfied wait for some more.
14998348SEric.Yu@Sun.COM 		 */
15008348SEric.Yu@Sun.COM 		if ((flags & MSG_WAITALL) && !(msg->msg_flags & MSG_EOR) &&
15018348SEric.Yu@Sun.COM 		    uiop->uio_resid != saved_resid && uiop->uio_resid > 0) {
15028348SEric.Yu@Sun.COM 			mutex_exit(&so->so_lock);
15038348SEric.Yu@Sun.COM 			goto retry;
15048348SEric.Yu@Sun.COM 		}
15058348SEric.Yu@Sun.COM 		goto out_locked;
15068348SEric.Yu@Sun.COM 	}
15078348SEric.Yu@Sun.COM 	case T_UNITDATA_IND: {
15088348SEric.Yu@Sun.COM 		void *addr;
15098348SEric.Yu@Sun.COM 		t_uscalar_t addrlen;
15108348SEric.Yu@Sun.COM 		void *abuf;
15118348SEric.Yu@Sun.COM 		t_uscalar_t optlen;
15128348SEric.Yu@Sun.COM 		void *opt;
15138348SEric.Yu@Sun.COM 
15148348SEric.Yu@Sun.COM 		if (namelen != 0) {
15158348SEric.Yu@Sun.COM 			/* Caller wants source address */
15168348SEric.Yu@Sun.COM 			addrlen = tpr->unitdata_ind.SRC_length;
15178348SEric.Yu@Sun.COM 			addr = sogetoff(mctlp, tpr->unitdata_ind.SRC_offset,
15188348SEric.Yu@Sun.COM 			    addrlen, 1);
15198348SEric.Yu@Sun.COM 			if (addr == NULL) {
15208348SEric.Yu@Sun.COM 				freemsg(mctlp);
15218348SEric.Yu@Sun.COM 				error = EPROTO;
15228348SEric.Yu@Sun.COM 				eprintsoline(so, error);
15238348SEric.Yu@Sun.COM 				goto out;
15248348SEric.Yu@Sun.COM 			}
15258348SEric.Yu@Sun.COM 			ASSERT(so->so_family != AF_UNIX);
15268348SEric.Yu@Sun.COM 		}
15278348SEric.Yu@Sun.COM 		optlen = tpr->unitdata_ind.OPT_length;
15288348SEric.Yu@Sun.COM 		if (optlen != 0) {
15298348SEric.Yu@Sun.COM 			t_uscalar_t ncontrollen;
15308348SEric.Yu@Sun.COM 
15318348SEric.Yu@Sun.COM 			/*
15328348SEric.Yu@Sun.COM 			 * Extract any source address option.
15338348SEric.Yu@Sun.COM 			 * Determine how large cmsg buffer is needed.
15348348SEric.Yu@Sun.COM 			 */
15358348SEric.Yu@Sun.COM 			opt = sogetoff(mctlp, tpr->unitdata_ind.OPT_offset,
15368348SEric.Yu@Sun.COM 			    optlen, __TPI_ALIGN_SIZE);
15378348SEric.Yu@Sun.COM 
15388348SEric.Yu@Sun.COM 			if (opt == NULL) {
15398348SEric.Yu@Sun.COM 				freemsg(mctlp);
15408348SEric.Yu@Sun.COM 				error = EPROTO;
15418348SEric.Yu@Sun.COM 				eprintsoline(so, error);
15428348SEric.Yu@Sun.COM 				goto out;
15438348SEric.Yu@Sun.COM 			}
15448348SEric.Yu@Sun.COM 			if (so->so_family == AF_UNIX)
15458348SEric.Yu@Sun.COM 				so_getopt_srcaddr(opt, optlen, &addr, &addrlen);
15468348SEric.Yu@Sun.COM 			ncontrollen = so_cmsglen(mctlp, opt, optlen,
15478348SEric.Yu@Sun.COM 			    !(flags & MSG_XPG4_2));
15488348SEric.Yu@Sun.COM 			if (controllen != 0)
15498348SEric.Yu@Sun.COM 				controllen = ncontrollen;
15508348SEric.Yu@Sun.COM 			else if (ncontrollen != 0)
15518348SEric.Yu@Sun.COM 				msg->msg_flags |= MSG_CTRUNC;
15528348SEric.Yu@Sun.COM 		} else {
15538348SEric.Yu@Sun.COM 			controllen = 0;
15548348SEric.Yu@Sun.COM 		}
15558348SEric.Yu@Sun.COM 
15568348SEric.Yu@Sun.COM 		if (namelen != 0) {
15578348SEric.Yu@Sun.COM 			/*
15588348SEric.Yu@Sun.COM 			 * Return address to caller.
15598348SEric.Yu@Sun.COM 			 * Caller handles truncation if length
15608348SEric.Yu@Sun.COM 			 * exceeds msg_namelen.
15618348SEric.Yu@Sun.COM 			 * NOTE: AF_UNIX NUL termination is ensured by
15628348SEric.Yu@Sun.COM 			 * the sender's copyin_name().
15638348SEric.Yu@Sun.COM 			 */
15648348SEric.Yu@Sun.COM 			abuf = kmem_alloc(addrlen, KM_SLEEP);
15658348SEric.Yu@Sun.COM 
15668348SEric.Yu@Sun.COM 			bcopy(addr, abuf, addrlen);
15678348SEric.Yu@Sun.COM 			msg->msg_name = abuf;
15688348SEric.Yu@Sun.COM 			msg->msg_namelen = addrlen;
15698348SEric.Yu@Sun.COM 		}
15708348SEric.Yu@Sun.COM 
15718348SEric.Yu@Sun.COM 		if (controllen != 0) {
15728348SEric.Yu@Sun.COM 			/*
15738348SEric.Yu@Sun.COM 			 * Return control msg to caller.
15748348SEric.Yu@Sun.COM 			 * Caller handles truncation if length
15758348SEric.Yu@Sun.COM 			 * exceeds msg_controllen.
15768348SEric.Yu@Sun.COM 			 */
15778348SEric.Yu@Sun.COM 			control = kmem_zalloc(controllen, KM_SLEEP);
15788348SEric.Yu@Sun.COM 
15798348SEric.Yu@Sun.COM 			error = so_opt2cmsg(mctlp, opt, optlen,
15808348SEric.Yu@Sun.COM 			    !(flags & MSG_XPG4_2), control, controllen);
15818348SEric.Yu@Sun.COM 			if (error) {
15828348SEric.Yu@Sun.COM 				freemsg(mctlp);
15838348SEric.Yu@Sun.COM 				if (msg->msg_namelen != 0)
15848348SEric.Yu@Sun.COM 					kmem_free(msg->msg_name,
15858348SEric.Yu@Sun.COM 					    msg->msg_namelen);
15868348SEric.Yu@Sun.COM 				kmem_free(control, controllen);
15878348SEric.Yu@Sun.COM 				eprintsoline(so, error);
15888348SEric.Yu@Sun.COM 				goto out;
15898348SEric.Yu@Sun.COM 			}
15908348SEric.Yu@Sun.COM 			msg->msg_control = control;
15918348SEric.Yu@Sun.COM 			msg->msg_controllen = controllen;
15928348SEric.Yu@Sun.COM 		}
15938348SEric.Yu@Sun.COM 
15948348SEric.Yu@Sun.COM 		freemsg(mctlp);
15958348SEric.Yu@Sun.COM 		goto out;
15968348SEric.Yu@Sun.COM 	}
15978348SEric.Yu@Sun.COM 	case T_OPTDATA_IND: {
15988348SEric.Yu@Sun.COM 		struct T_optdata_req *tdr;
15998348SEric.Yu@Sun.COM 		void *opt;
16008348SEric.Yu@Sun.COM 		t_uscalar_t optlen;
16018348SEric.Yu@Sun.COM 
16028348SEric.Yu@Sun.COM 		tdr = (struct T_optdata_req *)mctlp->b_rptr;
16038348SEric.Yu@Sun.COM 		optlen = tdr->OPT_length;
16048348SEric.Yu@Sun.COM 		if (optlen != 0) {
16058348SEric.Yu@Sun.COM 			t_uscalar_t ncontrollen;
16068348SEric.Yu@Sun.COM 			/*
16078348SEric.Yu@Sun.COM 			 * Determine how large cmsg buffer is needed.
16088348SEric.Yu@Sun.COM 			 */
16098348SEric.Yu@Sun.COM 			opt = sogetoff(mctlp,
16108348SEric.Yu@Sun.COM 			    tpr->optdata_ind.OPT_offset, optlen,
16118348SEric.Yu@Sun.COM 			    __TPI_ALIGN_SIZE);
16128348SEric.Yu@Sun.COM 
16138348SEric.Yu@Sun.COM 			if (opt == NULL) {
16148348SEric.Yu@Sun.COM 				freemsg(mctlp);
16158348SEric.Yu@Sun.COM 				error = EPROTO;
16168348SEric.Yu@Sun.COM 				eprintsoline(so, error);
16178348SEric.Yu@Sun.COM 				goto out;
16188348SEric.Yu@Sun.COM 			}
16198348SEric.Yu@Sun.COM 
16208348SEric.Yu@Sun.COM 			ncontrollen = so_cmsglen(mctlp, opt, optlen,
16218348SEric.Yu@Sun.COM 			    !(flags & MSG_XPG4_2));
16228348SEric.Yu@Sun.COM 			if (controllen != 0)
16238348SEric.Yu@Sun.COM 				controllen = ncontrollen;
16248348SEric.Yu@Sun.COM 			else if (ncontrollen != 0)
16258348SEric.Yu@Sun.COM 				msg->msg_flags |= MSG_CTRUNC;
16268348SEric.Yu@Sun.COM 		} else {
16278348SEric.Yu@Sun.COM 			controllen = 0;
16288348SEric.Yu@Sun.COM 		}
16298348SEric.Yu@Sun.COM 
16308348SEric.Yu@Sun.COM 		if (controllen != 0) {
16318348SEric.Yu@Sun.COM 			/*
16328348SEric.Yu@Sun.COM 			 * Return control msg to caller.
16338348SEric.Yu@Sun.COM 			 * Caller handles truncation if length
16348348SEric.Yu@Sun.COM 			 * exceeds msg_controllen.
16358348SEric.Yu@Sun.COM 			 */
16368348SEric.Yu@Sun.COM 			control = kmem_zalloc(controllen, KM_SLEEP);
16378348SEric.Yu@Sun.COM 
16388348SEric.Yu@Sun.COM 			error = so_opt2cmsg(mctlp, opt, optlen,
16398348SEric.Yu@Sun.COM 			    !(flags & MSG_XPG4_2), control, controllen);
16408348SEric.Yu@Sun.COM 			if (error) {
16418348SEric.Yu@Sun.COM 				freemsg(mctlp);
16428348SEric.Yu@Sun.COM 				kmem_free(control, controllen);
16438348SEric.Yu@Sun.COM 				eprintsoline(so, error);
16448348SEric.Yu@Sun.COM 				goto out;
16458348SEric.Yu@Sun.COM 			}
16468348SEric.Yu@Sun.COM 			msg->msg_control = control;
16478348SEric.Yu@Sun.COM 			msg->msg_controllen = controllen;
16488348SEric.Yu@Sun.COM 		}
16498348SEric.Yu@Sun.COM 
16508348SEric.Yu@Sun.COM 		/*
16518348SEric.Yu@Sun.COM 		 * Set msg_flags to MSG_EOR based on
16528348SEric.Yu@Sun.COM 		 * DATA_flag and MOREDATA.
16538348SEric.Yu@Sun.COM 		 */
16548348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
16558348SEric.Yu@Sun.COM 		so->so_state &= ~SS_SAVEDEOR;
16568348SEric.Yu@Sun.COM 		if (!(tpr->data_ind.MORE_flag & 1)) {
16578348SEric.Yu@Sun.COM 			if (!(rval.r_val1 & MOREDATA))
16588348SEric.Yu@Sun.COM 				msg->msg_flags |= MSG_EOR;
16598348SEric.Yu@Sun.COM 			else
16608348SEric.Yu@Sun.COM 				so->so_state |= SS_SAVEDEOR;
16618348SEric.Yu@Sun.COM 		}
16628348SEric.Yu@Sun.COM 		freemsg(mctlp);
16638348SEric.Yu@Sun.COM 		/*
16648348SEric.Yu@Sun.COM 		 * If some data was received (i.e. not EOF) and the
16658348SEric.Yu@Sun.COM 		 * read/recv* has not been satisfied wait for some more.
16668348SEric.Yu@Sun.COM 		 * Not possible to wait if control info was received.
16678348SEric.Yu@Sun.COM 		 */
16688348SEric.Yu@Sun.COM 		if ((flags & MSG_WAITALL) && !(msg->msg_flags & MSG_EOR) &&
16698348SEric.Yu@Sun.COM 		    controllen == 0 &&
16708348SEric.Yu@Sun.COM 		    uiop->uio_resid != saved_resid && uiop->uio_resid > 0) {
16718348SEric.Yu@Sun.COM 			mutex_exit(&so->so_lock);
16728348SEric.Yu@Sun.COM 			goto retry;
16738348SEric.Yu@Sun.COM 		}
16748348SEric.Yu@Sun.COM 		goto out_locked;
16758348SEric.Yu@Sun.COM 	}
16768348SEric.Yu@Sun.COM 	default:
16778348SEric.Yu@Sun.COM 		cmn_err(CE_CONT, "so_recvmsg bad type %x \n",
16788348SEric.Yu@Sun.COM 		    tpr->type);
16798348SEric.Yu@Sun.COM 		freemsg(mctlp);
16808348SEric.Yu@Sun.COM 		error = EPROTO;
16818348SEric.Yu@Sun.COM 		ASSERT(0);
16828348SEric.Yu@Sun.COM 	}
16838348SEric.Yu@Sun.COM out:
16848348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
16858348SEric.Yu@Sun.COM out_locked:
16868348SEric.Yu@Sun.COM 	/* The sod_lockp pointers to the sonode so_lock */
16878348SEric.Yu@Sun.COM 	ret = sod_rcv_done(so, suiop, uiop);
16888348SEric.Yu@Sun.COM 	if (ret != 0 && error == 0)
16898348SEric.Yu@Sun.COM 		error = ret;
16908348SEric.Yu@Sun.COM 
16918348SEric.Yu@Sun.COM 	so_unlock_read(so);	/* Clear SOREADLOCKED */
16928348SEric.Yu@Sun.COM 	mutex_exit(&so->so_lock);
16938348SEric.Yu@Sun.COM 
16948348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
16958348SEric.Yu@Sun.COM 
16968348SEric.Yu@Sun.COM 	return (error);
16978348SEric.Yu@Sun.COM }
16988348SEric.Yu@Sun.COM 
16998348SEric.Yu@Sun.COM sonodeops_t so_sonodeops = {
17008348SEric.Yu@Sun.COM 	so_init,		/* sop_init	*/
17018348SEric.Yu@Sun.COM 	so_accept,		/* sop_accept   */
17028348SEric.Yu@Sun.COM 	so_bind,		/* sop_bind	*/
17038348SEric.Yu@Sun.COM 	so_listen,		/* sop_listen   */
17048348SEric.Yu@Sun.COM 	so_connect,		/* sop_connect  */
17058348SEric.Yu@Sun.COM 	so_recvmsg,		/* sop_recvmsg  */
17068348SEric.Yu@Sun.COM 	so_sendmsg,		/* sop_sendmsg  */
17078348SEric.Yu@Sun.COM 	so_sendmblk,		/* sop_sendmblk */
17088348SEric.Yu@Sun.COM 	so_getpeername,		/* sop_getpeername */
17098348SEric.Yu@Sun.COM 	so_getsockname,		/* sop_getsockname */
17108348SEric.Yu@Sun.COM 	so_shutdown,		/* sop_shutdown */
17118348SEric.Yu@Sun.COM 	so_getsockopt,		/* sop_getsockopt */
17128348SEric.Yu@Sun.COM 	so_setsockopt,		/* sop_setsockopt */
17138348SEric.Yu@Sun.COM 	so_ioctl,		/* sop_ioctl    */
17148348SEric.Yu@Sun.COM 	so_poll,		/* sop_poll	*/
17158348SEric.Yu@Sun.COM 	so_close,		/* sop_close */
17168348SEric.Yu@Sun.COM };
17178348SEric.Yu@Sun.COM 
17188348SEric.Yu@Sun.COM sock_upcalls_t so_upcalls = {
17198348SEric.Yu@Sun.COM 	so_newconn,
17208348SEric.Yu@Sun.COM 	so_connected,
17218348SEric.Yu@Sun.COM 	so_disconnected,
17228348SEric.Yu@Sun.COM 	so_opctl,
17238348SEric.Yu@Sun.COM 	so_queue_msg,
17248348SEric.Yu@Sun.COM 	so_set_prop,
17258348SEric.Yu@Sun.COM 	so_txq_full,
17268348SEric.Yu@Sun.COM 	so_signal_oob,
17278348SEric.Yu@Sun.COM 	so_zcopy_notify,
17288348SEric.Yu@Sun.COM 	so_set_error
17298348SEric.Yu@Sun.COM };
1730