xref: /onnv-gate/usr/src/uts/common/fs/sockfs/sockcommon_sops.c (revision 8399:b13f9ee6bce2)
18348SEric.Yu@Sun.COM /*
28348SEric.Yu@Sun.COM  * CDDL HEADER START
38348SEric.Yu@Sun.COM  *
48348SEric.Yu@Sun.COM  * The contents of this file are subject to the terms of the
58348SEric.Yu@Sun.COM  * Common Development and Distribution License (the "License").
68348SEric.Yu@Sun.COM  * You may not use this file except in compliance with the License.
78348SEric.Yu@Sun.COM  *
88348SEric.Yu@Sun.COM  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
98348SEric.Yu@Sun.COM  * or http://www.opensolaris.org/os/licensing.
108348SEric.Yu@Sun.COM  * See the License for the specific language governing permissions
118348SEric.Yu@Sun.COM  * and limitations under the License.
128348SEric.Yu@Sun.COM  *
138348SEric.Yu@Sun.COM  * When distributing Covered Code, include this CDDL HEADER in each
148348SEric.Yu@Sun.COM  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
158348SEric.Yu@Sun.COM  * If applicable, add the following below this CDDL HEADER, with the
168348SEric.Yu@Sun.COM  * fields enclosed by brackets "[]" replaced with your own identifying
178348SEric.Yu@Sun.COM  * information: Portions Copyright [yyyy] [name of copyright owner]
188348SEric.Yu@Sun.COM  *
198348SEric.Yu@Sun.COM  * CDDL HEADER END
208348SEric.Yu@Sun.COM  */
218348SEric.Yu@Sun.COM 
228348SEric.Yu@Sun.COM /*
238348SEric.Yu@Sun.COM  * Copyright 2008 Sun Microsystems, Inc.  All rights reserved.
248348SEric.Yu@Sun.COM  * Use is subject to license terms.
258348SEric.Yu@Sun.COM  */
268348SEric.Yu@Sun.COM 
278348SEric.Yu@Sun.COM #pragma ident	"@(#)sockcommon_sops.c	1.1	07/06/14 SMI"
288348SEric.Yu@Sun.COM 
298348SEric.Yu@Sun.COM #include <sys/types.h>
308348SEric.Yu@Sun.COM #include <sys/param.h>
318348SEric.Yu@Sun.COM #include <sys/systm.h>
328348SEric.Yu@Sun.COM #include <sys/sysmacros.h>
338348SEric.Yu@Sun.COM #include <sys/debug.h>
348348SEric.Yu@Sun.COM #include <sys/cmn_err.h>
358348SEric.Yu@Sun.COM 
368348SEric.Yu@Sun.COM #include <sys/stropts.h>
378348SEric.Yu@Sun.COM #include <sys/socket.h>
388348SEric.Yu@Sun.COM #include <sys/socketvar.h>
398348SEric.Yu@Sun.COM 
408348SEric.Yu@Sun.COM #define	_SUN_TPI_VERSION	2
418348SEric.Yu@Sun.COM #include <sys/tihdr.h>
428348SEric.Yu@Sun.COM #include <sys/sockio.h>
438348SEric.Yu@Sun.COM #include <sys/sodirect.h>
448348SEric.Yu@Sun.COM #include <sys/kmem_impl.h>
458348SEric.Yu@Sun.COM 
468348SEric.Yu@Sun.COM #include <sys/strsubr.h>
478348SEric.Yu@Sun.COM #include <sys/strsun.h>
488348SEric.Yu@Sun.COM #include <sys/ddi.h>
498348SEric.Yu@Sun.COM #include <netinet/in.h>
508348SEric.Yu@Sun.COM #include <inet/ip.h>
518348SEric.Yu@Sun.COM 
528348SEric.Yu@Sun.COM #include <fs/sockfs/sockcommon.h>
538348SEric.Yu@Sun.COM 
548348SEric.Yu@Sun.COM #include <sys/socket_proto.h>
558348SEric.Yu@Sun.COM 
568348SEric.Yu@Sun.COM #include <fs/sockfs/socktpi_impl.h>
578348SEric.Yu@Sun.COM #include <sys/tihdr.h>
588348SEric.Yu@Sun.COM #include <fs/sockfs/nl7c.h>
598348SEric.Yu@Sun.COM #include <inet/kssl/ksslapi.h>
608348SEric.Yu@Sun.COM 
618348SEric.Yu@Sun.COM 
628348SEric.Yu@Sun.COM extern int xnet_skip_checks;
638348SEric.Yu@Sun.COM extern int xnet_check_print;
648348SEric.Yu@Sun.COM 
658348SEric.Yu@Sun.COM static void so_queue_oob(sock_upper_handle_t, mblk_t *, size_t);
668348SEric.Yu@Sun.COM 
678348SEric.Yu@Sun.COM 
688348SEric.Yu@Sun.COM /*ARGSUSED*/
698348SEric.Yu@Sun.COM int
708348SEric.Yu@Sun.COM so_accept_notsupp(struct sonode *lso, int fflag,
718348SEric.Yu@Sun.COM     struct cred *cr, struct sonode **nsop)
728348SEric.Yu@Sun.COM {
738348SEric.Yu@Sun.COM 	return (EOPNOTSUPP);
748348SEric.Yu@Sun.COM }
758348SEric.Yu@Sun.COM 
768348SEric.Yu@Sun.COM /*ARGSUSED*/
778348SEric.Yu@Sun.COM int
788348SEric.Yu@Sun.COM so_listen_notsupp(struct sonode *so, int backlog, struct cred *cr)
798348SEric.Yu@Sun.COM {
808348SEric.Yu@Sun.COM 	return (EOPNOTSUPP);
818348SEric.Yu@Sun.COM }
828348SEric.Yu@Sun.COM 
838348SEric.Yu@Sun.COM /*ARGSUSED*/
848348SEric.Yu@Sun.COM int
858348SEric.Yu@Sun.COM so_getsockname_notsupp(struct sonode *so, struct sockaddr *sa,
868348SEric.Yu@Sun.COM     socklen_t *len, struct cred *cr)
878348SEric.Yu@Sun.COM {
888348SEric.Yu@Sun.COM 	return (EOPNOTSUPP);
898348SEric.Yu@Sun.COM }
908348SEric.Yu@Sun.COM 
918348SEric.Yu@Sun.COM /*ARGSUSED*/
928348SEric.Yu@Sun.COM int
938348SEric.Yu@Sun.COM so_getpeername_notsupp(struct sonode *so, struct sockaddr *addr,
948348SEric.Yu@Sun.COM     socklen_t *addrlen, boolean_t accept, struct cred *cr)
958348SEric.Yu@Sun.COM {
968348SEric.Yu@Sun.COM 	return (EOPNOTSUPP);
978348SEric.Yu@Sun.COM }
988348SEric.Yu@Sun.COM 
998348SEric.Yu@Sun.COM /*ARGSUSED*/
1008348SEric.Yu@Sun.COM int
1018348SEric.Yu@Sun.COM so_shutdown_notsupp(struct sonode *so, int how, struct cred *cr)
1028348SEric.Yu@Sun.COM {
1038348SEric.Yu@Sun.COM 	return (EOPNOTSUPP);
1048348SEric.Yu@Sun.COM }
1058348SEric.Yu@Sun.COM 
1068348SEric.Yu@Sun.COM /*ARGSUSED*/
1078348SEric.Yu@Sun.COM int
1088348SEric.Yu@Sun.COM so_sendmblk_notsupp(struct sonode *so, struct msghdr *msg, int fflag,
1098348SEric.Yu@Sun.COM     struct cred *cr, mblk_t **mpp)
1108348SEric.Yu@Sun.COM {
1118348SEric.Yu@Sun.COM 	return (EOPNOTSUPP);
1128348SEric.Yu@Sun.COM }
1138348SEric.Yu@Sun.COM 
1148348SEric.Yu@Sun.COM /*
1158348SEric.Yu@Sun.COM  * Generic Socket Ops
1168348SEric.Yu@Sun.COM  */
1178348SEric.Yu@Sun.COM 
1188348SEric.Yu@Sun.COM /* ARGSUSED */
1198348SEric.Yu@Sun.COM int
1208348SEric.Yu@Sun.COM so_init(struct sonode *so, struct sonode *pso, struct cred *cr, int flags)
1218348SEric.Yu@Sun.COM {
1228348SEric.Yu@Sun.COM 	return (socket_init_common(so, pso, flags, cr));
1238348SEric.Yu@Sun.COM }
1248348SEric.Yu@Sun.COM 
1258348SEric.Yu@Sun.COM int
1268348SEric.Yu@Sun.COM so_bind(struct sonode *so, struct sockaddr *name, socklen_t namelen,
1278348SEric.Yu@Sun.COM     int flags, struct cred *cr)
1288348SEric.Yu@Sun.COM {
1298348SEric.Yu@Sun.COM 	int error;
1308348SEric.Yu@Sun.COM 
1318348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_BIND(so, name, namelen, flags, cr));
1328348SEric.Yu@Sun.COM 
1338348SEric.Yu@Sun.COM 	ASSERT(flags == _SOBIND_XPG4_2 || flags == _SOBIND_SOCKBSD);
1348348SEric.Yu@Sun.COM 
1358348SEric.Yu@Sun.COM 	/* X/Open requires this check */
1368348SEric.Yu@Sun.COM 	if ((so->so_state & SS_CANTSENDMORE) && !xnet_skip_checks) {
1378348SEric.Yu@Sun.COM 		if (xnet_check_print) {
1388348SEric.Yu@Sun.COM 			printf("sockfs: X/Open bind state check "
1398348SEric.Yu@Sun.COM 			    "caused EINVAL\n");
1408348SEric.Yu@Sun.COM 		}
1418348SEric.Yu@Sun.COM 		error = EINVAL;
1428348SEric.Yu@Sun.COM 		goto done;
1438348SEric.Yu@Sun.COM 	}
1448348SEric.Yu@Sun.COM 
1458348SEric.Yu@Sun.COM 	/*
1468348SEric.Yu@Sun.COM 	 * a bind to a NULL address is interpreted as unbind. So just
1478348SEric.Yu@Sun.COM 	 * do the downcall.
1488348SEric.Yu@Sun.COM 	 */
1498348SEric.Yu@Sun.COM 	if (name == NULL)
1508348SEric.Yu@Sun.COM 		goto dobind;
1518348SEric.Yu@Sun.COM 
1528348SEric.Yu@Sun.COM 	switch (so->so_family) {
1538348SEric.Yu@Sun.COM 	case AF_INET:
1548348SEric.Yu@Sun.COM 		if ((size_t)namelen != sizeof (sin_t)) {
1558348SEric.Yu@Sun.COM 			error = name->sa_family != so->so_family ?
1568348SEric.Yu@Sun.COM 			    EAFNOSUPPORT : EINVAL;
1578348SEric.Yu@Sun.COM 			eprintsoline(so, error);
1588348SEric.Yu@Sun.COM 			goto done;
1598348SEric.Yu@Sun.COM 		}
1608348SEric.Yu@Sun.COM 
1618348SEric.Yu@Sun.COM 		if ((flags & _SOBIND_XPG4_2) &&
1628348SEric.Yu@Sun.COM 		    (name->sa_family != so->so_family)) {
1638348SEric.Yu@Sun.COM 			/*
1648348SEric.Yu@Sun.COM 			 * This check has to be made for X/Open
1658348SEric.Yu@Sun.COM 			 * sockets however application failures have
1668348SEric.Yu@Sun.COM 			 * been observed when it is applied to
1678348SEric.Yu@Sun.COM 			 * all sockets.
1688348SEric.Yu@Sun.COM 			 */
1698348SEric.Yu@Sun.COM 			error = EAFNOSUPPORT;
1708348SEric.Yu@Sun.COM 			eprintsoline(so, error);
1718348SEric.Yu@Sun.COM 			goto done;
1728348SEric.Yu@Sun.COM 		}
1738348SEric.Yu@Sun.COM 		/*
1748348SEric.Yu@Sun.COM 		 * Force a zero sa_family to match so_family.
1758348SEric.Yu@Sun.COM 		 *
1768348SEric.Yu@Sun.COM 		 * Some programs like inetd(1M) don't set the
1778348SEric.Yu@Sun.COM 		 * family field. Other programs leave
1788348SEric.Yu@Sun.COM 		 * sin_family set to garbage - SunOS 4.X does
1798348SEric.Yu@Sun.COM 		 * not check the family field on a bind.
1808348SEric.Yu@Sun.COM 		 * We use the family field that
1818348SEric.Yu@Sun.COM 		 * was passed in to the socket() call.
1828348SEric.Yu@Sun.COM 		 */
1838348SEric.Yu@Sun.COM 		name->sa_family = so->so_family;
1848348SEric.Yu@Sun.COM 		break;
1858348SEric.Yu@Sun.COM 
1868348SEric.Yu@Sun.COM 	case AF_INET6: {
1878348SEric.Yu@Sun.COM #ifdef DEBUG
1888348SEric.Yu@Sun.COM 		sin6_t *sin6 = (sin6_t *)name;
1898348SEric.Yu@Sun.COM #endif
1908348SEric.Yu@Sun.COM 		if ((size_t)namelen != sizeof (sin6_t)) {
1918348SEric.Yu@Sun.COM 			error = name->sa_family != so->so_family ?
1928348SEric.Yu@Sun.COM 			    EAFNOSUPPORT : EINVAL;
1938348SEric.Yu@Sun.COM 			eprintsoline(so, error);
1948348SEric.Yu@Sun.COM 			goto done;
1958348SEric.Yu@Sun.COM 		}
1968348SEric.Yu@Sun.COM 
1978348SEric.Yu@Sun.COM 		if (name->sa_family != so->so_family) {
1988348SEric.Yu@Sun.COM 			/*
1998348SEric.Yu@Sun.COM 			 * With IPv6 we require the family to match
2008348SEric.Yu@Sun.COM 			 * unlike in IPv4.
2018348SEric.Yu@Sun.COM 			 */
2028348SEric.Yu@Sun.COM 			error = EAFNOSUPPORT;
2038348SEric.Yu@Sun.COM 			eprintsoline(so, error);
2048348SEric.Yu@Sun.COM 			goto done;
2058348SEric.Yu@Sun.COM 		}
2068348SEric.Yu@Sun.COM #ifdef DEBUG
2078348SEric.Yu@Sun.COM 		/*
2088348SEric.Yu@Sun.COM 		 * Verify that apps don't forget to clear
2098348SEric.Yu@Sun.COM 		 * sin6_scope_id etc
2108348SEric.Yu@Sun.COM 		 */
2118348SEric.Yu@Sun.COM 		if (sin6->sin6_scope_id != 0 &&
2128348SEric.Yu@Sun.COM 		    !IN6_IS_ADDR_LINKSCOPE(&sin6->sin6_addr)) {
2138348SEric.Yu@Sun.COM 			zcmn_err(getzoneid(), CE_WARN,
2148348SEric.Yu@Sun.COM 			    "bind with uninitialized sin6_scope_id "
2158348SEric.Yu@Sun.COM 			    "(%d) on socket. Pid = %d\n",
2168348SEric.Yu@Sun.COM 			    (int)sin6->sin6_scope_id,
2178348SEric.Yu@Sun.COM 			    (int)curproc->p_pid);
2188348SEric.Yu@Sun.COM 		}
2198348SEric.Yu@Sun.COM 		if (sin6->__sin6_src_id != 0) {
2208348SEric.Yu@Sun.COM 			zcmn_err(getzoneid(), CE_WARN,
2218348SEric.Yu@Sun.COM 			    "bind with uninitialized __sin6_src_id "
2228348SEric.Yu@Sun.COM 			    "(%d) on socket. Pid = %d\n",
2238348SEric.Yu@Sun.COM 			    (int)sin6->__sin6_src_id,
2248348SEric.Yu@Sun.COM 			    (int)curproc->p_pid);
2258348SEric.Yu@Sun.COM 		}
2268348SEric.Yu@Sun.COM #endif /* DEBUG */
2278348SEric.Yu@Sun.COM 
2288348SEric.Yu@Sun.COM 		break;
2298348SEric.Yu@Sun.COM 	}
2308348SEric.Yu@Sun.COM 	default:
2318348SEric.Yu@Sun.COM 		/* Just pass the request to the protocol */
2328348SEric.Yu@Sun.COM 		goto dobind;
2338348SEric.Yu@Sun.COM 	}
2348348SEric.Yu@Sun.COM 
2358348SEric.Yu@Sun.COM 	/*
2368348SEric.Yu@Sun.COM 	 * First we check if either NCA or KSSL has been enabled for
2378348SEric.Yu@Sun.COM 	 * the requested address, and if so, we fall back to TPI.
2388348SEric.Yu@Sun.COM 	 * If neither of those two services are enabled, then we just
2398348SEric.Yu@Sun.COM 	 * pass the request to the protocol.
2408348SEric.Yu@Sun.COM 	 *
2418348SEric.Yu@Sun.COM 	 * Note that KSSL can only be enabled on a socket if NCA is NOT
2428348SEric.Yu@Sun.COM 	 * enabled for that socket, hence the else-statement below.
2438348SEric.Yu@Sun.COM 	 */
2448348SEric.Yu@Sun.COM 	if (nl7c_enabled && ((so->so_family == AF_INET ||
2458348SEric.Yu@Sun.COM 	    so->so_family == AF_INET6) &&
2468348SEric.Yu@Sun.COM 	    nl7c_lookup_addr(name, namelen) != NULL)) {
2478348SEric.Yu@Sun.COM 		/*
2488348SEric.Yu@Sun.COM 		 * NL7C is not supported in non-global zones,
2498348SEric.Yu@Sun.COM 		 * we enforce this restriction here.
2508348SEric.Yu@Sun.COM 		 */
2518348SEric.Yu@Sun.COM 		if (so->so_zoneid == GLOBAL_ZONEID) {
2528348SEric.Yu@Sun.COM 			/* NCA should be used, so fall back to TPI */
2538348SEric.Yu@Sun.COM 			error = so_tpi_fallback(so, cr);
2548348SEric.Yu@Sun.COM 			SO_UNBLOCK_FALLBACK(so);
2558348SEric.Yu@Sun.COM 			if (error)
2568348SEric.Yu@Sun.COM 				return (error);
2578348SEric.Yu@Sun.COM 			else
2588348SEric.Yu@Sun.COM 				return (SOP_BIND(so, name, namelen, flags, cr));
2598348SEric.Yu@Sun.COM 		}
2608348SEric.Yu@Sun.COM 	} else if (so->so_type == SOCK_STREAM) {
2618348SEric.Yu@Sun.COM 		/* Check if KSSL has been configured for this address */
2628348SEric.Yu@Sun.COM 		kssl_ent_t ent;
2638348SEric.Yu@Sun.COM 		kssl_endpt_type_t type;
2648348SEric.Yu@Sun.COM 		struct T_bind_req bind_req;
2658348SEric.Yu@Sun.COM 		mblk_t *mp;
2668348SEric.Yu@Sun.COM 
2678348SEric.Yu@Sun.COM 		/*
2688348SEric.Yu@Sun.COM 		 * TODO: Check with KSSL team if we could add a function call
2698348SEric.Yu@Sun.COM 		 * that only queries whether KSSL is enabled for the given
2708348SEric.Yu@Sun.COM 		 * address.
2718348SEric.Yu@Sun.COM 		 */
2728348SEric.Yu@Sun.COM 		bind_req.PRIM_type = T_BIND_REQ;
2738348SEric.Yu@Sun.COM 		bind_req.ADDR_length = namelen;
2748348SEric.Yu@Sun.COM 		bind_req.ADDR_offset = (t_scalar_t)sizeof (bind_req);
2758348SEric.Yu@Sun.COM 		mp = soallocproto2(&bind_req, sizeof (bind_req),
2768348SEric.Yu@Sun.COM 		    name, namelen, 0, _ALLOC_SLEEP);
2778348SEric.Yu@Sun.COM 
2788348SEric.Yu@Sun.COM 		type = kssl_check_proxy(mp, so, &ent);
2798348SEric.Yu@Sun.COM 		freemsg(mp);
2808348SEric.Yu@Sun.COM 
2818348SEric.Yu@Sun.COM 		if (type != KSSL_NO_PROXY) {
2828348SEric.Yu@Sun.COM 			/*
2838348SEric.Yu@Sun.COM 			 * KSSL has been configured for this address, so
2848348SEric.Yu@Sun.COM 			 * we must fall back to TPI.
2858348SEric.Yu@Sun.COM 			 */
2868348SEric.Yu@Sun.COM 			kssl_release_ent(ent, so, type);
2878348SEric.Yu@Sun.COM 			error = so_tpi_fallback(so, cr);
2888348SEric.Yu@Sun.COM 			SO_UNBLOCK_FALLBACK(so);
2898348SEric.Yu@Sun.COM 			if (error)
2908348SEric.Yu@Sun.COM 				return (error);
2918348SEric.Yu@Sun.COM 			else
2928348SEric.Yu@Sun.COM 				return (SOP_BIND(so, name, namelen, flags, cr));
2938348SEric.Yu@Sun.COM 		}
2948348SEric.Yu@Sun.COM 	}
2958348SEric.Yu@Sun.COM 
2968348SEric.Yu@Sun.COM dobind:
2978348SEric.Yu@Sun.COM 	error = (*so->so_downcalls->sd_bind)
2988348SEric.Yu@Sun.COM 	    (so->so_proto_handle, name, namelen, cr);
2998348SEric.Yu@Sun.COM done:
3008348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
3018348SEric.Yu@Sun.COM 
3028348SEric.Yu@Sun.COM 	return (error);
3038348SEric.Yu@Sun.COM }
3048348SEric.Yu@Sun.COM 
3058348SEric.Yu@Sun.COM int
3068348SEric.Yu@Sun.COM so_listen(struct sonode *so, int backlog, struct cred *cr)
3078348SEric.Yu@Sun.COM {
3088348SEric.Yu@Sun.COM 	int	error = 0;
3098348SEric.Yu@Sun.COM 
3108348SEric.Yu@Sun.COM 	ASSERT(MUTEX_NOT_HELD(&so->so_lock));
3118348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_LISTEN(so, backlog, cr));
3128348SEric.Yu@Sun.COM 
3138348SEric.Yu@Sun.COM 	error = (*so->so_downcalls->sd_listen)(so->so_proto_handle, backlog,
3148348SEric.Yu@Sun.COM 	    cr);
3158348SEric.Yu@Sun.COM 
3168348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
3178348SEric.Yu@Sun.COM 
3188348SEric.Yu@Sun.COM 	return (error);
3198348SEric.Yu@Sun.COM }
3208348SEric.Yu@Sun.COM 
3218348SEric.Yu@Sun.COM 
3228348SEric.Yu@Sun.COM int
3238348SEric.Yu@Sun.COM so_connect(struct sonode *so, const struct sockaddr *name,
3248348SEric.Yu@Sun.COM     socklen_t namelen, int fflag, int flags, struct cred *cr)
3258348SEric.Yu@Sun.COM {
3268348SEric.Yu@Sun.COM 	int error = 0;
3278348SEric.Yu@Sun.COM 	sock_connid_t id;
3288348SEric.Yu@Sun.COM 
3298348SEric.Yu@Sun.COM 	ASSERT(MUTEX_NOT_HELD(&so->so_lock));
3308348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_CONNECT(so, name, namelen, fflag, flags, cr));
3318348SEric.Yu@Sun.COM 
3328348SEric.Yu@Sun.COM 	/*
3338348SEric.Yu@Sun.COM 	 * If there is a pending error, return error
3348348SEric.Yu@Sun.COM 	 * This can happen if a non blocking operation caused an error.
3358348SEric.Yu@Sun.COM 	 */
3368348SEric.Yu@Sun.COM 
3378348SEric.Yu@Sun.COM 	if (so->so_error != 0) {
3388348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
3398348SEric.Yu@Sun.COM 		error = sogeterr(so, B_TRUE);
3408348SEric.Yu@Sun.COM 		mutex_exit(&so->so_lock);
3418348SEric.Yu@Sun.COM 		if (error != 0)
3428348SEric.Yu@Sun.COM 			goto done;
3438348SEric.Yu@Sun.COM 	}
3448348SEric.Yu@Sun.COM 
3458348SEric.Yu@Sun.COM 	error = (*so->so_downcalls->sd_connect)(so->so_proto_handle,
3468348SEric.Yu@Sun.COM 	    name, namelen, &id, cr);
3478348SEric.Yu@Sun.COM 
3488348SEric.Yu@Sun.COM 	if (error == EINPROGRESS)
3498348SEric.Yu@Sun.COM 		error = so_wait_connected(so, fflag & (FNONBLOCK|FNDELAY), id);
3508348SEric.Yu@Sun.COM 
3518348SEric.Yu@Sun.COM done:
3528348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
3538348SEric.Yu@Sun.COM 	return (error);
3548348SEric.Yu@Sun.COM }
3558348SEric.Yu@Sun.COM 
3568348SEric.Yu@Sun.COM /*ARGSUSED*/
3578348SEric.Yu@Sun.COM int
3588348SEric.Yu@Sun.COM so_accept(struct sonode *so, int fflag, struct cred *cr, struct sonode **nsop)
3598348SEric.Yu@Sun.COM {
3608348SEric.Yu@Sun.COM 	int error = 0;
3618348SEric.Yu@Sun.COM 	struct sonode *nso;
3628348SEric.Yu@Sun.COM 
3638348SEric.Yu@Sun.COM 	*nsop = NULL;
3648348SEric.Yu@Sun.COM 
3658348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_ACCEPT(so, fflag, cr, nsop));
3668348SEric.Yu@Sun.COM 	if ((so->so_state & SS_ACCEPTCONN) == 0) {
3678348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
3688348SEric.Yu@Sun.COM 		return ((so->so_type == SOCK_DGRAM || so->so_type == SOCK_RAW) ?
3698348SEric.Yu@Sun.COM 		    EOPNOTSUPP : EINVAL);
3708348SEric.Yu@Sun.COM 	}
3718348SEric.Yu@Sun.COM 
3728348SEric.Yu@Sun.COM 	if ((error = so_acceptq_dequeue(so, (fflag & (FNONBLOCK|FNDELAY)),
3738348SEric.Yu@Sun.COM 	    &nso)) == 0) {
3748348SEric.Yu@Sun.COM 		ASSERT(nso != NULL);
3758348SEric.Yu@Sun.COM 
3768348SEric.Yu@Sun.COM 		/* finish the accept */
3778348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_accept)(so->so_proto_handle,
3788348SEric.Yu@Sun.COM 		    nso->so_proto_handle, (sock_upper_handle_t)nso, cr);
3798348SEric.Yu@Sun.COM 		if (error != 0) {
3808348SEric.Yu@Sun.COM 			(void) socket_close(nso, 0, cr);
3818348SEric.Yu@Sun.COM 			socket_destroy(nso);
3828348SEric.Yu@Sun.COM 		} else {
3838348SEric.Yu@Sun.COM 			*nsop = nso;
3848348SEric.Yu@Sun.COM 		}
3858348SEric.Yu@Sun.COM 	}
3868348SEric.Yu@Sun.COM 
3878348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
3888348SEric.Yu@Sun.COM 	return (error);
3898348SEric.Yu@Sun.COM }
3908348SEric.Yu@Sun.COM 
3918348SEric.Yu@Sun.COM int
3928348SEric.Yu@Sun.COM so_sendmsg(struct sonode *so, struct nmsghdr *msg, struct uio *uiop,
3938348SEric.Yu@Sun.COM     struct cred *cr)
3948348SEric.Yu@Sun.COM {
3958348SEric.Yu@Sun.COM 	int error, flags;
3968348SEric.Yu@Sun.COM 	boolean_t dontblock;
3978348SEric.Yu@Sun.COM 	ssize_t orig_resid;
3988348SEric.Yu@Sun.COM 	mblk_t  *mp;
3998348SEric.Yu@Sun.COM 
4008348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_SENDMSG(so, msg, uiop, cr));
4018348SEric.Yu@Sun.COM 
4028348SEric.Yu@Sun.COM 	flags = msg->msg_flags;
4038348SEric.Yu@Sun.COM 	error = 0;
4048348SEric.Yu@Sun.COM 	dontblock = (flags & MSG_DONTWAIT) ||
4058348SEric.Yu@Sun.COM 	    (uiop->uio_fmode & (FNONBLOCK|FNDELAY));
4068348SEric.Yu@Sun.COM 
4078348SEric.Yu@Sun.COM 	if (!(flags & MSG_XPG4_2) && msg->msg_controllen != 0) {
4088348SEric.Yu@Sun.COM 		/*
4098348SEric.Yu@Sun.COM 		 * Old way of passing fd's is not supported
4108348SEric.Yu@Sun.COM 		 */
4118348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
4128348SEric.Yu@Sun.COM 		return (EOPNOTSUPP);
4138348SEric.Yu@Sun.COM 	}
4148348SEric.Yu@Sun.COM 
4158348SEric.Yu@Sun.COM 	if ((so->so_mode & SM_ATOMIC) &&
4168348SEric.Yu@Sun.COM 	    uiop->uio_resid > so->so_proto_props.sopp_maxpsz &&
4178348SEric.Yu@Sun.COM 	    so->so_proto_props.sopp_maxpsz != -1) {
4188348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
4198348SEric.Yu@Sun.COM 		return (EMSGSIZE);
4208348SEric.Yu@Sun.COM 	}
4218348SEric.Yu@Sun.COM 
4228348SEric.Yu@Sun.COM 	/*
4238348SEric.Yu@Sun.COM 	 * For atomic sends we will only do one iteration.
4248348SEric.Yu@Sun.COM 	 */
4258348SEric.Yu@Sun.COM 	do {
4268348SEric.Yu@Sun.COM 		if (so->so_state & SS_CANTSENDMORE) {
4278348SEric.Yu@Sun.COM 			error = EPIPE;
4288348SEric.Yu@Sun.COM 			break;
4298348SEric.Yu@Sun.COM 		}
4308348SEric.Yu@Sun.COM 
4318348SEric.Yu@Sun.COM 		if (so->so_error != 0) {
4328348SEric.Yu@Sun.COM 			mutex_enter(&so->so_lock);
4338348SEric.Yu@Sun.COM 			error = sogeterr(so, B_TRUE);
4348348SEric.Yu@Sun.COM 			mutex_exit(&so->so_lock);
4358348SEric.Yu@Sun.COM 			if (error != 0)
4368348SEric.Yu@Sun.COM 				break;
4378348SEric.Yu@Sun.COM 		}
4388348SEric.Yu@Sun.COM 
4398348SEric.Yu@Sun.COM 		/*
4408348SEric.Yu@Sun.COM 		 * Send down OOB messages even if the send path is being
4418348SEric.Yu@Sun.COM 		 * flow controlled (assuming the protocol supports OOB data).
4428348SEric.Yu@Sun.COM 		 */
4438348SEric.Yu@Sun.COM 		if (flags & MSG_OOB) {
4448348SEric.Yu@Sun.COM 			if ((so->so_mode & SM_EXDATA) == 0) {
4458348SEric.Yu@Sun.COM 				error = EOPNOTSUPP;
4468348SEric.Yu@Sun.COM 				break;
4478348SEric.Yu@Sun.COM 			}
4488348SEric.Yu@Sun.COM 		} else if (so->so_snd_qfull) {
4498348SEric.Yu@Sun.COM 			/*
4508348SEric.Yu@Sun.COM 			 * Need to wait until the protocol is ready to receive
4518348SEric.Yu@Sun.COM 			 * more data for transmission.
4528348SEric.Yu@Sun.COM 			 */
4538348SEric.Yu@Sun.COM 			if ((error = so_snd_wait_qnotfull(so, dontblock)) != 0)
4548348SEric.Yu@Sun.COM 				break;
4558348SEric.Yu@Sun.COM 		}
4568348SEric.Yu@Sun.COM 
4578348SEric.Yu@Sun.COM 		/*
4588348SEric.Yu@Sun.COM 		 * Time to send data to the protocol. We either copy the
4598348SEric.Yu@Sun.COM 		 * data into mblks or pass the uio directly to the protocol.
4608348SEric.Yu@Sun.COM 		 * We decide what to do based on the available down calls.
4618348SEric.Yu@Sun.COM 		 */
4628348SEric.Yu@Sun.COM 		if (so->so_downcalls->sd_send_uio != NULL) {
4638348SEric.Yu@Sun.COM 			error = (*so->so_downcalls->sd_send_uio)
4648348SEric.Yu@Sun.COM 			    (so->so_proto_handle, uiop, msg, cr);
4658348SEric.Yu@Sun.COM 			if (error != 0)
4668348SEric.Yu@Sun.COM 				break;
4678348SEric.Yu@Sun.COM 		} else {
4688348SEric.Yu@Sun.COM 			/* save the resid in case of failure */
4698348SEric.Yu@Sun.COM 			orig_resid = uiop->uio_resid;
4708348SEric.Yu@Sun.COM 
4718348SEric.Yu@Sun.COM 			if ((mp = socopyinuio(uiop,
4728348SEric.Yu@Sun.COM 			    so->so_proto_props.sopp_maxpsz,
4738348SEric.Yu@Sun.COM 			    so->so_proto_props.sopp_wroff,
4748348SEric.Yu@Sun.COM 			    so->so_proto_props.sopp_maxblk,
4758348SEric.Yu@Sun.COM 			    so->so_proto_props.sopp_tail, &error)) == NULL) {
4768348SEric.Yu@Sun.COM 				break;
4778348SEric.Yu@Sun.COM 			}
4788348SEric.Yu@Sun.COM 			ASSERT(uiop->uio_resid >= 0);
4798348SEric.Yu@Sun.COM 
4808348SEric.Yu@Sun.COM 			error = (*so->so_downcalls->sd_send)
4818348SEric.Yu@Sun.COM 			    (so->so_proto_handle, mp, msg, cr);
4828348SEric.Yu@Sun.COM 			if (error != 0) {
4838348SEric.Yu@Sun.COM 				/*
4848348SEric.Yu@Sun.COM 				 * The send failed. We do not have to free the
4858348SEric.Yu@Sun.COM 				 * mblks, because that is the protocol's
4868348SEric.Yu@Sun.COM 				 * responsibility. However, uio_resid must
4878348SEric.Yu@Sun.COM 				 * remain accurate, so adjust that here.
4888348SEric.Yu@Sun.COM 				 */
4898348SEric.Yu@Sun.COM 				uiop->uio_resid = orig_resid;
4908348SEric.Yu@Sun.COM 					break;
4918348SEric.Yu@Sun.COM 			}
4928348SEric.Yu@Sun.COM 		}
4938348SEric.Yu@Sun.COM 	} while (uiop->uio_resid > 0);
4948348SEric.Yu@Sun.COM 
4958348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
4968348SEric.Yu@Sun.COM 
4978348SEric.Yu@Sun.COM 	return (error);
4988348SEric.Yu@Sun.COM }
4998348SEric.Yu@Sun.COM 
5008348SEric.Yu@Sun.COM int
5018348SEric.Yu@Sun.COM so_sendmblk(struct sonode *so, struct nmsghdr *msg, int fflag,
5028348SEric.Yu@Sun.COM     struct cred *cr, mblk_t **mpp)
5038348SEric.Yu@Sun.COM {
5048348SEric.Yu@Sun.COM 	int error;
5058348SEric.Yu@Sun.COM 	boolean_t dontblock;
5068348SEric.Yu@Sun.COM 	size_t size;
5078348SEric.Yu@Sun.COM 	mblk_t *mp = *mpp;
5088348SEric.Yu@Sun.COM 
5098348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_SENDMBLK(so, msg, fflag, cr, mpp));
5108348SEric.Yu@Sun.COM 
5118348SEric.Yu@Sun.COM 	error = 0;
5128348SEric.Yu@Sun.COM 	dontblock = (msg->msg_flags & MSG_DONTWAIT) ||
5138348SEric.Yu@Sun.COM 	    (fflag & (FNONBLOCK|FNDELAY));
5148348SEric.Yu@Sun.COM 	size = msgdsize(mp);
5158348SEric.Yu@Sun.COM 
5168348SEric.Yu@Sun.COM 	if (so->so_downcalls->sd_send == NULL) {
5178348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
5188348SEric.Yu@Sun.COM 		return (EOPNOTSUPP);
5198348SEric.Yu@Sun.COM 	}
5208348SEric.Yu@Sun.COM 
5218348SEric.Yu@Sun.COM 	if ((so->so_mode & SM_ATOMIC) &&
5228348SEric.Yu@Sun.COM 	    size > so->so_proto_props.sopp_maxpsz &&
5238348SEric.Yu@Sun.COM 	    so->so_proto_props.sopp_maxpsz != -1) {
5248348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
5258348SEric.Yu@Sun.COM 		return (EMSGSIZE);
5268348SEric.Yu@Sun.COM 	}
5278348SEric.Yu@Sun.COM 
5288348SEric.Yu@Sun.COM 	while (mp != NULL) {
5298348SEric.Yu@Sun.COM 		mblk_t *nmp, *last_mblk;
5308348SEric.Yu@Sun.COM 		size_t mlen;
5318348SEric.Yu@Sun.COM 
5328348SEric.Yu@Sun.COM 		if (so->so_state & SS_CANTSENDMORE) {
5338348SEric.Yu@Sun.COM 			error = EPIPE;
5348348SEric.Yu@Sun.COM 			break;
5358348SEric.Yu@Sun.COM 		}
5368348SEric.Yu@Sun.COM 		if (so->so_error != 0) {
5378348SEric.Yu@Sun.COM 			mutex_enter(&so->so_lock);
5388348SEric.Yu@Sun.COM 			error = sogeterr(so, B_TRUE);
5398348SEric.Yu@Sun.COM 			mutex_exit(&so->so_lock);
5408348SEric.Yu@Sun.COM 			if (error != 0)
5418348SEric.Yu@Sun.COM 				break;
5428348SEric.Yu@Sun.COM 		}
5438348SEric.Yu@Sun.COM 		if (so->so_snd_qfull) {
5448348SEric.Yu@Sun.COM 			/*
5458348SEric.Yu@Sun.COM 			 * Need to wait until the protocol is ready to receive
5468348SEric.Yu@Sun.COM 			 * more data for transmission.
5478348SEric.Yu@Sun.COM 			 */
5488348SEric.Yu@Sun.COM 			if ((error = so_snd_wait_qnotfull(so, dontblock)) != 0)
5498348SEric.Yu@Sun.COM 				break;
5508348SEric.Yu@Sun.COM 		}
5518348SEric.Yu@Sun.COM 
5528348SEric.Yu@Sun.COM 		/*
5538348SEric.Yu@Sun.COM 		 * We only allow so_maxpsz of data to be sent down to
5548348SEric.Yu@Sun.COM 		 * the protocol at time.
5558348SEric.Yu@Sun.COM 		 */
5568348SEric.Yu@Sun.COM 		mlen = MBLKL(mp);
5578348SEric.Yu@Sun.COM 		nmp = mp->b_cont;
5588348SEric.Yu@Sun.COM 		last_mblk = mp;
5598348SEric.Yu@Sun.COM 		while (nmp != NULL) {
5608348SEric.Yu@Sun.COM 			mlen += MBLKL(nmp);
5618348SEric.Yu@Sun.COM 			if (mlen > so->so_proto_props.sopp_maxpsz) {
5628348SEric.Yu@Sun.COM 				last_mblk->b_cont = NULL;
5638348SEric.Yu@Sun.COM 				break;
5648348SEric.Yu@Sun.COM 			}
5658348SEric.Yu@Sun.COM 			last_mblk = nmp;
5668348SEric.Yu@Sun.COM 			nmp = nmp->b_cont;
5678348SEric.Yu@Sun.COM 		}
5688348SEric.Yu@Sun.COM 
5698348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_send)
5708348SEric.Yu@Sun.COM 		    (so->so_proto_handle, mp, msg, cr);
5718348SEric.Yu@Sun.COM 		if (error != 0) {
5728348SEric.Yu@Sun.COM 			/*
5738348SEric.Yu@Sun.COM 			 * The send failed. The protocol will free the mblks
5748348SEric.Yu@Sun.COM 			 * that were sent down. Let the caller deal with the
5758348SEric.Yu@Sun.COM 			 * rest.
5768348SEric.Yu@Sun.COM 			 */
5778348SEric.Yu@Sun.COM 			*mpp = nmp;
5788348SEric.Yu@Sun.COM 			break;
5798348SEric.Yu@Sun.COM 		}
5808348SEric.Yu@Sun.COM 
5818348SEric.Yu@Sun.COM 		*mpp = mp = nmp;
5828348SEric.Yu@Sun.COM 	}
5838348SEric.Yu@Sun.COM 
5848348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
5858348SEric.Yu@Sun.COM 
5868348SEric.Yu@Sun.COM 	return (error);
5878348SEric.Yu@Sun.COM }
5888348SEric.Yu@Sun.COM 
5898348SEric.Yu@Sun.COM int
5908348SEric.Yu@Sun.COM so_shutdown(struct sonode *so, int how, struct cred *cr)
5918348SEric.Yu@Sun.COM {
5928348SEric.Yu@Sun.COM 	int error;
5938348SEric.Yu@Sun.COM 
5948348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_SHUTDOWN(so, how, cr));
5958348SEric.Yu@Sun.COM 
5968348SEric.Yu@Sun.COM 	/*
5978348SEric.Yu@Sun.COM 	 * SunOS 4.X has no check for datagram sockets.
5988348SEric.Yu@Sun.COM 	 * 5.X checks that it is connected (ENOTCONN)
5998348SEric.Yu@Sun.COM 	 * X/Open requires that we check the connected state.
6008348SEric.Yu@Sun.COM 	 */
6018348SEric.Yu@Sun.COM 	if (!(so->so_state & SS_ISCONNECTED)) {
6028348SEric.Yu@Sun.COM 		if (!xnet_skip_checks) {
6038348SEric.Yu@Sun.COM 			error = ENOTCONN;
6048348SEric.Yu@Sun.COM 			if (xnet_check_print) {
6058348SEric.Yu@Sun.COM 				printf("sockfs: X/Open shutdown check "
6068348SEric.Yu@Sun.COM 				    "caused ENOTCONN\n");
6078348SEric.Yu@Sun.COM 			}
6088348SEric.Yu@Sun.COM 		}
6098348SEric.Yu@Sun.COM 		goto done;
6108348SEric.Yu@Sun.COM 	}
6118348SEric.Yu@Sun.COM 
6128348SEric.Yu@Sun.COM 	error = ((*so->so_downcalls->sd_shutdown)(so->so_proto_handle,
6138348SEric.Yu@Sun.COM 	    how, cr));
6148348SEric.Yu@Sun.COM 
6158348SEric.Yu@Sun.COM 	/*
6168348SEric.Yu@Sun.COM 	 * Protocol agreed to shutdown. We need to flush the
6178348SEric.Yu@Sun.COM 	 * receive buffer if the receive side is being shutdown.
6188348SEric.Yu@Sun.COM 	 */
6198348SEric.Yu@Sun.COM 	if (error == 0 && how != SHUT_WR) {
6208348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
6218348SEric.Yu@Sun.COM 		/* wait for active reader to finish */
6228348SEric.Yu@Sun.COM 		(void) so_lock_read(so, 0);
6238348SEric.Yu@Sun.COM 
6248348SEric.Yu@Sun.COM 		so_rcv_flush(so);
6258348SEric.Yu@Sun.COM 
6268348SEric.Yu@Sun.COM 		so_unlock_read(so);
6278348SEric.Yu@Sun.COM 		mutex_exit(&so->so_lock);
6288348SEric.Yu@Sun.COM 	}
6298348SEric.Yu@Sun.COM 
6308348SEric.Yu@Sun.COM done:
6318348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
6328348SEric.Yu@Sun.COM 	return (error);
6338348SEric.Yu@Sun.COM }
6348348SEric.Yu@Sun.COM 
6358348SEric.Yu@Sun.COM int
6368348SEric.Yu@Sun.COM so_getsockname(struct sonode *so, struct sockaddr *addr,
6378348SEric.Yu@Sun.COM     socklen_t *addrlen, struct cred *cr)
6388348SEric.Yu@Sun.COM {
6398348SEric.Yu@Sun.COM 	int error;
6408348SEric.Yu@Sun.COM 
6418348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_GETSOCKNAME(so, addr, addrlen, cr));
6428348SEric.Yu@Sun.COM 
6438348SEric.Yu@Sun.COM 	error = (*so->so_downcalls->sd_getsockname)
6448348SEric.Yu@Sun.COM 	    (so->so_proto_handle, addr, addrlen, cr);
6458348SEric.Yu@Sun.COM 
6468348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
6478348SEric.Yu@Sun.COM 	return (error);
6488348SEric.Yu@Sun.COM }
6498348SEric.Yu@Sun.COM 
6508348SEric.Yu@Sun.COM int
6518348SEric.Yu@Sun.COM so_getpeername(struct sonode *so, struct sockaddr *addr,
6528348SEric.Yu@Sun.COM     socklen_t *addrlen, boolean_t accept, struct cred *cr)
6538348SEric.Yu@Sun.COM {
6548348SEric.Yu@Sun.COM 	int error;
6558348SEric.Yu@Sun.COM 
6568348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_GETPEERNAME(so, addr, addrlen, accept, cr));
6578348SEric.Yu@Sun.COM 
6588348SEric.Yu@Sun.COM 	if (accept) {
6598348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_getpeername)
6608348SEric.Yu@Sun.COM 		    (so->so_proto_handle, addr, addrlen, cr);
6618348SEric.Yu@Sun.COM 	} else if (!(so->so_state & SS_ISCONNECTED)) {
6628348SEric.Yu@Sun.COM 		error = ENOTCONN;
6638348SEric.Yu@Sun.COM 	} else if ((so->so_state & SS_CANTSENDMORE) && !xnet_skip_checks) {
6648348SEric.Yu@Sun.COM 		/* Added this check for X/Open */
6658348SEric.Yu@Sun.COM 		error = EINVAL;
6668348SEric.Yu@Sun.COM 		if (xnet_check_print) {
6678348SEric.Yu@Sun.COM 			printf("sockfs: X/Open getpeername check => EINVAL\n");
6688348SEric.Yu@Sun.COM 		}
6698348SEric.Yu@Sun.COM 	} else {
6708348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_getpeername)
6718348SEric.Yu@Sun.COM 		    (so->so_proto_handle, addr, addrlen, cr);
6728348SEric.Yu@Sun.COM 	}
6738348SEric.Yu@Sun.COM 
6748348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
6758348SEric.Yu@Sun.COM 	return (error);
6768348SEric.Yu@Sun.COM }
6778348SEric.Yu@Sun.COM 
6788348SEric.Yu@Sun.COM int
6798348SEric.Yu@Sun.COM so_getsockopt(struct sonode *so, int level, int option_name,
6808348SEric.Yu@Sun.COM     void *optval, socklen_t *optlenp, int flags, struct cred *cr)
6818348SEric.Yu@Sun.COM {
6828348SEric.Yu@Sun.COM 	int error = 0;
6838348SEric.Yu@Sun.COM 
6848348SEric.Yu@Sun.COM 	ASSERT(MUTEX_NOT_HELD(&so->so_lock));
6858348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so,
6868348SEric.Yu@Sun.COM 	    SOP_GETSOCKOPT(so, level, option_name, optval, optlenp, flags, cr));
6878348SEric.Yu@Sun.COM 
6888348SEric.Yu@Sun.COM 	error = socket_getopt_common(so, level, option_name, optval,
6898348SEric.Yu@Sun.COM 	    optlenp);
6908348SEric.Yu@Sun.COM 	if (error < 0) {
6918348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_getsockopt)
6928348SEric.Yu@Sun.COM 		    (so->so_proto_handle, level, option_name, optval, optlenp,
6938348SEric.Yu@Sun.COM 		    cr);
6948348SEric.Yu@Sun.COM 		if (error ==  ENOPROTOOPT) {
6958348SEric.Yu@Sun.COM 			if (level == SOL_SOCKET) {
6968348SEric.Yu@Sun.COM 				/*
6978348SEric.Yu@Sun.COM 				 * If a protocol does not support a particular
6988348SEric.Yu@Sun.COM 				 * socket option, set can fail (not allowed)
6998348SEric.Yu@Sun.COM 				 * but get can not fail. This is the previous
7008348SEric.Yu@Sun.COM 				 * sockfs bahvior.
7018348SEric.Yu@Sun.COM 				 */
7028348SEric.Yu@Sun.COM 				switch (option_name) {
7038348SEric.Yu@Sun.COM 				case SO_LINGER:
7048348SEric.Yu@Sun.COM 					if (*optlenp < (t_uscalar_t)
7058348SEric.Yu@Sun.COM 					    sizeof (struct linger)) {
7068348SEric.Yu@Sun.COM 						error = EINVAL;
7078348SEric.Yu@Sun.COM 						break;
7088348SEric.Yu@Sun.COM 					}
7098348SEric.Yu@Sun.COM 					error = 0;
7108348SEric.Yu@Sun.COM 					bzero(optval, sizeof (struct linger));
7118348SEric.Yu@Sun.COM 					*optlenp = sizeof (struct linger);
7128348SEric.Yu@Sun.COM 					break;
7138348SEric.Yu@Sun.COM 				case SO_RCVTIMEO:
7148348SEric.Yu@Sun.COM 				case SO_SNDTIMEO:
7158348SEric.Yu@Sun.COM 					if (*optlenp < (t_uscalar_t)
7168348SEric.Yu@Sun.COM 					    sizeof (struct timeval)) {
7178348SEric.Yu@Sun.COM 						error = EINVAL;
7188348SEric.Yu@Sun.COM 						break;
7198348SEric.Yu@Sun.COM 					}
7208348SEric.Yu@Sun.COM 					error = 0;
7218348SEric.Yu@Sun.COM 					bzero(optval, sizeof (struct timeval));
7228348SEric.Yu@Sun.COM 					*optlenp = sizeof (struct timeval);
7238348SEric.Yu@Sun.COM 					break;
7248348SEric.Yu@Sun.COM 				case SO_SND_BUFINFO:
7258348SEric.Yu@Sun.COM 					if (*optlenp < (t_uscalar_t)
7268348SEric.Yu@Sun.COM 					    sizeof (struct so_snd_bufinfo)) {
7278348SEric.Yu@Sun.COM 						error = EINVAL;
7288348SEric.Yu@Sun.COM 						break;
7298348SEric.Yu@Sun.COM 					}
7308348SEric.Yu@Sun.COM 					error = 0;
7318348SEric.Yu@Sun.COM 					bzero(optval,
7328348SEric.Yu@Sun.COM 					    sizeof (struct so_snd_bufinfo));
7338348SEric.Yu@Sun.COM 					*optlenp =
7348348SEric.Yu@Sun.COM 					    sizeof (struct so_snd_bufinfo);
7358348SEric.Yu@Sun.COM 					break;
7368348SEric.Yu@Sun.COM 				case SO_DEBUG:
7378348SEric.Yu@Sun.COM 				case SO_REUSEADDR:
7388348SEric.Yu@Sun.COM 				case SO_KEEPALIVE:
7398348SEric.Yu@Sun.COM 				case SO_DONTROUTE:
7408348SEric.Yu@Sun.COM 				case SO_BROADCAST:
7418348SEric.Yu@Sun.COM 				case SO_USELOOPBACK:
7428348SEric.Yu@Sun.COM 				case SO_OOBINLINE:
7438348SEric.Yu@Sun.COM 				case SO_DGRAM_ERRIND:
7448348SEric.Yu@Sun.COM 				case SO_SNDBUF:
7458348SEric.Yu@Sun.COM 				case SO_RCVBUF:
7468348SEric.Yu@Sun.COM 					error = 0;
7478348SEric.Yu@Sun.COM 					*((int32_t *)optval) = 0;
7488348SEric.Yu@Sun.COM 					*optlenp = sizeof (int32_t);
7498348SEric.Yu@Sun.COM 					break;
7508348SEric.Yu@Sun.COM 				default:
7518348SEric.Yu@Sun.COM 					break;
7528348SEric.Yu@Sun.COM 				}
7538348SEric.Yu@Sun.COM 			}
7548348SEric.Yu@Sun.COM 		}
7558348SEric.Yu@Sun.COM 	}
7568348SEric.Yu@Sun.COM 
7578348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
7588348SEric.Yu@Sun.COM 	return (error);
7598348SEric.Yu@Sun.COM }
7608348SEric.Yu@Sun.COM 
7618348SEric.Yu@Sun.COM int
7628348SEric.Yu@Sun.COM so_setsockopt(struct sonode *so, int level, int option_name,
7638348SEric.Yu@Sun.COM     const void *optval, socklen_t optlen, struct cred *cr)
7648348SEric.Yu@Sun.COM {
7658348SEric.Yu@Sun.COM 	int error = 0;
7668348SEric.Yu@Sun.COM 
7678348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so,
7688348SEric.Yu@Sun.COM 	    SOP_SETSOCKOPT(so, level, option_name, optval, optlen, cr));
7698348SEric.Yu@Sun.COM 
7708348SEric.Yu@Sun.COM 	/* X/Open requires this check */
7718348SEric.Yu@Sun.COM 	if (so->so_state & SS_CANTSENDMORE && !xnet_skip_checks) {
7728348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
7738348SEric.Yu@Sun.COM 		if (xnet_check_print)
7748348SEric.Yu@Sun.COM 			printf("sockfs: X/Open setsockopt check => EINVAL\n");
7758348SEric.Yu@Sun.COM 		return (EINVAL);
7768348SEric.Yu@Sun.COM 	}
7778348SEric.Yu@Sun.COM 
7788348SEric.Yu@Sun.COM 	if (level == SOL_SOCKET &&
7798348SEric.Yu@Sun.COM 	    ((option_name == SO_RCVTIMEO) || (option_name == SO_SNDTIMEO))) {
7808348SEric.Yu@Sun.COM 		struct timeval *tl = (struct timeval *)optval;
7818348SEric.Yu@Sun.COM 		clock_t t_usec;
7828348SEric.Yu@Sun.COM 
7838348SEric.Yu@Sun.COM 		if (optlen != (t_uscalar_t)sizeof (struct timeval)) {
7848348SEric.Yu@Sun.COM 			SO_UNBLOCK_FALLBACK(so);
7858348SEric.Yu@Sun.COM 			return (EINVAL);
7868348SEric.Yu@Sun.COM 		}
7878348SEric.Yu@Sun.COM 		t_usec = tl->tv_sec * 1000 * 1000 + tl->tv_usec;
7888348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
7898348SEric.Yu@Sun.COM 		if (option_name == SO_RCVTIMEO)
7908348SEric.Yu@Sun.COM 			so->so_rcvtimeo = drv_usectohz(t_usec);
7918348SEric.Yu@Sun.COM 		else
7928348SEric.Yu@Sun.COM 			so->so_sndtimeo = drv_usectohz(t_usec);
7938348SEric.Yu@Sun.COM 		mutex_exit(&so->so_lock);
7948348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
7958348SEric.Yu@Sun.COM 		return (0);
7968348SEric.Yu@Sun.COM 	}
7978348SEric.Yu@Sun.COM 	error = (*so->so_downcalls->sd_setsockopt)
7988348SEric.Yu@Sun.COM 	    (so->so_proto_handle, level, option_name, optval, optlen, cr);
7998348SEric.Yu@Sun.COM 
8008348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
8018348SEric.Yu@Sun.COM 	return (error);
8028348SEric.Yu@Sun.COM }
8038348SEric.Yu@Sun.COM 
8048348SEric.Yu@Sun.COM int
8058348SEric.Yu@Sun.COM so_ioctl(struct sonode *so, int cmd, intptr_t arg, int mode,
8068348SEric.Yu@Sun.COM     struct cred *cr, int32_t *rvalp)
8078348SEric.Yu@Sun.COM {
8088348SEric.Yu@Sun.COM 	int error = 0;
8098348SEric.Yu@Sun.COM 
8108348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_IOCTL(so, cmd, arg, mode, cr, rvalp));
8118348SEric.Yu@Sun.COM 
8128348SEric.Yu@Sun.COM 	/*
8138348SEric.Yu@Sun.COM 	 * If there is a pending error, return error
8148348SEric.Yu@Sun.COM 	 * This can happen if a non blocking operation caused an error.
8158348SEric.Yu@Sun.COM 	 */
8168348SEric.Yu@Sun.COM 	if (so->so_error != 0) {
8178348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
8188348SEric.Yu@Sun.COM 		error = sogeterr(so, B_TRUE);
8198348SEric.Yu@Sun.COM 		mutex_exit(&so->so_lock);
8208348SEric.Yu@Sun.COM 		if (error != 0)
8218348SEric.Yu@Sun.COM 			goto done;
8228348SEric.Yu@Sun.COM 	}
8238348SEric.Yu@Sun.COM 
8248348SEric.Yu@Sun.COM 	/*
8258348SEric.Yu@Sun.COM 	 * calling strioc can result in the socket falling back to TPI,
8268348SEric.Yu@Sun.COM 	 * if that is supported.
8278348SEric.Yu@Sun.COM 	 */
8288348SEric.Yu@Sun.COM 	if ((error = socket_ioctl_common(so, cmd, arg, mode, cr, rvalp)) < 0 &&
8298348SEric.Yu@Sun.COM 	    (error = socket_strioc_common(so, cmd, arg, mode, cr, rvalp)) < 0) {
8308348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_ioctl)(so->so_proto_handle,
8318348SEric.Yu@Sun.COM 		    cmd, arg, mode, rvalp, cr);
8328348SEric.Yu@Sun.COM 	}
8338348SEric.Yu@Sun.COM 
8348348SEric.Yu@Sun.COM done:
8358348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
8368348SEric.Yu@Sun.COM 
8378348SEric.Yu@Sun.COM 	return (error);
8388348SEric.Yu@Sun.COM }
8398348SEric.Yu@Sun.COM 
8408348SEric.Yu@Sun.COM int
8418348SEric.Yu@Sun.COM so_poll(struct sonode *so, short events, int anyyet, short *reventsp,
8428348SEric.Yu@Sun.COM     struct pollhead **phpp)
8438348SEric.Yu@Sun.COM {
8448348SEric.Yu@Sun.COM 	int state = so->so_state;
8458348SEric.Yu@Sun.COM 	*reventsp = 0;
8468348SEric.Yu@Sun.COM 
8478348SEric.Yu@Sun.COM 	if (so->so_error != 0 &&
8488348SEric.Yu@Sun.COM 	    ((POLLIN|POLLRDNORM|POLLOUT) & events)  != 0) {
8498348SEric.Yu@Sun.COM 		*reventsp = (POLLIN|POLLRDNORM|POLLOUT) & events;
8508348SEric.Yu@Sun.COM 		return (0);
8518348SEric.Yu@Sun.COM 	}
8528348SEric.Yu@Sun.COM 
8538348SEric.Yu@Sun.COM 	/*
8548348SEric.Yu@Sun.COM 	 * As long as there is buffer to send data, and the socket is
8558348SEric.Yu@Sun.COM 	 * in a state where it can send data (i.e., connected for
8568348SEric.Yu@Sun.COM 	 * connection oriented protocols), then turn on POLLOUT events
8578348SEric.Yu@Sun.COM 	 */
8588348SEric.Yu@Sun.COM 	if (!so->so_snd_qfull && ((so->so_mode & SM_CONNREQUIRED) == 0 ||
8598348SEric.Yu@Sun.COM 	    state & SS_ISCONNECTED)) {
8608348SEric.Yu@Sun.COM 		*reventsp |= POLLOUT & events;
8618348SEric.Yu@Sun.COM 	}
8628348SEric.Yu@Sun.COM 
8638348SEric.Yu@Sun.COM 	/*
8648348SEric.Yu@Sun.COM 	 * Turn on POLLIN whenever there is data on the receive queue,
8658348SEric.Yu@Sun.COM 	 * or the socket is in a state where no more data will be received.
8668348SEric.Yu@Sun.COM 	 * Also, if the socket is accepting connections, flip the bit if
8678348SEric.Yu@Sun.COM 	 * there is something on the queue.
8688348SEric.Yu@Sun.COM 	 */
8698348SEric.Yu@Sun.COM 
8708348SEric.Yu@Sun.COM 	/* Pending connections */
8718348SEric.Yu@Sun.COM 	if (so->so_acceptq_len > 0)
8728348SEric.Yu@Sun.COM 		*reventsp |= (POLLIN|POLLRDNORM) & events;
8738348SEric.Yu@Sun.COM 
8748348SEric.Yu@Sun.COM 	/* Data */
8758348SEric.Yu@Sun.COM 	/* so_downcalls is null for sctp */
8768348SEric.Yu@Sun.COM 	if (so->so_downcalls != NULL && so->so_downcalls->sd_poll != NULL) {
8778348SEric.Yu@Sun.COM 		*reventsp |= (*so->so_downcalls->sd_poll)
8788348SEric.Yu@Sun.COM 		    (so->so_proto_handle, events & SO_PROTO_POLLEV, anyyet,
8798348SEric.Yu@Sun.COM 		    CRED()) & events;
8808348SEric.Yu@Sun.COM 		ASSERT((*reventsp & ~events) == 0);
8818348SEric.Yu@Sun.COM 		/* do not recheck events */
8828348SEric.Yu@Sun.COM 		events &= ~SO_PROTO_POLLEV;
8838348SEric.Yu@Sun.COM 	} else {
8848348SEric.Yu@Sun.COM 		if (SO_HAVE_DATA(so))
8858348SEric.Yu@Sun.COM 			*reventsp |= (POLLIN|POLLRDNORM) & events;
8868348SEric.Yu@Sun.COM 
8878348SEric.Yu@Sun.COM 		/* Urgent data */
8888348SEric.Yu@Sun.COM 		if ((state & SS_OOBPEND) != 0)
8898348SEric.Yu@Sun.COM 			*reventsp |= (POLLRDBAND) & events;
8908348SEric.Yu@Sun.COM 	}
8918348SEric.Yu@Sun.COM 
8928348SEric.Yu@Sun.COM 	if (!*reventsp && !anyyet) {
8938348SEric.Yu@Sun.COM 		/* Check for read events again, but this time under lock */
8948348SEric.Yu@Sun.COM 		if (events & (POLLIN|POLLRDNORM)) {
8958348SEric.Yu@Sun.COM 			mutex_enter(&so->so_lock);
8968348SEric.Yu@Sun.COM 			if (SO_HAVE_DATA(so) || so->so_acceptq_len > 0) {
8978348SEric.Yu@Sun.COM 				mutex_exit(&so->so_lock);
8988348SEric.Yu@Sun.COM 				*reventsp |= (POLLIN|POLLRDNORM) & events;
8998348SEric.Yu@Sun.COM 				return (0);
9008348SEric.Yu@Sun.COM 			} else {
9018348SEric.Yu@Sun.COM 				so->so_pollev |= SO_POLLEV_IN;
9028348SEric.Yu@Sun.COM 				mutex_exit(&so->so_lock);
9038348SEric.Yu@Sun.COM 			}
9048348SEric.Yu@Sun.COM 		}
9058348SEric.Yu@Sun.COM 		*phpp = &so->so_poll_list;
9068348SEric.Yu@Sun.COM 	}
9078348SEric.Yu@Sun.COM 	return (0);
9088348SEric.Yu@Sun.COM }
9098348SEric.Yu@Sun.COM 
9108348SEric.Yu@Sun.COM /*
9118348SEric.Yu@Sun.COM  * Generic Upcalls
9128348SEric.Yu@Sun.COM  */
9138348SEric.Yu@Sun.COM void
9148348SEric.Yu@Sun.COM so_connected(sock_upper_handle_t sock_handle, sock_connid_t id,
9158348SEric.Yu@Sun.COM     cred_t *peer_cred, pid_t peer_cpid)
9168348SEric.Yu@Sun.COM {
9178348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
9188348SEric.Yu@Sun.COM 
9198348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
9208348SEric.Yu@Sun.COM 	ASSERT(so->so_proto_handle != NULL);
9218348SEric.Yu@Sun.COM 
9228348SEric.Yu@Sun.COM 	if (peer_cred != NULL) {
9238348SEric.Yu@Sun.COM 		if (so->so_peercred != NULL)
9248348SEric.Yu@Sun.COM 			crfree(so->so_peercred);
9258348SEric.Yu@Sun.COM 		crhold(peer_cred);
9268348SEric.Yu@Sun.COM 		so->so_peercred = peer_cred;
9278348SEric.Yu@Sun.COM 		so->so_cpid = peer_cpid;
9288348SEric.Yu@Sun.COM 	}
9298348SEric.Yu@Sun.COM 
9308348SEric.Yu@Sun.COM 	so->so_proto_connid = id;
9318348SEric.Yu@Sun.COM 	soisconnected(so);
9328348SEric.Yu@Sun.COM 	/*
9338348SEric.Yu@Sun.COM 	 * Wake ones who're waiting for conn to become established.
9348348SEric.Yu@Sun.COM 	 */
9358348SEric.Yu@Sun.COM 	so_notify_connected(so);
9368348SEric.Yu@Sun.COM }
9378348SEric.Yu@Sun.COM 
9388348SEric.Yu@Sun.COM int
9398348SEric.Yu@Sun.COM so_disconnected(sock_upper_handle_t sock_handle, sock_connid_t id, int error)
9408348SEric.Yu@Sun.COM {
9418348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
9428348SEric.Yu@Sun.COM 
9438348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
9448348SEric.Yu@Sun.COM 
9458348SEric.Yu@Sun.COM 	so->so_proto_connid = id;
9468348SEric.Yu@Sun.COM 	soisdisconnected(so, error);
9478348SEric.Yu@Sun.COM 	so_notify_disconnected(so, error);
9488348SEric.Yu@Sun.COM 
9498348SEric.Yu@Sun.COM 	return (0);
9508348SEric.Yu@Sun.COM }
9518348SEric.Yu@Sun.COM 
9528348SEric.Yu@Sun.COM void
9538348SEric.Yu@Sun.COM so_opctl(sock_upper_handle_t sock_handle, sock_opctl_action_t action,
9548348SEric.Yu@Sun.COM     uintptr_t arg)
9558348SEric.Yu@Sun.COM {
9568348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
9578348SEric.Yu@Sun.COM 
9588348SEric.Yu@Sun.COM 	switch (action) {
9598348SEric.Yu@Sun.COM 	case SOCK_OPCTL_SHUT_SEND:
9608348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
9618348SEric.Yu@Sun.COM 		socantsendmore(so);
9628348SEric.Yu@Sun.COM 		so_notify_disconnecting(so);
9638348SEric.Yu@Sun.COM 		break;
9648348SEric.Yu@Sun.COM 	case SOCK_OPCTL_SHUT_RECV: {
9658348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
9668348SEric.Yu@Sun.COM 		socantrcvmore(so);
9678348SEric.Yu@Sun.COM 		so_notify_eof(so);
9688348SEric.Yu@Sun.COM 		break;
9698348SEric.Yu@Sun.COM 	}
9708348SEric.Yu@Sun.COM 	case SOCK_OPCTL_ENAB_ACCEPT:
9718348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
9728348SEric.Yu@Sun.COM 		so->so_state |= SS_ACCEPTCONN;
9738348SEric.Yu@Sun.COM 		so->so_backlog = (unsigned int)arg;
9748348SEric.Yu@Sun.COM 		mutex_exit(&so->so_lock);
9758348SEric.Yu@Sun.COM 		break;
9768348SEric.Yu@Sun.COM 	default:
9778348SEric.Yu@Sun.COM 		ASSERT(0);
9788348SEric.Yu@Sun.COM 		break;
9798348SEric.Yu@Sun.COM 	}
9808348SEric.Yu@Sun.COM }
9818348SEric.Yu@Sun.COM 
9828348SEric.Yu@Sun.COM void
9838348SEric.Yu@Sun.COM so_txq_full(sock_upper_handle_t sock_handle, boolean_t qfull)
9848348SEric.Yu@Sun.COM {
9858348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
9868348SEric.Yu@Sun.COM 
9878348SEric.Yu@Sun.COM 	if (qfull) {
9888348SEric.Yu@Sun.COM 		so_snd_qfull(so);
9898348SEric.Yu@Sun.COM 	} else {
9908348SEric.Yu@Sun.COM 		so_snd_qnotfull(so);
9918348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
9928348SEric.Yu@Sun.COM 		so_notify_writable(so);
9938348SEric.Yu@Sun.COM 	}
9948348SEric.Yu@Sun.COM }
9958348SEric.Yu@Sun.COM 
9968348SEric.Yu@Sun.COM sock_upper_handle_t
9978348SEric.Yu@Sun.COM so_newconn(sock_upper_handle_t parenthandle,
9988348SEric.Yu@Sun.COM     sock_lower_handle_t proto_handle, sock_downcalls_t *sock_downcalls,
9998348SEric.Yu@Sun.COM     struct cred *peer_cred, pid_t peer_cpid, sock_upcalls_t **sock_upcallsp)
10008348SEric.Yu@Sun.COM {
10018348SEric.Yu@Sun.COM 	struct sonode	*so = (struct sonode *)parenthandle;
10028348SEric.Yu@Sun.COM 	struct sonode	*nso;
10038348SEric.Yu@Sun.COM 	int error;
10048348SEric.Yu@Sun.COM 
10058348SEric.Yu@Sun.COM 	ASSERT(proto_handle != NULL);
10068348SEric.Yu@Sun.COM 
10078348SEric.Yu@Sun.COM 	if ((so->so_state & SS_ACCEPTCONN) == 0 ||
10088348SEric.Yu@Sun.COM 	    so->so_acceptq_len >= so->so_backlog)
10098348SEric.Yu@Sun.COM 		return (NULL);
10108348SEric.Yu@Sun.COM 
10118348SEric.Yu@Sun.COM 	nso = socket_newconn(so, proto_handle, sock_downcalls, SOCKET_NOSLEEP,
10128348SEric.Yu@Sun.COM 	    &error);
10138348SEric.Yu@Sun.COM 	if (nso == NULL)
10148348SEric.Yu@Sun.COM 		return (NULL);
10158348SEric.Yu@Sun.COM 
10168348SEric.Yu@Sun.COM 	if (peer_cred != NULL) {
10178348SEric.Yu@Sun.COM 		crhold(peer_cred);
10188348SEric.Yu@Sun.COM 		nso->so_peercred = peer_cred;
10198348SEric.Yu@Sun.COM 		nso->so_cpid = peer_cpid;
10208348SEric.Yu@Sun.COM 	}
10218348SEric.Yu@Sun.COM 
10228348SEric.Yu@Sun.COM 	(void) so_acceptq_enqueue(so, nso);
10238348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
10248348SEric.Yu@Sun.COM 	so_notify_newconn(so);
10258348SEric.Yu@Sun.COM 
10268348SEric.Yu@Sun.COM 	*sock_upcallsp = &so_upcalls;
10278348SEric.Yu@Sun.COM 
10288348SEric.Yu@Sun.COM 	return ((sock_upper_handle_t)nso);
10298348SEric.Yu@Sun.COM }
10308348SEric.Yu@Sun.COM 
10318348SEric.Yu@Sun.COM void
10328348SEric.Yu@Sun.COM so_set_prop(sock_upper_handle_t sock_handle, struct sock_proto_props *soppp)
10338348SEric.Yu@Sun.COM {
10348348SEric.Yu@Sun.COM 	struct sonode *so;
10358348SEric.Yu@Sun.COM 
10368348SEric.Yu@Sun.COM 	so = (struct sonode *)sock_handle;
10378348SEric.Yu@Sun.COM 
10388348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
10398348SEric.Yu@Sun.COM 
10408348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_MAXBLK)
10418348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_maxblk = soppp->sopp_maxblk;
10428348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_WROFF)
10438348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_wroff = soppp->sopp_wroff;
10448348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_TAIL)
10458348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_tail = soppp->sopp_tail;
10468348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_RCVHIWAT)
10478348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_rxhiwat = soppp->sopp_rxhiwat;
10488348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_RCVLOWAT)
10498348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_rxlowat = soppp->sopp_rxlowat;
10508348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_MAXPSZ)
10518348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_maxpsz = soppp->sopp_maxpsz;
10528348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_MINPSZ)
10538348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_minpsz = soppp->sopp_minpsz;
10548348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_ZCOPY) {
10558348SEric.Yu@Sun.COM 		if (soppp->sopp_zcopyflag & ZCVMSAFE) {
10568348SEric.Yu@Sun.COM 			so->so_proto_props.sopp_zcopyflag |= STZCVMSAFE;
10578348SEric.Yu@Sun.COM 			so->so_proto_props.sopp_zcopyflag &= ~STZCVMUNSAFE;
10588348SEric.Yu@Sun.COM 		} else if (soppp->sopp_zcopyflag & ZCVMUNSAFE) {
10598348SEric.Yu@Sun.COM 			so->so_proto_props.sopp_zcopyflag |= STZCVMUNSAFE;
10608348SEric.Yu@Sun.COM 			so->so_proto_props.sopp_zcopyflag &= ~STZCVMSAFE;
10618348SEric.Yu@Sun.COM 		}
10628348SEric.Yu@Sun.COM 
10638348SEric.Yu@Sun.COM 		if (soppp->sopp_zcopyflag & COPYCACHED) {
10648348SEric.Yu@Sun.COM 			so->so_proto_props.sopp_zcopyflag |= STRCOPYCACHED;
10658348SEric.Yu@Sun.COM 		}
10668348SEric.Yu@Sun.COM 	}
10678348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_OOBINLINE)
10688348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_oobinline = soppp->sopp_oobinline;
10698348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_RCVTIMER)
10708348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_rcvtimer = soppp->sopp_rcvtimer;
10718348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_RCVTHRESH)
10728348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_rcvthresh = soppp->sopp_rcvthresh;
10738348SEric.Yu@Sun.COM 	if (soppp->sopp_flags & SOCKOPT_MAXADDRLEN)
10748348SEric.Yu@Sun.COM 		so->so_proto_props.sopp_maxaddrlen = soppp->sopp_maxaddrlen;
10758348SEric.Yu@Sun.COM 
10768348SEric.Yu@Sun.COM 	mutex_exit(&so->so_lock);
10778348SEric.Yu@Sun.COM 
10788348SEric.Yu@Sun.COM #ifdef DEBUG
10798348SEric.Yu@Sun.COM 	soppp->sopp_flags &= ~(SOCKOPT_MAXBLK | SOCKOPT_WROFF | SOCKOPT_TAIL |
10808348SEric.Yu@Sun.COM 	    SOCKOPT_RCVHIWAT | SOCKOPT_RCVLOWAT | SOCKOPT_MAXPSZ |
10818348SEric.Yu@Sun.COM 	    SOCKOPT_ZCOPY | SOCKOPT_OOBINLINE | SOCKOPT_RCVTIMER |
10828348SEric.Yu@Sun.COM 	    SOCKOPT_RCVTHRESH | SOCKOPT_MAXADDRLEN | SOCKOPT_MINPSZ);
10838348SEric.Yu@Sun.COM 	ASSERT(soppp->sopp_flags == 0);
10848348SEric.Yu@Sun.COM #endif
10858348SEric.Yu@Sun.COM }
10868348SEric.Yu@Sun.COM 
10878348SEric.Yu@Sun.COM /* ARGSUSED */
10888348SEric.Yu@Sun.COM ssize_t
10898348SEric.Yu@Sun.COM so_queue_msg(sock_upper_handle_t sock_handle, mblk_t *mp,
10908348SEric.Yu@Sun.COM     size_t msg_size, int flags, int *errorp,  boolean_t *force_pushp)
10918348SEric.Yu@Sun.COM {
10928348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
10938348SEric.Yu@Sun.COM 	boolean_t force_push = B_TRUE;
10948348SEric.Yu@Sun.COM 	int space_left;
10958348SEric.Yu@Sun.COM 	sodirect_t *sodp = so->so_direct;
10968348SEric.Yu@Sun.COM 
10978348SEric.Yu@Sun.COM 	ASSERT(errorp != NULL);
10988348SEric.Yu@Sun.COM 	*errorp = 0;
10998348SEric.Yu@Sun.COM 	if (mp == NULL) {
11008348SEric.Yu@Sun.COM 		if (msg_size > 0) {
11018348SEric.Yu@Sun.COM 			ASSERT(so->so_downcalls->sd_recv_uio != NULL);
11028348SEric.Yu@Sun.COM 			mutex_enter(&so->so_lock);
11038348SEric.Yu@Sun.COM 			/* the notify functions will drop the lock */
11048348SEric.Yu@Sun.COM 			if (flags & MSG_OOB)
11058348SEric.Yu@Sun.COM 				so_notify_oobdata(so, IS_SO_OOB_INLINE(so));
11068348SEric.Yu@Sun.COM 			else
11078348SEric.Yu@Sun.COM 				so_notify_data(so, msg_size);
11088348SEric.Yu@Sun.COM 			return (0);
11098348SEric.Yu@Sun.COM 		}
11108348SEric.Yu@Sun.COM 		/*
11118348SEric.Yu@Sun.COM 		 * recv space check
11128348SEric.Yu@Sun.COM 		 */
11138348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
11148348SEric.Yu@Sun.COM 		space_left = so->so_rcvbuf - so->so_rcv_queued;
11158348SEric.Yu@Sun.COM 		if (space_left <= 0) {
11168348SEric.Yu@Sun.COM 			so->so_flowctrld = B_TRUE;
11178348SEric.Yu@Sun.COM 			*errorp = ENOSPC;
11188348SEric.Yu@Sun.COM 			space_left = -1;
11198348SEric.Yu@Sun.COM 		}
11208348SEric.Yu@Sun.COM 		goto done_unlock;
11218348SEric.Yu@Sun.COM 	}
11228348SEric.Yu@Sun.COM 
11238348SEric.Yu@Sun.COM 	ASSERT(mp->b_next == NULL);
11248348SEric.Yu@Sun.COM 	ASSERT(DB_TYPE(mp) == M_DATA || DB_TYPE(mp) == M_PROTO);
11258348SEric.Yu@Sun.COM 	ASSERT(msg_size == msgdsize(mp));
11268348SEric.Yu@Sun.COM 
11278348SEric.Yu@Sun.COM 	if (flags & MSG_OOB) {
11288348SEric.Yu@Sun.COM 		so_queue_oob(sock_handle, mp, msg_size);
11298348SEric.Yu@Sun.COM 		return (0);
11308348SEric.Yu@Sun.COM 	}
11318348SEric.Yu@Sun.COM 
11328348SEric.Yu@Sun.COM 	if (force_pushp != NULL)
11338348SEric.Yu@Sun.COM 		force_push = *force_pushp;
11348348SEric.Yu@Sun.COM 
11358348SEric.Yu@Sun.COM 	if (DB_TYPE(mp) == M_PROTO && !__TPI_PRIM_ISALIGNED(mp->b_rptr)) {
11368348SEric.Yu@Sun.COM 		/* The read pointer is not aligned correctly for TPI */
11378348SEric.Yu@Sun.COM 		zcmn_err(getzoneid(), CE_WARN,
11388348SEric.Yu@Sun.COM 		    "sockfs: Unaligned TPI message received. rptr = %p\n",
11398348SEric.Yu@Sun.COM 		    (void *)mp->b_rptr);
11408348SEric.Yu@Sun.COM 		freemsg(mp);
11418348SEric.Yu@Sun.COM 		mutex_enter(sodp->sod_lockp);
11428348SEric.Yu@Sun.COM 		SOD_UIOAFINI(sodp);
11438348SEric.Yu@Sun.COM 		mutex_exit(sodp->sod_lockp);
11448348SEric.Yu@Sun.COM 
11458348SEric.Yu@Sun.COM 		return (so->so_rcvbuf - so->so_rcv_queued);
11468348SEric.Yu@Sun.COM 	}
11478348SEric.Yu@Sun.COM 
11488348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
11498348SEric.Yu@Sun.COM 	if (so->so_state & (SS_FALLBACK_PENDING | SS_FALLBACK_COMP)) {
11508348SEric.Yu@Sun.COM 		SOD_DISABLE(sodp);
11518348SEric.Yu@Sun.COM 		mutex_exit(&so->so_lock);
11528348SEric.Yu@Sun.COM 		*errorp = EOPNOTSUPP;
11538348SEric.Yu@Sun.COM 		return (-1);
11548348SEric.Yu@Sun.COM 	}
11558348SEric.Yu@Sun.COM 	if (so->so_state & SS_CANTRCVMORE) {
11568348SEric.Yu@Sun.COM 		freemsg(mp);
11578348SEric.Yu@Sun.COM 		SOD_DISABLE(sodp);
11588348SEric.Yu@Sun.COM 		mutex_exit(&so->so_lock);
11598348SEric.Yu@Sun.COM 		return (0);
11608348SEric.Yu@Sun.COM 	}
11618348SEric.Yu@Sun.COM 
11628348SEric.Yu@Sun.COM 	/* process the mblk via I/OAT if capable */
11638348SEric.Yu@Sun.COM 	if (sodp != NULL && (sodp->sod_state & SOD_ENABLED)) {
11648348SEric.Yu@Sun.COM 		if (DB_TYPE(mp) == M_DATA) {
11658348SEric.Yu@Sun.COM 			(void) sod_uioa_mblk_init(sodp, mp, msg_size);
11668348SEric.Yu@Sun.COM 		} else {
11678348SEric.Yu@Sun.COM 			SOD_UIOAFINI(sodp);
11688348SEric.Yu@Sun.COM 		}
11698348SEric.Yu@Sun.COM 	}
11708348SEric.Yu@Sun.COM 
11718348SEric.Yu@Sun.COM 	if (mp->b_next == NULL) {
11728348SEric.Yu@Sun.COM 		so_enqueue_msg(so, mp, msg_size);
11738348SEric.Yu@Sun.COM 	} else {
11748348SEric.Yu@Sun.COM 		do {
11758348SEric.Yu@Sun.COM 			mblk_t *nmp;
11768348SEric.Yu@Sun.COM 
11778348SEric.Yu@Sun.COM 			if ((nmp = mp->b_next) != NULL) {
11788348SEric.Yu@Sun.COM 				mp->b_next = NULL;
11798348SEric.Yu@Sun.COM 			}
11808348SEric.Yu@Sun.COM 			so_enqueue_msg(so, mp, msgdsize(mp));
11818348SEric.Yu@Sun.COM 			mp = nmp;
11828348SEric.Yu@Sun.COM 		} while (mp != NULL);
11838348SEric.Yu@Sun.COM 	}
11848348SEric.Yu@Sun.COM 
11858348SEric.Yu@Sun.COM 	space_left = so->so_rcvbuf - so->so_rcv_queued;
11868348SEric.Yu@Sun.COM 	if (space_left <= 0) {
11878348SEric.Yu@Sun.COM 		so->so_flowctrld = B_TRUE;
11888348SEric.Yu@Sun.COM 		*errorp = ENOSPC;
11898348SEric.Yu@Sun.COM 		space_left = -1;
11908348SEric.Yu@Sun.COM 	}
11918348SEric.Yu@Sun.COM 
11928348SEric.Yu@Sun.COM 	if (force_push || so->so_rcv_queued >= so->so_rcv_thresh ||
11938348SEric.Yu@Sun.COM 	    so->so_rcv_queued >= so->so_rcv_wanted ||
11948348SEric.Yu@Sun.COM 	    (sodp != NULL && so->so_rcv_queued >= sodp->sod_want)) {
11958348SEric.Yu@Sun.COM 		SOCKET_TIMER_CANCEL(so);
11968348SEric.Yu@Sun.COM 		/*
11978348SEric.Yu@Sun.COM 		 * so_notify_data will release the lock
11988348SEric.Yu@Sun.COM 		 */
11998348SEric.Yu@Sun.COM 		so_notify_data(so, so->so_rcv_queued);
12008348SEric.Yu@Sun.COM 
12018348SEric.Yu@Sun.COM 		if (force_pushp != NULL)
12028348SEric.Yu@Sun.COM 			*force_pushp = B_TRUE;
12038348SEric.Yu@Sun.COM 		goto done;
12048348SEric.Yu@Sun.COM 	} else if (so->so_rcv_timer_tid == 0) {
12058348SEric.Yu@Sun.COM 		/* Make sure the recv push timer is running */
12068348SEric.Yu@Sun.COM 		SOCKET_TIMER_START(so);
12078348SEric.Yu@Sun.COM 	}
12088348SEric.Yu@Sun.COM 
12098348SEric.Yu@Sun.COM done_unlock:
12108348SEric.Yu@Sun.COM 	mutex_exit(&so->so_lock);
12118348SEric.Yu@Sun.COM done:
12128348SEric.Yu@Sun.COM 	return (space_left);
12138348SEric.Yu@Sun.COM }
12148348SEric.Yu@Sun.COM 
12158348SEric.Yu@Sun.COM /*
12168348SEric.Yu@Sun.COM  * Set the offset of where the oob data is relative to the bytes in
12178348SEric.Yu@Sun.COM  * queued. Also generate SIGURG
12188348SEric.Yu@Sun.COM  */
12198348SEric.Yu@Sun.COM void
12208348SEric.Yu@Sun.COM so_signal_oob(sock_upper_handle_t sock_handle, ssize_t offset)
12218348SEric.Yu@Sun.COM {
12228348SEric.Yu@Sun.COM 	struct sonode *so;
12238348SEric.Yu@Sun.COM 
12248348SEric.Yu@Sun.COM 	ASSERT(offset >= 0);
12258348SEric.Yu@Sun.COM 	so = (struct sonode *)sock_handle;
12268348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
12278348SEric.Yu@Sun.COM 	SOD_UIOAFINI(so->so_direct);
12288348SEric.Yu@Sun.COM 
12298348SEric.Yu@Sun.COM 	/*
12308348SEric.Yu@Sun.COM 	 * New urgent data on the way so forget about any old
12318348SEric.Yu@Sun.COM 	 * urgent data.
12328348SEric.Yu@Sun.COM 	 */
12338348SEric.Yu@Sun.COM 	so->so_state &= ~(SS_HAVEOOBDATA|SS_HADOOBDATA);
12348348SEric.Yu@Sun.COM 
12358348SEric.Yu@Sun.COM 	/*
12368348SEric.Yu@Sun.COM 	 * Record that urgent data is pending.
12378348SEric.Yu@Sun.COM 	 */
12388348SEric.Yu@Sun.COM 	so->so_state |= SS_OOBPEND;
12398348SEric.Yu@Sun.COM 
12408348SEric.Yu@Sun.COM 	if (so->so_oobmsg != NULL) {
12418348SEric.Yu@Sun.COM 		dprintso(so, 1, ("sock: discarding old oob\n"));
12428348SEric.Yu@Sun.COM 		freemsg(so->so_oobmsg);
12438348SEric.Yu@Sun.COM 		so->so_oobmsg = NULL;
12448348SEric.Yu@Sun.COM 	}
12458348SEric.Yu@Sun.COM 
12468348SEric.Yu@Sun.COM 	/*
12478348SEric.Yu@Sun.COM 	 * set the offset where the urgent byte is
12488348SEric.Yu@Sun.COM 	 */
12498348SEric.Yu@Sun.COM 	so->so_oobmark = so->so_rcv_queued + offset;
12508348SEric.Yu@Sun.COM 	if (so->so_oobmark == 0)
12518348SEric.Yu@Sun.COM 		so->so_state |= SS_RCVATMARK;
12528348SEric.Yu@Sun.COM 	else
12538348SEric.Yu@Sun.COM 		so->so_state &= ~SS_RCVATMARK;
12548348SEric.Yu@Sun.COM 
12558348SEric.Yu@Sun.COM 	so_notify_oobsig(so);
12568348SEric.Yu@Sun.COM }
12578348SEric.Yu@Sun.COM 
12588348SEric.Yu@Sun.COM /*
12598348SEric.Yu@Sun.COM  * Queue the OOB byte
12608348SEric.Yu@Sun.COM  */
12618348SEric.Yu@Sun.COM static void
12628348SEric.Yu@Sun.COM so_queue_oob(sock_upper_handle_t sock_handle, mblk_t *mp, size_t len)
12638348SEric.Yu@Sun.COM {
12648348SEric.Yu@Sun.COM 	struct sonode *so;
12658348SEric.Yu@Sun.COM 
12668348SEric.Yu@Sun.COM 	so = (struct sonode *)sock_handle;
12678348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
12688348SEric.Yu@Sun.COM 	SOD_UIOAFINI(so->so_direct);
12698348SEric.Yu@Sun.COM 
12708348SEric.Yu@Sun.COM 	ASSERT(mp != NULL);
12718348SEric.Yu@Sun.COM 	if (!IS_SO_OOB_INLINE(so)) {
12728348SEric.Yu@Sun.COM 		so->so_oobmsg = mp;
12738348SEric.Yu@Sun.COM 		so->so_state |= SS_HAVEOOBDATA;
12748348SEric.Yu@Sun.COM 	} else {
12758348SEric.Yu@Sun.COM 		so_enqueue_msg(so, mp, len);
12768348SEric.Yu@Sun.COM 	}
12778348SEric.Yu@Sun.COM 
12788348SEric.Yu@Sun.COM 	so_notify_oobdata(so, IS_SO_OOB_INLINE(so));
12798348SEric.Yu@Sun.COM }
12808348SEric.Yu@Sun.COM 
12818348SEric.Yu@Sun.COM int
12828348SEric.Yu@Sun.COM so_close(struct sonode *so, int flag, struct cred *cr)
12838348SEric.Yu@Sun.COM {
12848348SEric.Yu@Sun.COM 	int error;
12858348SEric.Yu@Sun.COM 
12868348SEric.Yu@Sun.COM 	error = (*so->so_downcalls->sd_close)(so->so_proto_handle, flag, cr);
12878348SEric.Yu@Sun.COM 
12888348SEric.Yu@Sun.COM 	/*
12898348SEric.Yu@Sun.COM 	 * At this point there will be no more upcalls from the protocol
12908348SEric.Yu@Sun.COM 	 */
12918348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
1292*8399SRao.Shoaib@Sun.COM 
1293*8399SRao.Shoaib@Sun.COM 	ASSERT(so_verify_oobstate(so));
1294*8399SRao.Shoaib@Sun.COM 
12958348SEric.Yu@Sun.COM 	so_rcv_flush(so);
12968348SEric.Yu@Sun.COM 	mutex_exit(&so->so_lock);
12978348SEric.Yu@Sun.COM 
12988348SEric.Yu@Sun.COM 	return (error);
12998348SEric.Yu@Sun.COM }
13008348SEric.Yu@Sun.COM 
13018348SEric.Yu@Sun.COM void
13028348SEric.Yu@Sun.COM so_zcopy_notify(sock_upper_handle_t sock_handle)
13038348SEric.Yu@Sun.COM {
13048348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
13058348SEric.Yu@Sun.COM 
13068348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
13078348SEric.Yu@Sun.COM 	so->so_copyflag |= STZCNOTIFY;
13088348SEric.Yu@Sun.COM 	cv_broadcast(&so->so_copy_cv);
13098348SEric.Yu@Sun.COM 	mutex_exit(&so->so_lock);
13108348SEric.Yu@Sun.COM }
13118348SEric.Yu@Sun.COM 
13128348SEric.Yu@Sun.COM void
13138348SEric.Yu@Sun.COM so_set_error(sock_upper_handle_t sock_handle, int error)
13148348SEric.Yu@Sun.COM {
13158348SEric.Yu@Sun.COM 	struct sonode *so = (struct sonode *)sock_handle;
13168348SEric.Yu@Sun.COM 
13178348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
13188348SEric.Yu@Sun.COM 
13198348SEric.Yu@Sun.COM 	soseterror(so, error);
13208348SEric.Yu@Sun.COM 
13218348SEric.Yu@Sun.COM 	so_notify_error(so);
13228348SEric.Yu@Sun.COM }
13238348SEric.Yu@Sun.COM 
13248348SEric.Yu@Sun.COM /*
13258348SEric.Yu@Sun.COM  * so_recvmsg - read data from the socket
13268348SEric.Yu@Sun.COM  *
13278348SEric.Yu@Sun.COM  * There are two ways of obtaining data; either we ask the protocol to
13288348SEric.Yu@Sun.COM  * copy directly into the supplied buffer, or we copy data from the
13298348SEric.Yu@Sun.COM  * sonode's receive queue. The decision which one to use depends on
13308348SEric.Yu@Sun.COM  * whether the protocol has a sd_recv_uio down call.
13318348SEric.Yu@Sun.COM  */
13328348SEric.Yu@Sun.COM int
13338348SEric.Yu@Sun.COM so_recvmsg(struct sonode *so, struct nmsghdr *msg, struct uio *uiop,
13348348SEric.Yu@Sun.COM     struct cred *cr)
13358348SEric.Yu@Sun.COM {
13368348SEric.Yu@Sun.COM 	rval_t 		rval;
13378348SEric.Yu@Sun.COM 	int 		flags = 0;
13388348SEric.Yu@Sun.COM 	t_uscalar_t	controllen, namelen;
13398348SEric.Yu@Sun.COM 	int 		error = 0;
13408348SEric.Yu@Sun.COM 	int ret;
13418348SEric.Yu@Sun.COM 	mblk_t		*mctlp = NULL;
13428348SEric.Yu@Sun.COM 	union T_primitives *tpr;
13438348SEric.Yu@Sun.COM 	void		*control;
13448348SEric.Yu@Sun.COM 	ssize_t		saved_resid;
13458348SEric.Yu@Sun.COM 	struct uio	*suiop;
13468348SEric.Yu@Sun.COM 
13478348SEric.Yu@Sun.COM 	SO_BLOCK_FALLBACK(so, SOP_RECVMSG(so, msg, uiop, cr));
13488348SEric.Yu@Sun.COM 
13498348SEric.Yu@Sun.COM 	if ((so->so_state & (SS_ISCONNECTED|SS_CANTRCVMORE)) == 0 &&
13508348SEric.Yu@Sun.COM 	    (so->so_mode & SM_CONNREQUIRED)) {
13518348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
13528348SEric.Yu@Sun.COM 		return (ENOTCONN);
13538348SEric.Yu@Sun.COM 	}
13548348SEric.Yu@Sun.COM 
13558348SEric.Yu@Sun.COM 	if (msg->msg_flags & MSG_PEEK)
13568348SEric.Yu@Sun.COM 		msg->msg_flags &= ~MSG_WAITALL;
13578348SEric.Yu@Sun.COM 
13588348SEric.Yu@Sun.COM 	if (so->so_mode & SM_ATOMIC)
13598348SEric.Yu@Sun.COM 		msg->msg_flags |= MSG_TRUNC;
13608348SEric.Yu@Sun.COM 
13618348SEric.Yu@Sun.COM 	if (msg->msg_flags & MSG_OOB) {
13628348SEric.Yu@Sun.COM 		if ((so->so_mode & SM_EXDATA) == 0) {
13638348SEric.Yu@Sun.COM 			error = EOPNOTSUPP;
13648348SEric.Yu@Sun.COM 		} else if (so->so_downcalls->sd_recv_uio != NULL) {
13658348SEric.Yu@Sun.COM 			error = (*so->so_downcalls->sd_recv_uio)
13668348SEric.Yu@Sun.COM 			    (so->so_proto_handle, uiop, msg, cr);
13678348SEric.Yu@Sun.COM 		} else {
13688348SEric.Yu@Sun.COM 			error = sorecvoob(so, msg, uiop, msg->msg_flags,
13698348SEric.Yu@Sun.COM 			    IS_SO_OOB_INLINE(so));
13708348SEric.Yu@Sun.COM 		}
13718348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
13728348SEric.Yu@Sun.COM 		return (error);
13738348SEric.Yu@Sun.COM 	}
13748348SEric.Yu@Sun.COM 
13758348SEric.Yu@Sun.COM 	/*
13768348SEric.Yu@Sun.COM 	 * If the protocol has the recv down call, then pass the request
13778348SEric.Yu@Sun.COM 	 * down.
13788348SEric.Yu@Sun.COM 	 */
13798348SEric.Yu@Sun.COM 	if (so->so_downcalls->sd_recv_uio != NULL) {
13808348SEric.Yu@Sun.COM 		error = (*so->so_downcalls->sd_recv_uio)
13818348SEric.Yu@Sun.COM 		    (so->so_proto_handle, uiop, msg, cr);
13828348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
13838348SEric.Yu@Sun.COM 		return (error);
13848348SEric.Yu@Sun.COM 	}
13858348SEric.Yu@Sun.COM 
13868348SEric.Yu@Sun.COM 	/*
13878348SEric.Yu@Sun.COM 	 * Reading data from the socket buffer
13888348SEric.Yu@Sun.COM 	 */
13898348SEric.Yu@Sun.COM 	flags = msg->msg_flags;
13908348SEric.Yu@Sun.COM 	msg->msg_flags = 0;
13918348SEric.Yu@Sun.COM 
13928348SEric.Yu@Sun.COM 	/*
13938348SEric.Yu@Sun.COM 	 * Set msg_controllen and msg_namelen to zero here to make it
13948348SEric.Yu@Sun.COM 	 * simpler in the cases that no control or name is returned.
13958348SEric.Yu@Sun.COM 	 */
13968348SEric.Yu@Sun.COM 	controllen = msg->msg_controllen;
13978348SEric.Yu@Sun.COM 	namelen = msg->msg_namelen;
13988348SEric.Yu@Sun.COM 	msg->msg_controllen = 0;
13998348SEric.Yu@Sun.COM 	msg->msg_namelen = 0;
14008348SEric.Yu@Sun.COM 
14018348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
14028348SEric.Yu@Sun.COM 	/* Set SOREADLOCKED */
14038348SEric.Yu@Sun.COM 	error = so_lock_read_intr(so,
14048348SEric.Yu@Sun.COM 	    uiop->uio_fmode | ((flags & MSG_DONTWAIT) ? FNONBLOCK : 0));
14058348SEric.Yu@Sun.COM 	mutex_exit(&so->so_lock);
14068348SEric.Yu@Sun.COM 	if (error) {
14078348SEric.Yu@Sun.COM 		SO_UNBLOCK_FALLBACK(so);
14088348SEric.Yu@Sun.COM 		return (error);
14098348SEric.Yu@Sun.COM 	}
14108348SEric.Yu@Sun.COM 
14118348SEric.Yu@Sun.COM 	suiop = sod_rcv_init(so, flags, &uiop);
14128348SEric.Yu@Sun.COM retry:
14138348SEric.Yu@Sun.COM 	saved_resid = uiop->uio_resid;
14148348SEric.Yu@Sun.COM 	error = so_dequeue_msg(so, &mctlp, uiop, &rval, flags);
14158348SEric.Yu@Sun.COM 	if (error != 0) {
14168348SEric.Yu@Sun.COM 		goto out;
14178348SEric.Yu@Sun.COM 	}
14188348SEric.Yu@Sun.COM 	/*
14198348SEric.Yu@Sun.COM 	 * For datagrams the MOREDATA flag is used to set MSG_TRUNC.
14208348SEric.Yu@Sun.COM 	 * For non-datagrams MOREDATA is used to set MSG_EOR.
14218348SEric.Yu@Sun.COM 	 */
14228348SEric.Yu@Sun.COM 	ASSERT(!(rval.r_val1 & MORECTL));
14238348SEric.Yu@Sun.COM 	if ((rval.r_val1 & MOREDATA) && (so->so_mode & SM_ATOMIC))
14248348SEric.Yu@Sun.COM 		msg->msg_flags |= MSG_TRUNC;
14258348SEric.Yu@Sun.COM 	if (mctlp == NULL) {
14268348SEric.Yu@Sun.COM 		dprintso(so, 1, ("so_recvmsg: got M_DATA\n"));
14278348SEric.Yu@Sun.COM 
14288348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
14298348SEric.Yu@Sun.COM 		/* Set MSG_EOR based on MOREDATA */
14308348SEric.Yu@Sun.COM 		if (!(rval.r_val1 & MOREDATA)) {
14318348SEric.Yu@Sun.COM 			if (so->so_state & SS_SAVEDEOR) {
14328348SEric.Yu@Sun.COM 				msg->msg_flags |= MSG_EOR;
14338348SEric.Yu@Sun.COM 				so->so_state &= ~SS_SAVEDEOR;
14348348SEric.Yu@Sun.COM 			}
14358348SEric.Yu@Sun.COM 		}
14368348SEric.Yu@Sun.COM 		/*
14378348SEric.Yu@Sun.COM 		 * If some data was received (i.e. not EOF) and the
14388348SEric.Yu@Sun.COM 		 * read/recv* has not been satisfied wait for some more.
14398348SEric.Yu@Sun.COM 		 */
14408348SEric.Yu@Sun.COM 		if ((flags & MSG_WAITALL) && !(msg->msg_flags & MSG_EOR) &&
14418348SEric.Yu@Sun.COM 		    uiop->uio_resid != saved_resid && uiop->uio_resid > 0) {
14428348SEric.Yu@Sun.COM 			mutex_exit(&so->so_lock);
14438348SEric.Yu@Sun.COM 			goto retry;
14448348SEric.Yu@Sun.COM 		}
14458348SEric.Yu@Sun.COM 
14468348SEric.Yu@Sun.COM 		goto out_locked;
14478348SEric.Yu@Sun.COM 	}
14488348SEric.Yu@Sun.COM 	/* strsock_proto has already verified length and alignment */
14498348SEric.Yu@Sun.COM 	tpr = (union T_primitives *)mctlp->b_rptr;
14508348SEric.Yu@Sun.COM 	dprintso(so, 1, ("so_recvmsg: type %d\n", tpr->type));
14518348SEric.Yu@Sun.COM 	switch (tpr->type) {
14528348SEric.Yu@Sun.COM 	case T_DATA_IND: {
14538348SEric.Yu@Sun.COM 		/*
14548348SEric.Yu@Sun.COM 		 * Set msg_flags to MSG_EOR based on
14558348SEric.Yu@Sun.COM 		 * MORE_flag and MOREDATA.
14568348SEric.Yu@Sun.COM 		 */
14578348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
14588348SEric.Yu@Sun.COM 		so->so_state &= ~SS_SAVEDEOR;
14598348SEric.Yu@Sun.COM 		if (!(tpr->data_ind.MORE_flag & 1)) {
14608348SEric.Yu@Sun.COM 			if (!(rval.r_val1 & MOREDATA))
14618348SEric.Yu@Sun.COM 				msg->msg_flags |= MSG_EOR;
14628348SEric.Yu@Sun.COM 			else
14638348SEric.Yu@Sun.COM 				so->so_state |= SS_SAVEDEOR;
14648348SEric.Yu@Sun.COM 		}
14658348SEric.Yu@Sun.COM 		freemsg(mctlp);
14668348SEric.Yu@Sun.COM 		/*
14678348SEric.Yu@Sun.COM 		 * If some data was received (i.e. not EOF) and the
14688348SEric.Yu@Sun.COM 		 * read/recv* has not been satisfied wait for some more.
14698348SEric.Yu@Sun.COM 		 */
14708348SEric.Yu@Sun.COM 		if ((flags & MSG_WAITALL) && !(msg->msg_flags & MSG_EOR) &&
14718348SEric.Yu@Sun.COM 		    uiop->uio_resid != saved_resid && uiop->uio_resid > 0) {
14728348SEric.Yu@Sun.COM 			mutex_exit(&so->so_lock);
14738348SEric.Yu@Sun.COM 			goto retry;
14748348SEric.Yu@Sun.COM 		}
14758348SEric.Yu@Sun.COM 		goto out_locked;
14768348SEric.Yu@Sun.COM 	}
14778348SEric.Yu@Sun.COM 	case T_UNITDATA_IND: {
14788348SEric.Yu@Sun.COM 		void *addr;
14798348SEric.Yu@Sun.COM 		t_uscalar_t addrlen;
14808348SEric.Yu@Sun.COM 		void *abuf;
14818348SEric.Yu@Sun.COM 		t_uscalar_t optlen;
14828348SEric.Yu@Sun.COM 		void *opt;
14838348SEric.Yu@Sun.COM 
14848348SEric.Yu@Sun.COM 		if (namelen != 0) {
14858348SEric.Yu@Sun.COM 			/* Caller wants source address */
14868348SEric.Yu@Sun.COM 			addrlen = tpr->unitdata_ind.SRC_length;
14878348SEric.Yu@Sun.COM 			addr = sogetoff(mctlp, tpr->unitdata_ind.SRC_offset,
14888348SEric.Yu@Sun.COM 			    addrlen, 1);
14898348SEric.Yu@Sun.COM 			if (addr == NULL) {
14908348SEric.Yu@Sun.COM 				freemsg(mctlp);
14918348SEric.Yu@Sun.COM 				error = EPROTO;
14928348SEric.Yu@Sun.COM 				eprintsoline(so, error);
14938348SEric.Yu@Sun.COM 				goto out;
14948348SEric.Yu@Sun.COM 			}
14958348SEric.Yu@Sun.COM 			ASSERT(so->so_family != AF_UNIX);
14968348SEric.Yu@Sun.COM 		}
14978348SEric.Yu@Sun.COM 		optlen = tpr->unitdata_ind.OPT_length;
14988348SEric.Yu@Sun.COM 		if (optlen != 0) {
14998348SEric.Yu@Sun.COM 			t_uscalar_t ncontrollen;
15008348SEric.Yu@Sun.COM 
15018348SEric.Yu@Sun.COM 			/*
15028348SEric.Yu@Sun.COM 			 * Extract any source address option.
15038348SEric.Yu@Sun.COM 			 * Determine how large cmsg buffer is needed.
15048348SEric.Yu@Sun.COM 			 */
15058348SEric.Yu@Sun.COM 			opt = sogetoff(mctlp, tpr->unitdata_ind.OPT_offset,
15068348SEric.Yu@Sun.COM 			    optlen, __TPI_ALIGN_SIZE);
15078348SEric.Yu@Sun.COM 
15088348SEric.Yu@Sun.COM 			if (opt == NULL) {
15098348SEric.Yu@Sun.COM 				freemsg(mctlp);
15108348SEric.Yu@Sun.COM 				error = EPROTO;
15118348SEric.Yu@Sun.COM 				eprintsoline(so, error);
15128348SEric.Yu@Sun.COM 				goto out;
15138348SEric.Yu@Sun.COM 			}
15148348SEric.Yu@Sun.COM 			if (so->so_family == AF_UNIX)
15158348SEric.Yu@Sun.COM 				so_getopt_srcaddr(opt, optlen, &addr, &addrlen);
15168348SEric.Yu@Sun.COM 			ncontrollen = so_cmsglen(mctlp, opt, optlen,
15178348SEric.Yu@Sun.COM 			    !(flags & MSG_XPG4_2));
15188348SEric.Yu@Sun.COM 			if (controllen != 0)
15198348SEric.Yu@Sun.COM 				controllen = ncontrollen;
15208348SEric.Yu@Sun.COM 			else if (ncontrollen != 0)
15218348SEric.Yu@Sun.COM 				msg->msg_flags |= MSG_CTRUNC;
15228348SEric.Yu@Sun.COM 		} else {
15238348SEric.Yu@Sun.COM 			controllen = 0;
15248348SEric.Yu@Sun.COM 		}
15258348SEric.Yu@Sun.COM 
15268348SEric.Yu@Sun.COM 		if (namelen != 0) {
15278348SEric.Yu@Sun.COM 			/*
15288348SEric.Yu@Sun.COM 			 * Return address to caller.
15298348SEric.Yu@Sun.COM 			 * Caller handles truncation if length
15308348SEric.Yu@Sun.COM 			 * exceeds msg_namelen.
15318348SEric.Yu@Sun.COM 			 * NOTE: AF_UNIX NUL termination is ensured by
15328348SEric.Yu@Sun.COM 			 * the sender's copyin_name().
15338348SEric.Yu@Sun.COM 			 */
15348348SEric.Yu@Sun.COM 			abuf = kmem_alloc(addrlen, KM_SLEEP);
15358348SEric.Yu@Sun.COM 
15368348SEric.Yu@Sun.COM 			bcopy(addr, abuf, addrlen);
15378348SEric.Yu@Sun.COM 			msg->msg_name = abuf;
15388348SEric.Yu@Sun.COM 			msg->msg_namelen = addrlen;
15398348SEric.Yu@Sun.COM 		}
15408348SEric.Yu@Sun.COM 
15418348SEric.Yu@Sun.COM 		if (controllen != 0) {
15428348SEric.Yu@Sun.COM 			/*
15438348SEric.Yu@Sun.COM 			 * Return control msg to caller.
15448348SEric.Yu@Sun.COM 			 * Caller handles truncation if length
15458348SEric.Yu@Sun.COM 			 * exceeds msg_controllen.
15468348SEric.Yu@Sun.COM 			 */
15478348SEric.Yu@Sun.COM 			control = kmem_zalloc(controllen, KM_SLEEP);
15488348SEric.Yu@Sun.COM 
15498348SEric.Yu@Sun.COM 			error = so_opt2cmsg(mctlp, opt, optlen,
15508348SEric.Yu@Sun.COM 			    !(flags & MSG_XPG4_2), control, controllen);
15518348SEric.Yu@Sun.COM 			if (error) {
15528348SEric.Yu@Sun.COM 				freemsg(mctlp);
15538348SEric.Yu@Sun.COM 				if (msg->msg_namelen != 0)
15548348SEric.Yu@Sun.COM 					kmem_free(msg->msg_name,
15558348SEric.Yu@Sun.COM 					    msg->msg_namelen);
15568348SEric.Yu@Sun.COM 				kmem_free(control, controllen);
15578348SEric.Yu@Sun.COM 				eprintsoline(so, error);
15588348SEric.Yu@Sun.COM 				goto out;
15598348SEric.Yu@Sun.COM 			}
15608348SEric.Yu@Sun.COM 			msg->msg_control = control;
15618348SEric.Yu@Sun.COM 			msg->msg_controllen = controllen;
15628348SEric.Yu@Sun.COM 		}
15638348SEric.Yu@Sun.COM 
15648348SEric.Yu@Sun.COM 		freemsg(mctlp);
15658348SEric.Yu@Sun.COM 		goto out;
15668348SEric.Yu@Sun.COM 	}
15678348SEric.Yu@Sun.COM 	case T_OPTDATA_IND: {
15688348SEric.Yu@Sun.COM 		struct T_optdata_req *tdr;
15698348SEric.Yu@Sun.COM 		void *opt;
15708348SEric.Yu@Sun.COM 		t_uscalar_t optlen;
15718348SEric.Yu@Sun.COM 
15728348SEric.Yu@Sun.COM 		tdr = (struct T_optdata_req *)mctlp->b_rptr;
15738348SEric.Yu@Sun.COM 		optlen = tdr->OPT_length;
15748348SEric.Yu@Sun.COM 		if (optlen != 0) {
15758348SEric.Yu@Sun.COM 			t_uscalar_t ncontrollen;
15768348SEric.Yu@Sun.COM 			/*
15778348SEric.Yu@Sun.COM 			 * Determine how large cmsg buffer is needed.
15788348SEric.Yu@Sun.COM 			 */
15798348SEric.Yu@Sun.COM 			opt = sogetoff(mctlp,
15808348SEric.Yu@Sun.COM 			    tpr->optdata_ind.OPT_offset, optlen,
15818348SEric.Yu@Sun.COM 			    __TPI_ALIGN_SIZE);
15828348SEric.Yu@Sun.COM 
15838348SEric.Yu@Sun.COM 			if (opt == NULL) {
15848348SEric.Yu@Sun.COM 				freemsg(mctlp);
15858348SEric.Yu@Sun.COM 				error = EPROTO;
15868348SEric.Yu@Sun.COM 				eprintsoline(so, error);
15878348SEric.Yu@Sun.COM 				goto out;
15888348SEric.Yu@Sun.COM 			}
15898348SEric.Yu@Sun.COM 
15908348SEric.Yu@Sun.COM 			ncontrollen = so_cmsglen(mctlp, opt, optlen,
15918348SEric.Yu@Sun.COM 			    !(flags & MSG_XPG4_2));
15928348SEric.Yu@Sun.COM 			if (controllen != 0)
15938348SEric.Yu@Sun.COM 				controllen = ncontrollen;
15948348SEric.Yu@Sun.COM 			else if (ncontrollen != 0)
15958348SEric.Yu@Sun.COM 				msg->msg_flags |= MSG_CTRUNC;
15968348SEric.Yu@Sun.COM 		} else {
15978348SEric.Yu@Sun.COM 			controllen = 0;
15988348SEric.Yu@Sun.COM 		}
15998348SEric.Yu@Sun.COM 
16008348SEric.Yu@Sun.COM 		if (controllen != 0) {
16018348SEric.Yu@Sun.COM 			/*
16028348SEric.Yu@Sun.COM 			 * Return control msg to caller.
16038348SEric.Yu@Sun.COM 			 * Caller handles truncation if length
16048348SEric.Yu@Sun.COM 			 * exceeds msg_controllen.
16058348SEric.Yu@Sun.COM 			 */
16068348SEric.Yu@Sun.COM 			control = kmem_zalloc(controllen, KM_SLEEP);
16078348SEric.Yu@Sun.COM 
16088348SEric.Yu@Sun.COM 			error = so_opt2cmsg(mctlp, opt, optlen,
16098348SEric.Yu@Sun.COM 			    !(flags & MSG_XPG4_2), control, controllen);
16108348SEric.Yu@Sun.COM 			if (error) {
16118348SEric.Yu@Sun.COM 				freemsg(mctlp);
16128348SEric.Yu@Sun.COM 				kmem_free(control, controllen);
16138348SEric.Yu@Sun.COM 				eprintsoline(so, error);
16148348SEric.Yu@Sun.COM 				goto out;
16158348SEric.Yu@Sun.COM 			}
16168348SEric.Yu@Sun.COM 			msg->msg_control = control;
16178348SEric.Yu@Sun.COM 			msg->msg_controllen = controllen;
16188348SEric.Yu@Sun.COM 		}
16198348SEric.Yu@Sun.COM 
16208348SEric.Yu@Sun.COM 		/*
16218348SEric.Yu@Sun.COM 		 * Set msg_flags to MSG_EOR based on
16228348SEric.Yu@Sun.COM 		 * DATA_flag and MOREDATA.
16238348SEric.Yu@Sun.COM 		 */
16248348SEric.Yu@Sun.COM 		mutex_enter(&so->so_lock);
16258348SEric.Yu@Sun.COM 		so->so_state &= ~SS_SAVEDEOR;
16268348SEric.Yu@Sun.COM 		if (!(tpr->data_ind.MORE_flag & 1)) {
16278348SEric.Yu@Sun.COM 			if (!(rval.r_val1 & MOREDATA))
16288348SEric.Yu@Sun.COM 				msg->msg_flags |= MSG_EOR;
16298348SEric.Yu@Sun.COM 			else
16308348SEric.Yu@Sun.COM 				so->so_state |= SS_SAVEDEOR;
16318348SEric.Yu@Sun.COM 		}
16328348SEric.Yu@Sun.COM 		freemsg(mctlp);
16338348SEric.Yu@Sun.COM 		/*
16348348SEric.Yu@Sun.COM 		 * If some data was received (i.e. not EOF) and the
16358348SEric.Yu@Sun.COM 		 * read/recv* has not been satisfied wait for some more.
16368348SEric.Yu@Sun.COM 		 * Not possible to wait if control info was received.
16378348SEric.Yu@Sun.COM 		 */
16388348SEric.Yu@Sun.COM 		if ((flags & MSG_WAITALL) && !(msg->msg_flags & MSG_EOR) &&
16398348SEric.Yu@Sun.COM 		    controllen == 0 &&
16408348SEric.Yu@Sun.COM 		    uiop->uio_resid != saved_resid && uiop->uio_resid > 0) {
16418348SEric.Yu@Sun.COM 			mutex_exit(&so->so_lock);
16428348SEric.Yu@Sun.COM 			goto retry;
16438348SEric.Yu@Sun.COM 		}
16448348SEric.Yu@Sun.COM 		goto out_locked;
16458348SEric.Yu@Sun.COM 	}
16468348SEric.Yu@Sun.COM 	default:
16478348SEric.Yu@Sun.COM 		cmn_err(CE_CONT, "so_recvmsg bad type %x \n",
16488348SEric.Yu@Sun.COM 		    tpr->type);
16498348SEric.Yu@Sun.COM 		freemsg(mctlp);
16508348SEric.Yu@Sun.COM 		error = EPROTO;
16518348SEric.Yu@Sun.COM 		ASSERT(0);
16528348SEric.Yu@Sun.COM 	}
16538348SEric.Yu@Sun.COM out:
16548348SEric.Yu@Sun.COM 	mutex_enter(&so->so_lock);
16558348SEric.Yu@Sun.COM out_locked:
16568348SEric.Yu@Sun.COM 	/* The sod_lockp pointers to the sonode so_lock */
16578348SEric.Yu@Sun.COM 	ret = sod_rcv_done(so, suiop, uiop);
16588348SEric.Yu@Sun.COM 	if (ret != 0 && error == 0)
16598348SEric.Yu@Sun.COM 		error = ret;
16608348SEric.Yu@Sun.COM 
16618348SEric.Yu@Sun.COM 	so_unlock_read(so);	/* Clear SOREADLOCKED */
16628348SEric.Yu@Sun.COM 	mutex_exit(&so->so_lock);
16638348SEric.Yu@Sun.COM 
16648348SEric.Yu@Sun.COM 	SO_UNBLOCK_FALLBACK(so);
16658348SEric.Yu@Sun.COM 
16668348SEric.Yu@Sun.COM 	return (error);
16678348SEric.Yu@Sun.COM }
16688348SEric.Yu@Sun.COM 
16698348SEric.Yu@Sun.COM sonodeops_t so_sonodeops = {
16708348SEric.Yu@Sun.COM 	so_init,		/* sop_init	*/
16718348SEric.Yu@Sun.COM 	so_accept,		/* sop_accept   */
16728348SEric.Yu@Sun.COM 	so_bind,		/* sop_bind	*/
16738348SEric.Yu@Sun.COM 	so_listen,		/* sop_listen   */
16748348SEric.Yu@Sun.COM 	so_connect,		/* sop_connect  */
16758348SEric.Yu@Sun.COM 	so_recvmsg,		/* sop_recvmsg  */
16768348SEric.Yu@Sun.COM 	so_sendmsg,		/* sop_sendmsg  */
16778348SEric.Yu@Sun.COM 	so_sendmblk,		/* sop_sendmblk */
16788348SEric.Yu@Sun.COM 	so_getpeername,		/* sop_getpeername */
16798348SEric.Yu@Sun.COM 	so_getsockname,		/* sop_getsockname */
16808348SEric.Yu@Sun.COM 	so_shutdown,		/* sop_shutdown */
16818348SEric.Yu@Sun.COM 	so_getsockopt,		/* sop_getsockopt */
16828348SEric.Yu@Sun.COM 	so_setsockopt,		/* sop_setsockopt */
16838348SEric.Yu@Sun.COM 	so_ioctl,		/* sop_ioctl    */
16848348SEric.Yu@Sun.COM 	so_poll,		/* sop_poll	*/
16858348SEric.Yu@Sun.COM 	so_close,		/* sop_close */
16868348SEric.Yu@Sun.COM };
16878348SEric.Yu@Sun.COM 
16888348SEric.Yu@Sun.COM sock_upcalls_t so_upcalls = {
16898348SEric.Yu@Sun.COM 	so_newconn,
16908348SEric.Yu@Sun.COM 	so_connected,
16918348SEric.Yu@Sun.COM 	so_disconnected,
16928348SEric.Yu@Sun.COM 	so_opctl,
16938348SEric.Yu@Sun.COM 	so_queue_msg,
16948348SEric.Yu@Sun.COM 	so_set_prop,
16958348SEric.Yu@Sun.COM 	so_txq_full,
16968348SEric.Yu@Sun.COM 	so_signal_oob,
16978348SEric.Yu@Sun.COM 	so_zcopy_notify,
16988348SEric.Yu@Sun.COM 	so_set_error
16998348SEric.Yu@Sun.COM };
1700