xref: /freebsd-src/sys/ofed/drivers/infiniband/ulp/sdp/sdp_main.c (revision 296a4cb5c5b18f82da7a365d9f209cb9fc09003b)
1aa0a1e58SJeff Roberson /*-
251369649SPedro F. Giffuni  * SPDX-License-Identifier: BSD-3-Clause
351369649SPedro F. Giffuni  *
4aa0a1e58SJeff Roberson  * Copyright (c) 1982, 1986, 1988, 1990, 1993, 1995
5aa0a1e58SJeff Roberson  *      The Regents of the University of California.  All rights reserved.
6aa0a1e58SJeff Roberson  * Copyright (c) 2004 The FreeBSD Foundation.  All rights reserved.
7aa0a1e58SJeff Roberson  * Copyright (c) 2004-2008 Robert N. M. Watson.  All rights reserved.
8aa0a1e58SJeff Roberson  *
9aa0a1e58SJeff Roberson  * Redistribution and use in source and binary forms, with or without
10aa0a1e58SJeff Roberson  * modification, are permitted provided that the following conditions
11aa0a1e58SJeff Roberson  * are met:
12aa0a1e58SJeff Roberson  * 1. Redistributions of source code must retain the above copyright
13aa0a1e58SJeff Roberson  *    notice, this list of conditions and the following disclaimer.
14aa0a1e58SJeff Roberson  * 2. Redistributions in binary form must reproduce the above copyright
15aa0a1e58SJeff Roberson  *    notice, this list of conditions and the following disclaimer in the
16aa0a1e58SJeff Roberson  *    documentation and/or other materials provided with the distribution.
17fbbd9655SWarner Losh  * 3. Neither the name of the University nor the names of its contributors
18aa0a1e58SJeff Roberson  *    may be used to endorse or promote products derived from this software
19aa0a1e58SJeff Roberson  *    without specific prior written permission.
20aa0a1e58SJeff Roberson  *
21aa0a1e58SJeff Roberson  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
22aa0a1e58SJeff Roberson  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23aa0a1e58SJeff Roberson  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24aa0a1e58SJeff Roberson  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25aa0a1e58SJeff Roberson  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
26aa0a1e58SJeff Roberson  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
27aa0a1e58SJeff Roberson  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
28aa0a1e58SJeff Roberson  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
29aa0a1e58SJeff Roberson  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
30aa0a1e58SJeff Roberson  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
31aa0a1e58SJeff Roberson  * SUCH DAMAGE.
32aa0a1e58SJeff Roberson  *
33aa0a1e58SJeff Roberson  * Excerpts taken from tcp_subr.c, tcp_usrreq.c, uipc_socket.c
34aa0a1e58SJeff Roberson  */
35aa0a1e58SJeff Roberson 
36aa0a1e58SJeff Roberson /*
37aa0a1e58SJeff Roberson  *
38aa0a1e58SJeff Roberson  * Copyright (c) 2010 Isilon Systems, Inc.
39aa0a1e58SJeff Roberson  * Copyright (c) 2010 iX Systems, Inc.
40aa0a1e58SJeff Roberson  * Copyright (c) 2010 Panasas, Inc.
41aa0a1e58SJeff Roberson  * All rights reserved.
42aa0a1e58SJeff Roberson  *
43aa0a1e58SJeff Roberson  * Redistribution and use in source and binary forms, with or without
44aa0a1e58SJeff Roberson  * modification, are permitted provided that the following conditions
45aa0a1e58SJeff Roberson  * are met:
46aa0a1e58SJeff Roberson  * 1. Redistributions of source code must retain the above copyright
47aa0a1e58SJeff Roberson  *    notice unmodified, this list of conditions, and the following
48aa0a1e58SJeff Roberson  *    disclaimer.
49aa0a1e58SJeff Roberson  * 2. Redistributions in binary form must reproduce the above copyright
50aa0a1e58SJeff Roberson  *    notice, this list of conditions and the following disclaimer in the
51aa0a1e58SJeff Roberson  *    documentation and/or other materials provided with the distribution.
52aa0a1e58SJeff Roberson  *
53aa0a1e58SJeff Roberson  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
54aa0a1e58SJeff Roberson  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
55aa0a1e58SJeff Roberson  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
56aa0a1e58SJeff Roberson  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
57aa0a1e58SJeff Roberson  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
58aa0a1e58SJeff Roberson  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
59aa0a1e58SJeff Roberson  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
60aa0a1e58SJeff Roberson  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
61aa0a1e58SJeff Roberson  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
62aa0a1e58SJeff Roberson  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
63aa0a1e58SJeff Roberson  *
64aa0a1e58SJeff Roberson  */
65fdafd315SWarner Losh 
66d3461164SMark Johnston #include <sys/param.h>
67e12be321SConrad Meyer #include <sys/eventhandler.h>
68d3461164SMark Johnston #include <sys/kernel.h>
69d3461164SMark Johnston #include <sys/malloc.h>
70d3461164SMark Johnston 
71aa0a1e58SJeff Roberson #include "sdp.h"
72aa0a1e58SJeff Roberson 
73aa0a1e58SJeff Roberson #include <net/if.h>
74aa0a1e58SJeff Roberson #include <net/route.h>
75aa0a1e58SJeff Roberson #include <net/vnet.h>
764813ad54SHans Petter Selasky #include <sys/sysctl.h>
77aa0a1e58SJeff Roberson 
78aa0a1e58SJeff Roberson uma_zone_t	sdp_zone;
79aa0a1e58SJeff Roberson struct rwlock	sdp_lock;
80aa0a1e58SJeff Roberson LIST_HEAD(, sdp_sock) sdp_list;
81aa0a1e58SJeff Roberson 
82aa0a1e58SJeff Roberson struct workqueue_struct *rx_comp_wq;
83aa0a1e58SJeff Roberson 
84aa0a1e58SJeff Roberson RW_SYSINIT(sdplockinit, &sdp_lock, "SDP lock");
85aa0a1e58SJeff Roberson #define	SDP_LIST_WLOCK()	rw_wlock(&sdp_lock)
86aa0a1e58SJeff Roberson #define	SDP_LIST_RLOCK()	rw_rlock(&sdp_lock)
87aa0a1e58SJeff Roberson #define	SDP_LIST_WUNLOCK()	rw_wunlock(&sdp_lock)
88aa0a1e58SJeff Roberson #define	SDP_LIST_RUNLOCK()	rw_runlock(&sdp_lock)
89aa0a1e58SJeff Roberson #define	SDP_LIST_WLOCK_ASSERT()	rw_assert(&sdp_lock, RW_WLOCKED)
90aa0a1e58SJeff Roberson #define	SDP_LIST_RLOCK_ASSERT()	rw_assert(&sdp_lock, RW_RLOCKED)
91aa0a1e58SJeff Roberson #define	SDP_LIST_LOCK_ASSERT()	rw_assert(&sdp_lock, RW_LOCKED)
92aa0a1e58SJeff Roberson 
93d3461164SMark Johnston MALLOC_DEFINE(M_SDP, "sdp", "Sockets Direct Protocol");
94aa0a1e58SJeff Roberson 
95aa0a1e58SJeff Roberson static void sdp_stop_keepalive_timer(struct socket *so);
96aa0a1e58SJeff Roberson 
97aa0a1e58SJeff Roberson /*
98aa0a1e58SJeff Roberson  * SDP protocol interface to socket abstraction.
99aa0a1e58SJeff Roberson  */
100aa0a1e58SJeff Roberson /*
101aa0a1e58SJeff Roberson  * sdp_sendspace and sdp_recvspace are the default send and receive window
102aa0a1e58SJeff Roberson  * sizes, respectively.
103aa0a1e58SJeff Roberson  */
104aa0a1e58SJeff Roberson u_long	sdp_sendspace = 1024*32;
105aa0a1e58SJeff Roberson u_long	sdp_recvspace = 1024*64;
106aa0a1e58SJeff Roberson 
107aa0a1e58SJeff Roberson static int sdp_count;
108aa0a1e58SJeff Roberson 
109aa0a1e58SJeff Roberson /*
110aa0a1e58SJeff Roberson  * Disable async. CMA events for sockets which are being torn down.
111aa0a1e58SJeff Roberson  */
112aa0a1e58SJeff Roberson static void
sdp_destroy_cma(struct sdp_sock * ssk)113aa0a1e58SJeff Roberson sdp_destroy_cma(struct sdp_sock *ssk)
114aa0a1e58SJeff Roberson {
115aa0a1e58SJeff Roberson 
116aa0a1e58SJeff Roberson 	if (ssk->id == NULL)
117aa0a1e58SJeff Roberson 		return;
118aa0a1e58SJeff Roberson 	rdma_destroy_id(ssk->id);
119aa0a1e58SJeff Roberson 	ssk->id = NULL;
120aa0a1e58SJeff Roberson }
121aa0a1e58SJeff Roberson 
122aa0a1e58SJeff Roberson static int
sdp_pcbbind(struct sdp_sock * ssk,struct sockaddr * nam,struct ucred * cred)123aa0a1e58SJeff Roberson sdp_pcbbind(struct sdp_sock *ssk, struct sockaddr *nam, struct ucred *cred)
124aa0a1e58SJeff Roberson {
125aa0a1e58SJeff Roberson 	struct sockaddr_in *sin;
126aa0a1e58SJeff Roberson 	struct sockaddr_in null;
127aa0a1e58SJeff Roberson 	int error;
128aa0a1e58SJeff Roberson 
129aa0a1e58SJeff Roberson 	SDP_WLOCK_ASSERT(ssk);
130aa0a1e58SJeff Roberson 
131aa0a1e58SJeff Roberson 	if (ssk->lport != 0 || ssk->laddr != INADDR_ANY)
132aa0a1e58SJeff Roberson 		return (EINVAL);
133aa0a1e58SJeff Roberson 	/* rdma_bind_addr handles bind races.  */
134aa0a1e58SJeff Roberson 	SDP_WUNLOCK(ssk);
135aa0a1e58SJeff Roberson 	if (ssk->id == NULL)
136c69c74b8SHans Petter Selasky 		ssk->id = rdma_create_id(&init_net, sdp_cma_handler, ssk, RDMA_PS_SDP, IB_QPT_RC);
137aa0a1e58SJeff Roberson 	if (ssk->id == NULL) {
138aa0a1e58SJeff Roberson 		SDP_WLOCK(ssk);
139aa0a1e58SJeff Roberson 		return (ENOMEM);
140aa0a1e58SJeff Roberson 	}
141aa0a1e58SJeff Roberson 	if (nam == NULL) {
142aa0a1e58SJeff Roberson 		null.sin_family = AF_INET;
143aa0a1e58SJeff Roberson 		null.sin_len = sizeof(null);
144aa0a1e58SJeff Roberson 		null.sin_addr.s_addr = INADDR_ANY;
145aa0a1e58SJeff Roberson 		null.sin_port = 0;
146aa0a1e58SJeff Roberson 		bzero(&null.sin_zero, sizeof(null.sin_zero));
147aa0a1e58SJeff Roberson 		nam = (struct sockaddr *)&null;
148aa0a1e58SJeff Roberson 	}
149aa0a1e58SJeff Roberson 	error = -rdma_bind_addr(ssk->id, nam);
150aa0a1e58SJeff Roberson 	SDP_WLOCK(ssk);
151aa0a1e58SJeff Roberson 	if (error == 0) {
152aa0a1e58SJeff Roberson 		sin = (struct sockaddr_in *)&ssk->id->route.addr.src_addr;
153aa0a1e58SJeff Roberson 		ssk->laddr = sin->sin_addr.s_addr;
154aa0a1e58SJeff Roberson 		ssk->lport = sin->sin_port;
155aa0a1e58SJeff Roberson 	} else
156aa0a1e58SJeff Roberson 		sdp_destroy_cma(ssk);
157aa0a1e58SJeff Roberson 	return (error);
158aa0a1e58SJeff Roberson }
159aa0a1e58SJeff Roberson 
160aa0a1e58SJeff Roberson static void
sdp_pcbfree(struct sdp_sock * ssk)161aa0a1e58SJeff Roberson sdp_pcbfree(struct sdp_sock *ssk)
162aa0a1e58SJeff Roberson {
163adaf3c49SMark Johnston 
164aa0a1e58SJeff Roberson 	KASSERT(ssk->socket == NULL, ("ssk %p socket still attached", ssk));
165adaf3c49SMark Johnston 	KASSERT((ssk->flags & SDP_DESTROY) == 0,
166adaf3c49SMark Johnston 	    ("ssk %p already destroyed", ssk));
167aa0a1e58SJeff Roberson 
168aa0a1e58SJeff Roberson 	sdp_dbg(ssk->socket, "Freeing pcb");
169aa0a1e58SJeff Roberson 	SDP_WLOCK_ASSERT(ssk);
170aa0a1e58SJeff Roberson 	ssk->flags |= SDP_DESTROY;
171aa0a1e58SJeff Roberson 	SDP_WUNLOCK(ssk);
172aa0a1e58SJeff Roberson 	SDP_LIST_WLOCK();
173aa0a1e58SJeff Roberson 	sdp_count--;
174aa0a1e58SJeff Roberson 	LIST_REMOVE(ssk, list);
175aa0a1e58SJeff Roberson 	SDP_LIST_WUNLOCK();
176aa0a1e58SJeff Roberson 	crfree(ssk->cred);
177aa0a1e58SJeff Roberson 	ssk->qp_active = 0;
178aa0a1e58SJeff Roberson 	if (ssk->qp) {
179aa0a1e58SJeff Roberson 		ib_destroy_qp(ssk->qp);
180aa0a1e58SJeff Roberson 		ssk->qp = NULL;
181aa0a1e58SJeff Roberson 	}
182aa0a1e58SJeff Roberson 	sdp_tx_ring_destroy(ssk);
183aa0a1e58SJeff Roberson 	sdp_rx_ring_destroy(ssk);
184adaf3c49SMark Johnston 	sdp_destroy_cma(ssk);
185aa0a1e58SJeff Roberson 	rw_destroy(&ssk->rx_ring.destroyed_lock);
186aa0a1e58SJeff Roberson 	rw_destroy(&ssk->lock);
187fa46ade8SMark Johnston 	uma_zfree(sdp_zone, ssk);
188aa0a1e58SJeff Roberson }
189aa0a1e58SJeff Roberson 
190aa0a1e58SJeff Roberson static int
sdp_getsockaddr(struct socket * so,struct sockaddr * sa)1910fac350cSGleb Smirnoff sdp_getsockaddr(struct socket *so, struct sockaddr *sa)
192aa0a1e58SJeff Roberson {
1930fac350cSGleb Smirnoff 	struct sdp_sock *ssk = sdp_sk(so);
194aa0a1e58SJeff Roberson 
195aa0a1e58SJeff Roberson 	SDP_RLOCK(ssk);
1960fac350cSGleb Smirnoff 	*(struct sockaddr_in *)sa = (struct sockaddr_in ){
1970fac350cSGleb Smirnoff 		.sin_family = AF_INET,
1980fac350cSGleb Smirnoff 		.sin_len = sizeof(struct sockaddr_in),
1990fac350cSGleb Smirnoff 		.sin_addr.s_addr = ssk->laddr,
2000fac350cSGleb Smirnoff 		.sin_port = ssk->lport,
2010fac350cSGleb Smirnoff 	};
202aa0a1e58SJeff Roberson 	SDP_RUNLOCK(ssk);
203aa0a1e58SJeff Roberson 
2040fac350cSGleb Smirnoff 	return (0);
205aa0a1e58SJeff Roberson }
206aa0a1e58SJeff Roberson 
207aa0a1e58SJeff Roberson static int
sdp_getpeeraddr(struct socket * so,struct sockaddr * sa)2080fac350cSGleb Smirnoff sdp_getpeeraddr(struct socket *so, struct sockaddr *sa)
209aa0a1e58SJeff Roberson {
2100fac350cSGleb Smirnoff 	struct sdp_sock *ssk = sdp_sk(so);
211aa0a1e58SJeff Roberson 
212aa0a1e58SJeff Roberson 	SDP_RLOCK(ssk);
2130fac350cSGleb Smirnoff 	*(struct sockaddr_in *)sa = (struct sockaddr_in ){
2140fac350cSGleb Smirnoff 		.sin_family = AF_INET,
2150fac350cSGleb Smirnoff 		.sin_len = sizeof(struct sockaddr_in),
2160fac350cSGleb Smirnoff 		.sin_addr.s_addr = ssk->faddr,
2170fac350cSGleb Smirnoff 		.sin_port = ssk->fport,
2180fac350cSGleb Smirnoff 	};
219aa0a1e58SJeff Roberson 	SDP_RUNLOCK(ssk);
220aa0a1e58SJeff Roberson 
2210fac350cSGleb Smirnoff 	return (0);
222aa0a1e58SJeff Roberson }
223aa0a1e58SJeff Roberson 
224aa0a1e58SJeff Roberson #if 0
225aa0a1e58SJeff Roberson static void
226aa0a1e58SJeff Roberson sdp_apply_all(void (*func)(struct sdp_sock *, void *), void *arg)
227aa0a1e58SJeff Roberson {
228aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
229aa0a1e58SJeff Roberson 
230aa0a1e58SJeff Roberson 	SDP_LIST_RLOCK();
231aa0a1e58SJeff Roberson 	LIST_FOREACH(ssk, &sdp_list, list) {
232aa0a1e58SJeff Roberson 		SDP_WLOCK(ssk);
233aa0a1e58SJeff Roberson 		func(ssk, arg);
234aa0a1e58SJeff Roberson 		SDP_WUNLOCK(ssk);
235aa0a1e58SJeff Roberson 	}
236aa0a1e58SJeff Roberson 	SDP_LIST_RUNLOCK();
237aa0a1e58SJeff Roberson }
238aa0a1e58SJeff Roberson #endif
239aa0a1e58SJeff Roberson 
240aa0a1e58SJeff Roberson static void
sdp_output_reset(struct sdp_sock * ssk)241aa0a1e58SJeff Roberson sdp_output_reset(struct sdp_sock *ssk)
242aa0a1e58SJeff Roberson {
243aa0a1e58SJeff Roberson 	struct rdma_cm_id *id;
244aa0a1e58SJeff Roberson 
245aa0a1e58SJeff Roberson 	SDP_WLOCK_ASSERT(ssk);
246aa0a1e58SJeff Roberson 	if (ssk->id) {
247aa0a1e58SJeff Roberson 		id = ssk->id;
248aa0a1e58SJeff Roberson 		ssk->qp_active = 0;
249aa0a1e58SJeff Roberson 		SDP_WUNLOCK(ssk);
250aa0a1e58SJeff Roberson 		rdma_disconnect(id);
251aa0a1e58SJeff Roberson 		SDP_WLOCK(ssk);
252aa0a1e58SJeff Roberson 	}
253aa0a1e58SJeff Roberson 	ssk->state = TCPS_CLOSED;
254aa0a1e58SJeff Roberson }
255aa0a1e58SJeff Roberson 
256aa0a1e58SJeff Roberson /*
257aa0a1e58SJeff Roberson  * Attempt to close a SDP socket, marking it as dropped, and freeing
258aa0a1e58SJeff Roberson  * the socket if we hold the only reference.
259aa0a1e58SJeff Roberson  */
260aa0a1e58SJeff Roberson static struct sdp_sock *
sdp_closed(struct sdp_sock * ssk)261aa0a1e58SJeff Roberson sdp_closed(struct sdp_sock *ssk)
262aa0a1e58SJeff Roberson {
263aa0a1e58SJeff Roberson 	struct socket *so;
264aa0a1e58SJeff Roberson 
265aa0a1e58SJeff Roberson 	SDP_WLOCK_ASSERT(ssk);
266aa0a1e58SJeff Roberson 
267aa0a1e58SJeff Roberson 	ssk->flags |= SDP_DROPPED;
268aa0a1e58SJeff Roberson 	so = ssk->socket;
269aa0a1e58SJeff Roberson 	soisdisconnected(so);
270aa0a1e58SJeff Roberson 	if (ssk->flags & SDP_SOCKREF) {
271aa0a1e58SJeff Roberson 		ssk->flags &= ~SDP_SOCKREF;
272aa0a1e58SJeff Roberson 		SDP_WUNLOCK(ssk);
273d8596171SGleb Smirnoff 		sorele(so);
274aa0a1e58SJeff Roberson 		return (NULL);
275aa0a1e58SJeff Roberson 	}
276aa0a1e58SJeff Roberson 	return (ssk);
277aa0a1e58SJeff Roberson }
278aa0a1e58SJeff Roberson 
279aa0a1e58SJeff Roberson /*
280aa0a1e58SJeff Roberson  * Perform timer based shutdowns which can not operate in
281aa0a1e58SJeff Roberson  * callout context.
282aa0a1e58SJeff Roberson  */
283aa0a1e58SJeff Roberson static void
sdp_shutdown_task(void * data,int pending)284aa0a1e58SJeff Roberson sdp_shutdown_task(void *data, int pending)
285aa0a1e58SJeff Roberson {
286aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
287aa0a1e58SJeff Roberson 
288aa0a1e58SJeff Roberson 	ssk = data;
289aa0a1e58SJeff Roberson 	SDP_WLOCK(ssk);
290aa0a1e58SJeff Roberson 	/*
291aa0a1e58SJeff Roberson 	 * I don't think this can race with another call to pcbfree()
292aa0a1e58SJeff Roberson 	 * because SDP_TIMEWAIT protects it.  SDP_DESTROY may be redundant.
293aa0a1e58SJeff Roberson 	 */
294aa0a1e58SJeff Roberson 	if (ssk->flags & SDP_DESTROY)
295aa0a1e58SJeff Roberson 		panic("sdp_shutdown_task: Racing with pcbfree for ssk %p",
296aa0a1e58SJeff Roberson 		    ssk);
297aa0a1e58SJeff Roberson 	if (ssk->flags & SDP_DISCON)
298aa0a1e58SJeff Roberson 		sdp_output_reset(ssk);
299aa0a1e58SJeff Roberson 	/* We have to clear this so sdp_detach() will call pcbfree(). */
300aa0a1e58SJeff Roberson 	ssk->flags &= ~(SDP_TIMEWAIT | SDP_DREQWAIT);
301aa0a1e58SJeff Roberson 	if ((ssk->flags & SDP_DROPPED) == 0 &&
302aa0a1e58SJeff Roberson 	    sdp_closed(ssk) == NULL)
303aa0a1e58SJeff Roberson 		return;
304aa0a1e58SJeff Roberson 	if (ssk->socket == NULL) {
305aa0a1e58SJeff Roberson 		sdp_pcbfree(ssk);
306aa0a1e58SJeff Roberson 		return;
307aa0a1e58SJeff Roberson 	}
308aa0a1e58SJeff Roberson 	SDP_WUNLOCK(ssk);
309aa0a1e58SJeff Roberson }
310aa0a1e58SJeff Roberson 
311aa0a1e58SJeff Roberson /*
312aa0a1e58SJeff Roberson  * 2msl has expired, schedule the shutdown task.
313aa0a1e58SJeff Roberson  */
314aa0a1e58SJeff Roberson static void
sdp_2msl_timeout(void * data)315aa0a1e58SJeff Roberson sdp_2msl_timeout(void *data)
316aa0a1e58SJeff Roberson {
317aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
318aa0a1e58SJeff Roberson 
319aa0a1e58SJeff Roberson 	ssk = data;
320aa0a1e58SJeff Roberson 	/* Callout canceled. */
321aa0a1e58SJeff Roberson         if (!callout_active(&ssk->keep2msl))
322aa0a1e58SJeff Roberson 		goto out;
323aa0a1e58SJeff Roberson         callout_deactivate(&ssk->keep2msl);
324aa0a1e58SJeff Roberson 	/* Should be impossible, defensive programming. */
325aa0a1e58SJeff Roberson 	if ((ssk->flags & SDP_TIMEWAIT) == 0)
326aa0a1e58SJeff Roberson 		goto out;
327aa0a1e58SJeff Roberson 	taskqueue_enqueue(taskqueue_thread, &ssk->shutdown_task);
328aa0a1e58SJeff Roberson out:
329aa0a1e58SJeff Roberson 	SDP_WUNLOCK(ssk);
330aa0a1e58SJeff Roberson 	return;
331aa0a1e58SJeff Roberson }
332aa0a1e58SJeff Roberson 
333aa0a1e58SJeff Roberson /*
334aa0a1e58SJeff Roberson  * Schedule the 2msl wait timer.
335aa0a1e58SJeff Roberson  */
336aa0a1e58SJeff Roberson static void
sdp_2msl_wait(struct sdp_sock * ssk)337aa0a1e58SJeff Roberson sdp_2msl_wait(struct sdp_sock *ssk)
338aa0a1e58SJeff Roberson {
339aa0a1e58SJeff Roberson 
340aa0a1e58SJeff Roberson 	SDP_WLOCK_ASSERT(ssk);
341aa0a1e58SJeff Roberson 	ssk->flags |= SDP_TIMEWAIT;
342aa0a1e58SJeff Roberson 	ssk->state = TCPS_TIME_WAIT;
343aa0a1e58SJeff Roberson 	soisdisconnected(ssk->socket);
344aa0a1e58SJeff Roberson 	callout_reset(&ssk->keep2msl, TCPTV_MSL, sdp_2msl_timeout, ssk);
345aa0a1e58SJeff Roberson }
346aa0a1e58SJeff Roberson 
347aa0a1e58SJeff Roberson /*
348aa0a1e58SJeff Roberson  * Timed out waiting for the final fin/ack from rdma_disconnect().
349aa0a1e58SJeff Roberson  */
350aa0a1e58SJeff Roberson static void
sdp_dreq_timeout(void * data)351aa0a1e58SJeff Roberson sdp_dreq_timeout(void *data)
352aa0a1e58SJeff Roberson {
353aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
354aa0a1e58SJeff Roberson 
355aa0a1e58SJeff Roberson 	ssk = data;
356aa0a1e58SJeff Roberson 	/* Callout canceled. */
357aa0a1e58SJeff Roberson         if (!callout_active(&ssk->keep2msl))
358aa0a1e58SJeff Roberson 		goto out;
359aa0a1e58SJeff Roberson 	/* Callout rescheduled, probably as a different timer. */
360aa0a1e58SJeff Roberson 	if (callout_pending(&ssk->keep2msl))
361aa0a1e58SJeff Roberson 		goto out;
362aa0a1e58SJeff Roberson         callout_deactivate(&ssk->keep2msl);
363aa0a1e58SJeff Roberson 	if (ssk->state != TCPS_FIN_WAIT_1 && ssk->state != TCPS_LAST_ACK)
364aa0a1e58SJeff Roberson 		goto out;
365aa0a1e58SJeff Roberson 	if ((ssk->flags & SDP_DREQWAIT) == 0)
366aa0a1e58SJeff Roberson 		goto out;
367aa0a1e58SJeff Roberson 	ssk->flags &= ~SDP_DREQWAIT;
368aa0a1e58SJeff Roberson 	ssk->flags |= SDP_DISCON;
369aa0a1e58SJeff Roberson 	sdp_2msl_wait(ssk);
370aa0a1e58SJeff Roberson 	ssk->qp_active = 0;
371aa0a1e58SJeff Roberson out:
372aa0a1e58SJeff Roberson 	SDP_WUNLOCK(ssk);
373aa0a1e58SJeff Roberson }
374aa0a1e58SJeff Roberson 
375aa0a1e58SJeff Roberson /*
376aa0a1e58SJeff Roberson  * Received the final fin/ack.  Cancel the 2msl.
377aa0a1e58SJeff Roberson  */
378aa0a1e58SJeff Roberson void
sdp_cancel_dreq_wait_timeout(struct sdp_sock * ssk)379aa0a1e58SJeff Roberson sdp_cancel_dreq_wait_timeout(struct sdp_sock *ssk)
380aa0a1e58SJeff Roberson {
381aa0a1e58SJeff Roberson 	sdp_dbg(ssk->socket, "cancelling dreq wait timeout\n");
382aa0a1e58SJeff Roberson 	ssk->flags &= ~SDP_DREQWAIT;
383aa0a1e58SJeff Roberson 	sdp_2msl_wait(ssk);
384aa0a1e58SJeff Roberson }
385aa0a1e58SJeff Roberson 
386aa0a1e58SJeff Roberson static int
sdp_init_sock(struct socket * sk)387aa0a1e58SJeff Roberson sdp_init_sock(struct socket *sk)
388aa0a1e58SJeff Roberson {
389aa0a1e58SJeff Roberson 	struct sdp_sock *ssk = sdp_sk(sk);
390aa0a1e58SJeff Roberson 
391aa0a1e58SJeff Roberson 	sdp_dbg(sk, "%s\n", __func__);
392aa0a1e58SJeff Roberson 
393aa0a1e58SJeff Roberson 	callout_init_rw(&ssk->keep2msl, &ssk->lock, CALLOUT_RETURNUNLOCKED);
394aa0a1e58SJeff Roberson 	TASK_INIT(&ssk->shutdown_task, 0, sdp_shutdown_task, ssk);
395aa0a1e58SJeff Roberson #ifdef SDP_ZCOPY
396aa0a1e58SJeff Roberson 	INIT_DELAYED_WORK(&ssk->srcavail_cancel_work, srcavail_cancel_timeout);
397aa0a1e58SJeff Roberson 	ssk->zcopy_thresh = -1; /* use global sdp_zcopy_thresh */
398aa0a1e58SJeff Roberson 	ssk->tx_ring.rdma_inflight = NULL;
399aa0a1e58SJeff Roberson #endif
400aa0a1e58SJeff Roberson 	atomic_set(&ssk->mseq_ack, 0);
401aa0a1e58SJeff Roberson 	sdp_rx_ring_init(ssk);
402aa0a1e58SJeff Roberson 	ssk->tx_ring.buffer = NULL;
403aa0a1e58SJeff Roberson 
404aa0a1e58SJeff Roberson 	return 0;
405aa0a1e58SJeff Roberson }
406aa0a1e58SJeff Roberson 
407aa0a1e58SJeff Roberson /*
408aa0a1e58SJeff Roberson  * Allocate an sdp_sock for the socket and reserve socket buffer space.
409aa0a1e58SJeff Roberson  */
410aa0a1e58SJeff Roberson static int
sdp_attach(struct socket * so,int proto,struct thread * td)411aa0a1e58SJeff Roberson sdp_attach(struct socket *so, int proto, struct thread *td)
412aa0a1e58SJeff Roberson {
413aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
414aa0a1e58SJeff Roberson 	int error;
415aa0a1e58SJeff Roberson 
416aa0a1e58SJeff Roberson 	ssk = sdp_sk(so);
417aa0a1e58SJeff Roberson 	KASSERT(ssk == NULL, ("sdp_attach: ssk already set on so %p", so));
418aa0a1e58SJeff Roberson 	if (so->so_snd.sb_hiwat == 0 || so->so_rcv.sb_hiwat == 0) {
419aa0a1e58SJeff Roberson 		error = soreserve(so, sdp_sendspace, sdp_recvspace);
420aa0a1e58SJeff Roberson 		if (error)
421aa0a1e58SJeff Roberson 			return (error);
422aa0a1e58SJeff Roberson 	}
423aa0a1e58SJeff Roberson 	so->so_rcv.sb_flags |= SB_AUTOSIZE;
424aa0a1e58SJeff Roberson 	so->so_snd.sb_flags |= SB_AUTOSIZE;
425aa0a1e58SJeff Roberson 	ssk = uma_zalloc(sdp_zone, M_NOWAIT | M_ZERO);
426aa0a1e58SJeff Roberson 	if (ssk == NULL)
427aa0a1e58SJeff Roberson 		return (ENOBUFS);
428aa0a1e58SJeff Roberson 	rw_init(&ssk->lock, "sdpsock");
429aa0a1e58SJeff Roberson 	ssk->socket = so;
430aa0a1e58SJeff Roberson 	ssk->cred = crhold(so->so_cred);
431aa0a1e58SJeff Roberson 	so->so_pcb = (caddr_t)ssk;
432aa0a1e58SJeff Roberson 	sdp_init_sock(so);
433aa0a1e58SJeff Roberson 	ssk->flags = 0;
434aa0a1e58SJeff Roberson 	ssk->qp_active = 0;
435aa0a1e58SJeff Roberson 	ssk->state = TCPS_CLOSED;
4362cefa87bSMark Johnston 	mbufq_init(&ssk->rxctlq, INT_MAX);
437aa0a1e58SJeff Roberson 	SDP_LIST_WLOCK();
438aa0a1e58SJeff Roberson 	LIST_INSERT_HEAD(&sdp_list, ssk, list);
439aa0a1e58SJeff Roberson 	sdp_count++;
440aa0a1e58SJeff Roberson 	SDP_LIST_WUNLOCK();
441aa0a1e58SJeff Roberson 
442aa0a1e58SJeff Roberson 	return (0);
443aa0a1e58SJeff Roberson }
444aa0a1e58SJeff Roberson 
445aa0a1e58SJeff Roberson /*
446aa0a1e58SJeff Roberson  * Detach SDP from the socket, potentially leaving it around for the
447aa0a1e58SJeff Roberson  * timewait to expire.
448aa0a1e58SJeff Roberson  */
449aa0a1e58SJeff Roberson static void
sdp_detach(struct socket * so)450aa0a1e58SJeff Roberson sdp_detach(struct socket *so)
451aa0a1e58SJeff Roberson {
452aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
453aa0a1e58SJeff Roberson 
454aa0a1e58SJeff Roberson 	ssk = sdp_sk(so);
455aa0a1e58SJeff Roberson 	SDP_WLOCK(ssk);
456aa0a1e58SJeff Roberson 	KASSERT(ssk->socket != NULL, ("sdp_detach: socket is NULL"));
457aa0a1e58SJeff Roberson 	ssk->socket->so_pcb = NULL;
458aa0a1e58SJeff Roberson 	ssk->socket = NULL;
459aa0a1e58SJeff Roberson 	if (ssk->flags & (SDP_TIMEWAIT | SDP_DREQWAIT))
460aa0a1e58SJeff Roberson 		SDP_WUNLOCK(ssk);
461aa0a1e58SJeff Roberson 	else if (ssk->flags & SDP_DROPPED || ssk->state < TCPS_SYN_SENT)
462aa0a1e58SJeff Roberson 		sdp_pcbfree(ssk);
463aa0a1e58SJeff Roberson 	else
464aa0a1e58SJeff Roberson 		panic("sdp_detach: Unexpected state, ssk %p.\n", ssk);
465aa0a1e58SJeff Roberson }
466aa0a1e58SJeff Roberson 
467aa0a1e58SJeff Roberson /*
468aa0a1e58SJeff Roberson  * Allocate a local address for the socket.
469aa0a1e58SJeff Roberson  */
470aa0a1e58SJeff Roberson static int
sdp_bind(struct socket * so,struct sockaddr * nam,struct thread * td)471aa0a1e58SJeff Roberson sdp_bind(struct socket *so, struct sockaddr *nam, struct thread *td)
472aa0a1e58SJeff Roberson {
473aa0a1e58SJeff Roberson 	int error = 0;
474aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
475aa0a1e58SJeff Roberson 	struct sockaddr_in *sin;
476aa0a1e58SJeff Roberson 
477aa0a1e58SJeff Roberson 	sin = (struct sockaddr_in *)nam;
478aa0a1e58SJeff Roberson 	if (sin->sin_family != AF_INET)
479f161d294SMark Johnston 		return (EAFNOSUPPORT);
480f161d294SMark Johnston 	if (nam->sa_len != sizeof(*sin))
481aa0a1e58SJeff Roberson 		return (EINVAL);
482aa0a1e58SJeff Roberson 	if (IN_MULTICAST(ntohl(sin->sin_addr.s_addr)))
483aa0a1e58SJeff Roberson 		return (EAFNOSUPPORT);
484aa0a1e58SJeff Roberson 
485aa0a1e58SJeff Roberson 	ssk = sdp_sk(so);
486aa0a1e58SJeff Roberson 	SDP_WLOCK(ssk);
487aa0a1e58SJeff Roberson 	if (ssk->flags & (SDP_TIMEWAIT | SDP_DROPPED)) {
488aa0a1e58SJeff Roberson 		error = EINVAL;
489aa0a1e58SJeff Roberson 		goto out;
490aa0a1e58SJeff Roberson 	}
491aa0a1e58SJeff Roberson 	error = sdp_pcbbind(ssk, nam, td->td_ucred);
492aa0a1e58SJeff Roberson out:
493aa0a1e58SJeff Roberson 	SDP_WUNLOCK(ssk);
494aa0a1e58SJeff Roberson 
495aa0a1e58SJeff Roberson 	return (error);
496aa0a1e58SJeff Roberson }
497aa0a1e58SJeff Roberson 
498aa0a1e58SJeff Roberson /*
499aa0a1e58SJeff Roberson  * Prepare to accept connections.
500aa0a1e58SJeff Roberson  */
501aa0a1e58SJeff Roberson static int
sdp_listen(struct socket * so,int backlog,struct thread * td)502aa0a1e58SJeff Roberson sdp_listen(struct socket *so, int backlog, struct thread *td)
503aa0a1e58SJeff Roberson {
504aa0a1e58SJeff Roberson 	int error = 0;
505aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
506aa0a1e58SJeff Roberson 
507aa0a1e58SJeff Roberson 	ssk = sdp_sk(so);
508aa0a1e58SJeff Roberson 	SDP_WLOCK(ssk);
509aa0a1e58SJeff Roberson 	if (ssk->flags & (SDP_TIMEWAIT | SDP_DROPPED)) {
510aa0a1e58SJeff Roberson 		error = EINVAL;
511aa0a1e58SJeff Roberson 		goto out;
512aa0a1e58SJeff Roberson 	}
513aa0a1e58SJeff Roberson 	if (error == 0 && ssk->lport == 0)
514aa0a1e58SJeff Roberson 		error = sdp_pcbbind(ssk, (struct sockaddr *)0, td->td_ucred);
515aa0a1e58SJeff Roberson 	SOCK_LOCK(so);
516aa0a1e58SJeff Roberson 	if (error == 0)
517aa0a1e58SJeff Roberson 		error = solisten_proto_check(so);
518aa0a1e58SJeff Roberson 	if (error == 0) {
519aa0a1e58SJeff Roberson 		solisten_proto(so, backlog);
520aa0a1e58SJeff Roberson 		ssk->state = TCPS_LISTEN;
521aa0a1e58SJeff Roberson 	}
522aa0a1e58SJeff Roberson 	SOCK_UNLOCK(so);
523aa0a1e58SJeff Roberson 
524aa0a1e58SJeff Roberson out:
525aa0a1e58SJeff Roberson 	SDP_WUNLOCK(ssk);
526aa0a1e58SJeff Roberson 	if (error == 0)
527aa0a1e58SJeff Roberson 		error = -rdma_listen(ssk->id, backlog);
528aa0a1e58SJeff Roberson 	return (error);
529aa0a1e58SJeff Roberson }
530aa0a1e58SJeff Roberson 
531aa0a1e58SJeff Roberson /*
532aa0a1e58SJeff Roberson  * Initiate a SDP connection to nam.
533aa0a1e58SJeff Roberson  */
534aa0a1e58SJeff Roberson static int
sdp_start_connect(struct sdp_sock * ssk,struct sockaddr * nam,struct thread * td)535aa0a1e58SJeff Roberson sdp_start_connect(struct sdp_sock *ssk, struct sockaddr *nam, struct thread *td)
536aa0a1e58SJeff Roberson {
537aa0a1e58SJeff Roberson 	struct sockaddr_in src;
538aa0a1e58SJeff Roberson 	struct socket *so;
539aa0a1e58SJeff Roberson 	int error;
540aa0a1e58SJeff Roberson 
541aa0a1e58SJeff Roberson 	so = ssk->socket;
542aa0a1e58SJeff Roberson 
543aa0a1e58SJeff Roberson 	SDP_WLOCK_ASSERT(ssk);
544aa0a1e58SJeff Roberson 	if (ssk->lport == 0) {
545aa0a1e58SJeff Roberson 		error = sdp_pcbbind(ssk, (struct sockaddr *)0, td->td_ucred);
546aa0a1e58SJeff Roberson 		if (error)
547aa0a1e58SJeff Roberson 			return error;
548aa0a1e58SJeff Roberson 	}
549aa0a1e58SJeff Roberson 	src.sin_family = AF_INET;
550aa0a1e58SJeff Roberson 	src.sin_len = sizeof(src);
551aa0a1e58SJeff Roberson 	bzero(&src.sin_zero, sizeof(src.sin_zero));
552aa0a1e58SJeff Roberson 	src.sin_port = ssk->lport;
553aa0a1e58SJeff Roberson 	src.sin_addr.s_addr = ssk->laddr;
554aa0a1e58SJeff Roberson 	soisconnecting(so);
555aa0a1e58SJeff Roberson 	SDP_WUNLOCK(ssk);
556aa0a1e58SJeff Roberson 	error = -rdma_resolve_addr(ssk->id, (struct sockaddr *)&src, nam,
557aa0a1e58SJeff Roberson 	    SDP_RESOLVE_TIMEOUT);
558aa0a1e58SJeff Roberson 	SDP_WLOCK(ssk);
559aa0a1e58SJeff Roberson 	if (error == 0)
560aa0a1e58SJeff Roberson 		ssk->state = TCPS_SYN_SENT;
561aa0a1e58SJeff Roberson 
562aa0a1e58SJeff Roberson 	return 0;
563aa0a1e58SJeff Roberson }
564aa0a1e58SJeff Roberson 
565aa0a1e58SJeff Roberson /*
566aa0a1e58SJeff Roberson  * Initiate SDP connection.
567aa0a1e58SJeff Roberson  */
568aa0a1e58SJeff Roberson static int
sdp_connect(struct socket * so,struct sockaddr * nam,struct thread * td)569aa0a1e58SJeff Roberson sdp_connect(struct socket *so, struct sockaddr *nam, struct thread *td)
570aa0a1e58SJeff Roberson {
571aa0a1e58SJeff Roberson 	int error = 0;
572aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
573aa0a1e58SJeff Roberson 	struct sockaddr_in *sin;
574aa0a1e58SJeff Roberson 
575aa0a1e58SJeff Roberson 	sin = (struct sockaddr_in *)nam;
576aa0a1e58SJeff Roberson 	if (nam->sa_len != sizeof(*sin))
577aa0a1e58SJeff Roberson 		return (EINVAL);
578aa0a1e58SJeff Roberson 	if (sin->sin_family != AF_INET)
579f161d294SMark Johnston 		return (EAFNOSUPPORT);
580aa0a1e58SJeff Roberson 	if (IN_MULTICAST(ntohl(sin->sin_addr.s_addr)))
581aa0a1e58SJeff Roberson 		return (EAFNOSUPPORT);
582aa0a1e58SJeff Roberson 	if ((error = prison_remote_ip4(td->td_ucred, &sin->sin_addr)) != 0)
583aa0a1e58SJeff Roberson 		return (error);
584aa0a1e58SJeff Roberson 	ssk = sdp_sk(so);
585aa0a1e58SJeff Roberson 	SDP_WLOCK(ssk);
586aa0a1e58SJeff Roberson 	if (ssk->flags & (SDP_TIMEWAIT | SDP_DROPPED))
587aa0a1e58SJeff Roberson 		error = EINVAL;
588aa0a1e58SJeff Roberson 	else
589aa0a1e58SJeff Roberson 		error = sdp_start_connect(ssk, nam, td);
590aa0a1e58SJeff Roberson 	SDP_WUNLOCK(ssk);
591aa0a1e58SJeff Roberson 	return (error);
592aa0a1e58SJeff Roberson }
593aa0a1e58SJeff Roberson 
594aa0a1e58SJeff Roberson /*
595aa0a1e58SJeff Roberson  * Drop a SDP socket, reporting
596aa0a1e58SJeff Roberson  * the specified error.  If connection is synchronized,
597aa0a1e58SJeff Roberson  * then send a RST to peer.
598aa0a1e58SJeff Roberson  */
599aa0a1e58SJeff Roberson static struct sdp_sock *
sdp_drop(struct sdp_sock * ssk,int errno)600aa0a1e58SJeff Roberson sdp_drop(struct sdp_sock *ssk, int errno)
601aa0a1e58SJeff Roberson {
602aa0a1e58SJeff Roberson 	struct socket *so;
603aa0a1e58SJeff Roberson 
604aa0a1e58SJeff Roberson 	SDP_WLOCK_ASSERT(ssk);
605aa0a1e58SJeff Roberson 	so = ssk->socket;
606aa0a1e58SJeff Roberson 	if (TCPS_HAVERCVDSYN(ssk->state))
607aa0a1e58SJeff Roberson 		sdp_output_reset(ssk);
608aa0a1e58SJeff Roberson 	if (errno == ETIMEDOUT && ssk->softerror)
609aa0a1e58SJeff Roberson 		errno = ssk->softerror;
610aa0a1e58SJeff Roberson 	so->so_error = errno;
611aa0a1e58SJeff Roberson 	return (sdp_closed(ssk));
612aa0a1e58SJeff Roberson }
613aa0a1e58SJeff Roberson 
614aa0a1e58SJeff Roberson /*
615aa0a1e58SJeff Roberson  * User issued close, and wish to trail through shutdown states:
616aa0a1e58SJeff Roberson  * if never received SYN, just forget it.  If got a SYN from peer,
617aa0a1e58SJeff Roberson  * but haven't sent FIN, then go to FIN_WAIT_1 state to send peer a FIN.
618aa0a1e58SJeff Roberson  * If already got a FIN from peer, then almost done; go to LAST_ACK
619aa0a1e58SJeff Roberson  * state.  In all other cases, have already sent FIN to peer (e.g.
620aa0a1e58SJeff Roberson  * after PRU_SHUTDOWN), and just have to play tedious game waiting
621aa0a1e58SJeff Roberson  * for peer to send FIN or not respond to keep-alives, etc.
622aa0a1e58SJeff Roberson  * We can let the user exit from the close as soon as the FIN is acked.
623aa0a1e58SJeff Roberson  */
624aa0a1e58SJeff Roberson static void
sdp_usrclosed(struct sdp_sock * ssk)625aa0a1e58SJeff Roberson sdp_usrclosed(struct sdp_sock *ssk)
626aa0a1e58SJeff Roberson {
627aa0a1e58SJeff Roberson 
628aa0a1e58SJeff Roberson 	SDP_WLOCK_ASSERT(ssk);
629aa0a1e58SJeff Roberson 
630aa0a1e58SJeff Roberson 	switch (ssk->state) {
631aa0a1e58SJeff Roberson 	case TCPS_LISTEN:
632aa0a1e58SJeff Roberson 		ssk->state = TCPS_CLOSED;
633aa0a1e58SJeff Roberson 		SDP_WUNLOCK(ssk);
634aa0a1e58SJeff Roberson 		sdp_destroy_cma(ssk);
635aa0a1e58SJeff Roberson 		SDP_WLOCK(ssk);
636aa0a1e58SJeff Roberson 		/* FALLTHROUGH */
637aa0a1e58SJeff Roberson 	case TCPS_CLOSED:
638aa0a1e58SJeff Roberson 		ssk = sdp_closed(ssk);
639aa0a1e58SJeff Roberson 		/*
640aa0a1e58SJeff Roberson 		 * sdp_closed() should never return NULL here as the socket is
641aa0a1e58SJeff Roberson 		 * still open.
642aa0a1e58SJeff Roberson 		 */
643aa0a1e58SJeff Roberson 		KASSERT(ssk != NULL,
644aa0a1e58SJeff Roberson 		    ("sdp_usrclosed: sdp_closed() returned NULL"));
645aa0a1e58SJeff Roberson 		break;
646aa0a1e58SJeff Roberson 
647aa0a1e58SJeff Roberson 	case TCPS_SYN_SENT:
648aa0a1e58SJeff Roberson 		/* FALLTHROUGH */
649aa0a1e58SJeff Roberson 	case TCPS_SYN_RECEIVED:
650aa0a1e58SJeff Roberson 		ssk->flags |= SDP_NEEDFIN;
651aa0a1e58SJeff Roberson 		break;
652aa0a1e58SJeff Roberson 
653aa0a1e58SJeff Roberson 	case TCPS_ESTABLISHED:
654aa0a1e58SJeff Roberson 		ssk->flags |= SDP_NEEDFIN;
655aa0a1e58SJeff Roberson 		ssk->state = TCPS_FIN_WAIT_1;
656aa0a1e58SJeff Roberson 		break;
657aa0a1e58SJeff Roberson 
658aa0a1e58SJeff Roberson 	case TCPS_CLOSE_WAIT:
659aa0a1e58SJeff Roberson 		ssk->state = TCPS_LAST_ACK;
660aa0a1e58SJeff Roberson 		break;
661aa0a1e58SJeff Roberson 	}
662aa0a1e58SJeff Roberson 	if (ssk->state >= TCPS_FIN_WAIT_2) {
663aa0a1e58SJeff Roberson 		/* Prevent the connection hanging in FIN_WAIT_2 forever. */
664aa0a1e58SJeff Roberson 		if (ssk->state == TCPS_FIN_WAIT_2)
665aa0a1e58SJeff Roberson 			sdp_2msl_wait(ssk);
666aa0a1e58SJeff Roberson 		else
667aa0a1e58SJeff Roberson 			soisdisconnected(ssk->socket);
668aa0a1e58SJeff Roberson 	}
669aa0a1e58SJeff Roberson }
670aa0a1e58SJeff Roberson 
671aa0a1e58SJeff Roberson static void
sdp_output_disconnect(struct sdp_sock * ssk)672aa0a1e58SJeff Roberson sdp_output_disconnect(struct sdp_sock *ssk)
673aa0a1e58SJeff Roberson {
674aa0a1e58SJeff Roberson 
675aa0a1e58SJeff Roberson 	SDP_WLOCK_ASSERT(ssk);
676aa0a1e58SJeff Roberson 	callout_reset(&ssk->keep2msl, SDP_FIN_WAIT_TIMEOUT,
677aa0a1e58SJeff Roberson 	    sdp_dreq_timeout, ssk);
678aa0a1e58SJeff Roberson 	ssk->flags |= SDP_NEEDFIN | SDP_DREQWAIT;
679aa0a1e58SJeff Roberson 	sdp_post_sends(ssk, M_NOWAIT);
680aa0a1e58SJeff Roberson }
681aa0a1e58SJeff Roberson 
682aa0a1e58SJeff Roberson /*
683aa0a1e58SJeff Roberson  * Initiate or continue a disconnect.
684aa0a1e58SJeff Roberson  * If embryonic state, just send reset (once).
685aa0a1e58SJeff Roberson  * If in ``let data drain'' option and linger null, just drop.
686aa0a1e58SJeff Roberson  * Otherwise (hard), mark socket disconnecting and drop
687aa0a1e58SJeff Roberson  * current input data; switch states based on user close, and
688aa0a1e58SJeff Roberson  * send segment to peer (with FIN).
689aa0a1e58SJeff Roberson  */
690aa0a1e58SJeff Roberson static void
sdp_start_disconnect(struct sdp_sock * ssk)691aa0a1e58SJeff Roberson sdp_start_disconnect(struct sdp_sock *ssk)
692aa0a1e58SJeff Roberson {
693aa0a1e58SJeff Roberson 	struct socket *so;
694aa0a1e58SJeff Roberson 	int unread;
695aa0a1e58SJeff Roberson 
696aa0a1e58SJeff Roberson 	so = ssk->socket;
697aa0a1e58SJeff Roberson 	SDP_WLOCK_ASSERT(ssk);
698aa0a1e58SJeff Roberson 	sdp_stop_keepalive_timer(so);
699aa0a1e58SJeff Roberson 	/*
700aa0a1e58SJeff Roberson 	 * Neither sdp_closed() nor sdp_drop() should return NULL, as the
701aa0a1e58SJeff Roberson 	 * socket is still open.
702aa0a1e58SJeff Roberson 	 */
703aa0a1e58SJeff Roberson 	if (ssk->state < TCPS_ESTABLISHED) {
704aa0a1e58SJeff Roberson 		ssk = sdp_closed(ssk);
705aa0a1e58SJeff Roberson 		KASSERT(ssk != NULL,
706aa0a1e58SJeff Roberson 		    ("sdp_start_disconnect: sdp_close() returned NULL"));
707aa0a1e58SJeff Roberson 	} else if ((so->so_options & SO_LINGER) && so->so_linger == 0) {
708aa0a1e58SJeff Roberson 		ssk = sdp_drop(ssk, 0);
709aa0a1e58SJeff Roberson 		KASSERT(ssk != NULL,
710aa0a1e58SJeff Roberson 		    ("sdp_start_disconnect: sdp_drop() returned NULL"));
711aa0a1e58SJeff Roberson 	} else {
712aa0a1e58SJeff Roberson 		soisdisconnecting(so);
713cfa6009eSGleb Smirnoff 		unread = sbused(&so->so_rcv);
714aa0a1e58SJeff Roberson 		sbflush(&so->so_rcv);
715aa0a1e58SJeff Roberson 		sdp_usrclosed(ssk);
716aa0a1e58SJeff Roberson 		if (!(ssk->flags & SDP_DROPPED)) {
717aa0a1e58SJeff Roberson 			if (unread)
718aa0a1e58SJeff Roberson 				sdp_output_reset(ssk);
719aa0a1e58SJeff Roberson 			else
720aa0a1e58SJeff Roberson 				sdp_output_disconnect(ssk);
721aa0a1e58SJeff Roberson 		}
722aa0a1e58SJeff Roberson 	}
723aa0a1e58SJeff Roberson }
724aa0a1e58SJeff Roberson 
725aa0a1e58SJeff Roberson /*
726aa0a1e58SJeff Roberson  * User initiated disconnect.
727aa0a1e58SJeff Roberson  */
728aa0a1e58SJeff Roberson static int
sdp_disconnect(struct socket * so)729aa0a1e58SJeff Roberson sdp_disconnect(struct socket *so)
730aa0a1e58SJeff Roberson {
731aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
732aa0a1e58SJeff Roberson 	int error = 0;
733aa0a1e58SJeff Roberson 
734aa0a1e58SJeff Roberson 	ssk = sdp_sk(so);
735aa0a1e58SJeff Roberson 	SDP_WLOCK(ssk);
736aa0a1e58SJeff Roberson 	if (ssk->flags & (SDP_TIMEWAIT | SDP_DROPPED)) {
737aa0a1e58SJeff Roberson 		error = ECONNRESET;
738aa0a1e58SJeff Roberson 		goto out;
739aa0a1e58SJeff Roberson 	}
740aa0a1e58SJeff Roberson 	sdp_start_disconnect(ssk);
741aa0a1e58SJeff Roberson out:
742aa0a1e58SJeff Roberson 	SDP_WUNLOCK(ssk);
743aa0a1e58SJeff Roberson 	return (error);
744aa0a1e58SJeff Roberson }
745aa0a1e58SJeff Roberson 
746aa0a1e58SJeff Roberson /*
747aa0a1e58SJeff Roberson  * Accept a connection.  Essentially all the work is done at higher levels;
748aa0a1e58SJeff Roberson  * just return the address of the peer, storing through addr.
749aa0a1e58SJeff Roberson  *
750aa0a1e58SJeff Roberson  *
751aa0a1e58SJeff Roberson  * XXX This is broken XXX
752aa0a1e58SJeff Roberson  *
753aa0a1e58SJeff Roberson  * The rationale for acquiring the sdp lock here is somewhat complicated,
754aa0a1e58SJeff Roberson  * and is described in detail in the commit log entry for r175612.  Acquiring
755aa0a1e58SJeff Roberson  * it delays an accept(2) racing with sonewconn(), which inserts the socket
756aa0a1e58SJeff Roberson  * before the address/port fields are initialized.  A better fix would
757aa0a1e58SJeff Roberson  * prevent the socket from being placed in the listen queue until all fields
758aa0a1e58SJeff Roberson  * are fully initialized.
759aa0a1e58SJeff Roberson  */
760aa0a1e58SJeff Roberson static int
sdp_accept(struct socket * so,struct sockaddr * sa)761cfb1e929SGleb Smirnoff sdp_accept(struct socket *so, struct sockaddr *sa)
762aa0a1e58SJeff Roberson {
763aa0a1e58SJeff Roberson 	struct sdp_sock *ssk = NULL;
764aa0a1e58SJeff Roberson 	int error;
765aa0a1e58SJeff Roberson 
766aa0a1e58SJeff Roberson 	if (so->so_state & SS_ISDISCONNECTED)
767aa0a1e58SJeff Roberson 		return (ECONNABORTED);
768aa0a1e58SJeff Roberson 
769aa0a1e58SJeff Roberson 	error = 0;
770aa0a1e58SJeff Roberson 	ssk = sdp_sk(so);
771aa0a1e58SJeff Roberson 	SDP_WLOCK(ssk);
772cfb1e929SGleb Smirnoff 	if (ssk->flags & (SDP_TIMEWAIT | SDP_DROPPED))
773aa0a1e58SJeff Roberson 		error = ECONNABORTED;
774cfb1e929SGleb Smirnoff 	else
775cfb1e929SGleb Smirnoff 		*(struct sockaddr_in *)sa = (struct sockaddr_in ){
776cfb1e929SGleb Smirnoff 			.sin_family = AF_INET,
777cfb1e929SGleb Smirnoff 			.sin_len = sizeof(struct sockaddr_in),
778cfb1e929SGleb Smirnoff 			.sin_addr.s_addr = ssk->faddr,
779cfb1e929SGleb Smirnoff 			.sin_port = ssk->fport,
780cfb1e929SGleb Smirnoff 		};
781aa0a1e58SJeff Roberson 	SDP_WUNLOCK(ssk);
782cfb1e929SGleb Smirnoff 
783cfb1e929SGleb Smirnoff 	return (error);
784aa0a1e58SJeff Roberson }
785aa0a1e58SJeff Roberson 
786aa0a1e58SJeff Roberson /*
787aa0a1e58SJeff Roberson  * Mark the connection as being incapable of further output.
788aa0a1e58SJeff Roberson  */
789aa0a1e58SJeff Roberson static int
sdp_shutdown(struct socket * so,enum shutdown_how how)790*296a4cb5SGleb Smirnoff sdp_shutdown(struct socket *so, enum shutdown_how how)
791aa0a1e58SJeff Roberson {
792*296a4cb5SGleb Smirnoff 	struct sdp_sock *ssk = sdp_sk(so);
793aa0a1e58SJeff Roberson 	int error = 0;
794aa0a1e58SJeff Roberson 
795*296a4cb5SGleb Smirnoff 	SOCK_LOCK(so);
796*296a4cb5SGleb Smirnoff 	if ((so->so_state &
797*296a4cb5SGleb Smirnoff 	    (SS_ISCONNECTED | SS_ISCONNECTING | SS_ISDISCONNECTING)) == 0) {
798*296a4cb5SGleb Smirnoff 		SOCK_UNLOCK(so);
799*296a4cb5SGleb Smirnoff 		return (ENOTCONN);
800*296a4cb5SGleb Smirnoff 	}
801*296a4cb5SGleb Smirnoff 	if (SOLISTENING(so)) {
802*296a4cb5SGleb Smirnoff 		if (how != SHUT_WR) {
803*296a4cb5SGleb Smirnoff 			so->so_error = ECONNABORTED;
804*296a4cb5SGleb Smirnoff 			solisten_wakeup(so);	/* unlocks so */
805*296a4cb5SGleb Smirnoff 		} else
806*296a4cb5SGleb Smirnoff 			SOCK_UNLOCK(so);
807*296a4cb5SGleb Smirnoff 		return (0);
808*296a4cb5SGleb Smirnoff 	}
809*296a4cb5SGleb Smirnoff 	SOCK_UNLOCK(so);
810*296a4cb5SGleb Smirnoff 
811*296a4cb5SGleb Smirnoff 	switch (how) {
812*296a4cb5SGleb Smirnoff 	case SHUT_RD:
813*296a4cb5SGleb Smirnoff 		socantrcvmore(so);
814*296a4cb5SGleb Smirnoff 		sbrelease(so, SO_RCV);
815*296a4cb5SGleb Smirnoff 		break;
816*296a4cb5SGleb Smirnoff 	case SHUT_RDWR:
817*296a4cb5SGleb Smirnoff 		socantrcvmore(so);
818*296a4cb5SGleb Smirnoff 		sbrelease(so, SO_RCV);
819*296a4cb5SGleb Smirnoff 		/* FALLTHROUGH */
820*296a4cb5SGleb Smirnoff 	case SHUT_WR:
821aa0a1e58SJeff Roberson 		SDP_WLOCK(ssk);
822aa0a1e58SJeff Roberson 		if (ssk->flags & (SDP_TIMEWAIT | SDP_DROPPED)) {
823*296a4cb5SGleb Smirnoff 			SDP_WUNLOCK(ssk);
824aa0a1e58SJeff Roberson 			error = ECONNRESET;
825*296a4cb5SGleb Smirnoff 			break;
826aa0a1e58SJeff Roberson 		}
827aa0a1e58SJeff Roberson 		socantsendmore(so);
828aa0a1e58SJeff Roberson 		sdp_usrclosed(ssk);
829aa0a1e58SJeff Roberson 		if (!(ssk->flags & SDP_DROPPED))
830aa0a1e58SJeff Roberson 			sdp_output_disconnect(ssk);
831aa0a1e58SJeff Roberson 		SDP_WUNLOCK(ssk);
832*296a4cb5SGleb Smirnoff 	}
833*296a4cb5SGleb Smirnoff 	wakeup(&so->so_timeo);
834aa0a1e58SJeff Roberson 
835aa0a1e58SJeff Roberson 	return (error);
836aa0a1e58SJeff Roberson }
837aa0a1e58SJeff Roberson 
838aa0a1e58SJeff Roberson static void
sdp_append(struct sdp_sock * ssk,struct sockbuf * sb,struct mbuf * mb,int cnt)839aa0a1e58SJeff Roberson sdp_append(struct sdp_sock *ssk, struct sockbuf *sb, struct mbuf *mb, int cnt)
840aa0a1e58SJeff Roberson {
841aa0a1e58SJeff Roberson 	struct mbuf *n;
842aa0a1e58SJeff Roberson 	int ncnt;
843aa0a1e58SJeff Roberson 
844aa0a1e58SJeff Roberson 	SOCKBUF_LOCK_ASSERT(sb);
8458317ddc8SJohn Baldwin 	SBLASTRECORDCHK(sb);
846aa0a1e58SJeff Roberson 	KASSERT(mb->m_flags & M_PKTHDR,
847aa0a1e58SJeff Roberson 		("sdp_append: %p Missing packet header.\n", mb));
848aa0a1e58SJeff Roberson 	n = sb->sb_lastrecord;
849aa0a1e58SJeff Roberson 	/*
850aa0a1e58SJeff Roberson 	 * If the queue is empty just set all pointers and proceed.
851aa0a1e58SJeff Roberson 	 */
852aa0a1e58SJeff Roberson 	if (n == NULL) {
853aa0a1e58SJeff Roberson 		sb->sb_lastrecord = sb->sb_mb = sb->sb_sndptr = mb;
854aa0a1e58SJeff Roberson 		for (; mb; mb = mb->m_next) {
855aa0a1e58SJeff Roberson 	                sb->sb_mbtail = mb;
856aa0a1e58SJeff Roberson 			sballoc(sb, mb);
857aa0a1e58SJeff Roberson 		}
858aa0a1e58SJeff Roberson 		return;
859aa0a1e58SJeff Roberson 	}
860aa0a1e58SJeff Roberson 	/*
861aa0a1e58SJeff Roberson 	 * Count the number of mbufs in the current tail.
862aa0a1e58SJeff Roberson 	 */
863aa0a1e58SJeff Roberson 	for (ncnt = 0; n->m_next; n = n->m_next)
864aa0a1e58SJeff Roberson 		ncnt++;
865aa0a1e58SJeff Roberson 	n = sb->sb_lastrecord;
866aa0a1e58SJeff Roberson 	/*
867aa0a1e58SJeff Roberson 	 * If the two chains can fit in a single sdp packet and
868aa0a1e58SJeff Roberson 	 * the last record has not been sent yet (WRITABLE) coalesce
869aa0a1e58SJeff Roberson 	 * them.  The lastrecord remains the same but we must strip the
870aa0a1e58SJeff Roberson 	 * packet header and then let sbcompress do the hard part.
871aa0a1e58SJeff Roberson 	 */
872aa0a1e58SJeff Roberson 	if (M_WRITABLE(n) && ncnt + cnt < SDP_MAX_SEND_SGES &&
873aa0a1e58SJeff Roberson 	    n->m_pkthdr.len + mb->m_pkthdr.len - SDP_HEAD_SIZE <
874aa0a1e58SJeff Roberson 	    ssk->xmit_size_goal) {
875aa0a1e58SJeff Roberson 		m_adj(mb, SDP_HEAD_SIZE);
876aa0a1e58SJeff Roberson 		n->m_pkthdr.len += mb->m_pkthdr.len;
877aa0a1e58SJeff Roberson 		n->m_flags |= mb->m_flags & (M_PUSH | M_URG);
878651e4e6aSGleb Smirnoff 		m_demote(mb, 1, 0);
879aa0a1e58SJeff Roberson 		sbcompress(sb, mb, sb->sb_mbtail);
880aa0a1e58SJeff Roberson 		return;
881aa0a1e58SJeff Roberson 	}
882aa0a1e58SJeff Roberson 	/*
883aa0a1e58SJeff Roberson 	 * Not compressible, just append to the end and adjust counters.
884aa0a1e58SJeff Roberson 	 */
885aa0a1e58SJeff Roberson 	sb->sb_lastrecord->m_flags |= M_PUSH;
886aa0a1e58SJeff Roberson 	sb->sb_lastrecord->m_nextpkt = mb;
887aa0a1e58SJeff Roberson 	sb->sb_lastrecord = mb;
888aa0a1e58SJeff Roberson 	if (sb->sb_sndptr == NULL)
889aa0a1e58SJeff Roberson 		sb->sb_sndptr = mb;
890aa0a1e58SJeff Roberson 	for (; mb; mb = mb->m_next) {
891aa0a1e58SJeff Roberson 		sb->sb_mbtail = mb;
892aa0a1e58SJeff Roberson 		sballoc(sb, mb);
893aa0a1e58SJeff Roberson 	}
894aa0a1e58SJeff Roberson }
895aa0a1e58SJeff Roberson 
896aa0a1e58SJeff Roberson /*
897aa0a1e58SJeff Roberson  * Do a send by putting data in output queue and updating urgent
898aa0a1e58SJeff Roberson  * marker if URG set.  Possibly send more data.  Unlike the other
899aa0a1e58SJeff Roberson  * pru_*() routines, the mbuf chains are our responsibility.  We
900aa0a1e58SJeff Roberson  * must either enqueue them or free them.  The other pru_* routines
901aa0a1e58SJeff Roberson  * generally are caller-frees.
902aa0a1e58SJeff Roberson  *
903aa0a1e58SJeff Roberson  * This comes from sendfile, normal sends will come from sdp_sosend().
904aa0a1e58SJeff Roberson  */
905aa0a1e58SJeff Roberson static int
sdp_send(struct socket * so,int flags,struct mbuf * m,struct sockaddr * nam,struct mbuf * control,struct thread * td)906aa0a1e58SJeff Roberson sdp_send(struct socket *so, int flags, struct mbuf *m,
907aa0a1e58SJeff Roberson     struct sockaddr *nam, struct mbuf *control, struct thread *td)
908aa0a1e58SJeff Roberson {
909aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
910aa0a1e58SJeff Roberson 	struct mbuf *n;
911aa0a1e58SJeff Roberson 	int error;
912aa0a1e58SJeff Roberson 	int cnt;
913aa0a1e58SJeff Roberson 
914f161d294SMark Johnston 	if (nam != NULL) {
915f161d294SMark Johnston 		if (nam->sa_family != AF_INET) {
916f161d294SMark Johnston 			if (control)
917f161d294SMark Johnston 				m_freem(control);
918f161d294SMark Johnston 			m_freem(m);
919f161d294SMark Johnston 			return (EAFNOSUPPORT);
920f161d294SMark Johnston 		}
921f161d294SMark Johnston 		if (nam->sa_len != sizeof(struct sockaddr_in)) {
922f161d294SMark Johnston 			if (control)
923f161d294SMark Johnston 				m_freem(control);
924f161d294SMark Johnston 			m_freem(m);
925f161d294SMark Johnston 			return (EINVAL);
926f161d294SMark Johnston 		}
927f161d294SMark Johnston 	}
928f161d294SMark Johnston 
929aa0a1e58SJeff Roberson 	error = 0;
930aa0a1e58SJeff Roberson 	ssk = sdp_sk(so);
931aa0a1e58SJeff Roberson 	KASSERT(m->m_flags & M_PKTHDR,
932aa0a1e58SJeff Roberson 	    ("sdp_send: %p no packet header", m));
933eb1b1807SGleb Smirnoff 	M_PREPEND(m, SDP_HEAD_SIZE, M_WAITOK);
934aa0a1e58SJeff Roberson 	mtod(m, struct sdp_bsdh *)->mid = SDP_MID_DATA;
935aa0a1e58SJeff Roberson 	for (n = m, cnt = 0; n->m_next; n = n->m_next)
936aa0a1e58SJeff Roberson 		cnt++;
937aa0a1e58SJeff Roberson 	if (cnt > SDP_MAX_SEND_SGES) {
938eb1b1807SGleb Smirnoff 		n = m_collapse(m, M_WAITOK, SDP_MAX_SEND_SGES);
939aa0a1e58SJeff Roberson 		if (n == NULL) {
940aa0a1e58SJeff Roberson 			m_freem(m);
941aa0a1e58SJeff Roberson 			return (EMSGSIZE);
942aa0a1e58SJeff Roberson 		}
943aa0a1e58SJeff Roberson 		m = n;
944aa0a1e58SJeff Roberson 		for (cnt = 0; n->m_next; n = n->m_next)
945aa0a1e58SJeff Roberson 			cnt++;
946aa0a1e58SJeff Roberson 	}
947aa0a1e58SJeff Roberson 	SDP_WLOCK(ssk);
948aa0a1e58SJeff Roberson 	if (ssk->flags & (SDP_TIMEWAIT | SDP_DROPPED)) {
949aa0a1e58SJeff Roberson 		if (control)
950aa0a1e58SJeff Roberson 			m_freem(control);
951aa0a1e58SJeff Roberson 		if (m)
952aa0a1e58SJeff Roberson 			m_freem(m);
953aa0a1e58SJeff Roberson 		error = ECONNRESET;
954aa0a1e58SJeff Roberson 		goto out;
955aa0a1e58SJeff Roberson 	}
956aa0a1e58SJeff Roberson 	if (control) {
957aa0a1e58SJeff Roberson 		/* SDP doesn't support control messages. */
958aa0a1e58SJeff Roberson 		if (control->m_len) {
959aa0a1e58SJeff Roberson 			m_freem(control);
960aa0a1e58SJeff Roberson 			if (m)
961aa0a1e58SJeff Roberson 				m_freem(m);
962aa0a1e58SJeff Roberson 			error = EINVAL;
963aa0a1e58SJeff Roberson 			goto out;
964aa0a1e58SJeff Roberson 		}
965aa0a1e58SJeff Roberson 		m_freem(control);	/* empty control, just free it */
966aa0a1e58SJeff Roberson 	}
967aa0a1e58SJeff Roberson 	if (!(flags & PRUS_OOB)) {
968aa0a1e58SJeff Roberson 		SOCKBUF_LOCK(&so->so_snd);
969aa0a1e58SJeff Roberson 		sdp_append(ssk, &so->so_snd, m, cnt);
970aa0a1e58SJeff Roberson 		SOCKBUF_UNLOCK(&so->so_snd);
971aa0a1e58SJeff Roberson 		if (nam && ssk->state < TCPS_SYN_SENT) {
972aa0a1e58SJeff Roberson 			/*
973aa0a1e58SJeff Roberson 			 * Do implied connect if not yet connected.
974aa0a1e58SJeff Roberson 			 */
975aa0a1e58SJeff Roberson 			error = sdp_start_connect(ssk, nam, td);
976aa0a1e58SJeff Roberson 			if (error)
977aa0a1e58SJeff Roberson 				goto out;
978aa0a1e58SJeff Roberson 		}
979aa0a1e58SJeff Roberson 		if (flags & PRUS_EOF) {
980aa0a1e58SJeff Roberson 			/*
981aa0a1e58SJeff Roberson 			 * Close the send side of the connection after
982aa0a1e58SJeff Roberson 			 * the data is sent.
983aa0a1e58SJeff Roberson 			 */
984aa0a1e58SJeff Roberson 			socantsendmore(so);
985aa0a1e58SJeff Roberson 			sdp_usrclosed(ssk);
986aa0a1e58SJeff Roberson 			if (!(ssk->flags & SDP_DROPPED))
987aa0a1e58SJeff Roberson 				sdp_output_disconnect(ssk);
988aa0a1e58SJeff Roberson 		} else if (!(ssk->flags & SDP_DROPPED) &&
989aa0a1e58SJeff Roberson 		    !(flags & PRUS_MORETOCOME))
990aa0a1e58SJeff Roberson 			sdp_post_sends(ssk, M_NOWAIT);
991aa0a1e58SJeff Roberson 		SDP_WUNLOCK(ssk);
992aa0a1e58SJeff Roberson 		return (0);
993aa0a1e58SJeff Roberson 	} else {
994aa0a1e58SJeff Roberson 		SOCKBUF_LOCK(&so->so_snd);
995aa0a1e58SJeff Roberson 		if (sbspace(&so->so_snd) < -512) {
996aa0a1e58SJeff Roberson 			SOCKBUF_UNLOCK(&so->so_snd);
997aa0a1e58SJeff Roberson 			m_freem(m);
998aa0a1e58SJeff Roberson 			error = ENOBUFS;
999aa0a1e58SJeff Roberson 			goto out;
1000aa0a1e58SJeff Roberson 		}
1001aa0a1e58SJeff Roberson 		/*
1002aa0a1e58SJeff Roberson 		 * According to RFC961 (Assigned Protocols),
1003aa0a1e58SJeff Roberson 		 * the urgent pointer points to the last octet
1004aa0a1e58SJeff Roberson 		 * of urgent data.  We continue, however,
1005aa0a1e58SJeff Roberson 		 * to consider it to indicate the first octet
1006aa0a1e58SJeff Roberson 		 * of data past the urgent section.
1007aa0a1e58SJeff Roberson 		 * Otherwise, snd_up should be one lower.
1008aa0a1e58SJeff Roberson 		 */
1009aa0a1e58SJeff Roberson 		m->m_flags |= M_URG | M_PUSH;
1010aa0a1e58SJeff Roberson 		sdp_append(ssk, &so->so_snd, m, cnt);
1011aa0a1e58SJeff Roberson 		SOCKBUF_UNLOCK(&so->so_snd);
1012aa0a1e58SJeff Roberson 		if (nam && ssk->state < TCPS_SYN_SENT) {
1013aa0a1e58SJeff Roberson 			/*
1014aa0a1e58SJeff Roberson 			 * Do implied connect if not yet connected.
1015aa0a1e58SJeff Roberson 			 */
1016aa0a1e58SJeff Roberson 			error = sdp_start_connect(ssk, nam, td);
1017aa0a1e58SJeff Roberson 			if (error)
1018aa0a1e58SJeff Roberson 				goto out;
1019aa0a1e58SJeff Roberson 		}
1020aa0a1e58SJeff Roberson 		sdp_post_sends(ssk, M_NOWAIT);
1021aa0a1e58SJeff Roberson 		SDP_WUNLOCK(ssk);
1022aa0a1e58SJeff Roberson 		return (0);
1023aa0a1e58SJeff Roberson 	}
1024aa0a1e58SJeff Roberson out:
1025aa0a1e58SJeff Roberson 	SDP_WUNLOCK(ssk);
1026aa0a1e58SJeff Roberson 	return (error);
1027aa0a1e58SJeff Roberson }
1028aa0a1e58SJeff Roberson 
1029aa0a1e58SJeff Roberson /*
1030aa0a1e58SJeff Roberson  * Send on a socket.  If send must go all at once and message is larger than
1031aa0a1e58SJeff Roberson  * send buffering, then hard error.  Lock against other senders.  If must go
1032aa0a1e58SJeff Roberson  * all at once and not enough room now, then inform user that this would
1033aa0a1e58SJeff Roberson  * block and do nothing.  Otherwise, if nonblocking, send as much as
1034aa0a1e58SJeff Roberson  * possible.  The data to be sent is described by "uio" if nonzero, otherwise
1035aa0a1e58SJeff Roberson  * by the mbuf chain "top" (which must be null if uio is not).  Data provided
1036aa0a1e58SJeff Roberson  * in mbuf chain must be small enough to send all at once.
1037aa0a1e58SJeff Roberson  *
1038aa0a1e58SJeff Roberson  * Returns nonzero on error, timeout or signal; callers must check for short
1039aa0a1e58SJeff Roberson  * counts if EINTR/ERESTART are returned.  Data and control buffers are freed
1040aa0a1e58SJeff Roberson  * on return.
1041aa0a1e58SJeff Roberson  */
1042aa0a1e58SJeff Roberson static int
sdp_sosend(struct socket * so,struct sockaddr * addr,struct uio * uio,struct mbuf * top,struct mbuf * control,int flags,struct thread * td)1043aa0a1e58SJeff Roberson sdp_sosend(struct socket *so, struct sockaddr *addr, struct uio *uio,
1044aa0a1e58SJeff Roberson     struct mbuf *top, struct mbuf *control, int flags, struct thread *td)
1045aa0a1e58SJeff Roberson {
1046aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
1047aa0a1e58SJeff Roberson 	long space, resid;
1048aa0a1e58SJeff Roberson 	int atomic;
1049aa0a1e58SJeff Roberson 	int error;
1050aa0a1e58SJeff Roberson 	int copy;
1051aa0a1e58SJeff Roberson 
1052aa0a1e58SJeff Roberson 	if (uio != NULL)
1053aa0a1e58SJeff Roberson 		resid = uio->uio_resid;
1054aa0a1e58SJeff Roberson 	else
1055aa0a1e58SJeff Roberson 		resid = top->m_pkthdr.len;
1056aa0a1e58SJeff Roberson 	atomic = top != NULL;
1057aa0a1e58SJeff Roberson 	if (control != NULL) {
1058aa0a1e58SJeff Roberson 		if (control->m_len) {
1059aa0a1e58SJeff Roberson 			m_freem(control);
1060aa0a1e58SJeff Roberson 			if (top)
1061aa0a1e58SJeff Roberson 				m_freem(top);
1062aa0a1e58SJeff Roberson 			return (EINVAL);
1063aa0a1e58SJeff Roberson 		}
1064aa0a1e58SJeff Roberson 		m_freem(control);
1065aa0a1e58SJeff Roberson 		control = NULL;
1066aa0a1e58SJeff Roberson 	}
1067aa0a1e58SJeff Roberson 	/*
1068aa0a1e58SJeff Roberson 	 * In theory resid should be unsigned.  However, space must be
1069aa0a1e58SJeff Roberson 	 * signed, as it might be less than 0 if we over-committed, and we
1070aa0a1e58SJeff Roberson 	 * must use a signed comparison of space and resid.  On the other
1071aa0a1e58SJeff Roberson 	 * hand, a negative resid causes us to loop sending 0-length
1072aa0a1e58SJeff Roberson 	 * segments to the protocol.
1073aa0a1e58SJeff Roberson 	 *
1074aa0a1e58SJeff Roberson 	 * Also check to make sure that MSG_EOR isn't used on SOCK_STREAM
1075aa0a1e58SJeff Roberson 	 * type sockets since that's an error.
1076aa0a1e58SJeff Roberson 	 */
1077aa0a1e58SJeff Roberson 	if (resid < 0 || (so->so_type == SOCK_STREAM && (flags & MSG_EOR))) {
1078aa0a1e58SJeff Roberson 		error = EINVAL;
1079aa0a1e58SJeff Roberson 		goto out;
1080aa0a1e58SJeff Roberson 	}
1081aa0a1e58SJeff Roberson 	if (td != NULL)
1082aa0a1e58SJeff Roberson 		td->td_ru.ru_msgsnd++;
1083aa0a1e58SJeff Roberson 
1084aa0a1e58SJeff Roberson 	ssk = sdp_sk(so);
1085f94acf52SMark Johnston 	error = SOCK_IO_SEND_LOCK(so, SBLOCKWAIT(flags));
1086aa0a1e58SJeff Roberson 	if (error)
1087aa0a1e58SJeff Roberson 		goto out;
1088aa0a1e58SJeff Roberson 
1089aa0a1e58SJeff Roberson restart:
1090aa0a1e58SJeff Roberson 	do {
1091aa0a1e58SJeff Roberson 		SOCKBUF_LOCK(&so->so_snd);
1092aa0a1e58SJeff Roberson 		if (so->so_snd.sb_state & SBS_CANTSENDMORE) {
1093aa0a1e58SJeff Roberson 			SOCKBUF_UNLOCK(&so->so_snd);
1094aa0a1e58SJeff Roberson 			error = EPIPE;
1095aa0a1e58SJeff Roberson 			goto release;
1096aa0a1e58SJeff Roberson 		}
1097aa0a1e58SJeff Roberson 		if (so->so_error) {
1098aa0a1e58SJeff Roberson 			error = so->so_error;
1099aa0a1e58SJeff Roberson 			so->so_error = 0;
1100aa0a1e58SJeff Roberson 			SOCKBUF_UNLOCK(&so->so_snd);
1101aa0a1e58SJeff Roberson 			goto release;
1102aa0a1e58SJeff Roberson 		}
1103aa0a1e58SJeff Roberson 		if ((so->so_state & SS_ISCONNECTED) == 0 && addr == NULL) {
1104aa0a1e58SJeff Roberson 			SOCKBUF_UNLOCK(&so->so_snd);
1105aa0a1e58SJeff Roberson 			error = ENOTCONN;
1106aa0a1e58SJeff Roberson 			goto release;
1107aa0a1e58SJeff Roberson 		}
1108aa0a1e58SJeff Roberson 		space = sbspace(&so->so_snd);
1109aa0a1e58SJeff Roberson 		if (flags & MSG_OOB)
1110aa0a1e58SJeff Roberson 			space += 1024;
1111aa0a1e58SJeff Roberson 		if (atomic && resid > ssk->xmit_size_goal - SDP_HEAD_SIZE) {
1112aa0a1e58SJeff Roberson 			SOCKBUF_UNLOCK(&so->so_snd);
1113aa0a1e58SJeff Roberson 			error = EMSGSIZE;
1114aa0a1e58SJeff Roberson 			goto release;
1115aa0a1e58SJeff Roberson 		}
1116aa0a1e58SJeff Roberson 		if (space < resid &&
1117aa0a1e58SJeff Roberson 		    (atomic || space < so->so_snd.sb_lowat)) {
11182f2ddd68SMark Johnston 			if ((so->so_state & SS_NBIO) ||
11192f2ddd68SMark Johnston 			    (flags & (MSG_NBIO | MSG_DONTWAIT)) != 0) {
1120aa0a1e58SJeff Roberson 				SOCKBUF_UNLOCK(&so->so_snd);
1121aa0a1e58SJeff Roberson 				error = EWOULDBLOCK;
1122aa0a1e58SJeff Roberson 				goto release;
1123aa0a1e58SJeff Roberson 			}
112443283184SGleb Smirnoff 			error = sbwait(so, SO_SND);
1125aa0a1e58SJeff Roberson 			SOCKBUF_UNLOCK(&so->so_snd);
1126aa0a1e58SJeff Roberson 			if (error)
1127aa0a1e58SJeff Roberson 				goto release;
1128aa0a1e58SJeff Roberson 			goto restart;
1129aa0a1e58SJeff Roberson 		}
1130aa0a1e58SJeff Roberson 		SOCKBUF_UNLOCK(&so->so_snd);
1131aa0a1e58SJeff Roberson 		do {
1132aa0a1e58SJeff Roberson 			if (uio == NULL) {
1133aa0a1e58SJeff Roberson 				resid = 0;
1134aa0a1e58SJeff Roberson 				if (flags & MSG_EOR)
1135aa0a1e58SJeff Roberson 					top->m_flags |= M_EOR;
1136aa0a1e58SJeff Roberson 			} else {
1137aa0a1e58SJeff Roberson 				/*
1138aa0a1e58SJeff Roberson 				 * Copy the data from userland into a mbuf
1139aa0a1e58SJeff Roberson 				 * chain.  If no data is to be copied in,
1140aa0a1e58SJeff Roberson 				 * a single empty mbuf is returned.
1141aa0a1e58SJeff Roberson 				 */
1142aa0a1e58SJeff Roberson 				copy = min(space,
1143aa0a1e58SJeff Roberson 				    ssk->xmit_size_goal - SDP_HEAD_SIZE);
1144aa0a1e58SJeff Roberson 				top = m_uiotombuf(uio, M_WAITOK, copy,
1145aa0a1e58SJeff Roberson 				    0, M_PKTHDR |
1146aa0a1e58SJeff Roberson 				    ((flags & MSG_EOR) ? M_EOR : 0));
1147aa0a1e58SJeff Roberson 				if (top == NULL) {
1148aa0a1e58SJeff Roberson 					/* only possible error */
1149aa0a1e58SJeff Roberson 					error = EFAULT;
1150aa0a1e58SJeff Roberson 					goto release;
1151aa0a1e58SJeff Roberson 				}
1152aa0a1e58SJeff Roberson 				space -= resid - uio->uio_resid;
1153aa0a1e58SJeff Roberson 				resid = uio->uio_resid;
1154aa0a1e58SJeff Roberson 			}
1155aa0a1e58SJeff Roberson 			/*
1156aa0a1e58SJeff Roberson 			 * XXX all the SBS_CANTSENDMORE checks previously
1157aa0a1e58SJeff Roberson 			 * done could be out of date after dropping the
1158aa0a1e58SJeff Roberson 			 * socket lock.
1159aa0a1e58SJeff Roberson 			 */
1160aa0a1e58SJeff Roberson 			error = sdp_send(so, (flags & MSG_OOB) ? PRUS_OOB :
1161aa0a1e58SJeff Roberson 			/*
1162aa0a1e58SJeff Roberson 			 * Set EOF on the last send if the user specified
1163aa0a1e58SJeff Roberson 			 * MSG_EOF.
1164aa0a1e58SJeff Roberson 			 */
1165aa0a1e58SJeff Roberson 			    ((flags & MSG_EOF) && (resid <= 0)) ? PRUS_EOF :
1166aa0a1e58SJeff Roberson 			/* If there is more to send set PRUS_MORETOCOME. */
1167aa0a1e58SJeff Roberson 			    (resid > 0 && space > 0) ? PRUS_MORETOCOME : 0,
1168aa0a1e58SJeff Roberson 			    top, addr, NULL, td);
1169aa0a1e58SJeff Roberson 			top = NULL;
1170aa0a1e58SJeff Roberson 			if (error)
1171aa0a1e58SJeff Roberson 				goto release;
1172aa0a1e58SJeff Roberson 		} while (resid && space > 0);
1173aa0a1e58SJeff Roberson 	} while (resid);
1174aa0a1e58SJeff Roberson 
1175aa0a1e58SJeff Roberson release:
1176f94acf52SMark Johnston 	SOCK_IO_SEND_UNLOCK(so);
1177aa0a1e58SJeff Roberson out:
1178aa0a1e58SJeff Roberson 	if (top != NULL)
1179aa0a1e58SJeff Roberson 		m_freem(top);
1180aa0a1e58SJeff Roberson 	return (error);
1181aa0a1e58SJeff Roberson }
1182aa0a1e58SJeff Roberson 
1183aa0a1e58SJeff Roberson /*
1184aa0a1e58SJeff Roberson  * The part of soreceive() that implements reading non-inline out-of-band
1185aa0a1e58SJeff Roberson  * data from a socket.  For more complete comments, see soreceive(), from
1186aa0a1e58SJeff Roberson  * which this code originated.
1187aa0a1e58SJeff Roberson  *
1188aa0a1e58SJeff Roberson  * Note that soreceive_rcvoob(), unlike the remainder of soreceive(), is
1189aa0a1e58SJeff Roberson  * unable to return an mbuf chain to the caller.
1190aa0a1e58SJeff Roberson  */
1191aa0a1e58SJeff Roberson static int
soreceive_rcvoob(struct socket * so,struct uio * uio,int flags)1192aa0a1e58SJeff Roberson soreceive_rcvoob(struct socket *so, struct uio *uio, int flags)
1193aa0a1e58SJeff Roberson {
1194aa0a1e58SJeff Roberson 	struct protosw *pr = so->so_proto;
1195aa0a1e58SJeff Roberson 	struct mbuf *m;
1196aa0a1e58SJeff Roberson 	int error;
1197aa0a1e58SJeff Roberson 
1198aa0a1e58SJeff Roberson 	KASSERT(flags & MSG_OOB, ("soreceive_rcvoob: (flags & MSG_OOB) == 0"));
1199aa0a1e58SJeff Roberson 
1200eb1b1807SGleb Smirnoff 	m = m_get(M_WAITOK, MT_DATA);
1201e7d02be1SGleb Smirnoff 	error = pr->pr_rcvoob(so, m, flags & MSG_PEEK);
1202aa0a1e58SJeff Roberson 	if (error)
1203aa0a1e58SJeff Roberson 		goto bad;
1204aa0a1e58SJeff Roberson 	do {
1205aa0a1e58SJeff Roberson 		error = uiomove(mtod(m, void *),
1206aa0a1e58SJeff Roberson 		    (int) min(uio->uio_resid, m->m_len), uio);
1207aa0a1e58SJeff Roberson 		m = m_free(m);
1208aa0a1e58SJeff Roberson 	} while (uio->uio_resid && error == 0 && m);
1209aa0a1e58SJeff Roberson bad:
1210aa0a1e58SJeff Roberson 	if (m != NULL)
1211aa0a1e58SJeff Roberson 		m_freem(m);
1212aa0a1e58SJeff Roberson 	return (error);
1213aa0a1e58SJeff Roberson }
1214aa0a1e58SJeff Roberson 
1215aa0a1e58SJeff Roberson /*
1216aa0a1e58SJeff Roberson  * Optimized version of soreceive() for stream (TCP) sockets.
1217aa0a1e58SJeff Roberson  */
1218aa0a1e58SJeff Roberson static int
sdp_sorecv(struct socket * so,struct sockaddr ** psa,struct uio * uio,struct mbuf ** mp0,struct mbuf ** controlp,int * flagsp)1219aa0a1e58SJeff Roberson sdp_sorecv(struct socket *so, struct sockaddr **psa, struct uio *uio,
1220aa0a1e58SJeff Roberson     struct mbuf **mp0, struct mbuf **controlp, int *flagsp)
1221aa0a1e58SJeff Roberson {
1222aa0a1e58SJeff Roberson 	int len = 0, error = 0, flags, oresid;
1223aa0a1e58SJeff Roberson 	struct sockbuf *sb;
1224aa0a1e58SJeff Roberson 	struct mbuf *m, *n = NULL;
1225aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
1226aa0a1e58SJeff Roberson 
1227aa0a1e58SJeff Roberson 	/* We only do stream sockets. */
1228aa0a1e58SJeff Roberson 	if (so->so_type != SOCK_STREAM)
1229aa0a1e58SJeff Roberson 		return (EINVAL);
1230aa0a1e58SJeff Roberson 	if (psa != NULL)
1231aa0a1e58SJeff Roberson 		*psa = NULL;
1232aa0a1e58SJeff Roberson 	if (controlp != NULL)
1233aa0a1e58SJeff Roberson 		return (EINVAL);
1234aa0a1e58SJeff Roberson 	if (flagsp != NULL)
1235aa0a1e58SJeff Roberson 		flags = *flagsp &~ MSG_EOR;
1236aa0a1e58SJeff Roberson 	else
1237aa0a1e58SJeff Roberson 		flags = 0;
1238aa0a1e58SJeff Roberson 	if (flags & MSG_OOB)
1239aa0a1e58SJeff Roberson 		return (soreceive_rcvoob(so, uio, flags));
1240aa0a1e58SJeff Roberson 	if (mp0 != NULL)
1241aa0a1e58SJeff Roberson 		*mp0 = NULL;
1242aa0a1e58SJeff Roberson 
1243aa0a1e58SJeff Roberson 	sb = &so->so_rcv;
1244aa0a1e58SJeff Roberson 	ssk = sdp_sk(so);
1245aa0a1e58SJeff Roberson 
1246aa0a1e58SJeff Roberson 	/* Prevent other readers from entering the socket. */
1247f94acf52SMark Johnston 	error = SOCK_IO_RECV_LOCK(so, SBLOCKWAIT(flags));
1248aa0a1e58SJeff Roberson 	if (error)
1249f94acf52SMark Johnston 		return (error);
1250aa0a1e58SJeff Roberson 	SOCKBUF_LOCK(sb);
1251aa0a1e58SJeff Roberson 
1252aa0a1e58SJeff Roberson 	/* Easy one, no space to copyout anything. */
1253aa0a1e58SJeff Roberson 	if (uio->uio_resid == 0) {
1254aa0a1e58SJeff Roberson 		error = EINVAL;
1255aa0a1e58SJeff Roberson 		goto out;
1256aa0a1e58SJeff Roberson 	}
1257aa0a1e58SJeff Roberson 	oresid = uio->uio_resid;
1258aa0a1e58SJeff Roberson 
1259aa0a1e58SJeff Roberson 	/* We will never ever get anything unless we are connected. */
1260aa0a1e58SJeff Roberson 	if (!(so->so_state & (SS_ISCONNECTED|SS_ISDISCONNECTED))) {
1261aa0a1e58SJeff Roberson 		/* When disconnecting there may be still some data left. */
1262cfa6009eSGleb Smirnoff 		if (sbavail(sb))
1263aa0a1e58SJeff Roberson 			goto deliver;
1264aa0a1e58SJeff Roberson 		if (!(so->so_state & SS_ISDISCONNECTED))
1265aa0a1e58SJeff Roberson 			error = ENOTCONN;
1266aa0a1e58SJeff Roberson 		goto out;
1267aa0a1e58SJeff Roberson 	}
1268aa0a1e58SJeff Roberson 
1269aa0a1e58SJeff Roberson 	/* Socket buffer is empty and we shall not block. */
1270cfa6009eSGleb Smirnoff 	if (sbavail(sb) == 0 &&
1271e5fb5622SJohn Baldwin 	    ((so->so_state & SS_NBIO) || (flags & (MSG_DONTWAIT|MSG_NBIO)))) {
1272aa0a1e58SJeff Roberson 		error = EAGAIN;
1273aa0a1e58SJeff Roberson 		goto out;
1274aa0a1e58SJeff Roberson 	}
1275aa0a1e58SJeff Roberson 
1276aa0a1e58SJeff Roberson restart:
1277aa0a1e58SJeff Roberson 	SOCKBUF_LOCK_ASSERT(&so->so_rcv);
1278aa0a1e58SJeff Roberson 
1279aa0a1e58SJeff Roberson 	/* Abort if socket has reported problems. */
1280aa0a1e58SJeff Roberson 	if (so->so_error) {
1281cfa6009eSGleb Smirnoff 		if (sbavail(sb))
1282aa0a1e58SJeff Roberson 			goto deliver;
1283aa0a1e58SJeff Roberson 		if (oresid > uio->uio_resid)
1284aa0a1e58SJeff Roberson 			goto out;
1285aa0a1e58SJeff Roberson 		error = so->so_error;
1286aa0a1e58SJeff Roberson 		if (!(flags & MSG_PEEK))
1287aa0a1e58SJeff Roberson 			so->so_error = 0;
1288aa0a1e58SJeff Roberson 		goto out;
1289aa0a1e58SJeff Roberson 	}
1290aa0a1e58SJeff Roberson 
1291aa0a1e58SJeff Roberson 	/* Door is closed.  Deliver what is left, if any. */
1292aa0a1e58SJeff Roberson 	if (sb->sb_state & SBS_CANTRCVMORE) {
1293cfa6009eSGleb Smirnoff 		if (sbavail(sb))
1294aa0a1e58SJeff Roberson 			goto deliver;
1295aa0a1e58SJeff Roberson 		else
1296aa0a1e58SJeff Roberson 			goto out;
1297aa0a1e58SJeff Roberson 	}
1298aa0a1e58SJeff Roberson 
1299aa0a1e58SJeff Roberson 	/* Socket buffer got some data that we shall deliver now. */
1300cfa6009eSGleb Smirnoff 	if (sbavail(sb) && !(flags & MSG_WAITALL) &&
1301e5fb5622SJohn Baldwin 	    ((so->so_state & SS_NBIO) ||
1302aa0a1e58SJeff Roberson 	     (flags & (MSG_DONTWAIT|MSG_NBIO)) ||
1303cfa6009eSGleb Smirnoff 	     sbavail(sb) >= sb->sb_lowat ||
1304cfa6009eSGleb Smirnoff 	     sbavail(sb) >= uio->uio_resid ||
1305cfa6009eSGleb Smirnoff 	     sbavail(sb) >= sb->sb_hiwat) ) {
1306aa0a1e58SJeff Roberson 		goto deliver;
1307aa0a1e58SJeff Roberson 	}
1308aa0a1e58SJeff Roberson 
1309aa0a1e58SJeff Roberson 	/* On MSG_WAITALL we must wait until all data or error arrives. */
1310aa0a1e58SJeff Roberson 	if ((flags & MSG_WAITALL) &&
1311cfa6009eSGleb Smirnoff 	    (sbavail(sb) >= uio->uio_resid || sbavail(sb) >= sb->sb_lowat))
1312aa0a1e58SJeff Roberson 		goto deliver;
1313aa0a1e58SJeff Roberson 
1314aa0a1e58SJeff Roberson 	/*
1315aa0a1e58SJeff Roberson 	 * Wait and block until (more) data comes in.
1316aa0a1e58SJeff Roberson 	 * NB: Drops the sockbuf lock during wait.
1317aa0a1e58SJeff Roberson 	 */
131843283184SGleb Smirnoff 	error = sbwait(so, SO_RCV);
1319aa0a1e58SJeff Roberson 	if (error)
1320aa0a1e58SJeff Roberson 		goto out;
1321aa0a1e58SJeff Roberson 	goto restart;
1322aa0a1e58SJeff Roberson 
1323aa0a1e58SJeff Roberson deliver:
1324aa0a1e58SJeff Roberson 	SOCKBUF_LOCK_ASSERT(&so->so_rcv);
1325cfa6009eSGleb Smirnoff 	KASSERT(sbavail(sb), ("%s: sockbuf empty", __func__));
1326aa0a1e58SJeff Roberson 	KASSERT(sb->sb_mb != NULL, ("%s: sb_mb == NULL", __func__));
1327aa0a1e58SJeff Roberson 
1328aa0a1e58SJeff Roberson 	/* Statistics. */
1329aa0a1e58SJeff Roberson 	if (uio->uio_td)
1330aa0a1e58SJeff Roberson 		uio->uio_td->td_ru.ru_msgrcv++;
1331aa0a1e58SJeff Roberson 
1332aa0a1e58SJeff Roberson 	/* Fill uio until full or current end of socket buffer is reached. */
1333cfa6009eSGleb Smirnoff 	len = min(uio->uio_resid, sbavail(sb));
1334aa0a1e58SJeff Roberson 	if (mp0 != NULL) {
1335aa0a1e58SJeff Roberson 		/* Dequeue as many mbufs as possible. */
1336aa0a1e58SJeff Roberson 		if (!(flags & MSG_PEEK) && len >= sb->sb_mb->m_len) {
1337aa0a1e58SJeff Roberson 			for (*mp0 = m = sb->sb_mb;
1338aa0a1e58SJeff Roberson 			     m != NULL && m->m_len <= len;
1339aa0a1e58SJeff Roberson 			     m = m->m_next) {
1340aa0a1e58SJeff Roberson 				len -= m->m_len;
1341aa0a1e58SJeff Roberson 				uio->uio_resid -= m->m_len;
1342aa0a1e58SJeff Roberson 				sbfree(sb, m);
1343aa0a1e58SJeff Roberson 				n = m;
1344aa0a1e58SJeff Roberson 			}
1345aa0a1e58SJeff Roberson 			sb->sb_mb = m;
1346aa0a1e58SJeff Roberson 			if (sb->sb_mb == NULL)
1347aa0a1e58SJeff Roberson 				SB_EMPTY_FIXUP(sb);
1348aa0a1e58SJeff Roberson 			n->m_next = NULL;
1349aa0a1e58SJeff Roberson 		}
1350aa0a1e58SJeff Roberson 		/* Copy the remainder. */
1351aa0a1e58SJeff Roberson 		if (len > 0) {
1352aa0a1e58SJeff Roberson 			KASSERT(sb->sb_mb != NULL,
1353aa0a1e58SJeff Roberson 			    ("%s: len > 0 && sb->sb_mb empty", __func__));
1354aa0a1e58SJeff Roberson 
1355eb1b1807SGleb Smirnoff 			m = m_copym(sb->sb_mb, 0, len, M_NOWAIT);
1356aa0a1e58SJeff Roberson 			if (m == NULL)
1357aa0a1e58SJeff Roberson 				len = 0;	/* Don't flush data from sockbuf. */
1358aa0a1e58SJeff Roberson 			else
1359aa0a1e58SJeff Roberson 				uio->uio_resid -= m->m_len;
1360aa0a1e58SJeff Roberson 			if (*mp0 != NULL)
1361aa0a1e58SJeff Roberson 				n->m_next = m;
1362aa0a1e58SJeff Roberson 			else
1363aa0a1e58SJeff Roberson 				*mp0 = m;
1364aa0a1e58SJeff Roberson 			if (*mp0 == NULL) {
1365aa0a1e58SJeff Roberson 				error = ENOBUFS;
1366aa0a1e58SJeff Roberson 				goto out;
1367aa0a1e58SJeff Roberson 			}
1368aa0a1e58SJeff Roberson 		}
1369aa0a1e58SJeff Roberson 	} else {
1370aa0a1e58SJeff Roberson 		/* NB: Must unlock socket buffer as uiomove may sleep. */
1371aa0a1e58SJeff Roberson 		SOCKBUF_UNLOCK(sb);
1372aa0a1e58SJeff Roberson 		error = m_mbuftouio(uio, sb->sb_mb, len);
1373aa0a1e58SJeff Roberson 		SOCKBUF_LOCK(sb);
1374aa0a1e58SJeff Roberson 		if (error)
1375aa0a1e58SJeff Roberson 			goto out;
1376aa0a1e58SJeff Roberson 	}
1377aa0a1e58SJeff Roberson 	SBLASTRECORDCHK(sb);
1378aa0a1e58SJeff Roberson 	SBLASTMBUFCHK(sb);
1379aa0a1e58SJeff Roberson 
1380aa0a1e58SJeff Roberson 	/*
1381aa0a1e58SJeff Roberson 	 * Remove the delivered data from the socket buffer unless we
1382aa0a1e58SJeff Roberson 	 * were only peeking.
1383aa0a1e58SJeff Roberson 	 */
1384aa0a1e58SJeff Roberson 	if (!(flags & MSG_PEEK)) {
1385aa0a1e58SJeff Roberson 		if (len > 0)
1386aa0a1e58SJeff Roberson 			sbdrop_locked(sb, len);
1387aa0a1e58SJeff Roberson 
1388aa0a1e58SJeff Roberson 		/* Notify protocol that we drained some data. */
1389aa0a1e58SJeff Roberson 		SOCKBUF_UNLOCK(sb);
1390aa0a1e58SJeff Roberson 		SDP_WLOCK(ssk);
1391aa0a1e58SJeff Roberson 		sdp_do_posts(ssk);
1392aa0a1e58SJeff Roberson 		SDP_WUNLOCK(ssk);
1393aa0a1e58SJeff Roberson 		SOCKBUF_LOCK(sb);
1394aa0a1e58SJeff Roberson 	}
1395aa0a1e58SJeff Roberson 
1396aa0a1e58SJeff Roberson 	/*
1397aa0a1e58SJeff Roberson 	 * For MSG_WAITALL we may have to loop again and wait for
1398aa0a1e58SJeff Roberson 	 * more data to come in.
1399aa0a1e58SJeff Roberson 	 */
1400aa0a1e58SJeff Roberson 	if ((flags & MSG_WAITALL) && uio->uio_resid > 0)
1401aa0a1e58SJeff Roberson 		goto restart;
1402aa0a1e58SJeff Roberson out:
1403aa0a1e58SJeff Roberson 	SBLASTRECORDCHK(sb);
1404aa0a1e58SJeff Roberson 	SBLASTMBUFCHK(sb);
1405aa0a1e58SJeff Roberson 	SOCKBUF_UNLOCK(sb);
1406f94acf52SMark Johnston 	SOCK_IO_RECV_UNLOCK(so);
1407aa0a1e58SJeff Roberson 	return (error);
1408aa0a1e58SJeff Roberson }
1409aa0a1e58SJeff Roberson 
1410aa0a1e58SJeff Roberson /*
1411aa0a1e58SJeff Roberson  * Abort is used to teardown a connection typically while sitting in
1412aa0a1e58SJeff Roberson  * the accept queue.
1413aa0a1e58SJeff Roberson  */
1414aa0a1e58SJeff Roberson void
sdp_abort(struct socket * so)1415aa0a1e58SJeff Roberson sdp_abort(struct socket *so)
1416aa0a1e58SJeff Roberson {
1417aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
1418aa0a1e58SJeff Roberson 
1419aa0a1e58SJeff Roberson 	ssk = sdp_sk(so);
1420aa0a1e58SJeff Roberson 	SDP_WLOCK(ssk);
1421aa0a1e58SJeff Roberson 	/*
1422aa0a1e58SJeff Roberson 	 * If we have not yet dropped, do it now.
1423aa0a1e58SJeff Roberson 	 */
1424aa0a1e58SJeff Roberson 	if (!(ssk->flags & SDP_TIMEWAIT) &&
1425aa0a1e58SJeff Roberson 	    !(ssk->flags & SDP_DROPPED))
1426aa0a1e58SJeff Roberson 		sdp_drop(ssk, ECONNABORTED);
1427aa0a1e58SJeff Roberson 	KASSERT(ssk->flags & SDP_DROPPED, ("sdp_abort: %p not dropped 0x%X",
1428aa0a1e58SJeff Roberson 	    ssk, ssk->flags));
1429aa0a1e58SJeff Roberson 	SDP_WUNLOCK(ssk);
1430aa0a1e58SJeff Roberson }
1431aa0a1e58SJeff Roberson 
1432aa0a1e58SJeff Roberson /*
1433aa0a1e58SJeff Roberson  * Close a SDP socket and initiate a friendly disconnect.
1434aa0a1e58SJeff Roberson  */
1435aa0a1e58SJeff Roberson static void
sdp_close(struct socket * so)1436aa0a1e58SJeff Roberson sdp_close(struct socket *so)
1437aa0a1e58SJeff Roberson {
1438aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
1439aa0a1e58SJeff Roberson 
1440aa0a1e58SJeff Roberson 	ssk = sdp_sk(so);
1441aa0a1e58SJeff Roberson 	SDP_WLOCK(ssk);
1442aa0a1e58SJeff Roberson 	/*
1443aa0a1e58SJeff Roberson 	 * If we have not yet dropped, do it now.
1444aa0a1e58SJeff Roberson 	 */
1445aa0a1e58SJeff Roberson 	if (!(ssk->flags & SDP_TIMEWAIT) &&
1446aa0a1e58SJeff Roberson 	    !(ssk->flags & SDP_DROPPED))
1447aa0a1e58SJeff Roberson 		sdp_start_disconnect(ssk);
1448aa0a1e58SJeff Roberson 
1449aa0a1e58SJeff Roberson 	/*
1450aa0a1e58SJeff Roberson 	 * If we've still not dropped let the socket layer know we're
1451aa0a1e58SJeff Roberson 	 * holding on to the socket and pcb for a while.
1452aa0a1e58SJeff Roberson 	 */
1453aa0a1e58SJeff Roberson 	if (!(ssk->flags & SDP_DROPPED)) {
1454aa0a1e58SJeff Roberson 		ssk->flags |= SDP_SOCKREF;
1455d8596171SGleb Smirnoff 		soref(so);
1456aa0a1e58SJeff Roberson 	}
1457aa0a1e58SJeff Roberson 	SDP_WUNLOCK(ssk);
1458aa0a1e58SJeff Roberson }
1459aa0a1e58SJeff Roberson 
1460aa0a1e58SJeff Roberson /*
1461aa0a1e58SJeff Roberson  * User requests out-of-band data.
1462aa0a1e58SJeff Roberson  */
1463aa0a1e58SJeff Roberson static int
sdp_rcvoob(struct socket * so,struct mbuf * m,int flags)1464aa0a1e58SJeff Roberson sdp_rcvoob(struct socket *so, struct mbuf *m, int flags)
1465aa0a1e58SJeff Roberson {
1466aa0a1e58SJeff Roberson 	int error = 0;
1467aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
1468aa0a1e58SJeff Roberson 
1469aa0a1e58SJeff Roberson 	ssk = sdp_sk(so);
1470aa0a1e58SJeff Roberson 	SDP_WLOCK(ssk);
1471aa0a1e58SJeff Roberson 	if (!rx_ring_trylock(&ssk->rx_ring)) {
1472aa0a1e58SJeff Roberson 		SDP_WUNLOCK(ssk);
1473aa0a1e58SJeff Roberson 		return (ECONNRESET);
1474aa0a1e58SJeff Roberson 	}
1475aa0a1e58SJeff Roberson 	if (ssk->flags & (SDP_TIMEWAIT | SDP_DROPPED)) {
1476aa0a1e58SJeff Roberson 		error = ECONNRESET;
1477aa0a1e58SJeff Roberson 		goto out;
1478aa0a1e58SJeff Roberson 	}
1479aa0a1e58SJeff Roberson 	if ((so->so_oobmark == 0 &&
1480aa0a1e58SJeff Roberson 	     (so->so_rcv.sb_state & SBS_RCVATMARK) == 0) ||
1481aa0a1e58SJeff Roberson 	    so->so_options & SO_OOBINLINE ||
1482aa0a1e58SJeff Roberson 	    ssk->oobflags & SDP_HADOOB) {
1483aa0a1e58SJeff Roberson 		error = EINVAL;
1484aa0a1e58SJeff Roberson 		goto out;
1485aa0a1e58SJeff Roberson 	}
1486aa0a1e58SJeff Roberson 	if ((ssk->oobflags & SDP_HAVEOOB) == 0) {
1487aa0a1e58SJeff Roberson 		error = EWOULDBLOCK;
1488aa0a1e58SJeff Roberson 		goto out;
1489aa0a1e58SJeff Roberson 	}
1490aa0a1e58SJeff Roberson 	m->m_len = 1;
1491aa0a1e58SJeff Roberson 	*mtod(m, caddr_t) = ssk->iobc;
1492aa0a1e58SJeff Roberson 	if ((flags & MSG_PEEK) == 0)
1493aa0a1e58SJeff Roberson 		ssk->oobflags ^= (SDP_HAVEOOB | SDP_HADOOB);
1494aa0a1e58SJeff Roberson out:
1495aa0a1e58SJeff Roberson 	rx_ring_unlock(&ssk->rx_ring);
1496aa0a1e58SJeff Roberson 	SDP_WUNLOCK(ssk);
1497aa0a1e58SJeff Roberson 	return (error);
1498aa0a1e58SJeff Roberson }
1499aa0a1e58SJeff Roberson 
1500aa0a1e58SJeff Roberson void
sdp_urg(struct sdp_sock * ssk,struct mbuf * mb)1501aa0a1e58SJeff Roberson sdp_urg(struct sdp_sock *ssk, struct mbuf *mb)
1502aa0a1e58SJeff Roberson {
1503aa0a1e58SJeff Roberson 	struct mbuf *m;
1504aa0a1e58SJeff Roberson 	struct socket *so;
1505aa0a1e58SJeff Roberson 
1506aa0a1e58SJeff Roberson 	so = ssk->socket;
1507aa0a1e58SJeff Roberson 	if (so == NULL)
1508aa0a1e58SJeff Roberson 		return;
1509aa0a1e58SJeff Roberson 
1510cfa6009eSGleb Smirnoff 	so->so_oobmark = sbused(&so->so_rcv) + mb->m_pkthdr.len - 1;
1511aa0a1e58SJeff Roberson 	sohasoutofband(so);
1512aa0a1e58SJeff Roberson 	ssk->oobflags &= ~(SDP_HAVEOOB | SDP_HADOOB);
1513aa0a1e58SJeff Roberson 	if (!(so->so_options & SO_OOBINLINE)) {
1514aa0a1e58SJeff Roberson 		for (m = mb; m->m_next != NULL; m = m->m_next);
1515aa0a1e58SJeff Roberson 		ssk->iobc = *(mtod(m, char *) + m->m_len - 1);
1516aa0a1e58SJeff Roberson 		ssk->oobflags |= SDP_HAVEOOB;
1517aa0a1e58SJeff Roberson 		m->m_len--;
1518aa0a1e58SJeff Roberson 		mb->m_pkthdr.len--;
1519aa0a1e58SJeff Roberson 	}
1520aa0a1e58SJeff Roberson }
1521aa0a1e58SJeff Roberson 
1522aa0a1e58SJeff Roberson /*
1523aa0a1e58SJeff Roberson  * Notify a sdp socket of an asynchronous error.
1524aa0a1e58SJeff Roberson  *
1525aa0a1e58SJeff Roberson  * Do not wake up user since there currently is no mechanism for
1526aa0a1e58SJeff Roberson  * reporting soft errors (yet - a kqueue filter may be added).
1527aa0a1e58SJeff Roberson  */
1528aa0a1e58SJeff Roberson struct sdp_sock *
sdp_notify(struct sdp_sock * ssk,int error)1529aa0a1e58SJeff Roberson sdp_notify(struct sdp_sock *ssk, int error)
1530aa0a1e58SJeff Roberson {
1531aa0a1e58SJeff Roberson 
1532aa0a1e58SJeff Roberson 	SDP_WLOCK_ASSERT(ssk);
1533aa0a1e58SJeff Roberson 
1534aa0a1e58SJeff Roberson 	if ((ssk->flags & SDP_TIMEWAIT) ||
1535aa0a1e58SJeff Roberson 	    (ssk->flags & SDP_DROPPED))
1536aa0a1e58SJeff Roberson 		return (ssk);
1537aa0a1e58SJeff Roberson 
1538aa0a1e58SJeff Roberson 	/*
1539aa0a1e58SJeff Roberson 	 * Ignore some errors if we are hooked up.
1540aa0a1e58SJeff Roberson 	 */
1541aa0a1e58SJeff Roberson 	if (ssk->state == TCPS_ESTABLISHED &&
1542aa0a1e58SJeff Roberson 	    (error == EHOSTUNREACH || error == ENETUNREACH ||
1543aa0a1e58SJeff Roberson 	     error == EHOSTDOWN))
1544aa0a1e58SJeff Roberson 		return (ssk);
1545aa0a1e58SJeff Roberson 	ssk->softerror = error;
1546aa0a1e58SJeff Roberson 	return sdp_drop(ssk, error);
1547aa0a1e58SJeff Roberson }
1548aa0a1e58SJeff Roberson 
1549aa0a1e58SJeff Roberson static void
sdp_keepalive_timeout(void * data)1550aa0a1e58SJeff Roberson sdp_keepalive_timeout(void *data)
1551aa0a1e58SJeff Roberson {
1552aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
1553aa0a1e58SJeff Roberson 
1554aa0a1e58SJeff Roberson 	ssk = data;
1555aa0a1e58SJeff Roberson 	/* Callout canceled. */
1556aa0a1e58SJeff Roberson         if (!callout_active(&ssk->keep2msl))
1557aa0a1e58SJeff Roberson                 return;
1558aa0a1e58SJeff Roberson 	/* Callout rescheduled as a different kind of timer. */
1559aa0a1e58SJeff Roberson 	if (callout_pending(&ssk->keep2msl))
1560aa0a1e58SJeff Roberson 		goto out;
1561aa0a1e58SJeff Roberson         callout_deactivate(&ssk->keep2msl);
1562aa0a1e58SJeff Roberson 	if (ssk->flags & SDP_DROPPED ||
1563aa0a1e58SJeff Roberson 	    (ssk->socket->so_options & SO_KEEPALIVE) == 0)
1564aa0a1e58SJeff Roberson 		goto out;
1565aa0a1e58SJeff Roberson 	sdp_post_keepalive(ssk);
1566aa0a1e58SJeff Roberson 	callout_reset(&ssk->keep2msl, SDP_KEEPALIVE_TIME,
1567aa0a1e58SJeff Roberson 	    sdp_keepalive_timeout, ssk);
1568aa0a1e58SJeff Roberson out:
1569aa0a1e58SJeff Roberson 	SDP_WUNLOCK(ssk);
1570aa0a1e58SJeff Roberson }
1571aa0a1e58SJeff Roberson 
1572aa0a1e58SJeff Roberson 
1573aa0a1e58SJeff Roberson void
sdp_start_keepalive_timer(struct socket * so)1574aa0a1e58SJeff Roberson sdp_start_keepalive_timer(struct socket *so)
1575aa0a1e58SJeff Roberson {
1576aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
1577aa0a1e58SJeff Roberson 
1578aa0a1e58SJeff Roberson 	ssk = sdp_sk(so);
1579aa0a1e58SJeff Roberson 	if (!callout_pending(&ssk->keep2msl))
1580aa0a1e58SJeff Roberson                 callout_reset(&ssk->keep2msl, SDP_KEEPALIVE_TIME,
1581aa0a1e58SJeff Roberson                     sdp_keepalive_timeout, ssk);
1582aa0a1e58SJeff Roberson }
1583aa0a1e58SJeff Roberson 
1584aa0a1e58SJeff Roberson static void
sdp_stop_keepalive_timer(struct socket * so)1585aa0a1e58SJeff Roberson sdp_stop_keepalive_timer(struct socket *so)
1586aa0a1e58SJeff Roberson {
1587aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
1588aa0a1e58SJeff Roberson 
1589aa0a1e58SJeff Roberson 	ssk = sdp_sk(so);
1590aa0a1e58SJeff Roberson 	callout_stop(&ssk->keep2msl);
1591aa0a1e58SJeff Roberson }
1592aa0a1e58SJeff Roberson 
1593aa0a1e58SJeff Roberson /*
1594aa0a1e58SJeff Roberson  * sdp_ctloutput() must drop the inpcb lock before performing copyin on
1595aa0a1e58SJeff Roberson  * socket option arguments.  When it re-acquires the lock after the copy, it
1596aa0a1e58SJeff Roberson  * has to revalidate that the connection is still valid for the socket
1597aa0a1e58SJeff Roberson  * option.
1598aa0a1e58SJeff Roberson  */
1599aa0a1e58SJeff Roberson #define SDP_WLOCK_RECHECK(inp) do {					\
1600aa0a1e58SJeff Roberson 	SDP_WLOCK(ssk);							\
1601aa0a1e58SJeff Roberson 	if (ssk->flags & (SDP_TIMEWAIT | SDP_DROPPED)) {		\
1602aa0a1e58SJeff Roberson 		SDP_WUNLOCK(ssk);					\
1603aa0a1e58SJeff Roberson 		return (ECONNRESET);					\
1604aa0a1e58SJeff Roberson 	}								\
1605aa0a1e58SJeff Roberson } while(0)
1606aa0a1e58SJeff Roberson 
1607aa0a1e58SJeff Roberson static int
sdp_ctloutput(struct socket * so,struct sockopt * sopt)1608aa0a1e58SJeff Roberson sdp_ctloutput(struct socket *so, struct sockopt *sopt)
1609aa0a1e58SJeff Roberson {
1610aa0a1e58SJeff Roberson 	int	error, opt, optval;
1611aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
1612aa0a1e58SJeff Roberson 
1613aa0a1e58SJeff Roberson 	error = 0;
1614aa0a1e58SJeff Roberson 	ssk = sdp_sk(so);
1615aa0a1e58SJeff Roberson 	if (sopt->sopt_level == SOL_SOCKET && sopt->sopt_name == SO_KEEPALIVE) {
1616aa0a1e58SJeff Roberson 		SDP_WLOCK(ssk);
1617aa0a1e58SJeff Roberson 		if (so->so_options & SO_KEEPALIVE)
1618aa0a1e58SJeff Roberson 			sdp_start_keepalive_timer(so);
1619aa0a1e58SJeff Roberson 		else
1620aa0a1e58SJeff Roberson 			sdp_stop_keepalive_timer(so);
1621aa0a1e58SJeff Roberson 		SDP_WUNLOCK(ssk);
1622aa0a1e58SJeff Roberson 	}
1623aa0a1e58SJeff Roberson 	if (sopt->sopt_level != IPPROTO_TCP)
1624aa0a1e58SJeff Roberson 		return (error);
1625aa0a1e58SJeff Roberson 
1626aa0a1e58SJeff Roberson 	SDP_WLOCK(ssk);
1627aa0a1e58SJeff Roberson 	if (ssk->flags & (SDP_TIMEWAIT | SDP_DROPPED)) {
1628aa0a1e58SJeff Roberson 		SDP_WUNLOCK(ssk);
1629aa0a1e58SJeff Roberson 		return (ECONNRESET);
1630aa0a1e58SJeff Roberson 	}
1631aa0a1e58SJeff Roberson 
1632aa0a1e58SJeff Roberson 	switch (sopt->sopt_dir) {
1633aa0a1e58SJeff Roberson 	case SOPT_SET:
1634aa0a1e58SJeff Roberson 		switch (sopt->sopt_name) {
1635aa0a1e58SJeff Roberson 		case TCP_NODELAY:
1636aa0a1e58SJeff Roberson 			SDP_WUNLOCK(ssk);
1637aa0a1e58SJeff Roberson 			error = sooptcopyin(sopt, &optval, sizeof optval,
1638aa0a1e58SJeff Roberson 			    sizeof optval);
1639aa0a1e58SJeff Roberson 			if (error)
1640aa0a1e58SJeff Roberson 				return (error);
1641aa0a1e58SJeff Roberson 
1642aa0a1e58SJeff Roberson 			SDP_WLOCK_RECHECK(ssk);
1643aa0a1e58SJeff Roberson 			opt = SDP_NODELAY;
1644aa0a1e58SJeff Roberson 			if (optval)
1645aa0a1e58SJeff Roberson 				ssk->flags |= opt;
1646aa0a1e58SJeff Roberson 			else
1647aa0a1e58SJeff Roberson 				ssk->flags &= ~opt;
1648aa0a1e58SJeff Roberson 			sdp_do_posts(ssk);
1649aa0a1e58SJeff Roberson 			SDP_WUNLOCK(ssk);
1650aa0a1e58SJeff Roberson 			break;
1651aa0a1e58SJeff Roberson 
1652aa0a1e58SJeff Roberson 		default:
1653aa0a1e58SJeff Roberson 			SDP_WUNLOCK(ssk);
1654aa0a1e58SJeff Roberson 			error = ENOPROTOOPT;
1655aa0a1e58SJeff Roberson 			break;
1656aa0a1e58SJeff Roberson 		}
1657aa0a1e58SJeff Roberson 		break;
1658aa0a1e58SJeff Roberson 
1659aa0a1e58SJeff Roberson 	case SOPT_GET:
1660aa0a1e58SJeff Roberson 		switch (sopt->sopt_name) {
1661aa0a1e58SJeff Roberson 		case TCP_NODELAY:
1662aa0a1e58SJeff Roberson 			optval = ssk->flags & SDP_NODELAY;
1663aa0a1e58SJeff Roberson 			SDP_WUNLOCK(ssk);
1664aa0a1e58SJeff Roberson 			error = sooptcopyout(sopt, &optval, sizeof optval);
1665aa0a1e58SJeff Roberson 			break;
1666aa0a1e58SJeff Roberson 		default:
1667aa0a1e58SJeff Roberson 			SDP_WUNLOCK(ssk);
1668aa0a1e58SJeff Roberson 			error = ENOPROTOOPT;
1669aa0a1e58SJeff Roberson 			break;
1670aa0a1e58SJeff Roberson 		}
1671aa0a1e58SJeff Roberson 		break;
1672aa0a1e58SJeff Roberson 	}
1673aa0a1e58SJeff Roberson 	return (error);
1674aa0a1e58SJeff Roberson }
1675aa0a1e58SJeff Roberson #undef SDP_WLOCK_RECHECK
1676aa0a1e58SJeff Roberson 
1677aa0a1e58SJeff Roberson int sdp_mod_count = 0;
1678aa0a1e58SJeff Roberson int sdp_mod_usec = 0;
1679aa0a1e58SJeff Roberson 
1680aa0a1e58SJeff Roberson void
sdp_set_default_moderation(struct sdp_sock * ssk)1681aa0a1e58SJeff Roberson sdp_set_default_moderation(struct sdp_sock *ssk)
1682aa0a1e58SJeff Roberson {
1683aa0a1e58SJeff Roberson 	if (sdp_mod_count <= 0 || sdp_mod_usec <= 0)
1684aa0a1e58SJeff Roberson 		return;
1685c69c74b8SHans Petter Selasky 	ib_modify_cq(ssk->rx_ring.cq, sdp_mod_count, sdp_mod_usec);
16868a8f7d5bSHans Petter Selasky }
1687aa0a1e58SJeff Roberson 
1688aa0a1e58SJeff Roberson static void
sdp_dev_add(struct ib_device * device)1689aa0a1e58SJeff Roberson sdp_dev_add(struct ib_device *device)
1690aa0a1e58SJeff Roberson {
1691aa0a1e58SJeff Roberson 	struct ib_fmr_pool_param param;
1692aa0a1e58SJeff Roberson 	struct sdp_device *sdp_dev;
1693aa0a1e58SJeff Roberson 
1694aa0a1e58SJeff Roberson 	sdp_dev = malloc(sizeof(*sdp_dev), M_SDP, M_WAITOK | M_ZERO);
1695c69c74b8SHans Petter Selasky 	sdp_dev->pd = ib_alloc_pd(device, 0);
1696aa0a1e58SJeff Roberson 	if (IS_ERR(sdp_dev->pd))
1697aa0a1e58SJeff Roberson 		goto out_pd;
1698aa0a1e58SJeff Roberson 	memset(&param, 0, sizeof param);
1699aa0a1e58SJeff Roberson 	param.max_pages_per_fmr = SDP_FMR_SIZE;
1700aa0a1e58SJeff Roberson 	param.page_shift = PAGE_SHIFT;
1701aa0a1e58SJeff Roberson 	param.access = (IB_ACCESS_LOCAL_WRITE | IB_ACCESS_REMOTE_READ);
1702aa0a1e58SJeff Roberson 	param.pool_size = SDP_FMR_POOL_SIZE;
1703aa0a1e58SJeff Roberson 	param.dirty_watermark = SDP_FMR_DIRTY_SIZE;
1704aa0a1e58SJeff Roberson 	param.cache = 1;
1705aa0a1e58SJeff Roberson 	sdp_dev->fmr_pool = ib_create_fmr_pool(sdp_dev->pd, &param);
1706aa0a1e58SJeff Roberson 	if (IS_ERR(sdp_dev->fmr_pool))
1707aa0a1e58SJeff Roberson 		goto out_fmr;
1708aa0a1e58SJeff Roberson 	ib_set_client_data(device, &sdp_client, sdp_dev);
1709aa0a1e58SJeff Roberson 	return;
1710aa0a1e58SJeff Roberson 
1711aa0a1e58SJeff Roberson out_fmr:
1712aa0a1e58SJeff Roberson 	ib_dealloc_pd(sdp_dev->pd);
1713aa0a1e58SJeff Roberson out_pd:
1714aa0a1e58SJeff Roberson 	free(sdp_dev, M_SDP);
1715aa0a1e58SJeff Roberson }
1716aa0a1e58SJeff Roberson 
1717aa0a1e58SJeff Roberson static void
sdp_dev_rem(struct ib_device * device,void * client_data)1718c69c74b8SHans Petter Selasky sdp_dev_rem(struct ib_device *device, void *client_data)
1719aa0a1e58SJeff Roberson {
1720aa0a1e58SJeff Roberson 	struct sdp_device *sdp_dev;
1721aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
1722aa0a1e58SJeff Roberson 
1723aa0a1e58SJeff Roberson 	SDP_LIST_WLOCK();
1724aa0a1e58SJeff Roberson 	LIST_FOREACH(ssk, &sdp_list, list) {
1725aa0a1e58SJeff Roberson 		if (ssk->ib_device != device)
1726aa0a1e58SJeff Roberson 			continue;
1727aa0a1e58SJeff Roberson 		SDP_WLOCK(ssk);
1728aa0a1e58SJeff Roberson 		if ((ssk->flags & SDP_DESTROY) == 0)
1729aa0a1e58SJeff Roberson 			ssk = sdp_notify(ssk, ECONNRESET);
1730aa0a1e58SJeff Roberson 		if (ssk)
1731aa0a1e58SJeff Roberson 			SDP_WUNLOCK(ssk);
1732aa0a1e58SJeff Roberson 	}
1733aa0a1e58SJeff Roberson 	SDP_LIST_WUNLOCK();
1734aa0a1e58SJeff Roberson 	/*
1735aa0a1e58SJeff Roberson 	 * XXX Do I need to wait between these two?
1736aa0a1e58SJeff Roberson 	 */
1737aa0a1e58SJeff Roberson 	sdp_dev = ib_get_client_data(device, &sdp_client);
1738aa0a1e58SJeff Roberson 	if (!sdp_dev)
1739aa0a1e58SJeff Roberson 		return;
1740aa0a1e58SJeff Roberson 	ib_flush_fmr_pool(sdp_dev->fmr_pool);
1741aa0a1e58SJeff Roberson 	ib_destroy_fmr_pool(sdp_dev->fmr_pool);
1742aa0a1e58SJeff Roberson 	ib_dealloc_pd(sdp_dev->pd);
1743aa0a1e58SJeff Roberson 	free(sdp_dev, M_SDP);
1744aa0a1e58SJeff Roberson }
1745aa0a1e58SJeff Roberson 
1746aa0a1e58SJeff Roberson struct ib_client sdp_client =
1747aa0a1e58SJeff Roberson     { .name = "sdp", .add = sdp_dev_add, .remove = sdp_dev_rem };
1748aa0a1e58SJeff Roberson 
1749aa0a1e58SJeff Roberson 
1750aa0a1e58SJeff Roberson static int
sdp_pcblist(SYSCTL_HANDLER_ARGS)1751aa0a1e58SJeff Roberson sdp_pcblist(SYSCTL_HANDLER_ARGS)
1752aa0a1e58SJeff Roberson {
1753aa0a1e58SJeff Roberson 	int error, n, i;
1754aa0a1e58SJeff Roberson 	struct sdp_sock *ssk;
1755aa0a1e58SJeff Roberson 	struct xinpgen xig;
1756aa0a1e58SJeff Roberson 
1757aa0a1e58SJeff Roberson 	/*
1758aa0a1e58SJeff Roberson 	 * The process of preparing the TCB list is too time-consuming and
1759aa0a1e58SJeff Roberson 	 * resource-intensive to repeat twice on every request.
1760aa0a1e58SJeff Roberson 	 */
1761aa0a1e58SJeff Roberson 	if (req->oldptr == NULL) {
1762aa0a1e58SJeff Roberson 		n = sdp_count;
1763aa0a1e58SJeff Roberson 		n += imax(n / 8, 10);
1764aa0a1e58SJeff Roberson 		req->oldidx = 2 * (sizeof xig) + n * sizeof(struct xtcpcb);
1765aa0a1e58SJeff Roberson 		return (0);
1766aa0a1e58SJeff Roberson 	}
1767aa0a1e58SJeff Roberson 
1768aa0a1e58SJeff Roberson 	if (req->newptr != NULL)
1769aa0a1e58SJeff Roberson 		return (EPERM);
1770aa0a1e58SJeff Roberson 
1771aa0a1e58SJeff Roberson 	/*
1772aa0a1e58SJeff Roberson 	 * OK, now we're committed to doing something.
1773aa0a1e58SJeff Roberson 	 */
1774aa0a1e58SJeff Roberson 	SDP_LIST_RLOCK();
1775aa0a1e58SJeff Roberson 	n = sdp_count;
1776aa0a1e58SJeff Roberson 	SDP_LIST_RUNLOCK();
1777aa0a1e58SJeff Roberson 
1778aa0a1e58SJeff Roberson 	error = sysctl_wire_old_buffer(req, 2 * (sizeof xig)
1779aa0a1e58SJeff Roberson 		+ n * sizeof(struct xtcpcb));
1780aa0a1e58SJeff Roberson 	if (error != 0)
1781aa0a1e58SJeff Roberson 		return (error);
1782aa0a1e58SJeff Roberson 
178379db6fe7SMark Johnston 	bzero(&xig, sizeof(xig));
1784aa0a1e58SJeff Roberson 	xig.xig_len = sizeof xig;
1785aa0a1e58SJeff Roberson 	xig.xig_count = n;
1786aa0a1e58SJeff Roberson 	xig.xig_gen = 0;
1787aa0a1e58SJeff Roberson 	xig.xig_sogen = so_gencnt;
1788aa0a1e58SJeff Roberson 	error = SYSCTL_OUT(req, &xig, sizeof xig);
1789aa0a1e58SJeff Roberson 	if (error)
1790aa0a1e58SJeff Roberson 		return (error);
1791aa0a1e58SJeff Roberson 
1792aa0a1e58SJeff Roberson 	SDP_LIST_RLOCK();
1793aa0a1e58SJeff Roberson 	for (ssk = LIST_FIRST(&sdp_list), i = 0;
1794aa0a1e58SJeff Roberson 	    ssk != NULL && i < n; ssk = LIST_NEXT(ssk, list)) {
1795aa0a1e58SJeff Roberson 		struct xtcpcb xt;
1796aa0a1e58SJeff Roberson 
1797aa0a1e58SJeff Roberson 		SDP_RLOCK(ssk);
1798aa0a1e58SJeff Roberson 		if (ssk->flags & SDP_TIMEWAIT) {
1799aa0a1e58SJeff Roberson 			if (ssk->cred != NULL)
1800aa0a1e58SJeff Roberson 				error = cr_cansee(req->td->td_ucred,
1801aa0a1e58SJeff Roberson 				    ssk->cred);
1802aa0a1e58SJeff Roberson 			else
1803aa0a1e58SJeff Roberson 				error = EINVAL;	/* Skip this inp. */
1804aa0a1e58SJeff Roberson 		} else if (ssk->socket)
1805aa0a1e58SJeff Roberson 			error = cr_canseesocket(req->td->td_ucred,
1806aa0a1e58SJeff Roberson 			    ssk->socket);
1807aa0a1e58SJeff Roberson 		else
1808aa0a1e58SJeff Roberson 			error = EINVAL;
1809aa0a1e58SJeff Roberson 		if (error) {
1810aa0a1e58SJeff Roberson 			error = 0;
1811aa0a1e58SJeff Roberson 			goto next;
1812aa0a1e58SJeff Roberson 		}
1813aa0a1e58SJeff Roberson 
1814aa0a1e58SJeff Roberson 		bzero(&xt, sizeof(xt));
1815aa0a1e58SJeff Roberson 		xt.xt_len = sizeof xt;
1816aa0a1e58SJeff Roberson 		xt.xt_inp.inp_gencnt = 0;
1817aa0a1e58SJeff Roberson 		xt.xt_inp.inp_vflag = INP_IPV4;
1818aa0a1e58SJeff Roberson 		memcpy(&xt.xt_inp.inp_laddr, &ssk->laddr, sizeof(ssk->laddr));
1819aa0a1e58SJeff Roberson 		xt.xt_inp.inp_lport = ssk->lport;
1820aa0a1e58SJeff Roberson 		memcpy(&xt.xt_inp.inp_faddr, &ssk->faddr, sizeof(ssk->faddr));
1821aa0a1e58SJeff Roberson 		xt.xt_inp.inp_fport = ssk->fport;
1822817e1ad9SGleb Smirnoff 		xt.t_state = ssk->state;
1823aa0a1e58SJeff Roberson 		if (ssk->socket != NULL)
1824817e1ad9SGleb Smirnoff 			sotoxsocket(ssk->socket, &xt.xt_inp.xi_socket);
1825817e1ad9SGleb Smirnoff 		xt.xt_inp.xi_socket.xso_protocol = IPPROTO_TCP;
1826aa0a1e58SJeff Roberson 		SDP_RUNLOCK(ssk);
1827aa0a1e58SJeff Roberson 		error = SYSCTL_OUT(req, &xt, sizeof xt);
1828aa0a1e58SJeff Roberson 		if (error)
1829aa0a1e58SJeff Roberson 			break;
1830aa0a1e58SJeff Roberson 		i++;
1831aa0a1e58SJeff Roberson 		continue;
1832aa0a1e58SJeff Roberson next:
1833aa0a1e58SJeff Roberson 		SDP_RUNLOCK(ssk);
1834aa0a1e58SJeff Roberson 	}
1835aa0a1e58SJeff Roberson 	if (!error) {
1836aa0a1e58SJeff Roberson 		/*
1837aa0a1e58SJeff Roberson 		 * Give the user an updated idea of our state.
1838aa0a1e58SJeff Roberson 		 * If the generation differs from what we told
1839aa0a1e58SJeff Roberson 		 * her before, she knows that something happened
1840aa0a1e58SJeff Roberson 		 * while we were processing this request, and it
1841aa0a1e58SJeff Roberson 		 * might be necessary to retry.
1842aa0a1e58SJeff Roberson 		 */
1843aa0a1e58SJeff Roberson 		xig.xig_gen = 0;
1844aa0a1e58SJeff Roberson 		xig.xig_sogen = so_gencnt;
1845aa0a1e58SJeff Roberson 		xig.xig_count = sdp_count;
1846aa0a1e58SJeff Roberson 		error = SYSCTL_OUT(req, &xig, sizeof xig);
1847aa0a1e58SJeff Roberson 	}
1848aa0a1e58SJeff Roberson 	SDP_LIST_RUNLOCK();
1849aa0a1e58SJeff Roberson 	return (error);
1850aa0a1e58SJeff Roberson }
1851aa0a1e58SJeff Roberson 
18527029da5cSPawel Biernacki SYSCTL_NODE(_net_inet, -1, sdp, CTLFLAG_RW | CTLFLAG_MPSAFE, 0,
18537029da5cSPawel Biernacki     "SDP");
1854aa0a1e58SJeff Roberson 
1855aa0a1e58SJeff Roberson SYSCTL_PROC(_net_inet_sdp, TCPCTL_PCBLIST, pcblist,
18567029da5cSPawel Biernacki     CTLFLAG_RD | CTLTYPE_STRUCT | CTLFLAG_MPSAFE,
18577029da5cSPawel Biernacki     0, 0, sdp_pcblist, "S,xtcpcb",
1858aa0a1e58SJeff Roberson     "List of active SDP connections");
1859aa0a1e58SJeff Roberson 
1860aa0a1e58SJeff Roberson static void
sdp_zone_change(void * tag)1861aa0a1e58SJeff Roberson sdp_zone_change(void *tag)
1862aa0a1e58SJeff Roberson {
1863aa0a1e58SJeff Roberson 
1864aa0a1e58SJeff Roberson 	uma_zone_set_max(sdp_zone, maxsockets);
1865aa0a1e58SJeff Roberson }
1866aa0a1e58SJeff Roberson 
1867aa0a1e58SJeff Roberson static void
sdp_init(void * arg __unused)186824e1c6aeSGleb Smirnoff sdp_init(void *arg __unused)
1869aa0a1e58SJeff Roberson {
1870aa0a1e58SJeff Roberson 
1871aa0a1e58SJeff Roberson 	LIST_INIT(&sdp_list);
1872aa0a1e58SJeff Roberson 	sdp_zone = uma_zcreate("sdp_sock", sizeof(struct sdp_sock),
1873aa0a1e58SJeff Roberson 	    NULL, NULL, NULL, NULL, UMA_ALIGN_PTR, UMA_ZONE_NOFREE);
1874aa0a1e58SJeff Roberson 	uma_zone_set_max(sdp_zone, maxsockets);
1875aa0a1e58SJeff Roberson 	EVENTHANDLER_REGISTER(maxsockets_change, sdp_zone_change, NULL,
1876aa0a1e58SJeff Roberson 		EVENTHANDLER_PRI_ANY);
1877aa0a1e58SJeff Roberson 	rx_comp_wq = create_singlethread_workqueue("rx_comp_wq");
1878aa0a1e58SJeff Roberson 	ib_register_client(&sdp_client);
1879aa0a1e58SJeff Roberson }
188024e1c6aeSGleb Smirnoff SYSINIT(sdp_init, SI_SUB_PROTO_DOMAIN, SI_ORDER_SECOND, sdp_init, NULL);
1881aa0a1e58SJeff Roberson 
1882e7d02be1SGleb Smirnoff #define	SDP_PROTOSW							\
1883e7d02be1SGleb Smirnoff 	.pr_type =		SOCK_STREAM,				\
1884e7d02be1SGleb Smirnoff 	.pr_flags =		PR_CONNREQUIRED|PR_IMPLOPCL|PR_WANTRCVD,\
1885e7d02be1SGleb Smirnoff 	.pr_ctloutput =		sdp_ctloutput,				\
1886e7d02be1SGleb Smirnoff 	.pr_abort =		sdp_abort,				\
1887e7d02be1SGleb Smirnoff 	.pr_accept =		sdp_accept,				\
1888e7d02be1SGleb Smirnoff 	.pr_attach =		sdp_attach,				\
1889e7d02be1SGleb Smirnoff 	.pr_bind =		sdp_bind,				\
1890e7d02be1SGleb Smirnoff 	.pr_connect =		sdp_connect,				\
1891e7d02be1SGleb Smirnoff 	.pr_detach =		sdp_detach,				\
1892e7d02be1SGleb Smirnoff 	.pr_disconnect =	sdp_disconnect,				\
1893e7d02be1SGleb Smirnoff 	.pr_listen =		sdp_listen,				\
1894e7d02be1SGleb Smirnoff 	.pr_peeraddr =		sdp_getpeeraddr,			\
1895e7d02be1SGleb Smirnoff 	.pr_rcvoob =		sdp_rcvoob,				\
1896e7d02be1SGleb Smirnoff 	.pr_send =		sdp_send,				\
1897e7d02be1SGleb Smirnoff 	.pr_sosend =		sdp_sosend,				\
1898e7d02be1SGleb Smirnoff 	.pr_soreceive =		sdp_sorecv,				\
1899e7d02be1SGleb Smirnoff 	.pr_shutdown =		sdp_shutdown,				\
1900e7d02be1SGleb Smirnoff 	.pr_sockaddr =		sdp_getsockaddr,			\
1901e7d02be1SGleb Smirnoff 	.pr_close =		sdp_close
1902aa0a1e58SJeff Roberson 
1903aa0a1e58SJeff Roberson 
1904e7d02be1SGleb Smirnoff static struct protosw sdp_ip_protosw = {
1905aa0a1e58SJeff Roberson 	.pr_protocol =		IPPROTO_IP,
1906e7d02be1SGleb Smirnoff 	SDP_PROTOSW
1907e7d02be1SGleb Smirnoff };
1908e7d02be1SGleb Smirnoff static struct protosw sdp_tcp_protosw = {
1909aa0a1e58SJeff Roberson 	.pr_protocol =		IPPROTO_TCP,
1910e7d02be1SGleb Smirnoff 	SDP_PROTOSW
1911aa0a1e58SJeff Roberson };
1912aa0a1e58SJeff Roberson 
1913e7d02be1SGleb Smirnoff static struct domain sdpdomain = {
1914aa0a1e58SJeff Roberson 	.dom_family =		AF_INET_SDP,
1915aa0a1e58SJeff Roberson 	.dom_name =		"SDP",
1916e7d02be1SGleb Smirnoff 	.dom_nprotosw =		2,
1917e7d02be1SGleb Smirnoff 	.dom_protosw = {
1918e7d02be1SGleb Smirnoff 		&sdp_ip_protosw,
1919e7d02be1SGleb Smirnoff 		&sdp_tcp_protosw,
1920e7d02be1SGleb Smirnoff 	},
1921aa0a1e58SJeff Roberson };
1922aa0a1e58SJeff Roberson 
1923aa0a1e58SJeff Roberson DOMAIN_SET(sdp);
1924aa0a1e58SJeff Roberson 
1925aa0a1e58SJeff Roberson int sdp_debug_level = 1;
1926aa0a1e58SJeff Roberson int sdp_data_debug_level = 0;
1927