clnt_vc.c revision 213756
1177633Sdfr/*	$NetBSD: clnt_vc.c,v 1.4 2000/07/14 08:40:42 fvdl Exp $	*/
2177633Sdfr
3177633Sdfr/*
4177633Sdfr * Sun RPC is a product of Sun Microsystems, Inc. and is provided for
5177633Sdfr * unrestricted use provided that this legend is included on all tape
6177633Sdfr * media and as a part of the software program in whole or part.  Users
7177633Sdfr * may copy or modify Sun RPC without charge, but are not authorized
8177633Sdfr * to license or distribute it to anyone else except as part of a product or
9177633Sdfr * program developed by the user.
10177633Sdfr *
11177633Sdfr * SUN RPC IS PROVIDED AS IS WITH NO WARRANTIES OF ANY KIND INCLUDING THE
12177633Sdfr * WARRANTIES OF DESIGN, MERCHANTIBILITY AND FITNESS FOR A PARTICULAR
13177633Sdfr * PURPOSE, OR ARISING FROM A COURSE OF DEALING, USAGE OR TRADE PRACTICE.
14177633Sdfr *
15177633Sdfr * Sun RPC is provided with no support and without any obligation on the
16177633Sdfr * part of Sun Microsystems, Inc. to assist in its use, correction,
17177633Sdfr * modification or enhancement.
18177633Sdfr *
19177633Sdfr * SUN MICROSYSTEMS, INC. SHALL HAVE NO LIABILITY WITH RESPECT TO THE
20177633Sdfr * INFRINGEMENT OF COPYRIGHTS, TRADE SECRETS OR ANY PATENTS BY SUN RPC
21177633Sdfr * OR ANY PART THEREOF.
22177633Sdfr *
23177633Sdfr * In no event will Sun Microsystems, Inc. be liable for any lost revenue
24177633Sdfr * or profits or other special, indirect and consequential damages, even if
25177633Sdfr * Sun has been advised of the possibility of such damages.
26177633Sdfr *
27177633Sdfr * Sun Microsystems, Inc.
28177633Sdfr * 2550 Garcia Avenue
29177633Sdfr * Mountain View, California  94043
30177633Sdfr */
31177633Sdfr
32177633Sdfr#if defined(LIBC_SCCS) && !defined(lint)
33177633Sdfrstatic char *sccsid2 = "@(#)clnt_tcp.c 1.37 87/10/05 Copyr 1984 Sun Micro";
34177633Sdfrstatic char *sccsid = "@(#)clnt_tcp.c	2.2 88/08/01 4.0 RPCSRC";
35177633Sdfrstatic char sccsid3[] = "@(#)clnt_vc.c 1.19 89/03/16 Copyr 1988 Sun Micro";
36177633Sdfr#endif
37177633Sdfr#include <sys/cdefs.h>
38177633Sdfr__FBSDID("$FreeBSD: head/sys/rpc/clnt_vc.c 213756 2010-10-13 00:57:14Z rmacklem $");
39177633Sdfr
40177633Sdfr/*
41177633Sdfr * clnt_tcp.c, Implements a TCP/IP based, client side RPC.
42177633Sdfr *
43177633Sdfr * Copyright (C) 1984, Sun Microsystems, Inc.
44177633Sdfr *
45177633Sdfr * TCP based RPC supports 'batched calls'.
46177633Sdfr * A sequence of calls may be batched-up in a send buffer.  The rpc call
47177633Sdfr * return immediately to the client even though the call was not necessarily
48177633Sdfr * sent.  The batching occurs if the results' xdr routine is NULL (0) AND
49177633Sdfr * the rpc timeout value is zero (see clnt.h, rpc).
50177633Sdfr *
51177633Sdfr * Clients should NOT casually batch calls that in fact return results; that is,
52177633Sdfr * the server side should be aware that a call is batched and not produce any
53177633Sdfr * return message.  Batched calls that produce many result messages can
54177633Sdfr * deadlock (netlock) the client and the server....
55177633Sdfr *
56177633Sdfr * Now go hang yourself.
57177633Sdfr */
58177633Sdfr
59177633Sdfr#include <sys/param.h>
60177633Sdfr#include <sys/systm.h>
61177633Sdfr#include <sys/lock.h>
62177633Sdfr#include <sys/malloc.h>
63177633Sdfr#include <sys/mbuf.h>
64177633Sdfr#include <sys/mutex.h>
65177633Sdfr#include <sys/pcpu.h>
66177633Sdfr#include <sys/proc.h>
67184588Sdfr#include <sys/protosw.h>
68177633Sdfr#include <sys/socket.h>
69177633Sdfr#include <sys/socketvar.h>
70177633Sdfr#include <sys/syslog.h>
71177633Sdfr#include <sys/time.h>
72177633Sdfr#include <sys/uio.h>
73196503Szec
74196503Szec#include <net/vnet.h>
75196503Szec
76184588Sdfr#include <netinet/tcp.h>
77177633Sdfr
78177633Sdfr#include <rpc/rpc.h>
79177685Sdfr#include <rpc/rpc_com.h>
80177633Sdfr
81177633Sdfr#define MCALL_MSG_SIZE 24
82177633Sdfr
83177633Sdfrstruct cmessage {
84177633Sdfr        struct cmsghdr cmsg;
85177633Sdfr        struct cmsgcred cmcred;
86177633Sdfr};
87177633Sdfr
88180025Sdfrstatic enum clnt_stat clnt_vc_call(CLIENT *, struct rpc_callextra *,
89184588Sdfr    rpcproc_t, struct mbuf *, struct mbuf **, struct timeval);
90177633Sdfrstatic void clnt_vc_geterr(CLIENT *, struct rpc_err *);
91177633Sdfrstatic bool_t clnt_vc_freeres(CLIENT *, xdrproc_t, void *);
92177633Sdfrstatic void clnt_vc_abort(CLIENT *);
93177633Sdfrstatic bool_t clnt_vc_control(CLIENT *, u_int, void *);
94184588Sdfrstatic void clnt_vc_close(CLIENT *);
95177633Sdfrstatic void clnt_vc_destroy(CLIENT *);
96177633Sdfrstatic bool_t time_not_ok(struct timeval *);
97193272Sjhbstatic int clnt_vc_soupcall(struct socket *so, void *arg, int waitflag);
98177633Sdfr
99177633Sdfrstatic struct clnt_ops clnt_vc_ops = {
100177633Sdfr	.cl_call =	clnt_vc_call,
101177633Sdfr	.cl_abort =	clnt_vc_abort,
102177633Sdfr	.cl_geterr =	clnt_vc_geterr,
103177633Sdfr	.cl_freeres =	clnt_vc_freeres,
104184588Sdfr	.cl_close =	clnt_vc_close,
105177633Sdfr	.cl_destroy =	clnt_vc_destroy,
106177633Sdfr	.cl_control =	clnt_vc_control
107177633Sdfr};
108177633Sdfr
109177633Sdfr/*
110180025Sdfr * A pending RPC request which awaits a reply. Requests which have
111180025Sdfr * received their reply will have cr_xid set to zero and cr_mrep to
112180025Sdfr * the mbuf chain of the reply.
113177633Sdfr */
114177633Sdfrstruct ct_request {
115177633Sdfr	TAILQ_ENTRY(ct_request) cr_link;
116177633Sdfr	uint32_t		cr_xid;		/* XID of request */
117177633Sdfr	struct mbuf		*cr_mrep;	/* reply received by upcall */
118177633Sdfr	int			cr_error;	/* any error from upcall */
119184588Sdfr	char			cr_verf[MAX_AUTH_BYTES]; /* reply verf */
120177633Sdfr};
121177633Sdfr
122177633SdfrTAILQ_HEAD(ct_request_list, ct_request);
123177633Sdfr
124177633Sdfrstruct ct_data {
125177633Sdfr	struct mtx	ct_lock;
126180025Sdfr	int		ct_threads;	/* number of threads in clnt_vc_call */
127184588Sdfr	bool_t		ct_closing;	/* TRUE if we are closing */
128184588Sdfr	bool_t		ct_closed;	/* TRUE if we are closed */
129177633Sdfr	struct socket	*ct_socket;	/* connection socket */
130177633Sdfr	bool_t		ct_closeit;	/* close it on destroy */
131177633Sdfr	struct timeval	ct_wait;	/* wait interval in milliseconds */
132177633Sdfr	struct sockaddr_storage	ct_addr; /* remote addr */
133177633Sdfr	struct rpc_err	ct_error;
134177633Sdfr	uint32_t	ct_xid;
135177633Sdfr	char		ct_mcallc[MCALL_MSG_SIZE]; /* marshalled callmsg */
136177633Sdfr	size_t		ct_mpos;	/* pos after marshal */
137177633Sdfr	const char	*ct_waitchan;
138177633Sdfr	int		ct_waitflag;
139177633Sdfr	struct mbuf	*ct_record;	/* current reply record */
140177633Sdfr	size_t		ct_record_resid; /* how much left of reply to read */
141177633Sdfr	bool_t		ct_record_eor;	 /* true if reading last fragment */
142177633Sdfr	struct ct_request_list ct_pending;
143193437Srmacklem	int		ct_upcallrefs;	/* Ref cnt of upcalls in prog. */
144177633Sdfr};
145177633Sdfr
146193437Srmacklemstatic void clnt_vc_upcallsdone(struct ct_data *);
147193437Srmacklem
148177633Sdfrstatic const char clnt_vc_errstr[] = "%s : %s";
149177633Sdfrstatic const char clnt_vc_str[] = "clnt_vc_create";
150177633Sdfrstatic const char clnt_read_vc_str[] = "read_vc";
151177633Sdfrstatic const char __no_mem_str[] = "out of memory";
152177633Sdfr
153177633Sdfr/*
154177633Sdfr * Create a client handle for a connection.
155177633Sdfr * Default options are set, which the user can change using clnt_control()'s.
156177633Sdfr * The rpc/vc package does buffering similar to stdio, so the client
157177633Sdfr * must pick send and receive buffer sizes, 0 => use the default.
158177633Sdfr * NB: fd is copied into a private area.
159177633Sdfr * NB: The rpch->cl_auth is set null authentication. Caller may wish to
160177633Sdfr * set this something more useful.
161177633Sdfr *
162177633Sdfr * fd should be an open socket
163177633Sdfr */
164177633SdfrCLIENT *
165177633Sdfrclnt_vc_create(
166177633Sdfr	struct socket *so,		/* open file descriptor */
167177633Sdfr	struct sockaddr *raddr,		/* servers address */
168177633Sdfr	const rpcprog_t prog,		/* program number */
169177633Sdfr	const rpcvers_t vers,		/* version number */
170177633Sdfr	size_t sendsz,			/* buffer recv size */
171177633Sdfr	size_t recvsz)			/* buffer send size */
172177633Sdfr{
173177633Sdfr	CLIENT *cl;			/* client handle */
174177633Sdfr	struct ct_data *ct = NULL;	/* client handle */
175177633Sdfr	struct timeval now;
176177633Sdfr	struct rpc_msg call_msg;
177177633Sdfr	static uint32_t disrupt;
178177633Sdfr	struct __rpc_sockinfo si;
179177633Sdfr	XDR xdrs;
180184588Sdfr	int error, interrupted, one = 1;
181184588Sdfr	struct sockopt sopt;
182177633Sdfr
183177633Sdfr	if (disrupt == 0)
184177633Sdfr		disrupt = (uint32_t)(long)raddr;
185177633Sdfr
186177633Sdfr	cl = (CLIENT *)mem_alloc(sizeof (*cl));
187177633Sdfr	ct = (struct ct_data *)mem_alloc(sizeof (*ct));
188177633Sdfr
189177633Sdfr	mtx_init(&ct->ct_lock, "ct->ct_lock", NULL, MTX_DEF);
190180025Sdfr	ct->ct_threads = 0;
191180025Sdfr	ct->ct_closing = FALSE;
192184588Sdfr	ct->ct_closed = FALSE;
193193437Srmacklem	ct->ct_upcallrefs = 0;
194177633Sdfr
195177633Sdfr	if ((so->so_state & (SS_ISCONNECTED|SS_ISCONFIRMING)) == 0) {
196177633Sdfr		error = soconnect(so, raddr, curthread);
197180025Sdfr		SOCK_LOCK(so);
198180025Sdfr		interrupted = 0;
199180025Sdfr		while ((so->so_state & SS_ISCONNECTING)
200180025Sdfr		    && so->so_error == 0) {
201180025Sdfr			error = msleep(&so->so_timeo, SOCK_MTX(so),
202195703Skib			    PSOCK | PCATCH | PBDRY, "connec", 0);
203180025Sdfr			if (error) {
204180025Sdfr				if (error == EINTR || error == ERESTART)
205180025Sdfr					interrupted = 1;
206180025Sdfr				break;
207180025Sdfr			}
208180025Sdfr		}
209180025Sdfr		if (error == 0) {
210180025Sdfr			error = so->so_error;
211180025Sdfr			so->so_error = 0;
212180025Sdfr		}
213180025Sdfr		SOCK_UNLOCK(so);
214177633Sdfr		if (error) {
215180025Sdfr			if (!interrupted)
216180025Sdfr				so->so_state &= ~SS_ISCONNECTING;
217177633Sdfr			rpc_createerr.cf_stat = RPC_SYSTEMERROR;
218177633Sdfr			rpc_createerr.cf_error.re_errno = error;
219177633Sdfr			goto err;
220177633Sdfr		}
221177633Sdfr	}
222177633Sdfr
223196503Szec	CURVNET_SET(so->so_vnet);
224196503Szec	if (!__rpc_socket2sockinfo(so, &si)) {
225196503Szec		CURVNET_RESTORE();
226177633Sdfr		goto err;
227196503Szec	}
228177633Sdfr
229184588Sdfr	if (so->so_proto->pr_flags & PR_CONNREQUIRED) {
230184588Sdfr		bzero(&sopt, sizeof(sopt));
231184588Sdfr		sopt.sopt_dir = SOPT_SET;
232184588Sdfr		sopt.sopt_level = SOL_SOCKET;
233184588Sdfr		sopt.sopt_name = SO_KEEPALIVE;
234184588Sdfr		sopt.sopt_val = &one;
235184588Sdfr		sopt.sopt_valsize = sizeof(one);
236184588Sdfr		sosetopt(so, &sopt);
237184588Sdfr	}
238184588Sdfr
239184588Sdfr	if (so->so_proto->pr_protocol == IPPROTO_TCP) {
240184588Sdfr		bzero(&sopt, sizeof(sopt));
241184588Sdfr		sopt.sopt_dir = SOPT_SET;
242184588Sdfr		sopt.sopt_level = IPPROTO_TCP;
243184588Sdfr		sopt.sopt_name = TCP_NODELAY;
244184588Sdfr		sopt.sopt_val = &one;
245184588Sdfr		sopt.sopt_valsize = sizeof(one);
246184588Sdfr		sosetopt(so, &sopt);
247184588Sdfr	}
248196503Szec	CURVNET_RESTORE();
249184588Sdfr
250177633Sdfr	ct->ct_closeit = FALSE;
251177633Sdfr
252177633Sdfr	/*
253177633Sdfr	 * Set up private data struct
254177633Sdfr	 */
255177633Sdfr	ct->ct_socket = so;
256177633Sdfr	ct->ct_wait.tv_sec = -1;
257177633Sdfr	ct->ct_wait.tv_usec = -1;
258177633Sdfr	memcpy(&ct->ct_addr, raddr, raddr->sa_len);
259177633Sdfr
260177633Sdfr	/*
261177633Sdfr	 * Initialize call message
262177633Sdfr	 */
263177633Sdfr	getmicrotime(&now);
264177633Sdfr	ct->ct_xid = ((uint32_t)++disrupt) ^ __RPC_GETXID(&now);
265177633Sdfr	call_msg.rm_xid = ct->ct_xid;
266177633Sdfr	call_msg.rm_direction = CALL;
267177633Sdfr	call_msg.rm_call.cb_rpcvers = RPC_MSG_VERSION;
268177633Sdfr	call_msg.rm_call.cb_prog = (uint32_t)prog;
269177633Sdfr	call_msg.rm_call.cb_vers = (uint32_t)vers;
270177633Sdfr
271177633Sdfr	/*
272177633Sdfr	 * pre-serialize the static part of the call msg and stash it away
273177633Sdfr	 */
274177633Sdfr	xdrmem_create(&xdrs, ct->ct_mcallc, MCALL_MSG_SIZE,
275177633Sdfr	    XDR_ENCODE);
276177633Sdfr	if (! xdr_callhdr(&xdrs, &call_msg)) {
277177633Sdfr		if (ct->ct_closeit) {
278177633Sdfr			soclose(ct->ct_socket);
279177633Sdfr		}
280177633Sdfr		goto err;
281177633Sdfr	}
282177633Sdfr	ct->ct_mpos = XDR_GETPOS(&xdrs);
283177633Sdfr	XDR_DESTROY(&xdrs);
284177633Sdfr	ct->ct_waitchan = "rpcrecv";
285177633Sdfr	ct->ct_waitflag = 0;
286177633Sdfr
287177633Sdfr	/*
288177633Sdfr	 * Create a client handle which uses xdrrec for serialization
289177633Sdfr	 * and authnone for authentication.
290177633Sdfr	 */
291213756Srmacklem	sendsz = __rpc_get_t_size(si.si_af, si.si_proto, (int)sendsz);
292213756Srmacklem	recvsz = __rpc_get_t_size(si.si_af, si.si_proto, (int)recvsz);
293213756Srmacklem	error = soreserve(ct->ct_socket, sendsz, recvsz);
294213756Srmacklem	if (error != 0) {
295213756Srmacklem		if (ct->ct_closeit) {
296213756Srmacklem			soclose(ct->ct_socket);
297213756Srmacklem		}
298213756Srmacklem		goto err;
299213756Srmacklem	}
300180025Sdfr	cl->cl_refs = 1;
301177633Sdfr	cl->cl_ops = &clnt_vc_ops;
302177633Sdfr	cl->cl_private = ct;
303177633Sdfr	cl->cl_auth = authnone_create();
304177633Sdfr
305177633Sdfr	SOCKBUF_LOCK(&ct->ct_socket->so_rcv);
306193272Sjhb	soupcall_set(ct->ct_socket, SO_RCV, clnt_vc_soupcall, ct);
307177633Sdfr	SOCKBUF_UNLOCK(&ct->ct_socket->so_rcv);
308177633Sdfr
309177633Sdfr	ct->ct_record = NULL;
310177633Sdfr	ct->ct_record_resid = 0;
311177633Sdfr	TAILQ_INIT(&ct->ct_pending);
312177633Sdfr	return (cl);
313177633Sdfr
314177633Sdfrerr:
315177633Sdfr	if (cl) {
316177633Sdfr		if (ct) {
317184877Sdfr			mtx_destroy(&ct->ct_lock);
318177633Sdfr			mem_free(ct, sizeof (struct ct_data));
319177633Sdfr		}
320177633Sdfr		if (cl)
321177633Sdfr			mem_free(cl, sizeof (CLIENT));
322177633Sdfr	}
323177633Sdfr	return ((CLIENT *)NULL);
324177633Sdfr}
325177633Sdfr
326177633Sdfrstatic enum clnt_stat
327177633Sdfrclnt_vc_call(
328184588Sdfr	CLIENT		*cl,		/* client handle */
329184588Sdfr	struct rpc_callextra *ext,	/* call metadata */
330184588Sdfr	rpcproc_t	proc,		/* procedure number */
331184588Sdfr	struct mbuf	*args,		/* pointer to args */
332184588Sdfr	struct mbuf	**resultsp,	/* pointer to results */
333184588Sdfr	struct timeval	utimeout)
334177633Sdfr{
335177633Sdfr	struct ct_data *ct = (struct ct_data *) cl->cl_private;
336180025Sdfr	AUTH *auth;
337184588Sdfr	struct rpc_err *errp;
338184588Sdfr	enum clnt_stat stat;
339177633Sdfr	XDR xdrs;
340177633Sdfr	struct rpc_msg reply_msg;
341177633Sdfr	bool_t ok;
342177633Sdfr	int nrefreshes = 2;		/* number of times to refresh cred */
343177633Sdfr	struct timeval timeout;
344177633Sdfr	uint32_t xid;
345184588Sdfr	struct mbuf *mreq = NULL, *results;
346180025Sdfr	struct ct_request *cr;
347177633Sdfr	int error;
348177633Sdfr
349180025Sdfr	cr = malloc(sizeof(struct ct_request), M_RPC, M_WAITOK);
350180025Sdfr
351177633Sdfr	mtx_lock(&ct->ct_lock);
352177633Sdfr
353184588Sdfr	if (ct->ct_closing || ct->ct_closed) {
354180025Sdfr		mtx_unlock(&ct->ct_lock);
355180025Sdfr		free(cr, M_RPC);
356180025Sdfr		return (RPC_CANTSEND);
357180025Sdfr	}
358180025Sdfr	ct->ct_threads++;
359177633Sdfr
360184588Sdfr	if (ext) {
361180025Sdfr		auth = ext->rc_auth;
362184588Sdfr		errp = &ext->rc_err;
363184588Sdfr	} else {
364180025Sdfr		auth = cl->cl_auth;
365184588Sdfr		errp = &ct->ct_error;
366184588Sdfr	}
367180025Sdfr
368180025Sdfr	cr->cr_mrep = NULL;
369180025Sdfr	cr->cr_error = 0;
370180025Sdfr
371177633Sdfr	if (ct->ct_wait.tv_usec == -1) {
372177633Sdfr		timeout = utimeout;	/* use supplied timeout */
373177633Sdfr	} else {
374177633Sdfr		timeout = ct->ct_wait;	/* use default timeout */
375177633Sdfr	}
376177633Sdfr
377177633Sdfrcall_again:
378177633Sdfr	mtx_assert(&ct->ct_lock, MA_OWNED);
379177633Sdfr
380177633Sdfr	ct->ct_xid++;
381177633Sdfr	xid = ct->ct_xid;
382177633Sdfr
383177633Sdfr	mtx_unlock(&ct->ct_lock);
384177633Sdfr
385177633Sdfr	/*
386177633Sdfr	 * Leave space to pre-pend the record mark.
387177633Sdfr	 */
388177633Sdfr	MGETHDR(mreq, M_WAIT, MT_DATA);
389177633Sdfr	mreq->m_data += sizeof(uint32_t);
390184588Sdfr	KASSERT(ct->ct_mpos + sizeof(uint32_t) <= MHLEN,
391184588Sdfr	    ("RPC header too big"));
392184588Sdfr	bcopy(ct->ct_mcallc, mreq->m_data, ct->ct_mpos);
393184588Sdfr	mreq->m_len = ct->ct_mpos;
394177633Sdfr
395177633Sdfr	/*
396177633Sdfr	 * The XID is the first thing in the request.
397177633Sdfr	 */
398177633Sdfr	*mtod(mreq, uint32_t *) = htonl(xid);
399177633Sdfr
400177633Sdfr	xdrmbuf_create(&xdrs, mreq, XDR_ENCODE);
401177633Sdfr
402184588Sdfr	errp->re_status = stat = RPC_SUCCESS;
403177633Sdfr
404177633Sdfr	if ((! XDR_PUTINT32(&xdrs, &proc)) ||
405184588Sdfr	    (! AUTH_MARSHALL(auth, xid, &xdrs,
406184588Sdfr		m_copym(args, 0, M_COPYALL, M_WAITOK)))) {
407184588Sdfr		errp->re_status = stat = RPC_CANTENCODEARGS;
408180025Sdfr		mtx_lock(&ct->ct_lock);
409180025Sdfr		goto out;
410177633Sdfr	}
411184588Sdfr	mreq->m_pkthdr.len = m_length(mreq, NULL);
412177633Sdfr
413177633Sdfr	/*
414177633Sdfr	 * Prepend a record marker containing the packet length.
415177633Sdfr	 */
416177633Sdfr	M_PREPEND(mreq, sizeof(uint32_t), M_WAIT);
417177633Sdfr	*mtod(mreq, uint32_t *) =
418177633Sdfr		htonl(0x80000000 | (mreq->m_pkthdr.len - sizeof(uint32_t)));
419177633Sdfr
420180025Sdfr	cr->cr_xid = xid;
421177633Sdfr	mtx_lock(&ct->ct_lock);
422199053Srmacklem	/*
423199053Srmacklem	 * Check to see if the other end has already started to close down
424199053Srmacklem	 * the connection. The upcall will have set ct_error.re_status
425199053Srmacklem	 * to RPC_CANTRECV if this is the case.
426199053Srmacklem	 * If the other end starts to close down the connection after this
427199053Srmacklem	 * point, it will be detected later when cr_error is checked,
428199053Srmacklem	 * since the request is in the ct_pending queue.
429199053Srmacklem	 */
430199053Srmacklem	if (ct->ct_error.re_status == RPC_CANTRECV) {
431199053Srmacklem		if (errp != &ct->ct_error) {
432199053Srmacklem			errp->re_errno = ct->ct_error.re_errno;
433199053Srmacklem			errp->re_status = RPC_CANTRECV;
434199053Srmacklem		}
435199053Srmacklem		stat = RPC_CANTRECV;
436199053Srmacklem		goto out;
437199053Srmacklem	}
438180025Sdfr	TAILQ_INSERT_TAIL(&ct->ct_pending, cr, cr_link);
439177633Sdfr	mtx_unlock(&ct->ct_lock);
440177633Sdfr
441177633Sdfr	/*
442177633Sdfr	 * sosend consumes mreq.
443177633Sdfr	 */
444177633Sdfr	error = sosend(ct->ct_socket, NULL, NULL, mreq, NULL, 0, curthread);
445177633Sdfr	mreq = NULL;
446184588Sdfr	if (error == EMSGSIZE) {
447184588Sdfr		SOCKBUF_LOCK(&ct->ct_socket->so_snd);
448184588Sdfr		sbwait(&ct->ct_socket->so_snd);
449184588Sdfr		SOCKBUF_UNLOCK(&ct->ct_socket->so_snd);
450184588Sdfr		AUTH_VALIDATE(auth, xid, NULL, NULL);
451184588Sdfr		mtx_lock(&ct->ct_lock);
452184588Sdfr		TAILQ_REMOVE(&ct->ct_pending, cr, cr_link);
453184588Sdfr		goto call_again;
454184588Sdfr	}
455177633Sdfr
456184588Sdfr	reply_msg.acpted_rply.ar_verf.oa_flavor = AUTH_NULL;
457184588Sdfr	reply_msg.acpted_rply.ar_verf.oa_base = cr->cr_verf;
458184588Sdfr	reply_msg.acpted_rply.ar_verf.oa_length = 0;
459184588Sdfr	reply_msg.acpted_rply.ar_results.where = NULL;
460184588Sdfr	reply_msg.acpted_rply.ar_results.proc = (xdrproc_t)xdr_void;
461177633Sdfr
462177633Sdfr	mtx_lock(&ct->ct_lock);
463177633Sdfr	if (error) {
464180025Sdfr		TAILQ_REMOVE(&ct->ct_pending, cr, cr_link);
465184588Sdfr		errp->re_errno = error;
466184588Sdfr		errp->re_status = stat = RPC_CANTSEND;
467177633Sdfr		goto out;
468177633Sdfr	}
469177633Sdfr
470177633Sdfr	/*
471177633Sdfr	 * Check to see if we got an upcall while waiting for the
472177633Sdfr	 * lock. In both these cases, the request has been removed
473177633Sdfr	 * from ct->ct_pending.
474177633Sdfr	 */
475180025Sdfr	if (cr->cr_error) {
476180025Sdfr		TAILQ_REMOVE(&ct->ct_pending, cr, cr_link);
477184588Sdfr		errp->re_errno = cr->cr_error;
478184588Sdfr		errp->re_status = stat = RPC_CANTRECV;
479177633Sdfr		goto out;
480177633Sdfr	}
481180025Sdfr	if (cr->cr_mrep) {
482180025Sdfr		TAILQ_REMOVE(&ct->ct_pending, cr, cr_link);
483177633Sdfr		goto got_reply;
484177633Sdfr	}
485177633Sdfr
486177633Sdfr	/*
487177633Sdfr	 * Hack to provide rpc-based message passing
488177633Sdfr	 */
489177633Sdfr	if (timeout.tv_sec == 0 && timeout.tv_usec == 0) {
490180025Sdfr		TAILQ_REMOVE(&ct->ct_pending, cr, cr_link);
491184588Sdfr		errp->re_status = stat = RPC_TIMEDOUT;
492177633Sdfr		goto out;
493177633Sdfr	}
494177633Sdfr
495180025Sdfr	error = msleep(cr, &ct->ct_lock, ct->ct_waitflag, ct->ct_waitchan,
496177633Sdfr	    tvtohz(&timeout));
497177633Sdfr
498180025Sdfr	TAILQ_REMOVE(&ct->ct_pending, cr, cr_link);
499180025Sdfr
500177633Sdfr	if (error) {
501177633Sdfr		/*
502177633Sdfr		 * The sleep returned an error so our request is still
503177633Sdfr		 * on the list. Turn the error code into an
504177633Sdfr		 * appropriate client status.
505177633Sdfr		 */
506184588Sdfr		errp->re_errno = error;
507177633Sdfr		switch (error) {
508177633Sdfr		case EINTR:
509195703Skib		case ERESTART:
510184588Sdfr			stat = RPC_INTR;
511177633Sdfr			break;
512177633Sdfr		case EWOULDBLOCK:
513184588Sdfr			stat = RPC_TIMEDOUT;
514177633Sdfr			break;
515177633Sdfr		default:
516184588Sdfr			stat = RPC_CANTRECV;
517177633Sdfr		}
518184588Sdfr		errp->re_status = stat;
519177633Sdfr		goto out;
520177633Sdfr	} else {
521177633Sdfr		/*
522177633Sdfr		 * We were woken up by the upcall.  If the
523177633Sdfr		 * upcall had a receive error, report that,
524177633Sdfr		 * otherwise we have a reply.
525177633Sdfr		 */
526180025Sdfr		if (cr->cr_error) {
527184588Sdfr			errp->re_errno = cr->cr_error;
528184588Sdfr			errp->re_status = stat = RPC_CANTRECV;
529177633Sdfr			goto out;
530177633Sdfr		}
531177633Sdfr	}
532177633Sdfr
533177633Sdfrgot_reply:
534177633Sdfr	/*
535177633Sdfr	 * Now decode and validate the response. We need to drop the
536177633Sdfr	 * lock since xdr_replymsg may end up sleeping in malloc.
537177633Sdfr	 */
538177633Sdfr	mtx_unlock(&ct->ct_lock);
539177633Sdfr
540184588Sdfr	if (ext && ext->rc_feedback)
541184588Sdfr		ext->rc_feedback(FEEDBACK_OK, proc, ext->rc_feedback_arg);
542184588Sdfr
543180025Sdfr	xdrmbuf_create(&xdrs, cr->cr_mrep, XDR_DECODE);
544177633Sdfr	ok = xdr_replymsg(&xdrs, &reply_msg);
545180025Sdfr	cr->cr_mrep = NULL;
546177633Sdfr
547177633Sdfr	if (ok) {
548177633Sdfr		if ((reply_msg.rm_reply.rp_stat == MSG_ACCEPTED) &&
549184588Sdfr		    (reply_msg.acpted_rply.ar_stat == SUCCESS))
550184588Sdfr			errp->re_status = stat = RPC_SUCCESS;
551177633Sdfr		else
552184588Sdfr			stat = _seterr_reply(&reply_msg, errp);
553177633Sdfr
554184588Sdfr		if (stat == RPC_SUCCESS) {
555184588Sdfr			results = xdrmbuf_getall(&xdrs);
556184588Sdfr			if (!AUTH_VALIDATE(auth, xid,
557184588Sdfr				&reply_msg.acpted_rply.ar_verf,
558184588Sdfr				&results)) {
559184588Sdfr				errp->re_status = stat = RPC_AUTHERROR;
560184588Sdfr				errp->re_why = AUTH_INVALIDRESP;
561184588Sdfr			} else {
562184588Sdfr				KASSERT(results,
563184588Sdfr				    ("auth validated but no result"));
564184588Sdfr				*resultsp = results;
565177633Sdfr			}
566177633Sdfr		}		/* end successful completion */
567177633Sdfr		/*
568177633Sdfr		 * If unsuccesful AND error is an authentication error
569177633Sdfr		 * then refresh credentials and try again, else break
570177633Sdfr		 */
571184588Sdfr		else if (stat == RPC_AUTHERROR)
572177633Sdfr			/* maybe our credentials need to be refreshed ... */
573177633Sdfr			if (nrefreshes > 0 &&
574184588Sdfr			    AUTH_REFRESH(auth, &reply_msg)) {
575177633Sdfr				nrefreshes--;
576184588Sdfr				XDR_DESTROY(&xdrs);
577184588Sdfr				mtx_lock(&ct->ct_lock);
578177633Sdfr				goto call_again;
579177633Sdfr			}
580177633Sdfr		/* end of unsuccessful completion */
581177633Sdfr	}	/* end of valid reply message */
582177633Sdfr	else {
583184588Sdfr		errp->re_status = stat = RPC_CANTDECODERES;
584177633Sdfr	}
585184588Sdfr	XDR_DESTROY(&xdrs);
586184588Sdfr	mtx_lock(&ct->ct_lock);
587177633Sdfrout:
588177633Sdfr	mtx_assert(&ct->ct_lock, MA_OWNED);
589177633Sdfr
590184588Sdfr	KASSERT(stat != RPC_SUCCESS || *resultsp,
591184588Sdfr	    ("RPC_SUCCESS without reply"));
592184588Sdfr
593177633Sdfr	if (mreq)
594177633Sdfr		m_freem(mreq);
595180025Sdfr	if (cr->cr_mrep)
596180025Sdfr		m_freem(cr->cr_mrep);
597177633Sdfr
598180025Sdfr	ct->ct_threads--;
599180025Sdfr	if (ct->ct_closing)
600180025Sdfr		wakeup(ct);
601180025Sdfr
602177633Sdfr	mtx_unlock(&ct->ct_lock);
603180025Sdfr
604184588Sdfr	if (auth && stat != RPC_SUCCESS)
605184588Sdfr		AUTH_VALIDATE(auth, xid, NULL, NULL);
606184588Sdfr
607180025Sdfr	free(cr, M_RPC);
608180025Sdfr
609184588Sdfr	return (stat);
610177633Sdfr}
611177633Sdfr
612177633Sdfrstatic void
613177633Sdfrclnt_vc_geterr(CLIENT *cl, struct rpc_err *errp)
614177633Sdfr{
615177633Sdfr	struct ct_data *ct = (struct ct_data *) cl->cl_private;
616177633Sdfr
617177633Sdfr	*errp = ct->ct_error;
618177633Sdfr}
619177633Sdfr
620177633Sdfrstatic bool_t
621177633Sdfrclnt_vc_freeres(CLIENT *cl, xdrproc_t xdr_res, void *res_ptr)
622177633Sdfr{
623177633Sdfr	XDR xdrs;
624177633Sdfr	bool_t dummy;
625177633Sdfr
626177633Sdfr	xdrs.x_op = XDR_FREE;
627177633Sdfr	dummy = (*xdr_res)(&xdrs, res_ptr);
628177633Sdfr
629177633Sdfr	return (dummy);
630177633Sdfr}
631177633Sdfr
632177633Sdfr/*ARGSUSED*/
633177633Sdfrstatic void
634177633Sdfrclnt_vc_abort(CLIENT *cl)
635177633Sdfr{
636177633Sdfr}
637177633Sdfr
638177633Sdfrstatic bool_t
639177633Sdfrclnt_vc_control(CLIENT *cl, u_int request, void *info)
640177633Sdfr{
641177633Sdfr	struct ct_data *ct = (struct ct_data *)cl->cl_private;
642177633Sdfr	void *infop = info;
643177633Sdfr
644177633Sdfr	mtx_lock(&ct->ct_lock);
645177633Sdfr
646177633Sdfr	switch (request) {
647177633Sdfr	case CLSET_FD_CLOSE:
648177633Sdfr		ct->ct_closeit = TRUE;
649177633Sdfr		mtx_unlock(&ct->ct_lock);
650177633Sdfr		return (TRUE);
651177633Sdfr	case CLSET_FD_NCLOSE:
652177633Sdfr		ct->ct_closeit = FALSE;
653177633Sdfr		mtx_unlock(&ct->ct_lock);
654177633Sdfr		return (TRUE);
655177633Sdfr	default:
656177633Sdfr		break;
657177633Sdfr	}
658177633Sdfr
659177633Sdfr	/* for other requests which use info */
660177633Sdfr	if (info == NULL) {
661177633Sdfr		mtx_unlock(&ct->ct_lock);
662177633Sdfr		return (FALSE);
663177633Sdfr	}
664177633Sdfr	switch (request) {
665177633Sdfr	case CLSET_TIMEOUT:
666177633Sdfr		if (time_not_ok((struct timeval *)info)) {
667177633Sdfr			mtx_unlock(&ct->ct_lock);
668177633Sdfr			return (FALSE);
669177633Sdfr		}
670177633Sdfr		ct->ct_wait = *(struct timeval *)infop;
671177633Sdfr		break;
672177633Sdfr	case CLGET_TIMEOUT:
673177633Sdfr		*(struct timeval *)infop = ct->ct_wait;
674177633Sdfr		break;
675177633Sdfr	case CLGET_SERVER_ADDR:
676177633Sdfr		(void) memcpy(info, &ct->ct_addr, (size_t)ct->ct_addr.ss_len);
677177633Sdfr		break;
678177633Sdfr	case CLGET_SVC_ADDR:
679177633Sdfr		/*
680177633Sdfr		 * Slightly different semantics to userland - we use
681177633Sdfr		 * sockaddr instead of netbuf.
682177633Sdfr		 */
683177633Sdfr		memcpy(info, &ct->ct_addr, ct->ct_addr.ss_len);
684177633Sdfr		break;
685177633Sdfr	case CLSET_SVC_ADDR:		/* set to new address */
686177633Sdfr		mtx_unlock(&ct->ct_lock);
687177633Sdfr		return (FALSE);
688177633Sdfr	case CLGET_XID:
689177633Sdfr		*(uint32_t *)info = ct->ct_xid;
690177633Sdfr		break;
691177633Sdfr	case CLSET_XID:
692177633Sdfr		/* This will set the xid of the NEXT call */
693177633Sdfr		/* decrement by 1 as clnt_vc_call() increments once */
694177633Sdfr		ct->ct_xid = *(uint32_t *)info - 1;
695177633Sdfr		break;
696177633Sdfr	case CLGET_VERS:
697177633Sdfr		/*
698177633Sdfr		 * This RELIES on the information that, in the call body,
699177633Sdfr		 * the version number field is the fifth field from the
700177633Sdfr		 * begining of the RPC header. MUST be changed if the
701177633Sdfr		 * call_struct is changed
702177633Sdfr		 */
703177633Sdfr		*(uint32_t *)info =
704177633Sdfr		    ntohl(*(uint32_t *)(void *)(ct->ct_mcallc +
705177633Sdfr		    4 * BYTES_PER_XDR_UNIT));
706177633Sdfr		break;
707177633Sdfr
708177633Sdfr	case CLSET_VERS:
709177633Sdfr		*(uint32_t *)(void *)(ct->ct_mcallc +
710177633Sdfr		    4 * BYTES_PER_XDR_UNIT) =
711177633Sdfr		    htonl(*(uint32_t *)info);
712177633Sdfr		break;
713177633Sdfr
714177633Sdfr	case CLGET_PROG:
715177633Sdfr		/*
716177633Sdfr		 * This RELIES on the information that, in the call body,
717177633Sdfr		 * the program number field is the fourth field from the
718177633Sdfr		 * begining of the RPC header. MUST be changed if the
719177633Sdfr		 * call_struct is changed
720177633Sdfr		 */
721177633Sdfr		*(uint32_t *)info =
722177633Sdfr		    ntohl(*(uint32_t *)(void *)(ct->ct_mcallc +
723177633Sdfr		    3 * BYTES_PER_XDR_UNIT));
724177633Sdfr		break;
725177633Sdfr
726177633Sdfr	case CLSET_PROG:
727177633Sdfr		*(uint32_t *)(void *)(ct->ct_mcallc +
728177633Sdfr		    3 * BYTES_PER_XDR_UNIT) =
729177633Sdfr		    htonl(*(uint32_t *)info);
730177633Sdfr		break;
731177633Sdfr
732177633Sdfr	case CLSET_WAITCHAN:
733184588Sdfr		ct->ct_waitchan = (const char *)info;
734177633Sdfr		break;
735177633Sdfr
736177633Sdfr	case CLGET_WAITCHAN:
737177633Sdfr		*(const char **) info = ct->ct_waitchan;
738177633Sdfr		break;
739177633Sdfr
740177633Sdfr	case CLSET_INTERRUPTIBLE:
741177633Sdfr		if (*(int *) info)
742195703Skib			ct->ct_waitflag = PCATCH | PBDRY;
743177633Sdfr		else
744177633Sdfr			ct->ct_waitflag = 0;
745177633Sdfr		break;
746177633Sdfr
747177633Sdfr	case CLGET_INTERRUPTIBLE:
748177633Sdfr		if (ct->ct_waitflag)
749177633Sdfr			*(int *) info = TRUE;
750177633Sdfr		else
751177633Sdfr			*(int *) info = FALSE;
752177633Sdfr		break;
753177633Sdfr
754177633Sdfr	default:
755177633Sdfr		mtx_unlock(&ct->ct_lock);
756177633Sdfr		return (FALSE);
757177633Sdfr	}
758177633Sdfr
759177633Sdfr	mtx_unlock(&ct->ct_lock);
760177633Sdfr	return (TRUE);
761177633Sdfr}
762177633Sdfr
763177633Sdfrstatic void
764184588Sdfrclnt_vc_close(CLIENT *cl)
765177633Sdfr{
766177633Sdfr	struct ct_data *ct = (struct ct_data *) cl->cl_private;
767180025Sdfr	struct ct_request *cr;
768177633Sdfr
769177633Sdfr	mtx_lock(&ct->ct_lock);
770177633Sdfr
771184588Sdfr	if (ct->ct_closed) {
772184588Sdfr		mtx_unlock(&ct->ct_lock);
773184588Sdfr		return;
774184588Sdfr	}
775184588Sdfr
776184588Sdfr	if (ct->ct_closing) {
777184588Sdfr		while (ct->ct_closing)
778184588Sdfr			msleep(ct, &ct->ct_lock, 0, "rpcclose", 0);
779184588Sdfr		KASSERT(ct->ct_closed, ("client should be closed"));
780184588Sdfr		mtx_unlock(&ct->ct_lock);
781184588Sdfr		return;
782184588Sdfr	}
783184588Sdfr
784177633Sdfr	if (ct->ct_socket) {
785193272Sjhb		ct->ct_closing = TRUE;
786193272Sjhb		mtx_unlock(&ct->ct_lock);
787193272Sjhb
788177633Sdfr		SOCKBUF_LOCK(&ct->ct_socket->so_rcv);
789193272Sjhb		soupcall_clear(ct->ct_socket, SO_RCV);
790193437Srmacklem		clnt_vc_upcallsdone(ct);
791177633Sdfr		SOCKBUF_UNLOCK(&ct->ct_socket->so_rcv);
792177633Sdfr
793180025Sdfr		/*
794180025Sdfr		 * Abort any pending requests and wait until everyone
795180025Sdfr		 * has finished with clnt_vc_call.
796180025Sdfr		 */
797193272Sjhb		mtx_lock(&ct->ct_lock);
798180025Sdfr		TAILQ_FOREACH(cr, &ct->ct_pending, cr_link) {
799180025Sdfr			cr->cr_xid = 0;
800180025Sdfr			cr->cr_error = ESHUTDOWN;
801180025Sdfr			wakeup(cr);
802180025Sdfr		}
803177633Sdfr
804180025Sdfr		while (ct->ct_threads)
805180025Sdfr			msleep(ct, &ct->ct_lock, 0, "rpcclose", 0);
806184588Sdfr	}
807180025Sdfr
808184588Sdfr	ct->ct_closing = FALSE;
809184588Sdfr	ct->ct_closed = TRUE;
810184588Sdfr	mtx_unlock(&ct->ct_lock);
811184588Sdfr	wakeup(ct);
812184588Sdfr}
813184588Sdfr
814184588Sdfrstatic void
815184588Sdfrclnt_vc_destroy(CLIENT *cl)
816184588Sdfr{
817184588Sdfr	struct ct_data *ct = (struct ct_data *) cl->cl_private;
818184588Sdfr	struct socket *so = NULL;
819184588Sdfr
820184588Sdfr	clnt_vc_close(cl);
821184588Sdfr
822184588Sdfr	mtx_lock(&ct->ct_lock);
823184588Sdfr
824184588Sdfr	if (ct->ct_socket) {
825177633Sdfr		if (ct->ct_closeit) {
826177633Sdfr			so = ct->ct_socket;
827177633Sdfr		}
828177633Sdfr	}
829177633Sdfr
830177633Sdfr	mtx_unlock(&ct->ct_lock);
831177633Sdfr
832177633Sdfr	mtx_destroy(&ct->ct_lock);
833177633Sdfr	if (so) {
834177633Sdfr		soshutdown(so, SHUT_WR);
835177633Sdfr		soclose(so);
836177633Sdfr	}
837177633Sdfr	mem_free(ct, sizeof(struct ct_data));
838177633Sdfr	mem_free(cl, sizeof(CLIENT));
839177633Sdfr}
840177633Sdfr
841177633Sdfr/*
842177633Sdfr * Make sure that the time is not garbage.   -1 value is disallowed.
843177633Sdfr * Note this is different from time_not_ok in clnt_dg.c
844177633Sdfr */
845177633Sdfrstatic bool_t
846177633Sdfrtime_not_ok(struct timeval *t)
847177633Sdfr{
848177633Sdfr	return (t->tv_sec <= -1 || t->tv_sec > 100000000 ||
849177633Sdfr		t->tv_usec <= -1 || t->tv_usec > 1000000);
850177633Sdfr}
851177633Sdfr
852193272Sjhbint
853177633Sdfrclnt_vc_soupcall(struct socket *so, void *arg, int waitflag)
854177633Sdfr{
855177633Sdfr	struct ct_data *ct = (struct ct_data *) arg;
856177633Sdfr	struct uio uio;
857177633Sdfr	struct mbuf *m;
858177633Sdfr	struct ct_request *cr;
859177633Sdfr	int error, rcvflag, foundreq;
860177633Sdfr	uint32_t xid, header;
861184588Sdfr	bool_t do_read;
862177633Sdfr
863193437Srmacklem	ct->ct_upcallrefs++;
864177633Sdfr	uio.uio_td = curthread;
865177633Sdfr	do {
866177633Sdfr		/*
867177633Sdfr		 * If ct_record_resid is zero, we are waiting for a
868177633Sdfr		 * record mark.
869177633Sdfr		 */
870177633Sdfr		if (ct->ct_record_resid == 0) {
871177633Sdfr
872177633Sdfr			/*
873177633Sdfr			 * Make sure there is either a whole record
874177633Sdfr			 * mark in the buffer or there is some other
875177633Sdfr			 * error condition
876177633Sdfr			 */
877177633Sdfr			do_read = FALSE;
878177633Sdfr			if (so->so_rcv.sb_cc >= sizeof(uint32_t)
879177633Sdfr			    || (so->so_rcv.sb_state & SBS_CANTRCVMORE)
880177633Sdfr			    || so->so_error)
881177633Sdfr				do_read = TRUE;
882177633Sdfr
883177633Sdfr			if (!do_read)
884193437Srmacklem				break;
885177633Sdfr
886193272Sjhb			SOCKBUF_UNLOCK(&so->so_rcv);
887177633Sdfr			uio.uio_resid = sizeof(uint32_t);
888177633Sdfr			m = NULL;
889177633Sdfr			rcvflag = MSG_DONTWAIT | MSG_SOCALLBCK;
890177633Sdfr			error = soreceive(so, NULL, &uio, &m, NULL, &rcvflag);
891193272Sjhb			SOCKBUF_LOCK(&so->so_rcv);
892177633Sdfr
893177633Sdfr			if (error == EWOULDBLOCK)
894177633Sdfr				break;
895177633Sdfr
896177633Sdfr			/*
897177633Sdfr			 * If there was an error, wake up all pending
898177633Sdfr			 * requests.
899177633Sdfr			 */
900177633Sdfr			if (error || uio.uio_resid > 0) {
901177633Sdfr			wakeup_all:
902177633Sdfr				mtx_lock(&ct->ct_lock);
903177633Sdfr				if (!error) {
904177633Sdfr					/*
905177633Sdfr					 * We must have got EOF trying
906177633Sdfr					 * to read from the stream.
907177633Sdfr					 */
908177633Sdfr					error = ECONNRESET;
909177633Sdfr				}
910177633Sdfr				ct->ct_error.re_status = RPC_CANTRECV;
911177633Sdfr				ct->ct_error.re_errno = error;
912177633Sdfr				TAILQ_FOREACH(cr, &ct->ct_pending, cr_link) {
913177633Sdfr					cr->cr_error = error;
914177633Sdfr					wakeup(cr);
915177633Sdfr				}
916177633Sdfr				mtx_unlock(&ct->ct_lock);
917177633Sdfr				break;
918177633Sdfr			}
919184588Sdfr			bcopy(mtod(m, uint32_t *), &header, sizeof(uint32_t));
920177633Sdfr			header = ntohl(header);
921177633Sdfr			ct->ct_record = NULL;
922177633Sdfr			ct->ct_record_resid = header & 0x7fffffff;
923177633Sdfr			ct->ct_record_eor = ((header & 0x80000000) != 0);
924177633Sdfr			m_freem(m);
925177633Sdfr		} else {
926177633Sdfr			/*
927184588Sdfr			 * Wait until the socket has the whole record
928184588Sdfr			 * buffered.
929184588Sdfr			 */
930184588Sdfr			do_read = FALSE;
931184588Sdfr			if (so->so_rcv.sb_cc >= ct->ct_record_resid
932184588Sdfr			    || (so->so_rcv.sb_state & SBS_CANTRCVMORE)
933184588Sdfr			    || so->so_error)
934184588Sdfr				do_read = TRUE;
935184588Sdfr
936184588Sdfr			if (!do_read)
937193437Srmacklem				break;
938184588Sdfr
939184588Sdfr			/*
940177633Sdfr			 * We have the record mark. Read as much as
941177633Sdfr			 * the socket has buffered up to the end of
942177633Sdfr			 * this record.
943177633Sdfr			 */
944193272Sjhb			SOCKBUF_UNLOCK(&so->so_rcv);
945177633Sdfr			uio.uio_resid = ct->ct_record_resid;
946177633Sdfr			m = NULL;
947177633Sdfr			rcvflag = MSG_DONTWAIT | MSG_SOCALLBCK;
948177633Sdfr			error = soreceive(so, NULL, &uio, &m, NULL, &rcvflag);
949193272Sjhb			SOCKBUF_LOCK(&so->so_rcv);
950177633Sdfr
951177633Sdfr			if (error == EWOULDBLOCK)
952177633Sdfr				break;
953177633Sdfr
954177633Sdfr			if (error || uio.uio_resid == ct->ct_record_resid)
955177633Sdfr				goto wakeup_all;
956177633Sdfr
957177633Sdfr			/*
958177633Sdfr			 * If we have part of the record already,
959177633Sdfr			 * chain this bit onto the end.
960177633Sdfr			 */
961177633Sdfr			if (ct->ct_record)
962177633Sdfr				m_last(ct->ct_record)->m_next = m;
963177633Sdfr			else
964177633Sdfr				ct->ct_record = m;
965177633Sdfr
966177633Sdfr			ct->ct_record_resid = uio.uio_resid;
967177633Sdfr
968177633Sdfr			/*
969177633Sdfr			 * If we have the entire record, see if we can
970177633Sdfr			 * match it to a request.
971177633Sdfr			 */
972177633Sdfr			if (ct->ct_record_resid == 0
973177633Sdfr			    && ct->ct_record_eor) {
974177633Sdfr				/*
975177633Sdfr				 * The XID is in the first uint32_t of
976177633Sdfr				 * the reply.
977177633Sdfr				 */
978184588Sdfr				if (ct->ct_record->m_len < sizeof(xid))
979184588Sdfr					ct->ct_record =
980184588Sdfr						m_pullup(ct->ct_record,
981184588Sdfr						    sizeof(xid));
982177633Sdfr				if (!ct->ct_record)
983177633Sdfr					break;
984184588Sdfr				bcopy(mtod(ct->ct_record, uint32_t *),
985184588Sdfr				    &xid, sizeof(uint32_t));
986177633Sdfr				xid = ntohl(xid);
987177633Sdfr
988177633Sdfr				mtx_lock(&ct->ct_lock);
989177633Sdfr				foundreq = 0;
990177633Sdfr				TAILQ_FOREACH(cr, &ct->ct_pending, cr_link) {
991177633Sdfr					if (cr->cr_xid == xid) {
992177633Sdfr						/*
993177633Sdfr						 * This one
994180025Sdfr						 * matches. We leave
995180025Sdfr						 * the reply mbuf in
996177633Sdfr						 * cr->cr_mrep. Set
997177633Sdfr						 * the XID to zero so
998180025Sdfr						 * that we will ignore
999180025Sdfr						 * any duplicaed
1000180025Sdfr						 * replies.
1001177633Sdfr						 */
1002177633Sdfr						cr->cr_xid = 0;
1003177633Sdfr						cr->cr_mrep = ct->ct_record;
1004177633Sdfr						cr->cr_error = 0;
1005177633Sdfr						foundreq = 1;
1006177633Sdfr						wakeup(cr);
1007177633Sdfr						break;
1008177633Sdfr					}
1009177633Sdfr				}
1010177633Sdfr				mtx_unlock(&ct->ct_lock);
1011177633Sdfr
1012177633Sdfr				if (!foundreq)
1013177633Sdfr					m_freem(ct->ct_record);
1014177633Sdfr				ct->ct_record = NULL;
1015177633Sdfr			}
1016177633Sdfr		}
1017177633Sdfr	} while (m);
1018193437Srmacklem	ct->ct_upcallrefs--;
1019193437Srmacklem	if (ct->ct_upcallrefs < 0)
1020193437Srmacklem		panic("rpcvc upcall refcnt");
1021193437Srmacklem	if (ct->ct_upcallrefs == 0)
1022193437Srmacklem		wakeup(&ct->ct_upcallrefs);
1023193272Sjhb	return (SU_OK);
1024177633Sdfr}
1025193437Srmacklem
1026193437Srmacklem/*
1027193437Srmacklem * Wait for all upcalls in progress to complete.
1028193437Srmacklem */
1029193437Srmacklemstatic void
1030193437Srmacklemclnt_vc_upcallsdone(struct ct_data *ct)
1031193437Srmacklem{
1032193437Srmacklem
1033193437Srmacklem	SOCKBUF_LOCK_ASSERT(&ct->ct_socket->so_rcv);
1034193437Srmacklem
1035193437Srmacklem	while (ct->ct_upcallrefs > 0)
1036193437Srmacklem		(void) msleep(&ct->ct_upcallrefs,
1037193437Srmacklem		    SOCKBUF_MTX(&ct->ct_socket->so_rcv), 0, "rpcvcup", 0);
1038193437Srmacklem}
1039