10Sstevel@tonic-gate /* 20Sstevel@tonic-gate * CDDL HEADER START 30Sstevel@tonic-gate * 40Sstevel@tonic-gate * The contents of this file are subject to the terms of the 52470Sgt29601 * Common Development and Distribution License (the "License"). 62470Sgt29601 * You may not use this file except in compliance with the License. 70Sstevel@tonic-gate * 80Sstevel@tonic-gate * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 90Sstevel@tonic-gate * or http://www.opensolaris.org/os/licensing. 100Sstevel@tonic-gate * See the License for the specific language governing permissions 110Sstevel@tonic-gate * and limitations under the License. 120Sstevel@tonic-gate * 130Sstevel@tonic-gate * When distributing Covered Code, include this CDDL HEADER in each 140Sstevel@tonic-gate * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 150Sstevel@tonic-gate * If applicable, add the following below this CDDL HEADER, with the 160Sstevel@tonic-gate * fields enclosed by brackets "[]" replaced with your own identifying 170Sstevel@tonic-gate * information: Portions Copyright [yyyy] [name of copyright owner] 180Sstevel@tonic-gate * 190Sstevel@tonic-gate * CDDL HEADER END 200Sstevel@tonic-gate */ 210Sstevel@tonic-gate /* 224386Sgeorges * Copyright 2007 Sun Microsystems, Inc. All rights reserved. 230Sstevel@tonic-gate * Use is subject to license terms. 240Sstevel@tonic-gate */ 250Sstevel@tonic-gate /* Copyright (c) 1990 Mentat Inc. */ 260Sstevel@tonic-gate 270Sstevel@tonic-gate /* Copyright (c) 1984, 1986, 1987, 1988, 1989 AT&T */ 280Sstevel@tonic-gate /* All Rights Reserved */ 290Sstevel@tonic-gate 300Sstevel@tonic-gate #pragma ident "%Z%%M% %I% %E% SMI" 310Sstevel@tonic-gate 320Sstevel@tonic-gate /* 330Sstevel@tonic-gate * Kernel RPC filtering module 340Sstevel@tonic-gate */ 350Sstevel@tonic-gate 360Sstevel@tonic-gate #include <sys/param.h> 370Sstevel@tonic-gate #include <sys/types.h> 380Sstevel@tonic-gate #include <sys/stream.h> 390Sstevel@tonic-gate #include <sys/stropts.h> 400Sstevel@tonic-gate #include <sys/tihdr.h> 410Sstevel@tonic-gate #include <sys/timod.h> 420Sstevel@tonic-gate #include <sys/tiuser.h> 430Sstevel@tonic-gate #include <sys/debug.h> 440Sstevel@tonic-gate #include <sys/signal.h> 450Sstevel@tonic-gate #include <sys/pcb.h> 460Sstevel@tonic-gate #include <sys/user.h> 470Sstevel@tonic-gate #include <sys/errno.h> 480Sstevel@tonic-gate #include <sys/cred.h> 490Sstevel@tonic-gate #include <sys/policy.h> 500Sstevel@tonic-gate #include <sys/inline.h> 510Sstevel@tonic-gate #include <sys/cmn_err.h> 520Sstevel@tonic-gate #include <sys/kmem.h> 530Sstevel@tonic-gate #include <sys/file.h> 540Sstevel@tonic-gate #include <sys/sysmacros.h> 550Sstevel@tonic-gate #include <sys/systm.h> 560Sstevel@tonic-gate #include <sys/t_lock.h> 570Sstevel@tonic-gate #include <sys/ddi.h> 580Sstevel@tonic-gate #include <sys/vtrace.h> 590Sstevel@tonic-gate #include <sys/callb.h> 600Sstevel@tonic-gate 610Sstevel@tonic-gate #include <sys/strlog.h> 620Sstevel@tonic-gate #include <rpc/rpc_com.h> 630Sstevel@tonic-gate #include <inet/common.h> 640Sstevel@tonic-gate #include <rpc/types.h> 650Sstevel@tonic-gate #include <sys/time.h> 660Sstevel@tonic-gate #include <rpc/xdr.h> 670Sstevel@tonic-gate #include <rpc/auth.h> 680Sstevel@tonic-gate #include <rpc/clnt.h> 690Sstevel@tonic-gate #include <rpc/rpc_msg.h> 700Sstevel@tonic-gate #include <rpc/clnt.h> 710Sstevel@tonic-gate #include <rpc/svc.h> 720Sstevel@tonic-gate #include <rpc/rpcsys.h> 730Sstevel@tonic-gate #include <rpc/rpc_rdma.h> 740Sstevel@tonic-gate 750Sstevel@tonic-gate /* 760Sstevel@tonic-gate * This is the loadable module wrapper. 770Sstevel@tonic-gate */ 780Sstevel@tonic-gate #include <sys/conf.h> 790Sstevel@tonic-gate #include <sys/modctl.h> 800Sstevel@tonic-gate #include <sys/syscall.h> 810Sstevel@tonic-gate 820Sstevel@tonic-gate extern struct streamtab rpcinfo; 830Sstevel@tonic-gate 840Sstevel@tonic-gate static struct fmodsw fsw = { 850Sstevel@tonic-gate "rpcmod", 860Sstevel@tonic-gate &rpcinfo, 870Sstevel@tonic-gate D_NEW|D_MP, 880Sstevel@tonic-gate }; 890Sstevel@tonic-gate 900Sstevel@tonic-gate /* 910Sstevel@tonic-gate * Module linkage information for the kernel. 920Sstevel@tonic-gate */ 930Sstevel@tonic-gate 940Sstevel@tonic-gate static struct modlstrmod modlstrmod = { 950Sstevel@tonic-gate &mod_strmodops, "rpc interface str mod", &fsw 960Sstevel@tonic-gate }; 970Sstevel@tonic-gate 980Sstevel@tonic-gate /* 990Sstevel@tonic-gate * For the RPC system call. 1000Sstevel@tonic-gate */ 1010Sstevel@tonic-gate static struct sysent rpcsysent = { 1020Sstevel@tonic-gate 2, 1030Sstevel@tonic-gate SE_32RVAL1 | SE_ARGC | SE_NOUNLOAD, 1040Sstevel@tonic-gate rpcsys 1050Sstevel@tonic-gate }; 1060Sstevel@tonic-gate 1070Sstevel@tonic-gate static struct modlsys modlsys = { 1080Sstevel@tonic-gate &mod_syscallops, 1090Sstevel@tonic-gate "RPC syscall", 1100Sstevel@tonic-gate &rpcsysent 1110Sstevel@tonic-gate }; 1120Sstevel@tonic-gate 1130Sstevel@tonic-gate #ifdef _SYSCALL32_IMPL 1140Sstevel@tonic-gate static struct modlsys modlsys32 = { 1150Sstevel@tonic-gate &mod_syscallops32, 1160Sstevel@tonic-gate "32-bit RPC syscall", 1170Sstevel@tonic-gate &rpcsysent 1180Sstevel@tonic-gate }; 1190Sstevel@tonic-gate #endif /* _SYSCALL32_IMPL */ 1200Sstevel@tonic-gate 1210Sstevel@tonic-gate static struct modlinkage modlinkage = { 1220Sstevel@tonic-gate MODREV_1, 1230Sstevel@tonic-gate { 1240Sstevel@tonic-gate &modlsys, 1250Sstevel@tonic-gate #ifdef _SYSCALL32_IMPL 1260Sstevel@tonic-gate &modlsys32, 1270Sstevel@tonic-gate #endif 1280Sstevel@tonic-gate &modlstrmod, 1290Sstevel@tonic-gate NULL 1300Sstevel@tonic-gate } 1310Sstevel@tonic-gate }; 1320Sstevel@tonic-gate 1330Sstevel@tonic-gate int 1340Sstevel@tonic-gate _init(void) 1350Sstevel@tonic-gate { 1360Sstevel@tonic-gate int error = 0; 1370Sstevel@tonic-gate callb_id_t cid; 1380Sstevel@tonic-gate int status; 1390Sstevel@tonic-gate 1400Sstevel@tonic-gate svc_init(); 1410Sstevel@tonic-gate clnt_init(); 1420Sstevel@tonic-gate cid = callb_add(connmgr_cpr_reset, 0, CB_CL_CPR_RPC, "rpc"); 1430Sstevel@tonic-gate 1440Sstevel@tonic-gate if (error = mod_install(&modlinkage)) { 1450Sstevel@tonic-gate /* 1460Sstevel@tonic-gate * Could not install module, cleanup previous 1470Sstevel@tonic-gate * initialization work. 1480Sstevel@tonic-gate */ 1490Sstevel@tonic-gate clnt_fini(); 1500Sstevel@tonic-gate if (cid != NULL) 1510Sstevel@tonic-gate (void) callb_delete(cid); 1520Sstevel@tonic-gate 1530Sstevel@tonic-gate return (error); 1540Sstevel@tonic-gate } 1550Sstevel@tonic-gate 1560Sstevel@tonic-gate /* 1570Sstevel@tonic-gate * Load up the RDMA plugins and initialize the stats. Even if the 1580Sstevel@tonic-gate * plugins loadup fails, but rpcmod was successfully installed the 1590Sstevel@tonic-gate * counters still get initialized. 1600Sstevel@tonic-gate */ 1610Sstevel@tonic-gate rw_init(&rdma_lock, NULL, RW_DEFAULT, NULL); 1620Sstevel@tonic-gate mutex_init(&rdma_modload_lock, NULL, MUTEX_DEFAULT, NULL); 1630Sstevel@tonic-gate mt_kstat_init(); 1640Sstevel@tonic-gate 1650Sstevel@tonic-gate /* 1660Sstevel@tonic-gate * Get our identification into ldi. This is used for loading 1670Sstevel@tonic-gate * other modules, e.g. rpcib. 1680Sstevel@tonic-gate */ 1690Sstevel@tonic-gate status = ldi_ident_from_mod(&modlinkage, &rpcmod_li); 1700Sstevel@tonic-gate if (status != 0) { 1710Sstevel@tonic-gate cmn_err(CE_WARN, "ldi_ident_from_mod fails with %d", status); 1720Sstevel@tonic-gate rpcmod_li = NULL; 1730Sstevel@tonic-gate } 1740Sstevel@tonic-gate 1750Sstevel@tonic-gate return (error); 1760Sstevel@tonic-gate } 1770Sstevel@tonic-gate 1780Sstevel@tonic-gate /* 1790Sstevel@tonic-gate * The unload entry point fails, because we advertise entry points into 1800Sstevel@tonic-gate * rpcmod from the rest of kRPC: rpcmod_release(). 1810Sstevel@tonic-gate */ 1820Sstevel@tonic-gate int 1830Sstevel@tonic-gate _fini(void) 1840Sstevel@tonic-gate { 1850Sstevel@tonic-gate return (EBUSY); 1860Sstevel@tonic-gate } 1870Sstevel@tonic-gate 1880Sstevel@tonic-gate int 1890Sstevel@tonic-gate _info(struct modinfo *modinfop) 1900Sstevel@tonic-gate { 1910Sstevel@tonic-gate return (mod_info(&modlinkage, modinfop)); 1920Sstevel@tonic-gate } 1930Sstevel@tonic-gate 1940Sstevel@tonic-gate extern int nulldev(); 1950Sstevel@tonic-gate 1960Sstevel@tonic-gate #define RPCMOD_ID 2049 1970Sstevel@tonic-gate 1980Sstevel@tonic-gate int rmm_open(), rmm_close(); 1990Sstevel@tonic-gate 2000Sstevel@tonic-gate /* 2010Sstevel@tonic-gate * To save instructions, since STREAMS ignores the return value 2020Sstevel@tonic-gate * from these functions, they are defined as void here. Kind of icky, but... 2030Sstevel@tonic-gate */ 2040Sstevel@tonic-gate void rmm_rput(queue_t *, mblk_t *); 2050Sstevel@tonic-gate void rmm_wput(queue_t *, mblk_t *); 2060Sstevel@tonic-gate void rmm_rsrv(queue_t *); 2070Sstevel@tonic-gate void rmm_wsrv(queue_t *); 2080Sstevel@tonic-gate 2090Sstevel@tonic-gate int rpcmodopen(), rpcmodclose(); 2100Sstevel@tonic-gate void rpcmodrput(), rpcmodwput(); 2110Sstevel@tonic-gate void rpcmodrsrv(), rpcmodwsrv(); 2120Sstevel@tonic-gate 2130Sstevel@tonic-gate static void rpcmodwput_other(queue_t *, mblk_t *); 2140Sstevel@tonic-gate static int mir_close(queue_t *q); 2150Sstevel@tonic-gate static int mir_open(queue_t *q, dev_t *devp, int flag, int sflag, 2160Sstevel@tonic-gate cred_t *credp); 2170Sstevel@tonic-gate static void mir_rput(queue_t *q, mblk_t *mp); 2180Sstevel@tonic-gate static void mir_rsrv(queue_t *q); 2190Sstevel@tonic-gate static void mir_wput(queue_t *q, mblk_t *mp); 2200Sstevel@tonic-gate static void mir_wsrv(queue_t *q); 2210Sstevel@tonic-gate 2220Sstevel@tonic-gate static struct module_info rpcmod_info = 2230Sstevel@tonic-gate {RPCMOD_ID, "rpcmod", 0, INFPSZ, 256*1024, 1024}; 2240Sstevel@tonic-gate 2250Sstevel@tonic-gate /* 2260Sstevel@tonic-gate * Read side has no service procedure. 2270Sstevel@tonic-gate */ 2280Sstevel@tonic-gate static struct qinit rpcmodrinit = { 2290Sstevel@tonic-gate (int (*)())rmm_rput, 2300Sstevel@tonic-gate (int (*)())rmm_rsrv, 2310Sstevel@tonic-gate rmm_open, 2320Sstevel@tonic-gate rmm_close, 2330Sstevel@tonic-gate nulldev, 2340Sstevel@tonic-gate &rpcmod_info, 2350Sstevel@tonic-gate NULL 2360Sstevel@tonic-gate }; 2370Sstevel@tonic-gate 2380Sstevel@tonic-gate /* 2390Sstevel@tonic-gate * The write put procedure is simply putnext to conserve stack space. 2400Sstevel@tonic-gate * The write service procedure is not used to queue data, but instead to 2410Sstevel@tonic-gate * synchronize with flow control. 2420Sstevel@tonic-gate */ 2430Sstevel@tonic-gate static struct qinit rpcmodwinit = { 2440Sstevel@tonic-gate (int (*)())rmm_wput, 2450Sstevel@tonic-gate (int (*)())rmm_wsrv, 2460Sstevel@tonic-gate rmm_open, 2470Sstevel@tonic-gate rmm_close, 2480Sstevel@tonic-gate nulldev, 2490Sstevel@tonic-gate &rpcmod_info, 2500Sstevel@tonic-gate NULL 2510Sstevel@tonic-gate }; 2520Sstevel@tonic-gate struct streamtab rpcinfo = { &rpcmodrinit, &rpcmodwinit, NULL, NULL }; 2530Sstevel@tonic-gate 2540Sstevel@tonic-gate struct xprt_style_ops { 2550Sstevel@tonic-gate int (*xo_open)(); 2560Sstevel@tonic-gate int (*xo_close)(); 2570Sstevel@tonic-gate void (*xo_wput)(); 2580Sstevel@tonic-gate void (*xo_wsrv)(); 2590Sstevel@tonic-gate void (*xo_rput)(); 2600Sstevel@tonic-gate void (*xo_rsrv)(); 2610Sstevel@tonic-gate }; 2620Sstevel@tonic-gate 2630Sstevel@tonic-gate static struct xprt_style_ops xprt_clts_ops = { 2640Sstevel@tonic-gate rpcmodopen, 2650Sstevel@tonic-gate rpcmodclose, 2660Sstevel@tonic-gate rpcmodwput, 2670Sstevel@tonic-gate rpcmodwsrv, 2680Sstevel@tonic-gate rpcmodrput, 2690Sstevel@tonic-gate NULL 2700Sstevel@tonic-gate }; 2710Sstevel@tonic-gate 2720Sstevel@tonic-gate static struct xprt_style_ops xprt_cots_ops = { 2730Sstevel@tonic-gate mir_open, 2740Sstevel@tonic-gate mir_close, 2750Sstevel@tonic-gate mir_wput, 2760Sstevel@tonic-gate mir_wsrv, 2770Sstevel@tonic-gate mir_rput, 2780Sstevel@tonic-gate mir_rsrv 2790Sstevel@tonic-gate }; 2800Sstevel@tonic-gate 2810Sstevel@tonic-gate /* 2820Sstevel@tonic-gate * Per rpcmod "slot" data structure. q->q_ptr points to one of these. 2830Sstevel@tonic-gate */ 2840Sstevel@tonic-gate struct rpcm { 2850Sstevel@tonic-gate void *rm_krpc_cell; /* Reserved for use by KRPC */ 2860Sstevel@tonic-gate struct xprt_style_ops *rm_ops; 2870Sstevel@tonic-gate int rm_type; /* Client or server side stream */ 2880Sstevel@tonic-gate #define RM_CLOSING 0x1 /* somebody is trying to close slot */ 2890Sstevel@tonic-gate uint_t rm_state; /* state of the slot. see above */ 2900Sstevel@tonic-gate uint_t rm_ref; /* cnt of external references to slot */ 2910Sstevel@tonic-gate kmutex_t rm_lock; /* mutex protecting above fields */ 2920Sstevel@tonic-gate kcondvar_t rm_cwait; /* condition for closing */ 2930Sstevel@tonic-gate zoneid_t rm_zoneid; /* zone which pushed rpcmod */ 2940Sstevel@tonic-gate }; 2950Sstevel@tonic-gate 2960Sstevel@tonic-gate struct temp_slot { 2970Sstevel@tonic-gate void *cell; 2980Sstevel@tonic-gate struct xprt_style_ops *ops; 2990Sstevel@tonic-gate int type; 3000Sstevel@tonic-gate mblk_t *info_ack; 3010Sstevel@tonic-gate kmutex_t lock; 3020Sstevel@tonic-gate kcondvar_t wait; 3030Sstevel@tonic-gate }; 3040Sstevel@tonic-gate 3054386Sgeorges typedef struct mir_s { 3064386Sgeorges void *mir_krpc_cell; /* Reserved for KRPC use. This field */ 3074386Sgeorges /* must be first in the structure. */ 3084386Sgeorges struct xprt_style_ops *rm_ops; 3094386Sgeorges int mir_type; /* Client or server side stream */ 3104386Sgeorges 3114386Sgeorges mblk_t *mir_head_mp; /* RPC msg in progress */ 3124386Sgeorges /* 3134386Sgeorges * mir_head_mp points the first mblk being collected in 3144386Sgeorges * the current RPC message. Record headers are removed 3154386Sgeorges * before data is linked into mir_head_mp. 3164386Sgeorges */ 3174386Sgeorges mblk_t *mir_tail_mp; /* Last mblk in mir_head_mp */ 3184386Sgeorges /* 3194386Sgeorges * mir_tail_mp points to the last mblk in the message 3204386Sgeorges * chain starting at mir_head_mp. It is only valid 3214386Sgeorges * if mir_head_mp is non-NULL and is used to add new 3224386Sgeorges * data blocks to the end of chain quickly. 3234386Sgeorges */ 3244386Sgeorges 3254386Sgeorges int32_t mir_frag_len; /* Bytes seen in the current frag */ 3264386Sgeorges /* 3274386Sgeorges * mir_frag_len starts at -4 for beginning of each fragment. 3284386Sgeorges * When this length is negative, it indicates the number of 3294386Sgeorges * bytes that rpcmod needs to complete the record marker 3304386Sgeorges * header. When it is positive or zero, it holds the number 3314386Sgeorges * of bytes that have arrived for the current fragment and 3324386Sgeorges * are held in mir_header_mp. 3334386Sgeorges */ 3344386Sgeorges 3354386Sgeorges int32_t mir_frag_header; 3364386Sgeorges /* 3374386Sgeorges * Fragment header as collected for the current fragment. 3384386Sgeorges * It holds the last-fragment indicator and the number 3394386Sgeorges * of bytes in the fragment. 3404386Sgeorges */ 3414386Sgeorges 3424386Sgeorges unsigned int 3434386Sgeorges mir_ordrel_pending : 1, /* Sent T_ORDREL_REQ */ 3444386Sgeorges mir_hold_inbound : 1, /* Hold inbound messages on server */ 3454386Sgeorges /* side until outbound flow control */ 3464386Sgeorges /* is relieved. */ 3474386Sgeorges mir_closing : 1, /* The stream is being closed */ 3484386Sgeorges mir_inrservice : 1, /* data queued or rd srv proc running */ 3494386Sgeorges mir_inwservice : 1, /* data queued or wr srv proc running */ 3504386Sgeorges mir_inwflushdata : 1, /* flush M_DATAs when srv runs */ 3514386Sgeorges /* 3524386Sgeorges * On client streams, mir_clntreq is 0 or 1; it is set 3534386Sgeorges * to 1 whenever a new request is sent out (mir_wput) 3544386Sgeorges * and cleared when the timer fires (mir_timer). If 3554386Sgeorges * the timer fires with this value equal to 0, then the 3564386Sgeorges * stream is considered idle and KRPC is notified. 3574386Sgeorges */ 3584386Sgeorges mir_clntreq : 1, 3594386Sgeorges /* 3604386Sgeorges * On server streams, stop accepting messages 3614386Sgeorges */ 3624386Sgeorges mir_svc_no_more_msgs : 1, 3634386Sgeorges mir_listen_stream : 1, /* listen end point */ 3644386Sgeorges mir_unused : 1, /* no longer used */ 3654386Sgeorges mir_timer_call : 1, 3664386Sgeorges mir_junk_fill_thru_bit_31 : 21; 3674386Sgeorges 3684386Sgeorges int mir_setup_complete; /* server has initialized everything */ 3694386Sgeorges timeout_id_t mir_timer_id; /* Timer for idle checks */ 3704386Sgeorges clock_t mir_idle_timeout; /* Allowed idle time before shutdown */ 3714386Sgeorges /* 3724386Sgeorges * This value is copied from clnt_idle_timeout or 3734386Sgeorges * svc_idle_timeout during the appropriate ioctl. 3744386Sgeorges * Kept in milliseconds 3754386Sgeorges */ 3764386Sgeorges clock_t mir_use_timestamp; /* updated on client with each use */ 3774386Sgeorges /* 3784386Sgeorges * This value is set to lbolt 3794386Sgeorges * every time a client stream sends or receives data. 3804386Sgeorges * Even if the timer message arrives, we don't shutdown 3814386Sgeorges * client unless: 3824386Sgeorges * lbolt >= MSEC_TO_TICK(mir_idle_timeout)+mir_use_timestamp. 3834386Sgeorges * This value is kept in HZ. 3844386Sgeorges */ 3854386Sgeorges 3864386Sgeorges uint_t *mir_max_msg_sizep; /* Reference to sanity check size */ 3874386Sgeorges /* 3884386Sgeorges * This pointer is set to &clnt_max_msg_size or 3894386Sgeorges * &svc_max_msg_size during the appropriate ioctl. 3904386Sgeorges */ 3914386Sgeorges zoneid_t mir_zoneid; /* zone which pushed rpcmod */ 3924386Sgeorges /* Server-side fields. */ 3934386Sgeorges int mir_ref_cnt; /* Reference count: server side only */ 3944386Sgeorges /* counts the number of references */ 3954386Sgeorges /* that a kernel RPC server thread */ 3964386Sgeorges /* (see svc_run()) has on this rpcmod */ 3974386Sgeorges /* slot. Effectively, it is the */ 3984386Sgeorges /* number * of unprocessed messages */ 3994386Sgeorges /* that have been passed up to the */ 4004386Sgeorges /* KRPC layer */ 4014386Sgeorges 4024386Sgeorges mblk_t *mir_svc_pend_mp; /* Pending T_ORDREL_IND or */ 4034386Sgeorges /* T_DISCON_IND */ 4044386Sgeorges 4054386Sgeorges /* 4064386Sgeorges * these fields are for both client and server, but for debugging, 4074386Sgeorges * it is easier to have these last in the structure. 4084386Sgeorges */ 4094386Sgeorges kmutex_t mir_mutex; /* Mutex and condvar for close */ 4104386Sgeorges kcondvar_t mir_condvar; /* synchronization. */ 4114386Sgeorges kcondvar_t mir_timer_cv; /* Timer routine sync. */ 4124386Sgeorges } mir_t; 4134386Sgeorges 4140Sstevel@tonic-gate void tmp_rput(queue_t *q, mblk_t *mp); 4150Sstevel@tonic-gate 4160Sstevel@tonic-gate struct xprt_style_ops tmpops = { 4170Sstevel@tonic-gate NULL, 4180Sstevel@tonic-gate NULL, 4190Sstevel@tonic-gate putnext, 4200Sstevel@tonic-gate NULL, 4210Sstevel@tonic-gate tmp_rput, 4220Sstevel@tonic-gate NULL 4230Sstevel@tonic-gate }; 4240Sstevel@tonic-gate 4250Sstevel@tonic-gate void 4260Sstevel@tonic-gate tmp_rput(queue_t *q, mblk_t *mp) 4270Sstevel@tonic-gate { 4280Sstevel@tonic-gate struct temp_slot *t = (struct temp_slot *)(q->q_ptr); 4290Sstevel@tonic-gate struct T_info_ack *pptr; 4300Sstevel@tonic-gate 4310Sstevel@tonic-gate switch (mp->b_datap->db_type) { 4320Sstevel@tonic-gate case M_PCPROTO: 4330Sstevel@tonic-gate pptr = (struct T_info_ack *)mp->b_rptr; 4340Sstevel@tonic-gate switch (pptr->PRIM_type) { 4350Sstevel@tonic-gate case T_INFO_ACK: 4360Sstevel@tonic-gate mutex_enter(&t->lock); 4370Sstevel@tonic-gate t->info_ack = mp; 4380Sstevel@tonic-gate cv_signal(&t->wait); 4390Sstevel@tonic-gate mutex_exit(&t->lock); 4400Sstevel@tonic-gate return; 4410Sstevel@tonic-gate default: 4420Sstevel@tonic-gate break; 4430Sstevel@tonic-gate } 4440Sstevel@tonic-gate default: 4450Sstevel@tonic-gate break; 4460Sstevel@tonic-gate } 4470Sstevel@tonic-gate 4480Sstevel@tonic-gate /* 4490Sstevel@tonic-gate * Not an info-ack, so free it. This is ok because we should 4500Sstevel@tonic-gate * not be receiving data until the open finishes: rpcmod 4510Sstevel@tonic-gate * is pushed well before the end-point is bound to an address. 4520Sstevel@tonic-gate */ 4530Sstevel@tonic-gate freemsg(mp); 4540Sstevel@tonic-gate } 4550Sstevel@tonic-gate 4560Sstevel@tonic-gate int 4570Sstevel@tonic-gate rmm_open(queue_t *q, dev_t *devp, int flag, int sflag, cred_t *crp) 4580Sstevel@tonic-gate { 4590Sstevel@tonic-gate mblk_t *bp; 4600Sstevel@tonic-gate struct temp_slot ts, *t; 4610Sstevel@tonic-gate struct T_info_ack *pptr; 4620Sstevel@tonic-gate int error = 0; 4630Sstevel@tonic-gate 4640Sstevel@tonic-gate ASSERT(q != NULL); 4650Sstevel@tonic-gate /* 4660Sstevel@tonic-gate * Check for re-opens. 4670Sstevel@tonic-gate */ 4680Sstevel@tonic-gate if (q->q_ptr) { 4690Sstevel@tonic-gate TRACE_1(TR_FAC_KRPC, TR_RPCMODOPEN_END, 4700Sstevel@tonic-gate "rpcmodopen_end:(%s)", "q->qptr"); 4710Sstevel@tonic-gate return (0); 4720Sstevel@tonic-gate } 4730Sstevel@tonic-gate 4740Sstevel@tonic-gate t = &ts; 4750Sstevel@tonic-gate bzero(t, sizeof (*t)); 4760Sstevel@tonic-gate q->q_ptr = (void *)t; 4774386Sgeorges WR(q)->q_ptr = (void *)t; 4780Sstevel@tonic-gate 4790Sstevel@tonic-gate /* 4800Sstevel@tonic-gate * Allocate the required messages upfront. 4810Sstevel@tonic-gate */ 4820Sstevel@tonic-gate if ((bp = allocb(sizeof (struct T_info_req) + 4830Sstevel@tonic-gate sizeof (struct T_info_ack), BPRI_LO)) == (mblk_t *)NULL) { 4840Sstevel@tonic-gate return (ENOBUFS); 4850Sstevel@tonic-gate } 4860Sstevel@tonic-gate 4870Sstevel@tonic-gate mutex_init(&t->lock, NULL, MUTEX_DEFAULT, NULL); 4880Sstevel@tonic-gate cv_init(&t->wait, NULL, CV_DEFAULT, NULL); 4890Sstevel@tonic-gate 4900Sstevel@tonic-gate t->ops = &tmpops; 4910Sstevel@tonic-gate 4920Sstevel@tonic-gate qprocson(q); 4930Sstevel@tonic-gate bp->b_datap->db_type = M_PCPROTO; 4940Sstevel@tonic-gate *(int32_t *)bp->b_wptr = (int32_t)T_INFO_REQ; 4950Sstevel@tonic-gate bp->b_wptr += sizeof (struct T_info_req); 4960Sstevel@tonic-gate putnext(WR(q), bp); 4970Sstevel@tonic-gate 4980Sstevel@tonic-gate mutex_enter(&t->lock); 4994386Sgeorges while (t->info_ack == NULL) { 5000Sstevel@tonic-gate if (cv_wait_sig(&t->wait, &t->lock) == 0) { 5010Sstevel@tonic-gate error = EINTR; 5020Sstevel@tonic-gate break; 5030Sstevel@tonic-gate } 5040Sstevel@tonic-gate } 5050Sstevel@tonic-gate mutex_exit(&t->lock); 5064386Sgeorges 5070Sstevel@tonic-gate if (error) 5080Sstevel@tonic-gate goto out; 5090Sstevel@tonic-gate 5100Sstevel@tonic-gate pptr = (struct T_info_ack *)t->info_ack->b_rptr; 5110Sstevel@tonic-gate 5120Sstevel@tonic-gate if (pptr->SERV_type == T_CLTS) { 5134386Sgeorges if ((error = rpcmodopen(q, devp, flag, sflag, crp)) == 0) 5144386Sgeorges ((struct rpcm *)q->q_ptr)->rm_ops = &xprt_clts_ops; 5150Sstevel@tonic-gate } else { 5164386Sgeorges if ((error = mir_open(q, devp, flag, sflag, crp)) == 0) 5174386Sgeorges ((mir_t *)q->q_ptr)->rm_ops = &xprt_cots_ops; 5180Sstevel@tonic-gate } 5190Sstevel@tonic-gate 5200Sstevel@tonic-gate out: 5214386Sgeorges if (error) 5220Sstevel@tonic-gate qprocsoff(q); 5230Sstevel@tonic-gate 5244386Sgeorges freemsg(t->info_ack); 5254386Sgeorges mutex_destroy(&t->lock); 5264386Sgeorges cv_destroy(&t->wait); 5274386Sgeorges 5280Sstevel@tonic-gate return (error); 5290Sstevel@tonic-gate } 5300Sstevel@tonic-gate 5310Sstevel@tonic-gate void 5320Sstevel@tonic-gate rmm_rput(queue_t *q, mblk_t *mp) 5330Sstevel@tonic-gate { 5340Sstevel@tonic-gate (*((struct temp_slot *)q->q_ptr)->ops->xo_rput)(q, mp); 5350Sstevel@tonic-gate } 5360Sstevel@tonic-gate 5370Sstevel@tonic-gate void 5380Sstevel@tonic-gate rmm_rsrv(queue_t *q) 5390Sstevel@tonic-gate { 5400Sstevel@tonic-gate (*((struct temp_slot *)q->q_ptr)->ops->xo_rsrv)(q); 5410Sstevel@tonic-gate } 5420Sstevel@tonic-gate 5430Sstevel@tonic-gate void 5440Sstevel@tonic-gate rmm_wput(queue_t *q, mblk_t *mp) 5450Sstevel@tonic-gate { 5460Sstevel@tonic-gate (*((struct temp_slot *)q->q_ptr)->ops->xo_wput)(q, mp); 5470Sstevel@tonic-gate } 5480Sstevel@tonic-gate 5490Sstevel@tonic-gate void 5500Sstevel@tonic-gate rmm_wsrv(queue_t *q) 5510Sstevel@tonic-gate { 5520Sstevel@tonic-gate (*((struct temp_slot *)q->q_ptr)->ops->xo_wsrv)(q); 5530Sstevel@tonic-gate } 5540Sstevel@tonic-gate 5550Sstevel@tonic-gate int 5560Sstevel@tonic-gate rmm_close(queue_t *q, int flag, cred_t *crp) 5570Sstevel@tonic-gate { 5580Sstevel@tonic-gate return ((*((struct temp_slot *)q->q_ptr)->ops->xo_close)(q, flag, crp)); 5590Sstevel@tonic-gate } 5600Sstevel@tonic-gate 5610Sstevel@tonic-gate /* 5620Sstevel@tonic-gate * rpcmodopen - open routine gets called when the module gets pushed 5630Sstevel@tonic-gate * onto the stream. 5640Sstevel@tonic-gate */ 5650Sstevel@tonic-gate /*ARGSUSED*/ 5660Sstevel@tonic-gate int 5670Sstevel@tonic-gate rpcmodopen(queue_t *q, dev_t *devp, int flag, int sflag, cred_t *crp) 5680Sstevel@tonic-gate { 5690Sstevel@tonic-gate struct rpcm *rmp; 5700Sstevel@tonic-gate 5710Sstevel@tonic-gate extern void (*rpc_rele)(queue_t *, mblk_t *); 5720Sstevel@tonic-gate static void rpcmod_release(queue_t *, mblk_t *); 5730Sstevel@tonic-gate 5740Sstevel@tonic-gate TRACE_0(TR_FAC_KRPC, TR_RPCMODOPEN_START, "rpcmodopen_start:"); 5750Sstevel@tonic-gate 5760Sstevel@tonic-gate /* 5770Sstevel@tonic-gate * Initialize entry points to release a rpcmod slot (and an input 5780Sstevel@tonic-gate * message if supplied) and to send an output message to the module 5790Sstevel@tonic-gate * below rpcmod. 5800Sstevel@tonic-gate */ 5810Sstevel@tonic-gate if (rpc_rele == NULL) 5820Sstevel@tonic-gate rpc_rele = rpcmod_release; 5830Sstevel@tonic-gate 5840Sstevel@tonic-gate /* 5850Sstevel@tonic-gate * Only sufficiently privileged users can use this module, and it 5860Sstevel@tonic-gate * is assumed that they will use this module properly, and NOT send 5870Sstevel@tonic-gate * bulk data from downstream. 5880Sstevel@tonic-gate */ 5890Sstevel@tonic-gate if (secpolicy_rpcmod_open(crp) != 0) 5900Sstevel@tonic-gate return (EPERM); 5910Sstevel@tonic-gate 5920Sstevel@tonic-gate /* 5930Sstevel@tonic-gate * Allocate slot data structure. 5940Sstevel@tonic-gate */ 5950Sstevel@tonic-gate rmp = kmem_zalloc(sizeof (*rmp), KM_SLEEP); 5960Sstevel@tonic-gate 5970Sstevel@tonic-gate mutex_init(&rmp->rm_lock, NULL, MUTEX_DEFAULT, NULL); 5980Sstevel@tonic-gate cv_init(&rmp->rm_cwait, NULL, CV_DEFAULT, NULL); 599766Scarlsonj rmp->rm_zoneid = rpc_zoneid(); 6000Sstevel@tonic-gate /* 6010Sstevel@tonic-gate * slot type will be set by kRPC client and server ioctl's 6020Sstevel@tonic-gate */ 6030Sstevel@tonic-gate rmp->rm_type = 0; 6040Sstevel@tonic-gate 6050Sstevel@tonic-gate q->q_ptr = (void *)rmp; 6060Sstevel@tonic-gate WR(q)->q_ptr = (void *)rmp; 6070Sstevel@tonic-gate 6080Sstevel@tonic-gate TRACE_1(TR_FAC_KRPC, TR_RPCMODOPEN_END, "rpcmodopen_end:(%s)", "end"); 6090Sstevel@tonic-gate return (0); 6100Sstevel@tonic-gate } 6110Sstevel@tonic-gate 6120Sstevel@tonic-gate /* 6130Sstevel@tonic-gate * rpcmodclose - This routine gets called when the module gets popped 6140Sstevel@tonic-gate * off of the stream. 6150Sstevel@tonic-gate */ 6160Sstevel@tonic-gate /*ARGSUSED*/ 6170Sstevel@tonic-gate int 6180Sstevel@tonic-gate rpcmodclose(queue_t *q, int flag, cred_t *crp) 6190Sstevel@tonic-gate { 6200Sstevel@tonic-gate struct rpcm *rmp; 6210Sstevel@tonic-gate 6220Sstevel@tonic-gate ASSERT(q != NULL); 6230Sstevel@tonic-gate rmp = (struct rpcm *)q->q_ptr; 6240Sstevel@tonic-gate 6250Sstevel@tonic-gate /* 6260Sstevel@tonic-gate * Mark our state as closing. 6270Sstevel@tonic-gate */ 6280Sstevel@tonic-gate mutex_enter(&rmp->rm_lock); 6290Sstevel@tonic-gate rmp->rm_state |= RM_CLOSING; 6300Sstevel@tonic-gate 6310Sstevel@tonic-gate /* 6320Sstevel@tonic-gate * Check and see if there are any messages on the queue. If so, send 6330Sstevel@tonic-gate * the messages, regardless whether the downstream module is ready to 6340Sstevel@tonic-gate * accept data. 6350Sstevel@tonic-gate */ 6360Sstevel@tonic-gate if (rmp->rm_type == RPC_SERVER) { 6370Sstevel@tonic-gate flushq(q, FLUSHDATA); 6380Sstevel@tonic-gate 6390Sstevel@tonic-gate qenable(WR(q)); 6400Sstevel@tonic-gate 6410Sstevel@tonic-gate if (rmp->rm_ref) { 6420Sstevel@tonic-gate mutex_exit(&rmp->rm_lock); 6430Sstevel@tonic-gate /* 6440Sstevel@tonic-gate * call into SVC to clean the queue 6450Sstevel@tonic-gate */ 6460Sstevel@tonic-gate svc_queueclean(q); 6470Sstevel@tonic-gate mutex_enter(&rmp->rm_lock); 6480Sstevel@tonic-gate 6490Sstevel@tonic-gate /* 6500Sstevel@tonic-gate * Block while there are kRPC threads with a reference 6510Sstevel@tonic-gate * to this message. 6520Sstevel@tonic-gate */ 6530Sstevel@tonic-gate while (rmp->rm_ref) 6540Sstevel@tonic-gate cv_wait(&rmp->rm_cwait, &rmp->rm_lock); 6550Sstevel@tonic-gate } 6560Sstevel@tonic-gate 6570Sstevel@tonic-gate mutex_exit(&rmp->rm_lock); 6580Sstevel@tonic-gate 6590Sstevel@tonic-gate /* 6600Sstevel@tonic-gate * It is now safe to remove this queue from the stream. No kRPC 6610Sstevel@tonic-gate * threads have a reference to the stream, and none ever will, 6620Sstevel@tonic-gate * because RM_CLOSING is set. 6630Sstevel@tonic-gate */ 6640Sstevel@tonic-gate qprocsoff(q); 6650Sstevel@tonic-gate 6660Sstevel@tonic-gate /* Notify kRPC that this stream is going away. */ 6670Sstevel@tonic-gate svc_queueclose(q); 6680Sstevel@tonic-gate } else { 6690Sstevel@tonic-gate mutex_exit(&rmp->rm_lock); 6700Sstevel@tonic-gate qprocsoff(q); 6710Sstevel@tonic-gate } 6720Sstevel@tonic-gate 6730Sstevel@tonic-gate q->q_ptr = NULL; 6740Sstevel@tonic-gate WR(q)->q_ptr = NULL; 6750Sstevel@tonic-gate mutex_destroy(&rmp->rm_lock); 6760Sstevel@tonic-gate cv_destroy(&rmp->rm_cwait); 6770Sstevel@tonic-gate kmem_free(rmp, sizeof (*rmp)); 6780Sstevel@tonic-gate return (0); 6790Sstevel@tonic-gate } 6800Sstevel@tonic-gate 6810Sstevel@tonic-gate #ifdef DEBUG 6820Sstevel@tonic-gate int rpcmod_send_msg_up = 0; 6830Sstevel@tonic-gate int rpcmod_send_uderr = 0; 6840Sstevel@tonic-gate int rpcmod_send_dup = 0; 6850Sstevel@tonic-gate int rpcmod_send_dup_cnt = 0; 6860Sstevel@tonic-gate #endif 6870Sstevel@tonic-gate 6880Sstevel@tonic-gate /* 6890Sstevel@tonic-gate * rpcmodrput - Module read put procedure. This is called from 6900Sstevel@tonic-gate * the module, driver, or stream head downstream. 6910Sstevel@tonic-gate */ 6920Sstevel@tonic-gate void 6930Sstevel@tonic-gate rpcmodrput(queue_t *q, mblk_t *mp) 6940Sstevel@tonic-gate { 6950Sstevel@tonic-gate struct rpcm *rmp; 6960Sstevel@tonic-gate union T_primitives *pptr; 6970Sstevel@tonic-gate int hdrsz; 6980Sstevel@tonic-gate 6990Sstevel@tonic-gate TRACE_0(TR_FAC_KRPC, TR_RPCMODRPUT_START, "rpcmodrput_start:"); 7000Sstevel@tonic-gate 7010Sstevel@tonic-gate ASSERT(q != NULL); 7020Sstevel@tonic-gate rmp = (struct rpcm *)q->q_ptr; 7030Sstevel@tonic-gate 7040Sstevel@tonic-gate if (rmp->rm_type == 0) { 7050Sstevel@tonic-gate freemsg(mp); 7060Sstevel@tonic-gate return; 7070Sstevel@tonic-gate } 7080Sstevel@tonic-gate 7090Sstevel@tonic-gate #ifdef DEBUG 7100Sstevel@tonic-gate if (rpcmod_send_msg_up > 0) { 7110Sstevel@tonic-gate mblk_t *nmp = copymsg(mp); 7120Sstevel@tonic-gate if (nmp) { 7130Sstevel@tonic-gate putnext(q, nmp); 7140Sstevel@tonic-gate rpcmod_send_msg_up--; 7150Sstevel@tonic-gate } 7160Sstevel@tonic-gate } 7170Sstevel@tonic-gate if ((rpcmod_send_uderr > 0) && mp->b_datap->db_type == M_PROTO) { 7180Sstevel@tonic-gate mblk_t *nmp; 7190Sstevel@tonic-gate struct T_unitdata_ind *data; 7200Sstevel@tonic-gate struct T_uderror_ind *ud; 7210Sstevel@tonic-gate int d; 7220Sstevel@tonic-gate data = (struct T_unitdata_ind *)mp->b_rptr; 7230Sstevel@tonic-gate if (data->PRIM_type == T_UNITDATA_IND) { 7240Sstevel@tonic-gate d = sizeof (*ud) - sizeof (*data); 7250Sstevel@tonic-gate nmp = allocb(mp->b_wptr - mp->b_rptr + d, BPRI_HI); 7260Sstevel@tonic-gate if (nmp) { 7270Sstevel@tonic-gate ud = (struct T_uderror_ind *)nmp->b_rptr; 7280Sstevel@tonic-gate ud->PRIM_type = T_UDERROR_IND; 7290Sstevel@tonic-gate ud->DEST_length = data->SRC_length; 7300Sstevel@tonic-gate ud->DEST_offset = data->SRC_offset + d; 7310Sstevel@tonic-gate ud->OPT_length = data->OPT_length; 7320Sstevel@tonic-gate ud->OPT_offset = data->OPT_offset + d; 7330Sstevel@tonic-gate ud->ERROR_type = ENETDOWN; 7340Sstevel@tonic-gate if (data->SRC_length) { 7350Sstevel@tonic-gate bcopy(mp->b_rptr + 7360Sstevel@tonic-gate data->SRC_offset, 7370Sstevel@tonic-gate nmp->b_rptr + 7380Sstevel@tonic-gate ud->DEST_offset, 7390Sstevel@tonic-gate data->SRC_length); 7400Sstevel@tonic-gate } 7410Sstevel@tonic-gate if (data->OPT_length) { 7420Sstevel@tonic-gate bcopy(mp->b_rptr + 7430Sstevel@tonic-gate data->OPT_offset, 7440Sstevel@tonic-gate nmp->b_rptr + 7450Sstevel@tonic-gate ud->OPT_offset, 7460Sstevel@tonic-gate data->OPT_length); 7470Sstevel@tonic-gate } 7480Sstevel@tonic-gate nmp->b_wptr += d; 7490Sstevel@tonic-gate nmp->b_wptr += (mp->b_wptr - mp->b_rptr); 7500Sstevel@tonic-gate nmp->b_datap->db_type = M_PROTO; 7510Sstevel@tonic-gate putnext(q, nmp); 7520Sstevel@tonic-gate rpcmod_send_uderr--; 7530Sstevel@tonic-gate } 7540Sstevel@tonic-gate } 7550Sstevel@tonic-gate } 7560Sstevel@tonic-gate #endif 7570Sstevel@tonic-gate switch (mp->b_datap->db_type) { 7580Sstevel@tonic-gate default: 7590Sstevel@tonic-gate putnext(q, mp); 7600Sstevel@tonic-gate break; 7610Sstevel@tonic-gate 7620Sstevel@tonic-gate case M_PROTO: 7630Sstevel@tonic-gate case M_PCPROTO: 7640Sstevel@tonic-gate ASSERT((mp->b_wptr - mp->b_rptr) >= sizeof (int32_t)); 7650Sstevel@tonic-gate pptr = (union T_primitives *)mp->b_rptr; 7660Sstevel@tonic-gate 7670Sstevel@tonic-gate /* 7680Sstevel@tonic-gate * Forward this message to krpc if it is data. 7690Sstevel@tonic-gate */ 7700Sstevel@tonic-gate if (pptr->type == T_UNITDATA_IND) { 771*4741Sgt29601 mblk_t *nmp; 7720Sstevel@tonic-gate 7730Sstevel@tonic-gate /* 7740Sstevel@tonic-gate * Check if the module is being popped. 7750Sstevel@tonic-gate */ 776*4741Sgt29601 mutex_enter(&rmp->rm_lock); 777*4741Sgt29601 if (rmp->rm_state & RM_CLOSING) { 778*4741Sgt29601 mutex_exit(&rmp->rm_lock); 779*4741Sgt29601 putnext(q, mp); 780*4741Sgt29601 break; 781*4741Sgt29601 } 782*4741Sgt29601 783*4741Sgt29601 switch (rmp->rm_type) { 784*4741Sgt29601 case RPC_CLIENT: 785*4741Sgt29601 mutex_exit(&rmp->rm_lock); 786*4741Sgt29601 hdrsz = mp->b_wptr - mp->b_rptr; 787*4741Sgt29601 788*4741Sgt29601 /* 789*4741Sgt29601 * Make sure the header is sane. 790*4741Sgt29601 */ 791*4741Sgt29601 if (hdrsz < TUNITDATAINDSZ || 792*4741Sgt29601 hdrsz < (pptr->unitdata_ind.OPT_length + 793*4741Sgt29601 pptr->unitdata_ind.OPT_offset) || 794*4741Sgt29601 hdrsz < (pptr->unitdata_ind.SRC_length + 795*4741Sgt29601 pptr->unitdata_ind.SRC_offset)) { 796*4741Sgt29601 freemsg(mp); 797*4741Sgt29601 return; 798*4741Sgt29601 } 799*4741Sgt29601 800*4741Sgt29601 /* 801*4741Sgt29601 * Call clnt_clts_dispatch_notify, so that it 802*4741Sgt29601 * can pass the message to the proper caller. 803*4741Sgt29601 * Don't discard the header just yet since the 804*4741Sgt29601 * client may need the sender's address. 805*4741Sgt29601 */ 806*4741Sgt29601 clnt_clts_dispatch_notify(mp, hdrsz, 807*4741Sgt29601 rmp->rm_zoneid); 808*4741Sgt29601 return; 809*4741Sgt29601 case RPC_SERVER: 810*4741Sgt29601 /* 811*4741Sgt29601 * rm_krpc_cell is exclusively used by the kRPC 812*4741Sgt29601 * CLTS server 813*4741Sgt29601 */ 814*4741Sgt29601 if (rmp->rm_krpc_cell) { 815*4741Sgt29601 #ifdef DEBUG 816*4741Sgt29601 /* 817*4741Sgt29601 * Test duplicate request cache and 818*4741Sgt29601 * rm_ref count handling by sending a 819*4741Sgt29601 * duplicate every so often, if 820*4741Sgt29601 * desired. 821*4741Sgt29601 */ 822*4741Sgt29601 if (rpcmod_send_dup && 823*4741Sgt29601 rpcmod_send_dup_cnt++ % 824*4741Sgt29601 rpcmod_send_dup) 825*4741Sgt29601 nmp = copymsg(mp); 826*4741Sgt29601 else 827*4741Sgt29601 nmp = NULL; 828*4741Sgt29601 #endif 829*4741Sgt29601 /* 830*4741Sgt29601 * Raise the reference count on this 831*4741Sgt29601 * module to prevent it from being 832*4741Sgt29601 * popped before krpc generates the 833*4741Sgt29601 * reply. 834*4741Sgt29601 */ 835*4741Sgt29601 rmp->rm_ref++; 836*4741Sgt29601 mutex_exit(&rmp->rm_lock); 837*4741Sgt29601 838*4741Sgt29601 /* 839*4741Sgt29601 * Submit the message to krpc. 840*4741Sgt29601 */ 841*4741Sgt29601 svc_queuereq(q, mp); 842*4741Sgt29601 #ifdef DEBUG 843*4741Sgt29601 /* 844*4741Sgt29601 * Send duplicate if we created one. 845*4741Sgt29601 */ 846*4741Sgt29601 if (nmp) { 847*4741Sgt29601 mutex_enter(&rmp->rm_lock); 848*4741Sgt29601 rmp->rm_ref++; 849*4741Sgt29601 mutex_exit(&rmp->rm_lock); 850*4741Sgt29601 svc_queuereq(q, nmp); 851*4741Sgt29601 } 852*4741Sgt29601 #endif 853*4741Sgt29601 } else { 854*4741Sgt29601 mutex_exit(&rmp->rm_lock); 855*4741Sgt29601 freemsg(mp); 856*4741Sgt29601 } 857*4741Sgt29601 return; 858*4741Sgt29601 default: 859*4741Sgt29601 mutex_exit(&rmp->rm_lock); 860*4741Sgt29601 freemsg(mp); 861*4741Sgt29601 return; 862*4741Sgt29601 } /* end switch(rmp->rm_type) */ 863*4741Sgt29601 } else if (pptr->type == T_UDERROR_IND) { 864*4741Sgt29601 mutex_enter(&rmp->rm_lock); 8650Sstevel@tonic-gate hdrsz = mp->b_wptr - mp->b_rptr; 8660Sstevel@tonic-gate 8670Sstevel@tonic-gate /* 868*4741Sgt29601 * Make sure the header is sane 8690Sstevel@tonic-gate */ 870*4741Sgt29601 if (hdrsz < TUDERRORINDSZ || 871*4741Sgt29601 hdrsz < (pptr->uderror_ind.OPT_length + 872*4741Sgt29601 pptr->uderror_ind.OPT_offset) || 873*4741Sgt29601 hdrsz < (pptr->uderror_ind.DEST_length + 874*4741Sgt29601 pptr->uderror_ind.DEST_offset)) { 875*4741Sgt29601 mutex_exit(&rmp->rm_lock); 876*4741Sgt29601 freemsg(mp); 877*4741Sgt29601 return; 8780Sstevel@tonic-gate } 8790Sstevel@tonic-gate 8800Sstevel@tonic-gate /* 881*4741Sgt29601 * In the case where a unit data error has been 882*4741Sgt29601 * received, all we need to do is clear the message from 883*4741Sgt29601 * the queue. 8840Sstevel@tonic-gate */ 8850Sstevel@tonic-gate mutex_exit(&rmp->rm_lock); 8860Sstevel@tonic-gate freemsg(mp); 887*4741Sgt29601 RPCLOG(32, "rpcmodrput: unitdata error received at " 888*4741Sgt29601 "%ld\n", gethrestime_sec()); 8890Sstevel@tonic-gate return; 8900Sstevel@tonic-gate } /* end else if (pptr->type == T_UDERROR_IND) */ 8910Sstevel@tonic-gate 8920Sstevel@tonic-gate putnext(q, mp); 8930Sstevel@tonic-gate break; 8940Sstevel@tonic-gate } /* end switch (mp->b_datap->db_type) */ 8950Sstevel@tonic-gate 8960Sstevel@tonic-gate TRACE_0(TR_FAC_KRPC, TR_RPCMODRPUT_END, 897*4741Sgt29601 "rpcmodrput_end:"); 8980Sstevel@tonic-gate /* 8990Sstevel@tonic-gate * Return codes are not looked at by the STREAMS framework. 9000Sstevel@tonic-gate */ 9010Sstevel@tonic-gate } 9020Sstevel@tonic-gate 9030Sstevel@tonic-gate /* 9040Sstevel@tonic-gate * write put procedure 9050Sstevel@tonic-gate */ 9060Sstevel@tonic-gate void 9070Sstevel@tonic-gate rpcmodwput(queue_t *q, mblk_t *mp) 9080Sstevel@tonic-gate { 9090Sstevel@tonic-gate struct rpcm *rmp; 9100Sstevel@tonic-gate 9110Sstevel@tonic-gate ASSERT(q != NULL); 9120Sstevel@tonic-gate 9130Sstevel@tonic-gate switch (mp->b_datap->db_type) { 914*4741Sgt29601 case M_PROTO: 915*4741Sgt29601 case M_PCPROTO: 916*4741Sgt29601 break; 917*4741Sgt29601 default: 918*4741Sgt29601 rpcmodwput_other(q, mp); 919*4741Sgt29601 return; 9200Sstevel@tonic-gate } 9210Sstevel@tonic-gate 9220Sstevel@tonic-gate /* 9230Sstevel@tonic-gate * Check to see if we can send the message downstream. 9240Sstevel@tonic-gate */ 9250Sstevel@tonic-gate if (canputnext(q)) { 9260Sstevel@tonic-gate putnext(q, mp); 9270Sstevel@tonic-gate return; 9280Sstevel@tonic-gate } 9290Sstevel@tonic-gate 9300Sstevel@tonic-gate rmp = (struct rpcm *)q->q_ptr; 9310Sstevel@tonic-gate ASSERT(rmp != NULL); 9320Sstevel@tonic-gate 9330Sstevel@tonic-gate /* 9340Sstevel@tonic-gate * The first canputnext failed. Try again except this time with the 9350Sstevel@tonic-gate * lock held, so that we can check the state of the stream to see if 9360Sstevel@tonic-gate * it is closing. If either of these conditions evaluate to true 9370Sstevel@tonic-gate * then send the meesage. 9380Sstevel@tonic-gate */ 9390Sstevel@tonic-gate mutex_enter(&rmp->rm_lock); 9400Sstevel@tonic-gate if (canputnext(q) || (rmp->rm_state & RM_CLOSING)) { 9410Sstevel@tonic-gate mutex_exit(&rmp->rm_lock); 9420Sstevel@tonic-gate putnext(q, mp); 9430Sstevel@tonic-gate } else { 9440Sstevel@tonic-gate /* 9450Sstevel@tonic-gate * canputnext failed again and the stream is not closing. 9460Sstevel@tonic-gate * Place the message on the queue and let the service 9470Sstevel@tonic-gate * procedure handle the message. 9480Sstevel@tonic-gate */ 9490Sstevel@tonic-gate mutex_exit(&rmp->rm_lock); 9500Sstevel@tonic-gate (void) putq(q, mp); 9510Sstevel@tonic-gate } 9520Sstevel@tonic-gate } 9530Sstevel@tonic-gate 9540Sstevel@tonic-gate static void 9550Sstevel@tonic-gate rpcmodwput_other(queue_t *q, mblk_t *mp) 9560Sstevel@tonic-gate { 9570Sstevel@tonic-gate struct rpcm *rmp; 9580Sstevel@tonic-gate struct iocblk *iocp; 9590Sstevel@tonic-gate 9600Sstevel@tonic-gate rmp = (struct rpcm *)q->q_ptr; 9610Sstevel@tonic-gate ASSERT(rmp != NULL); 9620Sstevel@tonic-gate 9630Sstevel@tonic-gate switch (mp->b_datap->db_type) { 9640Sstevel@tonic-gate case M_IOCTL: 9650Sstevel@tonic-gate iocp = (struct iocblk *)mp->b_rptr; 9660Sstevel@tonic-gate ASSERT(iocp != NULL); 9670Sstevel@tonic-gate switch (iocp->ioc_cmd) { 968*4741Sgt29601 case RPC_CLIENT: 969*4741Sgt29601 case RPC_SERVER: 970*4741Sgt29601 mutex_enter(&rmp->rm_lock); 971*4741Sgt29601 rmp->rm_type = iocp->ioc_cmd; 972*4741Sgt29601 mutex_exit(&rmp->rm_lock); 973*4741Sgt29601 mp->b_datap->db_type = M_IOCACK; 974*4741Sgt29601 qreply(q, mp); 975*4741Sgt29601 return; 976*4741Sgt29601 default: 9770Sstevel@tonic-gate /* 9780Sstevel@tonic-gate * pass the ioctl downstream and hope someone 9790Sstevel@tonic-gate * down there knows how to handle it. 9800Sstevel@tonic-gate */ 981*4741Sgt29601 putnext(q, mp); 982*4741Sgt29601 return; 9830Sstevel@tonic-gate } 9840Sstevel@tonic-gate default: 9850Sstevel@tonic-gate break; 9860Sstevel@tonic-gate } 9870Sstevel@tonic-gate /* 9880Sstevel@tonic-gate * This is something we definitely do not know how to handle, just 9890Sstevel@tonic-gate * pass the message downstream 9900Sstevel@tonic-gate */ 9910Sstevel@tonic-gate putnext(q, mp); 9920Sstevel@tonic-gate } 9930Sstevel@tonic-gate 9940Sstevel@tonic-gate /* 9950Sstevel@tonic-gate * Module write service procedure. This is called by downstream modules 9960Sstevel@tonic-gate * for back enabling during flow control. 9970Sstevel@tonic-gate */ 9980Sstevel@tonic-gate void 9990Sstevel@tonic-gate rpcmodwsrv(queue_t *q) 10000Sstevel@tonic-gate { 10010Sstevel@tonic-gate struct rpcm *rmp; 10020Sstevel@tonic-gate mblk_t *mp = NULL; 10030Sstevel@tonic-gate 10040Sstevel@tonic-gate rmp = (struct rpcm *)q->q_ptr; 10050Sstevel@tonic-gate ASSERT(rmp != NULL); 10060Sstevel@tonic-gate 10070Sstevel@tonic-gate /* 10080Sstevel@tonic-gate * Get messages that may be queued and send them down stream 10090Sstevel@tonic-gate */ 10100Sstevel@tonic-gate while ((mp = getq(q)) != NULL) { 10110Sstevel@tonic-gate /* 10120Sstevel@tonic-gate * Optimize the service procedure for the server-side, by 10130Sstevel@tonic-gate * avoiding a call to canputnext(). 10140Sstevel@tonic-gate */ 10150Sstevel@tonic-gate if (rmp->rm_type == RPC_SERVER || canputnext(q)) { 10160Sstevel@tonic-gate putnext(q, mp); 10170Sstevel@tonic-gate continue; 10180Sstevel@tonic-gate } 10190Sstevel@tonic-gate (void) putbq(q, mp); 10200Sstevel@tonic-gate return; 10210Sstevel@tonic-gate } 10220Sstevel@tonic-gate } 10230Sstevel@tonic-gate 10240Sstevel@tonic-gate static void 10250Sstevel@tonic-gate rpcmod_release(queue_t *q, mblk_t *bp) 10260Sstevel@tonic-gate { 10270Sstevel@tonic-gate struct rpcm *rmp; 10280Sstevel@tonic-gate 10290Sstevel@tonic-gate /* 10300Sstevel@tonic-gate * For now, just free the message. 10310Sstevel@tonic-gate */ 10320Sstevel@tonic-gate if (bp) 10330Sstevel@tonic-gate freemsg(bp); 10340Sstevel@tonic-gate rmp = (struct rpcm *)q->q_ptr; 10350Sstevel@tonic-gate 10360Sstevel@tonic-gate mutex_enter(&rmp->rm_lock); 10370Sstevel@tonic-gate rmp->rm_ref--; 10380Sstevel@tonic-gate 10390Sstevel@tonic-gate if (rmp->rm_ref == 0 && (rmp->rm_state & RM_CLOSING)) { 10400Sstevel@tonic-gate cv_broadcast(&rmp->rm_cwait); 10410Sstevel@tonic-gate } 10420Sstevel@tonic-gate 10430Sstevel@tonic-gate mutex_exit(&rmp->rm_lock); 10440Sstevel@tonic-gate } 10450Sstevel@tonic-gate 10460Sstevel@tonic-gate /* 10470Sstevel@tonic-gate * This part of rpcmod is pushed on a connection-oriented transport for use 10480Sstevel@tonic-gate * by RPC. It serves to bypass the Stream head, implements 10490Sstevel@tonic-gate * the record marking protocol, and dispatches incoming RPC messages. 10500Sstevel@tonic-gate */ 10510Sstevel@tonic-gate 10520Sstevel@tonic-gate /* Default idle timer values */ 10530Sstevel@tonic-gate #define MIR_CLNT_IDLE_TIMEOUT (5 * (60 * 1000L)) /* 5 minutes */ 10540Sstevel@tonic-gate #define MIR_SVC_IDLE_TIMEOUT (6 * (60 * 1000L)) /* 6 minutes */ 10550Sstevel@tonic-gate #define MIR_SVC_ORDREL_TIMEOUT (10 * (60 * 1000L)) /* 10 minutes */ 10560Sstevel@tonic-gate #define MIR_LASTFRAG 0x80000000 /* Record marker */ 10570Sstevel@tonic-gate 10580Sstevel@tonic-gate #define DLEN(mp) (mp->b_cont ? msgdsize(mp) : (mp->b_wptr - mp->b_rptr)) 10590Sstevel@tonic-gate 10600Sstevel@tonic-gate #define MIR_SVC_QUIESCED(mir) \ 10610Sstevel@tonic-gate (mir->mir_ref_cnt == 0 && mir->mir_inrservice == 0) 10620Sstevel@tonic-gate 10630Sstevel@tonic-gate #define MIR_CLEAR_INRSRV(mir_ptr) { \ 10640Sstevel@tonic-gate (mir_ptr)->mir_inrservice = 0; \ 10650Sstevel@tonic-gate if ((mir_ptr)->mir_type == RPC_SERVER && \ 10660Sstevel@tonic-gate (mir_ptr)->mir_closing) \ 10670Sstevel@tonic-gate cv_signal(&(mir_ptr)->mir_condvar); \ 10680Sstevel@tonic-gate } 10690Sstevel@tonic-gate 10700Sstevel@tonic-gate /* 10710Sstevel@tonic-gate * Don't block service procedure (and mir_close) if 10720Sstevel@tonic-gate * we are in the process of closing. 10730Sstevel@tonic-gate */ 10740Sstevel@tonic-gate #define MIR_WCANPUTNEXT(mir_ptr, write_q) \ 10750Sstevel@tonic-gate (canputnext(write_q) || ((mir_ptr)->mir_svc_no_more_msgs == 1)) 10760Sstevel@tonic-gate 10770Sstevel@tonic-gate static int mir_clnt_dup_request(queue_t *q, mblk_t *mp); 10780Sstevel@tonic-gate static void mir_rput_proto(queue_t *q, mblk_t *mp); 10790Sstevel@tonic-gate static int mir_svc_policy_notify(queue_t *q, int event); 10800Sstevel@tonic-gate static void mir_svc_release(queue_t *wq, mblk_t *mp); 10810Sstevel@tonic-gate static void mir_svc_start(queue_t *wq); 10820Sstevel@tonic-gate static void mir_svc_idle_start(queue_t *, mir_t *); 10830Sstevel@tonic-gate static void mir_svc_idle_stop(queue_t *, mir_t *); 10840Sstevel@tonic-gate static void mir_svc_start_close(queue_t *, mir_t *); 10850Sstevel@tonic-gate static void mir_clnt_idle_do_stop(queue_t *); 10860Sstevel@tonic-gate static void mir_clnt_idle_stop(queue_t *, mir_t *); 10870Sstevel@tonic-gate static void mir_clnt_idle_start(queue_t *, mir_t *); 10880Sstevel@tonic-gate static void mir_wput(queue_t *q, mblk_t *mp); 10890Sstevel@tonic-gate static void mir_wput_other(queue_t *q, mblk_t *mp); 10900Sstevel@tonic-gate static void mir_wsrv(queue_t *q); 10910Sstevel@tonic-gate static void mir_disconnect(queue_t *, mir_t *ir); 10920Sstevel@tonic-gate static int mir_check_len(queue_t *, int32_t, mblk_t *); 10930Sstevel@tonic-gate static void mir_timer(void *); 10940Sstevel@tonic-gate 10950Sstevel@tonic-gate extern void (*mir_rele)(queue_t *, mblk_t *); 10960Sstevel@tonic-gate extern void (*mir_start)(queue_t *); 10970Sstevel@tonic-gate extern void (*clnt_stop_idle)(queue_t *); 10980Sstevel@tonic-gate 10990Sstevel@tonic-gate clock_t clnt_idle_timeout = MIR_CLNT_IDLE_TIMEOUT; 11000Sstevel@tonic-gate clock_t svc_idle_timeout = MIR_SVC_IDLE_TIMEOUT; 11010Sstevel@tonic-gate 11020Sstevel@tonic-gate /* 11030Sstevel@tonic-gate * Timeout for subsequent notifications of idle connection. This is 11040Sstevel@tonic-gate * typically used to clean up after a wedged orderly release. 11050Sstevel@tonic-gate */ 11060Sstevel@tonic-gate clock_t svc_ordrel_timeout = MIR_SVC_ORDREL_TIMEOUT; /* milliseconds */ 11070Sstevel@tonic-gate 11080Sstevel@tonic-gate extern uint_t *clnt_max_msg_sizep; 11090Sstevel@tonic-gate extern uint_t *svc_max_msg_sizep; 11100Sstevel@tonic-gate uint_t clnt_max_msg_size = RPC_MAXDATASIZE; 11110Sstevel@tonic-gate uint_t svc_max_msg_size = RPC_MAXDATASIZE; 11120Sstevel@tonic-gate uint_t mir_krpc_cell_null; 11130Sstevel@tonic-gate 11140Sstevel@tonic-gate static void 11150Sstevel@tonic-gate mir_timer_stop(mir_t *mir) 11160Sstevel@tonic-gate { 11170Sstevel@tonic-gate timeout_id_t tid; 11180Sstevel@tonic-gate 11190Sstevel@tonic-gate ASSERT(MUTEX_HELD(&mir->mir_mutex)); 11200Sstevel@tonic-gate 11210Sstevel@tonic-gate /* 11220Sstevel@tonic-gate * Since the mir_mutex lock needs to be released to call 11230Sstevel@tonic-gate * untimeout(), we need to make sure that no other thread 11240Sstevel@tonic-gate * can start/stop the timer (changing mir_timer_id) during 11250Sstevel@tonic-gate * that time. The mir_timer_call bit and the mir_timer_cv 11260Sstevel@tonic-gate * condition variable are used to synchronize this. Setting 11270Sstevel@tonic-gate * mir_timer_call also tells mir_timer() (refer to the comments 11280Sstevel@tonic-gate * in mir_timer()) that it does not need to do anything. 11290Sstevel@tonic-gate */ 11300Sstevel@tonic-gate while (mir->mir_timer_call) 11310Sstevel@tonic-gate cv_wait(&mir->mir_timer_cv, &mir->mir_mutex); 11320Sstevel@tonic-gate mir->mir_timer_call = B_TRUE; 11330Sstevel@tonic-gate 11340Sstevel@tonic-gate if ((tid = mir->mir_timer_id) != 0) { 11350Sstevel@tonic-gate mir->mir_timer_id = 0; 11360Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 11370Sstevel@tonic-gate (void) untimeout(tid); 11380Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 11390Sstevel@tonic-gate } 11400Sstevel@tonic-gate mir->mir_timer_call = B_FALSE; 11410Sstevel@tonic-gate cv_broadcast(&mir->mir_timer_cv); 11420Sstevel@tonic-gate } 11430Sstevel@tonic-gate 11440Sstevel@tonic-gate static void 11450Sstevel@tonic-gate mir_timer_start(queue_t *q, mir_t *mir, clock_t intrvl) 11460Sstevel@tonic-gate { 11470Sstevel@tonic-gate timeout_id_t tid; 11480Sstevel@tonic-gate 11490Sstevel@tonic-gate ASSERT(MUTEX_HELD(&mir->mir_mutex)); 11500Sstevel@tonic-gate 11510Sstevel@tonic-gate while (mir->mir_timer_call) 11520Sstevel@tonic-gate cv_wait(&mir->mir_timer_cv, &mir->mir_mutex); 11530Sstevel@tonic-gate mir->mir_timer_call = B_TRUE; 11540Sstevel@tonic-gate 11550Sstevel@tonic-gate if ((tid = mir->mir_timer_id) != 0) { 11560Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 11570Sstevel@tonic-gate (void) untimeout(tid); 11580Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 11590Sstevel@tonic-gate } 11600Sstevel@tonic-gate /* Only start the timer when it is not closing. */ 11610Sstevel@tonic-gate if (!mir->mir_closing) { 11620Sstevel@tonic-gate mir->mir_timer_id = timeout(mir_timer, q, 11630Sstevel@tonic-gate MSEC_TO_TICK(intrvl)); 11640Sstevel@tonic-gate } 11650Sstevel@tonic-gate mir->mir_timer_call = B_FALSE; 11660Sstevel@tonic-gate cv_broadcast(&mir->mir_timer_cv); 11670Sstevel@tonic-gate } 11680Sstevel@tonic-gate 11690Sstevel@tonic-gate static int 11700Sstevel@tonic-gate mir_clnt_dup_request(queue_t *q, mblk_t *mp) 11710Sstevel@tonic-gate { 11720Sstevel@tonic-gate mblk_t *mp1; 11730Sstevel@tonic-gate uint32_t new_xid; 11740Sstevel@tonic-gate uint32_t old_xid; 11750Sstevel@tonic-gate 11760Sstevel@tonic-gate ASSERT(MUTEX_HELD(&((mir_t *)q->q_ptr)->mir_mutex)); 11770Sstevel@tonic-gate new_xid = BE32_TO_U32(&mp->b_rptr[4]); 11780Sstevel@tonic-gate /* 11790Sstevel@tonic-gate * This loop is a bit tacky -- it walks the STREAMS list of 11800Sstevel@tonic-gate * flow-controlled messages. 11810Sstevel@tonic-gate */ 11820Sstevel@tonic-gate if ((mp1 = q->q_first) != NULL) { 11830Sstevel@tonic-gate do { 11840Sstevel@tonic-gate old_xid = BE32_TO_U32(&mp1->b_rptr[4]); 11850Sstevel@tonic-gate if (new_xid == old_xid) 11860Sstevel@tonic-gate return (1); 11870Sstevel@tonic-gate } while ((mp1 = mp1->b_next) != NULL); 11880Sstevel@tonic-gate } 11890Sstevel@tonic-gate return (0); 11900Sstevel@tonic-gate } 11910Sstevel@tonic-gate 11920Sstevel@tonic-gate static int 11930Sstevel@tonic-gate mir_close(queue_t *q) 11940Sstevel@tonic-gate { 11950Sstevel@tonic-gate mir_t *mir; 11960Sstevel@tonic-gate mblk_t *mp; 11970Sstevel@tonic-gate bool_t queue_cleaned = FALSE; 11980Sstevel@tonic-gate 11990Sstevel@tonic-gate RPCLOG(32, "rpcmod: mir_close of q 0x%p\n", (void *)q); 12000Sstevel@tonic-gate mir = (mir_t *)q->q_ptr; 12010Sstevel@tonic-gate ASSERT(MUTEX_NOT_HELD(&mir->mir_mutex)); 12020Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 12030Sstevel@tonic-gate if ((mp = mir->mir_head_mp) != NULL) { 12040Sstevel@tonic-gate mir->mir_head_mp = (mblk_t *)0; 12050Sstevel@tonic-gate freemsg(mp); 12060Sstevel@tonic-gate } 12070Sstevel@tonic-gate /* 12080Sstevel@tonic-gate * Set mir_closing so we get notified when MIR_SVC_QUIESCED() 12090Sstevel@tonic-gate * is TRUE. And mir_timer_start() won't start the timer again. 12100Sstevel@tonic-gate */ 12110Sstevel@tonic-gate mir->mir_closing = B_TRUE; 12120Sstevel@tonic-gate mir_timer_stop(mir); 12130Sstevel@tonic-gate 12140Sstevel@tonic-gate if (mir->mir_type == RPC_SERVER) { 12150Sstevel@tonic-gate flushq(q, FLUSHDATA); /* Ditch anything waiting on read q */ 12160Sstevel@tonic-gate 12170Sstevel@tonic-gate /* 12180Sstevel@tonic-gate * This will prevent more requests from arriving and 12190Sstevel@tonic-gate * will force rpcmod to ignore flow control. 12200Sstevel@tonic-gate */ 12210Sstevel@tonic-gate mir_svc_start_close(WR(q), mir); 12220Sstevel@tonic-gate 12230Sstevel@tonic-gate while ((!MIR_SVC_QUIESCED(mir)) || mir->mir_inwservice == 1) { 12240Sstevel@tonic-gate 12250Sstevel@tonic-gate if (mir->mir_ref_cnt && !mir->mir_inrservice && 1226*4741Sgt29601 (queue_cleaned == FALSE)) { 12270Sstevel@tonic-gate /* 12280Sstevel@tonic-gate * call into SVC to clean the queue 12290Sstevel@tonic-gate */ 12300Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 12310Sstevel@tonic-gate svc_queueclean(q); 12320Sstevel@tonic-gate queue_cleaned = TRUE; 12330Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 12340Sstevel@tonic-gate continue; 12350Sstevel@tonic-gate } 12360Sstevel@tonic-gate 12370Sstevel@tonic-gate /* 12380Sstevel@tonic-gate * Bugid 1253810 - Force the write service 12390Sstevel@tonic-gate * procedure to send its messages, regardless 12400Sstevel@tonic-gate * whether the downstream module is ready 12410Sstevel@tonic-gate * to accept data. 12420Sstevel@tonic-gate */ 12430Sstevel@tonic-gate if (mir->mir_inwservice == 1) 12440Sstevel@tonic-gate qenable(WR(q)); 12450Sstevel@tonic-gate 12460Sstevel@tonic-gate cv_wait(&mir->mir_condvar, &mir->mir_mutex); 12470Sstevel@tonic-gate } 12480Sstevel@tonic-gate 12490Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 12500Sstevel@tonic-gate qprocsoff(q); 12510Sstevel@tonic-gate 12520Sstevel@tonic-gate /* Notify KRPC that this stream is going away. */ 12530Sstevel@tonic-gate svc_queueclose(q); 12540Sstevel@tonic-gate } else { 12550Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 12560Sstevel@tonic-gate qprocsoff(q); 12570Sstevel@tonic-gate } 12580Sstevel@tonic-gate 12590Sstevel@tonic-gate mutex_destroy(&mir->mir_mutex); 12600Sstevel@tonic-gate cv_destroy(&mir->mir_condvar); 12610Sstevel@tonic-gate cv_destroy(&mir->mir_timer_cv); 12620Sstevel@tonic-gate kmem_free(mir, sizeof (mir_t)); 12630Sstevel@tonic-gate return (0); 12640Sstevel@tonic-gate } 12650Sstevel@tonic-gate 12660Sstevel@tonic-gate /* 12670Sstevel@tonic-gate * This is server side only (RPC_SERVER). 12680Sstevel@tonic-gate * 12690Sstevel@tonic-gate * Exit idle mode. 12700Sstevel@tonic-gate */ 12710Sstevel@tonic-gate static void 12720Sstevel@tonic-gate mir_svc_idle_stop(queue_t *q, mir_t *mir) 12730Sstevel@tonic-gate { 12740Sstevel@tonic-gate ASSERT(MUTEX_HELD(&mir->mir_mutex)); 12750Sstevel@tonic-gate ASSERT((q->q_flag & QREADR) == 0); 12760Sstevel@tonic-gate ASSERT(mir->mir_type == RPC_SERVER); 12770Sstevel@tonic-gate RPCLOG(16, "rpcmod: mir_svc_idle_stop of q 0x%p\n", (void *)q); 12780Sstevel@tonic-gate 12790Sstevel@tonic-gate mir_timer_stop(mir); 12800Sstevel@tonic-gate } 12810Sstevel@tonic-gate 12820Sstevel@tonic-gate /* 12830Sstevel@tonic-gate * This is server side only (RPC_SERVER). 12840Sstevel@tonic-gate * 12850Sstevel@tonic-gate * Start idle processing, which will include setting idle timer if the 12860Sstevel@tonic-gate * stream is not being closed. 12870Sstevel@tonic-gate */ 12880Sstevel@tonic-gate static void 12890Sstevel@tonic-gate mir_svc_idle_start(queue_t *q, mir_t *mir) 12900Sstevel@tonic-gate { 12910Sstevel@tonic-gate ASSERT(MUTEX_HELD(&mir->mir_mutex)); 12920Sstevel@tonic-gate ASSERT((q->q_flag & QREADR) == 0); 12930Sstevel@tonic-gate ASSERT(mir->mir_type == RPC_SERVER); 12940Sstevel@tonic-gate RPCLOG(16, "rpcmod: mir_svc_idle_start q 0x%p\n", (void *)q); 12950Sstevel@tonic-gate 12960Sstevel@tonic-gate /* 12970Sstevel@tonic-gate * Don't re-start idle timer if we are closing queues. 12980Sstevel@tonic-gate */ 12990Sstevel@tonic-gate if (mir->mir_closing) { 13000Sstevel@tonic-gate RPCLOG(16, "mir_svc_idle_start - closing: 0x%p\n", 1301*4741Sgt29601 (void *)q); 13020Sstevel@tonic-gate 13030Sstevel@tonic-gate /* 13040Sstevel@tonic-gate * We will call mir_svc_idle_start() whenever MIR_SVC_QUIESCED() 13050Sstevel@tonic-gate * is true. When it is true, and we are in the process of 13060Sstevel@tonic-gate * closing the stream, signal any thread waiting in 13070Sstevel@tonic-gate * mir_close(). 13080Sstevel@tonic-gate */ 13090Sstevel@tonic-gate if (mir->mir_inwservice == 0) 13100Sstevel@tonic-gate cv_signal(&mir->mir_condvar); 13110Sstevel@tonic-gate 13120Sstevel@tonic-gate } else { 13130Sstevel@tonic-gate RPCLOG(16, "mir_svc_idle_start - reset %s timer\n", 1314*4741Sgt29601 mir->mir_ordrel_pending ? "ordrel" : "normal"); 13150Sstevel@tonic-gate /* 13160Sstevel@tonic-gate * Normal condition, start the idle timer. If an orderly 13170Sstevel@tonic-gate * release has been sent, set the timeout to wait for the 13180Sstevel@tonic-gate * client to close its side of the connection. Otherwise, 13190Sstevel@tonic-gate * use the normal idle timeout. 13200Sstevel@tonic-gate */ 13210Sstevel@tonic-gate mir_timer_start(q, mir, mir->mir_ordrel_pending ? 13220Sstevel@tonic-gate svc_ordrel_timeout : mir->mir_idle_timeout); 13230Sstevel@tonic-gate } 13240Sstevel@tonic-gate } 13250Sstevel@tonic-gate 13260Sstevel@tonic-gate /* ARGSUSED */ 13270Sstevel@tonic-gate static int 13280Sstevel@tonic-gate mir_open(queue_t *q, dev_t *devp, int flag, int sflag, cred_t *credp) 13290Sstevel@tonic-gate { 13300Sstevel@tonic-gate mir_t *mir; 13310Sstevel@tonic-gate 13320Sstevel@tonic-gate RPCLOG(32, "rpcmod: mir_open of q 0x%p\n", (void *)q); 13330Sstevel@tonic-gate /* Set variables used directly by KRPC. */ 13340Sstevel@tonic-gate if (!mir_rele) 13350Sstevel@tonic-gate mir_rele = mir_svc_release; 13360Sstevel@tonic-gate if (!mir_start) 13370Sstevel@tonic-gate mir_start = mir_svc_start; 13380Sstevel@tonic-gate if (!clnt_stop_idle) 13390Sstevel@tonic-gate clnt_stop_idle = mir_clnt_idle_do_stop; 13400Sstevel@tonic-gate if (!clnt_max_msg_sizep) 13410Sstevel@tonic-gate clnt_max_msg_sizep = &clnt_max_msg_size; 13420Sstevel@tonic-gate if (!svc_max_msg_sizep) 13430Sstevel@tonic-gate svc_max_msg_sizep = &svc_max_msg_size; 13440Sstevel@tonic-gate 13450Sstevel@tonic-gate /* Allocate a zero'ed out mir structure for this stream. */ 13460Sstevel@tonic-gate mir = kmem_zalloc(sizeof (mir_t), KM_SLEEP); 13470Sstevel@tonic-gate 13480Sstevel@tonic-gate /* 13490Sstevel@tonic-gate * We set hold inbound here so that incoming messages will 13500Sstevel@tonic-gate * be held on the read-side queue until the stream is completely 13510Sstevel@tonic-gate * initialized with a RPC_CLIENT or RPC_SERVER ioctl. During 13520Sstevel@tonic-gate * the ioctl processing, the flag is cleared and any messages that 13530Sstevel@tonic-gate * arrived between the open and the ioctl are delivered to KRPC. 13540Sstevel@tonic-gate * 13550Sstevel@tonic-gate * Early data should never arrive on a client stream since 13560Sstevel@tonic-gate * servers only respond to our requests and we do not send any. 13570Sstevel@tonic-gate * until after the stream is initialized. Early data is 13580Sstevel@tonic-gate * very common on a server stream where the client will start 13590Sstevel@tonic-gate * sending data as soon as the connection is made (and this 13600Sstevel@tonic-gate * is especially true with TCP where the protocol accepts the 13610Sstevel@tonic-gate * connection before nfsd or KRPC is notified about it). 13620Sstevel@tonic-gate */ 13630Sstevel@tonic-gate 13640Sstevel@tonic-gate mir->mir_hold_inbound = 1; 13650Sstevel@tonic-gate 13660Sstevel@tonic-gate /* 13670Sstevel@tonic-gate * Start the record marker looking for a 4-byte header. When 13680Sstevel@tonic-gate * this length is negative, it indicates that rpcmod is looking 13690Sstevel@tonic-gate * for bytes to consume for the record marker header. When it 13700Sstevel@tonic-gate * is positive, it holds the number of bytes that have arrived 13710Sstevel@tonic-gate * for the current fragment and are being held in mir_header_mp. 13720Sstevel@tonic-gate */ 13730Sstevel@tonic-gate 13740Sstevel@tonic-gate mir->mir_frag_len = -(int32_t)sizeof (uint32_t); 13750Sstevel@tonic-gate 1376766Scarlsonj mir->mir_zoneid = rpc_zoneid(); 13770Sstevel@tonic-gate mutex_init(&mir->mir_mutex, NULL, MUTEX_DEFAULT, NULL); 13780Sstevel@tonic-gate cv_init(&mir->mir_condvar, NULL, CV_DRIVER, NULL); 13790Sstevel@tonic-gate cv_init(&mir->mir_timer_cv, NULL, CV_DRIVER, NULL); 13800Sstevel@tonic-gate 13810Sstevel@tonic-gate q->q_ptr = (char *)mir; 13820Sstevel@tonic-gate WR(q)->q_ptr = (char *)mir; 13830Sstevel@tonic-gate 13840Sstevel@tonic-gate /* 13850Sstevel@tonic-gate * We noenable the read-side queue because we don't want it 13860Sstevel@tonic-gate * automatically enabled by putq. We enable it explicitly 13870Sstevel@tonic-gate * in mir_wsrv when appropriate. (See additional comments on 13880Sstevel@tonic-gate * flow control at the beginning of mir_rsrv.) 13890Sstevel@tonic-gate */ 13900Sstevel@tonic-gate noenable(q); 13910Sstevel@tonic-gate 13920Sstevel@tonic-gate qprocson(q); 13930Sstevel@tonic-gate return (0); 13940Sstevel@tonic-gate } 13950Sstevel@tonic-gate 13960Sstevel@tonic-gate /* 13970Sstevel@tonic-gate * Read-side put routine for both the client and server side. Does the 13980Sstevel@tonic-gate * record marking for incoming RPC messages, and when complete, dispatches 13990Sstevel@tonic-gate * the message to either the client or server. 14000Sstevel@tonic-gate */ 14010Sstevel@tonic-gate static void 14020Sstevel@tonic-gate mir_do_rput(queue_t *q, mblk_t *mp, int srv) 14030Sstevel@tonic-gate { 14040Sstevel@tonic-gate mblk_t *cont_mp; 14050Sstevel@tonic-gate int excess; 14060Sstevel@tonic-gate int32_t frag_len; 14070Sstevel@tonic-gate int32_t frag_header; 14080Sstevel@tonic-gate mblk_t *head_mp; 14090Sstevel@tonic-gate int len; 14100Sstevel@tonic-gate mir_t *mir; 14110Sstevel@tonic-gate mblk_t *mp1; 14120Sstevel@tonic-gate unsigned char *rptr; 14130Sstevel@tonic-gate mblk_t *tail_mp; 14140Sstevel@tonic-gate unsigned char *wptr; 14150Sstevel@tonic-gate boolean_t stop_timer = B_FALSE; 14160Sstevel@tonic-gate 14170Sstevel@tonic-gate mir = (mir_t *)q->q_ptr; 14180Sstevel@tonic-gate ASSERT(mir != NULL); 14190Sstevel@tonic-gate 14200Sstevel@tonic-gate /* 14210Sstevel@tonic-gate * If the stream has not been set up as a RPC_CLIENT or RPC_SERVER 14220Sstevel@tonic-gate * with the corresponding ioctl, then don't accept 14230Sstevel@tonic-gate * any inbound data. This should never happen for streams 14240Sstevel@tonic-gate * created by nfsd or client-side KRPC because they are careful 14250Sstevel@tonic-gate * to set the mode of the stream before doing anything else. 14260Sstevel@tonic-gate */ 14270Sstevel@tonic-gate if (mir->mir_type == 0) { 14280Sstevel@tonic-gate freemsg(mp); 14290Sstevel@tonic-gate return; 14300Sstevel@tonic-gate } 14310Sstevel@tonic-gate 14320Sstevel@tonic-gate ASSERT(MUTEX_NOT_HELD(&mir->mir_mutex)); 14330Sstevel@tonic-gate 14340Sstevel@tonic-gate switch (mp->b_datap->db_type) { 14350Sstevel@tonic-gate case M_DATA: 14360Sstevel@tonic-gate break; 14370Sstevel@tonic-gate case M_PROTO: 14380Sstevel@tonic-gate case M_PCPROTO: 14390Sstevel@tonic-gate rptr = mp->b_rptr; 14400Sstevel@tonic-gate if (mp->b_wptr - rptr < sizeof (uint32_t)) { 14410Sstevel@tonic-gate RPCLOG(1, "mir_rput: runt TPI message (%d bytes)\n", 14420Sstevel@tonic-gate (int)(mp->b_wptr - rptr)); 14430Sstevel@tonic-gate freemsg(mp); 14440Sstevel@tonic-gate return; 14450Sstevel@tonic-gate } 14460Sstevel@tonic-gate if (((union T_primitives *)rptr)->type != T_DATA_IND) { 14470Sstevel@tonic-gate mir_rput_proto(q, mp); 14480Sstevel@tonic-gate return; 14490Sstevel@tonic-gate } 14500Sstevel@tonic-gate 14510Sstevel@tonic-gate /* Throw away the T_DATA_IND block and continue with data. */ 14520Sstevel@tonic-gate mp1 = mp; 14530Sstevel@tonic-gate mp = mp->b_cont; 14540Sstevel@tonic-gate freeb(mp1); 14550Sstevel@tonic-gate break; 14560Sstevel@tonic-gate case M_SETOPTS: 14570Sstevel@tonic-gate /* 14580Sstevel@tonic-gate * If a module on the stream is trying set the Stream head's 14590Sstevel@tonic-gate * high water mark, then set our hiwater to the requested 14600Sstevel@tonic-gate * value. We are the "stream head" for all inbound 14610Sstevel@tonic-gate * data messages since messages are passed directly to KRPC. 14620Sstevel@tonic-gate */ 14630Sstevel@tonic-gate if ((mp->b_wptr - mp->b_rptr) >= sizeof (struct stroptions)) { 14640Sstevel@tonic-gate struct stroptions *stropts; 14650Sstevel@tonic-gate 14660Sstevel@tonic-gate stropts = (struct stroptions *)mp->b_rptr; 14670Sstevel@tonic-gate if ((stropts->so_flags & SO_HIWAT) && 1468*4741Sgt29601 !(stropts->so_flags & SO_BAND)) { 14690Sstevel@tonic-gate (void) strqset(q, QHIWAT, 0, stropts->so_hiwat); 14700Sstevel@tonic-gate } 14710Sstevel@tonic-gate } 14720Sstevel@tonic-gate putnext(q, mp); 14730Sstevel@tonic-gate return; 14740Sstevel@tonic-gate case M_FLUSH: 14750Sstevel@tonic-gate RPCLOG(32, "mir_do_rput: ignoring M_FLUSH on q 0x%p. ", 14760Sstevel@tonic-gate (void *)q); 14770Sstevel@tonic-gate RPCLOG(32, "M_FLUSH is %x\n", (uint_t)*mp->b_rptr); 14780Sstevel@tonic-gate 14790Sstevel@tonic-gate putnext(q, mp); 14800Sstevel@tonic-gate return; 14810Sstevel@tonic-gate default: 14820Sstevel@tonic-gate putnext(q, mp); 14830Sstevel@tonic-gate return; 14840Sstevel@tonic-gate } 14850Sstevel@tonic-gate 14860Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 14870Sstevel@tonic-gate 14880Sstevel@tonic-gate /* 14890Sstevel@tonic-gate * If this connection is closing, don't accept any new messages. 14900Sstevel@tonic-gate */ 14910Sstevel@tonic-gate if (mir->mir_svc_no_more_msgs) { 14920Sstevel@tonic-gate ASSERT(mir->mir_type == RPC_SERVER); 14930Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 14940Sstevel@tonic-gate freemsg(mp); 14950Sstevel@tonic-gate return; 14960Sstevel@tonic-gate } 14970Sstevel@tonic-gate 14980Sstevel@tonic-gate /* Get local copies for quicker access. */ 14990Sstevel@tonic-gate frag_len = mir->mir_frag_len; 15000Sstevel@tonic-gate frag_header = mir->mir_frag_header; 15010Sstevel@tonic-gate head_mp = mir->mir_head_mp; 15020Sstevel@tonic-gate tail_mp = mir->mir_tail_mp; 15030Sstevel@tonic-gate 15040Sstevel@tonic-gate /* Loop, processing each message block in the mp chain separately. */ 15050Sstevel@tonic-gate do { 15060Sstevel@tonic-gate /* 15070Sstevel@tonic-gate * cont_mp is used in the do/while condition below to 15080Sstevel@tonic-gate * walk to the next block in the STREAMS message. 15090Sstevel@tonic-gate * mp->b_cont may be nil'ed during processing so we 15100Sstevel@tonic-gate * can't rely on it to find the next block. 15110Sstevel@tonic-gate */ 15120Sstevel@tonic-gate cont_mp = mp->b_cont; 15130Sstevel@tonic-gate 15140Sstevel@tonic-gate /* 15150Sstevel@tonic-gate * Get local copies of rptr and wptr for our processing. 15160Sstevel@tonic-gate * These always point into "mp" (the current block being 15170Sstevel@tonic-gate * processed), but rptr is updated as we consume any 15180Sstevel@tonic-gate * record header in this message, and wptr is updated to 15190Sstevel@tonic-gate * point to the end of the data for the current fragment, 15200Sstevel@tonic-gate * if it ends in this block. The main point is that 15210Sstevel@tonic-gate * they are not always the same as b_rptr and b_wptr. 15220Sstevel@tonic-gate * b_rptr and b_wptr will be updated when appropriate. 15230Sstevel@tonic-gate */ 15240Sstevel@tonic-gate rptr = mp->b_rptr; 15250Sstevel@tonic-gate wptr = mp->b_wptr; 15260Sstevel@tonic-gate same_mblk:; 15270Sstevel@tonic-gate len = (int)(wptr - rptr); 15280Sstevel@tonic-gate if (len <= 0) { 15290Sstevel@tonic-gate /* 15300Sstevel@tonic-gate * If we have processed all of the data in the message 15310Sstevel@tonic-gate * or the block is empty to begin with, then we're 15320Sstevel@tonic-gate * done with this block and can go on to cont_mp, 15330Sstevel@tonic-gate * if there is one. 15340Sstevel@tonic-gate * 15350Sstevel@tonic-gate * First, we check to see if the current block is 15360Sstevel@tonic-gate * now zero-length and, if so, we free it. 15370Sstevel@tonic-gate * This happens when either the block was empty 15380Sstevel@tonic-gate * to begin with or we consumed all of the data 15390Sstevel@tonic-gate * for the record marking header. 15400Sstevel@tonic-gate */ 15410Sstevel@tonic-gate if (rptr <= mp->b_rptr) { 15420Sstevel@tonic-gate /* 15430Sstevel@tonic-gate * If head_mp is non-NULL, add cont_mp to the 15440Sstevel@tonic-gate * mblk list. XXX But there is a possibility 15450Sstevel@tonic-gate * that tail_mp = mp or even head_mp = mp XXX 15460Sstevel@tonic-gate */ 15470Sstevel@tonic-gate if (head_mp) { 15480Sstevel@tonic-gate if (head_mp == mp) 15490Sstevel@tonic-gate head_mp = NULL; 15500Sstevel@tonic-gate else if (tail_mp != mp) { 15510Sstevel@tonic-gate ASSERT((tail_mp->b_cont == NULL) || (tail_mp->b_cont == mp)); 15520Sstevel@tonic-gate tail_mp->b_cont = cont_mp; 15530Sstevel@tonic-gate /* 15540Sstevel@tonic-gate * It's possible that, because 15550Sstevel@tonic-gate * of a very short mblk (0-3 15560Sstevel@tonic-gate * bytes), we've ended up here 15570Sstevel@tonic-gate * and that cont_mp could be 15580Sstevel@tonic-gate * NULL (if we're at the end 15590Sstevel@tonic-gate * of an mblk chain). If so, 15600Sstevel@tonic-gate * don't set tail_mp to 15610Sstevel@tonic-gate * cont_mp, because the next 15620Sstevel@tonic-gate * time we access it, we'll 15630Sstevel@tonic-gate * dereference a NULL pointer 15640Sstevel@tonic-gate * and crash. Just leave 15650Sstevel@tonic-gate * tail_mp pointing at the 15660Sstevel@tonic-gate * current end of chain. 15670Sstevel@tonic-gate */ 15680Sstevel@tonic-gate if (cont_mp) 15690Sstevel@tonic-gate tail_mp = cont_mp; 15700Sstevel@tonic-gate } else { 15710Sstevel@tonic-gate mblk_t *smp = head_mp; 15720Sstevel@tonic-gate 15730Sstevel@tonic-gate while ((smp->b_cont != NULL) && 1574*4741Sgt29601 (smp->b_cont != mp)) 15750Sstevel@tonic-gate smp = smp->b_cont; 15760Sstevel@tonic-gate smp->b_cont = cont_mp; 15770Sstevel@tonic-gate /* 15780Sstevel@tonic-gate * Don't set tail_mp to cont_mp 15790Sstevel@tonic-gate * if it's NULL. Instead, set 15800Sstevel@tonic-gate * tail_mp to smp, which is the 15810Sstevel@tonic-gate * end of the chain starting 15820Sstevel@tonic-gate * at head_mp. 15830Sstevel@tonic-gate */ 15840Sstevel@tonic-gate if (cont_mp) 15850Sstevel@tonic-gate tail_mp = cont_mp; 15860Sstevel@tonic-gate else 15870Sstevel@tonic-gate tail_mp = smp; 15880Sstevel@tonic-gate } 15890Sstevel@tonic-gate } 15900Sstevel@tonic-gate freeb(mp); 15910Sstevel@tonic-gate } 15920Sstevel@tonic-gate continue; 15930Sstevel@tonic-gate } 15940Sstevel@tonic-gate 15950Sstevel@tonic-gate /* 15960Sstevel@tonic-gate * frag_len starts at -4 and is incremented past the record 15970Sstevel@tonic-gate * marking header to 0, and then becomes positive as real data 15980Sstevel@tonic-gate * bytes are received for the message. While frag_len is less 15990Sstevel@tonic-gate * than zero, we need more bytes for the record marking 16000Sstevel@tonic-gate * header. 16010Sstevel@tonic-gate */ 16020Sstevel@tonic-gate if (frag_len < 0) { 16030Sstevel@tonic-gate uchar_t *up = rptr; 16040Sstevel@tonic-gate /* 16050Sstevel@tonic-gate * Collect as many bytes as we need for the record 16060Sstevel@tonic-gate * marking header and that are available in this block. 16070Sstevel@tonic-gate */ 16080Sstevel@tonic-gate do { 16090Sstevel@tonic-gate --len; 16100Sstevel@tonic-gate frag_len++; 16110Sstevel@tonic-gate frag_header <<= 8; 16120Sstevel@tonic-gate frag_header += (*up++ & 0xFF); 16130Sstevel@tonic-gate } while (len > 0 && frag_len < 0); 16140Sstevel@tonic-gate 16150Sstevel@tonic-gate if (rptr == mp->b_rptr) { 16160Sstevel@tonic-gate /* 16170Sstevel@tonic-gate * The record header is located at the 16180Sstevel@tonic-gate * beginning of the block, so just walk 16190Sstevel@tonic-gate * b_rptr past it. 16200Sstevel@tonic-gate */ 16210Sstevel@tonic-gate mp->b_rptr = rptr = up; 16220Sstevel@tonic-gate } else { 16230Sstevel@tonic-gate /* 16240Sstevel@tonic-gate * The record header is located in the middle 16250Sstevel@tonic-gate * of a block, so copy any remaining data up. 16260Sstevel@tonic-gate * This happens when an RPC message is 16270Sstevel@tonic-gate * fragmented into multiple pieces and 16280Sstevel@tonic-gate * a middle (or end) fragment immediately 16290Sstevel@tonic-gate * follows a previous fragment in the same 16300Sstevel@tonic-gate * message block. 16310Sstevel@tonic-gate */ 16320Sstevel@tonic-gate wptr = &rptr[len]; 16330Sstevel@tonic-gate mp->b_wptr = wptr; 16340Sstevel@tonic-gate if (len) { 16350Sstevel@tonic-gate RPCLOG(32, "mir_do_rput: copying %d " 16360Sstevel@tonic-gate "bytes of data up", len); 16370Sstevel@tonic-gate RPCLOG(32, " db_ref %d\n", 16380Sstevel@tonic-gate (uint_t)mp->b_datap->db_ref); 16390Sstevel@tonic-gate bcopy(up, rptr, len); 16400Sstevel@tonic-gate } 16410Sstevel@tonic-gate } 16420Sstevel@tonic-gate 16430Sstevel@tonic-gate /* 16440Sstevel@tonic-gate * If we haven't received the complete record header 16450Sstevel@tonic-gate * yet, then loop around to get the next block in the 16460Sstevel@tonic-gate * STREAMS message. The logic at same_mblk label will 16470Sstevel@tonic-gate * free the current block if it has become empty. 16480Sstevel@tonic-gate */ 16490Sstevel@tonic-gate if (frag_len < 0) { 16500Sstevel@tonic-gate RPCLOG(32, "mir_do_rput: frag_len is still < 0 " 16510Sstevel@tonic-gate "(%d)", len); 16520Sstevel@tonic-gate goto same_mblk; 16530Sstevel@tonic-gate } 16540Sstevel@tonic-gate 16550Sstevel@tonic-gate #ifdef RPCDEBUG 16560Sstevel@tonic-gate if ((frag_header & MIR_LASTFRAG) == 0) { 16570Sstevel@tonic-gate RPCLOG0(32, "mir_do_rput: multi-fragment " 16580Sstevel@tonic-gate "record\n"); 16590Sstevel@tonic-gate } 16600Sstevel@tonic-gate { 16610Sstevel@tonic-gate uint_t l = frag_header & ~MIR_LASTFRAG; 16620Sstevel@tonic-gate 16630Sstevel@tonic-gate if (l != 0 && mir->mir_max_msg_sizep && 16640Sstevel@tonic-gate l >= *mir->mir_max_msg_sizep) { 16650Sstevel@tonic-gate RPCLOG(32, "mir_do_rput: fragment size" 16660Sstevel@tonic-gate " (%d) > maximum", l); 16670Sstevel@tonic-gate RPCLOG(32, " (%u)\n", 16680Sstevel@tonic-gate *mir->mir_max_msg_sizep); 16690Sstevel@tonic-gate } 16700Sstevel@tonic-gate } 16710Sstevel@tonic-gate #endif 16720Sstevel@tonic-gate /* 16730Sstevel@tonic-gate * At this point we have retrieved the complete record 16740Sstevel@tonic-gate * header for this fragment. If the current block is 16750Sstevel@tonic-gate * empty, then we need to free it and walk to the next 16760Sstevel@tonic-gate * block. 16770Sstevel@tonic-gate */ 16780Sstevel@tonic-gate if (mp->b_rptr >= wptr) { 16790Sstevel@tonic-gate /* 16800Sstevel@tonic-gate * If this is not the last fragment or if we 16810Sstevel@tonic-gate * have not received all the data for this 16820Sstevel@tonic-gate * RPC message, then loop around to the next 16830Sstevel@tonic-gate * block. 16840Sstevel@tonic-gate */ 16850Sstevel@tonic-gate if (!(frag_header & MIR_LASTFRAG) || 1686*4741Sgt29601 (frag_len - 1687*4741Sgt29601 (frag_header & ~MIR_LASTFRAG)) || 1688*4741Sgt29601 !head_mp) 16890Sstevel@tonic-gate goto same_mblk; 16900Sstevel@tonic-gate 16910Sstevel@tonic-gate /* 16920Sstevel@tonic-gate * Quick walk to next block in the 16930Sstevel@tonic-gate * STREAMS message. 16940Sstevel@tonic-gate */ 16950Sstevel@tonic-gate freeb(mp); 16960Sstevel@tonic-gate continue; 16970Sstevel@tonic-gate } 16980Sstevel@tonic-gate } 16990Sstevel@tonic-gate 17000Sstevel@tonic-gate /* 17010Sstevel@tonic-gate * We've collected the complete record header. The data 17020Sstevel@tonic-gate * in the current block is added to the end of the RPC 17030Sstevel@tonic-gate * message. Note that tail_mp is the same as mp after 17040Sstevel@tonic-gate * this linkage. 17050Sstevel@tonic-gate */ 17060Sstevel@tonic-gate if (!head_mp) 17070Sstevel@tonic-gate head_mp = mp; 17080Sstevel@tonic-gate else if (tail_mp != mp) { 17090Sstevel@tonic-gate ASSERT((tail_mp->b_cont == NULL) || 17100Sstevel@tonic-gate (tail_mp->b_cont == mp)); 17110Sstevel@tonic-gate tail_mp->b_cont = mp; 17120Sstevel@tonic-gate } 17130Sstevel@tonic-gate tail_mp = mp; 17140Sstevel@tonic-gate 17150Sstevel@tonic-gate /* 17160Sstevel@tonic-gate * Add the length of this block to the accumulated 17170Sstevel@tonic-gate * fragment length. 17180Sstevel@tonic-gate */ 17190Sstevel@tonic-gate frag_len += len; 17200Sstevel@tonic-gate excess = frag_len - (frag_header & ~MIR_LASTFRAG); 17210Sstevel@tonic-gate /* 17220Sstevel@tonic-gate * If we have not received all the data for this fragment, 17230Sstevel@tonic-gate * then walk to the next block. 17240Sstevel@tonic-gate */ 17250Sstevel@tonic-gate if (excess < 0) 17260Sstevel@tonic-gate continue; 17270Sstevel@tonic-gate 17280Sstevel@tonic-gate /* 17290Sstevel@tonic-gate * We've received a complete fragment, so reset frag_len 17300Sstevel@tonic-gate * for the next one. 17310Sstevel@tonic-gate */ 17320Sstevel@tonic-gate frag_len = -(int32_t)sizeof (uint32_t); 17330Sstevel@tonic-gate 17340Sstevel@tonic-gate /* 17350Sstevel@tonic-gate * Update rptr to point to the beginning of the next 17360Sstevel@tonic-gate * fragment in this block. If there are no more bytes 17370Sstevel@tonic-gate * in the block (excess is 0), then rptr will be equal 17380Sstevel@tonic-gate * to wptr. 17390Sstevel@tonic-gate */ 17400Sstevel@tonic-gate rptr = wptr - excess; 17410Sstevel@tonic-gate 17420Sstevel@tonic-gate /* 17430Sstevel@tonic-gate * Now we check to see if this fragment is the last one in 17440Sstevel@tonic-gate * the RPC message. 17450Sstevel@tonic-gate */ 17460Sstevel@tonic-gate if (!(frag_header & MIR_LASTFRAG)) { 17470Sstevel@tonic-gate /* 17480Sstevel@tonic-gate * This isn't the last one, so start processing the 17490Sstevel@tonic-gate * next fragment. 17500Sstevel@tonic-gate */ 17510Sstevel@tonic-gate frag_header = 0; 17520Sstevel@tonic-gate 17530Sstevel@tonic-gate /* 17540Sstevel@tonic-gate * If excess is 0, the next fragment 17550Sstevel@tonic-gate * starts at the beginning of the next block -- 17560Sstevel@tonic-gate * we "continue" to the end of the while loop and 17570Sstevel@tonic-gate * walk to cont_mp. 17580Sstevel@tonic-gate */ 17590Sstevel@tonic-gate if (excess == 0) 17600Sstevel@tonic-gate continue; 17610Sstevel@tonic-gate RPCLOG0(32, "mir_do_rput: multi-fragment message with " 17620Sstevel@tonic-gate "two or more fragments in one mblk\n"); 17630Sstevel@tonic-gate 17640Sstevel@tonic-gate /* 17650Sstevel@tonic-gate * If excess is non-0, then the next fragment starts 17660Sstevel@tonic-gate * in this block. rptr points to the beginning 17670Sstevel@tonic-gate * of the next fragment and we "goto same_mblk" 17680Sstevel@tonic-gate * to continue processing. 17690Sstevel@tonic-gate */ 17700Sstevel@tonic-gate goto same_mblk; 17710Sstevel@tonic-gate } 17720Sstevel@tonic-gate 17730Sstevel@tonic-gate /* 17740Sstevel@tonic-gate * We've got a complete RPC message. Before passing it 17750Sstevel@tonic-gate * upstream, check to see if there is extra data in this 17760Sstevel@tonic-gate * message block. If so, then we separate the excess 17770Sstevel@tonic-gate * from the complete message. The excess data is processed 17780Sstevel@tonic-gate * after the current message goes upstream. 17790Sstevel@tonic-gate */ 17800Sstevel@tonic-gate if (excess > 0) { 17810Sstevel@tonic-gate RPCLOG(32, "mir_do_rput: end of record, but excess " 17820Sstevel@tonic-gate "data (%d bytes) in this mblk. dupb/copyb " 17830Sstevel@tonic-gate "needed\n", excess); 17840Sstevel@tonic-gate 17850Sstevel@tonic-gate /* Duplicate only the overlapping block. */ 17860Sstevel@tonic-gate mp1 = dupb(tail_mp); 17870Sstevel@tonic-gate 17880Sstevel@tonic-gate /* 17890Sstevel@tonic-gate * dupb() might have failed due to ref count wrap around 17900Sstevel@tonic-gate * so try a copyb(). 17910Sstevel@tonic-gate */ 17920Sstevel@tonic-gate if (mp1 == NULL) 17930Sstevel@tonic-gate mp1 = copyb(tail_mp); 17940Sstevel@tonic-gate 17950Sstevel@tonic-gate /* 17960Sstevel@tonic-gate * Do not use bufcall() to schedule a "buffer 17970Sstevel@tonic-gate * availability event." The reason is that 17980Sstevel@tonic-gate * bufcall() has problems. For example, if memory 17990Sstevel@tonic-gate * runs out, bufcall() itself will fail since it 18000Sstevel@tonic-gate * needs to allocate memory. The most appropriate 18010Sstevel@tonic-gate * action right now is to disconnect this connection 18020Sstevel@tonic-gate * as the system is under stress. We should try to 18030Sstevel@tonic-gate * free up resources. 18040Sstevel@tonic-gate */ 18050Sstevel@tonic-gate if (mp1 == NULL) { 18060Sstevel@tonic-gate freemsg(head_mp); 18070Sstevel@tonic-gate RPCLOG0(1, "mir_do_rput: dupb/copyb failed\n"); 18080Sstevel@tonic-gate mir->mir_frag_header = 0; 18090Sstevel@tonic-gate mir->mir_frag_len = -(int)sizeof (uint32_t); 18100Sstevel@tonic-gate mir->mir_head_mp = NULL; 18110Sstevel@tonic-gate mir->mir_tail_mp = NULL; 18120Sstevel@tonic-gate 18130Sstevel@tonic-gate mir_disconnect(q, mir); 18140Sstevel@tonic-gate return; 18150Sstevel@tonic-gate } 18160Sstevel@tonic-gate 18170Sstevel@tonic-gate /* 18180Sstevel@tonic-gate * The new message block is linked with the 18190Sstevel@tonic-gate * continuation block in cont_mp. We then point 18200Sstevel@tonic-gate * cont_mp to the new block so that we will 18210Sstevel@tonic-gate * process it next. 18220Sstevel@tonic-gate */ 18230Sstevel@tonic-gate mp1->b_cont = cont_mp; 18240Sstevel@tonic-gate cont_mp = mp1; 18250Sstevel@tonic-gate /* 18260Sstevel@tonic-gate * Data in the new block begins at the 18270Sstevel@tonic-gate * next fragment (rptr). 18280Sstevel@tonic-gate */ 18290Sstevel@tonic-gate cont_mp->b_rptr += (rptr - tail_mp->b_rptr); 18300Sstevel@tonic-gate ASSERT(cont_mp->b_rptr >= cont_mp->b_datap->db_base); 18310Sstevel@tonic-gate ASSERT(cont_mp->b_rptr <= cont_mp->b_wptr); 18320Sstevel@tonic-gate 18330Sstevel@tonic-gate /* Data in the current fragment ends at rptr. */ 18340Sstevel@tonic-gate tail_mp->b_wptr = rptr; 18350Sstevel@tonic-gate ASSERT(tail_mp->b_wptr <= tail_mp->b_datap->db_lim); 18360Sstevel@tonic-gate ASSERT(tail_mp->b_wptr >= tail_mp->b_rptr); 18370Sstevel@tonic-gate 18380Sstevel@tonic-gate } 18390Sstevel@tonic-gate 18400Sstevel@tonic-gate /* tail_mp is the last block with data for this RPC message. */ 18410Sstevel@tonic-gate tail_mp->b_cont = NULL; 18420Sstevel@tonic-gate 18430Sstevel@tonic-gate /* Pass the RPC message to the current consumer. */ 18440Sstevel@tonic-gate switch (mir->mir_type) { 18450Sstevel@tonic-gate case RPC_CLIENT: 18460Sstevel@tonic-gate if (clnt_dispatch_notify(head_mp, mir->mir_zoneid)) { 18470Sstevel@tonic-gate /* 18480Sstevel@tonic-gate * Mark this stream as active. This marker 18490Sstevel@tonic-gate * is used in mir_timer(). 18500Sstevel@tonic-gate */ 18510Sstevel@tonic-gate 18520Sstevel@tonic-gate mir->mir_clntreq = 1; 18530Sstevel@tonic-gate mir->mir_use_timestamp = lbolt; 18540Sstevel@tonic-gate } else 18550Sstevel@tonic-gate freemsg(head_mp); 18560Sstevel@tonic-gate break; 18570Sstevel@tonic-gate 18580Sstevel@tonic-gate case RPC_SERVER: 18590Sstevel@tonic-gate /* 18600Sstevel@tonic-gate * Check for flow control before passing the 18610Sstevel@tonic-gate * message to KRPC. 18620Sstevel@tonic-gate */ 18630Sstevel@tonic-gate 18640Sstevel@tonic-gate if (!mir->mir_hold_inbound) { 1865*4741Sgt29601 if (mir->mir_krpc_cell) { 1866*4741Sgt29601 /* 1867*4741Sgt29601 * If the reference count is 0 1868*4741Sgt29601 * (not including this request), 1869*4741Sgt29601 * then the stream is transitioning 1870*4741Sgt29601 * from idle to non-idle. In this case, 1871*4741Sgt29601 * we cancel the idle timer. 1872*4741Sgt29601 */ 1873*4741Sgt29601 if (mir->mir_ref_cnt++ == 0) 1874*4741Sgt29601 stop_timer = B_TRUE; 1875*4741Sgt29601 if (mir_check_len(q, 1876*4741Sgt29601 (int32_t)msgdsize(mp), mp)) 18770Sstevel@tonic-gate return; 1878*4741Sgt29601 svc_queuereq(q, head_mp); /* to KRPC */ 1879*4741Sgt29601 } else { 1880*4741Sgt29601 /* 1881*4741Sgt29601 * Count # of times this happens. Should 1882*4741Sgt29601 * be never, but experience shows 1883*4741Sgt29601 * otherwise. 1884*4741Sgt29601 */ 1885*4741Sgt29601 mir_krpc_cell_null++; 1886*4741Sgt29601 freemsg(head_mp); 1887*4741Sgt29601 } 18880Sstevel@tonic-gate 18890Sstevel@tonic-gate } else { 18900Sstevel@tonic-gate /* 18910Sstevel@tonic-gate * If the outbound side of the stream is 18920Sstevel@tonic-gate * flow controlled, then hold this message 18930Sstevel@tonic-gate * until client catches up. mir_hold_inbound 18940Sstevel@tonic-gate * is set in mir_wput and cleared in mir_wsrv. 18950Sstevel@tonic-gate */ 18960Sstevel@tonic-gate if (srv) 18970Sstevel@tonic-gate (void) putbq(q, head_mp); 18980Sstevel@tonic-gate else 18990Sstevel@tonic-gate (void) putq(q, head_mp); 19000Sstevel@tonic-gate mir->mir_inrservice = B_TRUE; 19010Sstevel@tonic-gate } 19020Sstevel@tonic-gate break; 19030Sstevel@tonic-gate default: 19040Sstevel@tonic-gate RPCLOG(1, "mir_rput: unknown mir_type %d\n", 1905*4741Sgt29601 mir->mir_type); 19060Sstevel@tonic-gate freemsg(head_mp); 19070Sstevel@tonic-gate break; 19080Sstevel@tonic-gate } 19090Sstevel@tonic-gate 19100Sstevel@tonic-gate /* 19110Sstevel@tonic-gate * Reset head_mp and frag_header since we're starting on a 19120Sstevel@tonic-gate * new RPC fragment and message. 19130Sstevel@tonic-gate */ 19140Sstevel@tonic-gate head_mp = NULL; 19150Sstevel@tonic-gate tail_mp = NULL; 19160Sstevel@tonic-gate frag_header = 0; 19170Sstevel@tonic-gate } while ((mp = cont_mp) != NULL); 19180Sstevel@tonic-gate 19190Sstevel@tonic-gate /* 19200Sstevel@tonic-gate * Do a sanity check on the message length. If this message is 19210Sstevel@tonic-gate * getting excessively large, shut down the connection. 19220Sstevel@tonic-gate */ 19230Sstevel@tonic-gate if (head_mp != NULL && mir->mir_setup_complete && 1924*4741Sgt29601 mir_check_len(q, frag_len, head_mp)) 19250Sstevel@tonic-gate return; 19260Sstevel@tonic-gate 19270Sstevel@tonic-gate /* Save our local copies back in the mir structure. */ 19280Sstevel@tonic-gate mir->mir_frag_header = frag_header; 19290Sstevel@tonic-gate mir->mir_frag_len = frag_len; 19300Sstevel@tonic-gate mir->mir_head_mp = head_mp; 19310Sstevel@tonic-gate mir->mir_tail_mp = tail_mp; 19320Sstevel@tonic-gate 19330Sstevel@tonic-gate /* 19340Sstevel@tonic-gate * The timer is stopped after the whole message chain is processed. 19350Sstevel@tonic-gate * The reason is that stopping the timer releases the mir_mutex 19360Sstevel@tonic-gate * lock temporarily. This means that the request can be serviced 19370Sstevel@tonic-gate * while we are still processing the message chain. This is not 19380Sstevel@tonic-gate * good. So we stop the timer here instead. 19390Sstevel@tonic-gate * 19400Sstevel@tonic-gate * Note that if the timer fires before we stop it, it will not 19410Sstevel@tonic-gate * do any harm as MIR_SVC_QUIESCED() is false and mir_timer() 19420Sstevel@tonic-gate * will just return; 19430Sstevel@tonic-gate */ 19440Sstevel@tonic-gate if (stop_timer) { 19450Sstevel@tonic-gate RPCLOG(16, "mir_do_rput stopping idle timer on 0x%p because " 19460Sstevel@tonic-gate "ref cnt going to non zero\n", (void *) WR(q)); 19470Sstevel@tonic-gate mir_svc_idle_stop(WR(q), mir); 19480Sstevel@tonic-gate } 19490Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 19500Sstevel@tonic-gate } 19510Sstevel@tonic-gate 19520Sstevel@tonic-gate static void 19530Sstevel@tonic-gate mir_rput(queue_t *q, mblk_t *mp) 19540Sstevel@tonic-gate { 19550Sstevel@tonic-gate mir_do_rput(q, mp, 0); 19560Sstevel@tonic-gate } 19570Sstevel@tonic-gate 19580Sstevel@tonic-gate static void 19590Sstevel@tonic-gate mir_rput_proto(queue_t *q, mblk_t *mp) 19600Sstevel@tonic-gate { 19610Sstevel@tonic-gate mir_t *mir = (mir_t *)q->q_ptr; 19620Sstevel@tonic-gate uint32_t type; 19630Sstevel@tonic-gate uint32_t reason = 0; 19640Sstevel@tonic-gate 19650Sstevel@tonic-gate ASSERT(MUTEX_NOT_HELD(&mir->mir_mutex)); 19660Sstevel@tonic-gate 19670Sstevel@tonic-gate type = ((union T_primitives *)mp->b_rptr)->type; 19680Sstevel@tonic-gate switch (mir->mir_type) { 19690Sstevel@tonic-gate case RPC_CLIENT: 19700Sstevel@tonic-gate switch (type) { 19710Sstevel@tonic-gate case T_DISCON_IND: 1972*4741Sgt29601 reason = ((struct T_discon_ind *) 1973*4741Sgt29601 (mp->b_rptr))->DISCON_reason; 19740Sstevel@tonic-gate /*FALLTHROUGH*/ 19750Sstevel@tonic-gate case T_ORDREL_IND: 19760Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 19770Sstevel@tonic-gate if (mir->mir_head_mp) { 19780Sstevel@tonic-gate freemsg(mir->mir_head_mp); 19790Sstevel@tonic-gate mir->mir_head_mp = (mblk_t *)0; 19800Sstevel@tonic-gate mir->mir_tail_mp = (mblk_t *)0; 19810Sstevel@tonic-gate } 19820Sstevel@tonic-gate /* 19830Sstevel@tonic-gate * We are disconnecting, but not necessarily 19840Sstevel@tonic-gate * closing. By not closing, we will fail to 19850Sstevel@tonic-gate * pick up a possibly changed global timeout value, 19860Sstevel@tonic-gate * unless we store it now. 19870Sstevel@tonic-gate */ 19880Sstevel@tonic-gate mir->mir_idle_timeout = clnt_idle_timeout; 19890Sstevel@tonic-gate mir_clnt_idle_stop(WR(q), mir); 19900Sstevel@tonic-gate 19910Sstevel@tonic-gate /* 19920Sstevel@tonic-gate * Even though we are unconnected, we still 19930Sstevel@tonic-gate * leave the idle timer going on the client. The 19940Sstevel@tonic-gate * reason for is that if we've disconnected due 19950Sstevel@tonic-gate * to a server-side disconnect, reset, or connection 19960Sstevel@tonic-gate * timeout, there is a possibility the client may 19970Sstevel@tonic-gate * retry the RPC request. This retry needs to done on 19980Sstevel@tonic-gate * the same bound address for the server to interpret 19990Sstevel@tonic-gate * it as such. However, we don't want 20000Sstevel@tonic-gate * to wait forever for that possibility. If the 20010Sstevel@tonic-gate * end-point stays unconnected for mir_idle_timeout 20020Sstevel@tonic-gate * units of time, then that is a signal to the 20030Sstevel@tonic-gate * connection manager to give up waiting for the 20040Sstevel@tonic-gate * application (eg. NFS) to send a retry. 20050Sstevel@tonic-gate */ 20060Sstevel@tonic-gate mir_clnt_idle_start(WR(q), mir); 20070Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 20080Sstevel@tonic-gate clnt_dispatch_notifyall(WR(q), type, reason); 20090Sstevel@tonic-gate freemsg(mp); 20100Sstevel@tonic-gate return; 20110Sstevel@tonic-gate case T_ERROR_ACK: 20120Sstevel@tonic-gate { 20130Sstevel@tonic-gate struct T_error_ack *terror; 20140Sstevel@tonic-gate 20150Sstevel@tonic-gate terror = (struct T_error_ack *)mp->b_rptr; 20160Sstevel@tonic-gate RPCLOG(1, "mir_rput_proto T_ERROR_ACK for queue 0x%p", 2017*4741Sgt29601 (void *)q); 20180Sstevel@tonic-gate RPCLOG(1, " ERROR_prim: %s,", 2019*4741Sgt29601 rpc_tpiprim2name(terror->ERROR_prim)); 20200Sstevel@tonic-gate RPCLOG(1, " TLI_error: %s,", 2021*4741Sgt29601 rpc_tpierr2name(terror->TLI_error)); 20220Sstevel@tonic-gate RPCLOG(1, " UNIX_error: %d\n", terror->UNIX_error); 20230Sstevel@tonic-gate if (terror->ERROR_prim == T_DISCON_REQ) { 20240Sstevel@tonic-gate clnt_dispatch_notifyall(WR(q), type, reason); 20250Sstevel@tonic-gate freemsg(mp); 20260Sstevel@tonic-gate return; 20270Sstevel@tonic-gate } else { 20280Sstevel@tonic-gate if (clnt_dispatch_notifyconn(WR(q), mp)) 20290Sstevel@tonic-gate return; 20300Sstevel@tonic-gate } 20310Sstevel@tonic-gate break; 20320Sstevel@tonic-gate } 20330Sstevel@tonic-gate case T_OK_ACK: 20340Sstevel@tonic-gate { 20350Sstevel@tonic-gate struct T_ok_ack *tok = (struct T_ok_ack *)mp->b_rptr; 20360Sstevel@tonic-gate 20370Sstevel@tonic-gate if (tok->CORRECT_prim == T_DISCON_REQ) { 20380Sstevel@tonic-gate clnt_dispatch_notifyall(WR(q), type, reason); 20390Sstevel@tonic-gate freemsg(mp); 20400Sstevel@tonic-gate return; 20410Sstevel@tonic-gate } else { 20420Sstevel@tonic-gate if (clnt_dispatch_notifyconn(WR(q), mp)) 20430Sstevel@tonic-gate return; 20440Sstevel@tonic-gate } 20450Sstevel@tonic-gate break; 20460Sstevel@tonic-gate } 20470Sstevel@tonic-gate case T_CONN_CON: 20480Sstevel@tonic-gate case T_INFO_ACK: 20490Sstevel@tonic-gate case T_OPTMGMT_ACK: 20500Sstevel@tonic-gate if (clnt_dispatch_notifyconn(WR(q), mp)) 20510Sstevel@tonic-gate return; 20520Sstevel@tonic-gate break; 20530Sstevel@tonic-gate case T_BIND_ACK: 20540Sstevel@tonic-gate break; 20550Sstevel@tonic-gate default: 20560Sstevel@tonic-gate RPCLOG(1, "mir_rput: unexpected message %d " 20570Sstevel@tonic-gate "for KRPC client\n", 20580Sstevel@tonic-gate ((union T_primitives *)mp->b_rptr)->type); 20590Sstevel@tonic-gate break; 20600Sstevel@tonic-gate } 20610Sstevel@tonic-gate break; 20620Sstevel@tonic-gate 20630Sstevel@tonic-gate case RPC_SERVER: 20640Sstevel@tonic-gate switch (type) { 20650Sstevel@tonic-gate case T_BIND_ACK: 20660Sstevel@tonic-gate { 20670Sstevel@tonic-gate struct T_bind_ack *tbind; 20680Sstevel@tonic-gate 20690Sstevel@tonic-gate /* 20700Sstevel@tonic-gate * If this is a listening stream, then shut 20710Sstevel@tonic-gate * off the idle timer. 20720Sstevel@tonic-gate */ 20730Sstevel@tonic-gate tbind = (struct T_bind_ack *)mp->b_rptr; 20740Sstevel@tonic-gate if (tbind->CONIND_number > 0) { 20750Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 20760Sstevel@tonic-gate mir_svc_idle_stop(WR(q), mir); 20770Sstevel@tonic-gate 20780Sstevel@tonic-gate /* 20790Sstevel@tonic-gate * mark this as a listen endpoint 20800Sstevel@tonic-gate * for special handling. 20810Sstevel@tonic-gate */ 20820Sstevel@tonic-gate 20830Sstevel@tonic-gate mir->mir_listen_stream = 1; 20840Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 20850Sstevel@tonic-gate } 20860Sstevel@tonic-gate break; 20870Sstevel@tonic-gate } 20880Sstevel@tonic-gate case T_DISCON_IND: 20890Sstevel@tonic-gate case T_ORDREL_IND: 20900Sstevel@tonic-gate RPCLOG(16, "mir_rput_proto: got %s indication\n", 2091*4741Sgt29601 type == T_DISCON_IND ? "disconnect" 2092*4741Sgt29601 : "orderly release"); 20930Sstevel@tonic-gate 20940Sstevel@tonic-gate /* 20950Sstevel@tonic-gate * For listen endpoint just pass 20960Sstevel@tonic-gate * on the message. 20970Sstevel@tonic-gate */ 20980Sstevel@tonic-gate 20990Sstevel@tonic-gate if (mir->mir_listen_stream) 21000Sstevel@tonic-gate break; 21010Sstevel@tonic-gate 21020Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 21030Sstevel@tonic-gate 21040Sstevel@tonic-gate /* 21050Sstevel@tonic-gate * If client wants to break off connection, record 21060Sstevel@tonic-gate * that fact. 21070Sstevel@tonic-gate */ 21080Sstevel@tonic-gate mir_svc_start_close(WR(q), mir); 21090Sstevel@tonic-gate 21100Sstevel@tonic-gate /* 21110Sstevel@tonic-gate * If we are idle, then send the orderly release 21120Sstevel@tonic-gate * or disconnect indication to nfsd. 21130Sstevel@tonic-gate */ 21140Sstevel@tonic-gate if (MIR_SVC_QUIESCED(mir)) { 21150Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 21160Sstevel@tonic-gate break; 21170Sstevel@tonic-gate } 21180Sstevel@tonic-gate 21190Sstevel@tonic-gate RPCLOG(16, "mir_rput_proto: not idle, so " 2120*4741Sgt29601 "disconnect/ord rel indication not passed " 2121*4741Sgt29601 "upstream on 0x%p\n", (void *)q); 21220Sstevel@tonic-gate 21230Sstevel@tonic-gate /* 21240Sstevel@tonic-gate * Hold the indication until we get idle 21250Sstevel@tonic-gate * If there already is an indication stored, 21260Sstevel@tonic-gate * replace it if the new one is a disconnect. The 21270Sstevel@tonic-gate * reasoning is that disconnection takes less time 21280Sstevel@tonic-gate * to process, and once a client decides to 21290Sstevel@tonic-gate * disconnect, we should do that. 21300Sstevel@tonic-gate */ 21310Sstevel@tonic-gate if (mir->mir_svc_pend_mp) { 21320Sstevel@tonic-gate if (type == T_DISCON_IND) { 21330Sstevel@tonic-gate RPCLOG(16, "mir_rput_proto: replacing" 21340Sstevel@tonic-gate " held disconnect/ord rel" 21350Sstevel@tonic-gate " indication with disconnect on" 21360Sstevel@tonic-gate " 0x%p\n", (void *)q); 21370Sstevel@tonic-gate 21380Sstevel@tonic-gate freemsg(mir->mir_svc_pend_mp); 21390Sstevel@tonic-gate mir->mir_svc_pend_mp = mp; 21400Sstevel@tonic-gate } else { 21410Sstevel@tonic-gate RPCLOG(16, "mir_rput_proto: already " 21420Sstevel@tonic-gate "held a disconnect/ord rel " 21430Sstevel@tonic-gate "indication. freeing ord rel " 21440Sstevel@tonic-gate "ind on 0x%p\n", (void *)q); 21450Sstevel@tonic-gate freemsg(mp); 21460Sstevel@tonic-gate } 21470Sstevel@tonic-gate } else 21480Sstevel@tonic-gate mir->mir_svc_pend_mp = mp; 21490Sstevel@tonic-gate 21500Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 21510Sstevel@tonic-gate return; 21520Sstevel@tonic-gate 21530Sstevel@tonic-gate default: 21540Sstevel@tonic-gate /* nfsd handles server-side non-data messages. */ 21550Sstevel@tonic-gate break; 21560Sstevel@tonic-gate } 21570Sstevel@tonic-gate break; 21580Sstevel@tonic-gate 21590Sstevel@tonic-gate default: 21600Sstevel@tonic-gate break; 21610Sstevel@tonic-gate } 21620Sstevel@tonic-gate 21630Sstevel@tonic-gate putnext(q, mp); 21640Sstevel@tonic-gate } 21650Sstevel@tonic-gate 21660Sstevel@tonic-gate /* 21670Sstevel@tonic-gate * The server-side read queues are used to hold inbound messages while 21680Sstevel@tonic-gate * outbound flow control is exerted. When outbound flow control is 21690Sstevel@tonic-gate * relieved, mir_wsrv qenables the read-side queue. Read-side queues 21700Sstevel@tonic-gate * are not enabled by STREAMS and are explicitly noenable'ed in mir_open. 21710Sstevel@tonic-gate * 21720Sstevel@tonic-gate * For the server side, we have two types of messages queued. The first type 21730Sstevel@tonic-gate * are messages that are ready to be XDR decoded and and then sent to the 21740Sstevel@tonic-gate * RPC program's dispatch routine. The second type are "raw" messages that 21750Sstevel@tonic-gate * haven't been processed, i.e. assembled from rpc record fragements into 21760Sstevel@tonic-gate * full requests. The only time we will see the second type of message 21770Sstevel@tonic-gate * queued is if we have a memory allocation failure while processing a 21780Sstevel@tonic-gate * a raw message. The field mir_first_non_processed_mblk will mark the 21790Sstevel@tonic-gate * first such raw message. So the flow for server side is: 21800Sstevel@tonic-gate * 21810Sstevel@tonic-gate * - send processed queued messages to kRPC until we run out or find 21820Sstevel@tonic-gate * one that needs additional processing because we were short on memory 21830Sstevel@tonic-gate * earlier 21840Sstevel@tonic-gate * - process a message that was deferred because of lack of 21850Sstevel@tonic-gate * memory 21860Sstevel@tonic-gate * - continue processing messages until the queue empties or we 21870Sstevel@tonic-gate * have to stop because of lack of memory 21880Sstevel@tonic-gate * - during each of the above phase, if the queue is empty and 21890Sstevel@tonic-gate * there are no pending messages that were passed to the RPC 21900Sstevel@tonic-gate * layer, send upstream the pending disconnect/ordrel indication if 21910Sstevel@tonic-gate * there is one 21920Sstevel@tonic-gate * 21930Sstevel@tonic-gate * The read-side queue is also enabled by a bufcall callback if dupmsg 21940Sstevel@tonic-gate * fails in mir_rput. 21950Sstevel@tonic-gate */ 21960Sstevel@tonic-gate static void 21970Sstevel@tonic-gate mir_rsrv(queue_t *q) 21980Sstevel@tonic-gate { 21990Sstevel@tonic-gate mir_t *mir; 22000Sstevel@tonic-gate mblk_t *mp; 22010Sstevel@tonic-gate mblk_t *cmp = NULL; 22020Sstevel@tonic-gate boolean_t stop_timer = B_FALSE; 22030Sstevel@tonic-gate 22040Sstevel@tonic-gate mir = (mir_t *)q->q_ptr; 22050Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 22060Sstevel@tonic-gate 22070Sstevel@tonic-gate mp = NULL; 22080Sstevel@tonic-gate switch (mir->mir_type) { 22090Sstevel@tonic-gate case RPC_SERVER: 22100Sstevel@tonic-gate if (mir->mir_ref_cnt == 0) 22110Sstevel@tonic-gate mir->mir_hold_inbound = 0; 22120Sstevel@tonic-gate if (mir->mir_hold_inbound) { 22130Sstevel@tonic-gate 22140Sstevel@tonic-gate ASSERT(cmp == NULL); 22150Sstevel@tonic-gate if (q->q_first == NULL) { 22160Sstevel@tonic-gate 22170Sstevel@tonic-gate MIR_CLEAR_INRSRV(mir); 22180Sstevel@tonic-gate 22190Sstevel@tonic-gate if (MIR_SVC_QUIESCED(mir)) { 22200Sstevel@tonic-gate cmp = mir->mir_svc_pend_mp; 22210Sstevel@tonic-gate mir->mir_svc_pend_mp = NULL; 22220Sstevel@tonic-gate } 22230Sstevel@tonic-gate } 22240Sstevel@tonic-gate 22250Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 22260Sstevel@tonic-gate 22270Sstevel@tonic-gate if (cmp != NULL) { 22280Sstevel@tonic-gate RPCLOG(16, "mir_rsrv: line %d: sending a held " 22290Sstevel@tonic-gate "disconnect/ord rel indication upstream\n", 22300Sstevel@tonic-gate __LINE__); 22310Sstevel@tonic-gate putnext(q, cmp); 22320Sstevel@tonic-gate } 22330Sstevel@tonic-gate 22340Sstevel@tonic-gate return; 22350Sstevel@tonic-gate } 22360Sstevel@tonic-gate while (mp = getq(q)) { 2237*4741Sgt29601 if (mir->mir_krpc_cell && 2238*4741Sgt29601 (mir->mir_svc_no_more_msgs == 0)) { 22390Sstevel@tonic-gate /* 22400Sstevel@tonic-gate * If we were idle, turn off idle timer since 22410Sstevel@tonic-gate * we aren't idle any more. 22420Sstevel@tonic-gate */ 22430Sstevel@tonic-gate if (mir->mir_ref_cnt++ == 0) 22440Sstevel@tonic-gate stop_timer = B_TRUE; 22450Sstevel@tonic-gate if (mir_check_len(q, 2246*4741Sgt29601 (int32_t)msgdsize(mp), mp)) 2247*4741Sgt29601 return; 22480Sstevel@tonic-gate svc_queuereq(q, mp); 22490Sstevel@tonic-gate } else { 22500Sstevel@tonic-gate /* 22510Sstevel@tonic-gate * Count # of times this happens. Should be 22520Sstevel@tonic-gate * never, but experience shows otherwise. 22530Sstevel@tonic-gate */ 2254*4741Sgt29601 if (mir->mir_krpc_cell == NULL) 2255*4741Sgt29601 mir_krpc_cell_null++; 22560Sstevel@tonic-gate freemsg(mp); 22570Sstevel@tonic-gate } 22580Sstevel@tonic-gate } 22590Sstevel@tonic-gate break; 22600Sstevel@tonic-gate case RPC_CLIENT: 22610Sstevel@tonic-gate break; 22620Sstevel@tonic-gate default: 22630Sstevel@tonic-gate RPCLOG(1, "mir_rsrv: unexpected mir_type %d\n", mir->mir_type); 22640Sstevel@tonic-gate 22650Sstevel@tonic-gate if (q->q_first == NULL) 22660Sstevel@tonic-gate MIR_CLEAR_INRSRV(mir); 22670Sstevel@tonic-gate 22680Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 22690Sstevel@tonic-gate 22700Sstevel@tonic-gate return; 22710Sstevel@tonic-gate } 22720Sstevel@tonic-gate 22730Sstevel@tonic-gate /* 22740Sstevel@tonic-gate * The timer is stopped after all the messages are processed. 22750Sstevel@tonic-gate * The reason is that stopping the timer releases the mir_mutex 22760Sstevel@tonic-gate * lock temporarily. This means that the request can be serviced 22770Sstevel@tonic-gate * while we are still processing the message queue. This is not 22780Sstevel@tonic-gate * good. So we stop the timer here instead. 22790Sstevel@tonic-gate */ 22800Sstevel@tonic-gate if (stop_timer) { 22810Sstevel@tonic-gate RPCLOG(16, "mir_rsrv stopping idle timer on 0x%p because ref " 22820Sstevel@tonic-gate "cnt going to non zero\n", (void *)WR(q)); 22830Sstevel@tonic-gate mir_svc_idle_stop(WR(q), mir); 22840Sstevel@tonic-gate } 22850Sstevel@tonic-gate 22860Sstevel@tonic-gate if (q->q_first == NULL) { 22870Sstevel@tonic-gate 22880Sstevel@tonic-gate MIR_CLEAR_INRSRV(mir); 22890Sstevel@tonic-gate 22900Sstevel@tonic-gate ASSERT(cmp == NULL); 22910Sstevel@tonic-gate if (mir->mir_type == RPC_SERVER && MIR_SVC_QUIESCED(mir)) { 22920Sstevel@tonic-gate cmp = mir->mir_svc_pend_mp; 22930Sstevel@tonic-gate mir->mir_svc_pend_mp = NULL; 22940Sstevel@tonic-gate } 22950Sstevel@tonic-gate 22960Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 22970Sstevel@tonic-gate 22980Sstevel@tonic-gate if (cmp != NULL) { 22990Sstevel@tonic-gate RPCLOG(16, "mir_rsrv: line %d: sending a held " 2300*4741Sgt29601 "disconnect/ord rel indication upstream\n", 2301*4741Sgt29601 __LINE__); 23020Sstevel@tonic-gate putnext(q, cmp); 23030Sstevel@tonic-gate } 23040Sstevel@tonic-gate 23050Sstevel@tonic-gate return; 23060Sstevel@tonic-gate } 23070Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 23080Sstevel@tonic-gate } 23090Sstevel@tonic-gate 23100Sstevel@tonic-gate static int mir_svc_policy_fails; 23110Sstevel@tonic-gate 23120Sstevel@tonic-gate /* 23130Sstevel@tonic-gate * Called to send an event code to nfsd/lockd so that it initiates 23140Sstevel@tonic-gate * connection close. 23150Sstevel@tonic-gate */ 23160Sstevel@tonic-gate static int 23170Sstevel@tonic-gate mir_svc_policy_notify(queue_t *q, int event) 23180Sstevel@tonic-gate { 23190Sstevel@tonic-gate mblk_t *mp; 23200Sstevel@tonic-gate #ifdef DEBUG 23210Sstevel@tonic-gate mir_t *mir = (mir_t *)q->q_ptr; 23220Sstevel@tonic-gate ASSERT(MUTEX_NOT_HELD(&mir->mir_mutex)); 23230Sstevel@tonic-gate #endif 23240Sstevel@tonic-gate ASSERT(q->q_flag & QREADR); 23250Sstevel@tonic-gate 23260Sstevel@tonic-gate /* 23270Sstevel@tonic-gate * Create an M_DATA message with the event code and pass it to the 23280Sstevel@tonic-gate * Stream head (nfsd or whoever created the stream will consume it). 23290Sstevel@tonic-gate */ 23300Sstevel@tonic-gate mp = allocb(sizeof (int), BPRI_HI); 23310Sstevel@tonic-gate 23320Sstevel@tonic-gate if (!mp) { 23330Sstevel@tonic-gate 23340Sstevel@tonic-gate mir_svc_policy_fails++; 23350Sstevel@tonic-gate RPCLOG(16, "mir_svc_policy_notify: could not allocate event " 2336*4741Sgt29601 "%d\n", event); 23370Sstevel@tonic-gate return (ENOMEM); 23380Sstevel@tonic-gate } 23390Sstevel@tonic-gate 23400Sstevel@tonic-gate U32_TO_BE32(event, mp->b_rptr); 23410Sstevel@tonic-gate mp->b_wptr = mp->b_rptr + sizeof (int); 23420Sstevel@tonic-gate putnext(q, mp); 23430Sstevel@tonic-gate return (0); 23440Sstevel@tonic-gate } 23450Sstevel@tonic-gate 23460Sstevel@tonic-gate /* 23470Sstevel@tonic-gate * Server side: start the close phase. We want to get this rpcmod slot in an 23480Sstevel@tonic-gate * idle state before mir_close() is called. 23490Sstevel@tonic-gate */ 23500Sstevel@tonic-gate static void 23510Sstevel@tonic-gate mir_svc_start_close(queue_t *wq, mir_t *mir) 23520Sstevel@tonic-gate { 23530Sstevel@tonic-gate ASSERT(MUTEX_HELD(&mir->mir_mutex)); 23540Sstevel@tonic-gate ASSERT((wq->q_flag & QREADR) == 0); 23550Sstevel@tonic-gate ASSERT(mir->mir_type == RPC_SERVER); 23560Sstevel@tonic-gate 23570Sstevel@tonic-gate 23580Sstevel@tonic-gate /* 23590Sstevel@tonic-gate * Do not accept any more messages. 23600Sstevel@tonic-gate */ 23610Sstevel@tonic-gate mir->mir_svc_no_more_msgs = 1; 23620Sstevel@tonic-gate 23630Sstevel@tonic-gate /* 23640Sstevel@tonic-gate * Next two statements will make the read service procedure invoke 23650Sstevel@tonic-gate * svc_queuereq() on everything stuck in the streams read queue. 23660Sstevel@tonic-gate * It's not necessary because enabling the write queue will 23670Sstevel@tonic-gate * have the same effect, but why not speed the process along? 23680Sstevel@tonic-gate */ 23690Sstevel@tonic-gate mir->mir_hold_inbound = 0; 23700Sstevel@tonic-gate qenable(RD(wq)); 23710Sstevel@tonic-gate 23720Sstevel@tonic-gate /* 23730Sstevel@tonic-gate * Meanwhile force the write service procedure to send the 23740Sstevel@tonic-gate * responses downstream, regardless of flow control. 23750Sstevel@tonic-gate */ 23760Sstevel@tonic-gate qenable(wq); 23770Sstevel@tonic-gate } 23780Sstevel@tonic-gate 23790Sstevel@tonic-gate /* 23800Sstevel@tonic-gate * This routine is called directly by KRPC after a request is completed, 23810Sstevel@tonic-gate * whether a reply was sent or the request was dropped. 23820Sstevel@tonic-gate */ 23830Sstevel@tonic-gate static void 23840Sstevel@tonic-gate mir_svc_release(queue_t *wq, mblk_t *mp) 23850Sstevel@tonic-gate { 23860Sstevel@tonic-gate mir_t *mir = (mir_t *)wq->q_ptr; 23870Sstevel@tonic-gate mblk_t *cmp = NULL; 23880Sstevel@tonic-gate 23890Sstevel@tonic-gate ASSERT((wq->q_flag & QREADR) == 0); 23900Sstevel@tonic-gate if (mp) 23910Sstevel@tonic-gate freemsg(mp); 23920Sstevel@tonic-gate 23930Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 23940Sstevel@tonic-gate 23950Sstevel@tonic-gate /* 23960Sstevel@tonic-gate * Start idle processing if this is the last reference. 23970Sstevel@tonic-gate */ 23982610Smaheshvs if ((mir->mir_ref_cnt == 1) && (mir->mir_inrservice == 0)) { 23990Sstevel@tonic-gate 24000Sstevel@tonic-gate RPCLOG(16, "mir_svc_release starting idle timer on 0x%p " 24010Sstevel@tonic-gate "because ref cnt is zero\n", (void *) wq); 24020Sstevel@tonic-gate 24030Sstevel@tonic-gate cmp = mir->mir_svc_pend_mp; 24040Sstevel@tonic-gate mir->mir_svc_pend_mp = NULL; 24050Sstevel@tonic-gate mir_svc_idle_start(wq, mir); 24060Sstevel@tonic-gate } 24070Sstevel@tonic-gate 24082610Smaheshvs mir->mir_ref_cnt--; 24092610Smaheshvs ASSERT(mir->mir_ref_cnt >= 0); 24102610Smaheshvs 24112610Smaheshvs /* 24122610Smaheshvs * Wake up the thread waiting to close. 24132610Smaheshvs */ 24142610Smaheshvs 24152610Smaheshvs if ((mir->mir_ref_cnt == 0) && mir->mir_closing) 24162610Smaheshvs cv_signal(&mir->mir_condvar); 24172610Smaheshvs 24180Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 24190Sstevel@tonic-gate 24200Sstevel@tonic-gate if (cmp) { 24210Sstevel@tonic-gate RPCLOG(16, "mir_svc_release: sending a held " 24220Sstevel@tonic-gate "disconnect/ord rel indication upstream on queue 0x%p\n", 24230Sstevel@tonic-gate (void *)RD(wq)); 24240Sstevel@tonic-gate 24250Sstevel@tonic-gate putnext(RD(wq), cmp); 24260Sstevel@tonic-gate } 24270Sstevel@tonic-gate } 24280Sstevel@tonic-gate 24290Sstevel@tonic-gate /* 24300Sstevel@tonic-gate * This routine is called by server-side KRPC when it is ready to 24310Sstevel@tonic-gate * handle inbound messages on the stream. 24320Sstevel@tonic-gate */ 24330Sstevel@tonic-gate static void 24340Sstevel@tonic-gate mir_svc_start(queue_t *wq) 24350Sstevel@tonic-gate { 24360Sstevel@tonic-gate mir_t *mir = (mir_t *)wq->q_ptr; 24370Sstevel@tonic-gate 24382470Sgt29601 /* 24392470Sgt29601 * no longer need to take the mir_mutex because the 24402470Sgt29601 * mir_setup_complete field has been moved out of 24412470Sgt29601 * the binary field protected by the mir_mutex. 24422470Sgt29601 */ 24432470Sgt29601 24440Sstevel@tonic-gate mir->mir_setup_complete = 1; 24450Sstevel@tonic-gate qenable(RD(wq)); 24460Sstevel@tonic-gate } 24470Sstevel@tonic-gate 24480Sstevel@tonic-gate /* 24490Sstevel@tonic-gate * client side wrapper for stopping timer with normal idle timeout. 24500Sstevel@tonic-gate */ 24510Sstevel@tonic-gate static void 24520Sstevel@tonic-gate mir_clnt_idle_stop(queue_t *wq, mir_t *mir) 24530Sstevel@tonic-gate { 24540Sstevel@tonic-gate ASSERT(MUTEX_HELD(&mir->mir_mutex)); 24550Sstevel@tonic-gate ASSERT((wq->q_flag & QREADR) == 0); 24560Sstevel@tonic-gate ASSERT(mir->mir_type == RPC_CLIENT); 24570Sstevel@tonic-gate 24580Sstevel@tonic-gate mir_timer_stop(mir); 24590Sstevel@tonic-gate } 24600Sstevel@tonic-gate 24610Sstevel@tonic-gate /* 24620Sstevel@tonic-gate * client side wrapper for stopping timer with normal idle timeout. 24630Sstevel@tonic-gate */ 24640Sstevel@tonic-gate static void 24650Sstevel@tonic-gate mir_clnt_idle_start(queue_t *wq, mir_t *mir) 24660Sstevel@tonic-gate { 24670Sstevel@tonic-gate ASSERT(MUTEX_HELD(&mir->mir_mutex)); 24680Sstevel@tonic-gate ASSERT((wq->q_flag & QREADR) == 0); 24690Sstevel@tonic-gate ASSERT(mir->mir_type == RPC_CLIENT); 24700Sstevel@tonic-gate 24710Sstevel@tonic-gate mir_timer_start(wq, mir, mir->mir_idle_timeout); 24720Sstevel@tonic-gate } 24730Sstevel@tonic-gate 24740Sstevel@tonic-gate /* 24750Sstevel@tonic-gate * client side only. Forces rpcmod to stop sending T_ORDREL_REQs on 24760Sstevel@tonic-gate * end-points that aren't connected. 24770Sstevel@tonic-gate */ 24780Sstevel@tonic-gate static void 24790Sstevel@tonic-gate mir_clnt_idle_do_stop(queue_t *wq) 24800Sstevel@tonic-gate { 24810Sstevel@tonic-gate mir_t *mir = (mir_t *)wq->q_ptr; 24820Sstevel@tonic-gate 24830Sstevel@tonic-gate RPCLOG(1, "mir_clnt_idle_do_stop: wq 0x%p\n", (void *)wq); 24840Sstevel@tonic-gate ASSERT(MUTEX_NOT_HELD(&mir->mir_mutex)); 24850Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 24860Sstevel@tonic-gate mir_clnt_idle_stop(wq, mir); 24870Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 24880Sstevel@tonic-gate } 24890Sstevel@tonic-gate 24900Sstevel@tonic-gate /* 24910Sstevel@tonic-gate * Timer handler. It handles idle timeout and memory shortage problem. 24920Sstevel@tonic-gate */ 24930Sstevel@tonic-gate static void 24940Sstevel@tonic-gate mir_timer(void *arg) 24950Sstevel@tonic-gate { 24960Sstevel@tonic-gate queue_t *wq = (queue_t *)arg; 24970Sstevel@tonic-gate mir_t *mir = (mir_t *)wq->q_ptr; 24980Sstevel@tonic-gate boolean_t notify; 24990Sstevel@tonic-gate 25000Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 25010Sstevel@tonic-gate 25020Sstevel@tonic-gate /* 25030Sstevel@tonic-gate * mir_timer_call is set only when either mir_timer_[start|stop] 25040Sstevel@tonic-gate * is progressing. And mir_timer() can only be run while they 25050Sstevel@tonic-gate * are progressing if the timer is being stopped. So just 25060Sstevel@tonic-gate * return. 25070Sstevel@tonic-gate */ 25080Sstevel@tonic-gate if (mir->mir_timer_call) { 25090Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 25100Sstevel@tonic-gate return; 25110Sstevel@tonic-gate } 25120Sstevel@tonic-gate mir->mir_timer_id = 0; 25130Sstevel@tonic-gate 25140Sstevel@tonic-gate switch (mir->mir_type) { 25150Sstevel@tonic-gate case RPC_CLIENT: 25160Sstevel@tonic-gate 25170Sstevel@tonic-gate /* 25180Sstevel@tonic-gate * For clients, the timer fires at clnt_idle_timeout 25190Sstevel@tonic-gate * intervals. If the activity marker (mir_clntreq) is 25200Sstevel@tonic-gate * zero, then the stream has been idle since the last 25210Sstevel@tonic-gate * timer event and we notify KRPC. If mir_clntreq is 25220Sstevel@tonic-gate * non-zero, then the stream is active and we just 25230Sstevel@tonic-gate * restart the timer for another interval. mir_clntreq 25240Sstevel@tonic-gate * is set to 1 in mir_wput for every request passed 25250Sstevel@tonic-gate * downstream. 25260Sstevel@tonic-gate * 25270Sstevel@tonic-gate * If this was a memory shortage timer reset the idle 25280Sstevel@tonic-gate * timeout regardless; the mir_clntreq will not be a 25290Sstevel@tonic-gate * valid indicator. 25300Sstevel@tonic-gate * 25310Sstevel@tonic-gate * The timer is initially started in mir_wput during 25320Sstevel@tonic-gate * RPC_CLIENT ioctl processing. 25330Sstevel@tonic-gate * 25340Sstevel@tonic-gate * The timer interval can be changed for individual 25350Sstevel@tonic-gate * streams with the ND variable "mir_idle_timeout". 25360Sstevel@tonic-gate */ 25370Sstevel@tonic-gate if (mir->mir_clntreq > 0 && mir->mir_use_timestamp + 25380Sstevel@tonic-gate MSEC_TO_TICK(mir->mir_idle_timeout) - lbolt >= 0) { 25390Sstevel@tonic-gate clock_t tout; 25400Sstevel@tonic-gate 25410Sstevel@tonic-gate tout = mir->mir_idle_timeout - 2542*4741Sgt29601 TICK_TO_MSEC(lbolt - mir->mir_use_timestamp); 25430Sstevel@tonic-gate if (tout < 0) 25440Sstevel@tonic-gate tout = 1000; 25450Sstevel@tonic-gate #if 0 2546*4741Sgt29601 printf("mir_timer[%d < %d + %d]: reset client timer " 2547*4741Sgt29601 "to %d (ms)\n", TICK_TO_MSEC(lbolt), 2548*4741Sgt29601 TICK_TO_MSEC(mir->mir_use_timestamp), 2549*4741Sgt29601 mir->mir_idle_timeout, tout); 25500Sstevel@tonic-gate #endif 25510Sstevel@tonic-gate mir->mir_clntreq = 0; 25520Sstevel@tonic-gate mir_timer_start(wq, mir, tout); 25530Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 25540Sstevel@tonic-gate return; 25550Sstevel@tonic-gate } 25560Sstevel@tonic-gate #if 0 25570Sstevel@tonic-gate printf("mir_timer[%d]: doing client timeout\n", lbolt / hz); 25580Sstevel@tonic-gate #endif 25590Sstevel@tonic-gate /* 25600Sstevel@tonic-gate * We are disconnecting, but not necessarily 25610Sstevel@tonic-gate * closing. By not closing, we will fail to 25620Sstevel@tonic-gate * pick up a possibly changed global timeout value, 25630Sstevel@tonic-gate * unless we store it now. 25640Sstevel@tonic-gate */ 25650Sstevel@tonic-gate mir->mir_idle_timeout = clnt_idle_timeout; 25660Sstevel@tonic-gate mir_clnt_idle_start(wq, mir); 25670Sstevel@tonic-gate 25680Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 25690Sstevel@tonic-gate /* 25700Sstevel@tonic-gate * We pass T_ORDREL_REQ as an integer value 25710Sstevel@tonic-gate * to KRPC as the indication that the stream 25720Sstevel@tonic-gate * is idle. This is not a T_ORDREL_REQ message, 25730Sstevel@tonic-gate * it is just a convenient value since we call 25740Sstevel@tonic-gate * the same KRPC routine for T_ORDREL_INDs and 25750Sstevel@tonic-gate * T_DISCON_INDs. 25760Sstevel@tonic-gate */ 25770Sstevel@tonic-gate clnt_dispatch_notifyall(wq, T_ORDREL_REQ, 0); 25780Sstevel@tonic-gate return; 25790Sstevel@tonic-gate 25800Sstevel@tonic-gate case RPC_SERVER: 25810Sstevel@tonic-gate 25820Sstevel@tonic-gate /* 25830Sstevel@tonic-gate * For servers, the timer is only running when the stream 25840Sstevel@tonic-gate * is really idle or memory is short. The timer is started 25850Sstevel@tonic-gate * by mir_wput when mir_type is set to RPC_SERVER and 25860Sstevel@tonic-gate * by mir_svc_idle_start whenever the stream goes idle 25870Sstevel@tonic-gate * (mir_ref_cnt == 0). The timer is cancelled in 25880Sstevel@tonic-gate * mir_rput whenever a new inbound request is passed to KRPC 25890Sstevel@tonic-gate * and the stream was previously idle. 25900Sstevel@tonic-gate * 25910Sstevel@tonic-gate * The timer interval can be changed for individual 25920Sstevel@tonic-gate * streams with the ND variable "mir_idle_timeout". 25930Sstevel@tonic-gate * 25940Sstevel@tonic-gate * If the stream is not idle do nothing. 25950Sstevel@tonic-gate */ 25960Sstevel@tonic-gate if (!MIR_SVC_QUIESCED(mir)) { 25970Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 25980Sstevel@tonic-gate return; 25990Sstevel@tonic-gate } 26000Sstevel@tonic-gate 26010Sstevel@tonic-gate notify = !mir->mir_inrservice; 26020Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 26030Sstevel@tonic-gate 26040Sstevel@tonic-gate /* 26050Sstevel@tonic-gate * If there is no packet queued up in read queue, the stream 26060Sstevel@tonic-gate * is really idle so notify nfsd to close it. 26070Sstevel@tonic-gate */ 26080Sstevel@tonic-gate if (notify) { 26090Sstevel@tonic-gate RPCLOG(16, "mir_timer: telling stream head listener " 26100Sstevel@tonic-gate "to close stream (0x%p)\n", (void *) RD(wq)); 26110Sstevel@tonic-gate (void) mir_svc_policy_notify(RD(wq), 1); 26120Sstevel@tonic-gate } 26130Sstevel@tonic-gate return; 26140Sstevel@tonic-gate default: 26150Sstevel@tonic-gate RPCLOG(1, "mir_timer: unexpected mir_type %d\n", 2616*4741Sgt29601 mir->mir_type); 26170Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 26180Sstevel@tonic-gate return; 26190Sstevel@tonic-gate } 26200Sstevel@tonic-gate } 26210Sstevel@tonic-gate 26220Sstevel@tonic-gate /* 26230Sstevel@tonic-gate * Called by the RPC package to send either a call or a return, or a 26240Sstevel@tonic-gate * transport connection request. Adds the record marking header. 26250Sstevel@tonic-gate */ 26260Sstevel@tonic-gate static void 26270Sstevel@tonic-gate mir_wput(queue_t *q, mblk_t *mp) 26280Sstevel@tonic-gate { 26290Sstevel@tonic-gate uint_t frag_header; 26300Sstevel@tonic-gate mir_t *mir = (mir_t *)q->q_ptr; 26310Sstevel@tonic-gate uchar_t *rptr = mp->b_rptr; 26320Sstevel@tonic-gate 26330Sstevel@tonic-gate if (!mir) { 26340Sstevel@tonic-gate freemsg(mp); 26350Sstevel@tonic-gate return; 26360Sstevel@tonic-gate } 26370Sstevel@tonic-gate 26380Sstevel@tonic-gate if (mp->b_datap->db_type != M_DATA) { 26390Sstevel@tonic-gate mir_wput_other(q, mp); 26400Sstevel@tonic-gate return; 26410Sstevel@tonic-gate } 26420Sstevel@tonic-gate 26430Sstevel@tonic-gate if (mir->mir_ordrel_pending == 1) { 26440Sstevel@tonic-gate freemsg(mp); 26450Sstevel@tonic-gate RPCLOG(16, "mir_wput wq 0x%p: got data after T_ORDREL_REQ\n", 2646*4741Sgt29601 (void *)q); 26470Sstevel@tonic-gate return; 26480Sstevel@tonic-gate } 26490Sstevel@tonic-gate 26500Sstevel@tonic-gate frag_header = (uint_t)DLEN(mp); 26510Sstevel@tonic-gate frag_header |= MIR_LASTFRAG; 26520Sstevel@tonic-gate 26530Sstevel@tonic-gate /* Stick in the 4 byte record marking header. */ 26540Sstevel@tonic-gate if ((rptr - mp->b_datap->db_base) < sizeof (uint32_t) || 26550Sstevel@tonic-gate !IS_P2ALIGNED(mp->b_rptr, sizeof (uint32_t))) { 26560Sstevel@tonic-gate /* 26570Sstevel@tonic-gate * Since we know that M_DATA messages are created exclusively 26580Sstevel@tonic-gate * by KRPC, we expect that KRPC will leave room for our header 26590Sstevel@tonic-gate * and 4 byte align which is normal for XDR. 26600Sstevel@tonic-gate * If KRPC (or someone else) does not cooperate, then we 26610Sstevel@tonic-gate * just throw away the message. 26620Sstevel@tonic-gate */ 26630Sstevel@tonic-gate RPCLOG(1, "mir_wput: KRPC did not leave space for record " 26640Sstevel@tonic-gate "fragment header (%d bytes left)\n", 26650Sstevel@tonic-gate (int)(rptr - mp->b_datap->db_base)); 26660Sstevel@tonic-gate freemsg(mp); 26670Sstevel@tonic-gate return; 26680Sstevel@tonic-gate } 26690Sstevel@tonic-gate rptr -= sizeof (uint32_t); 26700Sstevel@tonic-gate *(uint32_t *)rptr = htonl(frag_header); 26710Sstevel@tonic-gate mp->b_rptr = rptr; 26720Sstevel@tonic-gate 26730Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 26740Sstevel@tonic-gate if (mir->mir_type == RPC_CLIENT) { 26750Sstevel@tonic-gate /* 26760Sstevel@tonic-gate * For the client, set mir_clntreq to indicate that the 26770Sstevel@tonic-gate * connection is active. 26780Sstevel@tonic-gate */ 26790Sstevel@tonic-gate mir->mir_clntreq = 1; 26800Sstevel@tonic-gate mir->mir_use_timestamp = lbolt; 26810Sstevel@tonic-gate } 26820Sstevel@tonic-gate 26830Sstevel@tonic-gate /* 26840Sstevel@tonic-gate * If we haven't already queued some data and the downstream module 26850Sstevel@tonic-gate * can accept more data, send it on, otherwise we queue the message 26860Sstevel@tonic-gate * and take other actions depending on mir_type. 26870Sstevel@tonic-gate */ 26880Sstevel@tonic-gate if (!mir->mir_inwservice && MIR_WCANPUTNEXT(mir, q)) { 26890Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 26900Sstevel@tonic-gate 26910Sstevel@tonic-gate /* 26920Sstevel@tonic-gate * Now we pass the RPC message downstream. 26930Sstevel@tonic-gate */ 26940Sstevel@tonic-gate putnext(q, mp); 26950Sstevel@tonic-gate return; 26960Sstevel@tonic-gate } 26970Sstevel@tonic-gate 26980Sstevel@tonic-gate switch (mir->mir_type) { 26990Sstevel@tonic-gate case RPC_CLIENT: 27000Sstevel@tonic-gate /* 27010Sstevel@tonic-gate * Check for a previous duplicate request on the 27020Sstevel@tonic-gate * queue. If there is one, then we throw away 27030Sstevel@tonic-gate * the current message and let the previous one 27040Sstevel@tonic-gate * go through. If we can't find a duplicate, then 27050Sstevel@tonic-gate * send this one. This tap dance is an effort 27060Sstevel@tonic-gate * to reduce traffic and processing requirements 27070Sstevel@tonic-gate * under load conditions. 27080Sstevel@tonic-gate */ 27090Sstevel@tonic-gate if (mir_clnt_dup_request(q, mp)) { 27100Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 27110Sstevel@tonic-gate freemsg(mp); 27120Sstevel@tonic-gate return; 27130Sstevel@tonic-gate } 27140Sstevel@tonic-gate break; 27150Sstevel@tonic-gate case RPC_SERVER: 27160Sstevel@tonic-gate /* 27170Sstevel@tonic-gate * Set mir_hold_inbound so that new inbound RPC 27180Sstevel@tonic-gate * messages will be held until the client catches 27190Sstevel@tonic-gate * up on the earlier replies. This flag is cleared 27200Sstevel@tonic-gate * in mir_wsrv after flow control is relieved; 27210Sstevel@tonic-gate * the read-side queue is also enabled at that time. 27220Sstevel@tonic-gate */ 27230Sstevel@tonic-gate mir->mir_hold_inbound = 1; 27240Sstevel@tonic-gate break; 27250Sstevel@tonic-gate default: 27260Sstevel@tonic-gate RPCLOG(1, "mir_wput: unexpected mir_type %d\n", mir->mir_type); 27270Sstevel@tonic-gate break; 27280Sstevel@tonic-gate } 27290Sstevel@tonic-gate mir->mir_inwservice = 1; 27300Sstevel@tonic-gate (void) putq(q, mp); 27310Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 27320Sstevel@tonic-gate } 27330Sstevel@tonic-gate 27340Sstevel@tonic-gate static void 27350Sstevel@tonic-gate mir_wput_other(queue_t *q, mblk_t *mp) 27360Sstevel@tonic-gate { 27370Sstevel@tonic-gate mir_t *mir = (mir_t *)q->q_ptr; 27380Sstevel@tonic-gate struct iocblk *iocp; 27390Sstevel@tonic-gate uchar_t *rptr = mp->b_rptr; 27400Sstevel@tonic-gate bool_t flush_in_svc = FALSE; 27410Sstevel@tonic-gate 27420Sstevel@tonic-gate ASSERT(MUTEX_NOT_HELD(&mir->mir_mutex)); 27430Sstevel@tonic-gate switch (mp->b_datap->db_type) { 27440Sstevel@tonic-gate case M_IOCTL: 27450Sstevel@tonic-gate iocp = (struct iocblk *)rptr; 27460Sstevel@tonic-gate switch (iocp->ioc_cmd) { 27470Sstevel@tonic-gate case RPC_CLIENT: 27480Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 27490Sstevel@tonic-gate if (mir->mir_type != 0 && 27500Sstevel@tonic-gate mir->mir_type != iocp->ioc_cmd) { 27510Sstevel@tonic-gate ioc_eperm: 27520Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 27530Sstevel@tonic-gate iocp->ioc_error = EPERM; 27540Sstevel@tonic-gate iocp->ioc_count = 0; 27550Sstevel@tonic-gate mp->b_datap->db_type = M_IOCACK; 27560Sstevel@tonic-gate qreply(q, mp); 27570Sstevel@tonic-gate return; 27580Sstevel@tonic-gate } 27590Sstevel@tonic-gate 27600Sstevel@tonic-gate mir->mir_type = iocp->ioc_cmd; 27610Sstevel@tonic-gate 27620Sstevel@tonic-gate /* 27630Sstevel@tonic-gate * Clear mir_hold_inbound which was set to 1 by 27640Sstevel@tonic-gate * mir_open. This flag is not used on client 27650Sstevel@tonic-gate * streams. 27660Sstevel@tonic-gate */ 27670Sstevel@tonic-gate mir->mir_hold_inbound = 0; 27680Sstevel@tonic-gate mir->mir_max_msg_sizep = &clnt_max_msg_size; 27690Sstevel@tonic-gate 27700Sstevel@tonic-gate /* 27710Sstevel@tonic-gate * Start the idle timer. See mir_timer() for more 27720Sstevel@tonic-gate * information on how client timers work. 27730Sstevel@tonic-gate */ 27740Sstevel@tonic-gate mir->mir_idle_timeout = clnt_idle_timeout; 27750Sstevel@tonic-gate mir_clnt_idle_start(q, mir); 27760Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 27770Sstevel@tonic-gate 27780Sstevel@tonic-gate mp->b_datap->db_type = M_IOCACK; 27790Sstevel@tonic-gate qreply(q, mp); 27800Sstevel@tonic-gate return; 27810Sstevel@tonic-gate case RPC_SERVER: 27820Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 27830Sstevel@tonic-gate if (mir->mir_type != 0 && 27840Sstevel@tonic-gate mir->mir_type != iocp->ioc_cmd) 27850Sstevel@tonic-gate goto ioc_eperm; 27860Sstevel@tonic-gate 27870Sstevel@tonic-gate /* 27880Sstevel@tonic-gate * We don't clear mir_hold_inbound here because 27890Sstevel@tonic-gate * mir_hold_inbound is used in the flow control 27900Sstevel@tonic-gate * model. If we cleared it here, then we'd commit 27910Sstevel@tonic-gate * a small violation to the model where the transport 27920Sstevel@tonic-gate * might immediately block downstream flow. 27930Sstevel@tonic-gate */ 27940Sstevel@tonic-gate 27950Sstevel@tonic-gate mir->mir_type = iocp->ioc_cmd; 27960Sstevel@tonic-gate mir->mir_max_msg_sizep = &svc_max_msg_size; 27970Sstevel@tonic-gate 27980Sstevel@tonic-gate /* 27990Sstevel@tonic-gate * Start the idle timer. See mir_timer() for more 28000Sstevel@tonic-gate * information on how server timers work. 28010Sstevel@tonic-gate * 28020Sstevel@tonic-gate * Note that it is important to start the idle timer 28030Sstevel@tonic-gate * here so that connections time out even if we 28040Sstevel@tonic-gate * never receive any data on them. 28050Sstevel@tonic-gate */ 28060Sstevel@tonic-gate mir->mir_idle_timeout = svc_idle_timeout; 28070Sstevel@tonic-gate RPCLOG(16, "mir_wput_other starting idle timer on 0x%p " 28080Sstevel@tonic-gate "because we got RPC_SERVER ioctl\n", (void *)q); 28090Sstevel@tonic-gate mir_svc_idle_start(q, mir); 28100Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 28110Sstevel@tonic-gate 28120Sstevel@tonic-gate mp->b_datap->db_type = M_IOCACK; 28130Sstevel@tonic-gate qreply(q, mp); 28140Sstevel@tonic-gate return; 28150Sstevel@tonic-gate default: 28160Sstevel@tonic-gate break; 28170Sstevel@tonic-gate } 28180Sstevel@tonic-gate break; 28190Sstevel@tonic-gate 28200Sstevel@tonic-gate case M_PROTO: 28210Sstevel@tonic-gate if (mir->mir_type == RPC_CLIENT) { 28220Sstevel@tonic-gate /* 28230Sstevel@tonic-gate * We are likely being called from the context of a 28240Sstevel@tonic-gate * service procedure. So we need to enqueue. However 28250Sstevel@tonic-gate * enqueing may put our message behind data messages. 28260Sstevel@tonic-gate * So flush the data first. 28270Sstevel@tonic-gate */ 28280Sstevel@tonic-gate flush_in_svc = TRUE; 28290Sstevel@tonic-gate } 28300Sstevel@tonic-gate if ((mp->b_wptr - rptr) < sizeof (uint32_t) || 2831*4741Sgt29601 !IS_P2ALIGNED(rptr, sizeof (uint32_t))) 28320Sstevel@tonic-gate break; 28330Sstevel@tonic-gate 28340Sstevel@tonic-gate switch (((union T_primitives *)rptr)->type) { 28350Sstevel@tonic-gate case T_DATA_REQ: 28360Sstevel@tonic-gate /* Don't pass T_DATA_REQ messages downstream. */ 28370Sstevel@tonic-gate freemsg(mp); 28380Sstevel@tonic-gate return; 28390Sstevel@tonic-gate case T_ORDREL_REQ: 28400Sstevel@tonic-gate RPCLOG(8, "mir_wput_other wq 0x%p: got T_ORDREL_REQ\n", 28410Sstevel@tonic-gate (void *)q); 28420Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 28430Sstevel@tonic-gate if (mir->mir_type != RPC_SERVER) { 28440Sstevel@tonic-gate /* 28450Sstevel@tonic-gate * We are likely being called from 28460Sstevel@tonic-gate * clnt_dispatch_notifyall(). Sending 28470Sstevel@tonic-gate * a T_ORDREL_REQ will result in 28480Sstevel@tonic-gate * a some kind of _IND message being sent, 28490Sstevel@tonic-gate * will be another call to 28500Sstevel@tonic-gate * clnt_dispatch_notifyall(). To keep the stack 28510Sstevel@tonic-gate * lean, queue this message. 28520Sstevel@tonic-gate */ 28530Sstevel@tonic-gate mir->mir_inwservice = 1; 28540Sstevel@tonic-gate (void) putq(q, mp); 28550Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 28560Sstevel@tonic-gate return; 28570Sstevel@tonic-gate } 28580Sstevel@tonic-gate 28590Sstevel@tonic-gate /* 28600Sstevel@tonic-gate * Mark the structure such that we don't accept any 28610Sstevel@tonic-gate * more requests from client. We could defer this 28620Sstevel@tonic-gate * until we actually send the orderly release 28630Sstevel@tonic-gate * request downstream, but all that does is delay 28640Sstevel@tonic-gate * the closing of this stream. 28650Sstevel@tonic-gate */ 28660Sstevel@tonic-gate RPCLOG(16, "mir_wput_other wq 0x%p: got T_ORDREL_REQ " 28670Sstevel@tonic-gate " so calling mir_svc_start_close\n", (void *)q); 28680Sstevel@tonic-gate 28690Sstevel@tonic-gate mir_svc_start_close(q, mir); 28700Sstevel@tonic-gate 28710Sstevel@tonic-gate /* 28720Sstevel@tonic-gate * If we have sent down a T_ORDREL_REQ, don't send 28730Sstevel@tonic-gate * any more. 28740Sstevel@tonic-gate */ 28750Sstevel@tonic-gate if (mir->mir_ordrel_pending) { 28760Sstevel@tonic-gate freemsg(mp); 28770Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 28780Sstevel@tonic-gate return; 28790Sstevel@tonic-gate } 28800Sstevel@tonic-gate 28810Sstevel@tonic-gate /* 28820Sstevel@tonic-gate * If the stream is not idle, then we hold the 28830Sstevel@tonic-gate * orderly release until it becomes idle. This 28840Sstevel@tonic-gate * ensures that KRPC will be able to reply to 28850Sstevel@tonic-gate * all requests that we have passed to it. 28860Sstevel@tonic-gate * 28870Sstevel@tonic-gate * We also queue the request if there is data already 28880Sstevel@tonic-gate * queued, because we cannot allow the T_ORDREL_REQ 28890Sstevel@tonic-gate * to go before data. When we had a separate reply 28900Sstevel@tonic-gate * count, this was not a problem, because the 28910Sstevel@tonic-gate * reply count was reconciled when mir_wsrv() 28920Sstevel@tonic-gate * completed. 28930Sstevel@tonic-gate */ 28940Sstevel@tonic-gate if (!MIR_SVC_QUIESCED(mir) || 28950Sstevel@tonic-gate mir->mir_inwservice == 1) { 28960Sstevel@tonic-gate mir->mir_inwservice = 1; 28970Sstevel@tonic-gate (void) putq(q, mp); 28980Sstevel@tonic-gate 28990Sstevel@tonic-gate RPCLOG(16, "mir_wput_other: queuing " 29000Sstevel@tonic-gate "T_ORDREL_REQ on 0x%p\n", (void *)q); 29010Sstevel@tonic-gate 29020Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 29030Sstevel@tonic-gate return; 29040Sstevel@tonic-gate } 29050Sstevel@tonic-gate 29060Sstevel@tonic-gate /* 29070Sstevel@tonic-gate * Mark the structure so that we know we sent 29080Sstevel@tonic-gate * an orderly release request, and reset the idle timer. 29090Sstevel@tonic-gate */ 29100Sstevel@tonic-gate mir->mir_ordrel_pending = 1; 29110Sstevel@tonic-gate 29120Sstevel@tonic-gate RPCLOG(16, "mir_wput_other: calling mir_svc_idle_start" 29130Sstevel@tonic-gate " on 0x%p because we got T_ORDREL_REQ\n", 29140Sstevel@tonic-gate (void *)q); 29150Sstevel@tonic-gate 29160Sstevel@tonic-gate mir_svc_idle_start(q, mir); 29170Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 29180Sstevel@tonic-gate 29190Sstevel@tonic-gate /* 29200Sstevel@tonic-gate * When we break, we will putnext the T_ORDREL_REQ. 29210Sstevel@tonic-gate */ 29220Sstevel@tonic-gate break; 29230Sstevel@tonic-gate 29240Sstevel@tonic-gate case T_CONN_REQ: 29250Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 29260Sstevel@tonic-gate if (mir->mir_head_mp != NULL) { 29270Sstevel@tonic-gate freemsg(mir->mir_head_mp); 29280Sstevel@tonic-gate mir->mir_head_mp = NULL; 29290Sstevel@tonic-gate mir->mir_tail_mp = NULL; 29300Sstevel@tonic-gate } 29310Sstevel@tonic-gate mir->mir_frag_len = -(int32_t)sizeof (uint32_t); 29320Sstevel@tonic-gate /* 29330Sstevel@tonic-gate * Restart timer in case mir_clnt_idle_do_stop() was 29340Sstevel@tonic-gate * called. 29350Sstevel@tonic-gate */ 29360Sstevel@tonic-gate mir->mir_idle_timeout = clnt_idle_timeout; 29370Sstevel@tonic-gate mir_clnt_idle_stop(q, mir); 29380Sstevel@tonic-gate mir_clnt_idle_start(q, mir); 29390Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 29400Sstevel@tonic-gate break; 29410Sstevel@tonic-gate 29420Sstevel@tonic-gate default: 29430Sstevel@tonic-gate /* 29440Sstevel@tonic-gate * T_DISCON_REQ is one of the interesting default 29450Sstevel@tonic-gate * cases here. Ideally, an M_FLUSH is done before 29460Sstevel@tonic-gate * T_DISCON_REQ is done. However, that is somewhat 29470Sstevel@tonic-gate * cumbersome for clnt_cots.c to do. So we queue 29480Sstevel@tonic-gate * T_DISCON_REQ, and let the service procedure 29490Sstevel@tonic-gate * flush all M_DATA. 29500Sstevel@tonic-gate */ 29510Sstevel@tonic-gate break; 29520Sstevel@tonic-gate } 29530Sstevel@tonic-gate /* fallthru */; 29540Sstevel@tonic-gate default: 29550Sstevel@tonic-gate if (mp->b_datap->db_type >= QPCTL) { 29560Sstevel@tonic-gate if (mp->b_datap->db_type == M_FLUSH) { 29570Sstevel@tonic-gate if (mir->mir_type == RPC_CLIENT && 29580Sstevel@tonic-gate *mp->b_rptr & FLUSHW) { 29590Sstevel@tonic-gate RPCLOG(32, "mir_wput_other: flushing " 29600Sstevel@tonic-gate "wq 0x%p\n", (void *)q); 29610Sstevel@tonic-gate if (*mp->b_rptr & FLUSHBAND) { 29620Sstevel@tonic-gate flushband(q, *(mp->b_rptr + 1), 2963*4741Sgt29601 FLUSHDATA); 29640Sstevel@tonic-gate } else { 29650Sstevel@tonic-gate flushq(q, FLUSHDATA); 29660Sstevel@tonic-gate } 29670Sstevel@tonic-gate } else { 29680Sstevel@tonic-gate RPCLOG(32, "mir_wput_other: ignoring " 29690Sstevel@tonic-gate "M_FLUSH on wq 0x%p\n", (void *)q); 29700Sstevel@tonic-gate } 29710Sstevel@tonic-gate } 29720Sstevel@tonic-gate break; 29730Sstevel@tonic-gate } 29740Sstevel@tonic-gate 29750Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 29760Sstevel@tonic-gate if (mir->mir_inwservice == 0 && MIR_WCANPUTNEXT(mir, q)) { 29770Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 29780Sstevel@tonic-gate break; 29790Sstevel@tonic-gate } 29800Sstevel@tonic-gate mir->mir_inwservice = 1; 29810Sstevel@tonic-gate mir->mir_inwflushdata = flush_in_svc; 29820Sstevel@tonic-gate (void) putq(q, mp); 29830Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 29840Sstevel@tonic-gate qenable(q); 29850Sstevel@tonic-gate 29860Sstevel@tonic-gate return; 29870Sstevel@tonic-gate } 29880Sstevel@tonic-gate putnext(q, mp); 29890Sstevel@tonic-gate } 29900Sstevel@tonic-gate 29910Sstevel@tonic-gate static void 29920Sstevel@tonic-gate mir_wsrv(queue_t *q) 29930Sstevel@tonic-gate { 29940Sstevel@tonic-gate mblk_t *mp; 29950Sstevel@tonic-gate mir_t *mir; 29960Sstevel@tonic-gate bool_t flushdata; 29970Sstevel@tonic-gate 29980Sstevel@tonic-gate mir = (mir_t *)q->q_ptr; 29990Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 30000Sstevel@tonic-gate 30010Sstevel@tonic-gate flushdata = mir->mir_inwflushdata; 30020Sstevel@tonic-gate mir->mir_inwflushdata = 0; 30030Sstevel@tonic-gate 30040Sstevel@tonic-gate while (mp = getq(q)) { 30050Sstevel@tonic-gate if (mp->b_datap->db_type == M_DATA) { 30060Sstevel@tonic-gate /* 30070Sstevel@tonic-gate * Do not send any more data if we have sent 30080Sstevel@tonic-gate * a T_ORDREL_REQ. 30090Sstevel@tonic-gate */ 30100Sstevel@tonic-gate if (flushdata || mir->mir_ordrel_pending == 1) { 30110Sstevel@tonic-gate freemsg(mp); 30120Sstevel@tonic-gate continue; 30130Sstevel@tonic-gate } 30140Sstevel@tonic-gate 30150Sstevel@tonic-gate /* 30160Sstevel@tonic-gate * Make sure that the stream can really handle more 30170Sstevel@tonic-gate * data. 30180Sstevel@tonic-gate */ 30190Sstevel@tonic-gate if (!MIR_WCANPUTNEXT(mir, q)) { 30200Sstevel@tonic-gate (void) putbq(q, mp); 30210Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 30220Sstevel@tonic-gate return; 30230Sstevel@tonic-gate } 30240Sstevel@tonic-gate 30250Sstevel@tonic-gate /* 30260Sstevel@tonic-gate * Now we pass the RPC message downstream. 30270Sstevel@tonic-gate */ 30280Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 30290Sstevel@tonic-gate putnext(q, mp); 30300Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 30310Sstevel@tonic-gate continue; 30320Sstevel@tonic-gate } 30330Sstevel@tonic-gate 30340Sstevel@tonic-gate /* 30350Sstevel@tonic-gate * This is not an RPC message, pass it downstream 30360Sstevel@tonic-gate * (ignoring flow control) if the server side is not sending a 30370Sstevel@tonic-gate * T_ORDREL_REQ downstream. 30380Sstevel@tonic-gate */ 30390Sstevel@tonic-gate if (mir->mir_type != RPC_SERVER || 3040*4741Sgt29601 ((union T_primitives *)mp->b_rptr)->type != 3041*4741Sgt29601 T_ORDREL_REQ) { 30420Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 30430Sstevel@tonic-gate putnext(q, mp); 30440Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 30450Sstevel@tonic-gate continue; 30460Sstevel@tonic-gate } 30470Sstevel@tonic-gate 30480Sstevel@tonic-gate if (mir->mir_ordrel_pending == 1) { 30490Sstevel@tonic-gate /* 30500Sstevel@tonic-gate * Don't send two T_ORDRELs 30510Sstevel@tonic-gate */ 30520Sstevel@tonic-gate freemsg(mp); 30530Sstevel@tonic-gate continue; 30540Sstevel@tonic-gate } 30550Sstevel@tonic-gate 30560Sstevel@tonic-gate /* 30570Sstevel@tonic-gate * Mark the structure so that we know we sent an orderly 30580Sstevel@tonic-gate * release request. We will check to see slot is idle at the 30590Sstevel@tonic-gate * end of this routine, and if so, reset the idle timer to 30600Sstevel@tonic-gate * handle orderly release timeouts. 30610Sstevel@tonic-gate */ 30620Sstevel@tonic-gate mir->mir_ordrel_pending = 1; 30630Sstevel@tonic-gate RPCLOG(16, "mir_wsrv: sending ordrel req on q 0x%p\n", 3064*4741Sgt29601 (void *)q); 30650Sstevel@tonic-gate /* 30660Sstevel@tonic-gate * Send the orderly release downstream. If there are other 30670Sstevel@tonic-gate * pending replies we won't be able to send them. However, 30680Sstevel@tonic-gate * the only reason we should send the orderly release is if 30690Sstevel@tonic-gate * we were idle, or if an unusual event occurred. 30700Sstevel@tonic-gate */ 30710Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 30720Sstevel@tonic-gate putnext(q, mp); 30730Sstevel@tonic-gate mutex_enter(&mir->mir_mutex); 30740Sstevel@tonic-gate } 30750Sstevel@tonic-gate 30760Sstevel@tonic-gate if (q->q_first == NULL) 30770Sstevel@tonic-gate /* 30780Sstevel@tonic-gate * If we call mir_svc_idle_start() below, then 30790Sstevel@tonic-gate * clearing mir_inwservice here will also result in 30800Sstevel@tonic-gate * any thread waiting in mir_close() to be signaled. 30810Sstevel@tonic-gate */ 30820Sstevel@tonic-gate mir->mir_inwservice = 0; 30830Sstevel@tonic-gate 30840Sstevel@tonic-gate if (mir->mir_type != RPC_SERVER) { 30850Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 30860Sstevel@tonic-gate return; 30870Sstevel@tonic-gate } 30880Sstevel@tonic-gate 30890Sstevel@tonic-gate /* 30900Sstevel@tonic-gate * If idle we call mir_svc_idle_start to start the timer (or wakeup 30910Sstevel@tonic-gate * a close). Also make sure not to start the idle timer on the 30920Sstevel@tonic-gate * listener stream. This can cause nfsd to send an orderly release 30930Sstevel@tonic-gate * command on the listener stream. 30940Sstevel@tonic-gate */ 30950Sstevel@tonic-gate if (MIR_SVC_QUIESCED(mir) && !(mir->mir_listen_stream)) { 30960Sstevel@tonic-gate RPCLOG(16, "mir_wsrv: calling mir_svc_idle_start on 0x%p " 30970Sstevel@tonic-gate "because mir slot is idle\n", (void *)q); 30980Sstevel@tonic-gate mir_svc_idle_start(q, mir); 30990Sstevel@tonic-gate } 31000Sstevel@tonic-gate 31010Sstevel@tonic-gate /* 31020Sstevel@tonic-gate * If outbound flow control has been relieved, then allow new 31030Sstevel@tonic-gate * inbound requests to be processed. 31040Sstevel@tonic-gate */ 31050Sstevel@tonic-gate if (mir->mir_hold_inbound) { 31060Sstevel@tonic-gate mir->mir_hold_inbound = 0; 31070Sstevel@tonic-gate qenable(RD(q)); 31080Sstevel@tonic-gate } 31090Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 31100Sstevel@tonic-gate } 31110Sstevel@tonic-gate 31120Sstevel@tonic-gate static void 31130Sstevel@tonic-gate mir_disconnect(queue_t *q, mir_t *mir) 31140Sstevel@tonic-gate { 31150Sstevel@tonic-gate ASSERT(MUTEX_HELD(&mir->mir_mutex)); 31160Sstevel@tonic-gate 31170Sstevel@tonic-gate switch (mir->mir_type) { 31180Sstevel@tonic-gate case RPC_CLIENT: 31190Sstevel@tonic-gate /* 31200Sstevel@tonic-gate * We are disconnecting, but not necessarily 31210Sstevel@tonic-gate * closing. By not closing, we will fail to 31220Sstevel@tonic-gate * pick up a possibly changed global timeout value, 31230Sstevel@tonic-gate * unless we store it now. 31240Sstevel@tonic-gate */ 31250Sstevel@tonic-gate mir->mir_idle_timeout = clnt_idle_timeout; 31260Sstevel@tonic-gate mir_clnt_idle_start(WR(q), mir); 31270Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 31280Sstevel@tonic-gate 31290Sstevel@tonic-gate /* 31300Sstevel@tonic-gate * T_DISCON_REQ is passed to KRPC as an integer value 31310Sstevel@tonic-gate * (this is not a TPI message). It is used as a 31320Sstevel@tonic-gate * convenient value to indicate a sanity check 31330Sstevel@tonic-gate * failure -- the same KRPC routine is also called 31340Sstevel@tonic-gate * for T_DISCON_INDs and T_ORDREL_INDs. 31350Sstevel@tonic-gate */ 31360Sstevel@tonic-gate clnt_dispatch_notifyall(WR(q), T_DISCON_REQ, 0); 31370Sstevel@tonic-gate break; 31380Sstevel@tonic-gate 31390Sstevel@tonic-gate case RPC_SERVER: 31400Sstevel@tonic-gate mir->mir_svc_no_more_msgs = 1; 31410Sstevel@tonic-gate mir_svc_idle_stop(WR(q), mir); 31420Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 31430Sstevel@tonic-gate RPCLOG(16, "mir_disconnect: telling " 3144*4741Sgt29601 "stream head listener to disconnect stream " 3145*4741Sgt29601 "(0x%p)\n", (void *) q); 31460Sstevel@tonic-gate (void) mir_svc_policy_notify(q, 2); 31470Sstevel@tonic-gate break; 31480Sstevel@tonic-gate 31490Sstevel@tonic-gate default: 31500Sstevel@tonic-gate mutex_exit(&mir->mir_mutex); 31510Sstevel@tonic-gate break; 31520Sstevel@tonic-gate } 31530Sstevel@tonic-gate } 31540Sstevel@tonic-gate 31550Sstevel@tonic-gate /* 31560Sstevel@tonic-gate * do a sanity check on the length of the fragment. 31570Sstevel@tonic-gate * returns 1 if bad else 0. 31580Sstevel@tonic-gate */ 31590Sstevel@tonic-gate static int 31600Sstevel@tonic-gate mir_check_len(queue_t *q, int32_t frag_len, 31610Sstevel@tonic-gate mblk_t *head_mp) 31620Sstevel@tonic-gate { 31630Sstevel@tonic-gate mir_t *mir; 31640Sstevel@tonic-gate 31650Sstevel@tonic-gate mir = (mir_t *)q->q_ptr; 31660Sstevel@tonic-gate 31670Sstevel@tonic-gate /* 31680Sstevel@tonic-gate * Do a sanity check on the message length. If this message is 31690Sstevel@tonic-gate * getting excessively large, shut down the connection. 31700Sstevel@tonic-gate */ 31710Sstevel@tonic-gate 31720Sstevel@tonic-gate if ((frag_len <= 0) || (mir->mir_max_msg_sizep == NULL) || 3173*4741Sgt29601 (frag_len <= *mir->mir_max_msg_sizep)) { 31740Sstevel@tonic-gate return (0); 31750Sstevel@tonic-gate } 31760Sstevel@tonic-gate 31770Sstevel@tonic-gate freemsg(head_mp); 31780Sstevel@tonic-gate mir->mir_head_mp = (mblk_t *)0; 31790Sstevel@tonic-gate mir->mir_frag_len = -(int)sizeof (uint32_t); 31800Sstevel@tonic-gate if (mir->mir_type != RPC_SERVER || mir->mir_setup_complete) { 31810Sstevel@tonic-gate cmn_err(CE_NOTE, 3182*4741Sgt29601 "KRPC: record fragment from %s of size(%d) exceeds " 3183*4741Sgt29601 "maximum (%u). Disconnecting", 3184*4741Sgt29601 (mir->mir_type == RPC_CLIENT) ? "server" : 3185*4741Sgt29601 (mir->mir_type == RPC_SERVER) ? "client" : 3186*4741Sgt29601 "test tool", 3187*4741Sgt29601 frag_len, *mir->mir_max_msg_sizep); 31880Sstevel@tonic-gate } 31890Sstevel@tonic-gate 31900Sstevel@tonic-gate mir_disconnect(q, mir); 31910Sstevel@tonic-gate return (1); 31920Sstevel@tonic-gate } 3193